diff --git a/.coveragerc b/.coveragerc
index 5b264a626abfa..3f630aa6cf8f5 100644
--- a/.coveragerc
+++ b/.coveragerc
@@ -1,6 +1,7 @@
 # .coveragerc to control coverage.py
 [run]
 branch = False
+omit = */tests/*
 
 [report]
 # Regexes for lines to exclude from consideration
@@ -23,4 +24,4 @@ exclude_lines =
 ignore_errors = False
 
 [html]
-directory = coverage_html_report
\ No newline at end of file
+directory = coverage_html_report
diff --git a/.github/CODE_OF_CONDUCT.md b/.github/CODE_OF_CONDUCT.md
new file mode 100644
index 0000000000000..a1fbece3284ec
--- /dev/null
+++ b/.github/CODE_OF_CONDUCT.md
@@ -0,0 +1,63 @@
+# Contributor Code of Conduct
+
+As contributors and maintainers of this project, and in the interest of
+fostering an open and welcoming community, we pledge to respect all people who
+contribute through reporting issues, posting feature requests, updating
+documentation, submitting pull requests or patches, and other activities.
+
+We are committed to making participation in this project a harassment-free
+experience for everyone, regardless of level of experience, gender, gender
+identity and expression, sexual orientation, disability, personal appearance,
+body size, race, ethnicity, age, religion, or nationality.
+
+Examples of unacceptable behavior by participants include:
+
+* The use of sexualized language or imagery
+* Personal attacks
+* Trolling or insulting/derogatory comments
+* Public or private harassment
+* Publishing other's private information, such as physical or electronic
+  addresses, without explicit permission
+* Other unethical or unprofessional conduct
+
+Project maintainers have the right and responsibility to remove, edit, or
+reject comments, commits, code, wiki edits, issues, and other contributions
+that are not aligned to this Code of Conduct, or to ban temporarily or
+permanently any contributor for other behaviors that they deem inappropriate,
+threatening, offensive, or harmful.
+
+By adopting this Code of Conduct, project maintainers commit themselves to
+fairly and consistently applying these principles to every aspect of managing
+this project. Project maintainers who do not follow or enforce the Code of
+Conduct may be permanently removed from the project team.
+
+This Code of Conduct applies both within project spaces and in public spaces
+when an individual is representing the project or its community.
+
+A working group of community members is committed to promptly addressing any
+reported issues. The working group is made up of pandas contributors and users.
+Instances of abusive, harassing, or otherwise unacceptable behavior may be
+reported by contacting the working group by e-mail (pandas-coc@googlegroups.com).
+Messages sent to this e-mail address will not be publicly visible but only to
+the working group members. The working group currently includes
+
+- Safia Abdalla
+- Tom Augspurger
+- Joris Van den Bossche
+- Camille Scott
+- Nathaniel Smith
+
+All complaints will be reviewed and investigated and will result in a response
+that is deemed necessary and appropriate to the circumstances. Maintainers are
+obligated to maintain confidentiality with regard to the reporter of an
+incident.
+
+This Code of Conduct is adapted from the [Contributor Covenant][homepage],
+version 1.3.0, available at
+[http://contributor-covenant.org/version/1/3/0/][version],
+and the [Swift Code of Conduct][swift].
+
+[homepage]: http://contributor-covenant.org
+[version]: http://contributor-covenant.org/version/1/3/0/
+[swift]: https://swift.org/community/#code-of-conduct
+
diff --git a/.github/CONTRIBUTING.md b/.github/CONTRIBUTING.md
new file mode 100644
index 0000000000000..95729f845ff5c
--- /dev/null
+++ b/.github/CONTRIBUTING.md
@@ -0,0 +1,24 @@
+Contributing to pandas
+======================
+
+Whether you are a novice or experienced software developer, all contributions and suggestions are welcome!
+
+Our main contribution docs can be found [here](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst), but if you do not want to read it in its entirety, we will summarize the main ways in which you can contribute and point to relevant places in the docs for further information.
+
+Getting Started
+---------------
+If you are looking to contribute to the *pandas* codebase, the best place to start is the [GitHub "issues" tab](https://github.com/pandas-dev/pandas/issues). This is also a great place for filing bug reports and making suggestions for ways in which we can improve the code and documentation.
+
+If you have additional questions, feel free to ask them on the [mailing list](https://groups.google.com/forum/?fromgroups#!forum/pydata) or on [Gitter](https://gitter.im/pydata/pandas). Further information can also be found in our [Getting Started](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst#where-to-start) section of our main contribution doc.
+
+Filing Issues
+-------------
+If you notice a bug in the code or in docs or have suggestions for how we can improve either, feel free to create an issue on the [GitHub "issues" tab](https://github.com/pandas-dev/pandas/issues) using [GitHub's "issue" form](https://github.com/pandas-dev/pandas/issues/new). The form contains some questions that will help us best address your issue. For more information regarding how to file issues against *pandas*, please refer to the [Bug reports and enhancement requests](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst#bug-reports-and-enhancement-requests) section of our main contribution doc.
+
+Contributing to the Codebase
+----------------------------
+The code is hosted on [GitHub](https://www.github.com/pandas-dev/pandas), so you will need to use [Git](http://git-scm.com/) to clone the project and make changes to the codebase. Once you have obtained a copy of the code, you should create a development environment that is separate from your existing Python environment so that you can make and test changes without compromising your own work environment. For more information, please refer to our [Working with the code](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst#working-with-the-code) section of our main contribution docs.
+
+Before submitting your changes for review, make sure to check that your changes do not break any tests. You can find more information about our test suites can be found [here](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst#test-driven-development-code-writing). We also have guidelines regarding coding style that will be enforced during testing. Details about coding style can be found [here](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst#code-standards).
+
+Once your changes are ready to be submitted, make sure to push your changes to GitHub before creating a pull request. Details about how to do that can be found in the [Contributing your changes to pandas](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst#contributing-your-changes-to-pandas) section of our main contribution docs. We will review your changes, and you will most likely be asked to make additional changes before it is finally ready to merge. However, once it's ready, we will merge it, and you will have successfully contributed to the codebase!
diff --git a/.github/ISSUE_TEMPLATE.md b/.github/ISSUE_TEMPLATE.md
new file mode 100644
index 0000000000000..e33835c462511
--- /dev/null
+++ b/.github/ISSUE_TEMPLATE.md
@@ -0,0 +1,29 @@
+#### Code Sample, a copy-pastable example if possible
+
+```python
+# Your code here
+
+```
+#### Problem description
+
+[this should explain **why** the current behaviour is a problem and why the expected output is a better solution.]
+
+**Note**: We receive a lot of issues on our GitHub tracker, so it is very possible that your issue has been posted before. Please check first before submitting so that we do not have to handle and close duplicates!
+
+**Note**: Many problems can be resolved by simply upgrading `pandas` to the latest version. Before submitting, please check if that solution works for you. If possible, you may want to check if `master` addresses this issue, but that is not necessary.
+
+For documentation-related issues, you can check the latest versions of the docs on `master` here:
+
+https://pandas-docs.github.io/pandas-docs-travis/
+
+If the issue has not been resolved there, go ahead and file it in the issue tracker.
+
+#### Expected Output
+
+#### Output of ``pd.show_versions()``
+
+<details>
+
+[paste the output of ``pd.show_versions()`` here below this line]
+
+</details>
diff --git a/.github/PULL_REQUEST_TEMPLATE.md b/.github/PULL_REQUEST_TEMPLATE.md
new file mode 100644
index 0000000000000..4e1e9ce017408
--- /dev/null
+++ b/.github/PULL_REQUEST_TEMPLATE.md
@@ -0,0 +1,4 @@
+- [ ] closes #xxxx
+- [ ] tests added / passed
+- [ ] passes `git diff upstream/master -u -- "*.py" | flake8 --diff`
+- [ ] whatsnew entry
diff --git a/.gitignore b/.gitignore
index d33df2df6e548..96b1f945870de 100644
--- a/.gitignore
+++ b/.gitignore
@@ -7,6 +7,7 @@
 *$
 *.bak
 *flymake*
+*.iml
 *.kdev4
 *.log
 *.swp
@@ -18,6 +19,9 @@
 .vagrant
 .noseids
 .ipynb_checkpoints
+.tags
+.cache/
+.vscode/
 
 # Compiled source #
 ###################
@@ -26,6 +30,7 @@
 *.class
 *.dll
 *.exe
+*.pxi
 *.o
 *.py[ocd]
 *.so
@@ -43,6 +48,7 @@ dist
 # Egg metadata
 *.egg-info
 .eggs
+.pypirc
 
 # tox testing tool
 .tox
@@ -53,6 +59,9 @@ dist
 **/wheelhouse/*
 # coverage
 .coverage
+coverage.xml
+coverage_html_report
+*.pytest_cache
 
 # OS generated files #
 ######################
@@ -66,6 +75,7 @@ Thumbs.db
 # Data files #
 ##############
 *.dta
+*.xpt
 *.h5
 pandas/io/*.dat
 pandas/io/*.json
@@ -79,9 +89,12 @@ scikits
 *.c
 *.cpp
 
-# Performance Testing #
-#######################
-asv_bench/
+# Unit / Performance Testing #
+##############################
+asv_bench/env/
+asv_bench/html/
+asv_bench/results/
+asv_bench/pandas/
 
 # Documentation generated files #
 #################################
@@ -93,3 +106,7 @@ doc/source/index.rst
 doc/build/html/index.html
 # Windows specific leftover:
 doc/tmp.sv
+doc/source/styled.xlsx
+doc/source/templates/
+env/
+doc/source/savefig/
diff --git a/.pep8speaks.yml b/.pep8speaks.yml
new file mode 100644
index 0000000000000..fda26d87bf7f6
--- /dev/null
+++ b/.pep8speaks.yml
@@ -0,0 +1,12 @@
+# File : .pep8speaks.yml
+
+scanner:
+    diff_only: True  # If True, errors caused by only the patch are shown
+
+pycodestyle:
+    max-line-length: 79
+    ignore:  # Errors and warnings to ignore
+        - E402,  # module level import not at top of file
+        - E731,  # do not assign a lambda expression, use a def
+        - E741,  # do not use variables named 'l', 'O', or 'I'
+        - W503   # line break before binary operator
diff --git a/.travis.yml b/.travis.yml
index 4e46fb7ad85ca..2d2a0bc019c80 100644
--- a/.travis.yml
+++ b/.travis.yml
@@ -1,190 +1,138 @@
-
+sudo: false
 language: python
+# Default Python version is usually 2.7
+python: 3.5
 
-env:
+# To turn off cached cython files and compiler cache
+# set NOCACHE-true
+# To delete caches go to https://travis-ci.org/OWNER/REPOSITORY/caches or run
+# travis cache --delete inside the project directory from the travis command line client
+# The cache directories will be deleted if anything in ci/ changes in a commit
+cache:
+ ccache: true
+ directories:
+  - $HOME/.cache # cython cache
+  - $HOME/.ccache # compiler cache
 
+env:
   global:
-  # scatterci API key
-  #- secure: "Bx5umgo6WjuGY+5XFa004xjCiX/vq0CyMZ/ETzcs7EIBI1BE/0fIDXOoWhoxbY9HPfdPGlDnDgB9nGqr5wArO2s+BavyKBWg6osZ3dmkfuJPMOWeyCa92EeP+sfKw8e5HSU5MizW9e319wHWOF/xkzdHR7T67Qd5erhv91x4DnQ="
-  # ironcache API key
-  - secure: "e4eEFn9nDQc3Xa5BWYkzfX37jaWVq89XidVX+rcCNEr5OlOImvveeXnF1IzbRXznH4Sv0YsLwUd8RGUWOmyCvkONq/VJeqCHWtTMyfaCIdqSyhIP9Odz8r9ahch+Y0XFepBey92AJHmlnTh+2GjCDgIiqq4fzglojnp56Vg1ojA="
-  - secure: "CjmYmY5qEu3KrvMtel6zWFEtMq8ORBeS1S1odJHnjQpbwT1KY2YFZRVlLphfyDQXSz6svKUdeRrCNp65baBzs3DQNA8lIuXGIBYFeJxqVGtYAZZs6+TzBPfJJK798sGOj5RshrOJkFG2rdlWNuTq/XphI0JOrN3nPUkRrdQRpAw="
-  # pandas-docs-bot GH
-  - secure: "PCzUFR8CHmw9lH84p4ygnojdF7Z8U5h7YfY0RyT+5K/aiQ1ZTU3ZkDTPI0/rR5FVMxsEEKEQKMcc5fvqW0PeD7Q2wRmluloKgT9w4EVEJ1ppKf7lITPcvZR2QgVOvjv4AfDtibLHFNiaSjzoqyJVjM4igjOu8WTlF3JfZcmOQjQ="
+    # create a github personal access token
+    # cd pandas-dev/pandas
+    # travis encrypt 'PANDAS_GH_TOKEN=personal_access_token' -r pandas-dev/pandas
+    - secure: "EkWLZhbrp/mXJOx38CHjs7BnjXafsqHtwxPQrqWy457VDFWhIY1DMnIR/lOWG+a20Qv52sCsFtiZEmMfUjf0pLGXOqurdxbYBGJ7/ikFLk9yV2rDwiArUlVM9bWFnFxHvdz9zewBH55WurrY4ShZWyV+x2dWjjceWG5VpWeI6sA="
 
 git:
     # for cloning
-    depth: 100
+    depth: 1000
 
 matrix:
     fast_finish: true
+    exclude:
+      # Exclude the default Python 3.5 build
+      - python: 3.5
     include:
-    - python: 2.6
-      env:
-      - JOB_NAME: "26_nslow_nnet"
-      - NOSE_ARGS="not slow and not network and not disabled"
-      - CLIPBOARD=xclip
-      - LOCALE_OVERRIDE="it_IT.UTF-8"
-      - BUILD_TYPE=conda
-      - INSTALL_TEST=true
-    - python: 2.7
-      env:
-      - JOB_NAME: "27_slow_nnet_LOCALE"
-      - NOSE_ARGS="slow and not network and not disabled"
-      - LOCALE_OVERRIDE="zh_CN.GB18030"
-      - FULL_DEPS=true
-      - JOB_TAG=_LOCALE
-      - BUILD_TYPE=conda
-    - python: 2.7
-      env:
-      - JOB_NAME: "27_nslow"
-      - NOSE_ARGS="not slow and not disabled"
-      - FULL_DEPS=true
-      - CLIPBOARD_GUI=gtk2
-      - BUILD_TYPE=conda
-      - DOC_BUILD=true # if rst files were changed, build docs in parallel with tests
-    - python: 3.4
+    - os: osx
+      language: generic
       env:
-      - JOB_NAME: "34_nslow"
-      - NOSE_ARGS="not slow and not disabled"
-      - FULL_DEPS=true
-      - CLIPBOARD=xsel
-      - BUILD_TYPE=conda
-    - python: 3.5
+        - JOB="3.5, OSX" ENV_FILE="ci/travis-35-osx.yaml" TEST_ARGS="--skip-slow --skip-network"
+
+    - dist: trusty
       env:
-      - JOB_NAME: "35_nslow"
-      - NOSE_ARGS="not slow and not network and not disabled"
-      - FULL_DEPS=true
-      - CLIPBOARD=xsel
-      - BUILD_TYPE=conda
-    - python: 3.3
+        - JOB="3.7" ENV_FILE="ci/travis-37.yaml" TEST_ARGS="--skip-slow --skip-network"
+
+    - dist: trusty
       env:
-      - JOB_NAME: "33_nslow"
-      - NOSE_ARGS="not slow and not disabled"
-      - FULL_DEPS=true
-      - CLIPBOARD=xsel
-      - BUILD_TYPE=conda
-    - python: 2.7
+        - JOB="2.7, locale, slow, old NumPy" ENV_FILE="ci/travis-27-locale.yaml" LOCALE_OVERRIDE="zh_CN.UTF-8" SLOW=true
+      addons:
+        apt:
+          packages:
+          - language-pack-zh-hans
+    - dist: trusty
       env:
-      - JOB_NAME: "27_slow"
-      - JOB_TAG=_SLOW
-      - NOSE_ARGS="slow and not network and not disabled"
-      - FULL_DEPS=true
-      - BUILD_TYPE=conda
-    - python: 3.4
+        - JOB="2.7, lint" ENV_FILE="ci/travis-27.yaml" TEST_ARGS="--skip-slow" LINT=true
+      addons:
+        apt:
+          packages:
+          - python-gtk2
+    - dist: trusty
       env:
-      - JOB_NAME: "34_slow"
-      - JOB_TAG=_SLOW
-      - NOSE_ARGS="slow and not network and not disabled"
-      - FULL_DEPS=true
-      - CLIPBOARD=xsel
-      - BUILD_TYPE=conda
-    - python: 2.7
+        - JOB="3.6, coverage" ENV_FILE="ci/travis-36.yaml" TEST_ARGS="--skip-slow --skip-network" PANDAS_TESTING_MODE="deprecate" COVERAGE=true
+    # In allow_failures
+    - dist: trusty
       env:
-      - JOB_NAME: "27_build_test_conda"
-      - JOB_TAG=_BUILD_TEST
-      - NOSE_ARGS="not slow and not disabled"
-      - FULL_DEPS=true
-      - BUILD_TYPE=conda
-      - BUILD_TEST=true
-    - python: 2.7
+        - JOB="3.6, slow" ENV_FILE="ci/travis-36-slow.yaml" SLOW=true
+    # In allow_failures
+    - dist: trusty
       env:
-      - JOB_NAME: "27_build_test_pydata"
-      - JOB_TAG=_BUILD_TEST
-      - NOSE_ARGS="not slow and not disabled"
-      - FULL_DEPS=true
-      - BUILD_TYPE=pydata
-      - BUILD_TEST=true
-    - python: 2.7
+        - JOB="3.6, NumPy dev" ENV_FILE="ci/travis-36-numpydev.yaml" TEST_ARGS="--skip-slow --skip-network" PANDAS_TESTING_MODE="deprecate"
+      addons:
+        apt:
+          packages:
+          - xsel
+    # In allow_failures
+    - dist: trusty
       env:
-      - JOB_NAME: "27_numpy_master"
-      - JOB_TAG=_NUMPY_DEV_master
-      - NOSE_ARGS="not slow and not network and not disabled"
-      - NUMPY_BUILD=master
-      - BUILD_TYPE=pydata
-      - PANDAS_TESTING_MODE="deprecate"
+        - JOB="3.6, doc" ENV_FILE="ci/travis-36-doc.yaml" DOC=true
     allow_failures:
-      - python: 3.3
-        env:
-        - JOB_NAME: "33_nslow"
-        - NOSE_ARGS="not slow and not disabled"
-        - FULL_DEPS=true
-        - CLIPBOARD=xsel
-        - BUILD_TYPE=conda
-      - python: 2.7
+      - dist: trusty
         env:
-        - JOB_NAME: "27_slow"
-        - JOB_TAG=_SLOW
-        - NOSE_ARGS="slow and not network and not disabled"
-        - FULL_DEPS=true
-        - BUILD_TYPE=conda
-      - python: 3.4
+          - JOB="3.6, slow" ENV_FILE="ci/travis-36-slow.yaml" SLOW=true
+      - dist: trusty
         env:
-        - JOB_NAME: "34_slow"
-        - JOB_TAG=_SLOW
-        - NOSE_ARGS="slow and not network and not disabled"
-        - FULL_DEPS=true
-        - CLIPBOARD=xsel
-        - BUILD_TYPE=conda
-      - python: 2.7
+          - JOB="3.6, NumPy dev" ENV_FILE="ci/travis-36-numpydev.yaml" TEST_ARGS="--skip-slow --skip-network" PANDAS_TESTING_MODE="deprecate"
+        addons:
+          apt:
+            packages:
+            - xsel
+      - dist: trusty
         env:
-        - JOB_NAME: "27_numpy_master"
-        - JOB_TAG=_NUMPY_DEV_master
-        - NOSE_ARGS="not slow and not network and not disabled"
-        - NUMPY_BUILD=master
-        - BUILD_TYPE=pydata
-        - PANDAS_TESTING_MODE="deprecate"
-      - python: 2.7
-        env:
-        - JOB_NAME: "27_build_test_conda"
-        - JOB_TAG=_BUILD_TEST
-        - NOSE_ARGS="not slow and not disabled"
-        - FULL_DEPS=true
-        - BUILD_TYPE=conda
-        - BUILD_TEST=true
-      - python: 2.7
-        env:
-        - JOB_NAME: "27_build_test_pydata"
-        - JOB_TAG=_BUILD_TEST
-        - NOSE_ARGS="not slow and not disabled"
-        - FULL_DEPS=true
-        - BUILD_TYPE=pydata
-        - BUILD_TEST=true
+          - JOB="3.6, doc" ENV_FILE="ci/travis-36-doc.yaml" DOC=true
 
 before_install:
   - echo "before_install"
-  - echo $VIRTUAL_ENV
-  - export PATH="$HOME/miniconda/bin:$PATH"
-  - sudo apt-get install ccache
+  # set non-blocking IO on travis
+  # https://github.com/travis-ci/travis-ci/issues/8920#issuecomment-352661024
+  - python -c 'import os,sys,fcntl; flags = fcntl.fcntl(sys.stdout, fcntl.F_GETFL); fcntl.fcntl(sys.stdout, fcntl.F_SETFL, flags&~os.O_NONBLOCK);'
+  - source ci/travis_process_gbq_encryption.sh
+  - export PATH="$HOME/miniconda3/bin:$PATH"
   - df -h
-  - date
   - pwd
   - uname -a
-  - python -V
-  - ci/before_install.sh
-  # Xvfb stuff for clipboard functionality; see the travis-ci documentation
-  - export DISPLAY=:99.0
-  - sh -e /etc/init.d/xvfb start
+  - git --version
+  - git tag
 
 install:
-  - echo "install"
-  - ci/prep_ccache.sh
-  - ci/install_${BUILD_TYPE}.sh
-  - ci/submit_ccache.sh
+  - echo "install start"
+  - ci/prep_cython_cache.sh
+  - ci/install_travis.sh
+  - ci/submit_cython_cache.sh
+  - echo "install done"
 
 before_script:
-  - mysql -e 'create database pandas_nosetest;'
-  - psql -c 'create database pandas_nosetest;' -U postgres
+  - ci/install_db_travis.sh
+  - export DISPLAY=":99.0"
+  - ci/before_script_travis.sh
 
 script:
-  - echo "script"
-  - ci/run_build_docs.sh &
-  - ci/script.sh
-# nothing here, or failed tests won't fail travis
+  - echo "script start"
+  - ci/run_build_docs.sh
+  - ci/script_single.sh
+  - ci/script_multi.sh
+  - ci/lint.sh
+  - echo "checking imports"
+  - source activate pandas && python ci/check_imports.py
+  - echo "script done"
+
+after_success:
+  -  ci/upload_coverage.sh
 
 after_script:
-  - ci/install_test.sh
-  - if [ -f /tmp/doc.log ]; then cat /tmp/doc.log; fi
-  - source activate pandas && ci/print_versions.py
-  - ci/print_skipped.py /tmp/nosetests.xml
-  - ci/after_script.sh
+  - echo "after_script start"
+  - source activate pandas && pushd /tmp && python -c "import pandas; pandas.show_versions();" && popd
+  - if [ -e /tmp/single.xml ]; then
+    ci/print_skipped.py /tmp/single.xml;
+    fi
+  - if [ -e /tmp/multiple.xml ]; then
+    ci/print_skipped.py /tmp/multiple.xml;
+    fi
+  - echo "after_script done"
diff --git a/AUTHORS.md b/AUTHORS.md
new file mode 100644
index 0000000000000..dcaaea101f4c8
--- /dev/null
+++ b/AUTHORS.md
@@ -0,0 +1,57 @@
+About the Copyright Holders
+===========================
+
+*   Copyright (c) 2008-2011 AQR Capital Management, LLC
+
+    AQR Capital Management began pandas development in 2008. Development was
+    led by Wes McKinney. AQR released the source under this license in 2009.
+*   Copyright (c) 2011-2012, Lambda Foundry, Inc.
+
+    Wes is now an employee of Lambda Foundry, and remains the pandas project
+    lead.
+*   Copyright (c) 2011-2012, PyData Development Team
+
+    The PyData Development Team is the collection of developers of the PyData
+    project. This includes all of the PyData sub-projects, including pandas. The
+    core team that coordinates development on GitHub can be found here:
+    http://github.com/pydata.
+
+Full credits for pandas contributors can be found in the documentation.
+
+Our Copyright Policy
+====================
+
+PyData uses a shared copyright model. Each contributor maintains copyright
+over their contributions to PyData. However, it is important to note that
+these contributions are typically only changes to the repositories. Thus,
+the PyData source code, in its entirety, is not the copyright of any single
+person or institution. Instead, it is the collective copyright of the
+entire PyData Development Team. If individual contributors want to maintain
+a record of what changes/contributions they have specific copyright on,
+they should indicate their copyright in the commit message of the change
+when they commit the change to one of the PyData repositories.
+
+With this in mind, the following banner should be used in any source code
+file to indicate the copyright and license terms:
+
+```
+#-----------------------------------------------------------------------------
+# Copyright (c) 2012, PyData Development Team
+# All rights reserved.
+#
+# Distributed under the terms of the BSD Simplified License.
+#
+# The full license is in the LICENSE file, distributed with this software.
+#-----------------------------------------------------------------------------
+```
+
+Other licenses can be found in the LICENSES directory.
+
+License
+=======
+
+pandas is distributed under a 3-clause ("Simplified" or "New") BSD
+license. Parts of NumPy, SciPy, numpydoc, bottleneck, which all have
+BSD-compatible licenses, are included. Their licenses follow the pandas
+license.
+
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
deleted file mode 100644
index 284ac2fc5b169..0000000000000
--- a/CONTRIBUTING.md
+++ /dev/null
@@ -1,640 +0,0 @@
-Contributing to pandas
-======================
-
-Where to start?
----------------
-
-All contributions, bug reports, bug fixes, documentation improvements,
-enhancements and ideas are welcome.
-
-If you are simply looking to start working with the *pandas* codebase,
-navigate to the [GitHub "issues"
-tab](https://github.com/pydata/pandas/issues) and start looking through
-interesting issues. There are a number of issues listed under
-[Docs](https://github.com/pydata/pandas/issues?labels=Docs&sort=updated&state=open)
-and [Difficulty
-Novice](https://github.com/pydata/pandas/issues?q=is%3Aopen+is%3Aissue+label%3A%22Difficulty+Novice%22)
-where you could start out.
-
-Or maybe through using *pandas* you have an idea of you own or are
-looking for something in the documentation and thinking 'this can be
-improved'...you can do something about it!
-
-Feel free to ask questions on [mailing
-list](https://groups.google.com/forum/?fromgroups#!forum/pydata)
-
-Bug Reports/Enhancement Requests
---------------------------------
-
-Bug reports are an important part of making *pandas* more stable. Having
-a complete bug report will allow others to reproduce the bug and provide
-insight into fixing. Since many versions of *pandas* are supported,
-knowing version information will also identify improvements made since
-previous versions. Often trying the bug-producing code out on the
-*master* branch is a worthwhile exercise to confirm the bug still
-exists. It is also worth searching existing bug reports and pull
-requests to see if the issue has already been reported and/or fixed.
-
-Bug reports must:
-
-1.  Include a short, self-contained Python snippet reproducing the
-    problem. You can have the code formatted nicely by using [GitHub
-    Flavored
-    Markdown](http://github.github.com/github-flavored-markdown/): :
-
-        ```python
-        >>> from pandas import DataFrame
-        >>> df = DataFrame(...)
-        ...
-        ```
-
-2.  Include the full version string of *pandas* and its dependencies. In
-    recent (\>0.12) versions of *pandas* you can use a built in
-    function: :
-
-        >>> from pandas.util.print_versions import show_versions
-        >>> show_versions()
-
-    and in 0.13.1 onwards: :
-
-        >>> pd.show_versions()
-
-3.  Explain why the current behavior is wrong/not desired and what you
-    expect instead.
-
-The issue will then show up to the *pandas* community and be open to
-comments/ideas from others.
-
-Working with the code
----------------------
-
-Now that you have an issue you want to fix, enhancement to add, or
-documentation to improve, you need to learn how to work with GitHub and
-the *pandas* code base.
-
-### Version Control, Git, and GitHub
-
-To the new user, working with Git is one of the more daunting aspects of
-contributing to *pandas*. It can very quickly become overwhelming, but
-sticking to the guidelines below will make the process straightforward
-and will work without much trouble. As always, if you are having
-difficulties please feel free to ask for help.
-
-The code is hosted on [GitHub](https://www.github.com/pydata/pandas). To
-contribute you will need to sign up for a [free GitHub
-account](https://github.com/signup/free). We use
-[Git](http://git-scm.com/) for version control to allow many people to
-work together on the project.
-
-Some great resources for learning git:
-
--   the [GitHub help pages](http://help.github.com/).
--   the [NumPy's
-    documentation](http://docs.scipy.org/doc/numpy/dev/index.html).
--   Matthew Brett's
-    [Pydagogue](http://matthew-brett.github.com/pydagogue/).
-
-### Getting Started with Git
-
-[GitHub has instructions](http://help.github.com/set-up-git-redirect)
-for installing git, setting up your SSH key, and configuring git. All
-these steps need to be completed before working seamlessly with your
-local repository and GitHub.
-
-### Forking
-
-You will need your own fork to work on the code. Go to the [pandas
-project page](https://github.com/pydata/pandas) and hit the *fork*
-button. You will want to clone your fork to your machine: :
-
-    git clone git@github.com:your-user-name/pandas.git pandas-yourname
-    cd pandas-yourname
-    git remote add upstream git://github.com/pydata/pandas.git
-
-This creates the directory pandas-yourname and connects your repository
-to the upstream (main project) *pandas* repository.
-
-You will also need to hook up Travis-CI to your GitHub repository so the
-suite is automatically run when a Pull Request is submitted.
-Instructions are
-[here](http://about.travis-ci.org/docs/user/getting-started/).
-
-### Creating a Branch
-
-You want your master branch to reflect only production-ready code, so
-create a feature branch for making your changes. For example:
-
-    git branch shiny-new-feature
-    git checkout shiny-new-feature
-
-The above can be simplified to:
-
-    git checkout -b shiny-new-feature
-
-This changes your working directory to the shiny-new-feature branch.
-Keep any changes in this branch specific to one bug or feature so it is
-clear what the branch brings to *pandas*. You can have many
-shiny-new-features and switch in between them using the git checkout
-command.
-
-### Creating a Development Environment
-
-An easy way to create a *pandas* development environment is as follows.
-
--   Install either Install Anaconda \<install-anaconda\> or
-    Install miniconda \<install-miniconda\>
--   Make sure that you have
-    cloned the repository \<contributing-forking\>
--   `cd` to the pandas source directory
-
-Tell `conda` to create a new environment, named `pandas_dev`, or any
-name you would like for this environment by running:
-
-    conda create -n pandas_dev --file ci/requirements_dev.txt
-
-For a python 3 environment
-
-    conda create -n pandas_dev python=3 --file ci/requirements_dev.txt
-
-If you are on `windows`, then you will need to install the compiler
-linkages:
-
-    conda install -n pandas_dev libpython
-
-This will create the new environment, and not touch any of your existing
-environments, nor any existing python installation. It will install all
-of the basic dependencies of *pandas*, as well as the development and
-testing tools. If you would like to install other dependencies, you can
-install them as follows:
-
-    conda install -n pandas_dev -c pandas pytables scipy
-
-To install *all* pandas dependencies you can do the following:
-
-    conda install -n pandas_dev -c pandas --file ci/requirements_all.txt
-
-To work in this environment, `activate` it as follows:
-
-    activate pandas_dev
-
-At which point, the prompt will change to indicate you are in the new
-development environment.
-
-> **note**
->
-> The above syntax is for `windows` environments. To work on
-> `macosx/linux`, use:
->
->     source activate pandas_dev
-
-To view your environments:
-
-    conda info -e
-
-To return to you home root environment:
-
-    deactivate
-
-See the full `conda` docs [here](http://conda.pydata.org/docs).
-
-At this point you can easily do an *in-place* install, as detailed in
-the next section.
-
-### Making changes
-
-Before making your code changes, it is often necessary to build the code
-that was just checked out. There are two primary methods of doing this.
-
-1.  The best way to develop *pandas* is to build the C extensions
-    in-place by running:
-
-        python setup.py build_ext --inplace
-
-    If you startup the Python interpreter in the *pandas* source
-    directory you will call the built C extensions
-
-2.  Another very common option is to do a `develop` install of *pandas*:
-
-        python setup.py develop
-
-    This makes a symbolic link that tells the Python interpreter to
-    import *pandas* from your development directory. Thus, you can
-    always be using the development version on your system without being
-    inside the clone directory.
-
-Contributing to the documentation
----------------------------------
-
-If you're not the developer type, contributing to the documentation is
-still of huge value. You don't even have to be an expert on *pandas* to
-do so! Something as simple as rewriting small passages for clarity as
-you reference the docs is a simple but effective way to contribute. The
-next person to read that passage will be in your debt!
-
-Actually, there are sections of the docs that are worse off by being
-written by experts. If something in the docs doesn't make sense to you,
-updating the relevant section after you figure it out is a simple way to
-ensure it will help the next person.
-
-### About the pandas documentation
-
-The documentation is written in **reStructuredText**, which is almost
-like writing in plain English, and built using
-[Sphinx](http://sphinx.pocoo.org/). The Sphinx Documentation has an
-excellent [introduction to reST](http://sphinx.pocoo.org/rest.html).
-Review the Sphinx docs to perform more complex changes to the
-documentation as well.
-
-Some other important things to know about the docs:
-
--   The *pandas* documentation consists of two parts: the docstrings in
-    the code itself and the docs in this folder `pandas/doc/`.
-
-    The docstrings provide a clear explanation of the usage of the
-    individual functions, while the documentation in this folder
-    consists of tutorial-like overviews per topic together with some
-    other information (what's new, installation, etc).
-
--   The docstrings follow the **Numpy Docstring Standard** which is used
-    widely in the Scientific Python community. This standard specifies
-    the format of the different sections of the docstring. See [this
-    document](https://github.com/numpy/numpy/blob/master/doc/HOWTO_DOCUMENT.rst.txt)
-    for a detailed explanation, or look at some of the existing
-    functions to extend it in a similar manner.
--   The tutorials make heavy use of the [ipython
-    directive](http://matplotlib.org/sampledoc/ipython_directive.html)
-    sphinx extension. This directive lets you put code in the
-    documentation which will be run during the doc build. For example:
-
-        .. ipython:: python
-
-            x = 2
-            x**3
-
-    will be rendered as
-
-        In [1]: x = 2
-
-        In [2]: x**3
-        Out[2]: 8
-
-    This means that almost all code examples in the docs are always run
-    (and the output saved) during the doc build. This way, they will
-    always be up to date, but it makes the doc building a bit more
-    complex.
-
-### How to build the pandas documentation
-
-#### Requirements
-
-To build the *pandas* docs there are some extra requirements: you will
-need to have `sphinx` and `ipython` installed.
-[numpydoc](https://github.com/numpy/numpydoc) is used to parse the
-docstrings that follow the Numpy Docstring Standard (see above), but you
-don't need to install this because a local copy of `numpydoc` is
-included in the *pandas* source code.
-
-It is easiest to
-create a development environment \<contributing-dev\_env\>, then
-install:
-
-    conda install -n pandas_dev sphinx ipython
-
-Furthermore, it is recommended to have all [optional
-dependencies](http://pandas.pydata.org/pandas-docs/dev/install.html#optional-dependencies)
-installed. This is not strictly necessary, but be aware that you will
-see some error messages. Because all the code in the documentation is
-executed during the doc build, the examples using this optional
-dependencies will generate errors. Run `pd.show_versions()` to get an
-overview of the installed version of all dependencies.
-
-> **warning**
->
-> Sphinx version \>= 1.2.2 or the older 1.1.3 is required.
-
-#### Building the documentation
-
-So how do you build the docs? Navigate to your local the folder
-`pandas/doc/` directory in the console and run:
-
-    python make.py html
-
-And then you can find the html output in the folder
-`pandas/doc/build/html/`.
-
-The first time it will take quite a while, because it has to run all the
-code examples in the documentation and build all generated docstring
-pages. In subsequent evocations, sphinx will try to only build the pages
-that have been modified.
-
-If you want to do a full clean build, do:
-
-    python make.py clean
-    python make.py build
-
-Starting with 0.13.1 you can tell `make.py` to compile only a single
-section of the docs, greatly reducing the turn-around time for checking
-your changes. You will be prompted to delete .rst files that aren't
-required, since the last committed version can always be restored from
-git.
-
-    #omit autosummary and API section
-    python make.py clean
-    python make.py --no-api
-
-    # compile the docs with only a single
-    # section, that which is in indexing.rst
-    python make.py clean
-    python make.py --single indexing
-
-For comparison, a full documentation build may take 10 minutes. a
-`-no-api` build may take 3 minutes and a single section may take 15
-seconds. However, subsequent builds only process portions you changed.
-Now, open the following file in a web browser to see the full
-documentation you just built:
-
-    pandas/docs/build/html/index.html
-
-And you'll have the satisfaction of seeing your new and improved
-documentation!
-
-Contributing to the code base
------------------------------
-
-### Code Standards
-
-*pandas* uses the [PEP8](http://www.python.org/dev/peps/pep-0008/)
-standard. There are several tools to ensure you abide by this standard.
-
-We've written a tool to check that your commits are PEP8 great, [pip
-install pep8radius](https://github.com/hayd/pep8radius). Look at PEP8
-fixes in your branch vs master with:
-
-    pep8radius master --diff` and make these changes with `pep8radius master --diff --in-place`
-
-Alternatively, use [flake8](http://pypi.python.org/pypi/flake8) tool for
-checking the style of your code. Additional standards are outlined on
-the [code style wiki
-page](https://github.com/pydata/pandas/wiki/Code-Style-and-Conventions).
-
-Please try to maintain backward-compatibility. *Pandas* has lots of
-users with lots of existing code, so don't break it if at all possible.
-If you think breakage is required clearly state why as part of the Pull
-Request. Also, be careful when changing method signatures and add
-deprecation warnings where needed.
-
-### Test-driven Development/Writing Code
-
-*Pandas* is serious about [Test-driven Development
-(TDD)](http://en.wikipedia.org/wiki/Test-driven_development). This
-development process "relies on the repetition of a very short
-development cycle: first the developer writes an (initially failing)
-automated test case that defines a desired improvement or new function,
-then produces the minimum amount of code to pass that test." So, before
-actually writing any code, you should write your tests. Often the test
-can be taken from the original GitHub issue. However, it is always worth
-considering additional use cases and writing corresponding tests.
-
-Adding tests is one of the most common requests after code is pushed to
-*pandas*. It is worth getting in the habit of writing tests ahead of
-time so this is never an issue.
-
-Like many packages, *pandas* uses the [Nose testing
-system](http://somethingaboutorange.com/mrl/projects/nose/) and the
-convenient extensions in
-[numpy.testing](http://docs.scipy.org/doc/numpy/reference/routines.testing.html).
-
-#### Writing tests
-
-All tests should go into the *tests* subdirectory of the specific
-package. There are probably many examples already there and looking to
-these for inspiration is suggested. If you test requires working with
-files or network connectivity there is more information on the [testing
-page](https://github.com/pydata/pandas/wiki/Testing) of the wiki.
-
-The `pandas.util.testing` module has many special `assert` functions
-that make it easier to make statements about whether Series or DataFrame
-objects are equivalent. The easiest way to verify that your code is
-correct is to explicitly construct the result you expect, then compare
-the actual result to the expected correct result:
-
-    def test_pivot(self):
-        data = {
-            'index' : ['A', 'B', 'C', 'C', 'B', 'A'],
-            'columns' : ['One', 'One', 'One', 'Two', 'Two', 'Two'],
-            'values' : [1., 2., 3., 3., 2., 1.]
-        }
-
-        frame = DataFrame(data)
-        pivoted = frame.pivot(index='index', columns='columns', values='values')
-
-        expected = DataFrame({
-            'One' : {'A' : 1., 'B' : 2., 'C' : 3.},
-            'Two' : {'A' : 1., 'B' : 2., 'C' : 3.}
-        })
-
-        assert_frame_equal(pivoted, expected)
-
-#### Running the test suite
-
-The tests can then be run directly inside your git clone (without having
-to install *pandas*) by typing::
-
-    nosetests pandas
-
-The tests suite is exhaustive and takes around 20 minutes to run. Often
-it is worth running only a subset of tests first around your changes
-before running the entire suite. This is done using one of the following
-constructs:
-
-    nosetests pandas/tests/[test-module].py
-    nosetests pandas/tests/[test-module].py:[TestClass]
-    nosetests pandas/tests/[test-module].py:[TestClass].[test_method]
-
-#### Running the performance test suite
-
-Performance matters and it is worth considering that your code has not
-introduced performance regressions. Currently *pandas* uses the [vbench
-library](https://github.com/pydata/vbench) to enable easy monitoring of
-the performance of critical *pandas* operations. These benchmarks are
-all found in the `pandas/vb_suite` directory. vbench currently only
-works on python2.
-
-To install vbench:
-
-    pip install git+https://github.com/pydata/vbench
-
-Vbench also requires sqlalchemy, gitpython, and psutil which can all be
-installed using pip. If you need to run a benchmark, change your
-directory to the *pandas* root and run:
-
-    ./test_perf.sh -b master -t HEAD
-
-This will checkout the master revision and run the suite on both master
-and your commit. Running the full test suite can take up to one hour and
-use up to 3GB of RAM. Usually it is sufficient to past a subset of the
-results in to the Pull Request to show that the committed changes do not
-cause unexpected performance regressions.
-
-You can run specific benchmarks using the *-r* flag which takes a
-regular expression.
-
-See the [performance testing
-wiki](https://github.com/pydata/pandas/wiki/Performance-Testing) for
-information on how to write a benchmark.
-
-### Documenting your code
-
-Changes should be reflected in the release notes located in
-doc/source/whatsnew/vx.y.z.txt. This file contains an ongoing change log
-for each release. Add an entry to this file to document your fix,
-enhancement or (unavoidable) breaking change. Make sure to include the
-GitHub issue number when adding your entry.
-
-If your code is an enhancement, it is most likely necessary to add usage
-examples to the existing documentation. This can be done following the
-section regarding documentation.
-
-Contributing your changes to *pandas*
--------------------------------------
-
-### Committing your code
-
-Keep style fixes to a separate commit to make your PR more readable.
-
-Once you've made changes, you can see them by typing:
-
-    git status
-
-If you've created a new file, it is not being tracked by git. Add it by
-typing :
-
-    git add path/to/file-to-be-added.py
-
-Doing 'git status' again should give something like :
-
-    # On branch shiny-new-feature
-    #
-    #       modified:   /relative/path/to/file-you-added.py
-    #
-
-Finally, commit your changes to your local repository with an
-explanatory message. An informal commit message format is in effect for
-the project. Please try to adhere to it. Here are some common prefixes
-along with general guidelines for when to use them:
-
-> -   ENH: Enhancement, new functionality
-> -   BUG: Bug fix
-> -   DOC: Additions/updates to documentation
-> -   TST: Additions/updates to tests
-> -   BLD: Updates to the build process/scripts
-> -   PERF: Performance improvement
-> -   CLN: Code cleanup
-
-The following defines how a commit message should be structured. Please
-reference the relevant GitHub issues in your commit message using GH1234
-or \#1234. Either style is fine, but the former is generally preferred:
-
-> -   a subject line with \< 80 chars.
-> -   One blank line.
-> -   Optionally, a commit message body.
-
-Now you can commit your changes in your local repository:
-
-    git commit -m
-
-If you have multiple commits, it is common to want to combine them into
-one commit, often referred to as "squashing" or "rebasing". This is a
-common request by package maintainers when submitting a Pull Request as
-it maintains a more compact commit history. To rebase your commits:
-
-    git rebase -i HEAD~#
-
-Where \# is the number of commits you want to combine. Then you can pick
-the relevant commit message and discard others.
-
-### Pushing your changes
-
-When you want your changes to appear publicly on your GitHub page, push
-your forked feature branch's commits :
-
-    git push origin shiny-new-feature
-
-Here origin is the default name given to your remote repository on
-GitHub. You can see the remote repositories :
-
-    git remote -v
-
-If you added the upstream repository as described above you will see
-something like :
-
-    origin  git@github.com:yourname/pandas.git (fetch)
-    origin  git@github.com:yourname/pandas.git (push)
-    upstream        git://github.com/pydata/pandas.git (fetch)
-    upstream        git://github.com/pydata/pandas.git (push)
-
-Now your code is on GitHub, but it is not yet a part of the *pandas*
-project. For that to happen, a Pull Request needs to be submitted on
-GitHub.
-
-### Review your code
-
-When you're ready to ask for a code review, you will file a Pull
-Request. Before you do, again make sure you've followed all the
-guidelines outlined in this document regarding code style, tests,
-performance tests, and documentation. You should also double check your
-branch changes against the branch it was based off of:
-
-1.  Navigate to your repository on
-    GitHub--<https://github.com/your-user-name/pandas>.
-2.  Click on Branches.
-3.  Click on the Compare button for your feature branch.
-4.  Select the base and compare branches, if necessary. This will be
-    master and shiny-new-feature, respectively.
-
-### Finally, make the Pull Request
-
-If everything looks good you are ready to make a Pull Request. A Pull
-Request is how code from a local repository becomes available to the
-GitHub community and can be looked at and eventually merged into the
-master version. This Pull Request and its associated changes will
-eventually be committed to the master branch and available in the next
-release. To submit a Pull Request:
-
-1.  Navigate to your repository on GitHub.
-2.  Click on the Pull Request button.
-3.  You can then click on Commits and Files Changed to make sure
-    everything looks okay one last time.
-4.  Write a description of your changes in the Preview Discussion tab.
-5.  Click Send Pull Request.
-
-This request then appears to the repository maintainers, and they will
-review the code. If you need to make more changes, you can make them in
-your branch, push them to GitHub, and the pull request will be
-automatically updated. Pushing them to GitHub again is done by:
-
-    git push -f origin shiny-new-feature
-
-This will automatically update your Pull Request with the latest code
-and restart the Travis-CI tests.
-
-### Delete your merged branch (optional)
-
-Once your feature branch is accepted into upstream, you'll probably want
-to get rid of the branch. First, merge upstream master into your branch
-so git knows it is safe to delete your branch :
-
-    git fetch upstream
-    git checkout master
-    git merge upstream/master
-
-Then you can just do:
-
-    git branch -d shiny-new-feature
-
-Make sure you use a lower-case -d, or else git won't warn you if your
-feature branch has not actually been merged.
-
-The branch will still exist on GitHub, so to delete it there do :
-
-    git push origin --delete shiny-new-feature
diff --git a/LICENSE b/LICENSE
index c9b8834e8774b..924de26253bf4 100644
--- a/LICENSE
+++ b/LICENSE
@@ -1,87 +1,29 @@
-=======
-License
-=======
+BSD 3-Clause License
 
-pandas is distributed under a 3-clause ("Simplified" or "New") BSD
-license. Parts of NumPy, SciPy, numpydoc, bottleneck, which all have
-BSD-compatible licenses, are included. Their licenses follow the pandas
-license.
-
-pandas license
-==============
-
-Copyright (c) 2011-2012, Lambda Foundry, Inc. and PyData Development Team
-All rights reserved.
-
-Copyright (c) 2008-2011 AQR Capital Management, LLC
+Copyright (c) 2008-2012, AQR Capital Management, LLC, Lambda Foundry, Inc. and PyData Development Team
 All rights reserved.
 
 Redistribution and use in source and binary forms, with or without
-modification, are permitted provided that the following conditions are
-met:
-
-    * Redistributions of source code must retain the above copyright
-       notice, this list of conditions and the following disclaimer.
-
-    * Redistributions in binary form must reproduce the above
-       copyright notice, this list of conditions and the following
-       disclaimer in the documentation and/or other materials provided
-       with the distribution.
-
-    * Neither the name of the copyright holder nor the names of any
-       contributors may be used to endorse or promote products derived
-       from this software without specific prior written permission.
-
-THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER AND CONTRIBUTORS
-"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
-LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
-A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
-OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
-SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
-LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
-DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
-THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+modification, are permitted provided that the following conditions are met:
+
+* Redistributions of source code must retain the above copyright notice, this
+  list of conditions and the following disclaimer.
+
+* Redistributions in binary form must reproduce the above copyright notice,
+  this list of conditions and the following disclaimer in the documentation
+  and/or other materials provided with the distribution.
+
+* Neither the name of the copyright holder nor the names of its
+  contributors may be used to endorse or promote products derived from
+  this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-About the Copyright Holders
-===========================
-
-AQR Capital Management began pandas development in 2008. Development was
-led by Wes McKinney. AQR released the source under this license in 2009.
-Wes is now an employee of Lambda Foundry, and remains the pandas project
-lead.
-
-The PyData Development Team is the collection of developers of the PyData
-project. This includes all of the PyData sub-projects, including pandas. The
-core team that coordinates development on GitHub can be found here:
-http://github.com/pydata.
-
-Full credits for pandas contributors can be found in the documentation.
-
-Our Copyright Policy
-====================
-
-PyData uses a shared copyright model. Each contributor maintains copyright
-over their contributions to PyData. However, it is important to note that
-these contributions are typically only changes to the repositories. Thus,
-the PyData source code, in its entirety, is not the copyright of any single
-person or institution. Instead, it is the collective copyright of the
-entire PyData Development Team. If individual contributors want to maintain
-a record of what changes/contributions they have specific copyright on,
-they should indicate their copyright in the commit message of the change
-when they commit the change to one of the PyData repositories.
-
-With this in mind, the following banner should be used in any source code
-file to indicate the copyright and license terms:
-
-#-----------------------------------------------------------------------------
-# Copyright (c) 2012, PyData Development Team
-# All rights reserved.
-#
-# Distributed under the terms of the BSD Simplified License.
-#
-# The full license is in the LICENSE file, distributed with this software.
-#-----------------------------------------------------------------------------
-
-Other licenses can be found in the LICENSES directory.
\ No newline at end of file
diff --git a/LICENSES/SAS7BDAT_LICENSE b/LICENSES/SAS7BDAT_LICENSE
new file mode 100644
index 0000000000000..8fbf194013e93
--- /dev/null
+++ b/LICENSES/SAS7BDAT_LICENSE
@@ -0,0 +1,19 @@
+Copyright (c) 2015 Jared Hobbs
+
+Permission is hereby granted, free of charge, to any person obtaining a copy of
+this software and associated documentation files (the "Software"), to deal in
+the Software without restriction, including without limitation the rights to
+use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
+of the Software, and to permit persons to whom the Software is furnished to do
+so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
diff --git a/LICENSES/ULTRAJSON_LICENSE b/LICENSES/ULTRAJSON_LICENSE
index defca46e7f820..3b2886eb9cfae 100644
--- a/LICENSES/ULTRAJSON_LICENSE
+++ b/LICENSES/ULTRAJSON_LICENSE
@@ -25,10 +25,10 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 
 Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
-http://code.google.com/p/stringencoders/
+https://github.com/client9/stringencoders
 Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights reserved.
 
 Numeric decoder derived from from TCL library
 http://www.opensource.apple.com/source/tcl/tcl-14/tcl/license.terms
  * Copyright (c) 1988-1993 The Regents of the University of California.
- * Copyright (c) 1994 Sun Microsystems, Inc.
\ No newline at end of file
+ * Copyright (c) 1994 Sun Microsystems, Inc.
diff --git a/LICENSES/XARRAY_LICENSE b/LICENSES/XARRAY_LICENSE
new file mode 100644
index 0000000000000..37ec93a14fdcd
--- /dev/null
+++ b/LICENSES/XARRAY_LICENSE
@@ -0,0 +1,191 @@
+Apache License
+Version 2.0, January 2004
+http://www.apache.org/licenses/
+
+TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+1. Definitions.
+
+"License" shall mean the terms and conditions for use, reproduction, and
+distribution as defined by Sections 1 through 9 of this document.
+
+"Licensor" shall mean the copyright owner or entity authorized by the copyright
+owner that is granting the License.
+
+"Legal Entity" shall mean the union of the acting entity and all other entities
+that control, are controlled by, or are under common control with that entity.
+For the purposes of this definition, "control" means (i) the power, direct or
+indirect, to cause the direction or management of such entity, whether by
+contract or otherwise, or (ii) ownership of fifty percent (50%) or more of the
+outstanding shares, or (iii) beneficial ownership of such entity.
+
+"You" (or "Your") shall mean an individual or Legal Entity exercising
+permissions granted by this License.
+
+"Source" form shall mean the preferred form for making modifications, including
+but not limited to software source code, documentation source, and configuration
+files.
+
+"Object" form shall mean any form resulting from mechanical transformation or
+translation of a Source form, including but not limited to compiled object code,
+generated documentation, and conversions to other media types.
+
+"Work" shall mean the work of authorship, whether in Source or Object form, made
+available under the License, as indicated by a copyright notice that is included
+in or attached to the work (an example is provided in the Appendix below).
+
+"Derivative Works" shall mean any work, whether in Source or Object form, that
+is based on (or derived from) the Work and for which the editorial revisions,
+annotations, elaborations, or other modifications represent, as a whole, an
+original work of authorship. For the purposes of this License, Derivative Works
+shall not include works that remain separable from, or merely link (or bind by
+name) to the interfaces of, the Work and Derivative Works thereof.
+
+"Contribution" shall mean any work of authorship, including the original version
+of the Work and any modifications or additions to that Work or Derivative Works
+thereof, that is intentionally submitted to Licensor for inclusion in the Work
+by the copyright owner or by an individual or Legal Entity authorized to submit
+on behalf of the copyright owner. For the purposes of this definition,
+"submitted" means any form of electronic, verbal, or written communication sent
+to the Licensor or its representatives, including but not limited to
+communication on electronic mailing lists, source code control systems, and
+issue tracking systems that are managed by, or on behalf of, the Licensor for
+the purpose of discussing and improving the Work, but excluding communication
+that is conspicuously marked or otherwise designated in writing by the copyright
+owner as "Not a Contribution."
+
+"Contributor" shall mean Licensor and any individual or Legal Entity on behalf
+of whom a Contribution has been received by Licensor and subsequently
+incorporated within the Work.
+
+2. Grant of Copyright License.
+
+Subject to the terms and conditions of this License, each Contributor hereby
+grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free,
+irrevocable copyright license to reproduce, prepare Derivative Works of,
+publicly display, publicly perform, sublicense, and distribute the Work and such
+Derivative Works in Source or Object form.
+
+3. Grant of Patent License.
+
+Subject to the terms and conditions of this License, each Contributor hereby
+grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free,
+irrevocable (except as stated in this section) patent license to make, have
+made, use, offer to sell, sell, import, and otherwise transfer the Work, where
+such license applies only to those patent claims licensable by such Contributor
+that are necessarily infringed by their Contribution(s) alone or by combination
+of their Contribution(s) with the Work to which such Contribution(s) was
+submitted. If You institute patent litigation against any entity (including a
+cross-claim or counterclaim in a lawsuit) alleging that the Work or a
+Contribution incorporated within the Work constitutes direct or contributory
+patent infringement, then any patent licenses granted to You under this License
+for that Work shall terminate as of the date such litigation is filed.
+
+4. Redistribution.
+
+You may reproduce and distribute copies of the Work or Derivative Works thereof
+in any medium, with or without modifications, and in Source or Object form,
+provided that You meet the following conditions:
+
+You must give any other recipients of the Work or Derivative Works a copy of
+this License; and
+You must cause any modified files to carry prominent notices stating that You
+changed the files; and
+You must retain, in the Source form of any Derivative Works that You distribute,
+all copyright, patent, trademark, and attribution notices from the Source form
+of the Work, excluding those notices that do not pertain to any part of the
+Derivative Works; and
+If the Work includes a "NOTICE" text file as part of its distribution, then any
+Derivative Works that You distribute must include a readable copy of the
+attribution notices contained within such NOTICE file, excluding those notices
+that do not pertain to any part of the Derivative Works, in at least one of the
+following places: within a NOTICE text file distributed as part of the
+Derivative Works; within the Source form or documentation, if provided along
+with the Derivative Works; or, within a display generated by the Derivative
+Works, if and wherever such third-party notices normally appear. The contents of
+the NOTICE file are for informational purposes only and do not modify the
+License. You may add Your own attribution notices within Derivative Works that
+You distribute, alongside or as an addendum to the NOTICE text from the Work,
+provided that such additional attribution notices cannot be construed as
+modifying the License.
+You may add Your own copyright statement to Your modifications and may provide
+additional or different license terms and conditions for use, reproduction, or
+distribution of Your modifications, or for any such Derivative Works as a whole,
+provided Your use, reproduction, and distribution of the Work otherwise complies
+with the conditions stated in this License.
+
+5. Submission of Contributions.
+
+Unless You explicitly state otherwise, any Contribution intentionally submitted
+for inclusion in the Work by You to the Licensor shall be under the terms and
+conditions of this License, without any additional terms or conditions.
+Notwithstanding the above, nothing herein shall supersede or modify the terms of
+any separate license agreement you may have executed with Licensor regarding
+such Contributions.
+
+6. Trademarks.
+
+This License does not grant permission to use the trade names, trademarks,
+service marks, or product names of the Licensor, except as required for
+reasonable and customary use in describing the origin of the Work and
+reproducing the content of the NOTICE file.
+
+7. Disclaimer of Warranty.
+
+Unless required by applicable law or agreed to in writing, Licensor provides the
+Work (and each Contributor provides its Contributions) on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied,
+including, without limitation, any warranties or conditions of TITLE,
+NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A PARTICULAR PURPOSE. You are
+solely responsible for determining the appropriateness of using or
+redistributing the Work and assume any risks associated with Your exercise of
+permissions under this License.
+
+8. Limitation of Liability.
+
+In no event and under no legal theory, whether in tort (including negligence),
+contract, or otherwise, unless required by applicable law (such as deliberate
+and grossly negligent acts) or agreed to in writing, shall any Contributor be
+liable to You for damages, including any direct, indirect, special, incidental,
+or consequential damages of any character arising as a result of this License or
+out of the use or inability to use the Work (including but not limited to
+damages for loss of goodwill, work stoppage, computer failure or malfunction, or
+any and all other commercial damages or losses), even if such Contributor has
+been advised of the possibility of such damages.
+
+9. Accepting Warranty or Additional Liability.
+
+While redistributing the Work or Derivative Works thereof, You may choose to
+offer, and charge a fee for, acceptance of support, warranty, indemnity, or
+other liability obligations and/or rights consistent with this License. However,
+in accepting such obligations, You may act only on Your own behalf and on Your
+sole responsibility, not on behalf of any other Contributor, and only if You
+agree to indemnify, defend, and hold each Contributor harmless for any liability
+incurred by, or claims asserted against, such Contributor by reason of your
+accepting any such warranty or additional liability.
+
+END OF TERMS AND CONDITIONS
+
+APPENDIX: How to apply the Apache License to your work
+
+To apply the Apache License to your work, attach the following boilerplate
+notice, with the fields enclosed by brackets "[]" replaced with your own
+identifying information. (Don't include the brackets!) The text should be
+enclosed in the appropriate comment syntax for the file format. We also
+recommend that a file or class name and description of purpose be included on
+the same "printed page" as the copyright notice for easier identification within
+third-party archives.
+
+   Copyright [yyyy] [name of copyright owner]
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/MANIFEST.in b/MANIFEST.in
index 2d26fbfd6adaf..b417b8890fa24 100644
--- a/MANIFEST.in
+++ b/MANIFEST.in
@@ -1,28 +1,41 @@
 include MANIFEST.in
 include LICENSE
 include RELEASE.md
-include README.rst
+include README.md
 include setup.py
 
 graft doc
 prune doc/build
 
-graft examples
+graft LICENSES
+
 graft pandas
 
-global-exclude *.so
-global-exclude *.pyd
+global-exclude *.bz2
+global-exclude *.csv
+global-exclude *.dta
+global-exclude *.gz
+global-exclude *.h5
+global-exclude *.html
+global-exclude *.json
+global-exclude *.msgpack
+global-exclude *.pickle
+global-exclude *.png
 global-exclude *.pyc
+global-exclude *.pyd
+global-exclude *.sas7bdat
+global-exclude *.so
+global-exclude *.xls
+global-exclude *.xlsm
+global-exclude *.xlsx
+global-exclude *.xpt
+global-exclude *.xz
+global-exclude *.zip
 global-exclude *~
-global-exclude \#*
-global-exclude .git*
 global-exclude .DS_Store
-global-exclude *.png
+global-exclude .git*
+global-exclude \#*
 
-# include examples/data/*
-# recursive-include examples *.py
-# recursive-include doc/source *
-# recursive-include doc/sphinxext *
-# recursive-include LICENSES *
 include versioneer.py
 include pandas/_version.py
+include pandas/io/formats/templates/*.tpl
diff --git a/Makefile b/Makefile
index 9a768932b8bea..4a82566cf726e 100644
--- a/Makefile
+++ b/Makefile
@@ -1,4 +1,4 @@
-tseries: pandas/lib.pyx pandas/tslib.pyx pandas/hashtable.pyx
+tseries: pandas/_libs/lib.pyx pandas/_libs/tslib.pyx pandas/_libs/hashtable.pyx
 	python setup.py build_ext --inplace
 
 .PHONY : develop build clean clean_pyc tseries doc
@@ -9,12 +9,12 @@ clean:
 clean_pyc:
 	-find . -name '*.py[co]' -exec rm {} \;
 
-sparse: pandas/src/sparse.pyx
-	python setup.py build_ext --inplace
-
 build: clean_pyc
 	python setup.py build_ext --inplace
 
+lint-diff:
+	git diff master --name-only -- "*.py" | grep "pandas" | xargs flake8
+
 develop: build
 	-python setup.py develop
 
@@ -23,3 +23,4 @@ doc:
 	cd doc; \
 	python make.py clean; \
 	python make.py html
+	python make.py spellcheck
diff --git a/README.md b/README.md
index 66e7605a63142..3c8fe57400099 100644
--- a/README.md
+++ b/README.md
@@ -1,48 +1,93 @@
+<div align="center">
+  <img src="https://github.com/pandas-dev/pandas/blob/master/doc/logo/pandas_logo.png"><br>
+</div>
+
+-----------------
+
 # pandas: powerful Python data analysis toolkit
 
 <table>
 <tr>
   <td>Latest Release</td>
-  <td><img src="https://img.shields.io/pypi/v/pandas.svg" alt="latest release" /></td>
+  <td>
+    <a href="https://pypi.org/project/pandas/">
+    <img src="https://img.shields.io/pypi/v/pandas.svg" alt="latest release" />
+    </a>
+  </td>
 </tr>
   <td></td>
-  <td><img src="https://anaconda.org/pandas/pandas/badges/version.svg" alt="latest release" /></td>
+  <td>
+    <a href="https://anaconda.org/anaconda/pandas/">
+    <img src="https://anaconda.org/conda-forge/pandas/badges/version.svg" alt="latest release" />
+    </a>
+</td>
 </tr>
 <tr>
   <td>Package Status</td>
-  <td><img src="https://img.shields.io/pypi/status/pandas.svg" alt="status" /></td>
+  <td>
+		<a href="https://pypi.org/project/pandas/">
+		<img src="https://img.shields.io/pypi/status/pandas.svg" alt="status" /></td>
+		</a>
 </tr>
 <tr>
   <td>License</td>
-  <td><img src="https://img.shields.io/pypi/l/pandas.svg" alt="license" /></td>
+  <td>
+    <a href="https://github.com/pandas-dev/pandas/blob/master/LICENSE">
+    <img src="https://img.shields.io/pypi/l/pandas.svg" alt="license" />
+    </a>
+</td>
 </tr>
 <tr>
   <td>Build Status</td>
   <td>
-    <a href="https://travis-ci.org/pydata/pandas">
-    <img src="https://travis-ci.org/pydata/pandas.svg?branch=master" alt="build status" />
+    <a href="https://travis-ci.org/pandas-dev/pandas">
+    <img src="https://travis-ci.org/pandas-dev/pandas.svg?branch=master" alt="travis build status" />
+    </a>
+  </td>
+</tr>
+<tr>
+  <td></td>
+  <td>
+    <a href="https://circleci.com/gh/pandas-dev/pandas">
+    <img src="https://circleci.com/gh/circleci/mongofinil/tree/master.svg?style=shield&circle-token=223d8cafa7b02902c3e150242520af8944e34671" alt="circleci build status" />
     </a>
   </td>
 </tr>
 <tr>
-  <td>Conda</td>
+  <td></td>
   <td>
-    <a href="http://pandas.pydata.org">
-    <img src="http://pubbadges.s3-website-us-east-1.amazonaws.com/pkgs-downloads-pandas.png" alt="conda downloads" />
+    <a href="https://ci.appveyor.com/project/pandas-dev/pandas">
+    <img src="https://ci.appveyor.com/api/projects/status/86vn83mxgnl4xf1s/branch/master?svg=true" alt="appveyor build status" />
+    </a>
+  </td>
+</tr>
+<tr>
+  <td>Coverage</td>
+  <td>
+    <a href="https://codecov.io/gh/pandas-dev/pandas">
+    <img src="https://codecov.io/github/pandas-dev/pandas/coverage.svg?branch=master" alt="coverage" />
     </a>
   </td>
 </tr>
 <tr>
-  <td>PyPI</td>
+  <td>Downloads</td>
   <td>
-    <a href="https://pypi.python.org/pypi/pandas/">
-    <img src="https://img.shields.io/pypi/dm/pandas.svg" alt="pypi downloads" />
+    <a href="https://pandas.pydata.org">
+    <img src="https://anaconda.org/conda-forge/pandas/badges/downloads.svg" alt="conda-forge downloads" />
     </a>
   </td>
 </tr>
+<tr>
+	<td>Gitter</td>
+	<td>
+		<a href="https://gitter.im/pydata/pandas">
+		<img src="https://badges.gitter.im/Join%20Chat.svg"
+	</a>
+	</td>
+</tr>
 </table>
 
-[![https://gitter.im/pydata/pandas](https://badges.gitter.im/Join%20Chat.svg)](https://gitter.im/pydata/pandas?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge)
+
 
 ## What is it
 
@@ -89,125 +134,49 @@ Here are just a few of the things that pandas does well:
     moving window linear regressions, date shifting and lagging, etc.
 
 
-   [missing-data]: http://pandas.pydata.org/pandas-docs/stable/missing_data.html#working-with-missing-data
-   [insertion-deletion]: http://pandas.pydata.org/pandas-docs/stable/dsintro.html#column-selection-addition-deletion
-   [alignment]: http://pandas.pydata.org/pandas-docs/stable/dsintro.html?highlight=alignment#intro-to-data-structures
-   [groupby]: http://pandas.pydata.org/pandas-docs/stable/groupby.html#group-by-split-apply-combine
-   [conversion]: http://pandas.pydata.org/pandas-docs/stable/dsintro.html#dataframe
-   [slicing]: http://pandas.pydata.org/pandas-docs/stable/indexing.html#slicing-ranges
-   [fancy-indexing]: http://pandas.pydata.org/pandas-docs/stable/indexing.html#advanced-indexing-with-ix
-   [subsetting]: http://pandas.pydata.org/pandas-docs/stable/indexing.html#boolean-indexing
-   [merging]: http://pandas.pydata.org/pandas-docs/stable/merging.html#database-style-dataframe-joining-merging
-   [joining]: http://pandas.pydata.org/pandas-docs/stable/merging.html#joining-on-index
-   [reshape]: http://pandas.pydata.org/pandas-docs/stable/reshaping.html#reshaping-and-pivot-tables
-   [pivot-table]: http://pandas.pydata.org/pandas-docs/stable/reshaping.html#pivot-tables-and-cross-tabulations
-   [mi]: http://pandas.pydata.org/pandas-docs/stable/indexing.html#hierarchical-indexing-multiindex
-   [flat-files]: http://pandas.pydata.org/pandas-docs/stable/io.html#csv-text-files
-   [excel]: http://pandas.pydata.org/pandas-docs/stable/io.html#excel-files
-   [db]: http://pandas.pydata.org/pandas-docs/stable/io.html#sql-queries
-   [hdfstore]: http://pandas.pydata.org/pandas-docs/stable/io.html#hdf5-pytables
-   [timeseries]: http://pandas.pydata.org/pandas-docs/stable/timeseries.html#time-series-date-functionality
+   [missing-data]: https://pandas.pydata.org/pandas-docs/stable/missing_data.html#working-with-missing-data
+   [insertion-deletion]: https://pandas.pydata.org/pandas-docs/stable/dsintro.html#column-selection-addition-deletion
+   [alignment]: https://pandas.pydata.org/pandas-docs/stable/dsintro.html?highlight=alignment#intro-to-data-structures
+   [groupby]: https://pandas.pydata.org/pandas-docs/stable/groupby.html#group-by-split-apply-combine
+   [conversion]: https://pandas.pydata.org/pandas-docs/stable/dsintro.html#dataframe
+   [slicing]: https://pandas.pydata.org/pandas-docs/stable/indexing.html#slicing-ranges
+   [fancy-indexing]: https://pandas.pydata.org/pandas-docs/stable/indexing.html#advanced-indexing-with-ix
+   [subsetting]: https://pandas.pydata.org/pandas-docs/stable/indexing.html#boolean-indexing
+   [merging]: https://pandas.pydata.org/pandas-docs/stable/merging.html#database-style-dataframe-joining-merging
+   [joining]: https://pandas.pydata.org/pandas-docs/stable/merging.html#joining-on-index
+   [reshape]: https://pandas.pydata.org/pandas-docs/stable/reshaping.html#reshaping-and-pivot-tables
+   [pivot-table]: https://pandas.pydata.org/pandas-docs/stable/reshaping.html#pivot-tables-and-cross-tabulations
+   [mi]: https://pandas.pydata.org/pandas-docs/stable/indexing.html#hierarchical-indexing-multiindex
+   [flat-files]: https://pandas.pydata.org/pandas-docs/stable/io.html#csv-text-files
+   [excel]: https://pandas.pydata.org/pandas-docs/stable/io.html#excel-files
+   [db]: https://pandas.pydata.org/pandas-docs/stable/io.html#sql-queries
+   [hdfstore]: https://pandas.pydata.org/pandas-docs/stable/io.html#hdf5-pytables
+   [timeseries]: https://pandas.pydata.org/pandas-docs/stable/timeseries.html#time-series-date-functionality
 
 ## Where to get it
 The source code is currently hosted on GitHub at:
-http://github.com/pydata/pandas
+https://github.com/pandas-dev/pandas
 
-Binary installers for the latest released version are available at the Python
-package index
-
-    http://pypi.python.org/pypi/pandas/
-
-And via `easy_install`:
+Binary installers for the latest released version are available at the [Python
+package index](https://pypi.org/project/pandas) and on conda.
 
 ```sh
-easy_install pandas
+# conda
+conda install pandas
 ```
 
-or  `pip`:
-
 ```sh
+# or PyPI
 pip install pandas
 ```
 
-or  `conda`:
-
-```sh
-conda install pandas
-```
-
 ## Dependencies
-- [NumPy](http://www.numpy.org): 1.7.0 or higher
-- [python-dateutil](http://labix.org/python-dateutil): 1.5 or higher
-- [pytz](http://pytz.sourceforge.net)
-    - Needed for time zone support with ``pandas.date_range``
-
-### Highly Recommended Dependencies
-- [numexpr](https://github.com/pydata/numexpr)
-   - Needed to accelerate some expression evaluation operations
-   - Required by PyTables
-- [bottleneck](http://berkeleyanalytics.com/bottleneck)
-   - Needed to accelerate certain numerical operations
-
-### Optional dependencies
-- [Cython](http://www.cython.org): Only necessary to build development version. Version 0.17.1 or higher.
-- [SciPy](http://www.scipy.org): miscellaneous statistical functions
-- [PyTables](http://www.pytables.org): necessary for HDF5-based storage
-- [SQLAlchemy](http://www.sqlalchemy.org): for SQL database support. Version 0.8.1 or higher recommended.
-- [matplotlib](http://matplotlib.sourceforge.net/): for plotting
-- [statsmodels](http://statsmodels.sourceforge.net/)
-   - Needed for parts of `pandas.stats`
-- For Excel I/O:
-  - [xlrd/xlwt](http://www.python-excel.org/)
-     - Excel reading (xlrd) and writing (xlwt)
-  - [openpyxl](http://packages.python.org/openpyxl/)
-     - openpyxl version 1.6.1 or higher, but lower than 2.0.0, for
-       writing .xlsx files
-     - xlrd >= 0.9.0
-  - [XlsxWriter](https://pypi.python.org/pypi/XlsxWriter)
-     - Alternative Excel writer.
-- [Google bq Command Line Tool](https://cloud.google.com/bigquery/bq-command-line-tool)
-  - Needed for `pandas.io.gbq`
-- [boto](https://pypi.python.org/pypi/boto): necessary for Amazon S3 access.
-- One of the following combinations of libraries is needed to use the
-  top-level [`pandas.read_html`][read-html-docs] function:
-  - [BeautifulSoup4][BeautifulSoup4] and [html5lib][html5lib] (Any
-    recent version of [html5lib][html5lib] is okay.)
-  - [BeautifulSoup4][BeautifulSoup4] and [lxml][lxml]
-  - [BeautifulSoup4][BeautifulSoup4] and [html5lib][html5lib] and [lxml][lxml]
-  - Only [lxml][lxml], although see [HTML reading gotchas][html-gotchas]
-    for reasons as to why you should probably **not** take this approach.
-
-#### Notes about HTML parsing libraries
-- If you install [BeautifulSoup4][BeautifulSoup4] you must install
-  either [lxml][lxml] or [html5lib][html5lib] or both.
-  `pandas.read_html` will **not** work with *only* `BeautifulSoup4`
-  installed.
-- You are strongly encouraged to read [HTML reading
-  gotchas][html-gotchas]. It explains issues surrounding the
-  installation and usage of the above three libraries.
-- You may need to install an older version of
-  [BeautifulSoup4][BeautifulSoup4]:
-    - Versions 4.2.1, 4.1.3 and 4.0.2 have been confirmed for 64 and
-      32-bit Ubuntu/Debian
-- Additionally, if you're using [Anaconda][Anaconda] you should
-  definitely read [the gotchas about HTML parsing][html-gotchas]
-  libraries
-- If you're on a system with `apt-get` you can do
-
-  ```sh
-  sudo apt-get build-dep python-lxml
-  ```
-
-  to get the necessary dependencies for installation of [lxml][lxml].
-  This will prevent further headaches down the line.
-
-   [html5lib]: https://github.com/html5lib/html5lib-python "html5lib"
-   [BeautifulSoup4]: http://www.crummy.com/software/BeautifulSoup "BeautifulSoup4"
-   [lxml]: http://lxml.de
-   [Anaconda]: https://store.continuum.io/cshop/anaconda
-   [NumPy]: http://numpy.scipy.org/
-   [html-gotchas]: http://pandas.pydata.org/pandas-docs/stable/gotchas.html#html-table-parsing
-   [read-html-docs]: http://pandas.pydata.org/pandas-docs/stable/generated/pandas.io.html.read_html.html#pandas.io.html.read_html
+- [NumPy](https://www.numpy.org): 1.9.0 or higher
+- [python-dateutil](https://labix.org/python-dateutil): 2.5.0 or higher
+- [pytz](https://pythonhosted.org/pytz): 2011k or higher
+
+See the [full installation instructions](https://pandas.pydata.org/pandas-docs/stable/install.html#dependencies)
+for recommended and optional dependencies.
 
 ## Installation from sources
 To install pandas from source you need Cython in addition to the normal
@@ -238,32 +207,36 @@ mode](https://pip.pypa.io/en/latest/reference/pip_install.html#editable-installs
 pip install -e .
 ```
 
-On Windows, you will need to install MinGW and execute:
-
-```sh
-python setup.py build --compiler=mingw32
-python setup.py install
-```
-
-See http://pandas.pydata.org/ for more information.
+See the full instructions for [installing from source](https://pandas.pydata.org/pandas-docs/stable/install.html#installing-from-source).
 
 ## License
-BSD
+[BSD 3](LICENSE)
 
 ## Documentation
-The official documentation is hosted on PyData.org: http://pandas.pydata.org/
-
-The Sphinx documentation should provide a good starting point for learning how
-to use the library. Expect the docs to continue to expand as time goes on.
+The official documentation is hosted on PyData.org: https://pandas.pydata.org/pandas-docs/stable
 
 ## Background
 Work on ``pandas`` started at AQR (a quantitative hedge fund) in 2008 and
 has been under active development since then.
 
+## Getting Help
+
+For usage questions, the best place to go to is [StackOverflow](https://stackoverflow.com/questions/tagged/pandas).
+Further, general questions and discussions can also take place on the [pydata mailing list](https://groups.google.com/forum/?fromgroups#!forum/pydata).
+
 ## Discussion and Development
-Since pandas development is related to a number of other scientific
-Python projects, questions are welcome on the scipy-user mailing
-list. Specialized discussions or design issues should take place on
-the PyData mailing list / Google group:
+Most development discussion is taking place on github in this repo. Further, the [pandas-dev mailing list](https://mail.python.org/mailman/listinfo/pandas-dev) can also be used for specialized discussions or design issues, and a [Gitter channel](https://gitter.im/pydata/pandas) is available for quick development related questions.
+
+## Contributing to pandas [![Open Source Helpers](https://www.codetriage.com/pandas-dev/pandas/badges/users.svg)](https://www.codetriage.com/pandas-dev/pandas)
+
+All contributions, bug reports, bug fixes, documentation improvements, enhancements and ideas are welcome.
+
+A detailed overview on how to contribute can be found in the **[contributing guide.](https://pandas.pydata.org/pandas-docs/stable/contributing.html)**
+
+If you are simply looking to start working with the pandas codebase, navigate to the [GitHub “issues” tab](https://github.com/pandas-dev/pandas/issues) and start looking through interesting issues. There are a number of issues listed under [Docs](https://github.com/pandas-dev/pandas/issues?labels=Docs&sort=updated&state=open) and [good first issue](https://github.com/pandas-dev/pandas/issues?labels=good+first+issue&sort=updated&state=open) where you could start out.
+
+You can also triage issues which may include reproducing bug reports, or asking for vital information such as version numbers or reproduction instructions. If you would like to start triaging issues, one easy way to get started is to [subscribe to pandas on CodeTriage](https://www.codetriage.com/pandas-dev/pandas).
+
+Or maybe through using pandas you have an idea of your own or are looking for something in the documentation and thinking ‘this can be improved’...you can do something about it!
 
-https://groups.google.com/forum/#!forum/pydata
+Feel free to ask questions on the [mailing list](https://groups.google.com/forum/?fromgroups#!forum/pydata) or on [Gitter](https://gitter.im/pydata/pandas).
diff --git a/RELEASE.md b/RELEASE.md
index 23c1817b7647c..efd075dabcba9 100644
--- a/RELEASE.md
+++ b/RELEASE.md
@@ -1,6 +1,6 @@
 Release Notes
 =============
 
-The list of changes to pandas between each release can be found
+The list of changes to Pandas between each release can be found
 [here](http://pandas.pydata.org/pandas-docs/stable/whatsnew.html). For full
-details, see the commit logs at http://github.com/pydata/pandas.
+details, see the commit logs at http://github.com/pandas-dev/pandas.
diff --git a/appveyor.yml b/appveyor.yml
index 9cec7895f1493..f70fc829ec971 100644
--- a/appveyor.yml
+++ b/appveyor.yml
@@ -1,38 +1,89 @@
+# With infos from
+# http://tjelvarolsson.com/blog/how-to-continuously-test-your-python-code-on-windows-using-appveyor/
+# https://packaging.python.org/en/latest/appveyor/
+# https://github.com/rmcgibbo/python-appveyor-conda-example
+
+# Backslashes in quotes need to be escaped: \ -> "\\"
+
+matrix:
+  fast_finish: true     # immediately finish build once one of the jobs fails.
+
 environment:
   global:
     # SDK v7.0 MSVC Express 2008's SetEnv.cmd script will fail if the
-    # /E:ON and /V:ON options are not enabled in the batch script intepreter
+    # /E:ON and /V:ON options are not enabled in the batch script interpreter
     # See: http://stackoverflow.com/a/13751649/163740
     CMD_IN_ENV: "cmd /E:ON /V:ON /C .\\ci\\run_with_env.cmd"
+    clone_folder: C:\projects\pandas
+    PANDAS_TESTING_MODE: "deprecate"
 
   matrix:
-    - PYTHON: "C:\\Python27_32"
-      PYTHON_VERSION: "2.7"
-      PYTHON_ARCH: "32"
 
-    - PYTHON: "C:\\Python27_64"
+    - CONDA_ROOT: "C:\\Miniconda3_64"
+      PYTHON_VERSION: "3.6"
+      PYTHON_ARCH: "64"
+      CONDA_PY: "36"
+      CONDA_NPY: "113"
+
+    - CONDA_ROOT: "C:\\Miniconda3_64"
       PYTHON_VERSION: "2.7"
       PYTHON_ARCH: "64"
+      CONDA_PY: "27"
+      CONDA_NPY: "110"
 
-    - PYTHON: "C:\\Python34_32"
-      PYTHON_VERSION: "3.4"
-      PYTHON_ARCH: "32"
+# We always use a 64-bit machine, but can build x86 distributions
+# with the PYTHON_ARCH variable (which is used by CMD_IN_ENV).
+platform:
+    - x64
 
-    - PYTHON: "C:\\Python34_64"
-      PYTHON_VERSION: "3.4"
-      PYTHON_ARCH: "64"
+# all our python builds have to happen in tests_script...
+build: false
 
 install:
-  # this installs the appropriate Miniconda (Py2/Py3, 32/64 bit),
-  # as well as pip, conda-build, and the binstar CLI
+  # cancel older builds for the same PR
+  - ps: if ($env:APPVEYOR_PULL_REQUEST_NUMBER -and $env:APPVEYOR_BUILD_NUMBER -ne ((Invoke-RestMethod `
+        https://ci.appveyor.com/api/projects/$env:APPVEYOR_ACCOUNT_NAME/$env:APPVEYOR_PROJECT_SLUG/history?recordsNumber=50).builds | `
+        Where-Object pullRequestId -eq $env:APPVEYOR_PULL_REQUEST_NUMBER)[0].buildNumber) { `
+        throw "There are newer queued builds for this pull request, failing early." }
+
+  # this installs the appropriate Miniconda (Py2/Py3, 32/64 bit)
+  # updates conda & installs: conda-build jinja2 anaconda-client
+  - powershell .\ci\install.ps1
+  - SET PATH=%CONDA_ROOT%;%CONDA_ROOT%\Scripts;%PATH%
   - echo "install"
   - cd
   - ls -ltr
-  - powershell .\\ci\\install_appveyor.ps1
-  - "SET PATH=%PYTHON%;%PYTHON%\\Scripts;%PATH%"
+  - git tag --sort v:refname
 
-build: false
+  # this can conflict with git
+  - cmd: rmdir C:\cygwin /s /q
+
+  # install our build environment
+  - cmd: conda config --set show_channel_urls true --set always_yes true --set changeps1 false
+  - cmd: conda update -q conda
+  - cmd: conda config --set ssl_verify false
+
+  # add the pandas channel *before* defaults to have defaults take priority
+  - cmd: conda config --add channels conda-forge
+  - cmd: conda config --add channels pandas
+  - cmd: conda config --remove channels defaults
+  - cmd: conda config --add channels defaults
+
+  # this is now the downloaded conda...
+  - cmd: conda info -a
+
+  # create our env
+  - cmd: conda env create -q -n pandas --file=ci\appveyor-%CONDA_PY%.yaml
+  - cmd: activate pandas
+  - cmd: conda list -n pandas
+  # uninstall pandas if it's present
+  - cmd: conda remove pandas -y --force & exit 0
+  - cmd: pip uninstall -y pandas & exit 0
+
+  # build em using the local source checkout in the correct windows env
+  - cmd: '%CMD_IN_ENV% python setup.py build_ext --inplace'
 
 test_script:
-  - "%CMD_IN_ENV% %PYTHON%/python.exe setup.py build_ext --inplace"
-  - "%PYTHON%/Scripts/nosetests -A \"not slow and not network and not disabled\" pandas"
+  # tests
+  - cmd: activate pandas
+  - cmd: test.bat
diff --git a/asv_bench/asv.conf.json b/asv_bench/asv.conf.json
index dcea59545aae3..9c333f62810f4 100644
--- a/asv_bench/asv.conf.json
+++ b/asv_bench/asv.conf.json
@@ -21,32 +21,70 @@
     "environment_type": "conda",
 
     // the base URL to show a commit for the project.
-    "show_commit_url": "https://github.com/pydata/pandas/commit/",
+    "show_commit_url": "https://github.com/pandas-dev/pandas/commit/",
 
     // The Pythons you'd like to test against.  If not provided, defaults
     // to the current version of Python used to run `asv`.
     // "pythons": ["2.7", "3.4"],
-    "pythons": ["2.7"],
+    "pythons": ["3.6"],
 
     // The matrix of dependencies to test.  Each key is the name of a
     // package (in PyPI) and the values are version numbers.  An empty
-    // list indicates to just test against the default (latest)
-    // version.
+    // list or empty string indicates to just test against the default
+    // (latest) version. null indicates that the package is to not be
+    // installed. If the package to be tested is only available from
+    // PyPi, and the 'environment_type' is conda, then you can preface
+    // the package name by 'pip+', and the package will be installed via
+    // pip (with all the conda available packages installed first,
+    // followed by the pip installed packages).
     "matrix": {
-        // To run against multiple versions, replace with
-        // "numpy": ["1.7", "1.9"],
         "numpy": [],
         "Cython": [],
         "matplotlib": [],
         "sqlalchemy": [],
         "scipy": [],
         "numexpr": [],
-        "pytables": [],
+        "pytables": [null, ""],  // platform dependent, see excludes below
+        "tables": [null, ""],
         "openpyxl": [],
+        "xlsxwriter": [],
         "xlrd": [],
-        "xlwt": []
+        "xlwt": [],
+        "pytest": [],
+        // If using Windows with python 2.7 and want to build using the
+        // mingw toolchain (rather than MSVC), uncomment the following line.
+        // "libpython": [],
     },
 
+    // Combinations of libraries/python versions can be excluded/included
+    // from the set to test. Each entry is a dictionary containing additional
+    // key-value pairs to include/exclude.
+    //
+    // An exclude entry excludes entries where all values match. The
+    // values are regexps that should match the whole string.
+    //
+    // An include entry adds an environment. Only the packages listed
+    // are installed. The 'python' key is required. The exclude rules
+    // do not apply to includes.
+    //
+    // In addition to package names, the following keys are available:
+    //
+    // - python
+    //     Python version, as in the *pythons* variable above.
+    // - environment_type
+    //     Environment type, as above.
+    // - sys_platform
+    //     Platform, as in sys.platform. Possible values for the common
+    //     cases: 'linux2', 'win32', 'cygwin', 'darwin'.
+    "exclude": [
+        // On conda install pytables, otherwise tables
+        {"environment_type": "conda", "tables": ""},
+        {"environment_type": "conda", "pytables": null},
+        {"environment_type": "(?!conda).*", "tables": null},
+        {"environment_type": "(?!conda).*", "pytables": ""},
+    ],
+    "include": [],
+
     // The directory (relative to the current directory) that benchmarks are
     // stored in.  If not provided, defaults to "benchmarks"
     // "benchmark_dir": "benchmarks",
@@ -55,7 +93,6 @@
     // environments in.  If not provided, defaults to "env"
     // "env_dir": "env",
 
-
     // The directory (relative to the current directory) that raw benchmark
     // results are stored in.  If not provided, defaults to "results".
     // "results_dir": "results",
@@ -65,5 +102,25 @@
     // "html_dir": "html",
 
     // The number of characters to retain in the commit hashes.
-    // "hash_length": 8
+    // "hash_length": 8,
+
+    // `asv` will cache wheels of the recent builds in each
+    // environment, making them faster to install next time.  This is
+    // number of builds to keep, per environment.
+    "wheel_cache_size": 8,
+
+    // The commits after which the regression search in `asv publish`
+    // should start looking for regressions. Dictionary whose keys are
+    // regexps matching to benchmark names, and values corresponding to
+    // the commit (exclusive) after which to start looking for
+    // regressions.  The default is to start from the first commit
+    // with results. If the commit is `null`, regression detection is
+    // skipped for the matching benchmark.
+    //
+    "regressions_first_commits": {
+        ".*": "v0.20.0"
+    },
+    "regression_thresholds": {
+        ".*": 0.05
+    }
 }
diff --git a/asv_bench/benchmarks/algorithms.py b/asv_bench/benchmarks/algorithms.py
new file mode 100644
index 0000000000000..cccd38ef11251
--- /dev/null
+++ b/asv_bench/benchmarks/algorithms.py
@@ -0,0 +1,128 @@
+import warnings
+from importlib import import_module
+
+import numpy as np
+import pandas as pd
+from pandas.util import testing as tm
+
+for imp in ['pandas.util', 'pandas.tools.hashing']:
+    try:
+        hashing = import_module(imp)
+        break
+    except:
+        pass
+
+from .pandas_vb_common import setup # noqa
+
+
+class Factorize(object):
+
+    goal_time = 0.2
+
+    params = [True, False]
+    param_names = ['sort']
+
+    def setup(self, sort):
+        N = 10**5
+        self.int_idx = pd.Int64Index(np.arange(N).repeat(5))
+        self.float_idx = pd.Float64Index(np.random.randn(N).repeat(5))
+        self.string_idx = tm.makeStringIndex(N)
+
+    def time_factorize_int(self, sort):
+        self.int_idx.factorize(sort=sort)
+
+    def time_factorize_float(self, sort):
+        self.float_idx.factorize(sort=sort)
+
+    def time_factorize_string(self, sort):
+        self.string_idx.factorize(sort=sort)
+
+
+class Duplicated(object):
+
+    goal_time = 0.2
+
+    params = ['first', 'last', False]
+    param_names = ['keep']
+
+    def setup(self, keep):
+        N = 10**5
+        self.int_idx = pd.Int64Index(np.arange(N).repeat(5))
+        self.float_idx = pd.Float64Index(np.random.randn(N).repeat(5))
+        self.string_idx = tm.makeStringIndex(N)
+
+    def time_duplicated_int(self, keep):
+        self.int_idx.duplicated(keep=keep)
+
+    def time_duplicated_float(self, keep):
+        self.float_idx.duplicated(keep=keep)
+
+    def time_duplicated_string(self, keep):
+        self.string_idx.duplicated(keep=keep)
+
+
+class DuplicatedUniqueIndex(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        N = 10**5
+        self.idx_int_dup = pd.Int64Index(np.arange(N * 5))
+        # cache is_unique
+        self.idx_int_dup.is_unique
+
+    def time_duplicated_unique_int(self):
+        self.idx_int_dup.duplicated()
+
+
+class Match(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        self.uniques = tm.makeStringIndex(1000).values
+        self.all = self.uniques.repeat(10)
+
+    def time_match_string(self):
+        with warnings.catch_warnings(record=True):
+            pd.match(self.all, self.uniques)
+
+
+class Hashing(object):
+
+    goal_time = 0.2
+
+    def setup_cache(self):
+        N = 10**5
+
+        df = pd.DataFrame(
+            {'strings': pd.Series(tm.makeStringIndex(10000).take(
+                np.random.randint(0, 10000, size=N))),
+             'floats': np.random.randn(N),
+             'ints': np.arange(N),
+             'dates': pd.date_range('20110101', freq='s', periods=N),
+             'timedeltas': pd.timedelta_range('1 day', freq='s', periods=N)})
+        df['categories'] = df['strings'].astype('category')
+        df.iloc[10:20] = np.nan
+        return df
+
+    def time_frame(self, df):
+        hashing.hash_pandas_object(df)
+
+    def time_series_int(self, df):
+        hashing.hash_pandas_object(df['ints'])
+
+    def time_series_string(self, df):
+        hashing.hash_pandas_object(df['strings'])
+
+    def time_series_float(self, df):
+        hashing.hash_pandas_object(df['floats'])
+
+    def time_series_categorical(self, df):
+        hashing.hash_pandas_object(df['categories'])
+
+    def time_series_timedeltas(self, df):
+        hashing.hash_pandas_object(df['timedeltas'])
+
+    def time_series_dates(self, df):
+        hashing.hash_pandas_object(df['dates'])
diff --git a/asv_bench/benchmarks/attrs_caching.py b/asv_bench/benchmarks/attrs_caching.py
index 2b10cb88a3134..48f0b7d71144c 100644
--- a/asv_bench/benchmarks/attrs_caching.py
+++ b/asv_bench/benchmarks/attrs_caching.py
@@ -1,23 +1,40 @@
-from .pandas_vb_common import *
+import numpy as np
+from pandas import DataFrame
+try:
+    from pandas.util import cache_readonly
+except ImportError:
+    from pandas.util.decorators import cache_readonly
 
+from .pandas_vb_common import setup  # noqa
+
+
+class DataFrameAttributes(object):
 
-class getattr_dataframe_index(object):
     goal_time = 0.2
 
     def setup(self):
         self.df = DataFrame(np.random.randn(10, 6))
         self.cur_index = self.df.index
 
-    def time_getattr_dataframe_index(self):
+    def time_get_index(self):
         self.foo = self.df.index
 
+    def time_set_index(self):
+        self.df.index = self.cur_index
+
+
+class CacheReadonly(object):
 
-class setattr_dataframe_index(object):
     goal_time = 0.2
 
     def setup(self):
-        self.df = DataFrame(np.random.randn(10, 6))
-        self.cur_index = self.df.index
 
-    def time_setattr_dataframe_index(self):
-        self.df.index = self.cur_index
\ No newline at end of file
+        class Foo:
+
+            @cache_readonly
+            def prop(self):
+                return 5
+        self.obj = Foo()
+
+    def time_cache_readonly(self):
+        self.obj.prop
diff --git a/asv_bench/benchmarks/binary_ops.py b/asv_bench/benchmarks/binary_ops.py
index d22d01f261b27..cc8766e1fa39c 100644
--- a/asv_bench/benchmarks/binary_ops.py
+++ b/asv_bench/benchmarks/binary_ops.py
@@ -1,261 +1,151 @@
-from .pandas_vb_common import *
-import pandas.computation.expressions as expr
+import numpy as np
+from pandas import DataFrame, Series, date_range
+from pandas.core.algorithms import checked_add_with_arr
+try:
+    import pandas.core.computation.expressions as expr
+except ImportError:
+    import pandas.computation.expressions as expr
 
+from .pandas_vb_common import setup # noqa
 
-class frame_add(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
+class Ops(object):
 
-    def time_frame_add(self):
-        (self.df + self.df2)
-
-
-class frame_add_no_ne(object):
     goal_time = 0.2
 
-    def setup(self):
+    params = [[True, False], ['default', 1]]
+    param_names = ['use_numexpr', 'threads']
+
+    def setup(self, use_numexpr, threads):
         self.df = DataFrame(np.random.randn(20000, 100))
         self.df2 = DataFrame(np.random.randn(20000, 100))
-        expr.set_use_numexpr(False)
-
-    def time_frame_add_no_ne(self):
-        (self.df + self.df2)
 
-    def teardown(self):
-        expr.set_use_numexpr(True)
+        if threads != 'default':
+            expr.set_numexpr_threads(threads)
+        if not use_numexpr:
+            expr.set_use_numexpr(False)
 
+    def time_frame_add(self, use_numexpr, threads):
+        self.df + self.df2
 
-class frame_add_st(object):
-    goal_time = 0.2
+    def time_frame_mult(self, use_numexpr, threads):
+        self.df * self.df2
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        expr.set_numexpr_threads(1)
+    def time_frame_multi_and(self, use_numexpr, threads):
+        self.df[(self.df > 0) & (self.df2 > 0)]
 
-    def time_frame_add_st(self):
-        (self.df + self.df2)
+    def time_frame_comparison(self, use_numexpr, threads):
+        self.df > self.df2
 
-    def teardown(self):
+    def teardown(self, use_numexpr, threads):
+        expr.set_use_numexpr(True)
         expr.set_numexpr_threads()
 
 
-class frame_float_div(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 1000))
-        self.df2 = DataFrame(np.random.randn(1000, 1000))
-
-    def time_frame_float_div(self):
-        (self.df // self.df2)
+class Ops2(object):
 
-
-class frame_float_div_by_zero(object):
     goal_time = 0.2
 
     def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 1000))
+        N = 10**3
+        self.df = DataFrame(np.random.randn(N, N))
+        self.df2 = DataFrame(np.random.randn(N, N))
 
-    def time_frame_float_div_by_zero(self):
-        (self.df / 0)
+        self.df_int = DataFrame(np.random.randint(np.iinfo(np.int16).min,
+                                                  np.iinfo(np.int16).max,
+                                                  size=(N, N)))
+        self.df2_int = DataFrame(np.random.randint(np.iinfo(np.int16).min,
+                                                   np.iinfo(np.int16).max,
+                                                   size=(N, N)))
 
+    # Division
 
-class frame_float_floor_by_zero(object):
-    goal_time = 0.2
+    def time_frame_float_div(self):
+        self.df // self.df2
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 1000))
+    def time_frame_float_div_by_zero(self):
+        self.df / 0
 
     def time_frame_float_floor_by_zero(self):
-        (self.df // 0)
-
-
-class frame_float_mod(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 1000))
-        self.df2 = DataFrame(np.random.randn(1000, 1000))
-
-    def time_frame_float_mod(self):
-        (self.df / self.df2)
-
-
-class frame_int_div_by_zero(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.random_integers(np.iinfo(np.int16).min, np.iinfo(np.int16).max, size=(1000, 1000)))
+        self.df // 0
 
     def time_frame_int_div_by_zero(self):
-        (self.df / 0)
+        self.df_int / 0
 
-
-class frame_int_mod(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.random_integers(np.iinfo(np.int16).min, np.iinfo(np.int16).max, size=(1000, 1000)))
-        self.df2 = DataFrame(np.random.random_integers(np.iinfo(np.int16).min, np.iinfo(np.int16).max, size=(1000, 1000)))
+    # Modulo
 
     def time_frame_int_mod(self):
-        (self.df / self.df2)
-
-
-class frame_mult(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-
-    def time_frame_mult(self):
-        (self.df * self.df2)
-
+        self.df_int % self.df2_int
 
-class frame_mult_no_ne(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        expr.set_use_numexpr(False)
-
-    def time_frame_mult_no_ne(self):
-        (self.df * self.df2)
-
-    def teardown(self):
-        expr.set_use_numexpr(True)
-
-
-class frame_mult_st(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        expr.set_numexpr_threads(1)
-
-    def time_frame_mult_st(self):
-        (self.df * self.df2)
-
-    def teardown(self):
-        expr.set_numexpr_threads()
-
-
-class frame_multi_and(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-
-    def time_frame_multi_and(self):
-        self.df[((self.df > 0) & (self.df2 > 0))]
-
-
-class frame_multi_and_no_ne(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        expr.set_use_numexpr(False)
-
-    def time_frame_multi_and_no_ne(self):
-        self.df[((self.df > 0) & (self.df2 > 0))]
-
-    def teardown(self):
-        expr.set_use_numexpr(True)
-
-
-class frame_multi_and_st(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        expr.set_numexpr_threads(1)
-
-    def time_frame_multi_and_st(self):
-        self.df[((self.df > 0) & (self.df2 > 0))]
+    def time_frame_float_mod(self):
+        self.df % self.df2
 
-    def teardown(self):
-        expr.set_numexpr_threads()
 
+class Timeseries(object):
 
-class series_timestamp_compare(object):
     goal_time = 0.2
 
-    def setup(self):
-        self.N = 1000000
-        self.halfway = ((self.N // 2) - 1)
-        self.s = Series(date_range('20010101', periods=self.N, freq='T'))
-        self.ts = self.s[self.halfway]
+    params = [None, 'US/Eastern']
+    param_names = ['tz']
 
-    def time_series_timestamp_compare(self):
-        (self.s <= self.ts)
+    def setup(self, tz):
+        N = 10**6
+        halfway = (N // 2) - 1
+        self.s = Series(date_range('20010101', periods=N, freq='T', tz=tz))
+        self.ts = self.s[halfway]
 
+        self.s2 = Series(date_range('20010101', periods=N, freq='s', tz=tz))
 
-class timestamp_ops_diff1(object):
-    goal_time = 0.2
-    N = 1000000
+    def time_series_timestamp_compare(self, tz):
+        self.s <= self.ts
 
-    def setup(self):
-        self.s = self.create()
+    def time_timestamp_series_compare(self, tz):
+        self.ts >= self.s
 
-    def create(self):
-        return Series(date_range('20010101', periods=self.N, freq='s'))
+    def time_timestamp_ops_diff(self, tz):
+        self.s2.diff()
 
-    def time_timestamp_ops_diff1(self):
-        self.s.diff()
+    def time_timestamp_ops_diff_with_shift(self, tz):
+        self.s - self.s.shift()
 
-class timestamp_tz_ops_diff1(timestamp_ops_diff1):
-    N = 10000
 
-    def create(self):
-        return Series(date_range('20010101', periods=self.N, freq='s', tz='US/Eastern'))
+class AddOverflowScalar(object):
 
-class timestamp_ops_diff2(object):
     goal_time = 0.2
-    N = 1000000
 
-    def setup(self):
-        self.s = self.create()
+    params = [1, -1, 0]
+    param_names = ['scalar']
 
-    def create(self):
-        return Series(date_range('20010101', periods=self.N, freq='s'))
+    def setup(self, scalar):
+        N = 10**6
+        self.arr = np.arange(N)
 
-    def time_timestamp_ops_diff2(self):
-        (self.s - self.s.shift())
+    def time_add_overflow_scalar(self, scalar):
+        checked_add_with_arr(self.arr, scalar)
 
-class timestamp_tz_ops_diff2(timestamp_ops_diff2):
-    N = 10000
 
-    def create(self):
-        return Series(date_range('20010101', periods=self.N, freq='s', tz='US/Eastern'))
+class AddOverflowArray(object):
 
-class timestamp_series_compare(object):
     goal_time = 0.2
-    N = 1000000
 
     def setup(self):
-        self.halfway = ((self.N // 2) - 1)
-        self.s = self.create()
-        self.ts = self.s[self.halfway]
+        N = 10**6
+        self.arr = np.arange(N)
+        self.arr_rev = np.arange(-N, 0)
+        self.arr_mixed = np.array([1, -1]).repeat(N / 2)
+        self.arr_nan_1 = np.random.choice([True, False], size=N)
+        self.arr_nan_2 = np.random.choice([True, False], size=N)
 
-    def create(self):
-        return Series(date_range('20010101', periods=self.N, freq='T'))
+    def time_add_overflow_arr_rev(self):
+        checked_add_with_arr(self.arr, self.arr_rev)
 
-    def time_timestamp_series_compare(self):
-        (self.ts >= self.s)
+    def time_add_overflow_arr_mask_nan(self):
+        checked_add_with_arr(self.arr, self.arr_mixed, arr_mask=self.arr_nan_1)
 
-class timestamp_tz_series_compare(timestamp_series_compare):
-    N = 10000
+    def time_add_overflow_b_mask_nan(self):
+        checked_add_with_arr(self.arr, self.arr_mixed,
+                             b_mask=self.arr_nan_1)
 
-    def create(self):
-        return Series(date_range('20010101', periods=self.N, freq='T', tz='US/Eastern'))
+    def time_add_overflow_both_arg_nan(self):
+        checked_add_with_arr(self.arr, self.arr_mixed, arr_mask=self.arr_nan_1,
+                             b_mask=self.arr_nan_2)
diff --git a/asv_bench/benchmarks/categoricals.py b/asv_bench/benchmarks/categoricals.py
index a0f9383336940..2a7717378c280 100644
--- a/asv_bench/benchmarks/categoricals.py
+++ b/asv_bench/benchmarks/categoricals.py
@@ -1,45 +1,247 @@
-from .pandas_vb_common import *
-import string
+import warnings
+
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+try:
+    from pandas.api.types import union_categoricals
+except ImportError:
+    try:
+        from pandas.types.concat import union_categoricals
+    except ImportError:
+        pass
+
+from .pandas_vb_common import setup # noqa
+
+
+class Concat(object):
 
-class concat_categorical(object):
     goal_time = 0.2
 
     def setup(self):
-        self.s = pd.Series((list('aabbcd') * 1000000)).astype('category')
+        N = 10**5
+        self.s = pd.Series(list('aabbcd') * N).astype('category')
+
+        self.a = pd.Categorical(list('aabbcd') * N)
+        self.b = pd.Categorical(list('bbcdjk') * N)
+
+    def time_concat(self):
+        pd.concat([self.s, self.s])
 
-    def time_concat_categorical(self):
-        concat([self.s, self.s])
+    def time_union(self):
+        union_categoricals([self.a, self.b])
 
 
-class categorical_value_counts(object):
-    goal_time = 1
+class Constructor(object):
+
+    goal_time = 0.2
 
     def setup(self):
-        n = 500000
-        np.random.seed(2718281)
+        N = 10**5
+        self.categories = list('abcde')
+        self.cat_idx = pd.Index(self.categories)
+        self.values = np.tile(self.categories, N)
+        self.codes = np.tile(range(len(self.categories)), N)
+
+        self.datetimes = pd.Series(pd.date_range('1995-01-01 00:00:00',
+                                                 periods=N / 10,
+                                                 freq='s'))
+        self.datetimes_with_nat = self.datetimes.copy()
+        self.datetimes_with_nat.iloc[-1] = pd.NaT
+
+        self.values_some_nan = list(np.tile(self.categories + [np.nan], N))
+        self.values_all_nan = [np.nan] * len(self.values)
+        self.values_all_int8 = np.ones(N, 'int8')
+
+    def time_regular(self):
+        pd.Categorical(self.values, self.categories)
+
+    def time_fastpath(self):
+        pd.Categorical(self.codes, self.cat_idx, fastpath=True)
+
+    def time_datetimes(self):
+        pd.Categorical(self.datetimes)
+
+    def time_datetimes_with_nat(self):
+        pd.Categorical(self.datetimes_with_nat)
+
+    def time_with_nan(self):
+        pd.Categorical(self.values_some_nan)
+
+    def time_all_nan(self):
+        pd.Categorical(self.values_all_nan)
+
+    def time_from_codes_all_int8(self):
+        pd.Categorical.from_codes(self.values_all_int8, self.categories)
+
+
+class ValueCounts(object):
+
+    goal_time = 0.2
+
+    params = [True, False]
+    param_names = ['dropna']
+
+    def setup(self, dropna):
+        n = 5 * 10**5
         arr = ['s%04d' % i for i in np.random.randint(0, n // 10, size=n)]
-        self.ts = Series(arr).astype('category')
+        self.ts = pd.Series(arr).astype('category')
+
+    def time_value_counts(self, dropna):
+        self.ts.value_counts(dropna=dropna)
 
-    def time_value_counts(self):
-        self.ts.value_counts(dropna=False)
 
-    def time_value_counts_dropna(self):
-        self.ts.value_counts(dropna=True)
+class Repr(object):
 
-class categorical_constructor(object):
     goal_time = 0.2
 
     def setup(self):
-        n = 5
-        N = 1e6
-        self.categories = list(string.ascii_letters[:n])
-        self.cat_idx = Index(self.categories)
-        self.values = np.tile(self.categories, N)
-        self.codes = np.tile(range(n), N)
+        self.sel = pd.Series(['s1234']).astype('category')
 
-    def time_regular_constructor(self):
-        Categorical(self.values, self.categories)
+    def time_rendering(self):
+        str(self.sel)
 
-    def time_fastpath(self):
-        Categorical(self.codes, self.cat_idx, fastpath=True)
 
+class SetCategories(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        n = 5 * 10**5
+        arr = ['s%04d' % i for i in np.random.randint(0, n // 10, size=n)]
+        self.ts = pd.Series(arr).astype('category')
+
+    def time_set_categories(self):
+        self.ts.cat.set_categories(self.ts.cat.categories[::2])
+
+
+class Rank(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        N = 10**5
+        ncats = 100
+
+        self.s_str = pd.Series(tm.makeCategoricalIndex(N, ncats)).astype(str)
+        self.s_str_cat = self.s_str.astype('category')
+        with warnings.catch_warnings(record=True):
+            self.s_str_cat_ordered = self.s_str.astype('category',
+                                                       ordered=True)
+
+        self.s_int = pd.Series(np.random.randint(0, ncats, size=N))
+        self.s_int_cat = self.s_int.astype('category')
+        with warnings.catch_warnings(record=True):
+            self.s_int_cat_ordered = self.s_int.astype('category',
+                                                       ordered=True)
+
+    def time_rank_string(self):
+        self.s_str.rank()
+
+    def time_rank_string_cat(self):
+        self.s_str_cat.rank()
+
+    def time_rank_string_cat_ordered(self):
+        self.s_str_cat_ordered.rank()
+
+    def time_rank_int(self):
+        self.s_int.rank()
+
+    def time_rank_int_cat(self):
+        self.s_int_cat.rank()
+
+    def time_rank_int_cat_ordered(self):
+        self.s_int_cat_ordered.rank()
+
+
+class Isin(object):
+
+    goal_time = 0.2
+
+    params = ['object', 'int64']
+    param_names = ['dtype']
+
+    def setup(self, dtype):
+        np.random.seed(1234)
+        n = 5 * 10**5
+        sample_size = 100
+        arr = [i for i in np.random.randint(0, n // 10, size=n)]
+        if dtype == 'object':
+            arr = ['s%04d' % i for i in arr]
+        self.sample = np.random.choice(arr, sample_size)
+        self.series = pd.Series(arr).astype('category')
+
+    def time_isin_categorical(self, dtype):
+        self.series.isin(self.sample)
+
+
+class IsMonotonic(object):
+
+    def setup(self):
+        N = 1000
+        self.c = pd.CategoricalIndex(list('a' * N + 'b' * N + 'c' * N))
+        self.s = pd.Series(self.c)
+
+    def time_categorical_index_is_monotonic_increasing(self):
+        self.c.is_monotonic_increasing
+
+    def time_categorical_index_is_monotonic_decreasing(self):
+        self.c.is_monotonic_decreasing
+
+    def time_categorical_series_is_monotonic_increasing(self):
+        self.s.is_monotonic_increasing
+
+    def time_categorical_series_is_monotonic_decreasing(self):
+        self.s.is_monotonic_decreasing
+
+
+class Contains(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        N = 10**5
+        self.ci = tm.makeCategoricalIndex(N)
+        self.c = self.ci.values
+        self.key = self.ci.categories[0]
+
+    def time_categorical_index_contains(self):
+        self.key in self.ci
+
+    def time_categorical_contains(self):
+        self.key in self.c
+
+
+class CategoricalSlicing(object):
+
+    goal_time = 0.2
+    params = ['monotonic_incr', 'monotonic_decr', 'non_monotonic']
+    param_names = ['index']
+
+    def setup(self, index):
+        N = 10**6
+        values = list('a' * N + 'b' * N + 'c' * N)
+        indices = {
+            'monotonic_incr': pd.Categorical(values),
+            'monotonic_decr': pd.Categorical(reversed(values)),
+            'non_monotonic': pd.Categorical(list('abc' * N))}
+        self.data = indices[index]
+
+        self.scalar = 10000
+        self.list = list(range(10000))
+        self.cat_scalar = 'b'
+
+    def time_getitem_scalar(self, index):
+        self.data[self.scalar]
+
+    def time_getitem_slice(self, index):
+        self.data[:self.scalar]
+
+    def time_getitem_list_like(self, index):
+        self.data[[self.scalar]]
+
+    def time_getitem_list(self, index):
+        self.data[self.list]
+
+    def time_getitem_bool_array(self, index):
+        self.data[self.data == self.cat_scalar]
diff --git a/asv_bench/benchmarks/ctors.py b/asv_bench/benchmarks/ctors.py
index 265ffbc7261ca..3f9016787aab4 100644
--- a/asv_bench/benchmarks/ctors.py
+++ b/asv_bench/benchmarks/ctors.py
@@ -1,52 +1,66 @@
-from .pandas_vb_common import *
+import numpy as np
+import pandas.util.testing as tm
+from pandas import Series, Index, DatetimeIndex, Timestamp, MultiIndex
 
+from .pandas_vb_common import setup  # noqa
 
-class frame_constructor_ndarray(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.arr = np.random.randn(100, 100)
 
-    def time_frame_constructor_ndarray(self):
-        DataFrame(self.arr)
+class SeriesConstructors(object):
 
-
-class ctor_index_array_string(object):
     goal_time = 0.2
 
-    def setup(self):
-        self.data = np.array(['foo', 'bar', 'baz'], dtype=object)
+    param_names = ["data_fmt", "with_index"]
+    params = [[lambda x: x,
+               list,
+               lambda arr: list(arr.astype(str)),
+               lambda arr: dict(zip(range(len(arr)), arr)),
+               lambda arr: [(i, -i) for i in arr],
+               lambda arr: [[i, -i] for i in arr],
+               lambda arr: ([(i, -i) for i in arr][:-1] + [None]),
+               lambda arr: ([[i, -i] for i in arr][:-1] + [None])],
+              [False, True]]
+
+    def setup(self, data_fmt, with_index):
+        N = 10**4
+        arr = np.random.randn(N)
+        self.data = data_fmt(arr)
+        self.index = np.arange(N) if with_index else None
+
+    def time_series_constructor(self, data_fmt, with_index):
+        Series(self.data, index=self.index)
 
-    def time_ctor_index_array_string(self):
-        Index(self.data)
 
+class SeriesDtypesConstructors(object):
 
-class series_constructor_ndarray(object):
     goal_time = 0.2
 
     def setup(self):
-        self.data = np.random.randn(100)
-        self.index = Index(np.arange(100))
+        N = 10**4
+        self.arr = np.random.randn(N, N)
+        self.arr_str = np.array(['foo', 'bar', 'baz'], dtype=object)
+        self.s = Series([Timestamp('20110101'), Timestamp('20120101'),
+                         Timestamp('20130101')] * N * 10)
 
-    def time_series_constructor_ndarray(self):
-        Series(self.data, index=self.index)
+    def time_index_from_array_string(self):
+        Index(self.arr_str)
 
+    def time_index_from_array_floats(self):
+        Index(self.arr)
 
-class dtindex_from_series_ctor(object):
-    goal_time = 0.2
+    def time_dtindex_from_series(self):
+        DatetimeIndex(self.s)
 
-    def setup(self):
-        self.s = Series(([Timestamp('20110101'), Timestamp('20120101'), Timestamp('20130101')] * 1000))
+    def time_dtindex_from_index_with_series(self):
+        Index(self.s)
 
-    def time_dtindex_from_series_ctor(self):
-        DatetimeIndex(self.s)
 
+class MultiIndexConstructor(object):
 
-class index_from_series_ctor(object):
     goal_time = 0.2
 
     def setup(self):
-        self.s = Series(([Timestamp('20110101'), Timestamp('20120101'), Timestamp('20130101')] * 1000))
+        N = 10**4
+        self.iterables = [tm.makeStringIndex(N), range(20)]
 
-    def time_index_from_series_ctor(self):
-        Index(self.s)
\ No newline at end of file
+    def time_multiindex_from_iterables(self):
+        MultiIndex.from_product(self.iterables)
diff --git a/asv_bench/benchmarks/eval.py b/asv_bench/benchmarks/eval.py
index 719d92567a7be..8e581dcf22b4c 100644
--- a/asv_bench/benchmarks/eval.py
+++ b/asv_bench/benchmarks/eval.py
@@ -1,239 +1,67 @@
-from .pandas_vb_common import *
+import numpy as np
 import pandas as pd
-import pandas.computation.expressions as expr
+try:
+    import pandas.core.computation.expressions as expr
+except ImportError:
+    import pandas.computation.expressions as expr
 
+from .pandas_vb_common import setup # noqa
 
-class eval_frame_add_all_threads(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
-
-    def time_eval_frame_add_all_threads(self):
-        pd.eval('df + df2 + df3 + df4')
-
-
-class eval_frame_add_one_thread(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
-        expr.set_numexpr_threads(1)
-
-    def time_eval_frame_add_one_thread(self):
-        pd.eval('df + df2 + df3 + df4')
-
-
-class eval_frame_add_python(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
-
-    def time_eval_frame_add_python(self):
-        pd.eval('df + df2 + df3 + df4', engine='python')
-
-
-class eval_frame_add_python_one_thread(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
-        expr.set_numexpr_threads(1)
-
-    def time_eval_frame_add_python_one_thread(self):
-        pd.eval('df + df2 + df3 + df4', engine='python')
-
-
-class eval_frame_and_all_threads(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
-
-    def time_eval_frame_and_all_threads(self):
-        pd.eval('(df > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)')
-
-
-class eval_frame_and_python_one_thread(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
-        expr.set_numexpr_threads(1)
-
-    def time_eval_frame_and_python_one_thread(self):
-        pd.eval('(df > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)', engine='python')
-
-
-class eval_frame_and_python(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
-
-    def time_eval_frame_and_python(self):
-        pd.eval('(df > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)', engine='python')
 
+class Eval(object):
 
-class eval_frame_chained_cmp_all_threads(object):
     goal_time = 0.2
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
-
-    def time_eval_frame_chained_cmp_all_threads(self):
-        pd.eval('df < df2 < df3 < df4')
-
-
-class eval_frame_chained_cmp_python_one_thread(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
-        expr.set_numexpr_threads(1)
-
-    def time_eval_frame_chained_cmp_python_one_thread(self):
-        pd.eval('df < df2 < df3 < df4', engine='python')
-
-
-class eval_frame_chained_cmp_python(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
-
-    def time_eval_frame_chained_cmp_python(self):
-        pd.eval('df < df2 < df3 < df4', engine='python')
-
-
-class eval_frame_mult_all_threads(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
-
-    def time_eval_frame_mult_all_threads(self):
-        pd.eval('df * df2 * df3 * df4')
+    params = [['numexpr', 'python'], [1, 'all']]
+    param_names = ['engine', 'threads']
 
+    def setup(self, engine, threads):
+        self.df = pd.DataFrame(np.random.randn(20000, 100))
+        self.df2 = pd.DataFrame(np.random.randn(20000, 100))
+        self.df3 = pd.DataFrame(np.random.randn(20000, 100))
+        self.df4 = pd.DataFrame(np.random.randn(20000, 100))
 
-class eval_frame_mult_one_thread(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
-        expr.set_numexpr_threads(1)
-
-    def time_eval_frame_mult_one_thread(self):
-        pd.eval('df * df2 * df3 * df4')
-
+        if threads == 1:
+            expr.set_numexpr_threads(1)
 
-class eval_frame_mult_python(object):
-    goal_time = 0.2
+    def time_add(self, engine, threads):
+        pd.eval('self.df + self.df2 + self.df3 + self.df4', engine=engine)
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
+    def time_and(self, engine, threads):
+        pd.eval('(self.df > 0) & (self.df2 > 0) & '
+                '(self.df3 > 0) & (self.df4 > 0)', engine=engine)
 
-    def time_eval_frame_mult_python(self):
-        pd.eval('df * df2 * df3 * df4', engine='python')
+    def time_chained_cmp(self, engine, threads):
+        pd.eval('self.df < self.df2 < self.df3 < self.df4', engine=engine)
 
+    def time_mult(self, engine, threads):
+        pd.eval('self.df * self.df2 * self.df3 * self.df4', engine=engine)
 
-class eval_frame_mult_python_one_thread(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
-        expr.set_numexpr_threads(1)
+    def teardown(self, engine, threads):
+        expr.set_numexpr_threads()
 
-    def time_eval_frame_mult_python_one_thread(self):
-        pd.eval('df * df2 * df3 * df4', engine='python')
 
+class Query(object):
 
-class query_datetime_index(object):
     goal_time = 0.2
 
     def setup(self):
-        self.N = 1000000
-        self.halfway = ((self.N // 2) - 1)
-        self.index = date_range('20010101', periods=self.N, freq='T')
-        self.s = Series(self.index)
-        self.ts = self.s.iloc[self.halfway]
-        self.df = DataFrame({'a': np.random.randn(self.N), }, index=self.index)
+        N = 10**6
+        halfway = (N // 2) - 1
+        index = pd.date_range('20010101', periods=N, freq='T')
+        s = pd.Series(index)
+        self.ts = s.iloc[halfway]
+        self.df = pd.DataFrame({'a': np.random.randn(N), 'dates': s},
+                               index=index)
+        data = np.random.randn(N)
+        self.min_val = data.min()
+        self.max_val = data.max()
 
     def time_query_datetime_index(self):
-        self.df.query('index < @ts')
+        self.df.query('index < @self.ts')
 
-
-class query_datetime_series(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 1000000
-        self.halfway = ((self.N // 2) - 1)
-        self.index = date_range('20010101', periods=self.N, freq='T')
-        self.s = Series(self.index)
-        self.ts = self.s.iloc[self.halfway]
-        self.df = DataFrame({'dates': self.s.values, })
-
-    def time_query_datetime_series(self):
-        self.df.query('dates < @ts')
-
-
-class query_with_boolean_selection(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 1000000
-        self.halfway = ((self.N // 2) - 1)
-        self.index = date_range('20010101', periods=self.N, freq='T')
-        self.s = Series(self.index)
-        self.ts = self.s.iloc[self.halfway]
-        self.N = 1000000
-        self.df = DataFrame({'a': np.random.randn(self.N), })
-        self.min_val = self.df['a'].min()
-        self.max_val = self.df['a'].max()
+    def time_query_datetime_column(self):
+        self.df.query('dates < @self.ts')
 
     def time_query_with_boolean_selection(self):
-        self.df.query('(a >= @min_val) & (a <= @max_val)')
\ No newline at end of file
+        self.df.query('(a >= @self.min_val) & (a <= @self.max_val)')
diff --git a/asv_bench/benchmarks/frame_ctor.py b/asv_bench/benchmarks/frame_ctor.py
index 85f3c1628bd8b..9def910df0bab 100644
--- a/asv_bench/benchmarks/frame_ctor.py
+++ b/asv_bench/benchmarks/frame_ctor.py
@@ -1,1706 +1,101 @@
-from .pandas_vb_common import *
+import numpy as np
+import pandas.util.testing as tm
+from pandas import DataFrame, Series, MultiIndex, Timestamp, date_range
 try:
-    from pandas.tseries.offsets import *
-except:
-    from pandas.core.datetools import *
+    from pandas.tseries.offsets import Nano, Hour
+except ImportError:
+    # For compatibility with older versions
+    from pandas.core.datetools import * # noqa
 
-
-class frame_ctor_dtindex_BDayx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BDay(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BDayx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BDayx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BDay(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BDayx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BMonthBeginx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BMonthBegin(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BMonthBeginx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BMonthBeginx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BMonthBegin(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BMonthBeginx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BMonthEndx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BMonthEnd(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BMonthEndx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BMonthEndx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BMonthEnd(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BMonthEndx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BQuarterBeginx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BQuarterBegin(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BQuarterBeginx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BQuarterBeginx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BQuarterBegin(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BQuarterBeginx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BQuarterEndx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BQuarterEnd(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BQuarterEndx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BQuarterEndx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BQuarterEnd(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BQuarterEndx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BYearBeginx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BYearBegin(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BYearBeginx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BYearBeginx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BYearBegin(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BYearBeginx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BYearEndx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BYearEnd(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BYearEndx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BYearEndx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BYearEnd(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BYearEndx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BusinessDayx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BusinessDay(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BusinessDayx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BusinessDayx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BusinessDay(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BusinessDayx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BusinessHourx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BusinessHour(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BusinessHourx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_BusinessHourx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(BusinessHour(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_BusinessHourx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_CBMonthBeginx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(CBMonthBegin(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_CBMonthBeginx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_CBMonthBeginx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(CBMonthBegin(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_CBMonthBeginx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_CBMonthEndx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(CBMonthEnd(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_CBMonthEndx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_CBMonthEndx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(CBMonthEnd(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_CBMonthEndx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_CDayx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(CDay(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_CDayx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_CDayx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(CDay(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_CDayx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_CustomBusinessDayx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(CustomBusinessDay(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_CustomBusinessDayx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_CustomBusinessDayx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(CustomBusinessDay(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_CustomBusinessDayx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_DateOffsetx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(DateOffset(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_DateOffsetx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_DateOffsetx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(DateOffset(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_DateOffsetx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Dayx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Day(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Dayx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Dayx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Day(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Dayx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Easterx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Easter(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Easterx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Easterx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Easter(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Easterx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_FY5253Quarterx1__variation_last(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(FY5253Quarter(1, **{'startingMonth': 1, 'qtr_with_extra_week': 1, 'weekday': 1, 'variation': 'last', }))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_FY5253Quarterx1__variation_last(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_FY5253Quarterx1__variation_nearest(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(FY5253Quarter(1, **{'startingMonth': 1, 'qtr_with_extra_week': 1, 'weekday': 1, 'variation': 'nearest', }))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_FY5253Quarterx1__variation_nearest(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_FY5253Quarterx2__variation_last(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(FY5253Quarter(2, **{'startingMonth': 1, 'qtr_with_extra_week': 1, 'weekday': 1, 'variation': 'last', }))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_FY5253Quarterx2__variation_last(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_FY5253Quarterx2__variation_nearest(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(FY5253Quarter(2, **{'startingMonth': 1, 'qtr_with_extra_week': 1, 'weekday': 1, 'variation': 'nearest', }))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_FY5253Quarterx2__variation_nearest(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_FY5253x1__variation_last(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(FY5253(1, **{'startingMonth': 1, 'weekday': 1, 'variation': 'last', }))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_FY5253x1__variation_last(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_FY5253x1__variation_nearest(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(FY5253(1, **{'startingMonth': 1, 'weekday': 1, 'variation': 'nearest', }))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_FY5253x1__variation_nearest(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_FY5253x2__variation_last(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(FY5253(2, **{'startingMonth': 1, 'weekday': 1, 'variation': 'last', }))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_FY5253x2__variation_last(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_FY5253x2__variation_nearest(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(FY5253(2, **{'startingMonth': 1, 'weekday': 1, 'variation': 'nearest', }))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_FY5253x2__variation_nearest(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Hourx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Hour(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Hourx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Hourx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Hour(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Hourx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_LastWeekOfMonthx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(LastWeekOfMonth(1, **{'week': 1, 'weekday': 1, }))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_LastWeekOfMonthx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
+from .pandas_vb_common import setup # noqa
 
 
-class frame_ctor_dtindex_LastWeekOfMonthx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(LastWeekOfMonth(2, **{'week': 1, 'weekday': 1, }))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_LastWeekOfMonthx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Microx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Micro(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Microx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Microx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Micro(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Microx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Millix1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Milli(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Millix1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Millix2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Milli(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Millix2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Minutex1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Minute(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Minutex1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Minutex2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Minute(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Minutex2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_MonthBeginx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(MonthBegin(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_MonthBeginx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_MonthBeginx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(MonthBegin(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_MonthBeginx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_MonthEndx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(MonthEnd(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_MonthEndx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_MonthEndx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(MonthEnd(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_MonthEndx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Nanox1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Nano(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Nanox1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Nanox2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Nano(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Nanox2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_QuarterBeginx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(QuarterBegin(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_QuarterBeginx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_QuarterBeginx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(QuarterBegin(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_QuarterBeginx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_QuarterEndx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(QuarterEnd(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_QuarterEndx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_QuarterEndx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(QuarterEnd(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_QuarterEndx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Secondx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Second(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Secondx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Secondx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Second(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Secondx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_WeekOfMonthx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(WeekOfMonth(1, **{'week': 1, 'weekday': 1, }))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_WeekOfMonthx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_WeekOfMonthx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(WeekOfMonth(2, **{'week': 1, 'weekday': 1, }))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_WeekOfMonthx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Weekx1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Week(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
+class FromDicts(object):
 
-    def time_frame_ctor_dtindex_Weekx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_Weekx2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = self.get_index_for_offset(Week(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_Weekx2(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_dtindex_YearBeginx1(object):
     goal_time = 0.2
 
     def setup(self):
-        self.idx = self.get_index_for_offset(YearBegin(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_YearBeginx1(self):
-        DataFrame(self.d)
-
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
+        N, K = 5000, 50
+        self.index = tm.makeStringIndex(N)
+        self.columns = tm.makeStringIndex(K)
+        frame = DataFrame(np.random.randn(N, K), index=self.index,
+                          columns=self.columns)
+        self.data = frame.to_dict()
+        self.dict_list = frame.to_dict(orient='records')
+        self.data2 = {i: {j: float(j) for j in range(100)}
+                      for i in range(2000)}
+
+    def time_list_of_dict(self):
+        DataFrame(self.dict_list)
 
+    def time_nested_dict(self):
+        DataFrame(self.data)
 
-class frame_ctor_dtindex_YearBeginx2(object):
-    goal_time = 0.2
+    def time_nested_dict_index(self):
+        DataFrame(self.data, index=self.index)
 
-    def setup(self):
-        self.idx = self.get_index_for_offset(YearBegin(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
+    def time_nested_dict_columns(self):
+        DataFrame(self.data, columns=self.columns)
 
-    def time_frame_ctor_dtindex_YearBeginx2(self):
-        DataFrame(self.d)
+    def time_nested_dict_index_columns(self):
+        DataFrame(self.data, index=self.index, columns=self.columns)
 
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
+    def time_nested_dict_int64(self):
+        # nested dict, integer indexes, regression described in #621
+        DataFrame(self.data2)
 
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
 
+class FromSeries(object):
 
-class frame_ctor_dtindex_YearEndx1(object):
     goal_time = 0.2
 
     def setup(self):
-        self.idx = self.get_index_for_offset(YearEnd(1, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
-
-    def time_frame_ctor_dtindex_YearEndx1(self):
-        DataFrame(self.d)
+        mi = MultiIndex.from_product([range(100), range(100)])
+        self.s = Series(np.random.randn(10000), index=mi)
 
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
+    def time_mi_series(self):
+        DataFrame(self.s)
 
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
 
+class FromDictwithTimestamp(object):
 
-class frame_ctor_dtindex_YearEndx2(object):
     goal_time = 0.2
+    params = [Nano(1), Hour(1)]
+    param_names = ['offset']
 
-    def setup(self):
-        self.idx = self.get_index_for_offset(YearEnd(2, **{}))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
+    def setup(self, offset):
+        N = 10**3
+        np.random.seed(1234)
+        idx = date_range(Timestamp('1/1/1900'), freq=offset, periods=N)
+        df = DataFrame(np.random.randn(N, 10), index=idx)
+        self.d = df.to_dict()
 
-    def time_frame_ctor_dtindex_YearEndx2(self):
+    def time_dict_with_timestamp_offsets(self, offset):
         DataFrame(self.d)
 
-    def get_period_count(self, start_date, off):
-        self.ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-        if (self.ten_offsets_in_days == 0):
-            return 1000
-        else:
-            return min((9 * ((Timestamp.max - start_date).days // self.ten_offsets_in_days)), 1000)
-
-    def get_index_for_offset(self, off):
-        self.start_date = Timestamp('1/1/1900')
-        return date_range(self.start_date, periods=min(1000, self.get_period_count(self.start_date, off)), freq=off)
-
-
-class frame_ctor_list_of_dict(object):
-    goal_time = 0.2
-
-    def setup(self):
-        (N, K) = (5000, 50)
-        self.index = tm.makeStringIndex(N)
-        self.columns = tm.makeStringIndex(K)
-        self.frame = DataFrame(np.random.randn(N, K), index=self.index, columns=self.columns)
-        try:
-            self.data = self.frame.to_dict()
-        except:
-            self.data = self.frame.toDict()
-        self.some_dict = self.data.values()[0]
-        self.dict_list = [dict(zip(self.columns, row)) for row in self.frame.values]
-
-    def time_frame_ctor_list_of_dict(self):
-        DataFrame(self.dict_list)
-
-
-class frame_ctor_nested_dict(object):
-    goal_time = 0.2
-
-    def setup(self):
-        (N, K) = (5000, 50)
-        self.index = tm.makeStringIndex(N)
-        self.columns = tm.makeStringIndex(K)
-        self.frame = DataFrame(np.random.randn(N, K), index=self.index, columns=self.columns)
-        try:
-            self.data = self.frame.to_dict()
-        except:
-            self.data = self.frame.toDict()
-        self.some_dict = self.data.values()[0]
-        self.dict_list = [dict(zip(self.columns, row)) for row in self.frame.values]
-
-    def time_frame_ctor_nested_dict(self):
-        DataFrame(self.data)
 
+class FromRecords(object):
 
-class frame_ctor_nested_dict_int64(object):
     goal_time = 0.2
+    params = [None, 1000]
+    param_names = ['nrows']
 
-    def setup(self):
-        self.data = dict(((i, dict(((j, float(j)) for j in range(100)))) for i in xrange(2000)))
-
-    def time_frame_ctor_nested_dict_int64(self):
-        DataFrame(self.data)
-
-
-class frame_from_series(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.mi = MultiIndex.from_tuples([(x, y) for x in range(100) for y in range(100)])
-        self.s = Series(randn(10000), index=self.mi)
+    def setup(self, nrows):
+        N = 100000
+        self.gen = ((x, (x * 20), (x * 100)) for x in range(N))
 
-    def time_frame_from_series(self):
-        DataFrame(self.s)
-
-
-class frame_get_numeric_data(object):
-    goal_time = 0.2
+    def time_frame_from_records_generator(self, nrows):
+        # issue-6700
+        self.df = DataFrame.from_records(self.gen, nrows=nrows)
 
-    def setup(self):
-        self.df = DataFrame(randn(10000, 25))
-        self.df['foo'] = 'bar'
-        self.df['bar'] = 'baz'
-        self.df = self.df.consolidate()
-
-    def time_frame_get_numeric_data(self):
-        self.df._get_numeric_data()
 
+class FromNDArray(object):
 
-class series_ctor_from_dict(object):
     goal_time = 0.2
 
     def setup(self):
-        (N, K) = (5000, 50)
-        self.index = tm.makeStringIndex(N)
-        self.columns = tm.makeStringIndex(K)
-        self.frame = DataFrame(np.random.randn(N, K), index=self.index, columns=self.columns)
-        try:
-            self.data = self.frame.to_dict()
-        except:
-            self.data = self.frame.toDict()
-        self.some_dict = self.data.values()[0]
-        self.dict_list = [dict(zip(self.columns, row)) for row in self.frame.values]
+        N = 100000
+        self.data = np.random.randn(N)
 
-    def time_series_ctor_from_dict(self):
-        Series(self.some_dict)
\ No newline at end of file
+    def time_frame_from_ndarray(self):
+        self.df = DataFrame(self.data)
diff --git a/asv_bench/benchmarks/frame_methods.py b/asv_bench/benchmarks/frame_methods.py
index a04a9d0814a30..1819cfa2725db 100644
--- a/asv_bench/benchmarks/frame_methods.py
+++ b/asv_bench/benchmarks/frame_methods.py
@@ -1,950 +1,532 @@
-from .pandas_vb_common import *
+import string
+import warnings
 
+import numpy as np
+import pandas.util.testing as tm
+from pandas import (DataFrame, Series, MultiIndex, date_range, period_range,
+                    isnull, NaT)
 
-class frame_apply_axis_1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 100))
-
-    def time_frame_apply_axis_1(self):
-        self.df.apply((lambda x: (x + 1)), axis=1)
-
+from .pandas_vb_common import setup  # noqa
 
-class frame_apply_lambda_mean(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 100))
-
-    def time_frame_apply_lambda_mean(self):
-        self.df.apply((lambda x: x.sum()))
 
+class GetNumericData(object):
 
-class frame_apply_np_mean(object):
     goal_time = 0.2
 
     def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 100))
-
-    def time_frame_apply_np_mean(self):
-        self.df.apply(np.mean)
-
-
-class frame_apply_pass_thru(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 100))
-
-    def time_frame_apply_pass_thru(self):
-        self.df.apply((lambda x: x))
-
-
-class frame_apply_ref_by_name(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 3), columns=list('ABC'))
-
-    def time_frame_apply_ref_by_name(self):
-        self.df.apply((lambda x: (x['A'] + x['B'])), axis=1)
-
-
-class frame_apply_user_func(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.s = Series(np.arange(1028.0))
-        self.df = DataFrame({i: self.s for i in range(1028)})
-
-    def time_frame_apply_user_func(self):
-        self.df.apply((lambda x: np.corrcoef(x, self.s)[(0, 1)]))
-
-
-class frame_assign_timeseries_index(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = date_range('1/1/2000', periods=100000, freq='D')
-        self.df = DataFrame(randn(100000, 1), columns=['A'], index=self.idx)
-
-    def time_frame_assign_timeseries_index(self):
-        self.f(self.df)
-
-    def f(self, df):
-        self.x = self.df.copy()
-        self.x['date'] = self.x.index
-
-
-class frame_boolean_row_select(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(randn(10000, 100))
-        self.bool_arr = np.zeros(10000, dtype=bool)
-        self.bool_arr[:1000] = True
-
-    def time_frame_boolean_row_select(self):
-        self.df[self.bool_arr]
-
-
-class frame_count_level_axis0_mixed_dtypes_multi(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
-        self.df.ix[50:1000, 20:50] = np.nan
-        self.df.ix[2000:3000] = np.nan
-        self.df.ix[:, 60:70] = np.nan
-        self.df['foo'] = 'bar'
-        self.df.index = MultiIndex.from_tuples(self.df.index.map((lambda x: (x, x))))
-        self.df.columns = MultiIndex.from_tuples(self.df.columns.map((lambda x: (x, x))))
-
-    def time_frame_count_level_axis0_mixed_dtypes_multi(self):
-        self.df.count(axis=0, level=1)
-
-
-class frame_count_level_axis0_multi(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
-        self.df.ix[50:1000, 20:50] = np.nan
-        self.df.ix[2000:3000] = np.nan
-        self.df.ix[:, 60:70] = np.nan
-        self.df.index = MultiIndex.from_tuples(self.df.index.map((lambda x: (x, x))))
-        self.df.columns = MultiIndex.from_tuples(self.df.columns.map((lambda x: (x, x))))
-
-    def time_frame_count_level_axis0_multi(self):
-        self.df.count(axis=0, level=1)
-
-
-class frame_count_level_axis1_mixed_dtypes_multi(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
-        self.df.ix[50:1000, 20:50] = np.nan
-        self.df.ix[2000:3000] = np.nan
-        self.df.ix[:, 60:70] = np.nan
+        self.df = DataFrame(np.random.randn(10000, 25))
         self.df['foo'] = 'bar'
-        self.df.index = MultiIndex.from_tuples(self.df.index.map((lambda x: (x, x))))
-        self.df.columns = MultiIndex.from_tuples(self.df.columns.map((lambda x: (x, x))))
-
-    def time_frame_count_level_axis1_mixed_dtypes_multi(self):
-        self.df.count(axis=1, level=1)
-
-
-class frame_count_level_axis1_multi(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
-        self.df.ix[50:1000, 20:50] = np.nan
-        self.df.ix[2000:3000] = np.nan
-        self.df.ix[:, 60:70] = np.nan
-        self.df.index = MultiIndex.from_tuples(self.df.index.map((lambda x: (x, x))))
-        self.df.columns = MultiIndex.from_tuples(self.df.columns.map((lambda x: (x, x))))
-
-    def time_frame_count_level_axis1_multi(self):
-        self.df.count(axis=1, level=1)
-
-
-class frame_dropna_axis0_all(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
-        self.df.ix[50:1000, 20:50] = np.nan
-        self.df.ix[2000:3000] = np.nan
-        self.df.ix[:, 60:70] = np.nan
-
-    def time_frame_dropna_axis0_all(self):
-        self.df.dropna(how='all', axis=0)
-
-
-class frame_dropna_axis0_all_mixed_dtypes(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
-        self.df.ix[50:1000, 20:50] = np.nan
-        self.df.ix[2000:3000] = np.nan
-        self.df.ix[:, 60:70] = np.nan
-        self.df['foo'] = 'bar'
-
-    def time_frame_dropna_axis0_all_mixed_dtypes(self):
-        self.df.dropna(how='all', axis=0)
-
-
-class frame_dropna_axis0_any(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
-        self.df.ix[50:1000, 20:50] = np.nan
-        self.df.ix[2000:3000] = np.nan
-        self.df.ix[:, 60:70] = np.nan
-
-    def time_frame_dropna_axis0_any(self):
-        self.df.dropna(how='any', axis=0)
-
-
-class frame_dropna_axis0_any_mixed_dtypes(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
-        self.df.ix[50:1000, 20:50] = np.nan
-        self.df.ix[2000:3000] = np.nan
-        self.df.ix[:, 60:70] = np.nan
-        self.df['foo'] = 'bar'
-
-    def time_frame_dropna_axis0_any_mixed_dtypes(self):
-        self.df.dropna(how='any', axis=0)
-
-
-class frame_dropna_axis1_all(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
-        self.df.ix[50:1000, 20:50] = np.nan
-        self.df.ix[2000:3000] = np.nan
-        self.df.ix[:, 60:70] = np.nan
-
-    def time_frame_dropna_axis1_all(self):
-        self.df.dropna(how='all', axis=1)
-
-
-class frame_dropna_axis1_all_mixed_dtypes(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
-        self.df.ix[50:1000, 20:50] = np.nan
-        self.df.ix[2000:3000] = np.nan
-        self.df.ix[:, 60:70] = np.nan
-        self.df['foo'] = 'bar'
-
-    def time_frame_dropna_axis1_all_mixed_dtypes(self):
-        self.df.dropna(how='all', axis=1)
-
-
-class frame_dropna_axis1_any(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
-        self.df.ix[50:1000, 20:50] = np.nan
-        self.df.ix[2000:3000] = np.nan
-        self.df.ix[:, 60:70] = np.nan
-
-    def time_frame_dropna_axis1_any(self):
-        self.df.dropna(how='any', axis=1)
-
-
-class frame_dropna_axis1_any_mixed_dtypes(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
-        self.df.ix[50:1000, 20:50] = np.nan
-        self.df.ix[2000:3000] = np.nan
-        self.df.ix[:, 60:70] = np.nan
-        self.df['foo'] = 'bar'
-
-    def time_frame_dropna_axis1_any_mixed_dtypes(self):
-        self.df.dropna(how='any', axis=1)
-
-
-class frame_dtypes(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 1000))
-
-    def time_frame_dtypes(self):
-        self.df.dtypes
-
-
-class frame_duplicated(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.n = (1 << 20)
-        self.t = date_range('2015-01-01', freq='S', periods=(self.n // 64))
-        self.xs = np.random.randn((self.n // 64)).round(2)
-        self.df = DataFrame({'a': np.random.randint(((-1) << 8), (1 << 8), self.n), 'b': np.random.choice(self.t, self.n), 'c': np.random.choice(self.xs, self.n), })
-
-    def time_frame_duplicated(self):
-        self.df.duplicated()
+        self.df['bar'] = 'baz'
+        with warnings.catch_warnings(record=True):
+            self.df = self.df.consolidate()
 
-class frame_duplicated_wide(object):
-    goal_time = 0.2
+    def time_frame_get_numeric_data(self):
+        self.df._get_numeric_data()
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 100).astype(str))
 
-    def time_frame_duplicated_wide(self):
-        self.df.T.duplicated()
+class Lookup(object):
 
-class frame_fancy_lookup(object):
     goal_time = 0.2
 
     def setup(self):
-        self.df = DataFrame(np.random.randn(10000, 8), columns=list('abcdefgh'))
+        self.df = DataFrame(np.random.randn(10000, 8),
+                            columns=list('abcdefgh'))
         self.df['foo'] = 'bar'
         self.row_labels = list(self.df.index[::10])[:900]
-        self.col_labels = (list(self.df.columns) * 100)
-        self.row_labels_all = np.array((list(self.df.index) * len(self.df.columns)), dtype='object')
-        self.col_labels_all = np.array((list(self.df.columns) * len(self.df.index)), dtype='object')
+        self.col_labels = list(self.df.columns) * 100
+        self.row_labels_all = np.array(
+            list(self.df.index) * len(self.df.columns), dtype='object')
+        self.col_labels_all = np.array(
+            list(self.df.columns) * len(self.df.index), dtype='object')
 
     def time_frame_fancy_lookup(self):
         self.df.lookup(self.row_labels, self.col_labels)
 
-
-class frame_fancy_lookup_all(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(10000, 8), columns=list('abcdefgh'))
-        self.df['foo'] = 'bar'
-        self.row_labels = list(self.df.index[::10])[:900]
-        self.col_labels = (list(self.df.columns) * 100)
-        self.row_labels_all = np.array((list(self.df.index) * len(self.df.columns)), dtype='object')
-        self.col_labels_all = np.array((list(self.df.columns) * len(self.df.index)), dtype='object')
-
     def time_frame_fancy_lookup_all(self):
         self.df.lookup(self.row_labels_all, self.col_labels_all)
 
 
-class frame_fillna_inplace(object):
-    goal_time = 0.2
+class Reindex(object):
 
-    def setup(self):
-        self.df = DataFrame(randn(10000, 100))
-        self.df.values[::2] = np.nan
-
-    def time_frame_fillna_inplace(self):
-        self.df.fillna(0, inplace=True)
-
-
-class frame_float_equal(object):
     goal_time = 0.2
 
     def setup(self):
-        self.float_df = DataFrame(np.random.randn(1000, 1000))
-        self.object_df = DataFrame(([(['foo'] * 1000)] * 1000))
-        self.nonunique_cols = self.object_df.copy()
-        self.nonunique_cols.columns = (['A'] * len(self.nonunique_cols.columns))
-        self.pairs = dict([(name, self.make_pair(frame)) for (name, frame) in (('float_df', self.float_df), ('object_df', self.object_df), ('nonunique_cols', self.nonunique_cols))])
-
-    def time_frame_float_equal(self):
-        self.test_equal('float_df')
-
-    def make_pair(self, frame):
-        self.df = frame
-        self.df2 = self.df.copy()
-        self.df2.ix[((-1), (-1))] = np.nan
-        return (self.df, self.df2)
-
-    def test_equal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df)
-
-    def test_unequal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df2)
+        N = 10**3
+        self.df = DataFrame(np.random.randn(N * 10, N))
+        self.idx = np.arange(4 * N, 7 * N)
+        self.df2 = DataFrame(
+            {c: {0: np.random.randint(0, 2, N).astype(np.bool_),
+                 1: np.random.randint(0, N, N).astype(np.int16),
+                 2: np.random.randint(0, N, N).astype(np.int32),
+                 3: np.random.randint(0, N, N).astype(np.int64)}
+                [np.random.randint(0, 4)] for c in range(N)})
 
+    def time_reindex_axis0(self):
+        self.df.reindex(self.idx)
 
-class frame_float_unequal(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.float_df = DataFrame(np.random.randn(1000, 1000))
-        self.object_df = DataFrame(([(['foo'] * 1000)] * 1000))
-        self.nonunique_cols = self.object_df.copy()
-        self.nonunique_cols.columns = (['A'] * len(self.nonunique_cols.columns))
-        self.pairs = dict([(name, self.make_pair(frame)) for (name, frame) in (('float_df', self.float_df), ('object_df', self.object_df), ('nonunique_cols', self.nonunique_cols))])
-
-    def time_frame_float_unequal(self):
-        self.test_unequal('float_df')
-
-    def make_pair(self, frame):
-        self.df = frame
-        self.df2 = self.df.copy()
-        self.df2.ix[((-1), (-1))] = np.nan
-        return (self.df, self.df2)
-
-    def test_equal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df)
-
-    def test_unequal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df2)
-
-
-class frame_from_records_generator(object):
-    goal_time = 0.2
-
-    def time_frame_from_records_generator(self):
-        self.df = DataFrame.from_records(self.get_data())
+    def time_reindex_axis1(self):
+        self.df.reindex(columns=self.idx)
 
-    def get_data(self, n=100000):
-        return ((x, (x * 20), (x * 100)) for x in range(n))
+    def time_reindex_both_axes(self):
+        self.df.reindex(index=self.idx, columns=self.idx)
 
+    def time_reindex_both_axes_ix(self):
+        self.df.ix[self.idx, self.idx]
 
-class frame_from_records_generator_nrows(object):
-    goal_time = 0.2
+    def time_reindex_upcast(self):
+        self.df2.reindex(np.random.permutation(range(1200)))
 
-    def time_frame_from_records_generator_nrows(self):
-        self.df = DataFrame.from_records(self.get_data(), nrows=1000)
 
-    def get_data(self, n=100000):
-        return ((x, (x * 20), (x * 100)) for x in range(n))
+class Iteration(object):
 
-
-class frame_get_dtype_counts(object):
     goal_time = 0.2
 
     def setup(self):
-        self.df = pandas.DataFrame(np.random.randn(10, 10000))
-
-    def time_frame_get_dtype_counts(self):
-        self.df.get_dtype_counts()
-
+        N = 1000
+        self.df = DataFrame(np.random.randn(N * 10, N))
+        self.df2 = DataFrame(np.random.randn(N * 50, 10))
+        self.df3 = DataFrame(np.random.randn(N, 5 * N),
+                             columns=['C' + str(c) for c in range(N * 5)])
 
-class frame_getitem_single_column(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(randn(10000, 1000))
-        self.df2 = DataFrame(randn(3000, 1), columns=['A'])
-        self.df3 = DataFrame(randn(3000, 1))
-
-    def time_frame_getitem_single_column(self):
-        self.h()
-
-    def f(self):
+    def time_iteritems(self):
+        # (monitor no-copying behaviour)
         if hasattr(self.df, '_item_cache'):
             self.df._item_cache.clear()
-        for (name, col) in self.df.iteritems():
+        for name, col in self.df.iteritems():
             pass
 
-    def g(self):
-        for (name, col) in self.df.iteritems():
+    def time_iteritems_cached(self):
+        for name, col in self.df.iteritems():
             pass
 
-    def h(self):
-        for i in range(10000):
-            self.df2['A']
-
-    def j(self):
-        for i in range(10000):
-            self.df3[0]
-
-
-class frame_getitem_single_column2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(randn(10000, 1000))
-        self.df2 = DataFrame(randn(3000, 1), columns=['A'])
-        self.df3 = DataFrame(randn(3000, 1))
-
-    def time_frame_getitem_single_column2(self):
-        self.j()
+    def time_iteritems_indexing(self):
+        for col in self.df3:
+            self.df3[col]
 
-    def f(self):
-        if hasattr(self.df, '_item_cache'):
-            self.df._item_cache.clear()
-        for (name, col) in self.df.iteritems():
+    def time_itertuples(self):
+        for row in self.df2.itertuples():
             pass
 
-    def g(self):
-        for (name, col) in self.df.iteritems():
+    def time_iterrows(self):
+        for row in self.df.iterrows():
             pass
 
-    def h(self):
-        for i in range(10000):
-            self.df2['A']
 
-    def j(self):
-        for i in range(10000):
-            self.df3[0]
+class ToString(object):
 
-
-class frame_html_repr_trunc_mi(object):
     goal_time = 0.2
 
     def setup(self):
-        self.nrows = 10000
-        self.data = randn(self.nrows, 10)
-        self.idx = MultiIndex.from_arrays(np.tile(randn(3, (self.nrows / 100)), 100))
-        self.df = DataFrame(self.data, index=self.idx)
-
-    def time_frame_html_repr_trunc_mi(self):
-        self.df._repr_html_()
-
+        self.df = DataFrame(np.random.randn(100, 10))
 
-class frame_html_repr_trunc_si(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.nrows = 10000
-        self.data = randn(self.nrows, 10)
-        self.idx = randn(self.nrows)
-        self.df = DataFrame(self.data, index=self.idx)
+    def time_to_string_floats(self):
+        self.df.to_string()
 
-    def time_frame_html_repr_trunc_si(self):
-        self.df._repr_html_()
 
+class ToHTML(object):
 
-class frame_insert_100_columns_begin(object):
     goal_time = 0.2
 
     def setup(self):
-        self.N = 1000
+        nrows = 500
+        self.df2 = DataFrame(np.random.randn(nrows, 10))
+        self.df2[0] = period_range('2000', periods=nrows)
+        self.df2[1] = range(nrows)
 
-    def time_frame_insert_100_columns_begin(self):
-        self.f()
+    def time_to_html_mixed(self):
+        self.df2.to_html()
 
-    def f(self, K=100):
-        self.df = DataFrame(index=range(self.N))
-        self.new_col = np.random.randn(self.N)
-        for i in range(K):
-            self.df.insert(0, i, self.new_col)
 
+class Repr(object):
 
-class frame_insert_500_columns_end(object):
     goal_time = 0.2
 
     def setup(self):
-        self.N = 1000
-
-    def time_frame_insert_500_columns_end(self):
-        self.f()
+        nrows = 10000
+        data = np.random.randn(nrows, 10)
+        arrays = np.tile(np.random.randn(3, int(nrows / 100)), 100)
+        idx = MultiIndex.from_arrays(arrays)
+        self.df3 = DataFrame(data, index=idx)
+        self.df4 = DataFrame(data, index=np.random.randn(nrows))
+        self.df_tall = DataFrame(np.random.randn(nrows, 10))
+        self.df_wide = DataFrame(np.random.randn(10, nrows))
 
-    def f(self, K=500):
-        self.df = DataFrame(index=range(self.N))
-        self.new_col = np.random.randn(self.N)
-        for i in range(K):
-            self.df[i] = self.new_col
+    def time_html_repr_trunc_mi(self):
+        self.df3._repr_html_()
 
+    def time_html_repr_trunc_si(self):
+        self.df4._repr_html_()
 
-class frame_interpolate(object):
-    goal_time = 0.2
+    def time_repr_tall(self):
+        repr(self.df_tall)
 
-    def setup(self):
-        self.df = DataFrame(randn(10000, 100))
-        self.df.values[::2] = np.nan
+    def time_frame_repr_wide(self):
+        repr(self.df_wide)
 
-    def time_frame_interpolate(self):
-        self.df.interpolate()
 
+class MaskBool(object):
 
-class frame_interpolate_some_good(object):
     goal_time = 0.2
 
     def setup(self):
-        self.df = DataFrame({'A': np.arange(0, 10000), 'B': np.random.randint(0, 100, 10000), 'C': randn(10000), 'D': randn(10000), })
-        self.df.loc[1::5, 'A'] = np.nan
-        self.df.loc[1::5, 'C'] = np.nan
+        data = np.random.randn(1000, 500)
+        df = DataFrame(data)
+        df = df.where(df > 0)
+        self.bools = df > 0
+        self.mask = isnull(df)
 
-    def time_frame_interpolate_some_good(self):
-        self.df.interpolate()
+    def time_frame_mask_bools(self):
+        self.bools.mask(self.mask)
+
+    def time_frame_mask_floats(self):
+        self.bools.astype(float).mask(self.mask)
 
 
-class frame_interpolate_some_good_infer(object):
+class Isnull(object):
+
     goal_time = 0.2
 
     def setup(self):
-        self.df = DataFrame({'A': np.arange(0, 10000), 'B': np.random.randint(0, 100, 10000), 'C': randn(10000), 'D': randn(10000), })
-        self.df.loc[1::5, 'A'] = np.nan
-        self.df.loc[1::5, 'C'] = np.nan
+        N = 10**3
+        self.df_no_null = DataFrame(np.random.randn(N, N))
 
-    def time_frame_interpolate_some_good_infer(self):
-        self.df.interpolate(downcast='infer')
+        sample = np.array([np.nan, 1.0])
+        data = np.random.choice(sample, (N, N))
+        self.df = DataFrame(data)
 
+        sample = np.array(list(string.ascii_letters + string.whitespace))
+        data = np.random.choice(sample, (N, N))
+        self.df_strings = DataFrame(data)
 
-class frame_isnull(object):
-    goal_time = 0.2
+        sample = np.array([NaT, np.nan, None, np.datetime64('NaT'),
+                           np.timedelta64('NaT'), 0, 1, 2.0, '', 'abcd'])
+        data = np.random.choice(sample, (N, N))
+        self.df_obj = DataFrame(data)
 
-    def setup(self):
-        self.data = np.random.randn(1000, 1000)
-        self.df = DataFrame(self.data)
+    def time_isnull_floats_no_null(self):
+        isnull(self.df_no_null)
 
-    def time_frame_isnull(self):
+    def time_isnull(self):
         isnull(self.df)
 
+    def time_isnull_strngs(self):
+        isnull(self.df_strings)
 
-class frame_iteritems(object):
-    goal_time = 0.2
+    def time_isnull_obj(self):
+        isnull(self.df_obj)
 
-    def setup(self):
-        self.df = DataFrame(randn(10000, 1000))
-        self.df2 = DataFrame(randn(3000, 1), columns=['A'])
-        self.df3 = DataFrame(randn(3000, 1))
 
-    def time_frame_iteritems(self):
-        self.f()
+class Fillna(object):
 
-    def f(self):
-        if hasattr(self.df, '_item_cache'):
-            self.df._item_cache.clear()
-        for (name, col) in self.df.iteritems():
-            pass
+    goal_time = 0.2
+    params = ([True, False], ['pad', 'bfill'])
+    param_names = ['inplace', 'method']
 
-    def g(self):
-        for (name, col) in self.df.iteritems():
-            pass
+    def setup(self, inplace, method):
+        values = np.random.randn(10000, 100)
+        values[::2] = np.nan
+        self.df = DataFrame(values)
 
-    def h(self):
-        for i in range(10000):
-            self.df2['A']
+    def time_frame_fillna(self, inplace, method):
+        self.df.fillna(inplace=inplace, method=method)
 
-    def j(self):
-        for i in range(10000):
-            self.df3[0]
 
+class Dropna(object):
 
-class frame_iteritems_cached(object):
     goal_time = 0.2
+    params = (['all', 'any'], [0, 1])
+    param_names = ['how', 'axis']
 
-    def setup(self):
-        self.df = DataFrame(randn(10000, 1000))
-        self.df2 = DataFrame(randn(3000, 1), columns=['A'])
-        self.df3 = DataFrame(randn(3000, 1))
-
-    def time_frame_iteritems_cached(self):
-        self.g()
-
-    def f(self):
-        if hasattr(self.df, '_item_cache'):
-            self.df._item_cache.clear()
-        for (name, col) in self.df.iteritems():
-            pass
+    def setup(self, how, axis):
+        self.df = DataFrame(np.random.randn(10000, 1000))
+        self.df.ix[50:1000, 20:50] = np.nan
+        self.df.ix[2000:3000] = np.nan
+        self.df.ix[:, 60:70] = np.nan
+        self.df_mixed = self.df.copy()
+        self.df_mixed['foo'] = 'bar'
 
-    def g(self):
-        for (name, col) in self.df.iteritems():
-            pass
+    def time_dropna(self, how, axis):
+        self.df.dropna(how=how, axis=axis)
 
-    def h(self):
-        for i in range(10000):
-            self.df2['A']
+    def time_dropna_axis_mixed_dtypes(self, how, axis):
+        self.df_mixed.dropna(how=how, axis=axis)
 
-    def j(self):
-        for i in range(10000):
-            self.df3[0]
 
+class Count(object):
 
-class frame_mask_bools(object):
     goal_time = 0.2
 
-    def setup(self):
-        self.data = np.random.randn(1000, 500)
-        self.df = DataFrame(self.data)
-        self.df = self.df.where((self.df > 0))
-        self.bools = (self.df > 0)
-        self.mask = isnull(self.df)
+    params = [0, 1]
+    param_names = ['axis']
 
-    def time_frame_mask_bools(self):
-        self.bools.mask(self.mask)
+    def setup(self, axis):
+        self.df = DataFrame(np.random.randn(10000, 1000))
+        self.df.ix[50:1000, 20:50] = np.nan
+        self.df.ix[2000:3000] = np.nan
+        self.df.ix[:, 60:70] = np.nan
+        self.df_mixed = self.df.copy()
+        self.df_mixed['foo'] = 'bar'
 
+        self.df.index = MultiIndex.from_arrays([self.df.index, self.df.index])
+        self.df.columns = MultiIndex.from_arrays([self.df.columns,
+                                                  self.df.columns])
+        self.df_mixed.index = MultiIndex.from_arrays([self.df_mixed.index,
+                                                      self.df_mixed.index])
+        self.df_mixed.columns = MultiIndex.from_arrays([self.df_mixed.columns,
+                                                        self.df_mixed.columns])
 
-class frame_mask_floats(object):
-    goal_time = 0.2
+    def time_count_level_multi(self, axis):
+        self.df.count(axis=axis, level=1)
 
-    def setup(self):
-        self.data = np.random.randn(1000, 500)
-        self.df = DataFrame(self.data)
-        self.df = self.df.where((self.df > 0))
-        self.bools = (self.df > 0)
-        self.mask = isnull(self.df)
+    def time_count_level_mixed_dtypes_multi(self, axis):
+        self.df_mixed.count(axis=axis, level=1)
 
-    def time_frame_mask_floats(self):
-        self.bools.astype(float).mask(self.mask)
 
+class Apply(object):
 
-class frame_nonunique_equal(object):
     goal_time = 0.2
 
     def setup(self):
-        self.float_df = DataFrame(np.random.randn(1000, 1000))
-        self.object_df = DataFrame(([(['foo'] * 1000)] * 1000))
-        self.nonunique_cols = self.object_df.copy()
-        self.nonunique_cols.columns = (['A'] * len(self.nonunique_cols.columns))
-        self.pairs = dict([(name, self.make_pair(frame)) for (name, frame) in (('float_df', self.float_df), ('object_df', self.object_df), ('nonunique_cols', self.nonunique_cols))])
-
-    def time_frame_nonunique_equal(self):
-        self.test_equal('nonunique_cols')
-
-    def make_pair(self, frame):
-        self.df = frame
-        self.df2 = self.df.copy()
-        self.df2.ix[((-1), (-1))] = np.nan
-        return (self.df, self.df2)
-
-    def test_equal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df)
+        self.df = DataFrame(np.random.randn(1000, 100))
 
-    def test_unequal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df2)
+        self.s = Series(np.arange(1028.0))
+        self.df2 = DataFrame({i: self.s for i in range(1028)})
+        self.df3 = DataFrame(np.random.randn(1000, 3), columns=list('ABC'))
 
+    def time_apply_user_func(self):
+        self.df2.apply(lambda x: np.corrcoef(x, self.s)[(0, 1)])
 
-class frame_nonunique_unequal(object):
-    goal_time = 0.2
+    def time_apply_axis_1(self):
+        self.df.apply(lambda x: x + 1, axis=1)
 
-    def setup(self):
-        self.float_df = DataFrame(np.random.randn(1000, 1000))
-        self.object_df = DataFrame(([(['foo'] * 1000)] * 1000))
-        self.nonunique_cols = self.object_df.copy()
-        self.nonunique_cols.columns = (['A'] * len(self.nonunique_cols.columns))
-        self.pairs = dict([(name, self.make_pair(frame)) for (name, frame) in (('float_df', self.float_df), ('object_df', self.object_df), ('nonunique_cols', self.nonunique_cols))])
+    def time_apply_lambda_mean(self):
+        self.df.apply(lambda x: x.mean())
 
-    def time_frame_nonunique_unequal(self):
-        self.test_unequal('nonunique_cols')
+    def time_apply_np_mean(self):
+        self.df.apply(np.mean)
 
-    def make_pair(self, frame):
-        self.df = frame
-        self.df2 = self.df.copy()
-        self.df2.ix[((-1), (-1))] = np.nan
-        return (self.df, self.df2)
+    def time_apply_pass_thru(self):
+        self.df.apply(lambda x: x)
 
-    def test_equal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df)
+    def time_apply_ref_by_name(self):
+        self.df3.apply(lambda x: x['A'] + x['B'], axis=1)
 
-    def test_unequal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df2)
 
+class Dtypes(object):
 
-class frame_object_equal(object):
     goal_time = 0.2
 
     def setup(self):
-        self.float_df = DataFrame(np.random.randn(1000, 1000))
-        self.object_df = DataFrame(([(['foo'] * 1000)] * 1000))
-        self.nonunique_cols = self.object_df.copy()
-        self.nonunique_cols.columns = (['A'] * len(self.nonunique_cols.columns))
-        self.pairs = dict([(name, self.make_pair(frame)) for (name, frame) in (('float_df', self.float_df), ('object_df', self.object_df), ('nonunique_cols', self.nonunique_cols))])
-
-    def time_frame_object_equal(self):
-        self.test_equal('object_df')
-
-    def make_pair(self, frame):
-        self.df = frame
-        self.df2 = self.df.copy()
-        self.df2.ix[((-1), (-1))] = np.nan
-        return (self.df, self.df2)
+        self.df = DataFrame(np.random.randn(1000, 1000))
 
-    def test_equal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df)
+    def time_frame_dtypes(self):
+        self.df.dtypes
 
-    def test_unequal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df2)
 
+class Equals(object):
 
-class frame_object_unequal(object):
     goal_time = 0.2
 
     def setup(self):
-        self.float_df = DataFrame(np.random.randn(1000, 1000))
-        self.object_df = DataFrame(([(['foo'] * 1000)] * 1000))
-        self.nonunique_cols = self.object_df.copy()
-        self.nonunique_cols.columns = (['A'] * len(self.nonunique_cols.columns))
-        self.pairs = dict([(name, self.make_pair(frame)) for (name, frame) in (('float_df', self.float_df), ('object_df', self.object_df), ('nonunique_cols', self.nonunique_cols))])
-
-    def time_frame_object_unequal(self):
-        self.test_unequal('object_df')
+        N = 10**3
+        self.float_df = DataFrame(np.random.randn(N, N))
+        self.float_df_nan = self.float_df.copy()
+        self.float_df_nan.iloc[-1, -1] = np.nan
 
-    def make_pair(self, frame):
-        self.df = frame
-        self.df2 = self.df.copy()
-        self.df2.ix[((-1), (-1))] = np.nan
-        return (self.df, self.df2)
+        self.object_df = DataFrame('foo', index=range(N), columns=range(N))
+        self.object_df_nan = self.object_df.copy()
+        self.object_df_nan.iloc[-1, -1] = np.nan
 
-    def test_equal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df)
+        self.nonunique_cols = self.object_df.copy()
+        self.nonunique_cols.columns = ['A'] * len(self.nonunique_cols.columns)
+        self.nonunique_cols_nan = self.nonunique_cols.copy()
+        self.nonunique_cols_nan.iloc[-1, -1] = np.nan
 
-    def test_unequal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df2)
+    def time_frame_float_equal(self):
+        self.float_df.equals(self.float_df)
 
+    def time_frame_float_unequal(self):
+        self.float_df.equals(self.float_df_nan)
 
-class frame_reindex_axis0(object):
-    goal_time = 0.2
+    def time_frame_nonunique_equal(self):
+        self.nonunique_cols.equals(self.nonunique_cols)
 
-    def setup(self):
-        self.df = DataFrame(randn(10000, 10000))
-        self.idx = np.arange(4000, 7000)
+    def time_frame_nonunique_unequal(self):
+        self.nonunique_cols.equals(self.nonunique_cols_nan)
 
-    def time_frame_reindex_axis0(self):
-        self.df.reindex(self.idx)
+    def time_frame_object_equal(self):
+        self.object_df.equals(self.object_df)
 
+    def time_frame_object_unequal(self):
+        self.object_df.equals(self.object_df_nan)
 
-class frame_reindex_axis1(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.df = DataFrame(randn(10000, 10000))
-        self.idx = np.arange(4000, 7000)
+class Interpolate(object):
 
-    def time_frame_reindex_axis1(self):
-        self.df.reindex(columns=self.idx)
+    goal_time = 0.2
+    params = [None, 'infer']
+    param_names = ['downcast']
 
+    def setup(self, downcast):
+        N = 10000
+        # this is the worst case, where every column has NaNs.
+        self.df = DataFrame(np.random.randn(N, 100))
+        self.df.values[::2] = np.nan
 
-class frame_reindex_both_axes(object):
-    goal_time = 0.2
+        self.df2 = DataFrame({'A': np.arange(0, N),
+                              'B': np.random.randint(0, 100, N),
+                              'C': np.random.randn(N),
+                              'D': np.random.randn(N)})
+        self.df2.loc[1::5, 'A'] = np.nan
+        self.df2.loc[1::5, 'C'] = np.nan
 
-    def setup(self):
-        self.df = DataFrame(randn(10000, 10000))
-        self.idx = np.arange(4000, 7000)
+    def time_interpolate(self, downcast):
+        self.df.interpolate(downcast=downcast)
 
-    def time_frame_reindex_both_axes(self):
-        self.df.reindex(index=self.idx, columns=self.idx)
+    def time_interpolate_some_good(self, downcast):
+        self.df2.interpolate(downcast=downcast)
 
 
-class frame_reindex_both_axes_ix(object):
+class Shift(object):
+    # frame shift speedup issue-5609
     goal_time = 0.2
+    params = [0, 1]
+    param_names = ['axis']
 
-    def setup(self):
-        self.df = DataFrame(randn(10000, 10000))
-        self.idx = np.arange(4000, 7000)
+    def setup(self, axis):
+        self.df = DataFrame(np.random.rand(10000, 500))
 
-    def time_frame_reindex_both_axes_ix(self):
-        self.df.ix[(self.idx, self.idx)]
+    def time_shift(self, axis):
+        self.df.shift(1, axis=axis)
 
 
-class frame_reindex_upcast(object):
-    goal_time = 0.2
+class Nunique(object):
 
     def setup(self):
-        self.df = DataFrame(dict([(c, {0: randint(0, 2, 1000).astype(np.bool_), 1: randint(0, 1000, 1000).astype(np.int16), 2: randint(0, 1000, 1000).astype(np.int32), 3: randint(0, 1000, 1000).astype(np.int64), }[randint(0, 4)]) for c in range(1000)]))
+        self.df = DataFrame(np.random.randn(10000, 1000))
+
+    def time_frame_nunique(self):
+        self.df.nunique()
 
-    def time_frame_reindex_upcast(self):
-        self.df.reindex(permutation(range(1200)))
 
+class Duplicated(object):
 
-class frame_repr_tall(object):
     goal_time = 0.2
 
     def setup(self):
-        self.df = pandas.DataFrame(np.random.randn(10000, 10))
+        n = (1 << 20)
+        t = date_range('2015-01-01', freq='S', periods=(n // 64))
+        xs = np.random.randn(n // 64).round(2)
+        self.df = DataFrame({'a': np.random.randint(-1 << 8, 1 << 8, n),
+                             'b': np.random.choice(t, n),
+                             'c': np.random.choice(xs, n)})
+        self.df2 = DataFrame(np.random.randn(1000, 100).astype(str)).T
 
-    def time_frame_repr_tall(self):
-        repr(self.df)
-
-
-class frame_repr_wide(object):
-    goal_time = 0.2
+    def time_frame_duplicated(self):
+        self.df.duplicated()
 
-    def setup(self):
-        self.df = pandas.DataFrame(np.random.randn(10, 10000))
+    def time_frame_duplicated_wide(self):
+        self.df2.duplicated()
 
-    def time_frame_repr_wide(self):
-        repr(self.df)
 
+class XS(object):
 
-class frame_shift_axis0(object):
     goal_time = 0.2
+    params = [0, 1]
+    param_names = ['axis']
 
-    def setup(self):
-        self.df = DataFrame(np.random.rand(10000, 500))
+    def setup(self, axis):
+        self.N = 10**4
+        self.df = DataFrame(np.random.randn(self.N, self.N))
+
+    def time_frame_xs(self, axis):
+        self.df.xs(self.N / 2, axis=axis)
 
-    def time_frame_shift_axis0(self):
-        self.df.shift(1, axis=0)
 
+class SortValues(object):
 
-class frame_shift_axis_1(object):
     goal_time = 0.2
+    params = [True, False]
+    param_names = ['ascending']
 
-    def setup(self):
-        self.df = DataFrame(np.random.rand(10000, 500))
+    def setup(self, ascending):
+        self.df = DataFrame(np.random.randn(1000000, 2), columns=list('AB'))
+
+    def time_frame_sort_values(self, ascending):
+        self.df.sort_values(by='A', ascending=ascending)
 
-    def time_frame_shift_axis_1(self):
-        self.df.shift(1, axis=1)
 
+class SortIndexByColumns(object):
 
-class frame_to_html_mixed(object):
     goal_time = 0.2
 
     def setup(self):
-        self.nrows = 500
-        self.df = DataFrame(randn(self.nrows, 10))
-        self.df[0] = period_range('2000', '2010', self.nrows)
-        self.df[1] = range(self.nrows)
+        N = 10000
+        K = 10
+        self.df = DataFrame({'key1': tm.makeStringIndex(N).values.repeat(K),
+                             'key2': tm.makeStringIndex(N).values.repeat(K),
+                             'value': np.random.randn(N * K)})
 
-    def time_frame_to_html_mixed(self):
-        self.df.to_html()
+    def time_frame_sort_values_by_columns(self):
+        self.df.sort_values(by=['key1', 'key2'])
 
 
-class frame_to_string_floats(object):
+class Quantile(object):
+
     goal_time = 0.2
+    params = [0, 1]
+    param_names = ['axis']
 
-    def setup(self):
-        self.df = DataFrame(randn(100, 10))
+    def setup(self, axis):
+        self.df = DataFrame(np.random.randn(1000, 3), columns=list('ABC'))
 
-    def time_frame_to_string_floats(self):
-        self.df.to_string()
+    def time_frame_quantile(self, axis):
+        self.df.quantile([0.1, 0.5], axis=axis)
 
 
-class frame_xs_col(object):
+class GetDtypeCounts(object):
+    # 2807
     goal_time = 0.2
 
     def setup(self):
-        self.df = DataFrame(randn(1, 100000))
+        self.df = DataFrame(np.random.randn(10, 10000))
 
-    def time_frame_xs_col(self):
-        self.df.xs(50000, axis=1)
+    def time_frame_get_dtype_counts(self):
+        self.df.get_dtype_counts()
 
+    def time_info(self):
+        self.df.info()
 
-class frame_xs_row(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.df = DataFrame(randn(100000, 1))
+class NSort(object):
 
-    def time_frame_xs_row(self):
-        self.df.xs(50000)
+    goal_time = 0.2
+    params = ['first', 'last', 'all']
+    param_names = ['keep']
 
+    def setup(self, keep):
+        self.df = DataFrame(np.random.randn(1000, 3), columns=list('ABC'))
 
-class frame_sort_index(object):
-    goal_time = 0.2
+    def time_nlargest(self, keep):
+        self.df.nlargest(100, 'A', keep=keep)
 
-    def setup(self):
-        self.df = DataFrame(randn(1000000, 2), columns=list('AB'))
+    def time_nsmallest(self, keep):
+        self.df.nsmallest(100, 'A', keep=keep)
 
-    def time_frame_sort_index(self):
-        self.df.sort_index()
 
+class Describe(object):
 
-class series_string_vector_slice(object):
     goal_time = 0.2
 
     def setup(self):
-        self.s = Series((['abcdefg', np.nan] * 500000))
+        self.df = DataFrame({
+            'a': np.random.randint(0, 100, int(1e6)),
+            'b': np.random.randint(0, 100, int(1e6)),
+            'c': np.random.randint(0, 100, int(1e6))
+        })
+
+    def time_series_describe(self):
+        self.df['a'].describe()
 
-    def time_series_string_vector_slice(self):
-        self.s.str[:5]
+    def time_dataframe_describe(self):
+        self.df.describe()
diff --git a/asv_bench/benchmarks/gil.py b/asv_bench/benchmarks/gil.py
index 4b82781fc39d9..21c1ccf46e1c4 100644
--- a/asv_bench/benchmarks/gil.py
+++ b/asv_bench/benchmarks/gil.py
@@ -1,5 +1,17 @@
-from .pandas_vb_common import *
-from pandas.core import common as com
+import numpy as np
+import pandas.util.testing as tm
+from pandas import DataFrame, Series, read_csv, factorize, date_range
+from pandas.core.algorithms import take_1d
+try:
+    from pandas import (rolling_median, rolling_mean, rolling_min, rolling_max,
+                        rolling_var, rolling_skew, rolling_kurt, rolling_std)
+    have_rolling_methods = True
+except ImportError:
+    have_rolling_methods = False
+try:
+    from pandas._libs import algos
+except ImportError:
+    from pandas import algos
 try:
     from pandas.util.testing import test_parallel
     have_real_test_parallel = True
@@ -7,316 +19,257 @@
     have_real_test_parallel = False
 
     def test_parallel(num_threads=1):
-
         def wrapper(fname):
             return fname
         return wrapper
 
+from .pandas_vb_common import BaseIO, setup  # noqa
 
-class nogil_groupby_count_2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
-            raise NotImplementedError
 
-    def time_nogil_groupby_count_2(self):
-        self.pg2()
+class ParallelGroupbyMethods(object):
 
-    @test_parallel(num_threads=2)
-    def pg2(self):
-        self.df.groupby('key')['data'].count()
-
-
-class nogil_groupby_last_2(object):
     goal_time = 0.2
+    params = ([2, 4, 8], ['count', 'last', 'max', 'mean', 'min', 'prod',
+                          'sum', 'var'])
+    param_names = ['threads', 'method']
 
-    def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
+    def setup(self, threads, method):
+        if not have_real_test_parallel:
             raise NotImplementedError
+        N = 10**6
+        ngroups = 10**3
+        df = DataFrame({'key': np.random.randint(0, ngroups, size=N),
+                        'data': np.random.randn(N)})
 
-    def time_nogil_groupby_last_2(self):
-        self.pg2()
-
-    @test_parallel(num_threads=2)
-    def pg2(self):
-        self.df.groupby('key')['data'].last()
+        @test_parallel(num_threads=threads)
+        def parallel():
+            getattr(df.groupby('key')['data'], method)()
+        self.parallel = parallel
 
+        def loop():
+            getattr(df.groupby('key')['data'], method)()
+        self.loop = loop
 
-class nogil_groupby_max_2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
-            raise NotImplementedError
+    def time_parallel(self, threads, method):
+        self.parallel()
 
-    def time_nogil_groupby_max_2(self):
-        self.pg2()
+    def time_loop(self, threads, method):
+        for i in range(threads):
+            self.loop()
 
-    @test_parallel(num_threads=2)
-    def pg2(self):
-        self.df.groupby('key')['data'].max()
 
+class ParallelGroups(object):
 
-class nogil_groupby_mean_2(object):
     goal_time = 0.2
+    params = [2, 4, 8]
+    param_names = ['threads']
 
-    def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
+    def setup(self, threads):
+        if not have_real_test_parallel:
             raise NotImplementedError
+        size = 2**22
+        ngroups = 10**3
+        data = Series(np.random.randint(0, ngroups, size=size))
 
-    def time_nogil_groupby_mean_2(self):
-        self.pg2()
-
-    @test_parallel(num_threads=2)
-    def pg2(self):
-        self.df.groupby('key')['data'].mean()
-
-
-class nogil_groupby_min_2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
-            raise NotImplementedError
+        @test_parallel(num_threads=threads)
+        def get_groups():
+            data.groupby(data).groups
+        self.get_groups = get_groups
 
-    def time_nogil_groupby_min_2(self):
-        self.pg2()
+    def time_get_groups(self, threads):
+        self.get_groups()
 
-    @test_parallel(num_threads=2)
-    def pg2(self):
-        self.df.groupby('key')['data'].min()
 
+class ParallelTake1D(object):
 
-class nogil_groupby_prod_2(object):
     goal_time = 0.2
+    params = ['int64', 'float64']
+    param_names = ['dtype']
 
-    def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
+    def setup(self, dtype):
+        if not have_real_test_parallel:
             raise NotImplementedError
+        N = 10**6
+        df = DataFrame({'col': np.arange(N, dtype=dtype)})
+        indexer = np.arange(100, len(df) - 100)
 
-    def time_nogil_groupby_prod_2(self):
-        self.pg2()
-
-    @test_parallel(num_threads=2)
-    def pg2(self):
-        self.df.groupby('key')['data'].prod()
-
-
-class nogil_groupby_sum_2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
-            raise NotImplementedError
+        @test_parallel(num_threads=2)
+        def parallel_take1d():
+            take_1d(df['col'].values, indexer)
+        self.parallel_take1d = parallel_take1d
 
-    def time_nogil_groupby_sum_2(self):
-        self.pg2()
+    def time_take1d(self, dtype):
+        self.parallel_take1d()
 
-    @test_parallel(num_threads=2)
-    def pg2(self):
-        self.df.groupby('key')['data'].sum()
 
+class ParallelKth(object):
 
-class nogil_groupby_sum_4(object):
-    goal_time = 0.2
+    number = 1
+    repeat = 5
 
     def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
+        if not have_real_test_parallel:
             raise NotImplementedError
+        N = 10**7
+        k = 5 * 10**5
+        kwargs_list = [{'arr': np.random.randn(N)},
+                       {'arr': np.random.randn(N)}]
 
-    def time_nogil_groupby_sum_4(self):
-        self.pg4()
-
-    def f(self):
-        self.df.groupby('key')['data'].sum()
-
-    def g2(self):
-        for i in range(2):
-            self.f()
+        @test_parallel(num_threads=2, kwargs_list=kwargs_list)
+        def parallel_kth_smallest(arr):
+            algos.kth_smallest(arr, k)
+        self.parallel_kth_smallest = parallel_kth_smallest
 
-    def g4(self):
-        for i in range(4):
-            self.f()
+    def time_kth_smallest(self):
+        self.parallel_kth_smallest()
 
-    def g8(self):
-        for i in range(8):
-            self.f()
 
-    @test_parallel(num_threads=2)
-    def pg2(self):
-        self.f()
+class ParallelDatetimeFields(object):
 
-    @test_parallel(num_threads=4)
-    def pg4(self):
-        self.f()
-
-    @test_parallel(num_threads=8)
-    def pg8(self):
-        self.f()
-
-
-class nogil_groupby_sum_8(object):
     goal_time = 0.2
 
     def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
+        if not have_real_test_parallel:
             raise NotImplementedError
+        N = 10**6
+        self.dti = date_range('1900-01-01', periods=N, freq='T')
+        self.period = self.dti.to_period('D')
+
+    def time_datetime_field_year(self):
+        @test_parallel(num_threads=2)
+        def run(dti):
+            dti.year
+        run(self.dti)
+
+    def time_datetime_field_day(self):
+        @test_parallel(num_threads=2)
+        def run(dti):
+            dti.day
+        run(self.dti)
+
+    def time_datetime_field_daysinmonth(self):
+        @test_parallel(num_threads=2)
+        def run(dti):
+            dti.days_in_month
+        run(self.dti)
+
+    def time_datetime_field_normalize(self):
+        @test_parallel(num_threads=2)
+        def run(dti):
+            dti.normalize()
+        run(self.dti)
+
+    def time_datetime_to_period(self):
+        @test_parallel(num_threads=2)
+        def run(dti):
+            dti.to_period('S')
+        run(self.dti)
+
+    def time_period_to_datetime(self):
+        @test_parallel(num_threads=2)
+        def run(period):
+            period.to_timestamp()
+        run(self.period)
+
+
+class ParallelRolling(object):
 
-    def time_nogil_groupby_sum_8(self):
-        self.pg8()
-
-    def f(self):
-        self.df.groupby('key')['data'].sum()
-
-    def g2(self):
-        for i in range(2):
-            self.f()
-
-    def g4(self):
-        for i in range(4):
-            self.f()
-
-    def g8(self):
-        for i in range(8):
-            self.f()
-
-    @test_parallel(num_threads=2)
-    def pg2(self):
-        self.f()
-
-    @test_parallel(num_threads=4)
-    def pg4(self):
-        self.f()
-
-    @test_parallel(num_threads=8)
-    def pg8(self):
-        self.f()
-
-
-class nogil_groupby_var_2(object):
     goal_time = 0.2
+    params = ['median', 'mean', 'min', 'max', 'var', 'skew', 'kurt', 'std']
+    param_names = ['method']
 
-    def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
+    def setup(self, method):
+        if not have_real_test_parallel:
+            raise NotImplementedError
+        win = 100
+        arr = np.random.rand(100000)
+        if hasattr(DataFrame, 'rolling'):
+            df = DataFrame(arr).rolling(win)
+
+            @test_parallel(num_threads=2)
+            def parallel_rolling():
+                getattr(df, method)()
+            self.parallel_rolling = parallel_rolling
+        elif have_rolling_methods:
+            rolling = {'median': rolling_median,
+                       'mean': rolling_mean,
+                       'min': rolling_min,
+                       'max': rolling_max,
+                       'var': rolling_var,
+                       'skew': rolling_skew,
+                       'kurt': rolling_kurt,
+                       'std': rolling_std}
+
+            @test_parallel(num_threads=2)
+            def parallel_rolling():
+                rolling[method](arr, win)
+            self.parallel_rolling = parallel_rolling
+        else:
             raise NotImplementedError
 
-    def time_nogil_groupby_var_2(self):
-        self.pg2()
+    def time_rolling(self, method):
+        self.parallel_rolling()
 
-    @test_parallel(num_threads=2)
-    def pg2(self):
-        self.df.groupby('key')['data'].var()
 
+class ParallelReadCSV(BaseIO):
 
-class nogil_take1d_float64(object):
-    goal_time = 0.2
+    number = 1
+    repeat = 5
+    params = ['float', 'object', 'datetime']
+    param_names = ['dtype']
 
-    def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
+    def setup(self, dtype):
+        if not have_real_test_parallel:
             raise NotImplementedError
-        self.N = 10000000.0
-        self.df = DataFrame({'int64': np.arange(self.N, dtype='int64'), 'float64': np.arange(self.N, dtype='float64'), })
-        self.indexer = np.arange(100, (len(self.df) - 100))
+        rows = 10000
+        cols = 50
+        data = {'float': DataFrame(np.random.randn(rows, cols)),
+                'datetime': DataFrame(np.random.randn(rows, cols),
+                                      index=date_range('1/1/2000',
+                                                       periods=rows)),
+                'object': DataFrame('foo',
+                                    index=range(rows),
+                                    columns=['object%03d'.format(i)
+                                             for i in range(5)])}
 
-    def time_nogil_take1d_float64(self):
-        self.take_1d_pg2_int64()
+        self.fname = '__test_{}__.csv'.format(dtype)
+        df = data[dtype]
+        df.to_csv(self.fname)
 
-    @test_parallel(num_threads=2)
-    def take_1d_pg2_int64(self):
-        com.take_1d(self.df.int64.values, self.indexer)
+        @test_parallel(num_threads=2)
+        def parallel_read_csv():
+            read_csv(self.fname)
+        self.parallel_read_csv = parallel_read_csv
 
-    @test_parallel(num_threads=2)
-    def take_1d_pg2_float64(self):
-        com.take_1d(self.df.float64.values, self.indexer)
+    def time_read_csv(self, dtype):
+        self.parallel_read_csv()
 
 
-class nogil_take1d_int64(object):
-    goal_time = 0.2
+class ParallelFactorize(object):
 
-    def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
-            raise NotImplementedError
-        self.N = 10000000.0
-        self.df = DataFrame({'int64': np.arange(self.N, dtype='int64'), 'float64': np.arange(self.N, dtype='float64'), })
-        self.indexer = np.arange(100, (len(self.df) - 100))
+    number = 1
+    repeat = 5
+    params = [2, 4, 8]
+    param_names = ['threads']
 
-    def time_nogil_take1d_int64(self):
-        self.take_1d_pg2_float64()
+    def setup(self, threads):
+        if not have_real_test_parallel:
+            raise NotImplementedError
 
-    @test_parallel(num_threads=2)
-    def take_1d_pg2_int64(self):
-        com.take_1d(self.df.int64.values, self.indexer)
+        strings = tm.makeStringIndex(100000)
 
-    @test_parallel(num_threads=2)
-    def take_1d_pg2_float64(self):
-        com.take_1d(self.df.float64.values, self.indexer)
+        @test_parallel(num_threads=threads)
+        def parallel():
+            factorize(strings)
+        self.parallel = parallel
 
+        def loop():
+            factorize(strings)
+        self.loop = loop
 
-class nogil_kth_smallest(object):
-    number = 1
-    repeat = 5
+    def time_parallel(self, threads):
+        self.parallel()
 
-    def setup(self):
-        if (not have_real_test_parallel):
-            raise NotImplementedError
-        np.random.seed(1234)
-        self.N = 10000000
-        self.k = 500000
-        self.a = np.random.randn(self.N)
-        self.b = self.a.copy()
-        self.kwargs_list = [{'arr': self.a}, {'arr': self.b}]
-
-    def time_nogil_kth_smallest(self):
-        @test_parallel(num_threads=2, kwargs_list=self.kwargs_list)
-        def run(arr):
-            algos.kth_smallest(arr, self.k)
-        run()
+    def time_loop(self, threads):
+        for i in range(threads):
+            self.loop()
diff --git a/asv_bench/benchmarks/groupby.py b/asv_bench/benchmarks/groupby.py
index 138977a29463e..0725bbeb6c36d 100644
--- a/asv_bench/benchmarks/groupby.py
+++ b/asv_bench/benchmarks/groupby.py
@@ -1,774 +1,581 @@
-from .pandas_vb_common import *
-from string import ascii_letters, digits
+import warnings
+from string import ascii_letters
 from itertools import product
+from functools import partial
 
+import numpy as np
+from pandas import (DataFrame, Series, MultiIndex, date_range, period_range,
+                    TimeGrouper, Categorical, Timestamp)
+import pandas.util.testing as tm
 
-class groupby_agg_builtins(object):
-    goal_time = 0.2
-
-    def setup(self):
-        np.random.seed(27182)
-        self.n = 100000
-        self.df = DataFrame(np.random.randint(1, (self.n / 100), (self.n, 3)), columns=['jim', 'joe', 'jolie'])
+from .pandas_vb_common import setup  # noqa
 
-    def time_groupby_agg_builtins1(self):
-        self.df.groupby('jim').agg([sum, min, max])
 
-    def time_groupby_agg_builtins2(self):
-        self.df.groupby(['jim', 'joe']).agg([sum, min, max])
+method_blacklist = {
+    'object': {'median', 'prod', 'sem', 'cumsum', 'sum', 'cummin', 'mean',
+               'max', 'skew', 'cumprod', 'cummax', 'rank', 'pct_change', 'min',
+               'var', 'mad', 'describe', 'std'},
+    'datetime': {'median', 'prod', 'sem', 'cumsum', 'sum', 'mean', 'skew',
+                 'cumprod', 'cummax', 'pct_change', 'var', 'mad', 'describe',
+                 'std'}
+}
 
-#----------------------------------------------------------------------
-# dict return values
 
-class groupby_apply_dict_return(object):
+class ApplyDictReturn(object):
     goal_time = 0.2
 
     def setup(self):
         self.labels = np.arange(1000).repeat(10)
-        self.data = Series(randn(len(self.labels)))
-        self.f = (lambda x: {'first': x.values[0], 'last': x.values[(-1)], })
+        self.data = Series(np.random.randn(len(self.labels)))
 
     def time_groupby_apply_dict_return(self):
-        self.data.groupby(self.labels).apply(self.f)
+        self.data.groupby(self.labels).apply(lambda x: {'first': x.values[0],
+                                                        'last': x.values[-1]})
 
 
-#----------------------------------------------------------------------
-# First / last functions
+class Apply(object):
 
-class groupby_first_last(object):
     goal_time = 0.2
 
-    def setup(self):
-        self.labels = np.arange(10000).repeat(10)
-        self.data = Series(randn(len(self.labels)))
-        self.data[::3] = np.nan
-        self.data[1::3] = np.nan
-        self.data2 = Series(randn(len(self.labels)), dtype='float32')
-        self.data2[::3] = np.nan
-        self.data2[1::3] = np.nan
-        self.labels = self.labels.take(np.random.permutation(len(self.labels)))
-
-    def time_groupby_first_float32(self):
-        self.data2.groupby(self.labels).first()
+    def setup_cache(self):
+        N = 10**4
+        labels = np.random.randint(0, 2000, size=N)
+        labels2 = np.random.randint(0, 3, size=N)
+        df = DataFrame({'key': labels,
+                        'key2': labels2,
+                        'value1': np.random.randn(N),
+                        'value2': ['foo', 'bar', 'baz', 'qux'] * (N // 4)
+                        })
+        return df
 
-    def time_groupby_first_float64(self):
-        self.data.groupby(self.labels).first()
+    def time_scalar_function_multi_col(self, df):
+        df.groupby(['key', 'key2']).apply(lambda x: 1)
 
-    def time_groupby_last_float32(self):
-        self.data2.groupby(self.labels).last()
+    def time_scalar_function_single_col(self, df):
+        df.groupby('key').apply(lambda x: 1)
 
-    def time_groupby_last_float64(self):
-        self.data.groupby(self.labels).last()
+    @staticmethod
+    def df_copy_function(g):
+        # ensure that the group name is available (see GH #15062)
+        g.name
+        return g.copy()
 
-    def time_groupby_nth_float32_any(self):
-        self.data2.groupby(self.labels).nth(0, dropna='all')
+    def time_copy_function_multi_col(self, df):
+        df.groupby(['key', 'key2']).apply(self.df_copy_function)
 
-    def time_groupby_nth_float32_none(self):
-        self.data2.groupby(self.labels).nth(0)
+    def time_copy_overhead_single_col(self, df):
+        df.groupby('key').apply(self.df_copy_function)
 
-    def time_groupby_nth_float64_any(self):
-        self.data.groupby(self.labels).nth(0, dropna='all')
 
-    def time_groupby_nth_float64_none(self):
-        self.data.groupby(self.labels).nth(0)
+class Groups(object):
 
-# with datetimes (GH7555)
-
-class groupby_first_last_datetimes(object):
     goal_time = 0.2
 
-    def setup(self):
-        self.df = DataFrame({'a': date_range('1/1/2011', periods=100000, freq='s'), 'b': range(100000), })
+    param_names = ['key']
+    params = ['int64_small', 'int64_large', 'object_small', 'object_large']
 
-    def time_groupby_first_datetimes(self):
-        self.df.groupby('b').first()
+    def setup_cache(self):
+        size = 10**6
+        data = {'int64_small': Series(np.random.randint(0, 100, size=size)),
+                'int64_large': Series(np.random.randint(0, 10000, size=size)),
+                'object_small': Series(
+                    tm.makeStringIndex(100).take(
+                        np.random.randint(0, 100, size=size))),
+                'object_large': Series(
+                    tm.makeStringIndex(10000).take(
+                        np.random.randint(0, 10000, size=size)))}
+        return data
 
-    def time_groupby_last_datetimes(self):
-        self.df.groupby('b').last()
+    def setup(self, data, key):
+        self.ser = data[key]
 
-    def time_groupby_nth_datetimes_any(self):
-        self.df.groupby('b').nth(0, dropna='all')
+    def time_series_groups(self, data, key):
+        self.ser.groupby(self.ser).groups
 
-    def time_groupby_nth_datetimes_none(self):
-        self.df.groupby('b').nth(0)
 
+class GroupManyLabels(object):
 
-class groupby_first_last_object(object):
     goal_time = 0.2
+    params = [1, 1000]
+    param_names = ['ncols']
 
-    def setup(self):
-        self.df = DataFrame({'a': (['foo'] * 100000), 'b': range(100000)})
-
-    def time_groupby_first_object(self):
-        self.df.groupby('b').first()
+    def setup(self, ncols):
+        N = 1000
+        data = np.random.randn(N, ncols)
+        self.labels = np.random.randint(0, 100, size=N)
+        self.df = DataFrame(data)
 
-    def time_groupby_last_object(self):
-        self.df.groupby('b').last()
-
-    def time_groupby_nth_object_any(self):
-        self.df.groupby('b').nth(0, dropna='any')
-
-    def time_groupby_nth_object_none(self):
-        self.df.groupby('b').nth(0)
+    def time_sum(self, ncols):
+        self.df.groupby(self.labels).sum()
 
 
-#----------------------------------------------------------------------
-# DataFrame Apply overhead
+class Nth(object):
 
-class groupby_frame_apply(object):
     goal_time = 0.2
 
-    def setup(self):
-        self.N = 10000
-        self.labels = np.random.randint(0, 2000, size=self.N)
-        self.labels2 = np.random.randint(0, 3, size=self.N)
-        self.df = DataFrame({'key': self.labels, 'key2': self.labels2, 'value1': randn(self.N), 'value2': (['foo', 'bar', 'baz', 'qux'] * (self.N / 4)), })
+    param_names = ['dtype']
+    params = ['float32', 'float64', 'datetime', 'object']
 
-    def f(self, g):
-        return 1
+    def setup(self, dtype):
+        N = 10**5
+        # with datetimes (GH7555)
+        if dtype == 'datetime':
+            values = date_range('1/1/2011', periods=N, freq='s')
+        elif dtype == 'object':
+            values = ['foo'] * N
+        else:
+            values = np.arange(N).astype(dtype)
 
-    def time_groupby_frame_apply(self):
-        self.df.groupby(['key', 'key2']).apply(self.f)
+        key = np.arange(N)
+        self.df = DataFrame({'key': key, 'values': values})
+        self.df.iloc[1, 1] = np.nan  # insert missing data
 
-    def time_groupby_frame_apply_overhead(self):
-        self.df.groupby('key').apply(self.f)
+    def time_frame_nth_any(self, dtype):
+        self.df.groupby('key').nth(0, dropna='any')
 
+    def time_groupby_nth_all(self, dtype):
+        self.df.groupby('key').nth(0, dropna='all')
 
-#----------------------------------------------------------------------
-# 2d grouping, aggregate many columns
+    def time_frame_nth(self, dtype):
+        self.df.groupby('key').nth(0)
 
-class groupby_frame_cython_many_columns(object):
-    goal_time = 0.2
+    def time_series_nth_any(self, dtype):
+        self.df['values'].groupby(self.df['key']).nth(0, dropna='any')
 
-    def setup(self):
-        self.labels = np.random.randint(0, 100, size=1000)
-        self.df = DataFrame(randn(1000, 1000))
+    def time_groupby_nth_all(self, dtype):
+        self.df['values'].groupby(self.df['key']).nth(0, dropna='all')
 
-    def time_sum(self):
-        self.df.groupby(self.labels).sum()
+    def time_series_nth(self, dtype):
+        self.df['values'].groupby(self.df['key']).nth(0)
 
 
-#----------------------------------------------------------------------
-# single key, long, integer key
+class DateAttributes(object):
 
-class groupby_frame_singlekey_integer(object):
     goal_time = 0.2
 
     def setup(self):
-        self.data = np.random.randn(100000, 1)
-        self.labels = np.random.randint(0, 1000, size=100000)
-        self.df = DataFrame(self.data)
+        rng = date_range('1/1/2000', '12/31/2005', freq='H')
+        self.year, self.month, self.day = rng.year, rng.month, rng.day
+        self.ts = Series(np.random.randn(len(rng)), index=rng)
 
-    def time_sum(self):
-        self.df.groupby(self.labels).sum()
+    def time_len_groupby_object(self):
+        len(self.ts.groupby([self.year, self.month, self.day]))
 
 
-#----------------------------------------------------------------------
-# median
+class Int64(object):
 
-class groupby_frame(object):
     goal_time = 0.2
 
     def setup(self):
-        self.data = np.random.randn(100000, 2)
-        self.labels = np.random.randint(0, 1000, size=100000)
-        self.df = DataFrame(self.data)
-
-    def time_groupby_frame_median(self):
-        self.df.groupby(self.labels).median()
+        arr = np.random.randint(-1 << 12, 1 << 12, (1 << 17, 5))
+        i = np.random.choice(len(arr), len(arr) * 5)
+        arr = np.vstack((arr, arr[i]))
+        i = np.random.permutation(len(arr))
+        arr = arr[i]
+        self.cols = list('abcde')
+        self.df = DataFrame(arr, columns=self.cols)
+        self.df['jim'], self.df['joe'] = np.random.randn(2, len(self.df)) * 10
 
-    def time_groupby_simple_compress_timing(self):
-        self.df.groupby(self.labels).mean()
+    def time_overflow(self):
+        self.df.groupby(self.cols).max()
 
 
-#----------------------------------------------------------------------
-# DataFrame nth
+class CountMultiDtype(object):
 
-class groupby_nth(object):
     goal_time = 0.2
 
-    def setup(self):
-        self.df = DataFrame(np.random.randint(1, 100, (10000, 2)))
-
-    def time_groupby_frame_nth_any(self):
-        self.df.groupby(0).nth(0, dropna='any')
-
-    def time_groupby_frame_nth_none(self):
-        self.df.groupby(0).nth(0)
-
-    def time_groupby_series_nth_any(self):
-        self.df[1].groupby(self.df[0]).nth(0, dropna='any')
+    def setup_cache(self):
+        n = 10000
+        offsets = np.random.randint(n, size=n).astype('timedelta64[ns]')
+        dates = np.datetime64('now') + offsets
+        dates[np.random.rand(n) > 0.5] = np.datetime64('nat')
+        offsets[np.random.rand(n) > 0.5] = np.timedelta64('nat')
+        value2 = np.random.randn(n)
+        value2[np.random.rand(n) > 0.5] = np.nan
+        obj = np.random.choice(list('ab'), size=n).astype(object)
+        obj[np.random.randn(n) > 0.5] = np.nan
+        df = DataFrame({'key1': np.random.randint(0, 500, size=n),
+                        'key2': np.random.randint(0, 100, size=n),
+                        'dates': dates,
+                        'value2': value2,
+                        'value3': np.random.randn(n),
+                        'ints': np.random.randint(0, 1000, size=n),
+                        'obj': obj,
+                        'offsets': offsets})
+        return df
+
+    def time_multi_count(self, df):
+        df.groupby(['key1', 'key2']).count()
+
+
+class CountMultiInt(object):
 
-    def time_groupby_series_nth_none(self):
-        self.df[1].groupby(self.df[0]).nth(0)
-
-
-#----------------------------------------------------------------------
-# groupby_indices replacement, chop up Series
-
-class groupby_indices(object):
     goal_time = 0.2
 
-    def setup(self):
-        try:
-            self.rng = date_range('1/1/2000', '12/31/2005', freq='H')
-            (self.year, self.month, self.day) = (self.rng.year, self.rng.month, self.rng.day)
-        except:
-            self.rng = date_range('1/1/2000', '12/31/2000', offset=datetools.Hour())
-            self.year = self.rng.map((lambda x: x.year))
-            self.month = self.rng.map((lambda x: x.month))
-            self.day = self.rng.map((lambda x: x.day))
-        self.ts = Series(np.random.randn(len(self.rng)), index=self.rng)
-
-    def time_groupby_indices(self):
-        len(self.ts.groupby([self.year, self.month, self.day]))
-
+    def setup_cache(self):
+        n = 10000
+        df = DataFrame({'key1': np.random.randint(0, 500, size=n),
+                        'key2': np.random.randint(0, 100, size=n),
+                        'ints': np.random.randint(0, 1000, size=n),
+                        'ints2': np.random.randint(0, 1000, size=n)})
+        return df
 
-class groupby_int64_overflow(object):
-    goal_time = 0.2
+    def time_multi_int_count(self, df):
+        df.groupby(['key1', 'key2']).count()
 
-    def setup(self):
-        self.arr = np.random.randint(((-1) << 12), (1 << 12), ((1 << 17), 5))
-        self.i = np.random.choice(len(self.arr), (len(self.arr) * 5))
-        self.arr = np.vstack((self.arr, self.arr[self.i]))
-        self.i = np.random.permutation(len(self.arr))
-        self.arr = self.arr[self.i]
-        self.df = DataFrame(self.arr, columns=list('abcde'))
-        (self.df['jim'], self.df['joe']) = (np.random.randn(2, len(self.df)) * 10)
+    def time_multi_int_nunique(self, df):
+        df.groupby(['key1', 'key2']).nunique()
 
-    def time_groupby_int64_overflow(self):
-        self.df.groupby(list('abcde')).max()
 
+class AggFunctions(object):
 
-#----------------------------------------------------------------------
-# count() speed
-
-class groupby_multi_count(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.n = 10000
-        self.offsets = np.random.randint(self.n, size=self.n).astype('timedelta64[ns]')
-        self.dates = (np.datetime64('now') + self.offsets)
-        self.dates[(np.random.rand(self.n) > 0.5)] = np.datetime64('nat')
-        self.offsets[(np.random.rand(self.n) > 0.5)] = np.timedelta64('nat')
-        self.value2 = np.random.randn(self.n)
-        self.value2[(np.random.rand(self.n) > 0.5)] = np.nan
-        self.obj = tm.choice(list('ab'), size=self.n).astype(object)
-        self.obj[(np.random.randn(self.n) > 0.5)] = np.nan
-        self.df = DataFrame({'key1': np.random.randint(0, 500, size=self.n),
-                             'key2': np.random.randint(0, 100, size=self.n),
-                             'dates': self.dates,
-                             'value2': self.value2,
-                             'value3': np.random.randn(self.n),
-                             'ints': np.random.randint(0, 1000, size=self.n),
-                             'obj': self.obj,
-                             'offsets': self.offsets, })
-
-    def time_groupby_multi_count(self):
-        self.df.groupby(['key1', 'key2']).count()
-
-
-class groupby_int_count(object):
     goal_time = 0.2
 
-    def setup(self):
-        self.n = 10000
-        self.df = DataFrame({'key1': randint(0, 500, size=self.n),
-                             'key2': randint(0, 100, size=self.n),
-                             'ints': randint(0, 1000, size=self.n),
-                             'ints2': randint(0, 1000, size=self.n), })
-
-    def time_groupby_int_count(self):
-        self.df.groupby(['key1', 'key2']).count()
+    def setup_cache():
+        N = 10**5
+        fac1 = np.array(['A', 'B', 'C'], dtype='O')
+        fac2 = np.array(['one', 'two'], dtype='O')
+        df = DataFrame({'key1': fac1.take(np.random.randint(0, 3, size=N)),
+                        'key2': fac2.take(np.random.randint(0, 2, size=N)),
+                        'value1': np.random.randn(N),
+                        'value2': np.random.randn(N),
+                        'value3': np.random.randn(N)})
+        return df
 
+    def time_different_str_functions(self, df):
+        df.groupby(['key1', 'key2']).agg({'value1': 'mean',
+                                          'value2': 'var',
+                                          'value3': 'sum'})
 
-#----------------------------------------------------------------------
-# group with different functions per column
-
-class groupby_agg_multi(object):
-    goal_time = 0.2
+    def time_different_numpy_functions(self, df):
+        df.groupby(['key1', 'key2']).agg({'value1': np.mean,
+                                          'value2': np.var,
+                                          'value3': np.sum})
 
-    def setup(self):
-        self.fac1 = np.array(['A', 'B', 'C'], dtype='O')
-        self.fac2 = np.array(['one', 'two'], dtype='O')
-        self.df = DataFrame({'key1': self.fac1.take(np.random.randint(0, 3, size=100000)), 'key2': self.fac2.take(np.random.randint(0, 2, size=100000)), 'value1': np.random.randn(100000), 'value2': np.random.randn(100000), 'value3': np.random.randn(100000), })
+    def time_different_python_functions_multicol(self, df):
+        df.groupby(['key1', 'key2']).agg([sum, min, max])
 
-    def time_groupby_multi_different_functions(self):
-        self.df.groupby(['key1', 'key2']).agg({'value1': 'mean', 'value2': 'var', 'value3': 'sum'})
+    def time_different_python_functions_singlecol(self, df):
+        df.groupby('key1').agg([sum, min, max])
 
-    def time_groupby_multi_different_numpy_functions(self):
-        self.df.groupby(['key1', 'key2']).agg({'value1': np.mean, 'value2': np.var, 'value3': np.sum})
 
+class GroupStrings(object):
 
-class groupby_multi_index(object):
     goal_time = 0.2
 
     def setup(self):
-        self.n = (((5 * 7) * 11) * (1 << 9))
-        self.alpha = list(map(''.join, product((ascii_letters + digits), repeat=4)))
-        self.f = (lambda k: np.repeat(np.random.choice(self.alpha, (self.n // k)), k))
-        self.df = DataFrame({'a': self.f(11), 'b': self.f(7), 'c': self.f(5), 'd': self.f(1), })
+        n = 2 * 10**5
+        alpha = list(map(''.join, product(ascii_letters, repeat=4)))
+        data = np.random.choice(alpha, (n // 5, 4), replace=False)
+        data = np.repeat(data, 5, axis=0)
+        self.df = DataFrame(data, columns=list('abcd'))
         self.df['joe'] = (np.random.randn(len(self.df)) * 10).round(3)
-        self.i = np.random.permutation(len(self.df))
-        self.df = self.df.iloc[self.i].reset_index(drop=True).copy()
+        self.df = self.df.sample(frac=1).reset_index(drop=True)
 
-    def time_groupby_multi_index(self):
+    def time_multi_columns(self):
         self.df.groupby(list('abcd')).max()
 
 
-class groupby_multi(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.ngroups = 100
-        self.df = DataFrame({'key1': self.get_test_data(ngroups=self.ngroups), 'key2': self.get_test_data(ngroups=self.ngroups), 'data1': np.random.randn(self.N), 'data2': np.random.randn(self.N), })
-        self.simple_series = Series(np.random.randn(self.N))
-        self.key1 = self.df['key1']
-
-    def get_test_data(self, ngroups=100, n=100000):
-        self.unique_groups = range(self.ngroups)
-        self.arr = np.asarray(np.tile(self.unique_groups, (n / self.ngroups)), dtype=object)
-        if (len(self.arr) < n):
-            self.arr = np.asarray((list(self.arr) + self.unique_groups[:(n - len(self.arr))]), dtype=object)
-        random.shuffle(self.arr)
-        return self.arr
+class MultiColumn(object):
 
-    def f(self):
-        self.df.groupby(['key1', 'key2']).agg((lambda x: x.values.sum()))
+    goal_time = 0.2
 
-    def time_groupby_multi_cython(self):
-        self.df.groupby(['key1', 'key2']).sum()
+    def setup_cache(self):
+        N = 10**5
+        key1 = np.tile(np.arange(100, dtype=object), 1000)
+        key2 = key1.copy()
+        np.random.shuffle(key1)
+        np.random.shuffle(key2)
+        df = DataFrame({'key1': key1,
+                        'key2': key2,
+                        'data1': np.random.randn(N),
+                        'data2': np.random.randn(N)})
+        return df
 
-    def time_groupby_multi_python(self):
-        self.df.groupby(['key1', 'key2'])['data1'].agg((lambda x: x.values.sum()))
+    def time_lambda_sum(self, df):
+        df.groupby(['key1', 'key2']).agg(lambda x: x.values.sum())
 
-    def time_groupby_multi_series_op(self):
-        self.df.groupby(['key1', 'key2'])['data1'].agg(np.std)
+    def time_cython_sum(self, df):
+        df.groupby(['key1', 'key2']).sum()
 
-    def time_groupby_series_simple_cython(self):
-        self.simple_series.groupby(self.key1).sum()
+    def time_col_select_lambda_sum(self, df):
+        df.groupby(['key1', 'key2'])['data1'].agg(lambda x: x.values.sum())
 
-    def time_groupby_series_simple_rank(self):
-        self.df.groupby('key1').rank(pct=True)
+    def time_col_select_numpy_sum(self, df):
+        df.groupby(['key1', 'key2'])['data1'].agg(np.sum)
 
 
-#----------------------------------------------------------------------
-# size() speed
+class Size(object):
 
-class groupby_size(object):
     goal_time = 0.2
 
     def setup(self):
-        self.n = 100000
-        self.offsets = np.random.randint(self.n, size=self.n).astype('timedelta64[ns]')
-        self.dates = (np.datetime64('now') + self.offsets)
-        self.df = DataFrame({'key1': np.random.randint(0, 500, size=self.n), 'key2': np.random.randint(0, 100, size=self.n), 'value1': np.random.randn(self.n), 'value2': np.random.randn(self.n), 'value3': np.random.randn(self.n), 'dates': self.dates, })
-
-    def time_groupby_multi_size(self):
+        n = 10**5
+        offsets = np.random.randint(n, size=n).astype('timedelta64[ns]')
+        dates = np.datetime64('now') + offsets
+        self.df = DataFrame({'key1': np.random.randint(0, 500, size=n),
+                             'key2': np.random.randint(0, 100, size=n),
+                             'value1': np.random.randn(n),
+                             'value2': np.random.randn(n),
+                             'value3': np.random.randn(n),
+                             'dates': dates})
+        self.draws = Series(np.random.randn(n))
+        labels = Series(['foo', 'bar', 'baz', 'qux'] * (n // 4))
+        self.cats = labels.astype('category')
+
+    def time_multi_size(self):
         self.df.groupby(['key1', 'key2']).size()
 
-    def time_groupby_dt_size(self):
-        self.df.groupby(['dates']).size()
+    def time_dt_timegrouper_size(self):
+        with warnings.catch_warnings(record=True):
+            self.df.groupby(TimeGrouper(key='dates', freq='M')).size()
 
-    def time_groupby_dt_timegrouper_size(self):
-        self.df.groupby(TimeGrouper(key='dates', freq='M')).size()
+    def time_category_size(self):
+        self.draws.groupby(self.cats).size()
 
 
-#----------------------------------------------------------------------
-# groupby with a variable value for ngroups
+class GroupByMethods(object):
 
-class groupby_ngroups_10000(object):
     goal_time = 0.2
 
-    def setup(self):
-        np.random.seed(1234)
-        self.ngroups = 10000
-        self.size = (self.ngroups * 2)
-        self.rng = np.arange(self.ngroups)
-        self.df = DataFrame(dict(timestamp=self.rng.take(np.random.randint(0, self.ngroups, size=self.size)), value=np.random.randint(0, self.size, size=self.size)))
-
-    def time_all(self):
-        self.df.groupby('value')['timestamp'].all()
-
-    def time_any(self):
-        self.df.groupby('value')['timestamp'].any()
-
-    def time_count(self):
-        self.df.groupby('value')['timestamp'].count()
-
-    def time_cumcount(self):
-        self.df.groupby('value')['timestamp'].cumcount()
-
-    def time_cummax(self):
-        self.df.groupby('value')['timestamp'].cummax()
-
-    def time_cummin(self):
-        self.df.groupby('value')['timestamp'].cummin()
-
-    def time_cumprod(self):
-        self.df.groupby('value')['timestamp'].cumprod()
-
-    def time_cumsum(self):
-        self.df.groupby('value')['timestamp'].cumsum()
-
-    def time_describe(self):
-        self.df.groupby('value')['timestamp'].describe()
-
-    def time_diff(self):
-        self.df.groupby('value')['timestamp'].diff()
-
-    def time_first(self):
-        self.df.groupby('value')['timestamp'].first()
-
-    def time_head(self):
-        self.df.groupby('value')['timestamp'].head()
-
-    def time_last(self):
-        self.df.groupby('value')['timestamp'].last()
-
-    def time_mad(self):
-        self.df.groupby('value')['timestamp'].mad()
-
-    def time_max(self):
-        self.df.groupby('value')['timestamp'].max()
-
-    def time_mean(self):
-        self.df.groupby('value')['timestamp'].mean()
-
-    def time_median(self):
-        self.df.groupby('value')['timestamp'].median()
-
-    def time_min(self):
-        self.df.groupby('value')['timestamp'].min()
-
-    def time_nunique(self):
-        self.df.groupby('value')['timestamp'].nunique()
-
-    def time_pct_change(self):
-        self.df.groupby('value')['timestamp'].pct_change()
-
-    def time_prod(self):
-        self.df.groupby('value')['timestamp'].prod()
-
-    def time_rank(self):
-        self.df.groupby('value')['timestamp'].rank()
-
-    def time_sem(self):
-        self.df.groupby('value')['timestamp'].sem()
-
-    def time_size(self):
-        self.df.groupby('value')['timestamp'].size()
-
-    def time_skew(self):
-        self.df.groupby('value')['timestamp'].skew()
-
-    def time_std(self):
-        self.df.groupby('value')['timestamp'].std()
-
-    def time_sum(self):
-        self.df.groupby('value')['timestamp'].sum()
-
-    def time_tail(self):
-        self.df.groupby('value')['timestamp'].tail()
-
-    def time_unique(self):
-        self.df.groupby('value')['timestamp'].unique()
+    param_names = ['dtype', 'method', 'application']
+    params = [['int', 'float', 'object', 'datetime'],
+              ['all', 'any', 'bfill', 'count', 'cumcount', 'cummax', 'cummin',
+               'cumprod', 'cumsum', 'describe', 'ffill', 'first', 'head',
+               'last', 'mad', 'max', 'min', 'median', 'mean', 'nunique',
+               'pct_change', 'prod', 'rank', 'sem', 'shift', 'size', 'skew',
+               'std', 'sum', 'tail', 'unique', 'value_counts', 'var'],
+              ['direct', 'transformation']]
+
+    def setup(self, dtype, method, application):
+        if method in method_blacklist.get(dtype, {}):
+            raise NotImplementedError  # skip benchmark
+        ngroups = 1000
+        size = ngroups * 2
+        rng = np.arange(ngroups)
+        values = rng.take(np.random.randint(0, ngroups, size=size))
+        if dtype == 'int':
+            key = np.random.randint(0, size, size=size)
+        elif dtype == 'float':
+            key = np.concatenate([np.random.random(ngroups) * 0.1,
+                                  np.random.random(ngroups) * 10.0])
+        elif dtype == 'object':
+            key = ['foo'] * size
+        elif dtype == 'datetime':
+            key = date_range('1/1/2011', periods=size, freq='s')
+
+        df = DataFrame({'values': values, 'key': key})
+
+        if application == 'transform':
+            if method == 'describe':
+                raise NotImplementedError
+
+            self.as_group_method = lambda: df.groupby(
+                'key')['values'].transform(method)
+            self.as_field_method = lambda: df.groupby(
+                'values')['key'].transform(method)
+        else:
+            self.as_group_method = getattr(df.groupby('key')['values'], method)
+            self.as_field_method = getattr(df.groupby('values')['key'], method)
+
+    def time_dtype_as_group(self, dtype, method, application):
+        self.as_group_method()
+
+    def time_dtype_as_field(self, dtype, method, application):
+        self.as_field_method()
+
+
+class RankWithTies(object):
+    # GH 21237
+    goal_time = 0.2
+    param_names = ['dtype', 'tie_method']
+    params = [['float64', 'float32', 'int64', 'datetime64'],
+              ['first', 'average', 'dense', 'min', 'max']]
 
-    def time_value_counts(self):
-        self.df.groupby('value')['timestamp'].value_counts()
+    def setup(self, dtype, tie_method):
+        N = 10**4
+        if dtype == 'datetime64':
+            data = np.array([Timestamp("2011/01/01")] * N, dtype=dtype)
+        else:
+            data = np.array([1] * N, dtype=dtype)
+        self.df = DataFrame({'values': data, 'key': ['foo'] * N})
 
-    def time_var(self):
-        self.df.groupby('value')['timestamp'].var()
+    def time_rank_ties(self, dtype, tie_method):
+        self.df.groupby('key').rank(method=tie_method)
 
 
-class groupby_ngroups_100(object):
+class Float32(object):
+    # GH 13335
     goal_time = 0.2
 
     def setup(self):
-        np.random.seed(1234)
-        self.ngroups = 100
-        self.size = (self.ngroups * 2)
-        self.rng = np.arange(self.ngroups)
-        self.df = DataFrame(dict(timestamp=self.rng.take(np.random.randint(0, self.ngroups, size=self.size)), value=np.random.randint(0, self.size, size=self.size)))
-
-    def time_all(self):
-        self.df.groupby('value')['timestamp'].all()
-
-    def time_any(self):
-        self.df.groupby('value')['timestamp'].any()
-
-    def time_count(self):
-        self.df.groupby('value')['timestamp'].count()
-
-    def time_cumcount(self):
-        self.df.groupby('value')['timestamp'].cumcount()
-
-    def time_cummax(self):
-        self.df.groupby('value')['timestamp'].cummax()
-
-    def time_cummin(self):
-        self.df.groupby('value')['timestamp'].cummin()
-
-    def time_cumprod(self):
-        self.df.groupby('value')['timestamp'].cumprod()
-
-    def time_cumsum(self):
-        self.df.groupby('value')['timestamp'].cumsum()
-
-    def time_describe(self):
-        self.df.groupby('value')['timestamp'].describe()
-
-    def time_diff(self):
-        self.df.groupby('value')['timestamp'].diff()
-
-    def time_first(self):
-        self.df.groupby('value')['timestamp'].first()
-
-    def time_head(self):
-        self.df.groupby('value')['timestamp'].head()
-
-    def time_last(self):
-        self.df.groupby('value')['timestamp'].last()
-
-    def time_mad(self):
-        self.df.groupby('value')['timestamp'].mad()
-
-    def time_max(self):
-        self.df.groupby('value')['timestamp'].max()
-
-    def time_mean(self):
-        self.df.groupby('value')['timestamp'].mean()
-
-    def time_median(self):
-        self.df.groupby('value')['timestamp'].median()
-
-    def time_min(self):
-        self.df.groupby('value')['timestamp'].min()
-
-    def time_nunique(self):
-        self.df.groupby('value')['timestamp'].nunique()
-
-    def time_pct_change(self):
-        self.df.groupby('value')['timestamp'].pct_change()
-
-    def time_prod(self):
-        self.df.groupby('value')['timestamp'].prod()
-
-    def time_rank(self):
-        self.df.groupby('value')['timestamp'].rank()
-
-    def time_sem(self):
-        self.df.groupby('value')['timestamp'].sem()
-
-    def time_size(self):
-        self.df.groupby('value')['timestamp'].size()
-
-    def time_skew(self):
-        self.df.groupby('value')['timestamp'].skew()
-
-    def time_std(self):
-        self.df.groupby('value')['timestamp'].std()
+        tmp1 = (np.random.random(10000) * 0.1).astype(np.float32)
+        tmp2 = (np.random.random(10000) * 10.0).astype(np.float32)
+        tmp = np.concatenate((tmp1, tmp2))
+        arr = np.repeat(tmp, 10)
+        self.df = DataFrame(dict(a=arr, b=arr))
 
     def time_sum(self):
-        self.df.groupby('value')['timestamp'].sum()
-
-    def time_tail(self):
-        self.df.groupby('value')['timestamp'].tail()
-
-    def time_unique(self):
-        self.df.groupby('value')['timestamp'].unique()
+        self.df.groupby(['a'])['b'].sum()
 
-    def time_value_counts(self):
-        self.df.groupby('value')['timestamp'].value_counts()
 
-    def time_var(self):
-        self.df.groupby('value')['timestamp'].var()
+class Categories(object):
 
-
-#----------------------------------------------------------------------
-# Series.value_counts
-
-class series_value_counts(object):
     goal_time = 0.2
 
     def setup(self):
-        self.s = Series(np.random.randint(0, 1000, size=100000))
-        self.s2 = self.s.astype(float)
+        N = 10**5
+        arr = np.random.random(N)
+        data = {'a': Categorical(np.random.randint(10000, size=N)),
+                'b': arr}
+        self.df = DataFrame(data)
+        data = {'a': Categorical(np.random.randint(10000, size=N),
+                                 ordered=True),
+                'b': arr}
+        self.df_ordered = DataFrame(data)
+        data = {'a': Categorical(np.random.randint(100, size=N),
+                                 categories=np.arange(10000)),
+                'b': arr}
+        self.df_extra_cat = DataFrame(data)
 
-        self.K = 1000
-        self.N = 100000
-        self.uniques = tm.makeStringIndex(self.K).values
-        self.s3 = Series(np.tile(self.uniques, (self.N // self.K)))
+    def time_groupby_sort(self):
+        self.df.groupby('a')['b'].count()
 
-    def time_value_counts_int64(self):
-        self.s.value_counts()
+    def time_groupby_nosort(self):
+        self.df.groupby('a', sort=False)['b'].count()
 
-    def time_value_counts_float64(self):
-        self.s2.value_counts()
+    def time_groupby_ordered_sort(self):
+        self.df_ordered.groupby('a')['b'].count()
 
-    def time_value_counts_strings(self):
-        self.s.value_counts()
+    def time_groupby_ordered_nosort(self):
+        self.df_ordered.groupby('a', sort=False)['b'].count()
 
+    def time_groupby_extra_cat_sort(self):
+        self.df_extra_cat.groupby('a')['b'].count()
 
-#----------------------------------------------------------------------
-# pivot_table
+    def time_groupby_extra_cat_nosort(self):
+        self.df_extra_cat.groupby('a', sort=False)['b'].count()
 
-class groupby_pivot_table(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.fac1 = np.array(['A', 'B', 'C'], dtype='O')
-        self.fac2 = np.array(['one', 'two'], dtype='O')
-        self.ind1 = np.random.randint(0, 3, size=100000)
-        self.ind2 = np.random.randint(0, 2, size=100000)
-        self.df = DataFrame({'key1': self.fac1.take(self.ind1), 'key2': self.fac2.take(self.ind2), 'key3': self.fac2.take(self.ind2), 'value1': np.random.randn(100000), 'value2': np.random.randn(100000), 'value3': np.random.randn(100000), })
+class Datelike(object):
+    # GH 14338
+    goal_time = 0.2
+    params = ['period_range', 'date_range', 'date_range_tz']
+    param_names = ['grouper']
 
-    def time_groupby_pivot_table(self):
-        self.df.pivot_table(index='key1', columns=['key2', 'key3'])
+    def setup(self, grouper):
+        N = 10**4
+        rng_map = {'period_range': period_range,
+                   'date_range': date_range,
+                   'date_range_tz': partial(date_range, tz='US/Central')}
+        self.grouper = rng_map[grouper]('1900-01-01', freq='D', periods=N)
+        self.df = DataFrame(np.random.randn(10**4, 2))
 
+    def time_sum(self, grouper):
+        self.df.groupby(self.grouper).sum()
 
-#----------------------------------------------------------------------
-# Sum booleans #2692
 
-class groupby_sum_booleans(object):
+class SumBools(object):
+    # GH 2692
     goal_time = 0.2
 
     def setup(self):
-        self.N = 500
-        self.df = DataFrame({'ii': range(self.N), 'bb': [True for x in range(self.N)], })
+        N = 500
+        self.df = DataFrame({'ii': range(N),
+                             'bb': [True] * N})
 
     def time_groupby_sum_booleans(self):
         self.df.groupby('ii').sum()
 
 
-#----------------------------------------------------------------------
-# multi-indexed group sum #9049
-
-class groupby_sum_multiindex(object):
+class SumMultiLevel(object):
+    # GH 9049
     goal_time = 0.2
+    timeout = 120.0
 
     def setup(self):
-        self.N = 50
-        self.df = DataFrame({'A': (range(self.N) * 2), 'B': range((self.N * 2)), 'C': 1, }).set_index(['A', 'B'])
+        N = 50
+        self.df = DataFrame({'A': list(range(N)) * 2,
+                             'B': range(N * 2),
+                             'C': 1}).set_index(['A', 'B'])
 
     def time_groupby_sum_multiindex(self):
         self.df.groupby(level=[0, 1]).sum()
 
 
-#-------------------------------------------------------------------------------
-# Transform testing
-
-class groupby_transform(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.n_dates = 400
-        self.n_securities = 250
-        self.n_columns = 3
-        self.share_na = 0.1
-        self.dates = date_range('1997-12-31', periods=self.n_dates, freq='B')
-        self.dates = Index(map((lambda x: (((x.year * 10000) + (x.month * 100)) + x.day)), self.dates))
-        self.secid_min = int('10000000', 16)
-        self.secid_max = int('F0000000', 16)
-        self.step = ((self.secid_max - self.secid_min) // (self.n_securities - 1))
-        self.security_ids = map((lambda x: hex(x)[2:10].upper()), range(self.secid_min, (self.secid_max + 1), self.step))
-        self.data_index = MultiIndex(levels=[self.dates.values, self.security_ids],
-                                     labels=[[i for i in range(self.n_dates) for _ in range(self.n_securities)], (range(self.n_securities) * self.n_dates)],
-                                     names=['date', 'security_id'])
-        self.n_data = len(self.data_index)
-        self.columns = Index(['factor{}'.format(i) for i in range(1, (self.n_columns + 1))])
-        self.data = DataFrame(np.random.randn(self.n_data, self.n_columns), index=self.data_index, columns=self.columns)
-        self.step = int((self.n_data * self.share_na))
-        for column_index in range(self.n_columns):
-            self.index = column_index
-            while (self.index < self.n_data):
-                self.data.set_value(self.data_index[self.index], self.columns[column_index], np.nan)
-                self.index += self.step
-        self.f_fillna = (lambda x: x.fillna(method='pad'))
-
-    def time_groupby_transform(self):
-        self.data.groupby(level='security_id').transform(self.f_fillna)
-
-    def time_groupby_transform_ufunc(self):
-        self.data.groupby(level='date').transform(np.max)
-
-
-class groupby_transform_multi_key(object):
-    goal_time = 0.2
-
-    def setup(self):
-        np.random.seed(2718281)
-        self.n = 20000
-        self.df = DataFrame(np.random.randint(1, self.n, (self.n, 3)), columns=['jim', 'joe', 'jolie'])
-
-    def time_groupby_transform_multi_key1(self):
-        self.df.groupby(['jim', 'joe'])['jolie'].transform('max')
-
+class Transform(object):
 
-class groupby_transform_multi_key2(object):
     goal_time = 0.2
 
     def setup(self):
-        np.random.seed(2718281)
-        self.n = 20000
-        self.df = DataFrame(np.random.randint(1, self.n, (self.n, 3)), columns=['jim', 'joe', 'jolie'])
-        self.df['jim'] = self.df['joe']
+        n1 = 400
+        n2 = 250
+        index = MultiIndex(levels=[np.arange(n1), tm.makeStringIndex(n2)],
+                           labels=[np.repeat(range(n1), n2).tolist(),
+                                   list(range(n2)) * n1],
+                           names=['lev1', 'lev2'])
+        arr = np.random.randn(n1 * n2, 3)
+        arr[::10000, 0] = np.nan
+        arr[1::10000, 1] = np.nan
+        arr[2::10000, 2] = np.nan
+        data = DataFrame(arr, index=index, columns=['col1', 'col20', 'col3'])
+        self.df = data
 
-    def time_groupby_transform_multi_key2(self):
-        self.df.groupby(['jim', 'joe'])['jolie'].transform('max')
+        n = 20000
+        self.df1 = DataFrame(np.random.randint(1, n, (n, 3)),
+                             columns=['jim', 'joe', 'jolie'])
+        self.df2 = self.df1.copy()
+        self.df2['jim'] = self.df2['joe']
 
+        self.df3 = DataFrame(np.random.randint(1, (n / 10), (n, 3)),
+                             columns=['jim', 'joe', 'jolie'])
+        self.df4 = self.df3.copy()
+        self.df4['jim'] = self.df4['joe']
 
-class groupby_transform_multi_key3(object):
-    goal_time = 0.2
+    def time_transform_lambda_max(self):
+        self.df.groupby(level='lev1').transform(lambda x: max(x))
 
-    def setup(self):
-        np.random.seed(2718281)
-        self.n = 200000
-        self.df = DataFrame(np.random.randint(1, (self.n / 10), (self.n, 3)), columns=['jim', 'joe', 'jolie'])
+    def time_transform_ufunc_max(self):
+        self.df.groupby(level='lev1').transform(np.max)
 
-    def time_groupby_transform_multi_key3(self):
-        self.df.groupby(['jim', 'joe'])['jolie'].transform('max')
+    def time_transform_multi_key1(self):
+        self.df1.groupby(['jim', 'joe'])['jolie'].transform('max')
 
+    def time_transform_multi_key2(self):
+        self.df2.groupby(['jim', 'joe'])['jolie'].transform('max')
 
-class groupby_transform_multi_key4(object):
-    goal_time = 0.2
+    def time_transform_multi_key3(self):
+        self.df3.groupby(['jim', 'joe'])['jolie'].transform('max')
 
-    def setup(self):
-        np.random.seed(2718281)
-        self.n = 200000
-        self.df = DataFrame(np.random.randint(1, (self.n / 10), (self.n, 3)), columns=['jim', 'joe', 'jolie'])
-        self.df['jim'] = self.df['joe']
+    def time_transform_multi_key4(self):
+        self.df4.groupby(['jim', 'joe'])['jolie'].transform('max')
 
-    def time_groupby_transform_multi_key4(self):
-        self.df.groupby(['jim', 'joe'])['jolie'].transform('max')
 
+class TransformBools(object):
 
-class groupby_transform_series(object):
     goal_time = 0.2
 
     def setup(self):
-        np.random.seed(0)
-        self.N = 120000
-        self.N_TRANSITIONS = 1400
-        self.transition_points = np.random.permutation(np.arange(self.N))[:self.N_TRANSITIONS]
-        self.transition_points.sort()
-        self.transitions = np.zeros((self.N,), dtype=np.bool)
-        self.transitions[self.transition_points] = True
-        self.g = self.transitions.cumsum()
-        self.df = DataFrame({'signal': np.random.rand(self.N), })
-
-    def time_groupby_transform_series(self):
+        N = 120000
+        transition_points = np.sort(np.random.choice(np.arange(N), 1400))
+        transitions = np.zeros(N, dtype=np.bool)
+        transitions[transition_points] = True
+        self.g = transitions.cumsum()
+        self.df = DataFrame({'signal': np.random.rand(N)})
+
+    def time_transform_mean(self):
         self.df['signal'].groupby(self.g).transform(np.mean)
 
 
-class groupby_transform_series2(object):
+class TransformNaN(object):
+    # GH 12737
     goal_time = 0.2
 
     def setup(self):
-        np.random.seed(0)
-        self.df = DataFrame({'id': (np.arange(100000) / 3), 'val': np.random.randn(100000), })
+        self.df_nans = DataFrame({'key': np.repeat(np.arange(1000), 10),
+                                  'B': np.nan,
+                                  'C': np.nan})
+        self.df_nans.loc[4::10, 'B':'C'] = 5
 
-    def time_groupby_transform_series2(self):
-        self.df.groupby('id')['val'].transform(np.mean)
+    def time_first(self):
+        self.df_nans.groupby('key').transform('first')
diff --git a/asv_bench/benchmarks/hdfstore_bench.py b/asv_bench/benchmarks/hdfstore_bench.py
deleted file mode 100644
index 7638cc2a0f8df..0000000000000
--- a/asv_bench/benchmarks/hdfstore_bench.py
+++ /dev/null
@@ -1,351 +0,0 @@
-from .pandas_vb_common import *
-import os
-
-
-class query_store_table(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.index = date_range('1/1/2000', periods=25000)
-        self.df = DataFrame({'float1': randn(25000), 'float2': randn(25000), }, index=self.index)
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-        self.store.append('df12', self.df)
-
-    def time_query_store_table(self):
-        self.store.select('df12', [('index', '>', self.df.index[10000]), ('index', '<', self.df.index[15000])])
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class query_store_table_wide(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.index = date_range('1/1/2000', periods=25000)
-        self.df = DataFrame(np.random.randn(25000, 100), index=self.index)
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-        self.store.append('df11', self.df)
-
-    def time_query_store_table_wide(self):
-        self.store.select('df11', [('index', '>', self.df.index[10000]), ('index', '<', self.df.index[15000])])
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class read_store(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.index = tm.makeStringIndex(25000)
-        self.df = DataFrame({'float1': randn(25000), 'float2': randn(25000), }, index=self.index)
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-        self.store.put('df1', self.df)
-
-    def time_read_store(self):
-        self.store.get('df1')
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class read_store_mixed(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.index = tm.makeStringIndex(25000)
-        self.df = DataFrame({'float1': randn(25000), 'float2': randn(25000), 'string1': (['foo'] * 25000), 'bool1': ([True] * 25000), 'int1': np.random.randint(0, 250000, size=25000), }, index=self.index)
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-        self.store.put('df3', self.df)
-
-    def time_read_store_mixed(self):
-        self.store.get('df3')
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class read_store_table(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.index = tm.makeStringIndex(25000)
-        self.df = DataFrame({'float1': randn(25000), 'float2': randn(25000), }, index=self.index)
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-        self.store.append('df7', self.df)
-
-    def time_read_store_table(self):
-        self.store.select('df7')
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class read_store_table_mixed(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.N = 10000
-        self.index = tm.makeStringIndex(self.N)
-        self.df = DataFrame({'float1': randn(self.N), 'float2': randn(self.N), 'string1': (['foo'] * self.N), 'bool1': ([True] * self.N), 'int1': np.random.randint(0, self.N, size=self.N), }, index=self.index)
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-        self.store.append('df5', self.df)
-
-    def time_read_store_table_mixed(self):
-        self.store.select('df5')
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class read_store_table_panel(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.p = Panel(randn(20, 1000, 25), items=[('Item%03d' % i) for i in range(20)], major_axis=date_range('1/1/2000', periods=1000), minor_axis=[('E%03d' % i) for i in range(25)])
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-        self.store.append('p1', self.p)
-
-    def time_read_store_table_panel(self):
-        self.store.select('p1')
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class read_store_table_wide(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.df = DataFrame(np.random.randn(25000, 100))
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-        self.store.append('df9', self.df)
-
-    def time_read_store_table_wide(self):
-        self.store.select('df9')
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class write_store(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.index = tm.makeStringIndex(25000)
-        self.df = DataFrame({'float1': randn(25000), 'float2': randn(25000), }, index=self.index)
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-
-    def time_write_store(self):
-        self.store.put('df2', self.df)
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class write_store_mixed(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.index = tm.makeStringIndex(25000)
-        self.df = DataFrame({'float1': randn(25000), 'float2': randn(25000), 'string1': (['foo'] * 25000), 'bool1': ([True] * 25000), 'int1': np.random.randint(0, 250000, size=25000), }, index=self.index)
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-
-    def time_write_store_mixed(self):
-        self.store.put('df4', self.df)
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class write_store_table(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.index = tm.makeStringIndex(25000)
-        self.df = DataFrame({'float1': randn(25000), 'float2': randn(25000), }, index=self.index)
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-
-    def time_write_store_table(self):
-        self.store.append('df8', self.df)
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class write_store_table_dc(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.df = DataFrame(np.random.randn(10000, 10), columns=[('C%03d' % i) for i in range(10)])
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-
-    def time_write_store_table_dc(self):
-        self.store.append('df15', self.df, data_columns=True)
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class write_store_table_mixed(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.index = tm.makeStringIndex(25000)
-        self.df = DataFrame({'float1': randn(25000), 'float2': randn(25000), 'string1': (['foo'] * 25000), 'bool1': ([True] * 25000), 'int1': np.random.randint(0, 25000, size=25000), }, index=self.index)
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-
-    def time_write_store_table_mixed(self):
-        self.store.append('df6', self.df)
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class write_store_table_panel(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.p = Panel(randn(20, 1000, 25), items=[('Item%03d' % i) for i in range(20)], major_axis=date_range('1/1/2000', periods=1000), minor_axis=[('E%03d' % i) for i in range(25)])
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-
-    def time_write_store_table_panel(self):
-        self.store.append('p2', self.p)
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class write_store_table_wide(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.df = DataFrame(np.random.randn(25000, 100))
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-
-    def time_write_store_table_wide(self):
-        self.store.append('df10', self.df)
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
\ No newline at end of file
diff --git a/asv_bench/benchmarks/index_object.py b/asv_bench/benchmarks/index_object.py
index 8c65f09937df4..f1703e163917a 100644
--- a/asv_bench/benchmarks/index_object.py
+++ b/asv_bench/benchmarks/index_object.py
@@ -1,292 +1,194 @@
-from .pandas_vb_common import *
+import numpy as np
+import pandas.util.testing as tm
+from pandas import (Series, date_range, DatetimeIndex, Index, RangeIndex,
+                    Float64Index)
 
+from .pandas_vb_common import setup  # noqa
 
-class datetime_index_intersection(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=10000, freq='T')
-        self.rng2 = self.rng[:(-1)]
-
-    def time_datetime_index_intersection(self):
-        self.rng.intersection(self.rng2)
-
-
-class datetime_index_repr(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.dr = pd.date_range('20000101', freq='D', periods=100000)
-
-    def time_datetime_index_repr(self):
-        self.dr._is_dates_only
-
-
-class datetime_index_union(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=10000, freq='T')
-        self.rng2 = self.rng[:(-1)]
-
-    def time_datetime_index_union(self):
-        self.rng.union(self.rng2)
 
+class SetOperations(object):
 
-class index_datetime_intersection(object):
     goal_time = 0.2
+    params = (['datetime', 'date_string', 'int', 'strings'],
+              ['intersection', 'union', 'symmetric_difference'])
+    param_names = ['dtype', 'method']
 
-    def setup(self):
-        self.rng = DatetimeIndex(start='1/1/2000', periods=10000, freq=datetools.Minute())
-        if (self.rng.dtype == object):
-            self.rng = self.rng.view(Index)
-        else:
-            self.rng = self.rng.asobject
-        self.rng2 = self.rng[:(-1)]
-
-    def time_index_datetime_intersection(self):
-        self.rng.intersection(self.rng2)
-
+    def setup(self, dtype, method):
+        N = 10**5
+        dates_left = date_range('1/1/2000', periods=N, freq='T')
+        fmt = '%Y-%m-%d %H:%M:%S'
+        date_str_left = Index(dates_left.strftime(fmt))
+        int_left = Index(np.arange(N))
+        str_left = tm.makeStringIndex(N)
+        data = {'datetime': {'left': dates_left, 'right': dates_left[:-1]},
+                'date_string': {'left': date_str_left,
+                                'right': date_str_left[:-1]},
+                'int': {'left': int_left, 'right': int_left[:-1]},
+                'strings': {'left': str_left, 'right': str_left[:-1]}}
+        self.left = data[dtype]['left']
+        self.right = data[dtype]['right']
 
-class index_datetime_union(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = DatetimeIndex(start='1/1/2000', periods=10000, freq=datetools.Minute())
-        if (self.rng.dtype == object):
-            self.rng = self.rng.view(Index)
-        else:
-            self.rng = self.rng.asobject
-        self.rng2 = self.rng[:(-1)]
+    def time_operation(self, dtype, method):
+        getattr(self.left, method)(self.right)
 
-    def time_index_datetime_union(self):
-        self.rng.union(self.rng2)
 
+class SetDisjoint(object):
 
-class index_float64_boolean_indexer(object):
     goal_time = 0.2
 
     def setup(self):
-        self.idx = tm.makeFloatIndex(1000000)
-        self.mask = ((np.arange(self.idx.size) % 3) == 0)
-        self.series_mask = Series(self.mask)
-
-    def time_index_float64_boolean_indexer(self):
-        self.idx[self.mask]
-
+        N = 10**5
+        B = N + 20000
+        self.datetime_left = DatetimeIndex(range(N))
+        self.datetime_right = DatetimeIndex(range(N, B))
 
-class index_float64_boolean_series_indexer(object):
-    goal_time = 0.2
+    def time_datetime_difference_disjoint(self):
+        self.datetime_left.difference(self.datetime_right)
 
-    def setup(self):
-        self.idx = tm.makeFloatIndex(1000000)
-        self.mask = ((np.arange(self.idx.size) % 3) == 0)
-        self.series_mask = Series(self.mask)
 
-    def time_index_float64_boolean_series_indexer(self):
-        self.idx[self.series_mask]
+class Datetime(object):
 
-
-class index_float64_construct(object):
     goal_time = 0.2
 
     def setup(self):
-        self.baseidx = np.arange(1000000.0)
-
-    def time_index_float64_construct(self):
-        Index(self.baseidx)
+        self.dr = date_range('20000101', freq='D', periods=10000)
 
+    def time_is_dates_only(self):
+        self.dr._is_dates_only
 
-class index_float64_div(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.idx = tm.makeFloatIndex(1000000)
-        self.mask = ((np.arange(self.idx.size) % 3) == 0)
-        self.series_mask = Series(self.mask)
+class Ops(object):
 
-    def time_index_float64_div(self):
-        (self.idx / 2)
+    sample_time = 0.2
+    params = ['float', 'int']
+    param_names = ['dtype']
 
+    def setup(self, dtype):
+        N = 10**6
+        indexes = {'int': 'makeIntIndex', 'float': 'makeFloatIndex'}
+        self.index = getattr(tm, indexes[dtype])(N)
 
-class index_float64_get(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = tm.makeFloatIndex(1000000)
-        self.mask = ((np.arange(self.idx.size) % 3) == 0)
-        self.series_mask = Series(self.mask)
+    def time_add(self, dtype):
+        self.index + 2
 
-    def time_index_float64_get(self):
-        self.idx[1]
+    def time_subtract(self, dtype):
+        self.index - 2
 
+    def time_multiply(self, dtype):
+        self.index * 2
 
-class index_float64_mul(object):
-    goal_time = 0.2
+    def time_divide(self, dtype):
+        self.index / 2
 
-    def setup(self):
-        self.idx = tm.makeFloatIndex(1000000)
-        self.mask = ((np.arange(self.idx.size) % 3) == 0)
-        self.series_mask = Series(self.mask)
+    def time_modulo(self, dtype):
+        self.index % 2
 
-    def time_index_float64_mul(self):
-        (self.idx * 2)
 
+class Range(object):
 
-class index_float64_slice_indexer_basic(object):
     goal_time = 0.2
 
     def setup(self):
-        self.idx = tm.makeFloatIndex(1000000)
-        self.mask = ((np.arange(self.idx.size) % 3) == 0)
-        self.series_mask = Series(self.mask)
+        self.idx_inc = RangeIndex(start=0, stop=10**7, step=3)
+        self.idx_dec = RangeIndex(start=10**7, stop=-1, step=-3)
 
-    def time_index_float64_slice_indexer_basic(self):
-        self.idx[:(-1)]
+    def time_max(self):
+        self.idx_inc.max()
 
+    def time_max_trivial(self):
+        self.idx_dec.max()
 
-class index_float64_slice_indexer_even(object):
-    goal_time = 0.2
+    def time_min(self):
+        self.idx_dec.min()
 
-    def setup(self):
-        self.idx = tm.makeFloatIndex(1000000)
-        self.mask = ((np.arange(self.idx.size) % 3) == 0)
-        self.series_mask = Series(self.mask)
+    def time_min_trivial(self):
+        self.idx_inc.min()
 
-    def time_index_float64_slice_indexer_even(self):
-        self.idx[::2]
 
+class IndexAppend(object):
 
-class index_int64_intersection(object):
     goal_time = 0.2
 
     def setup(self):
-        self.N = 1000000
-        self.options = np.arange(self.N)
-        self.left = Index(self.options.take(np.random.permutation(self.N)[:(self.N // 2)]))
-        self.right = Index(self.options.take(np.random.permutation(self.N)[:(self.N // 2)]))
 
-    def time_index_int64_intersection(self):
-        self.left.intersection(self.right)
+        N = 10000
+        self.range_idx = RangeIndex(0, 100)
+        self.int_idx = self.range_idx.astype(int)
+        self.obj_idx = self.int_idx.astype(str)
+        self.range_idxs = []
+        self.int_idxs = []
+        self.object_idxs = []
+        for i in range(1, N):
+            r_idx = RangeIndex(i * 100, (i + 1) * 100)
+            self.range_idxs.append(r_idx)
+            i_idx = r_idx.astype(int)
+            self.int_idxs.append(i_idx)
+            o_idx = i_idx.astype(str)
+            self.object_idxs.append(o_idx)
 
+    def time_append_range_list(self):
+        self.range_idx.append(self.range_idxs)
 
-class index_int64_union(object):
-    goal_time = 0.2
+    def time_append_int_list(self):
+        self.int_idx.append(self.int_idxs)
 
-    def setup(self):
-        self.N = 1000000
-        self.options = np.arange(self.N)
-        self.left = Index(self.options.take(np.random.permutation(self.N)[:(self.N // 2)]))
-        self.right = Index(self.options.take(np.random.permutation(self.N)[:(self.N // 2)]))
+    def time_append_obj_list(self):
+        self.obj_idx.append(self.object_idxs)
 
-    def time_index_int64_union(self):
-        self.left.union(self.right)
 
+class Indexing(object):
 
-class index_str_boolean_indexer(object):
     goal_time = 0.2
+    params = ['String', 'Float', 'Int']
+    param_names = ['dtype']
 
-    def setup(self):
-        self.idx = tm.makeStringIndex(1000000)
-        self.mask = ((np.arange(1000000) % 3) == 0)
-        self.series_mask = Series(self.mask)
-
-    def time_index_str_boolean_indexer(self):
-        self.idx[self.mask]
-
+    def setup(self, dtype):
+        N = 10**6
+        self.idx = getattr(tm, 'make{}Index'.format(dtype))(N)
+        self.array_mask = (np.arange(N) % 3) == 0
+        self.series_mask = Series(self.array_mask)
+        self.sorted = self.idx.sort_values()
+        half = N // 2
+        self.non_unique = self.idx[:half].append(self.idx[:half])
+        self.non_unique_sorted = self.sorted[:half].append(self.sorted[:half])
+        self.key = self.sorted[N // 4]
 
-class index_str_boolean_series_indexer(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = tm.makeStringIndex(1000000)
-        self.mask = ((np.arange(1000000) % 3) == 0)
-        self.series_mask = Series(self.mask)
+    def time_boolean_array(self, dtype):
+        self.idx[self.array_mask]
 
-    def time_index_str_boolean_series_indexer(self):
+    def time_boolean_series(self, dtype):
         self.idx[self.series_mask]
 
+    def time_get(self, dtype):
+        self.idx[1]
 
-class index_str_slice_indexer_basic(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = tm.makeStringIndex(1000000)
-        self.mask = ((np.arange(1000000) % 3) == 0)
-        self.series_mask = Series(self.mask)
-
-    def time_index_str_slice_indexer_basic(self):
-        self.idx[:(-1)]
-
-
-class index_str_slice_indexer_even(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = tm.makeStringIndex(1000000)
-        self.mask = ((np.arange(1000000) % 3) == 0)
-        self.series_mask = Series(self.mask)
+    def time_slice(self, dtype):
+        self.idx[:-1]
 
-    def time_index_str_slice_indexer_even(self):
+    def time_slice_step(self, dtype):
         self.idx[::2]
 
+    def time_get_loc(self, dtype):
+        self.idx.get_loc(self.key)
 
-class multiindex_duplicated(object):
-    goal_time = 0.2
-
-    def setup(self):
-        (n, k) = (200, 5000)
-        self.levels = [np.arange(n), tm.makeStringIndex(n).values, (1000 + np.arange(n))]
-        self.labels = [np.random.choice(n, (k * n)) for lev in self.levels]
-        self.mi = MultiIndex(levels=self.levels, labels=self.labels)
-
-    def time_multiindex_duplicated(self):
-        self.mi.duplicated()
-
-
-class multiindex_from_product(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.iterables = [tm.makeStringIndex(10000), range(20)]
-
-    def time_multiindex_from_product(self):
-        MultiIndex.from_product(self.iterables)
+    def time_get_loc_sorted(self, dtype):
+        self.sorted.get_loc(self.key)
 
+    def time_get_loc_non_unique(self, dtype):
+        self.non_unique.get_loc(self.key)
 
-class multiindex_sortlevel_int64(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.n = ((((3 * 5) * 7) * 11) * (1 << 10))
-        (low, high) = (((-1) << 12), (1 << 12))
-        self.f = (lambda k: np.repeat(np.random.randint(low, high, (self.n // k)), k))
-        self.i = np.random.permutation(self.n)
-        self.mi = MultiIndex.from_arrays([self.f(11), self.f(7), self.f(5), self.f(3), self.f(1)])[self.i]
-
-    def time_multiindex_sortlevel_int64(self):
-        self.mi.sortlevel()
-
-
-class multiindex_with_datetime_level_full(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.level1 = range(1000)
-        self.level2 = date_range(start='1/1/2012', periods=100)
-        self.mi = MultiIndex.from_product([self.level1, self.level2])
-
-    def time_multiindex_with_datetime_level_full(self):
-        self.mi.copy().values
+    def time_get_loc_non_unique_sorted(self, dtype):
+        self.non_unique_sorted.get_loc(self.key)
 
 
-class multiindex_with_datetime_level_sliced(object):
+class Float64IndexMethod(object):
+    # GH 13166
     goal_time = 0.2
 
     def setup(self):
-        self.level1 = range(1000)
-        self.level2 = date_range(start='1/1/2012', periods=100)
-        self.mi = MultiIndex.from_product([self.level1, self.level2])
+        N = 100000
+        a = np.arange(N)
+        self.ind = Float64Index(a * 4.8000000418824129e-08)
 
-    def time_multiindex_with_datetime_level_sliced(self):
-        self.mi[:10].values
\ No newline at end of file
+    def time_get_loc(self):
+        self.ind.get_loc(0)
diff --git a/asv_bench/benchmarks/indexing.py b/asv_bench/benchmarks/indexing.py
index 32d80a7913234..739ad6a3d278b 100644
--- a/asv_bench/benchmarks/indexing.py
+++ b/asv_bench/benchmarks/indexing.py
@@ -1,489 +1,354 @@
-from .pandas_vb_common import *
-try:
-    import pandas.computation.expressions as expr
-except:
-    expr = None
+import warnings
 
+import numpy as np
+import pandas.util.testing as tm
+from pandas import (Series, DataFrame, MultiIndex, Int64Index, Float64Index,
+                    IntervalIndex, CategoricalIndex,
+                    IndexSlice, concat, date_range)
+from .pandas_vb_common import setup, Panel  # noqa
 
-class dataframe_getitem_scalar(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = tm.makeStringIndex(1000)
-        self.columns = tm.makeStringIndex(30)
-        self.df = DataFrame(np.random.rand(1000, 30), index=self.index, columns=self.columns)
-        self.idx = self.index[100]
-        self.col = self.columns[10]
-
-    def time_dataframe_getitem_scalar(self):
-        self.df[self.col][self.idx]
-
-
-class datamatrix_getitem_scalar(object):
-    goal_time = 0.2
-
-    def setup(self):
-        try:
-            self.klass = DataMatrix
-        except:
-            self.klass = DataFrame
-        self.index = tm.makeStringIndex(1000)
-        self.columns = tm.makeStringIndex(30)
-        self.df = self.klass(np.random.rand(1000, 30), index=self.index, columns=self.columns)
-        self.idx = self.index[100]
-        self.col = self.columns[10]
-
-    def time_datamatrix_getitem_scalar(self):
-        self.df[self.col][self.idx]
-
-
-class series_get_value(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = tm.makeStringIndex(1000)
-        self.s = Series(np.random.rand(1000), index=self.index)
-        self.idx = self.index[100]
-
-    def time_series_get_value(self):
-        self.s.get_value(self.idx)
-
-
-class time_series_getitem_scalar(object):
-    goal_time = 0.2
-
-    def setup(self):
-        tm.N = 1000
-        self.ts = tm.makeTimeSeries()
-        self.dt = self.ts.index[500]
-
-    def time_time_series_getitem_scalar(self):
-        self.ts[self.dt]
-
-
-class frame_iloc_big(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(dict(A=(['foo'] * 1000000)))
-
-    def time_frame_iloc_big(self):
-        self.df.iloc[:100, 0]
-
-
-class frame_iloc_dups(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame({'A': ([0.1] * 3000), 'B': ([1] * 3000), })
-        self.idx = (np.array(range(30)) * 99)
-        self.df2 = DataFrame({'A': ([0.1] * 1000), 'B': ([1] * 1000), })
-        self.df2 = concat([self.df2, (2 * self.df2), (3 * self.df2)])
-
-    def time_frame_iloc_dups(self):
-        self.df2.iloc[self.idx]
 
+class NumericSeriesIndexing(object):
 
-class frame_loc_dups(object):
     goal_time = 0.2
+    params = [Int64Index, Float64Index]
+    param = ['index']
 
-    def setup(self):
-        self.df = DataFrame({'A': ([0.1] * 3000), 'B': ([1] * 3000), })
-        self.idx = (np.array(range(30)) * 99)
-        self.df2 = DataFrame({'A': ([0.1] * 1000), 'B': ([1] * 1000), })
-        self.df2 = concat([self.df2, (2 * self.df2), (3 * self.df2)])
+    def setup(self, index):
+        N = 10**6
+        idx = index(range(N))
+        self.data = Series(np.random.rand(N), index=idx)
+        self.array = np.arange(10000)
+        self.array_list = self.array.tolist()
 
-    def time_frame_loc_dups(self):
-        self.df2.loc[self.idx]
+    def time_getitem_scalar(self, index):
+        self.data[800000]
 
+    def time_getitem_slice(self, index):
+        self.data[:800000]
 
-class frame_xs_mi_ix(object):
-    goal_time = 0.2
+    def time_getitem_list_like(self, index):
+        self.data[[800000]]
 
-    def setup(self):
-        self.mi = MultiIndex.from_tuples([(x, y) for x in range(1000) for y in range(1000)])
-        self.s = Series(np.random.randn(1000000), index=self.mi)
-        self.df = DataFrame(self.s)
+    def time_getitem_array(self, index):
+        self.data[self.array]
 
-    def time_frame_xs_mi_ix(self):
-        self.df.ix[999]
+    def time_getitem_lists(self, index):
+        self.data[self.array_list]
 
+    def time_iloc_array(self, index):
+        self.data.iloc[self.array]
 
-class indexing_dataframe_boolean(object):
-    goal_time = 0.2
+    def time_iloc_list_like(self, index):
+        self.data.iloc[[800000]]
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(50000, 100))
-        self.df2 = DataFrame(np.random.randn(50000, 100))
+    def time_iloc_scalar(self, index):
+        self.data.iloc[800000]
 
-    def time_indexing_dataframe_boolean(self):
-        (self.df > self.df2)
+    def time_iloc_slice(self, index):
+        self.data.iloc[:800000]
 
+    def time_ix_array(self, index):
+        self.data.ix[self.array]
 
-class indexing_dataframe_boolean_no_ne(object):
-    goal_time = 0.2
+    def time_ix_list_like(self, index):
+        self.data.ix[[800000]]
 
-    def setup(self):
-        if (expr is None):
-            raise NotImplementedError
-        self.df = DataFrame(np.random.randn(50000, 100))
-        self.df2 = DataFrame(np.random.randn(50000, 100))
-        expr.set_use_numexpr(False)
+    def time_ix_scalar(self, index):
+        self.data.ix[800000]
 
-    def time_indexing_dataframe_boolean_no_ne(self):
-        (self.df > self.df2)
+    def time_ix_slice(self, index):
+        self.data.ix[:800000]
 
-    def teardown(self):
-        expr.set_use_numexpr(True)
+    def time_loc_array(self, index):
+        self.data.loc[self.array]
 
+    def time_loc_list_like(self, index):
+        self.data.loc[[800000]]
 
-class indexing_dataframe_boolean_rows(object):
-    goal_time = 0.2
+    def time_loc_scalar(self, index):
+        self.data.loc[800000]
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(10000, 4), columns=['A', 'B', 'C', 'D'])
-        self.indexer = (self.df['B'] > 0)
-        self.obj_indexer = self.indexer.astype('O')
+    def time_loc_slice(self, index):
+        self.data.loc[:800000]
 
-    def time_indexing_dataframe_boolean_rows(self):
-        self.df[self.indexer]
 
+class NonNumericSeriesIndexing(object):
 
-class indexing_dataframe_boolean_rows_object(object):
     goal_time = 0.2
+    params = ['string', 'datetime']
+    param_names = ['index']
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(10000, 4), columns=['A', 'B', 'C', 'D'])
-        self.indexer = (self.df['B'] > 0)
-        self.obj_indexer = self.indexer.astype('O')
-
-    def time_indexing_dataframe_boolean_rows_object(self):
-        self.df[self.obj_indexer]
+    def setup(self, index):
+        N = 10**5
+        indexes = {'string': tm.makeStringIndex(N),
+                   'datetime': date_range('1900', periods=N, freq='s')}
+        index = indexes[index]
+        self.s = Series(np.random.rand(N), index=index)
+        self.lbl = index[80000]
 
+    def time_getitem_label_slice(self, index):
+        self.s[:self.lbl]
 
-class indexing_dataframe_boolean_st(object):
-    goal_time = 0.2
+    def time_getitem_pos_slice(self, index):
+        self.s[:80000]
 
-    def setup(self):
-        if (expr is None):
-            raise NotImplementedError
-        self.df = DataFrame(np.random.randn(50000, 100))
-        self.df2 = DataFrame(np.random.randn(50000, 100))
-        expr.set_numexpr_threads(1)
+    def time_get_value(self, index):
+        with warnings.catch_warnings(record=True):
+            self.s.get_value(self.lbl)
 
-    def time_indexing_dataframe_boolean_st(self):
-        (self.df > self.df2)
+    def time_getitem_scalar(self, index):
+        self.s[self.lbl]
 
-    def teardown(self):
-        expr.set_numexpr_threads()
 
+class DataFrameStringIndexing(object):
 
-class indexing_frame_get_value(object):
     goal_time = 0.2
 
     def setup(self):
-        self.index = tm.makeStringIndex(1000)
-        self.columns = tm.makeStringIndex(30)
-        self.df = DataFrame(np.random.randn(1000, 30), index=self.index, columns=self.columns)
-        self.idx = self.index[100]
-        self.col = self.columns[10]
+        index = tm.makeStringIndex(1000)
+        columns = tm.makeStringIndex(30)
+        self.df = DataFrame(np.random.randn(1000, 30), index=index,
+                            columns=columns)
+        self.idx_scalar = index[100]
+        self.col_scalar = columns[10]
+        self.bool_indexer = self.df[self.col_scalar] > 0
+        self.bool_obj_indexer = self.bool_indexer.astype(object)
 
-    def time_indexing_frame_get_value(self):
-        self.df.get_value(self.idx, self.col)
+    def time_get_value(self):
+        with warnings.catch_warnings(record=True):
+            self.df.get_value(self.idx_scalar, self.col_scalar)
 
+    def time_ix(self):
+        self.df.ix[self.idx_scalar, self.col_scalar]
 
-class indexing_frame_get_value_ix(object):
-    goal_time = 0.2
+    def time_loc(self):
+        self.df.loc[self.idx_scalar, self.col_scalar]
 
-    def setup(self):
-        self.index = tm.makeStringIndex(1000)
-        self.columns = tm.makeStringIndex(30)
-        self.df = DataFrame(np.random.randn(1000, 30), index=self.index, columns=self.columns)
-        self.idx = self.index[100]
-        self.col = self.columns[10]
+    def time_getitem_scalar(self):
+        self.df[self.col_scalar][self.idx_scalar]
 
-    def time_indexing_frame_get_value_ix(self):
-        self.df.ix[(self.idx, self.col)]
+    def time_boolean_rows(self):
+        self.df[self.bool_indexer]
 
+    def time_boolean_rows_object(self):
+        self.df[self.bool_obj_indexer]
 
-class indexing_panel_subset(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.p = Panel(np.random.randn(100, 100, 100))
-        self.inds = range(0, 100, 10)
+class DataFrameNumericIndexing(object):
 
-    def time_indexing_panel_subset(self):
-        self.p.ix[(self.inds, self.inds, self.inds)]
-
-
-class multiindex_slicers(object):
     goal_time = 0.2
 
     def setup(self):
-        np.random.seed(1234)
-        self.idx = pd.IndexSlice
-        self.n = 100000
-        self.mdt = pandas.DataFrame()
-        self.mdt['A'] = np.random.choice(range(10000, 45000, 1000), self.n)
-        self.mdt['B'] = np.random.choice(range(10, 400), self.n)
-        self.mdt['C'] = np.random.choice(range(1, 150), self.n)
-        self.mdt['D'] = np.random.choice(range(10000, 45000), self.n)
-        self.mdt['x'] = np.random.choice(range(400), self.n)
-        self.mdt['y'] = np.random.choice(range(25), self.n)
-        self.test_A = 25000
-        self.test_B = 25
-        self.test_C = 40
-        self.test_D = 35000
-        self.eps_A = 5000
-        self.eps_B = 5
-        self.eps_C = 5
-        self.eps_D = 5000
-        self.mdt2 = self.mdt.set_index(['A', 'B', 'C', 'D']).sortlevel()
-
-    def time_multiindex_slicers(self):
-        self.mdt2.loc[self.idx[(self.test_A - self.eps_A):(self.test_A + self.eps_A), (self.test_B - self.eps_B):(self.test_B + self.eps_B), (self.test_C - self.eps_C):(self.test_C + self.eps_C), (self.test_D - self.eps_D):(self.test_D + self.eps_D)], :]
-
-
-class series_getitem_array(object):
-    goal_time = 0.2
+        self.idx_dupe = np.array(range(30)) * 99
+        self.df = DataFrame(np.random.randn(10000, 5))
+        self.df_dup = concat([self.df, 2 * self.df, 3 * self.df])
+        self.bool_indexer = [True] * 5000 + [False] * 5000
 
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
-
-    def time_series_getitem_array(self):
-        self.s[np.arange(10000)]
+    def time_iloc_dups(self):
+        self.df_dup.iloc[self.idx_dupe]
 
+    def time_loc_dups(self):
+        self.df_dup.loc[self.idx_dupe]
 
-class series_getitem_label_slice(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = tm.makeStringIndex(1000000)
-        self.s = Series(np.random.rand(1000000), index=self.index)
-        self.lbl = self.s.index[800000]
-
-    def time_series_getitem_label_slice(self):
-        self.s[:self.lbl]
-
+    def time_iloc(self):
+        self.df.iloc[:100, 0]
 
-class series_getitem_list_like(object):
-    goal_time = 0.2
+    def time_loc(self):
+        self.df.loc[:100, 0]
 
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
+    def time_bool_indexer(self):
+        self.df[self.bool_indexer]
 
-    def time_series_getitem_list_like(self):
-        self.s[[800000]]
 
+class Take(object):
 
-class series_getitem_pos_slice(object):
     goal_time = 0.2
+    params = ['int', 'datetime']
+    param_names = ['index']
 
-    def setup(self):
-        self.index = tm.makeStringIndex(1000000)
-        self.s = Series(np.random.rand(1000000), index=self.index)
-
-    def time_series_getitem_pos_slice(self):
-        self.s[:800000]
-
-
-class series_getitem_scalar(object):
-    goal_time = 0.2
+    def setup(self, index):
+        N = 100000
+        indexes = {'int': Int64Index(np.arange(N)),
+                   'datetime': date_range('2011-01-01', freq='S', periods=N)}
+        index = indexes[index]
+        self.s = Series(np.random.rand(N), index=index)
+        self.indexer = [True, False, True, True, False] * 20000
 
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
+    def time_take(self, index):
+        self.s.take(self.indexer)
 
-    def time_series_getitem_scalar(self):
-        self.s[800000]
 
+class MultiIndexing(object):
 
-class series_getitem_slice(object):
     goal_time = 0.2
 
     def setup(self):
-        self.s = Series(np.random.rand(1000000))
-
-    def time_series_getitem_slice(self):
-        self.s[:800000]
+        mi = MultiIndex.from_product([range(1000), range(1000)])
+        self.s = Series(np.random.randn(1000000), index=mi)
+        self.df = DataFrame(self.s)
 
+        n = 100000
+        self.mdt = DataFrame({'A': np.random.choice(range(10000, 45000, 1000),
+                                                    n),
+                              'B': np.random.choice(range(10, 400), n),
+                              'C': np.random.choice(range(1, 150), n),
+                              'D': np.random.choice(range(10000, 45000), n),
+                              'x': np.random.choice(range(400), n),
+                              'y': np.random.choice(range(25), n)})
+        self.idx = IndexSlice[20000:30000, 20:30, 35:45, 30000:40000]
+        self.mdt = self.mdt.set_index(['A', 'B', 'C', 'D']).sort_index()
+
+    def time_series_ix(self):
+        self.s.ix[999]
 
-class series_iloc_array(object):
-    goal_time = 0.2
+    def time_frame_ix(self):
+        self.df.ix[999]
 
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
+    def time_index_slice(self):
+        self.mdt.loc[self.idx, :]
 
-    def time_series_iloc_array(self):
-        self.s.iloc[np.arange(10000)]
 
+class IntervalIndexing(object):
 
-class series_iloc_list_like(object):
     goal_time = 0.2
 
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
+    def setup_cache(self):
+        idx = IntervalIndex.from_breaks(np.arange(1000001))
+        monotonic = Series(np.arange(1000000), index=idx)
+        return monotonic
 
-    def time_series_iloc_list_like(self):
-        self.s.iloc[[800000]]
+    def time_getitem_scalar(self, monotonic):
+        monotonic[80000]
 
+    def time_loc_scalar(self, monotonic):
+        monotonic.loc[80000]
 
-class series_iloc_scalar(object):
-    goal_time = 0.2
+    def time_getitem_list(self, monotonic):
+        monotonic[80000:]
 
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
+    def time_loc_list(self, monotonic):
+        monotonic.loc[80000:]
 
-    def time_series_iloc_scalar(self):
-        self.s.iloc[800000]
 
+class CategoricalIndexIndexing(object):
 
-class series_iloc_slice(object):
     goal_time = 0.2
+    params = ['monotonic_incr', 'monotonic_decr', 'non_monotonic']
+    param_names = ['index']
 
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
+    def setup(self, index):
+        N = 10**5
+        values = list('a' * N + 'b' * N + 'c' * N)
+        indices = {
+            'monotonic_incr': CategoricalIndex(values),
+            'monotonic_decr': CategoricalIndex(reversed(values)),
+            'non_monotonic': CategoricalIndex(list('abc' * N))}
+        self.data = indices[index]
 
-    def time_series_iloc_slice(self):
-        self.s.iloc[:800000]
+        self.int_scalar = 10000
+        self.int_list = list(range(10000))
 
+        self.cat_scalar = 'b'
+        self.cat_list = ['a', 'c']
 
-class series_ix_array(object):
-    goal_time = 0.2
+    def time_getitem_scalar(self, index):
+        self.data[self.int_scalar]
 
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
+    def time_getitem_slice(self, index):
+        self.data[:self.int_scalar]
 
-    def time_series_ix_array(self):
-        self.s.ix[np.arange(10000)]
+    def time_getitem_list_like(self, index):
+        self.data[[self.int_scalar]]
 
+    def time_getitem_list(self, index):
+        self.data[self.int_list]
 
-class series_ix_list_like(object):
-    goal_time = 0.2
+    def time_getitem_bool_array(self, index):
+        self.data[self.data == self.cat_scalar]
 
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
+    def time_get_loc_scalar(self, index):
+        self.data.get_loc(self.cat_scalar)
 
-    def time_series_ix_list_like(self):
-        self.s.ix[[800000]]
+    def time_get_indexer_list(self, index):
+        self.data.get_indexer(self.cat_list)
 
 
-class series_ix_scalar(object):
-    goal_time = 0.2
+class PanelIndexing(object):
 
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
-
-    def time_series_ix_scalar(self):
-        self.s.ix[800000]
-
-
-class series_ix_slice(object):
     goal_time = 0.2
 
     def setup(self):
-        self.s = Series(np.random.rand(1000000))
-
-    def time_series_ix_slice(self):
-        self.s.ix[:800000]
+        with warnings.catch_warnings(record=True):
+            self.p = Panel(np.random.randn(100, 100, 100))
+            self.inds = range(0, 100, 10)
 
+    def time_subset(self):
+        with warnings.catch_warnings(record=True):
+            self.p.ix[(self.inds, self.inds, self.inds)]
 
-class series_loc_array(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
-
-    def time_series_loc_array(self):
-        self.s.loc[np.arange(10000)]
 
+class MethodLookup(object):
 
-class series_loc_list_like(object):
     goal_time = 0.2
 
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
-
-    def time_series_loc_list_like(self):
-        self.s.loc[[800000]]
+    def setup_cache(self):
+        s = Series()
+        return s
 
+    def time_lookup_iloc(self, s):
+        s.iloc
 
-class series_loc_scalar(object):
-    goal_time = 0.2
+    def time_lookup_ix(self, s):
+        s.ix
 
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
+    def time_lookup_loc(self, s):
+        s.loc
 
-    def time_series_loc_scalar(self):
-        self.s.loc[800000]
 
+class GetItemSingleColumn(object):
 
-class series_loc_slice(object):
     goal_time = 0.2
 
     def setup(self):
-        self.s = Series(np.random.rand(1000000))
+        self.df_string_col = DataFrame(np.random.randn(3000, 1), columns=['A'])
+        self.df_int_col = DataFrame(np.random.randn(3000, 1))
 
-    def time_series_loc_slice(self):
-        self.s.loc[:800000]
-
-
-class series_take_dtindex(object):
-    goal_time = 0.2
+    def time_frame_getitem_single_column_label(self):
+        self.df_string_col['A']
 
-    def setup(self):
-        self.s = Series(np.random.rand(100000))
-        self.ts = Series(np.random.rand(100000), index=date_range('2011-01-01', freq='S', periods=100000))
-        self.indexer = ([True, False, True, True, False] * 20000)
+    def time_frame_getitem_single_column_int(self):
+        self.df_int_col[0]
 
-    def time_series_take_dtindex(self):
-        self.ts.take(self.indexer)
 
+class AssignTimeseriesIndex(object):
 
-class series_take_intindex(object):
     goal_time = 0.2
 
     def setup(self):
-        self.s = Series(np.random.rand(100000))
-        self.ts = Series(np.random.rand(100000), index=date_range('2011-01-01', freq='S', periods=100000))
-        self.indexer = ([True, False, True, True, False] * 20000)
-
-    def time_series_take_intindex(self):
-        self.s.take(self.indexer)
-
+        N = 100000
+        idx = date_range('1/1/2000', periods=N, freq='H')
+        self.df = DataFrame(np.random.randn(N, 1), columns=['A'], index=idx)
 
-class series_xs_mi_ix(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.mi = MultiIndex.from_tuples([(x, y) for x in range(1000) for y in range(1000)])
-        self.s = Series(np.random.randn(1000000), index=self.mi)
+    def time_frame_assign_timeseries_index(self):
+        self.df['date'] = self.df.index
 
-    def time_series_xs_mi_ix(self):
-        self.s.ix[999]
 
+class InsertColumns(object):
 
-class sort_level_one(object):
     goal_time = 0.2
 
     def setup(self):
-        self.a = np.repeat(np.arange(100), 1000)
-        self.b = np.tile(np.arange(1000), 100)
-        self.midx = MultiIndex.from_arrays([self.a, self.b])
-        self.midx = self.midx.take(np.random.permutation(np.arange(100000)))
+        self.N = 10**3
+        self.df = DataFrame(index=range(self.N))
 
-    def time_sort_level_one(self):
-        self.midx.sortlevel(1)
-
-
-class sort_level_zero(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.a = np.repeat(np.arange(100), 1000)
-        self.b = np.tile(np.arange(1000), 100)
-        self.midx = MultiIndex.from_arrays([self.a, self.b])
-        self.midx = self.midx.take(np.random.permutation(np.arange(100000)))
+    def time_insert(self):
+        np.random.seed(1234)
+        for i in range(100):
+            self.df.insert(0, i, np.random.randn(self.N),
+                           allow_duplicates=True)
 
-    def time_sort_level_zero(self):
-        self.midx.sortlevel(0)
\ No newline at end of file
+    def time_assign_with_setitem(self):
+        np.random.seed(1234)
+        for i in range(100):
+            self.df[i] = np.random.randn(self.N)
diff --git a/asv_bench/benchmarks/inference.py b/asv_bench/benchmarks/inference.py
index 3fceed087facb..16d9e7cd73cbb 100644
--- a/asv_bench/benchmarks/inference.py
+++ b/asv_bench/benchmarks/inference.py
@@ -1,138 +1,113 @@
-from .pandas_vb_common import *
-import pandas as pd
+import numpy as np
+import pandas.util.testing as tm
+from pandas import DataFrame, Series, to_numeric
 
+from .pandas_vb_common import numeric_dtypes, lib, setup  # noqa
 
-class dtype_infer_datetime64(object):
+
+class NumericInferOps(object):
+    # from GH 7332
     goal_time = 0.2
+    params = numeric_dtypes
+    param_names = ['dtype']
 
-    def setup(self):
-        self.N = 500000
-        self.df_int64 = DataFrame(dict(A=np.arange(self.N, dtype='int64'), B=np.arange(self.N, dtype='int64')))
-        self.df_int32 = DataFrame(dict(A=np.arange(self.N, dtype='int32'), B=np.arange(self.N, dtype='int32')))
-        self.df_uint32 = DataFrame(dict(A=np.arange(self.N, dtype='uint32'), B=np.arange(self.N, dtype='uint32')))
-        self.df_float64 = DataFrame(dict(A=np.arange(self.N, dtype='float64'), B=np.arange(self.N, dtype='float64')))
-        self.df_float32 = DataFrame(dict(A=np.arange(self.N, dtype='float32'), B=np.arange(self.N, dtype='float32')))
-        self.df_datetime64 = DataFrame(dict(A=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms'), B=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms')))
-        self.df_timedelta64 = DataFrame(dict(A=(self.df_datetime64['A'] - self.df_datetime64['B']), B=self.df_datetime64['B']))
+    def setup(self, dtype):
+        N = 5 * 10**5
+        self.df = DataFrame({'A': np.arange(N).astype(dtype),
+                             'B': np.arange(N).astype(dtype)})
 
-    def time_dtype_infer_datetime64(self):
-        (self.df_datetime64['A'] - self.df_datetime64['B'])
+    def time_add(self, dtype):
+        self.df['A'] + self.df['B']
 
+    def time_subtract(self, dtype):
+        self.df['A'] - self.df['B']
 
-class dtype_infer_float32(object):
-    goal_time = 0.2
+    def time_multiply(self, dtype):
+        self.df['A'] * self.df['B']
 
-    def setup(self):
-        self.N = 500000
-        self.df_int64 = DataFrame(dict(A=np.arange(self.N, dtype='int64'), B=np.arange(self.N, dtype='int64')))
-        self.df_int32 = DataFrame(dict(A=np.arange(self.N, dtype='int32'), B=np.arange(self.N, dtype='int32')))
-        self.df_uint32 = DataFrame(dict(A=np.arange(self.N, dtype='uint32'), B=np.arange(self.N, dtype='uint32')))
-        self.df_float64 = DataFrame(dict(A=np.arange(self.N, dtype='float64'), B=np.arange(self.N, dtype='float64')))
-        self.df_float32 = DataFrame(dict(A=np.arange(self.N, dtype='float32'), B=np.arange(self.N, dtype='float32')))
-        self.df_datetime64 = DataFrame(dict(A=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms'), B=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms')))
-        self.df_timedelta64 = DataFrame(dict(A=(self.df_datetime64['A'] - self.df_datetime64['B']), B=self.df_datetime64['B']))
+    def time_divide(self, dtype):
+        self.df['A'] / self.df['B']
 
-    def time_dtype_infer_float32(self):
-        (self.df_float32['A'] + self.df_float32['B'])
+    def time_modulo(self, dtype):
+        self.df['A'] % self.df['B']
 
 
-class dtype_infer_float64(object):
+class DateInferOps(object):
+    # from GH 7332
     goal_time = 0.2
 
-    def setup(self):
-        self.N = 500000
-        self.df_int64 = DataFrame(dict(A=np.arange(self.N, dtype='int64'), B=np.arange(self.N, dtype='int64')))
-        self.df_int32 = DataFrame(dict(A=np.arange(self.N, dtype='int32'), B=np.arange(self.N, dtype='int32')))
-        self.df_uint32 = DataFrame(dict(A=np.arange(self.N, dtype='uint32'), B=np.arange(self.N, dtype='uint32')))
-        self.df_float64 = DataFrame(dict(A=np.arange(self.N, dtype='float64'), B=np.arange(self.N, dtype='float64')))
-        self.df_float32 = DataFrame(dict(A=np.arange(self.N, dtype='float32'), B=np.arange(self.N, dtype='float32')))
-        self.df_datetime64 = DataFrame(dict(A=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms'), B=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms')))
-        self.df_timedelta64 = DataFrame(dict(A=(self.df_datetime64['A'] - self.df_datetime64['B']), B=self.df_datetime64['B']))
+    def setup_cache(self):
+        N = 5 * 10**5
+        df = DataFrame({'datetime64': np.arange(N).astype('datetime64[ms]')})
+        df['timedelta'] = df['datetime64'] - df['datetime64']
+        return df
 
-    def time_dtype_infer_float64(self):
-        (self.df_float64['A'] + self.df_float64['B'])
+    def time_subtract_datetimes(self, df):
+        df['datetime64'] - df['datetime64']
 
+    def time_timedelta_plus_datetime(self, df):
+        df['timedelta'] + df['datetime64']
 
-class dtype_infer_int32(object):
-    goal_time = 0.2
+    def time_add_timedeltas(self, df):
+        df['timedelta'] + df['timedelta']
 
-    def setup(self):
-        self.N = 500000
-        self.df_int64 = DataFrame(dict(A=np.arange(self.N, dtype='int64'), B=np.arange(self.N, dtype='int64')))
-        self.df_int32 = DataFrame(dict(A=np.arange(self.N, dtype='int32'), B=np.arange(self.N, dtype='int32')))
-        self.df_uint32 = DataFrame(dict(A=np.arange(self.N, dtype='uint32'), B=np.arange(self.N, dtype='uint32')))
-        self.df_float64 = DataFrame(dict(A=np.arange(self.N, dtype='float64'), B=np.arange(self.N, dtype='float64')))
-        self.df_float32 = DataFrame(dict(A=np.arange(self.N, dtype='float32'), B=np.arange(self.N, dtype='float32')))
-        self.df_datetime64 = DataFrame(dict(A=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms'), B=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms')))
-        self.df_timedelta64 = DataFrame(dict(A=(self.df_datetime64['A'] - self.df_datetime64['B']), B=self.df_datetime64['B']))
 
-    def time_dtype_infer_int32(self):
-        (self.df_int32['A'] + self.df_int32['B'])
+class ToNumeric(object):
 
-
-class dtype_infer_int64(object):
     goal_time = 0.2
+    params = ['ignore', 'coerce']
+    param_names = ['errors']
 
-    def setup(self):
-        self.N = 500000
-        self.df_int64 = DataFrame(dict(A=np.arange(self.N, dtype='int64'), B=np.arange(self.N, dtype='int64')))
-        self.df_int32 = DataFrame(dict(A=np.arange(self.N, dtype='int32'), B=np.arange(self.N, dtype='int32')))
-        self.df_uint32 = DataFrame(dict(A=np.arange(self.N, dtype='uint32'), B=np.arange(self.N, dtype='uint32')))
-        self.df_float64 = DataFrame(dict(A=np.arange(self.N, dtype='float64'), B=np.arange(self.N, dtype='float64')))
-        self.df_float32 = DataFrame(dict(A=np.arange(self.N, dtype='float32'), B=np.arange(self.N, dtype='float32')))
-        self.df_datetime64 = DataFrame(dict(A=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms'), B=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms')))
-        self.df_timedelta64 = DataFrame(dict(A=(self.df_datetime64['A'] - self.df_datetime64['B']), B=self.df_datetime64['B']))
+    def setup(self, errors):
+        N = 10000
+        self.float = Series(np.random.randn(N))
+        self.numstr = self.float.astype('str')
+        self.str = Series(tm.makeStringIndex(N))
 
-    def time_dtype_infer_int64(self):
-        (self.df_int64['A'] + self.df_int64['B'])
+    def time_from_float(self, errors):
+        to_numeric(self.float, errors=errors)
 
+    def time_from_numeric_str(self, errors):
+        to_numeric(self.numstr, errors=errors)
 
-class dtype_infer_timedelta64_1(object):
-    goal_time = 0.2
+    def time_from_str(self, errors):
+        to_numeric(self.str, errors=errors)
 
-    def setup(self):
-        self.N = 500000
-        self.df_int64 = DataFrame(dict(A=np.arange(self.N, dtype='int64'), B=np.arange(self.N, dtype='int64')))
-        self.df_int32 = DataFrame(dict(A=np.arange(self.N, dtype='int32'), B=np.arange(self.N, dtype='int32')))
-        self.df_uint32 = DataFrame(dict(A=np.arange(self.N, dtype='uint32'), B=np.arange(self.N, dtype='uint32')))
-        self.df_float64 = DataFrame(dict(A=np.arange(self.N, dtype='float64'), B=np.arange(self.N, dtype='float64')))
-        self.df_float32 = DataFrame(dict(A=np.arange(self.N, dtype='float32'), B=np.arange(self.N, dtype='float32')))
-        self.df_datetime64 = DataFrame(dict(A=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms'), B=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms')))
-        self.df_timedelta64 = DataFrame(dict(A=(self.df_datetime64['A'] - self.df_datetime64['B']), B=self.df_datetime64['B']))
 
-    def time_dtype_infer_timedelta64_1(self):
-        (self.df_timedelta64['A'] + self.df_timedelta64['B'])
+class ToNumericDowncast(object):
 
+    param_names = ['dtype', 'downcast']
+    params = [['string-float', 'string-int', 'string-nint', 'datetime64',
+               'int-list', 'int32'],
+              [None, 'integer', 'signed', 'unsigned', 'float']]
 
-class dtype_infer_timedelta64_2(object):
-    goal_time = 0.2
+    N = 500000
+    N2 = int(N / 2)
 
-    def setup(self):
-        self.N = 500000
-        self.df_int64 = DataFrame(dict(A=np.arange(self.N, dtype='int64'), B=np.arange(self.N, dtype='int64')))
-        self.df_int32 = DataFrame(dict(A=np.arange(self.N, dtype='int32'), B=np.arange(self.N, dtype='int32')))
-        self.df_uint32 = DataFrame(dict(A=np.arange(self.N, dtype='uint32'), B=np.arange(self.N, dtype='uint32')))
-        self.df_float64 = DataFrame(dict(A=np.arange(self.N, dtype='float64'), B=np.arange(self.N, dtype='float64')))
-        self.df_float32 = DataFrame(dict(A=np.arange(self.N, dtype='float32'), B=np.arange(self.N, dtype='float32')))
-        self.df_datetime64 = DataFrame(dict(A=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms'), B=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms')))
-        self.df_timedelta64 = DataFrame(dict(A=(self.df_datetime64['A'] - self.df_datetime64['B']), B=self.df_datetime64['B']))
+    data_dict = {'string-int': ['1'] * N2 + [2] * N2,
+                 'string-nint': ['-1'] * N2 + [2] * N2,
+                 'datetime64': np.repeat(np.array(['1970-01-01', '1970-01-02'],
+                                                  dtype='datetime64[D]'), N),
+                 'string-float': ['1.1'] * N2 + [2] * N2,
+                 'int-list': [1] * N2 + [2] * N2,
+                 'int32': np.repeat(np.int32(1), N)}
 
-    def time_dtype_infer_timedelta64_2(self):
-        (self.df_timedelta64['A'] + self.df_timedelta64['A'])
+    def setup(self, dtype, downcast):
+        self.data = self.data_dict[dtype]
 
+    def time_downcast(self, dtype, downcast):
+        to_numeric(self.data, downcast=downcast)
 
-class dtype_infer_uint32(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.N = 500000
-        self.df_int64 = DataFrame(dict(A=np.arange(self.N, dtype='int64'), B=np.arange(self.N, dtype='int64')))
-        self.df_int32 = DataFrame(dict(A=np.arange(self.N, dtype='int32'), B=np.arange(self.N, dtype='int32')))
-        self.df_uint32 = DataFrame(dict(A=np.arange(self.N, dtype='uint32'), B=np.arange(self.N, dtype='uint32')))
-        self.df_float64 = DataFrame(dict(A=np.arange(self.N, dtype='float64'), B=np.arange(self.N, dtype='float64')))
-        self.df_float32 = DataFrame(dict(A=np.arange(self.N, dtype='float32'), B=np.arange(self.N, dtype='float32')))
-        self.df_datetime64 = DataFrame(dict(A=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms'), B=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms')))
-        self.df_timedelta64 = DataFrame(dict(A=(self.df_datetime64['A'] - self.df_datetime64['B']), B=self.df_datetime64['B']))
-
-    def time_dtype_infer_uint32(self):
-        (self.df_uint32['A'] + self.df_uint32['B'])
\ No newline at end of file
+class MaybeConvertNumeric(object):
+
+    def setup_cache(self):
+        N = 10**6
+        arr = np.repeat([2**63], N) + np.arange(N).astype('uint64')
+        data = arr.astype(object)
+        data[1::2] = arr[1::2].astype(str)
+        data[-1] = -1
+        return data
+
+    def time_convert(self, data):
+        lib.maybe_convert_numeric(data, set(), coerce_numeric=False)
diff --git a/doc/sphinxext/ipython_sphinxext/__init__.py b/asv_bench/benchmarks/io/__init__.py
similarity index 100%
rename from doc/sphinxext/ipython_sphinxext/__init__.py
rename to asv_bench/benchmarks/io/__init__.py
diff --git a/asv_bench/benchmarks/io/csv.py b/asv_bench/benchmarks/io/csv.py
new file mode 100644
index 0000000000000..0f5d07f9fac55
--- /dev/null
+++ b/asv_bench/benchmarks/io/csv.py
@@ -0,0 +1,217 @@
+import random
+import timeit
+import string
+
+import numpy as np
+import pandas.util.testing as tm
+from pandas import DataFrame, Categorical, date_range, read_csv
+from pandas.compat import PY2
+from pandas.compat import cStringIO as StringIO
+
+from ..pandas_vb_common import setup, BaseIO  # noqa
+
+
+class ToCSV(BaseIO):
+
+    goal_time = 0.2
+    fname = '__test__.csv'
+    params = ['wide', 'long', 'mixed']
+    param_names = ['kind']
+
+    def setup(self, kind):
+        wide_frame = DataFrame(np.random.randn(3000, 30))
+        long_frame = DataFrame({'A': np.arange(50000),
+                                'B': np.arange(50000) + 1.,
+                                'C': np.arange(50000) + 2.,
+                                'D': np.arange(50000) + 3.})
+        mixed_frame = DataFrame({'float': np.random.randn(5000),
+                                 'int': np.random.randn(5000).astype(int),
+                                 'bool': (np.arange(5000) % 2) == 0,
+                                 'datetime': date_range('2001',
+                                                        freq='s',
+                                                        periods=5000),
+                                 'object': ['foo'] * 5000})
+        mixed_frame.loc[30:500, 'float'] = np.nan
+        data = {'wide': wide_frame,
+                'long': long_frame,
+                'mixed': mixed_frame}
+        self.df = data[kind]
+
+    def time_frame(self, kind):
+        self.df.to_csv(self.fname)
+
+
+class ToCSVDatetime(BaseIO):
+
+    goal_time = 0.2
+    fname = '__test__.csv'
+
+    def setup(self):
+        rng = date_range('1/1/2000', periods=1000)
+        self.data = DataFrame(rng, index=rng)
+
+    def time_frame_date_formatting(self):
+        self.data.to_csv(self.fname, date_format='%Y%m%d')
+
+
+class ReadCSVDInferDatetimeFormat(object):
+
+    goal_time = 0.2
+    params = ([True, False], ['custom', 'iso8601', 'ymd'])
+    param_names = ['infer_datetime_format', 'format']
+
+    def setup(self, infer_datetime_format, format):
+        rng = date_range('1/1/2000', periods=1000)
+        formats = {'custom': '%m/%d/%Y %H:%M:%S.%f',
+                   'iso8601': '%Y-%m-%d %H:%M:%S',
+                   'ymd': '%Y%m%d'}
+        dt_format = formats[format]
+        self.data = StringIO('\n'.join(rng.strftime(dt_format).tolist()))
+
+    def time_read_csv(self, infer_datetime_format, format):
+        read_csv(self.data, header=None, names=['foo'], parse_dates=['foo'],
+                 infer_datetime_format=infer_datetime_format)
+
+
+class ReadCSVSkipRows(BaseIO):
+
+    goal_time = 0.2
+    fname = '__test__.csv'
+    params = [None, 10000]
+    param_names = ['skiprows']
+
+    def setup(self, skiprows):
+        N = 20000
+        index = tm.makeStringIndex(N)
+        df = DataFrame({'float1': np.random.randn(N),
+                        'float2': np.random.randn(N),
+                        'string1': ['foo'] * N,
+                        'bool1': [True] * N,
+                        'int1': np.random.randint(0, N, size=N)},
+                       index=index)
+        df.to_csv(self.fname)
+
+    def time_skipprows(self, skiprows):
+        read_csv(self.fname, skiprows=skiprows)
+
+
+class ReadUint64Integers(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        self.na_values = [2**63 + 500]
+        arr = np.arange(10000).astype('uint64') + 2**63
+        self.data1 = StringIO('\n'.join(arr.astype(str).tolist()))
+        arr = arr.astype(object)
+        arr[500] = -1
+        self.data2 = StringIO('\n'.join(arr.astype(str).tolist()))
+
+    def time_read_uint64(self):
+        read_csv(self.data1, header=None, names=['foo'])
+
+    def time_read_uint64_neg_values(self):
+        read_csv(self.data2, header=None, names=['foo'])
+
+    def time_read_uint64_na_values(self):
+        read_csv(self.data1, header=None, names=['foo'],
+                 na_values=self.na_values)
+
+
+class ReadCSVThousands(BaseIO):
+
+    goal_time = 0.2
+    fname = '__test__.csv'
+    params = ([',', '|'], [None, ','])
+    param_names = ['sep', 'thousands']
+
+    def setup(self, sep, thousands):
+        N = 10000
+        K = 8
+        data = np.random.randn(N, K) * np.random.randint(100, 10000, (N, K))
+        df = DataFrame(data)
+        if thousands is not None:
+            fmt = ':{}'.format(thousands)
+            fmt = '{' + fmt + '}'
+            df = df.applymap(lambda x: fmt.format(x))
+        df.to_csv(self.fname, sep=sep)
+
+    def time_thousands(self, sep, thousands):
+        read_csv(self.fname, sep=sep, thousands=thousands)
+
+
+class ReadCSVComment(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        data = ['A,B,C'] + (['1,2,3 # comment'] * 100000)
+        self.s_data = StringIO('\n'.join(data))
+
+    def time_comment(self):
+        read_csv(self.s_data, comment='#', header=None, names=list('abc'))
+
+
+class ReadCSVFloatPrecision(object):
+
+    goal_time = 0.2
+    params = ([',', ';'], ['.', '_'], [None, 'high', 'round_trip'])
+    param_names = ['sep', 'decimal', 'float_precision']
+
+    def setup(self, sep, decimal, float_precision):
+        floats = [''.join(random.choice(string.digits) for _ in range(28))
+                  for _ in range(15)]
+        rows = sep.join(['0{}'.format(decimal) + '{}'] * 3) + '\n'
+        data = rows * 5
+        data = data.format(*floats) * 200  # 1000 x 3 strings csv
+        self.s_data = StringIO(data)
+
+    def time_read_csv(self, sep, decimal, float_precision):
+        read_csv(self.s_data, sep=sep, header=None, names=list('abc'),
+                 float_precision=float_precision)
+
+    def time_read_csv_python_engine(self, sep, decimal, float_precision):
+        read_csv(self.s_data, sep=sep, header=None, engine='python',
+                 float_precision=None, names=list('abc'))
+
+
+class ReadCSVCategorical(BaseIO):
+
+    goal_time = 0.2
+    fname = '__test__.csv'
+
+    def setup(self):
+        N = 100000
+        group1 = ['aaaaaaaa', 'bbbbbbb', 'cccccccc', 'dddddddd', 'eeeeeeee']
+        df = DataFrame(np.random.choice(group1, (N, 3)), columns=list('abc'))
+        df.to_csv(self.fname, index=False)
+
+    def time_convert_post(self):
+        read_csv(self.fname).apply(Categorical)
+
+    def time_convert_direct(self):
+        read_csv(self.fname, dtype='category')
+
+
+class ReadCSVParseDates(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        data = """{},19:00:00,18:56:00,0.8100,2.8100,7.2000,0.0000,280.0000\n
+                  {},20:00:00,19:56:00,0.0100,2.2100,7.2000,0.0000,260.0000\n
+                  {},21:00:00,20:56:00,-0.5900,2.2100,5.7000,0.0000,280.0000\n
+                  {},21:00:00,21:18:00,-0.9900,2.0100,3.6000,0.0000,270.0000\n
+                  {},22:00:00,21:56:00,-0.5900,1.7100,5.1000,0.0000,290.0000\n
+               """
+        two_cols = ['KORD,19990127'] * 5
+        data = data.format(*two_cols)
+        self.s_data = StringIO(data)
+
+    def time_multiple_date(self):
+        read_csv(self.s_data, sep=',', header=None,
+                 names=list(string.digits[:9]), parse_dates=[[1, 2], [1, 3]])
+
+    def time_baseline(self):
+        read_csv(self.s_data, sep=',', header=None, parse_dates=[1],
+                 names=list(string.digits[:9]))
diff --git a/asv_bench/benchmarks/io/excel.py b/asv_bench/benchmarks/io/excel.py
new file mode 100644
index 0000000000000..58ab6bb8046c5
--- /dev/null
+++ b/asv_bench/benchmarks/io/excel.py
@@ -0,0 +1,36 @@
+import numpy as np
+from pandas import DataFrame, date_range, ExcelWriter, read_excel
+from pandas.compat import BytesIO
+import pandas.util.testing as tm
+
+from ..pandas_vb_common import BaseIO, setup  # noqa
+
+
+class Excel(object):
+
+    goal_time = 0.2
+    params = ['openpyxl', 'xlsxwriter', 'xlwt']
+    param_names = ['engine']
+
+    def setup(self, engine):
+        N = 2000
+        C = 5
+        self.df = DataFrame(np.random.randn(N, C),
+                            columns=['float{}'.format(i) for i in range(C)],
+                            index=date_range('20000101', periods=N, freq='H'))
+        self.df['object'] = tm.makeStringIndex(N)
+        self.bio_read = BytesIO()
+        self.writer_read = ExcelWriter(self.bio_read, engine=engine)
+        self.df.to_excel(self.writer_read, sheet_name='Sheet1')
+        self.writer_read.save()
+        self.bio_read.seek(0)
+
+    def time_read_excel(self, engine):
+        read_excel(self.bio_read)
+
+    def time_write_excel(self, engine):
+        bio_write = BytesIO()
+        bio_write.seek(0)
+        writer_write = ExcelWriter(bio_write, engine=engine)
+        self.df.to_excel(writer_write, sheet_name='Sheet1')
+        writer_write.save()
diff --git a/asv_bench/benchmarks/io/hdf.py b/asv_bench/benchmarks/io/hdf.py
new file mode 100644
index 0000000000000..4b6e1d69af92d
--- /dev/null
+++ b/asv_bench/benchmarks/io/hdf.py
@@ -0,0 +1,151 @@
+import warnings
+
+import numpy as np
+from pandas import DataFrame, Panel, date_range, HDFStore, read_hdf
+import pandas.util.testing as tm
+
+from ..pandas_vb_common import BaseIO, setup  # noqa
+
+
+class HDFStoreDataFrame(BaseIO):
+
+    goal_time = 0.2
+
+    def setup(self):
+        N = 25000
+        index = tm.makeStringIndex(N)
+        self.df = DataFrame({'float1': np.random.randn(N),
+                             'float2': np.random.randn(N)},
+                            index=index)
+        self.df_mixed = DataFrame({'float1': np.random.randn(N),
+                                   'float2': np.random.randn(N),
+                                   'string1': ['foo'] * N,
+                                   'bool1': [True] * N,
+                                   'int1': np.random.randint(0, N, size=N)},
+                                  index=index)
+        self.df_wide = DataFrame(np.random.randn(N, 100))
+        self.start_wide = self.df_wide.index[10000]
+        self.stop_wide = self.df_wide.index[15000]
+        self.df2 = DataFrame({'float1': np.random.randn(N),
+                              'float2': np.random.randn(N)},
+                             index=date_range('1/1/2000', periods=N))
+        self.start = self.df2.index[10000]
+        self.stop = self.df2.index[15000]
+        self.df_wide2 = DataFrame(np.random.randn(N, 100),
+                                  index=date_range('1/1/2000', periods=N))
+        self.df_dc = DataFrame(np.random.randn(N, 10),
+                               columns=['C%03d' % i for i in range(10)])
+
+        self.fname = '__test__.h5'
+
+        self.store = HDFStore(self.fname)
+        self.store.put('fixed', self.df)
+        self.store.put('fixed_mixed', self.df_mixed)
+        self.store.append('table', self.df2)
+        self.store.append('table_mixed', self.df_mixed)
+        self.store.append('table_wide', self.df_wide)
+        self.store.append('table_wide2', self.df_wide2)
+
+    def teardown(self):
+        self.store.close()
+        self.remove(self.fname)
+
+    def time_read_store(self):
+        self.store.get('fixed')
+
+    def time_read_store_mixed(self):
+        self.store.get('fixed_mixed')
+
+    def time_write_store(self):
+        self.store.put('fixed_write', self.df)
+
+    def time_write_store_mixed(self):
+        self.store.put('fixed_mixed_write', self.df_mixed)
+
+    def time_read_store_table_mixed(self):
+        self.store.select('table_mixed')
+
+    def time_write_store_table_mixed(self):
+        self.store.append('table_mixed_write', self.df_mixed)
+
+    def time_read_store_table(self):
+        self.store.select('table')
+
+    def time_write_store_table(self):
+        self.store.append('table_write', self.df)
+
+    def time_read_store_table_wide(self):
+        self.store.select('table_wide')
+
+    def time_write_store_table_wide(self):
+        self.store.append('table_wide_write', self.df_wide)
+
+    def time_write_store_table_dc(self):
+        self.store.append('table_dc_write', self.df_dc, data_columns=True)
+
+    def time_query_store_table_wide(self):
+        self.store.select('table_wide', where="index > self.start_wide and "
+                                              "index < self.stop_wide")
+
+    def time_query_store_table(self):
+        self.store.select('table', where="index > self.start and "
+                                         "index < self.stop")
+
+    def time_store_repr(self):
+        repr(self.store)
+
+    def time_store_str(self):
+        str(self.store)
+
+    def time_store_info(self):
+        self.store.info()
+
+
+class HDFStorePanel(BaseIO):
+
+    goal_time = 0.2
+
+    def setup(self):
+        self.fname = '__test__.h5'
+        with warnings.catch_warnings(record=True):
+            self.p = Panel(np.random.randn(20, 1000, 25),
+                           items=['Item%03d' % i for i in range(20)],
+                           major_axis=date_range('1/1/2000', periods=1000),
+                           minor_axis=['E%03d' % i for i in range(25)])
+            self.store = HDFStore(self.fname)
+            self.store.append('p1', self.p)
+
+    def teardown(self):
+        self.store.close()
+        self.remove(self.fname)
+
+    def time_read_store_table_panel(self):
+        with warnings.catch_warnings(record=True):
+            self.store.select('p1')
+
+    def time_write_store_table_panel(self):
+        with warnings.catch_warnings(record=True):
+            self.store.append('p2', self.p)
+
+
+class HDF(BaseIO):
+
+    goal_time = 0.2
+    params = ['table', 'fixed']
+    param_names = ['format']
+
+    def setup(self, format):
+        self.fname = '__test__.h5'
+        N = 100000
+        C = 5
+        self.df = DataFrame(np.random.randn(N, C),
+                            columns=['float{}'.format(i) for i in range(C)],
+                            index=date_range('20000101', periods=N, freq='H'))
+        self.df['object'] = tm.makeStringIndex(N)
+        self.df.to_hdf(self.fname, 'df', format=format)
+
+    def time_read_hdf(self, format):
+        read_hdf(self.fname, 'df')
+
+    def time_write_hdf(self, format):
+        self.df.to_hdf(self.fname, 'df', format=format)
diff --git a/asv_bench/benchmarks/io/json.py b/asv_bench/benchmarks/io/json.py
new file mode 100644
index 0000000000000..acfdd327c3b51
--- /dev/null
+++ b/asv_bench/benchmarks/io/json.py
@@ -0,0 +1,127 @@
+import numpy as np
+import pandas.util.testing as tm
+from pandas import DataFrame, date_range, timedelta_range, concat, read_json
+
+from ..pandas_vb_common import setup, BaseIO  # noqa
+
+
+class ReadJSON(BaseIO):
+
+    goal_time = 0.2
+    fname = "__test__.json"
+    params = (['split', 'index', 'records'], ['int', 'datetime'])
+    param_names = ['orient', 'index']
+
+    def setup(self, orient, index):
+        N = 100000
+        indexes = {'int': np.arange(N),
+                   'datetime': date_range('20000101', periods=N, freq='H')}
+        df = DataFrame(np.random.randn(N, 5),
+                       columns=['float_{}'.format(i) for i in range(5)],
+                       index=indexes[index])
+        df.to_json(self.fname, orient=orient)
+
+    def time_read_json(self, orient, index):
+        read_json(self.fname, orient=orient)
+
+
+class ReadJSONLines(BaseIO):
+
+    goal_time = 0.2
+    fname = "__test_lines__.json"
+    params = ['int', 'datetime']
+    param_names = ['index']
+
+    def setup(self, index):
+        N = 100000
+        indexes = {'int': np.arange(N),
+                   'datetime': date_range('20000101', periods=N, freq='H')}
+        df = DataFrame(np.random.randn(N, 5),
+                       columns=['float_{}'.format(i) for i in range(5)],
+                       index=indexes[index])
+        df.to_json(self.fname, orient='records', lines=True)
+
+    def time_read_json_lines(self, index):
+        read_json(self.fname, orient='records', lines=True)
+
+    def time_read_json_lines_concat(self, index):
+        concat(read_json(self.fname, orient='records', lines=True,
+                         chunksize=25000))
+
+    def peakmem_read_json_lines(self, index):
+        read_json(self.fname, orient='records', lines=True)
+
+    def peakmem_read_json_lines_concat(self, index):
+        concat(read_json(self.fname, orient='records', lines=True,
+                         chunksize=25000))
+
+
+class ToJSON(BaseIO):
+
+    goal_time = 0.2
+    fname = "__test__.json"
+    params = ['split', 'columns', 'index']
+    param_names = ['orient']
+
+    def setup(self, lines_orient):
+        N = 10**5
+        ncols = 5
+        index = date_range('20000101', periods=N, freq='H')
+        timedeltas = timedelta_range(start=1, periods=N, freq='s')
+        datetimes = date_range(start=1, periods=N, freq='s')
+        ints = np.random.randint(100000000, size=N)
+        floats = np.random.randn(N)
+        strings = tm.makeStringIndex(N)
+        self.df = DataFrame(np.random.randn(N, ncols), index=np.arange(N))
+        self.df_date_idx = DataFrame(np.random.randn(N, ncols), index=index)
+        self.df_td_int_ts = DataFrame({'td_1': timedeltas,
+                                       'td_2': timedeltas,
+                                       'int_1': ints,
+                                       'int_2': ints,
+                                       'ts_1': datetimes,
+                                       'ts_2': datetimes},
+                                      index=index)
+        self.df_int_floats = DataFrame({'int_1': ints,
+                                        'int_2': ints,
+                                        'int_3': ints,
+                                        'float_1': floats,
+                                        'float_2': floats,
+                                        'float_3': floats},
+                                       index=index)
+        self.df_int_float_str = DataFrame({'int_1': ints,
+                                           'int_2': ints,
+                                           'float_1': floats,
+                                           'float_2': floats,
+                                           'str_1': strings,
+                                           'str_2': strings},
+                                          index=index)
+
+    def time_floats_with_int_index(self, orient):
+        self.df.to_json(self.fname, orient=orient)
+
+    def time_floats_with_dt_index(self, orient):
+        self.df_date_idx.to_json(self.fname, orient=orient)
+
+    def time_delta_int_tstamp(self, orient):
+        self.df_td_int_ts.to_json(self.fname, orient=orient)
+
+    def time_float_int(self, orient):
+        self.df_int_floats.to_json(self.fname, orient=orient)
+
+    def time_float_int_str(self, orient):
+        self.df_int_float_str.to_json(self.fname, orient=orient)
+
+    def time_floats_with_int_idex_lines(self, orient):
+        self.df.to_json(self.fname, orient='records', lines=True)
+
+    def time_floats_with_dt_index_lines(self, orient):
+        self.df_date_idx.to_json(self.fname, orient='records', lines=True)
+
+    def time_delta_int_tstamp_lines(self, orient):
+        self.df_td_int_ts.to_json(self.fname, orient='records', lines=True)
+
+    def time_float_int_lines(self, orient):
+        self.df_int_floats.to_json(self.fname, orient='records', lines=True)
+
+    def time_float_int_str_lines(self, orient):
+        self.df_int_float_str.to_json(self.fname, orient='records', lines=True)
diff --git a/asv_bench/benchmarks/io/msgpack.py b/asv_bench/benchmarks/io/msgpack.py
new file mode 100644
index 0000000000000..8ccce01117ca4
--- /dev/null
+++ b/asv_bench/benchmarks/io/msgpack.py
@@ -0,0 +1,26 @@
+import numpy as np
+from pandas import DataFrame, date_range, read_msgpack
+import pandas.util.testing as tm
+
+from ..pandas_vb_common import BaseIO, setup  # noqa
+
+
+class MSGPack(BaseIO):
+
+    goal_time = 0.2
+
+    def setup(self):
+        self.fname = '__test__.msg'
+        N = 100000
+        C = 5
+        self.df = DataFrame(np.random.randn(N, C),
+                            columns=['float{}'.format(i) for i in range(C)],
+                            index=date_range('20000101', periods=N, freq='H'))
+        self.df['object'] = tm.makeStringIndex(N)
+        self.df.to_msgpack(self.fname)
+
+    def time_read_msgpack(self):
+        read_msgpack(self.fname)
+
+    def time_write_msgpack(self):
+        self.df.to_msgpack(self.fname)
diff --git a/asv_bench/benchmarks/io/pickle.py b/asv_bench/benchmarks/io/pickle.py
new file mode 100644
index 0000000000000..2ad0fcca6eb26
--- /dev/null
+++ b/asv_bench/benchmarks/io/pickle.py
@@ -0,0 +1,26 @@
+import numpy as np
+from pandas import DataFrame, date_range, read_pickle
+import pandas.util.testing as tm
+
+from ..pandas_vb_common import BaseIO, setup  # noqa
+
+
+class Pickle(BaseIO):
+
+    goal_time = 0.2
+
+    def setup(self):
+        self.fname = '__test__.pkl'
+        N = 100000
+        C = 5
+        self.df = DataFrame(np.random.randn(N, C),
+                            columns=['float{}'.format(i) for i in range(C)],
+                            index=date_range('20000101', periods=N, freq='H'))
+        self.df['object'] = tm.makeStringIndex(N)
+        self.df.to_pickle(self.fname)
+
+    def time_read_pickle(self):
+        read_pickle(self.fname)
+
+    def time_write_pickle(self):
+        self.df.to_pickle(self.fname)
diff --git a/asv_bench/benchmarks/io/sas.py b/asv_bench/benchmarks/io/sas.py
new file mode 100644
index 0000000000000..526c524de7fff
--- /dev/null
+++ b/asv_bench/benchmarks/io/sas.py
@@ -0,0 +1,21 @@
+import os
+
+from pandas import read_sas
+
+
+class SAS(object):
+
+    goal_time = 0.2
+    params = ['sas7bdat', 'xport']
+    param_names = ['format']
+
+    def setup(self, format):
+        # Read files that are located in 'pandas/io/tests/sas/data'
+        files = {'sas7bdat': 'test1.sas7bdat', 'xport': 'paxraw_d_short.xpt'}
+        file = files[format]
+        paths = [os.path.dirname(__file__), '..', '..', '..', 'pandas',
+                 'tests', 'io', 'sas', 'data', file]
+        self.f = os.path.join(*paths)
+
+    def time_read_msgpack(self, format):
+        read_sas(self.f, format=format)
diff --git a/asv_bench/benchmarks/io/sql.py b/asv_bench/benchmarks/io/sql.py
new file mode 100644
index 0000000000000..ef4e501e5f3b9
--- /dev/null
+++ b/asv_bench/benchmarks/io/sql.py
@@ -0,0 +1,132 @@
+import sqlite3
+
+import numpy as np
+import pandas.util.testing as tm
+from pandas import DataFrame, date_range, read_sql_query, read_sql_table
+from sqlalchemy import create_engine
+
+from ..pandas_vb_common import setup  # noqa
+
+
+class SQL(object):
+
+    goal_time = 0.2
+    params = ['sqlalchemy', 'sqlite']
+    param_names = ['connection']
+
+    def setup(self, connection):
+        N = 10000
+        con = {'sqlalchemy': create_engine('sqlite:///:memory:'),
+               'sqlite': sqlite3.connect(':memory:')}
+        self.table_name = 'test_type'
+        self.query_all = 'SELECT * FROM {}'.format(self.table_name)
+        self.con = con[connection]
+        self.df = DataFrame({'float': np.random.randn(N),
+                             'float_with_nan': np.random.randn(N),
+                             'string': ['foo'] * N,
+                             'bool': [True] * N,
+                             'int': np.random.randint(0, N, size=N),
+                             'datetime': date_range('2000-01-01',
+                                                    periods=N,
+                                                    freq='s')},
+                            index=tm.makeStringIndex(N))
+        self.df.loc[1000:3000, 'float_with_nan'] = np.nan
+        self.df['datetime_string'] = self.df['datetime'].astype(str)
+        self.df.to_sql(self.table_name, self.con, if_exists='replace')
+
+    def time_to_sql_dataframe(self, connection):
+        self.df.to_sql('test1', self.con, if_exists='replace')
+
+    def time_read_sql_query(self, connection):
+        read_sql_query(self.query_all, self.con)
+
+
+class WriteSQLDtypes(object):
+
+    goal_time = 0.2
+    params = (['sqlalchemy', 'sqlite'],
+              ['float', 'float_with_nan', 'string', 'bool', 'int', 'datetime'])
+    param_names = ['connection', 'dtype']
+
+    def setup(self, connection, dtype):
+        N = 10000
+        con = {'sqlalchemy': create_engine('sqlite:///:memory:'),
+               'sqlite': sqlite3.connect(':memory:')}
+        self.table_name = 'test_type'
+        self.query_col = 'SELECT {} FROM {}'.format(dtype, self.table_name)
+        self.con = con[connection]
+        self.df = DataFrame({'float': np.random.randn(N),
+                             'float_with_nan': np.random.randn(N),
+                             'string': ['foo'] * N,
+                             'bool': [True] * N,
+                             'int': np.random.randint(0, N, size=N),
+                             'datetime': date_range('2000-01-01',
+                                                    periods=N,
+                                                    freq='s')},
+                            index=tm.makeStringIndex(N))
+        self.df.loc[1000:3000, 'float_with_nan'] = np.nan
+        self.df['datetime_string'] = self.df['datetime'].astype(str)
+        self.df.to_sql(self.table_name, self.con, if_exists='replace')
+
+    def time_to_sql_dataframe_column(self, connection, dtype):
+        self.df[[dtype]].to_sql('test1', self.con, if_exists='replace')
+
+    def time_read_sql_query_select_column(self, connection, dtype):
+        read_sql_query(self.query_col, self.con)
+
+
+class ReadSQLTable(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        N = 10000
+        self.table_name = 'test'
+        self.con = create_engine('sqlite:///:memory:')
+        self.df = DataFrame({'float': np.random.randn(N),
+                             'float_with_nan': np.random.randn(N),
+                             'string': ['foo'] * N,
+                             'bool': [True] * N,
+                             'int': np.random.randint(0, N, size=N),
+                             'datetime': date_range('2000-01-01',
+                                                    periods=N,
+                                                    freq='s')},
+                            index=tm.makeStringIndex(N))
+        self.df.loc[1000:3000, 'float_with_nan'] = np.nan
+        self.df['datetime_string'] = self.df['datetime'].astype(str)
+        self.df.to_sql(self.table_name, self.con, if_exists='replace')
+
+    def time_read_sql_table_all(self):
+        read_sql_table(self.table_name, self.con)
+
+    def time_read_sql_table_parse_dates(self):
+        read_sql_table(self.table_name, self.con, columns=['datetime_string'],
+                       parse_dates=['datetime_string'])
+
+
+class ReadSQLTableDtypes(object):
+
+    goal_time = 0.2
+
+    params = ['float', 'float_with_nan', 'string', 'bool', 'int', 'datetime']
+    param_names = ['dtype']
+
+    def setup(self, dtype):
+        N = 10000
+        self.table_name = 'test'
+        self.con = create_engine('sqlite:///:memory:')
+        self.df = DataFrame({'float': np.random.randn(N),
+                             'float_with_nan': np.random.randn(N),
+                             'string': ['foo'] * N,
+                             'bool': [True] * N,
+                             'int': np.random.randint(0, N, size=N),
+                             'datetime': date_range('2000-01-01',
+                                                    periods=N,
+                                                    freq='s')},
+                            index=tm.makeStringIndex(N))
+        self.df.loc[1000:3000, 'float_with_nan'] = np.nan
+        self.df['datetime_string'] = self.df['datetime'].astype(str)
+        self.df.to_sql(self.table_name, self.con, if_exists='replace')
+
+    def time_read_sql_table_column(self, dtype):
+        read_sql_table(self.table_name, self.con, columns=[dtype])
diff --git a/asv_bench/benchmarks/io/stata.py b/asv_bench/benchmarks/io/stata.py
new file mode 100644
index 0000000000000..e0f5752ca930f
--- /dev/null
+++ b/asv_bench/benchmarks/io/stata.py
@@ -0,0 +1,37 @@
+import numpy as np
+from pandas import DataFrame, date_range, read_stata
+import pandas.util.testing as tm
+
+from ..pandas_vb_common import BaseIO, setup  # noqa
+
+
+class Stata(BaseIO):
+
+    goal_time = 0.2
+    params = ['tc', 'td', 'tm', 'tw', 'th', 'tq', 'ty']
+    param_names = ['convert_dates']
+
+    def setup(self, convert_dates):
+        self.fname = '__test__.dta'
+        N = 100000
+        C = 5
+        self.df = DataFrame(np.random.randn(N, C),
+                            columns=['float{}'.format(i) for i in range(C)],
+                            index=date_range('20000101', periods=N, freq='H'))
+        self.df['object'] = tm.makeStringIndex(N)
+        self.df['int8_'] = np.random.randint(np.iinfo(np.int8).min,
+                                             np.iinfo(np.int8).max - 27, N)
+        self.df['int16_'] = np.random.randint(np.iinfo(np.int16).min,
+                                              np.iinfo(np.int16).max - 27, N)
+        self.df['int32_'] = np.random.randint(np.iinfo(np.int32).min,
+                                              np.iinfo(np.int32).max - 27, N)
+        self.df['float32_'] = np.array(np.random.randn(N),
+                                       dtype=np.float32)
+        self.convert_dates = {'index': convert_dates}
+        self.df.to_stata(self.fname, self.convert_dates)
+
+    def time_read_stata(self, convert_dates):
+        read_stata(self.fname)
+
+    def time_write_stata(self, convert_dates):
+        self.df.to_stata(self.fname, self.convert_dates)
diff --git a/asv_bench/benchmarks/io_bench.py b/asv_bench/benchmarks/io_bench.py
deleted file mode 100644
index 0f15ab6e5e142..0000000000000
--- a/asv_bench/benchmarks/io_bench.py
+++ /dev/null
@@ -1,171 +0,0 @@
-from .pandas_vb_common import *
-from pandas import concat, Timestamp, compat
-try:
-    from StringIO import StringIO
-except ImportError:
-    from io import StringIO
-import timeit
-
-
-class frame_to_csv(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(3000, 30))
-
-    def time_frame_to_csv(self):
-        self.df.to_csv('__test__.csv')
-
-
-class frame_to_csv2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame({'A': range(50000), })
-        self.df['B'] = (self.df.A + 1.0)
-        self.df['C'] = (self.df.A + 2.0)
-        self.df['D'] = (self.df.A + 3.0)
-
-    def time_frame_to_csv2(self):
-        self.df.to_csv('__test__.csv')
-
-
-class frame_to_csv_date_formatting(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=1000)
-        self.data = DataFrame(self.rng, index=self.rng)
-
-    def time_frame_to_csv_date_formatting(self):
-        self.data.to_csv('__test__.csv', date_format='%Y%m%d')
-
-
-class frame_to_csv_mixed(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df_float = DataFrame(np.random.randn(5000, 5), dtype='float64', columns=self.create_cols('float'))
-        self.df_int = DataFrame(np.random.randn(5000, 5), dtype='int64', columns=self.create_cols('int'))
-        self.df_bool = DataFrame(True, index=self.df_float.index, columns=self.create_cols('bool'))
-        self.df_object = DataFrame('foo', index=self.df_float.index, columns=self.create_cols('object'))
-        self.df_dt = DataFrame(Timestamp('20010101'), index=self.df_float.index, columns=self.create_cols('date'))
-        self.df_float.ix[30:500, 1:3] = np.nan
-        self.df = concat([self.df_float, self.df_int, self.df_bool, self.df_object, self.df_dt], axis=1)
-
-    def time_frame_to_csv_mixed(self):
-        self.df.to_csv('__test__.csv')
-
-    def create_cols(self, name):
-        return [('%s%03d' % (name, i)) for i in range(5)]
-
-
-class read_csv_infer_datetime_format_custom(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=1000)
-        self.data = '\n'.join(self.rng.map((lambda x: x.strftime('%m/%d/%Y %H:%M:%S.%f'))))
-
-    def time_read_csv_infer_datetime_format_custom(self):
-        read_csv(StringIO(self.data), header=None, names=['foo'], parse_dates=['foo'], infer_datetime_format=True)
-
-
-class read_csv_infer_datetime_format_iso8601(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=1000)
-        self.data = '\n'.join(self.rng.map((lambda x: x.strftime('%Y-%m-%d %H:%M:%S'))))
-
-    def time_read_csv_infer_datetime_format_iso8601(self):
-        read_csv(StringIO(self.data), header=None, names=['foo'], parse_dates=['foo'], infer_datetime_format=True)
-
-
-class read_csv_infer_datetime_format_ymd(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=1000)
-        self.data = '\n'.join(self.rng.map((lambda x: x.strftime('%Y%m%d'))))
-
-    def time_read_csv_infer_datetime_format_ymd(self):
-        read_csv(StringIO(self.data), header=None, names=['foo'], parse_dates=['foo'], infer_datetime_format=True)
-
-
-class read_csv_skiprows(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = tm.makeStringIndex(20000)
-        self.df = DataFrame({'float1': randn(20000), 'float2': randn(20000), 'string1': (['foo'] * 20000), 'bool1': ([True] * 20000), 'int1': np.random.randint(0, 200000, size=20000), }, index=self.index)
-        self.df.to_csv('__test__.csv')
-
-    def time_read_csv_skiprows(self):
-        read_csv('__test__.csv', skiprows=10000)
-
-
-class read_csv_standard(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = tm.makeStringIndex(10000)
-        self.df = DataFrame({'float1': randn(10000), 'float2': randn(10000), 'string1': (['foo'] * 10000), 'bool1': ([True] * 10000), 'int1': np.random.randint(0, 100000, size=10000), }, index=self.index)
-        self.df.to_csv('__test__.csv')
-
-    def time_read_csv_standard(self):
-        read_csv('__test__.csv')
-
-
-class read_parse_dates_iso8601(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=1000)
-        self.data = '\n'.join(self.rng.map((lambda x: x.strftime('%Y-%m-%d %H:%M:%S'))))
-
-    def time_read_parse_dates_iso8601(self):
-        read_csv(StringIO(self.data), header=None, names=['foo'], parse_dates=['foo'])
-
-
-class write_csv_standard(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = tm.makeStringIndex(10000)
-        self.df = DataFrame({'float1': randn(10000), 'float2': randn(10000), 'string1': (['foo'] * 10000), 'bool1': ([True] * 10000), 'int1': np.random.randint(0, 100000, size=10000), }, index=self.index)
-
-    def time_write_csv_standard(self):
-        self.df.to_csv('__test__.csv')
-
-
-class read_csv_from_s3(object):
-    # Make sure that we can read part of a file from S3 without
-    # needing to download the entire thing. Use the timeit.default_timer
-    # to measure wall time instead of CPU time -- we want to see
-    # how long it takes to download the data.
-    timer = timeit.default_timer
-    params = ([None, "gzip", "bz2"], ["python", "c"])
-    param_names = ["compression", "engine"]
-
-    def setup(self, compression, engine):
-        if compression == "bz2" and engine == "c" and compat.PY2:
-            # The Python 2 C parser can't read bz2 from open files.
-            raise NotImplementedError
-        try:
-            import boto
-        except ImportError:
-            # Skip these benchmarks if `boto` is not installed.
-            raise NotImplementedError
-
-        self.big_fname = "s3://pandas-test/large_random.csv"
-
-    def time_read_nrows(self, compression, engine):
-        # Read a small number of rows from a huge (100,000 x 50) table.
-        ext = ""
-        if compression == "gzip":
-            ext = ".gz"
-        elif compression == "bz2":
-            ext = ".bz2"
-        pd.read_csv(self.big_fname + ext, nrows=10,
-                    compression=compression, engine=engine)
diff --git a/asv_bench/benchmarks/io_sql.py b/asv_bench/benchmarks/io_sql.py
deleted file mode 100644
index 9a6b21f9e067a..0000000000000
--- a/asv_bench/benchmarks/io_sql.py
+++ /dev/null
@@ -1,215 +0,0 @@
-import sqlalchemy
-from .pandas_vb_common import *
-import sqlite3
-from sqlalchemy import create_engine
-
-
-class sql_datetime_read_and_parse_sqlalchemy(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.df = DataFrame({'float': randn(10000), 'datetime': date_range('2000-01-01', periods=10000, freq='s'), })
-        self.df['datetime_string'] = self.df['datetime'].map(str)
-        self.df.to_sql('test_type', self.engine, if_exists='replace')
-        self.df[['float', 'datetime_string']].to_sql('test_type', self.con, if_exists='replace')
-
-    def time_sql_datetime_read_and_parse_sqlalchemy(self):
-        read_sql_table('test_type', self.engine, columns=['datetime_string'], parse_dates=['datetime_string'])
-
-
-class sql_datetime_read_as_native_sqlalchemy(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.df = DataFrame({'float': randn(10000), 'datetime': date_range('2000-01-01', periods=10000, freq='s'), })
-        self.df['datetime_string'] = self.df['datetime'].map(str)
-        self.df.to_sql('test_type', self.engine, if_exists='replace')
-        self.df[['float', 'datetime_string']].to_sql('test_type', self.con, if_exists='replace')
-
-    def time_sql_datetime_read_as_native_sqlalchemy(self):
-        read_sql_table('test_type', self.engine, columns=['datetime'])
-
-
-class sql_datetime_write_sqlalchemy(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.df = DataFrame({'float': randn(10000), 'string': (['foo'] * 10000), 'bool': ([True] * 10000), 'datetime': date_range('2000-01-01', periods=10000, freq='s'), })
-        self.df.loc[1000:3000, 'float'] = np.nan
-
-    def time_sql_datetime_write_sqlalchemy(self):
-        self.df[['datetime']].to_sql('test_datetime', self.engine, if_exists='replace')
-
-
-class sql_float_read_query_fallback(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.df = DataFrame({'float': randn(10000), 'datetime': date_range('2000-01-01', periods=10000, freq='s'), })
-        self.df['datetime_string'] = self.df['datetime'].map(str)
-        self.df.to_sql('test_type', self.engine, if_exists='replace')
-        self.df[['float', 'datetime_string']].to_sql('test_type', self.con, if_exists='replace')
-
-    def time_sql_float_read_query_fallback(self):
-        read_sql_query('SELECT float FROM test_type', self.con)
-
-
-class sql_float_read_query_sqlalchemy(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.df = DataFrame({'float': randn(10000), 'datetime': date_range('2000-01-01', periods=10000, freq='s'), })
-        self.df['datetime_string'] = self.df['datetime'].map(str)
-        self.df.to_sql('test_type', self.engine, if_exists='replace')
-        self.df[['float', 'datetime_string']].to_sql('test_type', self.con, if_exists='replace')
-
-    def time_sql_float_read_query_sqlalchemy(self):
-        read_sql_query('SELECT float FROM test_type', self.engine)
-
-
-class sql_float_read_table_sqlalchemy(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.df = DataFrame({'float': randn(10000), 'datetime': date_range('2000-01-01', periods=10000, freq='s'), })
-        self.df['datetime_string'] = self.df['datetime'].map(str)
-        self.df.to_sql('test_type', self.engine, if_exists='replace')
-        self.df[['float', 'datetime_string']].to_sql('test_type', self.con, if_exists='replace')
-
-    def time_sql_float_read_table_sqlalchemy(self):
-        read_sql_table('test_type', self.engine, columns=['float'])
-
-
-class sql_float_write_fallback(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.df = DataFrame({'float': randn(10000), 'string': (['foo'] * 10000), 'bool': ([True] * 10000), 'datetime': date_range('2000-01-01', periods=10000, freq='s'), })
-        self.df.loc[1000:3000, 'float'] = np.nan
-
-    def time_sql_float_write_fallback(self):
-        self.df[['float']].to_sql('test_float', self.con, if_exists='replace')
-
-
-class sql_float_write_sqlalchemy(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.df = DataFrame({'float': randn(10000), 'string': (['foo'] * 10000), 'bool': ([True] * 10000), 'datetime': date_range('2000-01-01', periods=10000, freq='s'), })
-        self.df.loc[1000:3000, 'float'] = np.nan
-
-    def time_sql_float_write_sqlalchemy(self):
-        self.df[['float']].to_sql('test_float', self.engine, if_exists='replace')
-
-
-class sql_read_query_fallback(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.index = tm.makeStringIndex(10000)
-        self.df = DataFrame({'float1': randn(10000), 'float2': randn(10000), 'string1': (['foo'] * 10000), 'bool1': ([True] * 10000), 'int1': np.random.randint(0, 100000, size=10000), }, index=self.index)
-        self.df.to_sql('test2', self.engine, if_exists='replace')
-        self.df.to_sql('test2', self.con, if_exists='replace')
-
-    def time_sql_read_query_fallback(self):
-        read_sql_query('SELECT * FROM test2', self.con)
-
-
-class sql_read_query_sqlalchemy(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.index = tm.makeStringIndex(10000)
-        self.df = DataFrame({'float1': randn(10000), 'float2': randn(10000), 'string1': (['foo'] * 10000), 'bool1': ([True] * 10000), 'int1': np.random.randint(0, 100000, size=10000), }, index=self.index)
-        self.df.to_sql('test2', self.engine, if_exists='replace')
-        self.df.to_sql('test2', self.con, if_exists='replace')
-
-    def time_sql_read_query_sqlalchemy(self):
-        read_sql_query('SELECT * FROM test2', self.engine)
-
-
-class sql_read_table_sqlalchemy(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.index = tm.makeStringIndex(10000)
-        self.df = DataFrame({'float1': randn(10000), 'float2': randn(10000), 'string1': (['foo'] * 10000), 'bool1': ([True] * 10000), 'int1': np.random.randint(0, 100000, size=10000), }, index=self.index)
-        self.df.to_sql('test2', self.engine, if_exists='replace')
-        self.df.to_sql('test2', self.con, if_exists='replace')
-
-    def time_sql_read_table_sqlalchemy(self):
-        read_sql_table('test2', self.engine)
-
-
-class sql_string_write_fallback(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.df = DataFrame({'float': randn(10000), 'string': (['foo'] * 10000), 'bool': ([True] * 10000), 'datetime': date_range('2000-01-01', periods=10000, freq='s'), })
-        self.df.loc[1000:3000, 'float'] = np.nan
-
-    def time_sql_string_write_fallback(self):
-        self.df[['string']].to_sql('test_string', self.con, if_exists='replace')
-
-
-class sql_string_write_sqlalchemy(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.df = DataFrame({'float': randn(10000), 'string': (['foo'] * 10000), 'bool': ([True] * 10000), 'datetime': date_range('2000-01-01', periods=10000, freq='s'), })
-        self.df.loc[1000:3000, 'float'] = np.nan
-
-    def time_sql_string_write_sqlalchemy(self):
-        self.df[['string']].to_sql('test_string', self.engine, if_exists='replace')
-
-
-class sql_write_fallback(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.index = tm.makeStringIndex(10000)
-        self.df = DataFrame({'float1': randn(10000), 'float2': randn(10000), 'string1': (['foo'] * 10000), 'bool1': ([True] * 10000), 'int1': np.random.randint(0, 100000, size=10000), }, index=self.index)
-
-    def time_sql_write_fallback(self):
-        self.df.to_sql('test1', self.con, if_exists='replace')
-
-
-class sql_write_sqlalchemy(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.index = tm.makeStringIndex(10000)
-        self.df = DataFrame({'float1': randn(10000), 'float2': randn(10000), 'string1': (['foo'] * 10000), 'bool1': ([True] * 10000), 'int1': np.random.randint(0, 100000, size=10000), }, index=self.index)
-
-    def time_sql_write_sqlalchemy(self):
-        self.df.to_sql('test1', self.engine, if_exists='replace')
\ No newline at end of file
diff --git a/asv_bench/benchmarks/join_merge.py b/asv_bench/benchmarks/join_merge.py
index 1da0d37d4a8dd..de0a3b33da147 100644
--- a/asv_bench/benchmarks/join_merge.py
+++ b/asv_bench/benchmarks/join_merge.py
@@ -1,33 +1,25 @@
-from .pandas_vb_common import *
+import warnings
+import string
 
+import numpy as np
+import pandas.util.testing as tm
+from pandas import (DataFrame, Series, MultiIndex, date_range, concat, merge,
+                    merge_asof)
+try:
+    from pandas import merge_ordered
+except ImportError:
+    from pandas import ordered_merge as merge_ordered
 
-class append_frame_single_homogenous(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df1 = pd.DataFrame(np.random.randn(10000, 4), columns=['A', 'B', 'C', 'D'])
-        self.df2 = self.df1.copy()
-        self.df2.index = np.arange(10000, 20000)
-        self.mdf1 = self.df1.copy()
-        self.mdf1['obj1'] = 'bar'
-        self.mdf1['obj2'] = 'bar'
-        self.mdf1['int1'] = 5
-        try:
-            self.mdf1.consolidate(inplace=True)
-        except:
-            pass
-        self.mdf2 = self.mdf1.copy()
-        self.mdf2.index = self.df2.index
+from .pandas_vb_common import Panel, setup  # noqa
 
-    def time_append_frame_single_homogenous(self):
-        self.df1.append(self.df2)
 
+class Append(object):
 
-class append_frame_single_mixed(object):
     goal_time = 0.2
 
     def setup(self):
-        self.df1 = pd.DataFrame(np.random.randn(10000, 4), columns=['A', 'B', 'C', 'D'])
+        self.df1 = DataFrame(np.random.randn(10000, 4),
+                             columns=['A', 'B', 'C', 'D'])
         self.df2 = self.df1.copy()
         self.df2.index = np.arange(10000, 20000)
         self.mdf1 = self.df1.copy()
@@ -35,325 +27,336 @@ def setup(self):
         self.mdf1['obj2'] = 'bar'
         self.mdf1['int1'] = 5
         try:
-            self.mdf1.consolidate(inplace=True)
+            with warnings.catch_warnings(record=True):
+                self.mdf1.consolidate(inplace=True)
         except:
             pass
         self.mdf2 = self.mdf1.copy()
         self.mdf2.index = self.df2.index
 
-    def time_append_frame_single_mixed(self):
+    def time_append_homogenous(self):
+        self.df1.append(self.df2)
+
+    def time_append_mixed(self):
         self.mdf1.append(self.mdf2)
 
 
-class concat_empty_frames1(object):
+class Concat(object):
+
     goal_time = 0.2
+    params = [0, 1]
+    param_names = ['axis']
 
-    def setup(self):
-        self.df = pd.DataFrame(dict(A=range(10000)), index=date_range('20130101', periods=10000, freq='s'))
-        self.empty = pd.DataFrame()
+    def setup(self, axis):
+        N = 1000
+        s = Series(N, index=tm.makeStringIndex(N))
+        self.series = [s[i:- i] for i in range(1, 10)] * 50
+        self.small_frames = [DataFrame(np.random.randn(5, 4))] * 1000
+        df = DataFrame({'A': range(N)},
+                       index=date_range('20130101', periods=N, freq='s'))
+        self.empty_left = [DataFrame(), df]
+        self.empty_right = [df, DataFrame()]
 
-    def time_concat_empty_frames1(self):
-        concat([self.df, self.empty])
+    def time_concat_series(self, axis):
+        concat(self.series, axis=axis)
 
+    def time_concat_small_frames(self, axis):
+        concat(self.small_frames, axis=axis)
 
-class concat_empty_frames2(object):
-    goal_time = 0.2
+    def time_concat_empty_right(self, axis):
+        concat(self.empty_right, axis=axis)
 
-    def setup(self):
-        self.df = pd.DataFrame(dict(A=range(10000)), index=date_range('20130101', periods=10000, freq='s'))
-        self.empty = pd.DataFrame()
+    def time_concat_empty_left(self, axis):
+        concat(self.empty_left, axis=axis)
 
-    def time_concat_empty_frames2(self):
-        concat([self.empty, self.df])
 
+class ConcatPanels(object):
 
-class concat_series_axis1(object):
     goal_time = 0.2
+    params = ([0, 1, 2], [True, False])
+    param_names = ['axis', 'ignore_index']
 
-    def setup(self):
-        self.n = 1000
-        self.indices = tm.makeStringIndex(1000)
-        self.s = Series(self.n, index=self.indices)
-        self.pieces = [self.s[i:(- i)] for i in range(1, 10)]
-        self.pieces = (self.pieces * 50)
+    def setup(self, axis, ignore_index):
+        with warnings.catch_warnings(record=True):
+            panel_c = Panel(np.zeros((10000, 200, 2),
+                                     dtype=np.float32,
+                                     order='C'))
+            self.panels_c = [panel_c] * 20
+            panel_f = Panel(np.zeros((10000, 200, 2),
+                            dtype=np.float32,
+                            order='F'))
+            self.panels_f = [panel_f] * 20
 
-    def time_concat_series_axis1(self):
-        concat(self.pieces, axis=1)
+    def time_c_ordered(self, axis, ignore_index):
+        with warnings.catch_warnings(record=True):
+            concat(self.panels_c, axis=axis, ignore_index=ignore_index)
 
+    def time_f_ordered(self, axis, ignore_index):
+        with warnings.catch_warnings(record=True):
+            concat(self.panels_f, axis=axis, ignore_index=ignore_index)
 
-class concat_small_frames(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.df = pd.DataFrame(randn(5, 4))
+class ConcatDataFrames(object):
 
-    def time_concat_small_frames(self):
-        concat(([self.df] * 1000))
+    goal_time = 0.2
+    params = ([0, 1], [True, False])
+    param_names = ['axis', 'ignore_index']
 
+    def setup(self, axis, ignore_index):
+        frame_c = DataFrame(np.zeros((10000, 200),
+                            dtype=np.float32, order='C'))
+        self.frame_c = [frame_c] * 20
+        frame_f = DataFrame(np.zeros((10000, 200),
+                            dtype=np.float32, order='F'))
+        self.frame_f = [frame_f] * 20
 
-class i8merge(object):
-    goal_time = 0.2
+    def time_c_ordered(self, axis, ignore_index):
+        concat(self.frame_c, axis=axis, ignore_index=ignore_index)
 
-    def setup(self):
-        (low, high, n) = (((-1) << 10), (1 << 10), (1 << 20))
-        self.left = pd.DataFrame(np.random.randint(low, high, (n, 7)), columns=list('ABCDEFG'))
-        self.left['left'] = self.left.sum(axis=1)
-        self.i = np.random.permutation(len(self.left))
-        self.right = self.left.iloc[self.i].copy()
-        self.right.columns = (self.right.columns[:(-1)].tolist() + ['right'])
-        self.right.index = np.arange(len(self.right))
-        self.right['right'] *= (-1)
+    def time_f_ordered(self, axis, ignore_index):
+        concat(self.frame_f, axis=axis, ignore_index=ignore_index)
 
-    def time_i8merge(self):
-        merge(self.left, self.right, how='outer')
 
+class Join(object):
 
-class join_dataframe_index_multi(object):
     goal_time = 0.2
+    params = [True, False]
+    param_names = ['sort']
 
-    def setup(self):
-        self.level1 = tm.makeStringIndex(10).values
-        self.level2 = tm.makeStringIndex(1000).values
-        self.label1 = np.arange(10).repeat(1000)
-        self.label2 = np.tile(np.arange(1000), 10)
-        self.key1 = np.tile(self.level1.take(self.label1), 10)
-        self.key2 = np.tile(self.level2.take(self.label2), 10)
-        self.shuf = np.arange(100000)
-        random.shuffle(self.shuf)
-        try:
-            self.index2 = MultiIndex(levels=[self.level1, self.level2], labels=[self.label1, self.label2])
-            self.index3 = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-            self.df_multi = DataFrame(np.random.randn(len(self.index2), 4), index=self.index2, columns=['A', 'B', 'C', 'D'])
-        except:
-            pass
-        try:
-            self.DataFrame = DataMatrix
-        except:
-            pass
-        self.df = pd.DataFrame({'data1': np.random.randn(100000), 'data2': np.random.randn(100000), 'key1': self.key1, 'key2': self.key2, })
-        self.df_key1 = pd.DataFrame(np.random.randn(len(self.level1), 4), index=self.level1, columns=['A', 'B', 'C', 'D'])
-        self.df_key2 = pd.DataFrame(np.random.randn(len(self.level2), 4), index=self.level2, columns=['A', 'B', 'C', 'D'])
-        self.df_shuf = self.df.reindex(self.df.index[self.shuf])
+    def setup(self, sort):
+        level1 = tm.makeStringIndex(10).values
+        level2 = tm.makeStringIndex(1000).values
+        label1 = np.arange(10).repeat(1000)
+        label2 = np.tile(np.arange(1000), 10)
+        index2 = MultiIndex(levels=[level1, level2],
+                            labels=[label1, label2])
+        self.df_multi = DataFrame(np.random.randn(len(index2), 4),
+                                  index=index2,
+                                  columns=['A', 'B', 'C', 'D'])
 
-    def time_join_dataframe_index_multi(self):
-        self.df.join(self.df_multi, on=['key1', 'key2'])
+        self.key1 = np.tile(level1.take(label1), 10)
+        self.key2 = np.tile(level2.take(label2), 10)
+        self.df = DataFrame({'data1': np.random.randn(100000),
+                             'data2': np.random.randn(100000),
+                             'key1': self.key1,
+                             'key2': self.key2})
 
+        self.df_key1 = DataFrame(np.random.randn(len(level1), 4),
+                                 index=level1,
+                                 columns=['A', 'B', 'C', 'D'])
+        self.df_key2 = DataFrame(np.random.randn(len(level2), 4),
+                                 index=level2,
+                                 columns=['A', 'B', 'C', 'D'])
 
-class join_dataframe_index_single_key_bigger(object):
-    goal_time = 0.2
+        shuf = np.arange(100000)
+        np.random.shuffle(shuf)
+        self.df_shuf = self.df.reindex(self.df.index[shuf])
 
-    def setup(self):
-        self.level1 = tm.makeStringIndex(10).values
-        self.level2 = tm.makeStringIndex(1000).values
-        self.label1 = np.arange(10).repeat(1000)
-        self.label2 = np.tile(np.arange(1000), 10)
-        self.key1 = np.tile(self.level1.take(self.label1), 10)
-        self.key2 = np.tile(self.level2.take(self.label2), 10)
-        self.shuf = np.arange(100000)
-        random.shuffle(self.shuf)
-        try:
-            self.index2 = MultiIndex(levels=[self.level1, self.level2], labels=[self.label1, self.label2])
-            self.index3 = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-            self.df_multi = DataFrame(np.random.randn(len(self.index2), 4), index=self.index2, columns=['A', 'B', 'C', 'D'])
-        except:
-            pass
-        try:
-            self.DataFrame = DataMatrix
-        except:
-            pass
-        self.df = pd.DataFrame({'data1': np.random.randn(100000), 'data2': np.random.randn(100000), 'key1': self.key1, 'key2': self.key2, })
-        self.df_key1 = pd.DataFrame(np.random.randn(len(self.level1), 4), index=self.level1, columns=['A', 'B', 'C', 'D'])
-        self.df_key2 = pd.DataFrame(np.random.randn(len(self.level2), 4), index=self.level2, columns=['A', 'B', 'C', 'D'])
-        self.df_shuf = self.df.reindex(self.df.index[self.shuf])
+    def time_join_dataframe_index_multi(self, sort):
+        self.df.join(self.df_multi, on=['key1', 'key2'], sort=sort)
+
+    def time_join_dataframe_index_single_key_bigger(self, sort):
+        self.df.join(self.df_key2, on='key2', sort=sort)
 
-    def time_join_dataframe_index_single_key_bigger(self):
-        self.df.join(self.df_key2, on='key2')
+    def time_join_dataframe_index_single_key_small(self, sort):
+        self.df.join(self.df_key1, on='key1', sort=sort)
 
+    def time_join_dataframe_index_shuffle_key_bigger_sort(self, sort):
+        self.df_shuf.join(self.df_key2, on='key2', sort=sort)
+
+
+class JoinIndex(object):
 
-class join_dataframe_index_single_key_bigger_sort(object):
     goal_time = 0.2
 
     def setup(self):
-        self.level1 = tm.makeStringIndex(10).values
-        self.level2 = tm.makeStringIndex(1000).values
-        self.label1 = np.arange(10).repeat(1000)
-        self.label2 = np.tile(np.arange(1000), 10)
-        self.key1 = np.tile(self.level1.take(self.label1), 10)
-        self.key2 = np.tile(self.level2.take(self.label2), 10)
-        self.shuf = np.arange(100000)
-        random.shuffle(self.shuf)
-        try:
-            self.index2 = MultiIndex(levels=[self.level1, self.level2], labels=[self.label1, self.label2])
-            self.index3 = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-            self.df_multi = DataFrame(np.random.randn(len(self.index2), 4), index=self.index2, columns=['A', 'B', 'C', 'D'])
-        except:
-            pass
-        try:
-            self.DataFrame = DataMatrix
-        except:
-            pass
-        self.df = pd.DataFrame({'data1': np.random.randn(100000), 'data2': np.random.randn(100000), 'key1': self.key1, 'key2': self.key2, })
-        self.df_key1 = pd.DataFrame(np.random.randn(len(self.level1), 4), index=self.level1, columns=['A', 'B', 'C', 'D'])
-        self.df_key2 = pd.DataFrame(np.random.randn(len(self.level2), 4), index=self.level2, columns=['A', 'B', 'C', 'D'])
-        self.df_shuf = self.df.reindex(self.df.index[self.shuf])
+        N = 50000
+        self.left = DataFrame(np.random.randint(1, N / 500, (N, 2)),
+                              columns=['jim', 'joe'])
+        self.right = DataFrame(np.random.randint(1, N / 500, (N, 2)),
+                               columns=['jolie', 'jolia']).set_index('jolie')
 
-    def time_join_dataframe_index_single_key_bigger_sort(self):
-        self.df_shuf.join(self.df_key2, on='key2', sort=True)
+    def time_left_outer_join_index(self):
+        self.left.join(self.right, on='jim')
 
 
-class join_dataframe_index_single_key_small(object):
+class JoinNonUnique(object):
+    # outer join of non-unique
+    # GH 6329
     goal_time = 0.2
 
     def setup(self):
-        self.level1 = tm.makeStringIndex(10).values
-        self.level2 = tm.makeStringIndex(1000).values
-        self.label1 = np.arange(10).repeat(1000)
-        self.label2 = np.tile(np.arange(1000), 10)
-        self.key1 = np.tile(self.level1.take(self.label1), 10)
-        self.key2 = np.tile(self.level2.take(self.label2), 10)
-        self.shuf = np.arange(100000)
-        random.shuffle(self.shuf)
-        try:
-            self.index2 = MultiIndex(levels=[self.level1, self.level2], labels=[self.label1, self.label2])
-            self.index3 = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-            self.df_multi = DataFrame(np.random.randn(len(self.index2), 4), index=self.index2, columns=['A', 'B', 'C', 'D'])
-        except:
-            pass
-        try:
-            self.DataFrame = DataMatrix
-        except:
-            pass
-        self.df = pd.DataFrame({'data1': np.random.randn(100000), 'data2': np.random.randn(100000), 'key1': self.key1, 'key2': self.key2, })
-        self.df_key1 = pd.DataFrame(np.random.randn(len(self.level1), 4), index=self.level1, columns=['A', 'B', 'C', 'D'])
-        self.df_key2 = pd.DataFrame(np.random.randn(len(self.level2), 4), index=self.level2, columns=['A', 'B', 'C', 'D'])
-        self.df_shuf = self.df.reindex(self.df.index[self.shuf])
+        date_index = date_range('01-Jan-2013', '23-Jan-2013', freq='T')
+        daily_dates = date_index.to_period('D').to_timestamp('S', 'S')
+        self.fracofday = date_index.values - daily_dates.values
+        self.fracofday = self.fracofday.astype('timedelta64[ns]')
+        self.fracofday = self.fracofday.astype(np.float64) / 86400000000000.0
+        self.fracofday = Series(self.fracofday, daily_dates)
+        index = date_range(date_index.min(), date_index.max(), freq='D')
+        self.temp = Series(1.0, index)[self.fracofday.index]
 
-    def time_join_dataframe_index_single_key_small(self):
-        self.df.join(self.df_key1, on='key1')
+    def time_join_non_unique_equal(self):
+        self.fracofday * self.temp
 
 
-class join_dataframe_integer_2key(object):
-    goal_time = 0.2
+class Merge(object):
 
-    def setup(self):
-        self.df = pd.DataFrame({'key1': np.tile(np.arange(500).repeat(10), 2), 'key2': np.tile(np.arange(250).repeat(10), 4), 'value': np.random.randn(10000), })
-        self.df2 = pd.DataFrame({'key1': np.arange(500), 'value2': randn(500), })
+    goal_time = 0.2
+    params = [True, False]
+    param_names = ['sort']
+
+    def setup(self, sort):
+        N = 10000
+        indices = tm.makeStringIndex(N).values
+        indices2 = tm.makeStringIndex(N).values
+        key = np.tile(indices[:8000], 10)
+        key2 = np.tile(indices2[:8000], 10)
+        self.left = DataFrame({'key': key, 'key2': key2,
+                               'value': np.random.randn(80000)})
+        self.right = DataFrame({'key': indices[2000:],
+                                'key2': indices2[2000:],
+                                'value2': np.random.randn(8000)})
+
+        self.df = DataFrame({'key1': np.tile(np.arange(500).repeat(10), 2),
+                             'key2': np.tile(np.arange(250).repeat(10), 4),
+                             'value': np.random.randn(10000)})
+        self.df2 = DataFrame({'key1': np.arange(500),
+                              'value2': np.random.randn(500)})
         self.df3 = self.df[:5000]
 
-    def time_join_dataframe_integer_2key(self):
-        merge(self.df, self.df3)
+    def time_merge_2intkey(self, sort):
+        merge(self.left, self.right, sort=sort)
+
+    def time_merge_dataframe_integer_2key(self, sort):
+        merge(self.df, self.df3, sort=sort)
+
+    def time_merge_dataframe_integer_key(self, sort):
+        merge(self.df, self.df2, on='key1', sort=sort)
 
 
-class join_dataframe_integer_key(object):
+class I8Merge(object):
+
     goal_time = 0.2
+    params = ['inner', 'outer', 'left', 'right']
+    param_names = ['how']
 
-    def setup(self):
-        self.df = pd.DataFrame({'key1': np.tile(np.arange(500).repeat(10), 2), 'key2': np.tile(np.arange(250).repeat(10), 4), 'value': np.random.randn(10000), })
-        self.df2 = pd.DataFrame({'key1': np.arange(500), 'value2': randn(500), })
-        self.df3 = self.df[:5000]
+    def setup(self, how):
+        low, high, n = -1000, 1000, 10**6
+        self.left = DataFrame(np.random.randint(low, high, (n, 7)),
+                              columns=list('ABCDEFG'))
+        self.left['left'] = self.left.sum(axis=1)
+        self.right = self.left.sample(frac=1).rename({'left': 'right'}, axis=1)
+        self.right = self.right.reset_index(drop=True)
+        self.right['right'] *= -1
+
+    def time_i8merge(self, how):
+        merge(self.left, self.right, how=how)
 
-    def time_join_dataframe_integer_key(self):
-        merge(self.df, self.df2, on='key1')
 
+class MergeCategoricals(object):
 
-class join_non_unique_equal(object):
     goal_time = 0.2
 
     def setup(self):
-        self.date_index = date_range('01-Jan-2013', '23-Jan-2013', freq='T')
-        self.daily_dates = self.date_index.to_period('D').to_timestamp('S', 'S')
-        self.fracofday = (self.date_index.view(np.ndarray) - self.daily_dates.view(np.ndarray))
-        self.fracofday = (self.fracofday.astype('timedelta64[ns]').astype(np.float64) / 86400000000000.0)
-        self.fracofday = TimeSeries(self.fracofday, self.daily_dates)
-        self.index = date_range(self.date_index.min().to_period('A').to_timestamp('D', 'S'), self.date_index.max().to_period('A').to_timestamp('D', 'E'), freq='D')
-        self.temp = TimeSeries(1.0, self.index)
+        self.left_object = DataFrame(
+            {'X': np.random.choice(range(0, 10), size=(10000,)),
+             'Y': np.random.choice(['one', 'two', 'three'], size=(10000,))})
 
-    def time_join_non_unique_equal(self):
-        (self.fracofday * self.temp[self.fracofday.index])
+        self.right_object = DataFrame(
+            {'X': np.random.choice(range(0, 10), size=(10000,)),
+             'Z': np.random.choice(['jjj', 'kkk', 'sss'], size=(10000,))})
 
+        self.left_cat = self.left_object.assign(
+            Y=self.left_object['Y'].astype('category'))
+        self.right_cat = self.right_object.assign(
+            Z=self.right_object['Z'].astype('category'))
+
+    def time_merge_object(self):
+        merge(self.left_object, self.right_object, on='X')
+
+    def time_merge_cat(self):
+        merge(self.left_cat, self.right_cat, on='X')
 
-class left_outer_join_index(object):
-    goal_time = 0.2
+
+class MergeOrdered(object):
 
     def setup(self):
-        np.random.seed(2718281)
-        self.n = 50000
-        self.left = pd.DataFrame(np.random.randint(1, (self.n / 500), (self.n, 2)), columns=['jim', 'joe'])
-        self.right = pd.DataFrame(np.random.randint(1, (self.n / 500), (self.n, 2)), columns=['jolie', 'jolia']).set_index('jolie')
+        groups = tm.makeStringIndex(10).values
+        self.left = DataFrame({'group': groups.repeat(5000),
+                               'key': np.tile(np.arange(0, 10000, 2), 10),
+                               'lvalue': np.random.randn(50000)})
+        self.right = DataFrame({'key': np.arange(10000),
+                                'rvalue': np.random.randn(10000)})
 
-    def time_left_outer_join_index(self):
-        self.left.join(self.right, on='jim')
+    def time_merge_ordered(self):
+        merge_ordered(self.left, self.right, on='key', left_by='group')
 
 
-class merge_2intkey_nosort(object):
-    goal_time = 0.2
+class MergeAsof(object):
 
     def setup(self):
-        self.N = 10000
-        self.indices = tm.makeStringIndex(self.N).values
-        self.indices2 = tm.makeStringIndex(self.N).values
-        self.key = np.tile(self.indices[:8000], 10)
-        self.key2 = np.tile(self.indices2[:8000], 10)
-        self.left = pd.DataFrame({'key': self.key, 'key2': self.key2, 'value': np.random.randn(80000), })
-        self.right = pd.DataFrame({'key': self.indices[2000:], 'key2': self.indices2[2000:], 'value2': np.random.randn(8000), })
+        one_count = 200000
+        two_count = 1000000
 
-    def time_merge_2intkey_nosort(self):
-        merge(self.left, self.right, sort=False)
+        df1 = DataFrame(
+            {'time': np.random.randint(0, one_count / 20, one_count),
+             'key': np.random.choice(list(string.ascii_uppercase), one_count),
+             'key2': np.random.randint(0, 25, one_count),
+             'value1': np.random.randn(one_count)})
+        df2 = DataFrame(
+            {'time': np.random.randint(0, two_count / 20, two_count),
+             'key': np.random.choice(list(string.ascii_uppercase), two_count),
+             'key2': np.random.randint(0, 25, two_count),
+             'value2': np.random.randn(two_count)})
 
+        df1 = df1.sort_values('time')
+        df2 = df2.sort_values('time')
 
-class merge_2intkey_sort(object):
-    goal_time = 0.2
+        df1['time32'] = np.int32(df1.time)
+        df2['time32'] = np.int32(df2.time)
 
-    def setup(self):
-        self.N = 10000
-        self.indices = tm.makeStringIndex(self.N).values
-        self.indices2 = tm.makeStringIndex(self.N).values
-        self.key = np.tile(self.indices[:8000], 10)
-        self.key2 = np.tile(self.indices2[:8000], 10)
-        self.left = pd.DataFrame({'key': self.key, 'key2': self.key2, 'value': np.random.randn(80000), })
-        self.right = pd.DataFrame({'key': self.indices[2000:], 'key2': self.indices2[2000:], 'value2': np.random.randn(8000), })
+        self.df1a = df1[['time', 'value1']]
+        self.df2a = df2[['time', 'value2']]
+        self.df1b = df1[['time', 'key', 'value1']]
+        self.df2b = df2[['time', 'key', 'value2']]
+        self.df1c = df1[['time', 'key2', 'value1']]
+        self.df2c = df2[['time', 'key2', 'value2']]
+        self.df1d = df1[['time32', 'value1']]
+        self.df2d = df2[['time32', 'value2']]
+        self.df1e = df1[['time', 'key', 'key2', 'value1']]
+        self.df2e = df2[['time', 'key', 'key2', 'value2']]
 
-    def time_merge_2intkey_sort(self):
-        merge(self.left, self.right, sort=True)
+    def time_on_int(self):
+        merge_asof(self.df1a, self.df2a, on='time')
 
+    def time_on_int32(self):
+        merge_asof(self.df1d, self.df2d, on='time32')
 
-class series_align_int64_index(object):
-    goal_time = 0.2
+    def time_by_object(self):
+        merge_asof(self.df1b, self.df2b, on='time', by='key')
 
-    def setup(self):
-        self.n = 1000000
-        self.sz = 500000
-        self.rng = np.arange(0, 10000000000000, 10000000)
-        self.stamps = (np.datetime64(datetime.now()).view('i8') + self.rng)
-        self.idx1 = np.sort(self.sample(self.stamps, self.sz))
-        self.idx2 = np.sort(self.sample(self.stamps, self.sz))
-        self.ts1 = Series(np.random.randn(self.sz), self.idx1)
-        self.ts2 = Series(np.random.randn(self.sz), self.idx2)
+    def time_by_int(self):
+        merge_asof(self.df1c, self.df2c, on='time', by='key2')
 
-    def time_series_align_int64_index(self):
-        (self.ts1 + self.ts2)
+    def time_multiby(self):
+        merge_asof(self.df1e, self.df2e, on='time', by=['key', 'key2'])
 
-    def sample(self, values, k):
-        self.sampler = np.random.permutation(len(values))
-        return values.take(self.sampler[:k])
 
+class Align(object):
 
-class series_align_left_monotonic(object):
     goal_time = 0.2
 
     def setup(self):
-        self.n = 1000000
-        self.sz = 500000
-        self.rng = np.arange(0, 10000000000000, 10000000)
-        self.stamps = (np.datetime64(datetime.now()).view('i8') + self.rng)
-        self.idx1 = np.sort(self.sample(self.stamps, self.sz))
-        self.idx2 = np.sort(self.sample(self.stamps, self.sz))
-        self.ts1 = Series(np.random.randn(self.sz), self.idx1)
-        self.ts2 = Series(np.random.randn(self.sz), self.idx2)
+        size = 5 * 10**5
+        rng = np.arange(0, 10**13, 10**7)
+        stamps = np.datetime64('now').view('i8') + rng
+        idx1 = np.sort(np.random.choice(stamps, size, replace=False))
+        idx2 = np.sort(np.random.choice(stamps, size, replace=False))
+        self.ts1 = Series(np.random.randn(size), idx1)
+        self.ts2 = Series(np.random.randn(size), idx2)
+
+    def time_series_align_int64_index(self):
+        self.ts1 + self.ts2
 
     def time_series_align_left_monotonic(self):
         self.ts1.align(self.ts2, join='left')
-
-    def sample(self, values, k):
-        self.sampler = np.random.permutation(len(values))
-        return values.take(self.sampler[:k])
\ No newline at end of file
diff --git a/asv_bench/benchmarks/miscellaneous.py b/asv_bench/benchmarks/miscellaneous.py
deleted file mode 100644
index fe610ef4cb376..0000000000000
--- a/asv_bench/benchmarks/miscellaneous.py
+++ /dev/null
@@ -1,30 +0,0 @@
-from .pandas_vb_common import *
-from pandas.util.decorators import cache_readonly
-
-
-class match_strings(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.uniques = tm.makeStringIndex(1000).values
-        self.all = self.uniques.repeat(10)
-
-    def time_match_strings(self):
-        match(self.all, self.uniques)
-
-
-class misc_cache_readonly(object):
-    goal_time = 0.2
-
-    def setup(self):
-
-
-        class Foo:
-
-            @cache_readonly
-            def prop(self):
-                return 5
-        self.obj = Foo()
-
-    def time_misc_cache_readonly(self):
-        self.obj.prop
\ No newline at end of file
diff --git a/asv_bench/benchmarks/multiindex_object.py b/asv_bench/benchmarks/multiindex_object.py
new file mode 100644
index 0000000000000..0c92214795557
--- /dev/null
+++ b/asv_bench/benchmarks/multiindex_object.py
@@ -0,0 +1,140 @@
+import string
+
+import numpy as np
+import pandas.util.testing as tm
+from pandas import date_range, MultiIndex
+
+from .pandas_vb_common import setup  # noqa
+
+
+class GetLoc(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        self.mi_large = MultiIndex.from_product(
+            [np.arange(1000), np.arange(20), list(string.ascii_letters)],
+            names=['one', 'two', 'three'])
+        self.mi_med = MultiIndex.from_product(
+            [np.arange(1000), np.arange(10), list('A')],
+            names=['one', 'two', 'three'])
+        self.mi_small = MultiIndex.from_product(
+            [np.arange(100), list('A'), list('A')],
+            names=['one', 'two', 'three'])
+
+    def time_large_get_loc(self):
+        self.mi_large.get_loc((999, 19, 'Z'))
+
+    def time_large_get_loc_warm(self):
+        for _ in range(1000):
+            self.mi_large.get_loc((999, 19, 'Z'))
+
+    def time_med_get_loc(self):
+        self.mi_med.get_loc((999, 9, 'A'))
+
+    def time_med_get_loc_warm(self):
+        for _ in range(1000):
+            self.mi_med.get_loc((999, 9, 'A'))
+
+    def time_string_get_loc(self):
+        self.mi_small.get_loc((99, 'A', 'A'))
+
+    def time_small_get_loc_warm(self):
+        for _ in range(1000):
+            self.mi_small.get_loc((99, 'A', 'A'))
+
+
+class Duplicates(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        size = 65536
+        arrays = [np.random.randint(0, 8192, size),
+                  np.random.randint(0, 1024, size)]
+        mask = np.random.rand(size) < 0.1
+        self.mi_unused_levels = MultiIndex.from_arrays(arrays)
+        self.mi_unused_levels = self.mi_unused_levels[mask]
+
+    def time_remove_unused_levels(self):
+        self.mi_unused_levels.remove_unused_levels()
+
+
+class Integer(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        self.mi_int = MultiIndex.from_product([np.arange(1000),
+                                               np.arange(1000)],
+                                              names=['one', 'two'])
+        self.obj_index = np.array([(0, 10), (0, 11), (0, 12),
+                                   (0, 13), (0, 14), (0, 15),
+                                   (0, 16), (0, 17), (0, 18),
+                                   (0, 19)], dtype=object)
+
+    def time_get_indexer(self):
+        self.mi_int.get_indexer(self.obj_index)
+
+    def time_is_monotonic(self):
+        self.mi_int.is_monotonic
+
+
+class Duplicated(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        n, k = 200, 5000
+        levels = [np.arange(n),
+                  tm.makeStringIndex(n).values,
+                  1000 + np.arange(n)]
+        labels = [np.random.choice(n, (k * n)) for lev in levels]
+        self.mi = MultiIndex(levels=levels, labels=labels)
+
+    def time_duplicated(self):
+        self.mi.duplicated()
+
+
+class Sortlevel(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        n = 1182720
+        low, high = -4096, 4096
+        arrs = [np.repeat(np.random.randint(low, high, (n // k)), k)
+                for k in [11, 7, 5, 3, 1]]
+        self.mi_int = MultiIndex.from_arrays(arrs)[np.random.permutation(n)]
+
+        a = np.repeat(np.arange(100), 1000)
+        b = np.tile(np.arange(1000), 100)
+        self.mi = MultiIndex.from_arrays([a, b])
+        self.mi = self.mi.take(np.random.permutation(np.arange(100000)))
+
+    def time_sortlevel_int64(self):
+        self.mi_int.sortlevel()
+
+    def time_sortlevel_zero(self):
+        self.mi.sortlevel(0)
+
+    def time_sortlevel_one(self):
+        self.mi.sortlevel(1)
+
+
+class Values(object):
+
+    goal_time = 0.2
+
+    def setup_cache(self):
+
+        level1 = range(1000)
+        level2 = date_range(start='1/1/2012', periods=100)
+        mi = MultiIndex.from_product([level1, level2])
+        return mi
+
+    def time_datetime_level_values_copy(self, mi):
+        mi.copy().values
+
+    def time_datetime_level_values_sliced(self, mi):
+        mi[:10].values
diff --git a/asv_bench/benchmarks/offset.py b/asv_bench/benchmarks/offset.py
new file mode 100644
index 0000000000000..e161b887ee86f
--- /dev/null
+++ b/asv_bench/benchmarks/offset.py
@@ -0,0 +1,125 @@
+# -*- coding: utf-8 -*-
+import warnings
+from datetime import datetime
+
+import numpy as np
+import pandas as pd
+try:
+    import pandas.tseries.holiday  # noqa
+except ImportError:
+    pass
+
+hcal = pd.tseries.holiday.USFederalHolidayCalendar()
+# These offests currently raise a NotImplimentedError with .apply_index()
+non_apply = [pd.offsets.Day(),
+             pd.offsets.BYearEnd(),
+             pd.offsets.BYearBegin(),
+             pd.offsets.BQuarterEnd(),
+             pd.offsets.BQuarterBegin(),
+             pd.offsets.BMonthEnd(),
+             pd.offsets.BMonthBegin(),
+             pd.offsets.CustomBusinessDay(),
+             pd.offsets.CustomBusinessDay(calendar=hcal),
+             pd.offsets.CustomBusinessMonthBegin(calendar=hcal),
+             pd.offsets.CustomBusinessMonthEnd(calendar=hcal),
+             pd.offsets.CustomBusinessMonthEnd(calendar=hcal)]
+other_offsets = [pd.offsets.YearEnd(), pd.offsets.YearBegin(),
+                 pd.offsets.QuarterEnd(), pd.offsets.QuarterBegin(),
+                 pd.offsets.MonthEnd(), pd.offsets.MonthBegin(),
+                 pd.offsets.DateOffset(months=2, days=2),
+                 pd.offsets.BusinessDay(), pd.offsets.SemiMonthEnd(),
+                 pd.offsets.SemiMonthBegin()]
+offsets = non_apply + other_offsets
+
+
+class ApplyIndex(object):
+
+    goal_time = 0.2
+
+    params = other_offsets
+    param_names = ['offset']
+
+    def setup(self, offset):
+        N = 10000
+        self.rng = pd.date_range(start='1/1/2000', periods=N, freq='T')
+
+    def time_apply_index(self, offset):
+        offset.apply_index(self.rng)
+
+
+class OnOffset(object):
+
+    goal_time = 0.2
+
+    params = offsets
+    param_names = ['offset']
+
+    def setup(self, offset):
+        self.dates = [datetime(2016, m, d)
+                      for m in [10, 11, 12]
+                      for d in [1, 2, 3, 28, 29, 30, 31]
+                      if not (m == 11 and d == 31)]
+
+    def time_on_offset(self, offset):
+        for date in self.dates:
+            offset.onOffset(date)
+
+
+class OffsetSeriesArithmetic(object):
+
+    goal_time = 0.2
+    params = offsets
+    param_names = ['offset']
+
+    def setup(self, offset):
+        N = 1000
+        rng = pd.date_range(start='1/1/2000', periods=N, freq='T')
+        self.data = pd.Series(rng)
+
+    def time_add_offset(self, offset):
+        with warnings.catch_warnings(record=True):
+            self.data + offset
+
+
+class OffsetDatetimeIndexArithmetic(object):
+
+    goal_time = 0.2
+    params = offsets
+    param_names = ['offset']
+
+    def setup(self, offset):
+        N = 1000
+        self.data = pd.date_range(start='1/1/2000', periods=N, freq='T')
+
+    def time_add_offset(self, offset):
+        with warnings.catch_warnings(record=True):
+            self.data + offset
+
+
+class OffestDatetimeArithmetic(object):
+
+    goal_time = 0.2
+    params = offsets
+    param_names = ['offset']
+
+    def setup(self, offset):
+        self.date = datetime(2011, 1, 1)
+        self.dt64 = np.datetime64('2011-01-01 09:00Z')
+
+    def time_apply(self, offset):
+        offset.apply(self.date)
+
+    def time_apply_np_dt64(self, offset):
+        offset.apply(self.dt64)
+
+    def time_add(self, offset):
+        self.date + offset
+
+    def time_add_10(self, offset):
+        self.date + (10 * offset)
+
+    def time_subtract(self, offset):
+        self.date - offset
+
+    def time_subtract_10(self, offset):
+        self.date - (10 * offset)
diff --git a/asv_bench/benchmarks/packers.py b/asv_bench/benchmarks/packers.py
deleted file mode 100644
index 12e48295d8d05..0000000000000
--- a/asv_bench/benchmarks/packers.py
+++ /dev/null
@@ -1,857 +0,0 @@
-from .pandas_vb_common import *
-from numpy.random import randint
-import pandas as pd
-from collections import OrderedDict
-from pandas.compat import BytesIO
-import sqlite3
-import os
-from sqlalchemy import create_engine
-import numpy as np
-from random import randrange
-from pandas.core import common as com
-
-
-class packers_read_csv(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.df.to_csv(self.f)
-
-    def time_packers_read_csv(self):
-        pd.read_csv(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_read_excel(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.bio = BytesIO()
-        self.writer = pd.io.excel.ExcelWriter(self.bio, engine='xlsxwriter')
-        self.df[:2000].to_excel(self.writer)
-        self.writer.save()
-
-    def time_packers_read_excel(self):
-        self.bio.seek(0)
-        pd.read_excel(self.bio)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_read_hdf_store(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.df2.to_hdf(self.f, 'df')
-
-    def time_packers_read_hdf_store(self):
-        pd.read_hdf(self.f, 'df')
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_read_hdf_table(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.df2.to_hdf(self.f, 'df', format='table')
-
-    def time_packers_read_hdf_table(self):
-        pd.read_hdf(self.f, 'df')
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_read_json(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.df.to_json(self.f, orient='split')
-        self.df.index = np.arange(self.N)
-
-    def time_packers_read_json(self):
-        pd.read_json(self.f, orient='split')
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_read_json_date_index(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.df.to_json(self.f, orient='split')
-
-    def time_packers_read_json_date_index(self):
-        pd.read_json(self.f, orient='split')
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_read_pack(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.df2.to_msgpack(self.f)
-
-    def time_packers_read_pack(self):
-        pd.read_msgpack(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_read_pickle(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.df2.to_pickle(self.f)
-
-    def time_packers_read_pickle(self):
-        pd.read_pickle(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_read_sql(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.engine = create_engine('sqlite:///:memory:')
-        self.df2.to_sql('table', self.engine, if_exists='replace')
-
-    def time_packers_read_sql(self):
-        pd.read_sql_table('table', self.engine)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_read_stata(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.df.to_stata(self.f, {'index': 'tc', })
-
-    def time_packers_read_stata(self):
-        pd.read_stata(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_read_stata_with_validation(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.df['int8_'] = [randint(np.iinfo(np.int8).min, (np.iinfo(np.int8).max - 27)) for _ in range(self.N)]
-        self.df['int16_'] = [randint(np.iinfo(np.int16).min, (np.iinfo(np.int16).max - 27)) for _ in range(self.N)]
-        self.df['int32_'] = [randint(np.iinfo(np.int32).min, (np.iinfo(np.int32).max - 27)) for _ in range(self.N)]
-        self.df['float32_'] = np.array(randn(self.N), dtype=np.float32)
-        self.df.to_stata(self.f, {'index': 'tc', })
-
-    def time_packers_read_stata_with_validation(self):
-        pd.read_stata(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_csv(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-
-    def time_packers_write_csv(self):
-        self.df.to_csv(self.f)
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_excel_openpyxl(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.bio = BytesIO()
-
-    def time_packers_write_excel_openpyxl(self):
-        self.bio.seek(0)
-        self.writer = pd.io.excel.ExcelWriter(self.bio, engine='openpyxl')
-        self.df[:2000].to_excel(self.writer)
-        self.writer.save()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_excel_xlsxwriter(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.bio = BytesIO()
-
-    def time_packers_write_excel_xlsxwriter(self):
-        self.bio.seek(0)
-        self.writer = pd.io.excel.ExcelWriter(self.bio, engine='xlsxwriter')
-        self.df[:2000].to_excel(self.writer)
-        self.writer.save()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_excel_xlwt(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.bio = BytesIO()
-
-    def time_packers_write_excel_xlwt(self):
-        self.bio.seek(0)
-        self.writer = pd.io.excel.ExcelWriter(self.bio, engine='xlwt')
-        self.df[:2000].to_excel(self.writer)
-        self.writer.save()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_hdf_store(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-
-    def time_packers_write_hdf_store(self):
-        self.df2.to_hdf(self.f, 'df')
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_hdf_table(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-
-    def time_packers_write_hdf_table(self):
-        self.df2.to_hdf(self.f, 'df', table=True)
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_json(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.df.index = np.arange(self.N)
-
-    def time_packers_write_json(self):
-        self.df.to_json(self.f, orient='split')
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_json_T(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.df.index = np.arange(self.N)
-
-    def time_packers_write_json_T(self):
-        self.df.to_json(self.f, orient='columns')
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_json_date_index(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-
-    def time_packers_write_json_date_index(self):
-        self.df.to_json(self.f, orient='split')
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_json_mixed_delta_int_tstamp(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.cols = [(lambda i: ('{0}_timedelta'.format(i), [pd.Timedelta(('%d seconds' % randrange(1000000.0))) for _ in range(self.N)])), (lambda i: ('{0}_int'.format(i), randint(100000000.0, size=self.N))), (lambda i: ('{0}_timestamp'.format(i), [pd.Timestamp((1418842918083256000 + randrange(1000000000.0, 1e+18, 200))) for _ in range(self.N)]))]
-        self.df_mixed = DataFrame(OrderedDict([self.cols[(i % len(self.cols))](i) for i in range(self.C)]), index=self.index)
-
-    def time_packers_write_json_mixed_delta_int_tstamp(self):
-        self.df_mixed.to_json(self.f, orient='split')
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_json_mixed_float_int(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.cols = [(lambda i: ('{0}_float'.format(i), randn(self.N))), (lambda i: ('{0}_int'.format(i), randint(100000000.0, size=self.N)))]
-        self.df_mixed = DataFrame(OrderedDict([self.cols[(i % len(self.cols))](i) for i in range(self.C)]), index=self.index)
-
-    def time_packers_write_json_mixed_float_int(self):
-        self.df_mixed.to_json(self.f, orient='index')
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_json_mixed_float_int_T(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.cols = [(lambda i: ('{0}_float'.format(i), randn(self.N))), (lambda i: ('{0}_int'.format(i), randint(100000000.0, size=self.N)))]
-        self.df_mixed = DataFrame(OrderedDict([self.cols[(i % len(self.cols))](i) for i in range(self.C)]), index=self.index)
-
-    def time_packers_write_json_mixed_float_int_T(self):
-        self.df_mixed.to_json(self.f, orient='columns')
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_json_mixed_float_int_str(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.cols = [(lambda i: ('{0}_float'.format(i), randn(self.N))), (lambda i: ('{0}_int'.format(i), randint(100000000.0, size=self.N))), (lambda i: ('{0}_str'.format(i), [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]))]
-        self.df_mixed = DataFrame(OrderedDict([self.cols[(i % len(self.cols))](i) for i in range(self.C)]), index=self.index)
-
-    def time_packers_write_json_mixed_float_int_str(self):
-        self.df_mixed.to_json(self.f, orient='split')
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_pack(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-
-    def time_packers_write_pack(self):
-        self.df2.to_msgpack(self.f)
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_pickle(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-
-    def time_packers_write_pickle(self):
-        self.df2.to_pickle(self.f)
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_sql(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.engine = create_engine('sqlite:///:memory:')
-
-    def time_packers_write_sql(self):
-        self.df2.to_sql('table', self.engine, if_exists='replace')
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_stata(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.df.to_stata(self.f, {'index': 'tc', })
-
-    def time_packers_write_stata(self):
-        self.df.to_stata(self.f, {'index': 'tc', })
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-
-class packers_write_stata_with_validation(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df2 = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-        self.df['int8_'] = [randint(np.iinfo(np.int8).min, (np.iinfo(np.int8).max - 27)) for _ in range(self.N)]
-        self.df['int16_'] = [randint(np.iinfo(np.int16).min, (np.iinfo(np.int16).max - 27)) for _ in range(self.N)]
-        self.df['int32_'] = [randint(np.iinfo(np.int32).min, (np.iinfo(np.int32).max - 27)) for _ in range(self.N)]
-        self.df['float32_'] = np.array(randn(self.N), dtype=np.float32)
-        self.df.to_stata(self.f, {'index': 'tc', })
-
-    def time_packers_write_stata_with_validation(self):
-        self.df.to_stata(self.f, {'index': 'tc', })
-
-    def teardown(self):
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
\ No newline at end of file
diff --git a/asv_bench/benchmarks/pandas_vb_common.py b/asv_bench/benchmarks/pandas_vb_common.py
index 3370131929c22..e255cd94f265b 100644
--- a/asv_bench/benchmarks/pandas_vb_common.py
+++ b/asv_bench/benchmarks/pandas_vb_common.py
@@ -1,31 +1,43 @@
-from pandas import *
-import pandas as pd
-from datetime import timedelta
-from numpy.random import randn
-from numpy.random import randint
-from numpy.random import permutation
-import pandas.util.testing as tm
-import random
+import os
+from importlib import import_module
+
 import numpy as np
-import threading
-try:
-    from pandas.compat import range
-except ImportError:
-    pass
-
-np.random.seed(1234)
-try:
-    import pandas._tseries as lib
-except:
-    import pandas.lib as lib
-
-try:
-    Panel = WidePanel
-except Exception:
-    pass
-
-# didn't add to namespace until later
-try:
-    from pandas.core.index import MultiIndex
-except ImportError:
-    pass
+from pandas import Panel
+
+# Compatibility import for lib
+for imp in ['pandas._libs.lib', 'pandas.lib']:
+    try:
+        lib = import_module(imp)
+        break
+    except:
+        pass
+
+numeric_dtypes = [np.int64, np.int32, np.uint32, np.uint64, np.float32,
+                  np.float64, np.int16, np.int8, np.uint16, np.uint8]
+datetime_dtypes = [np.datetime64, np.timedelta64]
+
+
+def setup(*args, **kwargs):
+    # This function just needs to be imported into each benchmark file to
+    # set up the random seed before each function.
+    # http://asv.readthedocs.io/en/latest/writing_benchmarks.html
+    np.random.seed(1234)
+
+
+class BaseIO(object):
+    """
+    Base class for IO benchmarks
+    """
+    fname = None
+
+    def remove(self, f):
+        """Remove created files"""
+        try:
+            os.remove(f)
+        except:
+            # On Windows, attempting to remove a file that is in use
+            # causes an exception to be raised
+            pass
+
+    def teardown(self, *args, **kwargs):
+        self.remove(self.fname)
diff --git a/asv_bench/benchmarks/panel_ctor.py b/asv_bench/benchmarks/panel_ctor.py
index 0b0e73847aa96..ce946c76ed199 100644
--- a/asv_bench/benchmarks/panel_ctor.py
+++ b/asv_bench/benchmarks/panel_ctor.py
@@ -1,64 +1,60 @@
-from .pandas_vb_common import *
+import warnings
+from datetime import datetime, timedelta
 
+from pandas import DataFrame, DatetimeIndex, date_range
 
-class panel_from_dict_all_different_indexes(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data_frames = {}
-        self.start = datetime(1990, 1, 1)
-        self.end = datetime(2012, 1, 1)
-        for x in range(100):
-            self.end += timedelta(days=1)
-            self.dr = np.asarray(date_range(self.start, self.end))
-            self.df = DataFrame({'a': ([0] * len(self.dr)), 'b': ([1] * len(self.dr)), 'c': ([2] * len(self.dr)), }, index=self.dr)
-            self.data_frames[x] = self.df
-
-    def time_panel_from_dict_all_different_indexes(self):
-        Panel.from_dict(self.data_frames)
+from .pandas_vb_common import Panel, setup  # noqa
 
 
-class panel_from_dict_equiv_indexes(object):
+class DifferentIndexes(object):
     goal_time = 0.2
 
     def setup(self):
         self.data_frames = {}
+        start = datetime(1990, 1, 1)
+        end = datetime(2012, 1, 1)
         for x in range(100):
-            self.dr = np.asarray(DatetimeIndex(start=datetime(1990, 1, 1), end=datetime(2012, 1, 1), freq=datetools.Day(1)))
-            self.df = DataFrame({'a': ([0] * len(self.dr)), 'b': ([1] * len(self.dr)), 'c': ([2] * len(self.dr)), }, index=self.dr)
-            self.data_frames[x] = self.df
+            end += timedelta(days=1)
+            idx = date_range(start, end)
+            df = DataFrame({'a': 0, 'b': 1, 'c': 2}, index=idx)
+            self.data_frames[x] = df
 
-    def time_panel_from_dict_equiv_indexes(self):
-        Panel.from_dict(self.data_frames)
+    def time_from_dict(self):
+        with warnings.catch_warnings(record=True):
+            Panel.from_dict(self.data_frames)
 
 
-class panel_from_dict_same_index(object):
+class SameIndexes(object):
+
     goal_time = 0.2
 
     def setup(self):
-        self.dr = np.asarray(DatetimeIndex(start=datetime(1990, 1, 1), end=datetime(2012, 1, 1), freq=datetools.Day(1)))
-        self.data_frames = {}
-        for x in range(100):
-            self.df = DataFrame({'a': ([0] * len(self.dr)), 'b': ([1] * len(self.dr)), 'c': ([2] * len(self.dr)), }, index=self.dr)
-            self.data_frames[x] = self.df
+        idx = DatetimeIndex(start=datetime(1990, 1, 1),
+                            end=datetime(2012, 1, 1),
+                            freq='D')
+        df = DataFrame({'a': 0, 'b': 1, 'c': 2}, index=idx)
+        self.data_frames = dict(enumerate([df] * 100))
 
-    def time_panel_from_dict_same_index(self):
-        Panel.from_dict(self.data_frames)
+    def time_from_dict(self):
+        with warnings.catch_warnings(record=True):
+            Panel.from_dict(self.data_frames)
 
 
-class panel_from_dict_two_different_indexes(object):
+class TwoIndexes(object):
+
     goal_time = 0.2
 
     def setup(self):
-        self.data_frames = {}
-        self.start = datetime(1990, 1, 1)
-        self.end = datetime(2012, 1, 1)
-        for x in range(100):
-            if (x == 50):
-                self.end += timedelta(days=1)
-            self.dr = np.asarray(date_range(self.start, self.end))
-            self.df = DataFrame({'a': ([0] * len(self.dr)), 'b': ([1] * len(self.dr)), 'c': ([2] * len(self.dr)), }, index=self.dr)
-            self.data_frames[x] = self.df
-
-    def time_panel_from_dict_two_different_indexes(self):
-        Panel.from_dict(self.data_frames)
\ No newline at end of file
+        start = datetime(1990, 1, 1)
+        end = datetime(2012, 1, 1)
+        df1 = DataFrame({'a': 0, 'b': 1, 'c': 2},
+                        index=DatetimeIndex(start=start, end=end, freq='D'))
+        end += timedelta(days=1)
+        df2 = DataFrame({'a': 0, 'b': 1, 'c': 2},
+                        index=DatetimeIndex(start=start, end=end, freq='D'))
+        dfs = [df1] * 50 + [df2] * 50
+        self.data_frames = dict(enumerate(dfs))
+
+    def time_from_dict(self):
+        with warnings.catch_warnings(record=True):
+            Panel.from_dict(self.data_frames)
diff --git a/asv_bench/benchmarks/panel_methods.py b/asv_bench/benchmarks/panel_methods.py
index 90118eaf6e407..a5b1a92e9cf67 100644
--- a/asv_bench/benchmarks/panel_methods.py
+++ b/asv_bench/benchmarks/panel_methods.py
@@ -1,56 +1,24 @@
-from .pandas_vb_common import *
+import warnings
 
+import numpy as np
 
-class panel_pct_change_items(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = date_range(start='2000', freq='D', periods=1000)
-        self.panel = Panel(np.random.randn(100, len(self.index), 1000))
-
-    def time_panel_pct_change_items(self):
-        self.panel.pct_change(1, axis='items')
-
-
-class panel_pct_change_major(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = date_range(start='2000', freq='D', periods=1000)
-        self.panel = Panel(np.random.randn(100, len(self.index), 1000))
-
-    def time_panel_pct_change_major(self):
-        self.panel.pct_change(1, axis='major')
+from .pandas_vb_common import Panel, setup  # noqa
 
 
-class panel_pct_change_minor(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = date_range(start='2000', freq='D', periods=1000)
-        self.panel = Panel(np.random.randn(100, len(self.index), 1000))
-
-    def time_panel_pct_change_minor(self):
-        self.panel.pct_change(1, axis='minor')
-
+class PanelMethods(object):
 
-class panel_shift(object):
     goal_time = 0.2
+    params = ['items', 'major', 'minor']
+    param_names = ['axis']
 
-    def setup(self):
-        self.index = date_range(start='2000', freq='D', periods=1000)
-        self.panel = Panel(np.random.randn(100, len(self.index), 1000))
-
-    def time_panel_shift(self):
-        self.panel.shift(1)
-
-
-class panel_shift_minor(object):
-    goal_time = 0.2
+    def setup(self, axis):
+        with warnings.catch_warnings(record=True):
+            self.panel = Panel(np.random.randn(100, 1000, 100))
 
-    def setup(self):
-        self.index = date_range(start='2000', freq='D', periods=1000)
-        self.panel = Panel(np.random.randn(100, len(self.index), 1000))
+    def time_pct_change(self, axis):
+        with warnings.catch_warnings(record=True):
+            self.panel.pct_change(1, axis=axis)
 
-    def time_panel_shift_minor(self):
-        self.panel.shift(1, axis='minor')
\ No newline at end of file
+    def time_shift(self, axis):
+        with warnings.catch_warnings(record=True):
+            self.panel.shift(1, axis=axis)
diff --git a/asv_bench/benchmarks/parser_vb.py b/asv_bench/benchmarks/parser_vb.py
deleted file mode 100644
index 18cd4de6cc9c5..0000000000000
--- a/asv_bench/benchmarks/parser_vb.py
+++ /dev/null
@@ -1,112 +0,0 @@
-from .pandas_vb_common import *
-import os
-from pandas import read_csv, read_table
-try:
-    from cStringIO import StringIO
-except ImportError:
-    from io import StringIO
-
-
-class read_csv_comment2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = ['A,B,C']
-        self.data = (self.data + (['1,2,3 # comment'] * 100000))
-        self.data = '\n'.join(self.data)
-
-    def time_read_csv_comment2(self):
-        read_csv(StringIO(self.data), comment='#')
-
-
-class read_csv_default_converter(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = '0.1213700904466425978256438611,0.0525708283766902484401839501,0.4174092731488769913994474336\n        0.4096341697147408700274695547,0.1587830198973579909349496119,0.1292545832485494372576795285\n        0.8323255650024565799327547210,0.9694902427379478160318626578,0.6295047811546814475747169126\n        0.4679375305798131323697930383,0.2963942381834381301075609371,0.5268936082160610157032465394\n        0.6685382761849776311890991564,0.6721207066140679753374342908,0.6519975277021627935170045020\n        '
-        self.data = (self.data * 200)
-
-    def time_read_csv_default_converter(self):
-        read_csv(StringIO(self.data), sep=',', header=None, float_precision=None)
-
-
-class read_csv_precise_converter(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = '0.1213700904466425978256438611,0.0525708283766902484401839501,0.4174092731488769913994474336\n        0.4096341697147408700274695547,0.1587830198973579909349496119,0.1292545832485494372576795285\n        0.8323255650024565799327547210,0.9694902427379478160318626578,0.6295047811546814475747169126\n        0.4679375305798131323697930383,0.2963942381834381301075609371,0.5268936082160610157032465394\n        0.6685382761849776311890991564,0.6721207066140679753374342908,0.6519975277021627935170045020\n        '
-        self.data = (self.data * 200)
-
-    def time_read_csv_precise_converter(self):
-        read_csv(StringIO(self.data), sep=',', header=None, float_precision='high')
-
-
-class read_csv_roundtrip_converter(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = '0.1213700904466425978256438611,0.0525708283766902484401839501,0.4174092731488769913994474336\n        0.4096341697147408700274695547,0.1587830198973579909349496119,0.1292545832485494372576795285\n        0.8323255650024565799327547210,0.9694902427379478160318626578,0.6295047811546814475747169126\n        0.4679375305798131323697930383,0.2963942381834381301075609371,0.5268936082160610157032465394\n        0.6685382761849776311890991564,0.6721207066140679753374342908,0.6519975277021627935170045020\n        '
-        self.data = (self.data * 200)
-
-    def time_read_csv_roundtrip_converter(self):
-        read_csv(StringIO(self.data), sep=',', header=None, float_precision='round_trip')
-
-
-class read_csv_thou_vb(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 10000
-        self.K = 8
-        self.format = (lambda x: '{:,}'.format(x))
-        self.df = DataFrame((np.random.randn(self.N, self.K) * np.random.randint(100, 10000, (self.N, self.K))))
-        self.df = self.df.applymap(self.format)
-        self.df.to_csv('test.csv', sep='|')
-
-    def time_read_csv_thou_vb(self):
-        read_csv('test.csv', sep='|', thousands=',')
-
-    def teardown(self):
-        os.remove('test.csv')
-
-
-class read_csv_vb(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 10000
-        self.K = 8
-        self.df = DataFrame((np.random.randn(self.N, self.K) * np.random.randint(100, 10000, (self.N, self.K))))
-        self.df.to_csv('test.csv', sep='|')
-
-    def time_read_csv_vb(self):
-        read_csv('test.csv', sep='|')
-
-    def teardown(self):
-        os.remove('test.csv')
-
-
-class read_table_multiple_date(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 10000
-        self.K = 8
-        self.data = 'KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000\n        KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000\n        KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000\n        KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000\n        KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000\n        '
-        self.data = (self.data * 200)
-
-    def time_read_table_multiple_date(self):
-        read_table(StringIO(self.data), sep=',', header=None, parse_dates=[[1, 2], [1, 3]])
-
-
-class read_table_multiple_date_baseline(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 10000
-        self.K = 8
-        self.data = 'KORD,19990127 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000\n        KORD,19990127 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000\n        KORD,19990127 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000\n        KORD,19990127 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000\n        KORD,19990127 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000\n        '
-        self.data = (self.data * 200)
-
-    def time_read_table_multiple_date_baseline(self):
-        read_table(StringIO(self.data), sep=',', header=None, parse_dates=[1])
\ No newline at end of file
diff --git a/asv_bench/benchmarks/period.py b/asv_bench/benchmarks/period.py
new file mode 100644
index 0000000000000..c34f9a737473e
--- /dev/null
+++ b/asv_bench/benchmarks/period.py
@@ -0,0 +1,121 @@
+from pandas import (DataFrame, Series, Period, PeriodIndex, date_range,
+                    period_range)
+
+
+class PeriodProperties(object):
+
+    params = (['M', 'min'],
+              ['year', 'month', 'day', 'hour', 'minute', 'second',
+               'is_leap_year', 'quarter', 'qyear', 'week', 'daysinmonth',
+               'dayofweek', 'dayofyear', 'start_time', 'end_time'])
+    param_names = ['freq', 'attr']
+
+    def setup(self, freq, attr):
+        self.per = Period('2012-06-01', freq=freq)
+
+    def time_property(self, freq, attr):
+        getattr(self.per, attr)
+
+
+class PeriodUnaryMethods(object):
+
+    params = ['M', 'min']
+    param_names = ['freq']
+
+    def setup(self, freq):
+        self.per = Period('2012-06-01', freq=freq)
+
+    def time_to_timestamp(self, freq):
+        self.per.to_timestamp()
+
+    def time_now(self, freq):
+        self.per.now(freq)
+
+    def time_asfreq(self, freq):
+        self.per.asfreq('A')
+
+
+class PeriodIndexConstructor(object):
+
+    goal_time = 0.2
+
+    params = ['D']
+    param_names = ['freq']
+
+    def setup(self, freq):
+        self.rng = date_range('1985', periods=1000)
+        self.rng2 = date_range('1985', periods=1000).to_pydatetime()
+
+    def time_from_date_range(self, freq):
+        PeriodIndex(self.rng, freq=freq)
+
+    def time_from_pydatetime(self, freq):
+        PeriodIndex(self.rng2, freq=freq)
+
+
+class DataFramePeriodColumn(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        self.rng = period_range(start='1/1/1990', freq='S', periods=20000)
+        self.df = DataFrame(index=range(len(self.rng)))
+
+    def time_setitem_period_column(self):
+        self.df['col'] = self.rng
+
+    def time_set_index(self):
+        # GH#21582 limited by comparisons of Period objects
+        self.df['col2'] = self.rng
+        self.df.set_index('col2', append=True)
+
+
+class Algorithms(object):
+
+    goal_time = 0.2
+
+    params = ['index', 'series']
+    param_names = ['typ']
+
+    def setup(self, typ):
+        data = [Period('2011-01', freq='M'), Period('2011-02', freq='M'),
+                Period('2011-03', freq='M'), Period('2011-04', freq='M')]
+
+        if typ == 'index':
+            self.vector = PeriodIndex(data * 1000, freq='M')
+        elif typ == 'series':
+            self.vector = Series(data * 1000)
+
+    def time_drop_duplicates(self, typ):
+        self.vector.drop_duplicates()
+
+    def time_value_counts(self, typ):
+        self.vector.value_counts()
+
+
+class Indexing(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        self.index = PeriodIndex(start='1985', periods=1000, freq='D')
+        self.series = Series(range(1000), index=self.index)
+        self.period = self.index[500]
+
+    def time_get_loc(self):
+        self.index.get_loc(self.period)
+
+    def time_shape(self):
+        self.index.shape
+
+    def time_shallow_copy(self):
+        self.index._shallow_copy()
+
+    def time_series_loc(self):
+        self.series.loc[self.period]
+
+    def time_align(self):
+        DataFrame({'a': self.series, 'b': self.series[:500]})
+
+    def time_intersection(self):
+        self.index[:750].intersection(self.index[250:])
diff --git a/asv_bench/benchmarks/plotting.py b/asv_bench/benchmarks/plotting.py
index f46082ac6f288..5b49112b0e07d 100644
--- a/asv_bench/benchmarks/plotting.py
+++ b/asv_bench/benchmarks/plotting.py
@@ -1,19 +1,64 @@
-from .pandas_vb_common import *
+import numpy as np
+from pandas import DataFrame, Series, DatetimeIndex, date_range
 try:
-    from pandas import date_range
+    from pandas.plotting import andrews_curves
 except ImportError:
+    from pandas.tools.plotting import andrews_curves
+import matplotlib
+matplotlib.use('Agg')
 
-    def date_range(start=None, end=None, periods=None, freq=None):
-        return DatetimeIndex(start, end, periods=periods, offset=freq)
+from .pandas_vb_common import setup  # noqa
 
 
-class plot_timeseries_period(object):
+class Plotting(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        self.s = Series(np.random.randn(1000000))
+        self.df = DataFrame({'col': self.s})
+
+    def time_series_plot(self):
+        self.s.plot()
+
+    def time_frame_plot(self):
+        self.df.plot()
+
+
+class TimeseriesPlotting(object):
+
     goal_time = 0.2
 
     def setup(self):
-        self.N = 2000
-        self.M = 5
-        self.df = DataFrame(np.random.randn(self.N, self.M), index=date_range('1/1/1975', periods=self.N))
+        N = 2000
+        M = 5
+        idx = date_range('1/1/1975', periods=N)
+        self.df = DataFrame(np.random.randn(N, M), index=idx)
+
+        idx_irregular = DatetimeIndex(np.concatenate((idx.values[0:10],
+                                                      idx.values[12:])))
+        self.df2 = DataFrame(np.random.randn(len(idx_irregular), M),
+                             index=idx_irregular)
+
+    def time_plot_regular(self):
+        self.df.plot()
+
+    def time_plot_regular_compat(self):
+        self.df.plot(x_compat=True)
+
+    def time_plot_irregular(self):
+        self.df2.plot()
+
+
+class Misc(object):
+
+    goal_time = 0.6
+
+    def setup(self):
+        N = 500
+        M = 10
+        self.df = DataFrame(np.random.randn(N, M))
+        self.df['Name'] = ["A"] * N
 
-    def time_plot_timeseries_period(self):
-        self.df.plot()
\ No newline at end of file
+    def time_plot_andrews_curves(self):
+        andrews_curves(self.df, "Name")
diff --git a/asv_bench/benchmarks/reindex.py b/asv_bench/benchmarks/reindex.py
index b1c039058ff8f..413427a16f40b 100644
--- a/asv_bench/benchmarks/reindex.py
+++ b/asv_bench/benchmarks/reindex.py
@@ -1,397 +1,172 @@
-from .pandas_vb_common import *
-from random import shuffle
+import numpy as np
+import pandas.util.testing as tm
+from pandas import (DataFrame, Series, DatetimeIndex, MultiIndex, Index,
+                    date_range)
+from .pandas_vb_common import setup, lib  # noqa
 
 
-class dataframe_reindex(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = DatetimeIndex(start='1/1/1970', periods=10000, freq=datetools.Minute())
-        self.df = DataFrame(np.random.rand(10000, 10), index=self.rng, columns=range(10))
-        self.df['foo'] = 'bar'
-        self.rng2 = Index(self.rng[::2])
-
-    def time_dataframe_reindex(self):
-        self.df.reindex(self.rng2)
-
-
-class frame_drop_dup_inplace(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 10000
-        self.K = 10
-        self.key1 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.key2 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.df = DataFrame({'key1': self.key1, 'key2': self.key2, 'value': np.random.randn((self.N * self.K)), })
-        self.col_array_list = list(self.df.values.T)
-
-    def time_frame_drop_dup_inplace(self):
-        self.df.drop_duplicates(['key1', 'key2'], inplace=True)
-
-
-class frame_drop_dup_na_inplace(object):
-    goal_time = 0.2
+class Reindex(object):
 
-    def setup(self):
-        self.N = 10000
-        self.K = 10
-        self.key1 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.key2 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.df = DataFrame({'key1': self.key1, 'key2': self.key2, 'value': np.random.randn((self.N * self.K)), })
-        self.col_array_list = list(self.df.values.T)
-        self.df.ix[:10000, :] = np.nan
-
-    def time_frame_drop_dup_na_inplace(self):
-        self.df.drop_duplicates(['key1', 'key2'], inplace=True)
-
-
-class frame_drop_duplicates(object):
     goal_time = 0.2
 
     def setup(self):
-        self.N = 10000
-        self.K = 10
-        self.key1 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.key2 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.df = DataFrame({'key1': self.key1, 'key2': self.key2, 'value': np.random.randn((self.N * self.K)), })
-        self.col_array_list = list(self.df.values.T)
-
-    def time_frame_drop_duplicates(self):
-        self.df.drop_duplicates(['key1', 'key2'])
-
-
-class frame_drop_duplicates_int(object):
-
-    def setup(self):
-        np.random.seed(1234)
-        self.N = 1000000
-        self.K = 10000
-        self.key1 = np.random.randint(0,self.K,size=self.N)
-        self.df = DataFrame({'key1': self.key1})
-
-    def time_frame_drop_duplicates_int(self):
-        self.df.drop_duplicates()
-
-
-class frame_drop_duplicates_na(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 10000
-        self.K = 10
-        self.key1 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.key2 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.df = DataFrame({'key1': self.key1, 'key2': self.key2, 'value': np.random.randn((self.N * self.K)), })
-        self.col_array_list = list(self.df.values.T)
-        self.df.ix[:10000, :] = np.nan
-
-    def time_frame_drop_duplicates_na(self):
-        self.df.drop_duplicates(['key1', 'key2'])
-
-
-class frame_fillna_many_columns_pad(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.values = np.random.randn(1000, 1000)
-        self.values[::2] = np.nan
-        self.df = DataFrame(self.values)
-
-    def time_frame_fillna_many_columns_pad(self):
-        self.df.fillna(method='pad')
-
-
-class frame_reindex_columns(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(index=range(10000), data=np.random.rand(10000, 30), columns=range(30))
-
-    def time_frame_reindex_columns(self):
-        self.df.reindex(columns=self.df.columns[1:5])
-
-
-class frame_sort_index_by_columns(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 10000
-        self.K = 10
-        self.key1 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.key2 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.df = DataFrame({'key1': self.key1, 'key2': self.key2, 'value': np.random.randn((self.N * self.K)), })
-        self.col_array_list = list(self.df.values.T)
-
-    def time_frame_sort_index_by_columns(self):
-        self.df.sort_index(by=['key1', 'key2'])
-
-
-class lib_fast_zip(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 10000
-        self.K = 10
-        self.key1 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.key2 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.df = DataFrame({'key1': self.key1, 'key2': self.key2, 'value': np.random.randn((self.N * self.K)), })
-        self.col_array_list = list(self.df.values.T)
-
-    def time_lib_fast_zip(self):
-        lib.fast_zip(self.col_array_list)
-
-
-class lib_fast_zip_fillna(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 10000
-        self.K = 10
-        self.key1 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.key2 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.df = DataFrame({'key1': self.key1, 'key2': self.key2, 'value': np.random.randn((self.N * self.K)), })
-        self.col_array_list = list(self.df.values.T)
-        self.df.ix[:10000, :] = np.nan
-
-    def time_lib_fast_zip_fillna(self):
-        lib.fast_zip_fillna(self.col_array_list)
-
-
-class reindex_daterange_backfill(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=100000, freq=datetools.Minute())
-        self.ts = Series(np.random.randn(len(self.rng)), index=self.rng)
-        self.ts2 = self.ts[::2]
-        self.ts3 = self.ts2.reindex(self.ts.index)
-        self.ts4 = self.ts3.astype('float32')
-
-    def time_reindex_daterange_backfill(self):
-        self.backfill(self.ts2, self.ts.index)
-
-    def pad(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='pad')
-        except:
-            source_series.reindex(target_index, fillMethod='pad')
-
-    def backfill(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='backfill')
-        except:
-            source_series.reindex(target_index, fillMethod='backfill')
-
-
-class reindex_daterange_pad(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=100000, freq=datetools.Minute())
-        self.ts = Series(np.random.randn(len(self.rng)), index=self.rng)
-        self.ts2 = self.ts[::2]
-        self.ts3 = self.ts2.reindex(self.ts.index)
-        self.ts4 = self.ts3.astype('float32')
-
-    def time_reindex_daterange_pad(self):
-        self.pad(self.ts2, self.ts.index)
-
-    def pad(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='pad')
-        except:
-            source_series.reindex(target_index, fillMethod='pad')
-
-    def backfill(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='backfill')
-        except:
-            source_series.reindex(target_index, fillMethod='backfill')
-
-
-class reindex_fillna_backfill(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=100000, freq=datetools.Minute())
-        self.ts = Series(np.random.randn(len(self.rng)), index=self.rng)
-        self.ts2 = self.ts[::2]
-        self.ts3 = self.ts2.reindex(self.ts.index)
-        self.ts4 = self.ts3.astype('float32')
-
-    def time_reindex_fillna_backfill(self):
-        self.ts3.fillna(method='backfill')
+        rng = DatetimeIndex(start='1/1/1970', periods=10000, freq='1min')
+        self.df = DataFrame(np.random.rand(10000, 10), index=rng,
+                            columns=range(10))
+        self.df['foo'] = 'bar'
+        self.rng_subset = Index(rng[::2])
+        self.df2 = DataFrame(index=range(10000),
+                             data=np.random.rand(10000, 30), columns=range(30))
+        N = 5000
+        K = 200
+        level1 = tm.makeStringIndex(N).values.repeat(K)
+        level2 = np.tile(tm.makeStringIndex(K).values, N)
+        index = MultiIndex.from_arrays([level1, level2])
+        self.s = Series(np.random.randn(N * K), index=index)
+        self.s_subset = self.s[::2]
+
+    def time_reindex_dates(self):
+        self.df.reindex(self.rng_subset)
+
+    def time_reindex_columns(self):
+        self.df2.reindex(columns=self.df.columns[1:5])
 
-    def pad(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='pad')
-        except:
-            source_series.reindex(target_index, fillMethod='pad')
+    def time_reindex_multiindex(self):
+        self.s.reindex(self.s_subset.index)
 
-    def backfill(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='backfill')
-        except:
-            source_series.reindex(target_index, fillMethod='backfill')
 
+class ReindexMethod(object):
 
-class reindex_fillna_backfill_float32(object):
     goal_time = 0.2
+    params = ['pad', 'backfill']
+    param_names = ['method']
 
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=100000, freq=datetools.Minute())
-        self.ts = Series(np.random.randn(len(self.rng)), index=self.rng)
-        self.ts2 = self.ts[::2]
-        self.ts3 = self.ts2.reindex(self.ts.index)
-        self.ts4 = self.ts3.astype('float32')
-
-    def time_reindex_fillna_backfill_float32(self):
-        self.ts4.fillna(method='backfill')
+    def setup(self, method):
+        N = 100000
+        self.idx = date_range('1/1/2000', periods=N, freq='1min')
+        self.ts = Series(np.random.randn(N), index=self.idx)[::2]
 
-    def pad(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='pad')
-        except:
-            source_series.reindex(target_index, fillMethod='pad')
+    def time_reindex_method(self, method):
+        self.ts.reindex(self.idx, method=method)
 
-    def backfill(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='backfill')
-        except:
-            source_series.reindex(target_index, fillMethod='backfill')
 
+class Fillna(object):
 
-class reindex_fillna_pad(object):
     goal_time = 0.2
+    params = ['pad', 'backfill']
+    param_names = ['method']
 
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=100000, freq=datetools.Minute())
-        self.ts = Series(np.random.randn(len(self.rng)), index=self.rng)
-        self.ts2 = self.ts[::2]
-        self.ts3 = self.ts2.reindex(self.ts.index)
-        self.ts4 = self.ts3.astype('float32')
+    def setup(self, method):
+        N = 100000
+        self.idx = date_range('1/1/2000', periods=N, freq='1min')
+        ts = Series(np.random.randn(N), index=self.idx)[::2]
+        self.ts_reindexed = ts.reindex(self.idx)
+        self.ts_float32 = self.ts_reindexed.astype('float32')
 
-    def time_reindex_fillna_pad(self):
-        self.ts3.fillna(method='pad')
+    def time_reindexed(self, method):
+        self.ts_reindexed.fillna(method=method)
 
-    def pad(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='pad')
-        except:
-            source_series.reindex(target_index, fillMethod='pad')
+    def time_float_32(self, method):
+        self.ts_float32.fillna(method=method)
 
-    def backfill(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='backfill')
-        except:
-            source_series.reindex(target_index, fillMethod='backfill')
 
+class LevelAlign(object):
 
-class reindex_fillna_pad_float32(object):
     goal_time = 0.2
 
     def setup(self):
-        self.rng = date_range('1/1/2000', periods=100000, freq=datetools.Minute())
-        self.ts = Series(np.random.randn(len(self.rng)), index=self.rng)
-        self.ts2 = self.ts[::2]
-        self.ts3 = self.ts2.reindex(self.ts.index)
-        self.ts4 = self.ts3.astype('float32')
+        self.index = MultiIndex(
+            levels=[np.arange(10), np.arange(100), np.arange(100)],
+            labels=[np.arange(10).repeat(10000),
+                    np.tile(np.arange(100).repeat(100), 10),
+                    np.tile(np.tile(np.arange(100), 100), 10)])
+        self.df = DataFrame(np.random.randn(len(self.index), 4),
+                            index=self.index)
+        self.df_level = DataFrame(np.random.randn(100, 4),
+                                  index=self.index.levels[1])
 
-    def time_reindex_fillna_pad_float32(self):
-        self.ts4.fillna(method='pad')
+    def time_align_level(self):
+        self.df.align(self.df_level, level=1, copy=False)
 
-    def pad(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='pad')
-        except:
-            source_series.reindex(target_index, fillMethod='pad')
+    def time_reindex_level(self):
+        self.df_level.reindex(self.index, level=1)
 
-    def backfill(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='backfill')
-        except:
-            source_series.reindex(target_index, fillMethod='backfill')
 
+class DropDuplicates(object):
 
-class reindex_frame_level_align(object):
     goal_time = 0.2
+    params = [True, False]
+    param_names = ['inplace']
 
-    def setup(self):
-        self.index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-        random.shuffle(self.index.values)
-        self.df = DataFrame(np.random.randn(len(self.index), 4), index=self.index)
-        self.df_level = DataFrame(np.random.randn(100, 4), index=self.index.levels[1])
+    def setup(self, inplace):
+        N = 10000
+        K = 10
+        key1 = tm.makeStringIndex(N).values.repeat(K)
+        key2 = tm.makeStringIndex(N).values.repeat(K)
+        self.df = DataFrame({'key1': key1, 'key2': key2,
+                             'value': np.random.randn(N * K)})
+        self.df_nan = self.df.copy()
+        self.df_nan.iloc[:10000, :] = np.nan
 
-    def time_reindex_frame_level_align(self):
-        self.df.align(self.df_level, level=1, copy=False)
+        self.s = Series(np.random.randint(0, 1000, size=10000))
+        self.s_str = Series(np.tile(tm.makeStringIndex(1000).values, 10))
 
+        N = 1000000
+        K = 10000
+        key1 = np.random.randint(0, K, size=N)
+        self.df_int = DataFrame({'key1': key1})
+        self.df_bool = DataFrame(np.random.randint(0, 2, size=(K, 10),
+                                                   dtype=bool))
 
-class reindex_frame_level_reindex(object):
-    goal_time = 0.2
+    def time_frame_drop_dups(self, inplace):
+        self.df.drop_duplicates(['key1', 'key2'], inplace=inplace)
 
-    def setup(self):
-        self.index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-        random.shuffle(self.index.values)
-        self.df = DataFrame(np.random.randn(len(self.index), 4), index=self.index)
-        self.df_level = DataFrame(np.random.randn(100, 4), index=self.index.levels[1])
+    def time_frame_drop_dups_na(self, inplace):
+        self.df_nan.drop_duplicates(['key1', 'key2'], inplace=inplace)
 
-    def time_reindex_frame_level_reindex(self):
-        self.df_level.reindex(self.df.index, level=1)
+    def time_series_drop_dups_int(self, inplace):
+        self.s.drop_duplicates(inplace=inplace)
 
+    def time_series_drop_dups_string(self, inplace):
+        self.s_str.drop_duplicates(inplace=inplace)
 
-class reindex_multiindex(object):
-    goal_time = 0.2
+    def time_frame_drop_dups_int(self, inplace):
+        self.df_int.drop_duplicates(inplace=inplace)
 
-    def setup(self):
-        self.N = 1000
-        self.K = 20
-        self.level1 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.level2 = np.tile(tm.makeStringIndex(self.K).values, self.N)
-        self.index = MultiIndex.from_arrays([self.level1, self.level2])
-        self.s1 = Series(np.random.randn((self.N * self.K)), index=self.index)
-        self.s2 = self.s1[::2]
-
-    def time_reindex_multiindex(self):
-        self.s1.reindex(self.s2.index)
+    def time_frame_drop_dups_bool(self, inplace):
+        self.df_bool.drop_duplicates(inplace=inplace)
 
 
-class series_align_irregular_string(object):
+class Align(object):
+    # blog "pandas escaped the zoo"
     goal_time = 0.2
 
     def setup(self):
-        self.n = 50000
-        self.indices = tm.makeStringIndex(self.n)
-        self.subsample_size = 40000
-        self.x = Series(np.random.randn(50000), self.indices)
-        self.y = Series(np.random.randn(self.subsample_size), index=self.sample(self.indices, self.subsample_size))
+        n = 50000
+        indices = tm.makeStringIndex(n)
+        subsample_size = 40000
+        self.x = Series(np.random.randn(n), indices)
+        self.y = Series(np.random.randn(subsample_size),
+                        index=np.random.choice(indices, subsample_size,
+                                               replace=False))
 
-    def time_series_align_irregular_string(self):
-        (self.x + self.y)
+    def time_align_series_irregular_string(self):
+        self.x + self.y
 
-    def sample(self, values, k):
-        self.sampler = np.arange(len(values))
-        shuffle(self.sampler)
-        return values.take(self.sampler[:k])
 
+class LibFastZip(object):
 
-class series_drop_duplicates_int(object):
     goal_time = 0.2
 
     def setup(self):
-        self.s = Series(np.random.randint(0, 1000, size=10000))
-        self.s2 = Series(np.tile(tm.makeStringIndex(1000).values, 10))
+        N = 10000
+        K = 10
+        key1 = tm.makeStringIndex(N).values.repeat(K)
+        key2 = tm.makeStringIndex(N).values.repeat(K)
+        col_array = np.vstack([key1, key2, np.random.randn(N * K)])
+        col_array2 = col_array.copy()
+        col_array2[:, :10000] = np.nan
+        self.col_array_list = list(col_array)
 
-    def time_series_drop_duplicates_int(self):
-        self.s.drop_duplicates()
-
-
-class series_drop_duplicates_string(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.s = Series(np.random.randint(0, 1000, size=10000))
-        self.s2 = Series(np.tile(tm.makeStringIndex(1000).values, 10))
-
-    def time_series_drop_duplicates_string(self):
-        self.s2.drop_duplicates()
+    def time_lib_fast_zip(self):
+        lib.fast_zip(self.col_array_list)
diff --git a/asv_bench/benchmarks/replace.py b/asv_bench/benchmarks/replace.py
index e9f33ebfce0bd..41208125e8f32 100644
--- a/asv_bench/benchmarks/replace.py
+++ b/asv_bench/benchmarks/replace.py
@@ -1,48 +1,58 @@
-from .pandas_vb_common import *
-from pandas.compat import range
-from datetime import timedelta
+import numpy as np
+import pandas as pd
 
+from .pandas_vb_common import setup  # noqa
+
+
+class FillNa(object):
 
-class replace_fillna(object):
     goal_time = 0.2
+    params = [True, False]
+    param_names = ['inplace']
+
+    def setup(self, inplace):
+        N = 10**6
+        rng = pd.date_range('1/1/2000', periods=N, freq='min')
+        data = np.random.randn(N)
+        data[::2] = np.nan
+        self.ts = pd.Series(data, index=rng)
+
+    def time_fillna(self, inplace):
+        self.ts.fillna(0.0, inplace=inplace)
 
-    def setup(self):
-        self.N = 1000000
-        try:
-            self.rng = date_range('1/1/2000', periods=self.N, freq='min')
-        except NameError:
-            self.rng = DatetimeIndex('1/1/2000', periods=self.N, offset=datetools.Minute())
-            self.date_range = DateRange
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
+    def time_replace(self, inplace):
+        self.ts.replace(np.nan, 0.0, inplace=inplace)
 
-    def time_replace_fillna(self):
-        self.ts.fillna(0.0, inplace=True)
 
+class ReplaceDict(object):
 
-class replace_large_dict(object):
     goal_time = 0.2
+    params = [True, False]
+    param_names = ['inplace']
 
-    def setup(self):
-        self.n = (10 ** 6)
-        self.start_value = (10 ** 5)
-        self.to_rep = dict(((i, (self.start_value + i)) for i in range(self.n)))
-        self.s = Series(np.random.randint(self.n, size=(10 ** 3)))
+    def setup(self, inplace):
+        N = 10**5
+        start_value = 10**5
+        self.to_rep = dict(enumerate(np.arange(N) + start_value))
+        self.s = pd.Series(np.random.randint(N, size=10**3))
 
-    def time_replace_large_dict(self):
-        self.s.replace(self.to_rep, inplace=True)
+    def time_replace_series(self, inplace):
+        self.s.replace(self.to_rep, inplace=inplace)
 
 
-class replace_replacena(object):
-    goal_time = 0.2
+class Convert(object):
+
+    goal_time = 0.5
+    params = (['DataFrame', 'Series'], ['Timestamp', 'Timedelta'])
+    param_names = ['constructor', 'replace_data']
+
+    def setup(self, constructor, replace_data):
+        N = 10**3
+        data = {'Series': pd.Series(np.random.randint(N, size=N)),
+                'DataFrame': pd.DataFrame({'A': np.random.randint(N, size=N),
+                                           'B': np.random.randint(N, size=N)})}
+        self.to_replace = {i: getattr(pd, replace_data) for i in range(N)}
+        self.data = data[constructor]
 
-    def setup(self):
-        self.N = 1000000
-        try:
-            self.rng = date_range('1/1/2000', periods=self.N, freq='min')
-        except NameError:
-            self.rng = DatetimeIndex('1/1/2000', periods=self.N, offset=datetools.Minute())
-            self.date_range = DateRange
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-
-    def time_replace_replacena(self):
-        self.ts.replace(np.nan, 0.0, inplace=True)
\ No newline at end of file
+    def time_replace(self, constructor, replace_data):
+        self.data.replace(self.to_replace)
diff --git a/asv_bench/benchmarks/reshape.py b/asv_bench/benchmarks/reshape.py
index 604fa5092a231..9044b080c45f9 100644
--- a/asv_bench/benchmarks/reshape.py
+++ b/asv_bench/benchmarks/reshape.py
@@ -1,13 +1,16 @@
-from .pandas_vb_common import *
-from pandas.core.reshape import melt
+from itertools import product
 
+import numpy as np
+from pandas import DataFrame, MultiIndex, date_range, melt, wide_to_long
+
+from .pandas_vb_common import setup  # noqa
+
+
+class Melt(object):
 
-class melt_dataframe(object):
     goal_time = 0.2
 
     def setup(self):
-        self.index = MultiIndex.from_arrays([np.arange(100).repeat(100), np.roll(np.tile(np.arange(100), 100), 25)])
-        self.df = DataFrame(np.random.randn(10000, 4), index=self.index)
         self.df = DataFrame(np.random.randn(10000, 3), columns=['A', 'B', 'C'])
         self.df['id1'] = np.random.randint(0, 10, 10000)
         self.df['id2'] = np.random.randint(100, 1000, 10000)
@@ -16,61 +19,116 @@ def time_melt_dataframe(self):
         melt(self.df, id_vars=['id1', 'id2'])
 
 
-class reshape_pivot_time_series(object):
+class Pivot(object):
+
     goal_time = 0.2
 
     def setup(self):
-        self.index = MultiIndex.from_arrays([np.arange(100).repeat(100), np.roll(np.tile(np.arange(100), 100), 25)])
-        self.df = DataFrame(np.random.randn(10000, 4), index=self.index)
-        self.index = date_range('1/1/2000', periods=10000, freq='h')
-        self.df = DataFrame(randn(10000, 50), index=self.index, columns=range(50))
-        self.pdf = self.unpivot(self.df)
-        self.f = (lambda : self.pdf.pivot('date', 'variable', 'value'))
+        N = 10000
+        index = date_range('1/1/2000', periods=N, freq='h')
+        data = {'value': np.random.randn(N * 50),
+                'variable': np.arange(50).repeat(N),
+                'date': np.tile(index.values, 50)}
+        self.df = DataFrame(data)
 
     def time_reshape_pivot_time_series(self):
-        self.f()
+        self.df.pivot('date', 'variable', 'value')
 
-    def unpivot(self, frame):
-        (N, K) = frame.shape
-        self.data = {'value': frame.values.ravel('F'), 'variable': np.asarray(frame.columns).repeat(N), 'date': np.tile(np.asarray(frame.index), K), }
-        return DataFrame(self.data, columns=['date', 'variable', 'value'])
 
+class SimpleReshape(object):
 
-class reshape_stack_simple(object):
     goal_time = 0.2
 
     def setup(self):
-        self.index = MultiIndex.from_arrays([np.arange(100).repeat(100), np.roll(np.tile(np.arange(100), 100), 25)])
-        self.df = DataFrame(np.random.randn(10000, 4), index=self.index)
+        arrays = [np.arange(100).repeat(100),
+                  np.roll(np.tile(np.arange(100), 100), 25)]
+        index = MultiIndex.from_arrays(arrays)
+        self.df = DataFrame(np.random.randn(10000, 4), index=index)
         self.udf = self.df.unstack(1)
 
-    def time_reshape_stack_simple(self):
+    def time_stack(self):
         self.udf.stack()
 
+    def time_unstack(self):
+        self.df.unstack(1)
+
+
+class Unstack(object):
 
-class reshape_unstack_simple(object):
     goal_time = 0.2
 
     def setup(self):
-        self.index = MultiIndex.from_arrays([np.arange(100).repeat(100), np.roll(np.tile(np.arange(100), 100), 25)])
-        self.df = DataFrame(np.random.randn(10000, 4), index=self.index)
+        m = 100
+        n = 1000
+
+        levels = np.arange(m)
+        index = MultiIndex.from_product([levels] * 2)
+        columns = np.arange(n)
+        values = np.arange(m * m * n).reshape(m * m, n)
+        self.df = DataFrame(values, index, columns)
+        self.df2 = self.df.iloc[:-1]
+
+    def time_full_product(self):
+        self.df.unstack()
+
+    def time_without_last_row(self):
+        self.df2.unstack()
+
+
+class SparseIndex(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        NUM_ROWS = 1000
+        self.df = DataFrame({'A': np.random.randint(50, size=NUM_ROWS),
+                             'B': np.random.randint(50, size=NUM_ROWS),
+                             'C': np.random.randint(-10, 10, size=NUM_ROWS),
+                             'D': np.random.randint(-10, 10, size=NUM_ROWS),
+                             'E': np.random.randint(10, size=NUM_ROWS),
+                             'F': np.random.randn(NUM_ROWS)})
+        self.df = self.df.set_index(['A', 'B', 'C', 'D', 'E'])
+
+    def time_unstack(self):
+        self.df.unstack()
+
+
+class WideToLong(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        nyrs = 20
+        nidvars = 20
+        N = 5000
+        self.letters = list('ABCD')
+        yrvars = [l + str(num)
+                  for l, num in product(self.letters, range(1, nyrs + 1))]
+        columns = [str(i) for i in range(nidvars)] + yrvars
+        self.df = DataFrame(np.random.randn(N, nidvars + len(yrvars)),
+                            columns=columns)
+        self.df['id'] = self.df.index
+
+    def time_wide_to_long_big(self):
+        wide_to_long(self.df, self.letters, i='id', j='year')
 
-    def time_reshape_unstack_simple(self):
-        self.df.unstack(1)
 
+class PivotTable(object):
 
-class unstack_sparse_keyspace(object):
     goal_time = 0.2
 
     def setup(self):
-        self.index = MultiIndex.from_arrays([np.arange(100).repeat(100), np.roll(np.tile(np.arange(100), 100), 25)])
-        self.df = DataFrame(np.random.randn(10000, 4), index=self.index)
-        self.NUM_ROWS = 1000
-        for iter in range(10):
-            self.df = DataFrame({'A': np.random.randint(50, size=self.NUM_ROWS), 'B': np.random.randint(50, size=self.NUM_ROWS), 'C': np.random.randint((-10), 10, size=self.NUM_ROWS), 'D': np.random.randint((-10), 10, size=self.NUM_ROWS), 'E': np.random.randint(10, size=self.NUM_ROWS), 'F': np.random.randn(self.NUM_ROWS), })
-            self.idf = self.df.set_index(['A', 'B', 'C', 'D', 'E'])
-            if (len(self.idf.index.unique()) == self.NUM_ROWS):
-                break
-
-    def time_unstack_sparse_keyspace(self):
-        self.idf.unstack()
\ No newline at end of file
+        N = 100000
+        fac1 = np.array(['A', 'B', 'C'], dtype='O')
+        fac2 = np.array(['one', 'two'], dtype='O')
+        ind1 = np.random.randint(0, 3, size=N)
+        ind2 = np.random.randint(0, 2, size=N)
+        self.df = DataFrame({'key1': fac1.take(ind1),
+                             'key2': fac2.take(ind2),
+                             'key3': fac2.take(ind2),
+                             'value1': np.random.randn(N),
+                             'value2': np.random.randn(N),
+                             'value3': np.random.randn(N)})
+
+    def time_pivot_table(self):
+        self.df.pivot_table(index='key1', columns=['key2', 'key3'])
diff --git a/asv_bench/benchmarks/rolling.py b/asv_bench/benchmarks/rolling.py
new file mode 100644
index 0000000000000..e3bf551fa5f2b
--- /dev/null
+++ b/asv_bench/benchmarks/rolling.py
@@ -0,0 +1,79 @@
+import pandas as pd
+import numpy as np
+
+from .pandas_vb_common import setup  # noqa
+
+
+class Methods(object):
+
+    sample_time = 0.2
+    params = (['DataFrame', 'Series'],
+              [10, 1000],
+              ['int', 'float'],
+              ['median', 'mean', 'max', 'min', 'std', 'count', 'skew', 'kurt',
+               'sum'])
+    param_names = ['contructor', 'window', 'dtype', 'method']
+
+    def setup(self, constructor, window, dtype, method):
+        N = 10**5
+        arr = (100 * np.random.random(N)).astype(dtype)
+        self.roll = getattr(pd, constructor)(arr).rolling(window)
+
+    def time_rolling(self, constructor, window, dtype, method):
+        getattr(self.roll, method)()
+
+
+class VariableWindowMethods(Methods):
+    sample_time = 0.2
+    params = (['DataFrame', 'Series'],
+              ['50s', '1h', '1d'],
+              ['int', 'float'],
+              ['median', 'mean', 'max', 'min', 'std', 'count', 'skew', 'kurt',
+               'sum'])
+    param_names = ['contructor', 'window', 'dtype', 'method']
+
+    def setup(self, constructor, window, dtype, method):
+        N = 10**5
+        arr = (100 * np.random.random(N)).astype(dtype)
+        index = pd.date_range('2017-01-01', periods=N, freq='5s')
+        self.roll = getattr(pd, constructor)(arr, index=index).rolling(window)
+
+
+class Pairwise(object):
+
+    sample_time = 0.2
+    params = ([10, 1000, None],
+              ['corr', 'cov'],
+              [True, False])
+    param_names = ['window', 'method', 'pairwise']
+
+    def setup(self, window, method, pairwise):
+        N = 10**4
+        arr = np.random.random(N)
+        self.df = pd.DataFrame(arr)
+
+    def time_pairwise(self, window, method, pairwise):
+        if window is None:
+            r = self.df.expanding()
+        else:
+            r = self.df.rolling(window=window)
+        getattr(r, method)(self.df, pairwise=pairwise)
+
+
+class Quantile(object):
+    sample_time = 0.2
+    params = (['DataFrame', 'Series'],
+              [10, 1000],
+              ['int', 'float'],
+              [0, 0.5, 1],
+              ['linear', 'nearest', 'lower', 'higher', 'midpoint'])
+    param_names = ['constructor', 'window', 'dtype', 'percentile']
+
+    def setup(self, constructor, window, dtype, percentile, interpolation):
+        N = 10 ** 5
+        arr = np.random.random(N).astype(dtype)
+        self.roll = getattr(pd, constructor)(arr).rolling(window)
+
+    def time_quantile(self, constructor, window, dtype, percentile,
+                      interpolation):
+        self.roll.quantile(percentile, interpolation=interpolation)
diff --git a/asv_bench/benchmarks/series_methods.py b/asv_bench/benchmarks/series_methods.py
index 37969a6949157..a5ccf5c32b876 100644
--- a/asv_bench/benchmarks/series_methods.py
+++ b/asv_bench/benchmarks/series_methods.py
@@ -1,73 +1,136 @@
-from .pandas_vb_common import *
+from datetime import datetime
 
+import numpy as np
+import pandas.util.testing as tm
+from pandas import Series, date_range, NaT
+
+from .pandas_vb_common import setup  # noqa
+
+
+class SeriesConstructor(object):
 
-class series_isin_int64(object):
     goal_time = 0.2
+    params = [None, 'dict']
+    param_names = ['data']
 
-    def setup(self):
-        self.s3 = Series(np.random.randint(1, 10, 100000)).astype('int64')
-        self.s4 = Series(np.random.randint(1, 100, 10000000)).astype('int64')
-        self.values = [1, 2]
+    def setup(self, data):
+        self.idx = date_range(start=datetime(2015, 10, 26),
+                              end=datetime(2016, 1, 1),
+                              freq='50s')
+        dict_data = dict(zip(self.idx, range(len(self.idx))))
+        self.data = None if data is None else dict_data
 
-    def time_series_isin_int64(self):
-        self.s3.isin(self.values)
+    def time_constructor(self, data):
+        Series(data=self.data, index=self.idx)
 
-    def time_series_isin_int64_large(self):
-        self.s4.isin(self.values)
 
+class IsIn(object):
 
-class series_isin_object(object):
     goal_time = 0.2
+    params = ['int64', 'object']
+    param_names = ['dtype']
 
-    def setup(self):
-        self.s3 = Series(np.random.randint(1, 10, 100000)).astype('int64')
+    def setup(self, dtype):
+        self.s = Series(np.random.randint(1, 10, 100000)).astype(dtype)
         self.values = [1, 2]
-        self.s4 = self.s3.astype('object')
 
-    def time_series_isin_object(self):
-        self.s4.isin(self.values)
+    def time_isin(self, dtypes):
+        self.s.isin(self.values)
+
+
+class NSort(object):
+
+    goal_time = 0.2
+    params = ['first', 'last', 'all']
+    param_names = ['keep']
+
+    def setup(self, keep):
+        self.s = Series(np.random.randint(1, 10, 100000))
+
+    def time_nlargest(self, keep):
+        self.s.nlargest(3, keep=keep)
+
+    def time_nsmallest(self, keep):
+        self.s.nsmallest(3, keep=keep)
+
+
+class Dropna(object):
+
+    goal_time = 0.2
+    params = ['int', 'datetime']
+    param_names = ['dtype']
+
+    def setup(self, dtype):
+        N = 10**6
+        data = {'int': np.random.randint(1, 10, N),
+                'datetime': date_range('2000-01-01', freq='S', periods=N)}
+        self.s = Series(data[dtype])
+        if dtype == 'datetime':
+            self.s[np.random.randint(1, N, 100)] = NaT
 
+    def time_dropna(self, dtype):
+        self.s.dropna()
+
+
+class Map(object):
+
+    goal_time = 0.2
+    params = ['dict', 'Series']
+    param_names = 'mapper'
+
+    def setup(self, mapper):
+        map_size = 1000
+        map_data = Series(map_size - np.arange(map_size))
+        self.map_data = map_data if mapper == 'Series' else map_data.to_dict()
+        self.s = Series(np.random.randint(0, map_size, 10000))
+
+    def time_map(self, mapper):
+        self.s.map(self.map_data)
+
+
+class Clip(object):
 
-class series_nlargest1(object):
     goal_time = 0.2
 
     def setup(self):
-        self.s1 = Series(np.random.randn(10000))
-        self.s2 = Series(np.random.randint(1, 10, 10000))
-        self.s3 = Series(np.random.randint(1, 10, 100000)).astype('int64')
-        self.values = [1, 2]
-        self.s4 = self.s3.astype('object')
+        self.s = Series(np.random.randn(50))
 
-    def time_series_nlargest1(self):
-        self.s1.nlargest(3, take_last=True)
-        self.s1.nlargest(3, take_last=False)
+    def time_clip(self):
+        self.s.clip(0, 1)
 
 
-class series_nlargest2(object):
+class ValueCounts(object):
+
+    goal_time = 0.2
+    params = ['int', 'float', 'object']
+    param_names = ['dtype']
+
+    def setup(self, dtype):
+        self.s = Series(np.random.randint(0, 1000, size=100000)).astype(dtype)
+
+    def time_value_counts(self, dtype):
+        self.s.value_counts()
+
+
+class Dir(object):
+
     goal_time = 0.2
 
     def setup(self):
-        self.s1 = Series(np.random.randn(10000))
-        self.s2 = Series(np.random.randint(1, 10, 10000))
-        self.s3 = Series(np.random.randint(1, 10, 100000)).astype('int64')
-        self.values = [1, 2]
-        self.s4 = self.s3.astype('object')
+        self.s = Series(index=tm.makeStringIndex(10000))
 
-    def time_series_nlargest2(self):
-        self.s2.nlargest(3, take_last=True)
-        self.s2.nlargest(3, take_last=False)
+    def time_dir_strings(self):
+        dir(self.s)
 
 
-class series_nsmallest2(object):
+class SeriesGetattr(object):
+    # https://github.com/pandas-dev/pandas/issues/19764
     goal_time = 0.2
 
     def setup(self):
-        self.s1 = Series(np.random.randn(10000))
-        self.s2 = Series(np.random.randint(1, 10, 10000))
-        self.s3 = Series(np.random.randint(1, 10, 100000)).astype('int64')
-        self.values = [1, 2]
-        self.s4 = self.s3.astype('object')
+        self.s = Series(1,
+                        index=date_range("2012-01-01", freq='s',
+                                         periods=int(1e6)))
 
-    def time_series_nsmallest2(self):
-        self.s2.nsmallest(3, take_last=True)
-        self.s2.nsmallest(3, take_last=False)
+    def time_series_datetimeindex_repr(self):
+        getattr(self.s, 'a', None)
diff --git a/asv_bench/benchmarks/sparse.py b/asv_bench/benchmarks/sparse.py
index d7ee58fc978ea..dcb7694abc2ad 100644
--- a/asv_bench/benchmarks/sparse.py
+++ b/asv_bench/benchmarks/sparse.py
@@ -1,55 +1,162 @@
-from .pandas_vb_common import *
-import pandas.sparse.series
+import itertools
+
+import numpy as np
 import scipy.sparse
-from pandas.core.sparse import SparseSeries, SparseDataFrame
-from pandas.core.sparse import SparseDataFrame
+from pandas import (SparseSeries, SparseDataFrame, SparseArray, Series,
+                    date_range, MultiIndex)
+
+from .pandas_vb_common import setup  # noqa
+
+
+def make_array(size, dense_proportion, fill_value, dtype):
+    dense_size = int(size * dense_proportion)
+    arr = np.full(size, fill_value, dtype)
+    indexer = np.random.choice(np.arange(size), dense_size, replace=False)
+    arr[indexer] = np.random.choice(np.arange(100, dtype=dtype), dense_size)
+    return arr
+
 
+class SparseSeriesToFrame(object):
 
-class sparse_series_to_frame(object):
     goal_time = 0.2
 
     def setup(self):
-        self.K = 50
-        self.N = 50000
-        self.rng = np.asarray(date_range('1/1/2000', periods=self.N, freq='T'))
+        K = 50
+        N = 50001
+        rng = date_range('1/1/2000', periods=N, freq='T')
         self.series = {}
-        for i in range(1, (self.K + 1)):
-            self.data = np.random.randn(self.N)[:(- i)]
-            self.this_rng = self.rng[:(- i)]
-            self.data[100:] = np.nan
-            self.series[i] = SparseSeries(self.data, index=self.this_rng)
+        for i in range(1, K):
+            data = np.random.randn(N)[:-i]
+            idx = rng[:-i]
+            data[100:] = np.nan
+            self.series[i] = SparseSeries(data, index=idx)
 
-    def time_sparse_series_to_frame(self):
+    def time_series_to_frame(self):
         SparseDataFrame(self.series)
 
 
-class sparse_frame_constructor(object):
+class SparseArrayConstructor(object):
+
     goal_time = 0.2
+    params = ([0.1, 0.01], [0, np.nan],
+              [np.int64, np.float64, np.object])
+    param_names = ['dense_proportion', 'fill_value', 'dtype']
+
+    def setup(self, dense_proportion, fill_value, dtype):
+        N = 10**6
+        self.array = make_array(N, dense_proportion, fill_value, dtype)
+
+    def time_sparse_array(self, dense_proportion, fill_value, dtype):
+        SparseArray(self.array, fill_value=fill_value, dtype=dtype)
 
-    def time_sparse_frame_constructor(self):
-        SparseDataFrame(columns=np.arange(100), index=np.arange(1000))
 
+class SparseDataFrameConstructor(object):
 
-class sparse_series_from_coo(object):
     goal_time = 0.2
 
     def setup(self):
-        self.A = scipy.sparse.coo_matrix(([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])), shape=(100, 100))
+        N = 1000
+        self.arr = np.arange(N)
+        self.sparse = scipy.sparse.rand(N, N, 0.005)
+        self.dict = dict(zip(range(N), itertools.repeat([0])))
+
+    def time_constructor(self):
+        SparseDataFrame(columns=self.arr, index=self.arr)
+
+    def time_from_scipy(self):
+        SparseDataFrame(self.sparse)
+
+    def time_from_dict(self):
+        SparseDataFrame(self.dict)
+
+
+class FromCoo(object):
+
+    goal_time = 0.2
+
+    def setup(self):
+        self.matrix = scipy.sparse.coo_matrix(([3.0, 1.0, 2.0],
+                                               ([1, 0, 0], [0, 2, 3])),
+                                              shape=(100, 100))
 
     def time_sparse_series_from_coo(self):
-        self.ss = pandas.sparse.series.SparseSeries.from_coo(self.A)
+        SparseSeries.from_coo(self.matrix)
 
 
-class sparse_series_to_coo(object):
+class ToCoo(object):
+
     goal_time = 0.2
 
     def setup(self):
-        self.s = pd.Series(([np.nan] * 10000))
-        self.s[0] = 3.0
-        self.s[100] = (-1.0)
-        self.s[999] = 12.1
-        self.s.index = pd.MultiIndex.from_product((range(10), range(10), range(10), range(10)))
-        self.ss = self.s.to_sparse()
+        s = Series([np.nan] * 10000)
+        s[0] = 3.0
+        s[100] = -1.0
+        s[999] = 12.1
+        s.index = MultiIndex.from_product([range(10)] * 4)
+        self.ss = s.to_sparse()
 
     def time_sparse_series_to_coo(self):
-        self.ss.to_coo(row_levels=[0, 1], column_levels=[2, 3], sort_labels=True)
\ No newline at end of file
+        self.ss.to_coo(row_levels=[0, 1],
+                       column_levels=[2, 3],
+                       sort_labels=True)
+
+
+class Arithmetic(object):
+
+    goal_time = 0.2
+    params = ([0.1, 0.01], [0, np.nan])
+    param_names = ['dense_proportion', 'fill_value']
+
+    def setup(self, dense_proportion, fill_value):
+        N = 10**6
+        arr1 = make_array(N, dense_proportion, fill_value, np.int64)
+        self.array1 = SparseArray(arr1, fill_value=fill_value)
+        arr2 = make_array(N, dense_proportion, fill_value, np.int64)
+        self.array2 = SparseArray(arr2, fill_value=fill_value)
+
+    def time_make_union(self, dense_proportion, fill_value):
+        self.array1.sp_index.make_union(self.array2.sp_index)
+
+    def time_intersect(self, dense_proportion, fill_value):
+        self.array1.sp_index.intersect(self.array2.sp_index)
+
+    def time_add(self, dense_proportion, fill_value):
+        self.array1 + self.array2
+
+    def time_divide(self, dense_proportion, fill_value):
+        self.array1 / self.array2
+
+
+class ArithmeticBlock(object):
+
+    goal_time = 0.2
+    params = [np.nan, 0]
+    param_names = ['fill_value']
+
+    def setup(self, fill_value):
+        N = 10**6
+        self.arr1 = self.make_block_array(length=N, num_blocks=1000,
+                                          block_size=10, fill_value=fill_value)
+        self.arr2 = self.make_block_array(length=N, num_blocks=1000,
+                                          block_size=10, fill_value=fill_value)
+
+    def make_block_array(self, length, num_blocks, block_size, fill_value):
+        arr = np.full(length, fill_value)
+        indicies = np.random.choice(np.arange(0, length, block_size),
+                                    num_blocks,
+                                    replace=False)
+        for ind in indicies:
+            arr[ind:ind + block_size] = np.random.randint(0, 100, block_size)
+        return SparseArray(arr, fill_value=fill_value)
+
+    def time_make_union(self, fill_value):
+        self.arr1.sp_index.make_union(self.arr2.sp_index)
+
+    def time_intersect(self, fill_value):
+        self.arr2.sp_index.intersect(self.arr2.sp_index)
+
+    def time_addition(self, fill_value):
+        self.arr1 + self.arr2
+
+    def time_division(self, fill_value):
+        self.arr1 / self.arr2
diff --git a/asv_bench/benchmarks/stat_ops.py b/asv_bench/benchmarks/stat_ops.py
index 4125357455d2e..c447c78d0d070 100644
--- a/asv_bench/benchmarks/stat_ops.py
+++ b/asv_bench/benchmarks/stat_ops.py
@@ -1,236 +1,114 @@
-from .pandas_vb_common import *
+import numpy as np
+import pandas as pd
 
+from .pandas_vb_common import setup  # noqa
 
-class stat_ops_frame_mean_float_axis_0(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
+ops = ['mean', 'sum', 'median', 'std', 'skew', 'kurt', 'mad', 'prod', 'sem',
+       'var']
 
-    def time_stat_ops_frame_mean_float_axis_0(self):
-        self.df.mean()
 
+class FrameOps(object):
 
-class stat_ops_frame_mean_float_axis_1(object):
     goal_time = 0.2
+    params = [ops, ['float', 'int'], [0, 1], [True, False]]
+    param_names = ['op', 'dtype', 'axis', 'use_bottleneck']
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
-
-    def time_stat_ops_frame_mean_float_axis_1(self):
-        self.df.mean(1)
-
-
-class stat_ops_frame_mean_int_axis_0(object):
-    goal_time = 0.2
+    def setup(self, op, dtype, axis, use_bottleneck):
+        df = pd.DataFrame(np.random.randn(100000, 4)).astype(dtype)
+        try:
+            pd.options.compute.use_bottleneck = use_bottleneck
+        except:
+            from pandas.core import nanops
+            nanops._USE_BOTTLENECK = use_bottleneck
+        self.df_func = getattr(df, op)
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
+    def time_op(self, op, dtype, axis, use_bottleneck):
+        self.df_func(axis=axis)
 
-    def time_stat_ops_frame_mean_int_axis_0(self):
-        self.dfi.mean()
 
+class FrameMultiIndexOps(object):
 
-class stat_ops_frame_mean_int_axis_1(object):
     goal_time = 0.2
+    params = ([0, 1, [0, 1]], ops)
+    param_names = ['level', 'op']
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
-
-    def time_stat_ops_frame_mean_int_axis_1(self):
-        self.dfi.mean(1)
-
-
-class stat_ops_frame_sum_float_axis_0(object):
-    goal_time = 0.2
+    def setup(self, level, op):
+        levels = [np.arange(10), np.arange(100), np.arange(100)]
+        labels = [np.arange(10).repeat(10000),
+                  np.tile(np.arange(100).repeat(100), 10),
+                  np.tile(np.tile(np.arange(100), 100), 10)]
+        index = pd.MultiIndex(levels=levels, labels=labels)
+        df = pd.DataFrame(np.random.randn(len(index), 4), index=index)
+        self.df_func = getattr(df, op)
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
+    def time_op(self, level, op):
+        self.df_func(level=level)
 
-    def time_stat_ops_frame_sum_float_axis_0(self):
-        self.df.sum()
 
+class SeriesOps(object):
 
-class stat_ops_frame_sum_float_axis_1(object):
     goal_time = 0.2
+    params = [ops, ['float', 'int'], [True, False]]
+    param_names = ['op', 'dtype', 'use_bottleneck']
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
+    def setup(self, op, dtype, use_bottleneck):
+        s = pd.Series(np.random.randn(100000)).astype(dtype)
+        try:
+            pd.options.compute.use_bottleneck = use_bottleneck
+        except:
+            from pandas.core import nanops
+            nanops._USE_BOTTLENECK = use_bottleneck
+        self.s_func = getattr(s, op)
 
-    def time_stat_ops_frame_sum_float_axis_1(self):
-        self.df.sum(1)
+    def time_op(self, op, dtype, use_bottleneck):
+        self.s_func()
 
 
-class stat_ops_frame_sum_int_axis_0(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
-
-    def time_stat_ops_frame_sum_int_axis_0(self):
-        self.dfi.sum()
-
+class SeriesMultiIndexOps(object):
 
-class stat_ops_frame_sum_int_axis_1(object):
     goal_time = 0.2
+    params = ([0, 1, [0, 1]], ops)
+    param_names = ['level', 'op']
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
-
-    def time_stat_ops_frame_sum_int_axis_1(self):
-        self.dfi.sum(1)
-
-
-class stat_ops_level_frame_sum(object):
-    goal_time = 0.2
+    def setup(self, level, op):
+        levels = [np.arange(10), np.arange(100), np.arange(100)]
+        labels = [np.arange(10).repeat(10000),
+                  np.tile(np.arange(100).repeat(100), 10),
+                  np.tile(np.tile(np.arange(100), 100), 10)]
+        index = pd.MultiIndex(levels=levels, labels=labels)
+        s = pd.Series(np.random.randn(len(index)), index=index)
+        self.s_func = getattr(s, op)
 
-    def setup(self):
-        self.index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-        random.shuffle(self.index.values)
-        self.df = DataFrame(np.random.randn(len(self.index), 4), index=self.index)
-        self.df_level = DataFrame(np.random.randn(100, 4), index=self.index.levels[1])
+    def time_op(self, level, op):
+        self.s_func(level=level)
 
-    def time_stat_ops_level_frame_sum(self):
-        self.df.sum(level=1)
 
+class Rank(object):
 
-class stat_ops_level_frame_sum_multiple(object):
     goal_time = 0.2
+    params = [['DataFrame', 'Series'], [True, False]]
+    param_names = ['constructor', 'pct']
 
-    def setup(self):
-        self.index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-        random.shuffle(self.index.values)
-        self.df = DataFrame(np.random.randn(len(self.index), 4), index=self.index)
-        self.df_level = DataFrame(np.random.randn(100, 4), index=self.index.levels[1])
-
-    def time_stat_ops_level_frame_sum_multiple(self):
-        self.df.sum(level=[0, 1])
-
-
-class stat_ops_level_series_sum(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-        random.shuffle(self.index.values)
-        self.df = DataFrame(np.random.randn(len(self.index), 4), index=self.index)
-        self.df_level = DataFrame(np.random.randn(100, 4), index=self.index.levels[1])
-
-    def time_stat_ops_level_series_sum(self):
-        self.df[1].sum(level=1)
-
-
-class stat_ops_level_series_sum_multiple(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-        random.shuffle(self.index.values)
-        self.df = DataFrame(np.random.randn(len(self.index), 4), index=self.index)
-        self.df_level = DataFrame(np.random.randn(100, 4), index=self.index.levels[1])
-
-    def time_stat_ops_level_series_sum_multiple(self):
-        self.df[1].sum(level=[0, 1])
-
-
-class stat_ops_series_std(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.s = Series(np.random.randn(100000), index=np.arange(100000))
-        self.s[::2] = np.nan
-
-    def time_stat_ops_series_std(self):
-        self.s.std()
+    def setup(self, constructor, pct):
+        values = np.random.randn(10**5)
+        self.data = getattr(pd, constructor)(values)
 
+    def time_rank(self, constructor, pct):
+        self.data.rank(pct=pct)
 
-class stats_corr_spearman(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 30))
-
-    def time_stats_corr_spearman(self):
-        self.df.corr(method='spearman')
-
-
-class stats_rank2d_axis0_average(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(5000, 50))
-
-    def time_stats_rank2d_axis0_average(self):
-        self.df.rank()
-
-
-class stats_rank2d_axis1_average(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(5000, 50))
-
-    def time_stats_rank2d_axis1_average(self):
-        self.df.rank(1)
-
-
-class stats_rank_average(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.values = np.concatenate([np.arange(100000), np.random.randn(100000), np.arange(100000)])
-        self.s = Series(self.values)
-
-    def time_stats_rank_average(self):
-        self.s.rank()
-
-
-class stats_rank_average_int(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.values = np.random.randint(0, 100000, size=200000)
-        self.s = Series(self.values)
-
-    def time_stats_rank_average_int(self):
-        self.s.rank()
-
-
-class stats_rank_pct_average(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.values = np.concatenate([np.arange(100000), np.random.randn(100000), np.arange(100000)])
-        self.s = Series(self.values)
-
-    def time_stats_rank_pct_average(self):
-        self.s.rank(pct=True)
-
-
-class stats_rank_pct_average_old(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.values = np.concatenate([np.arange(100000), np.random.randn(100000), np.arange(100000)])
-        self.s = Series(self.values)
+    def time_average_old(self, constructor, pct):
+        self.data.rank(pct=pct) / len(self.data)
 
-    def time_stats_rank_pct_average_old(self):
-        (self.s.rank() / len(self.s))
 
+class Correlation(object):
 
-class stats_rolling_mean(object):
     goal_time = 0.2
+    params = ['spearman', 'kendall', 'pearson']
+    param_names = ['method']
 
-    def setup(self):
-        self.arr = np.random.randn(100000)
+    def setup(self, method):
+        self.df = pd.DataFrame(np.random.randn(1000, 30))
 
-    def time_stats_rolling_mean(self):
-        rolling_mean(self.arr, 100)
\ No newline at end of file
+    def time_corr(self, method):
+        self.df.corr(method=method)
diff --git a/asv_bench/benchmarks/strings.py b/asv_bench/benchmarks/strings.py
index e4f91b1b9c0c6..b203c8b0fa5c9 100644
--- a/asv_bench/benchmarks/strings.py
+++ b/asv_bench/benchmarks/strings.py
@@ -1,393 +1,147 @@
-from .pandas_vb_common import *
-import string
-import itertools as IT
-import pandas.util.testing as testing
+import warnings
 
+import numpy as np
+from pandas import Series
+import pandas.util.testing as tm
 
-class strings_cat(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_cat(self):
-        self.many.str.cat(sep=',')
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
 
+class Methods(object):
 
-class strings_center(object):
     goal_time = 0.2
 
     def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
+        self.s = Series(tm.makeStringIndex(10**5))
 
-    def time_strings_center(self):
-        self.many.str.center(100)
+    def time_cat(self):
+        self.s.str.cat(sep=',')
 
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
+    def time_center(self):
+        self.s.str.center(100)
 
+    def time_count(self):
+        self.s.str.count('A')
 
-class strings_contains_few(object):
-    goal_time = 0.2
+    def time_endswith(self):
+        self.s.str.endswith('A')
 
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
+    def time_extract(self):
+        with warnings.catch_warnings(record=True):
+            self.s.str.extract('(\\w*)A(\\w*)')
 
-    def time_strings_contains_few(self):
-        self.few.str.contains('matchthis')
+    def time_findall(self):
+        self.s.str.findall('[A-Z]+')
 
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
+    def time_get(self):
+        self.s.str.get(0)
 
+    def time_len(self):
+        self.s.str.len()
 
-class strings_contains_few_noregex(object):
-    goal_time = 0.2
+    def time_match(self):
+        self.s.str.match('A')
 
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
+    def time_pad(self):
+        self.s.str.pad(100, side='both')
 
-    def time_strings_contains_few_noregex(self):
-        self.few.str.contains('matchthis', regex=False)
+    def time_replace(self):
+        self.s.str.replace('A', '\x01\x01')
 
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
+    def time_slice(self):
+        self.s.str.slice(5, 15, 2)
 
+    def time_startswith(self):
+        self.s.str.startswith('A')
 
-class strings_contains_many(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_contains_many(self):
-        self.many.str.contains('matchthis')
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_contains_many_noregex(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_contains_many_noregex(self):
-        self.many.str.contains('matchthis', regex=False)
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_count(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_count(self):
-        self.many.str.count('matchthis')
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_encode_decode(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.ser = Series(testing.makeUnicodeIndex())
+    def time_strip(self):
+        self.s.str.strip('A')
 
-    def time_strings_encode_decode(self):
-        self.ser.str.encode('utf-8').str.decode('utf-8')
+    def time_rstrip(self):
+        self.s.str.rstrip('A')
 
+    def time_lstrip(self):
+        self.s.str.lstrip('A')
 
-class strings_endswith(object):
-    goal_time = 0.2
+    def time_title(self):
+        self.s.str.title()
 
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
+    def time_upper(self):
+        self.s.str.upper()
 
-    def time_strings_endswith(self):
-        self.many.str.endswith('matchthis')
+    def time_lower(self):
+        self.s.str.lower()
 
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
 
+class Repeat(object):
 
-class strings_extract(object):
     goal_time = 0.2
+    params = ['int', 'array']
+    param_names = ['repeats']
 
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
+    def setup(self, repeats):
+        N = 10**5
+        self.s = Series(tm.makeStringIndex(N))
+        repeat = {'int': 1, 'array': np.random.randint(1, 3, N)}
+        self.repeat = repeat[repeats]
 
-    def time_strings_extract(self):
-        self.many.str.extract('(\\w*)matchthis(\\w*)')
+    def time_repeat(self, repeats):
+        self.s.str.repeat(self.repeat)
 
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
 
+class Contains(object):
 
-class strings_findall(object):
     goal_time = 0.2
+    params = [True, False]
+    param_names = ['regex']
 
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
+    def setup(self, regex):
+        self.s = Series(tm.makeStringIndex(10**5))
 
-    def time_strings_findall(self):
-        self.many.str.findall('[A-Z]+')
+    def time_contains(self, regex):
+        self.s.str.contains('A', regex=regex)
 
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
 
+class Split(object):
 
-class strings_get(object):
     goal_time = 0.2
+    params = [True, False]
+    param_names = ['expand']
 
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
+    def setup(self, expand):
+        self.s = Series(tm.makeStringIndex(10**5)).str.join('--')
 
-    def time_strings_get(self):
-        self.many.str.get(0)
+    def time_split(self, expand):
+        self.s.str.split('--', expand=expand)
 
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
 
+class Dummies(object):
 
-class strings_get_dummies(object):
     goal_time = 0.2
 
     def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-        self.s = self.make_series(string.ascii_uppercase, strlen=10, size=10000).str.join('|')
+        self.s = Series(tm.makeStringIndex(10**5)).str.join('|')
 
-    def time_strings_get_dummies(self):
+    def time_get_dummies(self):
         self.s.str.get_dummies('|')
 
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_join_split(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_join_split(self):
-        self.many.str.join('--').str.split('--')
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_join_split_expand(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_join_split_expand(self):
-        self.many.str.join('--').str.split('--', expand=True)
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_len(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_len(self):
-        self.many.str.len()
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_lower(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_lower(self):
-        self.many.str.lower()
 
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
+class Encode(object):
 
-
-class strings_lstrip(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_lstrip(self):
-        self.many.str.lstrip('matchthis')
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_match(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_match(self):
-        self.many.str.match('mat..this')
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_pad(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_pad(self):
-        self.many.str.pad(100, side='both')
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_repeat(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_repeat(self):
-        self.many.str.repeat(list(IT.islice(IT.cycle(range(1, 4)), len(self.many))))
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_replace(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_replace(self):
-        self.many.str.replace('(matchthis)', '\x01\x01')
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_rstrip(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_rstrip(self):
-        self.many.str.rstrip('matchthis')
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_slice(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_slice(self):
-        self.many.str.slice(5, 15, 2)
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_startswith(object):
     goal_time = 0.2
 
     def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
+        self.ser = Series(tm.makeUnicodeIndex())
 
-    def time_strings_startswith(self):
-        self.many.str.startswith('matchthis')
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_strip(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_strip(self):
-        self.many.str.strip('matchthis')
-
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
-
-
-class strings_title(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_title(self):
-        self.many.str.title()
+    def time_encode_decode(self):
+        self.ser.str.encode('utf-8').str.decode('utf-8')
 
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
 
+class Slice(object):
 
-class strings_upper(object):
     goal_time = 0.2
 
     def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-
-    def time_strings_upper(self):
-        self.many.str.upper()
+        self.s = Series(['abcdefg', np.nan] * 500000)
 
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
\ No newline at end of file
+    def time_vector_slice(self):
+        # GH 2602
+        self.s.str[:5]
diff --git a/asv_bench/benchmarks/timedelta.py b/asv_bench/benchmarks/timedelta.py
index 2f252a4d3e1dc..3fe75b3c34299 100644
--- a/asv_bench/benchmarks/timedelta.py
+++ b/asv_bench/benchmarks/timedelta.py
@@ -1,34 +1,129 @@
-from .pandas_vb_common import *
-from pandas import to_timedelta
+import datetime
 
+import numpy as np
+from pandas import Series, timedelta_range, to_timedelta, Timestamp, Timedelta
+
+
+class TimedeltaConstructor(object):
 
-class timedelta_convert_int(object):
     goal_time = 0.2
 
-    def setup(self):
-        self.arr = np.random.randint(0, 1000, size=10000)
+    def time_from_int(self):
+        Timedelta(123456789)
+
+    def time_from_unit(self):
+        Timedelta(1, unit='d')
+
+    def time_from_components(self):
+        Timedelta(days=1, hours=2, minutes=3, seconds=4, milliseconds=5,
+                  microseconds=6, nanoseconds=7)
+
+    def time_from_datetime_timedelta(self):
+        Timedelta(datetime.timedelta(days=1, seconds=1))
+
+    def time_from_np_timedelta(self):
+        Timedelta(np.timedelta64(1, 'ms'))
+
+    def time_from_string(self):
+        Timedelta('1 days')
+
+    def time_from_iso_format(self):
+        Timedelta('P4DT12H30M5S')
+
+    def time_from_missing(self):
+        Timedelta('nat')
 
-    def time_timedelta_convert_int(self):
-        to_timedelta(self.arr, unit='s')
 
+class ToTimedelta(object):
 
-class timedelta_convert_string(object):
     goal_time = 0.2
 
     def setup(self):
-        self.arr = np.random.randint(0, 1000, size=10000)
-        self.arr = ['{0} days'.format(i) for i in self.arr]
+        self.ints = np.random.randint(0, 60, size=10000)
+        self.str_days = []
+        self.str_seconds = []
+        for i in self.ints:
+            self.str_days.append('{0} days'.format(i))
+            self.str_seconds.append('00:00:{0:02d}'.format(i))
+
+    def time_convert_int(self):
+        to_timedelta(self.ints, unit='s')
+
+    def time_convert_string_days(self):
+        to_timedelta(self.str_days)
+
+    def time_convert_string_seconds(self):
+        to_timedelta(self.str_seconds)
+
+
+class ToTimedeltaErrors(object):
+
+    goal_time = 0.2
+    params = ['coerce', 'ignore']
+    param_names = ['errors']
+
+    def setup(self, errors):
+        ints = np.random.randint(0, 60, size=10000)
+        self.arr = ['{0} days'.format(i) for i in ints]
+        self.arr[-1] = 'apple'
+
+    def time_convert(self, errors):
+        to_timedelta(self.arr, errors=errors)
 
-    def time_timedelta_convert_string(self):
-        to_timedelta(self.arr)
 
+class TimedeltaOps(object):
 
-class timedelta_convert_string_seconds(object):
     goal_time = 0.2
 
     def setup(self):
-        self.arr = np.random.randint(0, 60, size=10000)
-        self.arr = ['00:00:{0:02d}'.format(i) for i in self.arr]
+        self.td = to_timedelta(np.arange(1000000))
+        self.ts = Timestamp('2000')
+
+    def time_add_td_ts(self):
+        self.td + self.ts
+
+
+class TimedeltaProperties(object):
+
+    goal_time = 0.2
+
+    def setup_cache(self):
+        td = Timedelta(days=365, minutes=35, seconds=25, milliseconds=35)
+        return td
+
+    def time_timedelta_days(self, td):
+        td.days
+
+    def time_timedelta_seconds(self, td):
+        td.seconds
+
+    def time_timedelta_microseconds(self, td):
+        td.microseconds
+
+    def time_timedelta_nanoseconds(self, td):
+        td.nanoseconds
+
+
+class DatetimeAccessor(object):
+
+    goal_time = 0.2
+
+    def setup_cache(self):
+        N = 100000
+        series = Series(timedelta_range('1 days', periods=N, freq='h'))
+        return series
+
+    def time_dt_accessor(self, series):
+        series.dt
+
+    def time_timedelta_days(self, series):
+        series.dt.days
+
+    def time_timedelta_seconds(self, series):
+        series.dt.seconds
+
+    def time_timedelta_microseconds(self, series):
+        series.dt.microseconds
 
-    def time_timedelta_convert_string_seconds(self):
-        to_timedelta(self.arr)
\ No newline at end of file
+    def time_timedelta_nanoseconds(self, series):
+        series.dt.nanoseconds
diff --git a/asv_bench/benchmarks/timeseries.py b/asv_bench/benchmarks/timeseries.py
index db0c526f25c7b..eada401d2930b 100644
--- a/asv_bench/benchmarks/timeseries.py
+++ b/asv_bench/benchmarks/timeseries.py
@@ -1,1163 +1,400 @@
-from pandas.tseries.converter import DatetimeConverter
-from .pandas_vb_common import *
-import pandas as pd
+import warnings
 from datetime import timedelta
-import datetime as dt
+
+import numpy as np
+from pandas import to_datetime, date_range, Series, DataFrame, period_range
+from pandas.tseries.frequencies import infer_freq
 try:
-    import pandas.tseries.holiday
+    from pandas.plotting._converter import DatetimeConverter
 except ImportError:
-    pass
-from pandas.tseries.frequencies import infer_freq
-import numpy as np
-
-
-class dataframe_resample_max_numpy(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='20130101', periods=100000, freq='50L')
-        self.df = DataFrame(np.random.randn(100000, 2), index=self.rng)
-
-    def time_dataframe_resample_max_numpy(self):
-        self.df.resample('1s', how=np.max)
-
-
-class dataframe_resample_max_string(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='20130101', periods=100000, freq='50L')
-        self.df = DataFrame(np.random.randn(100000, 2), index=self.rng)
-
-    def time_dataframe_resample_max_string(self):
-        self.df.resample('1s', how='max')
-
-
-class dataframe_resample_mean_numpy(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='20130101', periods=100000, freq='50L')
-        self.df = DataFrame(np.random.randn(100000, 2), index=self.rng)
-
-    def time_dataframe_resample_mean_numpy(self):
-        self.df.resample('1s', how=np.mean)
-
+    from pandas.tseries.converter import DatetimeConverter
 
-class dataframe_resample_mean_string(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='20130101', periods=100000, freq='50L')
-        self.df = DataFrame(np.random.randn(100000, 2), index=self.rng)
+from .pandas_vb_common import setup  # noqa
 
-    def time_dataframe_resample_mean_string(self):
-        self.df.resample('1s', how='mean')
 
+class DatetimeIndex(object):
 
-class dataframe_resample_min_numpy(object):
     goal_time = 0.2
+    params = ['dst', 'repeated', 'tz_aware', 'tz_naive']
+    param_names = ['index_type']
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='20130101', periods=100000, freq='50L')
-        self.df = DataFrame(np.random.randn(100000, 2), index=self.rng)
+    def setup(self, index_type):
+        N = 100000
+        dtidxes = {'dst': date_range(start='10/29/2000 1:00:00',
+                                     end='10/29/2000 1:59:59', freq='S'),
+                   'repeated': date_range(start='2000',
+                                          periods=N / 10,
+                                          freq='s').repeat(10),
+                   'tz_aware': date_range(start='2000',
+                                          periods=N,
+                                          freq='s',
+                                          tz='US/Eastern'),
+                   'tz_naive': date_range(start='2000',
+                                          periods=N,
+                                          freq='s')}
+        self.index = dtidxes[index_type]
 
-    def time_dataframe_resample_min_numpy(self):
-        self.df.resample('1s', how=np.min)
+    def time_add_timedelta(self, index_type):
+        self.index + timedelta(minutes=2)
 
+    def time_normalize(self, index_type):
+        self.index.normalize()
 
-class dataframe_resample_min_string(object):
-    goal_time = 0.2
+    def time_unique(self, index_type):
+        self.index.unique()
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='20130101', periods=100000, freq='50L')
-        self.df = DataFrame(np.random.randn(100000, 2), index=self.rng)
+    def time_to_time(self, index_type):
+        self.index.time
 
-    def time_dataframe_resample_min_string(self):
-        self.df.resample('1s', how='min')
+    def time_get(self, index_type):
+        self.index[0]
 
+    def time_timeseries_is_month_start(self, index_type):
+        self.index.is_month_start
 
-class datetimeindex_add_offset(object):
-    goal_time = 0.2
+    def time_to_date(self, index_type):
+        self.index.date
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='1/1/2000', periods=10000, freq='T')
+    def time_to_pydatetime(self, index_type):
+        self.index.to_pydatetime()
 
-    def time_datetimeindex_add_offset(self):
-        (self.rng + timedelta(minutes=2))
 
+class TzLocalize(object):
 
-class datetimeindex_converter(object):
     goal_time = 0.2
 
     def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
+        dst_rng = date_range(start='10/29/2000 1:00:00',
+                             end='10/29/2000 1:59:59', freq='S')
+        self.index = date_range(start='10/29/2000',
+                                end='10/29/2000 00:59:59', freq='S')
+        self.index = self.index.append(dst_rng)
+        self.index = self.index.append(dst_rng)
+        self.index = self.index.append(date_range(start='10/29/2000 2:00:00',
+                                                  end='10/29/2000 3:00:00',
+                                                  freq='S'))
 
-    def time_datetimeindex_converter(self):
-        DatetimeConverter.convert(self.rng, None, None)
+    def time_infer_dst(self):
+        self.index.tz_localize('US/Eastern', ambiguous='infer')
 
 
-class datetimeindex_infer_dst(object):
-    goal_time = 0.2
+class ResetIndex(object):
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.dst_rng = date_range(start='10/29/2000 1:00:00', end='10/29/2000 1:59:59', freq='S')
-        self.index = date_range(start='10/29/2000', end='10/29/2000 00:59:59', freq='S')
-        self.index = self.index.append(self.dst_rng)
-        self.index = self.index.append(self.dst_rng)
-        self.index = self.index.append(date_range(start='10/29/2000 2:00:00', end='10/29/2000 3:00:00', freq='S'))
-
-    def time_datetimeindex_infer_dst(self):
-        self.index.tz_localize('US/Eastern', infer_dst=True)
-
-
-class datetimeindex_normalize(object):
     goal_time = 0.2
+    params = [None, 'US/Eastern']
+    param_names = 'tz'
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='1/1/2000 9:30', periods=10000, freq='S', tz='US/Eastern')
-
-    def time_datetimeindex_normalize(self):
-        self.rng.normalize()
-
+    def setup(self, tz):
+        idx = date_range(start='1/1/2000', periods=1000, freq='H', tz=tz)
+        self.df = DataFrame(np.random.randn(1000, 2), index=idx)
 
-class datetimeindex_unique(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='1/1/2000', periods=1000, freq='T')
-        self.index = self.rng.repeat(10)
-
-    def time_datetimeindex_unique(self):
-        self.index.unique()
-
-
-class dti_reset_index(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='1/1/2000', periods=1000, freq='H')
-        self.df = DataFrame(np.random.randn(len(self.rng), 2), self.rng)
-
-    def time_dti_reset_index(self):
+    def time_reest_datetimeindex(self, tz):
         self.df.reset_index()
 
 
-class dti_reset_index_tz(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='1/1/2000', periods=1000, freq='H', tz='US/Eastern')
-        self.df = DataFrame(np.random.randn(len(self.rng), 2), index=self.rng)
-
-    def time_dti_reset_index_tz(self):
-        self.df.reset_index()
-
+class Factorize(object):
 
-class period_setitem(object):
     goal_time = 0.2
+    params = [None, 'Asia/Tokyo']
+    param_names = 'tz'
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = period_range(start='1/1/1990', freq='S', periods=20000)
-        self.df = DataFrame(index=range(len(self.rng)))
-
-    def time_period_setitem(self):
-        self.df['col'] = self.rng
-
-
-class timeseries_1min_5min_mean(object):
-    goal_time = 0.2
+    def setup(self, tz):
+        N = 100000
+        self.dti = date_range('2011-01-01', freq='H', periods=N, tz=tz)
+        self.dti = self.dti.repeat(5)
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
+    def time_factorize(self, tz):
+        self.dti.factorize()
 
-    def time_timeseries_1min_5min_mean(self):
-        self.ts[:10000].resample('5min', how='mean')
 
+class InferFreq(object):
 
-class timeseries_1min_5min_ohlc(object):
     goal_time = 0.2
+    params = [None, 'D', 'B']
+    param_names = ['freq']
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
+    def setup(self, freq):
+        if freq is None:
+            self.idx = date_range(start='1/1/1700', freq='D', periods=10000)
+            self.idx.freq = None
+        else:
+            self.idx = date_range(start='1/1/1700', freq=freq, periods=10000)
 
-    def time_timeseries_1min_5min_ohlc(self):
-        self.ts[:10000].resample('5min', how='ohlc')
+    def time_infer_freq(self, freq):
+        infer_freq(self.idx)
 
 
-class timeseries_add_irregular(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.lindex = np.random.permutation(self.N)[:(self.N // 2)]
-        self.rindex = np.random.permutation(self.N)[:(self.N // 2)]
-        self.left = Series(self.ts.values.take(self.lindex), index=self.ts.index.take(self.lindex))
-        self.right = Series(self.ts.values.take(self.rindex), index=self.ts.index.take(self.rindex))
+class TimeDatetimeConverter(object):
 
-    def time_timeseries_add_irregular(self):
-        (self.left + self.right)
-
-
-class timeseries_asof(object):
     goal_time = 0.2
 
     def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 10000
-        self.rng = date_range(start='1/1/1990', periods=self.N, freq='53s')
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.dates = date_range(start='1/1/1990', periods=(self.N * 10), freq='5s')
-
-    def time_timeseries_asof(self):
-        self.ts.asof(self.dates)
+        N = 100000
+        self.rng = date_range(start='1/1/2000', periods=N, freq='T')
 
+    def time_convert(self):
+        DatetimeConverter.convert(self.rng, None, None)
 
-class timeseries_asof_nan(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 10000
-        self.rng = date_range(start='1/1/1990', periods=self.N, freq='53s')
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.dates = date_range(start='1/1/1990', periods=(self.N * 10), freq='5s')
-        self.ts[250:5000] = np.nan
-
-    def time_timeseries_asof_nan(self):
-        self.ts.asof(self.dates)
 
+class Iteration(object):
 
-class timeseries_asof_single(object):
     goal_time = 0.2
+    params = [date_range, period_range]
+    param_names = ['time_index']
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 10000
-        self.rng = date_range(start='1/1/1990', periods=self.N, freq='53s')
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.dates = date_range(start='1/1/1990', periods=(self.N * 10), freq='5s')
+    def setup(self, time_index):
+        N = 10**6
+        self.idx = time_index(start='20140101', freq='T', periods=N)
+        self.exit = 10000
 
-    def time_timeseries_asof_single(self):
-        self.ts.asof(self.dates[0])
+    def time_iter(self, time_index):
+        for _ in self.idx:
+            pass
 
+    def time_iter_preexit(self, time_index):
+        for i, _ in enumerate(self.idx):
+            if i > self.exit:
+                break
 
-class timeseries_custom_bday_apply(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_custom_bday_apply(self):
-        self.cday.apply(self.date)
-
-
-class timeseries_custom_bday_apply_dt64(object):
-    goal_time = 0.2
+class ResampleDataFrame(object):
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_custom_bday_apply_dt64(self):
-        self.cday.apply(self.dt64)
-
-
-class timeseries_custom_bday_cal_decr(object):
     goal_time = 0.2
+    params = ['max', 'mean', 'min']
+    param_names = ['method']
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_custom_bday_cal_decr(self):
-        (self.date - (1 * self.cdayh))
-
-
-class timeseries_custom_bday_cal_incr(object):
-    goal_time = 0.2
+    def setup(self, method):
+        rng = date_range(start='20130101', periods=100000, freq='50L')
+        df = DataFrame(np.random.randn(100000, 2), index=rng)
+        self.resample = getattr(df.resample('1s'), method)
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_custom_bday_cal_incr(self):
-        (self.date + (1 * self.cdayh))
-
-
-class timeseries_custom_bday_cal_incr_n(object):
-    goal_time = 0.2
+    def time_method(self, method):
+        self.resample()
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_custom_bday_cal_incr_n(self):
-        (self.date + (10 * self.cdayh))
-
-
-class timeseries_custom_bday_cal_incr_neg_n(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_custom_bday_cal_incr_neg_n(self):
-        (self.date - (10 * self.cdayh))
-
-
-class timeseries_custom_bday_decr(object):
-    goal_time = 0.2
+class ResampleSeries(object):
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_custom_bday_decr(self):
-        (self.date - self.cday)
-
-
-class timeseries_custom_bday_incr(object):
     goal_time = 0.2
+    params = (['period', 'datetime'], ['5min', '1D'], ['mean', 'ohlc'])
+    param_names = ['index', 'freq', 'method']
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_custom_bday_incr(self):
-        (self.date + self.cday)
-
-
-class timeseries_custom_bmonthbegin_decr_n(object):
-    goal_time = 0.2
+    def setup(self, index, freq, method):
+        indexes = {'period': period_range(start='1/1/2000',
+                                          end='1/1/2001',
+                                          freq='T'),
+                   'datetime': date_range(start='1/1/2000',
+                                          end='1/1/2001',
+                                          freq='T')}
+        idx = indexes[index]
+        ts = Series(np.random.randn(len(idx)), index=idx)
+        self.resample = getattr(ts.resample(freq), method)
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_custom_bmonthbegin_decr_n(self):
-        (self.date - (10 * self.cmb))
-
-
-class timeseries_custom_bmonthbegin_incr_n(object):
-    goal_time = 0.2
+    def time_resample(self, index, freq, method):
+        self.resample()
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_custom_bmonthbegin_incr_n(self):
-        (self.date + (10 * self.cmb))
-
-
-class timeseries_custom_bmonthend_decr_n(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_custom_bmonthend_decr_n(self):
-        (self.date - (10 * self.cme))
-
-
-class timeseries_custom_bmonthend_incr(object):
+class ResampleDatetetime64(object):
+    # GH 7754
     goal_time = 0.2
 
     def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_custom_bmonthend_incr(self):
-        (self.date + self.cme)
-
-
-class timeseries_custom_bmonthend_incr_n(object):
-    goal_time = 0.2
+        rng3 = date_range(start='2000-01-01 00:00:00',
+                          end='2000-01-01 10:00:00', freq='555000U')
+        self.dt_ts = Series(5, rng3, dtype='datetime64[ns]')
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_custom_bmonthend_incr_n(self):
-        (self.date + (10 * self.cme))
-
-
-class timeseries_datetimeindex_offset_delta(object):
-    goal_time = 0.2
+    def time_resample(self):
+        self.dt_ts.resample('1S').last()
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 100000
-        self.idx1 = date_range(start='20140101', freq='T', periods=self.N)
-        self.delta_offset = pd.offsets.Day()
-        self.fast_offset = pd.offsets.DateOffset(months=2, days=2)
-        self.slow_offset = pd.offsets.BusinessDay()
-
-    def time_timeseries_datetimeindex_offset_delta(self):
-        (self.idx1 + self.delta_offset)
-
-
-class timeseries_datetimeindex_offset_fast(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 100000
-        self.idx1 = date_range(start='20140101', freq='T', periods=self.N)
-        self.delta_offset = pd.offsets.Day()
-        self.fast_offset = pd.offsets.DateOffset(months=2, days=2)
-        self.slow_offset = pd.offsets.BusinessDay()
-
-    def time_timeseries_datetimeindex_offset_fast(self):
-        (self.idx1 + self.fast_offset)
-
-
-class timeseries_datetimeindex_offset_slow(object):
-    goal_time = 0.2
+class AsOf(object):
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 100000
-        self.idx1 = date_range(start='20140101', freq='T', periods=self.N)
-        self.delta_offset = pd.offsets.Day()
-        self.fast_offset = pd.offsets.DateOffset(months=2, days=2)
-        self.slow_offset = pd.offsets.BusinessDay()
-
-    def time_timeseries_datetimeindex_offset_slow(self):
-        (self.idx1 + self.slow_offset)
-
-
-class timeseries_day_apply(object):
     goal_time = 0.2
+    params = ['DataFrame', 'Series']
+    param_names = ['constructor']
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_day_apply(self):
-        self.day.apply(self.date)
-
-
-class timeseries_day_incr(object):
-    goal_time = 0.2
+    def setup(self, constructor):
+        N = 10000
+        M = 10
+        rng = date_range(start='1/1/1990', periods=N, freq='53s')
+        data = {'DataFrame': DataFrame(np.random.randn(N, M)),
+                'Series': Series(np.random.randn(N))}
+        self.ts = data[constructor]
+        self.ts.index = rng
+        self.ts2 = self.ts.copy()
+        self.ts2.iloc[250:5000] = np.nan
+        self.ts3 = self.ts.copy()
+        self.ts3.iloc[-5000:] = np.nan
+        self.dates = date_range(start='1/1/1990', periods=N * 10, freq='5s')
+        self.date = self.dates[0]
+        self.date_last = self.dates[-1]
+        self.date_early = self.date - timedelta(10)
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_day_incr(self):
-        (self.date + self.day)
-
-
-class timeseries_infer_freq(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='1/1/1700', freq='D', periods=100000)
-        self.a = self.rng[:50000].append(self.rng[50002:])
+    # test speed of pre-computing NAs.
+    def time_asof(self, constructor):
+        self.ts.asof(self.dates)
 
-    def time_timeseries_infer_freq(self):
-        infer_freq(self.a)
+    # should be roughly the same as above.
+    def time_asof_nan(self, constructor):
+        self.ts2.asof(self.dates)
 
+    # test speed of the code path for a scalar index
+    # without *while* loop
+    def time_asof_single(self, constructor):
+        self.ts.asof(self.date)
 
-class timeseries_is_month_start(object):
-    goal_time = 0.2
+    # test speed of the code path for a scalar index
+    # before the start. should be the same as above.
+    def time_asof_single_early(self, constructor):
+        self.ts.asof(self.date_early)
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 10000
-        self.rng = date_range(start='1/1/1', periods=self.N, freq='B')
+    # test the speed of the code path for a scalar index
+    # with a long *while* loop. should still be much
+    # faster than pre-computing all the NAs.
+    def time_asof_nan_single(self, constructor):
+        self.ts3.asof(self.date_last)
 
-    def time_timeseries_is_month_start(self):
-        self.rng.is_month_start
 
+class SortIndex(object):
 
-class timeseries_iter_datetimeindex(object):
     goal_time = 0.2
+    params = [True, False]
+    param_names = ['monotonic']
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 1000000
-        self.M = 10000
-        self.idx1 = date_range(start='20140101', freq='T', periods=self.N)
-        self.idx2 = period_range(start='20140101', freq='T', periods=self.N)
-
-    def time_timeseries_iter_datetimeindex(self):
-        self.iter_n(self.idx1)
-
-    def iter_n(self, iterable, n=None):
-        self.i = 0
-        for _ in iterable:
-            self.i += 1
-            if ((n is not None) and (self.i > n)):
-                break
+    def setup(self, monotonic):
+        N = 10**5
+        idx = date_range(start='1/1/2000', periods=N, freq='s')
+        self.s = Series(np.random.randn(N), index=idx)
+        if not monotonic:
+            self.s = self.s.sample(frac=1)
 
+    def time_sort_index(self, monotonic):
+        self.s.sort_index()
 
-class timeseries_iter_datetimeindex_preexit(object):
-    goal_time = 0.2
+    def time_get_slice(self, monotonic):
+        self.s[:10000]
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 1000000
-        self.M = 10000
-        self.idx1 = date_range(start='20140101', freq='T', periods=self.N)
-        self.idx2 = period_range(start='20140101', freq='T', periods=self.N)
-
-    def time_timeseries_iter_datetimeindex_preexit(self):
-        self.iter_n(self.idx1, self.M)
-
-    def iter_n(self, iterable, n=None):
-        self.i = 0
-        for _ in iterable:
-            self.i += 1
-            if ((n is not None) and (self.i > n)):
-                break
 
+class IrregularOps(object):
 
-class timeseries_iter_periodindex(object):
     goal_time = 0.2
 
     def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 1000000
-        self.M = 10000
-        self.idx1 = date_range(start='20140101', freq='T', periods=self.N)
-        self.idx2 = period_range(start='20140101', freq='T', periods=self.N)
-
-    def time_timeseries_iter_periodindex(self):
-        self.iter_n(self.idx2)
-
-    def iter_n(self, iterable, n=None):
-        self.i = 0
-        for _ in iterable:
-            self.i += 1
-            if ((n is not None) and (self.i > n)):
-                break
+        N = 10**5
+        idx = date_range(start='1/1/2000', periods=N, freq='s')
+        s = Series(np.random.randn(N), index=idx)
+        self.left = s.sample(frac=1)
+        self.right = s.sample(frac=1)
 
+    def time_add(self):
+        self.left + self.right
 
-class timeseries_iter_periodindex_preexit(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 1000000
-        self.M = 10000
-        self.idx1 = date_range(start='20140101', freq='T', periods=self.N)
-        self.idx2 = period_range(start='20140101', freq='T', periods=self.N)
-
-    def time_timeseries_iter_periodindex_preexit(self):
-        self.iter_n(self.idx2, self.M)
-
-    def iter_n(self, iterable, n=None):
-        self.i = 0
-        for _ in iterable:
-            self.i += 1
-            if ((n is not None) and (self.i > n)):
-                break
 
+class Lookup(object):
 
-class timeseries_large_lookup_value(object):
     goal_time = 0.2
 
     def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='1/1/2000', periods=1500000, freq='S')
-        self.ts = Series(1, index=self.rng)
-
-    def time_timeseries_large_lookup_value(self):
-        self.ts[self.ts.index[(len(self.ts) // 2)]]
-        self.ts.index._cleanup()
-
-
-class timeseries_period_downsample_mean(object):
-    goal_time = 0.2
+        N = 1500000
+        rng = date_range(start='1/1/2000', periods=N, freq='S')
+        self.ts = Series(1, index=rng)
+        self.lookup_val = rng[N // 2]
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = period_range(start='1/1/2000', end='1/1/2001', freq='T')
-        self.ts = Series(np.random.randn(len(self.rng)), index=self.rng)
+    def time_lookup_and_cleanup(self):
+        self.ts[self.lookup_val]
+        self.ts.index._cleanup()
 
-    def time_timeseries_period_downsample_mean(self):
-        self.ts.resample('D', how='mean')
 
+class ToDatetimeYYYYMMDD(object):
 
-class timeseries_resample_datetime64(object):
     goal_time = 0.2
 
     def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='2000-01-01 00:00:00', end='2000-01-01 10:00:00', freq='555000U')
-        self.int_ts = Series(5, self.rng, dtype='int64')
-        self.ts = self.int_ts.astype('datetime64[ns]')
+        rng = date_range(start='1/1/2000', periods=10000, freq='D')
+        self.stringsD = Series(rng.strftime('%Y%m%d'))
 
-    def time_timeseries_resample_datetime64(self):
-        self.ts.resample('1S', how='last')
+    def time_format_YYYYMMDD(self):
+        to_datetime(self.stringsD, format='%Y%m%d')
 
 
-class timeseries_series_offset_delta(object):
-    goal_time = 0.2
+class ToDatetimeISO8601(object):
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 100000
-        self.s = Series(date_range(start='20140101', freq='T', periods=self.N))
-        self.delta_offset = pd.offsets.Day()
-        self.fast_offset = pd.offsets.DateOffset(months=2, days=2)
-        self.slow_offset = pd.offsets.BusinessDay()
-
-    def time_timeseries_series_offset_delta(self):
-        (self.s + self.delta_offset)
-
-
-class timeseries_series_offset_fast(object):
     goal_time = 0.2
 
     def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 100000
-        self.s = Series(date_range(start='20140101', freq='T', periods=self.N))
-        self.delta_offset = pd.offsets.Day()
-        self.fast_offset = pd.offsets.DateOffset(months=2, days=2)
-        self.slow_offset = pd.offsets.BusinessDay()
-
-    def time_timeseries_series_offset_fast(self):
-        (self.s + self.fast_offset)
-
-
-class timeseries_series_offset_slow(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 100000
-        self.s = Series(date_range(start='20140101', freq='T', periods=self.N))
-        self.delta_offset = pd.offsets.Day()
-        self.fast_offset = pd.offsets.DateOffset(months=2, days=2)
-        self.slow_offset = pd.offsets.BusinessDay()
-
-    def time_timeseries_series_offset_slow(self):
-        (self.s + self.slow_offset)
-
-
-class timeseries_slice_minutely(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-
-    def time_timeseries_slice_minutely(self):
-        self.ts[:10000]
+        rng = date_range(start='1/1/2000', periods=20000, freq='H')
+        self.strings = rng.strftime('%Y-%m-%d %H:%M:%S').tolist()
+        self.strings_nosep = rng.strftime('%Y%m%d %H:%M:%S').tolist()
+        self.strings_tz_space = [x.strftime('%Y-%m-%d %H:%M:%S') + ' -0800'
+                                 for x in rng]
 
+    def time_iso8601(self):
+        to_datetime(self.strings)
 
-class timeseries_sort_index(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='s')
-        self.rng = self.rng.take(np.random.permutation(self.N))
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-
-    def time_timeseries_sort_index(self):
-        self.ts.sort_index()
+    def time_iso8601_nosep(self):
+        to_datetime(self.strings_nosep)
 
+    def time_iso8601_format(self):
+        to_datetime(self.strings, format='%Y-%m-%d %H:%M:%S')
 
-class timeseries_timestamp_downsample_mean(object):
-    goal_time = 0.2
+    def time_iso8601_format_no_sep(self):
+        to_datetime(self.strings_nosep, format='%Y%m%d %H:%M:%S')
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='1/1/2000', end='1/1/2001', freq='T')
-        self.ts = Series(np.random.randn(len(self.rng)), index=self.rng)
+    def time_iso8601_tz_spaceformat(self):
+        to_datetime(self.strings_tz_space)
 
-    def time_timeseries_timestamp_downsample_mean(self):
-        self.ts.resample('D', how='mean')
 
+class ToDatetimeFormat(object):
 
-class timeseries_timestamp_tzinfo_cons(object):
     goal_time = 0.2
 
     def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='1/1/2000', end='3/1/2000', tz='US/Eastern')
+        self.s = Series(['19MAY11', '19MAY11:00:00:00'] * 100000)
+        self.s2 = self.s.str.replace(':\\S+$', '')
 
-    def time_timeseries_timestamp_tzinfo_cons(self):
-        self.rng[0]
+    def time_exact(self):
+        to_datetime(self.s2, format='%d%b%y')
 
+    def time_no_exact(self):
+        to_datetime(self.s, format='%d%b%y', exact=False)
 
-class timeseries_to_datetime_YYYYMMDD(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='1/1/2000', periods=10000, freq='D')
-        self.strings = Series((((self.rng.year * 10000) + (self.rng.month * 100)) + self.rng.day), dtype=np.int64).apply(str)
-
-    def time_timeseries_to_datetime_YYYYMMDD(self):
-        to_datetime(self.strings, format='%Y%m%d')
 
+class ToDatetimeCache(object):
 
-class timeseries_to_datetime_iso8601(object):
     goal_time = 0.2
+    params = [True, False]
+    param_names = ['cache']
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='1/1/2000', periods=20000, freq='H')
-        self.strings = [x.strftime('%Y-%m-%d %H:%M:%S') for x in self.rng]
-
-    def time_timeseries_to_datetime_iso8601(self):
-        to_datetime(self.strings)
-
+    def setup(self, cache):
+        N = 10000
+        self.unique_numeric_seconds = list(range(N))
+        self.dup_numeric_seconds = [1000] * N
+        self.dup_string_dates = ['2000-02-11'] * N
+        self.dup_string_with_tz = ['2000-02-11 15:00:00-0800'] * N
 
-class timeseries_to_datetime_iso8601_format(object):
-    goal_time = 0.2
+    def time_unique_seconds_and_unit(self, cache):
+        to_datetime(self.unique_numeric_seconds, unit='s', cache=cache)
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.rng = date_range(start='1/1/2000', periods=20000, freq='H')
-        self.strings = [x.strftime('%Y-%m-%d %H:%M:%S') for x in self.rng]
-
-    def time_timeseries_to_datetime_iso8601_format(self):
-        to_datetime(self.strings, format='%Y-%m-%d %H:%M:%S')
+    def time_dup_seconds_and_unit(self, cache):
+        to_datetime(self.dup_numeric_seconds, unit='s', cache=cache)
 
+    def time_dup_string_dates(self, cache):
+        to_datetime(self.dup_string_dates, cache=cache)
 
-class timeseries_with_format_no_exact(object):
-    goal_time = 0.2
+    def time_dup_string_dates_and_format(self, cache):
+        to_datetime(self.dup_string_dates, format='%Y-%m-%d', cache=cache)
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.s = Series((['19MAY11', '19MAY11:00:00:00'] * 100000))
-
-    def time_timeseries_with_format_no_exact(self):
-        to_datetime(self.s, format='%d%b%y', exact=False)
+    def time_dup_string_tzoffset_dates(self, cache):
+        to_datetime(self.dup_string_with_tz, cache=cache)
 
 
-class timeseries_with_format_replace(object):
-    goal_time = 0.2
+class DatetimeAccessor(object):
 
     def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.s = Series((['19MAY11', '19MAY11:00:00:00'] * 100000))
-
-    def time_timeseries_with_format_replace(self):
-        to_datetime(self.s.str.replace(':\\S+$', ''), format='%d%b%y')
-
+        N = 100000
+        self.series = Series(date_range(start='1/1/2000', periods=N, freq='T'))
 
-class timeseries_year_apply(object):
-    goal_time = 0.2
+    def time_dt_accessor(self):
+        self.series.dt
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_year_apply(self):
-        self.year.apply(self.date)
-
-
-class timeseries_year_incr(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        if hasattr(Series, 'convert'):
-            Series.resample = Series.convert
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_year_incr(self):
-        (self.date + self.year)
\ No newline at end of file
+    def time_dt_accessor_normalize(self):
+        self.series.dt.normalize()
diff --git a/asv_bench/benchmarks/timestamp.py b/asv_bench/benchmarks/timestamp.py
new file mode 100644
index 0000000000000..c142a9b59fc43
--- /dev/null
+++ b/asv_bench/benchmarks/timestamp.py
@@ -0,0 +1,119 @@
+import datetime
+
+from pandas import Timestamp
+import pytz
+
+
+class TimestampConstruction(object):
+
+    def time_parse_iso8601_no_tz(self):
+        Timestamp('2017-08-25 08:16:14')
+
+    def time_parse_iso8601_tz(self):
+        Timestamp('2017-08-25 08:16:14-0500')
+
+    def time_parse_dateutil(self):
+        Timestamp('2017/08/25 08:16:14 AM')
+
+    def time_parse_today(self):
+        Timestamp('today')
+
+    def time_parse_now(self):
+        Timestamp('now')
+
+    def time_fromordinal(self):
+        Timestamp.fromordinal(730120)
+
+    def time_fromtimestamp(self):
+        Timestamp.fromtimestamp(1515448538)
+
+
+class TimestampProperties(object):
+    goal_time = 0.2
+
+    _tzs = [None, pytz.timezone('Europe/Amsterdam')]
+    _freqs = [None, 'B']
+    params = [_tzs, _freqs]
+    param_names = ['tz', 'freq']
+
+    def setup(self, tz, freq):
+        self.ts = Timestamp('2017-08-25 08:16:14', tzinfo=tz, freq=freq)
+
+    def time_tz(self, tz, freq):
+        self.ts.tz
+
+    def time_dayofweek(self, tz, freq):
+        self.ts.dayofweek
+
+    def time_weekday_name(self, tz, freq):
+        self.ts.weekday_name
+
+    def time_dayofyear(self, tz, freq):
+        self.ts.dayofyear
+
+    def time_week(self, tz, freq):
+        self.ts.week
+
+    def time_quarter(self, tz, freq):
+        self.ts.quarter
+
+    def time_days_in_month(self, tz, freq):
+        self.ts.days_in_month
+
+    def time_freqstr(self, tz, freq):
+        self.ts.freqstr
+
+    def time_is_month_start(self, tz, freq):
+        self.ts.is_month_start
+
+    def time_is_month_end(self, tz, freq):
+        self.ts.is_month_end
+
+    def time_is_quarter_start(self, tz, freq):
+        self.ts.is_quarter_start
+
+    def time_is_quarter_end(self, tz, freq):
+        self.ts.is_quarter_end
+
+    def time_is_year_start(self, tz, freq):
+        self.ts.is_quarter_end
+
+    def time_is_year_end(self, tz, freq):
+        self.ts.is_quarter_end
+
+    def time_is_leap_year(self, tz, freq):
+        self.ts.is_quarter_end
+
+    def time_microsecond(self, tz, freq):
+        self.ts.microsecond
+
+
+class TimestampOps(object):
+    goal_time = 0.2
+
+    params = [None, 'US/Eastern']
+    param_names = ['tz']
+
+    def setup(self, tz):
+        self.ts = Timestamp('2017-08-25 08:16:14', tz=tz)
+
+    def time_replace_tz(self, tz):
+        self.ts.replace(tzinfo=pytz.timezone('US/Eastern'))
+
+    def time_replace_None(self, tz):
+        self.ts.replace(tzinfo=None)
+
+    def time_to_pydatetime(self, tz):
+        self.ts.to_pydatetime()
+
+
+class TimestampAcrossDst(object):
+    goal_time = 0.2
+
+    def setup(self):
+        dt = datetime.datetime(2016, 3, 27, 1)
+        self.tzinfo = pytz.timezone('CET').localize(dt, is_dst=False).tzinfo
+        self.ts2 = Timestamp(dt)
+
+    def time_replace_across_dst(self):
+        self.ts2.replace(tzinfo=self.tzinfo)
diff --git a/asv_bench/vbench_to_asv.py b/asv_bench/vbench_to_asv.py
index c3041ec2b1ba1..b1179387e65d5 100644
--- a/asv_bench/vbench_to_asv.py
+++ b/asv_bench/vbench_to_asv.py
@@ -69,7 +69,7 @@ def visit_ClassDef(self, node):
         return node
 
     def visit_TryExcept(self, node):
-        if any([isinstance(x, (ast.Import, ast.ImportFrom)) for x in node.body]):
+        if any(isinstance(x, (ast.Import, ast.ImportFrom)) for x in node.body):
             self.imports.append(node)
         else:
             self.generic_visit(node)
@@ -114,7 +114,7 @@ def translate_module(target_module):
     l_vars = {}
     exec('import ' + target_module) in g_vars
 
-    print target_module
+    print(target_module)
     module = eval(target_module, g_vars)
 
     benchmarks = []
@@ -157,7 +157,7 @@ def translate_module(target_module):
         mod = os.path.basename(module)
         if mod in ['make.py', 'measure_memory_consumption.py', 'perf_HEAD.py', 'run_suite.py', 'test_perf.py', 'generate_rst_files.py', 'test.py', 'suite.py']:
             continue
-        print
-        print mod
+        print('')
+        print(mod)
 
         translate_module(mod.replace('.py', ''))
diff --git a/bench/alignment.py b/bench/alignment.py
deleted file mode 100644
index bc3134f597ee0..0000000000000
--- a/bench/alignment.py
+++ /dev/null
@@ -1,22 +0,0 @@
-# Setup
-from pandas.compat import range, lrange
-import numpy as np
-import pandas
-import la
-N = 1000
-K = 50
-arr1 = np.random.randn(N, K)
-arr2 = np.random.randn(N, K)
-idx1 = lrange(N)
-idx2 = lrange(K)
-
-# pandas
-dma1 = pandas.DataFrame(arr1, idx1, idx2)
-dma2 = pandas.DataFrame(arr2, idx1[::-1], idx2[::-1])
-
-# larry
-lar1 = la.larry(arr1, [idx1, idx2])
-lar2 = la.larry(arr2, [idx1[::-1], idx2[::-1]])
-
-for i in range(100):
-    result = lar1 + lar2
diff --git a/bench/bench_dense_to_sparse.py b/bench/bench_dense_to_sparse.py
deleted file mode 100644
index e1dcd3456e88d..0000000000000
--- a/bench/bench_dense_to_sparse.py
+++ /dev/null
@@ -1,14 +0,0 @@
-from pandas import *
-
-K = 100
-N = 100000
-rng = DatetimeIndex('1/1/2000', periods=N, offset=datetools.Minute())
-
-rng2 = np.asarray(rng).astype('M8[us]').astype('i8')
-
-series = {}
-for i in range(1, K + 1):
-    data = np.random.randn(N)[:-i]
-    this_rng = rng2[:-i]
-    data[100:] = np.nan
-    series[i] = SparseSeries(data, index=this_rng)
diff --git a/bench/bench_get_put_value.py b/bench/bench_get_put_value.py
deleted file mode 100644
index 427e0b1b10a22..0000000000000
--- a/bench/bench_get_put_value.py
+++ /dev/null
@@ -1,56 +0,0 @@
-from pandas import *
-from pandas.util.testing import rands
-from pandas.compat import range
-
-N = 1000
-K = 50
-
-
-def _random_index(howmany):
-    return Index([rands(10) for _ in range(howmany)])
-
-df = DataFrame(np.random.randn(N, K), index=_random_index(N),
-               columns=_random_index(K))
-
-
-def get1():
-    for col in df.columns:
-        for row in df.index:
-            _ = df[col][row]
-
-
-def get2():
-    for col in df.columns:
-        for row in df.index:
-            _ = df.get_value(row, col)
-
-
-def put1():
-    for col in df.columns:
-        for row in df.index:
-            df[col][row] = 0
-
-
-def put2():
-    for col in df.columns:
-        for row in df.index:
-            df.set_value(row, col, 0)
-
-
-def resize1():
-    buf = DataFrame()
-    for col in df.columns:
-        for row in df.index:
-            buf = buf.set_value(row, col, 5.)
-    return buf
-
-
-def resize2():
-    from collections import defaultdict
-
-    buf = defaultdict(dict)
-    for col in df.columns:
-        for row in df.index:
-            buf[col][row] = 5.
-
-    return DataFrame(buf)
diff --git a/bench/bench_groupby.py b/bench/bench_groupby.py
deleted file mode 100644
index d7a2853e1e7b2..0000000000000
--- a/bench/bench_groupby.py
+++ /dev/null
@@ -1,66 +0,0 @@
-from pandas import *
-from pandas.util.testing import rands
-from pandas.compat import range
-
-import string
-import random
-
-k = 20000
-n = 10
-
-foo = np.tile(np.array([rands(10) for _ in range(k)], dtype='O'), n)
-foo2 = list(foo)
-random.shuffle(foo)
-random.shuffle(foo2)
-
-df = DataFrame({'A': foo,
-                'B': foo2,
-                'C': np.random.randn(n * k)})
-
-import pandas._sandbox as sbx
-
-
-def f():
-    table = sbx.StringHashTable(len(df))
-    ret = table.factorize(df['A'])
-    return ret
-
-
-def g():
-    table = sbx.PyObjectHashTable(len(df))
-    ret = table.factorize(df['A'])
-    return ret
-
-ret = f()
-
-"""
-import pandas._tseries as lib
-
-f = np.std
-
-
-grouped = df.groupby(['A', 'B'])
-
-label_list = [ping.labels for ping in grouped.groupings]
-shape = [len(ping.ids) for ping in grouped.groupings]
-
-from pandas.core.groupby import get_group_index
-
-
-group_index = get_group_index(label_list, shape,
-                              sort=True, xnull=True).astype('i4')
-
-ngroups = np.prod(shape)
-
-indexer = lib.groupsort_indexer(group_index, ngroups)
-
-values = df['C'].values.take(indexer)
-group_index = group_index.take(indexer)
-
-f = lambda x: x.std(ddof=1)
-
-grouper = lib.Grouper(df['C'], np.ndarray.std, group_index, ngroups)
-result = grouper.get_result()
-
-expected = grouped.std()
-"""
diff --git a/bench/bench_join_panel.py b/bench/bench_join_panel.py
deleted file mode 100644
index f3c3f8ba15f70..0000000000000
--- a/bench/bench_join_panel.py
+++ /dev/null
@@ -1,85 +0,0 @@
-# reasonably efficient
-
-
-def create_panels_append(cls, panels):
-        """ return an append list of panels """
-        panels = [a for a in panels if a is not None]
-        # corner cases
-        if len(panels) == 0:
-                return None
-        elif len(panels) == 1:
-                return panels[0]
-        elif len(panels) == 2 and panels[0] == panels[1]:
-                return panels[0]
-        # import pdb; pdb.set_trace()
-        # create a joint index for the axis
-
-        def joint_index_for_axis(panels, axis):
-                s = set()
-                for p in panels:
-                        s.update(list(getattr(p, axis)))
-                return sorted(list(s))
-
-        def reindex_on_axis(panels, axis, axis_reindex):
-                new_axis = joint_index_for_axis(panels, axis)
-                new_panels = [p.reindex(**{axis_reindex: new_axis,
-                                        'copy': False}) for p in panels]
-                return new_panels, new_axis
-        # create the joint major index, dont' reindex the sub-panels - we are
-        # appending
-        major = joint_index_for_axis(panels, 'major_axis')
-        # reindex on minor axis
-        panels, minor = reindex_on_axis(panels, 'minor_axis', 'minor')
-        # reindex on items
-        panels, items = reindex_on_axis(panels, 'items', 'items')
-        # concatenate values
-        try:
-                values = np.concatenate([p.values for p in panels], axis=1)
-        except Exception as detail:
-                raise Exception("cannot append values that dont' match dimensions! -> [%s] %s"
-                                % (','.join(["%s" % p for p in panels]), str(detail)))
-        # pm('append - create_panel')
-        p = Panel(values, items=items, major_axis=major,
-                  minor_axis=minor)
-        # pm('append - done')
-        return p
-
-
-# does the job but inefficient (better to handle like you read a table in
-# pytables...e.g create a LongPanel then convert to Wide)
-def create_panels_join(cls, panels):
-        """ given an array of panels's, create a single panel """
-        panels = [a for a in panels if a is not None]
-        # corner cases
-        if len(panels) == 0:
-                return None
-        elif len(panels) == 1:
-                return panels[0]
-        elif len(panels) == 2 and panels[0] == panels[1]:
-                return panels[0]
-        d = dict()
-        minor, major, items = set(), set(), set()
-        for panel in panels:
-                items.update(panel.items)
-                major.update(panel.major_axis)
-                minor.update(panel.minor_axis)
-                values = panel.values
-                for item, item_index in panel.items.indexMap.items():
-                        for minor_i, minor_index in panel.minor_axis.indexMap.items():
-                                for major_i, major_index in panel.major_axis.indexMap.items():
-                                        try:
-                                                d[(minor_i, major_i, item)] = values[item_index, major_index, minor_index]
-                                        except:
-                                                pass
-        # stack the values
-        minor = sorted(list(minor))
-        major = sorted(list(major))
-        items = sorted(list(items))
-        # create the 3d stack (items x columns x indicies)
-        data = np.dstack([np.asarray([np.asarray([d.get((minor_i, major_i, item), np.nan)
-                                                  for item in items])
-                                      for major_i in major]).transpose()
-                          for minor_i in minor])
-        # construct the panel
-        return Panel(data, items, major, minor)
-add_class_method(Panel, create_panels_join, 'join_many')
diff --git a/bench/bench_khash_dict.py b/bench/bench_khash_dict.py
deleted file mode 100644
index 054fc36131b65..0000000000000
--- a/bench/bench_khash_dict.py
+++ /dev/null
@@ -1,89 +0,0 @@
-"""
-Some comparisons of khash.h to Python dict
-"""
-from __future__ import print_function
-
-import numpy as np
-import os
-
-from vbench.api import Benchmark
-from pandas.util.testing import rands
-from pandas.compat import range
-import pandas._tseries as lib
-import pandas._sandbox as sbx
-import time
-
-import psutil
-
-pid = os.getpid()
-proc = psutil.Process(pid)
-
-
-def object_test_data(n):
-    pass
-
-
-def string_test_data(n):
-    return np.array([rands(10) for _ in range(n)], dtype='O')
-
-
-def int_test_data(n):
-    return np.arange(n, dtype='i8')
-
-N = 1000000
-
-#----------------------------------------------------------------------
-# Benchmark 1: map_locations
-
-
-def map_locations_python_object():
-    arr = string_test_data(N)
-    return _timeit(lambda: lib.map_indices_object(arr))
-
-
-def map_locations_khash_object():
-    arr = string_test_data(N)
-
-    def f():
-        table = sbx.PyObjectHashTable(len(arr))
-        table.map_locations(arr)
-    return _timeit(f)
-
-
-def _timeit(f, iterations=10):
-    start = time.time()
-    for _ in range(iterations):
-        foo = f()
-    elapsed = time.time() - start
-    return elapsed
-
-#----------------------------------------------------------------------
-# Benchmark 2: lookup_locations
-
-
-def lookup_python(values):
-    table = lib.map_indices_object(values)
-    return _timeit(lambda: lib.merge_indexer_object(values, table))
-
-
-def lookup_khash(values):
-    table = sbx.PyObjectHashTable(len(values))
-    table.map_locations(values)
-    locs = table.lookup_locations(values)
-    # elapsed = _timeit(lambda: table.lookup_locations2(values))
-    return table
-
-
-def leak(values):
-    for _ in range(100):
-        print(proc.get_memory_info())
-        table = lookup_khash(values)
-        # table.destroy()
-
-arr = string_test_data(N)
-
-#----------------------------------------------------------------------
-# Benchmark 3: unique
-
-#----------------------------------------------------------------------
-# Benchmark 4: factorize
diff --git a/bench/bench_merge.R b/bench/bench_merge.R
deleted file mode 100644
index 3ed4618494857..0000000000000
--- a/bench/bench_merge.R
+++ /dev/null
@@ -1,161 +0,0 @@
-library(plyr)
-library(data.table)
-N <- 10000
-indices = rep(NA, N)
-indices2 = rep(NA, N)
-for (i in 1:N) {
-  indices[i] <- paste(sample(letters, 10), collapse="")
-  indices2[i] <- paste(sample(letters, 10), collapse="")
-}
-left <- data.frame(key=rep(indices[1:8000], 10),
-                   key2=rep(indices2[1:8000], 10),
-                   value=rnorm(80000))
-right <- data.frame(key=indices[2001:10000],
-                    key2=indices2[2001:10000],
-                    value2=rnorm(8000))
-
-right2 <- data.frame(key=rep(right$key, 2),
-                     key2=rep(right$key2, 2),
-                     value2=rnorm(16000))
-
-left.dt <- data.table(left, key=c("key", "key2"))
-right.dt <- data.table(right, key=c("key", "key2"))
-right2.dt <- data.table(right2, key=c("key", "key2"))
-
-# left.dt2 <- data.table(left)
-# right.dt2 <- data.table(right)
-
-## left <- data.frame(key=rep(indices[1:1000], 10),
-##                    key2=rep(indices2[1:1000], 10),
-##                    value=rnorm(100000))
-## right <- data.frame(key=indices[1:1000],
-##                     key2=indices2[1:1000],
-##                     value2=rnorm(10000))
-
-timeit <- function(func, niter=10) {
-  timing = rep(NA, niter)
-  for (i in 1:niter) {
-    gc()
-    timing[i] <- system.time(func())[3]
-  }
-  mean(timing)
-}
-
-left.join <- function(sort=FALSE) {
-  result <- base::merge(left, right, all.x=TRUE, sort=sort)
-}
-
-right.join <- function(sort=FALSE) {
-  result <- base::merge(left, right, all.y=TRUE, sort=sort)
-}
-
-outer.join <- function(sort=FALSE) {
-  result <- base::merge(left, right, all=TRUE, sort=sort)
-}
-
-inner.join <- function(sort=FALSE) {
-  result <- base::merge(left, right, all=FALSE, sort=sort)
-}
-
-left.join.dt <- function(sort=FALSE) {
-  result <- right.dt[left.dt]
-}
-
-right.join.dt <- function(sort=FALSE) {
-  result <- left.dt[right.dt]
-}
-
-outer.join.dt <- function(sort=FALSE) {
-  result <- merge(left.dt, right.dt, all=TRUE, sort=sort)
-}
-
-inner.join.dt <- function(sort=FALSE) {
-  result <- merge(left.dt, right.dt, all=FALSE, sort=sort)
-}
-
-plyr.join <- function(type) {
-  result <- plyr::join(left, right, by=c("key", "key2"),
-                       type=type, match="first")
-}
-
-sort.options <- c(FALSE, TRUE)
-
-# many-to-one
-
-results <- matrix(nrow=4, ncol=3)
-colnames(results) <- c("base::merge", "plyr", "data.table")
-rownames(results) <- c("inner", "outer", "left", "right")
-
-base.functions <- c(inner.join, outer.join, left.join, right.join)
-plyr.functions <- c(function() plyr.join("inner"),
-                    function() plyr.join("full"),
-                    function() plyr.join("left"),
-					function() plyr.join("right"))
-dt.functions <- c(inner.join.dt, outer.join.dt, left.join.dt, right.join.dt)
-for (i in 1:4) {
-  base.func <- base.functions[[i]]
-  plyr.func <- plyr.functions[[i]]
-  dt.func <- dt.functions[[i]]
-  results[i, 1] <- timeit(base.func)
-  results[i, 2] <- timeit(plyr.func)
-  results[i, 3] <- timeit(dt.func)
-}
-
-
-# many-to-many
-
-left.join <- function(sort=FALSE) {
-  result <- base::merge(left, right2, all.x=TRUE, sort=sort)
-}
-
-right.join <- function(sort=FALSE) {
-  result <- base::merge(left, right2, all.y=TRUE, sort=sort)
-}
-
-outer.join <- function(sort=FALSE) {
-  result <- base::merge(left, right2, all=TRUE, sort=sort)
-}
-
-inner.join <- function(sort=FALSE) {
-  result <- base::merge(left, right2, all=FALSE, sort=sort)
-}
-
-left.join.dt <- function(sort=FALSE) {
-  result <- right2.dt[left.dt]
-}
-
-right.join.dt <- function(sort=FALSE) {
-  result <- left.dt[right2.dt]
-}
-
-outer.join.dt <- function(sort=FALSE) {
-  result <- merge(left.dt, right2.dt, all=TRUE, sort=sort)
-}
-
-inner.join.dt <- function(sort=FALSE) {
-  result <- merge(left.dt, right2.dt, all=FALSE, sort=sort)
-}
-
-sort.options <- c(FALSE, TRUE)
-
-# many-to-one
-
-results <- matrix(nrow=4, ncol=3)
-colnames(results) <- c("base::merge", "plyr", "data.table")
-rownames(results) <- c("inner", "outer", "left", "right")
-
-base.functions <- c(inner.join, outer.join, left.join, right.join)
-plyr.functions <- c(function() plyr.join("inner"),
-                    function() plyr.join("full"),
-                    function() plyr.join("left"),
-					function() plyr.join("right"))
-dt.functions <- c(inner.join.dt, outer.join.dt, left.join.dt, right.join.dt)
-for (i in 1:4) {
-  base.func <- base.functions[[i]]
-  plyr.func <- plyr.functions[[i]]
-  dt.func <- dt.functions[[i]]
-  results[i, 1] <- timeit(base.func)
-  results[i, 2] <- timeit(plyr.func)
-  results[i, 3] <- timeit(dt.func)
-}
-
diff --git a/bench/bench_merge.py b/bench/bench_merge.py
deleted file mode 100644
index 330dba7b9af69..0000000000000
--- a/bench/bench_merge.py
+++ /dev/null
@@ -1,105 +0,0 @@
-import random
-import gc
-import time
-from pandas import *
-from pandas.compat import range, lrange, StringIO
-from pandas.util.testing import rands
-
-N = 10000
-ngroups = 10
-
-
-def get_test_data(ngroups=100, n=N):
-    unique_groups = lrange(ngroups)
-    arr = np.asarray(np.tile(unique_groups, n / ngroups), dtype=object)
-
-    if len(arr) < n:
-        arr = np.asarray(list(arr) + unique_groups[:n - len(arr)],
-                         dtype=object)
-
-    random.shuffle(arr)
-    return arr
-
-# aggregate multiple columns
-# df = DataFrame({'key1' : get_test_data(ngroups=ngroups),
-#                 'key2' : get_test_data(ngroups=ngroups),
-#                 'data1' : np.random.randn(N),
-#                 'data2' : np.random.randn(N)})
-
-# df2 = DataFrame({'key1'  : get_test_data(ngroups=ngroups, n=N//10),
-#                  'key2'  : get_test_data(ngroups=ngroups//2, n=N//10),
-#                  'value' : np.random.randn(N // 10)})
-# result = merge.merge(df, df2, on='key2')
-
-N = 10000
-
-indices = np.array([rands(10) for _ in range(N)], dtype='O')
-indices2 = np.array([rands(10) for _ in range(N)], dtype='O')
-key = np.tile(indices[:8000], 10)
-key2 = np.tile(indices2[:8000], 10)
-
-left = DataFrame({'key': key, 'key2': key2,
-                  'value': np.random.randn(80000)})
-right = DataFrame({'key': indices[2000:], 'key2': indices2[2000:],
-                   'value2': np.random.randn(8000)})
-
-right2 = right.append(right, ignore_index=True)
-
-
-join_methods = ['inner', 'outer', 'left', 'right']
-results = DataFrame(index=join_methods, columns=[False, True])
-niter = 10
-for sort in [False, True]:
-    for join_method in join_methods:
-        f = lambda: merge(left, right, how=join_method, sort=sort)
-        gc.disable()
-        start = time.time()
-        for _ in range(niter):
-            f()
-        elapsed = (time.time() - start) / niter
-        gc.enable()
-        results[sort][join_method] = elapsed
-# results.columns = ['pandas']
-results.columns = ['dont_sort', 'sort']
-
-
-# R results
-# many to one
-r_results = read_table(StringIO("""      base::merge   plyr data.table
-inner      0.2475 0.1183     0.1100
-outer      0.4213 0.1916     0.2090
-left       0.2998 0.1188     0.0572
-right      0.3102 0.0536     0.0376
-"""), sep='\s+')
-
-presults = results[['dont_sort']].rename(columns={'dont_sort': 'pandas'})
-all_results = presults.join(r_results)
-
-all_results = all_results.div(all_results['pandas'], axis=0)
-
-all_results = all_results.ix[:, ['pandas', 'data.table', 'plyr',
-                                 'base::merge']]
-
-sort_results = DataFrame.from_items([('pandas', results['sort']),
-                                     ('R', r_results['base::merge'])])
-sort_results['Ratio'] = sort_results['R'] / sort_results['pandas']
-
-
-nosort_results = DataFrame.from_items([('pandas', results['dont_sort']),
-                                       ('R', r_results['base::merge'])])
-nosort_results['Ratio'] = nosort_results['R'] / nosort_results['pandas']
-
-# many to many
-
-# many to one
-r_results = read_table(StringIO("""base::merge   plyr data.table
-inner      0.4610 0.1276     0.1269
-outer      0.9195 0.1881     0.2725
-left       0.6559 0.1257     0.0678
-right      0.6425 0.0522     0.0428
-"""), sep='\s+')
-
-all_results = presults.join(r_results)
-all_results = all_results.div(all_results['pandas'], axis=0)
-all_results = all_results.ix[:, ['pandas', 'data.table', 'plyr',
-                                 'base::merge']]
diff --git a/bench/bench_merge_sqlite.py b/bench/bench_merge_sqlite.py
deleted file mode 100644
index 3ad4b810119c3..0000000000000
--- a/bench/bench_merge_sqlite.py
+++ /dev/null
@@ -1,87 +0,0 @@
-import numpy as np
-from collections import defaultdict
-import gc
-import time
-from pandas import DataFrame
-from pandas.util.testing import rands
-from pandas.compat import range, zip
-import random
-
-N = 10000
-
-indices = np.array([rands(10) for _ in range(N)], dtype='O')
-indices2 = np.array([rands(10) for _ in range(N)], dtype='O')
-key = np.tile(indices[:8000], 10)
-key2 = np.tile(indices2[:8000], 10)
-
-left = DataFrame({'key': key, 'key2': key2,
-                  'value': np.random.randn(80000)})
-right = DataFrame({'key': indices[2000:], 'key2': indices2[2000:],
-                   'value2': np.random.randn(8000)})
-
-# right2 = right.append(right, ignore_index=True)
-# right = right2
-
-# random.shuffle(key2)
-# indices2 = indices.copy()
-# random.shuffle(indices2)
-
-# Prepare Database
-import sqlite3
-create_sql_indexes = True
-
-conn = sqlite3.connect(':memory:')
-conn.execute(
-    'create table left( key varchar(10), key2 varchar(10), value int);')
-conn.execute(
-    'create table right( key varchar(10), key2 varchar(10), value2 int);')
-conn.executemany('insert into left values (?, ?, ?)',
-                 zip(key, key2, left['value']))
-conn.executemany('insert into right values (?, ?, ?)',
-                 zip(right['key'], right['key2'], right['value2']))
-
-# Create Indices
-if create_sql_indexes:
-    conn.execute('create index left_ix on left(key, key2)')
-    conn.execute('create index right_ix on right(key, key2)')
-
-
-join_methods = ['inner', 'left outer', 'left']  # others not supported
-sql_results = DataFrame(index=join_methods, columns=[False])
-niter = 5
-for sort in [False]:
-    for join_method in join_methods:
-        sql = """CREATE TABLE test as select *
-        from left
-           %s join right
-             on left.key=right.key
-               and left.key2 = right.key2;""" % join_method
-        sql = """select *
-        from left
-           %s join right
-             on left.key=right.key
-               and left.key2 = right.key2;""" % join_method
-
-        if sort:
-            sql = '%s order by key, key2' % sql
-        f = lambda: list(conn.execute(sql))  # list fetches results
-        g = lambda: conn.execute(sql)  # list fetches results
-        gc.disable()
-        start = time.time()
-        # for _ in range(niter):
-        g()
-        elapsed = (time.time() - start) / niter
-        gc.enable()
-
-        cur = conn.execute("DROP TABLE test")
-        conn.commit()
-
-        sql_results[sort][join_method] = elapsed
-        sql_results.columns = ['sqlite3']  # ['dont_sort', 'sort']
-        sql_results.index = ['inner', 'outer', 'left']
-
-        sql = """select *
-        from left
-           inner join right
-             on left.key=right.key
-               and left.key2 = right.key2;"""
diff --git a/bench/bench_pivot.R b/bench/bench_pivot.R
deleted file mode 100644
index 06dc6a105bc43..0000000000000
--- a/bench/bench_pivot.R
+++ /dev/null
@@ -1,27 +0,0 @@
-library(reshape2)
-
-
-n <- 100000
-a.size <- 5
-b.size <- 5
-
-data <- data.frame(a=sample(letters[1:a.size], n, replace=T),
-                   b=sample(letters[1:b.size], n, replace=T),
-                   c=rnorm(n),
-                   d=rnorm(n))
-
-timings <- numeric()
-
-# acast(melt(data, id=c("a", "b")), a ~ b, mean)
-# acast(melt(data, id=c("a", "b")), a + b ~ variable, mean)
-
-for (i in 1:10) {
-  gc()
-  tim <- system.time(acast(melt(data, id=c("a", "b")), a ~ b, mean,
-                           subset=.(variable=="c")))
-  timings[i] = tim[3]
-}
-
-mean(timings)
-
-acast(melt(data, id=c("a", "b")), a ~ b, mean, subset=.(variable="c"))
diff --git a/bench/bench_pivot.py b/bench/bench_pivot.py
deleted file mode 100644
index 007bd0aaebc2f..0000000000000
--- a/bench/bench_pivot.py
+++ /dev/null
@@ -1,16 +0,0 @@
-from pandas import *
-import string
-
-
-n = 100000
-asize = 5
-bsize = 5
-
-letters = np.asarray(list(string.letters), dtype=object)
-
-data = DataFrame(dict(foo=letters[:asize][np.random.randint(0, asize, n)],
-                      bar=letters[:bsize][np.random.randint(0, bsize, n)],
-                      baz=np.random.randn(n),
-                      qux=np.random.randn(n)))
-
-table = pivot_table(data, xby=['foo', 'bar'])
diff --git a/bench/bench_sparse.py b/bench/bench_sparse.py
deleted file mode 100644
index 0aa705118d970..0000000000000
--- a/bench/bench_sparse.py
+++ /dev/null
@@ -1,92 +0,0 @@
-import numpy as np
-
-from pandas import *
-import pandas.core.sparse as spm
-import pandas.compat as compat
-reload(spm)
-from pandas.core.sparse import *
-
-N = 10000.
-
-arr1 = np.arange(N)
-index = Index(np.arange(N))
-
-off = N // 10
-arr1[off: 2 * off] = np.NaN
-arr1[4 * off: 5 * off] = np.NaN
-arr1[8 * off: 9 * off] = np.NaN
-
-arr2 = np.arange(N)
-arr2[3 * off // 2: 2 * off + off // 2] = np.NaN
-arr2[8 * off + off // 2: 9 * off + off // 2] = np.NaN
-
-s1 = SparseSeries(arr1, index=index)
-s2 = SparseSeries(arr2, index=index)
-
-is1 = SparseSeries(arr1, kind='integer', index=index)
-is2 = SparseSeries(arr2, kind='integer', index=index)
-
-s1_dense = s1.to_dense()
-s2_dense = s2.to_dense()
-
-if compat.is_platform_linux():
-    pth = '/home/wesm/code/pandas/example'
-else:
-    pth = '/Users/wesm/code/pandas/example'
-
-dm = DataFrame.load(pth)
-
-sdf = dm.to_sparse()
-
-
-def new_data_like(sdf):
-    new_data = {}
-    for col, series in compat.iteritems(sdf):
-        new_data[col] = SparseSeries(np.random.randn(len(series.sp_values)),
-                                     index=sdf.index,
-                                     sparse_index=series.sp_index,
-                                     fill_value=series.fill_value)
-
-    return SparseDataFrame(new_data)
-
-# data = {}
-# for col, ser in dm.iteritems():
-#     data[col] = SparseSeries(ser)
-
-dwp = Panel.fromDict({'foo': dm})
-# sdf = SparseDataFrame(data)
-
-
-lp = stack_sparse_frame(sdf)
-
-
-swp = SparsePanel({'A': sdf})
-swp = SparsePanel({'A': sdf,
-                   'B': sdf,
-                   'C': sdf,
-                   'D': sdf})
-
-y = sdf
-x = SparsePanel({'x1': sdf + new_data_like(sdf) / 10,
-                 'x2': sdf + new_data_like(sdf) / 10})
-
-dense_y = sdf
-dense_x = x.to_dense()
-
-# import hotshot, hotshot.stats
-# prof = hotshot.Profile('test.prof')
-
-# benchtime, stones = prof.runcall(ols, y=y, x=x)
-
-# prof.close()
-
-# stats = hotshot.stats.load('test.prof')
-
-dense_model = ols(y=dense_y, x=dense_x)
-
-import pandas.stats.plm as plm
-import pandas.stats.interface as face
-reload(plm)
-reload(face)
-
-# model = face.ols(y=y, x=x)
diff --git a/bench/bench_take_indexing.py b/bench/bench_take_indexing.py
deleted file mode 100644
index 5fb584bcfe45f..0000000000000
--- a/bench/bench_take_indexing.py
+++ /dev/null
@@ -1,55 +0,0 @@
-from __future__ import print_function
-import numpy as np
-
-from pandas import *
-import pandas._tseries as lib
-
-from pandas import DataFrame
-import timeit
-from pandas.compat import zip
-
-setup = """
-from pandas import Series
-import pandas._tseries as lib
-import random
-import numpy as np
-
-import random
-n = %d
-k = %d
-arr = np.random.randn(n, k)
-indexer = np.arange(n, dtype=np.int32)
-indexer = indexer[::-1]
-"""
-
-sizes = [100, 1000, 10000, 100000]
-iters = [1000, 1000, 100, 1]
-
-fancy_2d = []
-take_2d = []
-cython_2d = []
-
-n = 1000
-
-
-def _timeit(stmt, size, k=5, iters=1000):
-    timer = timeit.Timer(stmt=stmt, setup=setup % (sz, k))
-    return timer.timeit(n) / n
-
-for sz, its in zip(sizes, iters):
-    print(sz)
-    fancy_2d.append(_timeit('arr[indexer]', sz, iters=its))
-    take_2d.append(_timeit('arr.take(indexer, axis=0)', sz, iters=its))
-    cython_2d.append(_timeit('lib.take_axis0(arr, indexer)', sz, iters=its))
-
-df = DataFrame({'fancy': fancy_2d,
-                'take': take_2d,
-                'cython': cython_2d})
-
-print(df)
-
-from pandas.rpy.common import r
-r('mat <- matrix(rnorm(50000), nrow=10000, ncol=5)')
-r('set.seed(12345')
-r('indexer <- sample(1:10000)')
-r('mat[indexer,]')
diff --git a/bench/bench_unique.py b/bench/bench_unique.py
deleted file mode 100644
index 87bd2f2df586c..0000000000000
--- a/bench/bench_unique.py
+++ /dev/null
@@ -1,278 +0,0 @@
-from __future__ import print_function
-from pandas import *
-from pandas.util.testing import rands
-from pandas.compat import range, zip
-import pandas._tseries as lib
-import numpy as np
-import matplotlib.pyplot as plt
-
-N = 50000
-K = 10000
-
-groups = np.array([rands(10) for _ in range(K)], dtype='O')
-groups2 = np.array([rands(10) for _ in range(K)], dtype='O')
-
-labels = np.tile(groups, N // K)
-labels2 = np.tile(groups2, N // K)
-data = np.random.randn(N)
-
-
-def timeit(f, niter):
-    import gc
-    import time
-    gc.disable()
-    start = time.time()
-    for _ in range(niter):
-        f()
-    elapsed = (time.time() - start) / niter
-    gc.enable()
-    return elapsed
-
-
-def algo1():
-    unique_labels = np.unique(labels)
-    result = np.empty(len(unique_labels))
-    for i, label in enumerate(unique_labels):
-        result[i] = data[labels == label].sum()
-
-
-def algo2():
-    unique_labels = np.unique(labels)
-    indices = lib.groupby_indices(labels)
-    result = np.empty(len(unique_labels))
-
-    for i, label in enumerate(unique_labels):
-        result[i] = data.take(indices[label]).sum()
-
-
-def algo3_nosort():
-    rizer = lib.DictFactorizer()
-    labs, counts = rizer.factorize(labels, sort=False)
-    k = len(rizer.uniques)
-    out = np.empty(k)
-    lib.group_add(out, counts, data, labs)
-
-
-def algo3_sort():
-    rizer = lib.DictFactorizer()
-    labs, counts = rizer.factorize(labels, sort=True)
-    k = len(rizer.uniques)
-    out = np.empty(k)
-    lib.group_add(out, counts, data, labs)
-
-import numpy as np
-import random
-
-
-# dict to hold results
-counts = {}
-
-# a hack to generate random key, value pairs.
-# 5k keys, 100k values
-x = np.tile(np.arange(5000, dtype='O'), 20)
-random.shuffle(x)
-xarr = x
-x = [int(y) for y in x]
-data = np.random.uniform(0, 1, 100000)
-
-
-def f():
-    # groupby sum
-    for k, v in zip(x, data):
-        try:
-            counts[k] += v
-        except KeyError:
-            counts[k] = v
-
-
-def f2():
-    rizer = lib.DictFactorizer()
-    labs, counts = rizer.factorize(xarr, sort=False)
-    k = len(rizer.uniques)
-    out = np.empty(k)
-    lib.group_add(out, counts, data, labs)
-
-
-def algo4():
-    rizer = lib.DictFactorizer()
-    labs1, _ = rizer.factorize(labels, sort=False)
-    k1 = len(rizer.uniques)
-
-    rizer = lib.DictFactorizer()
-    labs2, _ = rizer.factorize(labels2, sort=False)
-    k2 = len(rizer.uniques)
-
-    group_id = labs1 * k2 + labs2
-    max_group = k1 * k2
-
-    if max_group > 1e6:
-        rizer = lib.Int64Factorizer(len(group_id))
-        group_id, _ = rizer.factorize(group_id.astype('i8'), sort=True)
-        max_group = len(rizer.uniques)
-
-    out = np.empty(max_group)
-    counts = np.zeros(max_group, dtype='i4')
-    lib.group_add(out, counts, data, group_id)
-
-# cumtime  percall filename:lineno(function)
-#   0.592    0.592 <string>:1(<module>)
-  # 0.584    0.006 groupby_ex.py:37(algo3_nosort)
-  # 0.535    0.005 {method 'factorize' of DictFactorizer' objects}
-  # 0.047    0.000 {pandas._tseries.group_add}
-  # 0.002    0.000 numeric.py:65(zeros_like)
-  # 0.001    0.000 {method 'fill' of 'numpy.ndarray' objects}
-  # 0.000    0.000 {numpy.core.multiarray.empty_like}
-  # 0.000    0.000 {numpy.core.multiarray.empty}
-
-# UNIQUE timings
-
-# N = 10000000
-# K = 500000
-
-# groups = np.array([rands(10) for _ in range(K)], dtype='O')
-
-# labels = np.tile(groups, N // K)
-data = np.random.randn(N)
-
-data = np.random.randn(N)
-
-Ks = [100, 1000, 5000, 10000, 25000, 50000, 100000]
-
-# Ks = [500000, 1000000, 2500000, 5000000, 10000000]
-
-import psutil
-import os
-import gc
-
-pid = os.getpid()
-proc = psutil.Process(pid)
-
-
-def dict_unique(values, expected_K, sort=False, memory=False):
-    if memory:
-        gc.collect()
-        before_mem = proc.get_memory_info().rss
-
-    rizer = lib.DictFactorizer()
-    result = rizer.unique_int64(values)
-
-    if memory:
-        result = proc.get_memory_info().rss - before_mem
-        return result
-
-    if sort:
-        result.sort()
-    assert(len(result) == expected_K)
-    return result
-
-
-def khash_unique(values, expected_K, size_hint=False, sort=False,
-                 memory=False):
-    if memory:
-        gc.collect()
-        before_mem = proc.get_memory_info().rss
-
-    if size_hint:
-        rizer = lib.Factorizer(len(values))
-    else:
-        rizer = lib.Factorizer(100)
-
-    result = []
-    result = rizer.unique(values)
-
-    if memory:
-        result = proc.get_memory_info().rss - before_mem
-        return result
-
-    if sort:
-        result.sort()
-    assert(len(result) == expected_K)
-
-
-def khash_unique_str(values, expected_K, size_hint=False, sort=False,
-                     memory=False):
-    if memory:
-        gc.collect()
-        before_mem = proc.get_memory_info().rss
-
-    if size_hint:
-        rizer = lib.StringHashTable(len(values))
-    else:
-        rizer = lib.StringHashTable(100)
-
-    result = []
-    result = rizer.unique(values)
-
-    if memory:
-        result = proc.get_memory_info().rss - before_mem
-        return result
-
-    if sort:
-        result.sort()
-    assert(len(result) == expected_K)
-
-
-def khash_unique_int64(values, expected_K, size_hint=False, sort=False):
-    if size_hint:
-        rizer = lib.Int64HashTable(len(values))
-    else:
-        rizer = lib.Int64HashTable(100)
-
-    result = []
-    result = rizer.unique(values)
-
-    if sort:
-        result.sort()
-    assert(len(result) == expected_K)
-
-
-def hash_bench():
-    numpy = []
-    dict_based = []
-    dict_based_sort = []
-    khash_hint = []
-    khash_nohint = []
-    for K in Ks:
-        print(K)
-        # groups = np.array([rands(10) for _ in range(K)])
-        # labels = np.tile(groups, N // K).astype('O')
-
-        groups = np.random.randint(0, long(100000000000), size=K)
-        labels = np.tile(groups, N // K)
-        dict_based.append(timeit(lambda: dict_unique(labels, K), 20))
-        khash_nohint.append(timeit(lambda: khash_unique_int64(labels, K), 20))
-        khash_hint.append(timeit(lambda: khash_unique_int64(labels, K,
-                                                            size_hint=True), 20))
-
-        # memory, hard to get
-        # dict_based.append(np.mean([dict_unique(labels, K, memory=True)
-        #                            for _ in range(10)]))
-        # khash_nohint.append(np.mean([khash_unique(labels, K, memory=True)
-        #                              for _ in range(10)]))
-        # khash_hint.append(np.mean([khash_unique(labels, K, size_hint=True, memory=True)
-        #                            for _ in range(10)]))
-
-        # dict_based_sort.append(timeit(lambda: dict_unique(labels, K,
-        #                                                   sort=True), 10))
-        # numpy.append(timeit(lambda: np.unique(labels), 10))
-
-    # unique_timings = DataFrame({'numpy.unique' : numpy,
-    #                             'dict, no sort' : dict_based,
-    #                             'dict, sort' : dict_based_sort},
-    #                            columns=['dict, no sort',
-    #                                     'dict, sort', 'numpy.unique'],
-    #                            index=Ks)
-
-    unique_timings = DataFrame({'dict': dict_based,
-                                'khash, preallocate': khash_hint,
-                                'khash': khash_nohint},
-                               columns=['khash, preallocate', 'khash', 'dict'],
-                               index=Ks)
-
-    unique_timings.plot(kind='bar', legend=False)
-    plt.legend(loc='best')
-    plt.title('Unique on 100,000 values, int64')
-    plt.xlabel('Number of unique labels')
-    plt.ylabel('Mean execution time')
-
-    plt.show()
diff --git a/bench/bench_with_subset.R b/bench/bench_with_subset.R
deleted file mode 100644
index 69d0f7a9eec63..0000000000000
--- a/bench/bench_with_subset.R
+++ /dev/null
@@ -1,53 +0,0 @@
-library(microbenchmark)
-library(data.table)
-
-
-data.frame.subset.bench <- function (n=1e7, times=30) {
-    df <- data.frame(a=rnorm(n), b=rnorm(n), c=rnorm(n))
-    print(microbenchmark(subset(df, a <= b & b <= (c ^ 2 + b ^ 2 - a) & b > c),
-                         times=times))
-}
-
-
-# data.table allows something very similar to query with an expression
-# but we have chained comparisons AND we're faster BOO YAH!
-data.table.subset.expression.bench <- function (n=1e7, times=30) {
-    dt <- data.table(a=rnorm(n), b=rnorm(n), c=rnorm(n))
-    print(microbenchmark(dt[, a <= b & b <= (c ^ 2 + b ^ 2 - a) & b > c],
-                         times=times))
-}
-
-
-# compare against subset with data.table for good measure
-data.table.subset.bench <- function (n=1e7, times=30) {
-    dt <- data.table(a=rnorm(n), b=rnorm(n), c=rnorm(n))
-    print(microbenchmark(subset(dt, a <= b & b <= (c ^ 2 + b ^ 2 - a) & b > c),
-                         times=times))
-}
-
-
-data.frame.with.bench <- function (n=1e7, times=30) {
-    df <- data.frame(a=rnorm(n), b=rnorm(n), c=rnorm(n))
-
-    print(microbenchmark(with(df, a + b * (c ^ 2 + b ^ 2 - a) / (a * c) ^ 3),
-                         times=times))
-}
-
-
-data.table.with.bench <- function (n=1e7, times=30) {
-    dt <- data.table(a=rnorm(n), b=rnorm(n), c=rnorm(n))
-    print(microbenchmark(with(dt, a + b * (c ^ 2 + b ^ 2 - a) / (a * c) ^ 3),
-                         times=times))
-}
-
-
-bench <- function () {
-    data.frame.subset.bench()
-    data.table.subset.expression.bench()
-    data.table.subset.bench()
-    data.frame.with.bench()
-    data.table.with.bench()
-}
-
-
-bench()
diff --git a/bench/bench_with_subset.py b/bench/bench_with_subset.py
deleted file mode 100644
index 017401df3f7f3..0000000000000
--- a/bench/bench_with_subset.py
+++ /dev/null
@@ -1,116 +0,0 @@
-#!/usr/bin/env python
-
-"""
-Microbenchmarks for comparison with R's "with" and "subset" functions
-"""
-
-from __future__ import print_function
-import numpy as np
-from numpy import array
-from timeit import repeat as timeit
-from pandas.compat import range, zip
-from pandas import DataFrame
-
-
-setup_common = """from pandas import DataFrame
-from numpy.random import randn
-df = DataFrame(randn(%d, 3), columns=list('abc'))
-%s"""
-
-
-setup_with = "s = 'a + b * (c ** 2 + b ** 2 - a) / (a * c) ** 3'"
-
-
-def bench_with(n, times=10, repeat=3, engine='numexpr'):
-    return np.array(timeit('df.eval(s, engine=%r)' % engine,
-                           setup=setup_common % (n, setup_with),
-                           repeat=repeat, number=times)) / times
-
-
-setup_subset = "s = 'a <= b <= c ** 2 + b ** 2 - a and b > c'"
-
-
-def bench_subset(n, times=10, repeat=3, engine='numexpr'):
-    return np.array(timeit('df.query(s, engine=%r)' % engine,
-                           setup=setup_common % (n, setup_subset),
-                           repeat=repeat, number=times)) / times
-
-
-def bench(mn=1, mx=7, num=100, engines=('python', 'numexpr'), verbose=False):
-    r = np.logspace(mn, mx, num=num).round().astype(int)
-
-    ev = DataFrame(np.empty((num, len(engines))), columns=engines)
-    qu = ev.copy(deep=True)
-
-    ev['size'] = qu['size'] = r
-
-    for engine in engines:
-        for i, n in enumerate(r):
-            if verbose:
-                print('engine: %r, i == %d' % (engine, i))
-            ev.loc[i, engine] = bench_with(n, times=1, repeat=1, engine=engine)
-            qu.loc[i, engine] = bench_subset(n, times=1, repeat=1,
-                                             engine=engine)
-
-    return ev, qu
-
-
-def plot_perf(df, engines, title, filename=None):
-    from matplotlib.pyplot import figure, rc
-
-    try:
-        from mpltools import style
-    except ImportError:
-        pass
-    else:
-        style.use('ggplot')
-
-    rc('text', usetex=True)
-
-    fig = figure(figsize=(4, 3), dpi=100)
-    ax = fig.add_subplot(111)
-
-    for engine in engines:
-        ax.plot(df.size, df[engine], label=engine, lw=2)
-
-    ax.set_xlabel('Number of Rows')
-    ax.set_ylabel('Time (s)')
-    ax.set_title(title)
-    ax.legend(loc='best')
-    ax.tick_params(top=False, right=False)
-
-    fig.tight_layout()
-
-    if filename is not None:
-        fig.savefig(filename)
-
-
-if __name__ == '__main__':
-    import os
-    import pandas as pd
-
-    pandas_dir = os.path.dirname(os.path.abspath(os.path.dirname(__file__)))
-    static_path = os.path.join(pandas_dir, 'doc', 'source', '_static')
-
-    join = lambda p: os.path.join(static_path, p)
-
-    fn = join('eval-query-perf-data.h5')
-
-    engines = 'python', 'numexpr'
-
-    if not os.path.exists(fn):
-        ev, qu = bench(verbose=True)
-        ev.to_hdf(fn, 'eval')
-        qu.to_hdf(fn, 'query')
-    else:
-        ev = pd.read_hdf(fn, 'eval')
-        qu = pd.read_hdf(fn, 'query')
-
-    plot_perf(ev, engines, 'DataFrame.eval()', filename=join('eval-perf.png'))
-    plot_perf(qu, engines, 'DataFrame.query()',
-              filename=join('query-perf.png'))
-
-    plot_perf(ev[ev.size <= 50000], engines, 'DataFrame.eval()',
-              filename=join('eval-perf-small.png'))
-    plot_perf(qu[qu.size <= 500000], engines, 'DataFrame.query()',
-              filename=join('query-perf-small.png'))
diff --git a/bench/better_unique.py b/bench/better_unique.py
deleted file mode 100644
index e03a4f433ce66..0000000000000
--- a/bench/better_unique.py
+++ /dev/null
@@ -1,80 +0,0 @@
-from __future__ import print_function
-from pandas import DataFrame
-from pandas.compat import range, zip
-import timeit
-
-setup = """
-from pandas import Series
-import pandas._tseries as _tseries
-from pandas.compat import range
-import random
-import numpy as np
-
-def better_unique(values):
-    uniques = _tseries.fast_unique(values)
-    id_map = _tseries.map_indices_buf(uniques)
-    labels = _tseries.get_unique_labels(values, id_map)
-    return uniques, labels
-
-tot = 100000
-
-def get_test_data(ngroups=100, n=tot):
-    unique_groups = range(ngroups)
-    random.shuffle(unique_groups)
-    arr = np.asarray(np.tile(unique_groups, n / ngroups), dtype=object)
-
-    if len(arr) < n:
-        arr = np.asarray(list(arr) + unique_groups[:n - len(arr)],
-                         dtype=object)
-
-    return arr
-
-arr = get_test_data(ngroups=%d)
-"""
-
-group_sizes = [10, 100, 1000, 10000,
-               20000, 30000, 40000,
-               50000, 60000, 70000,
-               80000, 90000, 100000]
-
-numbers = [100, 100, 50] + [10] * 10
-
-numpy = []
-wes = []
-
-for sz, n in zip(group_sizes, numbers):
-    # wes_timer =  timeit.Timer(stmt='better_unique(arr)',
-    #                           setup=setup % sz)
-    wes_timer = timeit.Timer(stmt='_tseries.fast_unique(arr)',
-                             setup=setup % sz)
-
-    numpy_timer = timeit.Timer(stmt='np.unique(arr)',
-                               setup=setup % sz)
-
-    print(n)
-    numpy_result = numpy_timer.timeit(number=n) / n
-    wes_result = wes_timer.timeit(number=n) / n
-
-    print('Groups: %d, NumPy: %s, Wes: %s' % (sz, numpy_result, wes_result))
-
-    wes.append(wes_result)
-    numpy.append(numpy_result)
-
-result = DataFrame({'wes': wes, 'numpy': numpy}, index=group_sizes)
-
-
-def make_plot(numpy, wes):
-    pass
-
-# def get_test_data(ngroups=100, n=100000):
-#     unique_groups = range(ngroups)
-#     random.shuffle(unique_groups)
-#     arr = np.asarray(np.tile(unique_groups, n / ngroups), dtype=object)
-
-#     if len(arr) < n:
-#         arr = np.asarray(list(arr) + unique_groups[:n - len(arr)],
-#                          dtype=object)
-
-#     return arr
-
-# arr = get_test_data(ngroups=1000)
diff --git a/bench/duplicated.R b/bench/duplicated.R
deleted file mode 100644
index eb2376df2932a..0000000000000
--- a/bench/duplicated.R
+++ /dev/null
@@ -1,22 +0,0 @@
-N <- 100000
-
-k1 = rep(NA, N)
-k2 = rep(NA, N)
-for (i in 1:N){
-  k1[i] <- paste(sample(letters, 1), collapse="")
-  k2[i] <- paste(sample(letters, 1), collapse="")
-}
-df <- data.frame(a=k1, b=k2, c=rep(1:100, N / 100))
-df2 <- data.frame(a=k1, b=k2)
-
-timings <- numeric()
-timings2 <- numeric()
-for (i in 1:50) {
-  gc()
-  timings[i] = system.time(deduped <- df[!duplicated(df),])[3]
-  gc()
-  timings2[i] = system.time(deduped <- df[!duplicated(df[,c("a", "b")]),])[3]
-}
-
-mean(timings)
-mean(timings2)
diff --git a/bench/io_roundtrip.py b/bench/io_roundtrip.py
deleted file mode 100644
index d87da0ec6321a..0000000000000
--- a/bench/io_roundtrip.py
+++ /dev/null
@@ -1,116 +0,0 @@
-from __future__ import print_function
-import time
-import os
-import numpy as np
-
-import la
-import pandas
-from pandas.compat import range
-from pandas import datetools, DatetimeIndex
-
-
-def timeit(f, iterations):
-    start = time.clock()
-
-    for i in range(iterations):
-        f()
-
-    return time.clock() - start
-
-
-def rountrip_archive(N, K=50, iterations=10):
-    # Create data
-    arr = np.random.randn(N, K)
-    # lar = la.larry(arr)
-    dma = pandas.DataFrame(arr,
-                           DatetimeIndex('1/1/2000', periods=N,
-                                     offset=datetools.Minute()))
-    dma[201] = 'bar'
-
-    # filenames
-    filename_numpy = '/Users/wesm/tmp/numpy.npz'
-    filename_larry = '/Users/wesm/tmp/archive.hdf5'
-    filename_pandas = '/Users/wesm/tmp/pandas_tmp'
-
-    # Delete old files
-    try:
-        os.unlink(filename_numpy)
-    except:
-        pass
-    try:
-        os.unlink(filename_larry)
-    except:
-        pass
-
-    try:
-        os.unlink(filename_pandas)
-    except:
-        pass
-
-    # Time a round trip save and load
-    # numpy_f = lambda: numpy_roundtrip(filename_numpy, arr, arr)
-    # numpy_time = timeit(numpy_f, iterations) / iterations
-
-    # larry_f = lambda: larry_roundtrip(filename_larry, lar, lar)
-    # larry_time = timeit(larry_f, iterations) / iterations
-
-    pandas_f = lambda: pandas_roundtrip(filename_pandas, dma, dma)
-    pandas_time = timeit(pandas_f, iterations) / iterations
-    print('pandas (HDF5) %7.4f seconds' % pandas_time)
-
-    pickle_f = lambda: pandas_roundtrip(filename_pandas, dma, dma)
-    pickle_time = timeit(pickle_f, iterations) / iterations
-    print('pandas (pickle) %7.4f seconds' % pickle_time)
-
-    # print('Numpy (npz)   %7.4f seconds' % numpy_time)
-    # print('larry (HDF5)  %7.4f seconds' % larry_time)
-
-    # Delete old files
-    try:
-        os.unlink(filename_numpy)
-    except:
-        pass
-    try:
-        os.unlink(filename_larry)
-    except:
-        pass
-
-    try:
-        os.unlink(filename_pandas)
-    except:
-        pass
-
-
-def numpy_roundtrip(filename, arr1, arr2):
-    np.savez(filename, arr1=arr1, arr2=arr2)
-    npz = np.load(filename)
-    arr1 = npz['arr1']
-    arr2 = npz['arr2']
-
-
-def larry_roundtrip(filename, lar1, lar2):
-    io = la.IO(filename)
-    io['lar1'] = lar1
-    io['lar2'] = lar2
-    lar1 = io['lar1']
-    lar2 = io['lar2']
-
-
-def pandas_roundtrip(filename, dma1, dma2):
-    # What's the best way to code this?
-    from pandas.io.pytables import HDFStore
-    store = HDFStore(filename)
-    store['dma1'] = dma1
-    store['dma2'] = dma2
-    dma1 = store['dma1']
-    dma2 = store['dma2']
-
-
-def pandas_roundtrip_pickle(filename, dma1, dma2):
-    dma1.save(filename)
-    dma1 = pandas.DataFrame.load(filename)
-    dma2.save(filename)
-    dma2 = pandas.DataFrame.load(filename)
-
-if __name__ == '__main__':
-    rountrip_archive(10000, K=200)
diff --git a/bench/serialize.py b/bench/serialize.py
deleted file mode 100644
index b0edd6a5752d2..0000000000000
--- a/bench/serialize.py
+++ /dev/null
@@ -1,89 +0,0 @@
-from __future__ import print_function
-from pandas.compat import range, lrange
-import time
-import os
-import numpy as np
-
-import la
-import pandas
-
-
-def timeit(f, iterations):
-    start = time.clock()
-
-    for i in range(iterations):
-        f()
-
-    return time.clock() - start
-
-
-def roundtrip_archive(N, iterations=10):
-
-    # Create data
-    arr = np.random.randn(N, N)
-    lar = la.larry(arr)
-    dma = pandas.DataFrame(arr, lrange(N), lrange(N))
-
-    # filenames
-    filename_numpy = '/Users/wesm/tmp/numpy.npz'
-    filename_larry = '/Users/wesm/tmp/archive.hdf5'
-    filename_pandas = '/Users/wesm/tmp/pandas_tmp'
-
-    # Delete old files
-    try:
-        os.unlink(filename_numpy)
-    except:
-        pass
-    try:
-        os.unlink(filename_larry)
-    except:
-        pass
-    try:
-        os.unlink(filename_pandas)
-    except:
-        pass
-
-    # Time a round trip save and load
-    numpy_f = lambda: numpy_roundtrip(filename_numpy, arr, arr)
-    numpy_time = timeit(numpy_f, iterations) / iterations
-
-    larry_f = lambda: larry_roundtrip(filename_larry, lar, lar)
-    larry_time = timeit(larry_f, iterations) / iterations
-
-    pandas_f = lambda: pandas_roundtrip(filename_pandas, dma, dma)
-    pandas_time = timeit(pandas_f, iterations) / iterations
-
-    print('Numpy (npz)   %7.4f seconds' % numpy_time)
-    print('larry (HDF5)  %7.4f seconds' % larry_time)
-    print('pandas (HDF5) %7.4f seconds' % pandas_time)
-
-
-def numpy_roundtrip(filename, arr1, arr2):
-    np.savez(filename, arr1=arr1, arr2=arr2)
-    npz = np.load(filename)
-    arr1 = npz['arr1']
-    arr2 = npz['arr2']
-
-
-def larry_roundtrip(filename, lar1, lar2):
-    io = la.IO(filename)
-    io['lar1'] = lar1
-    io['lar2'] = lar2
-    lar1 = io['lar1']
-    lar2 = io['lar2']
-
-
-def pandas_roundtrip(filename, dma1, dma2):
-    from pandas.io.pytables import HDFStore
-    store = HDFStore(filename)
-    store['dma1'] = dma1
-    store['dma2'] = dma2
-    dma1 = store['dma1']
-    dma2 = store['dma2']
-
-
-def pandas_roundtrip_pickle(filename, dma1, dma2):
-    dma1.save(filename)
-    dma1 = pandas.DataFrame.load(filename)
-    dma2.save(filename)
-    dma2 = pandas.DataFrame.load(filename)
diff --git a/bench/test.py b/bench/test.py
deleted file mode 100644
index 2339deab313a1..0000000000000
--- a/bench/test.py
+++ /dev/null
@@ -1,70 +0,0 @@
-import numpy as np
-import itertools
-import collections
-import scipy.ndimage as ndi
-from pandas.compat import zip, range
-
-N = 10000
-
-lat = np.random.randint(0, 360, N)
-lon = np.random.randint(0, 360, N)
-data = np.random.randn(N)
-
-
-def groupby1(lat, lon, data):
-    indexer = np.lexsort((lon, lat))
-    lat = lat.take(indexer)
-    lon = lon.take(indexer)
-    sorted_data = data.take(indexer)
-
-    keys = 1000. * lat + lon
-    unique_keys = np.unique(keys)
-    bounds = keys.searchsorted(unique_keys)
-
-    result = group_agg(sorted_data, bounds, lambda x: x.mean())
-
-    decoder = keys.searchsorted(unique_keys)
-
-    return dict(zip(zip(lat.take(decoder), lon.take(decoder)), result))
-
-
-def group_mean(lat, lon, data):
-    indexer = np.lexsort((lon, lat))
-    lat = lat.take(indexer)
-    lon = lon.take(indexer)
-    sorted_data = data.take(indexer)
-
-    keys = 1000 * lat + lon
-    unique_keys = np.unique(keys)
-
-    result = ndi.mean(sorted_data, labels=keys, index=unique_keys)
-    decoder = keys.searchsorted(unique_keys)
-
-    return dict(zip(zip(lat.take(decoder), lon.take(decoder)), result))
-
-
-def group_mean_naive(lat, lon, data):
-    grouped = collections.defaultdict(list)
-    for lt, ln, da in zip(lat, lon, data):
-        grouped[(lt, ln)].append(da)
-
-    averaged = dict((ltln, np.mean(da)) for ltln, da in grouped.items())
-
-    return averaged
-
-
-def group_agg(values, bounds, f):
-    N = len(values)
-    result = np.empty(len(bounds), dtype=float)
-    for i, left_bound in enumerate(bounds):
-        if i == len(bounds) - 1:
-            right_bound = N
-        else:
-            right_bound = bounds[i + 1]
-
-        result[i] = f(values[left_bound: right_bound])
-
-    return result
-
-# for i in range(10):
-#     groupby1(lat, lon, data)
diff --git a/bench/zoo_bench.R b/bench/zoo_bench.R
deleted file mode 100644
index 294d55f51a9ab..0000000000000
--- a/bench/zoo_bench.R
+++ /dev/null
@@ -1,71 +0,0 @@
-library(zoo)
-library(xts)
-library(fts)
-library(tseries)
-library(its)
-library(xtable)
-
-## indices = rep(NA, 100000)
-## for (i in 1:100000)
-##   indices[i] <- paste(sample(letters, 10), collapse="")
-
-
-
-## x <- zoo(rnorm(100000), indices)
-## y <- zoo(rnorm(90000), indices[sample(1:100000, 90000)])
-
-## indices <- as.POSIXct(1:100000)
-
-indices <- as.POSIXct(Sys.Date()) + seq(1, 100000000, 100)
-
-sz <- 500000
-
-## x <- xts(rnorm(sz), sample(indices, sz))
-## y <- xts(rnorm(sz), sample(indices, sz))
-
-zoo.bench <- function(){
-    x <- zoo(rnorm(sz), sample(indices, sz))
-    y <- zoo(rnorm(sz), sample(indices, sz))
-    timeit(function() {x + y})
-}
-
-xts.bench <- function(){
-    x <- xts(rnorm(sz), sample(indices, sz))
-    y <- xts(rnorm(sz), sample(indices, sz))
-    timeit(function() {x + y})
-}
-
-fts.bench <- function(){
-    x <- fts(rnorm(sz), sort(sample(indices, sz)))
-    y <- fts(rnorm(sz), sort(sample(indices, sz))
-    timeit(function() {x + y})
-}
-
-its.bench <- function(){
-    x <- its(rnorm(sz), sort(sample(indices, sz)))
-    y <- its(rnorm(sz), sort(sample(indices, sz)))
-    timeit(function() {x + y})
-}
-
-irts.bench <- function(){
-    x <- irts(sort(sample(indices, sz)), rnorm(sz))
-    y <- irts(sort(sample(indices, sz)), rnorm(sz))
-    timeit(function() {x + y})
-}
-
-timeit <- function(f){
-  timings <- numeric()
-  for (i in 1:10) {
-    gc()
-    timings[i] = system.time(f())[3]
-  }
-  mean(timings)
-}
-
-bench <- function(){
-  results <- c(xts.bench(), fts.bench(), its.bench(), zoo.bench())
-  names <- c("xts", "fts", "its", "zoo")
-  data.frame(results, names)
-}
-
-result <- bench()
diff --git a/bench/zoo_bench.py b/bench/zoo_bench.py
deleted file mode 100644
index 74cb1952a5a2a..0000000000000
--- a/bench/zoo_bench.py
+++ /dev/null
@@ -1,36 +0,0 @@
-from pandas import *
-from pandas.util.testing import rands
-
-n = 1000000
-# indices = Index([rands(10) for _ in xrange(n)])
-
-
-def sample(values, k):
-    sampler = np.random.permutation(len(values))
-    return values.take(sampler[:k])
-sz = 500000
-rng = np.arange(0, 10000000000000, 10000000)
-stamps = np.datetime64(datetime.now()).view('i8') + rng
-idx1 = np.sort(sample(stamps, sz))
-idx2 = np.sort(sample(stamps, sz))
-ts1 = Series(np.random.randn(sz), idx1)
-ts2 = Series(np.random.randn(sz), idx2)
-
-
-# subsample_size = 90000
-
-# x = Series(np.random.randn(100000), indices)
-# y = Series(np.random.randn(subsample_size),
-#            index=sample(indices, subsample_size))
-
-
-# lx = larry(np.random.randn(100000), [list(indices)])
-# ly = larry(np.random.randn(subsample_size), [list(y.index)])
-
-# Benchmark 1: Two 1-million length time series (int64-based index) with
-# randomly chosen timestamps
-
-# Benchmark 2: Join two 5-variate time series DataFrames (outer and inner join)
-
-# df1 = DataFrame(np.random.randn(1000000, 5), idx1, columns=range(5))
-# df2 = DataFrame(np.random.randn(1000000, 5), idx2, columns=range(5, 10))
diff --git a/ci/after_script.sh b/ci/after_script.sh
deleted file mode 100755
index b17d69daa5b8d..0000000000000
--- a/ci/after_script.sh
+++ /dev/null
@@ -1,26 +0,0 @@
-#!/bin/bash
-
-#wget https://raw.github.com/y-p/ScatterCI-CLI/master/scatter_cli.py
-#chmod u+x scatter_cli.py
-
-pip install -I requests==2.1.0
-echo "${TRAVIS_PYTHON_VERSION:0:4}"
-if [ x"${TRAVIS_PYTHON_VERSION:0:4}" == x"2.6" ]; then
-    pip install simplejson;
-fi
-
-# ScatterCI accepts a build log, but currently does nothing with it.
-echo '' > /tmp/build.log
-
-# nore exposed in the build logs
-#export SCATTERCI_ACCESS_KEY=
-#export SCATTERCI_HOST=
-
-# Generate a json file describing system and dep versions
-ci/print_versions.py -j /tmp/env.json
-
-# nose ran using "--with-xunit --xunit-file nosetest.xml" and generated /tmp/nosetest.xml
-# Will timeout if server not available, and should not fail the build
-#python scatter_cli.py --xunit-file /tmp/nosetests.xml  --log-file /tmp/build.log  --env-file /tmp/env.json --build-name "$JOB_NAME" --succeed
-
-true # never fail because bad things happened here
diff --git a/ci/appveyor-27.yaml b/ci/appveyor-27.yaml
new file mode 100644
index 0000000000000..10511ac0e00ca
--- /dev/null
+++ b/ci/appveyor-27.yaml
@@ -0,0 +1,30 @@
+name: pandas
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - bottleneck
+  - dateutil
+  - gcsfs
+  - html5lib
+  - jinja2=2.8
+  - lxml
+  - matplotlib
+  - numexpr
+  - numpy=1.12*
+  - openpyxl
+  - pytables
+  - python=2.7.*
+  - pytz
+  - s3fs
+  - scipy
+  - sqlalchemy
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - cython
+  - pytest
+  - pytest-xdist
+  - moto
diff --git a/ci/appveyor-36.yaml b/ci/appveyor-36.yaml
new file mode 100644
index 0000000000000..868724419c464
--- /dev/null
+++ b/ci/appveyor-36.yaml
@@ -0,0 +1,27 @@
+name: pandas
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - blosc
+  - bottleneck
+  - fastparquet
+  - feather-format
+  - matplotlib
+  - numexpr
+  - numpy=1.14*
+  - openpyxl
+  - pyarrow
+  - pytables
+  - python-dateutil
+  - python=3.6.*
+  - pytz
+  - scipy
+  - thrift=0.10*
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - cython
+  - pytest
+  - pytest-xdist
diff --git a/ci/before_install.sh b/ci/before_install.sh
deleted file mode 100755
index e4376e1bf21c2..0000000000000
--- a/ci/before_install.sh
+++ /dev/null
@@ -1,13 +0,0 @@
-#!/bin/bash
-
-# If envars.sh determined we're running  in an authorized fork
-# and the user opted in to the network cache,and that cached versions
-# are available on the cache server, download and deploy the cached
-# files to the local filesystem
-
-echo "inside $0"
-
-# overview
-sudo apt-get update $APT_ARGS # run apt-get update for all versions
-
-true # never fail because bad things happened here
diff --git a/ci/before_script_travis.sh b/ci/before_script_travis.sh
new file mode 100755
index 0000000000000..0b3939b1906a2
--- /dev/null
+++ b/ci/before_script_travis.sh
@@ -0,0 +1,11 @@
+#!/bin/bash
+
+echo "inside $0"
+
+if [ "${TRAVIS_OS_NAME}" == "linux" ]; then
+   sh -e /etc/init.d/xvfb start
+   sleep 3
+fi
+
+# Never fail because bad things happened here.
+true
diff --git a/ci/build_docs.sh b/ci/build_docs.sh
index a8488e202dbec..90a666dc34ed7 100755
--- a/ci/build_docs.sh
+++ b/ci/build_docs.sh
@@ -1,42 +1,50 @@
 #!/bin/bash
 
+if [ "${TRAVIS_OS_NAME}" != "linux" ]; then
+   echo "not doing build_docs on non-linux"
+   exit 0
+fi
+
 cd "$TRAVIS_BUILD_DIR"
 echo "inside $0"
 
 git show --pretty="format:" --name-only HEAD~5.. --first-parent | grep -P "rst|txt|doc"
 
-if [ "$?" != "0" ]; then
-    echo "Skipping doc build, none were modified"
-    # nope, skip docs build
-    exit 0
-fi
+# if [ "$?" != "0" ]; then
+#     echo "Skipping doc build, none were modified"
+#     # nope, skip docs build
+#     exit 0
+# fi
 
 
-if [ x"$DOC_BUILD" != x"" ]; then
+if [ "$DOC" ]; then
 
-    # we're running network tests, let's build the docs in the meantime
     echo "Will build docs"
-    conda install -n pandas sphinx=1.1.3 pygments ipython=2.4 --yes
 
     source activate pandas
 
     mv "$TRAVIS_BUILD_DIR"/doc /tmp
+    mv "$TRAVIS_BUILD_DIR/LICENSE" /tmp  # included in the docs.
     cd /tmp/doc
 
-    rm /tmp/doc/source/api.rst # no R
-    rm /tmp/doc/source/r_interface.rst # no R
-
     echo ###############################
     echo # Log file for the doc build  #
     echo ###############################
 
-    echo -e "y\n" | ./make.py --no-api 2>&1
+    echo ./make.py
+    ./make.py
+
+    echo ########################
+    echo # Create and send docs #
+    echo ########################
 
     cd /tmp/doc/build/html
     git config --global user.email "pandas-docs-bot@localhost.foo"
     git config --global user.name "pandas-docs-bot"
 
+    # create the repo
     git init
+
     touch README
     git add README
     git commit -m "Initial commit" --allow-empty
@@ -45,8 +53,22 @@ if [ x"$DOC_BUILD" != x"" ]; then
     touch .nojekyll
     git add --all .
     git commit -m "Version" --allow-empty
-    git remote add origin https://$GH_TOKEN@github.com/pandas-docs/pandas-docs-travis
+
+    git remote remove origin
+    git remote add origin "https://${PANDAS_GH_TOKEN}@github.com/pandas-dev/pandas-docs-travis.git"
+    git fetch origin
+    git remote -v
+
     git push origin gh-pages -f
+
+    echo "Running doctests"
+    cd "$TRAVIS_BUILD_DIR"
+    pytest --doctest-modules \
+           pandas/core/reshape/concat.py \
+           pandas/core/reshape/pivot.py \
+           pandas/core/reshape/reshape.py \
+           pandas/core/reshape/tile.py
+
 fi
 
 exit 0
diff --git a/ci/check_cache.sh b/ci/check_cache.sh
new file mode 100755
index 0000000000000..b83144fc45ef4
--- /dev/null
+++ b/ci/check_cache.sh
@@ -0,0 +1,27 @@
+#!/bin/bash
+
+# currently not used
+# script to make sure that cache is clean
+# Travis CI now handles this
+
+if [ "$TRAVIS_PULL_REQUEST" == "false" ]
+then
+    echo "Not a PR: checking for changes in ci/ from last 2 commits"
+    git diff HEAD~2 --numstat | grep -E "ci/"
+    ci_changes=$(git diff HEAD~2 --numstat | grep -E "ci/"| wc -l)
+else
+    echo "PR: checking for changes in ci/ from last 2 commits"
+    git fetch origin pull/${TRAVIS_PULL_REQUEST}/head:PR_HEAD
+    git diff PR_HEAD~2 --numstat | grep -E "ci/"
+    ci_changes=$(git diff PR_HEAD~2 --numstat | grep -E "ci/"| wc -l)
+fi
+
+CACHE_DIR="$HOME/.cache/"
+CCACHE_DIR="$HOME/.ccache/"
+
+if [ $ci_changes -ne 0 ]
+then
+    echo "Files have changed in ci/ deleting all caches"
+    rm -rf "$CACHE_DIR"
+    rm -rf "$CCACHE_DIR"
+fi
diff --git a/ci/check_imports.py b/ci/check_imports.py
new file mode 100644
index 0000000000000..3f09290f8c375
--- /dev/null
+++ b/ci/check_imports.py
@@ -0,0 +1,36 @@
+"""
+Check that certain modules are not loaded by `import pandas`
+"""
+import sys
+
+blacklist = {
+    'bs4',
+    'gcsfs',
+    'html5lib',
+    'ipython',
+    'jinja2'
+    'lxml',
+    'numexpr',
+    'openpyxl',
+    'py',
+    'pytest',
+    's3fs',
+    'scipy',
+    'tables',
+    'xlrd',
+    'xlsxwriter',
+    'xlwt',
+}
+
+
+def main():
+    import pandas  # noqa
+
+    modules = set(x.split('.')[0] for x in sys.modules)
+    imported = modules & blacklist
+    if modules & blacklist:
+        sys.exit("Imported {}".format(imported))
+
+
+if __name__ == '__main__':
+    main()
diff --git a/ci/circle-27-compat.yaml b/ci/circle-27-compat.yaml
new file mode 100644
index 0000000000000..81a48d4edf11c
--- /dev/null
+++ b/ci/circle-27-compat.yaml
@@ -0,0 +1,28 @@
+name: pandas
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - bottleneck=1.0.0
+  - cython=0.24
+  - jinja2=2.8
+  - numexpr=2.4.4 # we test that we correctly don't use an unsupported numexpr
+  - numpy=1.9.2
+  - openpyxl
+  - psycopg2
+  - pytables=3.2.2
+  - python-dateutil=2.5.0
+  - python=2.7*
+  - pytz=2013b
+  - scipy=0.14.0
+  - sqlalchemy=0.7.8
+  - xlrd=0.9.2
+  - xlsxwriter=0.5.2
+  - xlwt=0.7.5
+  # universal
+  - pytest
+  - pytest-xdist
+  - pip:
+    - html5lib==1.0b2
+    - beautifulsoup4==4.2.1
+    - pymysql==0.6.0
diff --git a/ci/circle-35-ascii.yaml b/ci/circle-35-ascii.yaml
new file mode 100644
index 0000000000000..602c414b49bb2
--- /dev/null
+++ b/ci/circle-35-ascii.yaml
@@ -0,0 +1,13 @@
+name: pandas
+channels:
+  - defaults
+dependencies:
+  - cython
+  - nomkl
+  - numpy
+  - python-dateutil
+  - python=3.5*
+  - pytz
+  # universal
+  - pytest
+  - pytest-xdist
diff --git a/ci/circle-36-locale.yaml b/ci/circle-36-locale.yaml
new file mode 100644
index 0000000000000..cc852c1e2aeeb
--- /dev/null
+++ b/ci/circle-36-locale.yaml
@@ -0,0 +1,33 @@
+name: pandas
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - cython
+  - html5lib
+  - ipython
+  - jinja2
+  - lxml
+  - matplotlib
+  - nomkl
+  - numexpr
+  - numpy
+  - openpyxl
+  - psycopg2
+  - pymysql
+  - pytables
+  - python-dateutil
+  - python=3.6*
+  - pytz
+  - s3fs
+  - scipy
+  - sqlalchemy
+  - xarray
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - pytest
+  - pytest-xdist
+  - moto
diff --git a/ci/circle-36-locale_slow.yaml b/ci/circle-36-locale_slow.yaml
new file mode 100644
index 0000000000000..f44e98e1ee09d
--- /dev/null
+++ b/ci/circle-36-locale_slow.yaml
@@ -0,0 +1,34 @@
+name: pandas
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - cython
+  - gcsfs
+  - html5lib
+  - ipython
+  - jinja2
+  - lxml
+  - matplotlib
+  - nomkl
+  - numexpr
+  - numpy
+  - openpyxl
+  - psycopg2
+  - pymysql
+  - pytables
+  - python-dateutil
+  - python=3.6*
+  - pytz
+  - s3fs
+  - scipy
+  - sqlalchemy
+  - xarray
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - pytest
+  - pytest-xdist
+  - moto
diff --git a/ci/cron/go_doc.sh b/ci/cron/go_doc.sh
deleted file mode 100755
index 89659577d0e7f..0000000000000
--- a/ci/cron/go_doc.sh
+++ /dev/null
@@ -1,99 +0,0 @@
-#!/bin/bash
-
-# This is a one-command cron job for setting up
-# a virtualenv-based, linux-based, py2-based environment
-# for building the Pandas documentation.
-#
-# The first run will install all required deps from pypi
-# into the venv including monsters like scipy.
-# You may want to set it up yourself to speed up the
-# process.
-#
-# This is meant to be run as a cron job under a dedicated
-# user account whose HOME directory contains this script.
-# a CI directory will be created under it and all files
-# stored within it.
-#
-# The hardcoded dep versions will gradually become obsolete
-# You may need to tweak them
-#
-# @y-p, Jan/2014
-
-# disto latex is sometimes finicky. Optionall use
-# a local texlive install
-export PATH=/mnt/debian/texlive/2013/bin/x86_64-linux:$PATH
-
-# Having ccache will speed things up
-export PATH=/usr/lib64/ccache/:$PATH
-
-# limit disk usage
-ccache -M 200M
-
-BASEDIR="$HOME/CI"
-REPO_URL="https://github.com/pydata/pandas"
-REPO_LOC="$BASEDIR/pandas"
-
-if [ ! -d $BASEDIR ]; then
-	mkdir -p $BASEDIR
-	virtualenv $BASEDIR/venv
-fi
-
-source $BASEDIR/venv/bin/activate
-
-pip install numpy==1.7.2
-pip install cython==0.20.0
-pip install python-dateutil==2.2
-pip install --pre pytz==2013.9
-pip install sphinx==1.1.3
-pip install numexpr==2.2.2
-
-pip install matplotlib==1.3.0
-pip install lxml==3.2.5
-pip install beautifulsoup4==4.3.2
-pip install html5lib==0.99
-
-# You'll need R as well
-pip install rpy2==2.3.9
-
-pip install tables==3.0.0
-pip install bottleneck==0.7.0
-pip install ipython==0.13.2
-
-# only if you have too
-pip install scipy==0.13.2
-
-pip install openpyxl==1.6.2
-pip install xlrd==0.9.2
-pip install xlwt==0.7.5
-pip install xlsxwriter==0.5.1
-pip install sqlalchemy==0.8.3
-
-if [ ! -d "$REPO_LOC" ]; then
-	git clone "$REPO_URL" "$REPO_LOC"
-fi
-
-cd "$REPO_LOC"
-git reset --hard
-git clean -df
-git checkout master
-git pull origin
-make
-
-source $BASEDIR/venv/bin/activate
-export PATH="/usr/lib64/ccache/:$PATH"
-pip uninstall pandas -yq
-pip install "$REPO_LOC"
-
-cd "$REPO_LOC"/doc
-
-python make.py clean
-python make.py html
-if [ ! $? == 0 ]; then
-	exit 1
-fi
-python make.py zip_html
-# usually requires manual intervention
-# python make.py latex
-
-# If you have access:
-# python make.py upload_dev
diff --git a/ci/environment-dev.yaml b/ci/environment-dev.yaml
new file mode 100644
index 0000000000000..5733857b55dd4
--- /dev/null
+++ b/ci/environment-dev.yaml
@@ -0,0 +1,16 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - Cython
+  - NumPy
+  - flake8
+  - moto
+  - pytest>=3.1
+  - python-dateutil>=2.5.0
+  - python=3
+  - pytz
+  - setuptools>=24.2.0
+  - sphinx
+  - sphinxcontrib-spelling
diff --git a/ci/install.ps1 b/ci/install.ps1
new file mode 100644
index 0000000000000..64ec7f81884cd
--- /dev/null
+++ b/ci/install.ps1
@@ -0,0 +1,92 @@
+# Sample script to install Miniconda under Windows
+# Authors: Olivier Grisel, Jonathan Helmus and Kyle Kastner, Robert McGibbon
+# License: CC0 1.0 Universal: http://creativecommons.org/publicdomain/zero/1.0/
+
+$MINICONDA_URL = "http://repo.continuum.io/miniconda/"
+
+
+function DownloadMiniconda ($python_version, $platform_suffix) {
+    $webclient = New-Object System.Net.WebClient
+    $filename = "Miniconda3-latest-Windows-" + $platform_suffix + ".exe"
+    $url = $MINICONDA_URL + $filename
+
+    $basedir = $pwd.Path + "\"
+    $filepath = $basedir + $filename
+    if (Test-Path $filename) {
+        Write-Host "Reusing" $filepath
+        return $filepath
+    }
+
+    # Download and retry up to 3 times in case of network transient errors.
+    Write-Host "Downloading" $filename "from" $url
+    $retry_attempts = 2
+    for($i=0; $i -lt $retry_attempts; $i++){
+        try {
+            $webclient.DownloadFile($url, $filepath)
+            break
+        }
+        Catch [Exception]{
+            Start-Sleep 1
+        }
+   }
+   if (Test-Path $filepath) {
+       Write-Host "File saved at" $filepath
+   } else {
+       # Retry once to get the error message if any at the last try
+       $webclient.DownloadFile($url, $filepath)
+   }
+   return $filepath
+}
+
+
+function InstallMiniconda ($python_version, $architecture, $python_home) {
+    Write-Host "Installing Python" $python_version "for" $architecture "bit architecture to" $python_home
+    if (Test-Path $python_home) {
+        Write-Host $python_home "already exists, skipping."
+        return $false
+    }
+    if ($architecture -match "32") {
+        $platform_suffix = "x86"
+    } else {
+        $platform_suffix = "x86_64"
+    }
+
+    $filepath = DownloadMiniconda $python_version $platform_suffix
+    Write-Host "Installing" $filepath "to" $python_home
+    $install_log = $python_home + ".log"
+    $args = "/S /D=$python_home"
+    Write-Host $filepath $args
+    Start-Process -FilePath $filepath -ArgumentList $args -Wait -Passthru
+    if (Test-Path $python_home) {
+        Write-Host "Python $python_version ($architecture) installation complete"
+    } else {
+        Write-Host "Failed to install Python in $python_home"
+        Get-Content -Path $install_log
+        Exit 1
+    }
+}
+
+
+function InstallCondaPackages ($python_home, $spec) {
+    $conda_path = $python_home + "\Scripts\conda.exe"
+    $args = "install --yes " + $spec
+    Write-Host ("conda " + $args)
+    Start-Process -FilePath "$conda_path" -ArgumentList $args -Wait -Passthru
+}
+
+function UpdateConda ($python_home) {
+    $conda_path = $python_home + "\Scripts\conda.exe"
+    Write-Host "Updating conda..."
+    $args = "update --yes conda"
+    Write-Host $conda_path $args
+    Start-Process -FilePath "$conda_path" -ArgumentList $args -Wait -Passthru
+}
+
+
+function main () {
+    InstallMiniconda "3.5" $env:PYTHON_ARCH $env:CONDA_ROOT
+    UpdateConda $env:CONDA_ROOT
+    InstallCondaPackages $env:CONDA_ROOT "conda-build jinja2 anaconda-client"
+}
+
+main
diff --git a/ci/install_appveyor.ps1 b/ci/install_appveyor.ps1
deleted file mode 100644
index a022995dc7d58..0000000000000
--- a/ci/install_appveyor.ps1
+++ /dev/null
@@ -1,133 +0,0 @@
-# Sample script to install Miniconda under Windows
-# Authors: Olivier Grisel, Jonathan Helmus and Kyle Kastner, Robert McGibbon
-# License: CC0 1.0 Universal: http://creativecommons.org/publicdomain/zero/1.0/
-
-$MINICONDA_URL = "http://repo.continuum.io/miniconda/"
-
-
-function DownloadMiniconda ($python_version, $platform_suffix) {
-    $webclient = New-Object System.Net.WebClient
-    if ($python_version -match "3.4") {
-        $filename = "Miniconda3-3.5.5-Windows-" + $platform_suffix + ".exe"
-    } else {
-        $filename = "Miniconda-3.5.5-Windows-" + $platform_suffix + ".exe"
-    }
-    $url = $MINICONDA_URL + $filename
-
-    $basedir = $pwd.Path + "\"
-    $filepath = $basedir + $filename
-    if (Test-Path $filename) {
-        Write-Host "Reusing" $filepath
-        return $filepath
-    }
-
-    # Download and retry up to 3 times in case of network transient errors.
-    Write-Host "Downloading" $filename "from" $url
-    $retry_attempts = 2
-    for($i=0; $i -lt $retry_attempts; $i++){
-        try {
-            $webclient.DownloadFile($url, $filepath)
-            break
-        }
-        Catch [Exception]{
-            Start-Sleep 1
-        }
-   }
-   if (Test-Path $filepath) {
-       Write-Host "File saved at" $filepath
-   } else {
-       # Retry once to get the error message if any at the last try
-       $webclient.DownloadFile($url, $filepath)
-   }
-   return $filepath
-}
-
-function Start-Executable {
-   param(
-     [String] $FilePath,
-     [String[]] $ArgumentList
-   )
-   $OFS = " "
-   $process = New-Object System.Diagnostics.Process
-   $process.StartInfo.FileName = $FilePath
-   $process.StartInfo.Arguments = $ArgumentList
-   $process.StartInfo.UseShellExecute = $false
-   $process.StartInfo.RedirectStandardOutput = $true
-   if ( $process.Start() ) {
-     $output = $process.StandardOutput.ReadToEnd() `
-       -replace "\r\n$",""
-     if ( $output ) {
-       if ( $output.Contains("`r`n") ) {
-         $output -split "`r`n"
-       }
-       elseif ( $output.Contains("`n") ) {
-         $output -split "`n"
-       }
-       else {
-         $output
-       }
-     }
-     $process.WaitForExit()
-     & "$Env:SystemRoot\system32\cmd.exe" `
-       /c exit $process.ExitCode
-   }
- }
-
-function InstallMiniconda ($python_version, $architecture, $python_home) {
-    Write-Host "Installing Python" $python_version "for" $architecture "bit architecture to" $python_home
-    if (Test-Path $python_home) {
-        Write-Host $python_home "already exists, skipping."
-        return $false
-    }
-    if ($architecture -match "32") {
-        $platform_suffix = "x86"
-    } else {
-        $platform_suffix = "x86_64"
-    }
-
-    $filepath = DownloadMiniconda $python_version $platform_suffix
-    Write-Host "Installing" $filepath "to" $python_home
-    $install_log = $python_home + ".log"
-    $args = "/S /D=$python_home"
-    Write-Host $filepath $args
-    Start-Process -FilePath $filepath -ArgumentList $args -Wait
-    if (Test-Path $python_home) {
-        Write-Host "Python $python_version ($architecture) installation complete"
-    } else {
-        Write-Host "Failed to install Python in $python_home"
-        Get-Content -Path $install_log
-        Exit 1
-    }
-}
-
-
-function InstallCondaPackages ($python_home, $spec) {
-    $conda_path = $python_home + "\Scripts\conda.exe"
-    $args = "install --yes --quiet " + $spec
-    Write-Host ("conda " + $args)
-    Start-Executable -FilePath "$conda_path" -ArgumentList $args
-}
-function InstallCondaPackagesFromFile ($python_home, $ver, $arch) {
-    $conda_path = $python_home + "\Scripts\conda.exe"
-    $args = "install --yes --quiet --file " + $env:APPVEYOR_BUILD_FOLDER + "\ci\requirements-" + $ver + "_" + $arch + ".txt"
-    Write-Host ("conda " + $args)
-    Start-Executable -FilePath "$conda_path" -ArgumentList $args
-}
-
-function UpdateConda ($python_home) {
-    $conda_path = $python_home + "\Scripts\conda.exe"
-    Write-Host "Updating conda..."
-    $args = "update --yes conda"
-    Write-Host $conda_path $args
-    Start-Process -FilePath "$conda_path" -ArgumentList $args -Wait
-}
-
-
-function main () {
-    InstallMiniconda $env:PYTHON_VERSION $env:PYTHON_ARCH $env:PYTHON
-    UpdateConda $env:PYTHON
-    InstallCondaPackages $env:PYTHON "pip setuptools nose"
-    InstallCondaPackagesFromFile $env:PYTHON $env:PYTHON_VERSION $env:PYTHON_ARCH
-}
-
-main
\ No newline at end of file
diff --git a/ci/install_circle.sh b/ci/install_circle.sh
new file mode 100755
index 0000000000000..5ffff84c88488
--- /dev/null
+++ b/ci/install_circle.sh
@@ -0,0 +1,80 @@
+#!/usr/bin/env bash
+
+home_dir=$(pwd)
+echo "[home_dir: $home_dir]"
+
+echo "[ls -ltr]"
+ls -ltr
+
+echo "[Using clean Miniconda install]"
+rm -rf "$MINICONDA_DIR"
+
+# install miniconda
+wget http://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh -q -O miniconda.sh || exit 1
+bash miniconda.sh -b -p "$MINICONDA_DIR" || exit 1
+
+export PATH="$MINICONDA_DIR/bin:$PATH"
+
+echo "[update conda]"
+conda config --set ssl_verify false || exit 1
+conda config --set always_yes true --set changeps1 false || exit 1
+conda update -q conda
+
+# add the pandas channel to take priority
+# to add extra packages
+echo "[add channels]"
+conda config --add channels pandas || exit 1
+conda config --remove channels defaults || exit 1
+conda config --add channels defaults || exit 1
+
+# Useful for debugging any issues with conda
+conda info -a || exit 1
+
+# support env variables passed
+export ENVS_FILE=".envs"
+
+# make sure that the .envs file exists. it is ok if it is empty
+touch $ENVS_FILE
+
+# assume all command line arguments are environmental variables
+for var in "$@"
+do
+    echo "export $var" >> $ENVS_FILE
+done
+
+echo "[environmental variable file]"
+cat $ENVS_FILE
+source $ENVS_FILE
+
+# edit the locale override if needed
+if [ -n "$LOCALE_OVERRIDE" ]; then
+    echo "[Adding locale to the first line of pandas/__init__.py]"
+    rm -f pandas/__init__.pyc
+    sedc="3iimport locale\nlocale.setlocale(locale.LC_ALL, '$LOCALE_OVERRIDE')\n"
+    sed -i "$sedc" pandas/__init__.py
+    echo "[head -4 pandas/__init__.py]"
+    head -4 pandas/__init__.py
+    echo
+fi
+
+# create envbuild deps
+echo "[create env]"
+time conda env create -q -n pandas --file="${ENV_FILE}" || exit 1
+
+source activate pandas
+
+# remove any installed pandas package
+# w/o removing anything else
+echo
+echo "[removing installed pandas]"
+conda remove pandas -y --force
+pip uninstall -y pandas
+
+# build but don't install
+echo "[build em]"
+time python setup.py build_ext --inplace || exit 1
+
+echo
+echo "[show environment]"
+
+conda list
diff --git a/ci/install_conda.sh b/ci/install_conda.sh
deleted file mode 100755
index 8d99034a86109..0000000000000
--- a/ci/install_conda.sh
+++ /dev/null
@@ -1,129 +0,0 @@
-#!/bin/bash
-
-# There are 2 distinct pieces that get zipped and cached
-# - The venv site-packages dir including the installed dependencies
-# - The pandas build artifacts, using the build cache support via
-#   scripts/use_build_cache.py
-#
-# if the user opted in to use the cache and we're on a whitelisted fork
-# - if the server doesn't hold a cached version of venv/pandas build,
-#   do things the slow way, and put the results on the cache server
-#   for the next time.
-# -  if the cache files are available, instal some necessaries via apt
-#    (no compiling needed), then directly goto script and collect 200$.
-#
-
-function edit_init()
-{
-    if [ -n "$LOCALE_OVERRIDE" ]; then
-        echo "Adding locale to the first line of pandas/__init__.py"
-        rm -f pandas/__init__.pyc
-        sedc="3iimport locale\nlocale.setlocale(locale.LC_ALL, '$LOCALE_OVERRIDE')\n"
-        sed -i "$sedc" pandas/__init__.py
-        echo "head -4 pandas/__init__.py"
-        head -4 pandas/__init__.py
-        echo
-    fi
-}
-
-edit_init
-
-python_major_version="${TRAVIS_PYTHON_VERSION:0:1}"
-[ "$python_major_version" == "2" ] && python_major_version=""
-
-home_dir=$(pwd)
-echo "home_dir: [$home_dir]"
-
-if [ -n "$LOCALE_OVERRIDE" ]; then
-    # make sure the locale is available
-    # probably useless, since you would need to relogin
-    time sudo locale-gen "$LOCALE_OVERRIDE"
-fi
-
-# Need to enable for locale testing. The location of the locale file(s) is
-# distro specific. For example, on Arch Linux all of the locales are in a
-# commented file--/etc/locale.gen--that must be commented in to be used
-# whereas Ubuntu looks in /var/lib/locales/supported.d/* and generates locales
-# based on what's in the files in that folder
-time echo 'it_CH.UTF-8 UTF-8' | sudo tee -a /var/lib/locales/supported.d/it
-time sudo locale-gen
-
-
-# install gui for clipboard testing
-if [ -n "$CLIPBOARD_GUI" ]; then
-    echo "Using CLIPBOARD_GUI: $CLIPBOARD_GUI"
-    [ -n "$python_major_version" ] && py="py"
-    python_cb_gui_pkg=python${python_major_version}-${py}${CLIPBOARD_GUI}
-    time sudo apt-get $APT_ARGS install $python_cb_gui_pkg
-fi
-
-
-# install a clipboard if $CLIPBOARD is not empty
-if [ -n "$CLIPBOARD" ]; then
-    echo "Using clipboard: $CLIPBOARD"
-    time sudo apt-get $APT_ARGS install $CLIPBOARD
-fi
-
-python_major_version="${TRAVIS_PYTHON_VERSION:0:1}"
-[ "$python_major_version" == "2" ] && python_major_version=""
-
-wget http://repo.continuum.io/miniconda/Miniconda-latest-Linux-x86_64.sh -O miniconda.sh || exit 1
-bash miniconda.sh -b -p $HOME/miniconda || exit 1
-
-conda config --set always_yes yes --set changeps1 no || exit 1
-conda update -q conda || exit 1
-conda config --add channels conda-forge || exit 1
-conda config --add channels http://conda.binstar.org/pandas || exit 1
-conda config --set ssl_verify false || exit 1
-
-# Useful for debugging any issues with conda
-conda info -a || exit 1
-
-# build deps
-REQ="ci/requirements-${TRAVIS_PYTHON_VERSION}${JOB_TAG}.build"
-time conda create -n pandas python=$TRAVIS_PYTHON_VERSION nose || exit 1
-time conda install -n pandas --file=${REQ} || exit 1
-
-source activate pandas
-
-# set the compiler cache to work
-if [ "$IRON_TOKEN" ]; then
-    export PATH=/usr/lib/ccache:/usr/lib64/ccache:$PATH
-    gcc=$(which gcc)
-    echo "gcc: $gcc"
-    ccache=$(which ccache)
-    echo "ccache: $ccache"
-    export CC='ccache gcc'
-fi
-
-if [ "$BUILD_TEST" ]; then
-
-    # build testing
-    pip uninstall --yes cython
-    pip install cython==0.15.1
-    ( python setup.py build_ext --inplace && python setup.py develop ) || true
-
-else
-
-    # build but don't install
-    time python setup.py build_ext --inplace || exit 1
-
-    # we may have run installations
-    REQ="ci/requirements-${TRAVIS_PYTHON_VERSION}${JOB_TAG}.run"
-    time conda install -n pandas --file=${REQ} || exit 1
-
-    # we may have additional pip installs
-    REQ="ci/requirements-${TRAVIS_PYTHON_VERSION}${JOB_TAG}.pip"
-    if [ -e ${REQ} ]; then
-        pip install -r $REQ
-    fi
-
-    # remove any installed pandas package
-    conda remove pandas
-
-    # install our pandas
-    python setup.py develop  || exit 1
-
-fi
-
-true
diff --git a/ci/install_db_circle.sh b/ci/install_db_circle.sh
new file mode 100755
index 0000000000000..a00f74f009f54
--- /dev/null
+++ b/ci/install_db_circle.sh
@@ -0,0 +1,8 @@
+#!/bin/bash
+
+echo "installing dbs"
+mysql -e 'create database pandas_nosetest;'
+psql -c 'create database pandas_nosetest;' -U postgres
+
+echo "done"
+exit 0
diff --git a/ci/install_db_travis.sh b/ci/install_db_travis.sh
new file mode 100755
index 0000000000000..e4e6d7a5a9b85
--- /dev/null
+++ b/ci/install_db_travis.sh
@@ -0,0 +1,13 @@
+#!/bin/bash
+
+if [ "${TRAVIS_OS_NAME}" != "linux" ]; then
+   echo "not using dbs on non-linux"
+   exit 0
+fi
+
+echo "installing dbs"
+mysql -e 'create database pandas_nosetest;'
+psql -c 'create database pandas_nosetest;' -U postgres
+
+echo "done"
+exit 0
diff --git a/ci/install_pydata.sh b/ci/install_pydata.sh
deleted file mode 100755
index 667b57897be7e..0000000000000
--- a/ci/install_pydata.sh
+++ /dev/null
@@ -1,159 +0,0 @@
-#!/bin/bash
-
-# There are 2 distinct pieces that get zipped and cached
-# - The venv site-packages dir including the installed dependencies
-# - The pandas build artifacts, using the build cache support via
-#   scripts/use_build_cache.py
-#
-# if the user opted in to use the cache and we're on a whitelisted fork
-# - if the server doesn't hold a cached version of venv/pandas build,
-#   do things the slow way, and put the results on the cache server
-#   for the next time.
-# -  if the cache files are available, instal some necessaries via apt
-#    (no compiling needed), then directly goto script and collect 200$.
-#
-
-function edit_init()
-{
-    if [ -n "$LOCALE_OVERRIDE" ]; then
-        echo "Adding locale to the first line of pandas/__init__.py"
-        rm -f pandas/__init__.pyc
-        sedc="3iimport locale\nlocale.setlocale(locale.LC_ALL, '$LOCALE_OVERRIDE')\n"
-        sed -i "$sedc" pandas/__init__.py
-        echo "head -4 pandas/__init__.py"
-        head -4 pandas/__init__.py
-        echo
-    fi
-}
-
-edit_init
-
-python_major_version="${TRAVIS_PYTHON_VERSION:0:1}"
-[ "$python_major_version" == "2" ] && python_major_version=""
-
-home_dir=$(pwd)
-echo "home_dir: [$home_dir]"
-
-# known working
-# pip==1.5.1
-# setuptools==2.2
-# wheel==0.22
-# nose==1.3.3
-
-pip install -I -U pip
-pip install -I -U setuptools
-pip install wheel==0.22
-#pip install nose==1.3.3
-pip install nose==1.3.4
-
-# comment this line to disable the fetching of wheel files
-base_url=http://pandas.pydata.org/pandas-build/dev/wheels
-
-wheel_box=${TRAVIS_PYTHON_VERSION}${JOB_TAG}
-PIP_ARGS+=" -I --use-wheel --find-links=$base_url/$wheel_box/ --allow-external --allow-insecure"
-
-if [ -n "$LOCALE_OVERRIDE" ]; then
-    # make sure the locale is available
-    # probably useless, since you would need to relogin
-    time sudo locale-gen "$LOCALE_OVERRIDE"
-fi
-
-# we need these for numpy
-time sudo apt-get $APT_ARGS install libatlas-base-dev gfortran
-
-if [ -n "$NUMPY_BUILD" ]; then
-    # building numpy
-
-    cd $home_dir
-    echo "cloning numpy"
-
-    rm -Rf /tmp/numpy
-    cd /tmp
-
-    # remove the system installed numpy
-    pip uninstall numpy -y
-
-    # install cython
-    pip install --find-links http://wheels.astropy.org/ --find-links http://wheels2.astropy.org/ --use-wheel Cython
-
-    # clone & install
-    git clone --branch $NUMPY_BUILD https://github.com/numpy/numpy.git numpy
-    cd numpy
-    time pip install .
-    pip uninstall cython -y
-
-    cd $home_dir
-    numpy_version=$(python -c 'import numpy; print(numpy.__version__)')
-    echo "[$home_dir] numpy current: $numpy_version"
-fi
-
-# Force virtualenv to accept system_site_packages
-rm -f $VIRTUAL_ENV/lib/python$TRAVIS_PYTHON_VERSION/no-global-site-packages.txt
-
-# build deps
-time pip install $PIP_ARGS -r ci/requirements-${wheel_box}.build
-
-# Need to enable for locale testing. The location of the locale file(s) is
-# distro specific. For example, on Arch Linux all of the locales are in a
-# commented file--/etc/locale.gen--that must be commented in to be used
-# whereas Ubuntu looks in /var/lib/locales/supported.d/* and generates locales
-# based on what's in the files in that folder
-time echo 'it_CH.UTF-8 UTF-8' | sudo tee -a /var/lib/locales/supported.d/it
-time sudo locale-gen
-
-
-# install gui for clipboard testing
-if [ -n "$CLIPBOARD_GUI" ]; then
-    echo "Using CLIPBOARD_GUI: $CLIPBOARD_GUI"
-    [ -n "$python_major_version" ] && py="py"
-    python_cb_gui_pkg=python${python_major_version}-${py}${CLIPBOARD_GUI}
-    time sudo apt-get $APT_ARGS install $python_cb_gui_pkg
-fi
-
-
-# install a clipboard if $CLIPBOARD is not empty
-if [ -n "$CLIPBOARD" ]; then
-    echo "Using clipboard: $CLIPBOARD"
-    time sudo apt-get $APT_ARGS install $CLIPBOARD
-fi
-
-
-# Optional Deps
-if [ -n "$FULL_DEPS" ]; then
-    echo "Installing FULL_DEPS"
-
-    # need libhdf5 for PyTables
-    time sudo apt-get $APT_ARGS install libhdf5-serial-dev
-fi
-
-
-# set the compiler cache to work
-if [ "$IRON_TOKEN" ]; then
-    export PATH=/usr/lib/ccache:/usr/lib64/ccache:$PATH
-    gcc=$(which gcc)
-    echo "gcc: $gcc"
-    ccache=$(which ccache)
-    echo "ccache: $ccache"
-    export CC='ccache gcc'
-fi
-
-# build pandas
-if [ "$BUILD_TEST" ]; then
-    pip uninstall --yes cython
-    pip install cython==0.15.1
-    ( python setup.py build_ext --inplace ) || true
-    ( python setup.py develop ) || true
-else
-    python setup.py build_ext --inplace
-    python setup.py develop
-fi
-
-# install the run libs
-time pip install $PIP_ARGS -r ci/requirements-${wheel_box}.run
-
-# restore cython (if not numpy building)
-if [ -z "$NUMPY_BUILD" ]; then
-    time pip install $PIP_ARGS  $(cat ci/requirements-${wheel_box}.txt | grep -i cython)
-fi
-
-true
diff --git a/ci/install_test.sh b/ci/install_test.sh
deleted file mode 100755
index e01ad7b94a349..0000000000000
--- a/ci/install_test.sh
+++ /dev/null
@@ -1,17 +0,0 @@
-#!/bin/bash
-
-echo "inside $0"
-
-if [ "$INSTALL_TEST" ]; then
-    source activate pandas
-    echo "Starting installation test."
-    conda uninstall cython || exit 1
-    python "$TRAVIS_BUILD_DIR"/setup.py sdist --formats=zip,gztar || exit 1
-    pip install "$TRAVIS_BUILD_DIR"/dist/*tar.gz || exit 1
-    nosetests --exe -A "$NOSE_ARGS" pandas/tests/test_series.py --with-xunit --xunit-file=/tmp/nosetests_install.xml
-else
-    echo "Skipping installation test."
-fi
-RET="$?"
-
-exit "$RET"
diff --git a/ci/install_travis.sh b/ci/install_travis.sh
new file mode 100755
index 0000000000000..fd4a36f86db6c
--- /dev/null
+++ b/ci/install_travis.sh
@@ -0,0 +1,109 @@
+#!/bin/bash
+
+# edit the locale file if needed
+function edit_init()
+{
+    if [ -n "$LOCALE_OVERRIDE" ]; then
+        echo "[Adding locale to the first line of pandas/__init__.py]"
+        rm -f pandas/__init__.pyc
+        sedc="3iimport locale\nlocale.setlocale(locale.LC_ALL, '$LOCALE_OVERRIDE')\n"
+        sed -i "$sedc" pandas/__init__.py
+        echo "[head -4 pandas/__init__.py]"
+        head -4 pandas/__init__.py
+        echo
+    fi
+}
+
+echo
+echo "[install_travis]"
+edit_init
+
+home_dir=$(pwd)
+echo
+echo "[home_dir]: $home_dir"
+
+# install miniconda
+MINICONDA_DIR="$HOME/miniconda3"
+
+echo
+echo "[Using clean Miniconda install]"
+
+if [ -d "$MINICONDA_DIR" ]; then
+    rm -rf "$MINICONDA_DIR"
+fi
+
+# install miniconda
+if [ "${TRAVIS_OS_NAME}" == "osx" ]; then
+    time wget http://repo.continuum.io/miniconda/Miniconda3-latest-MacOSX-x86_64.sh -q -O miniconda.sh || exit 1
+else
+    time wget http://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh -q -O miniconda.sh || exit 1
+fi
+time bash miniconda.sh -b -p "$MINICONDA_DIR" || exit 1
+
+echo
+echo "[show conda]"
+which conda
+
+echo
+echo "[update conda]"
+conda config --set ssl_verify false || exit 1
+conda config --set quiet true --set always_yes true --set changeps1 false || exit 1
+conda update -q conda
+
+# Useful for debugging any issues with conda
+conda info -a || exit 1
+
+# set the compiler cache to work
+echo
+if [ -z "$NOCACHE" ] && [ "${TRAVIS_OS_NAME}" == "linux" ]; then
+    echo "[Using ccache]"
+    export PATH=/usr/lib/ccache:/usr/lib64/ccache:$PATH
+    gcc=$(which gcc)
+    echo "[gcc]: $gcc"
+    ccache=$(which ccache)
+    echo "[ccache]: $ccache"
+    export CC='ccache gcc'
+elif [ -z "$NOCACHE" ] && [ "${TRAVIS_OS_NAME}" == "osx" ]; then
+    echo "[Install ccache]"
+    brew install ccache > /dev/null 2>&1
+    echo "[Using ccache]"
+    export PATH=/usr/local/opt/ccache/libexec:$PATH
+    gcc=$(which gcc)
+    echo "[gcc]: $gcc"
+    ccache=$(which ccache)
+    echo "[ccache]: $ccache"
+else
+    echo "[Not using ccache]"
+fi
+
+echo
+echo "[create env]"
+
+# create our environment
+time conda env create -q -n pandas --file="${ENV_FILE}" || exit 1
+
+source activate pandas
+
+# remove any installed pandas package
+# w/o removing anything else
+echo
+echo "[removing installed pandas]"
+conda remove pandas -y --force
+pip uninstall -y pandas
+
+echo
+echo "[no installed pandas]"
+conda list pandas
+pip list --format columns |grep pandas
+
+# build and install
+echo "[running setup.py develop]"
+python setup.py develop  || exit 1
+
+echo
+echo "[show environment]"
+conda list
+
+echo
+echo "[done]"
+exit 0
diff --git a/ci/ironcache/get.py b/ci/ironcache/get.py
deleted file mode 100644
index a4663472b955c..0000000000000
--- a/ci/ironcache/get.py
+++ /dev/null
@@ -1,41 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-import sys
-import re
-import os
-import time
-import json
-import base64
-from hashlib import sha1
-from iron_cache import *
-import traceback as tb
-
-key='KEY.%s.%s' %(os.environ.get('TRAVIS_REPO_SLUG','unk'),
-                   os.environ.get('JOB_NAME','unk'))
-print(key)
-
-if sys.version_info[0] > 2:
-    key = bytes(key,encoding='utf8')
-
-key = sha1(key).hexdigest()[:8]+'.'
-
-b = b''
-cache = IronCache()
-for i in range(20):
-    print("getting %s" % key+str(i))
-    try:
-        item = cache.get(cache="travis", key=key+str(i))
-        v = item.value
-        if sys.version_info[0] > 2:
-            v = bytes(v,encoding='utf8')
-        b += bytes(base64.b64decode(v))
-    except Exception as e:
-        try:
-            print(tb.format_exc(e))
-        except:
-            print("exception during exception, oh my")
-        break
-
-with open(os.path.join(os.environ.get('HOME',''),"ccache.7z"),'wb') as f:
-    f.write(b)
diff --git a/ci/ironcache/put.py b/ci/ironcache/put.py
deleted file mode 100644
index f6aef3a327e87..0000000000000
--- a/ci/ironcache/put.py
+++ /dev/null
@@ -1,48 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-import sys
-import re
-import os
-import time
-import json
-import base64
-from hashlib import sha1
-from iron_cache import *
-
-key='KEY.%s.%s' %(os.environ.get('TRAVIS_REPO_SLUG','unk'),
-                   os.environ.get('JOB_NAME','unk'))
-
-key='KEY.%s.%s' %(os.environ.get('TRAVIS_REPO_SLUG','unk'),
-                   os.environ.get('JOB_NAME','unk'))
-print(key)
-
-if sys.version_info[0] > 2:
-    key = bytes(key,encoding='utf8')
-
-key = sha1(key).hexdigest()[:8]+'.'
-
-os.chdir(os.environ.get('HOME'))
-
-cache = IronCache()
-
-i=0
-
-for i, fname in enumerate(sorted([x for x in os.listdir('.') if re.match("ccache.\d+$",x)])):
-    print("Putting %s" % key+str(i))
-    with open(fname,"rb") as f:
-        s= f.read()
-        value=base64.b64encode(s)
-        if isinstance(value, bytes):
-            value = value.decode('ascii')
-    item = cache.put(cache="travis", key=key+str(i), value=value,options=dict(expires_in=24*60*60))
-
-# print("foo")
-for i in range(i+1,20):
-
-    try:
-        item = cache.delete(key+str(i),cache='travis')
-        print("Deleted %s" % key+str(i))
-    except:
-        break
-        pass
diff --git a/ci/lint.sh b/ci/lint.sh
new file mode 100755
index 0000000000000..9bcee55e1344c
--- /dev/null
+++ b/ci/lint.sh
@@ -0,0 +1,189 @@
+#!/bin/bash
+
+echo "inside $0"
+
+source activate pandas
+
+RET=0
+
+if [ "$LINT" ]; then
+
+    # pandas/_libs/src is C code, so no need to search there.
+    echo "Linting *.py"
+    flake8 pandas --filename=*.py --exclude pandas/_libs/src
+    if [ $? -ne "0" ]; then
+        RET=1
+    fi
+    echo "Linting *.py DONE"
+
+    echo "Linting setup.py"
+    flake8 setup.py
+    if [ $? -ne "0" ]; then
+        RET=1
+    fi
+    echo "Linting setup.py DONE"
+
+    echo "Linting asv_bench/benchmarks/"
+    flake8 asv_bench/benchmarks/  --exclude=asv_bench/benchmarks/*.py --ignore=F811
+    if [ $? -ne "0" ]; then
+        RET=1
+    fi
+    echo "Linting asv_bench/benchmarks/*.py DONE"
+
+    echo "Linting scripts/*.py"
+    flake8 scripts --filename=*.py
+    if [ $? -ne "0" ]; then
+        RET=1
+    fi
+    echo "Linting scripts/*.py DONE"
+
+    echo "Linting doc scripts"
+    flake8 doc/make.py doc/source/conf.py
+    if [ $? -ne "0" ]; then
+        RET=1
+    fi
+    echo "Linting doc scripts DONE"
+
+    echo "Linting *.pyx"
+    flake8 pandas --filename=*.pyx --select=E501,E302,E203,E111,E114,E221,E303,E128,E231,E126,E265,E305,E301,E127,E261,E271,E129,W291,E222,E241,E123,F403
+    if [ $? -ne "0" ]; then
+        RET=1
+    fi
+    echo "Linting *.pyx DONE"
+
+    echo "Linting *.pxi.in"
+    for path in 'src'
+    do
+        echo "linting -> pandas/$path"
+        flake8 pandas/$path --filename=*.pxi.in --select=E501,E302,E203,E111,E114,E221,E303,E231,E126,F403
+        if [ $? -ne "0" ]; then
+            RET=1
+        fi
+    done
+    echo "Linting *.pxi.in DONE"
+
+    echo "Linting *.pxd"
+    for path in '_libs'
+    do
+        echo "linting -> pandas/$path"
+        flake8 pandas/$path --filename=*.pxd --select=E501,E302,E203,E111,E114,E221,E303,E231,E126,F403
+        if [ $? -ne "0" ]; then
+            RET=1
+        fi
+    done
+    echo "Linting *.pxd DONE"
+
+    # readability/casting: Warnings about C casting instead of C++ casting
+    # runtime/int: Warnings about using C number types instead of C++ ones
+    # build/include_subdir: Warnings about prefacing included header files with directory
+
+    # We don't lint all C files because we don't want to lint any that are built
+    # from Cython files nor do we want to lint C files that we didn't modify for
+    # this particular codebase (e.g. src/headers, src/klib, src/msgpack). However,
+    # we can lint all header files since they aren't "generated" like C files are.
+    echo "Linting *.c and *.h"
+    for path in '*.h' 'period_helper.c' 'datetime' 'parser' 'ujson'
+    do
+        echo "linting -> pandas/_libs/src/$path"
+        cpplint --quiet --extensions=c,h --headers=h --filter=-readability/casting,-runtime/int,-build/include_subdir --recursive pandas/_libs/src/$path
+        if [ $? -ne "0" ]; then
+            RET=1
+        fi
+    done
+    echo "Linting *.c and *.h DONE"
+
+    echo "Check for invalid testing"
+
+    # Check for the following code in testing:
+    #
+    # np.testing
+    # np.array_equal
+    grep -r -E --include '*.py' --exclude testing.py '(numpy|np)(\.testing|\.array_equal)' pandas/tests/
+
+    if [ $? = "0" ]; then
+        RET=1
+    fi
+
+    # Check for pytest.warns
+    grep -r -E --include '*.py' 'pytest\.warns' pandas/tests/
+
+    if [ $? = "0" ]; then
+        RET=1
+    fi
+
+    # Check for the following code in the extension array base tests
+    # tm.assert_frame_equal
+    # tm.assert_series_equal
+    grep -r -E --include '*.py' --exclude base.py 'tm.assert_(series|frame)_equal' pandas/tests/extension/base
+
+    if [ $? = "0" ]; then
+        RET=1
+    fi
+
+    echo "Check for invalid testing DONE"
+
+    # Check for imports from pandas.core.common instead
+    # of `import pandas.core.common as com`
+    echo "Check for non-standard imports"
+    grep -R --include="*.py*" -E "from pandas.core.common import " pandas
+    if [ $? = "0" ]; then
+        RET=1
+    fi
+    echo "Check for non-standard imports DONE"
+
+    echo "Check for use of lists instead of generators in built-in Python functions"
+
+    # Example: Avoid `any([i for i in some_iterator])` in favor of `any(i for i in some_iterator)`
+    #
+    # Check the following functions:
+    # any(), all(), sum(), max(), min(), list(), dict(), set(), frozenset(), tuple(), str.join()
+    grep -R --include="*.py*" -E "[^_](any|all|sum|max|min|list|dict|set|frozenset|tuple|join)\(\[.* for .* in .*\]\)" pandas
+
+    if [ $? = "0" ]; then
+        RET=1
+    fi
+    echo "Check for use of lists instead of generators in built-in Python functions DONE"
+
+    echo "Check for incorrect sphinx directives"
+    SPHINX_DIRECTIVES=$(echo \
+       "autosummary|contents|currentmodule|deprecated|function|image|"\
+       "important|include|ipython|literalinclude|math|module|note|raw|"\
+       "seealso|toctree|versionadded|versionchanged|warning" | tr -d "[:space:]")
+    for path in './pandas' './doc/source'
+    do
+        grep -R --include="*.py" --include="*.pyx" --include="*.rst" -E "\.\. ($SPHINX_DIRECTIVES):[^:]" $path
+        if [ $? = "0" ]; then
+            RET=1
+        fi
+    done
+    echo "Check for incorrect sphinx directives DONE"
+
+    echo "Check for deprecated messages without sphinx directive"
+    grep -R --include="*.py" --include="*.pyx" -E "(DEPRECATED|DEPRECATE|Deprecated)(:|,|\.)" pandas
+
+    if [ $? = "0" ]; then
+        RET=1
+    fi
+    echo "Check for deprecated messages without sphinx directive DONE"
+
+    echo "Check for old-style classes"
+    grep -R --include="*.py" -E "class\s\S*[^)]:" pandas scripts
+
+    if [ $? = "0" ]; then
+        RET=1
+    fi
+    echo "Check for old-style classes DONE"
+    
+    echo "Check for backticks incorrectly rendering because of missing spaces"
+    grep -R --include="*.rst" -E "[a-zA-Z0-9]\`\`?[a-zA-Z0-9]" doc/source/
+
+    if [ $? = "0" ]; then
+        RET=1
+    fi
+    echo "Check for backticks incorrectly rendering because of missing spaces DONE"
+
+else
+    echo "NOT Linting"
+fi
+
+exit $RET
diff --git a/ci/prep_ccache.sh b/ci/prep_ccache.sh
deleted file mode 100755
index 34e1f2520c422..0000000000000
--- a/ci/prep_ccache.sh
+++ /dev/null
@@ -1,47 +0,0 @@
-#!/bin/bash
-
-if [ "$IRON_TOKEN" ]; then
-
-    home_dir=$(pwd)
-
-    # install the compiler cache
-    sudo apt-get $APT_ARGS install ccache p7zip-full
-    # iron_cache, pending py3 fixes upstream
-    pip install -I --allow-external --allow-insecure git+https://github.com/iron-io/iron_cache_python.git@8a451c7d7e4d16e0c3bedffd0f280d5d9bd4fe59#egg=iron_cache
-
-    python ci/ironcache/get.py
-    ccache -C
-
-    clear_cache=0
-    if [ -f ~/ccache.7z ]; then
-        echo "Cache retrieved"
-        clear_cache=1
-        cd $HOME
-        7za e $HOME/ccache.7z
-        # ls -l $HOME
-        cd /
-        tar xvf $HOME/ccache
-        rm -rf $HOME/ccache.7z
-        rm -rf $HOME/ccache
-
-    fi
-
-    # did the last commit change cython files?
-    cd $home_dir
-
-    retval=$(git diff HEAD~3 --numstat | grep -P "pyx|pxd"|wc -l)
-    echo "number of cython files changed: $retval"
-
-    if [ $clear_cache -eq 1 ] && [ $retval -eq 0 ]
-    then
-        # nope, reuse cython files
-        echo "Will reuse cached cython file"
-        touch "$TRAVIS_BUILD_DIR"/pandas/*.c
-        touch "$TRAVIS_BUILD_DIR"/pandas/src/*.c
-        touch "$TRAVIS_BUILD_DIR"/pandas/*.cpp
-    else
-        echo "Rebuilding cythonized files"
-    fi
-fi
-
-exit 0
diff --git a/ci/prep_cython_cache.sh b/ci/prep_cython_cache.sh
new file mode 100755
index 0000000000000..18d9388327ddc
--- /dev/null
+++ b/ci/prep_cython_cache.sh
@@ -0,0 +1,74 @@
+#!/bin/bash
+
+ls "$HOME/.cache/"
+
+PYX_CACHE_DIR="$HOME/.cache/pyxfiles"
+pyx_file_list=`find ${TRAVIS_BUILD_DIR} -name "*.pyx" -o -name "*.pxd" -o -name "*.pxi.in"`
+pyx_cache_file_list=`find ${PYX_CACHE_DIR} -name "*.pyx" -o -name "*.pxd" -o -name "*.pxi.in"`
+
+CACHE_File="$HOME/.cache/cython_files.tar"
+
+# Clear the cython cache 0 = NO, 1 = YES
+clear_cache=0
+
+pyx_files=`echo "$pyx_file_list" | wc -l`
+pyx_cache_files=`echo "$pyx_cache_file_list" | wc -l`
+
+if [[ pyx_files -ne pyx_cache_files ]]
+then
+        echo "Different number of pyx files"
+        clear_cache=1
+fi
+
+home_dir=$(pwd)
+
+if [ -f "$CACHE_File" ] && [ -z "$NOCACHE" ] && [ -d "$PYX_CACHE_DIR" ]; then
+
+    echo "Cache available - checking pyx diff"
+
+    for i in ${pyx_file_list}
+    do
+            diff=`diff -u $i $PYX_CACHE_DIR${i}`
+            if [[ $? -eq 2 ]]
+            then
+                    echo "${i##*/} can't be diffed; probably not in cache"
+                    clear_cache=1
+            fi
+            if [[ ! -z $diff ]]
+            then
+                    echo "${i##*/} has changed:"
+                    echo $diff
+                    clear_cache=1
+            fi
+    done
+
+    if [ "$TRAVIS_PULL_REQUEST" == "false" ]
+    then
+        echo "Not a PR"
+        # Uncomment next 2 lines to turn off cython caching not in a PR
+        # echo "Non PR cython caching is disabled"
+        # clear_cache=1
+    else
+        echo "In a PR"
+        # Uncomment next 2 lines to turn off cython caching in a PR
+        # echo "PR cython caching is disabled"
+        # clear_cache=1
+    fi
+
+fi
+
+if [ $clear_cache -eq 0 ] && [ -z "$NOCACHE" ]
+then
+    # No and nocache is not set
+    echo "Will reuse cached cython file"
+    cd /
+    tar xvmf $CACHE_File
+    cd $home_dir
+else
+    echo "Rebuilding cythonized files"
+    echo "No cache = $NOCACHE"
+    echo "Clear cache (1=YES) = $clear_cache"
+fi
+
+
+exit 0
diff --git a/ci/print_skipped.py b/ci/print_skipped.py
index 9fb05df64bcea..dd2180f6eeb19 100755
--- a/ci/print_skipped.py
+++ b/ci/print_skipped.py
@@ -30,20 +30,21 @@ def parse_results(filename):
             i += 1
             assert i - 1 == len(skipped)
     assert i - 1 == len(skipped)
-    assert len(skipped) == int(root.attrib['skip'])
+    # assert len(skipped) == int(root.attrib['skip'])
     return '\n'.join(skipped)
 
 
 def main(args):
     print('SKIPPED TESTS:')
-    print(parse_results(args.filename))
+    for fn in args.filename:
+        print(parse_results(fn))
     return 0
 
 
 def parse_args():
     import argparse
     parser = argparse.ArgumentParser()
-    parser.add_argument('filename', help='XUnit file to parse')
+    parser.add_argument('filename', nargs='+', help='XUnit file to parse')
     return parser.parse_args()
 
 
diff --git a/ci/requirements-2.6.build b/ci/requirements-2.6.build
deleted file mode 100644
index 85148069a9e6a..0000000000000
--- a/ci/requirements-2.6.build
+++ /dev/null
@@ -1,4 +0,0 @@
-numpy=1.7.1
-cython=0.19.1
-dateutil=1.5
-pytz=2013b
diff --git a/ci/requirements-2.6.pip b/ci/requirements-2.6.pip
deleted file mode 100644
index db293045f69ec..0000000000000
--- a/ci/requirements-2.6.pip
+++ /dev/null
@@ -1,3 +0,0 @@
-blosc
-openpyxl
-argparse
diff --git a/ci/requirements-2.6.run b/ci/requirements-2.6.run
deleted file mode 100644
index 5f8a2fde1409f..0000000000000
--- a/ci/requirements-2.6.run
+++ /dev/null
@@ -1,16 +0,0 @@
-numpy=1.7.1
-dateutil=1.5
-pytz=2013b
-scipy=0.11.0
-xlwt=0.7.5
-xlrd=0.9.2
-statsmodels=0.4.3
-bottleneck=0.8.0
-numexpr=2.2.2
-pytables=3.0.0
-html5lib=1.0b2
-beautiful-soup=4.2.0
-psycopg2=2.5.1
-pymysql=0.6.0
-sqlalchemy=0.7.8
-xlsxwriter=0.4.6
diff --git a/ci/requirements-2.7.build b/ci/requirements-2.7.build
deleted file mode 100644
index 6c9965ac0305e..0000000000000
--- a/ci/requirements-2.7.build
+++ /dev/null
@@ -1,4 +0,0 @@
-dateutil=2.1
-pytz=2013b
-numpy=1.9.3
-cython=0.19.1
diff --git a/ci/requirements-2.7.pip b/ci/requirements-2.7.pip
deleted file mode 100644
index 644457d69b37f..0000000000000
--- a/ci/requirements-2.7.pip
+++ /dev/null
@@ -1,4 +0,0 @@
-blosc
-httplib2
-google-api-python-client == 1.2
-python-gflags == 2.0
diff --git a/ci/requirements-2.7.run b/ci/requirements-2.7.run
deleted file mode 100644
index 10049179912da..0000000000000
--- a/ci/requirements-2.7.run
+++ /dev/null
@@ -1,21 +0,0 @@
-dateutil=2.1
-pytz=2013b
-numpy=1.9.3
-xlwt=0.7.5
-numexpr
-pytables
-matplotlib
-openpyxl=1.6.2
-xlrd=0.9.2
-sqlalchemy=0.9.6
-lxml=3.2.1
-scipy
-xlsxwriter=0.4.6
-boto=2.36.0
-bottleneck
-psycopg2=2.5.2
-patsy
-pymysql=0.6.3
-html5lib=1.0b2
-beautiful-soup=4.2.1
-statsmodels
diff --git a/ci/requirements-2.7_BUILD_TEST.build b/ci/requirements-2.7_BUILD_TEST.build
deleted file mode 100644
index faf1e3559f7f1..0000000000000
--- a/ci/requirements-2.7_BUILD_TEST.build
+++ /dev/null
@@ -1,4 +0,0 @@
-dateutil
-pytz
-numpy
-cython
diff --git a/ci/requirements-2.7_LOCALE.build b/ci/requirements-2.7_LOCALE.build
deleted file mode 100644
index ada6686f599ca..0000000000000
--- a/ci/requirements-2.7_LOCALE.build
+++ /dev/null
@@ -1,4 +0,0 @@
-python-dateutil
-pytz=2013b
-numpy=1.7.1
-cython=0.19.1
diff --git a/ci/requirements-2.7_LOCALE.pip b/ci/requirements-2.7_LOCALE.pip
deleted file mode 100644
index cf8e6b8b3d3a6..0000000000000
--- a/ci/requirements-2.7_LOCALE.pip
+++ /dev/null
@@ -1 +0,0 @@
-blosc
diff --git a/ci/requirements-2.7_LOCALE.run b/ci/requirements-2.7_LOCALE.run
deleted file mode 100644
index 9bb37ee10f8db..0000000000000
--- a/ci/requirements-2.7_LOCALE.run
+++ /dev/null
@@ -1,17 +0,0 @@
-python-dateutil
-pytz=2013b
-numpy=1.7.1
-xlwt=0.7.5
-openpyxl=1.6.2
-xlsxwriter=0.4.6
-xlrd=0.9.2
-bottleneck=0.8.0
-matplotlib=1.2.1
-patsy=0.1.0
-sqlalchemy=0.8.1
-html5lib=1.0b2
-lxml=3.2.1
-scipy=0.11.0
-beautiful-soup=4.2.1
-statsmodels=0.4.3
-bigquery=2.0.17
diff --git a/ci/requirements-2.7_NUMPY_DEV_master.build b/ci/requirements-2.7_NUMPY_DEV_master.build
deleted file mode 100644
index 7d1d11daf9eeb..0000000000000
--- a/ci/requirements-2.7_NUMPY_DEV_master.build
+++ /dev/null
@@ -1,3 +0,0 @@
-python-dateutil
-pytz
-cython==0.19.1
diff --git a/ci/requirements-2.7_SLOW.build b/ci/requirements-2.7_SLOW.build
deleted file mode 100644
index 664e8b418def7..0000000000000
--- a/ci/requirements-2.7_SLOW.build
+++ /dev/null
@@ -1,4 +0,0 @@
-python-dateutil
-pytz
-numpy=1.8.2
-cython
diff --git a/ci/requirements-2.7_SLOW.run b/ci/requirements-2.7_SLOW.run
deleted file mode 100644
index f02a7cb8a309a..0000000000000
--- a/ci/requirements-2.7_SLOW.run
+++ /dev/null
@@ -1,21 +0,0 @@
-python-dateutil
-pytz
-numpy=1.8.2
-matplotlib=1.3.1
-scipy
-patsy
-statsmodels
-xlwt
-openpyxl
-xlsxwriter
-xlrd
-numexpr
-pytables
-sqlalchemy
-lxml
-boto
-bottleneck
-psycopg2
-pymysql
-html5lib
-beautiful-soup
diff --git a/ci/requirements-3.3.build b/ci/requirements-3.3.build
deleted file mode 100644
index ada6686f599ca..0000000000000
--- a/ci/requirements-3.3.build
+++ /dev/null
@@ -1,4 +0,0 @@
-python-dateutil
-pytz=2013b
-numpy=1.7.1
-cython=0.19.1
diff --git a/ci/requirements-3.3.pip b/ci/requirements-3.3.pip
deleted file mode 100644
index 7e172dc039087..0000000000000
--- a/ci/requirements-3.3.pip
+++ /dev/null
@@ -1,2 +0,0 @@
-blosc
-openpyxl
diff --git a/ci/requirements-3.3.run b/ci/requirements-3.3.run
deleted file mode 100644
index 0256802a69eba..0000000000000
--- a/ci/requirements-3.3.run
+++ /dev/null
@@ -1,16 +0,0 @@
-python-dateutil
-pytz=2013b
-numpy=1.7.1
-xlsxwriter=0.4.6
-xlrd=0.9.2
-xlwt
-html5lib=1.0b2
-numexpr
-pytables
-bottleneck=0.8.0
-matplotlib
-patsy
-lxml=3.2.1
-scipy
-beautiful-soup=4.2.1
-statsmodels
diff --git a/ci/requirements-3.4.build b/ci/requirements-3.4.build
deleted file mode 100644
index 6fdffd41bd4c4..0000000000000
--- a/ci/requirements-3.4.build
+++ /dev/null
@@ -1,4 +0,0 @@
-python-dateutil
-pytz
-numpy=1.8.1
-cython
diff --git a/ci/requirements-3.4.pip b/ci/requirements-3.4.pip
deleted file mode 100644
index 47a049aac7632..0000000000000
--- a/ci/requirements-3.4.pip
+++ /dev/null
@@ -1,3 +0,0 @@
-blosc
-httplib2
-google-api-python-client
diff --git a/ci/requirements-3.4.run b/ci/requirements-3.4.run
deleted file mode 100644
index 45d082022713e..0000000000000
--- a/ci/requirements-3.4.run
+++ /dev/null
@@ -1,18 +0,0 @@
-python-dateutil
-pytz
-numpy=1.8.1
-openpyxl
-xlsxwriter
-xlrd
-xlwt
-html5lib
-patsy
-beautiful-soup
-scipy
-numexpr
-pytables
-lxml
-sqlalchemy
-bottleneck
-pymysql=0.6.3
-psycopg2
diff --git a/ci/requirements-3.4_SLOW.build b/ci/requirements-3.4_SLOW.build
deleted file mode 100644
index de36b1afb9fa4..0000000000000
--- a/ci/requirements-3.4_SLOW.build
+++ /dev/null
@@ -1,4 +0,0 @@
-python-dateutil
-pytz
-numpy=1.9.3
-cython
diff --git a/ci/requirements-3.4_SLOW.run b/ci/requirements-3.4_SLOW.run
deleted file mode 100644
index 1eca130ecd96a..0000000000000
--- a/ci/requirements-3.4_SLOW.run
+++ /dev/null
@@ -1,20 +0,0 @@
-python-dateutil
-pytz
-numpy=1.9.3
-openpyxl
-xlsxwriter
-xlrd
-xlwt
-html5lib
-patsy
-beautiful-soup
-scipy
-numexpr
-pytables
-matplotlib
-lxml
-sqlalchemy
-bottleneck
-pymysql
-psycopg2
-statsmodels
diff --git a/ci/requirements-3.5.build b/ci/requirements-3.5.build
deleted file mode 100644
index de36b1afb9fa4..0000000000000
--- a/ci/requirements-3.5.build
+++ /dev/null
@@ -1,4 +0,0 @@
-python-dateutil
-pytz
-numpy=1.9.3
-cython
diff --git a/ci/requirements-3.5.run b/ci/requirements-3.5.run
deleted file mode 100644
index 91938675280d9..0000000000000
--- a/ci/requirements-3.5.run
+++ /dev/null
@@ -1,23 +0,0 @@
-python-dateutil
-pytz
-numpy=1.9.3
-openpyxl
-xlsxwriter
-xlrd
-xlwt
-patsy
-scipy
-numexpr
-pytables
-html5lib
-lxml
-matplotlib
-
-# currently causing some warnings
-#sqlalchemy
-#pymysql
-#psycopg2
-
-# not available from conda
-#beautiful-soup
-#bottleneck
diff --git a/ci/requirements-optional-conda.txt b/ci/requirements-optional-conda.txt
new file mode 100644
index 0000000000000..9e4e8e99b5205
--- /dev/null
+++ b/ci/requirements-optional-conda.txt
@@ -0,0 +1,28 @@
+beautifulsoup4>=4.2.1
+blosc
+bottleneck
+fastparquet
+feather-format
+gcsfs
+html5lib
+ipython>=5.6.0
+ipykernel
+jinja2
+lxml
+matplotlib
+nbsphinx
+numexpr
+openpyxl
+pyarrow
+pymysql
+pytables
+pytest-cov
+pytest-xdist
+s3fs
+scipy
+seaborn
+sqlalchemy
+xarray
+xlrd
+xlsxwriter
+xlwt
diff --git a/ci/requirements-optional-pip.txt b/ci/requirements-optional-pip.txt
new file mode 100644
index 0000000000000..3cce3f5339883
--- /dev/null
+++ b/ci/requirements-optional-pip.txt
@@ -0,0 +1,30 @@
+# This file was autogenerated by scripts/convert_deps.py
+# Do not modify directly
+beautifulsoup4>=4.2.1
+blosc
+bottleneck
+fastparquet
+feather-format
+gcsfs
+html5lib
+ipython>=5.6.0
+ipykernel
+jinja2
+lxml
+matplotlib
+nbsphinx
+numexpr
+openpyxl
+pyarrow
+pymysql
+tables
+pytest-cov
+pytest-xdist
+s3fs
+scipy
+seaborn
+sqlalchemy
+xarray
+xlrd
+xlsxwriter
+xlwt
\ No newline at end of file
diff --git a/ci/requirements_all.txt b/ci/requirements_all.txt
deleted file mode 100644
index 6a0b695c5de87..0000000000000
--- a/ci/requirements_all.txt
+++ /dev/null
@@ -1,22 +0,0 @@
-nose
-sphinx
-ipython
-python-dateutil
-pytz
-openpyxl
-xlsxwriter
-xlrd
-xlwt
-html5lib
-patsy
-beautiful-soup
-numpy
-cython
-scipy
-numexpr
-pytables
-matplotlib
-lxml
-sqlalchemy
-bottleneck
-pymysql
diff --git a/ci/requirements_dev.txt b/ci/requirements_dev.txt
index eac993f1cdf73..83ee30b52071d 100644
--- a/ci/requirements_dev.txt
+++ b/ci/requirements_dev.txt
@@ -1,5 +1,12 @@
-python-dateutil
+# This file was autogenerated by scripts/convert_deps.py
+# Do not modify directly
+Cython
+NumPy
+flake8
+moto
+pytest>=3.1
+python-dateutil>=2.5.0
 pytz
-numpy
-cython
-nose
+setuptools>=24.2.0
+sphinx
+sphinxcontrib-spelling
\ No newline at end of file
diff --git a/ci/run_build_docs.sh b/ci/run_build_docs.sh
index c04c815297aa3..2909b9619552e 100755
--- a/ci/run_build_docs.sh
+++ b/ci/run_build_docs.sh
@@ -2,7 +2,7 @@
 
 echo "inside $0"
 
-"$TRAVIS_BUILD_DIR"/ci/build_docs.sh 2>&1 > /tmp/doc.log &
+"$TRAVIS_BUILD_DIR"/ci/build_docs.sh 2>&1
 
 # wait until subprocesses finish (build_docs.sh)
 wait
diff --git a/ci/run_circle.sh b/ci/run_circle.sh
new file mode 100755
index 0000000000000..435985bd42148
--- /dev/null
+++ b/ci/run_circle.sh
@@ -0,0 +1,9 @@
+#!/usr/bin/env bash
+
+echo "[running tests]"
+export PATH="$MINICONDA_DIR/bin:$PATH"
+
+source activate pandas
+
+echo "pytest --strict --junitxml=$CIRCLE_TEST_REPORTS/reports/junit.xml $@ pandas"
+pytest --strict --junitxml=$CIRCLE_TEST_REPORTS/reports/junit.xml $@ pandas
diff --git a/ci/run_with_env.cmd b/ci/run_with_env.cmd
index 3a472bc836c30..848f4608c8627 100644
--- a/ci/run_with_env.cmd
+++ b/ci/run_with_env.cmd
@@ -1,3 +1,7 @@
+:: EXPECTED ENV VARS: PYTHON_ARCH (either x86 or x64)
+::                    CONDA_PY (either 27, 33, 35 etc. - only major version is extracted)
+::
+::
 :: To build extensions for 64 bit Python 3, we need to configure environment
 :: variables to use the MSVC 2010 C++ compilers from GRMSDKX_EN_DVD.iso of:
 :: MS Windows SDK for Windows 7 and .NET Framework 4 (SDK v7.1)
@@ -6,7 +10,8 @@
 :: variables to use the MSVC 2008 C++ compilers from GRMSDKX_EN_DVD.iso of:
 :: MS Windows SDK for Windows 7 and .NET Framework 3.5 (SDK v7.0)
 ::
-:: 32 bit builds do not require specific environment configurations.
+:: 32 bit builds, and 64-bit builds for 3.5 and beyond, do not require specific
+:: environment configurations.
 ::
 :: Note: this script needs to be run with the /E:ON and /V:ON flags for the
 :: cmd interpreter, at least for (SDK v7.0)
@@ -15,33 +20,76 @@
 :: https://github.com/cython/cython/wiki/64BitCythonExtensionsOnWindows
 :: http://stackoverflow.com/a/13751649/163740
 ::
-:: Author: Olivier Grisel
+:: Author: Phil Elson
+:: Original Author: Olivier Grisel (https://github.com/ogrisel/python-appveyor-demo)
 :: License: CC0 1.0 Universal: http://creativecommons.org/publicdomain/zero/1.0/
+::
+:: Notes about batch files for Python people:
+::
+:: Quotes in values are literally part of the values:
+::      SET FOO="bar"
+:: FOO is now five characters long: " b a r "
+:: If you don't want quotes, don't include them on the right-hand side.
+::
+:: The CALL lines at the end of this file look redundant, but if you move them
+:: outside of the IF clauses, they do not run properly in the SET_SDK_64==Y
+:: case, I don't know why.
+:: originally from https://github.com/pelson/Obvious-CI/blob/master/scripts/obvci_appveyor_python_build_env.cmd
 @ECHO OFF
 
 SET COMMAND_TO_RUN=%*
 SET WIN_SDK_ROOT=C:\Program Files\Microsoft SDKs\Windows
 
-SET MAJOR_PYTHON_VERSION="%PYTHON_VERSION:~0,1%"
-IF %MAJOR_PYTHON_VERSION% == "2" (
+:: Extract the major and minor versions, and allow for the minor version to be
+:: more than 9.  This requires the version number to have two dots in it.
+SET MAJOR_PYTHON_VERSION=%CONDA_PY:~0,1%
+
+IF "%CONDA_PY:~2,1%" == "" (
+    :: CONDA_PY style, such as 27, 34 etc.
+    SET MINOR_PYTHON_VERSION=%CONDA_PY:~1,1%
+) ELSE (
+    IF "%CONDA_PY:~3,1%" == "." (
+     SET MINOR_PYTHON_VERSION=%CONDA_PY:~2,1%
+    ) ELSE (
+     SET MINOR_PYTHON_VERSION=%CONDA_PY:~2,2%
+    )
+)
+
+:: Based on the Python version, determine what SDK version to use, and whether
+:: to set the SDK for 64-bit.
+IF %MAJOR_PYTHON_VERSION% == 2 (
     SET WINDOWS_SDK_VERSION="v7.0"
-) ELSE IF %MAJOR_PYTHON_VERSION% == "3" (
-    SET WINDOWS_SDK_VERSION="v7.1"
+    SET SET_SDK_64=Y
 ) ELSE (
-    ECHO Unsupported Python version: "%MAJOR_PYTHON_VERSION%"
-    EXIT 1
+    IF %MAJOR_PYTHON_VERSION% == 3 (
+        SET WINDOWS_SDK_VERSION="v7.1"
+        IF %MINOR_PYTHON_VERSION% LEQ 4 (
+            SET SET_SDK_64=Y
+        ) ELSE (
+            SET SET_SDK_64=N
+        )
+    ) ELSE (
+        ECHO Unsupported Python version: "%MAJOR_PYTHON_VERSION%"
+        EXIT /B 1
+    )
 )
 
 IF "%PYTHON_ARCH%"=="64" (
-    ECHO Configuring Windows SDK %WINDOWS_SDK_VERSION% for Python %MAJOR_PYTHON_VERSION% on a 64 bit architecture
-    SET DISTUTILS_USE_SDK=1
-    SET MSSdk=1
-    "%WIN_SDK_ROOT%\%WINDOWS_SDK_VERSION%\Setup\WindowsSdkVer.exe" -q -version:%WINDOWS_SDK_VERSION%
-    "%WIN_SDK_ROOT%\%WINDOWS_SDK_VERSION%\Bin\SetEnv.cmd" /x64 /release
-    ECHO Executing: %COMMAND_TO_RUN%
-    call %COMMAND_TO_RUN% || EXIT 1
+    IF %SET_SDK_64% == Y (
+        ECHO Configuring Windows SDK %WINDOWS_SDK_VERSION% for Python %MAJOR_PYTHON_VERSION% on a 64 bit architecture
+        SET DISTUTILS_USE_SDK=1
+        SET MSSdk=1
+        "%WIN_SDK_ROOT%\%WINDOWS_SDK_VERSION%\Setup\WindowsSdkVer.exe" -q -version:%WINDOWS_SDK_VERSION%
+        "%WIN_SDK_ROOT%\%WINDOWS_SDK_VERSION%\Bin\SetEnv.cmd" /x64 /release
+        ECHO Executing: %COMMAND_TO_RUN%
+        call %COMMAND_TO_RUN% || EXIT /B 1
+    ) ELSE (
+        ECHO Using default MSVC build environment for 64 bit architecture
+        ECHO Executing: %COMMAND_TO_RUN%
+        call %COMMAND_TO_RUN% || EXIT /B 1
+    )
 ) ELSE (
     ECHO Using default MSVC build environment for 32 bit architecture
     ECHO Executing: %COMMAND_TO_RUN%
-    call %COMMAND_TO_RUN% || EXIT 1
+    call %COMMAND_TO_RUN% || EXIT /B 1
 )
diff --git a/ci/script.sh b/ci/script.sh
deleted file mode 100755
index 1126e8249646c..0000000000000
--- a/ci/script.sh
+++ /dev/null
@@ -1,24 +0,0 @@
-#!/bin/bash
-
-echo "inside $0"
-
-source activate pandas
-
-if [ -n "$LOCALE_OVERRIDE" ]; then
-    export LC_ALL="$LOCALE_OVERRIDE";
-    echo "Setting LC_ALL to $LOCALE_OVERRIDE"
-
-    pycmd='import pandas; print("pandas detected console encoding: %s" % pandas.get_option("display.encoding"))'
-    python -c "$pycmd"
-fi
-
-if [ "$BUILD_TEST" ]; then
-    echo "We are not running nosetests as this is simply a build test."
-else
-    echo nosetests --exe -A "$NOSE_ARGS" pandas --doctest-tests --with-xunit --xunit-file=/tmp/nosetests.xml
-    nosetests --exe -A "$NOSE_ARGS" pandas --doctest-tests --with-xunit --xunit-file=/tmp/nosetests.xml
-fi
-
-RET="$?"
-
-exit "$RET"
diff --git a/ci/script_multi.sh b/ci/script_multi.sh
new file mode 100755
index 0000000000000..2b2d4d5488b91
--- /dev/null
+++ b/ci/script_multi.sh
@@ -0,0 +1,46 @@
+#!/bin/bash -e
+
+echo "[script multi]"
+
+source activate pandas
+
+if [ -n "$LOCALE_OVERRIDE" ]; then
+    export LC_ALL="$LOCALE_OVERRIDE";
+    echo "Setting LC_ALL to $LOCALE_OVERRIDE"
+
+    pycmd='import pandas; print("pandas detected console encoding: %s" % pandas.get_option("display.encoding"))'
+    python -c "$pycmd"
+fi
+
+# Enforce absent network during testing by faking a proxy
+if echo "$TEST_ARGS" | grep -e --skip-network -q; then
+    export http_proxy=http://1.2.3.4 https_proxy=http://1.2.3.4;
+fi
+
+# Workaround for pytest-xdist flaky collection order
+# https://github.com/pytest-dev/pytest/issues/920
+# https://github.com/pytest-dev/pytest/issues/1075
+export PYTHONHASHSEED=$(python -c 'import random; print(random.randint(1, 4294967295))')
+echo PYTHONHASHSEED=$PYTHONHASHSEED
+
+if [ "$DOC" ]; then
+    echo "We are not running pytest as this is a doc-build"
+
+elif [ "$COVERAGE" ]; then
+    echo pytest -s -n 2 -m "not single" --cov=pandas --cov-report xml:/tmp/cov-multiple.xml --junitxml=/tmp/multiple.xml --strict $TEST_ARGS pandas
+    pytest -s -n 2 -m "not single" --cov=pandas --cov-report xml:/tmp/cov-multiple.xml --junitxml=/tmp/multiple.xml --strict $TEST_ARGS pandas
+
+elif [ "$SLOW" ]; then
+    TEST_ARGS="--only-slow --skip-network"
+    echo pytest -r xX -m "not single and slow" -v --junitxml=/tmp/multiple.xml --strict $TEST_ARGS pandas
+    pytest -r xX -m "not single and slow" -v --junitxml=/tmp/multiple.xml --strict $TEST_ARGS pandas
+
+else
+    echo pytest -n 2 -r xX -m "not single" --junitxml=/tmp/multiple.xml --strict $TEST_ARGS pandas
+    pytest -n 2 -r xX -m "not single" --junitxml=/tmp/multiple.xml --strict $TEST_ARGS pandas # TODO: doctest
+
+fi
+
+RET="$?"
+
+exit "$RET"
diff --git a/ci/script_single.sh b/ci/script_single.sh
new file mode 100755
index 0000000000000..60e2fbb33ee5d
--- /dev/null
+++ b/ci/script_single.sh
@@ -0,0 +1,39 @@
+#!/bin/bash
+
+echo "[script_single]"
+
+source activate pandas
+
+if [ -n "$LOCALE_OVERRIDE" ]; then
+    export LC_ALL="$LOCALE_OVERRIDE";
+    echo "Setting LC_ALL to $LOCALE_OVERRIDE"
+
+    pycmd='import pandas; print("pandas detected console encoding: %s" % pandas.get_option("display.encoding"))'
+    python -c "$pycmd"
+fi
+
+if [ "$SLOW" ]; then
+    TEST_ARGS="--only-slow --skip-network"
+fi
+
+# Enforce absent network during testing by faking a proxy
+if echo "$TEST_ARGS" | grep -e --skip-network -q; then
+    export http_proxy=http://1.2.3.4 https_proxy=http://1.2.3.4;
+fi
+
+if [ "$DOC" ]; then
+    echo "We are not running pytest as this is a doc-build"
+
+elif [ "$COVERAGE" ]; then
+    echo pytest -s -m "single" -r xXs --strict --cov=pandas --cov-report xml:/tmp/cov-single.xml --junitxml=/tmp/single.xml $TEST_ARGS pandas
+    pytest      -s -m "single" -r xXs --strict --cov=pandas --cov-report xml:/tmp/cov-single.xml --junitxml=/tmp/single.xml $TEST_ARGS pandas
+
+else
+    echo pytest -m "single" -r xXs --junitxml=/tmp/single.xml --strict $TEST_ARGS pandas
+    pytest      -m "single" -r xXs --junitxml=/tmp/single.xml --strict $TEST_ARGS pandas # TODO: doctest
+
+fi
+
+RET="$?"
+
+exit "$RET"
diff --git a/ci/show_circle.sh b/ci/show_circle.sh
new file mode 100755
index 0000000000000..bfaa65c1d84f2
--- /dev/null
+++ b/ci/show_circle.sh
@@ -0,0 +1,8 @@
+#!/usr/bin/env bash
+
+echo "[installed versions]"
+
+export PATH="$MINICONDA_DIR/bin:$PATH"
+source activate pandas
+
+python -c "import pandas; pandas.show_versions();"
diff --git a/ci/speedpack/Vagrantfile b/ci/speedpack/Vagrantfile
deleted file mode 100644
index ec939b7c0a937..0000000000000
--- a/ci/speedpack/Vagrantfile
+++ /dev/null
@@ -1,22 +0,0 @@
-# -*- mode: ruby -*-
-# vi: set ft=ruby :
-Vagrant.configure("2") do |config|
-  config.vm.box = "precise64"
-  config.vm.box_url = "http://files.vagrantup.com/precise64.box"
-
-#  config.vbguest.auto_update = true
-#  config.vbguest.no_remote = true
-
-  config.vm.synced_folder File.expand_path("..", Dir.pwd), "/reqf"
-  config.vm.synced_folder "wheelhouse", "/wheelhouse"
-
-  config.vm.provider :virtualbox do |vb|
-    vb.customize ["modifyvm", :id, "--cpus", "4"]
-    vb.customize ["modifyvm", :id, "--memory", "2048"]
-    vb.customize ["modifyvm", :id, "--natdnshostresolver1", "on"]
-    vb.customize ["modifyvm", :id, "--natdnsproxy1", "on"]
-  end
-
-  config.vm.provision :shell, :path => "build.sh"
-
-end
diff --git a/ci/speedpack/build.sh b/ci/speedpack/build.sh
deleted file mode 100755
index 330d8984ea7b7..0000000000000
--- a/ci/speedpack/build.sh
+++ /dev/null
@@ -1,117 +0,0 @@
-#!/bin/bash
-
-# This script is meant to run on a mint precise64 VM.
-# The generated wheel files should be compatible
-# with travis-ci as of 07/2013.
-#
-# Runtime can be up to an hour or more.
-
-echo "Building wheels..."
-
-# print a trace for everything; RTFM
-set -x
-
-# install and update some basics
-apt-get update
-apt-get install python-software-properties git -y
-apt-add-repository ppa:fkrull/deadsnakes -y
-apt-get update
-
-# install some deps and virtualenv
-apt-get install python-pip libfreetype6-dev libpng12-dev libhdf5-serial-dev \
-    g++ libatlas-base-dev gfortran libreadline-dev zlib1g-dev flex bison \
-    libxml2-dev libxslt-dev libssl-dev -y
-pip install virtualenv
-apt-get build-dep python-lxml -y
-
-# install sql servers
-apt-get install postgresql-client libpq-dev -y
-
-export PYTHONIOENCODING='utf-8'
-export VIRTUALENV_DISTRIBUTE=0
-
-function create_fake_pandas() {
-    local site_pkg_dir="$1"
-    rm -rf $site_pkg_dir/pandas
-    mkdir $site_pkg_dir/pandas
-    touch $site_pkg_dir/pandas/__init__.py
-    echo "version = '0.10.0-phony'" > $site_pkg_dir/pandas/version.py
-}
-
-
-function get_site_pkgs_dir() {
-    python$1 -c 'import distutils; print(distutils.sysconfig.get_python_lib())'
-}
-
-
-function create_wheel() {
-    local pip_args="$1"
-    local wheelhouse="$2"
-    local n="$3"
-    local pyver="$4"
-
-    local site_pkgs_dir="$(get_site_pkgs_dir $pyver)"
-
-
-    if [[ "$n" == *statsmodels* ]]; then
-        create_fake_pandas $site_pkgs_dir && \
-        pip wheel $pip_args --wheel-dir=$wheelhouse $n && \
-        pip install $pip_args --no-index $n && \
-        rm -Rf $site_pkgs_dir
-    else
-        pip wheel $pip_args --wheel-dir=$wheelhouse $n
-        pip install $pip_args --no-index $n
-    fi
-}
-
-
-function generate_wheels() {
-    # get the requirements file
-    local reqfile="$1"
-
-    # get the python version
-    local TAG=$(echo $reqfile |  grep -Po "(\d\.?[\d\-](_\w+)?)")
-
-    # base dir for wheel dirs
-    local WHEELSTREET=/wheelhouse
-    local WHEELHOUSE="$WHEELSTREET/$TAG"
-
-    local PY_VER="${TAG:0:3}"
-    local PY_MAJOR="${PY_VER:0:1}"
-    local PIP_ARGS="--use-wheel --find-links=$WHEELHOUSE --download-cache /tmp"
-
-    # install the python version if not installed
-    apt-get install python$PY_VER python$PY_VER-dev -y
-
-    # create a new virtualenv
-    rm -Rf /tmp/venv
-    virtualenv -p python$PY_VER /tmp/venv
-    source /tmp/venv/bin/activate
-
-    # install pip setuptools
-    pip install -I --download-cache /tmp 'git+https://github.com/pypa/pip@42102e9d#egg=pip'
-    pip install -I -U --download-cache /tmp setuptools
-    pip install -I --download-cache /tmp wheel
-
-    # make the dir if it doesn't exist
-    mkdir -p $WHEELHOUSE
-
-    # put the requirements file in the wheelhouse
-    cp $reqfile $WHEELHOUSE
-
-    # install and build the wheels
-    cat $reqfile | while read N; do
-        create_wheel "$PIP_ARGS" "$WHEELHOUSE" "$N" "$PY_VER"
-    done
-}
-
-
-# generate a single wheel version
-# generate_wheels "/reqf/requirements-2.7.txt"
-# 
-# if vagrant is already up
-# run as vagrant provision
-
-for reqfile in $(ls -1 /reqf/requirements-*.*); do
-    generate_wheels "$reqfile"
-done
diff --git a/ci/speedpack/nginx/nginx.conf.template b/ci/speedpack/nginx/nginx.conf.template
deleted file mode 100644
index e2cfeaf053d08..0000000000000
--- a/ci/speedpack/nginx/nginx.conf.template
+++ /dev/null
@@ -1,48 +0,0 @@
-#user  nobody;
-worker_processes  1;
-
-#error_log  logs/error.log;
-#error_log  logs/error.log  notice;
-#error_log  logs/error.log  info;
-
-#pid        logs/nginx.pid;
-
-
-events {
-    worker_connections  1024;
-}
-
-
-http {
-    include       mime.types;
-    default_type  application/octet-stream;
-
-    #log_format  main  '$remote_addr - $remote_user [$time_local] "$request" '
-    #                  '$status $body_bytes_sent "$http_referer" '
-    #                  '"$http_user_agent" "$http_x_forwarded_for"';
-
-    #access_log  logs/access.log  on;
-
-    sendfile        on;
-    #tcp_nopush     on;
-
-    #keepalive_timeout  0;
-    keepalive_timeout  65;
-
-    #gzip  on;
-
-    server {
-        listen $OPENSHIFT_IP:$OPENSHIFT_PORT;
-
-        access_log  access.log ;
-        sendfile        on;
-
-        location / {
-                root ../../app-root/data/store/;
-                autoindex on;
-        }
-
-
-    }
-
-}
diff --git a/ci/submit_ccache.sh b/ci/submit_ccache.sh
deleted file mode 100755
index da421489230dd..0000000000000
--- a/ci/submit_ccache.sh
+++ /dev/null
@@ -1,34 +0,0 @@
-#!/bin/bash
-
-home_dir=$(pwd)
-ccache -s
-
-MISSES=$(ccache -s | grep "cache miss" | grep -Po "\d+")
-echo "MISSES: $MISSES"
-
-if [ x"$MISSES" == x"0" ]; then
-    echo "No cache misses detected, skipping upload"
-    exit 0
-fi
-
-if [ "$IRON_TOKEN" ]; then
-
-    # install the compiler cache
-    sudo apt-get $APT_ARGS install ccache p7zip-full
-    # iron_cache, pending py3 fixes upstream
-    pip install -I --allow-external --allow-insecure git+https://github.com/iron-io/iron_cache_python.git@8a451c7d7e4d16e0c3bedffd0f280d5d9bd4fe59#egg=iron_cache
-
-    rm -rf $HOME/ccache.7z
-
-    tar cf - $HOME/.ccache \
-    "$TRAVIS_BUILD_DIR"/pandas/{index,algos,lib,tslib,parser,hashtable}.c \
-    "$TRAVIS_BUILD_DIR"/pandas/src/{sparse,testing}.c \
-    "$TRAVIS_BUILD_DIR"/pandas/msgpack.cpp  \
-    |  7za a -si $HOME/ccache.7z
-
-    split -b 500000 -d $HOME/ccache.7z $HOME/ccache.
-
-    python ci/ironcache/put.py
-fi;
-
-exit 0
diff --git a/ci/submit_cython_cache.sh b/ci/submit_cython_cache.sh
new file mode 100755
index 0000000000000..b87acef0ba11c
--- /dev/null
+++ b/ci/submit_cython_cache.sh
@@ -0,0 +1,29 @@
+#!/bin/bash
+
+CACHE_File="$HOME/.cache/cython_files.tar"
+PYX_CACHE_DIR="$HOME/.cache/pyxfiles"
+pyx_file_list=`find ${TRAVIS_BUILD_DIR} -name "*.pyx" -o -name "*.pxd" -o -name "*.pxi.in"`
+
+rm -rf $CACHE_File
+rm -rf $PYX_CACHE_DIR
+
+home_dir=$(pwd)
+
+mkdir -p $PYX_CACHE_DIR
+rsync -Rv $pyx_file_list $PYX_CACHE_DIR
+
+echo "pyx files:"
+echo $pyx_file_list
+
+tar cf ${CACHE_File} --files-from /dev/null
+
+for i in ${pyx_file_list}
+do
+        f=${i%.pyx}
+        ls $f.{c,cpp} | tar rf  ${CACHE_File} -T -
+done
+
+echo "Cython files in cache tar:"
+tar tvf ${CACHE_File}
+
+exit 0
diff --git a/ci/travis-27-locale.yaml b/ci/travis-27-locale.yaml
new file mode 100644
index 0000000000000..1312c1296d46a
--- /dev/null
+++ b/ci/travis-27-locale.yaml
@@ -0,0 +1,27 @@
+name: pandas
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - bottleneck=1.0.0
+  - cython=0.24
+  - lxml
+  - matplotlib=1.4.3
+  - numpy=1.9.2
+  - openpyxl=2.4.0
+  - python-dateutil
+  - python-blosc
+  - python=2.7
+  - pytz
+  - pytz=2013b
+  - scipy
+  - sqlalchemy=0.8.1
+  - xlrd=0.9.2
+  - xlsxwriter=0.5.2
+  - xlwt=0.7.5
+  # universal
+  - pytest
+  - pytest-xdist
+  - pip:
+    - html5lib==1.0b2
+    - beautifulsoup4==4.2.1
diff --git a/ci/travis-27.yaml b/ci/travis-27.yaml
new file mode 100644
index 0000000000000..482b888b88062
--- /dev/null
+++ b/ci/travis-27.yaml
@@ -0,0 +1,50 @@
+name: pandas
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - bottleneck
+  - cython=0.24
+  - fastparquet
+  - feather-format
+  - flake8=3.4.1
+  - gcsfs
+  - html5lib
+  - ipython
+  - jemalloc=4.5.0.post
+  - jinja2=2.8
+  - lxml
+  - matplotlib
+  - mock
+  - nomkl
+  - numexpr
+  - numpy=1.13*
+  - openpyxl=2.4.0
+  - patsy
+  - psycopg2
+  - py
+  - pyarrow=0.4.1
+  - PyCrypto
+  - pymysql=0.6.3
+  - pytables
+  - python-blosc
+  - python-dateutil=2.5.0
+  - python=2.7*
+  - pytz=2013b
+  - s3fs
+  - scipy
+  - sqlalchemy=0.9.6
+  - xarray=0.8.0
+  - xlrd=0.9.2
+  - xlsxwriter=0.5.2
+  - xlwt=0.7.5
+  # universal
+  - pytest
+  - pytest-xdist
+  - moto
+  - pip:
+    - backports.lzma
+    - cpplint
+    - pandas-gbq
+    - pathlib
diff --git a/ci/travis-35-osx.yaml b/ci/travis-35-osx.yaml
new file mode 100644
index 0000000000000..e74abac4c9775
--- /dev/null
+++ b/ci/travis-35-osx.yaml
@@ -0,0 +1,27 @@
+name: pandas
+channels:
+  - defaults
+dependencies:
+  - beautifulsoup4
+  - bottleneck
+  - cython
+  - html5lib
+  - jinja2
+  - lxml
+  - matplotlib
+  - nomkl
+  - numexpr
+  - numpy=1.10.4
+  - openpyxl
+  - pytables
+  - python=3.5*
+  - pytz
+  - xarray
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - pytest
+  - pytest-xdist
+  - pip:
+    - python-dateutil==2.5.3
diff --git a/ci/travis-36-doc.yaml b/ci/travis-36-doc.yaml
new file mode 100644
index 0000000000000..c22dddbe0ba3f
--- /dev/null
+++ b/ci/travis-36-doc.yaml
@@ -0,0 +1,45 @@
+name: pandas
+channels:
+  - defaults
+  - conda-forge
+  - r
+dependencies:
+  - beautifulsoup4
+  - bottleneck
+  - cython
+  - fastparquet
+  - feather-format
+  - html5lib
+  - ipykernel
+  - ipython
+  - ipywidgets
+  - lxml
+  - matplotlib
+  - nbconvert
+  - nbformat
+  - nbsphinx
+  - notebook
+  - numexpr
+  - numpy=1.13*
+  - openpyxl
+  - pandoc
+  - pyqt
+  - pytables
+  - python-dateutil
+  - python-snappy
+  - python=3.6*
+  - pytz
+  - r
+  - rpy2
+  - scipy
+  - seaborn
+  - sphinx
+  - sqlalchemy
+  - statsmodels
+  - xarray
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - pytest
+  - pytest-xdist
diff --git a/ci/travis-36-numpydev.yaml b/ci/travis-36-numpydev.yaml
new file mode 100644
index 0000000000000..455d65feb4242
--- /dev/null
+++ b/ci/travis-36-numpydev.yaml
@@ -0,0 +1,16 @@
+name: pandas
+channels:
+  - defaults
+dependencies:
+  - python=3.6*
+  - pytz
+  - Cython
+  # universal
+  - pytest
+  - pytest-xdist
+  - pip:
+    - "git+git://github.com/dateutil/dateutil.git"
+    - "-f https://7933911d6844c6c53a7d-47bd50c35cd79bd838daf386af554a83.ssl.cf2.rackcdn.com"
+    - "--pre"
+    - "numpy"
+    - "scipy"
diff --git a/ci/travis-36-slow.yaml b/ci/travis-36-slow.yaml
new file mode 100644
index 0000000000000..6c475dc48723c
--- /dev/null
+++ b/ci/travis-36-slow.yaml
@@ -0,0 +1,30 @@
+name: pandas
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - cython
+  - html5lib
+  - lxml
+  - matplotlib
+  - numexpr
+  - numpy
+  - openpyxl
+  - patsy
+  - psycopg2
+  - pymysql
+  - pytables
+  - python-dateutil
+  - python=3.6*
+  - pytz
+  - s3fs
+  - scipy
+  - sqlalchemy
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - pytest
+  - pytest-xdist
+  - moto
diff --git a/ci/travis-36.yaml b/ci/travis-36.yaml
new file mode 100644
index 0000000000000..ff4f1a4a86f99
--- /dev/null
+++ b/ci/travis-36.yaml
@@ -0,0 +1,48 @@
+name: pandas
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - cython
+  - dask
+  - fastparquet
+  - feather-format
+  - gcsfs
+  - geopandas
+  - html5lib
+  - ipython
+  - jinja2
+  - lxml
+  - matplotlib
+  - nomkl
+  - numexpr
+  - numpy
+  - openpyxl
+  - psycopg2
+  - pyarrow
+  - pymysql
+  - pytables
+  - python-snappy
+  - python=3.6*
+  - pytz
+  - s3fs
+  - scikit-learn
+  - scipy
+  - seaborn
+  - sqlalchemy
+  - statsmodels
+  - xarray
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - pytest
+  - pytest-xdist
+  - pytest-cov
+  - moto
+  - pip:
+    - brotlipy
+    - coverage
+    - pandas-datareader
+    - python-dateutil
diff --git a/ci/travis-37.yaml b/ci/travis-37.yaml
new file mode 100644
index 0000000000000..8b255c9e6ec72
--- /dev/null
+++ b/ci/travis-37.yaml
@@ -0,0 +1,14 @@
+name: pandas
+channels:
+  - defaults
+  - conda-forge
+  - c3i_test
+dependencies:
+  - python=3.7
+  - cython
+  - numpy
+  - python-dateutil
+  - nomkl
+  - pytz
+  - pytest
+  - pytest-xdist
diff --git a/ci/travis_encrypt_gbq.sh b/ci/travis_encrypt_gbq.sh
new file mode 100755
index 0000000000000..e404ca73a405e
--- /dev/null
+++ b/ci/travis_encrypt_gbq.sh
@@ -0,0 +1,34 @@
+#!/bin/bash
+
+GBQ_JSON_FILE=$1
+
+if [[ $# -ne 1 ]]; then
+    echo -e "Too few arguments.\nUsage: ./travis_encrypt_gbq.sh "\
+    "<gbq-json-credentials-file>"
+    exit 1
+fi
+
+if [[ $GBQ_JSON_FILE != *.json ]]; then
+    echo "ERROR: Expected *.json file"
+    exit 1
+fi
+
+if [[ ! -f $GBQ_JSON_FILE ]]; then
+    echo "ERROR: File $GBQ_JSON_FILE does not exist"
+    exit 1
+fi
+
+echo "Encrypting $GBQ_JSON_FILE..."
+read -d "\n" TRAVIS_KEY TRAVIS_IV <<<$(travis encrypt-file $GBQ_JSON_FILE \
+travis_gbq.json.enc -f | grep -o "\w*_iv\|\w*_key");
+
+echo "Adding your secure key to travis_gbq_config.txt ..."
+echo -e "TRAVIS_IV_ENV=$TRAVIS_IV\nTRAVIS_KEY_ENV=$TRAVIS_KEY"\
+> travis_gbq_config.txt
+
+echo "Done. Removing file $GBQ_JSON_FILE"
+rm $GBQ_JSON_FILE
+
+echo -e "Created encrypted credentials file travis_gbq.json.enc.\n"\
+     "NOTE: Do NOT commit the *.json file containing your unencrypted" \
+     "private key"
diff --git a/ci/travis_gbq.json.enc b/ci/travis_gbq.json.enc
new file mode 100644
index 0000000000000..c2a33bbd6f263
Binary files /dev/null and b/ci/travis_gbq.json.enc differ
diff --git a/ci/travis_gbq_config.txt b/ci/travis_gbq_config.txt
new file mode 100644
index 0000000000000..0b28cdedbd0d7
--- /dev/null
+++ b/ci/travis_gbq_config.txt
@@ -0,0 +1,2 @@
+TRAVIS_IV_ENV=encrypted_1d9d7b1f171b_iv
+TRAVIS_KEY_ENV=encrypted_1d9d7b1f171b_key
diff --git a/ci/travis_process_gbq_encryption.sh b/ci/travis_process_gbq_encryption.sh
new file mode 100755
index 0000000000000..9967d40e49f0a
--- /dev/null
+++ b/ci/travis_process_gbq_encryption.sh
@@ -0,0 +1,13 @@
+#!/bin/bash
+
+source ci/travis_gbq_config.txt
+
+if [[ -n ${SERVICE_ACCOUNT_KEY} ]]; then
+    echo "${SERVICE_ACCOUNT_KEY}" > ci/travis_gbq.json;
+elif [[ -n ${!TRAVIS_IV_ENV} ]]; then
+    openssl aes-256-cbc -K ${!TRAVIS_KEY_ENV} -iv ${!TRAVIS_IV_ENV} \
+    -in ci/travis_gbq.json.enc -out ci/travis_gbq.json -d;
+    export GBQ_PROJECT_ID='pandas-travis';
+    echo 'Successfully decrypted gbq credentials'
+fi
+
diff --git a/ci/upload_coverage.sh b/ci/upload_coverage.sh
new file mode 100755
index 0000000000000..a7ef2fa908079
--- /dev/null
+++ b/ci/upload_coverage.sh
@@ -0,0 +1,12 @@
+#!/bin/bash
+
+if [ -z "$COVERAGE" ]; then
+   echo "coverage is not selected for this build"
+   exit 0
+fi
+
+source activate pandas
+
+echo "uploading coverage"
+bash <(curl -s https://codecov.io/bash) -Z -c -F single -f /tmp/cov-single.xml
+bash <(curl -s https://codecov.io/bash) -Z -c -F multiple -f /tmp/cov-multiple.xml
diff --git a/circle.yml b/circle.yml
new file mode 100644
index 0000000000000..66415defba6fe
--- /dev/null
+++ b/circle.yml
@@ -0,0 +1,38 @@
+machine:
+  environment:
+    # these are globally set
+    MINICONDA_DIR: /home/ubuntu/miniconda3
+
+
+database:
+  override:
+    - ./ci/install_db_circle.sh
+
+
+checkout:
+  post:
+    # since circleci does a shallow fetch
+    # we need to populate our tags
+    - git fetch --depth=1000
+
+
+dependencies:
+  override:
+    - >
+      case $CIRCLE_NODE_INDEX in
+       0)
+         sudo apt-get install language-pack-it && ./ci/install_circle.sh JOB="2.7_COMPAT" ENV_FILE="ci/circle-27-compat.yaml" LOCALE_OVERRIDE="it_IT.UTF-8" ;;
+       1)
+         sudo apt-get install language-pack-zh-hans && ./ci/install_circle.sh JOB="3.6_LOCALE" ENV_FILE="ci/circle-36-locale.yaml" LOCALE_OVERRIDE="zh_CN.UTF-8" ;;
+       2)
+         sudo apt-get install language-pack-zh-hans && ./ci/install_circle.sh JOB="3.6_LOCALE_SLOW" ENV_FILE="ci/circle-36-locale_slow.yaml" LOCALE_OVERRIDE="zh_CN.UTF-8" ;;
+       3)
+         ./ci/install_circle.sh JOB="3.5_ASCII" ENV_FILE="ci/circle-35-ascii.yaml" LOCALE_OVERRIDE="C" ;;
+      esac
+    - ./ci/show_circle.sh
+
+
+test:
+  override:
+      - case $CIRCLE_NODE_INDEX in 0) ./ci/run_circle.sh --skip-slow --skip-network ;; 1) ./ci/run_circle.sh --only-slow --skip-network ;; 2) ./ci/run_circle.sh --skip-slow --skip-network ;; 3) ./ci/run_circle.sh --skip-slow --skip-network ;; esac:
+          parallel: true
diff --git a/codecov.yml b/codecov.yml
new file mode 100644
index 0000000000000..512bc2e82a736
--- /dev/null
+++ b/codecov.yml
@@ -0,0 +1,13 @@
+codecov:
+  branch: master
+
+coverage:
+  status:
+    project:
+      default:
+        enabled: no
+        target: '82'
+    patch:
+      default:
+        enabled: no
+        target: '50'
diff --git a/conda.recipe/meta.yaml b/conda.recipe/meta.yaml
index e3495bc5bd04a..86bed996c8aab 100644
--- a/conda.recipe/meta.yaml
+++ b/conda.recipe/meta.yaml
@@ -1,9 +1,11 @@
 package:
     name: pandas
-    version: {{ environ.get('GIT_DESCRIBE_TAG', '').replace('.dev', 'dev') }}
+    version: {{ environ.get('GIT_DESCRIBE_TAG','').replace('v', '', 1) }}
 
 build:
     number: {{ environ.get('GIT_DESCRIBE_NUMBER', 0) }}
+    {% if GIT_DESCRIBE_NUMBER|int == 0 %}string: np{{ CONDA_NPY }}py{{ CONDA_PY }}_0
+    {% else %}string: np{{ CONDA_NPY }}py{{ CONDA_PY }}_{{ GIT_BUILD_STR }}{% endif %}
 
 source:
     git_url: ../
@@ -12,28 +14,21 @@ requirements:
   build:
     - python
     - cython
-    - numpy
-    - libpython # [py2k and win]
-    - setuptools
+    - numpy 1.11.*
+    - setuptools >=3.3
+    - python-dateutil >=2.5.0
     - pytz
-    - python-dateutil
 
   run:
     - python
-    - numpy
-    - python-dateutil
+    - numpy >=1.11.*
+    - python-dateutil >=2.5.0
     - pytz
 
 test:
   imports:
     - pandas
 
-  #requires:
-  #  - nose
-
-  #commands:
-  #  - nosetests --exe -A "not slow and not network and not disabled" pandas
-
 about:
   home: http://pandas.pydata.org
   license: BSD
diff --git a/doc/README.rst b/doc/README.rst
index 06d95e6b9c44d..12950d323f5d3 100644
--- a/doc/README.rst
+++ b/doc/README.rst
@@ -3,9 +3,11 @@
 Contributing to the documentation
 =================================
 
-If you're not the developer type, contributing to the documentation is still
-of huge value. You don't even have to be an expert on
-*pandas* to do so! Something as simple as rewriting small passages for clarity
+Whether you are someone who loves writing, teaching, or development,
+contributing to the documentation is a huge value. If you don't see yourself
+as a developer type, please don't stress and know that we want you to
+contribute. You don't even have to be an expert on *pandas* to do so!
+Something as simple as rewriting small passages for clarity
 as you reference the docs is a simple but effective way to contribute. The
 next person to read that passage will be in your debt!
 
@@ -40,7 +42,7 @@ Some other important things to know about the docs:
 - The docstrings follow the **Numpy Docstring Standard** which is used widely
   in the Scientific Python community. This standard specifies the format of
   the different sections of the docstring. See `this document
-  <https://github.com/numpy/numpy/blob/master/doc/HOWTO_DOCUMENT.rst.txt>`_
+  <https://numpydoc.readthedocs.io/en/latest/>`_
   for a detailed explanation, or look at some of the existing functions to
   extend it in a similar manner.
 
@@ -81,7 +83,9 @@ have ``sphinx`` and ``ipython`` installed. `numpydoc
 <https://github.com/numpy/numpydoc>`_ is used to parse the docstrings that
 follow the Numpy Docstring Standard (see above), but you don't need to install
 this because a local copy of ``numpydoc`` is included in the pandas source
-code.
+code. `nbsphinx <https://nbsphinx.readthedocs.io/>`_ is used to convert
+Jupyter notebooks. You will need to install it if you intend to modify any of
+the notebooks included in the documentation.
 
 Furthermore, it is recommended to have all `optional dependencies
 <http://pandas.pydata.org/pandas-docs/dev/install.html#optional-dependencies>`_
@@ -155,12 +159,12 @@ Where to start?
 ---------------
 
 There are a number of issues listed under `Docs
-<https://github.com/pydata/pandas/issues?labels=Docs&sort=updated&state=open>`_
-and `Good as first PR
-<https://github.com/pydata/pandas/issues?labels=Good+as+first+PR&sort=updated&state=open>`_
+<https://github.com/pandas-dev/pandas/issues?labels=Docs&sort=updated&state=open>`_
+and `good first issue
+<https://github.com/pandas-dev/pandas/issues?labels=good+first+issue&sort=updated&state=open>`_
 where you could start out.
 
-Or maybe you have an idea of you own, by using pandas, looking for something
+Or maybe you have an idea of your own, by using pandas, looking for something
 in the documentation and thinking 'this can be improved', let's do something
 about that!
 
diff --git a/doc/_templates/api_redirect.html b/doc/_templates/api_redirect.html
index 24bdd8363830f..c04a8b58ce544 100644
--- a/doc/_templates/api_redirect.html
+++ b/doc/_templates/api_redirect.html
@@ -1,15 +1,10 @@
-{% set pgn = pagename.split('.') -%}
-{% if pgn[-2][0].isupper() -%}
-    {% set redirect = ["pandas", pgn[-2], pgn[-1], 'html']|join('.') -%}
-{% else -%}
-    {% set redirect = ["pandas", pgn[-1], 'html']|join('.') -%}
-{% endif -%}
+{% set redirect = redirects[pagename.split("/")[-1]] %}
 <html>
     <head>
-        <meta http-equiv="Refresh" content="0; url={{ redirect }}" />
+        <meta http-equiv="Refresh" content="0; url={{ redirect }}.html" />
         <title>This API page has moved</title>
     </head>
     <body>
-        <p>This API page has moved <a href="{{ redirect }}">here</a>.</p>
+        <p>This API page has moved <a href="{{ redirect }}.html">here</a>.</p>
     </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/doc/_templates/autosummary/accessor.rst b/doc/_templates/autosummary/accessor.rst
index 1401121fb51c6..4ba745cd6fdba 100644
--- a/doc/_templates/autosummary/accessor.rst
+++ b/doc/_templates/autosummary/accessor.rst
@@ -3,4 +3,4 @@
 
 .. currentmodule:: {{ module.split('.')[0] }}
 
-.. automethod:: {{ [module.split('.')[1], objname]|join('.') }}
+.. autoaccessor:: {{ (module.split('.')[1:] + [objname]) | join('.') }}
diff --git a/doc/_templates/autosummary/accessor_attribute.rst b/doc/_templates/autosummary/accessor_attribute.rst
index e38a9f22f9d99..b5ad65d6a736f 100644
--- a/doc/_templates/autosummary/accessor_attribute.rst
+++ b/doc/_templates/autosummary/accessor_attribute.rst
@@ -3,4 +3,4 @@
 
 .. currentmodule:: {{ module.split('.')[0] }}
 
-.. autoaccessorattribute:: {{ [module.split('.')[1], objname]|join('.') }}
\ No newline at end of file
+.. autoaccessorattribute:: {{ (module.split('.')[1:] + [objname]) | join('.') }}
diff --git a/doc/_templates/autosummary/accessor_callable.rst b/doc/_templates/autosummary/accessor_callable.rst
index 6f45e0fd01e16..7a3301814f5f4 100644
--- a/doc/_templates/autosummary/accessor_callable.rst
+++ b/doc/_templates/autosummary/accessor_callable.rst
@@ -3,4 +3,4 @@
 
 .. currentmodule:: {{ module.split('.')[0] }}
 
-.. autoaccessorcallable:: {{ [module.split('.')[1], objname]|join('.') }}.__call__
+.. autoaccessorcallable:: {{ (module.split('.')[1:] + [objname]) | join('.') }}.__call__
diff --git a/doc/_templates/autosummary/accessor_method.rst b/doc/_templates/autosummary/accessor_method.rst
index 8175d8615ceb2..aefbba6ef1bbc 100644
--- a/doc/_templates/autosummary/accessor_method.rst
+++ b/doc/_templates/autosummary/accessor_method.rst
@@ -3,4 +3,4 @@
 
 .. currentmodule:: {{ module.split('.')[0] }}
 
-.. autoaccessormethod:: {{ [module.split('.')[1], objname]|join('.') }}
\ No newline at end of file
+.. autoaccessormethod:: {{ (module.split('.')[1:] + [objname]) | join('.') }}
diff --git a/doc/cheatsheet/Pandas_Cheat_Sheet.pdf b/doc/cheatsheet/Pandas_Cheat_Sheet.pdf
new file mode 100644
index 0000000000000..696ed288cf7a6
Binary files /dev/null and b/doc/cheatsheet/Pandas_Cheat_Sheet.pdf differ
diff --git a/doc/cheatsheet/Pandas_Cheat_Sheet.pptx b/doc/cheatsheet/Pandas_Cheat_Sheet.pptx
new file mode 100644
index 0000000000000..f8b98a6f1f8e4
Binary files /dev/null and b/doc/cheatsheet/Pandas_Cheat_Sheet.pptx differ
diff --git a/doc/cheatsheet/README.txt b/doc/cheatsheet/README.txt
new file mode 100644
index 0000000000000..d32fe5bcd05a6
--- /dev/null
+++ b/doc/cheatsheet/README.txt
@@ -0,0 +1,8 @@
+The Pandas Cheat Sheet was created using Microsoft Powerpoint 2013.
+To create the PDF version, within Powerpoint, simply do a "Save As"
+and pick "PDF' as the format.
+
+This cheat sheet was inspired by the RstudioData Wrangling Cheatsheet[1], written by Irv Lustig, Princeton Consultants[2].
+
+[1]: https://www.rstudio.com/wp-content/uploads/2015/02/data-wrangling-cheatsheet.pdf
+[2]: http://www.princetonoptimization.com/
diff --git a/doc/logo/pandas_logo.png b/doc/logo/pandas_logo.png
new file mode 100644
index 0000000000000..065ee4e4856a6
Binary files /dev/null and b/doc/logo/pandas_logo.png differ
diff --git a/doc/logo/pandas_logo.py b/doc/logo/pandas_logo.py
new file mode 100644
index 0000000000000..c3647f0c7d2a8
--- /dev/null
+++ b/doc/logo/pandas_logo.py
@@ -0,0 +1,44 @@
+# script to generate the pandas logo
+
+from matplotlib import pyplot as plt
+from matplotlib import rcParams
+import numpy as np
+
+rcParams['mathtext.fontset'] = 'cm'
+
+
+def fnx():
+    return np.random.randint(5, 50, 10)
+
+
+fig = plt.figure(figsize=(6, 1.25))
+
+ax = fig.add_axes((0.45, 0.1, 0.16, 0.8))
+bar_data = [2.1, -00.8, 1.1, 2.5, -2.1, -0.5, -2.0, 1.5]
+ax.set_ylim(-3, 3)
+ax.set_xticks([])
+ax.set_yticks([])
+ax.bar(np.arange(len(bar_data)), bar_data)
+
+ax = fig.add_axes((0.63, 0.1, 0.16, 0.8))
+for i in range(4):
+    ax.plot(np.random.rand(8))
+ax.set_xticks([])
+ax.set_yticks([])
+
+ax = fig.add_axes((0.63 + 0.18, 0.1, 0.16, 0.8))
+y = np.row_stack((fnx(), fnx(), fnx()))
+x = np.arange(10)
+y1, y2, y3 = fnx(), fnx(), fnx()
+ax.stackplot(x, y1, y2, y3)
+ax.set_xticks([])
+ax.set_yticks([])
+
+plt.figtext(0.05, 0.5, "pandas", size=40)
+
+plt.figtext(
+    0.05, 0.2, r"$y_{it} = \beta^{\prime} x_{it} + \mu_{i} + \epsilon_{it}$",
+    size=16, color="#5a89a4")
+
+fig.savefig('pandas_logo.svg')
+fig.savefig('pandas_logo.png')
diff --git a/doc/logo/pandas_logo.svg b/doc/logo/pandas_logo.svg
new file mode 100644
index 0000000000000..b165f9635bf51
--- /dev/null
+++ b/doc/logo/pandas_logo.svg
@@ -0,0 +1,879 @@
+<?xml version="1.0" encoding="utf-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+  "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Created with matplotlib (http://matplotlib.org/) -->
+<svg height="90pt" version="1.1" viewBox="0 0 432 90" width="432pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+ <defs>
+  <style type="text/css">
+*{stroke-linecap:butt;stroke-linejoin:round;}
+  </style>
+ </defs>
+ <g id="figure_1">
+  <g id="patch_1">
+   <path d="M 0 90 
+L 432 90 
+L 432 0 
+L 0 0 
+z
+" style="fill:#ffffff;"/>
+  </g>
+  <g id="axes_1">
+   <g id="patch_2">
+    <path d="M 194.4 81 
+L 263.52 81 
+L 263.52 9 
+L 194.4 9 
+z
+" style="fill:#ffffff;"/>
+   </g>
+   <g id="patch_3">
+    <path clip-path="url(#p65e1c8b035)" d="M 197.541818 45 
+L 203.986573 45 
+L 203.986573 19.8 
+L 197.541818 19.8 
+z
+" style="fill:#1f77b4;"/>
+   </g>
+   <g id="patch_4">
+    <path clip-path="url(#p65e1c8b035)" d="M 205.597762 54.6 
+L 212.042517 54.6 
+L 212.042517 45 
+L 205.597762 45 
+z
+" style="fill:#1f77b4;"/>
+   </g>
+   <g id="patch_5">
+    <path clip-path="url(#p65e1c8b035)" d="M 213.653706 45 
+L 220.098462 45 
+L 220.098462 31.8 
+L 213.653706 31.8 
+z
+" style="fill:#1f77b4;"/>
+   </g>
+   <g id="patch_6">
+    <path clip-path="url(#p65e1c8b035)" d="M 221.70965 45 
+L 228.154406 45 
+L 228.154406 15 
+L 221.70965 15 
+z
+" style="fill:#1f77b4;"/>
+   </g>
+   <g id="patch_7">
+    <path clip-path="url(#p65e1c8b035)" d="M 229.765594 70.2 
+L 236.21035 70.2 
+L 236.21035 45 
+L 229.765594 45 
+z
+" style="fill:#1f77b4;"/>
+   </g>
+   <g id="patch_8">
+    <path clip-path="url(#p65e1c8b035)" d="M 237.821538 51 
+L 244.266294 51 
+L 244.266294 45 
+L 237.821538 45 
+z
+" style="fill:#1f77b4;"/>
+   </g>
+   <g id="patch_9">
+    <path clip-path="url(#p65e1c8b035)" d="M 245.877483 69 
+L 252.322238 69 
+L 252.322238 45 
+L 245.877483 45 
+z
+" style="fill:#1f77b4;"/>
+   </g>
+   <g id="patch_10">
+    <path clip-path="url(#p65e1c8b035)" d="M 253.933427 45 
+L 260.378182 45 
+L 260.378182 27 
+L 253.933427 27 
+z
+" style="fill:#1f77b4;"/>
+   </g>
+   <g id="patch_11">
+    <path d="M 194.4 81 
+L 194.4 9 
+" style="fill:none;stroke:#000000;stroke-linecap:square;stroke-linejoin:miter;"/>
+   </g>
+   <g id="patch_12">
+    <path d="M 263.52 81 
+L 263.52 9 
+" style="fill:none;stroke:#000000;stroke-linecap:square;stroke-linejoin:miter;"/>
+   </g>
+   <g id="patch_13">
+    <path d="M 194.4 81 
+L 263.52 81 
+" style="fill:none;stroke:#000000;stroke-linecap:square;stroke-linejoin:miter;"/>
+   </g>
+   <g id="patch_14">
+    <path d="M 194.4 9 
+L 263.52 9 
+" style="fill:none;stroke:#000000;stroke-linecap:square;stroke-linejoin:miter;"/>
+   </g>
+   <g id="matplotlib.axis_1"/>
+   <g id="matplotlib.axis_2"/>
+  </g>
+  <g id="axes_2">
+   <g id="patch_15">
+    <path d="M 272.16 81 
+L 341.28 81 
+L 341.28 9 
+L 272.16 9 
+z
+" style="fill:#ffffff;"/>
+   </g>
+   <g id="line2d_1">
+    <path clip-path="url(#p4dc94feb3b)" d="M 275.301818 28.25879 
+L 284.278442 12.272727 
+L 293.255065 77.727273 
+L 302.231688 74.001976 
+L 311.208312 75.463299 
+L 320.184935 22.132305 
+L 329.161558 55.957655 
+L 338.138182 61.29857 
+" style="fill:none;stroke:#1f77b4;stroke-linecap:square;stroke-width:1.5;"/>
+   </g>
+   <g id="line2d_2">
+    <path clip-path="url(#p4dc94feb3b)" d="M 275.301818 61.597884 
+L 284.278442 64.880819 
+L 293.255065 72.804377 
+L 302.231688 45.091884 
+L 311.208312 52.559951 
+L 320.184935 68.827589 
+L 329.161558 20.701624 
+L 338.138182 33.377345 
+" style="fill:none;stroke:#ff7f0e;stroke-linecap:square;stroke-width:1.5;"/>
+   </g>
+   <g id="line2d_3">
+    <path clip-path="url(#p4dc94feb3b)" d="M 275.301818 61.030555 
+L 284.278442 53.336965 
+L 293.255065 70.575237 
+L 302.231688 25.312123 
+L 311.208312 59.636378 
+L 320.184935 15.516067 
+L 329.161558 18.278268 
+L 338.138182 15.705298 
+" style="fill:none;stroke:#2ca02c;stroke-linecap:square;stroke-width:1.5;"/>
+   </g>
+   <g id="line2d_4">
+    <path clip-path="url(#p4dc94feb3b)" d="M 275.301818 24.671958 
+L 284.278442 24.751621 
+L 293.255065 54.365292 
+L 302.231688 22.746952 
+L 311.208312 43.129804 
+L 320.184935 56.792715 
+L 329.161558 36.348113 
+L 338.138182 22.434164 
+" style="fill:none;stroke:#d62728;stroke-linecap:square;stroke-width:1.5;"/>
+   </g>
+   <g id="patch_16">
+    <path d="M 272.16 81 
+L 272.16 9 
+" style="fill:none;stroke:#000000;stroke-linecap:square;stroke-linejoin:miter;"/>
+   </g>
+   <g id="patch_17">
+    <path d="M 341.28 81 
+L 341.28 9 
+" style="fill:none;stroke:#000000;stroke-linecap:square;stroke-linejoin:miter;"/>
+   </g>
+   <g id="patch_18">
+    <path d="M 272.16 81 
+L 341.28 81 
+" style="fill:none;stroke:#000000;stroke-linecap:square;stroke-linejoin:miter;"/>
+   </g>
+   <g id="patch_19">
+    <path d="M 272.16 9 
+L 341.28 9 
+" style="fill:none;stroke:#000000;stroke-linecap:square;stroke-linejoin:miter;"/>
+   </g>
+   <g id="matplotlib.axis_3"/>
+   <g id="matplotlib.axis_4"/>
+  </g>
+  <g id="axes_3">
+   <g id="patch_20">
+    <path d="M 349.92 81 
+L 419.04 81 
+L 419.04 9 
+L 349.92 9 
+z
+" style="fill:#ffffff;"/>
+   </g>
+   <g id="PolyCollection_1">
+    <defs>
+     <path d="M 353.061818 -31.491429 
+L 353.061818 -9 
+L 360.043636 -9 
+L 367.025455 -9 
+L 374.007273 -9 
+L 380.989091 -9 
+L 387.970909 -9 
+L 394.952727 -9 
+L 401.934545 -9 
+L 408.916364 -9 
+L 415.898182 -9 
+L 415.898182 -22.165714 
+L 415.898182 -22.165714 
+L 408.916364 -29.297143 
+L 401.934545 -15.034286 
+L 394.952727 -25.457143 
+L 387.970909 -19.422857 
+L 380.989091 -29.297143 
+L 374.007273 -24.908571 
+L 367.025455 -35.88 
+L 360.043636 -17.777143 
+L 353.061818 -31.491429 
+z
+" id="m81de97919c"/>
+    </defs>
+    <g clip-path="url(#pfceed726e3)">
+     <use style="fill:#1f77b4;" x="0" xlink:href="#m81de97919c" y="90"/>
+    </g>
+   </g>
+   <g id="PolyCollection_2">
+    <defs>
+     <path d="M 353.061818 -56.725714 
+L 353.061818 -31.491429 
+L 360.043636 -17.777143 
+L 367.025455 -35.88 
+L 374.007273 -24.908571 
+L 380.989091 -29.297143 
+L 387.970909 -19.422857 
+L 394.952727 -25.457143 
+L 401.934545 -15.034286 
+L 408.916364 -29.297143 
+L 415.898182 -22.165714 
+L 415.898182 -41.365714 
+L 415.898182 -41.365714 
+L 408.916364 -44.657143 
+L 401.934545 -36.977143 
+L 394.952727 -32.04 
+L 387.970909 -32.588571 
+L 380.989091 -47.4 
+L 374.007273 -37.525714 
+L 367.025455 -41.365714 
+L 360.043636 -34.782857 
+L 353.061818 -56.725714 
+z
+" id="maaf380e772"/>
+    </defs>
+    <g clip-path="url(#pfceed726e3)">
+     <use style="fill:#ff7f0e;" x="0" xlink:href="#maaf380e772" y="90"/>
+    </g>
+   </g>
+   <g id="PolyCollection_3">
+    <defs>
+     <path d="M 353.061818 -77.571429 
+L 353.061818 -56.725714 
+L 360.043636 -34.782857 
+L 367.025455 -41.365714 
+L 374.007273 -37.525714 
+L 380.989091 -47.4 
+L 387.970909 -32.588571 
+L 394.952727 -32.04 
+L 401.934545 -36.977143 
+L 408.916364 -44.657143 
+L 415.898182 -41.365714 
+L 415.898182 -58.92 
+L 415.898182 -58.92 
+L 408.916364 -64.405714 
+L 401.934545 -49.594286 
+L 394.952727 -40.817143 
+L 387.970909 -39.171429 
+L 380.989091 -50.691429 
+L 374.007273 -49.594286 
+L 367.025455 -57.822857 
+L 360.043636 -56.177143 
+L 353.061818 -77.571429 
+z
+" id="m31c02dcfcb"/>
+    </defs>
+    <g clip-path="url(#pfceed726e3)">
+     <use style="fill:#2ca02c;" x="0" xlink:href="#m31c02dcfcb" y="90"/>
+    </g>
+   </g>
+   <g id="patch_21">
+    <path d="M 349.92 81 
+L 349.92 9 
+" style="fill:none;stroke:#000000;stroke-linecap:square;stroke-linejoin:miter;"/>
+   </g>
+   <g id="patch_22">
+    <path d="M 419.04 81 
+L 419.04 9 
+" style="fill:none;stroke:#000000;stroke-linecap:square;stroke-linejoin:miter;"/>
+   </g>
+   <g id="patch_23">
+    <path d="M 349.92 81 
+L 419.04 81 
+" style="fill:none;stroke:#000000;stroke-linecap:square;stroke-linejoin:miter;"/>
+   </g>
+   <g id="patch_24">
+    <path d="M 349.92 9 
+L 419.04 9 
+" style="fill:none;stroke:#000000;stroke-linecap:square;stroke-linejoin:miter;"/>
+   </g>
+   <g id="matplotlib.axis_5"/>
+   <g id="matplotlib.axis_6"/>
+  </g>
+  <g id="text_1">
+   <!-- pandas -->
+   <defs>
+    <path d="M 18.109375 8.203125 
+L 18.109375 -20.796875 
+L 9.078125 -20.796875 
+L 9.078125 54.6875 
+L 18.109375 54.6875 
+L 18.109375 46.390625 
+Q 20.953125 51.265625 25.265625 53.625 
+Q 29.59375 56 35.59375 56 
+Q 45.5625 56 51.78125 48.09375 
+Q 58.015625 40.1875 58.015625 27.296875 
+Q 58.015625 14.40625 51.78125 6.484375 
+Q 45.5625 -1.421875 35.59375 -1.421875 
+Q 29.59375 -1.421875 25.265625 0.953125 
+Q 20.953125 3.328125 18.109375 8.203125 
+M 48.6875 27.296875 
+Q 48.6875 37.203125 44.609375 42.84375 
+Q 40.53125 48.484375 33.40625 48.484375 
+Q 26.265625 48.484375 22.1875 42.84375 
+Q 18.109375 37.203125 18.109375 27.296875 
+Q 18.109375 17.390625 22.1875 11.75 
+Q 26.265625 6.109375 33.40625 6.109375 
+Q 40.53125 6.109375 44.609375 11.75 
+Q 48.6875 17.390625 48.6875 27.296875 
+" id="DejaVuSans-70"/>
+    <path d="M 34.28125 27.484375 
+Q 23.390625 27.484375 19.1875 25 
+Q 14.984375 22.515625 14.984375 16.5 
+Q 14.984375 11.71875 18.140625 8.90625 
+Q 21.296875 6.109375 26.703125 6.109375 
+Q 34.1875 6.109375 38.703125 11.40625 
+Q 43.21875 16.703125 43.21875 25.484375 
+L 43.21875 27.484375 
+z
+M 52.203125 31.203125 
+L 52.203125 0 
+L 43.21875 0 
+L 43.21875 8.296875 
+Q 40.140625 3.328125 35.546875 0.953125 
+Q 30.953125 -1.421875 24.3125 -1.421875 
+Q 15.921875 -1.421875 10.953125 3.296875 
+Q 6 8.015625 6 15.921875 
+Q 6 25.140625 12.171875 29.828125 
+Q 18.359375 34.515625 30.609375 34.515625 
+L 43.21875 34.515625 
+L 43.21875 35.40625 
+Q 43.21875 41.609375 39.140625 45 
+Q 35.0625 48.390625 27.6875 48.390625 
+Q 23 48.390625 18.546875 47.265625 
+Q 14.109375 46.140625 10.015625 43.890625 
+L 10.015625 52.203125 
+Q 14.9375 54.109375 19.578125 55.046875 
+Q 24.21875 56 28.609375 56 
+Q 40.484375 56 46.34375 49.84375 
+Q 52.203125 43.703125 52.203125 31.203125 
+" id="DejaVuSans-61"/>
+    <path d="M 54.890625 33.015625 
+L 54.890625 0 
+L 45.90625 0 
+L 45.90625 32.71875 
+Q 45.90625 40.484375 42.875 44.328125 
+Q 39.84375 48.1875 33.796875 48.1875 
+Q 26.515625 48.1875 22.3125 43.546875 
+Q 18.109375 38.921875 18.109375 30.90625 
+L 18.109375 0 
+L 9.078125 0 
+L 9.078125 54.6875 
+L 18.109375 54.6875 
+L 18.109375 46.1875 
+Q 21.34375 51.125 25.703125 53.5625 
+Q 30.078125 56 35.796875 56 
+Q 45.21875 56 50.046875 50.171875 
+Q 54.890625 44.34375 54.890625 33.015625 
+" id="DejaVuSans-6e"/>
+    <path d="M 45.40625 46.390625 
+L 45.40625 75.984375 
+L 54.390625 75.984375 
+L 54.390625 0 
+L 45.40625 0 
+L 45.40625 8.203125 
+Q 42.578125 3.328125 38.25 0.953125 
+Q 33.9375 -1.421875 27.875 -1.421875 
+Q 17.96875 -1.421875 11.734375 6.484375 
+Q 5.515625 14.40625 5.515625 27.296875 
+Q 5.515625 40.1875 11.734375 48.09375 
+Q 17.96875 56 27.875 56 
+Q 33.9375 56 38.25 53.625 
+Q 42.578125 51.265625 45.40625 46.390625 
+M 14.796875 27.296875 
+Q 14.796875 17.390625 18.875 11.75 
+Q 22.953125 6.109375 30.078125 6.109375 
+Q 37.203125 6.109375 41.296875 11.75 
+Q 45.40625 17.390625 45.40625 27.296875 
+Q 45.40625 37.203125 41.296875 42.84375 
+Q 37.203125 48.484375 30.078125 48.484375 
+Q 22.953125 48.484375 18.875 42.84375 
+Q 14.796875 37.203125 14.796875 27.296875 
+" id="DejaVuSans-64"/>
+    <path d="M 44.28125 53.078125 
+L 44.28125 44.578125 
+Q 40.484375 46.53125 36.375 47.5 
+Q 32.28125 48.484375 27.875 48.484375 
+Q 21.1875 48.484375 17.84375 46.4375 
+Q 14.5 44.390625 14.5 40.28125 
+Q 14.5 37.15625 16.890625 35.375 
+Q 19.28125 33.59375 26.515625 31.984375 
+L 29.59375 31.296875 
+Q 39.15625 29.25 43.1875 25.515625 
+Q 47.21875 21.78125 47.21875 15.09375 
+Q 47.21875 7.46875 41.1875 3.015625 
+Q 35.15625 -1.421875 24.609375 -1.421875 
+Q 20.21875 -1.421875 15.453125 -0.5625 
+Q 10.6875 0.296875 5.421875 2 
+L 5.421875 11.28125 
+Q 10.40625 8.6875 15.234375 7.390625 
+Q 20.0625 6.109375 24.8125 6.109375 
+Q 31.15625 6.109375 34.5625 8.28125 
+Q 37.984375 10.453125 37.984375 14.40625 
+Q 37.984375 18.0625 35.515625 20.015625 
+Q 33.0625 21.96875 24.703125 23.78125 
+L 21.578125 24.515625 
+Q 13.234375 26.265625 9.515625 29.90625 
+Q 5.8125 33.546875 5.8125 39.890625 
+Q 5.8125 47.609375 11.28125 51.796875 
+Q 16.75 56 26.8125 56 
+Q 31.78125 56 36.171875 55.265625 
+Q 40.578125 54.546875 44.28125 53.078125 
+" id="DejaVuSans-73"/>
+   </defs>
+   <g transform="translate(21.6 45)scale(0.4 -0.4)">
+    <use xlink:href="#DejaVuSans-70"/>
+    <use x="63.476562" xlink:href="#DejaVuSans-61"/>
+    <use x="124.755859" xlink:href="#DejaVuSans-6e"/>
+    <use x="188.134766" xlink:href="#DejaVuSans-64"/>
+    <use x="251.611328" xlink:href="#DejaVuSans-61"/>
+    <use x="312.890625" xlink:href="#DejaVuSans-73"/>
+   </g>
+  </g>
+  <g id="text_2">
+   <!-- $y_{it} = \beta^{\prime} x_{it} + \mu_{i} + \epsilon_{it}$ -->
+   <defs>
+    <path d="M 8.40625 -14.3125 
+Q 10.5 -17.921875 15.71875 -17.921875 
+Q 20.453125 -17.921875 23.921875 -14.59375 
+Q 27.390625 -11.28125 29.515625 -6.5625 
+Q 31.640625 -1.859375 32.8125 3.078125 
+Q 28.375 -1.125 23.1875 -1.125 
+Q 19.234375 -1.125 16.453125 0.234375 
+Q 13.671875 1.609375 12.125 4.3125 
+Q 10.59375 7.03125 10.59375 10.890625 
+Q 10.59375 14.15625 11.46875 17.59375 
+Q 12.359375 21.046875 13.9375 25.265625 
+Q 15.53125 29.5 16.703125 32.625 
+Q 18.015625 36.28125 18.015625 38.625 
+Q 18.015625 41.609375 15.828125 41.609375 
+Q 11.859375 41.609375 9.296875 37.53125 
+Q 6.734375 33.453125 5.515625 28.421875 
+Q 5.328125 27.78125 4.6875 27.78125 
+L 3.515625 27.78125 
+Q 2.6875 27.78125 2.6875 28.71875 
+L 2.6875 29 
+Q 4.296875 34.96875 7.609375 39.578125 
+Q 10.9375 44.1875 16.015625 44.1875 
+Q 19.578125 44.1875 22.046875 41.84375 
+Q 24.515625 39.5 24.515625 35.890625 
+Q 24.515625 34.03125 23.6875 31.984375 
+Q 23.25 30.765625 21.6875 26.65625 
+Q 20.125 22.5625 19.28125 19.875 
+Q 18.453125 17.1875 17.921875 14.59375 
+Q 17.390625 12.015625 17.390625 9.421875 
+Q 17.390625 6.109375 18.796875 3.8125 
+Q 20.21875 1.515625 23.296875 1.515625 
+Q 29.5 1.515625 34.421875 9.078125 
+L 42 39.890625 
+Q 42.328125 41.21875 43.546875 42.15625 
+Q 44.78125 43.109375 46.1875 43.109375 
+Q 47.40625 43.109375 48.3125 42.328125 
+Q 49.21875 41.546875 49.21875 40.28125 
+Q 49.21875 39.703125 49.125 39.5 
+L 39.203125 -0.296875 
+Q 37.890625 -5.421875 34.375 -10.109375 
+Q 30.859375 -14.796875 25.90625 -17.65625 
+Q 20.953125 -20.515625 15.578125 -20.515625 
+Q 12.984375 -20.515625 10.4375 -19.5 
+Q 7.90625 -18.5 6.34375 -16.5 
+Q 4.78125 -14.5 4.78125 -11.8125 
+Q 4.78125 -9.078125 6.390625 -7.078125 
+Q 8.015625 -5.078125 10.6875 -5.078125 
+Q 12.3125 -5.078125 13.40625 -6.078125 
+Q 14.5 -7.078125 14.5 -8.6875 
+Q 14.5 -10.984375 12.78125 -12.6875 
+Q 11.078125 -14.40625 8.796875 -14.40625 
+Q 8.6875 -14.359375 8.59375 -14.328125 
+Q 8.5 -14.3125 8.40625 -14.3125 
+" id="Cmmi10-79"/>
+    <path d="M 7.8125 7.171875 
+Q 7.8125 9.03125 8.59375 11.078125 
+L 16.703125 32.625 
+Q 18.015625 36.28125 18.015625 38.625 
+Q 18.015625 41.609375 15.828125 41.609375 
+Q 11.859375 41.609375 9.296875 37.53125 
+Q 6.734375 33.453125 5.515625 28.421875 
+Q 5.328125 27.78125 4.6875 27.78125 
+L 3.515625 27.78125 
+Q 2.6875 27.78125 2.6875 28.71875 
+L 2.6875 29 
+Q 4.296875 34.96875 7.609375 39.578125 
+Q 10.9375 44.1875 16.015625 44.1875 
+Q 19.578125 44.1875 22.046875 41.84375 
+Q 24.515625 39.5 24.515625 35.890625 
+Q 24.515625 34.03125 23.6875 31.984375 
+L 15.578125 10.5 
+Q 14.203125 7.171875 14.203125 4.5 
+Q 14.203125 1.515625 16.5 1.515625 
+Q 20.40625 1.515625 23.015625 5.6875 
+Q 25.640625 9.859375 26.703125 14.703125 
+Q 26.90625 15.28125 27.484375 15.28125 
+L 28.71875 15.28125 
+Q 29.109375 15.28125 29.34375 15.015625 
+Q 29.59375 14.75 29.59375 14.40625 
+Q 29.59375 14.3125 29.5 14.109375 
+Q 28.125 8.453125 24.734375 3.65625 
+Q 21.34375 -1.125 16.3125 -1.125 
+Q 12.796875 -1.125 10.296875 1.296875 
+Q 7.8125 3.71875 7.8125 7.171875 
+M 19.09375 60.59375 
+Q 19.09375 62.703125 20.84375 64.40625 
+Q 22.609375 66.109375 24.703125 66.109375 
+Q 26.421875 66.109375 27.515625 65.0625 
+Q 28.609375 64.015625 28.609375 62.40625 
+Q 28.609375 60.15625 26.828125 58.46875 
+Q 25.046875 56.78125 22.90625 56.78125 
+Q 21.296875 56.78125 20.1875 57.875 
+Q 19.09375 58.984375 19.09375 60.59375 
+" id="Cmmi10-69"/>
+    <path d="M 6.203125 8.109375 
+Q 6.203125 9.578125 6.5 10.890625 
+L 13.71875 39.59375 
+L 3.21875 39.59375 
+Q 2.203125 39.59375 2.203125 40.921875 
+Q 2.59375 43.109375 3.515625 43.109375 
+L 14.59375 43.109375 
+L 18.609375 59.421875 
+Q 19 60.75 20.171875 61.671875 
+Q 21.34375 62.59375 22.796875 62.59375 
+Q 24.078125 62.59375 24.921875 61.828125 
+Q 25.78125 61.078125 25.78125 59.8125 
+Q 25.78125 59.515625 25.75 59.34375 
+Q 25.734375 59.1875 25.6875 58.984375 
+L 21.6875 43.109375 
+L 31.984375 43.109375 
+Q 33.015625 43.109375 33.015625 41.796875 
+Q 32.953125 41.546875 32.8125 40.953125 
+Q 32.671875 40.375 32.421875 39.984375 
+Q 32.171875 39.59375 31.6875 39.59375 
+L 20.796875 39.59375 
+L 13.625 10.6875 
+Q 12.890625 7.859375 12.890625 5.8125 
+Q 12.890625 1.515625 15.828125 1.515625 
+Q 20.21875 1.515625 23.609375 5.640625 
+Q 27 9.765625 28.8125 14.703125 
+Q 29.203125 15.28125 29.59375 15.28125 
+L 30.8125 15.28125 
+Q 31.203125 15.28125 31.4375 15.015625 
+Q 31.6875 14.75 31.6875 14.40625 
+Q 31.6875 14.203125 31.59375 14.109375 
+Q 29.390625 8.0625 25.1875 3.46875 
+Q 21 -1.125 15.578125 -1.125 
+Q 11.625 -1.125 8.90625 1.453125 
+Q 6.203125 4.046875 6.203125 8.109375 
+" id="Cmmi10-74"/>
+    <path d="M 7.515625 13.28125 
+Q 6.6875 13.28125 6.140625 13.90625 
+Q 5.609375 14.546875 5.609375 15.28125 
+Q 5.609375 16.109375 6.140625 16.6875 
+Q 6.6875 17.28125 7.515625 17.28125 
+L 70.3125 17.28125 
+Q 71.046875 17.28125 71.578125 16.6875 
+Q 72.125 16.109375 72.125 15.28125 
+Q 72.125 14.546875 71.578125 13.90625 
+Q 71.046875 13.28125 70.3125 13.28125 
+z
+M 7.515625 32.71875 
+Q 6.6875 32.71875 6.140625 33.296875 
+Q 5.609375 33.890625 5.609375 34.71875 
+Q 5.609375 35.453125 6.140625 36.078125 
+Q 6.6875 36.71875 7.515625 36.71875 
+L 70.3125 36.71875 
+Q 71.046875 36.71875 71.578125 36.078125 
+Q 72.125 35.453125 72.125 34.71875 
+Q 72.125 33.890625 71.578125 33.296875 
+Q 71.046875 32.71875 70.3125 32.71875 
+z
+" id="Cmr10-3d"/>
+    <path d="M 2.6875 -19.390625 
+Q 2.390625 -19.390625 2.140625 -19.046875 
+Q 1.90625 -18.703125 1.90625 -18.40625 
+L 17.28125 43.40625 
+Q 18.609375 48.390625 21.140625 53.078125 
+Q 23.6875 57.765625 27.515625 61.796875 
+Q 31.34375 65.828125 35.9375 68.171875 
+Q 40.53125 70.515625 45.703125 70.515625 
+Q 49.421875 70.515625 52.421875 68.875 
+Q 55.421875 67.234375 57.15625 64.28125 
+Q 58.890625 61.328125 58.890625 57.625 
+Q 58.890625 54.046875 57.515625 50.796875 
+Q 56.15625 47.5625 53.703125 44.75 
+Q 51.265625 41.9375 48.484375 40.1875 
+Q 50.09375 39.15625 51.359375 37.5625 
+Q 52.640625 35.984375 53.421875 34.25 
+Q 54.203125 32.515625 54.640625 30.390625 
+Q 55.078125 28.265625 55.078125 26.421875 
+Q 55.078125 21.296875 52.875 16.3125 
+Q 50.6875 11.328125 46.890625 7.265625 
+Q 43.109375 3.21875 38.21875 0.84375 
+Q 33.34375 -1.515625 28.21875 -1.515625 
+Q 22.609375 -1.515625 18.109375 1.5625 
+Q 13.625 4.640625 11.921875 9.90625 
+L 4.6875 -18.796875 
+Q 4.6875 -19.390625 3.90625 -19.390625 
+z
+M 28.421875 1.21875 
+Q 32.90625 1.21875 36.546875 4.171875 
+Q 40.1875 7.125 42.546875 11.59375 
+Q 44.921875 16.0625 46.15625 21.0625 
+Q 47.40625 26.078125 47.40625 30.171875 
+Q 47.40625 35.25 44.484375 38.1875 
+Q 41.0625 36.921875 37.796875 36.921875 
+Q 29.890625 36.921875 29.890625 39.59375 
+Q 29.890625 43.109375 38.921875 43.109375 
+Q 42.140625 43.109375 44.828125 42.09375 
+Q 46.96875 43.75 48.71875 46.96875 
+Q 50.484375 50.203125 51.390625 53.71875 
+Q 52.296875 57.234375 52.296875 60.296875 
+Q 52.296875 63.578125 50.5625 65.75 
+Q 48.828125 67.921875 45.515625 67.921875 
+Q 39.40625 67.921875 34.15625 64.15625 
+Q 28.90625 60.40625 25.296875 54.65625 
+Q 21.6875 48.921875 20.125 42.828125 
+L 14.59375 20.703125 
+Q 14.0625 18.40625 13.921875 15.578125 
+Q 13.921875 9.328125 18.015625 5.265625 
+Q 22.125 1.21875 28.421875 1.21875 
+M 32.90625 39.890625 
+Q 34.421875 39.5 37.890625 39.5 
+Q 39.59375 39.5 41.3125 40.09375 
+Q 41.21875 40.1875 40.921875 40.1875 
+Q 39.84375 40.484375 38.625 40.484375 
+Q 34.078125 40.484375 32.90625 39.890625 
+" id="Cmmi10-af"/>
+    <path d="M 3.515625 5.421875 
+Q 2.875 5.609375 2.875 6.390625 
+L 15.09375 51.8125 
+Q 15.671875 53.65625 17.078125 54.78125 
+Q 18.5 55.90625 20.3125 55.90625 
+Q 22.65625 55.90625 24.4375 54.359375 
+Q 26.21875 52.828125 26.21875 50.484375 
+Q 26.21875 49.46875 25.6875 48.1875 
+L 7.625 4.984375 
+Q 7.28125 4.296875 6.6875 4.296875 
+Q 6.15625 4.296875 5 4.78125 
+Q 3.859375 5.28125 3.515625 5.421875 
+" id="Cmsy10-30"/>
+    <path d="M 7.8125 2.875 
+Q 9.578125 1.515625 12.796875 1.515625 
+Q 15.921875 1.515625 18.3125 4.515625 
+Q 20.703125 7.515625 21.578125 11.078125 
+L 26.125 28.8125 
+Q 27.203125 33.640625 27.203125 35.40625 
+Q 27.203125 37.890625 25.8125 39.75 
+Q 24.421875 41.609375 21.921875 41.609375 
+Q 18.75 41.609375 15.96875 39.625 
+Q 13.1875 37.640625 11.28125 34.59375 
+Q 9.375 31.546875 8.59375 28.421875 
+Q 8.40625 27.78125 7.8125 27.78125 
+L 6.59375 27.78125 
+Q 5.8125 27.78125 5.8125 28.71875 
+L 5.8125 29 
+Q 6.78125 32.71875 9.125 36.25 
+Q 11.46875 39.796875 14.859375 41.984375 
+Q 18.265625 44.1875 22.125 44.1875 
+Q 25.78125 44.1875 28.734375 42.234375 
+Q 31.6875 40.28125 32.90625 36.921875 
+Q 34.625 39.984375 37.28125 42.078125 
+Q 39.9375 44.1875 43.109375 44.1875 
+Q 45.265625 44.1875 47.5 43.421875 
+Q 49.75 42.671875 51.171875 41.109375 
+Q 52.59375 39.546875 52.59375 37.203125 
+Q 52.59375 34.671875 50.953125 32.828125 
+Q 49.3125 31 46.78125 31 
+Q 45.171875 31 44.09375 32.03125 
+Q 43.015625 33.0625 43.015625 34.625 
+Q 43.015625 36.71875 44.453125 38.296875 
+Q 45.90625 39.890625 47.90625 40.1875 
+Q 46.09375 41.609375 42.921875 41.609375 
+Q 39.703125 41.609375 37.328125 38.625 
+Q 34.96875 35.640625 33.984375 31.984375 
+L 29.59375 14.3125 
+Q 28.515625 10.296875 28.515625 7.71875 
+Q 28.515625 5.171875 29.953125 3.34375 
+Q 31.390625 1.515625 33.796875 1.515625 
+Q 38.484375 1.515625 42.15625 5.640625 
+Q 45.84375 9.765625 47.015625 14.703125 
+Q 47.21875 15.28125 47.796875 15.28125 
+L 49.03125 15.28125 
+Q 49.421875 15.28125 49.65625 15.015625 
+Q 49.90625 14.75 49.90625 14.40625 
+Q 49.90625 14.3125 49.8125 14.109375 
+Q 48.390625 8.15625 43.84375 3.515625 
+Q 39.3125 -1.125 33.59375 -1.125 
+Q 29.9375 -1.125 26.984375 0.84375 
+Q 24.03125 2.828125 22.796875 6.203125 
+Q 21.234375 3.265625 18.46875 1.0625 
+Q 15.71875 -1.125 12.59375 -1.125 
+Q 10.453125 -1.125 8.171875 -0.359375 
+Q 5.90625 0.390625 4.484375 1.953125 
+Q 3.078125 3.515625 3.078125 5.90625 
+Q 3.078125 8.25 4.703125 10.171875 
+Q 6.34375 12.109375 8.796875 12.109375 
+Q 10.453125 12.109375 11.578125 11.109375 
+Q 12.703125 10.109375 12.703125 8.5 
+Q 12.703125 6.390625 11.296875 4.828125 
+Q 9.90625 3.265625 7.8125 2.875 
+" id="Cmmi10-78"/>
+    <path d="M 7.515625 23 
+Q 6.6875 23 6.140625 23.625 
+Q 5.609375 24.265625 5.609375 25 
+Q 5.609375 25.734375 6.140625 26.359375 
+Q 6.6875 27 7.515625 27 
+L 36.921875 27 
+L 36.921875 56.5 
+Q 36.921875 57.28125 37.5 57.78125 
+Q 38.09375 58.296875 38.921875 58.296875 
+Q 39.65625 58.296875 40.28125 57.78125 
+Q 40.921875 57.28125 40.921875 56.5 
+L 40.921875 27 
+L 70.3125 27 
+Q 71.046875 27 71.578125 26.359375 
+Q 72.125 25.734375 72.125 25 
+Q 72.125 24.265625 71.578125 23.625 
+Q 71.046875 23 70.3125 23 
+L 40.921875 23 
+L 40.921875 -6.5 
+Q 40.921875 -7.28125 40.28125 -7.78125 
+Q 39.65625 -8.296875 38.921875 -8.296875 
+Q 38.09375 -8.296875 37.5 -7.78125 
+Q 36.921875 -7.28125 36.921875 -6.5 
+L 36.921875 23 
+z
+" id="Cmr10-2b"/>
+    <path d="M 2.78125 -18.796875 
+Q 2.78125 -18.21875 2.875 -18.015625 
+L 17.578125 41.015625 
+Q 18.015625 42.4375 19.15625 43.3125 
+Q 20.3125 44.1875 21.78125 44.1875 
+Q 23.046875 44.1875 23.921875 43.421875 
+Q 24.8125 42.671875 24.8125 41.40625 
+Q 24.8125 41.109375 24.78125 40.9375 
+Q 24.75 40.765625 24.703125 40.578125 
+L 18.796875 17.1875 
+Q 17.828125 13.03125 17.828125 10.015625 
+Q 17.828125 6.296875 19.578125 3.90625 
+Q 21.34375 1.515625 24.90625 1.515625 
+Q 32.171875 1.515625 37.703125 10.59375 
+Q 37.75 10.6875 37.765625 10.734375 
+Q 37.796875 10.796875 37.796875 10.890625 
+L 45.015625 39.890625 
+Q 45.359375 41.21875 46.578125 42.15625 
+Q 47.796875 43.109375 49.21875 43.109375 
+Q 50.390625 43.109375 51.296875 42.328125 
+Q 52.203125 41.546875 52.203125 40.28125 
+Q 52.203125 39.703125 52.09375 39.5 
+L 44.921875 10.6875 
+Q 44.1875 7.859375 44.1875 5.8125 
+Q 44.1875 1.515625 47.125 1.515625 
+Q 50.25 1.515625 51.828125 5.375 
+Q 53.421875 9.234375 54.59375 14.703125 
+Q 54.78125 15.28125 55.421875 15.28125 
+L 56.59375 15.28125 
+Q 56.984375 15.28125 57.25 14.96875 
+Q 57.515625 14.65625 57.515625 14.3125 
+Q 55.765625 7.328125 53.6875 3.09375 
+Q 51.609375 -1.125 46.921875 -1.125 
+Q 43.609375 -1.125 41.046875 0.78125 
+Q 38.484375 2.6875 37.703125 5.90625 
+Q 35.203125 2.78125 31.859375 0.828125 
+Q 28.515625 -1.125 24.8125 -1.125 
+Q 18.5625 -1.125 14.984375 1.8125 
+L 9.90625 -18.40625 
+Q 9.625 -19.828125 8.453125 -20.703125 
+Q 7.28125 -21.578125 5.8125 -21.578125 
+Q 4.59375 -21.578125 3.6875 -20.8125 
+Q 2.78125 -20.0625 2.78125 -18.796875 
+" id="Cmmi10-b9"/>
+    <path d="M 12.3125 14.109375 
+Q 12.3125 10.75 13.53125 7.859375 
+Q 14.75 4.984375 17.203125 3.25 
+Q 19.671875 1.515625 23 1.515625 
+Q 25.25 1.515625 27.78125 2.484375 
+Q 30.328125 3.46875 32.5 4.640625 
+Q 34.671875 5.8125 34.71875 5.8125 
+Q 35.25 5.8125 35.5625 5.203125 
+Q 35.890625 4.59375 35.890625 4 
+Q 35.890625 3.46875 35.59375 3.328125 
+Q 29.34375 -1.125 22.90625 -1.125 
+Q 17.625 -1.125 13.375 1.34375 
+Q 9.125 3.8125 6.8125 8.203125 
+Q 4.5 12.59375 4.5 17.828125 
+Q 4.5 23 6.59375 27.65625 
+Q 8.6875 32.328125 12.390625 35.796875 
+Q 16.109375 39.265625 20.796875 41.1875 
+Q 25.484375 43.109375 30.609375 43.109375 
+L 36.28125 43.109375 
+Q 37.796875 43.109375 37.796875 41.609375 
+Q 37.796875 40.765625 37.234375 40.171875 
+Q 36.671875 39.59375 35.890625 39.59375 
+L 30.421875 39.59375 
+Q 26.421875 39.59375 23.171875 37.828125 
+Q 19.921875 36.078125 17.71875 32.953125 
+Q 15.53125 29.828125 14.3125 25.875 
+L 31.984375 25.875 
+Q 32.671875 25.875 33.078125 25.453125 
+Q 33.5 25.046875 33.5 24.421875 
+Q 33.5 23.578125 32.953125 22.984375 
+Q 32.421875 22.40625 31.59375 22.40625 
+L 13.375 22.40625 
+Q 12.3125 17.234375 12.3125 14.109375 
+" id="Cmmi10-b2"/>
+   </defs>
+   <g style="fill:#5a89a4;" transform="translate(21.6 72)scale(0.16 -0.16)">
+    <use transform="translate(0 0.601562)" xlink:href="#Cmmi10-79"/>
+    <use transform="translate(49.023438 -16.404687)scale(0.7)" xlink:href="#Cmmi10-69"/>
+    <use transform="translate(73.120117 -16.404687)scale(0.7)" xlink:href="#Cmmi10-74"/>
+    <use transform="translate(122.314844 0.601562)" xlink:href="#Cmr10-3d"/>
+    <use transform="translate(217.558984 0.601562)" xlink:href="#Cmmi10-af"/>
+    <use transform="translate(285.885312 38.865625)scale(0.7)" xlink:href="#Cmsy10-30"/>
+    <use transform="translate(311.50582 0.601562)" xlink:href="#Cmmi10-78"/>
+    <use transform="translate(368.585898 -16.404687)scale(0.7)" xlink:href="#Cmmi10-69"/>
+    <use transform="translate(392.682578 -16.404687)scale(0.7)" xlink:href="#Cmmi10-74"/>
+    <use transform="translate(441.877305 0.601562)" xlink:href="#Cmr10-2b"/>
+    <use transform="translate(537.121445 0.601562)" xlink:href="#Cmmi10-b9"/>
+    <use transform="translate(597.326523 -16.404687)scale(0.7)" xlink:href="#Cmmi10-69"/>
+    <use transform="translate(645.359141 0.601562)" xlink:href="#Cmr10-2b"/>
+    <use transform="translate(740.603281 0.601562)" xlink:href="#Cmmi10-b2"/>
+    <use transform="translate(781.081797 -16.404687)scale(0.7)" xlink:href="#Cmmi10-69"/>
+    <use transform="translate(805.178477 -16.404687)scale(0.7)" xlink:href="#Cmmi10-74"/>
+   </g>
+  </g>
+ </g>
+ <defs>
+  <clipPath id="p65e1c8b035">
+   <rect height="72" width="69.12" x="194.4" y="9"/>
+  </clipPath>
+  <clipPath id="p4dc94feb3b">
+   <rect height="72" width="69.12" x="272.16" y="9"/>
+  </clipPath>
+  <clipPath id="pfceed726e3">
+   <rect height="72" width="69.12" x="349.92" y="9"/>
+  </clipPath>
+ </defs>
+</svg>
diff --git a/doc/make.py b/doc/make.py
index 6b424ce2814d5..4d54a2415a194 100755
--- a/doc/make.py
+++ b/doc/make.py
@@ -1,381 +1,372 @@
 #!/usr/bin/env python
-
 """
 Python script for building documentation.
 
 To build the docs you must have all optional dependencies for pandas
 installed. See the installation instructions for a list of these.
 
-<del>Note: currently latex builds do not work because of table formats that are not
-supported in the latex generation.</del>
-
-2014-01-30: Latex has some issues but 'latex_forced' works ok for 0.13.0-400 or so
-
 Usage
 -----
-python make.py clean
-python make.py html
+    $ python make.py clean
+    $ python make.py html
+    $ python make.py latex
 """
-from __future__ import print_function
-
-import glob
+import importlib
+import sys
 import os
 import shutil
-import sys
-import sphinx
+# import subprocess
 import argparse
+from contextlib import contextmanager
+import webbrowser
 import jinja2
 
-os.environ['PYTHONPATH'] = '..'
-
-SPHINX_BUILD = 'sphinxbuild'
-
-
-def upload_dev(user='pandas'):
-    'push a copy to the pydata dev directory'
-    if os.system('cd build/html; rsync -avz . {0}@pandas.pydata.org'
-                 ':/usr/share/nginx/pandas/pandas-docs/dev/ -essh'.format(user)):
-        raise SystemExit('Upload to Pydata Dev failed')
-
-
-def upload_dev_pdf(user='pandas'):
-    'push a copy to the pydata dev directory'
-    if os.system('cd build/latex; scp pandas.pdf {0}@pandas.pydata.org'
-                 ':/usr/share/nginx/pandas/pandas-docs/dev/'.format(user)):
-        raise SystemExit('PDF upload to Pydata Dev failed')
-
 
-def upload_stable(user='pandas'):
-    'push a copy to the pydata stable directory'
-    if os.system('cd build/html; rsync -avz . {0}@pandas.pydata.org'
-                 ':/usr/share/nginx/pandas/pandas-docs/stable/ -essh'.format(user)):
-        raise SystemExit('Upload to stable failed')
+DOC_PATH = os.path.dirname(os.path.abspath(__file__))
+SOURCE_PATH = os.path.join(DOC_PATH, 'source')
+BUILD_PATH = os.path.join(DOC_PATH, 'build')
+BUILD_DIRS = ['doctrees', 'html', 'latex', 'plots', '_static', '_templates']
 
 
-def upload_stable_pdf(user='pandas'):
-    'push a copy to the pydata dev directory'
-    if os.system('cd build/latex; scp pandas.pdf {0}@pandas.pydata.org'
-                 ':/usr/share/nginx/pandas/pandas-docs/stable/'.format(user)):
-        raise SystemExit('PDF upload to stable failed')
+@contextmanager
+def _maybe_exclude_notebooks():
+    """Skip building the notebooks if pandoc is not installed.
 
+    This assumes that nbsphinx is installed.
 
-def upload_prev(ver, doc_root='./', user='pandas'):
-    'push a copy of older release to appropriate version directory'
-    local_dir = doc_root + 'build/html'
-    remote_dir = '/usr/share/nginx/pandas/pandas-docs/version/%s/' % ver
-    cmd = 'cd %s; rsync -avz . %s@pandas.pydata.org:%s -essh'
-    cmd = cmd % (local_dir, user, remote_dir)
-    print(cmd)
-    if os.system(cmd):
-        raise SystemExit(
-            'Upload to %s from %s failed' % (remote_dir, local_dir))
+    Skip notebook conversion if:
+    1. nbconvert isn't installed, or
+    2. nbconvert is installed, but pandoc isn't
+    """
+    # TODO move to exclude_pattern
+    base = os.path.dirname(__file__)
+    notebooks = [os.path.join(base, 'source', nb)
+                 for nb in ['style.ipynb']]
+    contents = {}
 
-    local_dir = doc_root + 'build/latex'
-    pdf_cmd = 'cd %s; scp pandas.pdf %s@pandas.pydata.org:%s'
-    pdf_cmd = pdf_cmd % (local_dir, user, remote_dir)
-    if os.system(pdf_cmd):
-        raise SystemExit('Upload PDF to %s from %s failed' % (ver, doc_root))
+    def _remove_notebooks():
+        for nb in notebooks:
+            with open(nb, 'rt') as f:
+                contents[nb] = f.read()
+            os.remove(nb)
 
-def build_pandas():
-    os.chdir('..')
-    os.system('python setup.py clean')
-    os.system('python setup.py build_ext --inplace')
-    os.chdir('doc')
-
-def build_prev(ver):
-    if os.system('git checkout v%s' % ver) != 1:
-        os.chdir('..')
-        os.system('python setup.py clean')
-        os.system('python setup.py build_ext --inplace')
-        os.chdir('doc')
-        os.system('python make.py clean')
-        os.system('python make.py html')
-        os.system('python make.py latex')
-        os.system('git checkout master')
-
-
-def clean():
-    if os.path.exists('build'):
-        shutil.rmtree('build')
-
-    if os.path.exists('source/generated'):
-        shutil.rmtree('source/generated')
-
-
-def html():
-    check_build()
-    if os.system('sphinx-build -P -b html -d build/doctrees '
-                 'source build/html'):
-        raise SystemExit("Building HTML failed.")
     try:
-        # remove stale file
-        os.system('cd build; rm -f html/pandas.zip;')
-    except:
-        pass
-
-def zip_html():
-    try:
-        print("\nZipping up HTML docs...")
-        # just in case the wonky build box doesn't have zip
-        # don't fail this.
-        os.system('cd build; rm -f html/pandas.zip; zip html/pandas.zip -r -q html/* ')
-        print("\n")
-    except:
-        pass
-
-def latex():
-    check_build()
-    if sys.platform != 'win32':
-        # LaTeX format.
-        if os.system('sphinx-build -b latex -d build/doctrees '
-                     'source build/latex'):
-            raise SystemExit("Building LaTeX failed.")
-        # Produce pdf.
-
-        os.chdir('build/latex')
-
-        # Call the makefile produced by sphinx...
-        if os.system('make'):
-            print("Rendering LaTeX failed.")
-            print("You may still be able to get a usable PDF file by going into 'build/latex'")
-            print("and executing 'pdflatex pandas.tex' for the requisite number of passes.")
-            print("Or using the 'latex_forced' target")
-            raise SystemExit
-
-        os.chdir('../..')
-    else:
-        print('latex build has not been tested on windows')
-
-def latex_forced():
-    check_build()
-    if sys.platform != 'win32':
-        # LaTeX format.
-        if os.system('sphinx-build -b latex -d build/doctrees '
-                     'source build/latex'):
-            raise SystemExit("Building LaTeX failed.")
-        # Produce pdf.
-
-        os.chdir('build/latex')
-
-        # Manually call pdflatex, 3 passes should ensure latex fixes up
-        # all the required cross-references and such.
-        os.system('pdflatex -interaction=nonstopmode pandas.tex')
-        os.system('pdflatex -interaction=nonstopmode pandas.tex')
-        os.system('pdflatex -interaction=nonstopmode pandas.tex')
-        raise SystemExit("You should check the file 'build/latex/pandas.pdf' for problems.")
-
-        os.chdir('../..')
+        import nbconvert
+    except ImportError:
+        sys.stderr.write('Warning: nbconvert not installed. '
+                         'Skipping notebooks.\n')
+        _remove_notebooks()
     else:
-        print('latex build has not been tested on windows')
-
+        try:
+            nbconvert.utils.pandoc.get_pandoc_version()
+        except nbconvert.utils.pandoc.PandocMissing:
+            sys.stderr.write('Warning: Pandoc is not installed. '
+                             'Skipping notebooks.\n')
+            _remove_notebooks()
+
+    yield
+
+    for nb, content in contents.items():
+        with open(nb, 'wt') as f:
+            f.write(content)
+
+
+class DocBuilder:
+    """Class to wrap the different commands of this script.
+
+    All public methods of this class can be called as parameters of the
+    script.
+    """
+    def __init__(self, num_jobs=1, include_api=True, single_doc=None,
+                 verbosity=0):
+        self.num_jobs = num_jobs
+        self.include_api = include_api
+        self.verbosity = verbosity
+        self.single_doc = None
+        self.single_doc_type = None
+        if single_doc is not None:
+            self._process_single_doc(single_doc)
+        self.exclude_patterns = self._exclude_patterns
+
+        self._generate_index()
+        if self.single_doc_type == 'docstring':
+            self._run_os('sphinx-autogen', '-o',
+                         'source/generated_single', 'source/index.rst')
+
+    @property
+    def _exclude_patterns(self):
+        """Docs source files that will be excluded from building."""
+        # TODO move maybe_exclude_notebooks here
+        if self.single_doc is not None:
+            rst_files = [f for f in os.listdir(SOURCE_PATH)
+                         if ((f.endswith('.rst') or f.endswith('.ipynb'))
+                             and (f != 'index.rst')
+                             and (f != '{0}.rst'.format(self.single_doc)))]
+            if self.single_doc_type != 'api':
+                rst_files += ['generated/*.rst']
+        elif not self.include_api:
+            rst_files = ['api.rst', 'generated/*.rst']
+        else:
+            rst_files = ['generated_single/*.rst']
+
+        exclude_patterns = ','.join(
+            '{!r}'.format(i) for i in ['**.ipynb_checkpoints'] + rst_files)
+
+        return exclude_patterns
+
+    def _process_single_doc(self, single_doc):
+        """Extract self.single_doc (base name) and self.single_doc_type from
+        passed single_doc kwarg.
+
+        """
+        self.include_api = False
+
+        if single_doc == 'api.rst' or single_doc == 'api':
+            self.single_doc_type = 'api'
+            self.single_doc = 'api'
+        elif os.path.exists(os.path.join(SOURCE_PATH, single_doc)):
+            self.single_doc_type = 'rst'
+            self.single_doc = os.path.splitext(os.path.basename(single_doc))[0]
+        elif os.path.exists(
+                os.path.join(SOURCE_PATH, '{}.rst'.format(single_doc))):
+            self.single_doc_type = 'rst'
+            self.single_doc = single_doc
+        elif single_doc is not None:
+            try:
+                obj = pandas  # noqa: F821
+                for name in single_doc.split('.'):
+                    obj = getattr(obj, name)
+            except AttributeError:
+                raise ValueError('Single document not understood, it should '
+                                 'be a file in doc/source/*.rst (e.g. '
+                                 '"contributing.rst" or a pandas function or '
+                                 'method (e.g. "pandas.DataFrame.head")')
+            else:
+                self.single_doc_type = 'docstring'
+                if single_doc.startswith('pandas.'):
+                    self.single_doc = single_doc[len('pandas.'):]
+                else:
+                    self.single_doc = single_doc
+
+    def _copy_generated_docstring(self):
+        """Copy existing generated (from api.rst) docstring page because
+        this is more correct in certain cases (where a custom autodoc
+        template is used).
+
+        """
+        fname = os.path.join(SOURCE_PATH, 'generated',
+                             'pandas.{}.rst'.format(self.single_doc))
+        temp_dir = os.path.join(SOURCE_PATH, 'generated_single')
 
-def check_build():
-    build_dirs = [
-        'build', 'build/doctrees', 'build/html',
-        'build/latex', 'build/plots', 'build/_static',
-        'build/_templates']
-    for d in build_dirs:
         try:
-            os.mkdir(d)
+            os.makedirs(temp_dir)
         except OSError:
             pass
 
+        if os.path.exists(fname):
+            try:
+                # copying to make sure sphinx always thinks it is new
+                # and needs to be re-generated (to pick source code changes)
+                shutil.copy(fname, temp_dir)
+            except:  # noqa
+                pass
+
+    def _generate_index(self):
+        """Create index.rst file with the specified sections."""
+        if self.single_doc_type == 'docstring':
+            self._copy_generated_docstring()
+
+        with open(os.path.join(SOURCE_PATH, 'index.rst.template')) as f:
+            t = jinja2.Template(f.read())
+
+        with open(os.path.join(SOURCE_PATH, 'index.rst'), 'w') as f:
+            f.write(t.render(include_api=self.include_api,
+                             single_doc=self.single_doc,
+                             single_doc_type=self.single_doc_type))
+
+    @staticmethod
+    def _create_build_structure():
+        """Create directories required to build documentation."""
+        for dirname in BUILD_DIRS:
+            try:
+                os.makedirs(os.path.join(BUILD_PATH, dirname))
+            except OSError:
+                pass
+
+    @staticmethod
+    def _run_os(*args):
+        """Execute a command as a OS terminal.
+
+        Parameters
+        ----------
+        *args : list of str
+            Command and parameters to be executed
+
+        Examples
+        --------
+        >>> DocBuilder()._run_os('python', '--version')
+        """
+        # TODO check_call should be more safe, but it fails with
+        # exclude patterns, needs investigation
+        # subprocess.check_call(args, stderr=subprocess.STDOUT)
+        os.system(' '.join(args))
+
+    def _sphinx_build(self, kind):
+        """Call sphinx to build documentation.
+
+        Attribute `num_jobs` from the class is used.
+
+        Parameters
+        ----------
+        kind : {'html', 'latex'}
+
+        Examples
+        --------
+        >>> DocBuilder(num_jobs=4)._sphinx_build('html')
+        """
+        if kind not in ('html', 'latex', 'spelling'):
+            raise ValueError('kind must be html, latex or '
+                             'spelling, not {}'.format(kind))
+
+        self._run_os('sphinx-build',
+                     '-j{}'.format(self.num_jobs),
+                     '-b{}'.format(kind),
+                     '-{}'.format(
+                         'v' * self.verbosity) if self.verbosity else '',
+                     '-d{}'.format(os.path.join(BUILD_PATH, 'doctrees')),
+                     '-Dexclude_patterns={}'.format(self.exclude_patterns),
+                     SOURCE_PATH,
+                     os.path.join(BUILD_PATH, kind))
+
+    def _open_browser(self):
+        base_url = os.path.join('file://', DOC_PATH, 'build', 'html')
+        if self.single_doc_type == 'docstring':
+            url = os.path.join(
+                base_url,
+                'generated_single', 'pandas.{}.html'.format(self.single_doc))
+        else:
+            url = os.path.join(base_url, '{}.html'.format(self.single_doc))
+        webbrowser.open(url, new=2)
+
+    def html(self):
+        """Build HTML documentation."""
+        self._create_build_structure()
+        with _maybe_exclude_notebooks():
+            self._sphinx_build('html')
+            zip_fname = os.path.join(BUILD_PATH, 'html', 'pandas.zip')
+            if os.path.exists(zip_fname):
+                os.remove(zip_fname)
+
+        if self.single_doc is not None:
+            self._open_browser()
+            shutil.rmtree(os.path.join(SOURCE_PATH, 'generated_single'),
+                          ignore_errors=True)
+
+    def latex(self, force=False):
+        """Build PDF documentation."""
+        self._create_build_structure()
+        if sys.platform == 'win32':
+            sys.stderr.write('latex build has not been tested on windows\n')
+        else:
+            self._sphinx_build('latex')
+            os.chdir(os.path.join(BUILD_PATH, 'latex'))
+            if force:
+                for i in range(3):
+                    self._run_os('pdflatex',
+                                 '-interaction=nonstopmode',
+                                 'pandas.tex')
+                raise SystemExit('You should check the file '
+                                 '"build/latex/pandas.pdf" for problems.')
+            else:
+                self._run_os('make')
+
+    def latex_forced(self):
+        """Build PDF documentation with retries to find missing references."""
+        self.latex(force=True)
+
+    @staticmethod
+    def clean():
+        """Clean documentation generated files."""
+        shutil.rmtree(BUILD_PATH, ignore_errors=True)
+        shutil.rmtree(os.path.join(SOURCE_PATH, 'generated'),
+                      ignore_errors=True)
+
+    def zip_html(self):
+        """Compress HTML documentation into a zip file."""
+        zip_fname = os.path.join(BUILD_PATH, 'html', 'pandas.zip')
+        if os.path.exists(zip_fname):
+            os.remove(zip_fname)
+        dirname = os.path.join(BUILD_PATH, 'html')
+        fnames = os.listdir(dirname)
+        os.chdir(dirname)
+        self._run_os('zip',
+                     zip_fname,
+                     '-r',
+                     '-q',
+                     *fnames)
+
+    def spellcheck(self):
+        """Spell check the documentation."""
+        self._sphinx_build('spelling')
+        output_location = os.path.join('build', 'spelling', 'output.txt')
+        with open(output_location) as output:
+            lines = output.readlines()
+            if lines:
+                raise SyntaxError(
+                    'Found misspelled words.'
+                    ' Check pandas/doc/build/spelling/output.txt'
+                    ' for more details.')
 
-def all():
-    # clean()
-    html()
-
-
-def auto_dev_build(debug=False):
-    msg = ''
-    try:
-        step = 'clean'
-        clean()
-        step = 'html'
-        html()
-        step = 'upload dev'
-        upload_dev()
-        if not debug:
-            sendmail(step)
-
-        step = 'latex'
-        latex()
-        step = 'upload pdf'
-        upload_dev_pdf()
-        if not debug:
-            sendmail(step)
-    except (Exception, SystemExit) as inst:
-        msg = str(inst) + '\n'
-        sendmail(step, '[ERROR] ' + msg)
-
-
-def sendmail(step=None, err_msg=None):
-    from_name, to_name = _get_config()
-
-    if step is None:
-        step = ''
-
-    if err_msg is None or '[ERROR]' not in err_msg:
-        msgstr = 'Daily docs %s completed successfully' % step
-        subject = "DOC: %s successful" % step
-    else:
-        msgstr = err_msg
-        subject = "DOC: %s failed" % step
-
-    import smtplib
-    from email.MIMEText import MIMEText
-    msg = MIMEText(msgstr)
-    msg['Subject'] = subject
-    msg['From'] = from_name
-    msg['To'] = to_name
-
-    server_str, port, login, pwd = _get_credentials()
-    server = smtplib.SMTP(server_str, port)
-    server.ehlo()
-    server.starttls()
-    server.ehlo()
-
-    server.login(login, pwd)
-    try:
-        server.sendmail(from_name, to_name, msg.as_string())
-    finally:
-        server.close()
-
-
-def _get_dir(subdir=None):
-    import getpass
-    USERNAME = getpass.getuser()
-    if sys.platform == 'darwin':
-        HOME = '/Users/%s' % USERNAME
-    else:
-        HOME = '/home/%s' % USERNAME
-
-    if subdir is None:
-        subdir = '/code/scripts/config'
-    conf_dir = '%s/%s' % (HOME, subdir)
-    return conf_dir
-
-
-def _get_credentials():
-    tmp_dir = _get_dir()
-    cred = '%s/credentials' % tmp_dir
-    with open(cred, 'r') as fh:
-        server, port, un, domain = fh.read().split(',')
-    port = int(port)
-    login = un + '@' + domain + '.com'
-
-    import base64
-    with open('%s/cron_email_pwd' % tmp_dir, 'r') as fh:
-        pwd = base64.b64decode(fh.read())
-
-    return server, port, login, pwd
-
-
-def _get_config():
-    tmp_dir = _get_dir()
-    with open('%s/addresses' % tmp_dir, 'r') as fh:
-        from_name, to_name = fh.read().split(',')
-    return from_name, to_name
-
-funcd = {
-    'html': html,
-    'zip_html': zip_html,
-    'upload_dev': upload_dev,
-    'upload_stable': upload_stable,
-    'upload_dev_pdf': upload_dev_pdf,
-    'upload_stable_pdf': upload_stable_pdf,
-    'latex': latex,
-    'latex_forced': latex_forced,
-    'clean': clean,
-    'auto_dev': auto_dev_build,
-    'auto_debug': lambda: auto_dev_build(True),
-    'build_pandas': build_pandas,
-    'all': all,
-}
-
-small_docs = False
-
-# current_dir = os.getcwd()
-# os.chdir(os.path.dirname(os.path.join(current_dir, __file__)))
-
-import argparse
-argparser = argparse.ArgumentParser(description="""
-pandas documentation builder
-""".strip())
-
-# argparser.add_argument('-arg_name', '--arg_name',
-#                    metavar='label for arg help',
-#                    type=str|etc,
-#                    nargs='N|*|?|+|argparse.REMAINDER',
-#                    required=False,
-#                    #choices='abc',
-#                    help='help string',
-#                    action='store|store_true')
-
-# args = argparser.parse_args()
-
-#print args.accumulate(args.integers)
-
-def generate_index(api=True, single=False, **kwds):
-    from jinja2 import Template
-    with open("source/index.rst.template") as f:
-        t = Template(f.read())
-
-    with open("source/index.rst","w") as f:
-        f.write(t.render(api=api,single=single,**kwds))
-
-import argparse
-argparser = argparse.ArgumentParser(description="pandas documentation builder",
-                                    epilog="Targets : %s" % funcd.keys())
-
-argparser.add_argument('--no-api',
-                   default=False,
-                   help='Ommit api and autosummary',
-                   action='store_true')
-argparser.add_argument('--single',
-                   metavar='FILENAME',
-                   type=str,
-                   default=False,
-                   help='filename of section to compile, e.g. "indexing"')
-argparser.add_argument('--user',
-                   type=str,
-                   default=False,
-                   help='Username to connect to the pydata server')
 
 def main():
-    args, unknown = argparser.parse_known_args()
-    sys.argv = [sys.argv[0]] + unknown
-    if args.single:
-        args.single = os.path.basename(args.single).split(".rst")[0]
-
-    if 'clean' in unknown:
-        args.single=False
-
-    generate_index(api=not args.no_api and not args.single, single=args.single)
-
-    if len(sys.argv) > 2:
-        ftype = sys.argv[1]
-        ver = sys.argv[2]
-
-        if ftype == 'build_previous':
-            build_prev(ver, user=args.user)
-        if ftype == 'upload_previous':
-            upload_prev(ver, user=args.user)
-    elif len(sys.argv) == 2:
-        for arg in sys.argv[1:]:
-            func = funcd.get(arg)
-            if func is None:
-                raise SystemExit('Do not know how to handle %s; valid args are %s' % (
-                    arg, list(funcd.keys())))
-            if args.user:
-                func(user=args.user)
-            else:
-                func()
-    else:
-        small_docs = False
-        all()
-# os.chdir(current_dir)
+    cmds = [method for method in dir(DocBuilder) if not method.startswith('_')]
+
+    argparser = argparse.ArgumentParser(
+        description='pandas documentation builder',
+        epilog='Commands: {}'.format(','.join(cmds)))
+    argparser.add_argument('command',
+                           nargs='?',
+                           default='html',
+                           help='command to run: {}'.format(', '.join(cmds)))
+    argparser.add_argument('--num-jobs',
+                           type=int,
+                           default=1,
+                           help='number of jobs used by sphinx-build')
+    argparser.add_argument('--no-api',
+                           default=False,
+                           help='ommit api and autosummary',
+                           action='store_true')
+    argparser.add_argument('--single',
+                           metavar='FILENAME',
+                           type=str,
+                           default=None,
+                           help=('filename of section or method name to '
+                                 'compile, e.g. "indexing", "DataFrame.join"'))
+    argparser.add_argument('--python-path',
+                           type=str,
+                           default=os.path.dirname(DOC_PATH),
+                           help='path')
+    argparser.add_argument('-v', action='count', dest='verbosity', default=0,
+                           help=('increase verbosity (can be repeated), '
+                                 'passed to the sphinx build command'))
+    args = argparser.parse_args()
+
+    if args.command not in cmds:
+        raise ValueError('Unknown command {}. Available options: {}'.format(
+            args.command, ', '.join(cmds)))
+
+    # Below we update both os.environ and sys.path. The former is used by
+    # external libraries (namely Sphinx) to compile this module and resolve
+    # the import of `python_path` correctly. The latter is used to resolve
+    # the import within the module, injecting it into the global namespace
+    os.environ['PYTHONPATH'] = args.python_path
+    sys.path.append(args.python_path)
+    globals()['pandas'] = importlib.import_module('pandas')
+
+    builder = DocBuilder(args.num_jobs, not args.no_api, args.single,
+                         args.verbosity)
+    getattr(builder, args.command)()
+
 
 if __name__ == '__main__':
-    import sys
     sys.exit(main())
diff --git a/doc/plots/stats/moment_plots.py b/doc/plots/stats/moment_plots.py
deleted file mode 100644
index 9e3a902592c6b..0000000000000
--- a/doc/plots/stats/moment_plots.py
+++ /dev/null
@@ -1,30 +0,0 @@
-import numpy as np
-
-import matplotlib.pyplot as plt
-import pandas.util.testing as t
-import pandas.stats.moments as m
-
-
-def test_series(n=1000):
-    t.N = n
-    s = t.makeTimeSeries()
-    return s
-
-
-def plot_timeseries(*args, **kwds):
-    n = len(args)
-
-    fig, axes = plt.subplots(n, 1, figsize=kwds.get('size', (10, 5)),
-                             sharex=True)
-    titles = kwds.get('titles', None)
-
-    for k in range(1, n + 1):
-        ax = axes[k - 1]
-        ts = args[k - 1]
-        ax.plot(ts.index, ts.values)
-
-        if titles:
-            ax.set_title(titles[k - 1])
-
-    fig.autofmt_xdate()
-    fig.subplots_adjust(bottom=0.10, top=0.95)
diff --git a/doc/plots/stats/moments_ewma.py b/doc/plots/stats/moments_ewma.py
deleted file mode 100644
index 3e521ed60bb8f..0000000000000
--- a/doc/plots/stats/moments_ewma.py
+++ /dev/null
@@ -1,15 +0,0 @@
-import matplotlib.pyplot as plt
-import pandas.util.testing as t
-import pandas.stats.moments as m
-
-t.N = 200
-s = t.makeTimeSeries().cumsum()
-
-plt.figure(figsize=(10, 5))
-plt.plot(s.index, s.values)
-plt.plot(s.index, m.ewma(s, 20, min_periods=1).values)
-f = plt.gcf()
-f.autofmt_xdate()
-
-plt.show()
-plt.close('all')
diff --git a/doc/plots/stats/moments_ewmvol.py b/doc/plots/stats/moments_ewmvol.py
deleted file mode 100644
index 093f62868fc4e..0000000000000
--- a/doc/plots/stats/moments_ewmvol.py
+++ /dev/null
@@ -1,23 +0,0 @@
-import matplotlib.pyplot as plt
-import pandas.util.testing as t
-import pandas.stats.moments as m
-
-t.N = 500
-ts = t.makeTimeSeries()
-ts[::100] = 20
-
-s = ts.cumsum()
-
-
-plt.figure(figsize=(10, 5))
-plt.plot(s.index, m.ewmvol(s, span=50, min_periods=1).values, color='b')
-plt.plot(s.index, m.rolling_std(s, 50, min_periods=1).values, color='r')
-
-plt.title('Exp-weighted std with shocks')
-plt.legend(('Exp-weighted', 'Equal-weighted'))
-
-f = plt.gcf()
-f.autofmt_xdate()
-
-plt.show()
-plt.close('all')
diff --git a/doc/plots/stats/moments_expw.py b/doc/plots/stats/moments_expw.py
deleted file mode 100644
index 5fff419b3a940..0000000000000
--- a/doc/plots/stats/moments_expw.py
+++ /dev/null
@@ -1,35 +0,0 @@
-from moment_plots import *
-
-np.random.seed(1)
-
-ts = test_series(500) * 10
-
-# ts[::100] = 20
-
-s = ts.cumsum()
-
-fig, axes = plt.subplots(3, 1, figsize=(8, 10), sharex=True)
-
-ax0, ax1, ax2 = axes
-
-ax0.plot(s.index, s.values)
-ax0.set_title('time series')
-
-ax1.plot(s.index, m.ewma(s, span=50, min_periods=1).values, color='b')
-ax1.plot(s.index, m.rolling_mean(s, 50, min_periods=1).values, color='r')
-ax1.set_title('rolling_mean vs. ewma')
-
-line1 = ax2.plot(
-    s.index, m.ewmstd(s, span=50, min_periods=1).values, color='b')
-line2 = ax2.plot(
-    s.index, m.rolling_std(s, 50, min_periods=1).values, color='r')
-ax2.set_title('rolling_std vs. ewmstd')
-
-fig.legend((line1, line2),
-           ('Exp-weighted', 'Equal-weighted'),
-           loc='upper right')
-fig.autofmt_xdate()
-fig.subplots_adjust(bottom=0.10, top=0.95)
-
-plt.show()
-plt.close('all')
diff --git a/doc/plots/stats/moments_rolling.py b/doc/plots/stats/moments_rolling.py
deleted file mode 100644
index 30a6c5f53e20c..0000000000000
--- a/doc/plots/stats/moments_rolling.py
+++ /dev/null
@@ -1,24 +0,0 @@
-from moment_plots import *
-
-ts = test_series()
-s = ts.cumsum()
-
-s[20:50] = np.NaN
-s[120:150] = np.NaN
-plot_timeseries(s,
-                m.rolling_count(s, 50),
-                m.rolling_sum(s, 50, min_periods=10),
-                m.rolling_mean(s, 50, min_periods=10),
-                m.rolling_std(s, 50, min_periods=10),
-                m.rolling_skew(s, 50, min_periods=10),
-                m.rolling_kurt(s, 50, min_periods=10),
-                size=(10, 12),
-                titles=('time series',
-                        'rolling_count',
-                        'rolling_sum',
-                        'rolling_mean',
-                        'rolling_std',
-                        'rolling_skew',
-                        'rolling_kurt'))
-plt.show()
-plt.close('all')
diff --git a/doc/plots/stats/moments_rolling_binary.py b/doc/plots/stats/moments_rolling_binary.py
deleted file mode 100644
index ab6b7b1c8ff49..0000000000000
--- a/doc/plots/stats/moments_rolling_binary.py
+++ /dev/null
@@ -1,30 +0,0 @@
-from moment_plots import *
-
-np.random.seed(1)
-
-ts = test_series()
-s = ts.cumsum()
-ts2 = test_series()
-s2 = ts2.cumsum()
-
-s[20:50] = np.NaN
-s[120:150] = np.NaN
-fig, axes = plt.subplots(3, 1, figsize=(8, 10), sharex=True)
-
-ax0, ax1, ax2 = axes
-
-ax0.plot(s.index, s.values)
-ax0.plot(s2.index, s2.values)
-ax0.set_title('time series')
-
-ax1.plot(s.index, m.rolling_corr(s, s2, 50, min_periods=1).values)
-ax1.set_title('rolling_corr')
-
-ax2.plot(s.index, m.rolling_cov(s, s2, 50, min_periods=1).values)
-ax2.set_title('rolling_cov')
-
-fig.autofmt_xdate()
-fig.subplots_adjust(bottom=0.10, top=0.95)
-
-plt.show()
-plt.close('all')
diff --git a/doc/source/10min.rst b/doc/source/10min.rst
index 3cf05698dd9d0..fbbe94a72c71e 100644
--- a/doc/source/10min.rst
+++ b/doc/source/10min.rst
@@ -11,10 +11,7 @@
    np.random.seed(123456)
    np.set_printoptions(precision=4, suppress=True)
    import matplotlib
-   try:
-      matplotlib.style.use('ggplot')
-   except AttributeError:
-      pd.options.display.mpl_style = 'default'
+   # matplotlib.style.use('default')
    pd.options.display.max_rows = 15
 
    #### portions of this were borrowed from the
@@ -28,7 +25,7 @@
 ********************
 
 This is a short introduction to pandas, geared mainly for new users.
-You can see more complex recipes in the :ref:`Cookbook<cookbook>`
+You can see more complex recipes in the :ref:`Cookbook<cookbook>`.
 
 Customarily, we import as follows:
 
@@ -41,7 +38,7 @@ Customarily, we import as follows:
 Object Creation
 ---------------
 
-See the :ref:`Data Structure Intro section <dsintro>`
+See the :ref:`Data Structure Intro section <dsintro>`.
 
 Creating a :class:`Series` by passing a list of values, letting pandas create
 a default integer index:
@@ -51,7 +48,7 @@ a default integer index:
    s = pd.Series([1,3,5,np.nan,6,8])
    s
 
-Creating a :class:`DataFrame` by passing a numpy array, with a datetime index
+Creating a :class:`DataFrame` by passing a NumPy array, with a datetime index
 and labeled columns:
 
 .. ipython:: python
@@ -73,7 +70,8 @@ Creating a ``DataFrame`` by passing a dict of objects that can be converted to s
                         'F' : 'foo' })
    df2
 
-Having specific :ref:`dtypes <basics.dtypes>`
+The columns of the resulting ``DataFrame`` have different 
+:ref:`dtypes <basics.dtypes>`.
 
 .. ipython:: python
 
@@ -87,29 +85,18 @@ will be completed:
 
    @verbatim
    In [1]: df2.<TAB>
-   df2.A                  df2.boxplot
-   df2.abs                df2.C
-   df2.add                df2.clip
-   df2.add_prefix         df2.clip_lower
-   df2.add_suffix         df2.clip_upper
-   df2.align              df2.columns
-   df2.all                df2.combine
-   df2.any                df2.combineAdd
+   df2.A                  df2.bool
+   df2.abs                df2.boxplot
+   df2.add                df2.C
+   df2.add_prefix         df2.clip
+   df2.add_suffix         df2.clip_lower
+   df2.align              df2.clip_upper
+   df2.all                df2.columns
+   df2.any                df2.combine
    df2.append             df2.combine_first
-   df2.apply              df2.combineMult
-   df2.applymap           df2.compound
-   df2.as_blocks          df2.consolidate
-   df2.asfreq             df2.convert_objects
-   df2.as_matrix          df2.copy
-   df2.astype             df2.corr
-   df2.at                 df2.corrwith
-   df2.at_time            df2.count
-   df2.axes               df2.cov
-   df2.B                  df2.cummax
-   df2.between_time       df2.cummin
-   df2.bfill              df2.cumprod
-   df2.blocks             df2.cumsum
-   df2.bool               df2.D
+   df2.apply              df2.compound
+   df2.applymap           df2.consolidate
+   df2.D
 
 As you can see, the columns ``A``, ``B``, ``C``, and ``D`` are automatically
 tab completed. ``E`` is there as well; the rest of the attributes have been
@@ -118,16 +105,16 @@ truncated for brevity.
 Viewing Data
 ------------
 
-See the :ref:`Basics section <basics>`
+See the :ref:`Basics section <basics>`.
 
-See the top & bottom rows of the frame
+Here is how to view the top and bottom rows of the frame:
 
 .. ipython:: python
 
    df.head()
    df.tail(3)
 
-Display the index, columns, and the underlying numpy data
+Display the index, columns, and the underlying NumPy data:
 
 .. ipython:: python
 
@@ -135,25 +122,25 @@ Display the index, columns, and the underlying numpy data
    df.columns
    df.values
 
-Describe shows a quick statistic summary of your data
+:func:`~DataFrame.describe` shows a quick statistic summary of your data:
 
 .. ipython:: python
 
    df.describe()
 
-Transposing your data
+Transposing your data:
 
 .. ipython:: python
 
    df.T
 
-Sorting by an axis
+Sorting by an axis:
 
 .. ipython:: python
 
    df.sort_index(axis=1, ascending=False)
 
-Sorting by values
+Sorting by values:
 
 .. ipython:: python
 
@@ -167,15 +154,15 @@ Selection
    While standard Python / Numpy expressions for selecting and setting are
    intuitive and come in handy for interactive work, for production code, we
    recommend the optimized pandas data access methods, ``.at``, ``.iat``,
-   ``.loc``, ``.iloc`` and ``.ix``.
+   ``.loc`` and ``.iloc``.
 
-See the indexing documentation :ref:`Indexing and Selecting Data <indexing>` and :ref:`MultiIndex / Advanced Indexing <advanced>`
+See the indexing documentation :ref:`Indexing and Selecting Data <indexing>` and :ref:`MultiIndex / Advanced Indexing <advanced>`.
 
 Getting
 ~~~~~~~
 
 Selecting a single column, which yields a ``Series``,
-equivalent to ``df.A``
+equivalent to ``df.A``:
 
 .. ipython:: python
 
@@ -191,39 +178,39 @@ Selecting via ``[]``, which slices the rows.
 Selection by Label
 ~~~~~~~~~~~~~~~~~~
 
-See more in :ref:`Selection by Label <indexing.label>`
+See more in :ref:`Selection by Label <indexing.label>`.
 
-For getting a cross section using a label
+For getting a cross section using a label:
 
 .. ipython:: python
 
    df.loc[dates[0]]
 
-Selecting on a multi-axis by label
+Selecting on a multi-axis by label:
 
 .. ipython:: python
 
    df.loc[:,['A','B']]
 
-Showing label slicing, both endpoints are *included*
+Showing label slicing, both endpoints are *included*:
 
 .. ipython:: python
 
    df.loc['20130102':'20130104',['A','B']]
 
-Reduction in the dimensions of the returned object
+Reduction in the dimensions of the returned object:
 
 .. ipython:: python
 
    df.loc['20130102',['A','B']]
 
-For getting a scalar value
+For getting a scalar value:
 
 .. ipython:: python
 
    df.loc[dates[0],'A']
 
-For getting fast access to a scalar (equiv to the prior method)
+For getting fast access to a scalar (equivalent to the prior method):
 
 .. ipython:: python
 
@@ -232,45 +219,45 @@ For getting fast access to a scalar (equiv to the prior method)
 Selection by Position
 ~~~~~~~~~~~~~~~~~~~~~
 
-See more in :ref:`Selection by Position <indexing.integer>`
+See more in :ref:`Selection by Position <indexing.integer>`.
 
-Select via the position of the passed integers
+Select via the position of the passed integers:
 
 .. ipython:: python
 
    df.iloc[3]
 
-By integer slices, acting similar to numpy/python
+By integer slices, acting similar to numpy/python:
 
 .. ipython:: python
 
    df.iloc[3:5,0:2]
 
-By lists of integer position locations, similar to the numpy/python style
+By lists of integer position locations, similar to the numpy/python style:
 
 .. ipython:: python
 
    df.iloc[[1,2,4],[0,2]]
 
-For slicing rows explicitly
+For slicing rows explicitly:
 
 .. ipython:: python
 
    df.iloc[1:3,:]
 
-For slicing columns explicitly
+For slicing columns explicitly:
 
 .. ipython:: python
 
    df.iloc[:,1:3]
 
-For getting a value explicitly
+For getting a value explicitly:
 
 .. ipython:: python
 
    df.iloc[1,1]
 
-For getting fast access to a scalar (equiv to the prior method)
+For getting fast access to a scalar (equivalent to the prior method):
 
 .. ipython:: python
 
@@ -285,7 +272,7 @@ Using a single column's values to select data.
 
    df[df.A > 0]
 
-A ``where`` operation for getting.
+Selecting values from a DataFrame where a boolean condition is met.
 
 .. ipython:: python
 
@@ -304,7 +291,7 @@ Setting
 ~~~~~~~
 
 Setting a new column automatically aligns the data
-by the indexes
+by the indexes.
 
 .. ipython:: python
 
@@ -312,25 +299,25 @@ by the indexes
    s1
    df['F'] = s1
 
-Setting values by label
+Setting values by label:
 
 .. ipython:: python
 
    df.at[dates[0],'A'] = 0
 
-Setting values by position
+Setting values by position:
 
 .. ipython:: python
 
    df.iat[0,1] = 0
 
-Setting by assigning with a numpy array
+Setting by assigning with a NumPy array:
 
 .. ipython:: python
 
    df.loc[:,'D'] = np.array([5] * len(df))
 
-The result of the prior setting operations
+The result of the prior setting operations.
 
 .. ipython:: python
 
@@ -350,7 +337,7 @@ Missing Data
 
 pandas primarily uses the value ``np.nan`` to represent missing data. It is by
 default not included in computations. See the :ref:`Missing Data section
-<missing_data>`
+<missing_data>`.
 
 Reindexing allows you to change/add/delete the index on a specified axis. This
 returns a copy of the data.
@@ -367,36 +354,36 @@ To drop any rows that have missing data.
 
    df1.dropna(how='any')
 
-Filling missing data
+Filling missing data.
 
 .. ipython:: python
 
    df1.fillna(value=5)
 
-To get the boolean mask where values are ``nan``
+To get the boolean mask where values are ``nan``.
 
 .. ipython:: python
 
-   pd.isnull(df1)
+   pd.isna(df1)
 
 
 Operations
 ----------
 
-See the :ref:`Basic section on Binary Ops <basics.binop>`
+See the :ref:`Basic section on Binary Ops <basics.binop>`.
 
 Stats
 ~~~~~
 
 Operations in general *exclude* missing data.
 
-Performing a descriptive statistic
+Performing a descriptive statistic:
 
 .. ipython:: python
 
    df.mean()
 
-Same operation on the other axis
+Same operation on the other axis:
 
 .. ipython:: python
 
@@ -415,7 +402,7 @@ In addition, pandas automatically broadcasts along the specified dimension.
 Apply
 ~~~~~
 
-Applying functions to the data
+Applying functions to the data:
 
 .. ipython:: python
 
@@ -425,7 +412,7 @@ Applying functions to the data
 Histogramming
 ~~~~~~~~~~~~~
 
-See more at :ref:`Histogramming and Discretization <basics.discretization>`
+See more at :ref:`Histogramming and Discretization <basics.discretization>`.
 
 .. ipython:: python
 
@@ -439,7 +426,7 @@ String Methods
 Series is equipped with a set of string processing methods in the `str`
 attribute that make it easy to operate on each element of the array, as in the
 code snippet below. Note that pattern-matching in `str` generally uses `regular
-expressions <https://docs.python.org/2/library/re.html>`__ by default (and in
+expressions <https://docs.python.org/3/library/re.html>`__ by default (and in
 some cases always uses them). See more at :ref:`Vectorized String Methods
 <text.string_methods>`.
 
@@ -459,7 +446,7 @@ DataFrame, and Panel objects with various kinds of set logic for the indexes
 and relational algebra functionality in the case of join / merge-type
 operations.
 
-See the :ref:`Merging section <merging>`
+See the :ref:`Merging section <merging>`.
 
 Concatenating pandas objects together with :func:`concat`:
 
@@ -476,7 +463,7 @@ Concatenating pandas objects together with :func:`concat`:
 Join
 ~~~~
 
-SQL style merges. See the :ref:`Database style joining <merging.join>`
+SQL style merges. See the :ref:`Database style joining <merging.join>` section.
 
 .. ipython:: python
 
@@ -486,10 +473,22 @@ SQL style merges. See the :ref:`Database style joining <merging.join>`
    right
    pd.merge(left, right, on='key')
 
+Another example that can be given is:
+
+.. ipython:: python
+
+   left = pd.DataFrame({'key': ['foo', 'bar'], 'lval': [1, 2]})
+   right = pd.DataFrame({'key': ['foo', 'bar'], 'rval': [4, 5]})
+   left
+   right
+   pd.merge(left, right, on='key')
+
+
 Append
 ~~~~~~
 
-Append rows to a dataframe. See the :ref:`Appending <merging.concatenation>`
+Append rows to a dataframe. See the :ref:`Appending <merging.concatenation>` 
+section.
 
 .. ipython:: python
 
@@ -503,13 +502,13 @@ Grouping
 --------
 
 By "group by" we are referring to a process involving one or more of the
-following steps
+following steps:
 
  - **Splitting** the data into groups based on some criteria
  - **Applying** a function to each group independently
  - **Combining** the results into a data structure
 
-See the :ref:`Grouping section <groupby>`
+See the :ref:`Grouping section <groupby>`.
 
 .. ipython:: python
 
@@ -521,14 +520,15 @@ See the :ref:`Grouping section <groupby>`
                       'D' : np.random.randn(8)})
    df
 
-Grouping and then applying a function ``sum`` to the resulting groups.
+Grouping and then applying the :meth:`~DataFrame.sum` function to the resulting 
+groups.
 
 .. ipython:: python
 
    df.groupby('A').sum()
 
-Grouping by multiple columns forms a hierarchical index, which we then apply
-the function.
+Grouping by multiple columns forms a hierarchical index, and again we can 
+apply the ``sum`` function.
 
 .. ipython:: python
 
@@ -598,15 +598,15 @@ Time Series
 pandas has simple, powerful, and efficient functionality for performing
 resampling operations during frequency conversion (e.g., converting secondly
 data into 5-minutely data). This is extremely common in, but not limited to,
-financial applications. See the :ref:`Time Series section <timeseries>`
+financial applications. See the :ref:`Time Series section <timeseries>`.
 
 .. ipython:: python
 
    rng = pd.date_range('1/1/2012', periods=100, freq='S')
    ts = pd.Series(np.random.randint(0, 500, len(rng)), index=rng)
-   ts.resample('5Min', how='sum')
+   ts.resample('5Min').sum()
 
-Time zone representation
+Time zone representation:
 
 .. ipython:: python
 
@@ -616,13 +616,13 @@ Time zone representation
    ts_utc = ts.tz_localize('UTC')
    ts_utc
 
-Convert to another time zone
+Converting to another time zone:
 
 .. ipython:: python
 
    ts_utc.tz_convert('US/Eastern')
 
-Converting between time span representations
+Converting between time span representations:
 
 .. ipython:: python
 
@@ -648,7 +648,7 @@ the quarter end:
 Categoricals
 ------------
 
-Since version 0.15, pandas can include categorical data in a ``DataFrame``. For full docs, see the
+pandas can include categorical data in a ``DataFrame``. For full docs, see the
 :ref:`categorical introduction <categorical>` and the :ref:`API documentation <api.categorical>`.
 
 .. ipython:: python
@@ -662,14 +662,15 @@ Convert the raw grades to a categorical data type.
     df["grade"] = df["raw_grade"].astype("category")
     df["grade"]
 
-Rename the categories to more meaningful names (assigning to ``Series.cat.categories`` is inplace!)
+Rename the categories to more meaningful names (assigning to 
+``Series.cat.categories`` is inplace!).
 
 .. ipython:: python
 
     df["grade"].cat.categories = ["very good", "good", "very bad"]
 
 Reorder the categories and simultaneously add the missing categories (methods under ``Series
-.cat`` return a new ``Series`` per default).
+.cat`` return a new ``Series`` by default).
 
 .. ipython:: python
 
@@ -682,7 +683,7 @@ Sorting is per order in the categories, not lexical order.
 
     df.sort_values(by="grade")
 
-Grouping by a categorical column shows also empty categories.
+Grouping by a categorical column also shows empty categories.
 
 .. ipython:: python
 
@@ -692,7 +693,7 @@ Grouping by a categorical column shows also empty categories.
 Plotting
 --------
 
-:ref:`Plotting <visualization>` docs.
+See the :ref:`Plotting <visualization>` docs.
 
 .. ipython:: python
    :suppress:
@@ -708,8 +709,8 @@ Plotting
    @savefig series_plot_basic.png
    ts.plot()
 
-On DataFrame, :meth:`~DataFrame.plot` is a convenience to plot all of the
-columns with labels:
+On a DataFrame, the :meth:`~DataFrame.plot` method is a convenience to plot all 
+of the columns with labels:
 
 .. ipython:: python
 
@@ -726,13 +727,13 @@ Getting Data In/Out
 CSV
 ~~~
 
-:ref:`Writing to a csv file <io.store_in_csv>`
+:ref:`Writing to a csv file. <io.store_in_csv>`
 
 .. ipython:: python
 
    df.to_csv('foo.csv')
 
-:ref:`Reading from a csv file <io.read_csv_table>`
+:ref:`Reading from a csv file. <io.read_csv_table>`
 
 .. ipython:: python
 
@@ -746,15 +747,15 @@ CSV
 HDF5
 ~~~~
 
-Reading and writing to :ref:`HDFStores <io.hdf5>`
+Reading and writing to :ref:`HDFStores <io.hdf5>`.
 
-Writing to a HDF5 Store
+Writing to a HDF5 Store.
 
 .. ipython:: python
 
    df.to_hdf('foo.h5','df')
 
-Reading from a HDF5 Store
+Reading from a HDF5 Store.
 
 .. ipython:: python
 
@@ -768,15 +769,15 @@ Reading from a HDF5 Store
 Excel
 ~~~~~
 
-Reading and writing to :ref:`MS Excel <io.excel>`
+Reading and writing to :ref:`MS Excel <io.excel>`.
 
-Writing to an excel file
+Writing to an excel file.
 
 .. ipython:: python
 
    df.to_excel('foo.xlsx', sheet_name='Sheet1')
 
-Reading from an excel file
+Reading from an excel file.
 
 .. ipython:: python
 
@@ -790,7 +791,7 @@ Reading from an excel file
 Gotchas
 -------
 
-If you are trying an operation and you see an exception like:
+If you are attempting to perform an operation you might see an exception like:
 
 .. code-block:: python
 
diff --git a/doc/source/_static/banklist.html b/doc/source/_static/banklist.html
index 8ec1561f8c394..cbcce5a2d49ff 100644
--- a/doc/source/_static/banklist.html
+++ b/doc/source/_static/banklist.html
@@ -7,7 +7,7 @@
 <meta charset="UTF-8">
 <!-- Unicode character encoding -->
 <meta http-equiv="X-UA-Compatible" content="IE=edge">
-<!-- Turns off IE Compatiblity Mode -->
+<!-- Turns off IE Compatibility Mode -->
 <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
 <!-- Makes it so phones don't auto zoom out. -->
 <meta name="author" content="DRR">
@@ -4849,7 +4849,7 @@ <h1 class="page_title">Failed Bank List</h1>
 		<ul>
 			<li><a href="/about/freedom/" title="Freedom of Information Act (FOIA) Service Center">Freedom of Information Act (FOIA) Service Center</a></li>
 			<li><a href="/open/" title="FDIC Open Government Webpage">FDIC Open Government Webpage</a></li>
-			<li><a href="/about/diversity/nofear/" title="No FEAR Act Data">No  FEAR Act Data</a></li>
+			<li><a href="/about/diversity/nofear/" title="No FEAR Act Data">No FEAR Act Data</a></li>
 		</ul>
 	</div>
 	<div id="responsive_footer-small">
diff --git a/doc/source/_static/ci.png b/doc/source/_static/ci.png
new file mode 100644
index 0000000000000..4570ed2155586
Binary files /dev/null and b/doc/source/_static/ci.png differ
diff --git a/doc/source/_static/favicon.ico b/doc/source/_static/favicon.ico
new file mode 100644
index 0000000000000..d15c4803b62e6
Binary files /dev/null and b/doc/source/_static/favicon.ico differ
diff --git a/doc/source/_static/print_df_new.png b/doc/source/_static/print_df_new.png
new file mode 100644
index 0000000000000..767d7d3f0ef06
Binary files /dev/null and b/doc/source/_static/print_df_new.png differ
diff --git a/doc/source/_static/print_df_old.png b/doc/source/_static/print_df_old.png
new file mode 100644
index 0000000000000..5f458722f1269
Binary files /dev/null and b/doc/source/_static/print_df_old.png differ
diff --git a/doc/source/_static/reshaping_melt.png b/doc/source/_static/reshaping_melt.png
new file mode 100644
index 0000000000000..d0c4e77655e60
Binary files /dev/null and b/doc/source/_static/reshaping_melt.png differ
diff --git a/doc/source/_static/reshaping_pivot.png b/doc/source/_static/reshaping_pivot.png
new file mode 100644
index 0000000000000..c6c37a80744d4
Binary files /dev/null and b/doc/source/_static/reshaping_pivot.png differ
diff --git a/doc/source/_static/reshaping_stack.png b/doc/source/_static/reshaping_stack.png
new file mode 100644
index 0000000000000..924f916ae0d37
Binary files /dev/null and b/doc/source/_static/reshaping_stack.png differ
diff --git a/doc/source/_static/reshaping_unstack.png b/doc/source/_static/reshaping_unstack.png
new file mode 100644
index 0000000000000..3e14cdd1ee1f7
Binary files /dev/null and b/doc/source/_static/reshaping_unstack.png differ
diff --git a/doc/source/_static/reshaping_unstack_0.png b/doc/source/_static/reshaping_unstack_0.png
new file mode 100644
index 0000000000000..eceddf73eea9e
Binary files /dev/null and b/doc/source/_static/reshaping_unstack_0.png differ
diff --git a/doc/source/_static/reshaping_unstack_1.png b/doc/source/_static/reshaping_unstack_1.png
new file mode 100644
index 0000000000000..ab0ae3796dcc1
Binary files /dev/null and b/doc/source/_static/reshaping_unstack_1.png differ
diff --git a/doc/source/_static/rplot-seaborn-example1.png b/doc/source/_static/rplot-seaborn-example1.png
deleted file mode 100644
index d19a3a018bfbf..0000000000000
Binary files a/doc/source/_static/rplot-seaborn-example1.png and /dev/null differ
diff --git a/doc/source/_static/rplot-seaborn-example2.png b/doc/source/_static/rplot-seaborn-example2.png
deleted file mode 100644
index 9293082e78129..0000000000000
Binary files a/doc/source/_static/rplot-seaborn-example2.png and /dev/null differ
diff --git a/doc/source/_static/rplot-seaborn-example3.png b/doc/source/_static/rplot-seaborn-example3.png
deleted file mode 100644
index 8fd311acbd528..0000000000000
Binary files a/doc/source/_static/rplot-seaborn-example3.png and /dev/null differ
diff --git a/doc/source/_static/rplot-seaborn-example3b.png b/doc/source/_static/rplot-seaborn-example3b.png
deleted file mode 100644
index 4bfbac574ef29..0000000000000
Binary files a/doc/source/_static/rplot-seaborn-example3b.png and /dev/null differ
diff --git a/doc/source/_static/rplot-seaborn-example4.png b/doc/source/_static/rplot-seaborn-example4.png
deleted file mode 100644
index 8e08c7e86178a..0000000000000
Binary files a/doc/source/_static/rplot-seaborn-example4.png and /dev/null differ
diff --git a/doc/source/_static/rplot-seaborn-example6.png b/doc/source/_static/rplot-seaborn-example6.png
deleted file mode 100644
index 0fa56f4a018e7..0000000000000
Binary files a/doc/source/_static/rplot-seaborn-example6.png and /dev/null differ
diff --git a/doc/source/_static/style-excel.png b/doc/source/_static/style-excel.png
new file mode 100644
index 0000000000000..f946949e8bcf9
Binary files /dev/null and b/doc/source/_static/style-excel.png differ
diff --git a/doc/source/advanced.rst b/doc/source/advanced.rst
index 76f8f6aa59b71..e530ece2e12c5 100644
--- a/doc/source/advanced.rst
+++ b/doc/source/advanced.rst
@@ -24,15 +24,9 @@ See the :ref:`Indexing and Selecting Data <indexing>` for general indexing docum
    Whether a copy or a reference is returned for a setting operation, may
    depend on the context.  This is sometimes called ``chained assignment`` and
    should be avoided.  See :ref:`Returning a View versus Copy
-   <indexing.view_versus_copy>`
+   <indexing.view_versus_copy>`.
 
-.. warning::
-
-   In 0.15.0 ``Index`` has internally been refactored to no longer sub-class ``ndarray``
-   but instead subclass ``PandasObject``, similarly to the rest of the pandas objects. This should be
-   a transparent change with only very limited API implications (See the :ref:`Internal Refactoring <whatsnew_0150.refactoring>`)
-
-See the :ref:`cookbook<cookbook.selection>` for some advanced strategies
+See the :ref:`cookbook<cookbook.selection>` for some advanced strategies.
 
 .. _advanced.hierarchical:
 
@@ -46,26 +40,26 @@ data with an arbitrary number of dimensions in lower dimensional data
 structures like Series (1d) and DataFrame (2d).
 
 In this section, we will show what exactly we mean by "hierarchical" indexing
-and how it integrates with the all of the pandas indexing functionality
+and how it integrates with all of the pandas indexing functionality
 described above and in prior sections. Later, when discussing :ref:`group by
 <groupby>` and :ref:`pivoting and reshaping data <reshaping>`, we'll show
 non-trivial applications to illustrate how it aids in structuring data for
 analysis.
 
-See the :ref:`cookbook<cookbook.multi_index>` for some advanced strategies
+See the :ref:`cookbook<cookbook.multi_index>` for some advanced strategies.
 
 Creating a MultiIndex (hierarchical index) object
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 The ``MultiIndex`` object is the hierarchical analogue of the standard
 ``Index`` object which typically stores the axis labels in pandas objects. You
-can think of ``MultiIndex`` an array of tuples where each tuple is unique. A
+can think of ``MultiIndex`` as an array of tuples where each tuple is unique. A
 ``MultiIndex`` can be created from a list of arrays (using
 ``MultiIndex.from_arrays``), an array of tuples (using
 ``MultiIndex.from_tuples``), or a crossed set of iterables (using
 ``MultiIndex.from_product``).  The ``Index`` constructor will attempt to return
 a ``MultiIndex`` when it is passed a list of tuples.  The following examples
-demo different ways to initialize MultiIndexes.
+demonstrate different ways to initialize MultiIndexes.
 
 
 .. ipython:: python
@@ -119,7 +113,13 @@ of the index is up to you:
    pd.DataFrame(np.random.randn(6, 6), index=index[:6], columns=index[:6])
 
 We've "sparsified" the higher levels of the indexes to make the console output a
-bit easier on the eyes.
+bit easier on the eyes. Note that how the index is displayed can be controlled using the
+``multi_sparse`` option in ``pandas.set_options()``:
+
+.. ipython:: python
+
+   with pd.option_context('display.multi_sparse', False):
+       df
 
 It's worth keeping in mind that there's nothing preventing you from using
 tuples as atomic labels on an axis:
@@ -135,15 +135,6 @@ can find yourself working with hierarchically-indexed data without creating a
 ``MultiIndex`` explicitly yourself. However, when loading data from a file, you
 may wish to generate your own ``MultiIndex`` when preparing the data set.
 
-Note that how the index is displayed by be controlled using the
-``multi_sparse`` option in ``pandas.set_printoptions``:
-
-.. ipython:: python
-
-   pd.set_option('display.multi_sparse', False)
-   df
-   pd.set_option('display.multi_sparse', True)
-
 .. _advanced.get_level_values:
 
 Reconstructing the level labels
@@ -175,35 +166,40 @@ completely analogous way to selecting a column in a regular DataFrame:
 See :ref:`Cross-section with hierarchical index <advanced.xs>` for how to select
 on a deeper level.
 
-.. note::
+.. _advanced.shown_levels:
 
-   The repr of a ``MultiIndex`` shows ALL the defined levels of an index, even
-   if the they are not actually used. When slicing an index, you may notice this.
-   For example:
+Defined Levels
+~~~~~~~~~~~~~~
 
-   .. ipython:: python
+The repr of a ``MultiIndex`` shows all the defined levels of an index, even
+if the they are not actually used. When slicing an index, you may notice this.
+For example:
 
-      # original multi-index
-      df.columns
+.. ipython:: python
+
+   df.columns  # original MultiIndex
+
+   df[['foo','qux']].columns  # sliced
 
-      # sliced
-      df[['foo','qux']].columns
+This is done to avoid a recomputation of the levels in order to make slicing
+highly performant. If you want to see only the used levels, you can use the
+:func:`MultiIndex.get_level_values` method.
 
-   This is done to avoid a recomputation of the levels in order to make slicing
-   highly performant. If you want to see the actual used levels.
+.. ipython:: python
 
-   .. ipython:: python
+   df[['foo','qux']].columns.values
 
-      df[['foo','qux']].columns.values
+   # for a specific level
+   df[['foo','qux']].columns.get_level_values(0)
 
-      # for a specific level
-      df[['foo','qux']].columns.get_level_values(0)
+To reconstruct the ``MultiIndex`` with only the used levels, the
+``remove_unused_levels`` method may be used.
 
-   To reconstruct the multiindex with only the used levels
+.. versionadded:: 0.20.0
 
-   .. ipython:: python
+.. ipython:: python
 
-      pd.MultiIndex.from_tuples(df[['foo','qux']].columns.values)
+   df[['foo','qux']].columns.remove_unused_levels()
 
 Data alignment and using ``reindex``
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -217,7 +213,7 @@ tuples:
    s + s[:-2]
    s + s[::2]
 
-``reindex`` can be called with another ``MultiIndex`` or even a list or array
+``reindex`` can be called with another ``MultiIndex``, or even a list or array
 of tuples:
 
 .. ipython:: python
@@ -230,16 +226,34 @@ of tuples:
 Advanced indexing with hierarchical index
 -----------------------------------------
 
-Syntactically integrating ``MultiIndex`` in advanced indexing with ``.loc/.ix`` is a
-bit challenging, but we've made every effort to do so. for example the
-following works as you would expect:
+Syntactically integrating ``MultiIndex`` in advanced indexing with ``.loc`` is a
+bit challenging, but we've made every effort to do so. In general, MultiIndex
+keys take the form of tuples. For example, the following works as you would expect:
 
 .. ipython:: python
 
    df = df.T
    df
-   df.loc['bar']
-   df.loc['bar', 'two']
+   df.loc[('bar', 'two'),]
+
+Note that ``df.loc['bar', 'two']`` would also work in this example, but this shorthand
+notation can lead to ambiguity in general.
+
+If you also want to index a specific column with ``.loc``, you must use a tuple
+like this:
+
+.. ipython:: python
+
+   df.loc[('bar', 'two'), 'A']
+
+You don't have to specify all levels of the ``MultiIndex`` by passing only the
+first elements of the tuple. For example, you can use "partial" indexing to
+get all elements with ``bar`` in the first level as follows:
+
+df.loc['bar']
+
+This is a shortcut for the slightly more verbose notation ``df.loc[('bar',),]`` (equivalent
+to ``df.loc['bar',]`` in this example).
 
 "Partial" slicing also works quite nicely.
 
@@ -258,17 +272,32 @@ Passing a list of labels or tuples works similar to reindexing:
 
 .. ipython:: python
 
-   df.ix[[('bar', 'two'), ('qux', 'one')]]
+   df.loc[[('bar', 'two'), ('qux', 'one')]]
+
+.. note::
+
+   It is important to note that tuples and lists are not treated identically
+   in pandas when it comes to indexing. Whereas a tuple is interpreted as one
+   multi-level key, a list is used to specify several keys. Or in other words,
+   tuples go horizontally (traversing levels), lists go vertically (scanning levels).
+
+Importantly, a list of tuples indexes several complete ``MultiIndex`` keys,
+whereas a tuple of lists refer to several values within a level:
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3, 4, 5, 6],
+                 index=pd.MultiIndex.from_product([["A", "B"], ["c", "d", "e"]]))
+   s.loc[[("A", "c"), ("B", "d")]]  # list of tuples
+   s.loc[(["A", "B"], ["c", "d"])]  # tuple of lists
+
 
 .. _advanced.mi_slicers:
 
 Using slicers
 ~~~~~~~~~~~~~
 
-.. versionadded:: 0.14.0
-
-In 0.14.0 we added a new way to slice multi-indexed objects.
-You can slice a multi-index by providing multiple indexers.
+You can slice a ``MultiIndex`` by providing multiple indexers.
 
 You can provide any of the selectors as if you are indexing by label, see :ref:`Selection by Label <indexing.label>`,
 including slices, lists of labels, labels, and boolean indexers.
@@ -281,25 +310,21 @@ As usual, **both sides** of the slicers are included as this is label indexing.
 .. warning::
 
    You should specify all axes in the ``.loc`` specifier, meaning the indexer for the **index** and
-   for the **columns**. Their are some ambiguous cases where the passed indexer could be mis-interpreted
-   as indexing *both* axes, rather than into say the MuliIndex for the rows.
+   for the **columns**. There are some ambiguous cases where the passed indexer could be mis-interpreted
+   as indexing *both* axes, rather than into say the ``MultiIndex`` for the rows.
 
    You should do this:
 
    .. code-block:: python
 
-      df.loc[(slice('A1','A3'),.....),:]
-
-   rather than this:
+      df.loc[(slice('A1','A3'),.....), :]
 
+   You should **not** do this:
+ 
    .. code-block:: python
 
       df.loc[(slice('A1','A3'),.....)]
 
-.. warning::
-
-   You will need to make sure that the selection axes are fully lexsorted!
-
 .. ipython:: python
 
    def mklbl(prefix,n):
@@ -317,47 +342,49 @@ As usual, **both sides** of the slicers are included as this is label indexing.
                        columns=micolumns).sort_index().sort_index(axis=1)
    dfmi
 
-Basic multi-index slicing using slices, lists, and labels.
+Basic MultiIndex slicing using slices, lists, and labels.
 
 .. ipython:: python
 
-   dfmi.loc[(slice('A1','A3'),slice(None), ['C1','C3']),:]
+   dfmi.loc[(slice('A1','A3'), slice(None), ['C1', 'C3']), :]
+
 
-You can use a ``pd.IndexSlice`` to have a more natural syntax using ``:`` rather than using ``slice(None)``
+You can use :class:`pandas.IndexSlice` to facilitate a more natural syntax
+using ``:``, rather than using ``slice(None)``.
 
 .. ipython:: python
 
    idx = pd.IndexSlice
-   dfmi.loc[idx[:,:,['C1','C3']],idx[:,'foo']]
+   dfmi.loc[idx[:, :, ['C1', 'C3']], idx[:, 'foo']]
 
 It is possible to perform quite complicated selections using this method on multiple
 axes at the same time.
 
 .. ipython:: python
 
-   dfmi.loc['A1',(slice(None),'foo')]
-   dfmi.loc[idx[:,:,['C1','C3']],idx[:,'foo']]
+   dfmi.loc['A1', (slice(None), 'foo')]
+   dfmi.loc[idx[:, :, ['C1', 'C3']], idx[:, 'foo']]
 
 Using a boolean indexer you can provide selection related to the *values*.
 
 .. ipython:: python
 
-   mask = dfmi[('a','foo')]>200
-   dfmi.loc[idx[mask,:,['C1','C3']],idx[:,'foo']]
+   mask = dfmi[('a', 'foo')] > 200
+   dfmi.loc[idx[mask, :, ['C1', 'C3']], idx[:, 'foo']]
 
 You can also specify the ``axis`` argument to ``.loc`` to interpret the passed
 slicers on a single axis.
 
 .. ipython:: python
 
-   dfmi.loc(axis=0)[:,:,['C1','C3']]
+   dfmi.loc(axis=0)[:, :, ['C1', 'C3']]
 
-Furthermore you can *set* the values using these methods
+Furthermore you can *set* the values using the following methods.
 
 .. ipython:: python
 
    df2 = dfmi.copy()
-   df2.loc(axis=0)[:,:,['C1','C3']] = -10
+   df2.loc(axis=0)[:, :, ['C1', 'C3']] = -10
    df2
 
 You can use a right-hand-side of an alignable object as well.
@@ -365,7 +392,7 @@ You can use a right-hand-side of an alignable object as well.
 .. ipython:: python
 
    df2 = dfmi.copy()
-   df2.loc[idx[:,:,['C1','C3']],:] = df2*1000
+   df2.loc[idx[:, :, ['C1', 'C3']], :] = df2 * 1000
    df2
 
 .. _advanced.xs:
@@ -383,11 +410,11 @@ selecting data at a particular level of a MultiIndex easier.
 
 .. ipython:: python
 
-   # using the slicers (new in 0.14.0)
+   # using the slicers
    df.loc[(slice(None),'one'),:]
 
 You can also select on the columns with :meth:`~pandas.MultiIndex.xs`, by
-providing the axis argument
+providing the axis argument.
 
 .. ipython:: python
 
@@ -396,10 +423,10 @@ providing the axis argument
 
 .. ipython:: python
 
-   # using the slicers (new in 0.14.0)
+   # using the slicers
    df.loc[:,(slice(None),'one')]
 
-:meth:`~pandas.MultiIndex.xs` also allows selection with multiple keys
+:meth:`~pandas.MultiIndex.xs` also allows selection with multiple keys.
 
 .. ipython:: python
 
@@ -407,19 +434,17 @@ providing the axis argument
 
 .. ipython:: python
 
-   # using the slicers (new in 0.14.0)
+   # using the slicers
    df.loc[:,('bar','one')]
 
-.. versionadded:: 0.13.0
-
 You can pass ``drop_level=False`` to :meth:`~pandas.MultiIndex.xs` to retain
-the level that was selected
+the level that was selected.
 
 .. ipython:: python
 
    df.xs('one', level='second', axis=1, drop_level=False)
 
-versus the result with ``drop_level=True`` (the default value)
+Compare the above with the result using ``drop_level=True`` (the default value).
 
 .. ipython:: python
 
@@ -477,31 +502,24 @@ allowing you to permute the hierarchical index levels in one step:
 
    df[:5].reorder_levels([1,0], axis=0)
 
-The need for sortedness with :class:`~pandas.MultiIndex`
---------------------------------------------------------
+Sorting a :class:`~pandas.MultiIndex`
+-------------------------------------
 
-**Caveat emptor**: the present implementation of ``MultiIndex`` requires that
-the labels be sorted for some of the slicing / indexing routines to work
-correctly. You can think about breaking the axis into unique groups, where at
-the hierarchical level of interest, each distinct group shares a label, but no
-two have the same label. However, the ``MultiIndex`` does not enforce this:
-**you are responsible for ensuring that things are properly sorted**. There is
-an important new method ``sort_index`` to sort an axis within a ``MultiIndex``
-so that its labels are grouped and sorted by the original ordering of the
-associated factor at that level. Note that this does not necessarily mean the
-labels will be sorted lexicographically!
+For MultiIndex-ed objects to be indexed and sliced effectively, they need
+to be sorted. As with any index, you can use ``sort_index``.
 
 .. ipython:: python
 
    import random; random.shuffle(tuples)
    s = pd.Series(np.random.randn(8), index=pd.MultiIndex.from_tuples(tuples))
    s
+   s.sort_index()
    s.sort_index(level=0)
    s.sort_index(level=1)
 
 .. _advanced.sortlevel_byname:
 
-Note, you may also pass a level name to ``sort_index`` if the MultiIndex levels
+You may also pass a level name to ``sort_index`` if the MultiIndex levels
 are named.
 
 .. ipython:: python
@@ -510,53 +528,70 @@ are named.
    s.sort_index(level='L1')
    s.sort_index(level='L2')
 
-Some indexing will work even if the data are not sorted, but will be rather
-inefficient and will also return a copy of the data rather than a view:
+On higher dimensional objects, you can sort any of the other axes by level if
+they have a ``MultiIndex``:
 
 .. ipython:: python
 
-   s['qux']
-   s.sort_index(level=1)['qux']
+   df.T.sort_index(level=1, axis=1)
 
-On higher dimensional objects, you can sort any of the other axes by level if
-they have a MultiIndex:
+Indexing will work even if the data are not sorted, but will be rather
+inefficient (and show a ``PerformanceWarning``). It will also
+return a copy of the data rather than a view:
 
 .. ipython:: python
 
-   df.T.sort_index(level=1, axis=1)
+   dfm = pd.DataFrame({'jim': [0, 0, 1, 1],
+                       'joe': ['x', 'x', 'z', 'y'],
+                       'jolie': np.random.rand(4)})
+   dfm = dfm.set_index(['jim', 'joe'])
+   dfm
 
-The ``MultiIndex`` object has code to **explicity check the sort depth**. Thus,
-if you try to index at a depth at which the index is not sorted, it will raise
-an exception. Here is a concrete example to illustrate this:
+.. code-block:: ipython
 
-.. ipython:: python
+   In [4]: dfm.loc[(1, 'z')]
+   PerformanceWarning: indexing past lexsort depth may impact performance.
 
-   tuples = [('a', 'a'), ('a', 'b'), ('b', 'a'), ('b', 'b')]
-   idx = pd.MultiIndex.from_tuples(tuples)
-   idx.lexsort_depth
+   Out[4]:
+              jolie
+   jim joe
+   1   z    0.64094
 
-   reordered = idx[[1, 0, 3, 2]]
-   reordered.lexsort_depth
+.. _advanced.unsorted:
 
-   s = pd.Series(np.random.randn(4), index=reordered)
-   s.ix['a':'a']
+Furthermore if you try to index something that is not fully lexsorted, this can raise:
 
-However:
+.. code-block:: ipython
 
-::
+    In [5]: dfm.loc[(0,'y'):(1, 'z')]
+    UnsortedIndexError: 'Key length (2) was greater than MultiIndex lexsort depth (1)'
 
-   >>> s.ix[('a', 'b'):('b', 'a')]
-   Traceback (most recent call last)
-        ...
-   KeyError: Key length (3) was greater than MultiIndex lexsort depth (2)
+The ``is_lexsorted()`` method on an ``Index`` show if the index is sorted, and the ``lexsort_depth`` property returns the sort depth:
 
+.. ipython:: python
+
+   dfm.index.is_lexsorted()
+   dfm.index.lexsort_depth
+
+.. ipython:: python
+
+   dfm = dfm.sort_index()
+   dfm
+   dfm.index.is_lexsorted()
+   dfm.index.lexsort_depth
+
+And now selection works as expected.
+
+.. ipython:: python
+
+   dfm.loc[(0,'y'):(1, 'z')]
 
 Take Methods
 ------------
 
 .. _advanced.take:
 
-Similar to numpy ndarrays, pandas Index, Series, and DataFrame also provides
+Similar to NumPy ndarrays, pandas Index, Series, and DataFrame also provides
 the ``take`` method that retrieves elements along a given axis at the given
 indices. The given indices must be either a list or an ndarray of integer
 index positions. ``take`` will also accept negative integers as relative positions to the end of the object.
@@ -598,7 +633,7 @@ intended to work on boolean indices and may return unexpected results.
 
    ser = pd.Series(np.random.randn(10))
    ser.take([False, False, True, True])
-   ser.ix[[0, 1]]
+   ser.iloc[[0, 1]]
 
 Finally, as a small note on performance, because the ``take`` method handles
 a narrower range of inputs, it can offer performance that is a good deal
@@ -614,68 +649,80 @@ faster than fancy indexing.
    timeit arr.take(indexer, axis=0)
 
    ser = pd.Series(arr[:, 0])
-   timeit ser.ix[indexer]
+   timeit ser.iloc[indexer]
    timeit ser.take(indexer)
 
+.. _indexing.index_types:
+
+Index Types
+-----------
+
+We have discussed ``MultiIndex`` in the previous sections pretty extensively. ``DatetimeIndex`` and ``PeriodIndex``
+are shown :ref:`here <timeseries.overview>`, and information about
+`TimedeltaIndex`` is found :ref:`here <timedeltas.timedeltas>`.
+
+In the following sub-sections we will highlight some other index types.
+
 .. _indexing.categoricalindex:
 
 CategoricalIndex
-----------------
+~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.16.1
-
-We introduce a ``CategoricalIndex``, a new type of index object that is useful for supporting
-indexing with duplicates. This is a container around a ``Categorical`` (introduced in v0.15.0)
-and allows efficient indexing and storage of an index with a large number of duplicated elements. Prior to 0.16.1,
-setting the index of a ``DataFrame/Series`` with a ``category`` dtype would convert this to regular object-based ``Index``.
+``CategoricalIndex`` is a type of index that is useful for supporting
+indexing with duplicates. This is a container around a ``Categorical``
+and allows efficient indexing and storage of an index with a large number of duplicated elements.
 
 .. ipython:: python
 
+   from pandas.api.types import CategoricalDtype
+
    df = pd.DataFrame({'A': np.arange(6),
                       'B': list('aabbca')})
-   df['B'] = df['B'].astype('category', categories=list('cab'))
+   df['B'] = df['B'].astype(CategoricalDtype(list('cab')))
    df
    df.dtypes
    df.B.cat.categories
 
-Setting the index, will create create a ``CategoricalIndex``
+Setting the index will create a ``CategoricalIndex``.
 
 .. ipython:: python
 
    df2 = df.set_index('B')
    df2.index
 
-Indexing with ``__getitem__/.iloc/.loc/.ix`` works similarly to an ``Index`` with duplicates.
-The indexers MUST be in the category or the operation will raise.
+Indexing with ``__getitem__/.iloc/.loc`` works similarly to an ``Index`` with duplicates.
+The indexers **must** be in the category or the operation will raise a ``KeyError``.
 
 .. ipython:: python
 
    df2.loc['a']
 
-These PRESERVE the ``CategoricalIndex``
+The ``CategoricalIndex`` is **preserved** after indexing:
 
 .. ipython:: python
 
    df2.loc['a'].index
 
-Sorting will order by the order of the categories
+Sorting the index will sort by the order of the categories (recall that we
+created the index with ``CategoricalDtype(list('cab'))``, so the sorted
+order is ``cab``).
 
 .. ipython:: python
 
    df2.sort_index()
 
-Groupby operations on the index will preserve the index nature as well
+Groupby operations on the index will preserve the index nature as well.
 
 .. ipython:: python
 
    df2.groupby(level=0).sum()
    df2.groupby(level=0).sum().index
 
-Reindexing operations, will return a resulting index based on the type of the passed
-indexer, meaning that passing a list will return a plain-old-``Index``; indexing with
+Reindexing operations will return a resulting index based on the type of the passed
+indexer. Passing a list will return a plain-old ``Index``; indexing with
 a ``Categorical`` will return a ``CategoricalIndex``, indexed according to the categories
-of the PASSED ``Categorical`` dtype. This allows one to arbitrarly index these even with
-values NOT in the categories, similarly to how you can reindex ANY pandas index.
+of the **passed** ``Categorical`` dtype. This allows one to arbitrarily index these even with
+values **not** in the categories, similarly to how you can reindex **any** pandas index.
 
 .. ipython :: python
 
@@ -686,7 +733,7 @@ values NOT in the categories, similarly to how you can reindex ANY pandas index.
 
 .. warning::
 
-   Reshaping and Comparision operations on a ``CategoricalIndex`` must have the same categories
+   Reshaping and Comparison operations on a ``CategoricalIndex`` must have the same categories
    or a ``TypeError`` will be raised.
 
    .. code-block:: python
@@ -702,21 +749,26 @@ values NOT in the categories, similarly to how you can reindex ANY pandas index.
       In [12]: pd.concat([df2, df3]
       TypeError: categories must match existing categories when appending
 
-.. _indexing.float64index:
+.. _indexing.rangeindex:
 
-Float64Index
-------------
+Int64Index and RangeIndex
+~~~~~~~~~~~~~~~~~~~~~~~~~
 
-.. note::
+.. warning::
+
+   Indexing on an integer-based Index with floats has been clarified in 0.18.0, for a summary of the changes, see :ref:`here <whatsnew_0180.float_indexers>`.
+
+``Int64Index`` is a fundamental basic index in pandas.
+This is an Immutable array implementing an ordered, sliceable set.
+Prior to 0.18.0, the ``Int64Index`` would provide the default index for all ``NDFrame`` objects.
 
-   As of 0.14.0, ``Float64Index`` is backed by a native ``float64`` dtype
-   array. Prior to 0.14.0, ``Float64Index`` was backed by an ``object`` dtype
-   array. Using a ``float64`` dtype in the backend speeds up arithmetic
-   operations by about 30x and boolean indexing operations on the
-   ``Float64Index`` itself are about 2x as fast.
+``RangeIndex`` is a sub-class of ``Int64Index`` added in version 0.18.0, now providing the default index for all ``NDFrame`` objects.
+``RangeIndex`` is an optimized version of ``Int64Index`` that can represent a monotonic ordered set. These are analogous to Python `range types <https://docs.python.org/3/library/stdtypes.html#typesseq-range>`__.
 
+.. _indexing.float64index:
 
-.. versionadded:: 0.13.0
+Float64Index
+~~~~~~~~~~~~
 
 By default a ``Float64Index`` will be automatically created when passing floating, or mixed-integer-floating values in index creation.
 This enables a pure label-based slicing paradigm that makes ``[],ix,loc`` for scalar indexing and slicing work exactly the
@@ -729,44 +781,42 @@ same.
    sf = pd.Series(range(5), index=indexf)
    sf
 
-Scalar selection for ``[],.ix,.loc`` will always be label based. An integer will match an equal float index (e.g. ``3`` is equivalent to ``3.0``)
+Scalar selection for ``[],.loc`` will always be label based. An integer will match an equal float index (e.g. ``3`` is equivalent to ``3.0``).
 
 .. ipython:: python
 
    sf[3]
    sf[3.0]
-   sf.ix[3]
-   sf.ix[3.0]
    sf.loc[3]
    sf.loc[3.0]
 
-The only positional indexing is via ``iloc``
+The only positional indexing is via ``iloc``.
 
 .. ipython:: python
 
    sf.iloc[3]
 
-A scalar index that is not found will raise ``KeyError``
-
-Slicing is ALWAYS on the values of the index, for ``[],ix,loc`` and ALWAYS positional with ``iloc``
+A scalar index that is not found will raise a ``KeyError``.
+Slicing is primarily on the values of the index when using ``[],ix,loc``, and
+**always** positional when using ``iloc``. The exception is when the slice is
+boolean, in which case it will always be positional.
 
 .. ipython:: python
 
    sf[2:4]
-   sf.ix[2:4]
    sf.loc[2:4]
    sf.iloc[2:4]
 
-In float indexes, slicing using floats is allowed
+In float indexes, slicing using floats is allowed.
 
 .. ipython:: python
 
    sf[2.1:4.6]
    sf.loc[2.1:4.6]
 
-In non-float indexes, slicing using floats will raise a ``TypeError``
+In non-float indexes, slicing using floats will raise a ``TypeError``.
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [1]: pd.Series(range(5))[3.5]
    TypeError: the label [3.5] is not a proper indexer for this index type (Int64Index)
@@ -774,12 +824,15 @@ In non-float indexes, slicing using floats will raise a ``TypeError``
    In [1]: pd.Series(range(5))[3.5:4.5]
    TypeError: the slice start [3.5] is not a proper indexer for this index type (Int64Index)
 
-Using a scalar float indexer will be deprecated in a future version, but is allowed for now.
+.. warning::
 
-.. code-block:: python
+   Using a scalar float indexer for ``.iloc`` has been removed in 0.18.0, so the following will raise a ``TypeError``:
+
+   .. code-block:: ipython
+
+      In [3]: pd.Series(range(5)).iloc[3.0]
+      TypeError: cannot do positional indexing on <class 'pandas.indexes.range.RangeIndex'> with these indexers [3.0] of <type 'float'>
 
-   In [3]: pd.Series(range(5))[3.0]
-   Out[3]: 3
 
 Here is a typical use-case for using this type of indexing. Imagine that you have a somewhat
 irregular timedelta-like indexing scheme, but the data is recorded as floats. This could for
@@ -803,14 +856,264 @@ Selection operations then will always work on a value basis, for all selection o
    dfir.loc[0:1001,'A']
    dfir.loc[1000.4]
 
-You could then easily pick out the first 1 second (1000 ms) of data then.
+You could retrieve the first 1 second (1000 ms) of data as such:
 
 .. ipython:: python
 
    dfir[0:1000]
 
-Of course if you need integer based selection, then use ``iloc``
+If you need integer based selection, you should use ``iloc``:
 
 .. ipython:: python
 
    dfir.iloc[0:5]
+
+.. _indexing.intervallindex:
+
+IntervalIndex
+~~~~~~~~~~~~~
+
+.. versionadded:: 0.20.0
+
+:class:`IntervalIndex` together with its own dtype, ``interval`` as well as the
+:class:`Interval` scalar type,  allow first-class support in pandas for interval
+notation.
+
+The ``IntervalIndex`` allows some unique indexing and is also used as a
+return type for the categories in :func:`cut` and :func:`qcut`.
+
+.. warning::
+
+   These indexing behaviors are provisional and may change in a future version of pandas.
+
+An ``IntervalIndex`` can be used in ``Series`` and in ``DataFrame`` as the index.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 2, 3, 4]},
+                      index=pd.IntervalIndex.from_breaks([0, 1, 2, 3, 4]))
+   df
+
+Label based indexing via ``.loc`` along the edges of an interval works as you would expect,
+selecting that particular interval.
+
+.. ipython:: python
+
+   df.loc[2]
+   df.loc[[2, 3]]
+
+If you select a label *contained* within an interval, this will also select the interval.
+
+.. ipython:: python
+
+   df.loc[2.5]
+   df.loc[[2.5, 3.5]]
+
+``Interval`` and ``IntervalIndex`` are used by ``cut`` and ``qcut``:
+
+.. ipython:: python
+
+   c = pd.cut(range(4), bins=2)
+   c
+   c.categories
+
+Furthermore, ``IntervalIndex`` allows one to bin *other* data with these same
+bins, with ``NaN`` representing a missing value similar to other dtypes.
+
+.. ipython:: python
+
+   pd.cut([0, 3, 5, 1], bins=c.categories)
+
+
+Generating Ranges of Intervals
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+If we need intervals on a regular frequency, we can use the :func:`interval_range` function
+to create an ``IntervalIndex`` using various combinations of ``start``, ``end``, and ``periods``.
+The default frequency for ``interval_range`` is a 1 for numeric intervals, and calendar day for
+datetime-like intervals:
+
+.. ipython:: python
+
+   pd.interval_range(start=0, end=5)
+
+   pd.interval_range(start=pd.Timestamp('2017-01-01'), periods=4)
+
+   pd.interval_range(end=pd.Timedelta('3 days'), periods=3)
+
+The ``freq`` parameter can used to specify non-default frequencies, and can utilize a variety
+of :ref:`frequency aliases <timeseries.offset_aliases>` with datetime-like intervals:
+
+.. ipython:: python
+
+   pd.interval_range(start=0, periods=5, freq=1.5)
+
+   pd.interval_range(start=pd.Timestamp('2017-01-01'), periods=4, freq='W')
+
+   pd.interval_range(start=pd.Timedelta('0 days'), periods=3, freq='9H')
+
+Additionally, the ``closed`` parameter can be used to specify which side(s) the intervals
+are closed on.  Intervals are closed on the right side by default.
+
+.. ipython:: python
+
+   pd.interval_range(start=0, end=4, closed='both')
+
+   pd.interval_range(start=0, end=4, closed='neither')
+
+.. versionadded:: 0.23.0
+
+Specifying ``start``, ``end``, and ``periods`` will generate a range of evenly spaced
+intervals from ``start`` to ``end`` inclusively, with ``periods`` number of elements
+in the resulting ``IntervalIndex``:
+
+.. ipython:: python
+
+   pd.interval_range(start=0, end=6, periods=4)
+
+   pd.interval_range(pd.Timestamp('2018-01-01'), pd.Timestamp('2018-02-28'), periods=3)
+
+Miscellaneous indexing FAQ
+--------------------------
+
+Integer indexing
+~~~~~~~~~~~~~~~~
+
+Label-based indexing with integer axis labels is a thorny topic. It has been
+discussed heavily on mailing lists and among various members of the scientific
+Python community. In pandas, our general viewpoint is that labels matter more
+than integer locations. Therefore, with an integer axis index *only*
+label-based indexing is possible with the standard tools like ``.loc``. The
+following code will generate exceptions:
+
+.. code-block:: python
+
+   s = pd.Series(range(5))
+   s[-1]
+   df = pd.DataFrame(np.random.randn(5, 4))
+   df
+   df.loc[-2:]
+
+This deliberate decision was made to prevent ambiguities and subtle bugs (many
+users reported finding bugs when the API change was made to stop "falling back"
+on position-based indexing).
+
+Non-monotonic indexes require exact matches
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+If the index of a ``Series`` or ``DataFrame`` is monotonically increasing or decreasing, then the bounds
+of a label-based slice can be outside the range of the index, much like slice indexing a
+normal Python ``list``. Monotonicity of an index can be tested with the ``is_monotonic_increasing`` and
+``is_monotonic_decreasing`` attributes.
+
+.. ipython:: python
+
+    df = pd.DataFrame(index=[2,3,3,4,5], columns=['data'], data=list(range(5)))
+    df.index.is_monotonic_increasing
+
+    # no rows 0 or 1, but still returns rows 2, 3 (both of them), and 4:
+    df.loc[0:4, :]
+
+    # slice is are outside the index, so empty DataFrame is returned
+    df.loc[13:15, :]
+
+On the other hand, if the index is not monotonic, then both slice bounds must be
+*unique* members of the index.
+
+.. ipython:: python
+
+    df = pd.DataFrame(index=[2,3,1,4,3,5], columns=['data'], data=list(range(6)))
+    df.index.is_monotonic_increasing
+
+    # OK because 2 and 4 are in the index
+    df.loc[2:4, :]
+
+.. code-block:: python
+
+    # 0 is not in the index
+    In [9]: df.loc[0:4, :]
+    KeyError: 0
+
+    # 3 is not a unique label
+    In [11]: df.loc[2:3, :]
+    KeyError: 'Cannot get right slice bound for non-unique label: 3'
+
+:meth:`Index.is_monotonic_increasing` and :meth:`Index.is_monotonic_decreasing` only check that
+an index is weakly monotonic. To check for strict monotonicity, you can combine one of those with
+:meth:`Index.is_unique`
+
+.. ipython:: python
+
+   weakly_monotonic = pd.Index(['a', 'b', 'c', 'c'])
+   weakly_monotonic
+   weakly_monotonic.is_monotonic_increasing
+   weakly_monotonic.is_monotonic_increasing & weakly_monotonic.is_unique
+
+Endpoints are inclusive
+~~~~~~~~~~~~~~~~~~~~~~~
+
+Compared with standard Python sequence slicing in which the slice endpoint is
+not inclusive, label-based slicing in pandas **is inclusive**. The primary
+reason for this is that it is often not possible to easily determine the
+"successor" or next element after a particular label in an index. For example,
+consider the following Series:
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(6), index=list('abcdef'))
+   s
+
+Suppose we wished to slice from ``c`` to ``e``, using integers this would be
+accomplished as such:
+
+.. ipython:: python
+
+   s[2:5]
+
+However, if you only had ``c`` and ``e``, determining the next element in the
+index can be somewhat complicated. For example, the following does not work:
+
+::
+
+    s.loc['c':'e'+1]
+
+A very common use case is to limit a time series to start and end at two
+specific dates. To enable this, we made the design to make label-based
+slicing include both endpoints:
+
+.. ipython:: python
+
+    s.loc['c':'e']
+
+This is most definitely a "practicality beats purity" sort of thing, but it is
+something to watch out for if you expect label-based slicing to behave exactly
+in the way that standard Python integer slicing works.
+
+
+Indexing potentially changes underlying Series dtype
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The different indexing operation can potentially change the dtype of a ``Series``.
+
+.. ipython:: python
+
+   series1 = pd.Series([1, 2, 3])
+   series1.dtype
+   res = series1.reindex([0, 4])
+   res.dtype
+   res
+
+.. ipython:: python
+
+   series2 = pd.Series([True])
+   series2.dtype
+   res = series2.reindex_like(series1)
+   res.dtype
+   res
+
+This is because the (re)indexing operations above silently inserts ``NaNs`` and the ``dtype``
+changes accordingly.  This can cause some issues when using ``numpy`` ``ufuncs``
+such as ``numpy.logical_and``.
+
+See the `this old issue <https://github.com/pydata/pandas/issues/2388>`__ for a more
+detailed discussion.
diff --git a/doc/source/api.rst b/doc/source/api.rst
index bfd1c92d14acd..8dc5d0e9fc023 100644
--- a/doc/source/api.rst
+++ b/doc/source/api.rst
@@ -5,6 +5,21 @@
 API Reference
 *************
 
+This page gives an overview of all public pandas objects, functions and
+methods. All classes and functions exposed in ``pandas.*`` namespace are public.
+
+Some subpackages are public which include ``pandas.errors``,
+``pandas.plotting``, and ``pandas.testing``. Public functions in
+``pandas.io`` and ``pandas.tseries`` submodules are mentioned in
+the documentation. ``pandas.api.types`` subpackage holds some
+public functions related to data types in pandas.
+
+
+.. warning::
+
+    The ``pandas.core``, ``pandas.compat``, and ``pandas.util`` top-level modules are PRIVATE. Stable functionality in such modules is not guaranteed.
+
+
 .. _api.functions:
 
 Input/Output
@@ -27,6 +42,7 @@ Flat File
    read_table
    read_csv
    read_fwf
+   read_msgpack
 
 Clipboard
 ~~~~~~~~~
@@ -59,6 +75,7 @@ JSON
    :toctree: generated/
 
    json_normalize
+   build_table_schema
 
 .. currentmodule:: pandas
 
@@ -81,6 +98,25 @@ HDFStore: PyTables (HDF5)
    HDFStore.append
    HDFStore.get
    HDFStore.select
+   HDFStore.info
+   HDFStore.keys
+   HDFStore.walk
+
+Feather
+~~~~~~~
+
+.. autosummary::
+   :toctree: generated/
+
+   read_feather
+
+Parquet
+~~~~~~~
+
+.. autosummary::
+   :toctree: generated/
+
+   read_parquet
 
 SAS
 ~~~
@@ -102,16 +138,11 @@ SQL
 
 Google BigQuery
 ~~~~~~~~~~~~~~~
-.. currentmodule:: pandas.io.gbq
 
 .. autosummary::
    :toctree: generated/
 
    read_gbq
-   to_gbq
-
-
-.. currentmodule:: pandas
 
 
 STATA
@@ -151,9 +182,13 @@ Data manipulations
    cut
    qcut
    merge
+   merge_ordered
+   merge_asof
    concat
    get_dummies
    factorize
+   unique
+   wide_to_long
 
 Top-level missing data
 ~~~~~~~~~~~~~~~~~~~~~~
@@ -161,7 +196,9 @@ Top-level missing data
 .. autosummary::
    :toctree: generated/
 
+   isna
    isnull
+   notna
    notnull
 
 Top-level conversions
@@ -186,72 +223,29 @@ Top-level dealing with datetimelike
    timedelta_range
    infer_freq
 
-Top-level evaluation
-~~~~~~~~~~~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   eval
-
-Standard moving window functions
+Top-level dealing with intervals
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 .. autosummary::
    :toctree: generated/
 
-   rolling_count
-   rolling_sum
-   rolling_mean
-   rolling_median
-   rolling_var
-   rolling_std
-   rolling_min
-   rolling_max
-   rolling_corr
-   rolling_corr_pairwise
-   rolling_cov
-   rolling_skew
-   rolling_kurt
-   rolling_apply
-   rolling_quantile
-   rolling_window
+   interval_range
 
-.. _api.functions_expanding:
-
-Standard expanding window functions
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Top-level evaluation
+~~~~~~~~~~~~~~~~~~~~
 
 .. autosummary::
    :toctree: generated/
 
-   expanding_count
-   expanding_sum
-   expanding_mean
-   expanding_median
-   expanding_var
-   expanding_std
-   expanding_min
-   expanding_max
-   expanding_corr
-   expanding_corr_pairwise
-   expanding_cov
-   expanding_skew
-   expanding_kurt
-   expanding_apply
-   expanding_quantile
+   eval
 
-Exponentially-weighted moving window functions
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Testing
+~~~~~~~
 
 .. autosummary::
    :toctree: generated/
 
-   ewma
-   ewmstd
-   ewmvar
-   ewmcorr
-   ewmcov
+   test
 
 .. _api.series:
 
@@ -260,6 +254,9 @@ Series
 
 Constructor
 ~~~~~~~~~~~
+
+.. currentmodule:: pandas
+
 .. autosummary::
    :toctree: generated/
 
@@ -268,7 +265,11 @@ Constructor
 Attributes
 ~~~~~~~~~~
 **Axes**
-  * **index**: axis labels
+
+.. autosummary::
+   :toctree: generated/
+
+   Series.index
 
 .. autosummary::
    :toctree: generated/
@@ -284,6 +285,16 @@ Attributes
    Series.itemsize
    Series.base
    Series.T
+   Series.memory_usage
+   Series.hasnans
+   Series.flags
+   Series.empty
+   Series.dtypes
+   Series.ftypes
+   Series.data
+   Series.is_copy
+   Series.name
+   Series.put
 
 Conversion
 ~~~~~~~~~~
@@ -291,9 +302,15 @@ Conversion
    :toctree: generated/
 
    Series.astype
+   Series.infer_objects
+   Series.convert_objects
    Series.copy
-   Series.isnull
-   Series.notnull
+   Series.bool
+   Series.to_period
+   Series.to_timestamp
+   Series.tolist
+   Series.get_values
+
 
 Indexing, iteration
 ~~~~~~~~~~~~~~~~~~~
@@ -303,13 +320,17 @@ Indexing, iteration
    Series.get
    Series.at
    Series.iat
-   Series.ix
    Series.loc
    Series.iloc
    Series.__iter__
    Series.iteritems
+   Series.items
+   Series.keys
+   Series.pop
+   Series.item
+   Series.xs
 
-For more information on ``.at``, ``.iat``, ``.ix``, ``.loc``, and
+For more information on ``.at``, ``.iat``, ``.loc``, and
 ``.iloc``,  see the :ref:`indexing documentation <indexing>`.
 
 Binary operator functions
@@ -342,15 +363,24 @@ Binary operator functions
    Series.ge
    Series.ne
    Series.eq
+   Series.product
+   Series.dot
 
-Function application, GroupBy
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Function application, GroupBy & Window
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 .. autosummary::
    :toctree: generated/
 
    Series.apply
+   Series.agg
+   Series.aggregate
+   Series.transform
    Series.map
    Series.groupby
+   Series.rolling
+   Series.expanding
+   Series.ewm
+   Series.pipe
 
 .. _api.series.stats:
 
@@ -395,9 +425,18 @@ Computations / Descriptive Stats
    Series.std
    Series.sum
    Series.var
+   Series.kurtosis
    Series.unique
    Series.nunique
+   Series.is_unique
+   Series.is_monotonic
+   Series.is_monotonic_increasing
+   Series.is_monotonic_decreasing
    Series.value_counts
+   Series.compound
+   Series.nonzero
+   Series.ptp
+
 
 Reindexing / Selection / Label manipulation
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -418,20 +457,27 @@ Reindexing / Selection / Label manipulation
    Series.reindex
    Series.reindex_like
    Series.rename
+   Series.rename_axis
    Series.reset_index
    Series.sample
    Series.select
+   Series.set_axis
    Series.take
    Series.tail
    Series.truncate
    Series.where
    Series.mask
+   Series.add_prefix
+   Series.add_suffix
+   Series.filter
 
 Missing data handling
 ~~~~~~~~~~~~~~~~~~~~~
 .. autosummary::
    :toctree: generated/
 
+   Series.isna
+   Series.notna
    Series.dropna
    Series.fillna
    Series.interpolate
@@ -442,13 +488,20 @@ Reshaping, sorting
    :toctree: generated/
 
    Series.argsort
+   Series.argmin
+   Series.argmax
    Series.reorder_levels
    Series.sort_values
    Series.sort_index
-   Series.sortlevel
    Series.swaplevel
    Series.unstack
    Series.searchsorted
+   Series.ravel
+   Series.repeat
+   Series.squeeze
+   Series.view
+   Series.sortlevel
+
 
 Combining / joining / merging
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -472,6 +525,10 @@ Time series-related
    Series.resample
    Series.tz_convert
    Series.tz_localize
+   Series.at_time
+   Series.between_time
+   Series.tshift
+   Series.slice_shift
 
 Datetimelike Properties
 ~~~~~~~~~~~~~~~~~~~~~~~
@@ -508,6 +565,7 @@ These can be accessed like ``Series.dt.<property>``.
    Series.dt.is_quarter_end
    Series.dt.is_year_start
    Series.dt.is_year_end
+   Series.dt.is_leap_year
    Series.dt.daysinmonth
    Series.dt.days_in_month
    Series.dt.tz
@@ -525,6 +583,11 @@ These can be accessed like ``Series.dt.<property>``.
    Series.dt.tz_convert
    Series.dt.normalize
    Series.dt.strftime
+   Series.dt.round
+   Series.dt.floor
+   Series.dt.ceil
+   Series.dt.month_name
+   Series.dt.day_name
 
 **Timedelta Properties**
 
@@ -550,7 +613,7 @@ These can be accessed like ``Series.dt.<property>``.
 String handling
 ~~~~~~~~~~~~~~~
 ``Series.str`` can be used to access the values of the series as
-strings and apply several methods to it. These can be acccessed like
+strings and apply several methods to it. These can be accessed like
 ``Series.str.<function/property>``.
 
 .. autosummary::
@@ -566,6 +629,7 @@ strings and apply several methods to it. These can be acccessed like
    Series.str.encode
    Series.str.endswith
    Series.str.extract
+   Series.str.extractall
    Series.str.find
    Series.str.findall
    Series.str.get
@@ -622,45 +686,29 @@ strings and apply several methods to it. These can be acccessed like
        Series.cat
        Series.dt
        Index.str
-       CategoricalIndex.str
-       DatetimeIndex.str
-       TimedeltaIndex.str
-
 
 .. _api.categorical:
 
 Categorical
 ~~~~~~~~~~~
 
-If the Series is of dtype ``category``, ``Series.cat`` can be used to change the the categorical
-data. This accessor is similar to the ``Series.dt`` or ``Series.str`` and has the
-following usable methods and properties:
+Pandas defines a custom data type for representing data that can take only a
+limited, fixed set of values. The dtype of a ``Categorical`` can be described by
+a :class:`pandas.api.types.CategoricalDtype`.
 
 .. autosummary::
    :toctree: generated/
-   :template: autosummary/accessor_attribute.rst
+   :template: autosummary/class_without_autosummary.rst
 
-   Series.cat.categories
-   Series.cat.ordered
-   Series.cat.codes
+   api.types.CategoricalDtype
 
 .. autosummary::
    :toctree: generated/
-   :template: autosummary/accessor_method.rst
 
-   Series.cat.rename_categories
-   Series.cat.reorder_categories
-   Series.cat.add_categories
-   Series.cat.remove_categories
-   Series.cat.remove_unused_categories
-   Series.cat.set_categories
-   Series.cat.as_ordered
-   Series.cat.as_unordered
-
-To create a Series of dtype ``category``, use ``cat = s.astype("category")``.
+   api.types.CategoricalDtype.categories
+   api.types.CategoricalDtype.ordered
 
-The following two ``Categorical`` constructors are considered API but should only be used when
-adding ordering information or special categories is need at creation time of the categorical data:
+Categorical data can be stored in a :class:`pandas.Categorical`
 
 .. autosummary::
    :toctree: generated/
@@ -668,19 +716,65 @@ adding ordering information or special categories is need at creation time of th
 
    Categorical
 
+
+The alternative :meth:`Categorical.from_codes` constructor can be used when you
+have the categories and integer codes already:
+
 .. autosummary::
    :toctree: generated/
 
    Categorical.from_codes
 
+The dtype information is available on the ``Categorical``
+
+.. autosummary::
+   :toctree: generated/
+
+   Categorical.dtype
+   Categorical.categories
+   Categorical.ordered
+   Categorical.codes
+
 ``np.asarray(categorical)`` works by implementing the array interface. Be aware, that this converts
-the Categorical back to a numpy array, so levels and order information is not preserved!
+the Categorical back to a NumPy array, so categories and order information is not preserved!
 
 .. autosummary::
    :toctree: generated/
 
    Categorical.__array__
 
+A ``Categorical`` can be stored in a ``Series`` or ``DataFrame``.
+To create a Series of dtype ``category``, use ``cat = s.astype(dtype)`` or
+``Series(..., dtype=dtype)`` where ``dtype`` is either
+
+* the string ``'category'``
+* an instance of :class:`~pandas.api.types.CategoricalDtype`.
+
+If the Series is of dtype ``CategoricalDtype``, ``Series.cat`` can be used to change the categorical
+data. This accessor is similar to the ``Series.dt`` or ``Series.str`` and has the
+following usable methods and properties:
+
+.. autosummary::
+   :toctree: generated/
+   :template: autosummary/accessor_attribute.rst
+
+   Series.cat.categories
+   Series.cat.ordered
+   Series.cat.codes
+
+.. autosummary::
+   :toctree: generated/
+   :template: autosummary/accessor_method.rst
+
+   Series.cat.rename_categories
+   Series.cat.reorder_categories
+   Series.cat.add_categories
+   Series.cat.remove_categories
+   Series.cat.remove_unused_categories
+   Series.cat.set_categories
+   Series.cat.as_ordered
+   Series.cat.as_unordered
+
 Plotting
 ~~~~~~~~
 
@@ -717,11 +811,12 @@ Serialization / IO / Conversion
 .. autosummary::
    :toctree: generated/
 
-   Series.from_csv
    Series.to_pickle
    Series.to_csv
    Series.to_dict
+   Series.to_excel
    Series.to_frame
+   Series.to_xarray
    Series.to_hdf
    Series.to_sql
    Series.to_msgpack
@@ -730,9 +825,10 @@ Serialization / IO / Conversion
    Series.to_dense
    Series.to_string
    Series.to_clipboard
+   Series.to_latex
 
-Sparse methods
-~~~~~~~~~~~~~~
+Sparse
+~~~~~~
 .. autosummary::
    :toctree: generated/
 
@@ -755,23 +851,29 @@ Attributes and underlying data
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 **Axes**
 
-  * **index**: row labels
-  * **columns**: column labels
+.. autosummary::
+   :toctree: generated/
+
+   DataFrame.index
+   DataFrame.columns
 
 .. autosummary::
    :toctree: generated/
 
-   DataFrame.as_matrix
    DataFrame.dtypes
    DataFrame.ftypes
    DataFrame.get_dtype_counts
    DataFrame.get_ftype_counts
    DataFrame.select_dtypes
    DataFrame.values
+   DataFrame.get_values
    DataFrame.axes
    DataFrame.ndim
    DataFrame.size
    DataFrame.shape
+   DataFrame.memory_usage
+   DataFrame.empty
+   DataFrame.is_copy
 
 Conversion
 ~~~~~~~~~~
@@ -780,9 +882,11 @@ Conversion
 
    DataFrame.astype
    DataFrame.convert_objects
+   DataFrame.infer_objects
    DataFrame.copy
-   DataFrame.isnull
-   DataFrame.notnull
+   DataFrame.isna
+   DataFrame.notna
+   DataFrame.bool
 
 Indexing, iteration
 ~~~~~~~~~~~~~~~~~~~
@@ -792,11 +896,13 @@ Indexing, iteration
    DataFrame.head
    DataFrame.at
    DataFrame.iat
-   DataFrame.ix
    DataFrame.loc
    DataFrame.iloc
    DataFrame.insert
+   DataFrame.insert
    DataFrame.__iter__
+   DataFrame.items
+   DataFrame.keys
    DataFrame.iteritems
    DataFrame.iterrows
    DataFrame.itertuples
@@ -804,12 +910,13 @@ Indexing, iteration
    DataFrame.pop
    DataFrame.tail
    DataFrame.xs
+   DataFrame.get
    DataFrame.isin
    DataFrame.where
    DataFrame.mask
    DataFrame.query
 
-For more information on ``.at``, ``.iat``, ``.ix``, ``.loc``, and
+For more information on ``.at``, ``.iat``, ``.loc``, and
 ``.iloc``,  see the :ref:`indexing documentation <indexing>`.
 
 
@@ -826,6 +933,7 @@ Binary operator functions
    DataFrame.floordiv
    DataFrame.mod
    DataFrame.pow
+   DataFrame.dot
    DataFrame.radd
    DataFrame.rsub
    DataFrame.rmul
@@ -843,14 +951,21 @@ Binary operator functions
    DataFrame.combine
    DataFrame.combine_first
 
-Function application, GroupBy
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Function application, GroupBy & Window
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 .. autosummary::
    :toctree: generated/
 
    DataFrame.apply
    DataFrame.applymap
+   DataFrame.pipe
+   DataFrame.agg
+   DataFrame.aggregate
+   DataFrame.transform
    DataFrame.groupby
+   DataFrame.rolling
+   DataFrame.expanding
+   DataFrame.ewm
 
 .. _api.dataframe.stats:
 
@@ -865,6 +980,7 @@ Computations / Descriptive Stats
    DataFrame.clip
    DataFrame.clip_lower
    DataFrame.clip_upper
+   DataFrame.compound
    DataFrame.corr
    DataFrame.corrwith
    DataFrame.count
@@ -877,6 +993,7 @@ Computations / Descriptive Stats
    DataFrame.diff
    DataFrame.eval
    DataFrame.kurt
+   DataFrame.kurtosis
    DataFrame.mad
    DataFrame.max
    DataFrame.mean
@@ -885,6 +1002,7 @@ Computations / Descriptive Stats
    DataFrame.mode
    DataFrame.pct_change
    DataFrame.prod
+   DataFrame.product
    DataFrame.quantile
    DataFrame.rank
    DataFrame.round
@@ -893,6 +1011,7 @@ Computations / Descriptive Stats
    DataFrame.sum
    DataFrame.std
    DataFrame.var
+   DataFrame.nunique
 
 Reindexing / Selection / Label manipulation
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -902,6 +1021,8 @@ Reindexing / Selection / Label manipulation
    DataFrame.add_prefix
    DataFrame.add_suffix
    DataFrame.align
+   DataFrame.at_time
+   DataFrame.between_time
    DataFrame.drop
    DataFrame.drop_duplicates
    DataFrame.duplicated
@@ -916,9 +1037,11 @@ Reindexing / Selection / Label manipulation
    DataFrame.reindex_axis
    DataFrame.reindex_like
    DataFrame.rename
+   DataFrame.rename_axis
    DataFrame.reset_index
    DataFrame.sample
    DataFrame.select
+   DataFrame.set_axis
    DataFrame.set_index
    DataFrame.tail
    DataFrame.take
@@ -934,6 +1057,7 @@ Missing data handling
    DataFrame.dropna
    DataFrame.fillna
    DataFrame.replace
+   DataFrame.interpolate
 
 Reshaping, sorting, transposing
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -941,17 +1065,21 @@ Reshaping, sorting, transposing
    :toctree: generated/
 
    DataFrame.pivot
+   DataFrame.pivot_table
    DataFrame.reorder_levels
    DataFrame.sort_values
    DataFrame.sort_index
-   DataFrame.sortlevel
    DataFrame.nlargest
    DataFrame.nsmallest
    DataFrame.swaplevel
    DataFrame.stack
    DataFrame.unstack
-   DataFrame.T
+   DataFrame.swapaxes
+   DataFrame.melt
+   DataFrame.squeeze
    DataFrame.to_panel
+   DataFrame.to_xarray
+   DataFrame.T
    DataFrame.transpose
 
 Combining / joining / merging
@@ -971,7 +1099,10 @@ Time series-related
    :toctree: generated/
 
    DataFrame.asfreq
+   DataFrame.asof
    DataFrame.shift
+   DataFrame.slice_shift
+   DataFrame.tshift
    DataFrame.first_valid_index
    DataFrame.last_valid_index
    DataFrame.resample
@@ -1026,6 +1157,7 @@ Serialization / IO / Conversion
    DataFrame.from_items
    DataFrame.from_records
    DataFrame.info
+   DataFrame.to_parquet
    DataFrame.to_pickle
    DataFrame.to_csv
    DataFrame.to_hdf
@@ -1034,6 +1166,7 @@ Serialization / IO / Conversion
    DataFrame.to_excel
    DataFrame.to_json
    DataFrame.to_html
+   DataFrame.to_feather
    DataFrame.to_latex
    DataFrame.to_stata
    DataFrame.to_msgpack
@@ -1043,6 +1176,14 @@ Serialization / IO / Conversion
    DataFrame.to_dense
    DataFrame.to_string
    DataFrame.to_clipboard
+   DataFrame.style
+
+Sparse
+~~~~~~
+.. autosummary::
+   :toctree: generated/
+
+   SparseDataFrame.to_coo
 
 .. _api.panel:
 
@@ -1060,9 +1201,9 @@ Attributes and underlying data
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 **Axes**
 
-  * **items**: axis 0; each item corresponds to a DataFrame contained inside
-  * **major_axis**: axis 1; the index (rows) of each of the DataFrames
-  * **minor_axis**: axis 2; the columns of each of the DataFrames
+* **items**: axis 0; each item corresponds to a DataFrame contained inside
+* **major_axis**: axis 1; the index (rows) of each of the DataFrames
+* **minor_axis**: axis 2; the columns of each of the DataFrames
 
 .. autosummary::
    :toctree: generated/
@@ -1084,8 +1225,8 @@ Conversion
 
    Panel.astype
    Panel.copy
-   Panel.isnull
-   Panel.notnull
+   Panel.isna
+   Panel.notna
 
 Getting and setting
 ~~~~~~~~~~~~~~~~~~~
@@ -1102,7 +1243,6 @@ Indexing, iteration, slicing
 
    Panel.at
    Panel.iat
-   Panel.ix
    Panel.loc
    Panel.iloc
    Panel.__iter__
@@ -1112,7 +1252,7 @@ Indexing, iteration, slicing
    Panel.major_xs
    Panel.minor_xs
 
-For more information on ``.at``, ``.iat``, ``.ix``, ``.loc``, and
+For more information on ``.at``, ``.iat``, ``.loc``, and
 ``.iloc``,  see the :ref:`indexing documentation <indexing>`.
 
 Binary operator functions
@@ -1179,6 +1319,7 @@ Computations / Descriptive Stats
    Panel.std
    Panel.var
 
+
 Reindexing / Selection / Label manipulation
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 .. autosummary::
@@ -1200,13 +1341,13 @@ Reindexing / Selection / Label manipulation
    Panel.take
    Panel.truncate
 
+
 Missing data handling
 ~~~~~~~~~~~~~~~~~~~~~
 .. autosummary::
    :toctree: generated/
 
    Panel.dropna
-   Panel.fillna
 
 Reshaping, sorting, transposing
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -1247,62 +1388,17 @@ Serialization / IO / Conversion
    Panel.to_pickle
    Panel.to_excel
    Panel.to_hdf
-   Panel.to_json
    Panel.to_sparse
    Panel.to_frame
    Panel.to_clipboard
 
-.. _api.panel4d:
-
-Panel4D
--------
-
-Constructor
-~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel4D
-
-Attributes and underlying data
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-**Axes**
-
-  * **labels**: axis 1; each label corresponds to a Panel contained inside
-  * **items**: axis 2; each item corresponds to a DataFrame contained inside
-  * **major_axis**: axis 3; the index (rows) of each of the DataFrames
-  * **minor_axis**: axis 4; the columns of each of the DataFrames
-
-.. autosummary::
-   :toctree: generated/
-
-   Panel4D.values
-   Panel4D.axes
-   Panel4D.ndim
-   Panel4D.size
-   Panel4D.shape
-   Panel4D.dtypes
-   Panel4D.ftypes
-   Panel4D.get_dtype_counts
-   Panel4D.get_ftype_counts
-
-Conversion
-~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel4D.astype
-   Panel4D.copy
-   Panel4D.isnull
-   Panel4D.notnull
-
 .. _api.index:
 
 Index
 -----
 
 **Many of these methods or variants thereof are available on the objects
-that contain an index (Series/Dataframe) and those should most likely be
+that contain an index (Series/DataFrame) and those should most likely be
 used before calling these methods directly.**
 
 .. autosummary::
@@ -1322,17 +1418,23 @@ Attributes
    Index.is_monotonic_decreasing
    Index.is_unique
    Index.has_duplicates
+   Index.hasnans
    Index.dtype
+   Index.dtype_str
    Index.inferred_type
    Index.is_all_dates
    Index.shape
+   Index.name
+   Index.names
    Index.nbytes
    Index.ndim
    Index.size
+   Index.empty
    Index.strides
    Index.itemsize
    Index.base
    Index.T
+   Index.memory_usage
 
 Modifying and Computations
 ~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -1352,26 +1454,60 @@ Modifying and Computations
    Index.factorize
    Index.identical
    Index.insert
+   Index.is_
+   Index.is_boolean
+   Index.is_categorical
+   Index.is_floating
+   Index.is_integer
+   Index.is_interval
+   Index.is_mixed
+   Index.is_numeric
+   Index.is_object
    Index.min
    Index.max
    Index.reindex
+   Index.rename
    Index.repeat
+   Index.where
    Index.take
    Index.putmask
-   Index.set_names
    Index.unique
    Index.nunique
    Index.value_counts
 
+Compatibility with MultiIndex
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: generated/
+
+   Index.set_names
+   Index.is_lexsorted_for_tuple
+   Index.droplevel
+
+Missing Values
+~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: generated/
+
+   Index.fillna
+   Index.dropna
+   Index.isna
+   Index.notna
+
 Conversion
 ~~~~~~~~~~
 .. autosummary::
    :toctree: generated/
 
    Index.astype
+   Index.item
+   Index.map
+   Index.ravel
    Index.tolist
-   Index.to_datetime
+   Index.to_native_types
    Index.to_series
+   Index.to_frame
+   Index.view
 
 Sorting
 ~~~~~~~
@@ -1379,6 +1515,7 @@ Sorting
    :toctree: generated/
 
    Index.argsort
+   Index.searchsorted
    Index.sort_values
 
 Time-specific operations
@@ -1398,22 +1535,53 @@ Combining / joining / set operations
    Index.intersection
    Index.union
    Index.difference
-   Index.sym_diff
+   Index.symmetric_difference
 
 Selecting
 ~~~~~~~~~
 .. autosummary::
    :toctree: generated/
 
+   Index.asof
+   Index.asof_locs
+   Index.contains
+   Index.get_duplicates
    Index.get_indexer
+   Index.get_indexer_for
    Index.get_indexer_non_unique
    Index.get_level_values
    Index.get_loc
+   Index.get_slice_bound
    Index.get_value
+   Index.get_values
+   Index.set_value
    Index.isin
    Index.slice_indexer
    Index.slice_locs
 
+.. _api.numericindex:
+
+Numeric Index
+-------------
+
+.. autosummary::
+   :toctree: generated/
+   :template: autosummary/class_without_autosummary.rst
+
+   RangeIndex
+   Int64Index
+   UInt64Index
+   Float64Index
+
+.. We need this autosummary so that the methods are generated.
+.. Separate block, since they aren't classes.
+
+.. autosummary::
+   :toctree: generated/
+
+   RangeIndex.from_range
+
+
 .. _api.categoricalindex:
 
 CategoricalIndex
@@ -1421,6 +1589,7 @@ CategoricalIndex
 
 .. autosummary::
    :toctree: generated/
+   :template: autosummary/class_without_autosummary.rst
 
    CategoricalIndex
 
@@ -1441,6 +1610,105 @@ Categorical Components
    CategoricalIndex.set_categories
    CategoricalIndex.as_ordered
    CategoricalIndex.as_unordered
+   CategoricalIndex.map
+
+.. _api.intervalindex:
+
+IntervalIndex
+-------------
+
+.. autosummary::
+   :toctree: generated/
+   :template: autosummary/class_without_autosummary.rst
+
+   IntervalIndex
+
+IntervalIndex Components
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+   :toctree: generated/
+
+   IntervalIndex.from_arrays
+   IntervalIndex.from_tuples
+   IntervalIndex.from_breaks
+   IntervalIndex.contains
+   IntervalIndex.left
+   IntervalIndex.right
+   IntervalIndex.mid
+   IntervalIndex.closed
+   IntervalIndex.length
+   IntervalIndex.values
+   IntervalIndex.is_non_overlapping_monotonic
+   IntervalIndex.get_loc
+   IntervalIndex.get_indexer
+
+
+.. _api.multiindex:
+
+MultiIndex
+----------
+
+.. autosummary::
+   :toctree: generated/
+   :template: autosummary/class_without_autosummary.rst
+
+   MultiIndex
+
+.. autosummary::
+   :toctree: generated/
+
+   IndexSlice
+
+MultiIndex Constructors
+~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+   :toctree: generated/
+
+   MultiIndex.from_arrays
+   MultiIndex.from_tuples
+   MultiIndex.from_product
+
+MultiIndex Attributes
+~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+   :toctree: generated/
+
+   MultiIndex.names
+   MultiIndex.levels
+   MultiIndex.labels
+   MultiIndex.nlevels
+   MultiIndex.levshape
+
+MultiIndex Components
+~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+   :toctree: generated/
+
+   MultiIndex.set_levels
+   MultiIndex.set_labels
+   MultiIndex.to_hierarchical
+   MultiIndex.to_frame
+   MultiIndex.is_lexsorted
+   MultiIndex.sortlevel
+   MultiIndex.droplevel
+   MultiIndex.swaplevel
+   MultiIndex.reorder_levels
+   MultiIndex.remove_unused_levels
+   MultiIndex.unique
+
+MultiIndex Selecting
+~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+   :toctree: generated/
+
+   MultiIndex.get_loc
+   MultiIndex.get_indexer
+   MultiIndex.get_level_values
 
 .. _api.datetimeindex:
 
@@ -1449,6 +1717,7 @@ DatetimeIndex
 
 .. autosummary::
    :toctree: generated/
+   :template: autosummary/class_without_autosummary.rst
 
    DatetimeIndex
 
@@ -1483,6 +1752,7 @@ Time/Date Components
    DatetimeIndex.is_quarter_end
    DatetimeIndex.is_year_start
    DatetimeIndex.is_year_end
+   DatetimeIndex.is_leap_year
    DatetimeIndex.inferred_freq
 
 Selecting
@@ -1504,24 +1774,29 @@ Time-specific operations
    DatetimeIndex.snap
    DatetimeIndex.tz_convert
    DatetimeIndex.tz_localize
-
+   DatetimeIndex.round
+   DatetimeIndex.floor
+   DatetimeIndex.ceil
+   DatetimeIndex.month_name
+   DatetimeIndex.day_name
 
 Conversion
 ~~~~~~~~~~
 .. autosummary::
    :toctree: generated/
 
-   DatetimeIndex.to_datetime
    DatetimeIndex.to_period
    DatetimeIndex.to_perioddelta
    DatetimeIndex.to_pydatetime
    DatetimeIndex.to_series
+   DatetimeIndex.to_frame
 
 TimedeltaIndex
 --------------
 
 .. autosummary::
    :toctree: generated/
+   :template: autosummary/class_without_autosummary.rst
 
    TimedeltaIndex
 
@@ -1545,6 +1820,346 @@ Conversion
 
    TimedeltaIndex.to_pytimedelta
    TimedeltaIndex.to_series
+   TimedeltaIndex.round
+   TimedeltaIndex.floor
+   TimedeltaIndex.ceil
+   TimedeltaIndex.to_frame
+
+.. currentmodule:: pandas
+
+PeriodIndex
+--------------
+
+.. autosummary::
+   :toctree: generated/
+   :template: autosummary/class_without_autosummary.rst
+
+   PeriodIndex
+
+Attributes
+~~~~~~~~~~
+.. autosummary::
+    :toctree: generated/
+
+    PeriodIndex.day
+    PeriodIndex.dayofweek
+    PeriodIndex.dayofyear
+    PeriodIndex.days_in_month
+    PeriodIndex.daysinmonth
+    PeriodIndex.end_time
+    PeriodIndex.freq
+    PeriodIndex.freqstr
+    PeriodIndex.hour
+    PeriodIndex.is_leap_year
+    PeriodIndex.minute
+    PeriodIndex.month
+    PeriodIndex.quarter
+    PeriodIndex.qyear
+    PeriodIndex.second
+    PeriodIndex.start_time
+    PeriodIndex.week
+    PeriodIndex.weekday
+    PeriodIndex.weekofyear
+    PeriodIndex.year
+
+Methods
+~~~~~~~
+.. autosummary::
+    :toctree: generated/
+
+    PeriodIndex.asfreq
+    PeriodIndex.strftime
+    PeriodIndex.to_timestamp
+    PeriodIndex.tz_convert
+    PeriodIndex.tz_localize
+
+Scalars
+-------
+
+Period
+~~~~~~
+.. autosummary::
+    :toctree: generated/
+
+    Period
+
+Attributes
+~~~~~~~~~~
+.. autosummary::
+    :toctree: generated/
+
+    Period.day
+    Period.dayofweek
+    Period.dayofyear
+    Period.days_in_month
+    Period.daysinmonth
+    Period.end_time
+    Period.freq
+    Period.freqstr
+    Period.hour
+    Period.is_leap_year
+    Period.minute
+    Period.month
+    Period.ordinal
+    Period.quarter
+    Period.qyear
+    Period.second
+    Period.start_time
+    Period.week
+    Period.weekday
+    Period.weekofyear
+    Period.year
+
+Methods
+~~~~~~~
+.. autosummary::
+    :toctree: generated/
+
+    Period.asfreq
+    Period.now
+    Period.strftime
+    Period.to_timestamp
+
+Timestamp
+~~~~~~~~~
+.. autosummary::
+    :toctree: generated/
+
+    Timestamp
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+    :toctree: generated/
+
+    Timestamp.asm8
+    Timestamp.day
+    Timestamp.dayofweek
+    Timestamp.dayofyear
+    Timestamp.days_in_month
+    Timestamp.daysinmonth
+    Timestamp.fold
+    Timestamp.hour
+    Timestamp.is_leap_year
+    Timestamp.is_month_end
+    Timestamp.is_month_start
+    Timestamp.is_quarter_end
+    Timestamp.is_quarter_start
+    Timestamp.is_year_end
+    Timestamp.is_year_start
+    Timestamp.max
+    Timestamp.microsecond
+    Timestamp.min
+    Timestamp.minute
+    Timestamp.month
+    Timestamp.nanosecond
+    Timestamp.quarter
+    Timestamp.resolution
+    Timestamp.second
+    Timestamp.tz
+    Timestamp.tzinfo
+    Timestamp.value
+    Timestamp.week
+    Timestamp.weekofyear
+    Timestamp.year
+
+Methods
+~~~~~~~
+.. autosummary::
+    :toctree: generated/
+
+    Timestamp.astimezone
+    Timestamp.ceil
+    Timestamp.combine
+    Timestamp.ctime
+    Timestamp.date
+    Timestamp.day_name
+    Timestamp.dst
+    Timestamp.floor
+    Timestamp.freq
+    Timestamp.freqstr
+    Timestamp.fromordinal
+    Timestamp.fromtimestamp
+    Timestamp.isocalendar
+    Timestamp.isoformat
+    Timestamp.isoweekday
+    Timestamp.month_name
+    Timestamp.normalize
+    Timestamp.now
+    Timestamp.replace
+    Timestamp.round
+    Timestamp.strftime
+    Timestamp.strptime
+    Timestamp.time
+    Timestamp.timestamp
+    Timestamp.timetuple
+    Timestamp.timetz
+    Timestamp.to_datetime64
+    Timestamp.to_julian_date
+    Timestamp.to_period
+    Timestamp.to_pydatetime
+    Timestamp.today
+    Timestamp.toordinal
+    Timestamp.tz_convert
+    Timestamp.tz_localize
+    Timestamp.tzname
+    Timestamp.utcfromtimestamp
+    Timestamp.utcnow
+    Timestamp.utcoffset
+    Timestamp.utctimetuple
+    Timestamp.weekday
+
+Interval
+~~~~~~~~
+.. autosummary::
+    :toctree: generated/
+
+    Interval
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+    :toctree: generated/
+
+    Interval.closed
+    Interval.closed_left
+    Interval.closed_right
+    Interval.left
+    Interval.length
+    Interval.mid
+    Interval.open_left
+    Interval.open_right
+    Interval.right
+
+Timedelta
+~~~~~~~~~
+.. autosummary::
+    :toctree: generated/
+
+    Timedelta
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+    :toctree: generated/
+
+    Timedelta.asm8
+    Timedelta.components
+    Timedelta.days
+    Timedelta.delta
+    Timedelta.freq
+    Timedelta.is_populated
+    Timedelta.max
+    Timedelta.microseconds
+    Timedelta.min
+    Timedelta.nanoseconds
+    Timedelta.resolution
+    Timedelta.seconds
+    Timedelta.value
+    Timedelta.view
+
+Methods
+~~~~~~~
+.. autosummary::
+    :toctree: generated/
+
+    Timedelta.ceil
+    Timedelta.floor
+    Timedelta.isoformat
+    Timedelta.round
+    Timedelta.to_pytimedelta
+    Timedelta.to_timedelta64
+    Timedelta.total_seconds
+
+.. _api.frequencies:
+
+Frequencies
+-----------
+
+.. currentmodule:: pandas.tseries.frequencies
+
+.. _api.offsets:
+
+.. autosummary::
+   :toctree: generated/
+
+   to_offset
+
+
+Window
+------
+
+.. currentmodule:: pandas.core.window
+
+Rolling objects are returned by ``.rolling`` calls: :func:`pandas.DataFrame.rolling`, :func:`pandas.Series.rolling`, etc.
+Expanding objects are returned by ``.expanding`` calls: :func:`pandas.DataFrame.expanding`, :func:`pandas.Series.expanding`, etc.
+EWM objects are returned by ``.ewm`` calls: :func:`pandas.DataFrame.ewm`, :func:`pandas.Series.ewm`, etc.
+
+Standard moving window functions
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. currentmodule:: pandas.core.window
+
+.. autosummary::
+   :toctree: generated/
+
+   Rolling.count
+   Rolling.sum
+   Rolling.mean
+   Rolling.median
+   Rolling.var
+   Rolling.std
+   Rolling.min
+   Rolling.max
+   Rolling.corr
+   Rolling.cov
+   Rolling.skew
+   Rolling.kurt
+   Rolling.apply
+   Rolling.aggregate
+   Rolling.quantile
+   Window.mean
+   Window.sum
+
+.. _api.functions_expanding:
+
+Standard expanding window functions
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. currentmodule:: pandas.core.window
+
+.. autosummary::
+   :toctree: generated/
+
+   Expanding.count
+   Expanding.sum
+   Expanding.mean
+   Expanding.median
+   Expanding.var
+   Expanding.std
+   Expanding.min
+   Expanding.max
+   Expanding.corr
+   Expanding.cov
+   Expanding.skew
+   Expanding.kurt
+   Expanding.apply
+   Expanding.aggregate
+   Expanding.quantile
+
+Exponentially-weighted moving window functions
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. currentmodule:: pandas.core.window
+
+.. autosummary::
+   :toctree: generated/
+
+   EWM.mean
+   EWM.std
+   EWM.var
+   EWM.corr
+   EWM.cov
 
 GroupBy
 -------
@@ -1566,6 +2181,7 @@ Indexing, iteration
 
 .. autosummary::
    :toctree: generated/
+   :template: autosummary/class_without_autosummary.rst
 
    Grouper
 
@@ -1579,14 +2195,19 @@ Function application
    GroupBy.apply
    GroupBy.aggregate
    GroupBy.transform
+   GroupBy.pipe
 
 Computations / Descriptive Stats
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 .. autosummary::
    :toctree: generated/
 
+   GroupBy.all
+   GroupBy.any
+   GroupBy.bfill
    GroupBy.count
    GroupBy.cumcount
+   GroupBy.ffill
    GroupBy.first
    GroupBy.head
    GroupBy.last
@@ -1594,9 +2215,12 @@ Computations / Descriptive Stats
    GroupBy.mean
    GroupBy.median
    GroupBy.min
+   GroupBy.ngroup
    GroupBy.nth
    GroupBy.ohlc
    GroupBy.prod
+   GroupBy.rank
+   GroupBy.pct_change
    GroupBy.size
    GroupBy.sem
    GroupBy.std
@@ -1613,19 +2237,22 @@ application to columns of a specific data type.
 .. autosummary::
    :toctree: generated/
 
+   DataFrameGroupBy.agg
+   DataFrameGroupBy.all
+   DataFrameGroupBy.any
    DataFrameGroupBy.bfill
+   DataFrameGroupBy.corr
+   DataFrameGroupBy.count
+   DataFrameGroupBy.cov
    DataFrameGroupBy.cummax
    DataFrameGroupBy.cummin
    DataFrameGroupBy.cumprod
    DataFrameGroupBy.cumsum
    DataFrameGroupBy.describe
-   DataFrameGroupBy.all
-   DataFrameGroupBy.any
-   DataFrameGroupBy.corr
-   DataFrameGroupBy.cov
    DataFrameGroupBy.diff
    DataFrameGroupBy.ffill
    DataFrameGroupBy.fillna
+   DataFrameGroupBy.filter
    DataFrameGroupBy.hist
    DataFrameGroupBy.idxmax
    DataFrameGroupBy.idxmin
@@ -1636,6 +2263,7 @@ application to columns of a specific data type.
    DataFrameGroupBy.rank
    DataFrameGroupBy.resample
    DataFrameGroupBy.shift
+   DataFrameGroupBy.size
    DataFrameGroupBy.skew
    DataFrameGroupBy.take
    DataFrameGroupBy.tshift
@@ -1650,6 +2278,8 @@ The following methods are available only for ``SeriesGroupBy`` objects.
    SeriesGroupBy.nunique
    SeriesGroupBy.unique
    SeriesGroupBy.value_counts
+   SeriesGroupBy.is_monotonic_increasing
+   SeriesGroupBy.is_monotonic_decreasing
 
 The following methods are available only for ``DataFrameGroupBy`` objects.
 
@@ -1659,6 +2289,151 @@ The following methods are available only for ``DataFrameGroupBy`` objects.
    DataFrameGroupBy.corrwith
    DataFrameGroupBy.boxplot
 
+Resampling
+----------
+.. currentmodule:: pandas.core.resample
+
+Resampler objects are returned by resample calls: :func:`pandas.DataFrame.resample`, :func:`pandas.Series.resample`.
+
+Indexing, iteration
+~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: generated/
+
+   Resampler.__iter__
+   Resampler.groups
+   Resampler.indices
+   Resampler.get_group
+
+Function application
+~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: generated/
+
+   Resampler.apply
+   Resampler.aggregate
+   Resampler.transform
+   Resampler.pipe
+
+Upsampling
+~~~~~~~~~~
+
+.. autosummary::
+   :toctree: generated/
+
+   Resampler.ffill
+   Resampler.backfill
+   Resampler.bfill
+   Resampler.pad
+   Resampler.nearest
+   Resampler.fillna
+   Resampler.asfreq
+   Resampler.interpolate
+
+Computations / Descriptive Stats
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: generated/
+
+   Resampler.count
+   Resampler.nunique
+   Resampler.first
+   Resampler.last
+   Resampler.max
+   Resampler.mean
+   Resampler.median
+   Resampler.min
+   Resampler.ohlc
+   Resampler.prod
+   Resampler.size
+   Resampler.sem
+   Resampler.std
+   Resampler.sum
+   Resampler.var
+
+Style
+-----
+.. currentmodule:: pandas.io.formats.style
+
+``Styler`` objects are returned by :attr:`pandas.DataFrame.style`.
+
+Styler Constructor
+~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: generated/
+
+   Styler
+   Styler.from_custom_template
+
+
+Styler Attributes
+~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: generated/
+
+   Styler.env
+   Styler.template
+   Styler.loader
+
+Style Application
+~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: generated/
+
+   Styler.apply
+   Styler.applymap
+   Styler.where
+   Styler.format
+   Styler.set_precision
+   Styler.set_table_styles
+   Styler.set_table_attributes
+   Styler.set_caption
+   Styler.set_properties
+   Styler.set_uuid
+   Styler.clear
+
+Builtin Styles
+~~~~~~~~~~~~~~
+
+.. autosummary::
+   :toctree: generated/
+
+   Styler.highlight_max
+   Styler.highlight_min
+   Styler.highlight_null
+   Styler.background_gradient
+   Styler.bar
+
+Style Export and Import
+~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+   :toctree: generated/
+
+   Styler.render
+   Styler.export
+   Styler.use
+   Styler.to_excel
+
+Plotting
+--------
+
+.. currentmodule:: pandas.plotting
+
+The following functions are contained in the `pandas.plotting` module.
+
+.. autosummary::
+   :toctree: generated/
+
+   andrews_curves
+   bootstrap_plot
+   deregister_matplotlib_converters
+   lag_plot
+   parallel_coordinates
+   radviz
+   register_matplotlib_converters
+   scatter_matrix
+
 .. currentmodule:: pandas
 
 General utility functions
@@ -1675,3 +2450,146 @@ Working with options
    get_option
    set_option
    option_context
+
+Testing functions
+~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+   :toctree: generated/
+
+   testing.assert_frame_equal
+   testing.assert_series_equal
+   testing.assert_index_equal
+
+
+Exceptions and warnings
+~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+   :toctree: generated/
+
+   errors.DtypeWarning
+   errors.EmptyDataError
+   errors.OutOfBoundsDatetime
+   errors.ParserError
+   errors.ParserWarning
+   errors.PerformanceWarning
+   errors.UnsortedIndexError
+   errors.UnsupportedFunctionCall
+
+
+Data types related functionality
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+   :toctree: generated/
+
+   api.types.union_categoricals
+   api.types.infer_dtype
+   api.types.pandas_dtype
+
+Dtype introspection
+
+.. autosummary::
+   :toctree: generated/
+
+    api.types.is_bool_dtype
+    api.types.is_categorical_dtype
+    api.types.is_complex_dtype
+    api.types.is_datetime64_any_dtype
+    api.types.is_datetime64_dtype
+    api.types.is_datetime64_ns_dtype
+    api.types.is_datetime64tz_dtype
+    api.types.is_extension_type
+    api.types.is_float_dtype
+    api.types.is_int64_dtype
+    api.types.is_integer_dtype
+    api.types.is_interval_dtype
+    api.types.is_numeric_dtype
+    api.types.is_object_dtype
+    api.types.is_period_dtype
+    api.types.is_signed_integer_dtype
+    api.types.is_string_dtype
+    api.types.is_timedelta64_dtype
+    api.types.is_timedelta64_ns_dtype
+    api.types.is_unsigned_integer_dtype
+    api.types.is_sparse
+
+Iterable introspection
+
+.. autosummary::
+   :toctree: generated/
+
+    api.types.is_dict_like
+    api.types.is_file_like
+    api.types.is_list_like
+    api.types.is_named_tuple
+    api.types.is_iterator
+
+Scalar introspection
+
+.. autosummary::
+   :toctree: generated/
+
+    api.types.is_bool
+    api.types.is_categorical
+    api.types.is_complex
+    api.types.is_datetimetz
+    api.types.is_float
+    api.types.is_hashable
+    api.types.is_integer
+    api.types.is_interval
+    api.types.is_number
+    api.types.is_period
+    api.types.is_re
+    api.types.is_re_compilable
+    api.types.is_scalar
+
+Extensions
+----------
+
+These are primarily intended for library authors looking to extend pandas
+objects.
+
+.. currentmodule:: pandas
+
+.. autosummary::
+   :toctree: generated/
+
+   api.extensions.register_dataframe_accessor
+   api.extensions.register_series_accessor
+   api.extensions.register_index_accessor
+   api.extensions.ExtensionDtype
+   api.extensions.ExtensionArray
+
+.. This is to prevent warnings in the doc build. We don't want to encourage
+.. these methods.
+
+.. toctree::
+   :hidden:
+
+   generated/pandas.DataFrame.blocks
+   generated/pandas.DataFrame.as_matrix
+   generated/pandas.DataFrame.ix
+   generated/pandas.Index.asi8
+   generated/pandas.Index.data
+   generated/pandas.Index.flags
+   generated/pandas.Index.holds_integer
+   generated/pandas.Index.is_type_compatible
+   generated/pandas.Index.nlevels
+   generated/pandas.Index.sort
+   generated/pandas.Panel.agg
+   generated/pandas.Panel.aggregate
+   generated/pandas.Panel.blocks
+   generated/pandas.Panel.empty
+   generated/pandas.Panel.is_copy
+   generated/pandas.Panel.items
+   generated/pandas.Panel.ix
+   generated/pandas.Panel.major_axis
+   generated/pandas.Panel.minor_axis
+   generated/pandas.Series.asobject
+   generated/pandas.Series.blocks
+   generated/pandas.Series.from_array
+   generated/pandas.Series.ix
+   generated/pandas.Series.imag
+   generated/pandas.Series.real
diff --git a/doc/source/basics.rst b/doc/source/basics.rst
index e11c612a510db..c460b19640f46 100644
--- a/doc/source/basics.rst
+++ b/doc/source/basics.rst
@@ -50,9 +50,8 @@ Attributes and the raw ndarray(s)
 
 pandas objects have a number of attributes enabling you to access the metadata
 
-  * **shape**: gives the axis dimensions of the object, consistent with ndarray
-  * Axis labels
-
+* **shape**: gives the axis dimensions of the object, consistent with ndarray
+* Axis labels
     * **Series**: *index* (only axis)
     * **DataFrame**: *index* (rows) and *columns*
     * **Panel**: *items*, *major_axis*, and *minor_axis*
@@ -93,7 +92,7 @@ Accelerated operations
 ----------------------
 
 pandas has support for accelerating certain types of binary numerical and boolean operations using
-the ``numexpr`` library (starting in 0.11.0) and the ``bottleneck`` libraries.
+the ``numexpr`` library and the ``bottleneck`` libraries.
 
 These libraries are especially useful when dealing with large data sets, and provide large
 speedups. ``numexpr`` uses smart chunking, caching, and multiple cores. ``bottleneck`` is
@@ -114,6 +113,15 @@ Here is a sample (using 100 column x 100,000 row ``DataFrames``):
 You are highly encouraged to install both libraries. See the section
 :ref:`Recommended Dependencies <install.recommended_dependencies>` for more installation info.
 
+These are both enabled to be used by default, you can control this by setting the options:
+
+.. versionadded:: 0.20.0
+
+.. code-block:: python
+
+   pd.set_option('compute.use_bottleneck', False)
+   pd.set_option('compute.use_numexpr', False)
+
 .. _basics.binop:
 
 Flexible binary operations
@@ -122,9 +130,9 @@ Flexible binary operations
 With binary operations between pandas data structures, there are two key points
 of interest:
 
-  * Broadcasting behavior between higher- (e.g. DataFrame) and
-    lower-dimensional (e.g. Series) objects.
-  * Missing data in computations
+* Broadcasting behavior between higher- (e.g. DataFrame) and
+  lower-dimensional (e.g. Series) objects.
+* Missing data in computations.
 
 We will demonstrate how to manage these issues independently, though they can
 be handled simultaneously.
@@ -145,7 +153,7 @@ either match on the *index* or *columns* via the **axis** keyword:
                       'two' : pd.Series(np.random.randn(4), index=['a', 'b', 'c', 'd']),
                       'three' : pd.Series(np.random.randn(3), index=['b', 'c', 'd'])})
    df
-   row = df.ix[1]
+   row = df.iloc[1]
    column = df['two']
 
    df.sub(row, axis='columns')
@@ -159,7 +167,7 @@ either match on the *index* or *columns* via the **axis** keyword:
 
    df_orig = df
 
-Furthermore you can align a level of a multi-indexed DataFrame with a Series.
+Furthermore you can align a level of a MultiIndexed DataFrame with a Series.
 
 .. ipython:: python
 
@@ -188,15 +196,41 @@ And similarly for ``axis="items"`` and ``axis="minor"``.
    match the broadcasting behavior of Panel. Though it would require a
    transition period so users can change their code...
 
+Series and Index also support the :func:`divmod` builtin. This function takes
+the floor division and modulo operation at the same time returning a two-tuple
+of the same type as the left hand side. For example:
+
+.. ipython:: python
+
+   s = pd.Series(np.arange(10))
+   s
+   div, rem = divmod(s, 3)
+   div
+   rem
+
+   idx = pd.Index(np.arange(10))
+   idx
+   div, rem = divmod(idx, 3)
+   div
+   rem
+
+We can also do elementwise :func:`divmod`:
+
+.. ipython:: python
+
+   div, rem = divmod(s, [2, 2, 3, 3, 4, 4, 5, 5, 6, 6])
+   div
+   rem
+
 Missing data / operations with fill values
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-In Series and DataFrame (though not yet in Panel), the arithmetic functions
-have the option of inputting a *fill_value*, namely a value to substitute when
-at most one of the values at a location are missing. For example, when adding
-two DataFrame objects, you may wish to treat NaN as 0 unless both DataFrames
-are missing that value, in which case the result will be NaN (you can later
-replace NaN with some other value using ``fillna`` if you wish).
+In Series and DataFrame, the arithmetic functions have the option of inputting
+a *fill_value*, namely a value to substitute when at most one of the values at
+a location are missing. For example, when adding two DataFrame objects, you may
+wish to treat NaN as 0 unless both DataFrames are missing that value, in which
+case the result will be NaN (you can later replace NaN with some other value
+using ``fillna`` if you wish).
 
 .. ipython:: python
    :suppress:
@@ -216,8 +250,8 @@ replace NaN with some other value using ``fillna`` if you wish).
 Flexible Comparisons
 ~~~~~~~~~~~~~~~~~~~~
 
-Starting in v0.8, pandas introduced binary comparison methods eq, ne, lt, gt,
-le, and ge to Series and DataFrame whose behavior is analogous to the binary
+Series and DataFrame have the binary comparison methods ``eq``, ``ne``, ``lt``, ``gt``,
+``le``, and ``ge`` whose behavior is analogous to the binary
 arithmetic operations described above:
 
 .. ipython:: python
@@ -225,9 +259,9 @@ arithmetic operations described above:
    df.gt(df2)
    df2.ne(df)
 
-These operations produce a pandas object the same type as the left-hand-side input
-that if of dtype ``bool``. These ``boolean`` objects can be used in indexing operations,
-see :ref:`here<indexing.boolean>`
+These operations produce a pandas object of the same type as the left-hand-side
+input that is of dtype ``bool``. These ``boolean`` objects can be used in
+indexing operations, see the section on :ref:`Boolean indexing<indexing.boolean>`.
 
 .. _basics.reductions:
 
@@ -272,7 +306,7 @@ To evaluate single-element pandas objects in a boolean context, use the method
 
    .. code-block:: python
 
-       >>>if df:
+       >>> if df:
             ...
 
    Or
@@ -281,7 +315,7 @@ To evaluate single-element pandas objects in a boolean context, use the method
 
        >>> df and df2
 
-   These both will raise as you are trying to compare multiple values.
+   These will both raise errors, as you are trying to compare multiple values.
 
    .. code-block:: python
 
@@ -294,7 +328,7 @@ See :ref:`gotchas<gotchas.truth>` for a more detailed discussion.
 Comparing if objects are equivalent
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Often you may find there is more than one way to compute the same
+Often you may find that there is more than one way to compute the same
 result.  As a simple example, consider ``df+df`` and ``df*2``. To test
 that these two computations produce the same result, given the tools
 shown above, you might imagine using ``(df+df == df*2).all()``. But in
@@ -306,13 +340,13 @@ fact, this expression is False:
    (df+df == df*2).all()
 
 Notice that the boolean DataFrame ``df+df == df*2`` contains some False values!
-That is because NaNs do not compare as equals:
+This is because NaNs do not compare as equals:
 
 .. ipython:: python
 
    np.nan == np.nan
 
-So, as of v0.13.1, NDFrames (such as Series, DataFrames, and Panels)
+So, NDFrames (such as Series, DataFrames, and Panels)
 have an :meth:`~DataFrame.equals` method for testing equality, with NaNs in
 corresponding locations treated as equal.
 
@@ -333,7 +367,7 @@ equality to be True:
 Comparing array-like objects
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-You can conveniently do element-wise comparisons when comparing a pandas
+You can conveniently perform element-wise comparisons when comparing a pandas
 data structure with a scalar value:
 
 .. ipython:: python
@@ -352,7 +386,7 @@ objects of the same length:
 Trying to compare ``Index`` or ``Series`` objects of different lengths will
 raise a ValueError:
 
-.. code-block:: python
+.. code-block:: ipython
 
     In [55]: pd.Series(['foo', 'bar', 'baz']) == pd.Series(['foo', 'bar'])
     ValueError: Series lengths must match to compare
@@ -360,7 +394,7 @@ raise a ValueError:
     In [56]: pd.Series(['foo', 'bar', 'baz']) == pd.Series(['foo'])
     ValueError: Series lengths must match to compare
 
-Note that this is different from the numpy behavior where a comparison can
+Note that this is different from the NumPy behavior where a comparison can
 be broadcast:
 
 .. ipython:: python
@@ -370,6 +404,7 @@ be broadcast:
 or it can return False if broadcasting can not be done:
 
 .. ipython:: python
+   :okwarning:
 
     np.array([1, 2, 3]) == np.array([1, 2])
 
@@ -400,7 +435,7 @@ General DataFrame Combine
 ~~~~~~~~~~~~~~~~~~~~~~~~~
 
 The :meth:`~DataFrame.combine_first` method above calls the more general
-DataFrame method :meth:`~DataFrame.combine`. This method takes another DataFrame
+:meth:`DataFrame.combine`. This method takes another DataFrame
 and a combiner function, aligns the input DataFrame and then passes the combiner
 function pairs of Series (i.e., columns whose names are the same).
 
@@ -408,7 +443,7 @@ So, for instance, to reproduce :meth:`~DataFrame.combine_first` as above:
 
 .. ipython:: python
 
-   combiner = lambda x, y: np.where(pd.isnull(x), y, x)
+   combiner = lambda x, y: np.where(pd.isna(x), y, x)
    df1.combine(df2, combiner)
 
 .. _basics.stats:
@@ -416,8 +451,8 @@ So, for instance, to reproduce :meth:`~DataFrame.combine_first` as above:
 Descriptive statistics
 ----------------------
 
-A large number of methods for computing descriptive statistics and other related
-operations on :ref:`Series <api.series.stats>`, :ref:`DataFrame
+There exists a large number of methods for computing descriptive statistics and
+other related operations on :ref:`Series <api.series.stats>`, :ref:`DataFrame
 <api.dataframe.stats>`, and :ref:`Panel <api.panel.stats>`. Most of these
 are aggregations (hence producing a lower-dimensional result) like
 :meth:`~DataFrame.sum`, :meth:`~DataFrame.mean`, and :meth:`~DataFrame.quantile`,
@@ -426,10 +461,10 @@ produce an object of the same size. Generally speaking, these methods take an
 **axis** argument, just like *ndarray.{sum, std, ...}*, but the axis can be
 specified by name or integer:
 
-  - **Series**: no axis argument needed
-  - **DataFrame**: "index" (axis=0, default), "columns" (axis=1)
-  - **Panel**: "items" (axis=0), "major" (axis=1, default), "minor"
-    (axis=2)
+* **Series**: no axis argument needed
+* **DataFrame**: "index" (axis=0, default), "columns" (axis=1)
+* **Panel**: "items" (axis=0), "major" (axis=1, default), "minor"
+  (axis=2)
 
 For example:
 
@@ -459,7 +494,9 @@ standard deviation 1), very concisely:
    xs_stand.std(1)
 
 Note that methods like :meth:`~DataFrame.cumsum` and :meth:`~DataFrame.cumprod`
-preserve the location of NA values:
+preserve the location of ``NaN`` values. This is somewhat different from
+:meth:`~DataFrame.expanding` and :meth:`~DataFrame.rolling`.
+For more details please see :ref:`this note <stats.moments.expanding.note>`.
 
 .. ipython:: python
 
@@ -473,7 +510,7 @@ optional ``level`` parameter which applies only if the object has a
     :header: "Function", "Description"
     :widths: 20, 80
 
-    ``count``, Number of non-null observations
+    ``count``, Number of non-NA observations
     ``sum``, Sum of values
     ``mean``, Mean of values
     ``mad``, Mean absolute deviation
@@ -483,11 +520,11 @@ optional ``level`` parameter which applies only if the object has a
     ``mode``, Mode
     ``abs``, Absolute Value
     ``prod``, Product of values
-    ``std``, Unbiased standard deviation
+    ``std``, Bessel-corrected sample standard deviation
     ``var``, Unbiased variance
-    ``sem``, Unbiased standard error of the mean
-    ``skew``, Unbiased skewness (3rd moment)
-    ``kurt``, Unbiased kurtosis (4th moment)
+    ``sem``, Standard error of the mean
+    ``skew``, Sample skewness (3rd moment)
+    ``kurt``, Sample kurtosis (4th moment)
     ``quantile``, Sample quantile (value at %)
     ``cumsum``, Cumulative sum
     ``cumprod``, Cumulative product
@@ -502,8 +539,8 @@ will exclude NAs on Series input by default:
    np.mean(df['one'])
    np.mean(df['one'].values)
 
-``Series`` also has a method :meth:`~Series.nunique` which will return the
-number of unique non-null values:
+:meth:`Series.nunique` will return the number of unique non-NA values in a
+Series:
 
 .. ipython:: python
 
@@ -527,7 +564,7 @@ course):
     series[::2] = np.nan
     series.describe()
     frame = pd.DataFrame(np.random.randn(1000, 5), columns=['a', 'b', 'c', 'd', 'e'])
-    frame.ix[::2] = np.nan
+    frame.iloc[::2] = np.nan
     frame.describe()
 
 You can select specific percentiles to include in the output:
@@ -555,7 +592,7 @@ categorical columns:
     frame = pd.DataFrame({'a': ['Yes', 'Yes', 'No', 'No'], 'b': range(4)})
     frame.describe()
 
-This behaviour can be controlled by providing a list of types as ``include``/``exclude``
+This behavior can be controlled by providing a list of types as ``include``/``exclude``
 arguments. The special value ``all`` can also be used:
 
 .. ipython:: python
@@ -673,15 +710,14 @@ on an entire ``DataFrame`` or ``Series``, row- or column-wise, or elementwise.
 
 1. `Tablewise Function Application`_: :meth:`~DataFrame.pipe`
 2. `Row or Column-wise Function Application`_: :meth:`~DataFrame.apply`
-3. Elementwise_ function application: :meth:`~DataFrame.applymap`
+3. `Aggregation API`_: :meth:`~DataFrame.agg` and :meth:`~DataFrame.transform`
+4. `Applying Elementwise Functions`_: :meth:`~DataFrame.applymap`
 
 .. _basics.pipe:
 
 Tablewise Function Application
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.16.2
-
 ``DataFrames`` and ``Series`` can of course just be passed into functions.
 However, if the function needs to be called in a chain, consider using the :meth:`~DataFrame.pipe` method.
 Compare the following
@@ -709,7 +745,7 @@ What if the function you wish to apply takes its data as, say, the second argume
 In this case, provide ``pipe`` with a tuple of ``(callable, data_keyword)``.
 ``.pipe`` will route the ``DataFrame`` to the argument specified in the tuple.
 
-For example, we can fit a regression using statsmodels. Their API expects a formula first and a ``DataFrame`` as the second argument, ``data``. We pass in the function, keyword pair ``(sm.poisson, 'data')`` to ``pipe``:
+For example, we can fit a regression using statsmodels. Their API expects a formula first and a ``DataFrame`` as the second argument, ``data``. We pass in the function, keyword pair ``(sm.ols, 'data')`` to ``pipe``:
 
 .. ipython:: python
 
@@ -719,7 +755,7 @@ For example, we can fit a regression using statsmodels. Their API expects a form
 
    (bb.query('h > 0')
       .assign(ln_h = lambda df: np.log(df.h))
-      .pipe((sm.poisson, 'data'), 'hr ~ ln_h + year + g + C(lg)')
+      .pipe((sm.ols, 'data'), 'hr ~ ln_h + year + g + C(lg)')
       .fit()
       .summary()
    )
@@ -727,7 +763,7 @@ For example, we can fit a regression using statsmodels. Their API expects a form
 The pipe method is inspired by unix pipes and more recently dplyr_ and magrittr_, which
 have introduced the popular ``(%>%)`` (read pipe) operator for R_.
 The implementation of ``pipe`` here is quite clean and feels right at home in python.
-We encourage you to view the source code (``pd.DataFrame.pipe??`` in IPython).
+We encourage you to view the source code of :meth:`~DataFrame.pipe`.
 
 .. _dplyr: https://github.com/hadley/dplyr
 .. _magrittr: https://github.com/smbache/magrittr
@@ -737,9 +773,9 @@ We encourage you to view the source code (``pd.DataFrame.pipe??`` in IPython).
 Row or Column-wise Function Application
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Arbitrary functions can be applied along the axes of a DataFrame or Panel
+Arbitrary functions can be applied along the axes of a DataFrame
 using the :meth:`~DataFrame.apply` method, which, like the descriptive
-statistics methods, take an optional ``axis`` argument:
+statistics methods, takes an optional ``axis`` argument:
 
 .. ipython:: python
 
@@ -749,8 +785,23 @@ statistics methods, take an optional ``axis`` argument:
    df.apply(np.cumsum)
    df.apply(np.exp)
 
-Depending on the return type of the function passed to :meth:`~DataFrame.apply`,
-the result will either be of lower dimension or the same dimension.
+The :meth:`~DataFrame.apply` method will also dispatch on a string method name.
+
+.. ipython:: python
+
+   df.apply('mean')
+   df.apply('mean', axis=1)
+
+The return type of the function passed to :meth:`~DataFrame.apply` affects the
+type of the final output from ``DataFrame.apply`` for the default behaviour:
+
+* If the applied function returns a ``Series``, the final output is a ``DataFrame``.
+  The columns match the index of the ``Series`` returned by the applied function.
+* If the applied function returns any other type, the final output is a ``Series``.
+
+This default behaviour can be overridden using the ``result_type``, which
+accepts three options: ``reduce``, ``broadcast``, and ``expand``.
+These will determine how list-likes return values expand (or not) to a ``DataFrame``.
 
 :meth:`~DataFrame.apply` combined with some cleverness can be used to answer many questions
 about a data set. For example, suppose we wanted to extract the date where the
@@ -798,16 +849,228 @@ set to True, the passed function will instead receive an ndarray object, which
 has positive performance implications if you do not need the indexing
 functionality.
 
-.. seealso::
+.. _basics.aggregate:
+
+Aggregation API
+~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.20.0
+
+The aggregation API allows one to express possibly multiple aggregation operations in a single concise way.
+This API is similar across pandas objects, see :ref:`groupby API <groupby.aggregate>`, the
+:ref:`window functions API <stats.aggregate>`, and the :ref:`resample API <timeseries.aggregate>`.
+The entry point for aggregation is :meth:`DataFrame.aggregate`, or the alias
+:meth:`DataFrame.agg`.
+
+We will use a similar starting frame from above:
+
+.. ipython:: python
+
+   tsdf = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'],
+                       index=pd.date_range('1/1/2000', periods=10))
+   tsdf.iloc[3:7] = np.nan
+   tsdf
+
+Using a single function is equivalent to :meth:`~DataFrame.apply`. You can also
+pass named methods as strings. These will return a ``Series`` of the aggregated
+output:
+
+.. ipython:: python
+
+   tsdf.agg(np.sum)
+
+   tsdf.agg('sum')
+
+   # these are equivalent to a ``.sum()`` because we are aggregating on a single function
+   tsdf.sum()
+
+Single aggregations on a ``Series`` this will return a scalar value:
+
+.. ipython:: python
+
+   tsdf.A.agg('sum')
+
+
+Aggregating with multiple functions
++++++++++++++++++++++++++++++++++++
+
+You can pass multiple aggregation arguments as a list.
+The results of each of the passed functions will be a row in the resulting ``DataFrame``.
+These are naturally named from the aggregation function.
+
+.. ipython:: python
+
+   tsdf.agg(['sum'])
+
+Multiple functions yield multiple rows:
+
+.. ipython:: python
+
+   tsdf.agg(['sum', 'mean'])
+
+On a ``Series``, multiple functions return a ``Series``, indexed by the function names:
+
+.. ipython:: python
+
+   tsdf.A.agg(['sum', 'mean'])
+
+Passing a ``lambda`` function will yield a ``<lambda>`` named row:
+
+.. ipython:: python
+
+   tsdf.A.agg(['sum', lambda x: x.mean()])
+
+Passing a named function will yield that name for the row:
+
+.. ipython:: python
+
+   def mymean(x):
+      return x.mean()
+
+   tsdf.A.agg(['sum', mymean])
+
+Aggregating with a dict
++++++++++++++++++++++++
+
+Passing a dictionary of column names to a scalar or a list of scalars, to ``DataFrame.agg``
+allows you to customize which functions are applied to which columns. Note that the results
+are not in any particular order, you can use an ``OrderedDict`` instead to guarantee ordering.
+
+.. ipython:: python
+
+   tsdf.agg({'A': 'mean', 'B': 'sum'})
+
+Passing a list-like will generate a ``DataFrame`` output. You will get a matrix-like output
+of all of the aggregators. The output will consist of all unique functions. Those that are
+not noted for a particular column will be ``NaN``:
+
+.. ipython:: python
+
+   tsdf.agg({'A': ['mean', 'min'], 'B': 'sum'})
+
+.. _basics.aggregation.mixed_dtypes:
+
+Mixed Dtypes
+++++++++++++
+
+When presented with mixed dtypes that cannot aggregate, ``.agg`` will only take the valid
+aggregations. This is similar to how groupby ``.agg`` works.
+
+.. ipython:: python
+
+   mdf = pd.DataFrame({'A': [1, 2, 3],
+                       'B': [1., 2., 3.],
+                       'C': ['foo', 'bar', 'baz'],
+                       'D': pd.date_range('20130101', periods=3)})
+   mdf.dtypes
+
+.. ipython:: python
+
+   mdf.agg(['min', 'sum'])
+
+.. _basics.aggregation.custom_describe:
+
+Custom describe
++++++++++++++++
+
+With ``.agg()`` is it possible to easily create a custom describe function, similar
+to the built in :ref:`describe function <basics.describe>`.
+
+.. ipython:: python
+
+   from functools import partial
+
+   q_25 = partial(pd.Series.quantile, q=0.25)
+   q_25.__name__ = '25%'
+   q_75 = partial(pd.Series.quantile, q=0.75)
+   q_75.__name__ = '75%'
+
+   tsdf.agg(['count', 'mean', 'std', 'min', q_25, 'median', q_75, 'max'])
+
+.. _basics.transform:
+
+Transform API
+~~~~~~~~~~~~~
+
+.. versionadded:: 0.20.0
+
+The :meth:`~DataFrame.transform` method returns an object that is indexed the same (same size)
+as the original. This API allows you to provide *multiple* operations at the same
+time rather than one-by-one. Its API is quite similar to the ``.agg`` API.
+
+We create a frame similar to the one used in the above sections.
+
+.. ipython:: python
+
+   tsdf = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'],
+                       index=pd.date_range('1/1/2000', periods=10))
+   tsdf.iloc[3:7] = np.nan
+   tsdf
+
+Transform the entire frame. ``.transform()`` allows input functions as: a NumPy function, a string
+function name or a user defined function.
+
+.. ipython:: python
+   :okwarning:
+
+   tsdf.transform(np.abs)
+   tsdf.transform('abs')
+   tsdf.transform(lambda x: x.abs())
+
+Here :meth:`~DataFrame.transform` received a single function; this is equivalent to a ufunc application.
+
+.. ipython:: python
+
+   np.abs(tsdf)
+
+Passing a single function to ``.transform()`` with a ``Series`` will yield a single ``Series`` in return.
+
+.. ipython:: python
+
+   tsdf.A.transform(np.abs)
+
+
+Transform with multiple functions
++++++++++++++++++++++++++++++++++
+
+Passing multiple functions will yield a column MultiIndexed DataFrame.
+The first level will be the original frame column names; the second level
+will be the names of the transforming functions.
+
+.. ipython:: python
+
+   tsdf.transform([np.abs, lambda x: x+1])
+
+Passing multiple functions to a Series will yield a DataFrame. The
+resulting column names will be the transforming functions.
+
+.. ipython:: python
+
+   tsdf.A.transform([np.abs, lambda x: x+1])
+
+
+Transforming with a dict
+++++++++++++++++++++++++
+
+
+Passing a dict of functions will allow selective transforming per column.
+
+.. ipython:: python
 
-   The section on :ref:`GroupBy <groupby>` demonstrates related, flexible
-   functionality for grouping by some criterion, applying, and combining the
-   results into a Series, DataFrame, etc.
+   tsdf.transform({'A': np.abs, 'B': lambda x: x+1})
 
-.. _Elementwise:
+Passing a dict of lists will generate a MultiIndexed DataFrame with these
+selective transforms.
 
-Applying elementwise Python functions
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. ipython:: python
+   :okwarning:
+
+   tsdf.transform({'A': np.abs, 'B': [lambda x: x+1, 'sqrt']})
+
+.. _basics.elementwise:
+
+Applying Elementwise Functions
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Since not all functions can be vectorized (accept NumPy arrays and return
 another array or value), the methods :meth:`~DataFrame.applymap` on DataFrame
@@ -826,7 +1089,7 @@ a single value and returning a single value. For example:
    df4['one'].map(f)
    df4.applymap(f)
 
-:meth:`Series.map` has an additional feature which is that it can be used to easily
+:meth:`Series.map` has an additional feature; it can be used to easily
 "link" or "map" values defined by a secondary series. This is closely related
 to :ref:`merging/joining functionality <merging>`:
 
@@ -848,10 +1111,6 @@ Applying with a ``Panel`` will pass a ``Series`` to the applied function. If the
 function returns a ``Series``, the result of the application will be a ``Panel``. If the applied function
 reduces to a scalar, the result of the application will be a ``DataFrame``.
 
-.. note::
-
-   Prior to 0.13.1 ``apply`` on a ``Panel`` would only work on ``ufuncs`` (e.g. ``np.sum/np.max``).
-
 .. ipython:: python
 
    import pandas.util.testing as tm
@@ -873,13 +1132,13 @@ A reduction operation.
 
    panel.apply(lambda x: x.dtype, axis='items')
 
-A similar reduction type operation
+A similar reduction type operation.
 
 .. ipython:: python
 
    panel.apply(lambda x: x.sum(), axis='major_axis')
 
-This last reduction is equivalent to
+This last reduction is equivalent to:
 
 .. ipython:: python
 
@@ -907,7 +1166,7 @@ Apply can also accept multiple axes in the ``axis`` argument. This will pass a
    result
    result.loc[:,:,'ItemA']
 
-This is equivalent to the following
+This is equivalent to the following:
 
 .. ipython:: python
 
@@ -927,11 +1186,11 @@ It is used to implement nearly all other features relying on label-alignment
 functionality. To *reindex* means to conform the data to match a given set of
 labels along a particular axis. This accomplishes several things:
 
-  * Reorders the existing data to match a new set of labels
-  * Inserts missing value (NA) markers in label locations where no data for
-    that label existed
-  * If specified, **fill** data for missing labels using logic (highly relevant
-    to working with time series data)
+* Reorders the existing data to match a new set of labels
+* Inserts missing value (NA) markers in label locations where no data for
+  that label existed
+* If specified, **fill** data for missing labels using logic (highly relevant
+  to working with time series data)
 
 Here is a simple example:
 
@@ -951,8 +1210,11 @@ With a DataFrame, you can simultaneously reindex the index and columns:
    df
    df.reindex(index=['c', 'f', 'b'], columns=['three', 'two', 'one'])
 
-For convenience, you may utilize the :meth:`~Series.reindex_axis` method, which
-takes the labels and a keyword ``axis`` parameter.
+You may also use ``reindex`` with an ``axis`` keyword:
+
+.. ipython:: python
+
+   df.reindex(['c', 'f', 'b'], axis='index')
 
 Note that the ``Index`` objects containing the actual axis labels can be
 **shared** between objects. So if we have a Series and a DataFrame, the
@@ -967,6 +1229,15 @@ following can be done:
 This means that the reindexed Series's index is the same Python object as the
 DataFrame's index.
 
+.. versionadded:: 0.21.0
+
+:meth:`DataFrame.reindex` also supports an "axis-style" calling convention,
+where you specify a single ``labels`` argument and the ``axis`` it applies to.
+
+.. ipython:: python
+
+   df.reindex(['c', 'f', 'b'], axis='index')
+   df.reindex(['three', 'two', 'one'], axis='columns')
 
 .. seealso::
 
@@ -1052,7 +1323,7 @@ objects either on the DataFrame's index or columns using the ``axis`` argument:
 
 .. ipython:: python
 
-   df.align(df2.ix[0], axis=1)
+   df.align(df2.iloc[0], axis=1)
 
 .. _basics.reindex_fill:
 
@@ -1096,9 +1367,9 @@ Note that the same result could have been achieved using
 
    ts2.reindex(ts.index).fillna(method='ffill')
 
-:meth:`~Series.reindex` will raise a ValueError if the index is not monotonic
-increasing or descreasing. :meth:`~Series.fillna` and :meth:`~Series.interpolate`
-will not make any checks on the order of the index.
+:meth:`~Series.reindex` will raise a ValueError if the index is not monotonically
+increasing or decreasing. :meth:`~Series.fillna` and :meth:`~Series.interpolate`
+will not perform any checks on the order of the index.
 
 .. _basics.limits_on_reindex_fill:
 
@@ -1158,18 +1429,41 @@ mapping (a dict or Series) or an arbitrary function.
    s.rename(str.upper)
 
 If you pass a function, it must return a value when called with any of the
-labels (and must produce a set of unique values). But if you pass a dict or
-Series, it need only contain a subset of the labels as keys:
+labels (and must produce a set of unique values). A dict or
+Series can also be used:
+
+.. ipython:: python
+
+   df.rename(columns={'one': 'foo', 'two': 'bar'},
+             index={'a': 'apple', 'b': 'banana', 'd': 'durian'})
+
+If the mapping doesn't include a column/index label, it isn't renamed. Note that
+extra labels in the mapping don't throw an error.
+
+.. versionadded:: 0.21.0
+
+:meth:`DataFrame.rename` also supports an "axis-style" calling convention, where
+you specify a single ``mapper`` and the ``axis`` to apply that mapping to.
 
 .. ipython:: python
 
-   df.rename(columns={'one' : 'foo', 'two' : 'bar'},
-             index={'a' : 'apple', 'b' : 'banana', 'd' : 'durian'})
+   df.rename({'one': 'foo', 'two': 'bar'}, axis='columns')
+   df.rename({'a': 'apple', 'b': 'banana', 'd': 'durian'}, axis='index')
+
 
 The :meth:`~DataFrame.rename` method also provides an ``inplace`` named
 parameter that is by default ``False`` and copies the underlying data. Pass
 ``inplace=True`` to rename the data in place.
 
+.. versionadded:: 0.18.0
+
+Finally, :meth:`~Series.rename` also accepts a scalar or list-like
+for altering the ``Series.name`` attribute.
+
+.. ipython:: python
+
+   s.rename("scalar-name")
+
 .. _basics.rename_axis:
 
 The Panel class has a related :meth:`~Panel.rename_axis` class which can rename
@@ -1211,9 +1505,10 @@ To iterate over the rows of a DataFrame, you can use the following methods:
 * :meth:`~DataFrame.iterrows`: Iterate over the rows of a DataFrame as (index, Series) pairs.
   This converts the rows to Series objects, which can change the dtypes and has some
   performance implications.
-* :meth:`~DataFrame.itertuples`: Iterate over the rows of a DataFrame as tuples of the values.
-  This is a lot faster as :meth:`~DataFrame.iterrows`, and is in most cases preferable to
-  use to iterate over the values of a DataFrame.
+* :meth:`~DataFrame.itertuples`: Iterate over the rows of a DataFrame
+  as namedtuples of the values.  This is a lot faster than
+  :meth:`~DataFrame.iterrows`, and is in most cases preferable to use
+  to iterate over the values of a DataFrame.
 
 .. warning::
 
@@ -1222,14 +1517,14 @@ To iterate over the rows of a DataFrame, you can use the following methods:
   one of the following approaches:
 
   * Look for a *vectorized* solution: many operations can be performed using
-    built-in methods or numpy functions, (boolean) indexing, ...
+    built-in methods or NumPy functions, (boolean) indexing, ...
 
   * When you have a function that cannot work on the full DataFrame/Series
     at once, it is better to use :meth:`~DataFrame.apply` instead of iterating
     over the values. See the docs on :ref:`function application <basics.apply>`.
 
   * If you need to do iterative manipulations on the values but performance is
-    important, consider writing the inner loop using e.g. cython or numba.
+    important, consider writing the inner loop with cython or numba.
     See the :ref:`enhancing performance <enhancingperf>` section for some
     examples of this approach.
 
@@ -1307,8 +1602,8 @@ index value along with a Series containing the data in each row:
       df_orig['int'].dtype
 
    To preserve dtypes while iterating over the rows, it is better
-   to use :meth:`~DataFrame.itertuples` which returns tuples of the values
-   and which is generally much faster as ``iterrows``.
+   to use :meth:`~DataFrame.itertuples` which returns namedtuples of the values
+   and which is generally much faster than :meth:`~DataFrame.iterrows`.
 
 For instance, a contrived way to transpose the DataFrame would be:
 
@@ -1325,20 +1620,27 @@ itertuples
 ~~~~~~~~~~
 
 The :meth:`~DataFrame.itertuples` method will return an iterator
-yielding a tuple for each row in the DataFrame. The first element
-of the tuple will be the row's corresponding index value,
-while the remaining values are the row values.
+yielding a namedtuple for each row in the DataFrame. The first element
+of the tuple will be the row's corresponding index value, while the
+remaining values are the row values.
 
-For instance,
+For instance:
 
 .. ipython:: python
 
    for row in df.itertuples():
        print(row)
 
-This method does not convert the row to a Series object but just returns the
-values inside a tuple. Therefore, :meth:`~DataFrame.itertuples` preserves the
-data type of the values and is generally faster as :meth:`~DataFrame.iterrows`.
+This method does not convert the row to a Series object; it merely
+returns the values inside a namedtuple. Therefore,
+:meth:`~DataFrame.itertuples` preserves the data type of the values
+and is generally faster as :meth:`~DataFrame.iterrows`.
+
+.. note::
+
+   The column names will be renamed to positional names if they are
+   invalid Python identifiers, repeated, or start with an underscore.
+   With a large number of columns (>255), regular tuples are returned.
 
 .. _basics.dt_accessors:
 
@@ -1416,7 +1718,7 @@ The ``.dt`` accessor works for period and timedelta dtypes.
 
 .. note::
 
-   ``Series.dt`` will raise a ``TypeError`` if you access with a non-datetimelike values
+   ``Series.dt`` will raise a ``TypeError`` if you access with a non-datetime-like values.
 
 Vectorized string methods
 -------------------------
@@ -1434,7 +1736,7 @@ built-in string methods. For example:
 
 Powerful pattern-matching methods are provided as well, but note that
 pattern-matching generally uses `regular expressions
-<https://docs.python.org/2/library/re.html>`__ by default (and in some cases
+<https://docs.python.org/3/library/re.html>`__ by default (and in some cases
 always uses them).
 
 Please see :ref:`Vectorized String Methods <text.string_methods>` for a complete
@@ -1445,24 +1747,26 @@ description.
 Sorting
 -------
 
-.. warning::
-
-   The sorting API is substantially changed in 0.17.0, see :ref:`here <whatsnew_0170.api_breaking.sorting>` for these changes.
-   In particular, all sorting methods now return a new object by default, and **DO NOT** operate in-place (except by passing ``inplace=True``).
+Pandas supports three kinds of sorting: sorting by index labels,
+sorting by column values, and sorting by a combination of both.
 
-There are two obvious kinds of sorting that you may be interested in: sorting
-by label and sorting by actual values.
+.. _basics.sort_index:
 
 By Index
 ~~~~~~~~
 
-The primary method for sorting axis
-labels (indexes) are the ``Series.sort_index()`` and the ``DataFrame.sort_index()`` methods.
+The :meth:`Series.sort_index` and :meth:`DataFrame.sort_index` methods are
+used to sort a pandas object by its index levels.
 
 .. ipython:: python
 
+   df = pd.DataFrame({'one' : pd.Series(np.random.randn(3), index=['a', 'b', 'c']),
+                      'two' : pd.Series(np.random.randn(4), index=['a', 'b', 'c', 'd']),
+                      'three' : pd.Series(np.random.randn(3), index=['b', 'c', 'd'])})
+
    unsorted_df = df.reindex(index=['a', 'd', 'c', 'b'],
                             columns=['three', 'two', 'one'])
+   unsorted_df
 
    # DataFrame
    unsorted_df.sort_index()
@@ -1472,20 +1776,22 @@ labels (indexes) are the ``Series.sort_index()`` and the ``DataFrame.sort_index(
    # Series
    unsorted_df['three'].sort_index()
 
+.. _basics.sort_values:
+
 By Values
 ~~~~~~~~~
 
-The :meth:`Series.sort_values` and :meth:`DataFrame.sort_values` are the entry points for **value** sorting (that is the values in a column or row).
-:meth:`DataFrame.sort_values` can accept an optional ``by`` argument for ``axis=0``
-which will use an arbitrary vector or a column name of the DataFrame to
-determine the sort order:
+The :meth:`Series.sort_values` method is used to sort a `Series` by its values. The
+:meth:`DataFrame.sort_values` method is used to sort a `DataFrame` by its column or row values.
+The optional ``by`` parameter to :meth:`DataFrame.sort_values` may used to specify one or more columns
+to use to determine the sorted order.
 
 .. ipython:: python
 
    df1 = pd.DataFrame({'one':[2,1,1,1],'two':[1,3,2,4],'three':[5,4,3,2]})
    df1.sort_values(by='two')
 
-The ``by`` argument can take a list of column names, e.g.:
+The ``by`` parameter can take a list of column names, e.g.:
 
 .. ipython:: python
 
@@ -1500,13 +1806,46 @@ argument:
    s.sort_values()
    s.sort_values(na_position='first')
 
+.. _basics.sort_indexes_and_values:
+
+By Indexes and Values
+~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.23.0
+
+Strings passed as the ``by`` parameter to :meth:`DataFrame.sort_values` may
+refer to either columns or index level names.
+
+.. ipython:: python
+
+   # Build MultiIndex
+   idx = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('a', 2),
+                                   ('b', 2), ('b', 1), ('b', 1)])
+   idx.names = ['first', 'second']
+
+   # Build DataFrame
+   df_multi = pd.DataFrame({'A': np.arange(6, 0, -1)},
+                           index=idx)
+   df_multi
+
+Sort by 'second' (index) and 'A' (column)
+
+.. ipython:: python
+
+   df_multi.sort_values(by=['second', 'A'])
+
+.. note::
+
+   If a string matches both a column name and an index level name then a
+   warning is issued and the column takes precedence. This will result in an
+   ambiguity error in a future version.
 
 .. _basics.searchsorted:
 
 searchsorted
 ~~~~~~~~~~~~
 
-Series has the :meth:`~Series.searchsorted` method, which works similar to
+Series has the :meth:`~Series.searchsorted` method, which works similarly to
 :meth:`numpy.ndarray.searchsorted`.
 
 .. ipython:: python
@@ -1524,8 +1863,6 @@ Series has the :meth:`~Series.searchsorted` method, which works similar to
 smallest / largest values
 ~~~~~~~~~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.14.0
-
 ``Series`` has the :meth:`~Series.nsmallest` and :meth:`~Series.nlargest` methods which return the
 smallest or largest :math:`n` values. For a large ``Series`` this can be much
 faster than sorting the entire Series and calling ``head(n)`` on the result.
@@ -1538,8 +1875,6 @@ faster than sorting the entire Series and calling ``head(n)`` on the result.
    s.nsmallest(3)
    s.nlargest(3)
 
-.. versionadded:: 0.17.0
-
 ``DataFrame`` also has the ``nlargest`` and ``nsmallest`` methods.
 
 .. ipython:: python
@@ -1553,12 +1888,12 @@ faster than sorting the entire Series and calling ``head(n)`` on the result.
    df.nsmallest(5, ['a', 'c'])
 
 
-.. _basics.multi-index_sorting:
+.. _basics.multiindex_sorting:
 
-Sorting by a multi-index column
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Sorting by a MultiIndex column
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-You must be explicit about sorting when the column is a multi-index, and fully specify
+You must be explicit about sorting when the column is a MultiIndex, and fully specify
 all levels to ``by``.
 
 .. ipython:: python
@@ -1575,14 +1910,14 @@ the axis indexes, since they are immutable) and returns a new object. Note that
 **it is seldom necessary to copy objects**. For example, there are only a
 handful of ways to alter a DataFrame *in-place*:
 
-  * Inserting, deleting, or modifying a column
-  * Assigning to the ``index`` or ``columns`` attributes
-  * For homogeneous data, directly modifying the values via the ``values``
-    attribute or advanced indexing
+* Inserting, deleting, or modifying a column.
+* Assigning to the ``index`` or ``columns`` attributes.
+* For homogeneous data, directly modifying the values via the ``values``
+  attribute or advanced indexing.
 
-To be clear, no pandas methods have the side effect of modifying your data;
-almost all methods return new objects, leaving the original object
-untouched. If data is modified, it is because you did so explicitly.
+To be clear, no pandas method has the side effect of modifying your data;
+almost every method returns a new object, leaving the original object
+untouched. If the data is modified, it is because you did so explicitly.
 
 .. _basics.dtypes:
 
@@ -1590,10 +1925,13 @@ dtypes
 ------
 
 The main types stored in pandas objects are ``float``, ``int``, ``bool``,
-``datetime64[ns]`` and ``datetime64[ns, tz]`` (in >= 0.17.0), ``timedelta[ns]``, ``category`` (in >= 0.15.0), and ``object``. In addition these dtypes
-have item sizes, e.g. ``int64`` and ``int32``. See :ref:`Series with TZ <timeseries.timezone_series>` for more detail on ``datetime64[ns, tz]`` dtypes.
+``datetime64[ns]`` and ``datetime64[ns, tz]``, ``timedelta[ns]``,
+``category`` and ``object``. In addition these dtypes have item sizes, e.g.
+``int64`` and ``int32``. See :ref:`Series with TZ <timeseries.timezone_series>`
+for more detail on ``datetime64[ns, tz]`` dtypes.
 
-A convenient :attr:`~DataFrame.dtypes` attribute for DataFrames returns a Series with the data type of each column.
+A convenient :attr:`~DataFrame.dtypes` attribute for DataFrame returns a Series
+with the data type of each column.
 
 .. ipython:: python
 
@@ -1607,15 +1945,15 @@ A convenient :attr:`~DataFrame.dtypes` attribute for DataFrames returns a Series
    dft
    dft.dtypes
 
-On a ``Series`` use the :attr:`~Series.dtype` attribute.
+On a ``Series`` object, use the :attr:`~Series.dtype` attribute.
 
 .. ipython:: python
 
    dft['A'].dtype
 
-If a pandas object contains data multiple dtypes *IN A SINGLE COLUMN*, the dtype of the
-column will be chosen to accommodate all of the data types (``object`` is the most
-general).
+If a pandas object contains data with multiple dtypes *in a single column*, the
+dtype of the column will be chosen to accommodate all of the data types
+(``object`` is the most general).
 
 .. ipython:: python
 
@@ -1625,14 +1963,14 @@ general).
    # string data forces an ``object`` dtype
    pd.Series([1, 2, 3, 6., 'foo'])
 
-The method :meth:`~DataFrame.get_dtype_counts` will return the number of columns of
-each type in a ``DataFrame``:
+The number of columns of each type in a ``DataFrame`` can be found by calling
+:meth:`~DataFrame.get_dtype_counts`.
 
 .. ipython:: python
 
    dft.get_dtype_counts()
 
-Numeric dtypes will propagate and can coexist in DataFrames (starting in v0.11.0).
+Numeric dtypes will propagate and can coexist in DataFrames.
 If a dtype is passed (either directly via the ``dtype`` keyword, a passed ``ndarray``,
 or a passed ``Series``, then it will be preserved in DataFrame operations. Furthermore,
 different numeric dtypes will **NOT** be combined. The following example will give you a taste.
@@ -1652,7 +1990,8 @@ defaults
 ~~~~~~~~
 
 By default integer types are ``int64`` and float types are ``float64``,
-*REGARDLESS* of platform (32-bit or 64-bit). The following will all result in ``int64`` dtypes.
+*regardless* of platform (32-bit or 64-bit).
+The following will all result in ``int64`` dtypes.
 
 .. ipython:: python
 
@@ -1660,7 +1999,7 @@ By default integer types are ``int64`` and float types are ``float64``,
    pd.DataFrame({'a': [1, 2]}).dtypes
    pd.DataFrame({'a': 1 }, index=list(range(2))).dtypes
 
-Numpy, however will choose *platform-dependent* types when creating arrays.
+Note that Numpy will choose *platform-dependent* types when creating arrays.
 The following **WILL** result in ``int32`` on 32-bit platform.
 
 .. ipython:: python
@@ -1672,7 +2011,7 @@ upcasting
 ~~~~~~~~~
 
 Types can potentially be *upcasted* when combined with other types, meaning they are promoted
-from the current type (say ``int`` to ``float``)
+from the current type (e.g. ``int`` to ``float``).
 
 .. ipython:: python
 
@@ -1681,7 +2020,7 @@ from the current type (say ``int`` to ``float``)
    df3.dtypes
 
 The ``values`` attribute on a DataFrame return the *lower-common-denominator* of the dtypes, meaning
-the dtype that can accommodate **ALL** of the types in the resulting homogeneous dtyped numpy array. This can
+the dtype that can accommodate **ALL** of the types in the resulting homogeneous dtyped NumPy array. This can
 force some *upcasting*.
 
 .. ipython:: python
@@ -1708,48 +2047,161 @@ then the more *general* one will be used as the result of the operation.
    # conversion of dtypes
    df3.astype('float32').dtypes
 
+
+Convert a subset of columns to a specified type using :meth:`~DataFrame.astype`.
+
+.. ipython:: python
+
+   dft = pd.DataFrame({'a': [1,2,3], 'b': [4,5,6], 'c': [7, 8, 9]})
+   dft[['a','b']] = dft[['a','b']].astype(np.uint8)
+   dft
+   dft.dtypes
+
+.. versionadded:: 0.19.0
+
+Convert certain columns to a specific dtype by passing a dict to :meth:`~DataFrame.astype`.
+
+.. ipython:: python
+
+   dft1 = pd.DataFrame({'a': [1,0,1], 'b': [4,5,6], 'c': [7, 8, 9]})
+   dft1 = dft1.astype({'a': np.bool, 'c': np.float64})
+   dft1
+   dft1.dtypes
+
+.. note::
+
+    When trying to convert a subset of columns to a specified type using :meth:`~DataFrame.astype`  and :meth:`~DataFrame.loc`, upcasting occurs.
+
+    :meth:`~DataFrame.loc` tries to fit in what we are assigning to the current dtypes, while ``[]`` will overwrite them taking the dtype from the right hand side. Therefore the following piece of code produces the unintended result.
+
+    .. ipython:: python
+
+       dft = pd.DataFrame({'a': [1,2,3], 'b': [4,5,6], 'c': [7, 8, 9]})
+       dft.loc[:, ['a', 'b']].astype(np.uint8).dtypes
+       dft.loc[:, ['a', 'b']] = dft.loc[:, ['a', 'b']].astype(np.uint8)
+       dft.dtypes
+
+.. _basics.object_conversion:
+
 object conversion
 ~~~~~~~~~~~~~~~~~
 
-:meth:`~DataFrame.convert_objects` is a method to try to force conversion of types from the ``object`` dtype to other types.
-To force conversion of specific types that are *number like*, e.g. could be a string that represents a number,
-pass ``convert_numeric=True``. This will force strings and numbers alike to be numbers if possible, otherwise
-they will be set to ``np.nan``.
+pandas offers various functions to try to force conversion of types from the ``object`` dtype to other types.
+In cases where the data is already of the correct type, but stored in an ``object`` array, the
+:meth:`DataFrame.infer_objects` and :meth:`Series.infer_objects` methods can be used to soft convert
+to the correct type.
+
+  .. ipython:: python
+
+     import datetime
+     df = pd.DataFrame([[1, 2],
+                        ['a', 'b'],
+                        [datetime.datetime(2016, 3, 2), datetime.datetime(2016, 3, 2)]])
+     df = df.T
+     df
+     df.dtypes
+
+Because the data was transposed the original inference stored all columns as object, which
+``infer_objects`` will correct.
+
+  .. ipython:: python
+
+     df.infer_objects().dtypes
+
+The following functions are available for one dimensional object arrays or scalars to perform
+hard conversion of objects to a specified type:
+
+* :meth:`~pandas.to_numeric` (conversion to numeric dtypes)
+
+  .. ipython:: python
+
+     m = ['1.1', 2, 3]
+     pd.to_numeric(m)
+
+* :meth:`~pandas.to_datetime` (conversion to datetime objects)
+
+  .. ipython:: python
+
+     import datetime
+     m = ['2016-07-09', datetime.datetime(2016, 3, 2)]
+     pd.to_datetime(m)
+
+* :meth:`~pandas.to_timedelta` (conversion to timedelta objects)
+
+  .. ipython:: python
+
+     m = ['5us', pd.Timedelta('1day')]
+     pd.to_timedelta(m)
+
+To force a conversion, we can pass in an ``errors`` argument, which specifies how pandas should deal with elements
+that cannot be converted to desired dtype or object. By default, ``errors='raise'``, meaning that any errors encountered
+will be raised during the conversion process. However, if ``errors='coerce'``, these errors will be ignored and pandas
+will convert problematic elements to ``pd.NaT`` (for datetime and timedelta) or ``np.nan`` (for numeric). This might be
+useful if you are reading in data which is mostly of the desired dtype (e.g. numeric, datetime), but occasionally has
+non-conforming elements intermixed that you want to represent as missing:
 
 .. ipython:: python
 
-   df3['D'] = '1.'
-   df3['E'] = '1'
-   df3.convert_objects(convert_numeric=True).dtypes
+    import datetime
+    m = ['apple', datetime.datetime(2016, 3, 2)]
+    pd.to_datetime(m, errors='coerce')
 
-   # same, but specific dtype conversion
-   df3['D'] = df3['D'].astype('float16')
-   df3['E'] = df3['E'].astype('int32')
-   df3.dtypes
+    m = ['apple', 2, 3]
+    pd.to_numeric(m, errors='coerce')
+
+    m = ['apple', pd.Timedelta('1day')]
+    pd.to_timedelta(m, errors='coerce')
 
-To force conversion to ``datetime64[ns]``, pass ``convert_dates='coerce'``.
-This will convert any datetime-like object to dates, forcing other values to ``NaT``.
-This might be useful if you are reading in data which is mostly dates,
-but occasionally has non-dates intermixed and you want to represent as missing.
+The ``errors`` parameter has a third option of ``errors='ignore'``, which will simply return the passed in data if it
+encounters any errors with the conversion to a desired data type:
 
 .. ipython:: python
 
-   import datetime
-   s = pd.Series([datetime.datetime(2001,1,1,0,0),
-                 'foo', 1.0, 1, pd.Timestamp('20010104'),
-                 '20010105'], dtype='O')
-   s
-   s.convert_objects(convert_dates='coerce')
+    import datetime
+    m = ['apple', datetime.datetime(2016, 3, 2)]
+    pd.to_datetime(m, errors='ignore')
+
+    m = ['apple', 2, 3]
+    pd.to_numeric(m, errors='ignore')
 
-In addition, :meth:`~DataFrame.convert_objects` will attempt the *soft* conversion of any *object* dtypes, meaning that if all
-the objects in a Series are of the same type, the Series will have that dtype.
+    m = ['apple', pd.Timedelta('1day')]
+    pd.to_timedelta(m, errors='ignore')
+
+In addition to object conversion, :meth:`~pandas.to_numeric` provides another argument ``downcast``, which gives the
+option of downcasting the newly (or already) numeric data to a smaller dtype, which can conserve memory:
+
+.. ipython:: python
+
+    m = ['1', 2, 3]
+    pd.to_numeric(m, downcast='integer')   # smallest signed int dtype
+    pd.to_numeric(m, downcast='signed')    # same as 'integer'
+    pd.to_numeric(m, downcast='unsigned')  # smallest unsigned int dtype
+    pd.to_numeric(m, downcast='float')     # smallest float dtype
+
+As these methods apply only to one-dimensional arrays, lists or scalars; they cannot be used directly on multi-dimensional objects such
+as DataFrames. However, with :meth:`~pandas.DataFrame.apply`, we can "apply" the function over each column efficiently:
+
+.. ipython:: python
+
+    import datetime
+    df = pd.DataFrame([['2016-07-09', datetime.datetime(2016, 3, 2)]] * 2, dtype='O')
+    df
+    df.apply(pd.to_datetime)
+
+    df = pd.DataFrame([['1.1', 2, 3]] * 2, dtype='O')
+    df
+    df.apply(pd.to_numeric)
+
+    df = pd.DataFrame([['5us', pd.Timedelta('1day')]] * 2, dtype='O')
+    df
+    df.apply(pd.to_timedelta)
 
 gotchas
 ~~~~~~~
 
 Performing selection operations on ``integer`` type data can easily upcast the data to ``floating``.
-The dtype of the input data will be preserved in cases where ``nans`` are not introduced (starting in 0.11.0)
-See also :ref:`integer na gotchas <gotchas.intna>`
+The dtype of the input data will be preserved in cases where ``nans`` are not introduced.
+See also :ref:`Support for integer NA <gotchas.intna>`.
 
 .. ipython:: python
 
@@ -1779,8 +2231,6 @@ Selecting columns based on ``dtype``
 
 .. _basics.selectdtypes:
 
-.. versionadded:: 0.14.1
-
 The :meth:`~DataFrame.select_dtypes` method implements subsetting of columns
 based on their ``dtype``.
 
@@ -1803,23 +2253,23 @@ dtypes:
    df['tz_aware_dates'] = pd.date_range('20130101', periods=3, tz='US/Eastern')
    df
 
-And the dtypes
+And the dtypes:
 
 .. ipython:: python
 
    df.dtypes
 
 :meth:`~DataFrame.select_dtypes` has two parameters ``include`` and ``exclude`` that allow you to
-say "give me the columns WITH these dtypes" (``include``) and/or "give the
-columns WITHOUT these dtypes" (``exclude``).
+say "give me the columns *with* these dtypes" (``include``) and/or "give the
+columns *without* these dtypes" (``exclude``).
 
-For example, to select ``bool`` columns
+For example, to select ``bool`` columns:
 
 .. ipython:: python
 
    df.select_dtypes(include=[bool])
 
-You can also pass the name of a dtype in the `numpy dtype hierarchy
+You can also pass the name of a dtype in the `NumPy dtype hierarchy
 <http://docs.scipy.org/doc/numpy/reference/arrays.scalars.html>`__:
 
 .. ipython:: python
@@ -1829,7 +2279,7 @@ You can also pass the name of a dtype in the `numpy dtype hierarchy
 :meth:`~pandas.DataFrame.select_dtypes` also works with generic dtypes as well.
 
 For example, to select all numeric and boolean columns while excluding unsigned
-integers
+integers:
 
 .. ipython:: python
 
@@ -1852,7 +2302,7 @@ can define a function that returns a tree of child dtypes:
            return dtype
        return [dtype, [subdtypes(dt) for dt in subs]]
 
-All numpy dtypes are subclasses of ``numpy.generic``:
+All NumPy dtypes are subclasses of ``numpy.generic``:
 
 .. ipython:: python
 
@@ -1861,8 +2311,4 @@ All numpy dtypes are subclasses of ``numpy.generic``:
 .. note::
 
     Pandas also defines the types ``category``, and ``datetime64[ns, tz]``, which are not integrated into the normal
-    numpy hierarchy and wont show up with the above function.
-
-.. note::
-
-   The ``include`` and ``exclude`` parameters must be non-string sequences.
+    NumPy hierarchy and won't show up with the above function.
diff --git a/doc/source/categorical.rst b/doc/source/categorical.rst
index ddd4fb81ed1f1..acab9de905540 100644
--- a/doc/source/categorical.rst
+++ b/doc/source/categorical.rst
@@ -16,20 +16,14 @@
 Categorical Data
 ****************
 
-.. versionadded:: 0.15
-
-.. note::
-    While there was `pandas.Categorical` in earlier versions, the ability to use
-    categorical data in `Series` and `DataFrame` is new.
-
-
 This is an introduction to pandas categorical data type, including a short comparison
 with R's ``factor``.
 
-`Categoricals` are a pandas data type, which correspond to categorical variables in
-statistics: a variable, which can take on only a limited, and usually fixed,
-number of possible values (`categories`; `levels` in R). Examples are gender, social class,
-blood types, country affiliations, observation time or ratings via Likert scales.
+`Categoricals` are a pandas data type corresponding to categorical variables in
+statistics. A categorical variable takes on a limited, and usually fixed,
+number of possible values (`categories`; `levels` in R). Examples are gender, 
+social class, blood type, country affiliation, observation time or rating via 
+Likert scales.
 
 In contrast to statistical categorical variables, categorical data might have an order (e.g.
 'strongly agree' vs 'agree' or 'first observation' vs. 'second observation'), but numerical
@@ -47,24 +41,29 @@ The categorical data type is useful in the following cases:
 * The lexical order of a variable is not the same as the logical order ("one", "two", "three").
   By converting to a categorical and specifying an order on the categories, sorting and
   min/max will use the logical order instead of the lexical order, see :ref:`here <categorical.sort>`.
-* As a signal to other python libraries that this column should be treated as a categorical
+* As a signal to other Python libraries that this column should be treated as a categorical
   variable (e.g. to use suitable statistical methods or plot types).
 
 See also the :ref:`API docs on categoricals<api.categorical>`.
 
+.. _categorical.objectcreation:
+
 Object Creation
 ---------------
 
-Categorical `Series` or columns in a `DataFrame` can be created in several ways:
+Series Creation
+~~~~~~~~~~~~~~~
+
+Categorical ``Series`` or columns in a ``DataFrame`` can be created in several ways:
 
-By specifying ``dtype="category"`` when constructing a `Series`:
+By specifying ``dtype="category"`` when constructing a ``Series``:
 
 .. ipython:: python
 
     s = pd.Series(["a","b","c","a"], dtype="category")
     s
 
-By converting an existing `Series` or column to a ``category`` dtype:
+By converting an existing ``Series`` or column to a ``category`` dtype:
 
 .. ipython:: python
 
@@ -72,19 +71,18 @@ By converting an existing `Series` or column to a ``category`` dtype:
     df["B"] = df["A"].astype('category')
     df
 
-By using some special functions:
+By using special functions, such as :func:`~pandas.cut`, which groups data into
+discrete bins. See the :ref:`example on tiling <reshaping.tile.cut>` in the docs.
 
 .. ipython:: python
 
     df = pd.DataFrame({'value': np.random.randint(0, 100, 20)})
-    labels = [ "{0} - {1}".format(i, i + 9) for i in range(0, 100, 10) ]
+    labels = ["{0} - {1}".format(i, i + 9) for i in range(0, 100, 10)]
 
     df['group'] = pd.cut(df.value, range(0, 105, 10), right=False, labels=labels)
     df.head(10)
 
-See :ref:`documentation <reshaping.tile.cut>` for :func:`~pandas.cut`.
-
-By passing a :class:`pandas.Categorical` object to a `Series` or assigning it to a `DataFrame`.
+By passing a :class:`pandas.Categorical` object to a ``Series`` or assigning it to a ``DataFrame``.
 
 .. ipython:: python
 
@@ -96,32 +94,107 @@ By passing a :class:`pandas.Categorical` object to a `Series` or assigning it to
     df["B"] = raw_cat
     df
 
-You can also specify differently ordered categories or make the resulting data ordered, by passing these arguments to ``astype()``:
+Categorical data has a specific ``category`` :ref:`dtype <basics.dtypes>`:
 
 .. ipython:: python
 
-    s = pd.Series(["a","b","c","a"])
-    s_cat = s.astype("category", categories=["b","c","d"], ordered=False)
-    s_cat
+    df.dtypes
 
-Categorical data has a specific ``category`` :ref:`dtype <basics.dtypes>`:
+DataFrame Creation
+~~~~~~~~~~~~~~~~~~
+
+Similar to the previous section where a single column was converted to categorical, all columns in a
+``DataFrame`` can be batch converted to categorical either during or after construction.
+
+This can be done during construction by specifying ``dtype="category"`` in the ``DataFrame`` constructor:
 
 .. ipython:: python
 
+    df = pd.DataFrame({'A': list('abca'), 'B': list('bccd')}, dtype="category")
     df.dtypes
 
-.. note::
+Note that the categories present in each column differ; the conversion is done column by column, so
+only labels present in a given column are categories:
 
-    In contrast to R's `factor` function, categorical data is not converting input values to
-    strings and categories will end up the same data type as the original values.
+.. ipython:: python
+
+    df['A']
+    df['B']
+
+
+.. versionadded:: 0.23.0
+
+Analogously, all columns in an existing ``DataFrame`` can be batch converted using :meth:`DataFrame.astype`:
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': list('abca'), 'B': list('bccd')})
+    df_cat = df.astype('category')
+    df_cat.dtypes
+
+This conversion is likewise done column by column:
+
+.. ipython:: python
+
+    df_cat['A']
+    df_cat['B']
+
+
+Controlling Behavior
+~~~~~~~~~~~~~~~~~~~~
+
+In the examples above where we passed ``dtype='category'``, we used the default 
+behavior:
+
+1. Categories are inferred from the data.
+2. Categories are unordered.
+
+To control those behaviors, instead of passing ``'category'``, use an instance
+of :class:`~pandas.api.types.CategoricalDtype`.
+
+.. ipython:: python
+
+    from pandas.api.types import CategoricalDtype
+
+    s = pd.Series(["a", "b", "c", "a"])
+    cat_type = CategoricalDtype(categories=["b", "c", "d"],
+                                ordered=True)
+    s_cat = s.astype(cat_type)
+    s_cat
+
+Similarly, a ``CategoricalDtype`` can be used with a ``DataFrame`` to ensure that categories
+are consistent among all columns.
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': list('abca'), 'B': list('bccd')})
+    cat_type = CategoricalDtype(categories=list('abcd'),
+                                ordered=True)
+    df_cat = df.astype(cat_type)
+    df_cat['A']
+    df_cat['B']
 
 .. note::
 
-    In contrast to R's `factor` function, there is currently no way to assign/change labels at
-    creation time. Use `categories` to change the categories after creation time.
+    To perform table-wise conversion, where all labels in the entire ``DataFrame`` are used as
+    categories for each column, the ``categories`` parameter can be determined programmatically by
+    ``categories = pd.unique(df.values.ravel())``.
 
-To get back to the original Series or `numpy` array, use ``Series.astype(original_dtype)`` or
-``np.asarray(categorical)``:
+If you already have ``codes`` and ``categories``, you can use the 
+:func:`~pandas.Categorical.from_codes` constructor to save the factorize step 
+during normal constructor mode:
+
+.. ipython:: python
+
+    splitter = np.random.choice([0,1], 5, p=[0.5,0.5])
+    s = pd.Series(pd.Categorical.from_codes(splitter, categories=["train", "test"]))
+
+
+Regaining Original Data
+~~~~~~~~~~~~~~~~~~~~~~~
+
+To get back to the original ``Series`` or NumPy array, use 
+``Series.astype(original_dtype)`` or ``np.asarray(categorical)``:
 
 .. ipython:: python
 
@@ -129,23 +202,93 @@ To get back to the original Series or `numpy` array, use ``Series.astype(origina
     s
     s2 = s.astype('category')
     s2
-    s3 = s2.astype('string')
-    s3
+    s2.astype(str)
     np.asarray(s2)
 
-If you have already `codes` and `categories`, you can use the :func:`~pandas.Categorical.from_codes`
-constructor to save the factorize step during normal constructor mode:
+.. note::
+
+    In contrast to R's `factor` function, categorical data is not converting input values to
+    strings; categories will end up the same data type as the original values.
+
+.. note::
+
+    In contrast to R's `factor` function, there is currently no way to assign/change labels at
+    creation time. Use `categories` to change the categories after creation time.
+
+.. _categorical.categoricaldtype:
+
+CategoricalDtype
+----------------
+
+.. versionchanged:: 0.21.0
+
+A categorical's type is fully described by
+
+1. ``categories``: a sequence of unique values and no missing values
+2. ``ordered``: a boolean
+
+This information can be stored in a :class:`~pandas.api.types.CategoricalDtype`.
+The ``categories`` argument is optional, which implies that the actual categories
+should be inferred from whatever is present in the data when the
+:class:`pandas.Categorical` is created. The categories are assumed to be unordered
+by default.      
 
 .. ipython:: python
 
-    splitter = np.random.choice([0,1], 5, p=[0.5,0.5])
-    s = pd.Series(pd.Categorical.from_codes(splitter, categories=["train", "test"]))
+   from pandas.api.types import CategoricalDtype
+
+   CategoricalDtype(['a', 'b', 'c'])
+   CategoricalDtype(['a', 'b', 'c'], ordered=True)
+   CategoricalDtype()
+
+A :class:`~pandas.api.types.CategoricalDtype` can be used in any place pandas
+expects a `dtype`. For example :func:`pandas.read_csv`,
+:func:`pandas.DataFrame.astype`, or in the ``Series`` constructor.
+
+.. note::
+
+    As a convenience, you can use the string ``'category'`` in place of a
+    :class:`~pandas.api.types.CategoricalDtype` when you want the default behavior of
+    the categories being unordered, and equal to the set values present in the
+    array. In other words, ``dtype='category'`` is equivalent to
+    ``dtype=CategoricalDtype()``.
+
+Equality Semantics
+~~~~~~~~~~~~~~~~~~
+
+Two instances of :class:`~pandas.api.types.CategoricalDtype` compare equal
+whenever they have the same categories and order. When comparing two
+unordered categoricals, the order of the ``categories`` is not considered.
+
+.. ipython:: python
+
+   c1 = CategoricalDtype(['a', 'b', 'c'], ordered=False)
+
+   # Equal, since order is not considered when ordered=False
+   c1 == CategoricalDtype(['b', 'c', 'a'], ordered=False)
+
+   # Unequal, since the second CategoricalDtype is ordered
+   c1 == CategoricalDtype(['a',  'b', 'c'], ordered=True)
+
+All instances of ``CategoricalDtype`` compare equal to the string ``'category'``.
+
+.. ipython:: python
+
+   c1 == 'category'
+
+.. warning::
+
+   Since ``dtype='category'`` is essentially ``CategoricalDtype(None, False)``,
+   and since all instances ``CategoricalDtype`` compare equal to ``'category'``,
+   all instances of ``CategoricalDtype`` compare equal to a
+   ``CategoricalDtype(None, False)``, regardless of ``categories`` or
+   ``ordered``.
 
 Description
 -----------
 
-Using ``.describe()`` on categorical data will produce similar output to a `Series` or
-`DataFrame` of type ``string``.
+Using :meth:`~DataFrame.describe` on categorical data will produce similar 
+output to a ``Series`` or ``DataFrame`` of type ``string``.
 
 .. ipython:: python
 
@@ -154,13 +297,15 @@ Using ``.describe()`` on categorical data will produce similar output to a `Seri
     df.describe()
     df["cat"].describe()
 
+.. _categorical.cat:
+
 Working with categories
 -----------------------
 
-Categorical data has a `categories` and a `ordered` property, which list their possible values and
-whether the ordering matters or not. These properties are exposed as ``s.cat.categories`` and
-``s.cat.ordered``. If you don't manually specify categories and ordering, they are inferred from the
-passed in values.
+Categorical data has a `categories` and a `ordered` property, which list their 
+possible values and whether the ordering matters or not. These properties are 
+exposed as ``s.cat.categories`` and ``s.cat.ordered``. If you don't manually 
+specify categories and ordering, they are inferred from the passed arguments.
 
 .. ipython:: python
 
@@ -178,15 +323,34 @@ It's also possible to pass in the categories in a specific order:
 
 .. note::
 
-    New categorical data are NOT automatically ordered. You must explicity pass ``ordered=True`` to
-    indicate an ordered ``Categorical``.
+    New categorical data are **not** automatically ordered. You must explicitly 
+    pass ``ordered=True`` to indicate an ordered ``Categorical``.
+
+
+.. note::
+
+    The result of :meth:`~Series.unique` is not always the same as ``Series.cat.categories``,
+    because ``Series.unique()`` has a couple of guarantees, namely that it returns categories
+    in the order of appearance, and it only includes values that are actually present.
+
+    .. ipython:: python
+
+         s = pd.Series(list('babc')).astype(CategoricalDtype(list('abcd')))
+         s
 
+         # categories
+         s.cat.categories
+
+         # uniques
+         s.unique()
 
 Renaming categories
 ~~~~~~~~~~~~~~~~~~~
 
-Renaming categories is done by assigning new values to the ``Series.cat.categories`` property or
-by using the :func:`Categorical.rename_categories` method:
+Renaming categories is done by assigning new values to the 
+``Series.cat.categories`` property or by using the 
+:meth:`~pandas.Categorical.rename_categories` method:
+
 
 .. ipython:: python
 
@@ -194,7 +358,11 @@ by using the :func:`Categorical.rename_categories` method:
     s
     s.cat.categories = ["Group %s" % g for g in s.cat.categories]
     s
-    s.cat.rename_categories([1,2,3])
+    s = s.cat.rename_categories([1,2,3])
+    s
+    # You can also pass a dict-like object to map the renaming
+    s = s.cat.rename_categories({1: 'x', 2: 'y', 3: 'z'})
+    s
 
 .. note::
 
@@ -202,8 +370,8 @@ by using the :func:`Categorical.rename_categories` method:
 
 .. note::
 
-    Be aware that assigning new categories is an inplace operations, while most other operation
-    under ``Series.cat`` per default return a new Series of dtype `category`.
+    Be aware that assigning new categories is an inplace operation, while most other operations
+    under ``Series.cat`` per default return a new ``Series`` of dtype `category`.
 
 Categories must be unique or a `ValueError` is raised:
 
@@ -214,10 +382,20 @@ Categories must be unique or a `ValueError` is raised:
     except ValueError as e:
         print("ValueError: " + str(e))
 
+Categories must also not be ``NaN`` or a `ValueError` is raised:
+
+.. ipython:: python
+
+    try:
+        s.cat.categories = [1,2,np.nan]
+    except ValueError as e:
+        print("ValueError: " + str(e))
+
 Appending new categories
 ~~~~~~~~~~~~~~~~~~~~~~~~
 
-Appending categories can be done by using the :func:`Categorical.add_categories` method:
+Appending categories can be done by using the 
+:meth:`~pandas.Categorical.add_categories` method:
 
 .. ipython:: python
 
@@ -228,8 +406,9 @@ Appending categories can be done by using the :func:`Categorical.add_categories`
 Removing categories
 ~~~~~~~~~~~~~~~~~~~
 
-Removing categories can be done by using the :func:`Categorical.remove_categories` method. Values
-which are removed are replaced by ``np.nan``.:
+Removing categories can be done by using the 
+:meth:`~pandas.Categorical.remove_categories` method. Values which are removed 
+are replaced by ``np.nan``.:
 
 .. ipython:: python
 
@@ -250,8 +429,10 @@ Removing unused categories can also be done:
 Setting categories
 ~~~~~~~~~~~~~~~~~~
 
-If you want to do remove and add new categories in one step (which has some speed advantage),
-or simply set the categories to a predefined scale, use :func:`Categorical.set_categories`.
+If you want to do remove and add new categories in one step (which has some 
+speed advantage), or simply set the categories to a predefined scale, 
+use :meth:`~pandas.Categorical.set_categories`.
+
 
 .. ipython:: python
 
@@ -263,25 +444,23 @@ or simply set the categories to a predefined scale, use :func:`Categorical.set_c
 .. note::
     Be aware that :func:`Categorical.set_categories` cannot know whether some category is omitted
     intentionally or because it is misspelled or (under Python3) due to a type difference (e.g.,
-    numpys S1 dtype and python strings). This can result in surprising behaviour!
+    NumPy S1 dtype and Python strings). This can result in surprising behaviour!
 
 Sorting and Order
 -----------------
 
 .. _categorical.sort:
 
-.. warning::
-
-   The default for construction has changed in v0.16.0 to ``ordered=False``, from the prior implicit ``ordered=True``
-
 If categorical data is ordered (``s.cat.ordered == True``), then the order of the categories has a
-meaning and certain operations are possible. If the categorical is unordered, ``.min()/.max()`` will raise a `TypeError`.
+meaning and certain operations are possible. If the categorical is unordered, ``.min()/.max()`` will raise a ``TypeError``.
 
 .. ipython:: python
 
     s = pd.Series(pd.Categorical(["a","b","c","a"], ordered=False))
     s.sort_values(inplace=True)
-    s = pd.Series(["a","b","c","a"]).astype('category', ordered=True)
+    s = pd.Series(["a","b","c","a"]).astype(
+        CategoricalDtype(ordered=True)
+    )
     s.sort_values(inplace=True)
     s
     s.min(), s.max()
@@ -310,8 +489,8 @@ This is even true for strings and numeric data:
 Reordering
 ~~~~~~~~~~
 
-Reordering the categories is possible via the :func:`Categorical.reorder_categories` and
-the :func:`Categorical.set_categories` methods. For :func:`Categorical.reorder_categories`, all
+Reordering the categories is possible via the :meth:`Categorical.reorder_categories` and
+the :meth:`Categorical.set_categories` methods. For :meth:`Categorical.reorder_categories`, all
 old categories must be included in the new categories and no new categories are allowed. This will
 necessarily make the sort order the same as the categories order.
 
@@ -327,22 +506,22 @@ necessarily make the sort order the same as the categories order.
 .. note::
 
     Note the difference between assigning new categories and reordering the categories: the first
-    renames categories and therefore the individual values in the `Series`, but if the first
+    renames categories and therefore the individual values in the ``Series``, but if the first
     position was sorted last, the renamed value will still be sorted last. Reordering means that the
     way values are sorted is different afterwards, but not that individual values in the
-    `Series` are changed.
+    ``Series`` are changed.
 
 .. note::
 
-    If the `Categorical` is not ordered, ``Series.min()`` and ``Series.max()`` will raise
-    `TypeError`. Numeric operations like ``+``, ``-``, ``*``, ``/`` and operations based on them
-    (e.g.``Series.median()``, which would need to compute the mean between two values if the length
-    of an array is even) do not work and raise a `TypeError`.
+    If the ``Categorical`` is not ordered, :meth:`Series.min` and :meth:`Series.max` will raise
+    ``TypeError``. Numeric operations like ``+``, ``-``, ``*``, ``/`` and operations based on them
+    (e.g. :meth:`Series.median`, which would need to compute the mean between two values if the length
+    of an array is even) do not work and raise a ``TypeError``.
 
 Multi Column Sorting
 ~~~~~~~~~~~~~~~~~~~~
 
-A categorical dtyped column will partcipate in a multi-column sort in a similar manner to other columns.
+A categorical dtyped column will participate in a multi-column sort in a similar manner to other columns.
 The ordering of the categorical is determined by the ``categories`` of that column.
 
 .. ipython:: python
@@ -363,27 +542,33 @@ Comparisons
 
 Comparing categorical data with other objects is possible in three cases:
 
- * comparing equality (``==`` and ``!=``) to a list-like object (list, Series, array,
-   ...) of the same length as the categorical data.
- * all comparisons (``==``, ``!=``, ``>``, ``>=``, ``<``, and ``<=``) of categorical data to
-   another categorical Series, when ``ordered==True`` and the `categories` are the same.
- * all comparisons of a categorical data to a scalar.
+* Comparing equality (``==`` and ``!=``) to a list-like object (list, Series, array,
+  ...) of the same length as the categorical data.
+* All comparisons (``==``, ``!=``, ``>``, ``>=``, ``<``, and ``<=``) of categorical data to
+  another categorical Series, when ``ordered==True`` and the `categories` are the same.
+* All comparisons of a categorical data to a scalar.
 
 All other comparisons, especially "non-equality" comparisons of two categoricals with different
-categories or a categorical with any list-like object, will raise a TypeError.
+categories or a categorical with any list-like object, will raise a ``TypeError``.
 
 .. note::
 
-    Any "non-equality" comparisons of categorical data with a `Series`, `np.array`, `list` or
-    categorical data with different categories or ordering will raise an `TypeError` because custom
+    Any "non-equality" comparisons of categorical data with a ``Series``, ``np.array``, ``list`` or
+    categorical data with different categories or ordering will raise a ``TypeError`` because custom
     categories ordering could be interpreted in two ways: one with taking into account the
     ordering and one without.
 
 .. ipython:: python
 
-    cat = pd.Series([1,2,3]).astype("category", categories=[3,2,1], ordered=True)
-    cat_base = pd.Series([2,2,2]).astype("category", categories=[3,2,1], ordered=True)
-    cat_base2 = pd.Series([2,2,2]).astype("category", ordered=True)
+    cat = pd.Series([1,2,3]).astype(
+        CategoricalDtype([3, 2, 1], ordered=True)
+    )
+    cat_base = pd.Series([2,2,2]).astype(
+        CategoricalDtype([3, 2, 1], ordered=True)
+    )
+    cat_base2 = pd.Series([2,2,2]).astype(
+        CategoricalDtype(ordered=True)
+    )
 
     cat
     cat_base
@@ -428,14 +613,22 @@ the original values:
 
     np.asarray(cat) > base
 
+When you compare two unordered categoricals with the same categories, the order is not considered:
+
+.. ipython:: python
+
+   c1 = pd.Categorical(['a', 'b'], categories=['a', 'b'], ordered=False)
+   c2 = pd.Categorical(['a', 'b'], categories=['b', 'a'], ordered=False)
+   c1 == c2
+
 Operations
 ----------
 
-Apart from ``Series.min()``, ``Series.max()`` and ``Series.mode()``, the following operations are
-possible with categorical data:
+Apart from :meth:`Series.min`, :meth:`Series.max` and :meth:`Series.mode`, the 
+following operations are possible with categorical data:
 
-`Series` methods like `Series.value_counts()` will use all categories, even if some categories are not
-present in the data:
+``Series`` methods like :meth:`Series.value_counts` will use all categories, 
+even if some categories are not present in the data:
 
 .. ipython:: python
 
@@ -466,15 +659,15 @@ Pivot tables:
 Data munging
 ------------
 
-The optimized pandas data access methods  ``.loc``, ``.iloc``, ``.ix`` ``.at``, and ``.iat``,
+The optimized pandas data access methods  ``.loc``, ``.iloc``, ``.at``, and ``.iat``,
 work as normal. The only difference is the return type (for getting) and
 that only values already in `categories` can be assigned.
 
 Getting
 ~~~~~~~
 
-If the slicing operation returns either a `DataFrame` or a column of type `Series`,
-the ``category`` dtype is preserved.
+If the slicing operation returns either a ``DataFrame`` or a column of type 
+``Series``, the ``category`` dtype is preserved.
 
 .. ipython:: python
 
@@ -485,11 +678,10 @@ the ``category`` dtype is preserved.
     df.iloc[2:4,:]
     df.iloc[2:4,:].dtypes
     df.loc["h":"j","cats"]
-    df.ix["h":"j",0:1]
     df[df["cats"] == "b"]
 
-An example where the category type is not preserved is if you take one single row: the
-resulting `Series` is of dtype ``object``:
+An example where the category type is not preserved is if you take one single 
+row: the resulting ``Series`` is of dtype ``object``:
 
 .. ipython:: python
 
@@ -506,20 +698,65 @@ of length "1".
     df.at["h","cats"] # returns a string
 
 .. note::
-    This is a difference to R's `factor` function, where ``factor(c(1,2,3))[1]``
+    The is in contrast to R's `factor` function, where ``factor(c(1,2,3))[1]``
     returns a single value `factor`.
 
-To get a single value `Series` of type ``category`` pass in a list with a single value:
+To get a single value ``Series`` of type ``category``, you pass in a list with 
+a single value:
 
 .. ipython:: python
 
     df.loc[["h"],"cats"]
 
+String and datetime accessors
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The accessors  ``.dt`` and ``.str`` will work if the ``s.cat.categories`` are of
+an appropriate type:
+
+
+.. ipython:: python
+
+    str_s = pd.Series(list('aabb'))
+    str_cat = str_s.astype('category')
+    str_cat
+    str_cat.str.contains("a")
+
+    date_s = pd.Series(pd.date_range('1/1/2015', periods=5))
+    date_cat = date_s.astype('category')
+    date_cat
+    date_cat.dt.day
+
+.. note::
+
+    The returned ``Series`` (or ``DataFrame``) is of the same type as if you used the
+    ``.str.<method>`` / ``.dt.<method>`` on a ``Series`` of that type (and not of
+    type ``category``!).
+
+That means, that the returned values from methods and properties on the accessors of a
+``Series`` and the returned values from methods and properties on the accessors of this
+``Series`` transformed to one of type `category` will be equal:
+
+.. ipython:: python
+
+    ret_s = str_s.str.contains("a")
+    ret_cat = str_cat.str.contains("a")
+    ret_s.dtype == ret_cat.dtype
+    ret_s == ret_cat
+
+.. note::
+
+    The work is done on the ``categories`` and then a new ``Series`` is constructed. This has
+    some performance implication if you have a ``Series`` of type string, where lots of elements
+    are repeated (i.e. the number of unique elements in the ``Series`` is a lot smaller than the
+    length of the ``Series``). In this case it can be faster to convert the original ``Series``
+    to one of type ``category`` and use ``.str.<method>`` or ``.dt.<property>`` on that.
+
 Setting
 ~~~~~~~
 
-Setting values in a categorical column (or `Series`) works as long as the value is included in the
-`categories`:
+Setting values in a categorical column (or ``Series``) works as long as the 
+value is included in the `categories`:
 
 .. ipython:: python
 
@@ -546,7 +783,7 @@ Setting values by assigning categorical data will also check that the `categorie
     except ValueError as e:
         print("ValueError: " + str(e))
 
-Assigning a `Categorical` to parts of a column of other types will use the values:
+Assigning a ``Categorical`` to parts of a column of other types will use the values:
 
 .. ipython:: python
 
@@ -556,11 +793,12 @@ Assigning a `Categorical` to parts of a column of other types will use the value
     df
     df.dtypes
 
+.. _categorical.merge:
 
 Merging
 ~~~~~~~
 
-You can concat two `DataFrames` containing categorical data together,
+You can concat two ``DataFrames`` containing categorical data together,
 but the categories of these categoricals need to be the same:
 
 .. ipython:: python
@@ -572,7 +810,7 @@ but the categories of these categoricals need to be the same:
     res
     res.dtypes
 
-In this case the categories are not the same and so an error is raised:
+In this case the categories are not the same, and therefore an error is raised:
 
 .. ipython:: python
 
@@ -585,16 +823,151 @@ In this case the categories are not the same and so an error is raised:
 
 The same applies to ``df.append(df_different)``.
 
+See also the section on :ref:`merge dtypes<merging.dtypes>` for notes about preserving merge dtypes and performance.
+
+
+.. _categorical.union:
+
+Unioning
+~~~~~~~~
+
+.. versionadded:: 0.19.0
+
+If you want to combine categoricals that do not necessarily have the same 
+categories, the :func:`~pandas.api.types.union_categoricals` function will
+combine a list-like of categoricals. The new categories will be the union of 
+the categories being combined.
+
+.. ipython:: python
+
+    from pandas.api.types import union_categoricals
+    a = pd.Categorical(["b", "c"])
+    b = pd.Categorical(["a", "b"])
+    union_categoricals([a, b])
+
+By default, the resulting categories will be ordered as
+they appear in the data. If you want the categories to
+be lexsorted, use ``sort_categories=True`` argument.
+
+.. ipython:: python
+
+    union_categoricals([a, b], sort_categories=True)
+
+``union_categoricals`` also works with the "easy" case of combining two
+categoricals of the same categories and order information
+(e.g. what you could also ``append`` for).
+
+.. ipython:: python
+
+    a = pd.Categorical(["a", "b"], ordered=True)
+    b = pd.Categorical(["a", "b", "a"], ordered=True)
+    union_categoricals([a, b])
+
+The below raises ``TypeError`` because the categories are ordered and not identical.
+
+.. code-block:: ipython
+
+   In [1]: a = pd.Categorical(["a", "b"], ordered=True)
+   In [2]: b = pd.Categorical(["a", "b", "c"], ordered=True)
+   In [3]: union_categoricals([a, b])
+   Out[3]:
+   TypeError: to union ordered Categoricals, all categories must be the same
+
+.. versionadded:: 0.20.0
+
+Ordered categoricals with different categories or orderings can be combined by
+using the ``ignore_ordered=True`` argument.
+
+.. ipython:: python
+
+    a = pd.Categorical(["a", "b", "c"], ordered=True)
+    b = pd.Categorical(["c", "b", "a"], ordered=True)
+    union_categoricals([a, b], ignore_order=True)
+
+:func:`~pandas.api.types.union_categoricals` also works with a 
+``CategoricalIndex``, or ``Series`` containing categorical data, but note that 
+the resulting array will always be a plain ``Categorical``:
+
+.. ipython:: python
+
+    a = pd.Series(["b", "c"], dtype='category')
+    b = pd.Series(["a", "b"], dtype='category')
+    union_categoricals([a, b])
+
+.. note::
+
+   ``union_categoricals`` may recode the integer codes for categories
+   when combining categoricals.  This is likely what you want,
+   but if you are relying on the exact numbering of the categories, be
+   aware.
+
+   .. ipython:: python
+
+      c1 = pd.Categorical(["b", "c"])
+      c2 = pd.Categorical(["a", "b"])
+
+      c1
+      # "b" is coded to 0
+      c1.codes
+
+      c2
+      # "b" is coded to 1
+      c2.codes
+
+      c = union_categoricals([c1, c2])
+      c
+      # "b" is coded to 0 throughout, same as c1, different from c2
+      c.codes
+
+.. _categorical.concat:
+
+Concatenation
+~~~~~~~~~~~~~
+
+This section describes concatenations specific to ``category`` dtype. See :ref:`Concatenating objects<merging.concat>` for general description.
+
+By default, ``Series`` or ``DataFrame`` concatenation which contains the same categories
+results in ``category`` dtype, otherwise results in ``object`` dtype.
+Use ``.astype`` or ``union_categoricals`` to get ``category`` result.
+
+.. ipython:: python
+
+   # same categories
+   s1 = pd.Series(['a', 'b'], dtype='category')
+   s2 = pd.Series(['a', 'b', 'a'], dtype='category')
+   pd.concat([s1, s2])
+
+   # different categories
+   s3 = pd.Series(['b', 'c'], dtype='category')
+   pd.concat([s1, s3])
+
+   pd.concat([s1, s3]).astype('category')
+   union_categoricals([s1.values, s3.values])
+
+
+Following table summarizes the results of ``Categoricals`` related concatenations.
+
++----------+--------------------------------------------------------+----------------------------+
+| arg1     | arg2                                                   | result                     |
++==========+========================================================+============================+
+| category | category (identical categories)                        | category                   |
++----------+--------------------------------------------------------+----------------------------+
+| category | category (different categories, both not ordered)      | object (dtype is inferred) |
++----------+--------------------------------------------------------+----------------------------+
+| category | category (different categories, either one is ordered) | object (dtype is inferred) |
++----------+--------------------------------------------------------+----------------------------+
+| category | not category                                           | object (dtype is inferred) |
++----------+--------------------------------------------------------+----------------------------+
+
+
 Getting Data In/Out
 -------------------
 
-.. versionadded:: 0.15.2
-
-Writing data (`Series`, `Frames`) to a HDF store that contains a ``category`` dtype was implemented
-in 0.15.2. See :ref:`here <io.hdf5-categorical>` for an example and caveats.
+You can write data that contains ``category`` dtypes to a ``HDFStore``.
+See :ref:`here <io.hdf5-categorical>` for an example and caveats.
 
-Writing data to and reading data from *Stata* format files was implemented in
-0.15.2. See :ref:`here <io.stata-categorical>` for an example and caveats.
+It is also possible to write data to and reading data from *Stata* format files.
+See :ref:`here <io.stata-categorical>` for an example and caveats.
 
 Writing to a CSV file will convert the data, effectively removing any information about the
 categorical (categories and ordering). So if you read back the CSV file you have to convert the
@@ -648,14 +1021,14 @@ a code of ``-1``.
     s.cat.codes
 
 
-Methods for working with missing data, e.g. :meth:`~Series.isnull`, :meth:`~Series.fillna`,
+Methods for working with missing data, e.g. :meth:`~Series.isna`, :meth:`~Series.fillna`,
 :meth:`~Series.dropna`, all work normally:
 
 .. ipython:: python
 
     s = pd.Series(["a", "b", np.nan], dtype="category")
     s
-    pd.isnull(s)
+    pd.isna(s)
     s.fillna("a")
 
 Differences to R's `factor`
@@ -663,7 +1036,7 @@ Differences to R's `factor`
 
 The following differences to R's factor functions can be observed:
 
-* R's `levels` are named `categories`
+* R's `levels` are named `categories`.
 * R's `levels` are always of type string, while `categories` in pandas can be of any dtype.
 * It's not possible to specify labels at creation time. Use ``s.cat.rename_categories(new_labels)``
   afterwards.
@@ -684,7 +1057,7 @@ Memory Usage
 
 .. _categorical.memory:
 
-The memory usage of a ``Categorical`` is proportional to the number of categories times the length of the data. In contrast,
+The memory usage of a ``Categorical`` is proportional to the number of categories plus the length of the data. In contrast,
 an ``object`` dtype is a constant times the length of the data.
 
 .. ipython:: python
@@ -713,39 +1086,13 @@ an ``object`` dtype is a constant times the length of the data.
       s.astype('category').nbytes
 
 
-Old style constructor usage
-~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-In earlier versions than pandas 0.15, a `Categorical` could be constructed by passing in precomputed
-`codes` (called then `labels`) instead of values with categories. The `codes` were interpreted as
-pointers to the categories with `-1` as `NaN`. This type of constructor useage is replaced by
-the special constructor :func:`Categorical.from_codes`.
-
-Unfortunately, in some special cases, using code which assumes the old style constructor usage
-will work with the current pandas version, resulting in subtle bugs:
-
-.. code-block:: python
-
-    >>> cat = pd.Categorical([1,2], [1,2,3])
-    >>> # old version
-    >>> cat.get_values()
-    array([2, 3], dtype=int64)
-    >>> # new version
-    >>> cat.get_values()
-    array([1, 2], dtype=int64)
-
-.. warning::
-    If you used `Categoricals` with older versions of pandas, please audit your code before
-    upgrading and change your code to use the :func:`~pandas.Categorical.from_codes`
-    constructor.
-
 `Categorical` is not a `numpy` array
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Currently, categorical data and the underlying `Categorical` is implemented as a python
-object and not as a low-level `numpy` array dtype. This leads to some problems.
+Currently, categorical data and the underlying ``Categorical`` is implemented as a Python
+object and not as a low-level NumPy array dtype. This leads to some problems.
 
-`numpy` itself doesn't know about the new `dtype`:
+NumPy itself doesn't know about the new `dtype`:
 
 .. ipython:: python
 
@@ -767,15 +1114,14 @@ Dtype comparisons work:
     dtype == np.str_
     np.str_ == dtype
 
-To check if a Series contains Categorical data, with pandas 0.16 or later, use
-``hasattr(s, 'cat')``:
+To check if a Series contains Categorical data, use ``hasattr(s, 'cat')``:
 
 .. ipython:: python
 
     hasattr(pd.Series(['a'], dtype='category'), 'cat')
     hasattr(pd.Series(['a']), 'cat')
 
-Using `numpy` functions on a `Series` of type ``category`` should not work as `Categoricals`
+Using NumPy functions on a ``Series`` of type ``category`` should not work as `Categoricals`
 are not numeric data (even in the case that ``.categories`` is numeric).
 
 .. ipython:: python
@@ -788,7 +1134,7 @@ are not numeric data (even in the case that ``.categories`` is numeric).
          print("TypeError: " + str(e))
 
 .. note::
-    If such a function works, please file a bug at https://github.com/pydata/pandas!
+    If such a function works, please file a bug at https://github.com/pandas-dev/pandas!
 
 dtype in apply
 ~~~~~~~~~~~~~~
@@ -808,13 +1154,13 @@ basic type) and applying along columns will also convert to object.
 Categorical Index
 ~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.16.1
-
-A new ``CategoricalIndex`` index type is introduced in version 0.16.1. See the
-:ref:`advanced indexing docs <indexing.categoricalindex>` for a more detailed
+``CategoricalIndex`` is a type of index that is useful for supporting
+indexing with duplicates. This is a container around a ``Categorical``
+and allows efficient indexing and storage of an index with a large number of duplicated elements.
+See the :ref:`advanced indexing docs <indexing.categoricalindex>` for a more detailed
 explanation.
 
-Setting the index, will create create a ``CategoricalIndex``
+Setting the index will create a ``CategoricalIndex``:
 
 .. ipython:: python
 
@@ -826,15 +1172,12 @@ Setting the index, will create create a ``CategoricalIndex``
     # This now sorts by the categories order
     df.sort_index()
 
-In previous versions (<0.16.1) there is no index of type ``category``, so
-setting the index to categorical column will convert the categorical data to a
-"normal" dtype first and therefore remove any custom ordering of the categories.
-
 Side Effects
 ~~~~~~~~~~~~
 
-Constructing a `Series` from a `Categorical` will not copy the input `Categorical`. This
-means that changes to the `Series` will in most cases change the original `Categorical`:
+Constructing a ``Series`` from a ``Categorical`` will not copy the input 
+``Categorical``. This means that changes to the ``Series`` will in most cases 
+change the original ``Categorical``:
 
 .. ipython:: python
 
@@ -847,7 +1190,7 @@ means that changes to the `Series` will in most cases change the original `Categ
     df["cat"].cat.categories = [1,2,3,4,5]
     cat
 
-Use ``copy=True`` to prevent such a behaviour or simply don't reuse `Categoricals`:
+Use ``copy=True`` to prevent such a behaviour or simply don't reuse ``Categoricals``:
 
 .. ipython:: python
 
@@ -858,6 +1201,6 @@ Use ``copy=True`` to prevent such a behaviour or simply don't reuse `Categorical
     cat
 
 .. note::
-    This also happens in some cases when you supply a `numpy` array instead of a `Categorical`:
-    using an int array (e.g. ``np.array([1,2,3,4])``) will exhibit the same behaviour, while using
+    This also happens in some cases when you supply a NumPy array instead of a ``Categorical``:
+    using an int array (e.g. ``np.array([1,2,3,4])``) will exhibit the same behavior, while using
     a string array (e.g. ``np.array(["a","b","c","a"])``) will not.
diff --git a/doc/source/comparison_with_r.rst b/doc/source/comparison_with_r.rst
index 0841f3354d160..eecacde8ad14e 100644
--- a/doc/source/comparison_with_r.rst
+++ b/doc/source/comparison_with_r.rst
@@ -18,11 +18,11 @@ was started to provide a more detailed look at the `R language
 party libraries as they relate to ``pandas``. In comparisons with R and CRAN
 libraries, we care about the following things:
 
-  - **Functionality / flexibility**: what can/cannot be done with each tool
-  - **Performance**: how fast are operations. Hard numbers/benchmarks are
-    preferable
-  - **Ease-of-use**: Is one tool easier/harder to use (you may have to be
-    the judge of this, given side-by-side code comparisons)
+* **Functionality / flexibility**: what can/cannot be done with each tool
+* **Performance**: how fast are operations. Hard numbers/benchmarks are
+  preferable
+* **Ease-of-use**: Is one tool easier/harder to use (you may have to be
+  the judge of this, given side-by-side code comparisons)
 
 This page is also here to offer a bit of a translation guide for users of these
 R packages.
@@ -31,6 +31,79 @@ For transfer of ``DataFrame`` objects from ``pandas`` to R, one option is to
 use HDF5 files, see :ref:`io.external_compatibility` for an
 example.
 
+
+Quick Reference
+---------------
+
+We'll start off with a quick reference guide pairing some common R
+operations using `dplyr
+<http://cran.r-project.org/web/packages/dplyr/index.html>`__ with
+pandas equivalents.
+
+
+Querying, Filtering, Sampling
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+===========================================  ===========================================
+R                                            pandas
+===========================================  ===========================================
+``dim(df)``                                  ``df.shape``
+``head(df)``                                 ``df.head()``
+``slice(df, 1:10)``                          ``df.iloc[:9]``
+``filter(df, col1 == 1, col2 == 1)``         ``df.query('col1 == 1 & col2 == 1')``
+``df[df$col1 == 1 & df$col2 == 1,]``         ``df[(df.col1 == 1) & (df.col2 == 1)]``
+``select(df, col1, col2)``                   ``df[['col1', 'col2']]``
+``select(df, col1:col3)``                    ``df.loc[:, 'col1':'col3']``
+``select(df, -(col1:col3))``                 ``df.drop(cols_to_drop, axis=1)`` but see [#select_range]_
+``distinct(select(df, col1))``               ``df[['col1']].drop_duplicates()``
+``distinct(select(df, col1, col2))``         ``df[['col1', 'col2']].drop_duplicates()``
+``sample_n(df, 10)``                         ``df.sample(n=10)``
+``sample_frac(df, 0.01)``                    ``df.sample(frac=0.01)``
+===========================================  ===========================================
+
+.. [#select_range] R's shorthand for a subrange of columns
+                   (``select(df, col1:col3)``) can be approached
+                   cleanly in pandas, if you have the list of columns,
+                   for example ``df[cols[1:3]]`` or
+                   ``df.drop(cols[1:3])``, but doing this by column
+                   name is a bit messy.
+
+
+Sorting
+~~~~~~~
+
+===========================================  ===========================================
+R                                            pandas
+===========================================  ===========================================
+``arrange(df, col1, col2)``                  ``df.sort_values(['col1', 'col2'])``
+``arrange(df, desc(col1))``                  ``df.sort_values('col1', ascending=False)``
+===========================================  ===========================================
+
+Transforming
+~~~~~~~~~~~~
+
+===========================================  ===========================================
+R                                            pandas
+===========================================  ===========================================
+``select(df, col_one = col1)``               ``df.rename(columns={'col1': 'col_one'})['col_one']``
+``rename(df, col_one = col1)``               ``df.rename(columns={'col1': 'col_one'})``
+``mutate(df, c=a-b)``                        ``df.assign(c=df.a-df.b)``
+===========================================  ===========================================
+
+
+Grouping and Summarizing
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+==============================================  ===========================================
+R                                               pandas
+==============================================  ===========================================
+``summary(df)``                                 ``df.describe()``
+``gdf <- group_by(df, col1)``                   ``gdf = df.groupby('col1')``
+``summarise(gdf, avg=mean(col1, na.rm=TRUE))``  ``df.groupby('col1').agg({'col1': 'mean'})``
+``summarise(gdf, total=sum(col1))``             ``df.groupby('col1').sum()``
+==============================================  ===========================================
+
+
 Base R
 ------
 
@@ -133,14 +206,6 @@ of its first argument in its second:
    s <- 0:4
    match(s, c(2,4))
 
-The :meth:`~pandas.core.groupby.GroupBy.apply` method can be used to replicate
-this:
-
-.. ipython:: python
-
-   s = pd.Series(np.arange(5),dtype=np.float32)
-   pd.Series(pd.match(s,[2,4],np.nan))
-
 For more details and examples see :ref:`the reshaping documentation
 <indexing.basics.indexing_isin>`.
 
@@ -182,8 +247,6 @@ For more details and examples see :ref:`the reshaping documentation
 |subset|_
 ~~~~~~~~~~
 
-.. versionadded:: 0.13
-
 The :meth:`~pandas.DataFrame.query` method is similar to the base R ``subset``
 function. In R you might want to get the rows of a ``data.frame`` where one
 column's values are less than another column's values:
@@ -212,8 +275,6 @@ For more details and examples see :ref:`the query documentation
 |with|_
 ~~~~~~~~
 
-.. versionadded:: 0.13
-
 An expression using a data.frame called ``df`` in R with the columns ``a`` and
 ``b`` would be evaluated using ``with`` like so:
 
@@ -236,12 +297,6 @@ In certain cases :meth:`~pandas.DataFrame.eval` will be much faster than
 evaluation in pure Python. For more details and examples see :ref:`the eval
 documentation <enhancingperf.eval>`.
 
-zoo
----
-
-xts
----
-
 plyr
 ----
 
@@ -295,7 +350,7 @@ In ``pandas`` the equivalent expression, using the
    })
 
    grouped = df.groupby(['month','week'])
-   print grouped['x'].agg([np.mean, np.std])
+   grouped['x'].agg([np.mean, np.std])
 
 
 For more details and examples see :ref:`the groupby documentation
@@ -342,7 +397,7 @@ In Python, this list would be a list of tuples, so
    pd.DataFrame(a)
 
 For more details and examples see :ref:`the Into to Data Structures
-documentation <basics.dataframe.from_items>`.
+documentation <dsintro>`.
 
 |meltdf|_
 ~~~~~~~~~~~~~~~~
@@ -450,8 +505,6 @@ For more details and examples see :ref:`the reshaping documentation
 |factor|_
 ~~~~~~~~~
 
-.. versionadded:: 0.15
-
 pandas has a data type for categorical data.
 
 .. code-block:: r
@@ -505,4 +558,4 @@ For more details and examples see :ref:`categorical introduction <categorical>`
 .. cast: http://www.inside-r.org/packages/cran/reshape2/docs/cast
 
 .. |factor| replace:: ``factor``
-.. _factor: https://stat.ethz.ch/R-manual/R-devel/library/base/html/factor.html
\ No newline at end of file
+.. _factor: https://stat.ethz.ch/R-manual/R-devel/library/base/html/factor.html
diff --git a/doc/source/comparison_with_sas.rst b/doc/source/comparison_with_sas.rst
index f51603750d61b..0354ad473544b 100644
--- a/doc/source/comparison_with_sas.rst
+++ b/doc/source/comparison_with_sas.rst
@@ -10,7 +10,7 @@ performed in pandas.
 If you're new to pandas, you might want to first read through :ref:`10 Minutes to pandas<10min>`
 to familiarize yourself with the library.
 
-As is customary, we import pandas and numpy as follows:
+As is customary, we import pandas and NumPy as follows:
 
 .. ipython:: python
 
@@ -25,7 +25,7 @@ As is customary, we import pandas and numpy as follows:
    This is often used in interactive work (e.g. `Jupyter notebook
    <https://jupyter.org/>`_ or terminal) - the equivalent in SAS would be:
 
-   .. code-block:: none
+   .. code-block:: sas
 
       proc print data=df(obs=5);
       run;
@@ -65,7 +65,7 @@ in the ``DATA`` step.
 
 Every ``DataFrame`` and ``Series`` has an ``Index`` - which are labels on the
 *rows* of the data. SAS does not have an exactly analogous concept. A data set's
-row are essentially unlabeled, other than an implicit integer index that can be
+rows are essentially unlabeled, other than an implicit integer index that can be
 accessed during the ``DATA`` step (``_N_``).
 
 In pandas, if no index is specified, an integer index is also used by default
@@ -87,7 +87,7 @@ A SAS data set can be built from specified values by
 placing the data after a ``datalines`` statement and
 specifying the column names.
 
-.. code-block:: none
+.. code-block:: sas
 
    data df;
        input x y;
@@ -100,7 +100,7 @@ specifying the column names.
 
 A pandas ``DataFrame`` can be constructed in many different ways,
 but for a small number of values, it is often convenient to specify it as
-a python dictionary, where the keys are the column names
+a Python dictionary, where the keys are the column names
 and the values are the data.
 
 .. ipython:: python
@@ -116,12 +116,12 @@ Reading External Data
 
 Like SAS, pandas provides utilities for reading in data from
 many formats.  The ``tips`` dataset, found within the pandas
-tests (`csv <https://raw.github.com/pydata/pandas/master/pandas/tests/data/tips.csv>`_)
+tests (`csv <https://raw.github.com/pandas-dev/pandas/master/pandas/tests/data/tips.csv>`_)
 will be used in many of the following examples.
 
 SAS provides ``PROC IMPORT`` to read csv data into a data set.
 
-.. code-block:: none
+.. code-block:: sas
 
    proc import datafile='tips.csv' dbms=csv out=tips replace;
        getnames=yes;
@@ -131,7 +131,7 @@ The pandas method is :func:`read_csv`, which works similarly.
 
 .. ipython:: python
 
-   url = 'https://raw.github.com/pydata/pandas/master/pandas/tests/data/tips.csv'
+   url = 'https://raw.github.com/pandas-dev/pandas/master/pandas/tests/data/tips.csv'
    tips = pd.read_csv(url)
    tips.head()
 
@@ -156,7 +156,7 @@ Exporting Data
 
 The inverse of ``PROC IMPORT`` in SAS is ``PROC EXPORT``
 
-.. code-block:: none
+.. code-block:: sas
 
    proc export data=tips outfile='tips2.csv' dbms=csv;
    run;
@@ -178,7 +178,7 @@ Operations on Columns
 In the ``DATA`` step, arbitrary math expressions can
 be used on new or existing columns.
 
-.. code-block:: none
+.. code-block:: sas
 
    data tips;
        set tips;
@@ -207,7 +207,7 @@ Filtering
 Filtering in SAS is done with an ``if`` or ``where`` statement, on one
 or more columns.
 
-.. code-block:: none
+.. code-block:: sas
 
    data tips;
        set tips;
@@ -233,7 +233,7 @@ If/Then Logic
 
 In SAS, if/then logic can be used to create new columns.
 
-.. code-block:: none
+.. code-block:: sas
 
    data tips;
        set tips;
@@ -262,7 +262,7 @@ Date Functionality
 SAS provides a variety of functions to do operations on
 date/datetime columns.
 
-.. code-block:: none
+.. code-block:: sas
 
    data tips;
        set tips;
@@ -271,7 +271,7 @@ date/datetime columns.
        date2 = mdy(2, 15, 2015);
        date1_year = year(date1);
        date2_month = month(date2);
-       * shift date to begninning of next interval;
+       * shift date to beginning of next interval;
        date1_next = intnx('MONTH', date1, 1);
        * count intervals between dates;
        months_between = intck('MONTH', date1, date2);
@@ -279,7 +279,7 @@ date/datetime columns.
 
 The equivalent pandas operations are shown below.  In addition to these
 functions pandas supports other Time Series features
-not available in Base SAS (such as resampling and and custom offets) -
+not available in Base SAS (such as resampling and custom offsets) -
 see the :ref:`timeseries documentation<timeseries>` for more details.
 
 .. ipython:: python
@@ -307,7 +307,7 @@ Selection of Columns
 SAS provides keywords in the ``DATA`` step to select,
 drop, and rename columns.
 
-.. code-block:: none
+.. code-block:: sas
 
    data tips;
        set tips;
@@ -343,20 +343,160 @@ Sorting by Values
 
 Sorting in SAS is accomplished via ``PROC SORT``
 
-.. code-block:: none
+.. code-block:: sas
 
    proc sort data=tips;
        by sex total_bill;
    run;
 
 pandas objects have a :meth:`~DataFrame.sort_values` method, which
-takes a list of columnns to sort by.
+takes a list of columns to sort by.
 
 .. ipython:: python
 
    tips = tips.sort_values(['sex', 'total_bill'])
    tips.head()
 
+
+String Processing
+-----------------
+
+Length
+~~~~~~
+
+SAS determines the length of a character string with the 
+`LENGTHN <http://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm>`__  
+and `LENGTHC <http://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm>`__ 
+functions. ``LENGTHN`` excludes trailing blanks and ``LENGTHC`` includes trailing blanks.
+
+.. code-block:: sas
+
+   data _null_;
+   set tips;
+   put(LENGTHN(time));
+   put(LENGTHC(time));
+   run;
+
+Python determines the length of a character string with the ``len`` function.
+``len`` includes trailing blanks.  Use ``len`` and ``rstrip`` to exclude 
+trailing blanks.
+
+.. ipython:: python
+
+   tips['time'].str.len().head()
+   tips['time'].str.rstrip().str.len().head()
+
+
+Find
+~~~~
+
+SAS determines the position of a character in a string with the 
+`FINDW <http://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm>`__ function. 
+``FINDW`` takes the string defined by the first argument and searches for the first position of the substring 
+you supply as the second argument.
+
+.. code-block:: sas
+
+   data _null_;
+   set tips;
+   put(FINDW(sex,'ale'));
+   run;
+
+Python determines the position of a character in a string with the 
+``find`` function.  ``find`` searches for the first position of the 
+substring.  If the substring is found, the function returns its 
+position.  Keep in mind that Python indexes are zero-based and 
+the function will return -1 if it fails to find the substring.
+
+.. ipython:: python
+
+   tips['sex'].str.find("ale").head()
+
+
+Substring
+~~~~~~~~~
+
+SAS extracts a substring from a string based on its position with the 
+`SUBSTR <http://www2.sas.com/proceedings/sugi25/25/cc/25p088.pdf>`__ function. 
+
+.. code-block:: sas
+
+   data _null_;
+   set tips;
+   put(substr(sex,1,1));
+   run;
+
+With pandas you can use ``[]`` notation to extract a substring
+from a string by position locations.  Keep in mind that Python 
+indexes are zero-based.
+
+.. ipython:: python
+
+   tips['sex'].str[0:1].head()
+
+
+Scan
+~~~~
+
+The SAS `SCAN <http://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm>`__ 
+function returns the nth word from a string. The first argument is the string you want to parse and the 
+second argument specifies which word you want to extract.
+
+.. code-block:: sas
+
+   data firstlast;
+   input String $60.;
+   First_Name = scan(string, 1);
+   Last_Name = scan(string, -1);
+   datalines2;
+   John Smith;
+   Jane Cook;
+   ;;;
+   run;   
+
+Python extracts a substring from a string based on its text 
+by using regular expressions. There are much more powerful 
+approaches, but this just shows a simple approach.
+
+.. ipython:: python
+
+   firstlast = pd.DataFrame({'String': ['John Smith', 'Jane Cook']})
+   firstlast['First_Name'] = firstlast['String'].str.split(" ", expand=True)[0]
+   firstlast['Last_Name'] = firstlast['String'].str.rsplit(" ", expand=True)[0]
+   firstlast
+
+
+Upcase, Lowcase, and Propcase
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The SAS `UPCASE <http://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm>`__ 
+`LOWCASE <http://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm>`__ and 
+`PROPCASE <http://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/a002598106.htm>`__ 
+functions change the case of the argument.
+
+.. code-block:: sas
+
+   data firstlast;
+   input String $60.;
+   string_up = UPCASE(string);
+   string_low = LOWCASE(string);
+   string_prop = PROPCASE(string);
+   datalines2;
+   John Smith;
+   Jane Cook;
+   ;;;
+   run;
+
+The equivalent Python functions are ``upper``, ``lower``, and ``title``.
+
+.. ipython:: python
+
+   firstlast = pd.DataFrame({'String': ['John Smith', 'Jane Cook']})
+   firstlast['string_up'] = firstlast['String'].str.upper()
+   firstlast['string_low'] = firstlast['String'].str.lower()
+   firstlast['string_prop'] = firstlast['String'].str.title()
+   firstlast
+
 Merging
 -------
 
@@ -376,7 +516,7 @@ types of joins are accomplished using the ``in=`` dummy
 variables to track whether a match was found in one or both
 input frames.
 
-.. code-block:: none
+.. code-block:: sas
 
    proc sort data=df1;
        by key;
@@ -432,7 +572,7 @@ operations, and is ignored by default for aggregations.
 One difference is that missing data cannot be compared to its sentinel value.
 For example, in SAS you could do this to filter missing values.
 
-.. code-block:: none
+.. code-block:: sas
 
    data outer_join_nulls;
        set outer_join;
@@ -444,13 +584,13 @@ For example, in SAS you could do this to filter missing values.
        if value_x ^= .;
    run;
 
-Which doesn't work in in pandas.  Instead, the ``pd.isnull`` or ``pd.notnull`` functions
+Which doesn't work in pandas.  Instead, the ``pd.isna`` or ``pd.notna`` functions
 should be used for comparisons.
 
 .. ipython:: python
 
-   outer_join[pd.isnull(outer_join['value_x'])]
-   outer_join[pd.notnull(outer_join['value_x'])]
+   outer_join[pd.isna(outer_join['value_x'])]
+   outer_join[pd.notna(outer_join['value_x'])]
 
 pandas also provides a variety of methods to work with missing data - some of
 which would be challenging to express in SAS. For example, there are methods to
@@ -475,7 +615,7 @@ SAS's PROC SUMMARY can be used to group by one or
 more key variables and compute aggregations on
 numeric columns.
 
-.. code-block:: none
+.. code-block:: sas
 
    proc summary data=tips nway;
        class sex smoker;
@@ -500,7 +640,7 @@ In SAS, if the group aggregations need to be used with
 the original frame, it must be merged back together.  For
 example, to subtract the mean for each observation by smoker group.
 
-.. code-block:: none
+.. code-block:: sas
 
    proc summary data=tips missing nway;
        class smoker;
@@ -539,7 +679,7 @@ replicate most other by group processing from SAS. For example,
 this ``DATA`` step reads the data by sex/smoker group and filters to
 the first entry for each.
 
-.. code-block:: none
+.. code-block:: sas
 
    proc sort data=tips;
       by sex smoker;
@@ -570,17 +710,16 @@ machine's memory, but also that the operations on that data may be faster.
 
 If out of core processing is needed, one possibility is the
 `dask.dataframe <http://dask.pydata.org/en/latest/dataframe.html>`_
-library (currently in development) which 
+library (currently in development) which
 provides a subset of pandas functionality for an on-disk ``DataFrame``
 
 Data Interop
 ~~~~~~~~~~~~
 
 pandas provides a :func:`read_sas` method that can read SAS data saved in
-the XPORT format.  The ability to read SAS's binary format is planned for a
-future release.
+the XPORT or SAS7BDAT binary format.
 
-.. code-block:: none
+.. code-block:: sas
 
    libname xportout xport 'transport-file.xpt';
    data xportout.tips;
@@ -591,6 +730,15 @@ future release.
 .. code-block:: python
 
    df = pd.read_sas('transport-file.xpt')
+   df = pd.read_sas('binary-file.sas7bdat')
+
+You can also specify the file format directly. By default, pandas will try
+to infer the file format based on its extension.
+
+.. code-block:: python
+
+   df = pd.read_sas('transport-file.xpt', format='xport')
+   df = pd.read_sas('binary-file.sas7bdat', format='sas7bdat')
 
 XPORT is a relatively limited format and the parsing of it is not as
 optimized as some of the other pandas readers. An alternative way
diff --git a/doc/source/comparison_with_sql.rst b/doc/source/comparison_with_sql.rst
index 5dc083db7d147..ba069b5a44c72 100644
--- a/doc/source/comparison_with_sql.rst
+++ b/doc/source/comparison_with_sql.rst
@@ -10,7 +10,7 @@ various SQL operations would be performed using pandas.
 If you're new to pandas, you might want to first read through :ref:`10 Minutes to pandas<10min>`
 to familiarize yourself with the library.
 
-As is customary, we import pandas and numpy as follows:
+As is customary, we import pandas and NumPy as follows:
 
 .. ipython:: python
 
@@ -23,7 +23,7 @@ structure.
 
 .. ipython:: python
 
-    url = 'https://raw.github.com/pydata/pandas/master/pandas/tests/data/tips.csv'
+    url = 'https://raw.github.com/pandas-dev/pandas/master/pandas/tests/data/tips.csv'
     tips = pd.read_csv(url)
     tips.head()
 
@@ -101,7 +101,7 @@ Just like SQL's OR and AND, multiple conditions can be passed to a DataFrame usi
     # tips by parties of at least 5 diners OR bill total was more than $45
     tips[(tips['size'] >= 5) | (tips['total_bill'] > 45)]
 
-NULL checking is done using the :meth:`~pandas.Series.notnull` and :meth:`~pandas.Series.isnull`
+NULL checking is done using the :meth:`~pandas.Series.notna` and :meth:`~pandas.Series.isna`
 methods.
 
 .. ipython:: python
@@ -121,9 +121,9 @@ where ``col2`` IS NULL with the following query:
 
 .. ipython:: python
 
-    frame[frame['col2'].isnull()]
+    frame[frame['col2'].isna()]
 
-Getting items where ``col1`` IS NOT NULL can be done with :meth:`~pandas.Series.notnull`.
+Getting items where ``col1`` IS NOT NULL can be done with :meth:`~pandas.Series.notna`.
 
 .. code-block:: sql
 
@@ -133,12 +133,12 @@ Getting items where ``col1`` IS NOT NULL can be done with :meth:`~pandas.Series.
 
 .. ipython:: python
 
-    frame[frame['col1'].notnull()]
+    frame[frame['col1'].notna()]
 
 
 GROUP BY
 --------
-In pandas, SQL's GROUP BY operations performed using the similarly named
+In pandas, SQL's GROUP BY operations are performed using the similarly named
 :meth:`~pandas.DataFrame.groupby` method. :meth:`~pandas.DataFrame.groupby` typically refers to a
 process where we'd like to split a dataset into groups, apply some function (typically aggregation)
 , and then combine the groups together.
@@ -163,23 +163,24 @@ The pandas equivalent would be:
 
     tips.groupby('sex').size()
 
-Notice that in the pandas code we used :meth:`~pandas.DataFrameGroupBy.size` and not
-:meth:`~pandas.DataFrameGroupBy.count`. This is because :meth:`~pandas.DataFrameGroupBy.count`
-applies the function to each column, returning the number of ``not null`` records within each.
+Notice that in the pandas code we used :meth:`~pandas.core.groupby.DataFrameGroupBy.size` and not
+:meth:`~pandas.core.groupby.DataFrameGroupBy.count`. This is because
+:meth:`~pandas.core.groupby.DataFrameGroupBy.count` applies the function to each column, returning
+the number of ``not null`` records within each.
 
 .. ipython:: python
 
     tips.groupby('sex').count()
 
-Alternatively, we could have applied the :meth:`~pandas.DataFrameGroupBy.count` method to an
-individual column:
+Alternatively, we could have applied the :meth:`~pandas.core.groupby.DataFrameGroupBy.count` method
+to an individual column:
 
 .. ipython:: python
 
     tips.groupby('sex')['total_bill'].count()
 
 Multiple functions can also be applied at once. For instance, say we'd like to see how tip amount
-differs by day of the week - :meth:`~pandas.DataFrameGroupBy.agg` allows you to pass a dictionary
+differs by day of the week - :meth:`~pandas.core.groupby.DataFrameGroupBy.agg` allows you to pass a dictionary
 to your grouped DataFrame, indicating which functions to apply to specific columns.
 
 .. code-block:: sql
@@ -371,10 +372,109 @@ In pandas, you can use :meth:`~pandas.concat` in conjunction with
 
     pd.concat([df1, df2]).drop_duplicates()
 
+Pandas equivalents for some SQL analytic and aggregate functions
+----------------------------------------------------------------
+
+Top N rows with offset
+~~~~~~~~~~~~~~~~~~~~~~
+
+.. code-block:: sql
+
+    -- MySQL
+    SELECT * FROM tips
+    ORDER BY tip DESC
+    LIMIT 10 OFFSET 5;
+
+.. ipython:: python
+
+    tips.nlargest(10+5, columns='tip').tail(10)
+
+Top N rows per group
+~~~~~~~~~~~~~~~~~~~~
+
+.. code-block:: sql
+
+    -- Oracle's ROW_NUMBER() analytic function
+    SELECT * FROM (
+      SELECT
+        t.*,
+        ROW_NUMBER() OVER(PARTITION BY day ORDER BY total_bill DESC) AS rn
+      FROM tips t
+    )
+    WHERE rn < 3
+    ORDER BY day, rn;
+
+
+.. ipython:: python
+
+    (tips.assign(rn=tips.sort_values(['total_bill'], ascending=False)
+                        .groupby(['day'])
+                        .cumcount() + 1)
+         .query('rn < 3')
+         .sort_values(['day','rn'])
+    )
+
+the same using `rank(method='first')` function
+
+.. ipython:: python
+
+    (tips.assign(rnk=tips.groupby(['day'])['total_bill']
+                         .rank(method='first', ascending=False))
+         .query('rnk < 3')
+         .sort_values(['day','rnk'])
+    )
+
+.. code-block:: sql
+
+    -- Oracle's RANK() analytic function
+    SELECT * FROM (
+      SELECT
+        t.*,
+        RANK() OVER(PARTITION BY sex ORDER BY tip) AS rnk
+      FROM tips t
+      WHERE tip < 2
+    )
+    WHERE rnk < 3
+    ORDER BY sex, rnk;
+
+Let's find tips with (rank < 3) per gender group for (tips < 2).
+Notice that when using ``rank(method='min')`` function
+`rnk_min` remains the same for the same `tip`
+(as Oracle's RANK() function)
+
+.. ipython:: python
+
+    (tips[tips['tip'] < 2]
+         .assign(rnk_min=tips.groupby(['sex'])['tip']
+                             .rank(method='min'))
+         .query('rnk_min < 3')
+         .sort_values(['sex','rnk_min'])
+    )
+
 
 UPDATE
 ------
 
+.. code-block:: sql
+
+    UPDATE tips
+    SET tip = tip*2
+    WHERE tip < 2;
+
+.. ipython:: python
+
+    tips.loc[tips['tip'] < 2, 'tip'] *= 2
 
 DELETE
 ------
+
+.. code-block:: sql
+
+    DELETE FROM tips
+    WHERE tip > 9;
+
+In pandas we select the rows that should remain, instead of deleting them
+
+.. ipython:: python
+
+    tips = tips.loc[tips['tip'] <= 9]
diff --git a/doc/source/comparison_with_stata.rst b/doc/source/comparison_with_stata.rst
new file mode 100644
index 0000000000000..6c518983d5904
--- /dev/null
+++ b/doc/source/comparison_with_stata.rst
@@ -0,0 +1,680 @@
+.. currentmodule:: pandas
+.. _compare_with_stata:
+
+Comparison with Stata
+*********************
+For potential users coming from `Stata <https://en.wikipedia.org/wiki/Stata>`__
+this page is meant to demonstrate how different Stata operations would be
+performed in pandas.
+
+If you're new to pandas, you might want to first read through :ref:`10 Minutes to pandas<10min>`
+to familiarize yourself with the library.
+
+As is customary, we import pandas and NumPy as follows. This means that we can refer to the
+libraries as ``pd`` and ``np``, respectively, for the rest of the document.
+
+.. ipython:: python
+
+    import pandas as pd
+    import numpy as np
+
+
+.. note::
+
+   Throughout this tutorial, the pandas ``DataFrame`` will be displayed by calling
+   ``df.head()``, which displays the first N (default 5) rows of the ``DataFrame``.
+   This is often used in interactive work (e.g. `Jupyter notebook
+   <https://jupyter.org/>`_ or terminal) -- the equivalent in Stata would be:
+
+   .. code-block:: stata
+
+      list in 1/5
+
+Data Structures
+---------------
+
+General Terminology Translation
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. csv-table::
+    :header: "pandas", "Stata"
+    :widths: 20, 20
+
+    ``DataFrame``, data set
+    column, variable
+    row, observation
+    groupby, bysort
+    ``NaN``, ``.``
+
+
+``DataFrame`` / ``Series``
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A ``DataFrame`` in pandas is analogous to a Stata data set -- a two-dimensional
+data source with labeled columns that can be of different types. As will be
+shown in this document, almost any operation that can be applied to a data set
+in Stata can also be accomplished in pandas.
+
+A ``Series`` is the data structure that represents one column of a
+``DataFrame``. Stata doesn't have a separate data structure for a single column,
+but in general, working with a ``Series`` is analogous to referencing a column
+of a data set in Stata.
+
+``Index``
+~~~~~~~~~
+
+Every ``DataFrame`` and ``Series`` has an ``Index`` -- labels on the
+*rows* of the data. Stata does not have an exactly analogous concept. In Stata, a data set's
+rows are essentially unlabeled, other than an implicit integer index that can be
+accessed with ``_n``.
+
+In pandas, if no index is specified, an integer index is also used by default
+(first row = 0, second row = 1, and so on). While using a labeled ``Index`` or
+``MultiIndex`` can enable sophisticated analyses and is ultimately an important
+part of pandas to understand, for this comparison we will essentially ignore the
+``Index`` and just treat the ``DataFrame`` as a collection of columns. Please
+see the :ref:`indexing documentation<indexing>` for much more on how to use an
+``Index`` effectively.
+
+
+Data Input / Output
+-------------------
+
+Constructing a DataFrame from Values
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A Stata data set can be built from specified values by
+placing the data after an ``input`` statement and
+specifying the column names.
+
+.. code-block:: stata
+
+   input x y
+   1 2
+   3 4
+   5 6
+   end
+
+A pandas ``DataFrame`` can be constructed in many different ways,
+but for a small number of values, it is often convenient to specify it as
+a Python dictionary, where the keys are the column names
+and the values are the data.
+
+.. ipython:: python
+
+   df = pd.DataFrame({
+            'x': [1, 3, 5],
+            'y': [2, 4, 6]})
+   df
+
+
+Reading External Data
+~~~~~~~~~~~~~~~~~~~~~
+
+Like Stata, pandas provides utilities for reading in data from
+many formats.  The ``tips`` data set, found within the pandas
+tests (`csv <https://raw.github.com/pandas-dev/pandas/master/pandas/tests/data/tips.csv>`_)
+will be used in many of the following examples.
+
+Stata provides ``import delimited`` to read csv data into a data set in memory.
+If the ``tips.csv`` file is in the current working directory, we can import it as follows.
+
+.. code-block:: stata
+
+   import delimited tips.csv
+
+The pandas method is :func:`read_csv`, which works similarly. Additionally, it will automatically download
+the data set if presented with a url.
+
+.. ipython:: python
+
+   url = 'https://raw.github.com/pandas-dev/pandas/master/pandas/tests/data/tips.csv'
+   tips = pd.read_csv(url)
+   tips.head()
+
+Like ``import delimited``, :func:`read_csv` can take a number of parameters to specify
+how the data should be parsed.  For example, if the data were instead tab delimited,
+did not have column names, and existed in the current working directory,
+the pandas command would be:
+
+.. code-block:: python
+
+   tips = pd.read_csv('tips.csv', sep='\t', header=None)
+
+   # alternatively, read_table is an alias to read_csv with tab delimiter
+   tips = pd.read_table('tips.csv', header=None)
+
+Pandas can also read Stata data sets in ``.dta`` format with the :func:`read_stata` function.
+
+.. code-block:: python
+
+   df = pd.read_stata('data.dta')
+
+In addition to text/csv and Stata files, pandas supports a variety of other data formats
+such as Excel, SAS, HDF5, Parquet, and SQL databases.  These are all read via a ``pd.read_*``
+function.  See the :ref:`IO documentation<io>` for more details.
+
+
+Exporting Data
+~~~~~~~~~~~~~~
+
+The inverse of ``import delimited`` in Stata is ``export delimited``
+
+.. code-block:: stata
+
+   export delimited tips2.csv
+
+Similarly in pandas, the opposite of ``read_csv`` is :meth:`DataFrame.to_csv`.
+
+.. code-block:: python
+
+   tips.to_csv('tips2.csv')
+
+Pandas can also export to Stata file format with the :meth:`DataFrame.to_stata` method.
+
+.. code-block:: python
+
+   tips.to_stata('tips2.dta')
+
+
+Data Operations
+---------------
+
+Operations on Columns
+~~~~~~~~~~~~~~~~~~~~~
+
+In Stata, arbitrary math expressions can be used with the ``generate`` and
+``replace`` commands on new or existing columns. The ``drop`` command drops
+the column from the data set.
+
+.. code-block:: stata
+
+   replace total_bill = total_bill - 2
+   generate new_bill = total_bill / 2
+   drop new_bill
+
+pandas provides similar vectorized operations by
+specifying the individual ``Series`` in the ``DataFrame``.
+New columns can be assigned in the same way. The :meth:`DataFrame.drop` method
+drops a column from the ``DataFrame``.
+
+.. ipython:: python
+
+   tips['total_bill'] = tips['total_bill'] - 2
+   tips['new_bill'] = tips['total_bill'] / 2
+   tips.head()
+
+   tips = tips.drop('new_bill', axis=1)
+
+Filtering
+~~~~~~~~~
+
+Filtering in Stata is done with an ``if`` clause on one or more columns.
+
+.. code-block:: stata
+
+   list if total_bill > 10
+
+DataFrames can be filtered in multiple ways; the most intuitive of which is using
+:ref:`boolean indexing <indexing.boolean>`.
+
+.. ipython:: python
+
+   tips[tips['total_bill'] > 10].head()
+
+If/Then Logic
+~~~~~~~~~~~~~
+
+In Stata, an ``if`` clause can also be used to create new columns.
+
+.. code-block:: stata
+
+   generate bucket = "low" if total_bill < 10
+   replace bucket = "high" if total_bill >= 10
+
+The same operation in pandas can be accomplished using
+the ``where`` method from ``numpy``.
+
+.. ipython:: python
+
+   tips['bucket'] = np.where(tips['total_bill'] < 10, 'low', 'high')
+   tips.head()
+
+.. ipython:: python
+   :suppress:
+
+   tips = tips.drop('bucket', axis=1)
+
+Date Functionality
+~~~~~~~~~~~~~~~~~~
+
+Stata provides a variety of functions to do operations on
+date/datetime columns.
+
+.. code-block:: stata
+
+   generate date1 = mdy(1, 15, 2013)
+   generate date2 = date("Feb152015", "MDY")
+
+   generate date1_year = year(date1)
+   generate date2_month = month(date2)
+
+   * shift date to beginning of next month
+   generate date1_next = mdy(month(date1) + 1, 1, year(date1)) if month(date1) != 12
+   replace date1_next = mdy(1, 1, year(date1) + 1) if month(date1) == 12
+   generate months_between = mofd(date2) - mofd(date1)
+
+   list date1 date2 date1_year date2_month date1_next months_between
+
+The equivalent pandas operations are shown below.  In addition to these
+functions, pandas supports other Time Series features
+not available in Stata (such as time zone handling and custom offsets) --
+see the :ref:`timeseries documentation<timeseries>` for more details.
+
+.. ipython:: python
+
+   tips['date1'] = pd.Timestamp('2013-01-15')
+   tips['date2'] = pd.Timestamp('2015-02-15')
+   tips['date1_year'] = tips['date1'].dt.year
+   tips['date2_month'] = tips['date2'].dt.month
+   tips['date1_next'] = tips['date1'] + pd.offsets.MonthBegin()
+   tips['months_between'] = (tips['date2'].dt.to_period('M') -
+                             tips['date1'].dt.to_period('M'))
+
+   tips[['date1','date2','date1_year','date2_month',
+         'date1_next','months_between']].head()
+
+.. ipython:: python
+   :suppress:
+
+   tips = tips.drop(['date1','date2','date1_year',
+      'date2_month','date1_next','months_between'], axis=1)
+
+Selection of Columns
+~~~~~~~~~~~~~~~~~~~~
+
+Stata provides keywords to select, drop, and rename columns.
+
+.. code-block:: stata
+
+   keep sex total_bill tip
+
+   drop sex
+
+   rename total_bill total_bill_2
+
+The same operations are expressed in pandas below. Note that in contrast to Stata, these
+operations do not happen in place. To make these changes persist, assign the operation back
+to a variable.
+
+.. ipython:: python
+
+   # keep
+   tips[['sex', 'total_bill', 'tip']].head()
+
+   # drop
+   tips.drop('sex', axis=1).head()
+
+   # rename
+   tips.rename(columns={'total_bill': 'total_bill_2'}).head()
+
+
+Sorting by Values
+~~~~~~~~~~~~~~~~~
+
+Sorting in Stata is accomplished via ``sort``
+
+.. code-block:: stata
+
+   sort sex total_bill
+
+pandas objects have a :meth:`DataFrame.sort_values` method, which
+takes a list of columns to sort by.
+
+.. ipython:: python
+
+   tips = tips.sort_values(['sex', 'total_bill'])
+   tips.head()
+
+
+String Processing
+-----------------
+
+Finding Length of String
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+Stata determines the length of a character string with the :func:`strlen` and
+:func:`ustrlen` functions for ASCII and Unicode strings, respectively.
+
+.. code-block:: stata
+
+   generate strlen_time = strlen(time)
+   generate ustrlen_time = ustrlen(time)
+
+Python determines the length of a character string with the ``len`` function.
+In Python 3, all strings are Unicode strings. ``len`` includes trailing blanks.
+Use ``len`` and ``rstrip`` to exclude trailing blanks.
+
+.. ipython:: python
+
+   tips['time'].str.len().head()
+   tips['time'].str.rstrip().str.len().head()
+
+
+Finding Position of Substring
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Stata determines the position of a character in a string with the :func:`strpos` function.
+This takes the string defined by the first argument and searches for the
+first position of the substring you supply as the second argument.
+
+.. code-block:: stata
+
+   generate str_position = strpos(sex, "ale")
+
+Python determines the position of a character in a string with the
+:func:`find` function.  ``find`` searches for the first position of the
+substring.  If the substring is found, the function returns its
+position.  Keep in mind that Python indexes are zero-based and
+the function will return -1 if it fails to find the substring.
+
+.. ipython:: python
+
+   tips['sex'].str.find("ale").head()
+
+
+Extracting Substring by Position
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Stata extracts a substring from a string based on its position with the :func:`substr` function.
+
+.. code-block:: stata
+
+   generate short_sex = substr(sex, 1, 1)
+
+With pandas you can use ``[]`` notation to extract a substring
+from a string by position locations.  Keep in mind that Python
+indexes are zero-based.
+
+.. ipython:: python
+
+   tips['sex'].str[0:1].head()
+
+
+Extracting nth Word
+~~~~~~~~~~~~~~~~~~~
+
+The Stata :func:`word` function returns the nth word from a string.
+The first argument is the string you want to parse and the
+second argument specifies which word you want to extract.
+
+.. code-block:: stata
+
+   clear
+   input str20 string
+   "John Smith"
+   "Jane Cook"
+   end
+
+   generate first_name = word(name, 1)
+   generate last_name = word(name, -1)
+
+Python extracts a substring from a string based on its text
+by using regular expressions. There are much more powerful
+approaches, but this just shows a simple approach.
+
+.. ipython:: python
+
+   firstlast = pd.DataFrame({'string': ['John Smith', 'Jane Cook']})
+   firstlast['First_Name'] = firstlast['string'].str.split(" ", expand=True)[0]
+   firstlast['Last_Name'] = firstlast['string'].str.rsplit(" ", expand=True)[0]
+   firstlast
+
+
+Changing Case
+~~~~~~~~~~~~~
+
+The Stata :func:`strupper`, :func:`strlower`, :func:`strproper`,
+:func:`ustrupper`, :func:`ustrlower`, and :func:`ustrtitle` functions
+change the case of ASCII and Unicode strings, respectively.
+
+.. code-block:: stata
+
+   clear
+   input str20 string
+   "John Smith"
+   "Jane Cook"
+   end
+
+   generate upper = strupper(string)
+   generate lower = strlower(string)
+   generate title = strproper(string)
+   list
+
+The equivalent Python functions are ``upper``, ``lower``, and ``title``.
+
+.. ipython:: python
+
+   firstlast = pd.DataFrame({'string': ['John Smith', 'Jane Cook']})
+   firstlast['upper'] = firstlast['string'].str.upper()
+   firstlast['lower'] = firstlast['string'].str.lower()
+   firstlast['title'] = firstlast['string'].str.title()
+   firstlast
+
+Merging
+-------
+
+The following tables will be used in the merge examples
+
+.. ipython:: python
+
+   df1 = pd.DataFrame({'key': ['A', 'B', 'C', 'D'],
+                       'value': np.random.randn(4)})
+   df1
+   df2 = pd.DataFrame({'key': ['B', 'D', 'D', 'E'],
+                        'value': np.random.randn(4)})
+   df2
+
+In Stata, to perform a merge, one data set must be in memory
+and the other must be referenced as a file name on disk. In
+contrast, Python must have both ``DataFrames`` already in memory.
+
+By default, Stata performs an outer join, where all observations
+from both data sets are left in memory after the merge. One can
+keep only observations from the initial data set, the merged data set,
+or the intersection of the two by using the values created in the
+``_merge`` variable.
+
+.. code-block:: stata
+
+   * First create df2 and save to disk
+   clear
+   input str1 key
+   B
+   D
+   D
+   E
+   end
+   generate value = rnormal()
+   save df2.dta
+
+   * Now create df1 in memory
+   clear
+   input str1 key
+   A
+   B
+   C
+   D
+   end
+   generate value = rnormal()
+
+   preserve
+
+   * Left join
+   merge 1:n key using df2.dta
+   keep if _merge == 1
+
+   * Right join
+   restore, preserve
+   merge 1:n key using df2.dta
+   keep if _merge == 2
+
+   * Inner join
+   restore, preserve
+   merge 1:n key using df2.dta
+   keep if _merge == 3
+
+   * Outer join
+   restore
+   merge 1:n key using df2.dta
+
+pandas DataFrames have a :meth:`DataFrame.merge` method, which provides
+similar functionality. Note that different join
+types are accomplished via the ``how`` keyword.
+
+.. ipython:: python
+
+   inner_join = df1.merge(df2, on=['key'], how='inner')
+   inner_join
+
+   left_join = df1.merge(df2, on=['key'], how='left')
+   left_join
+
+   right_join = df1.merge(df2, on=['key'], how='right')
+   right_join
+
+   outer_join = df1.merge(df2, on=['key'], how='outer')
+   outer_join
+
+
+Missing Data
+------------
+
+Like Stata, pandas has a representation for missing data -- the
+special float value ``NaN`` (not a number).  Many of the semantics
+are the same; for example missing data propagates through numeric
+operations, and is ignored by default for aggregations.
+
+.. ipython:: python
+
+   outer_join
+   outer_join['value_x'] + outer_join['value_y']
+   outer_join['value_x'].sum()
+
+One difference is that missing data cannot be compared to its sentinel value.
+For example, in Stata you could do this to filter missing values.
+
+.. code-block:: stata
+
+   * Keep missing values
+   list if value_x == .
+   * Keep non-missing values
+   list if value_x != .
+
+This doesn't work in pandas.  Instead, the :func:`pd.isna` or :func:`pd.notna` functions
+should be used for comparisons.
+
+.. ipython:: python
+
+   outer_join[pd.isna(outer_join['value_x'])]
+   outer_join[pd.notna(outer_join['value_x'])]
+
+Pandas also provides a variety of methods to work with missing data -- some of
+which would be challenging to express in Stata. For example, there are methods to
+drop all rows with any missing values, replacing missing values with a specified
+value, like the mean, or forward filling from previous rows. See the
+:ref:`missing data documentation<missing_data>` for more.
+
+.. ipython:: python
+
+   # Drop rows with any missing value
+   outer_join.dropna()
+
+   # Fill forwards
+   outer_join.fillna(method='ffill')
+
+   # Impute missing values with the mean
+   outer_join['value_x'].fillna(outer_join['value_x'].mean())
+
+
+GroupBy
+-------
+
+Aggregation
+~~~~~~~~~~~
+
+Stata's ``collapse`` can be used to group by one or
+more key variables and compute aggregations on
+numeric columns.
+
+.. code-block:: stata
+
+   collapse (sum) total_bill tip, by(sex smoker)
+
+pandas provides a flexible ``groupby`` mechanism that
+allows similar aggregations.  See the :ref:`groupby documentation<groupby>`
+for more details and examples.
+
+.. ipython:: python
+
+   tips_summed = tips.groupby(['sex', 'smoker'])['total_bill', 'tip'].sum()
+   tips_summed.head()
+
+
+Transformation
+~~~~~~~~~~~~~~
+
+In Stata, if the group aggregations need to be used with the
+original data set, one would usually use ``bysort`` with :func:`egen`.
+For example, to subtract the mean for each observation by smoker group.
+
+.. code-block:: stata
+
+   bysort sex smoker: egen group_bill = mean(total_bill)
+   generate adj_total_bill = total_bill - group_bill
+
+
+pandas ``groubpy`` provides a ``transform`` mechanism that allows
+these type of operations to be succinctly expressed in one
+operation.
+
+.. ipython:: python
+
+   gb = tips.groupby('smoker')['total_bill']
+   tips['adj_total_bill'] = tips['total_bill'] - gb.transform('mean')
+   tips.head()
+
+
+By Group Processing
+~~~~~~~~~~~~~~~~~~~
+
+In addition to aggregation, pandas ``groupby`` can be used to
+replicate most other ``bysort`` processing from Stata. For example,
+the following example lists the first observation in the current
+sort order by sex/smoker group.
+
+.. code-block:: stata
+
+   bysort sex smoker: list if _n == 1
+
+In pandas this would be written as:
+
+.. ipython:: python
+
+   tips.groupby(['sex','smoker']).first()
+
+
+Other Considerations
+--------------------
+
+Disk vs Memory
+~~~~~~~~~~~~~~
+
+Pandas and Stata both operate exclusively in memory. This means that the size of
+data able to be loaded in pandas is limited by your machine's memory.
+If out of core processing is needed, one possibility is the
+`dask.dataframe <http://dask.pydata.org/en/latest/dataframe.html>`_
+library, which provides a subset of pandas functionality for an
+on-disk ``DataFrame``.
+
+
diff --git a/doc/source/computation.rst b/doc/source/computation.rst
index dfb9fab19bf31..5e7b8be5f8af0 100644
--- a/doc/source/computation.rst
+++ b/doc/source/computation.rst
@@ -8,10 +8,7 @@
    np.set_printoptions(precision=4, suppress=True)
    import pandas as pd
    import matplotlib
-   try:
-      matplotlib.style.use('ggplot')
-   except AttributeError:
-      pd.options.display.mpl_style = 'default'
+   # matplotlib.style.use('default')
    import matplotlib.pyplot as plt
    plt.close('all')
    pd.options.display.max_rows=15
@@ -21,7 +18,7 @@
 Computational tools
 ===================
 
-Statistical functions
+Statistical Functions
 ---------------------
 
 .. _computation.pct_change:
@@ -29,9 +26,10 @@ Statistical functions
 Percent Change
 ~~~~~~~~~~~~~~
 
-``Series``, ``DataFrame``, and ``Panel`` all have a method ``pct_change`` to compute the
-percent change over a given number of periods (using ``fill_method`` to fill
-NA/null values *before* computing the percent change).
+``Series``, ``DataFrame``, and ``Panel`` all have a method 
+:meth:`~DataFrame.pct_change` to compute the percent change over a given number 
+of periods (using ``fill_method`` to fill NA/null values *before* computing 
+the percent change).
 
 .. ipython:: python
 
@@ -50,8 +48,8 @@ NA/null values *before* computing the percent change).
 Covariance
 ~~~~~~~~~~
 
-The ``Series`` object has a method ``cov`` to compute covariance between series
-(excluding NA/null values).
+:meth:`Series.cov` can be used to compute covariance between series 
+(excluding missing values).
 
 .. ipython:: python
 
@@ -59,8 +57,8 @@ The ``Series`` object has a method ``cov`` to compute covariance between series
    s2 = pd.Series(np.random.randn(1000))
    s1.cov(s2)
 
-Analogously, ``DataFrame`` has a method ``cov`` to compute pairwise covariances
-among the series in the DataFrame, also excluding NA/null values.
+Analogously, :meth:`DataFrame.cov` to compute pairwise covariances among the 
+series in the DataFrame, also excluding NA/null values.
 
 .. _computation.covariance.caveats:
 
@@ -87,8 +85,8 @@ in order to have a valid result.
 .. ipython:: python
 
    frame = pd.DataFrame(np.random.randn(20, 3), columns=['a', 'b', 'c'])
-   frame.ix[:5, 'a'] = np.nan
-   frame.ix[5:10, 'b'] = np.nan
+   frame.loc[frame.index[:5], 'a'] = np.nan
+   frame.loc[frame.index[5:10], 'b'] = np.nan
 
    frame.cov()
 
@@ -100,7 +98,9 @@ in order to have a valid result.
 Correlation
 ~~~~~~~~~~~
 
-Several methods for computing correlations are provided:
+Correlation may be computed using the :meth:`~DataFrame.corr` method.
+Using the ``method`` parameter, several methods for computing correlations are 
+provided:
 
 .. csv-table::
     :header: "Method name", "Description"
@@ -113,6 +113,11 @@ Several methods for computing correlations are provided:
 .. \rho = \cov(x, y) / \sigma_x \sigma_y
 
 All of these are currently computed using pairwise complete observations.
+Wikipedia has articles covering the above correlation coefficients:
+
+* `Pearson correlation coefficient <https://en.wikipedia.org/wiki/Pearson_correlation_coefficient>`_
+* `Kendall rank correlation coefficient <https://en.wikipedia.org/wiki/Kendall_rank_correlation_coefficient>`_
+* `Spearman's rank correlation coefficient <https://en.wikipedia.org/wiki/Spearman%27s_rank_correlation_coefficient>`_
 
 .. note::
 
@@ -123,7 +128,7 @@ All of these are currently computed using pairwise complete observations.
 .. ipython:: python
 
    frame = pd.DataFrame(np.random.randn(1000, 5), columns=['a', 'b', 'c', 'd', 'e'])
-   frame.ix[::2] = np.nan
+   frame.iloc[::2] = np.nan
 
    # Series with Series
    frame['a'].corr(frame['b'])
@@ -140,17 +145,17 @@ Like ``cov``, ``corr`` also supports the optional ``min_periods`` keyword:
 .. ipython:: python
 
    frame = pd.DataFrame(np.random.randn(20, 3), columns=['a', 'b', 'c'])
-   frame.ix[:5, 'a'] = np.nan
-   frame.ix[5:10, 'b'] = np.nan
+   frame.loc[frame.index[:5], 'a'] = np.nan
+   frame.loc[frame.index[5:10], 'b'] = np.nan
 
    frame.corr()
 
    frame.corr(min_periods=12)
 
 
-A related method ``corrwith`` is implemented on DataFrame to compute the
-correlation between like-labeled Series contained in different DataFrame
-objects.
+A related method :meth:`~DataFrame.corrwith` is implemented on DataFrame to 
+compute the correlation between like-labeled Series contained in different 
+DataFrame objects.
 
 .. ipython:: python
 
@@ -166,8 +171,8 @@ objects.
 Data ranking
 ~~~~~~~~~~~~
 
-The ``rank`` method produces a data ranking with ties being assigned the mean
-of the ranks (by default) for the group:
+The :meth:`~Series.rank` method produces a data ranking with ties being 
+assigned the mean of the ranks (by default) for the group:
 
 .. ipython:: python
 
@@ -175,8 +180,9 @@ of the ranks (by default) for the group:
    s['d'] = s['b'] # so there's a tie
    s.rank()
 
-``rank`` is also a DataFrame method and can rank either the rows (``axis=0``)
-or the columns (``axis=1``). ``NaN`` values are excluded from the ranking.
+:meth:`~DataFrame.rank` is also a DataFrame method and can rank either the rows 
+(``axis=0``) or the columns (``axis=1``). ``NaN`` values are excluded from the 
+ranking.
 
 .. ipython:: python
 
@@ -196,88 +202,119 @@ parameter:
   - ``max`` : highest rank in the group
   - ``first`` : ranks assigned in the order they appear in the array
 
+.. _stats.moments:
 
-.. currentmodule:: pandas
+Window Functions
+----------------
 
-.. currentmodule:: pandas.stats.api
+.. currentmodule:: pandas.core.window
 
-.. _stats.moments:
+For working with data, a number of window functions are provided for
+computing common *window* or *rolling* statistics. Among these are count, sum,
+mean, median, correlation, variance, covariance, standard deviation, skewness,
+and kurtosis.
 
-Moving (rolling) statistics / moments
--------------------------------------
+The ``rolling()`` and ``expanding()``
+functions can be used directly from DataFrameGroupBy objects,
+see the :ref:`groupby docs <groupby.transform.window_resample>`.
 
-For working with time series data, a number of functions are provided for
-computing common *moving* or *rolling* statistics. Among these are count, sum,
-mean, median, correlation, variance, covariance, standard deviation, skewness,
-and kurtosis. All of these methods are in the :mod:`pandas` namespace, but
-otherwise they can be found in :mod:`pandas.stats.moments`.
 
-.. csv-table::
-    :header: "Function", "Description"
-    :widths: 20, 80
+.. note::
+
+   The API for window statistics is quite similar to the way one works with ``GroupBy`` objects, see the documentation :ref:`here <groupby>`.
+
+We work with ``rolling``, ``expanding`` and ``exponentially weighted`` data through the corresponding
+objects, :class:`~pandas.core.window.Rolling`, :class:`~pandas.core.window.Expanding` and :class:`~pandas.core.window.EWM`.
 
-    ``rolling_count``, Number of non-null observations
-    ``rolling_sum``, Sum of values
-    ``rolling_mean``, Mean of values
-    ``rolling_median``, Arithmetic median of values
-    ``rolling_min``, Minimum
-    ``rolling_max``, Maximum
-    ``rolling_std``, Unbiased standard deviation
-    ``rolling_var``, Unbiased variance
-    ``rolling_skew``, Unbiased skewness (3rd moment)
-    ``rolling_kurt``, Unbiased kurtosis (4th moment)
-    ``rolling_quantile``, Sample quantile (value at %)
-    ``rolling_apply``, Generic apply
-    ``rolling_cov``, Unbiased covariance (binary)
-    ``rolling_corr``, Correlation (binary)
-    ``rolling_window``, Moving window function
-
-Generally these methods all have the same interface. The binary operators
-(e.g. ``rolling_corr``) take two Series or DataFrames. Otherwise, they all
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(1000), index=pd.date_range('1/1/2000', periods=1000))
+   s = s.cumsum()
+   s
+
+These are created from methods on ``Series`` and ``DataFrame``.
+
+.. ipython:: python
+
+   r = s.rolling(window=60)
+   r
+
+These object provide tab-completion of the available methods and properties.
+
+.. code-block:: ipython
+
+   In [14]: r.
+   r.agg         r.apply       r.count       r.exclusions  r.max         r.median      r.name        r.skew        r.sum
+   r.aggregate   r.corr        r.cov         r.kurt        r.mean        r.min         r.quantile    r.std         r.var
+
+Generally these methods all have the same interface. They all
 accept the following arguments:
 
-  - ``window``: size of moving window
-  - ``min_periods``: threshold of non-null data points to require (otherwise
-    result is NA)
-  - ``freq``: optionally specify a :ref:`frequency string <timeseries.alias>`
-    or :ref:`DateOffset <timeseries.offsets>` to pre-conform the data to.
-    Note that prior to pandas v0.8.0, a keyword argument ``time_rule`` was used
-    instead of ``freq`` that referred to the legacy time rule constants
-  - ``how``: optionally specify method for down or re-sampling.  Default is
-    is min for ``rolling_min``, max for ``rolling_max``, median for
-    ``rolling_median``, and mean for all other rolling functions.  See
-    :meth:`DataFrame.resample`'s how argument for more information.
+- ``window``: size of moving window
+- ``min_periods``: threshold of non-null data points to require (otherwise
+  result is NA)
+- ``center``: boolean, whether to set the labels at the center (default is False)
 
-These functions can be applied to ndarrays or Series objects:
+We can then call methods on these ``rolling`` objects. These return like-indexed objects:
 
 .. ipython:: python
 
-   ts = pd.Series(np.random.randn(1000), index=pd.date_range('1/1/2000', periods=1000))
-   ts = ts.cumsum()
+   r.mean()
 
-   ts.plot(style='k--')
+.. ipython:: python
 
-   @savefig rolling_mean_ex.png
-   pd.rolling_mean(ts, 60).plot(style='k')
+   s.plot(style='k--')
 
-They can also be applied to DataFrame objects. This is really just syntactic
-sugar for applying the moving window operator to all of the DataFrame's columns:
+   @savefig rolling_mean_ex.png
+   r.mean().plot(style='k')
 
 .. ipython:: python
    :suppress:
 
    plt.close('all')
 
+They can also be applied to DataFrame objects. This is really just syntactic
+sugar for applying the moving window operator to all of the DataFrame's columns:
+
 .. ipython:: python
 
-   df = pd.DataFrame(np.random.randn(1000, 4), index=ts.index,
-                  columns=['A', 'B', 'C', 'D'])
+   df = pd.DataFrame(np.random.randn(1000, 4),
+                     index=pd.date_range('1/1/2000', periods=1000),
+                     columns=['A', 'B', 'C', 'D'])
    df = df.cumsum()
 
    @savefig rolling_mean_frame.png
-   pd.rolling_sum(df, 60).plot(subplots=True)
+   df.rolling(window=60).sum().plot(subplots=True)
 
-The ``rolling_apply`` function takes an extra ``func`` argument and performs
+.. _stats.summary:
+
+Method Summary
+~~~~~~~~~~~~~~
+
+We provide a number of common statistical functions:
+
+.. currentmodule:: pandas.core.window
+
+.. csv-table::
+    :header: "Method", "Description"
+    :widths: 20, 80
+
+    :meth:`~Rolling.count`, Number of non-null observations
+    :meth:`~Rolling.sum`, Sum of values
+    :meth:`~Rolling.mean`, Mean of values
+    :meth:`~Rolling.median`, Arithmetic median of values
+    :meth:`~Rolling.min`, Minimum
+    :meth:`~Rolling.max`, Maximum
+    :meth:`~Rolling.std`, Bessel-corrected sample standard deviation
+    :meth:`~Rolling.var`, Unbiased variance
+    :meth:`~Rolling.skew`, Sample skewness (3rd moment)
+    :meth:`~Rolling.kurt`, Sample kurtosis (4th moment)
+    :meth:`~Rolling.quantile`, Sample quantile (value at %)
+    :meth:`~Rolling.apply`, Generic apply
+    :meth:`~Rolling.cov`, Unbiased covariance (binary)
+    :meth:`~Rolling.corr`, Correlation (binary)
+
+The :meth:`~Rolling.apply` function takes an extra ``func`` argument and performs
 generic rolling computations. The ``func`` argument should be a single function
 that produces a single value from an ndarray input. Suppose we wanted to
 compute the mean absolute deviation on a rolling basis:
@@ -286,108 +323,256 @@ compute the mean absolute deviation on a rolling basis:
 
    mad = lambda x: np.fabs(x - x.mean()).mean()
    @savefig rolling_apply_ex.png
-   pd.rolling_apply(ts, 60, mad).plot(style='k')
-
-The ``rolling_window`` function performs a generic rolling window computation
-on the input data. The weights used in the window are specified by the ``win_type``
-keyword. The list of recognized types are:
+   s.rolling(window=60).apply(mad, raw=True).plot(style='k')
 
-    - ``boxcar``
-    - ``triang``
-    - ``blackman``
-    - ``hamming``
-    - ``bartlett``
-    - ``parzen``
-    - ``bohman``
-    - ``blackmanharris``
-    - ``nuttall``
-    - ``barthann``
-    - ``kaiser`` (needs beta)
-    - ``gaussian`` (needs std)
-    - ``general_gaussian`` (needs power, width)
-    - ``slepian`` (needs width).
+.. _stats.rolling_window:
 
-.. ipython:: python
+Rolling Windows
+~~~~~~~~~~~~~~~
 
-   ser = pd.Series(np.random.randn(10), index=pd.date_range('1/1/2000', periods=10))
+Passing ``win_type`` to ``.rolling`` generates a generic rolling window computation, that is weighted according the ``win_type``.
+The following methods are available:
 
-   pd.rolling_window(ser, 5, 'triang')
+.. csv-table::
+    :header: "Method", "Description"
+    :widths: 20, 80
 
-Note that the ``boxcar`` window is equivalent to ``rolling_mean``.
+    :meth:`~Window.sum`, Sum of values
+    :meth:`~Window.mean`, Mean of values
+
+The weights used in the window are specified by the ``win_type`` keyword.
+The list of recognized types are the `scipy.signal window functions
+<https://docs.scipy.org/doc/scipy/reference/signal.html#window-functions>`__:
+
+* ``boxcar``
+* ``triang``
+* ``blackman``
+* ``hamming``
+* ``bartlett``
+* ``parzen``
+* ``bohman``
+* ``blackmanharris``
+* ``nuttall``
+* ``barthann``
+* ``kaiser`` (needs beta)
+* ``gaussian`` (needs std)
+* ``general_gaussian`` (needs power, width)
+* ``slepian`` (needs width).
 
 .. ipython:: python
 
-   pd.rolling_window(ser, 5, 'boxcar')
+   ser = pd.Series(np.random.randn(10), index=pd.date_range('1/1/2000', periods=10))
 
-   pd.rolling_mean(ser, 5)
+   ser.rolling(window=5, win_type='triang').mean()
 
-For some windowing functions, additional parameters must be specified:
+Note that the ``boxcar`` window is equivalent to :meth:`~Rolling.mean`.
 
 .. ipython:: python
 
-   pd.rolling_window(ser, 5, 'gaussian', std=0.1)
+   ser.rolling(window=5, win_type='boxcar').mean()
+   ser.rolling(window=5).mean()
 
-By default the labels are set to the right edge of the window, but a
-``center`` keyword is available so the labels can be set at the center.
-This keyword is available in other rolling functions as well.
+For some windowing functions, additional parameters must be specified:
 
 .. ipython:: python
 
-   pd.rolling_window(ser, 5, 'boxcar')
-
-   pd.rolling_window(ser, 5, 'boxcar', center=True)
-
-   pd.rolling_mean(ser, 5, center=True)
+   ser.rolling(window=5, win_type='gaussian').mean(std=0.1)
 
 .. _stats.moments.normalization:
 
 .. note::
 
-    In rolling sum mode (``mean=False``) there is no normalization done to the
-    weights. Passing custom weights of ``[1, 1, 1]`` will yield a different
+    For ``.sum()`` with a ``win_type``, there is no normalization done to the
+    weights for the window. Passing custom weights of ``[1, 1, 1]`` will yield a different
     result than passing weights of ``[2, 2, 2]``, for example. When passing a
     ``win_type`` instead of explicitly specifying the weights, the weights are
     already normalized so that the largest weight is 1.
 
-    In contrast, the nature of the rolling mean calculation (``mean=True``)is
+    In contrast, the nature of the ``.mean()`` calculation is
     such that the weights are normalized with respect to each other. Weights
     of ``[1, 1, 1]`` and ``[2, 2, 2]`` yield the same result.
 
+.. _stats.moments.ts:
+
+Time-aware Rolling
+~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.19.0
+
+New in version 0.19.0 are the ability to pass an offset (or convertible) to a ``.rolling()`` method and have it produce
+variable sized windows based on the passed time window. For each time point, this includes all preceding values occurring
+within the indicated time delta.
+
+This can be particularly useful for a non-regular time frequency index.
+
+.. ipython:: python
+
+   dft = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]},
+                      index=pd.date_range('20130101 09:00:00', periods=5, freq='s'))
+   dft
+
+This is a regular frequency index. Using an integer window parameter works to roll along the window frequency.
+
+.. ipython:: python
+
+   dft.rolling(2).sum()
+   dft.rolling(2, min_periods=1).sum()
+
+Specifying an offset allows a more intuitive specification of the rolling frequency.
+
+.. ipython:: python
+
+   dft.rolling('2s').sum()
+
+Using a non-regular, but still monotonic index, rolling with an integer window does not impart any special calculation.
+
+
+.. ipython:: python
+
+   dft = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]},
+                      index = pd.Index([pd.Timestamp('20130101 09:00:00'),
+                                        pd.Timestamp('20130101 09:00:02'),
+                                        pd.Timestamp('20130101 09:00:03'),
+                                        pd.Timestamp('20130101 09:00:05'),
+                                        pd.Timestamp('20130101 09:00:06')],
+                                       name='foo'))
+   dft
+   dft.rolling(2).sum()
+
+
+Using the time-specification generates variable windows for this sparse data.
+
+.. ipython:: python
+
+   dft.rolling('2s').sum()
+
+Furthermore, we now allow an optional ``on`` parameter to specify a column (rather than the
+default of the index) in a DataFrame.
+
+.. ipython:: python
+
+   dft = dft.reset_index()
+   dft
+   dft.rolling('2s', on='foo').sum()
+
+.. _stats.rolling_window.endpoints:
+
+Rolling Window Endpoints
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.20.0
+
+The inclusion of the interval endpoints in rolling window calculations can be specified with the ``closed``
+parameter:
+
+.. csv-table::
+    :header: "``closed``", "Description", "Default for"
+    :widths: 20, 30, 30
+
+    ``right``, close right endpoint, time-based windows
+    ``left``, close left endpoint,
+    ``both``, close both endpoints, fixed windows
+    ``neither``, open endpoints,
+
+For example, having the right endpoint open is useful in many problems that require that there is no contamination
+from present information back to past information. This allows the rolling window to compute statistics
+"up to that point in time", but not including that point in time.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'x': 1},
+                     index = [pd.Timestamp('20130101 09:00:01'),
+                              pd.Timestamp('20130101 09:00:02'),
+                              pd.Timestamp('20130101 09:00:03'),
+                              pd.Timestamp('20130101 09:00:04'),
+                              pd.Timestamp('20130101 09:00:06')])
+
+   df["right"] = df.rolling('2s', closed='right').x.sum()  # default
+   df["both"] = df.rolling('2s', closed='both').x.sum()
+   df["left"] = df.rolling('2s', closed='left').x.sum()
+   df["neither"] = df.rolling('2s', closed='neither').x.sum()
+
+   df
+
+Currently, this feature is only implemented for time-based windows.
+For fixed windows, the closed parameter cannot be set and the rolling window will always have both endpoints closed.
+
+.. _stats.moments.ts-versus-resampling:
+
+Time-aware Rolling vs. Resampling
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Using ``.rolling()`` with a time-based index is quite similar to :ref:`resampling <timeseries.resampling>`. They
+both operate and perform reductive operations on time-indexed pandas objects.
+
+When using ``.rolling()`` with an offset. The offset is a time-delta. Take a backwards-in-time looking window, and
+aggregate all of the values in that window (including the end-point, but not the start-point). This is the new value
+at that point in the result. These are variable sized windows in time-space for each point of the input. You will get
+a same sized result as the input.
+
+When using ``.resample()`` with an offset. Construct a new index that is the frequency of the offset. For each frequency
+bin, aggregate points from the input within a backwards-in-time looking window that fall in that bin. The result of this
+aggregation is the output for that frequency point. The windows are fixed size in the frequency space. Your result
+will have the shape of a regular frequency between the min and the max of the original input object.
+
+To summarize, ``.rolling()`` is a time-based window operation, while ``.resample()`` is a frequency-based window operation.
+
+Centering Windows
+~~~~~~~~~~~~~~~~~
+
+By default the labels are set to the right edge of the window, but a
+``center`` keyword is available so the labels can be set at the center.
+
+.. ipython:: python
+
+   ser.rolling(window=5).mean()
+   ser.rolling(window=5, center=True).mean()
+
 .. _stats.moments.binary:
 
-Binary rolling moments
-~~~~~~~~~~~~~~~~~~~~~~
+Binary Window Functions
+~~~~~~~~~~~~~~~~~~~~~~~
 
-``rolling_cov`` and ``rolling_corr`` can compute moving window statistics about
+:meth:`~Rolling.cov` and :meth:`~Rolling.corr` can compute moving window statistics about
 two ``Series`` or any combination of ``DataFrame/Series`` or
 ``DataFrame/DataFrame``. Here is the behavior in each case:
 
-- two ``Series``: compute the statistic for the pairing.
-- ``DataFrame/Series``: compute the statistics for each column of the DataFrame
+* two ``Series``: compute the statistic for the pairing.
+* ``DataFrame/Series``: compute the statistics for each column of the DataFrame
   with the passed Series, thus returning a DataFrame.
-- ``DataFrame/DataFrame``: by default compute the statistic for matching column
+* ``DataFrame/DataFrame``: by default compute the statistic for matching column
   names, returning a DataFrame. If the keyword argument ``pairwise=True`` is
   passed then computes the statistic for each pair of columns, returning a
-  ``Panel`` whose ``items`` are the dates in question (see :ref:`the next section
+  ``MultiIndexed DataFrame`` whose ``index`` are the dates in question (see :ref:`the next section
   <stats.moments.corr_pairwise>`).
 
 For example:
 
 .. ipython:: python
 
+   df = pd.DataFrame(np.random.randn(1000, 4),
+                     index=pd.date_range('1/1/2000', periods=1000),
+                     columns=['A', 'B', 'C', 'D'])
+   df = df.cumsum()
+
    df2 = df[:20]
-   pd.rolling_corr(df2, df2['B'], window=5)
+   df2.rolling(window=5).corr(df2['B'])
 
 .. _stats.moments.corr_pairwise:
 
 Computing rolling pairwise covariances and correlations
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
+.. warning::
+
+   Prior to version 0.20.0 if ``pairwise=True`` was passed, a ``Panel`` would be returned.
+   This will now return a 2-level MultiIndexed DataFrame, see the whatsnew :ref:`here <whatsnew_0200.api_breaking.rolling_pairwise>`.
+
 In financial data analysis and other fields it's common to compute covariance
 and correlation matrices for a collection of time series. Often one is also
 interested in moving-window covariance and correlation matrices. This can be
 done by passing the ``pairwise`` keyword argument, which in the case of
-``DataFrame`` inputs will yield a ``Panel`` whose ``items`` are the dates in
+``DataFrame`` inputs will yield a MultiIndexed ``DataFrame`` whose ``index`` are the dates in
 question. In the case of a single DataFrame argument the ``pairwise`` argument
 can even be omitted:
 
@@ -401,23 +586,16 @@ can even be omitted:
 
 .. ipython:: python
 
-   covs = pd.rolling_cov(df[['B','C','D']], df[['A','B','C']], 50, pairwise=True)
-   covs[df.index[-50]]
+   covs = df[['B','C','D']].rolling(window=50).cov(df[['A','B','C']], pairwise=True)
+   covs.loc['2002-09-22':]
 
 .. ipython:: python
 
-   correls = pd.rolling_corr(df, 50)
-   correls[df.index[-50]]
-
-.. note::
-
-    Prior to version 0.14 this was available through ``rolling_corr_pairwise``
-    which is now simply syntactic sugar for calling ``rolling_corr(...,
-    pairwise=True)`` and deprecated. This is likely to be removed in a future
-    release.
+   correls = df.rolling(window=50).corr()
+   correls.loc['2002-09-22':]
 
 You can efficiently retrieve the time series of correlations between two
-columns using ``ix`` indexing:
+columns by reshaping and indexing:
 
 .. ipython:: python
    :suppress:
@@ -427,69 +605,178 @@ columns using ``ix`` indexing:
 .. ipython:: python
 
    @savefig rolling_corr_pairwise_ex.png
-   correls.ix[:, 'A', 'C'].plot()
+   correls.unstack(1)[('A', 'C')].plot()
+
+.. _stats.aggregate:
+
+Aggregation
+-----------
+
+Once the ``Rolling``, ``Expanding`` or ``EWM`` objects have been created, several methods are available to
+perform multiple computations on the data. These operations are similar to the :ref:`aggregating API <basics.aggregate>`,
+:ref:`groupby API <groupby.aggregate>`, and :ref:`resample API <timeseries.aggregate>`.
+
+
+.. ipython:: python
+
+   dfa = pd.DataFrame(np.random.randn(1000, 3),
+                      index=pd.date_range('1/1/2000', periods=1000),
+                      columns=['A', 'B', 'C'])
+   r = dfa.rolling(window=60,min_periods=1)
+   r
+
+We can aggregate by passing a function to the entire DataFrame, or select a 
+Series (or multiple Series) via standard ``__getitem__``.
+
+.. ipython:: python
+
+   r.aggregate(np.sum)
+
+   r['A'].aggregate(np.sum)
+
+   r[['A','B']].aggregate(np.sum)
+
+As you can see, the result of the aggregation will have the selected columns, or all
+columns if none are selected.
+
+.. _stats.aggregate.multifunc:
+
+Applying multiple functions
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+With windowed ``Series`` you can also pass a list of functions to do
+aggregation with, outputting a DataFrame:
+
+.. ipython:: python
+
+   r['A'].agg([np.sum, np.mean, np.std])
+
+On a windowed DataFrame, you can pass a list of functions to apply to each
+column, which produces an aggregated result with a hierarchical index:
+
+.. ipython:: python
+
+   r.agg([np.sum, np.mean])
+
+Passing a dict of functions has different behavior by default, see the next
+section.
+
+Applying different functions to DataFrame columns
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+By passing a dict to ``aggregate`` you can apply a different aggregation to the
+columns of a ``DataFrame``:
+
+.. ipython:: python
+   :okexcept:
+   :okwarning:
+
+   r.agg({'A' : np.sum,
+          'B' : lambda x: np.std(x, ddof=1)})
+
+The function names can also be strings. In order for a string to be valid it
+must be implemented on the windowed object
+
+.. ipython:: python
+
+   r.agg({'A' : 'sum', 'B' : 'std'})
+
+Furthermore you can pass a nested dict to indicate different aggregations on different columns.
+
+.. ipython:: python
+
+   r.agg({'A' : ['sum','std'], 'B' : ['mean','std'] })
+
 
 .. _stats.moments.expanding:
 
-Expanding window moment functions
----------------------------------
+Expanding Windows
+-----------------
+
 A common alternative to rolling statistics is to use an *expanding* window,
 which yields the value of the statistic with all the data available up to that
-point in time. As these calculations are a special case of rolling statistics,
+point in time.
+
+These follow a similar interface to ``.rolling``, with the ``.expanding`` method
+returning an :class:`~pandas.core.window.Expanding` object.
+
+As these calculations are a special case of rolling statistics,
 they are implemented in pandas such that the following two calls are equivalent:
 
 .. ipython:: python
 
-   pd.rolling_mean(df, window=len(df), min_periods=1)[:5]
+   df.rolling(window=len(df), min_periods=1).mean()[:5]
+
+   df.expanding(min_periods=1).mean()[:5]
 
-   pd.expanding_mean(df)[:5]
+These have a similar set of methods to ``.rolling`` methods.
 
-Like the ``rolling_`` functions, the following methods are included in the
-``pandas`` namespace or can be located in ``pandas.stats.moments``.
+Method Summary
+~~~~~~~~~~~~~~
+
+.. currentmodule:: pandas.core.window
 
 .. csv-table::
     :header: "Function", "Description"
     :widths: 20, 80
 
-    ``expanding_count``, Number of non-null observations
-    ``expanding_sum``, Sum of values
-    ``expanding_mean``, Mean of values
-    ``expanding_median``, Arithmetic median of values
-    ``expanding_min``, Minimum
-    ``expanding_max``, Maximum
-    ``expanding_std``, Unbiased standard deviation
-    ``expanding_var``, Unbiased variance
-    ``expanding_skew``, Unbiased skewness (3rd moment)
-    ``expanding_kurt``, Unbiased kurtosis (4th moment)
-    ``expanding_quantile``, Sample quantile (value at %)
-    ``expanding_apply``, Generic apply
-    ``expanding_cov``, Unbiased covariance (binary)
-    ``expanding_corr``, Correlation (binary)
+    :meth:`~Expanding.count`, Number of non-null observations
+    :meth:`~Expanding.sum`, Sum of values
+    :meth:`~Expanding.mean`, Mean of values
+    :meth:`~Expanding.median`, Arithmetic median of values
+    :meth:`~Expanding.min`, Minimum
+    :meth:`~Expanding.max`, Maximum
+    :meth:`~Expanding.std`, Unbiased standard deviation
+    :meth:`~Expanding.var`, Unbiased variance
+    :meth:`~Expanding.skew`, Unbiased skewness (3rd moment)
+    :meth:`~Expanding.kurt`, Unbiased kurtosis (4th moment)
+    :meth:`~Expanding.quantile`, Sample quantile (value at %)
+    :meth:`~Expanding.apply`, Generic apply
+    :meth:`~Expanding.cov`, Unbiased covariance (binary)
+    :meth:`~Expanding.corr`, Correlation (binary)
+
+.. currentmodule:: pandas
 
 Aside from not having a ``window`` parameter, these functions have the same
-interfaces as their ``rolling_`` counterpart. Like above, the parameters they
+interfaces as their ``.rolling`` counterparts. Like above, the parameters they
 all accept are:
 
-  - ``min_periods``: threshold of non-null data points to require. Defaults to
-    minimum needed to compute statistic. No ``NaNs`` will be output once
-    ``min_periods`` non-null data points have been seen.
-  - ``freq``: optionally specify a :ref:`frequency string <timeseries.alias>`
-    or :ref:`DateOffset <timeseries.offsets>` to pre-conform the data to.
-    Note that prior to pandas v0.8.0, a keyword argument ``time_rule`` was used
-    instead of ``freq`` that referred to the legacy time rule constants
+* ``min_periods``: threshold of non-null data points to require. Defaults to
+  minimum needed to compute statistic. No ``NaNs`` will be output once
+  ``min_periods`` non-null data points have been seen.
+* ``center``: boolean, whether to set the labels at the center (default is False).
 
+.. _stats.moments.expanding.note:
 .. note::
 
-   The output of the ``rolling_`` and ``expanding_`` functions do not return a
+   The output of the ``.rolling`` and ``.expanding`` methods do not return a
    ``NaN`` if there are at least ``min_periods`` non-null values in the current
-   window. This differs from ``cumsum``, ``cumprod``, ``cummax``, and
-   ``cummin``, which return ``NaN`` in the output wherever a ``NaN`` is
-   encountered in the input.
+   window. For example:
+
+   .. ipython:: python
+
+        sn = pd.Series([1, 2, np.nan, 3, np.nan, 4])
+        sn
+        sn.rolling(2).max()
+        sn.rolling(2, min_periods=1).max()
+
+   In case of expanding functions, this differs from :meth:`~DataFrame.cumsum`,
+   :meth:`~DataFrame.cumprod`, :meth:`~DataFrame.cummax`,
+   and :meth:`~DataFrame.cummin`, which return ``NaN`` in the output wherever
+   a ``NaN`` is encountered in the input. In order to match the output of ``cumsum``
+   with ``expanding``, use :meth:`~DataFrame.fillna`:
+
+   .. ipython:: python
+
+        sn.expanding().sum()
+        sn.cumsum()
+        sn.cumsum().fillna(method='ffill')
+
 
 An expanding window statistic will be more stable (and less responsive) than
 its rolling window counterpart as the increasing window size decreases the
 relative impact of an individual data point. As an example, here is the
-``expanding_mean`` output for the previous time series dataset:
+:meth:`~core.window.Expanding.mean` output for the previous time series dataset:
 
 .. ipython:: python
    :suppress:
@@ -498,29 +785,35 @@ relative impact of an individual data point. As an example, here is the
 
 .. ipython:: python
 
-   ts.plot(style='k--')
+   s.plot(style='k--')
 
    @savefig expanding_mean_frame.png
-   pd.expanding_mean(ts).plot(style='k')
+   s.expanding().mean().plot(style='k')
+
 
 .. _stats.moments.exponentially_weighted:
 
-Exponentially weighted moment functions
----------------------------------------
+Exponentially Weighted Windows
+------------------------------
+
+.. currentmodule:: pandas.core.window
 
 A related set of functions are exponentially weighted versions of several of
-the above statistics. A number of expanding EW (exponentially weighted)
-functions are provided:
+the above statistics. A similar interface to ``.rolling`` and ``.expanding`` is accessed
+through the ``.ewm`` method to receive an :class:`~EWM` object.
+A number of expanding EW (exponentially weighted)
+methods are provided:
+
 
 .. csv-table::
     :header: "Function", "Description"
     :widths: 20, 80
 
-    ``ewma``, EW moving average
-    ``ewmvar``, EW moving variance
-    ``ewmstd``, EW moving standard deviation
-    ``ewmcorr``, EW moving correlation
-    ``ewmcov``, EW moving covariance
+    :meth:`~EWM.mean`, EW moving average
+    :meth:`~EWM.var`, EW moving variance
+    :meth:`~EWM.std`, EW moving standard deviation
+    :meth:`~EWM.corr`, EW moving correlation
+    :meth:`~EWM.cov`, EW moving covariance
 
 In general, a weighted moving average is calculated as
 
@@ -528,10 +821,19 @@ In general, a weighted moving average is calculated as
 
     y_t = \frac{\sum_{i=0}^t w_i x_{t-i}}{\sum_{i=0}^t w_i},
 
-where :math:`x_t` is the input at :math:`y_t` is the result.
+where :math:`x_t` is the input, :math:`y_t` is the result and the :math:`w_i`
+are the weights.
+
+The EW functions support two variants of exponential weights.
+The default, ``adjust=True``, uses the weights :math:`w_i = (1 - \alpha)^i`
+which gives
+
+.. math::
+
+    y_t = \frac{x_t + (1 - \alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...
+    + (1 - \alpha)^t x_{0}}{1 + (1 - \alpha) + (1 - \alpha)^2 + ...
+    + (1 - \alpha)^t}
 
-The EW functions support two variants of exponential weights:
-The default, ``adjust=True``, uses the weights :math:`w_i = (1 - \alpha)^i`.
 When ``adjust=False`` is specified, moving averages are calculated as
 
 .. math::
@@ -556,55 +858,84 @@ which is equivalent to using weights
 
       y_t = \alpha' y_{t-1} + (1 - \alpha') x_t.
 
-One must have :math:`0 < \alpha \leq 1`, but rather than pass :math:`\alpha`
-directly, it's easier to think about either the **span**, **center of mass
-(com)** or **halflife** of an EW moment:
+The difference between the above two variants arises because we are
+dealing with series which have finite history. Consider a series of infinite
+history:
+
+.. math::
+
+    y_t = \frac{x_t + (1 - \alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...}
+    {1 + (1 - \alpha) + (1 - \alpha)^2 + ...}
+
+Noting that the denominator is a geometric series with initial term equal to 1
+and a ratio of :math:`1 - \alpha` we have
+
+.. math::
+
+    y_t &= \frac{x_t + (1 - \alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...}
+    {\frac{1}{1 - (1 - \alpha)}}\\
+    &= [x_t + (1 - \alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...] \alpha \\
+    &= \alpha x_t + [(1-\alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...]\alpha \\
+    &= \alpha x_t + (1 - \alpha)[x_{t-1} + (1 - \alpha) x_{t-2} + ...]\alpha\\
+    &= \alpha x_t + (1 - \alpha) y_{t-1}
+
+which shows the equivalence of the above two variants for infinite series.
+When ``adjust=True`` we have :math:`y_0 = x_0` and from the last
+representation above we have :math:`y_t = \alpha x_t + (1 - \alpha) y_{t-1}`,
+therefore there is an assumption that :math:`x_0` is not an ordinary value
+but rather an exponentially weighted moment of the infinite series up to that
+point.
+
+One must have :math:`0 < \alpha \leq 1`, and while since version 0.18.0
+it has been possible to pass :math:`\alpha` directly, it's often easier
+to think about either the **span**, **center of mass (com)** or **half-life**
+of an EW moment:
 
 .. math::
 
    \alpha =
     \begin{cases}
-        \frac{2}{s + 1},               & s = \text{span}\\
-        \frac{1}{1 + c},               & c = \text{center of mass}\\
-        1 - \exp^{\frac{\log 0.5}{h}}, & h = \text{half life}
+        \frac{2}{s + 1},               & \text{for span}\ s \geq 1\\
+        \frac{1}{1 + c},               & \text{for center of mass}\ c \geq 0\\
+        1 - \exp^{\frac{\log 0.5}{h}}, & \text{for half-life}\ h > 0
     \end{cases}
 
-One must specify precisely one of the three to the EW functions. **Span**
-corresponds to what is commonly called a "20-day EW moving average" for
-example. **Center of mass** has a more physical interpretation. For example,
-**span** = 20 corresponds to **com** = 9.5. **Halflife** is the period of
-time for the exponential weight to reduce to one half.
+One must specify precisely one of **span**, **center of mass**, **half-life**
+and **alpha** to the EW functions:
+
+* **Span** corresponds to what is commonly called an "N-day EW moving average".
+* **Center of mass** has a more physical interpretation and can be thought of
+  in terms of span: :math:`c = (s - 1) / 2`.
+* **Half-life** is the period of time for the exponential weight to reduce to
+  one half.
+* **Alpha** specifies the smoothing factor directly.
 
 Here is an example for a univariate time series:
 
 .. ipython:: python
 
-   plt.close('all')
-   ts.plot(style='k--')
+   s.plot(style='k--')
 
    @savefig ewma_ex.png
-   pd.ewma(ts, span=20).plot(style='k')
+   s.ewm(span=20).mean().plot(style='k')
 
-All the EW functions have a ``min_periods`` argument, which has the same
-meaning it does for all the ``expanding_`` and ``rolling_`` functions:
+EWM has a ``min_periods`` argument, which has the same
+meaning it does for all the ``.expanding`` and ``.rolling`` methods:
 no output values will be set until at least ``min_periods`` non-null values
 are encountered in the (expanding) window.
-(This is a change from versions prior to 0.15.0, in which the ``min_periods``
-argument affected only the ``min_periods`` consecutive entries starting at the
-first non-null value.)
 
-All the EW functions also have an ``ignore_na`` argument, which deterines how
+EWM also has an ``ignore_na`` argument, which determines how
 intermediate null values affect the calculation of the weights.
 When ``ignore_na=False`` (the default), weights are calculated based on absolute
 positions, so that intermediate null values affect the result.
-When ``ignore_na=True`` (which reproduces the behavior in versions prior to 0.15.0),
+When ``ignore_na=True``,
 weights are calculated by ignoring intermediate null values.
 For example, assuming ``adjust=True``, if ``ignore_na=False``, the weighted
 average of ``3, NaN, 5`` would be calculated as
 
 .. math::
 
-	\frac{(1-\alpha)^2 \cdot 3 + 1 \cdot 5}{(1-\alpha)^2 + 1}
+	\frac{(1-\alpha)^2 \cdot 3 + 1 \cdot 5}{(1-\alpha)^2 + 1}.
 
 Whereas if ``ignore_na=True``, the weighted average would be calculated as
 
@@ -612,7 +943,7 @@ Whereas if ``ignore_na=True``, the weighted average would be calculated as
 
 	\frac{(1-\alpha) \cdot 3 + 1 \cdot 5}{(1-\alpha) + 1}.
 
-The ``ewmvar``, ``ewmstd``, and ``ewmcov`` functions have a ``bias`` argument,
+The :meth:`~Ewm.var`, :meth:`~Ewm.std`, and :meth:`~Ewm.cov` functions have a ``bias`` argument,
 specifying whether the result should contain biased or unbiased statistics.
 For example, if ``bias=True``, ``ewmvar(x)`` is calculated as
 ``ewmvar(x) = ewma(x**2) - ewma(x)**2``;
@@ -625,5 +956,5 @@ are scaled by debiasing factors
 
 (For :math:`w_i = 1`, this reduces to the usual :math:`N / (N - 1)` factor,
 with :math:`N = t + 1`.)
-See http://en.wikipedia.org/wiki/Weighted_arithmetic_mean#Weighted_sample_variance
-for further details.
+See `Weighted Sample Variance <http://en.wikipedia.org/wiki/Weighted_arithmetic_mean#Weighted_sample_variance>`__
+on Wikipedia for further details.
diff --git a/doc/source/conf.py b/doc/source/conf.py
index f2a033eb82d9c..29f947e1144ea 100644
--- a/doc/source/conf.py
+++ b/doc/source/conf.py
@@ -2,7 +2,8 @@
 #
 # pandas documentation build configuration file, created by
 #
-# This file is execfile()d with the current directory set to its containing dir.
+# This file is execfile()d with the current directory set to its containing
+# dir.
 #
 # Note that not all possible configuration values are present in this
 # autogenerated file.
@@ -13,7 +14,26 @@
 import sys
 import os
 import re
-from pandas.compat import u, PY3
+import inspect
+import importlib
+import logging
+import warnings
+from sphinx.ext.autosummary import _import_by_name
+
+logger = logging.getLogger(__name__)
+
+try:
+    raw_input          # Python 2
+except NameError:
+    raw_input = input  # Python 3
+
+# https://github.com/sphinx-doc/sphinx/pull/2325/files
+# Workaround for sphinx-build recursion limit overflow:
+# pickle.dump(doctree, f, pickle.HIGHEST_PROTOCOL)
+#  RuntimeError: maximum recursion depth exceeded while pickling an object
+#
+# Python's default allowed recursion depth is 1000.
+sys.setrecursionlimit(5000)
 
 # If extensions (or modules to document with autodoc) are in another directory,
 # add these directories to sys.path here. If the directory is relative to the
@@ -30,26 +50,45 @@
 
 ])
 
+# numpydoc is available in the sphinxext directory, and can't be imported
+# until sphinxext is available in the Python path
+from numpydoc.docscrape import NumpyDocString
+
 # -- General configuration -----------------------------------------------
 
-# Add any Sphinx extension module names here, as strings. They can be extensions
-# coming with Sphinx (named 'sphinx.ext.*') or your custom ones.  sphinxext.
+# Add any Sphinx extension module names here, as strings. They can be
+# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom ones.
+# sphinxext.
 
 extensions = ['sphinx.ext.autodoc',
               'sphinx.ext.autosummary',
               'sphinx.ext.doctest',
               'sphinx.ext.extlinks',
               'sphinx.ext.todo',
-              'numpydoc', # used to parse numpy-style docstrings for autodoc
-              'ipython_sphinxext.ipython_directive',
-              'ipython_sphinxext.ipython_console_highlighting',
+              'numpydoc',
+              'IPython.sphinxext.ipython_directive',
+              'IPython.sphinxext.ipython_console_highlighting',
+              'matplotlib.sphinxext.plot_directive',
               'sphinx.ext.intersphinx',
               'sphinx.ext.coverage',
-              'sphinx.ext.pngmath',
+              'sphinx.ext.mathjax',
               'sphinx.ext.ifconfig',
+              'sphinx.ext.linkcode',
+              'nbsphinx',
               ]
 
+try:
+    import sphinxcontrib.spelling  # noqa
+except ImportError as err:
+    logger.warn(('sphinxcontrib.spelling failed to import with error "{}". '
+                '`spellcheck` command is not available.'.format(err)))
+else:
+    extensions.append('sphinxcontrib.spelling')
+
+exclude_patterns = ['**.ipynb_checkpoints']
 
+spelling_word_list_filename = ['spelling_wordlist.txt', 'names_wordlist.txt']
+spelling_ignore_pypi_package_names = True
 
 with open("index.rst") as f:
     index_rst_lines = f.readlines()
@@ -60,37 +99,22 @@
 # JP: added from sphinxdocs
 autosummary_generate = False
 
-if any([re.match("\s*api\s*",l) for l in index_rst_lines]):
+if any(re.match("\s*api\s*", l) for l in index_rst_lines):
     autosummary_generate = True
 
-files_to_delete = []
-for f in os.listdir(os.path.dirname(__file__)):
-    if not f.endswith('.rst') or f.startswith('.') or os.path.basename(f) == 'index.rst':
-        continue
-
-    _file_basename = f.split('.rst')[0]
-    _regex_to_match = "\s*{}\s*$".format(_file_basename)
-    if not any([re.match(_regex_to_match, line) for line in index_rst_lines]):
-        files_to_delete.append(f)
-
-if files_to_delete:
-    print("I'm about to DELETE the following:\n%s\n" % list(sorted(files_to_delete)))
-    sys.stdout.write("WARNING: I'd like to delete those to speed up processing (yes/no)? ")
-    if PY3:
-        answer = input()
-    else:
-        answer = raw_input()
-
-    if answer.lower().strip() in ('y','yes'):
-        for f in files_to_delete:
-            f = os.path.join(os.path.join(os.path.dirname(__file__),f))
-            f= os.path.abspath(f)
-            try:
-                print("Deleting %s" % f)
-                os.unlink(f)
-            except:
-                print("Error deleting %s" % f)
-                pass
+# numpydoc
+# for now use old parameter listing (styling + **kwargs problem)
+numpydoc_use_blockquotes = True
+# use member listing for attributes
+numpydoc_attributes_as_param_list = False
+
+# matplotlib plot directive
+plot_include_source = True
+plot_formats = [("png", 90)]
+plot_html_show_formats = False
+plot_html_show_source_link = False
+plot_pre_code = """import numpy as np
+import pandas as pd"""
 
 # Add any paths that contain templates here, relative to this directory.
 templates_path = ['../_templates']
@@ -105,8 +129,8 @@
 master_doc = 'index'
 
 # General information about the project.
-project = u('pandas')
-copyright = u('2008-2014, the pandas development team')
+project = u'pandas'
+copyright = u'2008-2014, the pandas development team'
 
 # The version info for the project you're documenting, acts as replacement for
 # |version| and |release|, also used in various other places throughout the
@@ -116,7 +140,7 @@
 import pandas
 
 # version = '%s r%s' % (pandas.__version__, svn_version())
-version = '%s' % (pandas.__version__)
+version = str(pandas.__version__)
 
 # The full version, including alpha/beta/rc tags.
 release = version
@@ -138,8 +162,8 @@
 # for source files.
 exclude_trees = []
 
-# The reST default role (used for this markup: `text`) to use for all documents.
-# default_role = None
+# The reST default role (used for this markup: `text`) to use for all
+# documents. default_role = None
 
 # If true, '()' will be appended to :func: etc. cross-reference text.
 # add_function_parentheses = True
@@ -189,16 +213,16 @@
 # of the sidebar.
 # html_logo = None
 
-# The name of an image file (within the static path) to use as favicon of the
-# docs.  This file should be a Windows icon file (.ico) being 16x16 or 32x32
-# pixels large.
-# html_favicon = None
-
 # Add any paths that contain custom static files (such as style sheets) here,
 # relative to this directory. They are copied after the builtin static files,
 # so a file named "default.css" will overwrite the builtin "default.css".
 html_static_path = ['_static']
 
+# The name of an image file (within the static path) to use as favicon of the
+# docs.  This file should be a Windows icon file (.ico) being 16x16 or 32x32
+# pixels large.
+html_favicon = os.path.join(html_static_path[0], 'favicon.ico')
+
 # If not '', a 'Last updated on:' timestamp is inserted at every page bottom,
 # using the given strftime format.
 # html_last_updated_fmt = '%b %d, %Y'
@@ -213,29 +237,70 @@
 # Additional templates that should be rendered to pages, maps page names to
 # template names.
 
-# Add redirect for previously existing API pages (which are now included in
-# the API pages as top-level functions) based on a template (GH9911)
+# Add redirect for previously existing API pages
+# each item is like `(from_old, to_new)`
+# To redirect a class and all its methods, see below
+# https://github.com/pandas-dev/pandas/issues/16186
+
 moved_api_pages = [
-    'pandas.core.common.isnull', 'pandas.core.common.notnull', 'pandas.core.reshape.get_dummies',
-    'pandas.tools.merge.concat', 'pandas.tools.merge.merge', 'pandas.tools.pivot.pivot_table',
-    'pandas.tseries.tools.to_datetime', 'pandas.io.clipboard.read_clipboard', 'pandas.io.excel.ExcelFile.parse',
-    'pandas.io.excel.read_excel', 'pandas.io.html.read_html', 'pandas.io.json.read_json',
-    'pandas.io.parsers.read_csv', 'pandas.io.parsers.read_fwf', 'pandas.io.parsers.read_table',
-    'pandas.io.pickle.read_pickle', 'pandas.io.pytables.HDFStore.append', 'pandas.io.pytables.HDFStore.get',
-    'pandas.io.pytables.HDFStore.put', 'pandas.io.pytables.HDFStore.select', 'pandas.io.pytables.read_hdf',
-    'pandas.io.sql.read_sql', 'pandas.io.sql.read_frame', 'pandas.io.sql.write_frame',
-    'pandas.io.stata.read_stata', 'pandas.stats.moments.ewma', 'pandas.stats.moments.ewmcorr',
-    'pandas.stats.moments.ewmcov', 'pandas.stats.moments.ewmstd', 'pandas.stats.moments.ewmvar',
-    'pandas.stats.moments.expanding_apply', 'pandas.stats.moments.expanding_corr', 'pandas.stats.moments.expanding_count',
-    'pandas.stats.moments.expanding_cov', 'pandas.stats.moments.expanding_kurt', 'pandas.stats.moments.expanding_mean',
-    'pandas.stats.moments.expanding_median', 'pandas.stats.moments.expanding_quantile', 'pandas.stats.moments.expanding_skew',
-    'pandas.stats.moments.expanding_std', 'pandas.stats.moments.expanding_sum', 'pandas.stats.moments.expanding_var',
-    'pandas.stats.moments.rolling_apply', 'pandas.stats.moments.rolling_corr', 'pandas.stats.moments.rolling_count',
-    'pandas.stats.moments.rolling_cov', 'pandas.stats.moments.rolling_kurt', 'pandas.stats.moments.rolling_mean',
-    'pandas.stats.moments.rolling_median', 'pandas.stats.moments.rolling_quantile', 'pandas.stats.moments.rolling_skew',
-    'pandas.stats.moments.rolling_std', 'pandas.stats.moments.rolling_sum', 'pandas.stats.moments.rolling_var']
-
-html_additional_pages = {'generated/' + page: 'api_redirect.html' for page in moved_api_pages}
+    ('pandas.core.common.isnull', 'pandas.isna'),
+    ('pandas.core.common.notnull', 'pandas.notna'),
+    ('pandas.core.reshape.get_dummies', 'pandas.get_dummies'),
+    ('pandas.tools.merge.concat', 'pandas.concat'),
+    ('pandas.tools.merge.merge', 'pandas.merge'),
+    ('pandas.tools.pivot.pivot_table', 'pandas.pivot_table'),
+    ('pandas.tseries.tools.to_datetime', 'pandas.to_datetime'),
+    ('pandas.io.clipboard.read_clipboard', 'pandas.read_clipboard'),
+    ('pandas.io.excel.ExcelFile.parse', 'pandas.ExcelFile.parse'),
+    ('pandas.io.excel.read_excel', 'pandas.read_excel'),
+    ('pandas.io.gbq.read_gbq', 'pandas.read_gbq'),
+    ('pandas.io.html.read_html', 'pandas.read_html'),
+    ('pandas.io.json.read_json', 'pandas.read_json'),
+    ('pandas.io.parsers.read_csv', 'pandas.read_csv'),
+    ('pandas.io.parsers.read_fwf', 'pandas.read_fwf'),
+    ('pandas.io.parsers.read_table', 'pandas.read_table'),
+    ('pandas.io.pickle.read_pickle', 'pandas.read_pickle'),
+    ('pandas.io.pytables.HDFStore.append', 'pandas.HDFStore.append'),
+    ('pandas.io.pytables.HDFStore.get', 'pandas.HDFStore.get'),
+    ('pandas.io.pytables.HDFStore.put', 'pandas.HDFStore.put'),
+    ('pandas.io.pytables.HDFStore.select', 'pandas.HDFStore.select'),
+    ('pandas.io.pytables.read_hdf', 'pandas.read_hdf'),
+    ('pandas.io.sql.read_sql', 'pandas.read_sql'),
+    ('pandas.io.sql.read_frame', 'pandas.read_frame'),
+    ('pandas.io.sql.write_frame', 'pandas.write_frame'),
+    ('pandas.io.stata.read_stata', 'pandas.read_stata'),
+]
+
+# Again, tuples of (from_old, to_new)
+moved_classes = [
+    ('pandas.tseries.resample.Resampler', 'pandas.core.resample.Resampler'),
+    ('pandas.formats.style.Styler', 'pandas.io.formats.style.Styler'),
+]
+
+for old, new in moved_classes:
+    # the class itself...
+    moved_api_pages.append((old, new))
+
+    mod, classname = new.rsplit('.', 1)
+    klass = getattr(importlib.import_module(mod), classname)
+    methods = [x for x in dir(klass)
+               if not x.startswith('_') or x in ('__iter__', '__array__')]
+
+    for method in methods:
+        # ... and each of its public methods
+        moved_api_pages.append(
+            ("{old}.{method}".format(old=old, method=method),
+             "{new}.{method}".format(new=new, method=method))
+        )
+
+html_additional_pages = {
+    'generated/' + page[0]: 'api_redirect.html'
+    for page in moved_api_pages
+}
+
+html_context = {
+    'redirects': {old: new for old, new in moved_api_pages}
+}
 
 # If false, no module index is generated.
 html_use_modindex = True
@@ -260,6 +325,9 @@
 # Output file base name for HTML help builder.
 htmlhelp_basename = 'pandas'
 
+# -- Options for nbsphinx ------------------------------------------------
+
+nbsphinx_allow_errors = True
 
 # -- Options for LaTeX output --------------------------------------------
 
@@ -269,12 +337,12 @@
 # The font size ('10pt', '11pt' or '12pt').
 # latex_font_size = '10pt'
 
-# Grouping the document tree into LaTeX files. List of tuples
-# (source start file, target name, title, author, documentclass [howto/manual]).
+# Grouping the document tree into LaTeX files. List of tuples (source start
+# file, target name, title, author, documentclass [howto/manual]).
 latex_documents = [
     ('index', 'pandas.tex',
-     u('pandas: powerful Python data analysis toolkit'),
-     u('Wes McKinney\n\& PyData Development Team'), 'manual'),
+     u'pandas: powerful Python data analysis toolkit',
+     u'Wes McKinney\n\& PyData Development Team', 'manual'),
 ]
 
 # The name of an image file (relative to this directory) to place at the top of
@@ -295,47 +363,73 @@
 # latex_use_modindex = True
 
 
-# Example configuration for intersphinx: refer to the Python standard library.
 intersphinx_mapping = {
-    'statsmodels': ('http://statsmodels.sourceforge.net/devel/', None),
+    'statsmodels': ('http://www.statsmodels.org/devel/', None),
     'matplotlib': ('http://matplotlib.org/', None),
-    'python': ('http://docs.python.org/', None),
-    'numpy': ('http://docs.scipy.org/doc/numpy', None)
+    'pandas-gbq': ('https://pandas-gbq.readthedocs.io/en/latest/', None),
+    'python': ('https://docs.python.org/3/', None),
+    'numpy': ('https://docs.scipy.org/doc/numpy/', None),
+    'scipy': ('https://docs.scipy.org/doc/scipy/reference/', None),
+    'py': ('https://pylib.readthedocs.io/en/latest/', None)
 }
 import glob
 autosummary_generate = glob.glob("*.rst")
 
 # extlinks alias
-extlinks = {'issue': ('https://github.com/pydata/pandas/issues/%s',
+extlinks = {'issue': ('https://github.com/pandas-dev/pandas/issues/%s',
                       'GH'),
-            'wiki': ('https://github.com/pydata/pandas/wiki/%s',
+            'wiki': ('https://github.com/pandas-dev/pandas/wiki/%s',
                      'wiki ')}
 
+
+# ignore all deprecation warnings from Panel during doc build
+# (to avoid the need to add :okwarning: in many places)
+warnings.filterwarnings("ignore", message="\nPanel is deprecated",
+                        category=FutureWarning)
+
+
 ipython_exec_lines = [
     'import numpy as np',
     'import pandas as pd',
     # This ensures correct rendering on system with console encoding != utf8
     # (windows). It forces pandas to encode its output reprs using utf8
-    # whereever the docs are built. The docs' target is the browser, not
+    # wherever the docs are built. The docs' target is the browser, not
     # the console, so this is fine.
     'pd.options.display.encoding="utf8"'
-    ]
+]
 
 
 # Add custom Documenter to handle attributes/methods of an AccessorProperty
 # eg pandas.Series.str and pandas.Series.dt (see GH9322)
 
+import sphinx
 from sphinx.util import rpartition
-from sphinx.ext.autodoc import Documenter, MethodDocumenter, AttributeDocumenter
+from sphinx.ext.autodoc import (
+    Documenter, MethodDocumenter, AttributeDocumenter)
 from sphinx.ext.autosummary import Autosummary
 
 
+class AccessorDocumenter(MethodDocumenter):
+    """
+    Specialized Documenter subclass for accessors.
+    """
+    objtype = 'accessor'
+    directivetype = 'method'
+
+    # lower than MethodDocumenter so this is not chosen for normal methods
+    priority = 0.6
+
+    def format_signature(self):
+        # this method gives an error/warning for the accessors, therefore
+        # overriding it (accessor has no arguments)
+        return ''
+
+
 class AccessorLevelDocumenter(Documenter):
     """
     Specialized Documenter subclass for objects on accessor level (methods,
     attributes).
     """
-
     # This is the simple straightforward version
     # modname is None, base the last elements (eg 'hour')
     # and path the part before (eg 'Series.dt')
@@ -345,7 +439,6 @@ class AccessorLevelDocumenter(Documenter):
     #     mod_cls = mod_cls.split('.')
     #
     #     return modname, mod_cls + [base]
-
     def resolve_name(self, modname, parents, path, base):
         if modname is None:
             if path:
@@ -372,22 +465,31 @@ def resolve_name(self, modname, parents, path, base):
             if not modname:
                 modname = self.env.temp_data.get('autodoc:module')
             if not modname:
-                modname = self.env.temp_data.get('py:module')
+                if sphinx.__version__ > '1.3':
+                    modname = self.env.ref_context.get('py:module')
+                else:
+                    modname = self.env.temp_data.get('py:module')
             # ... else, it stays None, which means invalid
         return modname, parents + [base]
 
 
-class AccessorAttributeDocumenter(AccessorLevelDocumenter, AttributeDocumenter):
-
+class AccessorAttributeDocumenter(AccessorLevelDocumenter,
+                                  AttributeDocumenter):
     objtype = 'accessorattribute'
     directivetype = 'attribute'
 
+    # lower than AttributeDocumenter so this is not chosen for normal
+    # attributes
+    priority = 0.6
 
-class AccessorMethodDocumenter(AccessorLevelDocumenter, MethodDocumenter):
 
+class AccessorMethodDocumenter(AccessorLevelDocumenter, MethodDocumenter):
     objtype = 'accessormethod'
     directivetype = 'method'
 
+    # lower than MethodDocumenter so this is not chosen for normal methods
+    priority = 0.6
+
 
 class AccessorCallableDocumenter(AccessorLevelDocumenter, MethodDocumenter):
     """
@@ -409,7 +511,6 @@ class PandasAutosummary(Autosummary):
     This alternative autosummary class lets us override the table summary for
     Series.plot and DataFrame.plot in the API docs.
     """
-
     def _replace_pandas_items(self, display_name, sig, summary, real_name):
         # this a hack: ideally we should extract the signature from the
         # .__call__ method instead of hard coding this
@@ -421,20 +522,137 @@ def _replace_pandas_items(self, display_name, sig, summary, real_name):
             summary = 'Series plotting accessor and method'
         return (display_name, sig, summary, real_name)
 
+    @staticmethod
+    def _is_deprecated(real_name):
+        try:
+            obj, parent, modname = _import_by_name(real_name)
+        except ImportError:
+            return False
+        doc = NumpyDocString(obj.__doc__ or '')
+        summary = ''.join(doc['Summary'] + doc['Extended Summary'])
+        return '.. deprecated::' in summary
+
+    def _add_deprecation_prefixes(self, items):
+        for item in items:
+            display_name, sig, summary, real_name = item
+            if self._is_deprecated(real_name):
+                summary = '(DEPRECATED) %s' % summary
+            yield display_name, sig, summary, real_name
+
     def get_items(self, names):
         items = Autosummary.get_items(self, names)
         items = [self._replace_pandas_items(*item) for item in items]
+        items = list(self._add_deprecation_prefixes(items))
         return items
 
 
+# based on numpy doc/source/conf.py
+def linkcode_resolve(domain, info):
+    """
+    Determine the URL corresponding to Python object
+    """
+    if domain != 'py':
+        return None
+
+    modname = info['module']
+    fullname = info['fullname']
+
+    submod = sys.modules.get(modname)
+    if submod is None:
+        return None
+
+    obj = submod
+    for part in fullname.split('.'):
+        try:
+            obj = getattr(obj, part)
+        except:
+            return None
+
+    try:
+        fn = inspect.getsourcefile(obj)
+    except:
+        fn = None
+    if not fn:
+        return None
+
+    try:
+        source, lineno = inspect.getsourcelines(obj)
+    except:
+        lineno = None
+
+    if lineno:
+        linespec = "#L{:d}-L{:d}".format(lineno, lineno + len(source) - 1)
+    else:
+        linespec = ""
+
+    fn = os.path.relpath(fn, start=os.path.dirname(pandas.__file__))
+
+    if '+' in pandas.__version__:
+        return ("http://github.com/pandas-dev/pandas/blob/master/pandas/"
+                "{}{}".format(fn, linespec))
+    else:
+        return ("http://github.com/pandas-dev/pandas/blob/"
+                "v{}/pandas/{}{}".format(pandas.__version__, fn, linespec))
+
+
 # remove the docstring of the flags attribute (inherited from numpy ndarray)
 # because these give doc build errors (see GH issue 5331)
 def remove_flags_docstring(app, what, name, obj, options, lines):
     if what == "attribute" and name.endswith(".flags"):
         del lines[:]
 
+
+def process_class_docstrings(app, what, name, obj, options, lines):
+    """
+    For those classes for which we use ::
+
+    :template: autosummary/class_without_autosummary.rst
+
+    the documented attributes/methods have to be listed in the class
+    docstring. However, if one of those lists is empty, we use 'None',
+    which then generates warnings in sphinx / ugly html output.
+    This "autodoc-process-docstring" event connector removes that part
+    from the processed docstring.
+
+    """
+    if what == "class":
+        joined = '\n'.join(lines)
+
+        templates = [
+            """.. rubric:: Attributes
+
+.. autosummary::
+   :toctree:
+
+   None
+""",
+            """.. rubric:: Methods
+
+.. autosummary::
+   :toctree:
+
+   None
+"""
+        ]
+
+        for template in templates:
+            if template in joined:
+                joined = joined.replace(template, '')
+        lines[:] = joined.split('\n')
+
+
+suppress_warnings = [
+    # We "overwrite" autosummary with our PandasAutosummary, but
+    # still want the regular autosummary setup to run. So we just
+    # suppress this warning.
+    'app.add_directive'
+]
+
+
 def setup(app):
     app.connect("autodoc-process-docstring", remove_flags_docstring)
+    app.connect("autodoc-process-docstring", process_class_docstrings)
+    app.add_autodocumenter(AccessorDocumenter)
     app.add_autodocumenter(AccessorAttributeDocumenter)
     app.add_autodocumenter(AccessorMethodDocumenter)
     app.add_autodocumenter(AccessorCallableDocumenter)
diff --git a/doc/source/contributing.rst b/doc/source/contributing.rst
index 3e8e866c057e4..ff06d024740bf 100644
--- a/doc/source/contributing.rst
+++ b/doc/source/contributing.rst
@@ -11,38 +11,40 @@ Where to start?
 ===============
 
 All contributions, bug reports, bug fixes, documentation improvements,
-enhancements and ideas are welcome.
-
-If you are simply looking to start working with the *pandas* codebase, navigate to the
-`GitHub "issues" tab <https://github.com/pydata/pandas/issues>`_ and start looking through
-interesting issues.  There are a number of issues listed under `Docs
-<https://github.com/pydata/pandas/issues?labels=Docs&sort=updated&state=open>`_
-and `Difficulty Novice
-<https://github.com/pydata/pandas/issues?q=is%3Aopen+is%3Aissue+label%3A%22Difficulty+Novice%22>`_
-where you could start out.
-
-Or maybe through using *pandas* you have an idea of you own or are looking for something
-in the documentation and thinking 'this can be improved'...you can do something
-about it!
-
-Feel free to ask questions on `mailing list
-<https://groups.google.com/forum/?fromgroups#!forum/pydata>`_
-
-Bug Reports/Enhancement Requests
-================================
-
-Bug reports are an important part of making *pandas* more stable.  Having a complete bug report
-will allow others to reproduce the bug and provide insight into fixing.  Since many versions of
-*pandas* are supported, knowing version information will also identify improvements made since
-previous versions.  Often trying the bug-producing code out on the *master* branch is a worthwhile exercise
-to confirm the bug still exists.  It is also worth searching existing bug reports and pull requests
+enhancements, and ideas are welcome.
+
+If you are brand new to pandas or open-source development, we recommend going
+through the `GitHub "issues" tab <https://github.com/pandas-dev/pandas/issues>`_
+to find issues that interest you. There are a number of issues listed under `Docs
+<https://github.com/pandas-dev/pandas/issues?labels=Docs&sort=updated&state=open>`_
+and `good first issue
+<https://github.com/pandas-dev/pandas/issues?labels=good+first+issue&sort=updated&state=open>`_
+where you could start out. Once you've found an interesting issue, you can
+return here to get your development environment setup.
+
+Feel free to ask questions on the `mailing list
+<https://groups.google.com/forum/?fromgroups#!forum/pydata>`_ or on `Gitter`_.
+
+.. _contributing.bug_reports:
+
+Bug reports and enhancement requests
+====================================
+
+Bug reports are an important part of making *pandas* more stable. Having a complete bug report
+will allow others to reproduce the bug and provide insight into fixing. See
+`this stackoverflow article <https://stackoverflow.com/help/mcve>`_ and
+`this blogpost <http://matthewrocklin.com/blog/work/2018/02/28/minimal-bug-reports>`_
+for tips on writing a good bug report.
+
+Trying the bug-producing code out on the *master* branch is often a worthwhile exercise
+to confirm the bug still exists. It is also worth searching existing bug reports and pull requests
 to see if the issue has already been reported and/or fixed.
 
 Bug reports must:
 
 #. Include a short, self-contained Python snippet reproducing the problem.
-   You can have the code formatted nicely by using `GitHub Flavored Markdown
-   <http://github.github.com/github-flavored-markdown/>`_: ::
+   You can format the code nicely by using `GitHub Flavored Markdown
+   <http://github.github.com/github-flavored-markdown/>`_::
 
       ```python
       >>> from pandas import DataFrame
@@ -50,51 +52,50 @@ Bug reports must:
       ...
       ```
 
-#. Include the full version string of *pandas* and its dependencies. In recent (>0.12) versions
-   of *pandas* you can use a built in function: ::
-
-      >>> from pandas.util.print_versions import show_versions
-      >>> show_versions()
-
-   and in 0.13.1 onwards: ::
+#. Include the full version string of *pandas* and its dependencies. You can use the built in function::
 
+      >>> import pandas as pd
       >>> pd.show_versions()
 
 #. Explain why the current behavior is wrong/not desired and what you expect instead.
 
 The issue will then show up to the *pandas* community and be open to comments/ideas from others.
 
+.. _contributing.github:
+
 Working with the code
 =====================
 
 Now that you have an issue you want to fix, enhancement to add, or documentation to improve,
 you need to learn how to work with GitHub and the *pandas* code base.
 
-Version Control, Git, and GitHub
+.. _contributing.version_control:
+
+Version control, Git, and GitHub
 --------------------------------
 
 To the new user, working with Git is one of the more daunting aspects of contributing to *pandas*.
-It can very quickly become overwhelming, but sticking to the guidelines below will make the process
-straightforward and will work without much trouble.  As always, if you are having difficulties please
+It can very quickly become overwhelming, but sticking to the guidelines below will help keep the process
+straightforward and mostly trouble free.  As always, if you are having difficulties please
 feel free to ask for help.
 
-The code is hosted on `GitHub <https://www.github.com/pydata/pandas>`_. To
+The code is hosted on `GitHub <https://www.github.com/pandas-dev/pandas>`_. To
 contribute you will need to sign up for a `free GitHub account
 <https://github.com/signup/free>`_. We use `Git <http://git-scm.com/>`_ for
 version control to allow many people to work together on the project.
 
-Some great resources for learning git:
+Some great resources for learning Git:
 
 * the `GitHub help pages <http://help.github.com/>`_.
 * the `NumPy's documentation <http://docs.scipy.org/doc/numpy/dev/index.html>`_.
 * Matthew Brett's `Pydagogue <http://matthew-brett.github.com/pydagogue/>`_.
 
-Getting Started with Git
+Getting started with Git
 ------------------------
 
 `GitHub has instructions <http://help.github.com/set-up-git-redirect>`__ for installing git,
 setting up your SSH key, and configuring git.  All these steps need to be completed before
-working seamlessly with your local repository and GitHub.
+you can work seamlessly between your local repository and GitHub.
 
 .. _contributing.forking:
 
@@ -102,173 +103,180 @@ Forking
 -------
 
 You will need your own fork to work on the code. Go to the `pandas project
-page <https://github.com/pydata/pandas>`_ and hit the *fork* button. You will
-want to clone your fork to your machine: ::
+page <https://github.com/pandas-dev/pandas>`_ and hit the ``Fork`` button. You will
+want to clone your fork to your machine::
 
-    git clone git@github.com:your-user-name/pandas.git pandas-yourname
+    git clone https://github.com/your-user-name/pandas.git pandas-yourname
     cd pandas-yourname
-    git remote add upstream git://github.com/pydata/pandas.git
+    git remote add upstream https://github.com/pandas-dev/pandas.git
 
 This creates the directory `pandas-yourname` and connects your repository to
 the upstream (main project) *pandas* repository.
 
-The testing suite will run automatically on Travis-CI once your Pull Request is
-submitted.  However, if you wish to run the test suite on a branch prior to
-submitting the Pull Request, then Travis-CI needs to be hooked up to your
-GitHub repository.  Instructions are for doing so are `here
-<http://about.travis-ci.org/docs/user/getting-started/>`__.
-
-Creating a Branch
------------------
-
-You want your master branch to reflect only production-ready code, so create a
-feature branch for making your changes. For example::
-
-    git branch shiny-new-feature
-    git checkout shiny-new-feature
-
-The above can be simplified to::
-
-    git checkout -b shiny-new-feature
-
-This changes your working directory to the shiny-new-feature branch.  Keep any
-changes in this branch specific to one bug or feature so it is clear
-what the branch brings to *pandas*. You can have many shiny-new-features
-and switch in between them using the git checkout command.
-
-To update this branch, you need to retrieve the changes from the master branch::
-
-    git fetch upstream
-    git rebase upstream/master
-
-This will replay your commits on top of the lastest pandas git master.  If this
-leads to merge conflicts, you must resolve these before submitting your Pull
-Request.  If you have uncommitted changes, you will need to `stash` them prior
-to updating.  This will effectively store your changes and they can be reapplied
-after updating.
-
 .. _contributing.dev_env:
 
-Creating a Development Environment
+Creating a development environment
 ----------------------------------
 
-An easy way to create a *pandas* development environment is as follows.
+To test out code changes, you'll need to build pandas from source, which
+requires a C compiler and Python environment. If you're making documentation
+changes, you can skip to :ref:`contributing.documentation` but you won't be able
+to build the documentation locally before pushing your changes.
 
-- Install either :ref:`Install Anaconda <install.anaconda>` or :ref:`Install miniconda <install.miniconda>`
-- Make sure that you have :ref:`cloned the repository <contributing.forking>`
-- ``cd`` to the pandas source directory
+.. _contributiong.dev_c:
 
-Tell ``conda`` to create a new environment, named ``pandas_dev``, or any name you would like for this environment by running:
+Installing a C Compiler
+~~~~~~~~~~~~~~~~~~~~~~~
 
-::
+Pandas uses C extensions (mostly written using Cython) to speed up certain
+operations. To install pandas from source, you need to compile these C
+extensions, which means you need a C compiler. This process depends on which
+platform you're using. Follow the `CPython contributing guidelines
+<https://docs.python.org/devguide/setup.html#build-dependencies>`_ for getting a
+compiler installed. You don't need to do any of the ``./configure`` or ``make``
+steps; you only need to install the compiler.
 
-      conda create -n pandas_dev --file ci/requirements_dev.txt
+For Windows developers, the following links may be helpful.
 
+* https://blogs.msdn.microsoft.com/pythonengineering/2016/04/11/unable-to-find-vcvarsall-bat/
+* https://github.com/conda/conda-recipes/wiki/Building-from-Source-on-Windows-32-bit-and-64-bit
+* https://cowboyprogrammer.org/building-python-wheels-for-windows/
+* https://blog.ionelmc.ro/2014/12/21/compiling-python-extensions-on-windows/
+* https://support.enthought.com/hc/en-us/articles/204469260-Building-Python-extensions-with-Canopy
 
-For a python 3 environment
+Let us know if you have any difficulties by opening an issue or reaching out on
+`Gitter`_.
 
-::
+.. _contributiong.dev_python:
 
-      conda create -n pandas_dev python=3 --file ci/requirements_dev.txt
+Creating a Python Environment
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
+Now that you have a C compiler, create an isolated pandas development
+environment:
 
-If you are on ``windows``, then you will need to install the compiler linkages:
+* Install either `Anaconda <https://www.anaconda.com/download/>`_ or `miniconda
+  <https://conda.io/miniconda.html>`_
+* Make sure your conda is up to date (``conda update conda``)
+* Make sure that you have :ref:`cloned the repository <contributing.forking>`
+* ``cd`` to the *pandas* source directory
 
-::
+We'll now kick off a three-step process:
 
-      conda install -n pandas_dev libpython
+1. Install the build dependencies
+2. Build and install pandas
+3. Install the optional dependencies
 
-This will create the new environment, and not touch any of your existing environments, nor any existing python installation. It will install all of the basic dependencies of *pandas*, as well as the development and testing tools. If you would like to install other dependencies, you can install them as follows:
+.. code-block:: none
 
-::
+   # Create and activate the build environment
+   conda env create -f ci/environment-dev.yaml
+   conda activate pandas-dev
 
-      conda install -n pandas_dev -c pandas pytables scipy
+   # or with older versions of Anaconda:
+   source activate pandas-dev
 
-To install *all* pandas dependencies you can do the following:
+   # Build and install pandas
+   python setup.py build_ext --inplace -j 4
+   python -m pip install -e .
 
-::
+   # Install the rest of the optional dependencies
+   conda install -c defaults -c conda-forge --file=ci/requirements-optional-conda.txt
 
-      conda install -n pandas_dev -c pandas --file ci/requirements_all.txt
+At this point you should be able to import pandas from your locally built version::
 
-To work in this environment, ``activate`` it as follows:
+   $ python  # start an interpreter
+   >>> import pandas
+   >>> print(pandas.__version__)
+   0.22.0.dev0+29.g4ad6d4d74
 
-::
+This will create the new environment, and not touch any of your existing environments,
+nor any existing Python installation.
 
-      activate pandas_dev
+To view your environments::
 
-At which point, the prompt will change to indicate you are in the new development environment.
+      conda info -e
 
-.. note::
+To return to your root environment::
 
-   The above syntax is for ``windows`` environments. To work on ``macosx/linux``, use:
+      conda deactivate
 
-   ::
+See the full conda docs `here <http://conda.pydata.org/docs>`__.
 
-       source activate pandas_dev
+.. _contributing.pip:
 
-To view your environments:
+Creating a Python Environment (pip)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-::
+If you aren't using conda for you development environment, follow these instructions.
+You'll need to have at least python3.5 installed on your system.
 
-      conda info -e
+.. code-block:: none
 
-To return to you home root environment:
+   # Create a virtual environment
+   # Use an ENV_DIR of your choice. We'll use ~/virtualenvs/pandas-dev
+   # Any parent directories should already exist
+   python3 -m venv ~/virtualenvs/pandas-dev
+   # Activate the virtulaenv
+   . ~/virtualenvs/pandas-dev/bin/activate
 
-::
-
-      deactivate
+   # Install the build dependencies
+   python -m pip install -r ci/requirements_dev.txt
+   # Build and install pandas
+   python setup.py build_ext --inplace -j 4
+   python -m pip install -e .
 
-See the full ``conda`` docs `here
-<http://conda.pydata.org/docs>`__.
+   # Install additional dependencies
+   python -m pip install -r ci/requirements-optional-pip.txt
 
-At this point you can easily do an *in-place* install, as detailed in the next section.
-
-.. _contributing.getting_source:
+Creating a branch
+-----------------
 
-Making changes
---------------
+You want your master branch to reflect only production-ready code, so create a
+feature branch for making your changes. For example::
 
-Before making your code changes, it is often necessary to build the code that was
-just checked out.  There are two primary methods of doing this.
+    git branch shiny-new-feature
+    git checkout shiny-new-feature
 
-#. The best way to develop *pandas* is to build the C extensions in-place by
-   running::
+The above can be simplified to::
 
-      python setup.py build_ext --inplace
+    git checkout -b shiny-new-feature
 
-   If you startup the Python interpreter in the *pandas* source directory you
-   will call the built C extensions
+This changes your working directory to the shiny-new-feature branch.  Keep any
+changes in this branch specific to one bug or feature so it is clear
+what the branch brings to *pandas*. You can have many shiny-new-features
+and switch in between them using the git checkout command.
 
-#. Another very common option is to do a ``develop`` install of *pandas*::
+When creating this branch, make sure your master branch is up to date with
+the latest upstream master version. To update your local master branch, you
+can do::
 
-      python setup.py develop
+    git checkout master
+    git pull upstream master --ff-only
 
-   This makes a symbolic link that tells the Python interpreter to import *pandas*
-   from your development directory. Thus, you can always be using the development
-   version on your system without being inside the clone directory.
+When you want to update the feature branch with changes in master after
+you created the branch, check the section on
+:ref:`updating a PR <contributing.update-pr>`.
 
 .. _contributing.documentation:
 
 Contributing to the documentation
 =================================
 
-If you're not the developer type, contributing to the documentation is still
-of huge value. You don't even have to be an expert on
-*pandas* to do so! Something as simple as rewriting small passages for clarity
-as you reference the docs is a simple but effective way to contribute. The
-next person to read that passage will be in your debt!
-
-Actually, there are sections of the docs that are worse off by being written
-by experts. If something in the docs doesn't make sense to you, updating the
-relevant section after you figure it out is a simple way to ensure it will
-help the next person.
+Contributing to the documentation benefits everyone who uses *pandas*.
+We encourage you to help us improve the documentation, and
+you don't have to be an expert on *pandas* to do so! In fact,
+there are sections of the docs that are worse off after being written by
+experts. If something in the docs doesn't make sense to you, updating the
+relevant section after you figure it out is a great way to ensure it will help
+the next person.
 
 .. contents:: Documentation:
    :local:
 
 
-About the pandas documentation
-------------------------------
+About the *pandas* documentation
+--------------------------------
 
 The documentation is written in **reStructuredText**, which is almost like writing
 in plain English, and built using `Sphinx <http://sphinx.pocoo.org/>`__. The
@@ -278,7 +286,7 @@ complex changes to the documentation as well.
 
 Some other important things to know about the docs:
 
-- The *pandas* documentation consists of two parts: the docstrings in the code
+* The *pandas* documentation consists of two parts: the docstrings in the code
   itself and the docs in this folder ``pandas/doc/``.
 
   The docstrings provide a clear explanation of the usage of the individual
@@ -286,107 +294,111 @@ Some other important things to know about the docs:
   overviews per topic together with some other information (what's new,
   installation, etc).
 
-- The docstrings follow the **Numpy Docstring Standard** which is used widely
-  in the Scientific Python community. This standard specifies the format of
-  the different sections of the docstring. See `this document
-  <https://github.com/numpy/numpy/blob/master/doc/HOWTO_DOCUMENT.rst.txt>`_
-  for a detailed explanation, or look at some of the existing functions to
-  extend it in a similar manner.
+* The docstrings follow a pandas convention, based on the **Numpy Docstring
+  Standard**. Follow the :ref:`pandas docstring guide <docstring>` for detailed
+  instructions on how to write a correct docstring.
+
+  .. toctree::
+     :maxdepth: 2
 
-- The tutorials make heavy use of the `ipython directive
+     contributing_docstring.rst
+
+* The tutorials make heavy use of the `ipython directive
   <http://matplotlib.org/sampledoc/ipython_directive.html>`_ sphinx extension.
   This directive lets you put code in the documentation which will be run
-  during the doc build. For example:
-
-  ::
+  during the doc build. For example::
 
       .. ipython:: python
 
           x = 2
           x**3
 
-  will be rendered as
-
-  ::
+  will be rendered as::
 
       In [1]: x = 2
 
       In [2]: x**3
       Out[2]: 8
 
-  This means that almost all code examples in the docs are always run (and the
-  output saved) during the doc build. This way, they will always be up to date,
-  but it makes the doc building a bit more complex.
+  Almost all code examples in the docs are run (and the output saved) during the
+  doc build. This approach means that code examples will always be up to date,
+  but it does make the doc building a bit more complex.
 
-The utility script ``scripts/api_rst_coverage.py`` can be used to compare
-the list of methods documented in ``doc/source/api.rst`` (which is used to generate
-the `API Reference <http://pandas.pydata.org/pandas-docs/stable/api.html>`_ page)
-and the actual public methods.
-It will identify methods documented in in ``doc/source/api.rst`` that are not actually
-class methods, and existing methods that are not documented in ``doc/source/api.rst``.
+* Our API documentation in ``doc/source/api.rst`` houses the auto-generated
+  documentation from the docstrings. For classes, there are a few subtleties
+  around controlling which methods and attributes have pages auto-generated.
 
+  We have two autosummary templates for classes.
 
-How to build the pandas documentation
--------------------------------------
+  1. ``_templates/autosummary/class.rst``. Use this when you want to
+     automatically generate a page for every public method and attribute on the
+     class. The ``Attributes`` and ``Methods`` sections will be automatically
+     added to the class' rendered documentation by numpydoc. See ``DataFrame``
+     for an example.
 
-Requirements
-~~~~~~~~~~~~
+  2. ``_templates/autosummary/class_without_autosummary``. Use this when you
+     want to pick a subset of methods / attributes to auto-generate pages for.
+     When using this template, you should include an ``Attributes`` and
+     ``Methods`` section in the class docstring. See ``CategoricalIndex`` for an
+     example.
 
-To build the *pandas* docs there are some extra requirements: you will need to
-have ``sphinx`` and ``ipython`` installed. `numpydoc
-<https://github.com/numpy/numpydoc>`_ is used to parse the docstrings that
-follow the Numpy Docstring Standard (see above), but you don't need to install
-this because a local copy of ``numpydoc`` is included in the *pandas* source
-code.
+  Every method should be included in a ``toctree`` in ``api.rst``, else Sphinx
+  will emit a warning.
 
-It is easiest to :ref:`create a development environment <contributing.dev_env>`, then install:
+.. note::
 
-::
+    The ``.rst`` files are used to automatically generate Markdown and HTML versions
+    of the docs. For this reason, please do not edit ``CONTRIBUTING.md`` directly,
+    but instead make any changes to ``doc/source/contributing.rst``. Then, to
+    generate ``CONTRIBUTING.md``, use `pandoc <http://johnmacfarlane.net/pandoc/>`_
+    with the following command::
 
-      conda install -n pandas_dev sphinx ipython
+      pandoc doc/source/contributing.rst -t markdown_github > CONTRIBUTING.md
 
-Furthermore, it is recommended to have all `optional dependencies
-<http://pandas.pydata.org/pandas-docs/dev/install.html#optional-dependencies>`_
-installed. This is not strictly necessary, but be aware that you will see some error
-messages. Because all the code in the documentation is executed during the doc
-build, the examples using this optional dependencies will generate errors.
-Run ``pd.show_versions()`` to get an overview of the installed version of all
-dependencies.
+The utility script ``scripts/validate_docstrings.py`` can be used to get a csv
+summary of the API documentation. And also validate common errors in the docstring
+of a specific class, function or method. The summary also compares the list of
+methods documented in ``doc/source/api.rst`` (which is used to generate
+the `API Reference <http://pandas.pydata.org/pandas-docs/stable/api.html>`_ page)
+and the actual public methods.
+This will identify methods documented in ``doc/source/api.rst`` that are not actually
+class methods, and existing methods that are not documented in ``doc/source/api.rst``.
 
-.. warning::
 
-   Sphinx version >= 1.2.2 or the older 1.1.3 is required.
+How to build the *pandas* documentation
+---------------------------------------
+
+Requirements
+~~~~~~~~~~~~
+
+First, you need to have a development environment to be able to build pandas
+(see the docs on :ref:`creating a development environment above <contributing.dev_env>`).
 
 Building the documentation
 ~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-So how do you build the docs? Navigate to your local the folder
+So how do you build the docs? Navigate to your local
 ``pandas/doc/`` directory in the console and run::
 
     python make.py html
 
-And then you can find the html output in the folder ``pandas/doc/build/html/``.
+Then you can find the HTML output in the folder ``pandas/doc/build/html/``.
 
-The first time it will take quite a while, because it has to run all the code
-examples in the documentation and build all generated docstring pages.
-In subsequent evocations, sphinx will try to only build the pages that have
-been modified.
+The first time you build the docs, it will take quite a while because it has to run
+all the code examples and build all the generated docstring pages. In subsequent
+evocations, sphinx will try to only build the pages that have been modified.
 
 If you want to do a full clean build, do::
 
     python make.py clean
-    python make.py build
-
+    python make.py html
 
-Starting with 0.13.1 you can tell ``make.py`` to compile only a single section
-of the docs, greatly reducing the turn-around time for checking your changes.
-You will be prompted to delete `.rst` files that aren't required.  This is okay
-since the prior version can be checked out from git, but make sure to
-not commit the file deletions.
+You can tell ``make.py`` to compile only a single section of the docs, greatly
+reducing the turn-around time for checking your changes.
 
 ::
 
-    #omit autosummary and API section
+    # omit autosummary and API section
     python make.py clean
     python make.py --no-api
 
@@ -395,10 +407,20 @@ not commit the file deletions.
     python make.py clean
     python make.py --single indexing
 
-For comparison, a full documentation build may take 10 minutes. a ``-no-api`` build
-may take 3 minutes and a single section may take 15 seconds.  However, subsequent
-builds only process portions you changed.  Now, open the following file in a web
-browser to see the full documentation you just built::
+    # compile the reference docs for a single function
+    python make.py clean
+    python make.py --single DataFrame.join
+
+For comparison, a full documentation build may take 15 minutes, but a single
+section may take 15 seconds. Subsequent builds, which only process portions
+you have changed, will be faster.
+
+You can also specify to use multiple cores to speed up the documentation build::
+
+    python make.py html --num-jobs 4
+
+Open the following file in a web browser to see the full documentation you
+just built::
 
     pandas/docs/build/html/index.html
 
@@ -406,11 +428,34 @@ And you'll have the satisfaction of seeing your new and improved documentation!
 
 .. _contributing.dev_docs:
 
-Built Master Branch Documentation
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Building master branch documentation
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+When pull requests are merged into the *pandas* ``master`` branch, the main parts of
+the documentation are also built by Travis-CI. These docs are then hosted `here
+<http://pandas-docs.github.io/pandas-docs-travis>`__, see also
+the :ref:`Continuous Integration <contributing.ci>` section.
+
+Spell checking documentation
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+When contributing to documentation to **pandas** it's good to check if your work
+contains any spelling errors. Sphinx provides an easy way to spell check documentation
+and docstrings.
 
-When pull-requests are merged into the pandas *master* branch, the main parts of the documentation are
-also built by Travis-CI. These docs are then hosted `here <http://pandas-docs.github.io/pandas-docs-travis>`__.
+Running the spell check is easy. Just navigate to your local ``pandas/doc/`` directory and run::
+
+    python make.py spellcheck
+
+The spellcheck will take a few minutes to run (between 1 to 6 minutes). Sphinx will alert you
+with warnings and misspelt words - these misspelt words will be added to a file called
+``output.txt`` and you can find it on your local directory ``pandas/doc/build/spelling/``.
+
+The Sphinx spelling extension uses an EN-US dictionary to correct words, what means that in
+some cases you might need to add a word to this dictionary. You can do so by adding the word to
+the bag-of-words file named ``spelling_wordlist.txt`` located in the folder ``pandas/doc/``.
+
+.. _contributing.code:
 
 Contributing to the code base
 =============================
@@ -418,30 +463,184 @@ Contributing to the code base
 .. contents:: Code Base:
    :local:
 
-Code Standards
+Code standards
 --------------
 
+Writing good code is not just about what you write. It is also about *how* you
+write it. During :ref:`Continuous Integration <contributing.ci>` testing, several
+tools will be run to check your code for stylistic errors.
+Generating any warnings will cause the test to fail.
+Thus, good style is a requirement for submitting code to *pandas*.
+
+In addition, because a lot of people use our library, it is important that we
+do not make sudden changes to the code that could have the potential to break
+a lot of user code as a result, that is, we need it to be as *backwards compatible*
+as possible to avoid mass breakages.
+
+Additional standards are outlined on the `code style wiki
+page <https://github.com/pandas-dev/pandas/wiki/Code-Style-and-Conventions>`_.
+
+C (cpplint)
+~~~~~~~~~~~
+
+*pandas* uses the `Google <https://google.github.io/styleguide/cppguide.html>`_
+standard. Google provides an open source style checker called ``cpplint``, but we
+use a fork of it that can be found `here <https://github.com/cpplint/cpplint>`__.
+Here are *some* of the more common ``cpplint`` issues:
+
+* we restrict line-length to 80 characters to promote readability
+* every header file must include a header guard to avoid name collisions if re-included
+
+:ref:`Continuous Integration <contributing.ci>` will run the
+`cpplint <https://pypi.org/project/cpplint>`_ tool
+and report any stylistic errors in your code. Therefore, it is helpful before
+submitting code to run the check yourself::
+
+   cpplint --extensions=c,h --headers=h --filter=-readability/casting,-runtime/int,-build/include_subdir modified-c-file
+
+You can also run this command on an entire directory if necessary::
+
+   cpplint --extensions=c,h --headers=h --filter=-readability/casting,-runtime/int,-build/include_subdir --recursive modified-c-directory
+
+To make your commits compliant with this standard, you can install the
+`ClangFormat <http://clang.llvm.org/docs/ClangFormat.html>`_ tool, which can be
+downloaded `here <http://llvm.org/builds/>`__. To configure, in your home directory,
+run the following command::
+
+    clang-format style=google -dump-config  > .clang-format
+
+Then modify the file to ensure that any indentation width parameters are at least four.
+Once configured, you can run the tool as follows::
+
+    clang-format modified-c-file
+
+This will output what your file will look like if the changes are made, and to apply
+them, run the following command::
+
+    clang-format -i modified-c-file
+
+To run the tool on an entire directory, you can run the following analogous commands::
+
+    clang-format modified-c-directory/*.c modified-c-directory/*.h
+    clang-format -i modified-c-directory/*.c modified-c-directory/*.h
+
+Do note that this tool is best-effort, meaning that it will try to correct as
+many errors as possible, but it may not correct *all* of them. Thus, it is
+recommended that you run ``cpplint`` to double check and make any other style
+fixes manually.
+
+Python (PEP8)
+~~~~~~~~~~~~~
+
 *pandas* uses the `PEP8 <http://www.python.org/dev/peps/pep-0008/>`_ standard.
-There are several tools to ensure you abide by this standard.
+There are several tools to ensure you abide by this standard. Here are *some* of
+the more common ``PEP8`` issues:
+
+* we restrict line-length to 79 characters to promote readability
+* passing arguments should have spaces after commas, e.g. ``foo(arg1, arg2, kw1='bar')``
+
+:ref:`Continuous Integration <contributing.ci>` will run
+the `flake8 <https://pypi.org/project/flake8>`_ tool
+and report any stylistic errors in your code. Therefore, it is helpful before
+submitting code to run the check yourself on the diff::
+
+   git diff master -u -- "*.py" | flake8 --diff
+
+This command will catch any stylistic errors in your changes specifically, but
+be beware it may not catch all of them. For example, if you delete the only
+usage of an imported function, it is stylistically incorrect to import an
+unused function. However, style-checking the diff will not catch this because
+the actual import is not part of the diff. Thus, for completeness, you should
+run this command, though it will take longer::
+
+   git diff master --name-only -- "*.py" | grep "pandas/" | xargs -r flake8
+
+Note that on OSX, the ``-r`` flag is not available, so you have to omit it and
+run this slightly modified command::
+
+   git diff master --name-only -- "*.py" | grep "pandas/" | xargs flake8
+
+Note that on Windows, these commands are unfortunately not possible because
+commands like ``grep`` and ``xargs`` are not available natively. To imitate the
+behavior with the commands above, you should run::
+
+    git diff master --name-only -- "*.py"
+
+This will list all of the Python files that have been modified. The only ones
+that matter during linting are any whose directory filepath begins with "pandas."
+For each filepath, copy and paste it after the ``flake8`` command as shown below:
+
+    flake8 <python-filepath>
+
+Alternatively, you can install the ``grep`` and ``xargs`` commands via the
+`MinGW <http://www.mingw.org/>`__ toolchain, and it will allow you to run the
+commands above.
+
+Backwards Compatibility
+~~~~~~~~~~~~~~~~~~~~~~~
+
+Please try to maintain backward compatibility. *pandas* has lots of users with lots of
+existing code, so don't break it if at all possible.  If you think breakage is required,
+clearly state why as part of the pull request.  Also, be careful when changing method
+signatures and add deprecation warnings where needed. Also, add the deprecated sphinx
+directive to the deprecated functions or methods.
+
+If a function with the same arguments as the one being deprecated exist, you can use
+the ``pandas.util._decorators.deprecate``:
+
+.. code-block:: python
+
+    from pandas.util._decorators import deprecate
+
+    deprecate('old_func', 'new_func', '0.21.0')
+
+Otherwise, you need to do it manually:
+
+.. code-block:: python
+
+    def old_func():
+        """Summary of the function.
+
+        .. deprecated:: 0.21.0
+           Use new_func instead.
+        """
+        warnings.warn('Use new_func instead.', FutureWarning, stacklevel=2)
+        new_func()
+
+.. _contributing.ci:
 
-We've written a tool to check that your commits are PEP8 great, `pip install pep8radius <https://github.com/hayd/pep8radius>`_.
-Look at PEP8 fixes in your branch vs master with::
+Testing With Continuous Integration
+-----------------------------------
 
-    pep8radius master --diff` and make these changes with `pep8radius master --diff --in-place`
+The *pandas* test suite will run automatically on `Travis-CI <https://travis-ci.org/>`__,
+`Appveyor <https://www.appveyor.com/>`__, and `Circle CI <https://circleci.com/>`__ continuous integration
+services, once your pull request is submitted.
+However, if you wish to run the test suite on a branch prior to submitting the pull request,
+then the continuous integration services need to be hooked to your GitHub repository. Instructions are here
+for `Travis-CI <http://about.travis-ci.org/docs/user/getting-started/>`__,
+`Appveyor <https://www.appveyor.com/docs/>`__ , and `CircleCI <https://circleci.com/>`__.
 
-Alternatively, use `flake8 <http://pypi.python.org/pypi/flake8>`_ tool for checking the style of your code.
-Additional standards are outlined on the `code style wiki page <https://github.com/pydata/pandas/wiki/Code-Style-and-Conventions>`_.
+A pull-request will be considered for merging when you have an all 'green' build. If any tests are failing,
+then you will get a red 'X', where you can click through to see the individual failed tests.
+This is an example of a green build.
 
-Please try to maintain backward-compatibility. *Pandas* has lots of users with lots of existing code, so
-don't break it if at all possible.  If you think breakage is required clearly state why
-as part of the Pull Request.  Also, be careful when changing method signatures and add
-deprecation warnings where needed.
+.. image:: _static/ci.png
 
-Test-driven Development/Writing Code
+.. note::
+
+   Each time you push to *your* fork, a *new* run of the tests will be triggered on the CI. Appveyor will auto-cancel
+   any non-currently-running tests for that same pull-request. You can enable the auto-cancel feature for
+   `Travis-CI here <https://docs.travis-ci.com/user/customizing-the-build/#Building-only-the-latest-commit>`__ and
+   for `CircleCI here <https://circleci.com/changelog-legacy/#option-to-auto-cancel-redundant-builds>`__.
+
+.. _contributing.tdd:
+
+
+Test-driven development/code writing
 ------------------------------------
 
-*Pandas* is serious about testing and strongly encourages individuals to embrace `Test-driven Development (TDD)
-<http://en.wikipedia.org/wiki/Test-driven_development>`_.
+*pandas* is serious about testing and strongly encourages contributors to embrace
+`test-driven development (TDD) <http://en.wikipedia.org/wiki/Test-driven_development>`_.
 This development process "relies on the repetition of a very short development cycle:
 first the developer writes an (initially failing) automated test case that defines a desired
 improvement or new function, then produces the minimum amount of code to pass that test."
@@ -449,30 +648,32 @@ So, before actually writing any code, you should write your tests.  Often the te
 taken from the original GitHub issue.  However, it is always worth considering additional
 use cases and writing corresponding tests.
 
-Adding tests is one of the most common requests after code is pushed to *pandas*.  It is worth getting
-in the habit of writing tests ahead of time so this is never an issue.
+Adding tests is one of the most common requests after code is pushed to *pandas*.  Therefore,
+it is worth getting in the habit of writing tests ahead of time so this is never an issue.
 
-Like many packages, *pandas* uses the `Nose testing system
-<http://somethingaboutorange.com/mrl/projects/nose/>`_ and the convenient
+Like many packages, *pandas* uses `pytest
+<http://doc.pytest.org/en/latest/>`_ and the convenient
 extensions in `numpy.testing
 <http://docs.scipy.org/doc/numpy/reference/routines.testing.html>`_.
 
+.. note::
+
+   The earliest supported pytest version is 3.1.0.
+
 Writing tests
 ~~~~~~~~~~~~~
 
-All tests should go into the *tests* subdirectory of the specific package.
-There are probably many examples already there and looking to these for
-inspiration is suggested.  If you test requires working with files or
-network connectivity there is more information on the `testing page
-<https://github.com/pydata/pandas/wiki/Testing>`_ of the wiki.
+All tests should go into the ``tests`` subdirectory of the specific package.
+This folder contains many current examples of tests, and we suggest looking to these for
+inspiration.  If your test requires working with files or
+network connectivity, there is more information on the `testing page
+<https://github.com/pandas-dev/pandas/wiki/Testing>`_ of the wiki.
 
 The ``pandas.util.testing`` module has many special ``assert`` functions that
 make it easier to make statements about whether Series or DataFrame objects are
 equivalent. The easiest way to verify that your code is correct is to
 explicitly construct the result you expect, then compare the actual result to
-the expected correct result:
-
-::
+the expected correct result::
 
     def test_pivot(self):
         data = {
@@ -491,123 +692,239 @@ the expected correct result:
 
         assert_frame_equal(pivoted, expected)
 
+Transitioning to ``pytest``
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+*pandas* existing test structure is *mostly* classed based, meaning that you will typically find tests wrapped in a class.
+
+.. code-block:: python
+
+    class TestReallyCoolFeature(object):
+        ....
+
+Going forward, we are moving to a more *functional* style using the `pytest <http://doc.pytest.org/en/latest/>`__ framework, which offers a richer testing
+framework that will facilitate testing and developing. Thus, instead of writing test classes, we will write test functions like this:
+
+.. code-block:: python
+
+    def test_really_cool_feature():
+        ....
+
+Using ``pytest``
+~~~~~~~~~~~~~~~~
+
+Here is an example of a self-contained set of tests that illustrate multiple features that we like to use.
+
+* functional style: tests are like ``test_*`` and *only* take arguments that are either fixtures or parameters
+* ``pytest.mark`` can be used to set metadata on test functions, e.g. ``skip`` or ``xfail``.
+* using ``parametrize``: allow testing of multiple cases
+* to set a mark on a parameter, ``pytest.param(..., marks=...)`` syntax should be used
+* ``fixture``, code for object construction, on a per-test basis
+* using bare ``assert`` for scalars and truth-testing
+* ``tm.assert_series_equal`` (and its counter part ``tm.assert_frame_equal``), for pandas object comparisons.
+* the typical pattern of constructing an ``expected`` and comparing versus the ``result``
+
+We would name this file ``test_cool_feature.py`` and put in an appropriate place in the ``pandas/tests/`` structure.
+
+.. code-block:: python
+
+   import pytest
+   import numpy as np
+   import pandas as pd
+   from pandas.util import testing as tm
+
+   @pytest.mark.parametrize('dtype', ['int8', 'int16', 'int32', 'int64'])
+   def test_dtypes(dtype):
+       assert str(np.dtype(dtype)) == dtype
+
+   @pytest.mark.parametrize('dtype', ['float32',
+       pytest.param('int16', marks=pytest.mark.skip),
+       pytest.param('int32',
+                    marks=pytest.mark.xfail(reason='to show how it works'))])
+   def test_mark(dtype):
+       assert str(np.dtype(dtype)) == 'float32'
+
+   @pytest.fixture
+   def series():
+       return pd.Series([1, 2, 3])
+
+   @pytest.fixture(params=['int8', 'int16', 'int32', 'int64'])
+   def dtype(request):
+       return request.param
+
+   def test_series(series, dtype):
+       result = series.astype(dtype)
+       assert result.dtype == dtype
+
+       expected = pd.Series([1, 2, 3], dtype=dtype)
+       tm.assert_series_equal(result, expected)
+
+
+A test run of this yields
+
+.. code-block:: shell
+
+   ((pandas) bash-3.2$ pytest  test_cool_feature.py  -v
+   =========================== test session starts ===========================
+   platform darwin -- Python 3.6.2, pytest-3.2.1, py-1.4.31, pluggy-0.4.0
+   collected 11 items
+
+   tester.py::test_dtypes[int8] PASSED
+   tester.py::test_dtypes[int16] PASSED
+   tester.py::test_dtypes[int32] PASSED
+   tester.py::test_dtypes[int64] PASSED
+   tester.py::test_mark[float32] PASSED
+   tester.py::test_mark[int16] SKIPPED
+   tester.py::test_mark[int32] xfail
+   tester.py::test_series[int8] PASSED
+   tester.py::test_series[int16] PASSED
+   tester.py::test_series[int32] PASSED
+   tester.py::test_series[int64] PASSED
+
+Tests that we have ``parametrized`` are now accessible via the test name, for example we could run these with ``-k int8`` to sub-select *only* those tests which match ``int8``.
+
+
+.. code-block:: shell
+
+   ((pandas) bash-3.2$ pytest  test_cool_feature.py  -v -k int8
+   =========================== test session starts ===========================
+   platform darwin -- Python 3.6.2, pytest-3.2.1, py-1.4.31, pluggy-0.4.0
+   collected 11 items
+
+   test_cool_feature.py::test_dtypes[int8] PASSED
+   test_cool_feature.py::test_series[int8] PASSED
+
+
 Running the test suite
-~~~~~~~~~~~~~~~~~~~~~~
+----------------------
 
-The tests can then be run directly inside your git clone (without having to
-install *pandas*) by typing:::
+The tests can then be run directly inside your Git clone (without having to
+install *pandas*) by typing::
 
-    nosetests pandas
+    pytest pandas
 
 The tests suite is exhaustive and takes around 20 minutes to run.  Often it is
 worth running only a subset of tests first around your changes before running the
-entire suite.  This is done using one of the following constructs:
+entire suite.
 
-::
+The easiest way to do this is with::
 
-    nosetests pandas/tests/[test-module].py
-    nosetests pandas/tests/[test-module].py:[TestClass]
-    nosetests pandas/tests/[test-module].py:[TestClass].[test_method]
+    pytest pandas/path/to/test.py -k regex_matching_test_name
 
+Or with one of the following constructs::
 
-Running the performance test suite
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-Performance matters and it is worth considering that your code has not introduced
-performance regressions.  *pandas* is in the process of migrating to the
-`asv library <https://github.com/spacetelescope/asv>`__
-to enable easy monitoring of the performance of critical *pandas* operations.
-These benchmarks are all found in the ``pandas/asv_bench`` directory.  *asv*
-supports both python2 and python3.
+    pytest pandas/tests/[test-module].py
+    pytest pandas/tests/[test-module].py::[TestClass]
+    pytest pandas/tests/[test-module].py::[TestClass]::[test_method]
 
-.. note::
+Using `pytest-xdist <https://pypi.org/project/pytest-xdist>`_, one can
+speed up local testing on multicore machines. To use this feature, you will
+need to install `pytest-xdist` via::
 
-    The *asv* benchmark suite was translated from the previous framework, vbench,
-    so many stylistic issues are likely a result of automated transformation of the
-    code.
+    pip install pytest-xdist
 
-To use ''asv'' you will need either ''conda'' or ''virtualenv''. For more details
-please check installation webpage http://asv.readthedocs.org/en/latest/installing.html
+Two scripts are provided to assist with this.  These scripts distribute
+testing across 4 threads.
 
-To install ''asv''::
+On Unix variants, one can type::
 
-    pip install git+https://github.com/spacetelescope/asv
+    test_fast.sh
 
-If you need to run a benchmark, change your directory to asv_bench/ and run
-the following if you have been developing on master::
+On Windows, one can type::
 
-    asv continuous master
+    test_fast.bat
 
-Otherwise, if you are working on another branch, either of the following can be used::
+This can significantly reduce the time it takes to locally run tests before
+submitting a pull request.
 
-    asv continuous master HEAD
-    asv continuous master your_branch
+For more, see the `pytest <http://doc.pytest.org/en/latest/>`_ documentation.
 
-This will checkout the master revision and run the suite on both master and
-your commit.  Running the full test suite can take up to one hour and use up
-to 3GB of RAM.  Usually it is sufficient to paste a subset of the results in
-to the Pull Request to show that the committed changes do not cause unexpected
-performance regressions.
+    .. versionadded:: 0.20.0
 
-You can run specific benchmarks using the *-b* flag which takes a regular expression.
-For example this will only run tests from a ``pandas/asv_bench/benchmarks/groupby.py``
-file::
+Furthermore one can run
 
-    asv continuous master -b groupby
+.. code-block:: python
 
-If you want to run only some specific group of tests from a file you can do it
-using ``.`` as a separator. For example::
+   pd.test()
 
-    asv continuous master -b groupby.groupby_agg_builtins1
+with an imported pandas to run tests similarly.
 
-will only run a ``groupby_agg_builtins1`` test defined in a ``groupby`` file.
+Running the performance test suite
+----------------------------------
+
+Performance matters and it is worth considering whether your code has introduced
+performance regressions.  *pandas* is in the process of migrating to
+`asv benchmarks <https://github.com/spacetelescope/asv>`__
+to enable easy monitoring of the performance of critical *pandas* operations.
+These benchmarks are all found in the ``pandas/asv_bench`` directory.  asv
+supports both python2 and python3.
 
-It is also useful to run tests in your current environment. You can simply do it by::
+To use all features of asv, you will need either ``conda`` or
+``virtualenv``. For more details please check the `asv installation
+webpage <https://asv.readthedocs.io/en/latest/installing.html>`_.
 
-    asv dev
+To install asv::
 
-which would be equivalent to ``asv run --quick --show-stderr --python=same``. This
-will launch every test only once, display stderr from the benchmarks and use your
-local ``python`` that comes from your $PATH.
+    pip install git+https://github.com/spacetelescope/asv
 
-Information on how to write a benchmark can be found in
-`*asv*'s documentation http://asv.readthedocs.org/en/latest/writing_benchmarks.html`.
+If you need to run a benchmark, change your directory to ``asv_bench/`` and run::
 
-Running the vbench performance test suite (phasing out)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+    asv continuous -f 1.1 upstream/master HEAD
 
-Performance matters and it is worth considering that your code has not introduced
-performance regressions.  Historically, *pandas* used `vbench library <https://github.com/pydata/vbench>`__
-to enable easy monitoring of the performance of critical *pandas* operations.
-These benchmarks are all found in the ``pandas/vb_suite`` directory.  vbench
-currently only works on python2.
+You can replace ``HEAD`` with the name of the branch you are working on,
+and report benchmarks that changed by more than 10%.
+The command uses ``conda`` by default for creating the benchmark
+environments. If you want to use virtualenv instead, write::
 
-To install vbench::
+    asv continuous -f 1.1 -E virtualenv upstream/master HEAD
 
-    pip install git+https://github.com/pydata/vbench
+The ``-E virtualenv`` option should be added to all ``asv`` commands
+that run benchmarks. The default value is defined in ``asv.conf.json``.
 
-Vbench also requires sqlalchemy, gitpython, and psutil which can all be installed
-using pip.  If you need to run a benchmark, change your directory to the *pandas* root and run::
+Running the full test suite can take up to one hour and use up to 3GB of RAM.
+Usually it is sufficient to paste only a subset of the results into the pull
+request to show that the committed changes do not cause unexpected performance
+regressions.  You can run specific benchmarks using the ``-b`` flag, which
+takes a regular expression.  For example, this will only run tests from a
+``pandas/asv_bench/benchmarks/groupby.py`` file::
 
-    ./test_perf.sh -b master -t HEAD
+    asv continuous -f 1.1 upstream/master HEAD -b ^groupby
 
-This will checkout the master revision and run the suite on both master and
-your commit.  Running the full test suite can take up to one hour and use up
-to 3GB of RAM.  Usually it is sufficient to paste a subset of the results in
-to the Pull Request to show that the committed changes do not cause unexpected
-performance regressions.
+If you want to only run a specific group of tests from a file, you can do it
+using ``.`` as a separator. For example::
+
+    asv continuous -f 1.1 upstream/master HEAD -b groupby.GroupByMethods
+
+will only run the ``GroupByMethods`` benchmark defined in ``groupby.py``.
+
+You can also run the benchmark suite using the version of ``pandas``
+already installed in your current Python environment. This can be
+useful if you do not have virtualenv or conda, or are using the
+``setup.py develop`` approach discussed above; for the in-place build
+you need to set ``PYTHONPATH``, e.g.
+``PYTHONPATH="$PWD/.." asv [remaining arguments]``.
+You can run benchmarks using an existing Python
+environment by::
+
+    asv run -e -E existing
+
+or, to use a specific Python interpreter,::
+
+    asv run -e -E existing:python3.5
 
-You can run specific benchmarks using the *-r* flag which takes a regular expression.
+This will display stderr from the benchmarks, and use your local
+``python`` that comes from your ``$PATH``.
 
-See the `performance testing wiki <https://github.com/pydata/pandas/wiki/Performance-Testing>`_ for information
-on how to write a benchmark.
+Information on how to write a benchmark and how to use asv can be found in the
+`asv documentation <https://asv.readthedocs.io/en/latest/writing_benchmarks.html>`_.
 
 Documenting your code
 ---------------------
 
-Changes should be reflected in the release notes located in `doc/source/whatsnew/vx.y.z.txt`.
+Changes should be reflected in the release notes located in ``doc/source/whatsnew/vx.y.z.txt``.
 This file contains an ongoing change log for each release.  Add an entry to this file to
 document your fix, enhancement or (unavoidable) breaking change.  Make sure to include the
-GitHub issue number when adding your entry (using `` :issue:`1234` `` where `1234` is the
+GitHub issue number when adding your entry (using ``:issue:`1234``` where ``1234`` is the
 issue/pull request number).
 
 If your code is an enhancement, it is most likely necessary to add usage
@@ -618,12 +935,12 @@ directive is used. The sphinx syntax for that is:
 
 .. code-block:: rst
 
-  .. versionadded:: 0.17.0
+  .. versionadded:: 0.21.0
 
-This will put the text *New in version 0.17.0* wherever you put the sphinx
+This will put the text *New in version 0.21.0* wherever you put the sphinx
 directive. This should also be put in the docstring when adding a new function
-or method (`example <https://github.com/pydata/pandas/blob/v0.16.2/pandas/core/generic.py#L1959>`__)
-or a new keyword argument (`example <https://github.com/pydata/pandas/blob/v0.16.2/pandas/core/frame.py#L1171>`__).
+or method (`example <https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495>`__)
+or a new keyword argument (`example <https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568>`__).
 
 Contributing your changes to *pandas*
 =====================================
@@ -631,17 +948,17 @@ Contributing your changes to *pandas*
 Committing your code
 --------------------
 
-Keep style fixes to a separate commit to make your PR more readable.
+Keep style fixes to a separate commit to make your pull request more readable.
 
 Once you've made changes, you can see them by typing::
 
     git status
 
-If you've created a new file, it is not being tracked by git. Add it by typing ::
+If you have created a new file, it is not being tracked by git. Add it by typing::
 
     git add path/to/file-to-be-added.py
 
-Doing 'git status' again should give something like ::
+Doing 'git status' again should give something like::
 
     # On branch shiny-new-feature
     #
@@ -652,114 +969,147 @@ Finally, commit your changes to your local repository with an explanatory messag
 uses a convention for commit message prefixes and layout.  Here are
 some common prefixes along with general guidelines for when to use them:
 
-    * ENH: Enhancement, new functionality
-    * BUG: Bug fix
-    * DOC: Additions/updates to documentation
-    * TST: Additions/updates to tests
-    * BLD: Updates to the build process/scripts
-    * PERF: Performance improvement
-    * CLN: Code cleanup
+* ENH: Enhancement, new functionality
+* BUG: Bug fix
+* DOC: Additions/updates to documentation
+* TST: Additions/updates to tests
+* BLD: Updates to the build process/scripts
+* PERF: Performance improvement
+* CLN: Code cleanup
 
 The following defines how a commit message should be structured.  Please reference the
-relevant GitHub issues in your commit message using `GH1234` or `#1234`.  Either style
+relevant GitHub issues in your commit message using GH1234 or #1234.  Either style
 is fine, but the former is generally preferred:
 
-    * a subject line with `< 80` chars.
-    * One blank line.
-    * Optionally, a commit message body.
+* a subject line with `< 80` chars.
+* One blank line.
+* Optionally, a commit message body.
 
 Now you can commit your changes in your local repository::
 
     git commit -m
 
-If you have multiple commits, it is common to want to combine them into one commit, often
-referred to as "squashing" or "rebasing".  This is a common request by package maintainers
-when submitting a Pull Request as it maintains a more compact commit history.  To rebase your commits::
-
-    git rebase -i HEAD~#
-
-Where # is the number of commits you want to combine.  Then you can pick the relevant
-commit message and discard others.
-
 Pushing your changes
 --------------------
 
 When you want your changes to appear publicly on your GitHub page, push your
-forked feature branch's commits ::
+forked feature branch's commits::
 
     git push origin shiny-new-feature
 
-Here `origin` is the default name given to your remote repository on GitHub.
-You can see the remote repositories ::
+Here ``origin`` is the default name given to your remote repository on GitHub.
+You can see the remote repositories::
 
     git remote -v
 
 If you added the upstream repository as described above you will see something
-like ::
+like::
 
     origin  git@github.com:yourname/pandas.git (fetch)
     origin  git@github.com:yourname/pandas.git (push)
-    upstream        git://github.com/pydata/pandas.git (fetch)
-    upstream        git://github.com/pydata/pandas.git (push)
+    upstream        git://github.com/pandas-dev/pandas.git (fetch)
+    upstream        git://github.com/pandas-dev/pandas.git (push)
 
 Now your code is on GitHub, but it is not yet a part of the *pandas* project.  For that to
-happen, a Pull Request needs to be submitted on GitHub.
+happen, a pull request needs to be submitted on GitHub.
 
 Review your code
 ----------------
 
-When you're ready to ask for a code review, you will file a Pull Request. Before you do,
-again make sure you've followed all the guidelines outlined in this document regarding
-code style, tests, performance tests, and documentation. You should also double check
-your branch changes against the branch it was based off of:
+When you're ready to ask for a code review, file a pull request. Before you do, once
+again make sure that you have followed all the guidelines outlined in this document
+regarding code style, tests, performance tests, and documentation. You should also
+double check your branch changes against the branch it was based on:
 
-#. Navigate to your repository on GitHub--https://github.com/your-user-name/pandas.
-#. Click on `Branches`.
-#. Click on the `Compare` button for your feature branch.
-#. Select the `base` and `compare` branches, if necessary. This will be `master` and
-   `shiny-new-feature`, respectively.
+#. Navigate to your repository on GitHub -- https://github.com/your-user-name/pandas
+#. Click on ``Branches``
+#. Click on the ``Compare`` button for your feature branch
+#. Select the ``base`` and ``compare`` branches, if necessary. This will be ``master`` and
+   ``shiny-new-feature``, respectively.
 
-Finally, make the Pull Request
+Finally, make the pull request
 ------------------------------
 
-If everything looks good you are ready to make a Pull Request.  A Pull Request is how
+If everything looks good, you are ready to make a pull request.  A pull request is how
 code from a local repository becomes available to the GitHub community and can be looked
-at and eventually merged into the master version.  This Pull Request and its associated
+at and eventually merged into the master version.  This pull request and its associated
 changes will eventually be committed to the master branch and available in the next
-release.  To submit a Pull Request:
+release.  To submit a pull request:
+
+#. Navigate to your repository on GitHub
+#. Click on the ``Pull Request`` button
+#. You can then click on ``Commits`` and ``Files Changed`` to make sure everything looks
+   okay one last time
+#. Write a description of your changes in the ``Preview Discussion`` tab
+#. Click ``Send Pull Request``.
 
-#. Navigate to your repository on GitHub.
-#. Click on the `Pull Request` button.
-#. You can then click on `Commits` and `Files Changed` to make sure everything looks okay one last time.
-#. Write a description of your changes in the `Preview Discussion` tab.
-#. Click `Send Pull Request`.
+This request then goes to the repository maintainers, and they will review
+the code.
 
-This request then appears to the repository maintainers, and they will review
-the code. If you need to make more changes, you can make them in
-your branch, push them to GitHub, and the pull request will be automatically
-updated.  Pushing them to GitHub again is done by::
+.. _contributing.update-pr:
 
-    git push -f origin shiny-new-feature
+Updating your pull request
+--------------------------
+
+Based on the review you get on your pull request, you will probably need to make
+some changes to the code. In that case, you can make them in your branch,
+add a new commit to that branch, push it to GitHub, and the pull request will be
+automatically updated.  Pushing them to GitHub again is done by::
+
+    git push origin shiny-new-feature
 
-This will automatically update your Pull Request with the latest code and restart the Travis-CI tests.
+This will automatically update your pull request with the latest code and restart the
+:ref:`Continuous Integration <contributing.ci>` tests.
+
+Another reason you might need to update your pull request is to solve conflicts
+with changes that have been merged into the master branch since you opened your
+pull request.
+
+To do this, you need to "merge upstream master" in your branch::
+
+    git checkout shiny-new-feature
+    git fetch upstream
+    git merge upstream/master
+
+If there are no conflicts (or they could be fixed automatically), a file with a
+default commit message will open, and you can simply save and quit this file.
+
+If there are merge conflicts, you need to solve those conflicts. See for
+example at https://help.github.com/articles/resolving-a-merge-conflict-using-the-command-line/
+for an explanation on how to do this.
+Once the conflicts are merged and the files where the conflicts were solved are
+added, you can run ``git commit`` to save those fixes.
+
+If you have uncommitted changes at the moment you want to update the branch with
+master, you will need to ``stash`` them prior to updating (see the
+`stash docs <https://git-scm.com/book/en/v2/Git-Tools-Stashing-and-Cleaning>`__).
+This will effectively store your changes and they can be reapplied after updating.
+
+After the feature branch has been update locally, you can now update your pull
+request by pushing to the branch on GitHub::
+
+    git push origin shiny-new-feature
 
 Delete your merged branch (optional)
 ------------------------------------
 
 Once your feature branch is accepted into upstream, you'll probably want to get rid of
-the branch. First, merge upstream master into your branch so git knows it is safe to delete your branch ::
+the branch. First, merge upstream master into your branch so git knows it is safe to
+delete your branch::
 
     git fetch upstream
     git checkout master
     git merge upstream/master
 
-Then you can just do::
+Then you can do::
 
     git branch -d shiny-new-feature
 
-Make sure you use a lower-case -d, or else git won't warn you if your feature
+Make sure you use a lower-case ``-d``, or else git won't warn you if your feature
 branch has not actually been merged.
 
-The branch will still exist on GitHub, so to delete it there do ::
+The branch will still exist on GitHub, so to delete it there do::
 
     git push origin --delete shiny-new-feature
+
+.. _Gitter: https://gitter.im/pydata/pandas
diff --git a/doc/source/contributing_docstring.rst b/doc/source/contributing_docstring.rst
new file mode 100644
index 0000000000000..afb554aeffbc3
--- /dev/null
+++ b/doc/source/contributing_docstring.rst
@@ -0,0 +1,997 @@
+.. _docstring:
+
+======================
+pandas docstring guide
+======================
+
+.. note::
+  `Video tutorial: Pandas docstring guide
+  <https://www.youtube.com/watch?v=EOA0lUeW4NI>`_ by Frank Akogun.
+
+About docstrings and standards
+------------------------------
+
+A Python docstring is a string used to document a Python module, class,
+function or method, so programmers can understand what it does without having
+to read the details of the implementation.
+
+Also, it is a common practice to generate online (html) documentation
+automatically from docstrings. `Sphinx <http://www.sphinx-doc.org>`_ serves
+this purpose.
+
+Next example gives an idea on how a docstring looks like:
+
+.. code-block:: python
+
+    def add(num1, num2):
+    """
+    Add up two integer numbers.
+
+    This function simply wraps the `+` operator, and does not
+    do anything interesting, except for illustrating what is
+    the docstring of a very simple function.
+
+    Parameters
+    ----------
+    num1 : int
+        First number to add
+    num2 : int
+        Second number to add
+
+    Returns
+    -------
+    int
+        The sum of `num1` and `num2`
+
+    See Also
+    --------
+    subtract : Subtract one integer from another
+
+    Examples
+    --------
+    >>> add(2, 2)
+    4
+    >>> add(25, 0)
+    25
+    >>> add(10, -10)
+    0
+    """
+    return num1 + num2
+
+Some standards exist about docstrings, so they are easier to read, and they can
+be exported to other formats such as html or pdf.
+
+The first conventions every Python docstring should follow are defined in
+`PEP-257 <https://www.python.org/dev/peps/pep-0257/>`_.
+
+As PEP-257 is quite open, and some other standards exist on top of it. In the
+case of pandas, the numpy docstring convention is followed. The conventions is
+explained in this document:
+
+* `numpydoc docstring guide <http://numpydoc.readthedocs.io/en/latest/format.html>`_
+  (which is based in the original `Guide to NumPy/SciPy documentation
+  <https://github.com/numpy/numpy/blob/master/doc/HOWTO_DOCUMENT.rst.txt>`_)
+
+numpydoc is a Sphinx extension to support the numpy docstring convention.
+
+The standard uses reStructuredText (reST). reStructuredText is a markup
+language that allows encoding styles in plain text files. Documentation
+about reStructuredText can be found in:
+
+* `Sphinx reStructuredText primer <http://www.sphinx-doc.org/en/stable/rest.html>`_
+* `Quick reStructuredText reference <http://docutils.sourceforge.net/docs/user/rst/quickref.html>`_
+* `Full reStructuredText specification <http://docutils.sourceforge.net/docs/ref/rst/restructuredtext.html>`_
+
+Pandas has some helpers for sharing docstrings between related classes, see
+:ref:`docstring.sharing`.
+
+The rest of this document will summarize all the above guides, and will
+provide additional convention specific to the pandas project.
+
+.. _docstring.tutorial:
+
+Writing a docstring
+-------------------
+
+.. _docstring.general:
+
+General rules
+~~~~~~~~~~~~~
+
+Docstrings must be defined with three double-quotes. No blank lines should be
+left before or after the docstring. The text starts in the next line after the
+opening quotes. The closing quotes have their own line
+(meaning that they are not at the end of the last sentence).
+
+In rare occasions reST styles like bold text or italics will be used in
+docstrings, but is it common to have inline code, which is presented between
+backticks. It is considered inline code:
+
+* The name of a parameter
+* Python code, a module, function, built-in, type, literal... (e.g. ``os``,
+  ``list``, ``numpy.abs``, ``datetime.date``, ``True``)
+* A pandas class (in the form ``:class:`pandas.Series```)
+* A pandas method (in the form ``:meth:`pandas.Series.sum```)
+* A pandas function (in the form ``:func:`pandas.to_datetime```)
+
+.. note::
+    To display only the last component of the linked class, method or
+    function, prefix it with ``~``. For example, ``:class:`~pandas.Series```
+    will link to ``pandas.Series`` but only display the last part, ``Series``
+    as the link text. See `Sphinx cross-referencing syntax
+    <http://www.sphinx-doc.org/en/stable/domains.html#cross-referencing-syntax>`_
+    for details.
+
+**Good:**
+
+.. code-block:: python
+
+    def add_values(arr):
+        """
+        Add the values in `arr`.
+
+        This is equivalent to Python `sum` of :meth:`pandas.Series.sum`.
+
+        Some sections are omitted here for simplicity.
+        """
+        return sum(arr)
+
+**Bad:**
+
+.. code-block:: python
+
+    def func():
+
+        """Some function.
+
+        With several mistakes in the docstring.
+
+        It has a blank like after the signature `def func():`.
+
+        The text 'Some function' should go in the line after the
+        opening quotes of the docstring, not in the same line.
+
+        There is a blank line between the docstring and the first line
+        of code `foo = 1`.
+
+        The closing quotes should be in the next line, not in this one."""
+
+        foo = 1
+        bar = 2
+        return foo + bar
+
+.. _docstring.short_summary:
+
+Section 1: Short summary
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+The short summary is a single sentence that expresses what the function does in
+a concise way.
+
+The short summary must start with a capital letter, end with a dot, and fit in
+a single line. It needs to express what the object does without providing
+details. For functions and methods, the short summary must start with an
+infinitive verb.
+
+**Good:**
+
+.. code-block:: python
+
+    def astype(dtype):
+        """
+        Cast Series type.
+
+        This section will provide further details.
+        """
+        pass
+
+**Bad:**
+
+.. code-block:: python
+
+    def astype(dtype):
+        """
+        Casts Series type.
+
+        Verb in third-person of the present simple, should be infinitive.
+        """
+        pass
+
+    def astype(dtype):
+        """
+        Method to cast Series type.
+
+        Does not start with verb.
+        """
+        pass
+
+    def astype(dtype):
+        """
+        Cast Series type
+
+        Missing dot at the end.
+        """
+        pass
+
+    def astype(dtype):
+        """
+        Cast Series type from its current type to the new type defined in
+        the parameter dtype.
+
+        Summary is too verbose and doesn't fit in a single line.
+        """
+        pass
+
+.. _docstring.extended_summary:
+
+Section 2: Extended summary
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The extended summary provides details on what the function does. It should not
+go into the details of the parameters, or discuss implementation notes, which
+go in other sections.
+
+A blank line is left between the short summary and the extended summary. And
+every paragraph in the extended summary is finished by a dot.
+
+The extended summary should provide details on why the function is useful and
+their use cases, if it is not too generic.
+
+.. code-block:: python
+
+    def unstack():
+        """
+        Pivot a row index to columns.
+
+        When using a MultiIndex, a level can be pivoted so each value in
+        the index becomes a column. This is especially useful when a subindex
+        is repeated for the main index, and data is easier to visualize as a
+        pivot table.
+
+        The index level will be automatically removed from the index when added
+        as columns.
+        """
+        pass
+
+.. _docstring.parameters:
+
+Section 3: Parameters
+~~~~~~~~~~~~~~~~~~~~~
+
+The details of the parameters will be added in this section. This section has
+the title "Parameters", followed by a line with a hyphen under each letter of
+the word "Parameters". A blank line is left before the section title, but not
+after, and not between the line with the word "Parameters" and the one with
+the hyphens.
+
+After the title, each parameter in the signature must be documented, including
+`*args` and `**kwargs`, but not `self`.
+
+The parameters are defined by their name, followed by a space, a colon, another
+space, and the type (or types). Note that the space between the name and the
+colon is important. Types are not defined for `*args` and `**kwargs`, but must
+be defined for all other parameters. After the parameter definition, it is
+required to have a line with the parameter description, which is indented, and
+can have multiple lines. The description must start with a capital letter, and
+finish with a dot.
+
+For keyword arguments with a default value, the default will be listed after a
+comma at the end of the type. The exact form of the type in this case will be
+"int, default 0". In some cases it may be useful to explain what the default
+argument means, which can be added after a comma "int, default -1, meaning all
+cpus".
+
+In cases where the default value is `None`, meaning that the value will not be
+used. Instead of "str, default None", it is preferred to write "str, optional".
+When `None` is a value being used, we will keep the form "str, default None".
+For example, in `df.to_csv(compression=None)`, `None` is not a value being used,
+but means that compression is optional, and no compression is being used if not
+provided. In this case we will use `str, optional`. Only in cases like
+`func(value=None)` and `None` is being used in the same way as `0` or `foo`
+would be used, then we will specify "str, int or None, default None".
+
+**Good:**
+
+.. code-block:: python
+
+    class Series:
+        def plot(self, kind, color='blue', **kwargs):
+            """
+            Generate a plot.
+
+            Render the data in the Series as a matplotlib plot of the
+            specified kind.
+
+            Parameters
+            ----------
+            kind : str
+                Kind of matplotlib plot.
+            color : str, default 'blue'
+                Color name or rgb code.
+            **kwargs
+                These parameters will be passed to the matplotlib plotting
+                function.
+            """
+            pass
+
+**Bad:**
+
+.. code-block:: python
+
+    class Series:
+        def plot(self, kind, **kwargs):
+            """
+            Generate a plot.
+
+            Render the data in the Series as a matplotlib plot of the
+            specified kind.
+
+            Note the blank line between the parameters title and the first
+            parameter. Also, note that after the name of the parameter `kind`
+            and before the colon, a space is missing.
+
+            Also, note that the parameter descriptions do not start with a
+            capital letter, and do not finish with a dot.
+
+            Finally, the `**kwargs` parameter is missing.
+
+            Parameters
+            ----------
+
+            kind: str
+                kind of matplotlib plot
+            """
+            pass
+
+.. _docstring.parameter_types:
+
+Parameter types
+^^^^^^^^^^^^^^^
+
+When specifying the parameter types, Python built-in data types can be used
+directly (the Python type is preferred to the more verbose string, integer,
+boolean, etc):
+
+* int
+* float
+* str
+* bool
+
+For complex types, define the subtypes. For `dict` and `tuple`, as more than
+one type is present, we use the brackets to help read the type (curly brackets
+for `dict` and normal brackets for `tuple`):
+
+* list of int
+* dict of {str : int}
+* tuple of (str, int, int)
+* tuple of (str,)
+* set of str
+
+In case where there are just a set of values allowed, list them in curly
+brackets and separated by commas (followed by a space). If the values are
+ordinal and they have an order, list them in this order. Otherwise, list
+the default value first, if there is one:
+
+* {0, 10, 25}
+* {'simple', 'advanced'}
+* {'low', 'medium', 'high'}
+* {'cat', 'dog', 'bird'}
+
+If the type is defined in a Python module, the module must be specified:
+
+* datetime.date
+* datetime.datetime
+* decimal.Decimal
+
+If the type is in a package, the module must be also specified:
+
+* numpy.ndarray
+* scipy.sparse.coo_matrix
+
+If the type is a pandas type, also specify pandas except for Series and
+DataFrame:
+
+* Series
+* DataFrame
+* pandas.Index
+* pandas.Categorical
+* pandas.SparseArray
+
+If the exact type is not relevant, but must be compatible with a numpy
+array, array-like can be specified. If Any type that can be iterated is
+accepted, iterable can be used:
+
+* array-like
+* iterable
+
+If more than one type is accepted, separate them by commas, except the
+last two types, that need to be separated by the word 'or':
+
+* int or float
+* float, decimal.Decimal or None
+* str or list of str
+
+If ``None`` is one of the accepted values, it always needs to be the last in
+the list.
+
+For axis, the convention is to use something like:
+
+* axis : {0 or 'index', 1 or 'columns', None}, default None
+
+.. _docstring.returns:
+
+Section 4: Returns or Yields
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+If the method returns a value, it will be documented in this section. Also
+if the method yields its output.
+
+The title of the section will be defined in the same way as the "Parameters".
+With the names "Returns" or "Yields" followed by a line with as many hyphens
+as the letters in the preceding word.
+
+The documentation of the return is also similar to the parameters. But in this
+case, no name will be provided, unless the method returns or yields more than
+one value (a tuple of values).
+
+The types for "Returns" and "Yields" are the same as the ones for the
+"Parameters". Also, the description must finish with a dot.
+
+For example, with a single value:
+
+.. code-block:: python
+
+    def sample():
+        """
+        Generate and return a random number.
+
+        The value is sampled from a continuous uniform distribution between
+        0 and 1.
+
+        Returns
+        -------
+        float
+            Random number generated.
+        """
+        return random.random()
+
+With more than one value:
+
+.. code-block:: python
+
+    def random_letters():
+        """
+        Generate and return a sequence of random letters.
+
+        The length of the returned string is also random, and is also
+        returned.
+
+        Returns
+        -------
+        length : int
+            Length of the returned string.
+        letters : str
+            String of random letters.
+        """
+        length = random.randint(1, 10)
+        letters = ''.join(random.choice(string.ascii_lowercase)
+                          for i in range(length))
+        return length, letters
+
+If the method yields its value:
+
+.. code-block:: python
+
+    def sample_values():
+        """
+        Generate an infinite sequence of random numbers.
+
+        The values are sampled from a continuous uniform distribution between
+        0 and 1.
+
+        Yields
+        ------
+        float
+            Random number generated.
+        """
+        while True:
+            yield random.random()
+
+.. _docstring.see_also:
+
+Section 5: See Also
+~~~~~~~~~~~~~~~~~~~
+
+This section is used to let users know about pandas functionality
+related to the one being documented. In rare cases, if no related methods
+or functions can be found at all, this section can be skipped.
+
+An obvious example would be the `head()` and `tail()` methods. As `tail()` does
+the equivalent as `head()` but at the end of the `Series` or `DataFrame`
+instead of at the beginning, it is good to let the users know about it.
+
+To give an intuition on what can be considered related, here there are some
+examples:
+
+* ``loc`` and ``iloc``, as they do the same, but in one case providing indices
+  and in the other positions
+* ``max`` and ``min``, as they do the opposite
+* ``iterrows``, ``itertuples`` and ``iteritems``, as it is easy that a user
+  looking for the method to iterate over columns ends up in the method to
+  iterate over rows, and vice-versa
+* ``fillna`` and ``dropna``, as both methods are used to handle missing values
+* ``read_csv`` and ``to_csv``, as they are complementary
+* ``merge`` and ``join``, as one is a generalization of the other
+* ``astype`` and ``pandas.to_datetime``, as users may be reading the
+  documentation of ``astype`` to know how to cast as a date, and the way to do
+  it is with ``pandas.to_datetime``
+* ``where`` is related to ``numpy.where``, as its functionality is based on it
+
+When deciding what is related, you should mainly use your common sense and
+think about what can be useful for the users reading the documentation,
+especially the less experienced ones.
+
+When relating to other libraries (mainly ``numpy``), use the name of the module
+first (not an alias like ``np``). If the function is in a module which is not
+the main one, like ``scipy.sparse``, list the full module (e.g.
+``scipy.sparse.coo_matrix``).
+
+This section, as the previous, also has a header, "See Also" (note the capital
+S and A). Also followed by the line with hyphens, and preceded by a blank line.
+
+After the header, we will add a line for each related method or function,
+followed by a space, a colon, another space, and a short description that
+illustrated what this method or function does, why is it relevant in this
+context, and what are the key differences between the documented function and
+the one referencing. The description must also finish with a dot.
+
+Note that in "Returns" and "Yields", the description is located in the
+following line than the type. But in this section it is located in the same
+line, with a colon in between. If the description does not fit in the same
+line, it can continue in the next ones, but it has to be indented in them.
+
+For example:
+
+.. code-block:: python
+
+    class Series:
+        def head(self):
+            """
+            Return the first 5 elements of the Series.
+
+            This function is mainly useful to preview the values of the
+            Series without displaying the whole of it.
+
+            Returns
+            -------
+            Series
+                Subset of the original series with the 5 first values.
+
+            See Also
+            --------
+            Series.tail : Return the last 5 elements of the Series.
+            Series.iloc : Return a slice of the elements in the Series,
+                which can also be used to return the first or last n.
+            """
+            return self.iloc[:5]
+
+.. _docstring.notes:
+
+Section 6: Notes
+~~~~~~~~~~~~~~~~
+
+This is an optional section used for notes about the implementation of the
+algorithm. Or to document technical aspects of the function behavior.
+
+Feel free to skip it, unless you are familiar with the implementation of the
+algorithm, or you discover some counter-intuitive behavior while writing the
+examples for the function.
+
+This section follows the same format as the extended summary section.
+
+.. _docstring.examples:
+
+Section 7: Examples
+~~~~~~~~~~~~~~~~~~~
+
+This is one of the most important sections of a docstring, even if it is
+placed in the last position. As often, people understand concepts better
+with examples, than with accurate explanations.
+
+Examples in docstrings, besides illustrating the usage of the function or
+method, must be valid Python code, that in a deterministic way returns the
+presented output, and that can be copied and run by users.
+
+They are presented as a session in the Python terminal. `>>>` is used to
+present code. `...` is used for code continuing from the previous line.
+Output is presented immediately after the last line of code generating the
+output (no blank lines in between). Comments describing the examples can
+be added with blank lines before and after them.
+
+The way to present examples is as follows:
+
+1. Import required libraries (except ``numpy`` and ``pandas``)
+
+2. Create the data required for the example
+
+3. Show a very basic example that gives an idea of the most common use case
+
+4. Add examples with explanations that illustrate how the parameters can be
+   used for extended functionality
+
+A simple example could be:
+
+.. code-block:: python
+
+    class Series:
+        def head(self, n=5):
+            """
+            Return the first elements of the Series.
+
+            This function is mainly useful to preview the values of the
+            Series without displaying the whole of it.
+
+            Parameters
+            ----------
+            n : int
+                Number of values to return.
+
+            Return
+            ------
+            pandas.Series
+                Subset of the original series with the n first values.
+
+            See Also
+            --------
+            tail : Return the last n elements of the Series.
+
+            Examples
+            --------
+            >>> s = pd.Series(['Ant', 'Bear', 'Cow', 'Dog', 'Falcon',
+            ...                'Lion', 'Monkey', 'Rabbit', 'Zebra'])
+            >>> s.head()
+            0   Ant
+            1   Bear
+            2   Cow
+            3   Dog
+            4   Falcon
+            dtype: object
+
+            With the `n` parameter, we can change the number of returned rows:
+
+            >>> s.head(n=3)
+            0   Ant
+            1   Bear
+            2   Cow
+            dtype: object
+            """
+            return self.iloc[:n]
+
+The examples should be as concise as possible. In cases where the complexity of
+the function requires long examples, is recommended to use blocks with headers
+in bold. Use double star ``**`` to make a text bold, like in ``**this example**``.
+
+.. _docstring.example_conventions:
+
+Conventions for the examples
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Code in examples is assumed to always start with these two lines which are not
+shown:
+
+.. code-block:: python
+
+    import numpy as np
+    import pandas as pd
+
+
+Any other module used in the examples must be explicitly imported, one per line (as
+recommended in `PEP-8 <https://www.python.org/dev/peps/pep-0008/#imports>`_)
+and avoiding aliases. Avoid excessive imports, but if needed, imports from
+the standard library go first, followed by third-party libraries (like
+matplotlib).
+
+When illustrating examples with a single ``Series`` use the name ``s``, and if
+illustrating with a single ``DataFrame`` use the name ``df``. For indices,
+``idx`` is the preferred name. If a set of homogeneous ``Series`` or
+``DataFrame`` is used, name them ``s1``, ``s2``, ``s3``...  or ``df1``,
+``df2``, ``df3``... If the data is not homogeneous, and more than one structure
+is needed, name them with something meaningful, for example ``df_main`` and
+``df_to_join``.
+
+Data used in the example should be as compact as possible. The number of rows
+is recommended to be around 4, but make it a number that makes sense for the
+specific example. For example in the ``head`` method, it requires to be higher
+than 5, to show the example with the default values. If doing the ``mean``, we
+could use something like ``[1, 2, 3]``, so it is easy to see that the value
+returned is the mean.
+
+For more complex examples (grouping for example), avoid using data without
+interpretation, like a matrix of random numbers with columns A, B, C, D...
+And instead use a meaningful example, which makes it easier to understand the
+concept. Unless required by the example, use names of animals, to keep examples
+consistent. And numerical properties of them.
+
+When calling the method, keywords arguments ``head(n=3)`` are preferred to
+positional arguments ``head(3)``.
+
+**Good:**
+
+.. code-block:: python
+
+    class Series:
+        def mean(self):
+            """
+            Compute the mean of the input.
+
+            Examples
+            --------
+            >>> s = pd.Series([1, 2, 3])
+            >>> s.mean()
+            2
+            """
+            pass
+
+
+        def fillna(self, value):
+            """
+            Replace missing values by `value`.
+
+            Examples
+            --------
+            >>> s = pd.Series([1, np.nan, 3])
+            >>> s.fillna(0)
+            [1, 0, 3]
+            """
+            pass
+
+        def groupby_mean(self):
+            """
+            Group by index and return mean.
+
+            Examples
+            --------
+            >>> s = pd.Series([380., 370., 24., 26],
+            ...               name='max_speed',
+            ...               index=['falcon', 'falcon', 'parrot', 'parrot'])
+            >>> s.groupby_mean()
+            index
+            falcon    375.0
+            parrot     25.0
+            Name: max_speed, dtype: float64
+            """
+            pass
+
+        def contains(self, pattern, case_sensitive=True, na=numpy.nan):
+            """
+            Return whether each value contains `pattern`.
+
+            In this case, we are illustrating how to use sections, even
+            if the example is simple enough and does not require them.
+
+            Examples
+            --------
+            >>> s = pd.Series('Antelope', 'Lion', 'Zebra', numpy.nan)
+            >>> s.contains(pattern='a')
+            0    False
+            1    False
+            2     True
+            3      NaN
+            dtype: bool
+
+            **Case sensitivity**
+
+            With `case_sensitive` set to `False` we can match `a` with both
+            `a` and `A`:
+
+            >>> s.contains(pattern='a', case_sensitive=False)
+            0     True
+            1    False
+            2     True
+            3      NaN
+            dtype: bool
+
+            **Missing values**
+
+            We can fill missing values in the output using the `na` parameter:
+
+            >>> s.contains(pattern='a', na=False)
+            0    False
+            1    False
+            2     True
+            3    False
+            dtype: bool
+            """
+            pass
+
+**Bad:**
+
+.. code-block:: python
+
+    def method(foo=None, bar=None):
+        """
+        A sample DataFrame method.
+
+        Do not import numpy and pandas.
+
+        Try to use meaningful data, when it makes the example easier
+        to understand.
+
+        Try to avoid positional arguments like in `df.method(1)`. They
+        can be all right if previously defined with a meaningful name,
+        like in `present_value(interest_rate)`, but avoid them otherwise.
+
+        When presenting the behavior with different parameters, do not place
+        all the calls one next to the other. Instead, add a short sentence
+        explaining what the example shows.
+
+        Examples
+        --------
+        >>> import numpy as np
+        >>> import pandas as pd
+        >>> df = pd.DataFrame(numpy.random.randn(3, 3),
+        ...                   columns=('a', 'b', 'c'))
+        >>> df.method(1)
+        21
+        >>> df.method(bar=14)
+        123
+        """
+        pass
+
+
+.. _docstring.doctest_tips:
+
+Tips for getting your examples pass the doctests
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Getting the examples pass the doctests in the validation script can sometimes
+be tricky. Here are some attention points:
+
+* Import all needed libraries (except for pandas and numpy, those are already
+  imported as ``import pandas as pd`` and ``import numpy as np``) and define
+  all variables you use in the example.
+
+* Try to avoid using random data. However random data might be OK in some
+  cases, like if the function you are documenting deals with probability
+  distributions, or if the amount of data needed to make the function result
+  meaningful is too much, such that creating it manually is very cumbersome.
+  In those cases, always use a fixed random seed to make the generated examples
+  predictable. Example::
+
+    >>> np.random.seed(42)
+    >>> df = pd.DataFrame({'normal': np.random.normal(100, 5, 20)})
+
+* If you have a code snippet that wraps multiple lines, you need to use '...'
+  on the continued lines: ::
+
+    >>> df = pd.DataFrame([[1, 2, 3], [4, 5, 6]], index=['a', 'b', 'c'],
+    ...                   columns=['A', 'B'])
+
+* If you want to show a case where an exception is raised, you can do::
+
+    >>> pd.to_datetime(["712-01-01"])
+    Traceback (most recent call last):
+    OutOfBoundsDatetime: Out of bounds nanosecond timestamp: 712-01-01 00:00:00
+
+  It is essential to include the "Traceback (most recent call last):", but for
+  the actual error only the error name is sufficient.
+
+* If there is a small part of the result that can vary (e.g. a hash in an object
+  representation), you can use ``...`` to represent this part.
+
+  If you want to show that ``s.plot()`` returns a matplotlib AxesSubplot object,
+  this will fail the doctest ::
+
+    >>> s.plot()
+    <matplotlib.axes._subplots.AxesSubplot at 0x7efd0c0b0690>
+
+  However, you can do (notice the comment that needs to be added) ::
+
+    >>> s.plot()  # doctest: +ELLIPSIS
+    <matplotlib.axes._subplots.AxesSubplot at ...>
+
+
+.. _docstring.example_plots:
+
+Plots in examples
+^^^^^^^^^^^^^^^^^
+
+There are some methods in pandas returning plots. To render the plots generated
+by the examples in the documentation, the ``.. plot::`` directive exists.
+
+To use it, place the next code after the "Examples" header as shown below. The
+plot will be generated automatically when building the documentation.
+
+.. code-block:: python
+
+    class Series:
+        def plot(self):
+            """
+            Generate a plot with the `Series` data.
+
+            Examples
+            --------
+
+            .. plot::
+                :context: close-figs
+
+                >>> s = pd.Series([1, 2, 3])
+                >>> s.plot()
+            """
+            pass
+
+.. _docstring.sharing:
+
+Sharing Docstrings
+------------------
+
+Pandas has a system for sharing docstrings, with slight variations, between
+classes. This helps us keep docstrings consistent, while keeping things clear
+for the user reading. It comes at the cost of some complexity when writing.
+
+Each shared docstring will have a base template with variables, like
+``%(klass)s``. The variables filled in later on using the ``Substitution``
+decorator. Finally, docstrings can be appended to with the ``Appender``
+decorator.
+
+In this example, we'll create a parent docstring normally (this is like
+``pandas.core.generic.NDFrame``. Then we'll have two children (like
+``pandas.core.series.Series`` and ``pandas.core.frame.DataFrame``). We'll
+substitute the children's class names in this docstring.
+
+.. code-block:: python
+
+   class Parent:
+       def my_function(self):
+           """Apply my function to %(klass)s."""
+           ...
+
+   class ChildA(Parent):
+       @Substitution(klass="ChildA")
+       @Appender(Parent.my_function.__doc__)
+       def my_function(self):
+           ...
+
+   class ChildB(Parent):
+       @Substitution(klass="ChildB")
+       @Appender(Parent.my_function.__doc__)
+       def my_function(self):
+           ...
+
+The resulting docstrings are
+
+.. code-block:: python
+
+   >>> print(Parent.my_function.__doc__)
+   Apply my function to %(klass)s.
+   >>> print(ChildA.my_function.__doc__)
+   Apply my function to ChildA.
+   >>> print(ChildB.my_function.__doc__)
+   Apply my function to ChildB.
+
+Notice two things:
+
+1. We "append" the parent docstring to the children docstrings, which are
+   initially empty.
+2. Python decorators are applied inside out. So the order is Append then
+   Substitution, even though Substitution comes first in the file.
+
+Our files will often contain a module-level ``_shared_doc_kwargs`` with some
+common substitution values (things like ``klass``, ``axes``, etc).
+
+You can substitute and append in one shot with something like
+
+.. code-block:: python
+
+   @Appender(template % _shared_doc_kwargs)
+   def my_function(self):
+       ...
+
+where ``template`` may come from a module-level ``_shared_docs`` dictionary
+mapping function names to docstrings. Wherever possible, we prefer using
+``Appender`` and ``Substitution``, since the docstring-writing processes is
+slightly closer to normal.
+
+See ``pandas.core.generic.NDFrame.fillna`` for an example template, and
+``pandas.core.series.Series.fillna`` and ``pandas.core.generic.frame.fillna``
+for the filled versions.
diff --git a/doc/source/cookbook.rst b/doc/source/cookbook.rst
index 0b05f062f5fce..f6fa9e9f86143 100644
--- a/doc/source/cookbook.rst
+++ b/doc/source/cookbook.rst
@@ -7,6 +7,7 @@
 
    import pandas as pd
    import numpy as np
+   from pandas.compat import StringIO
 
    import random
    import os
@@ -19,10 +20,7 @@
    pd.options.display.max_rows=15
 
    import matplotlib
-   try:
-      matplotlib.style.use('ggplot')
-   except AttributeError:
-      pd.options.display.mpl_style = 'default'
+   # matplotlib.style.use('default')
 
    np.set_printoptions(precision=4, suppress=True)
 
@@ -43,7 +41,7 @@ above what the in-line examples offer.
 Pandas (pd) and Numpy (np) are the only two abbreviated imported modules. The rest are kept
 explicitly imported for newer users.
 
-These examples are written for python 3.4.  Minor tweaks might be necessary for earlier python
+These examples are written for Python 3.  Minor tweaks might be necessary for earlier python
 versions.
 
 Idioms
@@ -68,19 +66,19 @@ An if-then on one column
 
 .. ipython:: python
 
-   df.ix[df.AAA >= 5,'BBB'] = -1; df
+   df.loc[df.AAA >= 5,'BBB'] = -1; df
 
 An if-then with assignment to 2 columns:
 
 .. ipython:: python
 
-   df.ix[df.AAA >= 5,['BBB','CCC']] = 555; df
+   df.loc[df.AAA >= 5,['BBB','CCC']] = 555; df
 
 Add another line with different logic, to do the -else
 
 .. ipython:: python
 
-   df.ix[df.AAA < 5,['BBB','CCC']] = 2000; df
+   df.loc[df.AAA < 5,['BBB','CCC']] = 2000; df
 
 Or use pandas where after you've set up a mask
 
@@ -110,10 +108,8 @@ Splitting
    df = pd.DataFrame(
         {'AAA' : [4,5,6,7], 'BBB' : [10,20,30,40],'CCC' : [100,50,-30,-50]}); df
 
-   dflow = df[df.AAA <= 5]
-   dfhigh = df[df.AAA > 5]
-
-   dflow; dfhigh
+   dflow = df[df.AAA <= 5]; dflow
+   dfhigh = df[df.AAA > 5]; dfhigh
 
 Building Criteria
 *****************
@@ -136,7 +132,7 @@ Building Criteria
 
 .. ipython:: python
 
-   newseries = df.loc[(df['BBB'] > 25) | (df['CCC'] >= -40), 'AAA']; newseries;
+   newseries = df.loc[(df['BBB'] > 25) | (df['CCC'] >= -40), 'AAA']; newseries
 
 ...or (with assignment modifies the DataFrame.)
 
@@ -153,7 +149,7 @@ Building Criteria
         {'AAA' : [4,5,6,7], 'BBB' : [10,20,30,40],'CCC' : [100,50,-30,-50]}); df
 
    aValue = 43.0
-   df.ix[(df.CCC-aValue).abs().argsort()]
+   df.loc[(df.CCC-aValue).abs().argsort()]
 
 `Dynamically reduce a list of criteria using a binary operators
 <http://stackoverflow.com/questions/21058254/pandas-boolean-operation-in-a-python-list/21058331>`__
@@ -203,7 +199,7 @@ The :ref:`indexing <indexing>` docs.
    df[(df.AAA <= 6) & (df.index.isin([0,2,4]))]
 
 `Use loc for label-oriented slicing and iloc positional slicing
-<https://github.com/pydata/pandas/issues/2904>`__
+<https://github.com/pandas-dev/pandas/issues/2904>`__
 
 .. ipython:: python
 
@@ -221,9 +217,9 @@ There are 2 explicit slicing methods, with a third general case
 
    df.loc['bar':'kar'] #Label
 
-   #Generic
-   df.ix[0:3] #Same as .iloc[0:3]
-   df.ix['bar':'kar'] #Same as .loc['bar':'kar']
+   # Generic
+   df.iloc[0:3]
+   df.loc['bar':'kar']
 
 Ambiguity arises when an index consists of integers with a non-zero start or non-unit increment.
 
@@ -235,9 +231,6 @@ Ambiguity arises when an index consists of integers with a non-zero start or non
 
    df2.loc[1:3] #Label-oriented
 
-   df2.ix[1:3] #General, will mimic loc (label-oriented)
-   df2.ix[0:3] #General, will mimic iloc (position-oriented), as loc[0:3] would raise a KeyError
-
 `Using inverse operator (~) to take the complement of a mask
 <http://stackoverflow.com/questions/14986510/picking-out-elements-based-on-complement-of-indices-in-python-pandas>`__
 
@@ -263,12 +256,6 @@ Panels
 
    pf = pd.Panel({'df1':df1,'df2':df2,'df3':df3});pf
 
-   #Assignment using Transpose  (pandas < 0.15)
-   pf = pf.transpose(2,0,1)
-   pf['E'] = pd.DataFrame(data, rng, cols)
-   pf = pf.transpose(1,2,0);pf
-
-   #Direct assignment (pandas > 0.15)
    pf.loc[:,:,'F'] = pd.DataFrame(data, rng, cols);pf
 
 `Mask a panel by using np.where and then reconstructing the panel with the new masked values
@@ -299,7 +286,7 @@ New Columns
    df = pd.DataFrame(
         {'AAA' : [1,1,1,2,2,2,3,3], 'BBB' : [2,1,3,4,5,1,2,3]}); df
 
-Method 1 : idxmin() to get the index of the mins
+Method 1 : idxmin() to get the index of the minimums
 
 .. ipython:: python
 
@@ -320,7 +307,7 @@ MultiIndexing
 
 The :ref:`multindexing <advanced.hierarchical>` docs.
 
-`Creating a multi-index from a labeled frame
+`Creating a MultiIndex from a labeled frame
 <http://stackoverflow.com/questions/14916358/reshaping-dataframes-in-pandas-based-on-column-labels>`__
 
 .. ipython:: python
@@ -333,7 +320,7 @@ The :ref:`multindexing <advanced.hierarchical>` docs.
 
    # As Labelled Index
    df = df.set_index('row');df
-   # With Heirarchical Columns
+   # With Hierarchical Columns
    df.columns = pd.MultiIndex.from_tuples([tuple(c.split('_')) for c in df.columns]);df
    # Now stack & Reset
    df = df.stack(0).reset_index(1);df
@@ -343,7 +330,7 @@ The :ref:`multindexing <advanced.hierarchical>` docs.
 Arithmetic
 **********
 
-`Performing arithmetic with a multi-index that needs broadcasting
+`Performing arithmetic with a MultiIndex that needs broadcasting
 <http://stackoverflow.com/questions/19501510/divide-entire-pandas-multiindex-dataframe-by-dataframe-variable/19502176#19502176>`__
 
 .. ipython:: python
@@ -355,7 +342,7 @@ Arithmetic
 Slicing
 *******
 
-`Slicing a multi-index with xs
+`Slicing a MultiIndex with xs
 <http://stackoverflow.com/questions/12590131/how-to-slice-multindex-columns-in-pandas-dataframes>`__
 
 .. ipython:: python
@@ -376,7 +363,7 @@ To take the cross section of the 1st level and 1st axis the index:
 
    df.xs('six',level=1,axis=0)
 
-`Slicing a multi-index with xs, method #2
+`Slicing a MultiIndex with xs, method #2
 <http://stackoverflow.com/questions/14964493/multiindex-based-indexing-in-pandas>`__
 
 .. ipython:: python
@@ -399,13 +386,13 @@ To take the cross section of the 1st level and 1st axis the index:
    df.loc[(All,'Math'),('Exams')]
    df.loc[(All,'Math'),(All,'II')]
 
-`Setting portions of a multi-index with xs
+`Setting portions of a MultiIndex with xs
 <http://stackoverflow.com/questions/19319432/pandas-selecting-a-lower-level-in-a-dataframe-to-do-a-ffill>`__
 
 Sorting
 *******
 
-`Sort by specific column or an ordered list of columns, with a multi-index
+`Sort by specific column or an ordered list of columns, with a MultiIndex
 <http://stackoverflow.com/questions/14733871/mutli-index-sorting-in-pandas>`__
 
 .. ipython:: python
@@ -413,7 +400,7 @@ Sorting
    df.sort_values(by=('Labs', 'II'), ascending=False)
 
 `Partial Selection, the need for sortedness;
-<https://github.com/pydata/pandas/issues/2995>`__
+<https://github.com/pandas-dev/pandas/issues/2995>`__
 
 Levels
 ******
@@ -424,14 +411,6 @@ Levels
 `Flatten Hierarchical columns
 <http://stackoverflow.com/questions/14507794/python-pandas-how-to-flatten-a-hierarchical-index-in-columns>`__
 
-panelnd
-*******
-
-The :ref:`panelnd<dsintro.panelnd>` docs.
-
-`Construct a 5D panelnd
-<http://stackoverflow.com/questions/18748598/why-my-panelnd-factory-throwing-a-keyerror>`__
-
 .. _cookbook.missing_data:
 
 Missing Data
@@ -444,7 +423,7 @@ Fill forward a reversed timeseries
 .. ipython:: python
 
    df = pd.DataFrame(np.random.randn(6,1), index=pd.date_range('2013-08-01', periods=6, freq='B'), columns=list('A'))
-   df.ix[3,'A'] = np.nan
+   df.loc[df.index[3], 'A'] = np.nan
    df
    df.reindex(df.index[::-1]).ffill()
 
@@ -517,7 +496,7 @@ Unlike agg, apply's callable is passed a sub-DataFrame which gives you access to
    def Red(x):
       return functools.reduce(CumRet,x,1.0)
 
-   pd.expanding_apply(S, Red)
+   S.expanding().apply(Red, raw=True)
 
 
 `Replacing some values with mean of the rest of a group
@@ -549,7 +528,7 @@ Unlike agg, apply's callable is passed a sub-DataFrame which gives you access to
 
    agg_n_sort_order = code_groups[['data']].transform(sum).sort_values(by='data')
 
-   sorted_df = df.ix[agg_n_sort_order.index]
+   sorted_df = df.loc[agg_n_sort_order.index]
 
    sorted_df
 
@@ -567,7 +546,7 @@ Unlike agg, apply's callable is passed a sub-DataFrame which gives you access to
       return pd.NaT
 
    mhc = {'Mean' : np.mean, 'Max' : np.max, 'Custom' : MyCust}
-   ts.resample("5min",how = mhc)
+   ts.resample("5min").apply(mhc)
    ts
 
 `Create a value counts column and reassign back to the DataFrame
@@ -639,7 +618,7 @@ Create a list of dataframes, split using a delineation based on logic included i
    df = pd.DataFrame(data={'Case' : ['A','A','A','B','A','A','B','A','A'],
                            'Data' : np.random.randn(9)})
 
-   dfs = list(zip(*df.groupby(pd.rolling_median((1*(df['Case']=='B')).cumsum(),3,True))))[-1]
+   dfs = list(zip(*df.groupby((1*(df['Case']=='B')).cumsum().rolling(window=3,min_periods=1).median())))[-1]
 
    dfs[0]
    dfs[1]
@@ -682,10 +661,23 @@ The :ref:`Pivot <reshaping.pivot>` docs.
                        'Employed' : lambda x : sum(x),
                        'Grade' : lambda x : sum(x) / len(x)})
 
+`Plot pandas DataFrame with year over year data
+<http://stackoverflow.com/questions/30379789/plot-pandas-data-frame-with-year-over-year-data>`__
+
+To create year and month cross tabulation:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'value': np.random.randn(36)},
+                     index=pd.date_range('2011-01-01', freq='M', periods=36))
+
+   pd.pivot_table(df, index=df.index.month, columns=df.index.year,
+                  values='value', aggfunc='sum')
+
 Apply
 *****
 
-`Rolling Apply to Organize - Turning embedded lists into a multi-index frame
+`Rolling Apply to Organize - Turning embedded lists into a MultiIndex frame
 <http://stackoverflow.com/questions/17349981/converting-pandas-dataframe-with-categorical-values-into-binary-values>`__
 
 .. ipython:: python
@@ -726,9 +718,10 @@ Rolling Apply to multiple columns where function returns a Scalar (Volume Weight
                       'Close' : np.random.randn(len(rng)),
                       'Volume' : np.random.randint(100,2000,len(rng))}, index=rng); df
 
-   def vwap(bars): return ((bars.Close*bars.Volume).sum()/bars.Volume.sum()).round(2)
+   def vwap(bars): return ((bars.Close*bars.Volume).sum()/bars.Volume.sum())
    window = 5
-   s = pd.concat([ (pd.Series(vwap(df.iloc[i:i+window]), index=[df.index[i+window]])) for i in range(len(df)-window) ]); s
+   s = pd.concat([ (pd.Series(vwap(df.iloc[i:i+window]), index=[df.index[i+window]])) for i in range(len(df)-window) ]);
+   s.round(2)
 
 Timeseries
 ----------
@@ -749,7 +742,7 @@ Timeseries
 <http://nipunbatra.github.io/2015/06/timeseries/>`__
 
 Turn a matrix with hours in columns and days in rows into a continuous row sequence in the form of a time series.
-`How to rearrange a python pandas DataFrame?
+`How to rearrange a Python pandas DataFrame?
 <http://stackoverflow.com/questions/15432659/how-to-rearrange-a-python-pandas-dataframe>`__
 
 `Dealing with duplicates when reindexing a timeseries to a specified frequency
@@ -769,14 +762,20 @@ Resampling
 
 The :ref:`Resample <timeseries.resampling>` docs.
 
-`TimeGrouping of values grouped across time
-<http://stackoverflow.com/questions/15297053/how-can-i-divide-single-values-of-a-dataframe-by-monthly-averages>`__
+`Using Grouper instead of TimeGrouper for time grouping of values
+<https://stackoverflow.com/questions/15297053/how-can-i-divide-single-values-of-a-dataframe-by-monthly-averages>`__
+
+`Time grouping with some missing values
+<https://stackoverflow.com/questions/33637312/pandas-grouper-by-frequency-with-completeness-requirement>`__
+
+`Valid frequency arguments to Grouper
+<http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__
 
-`TimeGrouping #2
-<http://stackoverflow.com/questions/14569223/timegrouper-pandas>`__
+`Grouping using a MultiIndex
+<https://stackoverflow.com/questions/41483763/pandas-timegrouper-on-multiindex>`__
 
 `Using TimeGrouper and another grouping to create subgroups, then apply a custom function
-<https://github.com/pydata/pandas/issues/3791>`__
+<https://github.com/pandas-dev/pandas/issues/3791>`__
 
 `Resampling with custom periods
 <http://stackoverflow.com/questions/15408156/resampling-with-custom-periods>`__
@@ -805,14 +804,14 @@ The :ref:`Concat <merging.concatenation>` docs. The :ref:`Join <merging.join>` d
    df1 = pd.DataFrame(np.random.randn(6, 3), index=rng, columns=['A', 'B', 'C'])
    df2 = df1.copy()
 
-ignore_index is needed in pandas < v0.13, and depending on df construction
+Depending on df construction, ``ignore_index`` may be needed
 
 .. ipython:: python
 
    df = df1.append(df2,ignore_index=True); df
 
 `Self Join of a DataFrame
-<https://github.com/pydata/pandas/issues/2996>`__
+<https://github.com/pandas-dev/pandas/issues/2996>`__
 
 .. ipython:: python
 
@@ -866,7 +865,7 @@ The :ref:`Plotting <visualization>` docs.
 <http://stackoverflow.com/questions/17891493/annotating-points-from-a-pandas-dataframe-in-matplotlib-plot>`__
 
 `Generate Embedded plots in excel files using Pandas, Vincent and xlsxwriter
-<http://pandas-xlsxwriter-charts.readthedocs.org/en/latest/introduction.html>`__
+<https://pandas-xlsxwriter-charts.readthedocs.io/>`__
 
 `Boxplot for each quartile of a stratifying variable
 <http://stackoverflow.com/questions/23232989/boxplot-stratified-by-column-in-python-pandas>`__
@@ -898,14 +897,11 @@ CSV
 
 The :ref:`CSV <io.read_csv_table>` docs
 
-`read_csv in action <http://wesmckinney.com/blog/?p=635>`__
+`read_csv in action <http://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/>`__
 
 `appending to a csv
 <http://stackoverflow.com/questions/17134942/pandas-dataframe-output-end-of-csv>`__
 
-`how to read in multiple files, appending to create a single dataframe
-<http://stackoverflow.com/questions/25210819/speeding-up-data-import-function-pandas-and-appending-to-dataframe/25210900#25210900>`__
-
 `Reading a csv chunk-by-chunk
 <http://stackoverflow.com/questions/11622652/large-persistent-dataframe-in-pandas/12193309#12193309>`__
 
@@ -925,7 +921,7 @@ using that handle to read.
 <http://stackoverflow.com/questions/15555005/get-inferred-dataframe-types-iteratively-using-chunksize>`__
 
 `Dealing with bad lines
-<http://github.com/pydata/pandas/issues/2886>`__
+<http://github.com/pandas-dev/pandas/issues/2886>`__
 
 `Dealing with bad lines II
 <http://nipunbatra.github.io/2013/06/reading-unclean-data-csv-using-pandas/>`__
@@ -936,6 +932,42 @@ using that handle to read.
 `Write a multi-row index CSV without writing duplicates
 <http://stackoverflow.com/questions/17349574/pandas-write-multiindex-rows-with-to-csv>`__
 
+.. _cookbook.csv.multiple_files:
+
+Reading multiple files to create a single DataFrame
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The best way to combine multiple files into a single DataFrame is to read the individual frames one by one, put all
+of the individual frames into a list, and then combine the frames in the list using :func:`pd.concat`:
+
+.. ipython:: python
+
+    for i in range(3):
+        data = pd.DataFrame(np.random.randn(10, 4))
+        data.to_csv('file_{}.csv'.format(i))
+
+    files = ['file_0.csv', 'file_1.csv', 'file_2.csv']
+    result = pd.concat([pd.read_csv(f) for f in files], ignore_index=True)
+
+You can use the same approach to read all files matching a pattern.  Here is an example using ``glob``:
+
+.. ipython:: python
+
+    import glob
+    files = glob.glob('file_*.csv')
+    result = pd.concat([pd.read_csv(f) for f in files], ignore_index=True)
+
+Finally, this strategy will work with the other ``pd.read_*(...)`` functions described in the :ref:`io docs<io>`.
+
+.. ipython:: python
+    :suppress:
+
+    for i in range(3):
+        os.remove('file_{}.csv'.format(i))
+
+Parsing date components in multi-columns
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
 Parsing date components in multi-columns is faster with a format
 
 .. code-block:: python
@@ -971,6 +1003,51 @@ Parsing date components in multi-columns is faster with a format
     In [36]: %timeit pd.to_datetime(ds)
     1 loops, best of 3: 488 ms per loop
 
+Skip row between header and data
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. ipython:: python
+
+    data = """;;;;
+     ;;;;
+     ;;;;
+     ;;;;
+     ;;;;
+     ;;;;
+    ;;;;
+     ;;;;
+     ;;;;
+    ;;;;
+    date;Param1;Param2;Param4;Param5
+        ;m²;°C;m²;m
+    ;;;;
+    01.01.1990 00:00;1;1;2;3
+    01.01.1990 01:00;5;3;4;5
+    01.01.1990 02:00;9;5;6;7
+    01.01.1990 03:00;13;7;8;9
+    01.01.1990 04:00;17;9;10;11
+    01.01.1990 05:00;21;11;12;13
+    """
+
+Option 1: pass rows explicitly to skip rows
+"""""""""""""""""""""""""""""""""""""""""""
+
+.. ipython:: python
+
+    pd.read_csv(StringIO(data), sep=';', skiprows=[11,12],
+            index_col=0, parse_dates=True, header=10)
+
+Option 2: read column names and then data
+"""""""""""""""""""""""""""""""""""""""""
+
+.. ipython:: python
+
+    pd.read_csv(StringIO(data), sep=';', header=10, nrows=10).columns
+    columns = pd.read_csv(StringIO(data), sep=';', header=10, nrows=10).columns
+    pd.read_csv(StringIO(data), sep=';', index_col=0,
+                header=12, parse_dates=True, names=columns)
+
+
 .. _cookbook.sql:
 
 SQL
@@ -1013,7 +1090,7 @@ The :ref:`HDFStores <io.hdf5>` docs
 <http://stackoverflow.com/questions/13926089/selecting-columns-from-pandas-hdfstore-table>`__
 
 `Managing heterogeneous data using a linked multiple table hierarchy
-<http://github.com/pydata/pandas/issues/3032>`__
+<http://github.com/pandas-dev/pandas/issues/3032>`__
 
 `Merging on-disk tables with millions of rows
 <http://stackoverflow.com/questions/14614512/merging-two-tables-with-millions-of-rows-in-python/14617925#14617925>`__
@@ -1067,7 +1144,7 @@ Storing Attributes to a group node
    store = pd.HDFStore('test.h5')
    store.put('df',df)
 
-   # you can store an arbitrary python object via pickle
+   # you can store an arbitrary Python object via pickle
    store.get_storer('df').attrs.my_attribute = dict(A = 10)
    store.get_storer('df').attrs.my_attribute
 
@@ -1077,13 +1154,12 @@ Storing Attributes to a group node
    store.close()
    os.remove('test.h5')
 
-
 .. _cookbook.binary:
 
 Binary Files
 ************
 
-pandas readily accepts numpy record arrays, if you need to read in a binary
+pandas readily accepts NumPy record arrays, if you need to read in a binary
 file consisting of an array of C structs. For example, given this C program
 in a file called ``main.c`` compiled with ``gcc main.c -std=gnu99`` on a
 64-bit machine,
@@ -1155,7 +1231,7 @@ Timedeltas
 The :ref:`Timedeltas <timedeltas.timedeltas>` docs.
 
 `Using timedeltas
-<http://github.com/pydata/pandas/pull/2899>`__
+<http://github.com/pandas-dev/pandas/pull/2899>`__
 
 .. ipython:: python
 
diff --git a/doc/source/developer.rst b/doc/source/developer.rst
new file mode 100644
index 0000000000000..f76af394abc48
--- /dev/null
+++ b/doc/source/developer.rst
@@ -0,0 +1,142 @@
+.. _developer:
+
+.. currentmodule:: pandas
+
+.. ipython:: python
+   :suppress:
+
+   import numpy as np
+   np.random.seed(123456)
+   np.set_printoptions(precision=4, suppress=True)
+   import pandas as pd
+   pd.options.display.max_rows = 15
+
+*********
+Developer
+*********
+
+This section will focus on downstream applications of pandas.
+
+.. _apache.parquet:
+
+Storing pandas DataFrame objects in Apache Parquet format
+---------------------------------------------------------
+
+The `Apache Parquet <https://github.com/apache/parquet-format>`__ format
+provides key-value metadata at the file and column level, stored in the footer
+of the Parquet file:
+
+.. code-block:: shell
+
+  5: optional list<KeyValue> key_value_metadata
+
+where ``KeyValue`` is
+
+.. code-block:: shell
+
+   struct KeyValue {
+     1: required string key
+     2: optional string value
+   }
+
+So that a ``pandas.DataFrame`` can be faithfully reconstructed, we store a
+``pandas`` metadata key in the ``FileMetaData`` with the value stored as :
+
+.. code-block:: text
+
+   {'index_columns': ['__index_level_0__', '__index_level_1__', ...],
+    'column_indexes': [<ci0>, <ci1>, ..., <ciN>],
+    'columns': [<c0>, <c1>, ...],
+    'pandas_version': $VERSION}
+
+Here, ``<c0>``/``<ci0>`` and so forth are dictionaries containing the metadata
+for each column. This has JSON form:
+
+.. code-block:: text
+
+   {'name': column_name,
+    'pandas_type': pandas_type,
+    'numpy_type': numpy_type,
+    'metadata': metadata}
+
+``pandas_type`` is the logical type of the column, and is one of:
+
+* Boolean: ``'bool'``
+* Integers: ``'int8', 'int16', 'int32', 'int64', 'uint8', 'uint16', 'uint32', 'uint64'``
+* Floats: ``'float16', 'float32', 'float64'``
+* Date and Time Types: ``'datetime', 'datetimetz'``, ``'timedelta'``
+* String: ``'unicode', 'bytes'``
+* Categorical: ``'categorical'``
+* Other Python objects: ``'object'``
+
+The ``numpy_type`` is the physical storage type of the column, which is the
+result of ``str(dtype)`` for the underlying NumPy array that holds the data. So
+for ``datetimetz`` this is ``datetime64[ns]`` and for categorical, it may be
+any of the supported integer categorical types.
+
+The ``metadata`` field is ``None`` except for:
+
+* ``datetimetz``: ``{'timezone': zone, 'unit': 'ns'}``, e.g. ``{'timezone',
+  'America/New_York', 'unit': 'ns'}``. The ``'unit'`` is optional, and if
+  omitted it is assumed to be nanoseconds.
+* ``categorical``: ``{'num_categories': K, 'ordered': is_ordered, 'type': $TYPE}``
+
+    * Here ``'type'`` is optional, and can be a nested pandas type specification
+      here (but not categorical)
+
+* ``unicode``: ``{'encoding': encoding}``
+
+    * The encoding is optional, and if not present is UTF-8
+
+* ``object``: ``{'encoding': encoding}``. Objects can be serialized and stored
+  in ``BYTE_ARRAY`` Parquet columns. The encoding can be one of:
+
+    * ``'pickle'``
+    * ``'msgpack'``
+    * ``'bson'``
+    * ``'json'``
+
+* ``timedelta``: ``{'unit': 'ns'}``. The ``'unit'`` is optional, and if omitted
+  it is assumed to be nanoseconds. This metadata is optional altogether
+
+For types other than these, the ``'metadata'`` key can be
+omitted. Implementations can assume ``None`` if the key is not present.
+
+As an example of fully-formed metadata:
+
+.. code-block:: text
+
+   {'index_columns': ['__index_level_0__'],
+    'column_indexes': [
+        {'name': None,
+         'pandas_type': 'string',
+         'numpy_type': 'object',
+         'metadata': None}
+    ],
+    'columns': [
+        {'name': 'c0',
+         'pandas_type': 'int8',
+         'numpy_type': 'int8',
+         'metadata': None},
+        {'name': 'c1',
+         'pandas_type': 'bytes',
+         'numpy_type': 'object',
+         'metadata': None},
+        {'name': 'c2',
+         'pandas_type': 'categorical',
+         'numpy_type': 'int16',
+         'metadata': {'num_categories': 1000, 'ordered': False}},
+        {'name': 'c3',
+         'pandas_type': 'datetimetz',
+         'numpy_type': 'datetime64[ns]',
+         'metadata': {'timezone': 'America/Los_Angeles'}},
+        {'name': 'c4',
+         'pandas_type': 'object',
+         'numpy_type': 'object',
+         'metadata': {'encoding': 'pickle'}},
+        {'name': '__index_level_0__',
+         'pandas_type': 'int64',
+         'numpy_type': 'int64',
+         'metadata': None}
+    ],
+    'pandas_version': '0.20.0'}
diff --git a/doc/source/dsintro.rst b/doc/source/dsintro.rst
index 5a62e7dccea34..efa52a6f7cfe2 100644
--- a/doc/source/dsintro.rst
+++ b/doc/source/dsintro.rst
@@ -10,10 +10,7 @@
    pd.options.display.max_rows = 15
 
    import matplotlib
-   try:
-      matplotlib.style.use('ggplot')
-   except AttributeError:
-      pd.options.display.mpl_style = 'default'
+   # matplotlib.style.use('default')
    import matplotlib.pyplot as plt
    plt.close('all')
 
@@ -26,7 +23,7 @@ Intro to Data Structures
 We'll start with a quick, non-comprehensive overview of the fundamental data
 structures in pandas to get you started. The fundamental behavior about data
 types, indexing, and axis labeling / alignment apply across all of the
-objects. To get started, import numpy and load pandas into your namespace:
+objects. To get started, import NumPy and load pandas into your namespace:
 
 .. ipython:: python
 
@@ -44,12 +41,6 @@ categories of functionality and methods in separate sections.
 Series
 ------
 
-.. warning::
-
-   In 0.13.0 ``Series`` has internaly been refactored to no longer sub-class ``ndarray``
-   but instead subclass ``NDFrame``, similarly to the rest of the pandas containers. This should be
-   a transparent change with only very limited API implications (See the :ref:`Internal Refactoring<whatsnew_0130.refactoring>`)
-
 :class:`Series` is a one-dimensional labeled array capable of holding any data
 type (integers, strings, floating point numbers, Python objects, etc.). The axis
 labels are collectively referred to as the **index**. The basic method to create a Series is to call:
@@ -60,9 +51,9 @@ labels are collectively referred to as the **index**. The basic method to create
 
 Here, ``data`` can be many different things:
 
- - a Python dict
- - an ndarray
- - a scalar value (like 5)
+* a Python dict
+* an ndarray
+* a scalar value (like 5)
 
 The passed **index** is a list of axis labels. Thus, this separates into a few
 cases depending on what **data is**:
@@ -82,7 +73,7 @@ index is passed, one will be created having values ``[0, ..., len(data) - 1]``.
 
 .. note::
 
-    Starting in v0.8.0, pandas supports non-unique index values. If an operation
+    pandas supports non-unique index values. If an operation
     that does not support duplicate index values is attempted, an exception
     will be raised at that time. The reason for being lazy is nearly all performance-based
     (there are many instances in computations, like parts of GroupBy, where the index
@@ -90,9 +81,28 @@ index is passed, one will be created having values ``[0, ..., len(data) - 1]``.
 
 **From dict**
 
-If ``data`` is a dict, if **index** is passed the values in data corresponding
-to the labels in the index will be pulled out. Otherwise, an index will be
-constructed from the sorted keys of the dict, if possible.
+Series can be instantiated from dicts:
+
+.. ipython:: python
+
+   d = {'b' : 1, 'a' : 0, 'c' : 2}
+   pd.Series(d)
+
+.. note::
+
+   When the data is a dict, and an index is not passed, the ``Series`` index
+   will be ordered by the dict's insertion order, if you're using Python
+   version >= 3.6 and Pandas version >= 0.23.
+
+   If you're using Python < 3.6 or Pandas < 0.23, and an index is not passed,
+   the ``Series`` index will be the lexically ordered list of dict keys.
+
+In the example above, if you were on a Python version lower than 3.6 or a
+Pandas version lower than 0.23, the ``Series`` would be ordered by the lexical
+order of the dict keys (i.e. ``['a', 'b', 'c']`` rather than ``['b', 'a', 'c']``).
+
+If an index is passed, the values in data corresponding to the labels in the
+index will be pulled out.
 
 .. ipython:: python
 
@@ -102,10 +112,12 @@ constructed from the sorted keys of the dict, if possible.
 
 .. note::
 
-    NaN (not a number) is the standard missing data marker used in pandas
+    NaN (not a number) is the standard missing data marker used in pandas.
+
+**From scalar value**
 
-**From scalar value** If ``data`` is a scalar value, an index must be
-provided. The value will be repeated to match the length of **index**
+If ``data`` is a scalar value, an index must be
+provided. The value will be repeated to match the length of **index**.
 
 .. ipython:: python
 
@@ -115,7 +127,7 @@ Series is ndarray-like
 ~~~~~~~~~~~~~~~~~~~~~~
 
 ``Series`` acts very similarly to a ``ndarray``, and is a valid argument to most NumPy functions.
-However, things like slicing also slice the index.
+However, operations such as slicing will also slice the index.
 
 .. ipython :: python
 
@@ -161,10 +173,9 @@ See also the :ref:`section on attribute access<indexing.attribute_access>`.
 Vectorized operations and label alignment with Series
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-When doing data analysis, as with raw NumPy arrays looping through Series
-value-by-value is usually not necessary. Series can be also be passed into most
-NumPy methods expecting an ndarray.
-
+When working with raw NumPy arrays, looping through value-by-value is usually
+not necessary. The same is true when working with Series in pandas.
+Series can also be passed into most NumPy methods expecting an ndarray.
 
 .. ipython:: python
 
@@ -214,6 +225,17 @@ Series can also have a ``name`` attribute:
 The Series ``name`` will be assigned automatically in many cases, in particular
 when taking 1D slices of DataFrame as you will see below.
 
+.. versionadded:: 0.18.0
+
+You can rename a Series with the :meth:`pandas.Series.rename` method.
+
+.. ipython:: python
+
+   s2 = s.rename("different")
+   s2.name
+
+Note that ``s`` and ``s2`` refer to different objects.
+
 .. _basics.dataframe:
 
 DataFrame
@@ -224,12 +246,12 @@ potentially different types. You can think of it like a spreadsheet or SQL
 table, or a dict of Series objects. It is generally the most commonly used
 pandas object. Like Series, DataFrame accepts many different kinds of input:
 
- - Dict of 1D ndarrays, lists, dicts, or Series
- - 2-D numpy.ndarray
- - `Structured or record
-   <http://docs.scipy.org/doc/numpy/user/basics.rec.html>`__ ndarray
- - A ``Series``
- - Another ``DataFrame``
+* Dict of 1D ndarrays, lists, dicts, or Series
+* 2-D numpy.ndarray
+* `Structured or record
+  <http://docs.scipy.org/doc/numpy/user/basics.rec.html>`__ ndarray
+* A ``Series``
+* Another ``DataFrame``
 
 Along with the data, you can optionally pass **index** (row labels) and
 **columns** (column labels) arguments. If you pass an index and / or columns,
@@ -240,12 +262,22 @@ not matching up to the passed index.
 If axis labels are not passed, they will be constructed from the input data
 based on common sense rules.
 
+.. note::
+
+   When the data is a dict, and ``columns`` is not specified, the ``DataFrame``
+   columns will be ordered by the dict's insertion order, if you are using
+   Python version >= 3.6 and Pandas >= 0.23.
+
+   If you are using Python < 3.6 or Pandas < 0.23, and ``columns`` is not
+   specified, the ``DataFrame`` columns will be the lexically ordered list of dict
+   keys.
+
 From dict of Series or dicts
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-The result **index** will be the **union** of the indexes of the various
-Series. If there are any nested dicts, these will be first converted to
-Series. If no columns are passed, the columns will be the sorted list of dict
+The resulting **index** will be the **union** of the indexes of the various
+Series. If there are any nested dicts, these will first be converted to
+Series. If no columns are passed, the columns will be the ordered list of dict
 keys.
 
 .. ipython:: python
@@ -321,7 +353,8 @@ From a list of dicts
 From a dict of tuples
 ~~~~~~~~~~~~~~~~~~~~~
 
-You can automatically create a multi-indexed frame by passing a tuples dictionary
+You can automatically create a MultiIndexed frame by passing a tuples
+dictionary.
 
 .. ipython:: python
 
@@ -343,8 +376,8 @@ column name provided).
 **Missing Data**
 
 Much more will be said on this topic in the :ref:`Missing data <missing_data>`
-section. To construct a DataFrame with missing data, use ``np.nan`` for those
-values which are missing. Alternatively, you may pass a ``numpy.MaskedArray``
+section. To construct a DataFrame with missing data, we use ``np.nan`` to
+represent missing values. Alternatively, you may pass a ``numpy.MaskedArray``
 as the data argument to the DataFrame constructor, and its masked entries will
 be considered missing.
 
@@ -360,42 +393,33 @@ and returns a DataFrame. It operates like the ``DataFrame`` constructor except
 for the ``orient`` parameter which is ``'columns'`` by default, but which can be
 set to ``'index'`` in order to use the dict keys as row labels.
 
-.. _basics.dataframe.from_records:
-
-**DataFrame.from_records**
-
-``DataFrame.from_records`` takes a list of tuples or an ndarray with structured
-dtype. Works analogously to the normal ``DataFrame`` constructor, except that
-index maybe be a specific field of the structured dtype to use as the index.
-For example:
 
 .. ipython:: python
 
-   data
-   pd.DataFrame.from_records(data, index='C')
+   pd.DataFrame.from_dict(dict([('A', [1, 2, 3]), ('B', [4, 5, 6])]))
 
-.. _basics.dataframe.from_items:
+If you pass ``orient='index'``, the keys will be the row labels. In this
+case, you can also pass the desired column names:
 
-**DataFrame.from_items**
+.. ipython:: python
 
-``DataFrame.from_items`` works analogously to the form of the ``dict``
-constructor that takes a sequence of ``(key, value)`` pairs, where the keys are
-column (or row, in the case of ``orient='index'``) names, and the value are the
-column values (or row values). This can be useful for constructing a DataFrame
-with the columns in a particular order without having to pass an explicit list
-of columns:
+   pd.DataFrame.from_dict(dict([('A', [1, 2, 3]), ('B', [4, 5, 6])]),
+                          orient='index', columns=['one', 'two', 'three'])
 
-.. ipython:: python
+.. _basics.dataframe.from_records:
 
-   pd.DataFrame.from_items([('A', [1, 2, 3]), ('B', [4, 5, 6])])
+**DataFrame.from_records**
 
-If you pass ``orient='index'``, the keys will be the row labels. But in this
-case you must also pass the desired column names:
+``DataFrame.from_records`` takes a list of tuples or an ndarray with structured
+dtype. It works analogously to the normal ``DataFrame`` constructor, except that
+the resulting DataFrame index may be a specific field of the structured
+dtype. For example:
 
 .. ipython:: python
 
-   pd.DataFrame.from_items([('A', [1, 2, 3]), ('B', [4, 5, 6])],
-                           orient='index', columns=['one', 'two', 'three'])
+   data
+   pd.DataFrame.from_records(data, index='C')
+
 
 Column selection, addition, deletion
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -451,8 +475,6 @@ available to insert at a particular location in the columns:
 Assigning New Columns in Method Chains
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.16.0
-
 Inspired by `dplyr's
 <http://cran.rstudio.com/web/packages/dplyr/vignettes/introduction.html#mutate>`__
 ``mutate`` verb, DataFrame has an :meth:`~pandas.DataFrame.assign`
@@ -467,8 +489,8 @@ derived from existing columns.
    (iris.assign(sepal_ratio = iris['SepalWidth'] / iris['SepalLength'])
         .head())
 
-Above was an example of inserting a precomputed value. We can also pass in
-a function of one argument to be evalutated on the DataFrame being assigned to.
+In the example above, we inserted a precomputed value. We can also pass in
+a function of one argument to be evaluated on the DataFrame being assigned to.
 
 .. ipython:: python
 
@@ -480,7 +502,7 @@ DataFrame untouched.
 
 Passing a callable, as opposed to an actual value to be inserted, is
 useful when you don't have a reference to the DataFrame at hand. This is
-common when using ``assign`` in chains of operations. For example,
+common when using ``assign`` in a chain of operations. For example,
 we can limit the DataFrame to just those observations with a Sepal Length
 greater than 5, calculate the ratio, and plot:
 
@@ -504,25 +526,70 @@ to be inserted (for example, a ``Series`` or NumPy array), or a function
 of one argument to be called on the ``DataFrame``. A *copy* of the original
 DataFrame is returned, with the new values inserted.
 
+.. versionchanged:: 0.23.0
+
+Starting with Python 3.6 the order of ``**kwargs`` is preserved. This allows
+for *dependent* assignment, where an expression later in ``**kwargs`` can refer
+to a column created earlier in the same :meth:`~DataFrame.assign`.
+
+.. ipython:: python
+
+   dfa = pd.DataFrame({"A": [1, 2, 3],
+                       "B": [4, 5, 6]})
+   dfa.assign(C=lambda x: x['A'] + x['B'],
+              D=lambda x: x['A'] + x['C'])
+
+In the second expression, ``x['C']`` will refer to the newly created column,
+that's equal to ``dfa['A'] + dfa['B']``.
+
+To write code compatible with all versions of Python, split the assignment in two.
+
+.. ipython:: python
+
+   dependent = pd.DataFrame({"A": [1, 1, 1]})
+   (dependent.assign(A=lambda x: x['A'] + 1)
+             .assign(B=lambda x: x['A'] + 2))
+
 .. warning::
 
-  Since the function signature of ``assign`` is ``**kwargs``, a dictionary,
-  the order of the new columns in the resulting DataFrame cannot be guaranteed
-  to match the order you pass in. To make things predictable, items are inserted
-  alphabetically (by key) at the end of the DataFrame.
+   Dependent assignment maybe subtly change the behavior of your code between
+   Python 3.6 and older versions of Python.
+
+   If you wish write code that supports versions of python before and after 3.6,
+   you'll need to take care when passing ``assign`` expressions that
+
+   * Updating an existing column
+   * Referring to the newly updated column in the same ``assign``
+
+   For example, we'll update column "A" and then refer to it when creating "B".
+
+   .. code-block:: python
+
+      >>> dependent = pd.DataFrame({"A": [1, 1, 1]})
+      >>> dependent.assign(A=lambda x: x["A"] + 1,
+                           B=lambda x: x["A"] + 2)
+
+   For Python 3.5 and earlier the expression creating ``B`` refers to the
+   "old" value of ``A``, ``[1, 1, 1]``. The output is then
+
+   .. code-block:: python
+
+         A  B
+      0  2  3
+      1  2  3
+      2  2  3
 
-  All expressions are computed first, and then assigned. So you can't refer
-  to another column being assigned in the same call to ``assign``. For example:
+   For Python 3.6 and later, the expression creating ``A`` refers to the
+   "new" value of ``A``, ``[2, 2, 2]``, which results in
+
+   .. code-block:: python
+
+         A  B
+      0  2  4
+      1  2  4
+      2  2  4
 
-   .. ipython::
-       :verbatim:
 
-       In [1]: # Don't do this, bad reference to `C`
-               df.assign(C = lambda x: x['A'] + x['B'],
-                         D = lambda x: x['A'] + x['C'])
-       In [2]: # Instead, break it into two assigns
-               (df.assign(C = lambda x: x['A'] + x['B'])
-                  .assign(D = lambda x: x['A'] + x['C']))
 
 Indexing / Selection
 ~~~~~~~~~~~~~~~~~~~~
@@ -546,7 +613,7 @@ DataFrame:
    df.loc['b']
    df.iloc[2]
 
-For a more exhaustive treatment of more sophisticated label-based indexing and
+For a more exhaustive treatment of sophisticated label-based indexing and
 slicing, see the :ref:`section on indexing <indexing>`. We will address the
 fundamentals of reindexing / conforming to new sets of labels in the
 :ref:`section on reindexing <basics.reindexing>`.
@@ -684,6 +751,7 @@ R package):
 
 .. ipython:: python
    :suppress:
+   :okwarning:
 
    # restore GlobalPrintConfig
    pd.reset_option('^display\.')
@@ -695,7 +763,7 @@ DataFrame in tabular form, though it won't always fit the console width:
 
    print(baseball.iloc[-20:, :12].to_string())
 
-New since 0.10.0, wide DataFrames will now be printed across multiple rows by
+Wide DataFrames will be printed across multiple rows by
 default:
 
 .. ipython:: python
@@ -711,10 +779,25 @@ option:
 
    pd.DataFrame(np.random.randn(3, 12))
 
+You can adjust the max width of the individual columns by setting ``display.max_colwidth``
+
+.. ipython:: python
+
+   datafile={'filename': ['filename_01','filename_02'],
+             'path': ["media/user_name/storage/folder_01/filename_01",
+                      "media/user_name/storage/folder_02/filename_02"]}
+
+   pd.set_option('display.max_colwidth',30)
+   pd.DataFrame(datafile)
+
+   pd.set_option('display.max_colwidth',100)
+   pd.DataFrame(datafile)
+
 .. ipython:: python
    :suppress:
 
    pd.reset_option('display.width')
+   pd.reset_option('display.max_colwidth')
 
 You can also disable this feature via the ``expand_frame_repr`` option.
 This will print the table in one block.
@@ -723,7 +806,7 @@ DataFrame column attribute access and IPython completion
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 If a DataFrame column label is a valid Python variable name, the column can be
-accessed like attributes:
+accessed like an attribute:
 
 .. ipython:: python
 
@@ -745,6 +828,11 @@ completion mechanism so they can be tab-completed:
 Panel
 -----
 
+.. warning::
+
+    In 0.20.0, ``Panel`` is deprecated and will be removed in
+    a future version. See the section :ref:`Deprecate Panel <dsintro.deprecate_panel>`.
+
 Panel is a somewhat less-used, but still important container for 3-dimensional
 data. The term `panel data <http://en.wikipedia.org/wiki/Panel_data>`__ is
 derived from econometrics and is partially responsible for the name pandas:
@@ -754,10 +842,10 @@ econometric analysis of panel data. However, for the strict purposes of slicing
 and dicing a collection of DataFrame objects, you may find the axis names
 slightly arbitrary:
 
-  - **items**: axis 0, each item corresponds to a DataFrame contained inside
-  - **major_axis**: axis 1, it is the **index** (rows) of each of the
-    DataFrames
-  - **minor_axis**: axis 2, it is the **columns** of each of the DataFrames
+* **items**: axis 0, each item corresponds to a DataFrame contained inside
+* **major_axis**: axis 1, it is the **index** (rows) of each of the
+  DataFrames
+* **minor_axis**: axis 2, it is the **columns** of each of the DataFrames
 
 Construction of Panels works about like you would expect:
 
@@ -765,6 +853,7 @@ From 3D ndarray with optional axis labels
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 .. ipython:: python
+   :okwarning:
 
    wp = pd.Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
                  major_axis=pd.date_range('1/1/2000', periods=5),
@@ -776,6 +865,7 @@ From dict of DataFrame objects
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 .. ipython:: python
+   :okwarning:
 
    data = {'Item1' : pd.DataFrame(np.random.randn(4, 3)),
            'Item2' : pd.DataFrame(np.random.randn(4, 2))}
@@ -798,6 +888,7 @@ dictionary of DataFrames as above, and the following named parameters:
 For example, compare to the construction above:
 
 .. ipython:: python
+   :okwarning:
 
    pd.Panel.from_dict(data, orient='minor')
 
@@ -806,6 +897,7 @@ DataFrame objects with mixed-type columns, all of the data will get upcasted to
 ``dtype=object`` unless you pass ``orient='minor'``:
 
 .. ipython:: python
+   :okwarning:
 
    df = pd.DataFrame({'a': ['foo', 'bar', 'baz'],
                       'b': np.random.randn(3)})
@@ -818,21 +910,19 @@ DataFrame objects with mixed-type columns, all of the data will get upcasted to
 
 .. note::
 
-   Unfortunately Panel, being less commonly used than Series and DataFrame,
+   Panel, being less commonly used than Series and DataFrame,
    has been slightly neglected feature-wise. A number of methods and options
-   available in DataFrame are not available in Panel. This will get worked
-   on, of course, in future releases. And faster if you join me in working on
-   the codebase.
+   available in DataFrame are not available in Panel.
 
 .. _dsintro.to_panel:
 
 From DataFrame using ``to_panel`` method
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-This method was introduced in v0.7 to replace ``LongPanel.to_long``, and converts
-a DataFrame with a two-level index to a Panel.
+``to_panel`` converts a DataFrame with a two-level index to a Panel.
 
 .. ipython:: python
+   :okwarning:
 
    midx = pd.MultiIndex(levels=[['one', 'two'], ['x','y']], labels=[[1,1,0,0],[1,0,1,0]])
    df = pd.DataFrame({'A' : [1, 2, 3, 4], 'B': [5, 6, 7, 8]}, index=midx)
@@ -852,7 +942,7 @@ of DataFrames:
    wp['Item3'] = wp['Item1'] / wp['Item2']
 
 The API for insertion and deletion is the same as for DataFrame. And as with
-DataFrame, if the item is a valid python identifier, you can access it as an
+DataFrame, if the item is a valid Python identifier, you can access it as an
 attribute and tab-complete it in IPython.
 
 Transposing
@@ -862,6 +952,7 @@ A Panel can be rearranged using its ``transpose`` method (which does not make a
 copy by default unless the data are heterogeneous):
 
 .. ipython:: python
+   :okwarning:
 
    wp.transpose(2, 0, 1)
 
@@ -888,9 +979,11 @@ For example, using the earlier example data, we could do:
 Squeezing
 ~~~~~~~~~
 
-Another way to change the dimensionality of an object is to ``squeeze`` a 1-len object, similar to ``wp['Item1']``
+Another way to change the dimensionality of an object is to ``squeeze`` a 1-len
+object, similar to ``wp['Item1']``.
 
 .. ipython:: python
+   :okwarning:
 
    wp.reindex(items=['Item1']).squeeze()
    wp.reindex(items=['Item1'], minor=['B']).squeeze()
@@ -905,6 +998,7 @@ for more on this. To convert a Panel to a DataFrame, use the ``to_frame``
 method:
 
 .. ipython:: python
+   :okwarning:
 
    panel = pd.Panel(np.random.randn(3, 5, 4), items=['one', 'two', 'three'],
                     major_axis=pd.date_range('1/1/2000', periods=5),
@@ -912,124 +1006,44 @@ method:
    panel.to_frame()
 
 
-.. _dsintro.panel4d:
-
-Panel4D (Experimental)
-----------------------
+.. _dsintro.deprecate_panel:
 
-``Panel4D`` is a 4-Dimensional named container very much like a ``Panel``, but
-having 4 named dimensions. It is intended as a test bed for more N-Dimensional named
-containers.
+Deprecate Panel
+---------------
 
-  - **labels**: axis 0, each item corresponds to a Panel contained inside
-  - **items**: axis 1, each item corresponds to a DataFrame contained inside
-  - **major_axis**: axis 2, it is the **index** (rows) of each of the
-    DataFrames
-  - **minor_axis**: axis 3, it is the **columns** of each of the DataFrames
+Over the last few years, pandas has increased in both breadth and depth, with new features,
+datatype support, and manipulation routines. As a result, supporting efficient indexing and functional
+routines for ``Series``, ``DataFrame`` and ``Panel`` has contributed to an increasingly fragmented and
+difficult-to-understand code base.
 
-``Panel4D`` is a sub-class of ``Panel``, so most methods that work on Panels are
-applicable to Panel4D. The following methods are disabled:
+The 3-D structure of a ``Panel`` is much less common for many types of data analysis,
+than the 1-D of the ``Series`` or the 2-D of the ``DataFrame``. Going forward it makes sense for
+pandas to focus on these areas exclusively.
 
-  - ``join , to_frame , to_excel , to_sparse , groupby``
+Oftentimes, one can simply use a MultiIndex ``DataFrame`` for easily working with higher dimensional data.
 
-Construction of Panel4D works in a very similar manner to a ``Panel``
-
-From 4D ndarray with optional axis labels
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+In addition, the ``xarray`` package was built from the ground up, specifically in order to
+support the multi-dimensional analysis that is one of ``Panel`` s main use cases.
+`Here is a link to the xarray panel-transition documentation <http://xarray.pydata.org/en/stable/pandas.html#panel-transition>`__.
 
 .. ipython:: python
+   :okwarning:
 
-   p4d = pd.Panel4D(np.random.randn(2, 2, 5, 4),
-                    labels=['Label1','Label2'],
-                    items=['Item1', 'Item2'],
-                    major_axis=pd.date_range('1/1/2000', periods=5),
-                    minor_axis=['A', 'B', 'C', 'D'])
-   p4d
-
-
-From dict of Panel objects
-~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. ipython:: python
-
-   data = { 'Label1' : pd.Panel({ 'Item1' : pd.DataFrame(np.random.randn(4, 3)) }),
-            'Label2' : pd.Panel({ 'Item2' : pd.DataFrame(np.random.randn(4, 2)) }) }
-   pd.Panel4D(data)
-
-Note that the values in the dict need only be **convertible to Panels**.
-Thus, they can be any of the other valid inputs to Panel as per above.
-
-Slicing
-~~~~~~~
-
-Slicing works in a similar manner to a Panel. ``[]`` slices the first dimension.
-``.ix`` allows you to slice arbitrarily and get back lower dimensional objects
-
-.. ipython:: python
-
-   p4d['Label1']
-
-4D -> Panel
-
-.. ipython:: python
-
-   p4d.ix[:,:,:,'A']
-
-4D -> DataFrame
-
-.. ipython:: python
-
-   p4d.ix[:,:,0,'A']
-
-4D -> Series
-
-.. ipython:: python
-
-   p4d.ix[:,0,0,'A']
-
-Transposing
-~~~~~~~~~~~
+   p = tm.makePanel()
+   p
 
-A Panel4D can be rearranged using its ``transpose`` method (which does not make a
-copy by default unless the data are heterogeneous):
+Convert to a MultiIndex DataFrame.
 
 .. ipython:: python
+   :okwarning:
 
-   p4d.transpose(3, 2, 1, 0)
-
-.. _dsintro.panelnd:
-
-PanelND (Experimental)
-----------------------
-
-PanelND is a module with a set of factory functions to enable a user to construct N-dimensional named
-containers like Panel4D, with a custom set of axis labels. Thus a domain-specific container can easily be
-created.
+   p.to_frame()
 
-The following creates a Panel5D. A new panel type object must be sliceable into a lower dimensional object.
-Here we slice to a Panel4D.
+Alternatively, one can convert to an xarray ``DataArray``.
 
 .. ipython:: python
+   :okwarning:
 
-    from pandas.core import panelnd
-    Panel5D = panelnd.create_nd_panel_factory(
-        klass_name   = 'Panel5D',
-        orders  = [ 'cool', 'labels','items','major_axis','minor_axis'],
-        slices  = { 'labels' : 'labels', 'items' : 'items',
-	                'major_axis' : 'major_axis', 'minor_axis' : 'minor_axis' },
-        slicer  = pd.Panel4D,
-        aliases = { 'major' : 'major_axis', 'minor' : 'minor_axis' },
-        stat_axis    = 2)
-
-    p5d = Panel5D(dict(C1 = p4d))
-    p5d
-
-    # print a slice of our 5D
-    p5d.ix['C1',:,:,0:3,:]
-
-    # transpose it
-    p5d.transpose(1,2,3,4,0)
+   p.to_xarray()
 
-    # look at the shape & dim
-    p5d.shape
-    p5d.ndim
+You can see the full-documentation for the `xarray package <http://xarray.pydata.org/en/stable/>`__.
diff --git a/doc/source/ecosystem.rst b/doc/source/ecosystem.rst
index 762656ba05bd6..4e15f9069de67 100644
--- a/doc/source/ecosystem.rst
+++ b/doc/source/ecosystem.rst
@@ -24,10 +24,10 @@ substantial projects that you feel should be on this list, please let us know.
 Statistics and Machine Learning
 -------------------------------
 
-`Statsmodels <http://statsmodels.sourceforge.net>`__
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+`Statsmodels <http://www.statsmodels.org/>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Statsmodels is the prominent python "statistics and econometrics library" and it has
+Statsmodels is the prominent Python "statistics and econometrics library" and it has
 a long-standing special relationship with pandas. Statsmodels provides powerful statistics,
 econometrics, analysis and modeling functionality that is out of pandas' scope.
 Statsmodels leverages pandas objects as the underlying data container for computation.
@@ -38,7 +38,10 @@ Statsmodels leverages pandas objects as the underlying data container for comput
 Use pandas DataFrames in your `scikit-learn <http://scikit-learn.org/>`__
 ML pipeline.
 
+`Featuretools <https://github.com/featuretools/featuretools/>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
+Featuretools is a Python library for automated feature engineering built on top of pandas. It excels at transforming temporal and relational datasets into feature matrices for machine learning using reusable feature engineering "primitives". Users can contribute their own primitives in Python and share them with the rest of the community. 
 
 .. _ecosystem.visualization:
 
@@ -53,6 +56,18 @@ the latest web technologies. Its goal is to provide elegant, concise constructio
 graphics in the style of Protovis/D3, while delivering high-performance interactivity over
 large data to thin clients.
 
+`seaborn <https://seaborn.pydata.org>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Seaborn is a Python visualization library based on `matplotlib
+<http://matplotlib.org>`__.  It provides a high-level, dataset-oriented
+interface for creating attractive statistical graphics. The plotting functions
+in seaborn understand pandas objects and leverage pandas grouping operations
+internally to support concise specification of complex visualizations. Seaborn
+also goes beyond matplotlib and pandas with the option to perform statistical
+estimation while plotting, aggregating across observations and visualizing the
+fit of statistical models to emphasize patterns in a dataset.
+
 `yhat/ggplot <https://github.com/yhat/ggplot>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
@@ -60,38 +75,44 @@ Hadley Wickham's `ggplot2 <http://ggplot2.org/>`__ is a foundational exploratory
 Based on `"The Grammar of Graphics" <http://www.cs.uic.edu/~wilkinson/TheGrammarOfGraphics/GOG.html>`__ it
 provides a powerful, declarative and extremely general way to generate bespoke plots of any kind of data.
 It's really quite incredible. Various implementations to other languages are available,
-but a faithful implementation for python users has long been missing. Although still young
+but a faithful implementation for Python users has long been missing. Although still young
 (as of Jan-2014), the `yhat/ggplot <https://github.com/yhat/ggplot>`__ project has been
 progressing quickly in that direction.
 
-`Seaborn <https://github.com/mwaskom/seaborn>`__
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Although pandas has quite a bit of "just plot it" functionality built-in, visualization and
-in particular statistical graphics is a vast field with a long tradition and lots of ground
-to cover. The `Seaborn <https://github.com/mwaskom/seaborn>`__ project builds on top of pandas
-and `matplotlib <http://matplotlib.org>`__ to provide easy plotting of data which extends to
-more advanced types of plots then those offered by pandas.
-
 `Vincent <https://github.com/wrobstory/vincent>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 The `Vincent <https://github.com/wrobstory/vincent>`__ project leverages `Vega <https://github.com/trifacta/vega>`__
-(that in turn, leverages `d3 <http://d3js.org/>`__) to create plots . It has great support
-for pandas data objects.
+(that in turn, leverages `d3 <http://d3js.org/>`__) to create
+plots. Although functional, as of Summer 2016 the Vincent project has not been updated
+in over two years and is `unlikely to receive further updates <https://github.com/wrobstory/vincent#2015-08-12-update>`__.
 
-`Plotly <https://plot.ly/python>`__
+`IPython Vega <https://github.com/vega/ipyvega>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
+Like Vincent, the `IPython Vega <https://github.com/vega/ipyvega>`__ project leverages `Vega
+<https://github.com/trifacta/vega>`__ to create plots, but primarily
+targets the IPython Notebook environment.
+
+`Plotly <https://plot.ly/python>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
 `Plotly’s <https://plot.ly/>`__ `Python API <https://plot.ly/python/>`__ enables interactive figures and web shareability. Maps, 2D, 3D, and live-streaming graphs are rendered with WebGL and `D3.js <http://d3js.org/>`__. The library supports plotting directly from a pandas DataFrame and cloud-based collaboration. Users of `matplotlib, ggplot for Python, and Seaborn <https://plot.ly/python/matplotlib-to-plotly-tutorial/>`__ can convert figures into interactive web-based plots. Plots can be drawn in `IPython Notebooks <https://plot.ly/ipython-notebooks/>`__ , edited with R or MATLAB, modified in a GUI, or embedded in apps and dashboards. Plotly is free for unlimited sharing, and has `cloud <https://plot.ly/product/plans/>`__, `offline <https://plot.ly/python/offline/>`__, or `on-premise <https://plot.ly/product/enterprise/>`__ accounts for private use.
 
+`QtPandas <https://github.com/draperjames/qtpandas>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Spun off from the main pandas library, the `qtpandas <https://github.com/draperjames/qtpandas>`__
+library enables DataFrame visualization and manipulation in PyQt4 and PySide applications.
+
+
 .. _ecosystem.ide:
 
 IDE
 ------
 
 `IPython <http://ipython.org/documentation.html>`__
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 IPython is an interactive command shell and distributed computing
 environment.
@@ -110,12 +131,12 @@ which are utilized by IPython Notebook for displaying
 compatible with non-HTML IPython output formats.)
 
 `quantopian/qgrid <https://github.com/quantopian/qgrid>`__
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 qgrid is "an interactive grid for sorting and filtering
 DataFrames in IPython Notebook" built with SlickGrid.
 
-`Spyder <https://code.google.com/p/spyderlib/>`__
+`Spyder <https://github.com/spyder-ide/spyder/>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Spyder is a cross-platform Qt-based open-source Python IDE with
@@ -129,33 +150,53 @@ both "column wise min/max and global min/max coloring."
 API
 -----
 
-`quandl/Python <https://github.com/quandl/Python>`_
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+`pandas-datareader <https://github.com/pydata/pandas-datareader>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+``pandas-datareader`` is a remote data access library for pandas (PyPI:``pandas-datareader``).
+It is based on functionality that was located in ``pandas.io.data`` and ``pandas.io.wb`` but was
+split off in v0.19.
+See more in the  `pandas-datareader docs <https://pandas-datareader.readthedocs.io/en/latest/>`_:
+
+The following data feeds are available:
+
+* Yahoo! Finance
+* Google Finance
+* FRED
+* Fama/French
+* World Bank
+* OECD
+* Eurostat
+* EDGAR Index
+
+`quandl/Python <https://github.com/quandl/Python>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 Quandl API for Python wraps the Quandl REST API to return
 Pandas DataFrames with timeseries indexes.
 
-`pydatastream <https://github.com/vfilimonov/pydatastream>`_
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+`pydatastream <https://github.com/vfilimonov/pydatastream>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 PyDatastream is a Python interface to the
 `Thomson Dataworks Enterprise (DWE/Datastream) <http://dataworks.thomson.com/Dataworks/Enterprise/1.0/>`__
 SOAP API to return indexed Pandas DataFrames or Panels with financial data.
 This package requires valid credentials for this API (non free).
 
-`pandaSDMX <http://pandasdmx.readthedocs.org>`_
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-pandaSDMX is an extensible library to retrieve and acquire statistical data
+`pandaSDMX <https://pandasdmx.readthedocs.io>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+pandaSDMX is a library to retrieve and acquire statistical data
 and metadata disseminated in
-`SDMX <http://www.sdmx.org>`_ 2.1. This standard is currently supported by
-the European statistics office (Eurostat)
-and the European Central Bank (ECB). Datasets may be returned as pandas Series
-or multi-indexed DataFrames.
-
-`fredapi <https://github.com/mortada/fredapi>`_
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+`SDMX <http://www.sdmx.org>`_ 2.1, an ISO-standard
+widely used by institutions such as statistics offices, central banks,   
+and international organisations. pandaSDMX can expose datasets and related 
+structural metadata including data flows, code-lists,
+and data structure definitions as pandas Series
+or MultiIndexed DataFrames.
+   
+`fredapi <https://github.com/mortada/fredapi>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 fredapi is a Python interface to the `Federal Reserve Economic Data (FRED) <http://research.stlouisfed.org/fred2/>`__
 provided by the Federal Reserve Bank of St. Louis. It works with both the FRED database and ALFRED database that
-contains point-in-time data (i.e. historic data revisions). fredapi provides a wrapper in python to the FRED
-HTTP API, and also provides several conveninent methods for parsing and analyzing point-in-time data from ALFRED.
+contains point-in-time data (i.e. historic data revisions). fredapi provides a wrapper in Python to the FRED
+HTTP API, and also provides several convenient methods for parsing and analyzing point-in-time data from ALFRED.
 fredapi makes use of pandas and returns data in a Series or DataFrame. This module requires a FRED API key that
 you can obtain for free on the FRED website.
 
@@ -172,10 +213,10 @@ Geopandas extends pandas data objects to include geographic information which su
 geometric operations. If your work entails maps and geographical coordinates, and
 you love pandas, you should take a close look at Geopandas.
 
-`xray <https://github.com/xray/xray>`__
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+`xarray <https://github.com/pydata/xarray>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-xray brings the labeled data power of pandas to the physical sciences by
+xarray brings the labeled data power of pandas to the physical sciences by
 providing N-dimensional variants of the core pandas data structures. It aims to
 provide a pandas-like and pandas-compatible toolkit for analytics on multi-
 dimensional arrays, rather than the tabular data for which pandas excels.
@@ -186,6 +227,18 @@ dimensional arrays, rather than the tabular data for which pandas excels.
 Out-of-core
 -------------
 
+`Dask <https://dask.readthedocs.io/en/latest/>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Dask is a flexible parallel computing library for analytics. Dask
+provides a familiar ``DataFrame`` interface for out-of-core, parallel and distributed computing.
+
+`Dask-ML <https://dask-ml.readthedocs.io/en/latest/>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Dask-ML enables parallel and distributed machine learning using Dask alongside existing machine learning libraries like Scikit-Learn, XGBoost, and TensorFlow.
+
+
 `Blaze <http://blaze.pydata.org/>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
@@ -195,8 +248,55 @@ PySpark.
 
 `Odo <http://odo.pydata.org>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
 Odo provides a uniform API for moving data between different formats. It uses
 pandas own ``read_csv`` for CSV IO and leverages many existing packages such as
 PyTables, h5py, and pymongo to move data between non pandas formats. Its graph
 based approach is also extensible by end users for custom formats that may be
 too specific for the core of odo.
+
+.. _ecosystem.data_validation:
+
+Data validation
+---------------
+
+`Engarde <http://engarde.readthedocs.io/en/latest/>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Engarde is a lightweight library used to explicitly state your assumptions about your datasets
+and check that they're *actually* true.
+
+.. _ecosystem.extensions:
+
+Extension Data Types
+--------------------
+
+Pandas provides an interface for defining
+:ref:`extension types <extending.extension-types>` to extend NumPy's type
+system. The following libraries implement that interface to provide types not
+found in NumPy or pandas, which work well with pandas' data containers.
+
+`cyberpandas`_
+~~~~~~~~~~~~~~
+
+Cyberpandas provides an extension type for storing arrays of IP Addresses. These
+arrays can be stored inside pandas' Series and DataFrame.
+
+.. _ecosystem.accessors:
+
+Accessors
+---------
+
+A directory of projects providing
+:ref:`extension accessors <extending.register-accessors>`. This is for users to
+discover new accessors and for library authors to coordinate on the namespace.
+
+============== ========== =========================
+Library        Accessor   Classes
+============== ========== =========================
+`cyberpandas`_ ``ip``     ``Series``
+`pdvega`_      ``vgplot`` ``Series``, ``DataFrame``
+============== ========== =========================
+
+.. _cyberpandas: https://cyberpandas.readthedocs.io/en/latest
+.. _pdvega: https://jakevdp.github.io/pdvega/
diff --git a/doc/source/enhancingperf.rst b/doc/source/enhancingperf.rst
index 028e6d064a561..8f8a9fe3e50e0 100644
--- a/doc/source/enhancingperf.rst
+++ b/doc/source/enhancingperf.rst
@@ -19,30 +19,37 @@
 Enhancing Performance
 *********************
 
+In this part of the tutorial, we will investigate how to speed up certain
+functions operating on pandas ``DataFrames`` using three different techniques: 
+Cython, Numba and :func:`pandas.eval`. We will see a speed improvement of ~200 
+when we use Cython and Numba on a test function operating row-wise on the 
+``DataFrame``. Using :func:`pandas.eval` we will speed up a sum by an order of 
+~2.
+
 .. _enhancingperf.cython:
 
 Cython (Writing C extensions for pandas)
 ----------------------------------------
 
-For many use cases writing pandas in pure python and numpy is sufficient. In some
-computationally heavy applications however, it can be possible to achieve sizeable
+For many use cases writing pandas in pure Python and NumPy is sufficient. In some
+computationally heavy applications however, it can be possible to achieve sizable
 speed-ups by offloading work to `cython <http://cython.org/>`__.
 
-This tutorial assumes you have refactored as much as possible in python, for example
-trying to remove for loops and making use of numpy vectorization, it's always worth
-optimising in python first.
+This tutorial assumes you have refactored as much as possible in Python, for example
+by trying to remove for-loops and making use of NumPy vectorization. It's always worth
+optimising in Python first.
 
 This tutorial walks through a "typical" process of cythonizing a slow computation.
-We use an `example from the cython documentation <http://docs.cython.org/src/quickstart/cythonize.html>`__
+We use an `example from the Cython documentation <http://docs.cython.org/src/quickstart/cythonize.html>`__
 but in the context of pandas. Our final cythonized solution is around 100 times
-faster than the pure python.
+faster than the pure Python solution.
 
 .. _enhancingperf.pure:
 
 Pure python
 ~~~~~~~~~~~
 
-We have a DataFrame to which we want to apply a function row-wise.
+We have a ``DataFrame`` to which we want to apply a function row-wise.
 
 .. ipython:: python
 
@@ -52,7 +59,7 @@ We have a DataFrame to which we want to apply a function row-wise.
                       'x': 'x'})
    df
 
-Here's the function in pure python:
+Here's the function in pure Python:
 
 .. ipython:: python
 
@@ -68,7 +75,7 @@ Here's the function in pure python:
 
 We achieve our result by using ``apply`` (row-wise):
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [7]: %timeit df.apply(lambda x: integrate_f(x['a'], x['b'], x['N']), axis=1)
    10 loops, best of 3: 174 ms per loop
@@ -86,23 +93,23 @@ hence we'll concentrate our efforts cythonizing these two functions.
 
 .. note::
 
-  In python 2 replacing the ``range`` with its generator counterpart (``xrange``)
-  would mean the ``range`` line would vanish. In python 3 ``range`` is already a generator.
+  In Python 2 replacing the ``range`` with its generator counterpart (``xrange``)
+  would mean the ``range`` line would vanish. In Python 3 ``range`` is already a generator.
 
 .. _enhancingperf.plain:
 
-Plain cython
+Plain Cython
 ~~~~~~~~~~~~
 
-First we're going to need to import the cython magic function to ipython (for
-cython versions >=0.21 you can use ``%load_ext Cython``):
+First we're going to need to import the Cython magic function to ipython:
 
 .. ipython:: python
+   :okwarning:
 
-   %load_ext cythonmagic
+   %load_ext Cython
 
 
-Now, let's simply copy our functions over to cython as is (the suffix
+Now, let's simply copy our functions over to Cython as is (the suffix
 is here to distinguish between function versions):
 
 .. ipython::
@@ -124,7 +131,7 @@ is here to distinguish between function versions):
   to be using bleeding edge ipython for paste to play well with cell magics.
 
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [4]: %timeit df.apply(lambda x: integrate_f_plain(x['a'], x['b'], x['N']), axis=1)
    10 loops, best of 3: 85.5 ms per loop
@@ -153,7 +160,7 @@ We get another huge improvement simply by providing type information:
       ...:     return s * dx
       ...:
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [4]: %timeit df.apply(lambda x: integrate_f_typed(x['a'], x['b'], x['N']), axis=1)
    10 loops, best of 3: 20.3 ms per loop
@@ -173,12 +180,12 @@ Using ndarray
 
 It's calling series... a lot! It's creating a Series from each row, and get-ting from both
 the index and the series (three times for each row). Function calls are expensive
-in python, so maybe we could minimise these by cythonizing the apply part.
+in Python, so maybe we could minimize these by cythonizing the apply part.
 
 .. note::
 
-  We are now passing ndarrays into the cython function, fortunately cython plays
-  very nicely with numpy.
+  We are now passing ndarrays into the Cython function, fortunately Cython plays
+  very nicely with NumPy.
 
 .. ipython::
 
@@ -212,17 +219,18 @@ the rows, applying our ``integrate_f_typed``, and putting this in the zeros arra
 
 .. warning::
 
-   In 0.13.0 since ``Series`` has internaly been refactored to no longer sub-class ``ndarray``
-   but instead subclass ``NDFrame``, you can **not pass** a ``Series`` directly as a ``ndarray`` typed parameter
-   to a cython function. Instead pass the actual ``ndarray`` using the ``.values`` attribute of the Series.
+   You can **not pass** a ``Series`` directly as a ``ndarray`` typed parameter
+   to a Cython function. Instead pass the actual ``ndarray`` using the
+   ``.values`` attribute of the ``Series``. The reason is that the Cython
+   definition is specific to an ndarray and not the passed ``Series``.
 
-   Prior to 0.13.0
+   So, do not do this:
 
    .. code-block:: python
 
         apply_integrate_f(df['a'], df['b'], df['N'])
 
-   Use ``.values`` to get the underlying ``ndarray``
+   But rather, use ``.values`` to get the underlying ``ndarray``:
 
    .. code-block:: python
 
@@ -230,10 +238,10 @@ the rows, applying our ``integrate_f_typed``, and putting this in the zeros arra
 
 .. note::
 
-    Loops like this would be *extremely* slow in python, but in Cython looping
-    over numpy arrays is *fast*.
+    Loops like this would be *extremely* slow in Python, but in Cython looping
+    over NumPy arrays is *fast*.
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [4]: %timeit apply_integrate_f(df['a'].values, df['b'].values, df['N'].values)
    1000 loops, best of 3: 1.25 ms per loop
@@ -254,7 +262,7 @@ More advanced techniques
 ~~~~~~~~~~~~~~~~~~~~~~~~
 
 There is still hope for improvement. Here's an example of using some more
-advanced cython techniques:
+advanced Cython techniques:
 
 .. ipython::
 
@@ -274,8 +282,8 @@ advanced cython techniques:
       ...:     return s * dx
       ...: @cython.boundscheck(False)
       ...: @cython.wraparound(False)
-      ...: cpdef np.ndarray[double] apply_integrate_f_wrap(np.ndarray[double] col_a, np.ndarray[double] col_b, np.ndarray[Py_ssize_t] col_N):
-      ...:     cdef Py_ssize_t i, n = len(col_N)
+      ...: cpdef np.ndarray[double] apply_integrate_f_wrap(np.ndarray[double] col_a, np.ndarray[double] col_b, np.ndarray[int] col_N):
+      ...:     cdef int i, n = len(col_N)
       ...:     assert len(col_a) == len(col_b) == n
       ...:     cdef np.ndarray[double] res = np.empty(n)
       ...:     for i in range(n):
@@ -283,21 +291,22 @@ advanced cython techniques:
       ...:     return res
       ...:
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [4]: %timeit apply_integrate_f_wrap(df['a'].values, df['b'].values, df['N'].values)
    1000 loops, best of 3: 987 us per loop
 
-Even faster, with the caveat that a bug in our cython code (an off-by-one error,
+Even faster, with the caveat that a bug in our Cython code (an off-by-one error,
 for example) might cause a segfault because memory access isn't checked.
-
+For more about ``boundscheck`` and ``wraparound``, see the Cython docs on 
+`compiler directives <http://cython.readthedocs.io/en/latest/src/reference/compilation.html?highlight=wraparound#compiler-directives>`__.
 
 .. _enhancingperf.numba:
 
-Using numba
+Using Numba
 -----------
 
-A recent alternative to statically compiling cython code, is to use a *dynamic jit-compiler*, ``numba``.
+A recent alternative to statically compiling Cython code, is to use a *dynamic jit-compiler*, Numba.
 
 Numba gives you the power to speed up your applications with high performance functions written directly in Python. With a few annotations, array-oriented and math-heavy Python code can be just-in-time compiled to native machine instructions, similar in performance to C, C++ and Fortran, without having to switch languages or Python interpreters.
 
@@ -305,16 +314,17 @@ Numba works by generating optimized machine code using the LLVM compiler infrast
 
 .. note::
 
-    You will need to install ``numba``. This is easy with ``conda``, by using: ``conda install numba``, see :ref:`installing using miniconda<install.miniconda>`.
+    You will need to install Numba. This is easy with ``conda``, by using: ``conda install numba``, see :ref:`installing using miniconda<install.miniconda>`.
 
 .. note::
 
-    As of ``numba`` version 0.20, pandas objects cannot be passed directly to numba-compiled functions. Instead, one must pass the ``numpy`` array underlying the ``pandas`` object to the numba-compiled function as demonstrated below.
+    As of Numba version 0.20, pandas objects cannot be passed directly to Numba-compiled functions. Instead, one must pass the NumPy array underlying the pandas object to the Numba-compiled function as demonstrated below.
 
 Jit
 ~~~
 
-Using ``numba`` to just-in-time compile your code. We simply take the plain python code from above and annotate with the ``@jit`` decorator.
+We demonstrate how to use Numba to just-in-time compile our code. We simply 
+take the plain Python code from above and annotate with the ``@jit`` decorator.
 
 .. code-block:: python
 
@@ -345,17 +355,19 @@ Using ``numba`` to just-in-time compile your code. We simply take the plain pyth
        result = apply_integrate_f_numba(df['a'].values, df['b'].values, df['N'].values)
        return pd.Series(result, index=df.index, name='result')
 
-Note that we directly pass ``numpy`` arrays to the numba function. ``compute_numba`` is just a wrapper that provides a nicer interface by passing/returning pandas objects.
+Note that we directly pass NumPy arrays to the Numba function. ``compute_numba`` is just a wrapper that provides a nicer interface by passing/returning pandas objects.
 
-.. code-block:: python
+.. code-block:: ipython
 
     In [4]: %timeit compute_numba(df)
     1000 loops, best of 3: 798 us per loop
 
+In this example, using Numba was faster than Cython.
+
 Vectorize
 ~~~~~~~~~
 
-``numba`` can also be used to write vectorized functions that do not require the user to explicitly
+Numba can also be used to write vectorized functions that do not require the user to explicitly
 loop over the observations of a vector; a vectorized function will be applied to each row automatically.
 Consider the following toy example of doubling each observation:
 
@@ -388,20 +400,28 @@ Caveats
 
 .. note::
 
-    ``numba`` will execute on any function, but can only accelerate certain classes of functions.
+    Numba will execute on any function, but can only accelerate certain classes of functions.
 
-``numba`` is best at accelerating functions that apply numerical functions to numpy arrays. When passed a function that only uses operations it knows how to accelerate, it will execute in ``nopython`` mode.
+Numba is best at accelerating functions that apply numerical functions to NumPy 
+arrays. When passed a function that only uses operations it knows how to 
+accelerate, it will execute in ``nopython`` mode.
 
-If ``numba`` is passed a function that includes something it doesn't know how to work with -- a category that currently includes sets, lists, dictionaries, or string functions -- it will revert to ``object mode``. In ``object mode``, numba will execute but your code will not speed up significantly. If you would prefer that ``numba`` throw an error if it cannot compile a function in a way that speeds up your code, pass numba the argument ``nopython=True`` (e.g.  ``@numba.jit(nopython=True)``). For more on troubleshooting ``numba`` modes, see the `numba troubleshooting page <http://numba.pydata.org/numba-doc/0.20.0/user/troubleshoot.html#the-compiled-code-is-too-slow>`__.
+If Numba is passed a function that includes something it doesn't know how to 
+work with -- a category that currently includes sets, lists, dictionaries, or 
+string functions -- it will revert to ``object mode``. In ``object mode``, 
+Numba will execute but your code will not speed up significantly. If you would 
+prefer that Numba throw an error if it cannot compile a function in a way that 
+speeds up your code, pass Numba the argument 
+``nopython=True`` (e.g.  ``@numba.jit(nopython=True)``). For more on 
+troubleshooting Numba modes, see the `Numba troubleshooting page 
+<http://numba.pydata.org/numba-doc/latest/user/troubleshoot.html#the-compiled-code-is-too-slow>`__.
 
-Read more in the `numba docs <http://numba.pydata.org/>`__.
+Read more in the `Numba docs <http://numba.pydata.org/>`__.
 
 .. _enhancingperf.eval:
 
-Expression Evaluation via :func:`~pandas.eval` (Experimental)
--------------------------------------------------------------
-
-.. versionadded:: 0.13
+Expression Evaluation via :func:`~pandas.eval`
+-----------------------------------------------
 
 The top-level function :func:`pandas.eval` implements expression evaluation of
 :class:`~pandas.Series` and :class:`~pandas.DataFrame` objects.
@@ -441,15 +461,15 @@ Supported Syntax
 
 These operations are supported by :func:`pandas.eval`:
 
-- Arithmetic operations except for the left shift (``<<``) and right shift
+* Arithmetic operations except for the left shift (``<<``) and right shift
   (``>>``) operators, e.g., ``df + 2 * pi / s ** 4 % 42 - the_golden_ratio``
-- Comparison operations, including chained comparisons, e.g., ``2 < df < df2``
-- Boolean operations, e.g., ``df < df2 and df3 < df4 or not df_bool``
-- ``list`` and ``tuple`` literals, e.g., ``[1, 2]`` or ``(1, 2)``
-- Attribute access, e.g., ``df.a``
-- Subscript expressions, e.g., ``df[0]``
-- Simple variable evaluation, e.g., ``pd.eval('df')`` (this is not very useful)
-- Math functions, `sin`, `cos`, `exp`, `log`, `expm1`, `log1p`,
+* Comparison operations, including chained comparisons, e.g., ``2 < df < df2``
+* Boolean operations, e.g., ``df < df2 and df3 < df4 or not df_bool``
+* ``list`` and ``tuple`` literals, e.g., ``[1, 2]`` or ``(1, 2)``
+* Attribute access, e.g., ``df.a``
+* Subscript expressions, e.g., ``df[0]``
+* Simple variable evaluation, e.g., ``pd.eval('df')`` (this is not very useful)
+* Math functions: `sin`, `cos`, `exp`, `log`, `expm1`, `log1p`,
   `sqrt`, `sinh`, `cosh`, `tanh`, `arcsin`, `arccos`, `arctan`, `arccosh`,
   `arcsinh`, `arctanh`, `abs` and `arctan2`.
 
@@ -457,22 +477,22 @@ This Python syntax is **not** allowed:
 
 * Expressions
 
-  - Function calls other than math functions.
-  - ``is``/``is not`` operations
-  - ``if`` expressions
-  - ``lambda`` expressions
-  - ``list``/``set``/``dict`` comprehensions
-  - Literal ``dict`` and ``set`` expressions
-  - ``yield`` expressions
-  - Generator expressions
-  - Boolean expressions consisting of only scalar values
+    * Function calls other than math functions.
+    * ``is``/``is not`` operations
+    * ``if`` expressions
+    * ``lambda`` expressions
+    * ``list``/``set``/``dict`` comprehensions
+    * Literal ``dict`` and ``set`` expressions
+    * ``yield`` expressions
+    * Generator expressions
+    * Boolean expressions consisting of only scalar values
 
 * Statements
 
-  - Neither `simple <http://docs.python.org/2/reference/simple_stmts.html>`__
-    nor `compound <http://docs.python.org/2/reference/compound_stmts.html>`__
-    statements are allowed. This includes things like ``for``, ``while``, and
-    ``if``.
+    * Neither `simple <https://docs.python.org/3/reference/simple_stmts.html>`__
+      nor `compound <https://docs.python.org/3/reference/compound_stmts.html>`__
+      statements are allowed. This includes things like ``for``, ``while``, and
+      ``if``.
 
 
 
@@ -538,10 +558,8 @@ Now let's do the same thing but with comparisons:
    of type ``bool`` or ``np.bool_``. Again, you should perform these kinds of
    operations in plain Python.
 
-The ``DataFrame.eval`` method (Experimental)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.13
+The ``DataFrame.eval`` method
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 In addition to the top level :func:`pandas.eval` function you can also
 evaluate an expression in the "context" of a :class:`~pandas.DataFrame`.
@@ -570,18 +588,51 @@ prefix the name of the :class:`~pandas.DataFrame` to the column(s) you're
 interested in evaluating.
 
 In addition, you can perform assignment of columns within an expression.
-This allows for *formulaic evaluation*. Only a single assignment is permitted.
-The assignment target can be a new column name or an existing column name, and
-it must be a valid Python identifier.
+This allows for *formulaic evaluation*.  The assignment target can be a
+new column name or an existing column name, and it must be a valid Python
+identifier.
+
+.. versionadded:: 0.18.0
+
+The ``inplace`` keyword determines whether this assignment will performed
+on the original ``DataFrame`` or return a copy with the new column.
+
+.. warning::
+
+   For backwards compatibility, ``inplace`` defaults to ``True`` if not
+   specified. This will change in a future version of pandas - if your
+   code depends on an inplace assignment you should update to explicitly
+   set ``inplace=True``.
 
 .. ipython:: python
 
    df = pd.DataFrame(dict(a=range(5), b=range(5, 10)))
-   df.eval('c = a + b')
-   df.eval('d = a + b + c')
-   df.eval('a = 1')
+   df.eval('c = a + b', inplace=True)
+   df.eval('d = a + b + c', inplace=True)
+   df.eval('a = 1', inplace=True)
    df
 
+When ``inplace`` is set to ``False``, a copy of the ``DataFrame`` with the
+new or modified columns is returned and the original frame is unchanged.
+
+.. ipython:: python
+
+   df
+   df.eval('e = a - c', inplace=False)
+   df
+
+.. versionadded:: 0.18.0
+
+As a convenience, multiple assignments can be performed by using a
+multi-line string.
+
+.. ipython:: python
+
+   df.eval("""
+   c = a + b
+   d = a + b + c
+   a = 1""", inplace=False)
+
 The equivalent in standard Python would be
 
 .. ipython:: python
@@ -592,22 +643,26 @@ The equivalent in standard Python would be
    df['a'] = 1
    df
 
-Local Variables
-~~~~~~~~~~~~~~~
+.. versionadded:: 0.18.0
 
-In pandas version 0.14 the local variable API has changed. In pandas 0.13.x,
-you could refer to local variables the same way you would in standard Python.
-For example,
+The ``query`` method gained the ``inplace`` keyword which determines
+whether the query modifies the original frame.
 
-.. code-block:: python
+.. ipython:: python
 
-   df = pd.DataFrame(np.random.randn(5, 2), columns=['a', 'b'])
-   newcol = np.random.randn(len(df))
-   df.eval('b + newcol')
+   df = pd.DataFrame(dict(a=range(5), b=range(5, 10)))
+   df.query('a > 2')
+   df.query('a > 2', inplace=True)
+   df
 
-   UndefinedVariableError: name 'newcol' is not defined
+.. warning::
+
+   Unlike with ``eval``, the default value for ``inplace`` for ``query``
+   is ``False``.  This is consistent with prior versions of pandas.
+
+Local Variables
+~~~~~~~~~~~~~~~
 
-As you can see from the exception generated, this syntax is no longer allowed.
 You must *explicitly reference* any local variable that you want to use in an
 expression by placing the ``@`` character in front of the name. For example,
 
@@ -699,7 +754,7 @@ ol' Python.
 .. note::
 
    Using the ``'python'`` engine is generally *not* useful, except for testing
-   other evaluation engines against it. You will acheive **no** performance
+   other evaluation engines against it. You will achieve **no** performance
    benefits using :func:`~pandas.eval` with ``engine='python'`` and in fact may
    incur a performance hit.
 
@@ -745,13 +800,13 @@ Technical Minutia Regarding Expression Evaluation
 
 Expressions that would result in an object dtype or involve datetime operations
 (because of ``NaT``) must be evaluated in Python space. The main reason for
-this behavior is to maintain backwards compatbility with versions of numpy <
-1.7. In those versions of ``numpy`` a call to ``ndarray.astype(str)`` will
+this behavior is to maintain backwards compatibility with versions of NumPy <
+1.7. In those versions of NumPy a call to ``ndarray.astype(str)`` will
 truncate any strings that are more than 60 characters in length. Second, we
 can't pass ``object`` arrays to ``numexpr`` thus string comparisons must be
 evaluated in Python space.
 
-The upshot is that this *only* applies to object-dtype'd expressions. So, if
+The upshot is that this *only* applies to object-dtype expressions. So, if
 you have an expression--for example
 
 .. ipython:: python
diff --git a/doc/source/extending.rst b/doc/source/extending.rst
new file mode 100644
index 0000000000000..38b3b19031a0e
--- /dev/null
+++ b/doc/source/extending.rst
@@ -0,0 +1,342 @@
+.. _extending:
+
+****************
+Extending Pandas
+****************
+
+While pandas provides a rich set of methods, containers, and data types, your
+needs may not be fully satisfied. Pandas offers a few options for extending
+pandas.
+
+.. _extending.register-accessors:
+
+Registering Custom Accessors
+----------------------------
+
+Libraries can use the decorators
+:func:`pandas.api.extensions.register_dataframe_accessor`,
+:func:`pandas.api.extensions.register_series_accessor`, and
+:func:`pandas.api.extensions.register_index_accessor`, to add additional
+"namespaces" to pandas objects. All of these follow a similar convention: you
+decorate a class, providing the name of attribute to add. The class's
+``__init__`` method gets the object being decorated. For example:
+
+.. code-block:: python
+
+   @pd.api.extensions.register_dataframe_accessor("geo")
+   class GeoAccessor(object):
+       def __init__(self, pandas_obj):
+           self._obj = pandas_obj
+
+       @property
+       def center(self):
+           # return the geographic center point of this DataFrame
+           lat = self._obj.latitude
+           lon = self._obj.longitude
+           return (float(lon.mean()), float(lat.mean()))
+
+       def plot(self):
+           # plot this array's data on a map, e.g., using Cartopy
+           pass
+
+Now users can access your methods using the ``geo`` namespace:
+
+      >>> ds = pd.DataFrame({'longitude': np.linspace(0, 10),
+      ...                    'latitude': np.linspace(0, 20)})
+      >>> ds.geo.center
+      (5.0, 10.0)
+      >>> ds.geo.plot()
+      # plots data on a map
+
+This can be a convenient way to extend pandas objects without subclassing them.
+If you write a custom accessor, make a pull request adding it to our
+:ref:`ecosystem` page.
+
+.. _extending.extension-types:
+
+Extension Types
+---------------
+
+.. versionadded:: 0.23.0
+
+.. warning::
+
+   The :class:`pandas.api.extensions.ExtensionDtype` and :class:`pandas.api.extensions.ExtensionArray` APIs are new and
+   experimental. They may change between versions without warning.
+
+Pandas defines an interface for implementing data types and arrays that *extend*
+NumPy's type system. Pandas itself uses the extension system for some types
+that aren't built into NumPy (categorical, period, interval, datetime with
+timezone).
+
+Libraries can define a custom array and data type. When pandas encounters these
+objects, they will be handled properly (i.e. not converted to an ndarray of
+objects). Many methods like :func:`pandas.isna` will dispatch to the extension
+type's implementation.
+
+If you're building a library that implements the interface, please publicize it
+on :ref:`ecosystem.extensions`.
+
+The interface consists of two classes.
+
+:class:`~pandas.api.extensions.ExtensionDtype`
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+A :class:`pandas.api.extensions.ExtensionDtype` is similar to a ``numpy.dtype`` object. It describes the
+data type. Implementors are responsible for a few unique items like the name.
+
+One particularly important item is the ``type`` property. This should be the
+class that is the scalar type for your data. For example, if you were writing an
+extension array for IP Address data, this might be ``ipaddress.IPv4Address``.
+
+See the `extension dtype source`_ for interface definition.
+
+:class:`~pandas.api.extensions.ExtensionArray`
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+This class provides all the array-like functionality. ExtensionArrays are
+limited to 1 dimension. An ExtensionArray is linked to an ExtensionDtype via the
+``dtype`` attribute.
+
+Pandas makes no restrictions on how an extension array is created via its
+``__new__`` or ``__init__``, and puts no restrictions on how you store your
+data. We do require that your array be convertible to a NumPy array, even if
+this is relatively expensive (as it is for ``Categorical``).
+
+They may be backed by none, one, or many NumPy arrays. For example,
+``pandas.Categorical`` is an extension array backed by two arrays,
+one for codes and one for categories. An array of IPv6 addresses may
+be backed by a NumPy structured array with two fields, one for the
+lower 64 bits and one for the upper 64 bits. Or they may be backed
+by some other storage type, like Python lists.
+
+See the `extension array source`_ for the interface definition. The docstrings
+and comments contain guidance for properly implementing the interface.
+
+.. _extending.extension.operator:
+
+:class:`~pandas.api.extensions.ExtensionArray` Operator Support
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. versionadded:: 0.24.0
+
+By default, there are no operators defined for the class :class:`~pandas.api.extensions.ExtensionArray`.
+There are two approaches for providing operator support for your ExtensionArray:
+
+1. Define each of the operators on your ``ExtensionArray`` subclass.
+2. Use an operator implementation from pandas that depends on operators that are already defined
+   on the underlying elements (scalars) of the ExtensionArray.
+
+For the first approach, you define selected operators, e.g., ``__add__``, ``__le__``, etc. that
+you want your ``ExtensionArray`` subclass to support.
+
+The second approach assumes that the underlying elements (i.e., scalar type) of the ``ExtensionArray``
+have the individual operators already defined.  In other words, if your ``ExtensionArray``
+named ``MyExtensionArray`` is implemented so that each element is an instance
+of the class ``MyExtensionElement``, then if the operators are defined
+for ``MyExtensionElement``, the second approach will automatically
+define the operators for ``MyExtensionArray``.
+
+A mixin class, :class:`~pandas.api.extensions.ExtensionScalarOpsMixin` supports this second
+approach.  If developing an ``ExtensionArray`` subclass, for example ``MyExtensionArray``,
+can simply include ``ExtensionScalarOpsMixin`` as a parent class of ``MyExtensionArray``,
+and then call the methods :meth:`~MyExtensionArray._add_arithmetic_ops` and/or
+:meth:`~MyExtensionArray._add_comparison_ops` to hook the operators into
+your ``MyExtensionArray`` class, as follows:
+
+.. code-block:: python
+
+    class MyExtensionArray(ExtensionArray, ExtensionScalarOpsMixin):
+        pass
+
+    MyExtensionArray._add_arithmetic_ops()
+    MyExtensionArray._add_comparison_ops()
+
+Note that since ``pandas`` automatically calls the underlying operator on each
+element one-by-one, this might not be as performant as implementing your own
+version of the associated operators directly on the ``ExtensionArray``.
+
+.. _extending.extension.testing:
+
+Testing Extension Arrays
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+We provide a test suite for ensuring that your extension arrays satisfy the expected
+behavior. To use the test suite, you must provide several pytest fixtures and inherit
+from the base test class. The required fixtures are found in
+https://github.com/pandas-dev/pandas/blob/master/pandas/tests/extension/conftest.py.
+
+To use a test, subclass it:
+
+.. code-block:: python
+
+   from pandas.tests.extension import base
+
+   class TestConstructors(base.BaseConstructorsTests):
+       pass
+
+
+See https://github.com/pandas-dev/pandas/blob/master/pandas/tests/extension/base/__init__.py
+for a list of all the tests available.
+
+.. _extension dtype source: https://github.com/pandas-dev/pandas/blob/master/pandas/core/dtypes/base.py
+.. _extension array source: https://github.com/pandas-dev/pandas/blob/master/pandas/core/arrays/base.py
+
+.. _extending.subclassing-pandas:
+
+Subclassing pandas Data Structures
+----------------------------------
+
+.. warning:: There are some easier alternatives before considering subclassing ``pandas`` data structures.
+
+  1. Extensible method chains with :ref:`pipe <basics.pipe>`
+
+  2. Use *composition*. See `here <http://en.wikipedia.org/wiki/Composition_over_inheritance>`_.
+
+  3. Extending by :ref:`registering an accessor <extending.register-accessors>`
+
+  4. Extending by :ref:`extension type <extending.extension-types>`
+
+This section describes how to subclass ``pandas`` data structures to meet more specific needs. There are two points that need attention:
+
+1. Override constructor properties.
+2. Define original properties
+
+.. note::
+
+   You can find a nice example in `geopandas <https://github.com/geopandas/geopandas>`_ project.
+
+Override Constructor Properties
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Each data structure has several *constructor properties* for returning a new
+data structure as the result of an operation. By overriding these properties,
+you can retain subclasses through ``pandas`` data manipulations.
+
+There are 3 constructor properties to be defined:
+
+* ``_constructor``: Used when a manipulation result has the same dimensions as the original.
+* ``_constructor_sliced``: Used when a manipulation result has one lower dimension(s) as the original, such as ``DataFrame`` single columns slicing.
+* ``_constructor_expanddim``: Used when a manipulation result has one higher dimension as the original, such as ``Series.to_frame()`` and ``DataFrame.to_panel()``.
+
+Following table shows how ``pandas`` data structures define constructor properties by default.
+
+===========================  ======================= =============
+Property Attributes          ``Series``              ``DataFrame``
+===========================  ======================= =============
+``_constructor``             ``Series``              ``DataFrame``
+``_constructor_sliced``      ``NotImplementedError`` ``Series``
+``_constructor_expanddim``   ``DataFrame``           ``Panel``
+===========================  ======================= =============
+
+Below example shows how to define ``SubclassedSeries`` and ``SubclassedDataFrame`` overriding constructor properties.
+
+.. code-block:: python
+
+   class SubclassedSeries(Series):
+
+       @property
+       def _constructor(self):
+           return SubclassedSeries
+
+       @property
+       def _constructor_expanddim(self):
+           return SubclassedDataFrame
+
+   class SubclassedDataFrame(DataFrame):
+
+       @property
+       def _constructor(self):
+           return SubclassedDataFrame
+
+       @property
+       def _constructor_sliced(self):
+           return SubclassedSeries
+
+.. code-block:: python
+
+   >>> s = SubclassedSeries([1, 2, 3])
+   >>> type(s)
+   <class '__main__.SubclassedSeries'>
+
+   >>> to_framed = s.to_frame()
+   >>> type(to_framed)
+   <class '__main__.SubclassedDataFrame'>
+
+   >>> df = SubclassedDataFrame({'A', [1, 2, 3], 'B': [4, 5, 6], 'C': [7, 8, 9]})
+   >>> df
+      A  B  C
+   0  1  4  7
+   1  2  5  8
+   2  3  6  9
+
+   >>> type(df)
+   <class '__main__.SubclassedDataFrame'>
+
+   >>> sliced1 = df[['A', 'B']]
+   >>> sliced1
+      A  B
+   0  1  4
+   1  2  5
+   2  3  6
+   >>> type(sliced1)
+   <class '__main__.SubclassedDataFrame'>
+
+   >>> sliced2 = df['A']
+   >>> sliced2
+   0    1
+   1    2
+   2    3
+   Name: A, dtype: int64
+   >>> type(sliced2)
+   <class '__main__.SubclassedSeries'>
+
+Define Original Properties
+^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+To let original data structures have additional properties, you should let ``pandas`` know what properties are added. ``pandas`` maps unknown properties to data names overriding ``__getattribute__``. Defining original properties can be done in one of 2 ways:
+
+1. Define ``_internal_names`` and ``_internal_names_set`` for temporary properties which WILL NOT be passed to manipulation results.
+2. Define ``_metadata`` for normal properties which will be passed to manipulation results.
+
+Below is an example to define two original properties, "internal_cache" as a temporary property and "added_property" as a normal property
+
+.. code-block:: python
+
+   class SubclassedDataFrame2(DataFrame):
+
+       # temporary properties
+       _internal_names = pd.DataFrame._internal_names + ['internal_cache']
+       _internal_names_set = set(_internal_names)
+
+       # normal properties
+       _metadata = ['added_property']
+
+       @property
+       def _constructor(self):
+           return SubclassedDataFrame2
+
+.. code-block:: python
+
+   >>> df = SubclassedDataFrame2({'A': [1, 2, 3], 'B': [4, 5, 6], 'C': [7, 8, 9]})
+   >>> df
+      A  B  C
+   0  1  4  7
+   1  2  5  8
+   2  3  6  9
+
+   >>> df.internal_cache = 'cached'
+   >>> df.added_property = 'property'
+
+   >>> df.internal_cache
+   cached
+   >>> df.added_property
+   property
+
+   # properties defined in _internal_names is reset after manipulation
+   >>> df[['A', 'B']].internal_cache
+   AttributeError: 'SubclassedDataFrame2' object has no attribute 'internal_cache'
+
+   # properties defined in _metadata are retained
+   >>> df[['A', 'B']].added_property
+   property
diff --git a/doc/source/faq.rst b/doc/source/faq.rst
deleted file mode 100644
index 7714d937e15d6..0000000000000
--- a/doc/source/faq.rst
+++ /dev/null
@@ -1,180 +0,0 @@
-.. currentmodule:: pandas
-.. _faq:
-
-********************************
-Frequently Asked Questions (FAQ)
-********************************
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   np.random.seed(123456)
-   np.set_printoptions(precision=4, suppress=True)
-   import pandas as pd
-   pd.options.display.max_rows = 15
-   import matplotlib
-   try:
-      matplotlib.style.use('ggplot')
-   except AttributeError:
-      pd.options.display.mpl_style = 'default'
-   import matplotlib.pyplot as plt
-   plt.close('all')
-
-.. _df-memory-usage:
-
-DataFrame memory usage
-----------------------
-As of pandas version 0.15.0, the memory usage of a dataframe (including
-the index) is shown when accessing the ``info`` method of a dataframe. A
-configuration option, ``display.memory_usage`` (see :ref:`options`),
-specifies if the dataframe's memory usage will be displayed when
-invoking the ``df.info()`` method.
-
-For example, the memory usage of the dataframe below is shown
-when calling ``df.info()``:
-
-.. ipython:: python
-
-    dtypes = ['int64', 'float64', 'datetime64[ns]', 'timedelta64[ns]',
-              'complex128', 'object', 'bool']
-    n = 5000
-    data = dict([ (t, np.random.randint(100, size=n).astype(t))
-                    for t in dtypes])
-    df = pd.DataFrame(data)
-    df['categorical'] = df['object'].astype('category')
-
-    df.info()
-
-The ``+`` symbol indicates that the true memory usage could be higher, because
-pandas does not count the memory used by values in columns with
-``dtype=object``.
-
-By default the display option is set to ``True`` but can be explicitly
-overridden by passing the ``memory_usage`` argument when invoking ``df.info()``.
-
-The memory usage of each column can be found by calling the ``memory_usage``
-method. This returns a Series with an index represented by column names
-and memory usage of each column shown in bytes. For the dataframe above,
-the memory usage of each column and the total memory usage of the
-dataframe can be found with the memory_usage method:
-
-.. ipython:: python
-
-    df.memory_usage()
-
-    # total memory usage of dataframe
-    df.memory_usage().sum()
-
-By default the memory usage of the dataframe's index is not shown in the
-returned Series, the memory usage of the index can be shown by passing
-the ``index=True`` argument:
-
-.. ipython:: python
-
-    df.memory_usage(index=True)
-
-The memory usage displayed by the ``info`` method utilizes the
-``memory_usage`` method to determine the memory usage of a dataframe
-while also formatting the output in human-readable units (base-2
-representation; i.e., 1KB = 1024 bytes).
-
-See also :ref:`Categorical Memory Usage <categorical.memory>`.
-
-Byte-Ordering Issues
---------------------
-Occasionally you may have to deal with data that were created on a machine with
-a different byte order than the one on which you are running Python. To deal
-with this issue you should convert the underlying NumPy array to the native
-system byte order *before* passing it to Series/DataFrame/Panel constructors
-using something similar to the following:
-
-.. ipython:: python
-
-   x = np.array(list(range(10)), '>i4') # big endian
-   newx = x.byteswap().newbyteorder() # force native byteorder
-   s = pd.Series(newx)
-
-See `the NumPy documentation on byte order
-<http://docs.scipy.org/doc/numpy/user/basics.byteswapping.html>`__ for more
-details.
-
-
-Visualizing Data in Qt applications
------------------------------------
-
-.. warning::
-
-    The ``qt`` support is **deprecated and will be removed in a future version**.
-    We refer users to the external package `pandas-qt <https://github.com/datalyze-solutions/pandas-qt>`_.
-
-There is experimental support for visualizing DataFrames in PyQt4 and PySide
-applications. At the moment you can display and edit the values of the cells
-in the DataFrame. Qt will take care of displaying just the portion of the
-DataFrame that is currently visible and the edits will be immediately saved to
-the underlying DataFrame
-
-To demonstrate this we will create a simple PySide application that will switch
-between two editable DataFrames. For this will use the ``DataFrameModel`` class
-that handles the access to the DataFrame, and the ``DataFrameWidget``, which is
-just a thin layer around the ``QTableView``.
-
-.. code-block:: python
-
-	import numpy as np
-	import pandas as pd
-	from pandas.sandbox.qtpandas import DataFrameModel, DataFrameWidget
-	from PySide import QtGui, QtCore
-
-	# Or if you use PyQt4:
-	# from PyQt4 import QtGui, QtCore
-
-	class MainWidget(QtGui.QWidget):
-	    def __init__(self, parent=None):
-	        super(MainWidget, self).__init__(parent)
-
-	        # Create two DataFrames
-	        self.df1 = pd.DataFrame(np.arange(9).reshape(3, 3),
-	                                columns=['foo', 'bar', 'baz'])
-	        self.df2 = pd.DataFrame({
-	                'int': [1, 2, 3],
-	                'float': [1.5, 2.5, 3.5],
-	                'string': ['a', 'b', 'c'],
-	                'nan': [np.nan, np.nan, np.nan]
-	            }, index=['AAA', 'BBB', 'CCC'],
-	            columns=['int', 'float', 'string', 'nan'])
-
-	        # Create the widget and set the first DataFrame
-	        self.widget = DataFrameWidget(self.df1)
-
-	        # Create the buttons for changing DataFrames
-	        self.button_first = QtGui.QPushButton('First')
-	        self.button_first.clicked.connect(self.on_first_click)
-	        self.button_second = QtGui.QPushButton('Second')
-	        self.button_second.clicked.connect(self.on_second_click)
-
-	        # Set the layout
-	        vbox = QtGui.QVBoxLayout()
-	        vbox.addWidget(self.widget)
-	        hbox = QtGui.QHBoxLayout()
-	        hbox.addWidget(self.button_first)
-	        hbox.addWidget(self.button_second)
-	        vbox.addLayout(hbox)
-	        self.setLayout(vbox)
-
-	    def on_first_click(self):
-	    	'''Sets the first DataFrame'''
-	        self.widget.setDataFrame(self.df1)
-
-	    def on_second_click(self):
-	    	'''Sets the second DataFrame'''
-	        self.widget.setDataFrame(self.df2)
-
-	if __name__ == '__main__':
-	    import sys
-
-	    # Initialize the application
-	    app = QtGui.QApplication(sys.argv)
-	    mw = MainWidget()
-	    mw.show()
-	    app.exec_()
diff --git a/doc/source/gotchas.rst b/doc/source/gotchas.rst
index fe7ab67b7f759..79e312ca12833 100644
--- a/doc/source/gotchas.rst
+++ b/doc/source/gotchas.rst
@@ -1,35 +1,108 @@
 .. currentmodule:: pandas
 .. _gotchas:
 
+********************************
+Frequently Asked Questions (FAQ)
+********************************
+
 .. ipython:: python
    :suppress:
 
    import numpy as np
+   np.random.seed(123456)
    np.set_printoptions(precision=4, suppress=True)
    import pandas as pd
-   pd.options.display.max_rows=15
+   pd.options.display.max_rows = 15
+   import matplotlib
+   # matplotlib.style.use('default')
+   import matplotlib.pyplot as plt
+   plt.close('all')
+
+.. _df-memory-usage:
+
+DataFrame memory usage
+----------------------
+The memory usage of a ``DataFrame`` (including the index) is shown when calling
+the :meth:`~DataFrame.info`. A configuration option, ``display.memory_usage`` 
+(see :ref:`the list of options <options.available>`), specifies if the 
+``DataFrame``'s memory usage will be displayed when invoking the ``df.info()`` 
+method.
+
+For example, the memory usage of the ``DataFrame`` below is shown
+when calling :meth:`~DataFrame.info`:
+
+.. ipython:: python
+
+    dtypes = ['int64', 'float64', 'datetime64[ns]', 'timedelta64[ns]',
+              'complex128', 'object', 'bool']
+    n = 5000
+    data = dict([(t, np.random.randint(100, size=n).astype(t))
+                  for t in dtypes])
+    df = pd.DataFrame(data)
+    df['categorical'] = df['object'].astype('category')
+
+    df.info()
+
+The ``+`` symbol indicates that the true memory usage could be higher, because
+pandas does not count the memory used by values in columns with
+``dtype=object``.
+
+Passing ``memory_usage='deep'`` will enable a more accurate memory usage report,
+accounting for the full usage of the contained objects. This is optional
+as it can be expensive to do this deeper introspection.
+
+.. ipython:: python
+
+   df.info(memory_usage='deep')
+
+By default the display option is set to ``True`` but can be explicitly
+overridden by passing the ``memory_usage`` argument when invoking ``df.info()``.
+
+The memory usage of each column can be found by calling the 
+:meth:`~DataFrame.memory_usage` method. This returns a ``Series`` with an index 
+represented by column names and memory usage of each column shown in bytes. For 
+the ``DataFrame`` above, the memory usage of each column and the total memory 
+usage can be found with the ``memory_usage`` method:
+
+.. ipython:: python
+
+    df.memory_usage()
 
+    # total memory usage of dataframe
+    df.memory_usage().sum()
 
-*******************
-Caveats and Gotchas
-*******************
+By default the memory usage of the ``DataFrame``'s index is shown in the
+returned ``Series``, the memory usage of the index can be suppressed by passing
+the ``index=False`` argument:
+
+.. ipython:: python
+
+    df.memory_usage(index=False)
+
+The memory usage displayed by the :meth:`~DataFrame.info` method utilizes the
+:meth:`~DataFrame.memory_usage` method to determine the memory usage of a 
+``DataFrame`` while also formatting the output in human-readable units (base-2
+representation; i.e. 1KB = 1024 bytes).
+
+See also :ref:`Categorical Memory Usage <categorical.memory>`.
 
 .. _gotchas.truth:
 
 Using If/Truth Statements with pandas
 -------------------------------------
 
-pandas follows the numpy convention of raising an error when you try to convert something to a ``bool``.
-This happens in a ``if`` or when using the boolean operations, ``and``, ``or``, or ``not``.  It is not clear
-what the result of
+pandas follows the NumPy convention of raising an error when you try to convert 
+something to a ``bool``. This happens in an ``if``-statement or when using the 
+boolean operations: ``and``, ``or``, and ``not``. It is not clear what the result
+of the following code should be:
 
 .. code-block:: python
 
     >>> if pd.Series([False, True, False]):
          ...
 
-should be. Should it be ``True`` because it's not zero-length? ``False`` because there are ``False`` values?
-It is unclear, so instead, pandas raises a ``ValueError``:
+Should it be ``True`` because it's not zero-length, or ``False`` because there 
+are ``False`` values? It is unclear, so instead, pandas raises a ``ValueError``:
 
 .. code-block:: python
 
@@ -39,9 +112,9 @@ It is unclear, so instead, pandas raises a ``ValueError``:
         ...
     ValueError: The truth value of an array is ambiguous. Use a.empty, a.any() or a.all().
 
-
-If you see that, you need to explicitly choose what you want to do with it (e.g., use `any()`, `all()` or `empty`).
-or, you might want to compare if the pandas object is ``None``
+You need to explicitly choose what you want to do with the ``DataFrame``, e.g.
+use :meth:`~DataFrame.any`, :meth:`~DataFrame.all` or :meth:`~DataFrame.empty`.
+Alternatively, you might want to compare if the pandas object is ``None``:
 
 .. code-block:: python
 
@@ -50,7 +123,7 @@ or, you might want to compare if the pandas object is ``None``
     >>> I was not None
 
 
-or return if ``any`` value is ``True``.
+Below is how to check if any of the values are ``True``:
 
 .. code-block:: python
 
@@ -58,7 +131,8 @@ or return if ``any`` value is ``True``.
            print("I am any")
     >>> I am any
 
-To evaluate single-element pandas objects in a boolean context, use the method ``.bool()``:
+To evaluate single-element pandas objects in a boolean context, use the method 
+:meth:`~DataFrame.bool`:
 
 .. ipython:: python
 
@@ -70,7 +144,7 @@ To evaluate single-element pandas objects in a boolean context, use the method `
 Bitwise boolean
 ~~~~~~~~~~~~~~~
 
-Bitwise boolean operators like ``==`` and ``!=`` will return a boolean ``Series``,
+Bitwise boolean operators like ``==`` and ``!=`` return a boolean ``Series``,
 which is almost always what you want anyways.
 
 .. code-block:: python
@@ -89,25 +163,25 @@ See :ref:`boolean comparisons<basics.compare>` for more examples.
 Using the ``in`` operator
 ~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Using the Python ``in`` operator on a Series tests for membership in the
+Using the Python ``in`` operator on a ``Series`` tests for membership in the
 index, not membership among the values.
 
-.. ipython::
+.. ipython:: python
 
     s = pd.Series(range(5), index=list('abcde'))
     2 in s
     'b' in s
 
 If this behavior is surprising, keep in mind that using ``in`` on a Python
-dictionary tests keys, not values, and Series are dict-like.
-To test for membership in the values, use the method :func:`~pandas.Series.isin`:
+dictionary tests keys, not values, and ``Series`` are dict-like.
+To test for membership in the values, use the method :meth:`~pandas.Series.isin`:
 
-.. ipython::
+.. ipython:: python
 
     s.isin([2])
     s.isin([2]).any()
 
-For DataFrames, likewise, ``in`` applies to the column axis,
+For ``DataFrames``, likewise, ``in`` applies to the column axis,
 testing for membership in the list of column names.
 
 ``NaN``, Integer ``NA`` values and ``NA`` type promotions
@@ -117,18 +191,18 @@ Choice of ``NA`` representation
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 For lack of ``NA`` (missing) support from the ground up in NumPy and Python in
-general, we were given the difficult choice between either
+general, we were given the difficult choice between either:
 
-- A *masked array* solution: an array of data and an array of boolean values
-  indicating whether a value
-- Using a special sentinel value, bit pattern, or set of sentinel values to
-  denote ``NA`` across the dtypes
+* A *masked array* solution: an array of data and an array of boolean values
+  indicating whether a value is there or is missing.
+* Using a special sentinel value, bit pattern, or set of sentinel values to
+  denote ``NA`` across the dtypes.
 
 For many reasons we chose the latter. After years of production use it has
 proven, at least in my opinion, to be the best decision given the state of
 affairs in NumPy and Python in general. The special value ``NaN``
 (Not-A-Number) is used everywhere as the ``NA`` value, and there are API
-functions ``isnull`` and ``notnull`` which can be used across the dtypes to
+functions ``isna`` and ``notna`` which can be used across the dtypes to
 detect NA values.
 
 However, it comes with it a couple of trade-offs which I most certainly have
@@ -154,15 +228,16 @@ arrays. For example:
    s2.dtype
 
 This trade-off is made largely for memory and performance reasons, and also so
-that the resulting Series continues to be "numeric". One possibility is to use
-``dtype=object`` arrays instead.
+that the resulting ``Series`` continues to be "numeric". One possibility is to 
+use ``dtype=object`` arrays instead.
 
 ``NA`` type promotions
 ~~~~~~~~~~~~~~~~~~~~~~
 
-When introducing NAs into an existing Series or DataFrame via ``reindex`` or
-some other means, boolean and integer types will be promoted to a different
-dtype in order to store the NAs. These are summarized by this table:
+When introducing NAs into an existing ``Series`` or ``DataFrame`` via 
+:meth:`~Series.reindex` or some other means, boolean and integer types will be 
+promoted to a different dtype in order to store the NAs. The promotions are 
+summarized in this table:
 
 .. csv-table::
    :header: "Typeclass","Promotion dtype for storing NAs"
@@ -173,16 +248,16 @@ dtype in order to store the NAs. These are summarized by this table:
    ``integer``, cast to ``float64``
    ``boolean``, cast to ``object``
 
-While this may seem like a heavy trade-off, in practice I have found very few
-cases where this is an issue in practice. Some explanation for the motivation
-here in the next section.
+While this may seem like a heavy trade-off, I have found very few cases where
+this is an issue in practice i.e. storing values greater than 2**53. Some
+explanation for the motivation is in the next section.
 
 Why not make NumPy like R?
 ~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Many people have suggested that NumPy should simply emulate the ``NA`` support
 present in the more domain-specific statistical programming language `R
-<http://r-project.org>`__. Part of the reason is the NumPy type hierarchy:
+<https://r-project.org>`__. Part of the reason is the NumPy type hierarchy:
 
 .. csv-table::
    :header: "Typeclass","Dtypes"
@@ -214,344 +289,32 @@ and traded integer ``NA`` capability for a much simpler approach of using a
 special value in float and object arrays to denote ``NA``, and promoting
 integer arrays to floating when NAs must be introduced.
 
-Integer indexing
-----------------
-
-Label-based indexing with integer axis labels is a thorny topic. It has been
-discussed heavily on mailing lists and among various members of the scientific
-Python community. In pandas, our general viewpoint is that labels matter more
-than integer locations. Therefore, with an integer axis index *only*
-label-based indexing is possible with the standard tools like ``.ix``. The
-following code will generate exceptions:
-
-.. code-block:: python
-
-   s = pd.Series(range(5))
-   s[-1]
-   df = pd.DataFrame(np.random.randn(5, 4))
-   df
-   df.ix[-2:]
-
-This deliberate decision was made to prevent ambiguities and subtle bugs (many
-users reported finding bugs when the API change was made to stop "falling back"
-on position-based indexing).
-
-Label-based slicing conventions
--------------------------------
-
-Non-monotonic indexes require exact matches
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Endpoints are inclusive
-~~~~~~~~~~~~~~~~~~~~~~~
-
-Compared with standard Python sequence slicing in which the slice endpoint is
-not inclusive, label-based slicing in pandas **is inclusive**. The primary
-reason for this is that it is often not possible to easily determine the
-"successor" or next element after a particular label in an index. For example,
-consider the following Series:
-
-.. ipython:: python
-
-   s = pd.Series(np.random.randn(6), index=list('abcdef'))
-   s
-
-Suppose we wished to slice from ``c`` to ``e``, using integers this would be
-
-.. ipython:: python
-
-   s[2:5]
-
-However, if you only had ``c`` and ``e``, determining the next element in the
-index can be somewhat complicated. For example, the following does not work:
-
-::
-
-    s.ix['c':'e'+1]
-
-A very common use case is to limit a time series to start and end at two
-specific dates. To enable this, we made the design design to make label-based
-slicing include both endpoints:
-
-.. ipython:: python
-
-    s.ix['c':'e']
-
-This is most definitely a "practicality beats purity" sort of thing, but it is
-something to watch out for if you expect label-based slicing to behave exactly
-in the way that standard Python integer slicing works.
-
-Miscellaneous indexing gotchas
-------------------------------
-
-Reindex versus ix gotchas
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Many users will find themselves using the ``ix`` indexing capabilities as a
-concise means of selecting data from a pandas object:
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(6, 4), columns=['one', 'two', 'three', 'four'],
-                     index=list('abcdef'))
-   df
-   df.ix[['b', 'c', 'e']]
-
-This is, of course, completely equivalent *in this case* to using the
-``reindex`` method:
-
-.. ipython:: python
-
-   df.reindex(['b', 'c', 'e'])
-
-Some might conclude that ``ix`` and ``reindex`` are 100% equivalent based on
-this. This is indeed true **except in the case of integer indexing**. For
-example, the above operation could alternately have been expressed as:
-
-.. ipython:: python
-
-   df.ix[[1, 2, 4]]
-
-If you pass ``[1, 2, 4]`` to ``reindex`` you will get another thing entirely:
-
-.. ipython:: python
-
-   df.reindex([1, 2, 4])
-
-So it's important to remember that ``reindex`` is **strict label indexing
-only**. This can lead to some potentially surprising results in pathological
-cases where an index contains, say, both integers and strings:
-
-.. ipython:: python
-
-   s = pd.Series([1, 2, 3], index=['a', 0, 1])
-   s
-   s.ix[[0, 1]]
-   s.reindex([0, 1])
-
-Because the index in this case does not contain solely integers, ``ix`` falls
-back on integer indexing. By contrast, ``reindex`` only looks for the values
-passed in the index, thus finding the integers ``0`` and ``1``. While it would
-be possible to insert some logic to check whether a passed sequence is all
-contained in the index, that logic would exact a very high cost in large data
-sets.
-
-Reindex potentially changes underlying Series dtype
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The use of ``reindex_like`` can potentially change the dtype of a ``Series``.
-
-.. ipython:: python
-
-   series = pd.Series([1, 2, 3])
-   x = pd.Series([True])
-   x.dtype
-   x = pd.Series([True]).reindex_like(series)
-   x.dtype
-
-This is because ``reindex_like`` silently inserts ``NaNs`` and the ``dtype``
-changes accordingly.  This can cause some issues when using ``numpy`` ``ufuncs``
-such as ``numpy.logical_and``.
-
-See the `this old issue <https://github.com/pydata/pandas/issues/2388>`__ for a more
-detailed discussion.
-
-.. _gotchas.timestamp-limits:
-
-Timestamp limitations
----------------------
-
-Minimum and maximum timestamps
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Since pandas represents timestamps in nanosecond resolution, the timespan that
-can be represented using a 64-bit integer is limited to approximately 584 years:
-
-.. ipython:: python
-
-   begin = pd.Timestamp.min
-   begin
-
-   end = pd.Timestamp.max
-   end
-
-See :ref:`here <timeseries.oob>` for ways to represent data outside these bound.
-
-Parsing Dates from Text Files
------------------------------
-
-When parsing multiple text file columns into a single date column, the new date
-column is prepended to the data and then `index_col` specification is indexed off
-of the new set of columns rather than the original ones:
-
-.. ipython:: python
-   :suppress:
-
-   data =  ("KORD,19990127, 19:00:00, 18:56:00, 0.8100\n"
-            "KORD,19990127, 20:00:00, 19:56:00, 0.0100\n"
-            "KORD,19990127, 21:00:00, 20:56:00, -0.5900\n"
-            "KORD,19990127, 21:00:00, 21:18:00, -0.9900\n"
-            "KORD,19990127, 22:00:00, 21:56:00, -0.5900\n"
-            "KORD,19990127, 23:00:00, 22:56:00, -0.5900")
-
-   with open('tmp.csv', 'w') as fh:
-       fh.write(data)
-
-.. ipython:: python
-
-   print(open('tmp.csv').read())
-
-   date_spec = {'nominal': [1, 2], 'actual': [1, 3]}
-   df = pd.read_csv('tmp.csv', header=None,
-                    parse_dates=date_spec,
-                    keep_date_col=True,
-                    index_col=0)
-
-   # index_col=0 refers to the combined column "nominal" and not the original
-   # first column of 'KORD' strings
-
-   df
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   os.remove('tmp.csv')
-
 
 Differences with NumPy
 ----------------------
-For Series and DataFrame objects, ``var`` normalizes by ``N-1`` to produce
-unbiased estimates of the sample variance, while NumPy's ``var`` normalizes
-by N, which measures the variance of the sample. Note that ``cov``
-normalizes by ``N-1`` in both pandas and NumPy.
+For ``Series`` and ``DataFrame`` objects, :meth:`~DataFrame.var` normalizes by 
+``N-1`` to produce unbiased estimates of the sample variance, while NumPy's 
+``var`` normalizes by N, which measures the variance of the sample. Note that 
+:meth:`~DataFrame.cov` normalizes by ``N-1`` in both pandas and NumPy.
 
 
 Thread-safety
 -------------
 
 As of pandas 0.11, pandas is not 100% thread safe. The known issues relate to
-the ``DataFrame.copy`` method. If you are doing a lot of copying of DataFrame
-objects shared among threads, we recommend holding locks inside the threads
-where the data copying occurs.
+the :meth:`~DataFrame.copy` method. If you are doing a lot of copying of 
+``DataFrame`` objects shared among threads, we recommend holding locks inside 
+the threads where the data copying occurs.
 
-See `this link <http://stackoverflow.com/questions/13592618/python-pandas-dataframe-thread-safe>`__
+See `this link <https://stackoverflow.com/questions/13592618/python-pandas-dataframe-thread-safe>`__
 for more information.
 
-.. _html-gotchas:
-
-HTML Table Parsing
-------------------
-There are some versioning issues surrounding the libraries that are used to
-parse HTML tables in the top-level pandas io function ``read_html``.
-
-**Issues with** |lxml|_
-
-   * Benefits
-
-     * |lxml|_ is very fast
-
-     * |lxml|_ requires Cython to install correctly.
-
-   * Drawbacks
-
-     * |lxml|_ does *not* make any guarantees about the results of its parse
-       *unless* it is given |svm|_.
-
-     * In light of the above, we have chosen to allow you, the user, to use the
-       |lxml|_ backend, but **this backend will use** |html5lib|_ if |lxml|_
-       fails to parse
-
-     * It is therefore *highly recommended* that you install both
-       |BeautifulSoup4|_ and |html5lib|_, so that you will still get a valid
-       result (provided everything else is valid) even if |lxml|_ fails.
-
-**Issues with** |BeautifulSoup4|_ **using** |lxml|_ **as a backend**
-
-   * The above issues hold here as well since |BeautifulSoup4|_ is essentially
-     just a wrapper around a parser backend.
-
-**Issues with** |BeautifulSoup4|_ **using** |html5lib|_ **as a backend**
-
-   * Benefits
-
-     * |html5lib|_ is far more lenient than |lxml|_ and consequently deals
-       with *real-life markup* in a much saner way rather than just, e.g.,
-       dropping an element without notifying you.
-
-     * |html5lib|_ *generates valid HTML5 markup from invalid markup
-       automatically*. This is extremely important for parsing HTML tables,
-       since it guarantees a valid document. However, that does NOT mean that
-       it is "correct", since the process of fixing markup does not have a
-       single definition.
-
-     * |html5lib|_ is pure Python and requires no additional build steps beyond
-       its own installation.
-
-   * Drawbacks
-
-     * The biggest drawback to using |html5lib|_ is that it is slow as
-       molasses.  However consider the fact that many tables on the web are not
-       big enough for the parsing algorithm runtime to matter. It is more
-       likely that the bottleneck will be in the process of reading the raw
-       text from the URL over the web, i.e., IO (input-output). For very large
-       tables, this might not be true.
-
-**Issues with using** |Anaconda|_
-
-   * `Anaconda`_ ships with `lxml`_ version 3.2.0; the following workaround for
-     `Anaconda`_ was successfully used to deal with the versioning issues
-     surrounding `lxml`_ and `BeautifulSoup4`_.
-
-   .. note::
-
-      Unless you have *both*:
-
-         * A strong restriction on the upper bound of the runtime of some code
-           that incorporates :func:`~pandas.io.html.read_html`
-         * Complete knowledge that the HTML you will be parsing will be 100%
-           valid at all times
-
-      then you should install `html5lib`_ and things will work swimmingly
-      without you having to muck around with `conda`. If you want the best of
-      both worlds then install both `html5lib`_ and `lxml`_. If you do install
-      `lxml`_ then you need to perform the following commands to ensure that
-      lxml will work correctly:
-
-      .. code-block:: sh
-
-         # remove the included version
-         conda remove lxml
-
-         # install the latest version of lxml
-         pip install 'git+git://github.com/lxml/lxml.git'
-
-         # install the latest version of beautifulsoup4
-         pip install 'bzr+lp:beautifulsoup'
-
-      Note that you need `bzr <http://bazaar.canonical.com/en>`__ and `git
-      <http://git-scm.com>`__ installed to perform the last two operations.
-
-.. |svm| replace:: **strictly valid markup**
-.. _svm: http://validator.w3.org/docs/help.html#validation_basics
-
-.. |html5lib| replace:: **html5lib**
-.. _html5lib: https://github.com/html5lib/html5lib-python
-
-.. |BeautifulSoup4| replace:: **BeautifulSoup4**
-.. _BeautifulSoup4: http://www.crummy.com/software/BeautifulSoup
-
-.. |lxml| replace:: **lxml**
-.. _lxml: http://lxml.de
-
-.. |Anaconda| replace:: **Anaconda**
-.. _Anaconda: https://store.continuum.io/cshop/anaconda
-
 
 Byte-Ordering Issues
 --------------------
 Occasionally you may have to deal with data that were created on a machine with
-a different byte order than the one on which you are running Python. A common symptom of this issue is an error like
+a different byte order than the one on which you are running Python. A common 
+symptom of this issue is an error like:
 
 .. code-block:: python
 
@@ -561,8 +324,8 @@ a different byte order than the one on which you are running Python. A common sy
 
 To deal
 with this issue you should convert the underlying NumPy array to the native
-system byte order *before* passing it to Series/DataFrame/Panel constructors
-using something similar to the following:
+system byte order *before* passing it to ``Series`` or ``DataFrame`` 
+constructors using something similar to the following:
 
 .. ipython:: python
 
@@ -571,5 +334,5 @@ using something similar to the following:
    s = pd.Series(newx)
 
 See `the NumPy documentation on byte order
-<http://docs.scipy.org/doc/numpy/user/basics.byteswapping.html>`__ for more
+<https://docs.scipy.org/doc/numpy/user/basics.byteswapping.html>`__ for more
 details.
diff --git a/doc/source/groupby.rst b/doc/source/groupby.rst
index b5a382ce24342..45e449d081fb0 100644
--- a/doc/source/groupby.rst
+++ b/doc/source/groupby.rst
@@ -10,52 +10,50 @@
    import pandas as pd
    pd.options.display.max_rows = 15
    import matplotlib
-   try:
-      matplotlib.style.use('ggplot')
-   except AttributeError:
-      pd.options.display.mpl_style = 'default'
+   # matplotlib.style.use('default')
    import matplotlib.pyplot as plt
    plt.close('all')
+   from collections import OrderedDict
 
 *****************************
 Group By: split-apply-combine
 *****************************
 
 By "group by" we are referring to a process involving one or more of the following
-steps
+steps:
 
- - **Splitting** the data into groups based on some criteria
- - **Applying** a function to each group independently
- - **Combining** the results into a data structure
+* **Splitting** the data into groups based on some criteria.
+* **Applying** a function to each group independently.
+* **Combining** the results into a data structure.
 
-Of these, the split step is the most straightforward. In fact, in many
-situations you may wish to split the data set into groups and do something with
-those groups yourself. In the apply step, we might wish to one of the
+Out of these, the split step is the most straightforward. In fact, in many
+situations we may wish to split the data set into groups and do something with
+those groups. In the apply step, we might wish to one of the
 following:
 
- - **Aggregation**: computing a summary statistic (or statistics) about each
-   group. Some examples:
+* **Aggregation**: compute a summary statistic (or statistics) for each
+  group. Some examples:
 
-    - Compute group sums or means
-    - Compute group sizes / counts
+    * Compute group sums or means.
+    * Compute group sizes / counts.
 
- - **Transformation**: perform some group-specific computations and return a
-   like-indexed. Some examples:
+* **Transformation**: perform some group-specific computations and return a
+  like-indexed object. Some examples:
 
-    - Standardizing data (zscore) within group
-    - Filling NAs within groups with a value derived from each group
+    * Standardize data (zscore) within a group.
+    * Filling NAs within groups with a value derived from each group.
 
- - **Filtration**: discard some groups, according to a group-wise computation
-   that evaluates True or False. Some examples:
+* **Filtration**: discard some groups, according to a group-wise computation
+  that evaluates True or False. Some examples:
 
-    - Discarding data that belongs to groups with only a few members
-    - Filtering out data based on the group sum or mean
+    * Discard data that belongs to groups with only a few members.
+    * Filter out data based on the group sum or mean.
 
- - Some combination of the above: GroupBy will examine the results of the apply
-   step and try to return a sensibly combined result if it doesn't fit into
-   either of the above two categories
+* Some combination of the above: GroupBy will examine the results of the apply
+  step and try to return a sensibly combined result if it doesn't fit into
+  either of the above two categories.
 
-Since the set of object instance method on pandas data structures are generally
+Since the set of object instance methods on pandas data structures are generally
 rich and expressive, we often simply want to invoke, say, a DataFrame function
 on each group. The name GroupBy should be quite familiar to those who have used
 a SQL-based tool (or ``itertools``), in which you can write code like:
@@ -70,7 +68,7 @@ We aim to make operations like this natural and easy to express using
 pandas. We'll address each area of GroupBy functionality then provide some
 non-trivial examples / use cases.
 
-See the :ref:`cookbook<cookbook.grouping>` for some advanced strategies
+See the :ref:`cookbook<cookbook.grouping>` for some advanced strategies.
 
 .. _groupby.split:
 
@@ -79,7 +77,7 @@ Splitting an object into groups
 
 pandas objects can be split on any of their axes. The abstract definition of
 grouping is to provide a mapping of labels to group names. To create a GroupBy
-object (more on what the GroupBy object is later), you do the following:
+object (more on what the GroupBy object is later), you may do the following:
 
 .. code-block:: ipython
 
@@ -90,16 +88,27 @@ object (more on what the GroupBy object is later), you do the following:
 
 The mapping can be specified many different ways:
 
-  - A Python function, to be called on each of the axis labels
-  - A list or NumPy array of the same length as the selected axis
-  - A dict or Series, providing a ``label -> group name`` mapping
-  - For DataFrame objects, a string indicating a column to be used to group. Of
-    course ``df.groupby('A')`` is just syntactic sugar for
-    ``df.groupby(df['A'])``, but it makes life simpler
-  - A list of any of the above things
+* A Python function, to be called on each of the axis labels.
+* A list or NumPy array of the same length as the selected axis.
+* A dict or ``Series``, providing a ``label -> group name`` mapping.
+* For ``DataFrame`` objects, a string indicating a column to be used to group.
+  Of course ``df.groupby('A')`` is just syntactic sugar for
+  ``df.groupby(df['A'])``, but it makes life simpler.
+* For ``DataFrame`` objects, a string indicating an index level to be used to
+  group.
+* A list of any of the above things.
 
 Collectively we refer to the grouping objects as the **keys**. For example,
-consider the following DataFrame:
+consider the following ``DataFrame``:
+
+.. note::
+
+   .. versionadded:: 0.20
+
+   A string passed to ``groupby`` may refer to either a column or an index level.
+   If a string matches both a column name and an index level name then a warning is
+   issued and the column takes precedence. This will result in an ambiguity error
+   in a future version.
 
 .. ipython:: python
 
@@ -111,7 +120,8 @@ consider the following DataFrame:
                       'D' : np.random.randn(8)})
    df
 
-We could naturally group by either the ``A`` or ``B`` columns or both:
+On a DataFrame, we obtain a GroupBy object by calling :meth:`~DataFrame.groupby`.
+We could naturally group by either the ``A`` or ``B`` columns, or both:
 
 .. ipython:: python
 
@@ -132,7 +142,7 @@ columns:
 
     In [5]: grouped = df.groupby(get_letter_type, axis=1)
 
-Starting with 0.8, pandas Index objects now supports duplicate values. If a
+pandas :class:`~pandas.Index` objects support duplicate values. If a
 non-unique index is used as the group key in a groupby operation, all values
 for the same index value will be considered to be in one group and thus the
 output of aggregation functions will only contain unique index values:
@@ -174,7 +184,8 @@ By default the group keys are sorted during the ``groupby`` operation. You may h
    df2.groupby(['X'], sort=False).sum()
 
 
-Note that ``groupby`` will preserve the order in which *observations* are sorted *within* each group. For example, the groups created by ``groupby()`` below are in the order the appeared in the original ``DataFrame``:
+Note that ``groupby`` will preserve the order in which *observations* are sorted *within* each group.
+For example, the groups created by ``groupby()`` below are in the order they appeared in the original ``DataFrame``:
 
 .. ipython:: python
 
@@ -211,7 +222,7 @@ the length of the ``groups`` dict, so it is largely just a convenience:
 
 .. _groupby.tabcompletion:
 
-``GroupBy`` will tab complete column names (and other attributes)
+``GroupBy`` will tab complete column names (and other attributes):
 
 .. ipython:: python
    :suppress:
@@ -220,7 +231,7 @@ the length of the ``groups`` dict, so it is largely just a convenience:
    weight = np.random.normal(166, 20, size=n)
    height = np.random.normal(60, 10, size=n)
    time = pd.date_range('1/1/2000', periods=n)
-   gender = tm.choice(['male', 'female'], size=n)
+   gender = np.random.choice(['male', 'female'], size=n)
    df = pd.DataFrame({'height': height, 'weight': weight,
                       'gender': gender}, index=time)
 
@@ -238,17 +249,6 @@ the length of the ``groups`` dict, so it is largely just a convenience:
    gb.aggregate  gb.count      gb.cumprod    gb.dtype      gb.first      gb.groups     gb.hist       gb.max        gb.min        gb.nth        gb.prod       gb.resample   gb.sum        gb.var
    gb.apply      gb.cummax     gb.cumsum     gb.fillna     gb.gender     gb.head       gb.indices    gb.mean       gb.name       gb.ohlc       gb.quantile   gb.size       gb.tail       gb.weight
 
-
-.. ipython:: python
-   :suppress:
-
-   df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
-                             'foo', 'bar', 'foo', 'foo'],
-                      'B' : ['one', 'one', 'two', 'three',
-                             'two', 'two', 'one', 'three'],
-                      'C' : np.random.randn(8),
-                      'D' : np.random.randn(8)})
-
 .. _groupby.multiindex:
 
 GroupBy with MultiIndex
@@ -257,20 +257,21 @@ GroupBy with MultiIndex
 With :ref:`hierarchically-indexed data <advanced.hierarchical>`, it's quite
 natural to group by one of the levels of the hierarchy.
 
+Let's create a Series with a two-level ``MultiIndex``.
+
 .. ipython:: python
-   :suppress:
 
 
    arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
              ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-   tuples = list(zip(*arrays))
-   tuples
-   index = pd.MultiIndex.from_tuples(tuples, names=['first', 'second'])
+   index = pd.MultiIndex.from_arrays(arrays, names=['first', 'second'])
    s = pd.Series(np.random.randn(8), index=index)
+   s
+
+We can then group by one of the levels in ``s``.
 
 .. ipython:: python
 
-   s
    grouped = s.groupby(level=0)
    grouped.sum()
 
@@ -289,7 +290,7 @@ chosen level:
 
    s.sum(level='second')
 
-Also as of v0.6, grouping with multiple levels is supported.
+Grouping with multiple levels is supported.
 
 .. ipython:: python
    :suppress:
@@ -306,14 +307,72 @@ Also as of v0.6, grouping with multiple levels is supported.
    s
    s.groupby(level=['first', 'second']).sum()
 
+.. versionadded:: 0.20
+
+Index level names may be supplied as keys.
+
+.. ipython:: python
+
+   s.groupby(['first', 'second']).sum()
+
 More on the ``sum`` function and aggregation later.
 
+Grouping DataFrame with Index Levels and Columns
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+A DataFrame may be grouped by a combination of columns and index levels by
+specifying the column names as strings and the index levels as ``pd.Grouper``
+objects.
+
+.. ipython:: python
+
+   arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+             ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+
+   index = pd.MultiIndex.from_arrays(arrays, names=['first', 'second'])
+
+   df = pd.DataFrame({'A': [1, 1, 1, 1, 2, 2, 3, 3],
+                      'B': np.arange(8)},
+                     index=index)
+
+   df
+
+The following example groups ``df`` by the ``second`` index level and
+the ``A`` column.
+
+.. ipython:: python
+
+   df.groupby([pd.Grouper(level=1), 'A']).sum()
+
+Index levels may also be specified by name.
+
+.. ipython:: python
+
+   df.groupby([pd.Grouper(level='second'), 'A']).sum()
+
+.. versionadded:: 0.20
+
+Index level names may be specified as keys directly to ``groupby``.
+
+.. ipython:: python
+
+   df.groupby(['second', 'A']).sum()
+
 DataFrame column selection in GroupBy
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Once you have created the GroupBy object from a DataFrame, for example, you
-might want to do something different for each of the columns. Thus, using
-``[]`` similar to getting a column from a DataFrame, you can do:
+Once you have created the GroupBy object from a DataFrame, you might want to do
+something different for each of the columns. Thus, using ``[]`` similar to
+getting a column from a DataFrame, you can do:
+
+.. ipython:: python
+   :suppress:
+
+   df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
+                             'foo', 'bar', 'foo', 'foo'],
+                      'B' : ['one', 'one', 'two', 'three',
+                             'two', 'two', 'one', 'three'],
+                      'C' : np.random.randn(8),
+                      'D' : np.random.randn(8)})
 
 .. ipython:: python
 
@@ -336,7 +395,7 @@ Iterating through groups
 ------------------------
 
 With the GroupBy object in hand, iterating through the grouped data is very
-natural and functions similarly to ``itertools.groupby``:
+natural and functions similarly to :py:func:`itertools.groupby`:
 
 .. ipython::
 
@@ -362,7 +421,8 @@ statement if you wish: ``for (k1, k2), group in grouped:``.
 Selecting a group
 -----------------
 
-A single group can be selected using ``GroupBy.get_group()``:
+A single group can be selected using
+:meth:`~pandas.core.groupby.DataFrameGroupBy.get_group`:
 
 .. ipython:: python
 
@@ -380,9 +440,13 @@ Aggregation
 -----------
 
 Once the GroupBy object has been created, several methods are available to
-perform a computation on the grouped data.
+perform a computation on the grouped data. These operations are similar to the
+:ref:`aggregating API <basics.aggregate>`, :ref:`window functions API <stats.aggregate>`,
+and :ref:`resample API <timeseries.aggregate>`.
 
-An obvious one is aggregation via the ``aggregate`` or equivalently ``agg`` method:
+An obvious one is aggregation via the
+:meth:`~pandas.core.groupby.DataFrameGroupBy.aggregate` or equivalently
+:meth:`~pandas.core.groupby.DataFrameGroupBy.agg` method:
 
 .. ipython:: python
 
@@ -432,18 +496,41 @@ index are the group names and whose values are the sizes of each group.
    Passing ``as_index=False`` **will** return the groups that you are aggregating over, if they are
    named *columns*.
 
-   Aggregating functions are ones that reduce the dimension of the returned objects,
-   for example: ``mean, sum, size, count, std, var, sem, describe, first, last, nth, min, max``. This is
-   what happens when you do for example ``DataFrame.sum()`` and get back a ``Series``.
-
-   ``nth`` can act as a reducer *or* a filter, see :ref:`here <groupby.nth>`
+Aggregating functions are the ones that reduce the dimension of the returned objects.
+Some common aggregating functions are tabulated below:
+
+.. csv-table::
+    :header: "Function", "Description"
+    :widths: 20, 80
+    :delim: ;
+
+	:meth:`~pd.core.groupby.DataFrameGroupBy.mean`;Compute mean of groups
+	:meth:`~pd.core.groupby.DataFrameGroupBy.sum`;Compute sum of group values
+	:meth:`~pd.core.groupby.DataFrameGroupBy.size`;Compute group sizes
+	:meth:`~pd.core.groupby.DataFrameGroupBy.count`;Compute count of group
+	:meth:`~pd.core.groupby.DataFrameGroupBy.std`;Standard deviation of groups
+	:meth:`~pd.core.groupby.DataFrameGroupBy.var`;Compute variance of groups
+	:meth:`~pd.core.groupby.DataFrameGroupBy.sem`;Standard error of the mean of groups
+	:meth:`~pd.core.groupby.DataFrameGroupBy.describe`;Generates descriptive statistics
+	:meth:`~pd.core.groupby.DataFrameGroupBy.first`;Compute first of group values
+	:meth:`~pd.core.groupby.DataFrameGroupBy.last`;Compute last of group values
+	:meth:`~pd.core.groupby.DataFrameGroupBy.nth`;Take nth value, or a subset if n is a list
+	:meth:`~pd.core.groupby.DataFrameGroupBy.min`;Compute min of group values
+	:meth:`~pd.core.groupby.DataFrameGroupBy.max`;Compute max of group values
+
+
+The aggregating functions above will exclude NA values. Any function which
+reduces a :class:`Series` to a scalar value is an aggregation function and will work,
+a trivial example is ``df.groupby('A').agg(lambda ser: 1)``. Note that
+:meth:`~pd.core.groupby.DataFrameGroupBy.nth` can act as a reducer *or* a
+filter, see :ref:`here <groupby.nth>`.
 
 .. _groupby.aggregate.multifunc:
 
 Applying multiple functions at once
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-With grouped Series you can also pass a list or dict of functions to do
+With grouped ``Series`` you can also pass a list or dict of functions to do
 aggregation with, outputting a DataFrame:
 
 .. ipython:: python
@@ -451,23 +538,35 @@ aggregation with, outputting a DataFrame:
    grouped = df.groupby('A')
    grouped['C'].agg([np.sum, np.mean, np.std])
 
-If a dict is passed, the keys will be used to name the columns. Otherwise the
-function's name (stored in the function object) will be used.
+On a grouped ``DataFrame``, you can pass a list of functions to apply to each
+column, which produces an aggregated result with a hierarchical index:
 
 .. ipython:: python
 
-   grouped['D'].agg({'result1' : np.sum,
-                     'result2' : np.mean})
+   grouped.agg([np.sum, np.mean, np.std])
 
-On a grouped DataFrame, you can pass a list of functions to apply to each
-column, which produces an aggregated result with a hierarchical index:
+
+The resulting aggregations are named for the functions themselves. If you
+need to rename, then you can add in a chained operation for a ``Series`` like this:
 
 .. ipython:: python
 
-   grouped.agg([np.sum, np.mean, np.std])
+   (grouped['C'].agg([np.sum, np.mean, np.std])
+                .rename(columns={'sum': 'foo',
+                                 'mean': 'bar',
+                                 'std': 'baz'})
+   )
+
+For a grouped ``DataFrame``, you can rename in a similar manner:
+
+.. ipython:: python
+
+   (grouped.agg([np.sum, np.mean, np.std])
+           .rename(columns={'sum': 'foo',
+                            'mean': 'bar',
+                            'std': 'baz'})
+    )
 
-Passing a dict of functions has different behavior by default, see the next
-section.
 
 Applying different functions to DataFrame columns
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -488,6 +587,17 @@ must be either implemented on GroupBy or available via :ref:`dispatching
 
    grouped.agg({'C' : 'sum', 'D' : 'std'})
 
+.. note::
+
+    If you pass a dict to ``aggregate``, the ordering of the output columns is
+    non-deterministic. If you want to be sure the output columns will be in a specific
+    order, you can use an ``OrderedDict``.  Compare the output of the following two commands:
+
+.. ipython:: python
+
+   grouped.agg({'D': 'std', 'C': 'mean'})
+   grouped.agg(OrderedDict([('D', 'std'), ('C', 'mean')]))
+
 .. _groupby.aggregate.cython:
 
 Cython-optimized aggregation functions
@@ -510,15 +620,27 @@ Transformation
 --------------
 
 The ``transform`` method returns an object that is indexed the same (same size)
-as the one being grouped. Thus, the passed transform function should return a
-result that is the same size as the group chunk. For example, suppose we wished
-to standardize the data within each group:
+as the one being grouped. The transform function must:
+
+* Return a result that is either the same size as the group chunk or
+  broadcastable to the size of the group chunk (e.g., a scalar,
+  ``grouped.transform(lambda x: x.iloc[-1])``).
+* Operate column-by-column on the group chunk.  The transform is applied to
+  the first group chunk using chunk.apply.
+* Not perform in-place operations on the group chunk. Group chunks should
+  be treated as immutable, and changes to a group chunk may produce unexpected
+  results. For example, when using ``fillna``, ``inplace`` must be ``False``
+  (``grouped.transform(lambda x: x.fillna(inplace=False))``).
+* (Optionally) operates on the entire group chunk. If this is supported, a
+  fast path is used starting from the *second* chunk.
+
+For example, suppose we wished to standardize the data within each group:
 
 .. ipython:: python
 
    index = pd.date_range('10/1/1999', periods=1100)
    ts = pd.Series(np.random.normal(0.5, 2, 1100), index)
-   ts = pd.rolling_mean(ts, 100, 100).dropna()
+   ts = ts.rolling(window=100,min_periods=100).mean().dropna()
 
    ts.head()
    ts.tail()
@@ -550,6 +672,20 @@ We can also visually compare the original and transformed data sets.
    @savefig groupby_transform_plot.png
    compare.plot()
 
+Transformation functions that have lower dimension outputs are broadcast to
+match the shape of the input array.
+
+.. ipython:: python
+
+   data_range = lambda x: x.max() - x.min()
+   ts.groupby(key).transform(data_range)
+
+Alternatively, the built-in methods could be used to produce the same outputs.
+
+.. ipython:: python
+
+   ts.groupby(key).transform('max') - ts.groupby(key).transform('min')
+
 Another common data transform is to replace missing data with the group mean.
 
 .. ipython:: python
@@ -594,22 +730,69 @@ and that the transformed data contains no NAs.
 
 .. note::
 
-   Some functions when applied to a groupby object will automatically transform the input, returning
-   an object of the same shape as the original. Passing ``as_index=False`` will not affect these transformation methods.
+   Some functions will automatically transform the input when applied to a
+   GroupBy object, but returning an object of the same shape as the original.
+   Passing ``as_index=False`` will not affect these transformation methods.
 
-   For example: ``fillna, ffill, bfill, shift``.
+   For example: ``fillna, ffill, bfill, shift.``.
 
    .. ipython:: python
 
       grouped.ffill()
 
+
+.. _groupby.transform.window_resample:
+
+New syntax to window and resample operations
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. versionadded:: 0.18.1
+
+Working with the resample, expanding or rolling operations on the groupby
+level used to require the application of helper functions. However,
+now it is possible to use ``resample()``, ``expanding()`` and
+``rolling()`` as methods on groupbys.
+
+The example below will apply the ``rolling()`` method on the samples of
+the column B based on the groups of column A.
+
+.. ipython:: python
+
+   df_re = pd.DataFrame({'A': [1] * 10 + [5] * 10,
+                         'B': np.arange(20)})
+   df_re
+
+   df_re.groupby('A').rolling(4).B.mean()
+
+
+The ``expanding()`` method will accumulate a given operation
+(``sum()`` in the example) for all the members of each particular
+group.
+
+.. ipython:: python
+
+   df_re.groupby('A').expanding().sum()
+
+
+Suppose you want to use the ``resample()`` method to get a daily
+frequency in each group of your dataframe and wish to complete the
+missing values with the ``ffill()`` method.
+
+.. ipython:: python
+
+   df_re = pd.DataFrame({'date': pd.date_range(start='2016-01-01',
+                                 periods=4,
+                         freq='W'),
+                        'group': [1, 1, 2, 2],
+                        'val': [5, 6, 7, 8]}).set_index('date')
+   df_re
+
+   df_re.groupby('group').resample('1D').ffill()
+
 .. _groupby.filter:
 
 Filtration
 ----------
 
-.. versionadded:: 0.12
-
 The ``filter`` method returns a subset of the original object. Suppose we
 want to take only elements that belong to groups with a group sum greater
 than 2.
@@ -638,7 +821,7 @@ with NaNs.
 
    dff.groupby('B').filter(lambda x: len(x) > 2, dropna=False)
 
-For dataframes with multiple columns, filters should explicitly specify a column as the filter criterion.
+For DataFrames with multiple columns, filters should explicitly specify a column as the filter criterion.
 
 .. ipython:: python
 
@@ -648,7 +831,7 @@ For dataframes with multiple columns, filters should explicitly specify a column
 .. note::
 
    Some functions when applied to a groupby object will act as a **filter** on the input, returning
-   a reduced shape of the original (and potentitally eliminating groups), but with the index unchanged.
+   a reduced shape of the original (and potentially eliminating groups), but with the index unchanged.
    Passing ``as_index=False`` will not affect these transformation methods.
 
    For example: ``head, tail``.
@@ -692,7 +875,7 @@ next). This enables some operations to be carried out rather succinctly:
    tsdf = pd.DataFrame(np.random.randn(1000, 3),
                        index=pd.date_range('1/1/2000', periods=1000),
                        columns=['A', 'B', 'C'])
-   tsdf.ix[::2] = np.nan
+   tsdf.iloc[::2] = np.nan
    grouped = tsdf.groupby(lambda x: x.year)
    grouped.fillna(method='pad')
 
@@ -700,8 +883,6 @@ In this example, we chopped the collection of time series into yearly chunks
 then independently called :ref:`fillna <missing_data.fillna>` on the
 groups.
 
-.. versionadded:: 0.14.1
-
 The ``nlargest`` and ``nsmallest`` methods work on ``Series`` style groupbys:
 
 .. ipython:: python
@@ -744,12 +925,13 @@ The dimension of the returned result can also change:
 
     In [11]: grouped.apply(f)
 
-``apply`` on a Series can operate on a returned value from the applied function, that is itself a series, and possibly upcast the result to a DataFrame
+``apply`` on a Series can operate on a returned value from the applied function,
+that is itself a series, and possibly upcast the result to a DataFrame:
 
 .. ipython:: python
 
     def f(x):
-      return pd.Series([ x, x**2 ], index = ['x', 'x^s'])
+      return pd.Series([ x, x**2 ], index = ['x', 'x^2'])
     s = pd.Series(np.random.rand(5))
     s
     s.apply(f)
@@ -757,7 +939,7 @@ The dimension of the returned result can also change:
 
 .. note::
 
-   ``apply`` can act as a reducer, transformer, *or* filter function, depending on exactly what is passed to apply.
+   ``apply`` can act as a reducer, transformer, *or* filter function, depending on exactly what is passed to it.
    So depending on the path taken, and exactly what you are grouping. Thus the grouped columns(s) may be included in
    the output as well as set the indices.
 
@@ -773,7 +955,7 @@ The dimension of the returned result can also change:
 
         d = pd.DataFrame({"a":["x", "y"], "b":[1,2]})
         def identity(df):
-            print df
+            print(df)
             return df
 
         d.groupby("a").apply(identity)
@@ -791,7 +973,7 @@ Again consider the example DataFrame we've been looking at:
 
    df
 
-Supposed we wished to compute the standard deviation grouped by the ``A``
+Suppose we wish to compute the standard deviation grouped by the ``A``
 column. There is a slight problem, namely that we don't care about the data in
 column ``B``. We refer to this as a "nuisance" column. If the passed
 aggregation function can't be applied to some columns, the troublesome columns
@@ -801,15 +983,49 @@ will be (silently) dropped. Thus, this does not pose any problems:
 
    df.groupby('A').std()
 
+Note that ``df.groupby('A').colname.std().`` is more efficient than
+``df.groupby('A').std().colname``, so if the result of an aggregation function
+is only interesting over one column (here ``colname``), it may be filtered
+*before* applying the aggregation function.
+
+.. _groupby.observed:
+
+Handling of (un)observed Categorical values
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+When using a ``Categorical`` grouper (as a single grouper, or as part of multiple groupers), the ``observed`` keyword
+controls whether to return a cartesian product of all possible groupers values (``observed=False``) or only those
+that are observed groupers (``observed=True``).
+
+Show all values:
+
+.. ipython:: python
+
+   pd.Series([1, 1, 1]).groupby(pd.Categorical(['a', 'a', 'a'], categories=['a', 'b']), observed=False).count()
+
+Show only the observed values:
+
+.. ipython:: python
+
+   pd.Series([1, 1, 1]).groupby(pd.Categorical(['a', 'a', 'a'], categories=['a', 'b']), observed=True).count()
+
+The returned dtype of the grouped will *always* include *all* of the categories that were grouped.
+
+.. ipython:: python
+
+   s = pd.Series([1, 1, 1]).groupby(pd.Categorical(['a', 'a', 'a'], categories=['a', 'b']), observed=False).count()
+   s.index.dtype
+
 .. _groupby.missing:
 
 NA and NaT group handling
 ~~~~~~~~~~~~~~~~~~~~~~~~~
 
-If there are any NaN or NaT values in the grouping key, these will be automatically
-excluded. So there will never be an "NA group" or "NaT group". This was not the case in older
-versions of pandas, but users were generally discarding the NA group anyway
-(and supporting it was an implementation headache).
+If there are any NaN or NaT values in the grouping key, these will be
+automatically excluded. In other words, there will never be an "NA group" or
+"NaT group". This was not the case in older versions of pandas, but users were
+generally discarding the NA group anyway (and supporting it was an
+implementation headache).
 
 Grouping with ordered factors
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -890,25 +1106,14 @@ Just like for a DataFrame or Series you can call head and tail on a groupby:
 
 This shows the first or last n rows from each group.
 
-.. warning::
-
-   Before 0.14.0 this was implemented with a fall-through apply,
-   so the result would incorrectly respect the as_index flag:
-
-   .. code-block:: python
-
-       >>> g.head(1):  # was equivalent to g.apply(lambda x: x.head(1))
-             A  B
-        A
-        1 0  1  2
-        5 2  5  6
-
 .. _groupby.nth:
 
 Taking the nth row of each group
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-To select from a DataFrame or Series the nth item, use the nth method. This is a reduction method, and will return a single row (or no row) per group if you pass an int for n:
+To select from a DataFrame or Series the nth item, use
+:meth:`~pd.core.groupby.DataFrameGroupBy.nth`. This is a reduction method, and
+will return a single row (or no row) per group if you pass an int for n:
 
 .. ipython:: python
 
@@ -919,7 +1124,7 @@ To select from a DataFrame or Series the nth item, use the nth method. This is a
    g.nth(-1)
    g.nth(1)
 
-If you want to select the nth not-null item, use the ``dropna`` kwarg. For a DataFrame this should be either ``'any'`` or ``'all'`` just like you would pass to dropna, for a Series this just needs to be truthy.
+If you want to select the nth not-null item, use the ``dropna`` kwarg. For a DataFrame this should be either ``'any'`` or ``'all'`` just like you would pass to dropna:
 
 .. ipython:: python
 
@@ -931,7 +1136,7 @@ If you want to select the nth not-null item, use the ``dropna`` kwarg. For a Dat
    g.nth(-1, dropna='any')  # NaNs denote group exhausted when using dropna
    g.last()
 
-   g.B.nth(0, dropna=True)
+   g.B.nth(0, dropna='all')
 
 As with other methods, passing ``as_index=False``, will achieve a filtration, which returns the grouped row.
 
@@ -950,30 +1155,54 @@ You can also select multiple rows from each group by specifying multiple nth val
    business_dates = pd.date_range(start='4/1/2014', end='6/30/2014', freq='B')
    df = pd.DataFrame(1, index=business_dates, columns=['a', 'b'])
    # get the first, 4th, and last date index for each month
-   df.groupby((df.index.year, df.index.month)).nth([0, 3, -1])
+   df.groupby([df.index.year, df.index.month]).nth([0, 3, -1])
 
 Enumerate group items
 ~~~~~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.13.0
-
 To see the order in which each row appears within its group, use the
 ``cumcount`` method:
 
 .. ipython:: python
 
-   df = pd.DataFrame(list('aaabba'), columns=['A'])
-   df
+   dfg = pd.DataFrame(list('aaabba'), columns=['A'])
+   dfg
+
+   dfg.groupby('A').cumcount()
+
+   dfg.groupby('A').cumcount(ascending=False)
+
+.. _groupby.ngroup:
+
+Enumerate groups
+~~~~~~~~~~~~~~~~
 
-   df.groupby('A').cumcount()
+.. versionadded:: 0.20.2
 
-   df.groupby('A').cumcount(ascending=False)  # kwarg only
+To see the ordering of the groups (as opposed to the order of rows
+within a group given by ``cumcount``) you can use
+:meth:`~pandas.core.groupby.DataFrameGroupBy.ngroup`.
+
+
+
+Note that the numbers given to the groups match the order in which the
+groups would be seen when iterating over the groupby object, not the
+order they are first observed.
+
+.. ipython:: python
+
+   dfg = pd.DataFrame(list('aaabba'), columns=['A'])
+   dfg
+
+   dfg.groupby('A').ngroup()
+
+   dfg.groupby('A').ngroup(ascending=False)
 
 Plotting
 ~~~~~~~~
 
 Groupby also works with some plotting methods.  For example, suppose we
-suspect that some features in a DataFrame my differ by group, in this case,
+suspect that some features in a DataFrame may differ by group, in this case,
 the values in column 1 where the group is "B" are 3 higher on average.
 
 .. ipython:: python
@@ -1002,6 +1231,56 @@ See the :ref:`visualization documentation<visualization.box>` for more.
   to ``df.boxplot(by="g")``. See :ref:`here<visualization.box.return>` for
   an explanation.
 
+.. _groupby.pipe:
+
+Piping function calls
+~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.21.0
+
+Similar to the functionality provided by ``DataFrame`` and ``Series``, functions
+that take ``GroupBy`` objects can be chained together using a ``pipe`` method to
+allow for a cleaner, more readable syntax. To read about ``.pipe`` in general terms,
+see :ref:`here <basics.pipe>`.
+
+Combining ``.groupby`` and ``.pipe`` is often useful when you need to reuse
+GroupBy objects.
+
+As an example, imagine having a DataFrame with columns for stores, products,
+revenue and quantity sold. We'd like to do a groupwise calculation of *prices*
+(i.e. revenue/quantity) per store and per product. We could do this in a
+multi-step operation, but expressing it in terms of piping can make the
+code more readable. First we set the data:
+
+.. ipython:: python
+
+   import numpy as np
+   n = 1000
+   df = pd.DataFrame({'Store': np.random.choice(['Store_1', 'Store_2'], n),
+                      'Product': np.random.choice(['Product_1',
+                                                   'Product_2'], n),
+                      'Revenue': (np.random.random(n)*50+10).round(2),
+                      'Quantity': np.random.randint(1, 10, size=n)})
+   df.head(2)
+
+Now, to find prices per store/product, we can simply do:
+
+.. ipython:: python
+
+   (df.groupby(['Store', 'Product'])
+      .pipe(lambda grp: grp.Revenue.sum()/grp.Quantity.sum())
+      .unstack().round(2))
+
+Piping can also be expressive when you want to deliver a grouped object to some
+arbitrary function, for example:
+
+.. code-block:: python
+
+   (df.groupby(['Store', 'Product']).pipe(report_func)
+
+where ``report_func`` takes a GroupBy object and creates a report
+from that.
+
 Examples
 --------
 
@@ -1016,12 +1295,56 @@ Regroup columns of a DataFrame according to their sum, and sum the aggregated on
    df
    df.groupby(df.sum(), axis=1).sum()
 
+.. _groupby.multicolumn_factorization:
+
+Multi-column factorization
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+By using :meth:`~pandas.core.groupby.DataFrameGroupBy.ngroup`, we can extract
+information about the groups in a way similar to :func:`factorize` (as described
+further in the :ref:`reshaping API <reshaping.factorize>`) but which applies
+naturally to multiple columns of mixed type and different
+sources. This can be useful as an intermediate categorical-like step
+in processing, when the relationships between the group rows are more
+important than their content, or as input to an algorithm which only
+accepts the integer encoding. (For more information about support in
+pandas for full categorical data, see the :ref:`Categorical
+introduction <categorical>` and the
+:ref:`API documentation <api.categorical>`.)
+
+.. ipython:: python
+
+    dfg = pd.DataFrame({"A": [1, 1, 2, 3, 2], "B": list("aaaba")})
+
+    dfg
+
+    dfg.groupby(["A", "B"]).ngroup()
+
+    dfg.groupby(["A", [0, 0, 0, 1, 1]]).ngroup()
+
+Groupby by Indexer to 'resample' data
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Resampling produces new hypothetical samples (resamples) from already existing observed data or from a model that generates data. These new samples are similar to the pre-existing samples.
+
+In order to resample to work on indices that are non-datetimelike, the following procedure can be utilized.
+
+In the following examples, **df.index // 5** returns a binary array which is used to determine what gets selected for the groupby operation.
+
+.. note:: The below example shows how we can downsample by consolidation of samples into fewer samples. Here by using **df.index // 5**, we are aggregating the samples in bins. By applying **std()** function, we aggregate the information contained in many samples into a small subset of values which is their standard deviation thereby reducing the number of samples.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(10,2))
+   df
+   df.index // 5
+   df.groupby(df.index // 5).std()
 
 Returning a Series to propagate names
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Group DataFrame columns, compute a set of metrics and return a named Series.
-The Series name is used as the name for the column index.  This is especially
+The Series name is used as the name for the column index. This is especially
 useful in conjunction with reshaping operations such as stacking in which the
 column index name will be used as the name of the inserted column:
 
diff --git a/doc/source/index.rst.template b/doc/source/index.rst.template
index 621bd33ba5a41..f5ac7b77f4db1 100644
--- a/doc/source/index.rst.template
+++ b/doc/source/index.rst.template
@@ -12,11 +12,11 @@ pandas: powerful Python data analysis toolkit
 
 **Date**: |today| **Version**: |version|
 
-**Binary Installers:** http://pypi.python.org/pypi/pandas
+**Binary Installers:** https://pypi.org/project/pandas
 
-**Source Repository:** http://github.com/pydata/pandas
+**Source Repository:** http://github.com/pandas-dev/pandas
 
-**Issues & Ideas:** https://github.com/pydata/pandas/issues
+**Issues & Ideas:** https://github.com/pandas-dev/pandas/issues
 
 **Q&A Support:** http://stackoverflow.com/questions/tagged/pandas
 
@@ -92,7 +92,7 @@ Some other notes
    specialized tool.
 
  - pandas is a dependency of `statsmodels
-   <http://statsmodels.sourceforge.net>`__, making it an important part of the
+   <http://www.statsmodels.org/stable/index.html>`__, making it an important part of the
    statistical computing ecosystem in Python.
 
  - pandas has been used extensively in production in financial applications.
@@ -106,17 +106,21 @@ Some other notes
 See the package overview for more detail about what's in the library.
 
 
+{% if single_doc_type == 'docstring' -%}
+.. autosummary::
+    :toctree: generated_single/
+{% else -%}
 .. toctree::
     :maxdepth: 4
+{% endif %}
 
-    {% if single -%}
-    {{ single }}
+    {% if single_doc -%}
+    {{ single_doc }}
     {% endif -%}
-    {%if not single -%}
+    {% if not single_doc -%}
     whatsnew
     install
     contributing
-    faq
     overview
     10min
     tutorials
@@ -136,8 +140,8 @@ See the package overview for more detail about what's in the library.
     timedeltas
     categorical
     visualization
+    style
     io
-    remote_data
     enhancingperf
     sparse
     gotchas
@@ -146,11 +150,14 @@ See the package overview for more detail about what's in the library.
     comparison_with_r
     comparison_with_sql
     comparison_with_sas
+    comparison_with_stata
     {% endif -%}
-    {% if api -%}
+    {% if include_api -%}
     api
     {% endif -%}
-    {%if not single -%}
+    {% if not single_doc -%}
+    developer
     internals
+    extending
     release
     {% endif -%}
diff --git a/doc/source/indexing.rst b/doc/source/indexing.rst
index 38629ee7baaea..1c63acce6e3fa 100644
--- a/doc/source/indexing.rst
+++ b/doc/source/indexing.rst
@@ -17,17 +17,15 @@ Indexing and Selecting Data
 
 The axis labeling information in pandas objects serves many purposes:
 
-  - Identifies data (i.e. provides *metadata*) using known indicators,
-    important for analysis, visualization, and interactive console display
-  - Enables automatic and explicit data alignment
-  - Allows intuitive getting and setting of subsets of the data set
+* Identifies data (i.e. provides *metadata*) using known indicators,
+  important for analysis, visualization, and interactive console display.
+* Enables automatic and explicit data alignment.
+* Allows intuitive getting and setting of subsets of the data set.
 
 In this section, we will focus on the final point: namely, how to slice, dice,
 and generally get and set subsets of pandas objects. The primary focus will be
 on Series and DataFrame as they have received more development attention in
-this area. Expect more work to be invested in higher-dimensional data
-structures (including ``Panel``) in the future, especially in label-based
-advanced indexing.
+this area.
 
 .. note::
 
@@ -43,74 +41,72 @@ advanced indexing.
 .. warning::
 
    Whether a copy or a reference is returned for a setting operation, may
-   depend on the context.  This is sometimes called ``chained assignment`` and
-   should be avoided.  See :ref:`Returning a View versus Copy
-   <indexing.view_versus_copy>`
+   depend on the context. This is sometimes called ``chained assignment`` and
+   should be avoided. See :ref:`Returning a View versus Copy
+   <indexing.view_versus_copy>`.
 
 .. warning::
 
-   In 0.15.0 ``Index`` has internally been refactored to no longer subclass ``ndarray``
-   but instead subclass ``PandasObject``, similarly to the rest of the pandas objects. This should be
-   a transparent change with only very limited API implications (See the :ref:`Internal Refactoring <whatsnew_0150.refactoring>`)
+   Indexing on an integer-based Index with floats has been clarified in 0.18.0, for a summary of the changes, see :ref:`here <whatsnew_0180.float_indexers>`.
 
 See the :ref:`MultiIndex / Advanced Indexing <advanced>` for ``MultiIndex`` and more advanced indexing documentation.
 
-See the :ref:`cookbook<cookbook.selection>` for some advanced strategies
+See the :ref:`cookbook<cookbook.selection>` for some advanced strategies.
+
+.. _indexing.choice:
 
 Different Choices for Indexing
 ------------------------------
 
-.. versionadded:: 0.11.0
-
 Object selection has had a number of user-requested additions in order to
-support more explicit location based indexing. pandas now supports three types
+support more explicit location based indexing. Pandas now supports three types
 of multi-axis indexing.
 
-- ``.loc`` is primarily label based, but may also be used with a boolean array. ``.loc`` will raise ``KeyError`` when the items are not found. Allowed inputs are:
+* ``.loc`` is primarily label based, but may also be used with a boolean array. ``.loc`` will raise ``KeyError`` when the items are not found. Allowed inputs are:
 
-  - A single label, e.g. ``5`` or ``'a'``, (note that ``5`` is interpreted as a
-    *label* of the index. This use is **not** an integer position along the
-    index)
-  - A list or array of labels ``['a', 'b', 'c']``
-  - A slice object with labels ``'a':'f'``, (note that contrary to usual python
-    slices, **both** the start and the stop are included!)
-  - A boolean array
+    * A single label, e.g. ``5`` or ``'a'`` (Note that ``5`` is interpreted as a
+      *label* of the index. This use is **not** an integer position along the
+      index.).
+    * A list or array of labels ``['a', 'b', 'c']``.
+    * A slice object with labels ``'a':'f'`` (Note that contrary to usual python
+      slices, **both** the start and the stop are included, when present in the
+      index! See :ref:`Slicing with labels
+      <indexing.slicing_with_labels>`.).
+    * A boolean array
+    * A ``callable`` function with one argument (the calling Series, DataFrame or Panel) and
+      that returns valid output for indexing (one of the above).
 
-  See more at :ref:`Selection by Label <indexing.label>`
+      .. versionadded:: 0.18.1
 
-- ``.iloc`` is primarily integer position based (from ``0`` to
+  See more at :ref:`Selection by Label <indexing.label>`.
+
+* ``.iloc`` is primarily integer position based (from ``0`` to
   ``length-1`` of the axis), but may also be used with a boolean
   array.  ``.iloc`` will raise ``IndexError`` if a requested
   indexer is out-of-bounds, except *slice* indexers which allow
-  out-of-bounds indexing.  (this conforms with python/numpy *slice*
+  out-of-bounds indexing.  (this conforms with Python/NumPy *slice*
   semantics).  Allowed inputs are:
 
-  - An integer e.g. ``5``
-  - A list or array of integers ``[4, 3, 0]``
-  - A slice object with ints ``1:7``
-  - A boolean array
-
-  See more at :ref:`Selection by Position <indexing.integer>`
+    * An integer e.g. ``5``.
+    * A list or array of integers ``[4, 3, 0]``.
+    * A slice object with ints ``1:7``.
+    * A boolean array.
+    * A ``callable`` function with one argument (the calling Series, DataFrame or Panel) and
+      that returns valid output for indexing (one of the above).
 
-- ``.ix`` supports mixed integer and label based access. It is primarily label
-  based, but will fall back to integer positional access unless the corresponding
-  axis is of integer type. ``.ix`` is the most general and will
-  support any of the inputs in ``.loc`` and ``.iloc``. ``.ix`` also supports floating point
-  label schemes. ``.ix`` is exceptionally useful when dealing with mixed positional
-  and label based hierachical indexes.
+      .. versionadded:: 0.18.1
 
-  However, when an axis is integer based, ONLY
-  label based access and not positional access is supported.
-  Thus, in such cases, it's usually better to be explicit and use ``.iloc`` or ``.loc``.
-
-  See more at :ref:`Advanced Indexing <advanced>` and :ref:`Advanced
+  See more at :ref:`Selection by Position <indexing.integer>`,
+  :ref:`Advanced Indexing <advanced>` and :ref:`Advanced
   Hierarchical <advanced.advanced_hierarchical>`.
 
+* ``.loc``, ``.iloc``, and also ``[]`` indexing can accept a ``callable`` as indexer. See more at :ref:`Selection By Callable <indexing.callable>`.
+
 Getting values from an object with multi-axes selection uses the following
-notation (using ``.loc`` as an example, but applies to ``.iloc`` and ``.ix`` as
+notation (using ``.loc`` as an example, but the following applies to ``.iloc`` as
 well). Any of the axes accessors may be the null slice ``:``. Axes left out of
-the specification are assumed to be ``:``. (e.g. ``p.loc['a']`` is equiv to
-``p.loc['a', :, :]``)
+the specification are assumed to be ``:``, e.g. ``p.loc['a']`` is equivalent to
+``p.loc['a', :, :]``.
 
 .. csv-table::
     :header: "Object Type", "Indexers"
@@ -129,7 +125,8 @@ Basics
 As mentioned when introducing the data structures in the :ref:`last section
 <basics>`, the primary function of indexing with ``[]`` (a.k.a. ``__getitem__``
 for those familiar with implementing class behavior in Python) is selecting out
-lower-dimensional slices. Thus,
+lower-dimensional slices. The following table shows return type values when
+indexing pandas objects with ``[]``:
 
 .. csv-table::
     :header: "Object Type", "Selection", "Return Value Type"
@@ -138,7 +135,7 @@ lower-dimensional slices. Thus,
 
     Series; ``series[label]``; scalar value
     DataFrame; ``frame[colname]``; ``Series`` corresponding to colname
-    Panel; ``panel[itemname]``; ``DataFrame`` corresponing to the itemname
+    Panel; ``panel[itemname]``; ``DataFrame`` corresponding to the itemname
 
 Here we construct a simple time series data set to use for illustrating the
 indexing functionality:
@@ -177,6 +174,26 @@ raised. Multiple columns can also be set in this manner:
 You may find this useful for applying a transform (in-place) to a subset of the
 columns.
 
+.. warning::
+
+   pandas aligns all AXES when setting ``Series`` and ``DataFrame`` from ``.loc``, and ``.iloc``.
+
+   This will **not** modify ``df`` because the column alignment is before value assignment.
+
+   .. ipython:: python
+
+      df[['A', 'B']]
+      df.loc[:,['B', 'A']] = df[['A', 'B']]
+      df[['A', 'B']]
+
+   The correct way to swap column values is by using raw values:
+
+   .. ipython:: python
+
+      df.loc[:,['B', 'A']] = df[['A', 'B']].values
+      df[['A', 'B']]
+
+
 Attribute Access
 ----------------
 
@@ -186,7 +203,7 @@ Attribute Access
 
 .. _indexing.attribute_access:
 
-You may access an index on a ``Series``, column on a ``DataFrame``, and a item on a ``Panel`` directly
+You may access an index on a ``Series``, column on a ``DataFrame``, and an item on a ``Panel`` directly
 as an attribute:
 
 .. ipython:: python
@@ -200,10 +217,6 @@ as an attribute:
    dfa.A
    panel.one
 
-You can use attribute access to modify an existing element of a Series or column of a DataFrame, but be careful;
-if you try to use attribute access to create a new column, it fails silently, creating a new attribute rather than a
-new column.
-
 .. ipython:: python
 
    sa.a = 5
@@ -215,20 +228,18 @@ new column.
 
 .. warning::
 
-   - You can use this access only if the index element is a valid python identifier, e.g. ``s.1`` is not allowed.
+   - You can use this access only if the index element is a valid Python identifier, e.g. ``s.1`` is not allowed.
      See `here for an explanation of valid identifiers
-     <http://docs.python.org/2.7/reference/lexical_analysis.html#identifiers>`__.
+     <https://docs.python.org/3/reference/lexical_analysis.html#identifiers>`__.
 
    - The attribute will not be available if it conflicts with an existing method name, e.g. ``s.min`` is not allowed.
 
    - Similarly, the attribute will not be available if it conflicts with any of the following list: ``index``,
-     ``major_axis``, ``minor_axis``, ``items``, ``labels``.
+     ``major_axis``, ``minor_axis``, ``items``.
 
    - In any of these cases, standard indexing will still work, e.g. ``s['1']``, ``s['min']``, and ``s['index']`` will
      access the corresponding element or column.
 
-   - The ``Series/Panel`` accesses are available starting in 0.13.0.
-
 If you are using the IPython environment, you may also use tab-completion to
 see these accessible attributes.
 
@@ -240,6 +251,22 @@ You can also assign a ``dict`` to a row of a ``DataFrame``:
    x.iloc[1] = dict(x=9, y=99)
    x
 
+You can use attribute access to modify an existing element of a Series or column of a DataFrame, but be careful;
+if you try to use attribute access to create a new column, it creates a new attribute rather than a
+new column. In 0.21.0 and later, this will raise a ``UserWarning``:
+
+.. code-block:: ipython
+
+    In[1]: df = pd.DataFrame({'one': [1., 2., 3.]})
+    In[2]: df.two = [4, 5, 6]
+    UserWarning: Pandas doesn't allow Series to be assigned into nonexistent columns - see https://pandas.pydata.org/pandas-docs/stable/indexing.html#attribute_access
+    In[3]: df
+    Out[3]:
+       one
+    0  1.0
+    1  2.0
+    2  3.0
+
 Slicing ranges
 --------------
 
@@ -281,7 +308,7 @@ Selection By Label
 
    Whether a copy or a reference is returned for a setting operation, may depend on the context.
    This is sometimes called ``chained assignment`` and should be avoided.
-   See :ref:`Returning a View versus Copy <indexing.view_versus_copy>`
+   See :ref:`Returning a View versus Copy <indexing.view_versus_copy>`.
 
 .. warning::
 
@@ -293,7 +320,7 @@ Selection By Label
      dfl = pd.DataFrame(np.random.randn(5,4), columns=list('ABCD'), index=pd.date_range('20130101',periods=5))
      dfl
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [4]: dfl.loc[2:3]
      TypeError: cannot do slice indexing on <class 'pandas.tseries.index.DatetimeIndex'> with these indexers [2] of <type 'int'>
@@ -304,15 +331,26 @@ Selection By Label
 
      dfl.loc['20130102':'20130104']
 
+.. warning::
+
+   Starting in 0.21.0, pandas will show a ``FutureWarning`` if indexing with a list with missing labels. In the future
+   this will raise a ``KeyError``. See :ref:`list-like Using loc with missing keys in a list is Deprecated <indexing.deprecate_loc_reindex_listlike>`.
+
 pandas provides a suite of methods in order to have **purely label based indexing**. This is a strict inclusion based protocol.
-**At least 1** of the labels for which you ask, must be in the index or a ``KeyError`` will be raised! When slicing, the start bound is *included*, **AND** the stop bound is *included*. Integers are valid labels, but they refer to the label **and not the position**.
+Every label asked for must be in the index, or a ``KeyError`` will be raised.
+When slicing, both the start bound **AND** the stop bound are *included*, if present in the index.
+Integers are valid labels, but they refer to the label **and not the position**.
 
 The ``.loc`` attribute is the primary access method. The following are valid inputs:
 
-- A single label, e.g. ``5`` or ``'a'``, (note that ``5`` is interpreted as a *label* of the index. This use is **not** an integer position along the index)
-- A list or array of labels ``['a', 'b', 'c']``
-- A slice object with labels ``'a':'f'`` (note that contrary to usual python slices, **both** the start and the stop are included!)
-- A boolean array
+* A single label, e.g. ``5`` or ``'a'`` (Note that ``5`` is interpreted as a *label* of the index. This use is **not** an integer position along the index.).
+* A list or array of labels ``['a', 'b', 'c']``.
+* A slice object with labels ``'a':'f'`` (Note that contrary to usual python
+  slices, **both** the start and the stop are included, when present in the
+  index! See :ref:`Slicing with labels
+  <indexing.slicing_with_labels>`.).
+* A boolean array.
+* A ``callable``, see :ref:`Selection By Callable <indexing.callable>`.
 
 .. ipython:: python
 
@@ -328,7 +366,7 @@ Note that setting works as well:
    s1.loc['c':] = 0
    s1
 
-With a DataFrame
+With a DataFrame:
 
 .. ipython:: python
 
@@ -336,33 +374,61 @@ With a DataFrame
                       index=list('abcdef'),
                       columns=list('ABCD'))
    df1
-   df1.loc[['a','b','d'],:]
+   df1.loc[['a', 'b', 'd'], :]
 
-Accessing via label slices
+Accessing via label slices:
 
 .. ipython:: python
 
-   df1.loc['d':,'A':'C']
+   df1.loc['d':, 'A':'C']
 
-For getting a cross section using a label (equiv to ``df.xs('a')``)
+For getting a cross section using a label (equivalent to ``df.xs('a')``):
 
 .. ipython:: python
 
    df1.loc['a']
 
-For getting values with a boolean array
+For getting values with a boolean array:
 
 .. ipython:: python
 
-   df1.loc['a']>0
-   df1.loc[:,df1.loc['a']>0]
+   df1.loc['a'] > 0
+   df1.loc[:, df1.loc['a'] > 0]
 
-For getting a value explicitly (equiv to deprecated ``df.get_value('a','A')``)
+For getting a value explicitly (equivalent to deprecated ``df.get_value('a','A')``):
 
 .. ipython:: python
 
    # this is also equivalent to ``df1.at['a','A']``
-   df1.loc['a','A']
+   df1.loc['a', 'A']
+
+.. _indexing.slicing_with_labels:
+
+Slicing with labels
+~~~~~~~~~~~~~~~~~~~
+
+When using ``.loc`` with slices, if both the start and the stop labels are
+present in the index, then elements *located* between the two (including them)
+are returned:
+
+.. ipython:: python
+
+   s = pd.Series(list('abcde'), index=[0,3,2,5,4])
+   s.loc[3:5]
+
+If at least one of the two is absent, but the index is sorted, and can be
+compared against start and stop labels, then slicing will still work as
+expected, by selecting labels which *rank* between the two:
+
+.. ipython:: python
+
+   s.sort_index()
+   s.sort_index().loc[1:6]
+
+However, if at least one of the two is absent *and* the index is not sorted, an
+error will be raised (since doing otherwise would be computationally expensive,
+as well as potentially ambiguous for mixed type indexes). For instance, in the
+above example, ``s.loc[1:6]`` would raise ``KeyError``.
 
 .. _indexing.integer:
 
@@ -373,16 +439,17 @@ Selection By Position
 
    Whether a copy or a reference is returned for a setting operation, may depend on the context.
    This is sometimes called ``chained assignment`` and should be avoided.
-   See :ref:`Returning a View versus Copy <indexing.view_versus_copy>`
+   See :ref:`Returning a View versus Copy <indexing.view_versus_copy>`.
 
-pandas provides a suite of methods in order to get **purely integer based indexing**. The semantics follow closely python and numpy slicing. These are ``0-based`` indexing. When slicing, the start bounds is *included*, while the upper bound is *excluded*. Trying to use a non-integer, even a **valid** label will raise a ``IndexError``.
+Pandas provides a suite of methods in order to get **purely integer based indexing**. The semantics follow closely Python and NumPy slicing. These are ``0-based`` indexing. When slicing, the start bounds is *included*, while the upper bound is *excluded*. Trying to use a non-integer, even a **valid** label will raise an ``IndexError``.
 
 The ``.iloc`` attribute is the primary access method. The following are valid inputs:
 
-- An integer e.g. ``5``
-- A list or array of integers ``[4, 3, 0]``
-- A slice object with ints ``1:7``
-- A boolean array
+* An integer e.g. ``5``.
+* A list or array of integers ``[4, 3, 0]``.
+* A slice object with ints ``1:7``.
+* A boolean array.
+* A ``callable``, see :ref:`Selection By Callable <indexing.callable>`.
 
 .. ipython:: python
 
@@ -398,7 +465,7 @@ Note that setting works as well:
    s1.iloc[:3] = 0
    s1
 
-With a DataFrame
+With a DataFrame:
 
 .. ipython:: python
 
@@ -407,33 +474,33 @@ With a DataFrame
                       columns=list(range(0,8,2)))
    df1
 
-Select via integer slicing
+Select via integer slicing:
 
 .. ipython:: python
 
    df1.iloc[:3]
-   df1.iloc[1:5,2:4]
+   df1.iloc[1:5, 2:4]
 
-Select via integer list
+Select via integer list:
 
 .. ipython:: python
 
-   df1.iloc[[1,3,5],[1,3]]
+   df1.iloc[[1, 3, 5], [1, 3]]
 
 .. ipython:: python
 
-   df1.iloc[1:3,:]
+   df1.iloc[1:3, :]
 
 .. ipython:: python
 
-   df1.iloc[:,1:3]
+   df1.iloc[:, 1:3]
 
 .. ipython:: python
 
    # this is also equivalent to ``df1.iat[1,1]``
-   df1.iloc[1,1]
+   df1.iloc[1, 1]
 
-For getting a cross section using an integer position (equiv to ``df.xs(1)``)
+For getting a cross section using an integer position (equiv to ``df.xs(1)``):
 
 .. ipython:: python
 
@@ -444,7 +511,6 @@ Out of range slice indexes are handled gracefully just as in Python/Numpy.
 .. ipython:: python
 
     # these are allowed in python/numpy.
-    # Only works in Pandas starting from v0.14.0.
     x = list('abcdef')
     x
     x[4:10]
@@ -454,40 +520,232 @@ Out of range slice indexes are handled gracefully just as in Python/Numpy.
     s.iloc[4:10]
     s.iloc[8:10]
 
-.. note::
-
-    Prior to v0.14.0, ``iloc`` would not accept out of bounds indexers for
-    slices, e.g. a value that exceeds the length of the object being indexed.
-
-
-Note that this could result in an empty axis (e.g. an empty DataFrame being
-returned)
+Note that using slices that go out of bounds can result in
+an empty axis (e.g. an empty DataFrame being returned).
 
 .. ipython:: python
 
    dfl = pd.DataFrame(np.random.randn(5,2), columns=list('AB'))
    dfl
-   dfl.iloc[:,2:3]
-   dfl.iloc[:,1:3]
+   dfl.iloc[:, 2:3]
+   dfl.iloc[:, 1:3]
    dfl.iloc[4:6]
 
 A single indexer that is out of bounds will raise an ``IndexError``.
 A list of indexers where any element is out of bounds will raise an
-``IndexError``
+``IndexError``.
 
 .. code-block:: python
 
-   dfl.iloc[[4,5,6]]
+   dfl.iloc[[4, 5, 6]]
    IndexError: positional indexers are out-of-bounds
 
-   dfl.iloc[:,4]
+   dfl.iloc[:, 4]
    IndexError: single positional indexer is out-of-bounds
 
+.. _indexing.callable:
+
+Selection By Callable
+---------------------
+
+.. versionadded:: 0.18.1
+
+``.loc``, ``.iloc``, and also ``[]`` indexing can accept a ``callable`` as indexer.
+The ``callable`` must be a function with one argument (the calling Series, DataFrame or Panel) and that returns valid output for indexing.
+
+.. ipython:: python
+
+   df1 = pd.DataFrame(np.random.randn(6, 4),
+                      index=list('abcdef'),
+                      columns=list('ABCD'))
+   df1
+
+   df1.loc[lambda df: df.A > 0, :]
+   df1.loc[:, lambda df: ['A', 'B']]
+
+   df1.iloc[:, lambda df: [0, 1]]
+
+   df1[lambda df: df.columns[0]]
+
+
+You can use callable indexing in ``Series``.
+
+.. ipython:: python
+
+   df1.A.loc[lambda s: s > 0]
+
+Using these methods / indexers, you can chain data selection operations
+without using temporary variable.
+
+.. ipython:: python
+
+   bb = pd.read_csv('data/baseball.csv', index_col='id')
+   (bb.groupby(['year', 'team']).sum()
+      .loc[lambda df: df.r > 100])
+
+.. _indexing.deprecate_ix:
+
+IX Indexer is Deprecated
+------------------------
+
+.. warning::
+
+   Starting in 0.20.0, the ``.ix`` indexer is deprecated, in favor of the more strict ``.iloc``
+   and ``.loc`` indexers.
+
+``.ix`` offers a lot of magic on the inference of what the user wants to do. To wit, ``.ix`` can decide
+to index *positionally* OR via *labels* depending on the data type of the index. This has caused quite a
+bit of user confusion over the years.
+
+The recommended methods of indexing are:
+
+* ``.loc`` if you want to *label* index.
+* ``.iloc`` if you want to *positionally* index.
+
+.. ipython:: python
+
+  dfd = pd.DataFrame({'A': [1, 2, 3],
+                      'B': [4, 5, 6]},
+                     index=list('abc'))
+
+  dfd
+
+Previous behavior, where you wish to get the 0th and the 2nd elements from the index in the 'A' column.
+
+.. code-block:: ipython
+
+  In [3]: dfd.ix[[0, 2], 'A']
+  Out[3]:
+  a    1
+  c    3
+  Name: A, dtype: int64
+
+Using ``.loc``. Here we will select the appropriate indexes from the index, then use *label* indexing.
+
+.. ipython:: python
+
+  dfd.loc[dfd.index[[0, 2]], 'A']
+
+This can also be expressed using ``.iloc``, by explicitly getting locations on the indexers, and using
+*positional* indexing to select things.
+
+.. ipython:: python
+
+  dfd.iloc[[0, 2], dfd.columns.get_loc('A')]
+
+For getting *multiple* indexers, using ``.get_indexer``:
+
+.. ipython:: python
+
+  dfd.iloc[[0, 2], dfd.columns.get_indexer(['A', 'B'])]
+
+
+.. _deprecate_loc_reindex_listlike:
+.. _indexing.deprecate_loc_reindex_listlike:
+
+Indexing with list with missing labels is Deprecated
+----------------------------------------------------
+
+.. warning::
+
+   Starting in 0.21.0, using ``.loc`` or ``[]`` with a list with one or more missing labels, is deprecated, in favor of ``.reindex``.
+
+In prior versions, using ``.loc[list-of-labels]`` would work as long as *at least 1* of the keys was found (otherwise it
+would raise a ``KeyError``). This behavior is deprecated and will show a warning message pointing to this section. The
+recommended alternative is to use ``.reindex()``.
+
+For example.
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3])
+   s
+
+Selection with all keys found is unchanged.
+
+.. ipython:: python
+
+   s.loc[[1, 2]]
+
+Previous Behavior
+
+.. code-block:: ipython
+
+   In [4]: s.loc[[1, 2, 3]]
+   Out[4]:
+   1    2.0
+   2    3.0
+   3    NaN
+   dtype: float64
+
+
+Current Behavior
+
+.. code-block:: ipython
+
+   In [4]: s.loc[[1, 2, 3]]
+   Passing list-likes to .loc with any non-matching elements will raise
+   KeyError in the future, you can use .reindex() as an alternative.
+
+   See the documentation here:
+   http://pandas.pydata.org/pandas-docs/stable/indexing.html#deprecate-loc-reindex-listlike
+
+   Out[4]:
+   1    2.0
+   2    3.0
+   3    NaN
+   dtype: float64
+
+
+Reindexing
+~~~~~~~~~~
+
+The idiomatic way to achieve selecting potentially not-found elements is via ``.reindex()``. See also the section on :ref:`reindexing <basics.reindexing>`.
+
+.. ipython:: python
+
+  s.reindex([1, 2, 3])
+
+Alternatively, if you want to select only *valid* keys, the following is idiomatic and efficient; it is guaranteed to preserve the dtype of the selection.
+
+.. ipython:: python
+
+   labels = [1, 2, 3]
+   s.loc[s.index.intersection(labels)]
+
+Having a duplicated index will raise for a ``.reindex()``:
+
+.. ipython:: python
+
+   s = pd.Series(np.arange(4), index=['a', 'a', 'b', 'c'])
+   labels = ['c', 'd']
+
+.. code-block:: ipython
+
+   In [17]: s.reindex(labels)
+   ValueError: cannot reindex from a duplicate axis
+
+Generally, you can intersect the desired labels with the current
+axis, and then reindex.
+
+.. ipython:: python
+
+   s.loc[s.index.intersection(labels)].reindex(labels)
+
+However, this would *still* raise if your resulting index is duplicated.
+
+.. code-block:: ipython
+
+   In [41]: labels = ['a', 'd']
+
+   In [42]: s.loc[s.index.intersection(labels)].reindex(labels)
+   ValueError: cannot reindex from a duplicate axis
+
+
 .. _indexing.basics.partial_setting:
 
 Selecting Random Samples
 ------------------------
-.. versionadded::0.16.1
 
 A random selection of rows or columns from a Series, DataFrame, or Panel with the :meth:`~DataFrame.sample` method. The method will sample rows by default, and accepts a specific number of rows/columns to return, or a fraction of rows.
 
@@ -520,7 +778,7 @@ using the ``replace`` option:
 
 By default, each row has an equal probability of being selected, but if you want rows
 to have different probabilities, you can pass the ``sample`` function sampling weights as
-``weights``. These weights can be a list, a numpy array, or a Series, but they must be of the same length as the object you are sampling. Missing values will be treated as a weight of zero, and inf values are not allowed. If weights do not sum to 1, they will be re-normalized by dividing all weights by the sum of the weights. For example:
+``weights``. These weights can be a list, a NumPy array, or a Series, but they must be of the same length as the object you are sampling. Missing values will be treated as a weight of zero, and inf values are not allowed. If weights do not sum to 1, they will be re-normalized by dividing all weights by the sum of the weights. For example:
 
 .. ipython :: python
 
@@ -548,7 +806,7 @@ as a string.
     df3 = pd.DataFrame({'col1':[1,2,3], 'col2':[2,3,4]})
     df3.sample(n=1, axis=1)
 
-Finally, one can also set a seed for ``sample``'s random number generator using the ``random_state`` argument, which will accept either an integer (as a seed) or a numpy RandomState object.
+Finally, one can also set a seed for ``sample``'s random number generator using the ``random_state`` argument, which will accept either an integer (as a seed) or a NumPy RandomState object.
 
 .. 	ipython :: python
 
@@ -563,11 +821,9 @@ Finally, one can also set a seed for ``sample``'s random number generator using
 Setting With Enlargement
 ------------------------
 
-.. versionadded:: 0.13
-
-The ``.loc/.ix/[]`` operations can perform enlargement when setting a non-existant key for that axis.
+The ``.loc/[]`` operations can perform enlargement when setting a non-existent key for that axis.
 
-In the ``Series`` case this is effectively an appending operation
+In the ``Series`` case this is effectively an appending operation.
 
 .. ipython:: python
 
@@ -576,7 +832,7 @@ In the ``Series`` case this is effectively an appending operation
    se[5] = 5.
    se
 
-A ``DataFrame`` can be enlarged on either axis via ``.loc``
+A ``DataFrame`` can be enlarged on either axis via ``.loc``.
 
 .. ipython:: python
 
@@ -632,9 +888,13 @@ Boolean indexing
 .. _indexing.boolean:
 
 Another common operation is the use of boolean vectors to filter the data.
-The operators are: ``|`` for ``or``, ``&`` for ``and``, and ``~`` for ``not``. These **must** be grouped by using parentheses.
+The operators are: ``|`` for ``or``, ``&`` for ``and``, and ``~`` for ``not``.
+These **must** be grouped by using parentheses, since by default Python will
+evaluate an expression such as ``df.A > 2 & df.B < 3`` as
+``df.A > (2 & df.B) < 3``, while the desired evaluation order is
+``(df.A > 2) & (df.B < 3)``.
 
-Using a boolean vector to index a Series works exactly as in a numpy ndarray:
+Using a boolean vector to index a Series works exactly as in a NumPy ndarray:
 
 .. ipython:: python
 
@@ -672,7 +932,7 @@ more complex criteria:
    # Multiple criteria
    df2[criterion & (df2['b'] == 'x')]
 
-Note, with the choice methods :ref:`Selection by Label <indexing.label>`, :ref:`Selection by Position <indexing.integer>`,
+With the choice methods :ref:`Selection by Label <indexing.label>`, :ref:`Selection by Position <indexing.integer>`,
 and :ref:`Advanced Indexing <advanced>` you may select along more than one axis using boolean vectors combined with other indexing expressions.
 
 .. ipython:: python
@@ -684,9 +944,9 @@ and :ref:`Advanced Indexing <advanced>` you may select along more than one axis
 Indexing with isin
 ------------------
 
-Consider the ``isin`` method of Series, which returns a boolean vector that is
-true wherever the Series elements exist in the passed list. This allows you to
-select rows where one or more columns have values you want:
+Consider the :meth:`~Series.isin` method of ``Series``, which returns a boolean
+vector that is true wherever the ``Series`` elements exist in the passed list.
+This allows you to select rows where one or more columns have values you want:
 
 .. ipython:: python
 
@@ -703,7 +963,7 @@ when you don't know which of the sought labels are in fact present:
    s[s.index.isin([2, 4, 6])]
 
    # compare it to the following
-   s[[2, 4, 6]]
+   s.reindex([2, 4, 6])
 
 In addition to that, ``MultiIndex`` allows selecting a separate level to use
 in the membership check:
@@ -716,7 +976,7 @@ in the membership check:
    s_mi.iloc[s_mi.index.isin([(1, 'a'), (2, 'b'), (0, 'c')])]
    s_mi.iloc[s_mi.index.isin(['a', 'c', 'e'], level=1)]
 
-DataFrame also has an ``isin`` method.  When calling ``isin``, pass a set of
+DataFrame also has an :meth:`~DataFrame.isin` method.  When calling ``isin``, pass a set of
 values as either an array or dict.  If values is an array, ``isin`` returns
 a DataFrame of booleans that is the same shape as the original DataFrame, with True
 wherever the element is in the sequence of values.
@@ -752,6 +1012,8 @@ To select a row where each column meets its own criterion:
 
   df[row_mask]
 
+.. _indexing.where_mask:
+
 The :meth:`~pandas.DataFrame.where` Method and Masking
 ------------------------------------------------------
 
@@ -759,13 +1021,13 @@ Selecting values from a Series with a boolean vector generally returns a
 subset of the data. To guarantee that selection output has the same shape as
 the original data, you can use the ``where`` method in ``Series`` and ``DataFrame``.
 
-To return only the selected rows
+To return only the selected rows:
 
 .. ipython:: python
 
    s[s > 0]
 
-To return a Series of the same shape as the original
+To return a Series of the same shape as the original:
 
 .. ipython:: python
 
@@ -773,7 +1035,7 @@ To return a Series of the same shape as the original
 
 Selecting values from a DataFrame with a boolean criterion now also preserves
 input data shape. ``where`` is used under the hood as the implementation.
-Equivalent is ``df.where(df < 0)``
+The code below is equivalent to ``df.where(df < 0)``.
 
 .. ipython:: python
    :suppress:
@@ -815,20 +1077,27 @@ without creating a copy:
    df_orig.where(df > 0, -df, inplace=True);
    df_orig
 
+.. note::
+
+   The signature for :func:`DataFrame.where` differs from :func:`numpy.where`.
+   Roughly ``df1.where(m, df2)`` is equivalent to ``np.where(m, df1, df2)``.
+
+   .. ipython:: python
+
+      df.where(df < 0, -df) == np.where(df < 0, df, -df)
+
 **alignment**
 
 Furthermore, ``where`` aligns the input boolean condition (ndarray or DataFrame),
 such that partial selection with setting is possible. This is analogous to
-partial setting via ``.ix`` (but on the contents rather than the axis labels)
+partial setting via ``.loc`` (but on the contents rather than the axis labels).
 
 .. ipython:: python
 
    df2 = df.copy()
-   df2[ df2[1:4] > 0 ] = 3
+   df2[ df2[1:4] > 0] = 3
    df2
 
-.. versionadded:: 0.13
-
 Where can also accept ``axis`` and ``level`` parameters to align the input when
 performing the ``where``.
 
@@ -837,16 +1106,30 @@ performing the ``where``.
    df2 = df.copy()
    df2.where(df2>0,df2['A'],axis='index')
 
-This is equivalent (but faster than) the following.
+This is equivalent to (but faster than) the following.
 
 .. ipython:: python
 
    df2 = df.copy()
    df.apply(lambda x, y: x.where(x>0,y), y=df['A'])
 
-**mask**
+.. versionadded:: 0.18.1
 
-``mask`` is the inverse boolean operation of ``where``.
+Where can accept a callable as condition and ``other`` arguments. The function must
+be with one argument (the calling Series or DataFrame) and that returns valid output
+as condition and ``other`` argument.
+
+.. ipython:: python
+
+   df3 = pd.DataFrame({'A': [1, 2, 3],
+                       'B': [4, 5, 6],
+                       'C': [7, 8, 9]})
+   df3.where(lambda x: x > 4, lambda x: x + 10)
+
+Mask
+~~~~
+
+:meth:`~pandas.DataFrame.mask` is the inverse boolean operation of ``where``.
 
 .. ipython:: python
 
@@ -855,10 +1138,8 @@ This is equivalent (but faster than) the following.
 
 .. _indexing.query:
 
-The :meth:`~pandas.DataFrame.query` Method (Experimental)
----------------------------------------------------------
-
-.. versionadded:: 0.13
+The :meth:`~pandas.DataFrame.query` Method
+------------------------------------------
 
 :class:`~pandas.DataFrame` objects have a :meth:`~pandas.DataFrame.query`
 method that allows selection using an expression.
@@ -986,7 +1267,7 @@ having to specify which frame you're interested in querying
 :meth:`~pandas.DataFrame.query` Python versus pandas Syntax Comparison
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Full numpy-like syntax
+Full numpy-like syntax:
 
 .. ipython:: python
 
@@ -996,19 +1277,19 @@ Full numpy-like syntax
    df[(df.a < df.b) & (df.b < df.c)]
 
 Slightly nicer by removing the parentheses (by binding making comparison
-operators bind tighter than ``&``/``|``)
+operators bind tighter than ``&`` and ``|``).
 
 .. ipython:: python
 
    df.query('a < b & b < c')
 
-Use English instead of symbols
+Use English instead of symbols:
 
 .. ipython:: python
 
    df.query('a < b and b < c')
 
-Pretty close to how you might write it on paper
+Pretty close to how you might write it on paper:
 
 .. ipython:: python
 
@@ -1079,7 +1360,7 @@ Special use of the ``==`` operator with ``list`` objects
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Comparing a ``list`` of values to a column using ``==``/``!=`` works similarly
-to ``in``/``not in``
+to ``in``/``not in``.
 
 .. ipython:: python
 
@@ -1114,7 +1395,7 @@ You can negate boolean expressions with the word ``not`` or the ``~`` operator.
    df.query('not bools')
    df.query('not bools') == df[~df.bools]
 
-Of course, expressions can be arbitrarily complex too
+Of course, expressions can be arbitrarily complex too:
 
 .. ipython:: python
 
@@ -1143,7 +1424,7 @@ Performance of :meth:`~pandas.DataFrame.query`
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 ``DataFrame.query()`` using ``numexpr`` is slightly faster than Python for
-large frames
+large frames.
 
 .. image:: _static/query-perf.png
 
@@ -1151,7 +1432,7 @@ large frames
 
    You will only see the performance benefits of using the ``numexpr`` engine
    with ``DataFrame.query()`` if your frame has more than approximately 200,000
-   rows
+   rows.
 
       .. image:: _static/query-perf-small.png
 
@@ -1174,15 +1455,15 @@ If you want to identify and remove duplicate rows in a DataFrame,  there are
 two methods that will help: ``duplicated`` and ``drop_duplicates``. Each
 takes as an argument the columns to use to identify duplicated rows.
 
-- ``duplicated`` returns a boolean vector whose length is the number of rows, and which indicates whether a row is duplicated.
-- ``drop_duplicates`` removes duplicate rows.
+* ``duplicated`` returns a boolean vector whose length is the number of rows, and which indicates whether a row is duplicated.
+* ``drop_duplicates`` removes duplicate rows.
 
 By default, the first observed row of a duplicate set is considered unique, but
 each method has a ``keep`` parameter to specify targets to be kept.
 
-- ``keep='first'`` (default): mark / drop duplicates except for the first occurrence.
-- ``keep='last'``: mark / drop duplicates except for the last occurrence.
-- ``keep=False``: mark  / drop all duplicates.
+* ``keep='first'`` (default): mark / drop duplicates except for the first occurrence.
+* ``keep='last'``: mark / drop duplicates except for the last occurrence.
+* ``keep=False``: mark  / drop all duplicates.
 
 .. ipython:: python
 
@@ -1205,7 +1486,7 @@ Also, you can pass a list of columns to identify duplications.
    df2.drop_duplicates(['a', 'b'])
 
 To drop duplicates by index value, use ``Index.duplicated`` then perform slicing.
-Same options are available in ``keep`` parameter.
+The same set of options are available for the ``keep`` parameter.
 
 .. ipython:: python
 
@@ -1232,24 +1513,12 @@ default value.
    s.get('a')               # equivalent to s['a']
    s.get('x', default=-1)
 
-The :meth:`~pandas.DataFrame.select` Method
--------------------------------------------
-
-Another way to extract slices from an object is with the ``select`` method of
-Series, DataFrame, and Panel. This method should be used only when there is no
-more direct way.  ``select`` takes a function which operates on labels along
-``axis`` and returns a boolean.  For instance:
-
-.. ipython:: python
-
-   df.select(lambda x: x == 'A', axis=1)
-
 The :meth:`~pandas.DataFrame.lookup` Method
 -------------------------------------------
 
 Sometimes you want to extract a set of values given a sequence of row labels
 and column labels, and the ``lookup`` method allows for this and returns a
-numpy array.  For instance,
+NumPy array.  For instance:
 
 .. ipython:: python
 
@@ -1300,8 +1569,6 @@ The name, if set, will be shown in the console display:
 Setting metadata
 ~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.13.0
-
 Indexes are "mostly immutable", but it is possible to set and change their
 metadata, like the index ``name`` (or, for ``MultiIndex``, ``levels`` and
 ``labels``).
@@ -1321,8 +1588,6 @@ See :ref:`Advanced Indexing <advanced>` for usage of MultiIndexes.
   ind.name = "bob"
   ind
 
-.. versionadded:: 0.15.0
-
 ``set_names``, ``set_levels``, and ``set_labels`` also take an optional
 `level`` argument
 
@@ -1338,12 +1603,7 @@ Set operations on Index objects
 
 .. _indexing.set_ops:
 
-.. warning::
-
-   In 0.15.0. the set operations ``+`` and ``-`` were deprecated in order to provide these for numeric type operations on certain
-   index types. ``+`` can be replace by ``.union()`` or ``|``, and ``-`` by ``.difference()``.
-
-The two main operations are ``union (|)``, ``intersection (&)``
+The two main operations are ``union (|)`` and ``intersection (&)``.
 These can be directly called as instance methods or used via overloaded
 operators. Difference is provided via the ``.difference()`` method.
 
@@ -1355,8 +1615,8 @@ operators. Difference is provided via the ``.difference()`` method.
    a & b
    a.difference(b)
 
-Also available is the ``sym_diff (^)`` operation, which returns elements
-that appear in either ``idx1`` or ``idx2`` but not both. This is
+Also available is the ``symmetric_difference (^)`` operation, which returns elements
+that appear in either ``idx1`` or ``idx2``, but not in both. This is
 equivalent to the Index created by ``idx1.difference(idx2).union(idx2.difference(idx1))``,
 with duplicates dropped.
 
@@ -1364,9 +1624,36 @@ with duplicates dropped.
 
    idx1 = pd.Index([1, 2, 3, 4])
    idx2 = pd.Index([2, 3, 4, 5])
-   idx1.sym_diff(idx2)
+   idx1.symmetric_difference(idx2)
    idx1 ^ idx2
 
+.. note::
+
+   The resulting index from a set operation will be sorted in ascending order.
+
+Missing values
+~~~~~~~~~~~~~~
+
+.. _indexing.missing:
+
+.. important::
+
+   Even though ``Index`` can hold missing values (``NaN``), it should be avoided
+   if you do not want any unexpected results. For example, some operations
+   exclude missing values implicitly.
+
+``Index.fillna`` fills missing values with specified scalar value.
+
+.. ipython:: python
+
+   idx1 = pd.Index([1, np.nan, 3, 4])
+   idx1
+   idx1.fillna(2)
+
+   idx2 = pd.DatetimeIndex([pd.Timestamp('2011-01-01'), pd.NaT, pd.Timestamp('2011-01-03')])
+   idx2
+   idx2.fillna(pd.Timestamp('2011-01-02'))
+
 Set / Reset Index
 -----------------
 
@@ -1379,9 +1666,9 @@ Set an index
 
 .. _indexing.set_index:
 
-DataFrame has a ``set_index`` method which takes a column name (for a regular
-``Index``) or a list of column names (for a ``MultiIndex``), to create a new,
-indexed DataFrame:
+DataFrame has a :meth:`~DataFrame.set_index` method which takes a column name
+(for a regular ``Index``) or a list of column names (for a ``MultiIndex``).
+To create a new, re-indexed DataFrame:
 
 .. ipython:: python
    :suppress:
@@ -1420,9 +1707,11 @@ the index in-place (without creating a new object):
 Reset the index
 ~~~~~~~~~~~~~~~
 
-As a convenience, there is a new function on DataFrame called ``reset_index``
-which transfers the index values into the DataFrame's columns and sets a simple
-integer index. This is the inverse operation to ``set_index``
+As a convenience, there is a new function on DataFrame called
+:meth:`~DataFrame.reset_index` which transfers the index values into the
+DataFrame's columns and sets a simple integer index.
+This is the inverse operation of :meth:`~DataFrame.set_index`.
+
 
 .. ipython:: python
 
@@ -1443,11 +1732,6 @@ You can use the ``level`` keyword to remove only a portion of the index:
 ``reset_index`` takes an optional parameter ``drop`` which if true simply
 discards the index, instead of putting index values in the DataFrame's columns.
 
-.. note::
-
-   The ``reset_index`` method used to be called ``delevel`` which is now
-   deprecated.
-
 Adding an ad hoc index
 ~~~~~~~~~~~~~~~~~~~~~~
 
@@ -1486,10 +1770,10 @@ Compare these two access methods:
    dfmi.loc[:,('one','second')]
 
 These both yield the same results, so which should you use? It is instructive to understand the order
-of operations on these and why method 2 (``.loc``) is much preferred over method 1 (chained ``[]``)
+of operations on these and why method 2 (``.loc``) is much preferred over method 1 (chained ``[]``).
 
-``dfmi['one']`` selects the first level of the columns and returns a data frame that is singly-indexed.
-Then another python operation ``dfmi_with_one['second']`` selects the series indexed by ``'second'`` happens.
+``dfmi['one']`` selects the first level of the columns and returns a DataFrame that is singly-indexed.
+Then another Python operation ``dfmi_with_one['second']`` selects the series indexed by ``'second'``.
 This is indicated by the variable ``dfmi_with_one`` because pandas sees these operations as separate events.
 e.g. separate calls to ``__getitem__``, so it has to treat them as linear operations, they happen one after another.
 
@@ -1497,33 +1781,80 @@ Contrast this to ``df.loc[:,('one','second')]`` which passes a nested tuple of `
 ``__getitem__``. This allows pandas to deal with this as a single entity. Furthermore this order of operations *can* be significantly
 faster, and allows one to index *both* axes if so desired.
 
-Why does the assignment when using chained indexing fail!
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Why does assignment fail when using chained indexing?
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The problem in the previous section is just a performance issue. What's up with
+the ``SettingWithCopy`` warning? We don't **usually** throw warnings around when
+you do something that might cost a few extra milliseconds!
+
+But it turns out that assigning to the product of chained indexing has
+inherently unpredictable results. To see this, think about how the Python
+interpreter executes this code:
+
+.. code-block:: python
+
+   dfmi.loc[:,('one','second')] = value
+   # becomes
+   dfmi.loc.__setitem__((slice(None), ('one', 'second')), value)
 
-So, why does this show the ``SettingWithCopy`` warning / and possibly not work when you do chained indexing and assignment:
+But this code is handled differently:
 
 .. code-block:: python
 
    dfmi['one']['second'] = value
+   # becomes
+   dfmi.__getitem__('one').__setitem__('second', value)
+
+See that ``__getitem__`` in there? Outside of simple cases, it's very hard to
+predict whether it will return a view or a copy (it depends on the memory layout
+of the array, about which pandas makes no guarantees), and therefore whether
+the ``__setitem__`` will modify ``dfmi`` or a temporary object that gets thrown
+out immediately afterward. **That's** what ``SettingWithCopy`` is warning you
+about!
+
+.. note:: You may be wondering whether we should be concerned about the ``loc``
+   property in the first example. But ``dfmi.loc`` is guaranteed to be ``dfmi``
+   itself with modified indexing behavior, so ``dfmi.loc.__getitem__`` /
+   ``dfmi.loc.__setitem__`` operate on ``dfmi`` directly. Of course,
+   ``dfmi.loc.__getitem__(idx)`` may be a view or a copy of ``dfmi``.
+
+Sometimes a ``SettingWithCopy`` warning will arise at times when there's no
+obvious chained indexing going on. **These** are the bugs that
+``SettingWithCopy`` is designed to catch! Pandas is probably trying to warn you
+that you've done this:
 
-Since the chained indexing is 2 calls, it is possible that either call may return a **copy** of the data because of the way it is sliced.
-Thus when setting, you are actually setting a **copy**, and not the original frame data. It is impossible for pandas to figure this out because their are 2 separate python operations that are not connected.
+.. code-block:: python
 
-The ``SettingWithCopy`` warning is a 'heuristic' to detect this (meaning it tends to catch most cases but is simply a lightweight check). Figuring this out for real is way complicated.
+   def do_something(df):
+      foo = df[['bar', 'baz']]  # Is foo a view? A copy? Nobody knows!
+      # ... many lines here ...
+      foo['quux'] = value       # We don't know whether this will modify df or not!
+      return foo
 
-The ``.loc`` operation is a single python operation, and thus can select a slice (which still may be a copy), but allows pandas to assign that slice back into the frame after it is modified, thus setting the values as you would think.
+Yikes!
 
-The reason for having the ``SettingWithCopy`` warning is this. Sometimes when you slice an array you will simply get a view back, which means you can set it no problem. However, even a single dtyped array can generate a copy if it is sliced in a particular way. A multi-dtyped DataFrame (meaning it has say ``float`` and ``object`` data), will almost always yield a copy. Whether a view is created is dependent on the memory layout of the array.
+.. _indexing.evaluation_order:
 
 Evaluation order matters
 ~~~~~~~~~~~~~~~~~~~~~~~~
 
-Furthermore, in chained expressions, the order may determine whether a copy is returned or not.
-If an expression will set values on a copy of a slice, then a ``SettingWithCopy``
-exception will be raised (this raise/warn behavior is new starting in 0.13.0)
+When you use chained indexing, the order and type of the indexing operation
+partially determine whether the result is a slice into the original object, or
+a copy of the slice.
 
-You can control the action of a chained assignment via the option ``mode.chained_assignment``,
-which can take the values ``['raise','warn',None]``, where showing a warning is the default.
+Pandas has the ``SettingWithCopyWarning`` because assigning to a copy of a
+slice is frequently not intentional, but a mistake caused by chained indexing
+returning a copy where a slice was expected.
+
+If you would like pandas to be more or less trusting about assignment to a
+chained indexing expression, you can set the :ref:`option <options>`
+``mode.chained_assignment`` to one of these values:
+
+* ``'warn'``, the default, means a ``SettingWithCopyWarning`` is printed.
+* ``'raise'`` means pandas will raise a ``SettingWithCopyException``
+  you have to deal with.
+* ``None`` will suppress the warnings entirely.
 
 .. ipython:: python
    :okwarning:
@@ -1552,9 +1883,9 @@ A chained assignment can also crop up in setting in a mixed dtype frame.
 
 .. note::
 
-   These setting rules apply to all of ``.loc/.iloc/.ix``
+   These setting rules apply to all of ``.loc/.iloc``.
 
-This is the correct access method
+This is the correct access method:
 
 .. ipython:: python
 
@@ -1562,15 +1893,16 @@ This is the correct access method
    dfc.loc[0,'A'] = 11
    dfc
 
-This *can* work at times, but is not guaranteed, and so should be avoided
+This *can* work at times, but it is not guaranteed to, and therefore should be avoided:
 
 .. ipython:: python
+   :okwarning:
 
    dfc = dfc.copy()
    dfc['A'][0] = 111
    dfc
 
-This will **not** work at all, and so should be avoided
+This will **not** work at all, and so should be avoided:
 
 ::
 
@@ -1585,5 +1917,5 @@ This will **not** work at all, and so should be avoided
 .. warning::
 
    The chained assignment warnings / exceptions are aiming to inform the user of a possibly invalid
-   assignment. There may be false positives; situations where a chained assignment is inadvertantly
+   assignment. There may be false positives; situations where a chained assignment is inadvertently
    reported.
diff --git a/doc/source/install.rst b/doc/source/install.rst
index 54e7b2d4df350..a8c5194124829 100644
--- a/doc/source/install.rst
+++ b/doc/source/install.rst
@@ -6,39 +6,52 @@
 Installation
 ============
 
-The easiest way for the majority of users to install pandas is to install it
+The easiest way to install pandas is to install it
 as part of the `Anaconda <http://docs.continuum.io/anaconda/>`__ distribution, a
 cross platform distribution for data analysis and scientific computing.
 This is the recommended installation method for most users.
 
 Instructions for installing from source,
-`PyPI <http://pypi.python.org/pypi/pandas>`__, various Linux distributions, or a
-`development version <http://github.com/pydata/pandas>`__ are also provided.
+`PyPI <https://pypi.org/project/pandas>`__, `ActivePython <https://www.activestate.com/activepython/downloads>`__, various Linux distributions, or a
+`development version <http://github.com/pandas-dev/pandas>`__ are also provided.
 
-Python version support
-----------------------
+.. _install.dropping-27:
 
-Officially Python 2.6, 2.7, 3.3, 3.4, and 3.5
+Plan for dropping Python 2.7
+----------------------------
 
-Installing pandas
------------------
+The Python core team plans to stop supporting Python 2.7 on January 1st, 2020.
+In line with `NumPy's plans`_, all pandas releases through December 31, 2018
+will support Python 2.
 
-Trying out pandas, no installation required!
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+The final release before **December 31, 2018** will be the last release to
+support Python 2. The released package will continue to be available on
+PyPI and through conda.
 
-The easiest way to start experimenting with pandas doesn't involve installing
-pandas at all.
+Starting **January 1, 2019**, all releases will be Python 3 only.
 
-`Wakari <https://wakari.io>`__ is a free service that provides a hosted
-`IPython Notebook <http://ipython.org/notebook.html>`__ service in the cloud.
+If there are people interested in continued support for Python 2.7 past December
+31, 2018 (either backporting bug fixes or funding) please reach out to the
+maintainers on the issue tracker.
 
-Simply create an account, and have access to pandas from within your brower via
-an `IPython Notebook <http://ipython.org/notebook.html>`__ in a few minutes.
+For more information, see the `Python 3 statement`_ and the `Porting to Python 3 guide`_.
+
+.. _NumPy's plans: https://github.com/numpy/numpy/blob/master/doc/neps/nep-0014-dropping-python2.7-proposal.rst#plan-for-dropping-python-27-support
+.. _Python 3 statement: http://python3statement.org/
+.. _Porting to Python 3 guide: https://docs.python.org/3/howto/pyporting.html
+
+Python version support
+----------------------
+
+Officially Python 2.7, 3.5, 3.6, and 3.7.
+
+Installing pandas
+-----------------
 
 .. _install.anaconda:
 
-Installing pandas with Anaconda
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Installing with Anaconda
+~~~~~~~~~~~~~~~~~~~~~~~~
 
 Installing pandas and the rest of the `NumPy <http://www.numpy.org/>`__ and
 `SciPy <http://www.scipy.org/>`__ stack can be a little
@@ -52,7 +65,7 @@ packages that make up the `SciPy <http://www.scipy.org/>`__ stack
 (Linux, Mac OS X, Windows) Python distribution for data analytics and
 scientific computing.
 
-After running a simple installer, the user will have access to pandas and the
+After running the installer, the user will have access to pandas and the
 rest of the `SciPy <http://www.scipy.org/>`__ stack without needing to install
 anything else, and without needing to wait for any software to be compiled.
 
@@ -63,15 +76,15 @@ A full list of the packages available as part of the
 `Anaconda <http://docs.continuum.io/anaconda/>`__ distribution
 `can be found here <http://docs.continuum.io/anaconda/pkg-docs.html>`__.
 
-An additional advantage of installing with Anaconda is that you don't require
-admin rights to install it, it will install in the user's home directory, and
-this also makes it trivial to delete Anaconda at a later date (just delete
+Another advantage to installing Anaconda is that you don't need
+admin rights to install it. Anaconda can install in the user's home directory,
+which makes it trivial to delete Anaconda if you decide (just delete
 that folder).
 
 .. _install.miniconda:
 
-Installing pandas with Miniconda
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Installing with Miniconda
+~~~~~~~~~~~~~~~~~~~~~~~~~
 
 The previous section outlined how to get pandas installed as part of the
 `Anaconda <http://docs.continuum.io/anaconda/>`__ distribution.
@@ -97,9 +110,9 @@ downloading and running the `Miniconda
 will do this for you. The installer
 `can be found here <http://conda.pydata.org/miniconda.html>`__
 
-The next step is to create a new conda environment (these are analogous to a
-virtualenv but they also allow you to specify precisely which Python version
-to install also). Run the following commands from a terminal window::
+The next step is to create a new conda environment. A conda environment is like a
+virtualenv that allows you to specify a specific version of Python and set of libraries.
+Run the following commands from a terminal window::
 
     conda create -n name_of_my_env python
 
@@ -119,7 +132,7 @@ following command::
 
 To install a specific pandas version::
 
-    conda install pandas=0.13.1
+    conda install pandas=0.20.3
 
 To install other packages, IPython for example::
 
@@ -130,8 +143,8 @@ distribution::
 
     conda install anaconda
 
-If you require any packages that are available to pip but not conda, simply
-install pip, and use pip to install these packages::
+If you need packages that are available to pip but not conda, then
+install pip, and then use pip to install those packages::
 
     conda install pip
     pip install django
@@ -140,40 +153,41 @@ Installing from PyPI
 ~~~~~~~~~~~~~~~~~~~~
 
 pandas can be installed via pip from
-`PyPI <http://pypi.python.org/pypi/pandas>`__.
+`PyPI <https://pypi.org/project/pandas>`__.
 
 ::
 
     pip install pandas
 
-This will likely require the installation of a number of dependencies,
-including NumPy, will require a compiler to compile required bits of code,
-and can take a few minutes to complete.
+Installing with ActivePython
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Installation instructions for
+`ActivePython <https://www.activestate.com/activepython>`__ can be found
+`here <https://www.activestate.com/activepython/downloads>`__. Versions
+2.7 and 3.5 include pandas.
 
 Installing using your Linux distribution's package manager.
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-The commands in this table will install pandas for Python 2 from your distribution.
-To install pandas for Python 3 you may need to use the package ``python3-pandas``.
+The commands in this table will install pandas for Python 3 from your distribution.
+To install pandas for Python 2, you may need to use the ``python-pandas`` package.
 
 .. csv-table::
     :header: "Distribution", "Status", "Download / Repository Link", "Install method"
     :widths: 10, 10, 20, 50
 
 
-    Debian, stable, `official Debian repository <http://packages.debian.org/search?keywords=pandas&searchon=names&suite=all&section=all>`__ , ``sudo apt-get install python-pandas``
-    Debian & Ubuntu, unstable (latest packages), `NeuroDebian <http://neuro.debian.net/index.html#how-to-use-this-repository>`__ , ``sudo apt-get install python-pandas``
-    Ubuntu, stable, `official Ubuntu repository <http://packages.ubuntu.com/search?keywords=pandas&searchon=names&suite=all&section=all>`__ , ``sudo apt-get install python-pandas``
-    Ubuntu, unstable (daily builds), `PythonXY PPA  <https://code.launchpad.net/~pythonxy/+archive/pythonxy-devel>`__; activate by: ``sudo add-apt-repository ppa:pythonxy/pythonxy-devel && sudo apt-get update``, ``sudo apt-get install python-pandas``
-	OpenSuse & Fedora, stable, `OpenSuse Repository  <http://software.opensuse.org/package/python-pandas?search_term=pandas>`__ , ``zypper in  python-pandas``
-
-
-
-
-
-
-
+    Debian, stable, `official Debian repository <http://packages.debian.org/search?keywords=pandas&searchon=names&suite=all&section=all>`__ , ``sudo apt-get install python3-pandas``
+    Debian & Ubuntu, unstable (latest packages), `NeuroDebian <http://neuro.debian.net/index.html#how-to-use-this-repository>`__ , ``sudo apt-get install python3-pandas``
+    Ubuntu, stable, `official Ubuntu repository <http://packages.ubuntu.com/search?keywords=pandas&searchon=names&suite=all&section=all>`__ , ``sudo apt-get install python3-pandas``
+    OpenSuse, stable, `OpenSuse Repository  <http://software.opensuse.org/package/python-pandas?search_term=pandas>`__ , ``zypper in python3-pandas``
+    Fedora, stable, `official Fedora repository  <https://admin.fedoraproject.org/pkgdb/package/rpms/python-pandas/>`__ , ``dnf install python3-pandas``
+    Centos/RHEL, stable, `EPEL repository <https://admin.fedoraproject.org/pkgdb/package/rpms/python-pandas/>`__ , ``yum install python3-pandas``
 
+**However**, the packages in the linux package managers are often a few versions behind, so
+to get the newest version of pandas, it's recommended to install using the ``pip`` or ``conda``
+methods described above.
 
 
 Installing from source
@@ -182,59 +196,55 @@ Installing from source
 See the :ref:`contributing documentation <contributing>` for complete instructions on building from the git source tree. Further, see :ref:`creating a development environment <contributing.dev_env>` if you wish to create a *pandas* development environment.
 
 Running the test suite
-~~~~~~~~~~~~~~~~~~~~~~
+----------------------
 
-pandas is equipped with an exhaustive set of unit tests covering about 97% of
-the codebase as of this writing. To run it on your machine to verify that
-everything is working (and you have all of the dependencies, soft and hard,
-installed), make sure you have `nose
-<http://readthedocs.org/docs/nose/en/latest/>`__ and run:
+pandas is equipped with an exhaustive set of unit tests, covering about 97% of
+the code base as of this writing. To run it on your machine to verify that
+everything is working (and that you have all of the dependencies, soft and hard,
+installed), make sure you have `pytest
+<http://doc.pytest.org/en/latest/>`__ and run:
 
 ::
 
-    $ nosetests pandas
-    ..........................................................................
-    .......................S..................................................
-    ..........................................................................
-    ..........................................................................
-    ..........................................................................
-    ..........................................................................
-    ..........................................................................
-    ..........................................................................
-    ..........................................................................
-    ..........................................................................
-    .................S........................................................
-    ....
-    ----------------------------------------------------------------------
-    Ran 818 tests in 21.631s
-
-    OK (SKIP=2)
+    >>> import pandas as pd
+    >>> pd.test()
+    running: pytest --skip-slow --skip-network C:\Users\TP\Anaconda3\envs\py36\lib\site-packages\pandas
+    ============================= test session starts =============================
+    platform win32 -- Python 3.6.2, pytest-3.2.1, py-1.4.34, pluggy-0.4.0
+    rootdir: C:\Users\TP\Documents\Python\pandasdev\pandas, inifile: setup.cfg
+    collected 12145 items / 3 skipped
+
+    ..................................................................S......
+    ........S................................................................
+    .........................................................................
+
+    ==================== 12130 passed, 12 skipped in 368.339 seconds =====================
 
 Dependencies
 ------------
 
-* `setuptools <http://pythonhosted.org/setuptools>`__
-* `NumPy <http://www.numpy.org>`__: 1.7.1 or higher
-* `python-dateutil <http://labix.org/python-dateutil>`__ 1.5 or higher
+* `setuptools <https://setuptools.readthedocs.io/en/latest/>`__: 24.2.0 or higher
+* `NumPy <http://www.numpy.org>`__: 1.9.0 or higher
+* `python-dateutil <//https://dateutil.readthedocs.io/en/stable/>`__: 2.5.0 or higher
 * `pytz <http://pytz.sourceforge.net/>`__
-   * Needed for time zone support
 
 .. _install.recommended_dependencies:
 
 Recommended Dependencies
 ~~~~~~~~~~~~~~~~~~~~~~~~
 
-* `numexpr <http://code.google.com/p/numexpr/>`__: for accelerating certain numerical operations.
+* `numexpr <https://github.com/pydata/numexpr>`__: for accelerating certain numerical operations.
   ``numexpr`` uses multiple cores as well as smart chunking and caching to achieve large speedups.
-  If installed, must be Version 2.1 or higher.
+  If installed, must be Version 2.4.6 or higher.
 
-* `bottleneck <http://berkeleyanalytics.com/bottleneck>`__: for accelerating certain types of ``nan``
-  evaluations. ``bottleneck`` uses specialized cython routines to achieve large speedups.
+* `bottleneck <https://github.com/kwgoodman/bottleneck>`__: for accelerating certain types of ``nan``
+  evaluations. ``bottleneck`` uses specialized cython routines to achieve large speedups. If installed,
+  must be Version 1.0.0 or higher.
 
 .. note::
 
-   You are highly encouraged to install these libraries, as they provide large speedups, especially
-   if working with large data sets.
+   You are highly encouraged to install these libraries, as they provide speed improvements, especially
+   when working with large data sets.
 
 
 .. _install.optional_dependencies:
@@ -243,60 +253,67 @@ Optional Dependencies
 ~~~~~~~~~~~~~~~~~~~~~
 
 * `Cython <http://www.cython.org>`__: Only necessary to build development
-  version. Version 0.19.1 or higher.
-* `SciPy <http://www.scipy.org>`__: miscellaneous statistical functions
+  version. Version 0.24 or higher.
+* `SciPy <http://www.scipy.org>`__: miscellaneous statistical functions, Version 0.14.0 or higher
+* `xarray <http://xarray.pydata.org>`__: pandas like handling for > 2 dims, needed for converting Panels to xarray objects. Version 0.7.0 or higher is recommended.
 * `PyTables <http://www.pytables.org>`__: necessary for HDF5-based storage. Version 3.0.0 or higher required, Version 3.2.1 or higher highly recommended.
-* `SQLAlchemy <http://www.sqlalchemy.org>`__: for SQL database support. Version 0.8.1 or higher recommended.
-* `matplotlib <http://matplotlib.sourceforge.net/>`__: for plotting
-* `statsmodels <http://statsmodels.sourceforge.net/>`__
-   * Needed for parts of :mod:`pandas.stats`
-* `openpyxl <http://packages.python.org/openpyxl/>`__, `xlrd/xlwt <http://www.python-excel.org/>`__
-   * Needed for Excel I/O
-* `XlsxWriter <https://pypi.python.org/pypi/XlsxWriter>`__
-   * Alternative Excel writer
-* `boto <https://pypi.python.org/pypi/boto>`__: necessary for Amazon S3
-  access.
-* `blosc <https://pypi.python.org/pypi/blosc>`__: for msgpack compression using ``blosc``
-* One of `PyQt4
-  <http://www.riverbankcomputing.com/software/pyqt/download>`__, `PySide
-  <http://qt-project.org/wiki/Category:LanguageBindings::PySide>`__, `pygtk
-  <http://www.pygtk.org/>`__, `xsel
-  <http://www.vergenet.net/~conrad/software/xsel/>`__, or `xclip
-  <http://sourceforge.net/projects/xclip/>`__: necessary to use
-  :func:`~pandas.io.clipboard.read_clipboard`. Most package managers on Linux
-  distributions will have xclip and/or xsel immediately available for
-  installation.
-* Google's `python-gflags <http://code.google.com/p/python-gflags/>`__
-  and `google-api-python-client <http://github.com/google/google-api-python-client>`__
-  * Needed for :mod:`~pandas.io.gbq`
-* `setuptools <https://pypi.python.org/pypi/setuptools/>`__
-  * Needed for :mod:`~pandas.io.gbq` (specifically, it utilizes `pkg_resources`)
-* `httplib2 <http://pypi.python.org/pypi/httplib2>`__
-  * Needed for :mod:`~pandas.io.gbq`
+* `Feather Format <https://github.com/wesm/feather>`__: necessary for feather-based storage, version 0.3.1 or higher.
+* `Apache Parquet <https://parquet.apache.org/>`__, either `pyarrow <http://arrow.apache.org/docs/python/>`__ (>= 0.4.1) or `fastparquet <https://fastparquet.readthedocs.io/en/latest>`__ (>= 0.0.6) for parquet-based storage. The `snappy <https://pypi.org/project/python-snappy>`__ and `brotli <https://pypi.org/project/brotlipy>`__ are available for compression support.
+* `SQLAlchemy <http://www.sqlalchemy.org>`__: for SQL database support. Version 0.8.1 or higher recommended. Besides SQLAlchemy, you also need a database specific driver. You can find an overview of supported drivers for each SQL dialect in the `SQLAlchemy docs <http://docs.sqlalchemy.org/en/latest/dialects/index.html>`__. Some common drivers are:
+
+    * `psycopg2 <http://initd.org/psycopg/>`__: for PostgreSQL
+    * `pymysql <https://github.com/PyMySQL/PyMySQL>`__: for MySQL.
+    * `SQLite <https://docs.python.org/3/library/sqlite3.html>`__: for SQLite, this is included in Python's standard library by default.
+
+* `matplotlib <http://matplotlib.org/>`__: for plotting, Version 1.4.3 or higher.
+* For Excel I/O:
+
+    * `xlrd/xlwt <http://www.python-excel.org/>`__: Excel reading (xlrd) and writing (xlwt)
+    * `openpyxl <http://https://openpyxl.readthedocs.io/en/default/>`__: openpyxl version 2.4.0
+      for writing .xlsx files (xlrd >= 0.9.0)
+    * `XlsxWriter <https://pypi.org/project/XlsxWriter>`__: Alternative Excel writer
+
+* `Jinja2 <http://jinja.pocoo.org/>`__: Template engine for conditional HTML formatting.
+* `s3fs <http://s3fs.readthedocs.io/>`__: necessary for Amazon S3 access (s3fs >= 0.0.7).
+* `blosc <https://pypi.org/project/blosc>`__: for msgpack compression using ``blosc``
+* `gcsfs <http://gcsfs.readthedocs.io/>`__: necessary for Google Cloud Storage access (gcsfs >= 0.1.0).
+* One of
+  `qtpy  <https://github.com/spyder-ide/qtpy>`__ (requires PyQt or PySide),
+  `PyQt5 <https://www.riverbankcomputing.com/software/pyqt/download5>`__,
+  `PyQt4 <http://www.riverbankcomputing.com/software/pyqt/download>`__,
+  `pygtk <http://www.pygtk.org/>`__,
+  `xsel <http://www.vergenet.net/~conrad/software/xsel/>`__, or
+  `xclip <https://github.com/astrand/xclip/>`__: necessary to use
+  :func:`~pandas.read_clipboard`. Most package managers on Linux distributions will have ``xclip`` and/or ``xsel`` immediately available for installation.
+* `pandas-gbq <https://pandas-gbq.readthedocs.io/en/latest/install.html#dependencies>`__: for Google BigQuery I/O.
+
+
+* `Backports.lzma <https://pypi.org/project/backports.lzma/>`__: Only for Python 2, for writing to and/or reading from an xz compressed DataFrame in CSV; Python 3 support is built into the standard library.
 * One of the following combinations of libraries is needed to use the
-  top-level :func:`~pandas.io.html.read_html` function:
+  top-level :func:`~pandas.read_html` function:
+
+  .. versionchanged:: 0.23.0
+
+  .. note::
+
+     If using BeautifulSoup4 a minimum version of 4.2.1 is required
 
   * `BeautifulSoup4`_ and `html5lib`_ (Any recent version of `html5lib`_ is
     okay.)
   * `BeautifulSoup4`_ and `lxml`_
   * `BeautifulSoup4`_ and `html5lib`_ and `lxml`_
-  * Only `lxml`_, although see :ref:`HTML reading gotchas <html-gotchas>`
+  * Only `lxml`_, although see :ref:`HTML Table Parsing <io.html.gotchas>`
     for reasons as to why you should probably **not** take this approach.
 
   .. warning::
 
      * if you install `BeautifulSoup4`_ you must install either
        `lxml`_ or `html5lib`_ or both.
-       :func:`~pandas.io.html.read_html` will **not** work with *only*
+       :func:`~pandas.read_html` will **not** work with *only*
        `BeautifulSoup4`_ installed.
-     * You are highly encouraged to read :ref:`HTML reading gotchas
-       <html-gotchas>`. It explains issues surrounding the installation and
-       usage of the above three libraries
-     * You may need to install an older version of `BeautifulSoup4`_:
-        - Versions 4.2.1, 4.1.3 and 4.0.2 have been confirmed for 64 and
-          32-bit Ubuntu/Debian
-     * Additionally, if you're using `Anaconda`_ you should definitely
-       read :ref:`the gotchas about HTML parsing libraries <html-gotchas>`
+     * You are highly encouraged to read :ref:`HTML Table Parsing gotchas <io.html.gotchas>`.
+       It explains issues surrounding the installation and
+       usage of the above three libraries.
 
   .. note::
 
@@ -313,11 +330,10 @@ Optional Dependencies
 .. _html5lib: https://github.com/html5lib/html5lib-python
 .. _BeautifulSoup4: http://www.crummy.com/software/BeautifulSoup
 .. _lxml: http://lxml.de
-.. _Anaconda: https://store.continuum.io/cshop/anaconda
 
 .. note::
 
    Without the optional dependencies, many useful features will not
    work. Hence, it is highly recommended that you install these. A packaged
-   distribution like `Enthought Canopy
+   distribution like `Anaconda <http://docs.continuum.io/anaconda/>`__, `ActivePython <https://www.activestate.com/activepython/downloads>`__  (version 2.7 or 3.5), or `Enthought Canopy
    <http://enthought.com/products/canopy>`__ may be worth considering.
diff --git a/doc/source/internals.rst b/doc/source/internals.rst
index 3d96b93de4cc9..fce99fc633440 100644
--- a/doc/source/internals.rst
+++ b/doc/source/internals.rst
@@ -15,7 +15,8 @@
 Internals
 *********
 
-This section will provide a look into some of pandas internals.
+This section will provide a look into some of pandas internals. It's primarily
+intended for developers of pandas itself.
 
 Indexing
 --------
@@ -23,24 +24,24 @@ Indexing
 In pandas there are a few objects implemented which can serve as valid
 containers for the axis labels:
 
-- ``Index``: the generic "ordered set" object, an ndarray of object dtype
+* ``Index``: the generic "ordered set" object, an ndarray of object dtype
   assuming nothing about its contents. The labels must be hashable (and
   likely immutable) and unique. Populates a dict of label to location in
   Cython to do ``O(1)`` lookups.
-- ``Int64Index``: a version of ``Index`` highly optimized for 64-bit integer
+* ``Int64Index``: a version of ``Index`` highly optimized for 64-bit integer
   data, such as time stamps
-- ``Float64Index``: a version of ``Index`` highly optimized for 64-bit float data
-- ``MultiIndex``: the standard hierarchical index object
-- ``DatetimeIndex``: An Index object with ``Timestamp`` boxed elements (impl are the int64 values)
-- ``TimedeltaIndex``: An Index object with ``Timedelta`` boxed elements (impl are the in64 values)
-- ``PeriodIndex``: An Index object with Period elements
+* ``Float64Index``: a version of ``Index`` highly optimized for 64-bit float data
+* ``MultiIndex``: the standard hierarchical index object
+* ``DatetimeIndex``: An Index object with ``Timestamp`` boxed elements (impl are the int64 values)
+* ``TimedeltaIndex``: An Index object with ``Timedelta`` boxed elements (impl are the in64 values)
+* ``PeriodIndex``: An Index object with Period elements
 
 There are functions that make the creation of a regular index easy:
 
-- ``date_range``: fixed frequency date range generated from a time rule or
+* ``date_range``: fixed frequency date range generated from a time rule or
   DateOffset. An ndarray of Python datetime objects
-- ``period_range``: fixed frequency date range generated from a time rule or
-  DateOffset. An ndarray of ``Period`` objects, representing Timespans
+* ``period_range``: fixed frequency date range generated from a time rule or
+  DateOffset. An ndarray of ``Period`` objects, representing timespans
 
 The motivation for having an ``Index`` class in the first place was to enable
 different implementations of indexing. This means that it's possible for you,
@@ -51,22 +52,22 @@ From an internal implementation point of view, the relevant methods that an
 ``Index`` must define are one or more of the following (depending on how
 incompatible the new object internals are with the ``Index`` functions):
 
-- ``get_loc``: returns an "indexer" (an integer, or in some cases a
+* ``get_loc``: returns an "indexer" (an integer, or in some cases a
   slice object) for a label
-- ``slice_locs``: returns the "range" to slice between two labels
-- ``get_indexer``: Computes the indexing vector for reindexing / data
+* ``slice_locs``: returns the "range" to slice between two labels
+* ``get_indexer``: Computes the indexing vector for reindexing / data
   alignment purposes. See the source / docstrings for more on this
-- ``get_indexer_non_unique``: Computes the indexing vector for reindexing / data
+* ``get_indexer_non_unique``: Computes the indexing vector for reindexing / data
   alignment purposes when the index is non-unique. See the source / docstrings
   for more on this
-- ``reindex``: Does any pre-conversion of the input index then calls
+* ``reindex``: Does any pre-conversion of the input index then calls
   ``get_indexer``
-- ``union``, ``intersection``: computes the union or intersection of two
+* ``union``, ``intersection``: computes the union or intersection of two
   Index objects
-- ``insert``: Inserts a new label into an Index, yielding a new object
-- ``delete``: Delete a label, yielding a new object
-- ``drop``: Deletes a set of labels
-- ``take``: Analogous to ndarray.take
+* ``insert``: Inserts a new label into an Index, yielding a new object
+* ``delete``: Delete a label, yielding a new object
+* ``drop``: Deletes a set of labels
+* ``take``: Analogous to ndarray.take
 
 MultiIndex
 ~~~~~~~~~~
@@ -89,153 +90,27 @@ not check (or care) whether the levels themselves are sorted. Fortunately, the
 constructors ``from_tuples`` and ``from_arrays`` ensure that this is true, but
 if you compute the levels and labels yourself, please be careful.
 
-.. _ref-subclassing-pandas:
-
-Subclassing pandas Data Structures
-----------------------------------
-
-.. warning:: There are some easier alternatives before considering subclassing ``pandas`` data structures.
-
-  1. Extensible method chains with :ref:`pipe <basics.pipe>`
-
-  2. Use *composition*. See `here <http://en.wikipedia.org/wiki/Composition_over_inheritance>`_.
-
-This section describes how to subclass ``pandas`` data structures to meet more specific needs. There are 2 points which need attention:
-
-1. Override constructor properties.
-2. Define original properties
-
-.. note:: You can find a nice example in `geopandas <https://github.com/geopandas/geopandas>`_ project.
-
-Override Constructor Properties
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Each data structure has constructor properties to specifying data constructors. By overriding these properties, you can retain defined-classes through ``pandas`` data manipulations.
-
-There are 3 constructors to be defined:
-
-- ``_constructor``: Used when a manipulation result has the same dimesions as the original.
-- ``_constructor_sliced``: Used when a manipulation result has one lower dimension(s) as the original, such as ``DataFrame`` single columns slicing.
-- ``_constructor_expanddim``: Used when a manipulation result has one higher dimension as the original, such as ``Series.to_frame()`` and ``DataFrame.to_panel()``.
-
-Following table shows how ``pandas`` data structures define constructor properties by default.
-
-===========================  ======================= =================== =======================
-Property Attributes          ``Series``              ``DataFrame``       ``Panel``
-===========================  ======================= =================== =======================
-``_constructor``             ``Series``              ``DataFrame``       ``Panel``
-``_constructor_sliced``      ``NotImplementedError`` ``Series``          ``DataFrame``
-``_constructor_expanddim``   ``DataFrame``           ``Panel``           ``NotImplementedError``
-===========================  ======================= =================== =======================
-
-Below example shows how to define ``SubclassedSeries`` and ``SubclassedDataFrame`` overriding constructor properties.
-
-.. code-block:: python
-
-   class SubclassedSeries(Series):
-
-       @property
-       def _constructor(self):
-           return SubclassedSeries
-
-       @property
-       def _constructor_expanddim(self):
-           return SubclassedDataFrame
-
-   class SubclassedDataFrame(DataFrame):
+Values
+~~~~~~
 
-       @property
-       def _constructor(self):
-           return SubclassedDataFrame
+Pandas extends NumPy's type system with custom types, like ``Categorical`` or
+datetimes with a timezone, so we have multiple notions of "values". For 1-D
+containers (``Index`` classes and ``Series``) we have the following convention:
 
-       @property
-       def _constructor_sliced(self):
-           return SubclassedSeries
+* ``cls._ndarray_values`` is *always* a NumPy ``ndarray``. Ideally,
+  ``_ndarray_values`` is cheap to compute. For example, for a ``Categorical``,
+  this returns the codes, not the array of objects.
+* ``cls._values`` refers is the "best possible" array. This could be an
+  ``ndarray``, ``ExtensionArray``, or in ``Index`` subclass (note: we're in the
+  process of removing the index subclasses here so that it's always an
+  ``ndarray`` or ``ExtensionArray``).
 
-.. code-block:: python
+So, for example, ``Series[category]._values`` is a ``Categorical``, while
+``Series[category]._ndarray_values`` is the underlying codes.
 
-   >>> s = SubclassedSeries([1, 2, 3])
-   >>> type(s)
-   <class '__main__.SubclassedSeries'>
-
-   >>> to_framed = s.to_frame()
-   >>> type(to_framed)
-   <class '__main__.SubclassedDataFrame'>
-
-   >>> df = SubclassedDataFrame({'A', [1, 2, 3], 'B': [4, 5, 6], 'C': [7, 8, 9]})
-   >>> df
-      A  B  C
-   0  1  4  7
-   1  2  5  8
-   2  3  6  9
-
-   >>> type(df)
-   <class '__main__.SubclassedDataFrame'>
-
-   >>> sliced1 = df[['A', 'B']]
-   >>> sliced1
-      A  B
-   0  1  4
-   1  2  5
-   2  3  6
-   >>> type(sliced1)
-   <class '__main__.SubclassedDataFrame'>
-
-   >>> sliced2 = df['A']
-   >>> sliced2
-   0    1
-   1    2
-   2    3
-   Name: A, dtype: int64
-   >>> type(sliced2)
-   <class '__main__.SubclassedSeries'>
-
-Define Original Properties
-~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-To let original data structures have additional properties, you should let ``pandas`` know what properties are added. ``pandas`` maps unknown properties to data names overriding ``__getattribute__``. Defining original properties can be done in one of 2 ways:
-
-1. Define ``_internal_names`` and ``_internal_names_set`` for temporary properties which WILL NOT be passed to manipulation results.
-2. Define ``_metadata`` for normal properties which will be passed to manipulation results.
-
-Below is an example to define 2 original properties, "internal_cache" as a temporary property and "added_property" as a normal property
-
-.. code-block:: python
-
-   class SubclassedDataFrame2(DataFrame):
-
-       # temporary properties
-       _internal_names = pd.DataFrame._internal_names + ['internal_cache']
-       _internal_names_set = set(_internal_names)
-
-       # normal properties
-       _metadata = ['added_property']
-
-       @property
-       def _constructor(self):
-           return SubclassedDataFrame2
-
-.. code-block:: python
-
-   >>> df = SubclassedDataFrame2({'A', [1, 2, 3], 'B': [4, 5, 6], 'C': [7, 8, 9]})
-   >>> df
-      A  B  C
-   0  1  4  7
-   1  2  5  8
-   2  3  6  9
-
-   >>> df.internal_cache = 'cached'
-   >>> df.added_property = 'property'
-
-   >>> df.internal_cache
-   cached
-   >>> df.added_property
-   property
+.. _ref-subclassing-pandas:
 
-   # properties defined in _internal_names is reset after manipulation
-   >>> df[['A', 'B']].internal_cache
-   AttributeError: 'SubclassedDataFrame2' object has no attribute 'internal_cache'
+Subclassing pandas Data Structures
+----------------------------------
 
-   # properties defined in _metadata are retained
-   >>> df[['A', 'B']].added_property
-   property
+This section has been moved to :ref:`extending.subclassing-pandas`.
diff --git a/doc/source/io.rst b/doc/source/io.rst
index 014daa3f68dbb..9fe578524c8e0 100644
--- a/doc/source/io.rst
+++ b/doc/source/io.rst
@@ -19,45 +19,40 @@
    import matplotlib.pyplot as plt
    plt.close('all')
 
-   from pandas import *
-   options.display.max_rows=15
    import pandas.util.testing as tm
-   clipdf = DataFrame({'A':[1,2,3],'B':[4,5,6],'C':['p','q','r']},
-                      index=['x','y','z'])
+   pd.options.display.max_rows = 15
+   clipdf = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6], 'C': ['p', 'q', 'r']},
+                         index=['x', 'y', 'z'])
 
 ===============================
 IO Tools (Text, CSV, HDF5, ...)
 ===============================
 
-The pandas I/O API is a set of top level ``reader`` functions accessed like ``pd.read_csv()`` that generally return a ``pandas``
-object.
-
-    * :ref:`read_csv<io.read_csv_table>`
-    * :ref:`read_excel<io.excel_reader>`
-    * :ref:`read_hdf<io.hdf5>`
-    * :ref:`read_sql<io.sql>`
-    * :ref:`read_json<io.json_reader>`
-    * :ref:`read_msgpack<io.msgpack>` (experimental)
-    * :ref:`read_html<io.read_html>`
-    * :ref:`read_gbq<io.bigquery_reader>` (experimental)
-    * :ref:`read_stata<io.stata_reader>`
-    * :ref:`read_sas<io.sas_reader>`
-    * :ref:`read_clipboard<io.clipboard>`
-    * :ref:`read_pickle<io.pickle>`
-
-The corresponding ``writer`` functions are object methods that are accessed like ``df.to_csv()``
-
-    * :ref:`to_csv<io.store_in_csv>`
-    * :ref:`to_excel<io.excel_writer>`
-    * :ref:`to_hdf<io.hdf5>`
-    * :ref:`to_sql<io.sql>`
-    * :ref:`to_json<io.json_writer>`
-    * :ref:`to_msgpack<io.msgpack>` (experimental)
-    * :ref:`to_html<io.html>`
-    * :ref:`to_gbq<io.bigquery_writer>` (experimental)
-    * :ref:`to_stata<io.stata_writer>`
-    * :ref:`to_clipboard<io.clipboard>`
-    * :ref:`to_pickle<io.pickle>`
+The pandas I/O API is a set of top level ``reader`` functions accessed like
+:func:`pandas.read_csv` that generally return a pandas object. The corresponding
+``writer`` functions are object methods that are accessed like
+:meth:`DataFrame.to_csv`. Below is a table containing available ``readers`` and
+``writers``.
+
+.. csv-table::
+    :header: "Format Type", "Data Description", "Reader", "Writer"
+    :widths: 30, 100, 60, 60
+    :delim: ;
+
+    text;`CSV <https://en.wikipedia.org/wiki/Comma-separated_values>`__;:ref:`read_csv<io.read_csv_table>`;:ref:`to_csv<io.store_in_csv>`
+    text;`JSON <http://www.json.org/>`__;:ref:`read_json<io.json_reader>`;:ref:`to_json<io.json_writer>`
+    text;`HTML <https://en.wikipedia.org/wiki/HTML>`__;:ref:`read_html<io.read_html>`;:ref:`to_html<io.html>`
+    text; Local clipboard;:ref:`read_clipboard<io.clipboard>`;:ref:`to_clipboard<io.clipboard>`
+    binary;`MS Excel <https://en.wikipedia.org/wiki/Microsoft_Excel>`__;:ref:`read_excel<io.excel_reader>`;:ref:`to_excel<io.excel_writer>`
+    binary;`HDF5 Format <https://support.hdfgroup.org/HDF5/whatishdf5.html>`__;:ref:`read_hdf<io.hdf5>`;:ref:`to_hdf<io.hdf5>`
+    binary;`Feather Format <https://github.com/wesm/feather>`__;:ref:`read_feather<io.feather>`;:ref:`to_feather<io.feather>`
+    binary;`Parquet Format <https://parquet.apache.org/>`__;:ref:`read_parquet<io.parquet>`;:ref:`to_parquet<io.parquet>`
+    binary;`Msgpack <http://msgpack.org/index.html>`__;:ref:`read_msgpack<io.msgpack>`;:ref:`to_msgpack<io.msgpack>`
+    binary;`Stata <https://en.wikipedia.org/wiki/Stata>`__;:ref:`read_stata<io.stata_reader>`;:ref:`to_stata<io.stata_writer>`
+    binary;`SAS <https://en.wikipedia.org/wiki/SAS_(software)>`__;:ref:`read_sas<io.sas_reader>`;
+    binary;`Python Pickle Format <https://docs.python.org/3/library/pickle.html>`__;:ref:`read_pickle<io.pickle>`;:ref:`to_pickle<io.pickle>`
+    SQL;`SQL <https://en.wikipedia.org/wiki/SQL>`__;:ref:`read_sql<io.sql>`;:ref:`to_sql<io.sql>`
+    SQL;`Google Big Query <https://en.wikipedia.org/wiki/BigQuery>`__;:ref:`read_gbq<io.bigquery>`;:ref:`to_gbq<io.bigquery>`
 
 :ref:`Here <io.perf>` is an informal performance comparison for some of these IO methods.
 
@@ -72,234 +67,453 @@ CSV & Text files
 ----------------
 
 The two workhorse functions for reading text files (a.k.a. flat files) are
-:func:`~pandas.io.parsers.read_csv` and :func:`~pandas.io.parsers.read_table`.
-They both use the same parsing code to intelligently convert tabular
-data into a DataFrame object. See the :ref:`cookbook<cookbook.csv>`
-for some advanced strategies
+:func:`read_csv` and :func:`read_table`. They both use the same parsing code to
+intelligently convert tabular data into a ``DataFrame`` object. See the
+:ref:`cookbook<cookbook.csv>` for some advanced strategies.
 
-They can take a number of arguments:
-
-  - ``filepath_or_buffer``: Either a string path to a file, URL
-    (including http, ftp, and S3 locations), or any object with a ``read``
-    method (such as an open file or ``StringIO``).
-  - ``sep`` or ``delimiter``: A delimiter / separator to split fields
-    on. With ``sep=None``, ``read_csv`` will try to infer the delimiter
-    automatically in some cases by "sniffing".
-    The separator may be specified as a regular expression; for instance
-    you may use '\|\\s*' to indicate a pipe plus arbitrary whitespace.
-  - ``delim_whitespace``: Parse whitespace-delimited (spaces or tabs) file
-    (much faster than using a regular expression)
-  - ``compression``: decompress ``'gzip'`` and ``'bz2'`` formats on the fly.
-    Set to  ``'infer'`` (the default) to guess a format based on the file
-    extension.
-  - ``dialect``: string or :class:`python:csv.Dialect` instance to expose more
-    ways to specify the file format
-  - ``dtype``: A data type name or a dict of column name to data type. If not
-    specified, data types will be inferred. (Unsupported with
-    ``engine='python'``)
-  - ``header``: row number(s) to use as the column names, and the start of the
-    data.  Defaults to 0 if no ``names`` passed, otherwise ``None``. Explicitly
-    pass ``header=0`` to be able to replace existing names. The header can be
-    a list of integers that specify row locations for a multi-index on the columns
-    E.g. [0,1,3]. Intervening rows that are not specified will be
-    skipped (e.g. 2 in this example are skipped). Note that this parameter
-    ignores commented lines and empty lines if ``skip_blank_lines=True`` (the default),
-    so header=0 denotes the first line of data rather than the first line of the file.
-  - ``skip_blank_lines``: whether to skip over blank lines rather than interpreting
-    them as NaN values
-  - ``skiprows``: A collection of numbers for rows in the file to skip. Can
-    also be an integer to skip the first ``n`` rows
-  - ``index_col``: column number, column name, or list of column numbers/names,
-    to use as the ``index`` (row labels) of the resulting DataFrame. By default,
-    it will number the rows without using any column, unless there is one more
-    data column than there are headers, in which case the first column is taken
-    as the index.
-  - ``names``: List of column names to use as column names. To replace header
-    existing in file, explicitly pass ``header=0``.
-  - ``na_values``: optional string or list of strings to recognize as NaN (missing
-    values), either in addition to or in lieu of the default set.
-  - ``true_values``: list of strings to recognize as ``True``
-  - ``false_values``: list of strings to recognize as ``False``
-  - ``keep_default_na``: whether to include the default set of missing values
-    in addition to the ones specified in ``na_values``
-  - ``parse_dates``: if True then index will be parsed as dates
-    (False by default). You can specify more complicated options to parse
-    a subset of columns or a combination of columns into a single date column
-    (list of ints or names, list of lists, or dict)
-    [1, 2, 3] -> try parsing columns 1, 2, 3 each as a separate date column
-    [[1, 3]] -> combine columns 1 and 3 and parse as a single date column
-    {'foo' : [1, 3]} -> parse columns 1, 3 as date and call result 'foo'
-  - ``keep_date_col``: if True, then date component columns passed into
-    ``parse_dates`` will be retained in the output (False by default).
-  - ``date_parser``: function to use to parse strings into datetime
-    objects. If ``parse_dates`` is True, it defaults to the very robust
-    ``dateutil.parser``. Specifying this implicitly sets ``parse_dates`` as True.
-    You can also use functions from community supported date converters from
-    date_converters.py
-  - ``dayfirst``: if True then uses the DD/MM international/European date format
-    (This is False by default)
-  - ``thousands``: specifies the thousands separator. If not None, this character will
-    be stripped from numeric dtypes. However, if it is the first character in a field,
-    that column will be imported as a string. In the PythonParser, if not None,
-    then parser will try to look for it in the output and parse relevant data to numeric
-    dtypes. Because it has to essentially scan through the data again, this causes a
-    significant performance hit so only use if necessary.
-  - ``lineterminator`` : string (length 1), default ``None``, Character to break file into lines. Only valid with C parser
-  - ``quotechar`` : string, The character to used to denote the start and end of a quoted item.
-    Quoted items can include the delimiter and it will be ignored.
-  - ``quoting`` : int,
-    Controls whether quotes should be recognized. Values are taken from `csv.QUOTE_*` values.
-    Acceptable values are 0, 1, 2, and 3 for QUOTE_MINIMAL, QUOTE_ALL,
-    QUOTE_NONNUMERIC and QUOTE_NONE, respectively.
-  - ``skipinitialspace`` : boolean, default ``False``, Skip spaces after delimiter
-  - ``escapechar`` : string, to specify how to escape quoted data
-  - ``comment``: Indicates remainder of line should not be parsed. If found at the
-    beginning of a line, the line will be ignored altogether. This parameter
-    must be a single character. Like empty lines, fully commented lines
-    are ignored by the parameter `header` but not by `skiprows`. For example,
-    if comment='#', parsing '#empty\n1,2,3\na,b,c' with `header=0` will
-    result in '1,2,3' being treated as the header.
-  - ``nrows``: Number of rows to read out of the file. Useful to only read a
-    small portion of a large file
-  - ``iterator``: If True, return a ``TextFileReader`` to enable reading a file
-    into memory piece by piece
-  - ``chunksize``: An number of rows to be used to "chunk" a file into
-    pieces. Will cause an ``TextFileReader`` object to be returned. More on this
-    below in the section on :ref:`iterating and chunking <io.chunking>`
-  - ``skip_footer``: number of lines to skip at bottom of file (default 0)
-    (Unsupported with ``engine='c'``)
-  - ``converters``: a dictionary of functions for converting values in certain
-    columns, where keys are either integers or column labels
-  - ``encoding``: a string representing the encoding to use for decoding
-    unicode data, e.g. ``'utf-8``` or ``'latin-1'``. `Full list of Python
-    standard encodings
-    <https://docs.python.org/3/library/codecs.html#standard-encodings>`_
-  - ``verbose``: show number of NA values inserted in non-numeric columns
-  - ``squeeze``: if True then output with only one column is turned into Series
-  - ``error_bad_lines``: if False then any lines causing an error will be skipped :ref:`bad lines <io.bad_lines>`
-  - ``usecols``: a subset of columns to return, results in much faster parsing
-    time and lower memory usage.
-  - ``mangle_dupe_cols``: boolean, default True, then duplicate columns will be specified
-    as 'X.0'...'X.N', rather than 'X'...'X'
-  - ``tupleize_cols``: boolean, default False, if False, convert a list of tuples
-    to a multi-index of columns, otherwise, leave the column index as a list of
-    tuples
-  - ``float_precision`` : string, default None. Specifies which converter the C
-    engine should use for floating-point values. The options are None for the
-    ordinary converter, 'high' for the high-precision converter, and
-    'round_trip' for the round-trip converter.
+Parsing options
+'''''''''''''''
 
-.. ipython:: python
-   :suppress:
+The functions :func:`read_csv` and :func:`read_table` accept the following
+common arguments:
+
+Basic
++++++
+
+filepath_or_buffer : various
+  Either a path to a file (a :class:`python:str`, :class:`python:pathlib.Path`,
+  or :class:`py:py._path.local.LocalPath`), URL (including http, ftp, and S3
+  locations), or any object with a ``read()`` method (such as an open file or
+  :class:`~python:io.StringIO`).
+sep : str, defaults to ``','`` for :func:`read_csv`, ``\t`` for :func:`read_table`
+  Delimiter to use. If sep is ``None``, the C engine cannot automatically detect
+  the separator, but the Python parsing engine can, meaning the latter will be
+  used and automatically detect the separator by Python's builtin sniffer tool,
+  :class:`python:csv.Sniffer`. In addition, separators longer than 1 character and
+  different from ``'\s+'`` will be interpreted as regular expressions and
+  will also force the use of the Python parsing engine. Note that regex
+  delimiters are prone to ignoring quoted data. Regex example: ``'\\r\\t'``.
+delimiter : str, default ``None``
+  Alternative argument name for sep.
+delim_whitespace : boolean, default False
+  Specifies whether or not whitespace (e.g. ``' '`` or ``'\t'``)
+  will be used as the delimiter. Equivalent to setting ``sep='\s+'``.
+  If this option is set to ``True``, nothing should be passed in for the
+  ``delimiter`` parameter.
+
+  .. versionadded:: 0.18.1 support for the Python parser.
+
+Column and Index Locations and Names
+++++++++++++++++++++++++++++++++++++
+
+header : int or list of ints, default ``'infer'``
+  Row number(s) to use as the column names, and the start of the
+  data. Default behavior is to infer the column names: if no names are
+  passed the behavior is identical to ``header=0`` and column names
+  are inferred from the first line of the file, if column names are
+  passed explicitly then the behavior is identical to
+  ``header=None``. Explicitly pass ``header=0`` to be able to replace
+  existing names.
+
+  The header can be a list of ints that specify row locations
+  for a MultiIndex on the columns e.g. ``[0,1,3]``. Intervening rows
+  that are not specified will be skipped (e.g. 2 in this example is
+  skipped). Note that this parameter ignores commented lines and empty
+  lines if ``skip_blank_lines=True``, so header=0 denotes the first
+  line of data rather than the first line of the file.
+names : array-like, default ``None``
+  List of column names to use. If file contains no header row, then you should
+  explicitly pass ``header=None``. Duplicates in this list will cause
+  a ``UserWarning`` to be issued.
+index_col :  int or sequence or ``False``, default ``None``
+  Column to use as the row labels of the ``DataFrame``. If a sequence is given, a
+  MultiIndex is used. If you have a malformed file with delimiters at the end of
+  each line, you might consider ``index_col=False`` to force pandas to *not* use
+  the first column as the index (row names).
+usecols : list-like or callable, default ``None``
+  Return a subset of the columns. If list-like, all elements must either
+  be positional (i.e. integer indices into the document columns) or strings
+  that correspond to column names provided either by the user in `names` or
+  inferred from the document header row(s). For example, a valid list-like
+  `usecols` parameter would be ``[0, 1, 2]`` or ``['foo', 'bar', 'baz']``.
+
+  Element order is ignored, so ``usecols=[0, 1]`` is the same as ``[1, 0]``. To
+  instantiate a DataFrame from ``data`` with element order preserved use
+  ``pd.read_csv(data, usecols=['foo', 'bar'])[['foo', 'bar']]`` for columns
+  in ``['foo', 'bar']`` order or
+  ``pd.read_csv(data, usecols=['foo', 'bar'])[['bar', 'foo']]`` for
+  ``['bar', 'foo']`` order.
+
+  If callable, the callable function will be evaluated against the column names,
+  returning names where the callable function evaluates to True:
+
+  .. ipython:: python
+
+     data = 'col1,col2,col3\na,b,1\na,b,2\nc,d,3'
+     pd.read_csv(StringIO(data))
+     pd.read_csv(StringIO(data), usecols=lambda x: x.upper() in ['COL1', 'COL3'])
+
+  Using this parameter results in much faster parsing time and lower memory usage.
+squeeze : boolean, default ``False``
+  If the parsed data only contains one column then return a ``Series``.
+prefix : str, default ``None``
+  Prefix to add to column numbers when no header, e.g. 'X' for X0, X1, ...
+mangle_dupe_cols : boolean, default ``True``
+  Duplicate columns will be specified as 'X', 'X.1'...'X.N', rather than 'X'...'X'.
+  Passing in ``False`` will cause data to be overwritten if there are duplicate
+  names in the columns.
+
+General Parsing Configuration
++++++++++++++++++++++++++++++
 
-   f = open('foo.csv','w')
-   f.write('date,A,B,C\n20090101,a,1,2\n20090102,b,3,4\n20090103,c,4,5')
-   f.close()
+dtype : Type name or dict of column -> type, default ``None``
+  Data type for data or columns. E.g. ``{'a': np.float64, 'b': np.int32}``
+  (unsupported with ``engine='python'``). Use `str` or `object` together
+  with suitable ``na_values`` settings to preserve and
+  not interpret dtype.
+
+  .. versionadded:: 0.20.0 support for the Python parser.
+
+engine : {``'c'``, ``'python'``}
+  Parser engine to use. The C engine is faster while the Python engine is
+  currently more feature-complete.
+converters : dict, default ``None``
+  Dict of functions for converting values in certain columns. Keys can either be
+  integers or column labels.
+true_values : list, default ``None``
+  Values to consider as ``True``.
+false_values : list, default ``None``
+  Values to consider as ``False``.
+skipinitialspace : boolean, default ``False``
+  Skip spaces after delimiter.
+skiprows : list-like or integer, default ``None``
+  Line numbers to skip (0-indexed) or number of lines to skip (int) at the start
+  of the file.
+
+  If callable, the callable function will be evaluated against the row
+  indices, returning True if the row should be skipped and False otherwise:
+
+  .. ipython:: python
+
+     data = 'col1,col2,col3\na,b,1\na,b,2\nc,d,3'
+     pd.read_csv(StringIO(data))
+     pd.read_csv(StringIO(data), skiprows=lambda x: x % 2 != 0)
+
+skipfooter : int, default ``0``
+  Number of lines at bottom of file to skip (unsupported with engine='c').
+
+nrows : int, default ``None``
+  Number of rows of file to read. Useful for reading pieces of large files.
+low_memory : boolean, default ``True``
+  Internally process the file in chunks, resulting in lower memory use
+  while parsing, but possibly mixed type inference.  To ensure no mixed
+  types either set ``False``, or specify the type with the ``dtype`` parameter.
+  Note that the entire file is read into a single ``DataFrame`` regardless,
+  use the ``chunksize`` or ``iterator`` parameter to return the data in chunks.
+  (Only valid with C parser)
+memory_map : boolean, default False
+  If a filepath is provided for ``filepath_or_buffer``, map the file object
+  directly onto memory and access the data directly from there. Using this
+  option can improve performance because there is no longer any I/O overhead.
+
+NA and Missing Data Handling
+++++++++++++++++++++++++++++
+
+na_values : scalar, str, list-like, or dict, default ``None``
+  Additional strings to recognize as NA/NaN. If dict passed, specific per-column
+  NA values. See :ref:`na values const <io.navaluesconst>` below
+  for a list of the values interpreted as NaN by default.
+
+keep_default_na : boolean, default ``True``
+  Whether or not to include the default NaN values when parsing the data.
+  Depending on whether `na_values` is passed in, the behavior is as follows:
+
+  * If `keep_default_na` is ``True``, and `na_values` are specified, `na_values`
+    is appended to the default NaN values used for parsing.
+  * If `keep_default_na` is ``True``, and `na_values` are not specified, only
+    the default NaN values are used for parsing.
+  * If `keep_default_na` is ``False``, and `na_values` are specified, only
+    the NaN values specified `na_values` are used for parsing.
+  * If `keep_default_na` is ``False``, and `na_values` are not specified, no
+    strings will be parsed as NaN.
+
+  Note that if `na_filter` is passed in as ``False``, the `keep_default_na` and
+  `na_values` parameters will be ignored.
+na_filter : boolean, default ``True``
+  Detect missing value markers (empty strings and the value of na_values). In
+  data without any NAs, passing ``na_filter=False`` can improve the performance
+  of reading a large file.
+verbose : boolean, default ``False``
+  Indicate number of NA values placed in non-numeric columns.
+skip_blank_lines : boolean, default ``True``
+  If ``True``, skip over blank lines rather than interpreting as NaN values.
+
+Datetime Handling
++++++++++++++++++
 
-Consider a typical CSV file containing, in this case, some time series data:
+parse_dates : boolean or list of ints or names or list of lists or dict, default ``False``.
+  * If ``True`` -> try parsing the index.
+  * If ``[1, 2, 3]`` ->  try parsing columns 1, 2, 3 each as a separate date
+    column.
+  * If ``[[1, 3]]`` -> combine columns 1 and 3 and parse as a single date
+    column.
+  * If ``{'foo': [1, 3]}`` -> parse columns 1, 3 as date and call result 'foo'.
+    A fast-path exists for iso8601-formatted dates.
+infer_datetime_format : boolean, default ``False``
+  If ``True`` and parse_dates is enabled for a column, attempt to infer the
+  datetime format to speed up the processing.
+keep_date_col : boolean, default ``False``
+  If ``True`` and parse_dates specifies combining multiple columns then keep the
+  original columns.
+date_parser : function, default ``None``
+  Function to use for converting a sequence of string columns to an array of
+  datetime instances. The default uses ``dateutil.parser.parser`` to do the
+  conversion. Pandas will try to call date_parser in three different ways,
+  advancing to the next if an exception occurs: 1) Pass one or more arrays (as
+  defined by parse_dates) as arguments; 2) concatenate (row-wise) the string
+  values from the columns defined by parse_dates into a single array and pass
+  that; and 3) call date_parser once for each row using one or more strings
+  (corresponding to the columns defined by parse_dates) as arguments.
+dayfirst : boolean, default ``False``
+  DD/MM format dates, international and European format.
+
+Iteration
++++++++++
+
+iterator : boolean, default ``False``
+  Return `TextFileReader` object for iteration or getting chunks with
+  ``get_chunk()``.
+chunksize : int, default ``None``
+  Return `TextFileReader` object for iteration. See :ref:`iterating and chunking
+  <io.chunking>` below.
+
+Quoting, Compression, and File Format
++++++++++++++++++++++++++++++++++++++
 
-.. ipython:: python
+compression : {``'infer'``, ``'gzip'``, ``'bz2'``, ``'zip'``, ``'xz'``, ``None``}, default ``'infer'``
+  For on-the-fly decompression of on-disk data. If 'infer', then use gzip,
+  bz2, zip, or xz if filepath_or_buffer is a string ending in '.gz', '.bz2',
+  '.zip', or '.xz', respectively, and no decompression otherwise. If using 'zip',
+  the ZIP file must contain only one data file to be read in.
+  Set to ``None`` for no decompression.
+
+  .. versionadded:: 0.18.1 support for 'zip' and 'xz' compression.
+
+thousands : str, default ``None``
+  Thousands separator.
+decimal : str, default ``'.'``
+  Character to recognize as decimal point. E.g. use ``','`` for European data.
+float_precision : string, default None
+  Specifies which converter the C engine should use for floating-point values.
+  The options are ``None`` for the ordinary converter, ``high`` for the
+  high-precision converter, and ``round_trip`` for the round-trip converter.
+lineterminator : str (length 1), default ``None``
+  Character to break file into lines. Only valid with C parser.
+quotechar : str (length 1)
+  The character used to denote the start and end of a quoted item. Quoted items
+  can include the delimiter and it will be ignored.
+quoting : int or ``csv.QUOTE_*`` instance, default ``0``
+  Control field quoting behavior per ``csv.QUOTE_*`` constants. Use one of
+  ``QUOTE_MINIMAL`` (0), ``QUOTE_ALL`` (1), ``QUOTE_NONNUMERIC`` (2) or
+  ``QUOTE_NONE`` (3).
+doublequote : boolean, default ``True``
+   When ``quotechar`` is specified and ``quoting`` is not ``QUOTE_NONE``,
+   indicate whether or not to interpret two consecutive ``quotechar`` elements
+   **inside** a field as a single ``quotechar`` element.
+escapechar : str (length 1), default ``None``
+  One-character string used to escape delimiter when quoting is ``QUOTE_NONE``.
+comment : str, default ``None``
+  Indicates remainder of line should not be parsed. If found at the beginning of
+  a line, the line will be ignored altogether. This parameter must be a single
+  character. Like empty lines (as long as ``skip_blank_lines=True``), fully
+  commented lines are ignored by the parameter `header` but not by `skiprows`.
+  For example, if ``comment='#'``, parsing '#empty\\na,b,c\\n1,2,3' with
+  `header=0` will result in 'a,b,c' being treated as the header.
+encoding : str, default ``None``
+  Encoding to use for UTF when reading/writing (e.g. ``'utf-8'``). `List of
+  Python standard encodings
+  <https://docs.python.org/3/library/codecs.html#standard-encodings>`_.
+dialect : str or :class:`python:csv.Dialect` instance, default ``None``
+  If provided, this parameter will override values (default or not) for the
+  following parameters: `delimiter`, `doublequote`, `escapechar`,
+  `skipinitialspace`, `quotechar`, and `quoting`. If it is necessary to
+  override values, a ParserWarning will be issued. See :class:`python:csv.Dialect`
+  documentation for more details.
+tupleize_cols : boolean, default ``False``
+    .. deprecated:: 0.21.0
+
+    This argument will be removed and will always convert to MultiIndex
+
+  Leave a list of tuples on columns as is (default is to convert to a MultiIndex
+  on the columns).
+
+Error Handling
+++++++++++++++
 
-   print(open('foo.csv').read())
+error_bad_lines : boolean, default ``True``
+  Lines with too many fields (e.g. a csv line with too many commas) will by
+  default cause an exception to be raised, and no ``DataFrame`` will be
+  returned. If ``False``, then these "bad lines" will dropped from the
+  ``DataFrame`` that is returned. See :ref:`bad lines <io.bad_lines>`
+  below.
+warn_bad_lines : boolean, default ``True``
+  If error_bad_lines is ``False``, and warn_bad_lines is ``True``, a warning for
+  each "bad line" will be output.
+
+.. _io.dtypes:
+
+Specifying column data types
+''''''''''''''''''''''''''''
 
-The default for `read_csv` is to create a DataFrame with simple numbered rows:
+You can indicate the data type for the whole ``DataFrame`` or individual
+columns:
 
 .. ipython:: python
 
-   pd.read_csv('foo.csv')
+    data = 'a,b,c\n1,2,3\n4,5,6\n7,8,9'
+    print(data)
+
+    df = pd.read_csv(StringIO(data), dtype=object)
+    df
+    df['a'][0]
+    df = pd.read_csv(StringIO(data), dtype={'b': object, 'c': np.float64})
+    df.dtypes
 
-In the case of indexed data, you can pass the column number or column name you
-wish to use as the index:
+Fortunately, pandas offers more than one way to ensure that your column(s)
+contain only one ``dtype``. If you're unfamiliar with these concepts, you can
+see :ref:`here<basics.dtypes>` to learn more about dtypes, and
+:ref:`here<basics.object_conversion>` to learn more about ``object`` conversion in
+pandas.
 
-.. ipython:: python
 
-   pd.read_csv('foo.csv', index_col=0)
+For instance, you can use the ``converters`` argument
+of :func:`~pandas.read_csv`:
 
 .. ipython:: python
 
-   pd.read_csv('foo.csv', index_col='date')
+    data = "col_1\n1\n2\n'A'\n4.22"
+    df = pd.read_csv(StringIO(data), converters={'col_1': str})
+    df
+    df['col_1'].apply(type).value_counts()
 
-You can also use a list of columns to create a hierarchical index:
+Or you can use the :func:`~pandas.to_numeric` function to coerce the
+dtypes after reading in the data,
 
 .. ipython:: python
 
-   pd.read_csv('foo.csv', index_col=[0, 'A'])
+    df2 = pd.read_csv(StringIO(data))
+    df2['col_1'] = pd.to_numeric(df2['col_1'], errors='coerce')
+    df2
+    df2['col_1'].apply(type).value_counts()
 
-.. _io.dialect:
+which will convert all valid parsing to floats, leaving the invalid parsing
+as ``NaN``.
 
-The ``dialect`` keyword gives greater flexibility in specifying the file format.
-By default it uses the Excel dialect but you can specify either the dialect name
-or a :class:`python:csv.Dialect` instance.
+Ultimately, how you deal with reading in columns containing mixed dtypes
+depends on your specific needs. In the case above, if you wanted to ``NaN`` out
+the data anomalies, then :func:`~pandas.to_numeric` is probably your best option.
+However, if you wanted for all the data to be coerced, no matter the type, then
+using the ``converters`` argument of :func:`~pandas.read_csv` would certainly be
+worth trying.
+
+  .. versionadded:: 0.20.0 support for the Python parser.
+
+     The ``dtype`` option is supported by the 'python' engine.
+
+.. note::
+   In some cases, reading in abnormal data with columns containing mixed dtypes
+   will result in an inconsistent dataset. If you rely on pandas to infer the
+   dtypes of your columns, the parsing engine will go and infer the dtypes for
+   different chunks of the data, rather than the whole dataset at once. Consequently,
+   you can end up with column(s) with mixed dtypes. For example,
+
+   .. ipython:: python
+        :okwarning:
+
+        df = pd.DataFrame({'col_1': list(range(500000)) + ['a', 'b'] + list(range(500000))})
+        df.to_csv('foo.csv')
+        mixed_df = pd.read_csv('foo.csv')
+        mixed_df['col_1'].apply(type).value_counts()
+        mixed_df['col_1'].dtype
+
+   will result with `mixed_df` containing an ``int`` dtype for certain chunks
+   of the column, and ``str`` for others due to the mixed dtypes from the
+   data that was read in. It is important to note that the overall column will be
+   marked with a ``dtype`` of ``object``, which is used for columns with mixed dtypes.
 
 .. ipython:: python
    :suppress:
 
-   data = ('label1,label2,label3\n'
-           'index1,"a,c,e\n'
-           'index2,b,d,f')
+   os.remove('foo.csv')
 
-Suppose you had data with unenclosed quotes:
+.. _io.categorical:
+
+Specifying Categorical dtype
+''''''''''''''''''''''''''''
+
+.. versionadded:: 0.19.0
+
+``Categorical`` columns can be parsed directly by specifying ``dtype='category'`` or
+``dtype=CategoricalDtype(categories, ordered)``.
 
 .. ipython:: python
 
-   print(data)
+   data = 'col1,col2,col3\na,b,1\na,b,2\nc,d,3'
 
-By default, ``read_csv`` uses the Excel dialect and treats the double quote as
-the quote character, which causes it to fail when it finds a newline before it
-finds the closing double quote.
+   pd.read_csv(StringIO(data))
+   pd.read_csv(StringIO(data)).dtypes
+   pd.read_csv(StringIO(data), dtype='category').dtypes
 
-We can get around this using ``dialect``
+Individual columns can be parsed as a ``Categorical`` using a dict
+specification:
 
 .. ipython:: python
 
-   dia = csv.excel()
-   dia.quoting = csv.QUOTE_NONE
-   pd.read_csv(StringIO(data), dialect=dia)
+   pd.read_csv(StringIO(data), dtype={'col1': 'category'}).dtypes
 
-All of the dialect options can be specified separately by keyword arguments:
+.. versionadded:: 0.21.0
+
+Specifying ``dtype='cateogry'`` will result in an unordered ``Categorical``
+whose ``categories`` are the unique values observed in the data. For more
+control on the categories and order, create a
+:class:`~pandas.api.types.CategoricalDtype` ahead of time, and pass that for
+that column's ``dtype``.
 
 .. ipython:: python
 
-    data = 'a,b,c~1,2,3~4,5,6'
-    pd.read_csv(StringIO(data), lineterminator='~')
+   from pandas.api.types import CategoricalDtype
 
-Another common dialect option is ``skipinitialspace``, to skip any whitespace
-after a delimiter:
+   dtype = CategoricalDtype(['d', 'c', 'b', 'a'], ordered=True)
+   pd.read_csv(StringIO(data), dtype={'col1': dtype}).dtypes
 
-.. ipython:: python
+When using ``dtype=CategoricalDtype``, "unexpected" values outside of
+``dtype.categories`` are treated as missing values.
 
-   data = 'a, b, c\n1, 2, 3\n4, 5, 6'
-   print(data)
-   pd.read_csv(StringIO(data), skipinitialspace=True)
+.. ipython:: python
 
-The parsers make every attempt to "do the right thing" and not be very
-fragile. Type inference is a pretty big deal. So if a column can be coerced to
-integer dtype without altering the contents, it will do so. Any non-numeric
-columns will come through as object dtype as with the rest of pandas objects.
+   dtype = CategoricalDtype(['a', 'b', 'd'])  # No 'c'
+   pd.read_csv(StringIO(data), dtype={'col1': dtype}).col1
 
-.. _io.dtypes:
+This matches the behavior of :meth:`Categorical.set_categories`.
 
-Specifying column data types
-''''''''''''''''''''''''''''
+.. note::
 
-Starting with v0.10, you can indicate the data type for the whole DataFrame or
-individual columns:
+   With ``dtype='category'``, the resulting categories will always be parsed
+   as strings (object dtype). If the categories are numeric they can be
+   converted using the :func:`to_numeric` function, or as appropriate, another
+   converter such as :func:`to_datetime`.
 
-.. ipython:: python
+   When ``dtype`` is a ``CategoricalDtype`` with homogeneous ``categories`` (
+   all numeric, all datetimes, etc.), the conversion is done automatically.
 
-    data = 'a,b,c\n1,2,3\n4,5,6\n7,8,9'
-    print(data)
+   .. ipython:: python
 
-    df = pd.read_csv(StringIO(data), dtype=object)
-    df
-    df['a'][0]
-    df = pd.read_csv(StringIO(data), dtype={'b': object, 'c': np.float64})
-    df.dtypes
+      df = pd.read_csv(StringIO(data), dtype='category')
+      df.dtypes
+      df['col3']
+      df['col3'].cat.categories = pd.to_numeric(df['col3'].cat.categories)
+      df['col3']
 
-.. note::
-    The ``dtype`` option is currently only supported by the C engine.
-    Specifying ``dtype`` with ``engine`` other than 'c' raises a
-    ``ValueError``.
 
 Naming and Using Columns
 ''''''''''''''''''''''''
@@ -336,13 +550,60 @@ If the header is in a row other than the first, pass the row number to
     data = 'skip this skip it\na,b,c\n1,2,3\n4,5,6\n7,8,9'
     pd.read_csv(StringIO(data), header=1)
 
+.. note::
+
+  Default behavior is to infer the column names: if no names are
+  passed the behavior is identical to ``header=0`` and column names
+  are inferred from the first non-blank line of the file, if column
+  names are passed explicitly then the behavior is identical to
+  ``header=None``.
+
+.. _io.dupe_names:
+
+Duplicate names parsing
+'''''''''''''''''''''''
+
+If the file or header contains duplicate names, pandas will by default
+distinguish between them so as to prevent overwriting data:
+
+.. ipython :: python
+
+   data = 'a,b,a\n0,1,2\n3,4,5'
+   pd.read_csv(StringIO(data))
+
+There is no more duplicate data because ``mangle_dupe_cols=True`` by default,
+which modifies a series of duplicate columns 'X', ..., 'X' to become
+'X', 'X.1', ..., 'X.N'.  If ``mangle_dupe_cols=False``, duplicate data can
+arise:
+
+.. code-block :: python
+
+   In [2]: data = 'a,b,a\n0,1,2\n3,4,5'
+   In [3]: pd.read_csv(StringIO(data), mangle_dupe_cols=False)
+   Out[3]:
+      a  b  a
+   0  2  1  2
+   1  5  4  5
+
+To prevent users from encountering this problem with duplicate data, a ``ValueError``
+exception is raised if ``mangle_dupe_cols != True``:
+
+.. code-block :: python
+
+   In [2]: data = 'a,b,a\n0,1,2\n3,4,5'
+   In [3]: pd.read_csv(StringIO(data), mangle_dupe_cols=False)
+   ...
+   ValueError: Setting mangle_dupe_cols=False is not supported yet
+
 .. _io.usecols:
 
 Filtering columns (``usecols``)
 +++++++++++++++++++++++++++++++
 
 The ``usecols`` argument allows you to select any subset of the columns in a
-file, either using the column names or position numbers:
+file, either using the column names, position numbers or a callable:
+
+.. versionadded:: 0.20.0 support for callable `usecols` arguments
 
 .. ipython:: python
 
@@ -350,6 +611,17 @@ file, either using the column names or position numbers:
     pd.read_csv(StringIO(data))
     pd.read_csv(StringIO(data), usecols=['b', 'd'])
     pd.read_csv(StringIO(data), usecols=[0, 2, 3])
+    pd.read_csv(StringIO(data), usecols=lambda x: x.upper() in ['A', 'C'])
+
+The ``usecols`` argument can also be used to specify which columns not to
+use in the final result:
+
+.. ipython:: python
+
+   pd.read_csv(StringIO(data), usecols=lambda x: x not in ['a', 'c'])
+
+In this case, the callable is specifying that we exclude the "a" and "c"
+columns from the output.
 
 Comments and Empty Lines
 ''''''''''''''''''''''''
@@ -360,8 +632,7 @@ Ignoring line comments and empty lines
 ++++++++++++++++++++++++++++++++++++++
 
 If the ``comment`` parameter is specified, then completely commented lines will
-be ignored. By default, completely blank lines will be ignored as well. Both of
-these are API changes introduced in version 0.15.
+be ignored. By default, completely blank lines will be ignored as well.
 
 .. ipython:: python
 
@@ -458,7 +729,7 @@ result in byte strings being decoded to unicode in the result:
 Some formats which encode all characters as multiple bytes, like UTF-16, won't
 parse correctly at all without specifying the encoding. `Full list of Python
 standard encodings
-<https://docs.python.org/3/library/codecs.html#standard-encodings>`_
+<https://docs.python.org/3/library/codecs.html#standard-encodings>`_.
 
 .. _io.index_col:
 
@@ -466,7 +737,7 @@ Index columns and trailing delimiters
 '''''''''''''''''''''''''''''''''''''
 
 If a file has one more column of data than the number of column names, the
-first column will be used as the DataFrame's row names:
+first column will be used as the ``DataFrame``'s row names:
 
 .. ipython:: python
 
@@ -491,6 +762,16 @@ index column inference and discard the last column, pass ``index_col=False``:
     pd.read_csv(StringIO(data))
     pd.read_csv(StringIO(data), index_col=False)
 
+If a subset of data is being parsed using the ``usecols`` option, the
+``index_col`` specification is based on that subset, not the original data.
+
+.. ipython:: python
+
+    data = 'a,b,c\n4,apple,bat,\n8,orange,cow,'
+    print(data)
+    pd.read_csv(StringIO(data), usecols=['b', 'c'])
+    pd.read_csv(StringIO(data), usecols=['b', 'c'], index_col=0)
+
 .. _io.parse_dates:
 
 Date Handling
@@ -499,21 +780,27 @@ Date Handling
 Specifying Date Columns
 +++++++++++++++++++++++
 
-To better facilitate working with datetime data,
-:func:`~pandas.io.parsers.read_csv` and :func:`~pandas.io.parsers.read_table`
-uses the keyword arguments ``parse_dates`` and ``date_parser`` to allow users
-to specify a variety of columns and date/time formats to turn the input text
-data into ``datetime`` objects.
+To better facilitate working with datetime data, :func:`read_csv` and
+:func:`read_table` use the keyword arguments ``parse_dates`` and ``date_parser``
+to allow users to specify a variety of columns and date/time formats to turn the
+input text data into ``datetime`` objects.
 
 The simplest case is to just pass in ``parse_dates=True``:
 
+.. ipython:: python
+   :suppress:
+
+   f = open('foo.csv', 'w')
+   f.write('date,A,B,C\n20090101,a,1,2\n20090102,b,3,4\n20090103,c,4,5')
+   f.close()
+
 .. ipython:: python
 
    # Use a column as an index, and parse it as dates.
    df = pd.read_csv('foo.csv', index_col=0, parse_dates=True)
    df
 
-   # These are python datetime objects
+   # These are Python datetime objects
    df.index
 
 It is often the case that we may want to store date and time data separately,
@@ -577,9 +864,15 @@ data columns:
 
    date_spec = {'nominal': [1, 2], 'actual': [1, 3]}
    df = pd.read_csv('tmp.csv', header=None, parse_dates=date_spec,
-                    index_col=0) #index is the nominal column
+                    index_col=0)  # index is the nominal column
    df
 
+.. note::
+   If a column or index contains an unparsable date, the entire column or
+   index will be returned unaltered as an object data type. For non-standard
+   datetime parsing, use :func:`to_datetime` after ``pd.read_csv``.
+
+
 .. note::
    read_csv has a fast_path for parsing datetime strings in iso8601 format,
    e.g "2000-01-01T00:01:02+00:00" and similar variations. If you can arrange
@@ -614,30 +907,31 @@ Pandas will try to call the ``date_parser`` function in three different ways. If
 an exception is raised, the next one is tried:
 
 1. ``date_parser`` is first called with one or more arrays as arguments,
-   as defined using `parse_dates` (e.g., ``date_parser(['2013', '2013'], ['1', '2'])``)
+   as defined using `parse_dates` (e.g., ``date_parser(['2013', '2013'], ['1', '2'])``).
 
 2. If #1 fails, ``date_parser`` is called with all the columns
-   concatenated row-wise into a single array (e.g., ``date_parser(['2013 1', '2013 2'])``)
+   concatenated row-wise into a single array (e.g., ``date_parser(['2013 1', '2013 2'])``).
 
 3. If #2 fails, ``date_parser`` is called once for every row with one or more
    string arguments from the columns indicated with `parse_dates`
    (e.g., ``date_parser('2013', '1')`` for the first row, ``date_parser('2013', '2')``
-   for the second, etc.)
+   for the second, etc.).
 
 Note that performance-wise, you should try these methods of parsing dates in order:
 
-1. Try to infer the format using ``infer_datetime_format=True`` (see section below)
+1. Try to infer the format using ``infer_datetime_format=True`` (see section below).
 
 2. If you know the format, use ``pd.to_datetime()``:
-   ``date_parser=lambda x: pd.to_datetime(x, format=...)``
+   ``date_parser=lambda x: pd.to_datetime(x, format=...)``.
 
 3. If you have a really non-standard format, use a custom ``date_parser`` function.
    For optimal performance, this should be vectorized, i.e., it should accept arrays
    as arguments.
 
-You can explore the date parsing functionality in ``date_converters.py`` and
-add your own. We would love to turn this module into a community supported set
-of date/time parsers. To get you started, ``date_converters.py`` contains
+You can explore the date parsing functionality in
+`date_converters.py <https://github.com/pandas-dev/pandas/blob/master/pandas/io/date_converters.py>`__
+and add your own. We would love to turn this module into a community supported
+set of date/time parsers. To get you started, ``date_converters.py`` contains
 functions to parse dual date and time columns, year/month/day columns,
 and year/month/day/hour/minute/second columns. It also contains a
 ``generic_parser`` function so you can curry it with a function that deals with
@@ -665,16 +959,16 @@ of strings.  So in general, ``infer_datetime_format`` should not have any
 negative consequences if enabled.
 
 Here are some examples of datetime strings that can be guessed (All
-representing December 30th, 2011 at 00:00:00)
+representing December 30th, 2011 at 00:00:00):
 
-- "20111230"
-- "2011/12/30"
-- "20111230 00:00:00"
-- "12/30/2011 00:00:00"
-- "30/Dec/2011 00:00:00"
-- "30/December/2011 00:00:00"
+* "20111230"
+* "2011/12/30"
+* "20111230 00:00:00"
+* "12/30/2011 00:00:00"
+* "30/Dec/2011 00:00:00"
+* "30/December/2011 00:00:00"
 
-``infer_datetime_format`` is sensitive to ``dayfirst``.  With
+Note that ``infer_datetime_format`` is sensitive to ``dayfirst``.  With
 ``dayfirst=True``, it will guess "01/12/2011" to be December 1st. With
 ``dayfirst=False`` (default) it will guess "01/12/2011" to be January 12th.
 
@@ -750,7 +1044,7 @@ correctly:
    with open('tmp.csv', 'w') as fh:
        fh.write(data)
 
-By default, numbers with a thousands separator will be parsed as strings
+By default, numbers with a thousands separator will be parsed as strings:
 
 .. ipython:: python
 
@@ -760,7 +1054,7 @@ By default, numbers with a thousands separator will be parsed as strings
 
     df.level.dtype
 
-The ``thousands`` keyword allows integers to be parsed correctly
+The ``thousands`` keyword allows integers to be parsed correctly:
 
 .. ipython:: python
 
@@ -780,41 +1074,48 @@ The ``thousands`` keyword allows integers to be parsed correctly
 NA Values
 '''''''''
 
-To control which values are parsed as missing values (which are signified by ``NaN``), specifiy a
-string in ``na_values``. If you specify a list of strings, then all values in
-it are considered to be missing values. If you specify a number (a ``float``, like ``5.0`` or an ``integer`` like ``5``),
-the corresponding equivalent values will also imply a missing value (in this case effectively
-``[5.0,5]`` are recognized as ``NaN``.
+To control which values are parsed as missing values (which are signified by
+``NaN``), specify a string in ``na_values``. If you specify a list of strings,
+then all values in it are considered to be missing values. If you specify a
+number (a ``float``, like ``5.0`` or an ``integer`` like ``5``), the
+corresponding equivalent values will also imply a missing value (in this case
+effectively ``[5.0, 5]`` are recognized as ``NaN``).
 
 To completely override the default values that are recognized as missing, specify ``keep_default_na=False``.
-The default ``NaN`` recognized values are ``['-1.#IND', '1.#QNAN', '1.#IND', '-1.#QNAN', '#N/A','N/A', 'NA',
-'#NA', 'NULL', 'NaN', '-NaN', 'nan', '-nan']``. Although a 0-length string
-``''`` is not included in the default ``NaN`` values list, it is still treated
-as a missing value.
+
+.. _io.navaluesconst:
+
+The default ``NaN`` recognized values are ``['-1.#IND', '1.#QNAN', '1.#IND', '-1.#QNAN', '#N/A N/A', '#N/A', 'N/A',
+'n/a', 'NA', '#NA', 'NULL', 'null', 'NaN', '-NaN', 'nan', '-nan', '']``.
+
+Let us consider some examples:
 
 .. code-block:: python
 
    read_csv(path, na_values=[5])
 
-the default values, in addition to ``5`` , ``5.0`` when interpreted as numbers are recognized as ``NaN``
+In the example above ``5`` and ``5.0`` will be recognized as ``NaN``, in
+addition to the defaults. A string will first be interpreted as a numerical
+``5``, then as a ``NaN``.
 
 .. code-block:: python
 
    read_csv(path, keep_default_na=False, na_values=[""])
 
-only an empty field will be ``NaN``
+Above, only an empty field will be recognized as ``NaN``.
 
 .. code-block:: python
 
    read_csv(path, keep_default_na=False, na_values=["NA", "0"])
 
-only ``NA`` and ``0`` as strings are ``NaN``
+Above, both ``NA`` and ``0`` as strings are ``NaN``.
 
 .. code-block:: python
 
    read_csv(path, na_values=["Nope"])
 
-the default values, in addition to the string ``"Nope"`` are recognized as ``NaN``
+The default values, in addition to the string ``"Nope"`` are recognized as
+``NaN``.
 
 .. _io.infinity:
 
@@ -862,9 +1163,9 @@ Boolean values
 ''''''''''''''
 
 The common values ``True``, ``False``, ``TRUE``, and ``FALSE`` are all
-recognized as boolean. Sometime you would want to recognize some other values
-as being boolean. To do this use the ``true_values`` and ``false_values``
-options:
+recognized as boolean. Occasionally you might want to recognize other values
+as being boolean. To do this, use the ``true_values`` and ``false_values``
+options as follows:
 
 .. ipython:: python
 
@@ -880,7 +1181,7 @@ Handling "bad" lines
 
 Some files may have malformed lines with too few fields or too many. Lines with
 too few fields will have NA values filled in the trailing fields. Lines with
-too many will cause an error by default:
+too many fields will raise an error by default:
 
 .. ipython:: python
    :suppress:
@@ -893,8 +1194,8 @@ too many will cause an error by default:
 
     In [28]: pd.read_csv(StringIO(data))
     ---------------------------------------------------------------------------
-    CParserError                              Traceback (most recent call last)
-    CParserError: Error tokenizing data. C error: Expected 3 fields in line 3, saw 4
+    ParserError                              Traceback (most recent call last)
+    ParserError: Error tokenizing data. C error: Expected 3 fields in line 3, saw 4
 
 You can elect to skip bad lines:
 
@@ -908,6 +1209,75 @@ You can elect to skip bad lines:
     0  1  2   3
     1  8  9  10
 
+You can also use the ``usecols`` parameter to eliminate extraneous column
+data that appear in some lines but not others:
+
+.. code-block:: ipython
+
+   In [30]: pd.read_csv(StringIO(data), usecols=[0, 1, 2])
+
+    Out[30]:
+       a  b   c
+    0  1  2   3
+    1  4  5   6
+    2  8  9  10
+
+.. _io.dialect:
+
+Dialect
+'''''''
+
+The ``dialect`` keyword gives greater flexibility in specifying the file format.
+By default it uses the Excel dialect but you can specify either the dialect name
+or a :class:`python:csv.Dialect` instance.
+
+.. ipython:: python
+   :suppress:
+
+   data = ('label1,label2,label3\n'
+           'index1,"a,c,e\n'
+           'index2,b,d,f')
+
+Suppose you had data with unenclosed quotes:
+
+.. ipython:: python
+
+   print(data)
+
+By default, ``read_csv`` uses the Excel dialect and treats the double quote as
+the quote character, which causes it to fail when it finds a newline before it
+finds the closing double quote.
+
+We can get around this using ``dialect``:
+
+.. ipython:: python
+   :okwarning:
+
+   dia = csv.excel()
+   dia.quoting = csv.QUOTE_NONE
+   pd.read_csv(StringIO(data), dialect=dia)
+
+All of the dialect options can be specified separately by keyword arguments:
+
+.. ipython:: python
+
+    data = 'a,b,c~1,2,3~4,5,6'
+    pd.read_csv(StringIO(data), lineterminator='~')
+
+Another common dialect option is ``skipinitialspace``, to skip any whitespace
+after a delimiter:
+
+.. ipython:: python
+
+   data = 'a, b, c\n1, 2, 3\n4, 5, 6'
+   print(data)
+   pd.read_csv(StringIO(data), skipinitialspace=True)
+
+The parsers make every attempt to "do the right thing" and not be fragile. Type
+inference is a pretty big deal. If a column can be coerced to integer dtype
+without altering the contents, the parser will do so. Any non-numeric
+columns will come through as object dtype as with the rest of pandas objects.
+
 .. _io.quoting:
 
 Quoting and Escape Characters
@@ -928,18 +1298,21 @@ should pass the ``escapechar`` option:
 Files with Fixed Width Columns
 ''''''''''''''''''''''''''''''
 
-While ``read_csv`` reads delimited data, the :func:`~pandas.io.parsers.read_fwf`
-function works with data files that have known and fixed column widths.
-The function parameters to ``read_fwf`` are largely the same as `read_csv` with
-two extra parameters:
+While :func:`read_csv` reads delimited data, the :func:`read_fwf` function works
+with data files that have known and fixed column widths. The function parameters
+to ``read_fwf`` are largely the same as `read_csv` with two extra parameters, and
+a different usage of the ``delimiter`` parameter:
 
-  - ``colspecs``: A list of pairs (tuples) giving the extents of the
-    fixed-width fields of each line as half-open intervals (i.e.,  [from, to[ ).
-    String value 'infer' can be used to instruct the parser to try detecting
-    the column specifications from the first 100 rows of the data. Default
-    behaviour, if not specified, is to infer.
-  - ``widths``: A list of field widths which can be used instead of 'colspecs'
-    if the intervals are contiguous.
+* ``colspecs``: A list of pairs (tuples) giving the extents of the
+  fixed-width fields of each line as half-open intervals (i.e.,  [from, to[ ).
+  String value 'infer' can be used to instruct the parser to try detecting
+  the column specifications from the first 100 rows of the data. Default
+  behavior, if not specified, is to infer.
+* ``widths``: A list of field widths which can be used instead of 'colspecs'
+  if the intervals are contiguous.
+* ``delimiter``: Characters to consider as filler characters in the fixed-width file.
+  Can be used to specify the filler character of the fields
+  if it is not spaces (e.g., '~').
 
 .. ipython:: python
    :suppress:
@@ -959,12 +1332,12 @@ Consider a typical fixed-width data file:
 
    print(open('bar.csv').read())
 
-In order to parse this file into a DataFrame, we simply need to supply the
+In order to parse this file into a ``DataFrame``, we simply need to supply the
 column specifications to the `read_fwf` function along with the file name:
 
 .. ipython:: python
 
-   #Column specifications are a list of half-intervals
+   # Column specifications are a list of half-intervals
    colspecs = [(0, 6), (8, 20), (21, 33), (34, 43)]
    df = pd.read_fwf('bar.csv', colspecs=colspecs, header=None, index_col=0)
    df
@@ -975,7 +1348,7 @@ column widths for contiguous columns:
 
 .. ipython:: python
 
-   #Widths are a list of integers
+   # Widths are a list of integers
    widths = [6, 14, 13, 10]
    df = pd.read_fwf('bar.csv', widths=widths, header=None)
    df
@@ -983,8 +1356,6 @@ column widths for contiguous columns:
 The parser will take care of extra white spaces around the columns
 so it's ok to have extra separation between the columns in the file.
 
-.. versionadded:: 0.13.0
-
 By default, ``read_fwf`` will try to infer the file's ``colspecs`` by using the
 first 100 rows of the file. It can do it only in cases when the columns are
 aligned and correctly separated by the provided ``delimiter`` (default delimiter
@@ -995,11 +1366,22 @@ is whitespace).
    df = pd.read_fwf('bar.csv', header=None, index_col=0)
    df
 
+.. versionadded:: 0.20.0
+
+``read_fwf`` supports the ``dtype`` parameter for specifying the types of
+parsed columns to be different from the inferred type.
+
+.. ipython:: python
+
+   pd.read_fwf('bar.csv', header=None, index_col=0).dtypes
+   pd.read_fwf('bar.csv', header=None, dtype={2: 'object'}).dtypes
+
 .. ipython:: python
    :suppress:
 
    os.remove('bar.csv')
 
+
 Indexes
 '''''''
 
@@ -1021,7 +1403,7 @@ column:
    print(open('foo.csv').read())
 
 In this special case, ``read_csv`` assumes that the first column is to be used
-as the index of the DataFrame:
+as the index of the ``DataFrame``:
 
 .. ipython:: python
 
@@ -1060,7 +1442,7 @@ returned object:
 
    df = pd.read_csv("data/mindex_ex.csv", index_col=[0,1])
    df
-   df.ix[1978]
+   df.loc[1978]
 
 .. _io.multi_index_columns:
 
@@ -1069,35 +1451,34 @@ Reading columns with a ``MultiIndex``
 
 By specifying list of row locations for the ``header`` argument, you
 can read in a ``MultiIndex`` for the columns. Specifying non-consecutive
-rows will skip the intervening rows. In order to have the pre-0.13 behavior
-of tupleizing columns, specify ``tupleize_cols=True``.
+rows will skip the intervening rows.
 
 .. ipython:: python
 
    from pandas.util.testing import makeCustomDataframe as mkdf
-   df = mkdf(5,3,r_idx_nlevels=2,c_idx_nlevels=4)
+   df = mkdf(5, 3, r_idx_nlevels=2, c_idx_nlevels=4)
    df.to_csv('mi.csv')
    print(open('mi.csv').read())
-   pd.read_csv('mi.csv',header=[0,1,2,3],index_col=[0,1])
+   pd.read_csv('mi.csv', header=[0, 1, 2, 3], index_col=[0, 1])
 
-Starting in 0.13.0, ``read_csv`` will be able to interpret a more common format
+``read_csv`` is also able to interpret a more common format
 of multi-columns indices.
 
 .. ipython:: python
    :suppress:
 
    data = ",a,a,a,b,c,c\n,q,r,s,t,u,v\none,1,2,3,4,5,6\ntwo,7,8,9,10,11,12"
-   fh = open('mi2.csv','w')
+   fh = open('mi2.csv', 'w')
    fh.write(data)
    fh.close()
 
 .. ipython:: python
 
    print(open('mi2.csv').read())
-   pd.read_csv('mi2.csv',header=[0,1],index_col=0)
+   pd.read_csv('mi2.csv', header=[0, 1], index_col=0)
 
 Note: If an ``index_col`` is not specified (e.g. you don't have an index, or wrote it
-with ``df.to_csv(..., index=False``), then any ``names`` on the columns index will be *lost*.
+with ``df.to_csv(..., index=False)``, then any ``names`` on the columns index will be *lost*.
 
 .. ipython:: python
    :suppress:
@@ -1118,7 +1499,7 @@ class of the csv module. For this, you have to specify ``sep=None``.
 .. ipython:: python
    :suppress:
 
-   df = DataFrame(np.random.randn(10, 4))
+   df = pd.DataFrame(np.random.randn(10, 4))
    df.to_csv('tmp.sv', sep='|')
    df.to_csv('tmp2.sv', sep=':')
 
@@ -1127,6 +1508,14 @@ class of the csv module. For this, you have to specify ``sep=None``.
     print(open('tmp2.sv').read())
     pd.read_csv('tmp2.sv', sep=None, engine='python')
 
+.. _io.multiple_files:
+
+Reading multiple files to create a single DataFrame
+'''''''''''''''''''''''''''''''''''''''''''''''''''
+
+It's best to use :func:`~pandas.concat` to combine multiple files.
+See the :ref:`cookbook<cookbook.csv.multiple_files>` for an example.
+
 .. _io.chunking:
 
 Iterating through files chunk by chunk
@@ -1172,18 +1561,35 @@ Specifying the parser engine
 ''''''''''''''''''''''''''''
 
 Under the hood pandas uses a fast and efficient parser implemented in C as well
-as a python implementation which is currently more feature-complete. Where
+as a Python implementation which is currently more feature-complete. Where
 possible pandas uses the C parser (specified as ``engine='c'``), but may fall
-back to python if C-unsupported options are specified. Currently, C-unsupported
+back to Python if C-unsupported options are specified. Currently, C-unsupported
 options include:
 
-- ``sep`` other than a single character (e.g. regex separators)
-- ``skip_footer``
-- ``sep=None`` with ``delim_whitespace=False``
+* ``sep`` other than a single character (e.g. regex separators)
+* ``skipfooter``
+* ``sep=None`` with ``delim_whitespace=False``
 
 Specifying any of the above options will produce a ``ParserWarning`` unless the
 python engine is selected explicitly using ``engine='python'``.
 
+Reading remote files
+''''''''''''''''''''
+
+You can pass in a URL to a CSV file:
+
+.. code-block:: python
+
+   df = pd.read_csv('https://download.bls.gov/pub/time.series/cu/cu.item',
+                    sep='\t')
+
+S3 URLs are handled as well:
+
+.. code-block:: python
+
+   df = pd.read_csv('s3://pandas-test/tips.csv')
+
+
 Writing out Data
 ''''''''''''''''
 
@@ -1192,60 +1598,60 @@ Writing out Data
 Writing to CSV format
 +++++++++++++++++++++
 
-The Series and DataFrame objects have an instance method ``to_csv`` which
+The ``Series`` and ``DataFrame`` objects have an instance method ``to_csv`` which
 allows storing the contents of the object as a comma-separated-values file. The
 function takes a number of arguments. Only the first is required.
 
-  - ``path_or_buf``: A string path to the file to write or a StringIO
-  - ``sep`` : Field delimiter for the output file (default ",")
-  - ``na_rep``: A string representation of a missing value (default '')
-  - ``float_format``: Format string for floating point numbers
-  - ``cols``: Columns to write (default None)
-  - ``header``: Whether to write out the column names (default True)
-  - ``index``: whether to write row (index) names (default True)
-  - ``index_label``: Column label(s) for index column(s) if desired. If None
-    (default), and `header` and `index` are True, then the index names are
-    used. (A sequence should be given if the DataFrame uses MultiIndex).
-  - ``mode`` : Python write mode, default 'w'
-  - ``encoding``: a string representing the encoding to use if the contents are
-    non-ASCII, for python versions prior to 3
-  - ``line_terminator``: Character sequence denoting line end (default '\\n')
-  - ``quoting``: Set quoting rules as in csv module (default csv.QUOTE_MINIMAL)
-  - ``quotechar``: Character used to quote fields (default '"')
-  - ``doublequote``: Control quoting of ``quotechar`` in fields (default True)
-  - ``escapechar``: Character used to escape ``sep`` and ``quotechar`` when
-    appropriate (default None)
-  - ``chunksize``: Number of rows to write at a time
-  - ``tupleize_cols``: If False (default), write as a list of tuples, otherwise
-    write in an expanded line format suitable for ``read_csv``
-  - ``date_format``: Format string for datetime objects
+* ``path_or_buf``: A string path to the file to write or a StringIO
+* ``sep`` : Field delimiter for the output file (default ",")
+* ``na_rep``: A string representation of a missing value (default '')
+* ``float_format``: Format string for floating point numbers
+* ``cols``: Columns to write (default None)
+* ``header``: Whether to write out the column names (default True)
+* ``index``: whether to write row (index) names (default True)
+* ``index_label``: Column label(s) for index column(s) if desired. If None
+  (default), and `header` and `index` are True, then the index names are
+  used. (A sequence should be given if the ``DataFrame`` uses MultiIndex).
+* ``mode`` : Python write mode, default 'w'
+* ``encoding``: a string representing the encoding to use if the contents are
+  non-ASCII, for Python versions prior to 3
+* ``line_terminator``: Character sequence denoting line end (default '\\n')
+* ``quoting``: Set quoting rules as in csv module (default csv.QUOTE_MINIMAL). Note that if you have set a `float_format` then floats are converted to strings and csv.QUOTE_NONNUMERIC will treat them as non-numeric
+* ``quotechar``: Character used to quote fields (default '"')
+* ``doublequote``: Control quoting of ``quotechar`` in fields (default True)
+* ``escapechar``: Character used to escape ``sep`` and ``quotechar`` when
+  appropriate (default None)
+* ``chunksize``: Number of rows to write at a time
+* ``tupleize_cols``: If False (default), write as a list of tuples, otherwise
+  write in an expanded line format suitable for ``read_csv``
+* ``date_format``: Format string for datetime objects
 
 Writing a formatted string
 ++++++++++++++++++++++++++
 
 .. _io.formatting:
 
-The DataFrame object has an instance method ``to_string`` which allows control
+The ``DataFrame`` object has an instance method ``to_string`` which allows control
 over the string representation of the object. All arguments are optional:
 
-  - ``buf`` default None, for example a StringIO object
-  - ``columns`` default None, which columns to write
-  - ``col_space`` default None, minimum width of each column.
-  - ``na_rep`` default ``NaN``, representation of NA value
-  - ``formatters`` default None, a dictionary (by column) of functions each of
-    which takes a single argument and returns a formatted string
-  - ``float_format`` default None, a function which takes a single (float)
-    argument and returns a formatted string; to be applied to floats in the
-    DataFrame.
-  - ``sparsify`` default True, set to False for a DataFrame with a hierarchical
-    index to print every multiindex key at each row.
-  - ``index_names`` default True, will print the names of the indices
-  - ``index`` default True, will print the index (ie, row labels)
-  - ``header`` default True, will print the column labels
-  - ``justify`` default ``left``, will print column headers left- or
-    right-justified
-
-The Series object also has a ``to_string`` method, but with only the ``buf``,
+* ``buf`` default None, for example a StringIO object
+* ``columns`` default None, which columns to write
+* ``col_space`` default None, minimum width of each column.
+* ``na_rep`` default ``NaN``, representation of NA value
+* ``formatters`` default None, a dictionary (by column) of functions each of
+  which takes a single argument and returns a formatted string
+* ``float_format`` default None, a function which takes a single (float)
+  argument and returns a formatted string; to be applied to floats in the
+  ``DataFrame``.
+* ``sparsify`` default True, set to False for a ``DataFrame`` with a hierarchical
+  index to print every MultiIndex key at each row.
+* ``index_names`` default True, will print the names of the indices
+* ``index`` default True, will print the index (ie, row labels)
+* ``header`` default True, will print the column labels
+* ``justify`` default ``left``, will print column headers left- or
+  right-justified
+
+The ``Series`` object also has a ``to_string`` method, but with only the ``buf``,
 ``na_rep``, ``float_format`` arguments. There is also a ``length`` argument
 which, if set to ``True``, will additionally output the length of the Series.
 
@@ -1264,17 +1670,17 @@ Writing JSON
 A ``Series`` or ``DataFrame`` can be converted to a valid JSON string. Use ``to_json``
 with optional parameters:
 
-- ``path_or_buf`` : the pathname or buffer to write the output
+* ``path_or_buf`` : the pathname or buffer to write the output
   This can be ``None`` in which case a JSON string is returned
-- ``orient`` :
+* ``orient`` :
 
-  Series :
-      - default is ``index``
-      - allowed values are {``split``, ``records``, ``index``}
+  ``Series``:
+      * default is ``index``
+      * allowed values are {``split``, ``records``, ``index``}
 
-  DataFrame
-      - default is ``columns``
-      - allowed values are {``split``, ``records``, ``index``, ``columns``, ``values``}
+  ``DataFrame``:
+      * default is ``columns``
+      * allowed values are {``split``, ``records``, ``index``, ``columns``, ``values``, ``table``}
 
   The format of the JSON string
 
@@ -1288,17 +1694,18 @@ with optional parameters:
      ``columns``; dict like {column -> {index -> value}}
      ``values``; just the values array
 
-- ``date_format`` : string, type of date conversion, 'epoch' for timestamp, 'iso' for ISO8601.
-- ``double_precision`` : The number of decimal places to use when encoding floating point values, default 10.
-- ``force_ascii`` : force encoded string to be ASCII, default True.
-- ``date_unit`` : The time unit to encode to, governs timestamp and ISO8601 precision. One of 's', 'ms', 'us' or 'ns' for seconds, milliseconds, microseconds and nanoseconds respectively. Default 'ms'.
-- ``default_handler`` : The handler to call if an object cannot otherwise be converted to a suitable format for JSON. Takes a single argument, which is the object to convert, and returns a serializable object.
+* ``date_format`` : string, type of date conversion, 'epoch' for timestamp, 'iso' for ISO8601.
+* ``double_precision`` : The number of decimal places to use when encoding floating point values, default 10.
+* ``force_ascii`` : force encoded string to be ASCII, default True.
+* ``date_unit`` : The time unit to encode to, governs timestamp and ISO8601 precision. One of 's', 'ms', 'us' or 'ns' for seconds, milliseconds, microseconds and nanoseconds respectively. Default 'ms'.
+* ``default_handler`` : The handler to call if an object cannot otherwise be converted to a suitable format for JSON. Takes a single argument, which is the object to convert, and returns a serializable object.
+* ``lines`` : If ``records`` orient, then will write each record per line as json.
 
 Note ``NaN``'s, ``NaT``'s and ``None`` will be converted to ``null`` and ``datetime`` objects will be converted based on the ``date_format`` and ``date_unit`` parameters.
 
 .. ipython:: python
 
-   dfj = DataFrame(randn(5, 2), columns=list('AB'))
+   dfj = pd.DataFrame(randn(5, 2), columns=list('AB'))
    json = dfj.to_json()
    json
 
@@ -1306,14 +1713,14 @@ Orient Options
 ++++++++++++++
 
 There are a number of different options for the format of the resulting JSON
-file / string. Consider the following DataFrame and Series:
+file / string. Consider the following ``DataFrame`` and ``Series``:
 
 .. ipython:: python
 
-  dfjo = DataFrame(dict(A=range(1, 4), B=range(4, 7), C=range(7, 10)),
-                   columns=list('ABC'), index=list('xyz'))
+  dfjo = pd.DataFrame(dict(A=range(1, 4), B=range(4, 7), C=range(7, 10)),
+                      columns=list('ABC'), index=list('xyz'))
   dfjo
-  sjo = Series(dict(x=15, y=16, z=17), name='D')
+  sjo = pd.Series(dict(x=15, y=16, z=17), name='D')
   sjo
 
 **Column oriented** (the default for ``DataFrame``) serializes the data as
@@ -1333,8 +1740,8 @@ but the index labels are now primary:
   sjo.to_json(orient="index")
 
 **Record oriented** serializes the data to a JSON array of column -> value records,
-index labels are not included. This is useful for passing DataFrame data to plotting
-libraries, for example the JavaScript library d3.js:
+index labels are not included. This is useful for passing ``DataFrame`` data to plotting
+libraries, for example the JavaScript library ``d3.js``:
 
 .. ipython:: python
 
@@ -1357,6 +1764,9 @@ values, index and columns. Name is also included for ``Series``:
   dfjo.to_json(orient="split")
   sjo.to_json(orient="split")
 
+**Table oriented** serializes to the JSON `Table Schema`_, allowing for the
+preservation of metadata including but not limited to dtypes and index names.
+
 .. note::
 
   Any orient option that encodes to a JSON object will not preserve the ordering of
@@ -1366,86 +1776,76 @@ values, index and columns. Name is also included for ``Series``:
 Date Handling
 +++++++++++++
 
-Writing in ISO date format
+Writing in ISO date format:
 
 .. ipython:: python
 
-   dfd = DataFrame(randn(5, 2), columns=list('AB'))
-   dfd['date'] = Timestamp('20130101')
+   dfd = pd.DataFrame(randn(5, 2), columns=list('AB'))
+   dfd['date'] = pd.Timestamp('20130101')
    dfd = dfd.sort_index(1, ascending=False)
    json = dfd.to_json(date_format='iso')
    json
 
-Writing in ISO date format, with microseconds
+Writing in ISO date format, with microseconds:
 
 .. ipython:: python
 
    json = dfd.to_json(date_format='iso', date_unit='us')
    json
 
-Epoch timestamps, in seconds
+Epoch timestamps, in seconds:
 
 .. ipython:: python
 
    json = dfd.to_json(date_format='epoch', date_unit='s')
    json
 
-Writing to a file, with a date index and a date column
+Writing to a file, with a date index and a date column:
 
 .. ipython:: python
 
    dfj2 = dfj.copy()
-   dfj2['date'] = Timestamp('20130101')
+   dfj2['date'] = pd.Timestamp('20130101')
    dfj2['ints'] = list(range(5))
    dfj2['bools'] = True
-   dfj2.index = date_range('20130101', periods=5)
+   dfj2.index = pd.date_range('20130101', periods=5)
    dfj2.to_json('test.json')
    open('test.json').read()
 
 Fallback Behavior
 +++++++++++++++++
 
-If the JSON serializer cannot handle the container contents directly it will fallback in the following manner:
+If the JSON serializer cannot handle the container contents directly it will
+fall back in the following manner:
 
-- if a ``toDict`` method is defined by the unrecognised object then that
-  will be called and its returned ``dict`` will be JSON serialized.
-- if a ``default_handler`` has been passed to ``to_json`` that will
-  be called to convert the object.
-- otherwise an attempt is made to convert the object to a ``dict`` by
-  parsing its contents. However if the object is complex this will often fail
-  with an ``OverflowError``.
+* if the dtype is unsupported (e.g. ``np.complex``) then the ``default_handler``, if provided, will be called
+  for each value, otherwise an exception is raised.
 
-Your best bet when encountering ``OverflowError`` during serialization
-is to specify a ``default_handler``. For example ``timedelta`` can cause
-problems:
+* if an object is unsupported it will attempt the following:
 
-.. ipython:: python
-   :suppress:
 
-   from datetime import timedelta
-   dftd = DataFrame([timedelta(23), timedelta(seconds=5), 42])
+    * check if the object has defined a ``toDict`` method and call it.
+      A ``toDict`` method should return a ``dict`` which will then be JSON serialized.
 
-.. code-block:: ipython
+    * invoke the ``default_handler`` if one was provided.
+
+    * convert the object to a ``dict`` by traversing its contents. However this will often fail
+      with an ``OverflowError`` or give unexpected results.
 
-   In [141]: from datetime import timedelta
+In general the best approach for unsupported objects or dtypes is to provide a ``default_handler``.
+For example:
 
-   In [142]: dftd = DataFrame([timedelta(23), timedelta(seconds=5), 42])
+.. code-block:: python
 
-   In [143]: dftd.to_json()
+  DataFrame([1.0, 2.0, complex(1.0, 2.0)]).to_json()  # raises
 
-   ---------------------------------------------------------------------------
-   OverflowError                             Traceback (most recent call last)
-   OverflowError: Maximum recursion level reached
+  RuntimeError: Unhandled numpy dtype 15
 
-which can be dealt with by specifying a simple ``default_handler``:
+can be dealt with by specifying a simple ``default_handler``:
 
 .. ipython:: python
 
-   dftd.to_json(default_handler=str)
-
-   def my_handler(obj):
-      return obj.total_seconds()
-   dftd.to_json(default_handler=my_handler)
+   pd.DataFrame([1.0, 2.0, complex(1.0, 2.0)]).to_json(default_handler=str)
 
 .. _io.json_reader:
 
@@ -1456,20 +1856,20 @@ Reading a JSON string to pandas object can take a number of parameters.
 The parser will try to parse a ``DataFrame`` if ``typ`` is not supplied or
 is ``None``. To explicitly force ``Series`` parsing, pass ``typ=series``
 
-- ``filepath_or_buffer`` : a **VALID** JSON string or file handle / StringIO. The string could be
+* ``filepath_or_buffer`` : a **VALID** JSON string or file handle / StringIO. The string could be
   a URL. Valid URL schemes include http, ftp, S3, and file. For file URLs, a host
   is expected. For instance, a local file could be
   file ://localhost/path/to/table.json
-- ``typ``    : type of object to recover (series or frame), default 'frame'
-- ``orient`` :
+* ``typ``    : type of object to recover (series or frame), default 'frame'
+* ``orient`` :
 
   Series :
-      - default is ``index``
-      - allowed values are {``split``, ``records``, ``index``}
+      * default is ``index``
+      * allowed values are {``split``, ``records``, ``index``}
 
   DataFrame
-      - default is ``columns``
-      - allowed values are {``split``, ``records``, ``index``, ``columns``, ``values``}
+      * default is ``columns``
+      * allowed values are {``split``, ``records``, ``index``, ``columns``, ``values``, ``table``}
 
   The format of the JSON string
 
@@ -1482,18 +1882,23 @@ is ``None``. To explicitly force ``Series`` parsing, pass ``typ=series``
      ``index``; dict like {index -> {column -> value}}
      ``columns``; dict like {column -> {index -> value}}
      ``values``; just the values array
+     ``table``; adhering to the JSON `Table Schema`_
+
 
-- ``dtype`` : if True, infer dtypes, if a dict of column to dtype, then use those, if False, then don't infer dtypes at all, default is True, apply only to the data
-- ``convert_axes`` : boolean, try to convert the axes to the proper dtypes, default is True
-- ``convert_dates`` : a list of columns to parse for dates; If True, then try to parse date-like columns, default is True
-- ``keep_default_dates`` : boolean, default True. If parsing dates, then parse the default date-like columns
-- ``numpy`` : direct decoding to numpy arrays. default is False;
-  Supports numeric data only, although labels may be non-numeric. Also note that the JSON ordering **MUST** be the same for each term if ``numpy=True``
-- ``precise_float`` : boolean, default ``False``. Set to enable usage of higher precision (strtod) function when decoding string to double values. Default (``False``) is to use fast but less precise builtin functionality
-- ``date_unit`` : string, the timestamp unit to detect if converting dates. Default
+* ``dtype`` : if True, infer dtypes, if a dict of column to dtype, then use those, if ``False``, then don't infer dtypes at all, default is True, apply only to the data.
+* ``convert_axes`` : boolean, try to convert the axes to the proper dtypes, default is ``True``
+* ``convert_dates`` : a list of columns to parse for dates; If ``True``, then try to parse date-like columns, default is ``True``.
+* ``keep_default_dates`` : boolean, default ``True``. If parsing dates, then parse the default date-like columns.
+* ``numpy`` : direct decoding to NumPy arrays. default is ``False``;
+  Supports numeric data only, although labels may be non-numeric. Also note that the JSON ordering **MUST** be the same for each term if ``numpy=True``.
+* ``precise_float`` : boolean, default ``False``. Set to enable usage of higher precision (strtod) function when decoding string to double values. Default (``False``) is to use fast but less precise builtin functionality.
+* ``date_unit`` : string, the timestamp unit to detect if converting dates. Default
   None. By default the timestamp precision will be detected, if this is not desired
   then pass one of 's', 'ms', 'us' or 'ns' to force timestamp precision to
   seconds, milliseconds, microseconds or nanoseconds respectively.
+* ``lines`` : reads file as one json object per line.
+* ``encoding`` : The encoding to use to decode py3 bytes.
+* ``chunksize`` : when used in combination with ``lines=True``, return a JsonReader which reads in ``chunksize`` lines per iteration.
 
 The parser will raise one of ``ValueError/TypeError/AssertionError`` if the JSON is not parseable.
 
@@ -1504,9 +1909,11 @@ overview.
 Data Conversion
 +++++++++++++++
 
-The default of ``convert_axes=True``, ``dtype=True``, and ``convert_dates=True`` will try to parse the axes, and all of the data
-into appropriate types, including dates. If you need to override specific dtypes, pass a dict to ``dtype``. ``convert_axes`` should only
-be set to ``False`` if you need to preserve string-like numbers (e.g. '1', '2') in an axes.
+The default of ``convert_axes=True``, ``dtype=True``, and ``convert_dates=True``
+will try to parse the axes, and all of the data into appropriate types,
+including dates. If you need to override specific dtypes, pass a dict to
+``dtype``. ``convert_axes`` should only be set to ``False`` if you need to
+preserve string-like numbers (e.g. '1', '2') in an axes.
 
 .. note::
 
@@ -1550,13 +1957,13 @@ Specify dtypes for conversion:
 
 .. ipython:: python
 
-   pd.read_json('test.json', dtype={'A' : 'float32', 'bools' : 'int8'}).dtypes
+   pd.read_json('test.json', dtype={'A': 'float32', 'bools': 'int8'}).dtypes
 
 Preserve string indices:
 
 .. ipython:: python
 
-   si = DataFrame(np.zeros((4, 4)),
+   si = pd.DataFrame(np.zeros((4, 4)),
             columns=list(range(4)),
             index=[str(i) for i in range(4)])
    si
@@ -1595,7 +2002,7 @@ The Numpy Parameter
 
 If ``numpy=True`` is passed to ``read_json`` an attempt will be made to sniff
 an appropriate dtype during deserialization and to subsequently decode directly
-to numpy arrays, bypassing the need for intermediate Python objects.
+to NumPy arrays, bypassing the need for intermediate Python objects.
 
 This can provide speedups if you are deserialising a large amount of numeric
 data:
@@ -1604,17 +2011,17 @@ data:
 
    randfloats = np.random.uniform(-100, 1000, 10000)
    randfloats.shape = (1000, 10)
-   dffloats = DataFrame(randfloats, columns=list('ABCDEFGHIJ'))
+   dffloats = pd.DataFrame(randfloats, columns=list('ABCDEFGHIJ'))
 
    jsonfloats = dffloats.to_json()
 
 .. ipython:: python
 
-   timeit read_json(jsonfloats)
+   timeit pd.read_json(jsonfloats)
 
 .. ipython:: python
 
-   timeit read_json(jsonfloats, numpy=True)
+   timeit pd.read_json(jsonfloats, numpy=True)
 
 The speedup is less noticeable for smaller datasets:
 
@@ -1624,15 +2031,15 @@ The speedup is less noticeable for smaller datasets:
 
 .. ipython:: python
 
-   timeit read_json(jsonfloats)
+   timeit pd.read_json(jsonfloats)
 
 .. ipython:: python
 
-   timeit read_json(jsonfloats, numpy=True)
+   timeit pd.read_json(jsonfloats, numpy=True)
 
 .. warning::
 
-   Direct numpy decoding makes a number of assumptions and may fail or produce
+   Direct NumPy decoding makes a number of assumptions and may fail or produce
    unexpected output if these assumptions are not satisfied:
 
     - data is numeric.
@@ -1657,14 +2064,19 @@ The speedup is less noticeable for smaller datasets:
 Normalization
 '''''''''''''
 
-.. versionadded:: 0.13.0
-
 pandas provides a utility function to take a dict or list of dicts and *normalize* this semi-structured data
 into a flat table.
 
 .. ipython:: python
 
    from pandas.io.json import json_normalize
+   data = [{'id': 1, 'name': {'first': 'Coleen', 'last': 'Volk'}},
+           {'name': {'given': 'Mose', 'family': 'Regner'}},
+           {'id': 2, 'name': 'Faye Raker'}]
+   json_normalize(data)
+
+.. ipython:: python
+
    data = [{'state': 'Florida',
              'shortname': 'FL',
              'info': {
@@ -1683,154 +2095,358 @@ into a flat table.
 
    json_normalize(data, 'counties', ['state', 'shortname', ['info', 'governor']])
 
-HTML
-----
+.. _io.jsonl:
 
-.. _io.read_html:
+Line delimited json
+'''''''''''''''''''
 
-Reading HTML Content
-''''''''''''''''''''''
+.. versionadded:: 0.19.0
 
-.. warning::
+pandas is able to read and write line-delimited json files that are common in data processing pipelines
+using Hadoop or Spark.
 
-   We **highly encourage** you to read the :ref:`HTML parsing gotchas
-   <html-gotchas>` regarding the issues surrounding the
-   BeautifulSoup4/html5lib/lxml parsers.
+.. versionadded:: 0.21.0
 
-.. versionadded:: 0.12.0
+For line-delimited json files, pandas can also return an iterator which reads in ``chunksize`` lines at a time. This can be useful for large files or to read from a stream.
 
-The top-level :func:`~pandas.io.html.read_html` function can accept an HTML
-string/file/URL and will parse HTML tables into list of pandas DataFrames.
-Let's look at a few examples.
+.. ipython:: python
 
-.. note::
+  jsonl = '''
+      {"a": 1, "b": 2}
+      {"a": 3, "b": 4}
+  '''
+  df = pd.read_json(jsonl, lines=True)
+  df
+  df.to_json(orient='records', lines=True)
 
-   ``read_html`` returns a ``list`` of ``DataFrame`` objects, even if there is
-   only a single table contained in the HTML content
+  # reader is an iterator that returns `chunksize` lines each iteration
+  reader = pd.read_json(StringIO(jsonl), lines=True, chunksize=1)
+  reader
+  for chunk in reader:
+      print(chunk)
 
-Read a URL with no options
+.. _io.table_schema:
 
-.. ipython:: python
+Table Schema
+''''''''''''
 
-   url = 'http://www.fdic.gov/bank/individual/failed/banklist.html'
-   dfs = read_html(url)
-   dfs
+.. versionadded:: 0.20.0
 
-.. note::
+`Table Schema`_ is a spec for describing tabular datasets as a JSON
+object. The JSON includes information on the field names, types, and
+other attributes. You can use the orient ``table`` to build
+a JSON string with two fields, ``schema`` and ``data``.
 
-   The data from the above URL changes every Monday so the resulting data above
-   and the data below may be slightly different.
+.. ipython:: python
 
-Read in the content of the file from the above URL and pass it to ``read_html``
-as a string
+   df = pd.DataFrame(
+       {'A': [1, 2, 3],
+        'B': ['a', 'b', 'c'],
+        'C': pd.date_range('2016-01-01', freq='d', periods=3),
+       }, index=pd.Index(range(3), name='idx'))
+   df
+   df.to_json(orient='table', date_format="iso")
 
-.. ipython:: python
-   :suppress:
+The ``schema`` field contains the ``fields`` key, which itself contains
+a list of column name to type pairs, including the ``Index`` or ``MultiIndex``
+(see below for a list of types).
+The ``schema`` field also contains a ``primaryKey`` field if the (Multi)index
+is unique.
 
-   import os
-   file_path = os.path.abspath(os.path.join('source', '_static', 'banklist.html'))
+The second field, ``data``, contains the serialized data with the ``records``
+orient.
+The index is included, and any datetimes are ISO 8601 formatted, as required
+by the Table Schema spec.
 
-.. ipython:: python
+The full list of types supported are described in the Table Schema
+spec. This table shows the mapping from pandas types:
 
-   with open(file_path, 'r') as f:
-       dfs = read_html(f.read())
-   dfs
+=============== =================
+Pandas type     Table Schema type
+=============== =================
+int64           integer
+float64         number
+bool            boolean
+datetime64[ns]  datetime
+timedelta64[ns] duration
+categorical     any
+object          str
+=============== =================
 
-You can even pass in an instance of ``StringIO`` if you so desire
+A few notes on the generated table schema:
 
-.. ipython:: python
+* The ``schema`` object contains a ``pandas_version`` field. This contains
+  the version of pandas' dialect of the schema, and will be incremented
+  with each revision.
+* All dates are converted to UTC when serializing. Even timezone naive values,
+  which are treated as UTC with an offset of 0.
 
-   with open(file_path, 'r') as f:
-       sio = StringIO(f.read())
+  .. ipython:: python
 
-   dfs = read_html(sio)
-   dfs
+     from pandas.io.json import build_table_schema
+     s = pd.Series(pd.date_range('2016', periods=4))
+     build_table_schema(s)
 
-.. note::
+* datetimes with a timezone (before serializing), include an additional field
+  ``tz`` with the time zone name (e.g. ``'US/Central'``).
 
-   The following examples are not run by the IPython evaluator due to the fact
-   that having so many network-accessing functions slows down the documentation
-   build. If you spot an error or an example that doesn't run, please do not
-   hesitate to report it over on `pandas GitHub issues page
-   <http://www.github.com/pydata/pandas/issues>`__.
+  .. ipython:: python
 
+     s_tz = pd.Series(pd.date_range('2016', periods=12,
+                                    tz='US/Central'))
+     build_table_schema(s_tz)
 
-Read a URL and match a table that contains specific text
+* Periods are converted to timestamps before serialization, and so have the
+  same behavior of being converted to UTC. In addition, periods will contain
+  and additional field ``freq`` with the period's frequency, e.g. ``'A-DEC'``.
 
-.. code-block:: python
+  .. ipython:: python
 
-   match = 'Metcalf Bank'
-   df_list = read_html(url, match=match)
+     s_per = pd.Series(1, index=pd.period_range('2016', freq='A-DEC',
+                                                periods=4))
+     build_table_schema(s_per)
 
-Specify a header row (by default ``<th>`` elements are used to form the column
-index); if specified, the header row is taken from the data minus the parsed
-header elements (``<th>`` elements).
+* Categoricals use the ``any`` type and an ``enum`` constraint listing
+  the set of possible values. Additionally, an ``ordered`` field is included:
+
+  .. ipython:: python
+
+     s_cat = pd.Series(pd.Categorical(['a', 'b', 'a']))
+     build_table_schema(s_cat)
+
+* A ``primaryKey`` field, containing an array of labels, is included
+  *if the index is unique*:
+
+  .. ipython:: python
+
+     s_dupe = pd.Series([1, 2], index=[1, 1])
+     build_table_schema(s_dupe)
+
+* The ``primaryKey`` behavior is the same with MultiIndexes, but in this
+  case the ``primaryKey`` is an array:
+
+  .. ipython:: python
+
+     s_multi = pd.Series(1, index=pd.MultiIndex.from_product([('a', 'b'),
+                                                              (0, 1)]))
+     build_table_schema(s_multi)
+
+* The default naming roughly follows these rules:
+
+    * For series, the ``object.name`` is used. If that's none, then the
+      name is ``values``
+    * For ``DataFrames``, the stringified version of the column name is used
+    * For ``Index`` (not ``MultiIndex``), ``index.name`` is used, with a
+      fallback to ``index`` if that is None.
+    * For ``MultiIndex``, ``mi.names`` is used. If any level has no name,
+      then ``level_<i>`` is used.
+
+
+.. versionadded:: 0.23.0
+
+``read_json`` also accepts ``orient='table'`` as an argument. This allows for
+the preservation of metadata such as dtypes and index names in a
+round-trippable manner.
+
+  .. ipython:: python
+
+   df = pd.DataFrame({'foo': [1, 2, 3, 4],
+		      'bar': ['a', 'b', 'c', 'd'],
+		      'baz': pd.date_range('2018-01-01', freq='d', periods=4),
+		      'qux': pd.Categorical(['a', 'b', 'c', 'c'])
+		      }, index=pd.Index(range(4), name='idx'))
+   df
+   df.dtypes
+
+   df.to_json('test.json', orient='table')
+   new_df = pd.read_json('test.json', orient='table')
+   new_df
+   new_df.dtypes
+
+Please note that the literal string 'index' as the name of an :class:`Index`
+is not round-trippable, nor are any names beginning with ``'level_'`` within a
+:class:`MultiIndex`. These are used by default in :func:`DataFrame.to_json` to
+indicate missing values and the subsequent read cannot distinguish the intent.
+
+.. ipython:: python
+   :okwarning:
+
+   df.index.name = 'index'
+   df.to_json('test.json', orient='table')
+   new_df = pd.read_json('test.json', orient='table')
+   print(new_df.index.name)
+
+.. _Table Schema: http://specs.frictionlessdata.io/json-table-schema/
+
+HTML
+----
+
+.. _io.read_html:
+
+Reading HTML Content
+''''''''''''''''''''''
+
+.. warning::
+
+   We **highly encourage** you to read the :ref:`HTML Table Parsing gotchas <io.html.gotchas>`
+   below regarding the issues surrounding the BeautifulSoup4/html5lib/lxml parsers.
+
+The top-level :func:`~pandas.io.html.read_html` function can accept an HTML
+string/file/URL and will parse HTML tables into list of pandas ``DataFrames``.
+Let's look at a few examples.
+
+.. note::
+
+   ``read_html`` returns a ``list`` of ``DataFrame`` objects, even if there is
+   only a single table contained in the HTML content.
+
+Read a URL with no options:
+
+.. ipython:: python
+
+   url = 'http://www.fdic.gov/bank/individual/failed/banklist.html'
+   dfs = pd.read_html(url)
+   dfs
+
+.. note::
+
+   The data from the above URL changes every Monday so the resulting data above
+   and the data below may be slightly different.
+
+Read in the content of the file from the above URL and pass it to ``read_html``
+as a string:
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   file_path = os.path.abspath(os.path.join('source', '_static', 'banklist.html'))
+
+.. ipython:: python
+
+   with open(file_path, 'r') as f:
+       dfs = pd.read_html(f.read())
+   dfs
+
+You can even pass in an instance of ``StringIO`` if you so desire:
+
+.. ipython:: python
+
+   with open(file_path, 'r') as f:
+       sio = StringIO(f.read())
+
+   dfs = pd.read_html(sio)
+   dfs
+
+.. note::
+
+   The following examples are not run by the IPython evaluator due to the fact
+   that having so many network-accessing functions slows down the documentation
+   build. If you spot an error or an example that doesn't run, please do not
+   hesitate to report it over on `pandas GitHub issues page
+   <http://www.github.com/pandas-dev/pandas/issues>`__.
+
+
+Read a URL and match a table that contains specific text:
 
 .. code-block:: python
 
-   dfs = read_html(url, header=0)
+   match = 'Metcalf Bank'
+   df_list = pd.read_html(url, match=match)
 
-Specify an index column
+Specify a header row (by default ``<th>`` or ``<td>`` elements located within a
+``<thead>`` are used to form the column index, if multiple rows are contained within
+``<thead>`` then a MultiIndex is created); if specified, the header row is taken
+from the data minus the parsed header elements (``<th>`` elements).
 
 .. code-block:: python
 
-   dfs = read_html(url, index_col=0)
+   dfs = pd.read_html(url, header=0)
 
-Specify a number of rows to skip
+Specify an index column:
 
 .. code-block:: python
 
-   dfs = read_html(url, skiprows=0)
+   dfs = pd.read_html(url, index_col=0)
 
-Specify a number of rows to skip using a list (``xrange`` (Python 2 only) works
-as well)
+Specify a number of rows to skip:
 
 .. code-block:: python
 
-   dfs = read_html(url, skiprows=range(2))
+   dfs = pd.read_html(url, skiprows=0)
 
-Don't infer numeric and date types
+Specify a number of rows to skip using a list (``xrange`` (Python 2 only) works
+as well):
 
 .. code-block:: python
 
-   dfs = read_html(url, infer_types=False)
+   dfs = pd.read_html(url, skiprows=range(2))
 
-Specify an HTML attribute
+Specify an HTML attribute:
 
 .. code-block:: python
 
-   dfs1 = read_html(url, attrs={'id': 'table'})
-   dfs2 = read_html(url, attrs={'class': 'sortable'})
+   dfs1 = pd.read_html(url, attrs={'id': 'table'})
+   dfs2 = pd.read_html(url, attrs={'class': 'sortable'})
    print(np.array_equal(dfs1[0], dfs2[0]))  # Should be True
 
-Use some combination of the above
+Specify values that should be converted to NaN:
+
+.. code-block:: python
+
+   dfs = pd.read_html(url, na_values=['No Acquirer'])
+
+.. versionadded:: 0.19
+
+Specify whether to keep the default set of NaN values:
+
+.. code-block:: python
+
+   dfs = pd.read_html(url, keep_default_na=False)
+
+.. versionadded:: 0.19
+
+Specify converters for columns. This is useful for numerical text data that has
+leading zeros.  By default columns that are numerical are cast to numeric
+types and the leading zeros are lost. To avoid this, we can convert these
+columns to strings.
+
+.. code-block:: python
+
+   url_mcc = 'https://en.wikipedia.org/wiki/Mobile_country_code'
+   dfs = pd.read_html(url_mcc, match='Telekom Albania', header=0, converters={'MNC':
+   str})
+
+.. versionadded:: 0.19
+
+Use some combination of the above:
 
 .. code-block:: python
 
-   dfs = read_html(url, match='Metcalf Bank', index_col=0)
+   dfs = pd.read_html(url, match='Metcalf Bank', index_col=0)
 
-Read in pandas ``to_html`` output (with some loss of floating point precision)
+Read in pandas ``to_html`` output (with some loss of floating point precision):
 
 .. code-block:: python
 
-   df = DataFrame(randn(2, 2))
+   df = pd.DataFrame(randn(2, 2))
    s = df.to_html(float_format='{0:.40g}'.format)
-   dfin = read_html(s, index_col=0)
+   dfin = pd.read_html(s, index_col=0)
 
 The ``lxml`` backend will raise an error on a failed parse if that is the only
-parser you provide (if you only have a single parser you can provide just a
+parser you provide. If you only have a single parser you can provide just a
 string, but it is considered good practice to pass a list with one string if,
-for example, the function expects a sequence of strings)
+for example, the function expects a sequence of strings. You may use:
 
 .. code-block:: python
 
-   dfs = read_html(url, 'Metcalf Bank', index_col=0, flavor=['lxml'])
+   dfs = pd.read_html(url, 'Metcalf Bank', index_col=0, flavor=['lxml'])
 
-or
+Or you could pass ``flavor='lxml'`` without a list:
 
 .. code-block:: python
 
-   dfs = read_html(url, 'Metcalf Bank', index_col=0, flavor='lxml')
+   dfs = pd.read_html(url, 'Metcalf Bank', index_col=0, flavor='lxml')
 
 However, if you have bs4 and html5lib installed and pass ``None`` or ``['lxml',
 'bs4']`` then the parse will most likely succeed. Note that *as soon as a parse
@@ -1838,7 +2454,7 @@ succeeds, the function will return*.
 
 .. code-block:: python
 
-   dfs = read_html(url, 'Metcalf Bank', index_col=0, flavor=['lxml', 'bs4'])
+   dfs = pd.read_html(url, 'Metcalf Bank', index_col=0, flavor=['lxml', 'bs4'])
 
 
 .. _io.html:
@@ -1866,7 +2482,7 @@ in the method ``to_string`` described above.
 
 .. ipython:: python
 
-   df = DataFrame(randn(2, 2))
+   df = pd.DataFrame(randn(2, 2))
    df
    print(df.to_html())  # raw html
 
@@ -1880,7 +2496,7 @@ HTML:
 .. raw:: html
    :file: _static/basic.html
 
-The ``columns`` argument will limit the columns shown
+The ``columns`` argument will limit the columns shown:
 
 .. ipython:: python
 
@@ -1897,7 +2513,7 @@ HTML:
    :file: _static/columns.html
 
 ``float_format`` takes a Python callable to control the precision of floating
-point values
+point values:
 
 .. ipython:: python
 
@@ -1914,7 +2530,7 @@ HTML:
    :file: _static/float_format.html
 
 ``bold_rows`` will make the row labels bold by default, but you can turn that
-off
+off:
 
 .. ipython:: python
 
@@ -1942,7 +2558,7 @@ Finally, the ``escape`` argument allows you to control whether the
 
 .. ipython:: python
 
-   df = DataFrame({'a': list('&<>'), 'b': randn(3)})
+   df = pd.DataFrame({'a': list('&<>'), 'b': randn(3)})
 
 
 .. ipython:: python
@@ -1974,6 +2590,83 @@ Not escaped:
    Some browsers may not show a difference in the rendering of the previous two
    HTML tables.
 
+
+.. _io.html.gotchas:
+
+HTML Table Parsing Gotchas
+''''''''''''''''''''''''''
+
+There are some versioning issues surrounding the libraries that are used to
+parse HTML tables in the top-level pandas io function ``read_html``.
+
+**Issues with** |lxml|_
+
+* Benefits
+
+    * |lxml|_ is very fast.
+
+    * |lxml|_ requires Cython to install correctly.
+
+* Drawbacks
+
+    * |lxml|_ does *not* make any guarantees about the results of its parse
+      *unless* it is given |svm|_.
+
+    * In light of the above, we have chosen to allow you, the user, to use the
+      |lxml|_ backend, but **this backend will use** |html5lib|_ if |lxml|_
+      fails to parse
+
+    * It is therefore *highly recommended* that you install both
+      |BeautifulSoup4|_ and |html5lib|_, so that you will still get a valid
+      result (provided everything else is valid) even if |lxml|_ fails.
+
+**Issues with** |BeautifulSoup4|_ **using** |lxml|_ **as a backend**
+
+* The above issues hold here as well since |BeautifulSoup4|_ is essentially
+  just a wrapper around a parser backend.
+
+**Issues with** |BeautifulSoup4|_ **using** |html5lib|_ **as a backend**
+
+* Benefits
+
+    * |html5lib|_ is far more lenient than |lxml|_ and consequently deals
+      with *real-life markup* in a much saner way rather than just, e.g.,
+      dropping an element without notifying you.
+
+    * |html5lib|_ *generates valid HTML5 markup from invalid markup
+      automatically*. This is extremely important for parsing HTML tables,
+      since it guarantees a valid document. However, that does NOT mean that
+      it is "correct", since the process of fixing markup does not have a
+      single definition.
+
+    * |html5lib|_ is pure Python and requires no additional build steps beyond
+      its own installation.
+
+* Drawbacks
+
+    * The biggest drawback to using |html5lib|_ is that it is slow as
+      molasses.  However consider the fact that many tables on the web are not
+      big enough for the parsing algorithm runtime to matter. It is more
+      likely that the bottleneck will be in the process of reading the raw
+      text from the URL over the web, i.e., IO (input-output). For very large
+      tables, this might not be true.
+
+
+.. |svm| replace:: **strictly valid markup**
+.. _svm: http://validator.w3.org/docs/help.html#validation_basics
+
+.. |html5lib| replace:: **html5lib**
+.. _html5lib: https://github.com/html5lib/html5lib-python
+
+.. |BeautifulSoup4| replace:: **BeautifulSoup4**
+.. _BeautifulSoup4: http://www.crummy.com/software/BeautifulSoup
+
+.. |lxml| replace:: **lxml**
+.. _lxml: http://lxml.de
+
+
+
+
 .. _io.excel:
 
 Excel files
@@ -1983,8 +2676,8 @@ The :func:`~pandas.read_excel` method can read Excel 2003 (``.xls``) and
 Excel 2007+ (``.xlsx``) files using the ``xlrd`` Python
 module.  The :meth:`~DataFrame.to_excel` instance method is used for
 saving a ``DataFrame`` to Excel.  Generally the semantics are
-similar to working with :ref:`csv<io.read_csv_table>` data.  See the :ref:`cookbook<cookbook.excel>` for some
-advanced strategies
+similar to working with :ref:`csv<io.read_csv_table>` data.
+See the :ref:`cookbook<cookbook.excel>` for some advanced strategies.
 
 .. _io.excel_reader:
 
@@ -1992,12 +2685,12 @@ Reading Excel Files
 '''''''''''''''''''
 
 In the most basic use-case, ``read_excel`` takes a path to an Excel
-file, and the ``sheetname`` indicating which sheet to parse.
+file, and the ``sheet_name`` indicating which sheet to parse.
 
 .. code-block:: python
 
    # Returns a DataFrame
-   read_excel('path_to_file.xls', sheetname='Sheet1')
+   read_excel('path_to_file.xls', sheet_name='Sheet1')
 
 
 .. _io.excel.excelfile_class:
@@ -2005,14 +2698,14 @@ file, and the ``sheetname`` indicating which sheet to parse.
 ``ExcelFile`` class
 +++++++++++++++++++
 
-To faciliate working with multiple sheets from the same file, the ``ExcelFile``
-class can be used to wrap the file and can be be passed into ``read_excel``
+To facilitate working with multiple sheets from the same file, the ``ExcelFile``
+class can be used to wrap the file and can be passed into ``read_excel``
 There will be a performance benefit for reading multiple sheets as the file is
 read into memory only once.
 
 .. code-block:: python
 
-   xlsx = pd.ExcelFile('path_to_file.xls)
+   xlsx = pd.ExcelFile('path_to_file.xls')
    df = pd.read_excel(xlsx, 'Sheet1')
 
 The ``ExcelFile`` class can also be used as a context manager.
@@ -2027,7 +2720,7 @@ The ``sheet_names`` property will generate
 a list of the sheet names in the file.
 
 The primary use-case for an ``ExcelFile`` is parsing multiple sheets with
-different parameters
+different parameters:
 
 .. code-block:: python
 
@@ -2051,31 +2744,22 @@ of sheet names can simply be passed to ``read_excel`` with no loss in performanc
     # equivalent using the read_excel function
     data = read_excel('path_to_file.xls', ['Sheet1', 'Sheet2'], index_col=None, na_values=['NA'])
 
-.. versionadded:: 0.12
-
-``ExcelFile`` has been moved to the top level namespace.
-
-.. versionadded:: 0.17
-
-``read_excel`` can take an ``ExcelFile`` object as input
-
-
 .. _io.excel.specifying_sheets:
 
 Specifying Sheets
 +++++++++++++++++
 
-.. note :: The second argument is ``sheetname``, not to be confused with ``ExcelFile.sheet_names``
+.. note :: The second argument is ``sheet_name``, not to be confused with ``ExcelFile.sheet_names``.
 
 .. note :: An ExcelFile's attribute ``sheet_names`` provides access to a list of sheets.
 
-- The arguments ``sheetname`` allows specifying the sheet or sheets to read.
-- The default value for ``sheetname`` is 0, indicating to read the first sheet
-- Pass a string to refer to the name of a particular sheet in the workbook.
-- Pass an integer to refer to the index of a sheet. Indices follow Python
+* The arguments ``sheet_name`` allows specifying the sheet or sheets to read.
+* The default value for ``sheet_name`` is 0, indicating to read the first sheet
+* Pass a string to refer to the name of a particular sheet in the workbook.
+* Pass an integer to refer to the index of a sheet. Indices follow Python
   convention, beginning at 0.
-- Pass a list of either strings or integers, to return a dictionary of specified sheets.
-- Pass a ``None`` to return a dictionary of all available sheets.
+* Pass a list of either strings or integers, to return a dictionary of specified sheets.
+* Pass a ``None`` to return a dictionary of all available sheets.
 
 .. code-block:: python
 
@@ -2101,22 +2785,17 @@ Using None to get all sheets:
 .. code-block:: python
 
    # Returns a dictionary of DataFrames
-   read_excel('path_to_file.xls',sheetname=None)
+   read_excel('path_to_file.xls', sheet_name=None)
 
 Using a list to get multiple sheets:
 
 .. code-block:: python
 
    # Returns the 1st and 4th sheet, as a dictionary of DataFrames.
-   read_excel('path_to_file.xls',sheetname=['Sheet1',3])
+   read_excel('path_to_file.xls', sheet_name=['Sheet1', 3])
 
-.. versionadded:: 0.16
-
-``read_excel`` can read more than one sheet, by setting ``sheetname`` to either
+``read_excel`` can read more than one sheet, by setting ``sheet_name`` to either
 a list of sheet names, a list of sheet positions, or ``None`` to read all sheets.
-
-.. versionadded:: 0.13
-
 Sheets can be specified by sheet index or sheet name, using an integer or string,
 respectively.
 
@@ -2125,8 +2804,6 @@ respectively.
 Reading a ``MultiIndex``
 ++++++++++++++++++++++++
 
-.. versionadded:: 0.17
-
 ``read_excel`` can read a ``MultiIndex`` index, by passing a list of columns to ``index_col``
 and a ``MultiIndex`` column by passing a list of rows to ``header``.  If either the ``index``
 or ``columns`` have serialized level names those will be read in as well by specifying
@@ -2136,10 +2813,10 @@ For example, to read in a ``MultiIndex`` index without names:
 
 .. ipython:: python
 
-   df = pd.DataFrame({'a':[1,2,3,4], 'b':[5,6,7,8]},
-                     index=pd.MultiIndex.from_product([['a','b'],['c','d']]))
+   df = pd.DataFrame({'a':[1, 2, 3, 4], 'b':[5, 6, 7, 8]},
+                     index=pd.MultiIndex.from_product([['a', 'b'],['c', 'd']]))
    df.to_excel('path_to_file.xlsx')
-   df = pd.read_excel('path_to_file.xlsx', index_col=[0,1])
+   df = pd.read_excel('path_to_file.xlsx', index_col=[0, 1])
    df
 
 If the index has level names, they will parsed as well, using the same
@@ -2149,19 +2826,18 @@ parameters.
 
    df.index = df.index.set_names(['lvl1', 'lvl2'])
    df.to_excel('path_to_file.xlsx')
-   df = pd.read_excel('path_to_file.xlsx', index_col=[0,1])
+   df = pd.read_excel('path_to_file.xlsx', index_col=[0, 1])
    df
 
 
 If the source file has both ``MultiIndex`` index and columns, lists specifying each
-should be passed to ``index_col`` and ``header``
+should be passed to ``index_col`` and ``header``:
 
 .. ipython:: python
 
-   df.columns = pd.MultiIndex.from_product([['a'],['b', 'd']], names=['c1', 'c2'])
+   df.columns = pd.MultiIndex.from_product([['a'], ['b', 'd']], names=['c1', 'c2'])
    df.to_excel('path_to_file.xlsx')
-   df = pd.read_excel('path_to_file.xlsx',
-                       index_col=[0,1], header=[0,1])
+   df = pd.read_excel('path_to_file.xlsx', index_col=[0, 1], header=[0, 1])
    df
 
 .. ipython:: python
@@ -2170,37 +2846,47 @@ should be passed to ``index_col`` and ``header``
    import os
    os.remove('path_to_file.xlsx')
 
-.. warning::
-
-   Excel files saved in version 0.16.2 or prior that had index names will still able to be read in,
-   but the ``has_index_names`` argument must specified to ``True``.
-
 
 Parsing Specific Columns
 ++++++++++++++++++++++++
 
 It is often the case that users will insert columns to do temporary computations
-in Excel and you may not want to read in those columns. `read_excel` takes
-a `parse_cols` keyword to allow you to specify a subset of columns to parse.
+in Excel and you may not want to read in those columns. ``read_excel`` takes
+a ``usecols`` keyword to allow you to specify a subset of columns to parse.
 
-If `parse_cols` is an integer, then it is assumed to indicate the last column
+If ``usecols`` is an integer, then it is assumed to indicate the last column
 to be parsed.
 
 .. code-block:: python
 
-   read_excel('path_to_file.xls', 'Sheet1', parse_cols=2)
+   read_excel('path_to_file.xls', 'Sheet1', usecols=2)
 
-If `parse_cols` is a list of integers, then it is assumed to be the file column
+If `usecols` is a list of integers, then it is assumed to be the file column
 indices to be parsed.
 
 .. code-block:: python
 
-   read_excel('path_to_file.xls', 'Sheet1', parse_cols=[0, 2, 3])
+   read_excel('path_to_file.xls', 'Sheet1', usecols=[0, 2, 3])
+
+Element order is ignored, so ``usecols=[0, 1]`` is the same as ``[1, 0]``.
+
+Parsing Dates
++++++++++++++
+
+Datetime-like values are normally automatically converted to the appropriate
+dtype when reading the excel file. But if you have a column of strings that
+*look* like dates (but are not actually formatted as dates in excel), you can
+use the ``parse_dates`` keyword to parse those strings to datetimes:
+
+.. code-block:: python
+
+   read_excel('path_to_file.xls', 'Sheet1', parse_dates=['date_strings'])
+
 
 Cell Converters
 +++++++++++++++
 
-It is possible to transform the contents of Excel cells via the `converters`
+It is possible to transform the contents of Excel cells via the ``converters``
 option. For instance, to convert a column to boolean:
 
 .. code-block:: python
@@ -2219,6 +2905,20 @@ missing data to recover integer dtype:
    cfun = lambda x: int(x) if x else -1
    read_excel('path_to_file.xls', 'Sheet1', converters={'MyInts': cfun})
 
+dtype Specifications
+++++++++++++++++++++
+
+.. versionadded:: 0.20
+
+As an alternative to converters, the type for an entire column can
+be specified using the `dtype` keyword, which takes a dictionary
+mapping column names to types.  To interpret data with
+no type inference, use the type ``str`` or ``object``.
+
+.. code-block:: python
+
+   read_excel('path_to_file.xls', dtype={'MyInts': 'int64', 'MyText': str})
+
 .. _io.excel_writer:
 
 Writing Excel Files
@@ -2227,11 +2927,11 @@ Writing Excel Files
 Writing Excel Files to Disk
 +++++++++++++++++++++++++++
 
-To write a DataFrame object to a sheet of an Excel file, you can use the
+To write a ``DataFrame`` object to a sheet of an Excel file, you can use the
 ``to_excel`` instance method.  The arguments are largely the same as ``to_csv``
 described above, the first argument being the name of the excel file, and the
-optional second argument the name of the sheet to which the DataFrame should be
-written.  For example:
+optional second argument the name of the sheet to which the ``DataFrame`` should be
+written. For example:
 
 .. code-block:: python
 
@@ -2241,19 +2941,16 @@ Files with a ``.xls`` extension will be written using ``xlwt`` and those with a
 ``.xlsx`` extension will be written using ``xlsxwriter`` (if available) or
 ``openpyxl``.
 
-The DataFrame will be written in a way that tries to mimic the REPL output. One
-difference from 0.12.0 is that the ``index_label`` will be placed in the second
-row instead of the first. You can get the previous behaviour by setting the
+The ``DataFrame`` will be written in a way that tries to mimic the REPL output.
+The ``index_label`` will be placed in the second
+row instead of the first. You can place it in the first row by setting the
 ``merge_cells`` option in ``to_excel()`` to ``False``:
 
 .. code-block:: python
 
    df.to_excel('path_to_file.xlsx', index_label='label', merge_cells=False)
 
-The Panel class also has a ``to_excel`` instance method,
-which writes each DataFrame in the Panel to a separate sheet.
-
-In order to write separate DataFrames to separate sheets in a single Excel file,
+In order to write separate ``DataFrames`` to separate sheets in a single Excel file,
 one can pass an :class:`~pandas.io.excel.ExcelWriter`.
 
 .. code-block:: python
@@ -2276,15 +2973,9 @@ one can pass an :class:`~pandas.io.excel.ExcelWriter`.
 Writing Excel Files to Memory
 +++++++++++++++++++++++++++++
 
-.. versionadded:: 0.17
-
 Pandas supports writing Excel files to buffer-like objects such as ``StringIO`` or
 ``BytesIO`` using :class:`~pandas.io.excel.ExcelWriter`.
 
-.. versionadded:: 0.17
-
-Added support for Openpyxl >= 2.2
-
 .. code-block:: python
 
    # Safe import for either Python 2.x or 3.x
@@ -2314,37 +3005,34 @@ Added support for Openpyxl >= 2.2
     ``'xlsxwriter'`` will produce an Excel 2007-format workbook (xlsx). If
     omitted, an Excel 2007-formatted workbook is produced.
 
+
 .. _io.excel.writers:
 
 Excel writer engines
 ''''''''''''''''''''
 
-.. versionadded:: 0.13
-
-``pandas`` chooses an Excel writer via two methods:
+Pandas chooses an Excel writer via two methods:
 
 1. the ``engine`` keyword argument
 2. the filename extension (via the default specified in config options)
 
-By default, ``pandas`` uses the `XlsxWriter`_  for ``.xlsx`` and `openpyxl`_
-for ``.xlsm`` files and `xlwt`_ for ``.xls`` files.  If you have multiple
+By default, pandas uses the `XlsxWriter`_  for ``.xlsx``, `openpyxl`_
+for ``.xlsm``, and `xlwt`_ for ``.xls`` files. If you have multiple
 engines installed, you can set the default engine through :ref:`setting the
 config options <options>` ``io.excel.xlsx.writer`` and
 ``io.excel.xls.writer``. pandas will fall back on `openpyxl`_ for ``.xlsx``
 files if `Xlsxwriter`_ is not available.
 
-.. _XlsxWriter: http://xlsxwriter.readthedocs.org
-.. _openpyxl: http://openpyxl.readthedocs.org/
+.. _XlsxWriter: https://xlsxwriter.readthedocs.io
+.. _openpyxl: https://openpyxl.readthedocs.io/
 .. _xlwt: http://www.python-excel.org
 
 To specify which writer you want to use, you can pass an engine keyword
 argument to ``to_excel`` and to ``ExcelWriter``. The built-in engines are:
 
-- ``openpyxl``: This includes stable support for Openpyxl from 1.6.1. However,
-  it is advised to use version 2.2 and higher, especially when working with
-  styles.
-- ``xlsxwriter``
-- ``xlwt``
+* ``openpyxl``: version 2.4 or higher is required
+* ``xlsxwriter``
+* ``xlwt``
 
 .. code-block:: python
 
@@ -2360,15 +3048,27 @@ argument to ``to_excel`` and to ``ExcelWriter``. The built-in engines are:
 
    df.to_excel('path_to_file.xlsx', sheet_name='Sheet1')
 
+.. _io.excel.style:
+
+Style and Formatting
+''''''''''''''''''''
+
+The look and feel of Excel worksheets created from pandas can be modified using the following parameters on the ``DataFrame``'s ``to_excel`` method.
+
+* ``float_format`` : Format string for floating point numbers (default ``None``).
+* ``freeze_panes`` : A tuple of two integers representing the bottommost row and rightmost column to freeze. Each of these parameters is one-based, so (1, 1) will freeze the first row and first column (default ``None``).
+
+
+
 .. _io.clipboard:
 
 Clipboard
 ---------
 
-A handy way to grab data is to use the ``read_clipboard`` method, which takes
-the contents of the clipboard buffer and passes them to the ``read_table``
-method. For instance, you can copy the following
-text to the clipboard (CTRL-C on many operating systems):
+A handy way to grab data is to use the :meth:`~DataFrame.read_clipboard` method,
+which takes the contents of the clipboard buffer and passes them to the
+``read_table`` method. For instance, you can copy the following text to the
+clipboard (CTRL-C on many operating systems):
 
 .. code-block:: python
 
@@ -2377,7 +3077,7 @@ text to the clipboard (CTRL-C on many operating systems):
    y 2 5 q
    z 3 6 r
 
-And then import the data directly to a DataFrame by calling:
+And then import the data directly to a ``DataFrame`` by calling:
 
 .. code-block:: python
 
@@ -2387,14 +3087,15 @@ And then import the data directly to a DataFrame by calling:
 
    clipdf
 
-The ``to_clipboard`` method can be used to write the contents of a DataFrame to
+
+The ``to_clipboard`` method can be used to write the contents of a ``DataFrame`` to
 the clipboard. Following which you can paste the clipboard contents into other
 applications (CTRL-V on many operating systems). Here we illustrate writing a
-DataFrame into clipboard and reading it back.
+``DataFrame`` into clipboard and reading it back.
 
 .. ipython:: python
 
-    df=pd.DataFrame(randn(5,3))
+    df = pd.DataFrame(randn(5, 3))
     df
     df.to_clipboard()
     pd.read_clipboard()
@@ -2403,7 +3104,7 @@ We can see that we got the same content back, which we had earlier written to th
 
 .. note::
 
-   You may need to install xclip or xsel (with gtk or PyQt4 modules) on Linux to use these methods.
+   You may need to install xclip or xsel (with gtk, PyQt5, PyQt4 or qtpy) on Linux to use these methods.
 
 .. _io.pickle:
 
@@ -2424,7 +3125,7 @@ any pickled pandas object (or any other pickled object) from file:
 
 .. ipython:: python
 
-   read_pickle('foo.pkl')
+   pd.read_pickle('foo.pkl')
 
 .. ipython:: python
    :suppress:
@@ -2436,28 +3137,88 @@ any pickled pandas object (or any other pickled object) from file:
 
    Loading pickled data received from untrusted sources can be unsafe.
 
-   See: http://docs.python.org/2.7/library/pickle.html
+   See: https://docs.python.org/3/library/pickle.html
 
 .. warning::
 
-   Several internal refactorings, 0.13 (:ref:`Series Refactoring <whatsnew_0130.refactoring>`), and 0.15 (:ref:`Index Refactoring <whatsnew_0150.refactoring>`),
-   preserve compatibility with pickles created prior to these versions. However, these must
-   be read with ``pd.read_pickle``, rather than the default python ``pickle.load``.
-   See `this question <http://stackoverflow.com/questions/20444593/pandas-compiled-from-source-default-pickle-behavior-changed>`__
+   Several internal refactoring have been done while still preserving
+   compatibility with pickles created with older versions of pandas. However,
+   for such cases, pickled ``DataFrames``, ``Series`` etc, must be read with
+   ``pd.read_pickle``, rather than ``pickle.load``.
+
+   See `here <http://pandas.pydata.org/pandas-docs/stable/whatsnew.html#whatsnew-0130-refactoring>`__
+   and `here <http://pandas.pydata.org/pandas-docs/stable/whatsnew.html#whatsnew-0150-refactoring>`__
+   for some examples of compatibility-breaking changes. See
+   `this question <http://stackoverflow.com/questions/20444593/pandas-compiled-from-source-default-pickle-behavior-changed>`__
    for a detailed explanation.
 
-.. note::
+.. _io.pickle.compression:
 
-    These methods were previously ``pd.save`` and ``pd.load``, prior to 0.12.0, and are now deprecated.
+Compressed pickle files
+'''''''''''''''''''''''
 
-.. _io.msgpack:
+.. versionadded:: 0.20.0
+
+:func:`read_pickle`, :meth:`DataFrame.to_pickle` and :meth:`Series.to_pickle` can read
+and write compressed pickle files. The compression types of ``gzip``, ``bz2``, ``xz`` are supported for reading and writing.
+The ``zip`` file format only supports reading and must contain only one data file
+to be read.
+
+The compression type can be an explicit parameter or be inferred from the file extension.
+If 'infer', then use ``gzip``, ``bz2``, ``zip``, or ``xz`` if filename ends in ``'.gz'``, ``'.bz2'``, ``'.zip'``, or
+``'.xz'``, respectively.
+
+.. ipython:: python
+
+   df = pd.DataFrame({
+       'A': np.random.randn(1000),
+       'B': 'foo',
+       'C': pd.date_range('20130101', periods=1000, freq='s')})
+   df
+
+Using an explicit compression type:
+
+.. ipython:: python
+
+   df.to_pickle("data.pkl.compress", compression="gzip")
+   rt = pd.read_pickle("data.pkl.compress", compression="gzip")
+   rt
+
+Inferring compression type from the extension:
+
+.. ipython:: python
 
-msgpack (experimental)
-----------------------
+   df.to_pickle("data.pkl.xz", compression="infer")
+   rt = pd.read_pickle("data.pkl.xz", compression="infer")
+   rt
 
-.. versionadded:: 0.13.0
+The default is to 'infer':
 
-Starting in 0.13.0, pandas is supporting the ``msgpack`` format for
+.. ipython:: python
+
+   df.to_pickle("data.pkl.gz")
+   rt = pd.read_pickle("data.pkl.gz")
+   rt
+
+   df["A"].to_pickle("s1.pkl.bz2")
+   rt = pd.read_pickle("s1.pkl.bz2")
+   rt
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   os.remove("data.pkl.compress")
+   os.remove("data.pkl.xz")
+   os.remove("data.pkl.gz")
+   os.remove("s1.pkl.bz2")
+
+.. _io.msgpack:
+
+msgpack
+-------
+
+pandas supports the ``msgpack`` format for
 object serialization. This is a lightweight portable binary format, similar
 to binary JSON, that is highly space efficient, and provides good performance
 both on the writing (serialization), and reading (deserialization).
@@ -2470,40 +3231,41 @@ both on the writing (serialization), and reading (deserialization).
 
 .. ipython:: python
 
-   df = DataFrame(np.random.rand(5,2),columns=list('AB'))
+   df = pd.DataFrame(np.random.rand(5, 2), columns=list('AB'))
    df.to_msgpack('foo.msg')
    pd.read_msgpack('foo.msg')
-   s = Series(np.random.rand(5),index=date_range('20130101',periods=5))
+   s = pd.Series(np.random.rand(5), index=pd.date_range('20130101', periods=5))
 
 You can pass a list of objects and you will receive them back on deserialization.
 
 .. ipython:: python
 
-   pd.to_msgpack('foo.msg', df, 'foo', np.array([1,2,3]), s)
+   pd.to_msgpack('foo.msg', df, 'foo', np.array([1, 2, 3]), s)
    pd.read_msgpack('foo.msg')
 
-You can pass ``iterator=True`` to iterate over the unpacked results
+You can pass ``iterator=True`` to iterate over the unpacked results:
 
 .. ipython:: python
 
-   for o in pd.read_msgpack('foo.msg',iterator=True):
-       print o
+   for o in pd.read_msgpack('foo.msg', iterator=True):
+       print(o)
 
-You can pass ``append=True`` to the writer to append to an existing pack
+You can pass ``append=True`` to the writer to append to an existing pack:
 
 .. ipython:: python
 
-   df.to_msgpack('foo.msg',append=True)
+   df.to_msgpack('foo.msg', append=True)
    pd.read_msgpack('foo.msg')
 
 Unlike other io methods, ``to_msgpack`` is available on both a per-object basis,
 ``df.to_msgpack()`` and using the top-level ``pd.to_msgpack(...)`` where you
-can pack arbitrary collections of python lists, dicts, scalars, while intermixing
+can pack arbitrary collections of Python lists, dicts, scalars, while intermixing
 pandas objects.
 
 .. ipython:: python
 
-   pd.to_msgpack('foo2.msg', { 'dict' : [ { 'df' : df }, { 'string' : 'foo' }, { 'scalar' : 1. }, { 's' : s } ] })
+   pd.to_msgpack('foo2.msg', {'dict': [{ 'df': df }, {'string': 'foo'},
+                                       {'scalar': 1.}, {'s': s}]})
    pd.read_msgpack('foo2.msg')
 
 .. ipython:: python
@@ -2540,15 +3302,10 @@ for some advanced strategies
 
 .. warning::
 
-   As of version 0.15.0, pandas requires ``PyTables`` >= 3.0.0. Stores written with prior versions of pandas / ``PyTables`` >= 2.3 are fully compatible (this was the previous minimum ``PyTables`` required version).
-
-.. warning::
-
-   There is a ``PyTables`` indexing bug which may appear when querying stores using an index.  If you see a subset of results being returned, upgrade to ``PyTables`` >= 3.2.  Stores created previously will need to be rewritten using the updated version.
-
-.. warning::
-
-   As of version 0.17.0, ``HDFStore`` will not drop rows that have all missing values by default. Previously, if all values (except the index) were missing, ``HDFStore`` would not write those rows to disk.
+   pandas requires ``PyTables`` >= 3.0.0.
+   There is a indexing bug in ``PyTables`` < 3.2 which may appear when querying stores using an index.
+   If you see a subset of results being returned, upgrade to ``PyTables`` >= 3.2.
+   Stores created previously will need to be rewritten using the updated version.
 
 .. ipython:: python
    :suppress:
@@ -2558,7 +3315,7 @@ for some advanced strategies
 
 .. ipython:: python
 
-   store = HDFStore('store.h5')
+   store = pd.HDFStore('store.h5')
    print(store)
 
 Objects can be written to the file just like adding key-value pairs to a
@@ -2567,13 +3324,13 @@ dict:
 .. ipython:: python
 
    np.random.seed(1234)
-   index = date_range('1/1/2000', periods=8)
-   s = Series(randn(5), index=['a', 'b', 'c', 'd', 'e'])
-   df = DataFrame(randn(8, 3), index=index,
-                  columns=['A', 'B', 'C'])
-   wp = Panel(randn(2, 5, 4), items=['Item1', 'Item2'],
-              major_axis=date_range('1/1/2000', periods=5),
-              minor_axis=['A', 'B', 'C', 'D'])
+   index = pd.date_range('1/1/2000', periods=8)
+   s = pd.Series(randn(5), index=['a', 'b', 'c', 'd', 'e'])
+   df = pd.DataFrame(randn(8, 3), index=index,
+                     columns=['A', 'B', 'C'])
+   wp = pd.Panel(randn(2, 5, 4), items=['Item1', 'Item2'],
+                 major_axis=pd.date_range('1/1/2000', periods=5),
+                 minor_axis=['A', 'B', 'C', 'D'])
 
    # store.put('s', s) is an equivalent method
    store['s'] = s
@@ -2597,7 +3354,7 @@ In a current or later Python session, you can retrieve stored objects:
    # dotted (attribute) access provides get as well
    store.df
 
-Deletion of the object specified by the key
+Deletion of the object specified by the key:
 
 .. ipython:: python
 
@@ -2606,7 +3363,7 @@ Deletion of the object specified by the key
 
    store
 
-Closing a Store, Context Manager
+Closing a Store and using a context manager:
 
 .. ipython:: python
 
@@ -2614,9 +3371,8 @@ Closing a Store, Context Manager
    store
    store.is_open
 
-   # Working with, and automatically closing the store with the context
-   # manager
-   with HDFStore('store.h5') as store:
+   # Working with, and automatically closing the store using a context manager
+   with pd.HDFStore('store.h5') as store:
        store.keys()
 
 .. ipython:: python
@@ -2632,13 +3388,13 @@ Read/Write API
 ''''''''''''''
 
 ``HDFStore`` supports an top-level API using  ``read_hdf`` for reading and ``to_hdf`` for writing,
-similar to how ``read_csv`` and ``to_csv`` work. (new in 0.11.0)
+similar to how ``read_csv`` and ``to_csv`` work.
 
 .. ipython:: python
 
-   df_tl = DataFrame(dict(A=list(range(5)), B=list(range(5))))
-   df_tl.to_hdf('store_tl.h5','table',append=True)
-   read_hdf('store_tl.h5', 'table', where = ['index>2'])
+   df_tl = pd.DataFrame(dict(A=list(range(5)), B=list(range(5))))
+   df_tl.to_hdf('store_tl.h5','table', append=True)
+   pd.read_hdf('store_tl.h5', 'table', where=['index>2'])
 
 .. ipython:: python
    :suppress:
@@ -2647,7 +3403,7 @@ similar to how ``read_csv`` and ``to_csv`` work. (new in 0.11.0)
    os.remove('store_tl.h5')
 
 
-As of version 0.17.0, HDFStore will no longer drop rows that are all missing by default. This behavior can be enabled by setting ``dropna=True``.
+HDFStore will by default not drop rows that are all missing. This behavior can be changed by setting ``dropna=True``.
 
 .. ipython:: python
    :suppress:
@@ -2656,17 +3412,17 @@ As of version 0.17.0, HDFStore will no longer drop rows that are all missing by
 
 .. ipython:: python
 
-   df_with_missing = pd.DataFrame({'col1':[0, np.nan, 2],
-                                   'col2':[1, np.nan, np.nan]})
+   df_with_missing = pd.DataFrame({'col1': [0, np.nan, 2],
+                                   'col2': [1, np.nan, np.nan]})
    df_with_missing
 
    df_with_missing.to_hdf('file.h5', 'df_with_missing',
-                           format = 'table', mode='w')
+                           format='table', mode='w')
 
    pd.read_hdf('file.h5', 'df_with_missing')
 
    df_with_missing.to_hdf('file.h5', 'df_with_missing',
-                           format = 'table', mode='w', dropna=True)
+                           format='table', mode='w', dropna=True)
    pd.read_hdf('file.h5', 'df_with_missing')
 
 
@@ -2679,22 +3435,22 @@ This is also true for the major axis of a ``Panel``:
 
 .. ipython:: python
 
-   matrix = [[[np.nan, np.nan, np.nan],[1,np.nan,np.nan]],
-          [[np.nan, np.nan, np.nan], [np.nan,5,6]],
-          [[np.nan, np.nan, np.nan],[np.nan,3,np.nan]]]
+   matrix = [[[np.nan, np.nan, np.nan], [1, np.nan, np.nan]],
+            [[np.nan, np.nan, np.nan], [np.nan, 5, 6]],
+            [[np.nan, np.nan, np.nan], [np.nan, 3, np.nan]]]
 
-   panel_with_major_axis_all_missing = Panel(matrix,
-           items=['Item1', 'Item2','Item3'],
-           major_axis=[1,2],
+   panel_with_major_axis_all_missing=pd.Panel(matrix,
+           items=['Item1', 'Item2', 'Item3'],
+           major_axis=[1, 2],
            minor_axis=['A', 'B', 'C'])
 
    panel_with_major_axis_all_missing
 
    panel_with_major_axis_all_missing.to_hdf('file.h5', 'panel',
-                                           dropna = True,
-                                           format='table',
-                                           mode='w')
-   reloaded = read_hdf('file.h5', 'panel')
+                                            dropna=True,
+                                            format='table',
+                                            mode='w')
+   reloaded = pd.read_hdf('file.h5', 'panel')
    reloaded
 
 
@@ -2710,26 +3466,22 @@ This is also true for the major axis of a ``Panel``:
 Fixed Format
 ''''''''''''
 
-.. note::
-
-   This was prior to 0.13.0 the ``Storer`` format.
-
 The examples above show storing using ``put``, which write the HDF5 to ``PyTables`` in a fixed array format, called
-the ``fixed`` format. These types of stores are are **not** appendable once written (though you can simply
+the ``fixed`` format. These types of stores are **not** appendable once written (though you can simply
 remove them and rewrite). Nor are they **queryable**; they must be
 retrieved in their entirety. They also do not support dataframes with non-unique column names.
 The ``fixed`` format stores offer very fast writing and slightly faster reading than ``table`` stores.
-This format is specified by default when using ``put`` or ``to_hdf`` or by ``format='fixed'`` or ``format='f'``
+This format is specified by default when using ``put`` or ``to_hdf`` or by ``format='fixed'`` or ``format='f'``.
 
 .. warning::
 
-   A ``fixed`` format will raise a ``TypeError`` if you try to retrieve using a ``where`` .
+   A ``fixed`` format will raise a ``TypeError`` if you try to retrieve using a ``where``:
 
    .. code-block:: python
 
-       DataFrame(randn(10,2)).to_hdf('test_fixed.h5','df')
+       pd.DataFrame(randn(10, 2)).to_hdf('test_fixed.h5', 'df')
 
-       pd.read_hdf('test_fixed.h5','df',where='index>5')
+       pd.read_hdf('test_fixed.h5', 'df', where='index>5')
        TypeError: cannot pass a where specification when reading a fixed format.
                   this store must be selected in its entirety
 
@@ -2742,11 +3494,9 @@ Table Format
 ``HDFStore`` supports another ``PyTables`` format on disk, the ``table``
 format. Conceptually a ``table`` is shaped very much like a DataFrame,
 with rows and columns. A ``table`` may be appended to in the same or
-other sessions.  In addition, delete & query type operations are
+other sessions.  In addition, delete and query type operations are
 supported. This format is specified by ``format='table'`` or ``format='t'``
-to ``append`` or ``put`` or ``to_hdf``
-
-.. versionadded:: 0.13
+to ``append`` or ``put`` or ``to_hdf``.
 
 This format can be set as an option as well ``pd.set_option('io.hdf.default_format','table')`` to
 enable ``put/append/to_hdf`` to by default store in the ``table`` format.
@@ -2759,7 +3509,7 @@ enable ``put/append/to_hdf`` to by default store in the ``table`` format.
 
 .. ipython:: python
 
-   store = HDFStore('store.h5')
+   store = pd.HDFStore('store.h5')
    df1 = df[0:4]
    df2 = df[4:]
 
@@ -2786,9 +3536,9 @@ Hierarchical Keys
 Keys to a store can be specified as a string. These can be in a
 hierarchical path-name like format (e.g. ``foo/bar/bah``), which will
 generate a hierarchy of sub-stores (or ``Groups`` in PyTables
-parlance). Keys can be specified with out the leading '/' and are ALWAYS
+parlance). Keys can be specified with out the leading '/' and are **always**
 absolute (e.g. 'foo' refers to '/foo'). Removal operations can remove
-everything in the sub-store and BELOW, so be *careful*.
+everything in the sub-store and **below**, so be *careful*.
 
 .. ipython:: python
 
@@ -2804,6 +3554,47 @@ everything in the sub-store and BELOW, so be *careful*.
    store.remove('food')
    store
 
+
+You can walk through the group hierarchy using the ``walk`` method which
+will yield a tuple for each group key along with the relative keys of its contents.
+
+.. versionadded:: 0.24.0
+
+
+.. ipython:: python
+
+   for (path, subgroups, subkeys) in store.walk():
+       for subgroup in subgroups:
+           print('GROUP: {}/{}'.format(path, subgroup))
+       for subkey in subkeys:
+           key = '/'.join([path, subkey])
+           print('KEY: {}'.format(key))
+           print(store.get(key))
+
+
+
+.. warning::
+
+    Hierarchical keys cannot be retrieved as dotted (attribute) access as described above for items stored under the root node.
+
+    .. code-block:: python
+
+       In [8]: store.foo.bar.bah
+       AttributeError: 'HDFStore' object has no attribute 'foo'
+
+       # you can directly access the actual PyTables node but using the root node
+       In [9]: store.root.foo.bar.bah
+       Out[9]:
+       /foo/bar/bah (Group) ''
+         children := ['block0_items' (Array), 'block0_values' (Array), 'axis0' (Array), 'axis1' (Array)]
+
+    Instead, use explicit string based keys:
+
+    .. ipython:: python
+
+       store['foo/bar/bah']
+
+
 .. _io.hdf5-types:
 
 Storing Types
@@ -2813,8 +3604,8 @@ Storing Mixed Types in a Table
 ++++++++++++++++++++++++++++++
 
 Storing mixed-dtype data is supported. Strings are stored as a
-fixed-width using the maximum size of the appended column. Subsequent
-appends will truncate strings at this length.
+fixed-width using the maximum size of the appended column. Subsequent attempts
+at appending longer strings will raise a ``ValueError``.
 
 Passing ``min_itemsize={`values`: size}`` as a parameter to append
 will set a larger minimum for the string columns. Storing ``floats,
@@ -2825,15 +3616,15 @@ defaults to `nan`.
 
 .. ipython:: python
 
-    df_mixed = DataFrame({ 'A' : randn(8),
-                           'B' : randn(8),
-                           'C' : np.array(randn(8),dtype='float32'),
-                           'string' :'string',
-                           'int' : 1,
-                           'bool' : True,
-                           'datetime64' : Timestamp('20010102')},
-                         index=list(range(8)))
-    df_mixed.ix[3:5,['A', 'B', 'string', 'datetime64']] = np.nan
+    df_mixed = pd.DataFrame({'A': randn(8),
+                             'B': randn(8),
+                             'C': np.array(randn(8), dtype='float32'),
+                             'string':'string',
+                             'int': 1,
+                             'bool': True,
+                             'datetime64': pd.Timestamp('20010102')},
+                            index=list(range(8)))
+    df_mixed.loc[df_mixed.index[3:5], ['A', 'B', 'string', 'datetime64']] = np.nan
 
     store.append('df_mixed', df_mixed, min_itemsize = {'values': 50})
     df_mixed1 = store.select('df_mixed')
@@ -2843,24 +3634,24 @@ defaults to `nan`.
     # we have provided a minimum string column size
     store.root.df_mixed.table
 
-Storing Multi-Index DataFrames
-++++++++++++++++++++++++++++++
+Storing MultiIndex DataFrames
++++++++++++++++++++++++++++++
 
-Storing multi-index dataframes as tables is very similar to
-storing/selecting from homogeneous index DataFrames.
+Storing MultiIndex ``DataFrames`` as tables is very similar to
+storing/selecting from homogeneous index ``DataFrames``.
 
 .. ipython:: python
 
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['foo', 'bar'])
-        df_mi = DataFrame(np.random.randn(10, 3), index=index,
-                          columns=['A', 'B', 'C'])
+        index = pd.MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                                      ['one', 'two', 'three']],
+                              labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                      [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                              names=['foo', 'bar'])
+        df_mi = pd.DataFrame(np.random.randn(10, 3), index=index,
+                             columns=['A', 'B', 'C'])
         df_mi
 
-        store.append('df_mi',df_mi)
+        store.append('df_mi', df_mi)
         store.select('df_mi')
 
         # the levels are automatically included as data columns
@@ -2875,12 +3666,6 @@ Querying
 Querying a Table
 ++++++++++++++++
 
-.. warning::
-
-   This query capabilities have changed substantially starting in ``0.13.0``.
-   Queries from prior version are accepted (with a ``DeprecationWarning``) printed
-   if its not string-like.
-
 ``select`` and ``delete`` operations have an optional criterion that can
 be specified to select/delete only a subset of the data. This allows one
 to have a very large on-disk table and retrieve only a portion of the
@@ -2888,10 +3673,10 @@ data.
 
 A query is specified using the ``Term`` class under the hood, as a boolean expression.
 
-- ``index`` and ``columns`` are supported indexers of a DataFrame
-- ``major_axis``, ``minor_axis``, and ``items`` are supported indexers of
-  the Panel
-- if ``data_columns`` are specified, these can be used as additional indexers
+* ``index`` and ``columns`` are supported indexers of a ``DataFrames``.
+* ``major_axis``, ``minor_axis``, and ``items`` are supported indexers of
+  the Panel.
+* if ``data_columns`` are specified, these can be used as additional indexers.
 
 Valid comparison operators are:
 
@@ -2899,9 +3684,9 @@ Valid comparison operators are:
 
 Valid boolean expressions are combined with:
 
-- ``|`` : or
-- ``&`` : and
-- ``(`` and ``)`` : for grouping
+* ``|`` : or
+* ``&`` : and
+* ``(`` and ``)`` : for grouping
 
 These rules are similar to how boolean expressions are used in pandas for indexing.
 
@@ -2914,16 +3699,16 @@ These rules are similar to how boolean expressions are used in pandas for indexi
 
 The following are valid expressions:
 
-- ``'index>=date'``
-- ``"columns=['A', 'D']"``
-- ``"columns in ['A', 'D']"``
-- ``'columns=A'``
-- ``'columns==A'``
-- ``"~(columns=['A','B'])"``
-- ``'index>df.index[3] & string="bar"'``
-- ``'(index>df.index[3] & index<=df.index[6]) | string="bar"'``
-- ``"ts>=Timestamp('2012-02-01')"``
-- ``"major_axis>=20130101"``
+* ``'index >= date'``
+* ``"columns = ['A', 'D']"``
+* ``"columns in ['A', 'D']"``
+* ``'columns = A'``
+* ``'columns == A'``
+* ``"~(columns = ['A', 'B'])"``
+* ``'index > df.index[3] & string = "bar"'``
+* ``'(index > df.index[3] & index <= df.index[6]) | string = "bar"'``
+* ``"ts >= Timestamp('2012-02-01')"``
+* ``"major_axis>=20130101"``
 
 The ``indexers`` are on the left-hand side of the sub-expression:
 
@@ -2931,11 +3716,11 @@ The ``indexers`` are on the left-hand side of the sub-expression:
 
 The right-hand side of the sub-expression (after a comparison operator) can be:
 
-- functions that will be evaluated, e.g. ``Timestamp('2012-02-01')``
-- strings, e.g. ``"bar"``
-- date-like, e.g. ``20130101``, or ``"20130101"``
-- lists, e.g. ``"['A','B']"``
-- variables that are defined in the local names space, e.g. ``date``
+* functions that will be evaluated, e.g. ``Timestamp('2012-02-01')``
+* strings, e.g. ``"bar"``
+* date-like, e.g. ``20130101``, or ``"20130101"``
+* lists, e.g. ``"['A', 'B']"``
+* variables that are defined in the local names space, e.g. ``date``
 
 .. note::
 
@@ -2972,28 +3757,29 @@ Here are some examples:
 
 .. ipython:: python
 
-    dfq = DataFrame(randn(10,4),columns=list('ABCD'),index=date_range('20130101',periods=10))
-    store.append('dfq',dfq,format='table',data_columns=True)
+    dfq = pd.DataFrame(randn(10, 4), columns=list('ABCD'),
+                       index=pd.date_range('20130101', periods=10))
+    store.append('dfq', dfq, format='table', data_columns=True)
 
 Use boolean expressions, with in-line function evaluation.
 
 .. ipython:: python
 
-    store.select('dfq',"index>Timestamp('20130104') & columns=['A', 'B']")
+    store.select('dfq', "index>pd.Timestamp('20130104') & columns=['A', 'B']")
 
 Use and inline column reference
 
 .. ipython:: python
 
-   store.select('dfq',where="A>0 or C>0")
+   store.select('dfq', where="A>0 or C>0")
 
 Works with a Panel as well.
 
 .. ipython:: python
 
-   store.append('wp',wp)
+   store.append('wp', wp)
    store
-   store.select('wp', "major_axis>Timestamp('20000102') & minor_axis=['A', 'B']")
+   store.select('wp', "major_axis>pd.Timestamp('20000102') & minor_axis=['A', 'B']")
 
 The ``columns`` keyword can be supplied to select a list of columns to be
 returned, this is equivalent to passing a
@@ -3012,7 +3798,7 @@ space. These are in terms of the total number of rows in a table.
    wp.to_frame()
 
    # limiting the search
-   store.select('wp',"major_axis>20000102 & minor_axis=['A','B']",
+   store.select('wp', "major_axis>20000102 & minor_axis=['A', 'B']",
                 start=0, stop=10)
 
 .. note::
@@ -3029,20 +3815,18 @@ space. These are in terms of the total number of rows in a table.
 Using timedelta64[ns]
 +++++++++++++++++++++
 
-.. versionadded:: 0.13
-
-Beginning in 0.13.0, you can store and query using the ``timedelta64[ns]`` type. Terms can be
+You can store and query using the ``timedelta64[ns]`` type. Terms can be
 specified in the format: ``<float>(<unit>)``, where float may be signed (and fractional), and unit can be
 ``D,s,ms,us,ns`` for the timedelta. Here's an example:
 
 .. ipython:: python
 
    from datetime import timedelta
-   dftd = DataFrame(dict(A = Timestamp('20130101'), B = [ Timestamp('20130101') + timedelta(days=i,seconds=10) for i in range(10) ]))
-   dftd['C'] = dftd['A']-dftd['B']
+   dftd = pd.DataFrame(dict(A = pd.Timestamp('20130101'), B = [ pd.Timestamp('20130101') + timedelta(days=i, seconds=10) for i in range(10) ]))
+   dftd['C'] = dftd['A'] - dftd['B']
    dftd
-   store.append('dftd',dftd,data_columns=True)
-   store.select('dftd',"C<'-3.5D'")
+   store.append('dftd', dftd, data_columns=True)
+   store.select('dftd', "C<'-3.5D'")
 
 Indexing
 ++++++++
@@ -3055,7 +3839,7 @@ indexed dimension as the ``where``.
 
 .. note::
 
-   Indexes are automagically created (starting ``0.10.1``) on the indexables
+   Indexes are automagically created on the indexables
    and any data columns you specify. This behavior can be turned off by passing
    ``index=False`` to ``append``.
 
@@ -3070,8 +3854,37 @@ indexed dimension as the ``where``.
    i = store.root.df.table.cols.index.index
    i.optlevel, i.kind
 
+Oftentimes when appending large amounts of data to a store, it is useful to turn off index creation for each append, then recreate at the end.
+
+.. ipython:: python
+
+   df_1 = pd.DataFrame(randn(10, 2), columns=list('AB'))
+   df_2 = pd.DataFrame(randn(10, 2), columns=list('AB'))
+
+   st = pd.HDFStore('appends.h5', mode='w')
+   st.append('df', df_1, data_columns=['B'], index=False)
+   st.append('df', df_2, data_columns=['B'], index=False)
+   st.get_storer('df').table
+
+Then create the index when finished appending.
+
+.. ipython:: python
+
+   st.create_table_index('df', columns=['B'], optlevel=9, kind='full')
+   st.get_storer('df').table
+
+   st.close()
+
+.. ipython:: python
+   :suppress:
+   :okexcept:
+
+   os.remove('appends.h5')
+
 See `here <http://stackoverflow.com/questions/17893370/ptrepack-sortby-needs-full-index>`__ for how to create a completely-sorted-index (CSI) on an existing store.
 
+.. _io.hdf5-query-data-columns:
+
 Query via Data Columns
 ++++++++++++++++++++++
 
@@ -3080,21 +3893,21 @@ to perform queries (other than the `indexable` columns, which you can
 always query). For instance say you want to perform this common
 operation, on-disk, and return just the frame that matches this
 query. You can specify ``data_columns = True`` to force all columns to
-be data_columns
+be ``data_columns``.
 
 .. ipython:: python
 
    df_dc = df.copy()
    df_dc['string'] = 'foo'
-   df_dc.ix[4:6,'string'] = np.nan
-   df_dc.ix[7:9,'string'] = 'bar'
+   df_dc.loc[df_dc.index[4: 6], 'string'] = np.nan
+   df_dc.loc[df_dc.index[7: 9], 'string'] = 'bar'
    df_dc['string2'] = 'cool'
-   df_dc.ix[1:3,['B','C']] = 1.0
+   df_dc.loc[df_dc.index[1: 3], ['B', 'C']] = 1.0
    df_dc
 
    # on-disk operations
    store.append('df_dc', df_dc, data_columns = ['B', 'C', 'string', 'string2'])
-   store.select('df_dc', [ Term('B>0') ])
+   store.select('df_dc', where='B > 0')
 
    # getting creative
    store.select('df_dc', 'B > 0 & C > 0 & string == foo')
@@ -3110,12 +3923,12 @@ There is some performance degradation by making lots of columns into
 `data columns`, so it is up to the user to designate these. In addition,
 you cannot change data columns (nor indexables) after the first
 append/put operation (Of course you can simply read in the data and
-create a new table!)
+create a new table!).
 
 Iterator
 ++++++++
 
-Starting in ``0.11.0``, you can pass, ``iterator=True`` or ``chunksize=number_in_a_chunk``
+You can pass ``iterator=True`` or ``chunksize=number_in_a_chunk``
 to ``select`` and ``select_as_multiple`` to return an iterator on the results.
 The default is 50,000 rows returned in a chunk.
 
@@ -3126,14 +3939,12 @@ The default is 50,000 rows returned in a chunk.
 
 .. note::
 
-   .. versionadded:: 0.12.0
-
    You can also use the iterator with ``read_hdf`` which will open, then
    automatically close the store when finished iterating.
 
    .. code-block:: python
 
-      for df in read_hdf('store.h5','df', chunksize=3):
+      for df in pd.read_hdf('store.h5','df', chunksize=3):
           print(df)
 
 Note, that the chunksize keyword applies to the **source** rows. So if you
@@ -3145,18 +3956,18 @@ chunks.
 
 .. ipython:: python
 
-   dfeq = DataFrame({'number': np.arange(1,11)})
+   dfeq = pd.DataFrame({'number': np.arange(1, 11)})
    dfeq
 
    store.append('dfeq', dfeq, data_columns=['number'])
 
    def chunks(l, n):
-        return [l[i:i+n] for i in range(0, len(l), n)]
+        return [l[i: i+n] for i in range(0, len(l), n)]
 
-   evens = [2,4,6,8,10]
-   coordinates = store.select_as_coordinates('dfeq','number=evens')
+   evens = [2, 4, 6, 8, 10]
+   coordinates = store.select_as_coordinates('dfeq', 'number=evens')
    for c in chunks(coordinates, 2):
-        print store.select('dfeq',where=c)
+        print(store.select('dfeq', where=c))
 
 Advanced Queries
 ++++++++++++++++
@@ -3185,11 +3996,12 @@ Sometimes you want to get the coordinates (a.k.a the index locations) of your qu
 
 .. ipython:: python
 
-   df_coord = DataFrame(np.random.randn(1000,2),index=date_range('20000101',periods=1000))
-   store.append('df_coord',df_coord)
-   c = store.select_as_coordinates('df_coord','index>20020101')
-   c.summary()
-   store.select('df_coord',where=c)
+   df_coord = pd.DataFrame(np.random.randn(1000, 2),
+                           index=pd.date_range('20000101', periods=1000))
+   store.append('df_coord', df_coord)
+   c = store.select_as_coordinates('df_coord', 'index > 20020101')
+   c
+   store.select('df_coord', where=c)
 
 .. _io.hdf5-where_mask:
 
@@ -3202,11 +4014,12 @@ a datetimeindex which are 5.
 
 .. ipython:: python
 
-   df_mask = DataFrame(np.random.randn(1000,2),index=date_range('20000101',periods=1000))
-   store.append('df_mask',df_mask)
-   c = store.select_column('df_mask','index')
-   where = c[DatetimeIndex(c).month==5].index
-   store.select('df_mask',where=where)
+   df_mask = pd.DataFrame(np.random.randn(1000, 2),
+                          index=pd.date_range('20000101', periods=1000))
+   store.append('df_mask', df_mask)
+   c = store.select_column('df_mask', 'index')
+   where = c[pd.DatetimeIndex(c).month == 5].index
+   store.select('df_mask', where=where)
 
 Storer Object
 ^^^^^^^^^^^^^
@@ -3223,8 +4036,8 @@ of rows in an object.
 Multiple Table Queries
 ++++++++++++++++++++++
 
-New in 0.10.1 are the methods ``append_to_multiple`` and
-``select_as_multiple``, that can perform appending/selecting from
+The methods ``append_to_multiple`` and
+``select_as_multiple`` can perform appending/selecting from
 multiple tables at once. The idea is to have one table (call it the
 selector table) that you index most/all of the columns, and perform your
 queries. The other table(s) are data tables with an index matching the
@@ -3238,7 +4051,7 @@ table names to a list of 'columns' you want in that table. If `None`
 is used in place of a list, that table will have the remaining
 unspecified columns of the given DataFrame. The argument ``selector``
 defines which table is the selector table (which you can make queries from).
-The argument ``dropna`` will drop rows from the input DataFrame to ensure
+The argument ``dropna`` will drop rows from the input ``DataFrame`` to ensure
 tables are synchronized.  This means that if a row for one of the tables
 being written to is entirely ``np.NaN``, that row will be dropped from all tables.
 
@@ -3250,10 +4063,10 @@ results.
 
 .. ipython:: python
 
-   df_mt = DataFrame(randn(8, 6), index=date_range('1/1/2000', periods=8),
-                                  columns=['A', 'B', 'C', 'D', 'E', 'F'])
+   df_mt = pd.DataFrame(randn(8, 6), index=pd.date_range('1/1/2000', periods=8),
+                                     columns=['A', 'B', 'C', 'D', 'E', 'F'])
    df_mt['foo'] = 'bar'
-   df_mt.ix[1, ('A', 'B')] = np.nan
+   df_mt.loc[df_mt.index[1], ('A', 'B')] = np.nan
 
    # you can also create the tables individually
    store.append_to_multiple({'df1_mt': ['A', 'B'], 'df2_mt': None },
@@ -3286,15 +4099,15 @@ simple use case. You store panel-type data, with dates in the
 ``major_axis`` and ids in the ``minor_axis``. The data is then
 interleaved like this:
 
-- date_1
-  - id_1
-  - id_2
-  -  .
-  - id_n
-- date_2
-  - id_1
-  -  .
-  - id_n
+* date_1
+    * id_1
+    * id_2
+    *  .
+    * id_n
+* date_2
+    * id_1
+    *  .
+    * id_n
 
 It should be clear that a delete operation on the ``major_axis`` will be
 fairly quick, as one chunk is removed, then the following data moved. On
@@ -3305,7 +4118,7 @@ the table using a ``where`` that selects all but the missing data.
 .. ipython:: python
 
    # returns the number of rows deleted
-   store.remove('wp', 'major_axis>20000102' )
+   store.remove('wp', 'major_axis > 20000102' )
    store.select('wp')
 
 .. warning::
@@ -3314,7 +4127,7 @@ the table using a ``where`` that selects all but the missing data.
    automatically. Thus, repeatedly deleting (or removing nodes) and adding
    again, **WILL TEND TO INCREASE THE FILE SIZE**.
 
-   To *repack and clean* the file, use :ref:`ptrepack <io.hdf5-ptrepack>`
+   To *repack and clean* the file, use :ref:`ptrepack <io.hdf5-ptrepack>`.
 
 .. _io.hdf5-notes:
 
@@ -3326,26 +4139,65 @@ Compression
 +++++++++++
 
 ``PyTables`` allows the stored data to be compressed. This applies to
-all kinds of stores, not just tables.
+all kinds of stores, not just tables. Two parameters are used to
+control compression: ``complevel`` and ``complib``.
+
+``complevel`` specifies if and how hard data is to be compressed.
+              ``complevel=0`` and ``complevel=None`` disables
+              compression and ``0<complevel<10`` enables compression.
+
+``complib`` specifies which compression library to use. If nothing is
+            specified the default library ``zlib`` is used. A
+            compression library usually optimizes for either good
+            compression rates or speed and the results will depend on
+            the type of data. Which type of
+            compression to choose depends on your specific needs and
+            data. The list of supported compression libraries:
+
+             - `zlib <http://zlib.net/>`_: The default compression library. A classic in terms of compression, achieves good compression rates but is somewhat slow.
+             - `lzo <http://www.oberhumer.com/opensource/lzo/>`_: Fast compression and decompression.
+             - `bzip2 <http://bzip.org/>`_: Good compression rates.
+             - `blosc <http://www.blosc.org/>`_: Fast compression and decompression.
+
+             .. versionadded:: 0.20.2
+
+                Support for alternative blosc compressors:
+
+                - `blosc:blosclz <http://www.blosc.org/>`_ This is the
+                  default compressor for ``blosc``
+                - `blosc:lz4
+                  <https://fastcompression.blogspot.dk/p/lz4.html>`_:
+                  A compact, very popular and fast compressor.
+                - `blosc:lz4hc
+                  <https://fastcompression.blogspot.dk/p/lz4.html>`_:
+                  A tweaked version of LZ4, produces better
+                  compression ratios at the expense of speed.
+                - `blosc:snappy <https://google.github.io/snappy/>`_:
+                  A popular compressor used in many places.
+                - `blosc:zlib <http://zlib.net/>`_: A classic;
+                  somewhat slower than the previous ones, but
+                  achieving better compression ratios.
+                - `blosc:zstd <https://facebook.github.io/zstd/>`_: An
+                  extremely well balanced codec; it provides the best
+                  compression ratios among the others above, and at
+                  reasonably fast speed.
+
+             If ``complib`` is defined as something other than the
+             listed libraries a ``ValueError`` exception is issued.
 
-- Pass ``complevel=int`` for a compression level (1-9, with 0 being no
-  compression, and the default)
-- Pass ``complib=lib`` where lib is any of ``zlib, bzip2, lzo, blosc`` for
-  whichever compression library you prefer.
+.. note::
 
-``HDFStore`` will use the file based compression scheme if no overriding
-``complib`` or ``complevel`` options are provided. ``blosc`` offers very
-fast compression, and is my most used. Note that ``lzo`` and ``bzip2``
-may not be installed (by Python) by default.
+   If the library specified with the ``complib`` option is missing on your platform,
+   compression defaults to ``zlib`` without further ado.
 
-Compression for all objects within the file
+Enable compression for all objects within the file:
 
 .. code-block:: python
 
-   store_compressed = HDFStore('store_compressed.h5', complevel=9, complib='blosc')
+   store_compressed = pd.HDFStore('store_compressed.h5', complevel=9,
+                                  complib='blosc:blosclz')
 
-Or on-the-fly compression (this only applies to tables). You can turn
-off file compression for a specific table by passing ``complevel=0``
+Or on-the-fly compression (this only applies to tables) in stores where compression is not enabled:
 
 .. code-block:: python
 
@@ -3383,12 +4235,12 @@ Caveats
    need to serialize these operations in a single thread in a single
    process. You will corrupt your data otherwise. See the (:issue:`2397`) for more information.
 
-- If you use locks to manage write access between multiple processes, you
+* If you use locks to manage write access between multiple processes, you
   may want to use :py:func:`~os.fsync` before releasing write locks. For
   convenience you can use ``store.flush(fsync=True)`` to do this for you.
-- Once a ``table`` is created its items (Panel) / columns (DataFrame)
+* Once a ``table`` is created its items (Panel) / columns (DataFrame)
   are fixed; only exactly the same columns can be appended
-- Be aware that timezones (e.g., ``pytz.timezone('US/Eastern')``)
+* Be aware that timezones (e.g., ``pytz.timezone('US/Eastern')``)
   are not necessarily equal across timezone versions.  So if data is
   localized to a specific timezone in the HDFStore using one version
   of a timezone library and that data is updated with another version, the data
@@ -3398,7 +4250,7 @@ Caveats
 
 .. warning::
 
-   ``PyTables`` will show a ``NaturalNameWarning`` if a  column name
+   ``PyTables`` will show a ``NaturalNameWarning`` if a column name
    cannot be used as an attribute selector.
    *Natural* identifiers contain only letters, numbers, and underscores,
    and may not begin with a number.
@@ -3432,39 +4284,22 @@ object : ``strings``                                    ``np.nan``
 Categorical Data
 ++++++++++++++++
 
-.. versionadded:: 0.15.2
-
-Writing data to a ``HDFStore`` that contains a ``category`` dtype was implemented
-in 0.15.2. Queries work the same as if it was an object array. However, the ``category`` dtyped data is
+You can write data that contains ``category`` dtypes to a ``HDFStore``.
+Queries work the same as if it was an object array. However, the ``category`` dtyped data is
 stored in a more efficient manner.
 
 .. ipython:: python
 
-   dfcat = DataFrame({ 'A' : Series(list('aabbcdba')).astype('category'),
-                       'B' : np.random.randn(8) })
+   dfcat = pd.DataFrame({'A': pd.Series(list('aabbcdba')).astype('category'),
+                         'B': np.random.randn(8) })
    dfcat
    dfcat.dtypes
    cstore = pd.HDFStore('cats.h5', mode='w')
    cstore.append('dfcat', dfcat, format='table', data_columns=['A'])
-   result = cstore.select('dfcat', where="A in ['b','c']")
+   result = cstore.select('dfcat', where="A in ['b', 'c']")
    result
    result.dtypes
 
-.. warning::
-
-   The format of the ``Categorical`` is readable by prior versions of pandas (< 0.15.2), but will retrieve
-   the data as an integer based column (e.g. the ``codes``). However, the ``categories`` *can* be retrieved
-   but require the user to select them manually using the explicit meta path.
-
-   The data is stored like so:
-
-   .. ipython:: python
-
-      cstore
-
-      # to get the categories
-      cstore.select('dfcat/meta/A/meta')
-
 .. ipython:: python
    :suppress:
    :okexcept:
@@ -3490,7 +4325,7 @@ Pass ``min_itemsize`` on the first table creation to a-priori specify the minimu
 ``min_itemsize`` can be an integer, or a dict mapping a column name to an integer. You can pass ``values`` as a key to
 allow all *indexables* or *data_columns* to have this min_itemsize.
 
-Starting in 0.11.0, passing a ``min_itemsize`` dict will cause all passed columns to be created as *data_columns* automatically.
+Passing a ``min_itemsize`` dict will cause all passed columns to be created as *data_columns* automatically.
 
 .. note::
 
@@ -3498,16 +4333,16 @@ Starting in 0.11.0, passing a ``min_itemsize`` dict will cause all passed column
 
 .. ipython:: python
 
-   dfs = DataFrame(dict(A = 'foo', B = 'bar'),index=list(range(5)))
+   dfs = pd.DataFrame(dict(A='foo', B='bar'), index=list(range(5)))
    dfs
 
    # A and B have a size of 30
-   store.append('dfs', dfs, min_itemsize = 30)
+   store.append('dfs', dfs, min_itemsize=30)
    store.get_storer('dfs').table
 
    # A is created as a data_column with a size of 30
    # B is size is calculated
-   store.append('dfs2', dfs, min_itemsize = { 'A' : 30 })
+   store.append('dfs2', dfs, min_itemsize={'A': 30})
    store.get_storer('dfs2').table
 
 **nan_rep**
@@ -3517,7 +4352,7 @@ You could inadvertently turn an actual ``nan`` value into a missing value.
 
 .. ipython:: python
 
-   dfss = DataFrame(dict(A = ['foo','bar','nan']))
+   dfss = pd.DataFrame(dict(A=['foo', 'bar', 'nan']))
    dfss
 
    store.append('dfss', dfss)
@@ -3547,11 +4382,11 @@ It is possible to write an ``HDFStore`` object that can easily be imported into
    np.random.seed(1)
    df_for_r = pd.DataFrame({"first": np.random.rand(100),
                             "second": np.random.rand(100),
-                            "class": np.random.randint(0, 2, (100,))},
+                            "class": np.random.randint(0, 2, (100, ))},
                             index=range(100))
    df_for_r.head()
 
-   store_export = HDFStore('export.h5')
+   store_export = pd.HDFStore('export.h5')
    store_export.append('df_for_r', df_for_r, data_columns=df_dc.columns)
    store_export
 
@@ -3584,7 +4419,7 @@ and data values from the values and assembles them into a ``data.frame``:
    name_paths = paste(listing$group[name_nodes], listing$name[name_nodes], sep = "/")
    columns = list()
    for (idx in seq(data_paths)) {
-     # NOTE: matrices returned by h5read have to be transposed to to obtain
+     # NOTE: matrices returned by h5read have to be transposed to obtain
      # required Fortran order!
      data <- data.frame(t(h5read(h5File, data_paths[idx])))
      names <- t(h5read(h5File, name_paths[idx]))
@@ -3618,99 +4453,185 @@ Now you can import the ``DataFrame`` into R:
    starting point if you have stored multiple ``DataFrame`` objects to a
    single HDF5 file.
 
-Backwards Compatibility
-'''''''''''''''''''''''
-
-0.10.1 of ``HDFStore`` can read tables created in a prior version of pandas,
-however query terms using the
-prior (undocumented) methodology are unsupported. ``HDFStore`` will
-issue a warning if you try to use a legacy-format file. You must
-read in the entire file and write it out using the new format, using the
-method ``copy`` to take advantage of the updates. The group attribute
-``pandas_version`` contains the version information. ``copy`` takes a
-number of options, please see the docstring.
-
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   legacy_file_path = os.path.abspath('source/_static/legacy_0.10.h5')
-
-.. ipython:: python
-
-   # a legacy store
-   legacy_store = HDFStore(legacy_file_path,'r')
-   legacy_store
-
-   # copy (and return the new handle)
-   new_store = legacy_store.copy('store_new.h5')
-   new_store
-   new_store.close()
-
-.. ipython:: python
-   :suppress:
-
-   legacy_store.close()
-   import os
-   os.remove('store_new.h5')
-
 
 Performance
 '''''''''''
 
-- ``tables`` format come with a writing performance penalty as compared to
+* ``tables`` format come with a writing performance penalty as compared to
   ``fixed`` stores. The benefit is the ability to append/delete and
   query (potentially very large amounts of data).  Write times are
   generally longer as compared with regular stores. Query times can
   be quite fast, especially on an indexed axis.
-- You can pass ``chunksize=<int>`` to ``append``, specifying the
+* You can pass ``chunksize=<int>`` to ``append``, specifying the
   write chunksize (default is 50000). This will significantly lower
   your memory usage on writing.
-- You can pass ``expectedrows=<int>`` to the first ``append``,
+* You can pass ``expectedrows=<int>`` to the first ``append``,
   to set the TOTAL number of expected rows that ``PyTables`` will
   expected. This will optimize read/write performance.
-- Duplicate rows can be written to tables, but are filtered out in
+* Duplicate rows can be written to tables, but are filtered out in
   selection (with the last items being selected; thus a table is
   unique on major, minor pairs)
-- A ``PerformanceWarning`` will be raised if you are attempting to
+* A ``PerformanceWarning`` will be raised if you are attempting to
   store types that will be pickled by PyTables (rather than stored as
   endemic types). See
   `Here <http://stackoverflow.com/questions/14355151/how-to-make-pandas-hdfstore-put-operation-faster/14370190#14370190>`__
   for more information and some solutions.
 
-Experimental
-''''''''''''
 
-HDFStore supports ``Panel4D`` storage.
+.. ipython:: python
+   :suppress:
+
+   store.close()
+   import os
+   os.remove('store.h5')
+
+
+.. _io.feather:
+
+Feather
+-------
+
+.. versionadded:: 0.20.0
+
+Feather provides binary columnar serialization for data frames. It is designed to make reading and writing data
+frames efficient, and to make sharing data across data analysis languages easy.
+
+Feather is designed to faithfully serialize and de-serialize DataFrames, supporting all of the pandas
+dtypes, including extension dtypes such as categorical and datetime with tz.
+
+Several caveats.
+
+* This is a newer library, and the format, though stable, is not guaranteed to be backward compatible
+  to the earlier versions.
+* The format will NOT write an ``Index``, or ``MultiIndex`` for the
+  ``DataFrame`` and will raise an error if a non-default one is provided. You
+  can ``.reset_index()`` to store the index or ``.reset_index(drop=True)`` to
+  ignore it.
+* Duplicate column names and non-string columns names are not supported
+* Non supported types include ``Period`` and actual Python object types. These will raise a helpful error message
+  on an attempt at serialization.
+
+See the `Full Documentation <https://github.com/wesm/feather>`__.
 
 .. ipython:: python
 
-   p4d = Panel4D({ 'l1' : wp })
-   p4d
-   store.append('p4d', p4d)
-   store
+   df = pd.DataFrame({'a': list('abc'),
+                      'b': list(range(1, 4)),
+                      'c': np.arange(3, 6).astype('u1'),
+                      'd': np.arange(4.0, 7.0, dtype='float64'),
+                      'e': [True, False, True],
+                      'f': pd.Categorical(list('abc')),
+                      'g': pd.date_range('20130101', periods=3),
+                      'h': pd.date_range('20130101', periods=3, tz='US/Eastern'),
+                      'i': pd.date_range('20130101', periods=3, freq='ns')})
 
-These, by default, index the three axes ``items, major_axis,
-minor_axis``. On an ``AppendableTable`` it is possible to setup with the
-first append a different indexing scheme, depending on how you want to
-store your data. Pass the ``axes`` keyword with a list of dimensions
-(currently must by exactly 1 less than the total dimensions of the
-object). This cannot be changed after table creation.
+   df
+   df.dtypes
+
+Write to a feather file.
 
 .. ipython:: python
+   :okwarning:
 
-   store.append('p4d2', p4d, axes=['labels', 'major_axis', 'minor_axis'])
-   store
-   store.select('p4d2', [ Term('labels=l1'), Term('items=Item1'), Term('minor_axis=A_big_strings') ])
+   df.to_feather('example.feather')
+
+Read from a feather file.
+
+.. ipython:: python
+
+   result = pd.read_feather('example.feather')
+   result
+
+   # we preserve dtypes
+   result.dtypes
 
 .. ipython:: python
    :suppress:
 
-   store.close()
    import os
-   os.remove('store.h5')
+   os.remove('example.feather')
+
+
+.. _io.parquet:
 
+Parquet
+-------
+
+.. versionadded:: 0.21.0
+
+`Apache Parquet <https://parquet.apache.org/>`__ provides a partitioned binary columnar serialization for data frames. It is designed to
+make reading and writing data frames efficient, and to make sharing data across data analysis
+languages easy. Parquet can use a variety of compression techniques to shrink the file size as much as possible
+while still maintaining good read performance.
+
+Parquet is designed to faithfully serialize and de-serialize ``DataFrame`` s, supporting all of the pandas
+dtypes, including extension dtypes such as datetime with tz.
+
+Several caveats.
+
+* Duplicate column names and non-string columns names are not supported.
+* Index level names, if specified, must be strings.
+* Categorical dtypes can be serialized to parquet, but will de-serialize as ``object`` dtype.
+* Non supported types include ``Period`` and actual Python object types. These will raise a helpful error message
+  on an attempt at serialization.
+
+You can specify an ``engine`` to direct the serialization. This can be one of ``pyarrow``, or ``fastparquet``, or ``auto``.
+If the engine is NOT specified, then the ``pd.options.io.parquet.engine`` option is checked; if this is also ``auto``,
+then ``pyarrow`` is tried, and falling back to ``fastparquet``.
+
+See the documentation for `pyarrow <http://arrow.apache.org/docs/python/>`__ and `fastparquet <https://fastparquet.readthedocs.io/en/latest/>`__.
+
+.. note::
+
+   These engines are very similar and should read/write nearly identical parquet format files.
+   Currently ``pyarrow`` does not support timedelta data, ``fastparquet>=0.1.4`` supports timezone aware datetimes.
+   These libraries differ by having different underlying dependencies (``fastparquet`` by using ``numba``, while ``pyarrow`` uses a c-library).
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': list('abc'),
+                      'b': list(range(1, 4)),
+                      'c': np.arange(3, 6).astype('u1'),
+                      'd': np.arange(4.0, 7.0, dtype='float64'),
+                      'e': [True, False, True],
+                      'f': pd.date_range('20130101', periods=3),
+                      'g': pd.date_range('20130101', periods=3, tz='US/Eastern')})
+
+   df
+   df.dtypes
+
+Write to a parquet file.
+
+.. ipython:: python
+
+   df.to_parquet('example_pa.parquet', engine='pyarrow')
+   df.to_parquet('example_fp.parquet', engine='fastparquet')
+
+Read from a parquet file.
+
+.. ipython:: python
+
+   result = pd.read_parquet('example_fp.parquet', engine='fastparquet')
+   result = pd.read_parquet('example_pa.parquet', engine='pyarrow')
+
+   result.dtypes
+
+Read only certain columns of a parquet file.
+
+.. ipython:: python
+
+   result = pd.read_parquet('example_fp.parquet',
+                            engine='fastparquet', columns=['a', 'b'])
+
+   result.dtypes
+
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   os.remove('example_pa.parquet')
+   os.remove('example_fp.parquet')
 
 .. _io.sql:
 
@@ -3719,10 +4640,13 @@ SQL Queries
 
 The :mod:`pandas.io.sql` module provides a collection of query wrappers to both
 facilitate data retrieval and to reduce dependency on DB-specific API. Database abstraction
-is provided by SQLAlchemy if installed, in addition you will need a driver library for
-your database.
-
-.. versionadded:: 0.14.0
+is provided by SQLAlchemy if installed. In addition you will need a driver library for
+your database. Examples of such drivers are `psycopg2 <http://initd.org/psycopg/>`__
+for PostgreSQL or `pymysql <https://github.com/PyMySQL/PyMySQL>`__ for MySQL.
+For `SQLite <https://docs.python.org/3/library/sqlite3.html>`__ this is
+included in Python's standard library by default.
+You can find an overview of supported drivers for each SQL dialect in the
+`SQLAlchemy docs <http://docs.sqlalchemy.org/en/latest/dialects/index.html>`__.
 
 If SQLAlchemy is not installed, a fallback is only provided for sqlite (and
 for mysql for backwards compatibility, but this is deprecated and will be
@@ -3758,7 +4682,7 @@ To connect with SQLAlchemy you use the :func:`create_engine` function to create
 object from database URI. You only need to create the engine once per database you are
 connecting to.
 For more information on :func:`create_engine` and the URI formatting, see the examples
-below and the SQLAlchemy `documentation <http://docs.sqlalchemy.org/en/rel_0_9/core/engines.html>`__
+below and the SQLAlchemy `documentation <http://docs.sqlalchemy.org/en/latest/core/engines.html>`__
 
 .. ipython:: python
 
@@ -3776,7 +4700,7 @@ If you want to manage your own connections you can pass one of those instead:
 Writing DataFrames
 ''''''''''''''''''
 
-Assuming the following data is in a DataFrame ``data``, we can insert it into
+Assuming the following data is in a ``DataFrame`` ``data``, we can insert it into
 the database using :func:`~pandas.DataFrame.to_sql`.
 
 +-----+------------+-------+-------+-------+
@@ -3799,7 +4723,7 @@ the database using :func:`~pandas.DataFrame.to_sql`.
    (42, datetime.datetime(2010,10,19), 'Y', -12.5, False),
    (63, datetime.datetime(2010,10,20), 'Z', 5.73, True)]
 
-   data  = DataFrame(d, columns=c)
+   data  = pd.DataFrame(d, columns=c)
 
 .. ipython:: python
 
@@ -3862,7 +4786,7 @@ table name and optionally a subset of columns to read.
 
    pd.read_sql_table('data', engine)
 
-You can also specify the name of the column as the DataFrame index,
+You can also specify the name of the column as the ``DataFrame`` index,
 and specify a subset of columns to be read.
 
 .. ipython:: python
@@ -3890,8 +4814,6 @@ You can check if a table exists using :func:`~pandas.io.sql.has_table`
 Schema support
 ''''''''''''''
 
-.. versionadded:: 0.15.0
-
 Reading from and writing to different schema's is supported through the ``schema``
 keyword in the :func:`~pandas.read_sql_table` and :func:`~pandas.DataFrame.to_sql`
 functions. Note however that this depends on the database flavor (sqlite does not
@@ -3933,7 +4855,7 @@ Specifying this will return an iterator through chunks of the query result:
     for chunk in pd.read_sql_query("SELECT * FROM data_chunks", engine, chunksize=5):
         print(chunk)
 
-You can also run a plain query without creating a dataframe with
+You can also run a plain query without creating a ``DataFrame`` with
 :func:`~pandas.io.sql.execute`. This is useful for queries that don't return values,
 such as INSERT. This is functionally equivalent to calling ``execute`` on the
 SQLAlchemy engine or db connection object. Again, you must use the SQL syntax
@@ -3943,7 +4865,8 @@ variant appropriate for your database.
 
    from pandas.io import sql
    sql.execute('SELECT * FROM table_name', engine)
-   sql.execute('INSERT INTO table_name VALUES(?, ?, ?)', engine, params=[('id', 1, 12.2, True)])
+   sql.execute('INSERT INTO table_name VALUES(?, ?, ?)', engine,
+               params=[('id', 1, 12.2, True)])
 
 
 Engine connection examples
@@ -3972,7 +4895,7 @@ connecting to.
    # or absolute, starting with a slash:
    engine = create_engine('sqlite:////absolute/path/to/foo.db')
 
-For more information see the examples the SQLAlchemy `documentation <http://docs.sqlalchemy.org/en/rel_0_9/core/engines.html>`__
+For more information see the examples the SQLAlchemy `documentation <http://docs.sqlalchemy.org/en/latest/core/engines.html>`__
 
 
 Advanced SQLAlchemy queries
@@ -3985,7 +4908,8 @@ Use :func:`sqlalchemy.text` to specify query parameters in a backend-neutral way
 .. ipython:: python
 
    import sqlalchemy as sa
-   pd.read_sql(sa.text('SELECT * FROM data where Col_1=:col1'), engine, params={'col1': 'X'})
+   pd.read_sql(sa.text('SELECT * FROM data where Col_1=:col1'),
+               engine, params={'col1': 'X'})
 
 If you have an SQLAlchemy description of your database you can express where conditions using SQLAlchemy expressions
 
@@ -4035,204 +4959,27 @@ And then issue the following queries:
 
 .. _io.bigquery:
 
-Google BigQuery (Experimental)
-------------------------------
-
-.. versionadded:: 0.13.0
-
-The :mod:`pandas.io.gbq` module provides a wrapper for Google's BigQuery
-analytics web service to simplify retrieving results from BigQuery tables
-using SQL-like queries. Result sets are parsed into a pandas
-DataFrame with a shape and data types derived from the source table.
-Additionally, DataFrames can be inserted into new BigQuery tables or appended
-to existing tables.
-
-.. warning::
-
-   To use this module, you will need a valid BigQuery account. Refer to the
-   `BigQuery Documentation <https://developers.google.com/bigquery/>`__ for details on the service itself.
-
-The key functions are:
-
-.. currentmodule:: pandas.io.gbq
-
-.. autosummary::
-   :toctree: generated/
-
-   read_gbq
-   to_gbq
-
-.. currentmodule:: pandas
-
-.. _io.bigquery_reader:
-
-Querying
-''''''''
-
-Suppose you want to load all data from an existing BigQuery table : `test_dataset.test_table`
-into a DataFrame using the :func:`~pandas.io.gbq.read_gbq` function.
-
-.. code-block:: python
-
-   # Insert your BigQuery Project ID Here
-   # Can be found in the Google web console
-   projectid = "xxxxxxxx"
-
-   data_frame = pd.read_gbq('SELECT * FROM test_dataset.test_table', projectid)
-
-You will then be authenticated to the specified BigQuery account
-via Google's Oauth2 mechanism. In general, this is as simple as following the
-prompts in a browser window which will be opened for you. Should the browser not
-be available, or fail to launch, a code will be provided to complete the process
-manually.  Additional information on the authentication mechanism can be found
-`here <https://developers.google.com/accounts/docs/OAuth2#clientside/>`__.
-
-You can define which column from BigQuery to use as an index in the
-destination DataFrame as well as a preferred column order as follows:
-
-.. code-block:: python
-
-   data_frame = pd.read_gbq('SELECT * FROM test_dataset.test_table',
-                             index_col='index_column_name',
-                             col_order=['col1', 'col2', 'col3'], projectid)
-
-.. note::
-
-   You can find your project id in the `BigQuery management console <https://code.google.com/apis/console/b/0/?noredirect>`__.
-
-
-.. note::
-
-   You can toggle the verbose output via the ``verbose`` flag which defaults to ``True``.
-
-.. _io.bigquery_writer:
-
-Writing DataFrames
-''''''''''''''''''
-
-Assume we want to write a DataFrame ``df`` into a BigQuery table using :func:`~pandas.DataFrame.to_gbq`.
-
-.. ipython:: python
-
-   df = pd.DataFrame({'my_string': list('abc'),
-                      'my_int64': list(range(1, 4)),
-                      'my_float64': np.arange(4.0, 7.0),
-                      'my_bool1': [True, False, True],
-                      'my_bool2': [False, True, False],
-                      'my_dates': pd.date_range('now', periods=3)})
-
-   df
-   df.dtypes
-
-.. code-block:: python
-
-   df.to_gbq('my_dataset.my_table', projectid)
-
-.. note::
-
-   The destination table and destination dataset will automatically be created if they do not already exist.
-
-The ``if_exists`` argument can be used to dictate whether to ``'fail'``, ``'replace'``
-or ``'append'`` if the destination table already exists. The default value is ``'fail'``.
-
-For example, assume that ``if_exists`` is set to ``'fail'``. The following snippet will raise
-a ``TableCreationError`` if the destination table already exists.
-
-.. code-block:: python
-
-   df.to_gbq('my_dataset.my_table', projectid, if_exists='fail')
-
-.. note::
-
-   If the ``if_exists`` argument is set to ``'append'``, the destination dataframe will
-   be written to the table using the defined table schema and column types. The
-   dataframe must match the destination table in column order, structure, and
-   data types.
-   If the ``if_exists`` argument is set to ``'replace'``, and the existing table has a
-   different schema, a delay of 2 minutes will be forced to ensure that the new schema
-   has propagated in the Google environment. See
-   `Google BigQuery issue 191 <https://code.google.com/p/google-bigquery/issues/detail?id=191>`__.
-
-Writing large DataFrames can result in errors due to size limitations being exceeded.
-This can be avoided by setting the ``chunksize`` argument when calling :func:`~pandas.DataFrame.to_gbq`.
-For example, the following writes ``df`` to a BigQuery table in batches of 10000 rows at a time:
-
-.. code-block:: python
-
-   df.to_gbq('my_dataset.my_table', projectid, chunksize=10000)
-
-You can also see the progress of your post via the ``verbose`` flag which defaults to ``True``.
-For example:
-
-.. code-block:: python
-
-   In [8]: df.to_gbq('my_dataset.my_table', projectid, chunksize=10000, verbose=True)
-
-           Streaming Insert is 10% Complete
-           Streaming Insert is 20% Complete
-           Streaming Insert is 30% Complete
-           Streaming Insert is 40% Complete
-           Streaming Insert is 50% Complete
-           Streaming Insert is 60% Complete
-           Streaming Insert is 70% Complete
-           Streaming Insert is 80% Complete
-           Streaming Insert is 90% Complete
-           Streaming Insert is 100% Complete
-
-.. note::
-
-   If an error occurs while streaming data to BigQuery, see
-   `Troubleshooting BigQuery Errors <https://cloud.google.com/bigquery/troubleshooting-errors>`__.
-
-.. note::
-
-   The BigQuery SQL query language has some oddities, see the
-   `BigQuery Query Reference Documentation <https://developers.google.com/bigquery/query-reference>`__.
-
-.. note::
-
-   While BigQuery uses SQL-like syntax, it has some important differences from traditional
-   databases both in functionality, API limitations (size and quantity of queries or uploads),
-   and how Google charges for use of the service. You should refer to `Google BigQuery documentation <https://developers.google.com/bigquery/>`__
-   often as the service seems to be changing and evolving. BiqQuery is best for analyzing large
-   sets of data quickly, but it is not a direct replacement for a transactional database.
-
-Creating BigQuery Tables
-''''''''''''''''''''''''
+Google BigQuery
+---------------
 
 .. warning::
 
-   As of 0.17, the function :func:`~pandas.io.gbq.generate_bq_schema` has been deprecated and will be
-   removed in a future version.
-
-As of 0.15.2, the gbq module has a function :func:`~pandas.io.gbq.generate_bq_schema` which will
-produce the dictionary representation schema of the specified pandas DataFrame.
-
-.. code-block:: python
-
-   In [10]: gbq.generate_bq_schema(df, default_type='STRING')
+   Starting in 0.20.0, pandas has split off Google BigQuery support into the
+   separate package ``pandas-gbq``. You can ``pip install pandas-gbq`` to get it.
 
-   Out[10]: {'fields': [{'name': 'my_bool1', 'type': 'BOOLEAN'},
-            {'name': 'my_bool2', 'type': 'BOOLEAN'},
-            {'name': 'my_dates', 'type': 'TIMESTAMP'},
-            {'name': 'my_float64', 'type': 'FLOAT'},
-            {'name': 'my_int64', 'type': 'INTEGER'},
-            {'name': 'my_string', 'type': 'STRING'}]}
+The ``pandas-gbq`` package provides functionality to read/write from Google BigQuery.
 
-.. note::
+pandas integrates with this external package. if ``pandas-gbq`` is installed, you can
+use the pandas methods ``pd.read_gbq`` and ``DataFrame.to_gbq``, which will call the
+respective functions from ``pandas-gbq``.
 
-   If you delete and re-create a BigQuery table with the same name, but different table schema,
-   you must wait 2 minutes before streaming data into the table. As a workaround, consider creating
-   the new table with a different name. Refer to
-   `Google BigQuery issue 191 <https://code.google.com/p/google-bigquery/issues/detail?id=191>`__.
+Full documentation can be found `here <https://pandas-gbq.readthedocs.io/>`__.
 
 .. _io.stata:
 
 Stata Format
 ------------
 
-.. versionadded:: 0.12.0
-
 .. _io.stata_writer:
 
 Writing to Stata format
@@ -4243,7 +4990,7 @@ into a .dta file. The format version of this file is always 115 (Stata 12).
 
 .. ipython:: python
 
-   df = DataFrame(randn(10, 2), columns=list('AB'))
+   df = pd.DataFrame(randn(10, 2), columns=list('AB'))
    df.to_stata('stata.dta')
 
 *Stata* data files have limited data type support; only strings with
@@ -4289,15 +5036,13 @@ Reading from Stata format
 '''''''''''''''''''''''''
 
 The top-level function ``read_stata`` will read a dta file and return
-either a DataFrame or a :class:`~pandas.io.stata.StataReader` that can
+either a ``DataFrame`` or a :class:`~pandas.io.stata.StataReader` that can
 be used to read the file incrementally.
 
 .. ipython:: python
 
    pd.read_stata('stata.dta')
 
-.. versionadded:: 0.16.0
-
 Specifying a ``chunksize`` yields a
 :class:`~pandas.io.stata.StataReader` instance that can be used to
 read ``chunksize`` lines from the file at a time.  The ``StataReader``
@@ -4355,8 +5100,6 @@ values will have ``object`` data type.
 Categorical Data
 ++++++++++++++++
 
-.. versionadded:: 0.15.2
-
 ``Categorical`` data can be exported to *Stata* data files as value labeled data.
 The exported data consists of the underlying category codes as integer data values
 and the categories as value labels.  *Stata* does not have an explicit equivalent
@@ -4391,57 +5134,38 @@ whether imported ``Categorical`` variables are ordered.
 
 .. note::
 
-    *Stata* supports partially labeled series.  These series have value labels for
+    *Stata* supports partially labeled series. These series have value labels for
     some but not all data values. Importing a partially labeled series will produce
-    a ``Categorial`` with string categories for the values that are labeled and
+    a ``Categorical`` with string categories for the values that are labeled and
     numeric categories for values with no label.
 
-.. _io.other:
-
-Other file formats
-------------------
-
-pandas itself only supports IO with a limited set of file formats that map
-cleanly to its tabular data model. For reading and writing other file formats
-into and from pandas, we recommend these packages from the broader community.
-
-netCDF
-''''''
-
-xray_ provides data structures inspired by the pandas DataFrame for working
-with multi-dimensional datasets, with a focus on the netCDF file format and
-easy conversion to and from pandas.
-
-.. _xray: http://xray.readthedocs.org/
-
 .. _io.sas:
 
 .. _io.sas_reader:
 
-SAS Format
-----------
-
-.. versionadded:: 0.17.0
+SAS Formats
+-----------
 
-The top-level function :func:`read_sas` currently can read (but
-not write) SAS xport (.XPT) format files.  Pandas cannot currently
-handle SAS7BDAT files.
+The top-level function :func:`read_sas` can read (but not write) SAS
+`xport` (.XPT) and (since *v0.18.0*) `SAS7BDAT` (.sas7bdat) format files.
 
-XPORT files only contain two value types: ASCII text and double
-precision numeric values.  There is no automatic type conversion to
-integers, dates, or categoricals.  By default the whole file is read
-and returned as a ``DataFrame``.
+SAS files only contain two value types: ASCII text and floating point
+values (usually 8 bytes but sometimes truncated).  For xport files,
+there is no automatic type conversion to integers, dates, or
+categoricals.  For SAS7BDAT files, the format codes may allow date
+variables to be automatically converted to dates.  By default the
+whole file is read and returned as a ``DataFrame``.
 
-Specify a ``chunksize`` or use ``iterator=True`` to obtain an
-``XportReader`` object for incrementally reading the file.  The
-``XportReader`` object also has attributes that contain additional
-information about the file and its variables.
+Specify a ``chunksize`` or use ``iterator=True`` to obtain reader
+objects (``XportReader`` or ``SAS7BDATReader``) for incrementally
+reading the file.  The reader objects also have attributes that
+contain additional information about the file and its variables.
 
-Read a SAS XPORT file:
+Read a SAS7BDAT file:
 
 .. code-block:: python
 
-    df = pd.read_sas('sas_xport.xpt')
+    df = pd.read_sas('sas_data.sas7bdat')
 
 Obtain an iterator and read an XPORT file 100,000 lines at a time:
 
@@ -4456,90 +5180,139 @@ web site.
 
 .. _specification: https://support.sas.com/techsup/technote/ts140.pdf
 
+No official documentation is available for the SAS7BDAT format.
+
+.. _io.other:
+
+Other file formats
+------------------
+
+pandas itself only supports IO with a limited set of file formats that map
+cleanly to its tabular data model. For reading and writing other file formats
+into and from pandas, we recommend these packages from the broader community.
+
+netCDF
+''''''
+
+xarray_ provides data structures inspired by the pandas ``DataFrame`` for working
+with multi-dimensional datasets, with a focus on the netCDF file format and
+easy conversion to and from pandas.
+
+.. _xarray: http://xarray.pydata.org/
+
 .. _io.perf:
 
 Performance Considerations
 --------------------------
 
-This is an informal comparison of various IO methods, using pandas 0.13.1.
+This is an informal comparison of various IO methods, using pandas
+0.20.3. Timings are machine dependent and small differences should be
+ignored.
 
-.. code-block:: python
+.. code-block:: ipython
 
-   In [1]: df = DataFrame(randn(1000000,2),columns=list('AB'))
+   In [1]: sz = 1000000
+   In [2]: df = pd.DataFrame({'A': randn(sz), 'B': [1] * sz})
 
-   In [2]: df.info()
+   In [3]: df.info()
    <class 'pandas.core.frame.DataFrame'>
-   Int64Index: 1000000 entries, 0 to 999999
+   RangeIndex: 1000000 entries, 0 to 999999
    Data columns (total 2 columns):
    A    1000000 non-null float64
-   B    1000000 non-null float64
-   dtypes: float64(2)
-   memory usage: 22.9 MB
+   B    1000000 non-null int64
+   dtypes: float64(1), int64(1)
+   memory usage: 15.3 MB
 
-Writing
+When writing, the top-three functions in terms of speed are are
+``test_pickle_write``, ``test_feather_write`` and ``test_hdf_fixed_write_compress``.
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [14]: %timeit test_sql_write(df)
-   1 loops, best of 3: 6.24 s per loop
+   2.37 s ± 36.6 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
 
    In [15]: %timeit test_hdf_fixed_write(df)
-   1 loops, best of 3: 237 ms per loop
+   194 ms ± 65.9 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
 
    In [26]: %timeit test_hdf_fixed_write_compress(df)
-   1 loops, best of 3: 245 ms per loop
+   119 ms ± 2.15 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
 
    In [16]: %timeit test_hdf_table_write(df)
-   1 loops, best of 3: 901 ms per loop
+   623 ms ± 125 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
 
    In [27]: %timeit test_hdf_table_write_compress(df)
-   1 loops, best of 3: 952 ms per loop
+   563 ms ± 23.7 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
 
    In [17]: %timeit test_csv_write(df)
-   1 loops, best of 3: 3.44 s per loop
+   3.13 s ± 49.9 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
 
-Reading
+   In [30]: %timeit test_feather_write(df)
+   103 ms ± 5.88 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
 
-.. code-block:: python
+   In [31]: %timeit test_pickle_write(df)
+   109 ms ± 3.72 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
+
+   In [32]: %timeit test_pickle_write_compress(df)
+   3.33 s ± 55.2 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
+
+When reading, the top three are ``test_feather_read``, ``test_pickle_read`` and
+``test_hdf_fixed_read``.
+
+.. code-block:: ipython
 
    In [18]: %timeit test_sql_read()
-   1 loops, best of 3: 766 ms per loop
+   1.35 s ± 14.7 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
 
    In [19]: %timeit test_hdf_fixed_read()
-   10 loops, best of 3: 19.1 ms per loop
+   14.3 ms ± 438 µs per loop (mean ± std. dev. of 7 runs, 100 loops each)
 
    In [28]: %timeit test_hdf_fixed_read_compress()
-   10 loops, best of 3: 36.3 ms per loop
+   23.5 ms ± 672 µs per loop (mean ± std. dev. of 7 runs, 10 loops each)
 
    In [20]: %timeit test_hdf_table_read()
-   10 loops, best of 3: 39 ms per loop
+   35.4 ms ± 314 µs per loop (mean ± std. dev. of 7 runs, 10 loops each)
 
    In [29]: %timeit test_hdf_table_read_compress()
-   10 loops, best of 3: 60.6 ms per loop
+   42.6 ms ± 2.1 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
 
    In [22]: %timeit test_csv_read()
-   1 loops, best of 3: 620 ms per loop
+   516 ms ± 27.1 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
+
+   In [33]: %timeit test_feather_read()
+   4.06 ms ± 115 µs per loop (mean ± std. dev. of 7 runs, 100 loops each)
+
+   In [34]: %timeit test_pickle_read()
+   6.5 ms ± 172 µs per loop (mean ± std. dev. of 7 runs, 100 loops each)
+
+   In [35]: %timeit test_pickle_read_compress()
+   588 ms ± 3.57 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
 
 Space on disk (in bytes)
 
-.. code-block:: python
+.. code-block:: none
 
-    25843712 Apr  8 14:11 test.sql
-    24007368 Apr  8 14:11 test_fixed.hdf
-    15580682 Apr  8 14:11 test_fixed_compress.hdf
-    24458444 Apr  8 14:11 test_table.hdf
-    16797283 Apr  8 14:11 test_table_compress.hdf
-    46152810 Apr  8 14:11 test.csv
+    34816000 Aug 21 18:00 test.sql
+    24009240 Aug 21 18:00 test_fixed.hdf
+     7919610 Aug 21 18:00 test_fixed_compress.hdf
+    24458892 Aug 21 18:00 test_table.hdf
+     8657116 Aug 21 18:00 test_table_compress.hdf
+    28520770 Aug 21 18:00 test.csv
+    16000248 Aug 21 18:00 test.feather
+    16000848 Aug 21 18:00 test.pkl
+     7554108 Aug 21 18:00 test.pkl.compress
 
-And here's the code
+And here's the code:
 
 .. code-block:: python
 
-   import sqlite3
    import os
+   import pandas as pd
+   import sqlite3
+   from numpy.random import randn
    from pandas.io import sql
 
-   df = DataFrame(randn(1000000,2),columns=list('AB'))
+   sz = 1000000
+   df = pd.DataFrame({'A': randn(sz), 'B': [1] * sz})
 
    def test_sql_write(df):
        if os.path.exists('test.sql'):
@@ -4554,31 +5327,49 @@ And here's the code
        sql_db.close()
 
    def test_hdf_fixed_write(df):
-       df.to_hdf('test_fixed.hdf','test',mode='w')
+       df.to_hdf('test_fixed.hdf', 'test', mode='w')
 
    def test_hdf_fixed_read():
-       pd.read_hdf('test_fixed.hdf','test')
+       pd.read_hdf('test_fixed.hdf', 'test')
 
    def test_hdf_fixed_write_compress(df):
-       df.to_hdf('test_fixed_compress.hdf','test',mode='w',complib='blosc')
+       df.to_hdf('test_fixed_compress.hdf', 'test', mode='w', complib='blosc')
 
    def test_hdf_fixed_read_compress():
-       pd.read_hdf('test_fixed_compress.hdf','test')
+       pd.read_hdf('test_fixed_compress.hdf', 'test')
 
    def test_hdf_table_write(df):
-       df.to_hdf('test_table.hdf','test',mode='w',format='table')
+       df.to_hdf('test_table.hdf', 'test', mode='w', format='table')
 
    def test_hdf_table_read():
-       pd.read_hdf('test_table.hdf','test')
+       pd.read_hdf('test_table.hdf', 'test')
 
    def test_hdf_table_write_compress(df):
-       df.to_hdf('test_table_compress.hdf','test',mode='w',complib='blosc',format='table')
+       df.to_hdf('test_table_compress.hdf', 'test', mode='w', complib='blosc', format='table')
 
    def test_hdf_table_read_compress():
-       pd.read_hdf('test_table_compress.hdf','test')
+       pd.read_hdf('test_table_compress.hdf', 'test')
 
    def test_csv_write(df):
-       df.to_csv('test.csv',mode='w')
+       df.to_csv('test.csv', mode='w')
 
    def test_csv_read():
-       pd.read_csv('test.csv',index_col=0)
+       pd.read_csv('test.csv', index_col=0)
+
+   def test_feather_write(df):
+       df.to_feather('test.feather')
+
+   def test_feather_read():
+       pd.read_feather('test.feather')
+
+   def test_pickle_write(df):
+       df.to_pickle('test.pkl')
+
+   def test_pickle_read():
+       pd.read_pickle('test.pkl')
+
+   def test_pickle_write_compress(df):
+       df.to_pickle('test.pkl.compress', compression='xz')
+
+   def test_pickle_read_compress():
+       pd.read_pickle('test.pkl.compress', compression='xz')
diff --git a/doc/source/merging.rst b/doc/source/merging.rst
index eb75c2982131a..2eb5962ead986 100644
--- a/doc/source/merging.rst
+++ b/doc/source/merging.rst
@@ -13,7 +13,7 @@
 
    import matplotlib.pyplot as plt
    plt.close('all')
-   import pandas.util.doctools as doctools
+   import pandas.util._doctools as doctools
    p = doctools.TablePlotter()
 
 
@@ -31,11 +31,11 @@ operations.
 Concatenating objects
 ---------------------
 
-The ``concat`` function (in the main pandas namespace) does all of the heavy
-lifting of performing concatenation operations along an axis while performing
-optional set logic (union or intersection) of the indexes (if any) on the other
-axes. Note that I say "if any" because there is only a single possible axis of
-concatenation for Series.
+The :func:`~pandas.concat` function (in the main pandas namespace) does all of 
+the heavy lifting of performing concatenation operations along an axis while 
+performing optional set logic (union or intersection) of the indexes (if any) on 
+the other axes. Note that I say "if any" because there is only a single possible 
+axis of concatenation for Series.
 
 Before diving into all of the details of ``concat`` and what it can do, here is
 a simple example:
@@ -78,36 +78,41 @@ some configurable handling of "what to do with the other axes":
 ::
 
     pd.concat(objs, axis=0, join='outer', join_axes=None, ignore_index=False,
-           keys=None, levels=None, names=None, verify_integrity=False)
-
-- ``objs``: list or dict of Series, DataFrame, or Panel objects. If a dict is
-  passed, the sorted keys will be used as the `keys` argument, unless it is
-  passed, in which case the values will be selected (see below)
-- ``axis``: {0, 1, ...}, default 0. The axis to concatenate along
-- ``join``: {'inner', 'outer'}, default 'outer'. How to handle indexes on
-  other axis(es). Outer for union and inner for intersection
-- ``join_axes``: list of Index objects. Specific indexes to use for the other
-  n - 1 axes instead of performing inner/outer set logic
-- ``keys``: sequence, default None. Construct hierarchical index using the
-  passed keys as the outermost level If multiple levels passed, should
-  contain tuples.
-- ``levels`` : list of sequences, default None. If keys passed, specific
-  levels to use for the resulting MultiIndex. Otherwise they will be inferred
-  from the keys
-- ``names``: list, default None. Names for the levels in the resulting
-  hierarchical index
-- ``verify_integrity``: boolean, default False. Check whether the new
-  concatenated axis contains duplicates. This can be very expensive relative
-  to the actual data concatenation
-- ``ignore_index`` : boolean, default False. If True, do not use the index
+              keys=None, levels=None, names=None, verify_integrity=False,
+              copy=True)
+
+* ``objs`` : a sequence or mapping of Series, DataFrame, or Panel objects. If a
+  dict is passed, the sorted keys will be used as the `keys` argument, unless
+  it is passed, in which case the values will be selected (see below). Any None
+  objects will be dropped silently unless they are all None in which case a
+  ValueError will be raised.
+* ``axis`` : {0, 1, ...}, default 0. The axis to concatenate along.
+* ``join`` : {'inner', 'outer'}, default 'outer'. How to handle indexes on
+  other axis(es). Outer for union and inner for intersection.
+* ``ignore_index`` : boolean, default False. If True, do not use the index
   values on the concatenation axis. The resulting axis will be labeled 0, ...,
   n - 1. This is useful if you are concatenating objects where the
-  concatenation axis does not have meaningful indexing information.
+  concatenation axis does not have meaningful indexing information. Note
+  the index values on the other axes are still respected in the join.
+* ``join_axes`` : list of Index objects. Specific indexes to use for the other
+  n - 1 axes instead of performing inner/outer set logic.
+* ``keys`` : sequence, default None. Construct hierarchical index using the
+  passed keys as the outermost level. If multiple levels passed, should
+  contain tuples.
+* ``levels`` : list of sequences, default None. Specific levels (unique values)
+  to use for constructing a MultiIndex. Otherwise they will be inferred from the
+  keys.
+* ``names`` : list, default None. Names for the levels in the resulting
+  hierarchical index.
+* ``verify_integrity`` : boolean, default False. Check whether the new
+  concatenated axis contains duplicates. This can be very expensive relative
+  to the actual data concatenation.
+* ``copy`` : boolean, default True. If False, do not copy data unnecessarily.
 
-Without a little bit of context and example many of these arguments don't make
-much sense. Let's take the above example. Suppose we wanted to associate
-specific keys with each of the pieces of the chopped up DataFrame. We can do
-this using the ``keys`` argument:
+Without a little bit of context many of these arguments don't make much sense. 
+Let's revisit the above example. Suppose we wanted to associate specific keys 
+with each of the pieces of the chopped up DataFrame. We can do this using the 
+``keys`` argument:
 
 .. ipython:: python
 
@@ -123,20 +128,20 @@ this using the ``keys`` argument:
 
 As you can see (if you've read the rest of the documentation), the resulting
 object's index has a :ref:`hierarchical index <advanced.hierarchical>`. This
-means that we can now do stuff like select out each chunk by key:
+means that we can now select out each chunk by key:
 
 .. ipython:: python
 
-   result.ix['y']
+   result.loc['y']
 
 It's not a stretch to see how this can be very useful. More detail on this
 functionality below.
 
 .. note::
-   It is worth noting however, that ``concat`` (and therefore ``append``) makes
-   a full copy of the data, and that constantly reusing this function can
-   create a signifcant performance hit. If you need to use the operation over
-   several datasets, use a list comprehension.
+   It is worth noting that :func:`~pandas.concat` (and therefore 
+   :func:`~pandas.append`) makes a full copy of the data, and that constantly 
+   reusing this function can create a significant performance hit. If you need 
+   to use the operation over several datasets, use a list comprehension.
 
 ::
 
@@ -147,26 +152,25 @@ functionality below.
 Set logic on the other axes
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-When gluing together multiple DataFrames (or Panels or...), for example, you
-have a choice of how to handle the other axes (other than the one being
-concatenated). This can be done in three ways:
+When gluing together multiple DataFrames, you have a choice of how to handle
+the other axes (other than the one being concatenated). This can be done in
+the following three ways:
 
-- Take the (sorted) union of them all, ``join='outer'``. This is the default
+* Take the union of them all, ``join='outer'``. This is the default
   option as it results in zero information loss.
-- Take the intersection, ``join='inner'``.
-- Use a specific index (in the case of DataFrame) or indexes (in the case of
-  Panel or future higher dimensional objects), i.e. the ``join_axes`` argument
+* Take the intersection, ``join='inner'``.
+* Use a specific index, as passed to the ``join_axes`` argument.
 
-Here is a example of each of these methods. First, the default ``join='outer'``
+Here is an example of each of these methods. First, the default ``join='outer'``
 behavior:
 
 .. ipython:: python
 
    df4 = pd.DataFrame({'B': ['B2', 'B3', 'B6', 'B7'],
-                    'D': ['D2', 'D3', 'D6', 'D7'],
-                    'F': ['F2', 'F3', 'F6', 'F7']},
-                   index=[2, 3, 6, 7])
-   result = pd.concat([df1, df4], axis=1)
+                       'D': ['D2', 'D3', 'D6', 'D7'],
+                       'F': ['F2', 'F3', 'F6', 'F7']},
+                      index=[2, 3, 6, 7])
+   result = pd.concat([df1, df4], axis=1, sort=False)
 
 
 .. ipython:: python
@@ -177,8 +181,16 @@ behavior:
           labels=['df1', 'df4'], vertical=False);
    plt.close('all');
 
-Note that the row indexes have been unioned and sorted. Here is the same thing
-with ``join='inner'``:
+.. warning::
+
+   .. versionchanged:: 0.23.0
+
+   The default behavior with ``join='outer'`` is to sort the other axis
+   (columns in this case). In a future version of pandas, the default will
+   be to not sort. We specified ``sort=False`` to opt in to the new
+   behavior now.
+
+Here is the same thing with ``join='inner'``:
 
 .. ipython:: python
 
@@ -212,9 +224,9 @@ DataFrame:
 Concatenating using ``append``
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-A useful shortcut to ``concat`` are the ``append`` instance methods on Series
-and DataFrame. These methods actually predated ``concat``. They concatenate
-along ``axis=0``, namely the index:
+A useful shortcut to :func:`~pandas.concat` are the :meth:`~DataFrame.append` 
+instance methods on ``Series`` and ``DataFrame``. These methods actually predated 
+``concat``. They concatenate along ``axis=0``, namely the index:
 
 .. ipython:: python
 
@@ -228,7 +240,7 @@ along ``axis=0``, namely the index:
           labels=['df1', 'df2'], vertical=True);
    plt.close('all');
 
-In the case of DataFrame, the indexes must be disjoint but the columns do not
+In the case of ``DataFrame``, the indexes must be disjoint but the columns do not
 need to be:
 
 .. ipython:: python
@@ -259,18 +271,17 @@ need to be:
 
 .. note::
 
-   Unlike `list.append` method, which appends to the original list and
-   returns nothing, ``append`` here **does not** modify ``df1`` and
-   returns its copy with ``df2`` appended.
+   Unlike the :py:meth:`~list.append` method, which appends to the original list 
+   and returns ``None``, :meth:`~DataFrame.append`  here **does not** modify 
+   ``df1`` and returns its copy with ``df2`` appended.
 
 .. _merging.ignore_index:
 
 Ignoring indexes on the concatenation axis
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-For DataFrames which don't have a meaningful index, you may wish to append them
-and ignore the fact that they may have overlapping indexes:
-
-To do this, use the ``ignore_index`` argument:
+For ``DataFrame`` objects which don't have a meaningful index, you may wish
+to append them and ignore the fact that they may have overlapping indexes. To
+do this, use the ``ignore_index`` argument:
 
 .. ipython:: python
 
@@ -284,7 +295,7 @@ To do this, use the ``ignore_index`` argument:
           labels=['df1', 'df4'], vertical=True);
    plt.close('all');
 
-This is also a valid argument to ``DataFrame.append``:
+This is also a valid argument to :meth:`DataFrame.append`:
 
 .. ipython:: python
 
@@ -303,9 +314,9 @@ This is also a valid argument to ``DataFrame.append``:
 Concatenating with mixed ndims
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-You can concatenate a mix of Series and DataFrames. The
-Series will be transformed to DataFrames with the column name as
-the name of the Series.
+You can concatenate a mix of ``Series`` and ``DataFrame`` objects. The
+``Series`` will be transformed to ``DataFrame`` with the column name as
+the name of the ``Series``.
 
 .. ipython:: python
 
@@ -320,7 +331,14 @@ the name of the Series.
           labels=['df1', 's1'], vertical=False);
    plt.close('all');
 
-If unnamed Series are passed they will be numbered consecutively.
+.. note::
+
+   Since we're concatenating a ``Series`` to a ``DataFrame``, we could have
+   achieved the same result with :meth:`DataFrame.assign`. To concatenate an
+   arbitrary number of pandas objects (``DataFrame`` or ``Series``), use
+   ``concat``.
+
+If unnamed ``Series`` are passed they will be numbered consecutively.
 
 .. ipython:: python
 
@@ -352,8 +370,10 @@ Passing ``ignore_index=True`` will drop all name references.
 More concatenating with group keys
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-A fairly common use of the ``keys`` argument is to override the column names when creating a new DataFrame based on existing Series.
-Notice how the default behaviour consists on letting the resulting DataFrame inherits the parent Series' name, when these existed.
+A fairly common use of the ``keys`` argument is to override the column names 
+when creating a new ``DataFrame`` based on existing ``Series``.
+Notice how the default behaviour consists on letting the resulting ``DataFrame`` 
+inherit the parent ``Series``' name, when these existed.
 
 .. ipython:: python
 
@@ -369,7 +389,7 @@ Through the ``keys`` argument we can override the existing column names.
 
    pd.concat([s3, s4, s5], axis=1, keys=['red','blue','yellow'])
 
-Let's consider now a variation on the very first example presented:
+Let's consider a variation of the very first example presented:
 
 .. ipython:: python
 
@@ -412,7 +432,7 @@ for the ``keys`` argument (unless other keys are specified):
    plt.close('all');
 
 The MultiIndex created has levels that are constructed from the passed keys and
-the index of the DataFrame pieces:
+the index of the ``DataFrame`` pieces:
 
 .. ipython:: python
 
@@ -439,7 +459,7 @@ do so using the ``levels`` argument:
 
    result.index.levels
 
-Yes, this is fairly esoteric, but is actually necessary for implementing things
+This is fairly esoteric, but it is actually necessary for implementing things
 like GroupBy where the order of a categorical variable is meaningful.
 
 .. _merging.append.row:
@@ -448,8 +468,8 @@ Appending rows to a DataFrame
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 While not especially efficient (since a new object must be created), you can
-append a single row to a DataFrame by passing a Series or dict to ``append``,
-which returns a new DataFrame as above.
+append a single row to a ``DataFrame`` by passing a ``Series`` or dict to 
+``append``, which returns a new ``DataFrame`` as above.
 
 .. ipython:: python
 
@@ -493,94 +513,108 @@ pandas has full-featured, **high performance** in-memory join operations
 idiomatically very similar to relational databases like SQL. These methods
 perform significantly better (in some cases well over an order of magnitude
 better) than other open source implementations (like ``base::merge.data.frame``
-in R). The reason for this is careful algorithmic design and internal layout of
-the data in DataFrame.
+in R). The reason for this is careful algorithmic design and the internal layout 
+of the data in ``DataFrame``.
 
 See the :ref:`cookbook<cookbook.merge>` for some advanced strategies.
 
 Users who are familiar with SQL but new to pandas might be interested in a
 :ref:`comparison with SQL<compare_with_sql.join>`.
 
-pandas provides a single function, ``merge``, as the entry point for all
-standard database join operations between DataFrame objects:
+pandas provides a single function, :func:`~pandas.merge`, as the entry point for 
+all standard database join operations between ``DataFrame`` objects:
 
 ::
 
-    merge(left, right, how='inner', on=None, left_on=None, right_on=None,
-          left_index=False, right_index=False, sort=True,
-          suffixes=('_x', '_y'), copy=True, indicator=False)
-
-Here's a description of what each argument is for:
-
-  - ``left``: A DataFrame object
-  - ``right``: Another DataFrame object
-  - ``on``: Columns (names) to join on. Must be found in both the left and
-    right DataFrame objects. If not passed and ``left_index`` and
-    ``right_index`` are ``False``, the intersection of the columns in the
-    DataFrames will be inferred to be the join keys
-  - ``left_on``: Columns from the left DataFrame to use as keys. Can either be
-    column names or arrays with length equal to the length of the DataFrame
-  - ``right_on``: Columns from the right DataFrame to use as keys. Can either be
-    column names or arrays with length equal to the length of the DataFrame
-  - ``left_index``: If ``True``, use the index (row labels) from the left
-    DataFrame as its join key(s). In the case of a DataFrame with a MultiIndex
-    (hierarchical), the number of levels must match the number of join keys
-    from the right DataFrame
-  - ``right_index``: Same usage as ``left_index`` for the right DataFrame
-  - ``how``: One of ``'left'``, ``'right'``, ``'outer'``, ``'inner'``. Defaults
-    to ``inner``. See below for more detailed description of each method
-  - ``sort``: Sort the result DataFrame by the join keys in lexicographical
-    order. Defaults to ``True``, setting to ``False`` will improve performance
-    substantially in many cases
-  - ``suffixes``: A tuple of string suffixes to apply to overlapping
-    columns. Defaults to ``('_x', '_y')``.
-  - ``copy``: Always copy data (default ``True``) from the passed DataFrame
-    objects, even when reindexing is not necessary. Cannot be avoided in many
-    cases but may improve performance / memory usage. The cases where copying
-    can be avoided are somewhat pathological but this option is provided
-    nonetheless.
-  - ``indicator``: Add a column to the output DataFrame called ``_merge``
-    with information on the source of each row. ``_merge`` is Categorical-type 
-    and takes on a value of ``left_only`` for observations whose merge key 
-    only appears in ``'left'`` DataFrame, ``right_only`` for observations whose 
-    merge key only appears in ``'right'`` DataFrame, and ``both`` if the 
-    observation's merge key is found in both. 
-    
-    .. versionadded:: 0.17.0
+    pd.merge(left, right, how='inner', on=None, left_on=None, right_on=None,
+             left_index=False, right_index=False, sort=True,
+             suffixes=('_x', '_y'), copy=True, indicator=False,
+             validate=None)
+
+* ``left``: A DataFrame object.
+* ``right``: Another DataFrame object.
+* ``on``: Column or index level names to join on. Must be found in both the left
+  and right DataFrame objects. If not passed and ``left_index`` and
+  ``right_index`` are ``False``, the intersection of the columns in the
+  DataFrames will be inferred to be the join keys.
+* ``left_on``: Columns or index levels from the left DataFrame to use as
+  keys. Can either be column names, index level names, or arrays with length
+  equal to the length of the DataFrame.
+* ``right_on``: Columns or index levels from the right DataFrame to use as
+  keys. Can either be column names, index level names, or arrays with length
+  equal to the length of the DataFrame.
+* ``left_index``: If ``True``, use the index (row labels) from the left
+  DataFrame as its join key(s). In the case of a DataFrame with a MultiIndex
+  (hierarchical), the number of levels must match the number of join keys
+  from the right DataFrame.
+* ``right_index``: Same usage as ``left_index`` for the right DataFrame
+* ``how``: One of ``'left'``, ``'right'``, ``'outer'``, ``'inner'``. Defaults
+  to ``inner``. See below for more detailed description of each method.
+* ``sort``: Sort the result DataFrame by the join keys in lexicographical
+  order. Defaults to ``True``, setting to ``False`` will improve performance
+  substantially in many cases.
+* ``suffixes``: A tuple of string suffixes to apply to overlapping
+  columns. Defaults to ``('_x', '_y')``.
+* ``copy``: Always copy data (default ``True``) from the passed DataFrame
+  objects, even when reindexing is not necessary. Cannot be avoided in many
+  cases but may improve performance / memory usage. The cases where copying
+  can be avoided are somewhat pathological but this option is provided
+  nonetheless.
+* ``indicator``: Add a column to the output DataFrame called ``_merge``
+  with information on the source of each row. ``_merge`` is Categorical-type
+  and takes on a value of ``left_only`` for observations whose merge key
+  only appears in ``'left'`` DataFrame, ``right_only`` for observations whose
+  merge key only appears in ``'right'`` DataFrame, and ``both`` if the
+  observation's merge key is found in both.
+
+* ``validate`` : string, default None.
+  If specified, checks if merge is of specified type.
+
+    * "one_to_one" or "1:1": checks if merge keys are unique in both
+      left and right datasets.
+    * "one_to_many" or "1:m": checks if merge keys are unique in left
+      dataset.
+    * "many_to_one" or "m:1": checks if merge keys are unique in right
+      dataset.
+    * "many_to_many" or "m:m": allowed, but does not result in checks.
+
+  .. versionadded:: 0.21.0
 
+.. note::
+
+   Support for specifying index levels as the ``on``, ``left_on``, and
+   ``right_on`` parameters was added in version 0.23.0.
 
 The return type will be the same as ``left``. If ``left`` is a ``DataFrame``
 and ``right`` is a subclass of DataFrame, the return type will still be
 ``DataFrame``.
 
 ``merge`` is a function in the pandas namespace, and it is also available as a
-DataFrame instance method, with the calling DataFrame being implicitly
-considered the left object in the join.
+``DataFrame`` instance method :meth:`~DataFrame.merge`, with the calling 
+``DataFrame`` being implicitly considered the left object in the join.
 
-The related ``DataFrame.join`` method, uses ``merge`` internally for the
-index-on-index and index-on-column(s) joins, but *joins on indexes* by default
-rather than trying to join on common columns (the default behavior for
-``merge``). If you are joining on index, you may wish to use ``DataFrame.join``
-to save yourself some typing.
+The related :meth:`~DataFrame.join` method, uses ``merge`` internally for the
+index-on-index (by default) and column(s)-on-index join. If you are joining on
+index only, you may wish to use ``DataFrame.join`` to save yourself some typing.
 
 Brief primer on merge methods (relational algebra)
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Experienced users of relational databases like SQL will be familiar with the
 terminology used to describe join operations between two SQL-table like
-structures (DataFrame objects). There are several cases to consider which are
-very important to understand:
+structures (``DataFrame`` objects). There are several cases to consider which 
+are very important to understand:
 
-  - **one-to-one** joins: for example when joining two DataFrame objects on
-    their indexes (which must contain unique values)
-  - **many-to-one** joins: for example when joining an index (unique) to one or
-    more columns in a DataFrame
-  - **many-to-many** joins: joining columns on columns.
+* **one-to-one** joins: for example when joining two ``DataFrame`` objects on
+  their indexes (which must contain unique values).
+* **many-to-one** joins: for example when joining an index (unique) to one or
+  more columns in a different ``DataFrame``.
+* **many-to-many** joins: joining columns on columns.
 
 .. note::
 
    When joining columns on columns (potentially a many-to-many join), any
-   indexes on the passed DataFrame objects **will be discarded**.
+   indexes on the passed ``DataFrame`` objects **will be discarded**.
 
 
 It is worth spending some time understanding the result of the **many-to-many**
@@ -608,7 +642,9 @@ key combination:
           labels=['left', 'right'], vertical=False);
    plt.close('all');
 
-Here is a more complicated example with multiple join keys:
+Here is a more complicated example with multiple join keys. Only the keys 
+appearing in ``left`` and ``right`` are present (the intersection), since 
+``how='inner'`` by default.
 
 .. ipython:: python
 
@@ -693,14 +729,74 @@ either the left or right tables, the values in the joined table will be
           labels=['left', 'right'], vertical=False);
    plt.close('all');
 
+Here is another example with duplicate join keys in DataFrames:
+
+.. ipython:: python
+
+   left = pd.DataFrame({'A' : [1,2], 'B' : [2, 2]})
+
+   right = pd.DataFrame({'A' : [4,5,6], 'B': [2,2,2]})
+
+   result = pd.merge(left, right, on='B', how='outer')
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_on_key_dup.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+
+.. warning::
+
+  Joining / merging on duplicate keys can cause a returned frame that is the multiplication of the row dimensions, which may result in memory overflow. It is the user' s responsibility to manage duplicate values in keys before joining large DataFrames.
+
+.. _merging.validation:
+
+Checking for duplicate keys
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.21.0
+
+Users can use the ``validate`` argument to automatically check whether there 
+are unexpected duplicates in their merge keys. Key uniqueness is checked before 
+merge operations and so should protect against memory overflows. Checking key 
+uniqueness is also a good way to ensure user data structures are as expected. 
+
+In the following example, there are duplicate values of ``B`` in the right 
+``DataFrame``. As this is not a one-to-one merge -- as specified in the 
+``validate`` argument -- an exception will be raised.
+
+
+.. ipython:: python
+
+  left = pd.DataFrame({'A' : [1,2], 'B' : [1, 2]})
+  right = pd.DataFrame({'A' : [4,5,6], 'B': [2, 2, 2]})
+
+.. code-block:: ipython
+
+  In [53]: result = pd.merge(left, right, on='B', how='outer', validate="one_to_one")
+  ...
+  MergeError: Merge keys are not unique in right dataset; not a one-to-one merge    
+
+If the user is aware of the duplicates in the right ``DataFrame`` but wants to 
+ensure there are no duplicates in the left DataFrame, one can use the 
+``validate='one_to_many'`` argument instead, which will not raise an exception. 
+
+.. ipython:: python
+
+   pd.merge(left, right, on='B', how='outer', validate="one_to_many")
+
+
 .. _merging.indicator:
 
 The merge indicator
 ~~~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.17.0
-
-``merge`` now accepts the argument ``indicator``. If ``True``, a Categorical-type column called ``_merge`` will be added to the output object that takes on values:
+:func:`~pandas.merge` accepts the argument ``indicator``. If ``True``, a 
+Categorical-type column called ``_merge`` will be added to the output object 
+that takes on values:
 
   ===================================   ================
   Observation Origin                    ``_merge`` value
@@ -712,25 +808,103 @@ The merge indicator
 
 .. ipython:: python
 
-   df1 = DataFrame({'col1':[0,1], 'col_left':['a','b']})
-   df2 = DataFrame({'col1':[1,2,2],'col_right':[2,2,2]})
-   merge(df1, df2, on='col1', how='outer', indicator=True)
+   df1 = pd.DataFrame({'col1': [0, 1], 'col_left':['a', 'b']})
+   df2 = pd.DataFrame({'col1': [1, 2, 2],'col_right':[2, 2, 2]})
+   pd.merge(df1, df2, on='col1', how='outer', indicator=True)
+
+The ``indicator`` argument will also accept string arguments, in which case the indicator function will use the value of the passed string as the name for the indicator column.
+
+.. ipython:: python
+
+   pd.merge(df1, df2, on='col1', how='outer', indicator='indicator_column')
+
+
+.. _merging.dtypes:
+
+Merge Dtypes
+~~~~~~~~~~~~
+
+.. versionadded:: 0.19.0
+
+Merging will preserve the dtype of the join keys.
+
+.. ipython:: python
+
+   left = pd.DataFrame({'key': [1], 'v1': [10]})
+   left
+   right = pd.DataFrame({'key': [1, 2], 'v1': [20, 30]})
+   right
 
-The ``indicator`` argument will also accept string arguments, in which case the indicator function will use the value of the passed string as the name for the indicator column. 
+We are able to preserve the join keys:
 
 .. ipython:: python
 
-   merge(df1, df2, on='col1', how='outer', indicator='indicator_column')
+   pd.merge(left, right, how='outer')
+   pd.merge(left, right, how='outer').dtypes
+
+Of course if you have missing values that are introduced, then the
+resulting dtype will be upcast.
 
+.. ipython:: python
+
+   pd.merge(left, right, how='outer', on='key')
+   pd.merge(left, right, how='outer', on='key').dtypes
+
+.. versionadded:: 0.20.0
+
+Merging will preserve ``category`` dtypes of the mergands. See also the section on :ref:`categoricals <categorical.merge>`.
+
+The left frame.
+
+.. ipython:: python
+
+   from pandas.api.types import CategoricalDtype
+
+   X = pd.Series(np.random.choice(['foo', 'bar'], size=(10,)))
+   X = X.astype(CategoricalDtype(categories=['foo', 'bar']))
+
+   left = pd.DataFrame({'X': X,
+                        'Y': np.random.choice(['one', 'two', 'three'], size=(10,))})
+   left
+   left.dtypes
+
+The right frame.
+
+.. ipython:: python
+
+   right = pd.DataFrame({
+        'X': pd.Series(['foo', 'bar'],
+                       dtype=CategoricalDtype(['foo', 'bar'])),
+        'Z': [1, 2]
+   })
+   right
+   right.dtypes
+
+The merged result:
+
+.. ipython:: python
+
+   result = pd.merge(left, right, how='outer')
+   result
+   result.dtypes
+
+.. note::
+
+   The category dtypes must be *exactly* the same, meaning the same categories and the ordered attribute.
+   Otherwise the result will coerce to ``object`` dtype.
+
+.. note::
+
+   Merging on ``category`` dtypes that are the same can be quite performant compared to ``object`` dtype merging.
 
 .. _merging.join.index:
 
 Joining on index
 ~~~~~~~~~~~~~~~~
 
-``DataFrame.join`` is a convenient method for combining the columns of two
-potentially differently-indexed DataFrames into a single result DataFrame. Here
-is a very basic example:
+:meth:`DataFrame.join` is a convenient method for combining the columns of two
+potentially differently-indexed ``DataFrames`` into a single result 
+``DataFrame``. Here is a very basic example:
 
 .. ipython:: python
 
@@ -764,6 +938,8 @@ is a very basic example:
           labels=['left', 'right'], vertical=False);
    plt.close('all');
 
+The same as above, but with ``how='inner'``.
+
 .. ipython:: python
 
    result = left.join(right, how='inner')
@@ -807,10 +983,10 @@ indexes:
 Joining key columns on an index
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-``join`` takes an optional ``on`` argument which may be a column or multiple
-column names, which specifies that the passed DataFrame is to be aligned on
-that column in the DataFrame. These two function calls are completely
-equivalent:
+:meth:`~DataFrame.join` takes an optional ``on`` argument which may be a column 
+or multiple column names, which specifies that the passed ``DataFrame`` is to be
+aligned on that column in the ``DataFrame``. These two function calls are 
+completely equivalent:
 
 ::
 
@@ -819,8 +995,8 @@ equivalent:
           how='left', sort=False)
 
 Obviously you can choose whichever form you find more convenient. For
-many-to-one joins (where one of the DataFrame's is already indexed by the join
-key), using ``join`` may be more convenient. Here is a simple example:
+many-to-one joins (where one of the ``DataFrame``'s is already indexed by the 
+join key), using ``join`` may be more convenient. Here is a simple example:
 
 .. ipython:: python
 
@@ -909,20 +1085,18 @@ As you can see, this drops any rows where there was no match.
 
 .. _merging.join_on_mi:
 
-Joining a single Index to a Multi-index
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Joining a single Index to a MultiIndex
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.14.0
-
-You can join a singly-indexed ``DataFrame`` with a level of a multi-indexed ``DataFrame``.
+You can join a singly-indexed ``DataFrame`` with a level of a MultiIndexed ``DataFrame``.
 The level will match on the name of the index of the singly-indexed frame against
-a level name of the multi-indexed frame.
+a level name of the MultiIndexed frame.
 
 ..  ipython:: python
 
    left = pd.DataFrame({'A': ['A0', 'A1', 'A2'],
                         'B': ['B0', 'B1', 'B2']},
-                        index=Index(['K0', 'K1', 'K2'], name='key'))
+                        index=pd.Index(['K0', 'K1', 'K2'], name='key'))
 
    index = pd.MultiIndex.from_tuples([('K0', 'Y0'), ('K1', 'Y1'),
                                      ('K2', 'Y2'), ('K2', 'Y3')],
@@ -956,10 +1130,11 @@ This is equivalent but less verbose and more memory efficient / faster than this
           labels=['left', 'right'], vertical=False);
    plt.close('all');
 
-Joining with two multi-indexes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Joining with two MultiIndexes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-This is not Implemented via ``join`` at-the-moment, however it can be done using the following.
+This is not implemented via ``join`` at-the-moment, however it can be done using
+the following code.
 
 .. ipython:: python
 
@@ -981,11 +1156,61 @@ This is not Implemented via ``join`` at-the-moment, however it can be done using
           labels=['left', 'right'], vertical=False);
    plt.close('all');
 
+.. _merging.merge_on_columns_and_levels:
+
+Merging on a combination of columns and index levels
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.22
+
+Strings passed as the ``on``, ``left_on``, and ``right_on`` parameters
+may refer to either column names or index level names.  This enables merging
+``DataFrame`` instances on a combination of index levels and columns without
+resetting indexes.
+
+.. ipython:: python
+
+   left_index = pd.Index(['K0', 'K0', 'K1', 'K2'], name='key1')
+
+   left = pd.DataFrame({'A': ['A0', 'A1', 'A2', 'A3'],
+                        'B': ['B0', 'B1', 'B2', 'B3'],
+                        'key2': ['K0', 'K1', 'K0', 'K1']},
+                       index=left_index)
+
+   right_index = pd.Index(['K0', 'K1', 'K2', 'K2'], name='key1')
+
+   right = pd.DataFrame({'C': ['C0', 'C1', 'C2', 'C3'],
+                         'D': ['D0', 'D1', 'D2', 'D3'],
+                         'key2': ['K0', 'K0', 'K0', 'K1']},
+                        index=right_index)
+
+   result = left.merge(right, on=['key1', 'key2'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merge_on_index_and_column.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+.. note::
+
+   When DataFrames are merged on a string that matches an index level in both
+   frames, the index level is preserved as an index level in the resulting
+   DataFrame.
+
+.. note::
+
+   If a string matches both a column name and an index level name, then a
+   warning is issued and the column takes precedence. This will result in an
+   ambiguity error in a future version.
+
 Overlapping value columns
 ~~~~~~~~~~~~~~~~~~~~~~~~~
 
 The merge ``suffixes`` argument takes a tuple of list of strings to append to
-overlapping column names in the input DataFrames to disambiguate the result
+overlapping column names in the input ``DataFrame``\ s to disambiguate the result
 columns:
 
 .. ipython:: python
@@ -1015,7 +1240,7 @@ columns:
           labels=['left', 'right'], vertical=False);
    plt.close('all');
 
-``DataFrame.join`` has ``lsuffix`` and ``rsuffix`` arguments which behave
+:meth:`DataFrame.join` has ``lsuffix`` and ``rsuffix`` arguments which behave
 similarly.
 
 .. ipython:: python
@@ -1037,8 +1262,8 @@ similarly.
 Joining multiple DataFrame or Panel objects
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-A list or tuple of DataFrames can also be passed to ``DataFrame.join`` to join
-them together on their indexes. The same is true for ``Panel.join``.
+A list or tuple of ``DataFrames`` can also be passed to :meth:`~DataFrame.join` 
+to join them together on their indexes.
 
 .. ipython:: python
 
@@ -1053,42 +1278,14 @@ them together on their indexes. The same is true for ``Panel.join``.
           labels=['left', 'right', 'right2'], vertical=False);
    plt.close('all');
 
-.. _merging.ordered_merge:
-
-Merging Ordered Data
-~~~~~~~~~~~~~~~~~~~~
-
-New in v0.8.0 is the ordered_merge function for combining time series and other
-ordered data. In particular it has an optional ``fill_method`` keyword to
-fill/interpolate missing data:
-
-.. ipython:: python
-
-   left = DataFrame({'k': ['K0', 'K1', 'K1', 'K2'],
-                     'lv': [1, 2, 3, 4],
-                     's': ['a', 'b', 'c', 'd']})
-
-   right = DataFrame({'k': ['K1', 'K2', 'K4'],
-                      'rv': [1, 2, 3]})
-
-   result = ordered_merge(left, right, fill_method='ffill', left_by='s')
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_ordered_merge.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=True);
-   plt.close('all');
-
 .. _merging.combine_first.update:
 
 Merging together values within Series or DataFrame columns
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Another fairly common situation is to have two like-indexed (or similarly
-indexed) Series or DataFrame objects and wanting to "patch" values in one
-object from values for matching indices in the other. Here is an example:
+indexed) ``Series`` or ``DataFrame`` objects and wanting to "patch" values in 
+one object from values for matching indices in the other. Here is an example:
 
 .. ipython:: python
 
@@ -1097,7 +1294,7 @@ object from values for matching indices in the other. Here is an example:
    df2 = pd.DataFrame([[-42.6, np.nan, -8.2], [-5., 1.6, 4]],
                       index=[1, 2])
 
-For this, use the ``combine_first`` method:
+For this, use the :meth:`~DataFrame.combine_first` method:
 
 .. ipython:: python
 
@@ -1111,9 +1308,9 @@ For this, use the ``combine_first`` method:
           labels=['df1', 'df2'], vertical=False);
    plt.close('all');
 
-Note that this method only takes values from the right DataFrame if they are
-missing in the left DataFrame. A related method, ``update``, alters non-NA
-values inplace:
+Note that this method only takes values from the right ``DataFrame`` if they are
+missing in the left ``DataFrame``. A related method, :meth:`~DataFrame.update`, 
+alters non-NA values in place:
 
 .. ipython:: python
    :suppress:
@@ -1130,4 +1327,115 @@ values inplace:
    @savefig merging_update.png
    p.plot([df1_copy, df2], df1,
           labels=['df1', 'df2'], vertical=False);
-   plt.close('all');
\ No newline at end of file
+   plt.close('all');
+
+.. _merging.time_series:
+
+Timeseries friendly merging
+---------------------------
+
+.. _merging.merge_ordered:
+
+Merging Ordered Data
+~~~~~~~~~~~~~~~~~~~~
+
+A :func:`merge_ordered` function allows combining time series and other
+ordered data. In particular it has an optional ``fill_method`` keyword to
+fill/interpolate missing data:
+
+.. ipython:: python
+
+   left = pd.DataFrame({'k': ['K0', 'K1', 'K1', 'K2'],
+                        'lv': [1, 2, 3, 4],
+                        's': ['a', 'b', 'c', 'd']})
+
+   right = pd.DataFrame({'k': ['K1', 'K2', 'K4'],
+                         'rv': [1, 2, 3]})
+
+   pd.merge_ordered(left, right, fill_method='ffill', left_by='s')
+
+.. _merging.merge_asof:
+
+Merging AsOf
+~~~~~~~~~~~~
+
+.. versionadded:: 0.19.0
+
+A :func:`merge_asof` is similar to an ordered left-join except that we match on 
+nearest key rather than equal keys. For each row in the ``left`` ``DataFrame``, 
+we select the last row in the ``right`` ``DataFrame`` whose ``on`` key is less 
+than the left's key. Both DataFrames must be sorted by the key.
+
+Optionally an asof merge can perform a group-wise merge. This matches the 
+``by`` key equally, in addition to the nearest match on the ``on`` key.
+
+For example; we might have ``trades`` and ``quotes`` and we want to ``asof`` 
+merge them.
+
+.. ipython:: python
+
+   trades = pd.DataFrame({
+       'time': pd.to_datetime(['20160525 13:30:00.023',
+                               '20160525 13:30:00.038',
+                               '20160525 13:30:00.048',
+                               '20160525 13:30:00.048',
+                               '20160525 13:30:00.048']),
+       'ticker': ['MSFT', 'MSFT',
+                  'GOOG', 'GOOG', 'AAPL'],
+       'price': [51.95, 51.95,
+                 720.77, 720.92, 98.00],
+       'quantity': [75, 155,
+                    100, 100, 100]},
+       columns=['time', 'ticker', 'price', 'quantity'])
+
+   quotes = pd.DataFrame({
+       'time': pd.to_datetime(['20160525 13:30:00.023',
+                               '20160525 13:30:00.023',
+                               '20160525 13:30:00.030',
+                               '20160525 13:30:00.041',
+                               '20160525 13:30:00.048',
+                               '20160525 13:30:00.049',
+                               '20160525 13:30:00.072',
+                               '20160525 13:30:00.075']),
+       'ticker': ['GOOG', 'MSFT', 'MSFT',
+                  'MSFT', 'GOOG', 'AAPL', 'GOOG',
+                  'MSFT'],
+       'bid': [720.50, 51.95, 51.97, 51.99,
+               720.50, 97.99, 720.50, 52.01],
+       'ask': [720.93, 51.96, 51.98, 52.00,
+               720.93, 98.01, 720.88, 52.03]},
+       columns=['time', 'ticker', 'bid', 'ask'])
+
+.. ipython:: python
+
+   trades
+   quotes
+
+By default we are taking the asof of the quotes.
+
+.. ipython:: python
+
+   pd.merge_asof(trades, quotes,
+                 on='time',
+                 by='ticker')
+
+We only asof within ``2ms`` between the quote time and the trade time.
+
+.. ipython:: python
+
+   pd.merge_asof(trades, quotes,
+                 on='time',
+                 by='ticker',
+                 tolerance=pd.Timedelta('2ms'))
+
+We only asof within ``10ms`` between the quote time and the trade time and we 
+exclude exact matches on time. Note that though we exclude the exact matches 
+(of the quotes), prior quotes **do** propagate to that point in time.
+
+.. ipython:: python
+
+   pd.merge_asof(trades, quotes,
+                 on='time',
+                 by='ticker',
+                 tolerance=pd.Timedelta('10ms'),
+                 allow_exact_matches=False)
diff --git a/doc/source/missing_data.rst b/doc/source/missing_data.rst
index 96ae46621dca2..e4b5578af15f0 100644
--- a/doc/source/missing_data.rst
+++ b/doc/source/missing_data.rst
@@ -7,10 +7,7 @@
    import pandas as pd
    pd.options.display.max_rows=15
    import matplotlib
-   try:
-      matplotlib.style.use('ggplot')
-   except AttributeError:
-      pd.options.display.mpl_style = 'default'
+   # matplotlib.style.use('default')
    import matplotlib.pyplot as plt
 
 .. _missing_data:
@@ -30,7 +27,7 @@ pandas.
     NumPy will soon be able to provide a native NA type solution (similar to R)
     performant enough to be used in pandas.
 
-See the :ref:`cookbook<cookbook.missing_data>` for some advanced strategies
+See the :ref:`cookbook<cookbook.missing_data>` for some advanced strategies.
 
 Missing data basics
 -------------------
@@ -39,14 +36,14 @@ When / why does data become missing?
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Some might quibble over our usage of *missing*. By "missing" we simply mean
-**null** or "not present for whatever reason". Many data sets simply arrive with
+**NA** ("not available") or "not present for whatever reason". Many data sets simply arrive with
 missing data, either because it exists and was not collected or it never
 existed. For example, in a collection of financial time series, some of the time
 series might start on different dates. Thus, values prior to the start date
 would generally be marked as missing.
 
 In pandas, one of the most common ways that missing data is **introduced** into
-a data set is by reindexing. For example
+a data set is by reindexing. For example:
 
 .. ipython:: python
 
@@ -66,32 +63,31 @@ to handling missing data. While ``NaN`` is the default missing value marker for
 reasons of computational speed and convenience, we need to be able to easily
 detect this value with data of different types: floating point, integer,
 boolean, and general object. In many cases, however, the Python ``None`` will
-arise and we wish to also consider that "missing" or "null".
+arise and we wish to also consider that "missing" or "not available" or "NA".
 
 .. note::
 
-   Prior to version v0.10.0 ``inf`` and ``-inf`` were also
-   considered to be "null" in computations. This is no longer the case by
-   default; use the ``mode.use_inf_as_null`` option to recover it.
+   If you want to consider ``inf`` and ``-inf`` to be "NA" in computations,
+   you can set ``pandas.options.mode.use_inf_as_na = True``.
 
-.. _missing.isnull:
+.. _missing.isna:
 
 To make detecting missing values easier (and across different array dtypes),
-pandas provides the :func:`~pandas.core.common.isnull` and
-:func:`~pandas.core.common.notnull` functions, which are also methods on
-``Series`` and ``DataFrame`` objects:
+pandas provides the :func:`isna` and
+:func:`notna` functions, which are also methods on
+Series and DataFrame objects:
 
 .. ipython:: python
 
    df2['one']
-   pd.isnull(df2['one'])
-   df2['four'].notnull()
-   df2.isnull()
+   pd.isna(df2['one'])
+   df2['four'].notna()
+   df2.isna()
 
 .. warning::
 
-   One has to be mindful that in python (and numpy), the ``nan's`` don't compare equal, but ``None's`` **do**.
-   Note that Pandas/numpy uses the fact that ``np.nan != np.nan``, and treats ``None`` like ``np.nan``.
+   One has to be mindful that in Python (and NumPy), the ``nan's`` don't compare equal, but ``None's`` **do**.
+   Note that pandas/NumPy uses the fact that ``np.nan != np.nan``, and treats ``None`` like ``np.nan``.
 
    .. ipython:: python
 
@@ -108,15 +104,15 @@ Datetimes
 ---------
 
 For datetime64[ns] types, ``NaT`` represents missing values. This is a pseudo-native
-sentinel value that can be represented by numpy in a singular dtype (datetime64[ns]).
-pandas objects provide intercompatibility between ``NaT`` and ``NaN``.
+sentinel value that can be represented by NumPy in a singular dtype (datetime64[ns]).
+pandas objects provide compatibility between ``NaT`` and ``NaN``.
 
 .. ipython:: python
 
    df2 = df.copy()
    df2['timestamp'] = pd.Timestamp('20120101')
    df2
-   df2.ix[['a','c','h'],['one','timestamp']] = np.nan
+   df2.loc[['a','c','h'],['one','timestamp']] = np.nan
    df2
    df2.get_dtype_counts()
 
@@ -158,9 +154,9 @@ objects.
 .. ipython:: python
    :suppress:
 
-   df = df2.ix[:, ['one', 'two', 'three']]
-   a = df2.ix[:5, ['one', 'two']].fillna(method='pad')
-   b = df2.ix[:5, ['one', 'two', 'three']]
+   df = df2.loc[:, ['one', 'two', 'three']]
+   a = df2.loc[df2.index[:5], ['one', 'two']].fillna(method='pad')
+   b = df2.loc[df2.index[:5], ['one', 'two', 'three']]
 
 .. ipython:: python
 
@@ -173,10 +169,9 @@ The descriptive statistics and computational methods discussed in the
 <api.series.stats>` and :ref:`here <api.dataframe.stats>`) are all written to
 account for missing data. For example:
 
-* When summing data, NA (missing) values will be treated as zero
-* If the data are all NA, the result will be NA
-* Methods like **cumsum** and **cumprod** ignore NA values, but preserve them
-  in the resulting arrays
+* When summing data, NA (missing) values will be treated as zero.
+* If the data are all NA, the result will be 0.
+* Cumulative methods like :meth:`~DataFrame.cumsum` and :meth:`~DataFrame.cumprod` ignore NA values by default, but preserve them in the resulting arrays. To override this behaviour and include NA values, use ``skipna=False``.
 
 .. ipython:: python
 
@@ -184,6 +179,35 @@ account for missing data. For example:
    df['one'].sum()
    df.mean(1)
    df.cumsum()
+   df.cumsum(skipna=False)
+
+
+.. _missing_data.numeric_sum:
+
+Sum/Prod of Empties/Nans
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. warning::
+
+   This behavior is now standard as of v0.22.0 and is consistent with the default in ``numpy``; previously sum/prod of all-NA or empty Series/DataFrames would return NaN.
+   See :ref:`v0.22.0 whatsnew <whatsnew_0220>` for more.
+
+The sum of an empty or all-NA Series or column of a DataFrame is 0.
+
+.. ipython:: python
+
+   pd.Series([np.nan]).sum()
+   
+   pd.Series([]).sum()
+
+The product of an empty or all-NA Series or column of a DataFrame is 1.
+
+.. ipython:: python
+
+   pd.Series([np.nan]).prod()
+   
+   pd.Series([]).prod()
+
 
 NA values in GroupBy
 ~~~~~~~~~~~~~~~~~~~~
@@ -209,7 +233,7 @@ with missing data.
 Filling missing values: fillna
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-The **fillna** function can "fill in" NA values with non-null data in a couple
+:meth:`~DataFrame.fillna` can "fill in" NA values with non-NA data in a couple
 of ways, which we illustrate:
 
 **Replace NA with a scalar value**
@@ -218,12 +242,12 @@ of ways, which we illustrate:
 
    df2
    df2.fillna(0)
-   df2['four'].fillna('missing')
+   df2['one'].fillna('missing')
 
 **Fill gaps forward or backward**
 
 Using the same filling arguments as :ref:`reindexing <basics.reindexing>`, we
-can propagate non-null values forward or backward:
+can propagate non-NA values forward or backward:
 
 .. ipython:: python
 
@@ -240,7 +264,7 @@ we can use the `limit` keyword:
 .. ipython:: python
    :suppress:
 
-   df.ix[2:4, :] = np.nan
+   df.iloc[2:4, :] = np.nan
 
 .. ipython:: python
 
@@ -259,16 +283,14 @@ To remind you, these are the available filling methods:
 With time series data, using pad/ffill is extremely common so that the "last
 known value" is available at every time point.
 
-The ``ffill()`` function is equivalent to ``fillna(method='ffill')``
-and ``bfill()`` is equivalent to ``fillna(method='bfill')``
+:meth:`~DataFrame.ffill` is equivalent to ``fillna(method='ffill')``
+and :meth:`~DataFrame.bfill` is equivalent to ``fillna(method='bfill')``
 
 .. _missing_data.PandasObject:
 
 Filling with a PandasObject
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.12
-
 You can also fillna using a dict or Series that is alignable. The labels of the dict or index of the Series
 must match the columns of the frame you wish to fill. The
 use case of this is to fill a DataFrame with the mean of that column.
@@ -284,14 +306,12 @@ use case of this is to fill a DataFrame with the mean of that column.
         dff.fillna(dff.mean())
         dff.fillna(dff.mean()['B':'C'])
 
-.. versionadded:: 0.13
-
 Same result as above, but is aligning the 'fill' value which is
 a Series in this case.
 
 .. ipython:: python
 
-        dff.where(pd.notnull(dff), dff.mean(), axis='columns')
+        dff.where(pd.notna(dff), dff.mean(), axis='columns')
 
 
 .. _missing_data.dropna:
@@ -300,7 +320,7 @@ Dropping axis labels with missing data: dropna
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 You may wish to simply exclude labels from a data set which refer to missing
-data. To do this, use the **dropna** method:
+data. To do this, use :meth:`~DataFrame.dropna`:
 
 .. ipython:: python
    :suppress:
@@ -315,7 +335,7 @@ data. To do this, use the **dropna** method:
    df.dropna(axis=1)
    df['one'].dropna()
 
-Series.dropna is a simpler method as it only has one axis to consider.
+An equivalent :meth:`~Series.dropna` is available for Series.
 DataFrame.dropna has considerably more options than Series.dropna, which can be
 examined :ref:`in the API <api.dataframe.missing>`.
 
@@ -324,17 +344,12 @@ examined :ref:`in the API <api.dataframe.missing>`.
 Interpolation
 ~~~~~~~~~~~~~
 
-.. versionadded:: 0.13.0
+.. versionadded:: 0.21.0
 
-  :meth:`~pandas.DataFrame.interpolate`, and :meth:`~pandas.Series.interpolate` have
-  revamped interpolation methods and functionality.
+  The ``limit_area`` keyword argument was added.
 
-.. versionadded:: 0.17.0
-
-  The ``limit_direction`` keyword argument was added.
-
-Both Series and Dataframe objects have an ``interpolate`` method that, by default,
-performs linear interpolation at missing datapoints.
+Both Series and DataFrame objects have :meth:`~DataFrame.interpolate`
+that, by default, performs linear interpolation at missing data points.
 
 .. ipython:: python
    :suppress:
@@ -392,12 +407,15 @@ You can also interpolate with a DataFrame:
    df.interpolate()
 
 The ``method`` argument gives access to fancier interpolation methods.
-If you have scipy_ installed, you can set pass the name of a 1-d interpolation routine to ``method``.
+If you have scipy_ installed, you can pass the name of a 1-d interpolation routine to ``method``.
 You'll want to consult the full scipy interpolation documentation_ and reference guide_ for details.
 The appropriate interpolation method will depend on the type of data you are working with.
-For example, if you are dealing with a time series that is growing at an increasing rate,
-``method='quadratic'`` may be appropriate.  If you have values approximating a cumulative
-distribution function, then ``method='pchip'`` should work well.
+
+* If you are dealing with a time series that is growing at an increasing rate,
+  ``method='quadratic'`` may be appropriate.
+* If you have values approximating a cumulative distribution function,
+  then ``method='pchip'`` should work well.
+* To fill missing values with goal of smooth plotting, consider ``method='akima'``.
 
 .. warning::
 
@@ -409,6 +427,8 @@ distribution function, then ``method='pchip'`` should work well.
 
    df.interpolate(method='pchip')
 
+   df.interpolate(method='akima')
+
 When interpolating via a polynomial or spline approximation, you must also specify
 the degree or order of the approximation:
 
@@ -452,39 +472,61 @@ at the new values.
 .. _documentation: http://docs.scipy.org/doc/scipy/reference/interpolate.html#univariate-interpolation
 .. _guide: http://docs.scipy.org/doc/scipy/reference/tutorial/interpolate.html
 
+.. _missing_data.interp_limits:
+
 Interpolation Limits
 ^^^^^^^^^^^^^^^^^^^^
 
-Like other pandas fill methods, ``interpolate`` accepts a ``limit`` keyword
-argument. Use this argument to limit the number of consecutive interpolations,
-keeping ``NaN`` values for interpolations that are too far from the last valid
-observation:
+Like other pandas fill methods, :meth:`~DataFrame.interpolate` accepts a ``limit`` keyword
+argument. Use this argument to limit the number of consecutive ``NaN`` values
+filled since the last valid observation:
 
 .. ipython:: python
 
-   ser = pd.Series([np.nan, np.nan, 5, np.nan, np.nan, np.nan, 13])
-   ser.interpolate(limit=2)
+   ser = pd.Series([np.nan, np.nan, 5, np.nan, np.nan, np.nan, 13, np.nan, np.nan])
 
-By default, ``limit`` applies in a forward direction, so that only ``NaN``
-values after a non-``NaN`` value can be filled. If you provide ``'backward'`` or
-``'both'`` for the ``limit_direction`` keyword argument, you can fill ``NaN``
-values before non-``NaN`` values, or both before and after non-``NaN`` values,
-respectively:
+   # fill all consecutive values in a forward direction
+   ser.interpolate()
 
-.. ipython:: python
+   # fill one consecutive value in a forward direction
+   ser.interpolate(limit=1)
 
-   ser.interpolate(limit=1)  # limit_direction == 'forward'
+By default, ``NaN`` values are filled in a ``forward`` direction. Use
+``limit_direction`` parameter to fill ``backward`` or from ``both`` directions.
+
+.. ipython:: python
 
+   # fill one consecutive value backwards
    ser.interpolate(limit=1, limit_direction='backward')
 
+   # fill one consecutive value in both directions
    ser.interpolate(limit=1, limit_direction='both')
 
+   # fill all consecutive values in both directions
+   ser.interpolate(limit_direction='both')
+
+By default, ``NaN`` values are filled whether they are inside (surrounded by)
+existing valid values, or outside existing valid values. Introduced in v0.23
+the ``limit_area`` parameter restricts filling to either inside or outside values.
+
+.. ipython:: python
+
+   # fill one consecutive inside value in both directions
+   ser.interpolate(limit_direction='both', limit_area='inside', limit=1)
+
+   # fill all consecutive outside values backward
+   ser.interpolate(limit_direction='backward', limit_area='outside')
+
+   # fill all consecutive outside values in both directions
+   ser.interpolate(limit_direction='both', limit_area='outside')
+
 .. _missing_data.replace:
 
 Replacing Generic Values
 ~~~~~~~~~~~~~~~~~~~~~~~~
-Often times we want to replace arbitrary values with other values. New in v0.8
-is the ``replace`` method in Series/DataFrame that provides an efficient yet
+Often times we want to replace arbitrary values with other values.
+
+:meth:`~Series.replace` in Series and :meth:`~DataFrame.replace` in DataFrame provides an efficient yet
 flexible way to perform such replacements.
 
 For a Series, you can replace a single value or a list of values by another
@@ -535,10 +577,10 @@ String/Regular Expression Replacement
    backslashes than strings without this prefix. Backslashes in raw strings
    will be interpreted as an escaped backslash, e.g., ``r'\' == '\\'``. You
    should `read about them
-   <http://docs.python.org/2/reference/lexical_analysis.html#string-literals>`__
+   <https://docs.python.org/3/reference/lexical_analysis.html#string-literals>`__
    if this is unclear.
 
-Replace the '.' with ``nan`` (str -> str)
+Replace the '.' with ``NaN`` (str -> str):
 
 .. ipython:: python
 
@@ -547,58 +589,58 @@ Replace the '.' with ``nan`` (str -> str)
    df.replace('.', np.nan)
 
 Now do it with a regular expression that removes surrounding whitespace
-(regex -> regex)
+(regex -> regex):
 
 .. ipython:: python
 
    df.replace(r'\s*\.\s*', np.nan, regex=True)
 
-Replace a few different values (list -> list)
+Replace a few different values (list -> list):
 
 .. ipython:: python
 
    df.replace(['a', '.'], ['b', np.nan])
 
-list of regex -> list of regex
+list of regex -> list of regex:
 
 .. ipython:: python
 
    df.replace([r'\.', r'(a)'], ['dot', '\1stuff'], regex=True)
 
-Only search in column ``'b'`` (dict -> dict)
+Only search in column ``'b'`` (dict -> dict):
 
 .. ipython:: python
 
    df.replace({'b': '.'}, {'b': np.nan})
 
 Same as the previous example, but use a regular expression for
-searching instead (dict of regex -> dict)
+searching instead (dict of regex -> dict):
 
 .. ipython:: python
 
    df.replace({'b': r'\s*\.\s*'}, {'b': np.nan}, regex=True)
 
-You can pass nested dictionaries of regular expressions that use ``regex=True``
+You can pass nested dictionaries of regular expressions that use ``regex=True``:
 
 .. ipython:: python
 
    df.replace({'b': {'b': r''}}, regex=True)
 
-or you can pass the nested dictionary like so
+Alternatively, you can pass the nested dictionary like so:
 
 .. ipython:: python
 
    df.replace(regex={'b': {r'\s*\.\s*': np.nan}})
 
 You can also use the group of a regular expression match when replacing (dict
-of regex -> dict of regex), this works for lists as well
+of regex -> dict of regex), this works for lists as well.
 
 .. ipython:: python
 
    df.replace({'b': r'\s*(\.)\s*'}, {'b': r'\1ty'}, regex=True)
 
 You can pass a list of regular expressions, of which those that match
-will be replaced with a scalar (list of regex -> regex)
+will be replaced with a scalar (list of regex -> regex).
 
 .. ipython:: python
 
@@ -607,7 +649,7 @@ will be replaced with a scalar (list of regex -> regex)
 All of the regular expression examples can also be passed with the
 ``to_replace`` argument as the ``regex`` argument. In this case the ``value``
 argument must be passed explicitly by name or ``regex`` must be a nested
-dictionary. The previous example, in this case, would then be
+dictionary. The previous example, in this case, would then be:
 
 .. ipython:: python
 
@@ -624,7 +666,7 @@ want to use a regular expression.
 Numeric Replacement
 ~~~~~~~~~~~~~~~~~~~
 
-Similar to ``DataFrame.fillna``
+:meth:`~DataFrame.replace` is similar to :meth:`~DataFrame.fillna`.
 
 .. ipython:: python
 
@@ -632,7 +674,7 @@ Similar to ``DataFrame.fillna``
    df[np.random.rand(df.shape[0]) > 0.5] = 1.5
    df.replace(1.5, np.nan)
 
-Replacing more than one value via lists works as well
+Replacing more than one value is possible by passing a list.
 
 .. ipython:: python
 
@@ -640,7 +682,7 @@ Replacing more than one value via lists works as well
    df.replace([1.5, df00], [np.nan, 'a'])
    df[1].dtype
 
-You can also operate on the DataFrame in place
+You can also operate on the DataFrame in place:
 
 .. ipython:: python
 
@@ -650,7 +692,7 @@ You can also operate on the DataFrame in place
 
    When replacing multiple ``bool`` or ``datetime64`` objects, the first
    argument to ``replace`` (``to_replace``) must match the type of the value
-   being replaced type. For example,
+   being replaced. For example,
 
    .. code-block:: python
 
@@ -678,9 +720,9 @@ Missing data casting rules and indexing
 
 While pandas supports storing arrays of integer and boolean type, these types
 are not capable of storing missing data. Until we can switch to using a native
-NA type in NumPy, we've established some "casting rules" when reindexing will
-cause missing data to be introduced into, say, a Series or DataFrame. Here they
-are:
+NA type in NumPy, we've established some "casting rules". When a reindexing
+operation introduces missing data, the Series will be cast according to the
+rules introduced in the table below.
 
 .. csv-table::
     :header: "data type", "Cast to"
@@ -713,7 +755,7 @@ contains NAs, an exception will be generated:
    reindexed = s.reindex(list(range(8))).fillna(0)
    reindexed[crit]
 
-However, these can be filled in using **fillna** and it will work fine:
+However, these can be filled in using :meth:`~DataFrame.fillna` and it will work fine:
 
 .. ipython:: python
 
diff --git a/doc/source/names_wordlist.txt b/doc/source/names_wordlist.txt
new file mode 100644
index 0000000000000..032883b7febf6
--- /dev/null
+++ b/doc/source/names_wordlist.txt
@@ -0,0 +1,1652 @@
+Critchley
+Villanova
+del
+Hohmann
+Rychyk
+Buchkovsky
+Lenail
+Schade
+datetimeindex
+Aly
+Sivji
+Költringer
+Bui
+András
+Novoszáth
+Anh
+Anil
+Pallekonda
+Pitrou
+Linde
+Quinonez
+Varshokar
+Artem
+Bogachev
+Avi
+Azeez
+Oluwafemi
+Auffarth
+Thiel
+Bhavesh
+Poddar
+Haffner
+Naul
+Guinta
+Moreira
+García
+Márquez
+Cheuk
+Chitrank
+Dixit
+Catalfo
+Mazzullo
+Chwala
+Cihan
+Ceyhan
+Brunner
+Riemenschneider
+Dixey
+Garrido
+Sakuma
+Hirschfeld
+Adrián
+Cañones
+Castellano
+Arcos
+Hoese
+Stansby
+Kamau
+Niederhut
+Dror
+Atariah
+Chea
+Kisslinger
+Retkowski
+Sar
+Maeztu
+Gianpaolo
+Macario
+Giftlin
+Rajaiah
+Olimpio
+Gjelt
+Inggs
+Grzegorz
+Konefał
+Guilherme
+Beltramini
+Pitkeathly
+Mashkoor
+Ferchland
+Haochen
+Hissashi
+Sharaf
+Ignasi
+Fosch
+Alves
+Shelvinskyi
+Imanflow
+Ingolf
+Saeta
+Pérez
+Koevska
+Jakub
+Nowacki
+Werkmann
+Zoutkamp
+Bandlow
+Jaume
+Bonet
+Alammar
+Reback
+Jing
+Qiang
+Goh
+Miralles
+Nothman
+Joeun
+Metz
+Mease
+Schulze
+Jongwony
+Jordi
+Contestí
+Joris
+Bossche
+José
+Fonseca
+Jovixe
+Jörg
+Döpfert
+Ittoku
+Surta
+Kuhl
+Krzysztof
+Chomski
+Ksenia
+Ksenia
+Bobrova
+Kunal
+Gosar
+Kerstein
+Laksh
+Arora
+Geffert
+Licht
+Takeuchi
+Liudmila
+Villalba
+Manan
+Singh
+Manraj
+Singh
+Hemken
+Bibiloni
+Corchero
+Woodbridge
+Journois
+Gallo
+Heikkilä
+Braymer
+Maybeno
+Rocklin
+Roeschke
+Bussonnier
+Mikhaylov
+Veksler
+Roos
+Maximiliano
+Greco
+Penkov
+Röttger
+Selik
+Waskom
+Mie
+Kutzma
+Mitar
+Negus
+Münst
+Mortada
+Mehyar
+Braithwaite
+Chmura
+Karagiannakis
+Nipun
+Sadvilkar
+Martensen
+Noémi
+Éltető
+Bilodeau
+Ondrej
+Kokes
+Onno
+Ganssle
+Mannino
+Reidy
+Oliveira
+Hoffmann
+Ngo
+Battiston
+Pranav
+Suri
+Priyanka
+Ojha
+Pulkit
+Maloo
+Magliocchetti
+Ridhwan
+Luthra
+Kiplang'at
+Rohan
+Pandit
+Rok
+Mihevc
+Rouz
+Azari
+Ryszard
+Kaleta
+Samir
+Musali
+Sinayoko
+Sangwoong
+Yoon
+Sharad
+Vijalapuram
+Shubham
+Chaudhary
+Sietse
+Brouwer
+Delprete
+Cianciulli
+Childs
+Stijn
+Hoey
+Talitha
+Pumar
+Tarbo
+Fukazawa
+Petrou
+Caswell
+Hoffmann
+Swast
+Augspurger
+Tulio
+Casagrande
+Tushar
+Tushar
+Mittal
+Upkar
+Lidder
+Vinícius
+Figueiredo
+Vipin
+WBare
+Wenhuan
+Ayd
+Xbar
+Yaroslav
+Halchenko
+Yee
+Mey
+Yeongseon
+Choe
+Yian
+Yimeng
+Zhang
+Zihao
+Zhao
+adatasetaday
+akielbowicz
+akosel
+alinde
+amuta
+bolkedebruin
+cbertinato
+cgohlke
+charlie
+chris
+csfarkas
+dajcs
+deflatSOCO
+derestle
+htwg
+discort
+dmanikowski
+donK
+elrubio
+fivemok
+fjdiod
+fjetter
+froessler
+gabrielclow
+gfyoung
+ghasemnaddaf
+vetinari
+himanshu
+awasthi
+ignamv
+jayfoad
+jazzmuesli
+jbrockmendel
+jjames
+joaoavf
+joders
+jschendel
+juan
+huguet
+luzpaz
+mdeboc
+miguelmorin
+miker
+miquelcamprodon
+orereta
+ottiP
+peterpanmj
+rafarui
+raph
+readyready
+rmihael
+samghelms
+scriptomation
+sfoo
+stefansimik
+stonebig
+tmnhat
+tomneep
+tv
+verakai
+xpvpc
+zhanghui
+API
+Mazzullo
+Riemenschneider
+Hirschfeld
+Stansby
+Dror
+Atariah
+Kisslinger
+Ingolf
+Werkmann
+Reback
+Joris
+Bossche
+Jörg
+Döpfert
+Kuhl
+Krzysztof
+Chomski
+Licht
+Takeuchi
+Manraj
+Singh
+Braymer
+Waskom
+Mie
+Hoffmann
+Sietse
+Brouwer
+Swast
+Augspurger
+Ayd
+Yee
+Mey
+bolkedebruin
+cgohlke
+derestle
+htwg
+fjdiod
+gabrielclow
+gfyoung
+ghasemnaddaf
+jbrockmendel
+jschendel
+miker
+pypy
+Gleave
+Liaw
+Velasco
+Yee
+Marchenko
+Amol
+Winkler
+亮
+André
+Jonasson
+Sweger
+Berkay
+Haffner
+Tu
+Chankey
+Pathak
+Billington
+Filo
+Gorgolewski
+Mazzullo
+Prinoth
+Stade
+Schuldt
+Moehl
+Himmelstein
+Willmer
+Niederhut
+Wieser
+Fredriksen
+Kint
+Giftlin
+Giftlin
+Rajaiah
+Guilherme
+Beltramini
+Guillem
+Borrell
+Hanmin
+Qin
+Makait
+Hussain
+Tamboli
+Miholic
+Novotný
+Helie
+Schiratti
+Deschenes
+Knupp
+Reback
+Tratner
+Nothman
+Crall
+Mease
+Helmus
+Joris
+Bossche
+Bochi
+Kuhlmann
+Brabandere
+Keeton
+Keiron
+Pizzey
+Kernc
+Licht
+Takeuchi
+Kushner
+Jelloul
+Makarov
+Malgorzata
+Turzanska
+Sy
+Roeschke
+Picus
+Mehmet
+Akmanalp
+Gasvoda
+Penkov
+Eubank
+Shteynbuk
+Tillmann
+Pankaj
+Pandey
+Luo
+O'Melveny
+Reidy
+Quackenbush
+Yanovich
+Haessig
+Battiston
+Pradyumna
+Reddy
+Chinthala
+Prasanjit
+Prakash
+Sangwoong
+Yoon
+Sudeep
+Telt
+Caswell
+Swast
+Augspurger
+Tuan
+Utkarsh
+Upadhyay
+Vivek
+Aiyong
+WBare
+Yi
+Liu
+Yosuke
+Nakabayashi
+aaron
+abarber
+gh
+aernlund
+agustín
+méndez
+andymaheshw
+aviolov
+bpraggastis
+cbertinato
+cclauss
+chernrick
+chris
+dkamm
+dwkenefick
+faic
+fding
+gfyoung
+guygoldberg
+hhuuggoo
+huashuai
+ian
+iulia
+jaredsnyder
+jbrockmendel
+jdeschenes
+jebob
+jschendel
+keitakurita
+kernc
+kiwirob
+kjford
+linebp
+lloydkirk
+louispotok
+majiang
+manikbhandari
+matthiashuschle
+mattip
+maxwasserman
+mjlove
+nmartensen
+parchd
+philipphanemann
+rdk
+reidy
+ri
+ruiann
+rvernica
+weigand
+scotthavard
+skwbc
+tobycheese
+tsdlovell
+ysau
+zzgao
+cov
+abaldenko
+adrian
+stepien
+Saxena
+Akash
+Tandon
+Aleksey
+Bilogur
+alexandercbooth
+Amol
+Kahat
+Winkler
+Kittredge
+Anthonios
+Partheniou
+Arco
+Ashish
+Singal
+atbd
+bastewart
+Baurzhan
+Muftakhidinov
+Kandel
+bmagnusson
+carlosdanielcsantos
+Souza
+chaimdemulder
+chris
+Aycock
+Gohlke
+Paulik
+Warth
+Brunner
+Himmelstein
+Willmer
+Krych
+dickreuter
+Dimitris
+Spathis
+discort
+Dmitry
+Suria
+Wijaya
+Stanczak
+dr
+leo
+dubourg
+dwkenefick
+Andrade
+Ennemoser
+Francesc
+Alted
+Fumito
+Hamamura
+funnycrab
+gfyoung
+Ferroni
+goldenbull
+Jeffries
+Guilherme
+Beltramini
+Guilherme
+Samora
+Hao
+Harshit
+Patni
+Ilya
+Schurov
+Iván
+Vallés
+Pérez
+Leng
+Jaehoon
+Hwang
+Goppert
+Santucci
+Reback
+Crist
+Jevnik
+Nothman
+Zwinck
+jojomdt
+Whitmore
+Mease
+Mease
+Joost
+Kranendonk
+Joris
+Bossche
+Bradt
+Santander
+Julien
+Marrec
+Solinsky
+Kacawi
+Kamal
+Kamalaldin
+Shedden
+Kernc
+Keshav
+Ramaswamy
+Ren
+linebp
+Pedersen
+Cestaro
+Scarabello
+Lukasz
+paramstyle
+Lababidi
+Unserialized
+manu
+manuels
+Roeschke
+mattip
+Picus
+Roeschke
+maxalbert
+Roos
+mcocdawc
+Lamparski
+Michiel
+Mikolaj
+Chwalisz
+Miroslav
+Šedivý
+Mykola
+Golubyev
+Rud
+Halen
+Chmura
+nuffe
+Pankaj
+Pandey
+paul
+mannino
+Pawel
+Kordek
+pbreach
+Csizsek
+Petio
+Petrov
+Ruffwind
+Battiston
+Chromiec
+Prasanjit
+Prakash
+Forgione
+Rouz
+Azari
+Sahil
+Dua
+sakkemo
+Sami
+Salonen
+Sarma
+Tangirala
+scls
+Gsänger
+Sébastien
+Menten
+Heide
+Shyam
+Saladi
+sinhrks
+Sinhrks
+Rauch
+stijnvanhoey
+Adiseshan
+themrmax
+Thiago
+Serafim
+Thoralf
+Thrasibule
+Gustafsson
+Augspurger
+tomrod
+Shen
+tzinckgraf
+Uwe
+wandersoncferreira
+watercrossing
+wcwagner
+Wiktor
+Tomczak
+xgdgsc
+Yaroslav
+Halchenko
+Yimeng
+Zhang
+yui
+knk
+Saxena
+Kandel
+Aycock
+Himmelstein
+Willmer
+gfyoung
+hesham
+shabana
+Reback
+Jevnik
+Joris
+Bossche
+Santander
+Shedden
+Keshav
+Ramaswamy
+Scarabello
+Picus
+Roeschke
+Roos
+Mykola
+Golubyev
+Halen
+Pawel
+Kordek
+Battiston
+sinhrks
+Adiseshan
+Augspurger
+wandersoncferreira
+Yaroslav
+Halchenko
+Chainz
+Anthonios
+Partheniou
+Arash
+Rouhani
+Kandel
+chris
+Warth
+Krych
+dubourg
+gfyoung
+Iván
+Vallés
+Pérez
+Reback
+Jevnik
+Mease
+Joris
+Bossche
+Keshav
+Ramaswamy
+Ren
+mattrijk
+paul
+mannino
+Chromiec
+Sinhrks
+Thiago
+Serafim
+adneu
+agraboso
+Alekseyev
+Vig
+Riddell
+Amol
+Amol
+Agrawal
+Anthonios
+Partheniou
+babakkeyvani
+Kandel
+Baxley
+Camilo
+Cota
+chris
+Grinolds
+Hudon
+Aycock
+Warth
+cmazzullo
+cr
+Siladji
+Drewrey
+Lupton
+dsm
+Blancas
+Marsden
+Marczinowski
+O'Donovan
+Gábor
+Lipták
+Geraint
+gfyoung
+Ferroni
+Haleemur
+harshul
+Hassan
+Shamim
+iamsimha
+Iulius
+Nazarov
+jackieleng
+Reback
+Crist
+Jevnik
+Liekezer
+Zwinck
+Erenrich
+Joris
+Bossche
+Howes
+Brandys
+Kamil
+Sindi
+Ka
+Wo
+Shedden
+Kernc
+Brucher
+Roos
+Scherer
+Mortada
+Mehyar
+mpuels
+Haseeb
+Tariq
+Bonnotte
+Virtanen
+Mestemaker
+Pawel
+Kordek
+Battiston
+pijucha
+Jucha
+priyankjain
+Nimmi
+Gieseke
+Keyes
+Sahil
+Dua
+Sanjiv
+Lobo
+Sašo
+Stanovnik
+Heide
+sinhrks
+Sinhrks
+Kappel
+Choi
+Sudarshan
+Konge
+Caswell
+Augspurger
+Uwe
+Hoffmann
+wcwagner
+Xiang
+Zhang
+Yadunandan
+Yaroslav
+Halchenko
+YG
+Riku
+Yuichiro
+Kaneko
+yui
+knk
+zhangjinjie
+znmean
+颜发才
+Yan
+Facai
+Fiore
+Gartland
+Bastiaan
+Benoît
+Vinot
+Fustin
+Freitas
+Ter
+Livschitz
+Gábor
+Lipták
+Hassan
+Kibirige
+Iblis
+Saeta
+Pérez
+Wolosonovich
+Reback
+Jevnik
+Joris
+Bossche
+Storck
+Ka
+Wo
+Shedden
+Kieran
+O'Mahony
+Lababidi
+Maoyuan
+Liu
+Wittmann
+MaxU
+Roos
+Droettboom
+Eubank
+Bonnotte
+Virtanen
+Battiston
+Prabhjot
+Singh
+Augspurger
+Aiyong
+Winand
+Xbar
+Yan
+Facai
+adneu
+ajenkins
+cargometrics
+behzad
+nouri
+chinskiy
+gfyoung
+jeps
+jonaslb
+kotrfa
+nileracecrew
+onesandzeroes
+sinhrks
+tsdlovell
+Alekseyev
+Rosenfeld
+Anthonios
+Partheniou
+Sipos
+Carroux
+Aycock
+Scanlin
+Da
+Dorozhko
+O'Donovan
+Cleary
+Gianluca
+Jeffries
+Horel
+Schwabacher
+Deschenes
+Reback
+Jevnik
+Fremlin
+Hoersch
+Joris
+Bossche
+Joris
+Vankerschaver
+Ka
+Wo
+Keming
+Zhang
+Shedden
+Farrugia
+Lurie
+Roos
+Mayank
+Asthana
+Mortada
+Mehyar
+Moussa
+Taifi
+Navreet
+Bonnotte
+Reiners
+Gura
+Battiston
+Carnevale
+Rinoc
+Rishipuri
+Sangmin
+Lasley
+Sereger
+Seabold
+Thierry
+Moisan
+Caswell
+Augspurger
+Hauck
+Varun
+Yoong
+Kang
+Lim
+Yoshiki
+Vázquez
+Baeza
+Joong
+Younggun
+Yuval
+Langer
+argunov
+behzad
+nouri
+boombard
+brian
+pantano
+chromy
+daniel
+dgram
+gfyoung
+hcontrast
+jfoo
+kaustuv
+deolal
+llllllllll
+ranarag
+rockg
+scls
+seales
+sinhrks
+srib
+surveymedia
+tworec
+Drozd
+Anthonios
+Partheniou
+Berendt
+Piersall
+Hamed
+Saljooghinejad
+Iblis
+Deschenes
+Reback
+Callin
+Joris
+Bossche
+Ka
+Wo
+Loïc
+Séguin
+Luo
+Yicheng
+Magnus
+Jöud
+Leonhardt
+Roos
+Bonnotte
+Pastafarianist
+Chong
+Schaf
+Philipp
+deCarvalho
+Khomenko
+Rémy
+Léone
+Thierry
+Moisan
+Augspurger
+Varun
+Hoffmann
+Winterflower
+Younggun
+ajcr
+azuranski
+behzad
+nouri
+cel
+emilydolson
+hironow
+lexual
+llllllllll
+rockg
+silentquasar
+sinhrks
+taeold
+unparseable
+Rothberg
+Bedini
+Rosenfeld
+Anthonios
+Partheniou
+Artemy
+Kolchinsky
+Willers
+Gohlke
+Clearfield
+Ringwalt
+Cottrell
+Gagne
+Schettino
+Panfilov
+Araujo
+Gianluca
+Poulin
+Nisar
+Henriksen
+Hoegen
+Jaidev
+Deshpande
+Swails
+Reback
+Buyl
+Joris
+Bossche
+Joris
+Vankerschaver
+Julien
+Danjou
+Ka
+Wo
+Kehoe
+Jordahl
+Shedden
+Buitinck
+Gambogi
+Savoie
+Roos
+D'Agostino
+Mortada
+Mehyar
+Eubank
+Nipun
+Batra
+Ondřej
+Čertík
+Pratap
+Vardhan
+Rafal
+Skolasinski
+Rinoc
+Gieseke
+Safia
+Abdalla
+Saumitra
+Shahapure
+Pölsterl
+Rubbert
+Sinhrks
+Siu
+Kwan
+Seabold
+Carrucciu
+Hoyer
+Pascoe
+Santegoeds
+Grainger
+Tjerk
+Santegoeds
+Augspurger
+Winterflower
+Yaroslav
+Halchenko
+agijsberts
+ajcr
+behzad
+nouri
+cel
+cyrusmaher
+davidovitch
+ganego
+jreback
+juricast
+larvian
+maximilianr
+msund
+rekcahpassyla
+robertzk
+scls
+seth
+sinhrks
+springcoil
+terrytangyuan
+tzinckgraf
+Rosenfeld
+Artemy
+Kolchinsky
+Willers
+Christer
+der
+Meeren
+Hudon
+Lasiman
+Brundu
+Gaëtan
+Menten
+Hiebert
+Reback
+Joris
+Bossche
+Ka
+Wo
+Mortada
+Mehyar
+Grainger
+Ajamian
+Augspurger
+Yoshiki
+Vázquez
+Baeza
+Younggun
+austinc
+behzad
+nouri
+jreback
+lexual
+rekcahpassyla
+scls
+sinhrks
+Artemy
+Kolchinsky
+Gilmer
+Grinolds
+Birken
+Hirschfeld
+Dunné
+Hatem
+Nassrat
+Sperr
+Herter
+Blackburne
+Reback
+Crist
+Abernot
+Joris
+Bossche
+Shedden
+Razoumov
+Riel
+Mortada
+Mehyar
+Eubank
+Grisel
+Battiston
+Hyunjin
+Zhang
+Hoyer
+Tiago
+Antao
+Ajamian
+Augspurger
+Tomaz
+Berisa
+Shirgur
+Filimonov
+Hogman
+Yasin
+Younggun
+behzad
+nouri
+dsm
+floydsoft
+gfr
+jnmclarty
+jreback
+ksanghai
+lucas
+mschmohl
+ptype
+rockg
+scls
+sinhrks
+Toth
+Amici
+Artemy
+Kolchinsky
+Ashwini
+Chaudhary
+Letson
+Chau
+Hoang
+Christer
+der
+Meeren
+Cottrell
+Ehsan
+Azarnasab
+Torcasso
+Sexauer
+Reback
+Joris
+Bossche
+Joschka
+zur
+Jacobsmühlen
+Bochi
+Junya
+Hayashi
+Shedden
+Kieran
+O'Mahony
+Kodi
+Arfer
+Airas
+Mortada
+Mehyar
+Lasley
+Lasley
+Pascual
+Seabold
+Hoyer
+Grainger
+Augspurger
+Filimonov
+Vyomkesh
+Tripathi
+Holmgren
+Yulong
+behzad
+nouri
+bertrandhaut
+bjonen
+cel
+clham
+hsperr
+ischwabacher
+jnmclarty
+josham
+jreback
+omtinez
+roch
+sinhrks
+unutbu
+Angelos
+Evripiotis
+Artemy
+Kolchinsky
+Pointet
+Jacobowski
+Charalampos
+Papaloizou
+Warth
+Zanini
+Francesc
+Kleynhans
+Reback
+Tratner
+Joris
+Bossche
+Suggit
+Lasley
+Hoyer
+Sylvain
+Corlay
+Grainger
+Tiago
+Antao
+Hauck
+Chaves
+Salgado
+Bhandoh
+Aiyong
+Holmgren
+behzad
+nouri
+broessli
+charalampos
+papaloizou
+immerrr
+jnmclarty
+jreback
+mgilbert
+onesandzeroes
+peadarcoyle
+rockg
+seth
+sinhrks
+unutbu
+wavedatalab
+Åsmund
+Hjulstad
+Rosenfeld
+Sipos
+Artemy
+Kolchinsky
+Letson
+Horel
+Reback
+Joris
+Bossche
+Sanghee
+Hoyer
+Aiyong
+behzad
+nouri
+immerrr
+jnmclarty
+jreback
+pallav
+fdsi
+unutbu
+Greenhall
+Artemy
+Kolchinsky
+behzad
+nouri
+Sauer
+benjamin
+Thyreau
+bjonen
+Stoafer
+dlovell
+dsm
+Herrero
+Hsiaoming
+Huan
+hunterowens
+Hyungtae
+immerrr
+Slavitt
+ischwabacher
+Schaer
+Tratner
+Farnham
+jmorris
+jnmclarty
+Bradish
+Joerg
+Rittinger
+Joris
+Bossche
+jreback
+klonuo
+lexual
+mcjcode
+Schatzow
+Mortada
+Mehyar
+mtrbean
+Typanski
+onesandzeroes
+Masurel
+Battiston
+rockg
+Petchler
+seth
+Shahul
+Hameed
+Shashank
+Agarwal
+sinhrks
+someben
+stahlous
+stas
+sl
+Hoyer
+thatneat
+alcorn
+Augspurger
+unutbu
+Yevgeniy
+Grechka
+Yoshiki
+VÃ
+zquez
+Baeza
+zachcp
+Rosenfeld
+Quistorff
+Wignall
+bwignall
+clham
+Waeber
+Bew
+dsm
+helger
+immerrr
+Schaer
+jaimefrio
+Reaver
+Joris
+Bossche
+jreback
+Julien
+Danjou
+lexual
+Wittmann
+Mortada
+Mehyar
+onesandzeroes
+rockg
+sanguineturtle
+Schaer
+seth
+sinhrks
+Hoyer
+Kluyver
+yelite
+hexbin
+Acanthostega
+agijsberts
+akittredge
+Gaudio
+Rothberg
+Rosenfeld
+ankostis
+anomrake
+Mazières
+anton
+bashtage
+Sauer
+benjamin
+Buran
+bwignall
+cgohlke
+chebee
+clham
+Birken
+danielballan
+Waeber
+Drapala
+Gouthaman
+Balaraman
+Poulin
+hshimizu
+hugo
+immerrr
+ischwabacher
+Schaer
+jaimefrio
+Sexauer
+Reback
+Tratner
+Reaver
+Joris
+Bossche
+jreback
+jsexauer
+Júlio
+kdiether
+Jordahl
+Wittmann
+Grender
+Gruen
+michaelws
+mikebailey
+Nipun
+Batra
+ojdo
+onesandzeroes
+phaebz
+Battiston
+Carnevale
+ribonoous
+Gibboni
+rockg
+sinhrks
+Seabold
+Hoyer
+Cera
+Augspurger
+unutbu
+westurner
+Yaroslav
+Halchenko
+lexual
+danbirken
+travis
+Billington
+Cobzarenco
+Gamboa
+Cavazos
+Gaudecker
+Gerigk
+Yaroslav
+Halchenko
+sharey
+Vytautas
+Jancauskas
+Hammerbacher
+Hilboll
+Luc
+Kesters
+JanSchulz
+Negusse
+Wouter
+Overmeire
+Reeson
+Aman
+Thakral
+Uga
+Vandenbussche
+Pinxing
+astype
+Buglet
+Beltrame
+Hilboll
+Jev
+Kuznetsov
+Wouter
+Overmeire
+Reyfman
+Joon
+Ro
+Uga
+Vandenbussche
+setupegg
+Hammerbacher
+Jev
+Kuznetsov
+Wouter
+Overmeire
+Aman
+Thakral
+Uga
+Vandenbussche
+carljv
+rsamson
+newaxis
+Fortunov
+Aman
+Thakral
+Beltrame
+Wouter
+Overmeire
+rsamson
+Laserson
+Pentreath
+Joon
+Ro
+Uga
+Fortunov
+Berka
+Vandenbussche
+krogh
+akima
+BPoly
+isna
+kurt
diff --git a/doc/source/options.rst b/doc/source/options.rst
index 1b125fa76f68b..cbe0264f442bc 100644
--- a/doc/source/options.rst
+++ b/doc/source/options.rst
@@ -28,19 +28,19 @@ You can get/set options directly as attributes of the top-level ``options`` attr
    pd.options.display.max_rows = 999
    pd.options.display.max_rows
 
-There is also an API composed of 5 relevant functions, available directly from the ``pandas``
+The API is composed of 5 relevant functions, available directly from the ``pandas``
 namespace:
 
-- :func:`~pandas.get_option` / :func:`~pandas.set_option` - get/set the value of a single option.
-- :func:`~pandas.reset_option` - reset one or more options to their default value.
-- :func:`~pandas.describe_option` - print the descriptions of one or more options.
-- :func:`~pandas.option_context` - execute a codeblock with a set of options
+* :func:`~pandas.get_option` / :func:`~pandas.set_option` - get/set the value of a single option.
+* :func:`~pandas.reset_option` - reset one or more options to their default value.
+* :func:`~pandas.describe_option` - print the descriptions of one or more options.
+* :func:`~pandas.option_context` - execute a codeblock with a set of options
   that revert to prior settings after execution.
 
-**Note:** developers can check out pandas/core/config.py for more info.
+**Note:** Developers can check out `pandas/core/config.py <https://github.com/pandas-dev/pandas/blob/master/pandas/core/config.py>`_ for more information.
 
 All of the functions above accept a regexp pattern (``re.search`` style) as an argument,
-and so passing in a substring will work - as long as it is unambiguous :
+and so passing in a substring will work - as long as it is unambiguous:
 
 .. ipython:: python
 
@@ -71,14 +71,16 @@ with no argument ``describe_option`` will print out the descriptions for all ava
 
 .. ipython:: python
    :suppress:
+   :okwarning:
 
    pd.reset_option("all")
 
 Getting and Setting Options
 ---------------------------
 
-As described above, ``get_option()`` and ``set_option()`` are available from the
-pandas namespace.  To change an option, call ``set_option('option regex', new_value)``
+As described above, :func:`~pandas.get_option` and :func:`~pandas.set_option`
+are available from the pandas namespace.  To change an option, call
+``set_option('option regex', new_value)``.
 
 .. ipython:: python
 
@@ -86,7 +88,7 @@ pandas namespace.  To change an option, call ``set_option('option regex', new_va
    pd.set_option('mode.sim_interactive', True)
    pd.get_option('mode.sim_interactive')
 
-**Note:** that the option 'mode.sim_interactive' is mostly used for debugging purposes.
+**Note:** The option 'mode.sim_interactive' is mostly used for debugging purposes.
 
 All options also have a default value, and you can use ``reset_option`` to do just that:
 
@@ -107,6 +109,7 @@ All options also have a default value, and you can use ``reset_option`` to do ju
 It's also possible to reset multiple options at once (using a regex):
 
 .. ipython:: python
+   :okwarning:
 
    pd.reset_option("^display")
 
@@ -129,7 +132,7 @@ Setting Startup Options in python/ipython Environment
 
 Using startup scripts for the python/ipython environment to import pandas and set options makes working with pandas more efficient.  To do this, create a .py or .ipy script in the startup directory of the desired profile.  An example where the startup folder is in a default ipython profile can be found at:
 
-.. code-block:: python
+.. code-block:: none
 
   $IPYTHONDIR/profile_default/startup
 
@@ -146,7 +149,7 @@ More information can be found in the `ipython documentation
 
 Frequently Used Options
 -----------------------
-The following is a walkthrough of the more frequently used display options.
+The following is a walk-through of the more frequently used display options.
 
 ``display.max_rows`` and ``display.max_columns`` sets the maximum number
 of rows and columns displayed when a frame is pretty-printed.  Truncated
@@ -161,7 +164,7 @@ lines are replaced by an ellipsis.
    df
    pd.reset_option('max_rows')
 
-``display.expand_frame_repr`` allows for the the representation of
+``display.expand_frame_repr`` allows for the representation of
 dataframes to stretch across pages, wrapped over the full column vs row-wise.
 
 .. ipython:: python
@@ -219,7 +222,7 @@ can specify the option ``df.info(null_counts=True)`` to override on showing a pa
 
 .. ipython:: python
 
-   df  =pd.DataFrame(np.random.choice([0,1,np.nan], size=(10,10)))
+   df = pd.DataFrame(np.random.choice([0,1,np.nan], size=(10,10)))
    df
    pd.set_option('max_info_rows', 11)
    df.info()
@@ -227,8 +230,8 @@ can specify the option ``df.info(null_counts=True)`` to override on showing a pa
    df.info()
    pd.reset_option('max_info_rows')
 
-``display.precision`` sets the output display precision in terms of decimal places. This is only a
-suggestion.
+``display.precision`` sets the output display precision in terms of decimal places.
+This is only a suggestion.
 
 .. ipython:: python
 
@@ -239,7 +242,7 @@ suggestion.
    df
 
 ``display.chop_threshold`` sets at what level pandas rounds to zero when
-it displays a Series of DataFrame.  Note, this does not effect the
+it displays a Series of DataFrame. This setting does not change the
 precision at which the number is stored.
 
 .. ipython:: python
@@ -252,7 +255,7 @@ precision at which the number is stored.
    pd.reset_option('chop_threshold')
 
 ``display.colheader_justify`` controls the justification of the headers.
-Options are 'right', and 'left'.
+The options are 'right', and 'left'.
 
 .. ipython:: python
 
@@ -266,150 +269,177 @@ Options are 'right', and 'left'.
 
 
 
-List of Options
----------------
-
-========================== ============ ==================================
-Option                     Default      Function
-========================== ============ ==================================
-display.chop_threshold     None         If set to a float value, all float
-                                        values smaller then the given
-                                        threshold will be displayed as
-                                        exactly 0 by repr and friends.
-display.colheader_justify  right        Controls the justification of
-                                        column headers. used by DataFrameFormatter.
-display.column_space       12           No description available.
-display.date_dayfirst      False        When True, prints and parses dates
-                                        with the day first, eg 20/01/2005
-display.date_yearfirst     False        When True, prints and parses dates
-                                        with the year first, eg 2005/01/20
-display.encoding           UTF-8        Defaults to the detected encoding
-                                        of the console. Specifies the encoding
-                                        to be used for strings returned by
-                                        to_string, these are generally strings
-                                        meant to be displayed on the console.
-display.expand_frame_repr  True         Whether to print out the full DataFrame
-                                        repr for wide DataFrames across
-                                        multiple lines, `max_columns` is
-                                        still respected, but the output will
-                                        wrap-around across multiple "pages"
-                                        if its width exceeds `display.width`.
-display.float_format       None         The callable should accept a floating
-                                        point number and return a string with
-                                        the desired format of the number.
-                                        This is used in some places like
-                                        SeriesFormatter.
-                                        See core.format.EngFormatter for an example.
-display.height             60           Deprecated. Use `display.max_rows` instead.
-display.large_repr         truncate     For DataFrames exceeding max_rows/max_cols,
-                                        the repr (and HTML repr) can show
-                                        a truncated table (the default from 0.13),
-                                        or switch to the view from df.info()
-                                        (the behaviour in earlier versions of pandas).
-                                        allowable settings, ['truncate', 'info']
-display.line_width         80           Deprecated. Use `display.width` instead.
-display.max_columns        20           max_rows and max_columns are used
-                                        in __repr__() methods to decide if
-                                        to_string() or info() is used to
-                                        render an object to a string.  In
-                                        case python/IPython is running in
-                                        a terminal this can be set to 0 and
-                                        pandas will correctly auto-detect
-                                        the width the terminal and swap to
-                                        a smaller format in case all columns
-                                        would not fit vertically. The IPython
-                                        notebook, IPython qtconsole, or IDLE
-                                        do not run in a terminal and hence
-                                        it is not possible to do correct
-                                        auto-detection. 'None' value means
-                                        unlimited.
-display.max_colwidth       50           The maximum width in characters of
-                                        a column in the repr of a pandas
-                                        data structure. When the column overflows,
-                                        a "..." placeholder is embedded in
-                                        the output.
-display.max_info_columns   100          max_info_columns is used in DataFrame.info
-                                        method to decide if per column information
-                                        will be printed.
-display.max_info_rows      1690785      df.info() will usually show null-counts
-                                        for each column. For large frames
-                                        this can be quite slow. max_info_rows
-                                        and max_info_cols limit this null
-                                        check only to frames with smaller
-                                        dimensions then specified.
-display.max_rows           60           This sets the maximum number of rows
-                                        pandas should output when printing
-                                        out various output. For example,
-                                        this value determines whether the
-                                        repr() for a dataframe prints out
-                                        fully or just a summary repr.
-                                        'None' value means unlimited.
-display.max_seq_items      100          when pretty-printing a long sequence,
-                                        no more then `max_seq_items` will
-                                        be printed. If items are omitted,
-                                        they will be denoted by the addition
-                                        of "..." to the resulting string.
-                                        If set to None, the number of items
-                                        to be printed is unlimited.
-display.memory_usage       True         This specifies if the memory usage of
-                                        a DataFrame should be displayed when the
-                                        df.info() method is invoked.
-display.mpl_style          None         Setting this to 'default' will modify
-                                        the rcParams used by matplotlib
-                                        to give plots a more pleasing visual
-                                        style by default. Setting this to
-                                        None/False restores the values to
-                                        their initial value.
-display.multi_sparse       True         "Sparsify" MultiIndex display (don't
-                                        display repeated elements in outer
-                                        levels within groups)
-display.notebook_repr_html True         When True, IPython notebook will
-                                        use html representation for
-                                        pandas objects (if it is available).
-display.pprint_nest_depth  3            Controls the number of nested levels
-                                        to process when pretty-printing
-display.precision          6            Floating point output precision in
-                                        terms of number of places after the
-                                        decimal, for regular formatting as well
-                                        as scientific notation. Similar to
-                                        numpy's ``precision`` print option
-display.show_dimensions    truncate     Whether to print out dimensions
-                                        at the end of DataFrame repr.
-                                        If 'truncate' is specified, only
-                                        print out the dimensions if the
-                                        frame is truncated (e.g. not display
-                                        all rows and/or columns)
-display.width              80           Width of the display in characters.
-                                        In case python/IPython is running in
-                                        a terminal this can be set to None
-                                        and pandas will correctly auto-detect
-                                        the width. Note that the IPython notebook,
-                                        IPython qtconsole, or IDLE do not run in a
-                                        terminal and hence it is not possible
-                                        to correctly detect the width.
-io.excel.xls.writer        xlwt         The default Excel writer engine for
-                                        'xls' files.
-io.excel.xlsm.writer       openpyxl     The default Excel writer engine for
-                                        'xlsm' files. Available options:
-                                        'openpyxl' (the default).
-io.excel.xlsx.writer       openpyxl     The default Excel writer engine for
-                                        'xlsx' files.
-io.hdf.default_format      None         default format writing format, if
-                                        None, then put will default to
-                                        'fixed' and append will default to
-                                        'table'
-io.hdf.dropna_table        True         drop ALL nan rows when appending
-                                        to a table
-mode.chained_assignment    warn         Raise an exception, warn, or no
-                                        action if trying to use chained
-                                        assignment, The default is warn
-mode.sim_interactive       False        Whether to simulate interactive mode
-                                        for purposes of testing
-mode.use_inf_as_null       False        True means treat None, NaN, -INF,
-                                        INF as null (old way), False means
-                                        None and NaN are null, but INF, -INF
-                                        are not null (new way).
-========================== ============ ==================================
+.. _options.available:
+
+Available Options
+-----------------
+
+======================================= ============ ==================================
+Option                                  Default      Function
+======================================= ============ ==================================
+display.chop_threshold                  None         If set to a float value, all float
+                                                     values smaller then the given
+                                                     threshold will be displayed as
+                                                     exactly 0 by repr and friends.
+display.colheader_justify               right        Controls the justification of
+                                                     column headers. used by DataFrameFormatter.
+display.column_space                    12           No description available.
+display.date_dayfirst                   False        When True, prints and parses dates
+                                                     with the day first, eg 20/01/2005
+display.date_yearfirst                  False        When True, prints and parses dates
+                                                     with the year first, eg 2005/01/20
+display.encoding                        UTF-8        Defaults to the detected encoding
+                                                     of the console. Specifies the encoding
+                                                     to be used for strings returned by
+                                                     to_string, these are generally strings
+                                                     meant to be displayed on the console.
+display.expand_frame_repr               True         Whether to print out the full DataFrame
+                                                     repr for wide DataFrames across
+                                                     multiple lines, `max_columns` is
+                                                     still respected, but the output will
+                                                     wrap-around across multiple "pages"
+                                                     if its width exceeds `display.width`.
+display.float_format                    None         The callable should accept a floating
+                                                     point number and return a string with
+                                                     the desired format of the number.
+                                                     This is used in some places like
+                                                     SeriesFormatter.
+                                                     See core.format.EngFormatter for an example.
+display.large_repr                      truncate     For DataFrames exceeding max_rows/max_cols,
+                                                     the repr (and HTML repr) can show
+                                                     a truncated table (the default),
+                                                     or switch to the view from df.info()
+                                                     (the behaviour in earlier versions of pandas).
+                                                     allowable settings, ['truncate', 'info']
+display.latex.repr                      False        Whether to produce a latex DataFrame
+                                                     representation for jupyter frontends
+                                                     that support it.
+display.latex.escape                    True         Escapes special characters in DataFrames, when
+                                                     using the to_latex method.
+display.latex.longtable                 False        Specifies if the to_latex method of a DataFrame
+                                                     uses the longtable format.
+display.latex.multicolumn               True         Combines columns when using a MultiIndex
+display.latex.multicolumn_format        'l'          Alignment of multicolumn labels
+display.latex.multirow                  False        Combines rows when using a MultiIndex.
+                                                     Centered instead of top-aligned,
+                                                     separated by clines.
+display.max_columns                     0 or 20      max_rows and max_columns are used
+                                                     in __repr__() methods to decide if
+                                                     to_string() or info() is used to
+                                                     render an object to a string.  In
+                                                     case Python/IPython is running in
+                                                     a terminal this is set to 0 by default and
+                                                     pandas will correctly auto-detect
+                                                     the width of the terminal and switch to
+                                                     a smaller format in case all columns
+                                                     would not fit vertically. The IPython
+                                                     notebook, IPython qtconsole, or IDLE
+                                                     do not run in a terminal and hence
+                                                     it is not possible to do correct
+                                                     auto-detection, in which case the default
+                                                     is set to 20. 'None' value means unlimited.
+display.max_colwidth                    50           The maximum width in characters of
+                                                     a column in the repr of a pandas
+                                                     data structure. When the column overflows,
+                                                     a "..." placeholder is embedded in
+                                                     the output.
+display.max_info_columns                100          max_info_columns is used in DataFrame.info
+                                                     method to decide if per column information
+                                                     will be printed.
+display.max_info_rows                   1690785      df.info() will usually show null-counts
+                                                     for each column. For large frames
+                                                     this can be quite slow. max_info_rows
+                                                     and max_info_cols limit this null
+                                                     check only to frames with smaller
+                                                     dimensions then specified.
+display.max_rows                        60           This sets the maximum number of rows
+                                                     pandas should output when printing
+                                                     out various output. For example,
+                                                     this value determines whether the
+                                                     repr() for a dataframe prints out
+                                                     fully or just a summary repr.
+                                                     'None' value means unlimited.
+display.max_seq_items                   100          when pretty-printing a long sequence,
+                                                     no more then `max_seq_items` will
+                                                     be printed. If items are omitted,
+                                                     they will be denoted by the addition
+                                                     of "..." to the resulting string.
+                                                     If set to None, the number of items
+                                                     to be printed is unlimited.
+display.memory_usage                    True         This specifies if the memory usage of
+                                                     a DataFrame should be displayed when the
+                                                     df.info() method is invoked.
+display.multi_sparse                    True         "Sparsify" MultiIndex display (don't
+                                                     display repeated elements in outer
+                                                     levels within groups)
+display.notebook_repr_html              True         When True, IPython notebook will
+                                                     use html representation for
+                                                     pandas objects (if it is available).
+display.pprint_nest_depth               3            Controls the number of nested levels
+                                                     to process when pretty-printing
+display.precision                       6            Floating point output precision in
+                                                     terms of number of places after the
+                                                     decimal, for regular formatting as well
+                                                     as scientific notation. Similar to
+                                                     numpy's ``precision`` print option
+display.show_dimensions                 truncate     Whether to print out dimensions
+                                                     at the end of DataFrame repr.
+                                                     If 'truncate' is specified, only
+                                                     print out the dimensions if the
+                                                     frame is truncated (e.g. not display
+                                                     all rows and/or columns)
+display.width                           80           Width of the display in characters.
+                                                     In case python/IPython is running in
+                                                     a terminal this can be set to None
+                                                     and pandas will correctly auto-detect
+                                                     the width. Note that the IPython notebook,
+                                                     IPython qtconsole, or IDLE do not run in a
+                                                     terminal and hence it is not possible
+                                                     to correctly detect the width.
+display.html.table_schema               False        Whether to publish a Table Schema
+                                                     representation for frontends that
+                                                     support it.
+display.html.border                     1            A ``border=value`` attribute is
+                                                     inserted in the ``<table>`` tag
+                                                     for the DataFrame HTML repr.
+display.html.use_mathjax                True         When True, Jupyter notebook will process
+                                                     table contents using MathJax, rendering
+                                                     mathematical expressions enclosed by the
+                                                     dollar symbol.
+io.excel.xls.writer                     xlwt         The default Excel writer engine for
+                                                     'xls' files.
+io.excel.xlsm.writer                    openpyxl     The default Excel writer engine for
+                                                     'xlsm' files. Available options:
+                                                     'openpyxl' (the default).
+io.excel.xlsx.writer                    openpyxl     The default Excel writer engine for
+                                                     'xlsx' files.
+io.hdf.default_format                   None         default format writing format, if
+                                                     None, then put will default to
+                                                     'fixed' and append will default to
+                                                     'table'
+io.hdf.dropna_table                     True         drop ALL nan rows when appending
+                                                     to a table
+io.parquet.engine                       None         The engine to use as a default for
+                                                     parquet reading and writing. If None
+                                                     then try 'pyarrow' and 'fastparquet'
+mode.chained_assignment                 warn         Controls ``SettingWithCopyWarning``:
+                                                     'raise', 'warn', or None. Raise an
+                                                     exception, warn, or no action if
+                                                     trying to use :ref:`chained assignment <indexing.evaluation_order>`.
+mode.sim_interactive                    False        Whether to simulate interactive mode
+                                                     for purposes of testing.
+mode.use_inf_as_na                      False        True means treat None, NaN, -INF,
+                                                     INF as NA (old way), False means
+                                                     None and NaN are null, but INF, -INF
+                                                     are not NA (new way).
+compute.use_bottleneck                  True         Use the bottleneck library to accelerate
+                                                     computation if it is installed.
+compute.use_numexpr                     True         Use the numexpr library to accelerate
+                                                     computation if it is installed.
+plotting.matplotlib.register_converters True         Register custom converters with
+                                                     matplotlib. Set to False to de-register.
+======================================= ============ ==================================
+
 
 .. _basics.console_output:
 
@@ -436,6 +466,7 @@ For instance:
 
 .. ipython:: python
    :suppress:
+   :okwarning:
 
    pd.reset_option('^display\.')
 
@@ -451,10 +482,10 @@ Unicode Formatting
    Enabling this option will affect the performance for printing of DataFrame and Series (about 2 times slower).
    Use only when it is actually required.
 
-Some East Asian countries use Unicode characters its width is corresponding to 2 alphabets.
-If DataFrame or Series contains these characters, default output cannot be aligned properly.
+Some East Asian countries use Unicode characters whose width corresponds to two Latin characters.
+If a DataFrame or Series contains these characters, the default output mode may not align them properly.
 
-.. note:: Screen captures are attached for each outputs to show the actual results.
+.. note:: Screen captures are attached for each output to show the actual results.
 
 .. ipython:: python
 
@@ -463,8 +494,9 @@ If DataFrame or Series contains these characters, default output cannot be align
 
 .. image:: _static/option_unicode01.png
 
-Enable ``display.unicode.east_asian_width`` allows pandas to check each character's "East Asian Width" property.
-These characters can be aligned properly by checking this property, but it takes longer time than standard ``len`` function.
+Enabling ``display.unicode.east_asian_width`` allows pandas to check each character's "East Asian Width" property.
+These characters can be aligned properly by setting this option to ``True``. However, this will result in longer render
+times than the standard ``len`` function.
 
 .. ipython:: python
 
@@ -473,9 +505,10 @@ These characters can be aligned properly by checking this property, but it takes
 
 .. image:: _static/option_unicode02.png
 
-In addition, Unicode contains characters which width is "Ambiguous". These character's width should be either 1 or 2 depending on terminal setting or encoding. Because this cannot be distinguished from Python, ``display.unicode.ambiguous_as_wide`` option is added to handle this.
+In addition, Unicode characters whose width is "Ambiguous" can either be 1 or 2 characters wide depending on the
+terminal setting or encoding. The option ``display.unicode.ambiguous_as_wide`` can be used to handle the ambiguity.
 
-By default, "Ambiguous" character's width, "¡" (inverted exclamation) in below example, is regarded as 1.
+By default, an "Ambiguous" character's width, such as "¡" (inverted exclamation) in the example below, is taken to be 1.
 
 .. ipython:: python
 
@@ -484,7 +517,10 @@ By default, "Ambiguous" character's width, "¡" (inverted exclamation) in below
 
 .. image:: _static/option_unicode03.png
 
-Enabling ``display.unicode.ambiguous_as_wide`` lets pandas to figure these character's width as 2. Note that this option will be effective only when ``display.unicode.east_asian_width`` is enabled. Confirm starting position has been changed, but is not aligned properly because the setting is mismatched with this environment.
+Enabling ``display.unicode.ambiguous_as_wide`` makes pandas interpret these characters' widths to be 2.
+(Note that this option will only be effective when ``display.unicode.east_asian_width`` is enabled.)
+
+However, setting this option incorrectly for your terminal will cause these characters to be aligned incorrectly:
 
 .. ipython:: python
 
@@ -498,3 +534,26 @@ Enabling ``display.unicode.ambiguous_as_wide`` lets pandas to figure these chara
 
    pd.set_option('display.unicode.east_asian_width', False)
    pd.set_option('display.unicode.ambiguous_as_wide', False)
+
+.. _options.table_schema:
+
+Table Schema Display
+--------------------
+
+.. versionadded:: 0.20.0
+
+``DataFrame`` and ``Series`` will publish a Table Schema representation
+by default. False by default, this can be enabled globally with the
+``display.html.table_schema`` option:
+
+.. ipython:: python
+
+  pd.set_option('display.html.table_schema', True)
+
+Only ``'display.max_rows'`` are serialized and published.
+
+
+.. ipython:: python
+    :suppress:
+
+    pd.reset_option('display.html.table_schema')
diff --git a/doc/source/overview.rst b/doc/source/overview.rst
index b1addddc2121d..6ba9501ba0b5e 100644
--- a/doc/source/overview.rst
+++ b/doc/source/overview.rst
@@ -6,42 +6,42 @@
 Package overview
 ****************
 
-:mod:`pandas` consists of the following things
-
- * A set of labeled array data structures, the primary of which are
-   Series and DataFrame
- * Index objects enabling both simple axis indexing and multi-level /
-   hierarchical axis indexing
- * An integrated group by engine for aggregating and transforming data sets
- * Date range generation (date_range) and custom date offsets enabling the
-   implementation of customized frequencies
- * Input/Output tools: loading tabular data from flat files (CSV, delimited,
-   Excel 2003), and saving and loading pandas objects from the fast and
-   efficient PyTables/HDF5 format.
- * Memory-efficient "sparse" versions of the standard data structures for storing
-   data that is mostly missing or mostly constant (some fixed value)
- * Moving window statistics (rolling mean, rolling standard deviation, etc.)
- * Static and moving window linear and `panel regression
-   <http://en.wikipedia.org/wiki/Panel_data>`__
-
-Data structures at a glance
----------------------------
+:mod:`pandas` is an open source, BSD-licensed library providing high-performance, 
+easy-to-use data structures and data analysis tools for the `Python <https://www.python.org/>`__
+programming language.
+
+:mod:`pandas` consists of the following elements:
+
+* A set of labeled array data structures, the primary of which are
+  Series and DataFrame.
+* Index objects enabling both simple axis indexing and multi-level /
+  hierarchical axis indexing.
+* An integrated group by engine for aggregating and transforming data sets.
+* Date range generation (date_range) and custom date offsets enabling the
+  implementation of customized frequencies.
+* Input/Output tools: loading tabular data from flat files (CSV, delimited,
+  Excel 2003), and saving and loading pandas objects from the fast and
+  efficient PyTables/HDF5 format.
+* Memory-efficient "sparse" versions of the standard data structures for storing
+  data that is mostly missing or mostly constant (some fixed value).
+* Moving window statistics (rolling mean, rolling standard deviation, etc.).
+
+Data Structures
+---------------
 
 .. csv-table::
     :header: "Dimensions", "Name", "Description"
     :widths: 15, 20, 50
 
-    1, Series, "1D labeled homogeneously-typed array"
-    2, DataFrame, "General 2D labeled, size-mutable tabular structure with
-    potentially heterogeneously-typed columns"
-    3, Panel, "General 3D labeled, also size-mutable array"
+    1, "Series", "1D labeled homogeneously-typed array"
+    2, "DataFrame", "General 2D labeled, size-mutable tabular structure with potentially heterogeneously-typed column"
 
-Why more than 1 data structure?
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Why more than one data structure?
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 The best way to think about the pandas data structures is as flexible
 containers for lower dimensional data. For example, DataFrame is a container
-for Series, and Panel is a container for DataFrame objects. We would like to be
+for Series, and Series is a container for scalars. We would like to be
 able to insert and remove objects from these containers in a dictionary-like
 fashion.
 
@@ -58,7 +58,7 @@ transformations in downstream functions.
 
 For example, with tabular data (DataFrame) it is more semantically helpful to
 think of the **index** (the rows) and the **columns** rather than axis 0 and
-axis 1. And iterating through the columns of the DataFrame thus results in more
+axis 1. Iterating through the columns of the DataFrame thus results in more
 readable code:
 
 ::
@@ -74,47 +74,51 @@ All pandas data structures are value-mutable (the values they contain can be
 altered) but not always size-mutable. The length of a Series cannot be
 changed, but, for example, columns can be inserted into a DataFrame. However,
 the vast majority of methods produce new objects and leave the input data
-untouched. In general, though, we like to **favor immutability** where
-sensible.
+untouched. In general we like to **favor immutability** where sensible.
 
 Getting Support
 ---------------
 
 The first stop for pandas issues and ideas is the `Github Issue Tracker
-<https://github.com/pydata/pandas/issues>`__. If you have a general question,
+<https://github.com/pandas-dev/pandas/issues>`__. If you have a general question,
 pandas community experts can answer through `Stack Overflow
 <http://stackoverflow.com/questions/tagged/pandas>`__.
 
-Longer discussions occur on the `developer mailing list
-<http://groups.google.com/group/pystatsmodels>`__, and commercial support
-inquiries for Lambda Foundry should be sent to: support@lambdafoundry.com
+Community
+---------
 
-Credits
--------
+pandas is actively supported today by a community of like-minded individuals around 
+the world who contribute their valuable time and energy to help make open source 
+pandas possible. Thanks to `all of our contributors <https://github.com/pandas-dev/pandas/graphs/contributors>`__.
+
+If you're interested in contributing, please
+visit `Contributing to pandas webpage <http://pandas.pydata.org/pandas-docs/stable/contributing.html>`__.
+
+pandas is a `NumFOCUS <https://www.numfocus.org/open-source-projects/>`__ sponsored project.
+This will help ensure the success of development of pandas as a world-class open-source
+project, and makes it possible to `donate <https://pandas.pydata.org/donate.html>`__ to the project.
 
-pandas development began at `AQR Capital Management <http://www.aqr.com>`__ in
-April 2008. It was open-sourced at the end of 2009. AQR continued to provide
-resources for development through the end of 2011, and continues to contribute
-bug reports today.
+Project Governance
+------------------
 
-Since January 2012, `Lambda Foundry <http://www.lambdafoundry.com>`__, has
-been providing development resources, as well as commercial support,
-training, and consulting for pandas.
+The governance process that pandas project has used informally since its inception in 2008 is formalized in `Project Governance documents <https://github.com/pandas-dev/pandas-governance>`__.
+The documents clarify how decisions are made and how the various elements of our community interact, including the relationship between open source collaborative development and work that may be funded by for-profit or non-profit entities.
 
-pandas is only made possible by a group of people around the world like you
-who have contributed new code, bug reports, fixes, comments and ideas. A
-complete list can be found `on Github <http://www.github.com/pydata/pandas/contributors>`__.
+Wes McKinney is the Benevolent Dictator for Life (BDFL).
 
 Development Team
-----------------
+-----------------
 
-pandas is a part of the PyData project. The PyData Development Team is a
-collection of developers focused on the improvement of Python's data
-libraries. The core team that coordinates development can be found on `Github
-<http://github.com/pydata>`__. If you're interested in contributing, please
-visit the `project website <http://pandas.pydata.org>`__.
+The list of the Core Team members and more detailed information can be found on the `people’s page <https://github.com/pandas-dev/pandas-governance/blob/master/people.md>`__ of the governance repo.
+ 
+
+Institutional Partners
+----------------------
+
+The information about current institutional partners can be found on `pandas website page <https://pandas.pydata.org/about.html>`__.
 
 License
 -------
 
 .. literalinclude:: ../../LICENSE
+
diff --git a/doc/source/r_interface.rst b/doc/source/r_interface.rst
index 74cdc5a526585..88634d7f75c63 100644
--- a/doc/source/r_interface.rst
+++ b/doc/source/r_interface.rst
@@ -1,5 +1,3 @@
-.. currentmodule:: pandas.rpy
-
 .. _rpy:
 
 .. ipython:: python
@@ -15,155 +13,64 @@ rpy2 / R interface
 
 .. warning::
 
-   In v0.16.0, the ``pandas.rpy`` interface has been **deprecated and will be
-   removed in a future version**. Similar functionality can be accessed
-   through the `rpy2 <http://rpy.sourceforge.net/>`_ project.
-   See the :ref:`updating <rpy.updating>` section for a guide to port your
-   code from the ``pandas.rpy`` to ``rpy2`` functions.
-
-
-.. _rpy.updating:
-
-Updating your code to use rpy2 functions
-----------------------------------------
-
-In v0.16.0, the ``pandas.rpy`` module has been **deprecated** and users are
-pointed to the similar functionality in ``rpy2`` itself (rpy2 >= 2.4).
-
-Instead of importing ``import pandas.rpy.common as com``, the following imports
-should be done to activate the pandas conversion support in rpy2::
+    Up to pandas 0.19, a ``pandas.rpy`` module existed with functionality to
+    convert between pandas and ``rpy2`` objects. This functionality now lives in
+    the `rpy2 <https://rpy2.readthedocs.io/>`__ project itself.
+    See the `updating section <http://pandas.pydata.org/pandas-docs/version/0.19.0/r_interface.html#updating-your-code-to-use-rpy2-functions>`__
+    of the previous documentation for a guide to port your code from the
+    removed ``pandas.rpy`` to ``rpy2`` functions.
 
-    from rpy2.robjects import pandas2ri
-    pandas2ri.activate()
 
+`rpy2 <http://rpy2.bitbucket.org/>`__ is an interface to R running embedded in a Python process, and also includes functionality to deal with pandas DataFrames.
 Converting data frames back and forth between rpy2 and pandas should be largely
 automated (no need to convert explicitly, it will be done on the fly in most
 rpy2 functions).
-
 To convert explicitly, the functions are ``pandas2ri.py2ri()`` and
-``pandas2ri.ri2py()``. So these functions can be used to replace the existing
-functions in pandas:
-
-- ``com.convert_to_r_dataframe(df)`` should be replaced with ``pandas2ri.py2ri(df)``
-- ``com.convert_robj(rdf)`` should be replaced with ``pandas2ri.ri2py(rdf)``
-
-Note: these functions are for the latest version (rpy2 2.5.x) and were called
-``pandas2ri.pandas2ri()`` and ``pandas2ri.ri2pandas()`` previously.
-
-Some of the other functionality in `pandas.rpy` can be replaced easily as well.
-For example to load R data as done with the ``load_data`` function, the
-current method::
-
-    df_iris = com.load_data('iris')
-
-can be replaced with::
-
-    from rpy2.robjects import r
-    r.data('iris')
-    df_iris = pandas2ri.ri2py(r[name])
-
-The ``convert_to_r_matrix`` function can be replaced by the normal
-``pandas2ri.py2ri`` to convert dataframes, with a subsequent call to R
-``as.matrix`` function.
-
-.. warning::
-
-    Not all conversion functions in rpy2 are working exactly the same as the
-    current methods in pandas. If you experience problems or limitations in
-    comparison to the ones in pandas, please report this at the
-    `issue tracker <https://github.com/pydata/pandas/issues>`_.
-
-See also the documentation of the `rpy2 <http://rpy.sourceforge.net/>`_ project.
-
-
-R interface with rpy2
----------------------
+``pandas2ri.ri2py()``.
 
-If your computer has R and rpy2 (> 2.2) installed (which will be left to the
-reader), you will be able to leverage the below functionality. On Windows,
-doing this is quite an ordeal at the moment, but users on Unix-like systems
-should find it quite easy. rpy2 evolves in time, and is currently reaching
-its release 2.3, while the current interface is
-designed for the 2.2.x series. We recommend to use 2.2.x over other series
-unless you are prepared to fix parts of the code, yet the rpy2-2.3.0
-introduces improvements such as a better R-Python bridge memory management
-layer so it might be a good idea to bite the bullet and submit patches for
-the few minor differences that need to be fixed.
 
+See also the documentation of the `rpy2 <http://rpy2.bitbucket.org/>`__ project: https://rpy2.readthedocs.io.
 
-::
+In the remainder of this page, a few examples of explicit conversion is given. The pandas conversion of rpy2 needs first to be activated:
 
-    # if installing for the first time
-    hg clone http://bitbucket.org/lgautier/rpy2
-
-    cd rpy2
-    hg pull
-    hg update version_2.2.x
-    sudo python setup.py install
-
-.. note::
-
-    To use R packages with this interface, you will need to install
-    them inside R yourself. At the moment it cannot install them for
-    you.
+.. ipython:: python
 
-Once you have done installed R and rpy2, you should be able to import
-``pandas.rpy.common`` without a hitch.
+   from rpy2.robjects import r, pandas2ri
+   pandas2ri.activate()
 
 Transferring R data sets into Python
 ------------------------------------
 
-The **load_data** function retrieves an R data set and converts it to the
-appropriate pandas object (most likely a DataFrame):
-
+Once the pandas conversion is activated (``pandas2ri.activate()``), many conversions
+of R to pandas objects will be done automatically. For example, to obtain the 'iris' dataset as a pandas DataFrame:
 
 .. ipython:: python
-   :okwarning:
 
-   import pandas.rpy.common as com
-   infert = com.load_data('infert')
-
-   infert.head()
+    r.data('iris')
+    r['iris'].head()
 
+If the pandas conversion was not activated, the above could also be accomplished
+by explicitly converting it with the ``pandas2ri.ri2py`` function
+(``pandas2ri.ri2py(r['iris'])``).
 
 Converting DataFrames into R objects
 ------------------------------------
 
-.. versionadded:: 0.8
-
-Starting from pandas 0.8, there is **experimental** support to convert
+The ``pandas2ri.py2ri`` function support the reverse operation to convert
 DataFrames into the equivalent R object (that is, **data.frame**):
 
 .. ipython:: python
 
    df = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6], 'C':[7,8,9]},
                      index=["one", "two", "three"])
-   r_dataframe = com.convert_to_r_dataframe(df)
-
+   r_dataframe = pandas2ri.py2ri(df)
    print(type(r_dataframe))
    print(r_dataframe)
 
-
 The DataFrame's index is stored as the ``rownames`` attribute of the
 data.frame instance.
 
-You can also use **convert_to_r_matrix** to obtain a ``Matrix`` instance, but
-bear in mind that it will only work with homogeneously-typed DataFrames (as
-R matrices bear no information on the data type):
 
-
-.. ipython:: python
-
-   r_matrix = com.convert_to_r_matrix(df)
-
-   print(type(r_matrix))
-   print(r_matrix)
-
-
-Calling R functions with pandas objects
----------------------------------------
-
-
-
-High-level interface to R estimators
-------------------------------------
+..
+   Calling R functions with pandas objects
+   High-level interface to R estimators
diff --git a/doc/source/release.rst b/doc/source/release.rst
index ac6717da529fd..16fe896d9f58f 100644
--- a/doc/source/release.rst
+++ b/doc/source/release.rst
@@ -12,7 +12,7 @@
    import matplotlib.pyplot as plt
    plt.close('all')
 
-   options.display.max_rows=15
+   pd.options.display.max_rows=15
    import pandas.util.testing as tm
 
 *************
@@ -20,7 +20,7 @@ Release Notes
 *************
 
 This is the list of changes to pandas between each release. For full details,
-see the commit logs at http://github.com/pydata/pandas
+see the commit logs at http://github.com/pandas-dev/pandas
 
 **What is it**
 
@@ -33,10 +33,1537 @@ analysis / manipulation tool available in any language.
 
 **Where to get it**
 
-* Source code: http://github.com/pydata/pandas
-* Binary installers on PyPI: http://pypi.python.org/pypi/pandas
+* Source code: http://github.com/pandas-dev/pandas
+* Binary installers on PyPI: https://pypi.org/project/pandas
 * Documentation: http://pandas.pydata.org
 
+pandas 0.23.1
+-------------
+
+**Release date**: June 12, 2018
+
+This is a minor release from 0.23.0 and includes a number of bug fixes and
+performance improvements.
+
+See the :ref:`full whatsnew <whatsnew_0231>` for a list of all the changes.
+
+Thanks
+~~~~~~
+
+A total of 30 people contributed to this release.  People with a "+" by their
+names contributed a patch for the first time.
+
+* Adam J. Stewart
+* Adam Kim +
+* Aly Sivji
+* Chalmer Lowe +
+* Damini Satya +
+* Dr. Irv
+* Gabe Fernando +
+* Giftlin Rajaiah
+* Jeff Reback
+* Jeremy Schendel +
+* Joris Van den Bossche
+* Kalyan Gokhale +
+* Kevin Sheppard
+* Matthew Roeschke
+* Max Kanter +
+* Ming Li
+* Pyry Kovanen +
+* Stefano Cianciulli
+* Tom Augspurger
+* Uddeshya Singh +
+* Wenhuan
+* William Ayd
+* chris-b1
+* gfyoung
+* h-vetinari
+* nprad +
+* ssikdar1 +
+* tmnhat2001
+* topper-123
+* zertrin +
+
+pandas 0.23.0
+-------------
+
+**Release date**: May 15, 2018
+
+This is a major release from 0.22.0 and includes a number of API changes, new
+features, enhancements, and performance improvements along with a large number
+of bug fixes. We recommend that all users upgrade to this version.
+
+Highlights include:
+
+- :ref:`Round-trippable JSON format with 'table' orient <whatsnew_0230.enhancements.round-trippable_json>`.
+- :ref:`Instantiation from dicts respects order for Python 3.6+ <whatsnew_0230.api_breaking.dict_insertion_order>`.
+- :ref:`Dependent column arguments for assign <whatsnew_0230.enhancements.assign_dependent>`.
+- :ref:`Merging / sorting on a combination of columns and index levels <whatsnew_0230.enhancements.merge_on_columns_and_levels>`.
+- :ref:`Extending Pandas with custom types <whatsnew_023.enhancements.extension>`.
+- :ref:`Excluding unobserved categories from groupby <whatsnew_0230.enhancements.categorical_grouping>`.
+- :ref:`Changes to make output shape of DataFrame.apply consistent <whatsnew_0230.api_breaking.apply>`.
+
+See the :ref:`full whatsnew <whatsnew_0230>` for a list of all the changes.
+
+Thanks
+~~~~~~
+
+A total of 328 people contributed to this release.  People with a "+" by their
+names contributed a patch for the first time.
+
+* Aaron Critchley
+* AbdealiJK +
+* Adam Hooper +
+* Albert Villanova del Moral
+* Alejandro Giacometti +
+* Alejandro Hohmann +
+* Alex Rychyk
+* Alexander Buchkovsky
+* Alexander Lenail +
+* Alexander Michael Schade
+* Aly Sivji +
+* Andreas Költringer +
+* Andrew
+* Andrew Bui +
+* András Novoszáth +
+* Andy Craze +
+* Andy R. Terrel
+* Anh Le +
+* Anil Kumar Pallekonda +
+* Antoine Pitrou +
+* Antonio Linde +
+* Antonio Molina +
+* Antonio Quinonez +
+* Armin Varshokar +
+* Artem Bogachev +
+* Avi Sen +
+* Azeez Oluwafemi +
+* Ben Auffarth +
+* Bernhard Thiel +
+* Bhavesh Poddar +
+* BielStela +
+* Blair +
+* Bob Haffner
+* Brett Naul +
+* Brock Mendel
+* Bryce Guinta +
+* Carlos Eduardo Moreira dos Santos +
+* Carlos García Márquez +
+* Carol Willing
+* Cheuk Ting Ho +
+* Chitrank Dixit +
+* Chris
+* Chris Burr +
+* Chris Catalfo +
+* Chris Mazzullo
+* Christian Chwala +
+* Cihan Ceyhan +
+* Clemens Brunner
+* Colin +
+* Cornelius Riemenschneider
+* Crystal Gong +
+* DaanVanHauwermeiren
+* Dan Dixey +
+* Daniel Frank +
+* Daniel Garrido +
+* Daniel Sakuma +
+* DataOmbudsman +
+* Dave Hirschfeld
+* Dave Lewis +
+* David Adrián Cañones Castellano +
+* David Arcos +
+* David C Hall +
+* David Fischer
+* David Hoese +
+* David Lutz +
+* David Polo +
+* David Stansby
+* Dennis Kamau +
+* Dillon Niederhut
+* Dimitri +
+* Dr. Irv
+* Dror Atariah
+* Eric Chea +
+* Eric Kisslinger
+* Eric O. LEBIGOT (EOL) +
+* FAN-GOD +
+* Fabian Retkowski +
+* Fer Sar +
+* Gabriel de Maeztu +
+* Gianpaolo Macario +
+* Giftlin Rajaiah
+* Gilberto Olimpio +
+* Gina +
+* Gjelt +
+* Graham Inggs +
+* Grant Roch
+* Grant Smith +
+* Grzegorz Konefał +
+* Guilherme Beltramini
+* HagaiHargil +
+* Hamish Pitkeathly +
+* Hammad Mashkoor +
+* Hannah Ferchland +
+* Hans
+* Haochen Wu +
+* Hissashi Rocha +
+* Iain Barr +
+* Ibrahim Sharaf ElDen +
+* Ignasi Fosch +
+* Igor Conrado Alves de Lima +
+* Igor Shelvinskyi +
+* Imanflow +
+* Ingolf Becker
+* Israel Saeta Pérez
+* Iva Koevska +
+* Jakub Nowacki +
+* Jan F-F +
+* Jan Koch +
+* Jan Werkmann
+* Janelle Zoutkamp +
+* Jason Bandlow +
+* Jaume Bonet +
+* Jay Alammar +
+* Jeff Reback
+* JennaVergeynst
+* Jimmy Woo +
+* Jing Qiang Goh +
+* Joachim Wagner +
+* Joan Martin Miralles +
+* Joel Nothman
+* Joeun Park +
+* John Cant +
+* Johnny Metz +
+* Jon Mease
+* Jonas Schulze +
+* Jongwony +
+* Jordi Contestí +
+* Joris Van den Bossche
+* José F. R. Fonseca +
+* Jovixe +
+* Julio Martinez +
+* Jörg Döpfert
+* KOBAYASHI Ittoku +
+* Kate Surta +
+* Kenneth +
+* Kevin Kuhl
+* Kevin Sheppard
+* Krzysztof Chomski
+* Ksenia +
+* Ksenia Bobrova +
+* Kunal Gosar +
+* Kurtis Kerstein +
+* Kyle Barron +
+* Laksh Arora +
+* Laurens Geffert +
+* Leif Walsh
+* Liam Marshall +
+* Liam3851 +
+* Licht Takeuchi
+* Liudmila +
+* Ludovico Russo +
+* Mabel Villalba +
+* Manan Pal Singh +
+* Manraj Singh
+* Marc +
+* Marc Garcia
+* Marco Hemken +
+* Maria del Mar Bibiloni +
+* Mario Corchero +
+* Mark Woodbridge +
+* Martin Journois +
+* Mason Gallo +
+* Matias Heikkilä +
+* Matt Braymer-Hayes
+* Matt Kirk +
+* Matt Maybeno +
+* Matthew Kirk +
+* Matthew Rocklin +
+* Matthew Roeschke
+* Matthias Bussonnier +
+* Max Mikhaylov +
+* Maxim Veksler +
+* Maximilian Roos
+* Maximiliano Greco +
+* Michael Penkov
+* Michael Röttger +
+* Michael Selik +
+* Michael Waskom
+* Mie~~~
+* Mike Kutzma +
+* Ming Li +
+* Mitar +
+* Mitch Negus +
+* Montana Low +
+* Moritz Münst +
+* Mortada Mehyar
+* Myles Braithwaite +
+* Nate Yoder
+* Nicholas Ursa +
+* Nick Chmura
+* Nikos Karagiannakis +
+* Nipun Sadvilkar +
+* Nis Martensen +
+* Noah +
+* Noémi Éltető +
+* Olivier Bilodeau +
+* Ondrej Kokes +
+* Onno Eberhard +
+* Paul Ganssle +
+* Paul Mannino +
+* Paul Reidy
+* Paulo Roberto de Oliveira Castro +
+* Pepe Flores +
+* Peter Hoffmann
+* Phil Ngo +
+* Pietro Battiston
+* Pranav Suri +
+* Priyanka Ojha +
+* Pulkit Maloo +
+* README Bot +
+* Ray Bell +
+* Riccardo Magliocchetti +
+* Ridhwan Luthra +
+* Robert Meyer
+* Robin
+* Robin Kiplang'at +
+* Rohan Pandit +
+* Rok Mihevc +
+* Rouz Azari
+* Ryszard T. Kaleta +
+* Sam Cohan
+* Sam Foo
+* Samir Musali +
+* Samuel Sinayoko +
+* Sangwoong Yoon
+* SarahJessica +
+* Sharad Vijalapuram +
+* Shubham Chaudhary +
+* SiYoungOh +
+* Sietse Brouwer
+* Simone Basso +
+* Stefania Delprete +
+* Stefano Cianciulli +
+* Stephen Childs +
+* StephenVoland +
+* Stijn Van Hoey +
+* Sven
+* Talitha Pumar +
+* Tarbo Fukazawa +
+* Ted Petrou +
+* Thomas A Caswell
+* Tim Hoffmann +
+* Tim Swast
+* Tom Augspurger
+* Tommy +
+* Tulio Casagrande +
+* Tushar Gupta +
+* Tushar Mittal +
+* Upkar Lidder +
+* Victor Villas +
+* Vince W +
+* Vinícius Figueiredo +
+* Vipin Kumar +
+* WBare
+* Wenhuan +
+* Wes Turner
+* William Ayd
+* Wilson Lin +
+* Xbar
+* Yaroslav Halchenko
+* Yee Mey
+* Yeongseon Choe +
+* Yian +
+* Yimeng Zhang
+* ZhuBaohe +
+* Zihao Zhao +
+* adatasetaday +
+* akielbowicz +
+* akosel +
+* alinde1 +
+* amuta +
+* bolkedebruin
+* cbertinato
+* cgohlke
+* charlie0389 +
+* chris-b1
+* csfarkas +
+* dajcs +
+* deflatSOCO +
+* derestle-htwg
+* discort
+* dmanikowski-reef +
+* donK23 +
+* elrubio +
+* fivemok +
+* fjdiod
+* fjetter +
+* froessler +
+* gabrielclow
+* gfyoung
+* ghasemnaddaf
+* h-vetinari +
+* himanshu awasthi +
+* ignamv +
+* jayfoad +
+* jazzmuesli +
+* jbrockmendel
+* jen w +
+* jjames34 +
+* joaoavf +
+* joders +
+* jschendel
+* juan huguet +
+* l736x +
+* luzpaz +
+* mdeboc +
+* miguelmorin +
+* miker985
+* miquelcamprodon +
+* orereta +
+* ottiP +
+* peterpanmj +
+* rafarui +
+* raph-m +
+* readyready15728 +
+* rmihael +
+* samghelms +
+* scriptomation +
+* sfoo +
+* stefansimik +
+* stonebig
+* tmnhat2001 +
+* tomneep +
+* topper-123
+* tv3141 +
+* verakai +
+* xpvpc +
+* zhanghui +
+
+pandas 0.22.0
+-------------
+
+**Release date:** December 29, 2017
+
+This is a major release from 0.21.1 and includes a single, API-breaking change.
+We recommend that all users upgrade to this version after carefully reading the
+release note.
+
+The only changes are:
+
+- The sum of an empty or all-*NA* ``Series`` is now ``0``
+- The product of an empty or all-*NA* ``Series`` is now ``1``
+- We've added a ``min_count`` parameter to ``.sum()`` and ``.prod()`` controlling
+  the minimum number of valid values for the result to be valid. If fewer than
+  ``min_count`` non-*NA* values are present, the result is *NA*. The default is
+  ``0``. To return ``NaN``, the 0.21 behavior, use ``min_count=1``.
+
+See the :ref:`v0.22.0 Whatsnew <whatsnew_0220>` overview for further explanation
+of all the places in the library this affects.
+
+pandas 0.21.1
+-------------
+
+**Release date:** December 12, 2017
+
+This is a minor bug-fix release in the 0.21.x series and includes some small
+regression fixes, bug fixes and performance improvements. We recommend that all
+users upgrade to this version.
+
+Highlights include:
+
+- Temporarily restore matplotlib datetime plotting functionality. This should
+  resolve issues for users who relied implicitly on pandas to plot datetimes
+  with matplotlib. See :ref:`here <whatsnew_0211.converters>`.
+- Improvements to the Parquet IO functions introduced in 0.21.0. See
+  :ref:`here <whatsnew_0211.enhancements.parquet>`.
+
+See the :ref:`v0.21.1 Whatsnew <whatsnew_0211>` overview for an extensive list
+of all the changes for 0.21.1.
+
+Thanks
+~~~~~~
+
+A total of 46 people contributed to this release.  People with a "+" by their
+names contributed a patch for the first time.
+
+Contributors
+============
+
+* Aaron Critchley +
+* Alex Rychyk
+* Alexander Buchkovsky +
+* Alexander Michael Schade +
+* Chris Mazzullo
+* Cornelius Riemenschneider +
+* Dave Hirschfeld +
+* David Fischer +
+* David Stansby +
+* Dror Atariah +
+* Eric Kisslinger +
+* Hans +
+* Ingolf Becker +
+* Jan Werkmann +
+* Jeff Reback
+* Joris Van den Bossche
+* Jörg Döpfert +
+* Kevin Kuhl +
+* Krzysztof Chomski +
+* Leif Walsh
+* Licht Takeuchi
+* Manraj Singh +
+* Matt Braymer-Hayes +
+* Michael Waskom +
+* Mie~~~ +
+* Peter Hoffmann +
+* Robert Meyer +
+* Sam Cohan +
+* Sietse Brouwer +
+* Sven +
+* Tim Swast
+* Tom Augspurger
+* Wes Turner
+* William Ayd +
+* Yee Mey +
+* bolkedebruin +
+* cgohlke
+* derestle-htwg +
+* fjdiod +
+* gabrielclow +
+* gfyoung
+* ghasemnaddaf +
+* jbrockmendel
+* jschendel
+* miker985 +
+* topper-123
+
+pandas 0.21.0
+-------------
+
+**Release date:** October 27, 2017
+
+This is a major release from 0.20.3 and includes a number of API changes,
+deprecations, new features, enhancements, and performance improvements along
+with a large number of bug fixes. We recommend that all users upgrade to this
+version.
+
+Highlights include:
+
+- Integration with `Apache Parquet <https://parquet.apache.org/>`__, including a new top-level :func:`read_parquet` function and :meth:`DataFrame.to_parquet` method, see :ref:`here <whatsnew_0210.enhancements.parquet>`.
+- New user-facing :class:`pandas.api.types.CategoricalDtype` for specifying
+  categoricals independent of the data, see :ref:`here <whatsnew_0210.enhancements.categorical_dtype>`.
+- The behavior of ``sum`` and ``prod`` on all-NaN Series/DataFrames is now consistent and no longer depends on whether `bottleneck <http://berkeleyanalytics.com/bottleneck>`__ is installed, and ``sum`` and ``prod`` on empty Series now return NaN instead of 0, see :ref:`here <whatsnew_0210.api_breaking.bottleneck>`.
+- Compatibility fixes for pypy, see :ref:`here <whatsnew_0210.pypy>`.
+- Additions to the ``drop``, ``reindex`` and ``rename`` API to make them more consistent, see :ref:`here <whatsnew_0210.enhancements.drop_api>`.
+- Addition of the new methods ``DataFrame.infer_objects`` (see :ref:`here <whatsnew_0210.enhancements.infer_objects>`) and ``GroupBy.pipe`` (see :ref:`here <whatsnew_0210.enhancements.GroupBy_pipe>`).
+- Indexing with a list of labels, where one or more of the labels is missing, is deprecated and will raise a KeyError in a future version, see :ref:`here <whatsnew_0210.api_breaking.loc>`.
+
+See the :ref:`v0.21.0 Whatsnew <whatsnew_0210>` overview for an extensive list
+of all enhancements and bugs that have been fixed in 0.21.0
+
+Thanks
+~~~~~~
+
+A total of 206 people contributed to this release.  People with a "+" by their
+names contributed a patch for the first time.
+
+Contributors
+============
+
+* 3553x +
+* Aaron Barber
+* Adam Gleave +
+* Adam Smith +
+* AdamShamlian +
+* Adrian Liaw +
+* Alan Velasco +
+* Alan Yee +
+* Alex B +
+* Alex Lubbock +
+* Alex Marchenko +
+* Alex Rychyk +
+* Amol K +
+* Andreas Winkler
+* Andrew +
+* Andrew 亮
+* André Jonasson +
+* Becky Sweger
+* Berkay +
+* Bob Haffner +
+* Bran Yang
+* Brian Tu +
+* Brock Mendel +
+* Carol Willing +
+* Carter Green +
+* Chankey Pathak +
+* Chris
+* Chris Billington
+* Chris Filo Gorgolewski +
+* Chris Kerr
+* Chris M +
+* Chris Mazzullo +
+* Christian Prinoth
+* Christian Stade-Schuldt
+* Christoph Moehl +
+* DSM
+* Daniel Chen +
+* Daniel Grady
+* Daniel Himmelstein
+* Dave Willmer
+* David Cook
+* David Gwynne
+* David Read +
+* Dillon Niederhut +
+* Douglas Rudd
+* Eric Stein +
+* Eric Wieser +
+* Erik Fredriksen
+* Florian Wilhelm +
+* Floris Kint +
+* Forbidden Donut
+* Gabe F +
+* Giftlin +
+* Giftlin Rajaiah +
+* Giulio Pepe +
+* Guilherme Beltramini
+* Guillem Borrell +
+* Hanmin Qin +
+* Hendrik Makait +
+* Hugues Valois
+* Hussain Tamboli +
+* Iva Miholic +
+* Jan Novotný +
+* Jan Rudolph
+* Jean Helie +
+* Jean-Baptiste Schiratti +
+* Jean-Mathieu Deschenes
+* Jeff Knupp +
+* Jeff Reback
+* Jeff Tratner
+* JennaVergeynst
+* JimStearns206
+* Joel Nothman
+* John W. O'Brien
+* Jon Crall +
+* Jon Mease
+* Jonathan J. Helmus +
+* Joris Van den Bossche
+* JosephWagner
+* Juarez Bochi
+* Julian Kuhlmann +
+* Karel De Brabandere
+* Kassandra Keeton +
+* Keiron Pizzey +
+* Keith Webber
+* Kernc
+* Kevin Sheppard
+* Kirk Hansen +
+* Licht Takeuchi +
+* Lucas Kushner +
+* Mahdi Ben Jelloul +
+* Makarov Andrey +
+* Malgorzata Turzanska +
+* Marc Garcia +
+* Margaret Sy +
+* MarsGuy +
+* Matt Bark +
+* Matthew Roeschke
+* Matti Picus
+* Mehmet Ali "Mali" Akmanalp
+* Michael Gasvoda +
+* Michael Penkov +
+* Milo +
+* Morgan Stuart +
+* Morgan243 +
+* Nathan Ford +
+* Nick Eubank
+* Nick Garvey +
+* Oleg Shteynbuk +
+* P-Tillmann +
+* Pankaj Pandey
+* Patrick Luo
+* Patrick O'Melveny
+* Paul Reidy +
+* Paula +
+* Peter Quackenbush
+* Peter Yanovich +
+* Phillip Cloud
+* Pierre Haessig
+* Pietro Battiston
+* Pradyumna Reddy Chinthala
+* Prasanjit Prakash
+* RobinFiveWords
+* Ryan Hendrickson
+* Sam Foo
+* Sangwoong Yoon +
+* Simon Gibbons +
+* SimonBaron
+* Steven Cutting +
+* Sudeep +
+* Sylvia +
+* T N +
+* Telt
+* Thomas A Caswell
+* Tim Swast +
+* Tom Augspurger
+* Tong SHEN
+* Tuan +
+* Utkarsh Upadhyay +
+* Vincent La +
+* Vivek +
+* WANG Aiyong
+* WBare
+* Wes McKinney
+* XF +
+* Yi Liu +
+* Yosuke Nakabayashi +
+* aaron315 +
+* abarber4gh +
+* aernlund +
+* agustín méndez +
+* andymaheshw +
+* ante328 +
+* aviolov +
+* bpraggastis
+* cbertinato +
+* cclauss +
+* chernrick
+* chris-b1
+* dkamm +
+* dwkenefick
+* economy
+* faic +
+* fding253 +
+* gfyoung
+* guygoldberg +
+* hhuuggoo +
+* huashuai +
+* ian
+* iulia +
+* jaredsnyder
+* jbrockmendel +
+* jdeschenes
+* jebob +
+* jschendel +
+* keitakurita
+* kernc +
+* kiwirob +
+* kjford
+* linebp
+* lloydkirk
+* louispotok +
+* majiang +
+* manikbhandari +
+* matthiashuschle +
+* mattip
+* maxwasserman +
+* mjlove12 +
+* nmartensen +
+* pandas-docs-bot +
+* parchd-1 +
+* philipphanemann +
+* rdk1024 +
+* reidy-p +
+* ri938
+* ruiann +
+* rvernica +
+* s-weigand +
+* scotthavard92 +
+* skwbc +
+* step4me +
+* tobycheese +
+* topper-123 +
+* tsdlovell
+* ysau +
+* zzgao +
+
+
+pandas 0.20.0 / 0.20.1
+----------------------
+
+**Release date:** May 5, 2017
+
+
+This is a major release from 0.19.2 and includes a number of API changes, deprecations, new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+Highlights include:
+
+- New ``.agg()`` API for Series/DataFrame similar to the groupby-rolling-resample API's, see :ref:`here <whatsnew_0200.enhancements.agg>`
+- Integration with the ``feather-format``, including a new top-level ``pd.read_feather()`` and ``DataFrame.to_feather()`` method, see :ref:`here <io.feather>`.
+- The ``.ix`` indexer has been deprecated, see :ref:`here <whatsnew_0200.api_breaking.deprecate_ix>`
+- ``Panel`` has been deprecated, see :ref:`here <whatsnew_0200.api_breaking.deprecate_panel>`
+- Addition of an ``IntervalIndex`` and ``Interval`` scalar type, see :ref:`here <whatsnew_0200.enhancements.intervalindex>`
+- Improved user API when grouping by index levels in ``.groupby()``, see :ref:`here <whatsnew_0200.enhancements.groupby_access>`
+- Improved support for ``UInt64`` dtypes, see :ref:`here <whatsnew_0200.enhancements.uint64_support>`
+- A new orient for JSON serialization, ``orient='table'``, that uses the Table Schema spec and that gives the possibility for a more interactive repr in the Jupyter Notebook, see :ref:`here <whatsnew_0200.enhancements.table_schema>`
+- Experimental support for exporting styled DataFrames (``DataFrame.style``) to Excel, see :ref:`here <whatsnew_0200.enhancements.style_excel>`
+- Window binary corr/cov operations now return a MultiIndexed ``DataFrame`` rather than a ``Panel``, as ``Panel`` is now deprecated, see :ref:`here <whatsnew_0200.api_breaking.rolling_pairwise>`
+- Support for S3 handling now uses ``s3fs``, see :ref:`here <whatsnew_0200.api_breaking.s3>`
+- Google BigQuery support now uses the ``pandas-gbq`` library, see :ref:`here <whatsnew_0200.api_breaking.gbq>`
+
+See the :ref:`v0.20.1 Whatsnew <whatsnew_0200>` overview for an extensive list
+of all enhancements and bugs that have been fixed in 0.20.1.
+
+
+.. note::
+
+   This is a combined release for 0.20.0 and 0.20.1.
+   Version 0.20.1 contains one additional change for backwards-compatibility with downstream projects using pandas' ``utils`` routines. (:issue:`16250`)
+
+Thanks
+~~~~~~
+
+- abaldenko
+- Adam J. Stewart
+- Adrian
+- adrian-stepien
+- Ajay Saxena
+- Akash Tandon
+- Albert Villanova del Moral
+- Aleksey Bilogur
+- alexandercbooth
+- Alexis Mignon
+- Amol Kahat
+- Andreas Winkler
+- Andrew Kittredge
+- Anthonios Partheniou
+- Arco Bast
+- Ashish Singal
+- atbd
+- bastewart
+- Baurzhan Muftakhidinov
+- Ben Kandel
+- Ben Thayer
+- Ben Welsh
+- Bill Chambers
+- bmagnusson
+- Brandon M. Burroughs
+- Brian
+- Brian McFee
+- carlosdanielcsantos
+- Carlos Souza
+- chaimdemulder
+- Chris
+- chris-b1
+- Chris Ham
+- Christopher C. Aycock
+- Christoph Gohlke
+- Christoph Paulik
+- Chris Warth
+- Clemens Brunner
+- DaanVanHauwermeiren
+- Daniel Himmelstein
+- Dave Willmer
+- David Cook
+- David Gwynne
+- David Hoffman
+- David Krych
+- dickreuter
+- Diego Fernandez
+- Dimitris Spathis
+- discort
+- Dmitry L
+- Dody Suria Wijaya
+- Dominik Stanczak
+- Dr-Irv
+- Dr. Irv
+- dr-leo
+- D.S. McNeil
+- dubourg
+- dwkenefick
+- Elliott Sales de Andrade
+- Ennemoser Christoph
+- Francesc Alted
+- Fumito Hamamura
+- funnycrab
+- gfyoung
+- Giacomo Ferroni
+- goldenbull
+- Graham R. Jeffries
+- Greg Williams
+- Guilherme Beltramini
+- Guilherme Samora
+- Hao Wu
+- Harshit Patni
+- hesham.shabana@hotmail.com
+- Ilya V. Schurov
+- Iván Vallés Pérez
+- Jackie Leng
+- Jaehoon Hwang
+- James Draper
+- James Goppert
+- James McBride
+- James Santucci
+- Jan Schulz
+- Jeff Carey
+- Jeff Reback
+- JennaVergeynst
+- Jim
+- Jim Crist
+- Joe Jevnik
+- Joel Nothman
+- John
+- John Tucker
+- John W. O'Brien
+- John Zwinck
+- jojomdt
+- Jonathan de Bruin
+- Jonathan Whitmore
+- Jon Mease
+- Jon M. Mease
+- Joost Kranendonk
+- Joris Van den Bossche
+- Joshua Bradt
+- Julian Santander
+- Julien Marrec
+- Jun Kim
+- Justin Solinsky
+- Kacawi
+- Kamal Kamalaldin
+- Kerby Shedden
+- Kernc
+- Keshav Ramaswamy
+- Kevin Sheppard
+- Kyle Kelley
+- Larry Ren
+- Leon Yin
+- linebp
+- Line Pedersen
+- Lorenzo Cestaro
+- Luca Scarabello
+- Lukasz
+- Mahmoud Lababidi
+- manu
+- manuels
+- Mark Mandel
+- Matthew Brett
+- Matthew Roeschke
+- mattip
+- Matti Picus
+- Matt Roeschke
+- maxalbert
+- Maximilian Roos
+- mcocdawc
+- Michael Charlton
+- Michael Felt
+- Michael Lamparski
+- Michiel Stock
+- Mikolaj Chwalisz
+- Min RK
+- Miroslav Šedivý
+- Mykola Golubyev
+- Nate Yoder
+- Nathalie Rud
+- Nicholas Ver Halen
+- Nick Chmura
+- Nolan Nichols
+- nuffe
+- Pankaj Pandey
+- paul-mannino
+- Pawel Kordek
+- pbreach
+- Pete Huang
+- Peter
+- Peter Csizsek
+- Petio Petrov
+- Phil Ruffwind
+- Pietro Battiston
+- Piotr Chromiec
+- Prasanjit Prakash
+- Robert Bradshaw
+- Rob Forgione
+- Robin
+- Rodolfo Fernandez
+- Roger Thomas
+- Rouz Azari
+- Sahil Dua
+- sakkemo
+- Sam Foo
+- Sami Salonen
+- Sarah Bird
+- Sarma Tangirala
+- scls19fr
+- Scott Sanderson
+- Sebastian Bank
+- Sebastian Gsänger
+- Sébastien de Menten
+- Shawn Heide
+- Shyam Saladi
+- sinhrks
+- Sinhrks
+- Stephen Rauch
+- stijnvanhoey
+- Tara Adiseshan
+- themrmax
+- the-nose-knows
+- Thiago Serafim
+- Thoralf Gutierrez
+- Thrasibule
+- Tobias Gustafsson
+- Tom Augspurger
+- tomrod
+- Tong Shen
+- Tong SHEN
+- TrigonaMinima
+- tzinckgraf
+- Uwe
+- wandersoncferreira
+- watercrossing
+- wcwagner
+- Wes Turner
+- Wiktor Tomczak
+- WillAyd
+- xgdgsc
+- Yaroslav Halchenko
+- Yimeng Zhang
+- yui-knk
+
+
+pandas 0.19.2
+-------------
+
+**Release date:** December 24, 2016
+
+This is a minor bug-fix release in the 0.19.x series and includes some small regression fixes,
+bug fixes and performance improvements.
+
+Highlights include:
+
+- Compatibility with Python 3.6
+- Added a `Pandas Cheat Sheet <https://github.com/pandas-dev/pandas/tree/master/doc/cheatsheet/Pandas_Cheat_Sheet.pdf>`__. (:issue:`13202`).
+
+See the :ref:`v0.19.2 Whatsnew <whatsnew_0192>` page for an overview of all
+bugs that have been fixed in 0.19.2.
+
+Thanks
+~~~~~~
+
+- Ajay Saxena
+- Ben Kandel
+- Chris
+- Chris Ham
+- Christopher C. Aycock
+- Daniel Himmelstein
+- Dave Willmer
+- Dr-Irv
+- gfyoung
+- hesham shabana
+- Jeff Carey
+- Jeff Reback
+- Joe Jevnik
+- Joris Van den Bossche
+- Julian Santander
+- Kerby Shedden
+- Keshav Ramaswamy
+- Kevin Sheppard
+- Luca Scarabello
+- Matti Picus
+- Matt Roeschke
+- Maximilian Roos
+- Mykola Golubyev
+- Nate Yoder
+- Nicholas Ver Halen
+- Pawel Kordek
+- Pietro Battiston
+- Rodolfo Fernandez
+- sinhrks
+- Tara Adiseshan
+- Tom Augspurger
+- wandersoncferreira
+- Yaroslav Halchenko
+
+
+pandas 0.19.1
+-------------
+
+**Release date:** November 3, 2016
+
+This is a minor bug-fix release from 0.19.0 and includes some small regression fixes,
+bug fixes and performance improvements.
+
+See the :ref:`v0.19.1 Whatsnew <whatsnew_0191>` page for an overview of all
+bugs that have been fixed in 0.19.1.
+
+Thanks
+~~~~~~
+
+- Adam Chainz
+- Anthonios Partheniou
+- Arash Rouhani
+- Ben Kandel
+- Brandon M. Burroughs
+- Chris
+- chris-b1
+- Chris Warth
+- David Krych
+- dubourg
+- gfyoung
+- Iván Vallés Pérez
+- Jeff Reback
+- Joe Jevnik
+- Jon M. Mease
+- Joris Van den Bossche
+- Josh Owen
+- Keshav Ramaswamy
+- Larry Ren
+- mattrijk
+- Michael Felt
+- paul-mannino
+- Piotr Chromiec
+- Robert Bradshaw
+- Sinhrks
+- Thiago Serafim
+- Tom Bird
+
+
+pandas 0.19.0
+-------------
+
+**Release date:** October 2, 2016
+
+This is a major release from 0.18.1 and includes number of API changes, several new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+Highlights include:
+
+- :func:`merge_asof` for asof-style time-series joining, see :ref:`here <whatsnew_0190.enhancements.asof_merge>`
+- ``.rolling()`` is now time-series aware, see :ref:`here <whatsnew_0190.enhancements.rolling_ts>`
+- :func:`read_csv` now supports parsing ``Categorical`` data, see :ref:`here <whatsnew_0190.enhancements.read_csv_categorical>`
+- A function :func:`union_categorical` has been added for combining categoricals, see :ref:`here <whatsnew_0190.enhancements.union_categoricals>`
+- ``PeriodIndex`` now has its own ``period`` dtype, and changed to be more consistent with other ``Index`` classes. See :ref:`here <whatsnew_0190.api.period>`
+- Sparse data structures gained enhanced support of ``int`` and ``bool`` dtypes, see :ref:`here <whatsnew_0190.sparse>`
+- Comparison operations with ``Series`` no longer ignores the index, see :ref:`here <whatsnew_0190.api.series_ops>` for an overview of the API changes.
+- Introduction of a pandas development API for utility functions, see :ref:`here <whatsnew_0190.dev_api>`.
+- Deprecation of ``Panel4D`` and ``PanelND``. We recommend to represent these types of n-dimensional data with the `xarray package <http://xarray.pydata.org/en/stable/>`__.
+- Removal of the previously deprecated modules ``pandas.io.data``, ``pandas.io.wb``, ``pandas.tools.rplot``.
+
+See the :ref:`v0.19.0 Whatsnew <whatsnew_0190>` overview for an extensive list
+of all enhancements and bugs that have been fixed in 0.19.0.
+
+Thanks
+~~~~~~
+
+- adneu
+- Adrien Emery
+- agraboso
+- Alex Alekseyev
+- Alex Vig
+- Allen Riddell
+- Amol
+- Amol Agrawal
+- Andy R. Terrel
+- Anthonios Partheniou
+- babakkeyvani
+- Ben Kandel
+- Bob Baxley
+- Brett Rosen
+- c123w
+- Camilo Cota
+- Chris
+- chris-b1
+- Chris Grinolds
+- Christian Hudon
+- Christopher C. Aycock
+- Chris Warth
+- cmazzullo
+- conquistador1492
+- cr3
+- Daniel Siladji
+- Douglas McNeil
+- Drewrey Lupton
+- dsm054
+- Eduardo Blancas Reyes
+- Elliot Marsden
+- Evan Wright
+- Felix Marczinowski
+- Francis T. O'Donovan
+- Gábor Lipták
+- Geraint Duck
+- gfyoung
+- Giacomo Ferroni
+- Grant Roch
+- Haleemur Ali
+- harshul1610
+- Hassan Shamim
+- iamsimha
+- Iulius Curt
+- Ivan Nazarov
+- jackieleng
+- Jeff Reback
+- Jeffrey Gerard
+- Jenn Olsen
+- Jim Crist
+- Joe Jevnik
+- John Evans
+- John Freeman
+- John Liekezer
+- Johnny Gill
+- John W. O'Brien
+- John Zwinck
+- Jordan Erenrich
+- Joris Van den Bossche
+- Josh Howes
+- Jozef Brandys
+- Kamil Sindi
+- Ka Wo Chen
+- Kerby Shedden
+- Kernc
+- Kevin Sheppard
+- Matthieu Brucher
+- Maximilian Roos
+- Michael Scherer
+- Mike Graham
+- Mortada Mehyar
+- mpuels
+- Muhammad Haseeb Tariq
+- Nate George
+- Neil Parley
+- Nicolas Bonnotte
+- OXPHOS
+- Pan Deng / Zora
+- Paul
+- Pauli Virtanen
+- Paul Mestemaker
+- Pawel Kordek
+- Pietro Battiston
+- pijucha
+- Piotr Jucha
+- priyankjain
+- Ravi Kumar Nimmi
+- Robert Gieseke
+- Robert Kern
+- Roger Thomas
+- Roy Keyes
+- Russell Smith
+- Sahil Dua
+- Sanjiv Lobo
+- Sašo Stanovnik
+- Shawn Heide
+- sinhrks
+- Sinhrks
+- Stephen Kappel
+- Steve Choi
+- Stewart Henderson
+- Sudarshan Konge
+- Thomas A Caswell
+- Tom Augspurger
+- Tom Bird
+- Uwe Hoffmann
+- wcwagner
+- WillAyd
+- Xiang Zhang
+- Yadunandan
+- Yaroslav Halchenko
+- YG-Riku
+- Yuichiro Kaneko
+- yui-knk
+- zhangjinjie
+- znmean
+- 颜发才（Yan Facai）
+
+pandas 0.18.1
+-------------
+
+**Release date:** (May 3, 2016)
+
+This is a minor release from 0.18.0 and includes a large number of bug fixes
+along with several new features, enhancements, and performance improvements.
+
+Highlights include:
+
+- ``.groupby(...)`` has been enhanced to provide convenient syntax when working with ``.rolling(..)``, ``.expanding(..)`` and ``.resample(..)`` per group, see :ref:`here <whatsnew_0181.deferred_ops>`
+- ``pd.to_datetime()`` has gained the ability to assemble dates from a ``DataFrame``, see :ref:`here <whatsnew_0181.enhancements.assembling>`
+- Method chaining improvements, see :ref:`here <whatsnew_0181.enhancements.method_chain>`.
+- Custom business hour offset, see :ref:`here <whatsnew_0181.enhancements.custombusinesshour>`.
+- Many bug fixes in the handling of ``sparse``, see :ref:`here <whatsnew_0181.sparse>`
+- Expanded the :ref:`Tutorials section <tutorial-modern>` with a feature on modern pandas, courtesy of `@TomAugsburger <https://twitter.com/TomAugspurger>`__. (:issue:`13045`).
+
+See the :ref:`v0.18.1 Whatsnew <whatsnew_0181>` overview for an extensive list
+of all enhancements and bugs that have been fixed in 0.18.1.
+
+Thanks
+~~~~~~
+
+- Andrew Fiore-Gartland
+- Bastiaan
+- Benoît Vinot
+- Brandon Rhodes
+- DaCoEx
+- Drew Fustin
+- Ernesto Freitas
+- Filip Ter
+- Gregory Livschitz
+- Gábor Lipták
+- Hassan Kibirige
+- Iblis Lin
+- Israel Saeta Pérez
+- Jason Wolosonovich
+- Jeff Reback
+- Joe Jevnik
+- Joris Van den Bossche
+- Joshua Storck
+- Ka Wo Chen
+- Kerby Shedden
+- Kieran O'Mahony
+- Leif Walsh
+- Mahmoud Lababidi
+- Maoyuan Liu
+- Mark Roth
+- Matt Wittmann
+- MaxU
+- Maximilian Roos
+- Michael Droettboom
+- Nick Eubank
+- Nicolas Bonnotte
+- OXPHOS
+- Pauli Virtanen
+- Peter Waller
+- Pietro Battiston
+- Prabhjot Singh
+- Robin Wilson
+- Roger Thomas
+- Sebastian Bank
+- Stephen Hoover
+- Tim Hopper
+- Tom Augspurger
+- WANG Aiyong
+- Wes Turner
+- Winand
+- Xbar
+- Yan Facai
+- adneu
+- ajenkins-cargometrics
+- behzad nouri
+- chinskiy
+- gfyoung
+- jeps-journal
+- jonaslb
+- kotrfa
+- nileracecrew
+- onesandzeroes
+- rs2
+- sinhrks
+- tsdlovell
+
+pandas 0.18.0
+-------------
+
+**Release date:** (March 13, 2016)
+
+This is a major release from 0.17.1 and includes a small number of API changes, several new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+Highlights include:
+
+- Moving and expanding window functions are now methods on Series and DataFrame,
+  similar to ``.groupby``, see :ref:`here <whatsnew_0180.enhancements.moments>`.
+- Adding support for a ``RangeIndex`` as a specialized form of the ``Int64Index``
+  for memory savings, see :ref:`here <whatsnew_0180.enhancements.rangeindex>`.
+- API breaking change to the ``.resample`` method to make it more ``.groupby``
+  like, see :ref:`here <whatsnew_0180.breaking.resample>`.
+- Removal of support for positional indexing with floats, which was deprecated
+  since 0.14.0. This will now raise a ``TypeError``, see :ref:`here <whatsnew_0180.float_indexers>`.
+- The ``.to_xarray()`` function has been added for compatibility with the
+  `xarray package <http://xarray.pydata.org/en/stable/>`__, see :ref:`here <whatsnew_0180.enhancements.xarray>`.
+- The ``read_sas`` function has been enhanced to read ``sas7bdat`` files, see :ref:`here <whatsnew_0180.enhancements.sas>`.
+- Addition of the :ref:`.str.extractall() method <whatsnew_0180.enhancements.extract>`,
+  and API changes to the :ref:`.str.extract() method <whatsnew_0180.enhancements.extract>`
+  and :ref:`.str.cat() method <whatsnew_0180.enhancements.strcat>`.
+- ``pd.test()`` top-level nose test runner is available (:issue:`4327`).
+
+See the :ref:`v0.18.0 Whatsnew <whatsnew_0180>` overview for an extensive list
+of all enhancements and bugs that have been fixed in 0.18.0.
+
+Thanks
+~~~~~~
+
+- ARF
+- Alex Alekseyev
+- Andrew McPherson
+- Andrew Rosenfeld
+- Anthonios Partheniou
+- Anton I. Sipos
+- Ben
+- Ben North
+- Bran Yang
+- Chris
+- Chris Carroux
+- Christopher C. Aycock
+- Christopher Scanlin
+- Cody
+- Da Wang
+- Daniel Grady
+- Dorozhko Anton
+- Dr-Irv
+- Erik M. Bray
+- Evan Wright
+- Francis T. O'Donovan
+- Frank Cleary
+- Gianluca Rossi
+- Graham Jeffries
+- Guillaume Horel
+- Henry Hammond
+- Isaac Schwabacher
+- Jean-Mathieu Deschenes
+- Jeff Reback
+- Joe Jevnik
+- John Freeman
+- John Fremlin
+- Jonas Hoersch
+- Joris Van den Bossche
+- Joris Vankerschaver
+- Justin Lecher
+- Justin Lin
+- Ka Wo Chen
+- Keming Zhang
+- Kerby Shedden
+- Kyle
+- Marco Farrugia
+- MasonGallo
+- MattRijk
+- Matthew Lurie
+- Maximilian Roos
+- Mayank Asthana
+- Mortada Mehyar
+- Moussa Taifi
+- Navreet Gill
+- Nicolas Bonnotte
+- Paul Reiners
+- Philip Gura
+- Pietro Battiston
+- RahulHP
+- Randy Carnevale
+- Rinoc Johnson
+- Rishipuri
+- Sangmin Park
+- Scott E Lasley
+- Sereger13
+- Shannon Wang
+- Skipper Seabold
+- Thierry Moisan
+- Thomas A Caswell
+- Toby Dylan Hocking
+- Tom Augspurger
+- Travis
+- Trent Hauck
+- Tux1
+- Varun
+- Wes McKinney
+- Will Thompson
+- Yoav Ram
+- Yoong Kang Lim
+- Yoshiki Vázquez Baeza
+- Young Joong Kim
+- Younggun Kim
+- Yuval Langer
+- alex argunov
+- behzad nouri
+- boombard
+- brian-pantano
+- chromy
+- daniel
+- dgram0
+- gfyoung
+- hack-c
+- hcontrast
+- jfoo
+- kaustuv deolal
+- llllllllll
+- ranarag
+- rockg
+- scls19fr
+- seales
+- sinhrks
+- srib
+- surveymedia.ca
+- tworec
+
+pandas 0.17.1
+-------------
+
+**Release date:** (November 21, 2015)
+
+This is a minor release from 0.17.0 and includes a large number of bug fixes
+along with several new features, enhancements, and performance improvements.
+
+Highlights include:
+
+- Support for Conditional HTML Formatting, see :ref:`here <whatsnew_0171.style>`
+- Releasing the GIL on the csv reader & other ops, see :ref:`here <whatsnew_0171.performance>`
+- Regression in ``DataFrame.drop_duplicates`` from 0.16.2, causing incorrect results on integer values (:issue:`11376`)
+
+See the :ref:`v0.17.1 Whatsnew <whatsnew_0171>` overview for an extensive list
+of all enhancements and bugs that have been fixed in 0.17.1.
+
+Thanks
+~~~~~~
+
+- Aleksandr Drozd
+- Alex Chase
+- Anthonios Partheniou
+- BrenBarn
+- Brian J. McGuirk
+- Chris
+- Christian Berendt
+- Christian Perez
+- Cody Piersall
+- Data & Code Expert Experimenting with Code on Data
+- DrIrv
+- Evan Wright
+- Guillaume Gay
+- Hamed Saljooghinejad
+- Iblis Lin
+- Jake VanderPlas
+- Jan Schulz
+- Jean-Mathieu Deschenes
+- Jeff Reback
+- Jimmy Callin
+- Joris Van den Bossche
+- K.-Michael Aye
+- Ka Wo Chen
+- Loïc Séguin-C
+- Luo Yicheng
+- Magnus Jöud
+- Manuel Leonhardt
+- Matthew Gilbert
+- Maximilian Roos
+- Michael
+- Nicholas Stahl
+- Nicolas Bonnotte
+- Pastafarianist
+- Petra Chong
+- Phil Schaf
+- Philipp A
+- Rob deCarvalho
+- Roman Khomenko
+- Rémy Léone
+- Sebastian Bank
+- Thierry Moisan
+- Tom Augspurger
+- Tux1
+- Varun
+- Wieland Hoffmann
+- Winterflower
+- Yoav Ram
+- Younggun Kim
+- Zeke
+- ajcr
+- azuranski
+- behzad nouri
+- cel4
+- emilydolson
+- hironow
+- lexual
+- llllllllll
+- rockg
+- silentquasar
+- sinhrks
+- taeold
+
 pandas 0.17.0
 -------------
 
@@ -330,7 +1857,7 @@ Highlights include:
   modules are deprecated. We refer users to external packages like
   `seaborn <http://stanford.edu/~mwaskom/software/seaborn/>`_,
   `pandas-qt <https://github.com/datalyze-solutions/pandas-qt>`_ and
-  `rpy2 <http://rpy.sourceforge.net/>`_ for similar or equivalent
+  `rpy2 <http://rpy2.bitbucket.org/>`_ for similar or equivalent
   functionality, see :ref:`here <whatsnew_0160.deprecations>`
 
 See the :ref:`v0.16.0 Whatsnew <whatsnew_0160>` overview or the issue tracker on GitHub for an extensive list
@@ -511,7 +2038,7 @@ performance improvements along with a large number of bug fixes.
 
 Highlights include:
 
-- Drop support for numpy < 1.7.0 (:issue:`7711`)
+- Drop support for NumPy < 1.7.0 (:issue:`7711`)
 - The ``Categorical`` type was integrated as a first-class pandas type, see :ref:`here <whatsnew_0150.cat>`
 - New scalar type ``Timedelta``, and a new index type ``TimedeltaIndex``, see :ref:`here <whatsnew_0150.timedeltaindex>`
 - New DataFrame default display for ``df.info()`` to include memory usage, see :ref:`Memory Usage <whatsnew_0150.memory>`
@@ -694,7 +2221,7 @@ Highlights include:
 - SQL interfaces updated to use ``sqlalchemy``, see :ref:`here<whatsnew_0140.sql>`.
 - Display interface changes, see :ref:`here<whatsnew_0140.display>`
 - MultiIndexing using Slicers, see :ref:`here<whatsnew_0140.slicers>`.
-- Ability to join a singly-indexed DataFrame with a multi-indexed DataFrame, see :ref:`here <merging.join_on_mi>`
+- Ability to join a singly-indexed DataFrame with a MultiIndexed DataFrame, see :ref:`here <merging.join_on_mi>`
 - More consistency in groupby results and more flexible groupby specifications, see :ref:`here<whatsnew_0140.groupby>`
 - Holiday calendars are now supported in ``CustomBusinessDay``, see :ref:`here <timeseries.holiday>`
 - Several improvements in plotting functions, including: hexbin, area and pie plots, see :ref:`here<whatsnew_0140.plotting>`.
@@ -904,11 +2431,11 @@ Bug Fixes
 - Bug in merging ``timedelta`` dtypes (:issue:`5695`)
 - Bug in plotting.scatter_matrix function. Wrong alignment among diagonal
   and off-diagonal plots, see (:issue:`5497`).
-- Regression in Series with a multi-index via ix (:issue:`6018`)
-- Bug in Series.xs with a multi-index (:issue:`6018`)
+- Regression in Series with a MultiIndex via ix (:issue:`6018`)
+- Bug in Series.xs with a MultiIndex (:issue:`6018`)
 - Bug in Series construction of mixed type with datelike and an integer (which should result in
   object type and not automatic conversion) (:issue:`6028`)
-- Possible segfault when chained indexing with an object array under numpy 1.7.1 (:issue:`6026`, :issue:`6056`)
+- Possible segfault when chained indexing with an object array under NumPy 1.7.1 (:issue:`6026`, :issue:`6056`)
 - Bug in setting using fancy indexing a single element with a non-scalar (e.g. a list),
   (:issue:`6043`)
 - ``to_sql`` did not respect ``if_exists`` (:issue:`4110` :issue:`4304`)
@@ -919,7 +2446,7 @@ Bug Fixes
 - Fixed missing arg validation in get_options_data (:issue:`6105`)
 - Bug in assignment with duplicate columns in a frame where the locations
   are a slice (e.g. next to each other) (:issue:`6120`)
-- Bug in propogating _ref_locs during construction of a DataFrame with dups
+- Bug in propagating _ref_locs during construction of a DataFrame with dups
   index/columns (:issue:`6121`)
 - Bug in ``DataFrame.apply`` when using mixed datelike reductions (:issue:`6125`)
 - Bug in ``DataFrame.append`` when appending a row with different columns (:issue:`6129`)
@@ -929,10 +2456,10 @@ Bug Fixes
 - Fixed a bug in ``query``/``eval`` during lexicographic string comparisons (:issue:`6155`).
 - Fixed a bug in ``query`` where the index of a single-element ``Series`` was
   being thrown away (:issue:`6148`).
-- Bug in ``HDFStore`` on appending a dataframe with multi-indexed columns to
+- Bug in ``HDFStore`` on appending a dataframe with MultiIndexed columns to
   an existing table (:issue:`6167`)
 - Consistency with dtypes in setting an empty DataFrame (:issue:`6171`)
-- Bug in  selecting on a multi-index ``HDFStore`` even in the presence of under
+- Bug in selecting on a MultiIndex ``HDFStore`` even in the presence of under
   specified column spec (:issue:`6169`)
 - Bug in ``nanops.var`` with ``ddof=1`` and 1 elements would sometimes return ``inf``
   rather than ``nan`` on some platforms (:issue:`6136`)
@@ -949,7 +2476,7 @@ New Features
 
 - ``plot(kind='kde')`` now accepts the optional parameters ``bw_method`` and
   ``ind``, passed to scipy.stats.gaussian_kde() (for scipy >= 0.11.0) to set
-  the bandwidth, and to gkde.evaluate() to specify the indicies at which it
+  the bandwidth, and to gkde.evaluate() to specify the indices at which it
   is evaluated, respectively. See scipy docs. (:issue:`4298`)
 - Added ``isin`` method to DataFrame (:issue:`4211`)
 - ``df.to_clipboard()`` learned a new ``excel`` keyword that let's you
@@ -1053,14 +2580,14 @@ Improvements to existing features
 - allow DataFrame constructor to accept more list-like objects, e.g. list of
   ``collections.Sequence`` and ``array.Array`` objects (:issue:`3783`,
   :issue:`4297`, :issue:`4851`), thanks @lgautier
-- DataFrame constructor now accepts a numpy masked record array
+- DataFrame constructor now accepts a NumPy masked record array
   (:issue:`3478`), thanks @jnothman
 - ``__getitem__`` with ``tuple`` key (e.g., ``[:, 2]``) on ``Series``
   without ``MultiIndex`` raises ``ValueError`` (:issue:`4759`, :issue:`4837`)
 - ``read_json`` now raises a (more informative) ``ValueError`` when the dict
   contains a bad key and ``orient='split'`` (:issue:`4730`, :issue:`4838`)
 - ``read_stata`` now accepts Stata 13 format (:issue:`4291`)
-- ``ExcelWriter`` and ``ExcelFile`` can be used as contextmanagers.
+- ``ExcelWriter`` and ``ExcelFile`` can be used as context managers.
   (:issue:`3441`, :issue:`4933`)
 - ``pandas`` is now tested with two different versions of ``statsmodels``
   (0.4.3 and 0.5.0) (:issue:`4981`).
@@ -1073,7 +2600,7 @@ Improvements to existing features
   that cannot be concatenated (:issue:`4608`).
 - Add ``halflife`` option to exponentially weighted moving functions (PR
   :issue:`4998`)
-- ``to_dict`` now takes ``records`` as a possible outtype.  Returns an array
+- ``to_dict`` now takes ``records`` as a possible out type.  Returns an array
   of column-keyed dictionaries. (:issue:`4936`)
 - ``tz_localize`` can infer a fall daylight savings transition based on the
   structure of unlocalized data (:issue:`4230`)
@@ -1114,7 +2641,7 @@ Improvements to existing features
   option it is no longer possible to round trip Excel files with merged
   MultiIndex and Hierarchical Rows. Set the ``merge_cells`` to ``False`` to
   restore the previous behaviour.  (:issue:`5254`)
-- The FRED DataReader now accepts multiple series (:issue`3413`)
+- The FRED DataReader now accepts multiple series (:issue:`3413`)
 - StataWriter adjusts variable names to Stata's limitations (:issue:`5709`)
 
 API Changes
@@ -1179,18 +2706,18 @@ API Changes
   - the ``format`` keyword now replaces the ``table`` keyword; allowed values
     are ``fixed(f)|table(t)`` the ``Storer`` format has been renamed to
     ``Fixed``
-  - a column multi-index will be recreated properly (:issue:`4710`); raise on
-    trying to use a multi-index with data_columns on the same axis
+  - a column MultiIndex will be recreated properly (:issue:`4710`); raise on
+    trying to use a MultiIndex with data_columns on the same axis
   - ``select_as_coordinates`` will now return an ``Int64Index`` of the
     resultant selection set
   - support ``timedelta64[ns]`` as a serialization type (:issue:`3577`)
-  - store `datetime.date` objects as ordinals rather then timetuples to avoid
+  - store `datetime.date` objects as ordinals rather then time-tuples to avoid
     timezone issues (:issue:`2852`), thanks @tavistmorph and @numpand
   - ``numexpr`` 2.2.2 fixes incompatibility in PyTables 2.4 (:issue:`4908`)
   - ``flush`` now accepts an ``fsync`` parameter, which defaults to ``False``
     (:issue:`5364`)
   - ``unicode`` indices not supported on ``table`` formats (:issue:`5386`)
-  - pass thru store creation arguments; can be used to support in-memory stores
+  - pass through store creation arguments; can be used to support in-memory stores
 - ``JSON``
 
   - added ``date_unit`` parameter to specify resolution of timestamps.
@@ -1256,7 +2783,7 @@ API Changes
   created when passing floating values in index creation.  This enables a
   pure label-based slicing paradigm that makes ``[],ix,loc`` for scalar
   indexing and slicing work exactly the same.  Indexing on other index types
-  are preserved (and positional fallback for ``[],ix``), with the exception,
+  are preserved (and positional fall back for ``[],ix``), with the exception,
   that floating point slicing on indexes on non ``Float64Index`` will raise a
   ``TypeError``, e.g. ``Series(range(5))[3.5:4.5]`` (:issue:`263`,:issue:`5375`)
 - Make Categorical repr nicer (:issue:`4368`)
@@ -1273,8 +2800,8 @@ API Changes
   support ``pow`` or ``mod`` with non-scalars. (:issue:`3765`)
 - Arithmetic func factories are now passed real names (suitable for using
   with super) (:issue:`5240`)
-- Provide numpy compatibility with 1.7 for a calling convention like
-  ``np.prod(pandas_object)`` as numpy call with additional keyword args
+- Provide NumPy compatibility with 1.7 for a calling convention like
+  ``np.prod(pandas_object)`` as NumPy call with additional keyword args
   (:issue:`4435`)
 - Provide __dir__ method (and local context) for tab completion / remove
   ipython completers code (:issue:`4501`)
@@ -1285,11 +2812,11 @@ API Changes
   (:issue:`5339`)
 - default for `display.max_seq_len` is now 100 rather then `None`. This activates
   truncated display ("...") of long sequences in various places. (:issue:`3391`)
-- **All** division with ``NDFrame`` - likes is now truedivision, regardless
+- **All** division with ``NDFrame`` - likes is now true division, regardless
   of the future import. You can use ``//`` and ``floordiv`` to do integer
   division.
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [3]: arr = np.array([1, 2, 3, 4])
 
@@ -1307,13 +2834,13 @@ API Changes
    dtype: float64
 
 - raise/warn ``SettingWithCopyError/Warning`` exception/warning when setting of a
-  copy thru chained assignment is detected, settable via option ``mode.chained_assignment``
+  copy through chained assignment is detected, settable via option ``mode.chained_assignment``
 - test the list of ``NA`` values in the csv parser. add ``N/A``, ``#NA`` as independent default
   na values (:issue:`5521`)
-- The refactoring involving``Series`` deriving from ``NDFrame`` breaks ``rpy2<=2.3.8``. an Issue
+- The refactoring involving ``Series`` deriving from ``NDFrame`` breaks ``rpy2<=2.3.8``. an Issue
   has been opened against rpy2 and a workaround is detailed in :issue:`5698`. Thanks @JanSchulz.
 - ``Series.argmin`` and ``Series.argmax`` are now aliased to ``Series.idxmin`` and ``Series.idxmax``.
-  These return the *index* of the  min or max element respectively. Prior to 0.13.0 these would return
+  These return the *index* of the min or max element respectively. Prior to 0.13.0 these would return
   the position of the min / max element (:issue:`6214`)
 
 Internal Refactoring
@@ -1357,7 +2884,7 @@ See :ref:`Internal Refactoring<whatsnew_0130.refactoring>`
 - Series now inherits from ``NDFrame`` rather than directly from ``ndarray``.
   There are several minor changes that affect the API.
 
- - numpy functions that do not support the array interface will now return
+ - NumPy functions that do not support the array interface will now return
    ``ndarrays`` rather than series, e.g. ``np.diff``, ``np.ones_like``,
    ``np.where``
  - ``Series(0.5)`` would previously return the scalar ``0.5``, this is no
@@ -1408,7 +2935,7 @@ See :ref:`Internal Refactoring<whatsnew_0130.refactoring>`
   (datetime/timedelta/time etc.) into a separate, cleaned up wrapper class.
   (:issue:`4613`)
 - Complex compat for ``Series`` with ``ndarray``. (:issue:`4819`)
-- Removed unnecessary ``rwproperty`` from codebase in favor of builtin
+- Removed unnecessary ``rwproperty`` from code base in favor of builtin
   property. (:issue:`4843`)
 - Refactor object level numeric methods (mean/sum/min/max...) from object
   level modules to ``core/generic.py`` (:issue:`4435`).
@@ -1452,7 +2979,7 @@ Bug Fixes
   - A zero length series written in Fixed format not deserializing properly.
     (:issue:`4708`)
   - Fixed decoding perf issue on pyt3 (:issue:`5441`)
-  - Validate levels in a multi-index before storing (:issue:`5527`)
+  - Validate levels in a MultiIndex before storing (:issue:`5527`)
   - Correctly handle ``data_columns`` with a Panel (:issue:`5717`)
 - Fixed bug in tslib.tz_convert(vals, tz1, tz2): it could raise IndexError
   exception while trying to access trans[pos + 1] (:issue:`4496`)
@@ -1515,7 +3042,7 @@ Bug Fixes
   alignment (:issue:`3777`)
 - frozenset objects now raise in the ``Series`` constructor (:issue:`4482`,
   :issue:`4480`)
-- Fixed issue with sorting a duplicate multi-index that has multiple dtypes
+- Fixed issue with sorting a duplicate MultiIndex that has multiple dtypes
   (:issue:`4516`)
 - Fixed bug in ``DataFrame.set_values`` which was causing name attributes to
   be lost when expanding the index. (:issue:`3742`, :issue:`4039`)
@@ -1526,7 +3053,7 @@ Bug Fixes
 - Fix bug in having a rhs of ``np.timedelta64`` or ``np.offsets.DateOffset``
   when operating with datetimes (:issue:`4532`)
 - Fix arithmetic with series/datetimeindex and ``np.timedelta64`` not working
-  the same (:issue:`4134`) and buggy timedelta in numpy 1.6 (:issue:`4135`)
+  the same (:issue:`4134`) and buggy timedelta in NumPy 1.6 (:issue:`4135`)
 - Fix bug in ``pd.read_clipboard`` on windows with PY3 (:issue:`4561`); not
   decoding properly
 - ``tslib.get_period_field()`` and ``tslib.get_period_field_arr()`` now raise
@@ -1534,7 +3061,7 @@ Bug Fixes
 - Fix boolean indexing on an empty series loses index names (:issue:`4235`),
   infer_dtype works with empty arrays.
 - Fix reindexing with multiple axes; if an axes match was not replacing the
-  current axes, leading to a possible lazay frequency inference issue
+  current axes, leading to a possible lazy frequency inference issue
   (:issue:`3317`)
 - Fixed issue where ``DataFrame.apply`` was reraising exceptions incorrectly
   (causing the original stack trace to be truncated).
@@ -1556,18 +3083,18 @@ Bug Fixes
   (:issue:`4727`)
 - Fix some inconsistencies with ``Index.rename`` and ``MultiIndex.rename``,
   etc. (:issue:`4718`, :issue:`4628`)
-- Bug in using ``iloc/loc`` with a cross-sectional and duplicate indicies
+- Bug in using ``iloc/loc`` with a cross-sectional and duplicate indices
   (:issue:`4726`)
 - Bug with using ``QUOTE_NONE`` with ``to_csv`` causing ``Exception``.
   (:issue:`4328`)
 - Bug with Series indexing not raising an error when the right-hand-side has
   an incorrect length (:issue:`2702`)
-- Bug in multi-indexing with a partial string selection as one part of a
+- Bug in MultiIndexing with a partial string selection as one part of a
   MultIndex (:issue:`4758`)
 - Bug with reindexing on the index with a non-unique index will now raise
   ``ValueError`` (:issue:`4746`)
-- Bug in setting with ``loc/ix`` a single indexer with a multi-index axis and
-  a numpy array, related to (:issue:`3777`)
+- Bug in setting with ``loc/ix`` a single indexer with a MultiIndex axis and
+  a NumPy array, related to (:issue:`3777`)
 - Bug in concatenation with duplicate columns across dtypes not merging with
   axis=0 (:issue:`4771`, :issue:`4975`)
 - Bug in ``iloc`` with a slice index failing (:issue:`4771`)
@@ -1637,7 +3164,7 @@ Bug Fixes
 - Make sure series-series boolean comparisons are label based (:issue:`4947`)
 - Bug in multi-level indexing with a Timestamp partial indexer
   (:issue:`4294`)
-- Tests/fix for multi-index construction of an all-nan frame (:issue:`4078`)
+- Tests/fix for MultiIndex construction of an all-nan frame (:issue:`4078`)
 - Fixed a bug where :func:`~pandas.read_html` wasn't correctly inferring
   values of tables with commas (:issue:`5029`)
 - Fixed a bug where :func:`~pandas.read_html` wasn't providing a stable
@@ -1691,10 +3218,10 @@ Bug Fixes
 - Fixed bug in Excel writers where frames with duplicate column names weren't
   written correctly. (:issue:`5235`)
 - Fixed issue with ``drop`` and a non-unique index on Series (:issue:`5248`)
-- Fixed seg fault in C parser caused by passing more names than columns in
+- Fixed segfault in C parser caused by passing more names than columns in
   the file. (:issue:`5156`)
 - Fix ``Series.isin`` with date/time-like dtypes (:issue:`5021`)
-- C and Python Parser can now handle the more common multi-index column
+- C and Python Parser can now handle the more common MultiIndex column
   format which doesn't have a row for index names (:issue:`4702`)
 - Bug when trying to use an out-of-bounds date as an object dtype
   (:issue:`5312`)
@@ -1719,7 +3246,7 @@ Bug Fixes
 - performance improvements in ``isnull`` on larger size pandas objects
 - Fixed various setitem with 1d ndarray that does not have a matching
   length to the indexer (:issue:`5508`)
-- Bug in getitem with a multi-index and ``iloc`` (:issue:`5528`)
+- Bug in getitem with a MultiIndex and ``iloc`` (:issue:`5528`)
 - Bug in delitem on a Series (:issue:`5542`)
 - Bug fix in apply when using custom function and objects are not mutated (:issue:`5545`)
 - Bug in selecting from a non-unique index with ``loc`` (:issue:`5553`)
@@ -1728,7 +3255,7 @@ Bug Fixes
 - Bug in repeated indexing of object with resultant non-unique index (:issue:`5678`)
 - Bug in fillna with Series and a passed series/dict (:issue:`5703`)
 - Bug in groupby transform with a datetime-like grouper (:issue:`5712`)
-- Bug in multi-index selection in PY3 when using certain keys (:issue:`5725`)
+- Bug in MultiIndex selection in PY3 when using certain keys (:issue:`5725`)
 - Row-wise concat of differing dtypes failing in certain cases (:issue:`5754`)
 
 pandas 0.12.0
@@ -1749,14 +3276,14 @@ New Features
 - Added module for reading and writing Stata files: pandas.io.stata (:issue:`1512`)
   includes ``to_stata`` DataFrame method, and a ``read_stata`` top-level reader
 - Added support for writing in ``to_csv`` and reading in ``read_csv``,
-  multi-index columns. The ``header`` option in ``read_csv`` now accepts a
+  MultiIndex columns. The ``header`` option in ``read_csv`` now accepts a
   list of the rows from which to read the index. Added the option,
   ``tupleize_cols`` to provide compatibility for the pre 0.12 behavior of
-  writing and reading multi-index columns via a list of tuples. The default in
+  writing and reading MultiIndex columns via a list of tuples. The default in
   0.12 is to write lists of tuples and *not* interpret list of tuples as a
-  multi-index column.
+  MultiIndex column.
   Note: The default value will change in 0.12 to make the default *to* write and
-  read multi-index columns in the new format. (:issue:`3571`, :issue:`1651`, :issue:`3141`)
+  read MultiIndex columns in the new format. (:issue:`3571`, :issue:`1651`, :issue:`3141`)
 - Add iterator to ``Series.str`` (:issue:`3638`)
 - ``pd.set_option()`` now allows N option, value pairs (:issue:`3667`).
 - Added keyword parameters for different types of scatter_matrix subplots
@@ -1770,7 +3297,7 @@ Improvements to existing features
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 - Fixed various issues with internal pprinting code, the repr() for various objects
-  including TimeStamp and Index now produces valid python code strings and
+  including TimeStamp and Index now produces valid Python code strings and
   can be used to recreate the object, (:issue:`3038`, :issue:`3379`, :issue:`3251`, :issue:`3460`)
 - ``convert_objects`` now accepts a ``copy`` parameter (defaults to ``True``)
 - ``HDFStore``
@@ -1794,7 +3321,7 @@ Improvements to existing features
 - clipboard functions use pyperclip (no dependencies on Windows, alternative
   dependencies offered for Linux) (:issue:`3837`).
 - Plotting functions now raise a ``TypeError`` before trying to plot anything
-  if the associated objects have have a dtype of ``object`` (:issue:`1818`,
+  if the associated objects have a dtype of ``object`` (:issue:`1818`,
   :issue:`3572`, :issue:`3911`, :issue:`3912`), but they will try to convert object
   arrays to numeric arrays if possible so that you can still plot, for example, an
   object array with floats. This happens before any drawing takes place which
@@ -1834,7 +3361,7 @@ API Changes
     to enable alternate encodings (:issue:`3750`)
   - enable support for ``iterator/chunksize`` with ``read_hdf``
 - The repr() for (Multi)Index now obeys display.max_seq_items rather
-  then numpy threshold print options. (:issue:`3426`, :issue:`3466`)
+  then NumPy threshold print options. (:issue:`3426`, :issue:`3466`)
 - Added mangle_dupe_cols option to read_table/csv, allowing users
   to control legacy behaviour re dupe cols (A, A.1, A.2 vs A, A ) (:issue:`3468`)
   Note: The default value will change in 0.12 to the "no mangle" behaviour,
@@ -1897,12 +3424,12 @@ API Changes
 - more consistency in the to_datetime return types (give string/array of string inputs) (:issue:`3888`)
 - The internal ``pandas`` class hierarchy has changed (slightly). The
   previous ``PandasObject`` now is called ``PandasContainer`` and a new
-  ``PandasObject`` has become the baseclass for ``PandasContainer`` as well
+  ``PandasObject`` has become the base class for ``PandasContainer`` as well
   as ``Index``, ``Categorical``, ``GroupBy``, ``SparseList``, and
   ``SparseArray`` (+ their base classes). Currently, ``PandasObject``
   provides string methods (from ``StringMixin``). (:issue:`4090`, :issue:`4092`)
-- New ``StringMixin`` that, given a ``__unicode__`` method, gets python 2 and
-  python 3 compatible string methods (``__str__``, ``__bytes__``, and
+- New ``StringMixin`` that, given a ``__unicode__`` method, gets Python 2 and
+  Python 3 compatible string methods (``__str__``, ``__bytes__``, and
   ``__repr__``). Plus string safety throughout. Now employed in many places
   throughout the pandas library. (:issue:`4090`, :issue:`4092`)
 
@@ -1967,13 +3494,13 @@ Bug Fixes
 - Fixed bug with ``Panel.transpose`` argument aliases (:issue:`3556`)
 - Fixed platform bug in ``PeriodIndex.take`` (:issue:`3579`)
 - Fixed bud in incorrect conversion of datetime64[ns] in ``combine_first`` (:issue:`3593`)
-- Fixed bug in reset_index with ``NaN`` in a multi-index (:issue:`3586`)
+- Fixed bug in reset_index with ``NaN`` in a MultiIndex (:issue:`3586`)
 - ``fillna`` methods now raise a ``TypeError`` when the ``value`` parameter
   is a ``list`` or ``tuple``.
 - Fixed bug where a time-series was being selected in preference to an actual column name
   in a frame (:issue:`3594`)
 - Make secondary_y work properly for bar plots (:issue:`3598`)
-- Fix modulo and integer division on Series,DataFrames to act similary to ``float`` dtypes to return
+- Fix modulo and integer division on Series,DataFrames to act similarly to ``float`` dtypes to return
   ``np.nan`` or ``np.inf`` as appropriate (:issue:`3590`)
 - Fix incorrect dtype on groupby with ``as_index=False`` (:issue:`3610`)
 - Fix ``read_csv/read_excel`` to correctly encode identical na_values, e.g. ``na_values=[-999.0,-999]``
@@ -2000,7 +3527,7 @@ Bug Fixes
   their first argument (:issue:`3702`)
 - Fix file tokenization error with \r delimiter and quoted fields (:issue:`3453`)
 - Groupby transform with item-by-item not upcasting correctly (:issue:`3740`)
-- Incorrectly read a HDFStore multi-index Frame with a column specification (:issue:`3748`)
+- Incorrectly read a HDFStore MultiIndex Frame with a column specification (:issue:`3748`)
 - ``read_html`` now correctly skips tests (:issue:`3741`)
 - PandasObjects raise TypeError when trying to hash (:issue:`3882`)
 - Fix incorrect arguments passed to concat that are not list-like (e.g. concat(df1,df2)) (:issue:`3481`)
@@ -2015,9 +3542,9 @@ Bug Fixes
   two integer arrays with at least 10000 cells total (:issue:`3764`)
 - Indexing with a string with seconds resolution not selecting from a time index (:issue:`3925`)
 - csv parsers would loop infinitely if ``iterator=True`` but no ``chunksize`` was
-  specified (:issue:`3967`), python parser failing with ``chunksize=1``
+  specified (:issue:`3967`), Python parser failing with ``chunksize=1``
 - Fix index name not propagating when using ``shift``
-- Fixed dropna=False being ignored with multi-index stack (:issue:`3997`)
+- Fixed dropna=False being ignored with MultiIndex stack (:issue:`3997`)
 - Fixed flattening of columns when renaming MultiIndex columns DataFrame (:issue:`4004`)
 - Fix ``Series.clip`` for datetime series. NA/NaN threshold values will now throw ValueError (:issue:`3996`)
 - Fixed insertion issue into DataFrame, after rename (:issue:`4032`)
@@ -2041,7 +3568,7 @@ Bug Fixes
   iterated over when regex=False (:issue:`4115`)
 - Fixed bug in ``convert_objects(convert_numeric=True)`` where a mixed numeric and
   object Series/Frame was not converting properly (:issue:`4119`)
-- Fixed bugs in multi-index selection with column multi-index and duplicates
+- Fixed bugs in MultiIndex selection with column MultiIndex and duplicates
   (:issue:`4145`, :issue:`4146`)
 - Fixed bug in the parsing of microseconds when using the ``format``
   argument in ``to_datetime`` (:issue:`4152`)
@@ -2177,7 +3704,7 @@ API Changes
   - all timedelta like objects will be correctly assigned to ``timedelta64``
     with mixed ``NaN`` and/or ``NaT`` allowed
 
-- arguments to DataFrame.clip were inconsistent to numpy and Series clipping
+- arguments to DataFrame.clip were inconsistent to NumPy and Series clipping
   (:issue:`2747`)
 - util.testing.assert_frame_equal now checks the column and index names (:issue:`2964`)
 - Constructors will now return a more informative ValueError on failures
@@ -2236,7 +3763,7 @@ Bug Fixes
   - Series ops with a Timestamp on the rhs was throwing an exception (:issue:`2898`)
     added tests for Series ops with datetimes,timedeltas,Timestamps, and datelike
     Series on both lhs and rhs
-  - Fixed subtle timedelta64 inference issue on py3 & numpy 1.7.0 (:issue:`3094`)
+  - Fixed subtle timedelta64 inference issue on py3 & NumPy 1.7.0 (:issue:`3094`)
   - Fixed some formatting issues on timedelta when negative
   - Support null checking on timedelta64, representing (and formatting) with NaT
   - Support setitem with np.nan value, converts to NaT
@@ -2249,7 +3776,7 @@ Bug Fixes
 - Bug in value_counts of ``datetime64[ns]`` Series (:issue:`3002`)
 - Fixed printing of ``NaT`` in an index
 - Bug in idxmin/idxmax of ``datetime64[ns]`` Series with ``NaT`` (:issue:`2982`)
-- Bug in ``icol, take`` with negative indicies was producing incorrect return
+- Bug in ``icol, take`` with negative indices was producing incorrect return
   values (see :issue:`2922`, :issue:`2892`), also check for out-of-bounds indices (:issue:`3029`)
 - Bug in DataFrame column insertion when the column creation fails, existing frame is left in
   an irrecoverable state (:issue:`3010`)
@@ -2272,15 +3799,15 @@ Bug Fixes
 - Fix upsampling bug with closed='left' and daily to daily data (:issue:`3020`)
 - Fixed missing tick bars on scatter_matrix plot (:issue:`3063`)
 - Fixed bug in Timestamp(d,tz=foo) when d is date() rather then datetime() (:issue:`2993`)
-- series.plot(kind='bar') now respects pylab color schem (:issue:`3115`)
+- series.plot(kind='bar') now respects pylab color scheme (:issue:`3115`)
 - Fixed bug in reshape if not passed correct input, now raises TypeError (:issue:`2719`)
 - Fixed a bug where Series ctor did not respect ordering if OrderedDict passed in (:issue:`3282`)
 - Fix NameError issue on RESO_US (:issue:`2787`)
-- Allow selection in an *unordered* timeseries to work similary
+- Allow selection in an *unordered* timeseries to work similarly
   to an *ordered* timeseries (:issue:`2437`).
 - Fix implemented ``.xs`` when called with ``axes=1`` and a level parameter (:issue:`2903`)
 - Timestamp now supports the class method fromordinal similar to datetimes (:issue:`3042`)
-- Fix issue with indexing a series with a boolean key and specifiying a 1-len list on the rhs (:issue:`2745`)
+- Fix issue with indexing a series with a boolean key and specifying a 1-len list on the rhs (:issue:`2745`)
   or a list on the rhs (:issue:`3235`)
 - Fixed bug in groupby apply when kernel generate list of arrays having unequal len (:issue:`1738`)
 - fixed handling of rolling_corr with center=True which could produce corr>1 (:issue:`3155`)
@@ -2310,7 +3837,7 @@ Bug Fixes
   a simple index (:issue:`2893`)
 - Fix Python ASCII file parsing when integer falls outside of floating point
   spacing (:issue:`3258`)
-- fixed pretty priniting of sets (:issue:`3294`)
+- fixed pretty printing of sets (:issue:`3294`)
 - Panel() and Panel.from_dict() now respects ordering when give OrderedDict (:issue:`3303`)
 - DataFrame where with a datetimelike incorrectly selecting (:issue:`3311`)
 - Ensure index casts work even in Int64Index
@@ -2350,14 +3877,14 @@ Improvements to existing features
 
 - ``HDFStore``
 
-  - enables storing of multi-index dataframes (closes :issue:`1277`)
+  - enables storing of MultiIndex dataframes (closes :issue:`1277`)
   - support data column indexing and selection, via ``data_columns`` keyword
     in append
   - support write chunking to reduce memory footprint, via ``chunksize``
     keyword to append
   - support automagic indexing via ``index`` keyword to append
   - support ``expectedrows`` keyword in append to inform ``PyTables`` about
-    the expected tablesize
+    the expected table size
   - support ``start`` and ``stop`` keywords in select to limit the row
     selection space
   - added ``get_store`` context manager to automatically import with pandas
@@ -2428,10 +3955,10 @@ Bug Fixes
 - Fix setitem on a Series with a boolean key and a non-scalar as value
   (:issue:`2686`)
 - Box datetime64 values in Series.apply/map (:issue:`2627`, :issue:`2689`)
-- Upconvert datetime + datetime64 values when concatenating frames (:issue:`2624`)
+- Up convert datetime + datetime64 values when concatenating frames (:issue:`2624`)
 - Raise a more helpful error message in merge operations when one DataFrame
   has duplicate columns (:issue:`2649`)
-- Fix partial date parsing issue occuring only when code is run at EOM
+- Fix partial date parsing issue occurring only when code is run at EOM
   (:issue:`2618`)
 - Prevent MemoryError when using counting sort in sortlevel with
   high-cardinality MultiIndex objects (:issue:`2684`)
@@ -2635,7 +4162,7 @@ Bug Fixes
   datetime64 when calling DataFrame.apply. (:issue:`2374`)
 - Raise exception when calling to_panel on non uniquely-indexed frame (:issue:`2441`)
 - Improved detection of console encoding on IPython zmq frontends (:issue:`2458`)
-- Preserve time zone when .append-ing two time series (:issue:`2260`)
+- Preserve time zone when .appending two time series (:issue:`2260`)
 - Box timestamps when calling reset_index on time-zone-aware index rather
   than creating a tz-less datetime64 column (:issue:`2262`)
 - Enable searching non-string columns in DataFrame.filter(like=...) (:issue:`2467`)
@@ -2849,7 +4376,7 @@ Bug Fixes
 - Don't lose tzinfo when passing DatetimeIndex as DataFrame column (:issue:`1682`)
 - Fix tz conversion with time zones that haven't had any DST transitions since
   first date in the array (:issue:`1673`)
-- Fix field access with  UTC->local conversion on unsorted arrays (:issue:`1756`)
+- Fix field access with UTC->local conversion on unsorted arrays (:issue:`1756`)
 - Fix isnull handling of array-like (list) inputs (:issue:`1755`)
 - Fix regression in handling of Series in Series constructor (:issue:`1671`)
 - Fix comparison of Int64Index with DatetimeIndex (:issue:`1681`)
@@ -2879,7 +4406,7 @@ Bug Fixes
 - Fix DatetimeIndex.isin to function properly (:issue:`1763`)
 - Fix conversion of array of tz-aware datetime.datetime to DatetimeIndex with
   right time zone (:issue:`1777`)
-- Fix DST issues with generating ancxhored date ranges (:issue:`1778`)
+- Fix DST issues with generating anchored date ranges (:issue:`1778`)
 - Fix issue calling sort on result of Series.unique (:issue:`1807`)
 - Fix numerical issue leading to square root of negative number in
   rolling_std (:issue:`1840`)
@@ -2958,7 +4485,7 @@ Bug Fixes
   columns (:issue:`1943`)
 - Fix time zone localization bug causing improper fields (e.g. hours) in time
   zones that have not had a UTC transition in a long time (:issue:`1946`)
-- Fix errors when parsing and working with with fixed offset timezones
+- Fix errors when parsing and working with fixed offset timezones
   (:issue:`1922`, :issue:`1928`)
 - Fix text parser bug when handling UTC datetime objects generated by
   dateutil (:issue:`1693`)
@@ -3132,14 +4659,14 @@ New Features
 - Add keys() method on DataFrame (:issue:`1240`)
 - Add new ``match`` function to API (similar to R) (:issue:`502`)
 - Add dayfirst option to parsers (:issue:`854`)
-- Add ``method`` argument to ``align`` method for forward/backward fillin
+- Add ``method`` argument to ``align`` method for forward/backward filling
   (:issue:`216`)
 - Add Panel.transpose method for rearranging axes (:issue:`695`)
 - Add new ``cut`` function (patterned after R) for discretizing data into
   equal range-length bins or arbitrary breaks of your choosing (:issue:`415`)
 - Add new ``qcut`` for cutting with quantiles (:issue:`1378`)
 - Add ``value_counts`` top level array method (:issue:`1392`)
-- Added Andrews curves plot tupe (:issue:`1325`)
+- Added Andrews curves plot type (:issue:`1325`)
 - Add lag plot (:issue:`1440`)
 - Add autocorrelation_plot (:issue:`1425`)
 - Add support for tox and Travis CI (:issue:`1382`)
@@ -3210,7 +4737,7 @@ API Changes
 - Remove deprecated DataMatrix name
 - Default merge suffixes for overlap now have underscores instead of periods
   to facilitate tab completion, etc. (:issue:`1239`)
-- Deprecation of offset, time_rule timeRule parameters throughout codebase
+- Deprecation of offset, time_rule timeRule parameters throughout code base
 - Series.append and DataFrame.append no longer check for duplicate indexes
   by default, add verify_integrity parameter (:issue:`1394`)
 - Refactor Factor class, old constructor moved to Factor.from_array
@@ -3259,7 +4786,7 @@ Bug Fixes
   error (:issue:`1090`)
 - Consistently set name on groupby pieces (:issue:`184`)
 - Treat dict return values as Series in GroupBy.apply (:issue:`823`)
-- Respect column selection for DataFrame in in GroupBy.transform (:issue:`1365`)
+- Respect column selection for DataFrame in GroupBy.transform (:issue:`1365`)
 - Fix MultiIndex partial indexing bug (:issue:`1352`)
 - Enable assignment of rows in mixed-type DataFrame via .ix (:issue:`1432`)
 - Reset index mapping when grouping Series in Cython (:issue:`1423`)
@@ -3399,9 +4926,9 @@ Bug Fixes
 - Fix combineAdd NotImplementedError for SparseDataFrame (:issue:`887`)
 - Fix DataFrame.to_html encoding and columns (:issue:`890`, :issue:`891`, :issue:`909`)
 - Fix na-filling handling in mixed-type DataFrame (:issue:`910`)
-- Fix to DataFrame.set_value with non-existant row/col (:issue:`911`)
+- Fix to DataFrame.set_value with non-existent row/col (:issue:`911`)
 - Fix malformed block in groupby when excluding nuisance columns (:issue:`916`)
-- Fix inconsistant NA handling in dtype=object arrays (:issue:`925`)
+- Fix inconsistent NA handling in dtype=object arrays (:issue:`925`)
 - Fix missing center-of-mass computation in ewmcov (:issue:`862`)
 - Don't raise exception when opening read-only HDF5 file (:issue:`847`)
 - Fix possible out-of-bounds memory access in 0-length Series (:issue:`917`)
@@ -3450,12 +4977,12 @@ Bug Fixes
 - Add clearer error message in csv parser (:issue:`835`)
 - Fix loss of fractional seconds in HDFStore (:issue:`513`)
 - Fix DataFrame join where columns have datetimes (:issue:`787`)
-- Work around numpy performance issue in take (:issue:`817`)
+- Work around NumPy performance issue in take (:issue:`817`)
 - Improve comparison operations for NA-friendliness (:issue:`801`)
 - Fix indexing operation for floating point values (:issue:`780`, :issue:`798`)
 - Fix groupby case resulting in malformed dataframe (:issue:`814`)
 - Fix behavior of reindex of Series dropping name (:issue:`812`)
-- Improve on redudant groupby computation (:issue:`775`)
+- Improve on redundant groupby computation (:issue:`775`)
 - Catch possible NA assignment to int/bool series with exception (:issue:`839`)
 
 pandas 0.7.0
@@ -3636,7 +5163,7 @@ Bug Fixes
 - Raise exception in out-of-bounds indexing of Series instead of
   seg-faulting, regression from earlier releases (:issue:`495`)
 - Fix error when joining DataFrames of different dtypes within the same
-  typeclass (e.g. float32 and float64) (:issue:`486`)
+  type class (e.g. float32 and float64) (:issue:`486`)
 - Fix bug in Series.min/Series.max on objects like datetime.datetime (GH
   :issue:`487`)
 - Preserve index names in Index.union (:issue:`501`)
@@ -3682,7 +5209,7 @@ Bug Fixes
 - Format floats to default to same number of digits (:issue:`395`)
 - Added decorator to copy docstring from one function to another (:issue:`449`)
 - Fix error in monotonic many-to-one left joins
-- Fix __eq__ comparison between DateOffsets with different relativedelta
+- Fix __eq__ comparison between DateOffsets with different relative delta
   keywords passed
 - Fix exception caused by parser converter returning strings (:issue:`583`)
 - Fix MultiIndex formatting bug with integer names (:issue:`601`)
@@ -3916,7 +5443,7 @@ New Features
 - Add `melt` function to `pandas.core.reshape`
 - Add `level` parameter to group by level in Series and DataFrame
   descriptive statistics (:issue:`313`)
-- Add `head` and `tail` methods to Series, analogous to to DataFrame (PR
+- Add `head` and `tail` methods to Series, analogous to DataFrame (PR
   :issue:`296`)
 - Add `Series.isin` function which checks if each value is contained in a
   passed sequence (:issue:`289`)
@@ -3981,7 +5508,7 @@ Improvements to existing features
   `Series.map` significantly when passed elementwise Python function,
   motivated by :issue:`355`
 - Cythonized `cache_readonly`, resulting in substantial micro-performance
-  enhancements throughout the codebase (:issue:`361`)
+  enhancements throughout the code base (:issue:`361`)
 - Special Cython matrix iterator for applying arbitrary reduction operations
   with 3-5x better performance than `np.apply_along_axis` (:issue:`309`)
 - Add `raw` option to `DataFrame.apply` for getting better performance when
@@ -4271,9 +5798,9 @@ pandas 0.4.3
 
 **Release date:** 10/9/2011
 
-is is largely a bugfix release from 0.4.2 but also includes a handful of new
-d enhanced features. Also, pandas can now be installed and used on Python 3
-hanks Thomas Kluyver!).
+This is largely a bug fix release from 0.4.2 but also includes a handful of new
+and enhanced features. Also, pandas can now be installed and used on Python 3
+(thanks Thomas Kluyver!).
 
 New Features
 ~~~~~~~~~~~~
@@ -4323,7 +5850,7 @@ Bug Fixes
 - Fix Python ndarray access in Cython code for sparse blocked index integrity
   check
 - Fix bug writing Series to CSV in Python 3 (:issue:`209`)
-- Miscellaneous Python 3 bugfixes
+- Miscellaneous Python 3 bug fixes
 
 Thanks
 ~~~~~~
@@ -4336,9 +5863,9 @@ pandas 0.4.2
 
 **Release date:** 10/3/2011
 
-is is a performance optimization release with several bug fixes. The new
-t64Index and new merging / joining Cython code and related Python
-frastructure are the main new additions
+This is a performance optimization release with several bug fixes. The new
+Int64Index and new merging / joining Cython code and related Python
+infrastructure are the main new additions
 
 New Features
 ~~~~~~~~~~~~
@@ -4348,7 +5875,7 @@ New Features
   int64-based time series (e.g. using NumPy's datetime64 one day) and also
   faster operations on DataFrame objects storing record array-like data.
 - Refactored `Index` classes to have a `join` method and associated data
-  alignment routines throughout the codebase to be able to leverage optimized
+  alignment routines throughout the code base to be able to leverage optimized
   joining / merging routines.
 - Added `Series.align` method for aligning two series with choice of join
   method
@@ -4413,7 +5940,7 @@ pandas 0.4.1
 
 **Release date:** 9/25/2011
 
-is is primarily a bug fix release but includes some new features and
+This is primarily a bug fix release but includes some new features and
 improvements
 
 New Features
@@ -4684,7 +6211,7 @@ API Changes
 - Removed `pandas.core.pytools` module. Code has been moved to
   `pandas.core.common`
 - Tacked on `groupName` attribute for groups in GroupBy renamed to `name`
-- Panel/LongPanel `dims` attribute renamed to `shape` to be more conformant
+- Panel/LongPanel `dims` attribute renamed to `shape` to be more conforming
 - Slicing a `Series` returns a view now
 - More Series deprecations / renaming: `toCSV` to `to_csv`, `asOf` to `asof`,
   `merge` to `map`, `applymap` to `apply`, `toDict` to `to_dict`,
@@ -4698,7 +6225,7 @@ API Changes
   `offset` argument for everything. So you can still pass a time rule string
   to `offset`
 - Added optional `encoding` argument to `read_csv`, `read_table`, `to_csv`,
-  `from_csv` to handle unicode in python 2.x
+  `from_csv` to handle unicode in Python 2.x
 
 Bug Fixes
 ~~~~~~~~~
diff --git a/doc/source/remote_data.rst b/doc/source/remote_data.rst
deleted file mode 100644
index d1a2ba59d7fdf..0000000000000
--- a/doc/source/remote_data.rst
+++ /dev/null
@@ -1,408 +0,0 @@
-.. _remote_data:
-
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   import csv
-   import pandas as pd
-
-   import numpy as np
-   np.random.seed(123456)
-   randn = np.random.randn
-   np.set_printoptions(precision=4, suppress=True)
-
-   import matplotlib.pyplot as plt
-   plt.close('all')
-
-   from pandas import *
-   options.display.max_rows=15
-   import pandas.util.testing as tm
-
-******************
-Remote Data Access
-******************
-
-.. _remote_data.pandas_datareader:
-
-.. warning::
-
-   In pandas 0.17.0, the sub-package ``pandas.io.data`` will be removed in favor of a separately installable `pandas-datareader package <https://github.com/pydata/pandas-datareader>`_. This will allow the data modules to be independently updated to your pandas installation. The API for ``pandas-datareader v0.1.1`` is the same as in ``pandas v0.16.1``. (:issue:`8961`)
-
-   You should replace the imports of the following:
-
-   .. code-block:: python
-
-      from pandas.io import data, wb
-
-   With:
-
-   .. code-block:: python
-
-      from pandas_datareader import data, wb
-
-.. _remote_data.data_reader:
-
-Functions from :mod:`pandas.io.data` and :mod:`pandas.io.ga` extract data from various Internet sources into a DataFrame. Currently the following sources are supported:
-
-    - :ref:`Yahoo! Finance<remote_data.yahoo>`
-    - :ref:`Google Finance<remote_data.google>`
-    - :ref:`St.Louis FED (FRED)<remote_data.fred>`
-    - :ref:`Kenneth French's data library<remote_data.ff>`
-    - :ref:`World Bank<remote_data.wb>`
-    - :ref:`Google Analytics<remote_data.ga>`
-
-It should be noted, that various sources support different kinds of data, so not all sources implement the same methods and the data elements returned might also differ.
-
-.. _remote_data.yahoo:
-
-Yahoo! Finance
---------------
-
-.. ipython:: python
-   :okwarning:
-
-    import pandas.io.data as web
-    import datetime
-    start = datetime.datetime(2010, 1, 1)
-    end = datetime.datetime(2013, 1, 27)
-    f = web.DataReader("F", 'yahoo', start, end)
-    f.ix['2010-01-04']
-
-.. _remote_data.yahoo_options:
-
-Yahoo! Finance Options
-----------------------
-***Experimental***
-
-The ``Options`` class allows the download of options data from Yahoo! Finance.
-
-The ``get_all_data`` method downloads and caches option data for all expiry months
-and provides a formatted ``DataFrame`` with a hierarchical index, so it is easy to get
-to the specific option you want.
-
-.. ipython:: python
-
-      from pandas.io.data import Options
-      aapl = Options('aapl', 'yahoo')
-      data = aapl.get_all_data()
-      data.iloc[0:5, 0:5]
-
-      # Show the $100 strike puts at all expiry dates:
-      data.loc[(100, slice(None), 'put'),:].iloc[0:5, 0:5]
-
-      # Show the volume traded of $100 strike puts at all expiry dates:
-      data.loc[(100, slice(None), 'put'),'Vol'].head()
-
-If you don't want to download all the data, more specific requests can be made.
-
-.. ipython:: python
-
-      import datetime
-      expiry = datetime.date(2016, 1, 1)
-      data = aapl.get_call_data(expiry=expiry)
-      data.iloc[0:5:, 0:5]
-
-Note that if you call ``get_all_data`` first, this second call will happen much faster,
-as the data is cached.
-
-If a given expiry date is not available, data for the next available expiry will be
-returned (January 15, 2015 in the above example).
-
-Available expiry dates can be accessed from the ``expiry_dates`` property.
-
-.. ipython:: python
-
-      aapl.expiry_dates
-      data = aapl.get_call_data(expiry=aapl.expiry_dates[0])
-      data.iloc[0:5:, 0:5]
-
-A list-like object containing dates can also be passed to the expiry parameter,
-returning options data for all expiry dates in the list.
-
-.. ipython:: python
-
-      data = aapl.get_near_stock_price(expiry=aapl.expiry_dates[0:3])
-      data.iloc[0:5:, 0:5]
-
-The ``month`` and ``year`` parameters can be used to get all options data for a given month.
-
-.. _remote_data.google:
-
-Google Finance
---------------
-
-.. ipython:: python
-
-    import pandas.io.data as web
-    import datetime
-    start = datetime.datetime(2010, 1, 1)
-    end = datetime.datetime(2013, 1, 27)
-    f = web.DataReader("F", 'google', start, end)
-    f.ix['2010-01-04']
-
-.. _remote_data.fred:
-
-FRED
-----
-
-.. ipython:: python
-
-    import pandas.io.data as web
-    import datetime
-    start = datetime.datetime(2010, 1, 1)
-    end = datetime.datetime(2013, 1, 27)
-    gdp=web.DataReader("GDP", "fred", start, end)
-    gdp.ix['2013-01-01']
-
-    # Multiple series:
-    inflation = web.DataReader(["CPIAUCSL", "CPILFESL"], "fred", start, end)
-    inflation.head()
-.. _remote_data.ff:
-
-Fama/French
------------
-
-Dataset names are listed at `Fama/French Data Library
-<http://mba.tuck.dartmouth.edu/pages/faculty/ken.french/data_library.html>`__.
-
-.. ipython:: python
-
-    import pandas.io.data as web
-    ip = web.DataReader("5_Industry_Portfolios", "famafrench")
-    ip[4].ix[192607]
-
-.. _remote_data.wb:
-
-World Bank
-----------
-
-``pandas`` users can easily access thousands of panel data series from the
-`World Bank's World Development Indicators <http://data.worldbank.org>`__
-by using the ``wb`` I/O functions.
-
-Indicators
-~~~~~~~~~~
-
-Either from exploring the World Bank site, or using the search function included,
-every world bank indicator is accessible.
-
-For example, if you wanted to compare the Gross Domestic Products per capita in
-constant dollars in North America, you would use the ``search`` function:
-
-.. code-block:: python
-
-    In [1]: from pandas.io import wb
-
-    In [2]: wb.search('gdp.*capita.*const').iloc[:,:2]
-    Out[2]:
-                         id                                               name
-    3242            GDPPCKD             GDP per Capita, constant US$, millions
-    5143     NY.GDP.PCAP.KD                 GDP per capita (constant 2005 US$)
-    5145     NY.GDP.PCAP.KN                      GDP per capita (constant LCU)
-    5147  NY.GDP.PCAP.PP.KD  GDP per capita, PPP (constant 2005 internation...
-
-Then you would use the ``download`` function to acquire the data from the World
-Bank's servers:
-
-.. code-block:: python
-
-    In [3]: dat = wb.download(indicator='NY.GDP.PCAP.KD', country=['US', 'CA', 'MX'], start=2005, end=2008)
-
-    In [4]: print(dat)
-                          NY.GDP.PCAP.KD
-    country       year
-    Canada        2008  36005.5004978584
-                  2007  36182.9138439757
-                  2006  35785.9698172849
-                  2005  35087.8925933298
-    Mexico        2008  8113.10219480083
-                  2007  8119.21298908649
-                  2006  7961.96818458178
-                  2005  7666.69796097264
-    United States 2008  43069.5819857208
-                  2007  43635.5852068142
-                  2006   43228.111147107
-                  2005  42516.3934699993
-
-The resulting dataset is a properly formatted ``DataFrame`` with a hierarchical
-index, so it is easy to apply ``.groupby`` transformations to it:
-
-.. code-block:: python
-
-    In [6]: dat['NY.GDP.PCAP.KD'].groupby(level=0).mean()
-    Out[6]:
-    country
-    Canada           35765.569188
-    Mexico            7965.245332
-    United States    43112.417952
-    dtype: float64
-
-Now imagine you want to compare GDP to the share of people with cellphone
-contracts around the world.
-
-.. code-block:: python
-
-    In [7]: wb.search('cell.*%').iloc[:,:2]
-    Out[7]:
-                         id                                               name
-    3990  IT.CEL.SETS.FE.ZS  Mobile cellular telephone users, female (% of ...
-    3991  IT.CEL.SETS.MA.ZS  Mobile cellular telephone users, male (% of po...
-    4027      IT.MOB.COV.ZS  Population coverage of mobile cellular telepho...
-
-Notice that this second search was much faster than the first one because
-``pandas`` now has a cached list of available data series.
-
-.. code-block:: python
-
-    In [13]: ind = ['NY.GDP.PCAP.KD', 'IT.MOB.COV.ZS']
-    In [14]: dat = wb.download(indicator=ind, country='all', start=2011, end=2011).dropna()
-    In [15]: dat.columns = ['gdp', 'cellphone']
-    In [16]: print(dat.tail())
-                            gdp  cellphone
-    country   year
-    Swaziland 2011  2413.952853       94.9
-    Tunisia   2011  3687.340170      100.0
-    Uganda    2011   405.332501      100.0
-    Zambia    2011   767.911290       62.0
-    Zimbabwe  2011   419.236086       72.4
-
-Finally, we use the ``statsmodels`` package to assess the relationship between
-our two variables using ordinary least squares regression. Unsurprisingly,
-populations in rich countries tend to use cellphones at a higher rate:
-
-.. code-block:: python
-
-    In [17]: import numpy as np
-    In [18]: import statsmodels.formula.api as smf
-    In [19]: mod = smf.ols("cellphone ~ np.log(gdp)", dat).fit()
-    In [20]: print(mod.summary())
-                                OLS Regression Results
-    ==============================================================================
-    Dep. Variable:              cellphone   R-squared:                       0.297
-    Model:                            OLS   Adj. R-squared:                  0.274
-    Method:                 Least Squares   F-statistic:                     13.08
-    Date:                Thu, 25 Jul 2013   Prob (F-statistic):            0.00105
-    Time:                        15:24:42   Log-Likelihood:                -139.16
-    No. Observations:                  33   AIC:                             282.3
-    Df Residuals:                      31   BIC:                             285.3
-    Df Model:                           1
-    ===============================================================================
-                      coef    std err          t      P>|t|      [95.0% Conf. Int.]
-    -------------------------------------------------------------------------------
-    Intercept      16.5110     19.071      0.866      0.393       -22.384    55.406
-    np.log(gdp)     9.9333      2.747      3.616      0.001         4.331    15.535
-    ==============================================================================
-    Omnibus:                       36.054   Durbin-Watson:                   2.071
-    Prob(Omnibus):                  0.000   Jarque-Bera (JB):              119.133
-    Skew:                          -2.314   Prob(JB):                     1.35e-26
-    Kurtosis:                      11.077   Cond. No.                         45.8
-    ==============================================================================
-
-Country Codes
-~~~~~~~~~~~~~
-
-.. versionadded:: 0.15.1
-
-The ``country`` argument accepts a string or list of mixed
-`two <http://en.wikipedia.org/wiki/ISO_3166-1_alpha-2>`__ or `three <http://en.wikipedia.org/wiki/ISO_3166-1_alpha-3>`__ character
-ISO country codes, as well as dynamic `World Bank exceptions <http://data.worldbank.org/node/18>`__ to the ISO standards.
-
-For a list of the the hard-coded country codes (used solely for error handling logic) see ``pandas.io.wb.country_codes``.
-
-Problematic Country Codes & Indicators
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. note::
-
-   The World Bank's country list and indicators are dynamic. As of 0.15.1,
-   :func:`wb.download()` is more flexible.  To achieve this, the warning
-   and exception logic changed.
-
-The world bank converts some country codes in their response, which makes error
-checking by pandas difficult. Retired indicators still persist in the search.
-
-Given the new flexibility of 0.15.1, improved error handling by the user
-may be necessary for fringe cases.
-
-To help identify issues:
-
-There are at least 4 kinds of country codes:
-
-1. Standard (2/3 digit ISO) - returns data, will warn and error properly.
-2. Non-standard (WB Exceptions) - returns data, but will falsely warn.
-3. Blank - silently missing from the response.
-4. Bad - causes the entire response from WB to fail, always exception inducing.
-
-There are at least 3 kinds of indicators:
-
-1. Current - Returns data.
-2. Retired - Appears in search results, yet won't return data.
-3. Bad - Will not return data.
-
-Use the ``errors`` argument to control warnings and exceptions.  Setting
-errors to ignore or warn, won't stop failed responses.  (ie, 100% bad
-indicators, or a single "bad" (#4 above) country code).
-
-See docstrings for more info.
-
-.. _remote_data.ga:
-
-Google Analytics
-----------------
-
-The :mod:`~pandas.io.ga` module provides a wrapper for
-`Google Analytics API <https://developers.google.com/analytics/devguides>`__
-to simplify retrieving traffic data.
-Result sets are parsed into a pandas DataFrame with a shape and data types
-derived from the source table.
-
-Configuring Access to Google Analytics
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The first thing you need to do is to setup accesses to Google Analytics API. Follow the steps below:
-
-#. In the `Google Developers Console <https://console.developers.google.com>`__
-    #. enable the Analytics API
-    #. create a new project
-    #. create a new Client ID for an "Installed Application" (in the "APIs & auth / Credentials section" of the newly created project)
-    #. download it (JSON file)
-#. On your machine
-    #. rename it to ``client_secrets.json``
-    #. move it to the ``pandas/io`` module directory
-
-The first time you use the :func:`read_ga` funtion, a browser window will open to ask you to authentify to the Google API. Do proceed.
-
-Using the Google Analytics API
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The following will fetch users and pageviews (metrics) data per day of the week, for the first semester of 2014, from a particular property.
-
-.. code-block:: python
-
-    import pandas.io.ga as ga
-    ga.read_ga(
-        account_id  = "2360420",
-        profile_id  = "19462946",
-        property_id = "UA-2360420-5",
-        metrics     = ['users', 'pageviews'],
-        dimensions  = ['dayOfWeek'],
-        start_date  = "2014-01-01",
-        end_date    = "2014-08-01",
-        index_col   = 0,
-        filters     = "pagePath=~aboutus;ga:country==France",
-    )
-
-The only mandatory arguments are ``metrics,`` ``dimensions`` and ``start_date``. We strongly recommend that you always specify the ``account_id``, ``profile_id`` and ``property_id`` to avoid accessing the wrong data bucket in Google Analytics.
-
-The ``index_col`` argument indicates which dimension(s) has to be taken as index.
-
-The ``filters`` argument indicates the filtering to apply to the query. In the above example, the page URL has to contain ``aboutus`` AND the visitors country has to be France.
-
-Detailed information in the following:
-
-* `pandas & google analytics, by yhat <http://blog.yhathq.com/posts/pandas-google-analytics.html>`__
-* `Google Analytics integration in pandas, by Chang She <http://quantabee.wordpress.com/2012/12/17/google-analytics-pandas/>`__
-* `Google Analytics Dimensions and Metrics Reference <https://developers.google.com/analytics/devguides/reporting/core/dimsmets>`_
diff --git a/doc/source/reshaping.rst b/doc/source/reshaping.rst
index dbf3b838593a9..7d9925d800441 100644
--- a/doc/source/reshaping.rst
+++ b/doc/source/reshaping.rst
@@ -28,7 +28,7 @@ Reshaping by pivoting DataFrame objects
       ...:                 'variable' : np.asarray(frame.columns).repeat(N),
       ...:                 'date' : np.tile(np.asarray(frame.index), K)}
       ...:         columns = ['date', 'variable', 'value']
-      ...:         return DataFrame(data, columns=columns)
+      ...:         return pd.DataFrame(data, columns=columns)
       ...:
 
    In [3]: df = unpivot(tm.makeTimeDataFrame())
@@ -41,7 +41,7 @@ Data is often stored in CSV files or databases in so-called "stacked" or
    df
 
 
-For the curious here is how the above DataFrame was created:
+For the curious here is how the above ``DataFrame`` was created:
 
 .. code-block:: python
 
@@ -60,18 +60,21 @@ To select out everything for variable ``A`` we could do:
 
    df[df['variable'] == 'A']
 
+.. image:: _static/reshaping_pivot.png
+
 But suppose we wish to do time series operations with the variables. A better
 representation would be where the ``columns`` are the unique variables and an
 ``index`` of dates identifies individual observations. To reshape the data into
-this form, use the ``pivot`` function:
+this form, we use the :meth:`DataFrame.pivot` method (also implemented as a
+top level function :func:`~pandas.pivot`):
 
 .. ipython:: python
 
    df.pivot(index='date', columns='variable', values='value')
 
-If the ``values`` argument is omitted, and the input DataFrame has more than
+If the ``values`` argument is omitted, and the input ``DataFrame`` has more than
 one column of values which are not used as column or index inputs to ``pivot``,
-then the resulting "pivoted" DataFrame will have :ref:`hierarchical columns
+then the resulting "pivoted" ``DataFrame`` will have :ref:`hierarchical columns
 <advanced.hierarchical>` whose topmost level indicates the respective value
 column:
 
@@ -81,7 +84,7 @@ column:
    pivoted = df.pivot('date', 'variable')
    pivoted
 
-You of course can then select subsets from the pivoted DataFrame:
+You can then select subsets from the pivoted ``DataFrame``:
 
 .. ipython:: python
 
@@ -95,18 +98,22 @@ are homogeneously-typed.
 Reshaping by stacking and unstacking
 ------------------------------------
 
-Closely related to the ``pivot`` function are the related ``stack`` and
-``unstack`` functions currently available on Series and DataFrame. These
-functions are designed to work together with ``MultiIndex`` objects (see the
-section on :ref:`hierarchical indexing <advanced.hierarchical>`). Here are
-essentially what these functions do:
+.. image:: _static/reshaping_stack.png
+
+Closely related to the :meth:`~DataFrame.pivot` method are the related
+:meth:`~DataFrame.stack` and :meth:`~DataFrame.unstack` methods available on
+``Series`` and ``DataFrame``. These methods are designed to work together with
+``MultiIndex`` objects (see the section on :ref:`hierarchical indexing
+<advanced.hierarchical>`). Here are essentially what these methods do:
 
-  - ``stack``: "pivot" a level of the (possibly hierarchical) column labels,
-    returning a DataFrame with an index with a new inner-most level of row
-    labels.
-  - ``unstack``: inverse operation from ``stack``: "pivot" a level of the
-    (possibly hierarchical) row index to the column axis, producing a reshaped
-    DataFrame with a new inner-most level of column labels.
+* ``stack``: "pivot" a level of the (possibly hierarchical) column labels,
+  returning a ``DataFrame`` with an index with a new inner-most level of row
+  labels.
+* ``unstack``: (inverse operation of ``stack``) "pivot" a level of the
+  (possibly hierarchical) row index to the column axis, producing a reshaped
+  ``DataFrame`` with a new inner-most level of column labels.
+
+.. image:: _static/reshaping_unstack.png
 
 The clearest way to explain is by example. Let's take a prior example data set
 from the hierarchical indexing section:
@@ -122,11 +129,11 @@ from the hierarchical indexing section:
    df2 = df[:4]
    df2
 
-The ``stack`` function "compresses" a level in the DataFrame's columns to
+The ``stack`` function "compresses" a level in the ``DataFrame``'s columns to
 produce either:
 
-  - A Series, in the case of a simple column Index
-  - A DataFrame, in the case of a ``MultiIndex`` in the columns
+* A ``Series``, in the case of a simple column Index.
+* A ``DataFrame``, in the case of a ``MultiIndex`` in the columns.
 
 If the columns have a ``MultiIndex``, you can choose which level to stack. The
 stacked level becomes the new lowest level in a ``MultiIndex`` on the columns:
@@ -136,7 +143,7 @@ stacked level becomes the new lowest level in a ``MultiIndex`` on the columns:
    stacked = df2.stack()
    stacked
 
-With a "stacked" DataFrame or Series (having a ``MultiIndex`` as the
+With a "stacked" ``DataFrame`` or ``Series`` (having a ``MultiIndex`` as the
 ``index``), the inverse operation of ``stack`` is ``unstack``, which by default
 unstacks the **last level**:
 
@@ -148,6 +155,8 @@ unstacks the **last level**:
 
 .. _reshaping.unstack_by_name:
 
+.. image:: _static/reshaping_unstack_1.png
+
 If the indexes have names, you can use the level names instead of specifying
 the level numbers:
 
@@ -155,9 +164,12 @@ the level numbers:
 
    stacked.unstack('second')
 
+
+.. image:: _static/reshaping_unstack_0.png
+
 Notice that the ``stack`` and ``unstack`` methods implicitly sort the index
-levels involved. Hence a call to ``stack`` and then ``unstack``, or viceversa,
-will result in a **sorted** copy of the original DataFrame or Series:
+levels involved. Hence a call to ``stack`` and then ``unstack``, or vice versa,
+will result in a **sorted** copy of the original ``DataFrame`` or ``Series``:
 
 .. ipython:: python
 
@@ -166,7 +178,7 @@ will result in a **sorted** copy of the original DataFrame or Series:
    df
    all(df.unstack().stack() == df.sort_index())
 
-while the above code will raise a ``TypeError`` if the call to ``sort_index`` is
+The above code will raise a ``TypeError`` if the call to ``sort_index`` is
 removed.
 
 .. _reshaping.stack_multiple:
@@ -217,7 +229,7 @@ calling ``sort_index``, of course). Here is a more complex example:
                                        ('one', 'two')],
                                       names=['first', 'second'])
    df = pd.DataFrame(np.random.randn(8, 4), index=index, columns=columns)
-   df2 = df.ix[[0, 1, 2, 4, 5, 7]]
+   df2 = df.iloc[[0, 1, 2, 4, 5, 7]]
    df2
 
 As mentioned above, ``stack`` can be called with a ``level`` argument to select
@@ -228,6 +240,27 @@ which level in the columns to stack:
    df2.stack('exp')
    df2.stack('animal')
 
+Unstacking can result in missing values if subgroups do not have the same
+set of labels.  By default, missing values will be replaced with the default
+fill value for that data type, ``NaN`` for float, ``NaT`` for datetimelike,
+etc.  For integer types, by default data will converted to float and missing
+values will be set to ``NaN``.
+
+.. ipython:: python
+
+   df3 = df.iloc[[0, 1, 4, 7], [1, 2]]
+   df3
+   df3.unstack()
+
+.. versionadded:: 0.18.0
+
+Alternatively, unstack takes an optional ``fill_value`` argument, for specifying
+the value of missing data.
+
+.. ipython:: python
+
+   df3.unstack(fill_value=-1e9)
+
 With a MultiIndex
 ~~~~~~~~~~~~~~~~~
 
@@ -244,12 +277,14 @@ the right thing:
 Reshaping by Melt
 -----------------
 
-The :func:`~pandas.melt` function is useful to massage a
-DataFrame into a format where one or more columns are identifier variables,
-while all other columns, considered measured variables, are "unpivoted" to the
-row axis, leaving just two non-identifier columns, "variable" and "value". The
-names of those columns can be customized by supplying the ``var_name`` and
-``value_name`` parameters.
+.. image:: _static/reshaping_melt.png
+
+The top-level :func:`~pandas.melt` function and the corresponding :meth:`DataFrame.melt`
+are useful to massage a ``DataFrame`` into a format where one or more columns
+are *identifier variables*, while all other columns, considered *measured
+variables*, are "unpivoted" to the row axis, leaving just two non-identifier
+columns, "variable" and "value". The names of those columns can be customized
+by supplying the ``var_name`` and ``value_name`` parameters.
 
 For instance,
 
@@ -260,10 +295,12 @@ For instance,
                           'height' : [5.5, 6.0],
                           'weight' : [130, 150]})
    cheese
-   pd.melt(cheese, id_vars=['first', 'last'])
-   pd.melt(cheese, id_vars=['first', 'last'], var_name='quantity')
+   cheese.melt(id_vars=['first', 'last'])
+   cheese.melt(id_vars=['first', 'last'], var_name='quantity')
 
-Another way to transform is to use the ``wide_to_long`` panel data convenience function.
+Another way to transform is to use the :func:`~pandas.wide_to_long` panel data
+convenience function. It is less flexible than :func:`~pandas.melt`, but more
+user-friendly.
 
 .. ipython:: python
 
@@ -297,23 +334,30 @@ some very expressive and fast data manipulations.
    df.mean().unstack(0)
 
 
-Pivot tables and cross-tabulations
-----------------------------------
+Pivot tables
+------------
 
 .. _reshaping.pivot:
 
-The function ``pandas.pivot_table`` can be used to create spreadsheet-style pivot
-tables. See the :ref:`cookbook<cookbook.pivot>` for some advanced strategies
 
-It takes a number of arguments
 
-- ``data``: A DataFrame object
-- ``values``: a column or a list of columns to aggregate
-- ``index``: a column, Grouper, array which has the same length as data, or list of them.
+While :meth:`~DataFrame.pivot` provides general purpose pivoting with various
+data types (strings, numerics, etc.), pandas also provides :func:`~pandas.pivot_table`
+for pivoting with aggregation of numeric data.
+
+The function :func:`~pandas.pivot_table` can be used to create spreadsheet-style
+pivot tables. See the :ref:`cookbook<cookbook.pivot>` for some advanced
+strategies.
+
+It takes a number of arguments:
+
+* ``data``: a DataFrame object.
+* ``values``: a column or a list of columns to aggregate.
+* ``index``: a column, Grouper, array which has the same length as data, or list of them.
   Keys to group by on the pivot table index. If an array is passed, it is being used as the same manner as column values.
-- ``columns``: a column, Grouper, array which has the same length as data, or list of them.
+* ``columns``: a column, Grouper, array which has the same length as data, or list of them.
   Keys to group by on the pivot table column. If an array is passed, it is being used as the same manner as column values.
-- ``aggfunc``: function to use for aggregation, defaulting to ``numpy.mean``
+* ``aggfunc``: function to use for aggregation, defaulting to ``numpy.mean``.
 
 Consider a data set like this:
 
@@ -337,7 +381,7 @@ We can produce pivot tables from this data very easily:
    pd.pivot_table(df, values='D', index=['B'], columns=['A', 'C'], aggfunc=np.sum)
    pd.pivot_table(df, values=['D','E'], index=['B'], columns=['A', 'C'], aggfunc=np.sum)
 
-The result object is a DataFrame having potentially hierarchical indexes on the
+The result object is a ``DataFrame`` having potentially hierarchical indexes on the
 rows and columns. If the ``values`` column name is not given, the pivot table
 will include all of the data that can be aggregated in an additional level of
 hierarchy in the columns:
@@ -350,7 +394,7 @@ Also, you can use ``Grouper`` for ``index`` and ``columns`` keywords. For detail
 
 .. ipython:: python
 
-   pd.pivot_table(df, values='D', index=Grouper(freq='M', key='F'), columns='C')
+   pd.pivot_table(df, values='D', index=pd.Grouper(freq='M', key='F'), columns='C')
 
 You can render a nice output of the table omitting the missing values by
 calling ``to_string`` if you wish:
@@ -360,29 +404,48 @@ calling ``to_string`` if you wish:
    table = pd.pivot_table(df, index=['A', 'B'], columns=['C'])
    print(table.to_string(na_rep=''))
 
-Note that ``pivot_table`` is also available as an instance method on DataFrame.
+Note that ``pivot_table`` is also available as an instance method on DataFrame,
+ i.e. :meth:`DataFrame.pivot_table`.
+
+.. _reshaping.pivot.margins:
+
+Adding margins
+~~~~~~~~~~~~~~
+
+If you pass ``margins=True`` to ``pivot_table``, special ``All`` columns and
+rows will be added with partial group aggregates across the categories on the
+rows and columns:
+
+.. ipython:: python
+
+   df.pivot_table(index=['A', 'B'], columns='C', margins=True, aggfunc=np.std)
+
+.. _reshaping.crosstabulations:
 
 Cross tabulations
-~~~~~~~~~~~~~~~~~
+-----------------
 
-Use the ``crosstab`` function to compute a cross-tabulation of two (or more)
+Use :func:`~pandas.crosstab` to compute a cross-tabulation of two (or more)
 factors. By default ``crosstab`` computes a frequency table of the factors
 unless an array of values and an aggregation function are passed.
 
 It takes a number of arguments
 
-- ``index``: array-like, values to group by in the rows
-- ``columns``: array-like, values to group by in the columns
-- ``values``: array-like, optional, array of values to aggregate according to
-  the factors
-- ``aggfunc``: function, optional, If no values array is passed, computes a
-  frequency table
-- ``rownames``: sequence, default None, must match number of row arrays passed
-- ``colnames``: sequence, default None, if passed, must match number of column
-  arrays passed
-- ``margins``: boolean, default False, Add row/column margins (subtotals)
-
-Any Series passed will have their name attributes used unless row or column
+* ``index``: array-like, values to group by in the rows.
+* ``columns``: array-like, values to group by in the columns.
+* ``values``: array-like, optional, array of values to aggregate according to
+  the factors.
+* ``aggfunc``: function, optional, If no values array is passed, computes a
+  frequency table.
+* ``rownames``: sequence, default ``None``, must match number of row arrays passed.
+* ``colnames``: sequence, default ``None``, if passed, must match number of column
+  arrays passed.
+* ``margins``: boolean, default ``False``, Add row/column margins (subtotals)
+* ``normalize``: boolean, {'all', 'index', 'columns'}, or {0,1}, default ``False``.
+  Normalize by dividing all values by the sum of values.
+
+
+Any ``Series`` passed will have their name attributes used unless row or column
 names for the cross-tabulation are specified
 
 For example:
@@ -395,35 +458,77 @@ For example:
     c = np.array([dull, dull, shiny, dull, dull, shiny], dtype=object)
     pd.crosstab(a, [b, c], rownames=['a'], colnames=['b', 'c'])
 
-.. _reshaping.pivot.margins:
 
-Adding margins (partial aggregates)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+If ``crosstab`` receives only two Series, it will provide a frequency table.
 
-If you pass ``margins=True`` to ``pivot_table``, special ``All`` columns and
-rows will be added with partial group aggregates across the categories on the
-rows and columns:
+.. ipython:: python
+
+    df = pd.DataFrame({'A': [1, 2, 2, 2, 2], 'B': [3, 3, 4, 4, 4],
+                       'C': [1, 1, np.nan, 1, 1]})
+    df
+
+    pd.crosstab(df.A, df.B)
+
+Any input passed containing ``Categorical`` data will have **all** of its
+categories included in the cross-tabulation, even if the actual data does
+not contain any instances of a particular category.
 
 .. ipython:: python
 
-   df.pivot_table(index=['A', 'B'], columns='C', margins=True, aggfunc=np.std)
+    foo = pd.Categorical(['a', 'b'], categories=['a', 'b', 'c'])
+    bar = pd.Categorical(['d', 'e'], categories=['d', 'e', 'f'])
+    pd.crosstab(foo, bar)
+
+Normalization
+~~~~~~~~~~~~~
+
+.. versionadded:: 0.18.1
+
+Frequency tables can also be normalized to show percentages rather than counts
+using the ``normalize`` argument:
+
+.. ipython:: python
+
+   pd.crosstab(df.A, df.B, normalize=True)
+
+``normalize`` can also normalize values within each row or within each column:
+
+.. ipython:: python
+
+   pd.crosstab(df.A, df.B, normalize='columns')
+
+``crosstab`` can also be passed a third ``Series`` and an aggregation function
+(``aggfunc``) that will be applied to the values of the third ``Series`` within
+each group defined by the first two ``Series``:
+
+.. ipython:: python
+
+   pd.crosstab(df.A, df.B, values=df.C, aggfunc=np.sum)
+
+Adding Margins
+~~~~~~~~~~~~~~
+
+Finally, one can also add margins or normalize this output.
+
+.. ipython:: python
+
+   pd.crosstab(df.A, df.B, values=df.C, aggfunc=np.sum, normalize=True,
+               margins=True)
 
 .. _reshaping.tile:
+.. _reshaping.tile.cut:
 
 Tiling
 ------
 
-.. _reshaping.tile.cut:
-
-The ``cut`` function computes groupings for the values of the input array and
-is often used to transform continuous variables to discrete or categorical
-variables:
+The :func:`~pandas.cut` function computes groupings for the values of the input
+array and is often used to transform continuous variables to discrete or
+categorical variables:
 
 .. ipython:: python
 
    ages = np.array([10, 15, 13, 12, 23, 25, 28, 59, 60])
 
-
    pd.cut(ages, bins=3)
 
 If the ``bins`` keyword is an integer, then equal-width bins are formed.
@@ -431,7 +536,15 @@ Alternatively we can specify custom bin-edges:
 
 .. ipython:: python
 
-   pd.cut(ages, bins=[0, 18, 35, 70])
+   c = pd.cut(ages, bins=[0, 18, 35, 70])
+   c
+
+.. versionadded:: 0.20.0
+
+If the ``bins`` keyword is an ``IntervalIndex``, then these will be
+used to bin the passed data.::
+
+   pd.cut([25, 20, 50], bins=c.categories)
 
 
 .. _reshaping.dummies:
@@ -439,9 +552,10 @@ Alternatively we can specify custom bin-edges:
 Computing indicator / dummy variables
 -------------------------------------
 
-To convert a categorical variable into a "dummy" or "indicator" DataFrame, for example
-a column in a DataFrame (a Series) which has ``k`` distinct values, can derive a DataFrame
-containing ``k`` columns of 1s and 0s:
+To convert a categorical variable into a "dummy" or "indicator" ``DataFrame``,
+for example a column in a ``DataFrame`` (a ``Series``) which has ``k`` distinct
+values, can derive a ``DataFrame`` containing ``k`` columns of 1s and 0s using
+:func:`~pandas.get_dummies`:
 
 .. ipython:: python
 
@@ -450,7 +564,7 @@ containing ``k`` columns of 1s and 0s:
    pd.get_dummies(df['key'])
 
 Sometimes it's useful to prefix the column names, for example when merging the result
-with the original DataFrame:
+with the original ``DataFrame``:
 
 .. ipython:: python
 
@@ -475,11 +589,9 @@ This function is often used along with discretization functions like ``cut``:
 
 See also :func:`Series.str.get_dummies <pandas.Series.str.get_dummies>`.
 
-.. versionadded:: 0.15.0
-
-:func:`get_dummies` also accepts a DataFrame. By default all categorical
-variables (categorical in the statistical sense,
-those with `object` or `categorical` dtype) are encoded as dummy variables.
+:func:`get_dummies` also accepts a ``DataFrame``. By default all categorical
+variables (categorical in the statistical sense, those with `object` or
+`categorical` dtype) are encoded as dummy variables.
 
 
 .. ipython:: python
@@ -488,9 +600,8 @@ those with `object` or `categorical` dtype) are encoded as dummy variables.
                        'C': [1, 2, 3]})
     pd.get_dummies(df)
 
-All non-object columns are included untouched in the output.
-
-You can control the columns that are encoded with the ``columns`` keyword.
+All non-object columns are included untouched in the output. You can control
+the columns that are encoded with the ``columns`` keyword.
 
 .. ipython:: python
 
@@ -500,14 +611,14 @@ Notice that the ``B`` column is still included in the output, it just hasn't
 been encoded. You can drop ``B`` before calling ``get_dummies`` if you don't
 want to include it in the output.
 
-As with the Series version, you can pass values for the ``prefix`` and
+As with the ``Series`` version, you can pass values for the ``prefix`` and
 ``prefix_sep``. By default the column name is used as the prefix, and '_' as
-the prefix separator. You can specify ``prefix`` and ``prefix_sep`` in 3 ways
+the prefix separator. You can specify ``prefix`` and ``prefix_sep`` in 3 ways:
 
-- string: Use the same value for ``prefix`` or ``prefix_sep`` for each column
-  to be encoded
-- list: Must be the same length as the number of columns being encoded.
-- dict: Mapping column name to prefix
+* string: Use the same value for ``prefix`` or ``prefix_sep`` for each column
+  to be encoded.
+* list: Must be the same length as the number of columns being encoded.
+* dict: Mapping column name to prefix.
 
 .. ipython:: python
 
@@ -518,10 +629,48 @@ the prefix separator. You can specify ``prefix`` and ``prefix_sep`` in 3 ways
     from_dict = pd.get_dummies(df, prefix={'B': 'from_B', 'A': 'from_A'})
     from_dict
 
+.. versionadded:: 0.18.0
+
+Sometimes it will be useful to only keep k-1 levels of a categorical
+variable to avoid collinearity when feeding the result to statistical models.
+You can switch to this mode by turn on ``drop_first``.
+
+.. ipython:: python
+
+    s = pd.Series(list('abcaa'))
+
+    pd.get_dummies(s)
+
+    pd.get_dummies(s, drop_first=True)
+
+When a column contains only one level, it will be omitted in the result.
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A':list('aaaaa'),'B':list('ababc')})
+
+    pd.get_dummies(df)
+
+    pd.get_dummies(df, drop_first=True)
+
+By default new columns will have ``np.uint8`` dtype.
+To choose another dtype, use the ``dtype`` argument:
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': list('abc'), 'B': [1.1, 2.2, 3.3]})
+
+    pd.get_dummies(df, dtype=bool).dtypes
+
+.. versionadded:: 0.23.0
+
+
+.. _reshaping.factorize:
+
 Factorizing values
 ------------------
 
-To encode 1-d values as an enumerated type use ``factorize``:
+To encode 1-d values as an enumerated type use :func:`~pandas.factorize`:
 
 .. ipython:: python
 
@@ -537,16 +686,22 @@ handling of NaN:
 .. note::
    The following ``numpy.unique`` will fail under Python 3 with a ``TypeError``
    because of an ordering bug. See also
-   `Here <https://github.com/numpy/numpy/issues/641>`__
+   `here <https://github.com/numpy/numpy/issues/641>`__.
 
-.. ipython:: python
+.. code-block:: ipython
+
+    In [2]: pd.factorize(x, sort=True)
+    Out[2]:
+    (array([ 2,  2, -1,  3,  0,  1]),
+     Index([3.14, inf, u'A', u'B'], dtype='object'))
+
+    In [3]: np.unique(x, return_inverse=True)[::-1]
+    Out[3]: (array([3, 3, 0, 4, 1, 2]), array([nan, 3.14, inf, 'A', 'B'], dtype=object))
 
-   pd.factorize(x, sort=True)
-   np.unique(x, return_inverse=True)[::-1]
 
 .. note::
     If you just want to handle one column as a categorical variable (like R's factor),
     you can use  ``df["cat_col"] = pd.Categorical(df["col"])`` or
     ``df["cat_col"] = df["col"].astype("category")``. For full docs on :class:`~pandas.Categorical`,
     see the :ref:`Categorical introduction <categorical>` and the
-    :ref:`API documentation <api.categorical>`. This feature was introduced in version 0.15.
+    :ref:`API documentation <api.categorical>`.
diff --git a/doc/source/sparse.rst b/doc/source/sparse.rst
index 257fb2909d42c..2bb99dd1822b6 100644
--- a/doc/source/sparse.rst
+++ b/doc/source/sparse.rst
@@ -9,19 +9,20 @@
    import pandas as pd
    import pandas.util.testing as tm
    np.set_printoptions(precision=4, suppress=True)
-   options.display.max_rows = 15
+   pd.options.display.max_rows = 15
 
 **********************
 Sparse data structures
 **********************
 
-We have implemented "sparse" versions of Series, DataFrame, and Panel. These
-are not sparse in the typical "mostly 0". You can view these objects as being
-"compressed" where any data matching a specific value (NaN/missing by default,
-though any value can be chosen) is omitted. A special ``SparseIndex`` object
-tracks where data has been "sparsified". This will make much more sense in an
-example. All of the standard pandas data structures have a ``to_sparse``
-method:
+.. note:: The ``SparsePanel`` class has been removed in 0.19.0
+
+We have implemented "sparse" versions of ``Series`` and ``DataFrame``. These are not sparse
+in the typical "mostly 0". Rather, you can view these objects as being "compressed"
+where any data matching a specific value (``NaN`` / missing value, though any value
+can be chosen) is omitted. A special ``SparseIndex`` object tracks where data has been
+"sparsified". This will make much more sense with an example. All of the standard pandas
+data structures have a ``to_sparse`` method:
 
 .. ipython:: python
 
@@ -31,7 +32,7 @@ method:
    sts
 
 The ``to_sparse`` method takes a ``kind`` argument (for the sparse index, see
-below) and a ``fill_value``. So if we had a mostly zero Series, we could
+below) and a ``fill_value``. So if we had a mostly zero ``Series``, we could
 convert it to sparse with ``fill_value=0``:
 
 .. ipython:: python
@@ -39,12 +40,12 @@ convert it to sparse with ``fill_value=0``:
    ts.fillna(0).to_sparse(fill_value=0)
 
 The sparse objects exist for memory efficiency reasons. Suppose you had a
-large, mostly NA DataFrame:
+large, mostly NA ``DataFrame``:
 
 .. ipython:: python
 
    df = pd.DataFrame(randn(10000, 4))
-   df.ix[:9998] = np.nan
+   df.iloc[:9998] = np.nan
    sdf = df.to_sparse()
    sdf
    sdf.density
@@ -77,65 +78,134 @@ distinct from the ``fill_value``:
    sparr = pd.SparseArray(arr)
    sparr
 
-Like the indexed objects (SparseSeries, SparseDataFrame, SparsePanel), a
-``SparseArray`` can be converted back to a regular ndarray by calling
-``to_dense``:
+Like the indexed objects (SparseSeries, SparseDataFrame), a ``SparseArray``
+can be converted back to a regular ndarray by calling ``to_dense``:
 
 .. ipython:: python
 
    sparr.to_dense()
 
-.. _sparse.list:
 
-SparseList
-----------
+SparseIndex objects
+-------------------
+
+Two kinds of ``SparseIndex`` are implemented, ``block`` and ``integer``. We
+recommend using ``block`` as it's more memory efficient. The ``integer`` format
+keeps an arrays of all of the locations where the data are not equal to the
+fill value. The ``block`` format tracks only the locations and sizes of blocks
+of data.
 
-``SparseList`` is a list-like data structure for managing a dynamic collection
-of SparseArrays. To create one, simply call the ``SparseList`` constructor with
-a ``fill_value`` (defaulting to ``NaN``):
+.. _sparse.dtype:
 
-.. ipython:: python
+Sparse Dtypes
+-------------
 
-   spl = pd.SparseList()
-   spl
+Sparse data should have the same dtype as its dense representation. Currently,
+``float64``, ``int64`` and ``bool`` dtypes are supported. Depending on the original
+dtype, ``fill_value`` default changes:
 
-The two important methods are ``append`` and ``to_array``. ``append`` can
-accept scalar values or any 1-dimensional sequence:
+* ``float64``: ``np.nan``
+* ``int64``: ``0``
+* ``bool``: ``False``
 
 .. ipython:: python
-   :suppress:
+
+   s = pd.Series([1, np.nan, np.nan])
+   s
+   s.to_sparse()
+
+   s = pd.Series([1, 0, 0])
+   s
+   s.to_sparse()
+
+   s = pd.Series([True, False, True])
+   s
+   s.to_sparse()
+
+You can change the dtype using ``.astype()``, the result is also sparse. Note that
+``.astype()`` also affects to the ``fill_value`` to keep its dense representation.
+
 
 .. ipython:: python
 
-   spl.append(np.array([1., np.nan, np.nan, 2., 3.]))
-   spl.append(5)
-   spl.append(sparr)
-   spl
+   s = pd.Series([1, 0, 0, 0, 0])
+   s
+   ss = s.to_sparse()
+   ss
+   ss.astype(np.float64)
+
+It raises if any value cannot be coerced to specified dtype.
+
+.. code-block:: ipython
+
+   In [1]: ss = pd.Series([1, np.nan, np.nan]).to_sparse()
+   0    1.0
+   1    NaN
+   2    NaN
+   dtype: float64
+   BlockIndex
+   Block locations: array([0], dtype=int32)
+   Block lengths: array([1], dtype=int32)
+
+   In [2]: ss.astype(np.int64)
+   ValueError: unable to coerce current fill_value nan to int64 dtype
 
-As you can see, all of the contents are stored internally as a list of
-memory-efficient ``SparseArray`` objects. Once you've accumulated all of the
-data, you can call ``to_array`` to get a single ``SparseArray`` with all the
-data:
+.. _sparse.calculation:
+
+Sparse Calculation
+------------------
+
+You can apply NumPy *ufuncs* to ``SparseArray`` and get a ``SparseArray`` as a result.
 
 .. ipython:: python
 
-   spl.to_array()
+   arr = pd.SparseArray([1., np.nan, np.nan, -2., np.nan])
+   np.abs(arr)
 
-SparseIndex objects
--------------------
 
-Two kinds of ``SparseIndex`` are implemented, ``block`` and ``integer``. We
-recommend using ``block`` as it's more memory efficient. The ``integer`` format
-keeps an arrays of all of the locations where the data are not equal to the
-fill value. The ``block`` format tracks only the locations and sizes of blocks
-of data.
+The *ufunc* is also applied to ``fill_value``. This is needed to get
+the correct dense result.
+
+.. ipython:: python
+
+   arr = pd.SparseArray([1., -1, -1, -2., -1], fill_value=-1)
+   np.abs(arr)
+   np.abs(arr).to_dense()
 
 .. _sparse.scipysparse:
 
 Interaction with scipy.sparse
 -----------------------------
 
-Experimental api to transform between sparse pandas and scipy.sparse structures.
+SparseDataFrame
+~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.20.0
+
+Pandas supports creating sparse dataframes directly from ``scipy.sparse`` matrices.
+
+.. ipython:: python
+
+   from scipy.sparse import csr_matrix
+
+   arr = np.random.random(size=(1000, 5))
+   arr[arr < .9] = 0
+
+   sp_arr = csr_matrix(arr)
+   sp_arr
+
+   sdf = pd.SparseDataFrame(sp_arr)
+   sdf
+
+All sparse formats are supported, but matrices that are not in :mod:`COOrdinate <scipy.sparse>` format will be converted, copying data as needed.
+To convert a ``SparseDataFrame`` back to sparse SciPy matrix in COO format, you can use the :meth:`SparseDataFrame.to_coo` method:
+
+.. ipython:: python
+
+   sdf.to_coo()
+
+SparseSeries
+~~~~~~~~~~~~
 
 A :meth:`SparseSeries.to_coo` method is implemented for transforming a ``SparseSeries`` indexed by a ``MultiIndex`` to a ``scipy.sparse.coo_matrix``.
 
diff --git a/doc/source/spelling_wordlist.txt b/doc/source/spelling_wordlist.txt
new file mode 100644
index 0000000000000..be93cdad083e9
--- /dev/null
+++ b/doc/source/spelling_wordlist.txt
@@ -0,0 +1,920 @@
+IPython
+ipython
+numpy
+NumPy
+Reindexing
+reindexing
+ga
+fe
+reindexed
+automagic
+closedness
+ae
+arbitrarly
+losslessly
+Histogramming
+histogramming
+concat
+resampling
+iterables
+sparsified
+df
+loc
+gc
+Timeseries
+ndarrays
+ndarray
+dtype
+dtypes
+dtyped
+reindex
+sliceable
+timedelta
+Timedeltas
+timedeltas
+subpackages
+subpackage
+filepath
+io
+nthreads
+kwargs
+kwarg
+arg
+args
+Datetimelike
+datetime
+datetimes
+tz
+builtin
+NaN
+nan
+behaviour
+quantiling
+aggregators
+aggregator
+Dtypes
+groupby
+GroupBy
+Tablewise
+Elementwise
+ufunc
+ufuncs
+dict
+namedtuples
+namedtuple
+iterrows
+upcasted
+upcasting
+upcast
+searchsorted
+downcasting
+Likert
+categoricals
+Groupby
+Unioning
+csv
+Upcase
+resampling
+Upcase
+Lowcase
+Propcase
+Interop
+Stata
+stata
+bysort
+Spearman
+Wikipedia
+debiasing
+docstrings
+docstring
+Docstrings
+autosummary
+linting
+toolchain
+Appveyor
+Akogun
+online
+pdf
+reStructuredText
+reST
+backticks
+cpus
+str
+idxmin
+mins
+agg
+DataFrame
+dataframes
+NaT
+len
+Statsmodels
+Bokeh
+Protovis
+Seaborn
+Wickham
+shareability
+apps
+app
+Plotly
+Spyder
+Fama
+Eurostat
+organisations
+Geopandas
+Dask
+Scikit
+backends
+Engarde
+Cyberpandas
+Accessor
+Numba
+optimising
+Cython
+cython
+cythonizing
+cythonized
+Vectorize
+ol
+subclassing
+IPv
+iteritems
+itertuples
+dt
+upcast
+subsetting
+programmatically
+stderr
+scipy
+SparseArray
+doctests
+nd
+refactored
+Jit
+stdout
+Typeclass
+Pythonic
+zscore
+SQL
+broadcastable
+resample
+resamples
+groupbys
+metaprogramming
+upcast
+un
+dropna
+ints
+int
+boxplot
+groupwise
+indices
+pre
+datetimelike
+dev
+gd
+colname
+intemname
+nd
+isin
+backporting
+admin
+Debian
+Ubuntu
+Centos
+RHEL
+xlsx
+xz
+ftp
+impl
+timespans
+pre
+Regex
+regex
+sortedness
+delim
+usecols
+skipinitialspace
+skiprows
+skipfooter
+nrows
+na
+iso
+dayfirst
+chunksize
+gz
+bz
+lineterminator
+quotechar
+doublequote
+escapechar
+tupleize
+prepended
+colspecs
+NONNUMERIC
+serializer
+localhost
+json
+strtod
+deserialization
+Hadoop
+ns
+stringified
+xclip
+xsel
+gtk
+gtpy
+Msgpacks
+msgpack
+msgpacks
+foo
+ptrepack
+sqlalchemy
+sqlite
+Sqlite
+dta
+bdat
+netCDF
+backend
+deserialising
+deserializing
+qtpy
+indexables
+itemsize
+de
+sas
+Miniconda
+itemname
+ndims
+ndim
+mergands
+Timeseries
+timeseries
+asof
+Nans
+DataFrames
+fillna
+ffill
+bfill
+alignable
+sim
+py
+ipy
+colheader
+yearfirst
+repr
+EngFormatter
+frontends
+frontend
+longtable
+multirow
+cline
+clines
+colwidth
+Sparsify
+html
+pprint
+mathjax
+Jupyter
+xls
+xlsm
+hdf
+numexpr
+matplotlib
+timedeltas
+lexual
+danbirken
+isnull
+Timestamp
+np
+xs
+locs
+datelike
+dups
+recarray
+setitem
+rhs
+gaussian
+kde
+gkde
+fwf
+iNf
+astyping
+vbench
+lgautier
+jnothman
+roundtrip
+xlrd
+buf
+jtratner
+tavistmorph
+numpand
+unserialiable
+tseries
+mul
+completers
+refactor
+Refactor
+subclassed
+consolidatable
+setitem
+DataFrame
+klass
+jtratner
+bs
+lxml
+rockg
+inplace
+pyt
+tslib
+vals
+pos
+cparser
+locs
+repr'd
+cumsum
+cumprod
+rhs
+datetimeindex
+reraising
+iloc
+setitem
+lhs
+ticklocs
+ticklabels
+immerrr
+np
+kwds
+travis
+ci
+yarikoptic
+setitem
+delitem
+cpcloud
+pprinting
+hoechenberger
+Faq
+FAQ
+faq
+mtkini
+spearman
+SleepingPills
+astypes
+cov
+timedeltalike
+weekmasks
+Weekmasks
+xlrd
+unioning
+uint
+iget
+applymap
+stonebig
+recarrays
+tdsmith
+tokenization
+google
+xN
+sharex
+famafrench
+strptime
+stephenwlin
+nans
+diff
+ohlc
+util
+seg
+getitem
+queryables
+Dataframe
+idxmax
+putmasking
+argsort
+unsampling
+pylab
+fromordinal
+andrews
+strftime
+wb
+gzipped
+gzip
+aggfunc
+multithreading
+unicode
+bork
+tokenizer
+sortlevel
+Scikits
+isnull
+ndpanel
+notnul
+ctor
+tzinfo
+tzoffset
+endianness
+Upsampling
+upsampling
+upsampled
+locators
+locator
+astimezone
+iget
+qcut
+ewma
+icol
+printoption
+quantileTS
+UTC
+utc
+bool
+init
+OLS
+Isnull
+nansum
+Cythonize
+extlinks
+utcoffset
+khash
+kendall
+tolist
+unhandled
+downsampling
+dayofyear
+setops
+discretizing
+klib
+ylabel
+bday
+BDay
+timeRule
+unmergeable
+navar
+pyplot
+multiindex
+combineAdd
+ewmcov
+algos
+unpickling
+MultiIndex
+Memoize
+Unbox
+nanops
+vectorize
+DataFame
+fallback
+sharey
+xlabel
+notnull
+asfreq
+crit
+rpy
+nanvar
+ddof
+ols
+printoptions
+rankdata
+pyo
+camelCased
+cacheable
+unindexed
+reduceat
+blosc
+aggregatable
+idx
+tradeoff
+nPeriods
+camelCasing
+camelCased
+LongPanel
+truediv
+px
+parseCSV
+unpivoted
+extractall
+weekofyear
+dayofweek
+CDay
+Nano
+parameterised
+sunday
+monday
+tuesday
+friday
+upsample
+resampled
+tzfile
+bools
+xlsxwriter
+ggplot
+Colormaps
+colormaps
+trippable
+callables
+pivotting
+GBQ
+intersphinx
+hashable
+compat
+Compat
+rollforward
+seekable
+endian
+subrecords
+readonly
+orderedness
+eval
+datetimelikes
+pytables
+argmax
+argmin
+utf
+segfault
+segfaults
+xlims
+CPython
+MultiIndexed
+blosc
+blosclz
+hc
+lz
+zlib
+zstd
+tput
+boxplot
+UInt
+unioned
+hashtable
+saslib
+resampled
+dicts
+datetimetz
+ascii
+evals
+Compat
+lexsorted
+errstate
+incompat
+boxplots
+honour
+UTF
+subclasse
+ungrouped
+xport
+writeable
+unencodable
+serialising
+serialise
+Segfault
+ceiled
+xarray
+jupyter
+ified
+isoformat
+downsample
+upsample
+aggregator
+ascii
+compat
+src
+ness
+unencoded
+submethods
+gbq
+vectorised
+nanos
+Bigquery
+complib
+overridable
+xlabels
+xticklabels
+listlike
+jobComplete
+cummin
+cummax
+undeprecated
+triang
+errored
+unpickle
+ngroups
+multiindexes
+xticks
+yticks
+errorbars
+barplots
+rcParams
+dfs
+nw
+Openpyxl
+barh
+timestamp
+inv
+Welford
+tarball
+hdfstore
+Pandonic
+Perf
+factorizer
+sharey
+yyyy
+dd
+xxx
+bdays
+nfrequencies
+XYZ
+Vytautas
+Jancauskas
+rankdata
+Astype
+astyped
+mergesort
+nano
+unpickled
+dataframe
+serialised
+serialisation
+numpies
+deserialize
+hashtables
+unpivoting
+cubehelix
+unparsable
+fu
+Unpivots
+rownames
+retbins
+objs
+sep
+stubnames
+expr
+func
+skipna
+halflife
+cond
+ceil
+fillchar
+swapcased
+deletechars
+figsize
+bw
+xlabelsize
+ftypes
+ge
+Unpivots
+lsuffix
+fname
+fo
+ftypes
+rsuffix
+sparsifying
+tup
+cls
+nonunique
+xrange
+periodIndex
+pytz
+ctime
+dst
+localtime
+proleptic
+tzname
+stddev
+resampler
+Resampler
+searchpath
+cmap
+visualising
+figsize
+desc
+Iterable
+da
+ta
+CategoricalIndex
+specialised
+takeable
+iter
+upcase
+Outlier
+fontsize
+pearson
+corrwith
+eq
+ewm
+floordiv
+ftype
+iat
+typeR
+slinear
+krogh
+akima
+BPoly
+isna
+kurt
+le
+lt
+ne
+notna
+nsmallest
+Deutsche
+Colormap
+colorbar
+silverman
+gridsize
+radd
+rdiv
+regexes
+rfloordiv
+rmod
+rmul
+rpow
+rsub
+rtruediv
+RandomState
+sem
+quicksort
+heapsort
+organised
+swapaxes
+swaplevel
+OAuth
+defaultdict
+tablename
+HDFStore
+appendable
+searchable
+serialisable
+lzo
+usepackage
+booktabs
+coereced
+spellcheck
+misspelt
+rcl
+multicolumns
+gfc
+automagically
+fastparquet
+brotli
+sql
+nullable
+performant
+lexsorted
+tw
+latin
+StrL
+tshift
+basestring
+DatetimeIndex
+periodIndex
+pydatetime
+perioddelta
+ExcelFile
+noqa
+deepcopy
+Discretize
+hasnans
+nbytes
+nlevels
+DateOffset
+stringr
+orderable
+IntervalIndex
+versionadded
+lexsort
+droplevel
+swaplevel
+kurt
+IGNORECASE
+findall
+isalnum
+isalpha
+isdecimal
+isdigit
+islower
+isnumeric
+isspace
+istitle
+isupper
+ljust
+lstrip
+rfind
+rindex
+rpartition
+rsplit
+rstrip
+startswith
+deletechars
+whitespaces
+insecable
+stringr
+zfill
+tshift
+SparseSeries
+isoweekday
+isocalendar
+fromtimestamp
+dateutil
+utcfromtimestamp
+utcnow
+utctimetuple
+api
+ExtensionArray
+nbytes
+abc
+ABCMeta
+Typecode
+ExtensionDtype
+biufcmMOSUV
+accessor
+CategoricalDtype
+DataFrameGroupBy
+Weekmask
+walkthrough
+wieldy
+stubnames
+unix
+asian
+Eg
+recomputation
+useQueryCache
+LocalPath
+fspath
+params
+datatypes
+connectable
+multirows
+sparsify
+parseable
+TimedeltaIndex
+baz
+pathlib
+radviz
+axvline
+xtick
+unpivot
+StataWriter
+StataReader
+IndexSlice
+uuid
+cellstyle
+tablewise
+rowwise
+columnwise
+env
+fba
+Regexp
+sparsify
+multiline
+UnsupportedFunctionCall
+UnsortedIndexError
+PerformanceWarning
+ParserWarning
+ParserError
+OutOfBoundsDatetime
+EmptyDataError
+DtypeWarning
+crosstab
+SeriesGroupBy
+nunique
+nlargest
+Truthy
+cumcount
+ngroup
+bdate
+toordinal
+julian
+timetz
+timetuple
+freqstr
+daysinmonth
+asm
+TimedeltaIndex
+pytimedelta
+autodetect
+coords
+endswith
+SparseDataFrame
+spmatrix
+swapcase
+rjust
+ndarrary
+regexs
+ptp
+imag
+gca
+keywors
+intercalary
+daysinmonth
+divmod
+autocorr
+asobject
+Argsorts
+xrot
+RangeIndex
+PeriodIndex
+qyear
+timeries
+scikits
+fromDict
+levshape
+putmask
+asi
+repl
\ No newline at end of file
diff --git a/doc/source/style.ipynb b/doc/source/style.ipynb
new file mode 100644
index 0000000000000..152ca90049bf1
--- /dev/null
+++ b/doc/source/style.ipynb
@@ -0,0 +1,1242 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "collapsed": true
+   },
+   "source": [
+    "# Styling\n",
+    "\n",
+    "*New in version 0.17.1*\n",
+    "\n",
+    "<span style=\"color: red\">*Provisional: This is a new feature and still under development. We'll be adding features and possibly making breaking changes in future releases. We'd love to hear your feedback.*</span>\n",
+    "\n",
+    "This document is written as a Jupyter Notebook, and can be viewed or downloaded [here](http://nbviewer.ipython.org/github/pandas-dev/pandas/blob/master/doc/source/style.ipynb).\n",
+    "\n",
+    "You can apply **conditional formatting**, the visual styling of a DataFrame\n",
+    "depending on the data within, by using the ``DataFrame.style`` property.\n",
+    "This is a property that returns a ``Styler`` object, which has\n",
+    "useful methods for formatting and displaying DataFrames.\n",
+    "\n",
+    "The styling is accomplished using CSS.\n",
+    "You write \"style functions\" that take scalars, `DataFrame`s or `Series`, and return *like-indexed* DataFrames or Series with CSS `\"attribute: value\"` pairs for the values.\n",
+    "These functions can be incrementally passed to the `Styler` which collects the styles before rendering."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Building Styles\n",
+    "\n",
+    "Pass your style functions into one of the following methods:\n",
+    "\n",
+    "- ``Styler.applymap``: elementwise\n",
+    "- ``Styler.apply``: column-/row-/table-wise\n",
+    "\n",
+    "Both of those methods take a function (and some other keyword arguments) and applies your function to the DataFrame in a certain way.\n",
+    "`Styler.applymap` works through the DataFrame elementwise.\n",
+    "`Styler.apply` passes each column or row into your DataFrame one-at-a-time or the entire table at once, depending on the `axis` keyword argument.\n",
+    "For columnwise use `axis=0`, rowwise use `axis=1`, and for the entire table at once use `axis=None`.\n",
+    "\n",
+    "For `Styler.applymap` your function should take a scalar and return a single string with the CSS attribute-value pair.\n",
+    "\n",
+    "For `Styler.apply` your function should take a Series or DataFrame (depending on the axis parameter), and return a Series or DataFrame with an identical shape where each value is a string with a CSS attribute-value pair.\n",
+    "\n",
+    "Let's see some examples."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true,
+    "nbsphinx": "hidden"
+   },
+   "outputs": [],
+   "source": [
+    "import matplotlib.pyplot\n",
+    "# We have this here to trigger matplotlib's font cache stuff.\n",
+    "# This cell is hidden from the output"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import pandas as pd\n",
+    "import numpy as np\n",
+    "\n",
+    "np.random.seed(24)\n",
+    "df = pd.DataFrame({'A': np.linspace(1, 10, 10)})\n",
+    "df = pd.concat([df, pd.DataFrame(np.random.randn(10, 4), columns=list('BCDE'))],\n",
+    "               axis=1)\n",
+    "df.iloc[0, 2] = np.nan"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Here's a boring example of rendering a DataFrame, without any (visible) styles:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "*Note*: The `DataFrame.style` attribute is a property that returns a `Styler` object. `Styler` has a `_repr_html_` method defined on it so they are rendered automatically. If you want the actual HTML back for further processing or for writing to file call the `.render()` method which returns a string.\n",
+    "\n",
+    "The above output looks very similar to the standard DataFrame HTML representation. But we've done some work behind the scenes to attach CSS classes to each cell. We can view these by calling the `.render` method."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.highlight_null().render().split('\\n')[:10]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The `row0_col2` is the identifier for that particular cell. We've also prepended each row/column identifier with a UUID unique to each DataFrame so that the style from one doesn't collide with the styling from another within the same notebook or page (you can set the `uuid` if you'd like to tie together the styling of two DataFrames).\n",
+    "\n",
+    "When writing style functions, you take care of producing the CSS attribute / value pairs you want. Pandas matches those up with the CSS classes that identify each cell."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Let's write a simple style function that will color negative numbers red and positive numbers black."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "def color_negative_red(val):\n",
+    "    \"\"\"\n",
+    "    Takes a scalar and returns a string with\n",
+    "    the css property `'color: red'` for negative\n",
+    "    strings, black otherwise.\n",
+    "    \"\"\"\n",
+    "    color = 'red' if val < 0 else 'black'\n",
+    "    return 'color: %s' % color"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "In this case, the cell's style depends only on it's own value.\n",
+    "That means we should use the `Styler.applymap` method which works elementwise."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "s = df.style.applymap(color_negative_red)\n",
+    "s"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Notice the similarity with the standard `df.applymap`, which operates on DataFrames elementwise. We want you to be able to reuse your existing knowledge of how to interact with DataFrames.\n",
+    "\n",
+    "Notice also that our function returned a string containing the CSS attribute and value, separated by a colon just like in a `<style>` tag. This will be a common theme.\n",
+    "\n",
+    "Finally, the input shapes matched. `Styler.applymap` calls the function on each scalar input, and the function returns a scalar output."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Now suppose you wanted to highlight the maximum value in each column.\n",
+    "We can't use `.applymap` anymore since that operated elementwise.\n",
+    "Instead, we'll turn to `.apply` which operates columnwise (or rowwise using the `axis` keyword). Later on we'll see that something like `highlight_max` is already defined on `Styler` so you wouldn't need to write this yourself."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "def highlight_max(s):\n",
+    "    '''\n",
+    "    highlight the maximum in a Series yellow.\n",
+    "    '''\n",
+    "    is_max = s == s.max()\n",
+    "    return ['background-color: yellow' if v else '' for v in is_max]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.apply(highlight_max)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "In this case the input is a `Series`, one column at a time.\n",
+    "Notice that the output shape of `highlight_max` matches the input shape, an array with `len(s)` items."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We encourage you to use method chains to build up a style piecewise, before finally rending at the end of the chain."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.\\\n",
+    "    applymap(color_negative_red).\\\n",
+    "    apply(highlight_max)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Above we used `Styler.apply` to pass in each column one at a time.\n",
+    "\n",
+    "<span style=\"background-color: #DEDEBE\">*Debugging Tip*: If you're having trouble writing your style function, try just passing it into <code style=\"background-color: #DEDEBE\">DataFrame.apply</code>. Internally, <code style=\"background-color: #DEDEBE\">Styler.apply</code> uses <code style=\"background-color: #DEDEBE\">DataFrame.apply</code> so the result should be the same.</span>\n",
+    "\n",
+    "What if you wanted to highlight just the maximum value in the entire table?\n",
+    "Use `.apply(function, axis=None)` to indicate that your function wants the entire table, not one column or row at a time. Let's try that next.\n",
+    "\n",
+    "We'll rewrite our `highlight-max` to handle either Series (from `.apply(axis=0 or 1)`) or DataFrames (from `.apply(axis=None)`). We'll also allow the color to be adjustable, to demonstrate that `.apply`, and `.applymap` pass along keyword arguments."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "def highlight_max(data, color='yellow'):\n",
+    "    '''\n",
+    "    highlight the maximum in a Series or DataFrame\n",
+    "    '''\n",
+    "    attr = 'background-color: {}'.format(color)\n",
+    "    if data.ndim == 1:  # Series from .apply(axis=0) or axis=1\n",
+    "        is_max = data == data.max()\n",
+    "        return [attr if v else '' for v in is_max]\n",
+    "    else:  # from .apply(axis=None)\n",
+    "        is_max = data == data.max().max()\n",
+    "        return pd.DataFrame(np.where(is_max, attr, ''),\n",
+    "                            index=data.index, columns=data.columns)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "When using ``Styler.apply(func, axis=None)``, the function must return a DataFrame with the same index and column labels."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.apply(highlight_max, color='darkorange', axis=None)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Building Styles Summary\n",
+    "\n",
+    "Style functions should return strings with one or more CSS `attribute: value` delimited by semicolons. Use\n",
+    "\n",
+    "- `Styler.applymap(func)` for elementwise styles\n",
+    "- `Styler.apply(func, axis=0)` for columnwise styles\n",
+    "- `Styler.apply(func, axis=1)` for rowwise styles\n",
+    "- `Styler.apply(func, axis=None)` for tablewise styles\n",
+    "\n",
+    "And crucially the input and output shapes of `func` must match. If `x` is the input then ``func(x).shape == x.shape``."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Finer Control: Slicing"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Both `Styler.apply`, and `Styler.applymap` accept a `subset` keyword.\n",
+    "This allows you to apply styles to specific rows or columns, without having to code that logic into your `style` function.\n",
+    "\n",
+    "The value passed to `subset` behaves similar to slicing a DataFrame.\n",
+    "\n",
+    "- A scalar is treated as a column label\n",
+    "- A list (or series or numpy array)\n",
+    "- A tuple is treated as `(row_indexer, column_indexer)`\n",
+    "\n",
+    "Consider using `pd.IndexSlice` to construct the tuple for the last one."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.apply(highlight_max, subset=['B', 'C', 'D'])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "For row and column slicing, any valid indexer to `.loc` will work."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.applymap(color_negative_red,\n",
+    "                  subset=pd.IndexSlice[2:5, ['B', 'D']])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Only label-based slicing is supported right now, not positional.\n",
+    "\n",
+    "If your style function uses a `subset` or `axis` keyword argument, consider wrapping your function in a `functools.partial`, partialing out that keyword.\n",
+    "\n",
+    "```python\n",
+    "my_func2 = functools.partial(my_func, subset=42)\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Finer Control: Display Values\n",
+    "\n",
+    "We distinguish the *display* value from the *actual* value in `Styler`.\n",
+    "To control the display value, the text is printed in each cell, use `Styler.format`. Cells can be formatted according to a [format spec string](https://docs.python.org/3/library/string.html#format-specification-mini-language) or a callable that takes a single value and returns a string."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.format(\"{:.2%}\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Use a dictionary to format specific columns."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.format({'B': \"{:0<4.0f}\", 'D': '{:+.2f}'})"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Or pass in a callable (or dictionary of callables) for more flexible handling."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.format({\"B\": lambda x: \"±{:.2f}\".format(abs(x))})"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Builtin Styles"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Finally, we expect certain styling functions to be common enough that we've included a few \"built-in\" to the `Styler`, so you don't have to write them yourself."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.highlight_null(null_color='red')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "You can create \"heatmaps\" with the `background_gradient` method. These require matplotlib, and we'll use [Seaborn](http://stanford.edu/~mwaskom/software/seaborn/) to get a nice colormap."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import seaborn as sns\n",
+    "\n",
+    "cm = sns.light_palette(\"green\", as_cmap=True)\n",
+    "\n",
+    "s = df.style.background_gradient(cmap=cm)\n",
+    "s"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "`Styler.background_gradient` takes the keyword arguments `low` and `high`. Roughly speaking these extend the range of your data by `low` and `high` percent so that when we convert the colors, the colormap's entire range isn't used. This is useful so that you can actually read the text still."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Uses the full color range\n",
+    "df.loc[:4].style.background_gradient(cmap='viridis')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Compress the color range\n",
+    "(df.loc[:4]\n",
+    "    .style\n",
+    "    .background_gradient(cmap='viridis', low=.5, high=0)\n",
+    "    .highlight_null('red'))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "There's also `.highlight_min` and `.highlight_max`."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.highlight_max(axis=0)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Use `Styler.set_properties` when the style doesn't actually depend on the values."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.set_properties(**{'background-color': 'black',\n",
+    "                           'color': 'lawngreen',\n",
+    "                           'border-color': 'white'})"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Bar charts"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "You can include \"bar charts\" in your DataFrame."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.bar(subset=['A', 'B'], color='#d65f5f')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "New in version 0.20.0 is the ability to customize further the bar chart: You can now have the `df.style.bar` be centered on zero or midpoint value (in addition to the already existing way of having the min value at the left side of the cell), and you can pass a list of `[color_negative, color_positive]`.\n",
+    "\n",
+    "Here's how you can change the above with the new `align='mid'` option:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.bar(subset=['A', 'B'], align='mid', color=['#d65f5f', '#5fba7d'])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The following example aims to give a highlight of the behavior of the new align options:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import pandas as pd\n",
+    "from IPython.display import HTML\n",
+    "\n",
+    "# Test series\n",
+    "test1 = pd.Series([-100,-60,-30,-20], name='All Negative')\n",
+    "test2 = pd.Series([10,20,50,100], name='All Positive')\n",
+    "test3 = pd.Series([-10,-5,0,90], name='Both Pos and Neg')\n",
+    "\n",
+    "head = \"\"\"\n",
+    "<table>\n",
+    "    <thead>\n",
+    "        <th>Align</th>\n",
+    "        <th>All Negative</th>\n",
+    "        <th>All Positive</th>\n",
+    "        <th>Both Neg and Pos</th>\n",
+    "    </thead>\n",
+    "    </tbody>\n",
+    "\n",
+    "\"\"\"\n",
+    "\n",
+    "aligns = ['left','zero','mid']\n",
+    "for align in aligns:\n",
+    "    row = \"<tr><th>{}</th>\".format(align)\n",
+    "    for serie in [test1,test2,test3]:\n",
+    "        s = serie.copy()\n",
+    "        s.name=''\n",
+    "        row += \"<td>{}</td>\".format(s.to_frame().style.bar(align=align, \n",
+    "                                                           color=['#d65f5f', '#5fba7d'], \n",
+    "                                                           width=100).render()) #testn['width']\n",
+    "    row += '</tr>'\n",
+    "    head += row\n",
+    "    \n",
+    "head+= \"\"\"\n",
+    "</tbody>\n",
+    "</table>\"\"\"\n",
+    "        \n",
+    "\n",
+    "HTML(head)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Sharing Styles"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Say you have a lovely style built up for a DataFrame, and now you want to apply the same style to a second DataFrame. Export the style with `df1.style.export`, and import it on the second DataFrame with `df1.style.set`"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df2 = -df\n",
+    "style1 = df.style.applymap(color_negative_red)\n",
+    "style1"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "style2 = df2.style\n",
+    "style2.use(style1.export())\n",
+    "style2"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Notice that you're able share the styles even though they're data aware. The styles are re-evaluated on the new DataFrame they've been `use`d upon."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Other Options\n",
+    "\n",
+    "You've seen a few methods for data-driven styling.\n",
+    "`Styler` also provides a few other options for styles that don't depend on the data.\n",
+    "\n",
+    "- precision\n",
+    "- captions\n",
+    "- table-wide styles\n",
+    "- hiding the index or columns\n",
+    "\n",
+    "Each of these can be specified in two ways:\n",
+    "\n",
+    "- A keyword argument to `Styler.__init__`\n",
+    "- A call to one of the `.set_` or `.hide_` methods, e.g. `.set_caption` or `.hide_columns`\n",
+    "\n",
+    "The best method to use depends on the context. Use the `Styler` constructor when building many styled DataFrames that should all share the same properties. For interactive use, the`.set_` and `.hide_` methods are more convenient."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Precision"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "You can control the precision of floats using pandas' regular `display.precision` option."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "with pd.option_context('display.precision', 2):\n",
+    "    html = (df.style\n",
+    "              .applymap(color_negative_red)\n",
+    "              .apply(highlight_max))\n",
+    "html"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Or through a `set_precision` method."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style\\\n",
+    "  .applymap(color_negative_red)\\\n",
+    "  .apply(highlight_max)\\\n",
+    "  .set_precision(2)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Setting the precision only affects the printed number; the full-precision values are always passed to your style functions. You can always use `df.round(2).style` if you'd prefer to round from the start."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Captions"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Regular table captions can be added in a few ways."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.set_caption('Colormaps, with a caption.')\\\n",
+    "    .background_gradient(cmap=cm)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Table Styles"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The next option you have are \"table styles\".\n",
+    "These are styles that apply to the table as a whole, but don't look at the data.\n",
+    "Certain sytlings, including pseudo-selectors like `:hover` can only be used this way."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from IPython.display import HTML\n",
+    "\n",
+    "def hover(hover_color=\"#ffff99\"):\n",
+    "    return dict(selector=\"tr:hover\",\n",
+    "                props=[(\"background-color\", \"%s\" % hover_color)])\n",
+    "\n",
+    "styles = [\n",
+    "    hover(),\n",
+    "    dict(selector=\"th\", props=[(\"font-size\", \"150%\"),\n",
+    "                               (\"text-align\", \"center\")]),\n",
+    "    dict(selector=\"caption\", props=[(\"caption-side\", \"bottom\")])\n",
+    "]\n",
+    "html = (df.style.set_table_styles(styles)\n",
+    "          .set_caption(\"Hover to highlight.\"))\n",
+    "html"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "`table_styles` should be a list of dictionaries.\n",
+    "Each dictionary should have the `selector` and `props` keys.\n",
+    "The value for `selector` should be a valid CSS selector.\n",
+    "Recall that all the styles are already attached to an `id`, unique to\n",
+    "each `Styler`. This selector is in addition to that `id`.\n",
+    "The value for `props` should be a list of tuples of `('attribute', 'value')`.\n",
+    "\n",
+    "`table_styles` are extremely flexible, but not as fun to type out by hand.\n",
+    "We hope to collect some useful ones either in pandas, or preferable in a new package that [builds on top](#Extensibility) the tools here."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Hiding the Index or Columns"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The index can be hidden from rendering by calling `Styler.hide_index`. Columns can be hidden from rendering by calling `Styler.hide_columns` and passing in the name of a column, or a slice of columns."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.hide_index()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.hide_columns(['C','D'])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### CSS Classes\n",
+    "\n",
+    "Certain CSS classes are attached to cells.\n",
+    "\n",
+    "- Index and Column names include `index_name` and `level<k>` where `k` is its level in a MultiIndex\n",
+    "- Index label cells include\n",
+    "  + `row_heading`\n",
+    "  + `row<n>` where `n` is the numeric position of the row\n",
+    "  + `level<k>` where `k` is the level in a MultiIndex\n",
+    "- Column label cells include\n",
+    "  + `col_heading`\n",
+    "  + `col<n>` where `n` is the numeric position of the column\n",
+    "  + `level<k>` where `k` is the level in a MultiIndex\n",
+    "- Blank cells include `blank`\n",
+    "- Data cells include `data`"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Limitations\n",
+    "\n",
+    "- DataFrame only `(use Series.to_frame().style)`\n",
+    "- The index and columns must be unique\n",
+    "- No large repr, and performance isn't great; this is intended for summary DataFrames\n",
+    "- You can only style the *values*, not the index or columns\n",
+    "- You can only apply styles, you can't insert new HTML entities\n",
+    "\n",
+    "Some of these will be addressed in the future.\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Terms\n",
+    "\n",
+    "- Style function: a function that's passed into `Styler.apply` or `Styler.applymap` and returns values like `'css attribute: value'`\n",
+    "- Builtin style functions: style functions that are methods on `Styler`\n",
+    "- table style: a dictionary with the two keys `selector` and `props`. `selector` is the CSS selector that `props` will apply to. `props` is a list of `(attribute, value)` tuples. A list of table styles passed into `Styler`."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Fun stuff\n",
+    "\n",
+    "Here are a few interesting examples.\n",
+    "\n",
+    "`Styler` interacts pretty well with widgets. If you're viewing this online instead of running the notebook yourself, you're missing out on interactively adjusting the color palette."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "from IPython.html import widgets\n",
+    "@widgets.interact\n",
+    "def f(h_neg=(0, 359, 1), h_pos=(0, 359), s=(0., 99.9), l=(0., 99.9)):\n",
+    "    return df.style.background_gradient(\n",
+    "        cmap=sns.palettes.diverging_palette(h_neg=h_neg, h_pos=h_pos, s=s, l=l,\n",
+    "                                            as_cmap=True)\n",
+    "    )"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "def magnify():\n",
+    "    return [dict(selector=\"th\",\n",
+    "                 props=[(\"font-size\", \"4pt\")]),\n",
+    "            dict(selector=\"td\",\n",
+    "                 props=[('padding', \"0em 0em\")]),\n",
+    "            dict(selector=\"th:hover\",\n",
+    "                 props=[(\"font-size\", \"12pt\")]),\n",
+    "            dict(selector=\"tr:hover td:hover\",\n",
+    "                 props=[('max-width', '200px'),\n",
+    "                        ('font-size', '12pt')])\n",
+    "]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "np.random.seed(25)\n",
+    "cmap = cmap=sns.diverging_palette(5, 250, as_cmap=True)\n",
+    "bigdf = pd.DataFrame(np.random.randn(20, 25)).cumsum()\n",
+    "\n",
+    "bigdf.style.background_gradient(cmap, axis=1)\\\n",
+    "    .set_properties(**{'max-width': '80px', 'font-size': '1pt'})\\\n",
+    "    .set_caption(\"Hover to magnify\")\\\n",
+    "    .set_precision(2)\\\n",
+    "    .set_table_styles(magnify())"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Export to Excel\n",
+    "\n",
+    "*New in version 0.20.0*\n",
+    "\n",
+    "<span style=\"color: red\">*Experimental: This is a new feature and still under development. We'll be adding features and possibly making breaking changes in future releases. We'd love to hear your feedback.*</span>\n",
+    "\n",
+    "Some support is available for exporting styled `DataFrames` to Excel worksheets using the `OpenPyXL` or `XlsxWriter` engines. CSS2.2 properties handled include:\n",
+    "\n",
+    "- `background-color`\n",
+    "- `border-style`, `border-width`, `border-color` and their {`top`, `right`, `bottom`, `left` variants}\n",
+    "- `color`\n",
+    "- `font-family`\n",
+    "- `font-style`\n",
+    "- `font-weight`\n",
+    "- `text-align`\n",
+    "- `text-decoration`\n",
+    "- `vertical-align`\n",
+    "- `white-space: nowrap`\n",
+    "\n",
+    "Only CSS2 named colors and hex colors of the form `#rgb` or `#rrggbb` are currently supported."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "df.style.\\\n",
+    "    applymap(color_negative_red).\\\n",
+    "    apply(highlight_max).\\\n",
+    "    to_excel('styled.xlsx', engine='openpyxl')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "A screenshot of the output:\n",
+    "\n",
+    "![Excel spreadsheet with styled DataFrame](_static/style-excel.png)\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Extensibility\n",
+    "\n",
+    "The core of pandas is, and will remain, its \"high-performance, easy-to-use data structures\".\n",
+    "With that in mind, we hope that `DataFrame.style` accomplishes two goals\n",
+    "\n",
+    "- Provide an API that is pleasing to use interactively and is \"good enough\" for many tasks\n",
+    "- Provide the foundations for dedicated libraries to build on\n",
+    "\n",
+    "If you build a great library on top of this, let us know and we'll [link](http://pandas.pydata.org/pandas-docs/stable/ecosystem.html) to it.\n",
+    "\n",
+    "### Subclassing\n",
+    "\n",
+    "If the default template doesn't quite suit your needs, you can subclass Styler and extend or override the template.\n",
+    "We'll show an example of extending the default template to insert a custom header before each table."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "from jinja2 import Environment, ChoiceLoader, FileSystemLoader\n",
+    "from IPython.display import HTML\n",
+    "from pandas.io.formats.style import Styler"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "%mkdir templates"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "This next cell writes the custom template.\n",
+    "We extend the template `html.tpl`, which comes with pandas."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "%%file templates/myhtml.tpl\n",
+    "{% extends \"html.tpl\" %}\n",
+    "{% block table %}\n",
+    "<h1>{{ table_title|default(\"My Table\") }}</h1>\n",
+    "{{ super() }}\n",
+    "{% endblock table %}"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Now that we've created a template, we need to set up a subclass of ``Styler`` that\n",
+    "knows about it."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "class MyStyler(Styler):\n",
+    "    env = Environment(\n",
+    "        loader=ChoiceLoader([\n",
+    "            FileSystemLoader(\"templates\"),  # contains ours\n",
+    "            Styler.loader,  # the default\n",
+    "        ])\n",
+    "    )\n",
+    "    template = env.get_template(\"myhtml.tpl\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Notice that we include the original loader in our environment's loader.\n",
+    "That's because we extend the original template, so the Jinja environment needs\n",
+    "to be able to find it.\n",
+    "\n",
+    "Now we can use that custom styler. It's `__init__` takes a DataFrame."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "MyStyler(df)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Our custom template accepts a `table_title` keyword. We can provide the value in the `.render` method."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "HTML(MyStyler(df).render(table_title=\"Extending Example\"))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "For convenience, we provide the `Styler.from_custom_template` method that does the same as the custom subclass."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "EasyStyler = Styler.from_custom_template(\"templates\", \"myhtml.tpl\")\n",
+    "EasyStyler(df)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Here's the template structure:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "with open(\"template_structure.html\") as f:\n",
+    "    structure = f.read()\n",
+    "    \n",
+    "HTML(structure)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "See the template in the [GitHub repo](https://github.com/pandas-dev/pandas) for more details."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true,
+    "nbsphinx": "hidden"
+   },
+   "outputs": [],
+   "source": [
+    "# Hack to get the same style in the notebook as the\n",
+    "# main site. This is hidden in the docs.\n",
+    "from IPython.display import HTML\n",
+    "with open(\"themes/nature_with_gtoc/static/nature.css_t\") as f:\n",
+    "    css = f.read()\n",
+    "    \n",
+    "HTML('<style>{}</style>'.format(css))"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python [default]",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.5.3"
+  },
+  "widgets": {
+   "application/vnd.jupyter.widget-state+json": {
+    "state": {},
+    "version_major": 1,
+    "version_minor": 0
+   }
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 1
+}
diff --git a/doc/source/template_structure.html b/doc/source/template_structure.html
new file mode 100644
index 0000000000000..0778d8e2e6f18
--- /dev/null
+++ b/doc/source/template_structure.html
@@ -0,0 +1,57 @@
+<!--
+     This is an HTML fragment that gets included into a notebook & rst document
+
+     Inspired by nbconvert
+
+     https://github.com/jupyter/nbconvert/blob/8ac591a0b8694147d0f34bf6392594c2811c1395/docs/source/template_structure.html
+
+
+   -->
+<style type="text/css">
+    /* Overrides of notebook CSS for static HTML export */
+    .template_block {
+        background-color: hsla(120, 60%, 70%, 0.2);
+        margin: 10px;
+        padding: 5px;
+        border: 1px solid hsla(120, 60%, 70%, 0.5);
+        border-left: 2px solid black;
+    }
+    .template_block pre {
+        background: transparent;
+        padding: 0;
+    }
+    .big_vertical_ellipsis {
+        font-size: 24pt;
+    }
+</style>
+
+<div class="template_block">before_style</div>
+<div class="template_block">style
+    <pre>&lt;style type=&quot;text/css&quot;&gt;</pre>
+    <div class="template_block">table_styles</div>
+    <div class="template_block">before_cellstyle</div>
+    <div class="template_block">cellstyle</div>
+    <pre>&lt;/style&gt;</pre>
+</div><!-- /style -->
+
+<div class="template_block" >before_table</div>
+
+<div class="template_block" >table
+    <pre>&lt;table ...&gt;</pre>
+    <div class="template_block">caption</div>
+
+    <div class="template_block" >thead
+        <div class="template_block" >before_head_rows</div>
+        <div class="template_block">head_tr (loop over headers)</div>
+        <div class="template_block" >after_head_rows</div>
+    </div>
+
+    <div class="template_block" >tbody
+        <div class="template_block" >before_rows</div>
+        <div class="template_block">tr (loop over data rows)</div>
+        <div class="template_block" >after_rows</div>
+    </div>
+    <pre>&lt;/table&gt;</pre>
+</div><!-- /table -->
+
+<div class="template_block" >after_table</div>
diff --git a/doc/source/text.rst b/doc/source/text.rst
index ee4f96b41c7de..34bb1a07dfc08 100644
--- a/doc/source/text.rst
+++ b/doc/source/text.rst
@@ -9,7 +9,7 @@
    randn = np.random.randn
    np.set_printoptions(precision=4, suppress=True)
    from pandas.compat import lrange
-   options.display.max_rows=15
+   pd.options.display.max_rows=15
 
 ======================
 Working with Text Data
@@ -55,14 +55,31 @@ Since ``df.columns`` is an Index object, we can use the ``.str`` accessor
    df.columns.str.lower()
 
 These string methods can then be used to clean up the columns as needed.
-Here we are removing leading and trailing whitespaces, lowercasing all names,
-and replacing any remaining whitespaces with underscores:
+Here we are removing leading and trailing white spaces, lower casing all names,
+and replacing any remaining white spaces with underscores:
 
 .. ipython:: python
 
    df.columns = df.columns.str.strip().str.lower().str.replace(' ', '_')
    df
 
+.. note::
+
+    If you have a ``Series`` where lots of elements are repeated
+    (i.e. the number of unique elements in the ``Series`` is a lot smaller than the length of the
+    ``Series``), it can be faster to convert the original ``Series`` to one of type
+    ``category`` and then use ``.str.<method>`` or ``.dt.<property>`` on that.
+    The performance difference comes from the fact that, for ``Series`` of type ``category``, the
+    string operations are done on the ``.categories`` and not on each element of the
+    ``Series``.
+
+    Please note that a ``Series`` of type ``category`` with string ``.categories`` has
+    some limitations in comparison of ``Series`` of type string (e.g. you can't add strings to
+    each other: ``s + " " + s`` won't work if ``s`` is a ``Series`` of type ``category``). Also,
+    ``.str`` methods which operate on elements of type ``list`` are not available on such a
+    ``Series``.
+
+
 Splitting and Replacing Strings
 -------------------------------
 
@@ -82,7 +99,7 @@ Elements in the split lists can be accessed using ``get`` or ``[]`` notation:
    s2.str.split('_').str.get(1)
    s2.str.split('_').str[1]
 
-Easy to expand this to return a DataFrame using ``expand``.
+It is easy to expand this to return a DataFrame using ``expand``.
 
 .. ipython:: python
 
@@ -101,8 +118,8 @@ i.e., from the end of the string to the beginning of the string:
 
    s2.str.rsplit('_', expand=True, n=1)
 
-Methods like ``replace`` and ``findall`` take `regular expressions
-<https://docs.python.org/2/library/re.html>`__, too:
+``replace`` by default replaces `regular expressions
+<https://docs.python.org/3/library/re.html>`__:
 
 .. ipython:: python
 
@@ -129,6 +146,189 @@ following code will cause trouble because of the regular expression meaning of
    # We need to escape the special character (for >1 len patterns)
    dollars.str.replace(r'-\$', '-')
 
+.. versionadded:: 0.23.0
+
+If you do want literal replacement of a string (equivalent to
+:meth:`str.replace`), you can set the optional ``regex`` parameter to
+``False``, rather than escaping each character. In this case both ``pat``
+and ``repl`` must be strings:
+
+.. ipython:: python
+
+    # These lines are equivalent
+    dollars.str.replace(r'-\$', '-')
+    dollars.str.replace('-$', '-', regex=False)
+
+.. versionadded:: 0.20.0
+
+The ``replace`` method can also take a callable as replacement. It is called
+on every ``pat`` using :func:`re.sub`. The callable should expect one
+positional argument (a regex object) and return a string.
+
+.. ipython:: python
+
+   # Reverse every lowercase alphabetic word
+   pat = r'[a-z]+'
+   repl = lambda m: m.group(0)[::-1]
+   pd.Series(['foo 123', 'bar baz', np.nan]).str.replace(pat, repl)
+
+   # Using regex groups
+   pat = r"(?P<one>\w+) (?P<two>\w+) (?P<three>\w+)"
+   repl = lambda m: m.group('two').swapcase()
+   pd.Series(['Foo Bar Baz', np.nan]).str.replace(pat, repl)
+
+.. versionadded:: 0.20.0
+
+The ``replace`` method also accepts a compiled regular expression object
+from :func:`re.compile` as a pattern. All flags should be included in the
+compiled regular expression object.
+
+.. ipython:: python
+
+   import re
+   regex_pat = re.compile(r'^.a|dog', flags=re.IGNORECASE)
+   s3.str.replace(regex_pat, 'XX-XX ')
+
+Including a ``flags`` argument when calling ``replace`` with a compiled
+regular expression object will raise a ``ValueError``.
+
+.. ipython::
+
+    @verbatim
+    In [1]: s3.str.replace(regex_pat, 'XX-XX ', flags=re.IGNORECASE)
+    ---------------------------------------------------------------------------
+    ValueError: case and flags cannot be set when pat is a compiled regex
+
+.. _text.concatenate:
+
+Concatenation
+-------------
+
+There are several ways to concatenate a ``Series`` or ``Index``, either with itself or others, all based on :meth:`~Series.str.cat`,
+resp. ``Index.str.cat``.
+
+Concatenating a single Series into a string
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The content of a ``Series`` (or ``Index``) can be concatenated:
+
+.. ipython:: python
+
+    s = pd.Series(['a', 'b', 'c', 'd'])
+    s.str.cat(sep=',')
+    
+If not specified, the keyword ``sep`` for the separator defaults to the empty string, ``sep=''``:
+
+.. ipython:: python
+
+    s.str.cat()
+
+By default, missing values are ignored. Using ``na_rep``, they can be given a representation:
+
+.. ipython:: python
+
+    t = pd.Series(['a', 'b', np.nan, 'd'])
+    t.str.cat(sep=',')
+    t.str.cat(sep=',', na_rep='-')
+
+Concatenating a Series and something list-like into a Series
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The first argument to :meth:`~Series.str.cat` can be a list-like object, provided that it matches the length of the calling ``Series`` (or ``Index``).
+
+.. ipython:: python
+
+    s.str.cat(['A', 'B', 'C', 'D'])
+    
+Missing values on either side will result in missing values in the result as well, *unless* ``na_rep`` is specified:
+
+.. ipython:: python
+
+    s.str.cat(t)
+    s.str.cat(t, na_rep='-')
+
+Concatenating a Series and something array-like into a Series
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. versionadded:: 0.23.0
+
+The parameter ``others`` can also be two-dimensional. In this case, the number or rows must match the lengths of the calling ``Series`` (or ``Index``).
+
+.. ipython:: python
+
+    d = pd.concat([t, s], axis=1)
+    s
+    d
+    s.str.cat(d, na_rep='-')
+    
+Concatenating a Series and an indexed object into a Series, with alignment
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. versionadded:: 0.23.0
+
+For concatenation with a ``Series`` or ``DataFrame``, it is possible to align the indexes before concatenation by setting
+the ``join``-keyword.
+
+.. ipython:: python
+
+    u = pd.Series(['b', 'd', 'a', 'c'], index=[1, 3, 0, 2])
+    s
+    u
+    s.str.cat(u)
+    s.str.cat(u, join='left')
+
+.. warning::
+
+    If the ``join`` keyword is not passed, the method :meth:`~Series.str.cat` will currently fall back to the behavior before version 0.23.0 (i.e. no alignment),
+    but a ``FutureWarning`` will be raised if any of the involved indexes differ, since this default will change to ``join='left'`` in a future version.
+
+The usual options are available for ``join`` (one of ``'left', 'outer', 'inner', 'right'``).
+In particular, alignment also means that the different lengths do not need to coincide anymore.
+
+.. ipython:: python
+
+    v = pd.Series(['z', 'a', 'b', 'd', 'e'], index=[-1, 0, 1, 3, 4])
+    s
+    v
+    s.str.cat(v, join='left', na_rep='-')
+    s.str.cat(v, join='outer', na_rep='-')
+
+The same alignment can be used when ``others`` is a ``DataFrame``:
+
+.. ipython:: python
+    
+    f = d.loc[[3, 2, 1, 0], :]
+    s
+    f
+    s.str.cat(f, join='left', na_rep='-')
+
+Concatenating a Series and many objects into a Series
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+All one-dimensional list-likes can be arbitrarily combined in a list-like container (including iterators, ``dict``-views, etc.):
+
+.. ipython:: python
+
+    s
+    u
+    s.str.cat([u, pd.Index(u.values), ['A', 'B', 'C', 'D'], map(str, u.index)], na_rep='-')
+
+All elements must match in length to the calling ``Series`` (or ``Index``), except those having an index if ``join`` is not None:
+
+.. ipython:: python
+
+    v
+    s.str.cat([u, v, ['A', 'B', 'C', 'D']], join='outer', na_rep='-')
+
+If using ``join='right'`` on a list of ``others`` that contains different indexes,
+the union of these indexes will be used as the basis for the final concatenation:
+
+.. ipython:: python
+
+    u.loc[[3]]
+    v.loc[[-1, 0]]
+    s.str.cat([u.loc[[3]], v.loc[[-1, 0]]], join='right', na_rep='-')
+
 Indexing with ``.str``
 ----------------------
 
@@ -151,93 +351,210 @@ Extracting Substrings
 
 .. _text.extract:
 
-The method ``extract`` (introduced in version 0.13) accepts `regular expressions
-<https://docs.python.org/2/library/re.html>`__ with match groups. Extracting a
-regular expression with one group returns a Series of strings.
+Extract first match in each subject (extract)
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
-.. ipython:: python
+.. warning::
 
-   pd.Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)')
+   In version 0.18.0, ``extract`` gained the ``expand`` argument. When
+   ``expand=False`` it returns a ``Series``, ``Index``, or
+   ``DataFrame``, depending on the subject and regular expression
+   pattern (same behavior as pre-0.18.0). When ``expand=True`` it
+   always returns a ``DataFrame``, which is more consistent and less
+   confusing from the perspective of a user. ``expand=True`` is the
+   default since version 0.23.0.
 
-Elements that do not match return ``NaN``. Extracting a regular expression
-with more than one group returns a DataFrame with one column per group.
+The ``extract`` method accepts a `regular expression
+<https://docs.python.org/3/library/re.html>`__ with at least one
+capture group.
 
-.. ipython:: python
+Extracting a regular expression with more than one group returns a
+DataFrame with one column per group.
 
-   pd.Series(['a1', 'b2', 'c3']).str.extract('([ab])(\d)')
+.. ipython:: python
 
-Elements that do not match return a row filled with ``NaN``.
-Thus, a Series of messy strings can be "converted" into a
-like-indexed Series or DataFrame of cleaned-up or more useful strings,
-without necessitating ``get()`` to access tuples or ``re.match`` objects.
+   pd.Series(['a1', 'b2', 'c3']).str.extract('([ab])(\d)', expand=False)
 
-The results dtype always is object, even if no match is found and the result
-only contains ``NaN``.
+Elements that do not match return a row filled with ``NaN``. Thus, a
+Series of messy strings can be "converted" into a like-indexed Series
+or DataFrame of cleaned-up or more useful strings, without
+necessitating ``get()`` to access tuples or ``re.match`` objects. The
+dtype of the result is always object, even if no match is found and
+the result only contains ``NaN``.
 
 Named groups like
 
 .. ipython:: python
 
-   pd.Series(['a1', 'b2', 'c3']).str.extract('(?P<letter>[ab])(?P<digit>\d)')
+   pd.Series(['a1', 'b2', 'c3']).str.extract('(?P<letter>[ab])(?P<digit>\d)', expand=False)
 
 and optional groups like
 
 .. ipython:: python
 
-   pd.Series(['a1', 'b2', '3']).str.extract('(?P<letter>[ab])?(?P<digit>\d)')
+   pd.Series(['a1', 'b2', '3']).str.extract('([ab])?(\d)', expand=False)
+
+can also be used. Note that any capture group names in the regular
+expression will be used for column names; otherwise capture group
+numbers will be used.
+
+Extracting a regular expression with one group returns a ``DataFrame``
+with one column if ``expand=True``.
+
+.. ipython:: python
+
+   pd.Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)', expand=True)
+
+It returns a Series if ``expand=False``.
+
+.. ipython:: python
+
+   pd.Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)', expand=False)
+
+Calling on an ``Index`` with a regex with exactly one capture group
+returns a ``DataFrame`` with one column if ``expand=True``.
+
+.. ipython:: python
+
+   s = pd.Series(["a1", "b2", "c3"], ["A11", "B22", "C33"])
+   s
+   s.index.str.extract("(?P<letter>[a-zA-Z])", expand=True)
+
+It returns an ``Index`` if ``expand=False``.
+
+.. ipython:: python
+
+   s.index.str.extract("(?P<letter>[a-zA-Z])", expand=False)
+
+Calling on an ``Index`` with a regex with more than one capture group
+returns a ``DataFrame`` if ``expand=True``.
+
+.. ipython:: python
+
+   s.index.str.extract("(?P<letter>[a-zA-Z])([0-9]+)", expand=True)
+
+It raises ``ValueError`` if ``expand=False``.
+
+.. code-block:: python
+
+    >>> s.index.str.extract("(?P<letter>[a-zA-Z])([0-9]+)", expand=False)
+    ValueError: only one regex group is supported with Index
+
+The table below summarizes the behavior of ``extract(expand=False)``
+(input subject in first column, number of groups in regex in
+first row)
+
++--------+---------+------------+
+|        | 1 group | >1 group   |
++--------+---------+------------+
+| Index  | Index   | ValueError |
++--------+---------+------------+
+| Series | Series  | DataFrame  |
++--------+---------+------------+
+
+Extract all matches in each subject (extractall)
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. _text.extractall:
+
+.. versionadded:: 0.18.0
+
+Unlike ``extract`` (which returns only the first match),
+
+.. ipython:: python
+
+   s = pd.Series(["a1a2", "b1", "c1"], index=["A", "B", "C"])
+   s
+   two_groups = '(?P<letter>[a-z])(?P<digit>[0-9])'
+   s.str.extract(two_groups, expand=True)
+
+the ``extractall`` method returns every match. The result of
+``extractall`` is always a ``DataFrame`` with a ``MultiIndex`` on its
+rows. The last level of the ``MultiIndex`` is named ``match`` and
+indicates the order in the subject.
+
+.. ipython:: python
+
+   s.str.extractall(two_groups)
+
+When each subject string in the Series has exactly one match,
+
+.. ipython:: python
+
+   s = pd.Series(['a3', 'b3', 'c2'])
+   s
+
+then ``extractall(pat).xs(0, level='match')`` gives the same result as
+``extract(pat)``.
+
+.. ipython:: python
+
+   extract_result = s.str.extract(two_groups, expand=True)
+   extract_result
+   extractall_result = s.str.extractall(two_groups)
+   extractall_result
+   extractall_result.xs(0, level="match")
+
+``Index`` also supports ``.str.extractall``. It returns a ``DataFrame`` which has the
+same result as a ``Series.str.extractall`` with a default index (starts from 0).
+
+.. versionadded:: 0.19.0
+
+.. ipython:: python
+
+   pd.Index(["a1a2", "b1", "c1"]).str.extractall(two_groups)
+
+   pd.Series(["a1a2", "b1", "c1"]).str.extractall(two_groups)
 
-can also be used.
 
 Testing for Strings that Match or Contain a Pattern
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+---------------------------------------------------
 
 You can check whether elements contain a pattern:
 
 .. ipython:: python
 
-   pattern = r'[a-z][0-9]'
+   pattern = r'[0-9][a-z]'
    pd.Series(['1', '2', '3a', '3b', '03c']).str.contains(pattern)
 
-or match a pattern:
-
+Or whether elements match a pattern:
 
 .. ipython:: python
 
-   pd.Series(['1', '2', '3a', '3b', '03c']).str.match(pattern, as_indexer=True)
+   pd.Series(['1', '2', '3a', '3b', '03c']).str.match(pattern)
 
 The distinction between ``match`` and ``contains`` is strictness: ``match``
 relies on strict ``re.match``, while ``contains`` relies on ``re.search``.
 
-.. warning::
-
-   In previous versions, ``match`` was for *extracting* groups,
-   returning a not-so-convenient Series of tuples. The new method ``extract``
-   (described in the previous section) is now preferred.
-
-   This old, deprecated behavior of ``match`` is still the default. As
-   demonstrated above, use the new behavior by setting ``as_indexer=True``.
-   In this mode, ``match`` is analogous to ``contains``, returning a boolean
-   Series. The new behavior will become the default behavior in a future
-   release.
-
 Methods like ``match``, ``contains``, ``startswith``, and ``endswith`` take
- an extra ``na`` argument so missing values can be considered True or False:
+an extra ``na`` argument so missing values can be considered True or False:
 
 .. ipython:: python
 
    s4 = pd.Series(['A', 'B', 'C', 'Aaba', 'Baca', np.nan, 'CABA', 'dog', 'cat'])
    s4.str.contains('A', na=False)
 
+.. _text.indicator:
+
 Creating Indicator Variables
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+----------------------------
 
 You can extract dummy variables from string columns.
 For example if they are separated by a ``'|'``:
 
-  .. ipython:: python
+.. ipython:: python
+
+    s = pd.Series(['a', 'a|b', np.nan, 'a|c'])
+    s.str.get_dummies(sep='|')
+
+String ``Index`` also supports ``get_dummies`` which returns a ``MultiIndex``.
 
-      s = pd.Series(['a', 'a|b', np.nan, 'a|c'])
-      s.str.get_dummies(sep='|')
+.. versionadded:: 0.18.1
+
+.. ipython:: python
+
+    idx = pd.Index(['a', 'a|b', np.nan, 'a|c'])
+    idx.str.get_dummies(sep='|')
 
 See also :func:`~pandas.get_dummies`.
 
@@ -249,51 +566,54 @@ Method Summary
 .. csv-table::
     :header: "Method", "Description"
     :widths: 20, 80
-
-    :meth:`~Series.str.cat`,Concatenate strings
-    :meth:`~Series.str.split`,Split strings on delimiter
-    :meth:`~Series.str.rsplit`,Split strings on delimiter working from the end of the string
-    :meth:`~Series.str.get`,Index into each element (retrieve i-th element)
-    :meth:`~Series.str.join`,Join strings in each element of the Series with passed separator
-    :meth:`~Series.str.contains`,Return boolean array if each string contains pattern/regex
-    :meth:`~Series.str.replace`,Replace occurrences of pattern/regex with some other string
-    :meth:`~Series.str.repeat`,Duplicate values (``s.str.repeat(3)`` equivalent to ``x * 3``)
-    :meth:`~Series.str.pad`,"Add whitespace to left, right, or both sides of strings"
-    :meth:`~Series.str.center`,Equivalent to ``str.center``
-    :meth:`~Series.str.ljust`,Equivalent to ``str.ljust``
-    :meth:`~Series.str.rjust`,Equivalent to ``str.rjust``
-    :meth:`~Series.str.zfill`,Equivalent to ``str.zfill``
-    :meth:`~Series.str.wrap`,Split long strings into lines with length less than a given width
-    :meth:`~Series.str.slice`,Slice each string in the Series
-    :meth:`~Series.str.slice_replace`,Replace slice in each string with passed value
-    :meth:`~Series.str.count`,Count occurrences of pattern
-    :meth:`~Series.str.startswith`,Equivalent to ``str.startswith(pat)`` for each element
-    :meth:`~Series.str.endswith`,Equivalent to ``str.endswith(pat)`` for each element
-    :meth:`~Series.str.findall`,Compute list of all occurrences of pattern/regex for each string
-    :meth:`~Series.str.match`,"Call ``re.match`` on each element, returning matched groups as list"
-    :meth:`~Series.str.extract`,"Call ``re.match`` on each element, as ``match`` does, but return matched groups as strings for convenience."
-    :meth:`~Series.str.len`,Compute string lengths
-    :meth:`~Series.str.strip`,Equivalent to ``str.strip``
-    :meth:`~Series.str.rstrip`,Equivalent to ``str.rstrip``
-    :meth:`~Series.str.lstrip`,Equivalent to ``str.lstrip``
-    :meth:`~Series.str.partition`,Equivalent to ``str.partition``
-    :meth:`~Series.str.rpartition`,Equivalent to ``str.rpartition``
-    :meth:`~Series.str.lower`,Equivalent to ``str.lower``
-    :meth:`~Series.str.upper`,Equivalent to ``str.upper``
-    :meth:`~Series.str.find`,Equivalent to ``str.find``
-    :meth:`~Series.str.rfind`,Equivalent to ``str.rfind``
-    :meth:`~Series.str.index`,Equivalent to ``str.index``
-    :meth:`~Series.str.rindex`,Equivalent to ``str.rindex``
-    :meth:`~Series.str.capitalize`,Equivalent to ``str.capitalize``
-    :meth:`~Series.str.swapcase`,Equivalent to ``str.swapcase``
-    :meth:`~Series.str.normalize`,Return Unicode normal form. Equivalent to ``unicodedata.normalize``
-    :meth:`~Series.str.translate`,Equivalent to ``str.translate``
-    :meth:`~Series.str.isalnum`,Equivalent to ``str.isalnum``
-    :meth:`~Series.str.isalpha`,Equivalent to ``str.isalpha``
-    :meth:`~Series.str.isdigit`,Equivalent to ``str.isdigit``
-    :meth:`~Series.str.isspace`,Equivalent to ``str.isspace``
-    :meth:`~Series.str.islower`,Equivalent to ``str.islower``
-    :meth:`~Series.str.isupper`,Equivalent to ``str.isupper``
-    :meth:`~Series.str.istitle`,Equivalent to ``str.istitle``
-    :meth:`~Series.str.isnumeric`,Equivalent to ``str.isnumeric``
-    :meth:`~Series.str.isdecimal`,Equivalent to ``str.isdecimal``
+    :delim: ;
+
+    :meth:`~Series.str.cat`;Concatenate strings
+    :meth:`~Series.str.split`;Split strings on delimiter
+    :meth:`~Series.str.rsplit`;Split strings on delimiter working from the end of the string
+    :meth:`~Series.str.get`;Index into each element (retrieve i-th element)
+    :meth:`~Series.str.join`;Join strings in each element of the Series with passed separator
+    :meth:`~Series.str.get_dummies`;Split strings on the delimiter returning DataFrame of dummy variables
+    :meth:`~Series.str.contains`;Return boolean array if each string contains pattern/regex
+    :meth:`~Series.str.replace`;Replace occurrences of pattern/regex/string with some other string or the return value of a callable given the occurrence
+    :meth:`~Series.str.repeat`;Duplicate values (``s.str.repeat(3)`` equivalent to ``x * 3``)
+    :meth:`~Series.str.pad`;"Add whitespace to left, right, or both sides of strings"
+    :meth:`~Series.str.center`;Equivalent to ``str.center``
+    :meth:`~Series.str.ljust`;Equivalent to ``str.ljust``
+    :meth:`~Series.str.rjust`;Equivalent to ``str.rjust``
+    :meth:`~Series.str.zfill`;Equivalent to ``str.zfill``
+    :meth:`~Series.str.wrap`;Split long strings into lines with length less than a given width
+    :meth:`~Series.str.slice`;Slice each string in the Series
+    :meth:`~Series.str.slice_replace`;Replace slice in each string with passed value
+    :meth:`~Series.str.count`;Count occurrences of pattern
+    :meth:`~Series.str.startswith`;Equivalent to ``str.startswith(pat)`` for each element
+    :meth:`~Series.str.endswith`;Equivalent to ``str.endswith(pat)`` for each element
+    :meth:`~Series.str.findall`;Compute list of all occurrences of pattern/regex for each string
+    :meth:`~Series.str.match`;"Call ``re.match`` on each element, returning matched groups as list"
+    :meth:`~Series.str.extract`;"Call ``re.search`` on each element, returning DataFrame with one row for each element and one column for each regex capture group"
+    :meth:`~Series.str.extractall`;"Call ``re.findall`` on each element, returning DataFrame with one row for each match and one column for each regex capture group"
+    :meth:`~Series.str.len`;Compute string lengths
+    :meth:`~Series.str.strip`;Equivalent to ``str.strip``
+    :meth:`~Series.str.rstrip`;Equivalent to ``str.rstrip``
+    :meth:`~Series.str.lstrip`;Equivalent to ``str.lstrip``
+    :meth:`~Series.str.partition`;Equivalent to ``str.partition``
+    :meth:`~Series.str.rpartition`;Equivalent to ``str.rpartition``
+    :meth:`~Series.str.lower`;Equivalent to ``str.lower``
+    :meth:`~Series.str.upper`;Equivalent to ``str.upper``
+    :meth:`~Series.str.find`;Equivalent to ``str.find``
+    :meth:`~Series.str.rfind`;Equivalent to ``str.rfind``
+    :meth:`~Series.str.index`;Equivalent to ``str.index``
+    :meth:`~Series.str.rindex`;Equivalent to ``str.rindex``
+    :meth:`~Series.str.capitalize`;Equivalent to ``str.capitalize``
+    :meth:`~Series.str.swapcase`;Equivalent to ``str.swapcase``
+    :meth:`~Series.str.normalize`;Return Unicode normal form. Equivalent to ``unicodedata.normalize``
+    :meth:`~Series.str.translate`;Equivalent to ``str.translate``
+    :meth:`~Series.str.isalnum`;Equivalent to ``str.isalnum``
+    :meth:`~Series.str.isalpha`;Equivalent to ``str.isalpha``
+    :meth:`~Series.str.isdigit`;Equivalent to ``str.isdigit``
+    :meth:`~Series.str.isspace`;Equivalent to ``str.isspace``
+    :meth:`~Series.str.islower`;Equivalent to ``str.islower``
+    :meth:`~Series.str.isupper`;Equivalent to ``str.isupper``
+    :meth:`~Series.str.istitle`;Equivalent to ``str.istitle``
+    :meth:`~Series.str.isnumeric`;Equivalent to ``str.isnumeric``
+    :meth:`~Series.str.isdecimal`;Equivalent to ``str.isdecimal``
diff --git a/doc/source/themes/nature_with_gtoc/layout.html b/doc/source/themes/nature_with_gtoc/layout.html
index fd0755e096023..a2106605c5562 100644
--- a/doc/source/themes/nature_with_gtoc/layout.html
+++ b/doc/source/themes/nature_with_gtoc/layout.html
@@ -61,3 +61,48 @@ <h3 style="margin-top: 1.5em;">{{ _('Search') }}</h3>
     </div>
 </div>
 {%- endblock %}
+
+{%- block footer %}
+<style type="text/css">
+    .scrollToTop {
+        text-align: center;
+        font-weight: bold;
+        position: fixed;
+        bottom: 60px;
+        right: 40px;
+        display: none;
+    }
+</style>
+<a href="#" class="scrollToTop">Scroll To Top</a>
+<script type="text/javascript">
+$(document).ready(function() {
+    //Check to see if the window is top if not then display button
+    $(window).scroll(function() {
+        if ($(this).scrollTop() > 200) {
+            $('.scrollToTop').fadeIn();
+        } else {
+            $('.scrollToTop').fadeOut();
+        }
+    });
+
+    //Click event to scroll to top
+    $('.scrollToTop').click(function() {
+        $('html, body').animate({
+            scrollTop: 0
+        }, 500);
+        return false;
+    });
+});
+</script>
+<script type="text/javascript">
+  var _gaq = _gaq || [];
+  _gaq.push(['_setAccount', 'UA-27880019-2']);
+  _gaq.push(['_trackPageview']);
+
+  (function() {
+    var ga = document.createElement('script'); ga.type = 'text/javascript'; ga.async = true;
+    ga.src = ('https:' == document.location.protocol ? 'https://ssl' : 'http://www') + '.google-analytics.com/ga.js';
+    var s = document.getElementsByTagName('script')[0]; s.parentNode.insertBefore(ga, s);
+  })();
+</script>
+{% endblock %}
\ No newline at end of file
diff --git a/doc/source/themes/nature_with_gtoc/static/nature.css_t b/doc/source/themes/nature_with_gtoc/static/nature.css_t
index 33644101eb425..4571d97ec50ba 100644
--- a/doc/source/themes/nature_with_gtoc/static/nature.css_t
+++ b/doc/source/themes/nature_with_gtoc/static/nature.css_t
@@ -198,10 +198,18 @@ div.body p, div.body dd, div.body li {
     line-height: 1.5em;
 }
 
-div.admonition p.admonition-title + p {
+div.admonition p.admonition-title + p, div.deprecated p {
     display: inline;
 }
 
+div.deprecated {
+    margin-bottom: 10px;
+    margin-top: 10px;
+    padding: 7px;
+    background-color: #ffe4e4;
+    border: 1px solid #f66;
+}
+
 div.highlight{
     background-color: white;
 }
@@ -299,6 +307,44 @@ td.field-body blockquote {
     padding-left: 30px;
 }
 
+// Adapted from the new Jupyter notebook style
+// https://github.com/jupyter/notebook/blob/c8841b68c4c0739bbee1291e0214771f24194079/notebook/static/notebook/less/renderedhtml.less#L59
+table {
+    margin-left: auto;
+    margin-right: auto;
+    border: none;
+    border-collapse: collapse;
+    border-spacing: 0;
+    color: @rendered_html_border_color;
+    table-layout: fixed;
+}
+thead {
+    border-bottom: 1px solid @rendered_html_border_color;
+    vertical-align: bottom;
+}
+tr, th, td {
+    vertical-align: middle;
+    padding: 0.5em 0.5em;
+    line-height: normal;
+    white-space: normal;
+    max-width: none;
+    border: none;
+}
+th {
+    font-weight: bold;
+}
+th.col_heading {
+    text-align: right;
+}
+tbody tr:nth-child(odd) {
+    background: #f5f5f5;
+}
+
+table td.data, table th.row_heading table th.col_heading {
+    font-family: monospace;
+    text-align: right;
+}
+
 
 /**
  * See also
diff --git a/doc/source/timedeltas.rst b/doc/source/timedeltas.rst
index e62f4f9387526..e602e45784f4a 100644
--- a/doc/source/timedeltas.rst
+++ b/doc/source/timedeltas.rst
@@ -4,18 +4,17 @@
 .. ipython:: python
    :suppress:
 
-   from datetime import datetime, timedelta
+   import datetime
    import numpy as np
+   import pandas as pd
    np.random.seed(123456)
-   from pandas import *
    randn = np.random.randn
    randint = np.random.randint
    np.set_printoptions(precision=4, suppress=True)
-   options.display.max_rows=15
+   pd.options.display.max_rows=15
    import dateutil
    import pytz
    from dateutil.relativedelta import relativedelta
-   from pandas.tseries.api import *
    from pandas.tseries.offsets import *
 
 .. _timedeltas.timedeltas:
@@ -24,13 +23,12 @@
 Time Deltas
 ***********
 
-.. note::
-
-   Starting in v0.15.0, we introduce a new scalar type ``Timedelta``, which is a subclass of ``datetime.timedelta``, and behaves in a similar manner,
-   but allows compatibility with ``np.timedelta64`` types as well as a host of custom representation, parsing, and attributes.
+Timedeltas are differences in times, expressed in difference units, e.g. days, hours, minutes,
+seconds. They can be both positive and negative.
 
-Timedeltas are differences in times, expressed in difference units, e.g. days, hours, minutes, seconds.
-They can be both positive and negative.
+``Timedelta`` is a subclass of ``datetime.timedelta``, and behaves in a similar manner,
+but allows compatibility with ``np.timedelta64`` types as well as a host of custom representation,
+parsing, and attributes.
 
 Parsing
 -------
@@ -40,62 +38,91 @@ You can construct a ``Timedelta`` scalar through various arguments:
 .. ipython:: python
 
    # strings
-   Timedelta('1 days')
-   Timedelta('1 days 00:00:00')
-   Timedelta('1 days 2 hours')
-   Timedelta('-1 days 2 min 3us')
+   pd.Timedelta('1 days')
+   pd.Timedelta('1 days 00:00:00')
+   pd.Timedelta('1 days 2 hours')
+   pd.Timedelta('-1 days 2 min 3us')
 
    # like datetime.timedelta
    # note: these MUST be specified as keyword arguments
-   Timedelta(days=1,seconds=1)
+   pd.Timedelta(days=1, seconds=1)
 
    # integers with a unit
-   Timedelta(1,unit='d')
+   pd.Timedelta(1, unit='d')
 
-   # from a timedelta/np.timedelta64
-   Timedelta(timedelta(days=1,seconds=1))
-   Timedelta(np.timedelta64(1,'ms'))
+   # from a datetime.timedelta/np.timedelta64
+   pd.Timedelta(datetime.timedelta(days=1, seconds=1))
+   pd.Timedelta(np.timedelta64(1, 'ms'))
 
    # negative Timedeltas have this string repr
    # to be more consistent with datetime.timedelta conventions
-   Timedelta('-1us')
+   pd.Timedelta('-1us')
 
    # a NaT
-   Timedelta('nan')
-   Timedelta('nat')
+   pd.Timedelta('nan')
+   pd.Timedelta('nat')
+
+   # ISO 8601 Duration strings
+   pd.Timedelta('P0DT0H1M0S')
+   pd.Timedelta('P0DT0H0M0.000000123S')
+
+.. versionadded:: 0.23.0
+
+   Added constructor for `ISO 8601 Duration`_ strings
 
 :ref:`DateOffsets<timeseries.offsets>` (``Day, Hour, Minute, Second, Milli, Micro, Nano``) can also be used in construction.
 
 .. ipython:: python
 
-   Timedelta(Second(2))
+   pd.Timedelta(Second(2))
 
-Further, operations among the scalars yield another scalar ``Timedelta``
+Further, operations among the scalars yield another scalar ``Timedelta``.
 
 .. ipython:: python
 
-   Timedelta(Day(2)) + Timedelta(Second(2)) + Timedelta('00:00:00.000123')
+   pd.Timedelta(Day(2)) + pd.Timedelta(Second(2)) + pd.Timedelta('00:00:00.000123')
 
 to_timedelta
 ~~~~~~~~~~~~
 
-.. warning::
+Using the top-level ``pd.to_timedelta``, you can convert a scalar, array, list,
+or Series from a recognized timedelta format / value into a ``Timedelta`` type.
+It will construct Series if the input is a Series, a scalar if the input is
+scalar-like, otherwise it will output a ``TimedeltaIndex``.
+
+You can parse a single string to a Timedelta:
+
+.. ipython:: python
+
+   pd.to_timedelta('1 days 06:05:01.00003')
+   pd.to_timedelta('15.5us')
+
+or a list/array of strings:
+
+.. ipython:: python
+
+   pd.to_timedelta(['1 days 06:05:01.00003', '15.5us', 'nan'])
+
+The ``unit`` keyword argument specifies the unit of the Timedelta:
+
+.. ipython:: python
+
+   pd.to_timedelta(np.arange(5), unit='s')
+   pd.to_timedelta(np.arange(5), unit='d')
 
-       Prior to 0.15.0 ``pd.to_timedelta`` would return a ``Series`` for list-like/Series input, and a ``np.timedelta64`` for scalar input.
-       It will now return a ``TimedeltaIndex`` for list-like input, ``Series`` for Series input, and ``Timedelta`` for scalar input.
+.. _timedeltas.limitations:
 
-       The arguments to ``pd.to_timedelta`` are now ``(arg,unit='ns',box=True)``, previously were ``(arg,box=True,unit='ns')`` as these are more logical.
+Timedelta limitations
+~~~~~~~~~~~~~~~~~~~~~
 
-Using the top-level ``pd.to_timedelta``, you can convert a scalar, array, list, or Series from a recognized timedelta format / value into a ``Timedelta`` type.
-It will construct Series if the input is a Series, a scalar if the input is scalar-like, otherwise will output a ``TimedeltaIndex``
+Pandas represents ``Timedeltas`` in nanosecond resolution using
+64 bit integers. As such, the 64 bit integer limits determine
+the ``Timedelta`` limits.
 
 .. ipython:: python
 
-   to_timedelta('1 days 06:05:01.00003')
-   to_timedelta('15.5us')
-   to_timedelta(['1 days 06:05:01.00003','15.5us','nan'])
-   to_timedelta(np.arange(5),unit='s')
-   to_timedelta(np.arange(5),unit='d')
+   pd.Timedelta.min
+   pd.Timedelta.max
 
 .. _timedeltas.operations:
 
@@ -107,57 +134,57 @@ subtraction operations on ``datetime64[ns]`` Series, or ``Timestamps``.
 
 .. ipython:: python
 
-   s = Series(date_range('2012-1-1', periods=3, freq='D'))
-   td = Series([ Timedelta(days=i) for i in range(3) ])
-   df = DataFrame(dict(A = s, B = td))
+   s = pd.Series(pd.date_range('2012-1-1', periods=3, freq='D'))
+   td = pd.Series([ pd.Timedelta(days=i) for i in range(3) ])
+   df = pd.DataFrame(dict(A = s, B = td))
    df
    df['C'] = df['A'] + df['B']
    df
    df.dtypes
 
    s - s.max()
-   s - datetime(2011,1,1,3,5)
-   s + timedelta(minutes=5)
+   s - datetime.datetime(2011, 1, 1, 3, 5)
+   s + datetime.timedelta(minutes=5)
    s + Minute(5)
    s + Minute(5) + Milli(5)
 
-Operations with scalars from a ``timedelta64[ns]`` series
+Operations with scalars from a ``timedelta64[ns]`` series:
 
 .. ipython:: python
 
    y = s - s[0]
    y
 
-Series of timedeltas with ``NaT`` values are supported
+Series of timedeltas with ``NaT`` values are supported:
 
 .. ipython:: python
 
    y = s - s.shift()
    y
 
-Elements can be set to ``NaT`` using ``np.nan`` analogously to datetimes
+Elements can be set to ``NaT`` using ``np.nan`` analogously to datetimes:
 
 .. ipython:: python
 
    y[1] = np.nan
    y
 
-Operands can also appear in a reversed order (a singular object operated with a Series)
+Operands can also appear in a reversed order (a singular object operated with a Series):
 
 .. ipython:: python
 
    s.max() - s
-   datetime(2011,1,1,3,5) - s
-   timedelta(minutes=5) + s
+   datetime.datetime(2011, 1, 1, 3, 5) - s
+   datetime.timedelta(minutes=5) + s
 
-``min, max`` and the corresponding ``idxmin, idxmax`` operations are supported on frames
+``min, max`` and the corresponding ``idxmin, idxmax`` operations are supported on frames:
 
 .. ipython:: python
 
-   A = s - Timestamp('20120101') - Timedelta('00:05:05')
-   B = s - Series(date_range('2012-1-2', periods=3, freq='D'))
+   A = s - pd.Timestamp('20120101') - pd.Timedelta('00:05:05')
+   B = s - pd.Series(pd.date_range('2012-1-2', periods=3, freq='D'))
 
-   df = DataFrame(dict(A=A, B=B))
+   df = pd.DataFrame(dict(A=A, B=B))
    df
 
    df.min()
@@ -183,13 +210,13 @@ pass a timedelta to get a particular value.
 
    y.fillna(0)
    y.fillna(10)
-   y.fillna(Timedelta('-1 days, 00:00:05'))
+   y.fillna(pd.Timedelta('-1 days, 00:00:05'))
 
-You can also negate, multiply and use ``abs`` on  ``Timedeltas``
+You can also negate, multiply and use ``abs`` on ``Timedeltas``:
 
 .. ipython:: python
 
-   td1 = Timedelta('-1 days 2 hours 3 seconds')
+   td1 = pd.Timedelta('-1 days 2 hours 3 seconds')
    td1
    -1 * td1
    - td1
@@ -205,7 +232,7 @@ Numeric reduction operation for ``timedelta64[ns]`` will return ``Timedelta`` ob
 
 .. ipython:: python
 
-   y2 = Series(to_timedelta(['-1 days +00:00:05','nat','-1 days +00:00:05','1 days']))
+   y2 = pd.Series(pd.to_timedelta(['-1 days +00:00:05', 'nat', '-1 days +00:00:05', '1 days']))
    y2
    y2.mean()
    y2.median()
@@ -217,30 +244,28 @@ Numeric reduction operation for ``timedelta64[ns]`` will return ``Timedelta`` ob
 Frequency Conversion
 --------------------
 
-.. versionadded:: 0.13
-
 Timedelta Series, ``TimedeltaIndex``, and ``Timedelta`` scalars can be converted to other 'frequencies' by dividing by another timedelta,
-or by astyping to a specific timedelta type. These operations yield Series and propogate ``NaT`` -> ``nan``.
-Note that division by the numpy scalar is true division, while astyping is equivalent of floor division.
+or by astyping to a specific timedelta type. These operations yield Series and propagate ``NaT`` -> ``nan``.
+Note that division by the NumPy scalar is true division, while astyping is equivalent of floor division.
 
 .. ipython:: python
 
-   td = Series(date_range('20130101',periods=4)) - \
-        Series(date_range('20121201',periods=4))
-   td[2] += timedelta(minutes=5,seconds=3)
+   td = pd.Series(pd.date_range('20130101', periods=4)) - \
+        pd.Series(pd.date_range('20121201', periods=4))
+   td[2] += datetime.timedelta(minutes=5, seconds=3)
    td[3] = np.nan
    td
 
    # to days
-   td / np.timedelta64(1,'D')
+   td / np.timedelta64(1, 'D')
    td.astype('timedelta64[D]')
 
    # to seconds
-   td / np.timedelta64(1,'s')
+   td / np.timedelta64(1, 's')
    td.astype('timedelta64[s]')
 
    # to months (these are constant months)
-   td / np.timedelta64(1,'M')
+   td / np.timedelta64(1, 'M')
 
 Dividing or multiplying a ``timedelta64[ns]`` Series by an integer or integer Series
 yields another ``timedelta64[ns]`` dtypes Series.
@@ -248,7 +273,29 @@ yields another ``timedelta64[ns]`` dtypes Series.
 .. ipython:: python
 
    td * -1
-   td * Series([1,2,3,4])
+   td * pd.Series([1, 2, 3, 4])
+
+Rounded division (floor-division) of a ``timedelta64[ns]`` Series by a scalar
+``Timedelta`` gives a series of integers.
+
+.. ipython:: python
+
+   td // pd.Timedelta(days=3, hours=4)
+   pd.Timedelta(days=3, hours=4) // td
+
+.. _timedeltas.mod_divmod:
+
+The mod (%) and divmod operations are defined for ``Timedelta`` when operating with another timedelta-like or with a numeric argument.
+
+.. ipython:: python
+
+   pd.Timedelta(hours=37) % datetime.timedelta(hours=2)
+
+   # divmod against a timedelta-like returns a pair (int, Timedelta)
+   divmod(datetime.timedelta(hours=2), pd.Timedelta(minutes=11))
+
+   # divmod against a numeric returns a pair (Timedelta, Timedelta)
+   divmod(pd.Timedelta(hours=25), 86400000000000)
 
 Attributes
 ----------
@@ -261,7 +308,7 @@ These operations can also be directly accessed via the ``.dt`` property of the `
 
    Note that the attributes are NOT the displayed values of the ``Timedelta``. Use ``.components`` to retrieve the displayed values.
 
-For a ``Series``
+For a ``Series``:
 
 .. ipython:: python
 
@@ -272,7 +319,7 @@ You can access the value of the fields for a scalar ``Timedelta`` directly.
 
 .. ipython:: python
 
-   tds = Timedelta('31 days 5 min 3 sec')
+   tds = pd.Timedelta('31 days 5 min 3 sec')
    tds.days
    tds.seconds
    (-tds).seconds
@@ -285,30 +332,84 @@ similarly to the ``Series``. These are the *displayed* values of the ``Timedelta
    td.dt.components
    td.dt.components.seconds
 
+.. _timedeltas.isoformat:
+
+You can convert a ``Timedelta`` to an `ISO 8601 Duration`_ string with the
+``.isoformat`` method
+
+.. versionadded:: 0.20.0
+
+.. ipython:: python
+
+    pd.Timedelta(days=6, minutes=50, seconds=3,
+                 milliseconds=10, microseconds=10,
+                 nanoseconds=12).isoformat()
+
+.. _ISO 8601 Duration: https://en.wikipedia.org/wiki/ISO_8601#Durations
+
 .. _timedeltas.index:
 
 TimedeltaIndex
 --------------
 
-.. versionadded:: 0.15.0
-
-To generate an index with time delta, you can use either the ``TimedeltaIndex`` or
-the ``timedelta_range`` constructor.
+To generate an index with time delta, you can use either the :class:`TimedeltaIndex` or
+the :func:`timedelta_range` constructor.
 
 Using ``TimedeltaIndex`` you can pass string-like, ``Timedelta``, ``timedelta``,
 or ``np.timedelta64`` objects. Passing ``np.nan/pd.NaT/nat`` will represent missing values.
 
 .. ipython:: python
 
-   TimedeltaIndex(['1 days','1 days, 00:00:05',
-                   np.timedelta64(2,'D'),timedelta(days=2,seconds=2)])
+   pd.TimedeltaIndex(['1 days', '1 days, 00:00:05',
+                     np.timedelta64(2,'D'), datetime.timedelta(days=2,seconds=2)])
 
-Similarly to ``date_range``, you can construct regular ranges of a ``TimedeltaIndex``:
+The string 'infer' can be passed in order to set the frequency of the index as the
+inferred frequency upon creation:
 
 .. ipython:: python
 
-   timedelta_range(start='1 days',periods=5,freq='D')
-   timedelta_range(start='1 days',end='2 days',freq='30T')
+   pd.TimedeltaIndex(['0 days', '10 days', '20 days'], freq='infer')
+
+Generating Ranges of Time Deltas
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Similar to :func:`date_range`, you can construct regular ranges of a ``TimedeltaIndex``
+using :func:`timedelta_range`.  The default frequency for ``timedelta_range`` is 
+calendar day:
+
+.. ipython:: python
+
+   pd.timedelta_range(start='1 days', periods=5)
+
+Various combinations of ``start``, ``end``, and ``periods`` can be used with
+``timedelta_range``:
+
+.. ipython:: python
+
+   pd.timedelta_range(start='1 days', end='5 days')
+
+   pd.timedelta_range(end='10 days', periods=4)
+
+The ``freq`` parameter can passed a variety of :ref:`frequency aliases <timeseries.offset_aliases>`:
+
+.. ipython:: python
+
+   pd.timedelta_range(start='1 days', end='2 days', freq='30T')
+
+   pd.timedelta_range(start='1 days', periods=5, freq='2D5H')
+
+
+.. versionadded:: 0.23.0
+
+Specifying ``start``, ``end``, and ``periods`` will generate a range of evenly spaced
+timedeltas from ``start`` to ``end`` inclusively, with ``periods`` number of elements
+in the resulting ``TimedeltaIndex``:
+
+.. ipython:: python
+
+   pd.timedelta_range('0 days', '4 days', periods=5)
+
+   pd.timedelta_range('0 days', '4 days', periods=10)
 
 Using the TimedeltaIndex
 ~~~~~~~~~~~~~~~~~~~~~~~~
@@ -318,17 +419,17 @@ Similarly to other of the datetime-like indices, ``DatetimeIndex`` and ``PeriodI
 
 .. ipython:: python
 
-   s = Series(np.arange(100),
-              index=timedelta_range('1 days',periods=100,freq='h'))
+   s = pd.Series(np.arange(100),
+                 index=pd.timedelta_range('1 days', periods=100, freq='h'))
    s
 
-Selections work similary, with coercion on string-likes and slices:
+Selections work similarly, with coercion on string-likes and slices:
 
 .. ipython:: python
 
    s['1 day':'2 day']
    s['1 day 01:00:00']
-   s[Timedelta('1 day 1h')]
+   s[pd.Timedelta('1 day 1h')]
 
 Furthermore you can use partial string selection and the range will be inferred:
 
@@ -343,9 +444,9 @@ Finally, the combination of ``TimedeltaIndex`` with ``DatetimeIndex`` allow cert
 
 .. ipython:: python
 
-   tdi = TimedeltaIndex(['1 days',pd.NaT,'2 days'])
+   tdi = pd.TimedeltaIndex(['1 days', pd.NaT, '2 days'])
    tdi.tolist()
-   dti = date_range('20130101',periods=3)
+   dti = pd.date_range('20130101', periods=3)
    dti.tolist()
    (dti + tdi).tolist()
    (dti - tdi).tolist()
@@ -365,14 +466,14 @@ Scalars type ops work as well. These can potentially return a *different* type o
 .. ipython:: python
 
    # adding or timedelta and date -> datelike
-   tdi + Timestamp('20130101')
+   tdi + pd.Timestamp('20130101')
 
    # subtraction of a date and a timedelta -> datelike
    # note that trying to subtract a date from a Timedelta will raise an exception
-   (Timestamp('20130101') - tdi).tolist()
+   (pd.Timestamp('20130101') - tdi).tolist()
 
    # timedelta + timedelta -> timedelta
-   tdi + Timedelta('10 days')
+   tdi + pd.Timedelta('10 days')
 
    # division can result in a Timedelta if the divisor is an integer
    tdi / 2
@@ -389,4 +490,4 @@ Similar to :ref:`timeseries resampling <timeseries.resampling>`, we can resample
 
 .. ipython:: python
 
-   s.resample('D')
+   s.resample('D').mean()
diff --git a/doc/source/timeseries.rst b/doc/source/timeseries.rst
index 1d21f96a7d539..9e01296d9c9c7 100644
--- a/doc/source/timeseries.rst
+++ b/doc/source/timeseries.rst
@@ -6,36 +6,33 @@
 
    from datetime import datetime, timedelta, time
    import numpy as np
+   import pandas as pd
+   from pandas import offsets
    np.random.seed(123456)
-   from pandas import *
    randn = np.random.randn
    randint = np.random.randint
    np.set_printoptions(precision=4, suppress=True)
-   options.display.max_rows=15
+   pd.options.display.max_rows=15
    import dateutil
    import pytz
    from dateutil.relativedelta import relativedelta
-   from pandas.tseries.api import *
-   from pandas.tseries.offsets import *
 
 ********************************
 Time Series / Date functionality
 ********************************
 
 pandas has proven very successful as a tool for working with time series data,
-especially in the financial data analysis space. With the 0.8 release, we have
-further improved the time series API in pandas by leaps and bounds. Using the
-new NumPy ``datetime64`` dtype, we have consolidated a large number of features
-from other Python libraries like ``scikits.timeseries`` as well as created
+especially in the financial data analysis space. Using the NumPy ``datetime64`` and ``timedelta64`` dtypes,
+we have consolidated a large number of features from other Python libraries like ``scikits.timeseries`` as well as created
 a tremendous amount of new functionality for manipulating time series data.
 
 In working with time series data, we will frequently seek to:
 
-  - generate sequences of fixed-frequency dates and time spans
-  - conform or convert time series to a particular frequency
-  - compute "relative" dates based on various non-standard time increments
-    (e.g. 5 business days before the last business day of the year), or "roll"
-    dates forward or backward
+* generate sequences of fixed-frequency dates and time spans
+* conform or convert time series to a particular frequency
+* compute "relative" dates based on various non-standard time increments
+  (e.g. 5 business days before the last business day of the year), or "roll"
+  dates forward or backward
 
 pandas provides a relatively compact and self-contained set of tools for
 performing the above tasks.
@@ -45,14 +42,14 @@ Create a range of dates:
 .. ipython:: python
 
    # 72 hours starting with midnight Jan 1st, 2011
-   rng = date_range('1/1/2011', periods=72, freq='H')
+   rng = pd.date_range('1/1/2011', periods=72, freq='H')
    rng[:5]
 
 Index pandas objects with dates:
 
 .. ipython:: python
 
-   ts = Series(randn(len(rng)), index=rng)
+   ts = pd.Series(np.random.randn(len(rng)), index=rng)
    ts.head()
 
 Change frequency and fill gaps:
@@ -63,12 +60,12 @@ Change frequency and fill gaps:
    converted = ts.asfreq('45Min', method='pad')
    converted.head()
 
-Resample:
+Resample the series to a daily frequency:
 
 .. ipython:: python
 
    # Daily means
-   ts.resample('D', how='mean')
+   ts.resample('D').mean()
 
 
 .. _timeseries.overview:
@@ -76,31 +73,32 @@ Resample:
 Overview
 --------
 
-Following table shows the type of time-related classes pandas can handle and
+The following table shows the type of time-related classes pandas can handle and
 how to create them.
 
-=================  ============================== ==================================================
-Class              Remarks                        How to create
-=================  ============================== ==================================================
-``Timestamp``      Represents a single time stamp ``to_datetime``, ``Timestamp``
-``DatetimeIndex``  Index of ``Timestamps``        ``to_datetime``, ``date_range``, ``DatetimeIndex``
-``Period``         Represents a single time span  ``Period``
-``PeriodIndex``    Index of ``Period``            ``period_range``, ``PeriodIndex``
-=================  ============================== ==================================================
+=================  =============================== ===================================================================
+Class              Remarks                         How to create
+=================  =============================== ===================================================================
+``Timestamp``      Represents a single timestamp   ``to_datetime``, ``Timestamp``
+``DatetimeIndex``  Index of ``Timestamp``          ``to_datetime``, ``date_range``, ``bdate_range``, ``DatetimeIndex``
+``Period``         Represents a single time span   ``Period``
+``PeriodIndex``    Index of ``Period``             ``period_range``, ``PeriodIndex``
+=================  =============================== ===================================================================
 
 .. _timeseries.representation:
 
-Time Stamps vs. Time Spans
---------------------------
+Timestamps vs. Time Spans
+-------------------------
 
-Time-stamped data is the most basic type of timeseries data that associates
+Timestamped data is the most basic type of time series data that associates
 values with points in time. For pandas objects it means using the points in
 time.
 
 .. ipython:: python
 
-   Timestamp(datetime(2012, 5, 1))
-   Timestamp('2012-05-01')
+   pd.Timestamp(datetime(2012, 5, 1))
+   pd.Timestamp('2012-05-01')
+   pd.Timestamp(2012, 5, 1)
 
 However, in many cases it is more natural to associate things like change
 variables with a time span instead. The span represented by ``Period`` can be
@@ -110,34 +108,34 @@ For example:
 
 .. ipython:: python
 
-   Period('2011-01')
+   pd.Period('2011-01')
 
-   Period('2012-05', freq='D')
+   pd.Period('2012-05', freq='D')
 
-``Timestamp`` and ``Period`` can be the index. Lists of ``Timestamp`` and
-``Period`` are automatically coerce to ``DatetimeIndex`` and ``PeriodIndex``
-respectively.
+:class:`Timestamp` and :class:`Period` can serve as an index. Lists of 
+``Timestamp`` and ``Period`` are automatically coerced to :class:`DatetimeIndex`
+and :class:`PeriodIndex` respectively.
 
 .. ipython:: python
 
-   dates = [Timestamp('2012-05-01'), Timestamp('2012-05-02'), Timestamp('2012-05-03')]
-   ts = Series(np.random.randn(3), dates)
+   dates = [pd.Timestamp('2012-05-01'), pd.Timestamp('2012-05-02'), pd.Timestamp('2012-05-03')]
+   ts = pd.Series(np.random.randn(3), dates)
 
    type(ts.index)
    ts.index
 
    ts
 
-   periods = [Period('2012-01'), Period('2012-02'), Period('2012-03')]
+   periods = [pd.Period('2012-01'), pd.Period('2012-02'), pd.Period('2012-03')]
 
-   ts = Series(np.random.randn(3), periods)
+   ts = pd.Series(np.random.randn(3), periods)
 
    type(ts.index)
    ts.index
 
    ts
 
-Starting with 0.8, pandas allows you to capture both representations and
+pandas allows you to capture both representations and
 convert between them. Under the hood, pandas represents timestamps using
 instances of ``Timestamp`` and sequences of timestamps using instances of
 ``DatetimeIndex``. For regular time spans, pandas uses ``Period`` objects for
@@ -151,25 +149,25 @@ future releases.
 Converting to Timestamps
 ------------------------
 
-To convert a Series or list-like object of date-like objects e.g. strings,
+To convert a :class:`Series` or list-like object of date-like objects e.g. strings,
 epochs, or a mixture, you can use the ``to_datetime`` function. When passed
-a Series, this returns a Series (with the same index), while a list-like
-is converted to a DatetimeIndex:
+a ``Series``, this returns a ``Series`` (with the same index), while a list-like
+is converted to a ``DatetimeIndex``:
 
 .. ipython:: python
 
-    to_datetime(Series(['Jul 31, 2009', '2010-01-10', None]))
+    pd.to_datetime(pd.Series(['Jul 31, 2009', '2010-01-10', None]))
 
-    to_datetime(['2005/11/23', '2010.12.31'])
+    pd.to_datetime(['2005/11/23', '2010.12.31'])
 
 If you use dates which start with the day first (i.e. European style),
 you can pass the ``dayfirst`` flag:
 
 .. ipython:: python
 
-    to_datetime(['04-01-2012 10:00'], dayfirst=True)
+    pd.to_datetime(['04-01-2012 10:00'], dayfirst=True)
 
-    to_datetime(['14-01-2012', '01-14-2012'], dayfirst=True)
+    pd.to_datetime(['14-01-2012', '01-14-2012'], dayfirst=True)
 
 .. warning::
 
@@ -177,156 +175,319 @@ you can pass the ``dayfirst`` flag:
    can't be parsed with the day being first it will be parsed as if
    ``dayfirst`` were False.
 
-.. note::
-   Specifying a ``format`` argument will potentially speed up the conversion
-   considerably and on versions later then 0.13.0 explicitly specifying
-   a format string of '%Y%m%d' takes a faster path still.
+If you pass a single string to ``to_datetime``, it returns a single ``Timestamp``. 
+``Timestamp`` can also accept string input, but it doesn't accept string parsing
+options like ``dayfirst`` or ``format``, so use ``to_datetime`` if these are required.
+
+.. ipython:: python
+
+    pd.to_datetime('2010/11/12')
+
+    pd.Timestamp('2010/11/12')
+
+You can also use the ``DatetimeIndex`` constructor directly:
+
+.. ipython:: python
+
+    pd.DatetimeIndex(['2018-01-01', '2018-01-03', '2018-01-05'])
+
+The string 'infer' can be passed in order to set the frequency of the index as the
+inferred frequency upon creation:
+
+.. ipython:: python
+
+    pd.DatetimeIndex(['2018-01-01', '2018-01-03', '2018-01-05'], freq='infer')
+
+Providing a Format Argument
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+In addition to the required datetime string, a ``format`` argument can be passed to ensure specific parsing.
+This could also potentially speed up the conversion considerably.
+
+.. ipython:: python
 
-If you pass a single string to ``to_datetime``, it returns single ``Timestamp``.
-Also, ``Timestamp`` can accept the string input.
-Note that ``Timestamp`` doesn't accept string parsing option like ``dayfirst``
-or ``format``, use ``to_datetime`` if these are required.
+    pd.to_datetime('2010/11/12', format='%Y/%m/%d')
+
+    pd.to_datetime('12-11-2010 00:00', format='%d-%m-%Y %H:%M')
+
+For more information on the choices available when specifying the ``format`` 
+option, see the Python `datetime documentation`_.
+
+.. _datetime documentation: https://docs.python.org/3/library/datetime.html#strftime-and-strptime-behavior
+
+Assembling Datetime from Multiple DataFrame Columns
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.18.1
+
+You can also pass a ``DataFrame`` of integer or string columns to assemble into a ``Series`` of ``Timestamps``.
 
 .. ipython:: python
 
-    to_datetime('2010/11/12')
+   df = pd.DataFrame({'year': [2015, 2016],
+                      'month': [2, 3],
+                      'day': [4, 5],
+                      'hour': [2, 3]})
+   pd.to_datetime(df)
+
+
+You can pass only the columns that you need to assemble.
+
+.. ipython:: python
 
-    Timestamp('2010/11/12')
+   pd.to_datetime(df[['year', 'month', 'day']])
 
+``pd.to_datetime`` looks for standard designations of the datetime component in the column names, including:
+
+* required: ``year``, ``month``, ``day``
+* optional: ``hour``, ``minute``, ``second``, ``millisecond``, ``microsecond``, ``nanosecond``
 
 Invalid Data
 ~~~~~~~~~~~~
 
-.. note::
+The default behavior, ``errors='raise'``, is to raise when unparseable:
+
+.. code-block:: ipython
 
-   In version 0.17.0, the default for ``to_datetime`` is now ``errors='raise'``, rather than ``errors='ignore'``. This means
-   that invalid parsing will raise rather that return the original input as in previous versions.
+    In [2]: pd.to_datetime(['2009/07/31', 'asd'], errors='raise')
+    ValueError: Unknown string format
 
-Pass ``errors='coerce'`` to convert invalid data to ``NaT`` (not a time):
+Pass ``errors='ignore'`` to return the original input when unparseable:
 
 .. ipython:: python
-   :okexcept:
 
-   # this is the default, raise when unparseable
-   to_datetime(['2009/07/31', 'asd'], errors='raise')
+   pd.to_datetime(['2009/07/31', 'asd'], errors='ignore')
 
-   # return the original input when unparseable
-   to_datetime(['2009/07/31', 'asd'], errors='ignore')
+Pass ``errors='coerce'`` to convert unparseable data to ``NaT`` (not a time):
 
-   # return NaT for input when unparseable
-   to_datetime(['2009/07/31', 'asd'], errors='coerce')
+.. ipython:: python
+
+   pd.to_datetime(['2009/07/31', 'asd'], errors='coerce')
+
+
+.. _timeseries.converting.epoch:
 
 Epoch Timestamps
 ~~~~~~~~~~~~~~~~
 
-It's also possible to convert integer or float epoch times. The default unit
-for these is nanoseconds (since these are how Timestamps are stored). However,
-often epochs are stored in another ``unit`` which can be specified:
+pandas supports converting integer or float epoch times to ``Timestamp`` and
+``DatetimeIndex``. The default unit is nanoseconds, since that is how ``Timestamp``
+objects are stored internally. However, epochs are often stored in another ``unit``
+which can be specified. These are computed from the starting point specified by the
+``origin`` parameter.
+
+.. ipython:: python
+
+   pd.to_datetime([1349720105, 1349806505, 1349892905,
+                   1349979305, 1350065705], unit='s')
+
+   pd.to_datetime([1349720105100, 1349720105200, 1349720105300,
+                   1349720105400, 1349720105500 ], unit='ms')
+
+.. note::
+
+   Epoch times will be rounded to the nearest nanosecond.
+
+.. warning::
+
+   Conversion of float epoch times can lead to inaccurate and unexpected results.
+   :ref:`Python floats <python:tut-fp-issues>` have about 15 digits precision in
+   decimal. Rounding during conversion from float to high precision ``Timestamp`` is
+   unavoidable. The only way to achieve exact precision is to use a fixed-width
+   types (e.g. an int64).
+
+   .. ipython:: python
+
+      pd.to_datetime([1490195805.433, 1490195805.433502912], unit='s')
+      pd.to_datetime(1490195805433502912, unit='ns')
+
+.. seealso::
+
+   :ref:`timeseries.origin`
+
+.. _timeseries.converting.epoch_inverse:
+
+From Timestamps to Epoch
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+To invert the operation from above, namely, to convert from a ``Timestamp`` to a 'unix' epoch:
 
-Typical epoch stored units
+.. ipython:: python
+
+   stamps = pd.date_range('2012-10-08 18:15:05', periods=4, freq='D')
+   stamps
+
+We subtract the epoch (midnight at January 1, 1970 UTC) and then floor divide by the
+"unit" (1 second).
 
 .. ipython:: python
 
-   to_datetime([1349720105, 1349806505, 1349892905,
-                1349979305, 1350065705], unit='s')
+   (stamps - pd.Timestamp("1970-01-01")) // pd.Timedelta('1s')
+
+.. _timeseries.origin:
+
+Using the ``origin`` Parameter
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-   to_datetime([1349720105100, 1349720105200, 1349720105300,
-                1349720105400, 1349720105500 ], unit='ms')
+.. versionadded:: 0.20.0
 
-These *work*, but the results may be unexpected.
+Using the ``origin`` parameter, one can specify an alternative starting point for creation
+of a ``DatetimeIndex``. For example, to use 1960-01-01 as the starting date:
 
 .. ipython:: python
 
-   to_datetime([1])
+   pd.to_datetime([1, 2, 3], unit='D', origin=pd.Timestamp('1960-01-01'))
 
-   to_datetime([1, 3.14], unit='s')
+The default is set at ``origin='unix'``, which defaults to ``1970-01-01 00:00:00``.
+Commonly called 'unix epoch' or POSIX time.
 
-.. note::
+.. ipython:: python
 
-   Epoch times will be rounded to the nearest nanosecond.
+   pd.to_datetime([1, 2, 3], unit='D')
 
 .. _timeseries.daterange:
 
 Generating Ranges of Timestamps
 -------------------------------
 
-To generate an index with time stamps, you can use either the DatetimeIndex or
-Index constructor and pass in a list of datetime objects:
+To generate an index with timestamps, you can use either the ``DatetimeIndex`` or
+``Index`` constructor and pass in a list of datetime objects:
 
 .. ipython:: python
 
    dates = [datetime(2012, 5, 1), datetime(2012, 5, 2), datetime(2012, 5, 3)]
-   index = DatetimeIndex(dates)
-   index # Note the frequency information
 
-   index = Index(dates)
-   index # Automatically converted to DatetimeIndex
+   # Note the frequency information
+   index = pd.DatetimeIndex(dates)
+   index
 
-Practically, this becomes very cumbersome because we often need a very long
+   # Automatically converted to DatetimeIndex
+   index = pd.Index(dates)
+   index
+
+In practice this becomes very cumbersome because we often need a very long
 index with a large number of timestamps. If we need timestamps on a regular
-frequency, we can use the pandas functions ``date_range`` and ``bdate_range``
-to create timestamp indexes.
+frequency, we can use the :func:`date_range` and :func:`bdate_range` functions
+to create a ``DatetimeIndex``. The default frequency for ``date_range`` is a
+**calendar day** while the default for ``bdate_range`` is a **business day**:
 
 .. ipython:: python
 
-   index = date_range('2000-1-1', periods=1000, freq='M')
+   start = datetime(2011, 1, 1)
+   end = datetime(2012, 1, 1)
+
+   index = pd.date_range(start, end)
    index
 
-   index = bdate_range('2012-1-1', periods=250)
+   index = pd.bdate_range(start, end)
    index
 
-Convenience functions like ``date_range`` and ``bdate_range`` utilize a
-variety of frequency aliases. The default frequency for ``date_range`` is a
-**calendar day** while the default for ``bdate_range`` is a **business day**
+Convenience functions like ``date_range`` and ``bdate_range`` can utilize a
+variety of :ref:`frequency aliases <timeseries.offset_aliases>`:
 
 .. ipython:: python
 
-   start = datetime(2011, 1, 1)
-   end = datetime(2012, 1, 1)
+   pd.date_range(start, periods=1000, freq='M')
 
-   rng = date_range(start, end)
-   rng
-
-   rng = bdate_range(start, end)
-   rng
+   pd.bdate_range(start, periods=250, freq='BQS')
 
 ``date_range`` and ``bdate_range`` make it easy to generate a range of dates
-using various combinations of parameters like ``start``, ``end``,
-``periods``, and ``freq``:
+using various combinations of parameters like ``start``, ``end``, ``periods``,
+and ``freq``. The start and end dates are strictly inclusive, so dates outside
+of those specified will not be generated:
+
+.. ipython:: python
+
+   pd.date_range(start, end, freq='BM')
+
+   pd.date_range(start, end, freq='W')
+
+   pd.bdate_range(end=end, periods=20)
+
+   pd.bdate_range(start=start, periods=20)
+
+.. versionadded:: 0.23.0
+
+Specifying ``start``, ``end``, and ``periods`` will generate a range of evenly spaced
+dates from ``start`` to ``end`` inclusively, with ``periods`` number of elements in the
+resulting ``DatetimeIndex``:
+
+.. ipython:: python
+
+   pd.date_range('2018-01-01', '2018-01-05', periods=5)
+
+   pd.date_range('2018-01-01', '2018-01-05', periods=10)
+
+.. _timeseries.custom-freq-ranges:
+
+Custom Frequency Ranges
+~~~~~~~~~~~~~~~~~~~~~~~
+
+.. warning::
+
+   This functionality was originally exclusive to ``cdate_range``, which is
+   deprecated as of version 0.21.0 in favor of ``bdate_range``.  Note that
+   ``cdate_range`` only utilizes the ``weekmask`` and ``holidays`` parameters
+   when custom business day, 'C', is passed as the frequency string. Support has 
+   been expanded with ``bdate_range`` to work with any custom frequency string.
+
+.. versionadded:: 0.21.0
+
+``bdate_range`` can also generate a range of custom frequency dates by using
+the ``weekmask`` and ``holidays`` parameters.  These parameters will only be
+used if a custom frequency string is passed.
 
 .. ipython:: python
 
-   date_range(start, end, freq='BM')
+   weekmask = 'Mon Wed Fri'
+
+   holidays = [datetime(2011, 1, 5), datetime(2011, 3, 14)]
+
+   pd.bdate_range(start, end, freq='C', weekmask=weekmask, holidays=holidays)
+
+   pd.bdate_range(start, end, freq='CBMS', weekmask=weekmask)
 
-   date_range(start, end, freq='W')
+.. seealso::
+
+   :ref:`timeseries.custombusinessdays`
+
+.. _timeseries.timestamp-limits:
 
-   bdate_range(end=end, periods=20)
+Timestamp Limitations
+---------------------
 
-   bdate_range(start=start, periods=20)
+Since pandas represents timestamps in nanosecond resolution, the time span that
+can be represented using a 64-bit integer is limited to approximately 584 years:
+
+.. ipython:: python
 
-The start and end dates are strictly inclusive. So it will not generate any
-dates outside of those dates if specified.
+   pd.Timestamp.min
+   pd.Timestamp.max
+
+.. seealso::
+
+   :ref:`timeseries.oob`
 
 .. _timeseries.datetimeindex:
 
-DatetimeIndex
--------------
+Indexing
+--------
 
 One of the main uses for ``DatetimeIndex`` is as an index for pandas objects.
-The ``DatetimeIndex`` class contains many timeseries related optimizations:
+The ``DatetimeIndex`` class contains many time series related optimizations:
 
-  - A large range of dates for various offsets are pre-computed and cached
-    under the hood in order to make generating subsequent date ranges very fast
-    (just have to grab a slice)
-  - Fast shifting using the ``shift`` and ``tshift`` method on pandas objects
-  - Unioning of overlapping DatetimeIndex objects with the same frequency is
-    very fast (important for fast data alignment)
-  - Quick access to date fields via properties such as ``year``, ``month``, etc.
-  - Regularization functions like ``snap`` and very fast ``asof`` logic
+* A large range of dates for various offsets are pre-computed and cached
+  under the hood in order to make generating subsequent date ranges very fast
+  (just have to grab a slice).
+* Fast shifting using the ``shift`` and ``tshift`` method on pandas objects.
+* Unioning of overlapping ``DatetimeIndex`` objects with the same frequency is
+  very fast (important for fast data alignment).
+* Quick access to date fields via properties such as ``year``, ``month``, etc.
+* Regularization functions like ``snap`` and very fast ``asof`` logic.
 
-DatetimeIndex objects has all the basic functionality of regular Index objects
-and a smorgasbord of advanced timeseries-specific methods for easy frequency
-processing.
+``DatetimeIndex`` objects have all the basic functionality of regular ``Index``
+objects, and a smorgasbord of advanced time series specific methods for easy
+frequency processing.
 
 .. seealso::
     :ref:`Reindexing methods <basics.reindexing>`
@@ -334,26 +495,25 @@ processing.
 .. note::
 
     While pandas does not force you to have a sorted date index, some of these
-    methods may have unexpected or incorrect behavior if the dates are
-    unsorted. So please be careful.
+    methods may have unexpected or incorrect behavior if the dates are unsorted.
 
 ``DatetimeIndex`` can be used like a regular index and offers all of its
 intelligent functionality like selection, slicing, etc.
 
 .. ipython:: python
 
-   rng = date_range(start, end, freq='BM')
-   ts = Series(randn(len(rng)), index=rng)
+   rng = pd.date_range(start, end, freq='BM')
+   ts = pd.Series(np.random.randn(len(rng)), index=rng)
    ts.index
    ts[:5].index
    ts[::2].index
 
 .. _timeseries.partialindexing:
 
-DatetimeIndex Partial String Indexing
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Partial String Indexing
+~~~~~~~~~~~~~~~~~~~~~~~
 
-You can pass in dates and strings that parse to dates as indexing parameters:
+Dates and strings that parse to timestamps can be passed as indexing parameters:
 
 .. ipython:: python
 
@@ -372,63 +532,142 @@ the year or year and month as strings:
 
    ts['2011-6']
 
-This type of slicing will work on a DataFrame with a ``DateTimeIndex`` as well. Since the
+This type of slicing will work on a ``DataFrame`` with a ``DatetimeIndex`` as well. Since the
 partial string selection is a form of label slicing, the endpoints **will be** included. This
-would include matching times on an included date. Here's an example:
+would include matching times on an included date:
 
 .. ipython:: python
 
-   dft = DataFrame(randn(100000,1),columns=['A'],index=date_range('20130101',periods=100000,freq='T'))
+   dft = pd.DataFrame(randn(100000,1),
+                      columns=['A'],
+                      index=pd.date_range('20130101',periods=100000,freq='T'))
    dft
    dft['2013']
 
-This starts on the very first time in the month, and includes the last date & time for the month
+This starts on the very first time in the month, and includes the last date and 
+time for the month:
 
 .. ipython:: python
 
    dft['2013-1':'2013-2']
 
-This specifies a stop time **that includes all of the times on the last day**
+This specifies a stop time **that includes all of the times on the last day**:
 
 .. ipython:: python
 
    dft['2013-1':'2013-2-28']
 
-This specifies an **exact** stop time (and is not the same as the above)
+This specifies an **exact** stop time (and is not the same as the above):
 
 .. ipython:: python
 
    dft['2013-1':'2013-2-28 00:00:00']
 
-We are stopping on the included end-point as it is part of the index
+We are stopping on the included end-point as it is part of the index:
 
 .. ipython:: python
 
    dft['2013-1-15':'2013-1-15 12:30:00']
 
-.. warning::
+.. versionadded:: 0.18.0
+
+``DatetimeIndex`` partial string indexing also works on a ``DataFrame`` with a ``MultiIndex``:
+
+.. ipython:: python
 
-   The following selection will raise a ``KeyError``; otherwise this selection methodology
-   would be inconsistent with other selection methods in pandas (as this is not a *slice*, nor does it
-   resolve to one)
+   dft2 = pd.DataFrame(np.random.randn(20, 1),
+                       columns=['A'],
+                       index=pd.MultiIndex.from_product([pd.date_range('20130101',
+                                                                       periods=10,
+                                                                       freq='12H'),
+                                                        ['a', 'b']]))
+   dft2
+   dft2.loc['2013-01-05']
+   idx = pd.IndexSlice
+   dft2 = dft2.swaplevel(0, 1).sort_index()
+   dft2.loc[idx[:, '2013-01-05'], :]
 
-   .. code-block:: python
+.. _timeseries.slice_vs_exact_match:
 
-      dft['2013-1-15 12:30:00']
+Slice vs. Exact Match
+~~~~~~~~~~~~~~~~~~~~~
 
-   To select a single row, use ``.loc``
+.. versionchanged:: 0.20.0
+
+The same string used as an indexing parameter can be treated either as a slice or as an exact match depending on the resolution of the index. If the string is less accurate than the index, it will be treated as a slice, otherwise as an exact match.
+
+Consider a ``Series`` object with a minute resolution index:
+
+.. ipython:: python
+
+    series_minute = pd.Series([1, 2, 3],
+                              pd.DatetimeIndex(['2011-12-31 23:59:00',
+                                                '2012-01-01 00:00:00',
+                                                '2012-01-01 00:02:00']))
+    series_minute.index.resolution
+
+A timestamp string less accurate than a minute gives a ``Series`` object.
+
+.. ipython:: python
+
+    series_minute['2011-12-31 23']
+
+A timestamp string with minute resolution (or more accurate), gives a scalar instead, i.e. it is not casted to a slice.
+
+.. ipython:: python
+
+    series_minute['2011-12-31 23:59']
+    series_minute['2011-12-31 23:59:00']
+
+If index resolution is second, then the minute-accurate timestamp gives a 
+``Series``.
+
+.. ipython:: python
+
+    series_second = pd.Series([1, 2, 3],
+                              pd.DatetimeIndex(['2011-12-31 23:59:59',
+                                                '2012-01-01 00:00:00',
+                                                '2012-01-01 00:00:01']))
+    series_second.index.resolution
+    series_second['2011-12-31 23:59']
+
+If the timestamp string is treated as a slice, it can be used to index ``DataFrame`` with ``[]`` as well.
+
+.. ipython:: python
+
+    dft_minute = pd.DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]},
+                               index=series_minute.index)
+    dft_minute['2011-12-31 23']
+
+
+.. warning::
+
+   However, if the string is treated as an exact match, the selection in ``DataFrame``'s ``[]`` will be column-wise and not row-wise, see :ref:`Indexing Basics <indexing.basics>`. For example ``dft_minute['2011-12-31 23:59']`` will raise ``KeyError`` as ``'2012-12-31 23:59'`` has the same resolution as the index and there is no column with such name:
+
+   To *always* have unambiguous selection, whether the row is treated as a slice or a single selection, use ``.loc``.
 
    .. ipython:: python
 
-      dft.loc['2013-1-15 12:30:00']
+     dft_minute.loc['2011-12-31 23:59']
 
+Note also that ``DatetimeIndex`` resolution cannot be less precise than day.
 
-Datetime Indexing
-~~~~~~~~~~~~~~~~~
+.. ipython:: python
 
-Indexing a ``DateTimeIndex`` with a partial string depends on the "accuracy" of the period, in other words how specific the interval is in relation to the frequency of the index. In contrast, indexing with datetime objects is exact, because the objects have exact meaning. These also follow the semantics of *including both endpoints*.
+    series_monthly = pd.Series([1, 2, 3],
+                              pd.DatetimeIndex(['2011-12',
+                                                '2012-01',
+                                                '2012-02']))
+    series_monthly.index.resolution
+    series_monthly['2011-12'] # returns Series
 
-These ``datetime`` objects  are specific ``hours, minutes,`` and ``seconds`` even though they were not explicitly specified (they are ``0``).
+
+Exact Indexing
+~~~~~~~~~~~~~~
+
+As discussed in previous section, indexing a ``DatetimeIndex`` with a partial string depends on the "accuracy" of the period, in other words how specific the interval is in relation to the resolution of the index. In contrast, indexing with ``Timestamp`` or ``datetime`` objects is exact, because the objects have exact meaning. These also follow the semantics of *including both endpoints*.
+
+These ``Timestamp`` and ``datetime`` objects have exact ``hours, minutes,`` and ``seconds``, even though they were not explicitly specified (they are ``0``).
 
 .. ipython:: python
 
@@ -444,25 +683,32 @@ With no defaults.
 Truncating & Fancy Indexing
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-A ``truncate`` convenience function is provided that is equivalent to slicing:
+A :meth:`~DataFrame.truncate` convenience function is provided that is similar 
+to slicing. Note that ``truncate`` assumes a 0 value for any unspecified date 
+component in a ``DatetimeIndex`` in contrast to slicing which returns any 
+partially matching dates:
 
 .. ipython:: python
 
-   ts.truncate(before='10/31/2011', after='12/31/2011')
+   rng2 = pd.date_range('2011-01-01', '2012-01-01', freq='W')
+   ts2 = pd.Series(np.random.randn(len(rng2)), index=rng2)
+
+   ts2.truncate(before='2011-11', after='2011-12')
+   ts2['2011-11':'2011-12']
 
-Even complicated fancy indexing that breaks the DatetimeIndex's frequency
-regularity will result in a ``DatetimeIndex`` (but frequency is lost):
+Even complicated fancy indexing that breaks the ``DatetimeIndex`` frequency
+regularity will result in a ``DatetimeIndex``, although frequency is lost:
 
 .. ipython:: python
 
-   ts[[0, 2, 6]].index
+   ts2[[0, 2, 6]].index
 
-.. _timeseries.offsets:
+.. _timeseries.components:
 
 Time/Date Components
-~~~~~~~~~~~~~~~~~~~~~~~~~~~
+--------------------
 
-There are several time/date properties that one can access from ``Timestamp`` or a collection of timestamps like a ``DateTimeIndex``.
+There are several time/date properties that one can access from ``Timestamp`` or a collection of timestamps like a ``DatetimeIndex``.
 
 .. csv-table::
     :header: "Property", "Description"
@@ -476,32 +722,39 @@ There are several time/date properties that one can access from ``Timestamp`` or
     second,"The seconds of the datetime"
     microsecond,"The microseconds of the datetime"
     nanosecond,"The nanoseconds of the datetime"
-    date,"Returns datetime.date"
-    time,"Returns datetime.time"
+    date,"Returns datetime.date (does not contain timezone information)"
+    time,"Returns datetime.time (does not contain timezone information)"
     dayofyear,"The ordinal day of year"
     weekofyear,"The week ordinal of the year"
     week,"The week ordinal of the year"
-    dayofweek,"The day of the week with Monday=0, Sunday=6"
-    weekday,"The day of the week with Monday=0, Sunday=6"
-    quarter,"Quarter of the date: Jan=Mar = 1, Apr-Jun = 2, etc."
+    dayofweek,"The number of the day of the week with Monday=0, Sunday=6"
+    weekday,"The number of the day of the week with Monday=0, Sunday=6"
+    weekday_name,"The name of the day in a week (ex: Friday)"
+    quarter,"Quarter of the date: Jan-Mar = 1, Apr-Jun = 2, etc."
+    days_in_month,"The number of days in the month of the datetime"
     is_month_start,"Logical indicating if first day of month (defined by frequency)"
     is_month_end,"Logical indicating if last day of month (defined by frequency)"
     is_quarter_start,"Logical indicating if first day of quarter (defined by frequency)"
     is_quarter_end,"Logical indicating if last day of quarter (defined by frequency)"
     is_year_start,"Logical indicating if first day of year (defined by frequency)"
     is_year_end,"Logical indicating if last day of year (defined by frequency)"
+    is_leap_year,"Logical indicating if the date belongs to a leap year"
 
-Furthermore, if you have a ``Series`` with datetimelike values, then you can access these properties via the ``.dt`` accessor, see the :ref:`docs <basics.dt_accessors>`
+Furthermore, if you have a ``Series`` with datetimelike values, then you can 
+access these properties via the ``.dt`` accessor, as detailed in the section
+on :ref:`.dt accessors<basics.dt_accessors>`.
+
+.. _timeseries.offsets:
 
-DateOffset objects
+DateOffset Objects
 ------------------
 
-In the preceding examples, we created DatetimeIndex objects at various
-frequencies by passing in frequency strings like 'M', 'W', and 'BM to the
-``freq`` keyword. Under the hood, these frequency strings are being translated
-into an instance of pandas ``DateOffset``, which represents a regular
-frequency increment. Specific offset logic like "month", "business day", or
-"one hour" is represented in its various subclasses.
+In the preceding examples, we created ``DatetimeIndex`` objects at various
+frequencies by passing in :ref:`frequency strings <timeseries.offset_aliases>`
+like 'M', 'W', and 'BM' to the ``freq`` keyword. Under the hood, these frequency
+strings are being translated into an instance of :class:`DateOffset`,
+which represents a regular frequency increment. Specific offset logic like
+"month", "business day", or "one hour" is represented in its various subclasses.
 
 .. csv-table::
     :header: "Class name", "Description"
@@ -509,7 +762,7 @@ frequency increment. Specific offset logic like "month", "business day", or
 
     DateOffset, "Generic offset class, defaults to 1 calendar day"
     BDay, "business day (weekday)"
-    CDay, "custom business day (experimental)"
+    CDay, "custom business day"
     Week, "one week, optionally anchored on a day of the week"
     WeekOfMonth, "the x-th day of the y-th week of each month"
     LastWeekOfMonth, "the x-th day of the last week of each month"
@@ -519,6 +772,8 @@ frequency increment. Specific offset logic like "month", "business day", or
     BMonthBegin, "business month begin"
     CBMonthEnd, "custom business month end"
     CBMonthBegin, "custom business month begin"
+    SemiMonthEnd, "15th (or other day_of_month) and calendar month end"
+    SemiMonthBegin, "15th (or other day_of_month) and calendar month begin"
     QuarterEnd, "calendar quarter end"
     QuarterBegin, "calendar quarter begin"
     BQuarterEnd, "business quarter end"
@@ -530,6 +785,7 @@ frequency increment. Specific offset logic like "month", "business day", or
     BYearBegin, "business year begin"
     FY5253, "retail (aka 52-53 week) year"
     BusinessHour, "business hour"
+    CustomBusinessHour, "custom business hour"
     Hour, "one hour"
     Minute, "one minute"
     Second, "one second"
@@ -538,7 +794,7 @@ frequency increment. Specific offset logic like "month", "business day", or
     Nano, "one nanosecond"
 
 The basic ``DateOffset`` takes the same arguments as
-``dateutil.relativedelta``, which works like:
+``dateutil.relativedelta``, which works as follows:
 
 .. ipython:: python
 
@@ -554,12 +810,13 @@ We could have done the same thing with ``DateOffset``:
 
 The key features of a ``DateOffset`` object are:
 
-  - it can be added / subtracted to/from a datetime object to obtain a
-    shifted date
-  - it can be multiplied by an integer (positive or negative) so that the
-    increment will be applied multiple times
-  - it has ``rollforward`` and ``rollback`` methods for moving a date forward
-    or backward to the next or previous "offset date"
+* It can be added / subtracted to/from a datetime object to obtain a
+  shifted date.
+* It can be multiplied by an integer (positive or negative) so that the
+  increment will be applied multiple times.
+* It has :meth:`~pandas.DateOffset.rollforward` and
+  :meth:`~pandas.DateOffset.rollback` methods for moving a date forward or 
+  backward to the next or previous "offset date".
 
 Subclasses of ``DateOffset`` define the ``apply`` function which dictates
 custom date increment logic, such as adding business days:
@@ -588,26 +845,29 @@ The ``rollforward`` and ``rollback`` methods do exactly what you would expect:
 It's definitely worth exploring the ``pandas.tseries.offsets`` module and the
 various docstrings for the classes.
 
-These operations (``apply``, ``rollforward`` and ``rollback``) preserves time (hour, minute, etc) information by default. To reset time, use ``normalize=True`` keyword when creating the offset instance. If ``normalize=True``, result is normalized after the function is applied.
+These operations (``apply``, ``rollforward`` and ``rollback``) preserve time 
+(hour, minute, etc) information by default. To reset time, use ``normalize=True`` 
+when creating the offset instance. If ``normalize=True``, the result is 
+normalized after the function is applied.
 
 
 .. ipython:: python
 
    day = Day()
-   day.apply(Timestamp('2014-01-01 09:00'))
+   day.apply(pd.Timestamp('2014-01-01 09:00'))
 
    day = Day(normalize=True)
-   day.apply(Timestamp('2014-01-01 09:00'))
+   day.apply(pd.Timestamp('2014-01-01 09:00'))
 
    hour = Hour()
-   hour.apply(Timestamp('2014-01-01 22:00'))
+   hour.apply(pd.Timestamp('2014-01-01 22:00'))
 
    hour = Hour(normalize=True)
-   hour.apply(Timestamp('2014-01-01 22:00'))
-   hour.apply(Timestamp('2014-01-01 23:00'))
+   hour.apply(pd.Timestamp('2014-01-01 22:00'))
+   hour.apply(pd.Timestamp('2014-01-01 23:00'))
 
 
-Parametric offsets
+Parametric Offsets
 ~~~~~~~~~~~~~~~~~~
 
 Some of the offsets can be "parameterized" when created to result in different
@@ -624,7 +884,7 @@ particular day of the week:
 
    d - Week()
 
-``normalize`` option will be effective for addition and subtraction.
+The ``normalize`` option will be effective for addition and subtraction.
 
 .. ipython:: python
 
@@ -642,7 +902,7 @@ Another example is parameterizing ``YearEnd`` with the specific ending month:
 
 .. _timeseries.offsetseries:
 
-Using offsets with ``Series`` / ``DatetimeIndex``
+Using Offsets with ``Series`` / ``DatetimeIndex``
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Offsets can be used with either a ``Series`` or ``DatetimeIndex`` to
@@ -650,8 +910,8 @@ apply the offset to each element.
 
 .. ipython:: python
 
-   rng = date_range('2012-01-01', '2012-01-03')
-   s = Series(rng)
+   rng = pd.date_range('2012-01-01', '2012-01-03')
+   s = pd.Series(rng)
    rng
    rng + DateOffset(months=2)
    s + DateOffset(months=2)
@@ -665,13 +925,13 @@ used exactly like a ``Timedelta`` - see the
 .. ipython:: python
 
    s - Day(2)
-   td = s - Series(date_range('2011-12-29', '2011-12-31'))
+   td = s - pd.Series(pd.date_range('2011-12-29', '2011-12-31'))
    td
    td + Minute(15)
 
 Note that some offsets (such as ``BQuarterEnd``) do not have a
 vectorized implementation.  They can still be used but may
-calculate signficantly slower and will raise a ``PerformanceWarning``
+calculate significantly slower and will show a ``PerformanceWarning``
 
 .. ipython:: python
    :okwarning:
@@ -679,39 +939,50 @@ calculate signficantly slower and will raise a ``PerformanceWarning``
    rng + BQuarterEnd()
 
 
-.. _timeseries.alias:
+.. _timeseries.custombusinessdays:
 
-Custom Business Days (Experimental)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Custom Business Days
+~~~~~~~~~~~~~~~~~~~~
 
 The ``CDay`` or ``CustomBusinessDay`` class provides a parametric
 ``BusinessDay`` class which can be used to create customized business day
 calendars which account for local holidays and local weekend conventions.
 
+As an interesting example, let's look at Egypt where a Friday-Saturday weekend is observed.
+
 .. ipython:: python
 
     from pandas.tseries.offsets import CustomBusinessDay
-    # As an interesting example, let's look at Egypt where
-    # a Friday-Saturday weekend is observed.
     weekmask_egypt = 'Sun Mon Tue Wed Thu'
+
     # They also observe International Workers' Day so let's
     # add that for a couple of years
+
     holidays = ['2012-05-01', datetime(2013, 5, 1), np.datetime64('2014-05-01')]
     bday_egypt = CustomBusinessDay(holidays=holidays, weekmask=weekmask_egypt)
     dt = datetime(2013, 4, 30)
     dt + 2 * bday_egypt
-    dts = date_range(dt, periods=5, freq=bday_egypt)
-    Series(dts.weekday, dts).map(Series('Mon Tue Wed Thu Fri Sat Sun'.split()))
 
-As of v0.14 holiday calendars can be used to provide the list of holidays.  See the
+Let's map to the weekday names:
+
+.. ipython:: python
+
+    dts = pd.date_range(dt, periods=5, freq=bday_egypt)
+
+    pd.Series(dts.weekday, dts).map(pd.Series('Mon Tue Wed Thu Fri Sat Sun'.split()))
+
+Holiday calendars can be used to provide the list of holidays.  See the
 :ref:`holiday calendar<timeseries.holiday>` section for more information.
 
 .. ipython:: python
 
     from pandas.tseries.holiday import USFederalHolidayCalendar
+
     bday_us = CustomBusinessDay(calendar=USFederalHolidayCalendar())
+
     # Friday before MLK Day
     dt = datetime(2014, 1, 17)
+
     # Tuesday after MLK Day (Monday is skipped because it's a holiday)
     dt + bday_us
 
@@ -722,13 +993,13 @@ in the usual way.
 
     from pandas.tseries.offsets import CustomBusinessMonthBegin
     bmth_us = CustomBusinessMonthBegin(calendar=USFederalHolidayCalendar())
+
     # Skip new years
     dt = datetime(2013, 12, 17)
     dt + bmth_us
 
     # Define date index with custom offset
-    from pandas import DatetimeIndex
-    DatetimeIndex(start='20100101',end='20120101',freq=bmth_us)
+    pd.DatetimeIndex(start='20100101',end='20120101',freq=bmth_us)
 
 .. note::
 
@@ -739,22 +1010,6 @@ in the usual way.
     ensure that the 'C' frequency string is used consistently within the user's
     application.
 
-
-.. note::
-
-    This uses the ``numpy.busdaycalendar`` API introduced in Numpy 1.7 and
-    therefore requires Numpy 1.7.0 or newer.
-
-.. warning::
-
-    There are known problems with the timezone handling in Numpy 1.7 and users
-    should therefore use this **experimental(!)** feature with caution and at
-    their own risk.
-
-    To the extent that the ``datetime64`` and ``busdaycalendar`` APIs in Numpy
-    have to change to fix the timezone issues, the behaviour of the
-    ``CustomBusinessDay`` class may have to change in future versions.
-
 .. _timeseries.businesshour:
 
 Business Hour
@@ -764,9 +1019,10 @@ The ``BusinessHour`` class provides a business hour representation on ``Business
 allowing to use specific start and end times.
 
 By default, ``BusinessHour`` uses 9:00 - 17:00 as business hours.
-Adding ``BusinessHour`` will increment ``Timestamp`` by hourly.
-If target ``Timestamp`` is out of business hours, move to the next business hour then increment it.
-If the result exceeds the business hours end, remaining is added to the next business day.
+Adding ``BusinessHour`` will increment ``Timestamp`` by hourly frequency.
+If target ``Timestamp`` is out of business hours, move to the next business hour 
+then increment it. If the result exceeds the business hours end, the remaining 
+hours are added to the next business day.
 
 .. ipython:: python
 
@@ -774,36 +1030,37 @@ If the result exceeds the business hours end, remaining is added to the next bus
     bh
 
     # 2014-08-01 is Friday
-    Timestamp('2014-08-01 10:00').weekday()
-    Timestamp('2014-08-01 10:00') + bh
+    pd.Timestamp('2014-08-01 10:00').weekday()
+    pd.Timestamp('2014-08-01 10:00') + bh
 
-    # Below example is the same as Timestamp('2014-08-01 09:00') + bh
-    Timestamp('2014-08-01 08:00') + bh
+    # Below example is the same as: pd.Timestamp('2014-08-01 09:00') + bh
+    pd.Timestamp('2014-08-01 08:00') + bh
 
     # If the results is on the end time, move to the next business day
-    Timestamp('2014-08-01 16:00') + bh
+    pd.Timestamp('2014-08-01 16:00') + bh
 
     # Remainings are added to the next day
-    Timestamp('2014-08-01 16:30') + bh
+    pd.Timestamp('2014-08-01 16:30') + bh
 
     # Adding 2 business hours
-    Timestamp('2014-08-01 10:00') + BusinessHour(2)
+    pd.Timestamp('2014-08-01 10:00') + BusinessHour(2)
 
     # Subtracting 3 business hours
-    Timestamp('2014-08-01 10:00') + BusinessHour(-3)
+    pd.Timestamp('2014-08-01 10:00') + BusinessHour(-3)
 
-Also, you can specify ``start`` and ``end`` time by keywords.
-Argument must be ``str`` which has ``hour:minute`` representation or ``datetime.time`` instance.
-Specifying seconds, microseconds and nanoseconds as business hour results in ``ValueError``.
+You can also specify ``start`` and ``end`` time by keywords. The argument must 
+be a ``str`` with an ``hour:minute`` representation or a ``datetime.time`` 
+instance. Specifying seconds, microseconds and nanoseconds as business hour 
+results in ``ValueError``.
 
 .. ipython:: python
 
     bh = BusinessHour(start='11:00', end=time(20, 0))
     bh
 
-    Timestamp('2014-08-01 13:00') + bh
-    Timestamp('2014-08-01 09:00') + bh
-    Timestamp('2014-08-01 18:00') + bh
+    pd.Timestamp('2014-08-01 13:00') + bh
+    pd.Timestamp('2014-08-01 09:00') + bh
+    pd.Timestamp('2014-08-01 18:00') + bh
 
 Passing ``start`` time later than ``end`` represents midnight business hour.
 In this case, business hour exceeds midnight and overlap to the next day.
@@ -814,16 +1071,16 @@ Valid business hours are distinguished by whether it started from valid ``Busine
     bh = BusinessHour(start='17:00', end='09:00')
     bh
 
-    Timestamp('2014-08-01 17:00') + bh
-    Timestamp('2014-08-01 23:00') + bh
+    pd.Timestamp('2014-08-01 17:00') + bh
+    pd.Timestamp('2014-08-01 23:00') + bh
 
     # Although 2014-08-02 is Satuaday,
     # it is valid because it starts from 08-01 (Friday).
-    Timestamp('2014-08-02 04:00') + bh
+    pd.Timestamp('2014-08-02 04:00') + bh
 
     # Although 2014-08-04 is Monday,
     # it is out of business hours because it starts from 08-03 (Sunday).
-    Timestamp('2014-08-04 04:00') + bh
+    pd.Timestamp('2014-08-04 04:00') + bh
 
 Applying ``BusinessHour.rollforward`` and ``rollback`` to out of business hours results in
 the next business hour start or previous day's end. Different from other offsets, ``BusinessHour.rollforward``
@@ -836,55 +1093,93 @@ under the default business hours (9:00 - 17:00), there is no gap (0 minutes) bet
 .. ipython:: python
 
     # This adjusts a Timestamp to business hour edge
-    BusinessHour().rollback(Timestamp('2014-08-02 15:00'))
-    BusinessHour().rollforward(Timestamp('2014-08-02 15:00'))
+    BusinessHour().rollback(pd.Timestamp('2014-08-02 15:00'))
+    BusinessHour().rollforward(pd.Timestamp('2014-08-02 15:00'))
 
-    # It is the same as BusinessHour().apply(Timestamp('2014-08-01 17:00')).
-    # And it is the same as BusinessHour().apply(Timestamp('2014-08-04 09:00'))
-    BusinessHour().apply(Timestamp('2014-08-02 15:00'))
+    # It is the same as BusinessHour().apply(pd.Timestamp('2014-08-01 17:00')).
+    # And it is the same as BusinessHour().apply(pd.Timestamp('2014-08-04 09:00'))
+    BusinessHour().apply(pd.Timestamp('2014-08-02 15:00'))
 
     # BusinessDay results (for reference)
-    BusinessHour().rollforward(Timestamp('2014-08-02'))
+    BusinessHour().rollforward(pd.Timestamp('2014-08-02'))
 
-    # It is the same as BusinessDay().apply(Timestamp('2014-08-01'))
+    # It is the same as BusinessDay().apply(pd.Timestamp('2014-08-01'))
     # The result is the same as rollworward because BusinessDay never overlap.
-    BusinessHour().apply(Timestamp('2014-08-02'))
+    BusinessHour().apply(pd.Timestamp('2014-08-02'))
+
+``BusinessHour`` regards Saturday and Sunday as holidays. To use arbitrary 
+holidays, you can use ``CustomBusinessHour`` offset, as explained in the 
+following subsection.
+
+.. _timeseries.custombusinesshour:
+
+Custom Business Hour
+~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.18.1
+
+The ``CustomBusinessHour`` is a mixture of ``BusinessHour`` and ``CustomBusinessDay`` which
+allows you to specify arbitrary holidays. ``CustomBusinessHour`` works as the same
+as ``BusinessHour`` except that it skips specified custom holidays.
+
+.. ipython:: python
+
+    from pandas.tseries.holiday import USFederalHolidayCalendar
+    bhour_us = CustomBusinessHour(calendar=USFederalHolidayCalendar())
+    # Friday before MLK Day
+    dt = datetime(2014, 1, 17, 15)
+
+    dt + bhour_us
+
+    # Tuesday after MLK Day (Monday is skipped because it's a holiday)
+    dt + bhour_us * 2
+
+You can use keyword arguments supported by either ``BusinessHour`` and ``CustomBusinessDay``.
+
+.. ipython:: python
 
+    bhour_mon = CustomBusinessHour(start='10:00', weekmask='Tue Wed Thu Fri')
+
+    # Monday is skipped because it's a holiday, business hour starts from 10:00
+    dt + bhour_mon * 2
+
+.. _timeseries.offset_aliases:
 
 Offset Aliases
 ~~~~~~~~~~~~~~
 
 A number of string aliases are given to useful common time series
-frequencies. We will refer to these aliases as *offset aliases*
-(referred to as *time rules* prior to v0.8.0).
+frequencies. We will refer to these aliases as *offset aliases*.
 
 .. csv-table::
     :header: "Alias", "Description"
     :widths: 15, 100
 
     "B", "business day frequency"
-    "C", "custom business day frequency (experimental)"
+    "C", "custom business day frequency"
     "D", "calendar day frequency"
     "W", "weekly frequency"
     "M", "month end frequency"
+    "SM", "semi-month end frequency (15th and end of month)"
     "BM", "business month end frequency"
     "CBM", "custom business month end frequency"
     "MS", "month start frequency"
+    "SMS", "semi-month start frequency (1st and 15th)"
     "BMS", "business month start frequency"
     "CBMS", "custom business month start frequency"
     "Q", "quarter end frequency"
-    "BQ", "business quarter endfrequency"
+    "BQ", "business quarter end frequency"
     "QS", "quarter start frequency"
     "BQS", "business quarter start frequency"
-    "A", "year end frequency"
-    "BA", "business year end frequency"
-    "AS", "year start frequency"
-    "BAS", "business year start frequency"
+    "A, Y", "year end frequency"
+    "BA, BY", "business year end frequency"
+    "AS, YS", "year start frequency"
+    "BAS, BYS", "business year start frequency"
     "BH", "business hour frequency"
     "H", "hourly frequency"
     "T, min", "minutely frequency"
     "S", "secondly frequency"
-    "L, ms", "milliseonds"
+    "L, ms", "milliseconds"
     "U, us", "microseconds"
     "N", "nanoseconds"
 
@@ -896,17 +1191,17 @@ most functions:
 
 .. ipython:: python
 
-   date_range(start, periods=5, freq='B')
+   pd.date_range(start, periods=5, freq='B')
 
-   date_range(start, periods=5, freq=BDay())
+   pd.date_range(start, periods=5, freq=BDay())
 
 You can combine together day and intraday offsets:
 
 .. ipython:: python
 
-   date_range(start, periods=10, freq='2h20min')
+   pd.date_range(start, periods=10, freq='2h20min')
 
-   date_range(start, periods=10, freq='1D10U')
+   pd.date_range(start, periods=10, freq='1D10U')
 
 Anchored Offsets
 ~~~~~~~~~~~~~~~~
@@ -917,13 +1212,13 @@ For some frequencies you can specify an anchoring suffix:
     :header: "Alias", "Description"
     :widths: 15, 100
 
-    "W\-SUN", "weekly frequency (sundays). Same as 'W'"
-    "W\-MON", "weekly frequency (mondays)"
-    "W\-TUE", "weekly frequency (tuesdays)"
-    "W\-WED", "weekly frequency (wednesdays)"
-    "W\-THU", "weekly frequency (thursdays)"
-    "W\-FRI", "weekly frequency (fridays)"
-    "W\-SAT", "weekly frequency (saturdays)"
+    "W\-SUN", "weekly frequency (Sundays). Same as 'W'"
+    "W\-MON", "weekly frequency (Mondays)"
+    "W\-TUE", "weekly frequency (Tuesdays)"
+    "W\-WED", "weekly frequency (Wednesdays)"
+    "W\-THU", "weekly frequency (Thursdays)"
+    "W\-FRI", "weekly frequency (Fridays)"
+    "W\-SAT", "weekly frequency (Saturdays)"
     "(B)Q(S)\-DEC", "quarterly frequency, year ends in December. Same as 'Q'"
     "(B)Q(S)\-JAN", "quarterly frequency, year ends in January"
     "(B)Q(S)\-FEB", "quarterly frequency, year ends in February"
@@ -953,47 +1248,51 @@ These can be used as arguments to ``date_range``, ``bdate_range``, constructors
 for ``DatetimeIndex``, as well as various other timeseries-related functions
 in pandas.
 
-.. _timeseries.legacyaliases:
+Anchored Offset Semantics
+~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Legacy Aliases
-~~~~~~~~~~~~~~
-Note that prior to v0.8.0, time rules had a slightly different look. These are
-deprecated in v0.17.0, and removed in future version.
+For those offsets that are anchored to the start or end of specific
+frequency (``MonthEnd``, ``MonthBegin``, ``WeekEnd``, etc), the following
+rules apply to rolling forward and backwards.
 
-.. csv-table::
-    :header: "Legacy Time Rule", "Offset Alias"
-    :widths: 15, 65
+When ``n`` is not 0, if the given date is not on an anchor point, it snapped to the next(previous)
+anchor point, and moved ``|n|-1`` additional steps forwards or backwards.
+
+.. ipython:: python
+
+   pd.Timestamp('2014-01-02') + MonthBegin(n=1)
+   pd.Timestamp('2014-01-02') + MonthEnd(n=1)
+
+   pd.Timestamp('2014-01-02') - MonthBegin(n=1)
+   pd.Timestamp('2014-01-02') - MonthEnd(n=1)
+
+   pd.Timestamp('2014-01-02') + MonthBegin(n=4)
+   pd.Timestamp('2014-01-02') - MonthBegin(n=4)
+
+If the given date *is* on an anchor point, it is moved ``|n|`` points forwards
+or backwards.
+
+.. ipython:: python
+
+   pd.Timestamp('2014-01-01') + MonthBegin(n=1)
+   pd.Timestamp('2014-01-31') + MonthEnd(n=1)
+
+   pd.Timestamp('2014-01-01') - MonthBegin(n=1)
+   pd.Timestamp('2014-01-31') - MonthEnd(n=1)
+
+   pd.Timestamp('2014-01-01') + MonthBegin(n=4)
+   pd.Timestamp('2014-01-31') - MonthBegin(n=4)
+
+For the case when ``n=0``, the date is not moved if on an anchor point, otherwise
+it is rolled forward to the next anchor point.
+
+.. ipython:: python
 
-    "WEEKDAY", "B"
-    "EOM", "BM"
-    "W\@MON", "W\-MON"
-    "W\@TUE", "W\-TUE"
-    "W\@WED", "W\-WED"
-    "W\@THU", "W\-THU"
-    "W\@FRI", "W\-FRI"
-    "W\@SAT", "W\-SAT"
-    "W\@SUN", "W\-SUN"
-    "Q\@JAN", "BQ\-JAN"
-    "Q\@FEB", "BQ\-FEB"
-    "Q\@MAR", "BQ\-MAR"
-    "A\@JAN", "BA\-JAN"
-    "A\@FEB", "BA\-FEB"
-    "A\@MAR", "BA\-MAR"
-    "A\@APR", "BA\-APR"
-    "A\@MAY", "BA\-MAY"
-    "A\@JUN", "BA\-JUN"
-    "A\@JUL", "BA\-JUL"
-    "A\@AUG", "BA\-AUG"
-    "A\@SEP", "BA\-SEP"
-    "A\@OCT", "BA\-OCT"
-    "A\@NOV", "BA\-NOV"
-    "A\@DEC", "BA\-DEC"
-
-
-As you can see, legacy quarterly and annual frequencies are business quarters
-and business year ends. Please also note the legacy time rule for milliseconds
-``ms`` versus the new offset alias for month start ``MS``. This means that
-offset alias parsing is case sensitive.
+   pd.Timestamp('2014-01-02') + MonthBegin(n=0)
+   pd.Timestamp('2014-01-02') + MonthEnd(n=0)
+
+   pd.Timestamp('2014-01-01') + MonthBegin(n=0)
+   pd.Timestamp('2014-01-31') + MonthEnd(n=0)
 
 .. _timeseries.holiday:
 
@@ -1004,7 +1303,7 @@ Holidays and calendars provide a simple way to define holiday rules to be used
 with ``CustomBusinessDay`` or in other analysis that requires a predefined
 set of holidays.  The ``AbstractHolidayCalendar`` class provides all the necessary
 methods to return a list of holidays and only ``rules`` need to be defined
-in a specific holiday calendar class.  Further, ``start_date`` and ``end_date``
+in a specific holiday calendar class. Furthermore, the ``start_date`` and ``end_date``
 class attributes determine over what date range holidays are generated.  These
 should be overwritten on the ``AbstractHolidayCalendar`` class to have the range
 apply to all calendar subclasses.  ``USFederalHolidayCalendar`` is the
@@ -1042,11 +1341,15 @@ An example of how holidays and holiday calendars are defined:
     cal.holidays(datetime(2012, 1, 1), datetime(2012, 12, 31))
 
 Using this calendar, creating an index or doing offset arithmetic skips weekends
-and holidays (i.e., Memorial Day/July 4th).
+and holidays (i.e., Memorial Day/July 4th).  For example, the below defines
+a custom business day offset using the ``ExampleCalendar``.  Like any other offset,
+it can be used to create a ``DatetimeIndex`` or added to ``datetime``
+or ``Timestamp`` objects.
 
 .. ipython:: python
 
-    DatetimeIndex(start='7/1/2012', end='7/10/2012',
+    from pandas.tseries.offsets import CDay
+    pd.DatetimeIndex(start='7/1/2012', end='7/10/2012',
         freq=CDay(calendar=cal)).to_pydatetime()
     offset = CustomBusinessDay(calendar=cal)
     datetime(2012, 5, 25) + offset
@@ -1055,7 +1358,7 @@ and holidays (i.e., Memorial Day/July 4th).
     datetime(2012, 7, 6) + offset
 
 Ranges are defined by the ``start_date`` and ``end_date`` class attributes
-of ``AbstractHolidayCalendar``.  The defaults are below.
+of ``AbstractHolidayCalendar``.  The defaults are shown below.
 
 .. ipython:: python
 
@@ -1088,32 +1391,33 @@ or calendars with additional rules.
 
 .. _timeseries.advanced_datetime:
 
-Time series-related instance methods
+Time Series-Related Instance Methods
 ------------------------------------
 
-Shifting / lagging
+Shifting / Lagging
 ~~~~~~~~~~~~~~~~~~
 
 One may want to *shift* or *lag* the values in a time series back and forward in
-time. The method for this is ``shift``, which is available on all of the pandas
-objects.
+time. The method for this is :meth:`~Series.shift`, which is available on all of 
+the pandas objects.
 
 .. ipython:: python
 
    ts = ts[:5]
    ts.shift(1)
 
-The shift method accepts an ``freq`` argument which can accept a
-``DateOffset`` class or other ``timedelta``-like object or also a :ref:`offset alias <timeseries.alias>`:
+The ``shift`` method accepts an ``freq`` argument which can accept a
+``DateOffset`` class or other ``timedelta``-like object or also an 
+:ref:`offset alias <timeseries.offset_aliases>`:
 
 .. ipython:: python
 
-   ts.shift(5, freq=datetools.bday)
+   ts.shift(5, freq=offsets.BDay())
    ts.shift(5, freq='BM')
 
 Rather than changing the alignment of the data and the index, ``DataFrame`` and
-``Series`` objects also have a ``tshift`` convenience method that changes
-all the dates in the index by a specified number of offsets:
+``Series`` objects also have a :meth:`~Series.tshift` convenience method that 
+changes all the dates in the index by a specified number of offsets:
 
 .. ipython:: python
 
@@ -1122,88 +1426,103 @@ all the dates in the index by a specified number of offsets:
 Note that with ``tshift``, the leading entry is no longer NaN because the data
 is not being realigned.
 
-Frequency conversion
+Frequency Conversion
 ~~~~~~~~~~~~~~~~~~~~
 
-The primary function for changing frequencies is the ``asfreq`` function.
-For a ``DatetimeIndex``, this is basically just a thin, but convenient wrapper
-around ``reindex`` which generates a ``date_range`` and calls ``reindex``.
+The primary function for changing frequencies is the :meth:`~Series.asfreq` 
+method. For a ``DatetimeIndex``, this is basically just a thin, but convenient 
+wrapper around :meth:`~Series.reindex`  which generates a ``date_range`` and 
+calls ``reindex``.
 
 .. ipython:: python
 
-   dr = date_range('1/1/2010', periods=3, freq=3 * datetools.bday)
-   ts = Series(randn(3), index=dr)
+   dr = pd.date_range('1/1/2010', periods=3, freq=3 * offsets.BDay())
+   ts = pd.Series(randn(3), index=dr)
    ts
    ts.asfreq(BDay())
 
 ``asfreq`` provides a further convenience so you can specify an interpolation
-method for any gaps that may appear after the frequency conversion
+method for any gaps that may appear after the frequency conversion.
 
 .. ipython:: python
 
    ts.asfreq(BDay(), method='pad')
 
-Filling forward / backward
+Filling Forward / Backward
 ~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Related to ``asfreq`` and ``reindex`` is the ``fillna`` function documented in
-the :ref:`missing data section <missing_data.fillna>`.
+Related to ``asfreq`` and ``reindex`` is :meth:`~Series.fillna`, which is 
+documented in the :ref:`missing data section <missing_data.fillna>`.
 
-Converting to Python datetimes
+Converting to Python Datetimes
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-``DatetimeIndex`` can be converted to an array of Python native datetime.datetime objects using the
-``to_pydatetime`` method.
+``DatetimeIndex`` can be converted to an array of Python native 
+:py:class:`datetime.datetime` objects using the ``to_pydatetime`` method.
 
 .. _timeseries.resampling:
 
 Resampling
 ----------
 
-Pandas has a simple, powerful, and efficient functionality for
-performing resampling operations during frequency conversion (e.g., converting
-secondly data into 5-minutely data). This is extremely common in, but not
-limited to, financial applications.
+.. warning::
+
+   The interface to ``.resample`` has changed in 0.18.0 to be more groupby-like and hence more flexible.
+   See the :ref:`whatsnew docs <whatsnew_0180.breaking.resample>` for a comparison with prior versions.
+
+Pandas has a simple, powerful, and efficient functionality for performing 
+resampling operations during frequency conversion (e.g., converting secondly 
+data into 5-minutely data). This is extremely common in, but not limited to, 
+financial applications.
+
+:meth:`~Series.resample` is a time-based groupby, followed by a reduction method 
+on each of its groups. See some :ref:`cookbook examples <cookbook.resample>` for 
+some advanced strategies.
 
-``resample`` is a time-based groupby, followed by a reduction method on each of its groups.
+Starting in version 0.18.1, the ``resample()`` function can be used directly from
+``DataFrameGroupBy`` objects, see the :ref:`groupby docs <groupby.transform.window_resample>`.
 
-See some :ref:`cookbook examples <cookbook.resample>` for some advanced strategies
+.. note::
+
+   ``.resample()`` is similar to using a :meth:`~Series.rolling` operation with 
+   a time-based offset, see a discussion :ref:`here <stats.moments.ts-versus-resampling>`.
+
+Basics
+~~~~~~
 
 .. ipython:: python
 
-   rng = date_range('1/1/2012', periods=100, freq='S')
+   rng = pd.date_range('1/1/2012', periods=100, freq='S')
 
-   ts = Series(randint(0, 500, len(rng)), index=rng)
+   ts = pd.Series(np.random.randint(0, 500, len(rng)), index=rng)
 
-   ts.resample('5Min', how='sum')
+   ts.resample('5Min').sum()
 
 The ``resample`` function is very flexible and allows you to specify many
 different parameters to control the frequency conversion and resampling
 operation.
 
-The ``how`` parameter can be a function name or numpy array function that takes
-an array and produces aggregated values:
+Any function available via :ref:`dispatching <groupby.dispatch>` is available as
+a method of the returned object, including ``sum``, ``mean``, ``std``, ``sem``,
+``max``, ``min``, ``median``, ``first``, ``last``, ``ohlc``:
 
 .. ipython:: python
 
-   ts.resample('5Min') # default is mean
+   ts.resample('5Min').mean()
 
-   ts.resample('5Min', how='ohlc')
+   ts.resample('5Min').ohlc()
 
-   ts.resample('5Min', how=np.max)
+   ts.resample('5Min').max()
 
-Any function available via :ref:`dispatching <groupby.dispatch>` can be given to
-the ``how`` parameter by name, including ``sum``, ``mean``, ``std``, ``sem``,
-``max``, ``min``, ``median``, ``first``, ``last``, ``ohlc``.
 
 For downsampling, ``closed`` can be set to 'left' or 'right' to specify which
 end of the interval is closed:
 
 .. ipython:: python
 
-   ts.resample('5Min', closed='right')
+   ts.resample('5Min', closed='right').mean()
 
-   ts.resample('5Min', closed='left')
+   ts.resample('5Min', closed='left').mean()
 
 Parameters like ``label`` and ``loffset`` are used to manipulate the resulting
 labels. ``label`` specifies whether the result is labeled with the beginning or
@@ -1212,17 +1531,36 @@ labels.
 
 .. ipython:: python
 
-   ts.resample('5Min') # by default label='right'
+   ts.resample('5Min').mean() # by default label='left'
 
-   ts.resample('5Min', label='left')
+   ts.resample('5Min', label='left').mean()
 
-   ts.resample('5Min', label='left', loffset='1s')
+   ts.resample('5Min', label='left', loffset='1s').mean()
+
+.. note::
+
+    The default values for ``label`` and ``closed`` is 'left' for all 
+    frequency offsets except for 'M', 'A', 'Q', 'BM', 'BA', 'BQ', and 'W' 
+    which all have a default of 'right'.
+
+    .. ipython:: python
+
+       rng2 = pd.date_range('1/1/2012', end='3/31/2012', freq='D')
+       ts2 = pd.Series(range(len(rng2)), index=rng2)
+
+       # default: label='right', closed='right'
+       ts2.resample('M').max()
+
+       # default: label='left', closed='left'
+       ts2.resample('SM').max()
+
+       ts2.resample('SM', label='right', closed='right').max()
 
 The ``axis`` parameter can be set to 0 or 1 and allows you to resample the
-specified axis for a DataFrame.
+specified axis for a ``DataFrame``.
 
 ``kind`` can be set to 'timestamp' or 'period' to convert the resulting index
-to/from time-stamp and time-span representations. By default ``resample``
+to/from timestamp and time span representations. By default ``resample``
 retains the input representation.
 
 ``convention`` can be set to 'start' or 'end' when resampling period data
@@ -1230,43 +1568,43 @@ retains the input representation.
 frequency periods.
 
 
-Up Sampling
-~~~~~~~~~~~
+Upsampling
+~~~~~~~~~~
 
-For upsampling, the ``fill_method`` and ``limit`` parameters can be specified
-to interpolate over the gaps that are created:
+For upsampling, you can specify a way to upsample and the ``limit`` parameter to interpolate over the gaps that are created:
 
 .. ipython:: python
 
    # from secondly to every 250 milliseconds
 
-   ts[:2].resample('250L')
+   ts[:2].resample('250L').asfreq()
 
-   ts[:2].resample('250L', fill_method='pad')
+   ts[:2].resample('250L').ffill()
 
-   ts[:2].resample('250L', fill_method='pad', limit=2)
+   ts[:2].resample('250L').ffill(limit=2)
 
 Sparse Resampling
 ~~~~~~~~~~~~~~~~~
 
-Sparse timeseries are ones where you have a lot fewer points relative
-to the amount of time you are looking to resample. Naively upsampling a sparse series can potentially
-generate lots of intermediate values. When you don't want to use a method to fill these values, e.g. ``fill_method`` is ``None``,
-then intermediate values will be filled with ``NaN``.
+Sparse timeseries are the ones where you have a lot fewer points relative
+to the amount of time you are looking to resample. Naively upsampling a sparse 
+series can potentially generate lots of intermediate values. When you don't want 
+to use a method to fill these values, e.g. ``fill_method`` is ``None``, then 
+intermediate values will be filled with ``NaN``.
 
 Since ``resample`` is a time-based groupby, the following is a method to efficiently
-resample only the groups that are not all ``NaN``
+resample only the groups that are not all ``NaN``.
 
 .. ipython:: python
 
-    rng = date_range('2014-1-1', periods=100, freq='D') + Timedelta('1s')
-    ts = Series(range(100), index=rng)
+    rng = pd.date_range('2014-1-1', periods=100, freq='D') + pd.Timedelta('1s')
+    ts = pd.Series(range(100), index=rng)
 
-If we want to resample to the full range of the series
+If we want to resample to the full range of the series:
 
 .. ipython:: python
 
-    ts.resample('3T',how='sum')
+    ts.resample('3T').sum()
 
 We can instead only resample those groups where we have points as follows:
 
@@ -1278,10 +1616,96 @@ We can instead only resample those groups where we have points as follows:
     def round(t, freq):
         # round a Timestamp to a specified freq
         freq = to_offset(freq)
-        return Timestamp((t.value // freq.delta.value) * freq.delta.value)
+        return pd.Timestamp((t.value // freq.delta.value) * freq.delta.value)
 
     ts.groupby(partial(round, freq='3T')).sum()
 
+.. _timeseries.aggregate:
+
+Aggregation
+~~~~~~~~~~~
+
+Similar to the :ref:`aggregating API <basics.aggregate>`, :ref:`groupby API <groupby.aggregate>`, and the :ref:`window functions API <stats.aggregate>`,
+a ``Resampler`` can be selectively resampled.
+
+Resampling a ``DataFrame``, the default will be to act on all columns with the same function.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(1000, 3),
+                     index=pd.date_range('1/1/2012', freq='S', periods=1000),
+                     columns=['A', 'B', 'C'])
+   r = df.resample('3T')
+   r.mean()
+
+We can select a specific column or columns using standard getitem.
+
+.. ipython:: python
+
+   r['A'].mean()
+
+   r[['A','B']].mean()
+
+You can pass a list or dict of functions to do aggregation with, outputting a ``DataFrame``:
+
+.. ipython:: python
+
+   r['A'].agg([np.sum, np.mean, np.std])
+
+On a resampled ``DataFrame``, you can pass a list of functions to apply to each
+column, which produces an aggregated result with a hierarchical index:
+
+.. ipython:: python
+
+   r.agg([np.sum, np.mean])
+
+By passing a dict to ``aggregate`` you can apply a different aggregation to the
+columns of a ``DataFrame``:
+
+.. ipython:: python
+   :okexcept:
+
+   r.agg({'A' : np.sum,
+          'B' : lambda x: np.std(x, ddof=1)})
+
+The function names can also be strings. In order for a string to be valid it
+must be implemented on the resampled object:
+
+.. ipython:: python
+
+   r.agg({'A' : 'sum', 'B' : 'std'})
+
+Furthermore, you can also specify multiple aggregation functions for each column separately.
+
+.. ipython:: python
+
+   r.agg({'A' : ['sum','std'], 'B' : ['mean','std'] })
+
+
+If a ``DataFrame`` does not have a datetimelike index, but instead you want
+to resample based on datetimelike column in the frame, it can passed to the
+``on`` keyword.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'date': pd.date_range('2015-01-01', freq='W', periods=5),
+                      'a': np.arange(5)},
+                     index=pd.MultiIndex.from_arrays([
+                              [1,2,3,4,5],
+                              pd.date_range('2015-01-01', freq='W', periods=5)],
+                          names=['v','d']))
+   df
+   df.resample('M', on='date').sum()
+
+Similarly, if you instead want to resample by a datetimelike
+level of ``MultiIndex``, its name or location can be passed to the
+``level`` keyword.
+
+.. ipython:: python
+
+   df.resample('M', level='d').sum()
+
+
 .. _timeseries.periods:
 
 Time Span Representation
@@ -1300,53 +1724,53 @@ Because ``freq`` represents a span of ``Period``, it cannot be negative like "-3
 
 .. ipython:: python
 
-   Period('2012', freq='A-DEC')
+   pd.Period('2012', freq='A-DEC')
 
-   Period('2012-1-1', freq='D')
+   pd.Period('2012-1-1', freq='D')
 
-   Period('2012-1-1 19:00', freq='H')
+   pd.Period('2012-1-1 19:00', freq='H')
 
-   Period('2012-1-1 19:00', freq='5H')
+   pd.Period('2012-1-1 19:00', freq='5H')
 
 Adding and subtracting integers from periods shifts the period by its own
 frequency. Arithmetic is not allowed between ``Period`` with different ``freq`` (span).
 
 .. ipython:: python
 
-   p = Period('2012', freq='A-DEC')
+   p = pd.Period('2012', freq='A-DEC')
    p + 1
    p - 3
-   p = Period('2012-01', freq='2M')
+   p = pd.Period('2012-01', freq='2M')
    p + 2
    p - 1
    @okexcept
-   p == Period('2012-01', freq='3M')
+   p == pd.Period('2012-01', freq='3M')
 
 
-If ``Period`` freq is daily or higher (``D``, ``H``, ``T``, ``S``, ``L``, ``U``, ``N``), ``offsets`` and ``timedelta``-like can be added if the result can have the same freq. Otherise, ``ValueError`` will be raised.
+If ``Period`` freq is daily or higher (``D``, ``H``, ``T``, ``S``, ``L``, ``U``, ``N``), ``offsets`` and ``timedelta``-like can be added if the result can have the same freq. Otherwise, ``ValueError`` will be raised.
 
 .. ipython:: python
 
-   p = Period('2014-07-01 09:00', freq='H')
+   p = pd.Period('2014-07-01 09:00', freq='H')
    p + Hour(2)
    p + timedelta(minutes=120)
    p + np.timedelta64(7200, 's')
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [1]: p + Minute(5)
    Traceback
       ...
    ValueError: Input has different freq from Period(freq=H)
 
-If ``Period`` has other freqs, only the same ``offsets`` can be added. Otherwise, ``ValueError`` will be raised.
+If ``Period`` has other frequencies, only the same ``offsets`` can be added. Otherwise, ``ValueError`` will be raised.
 
 .. ipython:: python
 
-   p = Period('2014-07', freq='M')
+   p = pd.Period('2014-07', freq='M')
    p + MonthEnd(3)
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [1]: p + MonthBegin(3)
    Traceback
@@ -1358,7 +1782,7 @@ return the number of frequency units between them:
 
 .. ipython:: python
 
-   Period('2012', freq='A-DEC') - Period('2002', freq='A-DEC')
+   pd.Period('2012', freq='A-DEC') - pd.Period('2002', freq='A-DEC')
 
 PeriodIndex and period_range
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -1367,42 +1791,90 @@ which can be constructed using the ``period_range`` convenience function:
 
 .. ipython:: python
 
-   prng = period_range('1/1/2011', '1/1/2012', freq='M')
+   prng = pd.period_range('1/1/2011', '1/1/2012', freq='M')
    prng
 
 The ``PeriodIndex`` constructor can also be used directly:
 
 .. ipython:: python
 
-   PeriodIndex(['2011-1', '2011-2', '2011-3'], freq='M')
+   pd.PeriodIndex(['2011-1', '2011-2', '2011-3'], freq='M')
 
 Passing multiplied frequency outputs a sequence of ``Period`` which
 has multiplied span.
 
 .. ipython:: python
 
-   PeriodIndex(start='2014-01', freq='3M', periods=4)
+   pd.PeriodIndex(start='2014-01', freq='3M', periods=4)
+
+If ``start`` or ``end`` are ``Period`` objects, they will be used as anchor
+endpoints for a ``PeriodIndex`` with frequency matching that of the
+``PeriodIndex`` constructor.
+
+.. ipython:: python
+
+   pd.PeriodIndex(start=pd.Period('2017Q1', freq='Q'),
+                  end=pd.Period('2017Q2', freq='Q'), freq='M')
 
 Just like ``DatetimeIndex``, a ``PeriodIndex`` can also be used to index pandas
 objects:
 
 .. ipython:: python
 
-   ps = Series(randn(len(prng)), prng)
+   ps = pd.Series(np.random.randn(len(prng)), prng)
    ps
 
 ``PeriodIndex`` supports addition and subtraction with the same rule as ``Period``.
 
 .. ipython:: python
 
-   idx = period_range('2014-07-01 09:00', periods=5, freq='H')
+   idx = pd.period_range('2014-07-01 09:00', periods=5, freq='H')
    idx
    idx + Hour(2)
 
-   idx = period_range('2014-07', periods=5, freq='M')
+   idx = pd.period_range('2014-07', periods=5, freq='M')
    idx
    idx + MonthEnd(3)
 
+``PeriodIndex`` has its own dtype named ``period``, refer to :ref:`Period Dtypes <timeseries.period_dtype>`.
+
+.. _timeseries.period_dtype:
+
+Period Dtypes
+~~~~~~~~~~~~~
+
+.. versionadded:: 0.19.0
+
+``PeriodIndex`` has a custom ``period`` dtype. This is a pandas extension
+dtype similar to the :ref:`timezone aware dtype <timeseries.timezone_series>` (``datetime64[ns, tz]``).
+
+The ``period`` dtype holds the ``freq`` attribute and is represented with
+``period[freq]`` like ``period[D]`` or ``period[M]``, using :ref:`frequency strings <timeseries.offset_aliases>`.
+
+.. ipython:: python
+
+   pi = pd.period_range('2016-01-01', periods=3, freq='M')
+   pi
+   pi.dtype
+
+The ``period`` dtype can be used in ``.astype(...)``. It allows one to change the
+``freq`` of a ``PeriodIndex`` like ``.asfreq()`` and convert a
+``DatetimeIndex`` to ``PeriodIndex`` like ``to_period()``:
+
+.. ipython:: python
+
+   # change monthly freq to daily freq
+   pi.astype('period[D]')
+
+   # convert to DatetimeIndex
+   pi.astype('datetime64[ns]')
+
+   # convert to PeriodIndex
+   dti = pd.date_range('2011-01-01', freq='M', periods=3)
+   dti
+   dti.astype('period[M]')
+
+
 PeriodIndex Partial String Indexing
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
@@ -1422,8 +1894,9 @@ Passing a string representing a lower frequency than ``PeriodIndex`` returns par
 
    ps['2011']
 
-   dfp = DataFrame(randn(600,1), columns=['A'],
-                   index=period_range('2013-01-01 9:00', periods=600, freq='T'))
+   dfp = pd.DataFrame(np.random.randn(600,1),
+                      columns=['A'],
+                      index=pd.period_range('2013-01-01 9:00', periods=600, freq='T'))
    dfp
    dfp['2013-01-01 10H']
 
@@ -1440,7 +1913,7 @@ method. Let's start with the fiscal year 2011, ending in December:
 
 .. ipython:: python
 
-   p = Period('2011', freq='A-DEC')
+   p = pd.Period('2011', freq='A-DEC')
    p
 
 We can convert it to a monthly frequency. Using the ``how`` parameter, we can
@@ -1465,7 +1938,7 @@ input period:
 
 .. ipython:: python
 
-   p = Period('2011-12', freq='M')
+   p = pd.Period('2011-12', freq='M')
 
    p.asfreq('A-NOV')
 
@@ -1486,7 +1959,7 @@ frequencies ``Q-JAN`` through ``Q-DEC``.
 
 .. ipython:: python
 
-   p = Period('2012Q1', freq='Q-DEC')
+   p = pd.Period('2012Q1', freq='Q-DEC')
 
    p.asfreq('D', 's')
 
@@ -1496,7 +1969,7 @@ frequencies ``Q-JAN`` through ``Q-DEC``.
 
 .. ipython:: python
 
-   p = Period('2011Q4', freq='Q-MAR')
+   p = pd.Period('2011Q4', freq='Q-MAR')
 
    p.asfreq('D', 's')
 
@@ -1504,7 +1977,7 @@ frequencies ``Q-JAN`` through ``Q-DEC``.
 
 .. _timeseries.interchange:
 
-Converting between Representations
+Converting Between Representations
 ----------------------------------
 
 Timestamped data can be converted to PeriodIndex-ed data using ``to_period``
@@ -1512,9 +1985,9 @@ and vice-versa using ``to_timestamp``:
 
 .. ipython:: python
 
-   rng = date_range('1/1/2012', periods=5, freq='M')
+   rng = pd.date_range('1/1/2012', periods=5, freq='M')
 
-   ts = Series(randn(len(rng)), index=rng)
+   ts = pd.Series(np.random.randn(len(rng)), index=rng)
 
    ts
 
@@ -1538,9 +2011,9 @@ the quarter end:
 
 .. ipython:: python
 
-   prng = period_range('1990Q1', '2000Q4', freq='Q-NOV')
+   prng = pd.period_range('1990Q1', '2000Q4', freq='Q-NOV')
 
-   ts = Series(randn(len(prng)), prng)
+   ts = pd.Series(np.random.randn(len(prng)), prng)
 
    ts.index = (prng.asfreq('M', 'e') + 1).asfreq('H', 's') + 9
 
@@ -1548,35 +2021,35 @@ the quarter end:
 
 .. _timeseries.oob:
 
-Representing out-of-bounds spans
+Representing Out-of-Bounds Spans
 --------------------------------
 
-If you have data that is outside of the ``Timestamp`` bounds, see :ref:`Timestamp limitations <gotchas.timestamp-limits>`,
+If you have data that is outside of the ``Timestamp`` bounds, see :ref:`Timestamp limitations <timeseries.timestamp-limits>`,
 then you can use a ``PeriodIndex`` and/or ``Series`` of ``Periods`` to do computations.
 
 .. ipython:: python
 
-   span = period_range('1215-01-01', '1381-01-01', freq='D')
+   span = pd.period_range('1215-01-01', '1381-01-01', freq='D')
    span
 
-To convert from a ``int64`` based YYYYMMDD representation.
+To convert from an ``int64`` based YYYYMMDD representation.
 
 .. ipython:: python
 
-   s = Series([20121231, 20141130, 99991231])
+   s = pd.Series([20121231, 20141130, 99991231])
    s
 
    def conv(x):
-       return Period(year = x // 10000, month = x//100 % 100, day = x%100, freq='D')
+       return pd.Period(year = x // 10000, month = x//100 % 100, day = x%100, freq='D')
 
    s.apply(conv)
    s.apply(conv)[2]
 
-These can easily be converted to a ``PeriodIndex``
+These can easily be converted to a ``PeriodIndex``:
 
 .. ipython:: python
 
-   span = PeriodIndex(s.apply(conv))
+   span = pd.PeriodIndex(s.apply(conv))
    span
 
 .. _timeseries.timezone:
@@ -1584,9 +2057,11 @@ These can easily be converted to a ``PeriodIndex``
 Time Zone Handling
 ------------------
 
-Pandas provides rich support for working with timestamps in different time zones using ``pytz`` and ``dateutil`` libraries.
-``dateutil`` support is new in 0.14.1 and currently only supported for fixed offset and tzfile zones. The default library is ``pytz``.
-Support for ``dateutil`` is provided for compatibility with other applications e.g. if you use ``dateutil`` in other python packages.
+Pandas provides rich support for working with timestamps in different time
+zones using ``pytz`` and ``dateutil`` libraries. ``dateutil`` currently is only
+supported for fixed offset and tzfile zones. The default library is ``pytz``.
+Support for ``dateutil`` is provided for compatibility with other
+applications e.g. if you use ``dateutil`` in other Python packages.
 
 Working with Time Zones
 ~~~~~~~~~~~~~~~~~~~~~~~
@@ -1595,33 +2070,33 @@ By default, pandas objects are time zone unaware:
 
 .. ipython:: python
 
-   rng = date_range('3/6/2012 00:00', periods=15, freq='D')
+   rng = pd.date_range('3/6/2012 00:00', periods=15, freq='D')
    rng.tz is None
 
 To supply the time zone, you can use the ``tz`` keyword to ``date_range`` and
 other functions. Dateutil time zone strings are distinguished from ``pytz``
 time zones by starting with ``dateutil/``.
 
-- In ``pytz`` you can find a list of common (and less common) time zones using
+* In ``pytz`` you can find a list of common (and less common) time zones using
   ``from pytz import common_timezones, all_timezones``.
-- ``dateutil`` uses the OS timezones so there isn't a fixed list available. For
+* ``dateutil`` uses the OS timezones so there isn't a fixed list available. For
   common zones, the names are the same as ``pytz``.
 
 .. ipython:: python
 
    # pytz
-   rng_pytz = date_range('3/6/2012 00:00', periods=10, freq='D',
-                         tz='Europe/London')
+   rng_pytz = pd.date_range('3/6/2012 00:00', periods=10, freq='D',
+                            tz='Europe/London')
    rng_pytz.tz
 
    # dateutil
-   rng_dateutil = date_range('3/6/2012 00:00', periods=10, freq='D',
-                             tz='dateutil/Europe/London')
+   rng_dateutil = pd.date_range('3/6/2012 00:00', periods=10, freq='D',
+                                tz='dateutil/Europe/London')
    rng_dateutil.tz
 
    # dateutil - utc special case
-   rng_utc = date_range('3/6/2012 00:00', periods=10, freq='D',
-                        tz=dateutil.tz.tzutc())
+   rng_utc = pd.date_range('3/6/2012 00:00', periods=10, freq='D',
+                           tz=dateutil.tz.tzutc())
    rng_utc.tz
 
 Note that the ``UTC`` timezone is a special case in ``dateutil`` and should be constructed explicitly
@@ -1632,23 +2107,23 @@ which gives you more control over which time zone is used:
 
    # pytz
    tz_pytz = pytz.timezone('Europe/London')
-   rng_pytz = date_range('3/6/2012 00:00', periods=10, freq='D',
-                         tz=tz_pytz)
+   rng_pytz = pd.date_range('3/6/2012 00:00', periods=10, freq='D',
+                            tz=tz_pytz)
    rng_pytz.tz == tz_pytz
 
    # dateutil
    tz_dateutil = dateutil.tz.gettz('Europe/London')
-   rng_dateutil = date_range('3/6/2012 00:00', periods=10, freq='D',
-                             tz=tz_dateutil)
+   rng_dateutil = pd.date_range('3/6/2012 00:00', periods=10, freq='D',
+                                tz=tz_dateutil)
    rng_dateutil.tz == tz_dateutil
 
 Timestamps, like Python's ``datetime.datetime`` object can be either time zone
-naive or time zone aware. Naive time series and DatetimeIndex objects can be
+naive or time zone aware. Naive time series and ``DatetimeIndex`` objects can be
 *localized* using ``tz_localize``:
 
 .. ipython:: python
 
-   ts = Series(randn(len(rng)), rng)
+   ts = pd.Series(np.random.randn(len(rng)), rng)
 
    ts_utc = ts.tz_localize('UTC')
    ts_utc
@@ -1678,7 +2153,7 @@ tz-aware data to another time zone:
 
        It is incorrect to pass a timezone directly into the ``datetime.datetime`` constructor (e.g.,
        ``datetime.datetime(2011, 1, 1, tz=timezone('US/Eastern'))``.  Instead, the datetime
-       needs to be localized using the the localize method on the timezone.
+       needs to be localized using the localize method on the timezone.
 
 Under the hood, all timestamps are stored in UTC. Scalar values from a
 ``DatetimeIndex`` with a time zone will have their fields (day, hour, minute)
@@ -1694,8 +2169,8 @@ still considered to be equal even if they are in different time zones:
    rng_berlin[5]
    rng_eastern[5] == rng_berlin[5]
 
-Like Series, DataFrame, and DatetimeIndex, Timestamps can be converted to other
-time zones using ``tz_convert``:
+Like ``Series``, ``DataFrame``, and ``DatetimeIndex``; ``Timestamp`` objects
+can be converted to other time zones using ``tz_convert``:
 
 .. ipython:: python
 
@@ -1703,7 +2178,7 @@ time zones using ``tz_convert``:
    rng_berlin[5]
    rng_eastern[5].tz_convert('Europe/Berlin')
 
-Localization of Timestamps functions just like DatetimeIndex and Series:
+Localization of ``Timestamp`` functions just like ``DatetimeIndex`` and ``Series``:
 
 .. ipython:: python
 
@@ -1711,8 +2186,8 @@ Localization of Timestamps functions just like DatetimeIndex and Series:
    rng[5].tz_localize('Asia/Shanghai')
 
 
-Operations between Series in different time zones will yield UTC
-Series, aligning the data on the UTC timestamps:
+Operations between ``Series`` in different time zones will yield UTC
+``Series``, aligning the data on the UTC timestamps:
 
 .. ipython:: python
 
@@ -1728,7 +2203,7 @@ To remove timezone from tz-aware ``DatetimeIndex``, use ``tz_localize(None)`` or
 
 .. ipython:: python
 
-   didx = DatetimeIndex(start='2014-08-01 09:00', freq='H', periods=10, tz='US/Eastern')
+   didx = pd.DatetimeIndex(start='2014-08-01 09:00', freq='H', periods=10, tz='US/Eastern')
    didx
    didx.tz_localize(None)
    didx.tz_convert(None)
@@ -1743,20 +2218,27 @@ Ambiguous Times when Localizing
 
 In some cases, localize cannot determine the DST and non-DST hours when there are
 duplicates.  This often happens when reading files or database records that simply
-duplicate the hours.  Passing ``ambiguous='infer'`` (``infer_dst`` argument in prior
-releases) into ``tz_localize`` will attempt to determine the right offset.  Below
-the top example will fail as it contains ambiguous times and the bottom will
-infer the right offset.
+duplicate the hours.  Passing ``ambiguous='infer'`` into ``tz_localize`` will
+attempt to determine the right offset.  Below the top example will fail as it
+contains ambiguous times and the bottom will infer the right offset.
 
 .. ipython:: python
-   :okexcept:
 
-   rng_hourly = DatetimeIndex(['11/06/2011 00:00', '11/06/2011 01:00',
-                               '11/06/2011 01:00', '11/06/2011 02:00',
-                               '11/06/2011 03:00'])
+   rng_hourly = pd.DatetimeIndex(['11/06/2011 00:00', '11/06/2011 01:00',
+                                  '11/06/2011 01:00', '11/06/2011 02:00',
+                                  '11/06/2011 03:00'])
+
+This will fail as there are ambiguous times
+
+.. code-block:: ipython
+
+   In [2]: rng_hourly.tz_localize('US/Eastern')
+   AmbiguousTimeError: Cannot infer dst time from Timestamp('2011-11-06 01:00:00'), try using the 'ambiguous' argument
+
+Infer the ambiguous times
+
+.. ipython:: python
 
-   # This will fail as there are ambiguous times
-   rng_hourly.tz_localize('US/Eastern')
    rng_hourly_eastern = rng_hourly.tz_localize('US/Eastern', ambiguous='infer')
    rng_hourly_eastern.tolist()
 
@@ -1774,7 +2256,7 @@ constructor as well as ``tz_localize``.
    rng_hourly.tz_localize('US/Eastern', ambiguous=rng_hourly_dst).tolist()
    rng_hourly.tz_localize('US/Eastern', ambiguous='NaT').tolist()
 
-   didx = DatetimeIndex(start='2014-08-01 09:00', freq='H', periods=10, tz='US/Eastern')
+   didx = pd.DatetimeIndex(start='2014-08-01 09:00', freq='H', periods=10, tz='US/Eastern')
    didx
    didx.tz_localize(None)
    didx.tz_convert(None)
@@ -1784,11 +2266,9 @@ constructor as well as ``tz_localize``.
 
 .. _timeseries.timezone_series:
 
-TZ aware Dtypes
+TZ Aware Dtypes
 ~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.17.0
-
 ``Series/DatetimeIndex`` with a timezone **naive** value are represented with a dtype of ``datetime64[ns]``.
 
 .. ipython:: python
@@ -1828,21 +2308,21 @@ a convert on an aware stamp.
 
 .. note::
 
-   Using the ``.values`` accessor on a ``Series``, returns an numpy array of the data.
-   These values are converted to UTC, as numpy does not currently support timezones (even though it is *printing* in the local timezone!).
+   Using the ``.values`` accessor on a ``Series``, returns an NumPy array of the data.
+   These values are converted to UTC, as NumPy does not currently support timezones (even though it is *printing* in the local timezone!).
 
    .. ipython:: python
 
       s_naive.values
       s_aware.values
 
-   Further note that once converted to a numpy array these would lose the tz tenor.
+   Further note that once converted to a NumPy array these would lose the tz tenor.
 
    .. ipython:: python
 
-      Series(s_aware.values)
+      pd.Series(s_aware.values)
 
-   However, these can be easily converted
+   However, these can be easily converted:
 
    .. ipython:: python
 
diff --git a/doc/source/tutorials.rst b/doc/source/tutorials.rst
index 7c1d1e345d273..381031fa128e6 100644
--- a/doc/source/tutorials.rst
+++ b/doc/source/tutorials.rst
@@ -9,104 +9,108 @@ This is a guide to many pandas tutorials, geared mainly for new users.
 Internal Guides
 ---------------
 
-pandas own :ref:`10 Minutes to pandas<10min>`
+pandas' own :ref:`10 Minutes to pandas<10min>`.
 
-More complex recipes are in the :ref:`Cookbook<cookbook>`
+More complex recipes are in the :ref:`Cookbook<cookbook>`.
+
+A handy pandas `cheat sheet <http://pandas.pydata.org/Pandas_Cheat_Sheet.pdf>`_.
 
 pandas Cookbook
 ---------------
 
-The goal of this cookbook (by `Julia Evans <http://jvns.ca>`_) is to
+The goal of this 2015 cookbook (by `Julia Evans <http://jvns.ca>`_) is to
 give you some concrete examples for getting started with pandas. These
 are examples with real-world data, and all the bugs and weirdness that
-that entails.
+entails.
 
-Here are links to the v0.1 release. For an up-to-date table of contents, see the `pandas-cookbook GitHub
+Here are links to the v0.2 release. For an up-to-date table of contents, see the `pandas-cookbook GitHub
 repository <http://github.com/jvns/pandas-cookbook>`_. To run the examples in this tutorial, you'll need to
 clone the GitHub repository and get IPython Notebook running.
 See `How to use this cookbook <https://github.com/jvns/pandas-cookbook#how-to-use-this-cookbook>`_.
 
--  `A quick tour of the IPython Notebook: <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/A%20quick%20tour%20of%20IPython%20Notebook.ipynb>`_
+*  `A quick tour of the IPython Notebook: <http://nbviewer.jupyter.org/github/jvns/pandas-cookbook/blob/v0.2/cookbook/A%20quick%20tour%20of%20IPython%20Notebook.ipynb>`_
    Shows off IPython's awesome tab completion and magic functions.
--  `Chapter 1: <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%201%20-%20Reading%20from%20a%20CSV.ipynb>`_
+*  `Chapter 1: <http://nbviewer.jupyter.org/github/jvns/pandas-cookbook/blob/v0.2/cookbook/Chapter%201%20-%20Reading%20from%20a%20CSV.ipynb>`_
    Reading your data into pandas is pretty much the easiest thing. Even
    when the encoding is wrong!
--  `Chapter 2: <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%202%20-%20Selecting%20data%20&%20finding%20the%20most%20common%20complaint%20type.ipynb>`_
+*  `Chapter 2: <http://nbviewer.jupyter.org/github/jvns/pandas-cookbook/blob/v0.2/cookbook/Chapter%202%20-%20Selecting%20data%20%26%20finding%20the%20most%20common%20complaint%20type.ipynb>`_
    It's not totally obvious how to select data from a pandas dataframe.
    Here we explain the basics (how to take slices and get columns)
--  `Chapter 3: <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%203%20-%20Which%20borough%20has%20the%20most%20noise%20complaints%3F%20%28or%2C%20more%20selecting%20data%29.ipynb>`_
+*  `Chapter 3: <http://nbviewer.jupyter.org/github/jvns/pandas-cookbook/blob/v0.2/cookbook/Chapter%203%20-%20Which%20borough%20has%20the%20most%20noise%20complaints%20%28or%2C%20more%20selecting%20data%29.ipynb>`_
    Here we get into serious slicing and dicing and learn how to filter
    dataframes in complicated ways, really fast.
--  `Chapter 4: <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%204%20-%20Find%20out%20on%20which%20weekday%20people%20bike%20the%20most%20with%20groupby%20and%20aggregate.ipynb>`_
+*  `Chapter 4: <http://nbviewer.jupyter.org/github/jvns/pandas-cookbook/blob/v0.2/cookbook/Chapter%204%20-%20Find%20out%20on%20which%20weekday%20people%20bike%20the%20most%20with%20groupby%20and%20aggregate.ipynb>`_
    Groupby/aggregate is seriously my favorite thing about pandas
    and I use it all the time. You should probably read this.
--  `Chapter 5:  <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%205%20-%20Combining%20dataframes%20and%20scraping%20Canadian%20weather%20data.ipynb>`_
+*  `Chapter 5:  <http://nbviewer.jupyter.org/github/jvns/pandas-cookbook/blob/v0.2/cookbook/Chapter%205%20-%20Combining%20dataframes%20and%20scraping%20Canadian%20weather%20data.ipynb>`_
    Here you get to find out if it's cold in Montreal in the winter
    (spoiler: yes). Web scraping with pandas is fun! Here we combine dataframes.
--  `Chapter 6:  <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%206%20-%20String%20operations%21%20Which%20month%20was%20the%20snowiest%3F.ipynb>`_
+*  `Chapter 6:  <http://nbviewer.jupyter.org/github/jvns/pandas-cookbook/blob/v0.2/cookbook/Chapter%206%20-%20String%20Operations-%20Which%20month%20was%20the%20snowiest.ipynb>`_
    Strings with pandas are great. It has all these vectorized string
    operations and they're the best. We will turn a bunch of strings
    containing "Snow" into vectors of numbers in a trice.
--  `Chapter 7: <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%207%20-%20Cleaning%20up%20messy%20data.ipynb>`_
+*  `Chapter 7: <http://nbviewer.jupyter.org/github/jvns/pandas-cookbook/blob/v0.2/cookbook/Chapter%207%20-%20Cleaning%20up%20messy%20data.ipynb>`_
    Cleaning up messy data is never a joy, but with pandas it's easier.
--  `Chapter 8:  <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%208%20-%20How%20to%20deal%20with%20timestamps.ipynb>`_
+*  `Chapter 8:  <http://nbviewer.jupyter.org/github/jvns/pandas-cookbook/blob/v0.2/cookbook/Chapter%208%20-%20How%20to%20deal%20with%20timestamps.ipynb>`_
    Parsing Unix timestamps is confusing at first but it turns out
    to be really easy.
+*  `Chapter 9:  <http://nbviewer.jupyter.org/github/jvns/pandas-cookbook/blob/v0.2/cookbook/Chapter%209%20-%20Loading%20data%20from%20SQL%20databases.ipynb>`_
+   Reading data from SQL databases.
 
 
-Lessons for New pandas Users
+Lessons for new pandas users
 ----------------------------
 
-For more resources, please visit the main `repository <https://bitbucket.org/hrojas/learn-pandas>`_.
+For more resources, please visit the main `repository <https://bitbucket.org/hrojas/learn-pandas>`__.
 
-- `01 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/01%20-%20Lesson.ipynb>`_
-  - Importing libraries
-  - Creating data sets
-  - Creating data frames
-  - Reading from CSV
-  - Exporting to CSV
-  - Finding maximums
-  - Plotting data
+* `01 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/01%20-%20Lesson.ipynb>`_
+    * Importing libraries
+    * Creating data sets
+    * Creating data frames
+    * Reading from CSV
+    * Exporting to CSV
+    * Finding maximums
+    * Plotting data
 
-- `02 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/02%20-%20Lesson.ipynb>`_
-  - Reading from TXT
-  - Exporting to TXT
-  - Selecting top/bottom records
-  - Descriptive statistics
-  - Grouping/sorting data
+* `02 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/02%20-%20Lesson.ipynb>`_
+    * Reading from TXT
+    * Exporting to TXT
+    * Selecting top/bottom records
+    * Descriptive statistics
+    * Grouping/sorting data
 
-- `03 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/03%20-%20Lesson.ipynb>`_
-  - Creating functions
-  - Reading from EXCEL
-  - Exporting to EXCEL
-  - Outliers
-  - Lambda functions
-  - Slice and dice data
+* `03 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/03%20-%20Lesson.ipynb>`_
+    * Creating functions
+    * Reading from EXCEL
+    * Exporting to EXCEL
+    * Outliers
+    * Lambda functions
+    * Slice and dice data
 
-- `04 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/04%20-%20Lesson.ipynb>`_
-  - Adding/deleting columns
-  - Index operations
+* `04 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/04%20-%20Lesson.ipynb>`_
+    * Adding/deleting columns
+    * Index operations
 
-- `05 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/05%20-%20Lesson.ipynb>`_
-  - Stack/Unstack/Transpose functions
+* `05 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/05%20-%20Lesson.ipynb>`_
+    * Stack/Unstack/Transpose functions
 
-- `06 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/06%20-%20Lesson.ipynb>`_
-  - GroupBy function
+* `06 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/06%20-%20Lesson.ipynb>`_
+    * GroupBy function
 
-- `07 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/07%20-%20Lesson.ipynb>`_
-  - Ways to calculate outliers
+* `07 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/07%20-%20Lesson.ipynb>`_
+    * Ways to calculate outliers
 
-- `08 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/08%20-%20Lesson.ipynb>`_
-  - Read from Microsoft SQL databases
+* `08 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/08%20-%20Lesson.ipynb>`_
+    * Read from Microsoft SQL databases
 
-- `09 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/09%20-%20Lesson.ipynb>`_
-  - Export to CSV/EXCEL/TXT
+* `09 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/09%20-%20Lesson.ipynb>`_
+    * Export to CSV/EXCEL/TXT
 
-- `10 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/10%20-%20Lesson.ipynb>`_
-  - Converting between different kinds of formats
+* `10 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/10%20-%20Lesson.ipynb>`_
+    * Converting between different kinds of formats
 
-- `11 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/11%20-%20Lesson.ipynb>`_
-  - Combining data from various sources
+* `11 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/11%20-%20Lesson.ipynb>`_
+    * Combining data from various sources
 
 
 Practical data analysis with Python
@@ -115,27 +119,87 @@ Practical data analysis with Python
 This `guide <http://wavedatalab.github.io/datawithpython>`_ is a comprehensive introduction to the data analysis process using the Python data ecosystem and an interesting open dataset.
 There are four sections covering selected topics as follows:
 
--  `Munging Data <http://wavedatalab.github.io/datawithpython/munge.html>`_
+* `Munging Data <http://wavedatalab.github.io/datawithpython/munge.html>`_
+
+* `Aggregating Data <http://wavedatalab.github.io/datawithpython/aggregate.html>`_
+
+* `Visualizing Data <http://wavedatalab.github.io/datawithpython/visualize.html>`_
+
+* `Time Series <http://wavedatalab.github.io/datawithpython/timeseries.html>`_
+
+.. _tutorial-exercises-new-users:
+
+Exercises for new users
+-----------------------
+Practice your skills with real data sets and exercises.
+For more resources, please visit the main `repository <https://github.com/guipsamora/pandas_exercises>`__.
+
+* `01 - Getting & Knowing Your Data <https://github.com/guipsamora/pandas_exercises/tree/master/01_Getting_%26_Knowing_Your_Data>`_
+
+* `02 - Filtering & Sorting <https://github.com/guipsamora/pandas_exercises/tree/master/02_Filtering_%26_Sorting>`_
+
+* `03 - Grouping <https://github.com/guipsamora/pandas_exercises/tree/master/03_Grouping>`_
+
+* `04 - Apply <https://github.com/guipsamora/pandas_exercises/tree/master/04_Apply>`_
 
--  `Aggregating Data <http://wavedatalab.github.io/datawithpython/aggregate.html>`_
+* `05 - Merge <https://github.com/guipsamora/pandas_exercises/tree/master/05_Merge>`_
 
--  `Visualizing Data <http://wavedatalab.github.io/datawithpython/visualize.html>`_
+* `06 - Stats <https://github.com/guipsamora/pandas_exercises/tree/master/06_Stats>`_
 
--  `Time Series <http://wavedatalab.github.io/datawithpython/timeseries.html>`_
+* `07 - Visualization <https://github.com/guipsamora/pandas_exercises/tree/master/07_Visualization>`_
 
+* `08 - Creating Series and DataFrames <https://github.com/guipsamora/pandas_exercises/tree/master/08_Creating_Series_and_DataFrames/Pokemon>`_
+
+* `09 - Time Series <https://github.com/guipsamora/pandas_exercises/tree/master/09_Time_Series>`_
+
+* `10 - Deleting <https://github.com/guipsamora/pandas_exercises/tree/master/10_Deleting>`_
+
+.. _tutorial-modern:
+
+Modern pandas
+-------------
+
+Tutorial series written in 2016 by 
+`Tom Augspurger <https://github.com/TomAugspurger>`_.
+The source may be found in the GitHub repository
+`TomAugspurger/effective-pandas <https://github.com/TomAugspurger/effective-pandas>`_.
+
+* `Modern Pandas <http://tomaugspurger.github.io/modern-1-intro.html>`_
+* `Method Chaining <http://tomaugspurger.github.io/method-chaining.html>`_
+* `Indexes <http://tomaugspurger.github.io/modern-3-indexes.html>`_
+* `Performance <http://tomaugspurger.github.io/modern-4-performance.html>`_
+* `Tidy Data <http://tomaugspurger.github.io/modern-5-tidy.html>`_
+* `Visualization <http://tomaugspurger.github.io/modern-6-visualization.html>`_
+* `Timeseries <http://tomaugspurger.github.io/modern-7-timeseries.html>`_
 
 Excel charts with pandas, vincent and xlsxwriter
 ------------------------------------------------
 
--  `Using Pandas and XlsxWriter to create Excel charts <http://pandas-xlsxwriter-charts.readthedocs.org/>`_
+*  `Using Pandas and XlsxWriter to create Excel charts <https://pandas-xlsxwriter-charts.readthedocs.io/>`_
+
+Video Tutorials
+---------------
+
+* `Pandas From The Ground Up <https://www.youtube.com/watch?v=5JnMutdy6Fw>`_
+  (2015) (2:24)
+  `GitHub repo <https://github.com/brandon-rhodes/pycon-pandas-tutorial>`__
+* `Introduction Into Pandas <https://www.youtube.com/watch?v=-NR-ynQg0YM>`_
+  (2016) (1:28)
+  `GitHub repo <https://github.com/chendaniely/2016-pydata-carolinas-pandas>`__
+* `Pandas: .head() to .tail() <https://www.youtube.com/watch?v=7vuO9QXDN50>`_
+  (2016) (1:26)
+  `GitHub repo <https://github.com/TomAugspurger/pydata-chi-h2t>`__
+
 
 Various Tutorials
 -----------------
 
-- `Wes McKinney's (pandas BDFL) blog <http://blog.wesmckinney.com/>`_
-- `Statistical analysis made easy in Python with SciPy and pandas DataFrames, by Randal Olson <http://www.randalolson.com/2012/08/06/statistical-analysis-made-easy-in-python/>`_
-- `Statistical Data Analysis in Python, tutorial videos, by Christopher Fonnesbeck from SciPy 2013 <http://conference.scipy.org/scipy2013/tutorial_detail.php?id=109>`_
-- `Financial analysis in python, by Thomas Wiecki <http://nbviewer.ipython.org/github/twiecki/financial-analysis-python-tutorial/blob/master/1.%20Pandas%20Basics.ipynb>`_
-- `Intro to pandas data structures, by Greg Reda <http://www.gregreda.com/2013/10/26/intro-to-pandas-data-structures/>`_
-- `Pandas and Python: Top 10, by Manish Amde <http://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/>`_
-- `Pandas Tutorial, by Mikhail Semeniuk <http://www.bearrelroll.com/2013/05/python-pandas-tutorial>`_
+* `Wes McKinney's (pandas BDFL) blog <http://blog.wesmckinney.com/>`_
+* `Statistical analysis made easy in Python with SciPy and pandas DataFrames, by Randal Olson <http://www.randalolson.com/2012/08/06/statistical-analysis-made-easy-in-python/>`_
+* `Statistical Data Analysis in Python, tutorial videos, by Christopher Fonnesbeck from SciPy 2013 <http://conference.scipy.org/scipy2013/tutorial_detail.php?id=109>`_
+* `Financial analysis in Python, by Thomas Wiecki <http://nbviewer.ipython.org/github/twiecki/financial-analysis-python-tutorial/blob/master/1.%20Pandas%20Basics.ipynb>`_
+* `Intro to pandas data structures, by Greg Reda <http://www.gregreda.com/2013/10/26/intro-to-pandas-data-structures/>`_
+* `Pandas and Python: Top 10, by Manish Amde <http://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/>`_
+* `Pandas Tutorial, by Mikhail Semeniuk <http://www.bearrelroll.com/2013/05/python-pandas-tutorial>`_
+* `Pandas DataFrames Tutorial, by Karlijn Willems <http://www.datacamp.com/community/tutorials/pandas-tutorial-dataframe-python>`_
+* `A concise tutorial with real life examples <https://tutswiki.com/pandas-cookbook/chapter1>`_
diff --git a/doc/source/visualization.rst b/doc/source/visualization.rst
index b6ee2d83fd131..569a6fb7b7a0d 100644
--- a/doc/source/visualization.rst
+++ b/doc/source/visualization.rst
@@ -10,16 +10,13 @@
    np.set_printoptions(precision=4, suppress=True)
    pd.options.display.max_rows = 15
    import matplotlib
-   try:
-      matplotlib.style.use('ggplot')
-   except AttributeError:
-      pd.options.display.mpl_style = 'default'
+   # matplotlib.style.use('default')
    import matplotlib.pyplot as plt
    plt.close('all')
 
-********
-Plotting
-********
+*************
+Visualization
+*************
 
 We use the standard convention for referencing the matplotlib API:
 
@@ -27,18 +24,6 @@ We use the standard convention for referencing the matplotlib API:
 
    import matplotlib.pyplot as plt
 
-The plots in this document are made using matplotlib's ``ggplot`` style (new in version 1.4):
-
-.. code-block:: python
-
-   import matplotlib
-   matplotlib.style.use('ggplot')
-
-If your version of matplotlib is 1.3 or lower, you can set ``display.mpl_style`` to ``'default'``
-with ``pd.options.display.mpl_style = 'default'``
-to produce more appealing plots.
-When set, matplotlib's ``rcParams`` are changed (globally!) to nicer-looking settings.
-
 We provide the basics in pandas to easily create decent looking plots.
 See the :ref:`ecosystem <ecosystem.visualization>` section for visualization
 libraries that go beyond the basics documented here.
@@ -52,7 +37,8 @@ libraries that go beyond the basics documented here.
 Basic Plotting: ``plot``
 ------------------------
 
-See the :ref:`cookbook<cookbook.plotting>` for some advanced strategies
+We will demonstrate the basics, see the :ref:`cookbook<cookbook.plotting>` for 
+some advanced strategies.
 
 The ``plot`` method on Series and DataFrame is just a simple wrapper around
 :meth:`plt.plot() <matplotlib.axes.Axes.plot>`:
@@ -109,7 +95,8 @@ You can plot one column versus another using the `x` and `y` keywords in
 
 .. note::
 
-   For more formatting and sytling options, see :ref:`below <visualization.formatting>`.
+   For more formatting and styling options, see 
+   :ref:`formatting <visualization.formatting>` below.
 
 .. ipython:: python
     :suppress:
@@ -122,20 +109,26 @@ Other Plots
 -----------
 
 Plotting methods allow for a handful of plot styles other than the
-default Line plot. These methods can be provided as the ``kind``
-keyword argument to :meth:`~DataFrame.plot`.
-These include:
+default line plot. These methods can be provided as the ``kind``
+keyword argument to :meth:`~DataFrame.plot`, and include:
 
 * :ref:`'bar' <visualization.barplot>` or :ref:`'barh' <visualization.barplot>` for bar plots
 * :ref:`'hist' <visualization.hist>` for histogram
 * :ref:`'box' <visualization.box>` for boxplot
-* :ref:`'kde' <visualization.kde>` or ``'density'`` for density plots
+* :ref:`'kde' <visualization.kde>` or :ref:`'density' <visualization.kde>` for density plots
 * :ref:`'area' <visualization.area_plot>` for area plots
 * :ref:`'scatter' <visualization.scatter>` for scatter plots
 * :ref:`'hexbin' <visualization.hexbin>` for hexagonal bin plots
 * :ref:`'pie' <visualization.pie>` for pie plots
 
-.. versionadded:: 0.17
+For example, a bar plot can be created the following way:
+
+.. ipython:: python
+
+   plt.figure();
+
+   @savefig bar_plot_ex.png
+   df.iloc[5].plot(kind='bar');
 
 You can also create these other plots using the methods ``DataFrame.plot.<kind>`` instead of providing the ``kind`` keyword argument. This makes it easier to discover plot methods and the specific arguments they use:
 
@@ -148,12 +141,12 @@ You can also create these other plots using the methods ``DataFrame.plot.<kind>`
     df.plot.area     df.plot.barh     df.plot.density  df.plot.hist     df.plot.line     df.plot.scatter
     df.plot.bar      df.plot.box      df.plot.hexbin   df.plot.kde      df.plot.pie
 
-In addition to these ``kind`` s, there are  the :ref:`DataFrame.hist() <visualization.hist>`,
+In addition to these ``kind`` s, there are the :ref:`DataFrame.hist() <visualization.hist>`,
 and :ref:`DataFrame.boxplot() <visualization.box>` methods, which use a separate interface.
 
-Finally, there are several :ref:`plotting functions <visualization.tools>` in ``pandas.tools.plotting``
+Finally, there are several :ref:`plotting functions <visualization.tools>` in ``pandas.plotting``
 that take a :class:`Series` or :class:`DataFrame` as an argument. These
-include
+include:
 
 * :ref:`Scatter Matrix <visualization.scatter_matrix>`
 * :ref:`Andrews Curves <visualization.andrews_curves>`
@@ -178,9 +171,9 @@ For labeled, non-time series data, you may wish to produce a bar plot:
    plt.figure();
 
    @savefig bar_plot_ex.png
-   df.ix[5].plot(kind='bar'); plt.axhline(0, color='k')
+   df.iloc[5].plot.bar(); plt.axhline(0, color='k')
 
-Calling a DataFrame's :meth:`~DataFrame.plot` method with ``kind='bar'`` produces a multiple
+Calling a DataFrame's :meth:`plot.bar() <DataFrame.plot.bar>` method produces a multiple
 bar plot:
 
 .. ipython:: python
@@ -195,7 +188,7 @@ bar plot:
    df2 = pd.DataFrame(np.random.rand(10, 4), columns=['a', 'b', 'c', 'd'])
 
    @savefig bar_plot_multi_ex.png
-   df2.plot(kind='bar');
+   df2.plot.bar();
 
 To produce a stacked bar plot, pass ``stacked=True``:
 
@@ -208,9 +201,9 @@ To produce a stacked bar plot, pass ``stacked=True``:
 .. ipython:: python
 
    @savefig bar_plot_stacked_ex.png
-   df2.plot(kind='bar', stacked=True);
+   df2.plot.bar(stacked=True);
 
-To get horizontal bar plots, pass ``kind='barh'``:
+To get horizontal bar plots, use the ``barh`` method:
 
 .. ipython:: python
    :suppress:
@@ -221,16 +214,14 @@ To get horizontal bar plots, pass ``kind='barh'``:
 .. ipython:: python
 
    @savefig barh_plot_stacked_ex.png
-   df2.plot(kind='barh', stacked=True);
+   df2.plot.barh(stacked=True);
 
 .. _visualization.hist:
 
 Histograms
 ~~~~~~~~~~
 
-.. versionadded:: 0.15.0
-
-Histogram can be drawn specifying ``kind='hist'``.
+Histograms can be drawn by using the :meth:`DataFrame.plot.hist` and :meth:`Series.plot.hist` methods.
 
 .. ipython:: python
 
@@ -240,7 +231,7 @@ Histogram can be drawn specifying ``kind='hist'``.
    plt.figure();
 
    @savefig hist_new.png
-   df4.plot(kind='hist', alpha=0.5)
+   df4.plot.hist(alpha=0.5)
 
 
 .. ipython:: python
@@ -248,28 +239,31 @@ Histogram can be drawn specifying ``kind='hist'``.
 
    plt.close('all')
 
-Histogram can be stacked by ``stacked=True``. Bin size can be changed by ``bins`` keyword.
+A histogram can be stacked using ``stacked=True``. Bin size can be changed 
+using the ``bins`` keyword.
 
 .. ipython:: python
 
    plt.figure();
 
    @savefig hist_new_stacked.png
-   df4.plot(kind='hist', stacked=True, bins=20)
+   df4.plot.hist(stacked=True, bins=20)
 
 .. ipython:: python
    :suppress:
 
    plt.close('all')
 
-You can pass other keywords supported by matplotlib ``hist``. For example, horizontal and cumulative histgram can be drawn by ``orientation='horizontal'`` and ``cumulative='True'``.
+You can pass other keywords supported by matplotlib ``hist``. For example, 
+horizontal and cumulative histograms can be drawn by 
+``orientation='horizontal'`` and ``cumulative=True``.
 
 .. ipython:: python
 
    plt.figure();
 
    @savefig hist_new_kwargs.png
-   df4['a'].plot(kind='hist', orientation='horizontal', cumulative=True)
+   df4['a'].plot.hist(orientation='horizontal', cumulative=True)
 
 .. ipython:: python
    :suppress:
@@ -305,8 +299,6 @@ subplots:
    df.diff().hist(color='k', alpha=0.5, bins=50)
 
 
-.. versionadded:: 0.10.0
-
 The ``by`` keyword can be specified to plot grouped histograms:
 
 .. ipython:: python
@@ -329,12 +321,8 @@ The ``by`` keyword can be specified to plot grouped histograms:
 Box Plots
 ~~~~~~~~~
 
-Boxplot can be drawn calling a ``Series`` and ``DataFrame.plot`` with ``kind='box'``,
-or ``DataFrame.boxplot`` to visualize the distribution of values within each column.
-
-.. versionadded:: 0.15.0
-
-``plot`` method now supports ``kind='box'`` to draw boxplot.
+Boxplot can be drawn calling :meth:`Series.plot.box` and :meth:`DataFrame.plot.box`,
+or :meth:`DataFrame.boxplot` to visualize the distribution of values within each column.
 
 For instance, here is a boxplot representing five trials of 10 observations of
 a uniform random variable on [0,1).
@@ -350,7 +338,7 @@ a uniform random variable on [0,1).
    df = pd.DataFrame(np.random.rand(10, 5), columns=['A', 'B', 'C', 'D', 'E'])
 
    @savefig box_plot_new.png
-   df.plot(kind='box')
+   df.plot.box()
 
 Boxplot can be colorized by passing ``color`` keyword. You can pass a ``dict``
 whose keys are ``boxes``, ``whiskers``, ``medians`` and ``caps``.
@@ -371,7 +359,7 @@ more complicated colorization, you can get each drawn artists by passing
                 medians='DarkBlue', caps='Gray')
 
    @savefig box_new_colorize.png
-   df.plot(kind='box', color=color, sym='r+')
+   df.plot.box(color=color, sym='r+')
 
 .. ipython:: python
    :suppress:
@@ -385,7 +373,7 @@ For example, horizontal and custom-positioned boxplot can be drawn by
 .. ipython:: python
 
    @savefig box_new_kwargs.png
-   df.plot(kind='box', vert=False, positions=[1, 4, 5, 6, 8])
+   df.plot.box(vert=False, positions=[1, 4, 5, 6, 8])
 
 
 See the :meth:`boxplot <matplotlib.axes.Axes.boxplot>` method and the
@@ -457,28 +445,29 @@ columns:
 
 .. _visualization.box.return:
 
-Basically, plot functions return :class:`matplotlib Axes <matplotlib.axes.Axes>` as a return value.
-In ``boxplot``, the return type can be changed by argument ``return_type``, and whether the subplots is enabled (``subplots=True`` in ``plot`` or ``by`` is specified in ``boxplot``).
+.. warning::
 
-When ``subplots=False`` / ``by`` is ``None``:
+   The default changed from ``'dict'`` to ``'axes'`` in version 0.19.0.
 
-* if ``return_type`` is ``'dict'``, a dictionary containing the :class:`matplotlib Lines <matplotlib.lines.Line2D>` is returned. The keys are "boxes", "caps", "fliers", "medians", and "whiskers".
-   This is the default of ``boxplot`` in historical reason.
-   Note that ``plot(kind='box')`` returns ``Axes`` as default as the same as other plots.
-* if ``return_type`` is ``'axes'``, a :class:`matplotlib Axes <matplotlib.axes.Axes>` containing the boxplot is returned.
-* if ``return_type`` is ``'both'`` a namedtuple containging the :class:`matplotlib Axes <matplotlib.axes.Axes>`
-   and :class:`matplotlib Lines <matplotlib.lines.Line2D>` is returned
+In ``boxplot``, the return type can be controlled by the ``return_type``, keyword. The valid choices are ``{"axes", "dict", "both", None}``.
+Faceting, created by ``DataFrame.boxplot`` with the ``by``
+keyword, will affect the output type as well:
 
-When ``subplots=True`` / ``by`` is some column of the DataFrame:
+================ ======= ==========================
+``return_type=`` Faceted Output type
+---------------- ------- --------------------------
 
-* A dict of ``return_type`` is returned, where the keys are the columns
-  of the DataFrame. The plot has a facet for each column of
-  the DataFrame, with a separate box for each value of ``by``.
+``None``         No      axes
+``None``         Yes     2-D ndarray of axes
+``'axes'``       No      axes
+``'axes'``       Yes     Series of axes
+``'dict'``       No      dict of artists
+``'dict'``       Yes     Series of dicts of artists
+``'both'``       No      namedtuple
+``'both'``       Yes     Series of namedtuples
+================ ======= ==========================
 
-Finally, when calling boxplot on a :class:`Groupby` object, a dict of ``return_type``
-is returned, where the keys are the same as the Groupby object. The plot has a
-facet for each key, with each facet containing a box for each column of the
-DataFrame.
+``Groupby.boxplot`` always returns a ``Series`` of ``return_type``.
 
 .. ipython:: python
    :okwarning:
@@ -496,7 +485,9 @@ DataFrame.
 
    plt.close('all')
 
-Compare to:
+The subplots above are split by the numeric columns first, then the value of 
+the ``g`` column. Below the subplots are first split by the value of ``g``,
+then by the numeric columns.
 
 .. ipython:: python
    :okwarning:
@@ -514,9 +505,8 @@ Compare to:
 Area Plot
 ~~~~~~~~~
 
-.. versionadded:: 0.14
-
-You can create area plots with ``Series.plot`` and ``DataFrame.plot`` by passing ``kind='area'``. Area plots are stacked by default. To produce stacked area plot, each column must be either all positive or all negative values.
+You can create area plots with :meth:`Series.plot.area` and :meth:`DataFrame.plot.area`.
+Area plots are stacked by default. To produce stacked area plot, each column must be either all positive or all negative values.
 
 When input data contains `NaN`, it will be automatically filled by 0. If you want to drop or fill by different values, use :func:`dataframe.dropna` or :func:`dataframe.fillna` before calling `plot`.
 
@@ -531,7 +521,7 @@ When input data contains `NaN`, it will be automatically filled by 0. If you wan
    df = pd.DataFrame(np.random.rand(10, 4), columns=['a', 'b', 'c', 'd'])
 
    @savefig area_plot_stacked.png
-   df.plot(kind='area');
+   df.plot.area();
 
 To produce an unstacked plot, pass ``stacked=False``. Alpha value is set to 0.5 unless otherwise specified:
 
@@ -544,18 +534,16 @@ To produce an unstacked plot, pass ``stacked=False``. Alpha value is set to 0.5
 .. ipython:: python
 
    @savefig area_plot_unstacked.png
-   df.plot(kind='area', stacked=False);
+   df.plot.area(stacked=False);
 
 .. _visualization.scatter:
 
 Scatter Plot
 ~~~~~~~~~~~~
 
-.. versionadded:: 0.13
-
-You can create scatter plots with ``DataFrame.plot`` by passing ``kind='scatter'``.
-Scatter plot requires numeric columns for x and y axis.
-These can be specified by ``x`` and ``y`` keywords each.
+Scatter plot can be drawn by using the :meth:`DataFrame.plot.scatter` method.
+Scatter plot requires numeric columns for the x and y axes.
+These can be specified by the ``x`` and ``y`` keywords.
 
 .. ipython:: python
    :suppress:
@@ -569,18 +557,16 @@ These can be specified by ``x`` and ``y`` keywords each.
    df = pd.DataFrame(np.random.rand(50, 4), columns=['a', 'b', 'c', 'd'])
 
    @savefig scatter_plot.png
-   df.plot(kind='scatter', x='a', y='b');
+   df.plot.scatter(x='a', y='b');
 
 To plot multiple column groups in a single axes, repeat ``plot`` method specifying target ``ax``.
 It is recommended to specify ``color`` and ``label`` keywords to distinguish each groups.
 
 .. ipython:: python
 
-   ax = df.plot(kind='scatter', x='a', y='b',
-                color='DarkBlue', label='Group 1');
+   ax = df.plot.scatter(x='a', y='b', color='DarkBlue', label='Group 1');
    @savefig scatter_plot_repeated.png
-   df.plot(kind='scatter', x='c', y='d',
-           color='DarkGreen', label='Group 2', ax=ax);
+   df.plot.scatter(x='c', y='d', color='DarkGreen', label='Group 2', ax=ax);
 
 .. ipython:: python
    :suppress:
@@ -593,7 +579,7 @@ each point:
 .. ipython:: python
 
    @savefig scatter_plot_colored.png
-   df.plot(kind='scatter', x='a', y='b', c='c', s=50);
+   df.plot.scatter(x='a', y='b', c='c', s=50);
 
 
 .. ipython:: python
@@ -601,13 +587,14 @@ each point:
 
    plt.close('all')
 
-You can pass other keywords supported by matplotlib ``scatter``.
-Below example shows a bubble chart using a dataframe column values as bubble size.
+You can pass other keywords supported by matplotlib 
+:meth:`scatter <matplotlib.axes.Axes.scatter>`. The example  below shows a 
+bubble chart using a column of the ``DataFrame`` as the bubble size.
 
 .. ipython:: python
 
    @savefig scatter_plot_bubble.png
-   df.plot(kind='scatter', x='a', y='b', s=df['c']*200);
+   df.plot.scatter(x='a', y='b', s=df['c']*200);
 
 .. ipython:: python
    :suppress:
@@ -622,10 +609,7 @@ See the :meth:`scatter <matplotlib.axes.Axes.scatter>` method and the
 Hexagonal Bin Plot
 ~~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.14
-
-You can create hexagonal bin plots with :meth:`DataFrame.plot` and
-``kind='hexbin'``.
+You can create hexagonal bin plots with :meth:`DataFrame.plot.hexbin`.
 Hexbin plots can be a useful alternative to scatter plots if your data are
 too dense to plot each point individually.
 
@@ -641,7 +625,7 @@ too dense to plot each point individually.
    df['b'] = df['b'] + np.arange(1000)
 
    @savefig hexbin_plot.png
-   df.plot(kind='hexbin', x='a', y='b', gridsize=25)
+   df.plot.hexbin(x='a', y='b', gridsize=25)
 
 
 A useful keyword argument is ``gridsize``; it controls the number of hexagons
@@ -654,7 +638,7 @@ You can specify alternative aggregations by passing values to the ``C`` and
 and ``reduce_C_function`` is a function of one argument that reduces all the
 values in a bin to a single number (e.g. ``mean``, ``max``, ``sum``, ``std``).  In this
 example the positions are given by columns ``a`` and ``b``, while the value is
-given by column ``z``. The bins are aggregated with numpy's ``max`` function.
+given by column ``z``. The bins are aggregated with NumPy's ``max`` function.
 
 .. ipython:: python
    :suppress:
@@ -670,7 +654,7 @@ given by column ``z``. The bins are aggregated with numpy's ``max`` function.
    df['z'] = np.random.uniform(0, 3, 1000)
 
    @savefig hexbin_plot_agg.png
-   df.plot(kind='hexbin', x='a', y='b', C='z', reduce_C_function=np.max,
+   df.plot.hexbin(x='a', y='b', C='z', reduce_C_function=np.max,
            gridsize=25)
 
 .. ipython:: python
@@ -686,9 +670,7 @@ See the :meth:`hexbin <matplotlib.axes.Axes.hexbin>` method and the
 Pie plot
 ~~~~~~~~
 
-.. versionadded:: 0.14
-
-You can create a pie plot with :meth:`DataFrame.plot` or :meth:`Series.plot` with ``kind='pie'``.
+You can create a pie plot with :meth:`DataFrame.plot.pie` or :meth:`Series.plot.pie`.
 If your data includes any ``NaN``, they will be automatically filled with 0.
 A ``ValueError`` will be raised if there are any negative values in your data.
 
@@ -703,21 +685,23 @@ A ``ValueError`` will be raised if there are any negative values in your data.
    series = pd.Series(3 * np.random.rand(4), index=['a', 'b', 'c', 'd'], name='series')
 
    @savefig series_pie_plot.png
-   series.plot(kind='pie', figsize=(6, 6))
+   series.plot.pie(figsize=(6, 6))
 
 .. ipython:: python
    :suppress:
 
    plt.close('all')
 
-For pie plots it's best to use square figures, one's with an equal aspect ratio. You can create the
-figure with equal width and height, or force the aspect ratio to be equal after plotting by
-calling ``ax.set_aspect('equal')`` on the returned ``axes`` object.
+For pie plots it's best to use square figures, i.e. a figure aspect ratio 1. 
+You can create the figure with equal width and height, or force the aspect ratio 
+to be equal after plotting by calling ``ax.set_aspect('equal')`` on the returned 
+``axes`` object.
 
-Note that pie plot with :class:`DataFrame` requires that you either specify a target column by the ``y``
-argument or ``subplots=True``. When ``y`` is specified, pie plot of selected column
-will be drawn. If ``subplots=True`` is specified, pie plots for each column are drawn as subplots.
-A legend will be drawn in each pie plots by default; specify ``legend=False`` to hide it.
+Note that pie plot with :class:`DataFrame` requires that you either specify a 
+target column by the ``y`` argument or ``subplots=True``. When ``y`` is 
+specified, pie plot of selected column will be drawn. If ``subplots=True`` is 
+specified, pie plots for each column are drawn as subplots. A legend will be 
+drawn in each pie plots by default; specify ``legend=False`` to hide it.
 
 .. ipython:: python
    :suppress:
@@ -730,7 +714,7 @@ A legend will be drawn in each pie plots by default; specify ``legend=False`` to
    df = pd.DataFrame(3 * np.random.rand(4, 2), index=['a', 'b', 'c', 'd'], columns=['x', 'y'])
 
    @savefig df_pie_plot.png
-   df.plot(kind='pie', subplots=True, figsize=(8, 4))
+   df.plot.pie(subplots=True, figsize=(8, 4))
 
 .. ipython:: python
    :suppress:
@@ -741,7 +725,7 @@ You can use the ``labels`` and ``colors`` keywords to specify the labels and col
 
 .. warning::
 
-   Most pandas plots use the the ``label`` and ``color`` arguments (note the lack of "s" on those).
+   Most pandas plots use the ``label`` and ``color`` arguments (note the lack of "s" on those).
    To be consistent with :func:`matplotlib.pyplot.pie` you must use ``labels`` and ``colors``.
 
 If you want to hide wedge labels, specify ``labels=None``.
@@ -757,8 +741,8 @@ Also, other keywords supported by :func:`matplotlib.pyplot.pie` can be used.
 .. ipython:: python
 
    @savefig series_pie_plot_options.png
-   series.plot(kind='pie', labels=['AA', 'BB', 'CC', 'DD'], colors=['r', 'g', 'b', 'c'],
-               autopct='%.2f', fontsize=20, figsize=(6, 6))
+   series.plot.pie(labels=['AA', 'BB', 'CC', 'DD'], colors=['r', 'g', 'b', 'c'],
+                   autopct='%.2f', fontsize=20, figsize=(6, 6))
 
 If you pass values whose sum total is less than 1.0, matplotlib draws a semicircle.
 
@@ -773,7 +757,7 @@ If you pass values whose sum total is less than 1.0, matplotlib draws a semicirc
    series = pd.Series([0.1] * 4, index=['a', 'b', 'c', 'd'], name='series2')
 
    @savefig series_pie_plot_semi.png
-   series.plot(kind='pie', figsize=(6, 6))
+   series.plot.pie(figsize=(6, 6))
 
 See the `matplotlib pie documentation <http://matplotlib.org/api/pyplot_api.html#matplotlib.pyplot.pie>`__ for more.
 
@@ -787,7 +771,7 @@ See the `matplotlib pie documentation <http://matplotlib.org/api/pyplot_api.html
 Plotting with Missing Data
 --------------------------
 
-Pandas tries to be pragmatic about plotting DataFrames or Series
+Pandas tries to be pragmatic about plotting ``DataFrames`` or ``Series``
 that contain missing data. Missing values are dropped, left out, or filled
 depending on the plot type.
 
@@ -825,7 +809,7 @@ before plotting.
 Plotting Tools
 --------------
 
-These functions can be imported from ``pandas.tools.plotting``
+These functions can be imported from ``pandas.plotting``
 and take a :class:`Series` or :class:`DataFrame` as an argument.
 
 .. _visualization.scatter_matrix:
@@ -833,10 +817,8 @@ and take a :class:`Series` or :class:`DataFrame` as an argument.
 Scatter Matrix Plot
 ~~~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.7.3
-
 You can create a scatter plot matrix using the
-``scatter_matrix`` method in ``pandas.tools.plotting``:
+``scatter_matrix`` method in ``pandas.plotting``:
 
 .. ipython:: python
    :suppress:
@@ -845,7 +827,7 @@ You can create a scatter plot matrix using the
 
 .. ipython:: python
 
-   from pandas.tools.plotting import scatter_matrix
+   from pandas.plotting import scatter_matrix
    df = pd.DataFrame(np.random.randn(1000, 4), columns=['a', 'b', 'c', 'd'])
 
    @savefig scatter_matrix_kde.png
@@ -861,10 +843,7 @@ You can create a scatter plot matrix using the
 Density Plot
 ~~~~~~~~~~~~
 
-.. versionadded:: 0.8.0
-
-You can create density plots using the Series/DataFrame.plot and
-setting ``kind='kde'``:
+You can create density plots using the :meth:`Series.plot.kde` and :meth:`DataFrame.plot.kde` methods.
 
 .. ipython:: python
    :suppress:
@@ -877,7 +856,7 @@ setting ``kind='kde'``:
    ser = pd.Series(np.random.randn(1000))
 
    @savefig kde_plot.png
-   ser.plot(kind='kde')
+   ser.plot.kde()
 
 .. ipython:: python
    :suppress:
@@ -891,15 +870,16 @@ Andrews Curves
 
 Andrews curves allow one to plot multivariate data as a large number
 of curves that are created using the attributes of samples as coefficients
-for Fourier series. By coloring these curves differently for each class
+for Fourier series, see the `Wikipedia entry <https://en.wikipedia.org/wiki/Andrews_plot>`__
+for more information. By coloring these curves differently for each class
 it is possible to visualize data clustering. Curves belonging to samples
 of the same class will usually be closer together and form larger structures.
 
-**Note**: The "Iris" dataset is available `here <https://raw.github.com/pydata/pandas/master/pandas/tests/data/iris.csv>`__.
+**Note**: The "Iris" dataset is available `here <https://raw.github.com/pandas-dev/pandas/master/pandas/tests/data/iris.csv>`__.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import andrews_curves
+   from pandas.plotting import andrews_curves
 
    data = pd.read_csv('data/iris.data')
 
@@ -913,15 +893,17 @@ of the same class will usually be closer together and form larger structures.
 Parallel Coordinates
 ~~~~~~~~~~~~~~~~~~~~
 
-Parallel coordinates is a plotting technique for plotting multivariate data.
-It allows one to see clusters in data and to estimate other statistics visually.
+Parallel coordinates is a plotting technique for plotting multivariate data,
+see the `Wikipedia entry <https://en.wikipedia.org/wiki/Parallel_coordinates>`__
+for an introduction.
+Parallel coordinates allows one to see clusters in data and to estimate other statistics visually.
 Using parallel coordinates points are represented as connected line segments.
 Each vertical line represents one attribute. One set of connected line segments
 represents one data point. Points that tend to cluster will appear closer together.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import parallel_coordinates
+   from pandas.plotting import parallel_coordinates
 
    data = pd.read_csv('data/iris.data')
 
@@ -942,7 +924,9 @@ Lag Plot
 
 Lag plots are used to check if a data set or time series is random. Random
 data should not exhibit any structure in the lag plot. Non-random structure
-implies that the underlying data are not random.
+implies that the underlying data are not random. The ``lag`` argument may
+be passed, and when ``lag=1`` the plot is essentially ``data[:-1]`` vs. 
+``data[1:]``.
 
 .. ipython:: python
    :suppress:
@@ -951,7 +935,7 @@ implies that the underlying data are not random.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import lag_plot
+   from pandas.plotting import lag_plot
 
    plt.figure()
 
@@ -977,7 +961,9 @@ If time series is random, such autocorrelations should be near zero for any and
 all time-lag separations. If time series is non-random then one or more of the
 autocorrelations will be significantly non-zero. The horizontal lines displayed
 in the plot correspond to 95% and 99% confidence bands. The dashed line is 99%
-confidence band.
+confidence band. See the 
+`Wikipedia entry <https://en.wikipedia.org/wiki/Correlogram>`__ for more about
+autocorrelation plots.
 
 .. ipython:: python
    :suppress:
@@ -986,7 +972,7 @@ confidence band.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import autocorrelation_plot
+   from pandas.plotting import autocorrelation_plot
 
    plt.figure()
 
@@ -1019,7 +1005,7 @@ are what constitutes the bootstrap plot.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import bootstrap_plot
+   from pandas.plotting import bootstrap_plot
 
    data = pd.Series(np.random.rand(1000))
 
@@ -1046,12 +1032,14 @@ unit interval). The point in the plane, where our sample settles to (where the
 forces acting on our sample are at an equilibrium) is where a dot representing
 our sample will be drawn. Depending on which class that sample belongs it will
 be colored differently.
+See the R package `Radviz <https://cran.r-project.org/web/packages/Radviz/>`__
+for more information.
 
-**Note**: The "Iris" dataset is available `here <https://raw.github.com/pydata/pandas/master/pandas/tests/data/iris.csv>`__.
+**Note**: The "Iris" dataset is available `here <https://raw.github.com/pandas-dev/pandas/master/pandas/tests/data/iris.csv>`__.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import radviz
+   from pandas.plotting import radviz
 
    data = pd.read_csv('data/iris.data')
 
@@ -1070,6 +1058,21 @@ be colored differently.
 Plot Formatting
 ---------------
 
+Setting the plot style
+~~~~~~~~~~~~~~~~~~~~~~
+
+From version 1.5 and up, matplotlib offers a range of pre-configured plotting styles. Setting the
+style can be used to easily give plots the general look that you want.
+Setting the style is as easy as calling ``matplotlib.style.use(my_plot_style)`` before
+creating your plot. For example you could write ``matplotlib.style.use('ggplot')`` for ggplot-style
+plots.
+
+You can see the various available style names at ``matplotlib.style.available`` and it's very
+easy to try them out.
+
+General plot style arguments
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
 Most plotting methods have a set of keyword arguments that control the
 layout and formatting of the returned plot:
 
@@ -1162,7 +1165,7 @@ To plot data on a secondary y-axis, use the ``secondary_y`` keyword:
 
    plt.close('all')
 
-To plot some columns in a DataFrame, give the column names to the ``secondary_y``
+To plot some columns in a ``DataFrame``, give the column names to the ``secondary_y``
 keyword:
 
 .. ipython:: python
@@ -1202,7 +1205,7 @@ time-series data. For limited cases where pandas cannot infer the frequency
 information (e.g., in an externally created ``twinx``), you can choose to
 suppress this behavior for alignment purposes.
 
-Here is the default behavior, notice how the x-axis tick labelling is performed:
+Here is the default behavior, notice how the x-axis tick labeling is performed:
 
 .. ipython:: python
 
@@ -1231,14 +1234,14 @@ Using the ``x_compat`` parameter, you can suppress this behavior:
    plt.close('all')
 
 If you have more than one plot that needs to be suppressed, the ``use`` method
-in ``pandas.plot_params`` can be used in a `with statement`:
+in ``pandas.plotting.plot_params`` can be used in a `with statement`:
 
 .. ipython:: python
 
    plt.figure()
 
    @savefig ser_plot_suppress_context.png
-   with pd.plot_params.use('x_compat', True):
+   with pd.plotting.plot_params.use('x_compat', True):
        df.A.plot(color='r')
        df.B.plot(color='g')
        df.C.plot(color='b')
@@ -1248,10 +1251,22 @@ in ``pandas.plot_params`` can be used in a `with statement`:
 
    plt.close('all')
 
+Automatic Date Tick Adjustment
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.20.0
+
+``TimedeltaIndex`` now uses the native matplotlib
+tick locator methods, it is useful to call the automatic
+date tick adjustment from matplotlib for figures whose ticklabels overlap.
+
+See the :meth:`autofmt_xdate <matplotlib.figure.autofmt_xdate>` method and the
+`matplotlib documentation <http://matplotlib.org/users/recipes.html#fixing-common-date-annoyances>`__ for more.
+
 Subplots
 ~~~~~~~~
 
-Each Series in a DataFrame can be plotted on a different axis
+Each ``Series`` in a ``DataFrame`` can be plotted on a different axis
 with the ``subplots`` keyword:
 
 .. ipython:: python
@@ -1264,16 +1279,16 @@ with the ``subplots`` keyword:
 
    plt.close('all')
 
-Using Layout and Targetting Multiple Axes
+Using Layout and Targeting Multiple Axes
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-The layout of subplots can be specified by ``layout`` keyword. It can accept
+The layout of subplots can be specified by the ``layout`` keyword. It can accept
 ``(rows, columns)``. The ``layout`` keyword can be used in
-``hist`` and ``boxplot`` also. If input is invalid, ``ValueError`` will be raised.
+``hist`` and ``boxplot`` also. If the input is invalid, a ``ValueError`` will be raised.
 
 The number of axes which can be contained by rows x columns specified by ``layout`` must be
 larger than the number of required subplots. If layout can contain more axes than required,
-blank axes are not drawn. Similar to a numpy array's ``reshape`` method, you
+blank axes are not drawn. Similar to a NumPy array's ``reshape`` method, you
 can use ``-1`` for one dimension to automatically calculate the number of rows
 or columns needed, given the other.
 
@@ -1287,7 +1302,7 @@ or columns needed, given the other.
 
    plt.close('all')
 
-The above example is identical to using
+The above example is identical to using:
 
 .. ipython:: python
 
@@ -1301,11 +1316,11 @@ The above example is identical to using
 The required number of columns (3) is inferred from the number of series to plot
 and the given number of rows (2).
 
-Also, you can pass multiple axes created beforehand as list-like via ``ax`` keyword.
-This allows to use more complicated layout.
+You can pass multiple axes created beforehand as list-like via ``ax`` keyword.
+This allows more complicated layouts.
 The passed axes must be the same number as the subplots being drawn.
 
-When multiple axes are passed via ``ax`` keyword, ``layout``, ``sharex`` and ``sharey`` keywords
+When multiple axes are passed via the ``ax`` keyword, ``layout``, ``sharex`` and ``sharey`` keywords
 don't affect to the output. You should explicitly pass ``sharex=False`` and ``sharey=False``,
 otherwise you will see a warning.
 
@@ -1362,15 +1377,13 @@ Another option is passing an ``ax`` argument to :meth:`Series.plot` to plot on a
 Plotting With Error Bars
 ~~~~~~~~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.14
-
-Plotting with error bars is now supported in the :meth:`DataFrame.plot` and :meth:`Series.plot`
+Plotting with error bars is supported in :meth:`DataFrame.plot` and :meth:`Series.plot`.
 
-Horizontal and vertical errorbars can be supplied to the ``xerr`` and ``yerr`` keyword arguments to :meth:`~DataFrame.plot()`. The error values can be specified using a variety of formats.
+Horizontal and vertical error bars can be supplied to the ``xerr`` and ``yerr`` keyword arguments to :meth:`~DataFrame.plot()`. The error values can be specified using a variety of formats:
 
-- As a :class:`DataFrame` or ``dict`` of errors with column names matching the ``columns`` attribute of the plotting :class:`DataFrame` or matching the ``name`` attribute of the :class:`Series`
-- As a ``str`` indicating which of the columns of plotting :class:`DataFrame` contain the error values
-- As raw values (``list``, ``tuple``, or ``np.ndarray``). Must be the same length as the plotting :class:`DataFrame`/:class:`Series`
+* As a :class:`DataFrame` or ``dict`` of errors with column names matching the ``columns`` attribute of the plotting :class:`DataFrame` or matching the ``name`` attribute of the :class:`Series`.
+* As a ``str`` indicating which of the columns of plotting :class:`DataFrame` contain the error values.
+* As raw values (``list``, ``tuple``, or ``np.ndarray``). Must be the same length as the plotting :class:`DataFrame`/:class:`Series`.
 
 Asymmetrical error bars are also supported, however raw error values must be provided in this case. For a ``M`` length :class:`Series`, a ``Mx2`` array should be provided indicating lower and upper (or left and right) errors. For a ``MxN`` :class:`DataFrame`, asymmetrical errors should be in a ``Mx2xN`` array.
 
@@ -1392,7 +1405,7 @@ Here is an example of one way to easily plot group means with standard deviation
    # Plot
    fig, ax = plt.subplots()
    @savefig errorbar_example.png
-   means.plot(yerr=errors, ax=ax, kind='bar')
+   means.plot.bar(yerr=errors, ax=ax)
 
 .. ipython:: python
    :suppress:
@@ -1404,8 +1417,6 @@ Here is an example of one way to easily plot group means with standard deviation
 Plotting Tables
 ~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.14
-
 Plotting with matplotlib table is now supported in  :meth:`DataFrame.plot` and :meth:`Series.plot` with a ``table`` keyword. The ``table`` keyword can accept ``bool``, :class:`DataFrame` or :class:`Series`. The simple way to draw a table is to specify ``table=True``. Data will be transposed to meet matplotlib's default layout.
 
 .. ipython:: python
@@ -1427,7 +1438,10 @@ Plotting with matplotlib table is now supported in  :meth:`DataFrame.plot` and :
 
    plt.close('all')
 
-Also, you can pass different :class:`DataFrame` or :class:`Series` for ``table`` keyword. The data will be drawn as displayed in print method (not transposed automatically). If required, it should be transposed manually as below example.
+Also, you can pass a different :class:`DataFrame` or :class:`Series` to the 
+``table`` keyword. The data will be drawn as displayed in print method 
+(not transposed automatically). If required, it should be transposed manually 
+as seen in the example below.
 
 .. ipython:: python
 
@@ -1441,11 +1455,14 @@ Also, you can pass different :class:`DataFrame` or :class:`Series` for ``table``
 
    plt.close('all')
 
-Finally, there is a helper function ``pandas.tools.plotting.table`` to create a table from :class:`DataFrame` and :class:`Series`, and add it to an ``matplotlib.Axes``. This function can accept keywords which matplotlib table has.
+There also exists a helper function ``pandas.plotting.table``, which creates a 
+table from :class:`DataFrame` or :class:`Series`, and adds it to an 
+``matplotlib.Axes`` instance. This function can accept keywords which the 
+matplotlib `table <http://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table>`__ has.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import table
+   from pandas.plotting import table
    fig, ax = plt.subplots(1, 1)
 
    table(ax, np.round(df.describe(), 2),
@@ -1468,18 +1485,18 @@ Colormaps
 
 A potential issue when plotting a large number of columns is that it can be
 difficult to distinguish some series due to repetition in the default colors. To
-remedy this, DataFrame plotting supports the use of the ``colormap=`` argument,
+remedy this, ``DataFrame`` plotting supports the use of the ``colormap`` argument,
 which accepts either a Matplotlib `colormap <http://matplotlib.org/api/cm_api.html>`__
 or a string that is a name of a colormap registered with Matplotlib. A
 visualization of the default matplotlib colormaps is available `here
-<http://wiki.scipy.org/Cookbook/Matplotlib/Show_colormaps>`__.
+<https://matplotlib.org/examples/color/colormaps_reference.html>`__.
 
 As matplotlib does not directly support colormaps for line-based plots, the
 colors are selected based on an even spacing determined by the number of columns
-in the DataFrame. There is no consideration made for background color, so some
+in the ``DataFrame``. There is no consideration made for background color, so some
 colormaps will produce lines that are not easily visible.
 
-To use the cubehelix colormap, we can simply pass ``'cubehelix'`` to ``colormap=``
+To use the cubehelix colormap, we can pass ``colormap='cubehelix'``.
 
 .. ipython:: python
    :suppress:
@@ -1501,7 +1518,7 @@ To use the cubehelix colormap, we can simply pass ``'cubehelix'`` to ``colormap=
 
    plt.close('all')
 
-or we can pass the colormap itself
+Alternatively, we can pass the colormap itself:
 
 .. ipython:: python
 
@@ -1532,7 +1549,7 @@ Colormaps can also be used other plot types, like bar charts:
    plt.figure()
 
    @savefig greens.png
-   dd.plot(kind='bar', colormap='Greens')
+   dd.plot.bar(colormap='Greens')
 
 .. ipython:: python
    :suppress:
@@ -1572,9 +1589,9 @@ Plotting directly with matplotlib
 
 In some situations it may still be preferable or necessary to prepare plots
 directly with matplotlib, for instance when a certain type of plot or
-customization is not (yet) supported by pandas. Series and DataFrame objects
-behave like arrays and can therefore be passed directly to matplotlib functions
-without explicit casts.
+customization is not (yet) supported by pandas. ``Series`` and ``DataFrame`` 
+objects behave like arrays and can therefore be passed directly to 
+matplotlib functions without explicit casts.
 
 pandas also automatically registers formatters and locators that recognize date
 indices, thereby extending date and time support to practically all plot types
@@ -1582,10 +1599,6 @@ available in matplotlib. Although this formatting does not provide the same
 level of refinement you would get when plotting via pandas, it can be faster
 when plotting a large number of points.
 
-.. note::
-
-    The speed up for large data sets only applies to pandas 0.14.0 and later.
-
 .. ipython:: python
    :suppress:
 
@@ -1595,8 +1608,8 @@ when plotting a large number of points.
 
    price = pd.Series(np.random.randn(150).cumsum(),
                      index=pd.date_range('2000-1-1', periods=150, freq='B'))
-   ma = pd.rolling_mean(price, 20)
-   mstd = pd.rolling_std(price, 20)
+   ma = price.rolling(20).mean()
+   mstd = price.rolling(20).std()
 
    plt.figure()
 
@@ -1619,246 +1632,8 @@ Trellis plotting interface
 
 .. warning::
 
-    The ``rplot`` trellis plotting interface is **deprecated and will be removed
-    in a future version**. We refer to external packages like
-    `seaborn <https://github.com/mwaskom/seaborn>`_ for similar but more
-    refined functionality.
-
-    The docs below include some example on how to convert your existing code to
-    ``seaborn``.
-
-.. ipython:: python
-   :suppress:
-
-   tips_data = pd.read_csv('data/tips.csv')
-   iris_data = pd.read_csv('data/iris.data')
-   plt.close('all')
-
-
-.. note::
-
-   The tips data set can be downloaded `here
-   <http://wesmckinney.com/files/tips.csv>`__. Once you download it execute
-
-   .. code-block:: python
-
-      tips_data = pd.read_csv('tips.csv')
-
-   from the directory where you downloaded the file.
-
-We import the rplot API:
-
-.. ipython:: python
-   :okwarning:
-
-   import pandas.tools.rplot as rplot
-
-Examples
-~~~~~~~~
-
-RPlot was an API for producing Trellis plots. These plots allow you toµ
-arrange data in a rectangular grid by values of certain attributes.
-In the example below, data from the tips data set is arranged by the attributes
-'sex' and 'smoker'. Since both of those attributes can take on one of two
-values, the resulting grid has two columns and two rows. A histogram is
-displayed for each cell of the grid.
-
-.. ipython:: python
-   :okwarning:
-
-   plt.figure()
-
-   plot = rplot.RPlot(tips_data, x='total_bill', y='tip')
-   plot.add(rplot.TrellisGrid(['sex', 'smoker']))
-   plot.add(rplot.GeomHistogram())
-
-   @savefig rplot1_tips.png
-   plot.render(plt.gcf())
-
-.. ipython:: python
-   :suppress:
-
-   plt.close('all')
-
-A similar plot can be made with ``seaborn`` using the ``FacetGrid`` object,
-resulting in the following image:
-
-.. code-block:: python
-
-    import seaborn as sns
-    g = sns.FacetGrid(tips_data, row="sex", col="smoker")
-    g.map(plt.hist, "total_bill")
-
-.. image:: _static/rplot-seaborn-example1.png
-
-
-Example below is the same as previous except the plot is set to kernel density
-estimation. A ``seaborn`` example is included beneath.
-
-.. ipython:: python
-   :okwarning:
-
-   plt.figure()
-
-   plot = rplot.RPlot(tips_data, x='total_bill', y='tip')
-   plot.add(rplot.TrellisGrid(['sex', 'smoker']))
-   plot.add(rplot.GeomDensity())
-
-   @savefig rplot2_tips.png
-   plot.render(plt.gcf())
-
-.. ipython:: python
-   :suppress:
-
-   plt.close('all')
-
-.. code-block:: python
-
-    g = sns.FacetGrid(tips_data, row="sex", col="smoker")
-    g.map(sns.kdeplot, "total_bill")
-
-.. image:: _static/rplot-seaborn-example2.png
-
-The plot below shows that it is possible to have two or more plots for the same
-data displayed on the same Trellis grid cell.
-
-.. ipython:: python
-   :okwarning:
-
-   plt.figure()
-
-   plot = rplot.RPlot(tips_data, x='total_bill', y='tip')
-   plot.add(rplot.TrellisGrid(['sex', 'smoker']))
-   plot.add(rplot.GeomScatter())
-   plot.add(rplot.GeomPolyFit(degree=2))
-
-   @savefig rplot3_tips.png
-   plot.render(plt.gcf())
-
-.. ipython:: python
-   :suppress:
-
-   plt.close('all')
-
-A seaborn equivalent for a simple scatter plot:
-
-.. code-block:: python
-
-    g = sns.FacetGrid(tips_data, row="sex", col="smoker")
-    g.map(plt.scatter, "total_bill", "tip")
-
-.. image:: _static/rplot-seaborn-example3.png
-
-and with a regression line, using the dedicated ``seaborn`` ``regplot`` function:
-
-.. code-block:: python
-
-    g = sns.FacetGrid(tips_data, row="sex", col="smoker", margin_titles=True)
-    g.map(sns.regplot, "total_bill", "tip", order=2)
-
-.. image:: _static/rplot-seaborn-example3b.png
-
-
-Below is a similar plot but with 2D kernel density estimation plot superimposed,
-followed by a ``seaborn`` equivalent:
-
-.. ipython:: python
-   :okwarning:
-
-   plt.figure()
-
-   plot = rplot.RPlot(tips_data, x='total_bill', y='tip')
-   plot.add(rplot.TrellisGrid(['sex', 'smoker']))
-   plot.add(rplot.GeomScatter())
-   plot.add(rplot.GeomDensity2D())
-
-   @savefig rplot4_tips.png
-   plot.render(plt.gcf())
-
-.. ipython:: python
-   :suppress:
-
-   plt.close('all')
-
-.. code-block:: python
-
-    g = sns.FacetGrid(tips_data, row="sex", col="smoker")
-    g.map(plt.scatter, "total_bill", "tip")
-    g.map(sns.kdeplot, "total_bill", "tip")
-
-.. image:: _static/rplot-seaborn-example4.png
-
-It is possible to only use one attribute for grouping data. The example above
-only uses 'sex' attribute. If the second grouping attribute is not specified,
-the plots will be arranged in a column.
-
-.. ipython:: python
-   :okwarning:
-
-   plt.figure()
-
-   plot = rplot.RPlot(tips_data, x='total_bill', y='tip')
-   plot.add(rplot.TrellisGrid(['sex', '.']))
-   plot.add(rplot.GeomHistogram())
-
-   @savefig rplot5_tips.png
-   plot.render(plt.gcf())
-
-.. ipython:: python
-   :suppress:
-
-   plt.close('all')
-
-If the first grouping attribute is not specified the plots will be arranged in a row.
-
-.. ipython:: python
-   :okwarning:
-
-   plt.figure()
-
-   plot = rplot.RPlot(tips_data, x='total_bill', y='tip')
-   plot.add(rplot.TrellisGrid(['.', 'smoker']))
-   plot.add(rplot.GeomHistogram())
-
-   @savefig rplot6_tips.png
-   plot.render(plt.gcf())
-
-.. ipython:: python
-   :suppress:
-
-   plt.close('all')
-
-In ``seaborn``, this can also be done by only specifying one of the ``row``
-and ``col`` arguments.
-
-In the example below the colour and shape of the scatter plot graphical
-objects is mapped to 'day' and 'size' attributes respectively. You use
-scale objects to specify these mappings. The list of scale classes is
-given below with initialization arguments for quick reference.
-
-.. ipython:: python
-   :okwarning:
-
-   plt.figure()
-
-   plot = rplot.RPlot(tips_data, x='tip', y='total_bill')
-   plot.add(rplot.TrellisGrid(['sex', 'smoker']))
-   plot.add(rplot.GeomPoint(size=80.0, colour=rplot.ScaleRandomColour('day'), shape=rplot.ScaleShape('size'), alpha=1.0))
-
-   @savefig rplot7_tips.png
-   plot.render(plt.gcf())
-
-.. ipython:: python
-   :suppress:
-
-   plt.close('all')
-
-This can also be done in ``seaborn``, at least for 3 variables:
-
-.. code-block:: python
-
-    g = sns.FacetGrid(tips_data, row="sex", col="smoker", hue="day")
-    g.map(plt.scatter, "tip", "total_bill")
-    g.add_legend()
-
-.. image:: _static/rplot-seaborn-example6.png
+    The ``rplot`` trellis plotting interface has been **removed**. Please use
+    external packages like `seaborn <https://github.com/mwaskom/seaborn>`_ for
+    similar but more refined functionality and refer to our 0.18.1 documentation
+    `here <http://pandas.pydata.org/pandas-docs/version/0.18.1/visualization.html>`__
+    for how to convert to using it.
diff --git a/doc/source/whatsnew.rst b/doc/source/whatsnew.rst
index 1e4fb6f64cf2c..c744e44b4c17c 100644
--- a/doc/source/whatsnew.rst
+++ b/doc/source/whatsnew.rst
@@ -18,6 +18,34 @@ What's New
 
 These are new features and improvements of note in each release.
 
+.. include:: whatsnew/v0.24.0.txt
+
+.. include:: whatsnew/v0.23.1.txt
+
+.. include:: whatsnew/v0.23.0.txt
+
+.. include:: whatsnew/v0.22.0.txt
+
+.. include:: whatsnew/v0.21.1.txt
+
+.. include:: whatsnew/v0.21.0.txt
+
+.. include:: whatsnew/v0.20.3.txt
+
+.. include:: whatsnew/v0.20.2.txt
+
+.. include:: whatsnew/v0.20.0.txt
+
+.. include:: whatsnew/v0.19.2.txt
+
+.. include:: whatsnew/v0.19.1.txt
+
+.. include:: whatsnew/v0.19.0.txt
+
+.. include:: whatsnew/v0.18.1.txt
+
+.. include:: whatsnew/v0.18.0.txt
+
 .. include:: whatsnew/v0.17.1.txt
 
 .. include:: whatsnew/v0.17.0.txt
diff --git a/doc/source/whatsnew/v0.10.0.txt b/doc/source/whatsnew/v0.10.0.txt
index 04159186084f5..ec4ac17c80fd7 100644
--- a/doc/source/whatsnew/v0.10.0.txt
+++ b/doc/source/whatsnew/v0.10.0.txt
@@ -70,30 +70,103 @@ nfrequencies are unaffected. The prior defaults were causing a great deal of
 confusion for users, especially resampling data to daily frequency (which
 labeled the aggregated group with the end of the interval: the next day).
 
-Note:
-
-.. ipython:: python
-
-    dates = pd.date_range('1/1/2000', '1/5/2000', freq='4h')
-    series = Series(np.arange(len(dates)), index=dates)
-    series
-    series.resample('D', how='sum')
-    # old behavior
-    series.resample('D', how='sum', closed='right', label='right')
+.. code-block:: ipython
+
+   In [1]: dates = pd.date_range('1/1/2000', '1/5/2000', freq='4h')
+
+   In [2]: series = Series(np.arange(len(dates)), index=dates)
+
+   In [3]: series
+   Out[3]:
+   2000-01-01 00:00:00     0
+   2000-01-01 04:00:00     1
+   2000-01-01 08:00:00     2
+   2000-01-01 12:00:00     3
+   2000-01-01 16:00:00     4
+   2000-01-01 20:00:00     5
+   2000-01-02 00:00:00     6
+   2000-01-02 04:00:00     7
+   2000-01-02 08:00:00     8
+   2000-01-02 12:00:00     9
+   2000-01-02 16:00:00    10
+   2000-01-02 20:00:00    11
+   2000-01-03 00:00:00    12
+   2000-01-03 04:00:00    13
+   2000-01-03 08:00:00    14
+   2000-01-03 12:00:00    15
+   2000-01-03 16:00:00    16
+   2000-01-03 20:00:00    17
+   2000-01-04 00:00:00    18
+   2000-01-04 04:00:00    19
+   2000-01-04 08:00:00    20
+   2000-01-04 12:00:00    21
+   2000-01-04 16:00:00    22
+   2000-01-04 20:00:00    23
+   2000-01-05 00:00:00    24
+   Freq: 4H, dtype: int64
+
+   In [4]: series.resample('D', how='sum')
+   Out[4]:
+   2000-01-01     15
+   2000-01-02     51
+   2000-01-03     87
+   2000-01-04    123
+   2000-01-05     24
+   Freq: D, dtype: int64
+
+   In [5]: # old behavior
+   In [6]: series.resample('D', how='sum', closed='right', label='right')
+   Out[6]:
+   2000-01-01      0
+   2000-01-02     21
+   2000-01-03     57
+   2000-01-04     93
+   2000-01-05    129
+   Freq: D, dtype: int64
 
 - Infinity and negative infinity are no longer treated as NA by ``isnull`` and
-  ``notnull``. That they every were was a relic of early pandas. This behavior
+  ``notnull``. That they ever were was a relic of early pandas. This behavior
   can be re-enabled globally by the ``mode.use_inf_as_null`` option:
 
-.. ipython:: python
-
-    s = pd.Series([1.5, np.inf, 3.4, -np.inf])
-	pd.isnull(s)
-    s.fillna(0)
-    pd.set_option('use_inf_as_null', True)
-	pd.isnull(s)
-    s.fillna(0)
-	pd.reset_option('use_inf_as_null')
+.. code-block:: ipython
+
+    In [6]: s = pd.Series([1.5, np.inf, 3.4, -np.inf])
+
+    In [7]: pd.isnull(s)
+    Out[7]:
+    0    False
+    1    False
+    2    False
+    3    False
+    Length: 4, dtype: bool
+
+    In [8]: s.fillna(0)
+    Out[8]:
+    0    1.500000
+    1         inf
+    2    3.400000
+    3        -inf
+    Length: 4, dtype: float64
+
+    In [9]: pd.set_option('use_inf_as_null', True)
+
+    In [10]: pd.isnull(s)
+    Out[10]:
+    0    False
+    1     True
+    2    False
+    3     True
+    Length: 4, dtype: bool
+
+    In [11]: s.fillna(0)
+    Out[11]:
+    0    1.5
+    1    0.0
+    2    3.4
+    3    0.0
+    Length: 4, dtype: float64
+
+    In [12]: pd.reset_option('use_inf_as_null')
 
 - Methods with the ``inplace`` option now all return ``None`` instead of the
   calling object. E.g. code written like ``df = df.fillna(0, inplace=True)``
@@ -249,6 +322,7 @@ Updated PyTables Support
    store.select('df')
 
 .. ipython:: python
+   :okwarning:
 
    wp = Panel(randn(2, 5, 4), items=['Item1', 'Item2'],
           major_axis=date_range('1/1/2000', periods=5),
@@ -259,11 +333,10 @@ Updated PyTables Support
    store.append('wp',wp)
 
    # selecting via A QUERY
-   store.select('wp',
-     [ Term('major_axis>20000102'), Term('minor_axis', '=', ['A','B']) ])
+   store.select('wp', "major_axis>20000102 and minor_axis=['A','B']")
 
    # removing data from tables
-   store.remove('wp', Term('major_axis>20000103'))
+   store.remove('wp', "major_axis>20000103")
    store.select('wp')
 
    # deleting a store
@@ -296,8 +369,8 @@ Updated PyTables Support
       df1
       df1.get_dtype_counts()
 
-- performance improvments on table writing
-- support for arbitrarily indexed dimensions
+- performance improvements on table writing
+- support for arbitrarly indexed dimensions
 - ``SparseSeries`` now has a ``density`` property (:issue:`2384`)
 - enable ``Series.str.strip/lstrip/rstrip`` methods to take an input argument
   to strip arbitrary characters (:issue:`2411`)
@@ -336,16 +409,25 @@ N Dimensional Panels (Experimental)
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Adding experimental support for Panel4D and factory functions to create n-dimensional named panels.
-:ref:`Docs <dsintro.panel4d>` for NDim. Here is a taste of what to expect.
+Here is a taste of what to expect.
 
-     .. ipython:: python
+.. code-block:: ipython
 
-        p4d = Panel4D(randn(2, 2, 5, 4),
-              labels=['Label1','Label2'],
-              items=['Item1', 'Item2'],
-              major_axis=date_range('1/1/2000', periods=5),
-              minor_axis=['A', 'B', 'C', 'D'])
-        p4d
+  In [58]: p4d = Panel4D(randn(2, 2, 5, 4),
+    ....:       labels=['Label1','Label2'],
+    ....:       items=['Item1', 'Item2'],
+    ....:       major_axis=date_range('1/1/2000', periods=5),
+    ....:       minor_axis=['A', 'B', 'C', 'D'])
+    ....:
+
+  In [59]: p4d
+  Out[59]:
+  <class 'pandas.core.panelnd.Panel4D'>
+  Dimensions: 2 (labels) x 2 (items) x 5 (major_axis) x 4 (minor_axis)
+  Labels axis: Label1 to Label2
+  Items axis: Item1 to Item2
+  Major_axis axis: 2000-01-01 00:00:00 to 2000-01-05 00:00:00
+  Minor_axis axis: A to D
 
 
 
@@ -354,4 +436,3 @@ Adding experimental support for Panel4D and factory functions to create n-dimens
 See the :ref:`full release notes
 <release>` or issue tracker
 on GitHub for a complete list.
-
diff --git a/doc/source/whatsnew/v0.10.1.txt b/doc/source/whatsnew/v0.10.1.txt
index b61d31932c60d..f1a32440c6950 100644
--- a/doc/source/whatsnew/v0.10.1.txt
+++ b/doc/source/whatsnew/v0.10.1.txt
@@ -51,14 +51,14 @@ perform queries on a table, by passing a list to ``data_columns``
    df = DataFrame(randn(8, 3), index=date_range('1/1/2000', periods=8),
               columns=['A', 'B', 'C'])
    df['string'] = 'foo'
-   df.ix[4:6,'string'] = np.nan
-   df.ix[7:9,'string'] = 'bar'
+   df.loc[df.index[4:6], 'string'] = np.nan
+   df.loc[df.index[7:9], 'string'] = 'bar'
    df['string2'] = 'cool'
    df
 
    # on-disk operations
    store.append('df', df, data_columns = ['B','C','string','string2'])
-   store.select('df',[ 'B > 0', 'string == foo' ])
+   store.select('df', "B>0 and string=='foo'")
 
    # this is in-memory version of this type of selection
    df[(df.B > 0) & (df.string == 'foo')]
@@ -78,7 +78,7 @@ You can now store ``datetime64`` in data columns
 
     df_mixed               = df.copy()
     df_mixed['datetime64'] = Timestamp('20010102')
-    df_mixed.ix[3:4,['A','B']] = np.nan
+    df_mixed.loc[df_mixed.index[3:4], ['A','B']] = np.nan
 
     store.append('df_mixed', df_mixed)
     df_mixed1 = store.select('df_mixed')
@@ -93,7 +93,7 @@ columns, this is equivalent to passing a
 
    store.select('df',columns = ['A','B'])
 
-``HDFStore`` now serializes multi-index dataframes when appending tables.
+``HDFStore`` now serializes MultiIndex dataframes when appending tables.
 
 .. ipython:: python
 
@@ -110,7 +110,7 @@ columns, this is equivalent to passing a
    store.select('mi')
 
    # the levels are automatically included as data columns
-   store.select('mi', Term('foo=bar'))
+   store.select('mi', "foo='bar'")
 
 Multi-table creation via ``append_to_multiple`` and selection via
 ``select_as_multiple`` can create/select from multiple tables and return a
@@ -149,15 +149,15 @@ combined result, by using ``where`` on a selector table.
   `nan`.
 
 - You can pass ``index`` to ``append``. This defaults to ``True``. This will
-  automagically create indicies on the *indexables* and *data columns* of the
+  automagically create indices on the *indexables* and *data columns* of the
   table
 
 - You can pass ``chunksize=an integer`` to ``append``, to change the writing
-  chunksize (default is 50000). This will signficantly lower your memory usage
+  chunksize (default is 50000). This will significantly lower your memory usage
   on writing.
 
 - You can pass ``expectedrows=an integer`` to the first ``append``, to set the
-  TOTAL number of expectedrows that ``PyTables`` will expected. This will
+  TOTAL number of expected rows that ``PyTables`` will expected. This will
   optimize read/write performance.
 
 - ``Select`` now supports passing ``start`` and ``stop`` to provide selection
@@ -191,7 +191,7 @@ combined result, by using ``where`` on a selector table.
   levels with a very large number of combinatorial values (:issue:`2684`)
 - Fixed bug that causes plotting to fail when the index is a DatetimeIndex with
   a fixed-offset timezone (:issue:`2683`)
-- Corrected businessday subtraction logic when the offset is more than 5 bdays
+- Corrected business day subtraction logic when the offset is more than 5 bdays
   and the starting date is on a weekend (:issue:`2680`)
 - Fixed C file parser behavior when the file has more columns than data
   (:issue:`2668`)
@@ -208,4 +208,3 @@ combined result, by using ``where`` on a selector table.
 See the :ref:`full release notes
 <release>` or issue tracker
 on GitHub for a complete list.
-
diff --git a/doc/source/whatsnew/v0.11.0.txt b/doc/source/whatsnew/v0.11.0.txt
index 50b74fc5af090..f39e6c9ff459b 100644
--- a/doc/source/whatsnew/v0.11.0.txt
+++ b/doc/source/whatsnew/v0.11.0.txt
@@ -33,7 +33,7 @@ three types of multi-axis indexing.
 
   See more at :ref:`Selection by Label <indexing.label>`
 
-- ``.iloc`` is strictly integer position based (from ``0`` to ``length-1`` of the axis), will raise ``IndexError`` when the requested indicies are out of bounds. Allowed inputs are:
+- ``.iloc`` is strictly integer position based (from ``0`` to ``length-1`` of the axis), will raise ``IndexError`` when the requested indices are out of bounds. Allowed inputs are:
 
   - An integer e.g. ``5``
   - A list or array of integers ``[4, 3, 0]``
@@ -44,7 +44,7 @@ three types of multi-axis indexing.
 
 - ``.ix`` supports mixed integer and label based access. It is primarily label based, but will fallback to integer positional access. ``.ix`` is the most general and will support
   any of the inputs to ``.loc`` and ``.iloc``, as well as support for floating point label schemes. ``.ix`` is especially useful when dealing with mixed positional and label
-  based hierarchial indexes.
+  based hierarchical indexes.
 
   As using integer slices with ``.ix`` have different behavior depending on whether the slice
   is interpreted as position based or label based, it's usually better to be
@@ -76,7 +76,7 @@ Numeric dtypes will propagate and can coexist in DataFrames. If a dtype is passe
    df1.dtypes
    df2 = DataFrame(dict( A = Series(randn(8),dtype='float16'),
                          B = Series(randn(8)),
-                         C = Series(randn(8),dtype='uint8') ))
+                         C = Series(range(8),dtype='uint8') ))
    df2
    df2.dtypes
 
@@ -88,7 +88,7 @@ Numeric dtypes will propagate and can coexist in DataFrames. If a dtype is passe
 Dtype Conversion
 ~~~~~~~~~~~~~~~~
 
-This is lower-common-denomicator upcasting, meaning you get the dtype which can accomodate all of the types
+This is lower-common-denominator upcasting, meaning you get the dtype which can accommodate all of the types
 
 .. ipython:: python
 
@@ -190,10 +190,10 @@ Furthermore ``datetime64[ns]`` columns are created by default, when passed datet
    df.get_dtype_counts()
 
    # use the traditional nan, which is mapped to NaT internally
-   df.ix[2:4,['A','timestamp']] = np.nan
+   df.loc[df.index[2:4], ['A','timestamp']] = np.nan
    df
 
-Astype conversion on ``datetime64[ns]`` to ``object``, implicity converts ``NaT`` to ``np.nan``
+Astype conversion on ``datetime64[ns]`` to ``object``, implicitly converts ``NaT`` to ``np.nan``
 
 .. ipython:: python
 
@@ -211,7 +211,7 @@ Astype conversion on ``datetime64[ns]`` to ``object``, implicity converts ``NaT`
 API changes
 ~~~~~~~~~~~
 
-  - Added to_series() method to indicies, to facilitate the creation of indexers
+  - Added to_series() method to indices, to facilitate the creation of indexers
     (:issue:`3275`)
 
   - ``HDFStore``
diff --git a/doc/source/whatsnew/v0.12.0.txt b/doc/source/whatsnew/v0.12.0.txt
index 4c7d799ec5202..f66f6c0f72d5d 100644
--- a/doc/source/whatsnew/v0.12.0.txt
+++ b/doc/source/whatsnew/v0.12.0.txt
@@ -7,7 +7,7 @@ This is a major release from 0.11.0 and includes several new features and
 enhancements along with a large number of bug fixes.
 
 Highlights include a consistent I/O API naming scheme, routines to read html,
-write multi-indexes to csv files, read & write STATA data files, read & write JSON format
+write MultiIndexes to csv files, read & write STATA data files, read & write JSON format
 files, Python 3 support for ``HDFStore``, filtering of groupby expressions via ``filter``, and a
 revamped ``replace`` routine that accepts regular expressions.
 
@@ -38,7 +38,7 @@ API changes
     * ``to_clipboard``
 
 
-  - Fix modulo and integer division on Series,DataFrames to act similary to ``float`` dtypes to return
+  - Fix modulo and integer division on Series,DataFrames to act similarly to ``float`` dtypes to return
     ``np.nan`` or ``np.inf`` as appropriate (:issue:`3590`). This correct a numpy bug that treats ``integer``
     and ``float`` dtypes differently.
 
@@ -73,7 +73,7 @@ API changes
     e.g. a boolean Series, even with integer labels, will raise. Since ``iloc``
     is purely positional based, the labels on the Series are not alignable (:issue:`3631`)
 
-    This case is rarely used, and there are plently of alternatives. This preserves the
+    This case is rarely used, and there are plenty of alternatives. This preserves the
     ``iloc`` API to be *purely* positional based.
 
     .. ipython:: python
@@ -154,7 +154,7 @@ API changes
 
   - The behavior of ``datetime64`` dtypes has changed with respect to certain
     so-called reduction operations (:issue:`3726`). The following operations now
-    raise a ``TypeError`` when perfomed on a ``Series`` and return an *empty*
+    raise a ``TypeError`` when performed on a ``Series`` and return an *empty*
     ``Series`` when performed on a ``DataFrame`` similar to performing these
     operations on, for example, a ``DataFrame`` of ``slice`` objects:
 
@@ -166,7 +166,7 @@ API changes
 
   - The internal ``pandas`` class hierarchy has changed (slightly). The
     previous ``PandasObject`` now is called ``PandasContainer`` and a new
-    ``PandasObject`` has become the baseclass for ``PandasContainer`` as well
+    ``PandasObject`` has become the base class for ``PandasContainer`` as well
     as ``Index``, ``Categorical``, ``GroupBy``, ``SparseList``, and
     ``SparseArray`` (+ their base classes). Currently, ``PandasObject``
     provides string methods (from ``StringMixin``). (:issue:`4090`, :issue:`4092`)
@@ -206,11 +206,11 @@ I/O Enhancements
       :ref:`See the installation docs<install.optional_dependencies>`
 
   - Added module for reading and writing Stata files: ``pandas.io.stata`` (:issue:`1512`)
-    accessable via ``read_stata`` top-level function for reading,
+    accessible via ``read_stata`` top-level function for reading,
     and ``to_stata`` DataFrame method for writing, :ref:`See the docs<io.stata>`
 
   - Added module for reading and writing json format files: ``pandas.io.json``
-    accessable via ``read_json`` top-level function for reading,
+    accessible via ``read_json`` top-level function for reading,
     and ``to_json`` DataFrame method for writing, :ref:`See the docs<io.json>`
     various issues (:issue:`1226`, :issue:`3804`, :issue:`3876`, :issue:`3867`, :issue:`1305`)
 
@@ -220,7 +220,7 @@ I/O Enhancements
       list of the rows from which to read the index.
 
     - The option, ``tupleize_cols`` can now be specified in both ``to_csv`` and
-      ``read_csv``, to provide compatiblity for the pre 0.12 behavior of
+      ``read_csv``, to provide compatibility for the pre 0.12 behavior of
       writing and reading ``MultIndex`` columns via a list of tuples. The default in
       0.12 is to write lists of tuples and *not* interpret list of tuples as a
       ``MultiIndex`` column.
@@ -236,10 +236,10 @@ I/O Enhancements
       .. ipython:: python
 
          from pandas.util.testing import makeCustomDataframe as mkdf
-         df = mkdf(5,3,r_idx_nlevels=2,c_idx_nlevels=4)
-         df.to_csv('mi.csv',tupleize_cols=False)
+         df = mkdf(5, 3, r_idx_nlevels=2, c_idx_nlevels=4)
+         df.to_csv('mi.csv')
          print(open('mi.csv').read())
-         pd.read_csv('mi.csv',header=[0,1,2,3],index_col=[0,1],tupleize_cols=False)
+         pd.read_csv('mi.csv', header=[0,1,2,3], index_col=[0,1])
 
       .. ipython:: python
          :suppress:
@@ -252,7 +252,7 @@ I/O Enhancements
   - Iterator support via ``read_hdf`` that automatically opens and closes the
     store when iteration is finished. This is only for *tables*
 
-    .. code-block:: python
+    .. code-block:: ipython
 
         In [25]: path = 'store_iterator.h5'
 
@@ -296,7 +296,7 @@ Other Enhancements
         df.replace(regex=r'\s*\.\s*', value=np.nan)
 
     to replace all occurrences of the string ``'.'`` with zero or more
-    instances of surrounding whitespace with ``NaN``.
+    instances of surrounding white space with ``NaN``.
 
     Regular string replacement still works as expected. For example, you can do
 
@@ -403,7 +403,7 @@ Bug Fixes
     :issue:`3572`, :issue:`3911`, :issue:`3912`), but they will try to convert object arrays to
     numeric arrays if possible so that you can still plot, for example, an
     object array with floats. This happens before any drawing takes place which
-    elimnates any spurious plots from showing up.
+    eliminates any spurious plots from showing up.
 
   - ``fillna`` methods now raise a ``TypeError`` if the ``value`` parameter is
     a list or tuple.
diff --git a/doc/source/whatsnew/v0.13.0.txt b/doc/source/whatsnew/v0.13.0.txt
index 2e10ae4ea668d..94cd451196ead 100644
--- a/doc/source/whatsnew/v0.13.0.txt
+++ b/doc/source/whatsnew/v0.13.0.txt
@@ -80,7 +80,7 @@ API changes
 
   Integer division
 
-  .. code-block:: python
+  .. code-block:: ipython
 
       In [3]: arr = np.array([1, 2, 3, 4])
 
@@ -99,7 +99,7 @@ API changes
 
   True Division
 
-  .. code-block:: python
+  .. code-block:: ipython
 
       In [7]: pd.Series(arr) / pd.Series(arr2) # no future import required
       Out[7]:
@@ -274,7 +274,6 @@ Float64Index API Change
   .. ipython:: python
 
      s[3]
-     s.ix[3]
      s.loc[3]
 
   The only positional indexing is via ``iloc``
@@ -290,7 +289,6 @@ Float64Index API Change
   .. ipython:: python
 
      s[2:4]
-     s.ix[2:4]
      s.loc[2:4]
      s.iloc[2:4]
 
@@ -304,7 +302,7 @@ Float64Index API Change
 - Indexing on other index types are preserved (and positional fallback for ``[],ix``), with the exception, that floating point slicing
   on indexes on non ``Float64Index`` will now raise a ``TypeError``.
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [1]: Series(range(5))[3.5]
      TypeError: the label [3.5] is not a proper indexer for this index type (Int64Index)
@@ -314,7 +312,7 @@ Float64Index API Change
 
   Using a scalar float indexer will be deprecated in a future version, but is allowed for now.
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [3]: Series(range(5))[3.0]
      Out[3]: 3
@@ -359,11 +357,11 @@ HDFStore API Changes
   .. ipython:: python
 
      path = 'test.h5'
-     df = DataFrame(randn(10,2))
+     df = pd.DataFrame(np.random.randn(10,2))
      df.to_hdf(path,'df_table',format='table')
      df.to_hdf(path,'df_table2',append=True)
      df.to_hdf(path,'df_fixed')
-     with get_store(path) as store:
+     with pd.HDFStore(path) as store:
         print(store)
 
   .. ipython:: python
@@ -416,7 +414,7 @@ HDFStore API Changes
 - add the keyword ``dropna=True`` to ``append`` to change whether ALL nan rows are not written
   to the store (default is ``True``, ALL nan rows are NOT written), also settable
   via the option ``io.hdf.dropna_table`` (:issue:`4625`)
-- pass thru store creation arguments; can be used to support in-memory stores
+- pass through store creation arguments; can be used to support in-memory stores
 
 DataFrame repr Changes
 ~~~~~~~~~~~~~~~~~~~~~~
@@ -445,7 +443,7 @@ Enhancements
 - Clipboard functionality now works with PySide (:issue:`4282`)
 - Added a more informative error message when plot arguments contain
   overlapping color and style arguments (:issue:`4402`)
-- ``to_dict`` now takes ``records`` as a possible outtype.  Returns an array
+- ``to_dict`` now takes ``records`` as a possible out type.  Returns an array
   of column-keyed dictionaries. (:issue:`4936`)
 
 - ``NaN`` handing in get_dummies (:issue:`4446`) with `dummy_na`
@@ -536,6 +534,7 @@ Enhancements
   matches more conveniently.
 
   .. ipython:: python
+     :okwarning:
 
      Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)')
 
@@ -544,6 +543,7 @@ Enhancements
 
 
   .. ipython:: python
+     :okwarning:
 
      Series(['a1', 'b2', 'c3']).str.extract('([ab])(\d)')
 
@@ -555,6 +555,7 @@ Enhancements
   Named groups like
 
   .. ipython:: python
+     :okwarning:
 
      Series(['a1', 'b2', 'c3']).str.extract(
              '(?P<letter>[ab])(?P<digit>\d)')
@@ -562,6 +563,7 @@ Enhancements
   and optional groups can also be used.
 
   .. ipython:: python
+     :okwarning:
 
       Series(['a1', 'b2', '3']).str.extract(
               '(?P<letter>[ab])?(?P<digit>\d)')
@@ -596,7 +598,7 @@ Enhancements
   .. ipython:: python
 
      t = Timestamp('20130101 09:01:02')
-     t + pd.datetools.Nano(123)
+     t + pd.tseries.offsets.Nano(123)
 
 - A new method, ``isin`` for DataFrames, which plays nicely with boolean indexing. The argument to ``isin``, what we're comparing the DataFrame to, can be a DataFrame, Series, dict, or array of values. See :ref:`the docs<indexing.basics.indexing_isin>` for more.
 
@@ -649,7 +651,7 @@ Enhancements
 
   Additionally, the ``method`` argument to ``interpolate`` has been expanded
   to include ``'nearest', 'zero', 'slinear', 'quadratic', 'cubic',
-  'barycentric', 'krogh', 'piecewise_polynomial', 'pchip', `polynomial`, 'spline'``
+  'barycentric', 'krogh', 'piecewise_polynomial', 'pchip', 'polynomial', 'spline'``
   The new methods require scipy_. Consult the Scipy reference guide_ and documentation_ for more information
   about when the various methods are appropriate. See :ref:`the docs<missing_data.interpolate>`.
 
@@ -788,7 +790,7 @@ Experimental
   .. ipython:: python
 
      for o in pd.read_msgpack('foo.msg',iterator=True):
-        print o
+        print(o)
 
   .. ipython:: python
      :suppress:
@@ -821,7 +823,7 @@ Experimental
 
      # Your Google BigQuery Project ID
      # To find this, see your dashboard:
-     # https://code.google.com/apis/console/b/0/?noredirect
+     # https://console.developers.google.com/iam-admin/projects?authuser=0
      projectid = xxxxxxxxx;
 
      df = gbq.read_gbq(query, project_id = projectid)
diff --git a/doc/source/whatsnew/v0.13.1.txt b/doc/source/whatsnew/v0.13.1.txt
index 349acf508bbf3..51ca6116d42ce 100644
--- a/doc/source/whatsnew/v0.13.1.txt
+++ b/doc/source/whatsnew/v0.13.1.txt
@@ -36,7 +36,7 @@ Highlights include:
    .. ipython:: python
 
       df = DataFrame(dict(A = np.array(['foo','bar','bah','foo','bar'])))
-      df.ix[0,'A'] = np.nan
+      df.loc[0,'A'] = np.nan
       df
 
 Output Formatting Enhancements
@@ -121,11 +121,11 @@ API changes
 
   .. ipython:: python
       :okwarning:
-      
+
       df = DataFrame({'col':['foo', 0, np.nan]})
       df2 = DataFrame({'col':[np.nan, 0, 'foo']}, index=[2,1,0])
       df.equals(df2)
-      df.equals(df2.sort())
+      df.equals(df2.sort_index())
 
       import pandas.core.common as com
       com.array_equivalent(np.array([0, np.nan]), np.array([0, np.nan]))
@@ -140,14 +140,21 @@ API changes
   applied would be called with an empty ``Series`` to guess whether a
   ``Series`` or ``DataFrame`` should be returned:
 
-  .. ipython:: python
+  .. code-block:: ipython
 
-     def applied_func(col):
-        print("Apply function being called with: ", col)
-        return col.sum()
+    In [32]: def applied_func(col):
+      ....:    print("Apply function being called with: ", col)
+      ....:    return col.sum()
+      ....:
 
-     empty = DataFrame(columns=['a', 'b'])
-     empty.apply(applied_func)
+    In [33]: empty = DataFrame(columns=['a', 'b'])
+
+    In [34]: empty.apply(applied_func)
+    Apply function being called with:  Series([], Length: 0, dtype: float64)
+    Out[34]:
+    a   NaN
+    b   NaN
+    Length: 2, dtype: float64
 
   Now, when ``apply`` is called on an empty ``DataFrame``: if the ``reduce``
   argument is ``True`` a ``Series`` will returned, if it is ``False`` a
@@ -155,10 +162,22 @@ API changes
   function being applied will be called with an empty series to try and guess
   the return type.
 
-  .. ipython:: python
+  .. code-block:: ipython
+
+    In [35]: empty.apply(applied_func, reduce=True)
+    Out[35]:
+    a   NaN
+    b   NaN
+    Length: 2, dtype: float64
+
+    In [36]: empty.apply(applied_func, reduce=False)
+    Out[36]:
+    Empty DataFrame
+    Columns: [a, b]
+    Index: []
+
+    [0 rows x 2 columns]
 
-     empty.apply(applied_func, reduce=True)
-     empty.apply(applied_func, reduce=False)
 
 Prior Version Deprecations/Changes
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
diff --git a/doc/source/whatsnew/v0.14.0.txt b/doc/source/whatsnew/v0.14.0.txt
index e2f96f204edab..d4b7b09c054d6 100644
--- a/doc/source/whatsnew/v0.14.0.txt
+++ b/doc/source/whatsnew/v0.14.0.txt
@@ -13,7 +13,7 @@ users upgrade to this version.
   - SQL interfaces updated to use ``sqlalchemy``, See :ref:`Here<whatsnew_0140.sql>`.
   - Display interface changes, See :ref:`Here<whatsnew_0140.display>`
   - MultiIndexing Using Slicers, See :ref:`Here<whatsnew_0140.slicers>`.
-  - Ability to join a singly-indexed DataFrame with a multi-indexed DataFrame, see :ref:`Here <merging.join_on_mi>`
+  - Ability to join a singly-indexed DataFrame with a MultiIndexed DataFrame, see :ref:`Here <merging.join_on_mi>`
   - More consistency in groupby results and more flexible groupby specifications, See :ref:`Here<whatsnew_0140.groupby>`
   - Holiday calendars are now supported in ``CustomBusinessDay``, see :ref:`Here <timeseries.holiday>`
   - Several improvements in plotting functions, including: hexbin, area and pie plots, see :ref:`Here<whatsnew_0140.plotting>`.
@@ -78,12 +78,12 @@ API changes
   - ``df.iloc[len(df)::-1]`` now enumerates all elements in reverse
 
 - The :meth:`DataFrame.interpolate` keyword ``downcast`` default has been changed from ``infer`` to
-  ``None``. This is to preseve the original dtype unless explicitly requested otherwise (:issue:`6290`).
+  ``None``. This is to preserve the original dtype unless explicitly requested otherwise (:issue:`6290`).
 - When converting a dataframe to HTML it used to return `Empty DataFrame`. This special case has
   been removed, instead a header with the column names is returned (:issue:`6062`).
-- ``Series`` and ``Index`` now internall share more common operations, e.g. ``factorize(),nunique(),value_counts()`` are
+- ``Series`` and ``Index`` now internally share more common operations, e.g. ``factorize(),nunique(),value_counts()`` are
   now supported on ``Index`` types as well. The ``Series.weekday`` property from is removed
-  from Series for API  consistency. Using a ``DatetimeIndex/PeriodIndex`` method on a Series will now raise a ``TypeError``.
+  from Series for API consistency. Using a ``DatetimeIndex/PeriodIndex`` method on a Series will now raise a ``TypeError``.
   (:issue:`4551`, :issue:`4056`, :issue:`5519`, :issue:`6380`, :issue:`7206`).
 
 - Add ``is_month_start``, ``is_month_end``, ``is_quarter_start``, ``is_quarter_end``, ``is_year_start``, ``is_year_end`` accessors for ``DateTimeIndex`` / ``Timestamp`` which return a boolean array of whether the timestamp(s) are at the start/end of the month/quarter/year defined by the frequency of the ``DateTimeIndex`` / ``Timestamp`` (:issue:`4565`, :issue:`6998`)
@@ -170,11 +170,18 @@ API changes
   :ref:`Computing rolling pairwise covariances and correlations
   <stats.moments.corr_pairwise>` in the docs.
 
-  .. ipython:: python
+  .. code-block:: ipython
+
+     In [1]: df = DataFrame(np.random.randn(10,4),columns=list('ABCD'))
 
-    df = DataFrame(np.random.randn(10,4),columns=list('ABCD'))
-    covs = rolling_cov(df[['A','B','C']], df[['B','C','D']], 5, pairwise=True)
-    covs[df.index[-1]]
+     In [4]: covs = pd.rolling_cov(df[['A','B','C']], df[['B','C','D']], 5, pairwise=True)
+
+     In [5]: covs[df.index[-1]]
+     Out[5]:
+               B         C         D
+     A  0.035310  0.326593 -0.505430
+     B  0.137748 -0.006888 -0.005383
+     C -0.006888  0.861040  0.020762
 
 - ``Series.iteritems()`` is now lazy (returns an iterator rather than a list). This was the documented behavior prior to 0.14. (:issue:`6760`)
 
@@ -277,7 +284,7 @@ Display Changes
   `large_repr` set to 'info' (:issue:`7105`)
 - The `verbose` keyword in ``DataFrame.info()``, which controls whether to shorten the ``info``
   representation, is now ``None`` by default. This will follow the global setting in
-  ``display.max_info_columns``. The global setting can be overriden with ``verbose=True`` or
+  ``display.max_info_columns``. The global setting can be overridden with ``verbose=True`` or
   ``verbose=False``.
 - Fixed a bug with the `info` repr not honoring the `display.max_info_columns` setting (:issue:`6939`)
 - Offset/freq info now in Timestamp __repr__ (:issue:`4553`)
@@ -287,7 +294,7 @@ Display Changes
 Text Parsing API Changes
 ~~~~~~~~~~~~~~~~~~~~~~~~
 
-:func:`read_csv`/:func:`read_table` will now be noiser w.r.t invalid options rather than falling back to the ``PythonParser``.
+:func:`read_csv`/:func:`read_table` will now be noisier w.r.t invalid options rather than falling back to the ``PythonParser``.
 
 - Raise ``ValueError`` when ``sep`` specified with
   ``delim_whitespace=True`` in :func:`read_csv`/:func:`read_table`
@@ -394,7 +401,7 @@ through SQLAlchemy (:issue:`2717`, :issue:`4163`, :issue:`5950`, :issue:`6292`).
 All databases supported by SQLAlchemy can be used, such
 as PostgreSQL, MySQL, Oracle, Microsoft SQL server (see documentation of
 SQLAlchemy on `included dialects
-<http://sqlalchemy.readthedocs.org/en/latest/dialects/index.html>`_).
+<https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html>`_).
 
 The functionality of providing DBAPI connection objects will only be supported
 for sqlite3 in the future. The ``'mysql'`` flavor is deprecated.
@@ -439,7 +446,7 @@ Some other enhancements to the sql functions include:
 - support for writing the index. This can be controlled with the ``index``
   keyword (default is True).
 - specify the column label to use when writing the index with ``index_label``.
-- specify string columns to parse as datetimes withh the ``parse_dates``
+- specify string columns to parse as datetimes with the ``parse_dates``
   keyword in :func:`~pandas.read_sql_query` and :func:`~pandas.read_sql_table`.
 
 .. warning::
@@ -459,8 +466,8 @@ Some other enhancements to the sql functions include:
 MultiIndexing Using Slicers
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-In 0.14.0 we added a new way to slice multi-indexed objects.
-You can slice a multi-index by providing multiple indexers.
+In 0.14.0 we added a new way to slice MultiIndexed objects.
+You can slice a MultiIndex by providing multiple indexers.
 
 You can provide any of the selectors as if you are indexing by label, see :ref:`Selection by Label <indexing.label>`,
 including slices, lists of labels, labels, and boolean indexers.
@@ -509,10 +516,10 @@ See also issues (:issue:`6134`, :issue:`4036`, :issue:`3057`, :issue:`2598`, :is
                                       names=['lvl0', 'lvl1'])
    df = DataFrame(np.arange(len(index)*len(columns)).reshape((len(index),len(columns))),
                   index=index,
-                  columns=columns).sortlevel().sortlevel(axis=1)
+                  columns=columns).sort_index().sort_index(axis=1)
    df
 
-Basic multi-index slicing using slices, lists, and labels.
+Basic MultiIndex slicing using slices, lists, and labels.
 
 .. ipython:: python
 
@@ -589,15 +596,15 @@ Plotting
   - `align`: Specify the bar alignment. Default is `center` (different from matplotlib). In previous versions, pandas passes `align='edge'` to matplotlib and adjust the location to `center` by itself, and it results `align` keyword is not applied as expected. (:issue:`4525`)
   - `position`: Specify relative alignments for bar plot layout. From 0 (left/bottom-end) to 1(right/top-end). Default is 0.5 (center). (:issue:`6604`)
 
-  Because of the default `align` value changes, coordinates of bar plots are now located on integer values (0.0, 1.0, 2.0 ...). This is intended to make bar plot be located on the same coodinates as line plot. However, bar plot may differs unexpectedly when you manually adjust the bar location or drawing area, such as using `set_xlim`, `set_ylim`, etc. In this cases, please modify your script to meet with new coordinates.
+  Because of the default `align` value changes, coordinates of bar plots are now located on integer values (0.0, 1.0, 2.0 ...). This is intended to make bar plot be located on the same coordinates as line plot. However, bar plot may differs unexpectedly when you manually adjust the bar location or drawing area, such as using `set_xlim`, `set_ylim`, etc. In this cases, please modify your script to meet with new coordinates.
 
 - The :func:`parallel_coordinates` function now takes argument ``color``
-  instead of ``colors``. A ``FutureWarning`` is raised  to alert that
+  instead of ``colors``. A ``FutureWarning`` is raised to alert that
   the old ``colors`` argument will not be supported in a future release. (:issue:`6956`)
 
 - The :func:`parallel_coordinates` and :func:`andrews_curves` functions now take
   positional argument ``frame`` instead of ``data``. A ``FutureWarning`` is
-  raised  if the old ``data`` argument is used by name. (:issue:`6956`)
+  raised if the old ``data`` argument is used by name. (:issue:`6956`)
 
 - :meth:`DataFrame.boxplot` now supports ``layout`` keyword (:issue:`6769`)
 - :meth:`DataFrame.boxplot` has a new keyword argument, `return_type`. It accepts ``'dict'``,
@@ -623,9 +630,9 @@ There are prior version deprecations that are taking effect as of 0.14.0.
 - Remove ``unique`` keyword from :meth:`HDFStore.select_column` (:issue:`3256`)
 - Remove ``inferTimeRule`` keyword from :func:`Timestamp.offset` (:issue:`391`)
 - Remove ``name`` keyword from :func:`get_data_yahoo` and
-  :func:`get_data_google` ( `commit b921d1a <https://github.com/pydata/pandas/commit/b921d1a2>`__ )
+  :func:`get_data_google` ( `commit b921d1a <https://github.com/pandas-dev/pandas/commit/b921d1a2>`__ )
 - Remove ``offset`` keyword from :class:`DatetimeIndex` constructor
-  ( `commit 3136390 <https://github.com/pydata/pandas/commit/3136390>`__ )
+  ( `commit 3136390 <https://github.com/pandas-dev/pandas/commit/3136390>`__ )
 - Remove ``time_rule`` from several rolling-moment statistical functions, such
   as :func:`rolling_sum` (:issue:`1042`)
 - Removed neg ``-`` boolean operations on numpy arrays in favor of inv ``~``, as this is going to
@@ -638,23 +645,23 @@ Deprecations
 
 - The :func:`pivot_table`/:meth:`DataFrame.pivot_table` and :func:`crosstab` functions
   now take arguments ``index`` and ``columns`` instead of ``rows`` and ``cols``.  A
-  ``FutureWarning`` is raised  to alert that the old ``rows`` and ``cols`` arguments
+  ``FutureWarning`` is raised to alert that the old ``rows`` and ``cols`` arguments
   will not be supported in a future release (:issue:`5505`)
 
 - The :meth:`DataFrame.drop_duplicates` and :meth:`DataFrame.duplicated` methods
   now take argument ``subset`` instead of ``cols`` to better align with
-  :meth:`DataFrame.dropna`.  A ``FutureWarning`` is raised  to alert that the old
+  :meth:`DataFrame.dropna`.  A ``FutureWarning`` is raised to alert that the old
   ``cols`` arguments will not be supported in a future release (:issue:`6680`)
 
 - The :meth:`DataFrame.to_csv` and :meth:`DataFrame.to_excel` functions
   now takes argument ``columns`` instead of ``cols``.  A
-  ``FutureWarning`` is raised  to alert that the old ``cols`` arguments
+  ``FutureWarning`` is raised to alert that the old ``cols`` arguments
   will not be supported in a future release (:issue:`6645`)
 
 - Indexers will warn ``FutureWarning`` when used with a scalar indexer and
   a non-floating point Index (:issue:`4892`, :issue:`6960`)
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      # non-floating point indexes can only be indexed by integers / labels
      In [1]: Series(1,np.arange(5))[3.0]
@@ -691,12 +698,12 @@ Deprecations
   ALWAYS return a view. (:issue:`6894`)
 
 - The :func:`parallel_coordinates` function now takes argument ``color``
-  instead of ``colors``. A ``FutureWarning`` is raised  to alert that
+  instead of ``colors``. A ``FutureWarning`` is raised to alert that
   the old ``colors`` argument will not be supported in a future release. (:issue:`6956`)
 
 - The :func:`parallel_coordinates` and :func:`andrews_curves` functions now take
   positional argument ``frame`` instead of ``data``. A ``FutureWarning`` is
-  raised  if the old ``data`` argument is used by name. (:issue:`6956`)
+  raised if the old ``data`` argument is used by name. (:issue:`6956`)
 
 - The support for the 'mysql' flavor when using DBAPI connection objects has been deprecated.
   MySQL will be further supported with SQLAlchemy engines (:issue:`6900`).
@@ -707,7 +714,7 @@ Deprecations
   Use the `percentiles` keyword instead, which takes a list of percentiles to display. The
   default output is unchanged.
 
-- The default return type of :func:`boxplot` will change from a dict to a matpltolib Axes
+- The default return type of :func:`boxplot` will change from a dict to a matplotlib Axes
   in a future release. You can use the future behavior now by passing ``return_type='axes'``
   to boxplot.
 
@@ -741,9 +748,9 @@ Enhancements
 - Add option to turn off escaping in ``DataFrame.to_latex`` (:issue:`6472`)
 - ``pd.read_clipboard`` will, if the keyword ``sep`` is unspecified, try to detect data copied from a spreadsheet
   and parse accordingly. (:issue:`6223`)
-- Joining a singly-indexed DataFrame with a multi-indexed DataFrame (:issue:`3662`)
+- Joining a singly-indexed DataFrame with a MultiIndexed DataFrame (:issue:`3662`)
 
-  See :ref:`the docs<merging.join_on_mi>`. Joining multi-index DataFrames on both the left and right is not yet supported ATM.
+  See :ref:`the docs<merging.join_on_mi>`. Joining MultiIndex DataFrames on both the left and right is not yet supported ATM.
 
   .. ipython:: python
 
@@ -845,7 +852,7 @@ Performance
 - Performance improvement when converting ``DatetimeIndex`` to floating ordinals
   using ``DatetimeConverter`` (:issue:`6636`)
 - Performance improvement for  ``DataFrame.shift`` (:issue:`5609`)
-- Performance improvement in indexing into a multi-indexed Series (:issue:`5567`)
+- Performance improvement in indexing into a MultiIndexed Series (:issue:`5567`)
 - Performance improvements in single-dtyped indexing (:issue:`6484`)
 - Improve performance of DataFrame construction with certain offsets, by removing faulty caching
   (e.g. MonthEnd,BusinessMonthEnd), (:issue:`6479`)
@@ -874,7 +881,7 @@ Bug Fixes
 - Prevent segfault due to MultiIndex not being supported in HDFStore table
   format (:issue:`1848`)
 - Bug in ``pd.DataFrame.sort_index`` where mergesort wasn't stable when ``ascending=False`` (:issue:`6399`)
-- Bug in ``pd.tseries.frequencies.to_offset`` when argument has leading zeroes (:issue:`6391`)
+- Bug in ``pd.tseries.frequencies.to_offset`` when argument has leading zeros (:issue:`6391`)
 - Bug in version string gen. for dev versions with shallow clones / install from tarball (:issue:`6127`)
 - Inconsistent tz parsing ``Timestamp`` / ``to_datetime`` for current year (:issue:`5958`)
 - Indexing bugs with reordered indexes (:issue:`6252`, :issue:`6254`)
@@ -889,10 +896,10 @@ Bug Fixes
 - Issue with groupby ``agg`` with a single function and a a mixed-type frame (:issue:`6337`)
 - Bug in ``DataFrame.replace()`` when passing a non- ``bool``
   ``to_replace`` argument (:issue:`6332`)
-- Raise when trying to align on different levels of a multi-index assignment (:issue:`3738`)
+- Raise when trying to align on different levels of a MultiIndex assignment (:issue:`3738`)
 - Bug in setting complex dtypes via boolean indexing (:issue:`6345`)
 - Bug in TimeGrouper/resample when presented with a non-monotonic DatetimeIndex that would return invalid results. (:issue:`4161`)
-- Bug in index name propogation in TimeGrouper/resample (:issue:`4161`)
+- Bug in index name propagation in TimeGrouper/resample (:issue:`4161`)
 - TimeGrouper has a more compatible API to the rest of the groupers (e.g. ``groups`` was missing) (:issue:`3881`)
 - Bug in multiple grouping with a TimeGrouper depending on target column order (:issue:`6764`)
 - Bug in ``pd.eval`` when parsing strings with possible tokens like ``'&'``
@@ -915,7 +922,7 @@ Bug Fixes
 - Bug in ``Series.reindex`` when specifying a ``method`` with some nan values was inconsistent (noted on a resample) (:issue:`6418`)
 - Bug in :meth:`DataFrame.replace` where nested dicts were erroneously
   depending on the order of dictionary keys and values (:issue:`5338`).
-- Perf issue in concatting with empty objects (:issue:`3259`)
+- Performance issue in concatenating with empty objects (:issue:`3259`)
 - Clarify sorting of ``sym_diff`` on ``Index`` objects with ``NaN`` values (:issue:`6444`)
 - Regression in ``MultiIndex.from_product`` with a ``DatetimeIndex`` as input (:issue:`6439`)
 - Bug in ``str.extract`` when passed a non-default index (:issue:`6348`)
@@ -959,8 +966,8 @@ Bug Fixes
 - Bug in downcasting inference with empty arrays (:issue:`6733`)
 - Bug in ``obj.blocks`` on sparse containers dropping all but the last items of same for dtype (:issue:`6748`)
 - Bug in unpickling ``NaT (NaTType)`` (:issue:`4606`)
-- Bug in ``DataFrame.replace()`` where regex metacharacters were being treated
-  as regexs even when ``regex=False`` (:issue:`6777`).
+- Bug in ``DataFrame.replace()`` where regex meta characters were being treated
+  as regex even when ``regex=False`` (:issue:`6777`).
 - Bug in timedelta ops on 32-bit platforms (:issue:`6808`)
 - Bug in setting a tz-aware index directly via ``.index`` (:issue:`6785`)
 - Bug in expressions.py where numexpr would try to evaluate arithmetic ops
@@ -969,14 +976,14 @@ Bug Fixes
   clean`` (:issue:`6768`)
 - Bug with numpy < 1.7.2 when reading long strings from ``HDFStore`` (:issue:`6166`)
 - Bug in ``DataFrame._reduce`` where non bool-like (0/1) integers were being
-  coverted into bools. (:issue:`6806`)
+  converted into bools. (:issue:`6806`)
 - Regression from 0.13 with ``fillna`` and a Series on datetime-like (:issue:`6344`)
 - Bug in adding ``np.timedelta64`` to ``DatetimeIndex`` with timezone outputs incorrect results (:issue:`6818`)
 - Bug in ``DataFrame.replace()`` where changing a dtype through replacement
   would only replace the first occurrence of a value (:issue:`6689`)
 - Better error message when passing a frequency of 'MS' in ``Period`` construction (GH5332)
 - Bug in ``Series.__unicode__`` when ``max_rows=None`` and the Series has more than 1000 rows. (:issue:`6863`)
-- Bug in ``groupby.get_group`` where a datetlike wasn't always accepted (:issue:`5267`)
+- Bug in ``groupby.get_group`` where a datelike wasn't always accepted (:issue:`5267`)
 - Bug in ``groupBy.get_group`` created by ``TimeGrouper`` raises ``AttributeError`` (:issue:`6914`)
 - Bug in ``DatetimeIndex.tz_localize`` and ``DatetimeIndex.tz_convert`` converting ``NaT`` incorrectly (:issue:`5546`)
 - Bug in arithmetic operations affecting ``NaT`` (:issue:`6873`)
@@ -987,11 +994,11 @@ Bug Fixes
 - Bug in ``DataFrame.plot`` and ``Series.plot``, where the legend behave inconsistently when plotting to the same axes repeatedly (:issue:`6678`)
 - Internal tests for patching ``__finalize__`` / bug in merge not finalizing (:issue:`6923`, :issue:`6927`)
 - accept ``TextFileReader`` in ``concat``, which was affecting a common user idiom (:issue:`6583`)
-- Bug in C parser with leading whitespace (:issue:`3374`)
+- Bug in C parser with leading white space (:issue:`3374`)
 - Bug in C parser with ``delim_whitespace=True`` and ``\r``-delimited lines
-- Bug in python parser with explicit multi-index in row following column header (:issue:`6893`)
+- Bug in python parser with explicit MultiIndex in row following column header (:issue:`6893`)
 - Bug in ``Series.rank`` and ``DataFrame.rank`` that caused small floats (<1e-13) to all receive the same rank (:issue:`6886`)
-- Bug in ``DataFrame.apply`` with functions that used \*args`` or \*\*kwargs and returned
+- Bug in ``DataFrame.apply`` with functions that used ``*args`` or ``**kwargs`` and returned
   an empty result (:issue:`6952`)
 - Bug in sum/mean on 32-bit platforms on overflows (:issue:`6915`)
 - Moved ``Panel.shift`` to ``NDFrame.slice_shift`` and fixed to respect multiple dtypes. (:issue:`6959`)
@@ -1036,7 +1043,7 @@ Bug Fixes
 - Bug in ``query``/``eval`` where global constants were not looked up correctly
   (:issue:`7178`)
 - Bug in recognizing out-of-bounds positional list indexers with ``iloc`` and a multi-axis tuple indexer (:issue:`7189`)
-- Bug in setitem with a single value, multi-index and integer indices (:issue:`7190`, :issue:`7218`)
+- Bug in setitem with a single value, MultiIndex and integer indices (:issue:`7190`, :issue:`7218`)
 - Bug in expressions evaluation with reversed ops, showing in series-dataframe ops (:issue:`7198`, :issue:`7192`)
-- Bug in multi-axis indexing with > 2 ndim and a multi-index (:issue:`7199`)
+- Bug in multi-axis indexing with > 2 ndim and a MultiIndex (:issue:`7199`)
 - Fix a bug where invalid eval/query operations would blow the stack (:issue:`5198`)
diff --git a/doc/source/whatsnew/v0.14.1.txt b/doc/source/whatsnew/v0.14.1.txt
index 9e19161847327..5183dd24e9b34 100644
--- a/doc/source/whatsnew/v0.14.1.txt
+++ b/doc/source/whatsnew/v0.14.1.txt
@@ -48,7 +48,7 @@ API changes
   offsets (BusinessMonthBegin, MonthEnd, BusinessMonthEnd, CustomBusinessMonthEnd,
   BusinessYearBegin, LastWeekOfMonth, FY5253Quarter, LastWeekOfMonth, Easter):
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [6]: from pandas.tseries import offsets
 
@@ -75,7 +75,7 @@ API changes
 
   Note that for the other offsets the default behaviour did not change.
 
-- Add back ``#N/A N/A`` as a default NA value in text parsing, (regresion from 0.12) (:issue:`5521`)
+- Add back ``#N/A N/A`` as a default NA value in text parsing, (regression from 0.12) (:issue:`5521`)
 - Raise a ``TypeError`` on inplace-setting with a ``.where`` and a non ``np.nan`` value as this is inconsistent
   with a set-item expression like ``df[mask] = None`` (:issue:`7656`)
 
@@ -88,7 +88,7 @@ Enhancements
 - Add ``dropna`` argument to ``value_counts`` and ``nunique`` (:issue:`5569`).
 - Add :meth:`~pandas.DataFrame.select_dtypes` method to allow selection of
   columns based on dtype (:issue:`7316`). See :ref:`the docs <basics.selectdtypes>`.
-- All ``offsets`` suppports the ``normalize`` keyword to specify whether
+- All ``offsets`` supports the ``normalize`` keyword to specify whether
   ``offsets.apply``, ``rollforward`` and ``rollback`` resets the time (hour,
   minute, etc) or not (default ``False``, preserves time) (:issue:`7156`):
 
@@ -145,7 +145,7 @@ Performance
 ~~~~~~~~~~~
 - Improvements in dtype inference for numeric operations involving yielding performance gains for dtypes: ``int64``, ``timedelta64``, ``datetime64`` (:issue:`7223`)
 - Improvements in Series.transform for significant performance gains (:issue:`6496`)
-- Improvements in DataFrame.transform with ufuncs and built-in grouper functions for signifcant performance gains (:issue:`7383`)
+- Improvements in DataFrame.transform with ufuncs and built-in grouper functions for significant performance gains (:issue:`7383`)
 - Regression in groupby aggregation of datetime64 dtypes (:issue:`7555`)
 - Improvements in `MultiIndex.from_product` for large iterables (:issue:`7627`)
 
@@ -156,7 +156,7 @@ Experimental
 ~~~~~~~~~~~~
 
 - ``pandas.io.data.Options`` has a new method, ``get_all_data`` method, and now consistently returns a
-  multi-indexed ``DataFrame``, see :ref:`the docs <remote_data.yahoo_options>`. (:issue:`5602`)
+  MultiIndexed ``DataFrame`` (:issue:`5602`)
 - ``io.gbq.read_gbq`` and ``io.gbq.to_gbq`` were refactored to remove the
   dependency on the Google ``bq.py`` command line client. This submodule
   now uses ``httplib2`` and the Google ``apiclient`` and ``oauth2client`` API client
@@ -169,10 +169,10 @@ Experimental
 Bug Fixes
 ~~~~~~~~~
 - Bug in ``DataFrame.where`` with a symmetric shaped frame and a passed other of a DataFrame (:issue:`7506`)
-- Bug in Panel indexing with a multi-index axis (:issue:`7516`)
+- Bug in Panel indexing with a MultiIndex axis (:issue:`7516`)
 - Regression in datetimelike slice indexing with a duplicated index and non-exact end-points (:issue:`7523`)
 - Bug in setitem with list-of-lists and single vs mixed types (:issue:`7551`:)
-- Bug in timeops with non-aligned Series (:issue:`7500`)
+- Bug in time ops with non-aligned Series (:issue:`7500`)
 - Bug in timedelta inference when assigning an incomplete Series (:issue:`7592`)
 - Bug in groupby ``.nth`` with a Series and integer-like column name (:issue:`7559`)
 - Bug in ``Series.get`` with a boolean accessor (:issue:`7407`)
@@ -183,10 +183,10 @@ Bug Fixes
 - Bug in plotting subplots with ``DataFrame.plot``, ``hist`` clears passed ``ax`` even if the number of subplots is one (:issue:`7391`).
 - Bug in plotting subplots with ``DataFrame.boxplot`` with ``by`` kw raises ``ValueError`` if the number of subplots exceeds 1 (:issue:`7391`).
 - Bug in subplots displays ``ticklabels`` and ``labels`` in different rule (:issue:`5897`)
-- Bug in ``Panel.apply`` with a multi-index as an axis (:issue:`7469`)
+- Bug in ``Panel.apply`` with a MultiIndex as an axis (:issue:`7469`)
 - Bug in ``DatetimeIndex.insert`` doesn't preserve ``name`` and ``tz`` (:issue:`7299`)
 - Bug in ``DatetimeIndex.asobject`` doesn't preserve ``name`` (:issue:`7299`)
-- Bug in multi-index slicing with datetimelike ranges (strings and Timestamps), (:issue:`7429`)
+- Bug in MultiIndex slicing with datetimelike ranges (strings and Timestamps), (:issue:`7429`)
 - Bug in ``Index.min`` and ``max`` doesn't handle ``nan`` and ``NaT`` properly (:issue:`7261`)
 - Bug in ``PeriodIndex.min/max`` results in ``int`` (:issue:`7609`)
 - Bug in ``resample`` where ``fill_method`` was ignored if you passed ``how`` (:issue:`2073`)
@@ -209,7 +209,7 @@ Bug Fixes
 - Bug in inferred_freq results in None for eastern hemisphere timezones (:issue:`7310`)
 - Bug in ``Easter`` returns incorrect date when offset is negative (:issue:`7195`)
 - Bug in broadcasting with ``.div``, integer dtypes and divide-by-zero (:issue:`7325`)
-- Bug in ``CustomBusinessDay.apply`` raiases ``NameError`` when ``np.datetime64`` object is passed (:issue:`7196`)
+- Bug in ``CustomBusinessDay.apply`` raises ``NameError`` when ``np.datetime64`` object is passed (:issue:`7196`)
 - Bug in ``MultiIndex.append``, ``concat`` and ``pivot_table`` don't preserve timezone (:issue:`6606`)
 - Bug in ``.loc`` with a list of indexers on a single-multi index level (that is not nested) (:issue:`7349`)
 - Bug in ``Series.map`` when mapping a dict with tuple keys of different lengths (:issue:`7333`)
@@ -221,15 +221,15 @@ Bug Fixes
 - Bug where ``NDFrame.replace()`` didn't correctly replace objects with
   ``Period`` values (:issue:`7379`).
 - Bug in ``.ix`` getitem should always return a Series (:issue:`7150`)
-- Bug in multi-index slicing with incomplete indexers (:issue:`7399`)
-- Bug in multi-index slicing with a step in a sliced level (:issue:`7400`)
+- Bug in MultiIndex slicing with incomplete indexers (:issue:`7399`)
+- Bug in MultiIndex slicing with a step in a sliced level (:issue:`7400`)
 - Bug where negative indexers in ``DatetimeIndex`` were not correctly sliced
   (:issue:`7408`)
 - Bug where ``NaT`` wasn't repr'd correctly in a ``MultiIndex`` (:issue:`7406`,
   :issue:`7409`).
 - Bug where bool objects were converted to ``nan`` in ``convert_objects``
   (:issue:`7416`).
-- Bug in ``quantile`` ignoring the axis keyword argument (:issue`7306`)
+- Bug in ``quantile`` ignoring the axis keyword argument (:issue:`7306`)
 - Bug where ``nanops._maybe_null_out`` doesn't work with complex numbers
   (:issue:`7353`)
 - Bug in several ``nanops`` functions when ``axis==0`` for
diff --git a/doc/source/whatsnew/v0.15.0.txt b/doc/source/whatsnew/v0.15.0.txt
index a33e0f19961ab..79003296ac165 100644
--- a/doc/source/whatsnew/v0.15.0.txt
+++ b/doc/source/whatsnew/v0.15.0.txt
@@ -22,7 +22,7 @@ users upgrade to this version.
   - ``read_csv`` will now by default ignore blank lines when parsing, see :ref:`here <whatsnew_0150.blanklines>`
   - API change in using Indexes in set operations, see :ref:`here <whatsnew_0150.index_set_ops>`
   - Enhancements in the handling of timezones, see :ref:`here <whatsnew_0150.tz>`
-  - A lot of improvements to the rolling and expanding moment funtions, see :ref:`here <whatsnew_0150.roll>`
+  - A lot of improvements to the rolling and expanding moment functions, see :ref:`here <whatsnew_0150.roll>`
   - Internal refactoring of the ``Index`` class to no longer sub-class ``ndarray``, see :ref:`Internal Refactoring <whatsnew_0150.refactoring>`
   - dropping support for ``PyTables`` less than version 3.0.0, and ``numexpr`` less than version 2.1 (:issue:`7990`)
   - Split indexing documentation into :ref:`Indexing and Selecting Data <indexing>` and :ref:`MultiIndex / Advanced Indexing <advanced>`
@@ -44,7 +44,7 @@ users upgrade to this version.
 
 .. warning::
 
-   The refactorings in :class:`~pandas.Categorical` changed the two argument constructor from
+   The refactoring in :class:`~pandas.Categorical` changed the two argument constructor from
    "codes/labels and levels" to "values and levels (now called 'categories')". This can lead to subtle bugs. If you use
    :class:`~pandas.Categorical` directly, please audit your code before updating to this pandas
    version and change it to use the :meth:`~pandas.Categorical.from_codes` constructor. See more on ``Categorical`` :ref:`here <whatsnew_0150.cat>`
@@ -68,7 +68,7 @@ For full docs, see the :ref:`categorical introduction <categorical>` and the
 
 .. ipython:: python
     :okwarning:
-    
+
     df = DataFrame({"id":[1,2,3,4,5,6], "raw_grade":['a', 'b', 'b', 'a', 'a', 'e']})
 
     df["grade"] = df["raw_grade"].astype("category")
@@ -80,7 +80,7 @@ For full docs, see the :ref:`categorical introduction <categorical>` and the
     # Reorder the categories and simultaneously add the missing categories
     df["grade"] = df["grade"].cat.set_categories(["very bad", "bad", "medium", "good", "very good"])
     df["grade"]
-    df.sort("grade")
+    df.sort_values("grade")
     df.groupby("grade").size()
 
 - ``pandas.core.group_agg`` and ``pandas.core.factor_agg`` were removed. As an alternative, construct
@@ -112,7 +112,7 @@ This type is very similar to how ``Timestamp`` works for ``datetimes``. It is a
 
    ``Timedelta`` scalars (and ``TimedeltaIndex``) component fields are *not the same* as the component fields on a ``datetime.timedelta`` object. For example, ``.seconds`` on a ``datetime.timedelta`` object returns the total number of seconds combined between ``hours``, ``minutes`` and ``seconds``. In contrast, the pandas ``Timedelta`` breaks out hours, minutes, microseconds and nanoseconds separately.
 
-   .. code-block:: python
+   .. code-block:: ipython
 
       # Timedelta accessor
       In [9]: tds = Timedelta('31 days 5 min 3 sec')
@@ -139,7 +139,7 @@ This type is very similar to how ``Timestamp`` works for ``datetimes``. It is a
 
        The arguments to ``pd.to_timedelta`` are now ``(arg,unit='ns',box=True,coerce=False)``, previously were ``(arg,box=True,unit='ns')`` as these are more logical.
 
-Consruct a scalar
+Construct a scalar
 
 .. ipython:: python
 
@@ -326,7 +326,7 @@ Timezone handling improvements
 
 - ``Timestamp.tz_localize`` and ``Timestamp.tz_convert`` now raise ``TypeError`` in error cases, rather than ``Exception`` (:issue:`8025`)
 
-- a  timeseries/index localized to UTC when inserted into a Series/DataFrame will preserve the UTC timezone (rather than being a naive ``datetime64[ns]``) as ``object`` dtype (:issue:`8411`)
+- a timeseries/index localized to UTC when inserted into a Series/DataFrame will preserve the UTC timezone (rather than being a naive ``datetime64[ns]``) as ``object`` dtype (:issue:`8411`)
 
 - ``Timestamp.__repr__`` displays ``dateutil.tz.tzoffset`` info (:issue:`7907`)
 
@@ -346,16 +346,22 @@ Rolling/Expanding Moments improvements
 
      s = Series([10, 11, 12, 13])
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [15]: rolling_min(s, window=10, min_periods=5)
      ValueError: min_periods (5) must be <= window (4)
 
   New behavior
 
-  .. ipython:: python
+  .. code-block:: ipython
 
-     rolling_min(s, window=10, min_periods=5)
+     In [4]: pd.rolling_min(s, window=10, min_periods=5)
+     Out[4]:
+     0   NaN
+     1   NaN
+     2   NaN
+     3   NaN
+     dtype: float64
 
 - :func:`rolling_max`, :func:`rolling_min`, :func:`rolling_sum`, :func:`rolling_mean`, :func:`rolling_median`,
   :func:`rolling_std`, :func:`rolling_var`, :func:`rolling_skew`, :func:`rolling_kurt`, :func:`rolling_quantile`,
@@ -369,7 +375,7 @@ Rolling/Expanding Moments improvements
 
   Prior behavior (note final value is ``NaN``):
 
-  .. code-block:: python
+  .. code-block:: ipython
 
     In [7]: rolling_sum(Series(range(4)), window=3, min_periods=0, center=True)
     Out[7]:
@@ -381,9 +387,15 @@ Rolling/Expanding Moments improvements
 
   New behavior (note final value is ``5 = sum([2, 3, NaN])``):
 
-  .. ipython:: python
+  .. code-block:: ipython
 
-    rolling_sum(Series(range(4)), window=3, min_periods=0, center=True)
+     In [7]: rolling_sum(Series(range(4)), window=3, min_periods=0, center=True)
+     Out[7]:
+     0    1
+     1    3
+     2    6
+     3    5
+     dtype: float64
 
 - :func:`rolling_window` now normalizes the weights properly in rolling mean mode (`mean=True`) so that
   the calculated weighted means (e.g. 'triang', 'gaussian') are distributed about the same means as those
@@ -395,22 +407,29 @@ Rolling/Expanding Moments improvements
 
   Behavior prior to 0.15.0:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
-    In [39]: rolling_window(s, window=3, win_type='triang', center=True)
-    Out[39]:
-    0         NaN
-    1    6.583333
-    2    6.883333
-    3    6.683333
-    4         NaN
-    dtype: float64
+     In [39]: rolling_window(s, window=3, win_type='triang', center=True)
+     Out[39]:
+     0         NaN
+     1    6.583333
+     2    6.883333
+     3    6.683333
+     4         NaN
+     dtype: float64
 
   New behavior
 
-  .. ipython:: python
+  .. code-block:: ipython
 
-    rolling_window(s, window=3, win_type='triang', center=True)
+     In [10]: pd.rolling_window(s, window=3, win_type='triang', center=True)
+     Out[10]:
+     0       NaN
+     1     9.875
+     2    10.325
+     3    10.025
+     4       NaN
+     dtype: float64
 
 - Removed ``center`` argument from all :func:`expanding_ <expanding_apply>` functions (see :ref:`list <api.functions_expanding>`),
   as the results produced when ``center=True`` did not make much sense. (:issue:`7925`)
@@ -435,7 +454,7 @@ Rolling/Expanding Moments improvements
 
     s  = Series([1, None, None, None, 2, 3])
 
-  .. code-block:: python
+  .. code-block:: ipython
 
 	In [51]: ewma(s, com=3., min_periods=2)
 	Out[51]:
@@ -449,9 +468,17 @@ Rolling/Expanding Moments improvements
 
   New behavior (note values start at index ``4``, the location of the 2nd (since ``min_periods=2``) non-empty value):
 
-  .. ipython:: python
+  .. code-block:: ipython
 
-    ewma(s, com=3., min_periods=2)
+     In [2]: pd.ewma(s, com=3., min_periods=2)
+     Out[2]:
+     0         NaN
+     1         NaN
+     2         NaN
+     3         NaN
+     4    1.759644
+     5    2.383784
+     dtype: float64
 
 - :func:`ewmstd`, :func:`ewmvol`, :func:`ewmvar`, :func:`ewmcov`, and :func:`ewmcorr`
   now have an optional ``adjust`` argument, just like :func:`ewma` does,
@@ -465,11 +492,28 @@ Rolling/Expanding Moments improvements
   When ``ignore_na=True`` (which reproduces the pre-0.15.0 behavior), missing values are ignored in the weights calculation.
   (:issue:`7543`)
 
-  .. ipython:: python
+  .. code-block:: ipython
 
-     ewma(Series([None, 1., 8.]), com=2.)
-     ewma(Series([1., None, 8.]), com=2., ignore_na=True)  # pre-0.15.0 behavior
-     ewma(Series([1., None, 8.]), com=2., ignore_na=False)  # new default
+     In [7]: pd.ewma(Series([None, 1., 8.]), com=2.)
+     Out[7]:
+     0    NaN
+     1    1.0
+     2    5.2
+     dtype: float64
+
+     In [8]: pd.ewma(Series([1., None, 8.]), com=2., ignore_na=True)  # pre-0.15.0 behavior
+     Out[8]:
+     0    1.0
+     1    1.0
+     2    5.2
+     dtype: float64
+
+     In [9]: pd.ewma(Series([1., None, 8.]), com=2., ignore_na=False)  # new default
+     Out[9]:
+     0    1.000000
+     1    1.000000
+     2    5.846154
+     dtype: float64
 
   .. warning::
 
@@ -503,7 +547,7 @@ Rolling/Expanding Moments improvements
 
      s = Series([1., 2., 0., 4.])
 
-  .. code-block:: python
+  .. code-block:: ipython
 
 	 In [89]: ewmvar(s, com=2., bias=False)
 	 Out[89]:
@@ -525,10 +569,23 @@ Rolling/Expanding Moments improvements
   By comparison, the following 0.15.0 results have a ``NaN`` for entry ``0``,
   and the debiasing factors are decreasing (towards 1.25):
 
-  .. ipython:: python
+  .. code-block:: ipython
+
+     In [14]: pd.ewmvar(s, com=2., bias=False)
+     Out[14]:
+     0         NaN
+     1    0.500000
+     2    1.210526
+     3    4.089069
+     dtype: float64
 
-     ewmvar(s, com=2., bias=False)
-     ewmvar(s, com=2., bias=False) / ewmvar(s, com=2., bias=True)
+     In [15]: pd.ewmvar(s, com=2., bias=False) / pd.ewmvar(s, com=2., bias=True)
+     Out[15]:
+     0         NaN
+     1    2.083333
+     2    1.583333
+     3    1.425439
+     dtype: float64
 
   See :ref:`Exponentially weighted moment functions <stats.moments.exponentially_weighted>` for details. (:issue:`7912`)
 
@@ -580,7 +637,7 @@ for more details):
 
   will have to adapted to the following to keep the same behaviour:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
     In [2]: pd.Categorical.from_codes([0,1,0,2,1], categories=['a', 'b', 'c'])
     Out[2]:
@@ -619,10 +676,19 @@ Other notable API changes:
 
   Both will now return a frame reindex by [1,3]. E.g.
 
-  .. ipython:: python
+  .. code-block:: ipython
+
+     In [3]: df.loc[[1,3]]
+     Out[3]:
+          0
+     1    a
+     3  NaN
 
-     df.loc[[1,3]]
-     df.loc[[1,3],:]
+     In [4]: df.loc[[1,3],:]
+     Out[4]:
+          0
+     1    a
+     3  NaN
 
   This can also be seen in multi-axis indexing with a ``Panel``.
 
@@ -636,11 +702,16 @@ Other notable API changes:
 
   The following would raise ``KeyError`` prior to 0.15.0:
 
-  .. ipython:: python
+  .. code-block:: ipython
 
-     p.loc[['ItemA','ItemD'],:,'D']
+     In [5]:
+     Out[5]:
+        ItemA  ItemD
+     1      3    NaN
+     2      7    NaN
+     3     11    NaN
 
-  Furthermore, ``.loc`` will raise If no values are found in a multi-index with a list-like indexer:
+  Furthermore, ``.loc`` will raise If no values are found in a MultiIndex with a list-like indexer:
 
   .. ipython:: python
      :okexcept:
@@ -648,7 +719,7 @@ Other notable API changes:
      s = Series(np.arange(3,dtype='int64'),
                 index=MultiIndex.from_product([['A'],['foo','bar','baz']],
                                               names=['one','two'])
-               ).sortlevel()
+               ).sort_index()
      s
      try:
         s.loc[['D']]
@@ -690,7 +761,7 @@ Other notable API changes:
 
   Behavior prior to v0.15.0
 
-  .. code-block:: python
+  .. code-block:: ipython
 
 
      # the original object
@@ -723,7 +794,7 @@ Other notable API changes:
 .. _whatsnew_0150.blanklines:
 
 - Made both the C-based and Python engines for `read_csv` and `read_table` ignore empty lines in input as well as
-  whitespace-filled lines, as long as ``sep`` is not whitespace. This is an API change
+  white space-filled lines, as long as ``sep`` is not white space. This is an API change
   that can be controlled by the keyword parameter ``skip_blank_lines``.  See :ref:`the docs <io.skiplines>` (:issue:`4466`)
 
 - A timeseries/index localized to UTC when inserted into a Series/DataFrame will preserve the UTC timezone
@@ -766,7 +837,7 @@ Other notable API changes:
      A value is trying to be set on a copy of a slice from a DataFrame.
      Try using .loc[row_indexer,col_indexer] = value instead
 
-     See the the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
+     See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
 
 - ``merge``, ``DataFrame.merge``, and ``ordered_merge`` now return the same type
   as the ``left`` argument (:issue:`7737`).
@@ -807,7 +878,7 @@ a transparent change with only very limited API implications (:issue:`5080`, :is
 
 - you may need to unpickle pandas version < 0.15.0 pickles using ``pd.read_pickle`` rather than ``pickle.load``. See :ref:`pickle docs <io.pickle>`
 - when plotting with a ``PeriodIndex``, the matplotlib internal axes will now be arrays of ``Period`` rather than a ``PeriodIndex`` (this is similar to how a ``DatetimeIndex`` passes arrays of ``datetimes`` now)
-- MultiIndexes will now raise similary to other pandas objects w.r.t. truth testing, see :ref:`here <gotchas.truth>` (:issue:`7897`).
+- MultiIndexes will now raise similarly to other pandas objects w.r.t. truth testing, see :ref:`here <gotchas.truth>` (:issue:`7897`).
 - When plotting a DatetimeIndex directly with matplotlib's `plot` function,
   the axis labels will no longer be formatted as dates but as integers (the
   internal representation of a ``datetime64``). **UPDATE** This is fixed
@@ -869,7 +940,7 @@ Enhancements
 
 Enhancements in the importing/exporting of Stata files:
 
-- Added support for bool, uint8, uint16 and uint32 datatypes in ``to_stata`` (:issue:`7097`, :issue:`7365`)
+- Added support for bool, uint8, uint16 and uint32 data types in ``to_stata`` (:issue:`7097`, :issue:`7365`)
 - Added conversion option when importing Stata files (:issue:`8527`)
 - ``DataFrame.to_stata`` and ``StataWriter`` check string length for
   compatibility with limitations imposed in dta files where fixed-width
@@ -912,12 +983,12 @@ Other:
 
     df.describe(include='all')
 
-  Without those arguments, 'describe` will behave as before, including only numerical columns or, if none are, only categorical columns. See also the :ref:`docs <basics.describe>`
+  Without those arguments, ``describe`` will behave as before, including only numerical columns or, if none are, only categorical columns. See also the :ref:`docs <basics.describe>`
 
 - Added ``split`` as an option to the ``orient`` argument in ``pd.DataFrame.to_dict``. (:issue:`7840`)
 
 - The ``get_dummies`` method can now be used on DataFrames. By default only
-  catagorical columns are encoded as 0's and 1's, while other columns are
+  categorical columns are encoded as 0's and 1's, while other columns are
   left untouched.
 
   .. ipython:: python
@@ -973,14 +1044,14 @@ Other:
 
       idx = MultiIndex.from_product([['a'], range(3), list("pqr")], names=['foo', 'bar', 'baz'])
       idx.set_names('qux', level=0)
-      idx.set_names(['qux','baz'], level=[0,1])
+      idx.set_names(['qux','corge'], level=[0,1])
       idx.set_levels(['a','b','c'], level='bar')
       idx.set_levels([['a','b','c'],[1,2,3]], level=[1,2])
 
 - ``Index.isin`` now supports a ``level`` argument to specify which index level
   to use for membership tests (:issue:`7892`, :issue:`7890`)
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [1]: idx = MultiIndex.from_product([[0, 1], ['a', 'b', 'c']])
 
@@ -999,7 +1070,7 @@ Other:
      idx.duplicated()
      idx.drop_duplicates()
 
-- add ``copy=True`` argument to ``pd.concat`` to enable pass thru of complete blocks (:issue:`8252`)
+- add ``copy=True`` argument to ``pd.concat`` to enable pass through of complete blocks (:issue:`8252`)
 
 - Added support for numpy 1.8+ data types (``bool_``, ``int_``, ``float_``, ``string_``) for conversion to R dataframe  (:issue:`8400`)
 
@@ -1043,11 +1114,11 @@ Bug Fixes
 - Bug in ``DatetimeIndex`` and ``PeriodIndex`` in-place addition and subtraction cause different result from normal one (:issue:`6527`)
 - Bug in adding and subtracting ``PeriodIndex`` with ``PeriodIndex`` raise ``TypeError`` (:issue:`7741`)
 - Bug in ``combine_first`` with ``PeriodIndex`` data raises ``TypeError`` (:issue:`3367`)
-- Bug in multi-index slicing with missing indexers (:issue:`7866`)
-- Bug in multi-index slicing with various edge cases (:issue:`8132`)
-- Regression in multi-index indexing with a non-scalar type object (:issue:`7914`)
+- Bug in MultiIndex slicing with missing indexers (:issue:`7866`)
+- Bug in MultiIndex slicing with various edge cases (:issue:`8132`)
+- Regression in MultiIndex indexing with a non-scalar type object (:issue:`7914`)
 - Bug in ``Timestamp`` comparisons with ``==`` and ``int64`` dtype (:issue:`8058`)
-- Bug in pickles contains ``DateOffset`` may raise ``AttributeError`` when ``normalize`` attribute is reffered internally (:issue:`7748`)
+- Bug in pickles contains ``DateOffset`` may raise ``AttributeError`` when ``normalize`` attribute is referred internally (:issue:`7748`)
 - Bug in ``Panel`` when using ``major_xs`` and ``copy=False`` is passed (deprecation warning fails because of missing ``warnings``) (:issue:`8152`).
 - Bug in pickle deserialization that failed for pre-0.14.1 containers with dup items trying to avoid ambiguity
   when matching block and manager items, when there's only one block there's no ambiguity (:issue:`7794`)
@@ -1059,7 +1130,7 @@ Bug Fixes
 - Bug in ``get`` where an ``IndexError`` would not cause the default value to be returned (:issue:`7725`)
 - Bug in ``offsets.apply``, ``rollforward`` and ``rollback`` may reset nanosecond (:issue:`7697`)
 - Bug in ``offsets.apply``, ``rollforward`` and ``rollback`` may raise ``AttributeError`` if ``Timestamp`` has ``dateutil`` tzinfo (:issue:`7697`)
-- Bug in sorting a multi-index frame with a ``Float64Index`` (:issue:`8017`)
+- Bug in sorting a MultiIndex frame with a ``Float64Index`` (:issue:`8017`)
 - Bug in inconsistent panel setitem with a rhs of a ``DataFrame`` for alignment (:issue:`7763`)
 - Bug in ``is_superperiod`` and ``is_subperiod`` cannot handle higher frequencies than ``S`` (:issue:`7760`, :issue:`7772`, :issue:`7803`)
 - Bug in 32-bit platforms with ``Series.shift`` (:issue:`8129`)
@@ -1141,7 +1212,7 @@ Bug Fixes
 - Bug in ``NDFrame.loc`` indexing when row/column names were lost when target was a list/ndarray (:issue:`6552`)
 - Regression in ``NDFrame.loc`` indexing when rows/columns were converted to Float64Index if target was an empty list/ndarray (:issue:`7774`)
 - Bug in ``Series`` that allows it to be indexed by a ``DataFrame`` which has unexpected results.  Such indexing is no longer permitted (:issue:`8444`)
-- Bug in item assignment of a ``DataFrame`` with multi-index columns where right-hand-side columns were not aligned (:issue:`7655`)
+- Bug in item assignment of a ``DataFrame`` with MultiIndex columns where right-hand-side columns were not aligned (:issue:`7655`)
 - Suppress FutureWarning generated by NumPy when comparing object arrays containing NaN for equality (:issue:`7065`)
 - Bug in ``DataFrame.eval()`` where the dtype of the ``not`` operator (``~``)
   was not correctly inferred as ``bool``.
diff --git a/doc/source/whatsnew/v0.15.1.txt b/doc/source/whatsnew/v0.15.1.txt
index bd878db08a3ed..8cbf239ea20d0 100644
--- a/doc/source/whatsnew/v0.15.1.txt
+++ b/doc/source/whatsnew/v0.15.1.txt
@@ -26,7 +26,7 @@ API changes
 
   previous behavior:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [6]: s.dt.hour
      Out[6]:
@@ -57,7 +57,7 @@ API changes
 
   previous behavior:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [4]: df.groupby(ts, as_index=False).max()
      Out[4]:
@@ -72,7 +72,7 @@ API changes
 
     df.groupby(ts, as_index=False).max()
 
-- ``groupby`` will not erroneously exclude columns if the column name conflics
+- ``groupby`` will not erroneously exclude columns if the column name conflicts
   with the grouper name (:issue:`8112`):
 
   .. ipython:: python
@@ -83,7 +83,7 @@ API changes
 
   previous behavior (excludes 1st column from output):
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [4]: gr.apply(sum)
      Out[4]:
@@ -108,21 +108,20 @@ API changes
 
   previous behavior:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
-    In [8]: s.loc[3.5:1.5]
-    KeyError: 3.5
+     In [8]: s.loc[3.5:1.5]
+     KeyError: 3.5
 
   current behavior:
 
   .. ipython:: python
 
-    s.loc[3.5:1.5]
-
+     s.loc[3.5:1.5]
 
 - ``io.data.Options`` has been fixed for a change in the format of the Yahoo Options page (:issue:`8612`), (:issue:`8741`)
 
-  .. note:: 
+  .. note::
 
     As a result of a change in Yahoo's option page layout, when an expiry date is given,
     ``Options`` methods now return data for a single expiry date.  Previously, methods returned all
@@ -145,15 +144,46 @@ API changes
 
   Current behavior:
 
-  .. ipython:: python
-
-     from pandas.io.data import Options
-     aapl = Options('aapl','yahoo')
-     aapl.get_call_data().iloc[0:5,0:1]
-     aapl.expiry_dates
-     aapl.get_near_stock_price(expiry=aapl.expiry_dates[0:3]).iloc[0:5,0:1]
-
-  See the Options documentation in :ref:`Remote Data  <remote_data.yahoo_options>`
+  .. code-block:: ipython
+
+      In [17]: from pandas.io.data import Options
+
+      In [18]: aapl = Options('aapl','yahoo')
+
+      In [19]: aapl.get_call_data().iloc[0:5,0:1]
+      Out[19]:
+                                                   Last
+      Strike Expiry     Type Symbol
+      80     2014-11-14 call AAPL141114C00080000  29.05
+      84     2014-11-14 call AAPL141114C00084000  24.80
+      85     2014-11-14 call AAPL141114C00085000  24.05
+      86     2014-11-14 call AAPL141114C00086000  22.76
+      87     2014-11-14 call AAPL141114C00087000  21.74
+
+      In [20]: aapl.expiry_dates
+      Out[20]:
+      [datetime.date(2014, 11, 14),
+       datetime.date(2014, 11, 22),
+       datetime.date(2014, 11, 28),
+       datetime.date(2014, 12, 5),
+       datetime.date(2014, 12, 12),
+       datetime.date(2014, 12, 20),
+       datetime.date(2015, 1, 17),
+       datetime.date(2015, 2, 20),
+       datetime.date(2015, 4, 17),
+       datetime.date(2015, 7, 17),
+       datetime.date(2016, 1, 15),
+       datetime.date(2017, 1, 20)]
+
+      In [21]: aapl.get_near_stock_price(expiry=aapl.expiry_dates[0:3]).iloc[0:5,0:1]
+      Out[21]:
+                                                  Last
+      Strike Expiry     Type Symbol
+      109    2014-11-22 call AAPL141122C00109000  1.48
+             2014-11-28 call AAPL141128C00109000  1.79
+      110    2014-11-14 call AAPL141114C00110000  0.55
+             2014-11-22 call AAPL141122C00110000  1.02
+             2014-11-28 call AAPL141128C00110000  1.32
 
 .. _whatsnew_0151.datetime64_plotting:
 
@@ -180,7 +210,7 @@ Enhancements
 
   previous behavior:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [7]: pd.concat(deque((df1, df2)))
      TypeError: first argument must be a list-like of pandas objects, you passed an object of type "deque"
@@ -199,7 +229,7 @@ Enhancements
 
   previous behavior:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      # this was underreported in prior versions
      In [1]: dfi.memory_usage(index=True)
@@ -225,7 +255,7 @@ Enhancements
 
 - Added support for 3-character ISO and non-standard country codes in :func:`io.wb.download()` (:issue:`8482`)
 
-- :ref:`World Bank data requests <remote_data.wb>` now will warn/raise based
+- World Bank data requests now will warn/raise based
   on an ``errors`` argument, as well as a list of hard-coded country codes and
   the World Bank's JSON response.  In prior versions, the error messages
   didn't look at the World Bank's JSON response.  Problem-inducing input were
@@ -244,7 +274,7 @@ Enhancements
 Bug Fixes
 ~~~~~~~~~
 
-- Bug in unpickling  of a ``CustomBusinessDay`` object (:issue:`8591`)
+- Bug in unpickling of a ``CustomBusinessDay`` object (:issue:`8591`)
 - Bug in coercing ``Categorical`` to a records array, e.g. ``df.to_records()`` (:issue:`8626`)
 - Bug in ``Categorical`` not created properly with ``Series.to_frame()`` (:issue:`8626`)
 - Bug in coercing in astype of a ``Categorical`` of a passed ``pd.Categorical`` (this now raises ``TypeError`` correctly), (:issue:`8626`)
@@ -257,8 +287,8 @@ Bug Fixes
 - Bug in ``Categorical`` reflected comparison operator raising if the first argument was a numpy array scalar (e.g. np.int64) (:issue:`8658`)
 - Bug in Panel indexing with a list-like (:issue:`8710`)
 - Compat issue is ``DataFrame.dtypes`` when ``options.mode.use_inf_as_null`` is True (:issue:`8722`)
-- Bug in ``read_csv``, ``dialect`` parameter would not take a string (:issue: `8703`)
-- Bug in slicing a multi-index level with an empty-list (:issue:`8737`)
+- Bug in ``read_csv``, ``dialect`` parameter would not take a string (:issue:`8703`)
+- Bug in slicing a MultiIndex level with an empty-list (:issue:`8737`)
 - Bug in numeric index operations of add/sub with Float/Index Index with numpy arrays (:issue:`8608`)
 - Bug in setitem with empty indexer and unwanted coercion of dtypes (:issue:`8669`)
 - Bug in ix/loc block splitting on setitem (manifests with integer-like dtypes, e.g. datetime64) (:issue:`8607`)
@@ -274,4 +304,3 @@ Bug Fixes
 - Bug in Setting by indexer to a scalar value with a mixed-dtype `Panel4d` was failing (:issue:`8702`)
 - Bug where ``DataReader``'s would fail if one of the symbols passed was invalid.  Now returns data for valid symbols and np.nan for invalid (:issue:`8494`)
 - Bug in ``get_quote_yahoo`` that wouldn't allow non-float return values (:issue:`5229`).
-
diff --git a/doc/source/whatsnew/v0.15.2.txt b/doc/source/whatsnew/v0.15.2.txt
index 6a14a4024ba5a..ee72fab7d23f2 100644
--- a/doc/source/whatsnew/v0.15.2.txt
+++ b/doc/source/whatsnew/v0.15.2.txt
@@ -35,7 +35,7 @@ API changes
     df.loc[(1, 'z')]
 
     # lexically sorting
-    df2 = df.sortlevel()
+    df2 = df.sort_index()
     df2
     df2.index.lexsort_depth
     df2.loc[(1,'z')]
@@ -44,7 +44,7 @@ API changes
   whether they were "used" or not (see :issue:`8559` for the discussion).
   Previous behaviour was to return all categories:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
     In [3]: cat = pd.Categorical(['a', 'b', 'a'], categories=['a', 'b', 'c'])
 
@@ -81,7 +81,7 @@ API changes
 
   Old behavior:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [6]: data.y
      Out[6]: 2
@@ -102,7 +102,7 @@ API changes
 
   Old behavior:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [1]: s = pd.Series(np.arange(3), ['a', 'b', 'c'])
      Out[1]:
@@ -163,9 +163,9 @@ Other enhancements:
      p.all()
 
 - Added support for ``utcfromtimestamp()``, ``fromtimestamp()``, and ``combine()`` on `Timestamp` class (:issue:`5351`).
-- Added Google Analytics (`pandas.io.ga`) basic documentation (:issue:`8835`). See :ref:`here<remote_data.ga>`.
+- Added Google Analytics (`pandas.io.ga`) basic documentation (:issue:`8835`). See `here <http://pandas.pydata.org/pandas-docs/version/0.15.2/remote_data.html#remote-data-ga>`__.
 - ``Timedelta`` arithmetic returns ``NotImplemented`` in unknown cases, allowing extensions by custom classes (:issue:`8813`).
-- ``Timedelta`` now supports arithemtic with ``numpy.ndarray`` objects of the appropriate dtype (numpy 1.8 or newer only) (:issue:`8884`).
+- ``Timedelta`` now supports arithmetic with ``numpy.ndarray`` objects of the appropriate dtype (numpy 1.8 or newer only) (:issue:`8884`).
 - Added ``Timedelta.to_timedelta64()`` method to the public API (:issue:`8884`).
 - Added ``gbq.generate_bq_schema()`` function to the gbq module (:issue:`8325`).
 - ``Series`` now works with map objects the same way as generators (:issue:`8909`).
@@ -173,7 +173,7 @@ Other enhancements:
 - ``to_datetime`` gains an ``exact`` keyword to allow for a format to not require an exact match for a provided format string (if its ``False``). ``exact`` defaults to ``True`` (meaning that exact matching is still the default)  (:issue:`8904`)
 - Added ``axvlines`` boolean option to parallel_coordinates plot function, determines whether vertical lines will be printed, default is True
 - Added ability to read table footers to read_html (:issue:`8552`)
-- ``to_sql`` now infers datatypes of non-NA values for columns that contain NA values and have dtype ``object`` (:issue:`8778`).
+- ``to_sql`` now infers data types of non-NA values for columns that contain NA values and have dtype ``object`` (:issue:`8778`).
 
 
 .. _whatsnew_0152.performance:
@@ -194,12 +194,12 @@ Bug Fixes
 - Bug in Timestamp-Timestamp not returning a Timedelta type and datelike-datelike ops with timezones (:issue:`8865`)
 - Made consistent a timezone mismatch exception (either tz operated with None or incompatible timezone), will now return ``TypeError`` rather than ``ValueError`` (a couple of edge cases only), (:issue:`8865`)
 - Bug in using a ``pd.Grouper(key=...)`` with no level/axis or level only (:issue:`8795`, :issue:`8866`)
-- Report a ``TypeError`` when invalid/no paramaters are passed in a groupby (:issue:`8015`)
+- Report a ``TypeError`` when invalid/no parameters are passed in a groupby (:issue:`8015`)
 - Bug in packaging pandas with ``py2app/cx_Freeze`` (:issue:`8602`, :issue:`8831`)
 - Bug in ``groupby`` signatures that didn't include \*args or \*\*kwargs (:issue:`8733`).
 - ``io.data.Options`` now raises ``RemoteDataError`` when no expiry dates are available from Yahoo and when it receives no data from Yahoo (:issue:`8761`), (:issue:`8783`).
 - Unclear error message in csv parsing when passing dtype and names and the parsed data is a different data type (:issue:`8833`)
-- Bug in slicing a multi-index with an empty list and at least one boolean indexer (:issue:`8781`)
+- Bug in slicing a MultiIndex with an empty list and at least one boolean indexer (:issue:`8781`)
 - ``io.data.Options`` now raises ``RemoteDataError`` when no expiry dates are available from Yahoo (:issue:`8761`).
 - ``Timedelta`` kwargs may now be numpy ints and floats (:issue:`8757`).
 - Fixed several outstanding bugs for ``Timedelta`` arithmetic and comparisons (:issue:`8813`, :issue:`5963`, :issue:`5436`).
@@ -215,7 +215,7 @@ Bug Fixes
 - ``io.data.Options`` now raises ``RemoteDataError`` when no expiry dates are available from Yahoo and when it receives no data from Yahoo (:issue:`8761`), (:issue:`8783`).
 - Fix: The font size was only set on x axis if vertical or the y axis if horizontal. (:issue:`8765`)
 - Fixed division by 0 when reading big csv files in python 3 (:issue:`8621`)
-- Bug in outputing a Multindex with ``to_html,index=False`` which would add an extra column (:issue:`8452`)
+- Bug in outputting a MultiIndex with ``to_html,index=False`` which would add an extra column (:issue:`8452`)
 - Imported categorical variables from Stata files retain the ordinal information in the underlying data (:issue:`8836`).
 - Defined ``.size`` attribute across ``NDFrame`` objects to provide compat with numpy >= 1.9.1; buggy with ``np.array_split`` (:issue:`8846`)
 - Skip testing of histogram plots for matplotlib <= 1.2 (:issue:`8648`).
@@ -230,12 +230,11 @@ Bug Fixes
 - Bug where index name was still used when plotting a series with ``use_index=False`` (:issue:`8558`).
 - Bugs when trying to stack multiple columns, when some (or all) of the level names are numbers (:issue:`8584`).
 - Bug in ``MultiIndex`` where ``__contains__`` returns wrong result if index is not lexically sorted or unique (:issue:`7724`)
-- BUG CSV: fix problem with trailing whitespace in skipped rows, (:issue:`8679`), (:issue:`8661`), (:issue:`8983`)
+- BUG CSV: fix problem with trailing white space in skipped rows, (:issue:`8679`), (:issue:`8661`), (:issue:`8983`)
 - Regression in ``Timestamp`` does not parse 'Z' zone designator for UTC (:issue:`8771`)
 - Bug in `StataWriter` the produces writes strings with 244 characters irrespective of actual size (:issue:`8969`)
 - Fixed ValueError raised by cummin/cummax when datetime64 Series contains NaT. (:issue:`8965`)
-- Bug in Datareader returns object dtype if there are missing values (:issue:`8980`)
+- Bug in DataReader returns object dtype if there are missing values (:issue:`8980`)
 - Bug in plotting if sharex was enabled and index was a timeseries, would show labels on multiple axes (:issue:`3964`).
 - Bug where passing a unit to the TimedeltaIndex constructor applied the to nano-second conversion twice. (:issue:`9011`).
 - Bug in plotting of a period-like array (:issue:`9012`)
-
diff --git a/doc/source/whatsnew/v0.16.0.txt b/doc/source/whatsnew/v0.16.0.txt
index a78d776403528..ce525bbb4c1d6 100644
--- a/doc/source/whatsnew/v0.16.0.txt
+++ b/doc/source/whatsnew/v0.16.0.txt
@@ -19,7 +19,7 @@ Highlights include:
   modules are deprecated. We refer users to external packages like
   `seaborn <http://stanford.edu/~mwaskom/software/seaborn/>`_,
   `pandas-qt <https://github.com/datalyze-solutions/pandas-qt>`_ and
-  `rpy2 <http://rpy.sourceforge.net/>`_ for similar or equivalent
+  `rpy2 <http://rpy2.bitbucket.org/>`_ for similar or equivalent
   functionality, see :ref:`here <whatsnew_0160.deprecations>`
 
 Check the :ref:`API Changes <whatsnew_0160.api>` and :ref:`deprecations <whatsnew_0160.deprecations>` before updating.
@@ -56,7 +56,7 @@ and the entire DataFrame (with all original and new columns) is returned.
    iris.assign(sepal_ratio=iris['SepalWidth'] / iris['SepalLength']).head()
 
 Above was an example of inserting a precomputed value. We can also pass in
-a function to be evalutated.
+a function to be evaluated.
 
 .. ipython :: python
 
@@ -133,7 +133,7 @@ from a ``scipy.sparse.coo_matrix``:
 String Methods Enhancements
 ^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
-- Following new methods are accesible via ``.str`` accessor to apply the function to each values. This is intended to make it more consistent with standard methods on strings. (:issue:`9282`, :issue:`9352`, :issue:`9386`, :issue:`9387`, :issue:`9439`)
+- Following new methods are accessible via ``.str`` accessor to apply the function to each values. This is intended to make it more consistent with standard methods on strings. (:issue:`9282`, :issue:`9352`, :issue:`9386`, :issue:`9387`, :issue:`9439`)
 
   =============  =============  =============  ===============    ===============
   ..             ..             Methods        ..                 ..
@@ -225,7 +225,7 @@ So in v0.16.0, we are restoring the API to match that of ``datetime.timedelta``.
 
 Previous Behavior
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [2]: t = pd.Timedelta('1 day, 10:11:12.100123')
 
@@ -274,7 +274,7 @@ The behavior of a small sub-set of edge cases for using ``.loc`` have changed (:
 
   Previous Behavior
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [4]: df.loc['2013-01-02':'2013-01-10']
      KeyError: 'stop bound [2013-01-10] is not in the [index]'
@@ -293,16 +293,21 @@ The behavior of a small sub-set of edge cases for using ``.loc`` have changed (:
 
   Previous Behavior
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [8]: s.ix[-1.0:2]
      TypeError: the slice start value [-1.0] is not a proper indexer for this index type (Int64Index)
 
   New Behavior
 
-  .. ipython:: python
+  .. code-block:: python
 
-     s.ix[-1.0:2]
+     In [2]: s.ix[-1.0:2]
+     Out[2]:
+     -1    1
+      1    2
+      2    3
+     dtype: int64
 
 - Provide a useful exception for indexing with an invalid type for that index when using ``.loc``. For example trying to use ``.loc`` on an index of type ``DatetimeIndex`` or ``PeriodIndex`` or ``TimedeltaIndex``, with an integer (or a float).
 
@@ -315,7 +320,7 @@ The behavior of a small sub-set of edge cases for using ``.loc`` have changed (:
 
   New Behavior
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [4]: df.loc[2:3]
      TypeError: Cannot do slice indexing on <class 'pandas.tseries.index.DatetimeIndex'> with <type 'int'> keys
@@ -332,7 +337,7 @@ Furthermore, previously you *could* change the ``ordered`` attribute of a Catego
 
 Previous Behavior
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [3]: s = Series([0,1,2], dtype='category')
 
@@ -375,12 +380,29 @@ New Behavior
 
 For ease of creation of series of categorical data, we have added the ability to pass keywords when calling ``.astype()``. These are passed directly to the constructor.
 
-.. ipython:: python
+.. code-block:: python
 
-   s = Series(["a","b","c","a"]).astype('category',ordered=True)
-   s
-   s = Series(["a","b","c","a"]).astype('category',categories=list('abcdef'),ordered=False)
-   s
+    In [54]: s = Series(["a","b","c","a"]).astype('category',ordered=True)
+
+    In [55]: s
+    Out[55]:
+    0    a
+    1    b
+    2    c
+    3    a
+    dtype: category
+    Categories (3, object): [a < b < c]
+
+    In [56]: s = Series(["a","b","c","a"]).astype('category',categories=list('abcdef'),ordered=False)
+
+    In [57]: s
+    Out[57]:
+    0    a
+    1    b
+    2    c
+    3    a
+    dtype: category
+    Categories (6, object): [a, b, c, d, e, f]
 
 
 .. _whatsnew_0160.api_breaking.other:
@@ -394,14 +416,14 @@ Other API Changes
   Previously data was coerced to a common dtype before serialisation, which for
   example resulted in integers being serialised to floats:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
     In [2]: pd.DataFrame({'i': [1,2], 'f': [3.0, 4.2]}).to_json()
     Out[2]: '{"f":{"0":3.0,"1":4.2},"i":{"0":1.0,"1":2.0}}'
 
   Now each column is serialised using its correct dtype:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
     In [2]:  pd.DataFrame({'i': [1,2], 'f': [3.0, 4.2]}).to_json()
     Out[2]: '{"f":{"0":3.0,"1":4.2},"i":{"0":1,"1":2}}'
@@ -417,7 +439,7 @@ Other API Changes
 
   Previous Behavior
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [2]: pd.Series([0,1,2,3], list('abcd')) | pd.Series([4,4,4,4], list('abcd'))
      Out[2]:
@@ -430,7 +452,7 @@ Other API Changes
   New Behavior. If the input dtypes are integral, the output dtype is also integral and the output
   values are the result of the bitwise operation.
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [2]: pd.Series([0,1,2,3], list('abcd')) | pd.Series([4,4,4,4], list('abcd'))
      Out[2]:
@@ -445,7 +467,7 @@ Other API Changes
 
   Previous Behavior
 
-  .. code-block:: python
+  .. code-block:: ipython
 
         In [2]: p = pd.Series([0, 1])
 
@@ -478,7 +500,7 @@ Other API Changes
 
   Old behavior:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
     In [4]: pd.to_datetime(['2000-01-31', '2000-02-28']).asof('2000-02')
     Out[4]: Timestamp('2000-01-31 00:00:00')
@@ -508,7 +530,7 @@ Deprecations
   We refer users to the external package `pandas-qt <https://github.com/datalyze-solutions/pandas-qt>`_. (:issue:`9615`)
 
 - The ``pandas.rpy`` interface is deprecated and will be removed in a future version.
-  Similar functionaility can be accessed thru the `rpy2 <http://rpy.sourceforge.net/>`_ project (:issue:`9602`)
+  Similar functionality can be accessed through the `rpy2 <http://rpy2.bitbucket.org/>`_ project (:issue:`9602`)
 
 - Adding ``DatetimeIndex/PeriodIndex`` to another ``DatetimeIndex/PeriodIndex`` is being deprecated as a set-operation. This will be changed to a ``TypeError`` in a future version. ``.union()`` should be used for the union set operation. (:issue:`9094`)
 - Subtracting ``DatetimeIndex/PeriodIndex`` from another ``DatetimeIndex/PeriodIndex`` is being deprecated as a set-operation. This will be changed to an actual numeric subtraction yielding a ``TimeDeltaIndex`` in a future version. ``.difference()`` should be used for the differencing set operation. (:issue:`9094`)
@@ -567,19 +589,19 @@ Bug Fixes
 - Fixed bug on big endian platforms which produced incorrect results in ``StataReader`` (:issue:`8688`).
 - Bug in ``MultiIndex.has_duplicates`` when having many levels causes an indexer overflow (:issue:`9075`, :issue:`5873`)
 - Bug in ``pivot`` and ``unstack`` where ``nan`` values would break index alignment (:issue:`4862`, :issue:`7401`, :issue:`7403`, :issue:`7405`, :issue:`7466`, :issue:`9497`)
-- Bug in left ``join`` on multi-index with ``sort=True`` or null values (:issue:`9210`).
+- Bug in left ``join`` on MultiIndex with ``sort=True`` or null values (:issue:`9210`).
 - Bug in ``MultiIndex`` where inserting new keys would fail (:issue:`9250`).
 - Bug in ``groupby`` when key space exceeds ``int64`` bounds (:issue:`9096`).
 - Bug in ``unstack`` with ``TimedeltaIndex`` or ``DatetimeIndex`` and nulls (:issue:`9491`).
 - Bug in ``rank`` where comparing floats with tolerance will cause inconsistent behaviour (:issue:`8365`).
 - Fixed character encoding bug in ``read_stata`` and ``StataReader`` when loading data from a URL (:issue:`9231`).
-- Bug in adding ``offsets.Nano`` to other offets raises ``TypeError`` (:issue:`9284`)
+- Bug in adding ``offsets.Nano`` to other offsets raises ``TypeError`` (:issue:`9284`)
 - Bug in ``DatetimeIndex`` iteration, related to (:issue:`8890`), fixed in (:issue:`9100`)
 - Bugs in ``resample`` around DST transitions. This required fixing offset classes so they behave correctly on DST transitions. (:issue:`5172`, :issue:`8744`, :issue:`8653`, :issue:`9173`, :issue:`9468`).
 - Bug in binary operator method (eg ``.mul()``) alignment with integer levels (:issue:`9463`).
 - Bug in boxplot, scatter and hexbin plot may show an unnecessary warning (:issue:`8877`)
 - Bug in subplot with ``layout`` kw may show unnecessary warning (:issue:`9464`)
-- Bug in using grouper functions that need passed thru arguments (e.g. axis), when using wrapped function (e.g. ``fillna``), (:issue:`9221`)
+- Bug in using grouper functions that need passed through arguments (e.g. axis), when using wrapped function (e.g. ``fillna``), (:issue:`9221`)
 - ``DataFrame`` now properly supports simultaneous ``copy`` and ``dtype`` arguments in constructor (:issue:`9099`)
 - Bug in ``read_csv`` when using skiprows on a file with CR line endings with the c engine. (:issue:`9079`)
 - ``isnull`` now detects ``NaT`` in ``PeriodIndex`` (:issue:`9129`)
@@ -589,9 +611,9 @@ Bug Fixes
 - Accessing ``Series.str`` methods on with non-string values now raises ``TypeError`` instead of producing incorrect results (:issue:`9184`)
 - Bug in ``DatetimeIndex.__contains__`` when index has duplicates and is not monotonic increasing (:issue:`9512`)
 - Fixed division by zero error for ``Series.kurt()`` when all values are equal (:issue:`9197`)
-- Fixed issue in the ``xlsxwriter`` engine where it added a default 'General' format to cells if no other format wass applied. This prevented other row or column formatting being applied. (:issue:`9167`)
+- Fixed issue in the ``xlsxwriter`` engine where it added a default 'General' format to cells if no other format was applied. This prevented other row or column formatting being applied. (:issue:`9167`)
 - Fixes issue with ``index_col=False`` when ``usecols`` is also specified in ``read_csv``. (:issue:`9082`)
-- Bug where ``wide_to_long`` would modify the input stubnames list (:issue:`9204`)
+- Bug where ``wide_to_long`` would modify the input stub names list (:issue:`9204`)
 - Bug in ``to_sql`` not storing float64 values using double precision. (:issue:`9009`)
 - ``SparseSeries`` and ``SparsePanel`` now accept zero argument constructors (same as their non-sparse counterparts) (:issue:`9272`).
 - Regression in merging ``Categorical`` and ``object`` dtypes (:issue:`9426`)
@@ -602,7 +624,7 @@ Bug Fixes
 - Fixed bug with reading CSV files from Amazon S3 on python 3 raising a TypeError (:issue:`9452`)
 - Bug in the Google BigQuery reader where the 'jobComplete' key may be present but False in the query results (:issue:`8728`)
 - Bug in ``Series.values_counts`` with excluding ``NaN`` for categorical type ``Series`` with ``dropna=True`` (:issue:`9443`)
-- Fixed mising numeric_only option for ``DataFrame.std/var/sem`` (:issue:`9201`)
+- Fixed missing numeric_only option for ``DataFrame.std/var/sem`` (:issue:`9201`)
 - Support constructing ``Panel`` or ``Panel4D`` with scalar data (:issue:`8285`)
 - ``Series`` text representation disconnected from `max_rows`/`max_columns` (:issue:`7508`).
 
diff --git a/doc/source/whatsnew/v0.16.1.txt b/doc/source/whatsnew/v0.16.1.txt
old mode 100755
new mode 100644
index e1a58a443aa55..d3a8064a0e786
--- a/doc/source/whatsnew/v0.16.1.txt
+++ b/doc/source/whatsnew/v0.16.1.txt
@@ -26,7 +26,7 @@ Highlights include:
 
 .. warning::
 
-   In pandas 0.17.0, the sub-package ``pandas.io.data`` will be removed in favor of a separately installable package. See :ref:`here for details <remote_data.pandas_datareader>` (:issue:`8961`)
+   In pandas 0.17.0, the sub-package ``pandas.io.data`` will be removed in favor of a separately installable package (:issue:`8961`).
 
 Enhancements
 ~~~~~~~~~~~~
@@ -41,48 +41,94 @@ indexing with duplicates. This is a container around a ``Categorical`` (introduc
 and allows efficient indexing and storage of an index with a large number of duplicated elements. Prior to 0.16.1,
 setting the index of a ``DataFrame/Series`` with a ``category`` dtype would convert this to regular object-based ``Index``.
 
-.. ipython :: python
+.. code-block:: ipython
+
+    In [1]: df = DataFrame({'A' : np.arange(6),
+       ...:                 'B' : Series(list('aabbca')).astype('category',
+       ...:                                                     categories=list('cab'))
+       ...:                })
+       ...:
+
+    In [2]: df
+    Out[2]:
+       A  B
+    0  0  a
+    1  1  a
+    2  2  b
+    3  3  b
+    4  4  c
+    5  5  a
+
+    In [3]: df.dtypes
+    Out[3]:
+    A       int64
+    B    category
+    dtype: object
+
+    In [4]: df.B.cat.categories
+    Out[4]: Index(['c', 'a', 'b'], dtype='object')
 
-   df = DataFrame({'A' : np.arange(6),
-                   'B' : Series(list('aabbca')).astype('category',
-                                                       categories=list('cab'))
-                  })
-   df
-   df.dtypes
-   df.B.cat.categories
 
 setting the index, will create create a ``CategoricalIndex``
 
-.. ipython :: python
+.. code-block:: ipython
+
+    In [5]: df2 = df.set_index('B')
 
-   df2 = df.set_index('B')
-   df2.index
+    In [6]: df2.index
+    Out[6]: CategoricalIndex(['a', 'a', 'b', 'b', 'c', 'a'], categories=['c', 'a', 'b'], ordered=False, name='B', dtype='category')
 
 indexing with ``__getitem__/.iloc/.loc/.ix`` works similarly to an Index with duplicates.
 The indexers MUST be in the category or the operation will raise.
 
-.. ipython :: python
+.. code-block:: ipython
 
-   df2.loc['a']
+    In [7]: df2.loc['a']
+    Out[7]:
+       A
+    B
+    a  0
+    a  1
+    a  5
 
 and preserves the ``CategoricalIndex``
 
-.. ipython :: python
+.. code-block:: ipython
+
+    In [8]: df2.loc['a'].index
+    Out[8]: CategoricalIndex(['a', 'a', 'a'], categories=['c', 'a', 'b'], ordered=False, name='B', dtype='category')
 
-   df2.loc['a'].index
 
 sorting will order by the order of the categories
 
-.. ipython :: python
+.. code-block:: ipython
 
-   df2.sort_index()
+    In [9]: df2.sort_index()
+    Out[9]:
+       A
+    B
+    c  4
+    a  0
+    a  1
+    a  5
+    b  2
+    b  3
 
 groupby operations on the index will preserve the index nature as well
 
-.. ipython :: python
+.. code-block:: ipython
+
+    In [10]: df2.groupby(level=0).sum()
+    Out[10]:
+       A
+    B
+    c  4
+    a  6
+    b  5
+
+    In [11]: df2.groupby(level=0).sum().index
+    Out[11]: CategoricalIndex(['c', 'a', 'b'], categories=['c', 'a', 'b'], ordered=False, name='B', dtype='category')
 
-   df2.groupby(level=0).sum()
-   df2.groupby(level=0).sum().index
 
 reindexing operations, will return a resulting index based on the type of the passed
 indexer, meaning that passing a list will return a plain-old-``Index``; indexing with
@@ -90,12 +136,31 @@ a ``Categorical`` will return a ``CategoricalIndex``, indexed according to the c
 of the PASSED ``Categorical`` dtype. This allows one to arbitrarly index these even with
 values NOT in the categories, similarly to how you can reindex ANY pandas index.
 
-.. ipython :: python
+.. code-block:: ipython
+
+    In [12]: df2.reindex(['a','e'])
+    Out[12]:
+         A
+    B
+    a  0.0
+    a  1.0
+    a  5.0
+    e  NaN
+
+    In [13]: df2.reindex(['a','e']).index
+    Out[13]: Index(['a', 'a', 'a', 'e'], dtype='object', name='B')
+
+    In [14]: df2.reindex(pd.Categorical(['a','e'],categories=list('abcde')))
+    Out[14]:
+         A
+    B
+    a  0.0
+    a  1.0
+    a  5.0
+    e  NaN
 
-   df2.reindex(['a','e'])
-   df2.reindex(['a','e']).index
-   df2.reindex(pd.Categorical(['a','e'],categories=list('abcde')))
-   df2.reindex(pd.Categorical(['a','e'],categories=list('abcde'))).index
+    In [15]: df2.reindex(pd.Categorical(['a','e'],categories=list('abcde'))).index
+    Out[15]: CategoricalIndex(['a', 'a', 'a', 'e'], categories=['a', 'b', 'c', 'd', 'e'], ordered=False, name='B', dtype='category')
 
 See the :ref:`documentation <indexing.categoricalindex>` for more. (:issue:`7629`, :issue:`10038`, :issue:`10039`)
 
@@ -172,7 +237,7 @@ enhancements make string operations easier and more consistent with standard pyt
      idx.str.startswith('a')
      s[s.index.str.startswith('a')]
 
-- The following new methods are accesible via ``.str`` accessor to apply the function to each values. (:issue:`9766`, :issue:`9773`, :issue:`10031`, :issue:`10045`, :issue:`10052`)
+- The following new methods are accessible via ``.str`` accessor to apply the function to each values. (:issue:`9766`, :issue:`9773`, :issue:`10031`, :issue:`10045`, :issue:`10052`)
 
   ================  ===============  ===============  ===============  ================
   ..                ..               Methods          ..               ..
@@ -248,7 +313,7 @@ Other Enhancements
 - Add/delete ``str/dt/cat`` accessors dynamically from ``__dir__``. (:issue:`9910`)
 - Add ``normalize`` as a ``dt`` accessor method. (:issue:`10047`)
 
-- ``DataFrame`` and ``Series`` now have ``_constructor_expanddim`` property as overridable constructor for one higher dimensionality data. This should be used only when it is really needed, see :ref:`here <ref-subclassing-pandas>`
+- ``DataFrame`` and ``Series`` now have ``_constructor_expanddim`` property as overridable constructor for one higher dimensionality data. This should be used only when it is really needed, see :ref:`here <extending.subclassing-pandas>`
 
 - ``pd.lib.infer_dtype`` now returns ``'bytes'`` in Python 3 where appropriate. (:issue:`10032`)
 
@@ -283,11 +348,11 @@ Deprecations
 Index Representation
 ~~~~~~~~~~~~~~~~~~~~
 
-The string representation of ``Index`` and its sub-classes have now been unified. These will show a single-line display if there are few values; a wrapped multi-line display for a lot of values (but less than ``display.max_seq_items``; if lots of items (> ``display.max_seq_items``) will show a truncated display (the head and tail of the data). The formatting for ``MultiIndex`` is unchanges (a multi-line wrapped display). The display width responds to the option ``display.max_seq_items``, which is defaulted to 100. (:issue:`6482`)
+The string representation of ``Index`` and its sub-classes have now been unified. These will show a single-line display if there are few values; a wrapped multi-line display for a lot of values (but less than ``display.max_seq_items``; if lots of items (> ``display.max_seq_items``) will show a truncated display (the head and tail of the data). The formatting for ``MultiIndex`` is unchanged (a multi-line wrapped display). The display width responds to the option ``display.max_seq_items``, which is defaulted to 100. (:issue:`6482`)
 
 Previous Behavior
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [2]: pd.Index(range(4),name='foo')
    Out[2]: Int64Index([0, 1, 2, 3], dtype='int64')
@@ -372,8 +437,8 @@ Bug Fixes
 - Bug in ``to_msgpack`` and ``read_msgpack`` zlib and blosc compression support (:issue:`9783`)
 - Bug ``GroupBy.size`` doesn't attach index name properly if grouped by ``TimeGrouper`` (:issue:`9925`)
 - Bug causing an exception in slice assignments because ``length_of_indexer`` returns wrong results (:issue:`9995`)
-- Bug in csv parser causing lines with initial whitespace plus one non-space character to be skipped. (:issue:`9710`)
-- Bug in C csv parser causing spurious NaNs when data started with newline followed by whitespace. (:issue:`10022`)
+- Bug in csv parser causing lines with initial white space plus one non-space character to be skipped. (:issue:`9710`)
+- Bug in C csv parser causing spurious NaNs when data started with newline followed by white space. (:issue:`10022`)
 - Bug causing elements with a null group to spill into the final group when grouping by a ``Categorical`` (:issue:`9603`)
 - Bug where .iloc and .loc behavior is not consistent on empty dataframes (:issue:`9964`)
 - Bug in invalid attribute access on a ``TimedeltaIndex`` incorrectly raised ``ValueError`` instead of ``AttributeError`` (:issue:`9680`)
@@ -390,7 +455,7 @@ Bug Fixes
 - Bug where using DataFrames asfreq would remove the name of the index. (:issue:`9885`)
 - Bug causing extra index point when resample BM/BQ (:issue:`9756`)
 - Changed caching in ``AbstractHolidayCalendar`` to be at the instance level rather than at the class level as the latter can result in unexpected behaviour. (:issue:`9552`)
-- Fixed latex output for multi-indexed dataframes (:issue:`9778`)
+- Fixed latex output for MultiIndexed dataframes (:issue:`9778`)
 - Bug causing an exception when setting an empty range using ``DataFrame.loc`` (:issue:`9596`)
 - Bug in hiding ticklabels with subplots and shared axes when adding a new plot to an existing grid of axes (:issue:`9158`)
 - Bug in ``transform`` and ``filter`` when grouping on a categorical variable (:issue:`9921`)
diff --git a/doc/source/whatsnew/v0.16.2.txt b/doc/source/whatsnew/v0.16.2.txt
index bfe44290e49d2..047da4c94093b 100644
--- a/doc/source/whatsnew/v0.16.2.txt
+++ b/doc/source/whatsnew/v0.16.2.txt
@@ -63,10 +63,10 @@ of ``(function, keyword)`` indicating where the DataFrame should flow. For examp
 
    bb = pd.read_csv('data/baseball.csv', index_col='id')
 
-   # sm.poisson takes (formula, data)
+   # sm.ols takes (formula, data)
    (bb.query('h > 0')
       .assign(ln_h = lambda df: np.log(df.h))
-      .pipe((sm.poisson, 'data'), 'hr ~ ln_h + year + g + C(lg)')
+      .pipe((sm.ols, 'data'), 'hr ~ ln_h + year + g + C(lg)')
       .fit()
       .summary()
    )
@@ -125,7 +125,7 @@ Bug Fixes
 - Bug where ``HDFStore.select`` modifies the passed columns list (:issue:`7212`)
 - Bug in ``Categorical`` repr with ``display.width`` of ``None`` in Python 3 (:issue:`10087`)
 - Bug in ``to_json`` with certain orients and a ``CategoricalIndex`` would segfault (:issue:`10317`)
-- Bug where some of the nan funcs do not have consistent return dtypes (:issue:`10251`)
+- Bug where some of the nan functions do not have consistent return dtypes (:issue:`10251`)
 - Bug in ``DataFrame.quantile`` on checking that a valid axis was passed (:issue:`9543`)
 - Bug in ``groupby.apply`` aggregation for ``Categorical`` not preserving categories (:issue:`10138`)
 - Bug in ``to_csv`` where ``date_format`` is ignored if the ``datetime`` is fractional (:issue:`10209`)
@@ -155,7 +155,7 @@ Bug Fixes
 - Bug in ``GroupBy.get_group`` raises ``ValueError`` when group key contains ``NaT`` (:issue:`6992`)
 - Bug in ``SparseSeries`` constructor ignores input data name (:issue:`10258`)
 - Bug in ``Categorical.remove_categories`` causing a ``ValueError`` when removing the ``NaN`` category if underlying dtype is floating-point (:issue:`10156`)
-- Bug where infer_freq infers timerule (WOM-5XXX) unsupported by to_offset (:issue:`9425`)
+- Bug where infer_freq infers time rule (WOM-5XXX) unsupported by to_offset (:issue:`9425`)
 - Bug in ``DataFrame.to_hdf()`` where table format would raise a seemingly unrelated error for invalid (non-string) column names. This is now explicitly forbidden. (:issue:`9057`)
 - Bug to handle masking empty ``DataFrame`` (:issue:`10126`).
 - Bug where MySQL interface could not handle numeric table/column names (:issue:`10255`)
@@ -163,5 +163,5 @@ Bug Fixes
 - Bug in ``Panel.apply`` when the result has ndim=0 (:issue:`10332`)
 - Bug in ``read_hdf`` where ``auto_close`` could not be passed (:issue:`9327`).
 - Bug in ``read_hdf`` where open stores could not be used (:issue:`10330`).
-- Bug in adding empty ``DataFrame``s, now results in a ``DataFrame`` that ``.equals`` an empty ``DataFrame`` (:issue:`10181`).
+- Bug in adding empty ``DataFrames``, now results in a ``DataFrame`` that ``.equals`` an empty ``DataFrame`` (:issue:`10181`).
 - Bug in ``to_hdf`` and ``HDFStore`` which did not check that complib choices were valid (:issue:`4582`, :issue:`8874`).
diff --git a/doc/source/whatsnew/v0.17.0.txt b/doc/source/whatsnew/v0.17.0.txt
index 0b2bb0b5a475c..404f2bf06e861 100644
--- a/doc/source/whatsnew/v0.17.0.txt
+++ b/doc/source/whatsnew/v0.17.0.txt
@@ -102,7 +102,7 @@ This uses a new-dtype representation as well, that is very similar in look-and-f
 
    Previous Behavior:
 
-   .. code-block:: python
+   .. code-block:: ipython
 
       In [1]: pd.date_range('20130101',periods=3,tz='US/Eastern')
       Out[1]: DatetimeIndex(['2013-01-01 00:00:00-05:00', '2013-01-02 00:00:00-05:00',
@@ -141,7 +141,7 @@ as well as the ``.sum()`` operation.
 
 Releasing of the GIL could benefit an application that uses threads for user interactions (e.g. QT_), or performing multi-threaded computations. A nice example of a library that can handle these types of computation-in-parallel is the dask_ library.
 
-.. _dask: https://dask.readthedocs.org/en/latest/
+.. _dask: https://dask.readthedocs.io/en/latest/
 .. _QT: https://wiki.python.org/moin/PyQt
 
 .. _whatsnew_0170.plot:
@@ -308,7 +308,7 @@ See the :ref:`documentation <io.excel>` for more details.
    os.remove('test.xlsx')
 
 Previously, it was necessary to specify the ``has_index_names`` argument in ``read_excel``,
-if the serialized data had index names.  For version 0.17.0 the ouptput format of ``to_excel``
+if the serialized data had index names.  For version 0.17.0 the output format of ``to_excel``
 has been changed to make this keyword unnecessary - the change is shown below.
 
 **Old**
@@ -329,7 +329,7 @@ has been changed to make this keyword unnecessary - the change is shown below.
 Google BigQuery Enhancements
 ^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 - Added ability to automatically create a table/dataset using the :func:`pandas.io.gbq.to_gbq` function if the destination table/dataset does not exist. (:issue:`8325`, :issue:`11121`).
-- Added ability to replace an existing table and schema when calling the :func:`pandas.io.gbq.to_gbq` function via the ``if_exists`` argument. See the :ref:`docs <io.bigquery_writer>` for more details (:issue:`8325`).
+- Added ability to replace an existing table and schema when calling the :func:`pandas.io.gbq.to_gbq` function via the ``if_exists`` argument. See the `docs <https://pandas-gbq.readthedocs.io/en/latest/writing.html>`__ for more details (:issue:`8325`).
 - ``InvalidColumnOrder`` and ``InvalidPageToken`` in the gbq module will raise ``ValueError`` instead of ``IOError``.
 - The ``generate_bq_schema()`` function is now deprecated and will be removed in a future version (:issue:`11121`)
 - The gbq module will now support Python 3 (:issue:`11094`).
@@ -410,7 +410,7 @@ Other enhancements
 
   Previous Behavior:
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [1] pd.concat([foo, bar, baz], 1)
      Out[1]:
@@ -527,6 +527,7 @@ Other enhancements
 
 - ``pd.read_csv`` is now able to infer compression type for files read from AWS S3 storage (:issue:`11070`, :issue:`11074`).
 
+
 .. _whatsnew_0170.api:
 
 .. _whatsnew_0170.api_breaking:
@@ -606,14 +607,14 @@ will raise rather that return the original input as in previous versions. (:issu
 
 Previous Behavior:
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [2]: pd.to_datetime(['2009-07-31', 'asd'])
    Out[2]: array(['2009-07-31', 'asd'], dtype=object)
 
 New Behavior:
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [3]: pd.to_datetime(['2009-07-31', 'asd'])
    ValueError: Unknown string format
@@ -647,7 +648,7 @@ can parse, such as a quarterly string.
 
 Previous Behavior:
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [1]: Timestamp('2012Q2')
    Traceback
@@ -688,7 +689,7 @@ a ``ValueError``. This is to be consistent with the behavior of ``Series``.
 
 Previous Behavior:
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [2]: pd.Index([1, 2, 3]) == pd.Index([1, 4, 5])
    Out[2]: array([ True, False, False], dtype=bool)
@@ -701,7 +702,7 @@ Previous Behavior:
 
 New Behavior:
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [8]: pd.Index([1, 2, 3]) == pd.Index([1, 4, 5])
    Out[8]: array([ True, False, False], dtype=bool)
@@ -722,6 +723,7 @@ be broadcast:
 or it can return False if broadcasting can not be done:
 
 .. ipython:: python
+   :okwarning:
 
    np.array([1, 2, 3]) == np.array([1, 2])
 
@@ -738,7 +740,7 @@ Boolean comparisons of a ``Series`` vs ``None`` will now be equivalent to compar
 
 Previous Behavior:
 
-.. code-block:: python
+.. code-block:: ipython
 
    In [5]: s==None
    TypeError: Could not compare <type 'NoneType'> type with Series
@@ -782,15 +784,15 @@ Previous Behavior:
    df_with_missing
 
 
-.. code-block:: python
+.. code-block:: ipython
 
-   In [28]:
+   In [27]:
    df_with_missing.to_hdf('file.h5',
                           'df_with_missing',
                           format='table',
                           mode='w')
 
-   pd.read_hdf('file.h5', 'df_with_missing')
+   In [28]: pd.read_hdf('file.h5', 'df_with_missing')
 
    Out [28]:
          col1  col2
@@ -831,7 +833,7 @@ The ``display.precision`` option has been clarified to refer to decimal places (
 Earlier versions of pandas would format floating point numbers to have one less decimal place than the value in
 ``display.precision``.
 
-.. code-block:: python
+.. code-block:: ipython
 
   In [1]: pd.set_option('display.precision', 2)
 
@@ -963,7 +965,7 @@ Deprecations
 - ``TimeSeries`` deprecated in favor of ``Series`` (note that this has been an alias since 0.13.0), (:issue:`10890`)
 - ``SparsePanel`` deprecated and will be removed in a future version (:issue:`11157`).
 - ``Series.is_time_series`` deprecated in favor of ``Series.index.is_all_dates`` (:issue:`11135`)
-- Legacy offsets (like ``'A@JAN'``) listed in :ref:`here <timeseries.legacyaliases>` are deprecated (note that this has been alias since 0.8.0), (:issue:`10878`)
+- Legacy offsets (like ``'A@JAN'``) are deprecated (note that this has been alias since 0.8.0) (:issue:`10878`)
 - ``WidePanel`` deprecated in favor of ``Panel``, ``LongPanel`` in favor of ``DataFrame`` (note these have been aliases since < 0.11.0), (:issue:`10892`)
 - ``DataFrame.convert_objects`` has been deprecated in favor of type-specific functions ``pd.to_datetime``, ``pd.to_timestamp`` and ``pd.to_numeric`` (new in 0.17.0) (:issue:`11133`).
 
@@ -985,7 +987,7 @@ Removal of prior version deprecations/changes
 
   Previously
 
-  .. code-block:: python
+  .. code-block:: ipython
 
      In [3]: df + df.A
      FutureWarning: TimeSeries broadcasting along DataFrame index by default is deprecated.
@@ -1040,8 +1042,8 @@ Performance Improvements
 Bug Fixes
 ~~~~~~~~~
 
-- Bug in incorrection computation of ``.mean()`` on ``timedelta64[ns]`` because of overflow (:issue:`9442`)
-- Bug in  ``.isin`` on older numpies (:issue: `11232`)
+- Bug in incorrect computation of ``.mean()`` on ``timedelta64[ns]`` because of overflow (:issue:`9442`)
+- Bug in  ``.isin`` on older numpies (:issue:`11232`)
 - Bug in ``DataFrame.to_html(index=False)`` renders unnecessary ``name`` row (:issue:`10344`)
 - Bug in ``DataFrame.to_latex()`` the ``column_format`` argument could not be passed (:issue:`9402`)
 - Bug in ``DatetimeIndex`` when localizing with ``NaT`` (:issue:`10477`)
@@ -1067,7 +1069,7 @@ Bug Fixes
 - Bug in ``offsets.generate_range`` where ``start`` and ``end`` have finer precision than ``offset`` (:issue:`9907`)
 - Bug in ``pd.rolling_*`` where ``Series.name`` would be lost in the output (:issue:`10565`)
 - Bug in ``stack`` when index or columns are not unique. (:issue:`10417`)
-- Bug in setting a ``Panel`` when an axis has a multi-index (:issue:`10360`)
+- Bug in setting a ``Panel`` when an axis has a MultiIndex (:issue:`10360`)
 - Bug in ``USFederalHolidayCalendar`` where ``USMemorialDay`` and ``USMartinLutherKingJr`` were incorrect (:issue:`10278` and :issue:`9760` )
 - Bug in ``.sample()`` where returned object, if set, gives unnecessary ``SettingWithCopyWarning`` (:issue:`10738`)
 - Bug in ``.sample()`` where weights passed as ``Series`` were not aligned along axis before being treated positionally, potentially causing problems if weight indices were not aligned with sampled object. (:issue:`10738`)
@@ -1092,7 +1094,7 @@ Bug Fixes
 
 
 - Bug in ``to_datetime`` and ``to_timedelta`` causing ``Index`` name to be lost (:issue:`10875`)
-- Bug in ``len(DataFrame.groupby)`` causing ``IndexError`` when there's a column containing only NaNs (:issue: `11016`)
+- Bug in ``len(DataFrame.groupby)`` causing ``IndexError`` when there's a column containing only NaNs (:issue:`11016`)
 
 - Bug that caused segfault when resampling an empty Series (:issue:`10228`)
 - Bug in ``DatetimeIndex`` and ``PeriodIndex.value_counts`` resets name from its result, but retains in result's ``Index``. (:issue:`10150`)
@@ -1155,7 +1157,7 @@ Bug Fixes
 - Bug in ``.var()`` causing roundoff errors for highly similar values (:issue:`10242`)
 - Bug in ``DataFrame.plot(subplots=True)`` with duplicated columns outputs incorrect result (:issue:`10962`)
 - Bug in ``Index`` arithmetic may result in incorrect class (:issue:`10638`)
-- Bug in ``date_range`` results in empty if freq is negative annualy, quarterly and monthly (:issue:`11018`)
+- Bug in ``date_range`` results in empty if freq is negative annually, quarterly and monthly (:issue:`11018`)
 - Bug in ``DatetimeIndex`` cannot infer negative freq (:issue:`11018`)
 - Remove use of some deprecated numpy comparison operations, mainly in tests. (:issue:`10569`)
 - Bug in ``Index`` dtype may not applied properly (:issue:`11017`)
diff --git a/doc/source/whatsnew/v0.17.1.txt b/doc/source/whatsnew/v0.17.1.txt
old mode 100755
new mode 100644
index 945840184a00c..c5ae0d147824c
--- a/doc/source/whatsnew/v0.17.1.txt
+++ b/doc/source/whatsnew/v0.17.1.txt
@@ -1,98 +1,204 @@
 .. _whatsnew_0171:
 
-v0.17.1 (November ??, 2015)
+v0.17.1 (November 21, 2015)
 ---------------------------
 
-This is a minor bug-fix release from 0.17.0 and includes a a large number of
+.. note::
+
+   We are proud to announce that *pandas* has become a sponsored project of the (`NumFOCUS organization`_). This will help ensure the success of development of *pandas* as a world-class open-source project.
+
+.. _numfocus organization: http://www.numfocus.org/blog/numfocus-announces-new-fiscally-sponsored-project-pandas
+
+This is a minor bug-fix release from 0.17.0 and includes a large number of
 bug fixes along several new features, enhancements, and performance improvements.
 We recommend that all users upgrade to this version.
 
 Highlights include:
 
+- Support for Conditional HTML Formatting, see :ref:`here <whatsnew_0171.style>`
+- Releasing the GIL on the csv reader & other ops, see :ref:`here <whatsnew_0171.performance>`
+- Fixed regression in ``DataFrame.drop_duplicates`` from 0.16.2, causing incorrect results on integer values (:issue:`11376`)
+
 .. contents:: What's new in v0.17.1
     :local:
     :backlinks: none
 
-.. _whatsnew_0171.enhancements:
-
-Enhancements
+New features
 ~~~~~~~~~~~~
 
-- Support for ``compression`` (gzip/bz2) in :method:`DataFrame.to_csv` (:issue:`7615`)
+.. _whatsnew_0171.style:
 
-.. _whatsnew_0171.enhancements.other:
+Conditional HTML Formatting
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
-- Improve the error message in :func:`pandas.io.gbq.to_gbq` when a streaming insert fails (:issue:`11285`)
+.. warning::
+    This is a new feature and is under active development.
+    We'll be adding features an  possibly making breaking changes in future
+    releases. Feedback is welcome_.
 
-Other Enhancements
-^^^^^^^^^^^^^^^^^^
+.. _welcome: https://github.com/pandas-dev/pandas/issues/11610
 
-.. _whatsnew_0171.api:
+We've added *experimental* support for conditional HTML formatting:
+the visual styling of a DataFrame based on the data.
+The styling is accomplished with HTML and CSS.
+Accesses the styler class with the :attr:`pandas.DataFrame.style`, attribute,
+an instance of :class:`~pandas.core.style.Styler` with your data attached.
 
-API changes
-~~~~~~~~~~~
+Here's a quick example:
 
-- min and max reductions on ``datetime64`` and ``timedelta64`` dtyped series now
-  result in ``NaT`` and not ``nan`` (:issue:`11245`).
-- Regression from 0.16.2 for output formatting of long floats/nan, restored in (:issue:`11302`)
-- Prettyprinting sets (e.g. in DataFrame cells) now uses set literal syntax (``{x, y}``) instead of
-  Legacy Python syntax (``set([x, y])``) (:issue:`11215`)
+  .. ipython:: python
 
-.. _whatsnew_0171.deprecations:
+    np.random.seed(123)
+    df = DataFrame(np.random.randn(10, 5), columns=list('abcde'))
+    html = df.style.background_gradient(cmap='viridis', low=.5)
 
-Deprecations
-^^^^^^^^^^^^
-
-- The ``pandas.io.ga`` module which implements ``google-analytics`` support is deprecated and will be removed in a future version (:issue:`11308`)
-- Deprecate the ``engine`` keyword from ``.to_csv()``, which will be removed in a future version (:issue:`11274`)
-
-
-.. _whatsnew_0171.performance:
+We can render the HTML to get the following table.
 
-Performance Improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
+.. raw:: html
+   :file: whatsnew_0171_html_table.html
 
-- Checking monotonic-ness before sorting on an index (:issue:`11080`)
+:class:`~pandas.core.style.Styler` interacts nicely with the Jupyter Notebook.
+See the :doc:`documentation <style>` for more.
 
-.. _whatsnew_0171.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
+.. _whatsnew_0171.enhancements:
 
-- Bug in ``.to_latex()`` output broken when the index has a name (:issue: `10660`)
-- Bug in ``HDFStore.append`` with strings whose encoded length exceded the max unencoded length (:issue:`11234`)
+Enhancements
+~~~~~~~~~~~~
 
-- Bug in ``HDFStore.select`` when comparing with a numpy scalar in a where clause (:issue:`11283`)
+- ``DatetimeIndex`` now supports conversion to strings with ``astype(str)`` (:issue:`10442`)
+- Support for ``compression`` (gzip/bz2) in :meth:`pandas.DataFrame.to_csv` (:issue:`7615`)
+- ``pd.read_*`` functions can now also accept :class:`python:pathlib.Path`, or :class:`py:py._path.local.LocalPath`
+  objects for the ``filepath_or_buffer`` argument. (:issue:`11033`)
+  - The ``DataFrame`` and ``Series`` functions ``.to_csv()``, ``.to_html()`` and ``.to_latex()`` can now handle paths beginning with tildes (e.g. ``~/Documents/``) (:issue:`11438`)
+- ``DataFrame`` now uses the fields of a ``namedtuple`` as columns, if columns are not supplied (:issue:`11181`)
+- ``DataFrame.itertuples()`` now returns ``namedtuple`` objects, when possible. (:issue:`11269`, :issue:`11625`)
+- Added ``axvlines_kwds`` to parallel coordinates plot (:issue:`10709`)
+- Option to ``.info()`` and ``.memory_usage()`` to provide for deep introspection of memory consumption. Note that this can be expensive to compute and therefore is an optional parameter. (:issue:`11595`)
 
-- Bug in tz-conversions with an ambiguous time and ``.dt`` accessors (:issues:`11295`)
+  .. ipython:: python
 
+     df = DataFrame({'A' : ['foo']*1000})
+     df['B'] = df['A'].astype('category')
 
+     # shows the '+' as we have object dtypes
+     df.info()
 
+     # we have an accurate memory assessment (but can be expensive to compute this)
+     df.info(memory_usage='deep')
 
+- ``Index`` now has a ``fillna`` method (:issue:`10089`)
 
+  .. ipython:: python
 
+     pd.Index([1, np.nan, 3]).fillna(2)
 
+- Series of type ``category`` now make ``.str.<...>`` and ``.dt.<...>`` accessor methods / properties available, if the categories are of that type. (:issue:`10661`)
 
+  .. ipython:: python
 
+     s = pd.Series(list('aabb')).astype('category')
+     s
+     s.str.contains("a")
 
+     date = pd.Series(pd.date_range('1/1/2015', periods=5)).astype('category')
+     date
+     date.dt.day
 
-- Bug in ``squeeze()`` with zero length arrays (:issue:`11230`, :issue:`8999`)
+- ``pivot_table`` now has a ``margins_name`` argument so you can use something other than the default of 'All' (:issue:`3335`)
+- Implement export of ``datetime64[ns, tz]`` dtypes with a fixed HDF5 store (:issue:`11411`)
+- Pretty printing sets (e.g. in DataFrame cells) now uses set literal syntax (``{x, y}``) instead of
+  Legacy Python syntax (``set([x, y])``) (:issue:`11215`)
+- Improve the error message in :func:`pandas.io.gbq.to_gbq` when a streaming insert fails (:issue:`11285`)
+  and when the DataFrame does not match the schema of the destination table (:issue:`11359`)
 
+.. _whatsnew_0171.api:
 
+API changes
+~~~~~~~~~~~
 
+- raise ``NotImplementedError`` in ``Index.shift`` for non-supported index types (:issue:`8038`)
+- ``min`` and ``max`` reductions on ``datetime64`` and ``timedelta64`` dtyped series now
+  result in ``NaT`` and not ``nan`` (:issue:`11245`).
+- Indexing with a null key will raise a ``TypeError``, instead of a ``ValueError`` (:issue:`11356`)
+- ``Series.ptp`` will now ignore missing values by default (:issue:`11163`)
 
+.. _whatsnew_0171.deprecations:
 
+Deprecations
+^^^^^^^^^^^^
 
+- The ``pandas.io.ga`` module which implements ``google-analytics`` support is deprecated and will be removed in a future version (:issue:`11308`)
+- Deprecate the ``engine`` keyword in ``.to_csv()``, which will be removed in a future version (:issue:`11274`)
 
+.. _whatsnew_0171.performance:
 
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
 
+- Checking monotonic-ness before sorting on an index (:issue:`11080`)
+- ``Series.dropna`` performance improvement when its dtype can't contain ``NaN`` (:issue:`11159`)
+- Release the GIL on most datetime field operations (e.g. ``DatetimeIndex.year``, ``Series.dt.year``), normalization, and conversion to and from ``Period``, ``DatetimeIndex.to_period`` and ``PeriodIndex.to_timestamp`` (:issue:`11263`)
+- Release the GIL on some rolling algos: ``rolling_median``, ``rolling_mean``, ``rolling_max``, ``rolling_min``, ``rolling_var``, ``rolling_kurt``, ``rolling_skew`` (:issue:`11450`)
+- Release the GIL when reading and parsing text files in ``read_csv``, ``read_table`` (:issue:`11272`)
+- Improved performance of ``rolling_median`` (:issue:`11450`)
+- Improved performance of ``to_excel`` (:issue:`11352`)
+- Performance bug in repr of ``Categorical`` categories, which was rendering the strings before chopping them for display (:issue:`11305`)
+- Performance improvement in ``Categorical.remove_unused_categories``, (:issue:`11643`).
+- Improved performance of ``Series`` constructor with no data and ``DatetimeIndex`` (:issue:`11433`)
+- Improved performance of ``shift``, ``cumprod``, and ``cumsum`` with groupby (:issue:`4095`)
 
+.. _whatsnew_0171.bug_fixes:
 
+Bug Fixes
+~~~~~~~~~
 
+- ``SparseArray.__iter__()`` now does not cause ``PendingDeprecationWarning`` in Python 3.5 (:issue:`11622`)
+- Regression from 0.16.2 for output formatting of long floats/nan, restored in (:issue:`11302`)
+- ``Series.sort_index()`` now correctly handles the ``inplace`` option (:issue:`11402`)
+- Incorrectly distributed .c file in the build on ``PyPi`` when reading a csv of floats and passing ``na_values=<a scalar>`` would show an exception (:issue:`11374`)
+- Bug in ``.to_latex()`` output broken when the index has a name (:issue:`10660`)
+- Bug in ``HDFStore.append`` with strings whose encoded length exceeded the max unencoded length (:issue:`11234`)
+- Bug in merging ``datetime64[ns, tz]`` dtypes (:issue:`11405`)
+- Bug in ``HDFStore.select`` when comparing with a numpy scalar in a where clause (:issue:`11283`)
+- Bug in using ``DataFrame.ix`` with a MultiIndex indexer (:issue:`11372`)
+- Bug in ``date_range`` with ambiguous endpoints (:issue:`11626`)
+- Prevent adding new attributes to the accessors ``.str``, ``.dt`` and ``.cat``. Retrieving such
+  a value was not possible, so error out on setting it. (:issue:`10673`)
+- Bug in tz-conversions with an ambiguous time and ``.dt`` accessors (:issue:`11295`)
+- Bug in output formatting when using an index of ambiguous times (:issue:`11619`)
+- Bug in comparisons of Series vs list-likes (:issue:`11339`)
+- Bug in ``DataFrame.replace`` with a ``datetime64[ns, tz]`` and a non-compat to_replace (:issue:`11326`, :issue:`11153`)
+- Bug in ``isnull`` where ``numpy.datetime64('NaT')`` in a ``numpy.array`` was not determined to be null(:issue:`11206`)
+- Bug in list-like indexing with a mixed-integer Index (:issue:`11320`)
+- Bug in ``pivot_table`` with ``margins=True`` when indexes are of ``Categorical`` dtype (:issue:`10993`)
+- Bug in ``DataFrame.plot`` cannot use hex strings colors (:issue:`10299`)
+- Regression in ``DataFrame.drop_duplicates`` from 0.16.2, causing incorrect results on integer values (:issue:`11376`)
+- Bug in ``pd.eval`` where unary ops in a list error (:issue:`11235`)
+- Bug in ``squeeze()`` with zero length arrays (:issue:`11230`, :issue:`8999`)
+- Bug in ``describe()`` dropping column names for hierarchical indexes (:issue:`11517`)
+- Bug in ``DataFrame.pct_change()`` not propagating ``axis`` keyword on ``.fillna`` method (:issue:`11150`)
+- Bug in ``.to_csv()`` when a mix of integer and string column names are passed as the ``columns`` parameter (:issue:`11637`)
+- Bug in indexing with a ``range``, (:issue:`11652`)
+- Bug in inference of numpy scalars and preserving dtype when setting columns (:issue:`11638`)
+- Bug in ``to_sql`` using unicode column names giving UnicodeEncodeError with (:issue:`11431`).
+- Fix regression in setting of ``xticks`` in ``plot`` (:issue:`11529`).
+- Bug in ``holiday.dates`` where observance rules could not be applied to holiday and doc enhancement (:issue:`11477`, :issue:`11533`)
+- Fix plotting issues when having plain ``Axes`` instances instead of ``SubplotAxes`` (:issue:`11520`, :issue:`11556`).
 - Bug in ``DataFrame.to_latex()`` produces an extra rule when ``header=False`` (:issue:`7124`)
-
-
-
+- Bug in ``df.groupby(...).apply(func)`` when a func returns a ``Series`` containing a new datetimelike column (:issue:`11324`)
+- Bug in ``pandas.json`` when file to load is big (:issue:`11344`)
 - Bugs in ``to_excel`` with duplicate columns (:issue:`11007`, :issue:`10982`, :issue:`10970`)
-- Fixed a bug that prevented the construction of an empty series of dtype
-  ``datetime64[ns, tz]`` (:issue:`11245`).
+- Fixed a bug that prevented the construction of an empty series of dtype ``datetime64[ns, tz]`` (:issue:`11245`).
+- Bug in ``read_excel`` with MultiIndex containing integers (:issue:`11317`)
+- Bug in ``to_excel`` with openpyxl 2.2+ and merging (:issue:`11408`)
+- Bug in ``DataFrame.to_dict()`` produces a ``np.datetime64`` object instead of ``Timestamp`` when only datetime is present in data (:issue:`11327`)
+- Bug in ``DataFrame.corr()`` raises exception when computes Kendall correlation for DataFrames with boolean and not boolean columns (:issue:`11560`)
+- Bug in the link-time error caused by C ``inline`` functions on FreeBSD 10+ (with ``clang``) (:issue:`10510`)
+- Bug in ``DataFrame.to_csv`` in passing through arguments for formatting ``MultiIndexes``, including ``date_format`` (:issue:`7791`)
+- Bug in ``DataFrame.join()`` with ``how='right'`` producing a ``TypeError`` (:issue:`11519`)
+- Bug in ``Series.quantile`` with empty list results has ``Index`` with ``object`` dtype (:issue:`11588`)
+- Bug in ``pd.merge`` results in empty ``Int64Index`` rather than ``Index(dtype=object)`` when the merge result is empty (:issue:`11588`)
+- Bug in ``Categorical.remove_unused_categories`` when having ``NaN`` values (:issue:`11599`)
+- Bug in ``DataFrame.to_sparse()`` loses column names for MultiIndexes (:issue:`11600`)
+- Bug in ``DataFrame.round()`` with non-unique column index producing a Fatal Python error (:issue:`11611`)
+- Bug in ``DataFrame.round()`` with ``decimals`` being a non-unique indexed Series producing extra columns (:issue:`11618`)
diff --git a/doc/source/whatsnew/v0.18.0.txt b/doc/source/whatsnew/v0.18.0.txt
new file mode 100644
index 0000000000000..a3213136d998a
--- /dev/null
+++ b/doc/source/whatsnew/v0.18.0.txt
@@ -0,0 +1,1292 @@
+.. _whatsnew_0180:
+
+v0.18.0 (March 13, 2016)
+------------------------
+
+This is a major release from 0.17.1 and includes a small number of API changes, several new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+.. warning::
+
+   pandas >= 0.18.0 no longer supports compatibility with Python version 2.6
+   and 3.3 (:issue:`7718`, :issue:`11273`)
+
+.. warning::
+
+   ``numexpr`` version 2.4.4 will now show a warning and not be used as a computation back-end for pandas because of some buggy behavior. This does not affect other versions (>= 2.1 and >= 2.4.6). (:issue:`12489`)
+
+Highlights include:
+
+- Moving and expanding window functions are now methods on Series and DataFrame,
+  similar to ``.groupby``, see :ref:`here <whatsnew_0180.enhancements.moments>`.
+- Adding support for a ``RangeIndex`` as a specialized form of the ``Int64Index``
+  for memory savings, see :ref:`here <whatsnew_0180.enhancements.rangeindex>`.
+- API breaking change to the ``.resample`` method to make it more ``.groupby``
+  like, see :ref:`here <whatsnew_0180.breaking.resample>`.
+- Removal of support for positional indexing with floats, which was deprecated
+  since 0.14.0. This will now raise a ``TypeError``, see :ref:`here <whatsnew_0180.float_indexers>`.
+- The ``.to_xarray()`` function has been added for compatibility with the
+  `xarray package <http://xarray.pydata.org/en/stable/>`__, see :ref:`here <whatsnew_0180.enhancements.xarray>`.
+- The ``read_sas`` function has been enhanced to read ``sas7bdat`` files, see :ref:`here <whatsnew_0180.enhancements.sas>`.
+- Addition of the :ref:`.str.extractall() method <whatsnew_0180.enhancements.extract>`,
+  and API changes to the :ref:`.str.extract() method <whatsnew_0180.enhancements.extract>`
+  and :ref:`.str.cat() method <whatsnew_0180.enhancements.strcat>`.
+- ``pd.test()`` top-level nose test runner is available (:issue:`4327`).
+
+Check the :ref:`API Changes <whatsnew_0180.api_breaking>` and :ref:`deprecations <whatsnew_0180.deprecations>` before updating.
+
+.. contents:: What's new in v0.18.0
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0180.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0180.enhancements.moments:
+
+Window functions are now methods
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Window functions have been refactored to be methods on ``Series/DataFrame`` objects, rather than top-level functions, which are now deprecated. This allows these window-type functions, to have a similar API to that of ``.groupby``. See the full documentation :ref:`here <stats.moments>` (:issue:`11603`, :issue:`12373`)
+
+
+.. ipython:: python
+
+   np.random.seed(1234)
+   df = pd.DataFrame({'A' : range(10), 'B' : np.random.randn(10)})
+   df
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [8]: pd.rolling_mean(df,window=3)
+           FutureWarning: pd.rolling_mean is deprecated for DataFrame and will be removed in a future version, replace with
+                          DataFrame.rolling(window=3,center=False).mean()
+   Out[8]:
+       A         B
+   0 NaN       NaN
+   1 NaN       NaN
+   2   1  0.237722
+   3   2 -0.023640
+   4   3  0.133155
+   5   4 -0.048693
+   6   5  0.342054
+   7   6  0.370076
+   8   7  0.079587
+   9   8 -0.954504
+
+New Behavior:
+
+.. ipython:: python
+
+   r = df.rolling(window=3)
+
+These show a descriptive repr
+
+.. ipython:: python
+
+   r
+with tab-completion of available methods and properties.
+
+.. code-block:: ipython
+
+   In [9]: r.
+   r.A           r.agg         r.apply       r.count       r.exclusions  r.max         r.median      r.name        r.skew        r.sum
+   r.B           r.aggregate   r.corr        r.cov         r.kurt        r.mean        r.min         r.quantile    r.std         r.var
+
+The methods operate on the ``Rolling`` object itself
+
+.. ipython:: python
+
+   r.mean()
+
+They provide getitem accessors
+
+.. ipython:: python
+
+   r['A'].mean()
+
+And multiple aggregations
+
+.. ipython:: python
+
+   r.agg({'A' : ['mean','std'],
+          'B' : ['mean','std']})
+
+.. _whatsnew_0180.enhancements.rename:
+
+Changes to rename
+^^^^^^^^^^^^^^^^^
+
+``Series.rename`` and ``NDFrame.rename_axis`` can now take a scalar or list-like
+argument for altering the Series or axis *name*, in addition to their old behaviors of altering labels. (:issue:`9494`, :issue:`11965`)
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(5))
+   s.rename('newname')
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(5, 2))
+   (df.rename_axis("indexname")
+      .rename_axis("columns_name", axis="columns"))
+
+The new functionality works well in method chains. Previously these methods only accepted functions or dicts mapping a *label* to a new label.
+This continues to work as before for function or dict-like values.
+
+
+.. _whatsnew_0180.enhancements.rangeindex:
+
+Range Index
+^^^^^^^^^^^
+
+A ``RangeIndex`` has been added to the ``Int64Index`` sub-classes to support a memory saving alternative for common use cases. This has a similar implementation to the python ``range`` object (``xrange`` in python 2), in that it only stores the start, stop, and step values for the index. It will transparently interact with the user API, converting to ``Int64Index`` if needed.
+
+This will now be the default constructed index for ``NDFrame`` objects, rather than previous an ``Int64Index``. (:issue:`939`, :issue:`12070`, :issue:`12071`, :issue:`12109`, :issue:`12888`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [3]: s = pd.Series(range(1000))
+
+   In [4]: s.index
+   Out[4]:
+   Int64Index([  0,   1,   2,   3,   4,   5,   6,   7,   8,   9,
+               ...
+               990, 991, 992, 993, 994, 995, 996, 997, 998, 999], dtype='int64', length=1000)
+
+   In [6]: s.index.nbytes
+   Out[6]: 8000
+
+
+New Behavior:
+
+.. ipython:: python
+
+   s = pd.Series(range(1000))
+   s.index
+   s.index.nbytes
+
+.. _whatsnew_0180.enhancements.extract:
+
+Changes to str.extract
+^^^^^^^^^^^^^^^^^^^^^^
+
+The :ref:`.str.extract <text.extract>` method takes a regular
+expression with capture groups, finds the first match in each subject
+string, and returns the contents of the capture groups
+(:issue:`11386`).
+
+In v0.18.0, the ``expand`` argument was added to
+``extract``.
+
+- ``expand=False``: it returns a ``Series``, ``Index``, or ``DataFrame``, depending on the subject and regular expression pattern (same behavior as pre-0.18.0).
+- ``expand=True``: it always returns a ``DataFrame``, which is more consistent and less confusing from the perspective of a user.
+
+Currently the default is ``expand=None`` which gives a ``FutureWarning`` and uses ``expand=False``. To avoid this warning, please explicitly specify ``expand``.
+
+.. code-block:: ipython
+
+   In [1]: pd.Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)', expand=None)
+   FutureWarning: currently extract(expand=None) means expand=False (return Index/Series/DataFrame)
+   but in a future version of pandas this will be changed to expand=True (return DataFrame)
+
+   Out[1]:
+   0      1
+   1      2
+   2    NaN
+   dtype: object
+
+Extracting a regular expression with one group returns a Series if
+``expand=False``.
+
+.. ipython:: python
+
+   pd.Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)', expand=False)
+
+It returns a ``DataFrame`` with one column if ``expand=True``.
+
+.. ipython:: python
+
+   pd.Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)', expand=True)
+
+Calling on an ``Index`` with a regex with exactly one capture group
+returns an ``Index`` if ``expand=False``.
+
+.. ipython:: python
+
+   s = pd.Series(["a1", "b2", "c3"], ["A11", "B22", "C33"])
+   s.index
+   s.index.str.extract("(?P<letter>[a-zA-Z])", expand=False)
+
+It returns a ``DataFrame`` with one column if ``expand=True``.
+
+.. ipython:: python
+
+   s.index.str.extract("(?P<letter>[a-zA-Z])", expand=True)
+
+Calling on an ``Index`` with a regex with more than one capture group
+raises ``ValueError`` if ``expand=False``.
+
+.. code-block:: python
+
+    >>> s.index.str.extract("(?P<letter>[a-zA-Z])([0-9]+)", expand=False)
+    ValueError: only one regex group is supported with Index
+
+It returns a ``DataFrame`` if ``expand=True``.
+
+.. ipython:: python
+
+   s.index.str.extract("(?P<letter>[a-zA-Z])([0-9]+)", expand=True)
+
+In summary, ``extract(expand=True)`` always returns a ``DataFrame``
+with a row for every subject string, and a column for every capture
+group.
+
+.. _whatsnew_0180.enhancements.extractall:
+
+Addition of str.extractall
+^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :ref:`.str.extractall <text.extractall>` method was added
+(:issue:`11386`).  Unlike ``extract``, which returns only the first
+match.
+
+.. ipython:: python
+
+   s = pd.Series(["a1a2", "b1", "c1"], ["A", "B", "C"])
+   s
+   s.str.extract("(?P<letter>[ab])(?P<digit>\d)", expand=False)
+
+The ``extractall`` method returns all matches.
+
+.. ipython:: python
+
+   s.str.extractall("(?P<letter>[ab])(?P<digit>\d)")
+
+.. _whatsnew_0180.enhancements.strcat:
+
+Changes to str.cat
+^^^^^^^^^^^^^^^^^^
+
+The method ``.str.cat()`` concatenates the members of a ``Series``. Before, if ``NaN`` values were present in the Series, calling ``.str.cat()`` on it would return ``NaN``, unlike the rest of the ``Series.str.*`` API. This behavior has been amended to ignore ``NaN`` values by default. (:issue:`11435`).
+
+A new, friendlier ``ValueError`` is added to protect against the mistake of supplying the ``sep`` as an arg, rather than as a kwarg. (:issue:`11334`).
+
+.. ipython:: python
+
+    pd.Series(['a','b',np.nan,'c']).str.cat(sep=' ')
+    pd.Series(['a','b',np.nan,'c']).str.cat(sep=' ', na_rep='?')
+
+.. code-block:: ipython
+
+    In [2]: pd.Series(['a','b',np.nan,'c']).str.cat(' ')
+    ValueError: Did you mean to supply a `sep` keyword?
+
+
+.. _whatsnew_0180.enhancements.rounding:
+
+Datetimelike rounding
+^^^^^^^^^^^^^^^^^^^^^
+
+``DatetimeIndex``, ``Timestamp``, ``TimedeltaIndex``, ``Timedelta`` have gained the ``.round()``, ``.floor()`` and ``.ceil()`` method for datetimelike rounding, flooring and ceiling. (:issue:`4314`, :issue:`11963`)
+
+Naive datetimes
+
+.. ipython:: python
+
+   dr = pd.date_range('20130101 09:12:56.1234', periods=3)
+   dr
+   dr.round('s')
+
+   # Timestamp scalar
+   dr[0]
+   dr[0].round('10s')
+
+Tz-aware are rounded, floored and ceiled in local times
+
+.. ipython:: python
+
+   dr = dr.tz_localize('US/Eastern')
+   dr
+   dr.round('s')
+
+Timedeltas
+
+.. ipython:: python
+
+   t = timedelta_range('1 days 2 hr 13 min 45 us',periods=3,freq='d')
+   t
+   t.round('10min')
+
+   # Timedelta scalar
+   t[0]
+   t[0].round('2h')
+
+
+In addition, ``.round()``, ``.floor()`` and ``.ceil()`` will be available through the ``.dt`` accessor of ``Series``.
+
+.. ipython:: python
+
+   s = pd.Series(dr)
+   s
+   s.dt.round('D')
+
+Formatting of Integers in FloatIndex
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Integers in ``FloatIndex``, e.g. 1., are now formatted with a decimal point and a ``0`` digit, e.g. ``1.0`` (:issue:`11713`)
+This change not only affects the display to the console, but also the output of IO methods like ``.to_csv`` or ``.to_html``.
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [2]: s = pd.Series([1,2,3], index=np.arange(3.))
+
+   In [3]: s
+   Out[3]:
+   0    1
+   1    2
+   2    3
+   dtype: int64
+
+   In [4]: s.index
+   Out[4]: Float64Index([0.0, 1.0, 2.0], dtype='float64')
+
+   In [5]: print(s.to_csv(path=None))
+   0,1
+   1,2
+   2,3
+
+
+New Behavior:
+
+.. ipython:: python
+
+   s = pd.Series([1,2,3], index=np.arange(3.))
+   s
+   s.index
+   print(s.to_csv(path=None))
+
+Changes to dtype assignment behaviors
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+When a DataFrame's slice is updated with a new slice of the same dtype, the dtype of the DataFrame will now remain the same. (:issue:`10503`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [5]: df = pd.DataFrame({'a': [0, 1, 1],
+                              'b': pd.Series([100, 200, 300], dtype='uint32')})
+
+   In [7]: df.dtypes
+   Out[7]:
+   a     int64
+   b    uint32
+   dtype: object
+
+   In [8]: ix = df['a'] == 1
+
+   In [9]: df.loc[ix, 'b'] = df.loc[ix, 'b']
+
+   In [11]: df.dtypes
+   Out[11]:
+   a    int64
+   b    int64
+   dtype: object
+
+New Behavior:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': [0, 1, 1],
+                      'b': pd.Series([100, 200, 300], dtype='uint32')})
+   df.dtypes
+   ix = df['a'] == 1
+   df.loc[ix, 'b'] = df.loc[ix, 'b']
+   df.dtypes
+
+When a DataFrame's integer slice is partially updated with a new slice of floats that could potentially be down-casted to integer without losing precision, the dtype of the slice will be set to float instead of integer.
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [4]: df = pd.DataFrame(np.array(range(1,10)).reshape(3,3),
+                             columns=list('abc'),
+                             index=[[4,4,8], [8,10,12]])
+
+   In [5]: df
+   Out[5]:
+         a  b  c
+   4 8   1  2  3
+     10  4  5  6
+   8 12  7  8  9
+
+   In [7]: df.ix[4, 'c'] = np.array([0., 1.])
+
+   In [8]: df
+   Out[8]:
+         a  b  c
+   4 8   1  2  0
+     10  4  5  1
+   8 12  7  8  9
+
+New Behavior:
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.array(range(1,10)).reshape(3,3),
+                     columns=list('abc'),
+                     index=[[4,4,8], [8,10,12]])
+   df
+   df.loc[4, 'c'] = np.array([0., 1.])
+   df
+
+.. _whatsnew_0180.enhancements.xarray:
+
+to_xarray
+^^^^^^^^^
+
+In a future version of pandas, we will be deprecating ``Panel`` and other > 2 ndim objects. In order to provide for continuity,
+all ``NDFrame`` objects have gained the ``.to_xarray()`` method in order to convert to ``xarray`` objects, which has
+a pandas-like interface for > 2 ndim. (:issue:`11972`)
+
+See the `xarray full-documentation here <http://xarray.pydata.org/en/stable/>`__.
+
+.. code-block:: ipython
+
+   In [1]: p = Panel(np.arange(2*3*4).reshape(2,3,4))
+
+   In [2]: p.to_xarray()
+   Out[2]:
+   <xarray.DataArray (items: 2, major_axis: 3, minor_axis: 4)>
+   array([[[ 0,  1,  2,  3],
+           [ 4,  5,  6,  7],
+           [ 8,  9, 10, 11]],
+
+          [[12, 13, 14, 15],
+           [16, 17, 18, 19],
+           [20, 21, 22, 23]]])
+   Coordinates:
+     * items       (items) int64 0 1
+     * major_axis  (major_axis) int64 0 1 2
+     * minor_axis  (minor_axis) int64 0 1 2 3
+
+Latex Representation
+^^^^^^^^^^^^^^^^^^^^
+
+``DataFrame`` has gained a ``._repr_latex_()`` method in order to allow for conversion to latex in a ipython/jupyter notebook using nbconvert. (:issue:`11778`)
+
+Note that this must be activated by setting the option ``pd.display.latex.repr=True`` (:issue:`12182`)
+
+For example, if you have a jupyter notebook you plan to convert to latex using nbconvert, place the statement ``pd.display.latex.repr=True`` in the first cell to have the contained DataFrame output also stored as latex.
+
+The options ``display.latex.escape`` and ``display.latex.longtable`` have also been added to the configuration and are used automatically by the ``to_latex``
+method. See the :ref:`available options docs <options.available>` for more info.
+
+.. _whatsnew_0180.enhancements.sas:
+
+``pd.read_sas()`` changes
+^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``read_sas`` has gained the ability to read SAS7BDAT files, including compressed files.  The files can be read in entirety, or incrementally.  For full details see :ref:`here <io.sas>`. (:issue:`4052`)
+
+.. _whatsnew_0180.enhancements.other:
+
+Other enhancements
+^^^^^^^^^^^^^^^^^^
+
+- Handle truncated floats in SAS xport files (:issue:`11713`)
+- Added option to hide index in ``Series.to_string`` (:issue:`11729`)
+- ``read_excel`` now supports s3 urls of the format ``s3://bucketname/filename`` (:issue:`11447`)
+- add support for ``AWS_S3_HOST`` env variable when reading from s3 (:issue:`12198`)
+- A simple version of ``Panel.round()`` is now implemented (:issue:`11763`)
+- For Python 3.x, ``round(DataFrame)``, ``round(Series)``, ``round(Panel)`` will work (:issue:`11763`)
+- ``sys.getsizeof(obj)`` returns the memory usage of a pandas object, including the
+  values it contains (:issue:`11597`)
+- ``Series`` gained an ``is_unique`` attribute (:issue:`11946`)
+- ``DataFrame.quantile`` and ``Series.quantile`` now accept ``interpolation`` keyword (:issue:`10174`).
+- Added ``DataFrame.style.format`` for more flexible formatting of cell values (:issue:`11692`)
+- ``DataFrame.select_dtypes`` now allows the ``np.float16`` type code (:issue:`11990`)
+- ``pivot_table()`` now accepts most iterables for the ``values`` parameter (:issue:`12017`)
+- Added Google ``BigQuery`` service account authentication support, which enables authentication on remote servers. (:issue:`11881`, :issue:`12572`). For further details see `here <https://pandas-gbq.readthedocs.io/en/latest/intro.html>`__
+- ``HDFStore`` is now iterable: ``for k in store`` is equivalent to ``for k in store.keys()`` (:issue:`12221`).
+- Add missing methods/fields to ``.dt`` for ``Period`` (:issue:`8848`)
+- The entire code base has been ``PEP``-ified (:issue:`12096`)
+
+.. _whatsnew_0180.api_breaking:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+- the leading white spaces have been removed from the output of ``.to_string(index=False)`` method (:issue:`11833`)
+- the ``out`` parameter has been removed from the ``Series.round()`` method. (:issue:`11763`)
+- ``DataFrame.round()`` leaves non-numeric columns unchanged in its return, rather than raises. (:issue:`11885`)
+- ``DataFrame.head(0)`` and ``DataFrame.tail(0)`` return empty frames, rather than ``self``.  (:issue:`11937`)
+- ``Series.head(0)`` and ``Series.tail(0)`` return empty series, rather than ``self``.  (:issue:`11937`)
+- ``to_msgpack`` and ``read_msgpack`` encoding now defaults to ``'utf-8'``. (:issue:`12170`)
+- the order of keyword arguments to text file parsing functions (``.read_csv()``, ``.read_table()``, ``.read_fwf()``) changed to group related arguments. (:issue:`11555`)
+- ``NaTType.isoformat`` now returns the string ``'NaT`` to allow the result to
+  be passed to the constructor of ``Timestamp``. (:issue:`12300`)
+
+NaT and Timedelta operations
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``NaT`` and ``Timedelta`` have expanded arithmetic operations, which are extended to ``Series``
+arithmetic where applicable.  Operations defined for ``datetime64[ns]`` or ``timedelta64[ns]``
+are now also defined for ``NaT`` (:issue:`11564`).
+
+``NaT`` now supports arithmetic operations with integers and floats.
+
+.. ipython:: python
+
+   pd.NaT * 1
+   pd.NaT * 1.5
+   pd.NaT / 2
+   pd.NaT * np.nan
+
+``NaT`` defines more arithmetic operations with ``datetime64[ns]`` and ``timedelta64[ns]``.
+
+.. ipython:: python
+
+   pd.NaT / pd.NaT
+   pd.Timedelta('1s') / pd.NaT
+
+``NaT`` may represent either a ``datetime64[ns]`` null or a ``timedelta64[ns]`` null.
+Given the ambiguity, it is treated as a ``timedelta64[ns]``, which allows more operations
+to succeed.
+
+.. ipython:: python
+
+   pd.NaT + pd.NaT
+
+   # same as
+   pd.Timedelta('1s') + pd.Timedelta('1s')
+
+as opposed to
+
+.. code-block:: ipython
+
+   In [3]: pd.Timestamp('19900315') + pd.Timestamp('19900315')
+   TypeError: unsupported operand type(s) for +: 'Timestamp' and 'Timestamp'
+
+However, when wrapped in a ``Series`` whose ``dtype`` is ``datetime64[ns]`` or ``timedelta64[ns]``,
+the ``dtype`` information is respected.
+
+.. code-block:: ipython
+
+   In [1]: pd.Series([pd.NaT], dtype='<M8[ns]') + pd.Series([pd.NaT], dtype='<M8[ns]')
+   TypeError: can only operate on a datetimes for subtraction,
+              but the operator [__add__] was passed
+
+.. ipython:: python
+
+   pd.Series([pd.NaT], dtype='<m8[ns]') + pd.Series([pd.NaT], dtype='<m8[ns]')
+
+``Timedelta`` division by ``floats`` now works.
+
+.. ipython:: python
+
+   pd.Timedelta('1s') / 2.0
+
+Subtraction by ``Timedelta`` in a ``Series`` by a ``Timestamp`` works (:issue:`11925`)
+
+.. ipython:: python
+
+   ser = pd.Series(pd.timedelta_range('1 day', periods=3))
+   ser
+   pd.Timestamp('2012-01-01') - ser
+
+
+``NaT.isoformat()`` now returns ``'NaT'``. This change allows allows
+``pd.Timestamp`` to rehydrate any timestamp like object from its isoformat
+(:issue:`12300`).
+
+Changes to msgpack
+^^^^^^^^^^^^^^^^^^
+
+Forward incompatible changes in ``msgpack`` writing format were made over 0.17.0 and 0.18.0; older versions of pandas cannot read files packed by newer versions (:issue:`12129`, :issue:`10527`)
+
+Bugs in ``to_msgpack`` and ``read_msgpack`` introduced in 0.17.0 and fixed in 0.18.0, caused files packed in Python 2 unreadable by Python 3 (:issue:`12142`). The following table describes the backward and forward compat of msgpacks.
+
+.. warning::
+
+   +----------------------+------------------------+
+   | Packed with          | Can be unpacked with   |
+   +======================+========================+
+   | pre-0.17 / Python 2  | any                    |
+   +----------------------+------------------------+
+   | pre-0.17 / Python 3  | any                    |
+   +----------------------+------------------------+
+   | 0.17 / Python 2      | - ==0.17 / Python 2    |
+   |                      | - >=0.18 / any Python  |
+   +----------------------+------------------------+
+   | 0.17 / Python 3      | >=0.18 / any Python    |
+   +----------------------+------------------------+
+   | 0.18                 | >= 0.18                |
+   +----------------------+------------------------+
+
+
+   0.18.0 is backward-compatible for reading files packed by older versions, except for files packed with 0.17 in Python 2, in which case only they can only be unpacked in Python 2.
+
+Signature change for .rank
+^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``Series.rank`` and ``DataFrame.rank`` now have the same signature (:issue:`11759`)
+
+Previous signature
+
+.. code-block:: ipython
+
+   In [3]: pd.Series([0,1]).rank(method='average', na_option='keep',
+                                 ascending=True, pct=False)
+   Out[3]:
+   0    1
+   1    2
+   dtype: float64
+
+   In [4]: pd.DataFrame([0,1]).rank(axis=0, numeric_only=None,
+                                    method='average', na_option='keep',
+                                    ascending=True, pct=False)
+   Out[4]:
+      0
+   0  1
+   1  2
+
+New signature
+
+.. ipython:: python
+
+   pd.Series([0,1]).rank(axis=0, method='average', numeric_only=None,
+                         na_option='keep', ascending=True, pct=False)
+   pd.DataFrame([0,1]).rank(axis=0, method='average', numeric_only=None,
+                            na_option='keep', ascending=True, pct=False)
+
+
+Bug in QuarterBegin with n=0
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions, the behavior of the QuarterBegin offset was inconsistent
+depending on the date when the ``n`` parameter was 0. (:issue:`11406`)
+
+The general semantics of anchored offsets for ``n=0`` is to not move the date
+when it is an anchor point (e.g., a quarter start date), and otherwise roll
+forward to the next anchor point.
+
+.. ipython:: python
+
+   d = pd.Timestamp('2014-02-01')
+   d
+   d + pd.offsets.QuarterBegin(n=0, startingMonth=2)
+   d + pd.offsets.QuarterBegin(n=0, startingMonth=1)
+
+For the ``QuarterBegin`` offset in previous versions, the date would be rolled
+*backwards* if date was in the same month as the quarter start date.
+
+.. code-block:: ipython
+
+   In [3]: d = pd.Timestamp('2014-02-15')
+
+   In [4]: d + pd.offsets.QuarterBegin(n=0, startingMonth=2)
+   Out[4]: Timestamp('2014-02-01 00:00:00')
+
+This behavior has been corrected in version 0.18.0, which is consistent with
+other anchored offsets like ``MonthBegin`` and ``YearBegin``.
+
+.. ipython:: python
+
+   d = pd.Timestamp('2014-02-15')
+   d + pd.offsets.QuarterBegin(n=0, startingMonth=2)
+
+.. _whatsnew_0180.breaking.resample:
+
+Resample API
+^^^^^^^^^^^^
+
+Like the change in the window functions API :ref:`above <whatsnew_0180.enhancements.moments>`, ``.resample(...)`` is changing to have a more groupby-like API. (:issue:`11732`, :issue:`12702`, :issue:`12202`, :issue:`12332`, :issue:`12334`, :issue:`12348`, :issue:`12448`).
+
+.. ipython:: python
+
+   np.random.seed(1234)
+   df = pd.DataFrame(np.random.rand(10,4),
+                     columns=list('ABCD'),
+                     index=pd.date_range('2010-01-01 09:00:00', periods=10, freq='s'))
+   df
+
+
+**Previous API**:
+
+You would write a resampling operation that immediately evaluates. If a ``how`` parameter was not provided, it
+would default to ``how='mean'``.
+
+.. code-block:: ipython
+
+   In [6]: df.resample('2s')
+   Out[6]:
+                            A         B         C         D
+   2010-01-01 09:00:00  0.485748  0.447351  0.357096  0.793615
+   2010-01-01 09:00:02  0.820801  0.794317  0.364034  0.531096
+   2010-01-01 09:00:04  0.433985  0.314582  0.424104  0.625733
+   2010-01-01 09:00:06  0.624988  0.609738  0.633165  0.612452
+   2010-01-01 09:00:08  0.510470  0.534317  0.573201  0.806949
+
+You could also specify a ``how`` directly
+
+.. code-block:: ipython
+
+   In [7]: df.resample('2s', how='sum')
+   Out[7]:
+                            A         B         C         D
+   2010-01-01 09:00:00  0.971495  0.894701  0.714192  1.587231
+   2010-01-01 09:00:02  1.641602  1.588635  0.728068  1.062191
+   2010-01-01 09:00:04  0.867969  0.629165  0.848208  1.251465
+   2010-01-01 09:00:06  1.249976  1.219477  1.266330  1.224904
+   2010-01-01 09:00:08  1.020940  1.068634  1.146402  1.613897
+
+**New API**:
+
+Now, you can write ``.resample(..)`` as a 2-stage operation like ``.groupby(...)``, which
+yields a ``Resampler``.
+
+.. ipython:: python
+   :okwarning:
+
+   r = df.resample('2s')
+   r
+
+Downsampling
+""""""""""""
+
+You can then use this object to perform operations.
+These are downsampling operations (going from a higher frequency to a lower one).
+
+.. ipython:: python
+
+   r.mean()
+
+.. ipython:: python
+
+   r.sum()
+
+Furthermore, resample now supports ``getitem`` operations to perform the resample on specific columns.
+
+.. ipython:: python
+
+   r[['A','C']].mean()
+
+and ``.aggregate`` type operations.
+
+.. ipython:: python
+
+   r.agg({'A' : 'mean', 'B' : 'sum'})
+
+These accessors can of course, be combined
+
+.. ipython:: python
+
+   r[['A','B']].agg(['mean','sum'])
+
+Upsampling
+""""""""""
+
+.. currentmodule:: pandas.tseries.resample
+
+Upsampling operations take you from a lower frequency to a higher frequency. These are now
+performed with the ``Resampler`` objects with :meth:`~Resampler.backfill`,
+:meth:`~Resampler.ffill`, :meth:`~Resampler.fillna` and :meth:`~Resampler.asfreq` methods.
+
+.. ipython:: python
+
+   s = pd.Series(np.arange(5,dtype='int64'),
+                 index=date_range('2010-01-01', periods=5, freq='Q'))
+   s
+
+Previously
+
+.. code-block:: ipython
+
+   In [6]: s.resample('M', fill_method='ffill')
+   Out[6]:
+   2010-03-31    0
+   2010-04-30    0
+   2010-05-31    0
+   2010-06-30    1
+   2010-07-31    1
+   2010-08-31    1
+   2010-09-30    2
+   2010-10-31    2
+   2010-11-30    2
+   2010-12-31    3
+   2011-01-31    3
+   2011-02-28    3
+   2011-03-31    4
+   Freq: M, dtype: int64
+
+New API
+
+.. ipython:: python
+
+   s.resample('M').ffill()
+
+.. note::
+
+   In the new API, you can either downsample OR upsample. The prior implementation would allow you to pass an aggregator function (like ``mean``) even though you were upsampling, providing a bit of confusion.
+
+Previous API will work but with deprecations
+""""""""""""""""""""""""""""""""""""""""""""
+
+.. warning::
+
+   This new API for resample includes some internal changes for the prior-to-0.18.0 API, to work with a deprecation warning in most cases, as the resample operation returns a deferred object. We can intercept operations and just do what the (pre 0.18.0) API did (with a warning). Here is a typical use case:
+
+   .. code-block:: ipython
+
+      In [4]: r = df.resample('2s')
+
+      In [6]: r*10
+      pandas/tseries/resample.py:80: FutureWarning: .resample() is now a deferred operation
+      use .resample(...).mean() instead of .resample(...)
+
+      Out[6]:
+                            A         B         C         D
+      2010-01-01 09:00:00  4.857476  4.473507  3.570960  7.936154
+      2010-01-01 09:00:02  8.208011  7.943173  3.640340  5.310957
+      2010-01-01 09:00:04  4.339846  3.145823  4.241039  6.257326
+      2010-01-01 09:00:06  6.249881  6.097384  6.331650  6.124518
+      2010-01-01 09:00:08  5.104699  5.343172  5.732009  8.069486
+
+   However, getting and assignment operations directly on a ``Resampler`` will raise a ``ValueError``:
+
+   .. code-block:: ipython
+
+      In [7]: r.iloc[0] = 5
+      ValueError: .resample() is now a deferred operation
+      use .resample(...).mean() instead of .resample(...)
+
+   There is a situation where the new API can not perform all the operations when using original code.
+   This code is intending to resample every 2s, take the ``mean`` AND then take the ``min`` of those results.
+
+   .. code-block:: ipython
+
+      In [4]: df.resample('2s').min()
+      Out[4]:
+      A    0.433985
+      B    0.314582
+      C    0.357096
+      D    0.531096
+      dtype: float64
+
+   The new API will:
+
+   .. ipython:: python
+
+      df.resample('2s').min()
+
+   The good news is the return dimensions will differ between the new API and the old API, so this should loudly raise
+   an exception.
+
+   To replicate the original operation
+
+   .. ipython:: python
+
+      df.resample('2s').mean().min()
+
+Changes to eval
+^^^^^^^^^^^^^^^
+
+In prior versions, new columns assignments in an ``eval`` expression resulted
+in an inplace change to the ``DataFrame``. (:issue:`9297`, :issue:`8664`, :issue:`10486`)
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': np.linspace(0, 10, 5), 'b': range(5)})
+   df
+
+.. ipython:: python
+   :suppress:
+
+   df.eval('c = a + b', inplace=True)
+
+.. code-block:: ipython
+
+   In [12]: df.eval('c = a + b')
+   FutureWarning: eval expressions containing an assignment currentlydefault to operating inplace.
+   This will change in a future version of pandas, use inplace=True to avoid this warning.
+
+   In [13]: df
+   Out[13]:
+         a  b     c
+   0   0.0  0   0.0
+   1   2.5  1   3.5
+   2   5.0  2   7.0
+   3   7.5  3  10.5
+   4  10.0  4  14.0
+
+In version 0.18.0, a new ``inplace`` keyword was added to choose whether the
+assignment should be done inplace or return a copy.
+
+.. ipython:: python
+
+   df
+   df.eval('d = c - b', inplace=False)
+   df
+   df.eval('d = c - b', inplace=True)
+   df
+
+.. warning::
+
+   For backwards compatibility, ``inplace`` defaults to ``True`` if not specified.
+   This will change in a future version of pandas. If your code depends on an
+   inplace assignment you should update to explicitly set ``inplace=True``
+
+The ``inplace`` keyword parameter was also added the ``query`` method.
+
+.. ipython:: python
+
+   df.query('a > 5')
+   df.query('a > 5', inplace=True)
+   df
+
+.. warning::
+
+   Note that the default value for ``inplace`` in a ``query``
+   is ``False``, which is consistent with prior versions.
+
+``eval`` has also been updated to allow multi-line expressions for multiple
+assignments.  These expressions will be evaluated one at a time in order.  Only
+assignments are valid for multi-line expressions.
+
+.. ipython:: python
+
+   df
+   df.eval("""
+   e = d + a
+   f = e - 22
+   g = f / 2.0""", inplace=True)
+   df
+
+
+.. _whatsnew_0180.api:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+- ``DataFrame.between_time`` and ``Series.between_time`` now only parse a fixed set of time strings. Parsing of date strings is no longer supported and raises a ``ValueError``. (:issue:`11818`)
+
+  .. ipython:: python
+
+     s = pd.Series(range(10), pd.date_range('2015-01-01', freq='H', periods=10))
+     s.between_time("7:00am", "9:00am")
+
+  This will now raise.
+
+  .. code-block:: ipython
+
+     In [2]: s.between_time('20150101 07:00:00','20150101 09:00:00')
+     ValueError: Cannot convert arg ['20150101 07:00:00'] to a time.
+
+- ``.memory_usage()`` now includes values in the index, as does memory_usage in ``.info()`` (:issue:`11597`)
+- ``DataFrame.to_latex()`` now supports non-ascii encodings (eg ``utf-8``) in Python 2 with the parameter ``encoding`` (:issue:`7061`)
+- ``pandas.merge()`` and ``DataFrame.merge()`` will show a specific error message when trying to merge with an object that is not of type ``DataFrame`` or a subclass (:issue:`12081`)
+- ``DataFrame.unstack`` and ``Series.unstack`` now take ``fill_value`` keyword to allow direct replacement of missing values when an unstack results in missing values in the resulting ``DataFrame``. As an added benefit, specifying ``fill_value`` will preserve the data type of the original stacked data.  (:issue:`9746`)
+- As part of the new API for :ref:`window functions <whatsnew_0180.enhancements.moments>` and :ref:`resampling <whatsnew_0180.breaking.resample>`, aggregation functions have been clarified, raising more informative error messages on invalid aggregations. (:issue:`9052`). A full set of examples are presented in :ref:`groupby <groupby.aggregate>`.
+- Statistical functions for ``NDFrame`` objects (like ``sum(), mean(), min()``) will now raise if non-numpy-compatible arguments are passed in for ``**kwargs`` (:issue:`12301`)
+- ``.to_latex`` and ``.to_html`` gain a ``decimal`` parameter like ``.to_csv``; the default is ``'.'`` (:issue:`12031`)
+- More helpful error message when constructing a ``DataFrame`` with empty data but with indices (:issue:`8020`)
+- ``.describe()`` will now properly handle bool dtype as a categorical (:issue:`6625`)
+- More helpful error message with an invalid ``.transform`` with user defined input (:issue:`10165`)
+- Exponentially weighted functions now allow specifying alpha directly (:issue:`10789`) and raise ``ValueError`` if parameters violate ``0 < alpha <= 1`` (:issue:`12492`)
+
+.. _whatsnew_0180.deprecations:
+
+Deprecations
+^^^^^^^^^^^^
+
+.. _whatsnew_0180.window_deprecations:
+
+- The functions ``pd.rolling_*``, ``pd.expanding_*``, and ``pd.ewm*`` are deprecated and replaced by the corresponding method call. Note that
+  the new suggested syntax includes all of the arguments (even if default) (:issue:`11603`)
+
+  .. code-block:: ipython
+
+     In [1]: s = pd.Series(range(3))
+
+     In [2]: pd.rolling_mean(s,window=2,min_periods=1)
+             FutureWarning: pd.rolling_mean is deprecated for Series and
+                  will be removed in a future version, replace with
+                  Series.rolling(min_periods=1,window=2,center=False).mean()
+     Out[2]:
+             0    0.0
+             1    0.5
+             2    1.5
+             dtype: float64
+
+     In [3]: pd.rolling_cov(s, s, window=2)
+             FutureWarning: pd.rolling_cov is deprecated for Series and
+                  will be removed in a future version, replace with
+                  Series.rolling(window=2).cov(other=<Series>)
+     Out[3]:
+             0    NaN
+             1    0.5
+             2    0.5
+             dtype: float64
+
+- The ``freq`` and ``how`` arguments to the ``.rolling``, ``.expanding``, and ``.ewm`` (new) functions are deprecated, and will be removed in a future version. You can simply resample the input prior to creating a window function. (:issue:`11603`).
+
+  For example, instead of ``s.rolling(window=5,freq='D').max()`` to get the max value on a rolling 5 Day window, one could use ``s.resample('D').mean().rolling(window=5).max()``, which first resamples the data to daily data, then provides a rolling 5 day window.
+
+- ``pd.tseries.frequencies.get_offset_name`` function is deprecated. Use offset's ``.freqstr`` property as alternative (:issue:`11192`)
+- ``pandas.stats.fama_macbeth`` routines are deprecated and will be removed in a future version (:issue:`6077`)
+- ``pandas.stats.ols``, ``pandas.stats.plm`` and ``pandas.stats.var`` routines are deprecated and will be removed in a future version (:issue:`6077`)
+- show a ``FutureWarning`` rather than a ``DeprecationWarning`` on using long-time deprecated syntax in ``HDFStore.select``, where the ``where`` clause is not a string-like (:issue:`12027`)
+
+- The ``pandas.options.display.mpl_style`` configuration has been deprecated
+  and will be removed in a future version of pandas. This functionality
+  is better handled by matplotlib's `style sheets`_ (:issue:`11783`).
+
+
+.. _style sheets: http://matplotlib.org/users/style_sheets.html
+
+.. _whatsnew_0180.float_indexers:
+
+Removal of deprecated float indexers
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In :issue:`4892` indexing with floating point numbers on a non-``Float64Index`` was deprecated (in version 0.14.0).
+In 0.18.0, this deprecation warning is removed and these will now raise a ``TypeError``. (:issue:`12165`, :issue:`12333`)
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3], index=[4, 5, 6])
+   s
+   s2 = pd.Series([1, 2, 3], index=list('abc'))
+   s2
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   # this is label indexing
+   In [2]: s[5.0]
+   FutureWarning: scalar indexers for index type Int64Index should be integers and not floating point
+   Out[2]: 2
+
+   # this is positional indexing
+   In [3]: s.iloc[1.0]
+   FutureWarning: scalar indexers for index type Int64Index should be integers and not floating point
+   Out[3]: 2
+
+   # this is label indexing
+   In [4]: s.loc[5.0]
+   FutureWarning: scalar indexers for index type Int64Index should be integers and not floating point
+   Out[4]: 2
+
+   # .ix would coerce 1.0 to the positional 1, and index
+   In [5]: s2.ix[1.0] = 10
+   FutureWarning: scalar indexers for index type Index should be integers and not floating point
+
+   In [6]: s2
+   Out[6]:
+   a     1
+   b    10
+   c     3
+   dtype: int64
+
+New Behavior:
+
+For iloc, getting & setting via a float scalar will always raise.
+
+.. code-block:: ipython
+
+   In [3]: s.iloc[2.0]
+   TypeError: cannot do label indexing on <class 'pandas.indexes.numeric.Int64Index'> with these indexers [2.0] of <type 'float'>
+
+Other indexers will coerce to a like integer for both getting and setting. The ``FutureWarning`` has been dropped for ``.loc``, ``.ix`` and ``[]``.
+
+.. ipython:: python
+
+   s[5.0]
+   s.loc[5.0]
+
+and setting
+
+.. ipython:: python
+
+   s_copy = s.copy()
+   s_copy[5.0] = 10
+   s_copy
+   s_copy = s.copy()
+   s_copy.loc[5.0] = 10
+   s_copy
+
+Positional setting with ``.ix`` and a float indexer will ADD this value to the index, rather than previously setting the value by position.
+
+.. code-block:: python
+
+   In [3]: s2.ix[1.0] = 10
+   In [4]: s2
+   Out[4]:
+   a       1
+   b       2
+   c       3
+   1.0    10
+   dtype: int64
+
+Slicing will also coerce integer-like floats to integers for a non-``Float64Index``.
+
+.. ipython:: python
+
+   s.loc[5.0:6]
+
+Note that for floats that are NOT coercible to ints, the label based bounds will be excluded
+
+.. ipython:: python
+
+   s.loc[5.1:6]
+
+Float indexing on a ``Float64Index`` is unchanged.
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3], index=np.arange(3.))
+   s[1.0]
+   s[1.0:2.5]
+
+.. _whatsnew_0180.prior_deprecations:
+
+Removal of prior version deprecations/changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Removal of ``rolling_corr_pairwise`` in favor of ``.rolling().corr(pairwise=True)`` (:issue:`4950`)
+- Removal of ``expanding_corr_pairwise`` in favor of ``.expanding().corr(pairwise=True)`` (:issue:`4950`)
+- Removal of ``DataMatrix`` module. This was not imported into the pandas namespace in any event (:issue:`12111`)
+- Removal of ``cols`` keyword in favor of ``subset`` in ``DataFrame.duplicated()`` and ``DataFrame.drop_duplicates()`` (:issue:`6680`)
+- Removal of the ``read_frame`` and ``frame_query`` (both aliases for ``pd.read_sql``)
+  and ``write_frame`` (alias of ``to_sql``) functions in the ``pd.io.sql`` namespace,
+  deprecated since 0.14.0 (:issue:`6292`).
+- Removal of the ``order`` keyword from ``.factorize()`` (:issue:`6930`)
+
+.. _whatsnew_0180.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved performance of ``andrews_curves`` (:issue:`11534`)
+- Improved huge ``DatetimeIndex``, ``PeriodIndex`` and ``TimedeltaIndex``'s ops performance including ``NaT`` (:issue:`10277`)
+- Improved performance of ``pandas.concat`` (:issue:`11958`)
+- Improved performance of ``StataReader`` (:issue:`11591`)
+- Improved performance in construction of ``Categoricals`` with ``Series`` of datetimes containing ``NaT`` (:issue:`12077`)
+
+
+- Improved performance of ISO 8601 date parsing for dates without separators (:issue:`11899`), leading zeros (:issue:`11871`) and with white space preceding the time zone (:issue:`9714`)
+
+
+
+
+.. _whatsnew_0180.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Bug in ``GroupBy.size`` when data-frame is empty. (:issue:`11699`)
+- Bug in ``Period.end_time`` when a multiple of time period is requested (:issue:`11738`)
+- Regression in ``.clip`` with tz-aware datetimes (:issue:`11838`)
+- Bug in ``date_range`` when the boundaries fell on the frequency (:issue:`11804`, :issue:`12409`)
+- Bug in consistency of passing nested dicts to ``.groupby(...).agg(...)`` (:issue:`9052`)
+- Accept unicode in ``Timedelta`` constructor (:issue:`11995`)
+- Bug in value label reading for ``StataReader`` when reading incrementally (:issue:`12014`)
+- Bug in vectorized ``DateOffset`` when ``n`` parameter is ``0`` (:issue:`11370`)
+- Compat for numpy 1.11 w.r.t. ``NaT`` comparison changes (:issue:`12049`)
+- Bug in ``read_csv`` when reading from a ``StringIO`` in threads (:issue:`11790`)
+- Bug in not treating ``NaT`` as a missing value in datetimelikes when factorizing & with ``Categoricals`` (:issue:`12077`)
+- Bug in getitem when the values of a ``Series`` were tz-aware (:issue:`12089`)
+- Bug in ``Series.str.get_dummies`` when one of the variables was 'name' (:issue:`12180`)
+- Bug in ``pd.concat`` while concatenating tz-aware NaT series. (:issue:`11693`, :issue:`11755`, :issue:`12217`)
+- Bug in ``pd.read_stata`` with version <= 108 files (:issue:`12232`)
+- Bug in ``Series.resample`` using a frequency of ``Nano`` when the index is a ``DatetimeIndex`` and contains non-zero nanosecond parts (:issue:`12037`)
+- Bug in resampling with ``.nunique`` and a sparse index (:issue:`12352`)
+- Removed some compiler warnings (:issue:`12471`)
+- Work around compat issues with ``boto`` in python 3.5 (:issue:`11915`)
+- Bug in ``NaT`` subtraction from ``Timestamp`` or ``DatetimeIndex`` with timezones (:issue:`11718`)
+- Bug in subtraction of ``Series`` of a single tz-aware ``Timestamp`` (:issue:`12290`)
+- Use compat iterators in PY2 to support ``.next()`` (:issue:`12299`)
+- Bug in ``Timedelta.round`` with negative values (:issue:`11690`)
+- Bug in ``.loc`` against ``CategoricalIndex`` may result in normal ``Index`` (:issue:`11586`)
+- Bug in ``DataFrame.info`` when duplicated column names exist (:issue:`11761`)
+- Bug in ``.copy`` of datetime tz-aware objects (:issue:`11794`)
+- Bug in ``Series.apply`` and ``Series.map`` where ``timedelta64`` was not boxed (:issue:`11349`)
+- Bug in ``DataFrame.set_index()`` with tz-aware ``Series`` (:issue:`12358`)
+
+
+
+- Bug in subclasses of ``DataFrame`` where ``AttributeError`` did not propagate (:issue:`11808`)
+- Bug groupby on tz-aware data where selection not returning ``Timestamp`` (:issue:`11616`)
+- Bug in ``pd.read_clipboard`` and ``pd.to_clipboard`` functions not supporting Unicode; upgrade included ``pyperclip`` to v1.5.15 (:issue:`9263`)
+- Bug in ``DataFrame.query`` containing an assignment (:issue:`8664`)
+
+- Bug in ``from_msgpack`` where ``__contains__()`` fails for columns of the unpacked ``DataFrame``, if the ``DataFrame`` has object columns. (:issue:`11880`)
+- Bug in ``.resample`` on categorical data with ``TimedeltaIndex`` (:issue:`12169`)
+
+
+- Bug in timezone info lost when broadcasting scalar datetime to ``DataFrame`` (:issue:`11682`)
+- Bug in ``Index`` creation from ``Timestamp`` with mixed tz coerces to UTC (:issue:`11488`)
+- Bug in ``to_numeric`` where it does not raise if input is more than one dimension (:issue:`11776`)
+- Bug in parsing timezone offset strings with non-zero minutes (:issue:`11708`)
+- Bug in ``df.plot`` using incorrect colors for bar plots under matplotlib 1.5+ (:issue:`11614`)
+- Bug in the ``groupby`` ``plot`` method when using keyword arguments (:issue:`11805`).
+- Bug in ``DataFrame.duplicated`` and ``drop_duplicates`` causing spurious matches when setting ``keep=False`` (:issue:`11864`)
+- Bug in ``.loc`` result with duplicated key may have ``Index`` with incorrect dtype (:issue:`11497`)
+- Bug in ``pd.rolling_median`` where memory allocation failed even with sufficient memory (:issue:`11696`)
+- Bug in ``DataFrame.style`` with spurious zeros (:issue:`12134`)
+- Bug in ``DataFrame.style`` with integer columns not starting at 0 (:issue:`12125`)
+- Bug in ``.style.bar`` may not rendered properly using specific browser (:issue:`11678`)
+- Bug in rich comparison of ``Timedelta`` with a ``numpy.array`` of ``Timedelta`` that caused an infinite recursion (:issue:`11835`)
+- Bug in ``DataFrame.round`` dropping column index name (:issue:`11986`)
+- Bug in ``df.replace`` while replacing value in mixed dtype ``Dataframe`` (:issue:`11698`)
+- Bug in ``Index`` prevents copying name of passed ``Index``, when a new name is not provided (:issue:`11193`)
+- Bug in ``read_excel`` failing to read any non-empty sheets when empty sheets exist and ``sheetname=None`` (:issue:`11711`)
+- Bug in ``read_excel`` failing to raise ``NotImplemented`` error when keywords ``parse_dates`` and ``date_parser`` are provided (:issue:`11544`)
+- Bug in ``read_sql`` with ``pymysql`` connections failing to return chunked data (:issue:`11522`)
+- Bug in ``.to_csv`` ignoring formatting parameters ``decimal``, ``na_rep``, ``float_format`` for float indexes (:issue:`11553`)
+- Bug in ``Int64Index`` and ``Float64Index`` preventing the use of the modulo operator (:issue:`9244`)
+- Bug in ``MultiIndex.drop`` for not lexsorted MultiIndexes (:issue:`12078`)
+
+- Bug in ``DataFrame`` when masking an empty ``DataFrame`` (:issue:`11859`)
+
+
+- Bug in ``.plot`` potentially modifying the ``colors`` input when the number of columns didn't match the number of series provided (:issue:`12039`).
+- Bug in ``Series.plot`` failing when index has a ``CustomBusinessDay`` frequency (:issue:`7222`).
+- Bug in ``.to_sql`` for ``datetime.time`` values with sqlite fallback (:issue:`8341`)
+- Bug in ``read_excel`` failing to read data with one column when ``squeeze=True`` (:issue:`12157`)
+- Bug in ``read_excel`` failing to read one empty column (:issue:`12292`, :issue:`9002`)
+- Bug in ``.groupby`` where a ``KeyError`` was not raised for a wrong column if there was only one row in the dataframe (:issue:`11741`)
+- Bug in ``.read_csv`` with dtype specified on empty data producing an error (:issue:`12048`)
+- Bug in ``.read_csv`` where strings like ``'2E'`` are treated as valid floats (:issue:`12237`)
+- Bug in building *pandas* with debugging symbols (:issue:`12123`)
+
+
+- Removed ``millisecond`` property of ``DatetimeIndex``. This would always raise a ``ValueError`` (:issue:`12019`).
+- Bug in ``Series`` constructor with read-only data (:issue:`11502`)
+- Removed ``pandas.util.testing.choice()``.  Should use ``np.random.choice()``, instead. (:issue:`12386`)
+- Bug in ``.loc`` setitem indexer preventing the use of a TZ-aware DatetimeIndex (:issue:`12050`)
+- Bug in ``.style`` indexes and MultiIndexes not appearing (:issue:`11655`)
+- Bug in ``to_msgpack`` and ``from_msgpack`` which did not correctly serialize or deserialize ``NaT`` (:issue:`12307`).
+- Bug in ``.skew`` and ``.kurt`` due to roundoff error for highly similar values (:issue:`11974`)
+- Bug in ``Timestamp`` constructor where microsecond resolution was lost if HHMMSS were not separated with ':' (:issue:`10041`)
+- Bug in ``buffer_rd_bytes`` src->buffer could be freed more than once if reading failed, causing a segfault (:issue:`12098`)
+
+- Bug in ``crosstab`` where arguments with non-overlapping indexes would return a ``KeyError`` (:issue:`10291`)
+
+- Bug in ``DataFrame.apply`` in which reduction was not being prevented for cases in which ``dtype`` was not a numpy dtype (:issue:`12244`)
+- Bug when initializing categorical series with a scalar value. (:issue:`12336`)
+- Bug when specifying a UTC ``DatetimeIndex`` by setting ``utc=True`` in ``.to_datetime`` (:issue:`11934`)
+- Bug when increasing the buffer size of CSV reader in ``read_csv`` (:issue:`12494`)
+- Bug when setting columns of a ``DataFrame`` with duplicate column names (:issue:`12344`)
diff --git a/doc/source/whatsnew/v0.18.1.txt b/doc/source/whatsnew/v0.18.1.txt
new file mode 100644
index 0000000000000..34921505a46bf
--- /dev/null
+++ b/doc/source/whatsnew/v0.18.1.txt
@@ -0,0 +1,694 @@
+.. _whatsnew_0181:
+
+v0.18.1 (May 3, 2016)
+---------------------
+
+This is a minor bug-fix release from 0.18.0 and includes a large number of
+bug fixes along with several new features, enhancements, and performance improvements.
+We recommend that all users upgrade to this version.
+
+Highlights include:
+
+- ``.groupby(...)`` has been enhanced to provide convenient syntax when working with ``.rolling(..)``, ``.expanding(..)`` and ``.resample(..)`` per group, see :ref:`here <whatsnew_0181.deferred_ops>`
+- ``pd.to_datetime()`` has gained the ability to assemble dates from a ``DataFrame``, see :ref:`here <whatsnew_0181.enhancements.assembling>`
+- Method chaining improvements, see :ref:`here <whatsnew_0181.enhancements.method_chain>`.
+- Custom business hour offset, see :ref:`here <whatsnew_0181.enhancements.custombusinesshour>`.
+- Many bug fixes in the handling of ``sparse``, see :ref:`here <whatsnew_0181.sparse>`
+- Expanded the :ref:`Tutorials section <tutorial-modern>` with a feature on modern pandas, courtesy of `@TomAugsburger <https://twitter.com/TomAugspurger>`__. (:issue:`13045`).
+
+
+.. contents:: What's new in v0.18.1
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0181.new_features:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0181.enhancements.custombusinesshour:
+
+Custom Business Hour
+^^^^^^^^^^^^^^^^^^^^
+
+The ``CustomBusinessHour`` is a mixture of ``BusinessHour`` and ``CustomBusinessDay`` which
+allows you to specify arbitrary holidays. For details,
+see :ref:`Custom Business Hour <timeseries.custombusinesshour>` (:issue:`11514`)
+
+.. ipython:: python
+
+    from pandas.tseries.offsets import CustomBusinessHour
+    from pandas.tseries.holiday import USFederalHolidayCalendar
+    bhour_us = CustomBusinessHour(calendar=USFederalHolidayCalendar())
+
+Friday before MLK Day
+
+.. ipython:: python
+
+    dt = datetime(2014, 1, 17, 15)
+
+    dt + bhour_us
+
+Tuesday after MLK Day (Monday is skipped because it's a holiday)
+
+.. ipython:: python
+
+    dt + bhour_us * 2
+
+.. _whatsnew_0181.deferred_ops:
+
+``.groupby(..)`` syntax with window and resample operations
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``.groupby(...)`` has been enhanced to provide convenient syntax when working with ``.rolling(..)``, ``.expanding(..)`` and ``.resample(..)`` per group, see (:issue:`12486`, :issue:`12738`).
+
+You can now use ``.rolling(..)`` and ``.expanding(..)`` as methods on groupbys. These return another deferred object (similar to what ``.rolling()`` and ``.expanding()`` do on ungrouped pandas objects). You can then operate on these ``RollingGroupby`` objects in a similar manner.
+
+Previously you would have to do this to get a rolling window mean per-group:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1] * 20 + [2] * 12 + [3] * 8,
+                      'B': np.arange(40)})
+   df
+
+.. ipython:: python
+
+   df.groupby('A').apply(lambda x: x.rolling(4).B.mean())
+
+Now you can do:
+
+.. ipython:: python
+
+   df.groupby('A').rolling(4).B.mean()
+
+For ``.resample(..)`` type of operations, previously you would have to:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'date': pd.date_range(start='2016-01-01',
+                                            periods=4,
+                                            freq='W'),
+                      'group': [1, 1, 2, 2],
+                      'val': [5, 6, 7, 8]}).set_index('date')
+
+   df
+
+.. ipython:: python
+
+   df.groupby('group').apply(lambda x: x.resample('1D').ffill())
+
+Now you can do:
+
+.. ipython:: python
+
+   df.groupby('group').resample('1D').ffill()
+
+.. _whatsnew_0181.enhancements.method_chain:
+
+Method chaining improvements
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The following methods / indexers now accept a ``callable``. It is intended to make
+these more useful in method chains, see the :ref:`documentation <indexing.callable>`.
+(:issue:`11485`, :issue:`12533`)
+
+- ``.where()`` and ``.mask()``
+- ``.loc[]``, ``iloc[]`` and ``.ix[]``
+- ``[]`` indexing
+
+``.where()`` and ``.mask()``
+""""""""""""""""""""""""""""
+
+These can accept a callable for the condition and ``other``
+arguments.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 2, 3],
+                      'B': [4, 5, 6],
+                      'C': [7, 8, 9]})
+   df.where(lambda x: x > 4, lambda x: x + 10)
+
+``.loc[]``, ``.iloc[]``, ``.ix[]``
+""""""""""""""""""""""""""""""""""
+
+These can accept a callable, and a tuple of callable as a slicer. The callable
+can return a valid boolean indexer or anything which is valid for these indexer's input.
+
+.. ipython:: python
+
+   # callable returns bool indexer
+   df.loc[lambda x: x.A >= 2, lambda x: x.sum() > 10]
+
+   # callable returns list of labels
+   df.loc[lambda x: [1, 2], lambda x: ['A', 'B']]
+
+``[]`` indexing
+"""""""""""""""
+
+Finally, you can use a callable in ``[]`` indexing of Series, DataFrame and Panel.
+The callable must return a valid input for ``[]`` indexing depending on its
+class and index type.
+
+.. ipython:: python
+
+   df[lambda x: 'A']
+
+Using these methods / indexers, you can chain data selection operations
+without using temporary variable.
+
+.. ipython:: python
+
+   bb = pd.read_csv('data/baseball.csv', index_col='id')
+   (bb.groupby(['year', 'team'])
+      .sum()
+      .loc[lambda df: df.r > 100]
+   )
+
+.. _whatsnew_0181.partial_string_indexing:
+
+Partial string indexing on ``DateTimeIndex`` when part of a ``MultiIndex``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Partial string indexing now matches on ``DateTimeIndex`` when part of a ``MultiIndex`` (:issue:`10331`)
+
+.. ipython:: python
+
+   dft2 = pd.DataFrame(np.random.randn(20, 1),
+                       columns=['A'],
+                       index=pd.MultiIndex.from_product([pd.date_range('20130101',
+                                                                       periods=10,
+                                                                       freq='12H'),
+                                                        ['a', 'b']]))
+   dft2
+   dft2.loc['2013-01-05']
+
+On other levels
+
+.. ipython:: python
+
+   idx = pd.IndexSlice
+   dft2 = dft2.swaplevel(0, 1).sort_index()
+   dft2
+   dft2.loc[idx[:, '2013-01-05'], :]
+
+.. _whatsnew_0181.enhancements.assembling:
+
+Assembling Datetimes
+^^^^^^^^^^^^^^^^^^^^
+
+``pd.to_datetime()`` has gained the ability to assemble datetimes from a passed in ``DataFrame`` or a dict. (:issue:`8158`).
+
+.. ipython:: python
+
+   df = pd.DataFrame({'year': [2015, 2016],
+                      'month': [2, 3],
+                      'day': [4, 5],
+                      'hour': [2, 3]})
+   df
+
+Assembling using the passed frame.
+
+.. ipython:: python
+
+   pd.to_datetime(df)
+
+You can pass only the columns that you need to assemble.
+
+.. ipython:: python
+
+   pd.to_datetime(df[['year', 'month', 'day']])
+
+.. _whatsnew_0181.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+- ``pd.read_csv()`` now supports ``delim_whitespace=True`` for the Python engine (:issue:`12958`)
+- ``pd.read_csv()`` now supports opening ZIP files that contains a single CSV, via extension inference or explicit ``compression='zip'`` (:issue:`12175`)
+- ``pd.read_csv()`` now supports opening files using xz compression, via extension inference or explicit ``compression='xz'`` is specified; ``xz`` compressions is also supported by ``DataFrame.to_csv`` in the same way (:issue:`11852`)
+- ``pd.read_msgpack()`` now always gives writeable ndarrays even when compression is used (:issue:`12359`).
+- ``pd.read_msgpack()`` now supports serializing and de-serializing categoricals with msgpack (:issue:`12573`)
+- ``.to_json()`` now supports ``NDFrames`` that contain categorical and sparse data (:issue:`10778`)
+- ``interpolate()`` now supports ``method='akima'`` (:issue:`7588`).
+- ``pd.read_excel()`` now accepts path objects (e.g. ``pathlib.Path``, ``py.path.local``) for the file path, in line with other ``read_*`` functions (:issue:`12655`)
+- Added ``.weekday_name`` property as a component to ``DatetimeIndex`` and the ``.dt`` accessor. (:issue:`11128`)
+
+- ``Index.take`` now handles ``allow_fill`` and ``fill_value`` consistently (:issue:`12631`)
+
+  .. ipython:: python
+
+     idx = pd.Index([1., 2., 3., 4.], dtype='float')
+
+     # default, allow_fill=True, fill_value=None
+     idx.take([2, -1])
+     idx.take([2, -1], fill_value=True)
+
+- ``Index`` now supports ``.str.get_dummies()`` which returns ``MultiIndex``, see :ref:`Creating Indicator Variables <text.indicator>` (:issue:`10008`, :issue:`10103`)
+
+  .. ipython:: python
+
+     idx = pd.Index(['a|b', 'a|c', 'b|c'])
+     idx.str.get_dummies('|')
+
+
+- ``pd.crosstab()`` has gained a ``normalize`` argument for normalizing frequency tables (:issue:`12569`). Examples in the updated docs :ref:`here <reshaping.crosstabulations>`.
+- ``.resample(..).interpolate()`` is now supported (:issue:`12925`)
+- ``.isin()`` now accepts passed ``sets`` (:issue:`12988`)
+
+.. _whatsnew_0181.sparse:
+
+Sparse changes
+~~~~~~~~~~~~~~
+
+These changes conform sparse handling to return the correct types and work to make a smoother experience with indexing.
+
+``SparseArray.take`` now returns a scalar for scalar input, ``SparseArray`` for others. Furthermore, it handles a negative indexer with the same rule as ``Index`` (:issue:`10560`, :issue:`12796`)
+
+.. ipython:: python
+
+   s = pd.SparseArray([np.nan, np.nan, 1, 2, 3, np.nan, 4, 5, np.nan, 6])
+   s.take(0)
+   s.take([1, 2, 3])
+
+- Bug in ``SparseSeries[]`` indexing with ``Ellipsis`` raises ``KeyError`` (:issue:`9467`)
+- Bug in ``SparseArray[]`` indexing with tuples are not handled properly (:issue:`12966`)
+- Bug in ``SparseSeries.loc[]`` with list-like input raises ``TypeError`` (:issue:`10560`)
+- Bug in ``SparseSeries.iloc[]`` with scalar input may raise ``IndexError`` (:issue:`10560`)
+- Bug in ``SparseSeries.loc[]``, ``.iloc[]`` with ``slice`` returns ``SparseArray``, rather than ``SparseSeries`` (:issue:`10560`)
+- Bug in ``SparseDataFrame.loc[]``, ``.iloc[]`` may results in dense ``Series``, rather than ``SparseSeries`` (:issue:`12787`)
+- Bug in ``SparseArray`` addition ignores ``fill_value`` of right hand side (:issue:`12910`)
+- Bug in ``SparseArray`` mod raises ``AttributeError`` (:issue:`12910`)
+- Bug in ``SparseArray`` pow calculates ``1 ** np.nan`` as ``np.nan`` which must be 1 (:issue:`12910`)
+- Bug in ``SparseArray`` comparison output may incorrect result or raise ``ValueError`` (:issue:`12971`)
+- Bug in ``SparseSeries.__repr__`` raises ``TypeError`` when it is longer than ``max_rows`` (:issue:`10560`)
+- Bug in ``SparseSeries.shape`` ignores ``fill_value`` (:issue:`10452`)
+- Bug in ``SparseSeries`` and ``SparseArray`` may have different ``dtype`` from its dense values (:issue:`12908`)
+- Bug in ``SparseSeries.reindex`` incorrectly handle ``fill_value`` (:issue:`12797`)
+- Bug in ``SparseArray.to_frame()`` results in ``DataFrame``, rather than ``SparseDataFrame`` (:issue:`9850`)
+- Bug in ``SparseSeries.value_counts()`` does not count ``fill_value`` (:issue:`6749`)
+- Bug in ``SparseArray.to_dense()`` does not preserve ``dtype`` (:issue:`10648`)
+- Bug in ``SparseArray.to_dense()`` incorrectly handle ``fill_value`` (:issue:`12797`)
+- Bug in ``pd.concat()`` of ``SparseSeries`` results in dense (:issue:`10536`)
+- Bug in ``pd.concat()`` of ``SparseDataFrame`` incorrectly handle ``fill_value`` (:issue:`9765`)
+- Bug in ``pd.concat()`` of ``SparseDataFrame`` may raise ``AttributeError`` (:issue:`12174`)
+- Bug in ``SparseArray.shift()`` may raise ``NameError`` or ``TypeError`` (:issue:`12908`)
+
+.. _whatsnew_0181.api:
+
+API changes
+~~~~~~~~~~~
+
+.. _whatsnew_0181.api.groubynth:
+
+``.groupby(..).nth()`` changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The index in ``.groupby(..).nth()`` output is now more consistent when the ``as_index`` argument is passed (:issue:`11039`):
+
+.. ipython:: python
+
+   df = DataFrame({'A' : ['a', 'b', 'a'],
+                   'B' : [1, 2, 3]})
+   df
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [3]: df.groupby('A', as_index=True)['B'].nth(0)
+   Out[3]:
+   0    1
+   1    2
+   Name: B, dtype: int64
+
+   In [4]: df.groupby('A', as_index=False)['B'].nth(0)
+   Out[4]:
+   0    1
+   1    2
+   Name: B, dtype: int64
+
+New Behavior:
+
+.. ipython:: python
+
+    df.groupby('A', as_index=True)['B'].nth(0)
+    df.groupby('A', as_index=False)['B'].nth(0)
+
+Furthermore, previously, a ``.groupby`` would always sort, regardless if ``sort=False`` was passed with ``.nth()``.
+
+.. ipython:: python
+
+   np.random.seed(1234)
+   df = pd.DataFrame(np.random.randn(100, 2), columns=['a', 'b'])
+   df['c'] = np.random.randint(0, 4, 100)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [4]: df.groupby('c', sort=True).nth(1)
+   Out[4]:
+             a         b
+   c
+   0 -0.334077  0.002118
+   1  0.036142 -2.074978
+   2 -0.720589  0.887163
+   3  0.859588 -0.636524
+
+   In [5]: df.groupby('c', sort=False).nth(1)
+   Out[5]:
+             a         b
+   c
+   0 -0.334077  0.002118
+   1  0.036142 -2.074978
+   2 -0.720589  0.887163
+   3  0.859588 -0.636524
+
+New Behavior:
+
+.. ipython:: python
+
+   df.groupby('c', sort=True).nth(1)
+   df.groupby('c', sort=False).nth(1)
+
+
+.. _whatsnew_0181.numpy_compatibility:
+
+numpy function compatibility
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Compatibility between pandas array-like methods (e.g. ``sum`` and ``take``) and their ``numpy``
+counterparts has been greatly increased by augmenting the signatures of the ``pandas`` methods so
+as to accept arguments that can be passed in from ``numpy``, even if they are not necessarily
+used in the ``pandas`` implementation (:issue:`12644`, :issue:`12638`, :issue:`12687`)
+
+- ``.searchsorted()`` for ``Index`` and ``TimedeltaIndex`` now accept a ``sorter`` argument to maintain compatibility with numpy's ``searchsorted`` function (:issue:`12238`)
+- Bug in numpy compatibility of ``np.round()`` on a ``Series`` (:issue:`12600`)
+
+An example of this signature augmentation is illustrated below:
+
+.. ipython:: python
+
+   sp = pd.SparseDataFrame([1, 2, 3])
+   sp
+
+Previous behaviour:
+
+.. code-block:: ipython
+
+   In [2]: np.cumsum(sp, axis=0)
+   ...
+   TypeError: cumsum() takes at most 2 arguments (4 given)
+
+New behaviour:
+
+.. ipython:: python
+
+   np.cumsum(sp, axis=0)
+
+.. _whatsnew_0181.apply_resample:
+
+Using ``.apply`` on groupby resampling
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Using ``apply`` on resampling groupby operations (using a ``pd.TimeGrouper``) now has the same output types as similar ``apply`` calls on other groupby operations. (:issue:`11742`).
+
+.. ipython:: python
+
+    df = pd.DataFrame({'date': pd.to_datetime(['10/10/2000', '11/10/2000']),
+                      'value': [10, 13]})
+    df
+
+Previous behavior:
+
+.. code-block:: ipython
+
+    In [1]: df.groupby(pd.TimeGrouper(key='date', freq='M')).apply(lambda x: x.value.sum())
+    Out[1]:
+    ...
+    TypeError: cannot concatenate a non-NDFrame object
+
+    # Output is a Series
+    In [2]: df.groupby(pd.TimeGrouper(key='date', freq='M')).apply(lambda x: x[['value']].sum())
+    Out[2]:
+    date
+    2000-10-31  value    10
+    2000-11-30  value    13
+    dtype: int64
+
+New Behavior:
+
+.. code-block:: python
+
+    # Output is a Series
+    In [55]: df.groupby(pd.TimeGrouper(key='date', freq='M')).apply(lambda x: x.value.sum())
+    Out[55]:
+    date
+    2000-10-31    10
+    2000-11-30    13
+    Freq: M, dtype: int64
+
+    # Output is a DataFrame
+    In [56]: df.groupby(pd.TimeGrouper(key='date', freq='M')).apply(lambda x: x[['value']].sum())
+    Out[56]:
+                value
+    date
+    2000-10-31     10
+    2000-11-30     13
+
+.. _whatsnew_0181.read_csv_exceptions:
+
+Changes in ``read_csv`` exceptions
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In order to standardize the ``read_csv`` API for both the ``c`` and ``python`` engines, both will now raise an
+``EmptyDataError``, a subclass of ``ValueError``, in response to empty columns or header (:issue:`12493`, :issue:`12506`)
+
+Previous behaviour:
+
+.. code-block:: ipython
+
+   In [1]: df = pd.read_csv(StringIO(''), engine='c')
+   ...
+   ValueError: No columns to parse from file
+
+   In [2]: df = pd.read_csv(StringIO(''), engine='python')
+   ...
+   StopIteration
+
+New behaviour:
+
+.. code-block:: ipython
+
+   In [1]: df = pd.read_csv(StringIO(''), engine='c')
+   ...
+   pandas.io.common.EmptyDataError: No columns to parse from file
+
+   In [2]: df = pd.read_csv(StringIO(''), engine='python')
+   ...
+   pandas.io.common.EmptyDataError: No columns to parse from file
+
+In addition to this error change, several others have been made as well:
+
+- ``CParserError`` now sub-classes ``ValueError`` instead of just a ``Exception`` (:issue:`12551`)
+- A ``CParserError`` is now raised instead of a generic ``Exception`` in ``read_csv`` when the ``c`` engine cannot parse a column (:issue:`12506`)
+- A ``ValueError`` is now raised instead of a generic ``Exception`` in ``read_csv`` when the ``c`` engine encounters a ``NaN`` value in an integer column (:issue:`12506`)
+- A ``ValueError`` is now raised instead of a generic ``Exception`` in ``read_csv`` when ``true_values`` is specified, and the ``c`` engine encounters an element in a column containing unencodable bytes (:issue:`12506`)
+- ``pandas.parser.OverflowError`` exception has been removed and has been replaced with Python's built-in ``OverflowError`` exception (:issue:`12506`)
+- ``pd.read_csv()`` no longer allows a combination of strings and integers for the ``usecols`` parameter (:issue:`12678`)
+
+
+.. _whatsnew_0181.api.to_datetime:
+
+``to_datetime`` error changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Bugs in ``pd.to_datetime()`` when passing a ``unit`` with convertible entries and ``errors='coerce'`` or non-convertible with ``errors='ignore'``. Furthermore, an ``OutOfBoundsDateime`` exception will be raised when an out-of-range value is encountered for that unit when ``errors='raise'``. (:issue:`11758`, :issue:`13052`, :issue:`13059`)
+
+Previous behaviour:
+
+.. code-block:: ipython
+
+   In [27]: pd.to_datetime(1420043460, unit='s', errors='coerce')
+   Out[27]: NaT
+
+   In [28]: pd.to_datetime(11111111, unit='D', errors='ignore')
+   OverflowError: Python int too large to convert to C long
+
+   In [29]: pd.to_datetime(11111111, unit='D', errors='raise')
+   OverflowError: Python int too large to convert to C long
+
+New behaviour:
+
+.. code-block:: ipython
+
+   In [2]: pd.to_datetime(1420043460, unit='s', errors='coerce')
+   Out[2]: Timestamp('2014-12-31 16:31:00')
+
+   In [3]: pd.to_datetime(11111111, unit='D', errors='ignore')
+   Out[3]: 11111111
+
+   In [4]: pd.to_datetime(11111111, unit='D', errors='raise')
+   OutOfBoundsDatetime: cannot convert input with unit 'D'
+
+.. _whatsnew_0181.api.other:
+
+Other API changes
+^^^^^^^^^^^^^^^^^
+
+- ``.swaplevel()`` for ``Series``, ``DataFrame``, ``Panel``, and ``MultiIndex`` now features defaults for its first two parameters ``i`` and ``j`` that swap the two innermost levels of the index. (:issue:`12934`)
+- ``.searchsorted()`` for ``Index`` and ``TimedeltaIndex`` now accept a ``sorter`` argument to maintain compatibility with numpy's ``searchsorted`` function (:issue:`12238`)
+- ``Period`` and ``PeriodIndex`` now raises ``IncompatibleFrequency`` error which inherits ``ValueError`` rather than raw ``ValueError`` (:issue:`12615`)
+- ``Series.apply`` for category dtype now applies the passed function to each of the ``.categories`` (and not the ``.codes``), and returns a ``category`` dtype if possible (:issue:`12473`)
+- ``read_csv`` will now raise a ``TypeError`` if ``parse_dates`` is neither a boolean, list, or dictionary (matches the doc-string) (:issue:`5636`)
+- The default for ``.query()/.eval()`` is now ``engine=None``, which will use ``numexpr`` if it's installed; otherwise it will fallback to the ``python`` engine. This mimics the pre-0.18.1 behavior if ``numexpr`` is installed (and which, previously, if numexpr was not installed, ``.query()/.eval()`` would raise). (:issue:`12749`)
+- ``pd.show_versions()`` now includes ``pandas_datareader`` version (:issue:`12740`)
+- Provide a proper ``__name__`` and ``__qualname__`` attributes for generic functions (:issue:`12021`)
+- ``pd.concat(ignore_index=True)`` now uses ``RangeIndex`` as default (:issue:`12695`)
+- ``pd.merge()`` and ``DataFrame.join()`` will show a ``UserWarning`` when merging/joining a single- with a multi-leveled dataframe (:issue:`9455`, :issue:`12219`)
+- Compat with ``scipy`` > 0.17 for deprecated ``piecewise_polynomial`` interpolation method; support for the replacement ``from_derivatives`` method (:issue:`12887`)
+
+.. _whatsnew_0181.deprecations:
+
+Deprecations
+^^^^^^^^^^^^
+
+- The method name ``Index.sym_diff()`` is deprecated and can be replaced by ``Index.symmetric_difference()`` (:issue:`12591`)
+- The method name ``Categorical.sort()`` is deprecated in favor of ``Categorical.sort_values()`` (:issue:`12882`)
+
+
+
+
+
+
+
+
+.. _whatsnew_0181.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved speed of SAS reader (:issue:`12656`, :issue:`12961`)
+- Performance improvements in ``.groupby(..).cumcount()`` (:issue:`11039`)
+- Improved memory usage in ``pd.read_csv()`` when using ``skiprows=an_integer`` (:issue:`13005`)
+- Improved performance of ``DataFrame.to_sql`` when checking case sensitivity for tables. Now only checks if table has been created correctly when table name is not lower case. (:issue:`12876`)
+- Improved performance of ``Period`` construction and time series plotting (:issue:`12903`, :issue:`11831`).
+- Improved performance of ``.str.encode()`` and ``.str.decode()`` methods (:issue:`13008`)
+- Improved performance of ``to_numeric`` if input is numeric dtype (:issue:`12777`)
+- Improved performance of sparse arithmetic with ``IntIndex`` (:issue:`13036`)
+
+
+
+
+
+
+
+
+.. _whatsnew_0181.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+- ``usecols`` parameter in ``pd.read_csv`` is now respected even when the lines of a CSV file are not even (:issue:`12203`)
+- Bug in ``groupby.transform(..)`` when ``axis=1`` is specified with a non-monotonic ordered index (:issue:`12713`)
+- Bug in ``Period`` and ``PeriodIndex`` creation raises ``KeyError`` if ``freq="Minute"`` is specified. Note that "Minute" freq is deprecated in v0.17.0, and recommended to use ``freq="T"`` instead (:issue:`11854`)
+- Bug in ``.resample(...).count()`` with a ``PeriodIndex`` always raising a ``TypeError`` (:issue:`12774`)
+- Bug in ``.resample(...)`` with a ``PeriodIndex`` casting to a ``DatetimeIndex`` when empty (:issue:`12868`)
+- Bug in ``.resample(...)`` with a ``PeriodIndex`` when resampling to an existing frequency (:issue:`12770`)
+- Bug in printing data which contains ``Period`` with different ``freq`` raises ``ValueError`` (:issue:`12615`)
+- Bug in ``Series`` construction with ``Categorical`` and ``dtype='category'`` is specified (:issue:`12574`)
+- Bugs in concatenation with a coercible dtype was too aggressive, resulting in different dtypes in output formatting when an object was longer than ``display.max_rows`` (:issue:`12411`, :issue:`12045`, :issue:`11594`, :issue:`10571`, :issue:`12211`)
+- Bug in ``float_format`` option with option not being validated as a callable. (:issue:`12706`)
+- Bug in ``GroupBy.filter`` when ``dropna=False`` and no groups fulfilled the criteria (:issue:`12768`)
+- Bug in ``__name__`` of ``.cum*`` functions (:issue:`12021`)
+- Bug in ``.astype()`` of a ``Float64Inde/Int64Index`` to an ``Int64Index`` (:issue:`12881`)
+- Bug in round tripping an integer based index in ``.to_json()/.read_json()`` when ``orient='index'`` (the default) (:issue:`12866`)
+- Bug in plotting ``Categorical`` dtypes cause error when attempting stacked bar plot (:issue:`13019`)
+- Compat with >= ``numpy`` 1.11 for ``NaT`` comparisons (:issue:`12969`)
+- Bug in ``.drop()`` with a non-unique ``MultiIndex``. (:issue:`12701`)
+- Bug in ``.concat`` of datetime tz-aware and naive DataFrames (:issue:`12467`)
+- Bug in correctly raising a ``ValueError`` in ``.resample(..).fillna(..)`` when passing a non-string (:issue:`12952`)
+- Bug fixes in various encoding and header processing issues in ``pd.read_sas()`` (:issue:`12659`, :issue:`12654`, :issue:`12647`, :issue:`12809`)
+- Bug in ``pd.crosstab()`` where would silently ignore ``aggfunc`` if ``values=None`` (:issue:`12569`).
+- Potential segfault in ``DataFrame.to_json`` when serialising ``datetime.time`` (:issue:`11473`).
+- Potential segfault in ``DataFrame.to_json`` when attempting to serialise 0d array (:issue:`11299`).
+- Segfault in ``to_json`` when attempting to serialise a ``DataFrame`` or ``Series`` with non-ndarray values; now supports serialization of ``category``, ``sparse``, and ``datetime64[ns, tz]`` dtypes (:issue:`10778`).
+- Bug in ``DataFrame.to_json`` with unsupported dtype not passed to default handler (:issue:`12554`).
+- Bug in ``.align`` not returning the sub-class (:issue:`12983`)
+- Bug in aligning a ``Series`` with a ``DataFrame`` (:issue:`13037`)
+- Bug in ``ABCPanel`` in which ``Panel4D`` was not being considered as a valid instance of this generic type (:issue:`12810`)
+
+
+- Bug in consistency of ``.name`` on ``.groupby(..).apply(..)`` cases (:issue:`12363`)
+
+- Bug in ``Timestamp.__repr__`` that caused ``pprint`` to fail in nested structures (:issue:`12622`)
+- Bug in ``Timedelta.min`` and ``Timedelta.max``, the properties now report the true minimum/maximum ``timedeltas`` as recognized by pandas. See the :ref:`documentation <timedeltas.limitations>`. (:issue:`12727`)
+- Bug in ``.quantile()`` with interpolation may coerce to ``float`` unexpectedly (:issue:`12772`)
+- Bug in ``.quantile()`` with empty ``Series`` may return scalar rather than empty ``Series`` (:issue:`12772`)
+
+
+- Bug in ``.loc`` with out-of-bounds in a large indexer would raise ``IndexError`` rather than ``KeyError`` (:issue:`12527`)
+- Bug in resampling when using a ``TimedeltaIndex`` and ``.asfreq()``, would previously not include the final fencepost (:issue:`12926`)
+
+- Bug in equality testing with a ``Categorical`` in a ``DataFrame`` (:issue:`12564`)
+- Bug in ``GroupBy.first()``, ``.last()`` returns incorrect row when ``TimeGrouper`` is used (:issue:`7453`)
+
+
+
+- Bug in ``pd.read_csv()`` with the ``c`` engine when specifying ``skiprows`` with newlines in quoted items (:issue:`10911`, :issue:`12775`)
+- Bug in ``DataFrame`` timezone lost when assigning tz-aware datetime ``Series`` with alignment (:issue:`12981`)
+
+
+
+
+- Bug in ``.value_counts()`` when ``normalize=True`` and ``dropna=True`` where nulls still contributed to the normalized count (:issue:`12558`)
+- Bug in ``Series.value_counts()`` loses name if its dtype is ``category`` (:issue:`12835`)
+- Bug in ``Series.value_counts()`` loses timezone info (:issue:`12835`)
+- Bug in ``Series.value_counts(normalize=True)`` with ``Categorical`` raises ``UnboundLocalError`` (:issue:`12835`)
+- Bug in ``Panel.fillna()`` ignoring ``inplace=True`` (:issue:`12633`)
+- Bug in ``pd.read_csv()`` when specifying ``names``, ``usecols``, and ``parse_dates`` simultaneously with the ``c`` engine (:issue:`9755`)
+- Bug in ``pd.read_csv()`` when specifying ``delim_whitespace=True`` and ``lineterminator`` simultaneously with the ``c`` engine (:issue:`12912`)
+- Bug in ``Series.rename``, ``DataFrame.rename`` and ``DataFrame.rename_axis`` not treating ``Series`` as mappings to relabel (:issue:`12623`).
+- Clean in ``.rolling.min`` and ``.rolling.max`` to enhance dtype handling (:issue:`12373`)
+- Bug in ``groupby`` where complex types are coerced to float (:issue:`12902`)
+- Bug in ``Series.map`` raises ``TypeError`` if its dtype is ``category`` or tz-aware ``datetime`` (:issue:`12473`)
+
+- Bugs on 32bit platforms for some test comparisons (:issue:`12972`)
+- Bug in index coercion when falling back from ``RangeIndex`` construction (:issue:`12893`)
+- Better error message in window functions when invalid argument (e.g. a float window) is passed (:issue:`12669`)
+
+- Bug in slicing subclassed ``DataFrame`` defined to return subclassed ``Series`` may return normal ``Series`` (:issue:`11559`)
+
+
+- Bug in ``.str`` accessor methods may raise ``ValueError`` if input has ``name`` and the result is ``DataFrame`` or ``MultiIndex`` (:issue:`12617`)
+- Bug in ``DataFrame.last_valid_index()`` and ``DataFrame.first_valid_index()`` on empty frames (:issue:`12800`)
+
+
+- Bug in ``CategoricalIndex.get_loc`` returns different result from regular ``Index`` (:issue:`12531`)
+- Bug in ``PeriodIndex.resample`` where name not propagated (:issue:`12769`)
+
+- Bug in ``date_range`` ``closed`` keyword and timezones (:issue:`12684`).
+
+- Bug in ``pd.concat`` raises ``AttributeError`` when input data contains tz-aware datetime and timedelta (:issue:`12620`)
+- Bug in ``pd.concat`` did not handle empty ``Series`` properly (:issue:`11082`)
+
+- Bug in ``.plot.bar`` alignment when ``width`` is specified with ``int`` (:issue:`12979`)
+
+
+- Bug in ``fill_value`` is ignored if the argument to a binary operator is a constant (:issue:`12723`)
+
+- Bug in ``pd.read_html()`` when using bs4 flavor and parsing table with a header and only one column (:issue:`9178`)
+
+- Bug in ``.pivot_table`` when ``margins=True`` and ``dropna=True`` where nulls still contributed to margin count (:issue:`12577`)
+- Bug in ``.pivot_table`` when ``dropna=False`` where table index/column names disappear (:issue:`12133`)
+- Bug in ``pd.crosstab()`` when ``margins=True`` and ``dropna=False`` which raised (:issue:`12642`)
+
+- Bug in ``Series.name`` when ``name`` attribute can be a hashable type (:issue:`12610`)
+
+- Bug in ``.describe()`` resets categorical columns information (:issue:`11558`)
+- Bug where ``loffset`` argument was not applied when calling ``resample().count()`` on a timeseries (:issue:`12725`)
+- ``pd.read_excel()`` now accepts column names associated with keyword argument ``names`` (:issue:`12870`)
+- Bug in ``pd.to_numeric()`` with ``Index`` returns ``np.ndarray``, rather than ``Index`` (:issue:`12777`)
+- Bug in ``pd.to_numeric()`` with datetime-like may raise ``TypeError`` (:issue:`12777`)
+- Bug in ``pd.to_numeric()`` with scalar raises ``ValueError`` (:issue:`12777`)
diff --git a/doc/source/whatsnew/v0.19.0.txt b/doc/source/whatsnew/v0.19.0.txt
new file mode 100644
index 0000000000000..73fb124afef87
--- /dev/null
+++ b/doc/source/whatsnew/v0.19.0.txt
@@ -0,0 +1,1566 @@
+.. _whatsnew_0190:
+
+v0.19.0 (October 2, 2016)
+-------------------------
+
+This is a major release from 0.18.1 and includes number of API changes, several new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+Highlights include:
+
+- :func:`merge_asof` for asof-style time-series joining, see :ref:`here <whatsnew_0190.enhancements.asof_merge>`
+- ``.rolling()`` is now time-series aware, see :ref:`here <whatsnew_0190.enhancements.rolling_ts>`
+- :func:`read_csv` now supports parsing ``Categorical`` data, see :ref:`here <whatsnew_0190.enhancements.read_csv_categorical>`
+- A function :func:`union_categorical` has been added for combining categoricals, see :ref:`here <whatsnew_0190.enhancements.union_categoricals>`
+- ``PeriodIndex`` now has its own ``period`` dtype, and changed to be more consistent with other ``Index`` classes. See :ref:`here <whatsnew_0190.api.period>`
+- Sparse data structures gained enhanced support of ``int`` and ``bool`` dtypes, see :ref:`here <whatsnew_0190.sparse>`
+- Comparison operations with ``Series`` no longer ignores the index, see :ref:`here <whatsnew_0190.api.series_ops>` for an overview of the API changes.
+- Introduction of a pandas development API for utility functions, see :ref:`here <whatsnew_0190.dev_api>`.
+- Deprecation of ``Panel4D`` and ``PanelND``. We recommend to represent these types of n-dimensional data with the `xarray package <http://xarray.pydata.org/en/stable/>`__.
+- Removal of the previously deprecated modules ``pandas.io.data``, ``pandas.io.wb``, ``pandas.tools.rplot``.
+
+.. warning::
+
+    pandas >= 0.19.0 will no longer silence numpy ufunc warnings upon import, see :ref:`here <whatsnew_0190.errstate>`.
+
+.. contents:: What's new in v0.19.0
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0190.new_features:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0190.enhancements.asof_merge:
+
+``merge_asof`` for asof-style time-series joining
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+A long-time requested feature has been added through the :func:`merge_asof` function, to
+support asof style joining of time-series (:issue:`1870`, :issue:`13695`, :issue:`13709`, :issue:`13902`). Full documentation is
+:ref:`here <merging.merge_asof>`.
+
+The :func:`merge_asof` performs an asof merge, which is similar to a left-join
+except that we match on nearest key rather than equal keys.
+
+.. ipython:: python
+
+   left = pd.DataFrame({'a': [1, 5, 10],
+                        'left_val': ['a', 'b', 'c']})
+   right = pd.DataFrame({'a': [1, 2, 3, 6, 7],
+                        'right_val': [1, 2, 3, 6, 7]})
+
+   left
+   right
+
+We typically want to match exactly when possible, and use the most
+recent value otherwise.
+
+.. ipython:: python
+
+   pd.merge_asof(left, right, on='a')
+
+We can also match rows ONLY with prior data, and not an exact match.
+
+.. ipython:: python
+
+   pd.merge_asof(left, right, on='a', allow_exact_matches=False)
+
+
+In a typical time-series example, we have ``trades`` and ``quotes`` and we want to ``asof-join`` them.
+This also illustrates using the ``by`` parameter to group data before merging.
+
+.. ipython:: python
+
+   trades = pd.DataFrame({
+       'time': pd.to_datetime(['20160525 13:30:00.023',
+                               '20160525 13:30:00.038',
+                               '20160525 13:30:00.048',
+                               '20160525 13:30:00.048',
+                               '20160525 13:30:00.048']),
+       'ticker': ['MSFT', 'MSFT',
+                  'GOOG', 'GOOG', 'AAPL'],
+       'price': [51.95, 51.95,
+                 720.77, 720.92, 98.00],
+       'quantity': [75, 155,
+                    100, 100, 100]},
+       columns=['time', 'ticker', 'price', 'quantity'])
+
+   quotes = pd.DataFrame({
+       'time': pd.to_datetime(['20160525 13:30:00.023',
+                               '20160525 13:30:00.023',
+                               '20160525 13:30:00.030',
+                               '20160525 13:30:00.041',
+                               '20160525 13:30:00.048',
+                               '20160525 13:30:00.049',
+                               '20160525 13:30:00.072',
+                               '20160525 13:30:00.075']),
+       'ticker': ['GOOG', 'MSFT', 'MSFT',
+                  'MSFT', 'GOOG', 'AAPL', 'GOOG',
+                  'MSFT'],
+       'bid': [720.50, 51.95, 51.97, 51.99,
+               720.50, 97.99, 720.50, 52.01],
+       'ask': [720.93, 51.96, 51.98, 52.00,
+               720.93, 98.01, 720.88, 52.03]},
+       columns=['time', 'ticker', 'bid', 'ask'])
+
+.. ipython:: python
+
+   trades
+   quotes
+
+An asof merge joins on the ``on``, typically a datetimelike field, which is ordered, and
+in this case we are using a grouper in the ``by`` field. This is like a left-outer join, except
+that forward filling happens automatically taking the most recent non-NaN value.
+
+.. ipython:: python
+
+   pd.merge_asof(trades, quotes,
+                 on='time',
+                 by='ticker')
+
+This returns a merged DataFrame with the entries in the same order as the original left
+passed DataFrame (``trades`` in this case), with the fields of the ``quotes`` merged.
+
+.. _whatsnew_0190.enhancements.rolling_ts:
+
+``.rolling()`` is now time-series aware
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``.rolling()`` objects are now time-series aware and can accept a time-series offset (or convertible) for the ``window`` argument (:issue:`13327`, :issue:`12995`).
+See the full documentation :ref:`here <stats.moments.ts>`.
+
+.. ipython:: python
+
+   dft = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]},
+                      index=pd.date_range('20130101 09:00:00', periods=5, freq='s'))
+   dft
+
+This is a regular frequency index. Using an integer window parameter works to roll along the window frequency.
+
+.. ipython:: python
+
+   dft.rolling(2).sum()
+   dft.rolling(2, min_periods=1).sum()
+
+Specifying an offset allows a more intuitive specification of the rolling frequency.
+
+.. ipython:: python
+
+   dft.rolling('2s').sum()
+
+Using a non-regular, but still monotonic index, rolling with an integer window does not impart any special calculation.
+
+.. ipython:: python
+
+
+   dft = DataFrame({'B': [0, 1, 2, np.nan, 4]},
+                   index = pd.Index([pd.Timestamp('20130101 09:00:00'),
+                                     pd.Timestamp('20130101 09:00:02'),
+                                     pd.Timestamp('20130101 09:00:03'),
+                                     pd.Timestamp('20130101 09:00:05'),
+                                     pd.Timestamp('20130101 09:00:06')],
+                                    name='foo'))
+
+   dft
+   dft.rolling(2).sum()
+
+Using the time-specification generates variable windows for this sparse data.
+
+.. ipython:: python
+
+   dft.rolling('2s').sum()
+
+Furthermore, we now allow an optional ``on`` parameter to specify a column (rather than the
+default of the index) in a DataFrame.
+
+.. ipython:: python
+
+   dft = dft.reset_index()
+   dft
+   dft.rolling('2s', on='foo').sum()
+
+.. _whatsnew_0190.enhancements.read_csv_dupe_col_names_support:
+
+``read_csv`` has improved support for duplicate column names
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. ipython:: python
+   :suppress:
+
+   from pandas.compat import StringIO
+
+:ref:`Duplicate column names <io.dupe_names>` are now supported in :func:`read_csv` whether
+they are in the file or passed in as the ``names`` parameter (:issue:`7160`, :issue:`9424`)
+
+.. ipython:: python
+
+   data = '0,1,2\n3,4,5'
+   names = ['a', 'b', 'a']
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [2]: pd.read_csv(StringIO(data), names=names)
+   Out[2]:
+      a  b  a
+   0  2  1  2
+   1  5  4  5
+
+The first ``a`` column contained the same data as the second ``a`` column, when it should have
+contained the values ``[0, 3]``.
+
+**New behavior**:
+
+.. ipython:: python
+   :okwarning:
+
+   pd.read_csv(StringIO(data), names=names)
+
+
+.. _whatsnew_0190.enhancements.read_csv_categorical:
+
+``read_csv`` supports parsing ``Categorical`` directly
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :func:`read_csv` function now supports parsing a ``Categorical`` column when
+specified as a dtype (:issue:`10153`).  Depending on the structure of the data,
+this can result in a faster parse time and lower memory usage compared to
+converting to ``Categorical`` after parsing.  See the io :ref:`docs here <io.categorical>`.
+
+.. ipython:: python
+
+   data = 'col1,col2,col3\na,b,1\na,b,2\nc,d,3'
+
+   pd.read_csv(StringIO(data))
+   pd.read_csv(StringIO(data)).dtypes
+   pd.read_csv(StringIO(data), dtype='category').dtypes
+
+Individual columns can be parsed as a ``Categorical`` using a dict specification
+
+.. ipython:: python
+
+   pd.read_csv(StringIO(data), dtype={'col1': 'category'}).dtypes
+
+.. note::
+
+   The resulting categories will always be parsed as strings (object dtype).
+   If the categories are numeric they can be converted using the
+   :func:`to_numeric` function, or as appropriate, another converter
+   such as :func:`to_datetime`.
+
+   .. ipython:: python
+
+      df = pd.read_csv(StringIO(data), dtype='category')
+      df.dtypes
+      df['col3']
+      df['col3'].cat.categories = pd.to_numeric(df['col3'].cat.categories)
+      df['col3']
+
+.. _whatsnew_0190.enhancements.union_categoricals:
+
+Categorical Concatenation
+^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- A function :func:`union_categoricals` has been added for combining categoricals, see :ref:`Unioning Categoricals<categorical.union>` (:issue:`13361`, :issue:`13763`, :issue:`13846`, :issue:`14173`)
+
+  .. ipython:: python
+
+      from pandas.api.types import union_categoricals
+      a = pd.Categorical(["b", "c"])
+      b = pd.Categorical(["a", "b"])
+      union_categoricals([a, b])
+
+- ``concat`` and ``append`` now can concat ``category`` dtypes with different ``categories`` as ``object`` dtype (:issue:`13524`)
+
+  .. ipython:: python
+
+     s1 = pd.Series(['a', 'b'], dtype='category')
+     s2 = pd.Series(['b', 'c'], dtype='category')
+
+  **Previous behavior**:
+
+  .. code-block:: ipython
+
+     In [1]: pd.concat([s1, s2])
+     ValueError: incompatible categories in categorical concat
+
+  **New behavior**:
+
+  .. ipython:: python
+
+     pd.concat([s1, s2])
+
+.. _whatsnew_0190.enhancements.semi_month_offsets:
+
+Semi-Month Offsets
+^^^^^^^^^^^^^^^^^^
+
+Pandas has gained new frequency offsets, ``SemiMonthEnd`` ('SM') and ``SemiMonthBegin`` ('SMS').
+These provide date offsets anchored (by default) to the 15th and end of month, and 15th and 1st of month respectively.
+(:issue:`1543`)
+
+.. ipython:: python
+
+    from pandas.tseries.offsets import SemiMonthEnd, SemiMonthBegin
+
+**SemiMonthEnd**:
+
+.. ipython:: python
+
+    Timestamp('2016-01-01') + SemiMonthEnd()
+
+    pd.date_range('2015-01-01', freq='SM', periods=4)
+
+**SemiMonthBegin**:
+
+.. ipython:: python
+
+    Timestamp('2016-01-01') + SemiMonthBegin()
+
+    pd.date_range('2015-01-01', freq='SMS', periods=4)
+
+Using the anchoring suffix, you can also specify the day of month to use instead of the 15th.
+
+.. ipython:: python
+
+    pd.date_range('2015-01-01', freq='SMS-16', periods=4)
+
+    pd.date_range('2015-01-01', freq='SM-14', periods=4)
+
+.. _whatsnew_0190.enhancements.index:
+
+New Index methods
+^^^^^^^^^^^^^^^^^
+
+The following methods and options are added to ``Index``, to be more consistent with the ``Series`` and ``DataFrame`` API.
+
+``Index`` now supports the ``.where()`` function for same shape indexing (:issue:`13170`)
+
+.. ipython:: python
+
+   idx = pd.Index(['a', 'b', 'c'])
+   idx.where([True, False, True])
+
+
+``Index`` now supports ``.dropna()`` to exclude missing values (:issue:`6194`)
+
+.. ipython:: python
+
+   idx = pd.Index([1, 2, np.nan, 4])
+   idx.dropna()
+
+For ``MultiIndex``, values are dropped if any level is missing by default. Specifying
+``how='all'`` only drops values where all levels are missing.
+
+.. ipython:: python
+
+   midx = pd.MultiIndex.from_arrays([[1, 2, np.nan, 4],
+                                       [1, 2, np.nan, np.nan]])
+   midx
+   midx.dropna()
+   midx.dropna(how='all')
+
+``Index`` now supports ``.str.extractall()`` which returns a ``DataFrame``, see the :ref:`docs here <text.extractall>` (:issue:`10008`, :issue:`13156`)
+
+.. ipython:: python
+
+   idx = pd.Index(["a1a2", "b1", "c1"])
+   idx.str.extractall("[ab](?P<digit>\d)")
+
+``Index.astype()`` now accepts an optional boolean argument ``copy``, which allows optional copying if the requirements on dtype are satisfied (:issue:`13209`)
+
+.. _whatsnew_0190.gbq:
+
+Google BigQuery Enhancements
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- The :func:`read_gbq` method has gained the ``dialect`` argument to allow users to specify whether to use BigQuery's legacy SQL or BigQuery's standard SQL. See the `docs <https://pandas-gbq.readthedocs.io/en/latest/reading.html>`__ for more details (:issue:`13615`).
+- The :func:`~DataFrame.to_gbq` method now allows the DataFrame column order to differ from the destination table schema (:issue:`11359`).
+
+.. _whatsnew_0190.errstate:
+
+Fine-grained numpy errstate
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previous versions of pandas would permanently silence numpy's ufunc error handling when ``pandas`` was imported. Pandas did this in order to silence the warnings that would arise from using numpy ufuncs on missing data, which are usually represented as ``NaN`` s. Unfortunately, this silenced legitimate warnings arising in non-pandas code in the application. Starting with 0.19.0, pandas will use the ``numpy.errstate`` context manager to silence these warnings in a more fine-grained manner, only around where these operations are actually used in the pandas code base. (:issue:`13109`, :issue:`13145`)
+
+After upgrading pandas, you may see *new* ``RuntimeWarnings`` being issued from your code. These are likely legitimate, and the underlying cause likely existed in the code when using previous versions of pandas that simply silenced the warning. Use `numpy.errstate <http://docs.scipy.org/doc/numpy/reference/generated/numpy.errstate.html>`__ around the source of the ``RuntimeWarning`` to control how these conditions are handled.
+
+.. _whatsnew_0190.get_dummies_dtypes:
+
+``get_dummies`` now returns integer dtypes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The ``pd.get_dummies`` function now returns dummy-encoded columns as small integers, rather than floats (:issue:`8725`). This should provide an improved memory footprint.
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [1]: pd.get_dummies(['a', 'b', 'a', 'c']).dtypes
+
+   Out[1]:
+   a    float64
+   b    float64
+   c    float64
+   dtype: object
+
+**New behavior**:
+
+.. ipython:: python
+
+   pd.get_dummies(['a', 'b', 'a', 'c']).dtypes
+
+
+.. _whatsnew_0190.enhancements.to_numeric_downcast:
+
+Downcast values to smallest possible dtype in ``to_numeric``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``pd.to_numeric()`` now accepts a ``downcast`` parameter, which will downcast the data if possible to smallest specified numerical dtype (:issue:`13352`)
+
+.. ipython:: python
+
+   s = ['1', 2, 3]
+   pd.to_numeric(s, downcast='unsigned')
+   pd.to_numeric(s, downcast='integer')
+
+.. _whatsnew_0190.dev_api:
+
+pandas development API
+^^^^^^^^^^^^^^^^^^^^^^
+
+As part of making pandas API more uniform and accessible in the future, we have created a standard
+sub-package of pandas, ``pandas.api`` to hold public API's. We are starting by exposing type
+introspection functions in ``pandas.api.types``. More sub-packages and officially sanctioned API's
+will be published in future versions of pandas (:issue:`13147`, :issue:`13634`)
+
+The following are now part of this API:
+
+.. ipython:: python
+
+   import pprint
+   from pandas.api import types
+   funcs = [ f for f in dir(types) if not f.startswith('_') ]
+   pprint.pprint(funcs)
+
+.. note::
+
+   Calling these functions from the internal module ``pandas.core.common`` will now show a ``DeprecationWarning`` (:issue:`13990`)
+
+
+.. _whatsnew_0190.enhancements.other:
+
+Other enhancements
+^^^^^^^^^^^^^^^^^^
+
+- ``Timestamp`` can now accept positional and keyword parameters similar to :func:`datetime.datetime` (:issue:`10758`, :issue:`11630`)
+
+  .. ipython:: python
+
+    pd.Timestamp(2012, 1, 1)
+
+    pd.Timestamp(year=2012, month=1, day=1, hour=8, minute=30)
+
+- The ``.resample()`` function now accepts a ``on=`` or ``level=`` parameter for resampling on a datetimelike column or ``MultiIndex`` level (:issue:`13500`)
+
+  .. ipython:: python
+
+     df = pd.DataFrame({'date': pd.date_range('2015-01-01', freq='W', periods=5),
+                        'a': np.arange(5)},
+                       index=pd.MultiIndex.from_arrays([
+                                [1,2,3,4,5],
+                                pd.date_range('2015-01-01', freq='W', periods=5)],
+                            names=['v','d']))
+     df
+     df.resample('M', on='date').sum()
+     df.resample('M', level='d').sum()
+
+- The ``.get_credentials()`` method of ``GbqConnector`` can now first try to fetch `the application default credentials <https://developers.google.com/identity/protocols/application-default-credentials>`__. See the docs for more details (:issue:`13577`).
+- The ``.tz_localize()`` method of ``DatetimeIndex`` and ``Timestamp`` has gained the ``errors`` keyword, so you can potentially coerce nonexistent timestamps to ``NaT``. The default behavior remains to raising a ``NonExistentTimeError`` (:issue:`13057`)
+- ``.to_hdf/read_hdf()`` now accept path objects (e.g. ``pathlib.Path``, ``py.path.local``) for the file path (:issue:`11773`)
+- The ``pd.read_csv()`` with ``engine='python'`` has gained support for the
+  ``decimal`` (:issue:`12933`), ``na_filter`` (:issue:`13321`) and the ``memory_map`` option (:issue:`13381`).
+- Consistent with the Python API, ``pd.read_csv()`` will now interpret ``+inf`` as positive infinity (:issue:`13274`)
+- The ``pd.read_html()`` has gained support for the ``na_values``, ``converters``, ``keep_default_na``  options (:issue:`13461`)
+- ``Categorical.astype()`` now accepts an optional boolean argument ``copy``, effective when dtype is categorical (:issue:`13209`)
+- ``DataFrame`` has gained the ``.asof()`` method to return the last non-NaN values according to the selected subset (:issue:`13358`)
+- The ``DataFrame`` constructor will now respect key ordering if a list of ``OrderedDict`` objects are passed in (:issue:`13304`)
+- ``pd.read_html()`` has gained support for the ``decimal`` option (:issue:`12907`)
+- ``Series`` has gained the properties ``.is_monotonic``, ``.is_monotonic_increasing``, ``.is_monotonic_decreasing``, similar to ``Index`` (:issue:`13336`)
+- ``DataFrame.to_sql()`` now allows a single value as the SQL type for all columns (:issue:`11886`).
+- ``Series.append`` now supports the ``ignore_index`` option (:issue:`13677`)
+- ``.to_stata()`` and ``StataWriter`` can now write variable labels to Stata dta files using a dictionary to make column names to labels (:issue:`13535`, :issue:`13536`)
+- ``.to_stata()`` and ``StataWriter`` will automatically convert ``datetime64[ns]`` columns to Stata format ``%tc``, rather than raising a ``ValueError`` (:issue:`12259`)
+- ``read_stata()`` and ``StataReader`` raise with a more explicit error message when reading Stata files with repeated value labels when ``convert_categoricals=True`` (:issue:`13923`)
+- ``DataFrame.style`` will now render sparsified MultiIndexes (:issue:`11655`)
+- ``DataFrame.style`` will now show column level names (e.g. ``DataFrame.columns.names``) (:issue:`13775`)
+- ``DataFrame`` has gained support to re-order the columns based on the values
+  in a row using ``df.sort_values(by='...', axis=1)`` (:issue:`10806`)
+
+  .. ipython:: python
+
+     df = pd.DataFrame({'A': [2, 7], 'B': [3, 5], 'C': [4, 8]},
+                       index=['row1', 'row2'])
+     df
+     df.sort_values(by='row2', axis=1)
+
+- Added documentation to :ref:`I/O<io.dtypes>` regarding the perils of reading in columns with mixed dtypes and how to handle it (:issue:`13746`)
+- :meth:`~DataFrame.to_html` now has a ``border`` argument to control the value in the opening ``<table>`` tag. The default is the value of the ``html.border`` option, which defaults to 1. This also affects the notebook HTML repr, but since Jupyter's CSS includes a border-width attribute, the visual effect is the same. (:issue:`11563`).
+- Raise ``ImportError`` in the sql functions when ``sqlalchemy`` is not installed and a connection string is used (:issue:`11920`).
+- Compatibility with matplotlib 2.0. Older versions of pandas should also work with matplotlib 2.0 (:issue:`13333`)
+- ``Timestamp``, ``Period``, ``DatetimeIndex``, ``PeriodIndex`` and ``.dt`` accessor have gained a ``.is_leap_year`` property to check whether the date belongs to a leap year. (:issue:`13727`)
+- ``astype()`` will now accept a dict of column name to data types mapping as the ``dtype`` argument. (:issue:`12086`)
+- The ``pd.read_json`` and ``DataFrame.to_json`` has gained support for reading and writing json lines with ``lines`` option see :ref:`Line delimited json <io.jsonl>` (:issue:`9180`)
+- :func:`read_excel` now supports the true_values and false_values keyword arguments (:issue:`13347`)
+- ``groupby()`` will now accept a scalar and a single-element list for specifying ``level`` on a non-``MultiIndex`` grouper. (:issue:`13907`)
+- Non-convertible dates in an excel date column will be returned without conversion and the column will be ``object`` dtype, rather than raising an exception (:issue:`10001`).
+- ``pd.Timedelta(None)`` is now accepted and will return ``NaT``, mirroring ``pd.Timestamp`` (:issue:`13687`)
+- ``pd.read_stata()`` can now handle some format 111 files, which are produced by SAS when generating Stata dta files (:issue:`11526`)
+- ``Series`` and ``Index`` now support ``divmod`` which will return a tuple of
+  series or indices. This behaves like a standard binary operator with regards
+  to broadcasting rules (:issue:`14208`).
+
+
+.. _whatsnew_0190.api:
+
+API changes
+~~~~~~~~~~~
+
+``Series.tolist()`` will now return Python types
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``Series.tolist()`` will now return Python types in the output, mimicking NumPy ``.tolist()`` behavior (:issue:`10904`)
+
+
+.. ipython:: python
+
+   s = pd.Series([1,2,3])
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [7]: type(s.tolist()[0])
+   Out[7]:
+    <class 'numpy.int64'>
+
+**New behavior**:
+
+.. ipython:: python
+
+   type(s.tolist()[0])
+
+.. _whatsnew_0190.api.series_ops:
+
+``Series`` operators for different indexes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Following ``Series`` operators have been changed to make all operators consistent,
+including ``DataFrame`` (:issue:`1134`, :issue:`4581`, :issue:`13538`)
+
+- ``Series`` comparison operators now raise ``ValueError`` when ``index`` are different.
+- ``Series`` logical operators align both ``index`` of left and right hand side.
+
+.. warning::
+   Until 0.18.1, comparing ``Series`` with the same length, would succeed even if
+   the ``.index`` are different (the result ignores ``.index``). As of 0.19.0, this will raises ``ValueError`` to be more strict. This section also describes how to keep previous behavior or align different indexes, using the flexible comparison methods like ``.eq``.
+
+
+As a result, ``Series`` and ``DataFrame`` operators behave as below:
+
+Arithmetic operators
+""""""""""""""""""""
+
+Arithmetic operators align both ``index`` (no changes).
+
+.. ipython:: python
+
+   s1 = pd.Series([1, 2, 3], index=list('ABC'))
+   s2 = pd.Series([2, 2, 2], index=list('ABD'))
+   s1 + s2
+
+   df1 = pd.DataFrame([1, 2, 3], index=list('ABC'))
+   df2 = pd.DataFrame([2, 2, 2], index=list('ABD'))
+   df1 + df2
+
+Comparison operators
+""""""""""""""""""""
+
+Comparison operators raise ``ValueError`` when ``.index`` are different.
+
+**Previous Behavior** (``Series``):
+
+``Series`` compared values ignoring the ``.index`` as long as both had the same length:
+
+.. code-block:: ipython
+
+   In [1]: s1 == s2
+   Out[1]:
+   A    False
+   B     True
+   C    False
+   dtype: bool
+
+**New behavior** (``Series``):
+
+.. code-block:: ipython
+
+   In [2]: s1 == s2
+   Out[2]:
+   ValueError: Can only compare identically-labeled Series objects
+
+.. note::
+
+   To achieve the same result as previous versions (compare values based on locations ignoring ``.index``), compare both ``.values``.
+
+   .. ipython:: python
+
+      s1.values == s2.values
+
+   If you want to compare ``Series`` aligning its ``.index``, see flexible comparison methods section below:
+
+   .. ipython:: python
+
+      s1.eq(s2)
+
+**Current Behavior** (``DataFrame``, no change):
+
+.. code-block:: ipython
+
+   In [3]: df1 == df2
+   Out[3]:
+   ValueError: Can only compare identically-labeled DataFrame objects
+
+Logical operators
+"""""""""""""""""
+
+Logical operators align both ``.index`` of left and right hand side.
+
+**Previous behavior** (``Series``), only left hand side ``index`` was kept:
+
+.. code-block:: ipython
+
+   In [4]: s1 = pd.Series([True, False, True], index=list('ABC'))
+   In [5]: s2 = pd.Series([True, True, True], index=list('ABD'))
+   In [6]: s1 & s2
+   Out[6]:
+   A     True
+   B    False
+   C    False
+   dtype: bool
+
+**New behavior** (``Series``):
+
+.. ipython:: python
+
+   s1 = pd.Series([True, False, True], index=list('ABC'))
+   s2 = pd.Series([True, True, True], index=list('ABD'))
+   s1 & s2
+
+.. note::
+   ``Series`` logical operators fill a ``NaN`` result with ``False``.
+
+.. note::
+   To achieve the same result as previous versions (compare values based on only left hand side index), you can use ``reindex_like``:
+
+   .. ipython:: python
+
+      s1 & s2.reindex_like(s1)
+
+**Current Behavior** (``DataFrame``, no change):
+
+.. ipython:: python
+
+   df1 = pd.DataFrame([True, False, True], index=list('ABC'))
+   df2 = pd.DataFrame([True, True, True], index=list('ABD'))
+   df1 & df2
+
+Flexible comparison methods
+"""""""""""""""""""""""""""
+
+``Series`` flexible comparison methods like ``eq``, ``ne``, ``le``, ``lt``, ``ge`` and ``gt`` now align both ``index``. Use these operators if you want to compare two ``Series``
+which has the different ``index``.
+
+.. ipython:: python
+
+   s1 = pd.Series([1, 2, 3], index=['a', 'b', 'c'])
+   s2 = pd.Series([2, 2, 2], index=['b', 'c', 'd'])
+   s1.eq(s2)
+   s1.ge(s2)
+
+Previously, this worked the same as comparison operators (see above).
+
+.. _whatsnew_0190.api.promote:
+
+``Series`` type promotion on assignment
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+A ``Series`` will now correctly promote its dtype for assignment with incompat values to the current dtype (:issue:`13234`)
+
+
+.. ipython:: python
+
+   s = pd.Series()
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [2]: s["a"] = pd.Timestamp("2016-01-01")
+
+   In [3]: s["b"] = 3.0
+   TypeError: invalid type promotion
+
+**New behavior**:
+
+.. ipython:: python
+
+   s["a"] = pd.Timestamp("2016-01-01")
+   s["b"] = 3.0
+   s
+   s.dtype
+
+.. _whatsnew_0190.api.to_datetime_coerce:
+
+``.to_datetime()`` changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously if ``.to_datetime()`` encountered mixed integers/floats and strings, but no datetimes with ``errors='coerce'`` it would convert all to ``NaT``.
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [2]: pd.to_datetime([1, 'foo'], errors='coerce')
+   Out[2]: DatetimeIndex(['NaT', 'NaT'], dtype='datetime64[ns]', freq=None)
+
+**Current behavior**:
+
+This will now convert integers/floats with the default unit of ``ns``.
+
+.. ipython:: python
+
+   pd.to_datetime([1, 'foo'], errors='coerce')
+
+Bug fixes related to ``.to_datetime()``:
+
+- Bug in ``pd.to_datetime()`` when passing integers or floats, and no ``unit`` and ``errors='coerce'`` (:issue:`13180`).
+- Bug in ``pd.to_datetime()`` when passing invalid data types (e.g. bool); will now respect the ``errors`` keyword (:issue:`13176`)
+- Bug in ``pd.to_datetime()`` which overflowed on ``int8``, and ``int16`` dtypes (:issue:`13451`)
+- Bug in ``pd.to_datetime()`` raise ``AttributeError`` with ``NaN`` and the other string is not valid when ``errors='ignore'`` (:issue:`12424`)
+- Bug in ``pd.to_datetime()`` did not cast floats correctly when ``unit`` was specified, resulting in truncated datetime (:issue:`13834`)
+
+.. _whatsnew_0190.api.merging:
+
+Merging changes
+^^^^^^^^^^^^^^^
+
+Merging will now preserve the dtype of the join keys (:issue:`8596`)
+
+.. ipython:: python
+
+   df1 = pd.DataFrame({'key': [1], 'v1': [10]})
+   df1
+   df2 = pd.DataFrame({'key': [1, 2], 'v1': [20, 30]})
+   df2
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [5]: pd.merge(df1, df2, how='outer')
+   Out[5]:
+      key    v1
+   0  1.0  10.0
+   1  1.0  20.0
+   2  2.0  30.0
+
+   In [6]: pd.merge(df1, df2, how='outer').dtypes
+   Out[6]:
+   key    float64
+   v1     float64
+   dtype: object
+
+**New behavior**:
+
+We are able to preserve the join keys
+
+.. ipython:: python
+
+   pd.merge(df1, df2, how='outer')
+   pd.merge(df1, df2, how='outer').dtypes
+
+Of course if you have missing values that are introduced, then the
+resulting dtype will be upcast, which is unchanged from previous.
+
+.. ipython:: python
+
+   pd.merge(df1, df2, how='outer', on='key')
+   pd.merge(df1, df2, how='outer', on='key').dtypes
+
+.. _whatsnew_0190.api.describe:
+
+``.describe()`` changes
+^^^^^^^^^^^^^^^^^^^^^^^
+
+Percentile identifiers in the index of a ``.describe()`` output will now be rounded to the least precision that keeps them distinct (:issue:`13104`)
+
+.. ipython:: python
+
+   s = pd.Series([0, 1, 2, 3, 4])
+   df = pd.DataFrame([0, 1, 2, 3, 4])
+
+**Previous behavior**:
+
+The percentiles were rounded to at most one decimal place, which could raise ``ValueError`` for a data frame if the percentiles were duplicated.
+
+.. code-block:: ipython
+
+   In [3]: s.describe(percentiles=[0.0001, 0.0005, 0.001, 0.999, 0.9995, 0.9999])
+   Out[3]:
+   count     5.000000
+   mean      2.000000
+   std       1.581139
+   min       0.000000
+   0.0%      0.000400
+   0.1%      0.002000
+   0.1%      0.004000
+   50%       2.000000
+   99.9%     3.996000
+   100.0%    3.998000
+   100.0%    3.999600
+   max       4.000000
+   dtype: float64
+
+   In [4]: df.describe(percentiles=[0.0001, 0.0005, 0.001, 0.999, 0.9995, 0.9999])
+   Out[4]:
+   ...
+   ValueError: cannot reindex from a duplicate axis
+
+**New behavior**:
+
+.. ipython:: python
+
+   s.describe(percentiles=[0.0001, 0.0005, 0.001, 0.999, 0.9995, 0.9999])
+   df.describe(percentiles=[0.0001, 0.0005, 0.001, 0.999, 0.9995, 0.9999])
+
+Furthermore:
+
+- Passing duplicated ``percentiles`` will now raise a ``ValueError``.
+- Bug in ``.describe()`` on a DataFrame with a mixed-dtype column index, which would previously raise a ``TypeError`` (:issue:`13288`)
+
+.. _whatsnew_0190.api.period:
+
+``Period`` changes
+^^^^^^^^^^^^^^^^^^
+
+``PeriodIndex`` now has ``period`` dtype
+""""""""""""""""""""""""""""""""""""""""
+
+``PeriodIndex`` now has its own ``period`` dtype. The ``period`` dtype is a
+pandas extension dtype like ``category`` or the :ref:`timezone aware dtype <timeseries.timezone_series>` (``datetime64[ns, tz]``) (:issue:`13941`).
+As a consequence of this change, ``PeriodIndex`` no longer has an integer dtype:
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [1]: pi = pd.PeriodIndex(['2016-08-01'], freq='D')
+
+   In [2]: pi
+   Out[2]: PeriodIndex(['2016-08-01'], dtype='int64', freq='D')
+
+   In [3]: pd.api.types.is_integer_dtype(pi)
+   Out[3]: True
+
+   In [4]: pi.dtype
+   Out[4]: dtype('int64')
+
+**New behavior**:
+
+.. ipython:: python
+
+   pi = pd.PeriodIndex(['2016-08-01'], freq='D')
+   pi
+   pd.api.types.is_integer_dtype(pi)
+   pd.api.types.is_period_dtype(pi)
+   pi.dtype
+   type(pi.dtype)
+
+.. _whatsnew_0190.api.periodnat:
+
+``Period('NaT')`` now returns ``pd.NaT``
+""""""""""""""""""""""""""""""""""""""""
+
+Previously, ``Period`` has its own ``Period('NaT')`` representation different from ``pd.NaT``. Now ``Period('NaT')`` has been changed to return ``pd.NaT``. (:issue:`12759`, :issue:`13582`)
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [5]: pd.Period('NaT', freq='D')
+   Out[5]: Period('NaT', 'D')
+
+**New behavior**:
+
+These result in ``pd.NaT`` without providing ``freq`` option.
+
+.. ipython:: python
+
+   pd.Period('NaT')
+   pd.Period(None)
+
+
+To be compatible with ``Period`` addition and subtraction, ``pd.NaT`` now supports addition and subtraction with ``int``. Previously it raised ``ValueError``.
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [5]: pd.NaT + 1
+   ...
+   ValueError: Cannot add integral value to Timestamp without freq.
+
+**New behavior**:
+
+.. ipython:: python
+
+   pd.NaT + 1
+   pd.NaT - 1
+
+``PeriodIndex.values`` now returns array of ``Period`` object
+"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""
+
+``.values`` is changed to return an array of ``Period`` objects, rather than an array
+of integers (:issue:`13988`).
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [6]: pi = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
+   In [7]: pi.values
+   array([492, 493])
+
+**New behavior**:
+
+.. ipython:: python
+
+   pi = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
+   pi.values
+
+
+.. _whatsnew_0190.api.setops:
+
+Index ``+`` / ``-`` no longer used for set operations
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Addition and subtraction of the base Index type and of DatetimeIndex
+(not the numeric index types)
+previously performed set operations (set union and difference). This
+behavior was already deprecated since 0.15.0 (in favor using the specific
+``.union()`` and ``.difference()`` methods), and is now disabled. When
+possible, ``+`` and ``-`` are now used for element-wise operations, for
+example for concatenating strings or subtracting datetimes
+(:issue:`8227`, :issue:`14127`).
+
+Previous behavior:
+
+.. code-block:: ipython
+
+    In [1]: pd.Index(['a', 'b']) + pd.Index(['a', 'c'])
+    FutureWarning: using '+' to provide set union with Indexes is deprecated, use '|' or .union()
+    Out[1]: Index(['a', 'b', 'c'], dtype='object')
+
+**New behavior**: the same operation will now perform element-wise addition:
+
+.. ipython:: python
+
+    pd.Index(['a', 'b']) + pd.Index(['a', 'c'])
+
+Note that numeric Index objects already performed element-wise operations.
+For example, the behavior of adding two integer Indexes is unchanged.
+The base ``Index`` is now made consistent with this behavior.
+
+.. ipython:: python
+
+    pd.Index([1, 2, 3]) + pd.Index([2, 3, 4])
+
+Further, because of this change, it is now possible to subtract two
+DatetimeIndex objects resulting in a TimedeltaIndex:
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+    In [1]: pd.DatetimeIndex(['2016-01-01', '2016-01-02']) - pd.DatetimeIndex(['2016-01-02', '2016-01-03'])
+    FutureWarning: using '-' to provide set differences with datetimelike Indexes is deprecated, use .difference()
+    Out[1]: DatetimeIndex(['2016-01-01'], dtype='datetime64[ns]', freq=None)
+
+**New behavior**:
+
+.. ipython:: python
+
+    pd.DatetimeIndex(['2016-01-01', '2016-01-02']) - pd.DatetimeIndex(['2016-01-02', '2016-01-03'])
+
+
+.. _whatsnew_0190.api.difference:
+
+``Index.difference`` and ``.symmetric_difference`` changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``Index.difference`` and ``Index.symmetric_difference`` will now, more consistently, treat ``NaN`` values as any other values. (:issue:`13514`)
+
+.. ipython:: python
+
+   idx1 = pd.Index([1, 2, 3, np.nan])
+   idx2 = pd.Index([0, 1, np.nan])
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [3]: idx1.difference(idx2)
+   Out[3]: Float64Index([nan, 2.0, 3.0], dtype='float64')
+
+   In [4]: idx1.symmetric_difference(idx2)
+   Out[4]: Float64Index([0.0, nan, 2.0, 3.0], dtype='float64')
+
+**New behavior**:
+
+.. ipython:: python
+
+   idx1.difference(idx2)
+   idx1.symmetric_difference(idx2)
+
+.. _whatsnew_0190.api.unique_index:
+
+``Index.unique`` consistently returns ``Index``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``Index.unique()`` now returns unique values as an
+``Index`` of the appropriate ``dtype``. (:issue:`13395`).
+Previously, most ``Index`` classes returned ``np.ndarray``, and ``DatetimeIndex``,
+``TimedeltaIndex`` and ``PeriodIndex`` returned ``Index`` to keep metadata like timezone.
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [1]: pd.Index([1, 2, 3]).unique()
+   Out[1]: array([1, 2, 3])
+
+   In [2]: pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'], tz='Asia/Tokyo').unique()
+   Out[2]:
+   DatetimeIndex(['2011-01-01 00:00:00+09:00', '2011-01-02 00:00:00+09:00',
+                  '2011-01-03 00:00:00+09:00'],
+                 dtype='datetime64[ns, Asia/Tokyo]', freq=None)
+
+**New behavior**:
+
+.. ipython:: python
+
+   pd.Index([1, 2, 3]).unique()
+   pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'], tz='Asia/Tokyo').unique()
+
+.. _whatsnew_0190.api.multiindex:
+
+``MultiIndex`` constructors, ``groupby`` and ``set_index`` preserve categorical dtypes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``MultiIndex.from_arrays`` and ``MultiIndex.from_product`` will now preserve categorical dtype
+in ``MultiIndex`` levels (:issue:`13743`, :issue:`13854`).
+
+.. ipython:: python
+
+   cat = pd.Categorical(['a', 'b'], categories=list("bac"))
+   lvl1 = ['foo', 'bar']
+   midx = pd.MultiIndex.from_arrays([cat, lvl1])
+   midx
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [4]: midx.levels[0]
+   Out[4]: Index(['b', 'a', 'c'], dtype='object')
+
+   In [5]: midx.get_level_values[0]
+   Out[5]: Index(['a', 'b'], dtype='object')
+
+**New behavior**: the single level is now a ``CategoricalIndex``:
+
+.. ipython:: python
+
+   midx.levels[0]
+   midx.get_level_values(0)
+
+An analogous change has been made to ``MultiIndex.from_product``.
+As a consequence, ``groupby`` and ``set_index`` also preserve categorical dtypes in indexes
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [0, 1], 'B': [10, 11], 'C': cat})
+   df_grouped = df.groupby(by=['A', 'C']).first()
+   df_set_idx = df.set_index(['A', 'C'])
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [11]: df_grouped.index.levels[1]
+   Out[11]: Index(['b', 'a', 'c'], dtype='object', name='C')
+   In [12]: df_grouped.reset_index().dtypes
+   Out[12]:
+   A      int64
+   C     object
+   B    float64
+   dtype: object
+
+   In [13]: df_set_idx.index.levels[1]
+   Out[13]: Index(['b', 'a', 'c'], dtype='object', name='C')
+   In [14]: df_set_idx.reset_index().dtypes
+   Out[14]:
+   A      int64
+   C     object
+   B      int64
+   dtype: object
+
+**New behavior**:
+
+.. ipython:: python
+
+   df_grouped.index.levels[1]
+   df_grouped.reset_index().dtypes
+
+   df_set_idx.index.levels[1]
+   df_set_idx.reset_index().dtypes
+
+.. _whatsnew_0190.api.autogenerated_chunksize_index:
+
+``read_csv`` will progressively enumerate chunks
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+When :func:`read_csv` is called with ``chunksize=n`` and without specifying an index,
+each chunk used to have an independently generated index from ``0`` to ``n-1``.
+They are now given instead a progressive index, starting from ``0`` for the first chunk,
+from ``n`` for the second, and so on, so that, when concatenated, they are identical to
+the result of calling :func:`read_csv` without the ``chunksize=`` argument
+(:issue:`12185`).
+
+.. ipython :: python
+
+   data = 'A,B\n0,1\n2,3\n4,5\n6,7'
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [2]: pd.concat(pd.read_csv(StringIO(data), chunksize=2))
+   Out[2]:
+      A  B
+   0  0  1
+   1  2  3
+   0  4  5
+   1  6  7
+
+**New behavior**:
+
+.. ipython :: python
+
+   pd.concat(pd.read_csv(StringIO(data), chunksize=2))
+
+.. _whatsnew_0190.sparse:
+
+Sparse Changes
+^^^^^^^^^^^^^^
+
+These changes allow pandas to handle sparse data with more dtypes, and for work to make a smoother experience with data handling.
+
+``int64`` and ``bool`` support enhancements
+"""""""""""""""""""""""""""""""""""""""""""
+
+Sparse data structures now gained enhanced support of ``int64`` and ``bool`` ``dtype`` (:issue:`667`, :issue:`13849`).
+
+Previously, sparse data were ``float64`` dtype by default, even if all inputs were of ``int`` or ``bool`` dtype. You had to specify ``dtype`` explicitly to create sparse data with ``int64`` dtype. Also, ``fill_value`` had to be specified explicitly because the default was ``np.nan`` which doesn't appear in ``int64`` or ``bool`` data.
+
+.. code-block:: ipython
+
+   In [1]: pd.SparseArray([1, 2, 0, 0])
+   Out[1]:
+   [1.0, 2.0, 0.0, 0.0]
+   Fill: nan
+   IntIndex
+   Indices: array([0, 1, 2, 3], dtype=int32)
+
+   # specifying int64 dtype, but all values are stored in sp_values because
+   # fill_value default is np.nan
+   In [2]: pd.SparseArray([1, 2, 0, 0], dtype=np.int64)
+   Out[2]:
+   [1, 2, 0, 0]
+   Fill: nan
+   IntIndex
+   Indices: array([0, 1, 2, 3], dtype=int32)
+
+   In [3]: pd.SparseArray([1, 2, 0, 0], dtype=np.int64, fill_value=0)
+   Out[3]:
+   [1, 2, 0, 0]
+   Fill: 0
+   IntIndex
+   Indices: array([0, 1], dtype=int32)
+
+As of v0.19.0, sparse data keeps the input dtype, and uses more appropriate ``fill_value`` defaults (``0`` for ``int64`` dtype, ``False`` for ``bool`` dtype).
+
+.. ipython:: python
+
+   pd.SparseArray([1, 2, 0, 0], dtype=np.int64)
+   pd.SparseArray([True, False, False, False])
+
+See the :ref:`docs <sparse.dtype>` for more details.
+
+Operators now preserve dtypes
+"""""""""""""""""""""""""""""
+
+- Sparse data structure now can preserve ``dtype`` after arithmetic ops (:issue:`13848`)
+
+  .. ipython:: python
+
+      s = pd.SparseSeries([0, 2, 0, 1], fill_value=0, dtype=np.int64)
+      s.dtype
+
+      s + 1
+
+- Sparse data structure now support ``astype`` to convert internal ``dtype`` (:issue:`13900`)
+
+  .. ipython:: python
+
+      s = pd.SparseSeries([1., 0., 2., 0.], fill_value=0)
+      s
+      s.astype(np.int64)
+
+  ``astype`` fails if data contains values which cannot be converted to specified ``dtype``.
+  Note that the limitation is applied to ``fill_value`` which default is ``np.nan``.
+
+  .. code-block:: ipython
+
+     In [7]: pd.SparseSeries([1., np.nan, 2., np.nan], fill_value=np.nan).astype(np.int64)
+     Out[7]:
+     ValueError: unable to coerce current fill_value nan to int64 dtype
+
+Other sparse fixes
+""""""""""""""""""
+
+- Subclassed ``SparseDataFrame`` and ``SparseSeries`` now preserve class types when slicing or transposing. (:issue:`13787`)
+- ``SparseArray`` with ``bool`` dtype now supports logical (bool) operators (:issue:`14000`)
+- Bug in ``SparseSeries`` with ``MultiIndex`` ``[]`` indexing may raise ``IndexError`` (:issue:`13144`)
+- Bug in ``SparseSeries`` with ``MultiIndex`` ``[]`` indexing result may have normal ``Index`` (:issue:`13144`)
+- Bug in ``SparseDataFrame`` in which ``axis=None`` did not default to ``axis=0`` (:issue:`13048`)
+- Bug in ``SparseSeries`` and ``SparseDataFrame`` creation with ``object`` dtype may raise ``TypeError`` (:issue:`11633`)
+- Bug in ``SparseDataFrame`` doesn't respect passed ``SparseArray`` or ``SparseSeries`` 's dtype and ``fill_value``  (:issue:`13866`)
+- Bug in ``SparseArray`` and ``SparseSeries`` don't apply ufunc to ``fill_value`` (:issue:`13853`)
+- Bug in ``SparseSeries.abs`` incorrectly keeps negative ``fill_value`` (:issue:`13853`)
+- Bug in single row slicing on multi-type ``SparseDataFrame`` s, types were previously forced to float (:issue:`13917`)
+- Bug in ``SparseSeries`` slicing changes integer dtype to float (:issue:`8292`)
+- Bug in ``SparseDataFarme`` comparison ops may raise ``TypeError`` (:issue:`13001`)
+- Bug in ``SparseDataFarme.isnull`` raises ``ValueError`` (:issue:`8276`)
+- Bug in ``SparseSeries`` representation with ``bool`` dtype may raise ``IndexError`` (:issue:`13110`)
+- Bug in ``SparseSeries`` and ``SparseDataFrame`` of ``bool`` or ``int64`` dtype may display its values like ``float64`` dtype (:issue:`13110`)
+- Bug in sparse indexing using ``SparseArray`` with ``bool`` dtype may return incorrect result  (:issue:`13985`)
+- Bug in ``SparseArray`` created from ``SparseSeries`` may lose ``dtype`` (:issue:`13999`)
+- Bug in ``SparseSeries`` comparison with dense returns normal ``Series`` rather than ``SparseSeries`` (:issue:`13999`)
+
+
+.. _whatsnew_0190.indexer_dtype:
+
+Indexer dtype changes
+^^^^^^^^^^^^^^^^^^^^^
+
+.. note::
+
+   This change only affects 64 bit python running on Windows, and only affects relatively advanced
+   indexing operations
+
+Methods such as ``Index.get_indexer`` that return an indexer array, coerce that array to a "platform int", so that it can be
+directly used in 3rd party library operations like ``numpy.take``.  Previously, a platform int was defined as ``np.int_``
+which corresponds to a C integer, but the correct type, and what is being used now, is ``np.intp``, which corresponds
+to the C integer size that can hold a pointer (:issue:`3033`, :issue:`13972`).
+
+These types are the same on many platform, but for 64 bit python on Windows,
+``np.int_`` is 32 bits, and ``np.intp`` is 64 bits.  Changing this behavior improves performance for many
+operations on that platform.
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [1]: i = pd.Index(['a', 'b', 'c'])
+
+   In [2]: i.get_indexer(['b', 'b', 'c']).dtype
+   Out[2]: dtype('int32')
+
+**New behavior**:
+
+.. code-block:: ipython
+
+   In [1]: i = pd.Index(['a', 'b', 'c'])
+
+   In [2]: i.get_indexer(['b', 'b', 'c']).dtype
+   Out[2]: dtype('int64')
+
+
+.. _whatsnew_0190.api.other:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+
+- ``Timestamp.to_pydatetime`` will issue a ``UserWarning`` when ``warn=True``, and the instance has a non-zero number of nanoseconds, previously this would print a message to stdout (:issue:`14101`).
+- ``Series.unique()`` with datetime and timezone now returns return array of ``Timestamp`` with timezone (:issue:`13565`).
+- ``Panel.to_sparse()`` will raise a ``NotImplementedError`` exception when called (:issue:`13778`).
+- ``Index.reshape()`` will raise a ``NotImplementedError`` exception when called (:issue:`12882`).
+- ``.filter()`` enforces mutual exclusion of the keyword arguments (:issue:`12399`).
+- ``eval``'s upcasting rules for ``float32`` types have been updated to be more consistent with NumPy's rules.  New behavior will not upcast to ``float64`` if you multiply a pandas ``float32`` object by a scalar float64 (:issue:`12388`).
+- An ``UnsupportedFunctionCall`` error is now raised if NumPy ufuncs like ``np.mean`` are called on groupby or resample objects (:issue:`12811`).
+- ``__setitem__`` will no longer apply a callable rhs as a function instead of storing it. Call ``where`` directly to get the previous behavior (:issue:`13299`).
+- Calls to ``.sample()`` will respect the random seed set via ``numpy.random.seed(n)`` (:issue:`13161`)
+- ``Styler.apply`` is now more strict about the outputs your function must return. For ``axis=0`` or ``axis=1``, the output shape must be identical. For ``axis=None``, the output must be a DataFrame with identical columns and index labels (:issue:`13222`).
+- ``Float64Index.astype(int)`` will now raise ``ValueError`` if ``Float64Index`` contains ``NaN`` values (:issue:`13149`)
+- ``TimedeltaIndex.astype(int)`` and ``DatetimeIndex.astype(int)`` will now return ``Int64Index`` instead of ``np.array`` (:issue:`13209`)
+- Passing ``Period`` with multiple frequencies to normal ``Index`` now returns ``Index`` with ``object`` dtype (:issue:`13664`)
+- ``PeriodIndex.fillna`` with ``Period`` has different freq now coerces to ``object`` dtype (:issue:`13664`)
+- Faceted boxplots from ``DataFrame.boxplot(by=col)`` now return a ``Series`` when ``return_type`` is not None. Previously these returned an ``OrderedDict``. Note that when ``return_type=None``, the default, these still return a 2-D NumPy array (:issue:`12216`, :issue:`7096`).
+- ``pd.read_hdf`` will now raise a ``ValueError`` instead of ``KeyError``, if a mode other than ``r``, ``r+`` and ``a`` is supplied. (:issue:`13623`)
+- ``pd.read_csv()``, ``pd.read_table()``, and ``pd.read_hdf()`` raise the builtin ``FileNotFoundError`` exception for Python 3.x when called on a nonexistent file; this is back-ported as ``IOError`` in Python 2.x (:issue:`14086`)
+- More informative exceptions are passed through the csv parser. The exception type would now be the original exception type instead of ``CParserError`` (:issue:`13652`).
+- ``pd.read_csv()`` in the C engine will now issue a ``ParserWarning`` or raise a ``ValueError`` when ``sep`` encoded is more than one character long (:issue:`14065`)
+- ``DataFrame.values`` will now return ``float64`` with a ``DataFrame`` of mixed ``int64`` and ``uint64`` dtypes, conforming to ``np.find_common_type`` (:issue:`10364`, :issue:`13917`)
+- ``.groupby.groups`` will now return a dictionary of ``Index`` objects, rather than a dictionary of ``np.ndarray`` or ``lists`` (:issue:`14293`)
+
+.. _whatsnew_0190.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+- ``Series.reshape`` and ``Categorical.reshape`` have been deprecated and will be removed in a subsequent release (:issue:`12882`, :issue:`12882`)
+- ``PeriodIndex.to_datetime`` has been deprecated in favor of ``PeriodIndex.to_timestamp`` (:issue:`8254`)
+- ``Timestamp.to_datetime`` has been deprecated in favor of ``Timestamp.to_pydatetime`` (:issue:`8254`)
+- ``Index.to_datetime`` and ``DatetimeIndex.to_datetime`` have been deprecated in favor of ``pd.to_datetime`` (:issue:`8254`)
+- ``pandas.core.datetools`` module has been deprecated and will be removed in a subsequent release (:issue:`14094`)
+- ``SparseList`` has been deprecated and will be removed in a future version (:issue:`13784`)
+- ``DataFrame.to_html()`` and ``DataFrame.to_latex()`` have dropped the ``colSpace`` parameter in favor of ``col_space`` (:issue:`13857`)
+- ``DataFrame.to_sql()`` has deprecated the ``flavor`` parameter, as it is superfluous when SQLAlchemy is not installed (:issue:`13611`)
+- Deprecated ``read_csv`` keywords:
+
+  - ``compact_ints`` and ``use_unsigned`` have been deprecated and will be removed in a future version (:issue:`13320`)
+  - ``buffer_lines`` has been deprecated and will be removed in a future version (:issue:`13360`)
+  - ``as_recarray`` has been deprecated and will be removed in a future version (:issue:`13373`)
+  - ``skip_footer`` has been deprecated in favor of ``skipfooter`` and will be removed in a future version (:issue:`13349`)
+
+- top-level ``pd.ordered_merge()`` has been renamed to ``pd.merge_ordered()`` and the original name will be removed in a future version (:issue:`13358`)
+- ``Timestamp.offset`` property (and named arg in the constructor), has been deprecated in favor of ``freq`` (:issue:`12160`)
+- ``pd.tseries.util.pivot_annual`` is deprecated. Use ``pivot_table`` as alternative, an example is :ref:`here <cookbook.pivot>` (:issue:`736`)
+- ``pd.tseries.util.isleapyear`` has been deprecated and will be removed in a subsequent release. Datetime-likes now have a ``.is_leap_year`` property (:issue:`13727`)
+- ``Panel4D`` and ``PanelND`` constructors are deprecated and will be removed in a future version. The recommended way to represent these types of n-dimensional data are with the `xarray package <http://xarray.pydata.org/en/stable/>`__. Pandas provides a :meth:`~Panel4D.to_xarray` method to automate this conversion (:issue:`13564`).
+- ``pandas.tseries.frequencies.get_standard_freq`` is deprecated. Use  ``pandas.tseries.frequencies.to_offset(freq).rule_code`` instead (:issue:`13874`)
+- ``pandas.tseries.frequencies.to_offset``'s ``freqstr`` keyword is deprecated in favor of ``freq`` (:issue:`13874`)
+- ``Categorical.from_array`` has been deprecated and will be removed in a future version (:issue:`13854`)
+
+.. _whatsnew_0190.prior_deprecations:
+
+Removal of prior version deprecations/changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+- The ``SparsePanel`` class has been removed (:issue:`13778`)
+- The ``pd.sandbox`` module has been removed in favor of the external library ``pandas-qt`` (:issue:`13670`)
+- The ``pandas.io.data`` and ``pandas.io.wb`` modules are removed in favor of
+  the `pandas-datareader package <https://github.com/pydata/pandas-datareader>`__ (:issue:`13724`).
+- The ``pandas.tools.rplot`` module has been removed in favor of
+  the `seaborn package <https://github.com/mwaskom/seaborn>`__ (:issue:`13855`)
+- ``DataFrame.to_csv()`` has dropped the ``engine`` parameter, as was deprecated in 0.17.1 (:issue:`11274`, :issue:`13419`)
+- ``DataFrame.to_dict()`` has dropped the ``outtype`` parameter in favor of ``orient`` (:issue:`13627`, :issue:`8486`)
+- ``pd.Categorical`` has dropped setting of the ``ordered`` attribute directly in favor of the ``set_ordered`` method (:issue:`13671`)
+- ``pd.Categorical`` has dropped the ``levels`` attribute in favor of ``categories`` (:issue:`8376`)
+- ``DataFrame.to_sql()`` has dropped the ``mysql`` option for the ``flavor`` parameter (:issue:`13611`)
+- ``Panel.shift()`` has dropped the ``lags`` parameter in favor of ``periods`` (:issue:`14041`)
+- ``pd.Index`` has dropped the ``diff`` method in favor of ``difference`` (:issue:`13669`)
+- ``pd.DataFrame`` has dropped the ``to_wide`` method in favor of ``to_panel`` (:issue:`14039`)
+- ``Series.to_csv`` has dropped the ``nanRep`` parameter in favor of ``na_rep`` (:issue:`13804`)
+- ``Series.xs``, ``DataFrame.xs``, ``Panel.xs``, ``Panel.major_xs``, and ``Panel.minor_xs`` have dropped the ``copy`` parameter (:issue:`13781`)
+- ``str.split`` has dropped the ``return_type`` parameter in favor of ``expand`` (:issue:`13701`)
+- Removal of the legacy time rules (offset aliases), deprecated since 0.17.0 (this has been alias since 0.8.0) (:issue:`13590`, :issue:`13868`). Now legacy time rules raises ``ValueError``. For the list of currently supported offsets, see :ref:`here <timeseries.offset_aliases>`.
+- The default value for the ``return_type`` parameter for ``DataFrame.plot.box`` and ``DataFrame.boxplot`` changed from ``None`` to ``"axes"``. These methods will now return a matplotlib axes by default instead of a dictionary of artists. See :ref:`here <visualization.box.return>` (:issue:`6581`).
+- The ``tquery`` and ``uquery`` functions in the ``pandas.io.sql`` module are removed (:issue:`5950`).
+
+
+.. _whatsnew_0190.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved performance of sparse ``IntIndex.intersect`` (:issue:`13082`)
+- Improved performance of sparse arithmetic with ``BlockIndex`` when the number of blocks are large, though recommended to use ``IntIndex`` in such cases (:issue:`13082`)
+- Improved performance of ``DataFrame.quantile()`` as it now operates per-block (:issue:`11623`)
+- Improved performance of float64 hash table operations, fixing some very slow indexing and groupby operations in python 3 (:issue:`13166`, :issue:`13334`)
+- Improved performance of ``DataFrameGroupBy.transform`` (:issue:`12737`)
+- Improved performance of ``Index`` and ``Series`` ``.duplicated`` (:issue:`10235`)
+- Improved performance of ``Index.difference`` (:issue:`12044`)
+- Improved performance of ``RangeIndex.is_monotonic_increasing`` and ``is_monotonic_decreasing`` (:issue:`13749`)
+- Improved performance of datetime string parsing in ``DatetimeIndex`` (:issue:`13692`)
+- Improved performance of hashing ``Period`` (:issue:`12817`)
+- Improved performance of ``factorize`` of datetime with timezone (:issue:`13750`)
+- Improved performance of by lazily creating indexing hashtables on larger Indexes (:issue:`14266`)
+- Improved performance of ``groupby.groups`` (:issue:`14293`)
+- Unnecessary materializing of a MultiIndex when introspecting for memory usage (:issue:`14308`)
+
+.. _whatsnew_0190.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Bug in ``groupby().shift()``, which could cause a segfault or corruption in rare circumstances when grouping by columns with missing values (:issue:`13813`)
+- Bug in ``groupby().cumsum()`` calculating ``cumprod`` when ``axis=1``. (:issue:`13994`)
+- Bug in ``pd.to_timedelta()`` in which the ``errors`` parameter was not being respected (:issue:`13613`)
+- Bug in ``io.json.json_normalize()``, where non-ascii keys raised an exception (:issue:`13213`)
+- Bug when passing a not-default-indexed ``Series`` as ``xerr`` or ``yerr`` in ``.plot()`` (:issue:`11858`)
+- Bug in area plot draws legend incorrectly if subplot is enabled or legend is moved after plot (matplotlib 1.5.0 is required to draw area plot legend properly) (:issue:`9161`, :issue:`13544`)
+- Bug in ``DataFrame`` assignment with an object-dtyped ``Index`` where the resultant column is mutable to the original object. (:issue:`13522`)
+- Bug in matplotlib ``AutoDataFormatter``; this restores the second scaled formatting and re-adds micro-second scaled formatting (:issue:`13131`)
+- Bug in selection from a ``HDFStore`` with a fixed format and ``start`` and/or ``stop`` specified will now return the selected range (:issue:`8287`)
+- Bug in ``Categorical.from_codes()`` where an unhelpful error was raised when an invalid ``ordered`` parameter was passed in (:issue:`14058`)
+- Bug in ``Series`` construction from a tuple of integers on windows not returning default dtype (int64) (:issue:`13646`)
+- Bug in ``TimedeltaIndex`` addition with a Datetime-like object where addition overflow was not being caught (:issue:`14068`)
+- Bug in ``.groupby(..).resample(..)`` when the same object is called multiple times (:issue:`13174`)
+- Bug in ``.to_records()`` when index name is a unicode string (:issue:`13172`)
+- Bug in calling ``.memory_usage()`` on object which doesn't implement (:issue:`12924`)
+- Regression in ``Series.quantile`` with nans (also shows up in ``.median()`` and ``.describe()`` ); furthermore now names the ``Series`` with the quantile (:issue:`13098`, :issue:`13146`)
+- Bug in ``SeriesGroupBy.transform`` with datetime values and missing groups (:issue:`13191`)
+- Bug where empty ``Series`` were incorrectly coerced in datetime-like numeric operations (:issue:`13844`)
+- Bug in ``Categorical`` constructor when passed a ``Categorical`` containing datetimes with timezones (:issue:`14190`)
+- Bug in ``Series.str.extractall()`` with ``str`` index raises ``ValueError``  (:issue:`13156`)
+- Bug in ``Series.str.extractall()`` with single group and quantifier  (:issue:`13382`)
+- Bug in ``DatetimeIndex`` and ``Period`` subtraction raises ``ValueError`` or ``AttributeError`` rather than ``TypeError`` (:issue:`13078`)
+- Bug in ``Index`` and ``Series`` created with ``NaN`` and ``NaT`` mixed data may not have ``datetime64`` dtype  (:issue:`13324`)
+- Bug in ``Index`` and ``Series`` may ignore ``np.datetime64('nat')`` and ``np.timdelta64('nat')`` to infer dtype (:issue:`13324`)
+- Bug in ``PeriodIndex`` and ``Period`` subtraction raises ``AttributeError`` (:issue:`13071`)
+- Bug in ``PeriodIndex`` construction returning a ``float64`` index in some circumstances (:issue:`13067`)
+- Bug in ``.resample(..)`` with a ``PeriodIndex`` not changing its ``freq`` appropriately when empty (:issue:`13067`)
+- Bug in ``.resample(..)`` with a ``PeriodIndex`` not retaining its type or name with an empty ``DataFrame`` appropriately when empty (:issue:`13212`)
+- Bug in ``groupby(..).apply(..)`` when the passed function returns scalar values per group (:issue:`13468`).
+- Bug in ``groupby(..).resample(..)`` where passing some keywords would raise an exception (:issue:`13235`)
+- Bug in ``.tz_convert`` on a tz-aware ``DateTimeIndex`` that relied on index being sorted for correct results (:issue:`13306`)
+- Bug in ``.tz_localize`` with ``dateutil.tz.tzlocal`` may return incorrect result (:issue:`13583`)
+- Bug in ``DatetimeTZDtype`` dtype with ``dateutil.tz.tzlocal`` cannot be regarded as valid dtype (:issue:`13583`)
+- Bug in ``pd.read_hdf()`` where attempting to load an HDF file with a single dataset, that had one or more categorical columns, failed unless the key argument was set to the name of the dataset. (:issue:`13231`)
+- Bug in ``.rolling()`` that allowed a negative integer window in construction of the ``Rolling()`` object, but would later fail on aggregation (:issue:`13383`)
+- Bug in ``Series`` indexing with tuple-valued data and a numeric index (:issue:`13509`)
+- Bug in printing ``pd.DataFrame`` where unusual elements with the ``object`` dtype were causing segfaults (:issue:`13717`)
+- Bug in ranking ``Series`` which could result in segfaults (:issue:`13445`)
+- Bug in various index types, which did not propagate the name of passed index (:issue:`12309`)
+- Bug in ``DatetimeIndex``, which did not honour the ``copy=True`` (:issue:`13205`)
+- Bug in ``DatetimeIndex.is_normalized`` returns incorrectly for normalized date_range in case of local timezones (:issue:`13459`)
+- Bug in ``pd.concat`` and ``.append`` may coerces ``datetime64`` and ``timedelta`` to ``object`` dtype containing python built-in ``datetime`` or ``timedelta`` rather than ``Timestamp`` or ``Timedelta`` (:issue:`13626`)
+- Bug in ``PeriodIndex.append`` may raises ``AttributeError`` when the result is ``object`` dtype (:issue:`13221`)
+- Bug in ``CategoricalIndex.append`` may accept normal ``list`` (:issue:`13626`)
+- Bug in ``pd.concat`` and ``.append`` with the same timezone get reset to UTC (:issue:`7795`)
+- Bug in ``Series`` and ``DataFrame`` ``.append`` raises ``AmbiguousTimeError`` if data contains datetime near DST boundary (:issue:`13626`)
+- Bug in ``DataFrame.to_csv()`` in which float values were being quoted even though quotations were specified for non-numeric values only (:issue:`12922`, :issue:`13259`)
+- Bug in ``DataFrame.describe()`` raising ``ValueError`` with only boolean columns (:issue:`13898`)
+- Bug in ``MultiIndex`` slicing where extra elements were returned when level is non-unique (:issue:`12896`)
+- Bug in ``.str.replace`` does not raise ``TypeError`` for invalid replacement (:issue:`13438`)
+- Bug in ``MultiIndex.from_arrays`` which didn't check for input array lengths matching (:issue:`13599`)
+- Bug in ``cartesian_product`` and ``MultiIndex.from_product`` which may raise with empty input arrays (:issue:`12258`)
+- Bug in ``pd.read_csv()`` which may cause a segfault or corruption when iterating in large chunks over a stream/file under rare circumstances (:issue:`13703`)
+- Bug in ``pd.read_csv()`` which caused errors to be raised when a dictionary containing scalars is passed in for ``na_values`` (:issue:`12224`)
+- Bug in ``pd.read_csv()`` which caused BOM files to be incorrectly parsed by not ignoring the BOM (:issue:`4793`)
+- Bug in ``pd.read_csv()`` with ``engine='python'`` which raised errors when a numpy array was passed in for ``usecols`` (:issue:`12546`)
+- Bug in ``pd.read_csv()`` where the index columns were being incorrectly parsed when parsed as dates with a ``thousands`` parameter (:issue:`14066`)
+- Bug in ``pd.read_csv()`` with ``engine='python'`` in which ``NaN`` values weren't being detected after data was converted to numeric values (:issue:`13314`)
+- Bug in ``pd.read_csv()`` in which the ``nrows`` argument was not properly validated for both engines (:issue:`10476`)
+- Bug in ``pd.read_csv()`` with ``engine='python'`` in which infinities of mixed-case forms were not being interpreted properly (:issue:`13274`)
+- Bug in ``pd.read_csv()`` with ``engine='python'`` in which trailing ``NaN`` values were not being parsed (:issue:`13320`)
+- Bug in ``pd.read_csv()`` with ``engine='python'`` when reading from a ``tempfile.TemporaryFile`` on Windows with Python 3 (:issue:`13398`)
+- Bug in ``pd.read_csv()`` that prevents ``usecols`` kwarg from accepting single-byte unicode strings (:issue:`13219`)
+- Bug in ``pd.read_csv()`` that prevents ``usecols`` from being an empty set (:issue:`13402`)
+- Bug in ``pd.read_csv()`` in the C engine where the NULL character was not being parsed as NULL (:issue:`14012`)
+- Bug in ``pd.read_csv()`` with ``engine='c'`` in which NULL ``quotechar`` was not accepted even though ``quoting`` was specified as ``None`` (:issue:`13411`)
+- Bug in ``pd.read_csv()`` with ``engine='c'`` in which fields were not properly cast to float when quoting was specified as non-numeric (:issue:`13411`)
+- Bug in ``pd.read_csv()`` in Python 2.x with non-UTF8 encoded, multi-character separated data (:issue:`3404`)
+- Bug in ``pd.read_csv()``, where aliases for utf-xx (e.g. UTF-xx, UTF_xx, utf_xx) raised UnicodeDecodeError (:issue:`13549`)
+- Bug in ``pd.read_csv``, ``pd.read_table``, ``pd.read_fwf``, ``pd.read_stata`` and ``pd.read_sas`` where files were opened by parsers but not closed if both ``chunksize`` and ``iterator`` were ``None``. (:issue:`13940`)
+- Bug in ``StataReader``, ``StataWriter``, ``XportReader`` and ``SAS7BDATReader`` where a file was not properly closed when an error was raised. (:issue:`13940`)
+- Bug in ``pd.pivot_table()`` where ``margins_name`` is ignored when ``aggfunc`` is a list (:issue:`13354`)
+- Bug in ``pd.Series.str.zfill``, ``center``, ``ljust``, ``rjust``, and ``pad`` when passing non-integers, did not raise ``TypeError`` (:issue:`13598`)
+- Bug in checking for any null objects in a ``TimedeltaIndex``, which always returned ``True`` (:issue:`13603`)
+- Bug in ``Series`` arithmetic raises ``TypeError`` if it contains datetime-like as ``object`` dtype (:issue:`13043`)
+- Bug ``Series.isnull()`` and ``Series.notnull()`` ignore ``Period('NaT')``  (:issue:`13737`)
+- Bug ``Series.fillna()`` and ``Series.dropna()`` don't affect to ``Period('NaT')``  (:issue:`13737`
+- Bug in ``.fillna(value=np.nan)`` incorrectly raises ``KeyError`` on a ``category`` dtyped ``Series`` (:issue:`14021`)
+- Bug in extension dtype creation where the created types were not is/identical (:issue:`13285`)
+- Bug in ``.resample(..)`` where incorrect warnings were triggered by IPython introspection (:issue:`13618`)
+- Bug in ``NaT`` - ``Period`` raises ``AttributeError`` (:issue:`13071`)
+- Bug in ``Series`` comparison may output incorrect result if rhs contains ``NaT`` (:issue:`9005`)
+- Bug in ``Series`` and ``Index`` comparison may output incorrect result if it contains ``NaT`` with ``object`` dtype (:issue:`13592`)
+- Bug in ``Period`` addition raises ``TypeError`` if ``Period`` is on right hand side (:issue:`13069`)
+- Bug in ``Peirod`` and ``Series`` or ``Index`` comparison raises ``TypeError`` (:issue:`13200`)
+- Bug in ``pd.set_eng_float_format()`` that would prevent NaN and Inf from formatting (:issue:`11981`)
+- Bug in ``.unstack`` with ``Categorical`` dtype resets ``.ordered`` to ``True`` (:issue:`13249`)
+- Clean some compile time warnings in datetime parsing (:issue:`13607`)
+- Bug in ``factorize`` raises ``AmbiguousTimeError`` if data contains datetime near DST boundary (:issue:`13750`)
+- Bug in ``.set_index`` raises ``AmbiguousTimeError`` if new index contains DST boundary and multi levels (:issue:`12920`)
+- Bug in ``.shift`` raises ``AmbiguousTimeError`` if data contains datetime near DST boundary (:issue:`13926`)
+- Bug in ``pd.read_hdf()`` returns incorrect result when a ``DataFrame`` with a ``categorical`` column and a query which doesn't match any values (:issue:`13792`)
+- Bug in ``.iloc`` when indexing with a non lexsorted MultiIndex (:issue:`13797`)
+- Bug in ``.loc`` when indexing with date strings in a reverse sorted ``DatetimeIndex`` (:issue:`14316`)
+- Bug in ``Series`` comparison operators when dealing with zero dim NumPy arrays (:issue:`13006`)
+- Bug in ``.combine_first`` may return incorrect ``dtype`` (:issue:`7630`, :issue:`10567`)
+- Bug in ``groupby`` where ``apply`` returns different result depending on whether first result is ``None`` or not (:issue:`12824`)
+- Bug in ``groupby(..).nth()`` where the group key is included inconsistently if called after ``.head()/.tail()`` (:issue:`12839`)
+- Bug in ``.to_html``, ``.to_latex`` and ``.to_string`` silently ignore custom datetime formatter passed through the ``formatters`` key word (:issue:`10690`)
+- Bug in ``DataFrame.iterrows()``, not yielding a ``Series`` subclasse if defined (:issue:`13977`)
+- Bug in ``pd.to_numeric`` when ``errors='coerce'`` and input contains non-hashable objects (:issue:`13324`)
+- Bug in invalid ``Timedelta`` arithmetic and comparison may raise ``ValueError`` rather than ``TypeError`` (:issue:`13624`)
+- Bug in invalid datetime parsing in ``to_datetime`` and ``DatetimeIndex`` may raise ``TypeError`` rather than ``ValueError`` (:issue:`11169`, :issue:`11287`)
+- Bug in ``Index`` created with tz-aware ``Timestamp`` and mismatched ``tz`` option incorrectly coerces timezone (:issue:`13692`)
+- Bug in ``DatetimeIndex`` with nanosecond frequency does not include timestamp specified with ``end`` (:issue:`13672`)
+- Bug in ```Series`` when setting a slice with a ``np.timedelta64`` (:issue:`14155`)
+- Bug in ``Index`` raises ``OutOfBoundsDatetime`` if ``datetime`` exceeds ``datetime64[ns]`` bounds, rather than coercing to ``object`` dtype (:issue:`13663`)
+- Bug in ``Index`` may ignore specified ``datetime64`` or ``timedelta64`` passed as ``dtype``  (:issue:`13981`)
+- Bug in ``RangeIndex`` can be created without no arguments rather than raises ``TypeError`` (:issue:`13793`)
+- Bug in ``.value_counts()`` raises ``OutOfBoundsDatetime`` if data exceeds ``datetime64[ns]`` bounds (:issue:`13663`)
+- Bug in ``DatetimeIndex`` may raise ``OutOfBoundsDatetime`` if input ``np.datetime64`` has other unit than ``ns`` (:issue:`9114`)
+- Bug in ``Series`` creation with ``np.datetime64`` which has other unit than ``ns`` as ``object`` dtype results in incorrect values (:issue:`13876`)
+- Bug in ``resample`` with timedelta data where data was casted to float (:issue:`13119`).
+- Bug in ``pd.isnull()`` ``pd.notnull()`` raise ``TypeError`` if input datetime-like has other unit than ``ns`` (:issue:`13389`)
+- Bug in ``pd.merge()`` may raise ``TypeError`` if input datetime-like has other unit than ``ns`` (:issue:`13389`)
+- Bug in ``HDFStore``/``read_hdf()`` discarded ``DatetimeIndex.name`` if ``tz`` was set (:issue:`13884`)
+- Bug in ``Categorical.remove_unused_categories()`` changes ``.codes`` dtype to platform int (:issue:`13261`)
+- Bug in ``groupby`` with ``as_index=False`` returns all NaN's when grouping on multiple columns including a categorical one (:issue:`13204`)
+- Bug in ``df.groupby(...)[...]`` where getitem with ``Int64Index`` raised an error (:issue:`13731`)
+- Bug in the CSS classes assigned to ``DataFrame.style`` for index names. Previously they were assigned ``"col_heading level<n> col<c>"`` where ``n`` was the number of levels + 1. Now they are assigned ``"index_name level<n>"``, where ``n`` is the correct level for that MultiIndex.
+- Bug where ``pd.read_gbq()`` could throw ``ImportError: No module named discovery`` as a result of a naming conflict with another python package called apiclient  (:issue:`13454`)
+- Bug in ``Index.union`` returns an incorrect result with a named empty index (:issue:`13432`)
+- Bugs in ``Index.difference`` and ``DataFrame.join`` raise in Python3 when using mixed-integer indexes (:issue:`13432`, :issue:`12814`)
+- Bug in subtract tz-aware ``datetime.datetime`` from tz-aware ``datetime64`` series (:issue:`14088`)
+- Bug in ``.to_excel()`` when DataFrame contains a MultiIndex which contains a label with a NaN value (:issue:`13511`)
+- Bug in invalid frequency offset string like "D1", "-2-3H" may not raise ``ValueError`` (:issue:`13930`)
+- Bug in ``concat`` and ``groupby`` for hierarchical frames with ``RangeIndex`` levels (:issue:`13542`).
+- Bug in ``Series.str.contains()`` for Series containing only ``NaN`` values of ``object`` dtype (:issue:`14171`)
+- Bug in ``agg()`` function on groupby dataframe changes dtype of ``datetime64[ns]`` column to ``float64`` (:issue:`12821`)
+- Bug in using NumPy ufunc with ``PeriodIndex`` to add or subtract integer raise ``IncompatibleFrequency``. Note that using standard operator like ``+`` or ``-`` is recommended, because standard operators use more efficient path (:issue:`13980`)
+- Bug in operations on ``NaT`` returning ``float`` instead of ``datetime64[ns]`` (:issue:`12941`)
+- Bug in ``Series`` flexible arithmetic methods (like ``.add()``) raises ``ValueError`` when ``axis=None`` (:issue:`13894`)
+- Bug in ``DataFrame.to_csv()`` with ``MultiIndex`` columns in which a stray empty line was added (:issue:`6618`)
+- Bug in ``DatetimeIndex``, ``TimedeltaIndex`` and ``PeriodIndex.equals()`` may return ``True`` when input isn't ``Index`` but contains the same values (:issue:`13107`)
+- Bug in assignment against datetime with timezone may not work if it contains datetime near DST boundary (:issue:`14146`)
+- Bug in ``pd.eval()`` and ``HDFStore`` query truncating long float literals with python 2 (:issue:`14241`)
+- Bug in ``Index`` raises ``KeyError`` displaying incorrect column when column is not in the df and columns contains duplicate values (:issue:`13822`)
+- Bug in ``Period`` and ``PeriodIndex`` creating wrong dates when frequency has combined offset aliases (:issue:`13874`)
+- Bug in ``.to_string()`` when called with an integer ``line_width`` and ``index=False`` raises an UnboundLocalError exception because ``idx`` referenced before assignment.
+- Bug in ``eval()`` where the ``resolvers`` argument would not accept a list (:issue:`14095`)
+- Bugs in ``stack``, ``get_dummies``, ``make_axis_dummies`` which don't preserve categorical dtypes in (multi)indexes (:issue:`13854`)
+- ``PeriodIndex`` can now accept ``list`` and ``array`` which contains ``pd.NaT`` (:issue:`13430`)
+- Bug in ``df.groupby`` where ``.median()`` returns arbitrary values if grouped dataframe contains empty bins (:issue:`13629`)
+- Bug in ``Index.copy()`` where ``name`` parameter was ignored (:issue:`14302`)
diff --git a/doc/source/whatsnew/v0.19.1.txt b/doc/source/whatsnew/v0.19.1.txt
new file mode 100644
index 0000000000000..1c577dddf1cd4
--- /dev/null
+++ b/doc/source/whatsnew/v0.19.1.txt
@@ -0,0 +1,61 @@
+.. _whatsnew_0191:
+
+v0.19.1 (November 3, 2016)
+--------------------------
+
+This is a minor bug-fix release from 0.19.0 and includes some small regression fixes,
+bug fixes and performance improvements.
+We recommend that all users upgrade to this version.
+
+.. contents:: What's new in v0.19.1
+    :local:
+    :backlinks: none
+
+
+.. _whatsnew_0191.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Fixed performance regression in factorization of ``Period`` data (:issue:`14338`)
+- Fixed performance regression in ``Series.asof(where)`` when ``where`` is a scalar (:issue:`14461`)
+- Improved performance in ``DataFrame.asof(where)`` when ``where`` is a scalar (:issue:`14461`)
+- Improved performance in ``.to_json()`` when ``lines=True`` (:issue:`14408`)
+- Improved performance in certain types of `loc` indexing with a MultiIndex (:issue:`14551`).
+
+
+.. _whatsnew_0191.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Source installs from PyPI will now again work without ``cython`` installed, as in previous versions (:issue:`14204`)
+- Compat with Cython 0.25 for building (:issue:`14496`)
+- Fixed regression where user-provided file handles were closed in ``read_csv`` (c engine) (:issue:`14418`).
+- Fixed regression in ``DataFrame.quantile`` when missing values where present in some columns (:issue:`14357`).
+- Fixed regression in ``Index.difference`` where the ``freq`` of a ``DatetimeIndex`` was incorrectly set (:issue:`14323`)
+- Added back ``pandas.core.common.array_equivalent`` with a deprecation warning (:issue:`14555`).
+- Bug in ``pd.read_csv`` for the C engine in which quotation marks were improperly parsed in skipped rows (:issue:`14459`)
+- Bug in ``pd.read_csv`` for Python 2.x in which Unicode quote characters were no longer being respected (:issue:`14477`)
+- Fixed regression in ``Index.append`` when categorical indices were appended (:issue:`14545`).
+- Fixed regression in ``pd.DataFrame`` where constructor fails when given dict with ``None`` value (:issue:`14381`)
+- Fixed regression in ``DatetimeIndex._maybe_cast_slice_bound`` when index is empty (:issue:`14354`).
+- Bug in localizing an ambiguous timezone when a boolean is passed (:issue:`14402`)
+- Bug in ``TimedeltaIndex`` addition with a Datetime-like object where addition overflow in the negative direction was not being caught (:issue:`14068`, :issue:`14453`)
+- Bug in string indexing against data with ``object`` ``Index`` may raise ``AttributeError`` (:issue:`14424`)
+- Correctly raise ``ValueError`` on empty input to ``pd.eval()`` and ``df.query()`` (:issue:`13139`)
+- Bug in ``RangeIndex.intersection`` when result is a empty set (:issue:`14364`).
+- Bug in groupby-transform broadcasting that could cause incorrect dtype coercion (:issue:`14457`)
+- Bug in ``Series.__setitem__`` which allowed mutating read-only arrays (:issue:`14359`).
+- Bug in ``DataFrame.insert`` where multiple calls with duplicate columns can fail (:issue:`14291`)
+- ``pd.merge()`` will raise ``ValueError`` with non-boolean parameters in passed boolean type arguments (:issue:`14434`)
+- Bug in ``Timestamp`` where dates very near the minimum (1677-09) could underflow on creation (:issue:`14415`)
+- Bug in ``pd.concat`` where names of the ``keys`` were not propagated to the resulting ``MultiIndex`` (:issue:`14252`)
+- Bug in ``pd.concat`` where ``axis`` cannot take string parameters ``'rows'`` or ``'columns'`` (:issue:`14369`)
+- Bug in ``pd.concat`` with dataframes heterogeneous in length and tuple ``keys`` (:issue:`14438`)
+- Bug in ``MultiIndex.set_levels`` where illegal level values were still set after raising an error (:issue:`13754`)
+- Bug in ``DataFrame.to_json`` where ``lines=True`` and a value contained a ``}`` character (:issue:`14391`)
+- Bug in ``df.groupby`` causing an ``AttributeError`` when grouping a single index frame by a column and the index level (:issue:`14327`)
+- Bug in ``df.groupby`` where ``TypeError`` raised when ``pd.Grouper(key=...)`` is passed in a list (:issue:`14334`)
+- Bug in ``pd.pivot_table`` may raise ``TypeError`` or ``ValueError`` when ``index`` or ``columns``
+  is not scalar and ``values`` is not specified (:issue:`14380`)
diff --git a/doc/source/whatsnew/v0.19.2.txt b/doc/source/whatsnew/v0.19.2.txt
new file mode 100644
index 0000000000000..171d97b76de75
--- /dev/null
+++ b/doc/source/whatsnew/v0.19.2.txt
@@ -0,0 +1,82 @@
+.. _whatsnew_0192:
+
+v0.19.2 (December 24, 2016)
+---------------------------
+
+This is a minor bug-fix release in the 0.19.x series and includes some small regression fixes,
+bug fixes and performance improvements.
+We recommend that all users upgrade to this version.
+
+Highlights include:
+
+- Compatibility with Python 3.6
+- Added a `Pandas Cheat Sheet <https://github.com/pandas-dev/pandas/tree/master/doc/cheatsheet/Pandas_Cheat_Sheet.pdf>`__. (:issue:`13202`).
+
+
+.. contents:: What's new in v0.19.2
+    :local:
+    :backlinks: none
+
+
+.. _whatsnew_0192.enhancements:
+
+Enhancements
+~~~~~~~~~~~~
+
+The ``pd.merge_asof()``, added in 0.19.0, gained some improvements:
+
+- ``pd.merge_asof()`` gained ``left_index``/``right_index`` and ``left_by``/``right_by`` arguments (:issue:`14253`)
+- ``pd.merge_asof()`` can take multiple columns in ``by`` parameter and has specialized dtypes for better performance (:issue:`13936`)
+
+
+.. _whatsnew_0192.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Performance regression with ``PeriodIndex`` (:issue:`14822`)
+- Performance regression in indexing with getitem (:issue:`14930`)
+- Improved performance of ``.replace()`` (:issue:`12745`)
+- Improved performance ``Series`` creation with a datetime index and dictionary data (:issue:`14894`)
+
+
+.. _whatsnew_0192.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+- Compat with python 3.6 for pickling of some offsets (:issue:`14685`)
+- Compat with python 3.6 for some indexing exception types (:issue:`14684`, :issue:`14689`)
+- Compat with python 3.6 for deprecation warnings in the test suite (:issue:`14681`)
+- Compat with python 3.6 for Timestamp pickles (:issue:`14689`)
+- Compat with ``dateutil==2.6.0``; segfault reported in the testing suite (:issue:`14621`)
+- Allow ``nanoseconds`` in ``Timestamp.replace`` as a kwarg (:issue:`14621`)
+- Bug in ``pd.read_csv`` in which aliasing was being done for ``na_values`` when passed in as a dictionary (:issue:`14203`)
+- Bug in ``pd.read_csv`` in which column indices for a dict-like ``na_values`` were not being respected (:issue:`14203`)
+- Bug in ``pd.read_csv`` where reading files fails, if the number of headers is equal to the number of lines in the file (:issue:`14515`)
+- Bug in ``pd.read_csv`` for the Python engine in which an unhelpful error message was being raised when multi-char delimiters were not being respected with quotes (:issue:`14582`)
+- Fix bugs (:issue:`14734`, :issue:`13654`) in ``pd.read_sas`` and ``pandas.io.sas.sas7bdat.SAS7BDATReader`` that caused problems when reading a SAS file incrementally.
+- Bug in ``pd.read_csv`` for the Python engine in which an unhelpful error message was being raised when ``skipfooter`` was not being respected by Python's CSV library (:issue:`13879`)
+- Bug in ``.fillna()`` in which timezone aware datetime64 values were incorrectly rounded (:issue:`14872`)
+- Bug in ``.groupby(..., sort=True)`` of a non-lexsorted MultiIndex when grouping with multiple levels (:issue:`14776`)
+- Bug in ``pd.cut`` with negative values and a single bin (:issue:`14652`)
+- Bug in ``pd.to_numeric`` where a 0 was not unsigned on a ``downcast='unsigned'`` argument (:issue:`14401`)
+- Bug in plotting regular and irregular timeseries using shared axes
+  (``sharex=True`` or ``ax.twinx()``) (:issue:`13341`, :issue:`14322`).
+- Bug in not propagating exceptions in parsing invalid datetimes, noted in python 3.6 (:issue:`14561`)
+- Bug in resampling a ``DatetimeIndex`` in local TZ, covering a DST change, which would raise ``AmbiguousTimeError`` (:issue:`14682`)
+- Bug in indexing that transformed ``RecursionError`` into ``KeyError`` or ``IndexingError`` (:issue:`14554`)
+- Bug in ``HDFStore`` when writing a ``MultiIndex`` when using ``data_columns=True`` (:issue:`14435`)
+- Bug in ``HDFStore.append()`` when writing a ``Series`` and passing a ``min_itemsize`` argument containing a value for the ``index`` (:issue:`11412`)
+- Bug when writing to a ``HDFStore`` in ``table`` format with a ``min_itemsize`` value for the ``index`` and without asking to append (:issue:`10381`)
+- Bug in ``Series.groupby.nunique()`` raising an ``IndexError`` for an empty ``Series`` (:issue:`12553`)
+- Bug in ``DataFrame.nlargest`` and ``DataFrame.nsmallest`` when the index had duplicate values (:issue:`13412`)
+- Bug in clipboard functions on linux with python2 with unicode and separators (:issue:`13747`)
+- Bug in clipboard functions on Windows 10 and python 3 (:issue:`14362`, :issue:`12807`)
+- Bug in ``.to_clipboard()`` and Excel compat (:issue:`12529`)
+- Bug in ``DataFrame.combine_first()`` for integer columns (:issue:`14687`).
+- Bug in ``pd.read_csv()`` in which the ``dtype`` parameter was not being respected for empty data (:issue:`14712`)
+- Bug in ``pd.read_csv()`` in which the ``nrows`` parameter was not being respected for large input when using the C engine for parsing (:issue:`7626`)
+- Bug in ``pd.merge_asof()`` could not handle timezone-aware DatetimeIndex when a tolerance was specified (:issue:`14844`)
+- Explicit check in ``to_stata`` and ``StataWriter`` for out-of-range values when writing doubles (:issue:`14618`)
+- Bug in ``.plot(kind='kde')`` which did not drop missing values to generate the KDE Plot, instead generating an empty plot. (:issue:`14821`)
+- Bug in ``unstack()`` if called with a list of column(s) as an argument, regardless of the dtypes of all columns, they get coerced to ``object`` (:issue:`11847`)
diff --git a/doc/source/whatsnew/v0.20.0.txt b/doc/source/whatsnew/v0.20.0.txt
new file mode 100644
index 0000000000000..2146b7b99a5a7
--- /dev/null
+++ b/doc/source/whatsnew/v0.20.0.txt
@@ -0,0 +1,1733 @@
+.. _whatsnew_0200:
+
+v0.20.1 (May 5, 2017)
+---------------------
+
+This is a major release from 0.19.2 and includes a number of API changes, deprecations, new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+Highlights include:
+
+- New ``.agg()`` API for Series/DataFrame similar to the groupby-rolling-resample API's, see :ref:`here <whatsnew_0200.enhancements.agg>`
+- Integration with the ``feather-format``, including a new top-level ``pd.read_feather()`` and ``DataFrame.to_feather()`` method, see :ref:`here <io.feather>`.
+- The ``.ix`` indexer has been deprecated, see :ref:`here <whatsnew_0200.api_breaking.deprecate_ix>`
+- ``Panel`` has been deprecated, see :ref:`here <whatsnew_0200.api_breaking.deprecate_panel>`
+- Addition of an ``IntervalIndex`` and ``Interval`` scalar type, see :ref:`here <whatsnew_0200.enhancements.intervalindex>`
+- Improved user API when grouping by index levels in ``.groupby()``, see :ref:`here <whatsnew_0200.enhancements.groupby_access>`
+- Improved support for ``UInt64`` dtypes, see :ref:`here <whatsnew_0200.enhancements.uint64_support>`
+- A new orient for JSON serialization, ``orient='table'``, that uses the Table Schema spec and that gives the possibility for a more interactive repr in the Jupyter Notebook, see :ref:`here <whatsnew_0200.enhancements.table_schema>`
+- Experimental support for exporting styled DataFrames (``DataFrame.style``) to Excel, see :ref:`here <whatsnew_0200.enhancements.style_excel>`
+- Window binary corr/cov operations now return a MultiIndexed ``DataFrame`` rather than a ``Panel``, as ``Panel`` is now deprecated, see :ref:`here <whatsnew_0200.api_breaking.rolling_pairwise>`
+- Support for S3 handling now uses ``s3fs``, see :ref:`here <whatsnew_0200.api_breaking.s3>`
+- Google BigQuery support now uses the ``pandas-gbq`` library, see :ref:`here <whatsnew_0200.api_breaking.gbq>`
+
+.. warning::
+
+  Pandas has changed the internal structure and layout of the code base.
+  This can affect imports that are not from the top-level ``pandas.*`` namespace, please see the changes :ref:`here <whatsnew_0200.privacy>`.
+
+Check the :ref:`API Changes <whatsnew_0200.api_breaking>` and :ref:`deprecations <whatsnew_0200.deprecations>` before updating.
+
+.. note::
+
+   This is a combined release for 0.20.0 and and 0.20.1.
+   Version 0.20.1 contains one additional change for backwards-compatibility with downstream projects using pandas' ``utils`` routines. (:issue:`16250`)
+
+.. contents:: What's new in v0.20.0
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0200.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+.. ipython:: python
+   :suppress:
+
+   import pandas.util.testing as tm
+
+.. _whatsnew_0200.enhancements.agg:
+
+``agg`` API for DataFrame/Series
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Series & DataFrame have been enhanced to support the aggregation API. This is a familiar API
+from groupby, window operations, and resampling. This allows aggregation operations in a concise way
+by using :meth:`~DataFrame.agg` and :meth:`~DataFrame.transform`. The full documentation
+is :ref:`here <basics.aggregate>` (:issue:`1623`).
+
+Here is a sample
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'],
+                    index=pd.date_range('1/1/2000', periods=10))
+   df.iloc[3:7] = np.nan
+   df
+
+One can operate using string function names, callables, lists, or dictionaries of these.
+
+Using a single function is equivalent to ``.apply``.
+
+.. ipython:: python
+
+   df.agg('sum')
+
+Multiple aggregations with a list of functions.
+
+.. ipython:: python
+
+   df.agg(['sum', 'min'])
+
+Using a dict provides the ability to apply specific aggregations per column.
+You will get a matrix-like output of all of the aggregators. The output has one column
+per unique function. Those functions applied to a particular column will be ``NaN``:
+
+.. ipython:: python
+
+   df.agg({'A' : ['sum', 'min'], 'B' : ['min', 'max']})
+
+The API also supports a ``.transform()`` function for broadcasting results.
+
+.. ipython:: python
+   :okwarning:
+
+   df.transform(['abs', lambda x: x - x.min()])
+
+When presented with mixed dtypes that cannot be aggregated, ``.agg()`` will only take the valid
+aggregations. This is similar to how groupby ``.agg()`` works. (:issue:`15015`)
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 2, 3],
+                      'B': [1., 2., 3.],
+                      'C': ['foo', 'bar', 'baz'],
+                      'D': pd.date_range('20130101', periods=3)})
+   df.dtypes
+
+.. ipython:: python
+
+   df.agg(['min', 'sum'])
+
+.. _whatsnew_0200.enhancements.dataio_dtype:
+
+``dtype`` keyword for data IO
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The ``'python'`` engine for :func:`read_csv`, as well as the :func:`read_fwf` function for parsing
+fixed-width text files and :func:`read_excel` for parsing Excel files, now accept the ``dtype`` keyword argument for specifying the types of specific columns (:issue:`14295`). See the :ref:`io docs <io.dtypes>` for more information.
+
+.. ipython:: python
+   :suppress:
+
+   from pandas.compat import StringIO
+
+.. ipython:: python
+
+   data = "a  b\n1  2\n3  4"
+   pd.read_fwf(StringIO(data)).dtypes
+   pd.read_fwf(StringIO(data), dtype={'a':'float64', 'b':'object'}).dtypes
+
+.. _whatsnew_0120.enhancements.datetime_origin:
+
+``.to_datetime()`` has gained an ``origin`` parameter
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`to_datetime` has gained a new parameter, ``origin``, to define a reference date
+from where to compute the resulting timestamps when parsing numerical values with a specific ``unit`` specified. (:issue:`11276`, :issue:`11745`)
+
+For example, with 1960-01-01 as the starting date:
+
+.. ipython:: python
+
+   pd.to_datetime([1, 2, 3], unit='D', origin=pd.Timestamp('1960-01-01'))
+
+The default is set at ``origin='unix'``, which defaults to ``1970-01-01 00:00:00``, which is
+commonly called 'unix epoch' or POSIX time. This was the previous default, so this is a backward compatible change.
+
+.. ipython:: python
+
+   pd.to_datetime([1, 2, 3], unit='D')
+
+
+.. _whatsnew_0200.enhancements.groupby_access:
+
+Groupby Enhancements
+^^^^^^^^^^^^^^^^^^^^
+
+Strings passed to ``DataFrame.groupby()`` as the ``by`` parameter may now reference either column names or index level names. Previously, only column names could be referenced. This allows to easily group by a column and index level at the same time. (:issue:`5677`)
+
+.. ipython:: python
+
+   arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+             ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+
+   index = pd.MultiIndex.from_arrays(arrays, names=['first', 'second'])
+
+   df = pd.DataFrame({'A': [1, 1, 1, 1, 2, 2, 3, 3],
+                      'B': np.arange(8)},
+                     index=index)
+   df
+
+   df.groupby(['second', 'A']).sum()
+
+
+.. _whatsnew_0200.enhancements.compressed_urls:
+
+Better support for compressed URLs in ``read_csv``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The compression code was refactored (:issue:`12688`). As a result, reading
+dataframes from URLs in :func:`read_csv` or :func:`read_table` now supports
+additional compression methods: ``xz``, ``bz2``, and ``zip`` (:issue:`14570`).
+Previously, only ``gzip`` compression was supported. By default, compression of
+URLs and paths are now inferred using their file extensions. Additionally,
+support for bz2 compression in the python 2 C-engine improved (:issue:`14874`).
+
+.. ipython:: python
+
+   url = 'https://github.com/{repo}/raw/{branch}/{path}'.format(
+       repo = 'pandas-dev/pandas',
+       branch = 'master',
+       path = 'pandas/tests/io/parser/data/salaries.csv.bz2',
+   )
+   df = pd.read_table(url, compression='infer')  # default, infer compression
+   df = pd.read_table(url, compression='bz2')  # explicitly specify compression
+   df.head(2)
+
+.. _whatsnew_0200.enhancements.pickle_compression:
+
+Pickle file I/O now supports compression
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`read_pickle`, :meth:`DataFrame.to_pickle` and :meth:`Series.to_pickle`
+can now read from and write to compressed pickle files. Compression methods
+can be an explicit parameter or be inferred from the file extension.
+See :ref:`the docs here. <io.pickle.compression>`
+
+.. ipython:: python
+
+   df = pd.DataFrame({
+       'A': np.random.randn(1000),
+       'B': 'foo',
+       'C': pd.date_range('20130101', periods=1000, freq='s')})
+
+Using an explicit compression type
+
+.. ipython:: python
+
+   df.to_pickle("data.pkl.compress", compression="gzip")
+   rt = pd.read_pickle("data.pkl.compress", compression="gzip")
+   rt.head()
+
+The default is to infer the compression type from the extension (``compression='infer'``):
+
+.. ipython:: python
+
+   df.to_pickle("data.pkl.gz")
+   rt = pd.read_pickle("data.pkl.gz")
+   rt.head()
+   df["A"].to_pickle("s1.pkl.bz2")
+   rt = pd.read_pickle("s1.pkl.bz2")
+   rt.head()
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   os.remove("data.pkl.compress")
+   os.remove("data.pkl.gz")
+   os.remove("s1.pkl.bz2")
+
+.. _whatsnew_0200.enhancements.uint64_support:
+
+UInt64 Support Improved
+^^^^^^^^^^^^^^^^^^^^^^^
+
+Pandas has significantly improved support for operations involving unsigned,
+or purely non-negative, integers. Previously, handling these integers would
+result in improper rounding or data-type casting, leading to incorrect results.
+Notably, a new numerical index, ``UInt64Index``, has been created (:issue:`14937`)
+
+.. ipython:: python
+
+   idx = pd.UInt64Index([1, 2, 3])
+   df = pd.DataFrame({'A': ['a', 'b', 'c']}, index=idx)
+   df.index
+
+- Bug in converting object elements of array-like objects to unsigned 64-bit integers (:issue:`4471`, :issue:`14982`)
+- Bug in ``Series.unique()`` in which unsigned 64-bit integers were causing overflow (:issue:`14721`)
+- Bug in ``DataFrame`` construction in which unsigned 64-bit integer elements were being converted to objects (:issue:`14881`)
+- Bug in ``pd.read_csv()`` in which unsigned 64-bit integer elements were being improperly converted to the wrong data types (:issue:`14983`)
+- Bug in ``pd.unique()`` in which unsigned 64-bit integers were causing overflow (:issue:`14915`)
+- Bug in ``pd.value_counts()`` in which unsigned 64-bit integers were being erroneously truncated in the output (:issue:`14934`)
+
+.. _whatsnew_0200.enhancements.groupy_categorical:
+
+GroupBy on Categoricals
+^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions, ``.groupby(..., sort=False)`` would fail with a ``ValueError`` when grouping on a categorical series with some categories not appearing in the data. (:issue:`13179`)
+
+.. ipython:: python
+
+  chromosomes = np.r_[np.arange(1, 23).astype(str), ['X', 'Y']]
+  df = pd.DataFrame({
+      'A': np.random.randint(100),
+      'B': np.random.randint(100),
+      'C': np.random.randint(100),
+      'chromosomes': pd.Categorical(np.random.choice(chromosomes, 100),
+                                    categories=chromosomes,
+                                    ordered=True)})
+  df
+
+**Previous Behavior**:
+
+.. code-block:: ipython
+
+  In [3]: df[df.chromosomes != '1'].groupby('chromosomes', sort=False).sum()
+  ---------------------------------------------------------------------------
+  ValueError: items in new_categories are not the same as in old categories
+
+**New Behavior**:
+
+.. ipython:: python
+
+  df[df.chromosomes != '1'].groupby('chromosomes', sort=False).sum()
+
+.. _whatsnew_0200.enhancements.table_schema:
+
+Table Schema Output
+^^^^^^^^^^^^^^^^^^^
+
+The new orient ``'table'`` for :meth:`DataFrame.to_json`
+will generate a `Table Schema`_ compatible string representation of
+the data.
+
+.. ipython:: python
+
+   df = pd.DataFrame(
+       {'A': [1, 2, 3],
+        'B': ['a', 'b', 'c'],
+        'C': pd.date_range('2016-01-01', freq='d', periods=3),
+       }, index=pd.Index(range(3), name='idx'))
+   df
+   df.to_json(orient='table')
+
+
+See :ref:`IO: Table Schema for more information <io.table_schema>`.
+
+Additionally, the repr for ``DataFrame`` and ``Series`` can now publish
+this JSON Table schema representation of the Series or DataFrame if you are
+using IPython (or another frontend like `nteract`_ using the Jupyter messaging
+protocol).
+This gives frontends like the Jupyter notebook and `nteract`_
+more flexibility in how they display pandas objects, since they have
+more information about the data.
+You must enable this by setting the ``display.html.table_schema`` option to ``True``.
+
+.. _Table Schema: http://specs.frictionlessdata.io/json-table-schema/
+.. _nteract: http://nteract.io/
+
+.. _whatsnew_0200.enhancements.scipy_sparse:
+
+SciPy sparse matrix from/to SparseDataFrame
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Pandas now supports creating sparse dataframes directly from ``scipy.sparse.spmatrix`` instances.
+See the :ref:`documentation <sparse.scipysparse>` for more information. (:issue:`4343`)
+
+All sparse formats are supported, but matrices that are not in :mod:`COOrdinate <scipy.sparse>` format will be converted, copying data as needed.
+
+.. ipython:: python
+
+   from scipy.sparse import csr_matrix
+   arr = np.random.random(size=(1000, 5))
+   arr[arr < .9] = 0
+   sp_arr = csr_matrix(arr)
+   sp_arr
+   sdf = pd.SparseDataFrame(sp_arr)
+   sdf
+
+To convert a ``SparseDataFrame`` back to sparse SciPy matrix in COO format, you can use:
+
+.. ipython:: python
+
+   sdf.to_coo()
+
+.. _whatsnew_0200.enhancements.style_excel:
+
+Excel output for styled DataFrames
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Experimental support has been added to export ``DataFrame.style`` formats to Excel using the ``openpyxl`` engine. (:issue:`15530`)
+
+For example, after running the following, ``styled.xlsx`` renders as below:
+
+.. ipython:: python
+   :okwarning:
+
+   np.random.seed(24)
+   df = pd.DataFrame({'A': np.linspace(1, 10, 10)})
+   df = pd.concat([df, pd.DataFrame(np.random.RandomState(24).randn(10, 4),
+                                    columns=list('BCDE'))],
+                  axis=1)
+   df.iloc[0, 2] = np.nan
+   df
+   styled = df.style.\
+       applymap(lambda val: 'color: %s' % 'red' if val < 0 else 'black').\
+       highlight_max()
+   styled.to_excel('styled.xlsx', engine='openpyxl')
+
+.. image:: _static/style-excel.png
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   os.remove('styled.xlsx')
+
+See the :ref:`Style documentation </style.ipynb#Export-to-Excel>` for more detail.
+
+.. _whatsnew_0200.enhancements.intervalindex:
+
+IntervalIndex
+^^^^^^^^^^^^^
+
+pandas has gained an ``IntervalIndex`` with its own dtype, ``interval`` as well as the ``Interval`` scalar type. These allow first-class support for interval
+notation, specifically as a return type for the categories in :func:`cut` and :func:`qcut`. The ``IntervalIndex`` allows some unique indexing, see the
+:ref:`docs <indexing.intervallindex>`. (:issue:`7640`, :issue:`8625`)
+
+.. warning::
+
+   These indexing behaviors of the IntervalIndex are provisional and may change in a future version of pandas. Feedback on usage is welcome.
+
+
+Previous behavior:
+
+The returned categories were strings, representing Intervals
+
+.. code-block:: ipython
+
+   In [1]: c = pd.cut(range(4), bins=2)
+
+   In [2]: c
+   Out[2]:
+   [(-0.003, 1.5], (-0.003, 1.5], (1.5, 3], (1.5, 3]]
+   Categories (2, object): [(-0.003, 1.5] < (1.5, 3]]
+
+   In [3]: c.categories
+   Out[3]: Index(['(-0.003, 1.5]', '(1.5, 3]'], dtype='object')
+
+New behavior:
+
+.. ipython:: python
+
+   c = pd.cut(range(4), bins=2)
+   c
+   c.categories
+
+Furthermore, this allows one to bin *other* data with these same bins, with ``NaN`` representing a missing
+value similar to other dtypes.
+
+.. ipython:: python
+
+   pd.cut([0, 3, 5, 1], bins=c.categories)
+
+An ``IntervalIndex`` can also be used in ``Series`` and ``DataFrame`` as the index.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': range(4),
+                      'B': pd.cut([0, 3, 1, 1], bins=c.categories)}
+                    ).set_index('B')
+   df
+
+Selecting via a specific interval:
+
+.. ipython:: python
+
+   df.loc[pd.Interval(1.5, 3.0)]
+
+Selecting via a scalar value that is contained *in* the intervals.
+
+.. ipython:: python
+
+   df.loc[0]
+
+.. _whatsnew_0200.enhancements.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+- ``DataFrame.rolling()`` now accepts the parameter ``closed='right'|'left'|'both'|'neither'`` to choose the rolling window-endpoint closedness. See the :ref:`documentation <stats.rolling_window.endpoints>` (:issue:`13965`)
+- Integration with the ``feather-format``, including a new top-level ``pd.read_feather()`` and ``DataFrame.to_feather()`` method, see :ref:`here <io.feather>`.
+- ``Series.str.replace()`` now accepts a callable, as replacement, which is passed to ``re.sub`` (:issue:`15055`)
+- ``Series.str.replace()`` now accepts a compiled regular expression as a pattern (:issue:`15446`)
+- ``Series.sort_index`` accepts parameters ``kind`` and ``na_position`` (:issue:`13589`, :issue:`14444`)
+- ``DataFrame`` and ``DataFrame.groupby()``  have gained a ``nunique()`` method to count the distinct values over an axis (:issue:`14336`, :issue:`15197`).
+- ``DataFrame`` has gained a ``melt()`` method, equivalent to ``pd.melt()``, for unpivoting from a wide to long format (:issue:`12640`).
+- ``pd.read_excel()`` now preserves sheet order when using ``sheetname=None`` (:issue:`9930`)
+- Multiple offset aliases with decimal points are now supported (e.g. ``0.5min`` is parsed as ``30s``) (:issue:`8419`)
+- ``.isnull()`` and ``.notnull()`` have been added to ``Index`` object to make them more consistent with the ``Series`` API (:issue:`15300`)
+- New ``UnsortedIndexError`` (subclass of ``KeyError``) raised when indexing/slicing into an
+  unsorted MultiIndex (:issue:`11897`). This allows differentiation between errors due to lack
+  of sorting or an incorrect key. See :ref:`here <advanced.unsorted>`
+- ``MultiIndex`` has gained a ``.to_frame()`` method to convert to a ``DataFrame`` (:issue:`12397`)
+- ``pd.cut`` and ``pd.qcut`` now support datetime64 and timedelta64 dtypes (:issue:`14714`, :issue:`14798`)
+- ``pd.qcut`` has gained the ``duplicates='raise'|'drop'`` option to control whether to raise on duplicated edges (:issue:`7751`)
+- ``Series`` provides a ``to_excel`` method to output Excel files (:issue:`8825`)
+- The ``usecols`` argument in ``pd.read_csv()`` now accepts a callable function as a value  (:issue:`14154`)
+- The ``skiprows`` argument in ``pd.read_csv()`` now accepts a callable function as a value  (:issue:`10882`)
+- The ``nrows`` and ``chunksize`` arguments in ``pd.read_csv()`` are supported if both are passed (:issue:`6774`, :issue:`15755`)
+- ``DataFrame.plot`` now prints a title above each subplot if ``suplots=True`` and ``title`` is a list of strings (:issue:`14753`)
+- ``DataFrame.plot`` can pass the matplotlib 2.0 default color cycle as a single string as color parameter, see `here <http://matplotlib.org/2.0.0/users/colors.html#cn-color-selection>`__. (:issue:`15516`)
+- ``Series.interpolate()`` now supports timedelta as an index type with ``method='time'`` (:issue:`6424`)
+- Addition of a ``level`` keyword to ``DataFrame/Series.rename`` to rename
+  labels in the specified level of a MultiIndex (:issue:`4160`).
+- ``DataFrame.reset_index()`` will now interpret a tuple ``index.name`` as a key spanning across levels of ``columns``, if this is a ``MultiIndex`` (:issue:`16164`)
+- ``Timedelta.isoformat`` method added for formatting Timedeltas as an `ISO 8601 duration`_. See the :ref:`Timedelta docs <timedeltas.isoformat>` (:issue:`15136`)
+- ``.select_dtypes()`` now allows the string ``datetimetz`` to generically select datetimes with tz (:issue:`14910`)
+- The ``.to_latex()`` method will now accept ``multicolumn`` and ``multirow`` arguments to use the accompanying LaTeX enhancements
+- ``pd.merge_asof()`` gained the option ``direction='backward'|'forward'|'nearest'`` (:issue:`14887`)
+- ``Series/DataFrame.asfreq()`` have gained a ``fill_value`` parameter, to fill missing values (:issue:`3715`).
+- ``Series/DataFrame.resample.asfreq`` have gained a ``fill_value`` parameter, to fill missing values during resampling (:issue:`3715`).
+- :func:`pandas.util.hash_pandas_object` has gained the ability to hash a ``MultiIndex`` (:issue:`15224`)
+- ``Series/DataFrame.squeeze()`` have gained the ``axis`` parameter. (:issue:`15339`)
+- ``DataFrame.to_excel()`` has a new ``freeze_panes`` parameter to turn on Freeze Panes when exporting to Excel (:issue:`15160`)
+- ``pd.read_html()`` will parse multiple header rows, creating a MutliIndex header. (:issue:`13434`).
+- HTML table output skips ``colspan`` or ``rowspan`` attribute if equal to 1. (:issue:`15403`)
+- :class:`pandas.io.formats.style.Styler` template now has blocks for easier extension, see the :ref:`example notebook </style.ipynb#Subclassing>` (:issue:`15649`)
+- :meth:`Styler.render() <pandas.io.formats.style.Styler.render>` now accepts ``**kwargs`` to allow user-defined variables in the template (:issue:`15649`)
+- Compatibility with Jupyter notebook 5.0; MultiIndex column labels are left-aligned and MultiIndex row-labels are top-aligned (:issue:`15379`)
+- ``TimedeltaIndex`` now has a custom date-tick formatter specifically designed for nanosecond level precision (:issue:`8711`)
+- ``pd.api.types.union_categoricals`` gained the ``ignore_ordered`` argument to allow ignoring the ordered attribute of unioned categoricals (:issue:`13410`). See the :ref:`categorical union docs <categorical.union>` for more information.
+- ``DataFrame.to_latex()`` and ``DataFrame.to_string()`` now allow optional header aliases. (:issue:`15536`)
+- Re-enable the ``parse_dates`` keyword of ``pd.read_excel()`` to parse string columns as dates (:issue:`14326`)
+- Added ``.empty`` property to subclasses of ``Index``. (:issue:`15270`)
+- Enabled floor division for ``Timedelta`` and ``TimedeltaIndex`` (:issue:`15828`)
+- ``pandas.io.json.json_normalize()`` gained the option ``errors='ignore'|'raise'``; the default is ``errors='raise'`` which is backward compatible. (:issue:`14583`)
+- ``pandas.io.json.json_normalize()`` with an empty ``list`` will return an empty ``DataFrame`` (:issue:`15534`)
+- ``pandas.io.json.json_normalize()`` has gained a ``sep`` option that accepts ``str`` to separate joined fields; the default is ".", which is backward compatible. (:issue:`14883`)
+- :meth:`MultiIndex.remove_unused_levels` has been added to facilitate :ref:`removing unused levels <advanced.shown_levels>`. (:issue:`15694`)
+- ``pd.read_csv()`` will now raise a ``ParserError`` error whenever any parsing error occurs (:issue:`15913`, :issue:`15925`)
+- ``pd.read_csv()`` now supports the ``error_bad_lines`` and ``warn_bad_lines`` arguments for the Python parser (:issue:`15925`)
+- The ``display.show_dimensions`` option can now also be used to specify
+  whether the length of a ``Series`` should be shown in its repr (:issue:`7117`).
+- ``parallel_coordinates()`` has gained a ``sort_labels`` keyword argument that sorts class labels and the colors assigned to them (:issue:`15908`)
+- Options added to allow one to turn on/off using ``bottleneck`` and ``numexpr``, see :ref:`here <basics.accelerate>` (:issue:`16157`)
+- ``DataFrame.style.bar()`` now accepts two more options to further customize the bar chart. Bar alignment is set with ``align='left'|'mid'|'zero'``, the default is "left", which is backward compatible; You can now pass a list of ``color=[color_negative, color_positive]``. (:issue:`14757`)
+
+.. _ISO 8601 duration: https://en.wikipedia.org/wiki/ISO_8601#Durations
+
+
+.. _whatsnew_0200.api_breaking:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _whatsnew.api_breaking.io_compat:
+
+Possible incompatibility for HDF5 formats created with pandas < 0.13.0
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``pd.TimeSeries`` was deprecated officially in 0.17.0, though has already been an alias since 0.13.0. It has
+been dropped in favor of ``pd.Series``. (:issue:`15098`).
+
+This *may* cause HDF5 files that were created in prior versions to become unreadable if ``pd.TimeSeries``
+was used. This is most likely to be for pandas < 0.13.0. If you find yourself in this situation.
+You can use a recent prior version of pandas to read in your HDF5 files,
+then write them out again after applying the procedure below.
+
+.. code-block:: ipython
+
+   In [2]: s = pd.TimeSeries([1,2,3], index=pd.date_range('20130101', periods=3))
+
+   In [3]: s
+   Out[3]:
+   2013-01-01    1
+   2013-01-02    2
+   2013-01-03    3
+   Freq: D, dtype: int64
+
+   In [4]: type(s)
+   Out[4]: pandas.core.series.TimeSeries
+
+   In [5]: s = pd.Series(s)
+
+   In [6]: s
+   Out[6]:
+   2013-01-01    1
+   2013-01-02    2
+   2013-01-03    3
+   Freq: D, dtype: int64
+
+   In [7]: type(s)
+   Out[7]: pandas.core.series.Series
+
+
+.. _whatsnew_0200.api_breaking.index_map:
+
+Map on Index types now return other Index types
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``map`` on an ``Index`` now returns an ``Index``, not a numpy array (:issue:`12766`)
+
+.. ipython:: python
+
+   idx = Index([1, 2])
+   idx
+   mi = MultiIndex.from_tuples([(1, 2), (2, 4)])
+   mi
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [5]: idx.map(lambda x: x * 2)
+   Out[5]: array([2, 4])
+
+   In [6]: idx.map(lambda x: (x, x * 2))
+   Out[6]: array([(1, 2), (2, 4)], dtype=object)
+
+   In [7]: mi.map(lambda x: x)
+   Out[7]: array([(1, 2), (2, 4)], dtype=object)
+
+   In [8]: mi.map(lambda x: x[0])
+   Out[8]: array([1, 2])
+
+New Behavior:
+
+.. ipython:: python
+
+   idx.map(lambda x: x * 2)
+   idx.map(lambda x: (x, x * 2))
+
+   mi.map(lambda x: x)
+
+   mi.map(lambda x: x[0])
+
+
+``map`` on a ``Series`` with ``datetime64`` values may return ``int64`` dtypes rather than ``int32``
+
+.. ipython:: python
+
+   s = Series(date_range('2011-01-02T00:00', '2011-01-02T02:00', freq='H').tz_localize('Asia/Tokyo'))
+   s
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [9]: s.map(lambda x: x.hour)
+   Out[9]:
+   0    0
+   1    1
+   2    2
+   dtype: int32
+
+New Behavior:
+
+.. ipython:: python
+
+   s.map(lambda x: x.hour)
+
+
+.. _whatsnew_0200.api_breaking.index_dt_field:
+
+Accessing datetime fields of Index now return Index
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The datetime-related attributes (see :ref:`here <timeseries.components>`
+for an overview) of ``DatetimeIndex``, ``PeriodIndex`` and ``TimedeltaIndex`` previously
+returned numpy arrays. They will now return a new ``Index`` object, except
+in the case of a boolean field, where the result will still be a boolean ndarray. (:issue:`15022`)
+
+Previous behaviour:
+
+.. code-block:: ipython
+
+    In [1]: idx = pd.date_range("2015-01-01", periods=5, freq='10H')
+
+    In [2]: idx.hour
+    Out[2]: array([ 0, 10, 20,  6, 16], dtype=int32)
+
+New Behavior:
+
+.. ipython:: python
+
+    idx = pd.date_range("2015-01-01", periods=5, freq='10H')
+    idx.hour
+
+This has the advantage that specific ``Index`` methods are still available on the
+result. On the other hand, this might have backward incompatibilities: e.g.
+compared to numpy arrays, ``Index`` objects are not mutable. To get the original
+ndarray, you can always convert explicitly using ``np.asarray(idx.hour)``.
+
+.. _whatsnew_0200.api_breaking.unique:
+
+pd.unique will now be consistent with extension types
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In prior versions, using :meth:`Series.unique` and :func:`pandas.unique` on ``Categorical`` and tz-aware
+data-types would yield different return types. These are now made consistent. (:issue:`15903`)
+
+- Datetime tz-aware
+
+  Previous behaviour:
+
+  .. code-block:: ipython
+
+     # Series
+     In [5]: pd.Series([pd.Timestamp('20160101', tz='US/Eastern'),
+                        pd.Timestamp('20160101', tz='US/Eastern')]).unique()
+     Out[5]: array([Timestamp('2016-01-01 00:00:00-0500', tz='US/Eastern')], dtype=object)
+
+     In [6]: pd.unique(pd.Series([pd.Timestamp('20160101', tz='US/Eastern'),
+                                  pd.Timestamp('20160101', tz='US/Eastern')]))
+     Out[6]: array(['2016-01-01T05:00:00.000000000'], dtype='datetime64[ns]')
+
+     # Index
+     In [7]: pd.Index([pd.Timestamp('20160101', tz='US/Eastern'),
+                       pd.Timestamp('20160101', tz='US/Eastern')]).unique()
+     Out[7]: DatetimeIndex(['2016-01-01 00:00:00-05:00'], dtype='datetime64[ns, US/Eastern]', freq=None)
+
+     In [8]: pd.unique([pd.Timestamp('20160101', tz='US/Eastern'),
+                        pd.Timestamp('20160101', tz='US/Eastern')])
+     Out[8]: array(['2016-01-01T05:00:00.000000000'], dtype='datetime64[ns]')
+
+  New Behavior:
+
+  .. ipython:: python
+
+     # Series, returns an array of Timestamp tz-aware
+     pd.Series([pd.Timestamp('20160101', tz='US/Eastern'),
+               pd.Timestamp('20160101', tz='US/Eastern')]).unique()
+     pd.unique(pd.Series([pd.Timestamp('20160101', tz='US/Eastern'),
+                          pd.Timestamp('20160101', tz='US/Eastern')]))
+
+     # Index, returns a DatetimeIndex
+     pd.Index([pd.Timestamp('20160101', tz='US/Eastern'),
+               pd.Timestamp('20160101', tz='US/Eastern')]).unique()
+     pd.unique(pd.Index([pd.Timestamp('20160101', tz='US/Eastern'),
+                         pd.Timestamp('20160101', tz='US/Eastern')]))
+
+- Categoricals
+
+  Previous behaviour:
+
+  .. code-block:: ipython
+
+     In [1]: pd.Series(list('baabc'), dtype='category').unique()
+     Out[1]:
+     [b, a, c]
+     Categories (3, object): [b, a, c]
+
+     In [2]: pd.unique(pd.Series(list('baabc'), dtype='category'))
+     Out[2]: array(['b', 'a', 'c'], dtype=object)
+
+  New Behavior:
+
+  .. ipython:: python
+
+     # returns a Categorical
+     pd.Series(list('baabc'), dtype='category').unique()
+     pd.unique(pd.Series(list('baabc'), dtype='category'))
+
+.. _whatsnew_0200.api_breaking.s3:
+
+S3 File Handling
+^^^^^^^^^^^^^^^^
+
+pandas now uses `s3fs <http://s3fs.readthedocs.io/>`_ for handling S3 connections. This shouldn't break
+any code. However, since ``s3fs`` is not a required dependency, you will need to install it separately, like ``boto``
+in prior versions of pandas. (:issue:`11915`).
+
+.. _whatsnew_0200.api_breaking.partial_string_indexing:
+
+Partial String Indexing Changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:ref:`DatetimeIndex Partial String Indexing <timeseries.partialindexing>` now works as an exact match, provided that string resolution coincides with index resolution, including a case when both are seconds (:issue:`14826`). See :ref:`Slice vs. Exact Match <timeseries.slice_vs_exact_match>` for details.
+
+.. ipython:: python
+
+  df = DataFrame({'a': [1, 2, 3]}, DatetimeIndex(['2011-12-31 23:59:59',
+                                                  '2012-01-01 00:00:00',
+                                                  '2012-01-01 00:00:01']))
+Previous Behavior:
+
+.. code-block:: ipython
+
+  In [4]: df['2011-12-31 23:59:59']
+  Out[4]:
+                         a
+  2011-12-31 23:59:59  1
+
+  In [5]: df['a']['2011-12-31 23:59:59']
+  Out[5]:
+  2011-12-31 23:59:59    1
+  Name: a, dtype: int64
+
+
+New Behavior:
+
+.. code-block:: ipython
+
+  In [4]: df['2011-12-31 23:59:59']
+  KeyError: '2011-12-31 23:59:59'
+
+  In [5]: df['a']['2011-12-31 23:59:59']
+  Out[5]: 1
+
+.. _whatsnew_0200.api_breaking.concat_dtypes:
+
+Concat of different float dtypes will not automatically upcast
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously, ``concat`` of multiple objects with different ``float`` dtypes would automatically upcast results to a dtype of ``float64``.
+Now the smallest acceptable dtype will be used (:issue:`13247`)
+
+.. ipython:: python
+
+   df1 = pd.DataFrame(np.array([1.0], dtype=np.float32, ndmin=2))
+   df1.dtypes
+
+   df2 = pd.DataFrame(np.array([np.nan], dtype=np.float32, ndmin=2))
+   df2.dtypes
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [7]: pd.concat([df1, df2]).dtypes
+   Out[7]:
+   0    float64
+   dtype: object
+
+New Behavior:
+
+.. ipython:: python
+
+   pd.concat([df1, df2]).dtypes
+
+.. _whatsnew_0200.api_breaking.gbq:
+
+Pandas Google BigQuery support has moved
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+pandas has split off Google BigQuery support into a separate package ``pandas-gbq``. You can ``conda install pandas-gbq -c conda-forge`` or
+``pip install pandas-gbq`` to get it. The functionality of :func:`read_gbq` and :meth:`DataFrame.to_gbq` remain the same with the
+currently released version of ``pandas-gbq=0.1.4``. Documentation is now hosted `here <https://pandas-gbq.readthedocs.io/>`__  (:issue:`15347`)
+
+.. _whatsnew_0200.api_breaking.memory_usage:
+
+Memory Usage for Index is more Accurate
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions, showing ``.memory_usage()`` on a pandas structure that has an index, would only include actual index values and not include structures that facilitated fast indexing. This will generally be different for ``Index`` and ``MultiIndex`` and less-so for other index types. (:issue:`15237`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [8]: index = Index(['foo', 'bar', 'baz'])
+
+   In [9]: index.memory_usage(deep=True)
+   Out[9]: 180
+
+   In [10]: index.get_loc('foo')
+   Out[10]: 0
+
+   In [11]: index.memory_usage(deep=True)
+   Out[11]: 180
+
+New Behavior:
+
+.. code-block:: ipython
+
+   In [8]: index = Index(['foo', 'bar', 'baz'])
+
+   In [9]: index.memory_usage(deep=True)
+   Out[9]: 180
+
+   In [10]: index.get_loc('foo')
+   Out[10]: 0
+
+   In [11]: index.memory_usage(deep=True)
+   Out[11]: 260
+
+.. _whatsnew_0200.api_breaking.sort_index:
+
+DataFrame.sort_index changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In certain cases, calling ``.sort_index()`` on a MultiIndexed DataFrame would return the *same* DataFrame without seeming to sort.
+This would happen with a ``lexsorted``, but non-monotonic levels. (:issue:`15622`, :issue:`15687`, :issue:`14015`, :issue:`13431`, :issue:`15797`)
+
+This is *unchanged* from prior versions, but shown for illustration purposes:
+
+.. ipython:: python
+
+    df = DataFrame(np.arange(6), columns=['value'], index=MultiIndex.from_product([list('BA'), range(3)]))
+    df
+
+.. ipython:: python
+
+    df.index.is_lexsorted()
+    df.index.is_monotonic
+
+Sorting works as expected
+
+.. ipython:: python
+
+    df.sort_index()
+
+.. ipython:: python
+
+    df.sort_index().index.is_lexsorted()
+    df.sort_index().index.is_monotonic
+
+However, this example, which has a non-monotonic 2nd level,
+doesn't behave as desired.
+
+.. ipython:: python
+
+   df = pd.DataFrame(
+           {'value': [1, 2, 3, 4]},
+            index=pd.MultiIndex(levels=[['a', 'b'], ['bb', 'aa']],
+                                labels=[[0, 0, 1, 1], [0, 1, 0, 1]]))
+   df
+
+Previous Behavior:
+
+.. code-block:: python
+
+   In [11]: df.sort_index()
+   Out[11]:
+         value
+   a bb      1
+     aa      2
+   b bb      3
+     aa      4
+
+   In [14]: df.sort_index().index.is_lexsorted()
+   Out[14]: True
+
+   In [15]: df.sort_index().index.is_monotonic
+   Out[15]: False
+
+New Behavior:
+
+.. ipython:: python
+
+   df.sort_index()
+   df.sort_index().index.is_lexsorted()
+   df.sort_index().index.is_monotonic
+
+
+.. _whatsnew_0200.api_breaking.groupby_describe:
+
+Groupby Describe Formatting
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The output formatting of ``groupby.describe()`` now labels the ``describe()`` metrics in the columns instead of the index.
+This format is consistent with ``groupby.agg()`` when applying multiple functions at once. (:issue:`4792`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [1]: df = pd.DataFrame({'A': [1, 1, 2, 2], 'B': [1, 2, 3, 4]})
+
+   In [2]: df.groupby('A').describe()
+   Out[2]:
+                   B
+   A
+   1 count  2.000000
+     mean   1.500000
+     std    0.707107
+     min    1.000000
+     25%    1.250000
+     50%    1.500000
+     75%    1.750000
+     max    2.000000
+   2 count  2.000000
+     mean   3.500000
+     std    0.707107
+     min    3.000000
+     25%    3.250000
+     50%    3.500000
+     75%    3.750000
+     max    4.000000
+
+   In [3]: df.groupby('A').agg([np.mean, np.std, np.min, np.max])
+   Out[3]:
+        B
+     mean       std amin amax
+   A
+   1  1.5  0.707107    1    2
+   2  3.5  0.707107    3    4
+
+New Behavior:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 1, 2, 2], 'B': [1, 2, 3, 4]})
+
+   df.groupby('A').describe()
+
+   df.groupby('A').agg([np.mean, np.std, np.min, np.max])
+
+.. _whatsnew_0200.api_breaking.rolling_pairwise:
+
+Window Binary Corr/Cov operations return a MultiIndex DataFrame
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+A binary window operation, like ``.corr()`` or ``.cov()``, when operating on a ``.rolling(..)``, ``.expanding(..)``, or ``.ewm(..)`` object,
+will now return a 2-level ``MultiIndexed DataFrame`` rather than a ``Panel``, as ``Panel`` is now deprecated,
+see :ref:`here <whatsnew_0200.api_breaking.deprecate_panel>`. These are equivalent in function,
+but a MultiIndexed ``DataFrame`` enjoys more support in pandas.
+See the section on :ref:`Windowed Binary Operations <stats.moments.binary>` for more information. (:issue:`15677`)
+
+.. ipython:: python
+
+   np.random.seed(1234)
+   df = pd.DataFrame(np.random.rand(100, 2),
+                     columns=pd.Index(['A', 'B'], name='bar'),
+                     index=pd.date_range('20160101',
+                                         periods=100, freq='D', name='foo'))
+   df.tail()
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [2]: df.rolling(12).corr()
+   Out[2]:
+   <class 'pandas.core.panel.Panel'>
+   Dimensions: 100 (items) x 2 (major_axis) x 2 (minor_axis)
+   Items axis: 2016-01-01 00:00:00 to 2016-04-09 00:00:00
+   Major_axis axis: A to B
+   Minor_axis axis: A to B
+
+New Behavior:
+
+.. ipython:: python
+
+   res = df.rolling(12).corr()
+   res.tail()
+
+Retrieving a correlation matrix for a cross-section
+
+.. ipython:: python
+
+   df.rolling(12).corr().loc['2016-04-07']
+
+.. _whatsnew_0200.api_breaking.hdfstore_where:
+
+HDFStore where string comparison
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions most types could be compared to string column in a ``HDFStore``
+usually resulting in an invalid comparison, returning an empty result frame. These comparisons will now raise a
+``TypeError`` (:issue:`15492`)
+
+.. ipython:: python
+
+   df = pd.DataFrame({'unparsed_date': ['2014-01-01', '2014-01-01']})
+   df.to_hdf('store.h5', 'key', format='table', data_columns=True)
+   df.dtypes
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [4]: pd.read_hdf('store.h5', 'key', where='unparsed_date > ts')
+   File "<string>", line 1
+     (unparsed_date > 1970-01-01 00:00:01.388552400)
+                           ^
+   SyntaxError: invalid token
+
+New Behavior:
+
+.. code-block:: ipython
+
+   In [18]: ts = pd.Timestamp('2014-01-01')
+
+   In [19]: pd.read_hdf('store.h5', 'key', where='unparsed_date > ts')
+   TypeError: Cannot compare 2014-01-01 00:00:00 of
+   type <class 'pandas.tslib.Timestamp'> to string column
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   os.remove('store.h5')
+
+.. _whatsnew_0200.api_breaking.index_order:
+
+Index.intersection and inner join now preserve the order of the left Index
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:meth:`Index.intersection` now preserves the order of the calling ``Index`` (left)
+instead of the other ``Index`` (right) (:issue:`15582`). This affects inner
+joins, :meth:`DataFrame.join` and :func:`merge`, and the ``.align`` method.
+
+- ``Index.intersection``
+
+  .. ipython:: python
+
+     left = pd.Index([2, 1, 0])
+     left
+     right = pd.Index([1, 2, 3])
+     right
+
+  Previous Behavior:
+
+  .. code-block:: ipython
+
+     In [4]: left.intersection(right)
+     Out[4]: Int64Index([1, 2], dtype='int64')
+
+  New Behavior:
+
+  .. ipython:: python
+
+     left.intersection(right)
+
+- ``DataFrame.join`` and ``pd.merge``
+
+  .. ipython:: python
+
+     left = pd.DataFrame({'a': [20, 10, 0]}, index=[2, 1, 0])
+     left
+     right = pd.DataFrame({'b': [100, 200, 300]}, index=[1, 2, 3])
+     right
+
+  Previous Behavior:
+
+  .. code-block:: ipython
+
+     In [4]: left.join(right, how='inner')
+     Out[4]:
+         a    b
+     1  10  100
+     2  20  200
+
+  New Behavior:
+
+  .. ipython:: python
+
+     left.join(right, how='inner')
+
+.. _whatsnew_0200.api_breaking.pivot_table:
+
+Pivot Table always returns a DataFrame
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The documentation for :meth:`pivot_table` states that a ``DataFrame`` is *always* returned. Here a bug
+is fixed that allowed this to return a ``Series`` under certain circumstance. (:issue:`4386`)
+
+.. ipython:: python
+
+   df = DataFrame({'col1': [3, 4, 5],
+                   'col2': ['C', 'D', 'E'],
+                   'col3': [1, 3, 9]})
+   df
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [2]: df.pivot_table('col1', index=['col3', 'col2'], aggfunc=np.sum)
+   Out[2]:
+   col3  col2
+   1     C       3
+   3     D       4
+   9     E       5
+   Name: col1, dtype: int64
+
+New Behavior:
+
+.. ipython:: python
+
+   df.pivot_table('col1', index=['col3', 'col2'], aggfunc=np.sum)
+
+.. _whatsnew_0200.api:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+
+- ``numexpr`` version is now required to be >= 2.4.6 and it will not be used at all if this requisite is not fulfilled (:issue:`15213`).
+- ``CParserError`` has been renamed to ``ParserError`` in ``pd.read_csv()`` and will be removed in the future (:issue:`12665`)
+- ``SparseArray.cumsum()`` and ``SparseSeries.cumsum()`` will now always return ``SparseArray`` and ``SparseSeries`` respectively (:issue:`12855`)
+- ``DataFrame.applymap()`` with an empty ``DataFrame`` will return a copy of the empty ``DataFrame`` instead of a ``Series`` (:issue:`8222`)
+- ``Series.map()`` now respects default values of dictionary subclasses with a ``__missing__`` method, such as ``collections.Counter`` (:issue:`15999`)
+- ``.loc`` has compat with ``.ix`` for accepting iterators, and NamedTuples (:issue:`15120`)
+- ``interpolate()`` and ``fillna()`` will raise a ``ValueError`` if the ``limit`` keyword argument is not greater than 0. (:issue:`9217`)
+- ``pd.read_csv()`` will now issue a ``ParserWarning`` whenever there are conflicting values provided by the ``dialect`` parameter and the user (:issue:`14898`)
+- ``pd.read_csv()`` will now raise a ``ValueError`` for the C engine if the quote character is larger than than one byte (:issue:`11592`)
+- ``inplace`` arguments now require a boolean value, else a ``ValueError`` is thrown (:issue:`14189`)
+- ``pandas.api.types.is_datetime64_ns_dtype`` will now report ``True`` on a tz-aware dtype, similar to ``pandas.api.types.is_datetime64_any_dtype``
+- ``DataFrame.asof()`` will return a null filled ``Series`` instead the scalar ``NaN`` if a match is not found (:issue:`15118`)
+- Specific support for ``copy.copy()`` and ``copy.deepcopy()`` functions on NDFrame objects (:issue:`15444`)
+- ``Series.sort_values()`` accepts a one element list of bool for consistency with the behavior of ``DataFrame.sort_values()`` (:issue:`15604`)
+- ``.merge()`` and ``.join()`` on ``category`` dtype columns will now preserve the category dtype when possible (:issue:`10409`)
+- ``SparseDataFrame.default_fill_value`` will be 0, previously was ``nan`` in the return from ``pd.get_dummies(..., sparse=True)`` (:issue:`15594`)
+- The default behaviour of ``Series.str.match`` has changed from extracting
+  groups to matching the pattern. The extracting behaviour was deprecated
+  since pandas version 0.13.0 and can be done with the ``Series.str.extract``
+  method (:issue:`5224`). As a consequence, the ``as_indexer`` keyword is
+  ignored (no longer needed to specify the new behaviour) and is deprecated.
+- ``NaT`` will now correctly report ``False`` for datetimelike boolean operations such as ``is_month_start`` (:issue:`15781`)
+- ``NaT`` will now correctly return ``np.nan`` for ``Timedelta`` and ``Period`` accessors such as ``days`` and ``quarter`` (:issue:`15782`)
+- ``NaT`` will now returns ``NaT`` for ``tz_localize`` and ``tz_convert``
+  methods (:issue:`15830`)
+- ``DataFrame`` and ``Panel`` constructors with invalid input will now raise ``ValueError`` rather than ``PandasError``, if called with scalar inputs and not axes (:issue:`15541`)
+- ``DataFrame`` and ``Panel`` constructors with invalid input will now raise ``ValueError`` rather than ``pandas.core.common.PandasError``, if called with scalar inputs and not axes; The exception ``PandasError`` is removed as well. (:issue:`15541`)
+- The exception ``pandas.core.common.AmbiguousIndexError`` is removed as it is not referenced (:issue:`15541`)
+
+
+.. _whatsnew_0200.privacy:
+
+Reorganization of the library: Privacy Changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _whatsnew_0200.privacy.extensions:
+
+Modules Privacy Has Changed
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Some formerly public python/c/c++/cython extension modules have been moved and/or renamed. These are all removed from the public API.
+Furthermore, the ``pandas.core``, ``pandas.compat``, and ``pandas.util`` top-level modules are now considered to be PRIVATE.
+If indicated, a deprecation warning will be issued if you reference theses modules. (:issue:`12588`)
+
+.. csv-table::
+    :header: "Previous Location", "New Location", "Deprecated"
+    :widths: 30, 30, 4
+
+    "pandas.lib", "pandas._libs.lib", "X"
+    "pandas.tslib", "pandas._libs.tslib", "X"
+    "pandas.computation", "pandas.core.computation", "X"
+    "pandas.msgpack", "pandas.io.msgpack", ""
+    "pandas.index", "pandas._libs.index", ""
+    "pandas.algos", "pandas._libs.algos", ""
+    "pandas.hashtable", "pandas._libs.hashtable", ""
+    "pandas.indexes", "pandas.core.indexes", ""
+    "pandas.json", "pandas._libs.json / pandas.io.json", "X"
+    "pandas.parser", "pandas._libs.parsers", "X"
+    "pandas.formats", "pandas.io.formats", ""
+    "pandas.sparse", "pandas.core.sparse", ""
+    "pandas.tools", "pandas.core.reshape", "X"
+    "pandas.types", "pandas.core.dtypes", "X"
+    "pandas.io.sas.saslib", "pandas.io.sas._sas", ""
+    "pandas._join", "pandas._libs.join", ""
+    "pandas._hash", "pandas._libs.hashing", ""
+    "pandas._period", "pandas._libs.period", ""
+    "pandas._sparse", "pandas._libs.sparse", ""
+    "pandas._testing", "pandas._libs.testing", ""
+    "pandas._window", "pandas._libs.window", ""
+
+
+Some new subpackages are created with public functionality that is not directly
+exposed in the top-level namespace: ``pandas.errors``, ``pandas.plotting`` and
+``pandas.testing`` (more details below). Together with ``pandas.api.types`` and
+certain functions in the ``pandas.io`` and ``pandas.tseries`` submodules,
+these are now the public subpackages.
+
+Further changes:
+
+- The function :func:`~pandas.api.types.union_categoricals` is now importable from ``pandas.api.types``, formerly from ``pandas.types.concat`` (:issue:`15998`)
+- The type import ``pandas.tslib.NaTType`` is deprecated and can be replaced by using ``type(pandas.NaT)`` (:issue:`16146`)
+- The public functions in ``pandas.tools.hashing`` deprecated from that locations, but are now importable from ``pandas.util`` (:issue:`16223`)
+- The modules in ``pandas.util``: ``decorators``, ``print_versions``, ``doctools``, ``validators``, ``depr_module`` are now private. Only the functions exposed in ``pandas.util`` itself are public (:issue:`16223`)
+
+.. _whatsnew_0200.privacy.errors:
+
+``pandas.errors``
+^^^^^^^^^^^^^^^^^
+
+We are adding a standard public module for all pandas exceptions & warnings ``pandas.errors``. (:issue:`14800`). Previously
+these exceptions & warnings could be imported from ``pandas.core.common`` or ``pandas.io.common``. These exceptions and warnings
+will be removed from the ``*.common`` locations in a future release. (:issue:`15541`)
+
+The following are now part of this API:
+
+.. code-block:: python
+
+   ['DtypeWarning',
+    'EmptyDataError',
+    'OutOfBoundsDatetime',
+    'ParserError',
+    'ParserWarning',
+    'PerformanceWarning',
+    'UnsortedIndexError',
+    'UnsupportedFunctionCall']
+
+
+.. _whatsnew_0200.privacy.testing:
+
+``pandas.testing``
+^^^^^^^^^^^^^^^^^^
+
+We are adding a standard module that exposes the public testing functions in ``pandas.testing`` (:issue:`9895`). Those functions can be used when writing tests for functionality using pandas objects.
+
+The following testing functions are now part of this API:
+
+- :func:`testing.assert_frame_equal`
+- :func:`testing.assert_series_equal`
+- :func:`testing.assert_index_equal`
+
+
+.. _whatsnew_0200.privacy.plotting:
+
+``pandas.plotting``
+^^^^^^^^^^^^^^^^^^^
+
+A new public ``pandas.plotting`` module has been added that holds plotting functionality that was previously in either ``pandas.tools.plotting`` or in the top-level namespace. See the :ref:`deprecations sections <whatsnew_0200.privacy.deprecate_plotting>` for more details.
+
+.. _whatsnew_0200.privacy.development:
+
+Other Development Changes
+^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Building pandas for development now requires ``cython >= 0.23`` (:issue:`14831`)
+- Require at least 0.23 version of cython to avoid problems with character encodings (:issue:`14699`)
+- Switched the test framework to use `pytest <http://doc.pytest.org/en/latest>`__ (:issue:`13097`)
+- Reorganization of tests directory layout (:issue:`14854`, :issue:`15707`).
+
+
+.. _whatsnew_0200.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+
+.. _whatsnew_0200.api_breaking.deprecate_ix:
+
+Deprecate ``.ix``
+^^^^^^^^^^^^^^^^^
+
+The ``.ix`` indexer is deprecated, in favor of the more strict ``.iloc`` and ``.loc`` indexers. ``.ix`` offers a lot of magic on the inference of what the user wants to do. To wit, ``.ix`` can decide to index *positionally* OR via *labels*, depending on the data type of the index. This has caused quite a bit of user confusion over the years. The full indexing documentation is :ref:`here <indexing>`. (:issue:`14218`)
+
+The recommended methods of indexing are:
+
+- ``.loc`` if you want to *label* index
+- ``.iloc`` if you want to *positionally* index.
+
+Using ``.ix`` will now show a ``DeprecationWarning`` with a link to some examples of how to convert code :ref:`here <indexing.deprecate_ix>`.
+
+
+.. ipython:: python
+
+  df = pd.DataFrame({'A': [1, 2, 3],
+                     'B': [4, 5, 6]},
+                    index=list('abc'))
+
+  df
+
+Previous Behavior, where you wish to get the 0th and the 2nd elements from the index in the 'A' column.
+
+.. code-block:: ipython
+
+  In [3]: df.ix[[0, 2], 'A']
+  Out[3]:
+  a    1
+  c    3
+  Name: A, dtype: int64
+
+Using ``.loc``. Here we will select the appropriate indexes from the index, then use *label* indexing.
+
+.. ipython:: python
+
+  df.loc[df.index[[0, 2]], 'A']
+
+Using ``.iloc``. Here we will get the location of the 'A' column, then use *positional* indexing to select things.
+
+.. ipython:: python
+
+  df.iloc[[0, 2], df.columns.get_loc('A')]
+
+
+.. _whatsnew_0200.api_breaking.deprecate_panel:
+
+Deprecate Panel
+^^^^^^^^^^^^^^^
+
+``Panel`` is deprecated and will be removed in a future version. The recommended way to represent 3-D data are
+with a ``MultiIndex`` on a ``DataFrame`` via the :meth:`~Panel.to_frame` or with the `xarray package <http://xarray.pydata.org/en/stable/>`__. Pandas
+provides a :meth:`~Panel.to_xarray` method to automate this conversion. For more details see :ref:`Deprecate Panel <dsintro.deprecate_panel>` documentation. (:issue:`13563`).
+
+.. ipython:: python
+   :okwarning:
+
+   p = tm.makePanel()
+   p
+
+Convert to a MultiIndex DataFrame
+
+.. ipython:: python
+
+   p.to_frame()
+
+Convert to an xarray DataArray
+
+.. ipython:: python
+   :okwarning:
+
+   p.to_xarray()
+
+.. _whatsnew_0200.api_breaking.deprecate_group_agg_dict:
+
+Deprecate groupby.agg() with a dictionary when renaming
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The ``.groupby(..).agg(..)``, ``.rolling(..).agg(..)``, and ``.resample(..).agg(..)``  syntax can accept a variable of inputs, including scalars,
+list, and a dict of column names to scalars or lists. This provides a useful syntax for constructing multiple
+(potentially different) aggregations.
+
+However, ``.agg(..)`` can *also* accept a dict that allows 'renaming' of the result columns. This is a complicated and confusing syntax, as well as not consistent
+between ``Series`` and ``DataFrame``. We are deprecating this 'renaming' functionality.
+
+- We are deprecating passing a dict to a grouped/rolled/resampled ``Series``. This allowed
+  one to ``rename`` the resulting aggregation, but this had a completely different
+  meaning than passing a dictionary to a grouped ``DataFrame``, which accepts column-to-aggregations.
+- We are deprecating passing a dict-of-dicts to a grouped/rolled/resampled ``DataFrame`` in a similar manner.
+
+This is an illustrative example:
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': [1, 1, 1, 2, 2],
+                       'B': range(5),
+                       'C': range(5)})
+    df
+
+Here is a typical useful syntax for computing different aggregations for different columns. This
+is a natural, and useful syntax. We aggregate from the dict-to-list by taking the specified
+columns and applying the list of functions. This returns a ``MultiIndex`` for the columns (this is *not* deprecated).
+
+.. ipython:: python
+
+   df.groupby('A').agg({'B': 'sum', 'C': 'min'})
+
+Here's an example of the first deprecation, passing a dict to a grouped ``Series``. This
+is a combination aggregation & renaming:
+
+.. code-block:: ipython
+
+   In [6]: df.groupby('A').B.agg({'foo': 'count'})
+   FutureWarning: using a dict on a Series for aggregation
+   is deprecated and will be removed in a future version
+
+   Out[6]:
+      foo
+   A
+   1    3
+   2    2
+
+You can accomplish the same operation, more idiomatically by:
+
+.. ipython:: python
+
+   df.groupby('A').B.agg(['count']).rename(columns={'count': 'foo'})
+
+
+Here's an example of the second deprecation, passing a dict-of-dict to a grouped ``DataFrame``:
+
+.. code-block:: python
+
+   In [23]: (df.groupby('A')
+               .agg({'B': {'foo': 'sum'}, 'C': {'bar': 'min'}})
+            )
+   FutureWarning: using a dict with renaming is deprecated and
+   will be removed in a future version
+
+   Out[23]:
+        B   C
+      foo bar
+   A
+   1   3   0
+   2   7   3
+
+
+You can accomplish nearly the same by:
+
+.. ipython:: python
+
+   (df.groupby('A')
+      .agg({'B': 'sum', 'C': 'min'})
+      .rename(columns={'B': 'foo', 'C': 'bar'})
+   )
+
+
+
+.. _whatsnew_0200.privacy.deprecate_plotting:
+
+Deprecate .plotting
+^^^^^^^^^^^^^^^^^^^
+
+The ``pandas.tools.plotting`` module has been deprecated,  in favor of the top level ``pandas.plotting`` module. All the public plotting functions are now available
+from ``pandas.plotting`` (:issue:`12548`).
+
+Furthermore, the top-level ``pandas.scatter_matrix`` and ``pandas.plot_params`` are deprecated.
+Users can import these from ``pandas.plotting`` as well.
+
+Previous script:
+
+.. code-block:: python
+
+   pd.tools.plotting.scatter_matrix(df)
+   pd.scatter_matrix(df)
+
+Should be changed to:
+
+.. code-block:: python
+
+    pd.plotting.scatter_matrix(df)
+
+
+
+.. _whatsnew_0200.deprecations.other:
+
+Other Deprecations
+^^^^^^^^^^^^^^^^^^
+
+- ``SparseArray.to_dense()`` has deprecated the ``fill`` parameter, as that parameter was not being respected (:issue:`14647`)
+- ``SparseSeries.to_dense()`` has deprecated the ``sparse_only`` parameter (:issue:`14647`)
+- ``Series.repeat()`` has deprecated the ``reps`` parameter in favor of ``repeats`` (:issue:`12662`)
+- The ``Series`` constructor and ``.astype`` method have deprecated accepting timestamp dtypes without a frequency (e.g. ``np.datetime64``) for the ``dtype`` parameter (:issue:`15524`)
+- ``Index.repeat()`` and ``MultiIndex.repeat()`` have deprecated the ``n`` parameter in favor of ``repeats`` (:issue:`12662`)
+- ``Categorical.searchsorted()`` and ``Series.searchsorted()`` have deprecated the ``v`` parameter in favor of ``value`` (:issue:`12662`)
+- ``TimedeltaIndex.searchsorted()``, ``DatetimeIndex.searchsorted()``, and ``PeriodIndex.searchsorted()`` have deprecated the ``key`` parameter in favor of ``value`` (:issue:`12662`)
+- ``DataFrame.astype()`` has deprecated the ``raise_on_error`` parameter in favor of ``errors`` (:issue:`14878`)
+- ``Series.sortlevel`` and ``DataFrame.sortlevel`` have been deprecated in favor of ``Series.sort_index`` and ``DataFrame.sort_index`` (:issue:`15099`)
+- importing ``concat`` from ``pandas.tools.merge`` has been deprecated in favor of imports from the ``pandas`` namespace. This should only affect explicit imports (:issue:`15358`)
+- ``Series/DataFrame/Panel.consolidate()`` been deprecated as a public method. (:issue:`15483`)
+- The ``as_indexer`` keyword of ``Series.str.match()`` has been deprecated (ignored keyword) (:issue:`15257`).
+- The following top-level pandas functions have been deprecated and will be removed in a future version (:issue:`13790`, :issue:`15940`)
+
+  * ``pd.pnow()``, replaced by ``Period.now()``
+  * ``pd.Term``, is removed, as it is not applicable to user code. Instead use in-line string expressions in the where clause when searching in HDFStore
+  * ``pd.Expr``, is removed, as it is not applicable to user code.
+  * ``pd.match()``, is removed.
+  * ``pd.groupby()``, replaced by using the ``.groupby()`` method directly on a ``Series/DataFrame``
+  * ``pd.get_store()``, replaced by a direct call to ``pd.HDFStore(...)``
+- ``is_any_int_dtype``, ``is_floating_dtype``, and ``is_sequence`` are deprecated from ``pandas.api.types`` (:issue:`16042`)
+
+.. _whatsnew_0200.prior_deprecations:
+
+Removal of prior version deprecations/changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+- The ``pandas.rpy`` module is removed. Similar functionality can be accessed
+  through the `rpy2 <https://rpy2.readthedocs.io/>`__ project.
+  See the :ref:`R interfacing docs <rpy>` for more details.
+- The ``pandas.io.ga`` module with a ``google-analytics`` interface is removed (:issue:`11308`).
+  Similar functionality can be found in the `Google2Pandas <https://github.com/panalysis/Google2Pandas>`__ package.
+- ``pd.to_datetime`` and ``pd.to_timedelta`` have dropped the ``coerce`` parameter in favor of ``errors`` (:issue:`13602`)
+- ``pandas.stats.fama_macbeth``, ``pandas.stats.ols``, ``pandas.stats.plm`` and ``pandas.stats.var``, as well as the top-level ``pandas.fama_macbeth`` and ``pandas.ols`` routines are removed. Similar functionality can be found in the `statsmodels <shttp://www.statsmodels.org/dev/>`__ package. (:issue:`11898`)
+- The ``TimeSeries`` and ``SparseTimeSeries`` classes, aliases of ``Series``
+  and ``SparseSeries``, are removed (:issue:`10890`, :issue:`15098`).
+- ``Series.is_time_series`` is dropped in favor of ``Series.index.is_all_dates`` (:issue:`15098`)
+- The deprecated ``irow``, ``icol``, ``iget`` and ``iget_value`` methods are removed
+  in favor of ``iloc`` and ``iat`` as explained :ref:`here <whatsnew_0170.deprecations>` (:issue:`10711`).
+- The deprecated ``DataFrame.iterkv()`` has been removed in favor of ``DataFrame.iteritems()`` (:issue:`10711`)
+- The ``Categorical`` constructor has dropped the ``name`` parameter (:issue:`10632`)
+- ``Categorical`` has dropped support for ``NaN`` categories (:issue:`10748`)
+- The ``take_last`` parameter has been dropped from ``duplicated()``, ``drop_duplicates()``, ``nlargest()``, and ``nsmallest()`` methods (:issue:`10236`, :issue:`10792`, :issue:`10920`)
+- ``Series``, ``Index``, and ``DataFrame`` have dropped the ``sort`` and ``order`` methods (:issue:`10726`)
+- Where clauses in ``pytables`` are only accepted as strings and expressions types and not other data-types (:issue:`12027`)
+- ``DataFrame`` has dropped the ``combineAdd`` and ``combineMult`` methods in favor of ``add`` and ``mul`` respectively (:issue:`10735`)
+
+.. _whatsnew_0200.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved performance of ``pd.wide_to_long()`` (:issue:`14779`)
+- Improved performance of ``pd.factorize()`` by releasing the GIL with ``object`` dtype when inferred as strings (:issue:`14859`, :issue:`16057`)
+- Improved performance of timeseries plotting with an irregular DatetimeIndex
+  (or with ``compat_x=True``) (:issue:`15073`).
+- Improved performance of ``groupby().cummin()`` and ``groupby().cummax()`` (:issue:`15048`, :issue:`15109`, :issue:`15561`, :issue:`15635`)
+- Improved performance and reduced memory when indexing with a ``MultiIndex`` (:issue:`15245`)
+- When reading buffer object in ``read_sas()`` method without specified format, filepath string is inferred rather than buffer object. (:issue:`14947`)
+- Improved performance of ``.rank()`` for categorical data (:issue:`15498`)
+- Improved performance when using ``.unstack()`` (:issue:`15503`)
+- Improved performance of merge/join on ``category`` columns (:issue:`10409`)
+- Improved performance of ``drop_duplicates()`` on ``bool`` columns (:issue:`12963`)
+- Improve performance of ``pd.core.groupby.GroupBy.apply`` when the applied
+  function used the ``.name`` attribute of the group DataFrame (:issue:`15062`).
+- Improved performance of ``iloc`` indexing with a list or array (:issue:`15504`).
+- Improved performance of ``Series.sort_index()`` with a monotonic index (:issue:`15694`)
+- Improved performance in ``pd.read_csv()`` on some platforms with buffered reads (:issue:`16039`)
+
+.. _whatsnew_0200.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+Conversion
+^^^^^^^^^^
+
+- Bug in ``Timestamp.replace`` now raises ``TypeError`` when incorrect argument names are given; previously this raised ``ValueError`` (:issue:`15240`)
+- Bug in ``Timestamp.replace`` with compat for passing long integers (:issue:`15030`)
+- Bug in ``Timestamp`` returning UTC based time/date attributes when a timezone was provided (:issue:`13303`, :issue:`6538`)
+- Bug in ``Timestamp`` incorrectly localizing timezones during construction (:issue:`11481`, :issue:`15777`)
+- Bug in ``TimedeltaIndex`` addition where overflow was being allowed without error (:issue:`14816`)
+- Bug in ``TimedeltaIndex`` raising a ``ValueError`` when boolean indexing with ``loc`` (:issue:`14946`)
+- Bug in catching an overflow in ``Timestamp`` + ``Timedelta/Offset`` operations (:issue:`15126`)
+- Bug in ``DatetimeIndex.round()`` and ``Timestamp.round()`` floating point accuracy when rounding by milliseconds or less (:issue:`14440`, :issue:`15578`)
+- Bug in ``astype()`` where ``inf`` values were incorrectly converted to integers. Now raises error now with ``astype()`` for Series and DataFrames (:issue:`14265`)
+- Bug in ``DataFrame(..).apply(to_numeric)`` when values are of type decimal.Decimal. (:issue:`14827`)
+- Bug in ``describe()`` when passing a numpy array which does not contain the median to the ``percentiles`` keyword argument (:issue:`14908`)
+- Cleaned up ``PeriodIndex`` constructor, including raising on floats more consistently (:issue:`13277`)
+- Bug in using ``__deepcopy__`` on empty NDFrame objects (:issue:`15370`)
+- Bug in ``.replace()`` may result in incorrect dtypes. (:issue:`12747`, :issue:`15765`)
+- Bug in ``Series.replace`` and ``DataFrame.replace`` which failed on empty replacement dicts (:issue:`15289`)
+- Bug in ``Series.replace`` which replaced a numeric by string (:issue:`15743`)
+- Bug in ``Index`` construction with ``NaN`` elements and integer dtype specified (:issue:`15187`)
+- Bug in ``Series`` construction with a datetimetz (:issue:`14928`)
+- Bug in ``Series.dt.round()`` inconsistent behaviour on ``NaT`` 's with different arguments (:issue:`14940`)
+- Bug in ``Series`` constructor when both ``copy=True`` and ``dtype`` arguments are provided (:issue:`15125`)
+- Incorrect dtyped ``Series`` was returned by comparison methods (e.g., ``lt``, ``gt``, ...) against a constant for an empty ``DataFrame`` (:issue:`15077`)
+- Bug in ``Series.ffill()`` with mixed dtypes containing tz-aware datetimes. (:issue:`14956`)
+- Bug in ``DataFrame.fillna()`` where the argument ``downcast`` was ignored when fillna value was of type ``dict`` (:issue:`15277`)
+- Bug in ``.asfreq()``, where frequency was not set for empty ``Series`` (:issue:`14320`)
+- Bug in ``DataFrame`` construction with nulls and datetimes in a list-like (:issue:`15869`)
+- Bug in ``DataFrame.fillna()`` with tz-aware datetimes (:issue:`15855`)
+- Bug in ``is_string_dtype``, ``is_timedelta64_ns_dtype``, and ``is_string_like_dtype`` in which an error was raised when ``None`` was passed in (:issue:`15941`)
+- Bug in the return type of ``pd.unique`` on a ``Categorical``, which was returning an ndarray and not a ``Categorical`` (:issue:`15903`)
+- Bug in ``Index.to_series()`` where the index was not copied (and so mutating later would change the original), (:issue:`15949`)
+- Bug in indexing with partial string indexing with a len-1 DataFrame (:issue:`16071`)
+- Bug in ``Series`` construction where passing invalid dtype didn't raise an error. (:issue:`15520`)
+
+Indexing
+^^^^^^^^
+
+- Bug in ``Index`` power operations with reversed operands (:issue:`14973`)
+- Bug in ``DataFrame.sort_values()`` when sorting by multiple columns where one column is of type ``int64`` and contains ``NaT`` (:issue:`14922`)
+- Bug in ``DataFrame.reindex()`` in which ``method`` was ignored when passing ``columns`` (:issue:`14992`)
+- Bug in ``DataFrame.loc`` with indexing a ``MultiIndex`` with a ``Series`` indexer (:issue:`14730`, :issue:`15424`)
+- Bug in ``DataFrame.loc`` with indexing a ``MultiIndex`` with a numpy array (:issue:`15434`)
+- Bug in ``Series.asof`` which raised if the series contained all ``np.nan`` (:issue:`15713`)
+- Bug in ``.at`` when selecting from a tz-aware column (:issue:`15822`)
+- Bug in ``Series.where()`` and ``DataFrame.where()`` where array-like conditionals were being rejected (:issue:`15414`)
+- Bug in ``Series.where()`` where TZ-aware data was converted to float representation (:issue:`15701`)
+- Bug in ``.loc`` that would not return the correct dtype for scalar access for a DataFrame (:issue:`11617`)
+- Bug in output formatting of a ``MultiIndex`` when names are integers (:issue:`12223`, :issue:`15262`)
+- Bug in ``Categorical.searchsorted()`` where alphabetical instead of the provided categorical order was used (:issue:`14522`)
+- Bug in ``Series.iloc`` where a ``Categorical`` object for list-like indexes input was returned, where a ``Series`` was expected. (:issue:`14580`)
+- Bug in ``DataFrame.isin`` comparing datetimelike to empty frame (:issue:`15473`)
+- Bug in ``.reset_index()`` when an all ``NaN`` level of a ``MultiIndex`` would fail (:issue:`6322`)
+- Bug in ``.reset_index()`` when raising error for index name already present in ``MultiIndex`` columns (:issue:`16120`)
+- Bug in creating a ``MultiIndex`` with tuples and not passing a list of names; this will now raise ``ValueError`` (:issue:`15110`)
+- Bug in the HTML display with with a ``MultiIndex`` and truncation (:issue:`14882`)
+- Bug in the display of ``.info()`` where a qualifier (+) would always be displayed with a ``MultiIndex`` that contains only non-strings (:issue:`15245`)
+- Bug in ``pd.concat()`` where the names of ``MultiIndex`` of resulting ``DataFrame`` are not handled correctly when ``None`` is presented in the names of ``MultiIndex`` of input ``DataFrame`` (:issue:`15787`)
+- Bug in ``DataFrame.sort_index()`` and ``Series.sort_index()`` where ``na_position`` doesn't work with a ``MultiIndex`` (:issue:`14784`, :issue:`16604`)
+- Bug in in ``pd.concat()`` when combining objects with a ``CategoricalIndex`` (:issue:`16111`)
+- Bug in indexing with a scalar and a ``CategoricalIndex`` (:issue:`16123`)
+
+I/O
+^^^
+
+- Bug in ``pd.to_numeric()`` in which float and unsigned integer elements were being improperly casted (:issue:`14941`, :issue:`15005`)
+- Bug in ``pd.read_fwf()`` where the skiprows parameter was not being respected during column width inference (:issue:`11256`)
+- Bug in ``pd.read_csv()`` in which the ``dialect`` parameter was not being verified before processing (:issue:`14898`)
+- Bug in ``pd.read_csv()`` in which missing data was being improperly handled with ``usecols`` (:issue:`6710`)
+- Bug in ``pd.read_csv()`` in which a file containing a row with many columns followed by rows with fewer columns would cause a crash (:issue:`14125`)
+- Bug in ``pd.read_csv()`` for the C engine where ``usecols`` were being indexed incorrectly with ``parse_dates`` (:issue:`14792`)
+- Bug in ``pd.read_csv()`` with ``parse_dates`` when multi-line headers are specified (:issue:`15376`)
+- Bug in ``pd.read_csv()`` with ``float_precision='round_trip'`` which caused a segfault when a text entry is parsed (:issue:`15140`)
+- Bug in ``pd.read_csv()`` when an index was specified and no values were specified as null values (:issue:`15835`)
+- Bug in ``pd.read_csv()`` in which certain invalid file objects caused the Python interpreter to crash (:issue:`15337`)
+- Bug in ``pd.read_csv()`` in which invalid values for ``nrows`` and ``chunksize`` were allowed (:issue:`15767`)
+- Bug in ``pd.read_csv()`` for the Python engine in which unhelpful error messages were being raised when parsing errors occurred (:issue:`15910`)
+- Bug in ``pd.read_csv()`` in which the ``skipfooter`` parameter was not being properly validated (:issue:`15925`)
+- Bug in ``pd.to_csv()`` in which there was numeric overflow when a timestamp index was being written (:issue:`15982`)
+- Bug in ``pd.util.hashing.hash_pandas_object()`` in which hashing of categoricals depended on the ordering of categories, instead of just their values. (:issue:`15143`)
+- Bug in ``.to_json()`` where ``lines=True`` and contents (keys or values) contain escaped characters (:issue:`15096`)
+- Bug in ``.to_json()`` causing single byte ascii characters to be expanded to four byte unicode (:issue:`15344`)
+- Bug in ``.to_json()`` for the C engine where rollover was not correctly handled for case where frac is odd and diff is exactly 0.5 (:issue:`15716`, :issue:`15864`)
+- Bug in ``pd.read_json()`` for Python 2 where ``lines=True`` and contents contain non-ascii unicode characters (:issue:`15132`)
+- Bug in ``pd.read_msgpack()`` in which ``Series`` categoricals were being improperly processed (:issue:`14901`)
+- Bug in ``pd.read_msgpack()`` which did not allow loading of a dataframe with an index of type ``CategoricalIndex`` (:issue:`15487`)
+- Bug in ``pd.read_msgpack()`` when deserializing a ``CategoricalIndex`` (:issue:`15487`)
+- Bug in ``DataFrame.to_records()`` with converting a ``DatetimeIndex`` with a timezone (:issue:`13937`)
+- Bug in ``DataFrame.to_records()`` which failed with unicode characters in column names (:issue:`11879`)
+- Bug in ``.to_sql()`` when writing a DataFrame with numeric index names (:issue:`15404`).
+- Bug in ``DataFrame.to_html()`` with ``index=False`` and ``max_rows`` raising in ``IndexError`` (:issue:`14998`)
+- Bug in ``pd.read_hdf()`` passing a ``Timestamp`` to the ``where`` parameter with a non date column (:issue:`15492`)
+- Bug in ``DataFrame.to_stata()`` and ``StataWriter`` which produces incorrectly formatted files to be produced for some locales (:issue:`13856`)
+- Bug in ``StataReader`` and ``StataWriter`` which allows invalid encodings (:issue:`15723`)
+- Bug in the ``Series`` repr not showing the length when the output was truncated (:issue:`15962`).
+
+Plotting
+^^^^^^^^
+
+- Bug in ``DataFrame.hist`` where ``plt.tight_layout`` caused an ``AttributeError``  (use ``matplotlib >= 2.0.1``) (:issue:`9351`)
+- Bug in ``DataFrame.boxplot`` where ``fontsize`` was not applied to the tick labels on both axes (:issue:`15108`)
+- Bug in the date and time converters pandas registers with matplotlib not handling multiple dimensions (:issue:`16026`)
+- Bug in ``pd.scatter_matrix()`` could accept either ``color`` or ``c``, but not both (:issue:`14855`)
+
+Groupby/Resample/Rolling
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Bug in ``.groupby(..).resample()`` when passed the ``on=`` kwarg. (:issue:`15021`)
+- Properly set ``__name__`` and ``__qualname__`` for ``Groupby.*`` functions (:issue:`14620`)
+- Bug in ``GroupBy.get_group()`` failing with a categorical grouper (:issue:`15155`)
+- Bug in ``.groupby(...).rolling(...)`` when ``on`` is specified and using a ``DatetimeIndex`` (:issue:`15130`, :issue:`13966`)
+- Bug in groupby operations with ``timedelta64`` when passing ``numeric_only=False`` (:issue:`5724`)
+- Bug in ``groupby.apply()`` coercing ``object`` dtypes to numeric types, when not all values were numeric (:issue:`14423`, :issue:`15421`, :issue:`15670`)
+- Bug in ``resample``, where a non-string ``loffset`` argument would not be applied when resampling a timeseries (:issue:`13218`)
+- Bug in ``DataFrame.groupby().describe()`` when grouping on ``Index`` containing tuples (:issue:`14848`)
+- Bug in ``groupby().nunique()`` with a datetimelike-grouper where bins counts were incorrect (:issue:`13453`)
+- Bug in ``groupby.transform()`` that would coerce the resultant dtypes back to the original (:issue:`10972`, :issue:`11444`)
+- Bug in ``groupby.agg()`` incorrectly localizing timezone on ``datetime`` (:issue:`15426`, :issue:`10668`, :issue:`13046`)
+- Bug in ``.rolling/expanding()`` functions where ``count()`` was not counting ``np.Inf``, nor handling ``object`` dtypes (:issue:`12541`)
+- Bug in ``.rolling()`` where ``pd.Timedelta`` or ``datetime.timedelta`` was not accepted as a ``window`` argument (:issue:`15440`)
+- Bug in ``Rolling.quantile`` function that caused a segmentation fault when called with a quantile value outside of the range [0, 1] (:issue:`15463`)
+- Bug in ``DataFrame.resample().median()`` if duplicate column names are present (:issue:`14233`)
+
+Sparse
+^^^^^^
+
+- Bug in ``SparseSeries.reindex`` on single level with list of length 1 (:issue:`15447`)
+- Bug in repr-formatting a ``SparseDataFrame`` after a value was set on (a copy of) one of its series (:issue:`15488`)
+- Bug in ``SparseDataFrame`` construction with lists not coercing to dtype (:issue:`15682`)
+- Bug in sparse array indexing in which indices were not being validated (:issue:`15863`)
+
+Reshaping
+^^^^^^^^^
+
+- Bug in ``pd.merge_asof()`` where ``left_index`` or ``right_index`` caused a failure when multiple ``by`` was specified (:issue:`15676`)
+- Bug in ``pd.merge_asof()`` where ``left_index``/``right_index`` together caused a failure when ``tolerance`` was specified (:issue:`15135`)
+- Bug in ``DataFrame.pivot_table()`` where ``dropna=True`` would not drop all-NaN columns when the columns was a ``category`` dtype (:issue:`15193`)
+- Bug in ``pd.melt()`` where passing a tuple value for ``value_vars`` caused a ``TypeError`` (:issue:`15348`)
+- Bug in ``pd.pivot_table()`` where no error was raised when values argument was not in the columns (:issue:`14938`)
+- Bug in ``pd.concat()`` in which concatenating with an empty dataframe with ``join='inner'`` was being improperly handled (:issue:`15328`)
+- Bug with ``sort=True`` in ``DataFrame.join`` and ``pd.merge`` when joining on indexes (:issue:`15582`)
+- Bug in ``DataFrame.nsmallest`` and ``DataFrame.nlargest`` where identical values resulted in duplicated rows (:issue:`15297`)
+- Bug in :func:`pandas.pivot_table` incorrectly raising ``UnicodeError`` when passing unicode input for ``margins`` keyword (:issue:`13292`)
+
+Numeric
+^^^^^^^
+
+- Bug in ``.rank()`` which incorrectly ranks ordered categories (:issue:`15420`)
+- Bug in ``.corr()`` and ``.cov()`` where the column and index were the same object (:issue:`14617`)
+- Bug in ``.mode()`` where ``mode`` was not returned if was only a single value (:issue:`15714`)
+- Bug in ``pd.cut()`` with a single bin on an all 0s array (:issue:`15428`)
+- Bug in ``pd.qcut()`` with a single quantile and an array with identical values (:issue:`15431`)
+- Bug in ``pandas.tools.utils.cartesian_product()`` with large input can cause overflow on windows (:issue:`15265`)
+- Bug in ``.eval()`` which caused multi-line evals to fail with local variables not on the first line (:issue:`15342`)
+
+Other
+^^^^^
+
+- Compat with SciPy 0.19.0 for testing on ``.interpolate()`` (:issue:`15662`)
+- Compat for 32-bit platforms for ``.qcut/cut``; bins will now be ``int64`` dtype (:issue:`14866`)
+- Bug in interactions with ``Qt`` when a ``QtApplication`` already exists (:issue:`14372`)
+- Avoid use of ``np.finfo()`` during ``import pandas`` removed to mitigate deadlock on Python GIL misuse (:issue:`14641`)
diff --git a/doc/source/whatsnew/v0.20.2.txt b/doc/source/whatsnew/v0.20.2.txt
new file mode 100644
index 0000000000000..3de6fbc8afaf8
--- /dev/null
+++ b/doc/source/whatsnew/v0.20.2.txt
@@ -0,0 +1,127 @@
+.. _whatsnew_0202:
+
+v0.20.2 (June 4, 2017)
+----------------------
+
+This is a minor bug-fix release in the 0.20.x series and includes some small regression fixes,
+bug fixes and performance improvements.
+We recommend that all users upgrade to this version.
+
+.. contents:: What's new in v0.20.2
+    :local:
+    :backlinks: none
+
+
+.. _whatsnew_0202.enhancements:
+
+Enhancements
+~~~~~~~~~~~~
+
+- Unblocked access to additional compression types supported in pytables: 'blosc:blosclz, 'blosc:lz4', 'blosc:lz4hc', 'blosc:snappy', 'blosc:zlib', 'blosc:zstd' (:issue:`14478`)
+- ``Series`` provides a ``to_latex`` method (:issue:`16180`)
+
+- A new groupby method :meth:`~pandas.core.groupby.GroupBy.ngroup`,
+  parallel to the existing :meth:`~pandas.core.groupby.GroupBy.cumcount`,
+  has been added to return the group order (:issue:`11642`); see
+  :ref:`here <groupby.ngroup>`.
+
+.. _whatsnew_0202.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Performance regression fix when indexing with a list-like (:issue:`16285`)
+- Performance regression fix for MultiIndexes (:issue:`16319`, :issue:`16346`)
+- Improved performance of ``.clip()`` with scalar arguments (:issue:`15400`)
+- Improved performance of groupby with categorical groupers (:issue:`16413`)
+- Improved performance of ``MultiIndex.remove_unused_levels()`` (:issue:`16556`)
+
+.. _whatsnew_0202.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Silenced a warning on some Windows environments about "tput: terminal attributes: No such device or address" when
+  detecting the terminal size. This fix only applies to python 3 (:issue:`16496`)
+- Bug in using ``pathlib.Path`` or ``py.path.local`` objects with io functions (:issue:`16291`)
+- Bug in ``Index.symmetric_difference()`` on two equal MultiIndex's, results in a ``TypeError`` (:issue:`13490`)
+- Bug in ``DataFrame.update()`` with ``overwrite=False`` and ``NaN values`` (:issue:`15593`)
+- Passing an invalid engine to :func:`read_csv` now raises an informative
+  ``ValueError`` rather than ``UnboundLocalError``. (:issue:`16511`)
+- Bug in :func:`unique` on an array of tuples (:issue:`16519`)
+- Bug in :func:`cut` when ``labels`` are set, resulting in incorrect label ordering (:issue:`16459`)
+- Fixed a compatibility issue with IPython 6.0's tab completion showing deprecation warnings on ``Categoricals`` (:issue:`16409`)
+
+Conversion
+^^^^^^^^^^
+
+- Bug in :func:`to_numeric` in which empty data inputs were causing a segfault of the interpreter (:issue:`16302`)
+- Silence numpy warnings when broadcasting ``DataFrame`` to ``Series`` with comparison ops (:issue:`16378`, :issue:`16306`)
+
+
+Indexing
+^^^^^^^^
+
+- Bug in ``DataFrame.reset_index(level=)`` with single level index (:issue:`16263`)
+- Bug in partial string indexing with a monotonic, but not strictly-monotonic, index incorrectly reversing the slice bounds (:issue:`16515`)
+- Bug in ``MultiIndex.remove_unused_levels()`` that would not return a ``MultiIndex`` equal to the original. (:issue:`16556`)
+
+I/O
+^^^
+
+- Bug in :func:`read_csv` when ``comment`` is passed in a space delimited text file (:issue:`16472`)
+- Bug in :func:`read_csv` not raising an exception with nonexistent columns in ``usecols`` when it had the correct length (:issue:`14671`)
+- Bug that would force importing of the clipboard routines unnecessarily, potentially causing an import error on startup (:issue:`16288`)
+- Bug that raised ``IndexError`` when HTML-rendering an empty ``DataFrame`` (:issue:`15953`)
+- Bug in :func:`read_csv` in which tarfile object inputs were raising an error in Python 2.x for the C engine (:issue:`16530`)
+- Bug where ``DataFrame.to_html()`` ignored the ``index_names`` parameter (:issue:`16493`)
+- Bug where ``pd.read_hdf()`` returns numpy strings for index names (:issue:`13492`)
+
+- Bug in ``HDFStore.select_as_multiple()`` where start/stop arguments were not respected (:issue:`16209`)
+
+Plotting
+^^^^^^^^
+
+- Bug in ``DataFrame.plot`` with a single column and a list-like ``color`` (:issue:`3486`)
+- Bug in ``plot`` where ``NaT`` in ``DatetimeIndex`` results in ``Timestamp.min`` (:issue:`12405`)
+- Bug in ``DataFrame.boxplot`` where ``figsize`` keyword was not respected for non-grouped boxplots (:issue:`11959`)
+
+
+
+
+Groupby/Resample/Rolling
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Bug in creating a time-based rolling window on an empty ``DataFrame`` (:issue:`15819`)
+- Bug in ``rolling.cov()`` with offset window (:issue:`16058`)
+- Bug in ``.resample()`` and ``.groupby()`` when aggregating on integers (:issue:`16361`)
+
+
+Sparse
+^^^^^^
+
+- Bug in construction of ``SparseDataFrame`` from ``scipy.sparse.dok_matrix`` (:issue:`16179`)
+
+Reshaping
+^^^^^^^^^
+
+- Bug in ``DataFrame.stack`` with unsorted levels in ``MultiIndex`` columns (:issue:`16323`)
+- Bug in ``pd.wide_to_long()`` where no error was raised when ``i`` was not a unique identifier (:issue:`16382`)
+- Bug in ``Series.isin(..)`` with a list of tuples (:issue:`16394`)
+- Bug in construction of a ``DataFrame`` with mixed dtypes including an all-NaT column. (:issue:`16395`)
+- Bug in ``DataFrame.agg()`` and ``Series.agg()`` with aggregating on non-callable attributes (:issue:`16405`)
+
+
+Numeric
+^^^^^^^
+- Bug in ``.interpolate()``, where ``limit_direction`` was not respected when ``limit=None`` (default) was passed (:issue:`16282`)
+
+Categorical
+^^^^^^^^^^^
+
+- Fixed comparison operations considering the order of the categories when both categoricals are unordered (:issue:`16014`)
+
+Other
+^^^^^
+
+- Bug in ``DataFrame.drop()`` with an empty-list with non-unique indices (:issue:`16270`)
diff --git a/doc/source/whatsnew/v0.20.3.txt b/doc/source/whatsnew/v0.20.3.txt
new file mode 100644
index 0000000000000..582f975f81a7a
--- /dev/null
+++ b/doc/source/whatsnew/v0.20.3.txt
@@ -0,0 +1,60 @@
+.. _whatsnew_0203:
+
+v0.20.3 (July 7, 2017)
+-----------------------
+
+This is a minor bug-fix release in the 0.20.x series and includes some small regression fixes
+and bug fixes. We recommend that all users upgrade to this version.
+
+.. contents:: What's new in v0.20.3
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0203.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Fixed a bug in failing to compute rolling computations of a column-MultiIndexed ``DataFrame`` (:issue:`16789`, :issue:`16825`)
+- Fixed a pytest marker failing downstream packages' tests suites (:issue:`16680`)
+
+Conversion
+^^^^^^^^^^
+
+- Bug in pickle compat prior to the v0.20.x series, when ``UTC`` is a timezone in a Series/DataFrame/Index (:issue:`16608`)
+- Bug in ``Series`` construction when passing a ``Series`` with ``dtype='category'`` (:issue:`16524`).
+- Bug in :meth:`DataFrame.astype` when passing a ``Series`` as the ``dtype`` kwarg. (:issue:`16717`).
+
+Indexing
+^^^^^^^^
+
+- Bug in ``Float64Index`` causing an empty array instead of ``None`` to be returned from ``.get(np.nan)`` on a Series whose index did not contain any ``NaN`` s (:issue:`8569`)
+- Bug in ``MultiIndex.isin`` causing an error when passing an empty iterable (:issue:`16777`)
+- Fixed a bug in a slicing DataFrame/Series that have a  ``TimedeltaIndex`` (:issue:`16637`)
+
+I/O
+^^^
+
+- Bug in :func:`read_csv` in which files weren't opened as binary files by the C engine on Windows, causing EOF characters mid-field, which would fail (:issue:`16039`, :issue:`16559`, :issue:`16675`)
+- Bug in :func:`read_hdf` in which reading a ``Series`` saved to an HDF file in 'fixed' format fails when an explicit ``mode='r'`` argument is supplied (:issue:`16583`)
+- Bug in :meth:`DataFrame.to_latex` where ``bold_rows`` was wrongly specified to be ``True`` by default, whereas in reality row labels remained non-bold whatever parameter provided. (:issue:`16707`)
+- Fixed an issue with :meth:`DataFrame.style` where generated element ids were not unique (:issue:`16780`)
+- Fixed loading a ``DataFrame`` with a ``PeriodIndex``, from a ``format='fixed'`` HDFStore, in Python 3, that was written in Python 2 (:issue:`16781`)
+
+Plotting
+^^^^^^^^
+
+- Fixed regression that prevented RGB and RGBA tuples from being used as color arguments (:issue:`16233`)
+- Fixed an issue with :meth:`DataFrame.plot.scatter` that incorrectly raised a ``KeyError`` when categorical data is used for plotting (:issue:`16199`)
+
+Reshaping
+^^^^^^^^^
+
+- ``PeriodIndex`` / ``TimedeltaIndex.join`` was missing the ``sort=`` kwarg (:issue:`16541`) 
+- Bug in joining on a ``MultiIndex`` with a ``category`` dtype for a level (:issue:`16627`).
+- Bug in :func:`merge` when merging/joining with multiple categorical columns (:issue:`16767`)
+
+Categorical
+^^^^^^^^^^^
+
+- Bug in ``DataFrame.sort_values`` not respecting the ``kind`` parameter with categorical data (:issue:`16793`)
diff --git a/doc/source/whatsnew/v0.21.0.txt b/doc/source/whatsnew/v0.21.0.txt
new file mode 100644
index 0000000000000..77ae5b92d0e70
--- /dev/null
+++ b/doc/source/whatsnew/v0.21.0.txt
@@ -0,0 +1,1178 @@
+.. _whatsnew_0210:
+
+v0.21.0 (October 27, 2017)
+--------------------------
+
+This is a major release from 0.20.3 and includes a number of API changes, deprecations, new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+Highlights include:
+
+- Integration with `Apache Parquet <https://parquet.apache.org/>`__, including a new top-level :func:`read_parquet` function and :meth:`DataFrame.to_parquet` method, see :ref:`here <whatsnew_0210.enhancements.parquet>`.
+- New user-facing :class:`pandas.api.types.CategoricalDtype` for specifying
+  categoricals independent of the data, see :ref:`here <whatsnew_0210.enhancements.categorical_dtype>`.
+- The behavior of ``sum`` and ``prod`` on all-NaN Series/DataFrames is now consistent and no longer depends on whether `bottleneck <http://berkeleyanalytics.com/bottleneck>`__ is installed, and ``sum`` and ``prod`` on empty Series now return NaN instead of 0, see :ref:`here <whatsnew_0210.api_breaking.bottleneck>`.
+- Compatibility fixes for pypy, see :ref:`here <whatsnew_0210.pypy>`.
+- Additions to the ``drop``, ``reindex`` and ``rename`` API to make them more consistent, see :ref:`here <whatsnew_0210.enhancements.drop_api>`.
+- Addition of the new methods ``DataFrame.infer_objects`` (see :ref:`here <whatsnew_0210.enhancements.infer_objects>`) and ``GroupBy.pipe`` (see :ref:`here <whatsnew_0210.enhancements.GroupBy_pipe>`).
+- Indexing with a list of labels, where one or more of the labels is missing, is deprecated and will raise a KeyError in a future version, see :ref:`here <whatsnew_0210.api_breaking.loc>`.
+
+Check the :ref:`API Changes <whatsnew_0210.api_breaking>` and :ref:`deprecations <whatsnew_0210.deprecations>` before updating.
+
+.. contents:: What's new in v0.21.0
+    :local:
+    :backlinks: none
+    :depth: 2
+
+.. _whatsnew_0210.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0210.enhancements.parquet:
+
+Integration with Apache Parquet file format
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Integration with `Apache Parquet <https://parquet.apache.org/>`__, including a new top-level :func:`read_parquet` and :func:`DataFrame.to_parquet` method, see :ref:`here <io.parquet>` (:issue:`15838`, :issue:`17438`).
+
+`Apache Parquet <https://parquet.apache.org/>`__ provides a cross-language, binary file format for reading and writing data frames efficiently.
+Parquet is designed to faithfully serialize and de-serialize ``DataFrame`` s, supporting all of the pandas
+dtypes, including extension dtypes such as datetime with timezones.
+
+This functionality depends on either the `pyarrow <http://arrow.apache.org/docs/python/>`__ or `fastparquet <https://fastparquet.readthedocs.io/en/latest/>`__ library.
+For more details, see see :ref:`the IO docs on Parquet <io.parquet>`.
+
+
+.. _whatsnew_0210.enhancements.infer_objects:
+
+``infer_objects`` type conversion
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :meth:`DataFrame.infer_objects` and :meth:`Series.infer_objects`
+methods have been added to perform dtype inference on object columns, replacing
+some of the functionality of the deprecated ``convert_objects``
+method. See the documentation :ref:`here <basics.object_conversion>`
+for more details. (:issue:`11221`)
+
+This method only performs soft conversions on object columns, converting Python objects
+to native types, but not any coercive conversions. For example:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 2, 3],
+                      'B': np.array([1, 2, 3], dtype='object'),
+                      'C': ['1', '2', '3']})
+   df.dtypes
+   df.infer_objects().dtypes
+
+Note that column ``'C'`` was not converted - only scalar numeric types
+will be converted to a new type.  Other types of conversion should be accomplished
+using the :func:`to_numeric` function (or :func:`to_datetime`, :func:`to_timedelta`).
+
+.. ipython:: python
+
+   df = df.infer_objects()
+   df['C'] = pd.to_numeric(df['C'], errors='coerce')
+   df.dtypes
+
+.. _whatsnew_0210.enhancements.attribute_access:
+
+Improved warnings when attempting to create columns
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+New users are often puzzled by the relationship between column operations and
+attribute access on ``DataFrame`` instances (:issue:`7175`). One specific
+instance of this confusion is attempting to create a new column by setting an
+attribute on the ``DataFrame``:
+
+.. code-block:: ipython
+
+   In[1]: df = pd.DataFrame({'one': [1., 2., 3.]})
+   In[2]: df.two = [4, 5, 6]
+
+This does not raise any obvious exceptions, but also does not create a new column:
+
+.. code-block:: ipython
+
+   In[3]: df
+   Out[3]:
+       one
+   0  1.0
+   1  2.0
+   2  3.0
+
+Setting a list-like data structure into a new attribute now raises a ``UserWarning`` about the potential for unexpected behavior. See :ref:`Attribute Access <indexing.attribute_access>`.
+
+.. _whatsnew_0210.enhancements.drop_api:
+
+``drop`` now also accepts index/columns keywords
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :meth:`~DataFrame.drop` method has gained ``index``/``columns`` keywords as an
+alternative to specifying the ``axis``. This is similar to the behavior of ``reindex``
+(:issue:`12392`).
+
+For example:
+
+.. ipython:: python
+
+    df = pd.DataFrame(np.arange(8).reshape(2,4),
+                      columns=['A', 'B', 'C', 'D'])
+    df
+    df.drop(['B', 'C'], axis=1)
+    # the following is now equivalent
+    df.drop(columns=['B', 'C'])
+
+.. _whatsnew_0210.enhancements.rename_reindex_axis:
+
+``rename``, ``reindex`` now also accept axis keyword
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :meth:`DataFrame.rename` and :meth:`DataFrame.reindex` methods have gained
+the ``axis`` keyword to specify the axis to target with the operation
+(:issue:`12392`).
+
+Here's ``rename``:
+
+.. ipython:: python
+
+   df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
+   df.rename(str.lower, axis='columns')
+   df.rename(id, axis='index')
+
+And ``reindex``:
+
+.. ipython:: python
+
+   df.reindex(['A', 'B', 'C'], axis='columns')
+   df.reindex([0, 1, 3], axis='index')
+
+The "index, columns" style continues to work as before.
+
+.. ipython:: python
+
+   df.rename(index=id, columns=str.lower)
+   df.reindex(index=[0, 1, 3], columns=['A', 'B', 'C'])
+
+We *highly* encourage using named arguments to avoid confusion when using either
+style.
+
+.. _whatsnew_0210.enhancements.categorical_dtype:
+
+``CategoricalDtype`` for specifying categoricals
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:class:`pandas.api.types.CategoricalDtype` has been added to the public API and
+expanded to include the ``categories`` and ``ordered`` attributes. A
+``CategoricalDtype`` can be used to specify the set of categories and
+orderedness of an array, independent of the data. This can be useful for example,
+when converting string data to a ``Categorical`` (:issue:`14711`,
+:issue:`15078`, :issue:`16015`, :issue:`17643`):
+
+.. ipython:: python
+
+   from pandas.api.types import CategoricalDtype
+
+   s = pd.Series(['a', 'b', 'c', 'a'])  # strings
+   dtype = CategoricalDtype(categories=['a', 'b', 'c', 'd'], ordered=True)
+   s.astype(dtype)
+
+One place that deserves special mention is in :meth:`read_csv`. Previously, with
+``dtype={'col': 'category'}``, the returned values and categories would always
+be strings.
+
+.. ipython:: python
+   :suppress:
+
+   from pandas.compat import StringIO
+
+.. ipython:: python
+
+   data = 'A,B\na,1\nb,2\nc,3'
+   pd.read_csv(StringIO(data), dtype={'B': 'category'}).B.cat.categories
+
+Notice the "object" dtype.
+
+With a ``CategoricalDtype`` of all numerics, datetimes, or
+timedeltas, we can automatically convert to the correct type
+
+.. ipython:: python
+
+   dtype = {'B': CategoricalDtype([1, 2, 3])}
+   pd.read_csv(StringIO(data), dtype=dtype).B.cat.categories
+
+The values have been correctly interpreted as integers.
+
+The ``.dtype`` property of a ``Categorical``, ``CategoricalIndex`` or a
+``Series`` with categorical type will now return an instance of
+``CategoricalDtype``. While the repr has changed, ``str(CategoricalDtype())`` is
+still the string ``'category'``. We'll take this moment to remind users that the
+*preferred* way to detect categorical data is to use
+:func:`pandas.api.types.is_categorical_dtype`, and not ``str(dtype) == 'category'``.
+
+See the :ref:`CategoricalDtype docs <categorical.categoricaldtype>` for more.
+
+.. _whatsnew_0210.enhancements.GroupBy_pipe:
+
+``GroupBy`` objects now have a ``pipe`` method
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``GroupBy`` objects now have a ``pipe`` method, similar to the one on
+``DataFrame`` and ``Series``, that allow for functions that take a
+``GroupBy`` to be composed in a clean, readable syntax. (:issue:`17871`)
+
+For a concrete example on combining ``.groupby`` and ``.pipe`` , imagine having a
+DataFrame with columns for stores, products, revenue and sold quantity. We'd like to
+do a groupwise calculation of *prices* (i.e. revenue/quantity) per store and per product.
+We could do this in a multi-step operation, but expressing it in terms of piping can make the
+code more readable.
+
+First we set the data:
+
+.. ipython:: python
+
+   import numpy as np
+   n = 1000
+   df = pd.DataFrame({'Store': np.random.choice(['Store_1', 'Store_2'], n),
+                      'Product': np.random.choice(['Product_1', 'Product_2', 'Product_3'], n),
+                      'Revenue': (np.random.random(n)*50+10).round(2),
+                      'Quantity': np.random.randint(1, 10, size=n)})
+   df.head(2)
+
+Now, to find prices per store/product, we can simply do:
+
+.. ipython:: python
+
+   (df.groupby(['Store', 'Product'])
+      .pipe(lambda grp: grp.Revenue.sum()/grp.Quantity.sum())
+      .unstack().round(2))
+
+See the :ref:`documentation <groupby.pipe>` for more.
+
+
+.. _whatsnew_0210.enhancements.reanme_categories:
+
+``Categorical.rename_categories`` accepts a dict-like
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:meth:`~Series.cat.rename_categories` now accepts a dict-like argument for
+``new_categories``. The previous categories are looked up in the dictionary's
+keys and replaced if found. The behavior of missing and extra keys is the same
+as in :meth:`DataFrame.rename`.
+
+.. ipython:: python
+
+   c = pd.Categorical(['a', 'a', 'b'])
+   c.rename_categories({"a": "eh", "b": "bee"})
+
+.. warning::
+
+    To assist with upgrading pandas, ``rename_categories`` treats ``Series`` as
+    list-like. Typically, Series are considered to be dict-like (e.g. in
+    ``.rename``, ``.map``). In a future version of pandas ``rename_categories``
+    will change to treat them as dict-like. Follow the warning message's
+    recommendations for writing future-proof code.
+
+    .. code-block:: ipython
+
+        In [33]: c.rename_categories(pd.Series([0, 1], index=['a', 'c']))
+        FutureWarning: Treating Series 'new_categories' as a list-like and using the values.
+        In a future version, 'rename_categories' will treat Series like a dictionary.
+        For dict-like, use 'new_categories.to_dict()'
+        For list-like, use 'new_categories.values'.
+        Out[33]:
+        [0, 0, 1]
+        Categories (2, int64): [0, 1]
+
+
+.. _whatsnew_0210.enhancements.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+New functions or methods
+""""""""""""""""""""""""
+
+- :meth:`~pandas.core.resample.Resampler.nearest` is added to support nearest-neighbor upsampling (:issue:`17496`).
+- :class:`~pandas.Index` has added support for a ``to_frame`` method (:issue:`15230`).
+
+New keywords
+""""""""""""
+
+- Added a ``skipna`` parameter to :func:`~pandas.api.types.infer_dtype` to
+  support type inference in the presence of missing values (:issue:`17059`).
+- :func:`Series.to_dict` and :func:`DataFrame.to_dict` now support an ``into`` keyword which allows you to specify the ``collections.Mapping`` subclass that you would like returned.  The default is ``dict``, which is backwards compatible. (:issue:`16122`)
+- :func:`Series.set_axis` and :func:`DataFrame.set_axis` now support the ``inplace`` parameter. (:issue:`14636`)
+- :func:`Series.to_pickle` and :func:`DataFrame.to_pickle` have gained a ``protocol`` parameter (:issue:`16252`). By default, this parameter is set to `HIGHEST_PROTOCOL <https://docs.python.org/3/library/pickle.html#data-stream-format>`__
+- :func:`read_feather` has gained the ``nthreads`` parameter for multi-threaded operations (:issue:`16359`)
+- :func:`DataFrame.clip()` and :func:`Series.clip()` have gained an ``inplace`` argument. (:issue:`15388`)
+- :func:`crosstab` has gained a ``margins_name`` parameter to define the name of the row / column that will contain the totals when ``margins=True``. (:issue:`15972`)
+- :func:`read_json` now accepts a ``chunksize`` parameter that can be used when ``lines=True``. If ``chunksize`` is passed, read_json now returns an iterator which reads in ``chunksize`` lines with each iteration. (:issue:`17048`)
+- :func:`read_json` and :func:`~DataFrame.to_json` now accept a ``compression`` argument which allows them to transparently handle compressed files. (:issue:`17798`)
+
+Various enhancements
+""""""""""""""""""""
+
+- Improved the import time of pandas by about 2.25x.  (:issue:`16764`)
+- Support for `PEP 519 -- Adding a file system path protocol
+  <https://www.python.org/dev/peps/pep-0519/>`_ on most readers (e.g.
+  :func:`read_csv`) and writers (e.g. :meth:`DataFrame.to_csv`) (:issue:`13823`).
+- Added a ``__fspath__`` method to ``pd.HDFStore``, ``pd.ExcelFile``,
+  and ``pd.ExcelWriter`` to work properly with the file system path protocol (:issue:`13823`).
+- The ``validate`` argument for :func:`merge` now checks whether a merge is one-to-one, one-to-many, many-to-one, or many-to-many. If a merge is found to not be an example of specified merge type, an exception of type ``MergeError`` will be raised. For more, see :ref:`here <merging.validation>` (:issue:`16270`)
+- Added support for `PEP 518 <https://www.python.org/dev/peps/pep-0518/>`_ (``pyproject.toml``) to the build system (:issue:`16745`)
+- :func:`RangeIndex.append` now returns a ``RangeIndex`` object when possible (:issue:`16212`)
+- :func:`Series.rename_axis` and :func:`DataFrame.rename_axis` with ``inplace=True`` now return ``None`` while renaming the axis inplace. (:issue:`15704`)
+- :func:`api.types.infer_dtype` now infers decimals. (:issue:`15690`)
+- :func:`DataFrame.select_dtypes` now accepts scalar values for include/exclude as well as list-like. (:issue:`16855`)
+- :func:`date_range` now accepts 'YS' in addition to 'AS' as an alias for start of year. (:issue:`9313`)
+- :func:`date_range` now accepts 'Y' in addition to 'A' as an alias for end of year. (:issue:`9313`)
+- :func:`DataFrame.add_prefix` and :func:`DataFrame.add_suffix` now accept strings containing the '%' character. (:issue:`17151`)
+- Read/write methods that infer compression (:func:`read_csv`, :func:`read_table`, :func:`read_pickle`, and :meth:`~DataFrame.to_pickle`) can now infer from path-like objects, such as ``pathlib.Path``. (:issue:`17206`)
+- :func:`read_sas` now recognizes much more of the most frequently used date (datetime) formats in SAS7BDAT files. (:issue:`15871`)
+- :func:`DataFrame.items` and :func:`Series.items` are now present in both Python 2 and 3 and is lazy in all cases. (:issue:`13918`, :issue:`17213`)
+- :meth:`pandas.io.formats.style.Styler.where` has been implemented as a convenience for :meth:`pandas.io.formats.style.Styler.applymap`. (:issue:`17474`)
+- :func:`MultiIndex.is_monotonic_decreasing` has been implemented.  Previously returned ``False`` in all cases. (:issue:`16554`)
+- :func:`read_excel` raises ``ImportError`` with a better message if ``xlrd`` is not installed. (:issue:`17613`)
+- :meth:`DataFrame.assign` will preserve the original order of ``**kwargs`` for Python 3.6+ users instead of sorting the column names. (:issue:`14207`)
+- :func:`Series.reindex`, :func:`DataFrame.reindex`, :func:`Index.get_indexer` now support list-like argument for ``tolerance``. (:issue:`17367`)
+
+.. _whatsnew_0210.api_breaking:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _whatsnew_0210.api_breaking.deps:
+
+Dependencies have increased minimum versions
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+We have updated our minimum supported versions of dependencies (:issue:`15206`, :issue:`15543`, :issue:`15214`).
+If installed, we now require:
+
+   +--------------+-----------------+----------+
+   | Package      | Minimum Version | Required |
+   +==============+=================+==========+
+   | Numpy        | 1.9.0           |    X     |
+   +--------------+-----------------+----------+
+   | Matplotlib   | 1.4.3           |          |
+   +--------------+-----------------+----------+
+   | Scipy        | 0.14.0          |          |
+   +--------------+-----------------+----------+
+   | Bottleneck   | 1.0.0           |          |
+   +--------------+-----------------+----------+
+
+Additionally, support has been dropped for Python 3.4 (:issue:`15251`).
+
+
+.. _whatsnew_0210.api_breaking.bottleneck:
+
+Sum/Prod of all-NaN or empty Series/DataFrames is now consistently NaN
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. note::
+
+   The changes described here have been partially reverted. See
+   the :ref:`v0.22.0 Whatsnew <whatsnew_0220>` for more.
+
+
+The behavior of ``sum`` and ``prod`` on all-NaN Series/DataFrames no longer depends on
+whether `bottleneck <http://berkeleyanalytics.com/bottleneck>`__ is installed, and return value of ``sum`` and ``prod`` on an empty Series has changed (:issue:`9422`, :issue:`15507`).
+
+Calling ``sum`` or ``prod`` on an empty or all-``NaN`` ``Series``, or columns of a ``DataFrame``, will result in ``NaN``. See the :ref:`docs <missing_data.numeric_sum>`.
+
+.. ipython:: python
+
+   s = Series([np.nan])
+
+Previously WITHOUT ``bottleneck`` installed:
+
+.. code-block:: ipython
+
+   In [2]: s.sum()
+   Out[2]: np.nan
+
+Previously WITH ``bottleneck``:
+
+.. code-block:: ipython
+
+   In [2]: s.sum()
+   Out[2]: 0.0
+
+New Behavior, without regard to the bottleneck installation:
+
+.. ipython:: python
+
+   s.sum()
+
+Note that this also changes the sum of an empty ``Series``. Previously this always returned 0 regardless of a ``bottlenck`` installation:
+
+.. code-block:: ipython
+
+   In [1]: pd.Series([]).sum()
+   Out[1]: 0
+
+but for consistency with the all-NaN case, this was changed to return NaN as well:
+
+.. ipython:: python
+
+   pd.Series([]).sum()
+
+
+.. _whatsnew_0210.api_breaking.loc:
+
+Indexing with a list with missing labels is Deprecated
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously, selecting with a list of labels, where one or more labels were missing would always succeed, returning ``NaN`` for missing labels.
+This will now show a ``FutureWarning``. In the future this will raise a ``KeyError`` (:issue:`15747`).
+This warning will trigger on a ``DataFrame`` or a ``Series`` for using ``.loc[]``  or ``[[]]`` when passing a list-of-labels with at least 1 missing label.
+See the :ref:`deprecation docs <indexing.deprecate_loc_reindex_listlike>`.
+
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3])
+   s
+
+Previous Behavior
+
+.. code-block:: ipython
+
+   In [4]: s.loc[[1, 2, 3]]
+   Out[4]:
+   1    2.0
+   2    3.0
+   3    NaN
+   dtype: float64
+
+
+Current Behavior
+
+.. code-block:: ipython
+
+   In [4]: s.loc[[1, 2, 3]]
+   Passing list-likes to .loc or [] with any missing label will raise
+   KeyError in the future, you can use .reindex() as an alternative.
+
+   See the documentation here:
+   http://pandas.pydata.org/pandas-docs/stable/indexing.html#deprecate-loc-reindex-listlike
+
+   Out[4]:
+   1    2.0
+   2    3.0
+   3    NaN
+   dtype: float64
+
+The idiomatic way to achieve selecting potentially not-found elements is via ``.reindex()``
+
+.. ipython:: python
+
+  s.reindex([1, 2, 3])
+
+Selection with all keys found is unchanged.
+
+.. ipython:: python
+
+   s.loc[[1, 2]]
+
+
+.. _whatsnew_0210.api.na_changes:
+
+NA naming Changes
+^^^^^^^^^^^^^^^^^
+
+In order to promote more consistency among the pandas API, we have added additional top-level
+functions :func:`isna` and :func:`notna` that are aliases for :func:`isnull` and :func:`notnull`.
+The naming scheme is now more consistent with methods like ``.dropna()`` and ``.fillna()``. Furthermore
+in all cases where ``.isnull()`` and ``.notnull()`` methods are defined, these have additional methods
+named ``.isna()`` and ``.notna()``, these are included for classes ``Categorical``,
+``Index``, ``Series``, and ``DataFrame``. (:issue:`15001`).
+
+The configuration option ``pd.options.mode.use_inf_as_null`` is deprecated, and ``pd.options.mode.use_inf_as_na`` is added as a replacement.
+
+
+.. _whatsnew_0210.api_breaking.iteration_scalars:
+
+Iteration of Series/Index will now return Python scalars
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously, when using certain iteration methods for a ``Series`` with dtype ``int`` or ``float``, you would receive a ``numpy`` scalar, e.g. a ``np.int64``, rather than a Python ``int``. Issue (:issue:`10904`) corrected this for ``Series.tolist()`` and ``list(Series)``. This change makes all iteration methods consistent, in particular, for ``__iter__()`` and ``.map()``; note that this only affects int/float dtypes. (:issue:`13236`, :issue:`13258`, :issue:`14216`).
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3])
+   s
+
+Previously:
+
+.. code-block:: ipython
+
+   In [2]: type(list(s)[0])
+   Out[2]: numpy.int64
+
+New Behaviour:
+
+.. ipython:: python
+
+   type(list(s)[0])
+
+Furthermore this will now correctly box the results of iteration for :func:`DataFrame.to_dict` as well.
+
+.. ipython:: python
+
+   d = {'a':[1], 'b':['b']}
+   df = pd.DataFrame(d)
+
+Previously:
+
+.. code-block:: ipython
+
+   In [8]: type(df.to_dict()['a'][0])
+   Out[8]: numpy.int64
+
+New Behaviour:
+
+.. ipython:: python
+
+   type(df.to_dict()['a'][0])
+
+
+.. _whatsnew_0210.api_breaking.loc_with_index:
+
+Indexing with a Boolean Index
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously when passing a boolean ``Index`` to ``.loc``, if the index of the ``Series/DataFrame`` had ``boolean`` labels,
+you would get a label based selection, potentially duplicating result labels, rather than a boolean indexing selection
+(where ``True`` selects elements), this was inconsistent how a boolean numpy array indexed. The new behavior is to
+act like a boolean numpy array indexer. (:issue:`17738`)
+
+Previous Behavior:
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3], index=[False, True, False])
+   s
+
+.. code-block:: ipython
+
+   In [59]: s.loc[pd.Index([True, False, True])]
+   Out[59]:
+   True     2
+   False    1
+   False    3
+   True     2
+   dtype: int64
+
+Current Behavior
+
+.. ipython:: python
+
+   s.loc[pd.Index([True, False, True])]
+
+
+Furthermore, previously if you had an index that was non-numeric (e.g. strings), then a boolean Index would raise a ``KeyError``.
+This will now be treated as a boolean indexer.
+
+Previously Behavior:
+
+.. ipython:: python
+
+    s = pd.Series([1,2,3], index=['a', 'b', 'c'])
+    s
+
+.. code-block:: ipython
+
+    In [39]: s.loc[pd.Index([True, False, True])]
+    KeyError: "None of [Index([True, False, True], dtype='object')] are in the [index]"
+
+Current Behavior
+
+.. ipython:: python
+
+   s.loc[pd.Index([True, False, True])]
+
+
+.. _whatsnew_0210.api_breaking.period_index_resampling:
+
+``PeriodIndex`` resampling
+^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions of pandas, resampling a ``Series``/``DataFrame`` indexed by a ``PeriodIndex`` returned a ``DatetimeIndex`` in some cases (:issue:`12884`). Resampling to a multiplied frequency now returns a ``PeriodIndex`` (:issue:`15944`). As a minor enhancement, resampling a ``PeriodIndex`` can now handle ``NaT`` values (:issue:`13224`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [1]: pi = pd.period_range('2017-01', periods=12, freq='M')
+
+   In [2]: s = pd.Series(np.arange(12), index=pi)
+
+   In [3]: resampled = s.resample('2Q').mean()
+
+   In [4]: resampled
+   Out[4]:
+   2017-03-31     1.0
+   2017-09-30     5.5
+   2018-03-31    10.0
+   Freq: 2Q-DEC, dtype: float64
+
+   In [5]: resampled.index
+   Out[5]: DatetimeIndex(['2017-03-31', '2017-09-30', '2018-03-31'], dtype='datetime64[ns]', freq='2Q-DEC')
+
+New Behavior:
+
+.. ipython:: python
+
+   pi = pd.period_range('2017-01', periods=12, freq='M')
+
+   s = pd.Series(np.arange(12), index=pi)
+
+   resampled = s.resample('2Q').mean()
+
+   resampled
+
+   resampled.index
+
+Upsampling and calling ``.ohlc()`` previously returned a ``Series``, basically identical to calling ``.asfreq()``. OHLC upsampling now returns a DataFrame with columns ``open``, ``high``, ``low`` and ``close`` (:issue:`13083`). This is consistent with downsampling and ``DatetimeIndex`` behavior.
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [1]: pi = pd.PeriodIndex(start='2000-01-01', freq='D', periods=10)
+
+   In [2]: s = pd.Series(np.arange(10), index=pi)
+
+   In [3]: s.resample('H').ohlc()
+   Out[3]:
+   2000-01-01 00:00    0.0
+                   ...
+   2000-01-10 23:00    NaN
+   Freq: H, Length: 240, dtype: float64
+
+   In [4]: s.resample('M').ohlc()
+   Out[4]:
+            open  high  low  close
+   2000-01     0     9    0      9
+
+New Behavior:
+
+.. ipython:: python
+
+   pi = pd.PeriodIndex(start='2000-01-01', freq='D', periods=10)
+
+   s = pd.Series(np.arange(10), index=pi)
+
+   s.resample('H').ohlc()
+
+   s.resample('M').ohlc()
+
+
+.. _whatsnew_0210.api_breaking.pandas_eval:
+
+Improved error handling during item assignment in pd.eval
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`eval` will now raise a ``ValueError`` when item assignment malfunctions, or
+inplace operations are specified, but there is no item assignment in the expression (:issue:`16732`)
+
+.. ipython:: python
+
+   arr = np.array([1, 2, 3])
+
+Previously, if you attempted the following expression, you would get a not very helpful error message:
+
+.. code-block:: ipython
+
+  In [3]: pd.eval("a = 1 + 2", target=arr, inplace=True)
+  ...
+  IndexError: only integers, slices (`:`), ellipsis (`...`), numpy.newaxis (`None`)
+  and integer or boolean arrays are valid indices
+
+This is a very long way of saying numpy arrays don't support string-item indexing. With this
+change, the error message is now this:
+
+.. code-block:: python
+
+   In [3]: pd.eval("a = 1 + 2", target=arr, inplace=True)
+   ...
+   ValueError: Cannot assign expression output to target
+
+It also used to be possible to evaluate expressions inplace, even if there was no item assignment:
+
+.. code-block:: ipython
+
+  In [4]: pd.eval("1 + 2", target=arr, inplace=True)
+  Out[4]: 3
+
+However, this input does not make much sense because the output is not being assigned to
+the target. Now, a ``ValueError`` will be raised when such an input is passed in:
+
+.. code-block:: ipython
+
+   In [4]: pd.eval("1 + 2", target=arr, inplace=True)
+   ...
+   ValueError: Cannot operate inplace if there is no assignment
+
+
+.. _whatsnew_0210.api_breaking.dtype_conversions:
+
+Dtype Conversions
+^^^^^^^^^^^^^^^^^
+
+Previously assignments, ``.where()`` and ``.fillna()`` with a ``bool`` assignment, would coerce to same the type (e.g. int / float), or raise for datetimelikes. These will now preserve the bools with ``object`` dtypes. (:issue:`16821`).
+
+.. ipython:: python
+
+   s = Series([1, 2, 3])
+
+.. code-block:: python
+
+   In [5]: s[1] = True
+
+   In [6]: s
+   Out[6]:
+   0    1
+   1    1
+   2    3
+   dtype: int64
+
+New Behavior
+
+.. ipython:: python
+
+   s[1] = True
+   s
+
+Previously, as assignment to a datetimelike with a non-datetimelike would coerce the
+non-datetime-like item being assigned (:issue:`14145`).
+
+.. ipython:: python
+
+   s = pd.Series([pd.Timestamp('2011-01-01'), pd.Timestamp('2012-01-01')])
+
+.. code-block:: python
+
+   In [1]: s[1] = 1
+
+   In [2]: s
+   Out[2]:
+   0   2011-01-01 00:00:00.000000000
+   1   1970-01-01 00:00:00.000000001
+   dtype: datetime64[ns]
+
+These now coerce to ``object`` dtype.
+
+.. ipython:: python
+
+   s[1] = 1
+   s
+
+- Inconsistent behavior in ``.where()`` with datetimelikes which would raise rather than coerce to ``object`` (:issue:`16402`)
+- Bug in assignment against ``int64`` data with ``np.ndarray`` with ``float64`` dtype may keep ``int64`` dtype (:issue:`14001`)
+
+
+.. _whatsnew_210.api.multiindex_single:
+
+MultiIndex Constructor with a Single Level
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The ``MultiIndex`` constructors no longer squeezes a MultiIndex with all
+length-one levels down to a regular ``Index``. This affects all the
+``MultiIndex`` constructors. (:issue:`17178`)
+
+Previous behavior:
+
+.. code-block:: ipython
+
+   In [2]: pd.MultiIndex.from_tuples([('a',), ('b',)])
+   Out[2]: Index(['a', 'b'], dtype='object')
+
+Length 1 levels are no longer special-cased. They behave exactly as if you had
+length 2+ levels, so a :class:`MultiIndex` is always returned from all of the
+``MultiIndex`` constructors:
+
+.. ipython:: python
+
+   pd.MultiIndex.from_tuples([('a',), ('b',)])
+
+.. _whatsnew_0210.api.utc_localization_with_series:
+
+UTC Localization with Series
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously, :func:`to_datetime` did not localize datetime ``Series`` data when ``utc=True`` was passed. Now, :func:`to_datetime` will correctly localize ``Series`` with a ``datetime64[ns, UTC]`` dtype to be consistent with how list-like and ``Index`` data are handled. (:issue:`6415`).
+
+Previous Behavior
+
+.. ipython:: python
+
+   s = Series(['20130101 00:00:00'] * 3)
+
+.. code-block:: ipython
+
+   In [12]: pd.to_datetime(s, utc=True)
+   Out[12]:
+   0   2013-01-01
+   1   2013-01-01
+   2   2013-01-01
+   dtype: datetime64[ns]
+
+New Behavior
+
+.. ipython:: python
+
+   pd.to_datetime(s, utc=True)
+
+Additionally, DataFrames with datetime columns that were parsed by :func:`read_sql_table` and :func:`read_sql_query` will also be localized to UTC only if the original SQL columns were timezone aware datetime columns.
+
+.. _whatsnew_0210.api.consistency_of_range_functions:
+
+Consistency of Range Functions
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions, there were some inconsistencies between the various range functions: :func:`date_range`, :func:`bdate_range`, :func:`period_range`, :func:`timedelta_range`, and :func:`interval_range`. (:issue:`17471`).
+
+One of the inconsistent behaviors occurred when the ``start``, ``end`` and ``period`` parameters were all specified, potentially leading to ambiguous ranges.  When all three parameters were passed, ``interval_range`` ignored the ``period`` parameter, ``period_range`` ignored the ``end`` parameter, and the other range functions raised.  To promote consistency among the range functions, and avoid potentially ambiguous ranges, ``interval_range`` and ``period_range`` will now raise when all three parameters are passed.
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+  In [2]: pd.interval_range(start=0, end=4, periods=6)
+  Out[2]:
+  IntervalIndex([(0, 1], (1, 2], (2, 3]]
+                closed='right',
+                dtype='interval[int64]')
+
+  In [3]: pd.period_range(start='2017Q1', end='2017Q4', periods=6, freq='Q')
+  Out[3]: PeriodIndex(['2017Q1', '2017Q2', '2017Q3', '2017Q4', '2018Q1', '2018Q2'], dtype='period[Q-DEC]', freq='Q-DEC')
+
+New Behavior:
+
+.. code-block:: ipython
+
+  In [2]: pd.interval_range(start=0, end=4, periods=6)
+  ---------------------------------------------------------------------------
+  ValueError: Of the three parameters: start, end, and periods, exactly two must be specified
+
+  In [3]: pd.period_range(start='2017Q1', end='2017Q4', periods=6, freq='Q')
+  ---------------------------------------------------------------------------
+  ValueError: Of the three parameters: start, end, and periods, exactly two must be specified
+
+Additionally, the endpoint parameter ``end`` was not included in the intervals produced by ``interval_range``.  However, all other range functions include ``end`` in their output.  To promote consistency among the range functions, ``interval_range`` will now include ``end`` as the right endpoint of the final interval, except if ``freq`` is specified in a way which skips ``end``.
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+  In [4]: pd.interval_range(start=0, end=4)
+  Out[4]:
+  IntervalIndex([(0, 1], (1, 2], (2, 3]]
+                closed='right',
+                dtype='interval[int64]')
+
+
+New Behavior:
+
+.. ipython:: python
+
+   pd.interval_range(start=0, end=4)
+
+.. _whatsnew_0210.api.mpl_converters:
+
+No Automatic Matplotlib Converters
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Pandas no longer registers our ``date``, ``time``, ``datetime``,
+``datetime64``, and ``Period`` converters with matplotlib when pandas is
+imported. Matplotlib plot methods (``plt.plot``, ``ax.plot``, ...), will not
+nicely format the x-axis for ``DatetimeIndex`` or ``PeriodIndex`` values. You
+must explicitly register these methods:
+
+Pandas built-in ``Series.plot`` and ``DataFrame.plot`` *will* register these
+converters on first-use (:issue:`17710`).
+
+.. note::
+
+  This change has been temporarily reverted in pandas 0.21.1,
+  for more details see :ref:`here <whatsnew_0211.converters>`.
+
+.. _whatsnew_0210.api:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+
+- The Categorical constructor no longer accepts a scalar for the ``categories`` keyword. (:issue:`16022`)
+- Accessing a non-existent attribute on a closed :class:`~pandas.HDFStore` will now
+  raise an ``AttributeError`` rather than a ``ClosedFileError`` (:issue:`16301`)
+- :func:`read_csv` now issues a ``UserWarning`` if the ``names`` parameter contains duplicates (:issue:`17095`)
+- :func:`read_csv` now treats ``'null'`` and ``'n/a'`` strings as missing values by default (:issue:`16471`, :issue:`16078`)
+- :class:`pandas.HDFStore`'s string representation is now faster and less detailed. For the previous behavior, use ``pandas.HDFStore.info()``. (:issue:`16503`).
+- Compression defaults in HDF stores now follow pytables standards. Default is no compression and if ``complib`` is missing and ``complevel`` > 0 ``zlib`` is used (:issue:`15943`)
+- ``Index.get_indexer_non_unique()`` now returns a ndarray indexer rather than an ``Index``; this is consistent with ``Index.get_indexer()`` (:issue:`16819`)
+- Removed the ``@slow`` decorator from ``pandas.util.testing``, which caused issues for some downstream packages' test suites. Use ``@pytest.mark.slow`` instead, which achieves the same thing (:issue:`16850`)
+- Moved definition of ``MergeError`` to the ``pandas.errors`` module.
+- The signature of :func:`Series.set_axis` and :func:`DataFrame.set_axis` has been changed from ``set_axis(axis, labels)`` to ``set_axis(labels, axis=0)``, for consistency with the rest of the API. The old signature is deprecated and will show a ``FutureWarning`` (:issue:`14636`)
+- :func:`Series.argmin` and :func:`Series.argmax` will now raise a ``TypeError`` when used with ``object`` dtypes, instead of a ``ValueError`` (:issue:`13595`)
+- :class:`Period` is now immutable, and will now raise an ``AttributeError`` when a user tries to assign a new value to the ``ordinal`` or ``freq`` attributes (:issue:`17116`).
+- :func:`to_datetime` when passed a tz-aware ``origin=`` kwarg will now raise a more informative ``ValueError`` rather than a ``TypeError`` (:issue:`16842`)
+- :func:`to_datetime` now raises a ``ValueError`` when format includes ``%W`` or ``%U`` without also including day of the week and calendar year (:issue:`16774`)
+- Renamed non-functional ``index`` to ``index_col`` in :func:`read_stata` to improve API consistency (:issue:`16342`)
+- Bug in :func:`DataFrame.drop` caused boolean labels ``False`` and ``True`` to be treated as labels 0 and 1 respectively when dropping indices from a numeric index. This will now raise a ValueError (:issue:`16877`)
+- Restricted DateOffset keyword arguments.  Previously, ``DateOffset`` subclasses allowed arbitrary keyword arguments which could lead to unexpected behavior.  Now, only valid arguments will be accepted. (:issue:`17176`).
+
+.. _whatsnew_0210.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+
+- :meth:`DataFrame.from_csv` and :meth:`Series.from_csv` have been deprecated in favor of :func:`read_csv()` (:issue:`4191`)
+- :func:`read_excel()` has deprecated ``sheetname`` in favor of ``sheet_name`` for consistency with ``.to_excel()`` (:issue:`10559`).
+- :func:`read_excel()` has deprecated ``parse_cols`` in favor of ``usecols`` for consistency with :func:`read_csv` (:issue:`4988`)
+- :func:`read_csv()` has deprecated the ``tupleize_cols`` argument. Column tuples will always be converted to a ``MultiIndex`` (:issue:`17060`)
+- :meth:`DataFrame.to_csv` has deprecated the ``tupleize_cols`` argument. MultiIndex columns will be always written as rows in the CSV file (:issue:`17060`)
+- The ``convert`` parameter has been deprecated in the ``.take()`` method, as it was not being respected (:issue:`16948`)
+- ``pd.options.html.border`` has been deprecated in favor of ``pd.options.display.html.border`` (:issue:`15793`).
+- :func:`SeriesGroupBy.nth` has deprecated ``True`` in favor of ``'all'`` for its kwarg ``dropna`` (:issue:`11038`).
+- :func:`DataFrame.as_blocks` is deprecated, as this is exposing the internal implementation (:issue:`17302`)
+- ``pd.TimeGrouper`` is deprecated in favor of :class:`pandas.Grouper` (:issue:`16747`)
+- ``cdate_range`` has been deprecated in favor of :func:`bdate_range`, which has gained ``weekmask`` and ``holidays`` parameters for building custom frequency date ranges. See the :ref:`documentation <timeseries.custom-freq-ranges>` for more details (:issue:`17596`)
+- passing ``categories`` or ``ordered`` kwargs to :func:`Series.astype` is deprecated, in favor of passing a :ref:`CategoricalDtype <whatsnew_0210.enhancements.categorical_dtype>` (:issue:`17636`)
+- ``.get_value`` and ``.set_value`` on ``Series``, ``DataFrame``, ``Panel``, ``SparseSeries``, and ``SparseDataFrame`` are deprecated in favor of using ``.iat[]`` or ``.at[]`` accessors (:issue:`15269`)
+- Passing a non-existent column in ``.to_excel(..., columns=)`` is deprecated and will raise a ``KeyError`` in the future (:issue:`17295`)
+- ``raise_on_error`` parameter to :func:`Series.where`, :func:`Series.mask`, :func:`DataFrame.where`, :func:`DataFrame.mask` is deprecated, in favor of ``errors=`` (:issue:`14968`)
+- Using :meth:`DataFrame.rename_axis` and :meth:`Series.rename_axis` to alter index or column *labels* is now deprecated in favor of using ``.rename``. ``rename_axis`` may still be used to alter the name of the index or columns (:issue:`17833`).
+- :meth:`~DataFrame.reindex_axis` has been deprecated in favor of :meth:`~DataFrame.reindex`. See :ref:`here <whatsnew_0210.enhancements.rename_reindex_axis>` for more (:issue:`17833`).
+
+.. _whatsnew_0210.deprecations.select:
+
+Series.select and DataFrame.select
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :meth:`Series.select` and :meth:`DataFrame.select` methods are deprecated in favor of using ``df.loc[labels.map(crit)]`` (:issue:`12401`)
+
+.. ipython:: python
+
+   df = DataFrame({'A': [1, 2, 3]}, index=['foo', 'bar', 'baz'])
+
+.. code-block:: ipython
+
+   In [3]: df.select(lambda x: x in ['bar', 'baz'])
+   FutureWarning: select is deprecated and will be removed in a future release. You can use .loc[crit] as a replacement
+   Out[3]:
+        A
+   bar  2
+   baz  3
+
+.. ipython:: python
+
+   df.loc[df.index.map(lambda x: x in ['bar', 'baz'])]
+
+
+.. _whatsnew_0210.deprecations.argmin_min:
+
+Series.argmax and Series.argmin
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The behavior of :func:`Series.argmax` and :func:`Series.argmin` have been deprecated in favor of :func:`Series.idxmax` and :func:`Series.idxmin`, respectively (:issue:`16830`).
+
+For compatibility with NumPy arrays, ``pd.Series`` implements ``argmax`` and
+``argmin``. Since pandas 0.13.0, ``argmax`` has been an alias for
+:meth:`pandas.Series.idxmax`, and ``argmin`` has been an alias for
+:meth:`pandas.Series.idxmin`. They return the *label* of the maximum or minimum,
+rather than the *position*.
+
+We've deprecated the current behavior of ``Series.argmax`` and
+``Series.argmin``. Using either of these will emit a ``FutureWarning``. Use
+:meth:`Series.idxmax` if you want the label of the maximum. Use
+``Series.values.argmax()`` if you want the position of the maximum. Likewise for
+the minimum. In a future release ``Series.argmax`` and ``Series.argmin`` will
+return the position of the maximum or minimum.
+
+.. _whatsnew_0210.prior_deprecations:
+
+Removal of prior version deprecations/changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+- :func:`read_excel()` has dropped the ``has_index_names`` parameter (:issue:`10967`)
+- The ``pd.options.display.height`` configuration has been dropped (:issue:`3663`)
+- The ``pd.options.display.line_width`` configuration has been dropped (:issue:`2881`)
+- The ``pd.options.display.mpl_style`` configuration has been dropped (:issue:`12190`)
+- ``Index`` has dropped the ``.sym_diff()`` method in favor of ``.symmetric_difference()`` (:issue:`12591`)
+- ``Categorical`` has dropped the ``.order()`` and ``.sort()`` methods in favor of ``.sort_values()`` (:issue:`12882`)
+- :func:`eval` and :func:`DataFrame.eval` have changed the default of ``inplace`` from ``None`` to ``False`` (:issue:`11149`)
+- The function ``get_offset_name`` has been dropped in favor of the ``.freqstr`` attribute for an offset (:issue:`11834`)
+- pandas no longer tests for compatibility with hdf5-files created with pandas < 0.11 (:issue:`17404`).
+
+
+
+.. _whatsnew_0210.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved performance of instantiating :class:`SparseDataFrame` (:issue:`16773`)
+- :attr:`Series.dt` no longer performs frequency inference, yielding a large speedup when accessing the attribute (:issue:`17210`)
+- Improved performance of :meth:`~Series.cat.set_categories` by not materializing the values (:issue:`17508`)
+- :attr:`Timestamp.microsecond` no longer re-computes on attribute access (:issue:`17331`)
+- Improved performance of the :class:`CategoricalIndex` for data that is already categorical dtype (:issue:`17513`)
+- Improved performance of :meth:`RangeIndex.min` and :meth:`RangeIndex.max` by using ``RangeIndex`` properties to perform the computations (:issue:`17607`)
+
+.. _whatsnew_0210.docs:
+
+Documentation Changes
+~~~~~~~~~~~~~~~~~~~~~
+
+- Several ``NaT`` method docstrings (e.g. :func:`NaT.ctime`) were incorrect (:issue:`17327`)
+- The documentation has had references to versions < v0.17 removed and cleaned up (:issue:`17442`, :issue:`17442`, :issue:`17404` & :issue:`17504`)
+
+.. _whatsnew_0210.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+Conversion
+^^^^^^^^^^
+
+- Bug in assignment against datetime-like data with ``int`` may incorrectly convert to datetime-like (:issue:`14145`)
+- Bug in assignment against ``int64`` data with ``np.ndarray`` with ``float64`` dtype may keep ``int64`` dtype (:issue:`14001`)
+- Fixed the return type of ``IntervalIndex.is_non_overlapping_monotonic`` to be a Python ``bool`` for consistency with similar attributes/methods.  Previously returned a ``numpy.bool_``. (:issue:`17237`)
+- Bug in ``IntervalIndex.is_non_overlapping_monotonic`` when intervals are closed on both sides and overlap at a point (:issue:`16560`)
+- Bug in :func:`Series.fillna` returns frame when ``inplace=True`` and ``value`` is dict (:issue:`16156`)
+- Bug in :attr:`Timestamp.weekday_name` returning a UTC-based weekday name when localized to a timezone (:issue:`17354`)
+- Bug in ``Timestamp.replace`` when replacing ``tzinfo`` around DST changes (:issue:`15683`)
+- Bug in ``Timedelta`` construction and arithmetic that would not propagate the ``Overflow`` exception (:issue:`17367`)
+- Bug in :meth:`~DataFrame.astype` converting to object dtype when passed extension type classes (``DatetimeTZDtype``, ``CategoricalDtype``) rather than instances. Now a ``TypeError`` is raised when a class is passed (:issue:`17780`).
+- Bug in :meth:`to_numeric` in which elements were not always being coerced to numeric when ``errors='coerce'`` (:issue:`17007`, :issue:`17125`)
+- Bug in ``DataFrame`` and ``Series`` constructors where ``range`` objects are converted to ``int32`` dtype on Windows instead of ``int64`` (:issue:`16804`)
+
+Indexing
+^^^^^^^^
+
+- When called with a null slice (e.g. ``df.iloc[:]``), the ``.iloc`` and ``.loc`` indexers return a shallow copy of the original object. Previously they returned the original object. (:issue:`13873`).
+- When called on an unsorted ``MultiIndex``, the ``loc`` indexer now will raise ``UnsortedIndexError`` only if proper slicing is used on non-sorted levels (:issue:`16734`).
+- Fixes regression in 0.20.3 when indexing with a string on a ``TimedeltaIndex`` (:issue:`16896`).
+- Fixed :func:`TimedeltaIndex.get_loc` handling of ``np.timedelta64`` inputs (:issue:`16909`).
+- Fix :func:`MultiIndex.sort_index` ordering when ``ascending`` argument is a list, but not all levels are specified, or are in a different order (:issue:`16934`).
+- Fixes bug where indexing with ``np.inf`` caused an ``OverflowError`` to be raised (:issue:`16957`)
+- Bug in reindexing on an empty ``CategoricalIndex`` (:issue:`16770`)
+- Fixes ``DataFrame.loc`` for setting with alignment and tz-aware ``DatetimeIndex`` (:issue:`16889`)
+- Avoids ``IndexError`` when passing an Index or Series to ``.iloc`` with older numpy (:issue:`17193`)
+- Allow unicode empty strings as placeholders in multilevel columns in Python 2 (:issue:`17099`)
+- Bug in ``.iloc`` when used with inplace addition or assignment and an int indexer on a ``MultiIndex`` causing the wrong indexes to be read from and written to (:issue:`17148`)
+- Bug in ``.isin()`` in which checking membership in empty ``Series`` objects raised an error (:issue:`16991`)
+- Bug in ``CategoricalIndex`` reindexing in which specified indices containing duplicates were not being respected (:issue:`17323`)
+- Bug in intersection of ``RangeIndex`` with negative step (:issue:`17296`)
+- Bug in ``IntervalIndex`` where performing a scalar lookup fails for included right endpoints of non-overlapping monotonic decreasing indexes (:issue:`16417`, :issue:`17271`)
+- Bug in :meth:`DataFrame.first_valid_index` and :meth:`DataFrame.last_valid_index` when no valid entry (:issue:`17400`)
+- Bug in :func:`Series.rename` when called with a callable, incorrectly alters the name of the ``Series``, rather than the name of the ``Index``. (:issue:`17407`)
+- Bug in :func:`String.str_get` raises ``IndexError`` instead of inserting NaNs when using a negative index. (:issue:`17704`)
+
+I/O
+^^^
+
+- Bug in :func:`read_hdf` when reading a timezone aware index from ``fixed`` format HDFStore (:issue:`17618`)
+- Bug in :func:`read_csv` in which columns were not being thoroughly de-duplicated (:issue:`17060`)
+- Bug in :func:`read_csv` in which specified column names were not being thoroughly de-duplicated (:issue:`17095`)
+- Bug in :func:`read_csv` in which non integer values for the header argument generated an unhelpful / unrelated error message (:issue:`16338`)
+- Bug in :func:`read_csv` in which memory management issues in exception handling, under certain conditions, would cause the interpreter to segfault (:issue:`14696`, :issue:`16798`).
+- Bug in :func:`read_csv` when called with ``low_memory=False`` in which a CSV with at least one column > 2GB in size would incorrectly raise a ``MemoryError`` (:issue:`16798`).
+- Bug in :func:`read_csv` when called with a single-element list ``header`` would return a ``DataFrame`` of all NaN values (:issue:`7757`)
+- Bug in :meth:`DataFrame.to_csv` defaulting to 'ascii' encoding in Python 3, instead of 'utf-8' (:issue:`17097`)
+- Bug in :func:`read_stata` where value labels could not be read when using an iterator (:issue:`16923`)
+- Bug in :func:`read_stata` where the index was not set (:issue:`16342`)
+- Bug in :func:`read_html` where import check fails when run in multiple threads (:issue:`16928`)
+- Bug in :func:`read_csv` where automatic delimiter detection caused a ``TypeError`` to be thrown when a bad line was encountered rather than the correct error message (:issue:`13374`)
+- Bug in :meth:`DataFrame.to_html` with ``notebook=True`` where DataFrames with named indices or non-MultiIndex indices had undesired horizontal or vertical alignment for column or row labels, respectively (:issue:`16792`)
+- Bug in :meth:`DataFrame.to_html` in which there was no validation of the ``justify`` parameter (:issue:`17527`)
+- Bug in :func:`HDFStore.select` when reading a contiguous mixed-data table featuring VLArray (:issue:`17021`)
+- Bug in :func:`to_json` where several conditions (including objects with unprintable symbols, objects with deep recursion, overlong labels) caused segfaults instead of raising the appropriate exception (:issue:`14256`)
+
+Plotting
+^^^^^^^^
+- Bug in plotting methods using ``secondary_y`` and ``fontsize`` not setting secondary axis font size (:issue:`12565`)
+- Bug when plotting ``timedelta`` and ``datetime`` dtypes on y-axis (:issue:`16953`)
+- Line plots no longer assume monotonic x data when calculating xlims, they show the entire lines now even for unsorted x data. (:issue:`11310`, :issue:`11471`)
+- With matplotlib 2.0.0 and above, calculation of x limits for line plots is left to matplotlib, so that its new default settings are applied. (:issue:`15495`)
+- Bug in ``Series.plot.bar`` or ``DataFrame.plot.bar`` with ``y`` not respecting user-passed ``color`` (:issue:`16822`)
+- Bug causing ``plotting.parallel_coordinates`` to reset the random seed when using random colors (:issue:`17525`)
+
+
+Groupby/Resample/Rolling
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Bug in ``DataFrame.resample(...).size()`` where an empty ``DataFrame`` did not return a ``Series`` (:issue:`14962`)
+- Bug in :func:`infer_freq` causing indices with 2-day gaps during the working week to be wrongly inferred as business daily (:issue:`16624`)
+- Bug in ``.rolling(...).quantile()`` which incorrectly used different defaults than :func:`Series.quantile()` and :func:`DataFrame.quantile()` (:issue:`9413`, :issue:`16211`)
+- Bug in ``groupby.transform()`` that would coerce boolean dtypes back to float (:issue:`16875`)
+- Bug in ``Series.resample(...).apply()`` where an empty ``Series`` modified the source index and did not return the name of a ``Series`` (:issue:`14313`)
+- Bug in ``.rolling(...).apply(...)`` with a ``DataFrame`` with a ``DatetimeIndex``, a ``window`` of a timedelta-convertible and ``min_periods >= 1`` (:issue:`15305`)
+- Bug in ``DataFrame.groupby`` where index and column keys were not recognized correctly when the number of keys equaled the number of elements on the groupby axis (:issue:`16859`)
+- Bug in ``groupby.nunique()`` with ``TimeGrouper`` which cannot handle ``NaT`` correctly (:issue:`17575`)
+- Bug in ``DataFrame.groupby`` where a single level selection from a ``MultiIndex`` unexpectedly sorts (:issue:`17537`)
+- Bug in ``DataFrame.groupby`` where spurious warning is raised when ``Grouper`` object is used to override ambiguous column name (:issue:`17383`)
+- Bug in ``TimeGrouper`` differs when passes as a list and as a scalar (:issue:`17530`)
+
+Sparse
+^^^^^^
+
+- Bug in ``SparseSeries`` raises ``AttributeError`` when a dictionary is passed in as data (:issue:`16905`)
+- Bug in :func:`SparseDataFrame.fillna` not filling all NaNs when frame was instantiated from SciPy sparse matrix (:issue:`16112`)
+- Bug in :func:`SparseSeries.unstack` and :func:`SparseDataFrame.stack` (:issue:`16614`, :issue:`15045`)
+- Bug in :func:`make_sparse` treating two numeric/boolean data, which have same bits, as same when array ``dtype`` is ``object`` (:issue:`17574`)
+- :func:`SparseArray.all` and :func:`SparseArray.any` are now implemented to handle ``SparseArray``, these were used but not implemented (:issue:`17570`)
+
+Reshaping
+^^^^^^^^^
+- Joining/Merging with a non unique ``PeriodIndex`` raised a ``TypeError`` (:issue:`16871`)
+- Bug in :func:`crosstab` where non-aligned series of integers were casted to float (:issue:`17005`)
+- Bug in merging with categorical dtypes with datetimelikes incorrectly raised a ``TypeError`` (:issue:`16900`)
+- Bug when using :func:`isin` on a large object series and large comparison array (:issue:`16012`)
+- Fixes regression from 0.20, :func:`Series.aggregate` and :func:`DataFrame.aggregate` allow dictionaries as return values again (:issue:`16741`)
+- Fixes dtype of result with integer dtype input, from :func:`pivot_table` when called with ``margins=True`` (:issue:`17013`)
+- Bug in :func:`crosstab` where passing two ``Series`` with the same name raised a ``KeyError`` (:issue:`13279`)
+- :func:`Series.argmin`, :func:`Series.argmax`, and their counterparts on ``DataFrame`` and groupby objects work correctly with floating point data that contains infinite values (:issue:`13595`).
+- Bug in :func:`unique` where checking a tuple of strings raised a ``TypeError`` (:issue:`17108`)
+- Bug in :func:`concat` where order of result index was unpredictable if it contained non-comparable elements (:issue:`17344`)
+- Fixes regression when sorting by multiple columns on a ``datetime64`` dtype ``Series`` with ``NaT`` values (:issue:`16836`)
+- Bug in :func:`pivot_table` where the result's columns did not preserve the categorical dtype of ``columns`` when ``dropna`` was ``False`` (:issue:`17842`)
+- Bug in ``DataFrame.drop_duplicates`` where dropping with non-unique column names raised a ``ValueError`` (:issue:`17836`)
+- Bug in :func:`unstack` which, when called on a list of levels, would discard the ``fillna`` argument (:issue:`13971`)
+- Bug in the alignment of ``range`` objects and other list-likes with ``DataFrame`` leading to operations being performed row-wise instead of column-wise (:issue:`17901`)
+
+Numeric
+^^^^^^^
+- Bug in ``.clip()`` with ``axis=1`` and a list-like for ``threshold`` is passed; previously this raised ``ValueError`` (:issue:`15390`)
+- :func:`Series.clip()` and :func:`DataFrame.clip()` now treat NA values for upper and lower arguments as ``None`` instead of raising ``ValueError`` (:issue:`17276`).
+
+
+Categorical
+^^^^^^^^^^^
+- Bug in :func:`Series.isin` when called with a categorical (:issue:`16639`)
+- Bug in the categorical constructor with empty values and categories causing the ``.categories`` to be an empty ``Float64Index`` rather than an empty ``Index`` with object dtype (:issue:`17248`)
+- Bug in categorical operations with :ref:`Series.cat <categorical.cat>` not preserving the original Series' name (:issue:`17509`)
+- Bug in :func:`DataFrame.merge` failing for categorical columns with boolean/int data types (:issue:`17187`)
+- Bug in constructing a ``Categorical``/``CategoricalDtype`` when the specified ``categories`` are of categorical type (:issue:`17884`).
+
+.. _whatsnew_0210.pypy:
+
+PyPy
+^^^^
+
+- Compatibility with PyPy in :func:`read_csv` with ``usecols=[<unsorted ints>]`` and
+  :func:`read_json` (:issue:`17351`)
+- Split tests into cases for CPython and PyPy where needed, which highlights the fragility
+  of index matching with ``float('nan')``, ``np.nan`` and ``NAT`` (:issue:`17351`)
+- Fix :func:`DataFrame.memory_usage` to support PyPy. Objects on PyPy do not have a fixed size,
+  so an approximation is used instead (:issue:`17228`)
+
+Other
+^^^^^
+- Bug where some inplace operators were not being wrapped and produced a copy when invoked (:issue:`12962`)
+- Bug in :func:`eval` where the ``inplace`` parameter was being incorrectly handled (:issue:`16732`)
+
diff --git a/doc/source/whatsnew/v0.21.1.txt b/doc/source/whatsnew/v0.21.1.txt
new file mode 100644
index 0000000000000..49e59c9ddf5a7
--- /dev/null
+++ b/doc/source/whatsnew/v0.21.1.txt
@@ -0,0 +1,171 @@
+.. _whatsnew_0211:
+
+v0.21.1 (December 12, 2017)
+---------------------------
+
+This is a minor bug-fix release in the 0.21.x series and includes some small regression fixes,
+bug fixes and performance improvements.
+We recommend that all users upgrade to this version.
+
+Highlights include:
+
+- Temporarily restore matplotlib datetime plotting functionality. This should
+  resolve issues for users who implicitly relied on pandas to plot datetimes
+  with matplotlib. See :ref:`here <whatsnew_0211.converters>`.
+- Improvements to the Parquet IO functions introduced in 0.21.0. See
+  :ref:`here <whatsnew_0211.enhancements.parquet>`.
+
+
+.. contents:: What's new in v0.21.1
+    :local:
+    :backlinks: none
+
+
+.. _whatsnew_0211.converters:
+
+Restore Matplotlib datetime Converter Registration
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Pandas implements some matplotlib converters for nicely formatting the axis
+labels on plots with ``datetime`` or ``Period`` values. Prior to pandas 0.21.0,
+these were implicitly registered with matplotlib, as a side effect of ``import
+pandas``.
+
+In pandas 0.21.0, we required users to explicitly register the
+converter. This caused problems for some users who relied on those converters
+being present for regular ``matplotlib.pyplot`` plotting methods, so we're
+temporarily reverting that change; pandas 0.21.1 again registers the converters on
+import, just like before 0.21.0.
+
+We've added a new option to control the converters:
+``pd.options.plotting.matplotlib.register_converters``. By default, they are
+registered. Toggling this to ``False`` removes pandas' formatters and restore
+any converters we overwrote when registering them (:issue:`18301`).
+
+We're working with the matplotlib developers to make this easier. We're trying
+to balance user convenience (automatically registering the converters) with
+import performance and best practices (importing pandas shouldn't have the side
+effect of overwriting any custom converters you've already set). In the future
+we hope to have most of the datetime formatting functionality in matplotlib,
+with just the pandas-specific converters in pandas. We'll then gracefully
+deprecate the automatic registration of converters in favor of users explicitly
+registering them when they want them.
+
+.. _whatsnew_0211.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0211.enhancements.parquet:
+
+Improvements to the Parquet IO functionality
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- :func:`DataFrame.to_parquet` will now write non-default indexes when the
+  underlying engine supports it. The indexes will be preserved when reading
+  back in with :func:`read_parquet` (:issue:`18581`).
+- :func:`read_parquet` now allows to specify the columns to read from a parquet file (:issue:`18154`)
+- :func:`read_parquet` now allows to specify kwargs which are passed to the respective engine (:issue:`18216`)
+
+.. _whatsnew_0211.enhancements.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+- :meth:`Timestamp.timestamp` is now available in Python 2.7. (:issue:`17329`)
+- :class:`Grouper` and :class:`TimeGrouper` now have a friendly repr output (:issue:`18203`).
+
+.. _whatsnew_0211.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+
+- ``pandas.tseries.register`` has been renamed to
+  :func:`pandas.plotting.register_matplotlib_converters` (:issue:`18301`)
+
+.. _whatsnew_0211.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved performance of plotting large series/dataframes (:issue:`18236`).
+
+.. _whatsnew_0211.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+Conversion
+^^^^^^^^^^
+
+- Bug in :class:`TimedeltaIndex` subtraction could incorrectly overflow when ``NaT`` is present (:issue:`17791`)
+- Bug in :class:`DatetimeIndex` subtracting datetimelike from DatetimeIndex could fail to overflow (:issue:`18020`)
+- Bug in :meth:`IntervalIndex.copy` when copying and ``IntervalIndex`` with non-default ``closed`` (:issue:`18339`)
+- Bug in :func:`DataFrame.to_dict` where columns of datetime that are tz-aware were not converted to required arrays when used with ``orient='records'``, raising ``TypeError`` (:issue:`18372`)
+- Bug in :class:`DateTimeIndex` and :meth:`date_range` where mismatching tz-aware ``start`` and ``end`` timezones would not raise an err if ``end.tzinfo`` is None (:issue:`18431`)
+- Bug in :meth:`Series.fillna` which raised when passed a long integer on Python 2 (:issue:`18159`).
+
+Indexing
+^^^^^^^^
+
+- Bug in a boolean comparison of a ``datetime.datetime`` and a ``datetime64[ns]`` dtype Series (:issue:`17965`)
+- Bug where a ``MultiIndex`` with more than a million records was not raising ``AttributeError`` when trying to access a missing attribute (:issue:`18165`)
+- Bug in :class:`IntervalIndex` constructor when a list of intervals is passed with non-default ``closed`` (:issue:`18334`)
+- Bug in ``Index.putmask`` when an invalid mask passed (:issue:`18368`)
+- Bug in masked assignment of a ``timedelta64[ns]`` dtype ``Series``, incorrectly coerced to float (:issue:`18493`)
+
+I/O
+^^^
+
+- Bug in class:`~pandas.io.stata.StataReader` not converting date/time columns with display formatting addressed (:issue:`17990`). Previously columns with display formatting were normally left as ordinal numbers and not converted to datetime objects.
+- Bug in :func:`read_csv` when reading a compressed UTF-16 encoded file (:issue:`18071`)
+- Bug in :func:`read_csv` for handling null values in index columns when specifying ``na_filter=False`` (:issue:`5239`)
+- Bug in :func:`read_csv` when reading numeric category fields with high cardinality (:issue:`18186`)
+- Bug in :meth:`DataFrame.to_csv` when the table had ``MultiIndex`` columns, and a list of strings was passed in for ``header`` (:issue:`5539`)
+- Bug in parsing integer datetime-like columns with specified format in ``read_sql`` (:issue:`17855`).
+- Bug in :meth:`DataFrame.to_msgpack` when serializing data of the ``numpy.bool_`` datatype (:issue:`18390`)
+- Bug in :func:`read_json` not decoding when reading line delimited JSON from S3 (:issue:`17200`)
+- Bug in :func:`pandas.io.json.json_normalize` to avoid modification of ``meta`` (:issue:`18610`)
+- Bug in :func:`to_latex` where repeated MultiIndex values were not printed even though a higher level index differed from the previous row (:issue:`14484`)
+- Bug when reading NaN-only categorical columns in :class:`HDFStore` (:issue:`18413`)
+- Bug in :meth:`DataFrame.to_latex` with ``longtable=True`` where a latex multicolumn always spanned over three columns (:issue:`17959`)
+
+Plotting
+^^^^^^^^
+
+- Bug in ``DataFrame.plot()`` and ``Series.plot()`` with :class:`DatetimeIndex` where a figure generated by them is not pickleable in Python 3 (:issue:`18439`)
+
+Groupby/Resample/Rolling
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Bug in ``DataFrame.resample(...).apply(...)`` when there is a callable that returns different columns (:issue:`15169`)
+- Bug in ``DataFrame.resample(...)`` when there is a time change (DST) and resampling frequency is 12h or higher (:issue:`15549`)
+- Bug in ``pd.DataFrameGroupBy.count()`` when counting over a datetimelike column (:issue:`13393`)
+- Bug in ``rolling.var`` where calculation is inaccurate with a zero-valued array (:issue:`18430`)
+
+Reshaping
+^^^^^^^^^
+
+- Error message in ``pd.merge_asof()`` for key datatype mismatch now includes datatype of left and right key (:issue:`18068`)
+- Bug in ``pd.concat`` when empty and non-empty DataFrames or Series are concatenated (:issue:`18178` :issue:`18187`)
+- Bug in ``DataFrame.filter(...)`` when :class:`unicode` is passed as a condition in Python 2 (:issue:`13101`)
+- Bug when merging empty DataFrames when ``np.seterr(divide='raise')`` is set (:issue:`17776`)
+
+Numeric
+^^^^^^^
+
+- Bug in ``pd.Series.rolling.skew()`` and ``rolling.kurt()`` with all equal values has floating issue (:issue:`18044`)
+
+Categorical
+^^^^^^^^^^^
+
+- Bug in :meth:`DataFrame.astype` where casting to 'category' on an empty ``DataFrame`` causes a segmentation fault (:issue:`18004`)
+- Error messages in the testing module have been improved when items have different ``CategoricalDtype`` (:issue:`18069`)
+- ``CategoricalIndex`` can now correctly take a ``pd.api.types.CategoricalDtype`` as its dtype (:issue:`18116`)
+- Bug in ``Categorical.unique()`` returning read-only ``codes``  array when all categories were ``NaN`` (:issue:`18051`)
+- Bug in ``DataFrame.groupby(axis=1)`` with a ``CategoricalIndex`` (:issue:`18432`)
+
+String
+^^^^^^
+
+- :meth:`Series.str.split()` will now propagate ``NaN`` values across all expanded columns instead of ``None`` (:issue:`18450`)
diff --git a/doc/source/whatsnew/v0.22.0.txt b/doc/source/whatsnew/v0.22.0.txt
new file mode 100644
index 0000000000000..d165339cb0de9
--- /dev/null
+++ b/doc/source/whatsnew/v0.22.0.txt
@@ -0,0 +1,243 @@
+.. _whatsnew_0220:
+
+v0.22.0 (December 29, 2017)
+---------------------------
+
+This is a major release from 0.21.1 and includes a single, API-breaking change.
+We recommend that all users upgrade to this version after carefully reading the
+release note (singular!).
+
+.. _whatsnew_0220.api_breaking:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Pandas 0.22.0 changes the handling of empty and all-*NA* sums and products. The
+summary is that
+
+* The sum of an empty or all-*NA* ``Series`` is now ``0``
+* The product of an empty or all-*NA* ``Series`` is now ``1``
+* We've added a ``min_count`` parameter to ``.sum()`` and ``.prod()`` controlling
+  the minimum number of valid values for the result to be valid. If fewer than
+  ``min_count`` non-*NA* values are present, the result is *NA*. The default is
+  ``0``. To return ``NaN``, the 0.21 behavior, use ``min_count=1``.
+
+Some background: In pandas 0.21, we fixed a long-standing inconsistency
+in the return value of all-*NA* series depending on whether or not bottleneck
+was installed. See :ref:`whatsnew_0210.api_breaking.bottleneck`. At the same
+time, we changed the sum and prod of an empty ``Series`` to also be ``NaN``.
+
+Based on feedback, we've partially reverted those changes.
+
+Arithmetic Operations
+^^^^^^^^^^^^^^^^^^^^^
+
+The default sum for empty or all-*NA* ``Series`` is now ``0``.
+
+*pandas 0.21.x*
+
+.. code-block:: ipython
+
+   In [1]: pd.Series([]).sum()
+   Out[1]: nan
+
+   In [2]: pd.Series([np.nan]).sum()
+   Out[2]: nan
+
+*pandas 0.22.0*
+
+.. ipython:: python
+
+   pd.Series([]).sum()
+   pd.Series([np.nan]).sum()
+
+The default behavior is the same as pandas 0.20.3 with bottleneck installed. It
+also matches the behavior of NumPy's ``np.nansum`` on empty and all-*NA* arrays.
+
+To have the sum of an empty series return ``NaN`` (the default behavior of
+pandas 0.20.3 without bottleneck, or pandas 0.21.x), use the ``min_count``
+keyword.
+
+.. ipython:: python
+
+   pd.Series([]).sum(min_count=1)
+
+Thanks to the ``skipna`` parameter, the ``.sum`` on an all-*NA*
+series is conceptually the same as the ``.sum`` of an empty one with
+``skipna=True`` (the default).
+
+.. ipython:: python
+
+   pd.Series([np.nan]).sum(min_count=1)  # skipna=True by default
+
+The ``min_count`` parameter refers to the minimum number of *non-null* values
+required for a non-NA sum or product.
+
+:meth:`Series.prod` has been updated to behave the same as :meth:`Series.sum`,
+returning ``1`` instead.
+
+.. ipython:: python
+
+   pd.Series([]).prod()
+   pd.Series([np.nan]).prod()
+   pd.Series([]).prod(min_count=1)
+
+These changes affect :meth:`DataFrame.sum` and :meth:`DataFrame.prod` as well.
+Finally, a few less obvious places in pandas are affected by this change.
+
+Grouping by a Categorical
+^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Grouping by a ``Categorical`` and summing now returns ``0`` instead of
+``NaN`` for categories with no observations. The product now returns ``1``
+instead of ``NaN``.
+
+*pandas 0.21.x*
+
+.. code-block:: ipython
+
+   In [8]: grouper = pd.Categorical(['a', 'a'], categories=['a', 'b'])
+
+   In [9]: pd.Series([1, 2]).groupby(grouper).sum()
+   Out[9]:
+   a    3.0
+   b    NaN
+   dtype: float64
+
+*pandas 0.22*
+
+.. ipython:: python
+
+   grouper = pd.Categorical(['a', 'a'], categories=['a', 'b'])
+   pd.Series([1, 2]).groupby(grouper).sum()
+
+To restore the 0.21 behavior of returning ``NaN`` for unobserved groups,
+use ``min_count>=1``.
+
+.. ipython:: python
+
+   pd.Series([1, 2]).groupby(grouper).sum(min_count=1)
+
+Resample
+^^^^^^^^
+
+The sum and product of all-*NA* bins has changed from ``NaN`` to ``0`` for
+sum and ``1`` for product.
+
+*pandas 0.21.x*
+
+.. code-block:: ipython
+
+   In [11]: s = pd.Series([1, 1, np.nan, np.nan],
+      ...:                index=pd.date_range('2017', periods=4))
+      ...:  s
+   Out[11]:
+   2017-01-01    1.0
+   2017-01-02    1.0
+   2017-01-03    NaN
+   2017-01-04    NaN
+   Freq: D, dtype: float64
+
+   In [12]: s.resample('2d').sum()
+   Out[12]:
+   2017-01-01    2.0
+   2017-01-03    NaN
+   Freq: 2D, dtype: float64
+
+*pandas 0.22.0*
+
+.. ipython:: python
+
+   s = pd.Series([1, 1, np.nan, np.nan],
+                 index=pd.date_range('2017', periods=4))
+   s.resample('2d').sum()
+
+To restore the 0.21 behavior of returning ``NaN``, use ``min_count>=1``.
+
+.. ipython:: python
+
+   s.resample('2d').sum(min_count=1)
+
+In particular, upsampling and taking the sum or product is affected, as
+upsampling introduces missing values even if the original series was
+entirely valid.
+
+*pandas 0.21.x*
+
+.. code-block:: ipython
+
+   In [14]: idx = pd.DatetimeIndex(['2017-01-01', '2017-01-02'])
+
+   In [15]: pd.Series([1, 2], index=idx).resample('12H').sum()
+   Out[15]:
+   2017-01-01 00:00:00    1.0
+   2017-01-01 12:00:00    NaN
+   2017-01-02 00:00:00    2.0
+   Freq: 12H, dtype: float64
+
+*pandas 0.22.0*
+
+.. ipython:: python
+
+   idx = pd.DatetimeIndex(['2017-01-01', '2017-01-02'])
+   pd.Series([1, 2], index=idx).resample("12H").sum()
+
+Once again, the ``min_count`` keyword is available to restore the 0.21 behavior.
+
+.. ipython:: python
+
+   pd.Series([1, 2], index=idx).resample("12H").sum(min_count=1)
+
+Rolling and Expanding
+^^^^^^^^^^^^^^^^^^^^^
+
+Rolling and expanding already have a ``min_periods`` keyword that behaves
+similar to ``min_count``. The only case that changes is when doing a rolling
+or expanding sum with ``min_periods=0``. Previously this returned ``NaN``,
+when fewer than ``min_periods`` non-*NA* values were in the window. Now it
+returns ``0``.
+
+*pandas 0.21.1*
+
+.. code-block:: ipython
+
+   In [17]: s = pd.Series([np.nan, np.nan])
+
+   In [18]: s.rolling(2, min_periods=0).sum()
+   Out[18]:
+   0   NaN
+   1   NaN
+   dtype: float64
+
+*pandas 0.22.0*
+
+.. ipython:: python
+
+   s = pd.Series([np.nan, np.nan])
+   s.rolling(2, min_periods=0).sum()
+
+The default behavior of ``min_periods=None``, implying that ``min_periods``
+equals the window size, is unchanged.
+
+Compatibility
+~~~~~~~~~~~~~
+
+If you maintain a library that should work across pandas versions, it
+may be easiest to exclude pandas 0.21 from your requirements. Otherwise, all your
+``sum()`` calls would need to check if the ``Series`` is empty before summing.
+
+With setuptools, in your ``setup.py`` use::
+
+    install_requires=['pandas!=0.21.*', ...]
+
+With conda, use
+
+.. code-block:: yaml
+
+    requirements:
+      run:
+        - pandas !=0.21.0,!=0.21.1
+
+Note that the inconsistency in the return value for all-*NA* series is still
+there for pandas 0.20.3 and earlier. Avoiding pandas 0.21 will only help with
+the empty case.
diff --git a/doc/source/whatsnew/v0.23.0.txt b/doc/source/whatsnew/v0.23.0.txt
new file mode 100644
index 0000000000000..2430b6ac2bbd4
--- /dev/null
+++ b/doc/source/whatsnew/v0.23.0.txt
@@ -0,0 +1,1415 @@
+.. _whatsnew_0230:
+
+v0.23.0 (May 15, 2018)
+----------------------
+
+This is a major release from 0.22.0 and includes a number of API changes,
+deprecations, new features, enhancements, and performance improvements along
+with a large number of bug fixes. We recommend that all users upgrade to this
+version.
+
+Highlights include:
+
+- :ref:`Round-trippable JSON format with 'table' orient <whatsnew_0230.enhancements.round-trippable_json>`.
+- :ref:`Instantiation from dicts respects order for Python 3.6+ <whatsnew_0230.api_breaking.dict_insertion_order>`.
+- :ref:`Dependent column arguments for assign <whatsnew_0230.enhancements.assign_dependent>`.
+- :ref:`Merging / sorting on a combination of columns and index levels <whatsnew_0230.enhancements.merge_on_columns_and_levels>`.
+- :ref:`Extending Pandas with custom types <whatsnew_023.enhancements.extension>`.
+- :ref:`Excluding unobserved categories from groupby <whatsnew_0230.enhancements.categorical_grouping>`.
+- :ref:`Changes to make output shape of DataFrame.apply consistent <whatsnew_0230.api_breaking.apply>`.
+
+Check the :ref:`API Changes <whatsnew_0230.api_breaking>` and :ref:`deprecations <whatsnew_0230.deprecations>` before updating.
+
+.. warning::
+
+   Starting January 1, 2019, pandas feature releases will support Python 3 only.
+   See :ref:`install.dropping-27` for more.
+
+.. contents:: What's new in v0.23.0
+    :local:
+    :backlinks: none
+    :depth: 2
+
+.. _whatsnew_0230.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0230.enhancements.round-trippable_json:
+
+JSON read/write round-trippable with ``orient='table'``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+A ``DataFrame`` can now be written to and subsequently read back via JSON while preserving metadata through usage of the ``orient='table'`` argument (see :issue:`18912` and :issue:`9146`). Previously, none of the available ``orient`` values guaranteed the preservation of dtypes and index names, amongst other metadata.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'foo': [1, 2, 3, 4],
+		      'bar': ['a', 'b', 'c', 'd'],
+		      'baz': pd.date_range('2018-01-01', freq='d', periods=4),
+		      'qux': pd.Categorical(['a', 'b', 'c', 'c'])
+		      }, index=pd.Index(range(4), name='idx'))
+   df
+   df.dtypes
+   df.to_json('test.json', orient='table')
+   new_df = pd.read_json('test.json', orient='table')
+   new_df
+   new_df.dtypes
+
+Please note that the string `index` is not supported with the round trip format, as it is used by default in ``write_json`` to indicate a missing index name.
+
+.. ipython:: python
+   :okwarning:
+
+   df.index.name = 'index'
+
+   df.to_json('test.json', orient='table')
+   new_df = pd.read_json('test.json', orient='table')
+   new_df
+   new_df.dtypes
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   os.remove('test.json')
+
+
+.. _whatsnew_0230.enhancements.assign_dependent:
+
+
+``.assign()`` accepts dependent arguments
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :func:`DataFrame.assign` now accepts dependent keyword arguments for python version later than 3.6 (see also `PEP 468
+<https://www.python.org/dev/peps/pep-0468/>`_). Later keyword arguments may now refer to earlier ones if the argument is a callable. See the
+:ref:`documentation here <dsintro.chained_assignment>` (:issue:`14207`)
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': [1, 2, 3]})
+    df
+    df.assign(B=df.A, C=lambda x:x['A']+ x['B'])
+
+.. warning::
+
+  This may subtly change the behavior of your code when you're
+  using ``.assign()`` to update an existing column. Previously, callables
+  referring to other variables being updated would get the "old" values
+
+  Previous Behavior:
+
+  .. code-block:: ipython
+
+      In [2]: df = pd.DataFrame({"A": [1, 2, 3]})
+
+      In [3]: df.assign(A=lambda df: df.A + 1, C=lambda df: df.A * -1)
+      Out[3]:
+         A  C
+      0  2 -1
+      1  3 -2
+      2  4 -3
+
+  New Behavior:
+
+  .. ipython:: python
+
+      df.assign(A=df.A+1, C= lambda df: df.A* -1)
+
+
+
+.. _whatsnew_0230.enhancements.merge_on_columns_and_levels:
+
+Merging on a combination of columns and index levels
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Strings passed to :meth:`DataFrame.merge` as the ``on``, ``left_on``, and ``right_on``
+parameters may now refer to either column names or index level names.
+This enables merging ``DataFrame`` instances on a combination of index levels
+and columns without resetting indexes. See the :ref:`Merge on columns and
+levels <merging.merge_on_columns_and_levels>` documentation section.
+(:issue:`14355`)
+
+.. ipython:: python
+
+   left_index = pd.Index(['K0', 'K0', 'K1', 'K2'], name='key1')
+
+   left = pd.DataFrame({'A': ['A0', 'A1', 'A2', 'A3'],
+                        'B': ['B0', 'B1', 'B2', 'B3'],
+                        'key2': ['K0', 'K1', 'K0', 'K1']},
+                       index=left_index)
+
+   right_index = pd.Index(['K0', 'K1', 'K2', 'K2'], name='key1')
+
+   right = pd.DataFrame({'C': ['C0', 'C1', 'C2', 'C3'],
+                         'D': ['D0', 'D1', 'D2', 'D3'],
+                         'key2': ['K0', 'K0', 'K0', 'K1']},
+                        index=right_index)
+
+   left.merge(right, on=['key1', 'key2'])
+
+.. _whatsnew_0230.enhancements.sort_by_columns_and_levels:
+
+Sorting by a combination of columns and index levels
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Strings passed to :meth:`DataFrame.sort_values` as the ``by`` parameter may
+now refer to either column names or index level names.  This enables sorting
+``DataFrame`` instances by a combination of index levels and columns without
+resetting indexes. See the :ref:`Sorting by Indexes and Values
+<basics.sort_indexes_and_values>` documentation section.
+(:issue:`14353`)
+
+.. ipython:: python
+
+   # Build MultiIndex
+   idx = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('a', 2),
+                                    ('b', 2), ('b', 1), ('b', 1)])
+   idx.names = ['first', 'second']
+
+   # Build DataFrame
+   df_multi = pd.DataFrame({'A': np.arange(6, 0, -1)},
+                           index=idx)
+   df_multi
+
+   # Sort by 'second' (index) and 'A' (column)
+   df_multi.sort_values(by=['second', 'A'])
+
+
+.. _whatsnew_023.enhancements.extension:
+
+Extending Pandas with Custom Types (Experimental)
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Pandas now supports storing array-like objects that aren't necessarily 1-D NumPy
+arrays as columns in a DataFrame or values in a Series. This allows third-party
+libraries to implement extensions to NumPy's types, similar to how pandas
+implemented categoricals, datetimes with timezones, periods, and intervals.
+
+As a demonstration, we'll use cyberpandas_, which provides an ``IPArray`` type
+for storing ip addresses.
+
+.. code-block:: ipython
+
+   In [1]: from cyberpandas import IPArray
+
+   In [2]: values = IPArray([
+      ...:     0,
+      ...:     3232235777,
+      ...:     42540766452641154071740215577757643572
+      ...: ])
+      ...:
+      ...:
+
+``IPArray`` isn't a normal 1-D NumPy array, but because it's a pandas
+:class:`~pandas.api.extension.ExtensionArray`, it can be stored properly inside pandas' containers.
+
+.. code-block:: ipython
+
+   In [3]: ser = pd.Series(values)
+
+   In [4]: ser
+   Out[4]:
+   0                         0.0.0.0
+   1                     192.168.1.1
+   2    2001:db8:85a3::8a2e:370:7334
+   dtype: ip
+
+Notice that the dtype is ``ip``. The missing value semantics of the underlying
+array are respected:
+
+.. code-block:: ipython
+
+   In [5]: ser.isna()
+   Out[5]:
+   0     True
+   1    False
+   2    False
+   dtype: bool
+
+For more, see the :ref:`extension types <extending.extension-types>`
+documentation. If you build an extension array, publicize it on our
+:ref:`ecosystem page <ecosystem.extensions>`.
+
+.. _cyberpandas: https://cyberpandas.readthedocs.io/en/latest/
+
+
+.. _whatsnew_0230.enhancements.categorical_grouping:
+
+New ``observed`` keyword for excluding unobserved categories in ``groupby``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Grouping by a categorical includes the unobserved categories in the output.
+When grouping by multiple categorical columns, this means you get the cartesian product of all the
+categories, including combinations where there are no observations, which can result in a large
+number of groups. We have added a keyword ``observed`` to control this behavior, it defaults to
+``observed=False`` for backward-compatibility. (:issue:`14942`, :issue:`8138`, :issue:`15217`, :issue:`17594`, :issue:`8669`, :issue:`20583`, :issue:`20902`)
+
+.. ipython:: python
+
+   cat1 = pd.Categorical(["a", "a", "b", "b"],
+                         categories=["a", "b", "z"], ordered=True)
+   cat2 = pd.Categorical(["c", "d", "c", "d"],
+                         categories=["c", "d", "y"], ordered=True)
+   df = pd.DataFrame({"A": cat1, "B": cat2, "values": [1, 2, 3, 4]})
+   df['C'] = ['foo', 'bar'] * 2
+   df
+
+To show all values, the previous behavior:
+
+.. ipython:: python
+
+   df.groupby(['A', 'B', 'C'], observed=False).count()
+
+
+To show only observed values:
+
+.. ipython:: python
+
+   df.groupby(['A', 'B', 'C'], observed=True).count()
+
+For pivotting operations, this behavior is *already* controlled by the ``dropna`` keyword:
+
+.. ipython:: python
+
+   cat1 = pd.Categorical(["a", "a", "b", "b"],
+                         categories=["a", "b", "z"], ordered=True)
+   cat2 = pd.Categorical(["c", "d", "c", "d"],
+                         categories=["c", "d", "y"], ordered=True)
+   df = DataFrame({"A": cat1, "B": cat2, "values": [1, 2, 3, 4]})
+   df
+
+.. ipython:: python
+
+   pd.pivot_table(df, values='values', index=['A', 'B'],
+                  dropna=True)
+   pd.pivot_table(df, values='values', index=['A', 'B'],
+                  dropna=False)
+
+
+.. _whatsnew_0230.enhancements.window_raw:
+
+Rolling/Expanding.apply() accepts ``raw=False`` to pass a ``Series`` to the function
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`Series.rolling().apply() <pandas.core.window.Rolling.apply>`, :func:`DataFrame.rolling().apply() <pandas.core.window.Rolling.apply>`,
+:func:`Series.expanding().apply() <pandas.core.window.Expanding.apply>`, and :func:`DataFrame.expanding().apply() <pandas.core.window.Expanding.apply>` have gained a ``raw=None`` parameter.
+This is similar to :func:`DataFame.apply`. This parameter, if ``True`` allows one to send a ``np.ndarray`` to the applied function. If ``False`` a ``Series`` will be passed. The
+default is ``None``, which preserves backward compatibility, so this will default to ``True``, sending an ``np.ndarray``.
+In a future version the default will be changed to ``False``, sending a ``Series``. (:issue:`5071`, :issue:`20584`)
+
+.. ipython:: python
+
+   s = pd.Series(np.arange(5), np.arange(5) + 1)
+   s
+
+Pass a ``Series``:
+
+.. ipython:: python
+
+   s.rolling(2, min_periods=1).apply(lambda x: x.iloc[-1], raw=False)
+
+Mimic the original behavior of passing a ndarray:
+
+.. ipython:: python
+
+   s.rolling(2, min_periods=1).apply(lambda x: x[-1], raw=True)
+
+
+.. _whatsnew_0210.enhancements.limit_area:
+
+``DataFrame.interpolate`` has gained the ``limit_area`` kwarg
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:meth:`DataFrame.interpolate` has gained a ``limit_area`` parameter to allow further control of which ``NaN`` s are replaced.
+Use ``limit_area='inside'`` to fill only NaNs surrounded by valid values or use ``limit_area='outside'`` to fill only ``NaN`` s
+outside the existing valid values while preserving those inside.  (:issue:`16284`) See the :ref:`full documentation here <missing_data.interp_limits>`.
+
+
+.. ipython:: python
+
+   ser = pd.Series([np.nan, np.nan, 5, np.nan, np.nan, np.nan, 13, np.nan, np.nan])
+   ser
+
+Fill one consecutive inside value in both directions
+
+.. ipython:: python
+
+   ser.interpolate(limit_direction='both', limit_area='inside', limit=1)
+
+Fill all consecutive outside values backward
+
+.. ipython:: python
+
+   ser.interpolate(limit_direction='backward', limit_area='outside')
+
+Fill all consecutive outside values in both directions
+
+.. ipython:: python
+
+   ser.interpolate(limit_direction='both', limit_area='outside')
+
+.. _whatsnew_0210.enhancements.get_dummies_dtype:
+
+``get_dummies`` now supports ``dtype`` argument
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :func:`get_dummies` now accepts a ``dtype`` argument, which specifies a dtype for the new columns. The default remains uint8. (:issue:`18330`)
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': [1, 2], 'b': [3, 4], 'c': [5, 6]})
+   pd.get_dummies(df, columns=['c']).dtypes
+   pd.get_dummies(df, columns=['c'], dtype=bool).dtypes
+
+
+.. _whatsnew_0230.enhancements.timedelta_mod:
+
+Timedelta mod method
+^^^^^^^^^^^^^^^^^^^^
+
+``mod`` (%) and ``divmod`` operations are now defined on ``Timedelta`` objects
+when operating with either timedelta-like or with numeric arguments.
+See the :ref:`documentation here <timedeltas.mod_divmod>`. (:issue:`19365`)
+
+.. ipython:: python
+
+    td = pd.Timedelta(hours=37)
+    td % pd.Timedelta(minutes=45)
+
+.. _whatsnew_0230.enhancements.ran_inf:
+
+``.rank()`` handles ``inf`` values when ``NaN`` are present
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions, ``.rank()`` would assign ``inf`` elements ``NaN`` as their ranks. Now ranks are calculated properly. (:issue:`6945`)
+
+.. ipython:: python
+
+    s = pd.Series([-np.inf, 0, 1, np.nan, np.inf])
+    s
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+    In [11]: s.rank()
+    Out[11]:
+    0    1.0
+    1    2.0
+    2    3.0
+    3    NaN
+    4    NaN
+    dtype: float64
+
+Current Behavior:
+
+.. ipython:: python
+
+    s.rank()
+
+Furthermore, previously if you rank ``inf`` or ``-inf`` values together with ``NaN`` values, the calculation won't distinguish ``NaN`` from infinity when using 'top' or 'bottom' argument.
+
+.. ipython:: python
+
+    s = pd.Series([np.nan, np.nan, -np.inf, -np.inf])
+    s
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+    In [15]: s.rank(na_option='top')
+    Out[15]:
+    0    2.5
+    1    2.5
+    2    2.5
+    3    2.5
+    dtype: float64
+
+Current Behavior:
+
+.. ipython:: python
+
+    s.rank(na_option='top')
+
+These bugs were squashed:
+
+- Bug in :meth:`DataFrame.rank` and :meth:`Series.rank` when ``method='dense'`` and ``pct=True`` in which percentile ranks were not being used with the number of distinct observations (:issue:`15630`)
+- Bug in :meth:`Series.rank` and :meth:`DataFrame.rank` when ``ascending='False'`` failed to return correct ranks for infinity if ``NaN`` were present (:issue:`19538`)
+- Bug in :func:`DataFrameGroupBy.rank` where ranks were incorrect when both infinity and ``NaN`` were present (:issue:`20561`)
+
+
+.. _whatsnew_0230.enhancements.str_cat_align:
+
+``Series.str.cat`` has gained the ``join`` kwarg
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously, :meth:`Series.str.cat` did not -- in contrast to most of ``pandas`` -- align :class:`Series` on their index before concatenation (see :issue:`18657`).
+The method has now gained a keyword ``join`` to control the manner of alignment, see examples below and :ref:`here <text.concatenate>`.
+
+In v.0.23 `join` will default to None (meaning no alignment), but this default will change to ``'left'`` in a future version of pandas.
+
+.. ipython:: python
+   :okwarning:
+
+    s = pd.Series(['a', 'b', 'c', 'd'])
+    t = pd.Series(['b', 'd', 'e', 'c'], index=[1, 3, 4, 2])
+    s.str.cat(t)
+    s.str.cat(t, join='left', na_rep='-')
+
+Furthermore, :meth:`Series.str.cat` now works for ``CategoricalIndex`` as well (previously raised a ``ValueError``; see :issue:`20842`).
+
+.. _whatsnew_0230.enhancements.astype_category:
+
+``DataFrame.astype`` performs column-wise conversion to ``Categorical``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:meth:`DataFrame.astype` can now perform column-wise conversion to ``Categorical`` by supplying the string ``'category'`` or
+a :class:`~pandas.api.types.CategoricalDtype`. Previously, attempting this would raise a ``NotImplementedError``. See the
+:ref:`categorical.objectcreation` section of the documentation for more details and examples. (:issue:`12860`, :issue:`18099`)
+
+Supplying the string ``'category'`` performs column-wise conversion, with only labels appearing in a given column set as categories:
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': list('abca'), 'B': list('bccd')})
+    df = df.astype('category')
+    df['A'].dtype
+    df['B'].dtype
+
+
+Supplying a ``CategoricalDtype`` will make the categories in each column consistent with the supplied dtype:
+
+.. ipython:: python
+
+    from pandas.api.types import CategoricalDtype
+    df = pd.DataFrame({'A': list('abca'), 'B': list('bccd')})
+    cdt = CategoricalDtype(categories=list('abcd'), ordered=True)
+    df = df.astype(cdt)
+    df['A'].dtype
+    df['B'].dtype
+
+
+.. _whatsnew_0230.enhancements.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+- Unary ``+`` now permitted for ``Series`` and ``DataFrame`` as  numeric operator (:issue:`16073`)
+- Better support for :meth:`~pandas.io.formats.style.Styler.to_excel` output with the ``xlsxwriter`` engine. (:issue:`16149`)
+- :func:`pandas.tseries.frequencies.to_offset` now accepts leading '+' signs e.g. '+1h'. (:issue:`18171`)
+- :func:`MultiIndex.unique` now supports the ``level=`` argument, to get unique values from a specific index level (:issue:`17896`)
+- :class:`pandas.io.formats.style.Styler` now has method ``hide_index()`` to determine whether the index will be rendered in output (:issue:`14194`)
+- :class:`pandas.io.formats.style.Styler` now has method ``hide_columns()`` to determine whether columns will be hidden in output (:issue:`14194`)
+- Improved wording of ``ValueError`` raised in :func:`to_datetime` when ``unit=`` is passed with a non-convertible value (:issue:`14350`)
+- :func:`Series.fillna` now accepts a Series or a dict as a ``value`` for a categorical dtype (:issue:`17033`)
+- :func:`pandas.read_clipboard` updated to use qtpy, falling back to PyQt5 and then PyQt4, adding compatibility with Python3 and multiple python-qt bindings (:issue:`17722`)
+- Improved wording of ``ValueError`` raised in :func:`read_csv` when the ``usecols`` argument cannot match all columns. (:issue:`17301`)
+- :func:`DataFrame.corrwith` now silently drops non-numeric columns when passed a Series. Before, an exception was raised (:issue:`18570`).
+- :class:`IntervalIndex` now supports time zone aware ``Interval`` objects (:issue:`18537`, :issue:`18538`)
+- :func:`Series` / :func:`DataFrame` tab completion also returns identifiers in the first level of a :func:`MultiIndex`. (:issue:`16326`)
+- :func:`read_excel()` has gained the ``nrows`` parameter (:issue:`16645`)
+- :meth:`DataFrame.append` can now in more cases preserve the type of the calling dataframe's columns (e.g. if both are ``CategoricalIndex``) (:issue:`18359`)
+- :meth:`DataFrame.to_json` and :meth:`Series.to_json` now accept an ``index`` argument which allows the user to exclude the index from the JSON output (:issue:`17394`)
+- ``IntervalIndex.to_tuples()`` has gained the ``na_tuple`` parameter to control whether NA is returned as a tuple of NA, or NA itself (:issue:`18756`)
+- ``Categorical.rename_categories``, ``CategoricalIndex.rename_categories`` and :attr:`Series.cat.rename_categories`
+  can now take a callable as their argument (:issue:`18862`)
+- :class:`Interval` and :class:`IntervalIndex` have gained a ``length`` attribute (:issue:`18789`)
+- ``Resampler`` objects now have a functioning :attr:`~pandas.core.resample.Resampler.pipe` method.
+  Previously, calls to ``pipe`` were diverted to  the ``mean`` method (:issue:`17905`).
+- :func:`~pandas.api.types.is_scalar` now returns ``True`` for ``DateOffset`` objects (:issue:`18943`).
+- :func:`DataFrame.pivot` now accepts a list for the ``values=`` kwarg (:issue:`17160`).
+- Added :func:`pandas.api.extensions.register_dataframe_accessor`,
+  :func:`pandas.api.extensions.register_series_accessor`, and
+  :func:`pandas.api.extensions.register_index_accessor`, accessor for libraries downstream of pandas
+  to register custom accessors like ``.cat`` on pandas objects. See
+  :ref:`Registering Custom Accessors <extending.register-accessors>` for more (:issue:`14781`).
+
+- ``IntervalIndex.astype`` now supports conversions between subtypes when passed an ``IntervalDtype`` (:issue:`19197`)
+- :class:`IntervalIndex` and its associated constructor methods (``from_arrays``, ``from_breaks``, ``from_tuples``) have gained a ``dtype`` parameter (:issue:`19262`)
+- Added :func:`pandas.core.groupby.SeriesGroupBy.is_monotonic_increasing` and :func:`pandas.core.groupby.SeriesGroupBy.is_monotonic_decreasing` (:issue:`17015`)
+- For subclassed ``DataFrames``, :func:`DataFrame.apply` will now preserve the ``Series`` subclass (if defined) when passing the data to the applied function (:issue:`19822`)
+- :func:`DataFrame.from_dict` now accepts a ``columns`` argument that can be used to specify the column names when ``orient='index'`` is used (:issue:`18529`)
+- Added option ``display.html.use_mathjax`` so `MathJax <https://www.mathjax.org/>`_ can be disabled when rendering tables in ``Jupyter`` notebooks (:issue:`19856`, :issue:`19824`)
+- :func:`DataFrame.replace` now supports the ``method`` parameter, which can be used to specify the replacement method when ``to_replace`` is a scalar, list or tuple and ``value`` is ``None`` (:issue:`19632`)
+- :meth:`Timestamp.month_name`, :meth:`DatetimeIndex.month_name`, and :meth:`Series.dt.month_name` are now available (:issue:`12805`)
+- :meth:`Timestamp.day_name` and :meth:`DatetimeIndex.day_name` are now available to return day names with a specified locale (:issue:`12806`)
+- :meth:`DataFrame.to_sql` now performs a multi-value insert if the underlying connection supports itk rather than inserting row by row.
+  ``SQLAlchemy`` dialects supporting multi-value inserts include: ``mysql``, ``postgresql``, ``sqlite`` and any dialect with ``supports_multivalues_insert``. (:issue:`14315`, :issue:`8953`)
+- :func:`read_html` now accepts a ``displayed_only`` keyword argument to controls whether or not hidden elements are parsed (``True`` by default) (:issue:`20027`)
+- :func:`read_html` now reads all ``<tbody>`` elements in a ``<table>``, not just the first. (:issue:`20690`)
+- :meth:`~pandas.core.window.Rolling.quantile` and :meth:`~pandas.core.window.Expanding.quantile` now accept the ``interpolation`` keyword, ``linear`` by default (:issue:`20497`)
+- zip compression is supported via ``compression=zip`` in :func:`DataFrame.to_pickle`, :func:`Series.to_pickle`, :func:`DataFrame.to_csv`, :func:`Series.to_csv`, :func:`DataFrame.to_json`, :func:`Series.to_json`. (:issue:`17778`)
+- :class:`~pandas.tseries.offsets.WeekOfMonth` constructor now supports ``n=0`` (:issue:`20517`).
+- :class:`DataFrame` and :class:`Series` now support matrix multiplication (``@``) operator (:issue:`10259`) for Python>=3.5
+- Updated :meth:`DataFrame.to_gbq` and :meth:`pandas.read_gbq` signature and documentation to reflect changes from
+  the Pandas-GBQ library version 0.4.0. Adds intersphinx mapping to Pandas-GBQ
+  library. (:issue:`20564`)
+- Added new writer for exporting Stata dta files in version 117, ``StataWriter117``.  This format supports exporting strings with lengths up to 2,000,000 characters (:issue:`16450`)
+- :func:`to_hdf` and :func:`read_hdf` now accept an ``errors`` keyword argument to control encoding error handling (:issue:`20835`)
+- :func:`cut` has gained the ``duplicates='raise'|'drop'`` option to control whether to raise on duplicated edges (:issue:`20947`)
+- :func:`date_range`, :func:`timedelta_range`, and :func:`interval_range` now return a linearly spaced index if ``start``, ``stop``, and ``periods`` are specified, but ``freq`` is not. (:issue:`20808`, :issue:`20983`, :issue:`20976`)
+
+.. _whatsnew_0230.api_breaking:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _whatsnew_0230.api_breaking.deps:
+
+Dependencies have increased minimum versions
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+We have updated our minimum supported versions of dependencies (:issue:`15184`).
+If installed, we now require:
+
++-----------------+-----------------+----------+---------------+
+| Package         | Minimum Version | Required |     Issue     |
++=================+=================+==========+===============+
+| python-dateutil | 2.5.0           |    X     | :issue:`15184`|
++-----------------+-----------------+----------+---------------+
+| openpyxl        | 2.4.0           |          | :issue:`15184`|
++-----------------+-----------------+----------+---------------+
+| beautifulsoup4  | 4.2.1           |          | :issue:`20082`|
++-----------------+-----------------+----------+---------------+
+| setuptools      | 24.2.0          |          | :issue:`20698`|
++-----------------+-----------------+----------+---------------+
+
+.. _whatsnew_0230.api_breaking.dict_insertion_order:
+
+Instantiation from dicts preserves dict insertion order for python 3.6+
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Until Python 3.6, dicts in Python had no formally defined ordering. For Python
+version 3.6 and later, dicts are ordered by insertion order, see
+`PEP 468 <https://www.python.org/dev/peps/pep-0468/>`_.
+Pandas will use the dict's insertion order, when creating a ``Series`` or
+``DataFrame`` from a dict and you're using Python version 3.6 or
+higher. (:issue:`19884`)
+
+Previous Behavior (and current behavior if on Python < 3.6):
+
+.. code-block:: ipython
+
+   pd.Series({'Income': 2000,
+              'Expenses': -1500,
+              'Taxes': -200,
+              'Net result': 300})
+   Expenses     -1500
+   Income        2000
+   Net result     300
+   Taxes         -200
+   dtype: int64
+
+Note the Series above is ordered alphabetically by the index values.
+
+New Behavior (for Python >= 3.6):
+
+.. ipython:: python
+
+    pd.Series({'Income': 2000,
+               'Expenses': -1500,
+               'Taxes': -200,
+               'Net result': 300})
+
+Notice that the Series is now ordered by insertion order. This new behavior is
+used for all relevant pandas types (``Series``, ``DataFrame``, ``SparseSeries``
+and ``SparseDataFrame``).
+
+If you wish to retain the old behavior while using Python >= 3.6, you can use
+``.sort_index()``:
+
+.. ipython:: python
+
+    pd.Series({'Income': 2000,
+               'Expenses': -1500,
+               'Taxes': -200,
+               'Net result': 300}).sort_index()
+
+.. _whatsnew_0230.api_breaking.deprecate_panel:
+
+Deprecate Panel
+^^^^^^^^^^^^^^^
+
+``Panel`` was deprecated in the 0.20.x release, showing as a ``DeprecationWarning``. Using ``Panel`` will now show a ``FutureWarning``. The recommended way to represent 3-D data are
+with a ``MultiIndex`` on a ``DataFrame`` via the :meth:`~Panel.to_frame` or with the `xarray package <http://xarray.pydata.org/en/stable/>`__. Pandas
+provides a :meth:`~Panel.to_xarray` method to automate this conversion. For more details see :ref:`Deprecate Panel <dsintro.deprecate_panel>` documentation. (:issue:`13563`, :issue:`18324`).
+
+.. ipython:: python
+   :suppress:
+
+   import pandas.util.testing as tm
+
+.. ipython:: python
+   :okwarning:
+
+   p = tm.makePanel()
+   p
+
+Convert to a MultiIndex DataFrame
+
+.. ipython:: python
+
+   p.to_frame()
+
+Convert to an xarray DataArray
+
+.. ipython:: python
+   :okwarning:
+
+   p.to_xarray()
+
+
+.. _whatsnew_0230.api_breaking.core_common:
+
+pandas.core.common removals
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The following error & warning messages are removed from ``pandas.core.common`` (:issue:`13634`, :issue:`19769`):
+
+- ``PerformanceWarning``
+- ``UnsupportedFunctionCall``
+- ``UnsortedIndexError``
+- ``AbstractMethodError``
+
+These are available from import from ``pandas.errors`` (since 0.19.0).
+
+
+.. _whatsnew_0230.api_breaking.apply:
+
+Changes to make output of ``DataFrame.apply`` consistent
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`DataFrame.apply` was inconsistent when applying an arbitrary user-defined-function that returned a list-like with ``axis=1``. Several bugs and inconsistencies
+are resolved. If the applied function returns a Series, then pandas will return a DataFrame; otherwise a Series will be returned, this includes the case
+where a list-like (e.g. ``tuple`` or ``list`` is returned) (:issue:`16353`, :issue:`17437`, :issue:`17970`, :issue:`17348`, :issue:`17892`, :issue:`18573`,
+:issue:`17602`, :issue:`18775`, :issue:`18901`, :issue:`18919`).
+
+.. ipython:: python
+
+    df = pd.DataFrame(np.tile(np.arange(3), 6).reshape(6, -1) + 1, columns=['A', 'B', 'C'])
+    df
+
+Previous Behavior: if the returned shape happened to match the length of original columns, this would return a ``DataFrame``.
+If the return shape did not match, a ``Series`` with lists was returned.
+
+.. code-block:: python
+
+   In [3]: df.apply(lambda x: [1, 2, 3], axis=1)
+   Out[3]:
+      A  B  C
+   0  1  2  3
+   1  1  2  3
+   2  1  2  3
+   3  1  2  3
+   4  1  2  3
+   5  1  2  3
+
+   In [4]: df.apply(lambda x: [1, 2], axis=1)
+   Out[4]:
+   0    [1, 2]
+   1    [1, 2]
+   2    [1, 2]
+   3    [1, 2]
+   4    [1, 2]
+   5    [1, 2]
+   dtype: object
+
+
+New Behavior: When the applied function returns a list-like, this will now *always* return a ``Series``.
+
+.. ipython:: python
+
+    df.apply(lambda x: [1, 2, 3], axis=1)
+    df.apply(lambda x: [1, 2], axis=1)
+
+To have expanded columns, you can use ``result_type='expand'``
+
+.. ipython:: python
+
+    df.apply(lambda x: [1, 2, 3], axis=1, result_type='expand')
+
+To broadcast the result across the original columns (the old behaviour for
+list-likes of the correct length), you can use ``result_type='broadcast'``.
+The shape must match the original columns.
+
+.. ipython:: python
+
+    df.apply(lambda x: [1, 2, 3], axis=1, result_type='broadcast')
+
+Returning a ``Series`` allows one to control the exact return structure and column names:
+
+.. ipython:: python
+
+    df.apply(lambda x: Series([1, 2, 3], index=['D', 'E', 'F']), axis=1)
+
+.. _whatsnew_0230.api_breaking.concat:
+
+Concatenation will no longer sort
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In a future version of pandas :func:`pandas.concat` will no longer sort the non-concatenation axis when it is not already aligned.
+The current behavior is the same as the previous (sorting), but now a warning is issued when ``sort`` is not specified and the non-concatenation axis is not aligned (:issue:`4588`).
+
+.. ipython:: python
+   :okwarning:
+
+   df1 = pd.DataFrame({"a": [1, 2], "b": [1, 2]}, columns=['b', 'a'])
+   df2 = pd.DataFrame({"a": [4, 5]})
+
+   pd.concat([df1, df2])
+
+To keep the previous behavior (sorting) and silence the warning, pass ``sort=True``
+
+.. ipython:: python
+
+   pd.concat([df1, df2], sort=True)
+
+To accept the future behavior (no sorting), pass ``sort=False``
+
+.. ipython
+
+   pd.concat([df1, df2], sort=False)
+
+Note that this change also applies to :meth:`DataFrame.append`, which has also received a ``sort`` keyword for controlling this behavior.
+
+
+.. _whatsnew_0230.api_breaking.build_changes:
+
+Build Changes
+^^^^^^^^^^^^^
+
+- Building pandas for development now requires ``cython >= 0.24`` (:issue:`18613`)
+- Building from source now explicitly requires ``setuptools`` in ``setup.py`` (:issue:`18113`)
+- Updated conda recipe to be in compliance with conda-build 3.0+ (:issue:`18002`)
+
+.. _whatsnew_0230.api_breaking.index_division_by_zero:
+
+Index Division By Zero Fills Correctly
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Division operations on ``Index`` and subclasses will now fill division of positive numbers by zero with ``np.inf``, division of negative numbers by zero with ``-np.inf`` and `0 / 0` with ``np.nan``.  This matches existing ``Series`` behavior. (:issue:`19322`, :issue:`19347`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+    In [6]: index = pd.Int64Index([-1, 0, 1])
+
+    In [7]: index / 0
+    Out[7]: Int64Index([0, 0, 0], dtype='int64')
+
+    # Previous behavior yielded different results depending on the type of zero in the divisor
+    In [8]: index / 0.0
+    Out[8]: Float64Index([-inf, nan, inf], dtype='float64')
+
+    In [9]: index = pd.UInt64Index([0, 1])
+
+    In [10]: index / np.array([0, 0], dtype=np.uint64)
+    Out[10]: UInt64Index([0, 0], dtype='uint64')
+
+    In [11]: pd.RangeIndex(1, 5) / 0
+    ZeroDivisionError: integer division or modulo by zero
+
+Current Behavior:
+
+.. ipython:: python
+
+    index = pd.Int64Index([-1, 0, 1])
+    # division by zero gives -infinity where negative, +infinity where positive, and NaN for 0 / 0
+    index / 0
+
+    # The result of division by zero should not depend on whether the zero is int or float
+    index / 0.0
+
+    index = pd.UInt64Index([0, 1])
+    index / np.array([0, 0], dtype=np.uint64)
+
+    pd.RangeIndex(1, 5) / 0
+
+.. _whatsnew_0230.api_breaking.extract:
+
+Extraction of matching patterns from strings
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+By default, extracting matching patterns from strings with :func:`str.extract` used to return a
+``Series`` if a single group was being extracted (a ``DataFrame`` if more than one group was
+extracted). As of Pandas 0.23.0 :func:`str.extract` always returns a ``DataFrame``, unless
+``expand`` is set to ``False``. Finally, ``None`` was an accepted value for
+the ``expand`` parameter (which was equivalent to ``False``), but now raises a ``ValueError``. (:issue:`11386`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+    In [1]: s = pd.Series(['number 10', '12 eggs'])
+
+    In [2]: extracted = s.str.extract('.*(\d\d).*')
+
+    In [3]: extracted
+    Out [3]:
+    0    10
+    1    12
+    dtype: object
+
+    In [4]: type(extracted)
+    Out [4]:
+    pandas.core.series.Series
+
+New Behavior:
+
+.. ipython:: python
+
+    s = pd.Series(['number 10', '12 eggs'])
+    extracted = s.str.extract('.*(\d\d).*')
+    extracted
+    type(extracted)
+
+To restore previous behavior, simply set ``expand`` to ``False``:
+
+.. ipython:: python
+
+    s = pd.Series(['number 10', '12 eggs'])
+    extracted = s.str.extract('.*(\d\d).*', expand=False)
+    extracted
+    type(extracted)
+
+.. _whatsnew_0230.api_breaking.cdt_ordered:
+
+Default value for the ``ordered`` parameter of ``CategoricalDtype``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The default value of the ``ordered`` parameter for :class:`~pandas.api.types.CategoricalDtype` has changed from ``False`` to ``None`` to allow updating of ``categories`` without impacting ``ordered``.  Behavior should remain consistent for downstream objects, such as :class:`Categorical` (:issue:`18790`)
+
+In previous versions, the default value for the ``ordered`` parameter was ``False``.  This could potentially lead to the ``ordered`` parameter unintentionally being changed from ``True`` to ``False`` when users attempt to update ``categories`` if ``ordered`` is not explicitly specified, as it would silently default to ``False``.  The new behavior for ``ordered=None`` is to retain the existing value of ``ordered``.
+
+New Behavior:
+
+.. ipython:: python
+
+    from pandas.api.types import CategoricalDtype
+    cat = pd.Categorical(list('abcaba'), ordered=True, categories=list('cba'))
+    cat
+    cdt = CategoricalDtype(categories=list('cbad'))
+    cat.astype(cdt)
+
+Notice in the example above that the converted ``Categorical`` has retained ``ordered=True``.  Had the default value for ``ordered`` remained as ``False``, the converted ``Categorical`` would have become unordered, despite ``ordered=False`` never being explicitly specified.  To change the value of ``ordered``, explicitly pass it to the new dtype, e.g. ``CategoricalDtype(categories=list('cbad'), ordered=False)``.
+
+Note that the unintentional conversion of ``ordered`` discussed above did not arise in previous versions due to separate bugs that prevented ``astype`` from doing any type of category to category conversion (:issue:`10696`, :issue:`18593`).  These bugs have been fixed in this release, and motivated changing the default value of ``ordered``.
+
+.. _whatsnew_0230.api_breaking.pretty_printing:
+
+Better pretty-printing of DataFrames in a terminal
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+Previously, the default value for the maximum number of columns was
+``pd.options.display.max_columns=20``. This meant that relatively wide data
+frames would not fit within the terminal width, and pandas would introduce line
+breaks to display these 20 columns. This resulted in an output that was
+relatively difficult to read:
+
+.. image:: _static/print_df_old.png
+
+If Python runs in a terminal, the maximum number of columns is now determined
+automatically so that the printed data frame fits within the current terminal
+width (``pd.options.display.max_columns=0``) (:issue:`17023`). If Python runs
+as a Jupyter kernel (such as the Jupyter QtConsole or a Jupyter notebook, as
+well as in many IDEs), this value cannot be inferred automatically and is thus
+set to `20` as in previous versions. In a terminal, this results in a much
+nicer output:
+
+.. image:: _static/print_df_new.png
+
+Note that if you don't like the new default, you can always set this option
+yourself. To revert to the old setting, you can run this line:
+
+.. code-block:: python
+
+  pd.options.display.max_columns = 20
+
+.. _whatsnew_0230.api.datetimelike:
+
+Datetimelike API Changes
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- The default ``Timedelta`` constructor now accepts an ``ISO 8601 Duration`` string as an argument (:issue:`19040`)
+- Subtracting ``NaT`` from a :class:`Series` with ``dtype='datetime64[ns]'`` returns a ``Series`` with ``dtype='timedelta64[ns]'`` instead of ``dtype='datetime64[ns]'`` (:issue:`18808`)
+- Addition or subtraction of ``NaT`` from :class:`TimedeltaIndex` will return ``TimedeltaIndex`` instead of ``DatetimeIndex`` (:issue:`19124`)
+- :func:`DatetimeIndex.shift` and :func:`TimedeltaIndex.shift` will now raise ``NullFrequencyError`` (which subclasses ``ValueError``, which was raised in older versions) when the index object frequency is ``None`` (:issue:`19147`)
+- Addition and subtraction of ``NaN`` from a :class:`Series` with ``dtype='timedelta64[ns]'`` will raise a ``TypeError`` instead of treating the ``NaN`` as ``NaT`` (:issue:`19274`)
+- ``NaT`` division with :class:`datetime.timedelta` will now return ``NaN`` instead of raising (:issue:`17876`)
+- Operations between a :class:`Series` with dtype ``dtype='datetime64[ns]'`` and a :class:`PeriodIndex` will correctly raises ``TypeError`` (:issue:`18850`)
+- Subtraction of :class:`Series` with timezone-aware ``dtype='datetime64[ns]'`` with mis-matched timezones will raise ``TypeError`` instead of ``ValueError`` (:issue:`18817`)
+- :class:`Timestamp` will no longer silently ignore unused or invalid ``tz`` or ``tzinfo`` keyword arguments (:issue:`17690`)
+- :class:`Timestamp` will no longer silently ignore invalid ``freq`` arguments (:issue:`5168`)
+- :class:`CacheableOffset` and :class:`WeekDay` are no longer available in the ``pandas.tseries.offsets`` module (:issue:`17830`)
+- ``pandas.tseries.frequencies.get_freq_group()`` and ``pandas.tseries.frequencies.DAYS`` are removed from the public API (:issue:`18034`)
+- :func:`Series.truncate` and :func:`DataFrame.truncate` will raise a ``ValueError`` if the index is not sorted instead of an unhelpful ``KeyError`` (:issue:`17935`)
+- :attr:`Series.first` and :attr:`DataFrame.first` will now raise a ``TypeError``
+  rather than ``NotImplementedError`` when index is not a :class:`DatetimeIndex` (:issue:`20725`).
+- :attr:`Series.last` and :attr:`DataFrame.last` will now raise a ``TypeError``
+  rather than ``NotImplementedError`` when index is not a :class:`DatetimeIndex` (:issue:`20725`).
+- Restricted ``DateOffset`` keyword arguments. Previously, ``DateOffset`` subclasses allowed arbitrary keyword arguments which could lead to unexpected behavior. Now, only valid arguments will be accepted. (:issue:`17176`, :issue:`18226`).
+- :func:`pandas.merge` provides a more informative error message when trying to merge on timezone-aware and timezone-naive columns (:issue:`15800`)
+- For :class:`DatetimeIndex` and :class:`TimedeltaIndex` with ``freq=None``, addition or subtraction of integer-dtyped array or ``Index`` will raise ``NullFrequencyError`` instead of ``TypeError`` (:issue:`19895`)
+- :class:`Timestamp` constructor now accepts a `nanosecond` keyword or positional argument (:issue:`18898`)
+- :class:`DatetimeIndex` will now raise an ``AttributeError`` when the ``tz`` attribute is set after instantiation (:issue:`3746`)
+- :class:`DatetimeIndex` with a ``pytz`` timezone will now return a consistent ``pytz`` timezone (:issue:`18595`)
+
+.. _whatsnew_0230.api.other:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+
+- :func:`Series.astype` and :func:`Index.astype` with an incompatible dtype will now raise a ``TypeError`` rather than a ``ValueError`` (:issue:`18231`)
+- ``Series`` construction with an ``object`` dtyped tz-aware datetime and ``dtype=object`` specified, will now return an ``object`` dtyped ``Series``, previously this would infer the datetime dtype (:issue:`18231`)
+- A :class:`Series` of ``dtype=category`` constructed from an empty ``dict`` will now have categories of ``dtype=object`` rather than ``dtype=float64``, consistently with the case in which an empty list is passed (:issue:`18515`)
+- All-NaN levels in a ``MultiIndex`` are now assigned ``float`` rather than ``object`` dtype, promoting consistency with ``Index`` (:issue:`17929`).
+- Levels names of a ``MultiIndex`` (when not None) are now required to be unique: trying to create a ``MultiIndex`` with repeated names will raise a ``ValueError`` (:issue:`18872`)
+- Both construction and renaming of ``Index``/``MultiIndex`` with non-hashable ``name``/``names`` will now raise ``TypeError`` (:issue:`20527`)
+- :func:`Index.map` can now accept ``Series`` and dictionary input objects (:issue:`12756`, :issue:`18482`, :issue:`18509`).
+- :func:`DataFrame.unstack` will now default to filling with ``np.nan`` for ``object`` columns. (:issue:`12815`)
+- :class:`IntervalIndex` constructor will raise if the ``closed`` parameter conflicts with how the input data is inferred to be closed (:issue:`18421`)
+- Inserting missing values into indexes will work for all types of indexes and automatically insert the correct type of missing value (``NaN``, ``NaT``, etc.) regardless of the type passed in (:issue:`18295`)
+- When created with duplicate labels, ``MultiIndex`` now raises a ``ValueError``. (:issue:`17464`)
+- :func:`Series.fillna` now raises a ``TypeError`` instead of a ``ValueError`` when passed a list, tuple or DataFrame as a ``value`` (:issue:`18293`)
+- :func:`pandas.DataFrame.merge` no longer casts a ``float`` column to ``object`` when merging on ``int`` and ``float`` columns (:issue:`16572`)
+- :func:`pandas.merge` now raises a ``ValueError`` when trying to merge on incompatible data types (:issue:`9780`)
+- The default NA value for :class:`UInt64Index` has changed from 0 to ``NaN``, which impacts methods that mask with NA, such as ``UInt64Index.where()`` (:issue:`18398`)
+- Refactored ``setup.py`` to use ``find_packages`` instead of explicitly listing out all subpackages (:issue:`18535`)
+- Rearranged the order of keyword arguments in :func:`read_excel()` to align with :func:`read_csv()` (:issue:`16672`)
+- :func:`wide_to_long` previously kept numeric-like suffixes as ``object`` dtype. Now they are cast to numeric if possible (:issue:`17627`)
+- In :func:`read_excel`, the ``comment`` argument is now exposed as a named parameter (:issue:`18735`)
+- Rearranged the order of keyword arguments in :func:`read_excel()` to align with :func:`read_csv()` (:issue:`16672`)
+- The options ``html.border`` and ``mode.use_inf_as_null`` were deprecated in prior versions, these will now show ``FutureWarning`` rather than a ``DeprecationWarning`` (:issue:`19003`)
+- :class:`IntervalIndex` and ``IntervalDtype`` no longer support categorical, object, and string subtypes (:issue:`19016`)
+- ``IntervalDtype`` now returns ``True`` when compared against ``'interval'`` regardless of subtype, and ``IntervalDtype.name`` now returns ``'interval'`` regardless of subtype (:issue:`18980`)
+- ``KeyError`` now raises instead of ``ValueError`` in :meth:`~DataFrame.drop`, :meth:`~Panel.drop`, :meth:`~Series.drop`, :meth:`~Index.drop` when dropping a non-existent element in an axis with duplicates (:issue:`19186`)
+- :func:`Series.to_csv` now accepts a ``compression`` argument that works in the same way as the ``compression`` argument in :func:`DataFrame.to_csv` (:issue:`18958`)
+- Set operations (union, difference...) on :class:`IntervalIndex` with incompatible index types will now raise a ``TypeError`` rather than a ``ValueError`` (:issue:`19329`)
+- :class:`DateOffset` objects render more simply, e.g. ``<DateOffset: days=1>`` instead of ``<DateOffset: kwds={'days': 1}>`` (:issue:`19403`)
+- ``Categorical.fillna`` now validates its ``value`` and ``method`` keyword arguments. It now raises when both or none are specified, matching the behavior of :meth:`Series.fillna` (:issue:`19682`)
+- ``pd.to_datetime('today')`` now returns a datetime, consistent with ``pd.Timestamp('today')``; previously ``pd.to_datetime('today')`` returned a ``.normalized()`` datetime (:issue:`19935`)
+- :func:`Series.str.replace` now takes an optional `regex` keyword which, when set to ``False``, uses literal string replacement rather than regex replacement (:issue:`16808`)
+- :func:`DatetimeIndex.strftime` and :func:`PeriodIndex.strftime` now return an ``Index`` instead of a numpy array to be consistent with similar accessors (:issue:`20127`)
+- Constructing a Series from a list of length 1 no longer broadcasts this list when a longer index is specified (:issue:`19714`, :issue:`20391`).
+- :func:`DataFrame.to_dict` with ``orient='index'`` no longer casts int columns to float for a DataFrame with only int and float columns (:issue:`18580`)
+- A user-defined-function that is passed to :func:`Series.rolling().aggregate() <pandas.core.window.Rolling.aggregate>`, :func:`DataFrame.rolling().aggregate() <pandas.core.window.Rolling.aggregate>`, or its expanding cousins, will now *always* be passed a ``Series``, rather than a ``np.array``; ``.apply()`` only has the ``raw`` keyword, see :ref:`here <whatsnew_0230.enhancements.window_raw>`. This is consistent with the signatures of ``.aggregate()`` across pandas (:issue:`20584`)
+- Rolling and Expanding types raise ``NotImplementedError`` upon iteration (:issue:`11704`).
+
+.. _whatsnew_0230.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+
+- ``Series.from_array`` and ``SparseSeries.from_array`` are deprecated. Use the normal constructor ``Series(..)`` and ``SparseSeries(..)`` instead (:issue:`18213`).
+- ``DataFrame.as_matrix`` is deprecated. Use ``DataFrame.values`` instead (:issue:`18458`).
+- ``Series.asobject``, ``DatetimeIndex.asobject``, ``PeriodIndex.asobject`` and ``TimeDeltaIndex.asobject`` have been deprecated. Use ``.astype(object)`` instead (:issue:`18572`)
+- Grouping by a tuple of keys now emits a ``FutureWarning`` and is deprecated.
+  In the future, a tuple passed to ``'by'`` will always refer to a single key
+  that is the actual tuple, instead of treating the tuple as multiple keys. To
+  retain the previous behavior, use a list instead of a tuple (:issue:`18314`)
+- ``Series.valid`` is deprecated. Use :meth:`Series.dropna` instead (:issue:`18800`).
+- :func:`read_excel` has deprecated the ``skip_footer`` parameter. Use ``skipfooter`` instead (:issue:`18836`)
+- :meth:`ExcelFile.parse` has deprecated ``sheetname`` in favor of ``sheet_name`` for consistency with :func:`read_excel` (:issue:`20920`).
+- The ``is_copy`` attribute is deprecated and will be removed in a future version (:issue:`18801`).
+- ``IntervalIndex.from_intervals`` is deprecated in favor of the :class:`IntervalIndex` constructor (:issue:`19263`)
+- ``DataFrame.from_items`` is deprecated. Use :func:`DataFrame.from_dict` instead, or ``DataFrame.from_dict(OrderedDict())`` if you wish to preserve the key order (:issue:`17320`, :issue:`17312`)
+- Indexing a :class:`MultiIndex` or a :class:`FloatIndex` with a list containing some missing keys will now show a :class:`FutureWarning`, which is consistent with other types of indexes (:issue:`17758`).
+
+- The ``broadcast`` parameter of ``.apply()`` is deprecated in favor of ``result_type='broadcast'`` (:issue:`18577`)
+- The ``reduce`` parameter of ``.apply()`` is deprecated in favor of ``result_type='reduce'`` (:issue:`18577`)
+- The ``order`` parameter of :func:`factorize` is deprecated and will be removed in a future release (:issue:`19727`)
+- :attr:`Timestamp.weekday_name`, :attr:`DatetimeIndex.weekday_name`, and :attr:`Series.dt.weekday_name` are deprecated in favor of :meth:`Timestamp.day_name`, :meth:`DatetimeIndex.day_name`, and :meth:`Series.dt.day_name` (:issue:`12806`)
+
+- ``pandas.tseries.plotting.tsplot`` is deprecated. Use :func:`Series.plot` instead (:issue:`18627`)
+- ``Index.summary()`` is deprecated and will be removed in a future version (:issue:`18217`)
+- ``NDFrame.get_ftype_counts()`` is deprecated and will be removed in a future version (:issue:`18243`)
+- The ``convert_datetime64`` parameter in :func:`DataFrame.to_records` has been deprecated and will be removed in a future version. The NumPy bug motivating this parameter has been resolved. The default value for this parameter has also changed from ``True`` to ``None`` (:issue:`18160`).
+- :func:`Series.rolling().apply() <pandas.core.window.Rolling.apply>`, :func:`DataFrame.rolling().apply() <pandas.core.window.Rolling.apply>`,
+  :func:`Series.expanding().apply() <pandas.core.window.Expanding.apply>`, and :func:`DataFrame.expanding().apply() <pandas.core.window.Expanding.apply>` have deprecated passing an ``np.array`` by default. One will need to pass the new ``raw`` parameter to be explicit about what is passed (:issue:`20584`)
+- The ``data``, ``base``, ``strides``, ``flags`` and ``itemsize`` properties
+  of the ``Series`` and ``Index`` classes have been deprecated and will be
+  removed in a future version (:issue:`20419`).
+- ``DatetimeIndex.offset`` is deprecated. Use ``DatetimeIndex.freq`` instead (:issue:`20716`)
+- Floor division between an integer ndarray and a :class:`Timedelta` is deprecated. Divide by :attr:`Timedelta.value` instead (:issue:`19761`)
+- Setting ``PeriodIndex.freq`` (which was not guaranteed to work correctly) is deprecated. Use :meth:`PeriodIndex.asfreq` instead (:issue:`20678`)
+- ``Index.get_duplicates()`` is deprecated and will be removed in a future version (:issue:`20239`)
+- The previous default behavior of negative indices in ``Categorical.take`` is deprecated. In a future version it will change from meaning missing values to meaning positional indices from the right. The future behavior is consistent with :meth:`Series.take` (:issue:`20664`).
+- Passing multiple axes to the ``axis`` parameter in :func:`DataFrame.dropna` has been deprecated and will be removed in a future version (:issue:`20987`)
+
+
+.. _whatsnew_0230.prior_deprecations:
+
+Removal of prior version deprecations/changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Warnings against the obsolete usage ``Categorical(codes, categories)``, which were emitted for instance when the first two arguments to ``Categorical()`` had different dtypes, and recommended the use of ``Categorical.from_codes``, have now been removed (:issue:`8074`)
+- The ``levels`` and ``labels`` attributes of a ``MultiIndex`` can no longer be set directly (:issue:`4039`).
+- ``pd.tseries.util.pivot_annual`` has been removed (deprecated since v0.19). Use ``pivot_table`` instead (:issue:`18370`)
+- ``pd.tseries.util.isleapyear`` has been removed (deprecated since v0.19). Use ``.is_leap_year`` property in Datetime-likes instead (:issue:`18370`)
+- ``pd.ordered_merge`` has been removed (deprecated since v0.19). Use ``pd.merge_ordered`` instead (:issue:`18459`)
+- The ``SparseList`` class has been removed (:issue:`14007`)
+- The ``pandas.io.wb`` and ``pandas.io.data`` stub modules have been removed (:issue:`13735`)
+- ``Categorical.from_array`` has been removed (:issue:`13854`)
+- The ``freq`` and ``how`` parameters have been removed from the ``rolling``/``expanding``/``ewm`` methods of DataFrame
+  and Series (deprecated since v0.18). Instead, resample before calling the methods. (:issue:`18601` & :issue:`18668`)
+- ``DatetimeIndex.to_datetime``, ``Timestamp.to_datetime``, ``PeriodIndex.to_datetime``, and ``Index.to_datetime`` have been removed (:issue:`8254`, :issue:`14096`, :issue:`14113`)
+- :func:`read_csv` has dropped the ``skip_footer`` parameter (:issue:`13386`)
+- :func:`read_csv` has dropped the ``as_recarray`` parameter (:issue:`13373`)
+- :func:`read_csv` has dropped the ``buffer_lines`` parameter (:issue:`13360`)
+- :func:`read_csv` has dropped the ``compact_ints`` and ``use_unsigned`` parameters (:issue:`13323`)
+- The ``Timestamp`` class has dropped the ``offset`` attribute in favor of ``freq`` (:issue:`13593`)
+- The ``Series``, ``Categorical``, and ``Index`` classes have dropped the ``reshape`` method (:issue:`13012`)
+- ``pandas.tseries.frequencies.get_standard_freq`` has been removed in favor of ``pandas.tseries.frequencies.to_offset(freq).rule_code`` (:issue:`13874`)
+- The ``freqstr`` keyword has been removed from ``pandas.tseries.frequencies.to_offset`` in favor of ``freq`` (:issue:`13874`)
+- The ``Panel4D`` and ``PanelND`` classes have been removed (:issue:`13776`)
+- The ``Panel`` class has dropped the ``to_long`` and ``toLong`` methods (:issue:`19077`)
+- The options ``display.line_with`` and ``display.height`` are removed in favor of ``display.width`` and ``display.max_rows`` respectively (:issue:`4391`, :issue:`19107`)
+- The ``labels`` attribute of the ``Categorical`` class has been removed in favor of :attr:`Categorical.codes` (:issue:`7768`)
+- The ``flavor`` parameter have been removed from func:`to_sql` method (:issue:`13611`)
+- The modules ``pandas.tools.hashing`` and ``pandas.util.hashing`` have been removed (:issue:`16223`)
+- The top-level functions ``pd.rolling_*``, ``pd.expanding_*`` and ``pd.ewm*`` have been removed (Deprecated since v0.18).
+  Instead, use the DataFrame/Series methods :attr:`~DataFrame.rolling`, :attr:`~DataFrame.expanding` and :attr:`~DataFrame.ewm` (:issue:`18723`)
+- Imports from ``pandas.core.common`` for functions such as ``is_datetime64_dtype`` are now removed. These are located in ``pandas.api.types``. (:issue:`13634`, :issue:`19769`)
+- The ``infer_dst`` keyword in :meth:`Series.tz_localize`, :meth:`DatetimeIndex.tz_localize`
+  and :class:`DatetimeIndex` have been removed. ``infer_dst=True`` is equivalent to
+  ``ambiguous='infer'``, and ``infer_dst=False`` to ``ambiguous='raise'`` (:issue:`7963`).
+- When ``.resample()`` was changed from an eager to a lazy operation, like ``.groupby()`` in v0.18.0, we put in place compatibility (with a ``FutureWarning``),
+  so operations would continue to work. This is now fully removed, so a ``Resampler`` will no longer forward compat operations (:issue:`20554`)
+- Remove long deprecated ``axis=None`` parameter from ``.replace()`` (:issue:`20271`)
+
+.. _whatsnew_0230.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Indexers on ``Series`` or ``DataFrame`` no longer create a reference cycle (:issue:`17956`)
+- Added a keyword argument, ``cache``, to :func:`to_datetime` that improved the performance of converting duplicate datetime arguments (:issue:`11665`)
+- :class:`DateOffset` arithmetic performance is improved (:issue:`18218`)
+- Converting a ``Series`` of ``Timedelta`` objects to days, seconds, etc... sped up through vectorization of underlying methods (:issue:`18092`)
+- Improved performance of ``.map()`` with a ``Series/dict`` input (:issue:`15081`)
+- The overridden ``Timedelta`` properties of days, seconds and microseconds have been removed, leveraging their built-in Python versions instead (:issue:`18242`)
+- ``Series`` construction will reduce the number of copies made of the input data in certain cases (:issue:`17449`)
+- Improved performance of :func:`Series.dt.date` and :func:`DatetimeIndex.date` (:issue:`18058`)
+- Improved performance of :func:`Series.dt.time` and :func:`DatetimeIndex.time` (:issue:`18461`)
+- Improved performance of :func:`IntervalIndex.symmetric_difference()` (:issue:`18475`)
+- Improved performance of ``DatetimeIndex`` and ``Series`` arithmetic operations with Business-Month and Business-Quarter frequencies (:issue:`18489`)
+- :func:`Series` / :func:`DataFrame` tab completion limits to 100 values, for better performance. (:issue:`18587`)
+- Improved performance of :func:`DataFrame.median` with ``axis=1`` when bottleneck is not installed (:issue:`16468`)
+- Improved performance of :func:`MultiIndex.get_loc` for large indexes, at the cost of a reduction in performance for small ones (:issue:`18519`)
+- Improved performance of :func:`MultiIndex.remove_unused_levels` when there are no unused levels, at the cost of a reduction in performance when there are (:issue:`19289`)
+- Improved performance of :func:`Index.get_loc` for non-unique indexes (:issue:`19478`)
+- Improved performance of pairwise ``.rolling()`` and ``.expanding()`` with ``.cov()`` and ``.corr()`` operations (:issue:`17917`)
+- Improved performance of :func:`pandas.core.groupby.GroupBy.rank` (:issue:`15779`)
+- Improved performance of variable ``.rolling()`` on ``.min()`` and ``.max()`` (:issue:`19521`)
+- Improved performance of :func:`pandas.core.groupby.GroupBy.ffill` and :func:`pandas.core.groupby.GroupBy.bfill` (:issue:`11296`)
+- Improved performance of :func:`pandas.core.groupby.GroupBy.any` and :func:`pandas.core.groupby.GroupBy.all` (:issue:`15435`)
+- Improved performance of :func:`pandas.core.groupby.GroupBy.pct_change` (:issue:`19165`)
+- Improved performance of :func:`Series.isin` in the case of categorical dtypes (:issue:`20003`)
+- Improved performance of ``getattr(Series, attr)`` when the Series has certain index types. This manifested in slow printing of large Series with a ``DatetimeIndex`` (:issue:`19764`)
+- Fixed a performance regression for :func:`GroupBy.nth` and :func:`GroupBy.last` with some object columns (:issue:`19283`)
+- Improved performance of :func:`pandas.core.arrays.Categorical.from_codes` (:issue:`18501`)
+
+.. _whatsnew_0230.docs:
+
+Documentation Changes
+~~~~~~~~~~~~~~~~~~~~~
+
+Thanks to all of the contributors who participated in the Pandas Documentation
+Sprint, which took place on March 10th. We had about 500 participants from over
+30 locations across the world. You should notice that many of the
+:ref:`API docstrings <api>` have greatly improved.
+
+There were too many simultaneous contributions to include a release note for each
+improvement, but this `GitHub search`_ should give you an idea of how many docstrings
+were improved.
+
+Special thanks to `Marc Garcia`_ for organizing the sprint. For more information,
+read the `NumFOCUS blogpost`_ recapping the sprint.
+
+.. _GitHub search: https://github.com/pandas-dev/pandas/pulls?utf8=%E2%9C%93&q=is%3Apr+label%3ADocs+created%3A2018-03-10..2018-03-15+
+.. _NumFOCUS blogpost: https://www.numfocus.org/blog/worldwide-pandas-sprint/
+.. _Marc Garcia: https://github.com/datapythonista
+
+- Changed spelling of "numpy" to "NumPy", and "python" to "Python". (:issue:`19017`)
+- Consistency when introducing code samples, using either colon or period.
+  Rewrote some sentences for greater clarity, added more dynamic references
+  to functions, methods and classes.
+  (:issue:`18941`, :issue:`18948`, :issue:`18973`, :issue:`19017`)
+- Added a reference to :func:`DataFrame.assign` in the concatenate section of the merging documentation (:issue:`18665`)
+
+.. _whatsnew_0230.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+Categorical
+^^^^^^^^^^^
+
+.. warning::
+
+   A class of bugs were introduced in pandas 0.21 with ``CategoricalDtype`` that
+   affects the correctness of operations like ``merge``, ``concat``, and
+   indexing when comparing multiple unordered ``Categorical`` arrays that have
+   the same categories, but in a different order. We highly recommend upgrading
+   or manually aligning your categories before doing these operations.
+
+- Bug in ``Categorical.equals`` returning the wrong result when comparing two
+  unordered ``Categorical`` arrays with the same categories, but in a different
+  order (:issue:`16603`)
+- Bug in :func:`pandas.api.types.union_categoricals` returning the wrong result
+  when for unordered categoricals with the categories in a different order.
+  This affected :func:`pandas.concat` with Categorical data (:issue:`19096`).
+- Bug in :func:`pandas.merge` returning the wrong result when joining on an
+  unordered ``Categorical`` that had the same categories but in a different
+  order (:issue:`19551`)
+- Bug in :meth:`CategoricalIndex.get_indexer` returning the wrong result when
+  ``target`` was an unordered ``Categorical`` that had the same categories as
+  ``self`` but in a different order (:issue:`19551`)
+- Bug in :meth:`Index.astype` with a categorical dtype where the resultant index is not converted to a :class:`CategoricalIndex` for all types of index (:issue:`18630`)
+- Bug in :meth:`Series.astype` and ``Categorical.astype()`` where an existing categorical data does not get updated (:issue:`10696`, :issue:`18593`)
+- Bug in :meth:`Series.str.split` with ``expand=True`` incorrectly raising an IndexError on empty strings (:issue:`20002`).
+- Bug in :class:`Index` constructor with ``dtype=CategoricalDtype(...)`` where ``categories`` and ``ordered`` are not maintained (:issue:`19032`)
+- Bug in :class:`Series` constructor with scalar and ``dtype=CategoricalDtype(...)`` where ``categories`` and ``ordered`` are not maintained (:issue:`19565`)
+- Bug in ``Categorical.__iter__`` not converting to Python types (:issue:`19909`)
+- Bug in :func:`pandas.factorize` returning the unique codes for the ``uniques``. This now returns a ``Categorical`` with the same dtype as the input (:issue:`19721`)
+- Bug in :func:`pandas.factorize` including an item for missing values in the ``uniques`` return value (:issue:`19721`)
+- Bug in :meth:`Series.take` with categorical data interpreting ``-1`` in `indices` as missing value markers, rather than the last element of the Series (:issue:`20664`)
+
+Datetimelike
+^^^^^^^^^^^^
+
+- Bug in :func:`Series.__sub__` subtracting a non-nanosecond ``np.datetime64`` object from a ``Series`` gave incorrect results (:issue:`7996`)
+- Bug in :class:`DatetimeIndex`, :class:`TimedeltaIndex` addition and subtraction of zero-dimensional integer arrays gave incorrect results (:issue:`19012`)
+- Bug in :class:`DatetimeIndex` and :class:`TimedeltaIndex` where adding or subtracting an array-like of ``DateOffset`` objects either raised (``np.array``, ``pd.Index``) or broadcast incorrectly (``pd.Series``) (:issue:`18849`)
+- Bug in :func:`Series.__add__` adding Series with dtype ``timedelta64[ns]`` to a timezone-aware ``DatetimeIndex`` incorrectly dropped timezone information (:issue:`13905`)
+- Adding a ``Period`` object to a ``datetime`` or ``Timestamp`` object will now correctly raise a ``TypeError`` (:issue:`17983`)
+- Bug in :class:`Timestamp` where comparison with an array of ``Timestamp`` objects would result in a ``RecursionError`` (:issue:`15183`)
+- Bug in :class:`Series` floor-division where operating on a scalar ``timedelta`` raises an exception (:issue:`18846`)
+- Bug in :class:`DatetimeIndex` where the repr was not showing high-precision time values at the end of a day (e.g., 23:59:59.999999999) (:issue:`19030`)
+- Bug in ``.astype()`` to non-ns timedelta units would hold the incorrect dtype (:issue:`19176`, :issue:`19223`, :issue:`12425`)
+- Bug in subtracting :class:`Series` from ``NaT`` incorrectly returning ``NaT`` (:issue:`19158`)
+- Bug in :func:`Series.truncate` which raises ``TypeError`` with a monotonic ``PeriodIndex`` (:issue:`17717`)
+- Bug in :func:`~DataFrame.pct_change` using ``periods`` and ``freq`` returned different length outputs (:issue:`7292`)
+- Bug in comparison of :class:`DatetimeIndex` against ``None`` or ``datetime.date`` objects raising ``TypeError`` for ``==`` and ``!=`` comparisons instead of all-``False`` and all-``True``, respectively (:issue:`19301`)
+- Bug in :class:`Timestamp` and :func:`to_datetime` where a string representing a barely out-of-bounds timestamp would be incorrectly rounded down instead of raising ``OutOfBoundsDatetime`` (:issue:`19382`)
+- Bug in :func:`Timestamp.floor` :func:`DatetimeIndex.floor` where time stamps far in the future and past were not rounded correctly (:issue:`19206`)
+- Bug in :func:`to_datetime` where passing an out-of-bounds datetime with ``errors='coerce'`` and ``utc=True`` would raise ``OutOfBoundsDatetime`` instead of parsing to ``NaT`` (:issue:`19612`)
+- Bug in :class:`DatetimeIndex` and :class:`TimedeltaIndex` addition and subtraction where name of the returned object was not always set consistently. (:issue:`19744`)
+- Bug in :class:`DatetimeIndex` and :class:`TimedeltaIndex` addition and subtraction where operations with numpy arrays raised ``TypeError`` (:issue:`19847`)
+- Bug in :class:`DatetimeIndex` and :class:`TimedeltaIndex` where setting the ``freq`` attribute was not fully supported (:issue:`20678`)
+
+Timedelta
+^^^^^^^^^
+
+- Bug in :func:`Timedelta.__mul__` where multiplying by ``NaT`` returned ``NaT`` instead of raising a ``TypeError`` (:issue:`19819`)
+- Bug in :class:`Series` with ``dtype='timedelta64[ns]'`` where addition or subtraction of ``TimedeltaIndex`` had results cast to ``dtype='int64'`` (:issue:`17250`)
+- Bug in :class:`Series` with ``dtype='timedelta64[ns]'`` where addition or subtraction of ``TimedeltaIndex`` could return a ``Series`` with an incorrect name (:issue:`19043`)
+- Bug in :func:`Timedelta.__floordiv__` and :func:`Timedelta.__rfloordiv__` dividing by many incompatible numpy objects was incorrectly allowed (:issue:`18846`)
+- Bug where dividing a scalar timedelta-like object with :class:`TimedeltaIndex` performed the reciprocal operation (:issue:`19125`)
+- Bug in :class:`TimedeltaIndex` where division by a ``Series`` would return a ``TimedeltaIndex`` instead of a ``Series`` (:issue:`19042`)
+- Bug in :func:`Timedelta.__add__`, :func:`Timedelta.__sub__` where adding or subtracting a ``np.timedelta64`` object would return another ``np.timedelta64`` instead of a ``Timedelta`` (:issue:`19738`)
+- Bug in :func:`Timedelta.__floordiv__`, :func:`Timedelta.__rfloordiv__` where operating with a ``Tick`` object would raise a ``TypeError`` instead of returning a numeric value (:issue:`19738`)
+- Bug in :func:`Period.asfreq` where periods near ``datetime(1, 1, 1)`` could be converted incorrectly (:issue:`19643`, :issue:`19834`)
+- Bug in :func:`Timedelta.total_seconds()` causing precision errors, for example ``Timedelta('30S').total_seconds()==30.000000000000004`` (:issue:`19458`)
+- Bug in :func:`Timedelta.__rmod__` where operating with a ``numpy.timedelta64`` returned a ``timedelta64`` object instead of a ``Timedelta`` (:issue:`19820`)
+- Multiplication of :class:`TimedeltaIndex` by ``TimedeltaIndex`` will now raise ``TypeError`` instead of raising ``ValueError`` in cases of length mis-match (:issue:`19333`)
+- Bug in indexing a :class:`TimedeltaIndex` with a ``np.timedelta64`` object which was raising a ``TypeError`` (:issue:`20393`)
+
+
+Timezones
+^^^^^^^^^
+
+- Bug in creating a ``Series`` from an array that contains both tz-naive and tz-aware values will result in a ``Series`` whose dtype is tz-aware instead of object (:issue:`16406`)
+- Bug in comparison of timezone-aware :class:`DatetimeIndex` against ``NaT`` incorrectly raising ``TypeError`` (:issue:`19276`)
+- Bug in :meth:`DatetimeIndex.astype` when converting between timezone aware dtypes, and converting from timezone aware to naive (:issue:`18951`)
+- Bug in comparing :class:`DatetimeIndex`, which failed to raise ``TypeError`` when attempting to compare timezone-aware and timezone-naive datetimelike objects (:issue:`18162`)
+- Bug in localization of a naive, datetime string in a ``Series`` constructor with a ``datetime64[ns, tz]`` dtype (:issue:`174151`)
+- :func:`Timestamp.replace` will now handle Daylight Savings transitions gracefully (:issue:`18319`)
+- Bug in tz-aware :class:`DatetimeIndex` where addition/subtraction with a :class:`TimedeltaIndex` or array with ``dtype='timedelta64[ns]'`` was incorrect (:issue:`17558`)
+- Bug in :func:`DatetimeIndex.insert` where inserting ``NaT`` into a timezone-aware index incorrectly raised (:issue:`16357`)
+- Bug in :class:`DataFrame` constructor, where tz-aware Datetimeindex and a given column name will result in an empty ``DataFrame`` (:issue:`19157`)
+- Bug in :func:`Timestamp.tz_localize` where localizing a timestamp near the minimum or maximum valid values could overflow and return a timestamp with an incorrect nanosecond value (:issue:`12677`)
+- Bug when iterating over :class:`DatetimeIndex` that was localized with fixed timezone offset that rounded nanosecond precision to microseconds (:issue:`19603`)
+- Bug in :func:`DataFrame.diff` that raised an ``IndexError`` with tz-aware values (:issue:`18578`)
+- Bug in :func:`melt` that converted tz-aware dtypes to tz-naive (:issue:`15785`)
+- Bug in :func:`Dataframe.count` that raised an ``ValueError``, if :func:`Dataframe.dropna` was called for a single column with timezone-aware values. (:issue:`13407`)
+
+Offsets
+^^^^^^^
+
+- Bug in :class:`WeekOfMonth` and :class:`Week` where addition and subtraction did not roll correctly (:issue:`18510`, :issue:`18672`, :issue:`18864`)
+- Bug in :class:`WeekOfMonth` and :class:`LastWeekOfMonth` where default keyword arguments for constructor raised ``ValueError`` (:issue:`19142`)
+- Bug in :class:`FY5253Quarter`, :class:`LastWeekOfMonth` where rollback and rollforward behavior was inconsistent with addition and subtraction behavior (:issue:`18854`)
+- Bug in :class:`FY5253` where ``datetime`` addition and subtraction incremented incorrectly for dates on the year-end but not normalized to midnight (:issue:`18854`)
+- Bug in :class:`FY5253` where date offsets could incorrectly raise an ``AssertionError`` in arithmetic operations (:issue:`14774`)
+
+
+Numeric
+^^^^^^^
+- Bug in :class:`Series` constructor with an int or float list where specifying ``dtype=str``, ``dtype='str'`` or ``dtype='U'`` failed to convert the data elements to strings (:issue:`16605`)
+- Bug in :class:`Index` multiplication and division methods where operating with a ``Series`` would return an ``Index`` object instead of a ``Series`` object (:issue:`19042`)
+- Bug in the :class:`DataFrame` constructor in which data containing very large positive or very large negative numbers was causing ``OverflowError`` (:issue:`18584`)
+- Bug in :class:`Index` constructor with ``dtype='uint64'`` where int-like floats were not coerced to :class:`UInt64Index` (:issue:`18400`)
+- Bug in :class:`DataFrame` flex arithmetic (e.g. ``df.add(other, fill_value=foo)``) with a ``fill_value`` other than ``None`` failed to raise ``NotImplementedError`` in corner cases where either the frame or ``other`` has length zero (:issue:`19522`)
+- Multiplication and division of numeric-dtyped :class:`Index` objects with timedelta-like scalars returns ``TimedeltaIndex`` instead of raising ``TypeError`` (:issue:`19333`)
+- Bug where ``NaN`` was returned instead of 0 by :func:`Series.pct_change` and :func:`DataFrame.pct_change` when ``fill_method`` is not ``None`` (:issue:`19873`)
+
+Strings
+^^^^^^^
+- Bug in :func:`Series.str.get` with a dictionary in the values and the index not in the keys, raising `KeyError` (:issue:`20671`)
+
+
+Indexing
+^^^^^^^^
+
+- Bug in :class:`Index` construction from list of mixed type tuples (:issue:`18505`)
+- Bug in :func:`Index.drop` when passing a list of both tuples and non-tuples (:issue:`18304`)
+- Bug in :func:`DataFrame.drop`, :meth:`Panel.drop`, :meth:`Series.drop`, :meth:`Index.drop` where no ``KeyError`` is raised when dropping a non-existent element from an axis that contains duplicates (:issue:`19186`)
+- Bug in indexing a datetimelike ``Index`` that raised ``ValueError`` instead of ``IndexError`` (:issue:`18386`).
+- :func:`Index.to_series` now accepts ``index`` and ``name`` kwargs (:issue:`18699`)
+- :func:`DatetimeIndex.to_series` now accepts ``index`` and ``name`` kwargs (:issue:`18699`)
+- Bug in indexing non-scalar value from ``Series`` having non-unique ``Index`` will return value flattened (:issue:`17610`)
+- Bug in indexing with iterator containing only missing keys, which raised no error (:issue:`20748`)
+- Fixed inconsistency in ``.ix`` between list and scalar keys when the index has integer dtype and does not include the desired keys (:issue:`20753`)
+- Bug in ``__setitem__`` when indexing a :class:`DataFrame` with a 2-d boolean ndarray (:issue:`18582`)
+- Bug in ``str.extractall`` when there were no matches empty :class:`Index` was returned instead of appropriate :class:`MultiIndex` (:issue:`19034`)
+- Bug in :class:`IntervalIndex` where empty and purely NA data was constructed inconsistently depending on the construction method (:issue:`18421`)
+- Bug in :func:`IntervalIndex.symmetric_difference` where the symmetric difference with a non-``IntervalIndex`` did not raise (:issue:`18475`)
+- Bug in :class:`IntervalIndex` where set operations that returned an empty ``IntervalIndex`` had the wrong dtype (:issue:`19101`)
+- Bug in :meth:`DataFrame.drop_duplicates` where no ``KeyError`` is raised when passing in columns that don't exist on the ``DataFrame`` (:issue:`19726`)
+- Bug in ``Index`` subclasses constructors that ignore unexpected keyword arguments (:issue:`19348`)
+- Bug in :meth:`Index.difference` when taking difference of an ``Index`` with itself (:issue:`20040`)
+- Bug in :meth:`DataFrame.first_valid_index` and :meth:`DataFrame.last_valid_index` in presence of entire rows of NaNs in the middle of values (:issue:`20499`).
+- Bug in :class:`IntervalIndex` where some indexing operations were not supported for overlapping or non-monotonic ``uint64`` data (:issue:`20636`)
+- Bug in ``Series.is_unique`` where extraneous output in stderr is shown if Series contains objects with ``__ne__`` defined (:issue:`20661`)
+- Bug in ``.loc`` assignment with a single-element list-like incorrectly assigns as a list (:issue:`19474`)
+- Bug in partial string indexing on a ``Series/DataFrame`` with a monotonic decreasing ``DatetimeIndex`` (:issue:`19362`)
+- Bug in performing in-place operations on a ``DataFrame`` with a duplicate ``Index`` (:issue:`17105`)
+- Bug in :meth:`IntervalIndex.get_loc` and :meth:`IntervalIndex.get_indexer` when used with an :class:`IntervalIndex` containing a single interval (:issue:`17284`, :issue:`20921`)
+- Bug in ``.loc`` with a ``uint64`` indexer (:issue:`20722`)
+
+MultiIndex
+^^^^^^^^^^
+
+- Bug in :func:`MultiIndex.__contains__` where non-tuple keys would return ``True`` even if they had been dropped (:issue:`19027`)
+- Bug in :func:`MultiIndex.set_labels` which would cause casting (and potentially clipping) of the new labels if the ``level`` argument is not 0 or a list like [0, 1, ... ]  (:issue:`19057`)
+- Bug in :func:`MultiIndex.get_level_values` which would return an invalid index on level of ints with missing values (:issue:`17924`)
+- Bug in :func:`MultiIndex.unique` when called on empty :class:`MultiIndex` (:issue:`20568`)
+- Bug in :func:`MultiIndex.unique` which would not preserve level names (:issue:`20570`)
+- Bug in :func:`MultiIndex.remove_unused_levels` which would fill nan values (:issue:`18417`)
+- Bug in :func:`MultiIndex.from_tuples` which would fail to take zipped tuples in python3 (:issue:`18434`)
+- Bug in :func:`MultiIndex.get_loc` which would fail to automatically cast values between float and int (:issue:`18818`, :issue:`15994`)
+- Bug in :func:`MultiIndex.get_loc` which would cast boolean to integer labels (:issue:`19086`)
+- Bug in :func:`MultiIndex.get_loc` which would fail to locate keys containing ``NaN`` (:issue:`18485`)
+- Bug in :func:`MultiIndex.get_loc` in large :class:`MultiIndex`, would fail when levels had different dtypes (:issue:`18520`)
+- Bug in indexing where nested indexers having only numpy arrays are handled incorrectly (:issue:`19686`)
+
+
+I/O
+^^^
+
+- :func:`read_html` now rewinds seekable IO objects after parse failure, before attempting to parse with a new parser. If a parser errors and the object is non-seekable, an informative error is raised suggesting the use of a different parser (:issue:`17975`)
+- :meth:`DataFrame.to_html` now has an option to add an id to the leading `<table>` tag (:issue:`8496`)
+- Bug in :func:`read_msgpack` with a non existent file is passed in Python 2 (:issue:`15296`)
+- Bug in :func:`read_csv` where a ``MultiIndex`` with duplicate columns was not being mangled appropriately (:issue:`18062`)
+- Bug in :func:`read_csv` where missing values were not being handled properly when ``keep_default_na=False`` with dictionary ``na_values`` (:issue:`19227`)
+- Bug in :func:`read_csv` causing heap corruption on 32-bit, big-endian architectures (:issue:`20785`)
+- Bug in :func:`read_sas` where a file with 0 variables gave an ``AttributeError`` incorrectly. Now it gives an ``EmptyDataError`` (:issue:`18184`)
+- Bug in :func:`DataFrame.to_latex()` where pairs of braces meant to serve as invisible placeholders were escaped (:issue:`18667`)
+- Bug in :func:`DataFrame.to_latex()` where a ``NaN`` in a ``MultiIndex`` would cause an ``IndexError`` or incorrect output (:issue:`14249`)
+- Bug in :func:`DataFrame.to_latex()` where a non-string index-level name would result in an ``AttributeError`` (:issue:`19981`)
+- Bug in :func:`DataFrame.to_latex()` where the combination of an index name and the `index_names=False` option would result in incorrect output (:issue:`18326`)
+- Bug in :func:`DataFrame.to_latex()` where a ``MultiIndex`` with an empty string as its name would result in incorrect output (:issue:`18669`)
+- Bug in :func:`DataFrame.to_latex()` where missing space characters caused wrong escaping and produced non-valid latex in some cases (:issue:`20859`)
+- Bug in :func:`read_json` where large numeric values were causing an ``OverflowError`` (:issue:`18842`)
+- Bug in :func:`DataFrame.to_parquet` where an exception was raised if the write destination is S3 (:issue:`19134`)
+- :class:`Interval` now supported in :func:`DataFrame.to_excel` for all Excel file types (:issue:`19242`)
+- :class:`Timedelta` now supported in :func:`DataFrame.to_excel` for all Excel file types (:issue:`19242`, :issue:`9155`, :issue:`19900`)
+- Bug in :meth:`pandas.io.stata.StataReader.value_labels` raising an ``AttributeError`` when called on very old files. Now returns an empty dict (:issue:`19417`)
+- Bug in :func:`read_pickle` when unpickling objects with :class:`TimedeltaIndex` or :class:`Float64Index` created with pandas prior to version 0.20 (:issue:`19939`)
+- Bug in :meth:`pandas.io.json.json_normalize` where sub-records are not properly normalized if any sub-records values are NoneType (:issue:`20030`)
+- Bug in ``usecols`` parameter in :func:`read_csv` where error is not raised correctly when passing a string. (:issue:`20529`)
+- Bug in :func:`HDFStore.keys` when reading a file with a soft link causes exception (:issue:`20523`)
+- Bug in :func:`HDFStore.select_column` where a key which is not a valid store raised an ``AttributeError`` instead of a ``KeyError`` (:issue:`17912`)
+
+Plotting
+^^^^^^^^
+
+- Better error message when attempting to plot but matplotlib is not installed (:issue:`19810`).
+- :func:`DataFrame.plot` now raises a ``ValueError`` when the ``x`` or ``y`` argument is improperly formed (:issue:`18671`)
+- Bug in :func:`DataFrame.plot` when ``x`` and ``y`` arguments given as positions caused incorrect referenced columns for line, bar and area plots (:issue:`20056`)
+- Bug in formatting tick labels with ``datetime.time()`` and fractional seconds (:issue:`18478`).
+- :meth:`Series.plot.kde` has exposed the args ``ind`` and ``bw_method`` in the docstring (:issue:`18461`). The argument ``ind`` may now also be an integer (number of sample points).
+- :func:`DataFrame.plot` now supports multiple columns to the ``y`` argument (:issue:`19699`)
+
+
+Groupby/Resample/Rolling
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Bug when grouping by a single column and aggregating with a class like ``list`` or ``tuple`` (:issue:`18079`)
+- Fixed regression in :func:`DataFrame.groupby` which would not emit an error when called with a tuple key not in the index (:issue:`18798`)
+- Bug in :func:`DataFrame.resample` which silently ignored unsupported (or mistyped) options for ``label``, ``closed`` and ``convention`` (:issue:`19303`)
+- Bug in :func:`DataFrame.groupby` where tuples were interpreted as lists of keys rather than as keys (:issue:`17979`, :issue:`18249`)
+- Bug in :func:`DataFrame.groupby` where aggregation by ``first``/``last``/``min``/``max`` was causing timestamps to lose precision (:issue:`19526`)
+- Bug in :func:`DataFrame.transform` where particular aggregation functions were being incorrectly cast to match the dtype(s) of the grouped data (:issue:`19200`)
+- Bug in :func:`DataFrame.groupby` passing the `on=` kwarg, and subsequently using ``.apply()`` (:issue:`17813`)
+- Bug in :func:`DataFrame.resample().aggregate <pandas.core.resample.Resampler.aggregate>` not raising a ``KeyError`` when aggregating a non-existent column (:issue:`16766`, :issue:`19566`)
+- Bug in :func:`DataFrameGroupBy.cumsum` and :func:`DataFrameGroupBy.cumprod` when ``skipna`` was passed (:issue:`19806`)
+- Bug in :func:`DataFrame.resample` that dropped timezone information (:issue:`13238`)
+- Bug in :func:`DataFrame.groupby` where transformations using ``np.all`` and ``np.any`` were raising a ``ValueError`` (:issue:`20653`)
+- Bug in :func:`DataFrame.resample` where ``ffill``, ``bfill``, ``pad``, ``backfill``, ``fillna``, ``interpolate``, and ``asfreq`` were ignoring ``loffset``. (:issue:`20744`)
+- Bug in :func:`DataFrame.groupby` when applying a function that has mixed data types and the user supplied function can fail on the grouping column (:issue:`20949`)
+- Bug in :func:`DataFrameGroupBy.rolling().apply() <pandas.core.window.Rolling.apply>` where operations performed against the associated :class:`DataFrameGroupBy` object could impact the inclusion of the grouped item(s) in the result (:issue:`14013`)
+
+Sparse
+^^^^^^
+
+- Bug in which creating a :class:`SparseDataFrame` from a dense ``Series`` or an unsupported type raised an uncontrolled exception (:issue:`19374`)
+- Bug in :class:`SparseDataFrame.to_csv` causing exception (:issue:`19384`)
+- Bug in :class:`SparseSeries.memory_usage` which caused segfault by accessing non sparse elements (:issue:`19368`)
+- Bug in constructing a :class:`SparseArray`: if ``data`` is a scalar and ``index`` is defined it will coerce to ``float64`` regardless of scalar's dtype. (:issue:`19163`)
+
+Reshaping
+^^^^^^^^^
+
+- Bug in :func:`DataFrame.merge` where referencing a ``CategoricalIndex`` by name, where the ``by`` kwarg would ``KeyError`` (:issue:`20777`)
+- Bug in :func:`DataFrame.stack` which fails trying to sort mixed type levels under Python 3 (:issue:`18310`)
+- Bug in :func:`DataFrame.unstack` which casts int to float if ``columns`` is a ``MultiIndex`` with unused levels (:issue:`17845`)
+- Bug in :func:`DataFrame.unstack` which raises an error if ``index`` is a ``MultiIndex`` with unused labels on the unstacked level (:issue:`18562`)
+- Fixed construction of a :class:`Series` from a ``dict`` containing ``NaN`` as key (:issue:`18480`)
+- Fixed construction of a :class:`DataFrame` from a ``dict`` containing ``NaN`` as key (:issue:`18455`)
+- Disabled construction of a :class:`Series` where len(index) > len(data) = 1, which previously would broadcast the data item, and now raises a ``ValueError`` (:issue:`18819`)
+- Suppressed error in the construction of a :class:`DataFrame` from a ``dict`` containing scalar values when the corresponding keys are not included in the passed index (:issue:`18600`)
+
+- Fixed (changed from ``object`` to ``float64``) dtype of :class:`DataFrame` initialized with axes, no data, and ``dtype=int`` (:issue:`19646`)
+- Bug in :func:`Series.rank` where ``Series`` containing ``NaT`` modifies the ``Series`` inplace (:issue:`18521`)
+- Bug in :func:`cut` which fails when using readonly arrays (:issue:`18773`)
+- Bug in :func:`DataFrame.pivot_table` which fails when the ``aggfunc`` arg is of type string.  The behavior is now consistent with other methods like ``agg`` and ``apply`` (:issue:`18713`)
+- Bug in :func:`DataFrame.merge` in which merging using ``Index`` objects as vectors raised an Exception (:issue:`19038`)
+- Bug in :func:`DataFrame.stack`, :func:`DataFrame.unstack`, :func:`Series.unstack` which were not returning subclasses (:issue:`15563`)
+- Bug in timezone comparisons, manifesting as a conversion of the index to UTC in ``.concat()`` (:issue:`18523`)
+- Bug in :func:`concat` when concatenating sparse and dense series it returns only a ``SparseDataFrame``. Should be a ``DataFrame``. (:issue:`18914`, :issue:`18686`, and :issue:`16874`)
+- Improved error message for :func:`DataFrame.merge` when there is no common merge key (:issue:`19427`)
+- Bug in :func:`DataFrame.join` which does an ``outer`` instead of a ``left`` join when being called with multiple DataFrames and some have non-unique indices (:issue:`19624`)
+- :func:`Series.rename` now accepts ``axis`` as a kwarg (:issue:`18589`)
+- Bug in :func:`~DataFrame.rename` where an Index of same-length tuples was converted to a MultiIndex (:issue:`19497`)
+- Comparisons between :class:`Series` and :class:`Index` would return a ``Series`` with an incorrect name, ignoring the ``Index``'s name attribute (:issue:`19582`)
+- Bug in :func:`qcut` where datetime and timedelta data with ``NaT`` present raised a ``ValueError`` (:issue:`19768`)
+- Bug in :func:`DataFrame.iterrows`, which would infers strings not compliant to `ISO8601 <https://en.wikipedia.org/wiki/ISO_8601>`_ to datetimes (:issue:`19671`)
+- Bug in :class:`Series` constructor with ``Categorical`` where a ``ValueError`` is not raised when an index of different length is given (:issue:`19342`)
+- Bug in :meth:`DataFrame.astype` where column metadata is lost when converting to categorical or a dictionary of dtypes (:issue:`19920`)
+- Bug in :func:`cut` and :func:`qcut` where timezone information was dropped (:issue:`19872`)
+- Bug in :class:`Series` constructor with a ``dtype=str``, previously raised in some cases (:issue:`19853`)
+- Bug in :func:`get_dummies`, and :func:`select_dtypes`, where duplicate column names caused incorrect behavior (:issue:`20848`)
+- Bug in :func:`isna`, which cannot handle ambiguous typed lists (:issue:`20675`)
+- Bug in :func:`concat` which raises an error when concatenating TZ-aware dataframes and all-NaT dataframes (:issue:`12396`)
+- Bug in :func:`concat` which raises an error when concatenating empty TZ-aware series (:issue:`18447`)
+
+Other
+^^^^^
+
+- Improved error message when attempting to use a Python keyword as an identifier in a ``numexpr`` backed query (:issue:`18221`)
+- Bug in accessing a :func:`pandas.get_option`, which raised ``KeyError`` rather than ``OptionError`` when looking up a non-existent option key in some cases (:issue:`19789`)
+- Bug in :func:`testing.assert_series_equal` and :func:`testing.assert_frame_equal` for Series or DataFrames with differing unicode data (:issue:`20503`)
diff --git a/doc/source/whatsnew/v0.23.1.txt b/doc/source/whatsnew/v0.23.1.txt
new file mode 100644
index 0000000000000..af4eeffd87d01
--- /dev/null
+++ b/doc/source/whatsnew/v0.23.1.txt
@@ -0,0 +1,135 @@
+.. _whatsnew_0231:
+
+v0.23.1
+-------
+
+This is a minor bug-fix release in the 0.23.x series and includes some small regression fixes
+and bug fixes. We recommend that all users upgrade to this version.
+
+.. contents:: What's new in v0.23.1
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0231.fixed_regressions:
+
+Fixed Regressions
+~~~~~~~~~~~~~~~~~
+
+**Comparing Series with datetime.date**
+
+We've reverted a 0.23.0 change to comparing a :class:`Series` holding datetimes and a ``datetime.date`` object (:issue:`21152`).
+In pandas 0.22 and earlier, comparing a Series holding datetimes and ``datetime.date`` objects would coerce the ``datetime.date`` to a datetime before comapring.
+This was inconsistent with Python, NumPy, and :class:`DatetimeIndex`, which never consider a datetime and ``datetime.date`` equal.
+
+In 0.23.0, we unified operations between DatetimeIndex and Series, and in the process changed comparisons between a Series of datetimes and ``datetime.date`` without warning.
+
+We've temporarily restored the 0.22.0 behavior, so datetimes and dates may again compare equal, but restore the 0.23.0 behavior in a future release.
+
+To summarize, here's the behavior in 0.22.0, 0.23.0, 0.23.1:
+
+.. code-block:: python
+
+   # 0.22.0... Silently coerce the datetime.date
+   >>> Series(pd.date_range('2017', periods=2)) == datetime.date(2017, 1, 1)
+   0     True
+   1    False
+   dtype: bool
+
+   # 0.23.0... Do not coerce the datetime.date
+   >>> Series(pd.date_range('2017', periods=2)) == datetime.date(2017, 1, 1)
+   0    False
+   1    False
+   dtype: bool
+
+   # 0.23.1... Coerce the datetime.date with a warning
+   >>> Series(pd.date_range('2017', periods=2)) == datetime.date(2017, 1, 1)
+   /bin/python:1: FutureWarning: Comparing Series of datetimes with 'datetime.date'.  Currently, the
+   'datetime.date' is coerced to a datetime. In the future pandas will
+   not coerce, and the values not compare equal to the 'datetime.date'.
+   To retain the current behavior, convert the 'datetime.date' to a
+   datetime with 'pd.Timestamp'.
+     #!/bin/python3
+   0     True
+   1    False
+   dtype: bool
+
+In addition, ordering comparisons will raise a ``TypeError`` in the future.
+
+**Other Fixes**
+
+- Reverted the ability of :func:`~DataFrame.to_sql` to perform multivalue
+  inserts as this caused regression in certain cases (:issue:`21103`).
+  In the future this will be made configurable.
+- Fixed regression in the :attr:`DatetimeIndex.date` and :attr:`DatetimeIndex.time`
+  attributes in case of timezone-aware data: :attr:`DatetimeIndex.time` returned
+  a tz-aware time instead of tz-naive (:issue:`21267`) and :attr:`DatetimeIndex.date`
+  returned incorrect date when the input date has a non-UTC timezone (:issue:`21230`).
+- Fixed regression in :meth:`pandas.io.json.json_normalize` when called with ``None`` values
+  in nested levels in JSON, and to not drop keys with value as `None` (:issue:`21158`, :issue:`21356`).
+- Bug in :meth:`~DataFrame.to_csv` causes encoding error when compression and encoding are specified (:issue:`21241`, :issue:`21118`)
+- Bug preventing pandas from being importable with -OO optimization (:issue:`21071`)
+- Bug in :meth:`Categorical.fillna` incorrectly raising a ``TypeError`` when `value` the individual categories are iterable and `value` is an iterable (:issue:`21097`, :issue:`19788`)
+- Fixed regression in constructors coercing NA values like ``None`` to strings when passing ``dtype=str`` (:issue:`21083`)
+- Regression in :func:`pivot_table` where an ordered ``Categorical`` with missing
+  values for the pivot's ``index`` would give a mis-aligned result (:issue:`21133`)
+- Fixed regression in merging on boolean index/columns (:issue:`21119`).
+
+.. _whatsnew_0231.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved performance of :meth:`CategoricalIndex.is_monotonic_increasing`, :meth:`CategoricalIndex.is_monotonic_decreasing` and :meth:`CategoricalIndex.is_monotonic` (:issue:`21025`)
+- Improved performance of :meth:`CategoricalIndex.is_unique` (:issue:`21107`)
+
+
+.. _whatsnew_0231.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+**Groupby/Resample/Rolling**
+
+- Bug in :func:`DataFrame.agg` where applying multiple aggregation functions to a :class:`DataFrame` with duplicated column names would cause a stack overflow (:issue:`21063`)
+- Bug in :func:`pandas.core.groupby.GroupBy.ffill` and :func:`pandas.core.groupby.GroupBy.bfill` where the fill within a grouping would not always be applied as intended due to the implementations' use of a non-stable sort (:issue:`21207`)
+- Bug in :func:`pandas.core.groupby.GroupBy.rank` where results did not scale to 100% when specifying ``method='dense'`` and ``pct=True``
+- Bug in :func:`pandas.DataFrame.rolling` and :func:`pandas.Series.rolling` which incorrectly accepted a 0 window size rather than raising (:issue:`21286`)
+
+**Data-type specific**
+
+- Bug in :meth:`Series.str.replace()` where the method throws `TypeError` on Python 3.5.2 (:issue:`21078`)
+- Bug in :class:`Timedelta` where passing a float with a unit would prematurely round the float precision (:issue:`14156`)
+- Bug in :func:`pandas.testing.assert_index_equal` which raised ``AssertionError`` incorrectly, when comparing two :class:`CategoricalIndex` objects with param ``check_categorical=False`` (:issue:`19776`)
+
+**Sparse**
+
+- Bug in :attr:`SparseArray.shape` which previously only returned the shape :attr:`SparseArray.sp_values` (:issue:`21126`)
+
+**Indexing**
+
+- Bug in :meth:`Series.reset_index` where appropriate error was not raised with an invalid level name (:issue:`20925`)
+- Bug in :func:`interval_range` when ``start``/``periods`` or ``end``/``periods`` are specified with float ``start`` or ``end`` (:issue:`21161`)
+- Bug in :meth:`MultiIndex.set_names` where error raised for a ``MultiIndex`` with ``nlevels == 1`` (:issue:`21149`)
+- Bug in :class:`IntervalIndex` constructors where creating an ``IntervalIndex`` from categorical data was not fully supported (:issue:`21243`, :issue:`21253`)
+- Bug in :meth:`MultiIndex.sort_index` which was not guaranteed to sort correctly with ``level=1``; this was also causing data misalignment in particular :meth:`DataFrame.stack` operations (:issue:`20994`, :issue:`20945`, :issue:`21052`)
+
+**Plotting**
+
+- New keywords (sharex, sharey) to turn on/off sharing of x/y-axis by subplots generated with pandas.DataFrame().groupby().boxplot() (:issue:`20968`)
+
+**I/O**
+
+- Bug in IO methods specifying ``compression='zip'`` which produced uncompressed zip archives (:issue:`17778`, :issue:`21144`)
+- Bug in :meth:`DataFrame.to_stata` which prevented exporting DataFrames to buffers and most file-like objects (:issue:`21041`)
+- Bug in :meth:`read_stata` and :class:`StataReader` which did not correctly decode utf-8 strings on Python 3 from Stata 14 files (dta version 118) (:issue:`21244`)
+- Bug in IO JSON :func:`read_json` reading empty JSON schema with ``orient='table'`` back to :class:`DataFrame` caused an error (:issue:`21287`)
+
+**Reshaping**
+
+- Bug in :func:`concat` where error was raised in concatenating :class:`Series` with numpy scalar and tuple names (:issue:`21015`)
+- Bug in :func:`concat` warning message providing the wrong guidance for future behavior (:issue:`21101`)
+
+**Other**
+
+- Tab completion on :class:`Index` in IPython no longer outputs deprecation warnings (:issue:`21125`)
+- Bug preventing pandas being used on Windows without C++ redistributable installed (:issue:`21106`)
diff --git a/doc/source/whatsnew/v0.23.2.txt b/doc/source/whatsnew/v0.23.2.txt
new file mode 100644
index 0000000000000..987f171878d0b
--- /dev/null
+++ b/doc/source/whatsnew/v0.23.2.txt
@@ -0,0 +1,143 @@
+.. _whatsnew_0232:
+
+v0.23.2
+-------
+
+This is a minor bug-fix release in the 0.23.x series and includes some small regression fixes
+and bug fixes. We recommend that all users upgrade to this version.
+
+.. note::
+
+   Pandas 0.23.2 is first pandas release that's compatible with
+   Python 3.7 (:issue:`20552`)
+
+
+.. contents:: What's new in v0.23.2
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0232.enhancements:
+
+Logical Reductions over Entire DataFrame
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+:meth:`DataFrame.all` and :meth:`DataFrame.any` now accept ``axis=None`` to reduce over all axes to a scalar (:issue:`19976`)
+
+.. ipython:: python
+
+   df = pd.DataFrame({"A": [1, 2], "B": [True, False]})
+   df.all(axis=None)
+
+
+This also provides compatibility with NumPy 1.15, which now dispatches to ``DataFrame.all``.
+With NumPy 1.15 and pandas 0.23.1 or earlier, :func:`numpy.all` will no longer reduce over every axis:
+
+.. code-block:: python
+
+   >>> # NumPy 1.15, pandas 0.23.1
+   >>> np.any(pd.DataFrame({"A": [False], "B": [False]}))
+   A    False
+   B    False
+   dtype: bool
+
+With pandas 0.23.2, that will correctly return False, as it did with NumPy < 1.15.
+
+.. ipython:: python
+
+   np.any(pd.DataFrame({"A": [False], "B": [False]}))
+
+
+.. _whatsnew_0232.fixed_regressions:
+
+Fixed Regressions
+~~~~~~~~~~~~~~~~~
+
+- Fixed regression in :meth:`to_csv` when handling file-like object incorrectly (:issue:`21471`)
+- Re-allowed duplicate level names of a ``MultiIndex``. Accessing a level that has a duplicate name by name still raises an error (:issue:`19029`).
+- Bug in both :meth:`DataFrame.first_valid_index` and :meth:`Series.first_valid_index` raised for a row index having duplicate values (:issue:`21441`)
+- Fixed regression in unary negative operations with object dtype (:issue:`21380`)
+- Bug in :meth:`Timestamp.ceil` and :meth:`Timestamp.floor` when timestamp is a multiple of the rounding frequency (:issue:`21262`)
+
+.. _whatsnew_0232.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved performance of membership checks in :class:`Categorical` and :class:`CategoricalIndex`
+  (i.e. ``x in cat``-style checks are much faster). :meth:`CategoricalIndex.contains`
+  is likewise much faster (:issue:`21369`, :issue:`21508`)
+- Improved performance of :meth:`HDFStore.groups` (and dependent functions like
+  :meth:`~HDFStore.keys`.  (i.e. ``x in store`` checks are much faster)
+  (:issue:`21372`)
+- Improved performance of :meth:`MultiIndex.is_unique` (:issue:`21522`)
+-
+
+Documentation Changes
+~~~~~~~~~~~~~~~~~~~~~
+
+-
+-
+
+Build Changes
+-------------
+
+- The source and binary distributions no longer include test data files, resulting in smaller download sizes. Tests relying on these data files will be skipped when using ``pandas.test()``. (:issue:`19320`)
+
+.. _whatsnew_0232.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+**Groupby/Resample/Rolling**
+
+-
+-
+
+**Timedelta**
+
+- Bug in :class:`Timedelta` where non-zero timedeltas shorter than 1 microsecond were considered False (:issue:`21484`)
+
+**Conversion**
+
+- Bug in constructing :class:`Index` with an iterator or generator (:issue:`21470`)
+- Bug in :meth:`Series.nlargest` for signed and unsigned integer dtypes when the minimum value is present (:issue:`21426`)
+
+
+**Indexing**
+
+- Bug in :meth:`Index.get_indexer_non_unique` with categorical key (:issue:`21448`)
+- Bug in comparison operations for :class:`MultiIndex` where error was raised on equality / inequality comparison involving a MultiIndex with ``nlevels == 1`` (:issue:`21149`)
+- Bug in :meth:`DataFrame.drop` behaviour is not consistent for unique and non-unique indexes (:issue:`21494`)
+- Bug in :func:`DataFrame.duplicated` with a large number of columns causing a 'maximum recursion depth exceeded' (:issue:`21524`).
+-
+
+**I/O**
+
+- Bug in :func:`read_csv` that caused it to incorrectly raise an error when ``nrows=0``, ``low_memory=True``, and ``index_col`` was not ``None`` (:issue:`21141`)
+- Bug in :func:`json_normalize` when formatting the ``record_prefix`` with integer columns (:issue:`21536`)
+-
+
+**Plotting**
+
+-
+-
+
+**Reshaping**
+
+-
+-
+
+**Categorical**
+
+- Bug in rendering :class:`Series` with ``Categorical`` dtype in rare conditions under Python 2.7 (:issue:`21002`)
+-
+
+**Timezones**
+
+- Bug in :class:`Timestamp` and :class:`DatetimeIndex` where passing a :class:`Timestamp` localized after a DST transition would return a datetime before the DST transition (:issue:`20854`)
+- Bug in comparing :class:`DataFrame`s with tz-aware :class:`DatetimeIndex` columns with a DST transition that raised a ``KeyError`` (:issue:`19970`)
+
+
+**Other**
+
+-
diff --git a/doc/source/whatsnew/v0.24.0.txt b/doc/source/whatsnew/v0.24.0.txt
new file mode 100644
index 0000000000000..0ca5b9cdf1d57
--- /dev/null
+++ b/doc/source/whatsnew/v0.24.0.txt
@@ -0,0 +1,348 @@
+.. _whatsnew_0240:
+
+v0.24.0
+-------
+
+.. _whatsnew_0240.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+- ``ExcelWriter`` now accepts ``mode`` as a keyword argument, enabling append to existing workbooks when using the ``openpyxl`` engine (:issue:`3441`)
+
+.. _whatsnew_0240.enhancements.extension_array_operators
+
+``ExtensionArray`` operator support
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+A ``Series`` based on an ``ExtensionArray`` now supports arithmetic and comparison
+operators. (:issue:`19577`). There are two approaches for providing operator support for an ``ExtensionArray``:
+
+1. Define each of the operators on your ``ExtensionArray`` subclass.
+2. Use an operator implementation from pandas that depends on operators that are already defined
+   on the underlying elements (scalars) of the ``ExtensionArray``.
+
+See the :ref:`ExtensionArray Operator Support
+<extending.extension.operator>` documentation section for details on both
+ways of adding operator support.
+
+.. _whatsnew_0240.enhancements.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+- :func:`to_datetime` now supports the ``%Z`` and ``%z`` directive when passed into ``format`` (:issue:`13486`)
+- :func:`Series.mode` and :func:`DataFrame.mode` now support the ``dropna`` parameter which can be used to specify whether NaN/NaT values should be considered (:issue:`17534`)
+- :func:`to_csv` now supports ``compression`` keyword when a file handle is passed. (:issue:`21227`)
+- :meth:`Index.droplevel` is now implemented also for flat indexes, for compatibility with :class:`MultiIndex` (:issue:`21115`)
+- Added support for reading from Google Cloud Storage via the ``gcsfs`` library (:issue:`19454`)
+- :func:`to_gbq` and :func:`read_gbq` signature and documentation updated to
+  reflect changes from the `Pandas-GBQ library version 0.5.0
+  <https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-5-0>`__.
+  (:issue:`21627`)
+- New method :meth:`HDFStore.walk` will recursively walk the group hierarchy of an HDF5 file (:issue:`10932`)
+- :meth:`Series.nlargest`, :meth:`Series.nsmallest`, :meth:`DataFrame.nlargest`, and :meth:`DataFrame.nsmallest` now accept the value ``"all"`` for the ``keep` argument. This keeps all ties for the nth largest/smallest value (:issue:`16818`)
+-
+
+.. _whatsnew_0240.api_breaking:
+
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _whatsnew_0240.api.datetimelike.normalize:
+
+Tick DateOffset Normalize Restrictions
+--------------------------------------
+
+Creating a ``Tick`` object (:class:`Day`, :class:`Hour`, :class:`Minute`,
+:class:`Second`, :class:`Milli`, :class:`Micro`, :class:`Nano`) with
+`normalize=True` is no longer supported.  This prevents unexpected behavior
+where addition could fail to be monotone or associative.  (:issue:`21427`)
+
+.. ipython:: python
+
+    ts = pd.Timestamp('2018-06-11 18:01:14')
+    ts
+    tic = pd.offsets.Hour(n=2, normalize=True)
+    tic
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+    In [4]: ts + tic
+    Out [4]: Timestamp('2018-06-11 00:00:00')
+
+    In [5]: ts + tic + tic + tic == ts + (tic + tic + tic)
+    Out [5]: False
+
+Current Behavior:
+
+.. ipython:: python
+
+    tic = pd.offsets.Hour(n=2)
+    ts + tic + tic + tic == ts + (tic + tic + tic)
+
+
+.. _whatsnew_0240.api.datetimelike:
+
+
+.. _whatsnew_0240.api.period_subtraction:
+
+Period Subtraction
+^^^^^^^^^^^^^^^^^^
+
+Subtraction of a ``Period`` from another ``Period`` will give a ``DateOffset``.
+instead of an integer (:issue:`21314`)
+
+.. ipython:: python
+
+    june = pd.Period('June 2018')
+    april = pd.Period('April 2018')
+    june - april
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+    In [2]: june = pd.Period('June 2018')
+
+    In [3]: april = pd.Period('April 2018')
+
+    In [4]: june - april
+    Out [4]: 2
+
+Similarly, subtraction of a ``Period`` from a ``PeriodIndex`` will now return
+an ``Index`` of ``DateOffset`` objects instead of an ``Int64Index``
+
+.. ipython:: python
+
+    pi = pd.period_range('June 2018', freq='M', periods=3)
+    pi - pi[0]
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+    In [2]: pi = pd.period_range('June 2018', freq='M', periods=3)
+
+    In [3]: pi - pi[0]
+    Out[3]: Int64Index([0, 1, 2], dtype='int64')
+
+Datetimelike API Changes
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- For :class:`DatetimeIndex` and :class:`TimedeltaIndex` with non-``None`` ``freq`` attribute, addition or subtraction of integer-dtyped array or ``Index`` will return an object of the same class (:issue:`19959`)
+- :class:`DateOffset` objects are now immutable. Attempting to alter one of these will now raise ``AttributeError`` (:issue:`21341`)
+- :class:`PeriodIndex` subtraction of another ``PeriodIndex`` will now return an object-dtype :class:`Index` of :class:`DateOffset` objects instead of raising a ``TypeError`` (:issue:`20049`)
+
+.. _whatsnew_0240.api.other:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+
+.. _whatsnew_0240.api.other.incompatibilities:
+
+Series and Index Data-Dtype Incompatibilities
+---------------------------------------------
+
+``Series`` and ``Index`` constructors now raise when the
+data is incompatible with a passed ``dtype=`` (:issue:`15832`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+    In [4]: pd.Series([-1], dtype="uint64")
+    Out [4]:
+    0    18446744073709551615
+    dtype: uint64
+
+Current Behavior:
+
+.. code-block:: ipython
+
+    In [4]: pd.Series([-1], dtype="uint64")
+    Out [4]:
+    ...
+    OverflowError: Trying to coerce negative values to unsigned integers
+
+- :class:`DatetimeIndex` now accepts :class:`Int64Index` arguments as epoch timestamps (:issue:`20997`)
+-
+-
+
+.. _whatsnew_0240.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+
+- :meth:`DataFrame.to_stata`, :meth:`read_stata`, :class:`StataReader` and :class:`StataWriter` have deprecated the ``encoding`` argument.  The encoding of a Stata dta file is determined by the file type and cannot be changed (:issue:`21244`).
+- :meth:`MultiIndex.to_hierarchical` is deprecated and will be removed in a future version  (:issue:`21613`)
+-
+
+.. _whatsnew_0240.prior_deprecations:
+
+Removal of prior version deprecations/changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+- The ``LongPanel`` and ``WidePanel`` classes have been removed (:issue:`10892`)
+-
+-
+-
+
+.. _whatsnew_0240.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Very large improvement in performance of slicing when the index is a :class:`CategoricalIndex`,
+  both when indexing by label (using .loc) and position(.iloc).
+  Likewise, slicing a ``CategoricalIndex`` itself (i.e. ``ci[100:200]``) shows similar speed improvements (:issue:`21659`)
+- Improved performance of :func:`Series.describe` in case of numeric dtpyes (:issue:`21274`)
+- Improved performance of :func:`pandas.core.groupby.GroupBy.rank` when dealing with tied rankings (:issue:`21237`)
+- Improved performance of :func:`DataFrame.set_index` with columns consisting of :class:`Period` objects (:issue:`21582`,:issue:`21606`)
+-
+
+.. _whatsnew_0240.docs:
+
+Documentation Changes
+~~~~~~~~~~~~~~~~~~~~~
+
+- Added sphinx spelling extension, updated documentation on how to use the spell check (:issue:`21079`)
+-
+-
+
+.. _whatsnew_0240.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+Categorical
+^^^^^^^^^^^
+
+-
+-
+-
+
+Datetimelike
+^^^^^^^^^^^^
+
+- Fixed bug where two :class:`DateOffset` objects with different ``normalize`` attributes could evaluate as equal (:issue:`21404`)
+
+Timedelta
+^^^^^^^^^
+
+-
+-
+-
+
+Timezones
+^^^^^^^^^
+
+- Bug in :meth:`DatetimeIndex.shift` where an ``AssertionError`` would raise when shifting across DST (:issue:`8616`)
+- Bug in :class:`Timestamp` constructor where passing an invalid timezone offset designator (``Z``) would not raise a ``ValueError``(:issue:`8910`)
+- Bug in :meth:`Timestamp.replace` where replacing at a DST boundary would retain an incorrect offset (:issue:`7825`)
+- Bug in :meth:`Series.replace` with ``datetime64[ns, tz]`` data when replacing ``NaT`` (:issue:`11792`)
+- Bug in :class:`Timestamp` when passing different string date formats with a timezone offset would produce different timezone offsets (:issue:`12064`)
+- Bug when comparing a tz-naive :class:`Timestamp` to a tz-aware :class:`DatetimeIndex` which would coerce the :class:`DatetimeIndex` to tz-naive (:issue:`12601`)
+- Bug in :meth:`Series.truncate` with a tz-aware :class:`DatetimeIndex` which would cause a core dump (:issue:`9243`)
+- Bug in :class:`Series` constructor which would coerce tz-aware and tz-naive :class:`Timestamp`s to tz-aware (:issue:`13051`)
+- Bug in :class:`Index` with ``datetime64[ns, tz]`` dtype that did not localize integer data correctly (:issue:`20964`)
+
+Offsets
+^^^^^^^
+
+-
+-
+
+Numeric
+^^^^^^^
+
+- Bug in :class:`Series` ``__rmatmul__`` doesn't support matrix vector multiplication (:issue:`21530`)
+-
+-
+
+Strings
+^^^^^^^
+
+-
+-
+-
+
+Interval
+^^^^^^^^
+
+- Bug in the :class:`IntervalIndex` constructor where the ``closed`` parameter did not always override the inferred ``closed`` (:issue:`19370`)
+-
+-
+
+Indexing
+^^^^^^^^
+
+- The traceback from a ``KeyError`` when asking ``.loc`` for a single missing label is now shorter and more clear (:issue:`21557`)
+- When ``.ix`` is asked for a missing integer label in a :class:`MultiIndex` with a first level of integer type, it now raises a ``KeyError`` - consistently with the case of a flat :class:`Int64Index` - rather than falling back to positional indexing (:issue:`21593`)
+- Bug in :meth:`DatetimeIndex.reindex` when reindexing a tz-naive and tz-aware :class:`DatetimeIndex` (:issue:`8306`)
+- Bug in :class:`DataFrame` when setting values with ``.loc`` and a timezone aware :class:`DatetimeIndex` (:issue:`11365`)
+- Bug when indexing :class:`DatetimeIndex` with nanosecond resolution dates and timezones (:issue:`11679`)
+
+-
+
+MultiIndex
+^^^^^^^^^^
+
+-
+-
+-
+
+I/O
+^^^
+
+-
+-
+-
+
+Plotting
+^^^^^^^^
+
+-
+-
+-
+
+Groupby/Resample/Rolling
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Bug in :func:`pandas.core.groupby.GroupBy.first` and :func:`pandas.core.groupby.GroupBy.last` with ``as_index=False`` leading to the loss of timezone information (:issue:`15884`)
+- Bug in :meth:`DatetimeIndex.resample` when downsampling across a DST boundary (:issue:`8531`)
+-
+-
+
+Sparse
+^^^^^^
+
+-
+-
+-
+
+Reshaping
+^^^^^^^^^
+
+-
+-
+-
+
+ExtensionArray
+^^^^^^^^^^^^^^
+
+- Bug in :meth:`Series.get` for ``Series`` using ``ExtensionArray`` and integer index (:issue:`21257`)
+- :meth:`Series.combine()` works correctly with :class:`~pandas.api.extensions.ExtensionArray` inside of :class:`Series` (:issue:`20825`)
+- :meth:`Series.combine()` with scalar argument now works for any function type (:issue:`21248`)
+-
+-
+
+Other
+^^^^^
+
+- :meth: `~pandas.io.formats.style.Styler.background_gradient` now takes a ``text_color_threshold`` parameter to automatically lighten the text color based on the luminance of the background color. This improves readability with dark background colors without the need to limit the background colormap range. (:issue:`21258`)
+-
+-
+-
diff --git a/doc/source/whatsnew/v0.4.x.txt b/doc/source/whatsnew/v0.4.x.txt
index 4717b46a6bca8..ed9352059a6dc 100644
--- a/doc/source/whatsnew/v0.4.x.txt
+++ b/doc/source/whatsnew/v0.4.x.txt
@@ -9,7 +9,7 @@ New Features
 - Added Python 3 support using 2to3 (:issue:`200`)
 - :ref:`Added <dsintro.name_attribute>` ``name`` attribute to ``Series``, now
   prints as part of ``Series.__repr__``
-- :ref:`Added <missing.isnull>` instance methods ``isnull`` and ``notnull`` to
+- :ref:`Added <missing.isna>` instance methods ``isnull`` and ``notnull`` to
   Series (:issue:`209`, :issue:`203`)
 - :ref:`Added <basics.align>` ``Series.align`` method for aligning two series
   with choice of join method (ENH56_)
@@ -56,8 +56,8 @@ Performance Enhancements
 - Wrote fast time series merging / joining methods in Cython. Will be
   integrated later into DataFrame.join and related functions
 
-.. _ENH1b: https://github.com/pydata/pandas/commit/1ba56251f0013ff7cd8834e9486cef2b10098371
-.. _ENHdc: https://github.com/pydata/pandas/commit/dca3c5c5a6a3769ee01465baca04cfdfa66a4f76
-.. _ENHed: https://github.com/pydata/pandas/commit/edd9f1945fc010a57fa0ae3b3444d1fffe592591
-.. _ENH56: https://github.com/pydata/pandas/commit/56e0c9ffafac79ce262b55a6a13e1b10a88fbe93
+.. _ENH1b: https://github.com/pandas-dev/pandas/commit/1ba56251f0013ff7cd8834e9486cef2b10098371
+.. _ENHdc: https://github.com/pandas-dev/pandas/commit/dca3c5c5a6a3769ee01465baca04cfdfa66a4f76
+.. _ENHed: https://github.com/pandas-dev/pandas/commit/edd9f1945fc010a57fa0ae3b3444d1fffe592591
+.. _ENH56: https://github.com/pandas-dev/pandas/commit/56e0c9ffafac79ce262b55a6a13e1b10a88fbe93
 
diff --git a/doc/source/whatsnew/v0.5.0.txt b/doc/source/whatsnew/v0.5.0.txt
index 8b7e4721d136f..6fe6a02b08f70 100644
--- a/doc/source/whatsnew/v0.5.0.txt
+++ b/doc/source/whatsnew/v0.5.0.txt
@@ -39,5 +39,5 @@ Performance Enhancements
 - VBENCH Significantly sped up conversion of nested dict into DataFrame (:issue:`212`)
 - VBENCH Significantly speed up DataFrame ``__repr__`` and ``count`` on large mixed-type DataFrame objects
 
-.. _ENH61: https://github.com/pydata/pandas/commit/6141961
-.. _ENH5c: https://github.com/pydata/pandas/commit/5ca6ff5d822ee4ddef1ec0d87b6d83d8b4bbd3eb
+.. _ENH61: https://github.com/pandas-dev/pandas/commit/6141961
+.. _ENH5c: https://github.com/pandas-dev/pandas/commit/5ca6ff5d822ee4ddef1ec0d87b6d83d8b4bbd3eb
diff --git a/doc/source/whatsnew/v0.6.0.txt b/doc/source/whatsnew/v0.6.0.txt
index 55a67a75e0fd1..bd01dd0a90a59 100644
--- a/doc/source/whatsnew/v0.6.0.txt
+++ b/doc/source/whatsnew/v0.6.0.txt
@@ -43,7 +43,7 @@ New Features
 
 Performance Enhancements
 ~~~~~~~~~~~~~~~~~~~~~~~~
-- VBENCH Cythonized ``cache_readonly``, resulting in substantial micro-performance enhancements throughout the codebase (:issue:`361`)
+- VBENCH Cythonized ``cache_readonly``, resulting in substantial micro-performance enhancements throughout the code base (:issue:`361`)
 - VBENCH Special Cython matrix iterator for applying arbitrary reduction operations with 3-5x better performance than `np.apply_along_axis` (:issue:`309`)
 - VBENCH Improved performance of ``MultiIndex.from_tuples``
 - VBENCH Special Cython matrix iterator for applying arbitrary reduction operations
diff --git a/doc/source/whatsnew/v0.6.1.txt b/doc/source/whatsnew/v0.6.1.txt
index a2dab738546f9..acd5b0774f2bb 100644
--- a/doc/source/whatsnew/v0.6.1.txt
+++ b/doc/source/whatsnew/v0.6.1.txt
@@ -16,12 +16,12 @@ New features
 - Add PyQt table widget to sandbox (:issue:`435`)
 - DataFrame.align can :ref:`accept Series arguments <basics.align.frame.series>`
   and an :ref:`axis option <basics.df_join>` (:issue:`461`)
-- Implement new :ref:`SparseArray <sparse.array>` and :ref:`SparseList <sparse.list>`
+- Implement new :ref:`SparseArray <sparse.array>` and `SparseList`
   data structures. SparseSeries now derives from SparseArray (:issue:`463`)
 - :ref:`Better console printing options <basics.console_output>` (:issue:`453`)
 - Implement fast :ref:`data ranking <computation.ranking>` for Series and
   DataFrame, fast versions of scipy.stats.rankdata (:issue:`428`)
-- Implement :ref:`DataFrame.from_items <basics.dataframe.from_items>` alternate
+- Implement `DataFrame.from_items` alternate
   constructor (:issue:`444`)
 - DataFrame.convert_objects method for :ref:`inferring better dtypes <basics.cast>`
   for object columns (:issue:`302`)
diff --git a/doc/source/whatsnew/v0.7.0.txt b/doc/source/whatsnew/v0.7.0.txt
index cfba2ad3d05b6..21d91950e7b78 100644
--- a/doc/source/whatsnew/v0.7.0.txt
+++ b/doc/source/whatsnew/v0.7.0.txt
@@ -169,16 +169,30 @@ API tweaks regarding label-based slicing
 Label-based slicing using ``ix`` now requires that the index be sorted
 (monotonic) **unless** both the start and endpoint are contained in the index:
 
-.. ipython:: python
+.. code-block:: python
 
-   s = Series(randn(6), index=list('gmkaec'))
-   s
+   In [1]: s = Series(randn(6), index=list('gmkaec'))
+
+   In [2]: s
+   Out[2]:
+   g   -1.182230
+   m   -0.276183
+   k   -0.243550
+   a    1.628992
+   e    0.073308
+   c   -0.539890
+   dtype: float64
 
 Then this is OK:
 
-.. ipython:: python
+.. code-block:: python
 
-   s.ix['k':'e']
+   In [3]: s.ix['k':'e']
+   Out[3]:
+   k   -0.243550
+   a    1.628992
+   e    0.073308
+   dtype: float64
 
 But this is not:
 
@@ -189,11 +203,26 @@ But this is not:
 
 If the index had been sorted, the "range selection" would have been possible:
 
-.. ipython:: python
+.. code-block:: python
+
+   In [4]: s2 = s.sort_index()
 
-   s2 = s.sort_index()
-   s2
-   s2.ix['b':'h']
+   In [5]: s2
+   Out[5]:
+   a    1.628992
+   c   -0.539890
+   e    0.073308
+   g   -1.182230
+   k   -0.243550
+   m   -0.276183
+   dtype: float64
+
+   In [6]: s2.ix['b':'h']
+   Out[6]:
+   c   -0.539890
+   e    0.073308
+   g   -1.182230
+   dtype: float64
 
 Changes to Series ``[]`` operator
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -269,4 +298,3 @@ Performance improvements
   ``level`` parameter passed (:issue:`545`)
 - Ported skiplist data structure to C to speed up ``rolling_median`` by about
   5-10x in most typical use cases (:issue:`374`)
-
diff --git a/doc/source/whatsnew/v0.7.3.txt b/doc/source/whatsnew/v0.7.3.txt
index 21aa16e5fcb06..77cc72d8707cf 100644
--- a/doc/source/whatsnew/v0.7.3.txt
+++ b/doc/source/whatsnew/v0.7.3.txt
@@ -22,7 +22,7 @@ New features
    from pandas.tools.plotting import scatter_matrix
    scatter_matrix(df, alpha=0.2)
 
-.. image:: _static/scatter_matrix_kde.png
+.. image:: savefig/scatter_matrix_kde.png
    :width: 5in
 
 - Add ``stacked`` argument to Series and DataFrame's ``plot`` method for
@@ -32,14 +32,14 @@ New features
 
    df.plot(kind='bar', stacked=True)
 
-.. image:: _static/bar_plot_stacked_ex.png
+.. image:: savefig/bar_plot_stacked_ex.png
    :width: 4in
 
 .. code-block:: python
 
    df.plot(kind='barh', stacked=True)
 
-.. image:: _static/barh_plot_stacked_ex.png
+.. image:: savefig/barh_plot_stacked_ex.png
    :width: 4in
 
 - Add log x and y :ref:`scaling options <visualization.basic>` to
@@ -93,4 +93,4 @@ Series, to be more consistent with the ``groupby`` behavior with DataFrame:
     df
     grouped = df.groupby('A')['C']
     grouped.describe()
-    grouped.apply(lambda x: x.order()[-2:]) # top 2 values
+    grouped.apply(lambda x: x.sort_values()[-2:]) # top 2 values
diff --git a/doc/source/whatsnew/v0.8.0.txt b/doc/source/whatsnew/v0.8.0.txt
index a76c4e487d5d8..29d6fe563d047 100644
--- a/doc/source/whatsnew/v0.8.0.txt
+++ b/doc/source/whatsnew/v0.8.0.txt
@@ -33,7 +33,7 @@ clear of NumPy 1.6's datetime64 API functions (though limited as they are) and
 only interact with this data using the interface that pandas provides.
 
 See the end of the 0.8.0 section for a "porting" guide listing potential issues
-for users migrating legacy codebases from pandas 0.7 or earlier to 0.8.0.
+for users migrating legacy code bases from pandas 0.7 or earlier to 0.8.0.
 
 Bug fixes to the 0.7.x series for legacy NumPy < 1.6 users will be provided as
 they arise. There will be no more further development in 0.7.x beyond bug
@@ -59,7 +59,7 @@ Time series changes and improvements
   aggregation functions, and control over how the intervals and result labeling
   are defined. A suite of high performance Cython/C-based resampling functions
   (including Open-High-Low-Close) have also been implemented.
-- Revamp of :ref:`frequency aliases <timeseries.alias>` and support for
+- Revamp of :ref:`frequency aliases <timeseries.offset_aliases>` and support for
   **frequency shortcuts** like '15min', or '1h30min'
 - New :ref:`DatetimeIndex class <timeseries.datetimeindex>` supports both fixed
   frequency and irregular time
@@ -68,7 +68,7 @@ Time series changes and improvements
   :ref:`time spans <timeseries.periods>` and performing **calendar logic**,
   including the `12 fiscal quarterly frequencies <timeseries.quarterly>`.
   This is a partial port of, and a substantial enhancement to,
-  elements of the scikits.timeseries codebase. Support for conversion between
+  elements of the scikits.timeseries code base. Support for conversion between
   PeriodIndex and DatetimeIndex
 - New Timestamp data type subclasses `datetime.datetime`, providing the same
   interface while enabling working with nanosecond-resolution data. Also
@@ -76,7 +76,7 @@ Time series changes and improvements
 - Enhanced support for :ref:`time zones <timeseries.timezone>`. Add
   `tz_convert` and ``tz_lcoalize`` methods to TimeSeries and DataFrame. All
   timestamps are stored as UTC; Timestamps from DatetimeIndex objects with time
-  zone set will be localized to localtime. Time zone conversions are therefore
+  zone set will be localized to local time. Time zone conversions are therefore
   essentially free. User needs to know very little about pytz library now; only
   time zone names as as strings are required. Time zone-aware timestamps are
   equal if and only if their UTC timestamps match. Operations between time
@@ -123,7 +123,7 @@ Other new features
 - Enhanced :ref:`read_csv/read_table <io.parse_dates>` for reading time series
   data and converting multiple columns to dates
 - Add :ref:`comments <io.comments>` option to parser functions: read_csv, etc.
-- Add :ref`dayfirst <io.dayfirst>` option to parser functions for parsing
+- Add :ref:`dayfirst <io.dayfirst>` option to parser functions for parsing
   international DD/MM/YYYY dates
 - Allow the user to specify the CSV reader :ref:`dialect <io.dialect>` to
   control quoting etc.
@@ -134,7 +134,7 @@ Other new features
 - Move to klib-based hash tables for indexing; better performance and less
   memory usage than Python's dict
 - Add first, last, min, max, and prod optimized GroupBy functions
-- New :ref:`ordered_merge <merging.ordered_merge>` function
+- New :ref:`ordered_merge <merging.merge_ordered>` function
 - Add flexible :ref:`comparison <basics.binop>` instance methods eq, ne, lt,
   gt, etc. to DataFrame, Series
 - Improve :ref:`scatter_matrix <visualization.scatter_matrix>` plotting
@@ -168,7 +168,6 @@ New plotting methods
 
    fx['FR'].plot(style='g')
 
-   @savefig whatsnew_secondary_y.png
    fx['IT'].plot(style='k--', secondary_y=True)
 
 Vytautas Jancauskas, the 2012 GSOC participant, has added many new plot
@@ -180,7 +179,6 @@ types. For example, ``'kde'`` is a new option:
                               np.random.randn(1000) * 0.5 + 3)))
    plt.figure()
    s.hist(normed=True, alpha=0.2)
-   @savefig whatsnew_kde.png
    s.plot(kind='kde')
 
 See :ref:`the plotting page <visualization.other>` for much more.
@@ -219,12 +217,12 @@ nanosecond support (the ``nanosecond`` field store the nanosecond value between
 ``DatetimeIndex`` to regular NumPy arrays.
 
 If you have code that requires an array of ``datetime.datetime`` objects, you
-have a couple of options. First, the ``asobject`` property of ``DatetimeIndex``
+have a couple of options. First, the ``astype(object)`` method of ``DatetimeIndex``
 produces an array of ``Timestamp`` objects:
 
 .. ipython:: python
 
-   stamp_array = rng.asobject
+   stamp_array = rng.astype(object)
    stamp_array
    stamp_array[5]
 
@@ -241,7 +239,7 @@ matplotlib knows how to handle ``datetime.datetime`` but not Timestamp
 objects. While I recommend that you plot time series using ``TimeSeries.plot``,
 you can either use ``to_pydatetime`` or register a converter for the Timestamp
 type. See `matplotlib documentation
-<http://matplotlib.sourceforge.net/api/units_api.html>`__ for more on this.
+<http://matplotlib.org/api/units_api.html>`__ for more on this.
 
 .. warning::
 
@@ -271,4 +269,3 @@ unique. In many cases it will no longer fail (some method like ``append`` still
 check for uniqueness unless disabled). However, all is not lost: you can
 inspect ``index.is_unique`` and raise an exception explicitly if it is
 ``False`` or go to a different code branch.
-
diff --git a/doc/source/whatsnew/v0.8.1.txt b/doc/source/whatsnew/v0.8.1.txt
index 8227bc6bc9c66..add96bec9d1dd 100644
--- a/doc/source/whatsnew/v0.8.1.txt
+++ b/doc/source/whatsnew/v0.8.1.txt
@@ -32,5 +32,5 @@ Performance improvements
     strings with ``DatetimeIndex`` or ``to_datetime`` (:issue:`1571`)
   - Improve the performance of GroupBy on single-key aggregations and use with
     Categorical types
-  - Significant datetime parsing performance improvments
+  - Significant datetime parsing performance improvements
 
diff --git a/doc/source/whatsnew/v0.9.1.txt b/doc/source/whatsnew/v0.9.1.txt
index ce7439b8ecd92..1f58170b30244 100644
--- a/doc/source/whatsnew/v0.9.1.txt
+++ b/doc/source/whatsnew/v0.9.1.txt
@@ -8,7 +8,7 @@
 v0.9.1 (November 14, 2012)
 --------------------------
 
-This is a bugfix release from 0.9.0 and includes several new features and
+This is a bug fix release from 0.9.0 and includes several new features and
 enhancements along with a large number of bug fixes. The new features include
 by-column sort order for DataFrame and Series, improved NA handling for the rank
 method, masking functions for DataFrame, and intraday time-series filtering for
@@ -20,13 +20,20 @@ New features
   - `Series.sort`, `DataFrame.sort`, and `DataFrame.sort_index` can now be
     specified in a per-column manner to support multiple sort orders (:issue:`928`)
 
-    .. ipython:: python
-        :okwarning:
+    .. code-block:: ipython
 
-        df = DataFrame(np.random.randint(0, 2, (6, 3)), columns=['A', 'B', 'C'])
+       In [2]:  df = DataFrame(np.random.randint(0, 2, (6, 3)), columns=['A', 'B', 'C'])
 
-        df.sort(['A', 'B'], ascending=[1, 0])
+       In [3]: df.sort(['A', 'B'], ascending=[1, 0])
 
+       Out[3]:
+          A  B  C
+       3  0  1  1
+       4  0  1  1
+       2  0  0  1
+       0  1  0  0
+       1  1  0  0
+       5  1  0  0
 
   - `DataFrame.rank` now supports additional argument values for the
     `na_option` parameter so missing values can be assigned either the largest
@@ -36,7 +43,7 @@ New features
 
         df = DataFrame(np.random.randn(6, 3), columns=['A', 'B', 'C'])
 
-        df.ix[2:4] = np.nan
+        df.loc[2:4] = np.nan
 
         df.rank()
 
@@ -73,7 +80,7 @@ New features
 	   df.where(df>0,-df)
 
 	Furthermore, `where` now aligns the input boolean condition (ndarray or DataFrame), such that partial selection
-	with setting is possible. This is analagous to partial setting via `.ix` (but on the contents rather than the axis labels)
+	with setting is possible. This is analogous to partial setting via `.ix` (but on the contents rather than the axis labels)
 
 	.. ipython:: python
 
@@ -112,14 +119,21 @@ API changes
   - Upsampling data with a PeriodIndex will result in a higher frequency
     TimeSeries that spans the original time window
 
-    .. ipython:: python
-
-        prng = period_range('2012Q1', periods=2, freq='Q')
+    .. code-block:: ipython
 
-        s = Series(np.random.randn(len(prng)), prng)
+       In [1]: prng = period_range('2012Q1', periods=2, freq='Q')
 
-        s.resample('M')
+       In [2]: s = Series(np.random.randn(len(prng)), prng)
 
+       In [4]: s.resample('M')
+       Out[4]:
+       2012-01   -1.471992
+       2012-02         NaN
+       2012-03         NaN
+       2012-04   -0.493593
+       2012-05         NaN
+       2012-06         NaN
+       Freq: M, dtype: float64
 
   - Period.end_time now returns the last nanosecond in the time interval
     (:issue:`2124`, :issue:`2125`, :issue:`1764`)
diff --git a/doc/source/whatsnew/whatsnew_0171_html_table.html b/doc/source/whatsnew/whatsnew_0171_html_table.html
new file mode 100644
index 0000000000000..12965a045e41f
--- /dev/null
+++ b/doc/source/whatsnew/whatsnew_0171_html_table.html
@@ -0,0 +1,873 @@
+
+        <style  type="text/css" >
+        
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col0 {
+            
+                background-color:  #31688e;
+            
+                background-color:  #31688e;
+            
+                background-color:  #31688e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col1 {
+            
+                background-color:  #89d548;
+            
+                background-color:  #89d548;
+            
+                background-color:  #89d548;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col2 {
+            
+                background-color:  #3aba76;
+            
+                background-color:  #3aba76;
+            
+                background-color:  #3aba76;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col3 {
+            
+                background-color:  #31688e;
+            
+                background-color:  #31688e;
+            
+                background-color:  #31688e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col4 {
+            
+                background-color:  #24878e;
+            
+                background-color:  #24878e;
+            
+                background-color:  #24878e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col0 {
+            
+                background-color:  #fde725;
+            
+                background-color:  #fde725;
+            
+                background-color:  #fde725;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col1 {
+            
+                background-color:  #2c738e;
+            
+                background-color:  #2c738e;
+            
+                background-color:  #2c738e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col2 {
+            
+                background-color:  #1f9f88;
+            
+                background-color:  #1f9f88;
+            
+                background-color:  #1f9f88;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col3 {
+            
+                background-color:  #fde725;
+            
+                background-color:  #fde725;
+            
+                background-color:  #fde725;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col4 {
+            
+                background-color:  #297a8e;
+            
+                background-color:  #297a8e;
+            
+                background-color:  #297a8e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col0 {
+            
+                background-color:  #27808e;
+            
+                background-color:  #27808e;
+            
+                background-color:  #27808e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col1 {
+            
+                background-color:  #3bbb75;
+            
+                background-color:  #3bbb75;
+            
+                background-color:  #3bbb75;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col2 {
+            
+                background-color:  #b2dd2d;
+            
+                background-color:  #b2dd2d;
+            
+                background-color:  #b2dd2d;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col3 {
+            
+                background-color:  #1f9a8a;
+            
+                background-color:  #1f9a8a;
+            
+                background-color:  #1f9a8a;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col4 {
+            
+                background-color:  #228d8d;
+            
+                background-color:  #228d8d;
+            
+                background-color:  #228d8d;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col0 {
+            
+                background-color:  #218e8d;
+            
+                background-color:  #218e8d;
+            
+                background-color:  #218e8d;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col1 {
+            
+                background-color:  #efe51c;
+            
+                background-color:  #efe51c;
+            
+                background-color:  #efe51c;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col2 {
+            
+                background-color:  #fde725;
+            
+                background-color:  #fde725;
+            
+                background-color:  #fde725;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col3 {
+            
+                background-color:  #d5e21a;
+            
+                background-color:  #d5e21a;
+            
+                background-color:  #d5e21a;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col4 {
+            
+                background-color:  #2eb37c;
+            
+                background-color:  #2eb37c;
+            
+                background-color:  #2eb37c;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col0 {
+            
+                background-color:  #6ece58;
+            
+                background-color:  #6ece58;
+            
+                background-color:  #6ece58;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col1 {
+            
+                background-color:  #b2dd2d;
+            
+                background-color:  #b2dd2d;
+            
+                background-color:  #b2dd2d;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col2 {
+            
+                background-color:  #238a8d;
+            
+                background-color:  #238a8d;
+            
+                background-color:  #238a8d;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col3 {
+            
+                background-color:  #f1e51d;
+            
+                background-color:  #f1e51d;
+            
+                background-color:  #f1e51d;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col4 {
+            
+                background-color:  #31688e;
+            
+                background-color:  #31688e;
+            
+                background-color:  #31688e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col0 {
+            
+                background-color:  #26828e;
+            
+                background-color:  #26828e;
+            
+                background-color:  #26828e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col1 {
+            
+                background-color:  #81d34d;
+            
+                background-color:  #81d34d;
+            
+                background-color:  #81d34d;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col2 {
+            
+                background-color:  #2a768e;
+            
+                background-color:  #2a768e;
+            
+                background-color:  #2a768e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col3 {
+            
+                background-color:  #34b679;
+            
+                background-color:  #34b679;
+            
+                background-color:  #34b679;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col4 {
+            
+                background-color:  #297a8e;
+            
+                background-color:  #297a8e;
+            
+                background-color:  #297a8e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col0 {
+            
+                background-color:  #1f998a;
+            
+                background-color:  #1f998a;
+            
+                background-color:  #1f998a;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col1 {
+            
+                background-color:  #31688e;
+            
+                background-color:  #31688e;
+            
+                background-color:  #31688e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col2 {
+            
+                background-color:  #31688e;
+            
+                background-color:  #31688e;
+            
+                background-color:  #31688e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col3 {
+            
+                background-color:  #1f968b;
+            
+                background-color:  #1f968b;
+            
+                background-color:  #1f968b;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col4 {
+            
+                background-color:  #5cc863;
+            
+                background-color:  #5cc863;
+            
+                background-color:  #5cc863;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col0 {
+            
+                background-color:  #1f9e89;
+            
+                background-color:  #1f9e89;
+            
+                background-color:  #1f9e89;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col1 {
+            
+                background-color:  #40bd72;
+            
+                background-color:  #40bd72;
+            
+                background-color:  #40bd72;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col2 {
+            
+                background-color:  #5cc863;
+            
+                background-color:  #5cc863;
+            
+                background-color:  #5cc863;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col3 {
+            
+                background-color:  #228c8d;
+            
+                background-color:  #228c8d;
+            
+                background-color:  #228c8d;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col4 {
+            
+                background-color:  #28ae80;
+            
+                background-color:  #28ae80;
+            
+                background-color:  #28ae80;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col0 {
+            
+                background-color:  #2a788e;
+            
+                background-color:  #2a788e;
+            
+                background-color:  #2a788e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col1 {
+            
+                background-color:  #23898e;
+            
+                background-color:  #23898e;
+            
+                background-color:  #23898e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col2 {
+            
+                background-color:  #1fa088;
+            
+                background-color:  #1fa088;
+            
+                background-color:  #1fa088;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col3 {
+            
+                background-color:  #90d743;
+            
+                background-color:  #90d743;
+            
+                background-color:  #90d743;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col4 {
+            
+                background-color:  #2cb17e;
+            
+                background-color:  #2cb17e;
+            
+                background-color:  #2cb17e;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col0 {
+            
+                background-color:  #22a785;
+            
+                background-color:  #22a785;
+            
+                background-color:  #22a785;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col1 {
+            
+                background-color:  #fde725;
+            
+                background-color:  #fde725;
+            
+                background-color:  #fde725;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col2 {
+            
+                background-color:  #44bf70;
+            
+                background-color:  #44bf70;
+            
+                background-color:  #44bf70;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col3 {
+            
+                background-color:  #d2e21b;
+            
+                background-color:  #d2e21b;
+            
+                background-color:  #d2e21b;
+            
+            }
+        
+            #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col4 {
+            
+                background-color:  #fde725;
+            
+                background-color:  #fde725;
+            
+                background-color:  #fde725;
+            
+            }
+        
+        </style>
+
+        <table id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb">
+        
+
+        <thead>
+            
+            <tr>
+                
+                <th class="blank">
+                
+                <th class="col_heading level0 col0">a
+                
+                <th class="col_heading level0 col1">b
+                
+                <th class="col_heading level0 col2">c
+                
+                <th class="col_heading level0 col3">d
+                
+                <th class="col_heading level0 col4">e
+                
+            </tr>
+            
+        </thead>
+        <tbody>
+            
+            <tr>
+                
+                <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row0">
+                    
+                        0
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col0" class="data row0 col0">
+                    
+                        -1.085631
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col1" class="data row0 col1">
+                    
+                        0.997345
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col2" class="data row0 col2">
+                    
+                        0.282978
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col3" class="data row0 col3">
+                    
+                        -1.506295
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col4" class="data row0 col4">
+                    
+                        -0.5786
+                    
+                
+            </tr>
+            
+            <tr>
+                
+                <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row1">
+                    
+                        1
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col0" class="data row1 col0">
+                    
+                        1.651437
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col1" class="data row1 col1">
+                    
+                        -2.426679
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col2" class="data row1 col2">
+                    
+                        -0.428913
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col3" class="data row1 col3">
+                    
+                        1.265936
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col4" class="data row1 col4">
+                    
+                        -0.86674
+                    
+                
+            </tr>
+            
+            <tr>
+                
+                <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row2">
+                    
+                        2
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col0" class="data row2 col0">
+                    
+                        -0.678886
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col1" class="data row2 col1">
+                    
+                        -0.094709
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col2" class="data row2 col2">
+                    
+                        1.49139
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col3" class="data row2 col3">
+                    
+                        -0.638902
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col4" class="data row2 col4">
+                    
+                        -0.443982
+                    
+                
+            </tr>
+            
+            <tr>
+                
+                <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row3">
+                    
+                        3
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col0" class="data row3 col0">
+                    
+                        -0.434351
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col1" class="data row3 col1">
+                    
+                        2.20593
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col2" class="data row3 col2">
+                    
+                        2.186786
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col3" class="data row3 col3">
+                    
+                        1.004054
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col4" class="data row3 col4">
+                    
+                        0.386186
+                    
+                
+            </tr>
+            
+            <tr>
+                
+                <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row4">
+                    
+                        4
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col0" class="data row4 col0">
+                    
+                        0.737369
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col1" class="data row4 col1">
+                    
+                        1.490732
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col2" class="data row4 col2">
+                    
+                        -0.935834
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col3" class="data row4 col3">
+                    
+                        1.175829
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col4" class="data row4 col4">
+                    
+                        -1.253881
+                    
+                
+            </tr>
+            
+            <tr>
+                
+                <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row5">
+                    
+                        5
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col0" class="data row5 col0">
+                    
+                        -0.637752
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col1" class="data row5 col1">
+                    
+                        0.907105
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col2" class="data row5 col2">
+                    
+                        -1.428681
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col3" class="data row5 col3">
+                    
+                        -0.140069
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col4" class="data row5 col4">
+                    
+                        -0.861755
+                    
+                
+            </tr>
+            
+            <tr>
+                
+                <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row6">
+                    
+                        6
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col0" class="data row6 col0">
+                    
+                        -0.255619
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col1" class="data row6 col1">
+                    
+                        -2.798589
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col2" class="data row6 col2">
+                    
+                        -1.771533
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col3" class="data row6 col3">
+                    
+                        -0.699877
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col4" class="data row6 col4">
+                    
+                        0.927462
+                    
+                
+            </tr>
+            
+            <tr>
+                
+                <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row7">
+                    
+                        7
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col0" class="data row7 col0">
+                    
+                        -0.173636
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col1" class="data row7 col1">
+                    
+                        0.002846
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col2" class="data row7 col2">
+                    
+                        0.688223
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col3" class="data row7 col3">
+                    
+                        -0.879536
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col4" class="data row7 col4">
+                    
+                        0.283627
+                    
+                
+            </tr>
+            
+            <tr>
+                
+                <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row8">
+                    
+                        8
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col0" class="data row8 col0">
+                    
+                        -0.805367
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col1" class="data row8 col1">
+                    
+                        -1.727669
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col2" class="data row8 col2">
+                    
+                        -0.3909
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col3" class="data row8 col3">
+                    
+                        0.573806
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col4" class="data row8 col4">
+                    
+                        0.338589
+                    
+                
+            </tr>
+            
+            <tr>
+                
+                <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row9">
+                    
+                        9
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col0" class="data row9 col0">
+                    
+                        -0.01183
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col1" class="data row9 col1">
+                    
+                        2.392365
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col2" class="data row9 col2">
+                    
+                        0.412912
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col3" class="data row9 col3">
+                    
+                        0.978736
+                    
+                
+                <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col4" class="data row9 col4">
+                    
+                        2.238143
+                    
+                
+            </tr>
+            
+        </tbody>
+        </table>
+        
\ No newline at end of file
diff --git a/doc/sphinxext/README.rst b/doc/sphinxext/README.rst
index e39cf8daac036..2be5372bc0216 100644
--- a/doc/sphinxext/README.rst
+++ b/doc/sphinxext/README.rst
@@ -14,4 +14,4 @@ pandas documentation. These copies originate from other projects:
 
     These copies are maintained at the respective projects, so fixes should,
     to the extent possible, be pushed upstream instead of only adapting our
-    local copy to avoid divergence between the the local and upstream version.
+    local copy to avoid divergence between the local and upstream version.
diff --git a/doc/sphinxext/ipython_sphinxext/ipython_console_highlighting.py b/doc/sphinxext/ipython_sphinxext/ipython_console_highlighting.py
deleted file mode 100644
index dfb489e49394d..0000000000000
--- a/doc/sphinxext/ipython_sphinxext/ipython_console_highlighting.py
+++ /dev/null
@@ -1,116 +0,0 @@
-"""reST directive for syntax-highlighting ipython interactive sessions.
-
-XXX - See what improvements can be made based on the new (as of Sept 2009)
-'pycon' lexer for the python console.  At the very least it will give better
-highlighted tracebacks.
-"""
-
-#-----------------------------------------------------------------------------
-# Needed modules
-
-# Standard library
-import re
-
-# Third party
-from pygments.lexer import Lexer, do_insertions
-from pygments.lexers.agile import (PythonConsoleLexer, PythonLexer,
-                                   PythonTracebackLexer)
-from pygments.token import Comment, Generic
-
-from sphinx import highlighting
-
-#-----------------------------------------------------------------------------
-# Global constants
-line_re = re.compile('.*?\n')
-
-#-----------------------------------------------------------------------------
-# Code begins - classes and functions
-
-
-class IPythonConsoleLexer(Lexer):
-
-    """
-    For IPython console output or doctests, such as:
-
-    .. sourcecode:: ipython
-
-      In [1]: a = 'foo'
-
-      In [2]: a
-      Out[2]: 'foo'
-
-      In [3]: print(a)
-      foo
-
-      In [4]: 1 / 0
-
-    Notes:
-
-      - Tracebacks are not currently supported.
-
-      - It assumes the default IPython prompts, not customized ones.
-    """
-
-    name = 'IPython console session'
-    aliases = ['ipython']
-    mimetypes = ['text/x-ipython-console']
-    input_prompt = re.compile("(In \[[0-9]+\]: )|(   \.\.\.+:)")
-    output_prompt = re.compile("(Out\[[0-9]+\]: )|(   \.\.\.+:)")
-    continue_prompt = re.compile("   \.\.\.+:")
-    tb_start = re.compile("\-+")
-
-    def get_tokens_unprocessed(self, text):
-        pylexer = PythonLexer(**self.options)
-        tblexer = PythonTracebackLexer(**self.options)
-
-        curcode = ''
-        insertions = []
-        for match in line_re.finditer(text):
-            line = match.group()
-            input_prompt = self.input_prompt.match(line)
-            continue_prompt = self.continue_prompt.match(line.rstrip())
-            output_prompt = self.output_prompt.match(line)
-            if line.startswith("#"):
-                insertions.append((len(curcode),
-                                   [(0, Comment, line)]))
-            elif input_prompt is not None:
-                insertions.append((len(curcode),
-                                   [(0, Generic.Prompt, input_prompt.group())]))
-                curcode += line[input_prompt.end():]
-            elif continue_prompt is not None:
-                insertions.append((len(curcode),
-                                   [(0, Generic.Prompt, continue_prompt.group())]))
-                curcode += line[continue_prompt.end():]
-            elif output_prompt is not None:
-                # Use the 'error' token for output.  We should probably make
-                # our own token, but error is typicaly in a bright color like
-                # red, so it works fine for our output prompts.
-                insertions.append((len(curcode),
-                                   [(0, Generic.Error, output_prompt.group())]))
-                curcode += line[output_prompt.end():]
-            else:
-                if curcode:
-                    for item in do_insertions(insertions,
-                                              pylexer.get_tokens_unprocessed(curcode)):
-                        yield item
-                        curcode = ''
-                        insertions = []
-                yield match.start(), Generic.Output, line
-        if curcode:
-            for item in do_insertions(insertions,
-                                      pylexer.get_tokens_unprocessed(curcode)):
-                yield item
-
-
-def setup(app):
-    """Setup as a sphinx extension."""
-
-    # This is only a lexer, so adding it below to pygments appears sufficient.
-    # But if somebody knows that the right API usage should be to do that via
-    # sphinx, by all means fix it here.  At least having this setup.py
-    # suppresses the sphinx warning we'd get without it.
-    pass
-
-#-----------------------------------------------------------------------------
-# Register the extension as a valid pygments lexer
-highlighting.lexers['ipython'] = IPythonConsoleLexer()
diff --git a/doc/sphinxext/ipython_sphinxext/ipython_directive.py b/doc/sphinxext/ipython_sphinxext/ipython_directive.py
deleted file mode 100644
index ad7ada8e4eea3..0000000000000
--- a/doc/sphinxext/ipython_sphinxext/ipython_directive.py
+++ /dev/null
@@ -1,1089 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-Sphinx directive to support embedded IPython code.
-
-This directive allows pasting of entire interactive IPython sessions, prompts
-and all, and their code will actually get re-executed at doc build time, with
-all prompts renumbered sequentially. It also allows you to input code as a pure
-python input by giving the argument python to the directive. The output looks
-like an interactive ipython section.
-
-To enable this directive, simply list it in your Sphinx ``conf.py`` file
-(making sure the directory where you placed it is visible to sphinx, as is
-needed for all Sphinx directives). For example, to enable syntax highlighting
-and the IPython directive::
-
-    extensions = ['IPython.sphinxext.ipython_console_highlighting',
-                  'IPython.sphinxext.ipython_directive']
-
-The IPython directive outputs code-blocks with the language 'ipython'. So
-if you do not have the syntax highlighting extension enabled as well, then
-all rendered code-blocks will be uncolored. By default this directive assumes
-that your prompts are unchanged IPython ones, but this can be customized.
-The configurable options that can be placed in conf.py are:
-
-ipython_savefig_dir:
-    The directory in which to save the figures. This is relative to the
-    Sphinx source directory. The default is `html_static_path`.
-ipython_rgxin:
-    The compiled regular expression to denote the start of IPython input
-    lines. The default is re.compile('In \[(\d+)\]:\s?(.*)\s*'). You
-    shouldn't need to change this.
-ipython_rgxout:
-    The compiled regular expression to denote the start of IPython output
-    lines. The default is re.compile('Out\[(\d+)\]:\s?(.*)\s*'). You
-    shouldn't need to change this.
-ipython_promptin:
-    The string to represent the IPython input prompt in the generated ReST.
-    The default is 'In [%d]:'. This expects that the line numbers are used
-    in the prompt.
-ipython_promptout:
-    The string to represent the IPython prompt in the generated ReST. The
-    default is 'Out [%d]:'. This expects that the line numbers are used
-    in the prompt.
-ipython_mplbackend:
-    The string which specifies if the embedded Sphinx shell should import
-    Matplotlib and set the backend. The value specifies a backend that is
-    passed to `matplotlib.use()` before any lines in `ipython_execlines` are
-    executed. If not specified in conf.py, then the default value of 'agg' is
-    used. To use the IPython directive without matplotlib as a dependency, set
-    the value to `None`. It may end up that matplotlib is still imported
-    if the user specifies so in `ipython_execlines` or makes use of the
-    @savefig pseudo decorator.
-ipython_execlines:
-    A list of strings to be exec'd in the embedded Sphinx shell. Typical
-    usage is to make certain packages always available. Set this to an empty
-    list if you wish to have no imports always available. If specified in
-    conf.py as `None`, then it has the effect of making no imports available.
-    If omitted from conf.py altogether, then the default value of
-    ['import numpy as np', 'import matplotlib.pyplot as plt'] is used.
-ipython_holdcount
-    When the @suppress pseudo-decorator is used, the execution count can be
-    incremented or not. The default behavior is to hold the execution count,
-    corresponding to a value of `True`. Set this to `False` to increment
-    the execution count after each suppressed command.
-
-As an example, to use the IPython directive when `matplotlib` is not available,
-one sets the backend to `None`::
-
-    ipython_mplbackend = None
-
-An example usage of the directive is:
-
-.. code-block:: rst
-
-    .. ipython::
-
-        In [1]: x = 1
-
-        In [2]: y = x**2
-
-        In [3]: print(y)
-
-See http://matplotlib.org/sampledoc/ipython_directive.html for additional
-documentation.
-
-ToDo
-----
-
-- Turn the ad-hoc test() function into a real test suite.
-- Break up ipython-specific functionality from matplotlib stuff into better
-  separated code.
-
-Authors
--------
-
-- John D Hunter: orignal author.
-- Fernando Perez: refactoring, documentation, cleanups, port to 0.11.
-- VáclavŠmilauer <eudoxos-AT-arcig.cz>: Prompt generalizations.
-- Skipper Seabold, refactoring, cleanups, pure python addition
-"""
-from __future__ import print_function
-from __future__ import unicode_literals
-
-#-----------------------------------------------------------------------------
-# Imports
-#-----------------------------------------------------------------------------
-
-# Stdlib
-import os
-import re
-import sys
-import tempfile
-import ast
-from pandas.compat import zip, range, map, lmap, u, cStringIO as StringIO
-import warnings
-
-# To keep compatibility with various python versions
-try:
-    from hashlib import md5
-except ImportError:
-    from md5 import md5
-
-# Third-party
-import sphinx
-from docutils.parsers.rst import directives
-from docutils import nodes
-from sphinx.util.compat import Directive
-
-# Our own
-try:
-    from traitlets.config import Config
-except ImportError:
-    from IPython import Config
-from IPython import InteractiveShell
-from IPython.core.profiledir import ProfileDir
-from IPython.utils import io
-from IPython.utils.py3compat import PY3
-
-if PY3:
-    from io import StringIO
-    text_type = str
-else:
-    from StringIO import StringIO
-    text_type = unicode
-
-#-----------------------------------------------------------------------------
-# Globals
-#-----------------------------------------------------------------------------
-# for tokenizing blocks
-COMMENT, INPUT, OUTPUT =  range(3)
-
-#-----------------------------------------------------------------------------
-# Functions and class declarations
-#-----------------------------------------------------------------------------
-
-def block_parser(part, rgxin, rgxout, fmtin, fmtout):
-    """
-    part is a string of ipython text, comprised of at most one
-    input, one ouput, comments, and blank lines.  The block parser
-    parses the text into a list of::
-
-      blocks = [ (TOKEN0, data0), (TOKEN1, data1), ...]
-
-    where TOKEN is one of [COMMENT | INPUT | OUTPUT ] and
-    data is, depending on the type of token::
-
-      COMMENT : the comment string
-
-      INPUT: the (DECORATOR, INPUT_LINE, REST) where
-         DECORATOR: the input decorator (or None)
-         INPUT_LINE: the input as string (possibly multi-line)
-         REST : any stdout generated by the input line (not OUTPUT)
-
-      OUTPUT: the output string, possibly multi-line
-
-    """
-    block = []
-    lines = part.split('\n')
-    N = len(lines)
-    i = 0
-    decorator = None
-    while 1:
-
-        if i==N:
-            # nothing left to parse -- the last line
-            break
-
-        line = lines[i]
-        i += 1
-        line_stripped = line.strip()
-        if line_stripped.startswith('#'):
-            block.append((COMMENT, line))
-            continue
-
-        if line_stripped.startswith('@'):
-            # we're assuming at most one decorator -- may need to
-            # rethink
-            decorator = line_stripped
-            continue
-
-        # does this look like an input line?
-        matchin = rgxin.match(line)
-        if matchin:
-            lineno, inputline = int(matchin.group(1)), matchin.group(2)
-
-            # the ....: continuation string
-            continuation = '   %s:'%''.join(['.']*(len(str(lineno))+2))
-            Nc = len(continuation)
-            # input lines can continue on for more than one line, if
-            # we have a '\' line continuation char or a function call
-            # echo line 'print'.  The input line can only be
-            # terminated by the end of the block or an output line, so
-            # we parse out the rest of the input line if it is
-            # multiline as well as any echo text
-
-            rest = []
-            while i<N:
-
-                # look ahead; if the next line is blank, or a comment, or
-                # an output line, we're done
-
-                nextline = lines[i]
-                matchout = rgxout.match(nextline)
-                #print "nextline=%s, continuation=%s, starts=%s"%(nextline, continuation, nextline.startswith(continuation))
-                if matchout or nextline.startswith('#'):
-                    break
-                elif nextline.startswith(continuation):
-                    nextline = nextline[Nc:]
-                    if nextline and nextline[0] == ' ':
-                        nextline = nextline[1:]
-
-                    inputline += '\n' +  nextline
-
-                else:
-                    rest.append(nextline)
-                i+= 1
-
-            block.append((INPUT, (decorator, inputline, '\n'.join(rest))))
-            continue
-
-        # if it looks like an output line grab all the text to the end
-        # of the block
-        matchout = rgxout.match(line)
-        if matchout:
-            lineno, output = int(matchout.group(1)), matchout.group(2)
-            if i<N-1:
-                output = '\n'.join([output] + lines[i:])
-
-            block.append((OUTPUT, output))
-            break
-
-    return block
-
-
-class DecodingStringIO(StringIO, object):
-    def __init__(self,buf='',encodings=('utf8',), *args, **kwds):
-        super(DecodingStringIO, self).__init__(buf, *args, **kwds)
-        self.set_encodings(encodings)
-
-    def set_encodings(self, encodings):
-        self.encodings = encodings
-
-    def write(self,data):
-        if isinstance(data, text_type):
-            return super(DecodingStringIO, self).write(data)
-        else:
-            for enc in self.encodings:
-                try:
-                    data = data.decode(enc)
-                    return super(DecodingStringIO, self).write(data)
-                except :
-                    pass
-        # default to brute utf8 if no encoding succeded
-            return super(DecodingStringIO, self).write(data.decode('utf8', 'replace'))
-
-
-class EmbeddedSphinxShell(object):
-    """An embedded IPython instance to run inside Sphinx"""
-
-    def __init__(self, exec_lines=None,state=None):
-
-        self.cout = DecodingStringIO(u'')
-
-        if exec_lines is None:
-            exec_lines = []
-
-        self.state = state
-
-        # Create config object for IPython
-        config = Config()
-        config.InteractiveShell.autocall = False
-        config.InteractiveShell.autoindent = False
-        config.InteractiveShell.colors = 'NoColor'
-
-        # create a profile so instance history isn't saved
-        tmp_profile_dir = tempfile.mkdtemp(prefix='profile_')
-        profname = 'auto_profile_sphinx_build'
-        pdir = os.path.join(tmp_profile_dir,profname)
-        profile = ProfileDir.create_profile_dir(pdir)
-
-        # Create and initialize global ipython, but don't start its mainloop.
-        # This will persist across different EmbededSphinxShell instances.
-        IP = InteractiveShell.instance(config=config, profile_dir=profile)
-
-        # io.stdout redirect must be done after instantiating InteractiveShell
-        io.stdout = self.cout
-        io.stderr = self.cout
-
-        # For debugging, so we can see normal output, use this:
-        #from IPython.utils.io import Tee
-        #io.stdout = Tee(self.cout, channel='stdout') # dbg
-        #io.stderr = Tee(self.cout, channel='stderr') # dbg
-
-        # Store a few parts of IPython we'll need.
-        self.IP = IP
-        self.user_ns = self.IP.user_ns
-        self.user_global_ns = self.IP.user_global_ns
-
-        self.input = ''
-        self.output = ''
-
-        self.is_verbatim = False
-        self.is_doctest = False
-        self.is_suppress = False
-
-        # Optionally, provide more detailed information to shell.
-        self.directive = None
-
-        # on the first call to the savefig decorator, we'll import
-        # pyplot as plt so we can make a call to the plt.gcf().savefig
-        self._pyplot_imported = False
-
-        # Prepopulate the namespace.
-        for line in exec_lines:
-            self.process_input_line(line, store_history=False)
-
-    def clear_cout(self):
-        self.cout.seek(0)
-        self.cout.truncate(0)
-
-    def process_input_line(self, line, store_history=True):
-        """process the input, capturing stdout"""
-
-        stdout = sys.stdout
-        splitter = self.IP.input_splitter
-        try:
-            sys.stdout = self.cout
-            splitter.push(line)
-            more = splitter.push_accepts_more()
-            if not more:
-                try:
-                    source_raw = splitter.source_raw_reset()[1]
-                except:
-                    # recent ipython #4504
-                    source_raw = splitter.raw_reset()
-                self.IP.run_cell(source_raw, store_history=store_history)
-        finally:
-            sys.stdout = stdout
-
-    def process_image(self, decorator):
-        """
-        # build out an image directive like
-        # .. image:: somefile.png
-        #    :width 4in
-        #
-        # from an input like
-        # savefig somefile.png width=4in
-        """
-        savefig_dir = self.savefig_dir
-        source_dir = self.source_dir
-        saveargs = decorator.split(' ')
-        filename = saveargs[1]
-        # insert relative path to image file in source
-        outfile = os.path.relpath(os.path.join(savefig_dir,filename),
-                    source_dir)
-
-        imagerows = ['.. image:: %s'%outfile]
-
-        for kwarg in saveargs[2:]:
-            arg, val = kwarg.split('=')
-            arg = arg.strip()
-            val = val.strip()
-            imagerows.append('   :%s: %s'%(arg, val))
-
-        image_file = os.path.basename(outfile) # only return file name
-        image_directive = '\n'.join(imagerows)
-        return image_file, image_directive
-
-    # Callbacks for each type of token
-    def process_input(self, data, input_prompt, lineno):
-        """
-        Process data block for INPUT token.
-
-        """
-        decorator, input, rest = data
-        image_file = None
-        image_directive = None
-
-        is_verbatim = decorator=='@verbatim' or self.is_verbatim
-        is_doctest = (decorator is not None and \
-                     decorator.startswith('@doctest')) or self.is_doctest
-        is_suppress = decorator=='@suppress' or self.is_suppress
-        is_okexcept = decorator=='@okexcept' or self.is_okexcept
-        is_okwarning = decorator=='@okwarning' or self.is_okwarning
-        is_savefig = decorator is not None and \
-                     decorator.startswith('@savefig')
-
-        # set the encodings to be used by DecodingStringIO
-        # to convert the execution output into unicode if
-        # needed. this attrib is set by IpythonDirective.run()
-        # based on the specified block options, defaulting to ['ut
-        self.cout.set_encodings(self.output_encoding)
-
-        input_lines = input.split('\n')
-
-        if len(input_lines) > 1:
-           if input_lines[-1] != "":
-               input_lines.append('') # make sure there's a blank line
-                                       # so splitter buffer gets reset
-
-        continuation = '   %s:'%''.join(['.']*(len(str(lineno))+2))
-
-        if is_savefig:
-            image_file, image_directive = self.process_image(decorator)
-
-        ret = []
-        is_semicolon = False
-
-        # Hold the execution count, if requested to do so.
-        if is_suppress and self.hold_count:
-            store_history = False
-        else:
-            store_history = True
-
-        # Note: catch_warnings is not thread safe
-        with warnings.catch_warnings(record=True) as ws:
-            for i, line in enumerate(input_lines):
-                if line.endswith(';'):
-                    is_semicolon = True
-
-                if i == 0:
-                    # process the first input line
-                    if is_verbatim:
-                        self.process_input_line('')
-                        self.IP.execution_count += 1 # increment it anyway
-                    else:
-                        # only submit the line in non-verbatim mode
-                        self.process_input_line(line, store_history=store_history)
-                    formatted_line = '%s %s'%(input_prompt, line)
-                else:
-                    # process a continuation line
-                    if not is_verbatim:
-                        self.process_input_line(line, store_history=store_history)
-
-                    formatted_line = '%s %s'%(continuation, line)
-
-                if not is_suppress:
-                    ret.append(formatted_line)
-
-        if not is_suppress and len(rest.strip()) and is_verbatim:
-            # the "rest" is the standard output of the
-            # input, which needs to be added in
-            # verbatim mode
-            ret.append(rest)
-
-        self.cout.seek(0)
-        output = self.cout.read()
-        if not is_suppress and not is_semicolon:
-            ret.append(output)
-        elif is_semicolon: # get spacing right
-            ret.append('')
-
-        # context information
-        filename = self.state.document.current_source
-        lineno = self.state.document.current_line
-
-        # output any exceptions raised during execution to stdout
-        # unless :okexcept: has been specified.
-        if not is_okexcept and "Traceback" in output:
-            s =  "\nException in %s at block ending on line %s\n" % (filename, lineno)
-            s += "Specify :okexcept: as an option in the ipython:: block to suppress this message\n"
-            sys.stdout.write('\n\n>>>' + ('-' * 73))
-            sys.stdout.write(s)
-            sys.stdout.write(output)
-            sys.stdout.write('<<<' + ('-' * 73) + '\n\n')
-
-        # output any warning raised during execution to stdout
-        # unless :okwarning: has been specified.
-        if not is_okwarning:
-            for w in ws:
-                s =  "\nWarning in %s at block ending on line %s\n" % (filename, lineno)
-                s += "Specify :okwarning: as an option in the ipython:: block to suppress this message\n"
-                sys.stdout.write('\n\n>>>' + ('-' * 73))
-                sys.stdout.write(s)
-                sys.stdout.write('-' * 76 + '\n')
-                s=warnings.formatwarning(w.message, w.category,
-                                         w.filename, w.lineno, w.line)
-                sys.stdout.write(s)
-                sys.stdout.write('<<<' + ('-' * 73) + '\n')
-
-        self.cout.truncate(0)
-        return (ret, input_lines, output, is_doctest, decorator, image_file,
-                    image_directive)
-
-
-    def process_output(self, data, output_prompt,
-                       input_lines, output, is_doctest, decorator, image_file):
-        """
-        Process data block for OUTPUT token.
-
-        """
-        TAB = ' ' * 4
-
-        if is_doctest and output is not None:
-
-            found = output
-            found = found.strip()
-            submitted = data.strip()
-
-            if self.directive is None:
-                source = 'Unavailable'
-                content = 'Unavailable'
-            else:
-                source = self.directive.state.document.current_source
-                content = self.directive.content
-                # Add tabs and join into a single string.
-                content = '\n'.join([TAB + line for line in content])
-
-            # Make sure the output contains the output prompt.
-            ind = found.find(output_prompt)
-            if ind < 0:
-                e = ('output does not contain output prompt\n\n'
-                     'Document source: {0}\n\n'
-                     'Raw content: \n{1}\n\n'
-                     'Input line(s):\n{TAB}{2}\n\n'
-                     'Output line(s):\n{TAB}{3}\n\n')
-                e = e.format(source, content, '\n'.join(input_lines),
-                             repr(found), TAB=TAB)
-                raise RuntimeError(e)
-            found = found[len(output_prompt):].strip()
-
-            # Handle the actual doctest comparison.
-            if decorator.strip() == '@doctest':
-                # Standard doctest
-                if found != submitted:
-                    e = ('doctest failure\n\n'
-                         'Document source: {0}\n\n'
-                         'Raw content: \n{1}\n\n'
-                         'On input line(s):\n{TAB}{2}\n\n'
-                         'we found output:\n{TAB}{3}\n\n'
-                         'instead of the expected:\n{TAB}{4}\n\n')
-                    e = e.format(source, content, '\n'.join(input_lines),
-                                 repr(found), repr(submitted), TAB=TAB)
-                    raise RuntimeError(e)
-            else:
-                self.custom_doctest(decorator, input_lines, found, submitted)
-
-    def process_comment(self, data):
-        """Process data fPblock for COMMENT token."""
-        if not self.is_suppress:
-            return [data]
-
-    def save_image(self, image_file):
-        """
-        Saves the image file to disk.
-        """
-        self.ensure_pyplot()
-        command = ('plt.gcf().savefig("%s", bbox_inches="tight", '
-                   'dpi=100)' % image_file)
-
-        #print 'SAVEFIG', command  # dbg
-        self.process_input_line('bookmark ipy_thisdir', store_history=False)
-        self.process_input_line('cd -b ipy_savedir', store_history=False)
-        self.process_input_line(command, store_history=False)
-        self.process_input_line('cd -b ipy_thisdir', store_history=False)
-        self.process_input_line('bookmark -d ipy_thisdir', store_history=False)
-        self.clear_cout()
-
-    def process_block(self, block):
-        """
-        process block from the block_parser and return a list of processed lines
-        """
-        ret = []
-        output = None
-        input_lines = None
-        lineno = self.IP.execution_count
-
-        input_prompt = self.promptin % lineno
-        output_prompt = self.promptout % lineno
-        image_file = None
-        image_directive = None
-
-        for token, data in block:
-            if token == COMMENT:
-                out_data = self.process_comment(data)
-            elif token == INPUT:
-                (out_data, input_lines, output, is_doctest, decorator,
-                    image_file, image_directive) = \
-                          self.process_input(data, input_prompt, lineno)
-            elif token == OUTPUT:
-                out_data = \
-                    self.process_output(data, output_prompt,
-                                        input_lines, output, is_doctest,
-                                        decorator, image_file)
-            if out_data:
-                ret.extend(out_data)
-
-        # save the image files
-        if image_file is not None:
-            self.save_image(image_file)
-
-        return ret, image_directive
-
-    def ensure_pyplot(self):
-        """
-        Ensures that pyplot has been imported into the embedded IPython shell.
-
-        Also, makes sure to set the backend appropriately if not set already.
-
-        """
-        # We are here if the @figure pseudo decorator was used. Thus, it's
-        # possible that we could be here even if python_mplbackend were set to
-        # `None`. That's also strange and perhaps worthy of raising an
-        # exception, but for now, we just set the backend to 'agg'.
-
-        if not self._pyplot_imported:
-            if 'matplotlib.backends' not in sys.modules:
-                # Then ipython_matplotlib was set to None but there was a
-                # call to the @figure decorator (and ipython_execlines did
-                # not set a backend).
-                #raise Exception("No backend was set, but @figure was used!")
-                import matplotlib
-                matplotlib.use('agg')
-
-            # Always import pyplot into embedded shell.
-            self.process_input_line('import matplotlib.pyplot as plt',
-                                    store_history=False)
-            self._pyplot_imported = True
-
-    def process_pure_python(self, content):
-        """
-        content is a list of strings. it is unedited directive content
-
-        This runs it line by line in the InteractiveShell, prepends
-        prompts as needed capturing stderr and stdout, then returns
-        the content as a list as if it were ipython code
-        """
-        output = []
-        savefig = False # keep up with this to clear figure
-        multiline = False # to handle line continuation
-        multiline_start = None
-        fmtin = self.promptin
-
-        ct = 0
-
-        for lineno, line in enumerate(content):
-
-            line_stripped = line.strip()
-            if not len(line):
-                output.append(line)
-                continue
-
-            # handle decorators
-            if line_stripped.startswith('@'):
-                output.extend([line])
-                if 'savefig' in line:
-                    savefig = True # and need to clear figure
-                continue
-
-            # handle comments
-            if line_stripped.startswith('#'):
-                output.extend([line])
-                continue
-
-            # deal with lines checking for multiline
-            continuation  = u'   %s:'% ''.join(['.']*(len(str(ct))+2))
-            if not multiline:
-                modified = u"%s %s" % (fmtin % ct, line_stripped)
-                output.append(modified)
-                ct += 1
-                try:
-                    ast.parse(line_stripped)
-                    output.append(u'')
-                except Exception: # on a multiline
-                    multiline = True
-                    multiline_start = lineno
-            else: # still on a multiline
-                modified = u'%s %s' % (continuation, line)
-                output.append(modified)
-
-                # if the next line is indented, it should be part of multiline
-                if len(content) > lineno + 1:
-                    nextline = content[lineno + 1]
-                    if len(nextline) - len(nextline.lstrip()) > 3:
-                        continue
-                try:
-                    mod = ast.parse(
-                            '\n'.join(content[multiline_start:lineno+1]))
-                    if isinstance(mod.body[0], ast.FunctionDef):
-                        # check to see if we have the whole function
-                        for element in mod.body[0].body:
-                            if isinstance(element, ast.Return):
-                                multiline = False
-                    else:
-                        output.append(u'')
-                        multiline = False
-                except Exception:
-                    pass
-
-            if savefig: # clear figure if plotted
-                self.ensure_pyplot()
-                self.process_input_line('plt.clf()', store_history=False)
-                self.clear_cout()
-                savefig = False
-
-        return output
-
-    def custom_doctest(self, decorator, input_lines, found, submitted):
-        """
-        Perform a specialized doctest.
-
-        """
-        from .custom_doctests import doctests
-
-        args = decorator.split()
-        doctest_type = args[1]
-        if doctest_type in doctests:
-            doctests[doctest_type](self, args, input_lines, found, submitted)
-        else:
-            e = "Invalid option to @doctest: {0}".format(doctest_type)
-            raise Exception(e)
-
-
-class IPythonDirective(Directive):
-
-    has_content = True
-    required_arguments = 0
-    optional_arguments = 4 # python, suppress, verbatim, doctest
-    final_argumuent_whitespace = True
-    option_spec = { 'python': directives.unchanged,
-                    'suppress' : directives.flag,
-                    'verbatim' : directives.flag,
-                    'doctest' : directives.flag,
-                    'okexcept': directives.flag,
-                    'okwarning': directives.flag,
-                    'output_encoding': directives.unchanged_required
-                  }
-
-    shell = None
-
-    seen_docs = set()
-
-    def get_config_options(self):
-        # contains sphinx configuration variables
-        config = self.state.document.settings.env.config
-
-        # get config variables to set figure output directory
-        confdir = self.state.document.settings.env.app.confdir
-        savefig_dir = config.ipython_savefig_dir
-        source_dir = os.path.dirname(self.state.document.current_source)
-        if savefig_dir is None:
-            savefig_dir = config.html_static_path
-        if isinstance(savefig_dir, list):
-            savefig_dir = savefig_dir[0] # safe to assume only one path?
-        savefig_dir = os.path.join(confdir, savefig_dir)
-
-        # get regex and prompt stuff
-        rgxin      = config.ipython_rgxin
-        rgxout     = config.ipython_rgxout
-        promptin   = config.ipython_promptin
-        promptout  = config.ipython_promptout
-        mplbackend = config.ipython_mplbackend
-        exec_lines = config.ipython_execlines
-        hold_count = config.ipython_holdcount
-
-        return (savefig_dir, source_dir, rgxin, rgxout,
-                promptin, promptout, mplbackend, exec_lines, hold_count)
-
-    def setup(self):
-        # Get configuration values.
-        (savefig_dir, source_dir, rgxin, rgxout, promptin, promptout,
-         mplbackend, exec_lines, hold_count) = self.get_config_options()
-
-        if self.shell is None:
-            # We will be here many times.  However, when the
-            # EmbeddedSphinxShell is created, its interactive shell member
-            # is the same for each instance.
-
-            if mplbackend:
-                import matplotlib
-                # Repeated calls to use() will not hurt us since `mplbackend`
-                # is the same each time.
-                matplotlib.use(mplbackend)
-
-            # Must be called after (potentially) importing matplotlib and
-            # setting its backend since exec_lines might import pylab.
-            self.shell = EmbeddedSphinxShell(exec_lines, self.state)
-
-            # Store IPython directive to enable better error messages
-            self.shell.directive = self
-
-        # reset the execution count if we haven't processed this doc
-        #NOTE: this may be borked if there are multiple seen_doc tmp files
-        #check time stamp?
-        if not self.state.document.current_source in self.seen_docs:
-            self.shell.IP.history_manager.reset()
-            self.shell.IP.execution_count = 1
-            self.shell.IP.prompt_manager.width = 0
-            self.seen_docs.add(self.state.document.current_source)
-
-        # and attach to shell so we don't have to pass them around
-        self.shell.rgxin = rgxin
-        self.shell.rgxout = rgxout
-        self.shell.promptin = promptin
-        self.shell.promptout = promptout
-        self.shell.savefig_dir = savefig_dir
-        self.shell.source_dir = source_dir
-        self.shell.hold_count = hold_count
-
-        # setup bookmark for saving figures directory
-        self.shell.process_input_line('bookmark ipy_savedir %s'%savefig_dir,
-                                      store_history=False)
-        self.shell.clear_cout()
-
-        return rgxin, rgxout, promptin, promptout
-
-    def teardown(self):
-        # delete last bookmark
-        self.shell.process_input_line('bookmark -d ipy_savedir',
-                                      store_history=False)
-        self.shell.clear_cout()
-
-    def run(self):
-        debug = False
-
-        #TODO, any reason block_parser can't be a method of embeddable shell
-        # then we wouldn't have to carry these around
-        rgxin, rgxout, promptin, promptout = self.setup()
-
-        options = self.options
-        self.shell.is_suppress = 'suppress' in options
-        self.shell.is_doctest = 'doctest' in options
-        self.shell.is_verbatim = 'verbatim' in options
-        self.shell.is_okexcept = 'okexcept' in options
-        self.shell.is_okwarning = 'okwarning' in options
-
-        self.shell.output_encoding = [options.get('output_encoding', 'utf8')]
-
-        # handle pure python code
-        if 'python' in self.arguments:
-            content = self.content
-            self.content = self.shell.process_pure_python(content)
-
-        parts = '\n'.join(self.content).split('\n\n')
-
-        lines = ['.. code-block:: ipython', '']
-        figures = []
-
-        for part in parts:
-            block = block_parser(part, rgxin, rgxout, promptin, promptout)
-            if len(block):
-                rows, figure = self.shell.process_block(block)
-                for row in rows:
-                    lines.extend(['   %s'%line for line in row.split('\n')])
-
-                if figure is not None:
-                    figures.append(figure)
-
-        for figure in figures:
-            lines.append('')
-            lines.extend(figure.split('\n'))
-            lines.append('')
-
-        if len(lines)>2:
-            if debug:
-                print('\n'.join(lines))
-            else:
-                # This has to do with input, not output. But if we comment
-                # these lines out, then no IPython code will appear in the
-                # final output.
-                self.state_machine.insert_input(
-                    lines, self.state_machine.input_lines.source(0))
-
-        # cleanup
-        self.teardown()
-
-        return []
-
-# Enable as a proper Sphinx directive
-def setup(app):
-    setup.app = app
-
-    app.add_directive('ipython', IPythonDirective)
-    app.add_config_value('ipython_savefig_dir', None, 'env')
-    app.add_config_value('ipython_rgxin',
-                         re.compile('In \[(\d+)\]:\s?(.*)\s*'), 'env')
-    app.add_config_value('ipython_rgxout',
-                         re.compile('Out\[(\d+)\]:\s?(.*)\s*'), 'env')
-    app.add_config_value('ipython_promptin', 'In [%d]:', 'env')
-    app.add_config_value('ipython_promptout', 'Out[%d]:', 'env')
-
-    # We could just let matplotlib pick whatever is specified as the default
-    # backend in the matplotlibrc file, but this would cause issues if the
-    # backend didn't work in headless environments. For this reason, 'agg'
-    # is a good default backend choice.
-    app.add_config_value('ipython_mplbackend', 'agg', 'env')
-
-    # If the user sets this config value to `None`, then EmbeddedSphinxShell's
-    # __init__ method will treat it as [].
-    execlines = ['import numpy as np', 'import matplotlib.pyplot as plt']
-    app.add_config_value('ipython_execlines', execlines, 'env')
-
-    app.add_config_value('ipython_holdcount', True, 'env')
-
-# Simple smoke test, needs to be converted to a proper automatic test.
-def test():
-
-    examples = [
-        r"""
-In [9]: pwd
-Out[9]: '/home/jdhunter/py4science/book'
-
-In [10]: cd bookdata/
-/home/jdhunter/py4science/book/bookdata
-
-In [2]: from pylab import *
-
-In [2]: ion()
-
-In [3]: im = imread('stinkbug.png')
-
-@savefig mystinkbug.png width=4in
-In [4]: imshow(im)
-Out[4]: <matplotlib.image.AxesImage object at 0x39ea850>
-
-""",
-        r"""
-
-In [1]: x = 'hello world'
-
-# string methods can be
-# used to alter the string
-@doctest
-In [2]: x.upper()
-Out[2]: 'HELLO WORLD'
-
-@verbatim
-In [3]: x.st<TAB>
-x.startswith  x.strip
-""",
-    r"""
-
-In [130]: url = 'http://ichart.finance.yahoo.com/table.csv?s=CROX\
-   .....: &d=9&e=22&f=2009&g=d&a=1&br=8&c=2006&ignore=.csv'
-
-In [131]: print url.split('&')
-['http://ichart.finance.yahoo.com/table.csv?s=CROX', 'd=9', 'e=22', 'f=2009', 'g=d', 'a=1', 'b=8', 'c=2006', 'ignore=.csv']
-
-In [60]: import urllib
-
-""",
-    r"""\
-
-In [133]: import numpy.random
-
-@suppress
-In [134]: numpy.random.seed(2358)
-
-@doctest
-In [135]: numpy.random.rand(10,2)
-Out[135]:
-array([[ 0.64524308,  0.59943846],
-       [ 0.47102322,  0.8715456 ],
-       [ 0.29370834,  0.74776844],
-       [ 0.99539577,  0.1313423 ],
-       [ 0.16250302,  0.21103583],
-       [ 0.81626524,  0.1312433 ],
-       [ 0.67338089,  0.72302393],
-       [ 0.7566368 ,  0.07033696],
-       [ 0.22591016,  0.77731835],
-       [ 0.0072729 ,  0.34273127]])
-
-""",
-
-    r"""
-In [106]: print x
-jdh
-
-In [109]: for i in range(10):
-   .....:     print i
-   .....:
-   .....:
-0
-1
-2
-3
-4
-5
-6
-7
-8
-9
-""",
-
-        r"""
-
-In [144]: from pylab import *
-
-In [145]: ion()
-
-# use a semicolon to suppress the output
-@savefig test_hist.png width=4in
-In [151]: hist(np.random.randn(10000), 100);
-
-
-@savefig test_plot.png width=4in
-In [151]: plot(np.random.randn(10000), 'o');
-   """,
-
-        r"""
-# use a semicolon to suppress the output
-In [151]: plt.clf()
-
-@savefig plot_simple.png width=4in
-In [151]: plot([1,2,3])
-
-@savefig hist_simple.png width=4in
-In [151]: hist(np.random.randn(10000), 100);
-
-""",
-     r"""
-# update the current fig
-In [151]: ylabel('number')
-
-In [152]: title('normal distribution')
-
-
-@savefig hist_with_text.png
-In [153]: grid(True)
-
-@doctest float
-In [154]: 0.1 + 0.2
-Out[154]: 0.3
-
-@doctest float
-In [155]: np.arange(16).reshape(4,4)
-Out[155]:
-array([[ 0,  1,  2,  3],
-       [ 4,  5,  6,  7],
-       [ 8,  9, 10, 11],
-       [12, 13, 14, 15]])
-
-In [1]: x = np.arange(16, dtype=float).reshape(4,4)
-
-In [2]: x[0,0] = np.inf
-
-In [3]: x[0,1] = np.nan
-
-@doctest float
-In [4]: x
-Out[4]:
-array([[ inf,  nan,   2.,   3.],
-       [  4.,   5.,   6.,   7.],
-       [  8.,   9.,  10.,  11.],
-       [ 12.,  13.,  14.,  15.]])
-
-
-        """,
-        ]
-    # skip local-file depending first example:
-    examples = examples[1:]
-
-    #ipython_directive.DEBUG = True  # dbg
-    #options = dict(suppress=True)  # dbg
-    options = dict()
-    for example in examples:
-        content = example.split('\n')
-        IPythonDirective('debug', arguments=None, options=options,
-                          content=content, lineno=0,
-                          content_offset=None, block_text=None,
-                          state=None, state_machine=None,
-                          )
-
-# Run test suite as a script
-if __name__=='__main__':
-    if not os.path.isdir('_static'):
-        os.mkdir('_static')
-    test()
-    print('All OK? Check figures in _static/')
diff --git a/doc/sphinxext/numpydoc/LICENSE.txt b/doc/sphinxext/numpydoc/LICENSE.txt
old mode 100755
new mode 100644
diff --git a/doc/sphinxext/numpydoc/README.rst b/doc/sphinxext/numpydoc/README.rst
index 89b9f2fd23e9b..f91811ef9add6 100755
--- a/doc/sphinxext/numpydoc/README.rst
+++ b/doc/sphinxext/numpydoc/README.rst
@@ -46,6 +46,6 @@ The following options can be set in conf.py:
   methods and attributes. If a table of contents is made, Sphinx expects
   each entry to have a separate page.
 
-- numpydoc_edit_link: bool  (DEPRECATED -- edit your HTML template instead)
+- numpydoc_edit_link: bool (DEPRECATED -- edit your HTML template instead)
 
   Whether to insert an edit link after docstrings.
diff --git a/doc/sphinxext/numpydoc/__init__.py b/doc/sphinxext/numpydoc/__init__.py
old mode 100755
new mode 100644
index 0fce2cf747e23..30dba8fcf9132
--- a/doc/sphinxext/numpydoc/__init__.py
+++ b/doc/sphinxext/numpydoc/__init__.py
@@ -1,3 +1,8 @@
 from __future__ import division, absolute_import, print_function
 
-from .numpydoc import setup
+__version__ = '0.8.0.dev0'
+
+
+def setup(app, *args, **kwargs):
+    from .numpydoc import setup
+    return setup(app, *args, **kwargs)
diff --git a/doc/sphinxext/numpydoc/comment_eater.py b/doc/sphinxext/numpydoc/comment_eater.py
deleted file mode 100755
index 8cddd3305f0bc..0000000000000
--- a/doc/sphinxext/numpydoc/comment_eater.py
+++ /dev/null
@@ -1,169 +0,0 @@
-from __future__ import division, absolute_import, print_function
-
-import sys
-if sys.version_info[0] >= 3:
-    from io import StringIO
-else:
-    from io import StringIO
-
-import compiler
-import inspect
-import textwrap
-import tokenize
-
-from .compiler_unparse import unparse
-
-
-class Comment(object):
-    """ A comment block.
-    """
-    is_comment = True
-    def __init__(self, start_lineno, end_lineno, text):
-        # int : The first line number in the block. 1-indexed.
-        self.start_lineno = start_lineno
-        # int : The last line number. Inclusive!
-        self.end_lineno = end_lineno
-        # str : The text block including '#' character but not any leading spaces.
-        self.text = text
-
-    def add(self, string, start, end, line):
-        """ Add a new comment line.
-        """
-        self.start_lineno = min(self.start_lineno, start[0])
-        self.end_lineno = max(self.end_lineno, end[0])
-        self.text += string
-
-    def __repr__(self):
-        return '%s(%r, %r, %r)' % (self.__class__.__name__, self.start_lineno,
-            self.end_lineno, self.text)
-
-
-class NonComment(object):
-    """ A non-comment block of code.
-    """
-    is_comment = False
-    def __init__(self, start_lineno, end_lineno):
-        self.start_lineno = start_lineno
-        self.end_lineno = end_lineno
-
-    def add(self, string, start, end, line):
-        """ Add lines to the block.
-        """
-        if string.strip():
-            # Only add if not entirely whitespace.
-            self.start_lineno = min(self.start_lineno, start[0])
-            self.end_lineno = max(self.end_lineno, end[0])
-
-    def __repr__(self):
-        return '%s(%r, %r)' % (self.__class__.__name__, self.start_lineno,
-            self.end_lineno)
-
-
-class CommentBlocker(object):
-    """ Pull out contiguous comment blocks.
-    """
-    def __init__(self):
-        # Start with a dummy.
-        self.current_block = NonComment(0, 0)
-
-        # All of the blocks seen so far.
-        self.blocks = []
-
-        # The index mapping lines of code to their associated comment blocks.
-        self.index = {}
-
-    def process_file(self, file):
-        """ Process a file object.
-        """
-        if sys.version_info[0] >= 3:
-            nxt = file.__next__
-        else:
-            nxt = file.next
-        for token in tokenize.generate_tokens(nxt):
-            self.process_token(*token)
-        self.make_index()
-
-    def process_token(self, kind, string, start, end, line):
-        """ Process a single token.
-        """
-        if self.current_block.is_comment:
-            if kind == tokenize.COMMENT:
-                self.current_block.add(string, start, end, line)
-            else:
-                self.new_noncomment(start[0], end[0])
-        else:
-            if kind == tokenize.COMMENT:
-                self.new_comment(string, start, end, line)
-            else:
-                self.current_block.add(string, start, end, line)
-
-    def new_noncomment(self, start_lineno, end_lineno):
-        """ We are transitioning from a noncomment to a comment.
-        """
-        block = NonComment(start_lineno, end_lineno)
-        self.blocks.append(block)
-        self.current_block = block
-
-    def new_comment(self, string, start, end, line):
-        """ Possibly add a new comment.
-
-        Only adds a new comment if this comment is the only thing on the line.
-        Otherwise, it extends the noncomment block.
-        """
-        prefix = line[:start[1]]
-        if prefix.strip():
-            # Oops! Trailing comment, not a comment block.
-            self.current_block.add(string, start, end, line)
-        else:
-            # A comment block.
-            block = Comment(start[0], end[0], string)
-            self.blocks.append(block)
-            self.current_block = block
-
-    def make_index(self):
-        """ Make the index mapping lines of actual code to their associated
-        prefix comments.
-        """
-        for prev, block in zip(self.blocks[:-1], self.blocks[1:]):
-            if not block.is_comment:
-                self.index[block.start_lineno] = prev
-
-    def search_for_comment(self, lineno, default=None):
-        """ Find the comment block just before the given line number.
-
-        Returns None (or the specified default) if there is no such block.
-        """
-        if not self.index:
-            self.make_index()
-        block = self.index.get(lineno, None)
-        text = getattr(block, 'text', default)
-        return text
-
-
-def strip_comment_marker(text):
-    """ Strip # markers at the front of a block of comment text.
-    """
-    lines = []
-    for line in text.splitlines():
-        lines.append(line.lstrip('#'))
-    text = textwrap.dedent('\n'.join(lines))
-    return text
-
-
-def get_class_traits(klass):
-    """ Yield all of the documentation for trait definitions on a class object.
-    """
-    # FIXME: gracefully handle errors here or in the caller?
-    source = inspect.getsource(klass)
-    cb = CommentBlocker()
-    cb.process_file(StringIO(source))
-    mod_ast = compiler.parse(source)
-    class_ast = mod_ast.node.nodes[0]
-    for node in class_ast.code.nodes:
-        # FIXME: handle other kinds of assignments?
-        if isinstance(node, compiler.ast.Assign):
-            name = node.nodes[0].name
-            rhs = unparse(node.expr).strip()
-            doc = strip_comment_marker(cb.search_for_comment(node.lineno, default=''))
-            yield name, rhs, doc
-
diff --git a/doc/sphinxext/numpydoc/compiler_unparse.py b/doc/sphinxext/numpydoc/compiler_unparse.py
deleted file mode 100755
index 8933a83db3f23..0000000000000
--- a/doc/sphinxext/numpydoc/compiler_unparse.py
+++ /dev/null
@@ -1,865 +0,0 @@
-""" Turn compiler.ast structures back into executable python code.
-
-    The unparse method takes a compiler.ast tree and transforms it back into
-    valid python code.  It is incomplete and currently only works for
-    import statements, function calls, function definitions, assignments, and
-    basic expressions.
-
-    Inspired by python-2.5-svn/Demo/parser/unparse.py
-
-    fixme: We may want to move to using _ast trees because the compiler for
-           them is about 6 times faster than compiler.compile.
-"""
-from __future__ import division, absolute_import, print_function
-
-import sys
-from compiler.ast import Const, Name, Tuple, Div, Mul, Sub, Add
-
-if sys.version_info[0] >= 3:
-    from io import StringIO
-else:
-    from StringIO import StringIO
-
-def unparse(ast, single_line_functions=False):
-    s = StringIO()
-    UnparseCompilerAst(ast, s, single_line_functions)
-    return s.getvalue().lstrip()
-
-op_precedence = { 'compiler.ast.Power':3, 'compiler.ast.Mul':2, 'compiler.ast.Div':2,
-                  'compiler.ast.Add':1, 'compiler.ast.Sub':1 }
-
-class UnparseCompilerAst:
-    """ Methods in this class recursively traverse an AST and
-        output source code for the abstract syntax; original formatting
-        is disregarged.
-    """
-
-    #########################################################################
-    # object interface.
-    #########################################################################
-
-    def __init__(self, tree, file = sys.stdout, single_line_functions=False):
-        """ Unparser(tree, file=sys.stdout) -> None.
-
-            Print the source for tree to file.
-        """
-        self.f = file
-        self._single_func = single_line_functions
-        self._do_indent = True
-        self._indent = 0
-        self._dispatch(tree)
-        self._write("\n")
-        self.f.flush()
-
-    #########################################################################
-    # Unparser private interface.
-    #########################################################################
-
-    ### format, output, and dispatch methods ################################
-
-    def _fill(self, text = ""):
-        "Indent a piece of text, according to the current indentation level"
-        if self._do_indent:
-            self._write("\n"+"    "*self._indent + text)
-        else:
-            self._write(text)
-
-    def _write(self, text):
-        "Append a piece of text to the current line."
-        self.f.write(text)
-
-    def _enter(self):
-        "Print ':', and increase the indentation."
-        self._write(": ")
-        self._indent += 1
-
-    def _leave(self):
-        "Decrease the indentation level."
-        self._indent -= 1
-
-    def _dispatch(self, tree):
-        "_dispatcher function, _dispatching tree type T to method _T."
-        if isinstance(tree, list):
-            for t in tree:
-                self._dispatch(t)
-            return
-        meth = getattr(self, "_"+tree.__class__.__name__)
-        if tree.__class__.__name__ == 'NoneType' and not self._do_indent:
-            return
-        meth(tree)
-
-
-    #########################################################################
-    # compiler.ast unparsing methods.
-    #
-    # There should be one method per concrete grammar type. They are
-    # organized in alphabetical order.
-    #########################################################################
-
-    def _Add(self, t):
-        self.__binary_op(t, '+')
-
-    def _And(self, t):
-        self._write(" (")
-        for i, node in enumerate(t.nodes):
-            self._dispatch(node)
-            if i != len(t.nodes)-1:
-                self._write(") and (")
-        self._write(")")
-
-    def _AssAttr(self, t):
-        """ Handle assigning an attribute of an object
-        """
-        self._dispatch(t.expr)
-        self._write('.'+t.attrname)
-
-    def _Assign(self, t):
-        """ Expression Assignment such as "a = 1".
-
-            This only handles assignment in expressions.  Keyword assignment
-            is handled separately.
-        """
-        self._fill()
-        for target in t.nodes:
-            self._dispatch(target)
-            self._write(" = ")
-        self._dispatch(t.expr)
-        if not self._do_indent:
-            self._write('; ')
-
-    def _AssName(self, t):
-        """ Name on left hand side of expression.
-
-            Treat just like a name on the right side of an expression.
-        """
-        self._Name(t)
-
-    def _AssTuple(self, t):
-        """ Tuple on left hand side of an expression.
-        """
-
-        # _write each elements, separated by a comma.
-        for element in t.nodes[:-1]:
-            self._dispatch(element)
-            self._write(", ")
-
-        # Handle the last one without writing comma
-        last_element = t.nodes[-1]
-        self._dispatch(last_element)
-
-    def _AugAssign(self, t):
-        """ +=,-=,*=,/=,**=, etc. operations
-        """
-
-        self._fill()
-        self._dispatch(t.node)
-        self._write(' '+t.op+' ')
-        self._dispatch(t.expr)
-        if not self._do_indent:
-            self._write(';')
-
-    def _Bitand(self, t):
-        """ Bit and operation.
-        """
-
-        for i, node in enumerate(t.nodes):
-            self._write("(")
-            self._dispatch(node)
-            self._write(")")
-            if i != len(t.nodes)-1:
-                self._write(" & ")
-
-    def _Bitor(self, t):
-        """ Bit or operation
-        """
-
-        for i, node in enumerate(t.nodes):
-            self._write("(")
-            self._dispatch(node)
-            self._write(")")
-            if i != len(t.nodes)-1:
-                self._write(" | ")
-
-    def _CallFunc(self, t):
-        """ Function call.
-        """
-        self._dispatch(t.node)
-        self._write("(")
-        comma = False
-        for e in t.args:
-            if comma: self._write(", ")
-            else: comma = True
-            self._dispatch(e)
-        if t.star_args:
-            if comma: self._write(", ")
-            else: comma = True
-            self._write("*")
-            self._dispatch(t.star_args)
-        if t.dstar_args:
-            if comma: self._write(", ")
-            else: comma = True
-            self._write("**")
-            self._dispatch(t.dstar_args)
-        self._write(")")
-
-    def _Compare(self, t):
-        self._dispatch(t.expr)
-        for op, expr in t.ops:
-            self._write(" " + op + " ")
-            self._dispatch(expr)
-
-    def _Const(self, t):
-        """ A constant value such as an integer value, 3, or a string, "hello".
-        """
-        self._dispatch(t.value)
-
-    def _Decorators(self, t):
-        """ Handle function decorators (eg. @has_units)
-        """
-        for node in t.nodes:
-            self._dispatch(node)
-
-    def _Dict(self, t):
-        self._write("{")
-        for  i, (k, v) in enumerate(t.items):
-            self._dispatch(k)
-            self._write(": ")
-            self._dispatch(v)
-            if i < len(t.items)-1:
-                self._write(", ")
-        self._write("}")
-
-    def _Discard(self, t):
-        """ Node for when return value is ignored such as in "foo(a)".
-        """
-        self._fill()
-        self._dispatch(t.expr)
-
-    def _Div(self, t):
-        self.__binary_op(t, '/')
-
-    def _Ellipsis(self, t):
-        self._write("...")
-
-    def _From(self, t):
-        """ Handle "from xyz import foo, bar as baz".
-        """
-        # fixme: Are From and ImportFrom handled differently?
-        self._fill("from ")
-        self._write(t.modname)
-        self._write(" import ")
-        for i, (name,asname) in enumerate(t.names):
-            if i != 0:
-                self._write(", ")
-            self._write(name)
-            if asname is not None:
-                self._write(" as "+asname)
-
-    def _Function(self, t):
-        """ Handle function definitions
-        """
-        if t.decorators is not None:
-            self._fill("@")
-            self._dispatch(t.decorators)
-        self._fill("def "+t.name + "(")
-        defaults = [None] * (len(t.argnames) - len(t.defaults)) + list(t.defaults)
-        for i, arg in enumerate(zip(t.argnames, defaults)):
-            self._write(arg[0])
-            if arg[1] is not None:
-                self._write('=')
-                self._dispatch(arg[1])
-            if i < len(t.argnames)-1:
-                self._write(', ')
-        self._write(")")
-        if self._single_func:
-            self._do_indent = False
-        self._enter()
-        self._dispatch(t.code)
-        self._leave()
-        self._do_indent = True
-
-    def _Getattr(self, t):
-        """ Handle getting an attribute of an object
-        """
-        if isinstance(t.expr, (Div, Mul, Sub, Add)):
-            self._write('(')
-            self._dispatch(t.expr)
-            self._write(')')
-        else:
-            self._dispatch(t.expr)
-            
-        self._write('.'+t.attrname)
-        
-    def _If(self, t):
-        self._fill()
-        
-        for i, (compare,code) in enumerate(t.tests):
-            if i == 0:
-                self._write("if ")
-            else:
-                self._write("elif ")
-            self._dispatch(compare)
-            self._enter()
-            self._fill()
-            self._dispatch(code)
-            self._leave()
-            self._write("\n")
-
-        if t.else_ is not None:
-            self._write("else")
-            self._enter()
-            self._fill()
-            self._dispatch(t.else_)
-            self._leave()
-            self._write("\n")
-            
-    def _IfExp(self, t):
-        self._dispatch(t.then)
-        self._write(" if ")
-        self._dispatch(t.test)
-
-        if t.else_ is not None:
-            self._write(" else (")
-            self._dispatch(t.else_)
-            self._write(")")
-
-    def _Import(self, t):
-        """ Handle "import xyz.foo".
-        """
-        self._fill("import ")
-        
-        for i, (name,asname) in enumerate(t.names):
-            if i != 0:
-                self._write(", ")
-            self._write(name)
-            if asname is not None:
-                self._write(" as "+asname)
-
-    def _Keyword(self, t):
-        """ Keyword value assignment within function calls and definitions.
-        """
-        self._write(t.name)
-        self._write("=")
-        self._dispatch(t.expr)
-        
-    def _List(self, t):
-        self._write("[")
-        for  i,node in enumerate(t.nodes):
-            self._dispatch(node)
-            if i < len(t.nodes)-1:
-                self._write(", ")
-        self._write("]")
-
-    def _Module(self, t):
-        if t.doc is not None:
-            self._dispatch(t.doc)
-        self._dispatch(t.node)
-
-    def _Mul(self, t):
-        self.__binary_op(t, '*')
-
-    def _Name(self, t):
-        self._write(t.name)
-
-    def _NoneType(self, t):
-        self._write("None")
-        
-    def _Not(self, t):
-        self._write('not (')
-        self._dispatch(t.expr)
-        self._write(')')
-        
-    def _Or(self, t):
-        self._write(" (")
-        for i, node in enumerate(t.nodes):
-            self._dispatch(node)
-            if i != len(t.nodes)-1:
-                self._write(") or (")
-        self._write(")")
-                
-    def _Pass(self, t):
-        self._write("pass\n")
-
-    def _Printnl(self, t):
-        self._fill("print ")
-        if t.dest:
-            self._write(">> ")
-            self._dispatch(t.dest)
-            self._write(", ")
-        comma = False
-        for node in t.nodes:
-            if comma: self._write(', ')
-            else: comma = True
-            self._dispatch(node)
-
-    def _Power(self, t):
-        self.__binary_op(t, '**')
-
-    def _Return(self, t):
-        self._fill("return ")
-        if t.value:
-            if isinstance(t.value, Tuple):
-                text = ', '.join([ name.name for name in t.value.asList() ])
-                self._write(text)
-            else:
-                self._dispatch(t.value)
-            if not self._do_indent:
-                self._write('; ')
-
-    def _Slice(self, t):
-        self._dispatch(t.expr)
-        self._write("[")
-        if t.lower:
-            self._dispatch(t.lower)
-        self._write(":")
-        if t.upper:
-            self._dispatch(t.upper)
-        #if t.step:
-        #    self._write(":")
-        #    self._dispatch(t.step)
-        self._write("]")
-
-    def _Sliceobj(self, t):
-        for i, node in enumerate(t.nodes):
-            if i != 0:
-                self._write(":")
-            if not (isinstance(node, Const) and node.value is None):
-                self._dispatch(node)
-
-    def _Stmt(self, tree):
-        for node in tree.nodes:
-            self._dispatch(node)
-
-    def _Sub(self, t):
-        self.__binary_op(t, '-')
-
-    def _Subscript(self, t):
-        self._dispatch(t.expr)
-        self._write("[")
-        for i, value in enumerate(t.subs):
-            if i != 0:
-                self._write(",")
-            self._dispatch(value)
-        self._write("]")
-
-    def _TryExcept(self, t):
-        self._fill("try")
-        self._enter()
-        self._dispatch(t.body)
-        self._leave()
-
-        for handler in t.handlers:
-            self._fill('except ')
-            self._dispatch(handler[0])
-            if handler[1] is not None:
-                self._write(', ')
-                self._dispatch(handler[1])
-            self._enter()
-            self._dispatch(handler[2])
-            self._leave()
-            
-        if t.else_:
-            self._fill("else")
-            self._enter()
-            self._dispatch(t.else_)
-            self._leave()
-
-    def _Tuple(self, t):
-
-        if not t.nodes:
-            # Empty tuple.
-            self._write("()")
-        else:
-            self._write("(")
-
-            # _write each elements, separated by a comma.
-            for element in t.nodes[:-1]:
-                self._dispatch(element)
-                self._write(", ")
-
-            # Handle the last one without writing comma
-            last_element = t.nodes[-1]
-            self._dispatch(last_element)
-
-            self._write(")")
-            
-    def _UnaryAdd(self, t):
-        self._write("+")
-        self._dispatch(t.expr)
-        
-    def _UnarySub(self, t):
-        self._write("-")
-        self._dispatch(t.expr)        
-
-    def _With(self, t):
-        self._fill('with ')
-        self._dispatch(t.expr)
-        if t.vars:
-            self._write(' as ')
-            self._dispatch(t.vars.name)
-        self._enter()
-        self._dispatch(t.body)
-        self._leave()
-        self._write('\n')
-        
-    def _int(self, t):
-        self._write(repr(t))
-
-    def __binary_op(self, t, symbol):
-        # Check if parenthesis are needed on left side and then dispatch
-        has_paren = False
-        left_class = str(t.left.__class__)
-        if (left_class in op_precedence.keys() and
-            op_precedence[left_class] < op_precedence[str(t.__class__)]):
-            has_paren = True
-        if has_paren:
-            self._write('(')
-        self._dispatch(t.left)
-        if has_paren:
-            self._write(')')
-        # Write the appropriate symbol for operator
-        self._write(symbol)
-        # Check if parenthesis are needed on the right side and then dispatch
-        has_paren = False
-        right_class = str(t.right.__class__)
-        if (right_class in op_precedence.keys() and
-            op_precedence[right_class] < op_precedence[str(t.__class__)]):
-            has_paren = True
-        if has_paren:
-            self._write('(')
-        self._dispatch(t.right)
-        if has_paren:
-            self._write(')')
-
-    def _float(self, t):
-        # if t is 0.1, str(t)->'0.1' while repr(t)->'0.1000000000001'
-        # We prefer str here.
-        self._write(str(t))
-
-    def _str(self, t):
-        self._write(repr(t))
-        
-    def _tuple(self, t):
-        self._write(str(t))
-
-    #########################################################################
-    # These are the methods from the _ast modules unparse.
-    #
-    # As our needs to handle more advanced code increase, we may want to
-    # modify some of the methods below so that they work for compiler.ast.
-    #########################################################################
-
-#    # stmt
-#    def _Expr(self, tree):
-#        self._fill()
-#        self._dispatch(tree.value)
-#
-#    def _Import(self, t):
-#        self._fill("import ")
-#        first = True
-#        for a in t.names:
-#            if first:
-#                first = False
-#            else:
-#                self._write(", ")
-#            self._write(a.name)
-#            if a.asname:
-#                self._write(" as "+a.asname)
-#
-##    def _ImportFrom(self, t):
-##        self._fill("from ")
-##        self._write(t.module)
-##        self._write(" import ")
-##        for i, a in enumerate(t.names):
-##            if i == 0:
-##                self._write(", ")
-##            self._write(a.name)
-##            if a.asname:
-##                self._write(" as "+a.asname)
-##        # XXX(jpe) what is level for?
-##
-#
-#    def _Break(self, t):
-#        self._fill("break")
-#
-#    def _Continue(self, t):
-#        self._fill("continue")
-#
-#    def _Delete(self, t):
-#        self._fill("del ")
-#        self._dispatch(t.targets)
-#
-#    def _Assert(self, t):
-#        self._fill("assert ")
-#        self._dispatch(t.test)
-#        if t.msg:
-#            self._write(", ")
-#            self._dispatch(t.msg)
-#
-#    def _Exec(self, t):
-#        self._fill("exec ")
-#        self._dispatch(t.body)
-#        if t.globals:
-#            self._write(" in ")
-#            self._dispatch(t.globals)
-#        if t.locals:
-#            self._write(", ")
-#            self._dispatch(t.locals)
-#
-#    def _Print(self, t):
-#        self._fill("print ")
-#        do_comma = False
-#        if t.dest:
-#            self._write(">>")
-#            self._dispatch(t.dest)
-#            do_comma = True
-#        for e in t.values:
-#            if do_comma:self._write(", ")
-#            else:do_comma=True
-#            self._dispatch(e)
-#        if not t.nl:
-#            self._write(",")
-#
-#    def _Global(self, t):
-#        self._fill("global")
-#        for i, n in enumerate(t.names):
-#            if i != 0:
-#                self._write(",")
-#            self._write(" " + n)
-#
-#    def _Yield(self, t):
-#        self._fill("yield")
-#        if t.value:
-#            self._write(" (")
-#            self._dispatch(t.value)
-#            self._write(")")
-#
-#    def _Raise(self, t):
-#        self._fill('raise ')
-#        if t.type:
-#            self._dispatch(t.type)
-#        if t.inst:
-#            self._write(", ")
-#            self._dispatch(t.inst)
-#        if t.tback:
-#            self._write(", ")
-#            self._dispatch(t.tback)
-#
-#
-#    def _TryFinally(self, t):
-#        self._fill("try")
-#        self._enter()
-#        self._dispatch(t.body)
-#        self._leave()
-#
-#        self._fill("finally")
-#        self._enter()
-#        self._dispatch(t.finalbody)
-#        self._leave()
-#
-#    def _excepthandler(self, t):
-#        self._fill("except ")
-#        if t.type:
-#            self._dispatch(t.type)
-#        if t.name:
-#            self._write(", ")
-#            self._dispatch(t.name)
-#        self._enter()
-#        self._dispatch(t.body)
-#        self._leave()
-#
-#    def _ClassDef(self, t):
-#        self._write("\n")
-#        self._fill("class "+t.name)
-#        if t.bases:
-#            self._write("(")
-#            for a in t.bases:
-#                self._dispatch(a)
-#                self._write(", ")
-#            self._write(")")
-#        self._enter()
-#        self._dispatch(t.body)
-#        self._leave()
-#
-#    def _FunctionDef(self, t):
-#        self._write("\n")
-#        for deco in t.decorators:
-#            self._fill("@")
-#            self._dispatch(deco)
-#        self._fill("def "+t.name + "(")
-#        self._dispatch(t.args)
-#        self._write(")")
-#        self._enter()
-#        self._dispatch(t.body)
-#        self._leave()
-#
-#    def _For(self, t):
-#        self._fill("for ")
-#        self._dispatch(t.target)
-#        self._write(" in ")
-#        self._dispatch(t.iter)
-#        self._enter()
-#        self._dispatch(t.body)
-#        self._leave()
-#        if t.orelse:
-#            self._fill("else")
-#            self._enter()
-#            self._dispatch(t.orelse)
-#            self._leave
-#
-#    def _While(self, t):
-#        self._fill("while ")
-#        self._dispatch(t.test)
-#        self._enter()
-#        self._dispatch(t.body)
-#        self._leave()
-#        if t.orelse:
-#            self._fill("else")
-#            self._enter()
-#            self._dispatch(t.orelse)
-#            self._leave
-#
-#    # expr
-#    def _Str(self, tree):
-#        self._write(repr(tree.s))
-##
-#    def _Repr(self, t):
-#        self._write("`")
-#        self._dispatch(t.value)
-#        self._write("`")
-#
-#    def _Num(self, t):
-#        self._write(repr(t.n))
-#
-#    def _ListComp(self, t):
-#        self._write("[")
-#        self._dispatch(t.elt)
-#        for gen in t.generators:
-#            self._dispatch(gen)
-#        self._write("]")
-#
-#    def _GeneratorExp(self, t):
-#        self._write("(")
-#        self._dispatch(t.elt)
-#        for gen in t.generators:
-#            self._dispatch(gen)
-#        self._write(")")
-#
-#    def _comprehension(self, t):
-#        self._write(" for ")
-#        self._dispatch(t.target)
-#        self._write(" in ")
-#        self._dispatch(t.iter)
-#        for if_clause in t.ifs:
-#            self._write(" if ")
-#            self._dispatch(if_clause)
-#
-#    def _IfExp(self, t):
-#        self._dispatch(t.body)
-#        self._write(" if ")
-#        self._dispatch(t.test)
-#        if t.orelse:
-#            self._write(" else ")
-#            self._dispatch(t.orelse)
-#
-#    unop = {"Invert":"~", "Not": "not", "UAdd":"+", "USub":"-"}
-#    def _UnaryOp(self, t):
-#        self._write(self.unop[t.op.__class__.__name__])
-#        self._write("(")
-#        self._dispatch(t.operand)
-#        self._write(")")
-#
-#    binop = { "Add":"+", "Sub":"-", "Mult":"*", "Div":"/", "Mod":"%",
-#                    "LShift":">>", "RShift":"<<", "BitOr":"|", "BitXor":"^", "BitAnd":"&",
-#                    "FloorDiv":"//", "Pow": "**"}
-#    def _BinOp(self, t):
-#        self._write("(")
-#        self._dispatch(t.left)
-#        self._write(")" + self.binop[t.op.__class__.__name__] + "(")
-#        self._dispatch(t.right)
-#        self._write(")")
-#
-#    boolops = {_ast.And: 'and', _ast.Or: 'or'}
-#    def _BoolOp(self, t):
-#        self._write("(")
-#        self._dispatch(t.values[0])
-#        for v in t.values[1:]:
-#            self._write(" %s " % self.boolops[t.op.__class__])
-#            self._dispatch(v)
-#        self._write(")")
-#
-#    def _Attribute(self,t):
-#        self._dispatch(t.value)
-#        self._write(".")
-#        self._write(t.attr)
-#
-##    def _Call(self, t):
-##        self._dispatch(t.func)
-##        self._write("(")
-##        comma = False
-##        for e in t.args:
-##            if comma: self._write(", ")
-##            else: comma = True
-##            self._dispatch(e)
-##        for e in t.keywords:
-##            if comma: self._write(", ")
-##            else: comma = True
-##            self._dispatch(e)
-##        if t.starargs:
-##            if comma: self._write(", ")
-##            else: comma = True
-##            self._write("*")
-##            self._dispatch(t.starargs)
-##        if t.kwargs:
-##            if comma: self._write(", ")
-##            else: comma = True
-##            self._write("**")
-##            self._dispatch(t.kwargs)
-##        self._write(")")
-#
-#    # slice
-#    def _Index(self, t):
-#        self._dispatch(t.value)
-#
-#    def _ExtSlice(self, t):
-#        for i, d in enumerate(t.dims):
-#            if i != 0:
-#                self._write(': ')
-#            self._dispatch(d)
-#
-#    # others
-#    def _arguments(self, t):
-#        first = True
-#        nonDef = len(t.args)-len(t.defaults)
-#        for a in t.args[0:nonDef]:
-#            if first:first = False
-#            else: self._write(", ")
-#            self._dispatch(a)
-#        for a,d in zip(t.args[nonDef:], t.defaults):
-#            if first:first = False
-#            else: self._write(", ")
-#            self._dispatch(a),
-#            self._write("=")
-#            self._dispatch(d)
-#        if t.vararg:
-#            if first:first = False
-#            else: self._write(", ")
-#            self._write("*"+t.vararg)
-#        if t.kwarg:
-#            if first:first = False
-#            else: self._write(", ")
-#            self._write("**"+t.kwarg)
-#
-##    def _keyword(self, t):
-##        self._write(t.arg)
-##        self._write("=")
-##        self._dispatch(t.value)
-#
-#    def _Lambda(self, t):
-#        self._write("lambda ")
-#        self._dispatch(t.args)
-#        self._write(": ")
-#        self._dispatch(t.body)
-
-
-
diff --git a/doc/sphinxext/numpydoc/docscrape.py b/doc/sphinxext/numpydoc/docscrape.py
old mode 100755
new mode 100644
index 2c49ed84ad224..598b4438ffabc
--- a/doc/sphinxext/numpydoc/docscrape.py
+++ b/doc/sphinxext/numpydoc/docscrape.py
@@ -9,6 +9,17 @@
 import pydoc
 from warnings import warn
 import collections
+import copy
+import sys
+
+
+def strip_blank_lines(l):
+    "Remove leading and trailing blank lines from a list of lines"
+    while l and not l[0].strip():
+        del l[0]
+    while l and not l[-1].strip():
+        del l[-1]
+    return l
 
 
 class Reader(object):
@@ -23,10 +34,10 @@ def __init__(self, data):
            String with lines separated by '\n'.
 
         """
-        if isinstance(data,list):
+        if isinstance(data, list):
             self._str = data
         else:
-            self._str = data.split('\n') # store string as list of lines
+            self._str = data.split('\n')  # store string as list of lines
 
         self.reset()
 
@@ -34,7 +45,7 @@ def __getitem__(self, n):
         return self._str[n]
 
     def reset(self):
-        self._l = 0 # current line nr
+        self._l = 0  # current line nr
 
     def read(self):
         if not self.eof():
@@ -66,8 +77,10 @@ def read_to_condition(self, condition_func):
 
     def read_to_next_empty_line(self):
         self.seek_next_non_empty_line()
+
         def is_empty(line):
             return not line.strip()
+
         return self.read_to_condition(is_empty)
 
     def read_to_next_unindented_line(self):
@@ -75,7 +88,7 @@ def is_unindented(line):
             return (line.strip() and (len(line.lstrip()) == len(line)))
         return self.read_to_condition(is_unindented)
 
-    def peek(self,n=0):
+    def peek(self, n=0):
         if self._l + n < len(self._str):
             return self[self._l + n]
         else:
@@ -85,41 +98,69 @@ def is_empty(self):
         return not ''.join(self._str).strip()
 
 
-class NumpyDocString(object):
+class ParseError(Exception):
+    def __str__(self):
+        message = self.args[0]
+        if hasattr(self, 'docstring'):
+            message = "%s in %r" % (message, self.docstring)
+        return message
+
+
+class NumpyDocString(collections.Mapping):
+    """Parses a numpydoc string to an abstract representation
+
+    Instances define a mapping from section title to structured data.
+
+    """
+
+    sections = {
+        'Signature': '',
+        'Summary': [''],
+        'Extended Summary': [],
+        'Parameters': [],
+        'Returns': [],
+        'Yields': [],
+        'Raises': [],
+        'Warns': [],
+        'Other Parameters': [],
+        'Attributes': [],
+        'Methods': [],
+        'See Also': [],
+        'Notes': [],
+        'Warnings': [],
+        'References': '',
+        'Examples': '',
+        'index': {}
+    }
+
     def __init__(self, docstring, config={}):
+        orig_docstring = docstring
         docstring = textwrap.dedent(docstring).split('\n')
 
         self._doc = Reader(docstring)
-        self._parsed_data = {
-            'Signature': '',
-            'Summary': [''],
-            'Extended Summary': [],
-            'Parameters': [],
-            'Returns': [],
-            'Raises': [],
-            'Warns': [],
-            'Other Parameters': [],
-            'Attributes': [],
-            'Methods': [],
-            'See Also': [],
-            'Notes': [],
-            'Warnings': [],
-            'References': '',
-            'Examples': '',
-            'index': {}
-            }
-
-        self._parse()
-
-    def __getitem__(self,key):
+        self._parsed_data = copy.deepcopy(self.sections)
+
+        try:
+            self._parse()
+        except ParseError as e:
+            e.docstring = orig_docstring
+            raise
+
+    def __getitem__(self, key):
         return self._parsed_data[key]
 
-    def __setitem__(self,key,val):
+    def __setitem__(self, key, val):
         if key not in self._parsed_data:
-            warn("Unknown section %s" % key)
+            self._error_location("Unknown section %s" % key, error=False)
         else:
             self._parsed_data[key] = val
 
+    def __iter__(self):
+        return iter(self._parsed_data)
+
+    def __len__(self):
+        return len(self._parsed_data)
+
     def _is_at_section(self):
         self._doc.seek_next_non_empty_line()
 
@@ -131,17 +172,19 @@ def _is_at_section(self):
         if l1.startswith('.. index::'):
             return True
 
-        l2 = self._doc.peek(1).strip() #    ---------- or ==========
+        l2 = self._doc.peek(1).strip()  # ---------- or ==========
         return l2.startswith('-'*len(l1)) or l2.startswith('='*len(l1))
 
-    def _strip(self,doc):
+    def _strip(self, doc):
         i = 0
         j = 0
-        for i,line in enumerate(doc):
-            if line.strip(): break
+        for i, line in enumerate(doc):
+            if line.strip():
+                break
 
-        for j,line in enumerate(doc[::-1]):
-            if line.strip(): break
+        for j, line in enumerate(doc[::-1]):
+            if line.strip():
+                break
 
         return doc[i:len(doc)-j]
 
@@ -149,7 +192,7 @@ def _read_to_next_section(self):
         section = self._doc.read_to_next_empty_line()
 
         while not self._is_at_section() and not self._doc.eof():
-            if not self._doc.peek(-1).strip(): # previous line was empty
+            if not self._doc.peek(-1).strip():  # previous line was empty
                 section += ['']
 
             section += self._doc.read_to_next_empty_line()
@@ -161,14 +204,14 @@ def _read_sections(self):
             data = self._read_to_next_section()
             name = data[0].strip()
 
-            if name.startswith('..'): # index section
+            if name.startswith('..'):  # index section
                 yield name, data[1:]
             elif len(data) < 2:
                 yield StopIteration
             else:
                 yield name, self._strip(data[2:])
 
-    def _parse_param_list(self,content):
+    def _parse_param_list(self, content):
         r = Reader(content)
         params = []
         while not r.eof():
@@ -180,14 +223,16 @@ def _parse_param_list(self,content):
 
             desc = r.read_to_next_unindented_line()
             desc = dedent_lines(desc)
+            desc = strip_blank_lines(desc)
 
-            params.append((arg_name,arg_type,desc))
+            params.append((arg_name, arg_type, desc))
 
         return params
 
-
-    _name_rgx = re.compile(r"^\s*(:(?P<role>\w+):`(?P<name>[a-zA-Z0-9_.-]+)`|"
+    _name_rgx = re.compile(r"^\s*(:(?P<role>\w+):"
+                           r"`(?P<name>(?:~\w+\.)?[a-zA-Z0-9_.-]+)`|"
                            r" (?P<name2>[a-zA-Z0-9_.-]+))\s*", re.X)
+
     def _parse_see_also(self, content):
         """
         func_name : Descriptive text
@@ -207,7 +252,7 @@ def parse_item_name(text):
                     return g[3], None
                 else:
                     return g[2], g[1]
-            raise ValueError("%s is not a item name" % text)
+            raise ParseError("%s is not a item name" % text)
 
         def push_item(name, rest):
             if not name:
@@ -220,7 +265,8 @@ def push_item(name, rest):
         rest = []
 
         for line in content:
-            if not line.strip(): continue
+            if not line.strip():
+                continue
 
             m = self._name_rgx.match(line)
             if m and line[m.end():].strip().startswith(':'):
@@ -287,11 +333,27 @@ def _parse(self):
         self._doc.reset()
         self._parse_summary()
 
-        for (section,content) in self._read_sections():
+        sections = list(self._read_sections())
+        section_names = set([section for section, content in sections])
+
+        has_returns = 'Returns' in section_names
+        has_yields = 'Yields' in section_names
+        # We could do more tests, but we are not. Arbitrarily.
+        if has_returns and has_yields:
+            msg = 'Docstring contains both a Returns and Yields section.'
+            raise ValueError(msg)
+
+        for (section, content) in sections:
             if not section.startswith('..'):
-                section = ' '.join([s.capitalize() for s in section.split(' ')])
-            if section in ('Parameters', 'Returns', 'Raises', 'Warns',
-                           'Other Parameters', 'Attributes', 'Methods'):
+                section = (s.capitalize() for s in section.split(' '))
+                section = ' '.join(section)
+                if self.get(section):
+                    self._error_location("The section %s appears twice"
+                                         % section)
+
+            if section in ('Parameters', 'Returns', 'Yields', 'Raises',
+                           'Warns', 'Other Parameters', 'Attributes',
+                           'Methods'):
                 self[section] = self._parse_param_list(content)
             elif section.startswith('.. index::'):
                 self['index'] = self._parse_index(section, content)
@@ -300,6 +362,20 @@ def _parse(self):
             else:
                 self[section] = content
 
+    def _error_location(self, msg, error=True):
+        if hasattr(self, '_obj'):
+            # we know where the docs came from:
+            try:
+                filename = inspect.getsourcefile(self._obj)
+            except TypeError:
+                filename = None
+            msg = msg + (" in the docstring of %s in %s."
+                         % (self._obj, filename))
+        if error:
+            raise ValueError(msg)
+        else:
+            warn(msg)
+
     # string conversion routines
 
     def _str_header(self, name, symbol='-'):
@@ -313,7 +389,7 @@ def _str_indent(self, doc, indent=4):
 
     def _str_signature(self):
         if self['Signature']:
-            return [self['Signature'].replace('*','\*')] + ['']
+            return [self['Signature'].replace('*', '\*')] + ['']
         else:
             return ['']
 
@@ -333,12 +409,13 @@ def _str_param_list(self, name):
         out = []
         if self[name]:
             out += self._str_header(name)
-            for param,param_type,desc in self[name]:
+            for param, param_type, desc in self[name]:
                 if param_type:
                     out += ['%s : %s' % (param, param_type)]
                 else:
                     out += [param]
-                out += self._str_indent(desc)
+                if desc and ''.join(desc).strip():
+                    out += self._str_indent(desc)
             out += ['']
         return out
 
@@ -351,7 +428,8 @@ def _str_section(self, name):
         return out
 
     def _str_see_also(self, func_role):
-        if not self['See Also']: return []
+        if not self['See Also']:
+            return []
         out = []
         out += self._str_header("See Also")
         last_had_desc = True
@@ -378,7 +456,7 @@ def _str_see_also(self, func_role):
     def _str_index(self):
         idx = self['index']
         out = []
-        out += ['.. index:: %s' % idx.get('default','')]
+        out += ['.. index:: %s' % idx.get('default', '')]
         for section, references in idx.items():
             if section == 'default':
                 continue
@@ -390,12 +468,12 @@ def __str__(self, func_role=''):
         out += self._str_signature()
         out += self._str_summary()
         out += self._str_extended_summary()
-        for param_list in ('Parameters', 'Returns', 'Other Parameters',
-                           'Raises', 'Warns'):
+        for param_list in ('Parameters', 'Returns', 'Yields',
+                           'Other Parameters', 'Raises', 'Warns'):
             out += self._str_param_list(param_list)
         out += self._str_section('Warnings')
         out += self._str_see_also(func_role)
-        for s in ('Notes','References','Examples'):
+        for s in ('Notes', 'References', 'Examples'):
             out += self._str_section(s)
         for param_list in ('Attributes', 'Methods'):
             out += self._str_param_list(param_list)
@@ -403,17 +481,19 @@ def __str__(self, func_role=''):
         return '\n'.join(out)
 
 
-def indent(str,indent=4):
+def indent(str, indent=4):
     indent_str = ' '*indent
     if str is None:
         return indent_str
     lines = str.split('\n')
     return '\n'.join(indent_str + l for l in lines)
 
+
 def dedent_lines(lines):
     """Deindent a list of lines maximally"""
     return textwrap.dedent("\n".join(lines)).split("\n")
 
+
 def header(text, style='-'):
     return text + '\n' + style*len(text) + '\n'
 
@@ -421,7 +501,7 @@ def header(text, style='-'):
 class FunctionDoc(NumpyDocString):
     def __init__(self, func, role='func', doc=None, config={}):
         self._f = func
-        self._role = role # e.g. "func" or "meth"
+        self._role = role  # e.g. "func" or "meth"
 
         if doc is None:
             if func is None:
@@ -432,12 +512,17 @@ def __init__(self, func, role='func', doc=None, config={}):
         if not self['Signature'] and func is not None:
             func, func_name = self.get_func()
             try:
-                # try to read signature
-                argspec = inspect.getargspec(func)
-                argspec = inspect.formatargspec(*argspec)
-                argspec = argspec.replace('*','\*')
-                signature = '%s%s' % (func_name, argspec)
-            except TypeError as e:
+                try:
+                    signature = str(inspect.signature(func))
+                except (AttributeError, ValueError):
+                    # try to read signature, backward compat for older Python
+                    if sys.version_info[0] >= 3:
+                        argspec = inspect.getfullargspec(func)
+                    else:
+                        argspec = inspect.getargspec(func)
+                    signature = inspect.formatargspec(*argspec)
+                signature = '%s%s' % (func_name, signature.replace('*', '\*'))
+            except TypeError:
                 signature = '%s()' % func_name
             self['Signature'] = signature
 
@@ -461,7 +546,7 @@ def __str__(self):
         if self._role:
             if self._role not in roles:
                 print("Warning: invalid role %s" % self._role)
-            out += '.. %s:: %s\n    \n\n' % (roles.get(self._role,''),
+            out += '.. %s:: %s\n    \n\n' % (roles.get(self._role, ''),
                                              func_name)
 
         out += super(FunctionDoc, self).__str__(func_role=self._role)
@@ -478,6 +563,9 @@ def __init__(self, cls, doc=None, modulename='', func_doc=FunctionDoc,
             raise ValueError("Expected a class or None, but got %r" % cls)
         self._cls = cls
 
+        self.show_inherited_members = config.get(
+                    'show_inherited_class_members', True)
+
         if modulename and not modulename.endswith('.'):
             modulename += '.'
         self._mod = modulename
@@ -501,27 +589,36 @@ def splitlines_x(s):
                 if not self[field]:
                     doc_list = []
                     for name in sorted(items):
-                         try:
+                        try:
                             doc_item = pydoc.getdoc(getattr(self._cls, name))
                             doc_list.append((name, '', splitlines_x(doc_item)))
-                         except AttributeError:
-                            pass # method doesn't exist
+                        except AttributeError:
+                            pass  # method doesn't exist
                     self[field] = doc_list
 
     @property
     def methods(self):
         if self._cls is None:
             return []
-        return [name for name,func in inspect.getmembers(self._cls)
+        return [name for name, func in inspect.getmembers(self._cls)
                 if ((not name.startswith('_')
                      or name in self.extra_public_methods)
-                    and isinstance(func, collections.Callable))]
+                    and isinstance(func, collections.Callable)
+                    and self._is_show_member(name))]
 
     @property
     def properties(self):
         if self._cls is None:
             return []
-        return [name for name,func in inspect.getmembers(self._cls)
-                if not name.startswith('_') and
-                (func is None or isinstance(func, property) or
-                 inspect.isgetsetdescriptor(func))]
+        return [name for name, func in inspect.getmembers(self._cls)
+                if (not name.startswith('_') and
+                    (func is None or isinstance(func, property) or
+                     inspect.isdatadescriptor(func))
+                    and self._is_show_member(name))]
+
+    def _is_show_member(self, name):
+        if self.show_inherited_members:
+            return True  # show all class members
+        if name not in self._cls.__dict__:
+            return False  # class member is inherited, we do not show it
+        return True
diff --git a/doc/sphinxext/numpydoc/docscrape_sphinx.py b/doc/sphinxext/numpydoc/docscrape_sphinx.py
old mode 100755
new mode 100644
index 5a582b4d03282..19c355eba1898
--- a/doc/sphinxext/numpydoc/docscrape_sphinx.py
+++ b/doc/sphinxext/numpydoc/docscrape_sphinx.py
@@ -1,8 +1,18 @@
 from __future__ import division, absolute_import, print_function
 
-import sys, re, inspect, textwrap, pydoc
-import sphinx
+import sys
+import re
+import inspect
+import textwrap
+import pydoc
 import collections
+import os
+
+from jinja2 import FileSystemLoader
+from jinja2.sandbox import SandboxedEnvironment
+import sphinx
+from sphinx.jinja2glue import BuiltinTemplateLoader
+
 from .docscrape import NumpyDocString, FunctionDoc, ClassDoc
 
 if sys.version_info[0] >= 3:
@@ -11,15 +21,25 @@
     sixu = lambda s: unicode(s, 'unicode_escape')
 
 
+IMPORT_MATPLOTLIB_RE = r'\b(import +matplotlib|from +matplotlib +import)\b'
+
+
 class SphinxDocString(NumpyDocString):
     def __init__(self, docstring, config={}):
-        # Subclasses seemingly do not call this.
         NumpyDocString.__init__(self, docstring, config=config)
+        self.load_config(config)
 
     def load_config(self, config):
         self.use_plots = config.get('use_plots', False)
+        self.use_blockquotes = config.get('use_blockquotes', False)
         self.class_members_toctree = config.get('class_members_toctree', True)
-        self.class_members_list = config.get('class_members_list', True)
+        self.attributes_as_param_list = config.get('attributes_as_param_list', True)
+        self.template = config.get('template', None)
+        if self.template is None:
+            template_dirs = [os.path.join(os.path.dirname(__file__), 'templates')]
+            template_loader = FileSystemLoader(template_dirs)
+            template_env = SandboxedEnvironment(loader=template_loader)
+            self.template = template_env.get_template('numpydoc_docstring.rst')
 
     # string conversion routines
     def _str_header(self, name, symbol='`'):
@@ -47,38 +67,149 @@ def _str_summary(self):
     def _str_extended_summary(self):
         return self['Extended Summary'] + ['']
 
-    def _str_returns(self):
+    def _str_returns(self, name='Returns'):
+        if self.use_blockquotes:
+            typed_fmt = '**%s** : %s'
+            untyped_fmt = '**%s**'
+        else:
+            typed_fmt = '%s : %s'
+            untyped_fmt = '%s'
+
         out = []
-        if self['Returns']:
-            out += self._str_field_list('Returns')
+        if self[name]:
+            out += self._str_field_list(name)
             out += ['']
-            for param, param_type, desc in self['Returns']:
+            for param, param_type, desc in self[name]:
                 if param_type:
-                    out += self._str_indent(['**%s** : %s' % (param.strip(),
-                                                              param_type)])
+                    out += self._str_indent([typed_fmt % (param.strip(),
+                                                          param_type)])
                 else:
-                    out += self._str_indent([param.strip()])
-                if desc:
+                    out += self._str_indent([untyped_fmt % param.strip()])
+                if desc and self.use_blockquotes:
                     out += ['']
-                    out += self._str_indent(desc, 8)
+                elif not desc:
+                    desc = ['..']
+                out += self._str_indent(desc, 8)
                 out += ['']
         return out
 
-    def _str_param_list(self, name):
+    def _process_param(self, param, desc, fake_autosummary):
+        """Determine how to display a parameter
+
+        Emulates autosummary behavior if fake_autosummary
+
+        Parameters
+        ----------
+        param : str
+            The name of the parameter
+        desc : list of str
+            The parameter description as given in the docstring. This is
+            ignored when autosummary logic applies.
+        fake_autosummary : bool
+            If True, autosummary-style behaviour will apply for params
+            that are attributes of the class and have a docstring.
+
+        Returns
+        -------
+        display_param : str
+            The marked up parameter name for display. This may include a link
+            to the corresponding attribute's own documentation.
+        desc : list of str
+            A list of description lines. This may be identical to the input
+            ``desc``, if ``autosum is None`` or ``param`` is not a class
+            attribute, or it will be a summary of the class attribute's
+            docstring.
+
+        Notes
+        -----
+        This does not have the autosummary functionality to display a method's
+        signature, and hence is not used to format methods.  It may be
+        complicated to incorporate autosummary's signature mangling, as it
+        relies on Sphinx's plugin mechanism.
+        """
+        param = param.strip()
+        display_param = ('**%s**' if self.use_blockquotes else '%s') % param
+
+        if not fake_autosummary:
+            return display_param, desc
+
+        param_obj = getattr(self._obj, param, None)
+        if not (callable(param_obj)
+                or isinstance(param_obj, property)
+                or inspect.isgetsetdescriptor(param_obj)):
+            param_obj = None
+        obj_doc = pydoc.getdoc(param_obj)
+
+        if not (param_obj and obj_doc):
+            return display_param, desc
+
+        prefix = getattr(self, '_name', '')
+        if prefix:
+            autosum_prefix = '~%s.' % prefix
+            link_prefix = '%s.' % prefix
+        else:
+            autosum_prefix = ''
+            link_prefix = ''
+
+        # Referenced object has a docstring
+        display_param = ':obj:`%s <%s%s>`' % (param,
+                                              link_prefix,
+                                              param)
+        if obj_doc:
+            # Overwrite desc. Take summary logic of autosummary
+            desc = re.split('\n\s*\n', obj_doc.strip(), 1)[0]
+            # XXX: Should this have DOTALL?
+            #      It does not in autosummary
+            m = re.search(r"^([A-Z].*?\.)(?:\s|$)",
+                          ' '.join(desc.split()))
+            if m:
+                desc = m.group(1).strip()
+            else:
+                desc = desc.partition('\n')[0]
+            desc = desc.split('\n')
+        return display_param, desc
+
+    def _str_param_list(self, name, fake_autosummary=False):
+        """Generate RST for a listing of parameters or similar
+
+        Parameter names are displayed as bold text, and descriptions
+        are in blockquotes.  Descriptions may therefore contain block
+        markup as well.
+
+        Parameters
+        ----------
+        name : str
+            Section name (e.g. Parameters)
+        fake_autosummary : bool
+            When True, the parameter names may correspond to attributes of the
+            object beign documented, usually ``property`` instances on a class.
+            In this case, names will be linked to fuller descriptions.
+
+        Returns
+        -------
+        rst : list of str
+        """
         out = []
         if self[name]:
             out += self._str_field_list(name)
             out += ['']
             for param, param_type, desc in self[name]:
+                display_param, desc = self._process_param(param, desc,
+                                                          fake_autosummary)
+
                 if param_type:
-                    out += self._str_indent(['**%s** : %s' % (param.strip(),
-                                                              param_type)])
+                    out += self._str_indent(['%s : %s' % (display_param,
+                                                          param_type)])
                 else:
-                    out += self._str_indent(['**%s**' % param.strip()])
-                if desc:
+                    out += self._str_indent([display_param])
+                if desc and self.use_blockquotes:
                     out += ['']
-                    out += self._str_indent(desc, 8)
+                elif not desc:
+                    # empty definition
+                    desc = ['..']
+                out += self._str_indent(desc, 8)
                 out += ['']
+
         return out
 
     @property
@@ -96,7 +227,7 @@ def _str_member_list(self, name):
 
         """
         out = []
-        if self[name] and self.class_members_list:
+        if self[name]:
             out += ['.. rubric:: %s' % name, '']
             prefix = getattr(self, '_name', '')
 
@@ -112,16 +243,14 @@ def _str_member_list(self, name):
                 param_obj = getattr(self._obj, param, None)
                 if not (callable(param_obj)
                         or isinstance(param_obj, property)
-                        or inspect.isgetsetdescriptor(param_obj)):
+                        or inspect.isdatadescriptor(param_obj)):
                     param_obj = None
 
-                # pandas HACK - do not exclude attributes wich are None
-                # if param_obj and (pydoc.getdoc(param_obj) or not desc):
-                #     # Referenced object has a docstring
-                #     autosum += ["   %s%s" % (prefix, param)]
-                # else:
-                #     others.append((param, param_type, desc))
-                autosum += ["   %s%s" % (prefix, param)]
+                if param_obj and pydoc.getdoc(param_obj):
+                    # Referenced object has a docstring
+                    autosum += ["   %s%s" % (prefix, param)]
+                else:
+                    others.append((param, param_type, desc))
 
             if autosum:
                 out += ['.. autosummary::']
@@ -130,15 +259,15 @@ def _str_member_list(self, name):
                 out += [''] + autosum
 
             if others:
-                maxlen_0 = max(3, max([len(x[0]) for x in others]))
-                hdr = sixu("=")*maxlen_0 + sixu("  ") + sixu("=")*10
+                maxlen_0 = max(3, max([len(x[0]) + 4 for x in others]))
+                hdr = sixu("=") * maxlen_0 + sixu("  ") + sixu("=") * 10
                 fmt = sixu('%%%ds  %%s  ') % (maxlen_0,)
-                out += ['', hdr]
+                out += ['', '', hdr]
                 for param, param_type, desc in others:
                     desc = sixu(" ").join(x.strip() for x in desc).strip()
                     if param_type:
                         desc = "(%s) %s" % (param_type, desc)
-                    out += [fmt % (param.strip(), desc)]
+                    out += [fmt % ("**" + param.strip() + "**", desc)]
                 out += [hdr]
             out += ['']
         return out
@@ -147,7 +276,6 @@ def _str_section(self, name):
         out = []
         if self[name]:
             out += self._str_header(name)
-            out += ['']
             content = textwrap.dedent("\n".join(self[name])).split("\n")
             out += content
             out += ['']
@@ -166,6 +294,7 @@ def _str_warnings(self):
         if self['Warnings']:
             out = ['.. warning::', '']
             out += self._str_indent(self['Warnings'])
+            out += ['']
         return out
 
     def _str_index(self):
@@ -174,7 +303,7 @@ def _str_index(self):
         if len(idx) == 0:
             return out
 
-        out += ['.. index:: %s' % idx.get('default','')]
+        out += ['.. index:: %s' % idx.get('default', '')]
         for section, references in idx.items():
             if section == 'default':
                 continue
@@ -182,6 +311,7 @@ def _str_index(self):
                 out += ['   single: %s' % (', '.join(references))]
             else:
                 out += ['   %s: %s' % (section, ','.join(references))]
+        out += ['']
         return out
 
     def _str_references(self):
@@ -195,9 +325,9 @@ def _str_references(self):
             # Latex collects all references to a separate bibliography,
             # so we need to insert links to it
             if sphinx.__version__ >= "0.6":
-                out += ['.. only:: latex','']
+                out += ['.. only:: latex', '']
             else:
-                out += ['.. latexonly::','']
+                out += ['.. latexonly::', '']
             items = []
             for line in self['References']:
                 m = re.match(r'.. \[([a-z0-9._-]+)\]', line, re.I)
@@ -209,7 +339,7 @@ def _str_references(self):
     def _str_examples(self):
         examples_str = "\n".join(self['Examples'])
 
-        if (self.use_plots and 'import matplotlib' in examples_str
+        if (self.use_plots and re.search(IMPORT_MATPLOTLIB_RE, examples_str)
                 and 'plot::' not in examples_str):
             out = []
             out += self._str_header('Examples')
@@ -221,42 +351,54 @@ def _str_examples(self):
             return self._str_section('Examples')
 
     def __str__(self, indent=0, func_role="obj"):
-        out = []
-        out += self._str_signature()
-        out += self._str_index() + ['']
-        out += self._str_summary()
-        out += self._str_extended_summary()
-        out += self._str_param_list('Parameters')
-        out += self._str_returns()
-        for param_list in ('Other Parameters', 'Raises', 'Warns'):
-            out += self._str_param_list(param_list)
-        out += self._str_warnings()
-        out += self._str_see_also(func_role)
-        out += self._str_section('Notes')
-        out += self._str_references()
-        out += self._str_examples()
-        for param_list in ('Attributes', 'Methods'):
-            out += self._str_member_list(param_list)
-        out = self._str_indent(out,indent)
-        return '\n'.join(out)
+        ns = {
+            'signature':  self._str_signature(),
+            'index': self._str_index(),
+            'summary': self._str_summary(),
+            'extended_summary': self._str_extended_summary(),
+            'parameters': self._str_param_list('Parameters'),
+            'returns': self._str_returns('Returns'),
+            'yields': self._str_returns('Yields'),
+            'other_parameters': self._str_param_list('Other Parameters'),
+            'raises': self._str_param_list('Raises'),
+            'warns': self._str_param_list('Warns'),
+            'warnings': self._str_warnings(),
+            'see_also': self._str_see_also(func_role),
+            'notes': self._str_section('Notes'),
+            'references': self._str_references(),
+            'examples': self._str_examples(),
+            'attributes':
+                self._str_param_list('Attributes', fake_autosummary=True)
+                if self.attributes_as_param_list
+                else self._str_member_list('Attributes'),
+            'methods': self._str_member_list('Methods'),
+        }
+        ns = dict((k, '\n'.join(v)) for k, v in ns.items())
+
+        rendered = self.template.render(**ns)
+        return '\n'.join(self._str_indent(rendered.split('\n'), indent))
+
 
 class SphinxFunctionDoc(SphinxDocString, FunctionDoc):
     def __init__(self, obj, doc=None, config={}):
         self.load_config(config)
         FunctionDoc.__init__(self, obj, doc=doc, config=config)
 
+
 class SphinxClassDoc(SphinxDocString, ClassDoc):
     def __init__(self, obj, doc=None, func_doc=None, config={}):
         self.load_config(config)
         ClassDoc.__init__(self, obj, doc=doc, func_doc=None, config=config)
 
+
 class SphinxObjDoc(SphinxDocString):
     def __init__(self, obj, doc=None, config={}):
         self._f = obj
         self.load_config(config)
         SphinxDocString.__init__(self, doc, config=config)
 
-def get_doc_object(obj, what=None, doc=None, config={}):
+
+def get_doc_object(obj, what=None, doc=None, config={}, builder=None):
     if what is None:
         if inspect.isclass(obj):
             what = 'class'
@@ -266,6 +408,16 @@ def get_doc_object(obj, what=None, doc=None, config={}):
             what = 'function'
         else:
             what = 'object'
+
+    template_dirs = [os.path.join(os.path.dirname(__file__), 'templates')]
+    if builder is not None:
+        template_loader = BuiltinTemplateLoader()
+        template_loader.init(builder, dirs=template_dirs)
+    else:
+        template_loader = FileSystemLoader(template_dirs)
+    template_env = SandboxedEnvironment(loader=template_loader)
+    config['template'] = template_env.get_template('numpydoc_docstring.rst')
+
     if what == 'class':
         return SphinxClassDoc(obj, func_doc=SphinxFunctionDoc, doc=doc,
                               config=config)
diff --git a/doc/sphinxext/numpydoc/linkcode.py b/doc/sphinxext/numpydoc/linkcode.py
deleted file mode 100644
index 1ad3ab82cb49c..0000000000000
--- a/doc/sphinxext/numpydoc/linkcode.py
+++ /dev/null
@@ -1,83 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-    linkcode
-    ~~~~~~~~
-
-    Add external links to module code in Python object descriptions.
-
-    :copyright: Copyright 2007-2011 by the Sphinx team, see AUTHORS.
-    :license: BSD, see LICENSE for details.
-
-"""
-from __future__ import division, absolute_import, print_function
-
-import warnings
-import collections
-
-warnings.warn("This extension has been accepted to Sphinx upstream. "
-              "Use the version from there (Sphinx >= 1.2) "
-              "https://bitbucket.org/birkenfeld/sphinx/pull-request/47/sphinxextlinkcode",
-              FutureWarning, stacklevel=1)
-
-
-from docutils import nodes
-
-from sphinx import addnodes
-from sphinx.locale import _
-from sphinx.errors import SphinxError
-
-class LinkcodeError(SphinxError):
-    category = "linkcode error"
-
-def doctree_read(app, doctree):
-    env = app.builder.env
-
-    resolve_target = getattr(env.config, 'linkcode_resolve', None)
-    if not isinstance(env.config.linkcode_resolve, collections.Callable):
-        raise LinkcodeError(
-            "Function `linkcode_resolve` is not given in conf.py")
-
-    domain_keys = dict(
-        py=['module', 'fullname'],
-        c=['names'],
-        cpp=['names'],
-        js=['object', 'fullname'],
-    )
-
-    for objnode in doctree.traverse(addnodes.desc):
-        domain = objnode.get('domain')
-        uris = set()
-        for signode in objnode:
-            if not isinstance(signode, addnodes.desc_signature):
-                continue
-
-            # Convert signode to a specified format
-            info = {}
-            for key in domain_keys.get(domain, []):
-                value = signode.get(key)
-                if not value:
-                    value = ''
-                info[key] = value
-            if not info:
-                continue
-
-            # Call user code to resolve the link
-            uri = resolve_target(domain, info)
-            if not uri:
-                # no source
-                continue
-
-            if uri in uris or not uri:
-                # only one link per name, please
-                continue
-            uris.add(uri)
-
-            onlynode = addnodes.only(expr='html')
-            onlynode += nodes.reference('', '', internal=False, refuri=uri)
-            onlynode[0] += nodes.inline('', _('[source]'),
-                                        classes=['viewcode-link'])
-            signode += onlynode
-
-def setup(app):
-    app.connect('doctree-read', doctree_read)
-    app.add_config_value('linkcode_resolve', None, '')
diff --git a/doc/sphinxext/numpydoc/numpydoc.py b/doc/sphinxext/numpydoc/numpydoc.py
old mode 100755
new mode 100644
index 0cccf72de3745..dc20b3f828eb2
--- a/doc/sphinxext/numpydoc/numpydoc.py
+++ b/doc/sphinxext/numpydoc/numpydoc.py
@@ -10,14 +10,17 @@
 - Convert Parameters etc. sections to field lists.
 - Convert See Also section to a See also entry.
 - Renumber references.
-- Extract the signature from the docstring, if it can't be determined otherwise.
+- Extract the signature from the docstring, if it can't be determined
+  otherwise.
 
 .. [1] https://github.com/numpy/numpy/blob/master/doc/HOWTO_DOCUMENT.rst.txt
 
 """
 from __future__ import division, absolute_import, print_function
 
-import os, sys, re, pydoc
+import sys
+import re
+import pydoc
 import sphinx
 import inspect
 import collections
@@ -26,7 +29,7 @@
     raise RuntimeError("Sphinx 1.0.1 or newer is required")
 
 from .docscrape_sphinx import get_doc_object, SphinxDocString
-from sphinx.util.compat import Directive
+from . import __version__
 
 if sys.version_info[0] >= 3:
     sixu = lambda s: s
@@ -34,33 +37,66 @@
     sixu = lambda s: unicode(s, 'unicode_escape')
 
 
-def mangle_docstrings(app, what, name, obj, options, lines,
+def rename_references(app, what, name, obj, options, lines,
                       reference_offset=[0]):
+    # replace reference numbers so that there are no duplicates
+    references = set()
+    for line in lines:
+        line = line.strip()
+        m = re.match(sixu('^.. \\[(%s)\\]') % app.config.numpydoc_citation_re,
+                     line, re.I)
+        if m:
+            references.add(m.group(1))
 
-    cfg = dict(use_plots=app.config.numpydoc_use_plots,
-               show_class_members=app.config.numpydoc_show_class_members,
-               class_members_toctree=app.config.numpydoc_class_members_toctree,
-              )
+    if references:
+        for r in references:
+            if r.isdigit():
+                new_r = sixu("R%d") % (reference_offset[0] + int(r))
+            else:
+                new_r = sixu("%s%d") % (r, reference_offset[0])
 
-    # PANDAS HACK (to remove the list of methods/attributes for Categorical)
-    if what == "class" and name.endswith(".Categorical"):
-        cfg['class_members_list'] = False
+            for i, line in enumerate(lines):
+                lines[i] = lines[i].replace(sixu('[%s]_') % r,
+                                            sixu('[%s]_') % new_r)
+                lines[i] = lines[i].replace(sixu('.. [%s]') % r,
+                                            sixu('.. [%s]') % new_r)
 
+        reference_offset[0] += len(references)
+
+
+DEDUPLICATION_TAG = '    !! processed by numpydoc !!'
+
+
+def mangle_docstrings(app, what, name, obj, options, lines):
+    if DEDUPLICATION_TAG in lines:
+        return
+
+    cfg = {'use_plots': app.config.numpydoc_use_plots,
+           'use_blockquotes': app.config.numpydoc_use_blockquotes,
+           'show_class_members': app.config.numpydoc_show_class_members,
+           'show_inherited_class_members':
+           app.config.numpydoc_show_inherited_class_members,
+           'class_members_toctree': app.config.numpydoc_class_members_toctree,
+           'attributes_as_param_list':
+           app.config.numpydoc_attributes_as_param_list}
+
+    u_NL = sixu('\n')
     if what == 'module':
         # Strip top title
-        title_re = re.compile(sixu('^\\s*[#*=]{4,}\\n[a-z0-9 -]+\\n[#*=]{4,}\\s*'),
-                              re.I|re.S)
-        lines[:] = title_re.sub(sixu(''), sixu("\n").join(lines)).split(sixu("\n"))
+        pattern = '^\\s*[#*=]{4,}\\n[a-z0-9 -]+\\n[#*=]{4,}\\s*'
+        title_re = re.compile(sixu(pattern), re.I | re.S)
+        lines[:] = title_re.sub(sixu(''), u_NL.join(lines)).split(u_NL)
     else:
-        doc = get_doc_object(obj, what, sixu("\n").join(lines), config=cfg)
+        doc = get_doc_object(obj, what, u_NL.join(lines), config=cfg,
+                             builder=app.builder)
         if sys.version_info[0] >= 3:
             doc = str(doc)
         else:
             doc = unicode(doc)
-        lines[:] = doc.split(sixu("\n"))
+        lines[:] = doc.split(u_NL)
 
-    if app.config.numpydoc_edit_link and hasattr(obj, '__name__') and \
-           obj.__name__:
+    if (app.config.numpydoc_edit_link and hasattr(obj, '__name__') and
+            obj.__name__):
         if hasattr(obj, '__module__'):
             v = dict(full_name=sixu("%s.%s") % (obj.__module__, obj.__name__))
         else:
@@ -69,48 +105,36 @@ def mangle_docstrings(app, what, name, obj, options, lines,
         lines += [sixu('    %s') % x for x in
                   (app.config.numpydoc_edit_link % v).split("\n")]
 
-    # replace reference numbers so that there are no duplicates
-    references = []
-    for line in lines:
-        line = line.strip()
-        m = re.match(sixu('^.. \\[([a-z0-9_.-])\\]'), line, re.I)
-        if m:
-            references.append(m.group(1))
+    # call function to replace reference numbers so that there are no
+    # duplicates
+    rename_references(app, what, name, obj, options, lines)
 
-    # start renaming from the longest string, to avoid overwriting parts
-    references.sort(key=lambda x: -len(x))
-    if references:
-        for i, line in enumerate(lines):
-            for r in references:
-                if re.match(sixu('^\\d+$'), r):
-                    new_r = sixu("R%d") % (reference_offset[0] + int(r))
-                else:
-                    new_r = sixu("%s%d") % (r, reference_offset[0])
-                lines[i] = lines[i].replace(sixu('[%s]_') % r,
-                                            sixu('[%s]_') % new_r)
-                lines[i] = lines[i].replace(sixu('.. [%s]') % r,
-                                            sixu('.. [%s]') % new_r)
+    lines += ['..', DEDUPLICATION_TAG]
 
-    reference_offset[0] += len(references)
 
 def mangle_signature(app, what, name, obj, options, sig, retann):
     # Do not try to inspect classes that don't define `__init__`
     if (inspect.isclass(obj) and
         (not hasattr(obj, '__init__') or
-        'initializes x; see ' in pydoc.getdoc(obj.__init__))):
+            'initializes x; see ' in pydoc.getdoc(obj.__init__))):
         return '', ''
 
-    if not (isinstance(obj, collections.Callable) or hasattr(obj, '__argspec_is_invalid_')): return
-    if not hasattr(obj, '__doc__'): return
+    if not (isinstance(obj, collections.Callable) or
+            hasattr(obj, '__argspec_is_invalid_')):
+        return
 
+    if not hasattr(obj, '__doc__'):
+        return
     doc = SphinxDocString(pydoc.getdoc(obj))
-    if doc['Signature']:
-        sig = re.sub(sixu("^[^(]*"), sixu(""), doc['Signature'])
+    sig = doc['Signature'] or getattr(obj, '__text_signature__', None)
+    if sig:
+        sig = re.sub(sixu("^[^(]*"), sixu(""), sig)
         return sig, sixu('')
 
+
 def setup(app, get_doc_object_=get_doc_object):
     if not hasattr(app, 'add_config_value'):
-        return # probably called by nose, better bail out
+        return  # probably called by nose, better bail out
 
     global get_doc_object
     get_doc_object = get_doc_object_
@@ -119,21 +143,32 @@ def setup(app, get_doc_object_=get_doc_object):
     app.connect('autodoc-process-signature', mangle_signature)
     app.add_config_value('numpydoc_edit_link', None, False)
     app.add_config_value('numpydoc_use_plots', None, False)
+    app.add_config_value('numpydoc_use_blockquotes', None, False)
     app.add_config_value('numpydoc_show_class_members', True, True)
+    app.add_config_value('numpydoc_show_inherited_class_members', True, True)
     app.add_config_value('numpydoc_class_members_toctree', True, True)
+    app.add_config_value('numpydoc_citation_re', '[a-z0-9_.-]+', True)
+    app.add_config_value('numpydoc_attributes_as_param_list', True, True)
 
     # Extra mangling domains
     app.add_domain(NumpyPythonDomain)
     app.add_domain(NumpyCDomain)
 
-#------------------------------------------------------------------------------
+    app.setup_extension('sphinx.ext.autosummary')
+
+    metadata = {'version': __version__,
+                'parallel_read_safe': True}
+    return metadata
+
+# ------------------------------------------------------------------------------
 # Docstring-mangling domains
-#------------------------------------------------------------------------------
+# ------------------------------------------------------------------------------
 
 from docutils.statemachine import ViewList
 from sphinx.domains.c import CDomain
 from sphinx.domains.python import PythonDomain
 
+
 class ManglingDomainBase(object):
     directive_mangling_map = {}
 
@@ -146,6 +181,7 @@ def wrap_mangling_directives(self):
             self.directives[name] = wrap_mangling_directive(
                 self.directives[name], objtype)
 
+
 class NumpyPythonDomain(ManglingDomainBase, PythonDomain):
     name = 'np'
     directive_mangling_map = {
@@ -159,6 +195,7 @@ class NumpyPythonDomain(ManglingDomainBase, PythonDomain):
     }
     indices = []
 
+
 class NumpyCDomain(ManglingDomainBase, CDomain):
     name = 'np-c'
     directive_mangling_map = {
@@ -169,6 +206,63 @@ class NumpyCDomain(ManglingDomainBase, CDomain):
         'var': 'object',
     }
 
+
+def match_items(lines, content_old):
+    """Create items for mangled lines.
+
+    This function tries to match the lines in ``lines`` with the items (source
+    file references and line numbers) in ``content_old``. The
+    ``mangle_docstrings`` function changes the actual docstrings, but doesn't
+    keep track of where each line came from. The manging does many operations
+    on the original lines, which are hard to track afterwards.
+
+    Many of the line changes come from deleting or inserting blank lines. This
+    function tries to match lines by ignoring blank lines. All other changes
+    (such as inserting figures or changes in the references) are completely
+    ignored, so the generated line numbers will be off if ``mangle_docstrings``
+    does anything non-trivial.
+
+    This is a best-effort function and the real fix would be to make
+    ``mangle_docstrings`` actually keep track of the ``items`` together with
+    the ``lines``.
+
+    Examples
+    --------
+    >>> lines = ['', 'A', '', 'B', '   ', '', 'C', 'D']
+    >>> lines_old = ['a', '', '', 'b', '', 'c']
+    >>> items_old = [('file1.py', 0), ('file1.py', 1), ('file1.py', 2),
+    ...              ('file2.py', 0), ('file2.py', 1), ('file2.py', 2)]
+    >>> content_old = ViewList(lines_old, items=items_old)
+    >>> match_items(lines, content_old) # doctest: +NORMALIZE_WHITESPACE
+    [('file1.py', 0), ('file1.py', 0), ('file2.py', 0), ('file2.py', 0),
+     ('file2.py', 2), ('file2.py', 2), ('file2.py', 2), ('file2.py', 2)]
+    >>> # first 2 ``lines`` are matched to 'a', second 2 to 'b', rest to 'c'
+    >>> # actual content is completely ignored.
+
+    Notes
+    -----
+    The algorithm tries to match any line in ``lines`` with one in
+    ``lines_old``.  It skips over all empty lines in ``lines_old`` and assigns
+    this line number to all lines in ``lines``, unless a non-empty line is
+    found in ``lines`` in which case it goes to the next line in ``lines_old``.
+
+    """
+    items_new = []
+    lines_old = content_old.data
+    items_old = content_old.items
+    j = 0
+    for i, line in enumerate(lines):
+        # go to next non-empty line in old:
+        # line.strip() checks whether the string is all whitespace
+        while j < len(lines_old) - 1 and not lines_old[j].strip():
+            j += 1
+        items_new.append(items_old[j])
+        if line.strip() and j < len(lines_old) - 1:
+            j += 1
+    assert(len(items_new) == len(lines))
+    return items_new
+
+
 def wrap_mangling_directive(base_directive, objtype):
     class directive(base_directive):
         def run(self):
@@ -184,7 +278,10 @@ def run(self):
 
             lines = list(self.content)
             mangle_docstrings(env.app, objtype, name, None, None, lines)
-            self.content = ViewList(lines, self.content.parent)
+            if self.content:
+                items = match_items(lines, self.content)
+                self.content = ViewList(lines, items=items,
+                                        parent=self.content.parent)
 
             return base_directive.run(self)
 
diff --git a/doc/sphinxext/numpydoc/phantom_import.py b/doc/sphinxext/numpydoc/phantom_import.py
deleted file mode 100755
index 9a60b4a35b18f..0000000000000
--- a/doc/sphinxext/numpydoc/phantom_import.py
+++ /dev/null
@@ -1,167 +0,0 @@
-"""
-==============
-phantom_import
-==============
-
-Sphinx extension to make directives from ``sphinx.ext.autodoc`` and similar
-extensions to use docstrings loaded from an XML file.
-
-This extension loads an XML file in the Pydocweb format [1] and
-creates a dummy module that contains the specified docstrings. This
-can be used to get the current docstrings from a Pydocweb instance
-without needing to rebuild the documented module.
-
-.. [1] http://code.google.com/p/pydocweb
-
-"""
-from __future__ import division, absolute_import, print_function
-
-import imp, sys, compiler, types, os, inspect, re
-
-def setup(app):
-    app.connect('builder-inited', initialize)
-    app.add_config_value('phantom_import_file', None, True)
-
-def initialize(app):
-    fn = app.config.phantom_import_file
-    if (fn and os.path.isfile(fn)):
-        print("[numpydoc] Phantom importing modules from", fn, "...")
-        import_phantom_module(fn)
-
-#------------------------------------------------------------------------------
-# Creating 'phantom' modules from an XML description
-#------------------------------------------------------------------------------
-def import_phantom_module(xml_file):
-    """
-    Insert a fake Python module to sys.modules, based on a XML file.
-
-    The XML file is expected to conform to Pydocweb DTD. The fake
-    module will contain dummy objects, which guarantee the following:
-
-    - Docstrings are correct.
-    - Class inheritance relationships are correct (if present in XML).
-    - Function argspec is *NOT* correct (even if present in XML).
-      Instead, the function signature is prepended to the function docstring.
-    - Class attributes are *NOT* correct; instead, they are dummy objects.
-
-    Parameters
-    ----------
-    xml_file : str
-        Name of an XML file to read
-    
-    """
-    import lxml.etree as etree
-
-    object_cache = {}
-
-    tree = etree.parse(xml_file)
-    root = tree.getroot()
-
-    # Sort items so that
-    # - Base classes come before classes inherited from them
-    # - Modules come before their contents
-    all_nodes = dict([(n.attrib['id'], n) for n in root])
-    
-    def _get_bases(node, recurse=False):
-        bases = [x.attrib['ref'] for x in node.findall('base')]
-        if recurse:
-            j = 0
-            while True:
-                try:
-                    b = bases[j]
-                except IndexError: break
-                if b in all_nodes:
-                    bases.extend(_get_bases(all_nodes[b]))
-                j += 1
-        return bases
-
-    type_index = ['module', 'class', 'callable', 'object']
-    
-    def base_cmp(a, b):
-        x = cmp(type_index.index(a.tag), type_index.index(b.tag))
-        if x != 0: return x
-
-        if a.tag == 'class' and b.tag == 'class':
-            a_bases = _get_bases(a, recurse=True)
-            b_bases = _get_bases(b, recurse=True)
-            x = cmp(len(a_bases), len(b_bases))
-            if x != 0: return x
-            if a.attrib['id'] in b_bases: return -1
-            if b.attrib['id'] in a_bases: return 1
-        
-        return cmp(a.attrib['id'].count('.'), b.attrib['id'].count('.'))
-
-    nodes = root.getchildren()
-    nodes.sort(base_cmp)
-
-    # Create phantom items
-    for node in nodes:
-        name = node.attrib['id']
-        doc = (node.text or '').decode('string-escape') + "\n"
-        if doc == "\n": doc = ""
-
-        # create parent, if missing
-        parent = name
-        while True:
-            parent = '.'.join(parent.split('.')[:-1])
-            if not parent: break
-            if parent in object_cache: break
-            obj = imp.new_module(parent)
-            object_cache[parent] = obj
-            sys.modules[parent] = obj
-
-        # create object
-        if node.tag == 'module':
-            obj = imp.new_module(name)
-            obj.__doc__ = doc
-            sys.modules[name] = obj
-        elif node.tag == 'class':
-            bases = [object_cache[b] for b in _get_bases(node)
-                     if b in object_cache]
-            bases.append(object)
-            init = lambda self: None
-            init.__doc__ = doc
-            obj = type(name, tuple(bases), {'__doc__': doc, '__init__': init})
-            obj.__name__ = name.split('.')[-1]
-        elif node.tag == 'callable':
-            funcname = node.attrib['id'].split('.')[-1]
-            argspec = node.attrib.get('argspec')
-            if argspec:
-                argspec = re.sub('^[^(]*', '', argspec)
-                doc = "%s%s\n\n%s" % (funcname, argspec, doc)
-            obj = lambda: 0
-            obj.__argspec_is_invalid_ = True
-            if sys.version_info[0] >= 3:
-                obj.__name__ = funcname
-            else:
-                obj.func_name = funcname
-            obj.__name__ = name
-            obj.__doc__ = doc
-            if inspect.isclass(object_cache[parent]):
-                obj.__objclass__ = object_cache[parent]
-        else:
-            class Dummy(object): pass
-            obj = Dummy()
-            obj.__name__ = name
-            obj.__doc__ = doc
-            if inspect.isclass(object_cache[parent]):
-                obj.__get__ = lambda: None
-        object_cache[name] = obj
-
-        if parent:
-            if inspect.ismodule(object_cache[parent]):
-                obj.__module__ = parent
-                setattr(object_cache[parent], name.split('.')[-1], obj)
-
-    # Populate items
-    for node in root:
-        obj = object_cache.get(node.attrib['id'])
-        if obj is None: continue
-        for ref in node.findall('ref'):
-            if node.tag == 'class':
-                if ref.attrib['ref'].startswith(node.attrib['id'] + '.'):
-                    setattr(obj, ref.attrib['name'],
-                            object_cache.get(ref.attrib['ref']))
-            else:
-                setattr(obj, ref.attrib['name'],
-                        object_cache.get(ref.attrib['ref']))
diff --git a/doc/sphinxext/numpydoc/plot_directive.py b/doc/sphinxext/numpydoc/plot_directive.py
deleted file mode 100755
index 2014f857076c1..0000000000000
--- a/doc/sphinxext/numpydoc/plot_directive.py
+++ /dev/null
@@ -1,642 +0,0 @@
-"""
-A special directive for generating a matplotlib plot.
-
-.. warning::
-
-   This is a hacked version of plot_directive.py from Matplotlib.
-   It's very much subject to change!
-
-
-Usage
------
-
-Can be used like this::
-
-    .. plot:: examples/example.py
-
-    .. plot::
-
-       import matplotlib.pyplot as plt
-       plt.plot([1,2,3], [4,5,6])
-
-    .. plot::
-
-       A plotting example:
-
-       >>> import matplotlib.pyplot as plt
-       >>> plt.plot([1,2,3], [4,5,6])
-
-The content is interpreted as doctest formatted if it has a line starting
-with ``>>>``.
-
-The ``plot`` directive supports the options
-
-    format : {'python', 'doctest'}
-        Specify the format of the input
-
-    include-source : bool
-        Whether to display the source code. Default can be changed in conf.py
-
-and the ``image`` directive options ``alt``, ``height``, ``width``,
-``scale``, ``align``, ``class``.
-
-Configuration options
----------------------
-
-The plot directive has the following configuration options:
-
-    plot_include_source
-        Default value for the include-source option
-
-    plot_pre_code
-        Code that should be executed before each plot.
-
-    plot_basedir
-        Base directory, to which plot:: file names are relative to.
-        (If None or empty, file names are relative to the directoly where
-        the file containing the directive is.)
-
-    plot_formats
-        File formats to generate. List of tuples or strings::
-
-            [(suffix, dpi), suffix, ...]
-
-        that determine the file format and the DPI. For entries whose
-        DPI was omitted, sensible defaults are chosen.
-
-    plot_html_show_formats
-        Whether to show links to the files in HTML.
-
-TODO
-----
-
-* Refactor Latex output; now it's plain images, but it would be nice
-  to make them appear side-by-side, or in floats.
-
-"""
-from __future__ import division, absolute_import, print_function
-
-import sys, os, glob, shutil, imp, warnings, re, textwrap, traceback
-import sphinx
-
-if sys.version_info[0] >= 3:
-    from io import StringIO
-else:
-    from io import StringIO
-
-import warnings
-warnings.warn("A plot_directive module is also available under "
-              "matplotlib.sphinxext; expect this numpydoc.plot_directive "
-              "module to be deprecated after relevant features have been "
-              "integrated there.",
-              FutureWarning, stacklevel=2)
-
-
-#------------------------------------------------------------------------------
-# Registration hook
-#------------------------------------------------------------------------------
-
-def setup(app):
-    setup.app = app
-    setup.config = app.config
-    setup.confdir = app.confdir
-
-    app.add_config_value('plot_pre_code', '', True)
-    app.add_config_value('plot_include_source', False, True)
-    app.add_config_value('plot_formats', ['png', 'hires.png', 'pdf'], True)
-    app.add_config_value('plot_basedir', None, True)
-    app.add_config_value('plot_html_show_formats', True, True)
-
-    app.add_directive('plot', plot_directive, True, (0, 1, False),
-                      **plot_directive_options)
-
-#------------------------------------------------------------------------------
-# plot:: directive
-#------------------------------------------------------------------------------
-from docutils.parsers.rst import directives
-from docutils import nodes
-
-def plot_directive(name, arguments, options, content, lineno,
-                   content_offset, block_text, state, state_machine):
-    return run(arguments, content, options, state_machine, state, lineno)
-plot_directive.__doc__ = __doc__
-
-def _option_boolean(arg):
-    if not arg or not arg.strip():
-        # no argument given, assume used as a flag
-        return True
-    elif arg.strip().lower() in ('no', '0', 'false'):
-        return False
-    elif arg.strip().lower() in ('yes', '1', 'true'):
-        return True
-    else:
-        raise ValueError('"%s" unknown boolean' % arg)
-
-def _option_format(arg):
-    return directives.choice(arg, ('python', 'lisp'))
-
-def _option_align(arg):
-    return directives.choice(arg, ("top", "middle", "bottom", "left", "center",
-                                   "right"))
-
-plot_directive_options = {'alt': directives.unchanged,
-                          'height': directives.length_or_unitless,
-                          'width': directives.length_or_percentage_or_unitless,
-                          'scale': directives.nonnegative_int,
-                          'align': _option_align,
-                          'class': directives.class_option,
-                          'include-source': _option_boolean,
-                          'format': _option_format,
-                          }
-
-#------------------------------------------------------------------------------
-# Generating output
-#------------------------------------------------------------------------------
-
-from docutils import nodes, utils
-
-try:
-    # Sphinx depends on either Jinja or Jinja2
-    import jinja2
-    def format_template(template, **kw):
-        return jinja2.Template(template).render(**kw)
-except ImportError:
-    import jinja
-    def format_template(template, **kw):
-        return jinja.from_string(template, **kw)
-
-TEMPLATE = """
-{{ source_code }}
-
-{{ only_html }}
-
-   {% if source_link or (html_show_formats and not multi_image) %}
-   (
-   {%- if source_link -%}
-   `Source code <{{ source_link }}>`__
-   {%- endif -%}
-   {%- if html_show_formats and not multi_image -%}
-     {%- for img in images -%}
-       {%- for fmt in img.formats -%}
-         {%- if source_link or not loop.first -%}, {% endif -%}
-         `{{ fmt }} <{{ dest_dir }}/{{ img.basename }}.{{ fmt }}>`__
-       {%- endfor -%}
-     {%- endfor -%}
-   {%- endif -%}
-   )
-   {% endif %}
-
-   {% for img in images %}
-   .. figure:: {{ build_dir }}/{{ img.basename }}.png
-      {%- for option in options %}
-      {{ option }}
-      {% endfor %}
-
-      {% if html_show_formats and multi_image -%}
-        (
-        {%- for fmt in img.formats -%}
-        {%- if not loop.first -%}, {% endif -%}
-        `{{ fmt }} <{{ dest_dir }}/{{ img.basename }}.{{ fmt }}>`__
-        {%- endfor -%}
-        )
-      {%- endif -%}
-   {% endfor %}
-
-{{ only_latex }}
-
-   {% for img in images %}
-   .. image:: {{ build_dir }}/{{ img.basename }}.pdf
-   {% endfor %}
-
-"""
-
-class ImageFile(object):
-    def __init__(self, basename, dirname):
-        self.basename = basename
-        self.dirname = dirname
-        self.formats = []
-
-    def filename(self, format):
-        return os.path.join(self.dirname, "%s.%s" % (self.basename, format))
-
-    def filenames(self):
-        return [self.filename(fmt) for fmt in self.formats]
-
-def run(arguments, content, options, state_machine, state, lineno):
-    if arguments and content:
-        raise RuntimeError("plot:: directive can't have both args and content")
-
-    document = state_machine.document
-    config = document.settings.env.config
-
-    options.setdefault('include-source', config.plot_include_source)
-
-    # determine input
-    rst_file = document.attributes['source']
-    rst_dir = os.path.dirname(rst_file)
-
-    if arguments:
-        if not config.plot_basedir:
-            source_file_name = os.path.join(rst_dir,
-                                            directives.uri(arguments[0]))
-        else:
-            source_file_name = os.path.join(setup.confdir, config.plot_basedir,
-                                            directives.uri(arguments[0]))
-        code = open(source_file_name, 'r').read()
-        output_base = os.path.basename(source_file_name)
-    else:
-        source_file_name = rst_file
-        code = textwrap.dedent("\n".join(map(str, content)))
-        counter = document.attributes.get('_plot_counter', 0) + 1
-        document.attributes['_plot_counter'] = counter
-        base, ext = os.path.splitext(os.path.basename(source_file_name))
-        output_base = '%s-%d.py' % (base, counter)
-
-    base, source_ext = os.path.splitext(output_base)
-    if source_ext in ('.py', '.rst', '.txt'):
-        output_base = base
-    else:
-        source_ext = ''
-
-    # ensure that LaTeX includegraphics doesn't choke in foo.bar.pdf filenames
-    output_base = output_base.replace('.', '-')
-
-    # is it in doctest format?
-    is_doctest = contains_doctest(code)
-    if 'format' in options:
-        if options['format'] == 'python':
-            is_doctest = False
-        else:
-            is_doctest = True
-
-    # determine output directory name fragment
-    source_rel_name = relpath(source_file_name, setup.confdir)
-    source_rel_dir = os.path.dirname(source_rel_name)
-    while source_rel_dir.startswith(os.path.sep):
-        source_rel_dir = source_rel_dir[1:]
-
-    # build_dir: where to place output files (temporarily)
-    build_dir = os.path.join(os.path.dirname(setup.app.doctreedir),
-                             'plot_directive',
-                             source_rel_dir)
-    if not os.path.exists(build_dir):
-        os.makedirs(build_dir)
-
-    # output_dir: final location in the builder's directory
-    dest_dir = os.path.abspath(os.path.join(setup.app.builder.outdir,
-                                            source_rel_dir))
-
-    # how to link to files from the RST file
-    dest_dir_link = os.path.join(relpath(setup.confdir, rst_dir),
-                                 source_rel_dir).replace(os.path.sep, '/')
-    build_dir_link = relpath(build_dir, rst_dir).replace(os.path.sep, '/')
-    source_link = dest_dir_link + '/' + output_base + source_ext
-
-    # make figures
-    try:
-        results = makefig(code, source_file_name, build_dir, output_base,
-                          config)
-        errors = []
-    except PlotError as err:
-        reporter = state.memo.reporter
-        sm = reporter.system_message(
-            2, "Exception occurred in plotting %s: %s" % (output_base, err),
-            line=lineno)
-        results = [(code, [])]
-        errors = [sm]
-
-    # generate output restructuredtext
-    total_lines = []
-    for j, (code_piece, images) in enumerate(results):
-        if options['include-source']:
-            if is_doctest:
-                lines = ['']
-                lines += [row.rstrip() for row in code_piece.split('\n')]
-            else:
-                lines = ['.. code-block:: python', '']
-                lines += ['    %s' % row.rstrip()
-                          for row in code_piece.split('\n')]
-            source_code = "\n".join(lines)
-        else:
-            source_code = ""
-
-        opts = [':%s: %s' % (key, val) for key, val in list(options.items())
-                if key in ('alt', 'height', 'width', 'scale', 'align', 'class')]
-
-        only_html = ".. only:: html"
-        only_latex = ".. only:: latex"
-
-        if j == 0:
-            src_link = source_link
-        else:
-            src_link = None
-
-        result = format_template(
-            TEMPLATE,
-            dest_dir=dest_dir_link,
-            build_dir=build_dir_link,
-            source_link=src_link,
-            multi_image=len(images) > 1,
-            only_html=only_html,
-            only_latex=only_latex,
-            options=opts,
-            images=images,
-            source_code=source_code,
-            html_show_formats=config.plot_html_show_formats)
-
-        total_lines.extend(result.split("\n"))
-        total_lines.extend("\n")
-
-    if total_lines:
-        state_machine.insert_input(total_lines, source=source_file_name)
-
-    # copy image files to builder's output directory
-    if not os.path.exists(dest_dir):
-        os.makedirs(dest_dir)
-
-    for code_piece, images in results:
-        for img in images:
-            for fn in img.filenames():
-                shutil.copyfile(fn, os.path.join(dest_dir,
-                                                 os.path.basename(fn)))
-
-    # copy script (if necessary)
-    if source_file_name == rst_file:
-        target_name = os.path.join(dest_dir, output_base + source_ext)
-        f = open(target_name, 'w')
-        f.write(unescape_doctest(code))
-        f.close()
-
-    return errors
-
-
-#------------------------------------------------------------------------------
-# Run code and capture figures
-#------------------------------------------------------------------------------
-
-import matplotlib
-matplotlib.use('Agg')
-import matplotlib.pyplot as plt
-import matplotlib.image as image
-from matplotlib import _pylab_helpers
-
-import exceptions
-
-def contains_doctest(text):
-    try:
-        # check if it's valid Python as-is
-        compile(text, '<string>', 'exec')
-        return False
-    except SyntaxError:
-        pass
-    r = re.compile(r'^\s*>>>', re.M)
-    m = r.search(text)
-    return bool(m)
-
-def unescape_doctest(text):
-    """
-    Extract code from a piece of text, which contains either Python code
-    or doctests.
-
-    """
-    if not contains_doctest(text):
-        return text
-
-    code = ""
-    for line in text.split("\n"):
-        m = re.match(r'^\s*(>>>|\.\.\.) (.*)$', line)
-        if m:
-            code += m.group(2) + "\n"
-        elif line.strip():
-            code += "# " + line.strip() + "\n"
-        else:
-            code += "\n"
-    return code
-
-def split_code_at_show(text):
-    """
-    Split code at plt.show()
-
-    """
-
-    parts = []
-    is_doctest = contains_doctest(text)
-
-    part = []
-    for line in text.split("\n"):
-        if (not is_doctest and line.strip() == 'plt.show()') or \
-               (is_doctest and line.strip() == '>>> plt.show()'):
-            part.append(line)
-            parts.append("\n".join(part))
-            part = []
-        else:
-            part.append(line)
-    if "\n".join(part).strip():
-        parts.append("\n".join(part))
-    return parts
-
-class PlotError(RuntimeError):
-    pass
-
-def run_code(code, code_path, ns=None):
-    # Change the working directory to the directory of the example, so
-    # it can get at its data files, if any.
-    pwd = os.getcwd()
-    old_sys_path = list(sys.path)
-    if code_path is not None:
-        dirname = os.path.abspath(os.path.dirname(code_path))
-        os.chdir(dirname)
-        sys.path.insert(0, dirname)
-
-    # Redirect stdout
-    stdout = sys.stdout
-    sys.stdout = StringIO()
-
-    # Reset sys.argv
-    old_sys_argv = sys.argv
-    sys.argv = [code_path]
-    
-    try:
-        try:
-            code = unescape_doctest(code)
-            if ns is None:
-                ns = {}
-            if not ns:
-                exec(setup.config.plot_pre_code, ns)
-            exec(code, ns)
-        except (Exception, SystemExit) as err:
-            raise PlotError(traceback.format_exc())
-    finally:
-        os.chdir(pwd)
-        sys.argv = old_sys_argv
-        sys.path[:] = old_sys_path
-        sys.stdout = stdout
-    return ns
-
-
-#------------------------------------------------------------------------------
-# Generating figures
-#------------------------------------------------------------------------------
-
-def out_of_date(original, derived):
-    """
-    Returns True if derivative is out-of-date wrt original,
-    both of which are full file paths.
-    """
-    return (not os.path.exists(derived)
-            or os.stat(derived).st_mtime < os.stat(original).st_mtime)
-
-
-def makefig(code, code_path, output_dir, output_base, config):
-    """
-    Run a pyplot script *code* and save the images under *output_dir*
-    with file names derived from *output_base*
-
-    """
-
-    # -- Parse format list
-    default_dpi = {'png': 80, 'hires.png': 200, 'pdf': 50}
-    formats = []
-    for fmt in config.plot_formats:
-        if isinstance(fmt, str):
-            formats.append((fmt, default_dpi.get(fmt, 80)))
-        elif type(fmt) in (tuple, list) and len(fmt)==2:
-            formats.append((str(fmt[0]), int(fmt[1])))
-        else:
-            raise PlotError('invalid image format "%r" in plot_formats' % fmt)
-
-    # -- Try to determine if all images already exist
-
-    code_pieces = split_code_at_show(code)
-
-    # Look for single-figure output files first
-    all_exists = True
-    img = ImageFile(output_base, output_dir)
-    for format, dpi in formats:
-        if out_of_date(code_path, img.filename(format)):
-            all_exists = False
-            break
-        img.formats.append(format)
-
-    if all_exists:
-        return [(code, [img])]
-
-    # Then look for multi-figure output files
-    results = []
-    all_exists = True
-    for i, code_piece in enumerate(code_pieces):
-        images = []
-        for j in range(1000):
-            img = ImageFile('%s_%02d_%02d' % (output_base, i, j), output_dir)
-            for format, dpi in formats:
-                if out_of_date(code_path, img.filename(format)):
-                    all_exists = False
-                    break
-                img.formats.append(format)
-
-            # assume that if we have one, we have them all
-            if not all_exists:
-                all_exists = (j > 0)
-                break
-            images.append(img)
-        if not all_exists:
-            break
-        results.append((code_piece, images))
-
-    if all_exists:
-        return results
-
-    # -- We didn't find the files, so build them
-
-    results = []
-    ns = {}
-
-    for i, code_piece in enumerate(code_pieces):
-        # Clear between runs
-        plt.close('all')
-
-        # Run code
-        run_code(code_piece, code_path, ns)
-
-        # Collect images
-        images = []
-        fig_managers = _pylab_helpers.Gcf.get_all_fig_managers()
-        for j, figman in enumerate(fig_managers):
-            if len(fig_managers) == 1 and len(code_pieces) == 1:
-                img = ImageFile(output_base, output_dir)
-            else:
-                img = ImageFile("%s_%02d_%02d" % (output_base, i, j),
-                                output_dir)
-            images.append(img)
-            for format, dpi in formats:
-                try:
-                    figman.canvas.figure.savefig(img.filename(format), dpi=dpi)
-                except exceptions.BaseException as err:
-                    raise PlotError(traceback.format_exc())
-                img.formats.append(format)
-
-        # Results
-        results.append((code_piece, images))
-
-    return results
-
-
-#------------------------------------------------------------------------------
-# Relative pathnames
-#------------------------------------------------------------------------------
-
-try:
-    from os.path import relpath
-except ImportError:
-    # Copied from Python 2.7
-    if 'posix' in sys.builtin_module_names:
-        def relpath(path, start=os.path.curdir):
-            """Return a relative version of a path"""
-            from os.path import sep, curdir, join, abspath, commonprefix, \
-                 pardir
-
-            if not path:
-                raise ValueError("no path specified")
-
-            start_list = abspath(start).split(sep)
-            path_list = abspath(path).split(sep)
-
-            # Work out how much of the filepath is shared by start and path.
-            i = len(commonprefix([start_list, path_list]))
-
-            rel_list = [pardir] * (len(start_list)-i) + path_list[i:]
-            if not rel_list:
-                return curdir
-            return join(*rel_list)
-    elif 'nt' in sys.builtin_module_names:
-        def relpath(path, start=os.path.curdir):
-            """Return a relative version of a path"""
-            from os.path import sep, curdir, join, abspath, commonprefix, \
-                 pardir, splitunc
-
-            if not path:
-                raise ValueError("no path specified")
-            start_list = abspath(start).split(sep)
-            path_list = abspath(path).split(sep)
-            if start_list[0].lower() != path_list[0].lower():
-                unc_path, rest = splitunc(path)
-                unc_start, rest = splitunc(start)
-                if bool(unc_path) ^ bool(unc_start):
-                    raise ValueError("Cannot mix UNC and non-UNC paths (%s and %s)"
-                                                                        % (path, start))
-                else:
-                    raise ValueError("path is on drive %s, start on drive %s"
-                                                        % (path_list[0], start_list[0]))
-            # Work out how much of the filepath is shared by start and path.
-            for i in range(min(len(start_list), len(path_list))):
-                if start_list[i].lower() != path_list[i].lower():
-                    break
-            else:
-                i += 1
-
-            rel_list = [pardir] * (len(start_list)-i) + path_list[i:]
-            if not rel_list:
-                return curdir
-            return join(*rel_list)
-    else:
-        raise RuntimeError("Unsupported platform (no relpath available!)")
diff --git a/doc/sphinxext/numpydoc/templates/numpydoc_docstring.rst b/doc/sphinxext/numpydoc/templates/numpydoc_docstring.rst
new file mode 100644
index 0000000000000..1900db53cee47
--- /dev/null
+++ b/doc/sphinxext/numpydoc/templates/numpydoc_docstring.rst
@@ -0,0 +1,16 @@
+{{index}}
+{{summary}}
+{{extended_summary}}
+{{parameters}}
+{{returns}}
+{{yields}}
+{{other_parameters}}
+{{raises}}
+{{warns}}
+{{warnings}}
+{{see_also}}
+{{notes}}
+{{references}}
+{{examples}}
+{{attributes}}
+{{methods}}
diff --git a/doc/sphinxext/numpydoc/tests/test_docscrape.py b/doc/sphinxext/numpydoc/tests/test_docscrape.py
old mode 100755
new mode 100644
index b682504e1618f..2fb4eb5ab277e
--- a/doc/sphinxext/numpydoc/tests/test_docscrape.py
+++ b/doc/sphinxext/numpydoc/tests/test_docscrape.py
@@ -1,11 +1,25 @@
 # -*- encoding:utf-8 -*-
 from __future__ import division, absolute_import, print_function
 
-import sys, textwrap
-
-from numpydoc.docscrape import NumpyDocString, FunctionDoc, ClassDoc
-from numpydoc.docscrape_sphinx import SphinxDocString, SphinxClassDoc
-from nose.tools import *
+import re
+import sys
+import textwrap
+import warnings
+
+import jinja2
+
+from numpydoc.docscrape import (
+    NumpyDocString,
+    FunctionDoc,
+    ClassDoc,
+    ParseError
+)
+from numpydoc.docscrape_sphinx import (SphinxDocString, SphinxClassDoc,
+                                       SphinxFunctionDoc)
+from nose.tools import (assert_equal, assert_raises, assert_list_equal,
+                        assert_true)
+
+assert_list_equal.__self__.maxDiff = None
 
 if sys.version_info[0] >= 3:
     sixu = lambda s: s
@@ -42,7 +56,7 @@
   -------
   out : ndarray
       The drawn samples, arranged according to `shape`.  If the
-      shape given is (m,n,...), then the shape of `out` is is
+      shape given is (m,n,...), then the shape of `out` is
       (m,n,...,N).
 
       In other words, each entry ``out[i,j,...,:]`` is an N-dimensional
@@ -50,6 +64,7 @@
   list of str
       This is not a real return value.  It exists to test
       anonymous return values.
+  no_description
 
   Other Parameters
   ----------------
@@ -122,18 +137,35 @@
   '''
 doc = NumpyDocString(doc_txt)
 
+doc_yields_txt = """
+Test generator
+
+Yields
+------
+a : int
+    The number of apples.
+b : int
+    The number of bananas.
+int
+    The number of unknowns.
+"""
+doc_yields = NumpyDocString(doc_yields_txt)
+
 
 def test_signature():
     assert doc['Signature'].startswith('numpy.multivariate_normal(')
     assert doc['Signature'].endswith('spam=None)')
 
+
 def test_summary():
     assert doc['Summary'][0].startswith('Draw values')
     assert doc['Summary'][-1].endswith('covariance.')
 
+
 def test_extended_summary():
     assert doc['Extended Summary'][0].startswith('The multivariate normal')
 
+
 def test_parameters():
     assert_equal(len(doc['Parameters']), 3)
     assert_equal([n for n,_,_ in doc['Parameters']], ['mean','cov','shape'])
@@ -141,7 +173,8 @@ def test_parameters():
     arg, arg_type, desc = doc['Parameters'][1]
     assert_equal(arg_type, '(N, N) ndarray')
     assert desc[0].startswith('Covariance matrix')
-    assert doc['Parameters'][0][-1][-2] == '   (1+2+3)/3'
+    assert doc['Parameters'][0][-1][-1] == '   (1+2+3)/3'
+
 
 def test_other_parameters():
     assert_equal(len(doc['Other Parameters']), 1)
@@ -150,8 +183,9 @@ def test_other_parameters():
     assert_equal(arg_type, 'parrot')
     assert desc[0].startswith('A parrot off its mortal coil')
 
+
 def test_returns():
-    assert_equal(len(doc['Returns']), 2)
+    assert_equal(len(doc['Returns']), 3)
     arg, arg_type, desc = doc['Returns'][0]
     assert_equal(arg, 'out')
     assert_equal(arg_type, 'ndarray')
@@ -164,36 +198,152 @@ def test_returns():
     assert desc[0].startswith('This is not a real')
     assert desc[-1].endswith('anonymous return values.')
 
+    arg, arg_type, desc = doc['Returns'][2]
+    assert_equal(arg, 'no_description')
+    assert_equal(arg_type, '')
+    assert not ''.join(desc).strip()
+
+
+def test_yields():
+    section = doc_yields['Yields']
+    assert_equal(len(section), 3)
+    truth = [('a', 'int', 'apples.'),
+             ('b', 'int', 'bananas.'),
+             ('int', '', 'unknowns.')]
+    for (arg, arg_type, desc), (arg_, arg_type_, end) in zip(section, truth):
+        assert_equal(arg, arg_)
+        assert_equal(arg_type, arg_type_)
+        assert desc[0].startswith('The number of')
+        assert desc[0].endswith(end)
+
+
+def test_returnyield():
+    doc_text = """
+Test having returns and yields.
+
+Returns
+-------
+int
+    The number of apples.
+
+Yields
+------
+a : int
+    The number of apples.
+b : int
+    The number of bananas.
+
+"""
+    assert_raises(ValueError, NumpyDocString, doc_text)
+
+
+def test_section_twice():
+    doc_text = """
+Test having a section Notes twice
+
+Notes
+-----
+See the next note for more information
+
+Notes
+-----
+That should break...
+"""
+    assert_raises(ValueError, NumpyDocString, doc_text)
+
+    # if we have a numpydoc object, we know where the error came from
+    class Dummy(object):
+        """
+        Dummy class.
+
+        Notes
+        -----
+        First note.
+
+        Notes
+        -----
+        Second note.
+
+        """
+        def spam(self, a, b):
+            """Spam\n\nSpam spam."""
+            pass
+
+        def ham(self, c, d):
+            """Cheese\n\nNo cheese."""
+            pass
+
+    def dummy_func(arg):
+        """
+        Dummy function.
+
+        Notes
+        -----
+        First note.
+
+        Notes
+        -----
+        Second note.
+        """
+
+    try:
+        SphinxClassDoc(Dummy)
+    except ValueError as e:
+        # python 3 version or python 2 version
+        assert_true("test_section_twice.<locals>.Dummy" in str(e)
+                    or 'test_docscrape.Dummy' in str(e))
+
+    try:
+        SphinxFunctionDoc(dummy_func)
+    except ValueError as e:
+        # python 3 version or python 2 version
+        assert_true("test_section_twice.<locals>.dummy_func" in str(e)
+                    or 'function dummy_func' in str(e))
+
+
 def test_notes():
     assert doc['Notes'][0].startswith('Instead')
     assert doc['Notes'][-1].endswith('definite.')
     assert_equal(len(doc['Notes']), 17)
 
+
 def test_references():
     assert doc['References'][0].startswith('..')
     assert doc['References'][-1].endswith('2001.')
 
+
 def test_examples():
     assert doc['Examples'][0].startswith('>>>')
     assert doc['Examples'][-1].endswith('True]')
 
+
 def test_index():
     assert_equal(doc['index']['default'], 'random')
     assert_equal(len(doc['index']), 2)
     assert_equal(len(doc['index']['refguide']), 2)
 
-def non_blank_line_by_line_compare(a,b):
+
+def _strip_blank_lines(s):
+    "Remove leading, trailing and multiple blank lines"
+    s = re.sub(r'^\s*\n', '', s)
+    s = re.sub(r'\n\s*$', '', s)
+    s = re.sub(r'\n\s*\n', r'\n\n', s)
+    return s
+
+
+def line_by_line_compare(a, b):
     a = textwrap.dedent(a)
     b = textwrap.dedent(b)
-    a = [l.rstrip() for l in a.split('\n') if l.strip()]
-    b = [l.rstrip() for l in b.split('\n') if l.strip()]
-    for n,line in enumerate(a):
-        if not line == b[n]:
-            raise AssertionError("Lines %s of a and b differ: "
-                                 "\n>>> %s\n<<< %s\n" %
-                                 (n,line,b[n]))
+    a = [l.rstrip() for l in _strip_blank_lines(a).split('\n')]
+    b = [l.rstrip() for l in _strip_blank_lines(b).split('\n')]
+    assert_list_equal(a, b)
+
+
 def test_str():
-    non_blank_line_by_line_compare(str(doc),
+    # doc_txt has the order of Notes and See Also sections flipped.
+    # This should be handled automatically, and so, one thing this test does
+    # is to make sure that See Also precedes Notes in the output.
+    line_by_line_compare(str(doc),
 """numpy.multivariate_normal(mean, cov, shape=None, spam=None)
 
 Draw values from a multivariate normal distribution with specified
@@ -210,7 +360,6 @@ def test_str():
     .. math::
 
        (1+2+3)/3
-
 cov : (N, N) ndarray
     Covariance matrix of the distribution.
 shape : tuple of ints
@@ -222,7 +371,7 @@ def test_str():
 -------
 out : ndarray
     The drawn samples, arranged according to `shape`.  If the
-    shape given is (m,n,...), then the shape of `out` is is
+    shape given is (m,n,...), then the shape of `out` is
     (m,n,...,N).
 
     In other words, each entry ``out[i,j,...,:]`` is an N-dimensional
@@ -230,6 +379,7 @@ def test_str():
 list of str
     This is not a real return value.  It exists to test
     anonymous return values.
+no_description
 
 Other Parameters
 ----------------
@@ -252,6 +402,7 @@ def test_str():
 
 See Also
 --------
+
 `some`_, `other`_, `funcs`_
 
 `otherfunc`_
@@ -302,9 +453,25 @@ def test_str():
    :refguide: random;distributions, random;gauss""")
 
 
+def test_yield_str():
+    line_by_line_compare(str(doc_yields),
+"""Test generator
+
+Yields
+------
+a : int
+    The number of apples.
+b : int
+    The number of bananas.
+int
+    The number of unknowns.
+
+.. index:: """)
+
+
 def test_sphinx_str():
     sphinx_doc = SphinxDocString(doc_txt)
-    non_blank_line_by_line_compare(str(sphinx_doc),
+    line_by_line_compare(str(sphinx_doc),
 """
 .. index:: random
    single: random;distributions, random;gauss
@@ -317,56 +484,51 @@ def test_sphinx_str():
 
 :Parameters:
 
-    **mean** : (N,) ndarray
-
+    mean : (N,) ndarray
         Mean of the N-dimensional distribution.
 
         .. math::
 
            (1+2+3)/3
 
-    **cov** : (N, N) ndarray
-
+    cov : (N, N) ndarray
         Covariance matrix of the distribution.
 
-    **shape** : tuple of ints
-
+    shape : tuple of ints
         Given a shape of, for example, (m,n,k), m*n*k samples are
         generated, and packed in an m-by-n-by-k arrangement.  Because
         each sample is N-dimensional, the output shape is (m,n,k,N).
 
 :Returns:
 
-    **out** : ndarray
-
+    out : ndarray
         The drawn samples, arranged according to `shape`.  If the
-        shape given is (m,n,...), then the shape of `out` is is
+        shape given is (m,n,...), then the shape of `out` is
         (m,n,...,N).
 
         In other words, each entry ``out[i,j,...,:]`` is an N-dimensional
         value drawn from the distribution.
 
     list of str
-
         This is not a real return value.  It exists to test
         anonymous return values.
 
-:Other Parameters:
+    no_description
+        ..
 
-    **spam** : parrot
+:Other Parameters:
 
+    spam : parrot
         A parrot off its mortal coil.
 
 :Raises:
 
-    **RuntimeError**
-
+    RuntimeError
         Some error
 
 :Warns:
 
-    **RuntimeWarning**
-
+    RuntimeWarning
         Some warning
 
 .. warning::
@@ -427,6 +589,24 @@ def test_sphinx_str():
 """)
 
 
+def test_sphinx_yields_str():
+    sphinx_doc = SphinxDocString(doc_yields_txt)
+    line_by_line_compare(str(sphinx_doc),
+"""Test generator
+
+:Yields:
+
+    a : int
+        The number of apples.
+
+    b : int
+        The number of bananas.
+
+    int
+        The number of unknowns.
+""")
+
+
 doc2 = NumpyDocString("""
     Returns array of indices of the maximum values of along the given axis.
 
@@ -438,27 +618,39 @@ def test_sphinx_str():
         If None, the index is into the flattened array, otherwise along
         the specified axis""")
 
+
 def test_parameters_without_extended_description():
     assert_equal(len(doc2['Parameters']), 2)
 
+
 doc3 = NumpyDocString("""
     my_signature(*params, **kwds)
 
     Return this and that.
     """)
 
+
 def test_escape_stars():
     signature = str(doc3).split('\n')[0]
     assert_equal(signature, 'my_signature(\*params, \*\*kwds)')
 
+    def my_func(a, b, **kwargs):
+        pass
+
+    fdoc = FunctionDoc(func=my_func)
+    assert_equal(fdoc['Signature'], 'my_func(a, b, \*\*kwargs)')
+
+
 doc4 = NumpyDocString(
     """a.conj()
 
     Return an array with all complex-valued elements conjugated.""")
 
+
 def test_empty_extended_summary():
     assert_equal(doc4['Extended Summary'], [])
 
+
 doc5 = NumpyDocString(
     """
     a.something()
@@ -474,18 +666,21 @@ def test_empty_extended_summary():
         If needed
     """)
 
+
 def test_raises():
     assert_equal(len(doc5['Raises']), 1)
     name,_,desc = doc5['Raises'][0]
     assert_equal(name,'LinAlgException')
     assert_equal(desc,['If array is singular.'])
 
+
 def test_warns():
     assert_equal(len(doc5['Warns']), 1)
     name,_,desc = doc5['Warns'][0]
     assert_equal(name,'SomeWarning')
     assert_equal(desc,['If needed'])
 
+
 def test_see_also():
     doc6 = NumpyDocString(
     """
@@ -500,21 +695,23 @@ def test_see_also():
     func_f, func_g, :meth:`func_h`, func_j,
     func_k
     :obj:`baz.obj_q`
+    :obj:`~baz.obj_r`
     :class:`class_j`: fubar
         foobar
     """)
 
-    assert len(doc6['See Also']) == 12
+    assert len(doc6['See Also']) == 13
     for func, desc, role in doc6['See Also']:
         if func in ('func_a', 'func_b', 'func_c', 'func_f',
-                    'func_g', 'func_h', 'func_j', 'func_k', 'baz.obj_q'):
+                    'func_g', 'func_h', 'func_j', 'func_k', 'baz.obj_q',
+                    '~baz.obj_r'):
             assert(not desc)
         else:
             assert(desc)
 
         if func == 'func_h':
             assert role == 'meth'
-        elif func == 'baz.obj_q':
+        elif func == 'baz.obj_q' or func == '~baz.obj_r':
             assert role == 'obj'
         elif func == 'class_j':
             assert role == 'class'
@@ -528,6 +725,23 @@ def test_see_also():
         elif func == 'class_j':
             assert desc == ['fubar', 'foobar']
 
+
+def test_see_also_parse_error():
+    text = (
+    """
+    z(x,theta)
+
+    See Also
+    --------
+    :func:`~foo`
+    """)
+    with assert_raises(ParseError) as err:
+        NumpyDocString(text)
+    assert_equal(
+        str(r":func:`~foo` is not a item name in '\n    z(x,theta)\n\n    See Also\n    --------\n    :func:`~foo`\n    '"),
+        str(err.exception)
+    )
+
 def test_see_also_print():
     class Dummy(object):
         """
@@ -546,12 +760,45 @@ class Dummy(object):
     assert('    some relationship' in s)
     assert(':func:`func_d`' in s)
 
+
+def test_unknown_section():
+    doc_text = """
+Test having an unknown section
+
+Mope
+----
+This should be ignored and warned about
+"""
+
+    class BadSection(object):
+        """Class with bad section.
+
+        Nope
+        ----
+        This class has a nope section.
+        """
+        pass
+
+    with warnings.catch_warnings(record=True) as w:
+        NumpyDocString(doc_text)
+        assert len(w) == 1
+        assert "Unknown section Mope" == str(w[0].message)
+
+    with warnings.catch_warnings(record=True) as w:
+        SphinxClassDoc(BadSection)
+        assert len(w) == 1
+        assert_true('test_docscrape.test_unknown_section.<locals>.BadSection'
+                    in str(w[0].message)
+                    or 'test_docscrape.BadSection' in str(w[0].message))
+
+
 doc7 = NumpyDocString("""
 
         Doc starts on second line.
 
         """)
 
+
 def test_empty_first_line():
     assert doc7['Summary'][0].startswith('Doc starts')
 
@@ -582,6 +829,7 @@ def test_unicode():
     assert isinstance(doc['Summary'][0], str)
     assert doc['Summary'][0] == 'öäöäöäöäöåååå'
 
+
 def test_plot_examples():
     cfg = dict(use_plots=True)
 
@@ -594,6 +842,15 @@ def test_plot_examples():
     """, config=cfg)
     assert 'plot::' in str(doc), str(doc)
 
+    doc = SphinxDocString("""
+    Examples
+    --------
+    >>> from matplotlib import pyplot as plt
+    >>> plt.plot([1,2,3],[4,5,6])
+    >>> plt.show()
+    """, config=cfg)
+    assert 'plot::' in str(doc), str(doc)
+
     doc = SphinxDocString("""
     Examples
     --------
@@ -605,6 +862,47 @@ def test_plot_examples():
     """, config=cfg)
     assert str(doc).count('plot::') == 1, str(doc)
 
+
+def test_use_blockquotes():
+    cfg = dict(use_blockquotes=True)
+    doc = SphinxDocString("""
+    Parameters
+    ----------
+    abc : def
+        ghi
+    jkl
+        mno
+
+    Returns
+    -------
+    ABC : DEF
+        GHI
+    JKL
+        MNO
+    """, config=cfg)
+    line_by_line_compare(str(doc), '''
+    :Parameters:
+
+        **abc** : def
+
+            ghi
+
+        **jkl**
+
+            mno
+
+    :Returns:
+
+        **ABC** : DEF
+
+            GHI
+
+        **JKL**
+
+            MNO
+    ''')
+
+
 def test_class_members():
 
     class Dummy(object):
@@ -646,6 +944,47 @@ class Ignorable(object):
         else:
             assert 'Spammity index' in str(doc), str(doc)
 
+    class SubDummy(Dummy):
+        """
+        Subclass of Dummy class.
+
+        """
+        def ham(self, c, d):
+            """Cheese\n\nNo cheese.\nOverloaded Dummy.ham"""
+            pass
+
+        def bar(self, a, b):
+            """Bar\n\nNo bar"""
+            pass
+
+    for cls in (ClassDoc, SphinxClassDoc):
+        doc = cls(SubDummy, config=dict(show_class_members=True,
+                                        show_inherited_class_members=False))
+        assert 'Methods' in str(doc), (cls, str(doc))
+        assert 'spam' not in str(doc), (cls, str(doc))
+        assert 'ham' in str(doc), (cls, str(doc))
+        assert 'bar' in str(doc), (cls, str(doc))
+        assert 'spammity' not in str(doc), (cls, str(doc))
+
+        if cls is SphinxClassDoc:
+            assert '.. autosummary::' in str(doc), str(doc)
+        else:
+            assert 'Spammity index' not in str(doc), str(doc)
+
+        doc = cls(SubDummy, config=dict(show_class_members=True,
+                                        show_inherited_class_members=True))
+        assert 'Methods' in str(doc), (cls, str(doc))
+        assert 'spam' in str(doc), (cls, str(doc))
+        assert 'ham' in str(doc), (cls, str(doc))
+        assert 'bar' in str(doc), (cls, str(doc))
+        assert 'spammity' in str(doc), (cls, str(doc))
+
+        if cls is SphinxClassDoc:
+            assert '.. autosummary::' in str(doc), str(doc)
+        else:
+            assert 'Spammity index' in str(doc), str(doc)
+
+
 def test_duplicate_signature():
     # Duplicate function signatures occur e.g. in ufuncs, when the
     # automatic mechanism adds one, and a more detailed comes from the
@@ -669,6 +1008,7 @@ def test_duplicate_signature():
     f : callable ``f(t, y, *f_args)``
         Aaa.
     jac : callable ``jac(t, y, *jac_args)``
+
         Bbb.
 
     Attributes
@@ -678,6 +1018,17 @@ def test_duplicate_signature():
     y : ndarray
         Current variable values.
 
+        * hello
+        * world
+    an_attribute : float
+        The docstring is printed instead
+    no_docstring : str
+        But a description
+    no_docstring2 : str
+    multiline_sentence
+    midword_period
+    no_period
+
     Methods
     -------
     a
@@ -689,9 +1040,10 @@ def test_duplicate_signature():
     For usage examples, see `ode`.
 """
 
+
 def test_class_members_doc():
     doc = ClassDoc(None, class_doc_txt)
-    non_blank_line_by_line_compare(str(doc),
+    line_by_line_compare(str(doc),
     """
     Foo
 
@@ -713,55 +1065,140 @@ def test_class_members_doc():
     y : ndarray
         Current variable values.
 
+        * hello
+        * world
+    an_attribute : float
+        The docstring is printed instead
+    no_docstring : str
+        But a description
+    no_docstring2 : str
+    multiline_sentence
+    midword_period
+    no_period
+
     Methods
     -------
     a
-
     b
-
     c
 
     .. index::
 
     """)
 
+
 def test_class_members_doc_sphinx():
-    doc = SphinxClassDoc(None, class_doc_txt)
-    non_blank_line_by_line_compare(str(doc),
+    class Foo:
+        @property
+        def an_attribute(self):
+            """Test attribute"""
+            return None
+
+        @property
+        def no_docstring(self):
+            return None
+
+        @property
+        def no_docstring2(self):
+            return None
+
+        @property
+        def multiline_sentence(self):
+            """This is a
+            sentence. It spans multiple lines."""
+            return None
+
+        @property
+        def midword_period(self):
+            """The sentence for numpy.org."""
+            return None
+
+        @property
+        def no_period(self):
+            """This does not have a period
+            so we truncate its summary to the first linebreak
+
+            Apparently.
+            """
+            return None
+
+    doc = SphinxClassDoc(Foo, class_doc_txt)
+    line_by_line_compare(str(doc),
     """
     Foo
 
     :Parameters:
 
-        **f** : callable ``f(t, y, *f_args)``
-
+        f : callable ``f(t, y, *f_args)``
             Aaa.
 
-        **jac** : callable ``jac(t, y, *jac_args)``
-
+        jac : callable ``jac(t, y, *jac_args)``
             Bbb.
 
     .. rubric:: Examples
 
     For usage examples, see `ode`.
 
-    .. rubric:: Attributes
+    :Attributes:
+
+        t : float
+            Current time.
+
+        y : ndarray
+            Current variable values.
+
+            * hello
+            * world
 
-    ===  ==========
-      t  (float) Current time.
-      y  (ndarray) Current variable values.
-    ===  ==========
+        :obj:`an_attribute <an_attribute>` : float
+            Test attribute
+
+        no_docstring : str
+            But a description
+
+        no_docstring2 : str
+            ..
+
+        :obj:`multiline_sentence <multiline_sentence>`
+            This is a sentence.
+
+        :obj:`midword_period <midword_period>`
+            The sentence for numpy.org.
+
+        :obj:`no_period <no_period>`
+            This does not have a period
 
     .. rubric:: Methods
 
-    ===  ==========
-      a
-      b
-      c
-    ===  ==========
+    =====  ==========
+    **a**
+    **b**
+    **c**
+    =====  ==========
 
     """)
 
+
+def test_templated_sections():
+    doc = SphinxClassDoc(None, class_doc_txt,
+                         config={'template': jinja2.Template('{{examples}}\n{{parameters}}')})
+    line_by_line_compare(str(doc),
+    """
+    .. rubric:: Examples
+
+    For usage examples, see `ode`.
+
+    :Parameters:
+
+        f : callable ``f(t, y, *f_args)``
+            Aaa.
+
+        jac : callable ``jac(t, y, *jac_args)``
+            Bbb.
+
+    """)
+
+
 if __name__ == "__main__":
     import nose
     nose.run()
diff --git a/doc/sphinxext/numpydoc/tests/test_linkcode.py b/doc/sphinxext/numpydoc/tests/test_linkcode.py
deleted file mode 100644
index 340166a485fcd..0000000000000
--- a/doc/sphinxext/numpydoc/tests/test_linkcode.py
+++ /dev/null
@@ -1,5 +0,0 @@
-from __future__ import division, absolute_import, print_function
-
-import numpydoc.linkcode
-
-# No tests at the moment...
diff --git a/doc/sphinxext/numpydoc/tests/test_phantom_import.py b/doc/sphinxext/numpydoc/tests/test_phantom_import.py
deleted file mode 100644
index 173b5662b8df7..0000000000000
--- a/doc/sphinxext/numpydoc/tests/test_phantom_import.py
+++ /dev/null
@@ -1,5 +0,0 @@
-from __future__ import division, absolute_import, print_function
-
-import numpydoc.phantom_import
-
-# No tests at the moment...
diff --git a/doc/sphinxext/numpydoc/tests/test_plot_directive.py b/doc/sphinxext/numpydoc/tests/test_plot_directive.py
deleted file mode 100644
index 0e511fcbc1428..0000000000000
--- a/doc/sphinxext/numpydoc/tests/test_plot_directive.py
+++ /dev/null
@@ -1,5 +0,0 @@
-from __future__ import division, absolute_import, print_function
-
-import numpydoc.plot_directive
-
-# No tests at the moment...
diff --git a/doc/sphinxext/numpydoc/tests/test_traitsdoc.py b/doc/sphinxext/numpydoc/tests/test_traitsdoc.py
deleted file mode 100644
index d36e5ddbd751f..0000000000000
--- a/doc/sphinxext/numpydoc/tests/test_traitsdoc.py
+++ /dev/null
@@ -1,5 +0,0 @@
-from __future__ import division, absolute_import, print_function
-
-import numpydoc.traitsdoc
-
-# No tests at the moment...
diff --git a/doc/sphinxext/numpydoc/traitsdoc.py b/doc/sphinxext/numpydoc/traitsdoc.py
deleted file mode 100755
index 596c54eb389a3..0000000000000
--- a/doc/sphinxext/numpydoc/traitsdoc.py
+++ /dev/null
@@ -1,142 +0,0 @@
-"""
-=========
-traitsdoc
-=========
-
-Sphinx extension that handles docstrings in the Numpy standard format, [1]
-and support Traits [2].
-
-This extension can be used as a replacement for ``numpydoc`` when support
-for Traits is required.
-
-.. [1] http://projects.scipy.org/numpy/wiki/CodingStyleGuidelines#docstring-standard
-.. [2] http://code.enthought.com/projects/traits/
-
-"""
-from __future__ import division, absolute_import, print_function
-
-import inspect
-import os
-import pydoc
-import collections
-
-from . import docscrape
-from . import docscrape_sphinx
-from .docscrape_sphinx import SphinxClassDoc, SphinxFunctionDoc, SphinxDocString
-
-from . import numpydoc
-
-from . import comment_eater
-
-class SphinxTraitsDoc(SphinxClassDoc):
-    def __init__(self, cls, modulename='', func_doc=SphinxFunctionDoc):
-        if not inspect.isclass(cls):
-            raise ValueError("Initialise using a class. Got %r" % cls)
-        self._cls = cls
-
-        if modulename and not modulename.endswith('.'):
-            modulename += '.'
-        self._mod = modulename
-        self._name = cls.__name__
-        self._func_doc = func_doc
-
-        docstring = pydoc.getdoc(cls)
-        docstring = docstring.split('\n')
-
-        # De-indent paragraph
-        try:
-            indent = min(len(s) - len(s.lstrip()) for s in docstring
-                         if s.strip())
-        except ValueError:
-            indent = 0
-
-        for n,line in enumerate(docstring):
-            docstring[n] = docstring[n][indent:]
-
-        self._doc = docscrape.Reader(docstring)
-        self._parsed_data = {
-            'Signature': '',
-            'Summary': '',
-            'Description': [],
-            'Extended Summary': [],
-            'Parameters': [],
-            'Returns': [],
-            'Raises': [],
-            'Warns': [],
-            'Other Parameters': [],
-            'Traits': [],
-            'Methods': [],
-            'See Also': [],
-            'Notes': [],
-            'References': '',
-            'Example': '',
-            'Examples': '',
-            'index': {}
-            }
-
-        self._parse()
-
-    def _str_summary(self):
-        return self['Summary'] + ['']
-
-    def _str_extended_summary(self):
-        return self['Description'] + self['Extended Summary'] + ['']
-
-    def __str__(self, indent=0, func_role="func"):
-        out = []
-        out += self._str_signature()
-        out += self._str_index() + ['']
-        out += self._str_summary()
-        out += self._str_extended_summary()
-        for param_list in ('Parameters', 'Traits', 'Methods',
-                           'Returns','Raises'):
-            out += self._str_param_list(param_list)
-        out += self._str_see_also("obj")
-        out += self._str_section('Notes')
-        out += self._str_references()
-        out += self._str_section('Example')
-        out += self._str_section('Examples')
-        out = self._str_indent(out,indent)
-        return '\n'.join(out)
-
-def looks_like_issubclass(obj, classname):
-    """ Return True if the object has a class or superclass with the given class
-    name.
-
-    Ignores old-style classes.
-    """
-    t = obj
-    if t.__name__ == classname:
-        return True
-    for klass in t.__mro__:
-        if klass.__name__ == classname:
-            return True
-    return False
-
-def get_doc_object(obj, what=None, config=None):
-    if what is None:
-        if inspect.isclass(obj):
-            what = 'class'
-        elif inspect.ismodule(obj):
-            what = 'module'
-        elif isinstance(obj, collections.Callable):
-            what = 'function'
-        else:
-            what = 'object'
-    if what == 'class':
-        doc = SphinxTraitsDoc(obj, '', func_doc=SphinxFunctionDoc, config=config)
-        if looks_like_issubclass(obj, 'HasTraits'):
-            for name, trait, comment in comment_eater.get_class_traits(obj):
-                # Exclude private traits.
-                if not name.startswith('_'):
-                    doc['Traits'].append((name, trait, comment.splitlines()))
-        return doc
-    elif what in ('function', 'method'):
-        return SphinxFunctionDoc(obj, '', config=config)
-    else:
-        return SphinxDocString(pydoc.getdoc(obj), config=config)
-
-def setup(app):
-    # init numpydoc
-    numpydoc.setup(app, get_doc_object)
-
diff --git a/pandas/__init__.py b/pandas/__init__.py
index 68a90394cacf1..97ae73174c09c 100644
--- a/pandas/__init__.py
+++ b/pandas/__init__.py
@@ -1,64 +1,128 @@
 # pylint: disable-msg=W0614,W0401,W0611,W0622
 
+# flake8: noqa
 
 __docformat__ = 'restructuredtext'
 
+# Let users know if they're missing any of our hard dependencies
+hard_dependencies = ("numpy", "pytz", "dateutil")
+missing_dependencies = []
+
+for dependency in hard_dependencies:
+    try:
+        __import__(dependency)
+    except ImportError as e:
+        missing_dependencies.append(dependency)
+
+if missing_dependencies:
+    raise ImportError(
+        "Missing required dependencies {0}".format(missing_dependencies))
+del hard_dependencies, dependency, missing_dependencies
+
+# numpy compat
+from pandas.compat.numpy import *
+
 try:
-    from pandas import hashtable, tslib, lib
+    from pandas._libs import (hashtable as _hashtable,
+                             lib as _lib,
+                             tslib as _tslib)
 except ImportError as e:  # pragma: no cover
-    module = str(e).lstrip('cannot import name ')  # hack but overkill to use re
+    # hack but overkill to use re
+    module = str(e).replace('cannot import name ', '')
     raise ImportError("C extension: {0} not built. If you want to import "
                       "pandas from the source directory, you may need to run "
-                      "'python setup.py build_ext --inplace' to build the C "
-                      "extensions first.".format(module))
+                      "'python setup.py build_ext --inplace --force' to build "
+                      "the C extensions first.".format(module))
 
 from datetime import datetime
-import numpy as np
-
-
-# XXX: HACK for NumPy 1.5.1 to suppress warnings
-try:
-    np.seterr(all='ignore')
-except Exception:  # pragma: no cover
-    pass
-
-# numpy versioning
-from distutils.version import LooseVersion
-_np_version = np.version.short_version
-_np_version_under1p8 = LooseVersion(_np_version) < '1.8'
-_np_version_under1p9 = LooseVersion(_np_version) < '1.9'
-
-
-from pandas.info import __doc__
-
-
-if LooseVersion(_np_version) < '1.7.0':
-    raise ImportError('pandas {0} is incompatible with numpy < 1.7.0, '
-                      'your numpy version is {1}. Please upgrade numpy to'
-                      ' >= 1.7.0 to use pandas version {0}'.format(__version__,
-                                                                   _np_version))
 
 # let init-time option registration happen
 import pandas.core.config_init
 
 from pandas.core.api import *
-from pandas.sparse.api import *
-from pandas.stats.api import *
+from pandas.core.sparse.api import *
 from pandas.tseries.api import *
+from pandas.core.computation.api import *
+from pandas.core.reshape.api import *
+
+# deprecate tools.plotting, plot_params and scatter_matrix on the top namespace
+import pandas.tools.plotting
+plot_params = pandas.plotting._style._Options(deprecated=True)
+# do not import deprecate to top namespace
+scatter_matrix = pandas.util._decorators.deprecate(
+    'pandas.scatter_matrix', pandas.plotting.scatter_matrix, '0.20.0',
+    'pandas.plotting.scatter_matrix')
+
+from pandas.util._print_versions import show_versions
 from pandas.io.api import *
-from pandas.computation.api import *
+from pandas.util._tester import test
+import pandas.testing
+
+# extension module deprecations
+from pandas.util._depr_module import _DeprecatedModule
 
-from pandas.tools.merge import merge, concat, ordered_merge
-from pandas.tools.pivot import pivot_table, crosstab
-from pandas.tools.plotting import scatter_matrix, plot_params
-from pandas.tools.tile import cut, qcut
-from pandas.tools.util import to_numeric
-from pandas.core.reshape import melt
-from pandas.util.print_versions import show_versions
-import pandas.util.testing
+json = _DeprecatedModule(deprmod='pandas.json',
+                         moved={'dumps': 'pandas.io.json.dumps',
+                                'loads': 'pandas.io.json.loads'})
+parser = _DeprecatedModule(deprmod='pandas.parser',
+                           removals=['na_values'],
+                           moved={'CParserError': 'pandas.errors.ParserError'})
+lib = _DeprecatedModule(deprmod='pandas.lib', deprmodto=False,
+                        moved={'Timestamp': 'pandas.Timestamp',
+                               'Timedelta': 'pandas.Timedelta',
+                               'NaT': 'pandas.NaT',
+                               'infer_dtype': 'pandas.api.types.infer_dtype'})
+tslib = _DeprecatedModule(deprmod='pandas.tslib',
+                          moved={'Timestamp': 'pandas.Timestamp',
+                                 'Timedelta': 'pandas.Timedelta',
+                                 'NaT': 'pandas.NaT',
+                                 'NaTType': 'type(pandas.NaT)',
+                                 'OutOfBoundsDatetime': 'pandas.errors.OutOfBoundsDatetime'})
 
 # use the closest tagged version if possible
 from ._version import get_versions
 v = get_versions()
-__version__ = v.get('closest-tag',v['version'])
+__version__ = v.get('closest-tag', v['version'])
 del get_versions, v
+
+# module level doc-string
+__doc__ = """
+pandas - a powerful data analysis and manipulation library for Python
+=====================================================================
+
+**pandas** is a Python package providing fast, flexible, and expressive data
+structures designed to make working with "relational" or "labeled" data both
+easy and intuitive. It aims to be the fundamental high-level building block for
+doing practical, **real world** data analysis in Python. Additionally, it has
+the broader goal of becoming **the most powerful and flexible open source data
+analysis / manipulation tool available in any language**. It is already well on
+its way toward this goal.
+
+Main Features
+-------------
+Here are just a few of the things that pandas does well:
+
+  - Easy handling of missing data in floating point as well as non-floating
+    point data.
+  - Size mutability: columns can be inserted and deleted from DataFrame and
+    higher dimensional objects
+  - Automatic and explicit data alignment: objects can be explicitly aligned
+    to a set of labels, or the user can simply ignore the labels and let
+    `Series`, `DataFrame`, etc. automatically align the data for you in
+    computations.
+  - Powerful, flexible group by functionality to perform split-apply-combine
+    operations on data sets, for both aggregating and transforming data.
+  - Make it easy to convert ragged, differently-indexed data in other Python
+    and NumPy data structures into DataFrame objects.
+  - Intelligent label-based slicing, fancy indexing, and subsetting of large
+    data sets.
+  - Intuitive merging and joining data sets.
+  - Flexible reshaping and pivoting of data sets.
+  - Hierarchical labeling of axes (possible to have multiple labels per tick).
+  - Robust IO tools for loading data from flat files (CSV and delimited),
+    Excel files, databases, and saving/loading data from the ultrafast HDF5
+    format.
+  - Time series-specific functionality: date range generation and frequency
+    conversion, moving window statistics, moving window linear regressions,
+    date shifting and lagging, etc.
+"""
diff --git a/pandas/_libs/__init__.py b/pandas/_libs/__init__.py
new file mode 100644
index 0000000000000..b4c3ff8008015
--- /dev/null
+++ b/pandas/_libs/__init__.py
@@ -0,0 +1,9 @@
+# -*- coding: utf-8 -*-
+# flake8: noqa
+
+from .tslib import iNaT, NaT, Timestamp, Timedelta, OutOfBoundsDatetime
+
+# TODO
+# period is directly dependent on tslib and imports python
+# modules, so exposing Period as an alias is currently not possible
+# from period import Period
diff --git a/pandas/_libs/algos.pxd b/pandas/_libs/algos.pxd
new file mode 100644
index 0000000000000..a535872ff7279
--- /dev/null
+++ b/pandas/_libs/algos.pxd
@@ -0,0 +1,21 @@
+from util cimport numeric
+from numpy cimport float64_t, double_t
+
+cpdef numeric kth_smallest(numeric[:] a, Py_ssize_t k) nogil
+
+cdef inline Py_ssize_t swap(numeric *a, numeric *b) nogil:
+    cdef numeric t
+
+    # cython doesn't allow pointer dereference so use array syntax
+    t = a[0]
+    a[0] = b[0]
+    b[0] = t
+    return 0
+
+cdef enum TiebreakEnumType:
+    TIEBREAK_AVERAGE
+    TIEBREAK_MIN,
+    TIEBREAK_MAX
+    TIEBREAK_FIRST
+    TIEBREAK_FIRST_DESCENDING
+    TIEBREAK_DENSE
diff --git a/pandas/_libs/algos.pyx b/pandas/_libs/algos.pyx
new file mode 100644
index 0000000000000..a418e54e4da9b
--- /dev/null
+++ b/pandas/_libs/algos.pyx
@@ -0,0 +1,318 @@
+# cython: profile=False
+
+cimport cython
+from cython cimport Py_ssize_t
+
+from libc.stdlib cimport malloc, free
+from libc.string cimport memmove
+from libc.math cimport fabs, sqrt
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport (ndarray,
+                    NPY_INT64, NPY_UINT64, NPY_INT32, NPY_INT16, NPY_INT8,
+                    NPY_FLOAT32, NPY_FLOAT64,
+                    NPY_OBJECT,
+                    int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
+                    uint32_t, uint64_t, float32_t, float64_t,
+                    double_t)
+cnp.import_array()
+
+
+cimport util
+from util cimport numeric, get_nat
+
+import missing
+
+cdef float64_t FP_ERR = 1e-13
+
+cdef double NaN = <double> np.NaN
+cdef double nan = NaN
+
+cdef int64_t iNaT = get_nat()
+
+tiebreakers = {
+    'average': TIEBREAK_AVERAGE,
+    'min': TIEBREAK_MIN,
+    'max': TIEBREAK_MAX,
+    'first': TIEBREAK_FIRST,
+    'dense': TIEBREAK_DENSE,
+}
+
+
+cdef inline are_diff(object left, object right):
+    try:
+        return fabs(left - right) > FP_ERR
+    except TypeError:
+        return left != right
+
+
+class Infinity(object):
+    """ provide a positive Infinity comparison method for ranking """
+
+    __lt__ = lambda self, other: False
+    __le__ = lambda self, other: isinstance(other, Infinity)
+    __eq__ = lambda self, other: isinstance(other, Infinity)
+    __ne__ = lambda self, other: not isinstance(other, Infinity)
+    __gt__ = lambda self, other: (not isinstance(other, Infinity) and
+                                  not missing.checknull(other))
+    __ge__ = lambda self, other: not missing.checknull(other)
+
+
+class NegInfinity(object):
+    """ provide a negative Infinity comparison method for ranking """
+
+    __lt__ = lambda self, other: (not isinstance(other, NegInfinity) and
+                                  not missing.checknull(other))
+    __le__ = lambda self, other: not missing.checknull(other)
+    __eq__ = lambda self, other: isinstance(other, NegInfinity)
+    __ne__ = lambda self, other: not isinstance(other, NegInfinity)
+    __gt__ = lambda self, other: False
+    __ge__ = lambda self, other: isinstance(other, NegInfinity)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def is_lexsorted(list list_of_arrays):
+    cdef:
+        Py_ssize_t i
+        Py_ssize_t n, nlevels
+        int64_t k, cur, pre
+        ndarray arr
+        bint result = True
+
+    nlevels = len(list_of_arrays)
+    n = len(list_of_arrays[0])
+
+    cdef int64_t **vecs = <int64_t**> malloc(nlevels * sizeof(int64_t*))
+    for i in range(nlevels):
+        arr = list_of_arrays[i]
+        assert arr.dtype.name == 'int64'
+        vecs[i] = <int64_t*> arr.data
+
+    # Assume uniqueness??
+    with nogil:
+        for i in range(1, n):
+            for k in range(nlevels):
+                cur = vecs[k][i]
+                pre = vecs[k][i -1]
+                if cur == pre:
+                    continue
+                elif cur > pre:
+                    break
+                else:
+                    result = False
+                    break
+    free(vecs)
+    return result
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def groupsort_indexer(ndarray[int64_t] index, Py_ssize_t ngroups):
+    """
+    compute a 1-d indexer that is an ordering of the passed index,
+    ordered by the groups. This is a reverse of the label
+    factorization process.
+
+    Parameters
+    ----------
+    index: int64 ndarray
+        mappings from group -> position
+    ngroups: int64
+        number of groups
+
+    return a tuple of (1-d indexer ordered by groups, group counts)
+    """
+
+    cdef:
+        Py_ssize_t i, loc, label, n
+        ndarray[int64_t] counts, where, result
+
+    counts = np.zeros(ngroups + 1, dtype=np.int64)
+    n = len(index)
+    result = np.zeros(n, dtype=np.int64)
+    where = np.zeros(ngroups + 1, dtype=np.int64)
+
+    with nogil:
+
+        # count group sizes, location 0 for NA
+        for i in range(n):
+            counts[index[i] + 1] += 1
+
+        # mark the start of each contiguous group of like-indexed data
+        for i in range(1, ngroups + 1):
+            where[i] = where[i - 1] + counts[i - 1]
+
+        # this is our indexer
+        for i in range(n):
+            label = index[i] + 1
+            result[where[label]] = i
+            where[label] += 1
+
+    return result, counts
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+cpdef numeric kth_smallest(numeric[:] a, Py_ssize_t k) nogil:
+    cdef:
+        Py_ssize_t i, j, l, m, n = a.shape[0]
+        numeric x
+
+    with nogil:
+        l = 0
+        m = n - 1
+
+        while l < m:
+            x = a[k]
+            i = l
+            j = m
+
+            while 1:
+                while a[i] < x: i += 1
+                while x < a[j]: j -= 1
+                if i <= j:
+                    swap(&a[i], &a[j])
+                    i += 1; j -= 1
+
+                if i > j: break
+
+            if j < k: l = i
+            if k < i: m = j
+    return a[k]
+
+
+# ----------------------------------------------------------------------
+# Pairwise correlation/covariance
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def nancorr(ndarray[float64_t, ndim=2] mat, bint cov=0, minp=None):
+    cdef:
+        Py_ssize_t i, j, xi, yi, N, K
+        bint minpv
+        ndarray[float64_t, ndim=2] result
+        ndarray[uint8_t, ndim=2] mask
+        int64_t nobs = 0
+        float64_t vx, vy, sumx, sumy, sumxx, sumyy, meanx, meany, divisor
+
+    N, K = (<object> mat).shape
+
+    if minp is None:
+        minpv = 1
+    else:
+        minpv = <int>minp
+
+    result = np.empty((K, K), dtype=np.float64)
+    mask = np.isfinite(mat).view(np.uint8)
+
+    with nogil:
+        for xi in range(K):
+            for yi in range(xi + 1):
+                nobs = sumxx = sumyy = sumx = sumy = 0
+                for i in range(N):
+                    if mask[i, xi] and mask[i, yi]:
+                        vx = mat[i, xi]
+                        vy = mat[i, yi]
+                        nobs += 1
+                        sumx += vx
+                        sumy += vy
+
+                if nobs < minpv:
+                    result[xi, yi] = result[yi, xi] = NaN
+                else:
+                    meanx = sumx / nobs
+                    meany = sumy / nobs
+
+                    # now the cov numerator
+                    sumx = 0
+
+                    for i in range(N):
+                        if mask[i, xi] and mask[i, yi]:
+                            vx = mat[i, xi] - meanx
+                            vy = mat[i, yi] - meany
+
+                            sumx += vx * vy
+                            sumxx += vx * vx
+                            sumyy += vy * vy
+
+                    divisor = (nobs - 1.0) if cov else sqrt(sumxx * sumyy)
+
+                    if divisor != 0:
+                        result[xi, yi] = result[yi, xi] = sumx / divisor
+                    else:
+                        result[xi, yi] = result[yi, xi] = NaN
+
+    return result
+
+# ----------------------------------------------------------------------
+# Pairwise Spearman correlation
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def nancorr_spearman(ndarray[float64_t, ndim=2] mat, Py_ssize_t minp=1):
+    cdef:
+        Py_ssize_t i, j, xi, yi, N, K
+        ndarray[float64_t, ndim=2] result
+        ndarray[float64_t, ndim=1] maskedx
+        ndarray[float64_t, ndim=1] maskedy
+        ndarray[uint8_t, ndim=2] mask
+        int64_t nobs = 0
+        float64_t vx, vy, sumx, sumxx, sumyy, mean, divisor
+
+    N, K = (<object> mat).shape
+
+    result = np.empty((K, K), dtype=np.float64)
+    mask = np.isfinite(mat).view(np.uint8)
+
+    for xi in range(K):
+        for yi in range(xi + 1):
+            nobs = 0
+            for i in range(N):
+                if mask[i, xi] and mask[i, yi]:
+                    nobs += 1
+
+            if nobs < minp:
+                result[xi, yi] = result[yi, xi] = NaN
+            else:
+                maskedx = np.empty(nobs, dtype=np.float64)
+                maskedy = np.empty(nobs, dtype=np.float64)
+                j = 0
+                for i in range(N):
+                    if mask[i, xi] and mask[i, yi]:
+                        maskedx[j] = mat[i, xi]
+                        maskedy[j] = mat[i, yi]
+                        j += 1
+                maskedx = rank_1d_float64(maskedx)
+                maskedy = rank_1d_float64(maskedy)
+
+                mean = (nobs + 1) / 2.
+
+                # now the cov numerator
+                sumx = sumxx = sumyy = 0
+
+                for i in range(nobs):
+                    vx = maskedx[i] - mean
+                    vy = maskedy[i] - mean
+
+                    sumx += vx * vy
+                    sumxx += vx * vx
+                    sumyy += vy * vy
+
+                divisor = sqrt(sumxx * sumyy)
+
+                if divisor != 0:
+                    result[xi, yi] = result[yi, xi] = sumx / divisor
+                else:
+                    result[xi, yi] = result[yi, xi] = NaN
+
+    return result
+
+
+# generated from template
+include "algos_common_helper.pxi"
+include "algos_rank_helper.pxi"
+include "algos_take_helper.pxi"
diff --git a/pandas/_libs/algos_common_helper.pxi.in b/pandas/_libs/algos_common_helper.pxi.in
new file mode 100644
index 0000000000000..0d3f6664da9e3
--- /dev/null
+++ b/pandas/_libs/algos_common_helper.pxi.in
@@ -0,0 +1,591 @@
+"""
+Template for each `dtype` helper function using 1-d template
+
+# 1-d template
+- map_indices
+- pad
+- pad_1d
+- pad_2d
+- backfill
+- backfill_1d
+- backfill_2d
+- is_monotonic
+- arrmap
+
+WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
+"""
+
+#----------------------------------------------------------------------
+# 1-d template
+#----------------------------------------------------------------------
+
+{{py:
+
+# name, c_type, dtype, can_hold_na, nogil
+dtypes = [('float64', 'float64_t', 'np.float64', True, True),
+          ('float32', 'float32_t', 'np.float32', True, True),
+          ('object', 'object', 'object', True, False),
+          ('int32', 'int32_t', 'np.int32', False, True),
+          ('int64', 'int64_t', 'np.int64', False, True),
+          ('uint64', 'uint64_t', 'np.uint64', False, True),
+          ('bool', 'uint8_t', 'np.bool', False, True)]
+
+def get_dispatch(dtypes):
+
+    for name, c_type, dtype, can_hold_na, nogil in dtypes:
+
+        nogil_str = 'with nogil:' if nogil else ''
+        tab = '    ' if nogil else ''
+        yield name, c_type, dtype, can_hold_na, nogil_str, tab
+}}
+
+{{for name, c_type, dtype, can_hold_na, nogil_str, tab
+      in get_dispatch(dtypes)}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cpdef map_indices_{{name}}(ndarray[{{c_type}}] index):
+    """
+    Produce a dict mapping the values of the input array to their respective
+    locations.
+
+    Example:
+        array(['hi', 'there']) --> {'hi' : 0 , 'there' : 1}
+
+    Better to do this with Cython because of the enormous speed boost.
+    """
+    cdef Py_ssize_t i, length
+    cdef dict result = {}
+
+    length = len(index)
+
+    for i in range(length):
+        result[index[i]] = i
+
+    return result
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def pad_{{name}}(ndarray[{{c_type}}] old, ndarray[{{c_type}}] new,
+                 limit=None):
+    cdef Py_ssize_t i, j, nleft, nright
+    cdef ndarray[int64_t, ndim=1] indexer
+    cdef {{c_type}} cur, next
+    cdef int lim, fill_count = 0
+
+    nleft = len(old)
+    nright = len(new)
+    indexer = np.empty(nright, dtype=np.int64)
+    indexer.fill(-1)
+
+    if limit is None:
+        lim = nright
+    else:
+        if not util.is_integer_object(limit):
+            raise ValueError('Limit must be an integer')
+        if limit < 1:
+            raise ValueError('Limit must be greater than 0')
+        lim = limit
+
+    if nleft == 0 or nright == 0 or new[nright - 1] < old[0]:
+        return indexer
+
+    i = j = 0
+
+    cur = old[0]
+
+    while j <= nright - 1 and new[j] < cur:
+        j += 1
+
+    while True:
+        if j == nright:
+            break
+
+        if i == nleft - 1:
+            while j < nright:
+                if new[j] == cur:
+                    indexer[j] = i
+                elif new[j] > cur and fill_count < lim:
+                    indexer[j] = i
+                    fill_count += 1
+                j += 1
+            break
+
+        next = old[i + 1]
+
+        while j < nright and cur <= new[j] < next:
+            if new[j] == cur:
+                indexer[j] = i
+            elif fill_count < lim:
+                indexer[j] = i
+                fill_count += 1
+            j += 1
+
+        fill_count = 0
+        i += 1
+        cur = next
+
+    return indexer
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def pad_inplace_{{name}}(ndarray[{{c_type}}] values,
+                         ndarray[uint8_t, cast=True] mask,
+                         limit=None):
+    cdef Py_ssize_t i, N
+    cdef {{c_type}} val
+    cdef int lim, fill_count = 0
+
+    N = len(values)
+
+    # GH 2778
+    if N == 0:
+        return
+
+    if limit is None:
+        lim = N
+    else:
+        if not util.is_integer_object(limit):
+            raise ValueError('Limit must be an integer')
+        if limit < 1:
+            raise ValueError('Limit must be greater than 0')
+        lim = limit
+
+    val = values[0]
+    for i in range(N):
+        if mask[i]:
+            if fill_count >= lim:
+                continue
+            fill_count += 1
+            values[i] = val
+        else:
+            fill_count = 0
+            val = values[i]
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def pad_2d_inplace_{{name}}(ndarray[{{c_type}}, ndim=2] values,
+                            ndarray[uint8_t, ndim=2] mask,
+                            limit=None):
+    cdef Py_ssize_t i, j, N, K
+    cdef {{c_type}} val
+    cdef int lim, fill_count = 0
+
+    K, N = (<object> values).shape
+
+    # GH 2778
+    if N == 0:
+        return
+
+    if limit is None:
+        lim = N
+    else:
+        if not util.is_integer_object(limit):
+            raise ValueError('Limit must be an integer')
+        if limit < 1:
+            raise ValueError('Limit must be greater than 0')
+        lim = limit
+
+    for j in range(K):
+        fill_count = 0
+        val = values[j, 0]
+        for i in range(N):
+            if mask[j, i]:
+                if fill_count >= lim:
+                    continue
+                fill_count += 1
+                values[j, i] = val
+            else:
+                fill_count = 0
+                val = values[j, i]
+
+"""
+Backfilling logic for generating fill vector
+
+Diagram of what's going on
+
+Old      New    Fill vector    Mask
+         .        0               1
+         .        0               1
+         .        0               1
+A        A        0               1
+         .        1               1
+         .        1               1
+         .        1               1
+         .        1               1
+         .        1               1
+B        B        1               1
+         .        2               1
+         .        2               1
+         .        2               1
+C        C        2               1
+         .                        0
+         .                        0
+D
+"""
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def backfill_{{name}}(ndarray[{{c_type}}] old, ndarray[{{c_type}}] new,
+                      limit=None):
+    cdef Py_ssize_t i, j, nleft, nright
+    cdef ndarray[int64_t, ndim=1] indexer
+    cdef {{c_type}} cur, prev
+    cdef int lim, fill_count = 0
+
+    nleft = len(old)
+    nright = len(new)
+    indexer = np.empty(nright, dtype=np.int64)
+    indexer.fill(-1)
+
+    if limit is None:
+        lim = nright
+    else:
+        if not util.is_integer_object(limit):
+            raise ValueError('Limit must be an integer')
+        if limit < 1:
+            raise ValueError('Limit must be greater than 0')
+        lim = limit
+
+    if nleft == 0 or nright == 0 or new[0] > old[nleft - 1]:
+        return indexer
+
+    i = nleft - 1
+    j = nright - 1
+
+    cur = old[nleft - 1]
+
+    while j >= 0 and new[j] > cur:
+        j -= 1
+
+    while True:
+        if j < 0:
+            break
+
+        if i == 0:
+            while j >= 0:
+                if new[j] == cur:
+                    indexer[j] = i
+                elif new[j] < cur and fill_count < lim:
+                    indexer[j] = i
+                    fill_count += 1
+                j -= 1
+            break
+
+        prev = old[i - 1]
+
+        while j >= 0 and prev < new[j] <= cur:
+            if new[j] == cur:
+                indexer[j] = i
+            elif new[j] < cur and fill_count < lim:
+                indexer[j] = i
+                fill_count += 1
+            j -= 1
+
+        fill_count = 0
+        i -= 1
+        cur = prev
+
+    return indexer
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def backfill_inplace_{{name}}(ndarray[{{c_type}}] values,
+                              ndarray[uint8_t, cast=True] mask,
+                              limit=None):
+    cdef Py_ssize_t i, N
+    cdef {{c_type}} val
+    cdef int lim, fill_count = 0
+
+    N = len(values)
+
+    # GH 2778
+    if N == 0:
+        return
+
+    if limit is None:
+        lim = N
+    else:
+        if not util.is_integer_object(limit):
+            raise ValueError('Limit must be an integer')
+        if limit < 1:
+            raise ValueError('Limit must be greater than 0')
+        lim = limit
+
+    val = values[N - 1]
+    for i in range(N - 1, -1, -1):
+        if mask[i]:
+            if fill_count >= lim:
+                continue
+            fill_count += 1
+            values[i] = val
+        else:
+            fill_count = 0
+            val = values[i]
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def backfill_2d_inplace_{{name}}(ndarray[{{c_type}}, ndim=2] values,
+                                 ndarray[uint8_t, ndim=2] mask,
+                                 limit=None):
+    cdef Py_ssize_t i, j, N, K
+    cdef {{c_type}} val
+    cdef int lim, fill_count = 0
+
+    K, N = (<object> values).shape
+
+    # GH 2778
+    if N == 0:
+        return
+
+    if limit is None:
+        lim = N
+    else:
+        if not util.is_integer_object(limit):
+            raise ValueError('Limit must be an integer')
+        if limit < 1:
+            raise ValueError('Limit must be greater than 0')
+        lim = limit
+
+    for j in range(K):
+        fill_count = 0
+        val = values[j, N - 1]
+        for i in range(N - 1, -1, -1):
+            if mask[j, i]:
+                if fill_count >= lim:
+                    continue
+                fill_count += 1
+                values[j, i] = val
+            else:
+                fill_count = 0
+                val = values[j, i]
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def is_monotonic_{{name}}(ndarray[{{c_type}}] arr, bint timelike):
+    """
+    Returns
+    -------
+    is_monotonic_inc, is_monotonic_dec, is_unique
+    """
+    cdef:
+        Py_ssize_t i, n
+        {{c_type}} prev, cur
+        bint is_monotonic_inc = 1
+        bint is_monotonic_dec = 1
+        bint is_unique = 1
+
+    n = len(arr)
+
+    if n == 1:
+        if arr[0] != arr[0] or (timelike and <int64_t>arr[0] == iNaT):
+            # single value is NaN
+            return False, False, True
+        else:
+            return True, True, True
+    elif n < 2:
+        return True, True, True
+
+    if timelike and <int64_t>arr[0] == iNaT:
+        return False, False, True
+
+    {{nogil_str}}
+    {{tab}}prev = arr[0]
+    {{tab}}for i in range(1, n):
+    {{tab}}    cur = arr[i]
+    {{tab}}    if timelike and <int64_t>cur == iNaT:
+    {{tab}}        is_monotonic_inc = 0
+    {{tab}}        is_monotonic_dec = 0
+    {{tab}}        break
+    {{tab}}    if cur < prev:
+    {{tab}}        is_monotonic_inc = 0
+    {{tab}}    elif cur > prev:
+    {{tab}}        is_monotonic_dec = 0
+    {{tab}}    elif cur == prev:
+    {{tab}}        is_unique = 0
+    {{tab}}    else:
+    {{tab}}        # cur or prev is NaN
+    {{tab}}        is_monotonic_inc = 0
+    {{tab}}        is_monotonic_dec = 0
+    {{tab}}        break
+    {{tab}}    if not is_monotonic_inc and not is_monotonic_dec:
+    {{tab}}        is_monotonic_inc = 0
+    {{tab}}        is_monotonic_dec = 0
+    {{tab}}        break
+    {{tab}}    prev = cur
+    return is_monotonic_inc, is_monotonic_dec, \
+           is_unique and (is_monotonic_inc or is_monotonic_dec)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def arrmap_{{name}}(ndarray[{{c_type}}] index, object func):
+    cdef Py_ssize_t length = index.shape[0]
+    cdef Py_ssize_t i = 0
+
+    cdef ndarray[object] result = np.empty(length, dtype=np.object_)
+
+    from pandas._libs.lib import maybe_convert_objects
+
+    for i in range(length):
+        result[i] = func(index[i])
+
+    return maybe_convert_objects(result)
+
+{{endfor}}
+
+#----------------------------------------------------------------------
+# put template
+#----------------------------------------------------------------------
+
+{{py:
+
+# name, c_type, dest_type, dest_dtype
+dtypes = [('float64', 'float64_t', 'float64_t', 'np.float64'),
+          ('float32', 'float32_t', 'float32_t', 'np.float32'),
+          ('int8',  'int8_t',  'float32_t', 'np.float32'),
+          ('int16', 'int16_t', 'float32_t', 'np.float32'),
+          ('int32', 'int32_t', 'float64_t', 'np.float64'),
+          ('int64', 'int64_t', 'float64_t', 'np.float64')]
+
+def get_dispatch(dtypes):
+
+    for name, c_type, dest_type, dest_dtype, in dtypes:
+
+        dest_type2 = dest_type
+        dest_type = dest_type.replace('_t', '')
+
+        yield name, c_type, dest_type, dest_type2, dest_dtype
+
+}}
+
+{{for name, c_type, dest_type, dest_type2, dest_dtype
+      in get_dispatch(dtypes)}}
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def diff_2d_{{name}}(ndarray[{{c_type}}, ndim=2] arr,
+                     ndarray[{{dest_type2}}, ndim=2] out,
+                     Py_ssize_t periods, int axis):
+    cdef:
+        Py_ssize_t i, j, sx, sy
+
+    sx, sy = (<object> arr).shape
+    if arr.flags.f_contiguous:
+        if axis == 0:
+            if periods >= 0:
+                start, stop = periods, sx
+            else:
+                start, stop = 0, sx + periods
+            for j in range(sy):
+                for i in range(start, stop):
+                    out[i, j] = arr[i, j] - arr[i - periods, j]
+        else:
+            if periods >= 0:
+                start, stop = periods, sy
+            else:
+                start, stop = 0, sy + periods
+            for j in range(start, stop):
+                for i in range(sx):
+                    out[i, j] = arr[i, j] - arr[i, j - periods]
+    else:
+        if axis == 0:
+            if periods >= 0:
+                start, stop = periods, sx
+            else:
+                start, stop = 0, sx + periods
+            for i in range(start, stop):
+                for j in range(sy):
+                    out[i, j] = arr[i, j] - arr[i - periods, j]
+        else:
+            if periods >= 0:
+                start, stop = periods, sy
+            else:
+                start, stop = 0, sy + periods
+            for i in range(sx):
+                for j in range(start, stop):
+                    out[i, j] = arr[i, j] - arr[i, j - periods]
+
+
+def put2d_{{name}}_{{dest_type}}(ndarray[{{c_type}}, ndim=2, cast=True] values,
+                                 ndarray[int64_t] indexer, Py_ssize_t loc,
+                                 ndarray[{{dest_type2}}] out):
+    cdef:
+        Py_ssize_t i, j, k
+
+    k = len(values)
+    for j from 0 <= j < k:
+        i = indexer[j]
+        out[i] = values[j, loc]
+
+{{endfor}}
+
+#----------------------------------------------------------------------
+# ensure_dtype
+#----------------------------------------------------------------------
+
+cdef int PLATFORM_INT = (<ndarray> np.arange(0, dtype=np.intp)).descr.type_num
+
+cpdef ensure_platform_int(object arr):
+    # GH3033, GH1392
+    # platform int is the size of the int pointer, e.g. np.intp
+    if util.is_array(arr):
+        if (<ndarray> arr).descr.type_num == PLATFORM_INT:
+            return arr
+        else:
+            return arr.astype(np.intp)
+    else:
+        return np.array(arr, dtype=np.intp)
+
+cpdef ensure_object(object arr):
+    if util.is_array(arr):
+        if (<ndarray> arr).descr.type_num == NPY_OBJECT:
+            return arr
+        else:
+            return arr.astype(np.object_)
+    elif hasattr(arr, '_box_values_as_index'):
+        return arr._box_values_as_index()
+    else:
+        return np.array(arr, dtype=np.object_)
+
+{{py:
+
+# name, c_type, dtype
+dtypes = [('float64', 'FLOAT64', 'float64'),
+          ('float32', 'FLOAT32', 'float32'),
+          ('int8', 'INT8', 'int8'),
+          ('int16', 'INT16', 'int16'),
+          ('int32', 'INT32', 'int32'),
+          ('int64', 'INT64', 'int64'),
+          ('uint64', 'UINT64', 'uint64'),
+          # ('platform_int', 'INT', 'int_'),
+          # ('object', 'OBJECT', 'object_'),
+]
+
+def get_dispatch(dtypes):
+
+    for name, c_type, dtype in dtypes:
+        yield name, c_type, dtype
+}}
+
+{{for name, c_type, dtype in get_dispatch(dtypes)}}
+
+cpdef ensure_{{name}}(object arr, copy=True):
+    if util.is_array(arr):
+        if (<ndarray> arr).descr.type_num == NPY_{{c_type}}:
+            return arr
+        else:
+            return arr.astype(np.{{dtype}}, copy=copy)
+    else:
+        return np.array(arr, dtype=np.{{dtype}})
+
+{{endfor}}
diff --git a/pandas/_libs/algos_rank_helper.pxi.in b/pandas/_libs/algos_rank_helper.pxi.in
new file mode 100644
index 0000000000000..b2551f3733904
--- /dev/null
+++ b/pandas/_libs/algos_rank_helper.pxi.in
@@ -0,0 +1,400 @@
+"""
+Template for each `dtype` helper function for rank
+
+WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
+"""
+
+#----------------------------------------------------------------------
+# rank_1d, rank_2d
+#----------------------------------------------------------------------
+
+{{py:
+
+# dtype ctype pos_nan_value neg_nan_value
+dtypes = [('object', 'object', 'Infinity()', 'NegInfinity()'),
+          ('float64', 'float64_t', 'np.inf', '-np.inf'),
+          ('uint64', 'uint64_t', '', ''),
+          ('int64', 'int64_t', 'np.iinfo(np.int64).max',
+           'np.iinfo(np.int64).min')]
+
+}}
+
+{{for dtype, ctype, pos_nan_value, neg_nan_value in dtypes}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+{{if dtype == 'object'}}
+
+
+def rank_1d_{{dtype}}(object in_arr, ties_method='average',
+                      ascending=True, na_option='keep', pct=False):
+{{else}}
+
+
+def rank_1d_{{dtype}}(object in_arr, ties_method='average', ascending=True,
+                      na_option='keep', pct=False):
+{{endif}}
+    """
+    Fast NaN-friendly version of scipy.stats.rankdata
+    """
+
+    cdef:
+        Py_ssize_t i, j, n, dups = 0, total_tie_count = 0, non_na_idx = 0
+
+        {{if dtype == 'object'}}
+        ndarray sorted_data, values
+        {{else}}
+        ndarray[{{ctype}}] sorted_data, values
+        {{endif}}
+
+        ndarray[float64_t] ranks
+        ndarray[int64_t] argsorted
+        ndarray[uint8_t, cast=True] sorted_mask
+
+        {{if dtype == 'uint64'}}
+        {{ctype}} val
+        {{else}}
+        {{ctype}} val, nan_value
+        {{endif}}
+
+        float64_t sum_ranks = 0
+        int tiebreak = 0
+        bint keep_na = 0
+        bint isnan
+        float count = 0.0
+    tiebreak = tiebreakers[ties_method]
+
+    {{if dtype == 'float64'}}
+    values = np.asarray(in_arr).copy()
+    {{elif dtype == 'object'}}
+    values = np.array(in_arr, copy=True)
+
+    if values.dtype != np.object_:
+        values = values.astype('O')
+    {{else}}
+    values = np.asarray(in_arr)
+    {{endif}}
+
+    keep_na = na_option == 'keep'
+
+    {{if dtype == 'object'}}
+    mask = missing.isnaobj(values)
+    {{elif dtype == 'float64'}}
+    mask = np.isnan(values)
+    {{elif dtype == 'int64'}}
+    mask = values == iNaT
+
+    # create copy in case of iNaT
+    # values are mutated inplace
+    if mask.any():
+        values = values.copy()
+    {{endif}}
+
+    # double sort first by mask and then by values to ensure nan values are
+    # either at the beginning or the end. mask/(~mask) controls padding at
+    # tail or the head
+    {{if dtype != 'uint64'}}
+    if ascending ^ (na_option == 'top'):
+        nan_value = {{pos_nan_value}}
+        order = (values, mask)
+    else:
+        nan_value = {{neg_nan_value}}
+        order = (values, ~mask)
+    np.putmask(values, mask, nan_value)
+    {{else}}
+    mask = np.zeros(shape=len(values), dtype=bool)
+    order = (values, mask)
+    {{endif}}
+
+    n = len(values)
+    ranks = np.empty(n, dtype='f8')
+
+    {{if dtype == 'object'}}
+
+    try:
+        _as = np.lexsort(keys=order)
+    except TypeError:
+        # lexsort on object array will raise TypeError for numpy version
+        # earlier than 1.11.0. Use argsort with order argument instead.
+        _dt = [('values', 'O'), ('mask', '?')]
+        _values = np.asarray(list(zip(order[0], order[1])), dtype=_dt)
+        _as = np.argsort(_values, kind='mergesort', order=('mask', 'values'))
+    {{else}}
+    if tiebreak == TIEBREAK_FIRST:
+        # need to use a stable sort here
+        _as = np.lexsort(keys=order)
+        if not ascending:
+            tiebreak = TIEBREAK_FIRST_DESCENDING
+    else:
+        _as = np.lexsort(keys=order)
+    {{endif}}
+
+    if not ascending:
+        _as = _as[::-1]
+
+    sorted_data = values.take(_as)
+    sorted_mask = mask.take(_as)
+    _indices = np.diff(sorted_mask).nonzero()[0]
+    non_na_idx = _indices[0] if len(_indices) > 0 else -1
+    argsorted = _as.astype('i8')
+
+    {{if dtype == 'object'}}
+    for i in range(n):
+        sum_ranks += i + 1
+        dups += 1
+        isnan = sorted_mask[i]
+        val = util.get_value_at(sorted_data, i)
+
+        if isnan and keep_na:
+            ranks[argsorted[i]] = nan
+            continue
+        count += 1.0
+
+        if (i == n - 1 or
+                are_diff(util.get_value_at(sorted_data, i + 1), val) or
+                i == non_na_idx):
+            if tiebreak == TIEBREAK_AVERAGE:
+                for j in range(i - dups + 1, i + 1):
+                    ranks[argsorted[j]] = sum_ranks / dups
+            elif tiebreak == TIEBREAK_MIN:
+                for j in range(i - dups + 1, i + 1):
+                    ranks[argsorted[j]] = i - dups + 2
+            elif tiebreak == TIEBREAK_MAX:
+                for j in range(i - dups + 1, i + 1):
+                    ranks[argsorted[j]] = i + 1
+            elif tiebreak == TIEBREAK_FIRST:
+                raise ValueError('first not supported for non-numeric data')
+            elif tiebreak == TIEBREAK_FIRST_DESCENDING:
+                for j in range(i - dups + 1, i + 1):
+                    ranks[argsorted[j]] = 2 * i - j - dups + 2
+            elif tiebreak == TIEBREAK_DENSE:
+                total_tie_count += 1
+                for j in range(i - dups + 1, i + 1):
+                    ranks[argsorted[j]] = total_tie_count
+            sum_ranks = dups = 0
+    {{else}}
+    with nogil:
+        for i in range(n):
+            sum_ranks += i + 1
+            dups += 1
+            val = sorted_data[i]
+
+            {{if dtype != 'uint64'}}
+            isnan = sorted_mask[i]
+            if isnan and keep_na:
+                ranks[argsorted[i]] = nan
+                continue
+            {{endif}}
+
+            count += 1.0
+
+            if (i == n - 1 or sorted_data[i + 1] != val or
+                i == non_na_idx):
+                if tiebreak == TIEBREAK_AVERAGE:
+                    for j in range(i - dups + 1, i + 1):
+                        ranks[argsorted[j]] = sum_ranks / dups
+                elif tiebreak == TIEBREAK_MIN:
+                    for j in range(i - dups + 1, i + 1):
+                        ranks[argsorted[j]] = i - dups + 2
+                elif tiebreak == TIEBREAK_MAX:
+                    for j in range(i - dups + 1, i + 1):
+                        ranks[argsorted[j]] = i + 1
+                elif tiebreak == TIEBREAK_FIRST:
+                    for j in range(i - dups + 1, i + 1):
+                        ranks[argsorted[j]] = j + 1
+                elif tiebreak == TIEBREAK_FIRST_DESCENDING:
+                    for j in range(i - dups + 1, i + 1):
+                        ranks[argsorted[j]] = 2 * i - j - dups + 2
+                elif tiebreak == TIEBREAK_DENSE:
+                    total_tie_count += 1
+                    for j in range(i - dups + 1, i + 1):
+                        ranks[argsorted[j]] = total_tie_count
+                sum_ranks = dups = 0
+    {{endif}}
+    if pct:
+        if tiebreak == TIEBREAK_DENSE:
+            return ranks / total_tie_count
+        else:
+            return ranks / count
+    else:
+        return ranks
+
+
+def rank_2d_{{dtype}}(object in_arr, axis=0, ties_method='average',
+                      ascending=True, na_option='keep', pct=False):
+    """
+    Fast NaN-friendly version of scipy.stats.rankdata
+    """
+
+    cdef:
+        Py_ssize_t i, j, z, k, n, dups = 0, total_tie_count = 0
+
+        {{if dtype == 'object'}}
+        Py_ssize_t infs
+        {{endif}}
+
+        ndarray[float64_t, ndim=2] ranks
+        {{if dtype == 'int64' or dtype == 'uint64'}}
+        ndarray[{{ctype}}, ndim=2, cast=True] values
+        {{else}}
+        ndarray[{{ctype}}, ndim=2] values
+        {{endif}}
+
+        ndarray[int64_t, ndim=2] argsorted
+
+        {{if dtype == 'uint64'}}
+        {{ctype}} val
+        {{else}}
+        {{ctype}} val, nan_value
+        {{endif}}
+
+        float64_t sum_ranks = 0
+        int tiebreak = 0
+        bint keep_na = 0
+        float count = 0.0
+
+    tiebreak = tiebreakers[ties_method]
+
+    keep_na = na_option == 'keep'
+
+    in_arr = np.asarray(in_arr)
+
+    if axis == 0:
+        values = in_arr.T.copy()
+    else:
+        values = in_arr.copy()
+
+    {{if dtype == 'object'}}
+    if values.dtype != np.object_:
+        values = values.astype('O')
+    {{endif}}
+
+    {{if dtype != 'uint64'}}
+    if ascending ^ (na_option == 'top'):
+        nan_value = {{pos_nan_value}}
+    else:
+        nan_value = {{neg_nan_value}}
+
+    {{if dtype == 'object'}}
+    mask = missing.isnaobj2d(values)
+    {{elif dtype == 'float64'}}
+    mask = np.isnan(values)
+    {{elif dtype == 'int64'}}
+    mask = values == iNaT
+    {{endif}}
+
+    np.putmask(values, mask, nan_value)
+    {{endif}}
+
+    n, k = (<object> values).shape
+    ranks = np.empty((n, k), dtype='f8')
+
+    {{if dtype == 'object'}}
+    try:
+        _as = values.argsort(1)
+    except TypeError:
+        values = in_arr
+        for i in range(len(values)):
+            ranks[i] = rank_1d_object(in_arr[i], ties_method=ties_method,
+                                      ascending=ascending, pct=pct)
+        if axis == 0:
+            return ranks.T
+        else:
+            return ranks
+    {{else}}
+    if tiebreak == TIEBREAK_FIRST:
+        # need to use a stable sort here
+        _as = values.argsort(axis=1, kind='mergesort')
+        if not ascending:
+            tiebreak = TIEBREAK_FIRST_DESCENDING
+    else:
+        _as = values.argsort(1)
+    {{endif}}
+
+    if not ascending:
+        _as = _as[:, ::-1]
+
+    values = _take_2d_{{dtype}}(values, _as)
+    argsorted = _as.astype('i8')
+
+    for i in range(n):
+        {{if dtype == 'object'}}
+        dups = sum_ranks = infs = 0
+        {{else}}
+        dups = sum_ranks = 0
+        {{endif}}
+
+        total_tie_count = 0
+        count = 0.0
+        for j in range(k):
+            {{if dtype != 'object'}}
+            sum_ranks += j + 1
+            dups += 1
+            {{endif}}
+
+            val = values[i, j]
+
+            {{if dtype != 'uint64'}}
+            {{if dtype == 'object'}}
+            if (val is nan_value) and keep_na:
+            {{else}}
+            if (val == nan_value) and keep_na:
+            {{endif}}
+                ranks[i, argsorted[i, j]] = nan
+
+                {{if dtype == 'object'}}
+                infs += 1
+                {{endif}}
+
+                continue
+            {{endif}}
+
+            count += 1.0
+
+            {{if dtype == 'object'}}
+            sum_ranks += (j - infs) + 1
+            dups += 1
+            {{endif}}
+
+            {{if dtype == 'object'}}
+            if j == k - 1 or are_diff(values[i, j + 1], val):
+            {{else}}
+            if j == k - 1 or values[i, j + 1] != val:
+            {{endif}}
+                if tiebreak == TIEBREAK_AVERAGE:
+                    for z in range(j - dups + 1, j + 1):
+                        ranks[i, argsorted[i, z]] = sum_ranks / dups
+                elif tiebreak == TIEBREAK_MIN:
+                    for z in range(j - dups + 1, j + 1):
+                        ranks[i, argsorted[i, z]] = j - dups + 2
+                elif tiebreak == TIEBREAK_MAX:
+                    for z in range(j - dups + 1, j + 1):
+                        ranks[i, argsorted[i, z]] = j + 1
+                elif tiebreak == TIEBREAK_FIRST:
+                    {{if dtype == 'object'}}
+                    raise ValueError('first not supported '
+                                     'for non-numeric data')
+                    {{else}}
+                    for z in range(j - dups + 1, j + 1):
+                        ranks[i, argsorted[i, z]] = z + 1
+                    {{endif}}
+                elif tiebreak == TIEBREAK_FIRST_DESCENDING:
+                    for z in range(j - dups + 1, j + 1):
+                        ranks[i, argsorted[i, z]] = 2 * j - z - dups + 2
+                elif tiebreak == TIEBREAK_DENSE:
+                    total_tie_count += 1
+                    for z in range(j - dups + 1, j + 1):
+                        ranks[i, argsorted[i, z]] = total_tie_count
+                sum_ranks = dups = 0
+        if pct:
+            if tiebreak == TIEBREAK_DENSE:
+                ranks[i, :] /= total_tie_count
+            else:
+                ranks[i, :] /= count
+    if axis == 0:
+        return ranks.T
+    else:
+        return ranks
+
+{{endfor}}
diff --git a/pandas/_libs/algos_take_helper.pxi.in b/pandas/_libs/algos_take_helper.pxi.in
new file mode 100644
index 0000000000000..71bb1bb4fe9be
--- /dev/null
+++ b/pandas/_libs/algos_take_helper.pxi.in
@@ -0,0 +1,292 @@
+"""
+Template for each `dtype` helper function for take
+
+WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
+"""
+
+#----------------------------------------------------------------------
+# take_1d, take_2d
+#----------------------------------------------------------------------
+
+{{py:
+
+# name, dest, c_type_in, c_type_out, preval, postval, can_copy, nogil
+dtypes = [
+    ('bool', 'bool', 'uint8_t', 'uint8_t', '', '', True, True),
+    ('bool', 'object', 'uint8_t', 'object',
+     'True if ', ' > 0 else False', False, False),
+    ('int8', 'int8', 'int8_t', 'int8_t', '', '', True, False),
+    ('int8', 'int32', 'int8_t', 'int32_t', '', '', False, True),
+    ('int8', 'int64', 'int8_t', 'int64_t', '', '', False, True),
+    ('int8', 'float64', 'int8_t', 'float64_t', '', '', False, True),
+    ('int16', 'int16', 'int16_t', 'int16_t', '', '', True, True),
+    ('int16', 'int32', 'int16_t', 'int32_t', '', '', False, True),
+    ('int16', 'int64', 'int16_t', 'int64_t', '', '', False, True),
+    ('int16', 'float64', 'int16_t', 'float64_t', '', '', False, True),
+    ('int32', 'int32', 'int32_t', 'int32_t', '', '', True, True),
+    ('int32', 'int64', 'int32_t', 'int64_t', '', '', False, True),
+    ('int32', 'float64', 'int32_t', 'float64_t', '', '', False, True),
+    ('int64', 'int64', 'int64_t', 'int64_t', '', '', True, True),
+    ('int64', 'float64', 'int64_t', 'float64_t', '', '', False, True),
+    ('float32', 'float32', 'float32_t', 'float32_t', '', '', True, True),
+    ('float32', 'float64', 'float32_t', 'float64_t', '', '', False, True),
+    ('float64', 'float64', 'float64_t', 'float64_t', '', '', True, True),
+    ('object', 'object', 'object', 'object', '', '', False, False)]
+
+
+def get_dispatch(dtypes):
+
+    inner_take_1d_template = """
+    cdef:
+        Py_ssize_t i, n, idx
+        %(c_type_out)s fv
+
+    n = indexer.shape[0]
+
+    fv = fill_value
+
+    %(nogil_str)s
+    %(tab)sfor i from 0 <= i < n:
+    %(tab)s    idx = indexer[i]
+    %(tab)s    if idx == -1:
+    %(tab)s        out[i] = fv
+    %(tab)s    else:
+    %(tab)s        out[i] = %(preval)svalues[idx]%(postval)s
+"""
+
+    inner_take_2d_axis0_template = """\
+    cdef:
+        Py_ssize_t i, j, k, n, idx
+        %(c_type_out)s fv
+
+    n = len(indexer)
+    k = values.shape[1]
+
+    fv = fill_value
+
+    IF %(can_copy)s:
+        cdef:
+            %(c_type_out)s *v
+            %(c_type_out)s *o
+
+        #GH3130
+        if (values.strides[1] == out.strides[1] and
+            values.strides[1] == sizeof(%(c_type_out)s) and
+            sizeof(%(c_type_out)s) * n >= 256):
+
+            for i from 0 <= i < n:
+                idx = indexer[i]
+                if idx == -1:
+                    for j from 0 <= j < k:
+                        out[i, j] = fv
+                else:
+                    v = &values[idx, 0]
+                    o = &out[i, 0]
+                    memmove(o, v, <size_t>(sizeof(%(c_type_out)s) * k))
+            return
+
+    for i from 0 <= i < n:
+        idx = indexer[i]
+        if idx == -1:
+            for j from 0 <= j < k:
+                out[i, j] = fv
+        else:
+            for j from 0 <= j < k:
+                out[i, j] = %(preval)svalues[idx, j]%(postval)s
+"""
+
+    inner_take_2d_axis1_template = """\
+    cdef:
+        Py_ssize_t i, j, k, n, idx
+        %(c_type_out)s fv
+
+    n = len(values)
+    k = len(indexer)
+
+    if n == 0 or k == 0:
+        return
+
+    fv = fill_value
+
+    for i from 0 <= i < n:
+        for j from 0 <= j < k:
+            idx = indexer[j]
+            if idx == -1:
+                out[i, j] = fv
+            else:
+                out[i, j] = %(preval)svalues[i, idx]%(postval)s
+"""
+
+    for (name, dest, c_type_in, c_type_out, preval, postval,
+         can_copy, nogil) in dtypes:
+        if nogil:
+            nogil_str = "with nogil:"
+            tab = '    '
+        else:
+            nogil_str = ''
+            tab = ''
+
+        args = dict(name=name, dest=dest, c_type_in=c_type_in,
+                    c_type_out=c_type_out, preval=preval, postval=postval,
+                    can_copy=can_copy, nogil_str=nogil_str, tab=tab)
+
+        inner_take_1d = inner_take_1d_template % args
+        inner_take_2d_axis0 = inner_take_2d_axis0_template % args
+        inner_take_2d_axis1 = inner_take_2d_axis1_template % args
+
+        yield (name, dest, c_type_in, c_type_out, preval, postval, can_copy,
+               inner_take_1d, inner_take_2d_axis0, inner_take_2d_axis1)
+
+}}
+
+
+{{for name, dest, c_type_in, c_type_out, preval, postval, can_copy,
+      inner_take_1d, inner_take_2d_axis0, inner_take_2d_axis1
+      in get_dispatch(dtypes)}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cdef inline take_1d_{{name}}_{{dest}}_memview({{c_type_in}}[:] values,
+                                              int64_t[:] indexer,
+                                              {{c_type_out}}[:] out,
+                                              fill_value=np.nan):
+
+
+{{inner_take_1d}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def take_1d_{{name}}_{{dest}}(ndarray[{{c_type_in}}, ndim=1] values,
+                              int64_t[:] indexer,
+                              {{c_type_out}}[:] out,
+                              fill_value=np.nan):
+
+    if values.flags.writeable:
+        # We can call the memoryview version of the code
+        take_1d_{{name}}_{{dest}}_memview(values, indexer, out,
+                                          fill_value=fill_value)
+        return
+
+    # We cannot use the memoryview version on readonly-buffers due to
+    # a limitation of Cython's typed memoryviews. Instead we can use
+    # the slightly slower Cython ndarray type directly.
+{{inner_take_1d}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cdef inline take_2d_axis0_{{name}}_{{dest}}_memview({{c_type_in}}[:, :] values,
+                                                    int64_t[:] indexer,
+                                                    {{c_type_out}}[:, :] out,
+                                                    fill_value=np.nan):
+{{inner_take_2d_axis0}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def take_2d_axis0_{{name}}_{{dest}}(ndarray[{{c_type_in}}, ndim=2] values,
+                                    ndarray[int64_t] indexer,
+                                    {{c_type_out}}[:, :] out,
+                                    fill_value=np.nan):
+    if values.flags.writeable:
+        # We can call the memoryview version of the code
+        take_2d_axis0_{{name}}_{{dest}}_memview(values, indexer, out,
+                                                fill_value=fill_value)
+        return
+
+    # We cannot use the memoryview version on readonly-buffers due to
+    # a limitation of Cython's typed memoryviews. Instead we can use
+    # the slightly slower Cython ndarray type directly.
+{{inner_take_2d_axis0}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cdef inline take_2d_axis1_{{name}}_{{dest}}_memview({{c_type_in}}[:, :] values,
+                                                    int64_t[:] indexer,
+                                                    {{c_type_out}}[:, :] out,
+                                                    fill_value=np.nan):
+{{inner_take_2d_axis1}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def take_2d_axis1_{{name}}_{{dest}}(ndarray[{{c_type_in}}, ndim=2] values,
+                                    ndarray[int64_t] indexer,
+                                    {{c_type_out}}[:, :] out,
+                                    fill_value=np.nan):
+
+    if values.flags.writeable:
+        # We can call the memoryview version of the code
+        take_2d_axis1_{{name}}_{{dest}}_memview(values, indexer, out,
+                                                fill_value=fill_value)
+        return
+
+    # We cannot use the memoryview version on readonly-buffers due to
+    # a limitation of Cython's typed memoryviews. Instead we can use
+    # the slightly slower Cython ndarray type directly.
+{{inner_take_2d_axis1}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def take_2d_multi_{{name}}_{{dest}}(ndarray[{{c_type_in}}, ndim=2] values,
+                                    indexer,
+                                    ndarray[{{c_type_out}}, ndim=2] out,
+                                    fill_value=np.nan):
+    cdef:
+        Py_ssize_t i, j, k, n, idx
+        ndarray[int64_t] idx0 = indexer[0]
+        ndarray[int64_t] idx1 = indexer[1]
+        {{c_type_out}} fv
+
+    n = len(idx0)
+    k = len(idx1)
+
+    fv = fill_value
+    for i from 0 <= i < n:
+        idx = idx0[i]
+        if idx == -1:
+            for j from 0 <= j < k:
+                out[i, j] = fv
+        else:
+            for j from 0 <= j < k:
+                if idx1[j] == -1:
+                    out[i, j] = fv
+                else:
+                    out[i, j] = {{preval}}values[idx, idx1[j]]{{postval}}
+
+{{endfor}}
+
+#----------------------------------------------------------------------
+# take_2d internal function
+#----------------------------------------------------------------------
+
+{{py:
+
+# dtype, ctype, init_result
+dtypes = [('float64', 'float64_t', 'np.empty_like(values)'),
+          ('uint64', 'uint64_t', 'np.empty_like(values)'),
+          ('object', 'object', 'values.copy()'),
+          ('int64', 'int64_t', 'np.empty_like(values)')]
+}}
+
+{{for dtype, ctype, init_result in dtypes}}
+
+cdef _take_2d_{{dtype}}(ndarray[{{ctype}}, ndim=2] values, object idx):
+    cdef:
+        Py_ssize_t i, j, N, K
+        ndarray[Py_ssize_t, ndim=2, cast=True] indexer = idx
+        ndarray[{{ctype}}, ndim=2] result
+        object val
+
+    N, K = (<object> values).shape
+    result = {{init_result}}
+    for i in range(N):
+        for j in range(K):
+            result[i, j] = values[i, indexer[i, j]]
+    return result
+
+{{endfor}}
diff --git a/pandas/_libs/groupby.pyx b/pandas/_libs/groupby.pyx
new file mode 100644
index 0000000000000..a6dbaff17e543
--- /dev/null
+++ b/pandas/_libs/groupby.pyx
@@ -0,0 +1,384 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+cimport numpy as cnp
+import numpy as np
+
+cimport cython
+
+cnp.import_array()
+
+from numpy cimport (ndarray,
+                    double_t,
+                    int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
+                    uint32_t, uint64_t, float32_t, float64_t)
+
+from libc.stdlib cimport malloc, free
+
+from util cimport numeric, get_nat
+from algos cimport (swap, TiebreakEnumType, TIEBREAK_AVERAGE, TIEBREAK_MIN,
+                    TIEBREAK_MAX, TIEBREAK_FIRST, TIEBREAK_DENSE)
+from algos import take_2d_axis1_float64_float64, groupsort_indexer, tiebreakers
+
+cdef int64_t iNaT = get_nat()
+
+cdef double NaN = <double> np.NaN
+cdef double nan = NaN
+
+
+cdef inline float64_t median_linear(float64_t* a, int n) nogil:
+    cdef int i, j, na_count = 0
+    cdef float64_t result
+    cdef float64_t* tmp
+
+    if n == 0:
+        return NaN
+
+    # count NAs
+    for i in range(n):
+        if a[i] != a[i]:
+            na_count += 1
+
+    if na_count:
+        if na_count == n:
+            return NaN
+
+        tmp = <float64_t*> malloc((n - na_count) * sizeof(float64_t))
+
+        j = 0
+        for i in range(n):
+            if a[i] == a[i]:
+                tmp[j] = a[i]
+                j += 1
+
+        a = tmp
+        n -= na_count
+
+    if n % 2:
+        result = kth_smallest_c( a, n / 2, n)
+    else:
+        result = (kth_smallest_c(a, n / 2, n) +
+                  kth_smallest_c(a, n / 2 - 1, n)) / 2
+
+    if na_count:
+        free(a)
+
+    return result
+
+
+cdef inline float64_t kth_smallest_c(float64_t* a,
+                                     Py_ssize_t k,
+                                     Py_ssize_t n) nogil:
+    cdef:
+        Py_ssize_t i, j, l, m
+        double_t x, t
+
+    l = 0
+    m = n -1
+    while (l<m):
+        x = a[k]
+        i = l
+        j = m
+
+        while 1:
+            while a[i] < x: i += 1
+            while x < a[j]: j -= 1
+            if i <= j:
+                swap(&a[i], &a[j])
+                i += 1; j -= 1
+
+            if i > j: break
+
+        if j < k: l = i
+        if k < i: m = j
+    return a[k]
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def group_median_float64(ndarray[float64_t, ndim=2] out,
+                         ndarray[int64_t] counts,
+                         ndarray[float64_t, ndim=2] values,
+                         ndarray[int64_t] labels,
+                         Py_ssize_t min_count=-1):
+    """
+    Only aggregates on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, ngroups, size
+        ndarray[int64_t] _counts
+        ndarray data
+        float64_t* ptr
+
+    assert min_count == -1, "'min_count' only used in add and prod"
+
+    ngroups = len(counts)
+    N, K = (<object> values).shape
+
+    indexer, _counts = groupsort_indexer(labels, ngroups)
+    counts[:] = _counts[1:]
+
+    data = np.empty((K, N), dtype=np.float64)
+    ptr = <float64_t*> data.data
+
+    take_2d_axis1_float64_float64(values.T, indexer, out=data)
+
+    with nogil:
+
+        for i in range(K):
+            # exclude NA group
+            ptr += _counts[0]
+            for j in range(ngroups):
+                size = _counts[j + 1]
+                out[j, i] = median_linear(ptr, size)
+                ptr += size
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def group_cumprod_float64(float64_t[:, :] out,
+                          float64_t[:, :] values,
+                          int64_t[:] labels,
+                          bint is_datetimelike,
+                          bint skipna=True):
+    """
+    Only transforms on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, size
+        float64_t val
+        float64_t[:, :] accum
+        int64_t lab
+
+    N, K = (<object> values).shape
+    accum = np.ones_like(values)
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+
+            if lab < 0:
+                continue
+            for j in range(K):
+                val = values[i, j]
+                if val == val:
+                    accum[lab, j] *= val
+                    out[i, j] = accum[lab, j]
+                else:
+                    out[i, j] = NaN
+                    if not skipna:
+                        accum[lab, j] = NaN
+                        break
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def group_cumsum(numeric[:, :] out,
+                 numeric[:, :] values,
+                 int64_t[:] labels,
+                 is_datetimelike,
+                 bint skipna=True):
+    """
+    Only transforms on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, size
+        numeric val
+        numeric[:, :] accum
+        int64_t lab
+
+    N, K = (<object> values).shape
+    accum = np.zeros_like(values)
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+
+            if lab < 0:
+                continue
+            for j in range(K):
+                val = values[i, j]
+
+                if numeric == float32_t or numeric == float64_t:
+                    if val == val:
+                        accum[lab, j] += val
+                        out[i, j] = accum[lab, j]
+                    else:
+                        out[i, j] = NaN
+                        if not skipna:
+                            accum[lab, j] = NaN
+                            break
+                else:
+                    accum[lab, j] += val
+                    out[i, j] = accum[lab, j]
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def group_shift_indexer(ndarray[int64_t] out, ndarray[int64_t] labels,
+                        int ngroups, int periods):
+    cdef:
+        Py_ssize_t N, i, j, ii
+        int offset, sign
+        int64_t lab, idxer, idxer_slot
+        int64_t[:] label_seen = np.zeros(ngroups, dtype=np.int64)
+        int64_t[:, :] label_indexer
+
+    N, = (<object> labels).shape
+
+    if periods < 0:
+        periods = -periods
+        offset = N - 1
+        sign = -1
+    elif periods > 0:
+        offset = 0
+        sign = 1
+
+    if periods == 0:
+        with nogil:
+            for i in range(N):
+                out[i] = i
+    else:
+        # array of each previous indexer seen
+        label_indexer = np.zeros((ngroups, periods), dtype=np.int64)
+        with nogil:
+            for i in range(N):
+                ## reverse iterator if shifting backwards
+                ii = offset + sign * i
+                lab = labels[ii]
+
+                # Skip null keys
+                if lab == -1:
+                    out[ii] = -1
+                    continue
+
+                label_seen[lab] += 1
+
+                idxer_slot = label_seen[lab] % periods
+                idxer = label_indexer[lab, idxer_slot]
+
+                if label_seen[lab] > periods:
+                    out[ii] = idxer
+                else:
+                    out[ii] = -1
+
+                label_indexer[lab, idxer_slot] = ii
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def group_fillna_indexer(ndarray[int64_t] out, ndarray[int64_t] labels,
+                         ndarray[uint8_t] mask, object direction,
+                         int64_t limit):
+    """Indexes how to fill values forwards or backwards within a group
+
+    Parameters
+    ----------
+    out : array of int64_t values which this method will write its results to
+        Missing values will be written to with a value of -1
+    labels : array containing unique label for each group, with its ordering
+        matching up to the corresponding record in `values`
+    mask : array of int64_t values where a 1 indicates a missing value
+    direction : {'ffill', 'bfill'}
+        Direction for fill to be applied (forwards or backwards, respectively)
+    limit : Consecutive values to fill before stopping, or -1 for no limit
+
+    Notes
+    -----
+    This method modifies the `out` parameter rather than returning an object
+    """
+    cdef:
+        Py_ssize_t i, N
+        ndarray[int64_t] sorted_labels
+        int64_t idx, curr_fill_idx=-1, filled_vals=0
+
+    N = len(out)
+
+    # Make sure all arrays are the same size
+    assert N == len(labels) == len(mask)
+
+    sorted_labels = np.argsort(labels, kind='mergesort').astype(
+        np.int64, copy=False)
+    if direction == 'bfill':
+        sorted_labels = sorted_labels[::-1]
+
+    with nogil:
+        for i in range(N):
+            idx = sorted_labels[i]
+            if mask[idx] == 1:  # is missing
+                # Stop filling once we've hit the limit
+                if filled_vals >= limit and limit != -1:
+                    curr_fill_idx = -1
+                filled_vals += 1
+            else:  # reset items when not missing
+                filled_vals = 0
+                curr_fill_idx = idx
+
+            out[idx] = curr_fill_idx
+
+            # If we move to the next group, reset
+            # the fill_idx and counter
+            if i == N - 1 or labels[idx] != labels[sorted_labels[i+1]]:
+                curr_fill_idx = -1
+                filled_vals = 0
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def group_any_all(ndarray[uint8_t] out,
+                  ndarray[int64_t] labels,
+                  ndarray[uint8_t] values,
+                  ndarray[uint8_t] mask,
+                  object val_test,
+                  bint skipna):
+    """Aggregated boolean values to show truthfulness of group elements
+
+    Parameters
+    ----------
+    out : array of values which this method will write its results to
+    labels : array containing unique label for each group, with its
+        ordering matching up to the corresponding record in `values`
+    values : array containing the truth value of each element
+    mask : array indicating whether a value is na or not
+    val_test : str {'any', 'all'}
+        String object dictating whether to use any or all truth testing
+    skipna : boolean
+        Flag to ignore nan values during truth testing
+
+    Notes
+    -----
+    This method modifies the `out` parameter rather than returning an object.
+    The returned values will either be 0 or 1 (False or True, respectively).
+    """
+    cdef:
+        Py_ssize_t i, N=len(labels)
+        int64_t lab
+        uint8_t flag_val
+
+    if val_test == 'all':
+        # Because the 'all' value of an empty iterable in Python is True we can
+        # start with an array full of ones and set to zero when a False value
+        # is encountered
+        flag_val = 0
+    elif val_test == 'any':
+        # Because the 'any' value of an empty iterable in Python is False we
+        # can start with an array full of zeros and set to one only if any
+        # value encountered is True
+        flag_val = 1
+    else:
+        raise ValueError("'bool_func' must be either 'any' or 'all'!")
+
+    out.fill(1 - flag_val)
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0 or (skipna and mask[i]):
+                continue
+
+            if values[i] == flag_val:
+                out[lab] = flag_val
+
+
+# generated from template
+include "groupby_helper.pxi"
diff --git a/pandas/_libs/groupby_helper.pxi.in b/pandas/_libs/groupby_helper.pxi.in
new file mode 100644
index 0000000000000..0062a6c8d31ab
--- /dev/null
+++ b/pandas/_libs/groupby_helper.pxi.in
@@ -0,0 +1,805 @@
+"""
+Template for each `dtype` helper function using groupby
+
+WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
+"""
+
+cdef extern from "numpy/npy_math.h":
+    double NAN "NPY_NAN"
+_int64_max = np.iinfo(np.int64).max
+
+#----------------------------------------------------------------------
+# group_add, group_prod, group_var, group_mean, group_ohlc
+#----------------------------------------------------------------------
+
+{{py:
+
+# name, c_type, dest_type, dest_dtype
+dtypes = [('float64', 'float64_t', 'float64_t', 'np.float64'),
+          ('float32', 'float32_t', 'float32_t', 'np.float32')]
+
+def get_dispatch(dtypes):
+
+    for name, c_type, dest_type, dest_dtype in dtypes:
+
+        dest_type2 = dest_type
+        dest_type = dest_type.replace('_t', '')
+
+        yield name, c_type, dest_type, dest_type2, dest_dtype
+}}
+
+{{for name, c_type, dest_type, dest_type2, dest_dtype in get_dispatch(dtypes)}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def group_add_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
+                       ndarray[int64_t] counts,
+                       ndarray[{{c_type}}, ndim=2] values,
+                       ndarray[int64_t] labels,
+                       Py_ssize_t min_count=0):
+    """
+    Only aggregates on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
+        {{dest_type2}} val, count
+        ndarray[{{dest_type2}}, ndim=2] sumx, nobs
+
+    if not len(values) == len(labels):
+        raise AssertionError("len(index) != len(labels)")
+
+    nobs = np.zeros_like(out)
+    sumx = np.zeros_like(out)
+
+    N, K = (<object> values).shape
+
+    with nogil:
+
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
+
+            counts[lab] += 1
+            for j in range(K):
+                val = values[i, j]
+
+                # not nan
+                if val == val:
+                    nobs[lab, j] += 1
+                    sumx[lab, j] += val
+
+        for i in range(ncounts):
+            for j in range(K):
+                if nobs[i, j] < min_count:
+                    out[i, j] = NAN
+                else:
+                    out[i, j] = sumx[i, j]
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def group_prod_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
+                        ndarray[int64_t] counts,
+                        ndarray[{{c_type}}, ndim=2] values,
+                        ndarray[int64_t] labels,
+                        Py_ssize_t min_count=0):
+    """
+    Only aggregates on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
+        {{dest_type2}} val, count
+        ndarray[{{dest_type2}}, ndim=2] prodx, nobs
+
+    if not len(values) == len(labels):
+        raise AssertionError("len(index) != len(labels)")
+
+    nobs = np.zeros_like(out)
+    prodx = np.ones_like(out)
+
+    N, K = (<object> values).shape
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
+
+            counts[lab] += 1
+            for j in range(K):
+                val = values[i, j]
+
+                # not nan
+                if val == val:
+                    nobs[lab, j] += 1
+                    prodx[lab, j] *= val
+
+        for i in range(ncounts):
+            for j in range(K):
+                if nobs[i, j] < min_count:
+                    out[i, j] = NAN
+                else:
+                    out[i, j] = prodx[i, j]
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+@cython.cdivision(True)
+def group_var_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
+                       ndarray[int64_t] counts,
+                       ndarray[{{dest_type2}}, ndim=2] values,
+                       ndarray[int64_t] labels,
+                       Py_ssize_t min_count=-1):
+    cdef:
+        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
+        {{dest_type2}} val, ct, oldmean
+        ndarray[{{dest_type2}}, ndim=2] nobs, mean
+
+    assert min_count == -1, "'min_count' only used in add and prod"
+
+    if not len(values) == len(labels):
+        raise AssertionError("len(index) != len(labels)")
+
+    nobs = np.zeros_like(out)
+    mean = np.zeros_like(out)
+
+    N, K = (<object> values).shape
+
+    out[:, :] = 0.0
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
+
+            counts[lab] += 1
+
+            for j in range(K):
+                val = values[i, j]
+
+                # not nan
+                if val == val:
+                    nobs[lab, j] += 1
+                    oldmean = mean[lab, j]
+                    mean[lab, j] += (val - oldmean) / nobs[lab, j]
+                    out[lab, j] += (val - mean[lab, j]) * (val - oldmean)
+
+        for i in range(ncounts):
+            for j in range(K):
+                ct = nobs[i, j]
+                if ct < 2:
+                    out[i, j] = NAN
+                else:
+                    out[i, j] /= (ct - 1)
+# add passing bin edges, instead of labels
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def group_mean_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
+                        ndarray[int64_t] counts,
+                        ndarray[{{dest_type2}}, ndim=2] values,
+                        ndarray[int64_t] labels,
+                        Py_ssize_t min_count=-1):
+    cdef:
+        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
+        {{dest_type2}} val, count
+        ndarray[{{dest_type2}}, ndim=2] sumx, nobs
+
+    assert min_count == -1, "'min_count' only used in add and prod"
+
+    if not len(values) == len(labels):
+        raise AssertionError("len(index) != len(labels)")
+
+    nobs = np.zeros_like(out)
+    sumx = np.zeros_like(out)
+
+    N, K = (<object> values).shape
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
+
+            counts[lab] += 1
+            for j in range(K):
+                val = values[i, j]
+                # not nan
+                if val == val:
+                    nobs[lab, j] += 1
+                    sumx[lab, j] += val
+
+        for i in range(ncounts):
+            for j in range(K):
+                count = nobs[i, j]
+                if nobs[i, j] == 0:
+                    out[i, j] = NAN
+                else:
+                    out[i, j] = sumx[i, j] / count
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def group_ohlc_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
+                  ndarray[int64_t] counts,
+                  ndarray[{{dest_type2}}, ndim=2] values,
+                  ndarray[int64_t] labels,
+                  Py_ssize_t min_count=-1):
+    """
+    Only aggregates on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, lab
+        {{dest_type2}} val, count
+        Py_ssize_t ngroups = len(counts)
+
+    assert min_count == -1, "'min_count' only used in add and prod"
+
+    if len(labels) == 0:
+        return
+
+    N, K = (<object> values).shape
+
+    if out.shape[1] != 4:
+        raise ValueError('Output array must have 4 columns')
+
+    if K > 1:
+        raise NotImplementedError("Argument 'values' must have only "
+                                  "one dimension")
+    out.fill(np.nan)
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            if lab == -1:
+                continue
+
+            counts[lab] += 1
+            val = values[i, 0]
+            if val != val:
+                continue
+
+            if out[lab, 0] != out[lab, 0]:
+                out[lab, 0] = out[lab, 1] = out[lab, 2] = out[lab, 3] = val
+            else:
+                out[lab, 1] = max(out[lab, 1], val)
+                out[lab, 2] = min(out[lab, 2], val)
+                out[lab, 3] = val
+
+{{endfor}}
+
+#----------------------------------------------------------------------
+# group_nth, group_last, group_rank
+#----------------------------------------------------------------------
+
+{{py:
+
+# name, c_type, dest_type2, nan_val
+dtypes = [('float64', 'float64_t', 'float64_t', 'NAN'),
+          ('float32', 'float32_t', 'float32_t', 'NAN'),
+          ('int64', 'int64_t', 'int64_t', 'iNaT'),
+          ('object', 'object', 'object', 'NAN')]
+
+def get_dispatch(dtypes):
+
+    for name, c_type, dest_type2, nan_val in dtypes:
+
+        yield name, c_type, dest_type2, nan_val
+}}
+
+
+{{for name, c_type, dest_type2, nan_val in get_dispatch(dtypes)}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def group_last_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
+                        ndarray[int64_t] counts,
+                        ndarray[{{c_type}}, ndim=2] values,
+                        ndarray[int64_t] labels,
+                        Py_ssize_t min_count=-1):
+    """
+    Only aggregates on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
+        {{dest_type2}} val
+        ndarray[{{dest_type2}}, ndim=2] resx
+        ndarray[int64_t, ndim=2] nobs
+
+    assert min_count == -1, "'min_count' only used in add and prod"
+
+    if not len(values) == len(labels):
+        raise AssertionError("len(index) != len(labels)")
+
+    nobs = np.zeros((<object> out).shape, dtype=np.int64)
+    {{if name=='object'}}
+    resx = np.empty((<object> out).shape, dtype=object)
+    {{else}}
+    resx = np.empty_like(out)
+    {{endif}}
+
+    N, K = (<object> values).shape
+
+    {{if name == "object"}}
+    if True:  # make templating happy
+    {{else}}
+    with nogil:
+    {{endif}}
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
+
+            counts[lab] += 1
+            for j in range(K):
+                val = values[i, j]
+
+                # not nan
+                if val == val and val != {{nan_val}}:
+                    nobs[lab, j] += 1
+                    resx[lab, j] = val
+
+        for i in range(ncounts):
+            for j in range(K):
+                if nobs[i, j] == 0:
+                    out[i, j] = {{nan_val}}
+                else:
+                    out[i, j] = resx[i, j]
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def group_nth_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
+                       ndarray[int64_t] counts,
+                       ndarray[{{c_type}}, ndim=2] values,
+                       ndarray[int64_t] labels, int64_t rank,
+                       Py_ssize_t min_count=-1):
+    """
+    Only aggregates on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
+        {{dest_type2}} val
+        ndarray[{{dest_type2}}, ndim=2] resx
+        ndarray[int64_t, ndim=2] nobs
+
+    assert min_count == -1, "'min_count' only used in add and prod"
+
+    if not len(values) == len(labels):
+        raise AssertionError("len(index) != len(labels)")
+
+    nobs = np.zeros((<object> out).shape, dtype=np.int64)
+    {{if name=='object'}}
+    resx = np.empty((<object> out).shape, dtype=object)
+    {{else}}
+    resx = np.empty_like(out)
+    {{endif}}
+
+    N, K = (<object> values).shape
+
+    {{if name == "object"}}
+    if True:  # make templating happy
+    {{else}}
+    with nogil:
+    {{endif}}
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
+
+            counts[lab] += 1
+            for j in range(K):
+                val = values[i, j]
+
+                # not nan
+                if val == val and val != {{nan_val}}:
+                    nobs[lab, j] += 1
+                    if nobs[lab, j] == rank:
+                        resx[lab, j] = val
+
+        for i in range(ncounts):
+            for j in range(K):
+                if nobs[i, j] == 0:
+                    out[i, j] = {{nan_val}}
+                else:
+                    out[i, j] = resx[i, j]
+
+
+{{if name != 'object'}}
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def group_rank_{{name}}(ndarray[float64_t, ndim=2] out,
+                        ndarray[{{c_type}}, ndim=2] values,
+                        ndarray[int64_t] labels,
+                        bint is_datetimelike, object ties_method,
+                        bint ascending, bint pct, object na_option):
+    """
+    Provides the rank of values within each group.
+
+    Parameters
+    ----------
+    out : array of float64_t values which this method will write its results to
+    values : array of {{c_type}} values to be ranked
+    labels : array containing unique label for each group, with its ordering
+        matching up to the corresponding record in `values`
+    is_datetimelike : bool, default False
+        unused in this method but provided for call compatibility with other
+        Cython transformations
+    ties_method : {'average', 'min', 'max', 'first', 'dense'}, default
+        'average'
+        * average: average rank of group
+        * min: lowest rank in group
+        * max: highest rank in group
+        * first: ranks assigned in order they appear in the array
+        * dense: like 'min', but rank always increases by 1 between groups
+    ascending : boolean, default True
+        False for ranks by high (1) to low (N)
+        na_option : {'keep', 'top', 'bottom'}, default 'keep'
+    pct : boolean, default False
+        Compute percentage rank of data within each group
+    na_option : {'keep', 'top', 'bottom'}, default 'keep'
+        * keep: leave NA values where they are
+        * top: smallest rank if ascending
+        * bottom: smallest rank if descending
+
+    Notes
+    -----
+    This method modifies the `out` parameter rather than returning an object
+    """
+    cdef:
+        TiebreakEnumType tiebreak
+        Py_ssize_t i, j, N, K, grp_start=0, dups=0, sum_ranks=0
+        Py_ssize_t grp_vals_seen=1, grp_na_count=0, grp_tie_count=0
+        ndarray[int64_t] _as
+        ndarray[float64_t, ndim=2] grp_sizes
+        ndarray[{{c_type}}] masked_vals
+        ndarray[uint8_t] mask
+        bint keep_na
+        {{c_type}} nan_fill_val
+
+    tiebreak = tiebreakers[ties_method]
+    keep_na = na_option == 'keep'
+    N, K = (<object> values).shape
+    grp_sizes = np.ones_like(out)
+
+    # Copy values into new array in order to fill missing data
+    # with mask, without obfuscating location of missing data
+    # in values array
+    masked_vals = np.array(values[:, 0], copy=True)
+    {{if name=='int64'}}
+    mask = (masked_vals == {{nan_val}}).astype(np.uint8)
+    {{else}}
+    mask = np.isnan(masked_vals).astype(np.uint8)
+    {{endif}}
+
+    if ascending ^ (na_option == 'top'):
+        {{if name == 'int64'}}
+        nan_fill_val = np.iinfo(np.int64).max
+        {{else}}
+        nan_fill_val = np.inf
+        {{endif}}
+        order = (masked_vals, mask, labels)
+    else:
+        {{if name == 'int64'}}
+        nan_fill_val = np.iinfo(np.int64).min
+        {{else}}
+        nan_fill_val = -np.inf
+        {{endif}}
+        order = (masked_vals, ~mask, labels)
+    np.putmask(masked_vals, mask, nan_fill_val)
+
+    # lexsort using labels, then mask, then actual values
+    # each label corresponds to a different group value,
+    # the mask helps you differentiate missing values before
+    # performing sort on the actual values
+    _as = np.lexsort(order).astype(np.int64, copy=False)
+
+    if not ascending:
+        _as = _as[::-1]
+
+    with nogil:
+        # Loop over the length of the value array
+        # each incremental i value can be looked up in the _as array
+        # that we sorted previously, which gives us the location of
+        # that sorted value for retrieval back from the original
+        # values / masked_vals arrays
+        for i in range(N):
+            # dups and sum_ranks will be incremented each loop where
+            # the value / group remains the same, and should be reset
+            # when either of those change
+            # Used to calculate tiebreakers
+            dups += 1
+            sum_ranks += i - grp_start + 1
+
+            # Update out only when there is a transition of values or labels.
+            # When a new value or group is encountered, go back #dups steps(
+            # the number of occurrence of current value) and assign the ranks
+            # based on the the starting index of the current group (grp_start)
+            # and the current index
+            if (i == N - 1 or
+                    (masked_vals[_as[i]] != masked_vals[_as[i+1]]) or
+                    (mask[_as[i]] ^ mask[_as[i+1]]) or
+                    (labels[_as[i]] != labels[_as[i+1]])):
+                # if keep_na, check for missing values and assign back
+                # to the result where appropriate
+                if keep_na and mask[_as[i]]:
+                    for j in range(i - dups + 1, i + 1):
+                        out[_as[j], 0] = nan
+                        grp_na_count = dups
+                elif tiebreak == TIEBREAK_AVERAGE:
+                    for j in range(i - dups + 1, i + 1):
+                        out[_as[j], 0] = sum_ranks / <float64_t>dups
+                elif tiebreak == TIEBREAK_MIN:
+                    for j in range(i - dups + 1, i + 1):
+                        out[_as[j], 0] = i - grp_start - dups + 2
+                elif tiebreak == TIEBREAK_MAX:
+                    for j in range(i - dups + 1, i + 1):
+                        out[_as[j], 0] = i - grp_start + 1
+                elif tiebreak == TIEBREAK_FIRST:
+                    for j in range(i - dups + 1, i + 1):
+                        if ascending:
+                            out[_as[j], 0] = j + 1 - grp_start
+                        else:
+                            out[_as[j], 0] = 2 * i - j - dups + 2 - grp_start
+                elif tiebreak == TIEBREAK_DENSE:
+                    for j in range(i - dups + 1, i + 1):
+                        out[_as[j], 0] = grp_vals_seen
+
+                # look forward to the next value (using the sorting in _as)
+                # if the value does not equal the current value then we need to
+                # reset the dups and sum_ranks, knowing that a new value is
+                # coming up. the conditional also needs to handle nan equality
+                # and the end of iteration
+                if (i == N - 1 or
+                        (masked_vals[_as[i]] != masked_vals[_as[i+1]]) or
+                        (mask[_as[i]] ^ mask[_as[i+1]])):
+                    dups = sum_ranks = 0
+                    grp_vals_seen += 1
+                    grp_tie_count += 1
+
+                # Similar to the previous conditional, check now if we are
+                # moving to a new group. If so, keep track of the index where
+                # the new group occurs, so the tiebreaker calculations can
+                # decrement that from their position. fill in the size of each
+                # group encountered (used by pct calculations later). also be
+                # sure to reset any of the items helping to calculate dups
+                if i == N - 1 or labels[_as[i]] != labels[_as[i+1]]:
+                    if tiebreak != TIEBREAK_DENSE:
+                        for j in range(grp_start, i + 1):
+                            grp_sizes[_as[j], 0] = (i - grp_start + 1 -
+                                                    grp_na_count)
+                    else:
+                        for j in range(grp_start, i + 1):
+                            grp_sizes[_as[j], 0] = (grp_tie_count -
+                                                    (grp_na_count > 0))
+                    dups = sum_ranks = 0
+                    grp_na_count = 0
+                    grp_tie_count = 0
+                    grp_start = i + 1
+                    grp_vals_seen = 1
+
+        if pct:
+            for i in range(N):
+                out[i, 0] = out[i, 0] / grp_sizes[i, 0]
+{{endif}}
+{{endfor}}
+
+
+#----------------------------------------------------------------------
+# group_min, group_max
+#----------------------------------------------------------------------
+
+{{py:
+
+# name, c_type, dest_type2, nan_val
+dtypes = [('float64', 'float64_t', 'NAN', 'np.inf'),
+          ('float32', 'float32_t', 'NAN', 'np.inf'),
+          ('int64', 'int64_t', 'iNaT', '_int64_max')]
+
+def get_dispatch(dtypes):
+
+    for name, dest_type2, nan_val, inf_val in dtypes:
+        yield name, dest_type2, nan_val, inf_val
+}}
+
+
+{{for name, dest_type2, nan_val, inf_val in get_dispatch(dtypes)}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def group_max_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
+                       ndarray[int64_t] counts,
+                       ndarray[{{dest_type2}}, ndim=2] values,
+                       ndarray[int64_t] labels,
+                       Py_ssize_t min_count=-1):
+    """
+    Only aggregates on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
+        {{dest_type2}} val, count
+        ndarray[{{dest_type2}}, ndim=2] maxx, nobs
+
+    assert min_count == -1, "'min_count' only used in add and prod"
+
+    if not len(values) == len(labels):
+        raise AssertionError("len(index) != len(labels)")
+
+    nobs = np.zeros_like(out)
+
+    maxx = np.empty_like(out)
+    maxx.fill(-{{inf_val}})
+
+    N, K = (<object> values).shape
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
+
+            counts[lab] += 1
+            for j in range(K):
+                val = values[i, j]
+
+                # not nan
+                {{if name == 'int64'}}
+                if val != {{nan_val}}:
+                {{else}}
+                if val == val and val != {{nan_val}}:
+                {{endif}}
+                    nobs[lab, j] += 1
+                    if val > maxx[lab, j]:
+                        maxx[lab, j] = val
+
+        for i in range(ncounts):
+            for j in range(K):
+                if nobs[i, j] == 0:
+                    out[i, j] = {{nan_val}}
+                else:
+                    out[i, j] = maxx[i, j]
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def group_min_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
+                       ndarray[int64_t] counts,
+                       ndarray[{{dest_type2}}, ndim=2] values,
+                       ndarray[int64_t] labels,
+                       Py_ssize_t min_count=-1):
+    """
+    Only aggregates on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
+        {{dest_type2}} val, count
+        ndarray[{{dest_type2}}, ndim=2] minx, nobs
+
+    assert min_count == -1, "'min_count' only used in add and prod"
+
+    if not len(values) == len(labels):
+        raise AssertionError("len(index) != len(labels)")
+
+    nobs = np.zeros_like(out)
+
+    minx = np.empty_like(out)
+    minx.fill({{inf_val}})
+
+    N, K = (<object> values).shape
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
+
+            counts[lab] += 1
+            for j in range(K):
+                val = values[i, j]
+
+                # not nan
+                {{if name == 'int64'}}
+                if val != {{nan_val}}:
+                {{else}}
+                if val == val and val != {{nan_val}}:
+                {{endif}}
+                    nobs[lab, j] += 1
+                    if val < minx[lab, j]:
+                        minx[lab, j] = val
+
+        for i in range(ncounts):
+            for j in range(K):
+                if nobs[i, j] == 0:
+                    out[i, j] = {{nan_val}}
+                else:
+                    out[i, j] = minx[i, j]
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def group_cummin_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
+                          ndarray[{{dest_type2}}, ndim=2] values,
+                          ndarray[int64_t] labels,
+                          bint is_datetimelike):
+    """
+    Only transforms on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, size
+        {{dest_type2}} val, mval
+        ndarray[{{dest_type2}}, ndim=2] accum
+        int64_t lab
+
+    N, K = (<object> values).shape
+    accum = np.empty_like(values)
+    accum.fill({{inf_val}})
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+
+            if lab < 0:
+                continue
+            for j in range(K):
+                val = values[i, j]
+
+                # val = nan
+                {{if name == 'int64'}}
+                if is_datetimelike and val == {{nan_val}}:
+                    out[i, j] = {{nan_val}}
+                else:
+                {{else}}
+                if val == val:
+                {{endif}}
+                    mval = accum[lab, j]
+                    if val < mval:
+                        accum[lab, j] = mval = val
+                    out[i, j] = mval
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def group_cummax_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
+                          ndarray[{{dest_type2}}, ndim=2] values,
+                          ndarray[int64_t] labels,
+                          bint is_datetimelike):
+    """
+    Only transforms on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, size
+        {{dest_type2}} val, mval
+        ndarray[{{dest_type2}}, ndim=2] accum
+        int64_t lab
+
+    N, K = (<object> values).shape
+    accum = np.empty_like(values)
+    accum.fill(-{{inf_val}})
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+
+            if lab < 0:
+                continue
+            for j in range(K):
+                val = values[i, j]
+
+                {{if name == 'int64'}}
+                if is_datetimelike and val == {{nan_val}}:
+                    out[i, j] = {{nan_val}}
+                else:
+                {{else}}
+                if val == val:
+                {{endif}}
+                    mval = accum[lab, j]
+                    if val > mval:
+                        accum[lab, j] = mval = val
+                    out[i, j] = mval
+
+{{endfor}}
diff --git a/pandas/_libs/hashing.pyx b/pandas/_libs/hashing.pyx
new file mode 100644
index 0000000000000..4489847518a1d
--- /dev/null
+++ b/pandas/_libs/hashing.pyx
@@ -0,0 +1,190 @@
+# cython: profile=False
+# Translated from the reference implementation
+# at https://github.com/veorq/SipHash
+
+import cython
+cimport numpy as cnp
+import numpy as np
+from numpy cimport ndarray, uint8_t, uint32_t, uint64_t
+
+from util cimport _checknull
+from cpython cimport (PyBytes_Check,
+                      PyUnicode_Check)
+from libc.stdlib cimport malloc, free
+
+DEF cROUNDS = 2
+DEF dROUNDS = 4
+
+
+@cython.boundscheck(False)
+def hash_object_array(ndarray[object] arr, object key, object encoding='utf8'):
+    """
+    Parameters
+    ----------
+    arr : 1-d object ndarray of objects
+    key : hash key, must be 16 byte len encoded
+    encoding : encoding for key & arr, default to 'utf8'
+
+    Returns
+    -------
+    1-d uint64 ndarray of hashes
+
+    Notes
+    -----
+    allowed values must be strings, or nulls
+    mixed array types will raise TypeError
+
+    """
+    cdef:
+        Py_ssize_t i, l, n
+        ndarray[uint64_t] result
+        bytes data, k
+        uint8_t *kb
+        uint64_t *lens
+        char **vecs
+        char *cdata
+        object val
+
+    k = <bytes>key.encode(encoding)
+    kb = <uint8_t *>k
+    if len(k) != 16:
+        raise ValueError(
+            'key should be a 16-byte string encoded, got {!r} (len {})'.format(
+                k, len(k)))
+
+    n = len(arr)
+
+    # create an array of bytes
+    vecs = <char **> malloc(n * sizeof(char *))
+    lens = <uint64_t*> malloc(n * sizeof(uint64_t))
+
+    cdef list datas = []
+    for i in range(n):
+        val = arr[i]
+        if PyBytes_Check(val):
+            data = <bytes>val
+        elif PyUnicode_Check(val):
+            data = <bytes>val.encode(encoding)
+        elif _checknull(val):
+            # null, stringify and encode
+            data = <bytes>str(val).encode(encoding)
+
+        else:
+            raise TypeError("{} of type {} is not a valid type for hashing, "
+                            "must be string or null".format(val, type(val)))
+
+        l = len(data)
+        lens[i] = l
+        cdata = data
+
+        # keep the references alive thru the end of the
+        # function
+        datas.append(data)
+        vecs[i] = cdata
+
+    result = np.empty(n, dtype=np.uint64)
+    with nogil:
+        for i in range(n):
+            result[i] = low_level_siphash(<uint8_t *>vecs[i], lens[i], kb)
+
+    free(vecs)
+    free(lens)
+    return result
+
+
+cdef inline uint64_t _rotl(uint64_t x, uint64_t b) nogil:
+    return (x << b) | (x >> (64 - b))
+
+
+cdef inline void u32to8_le(uint8_t* p, uint32_t v) nogil:
+    p[0] = <uint8_t>(v)
+    p[1] = <uint8_t>(v >> 8)
+    p[2] = <uint8_t>(v >> 16)
+    p[3] = <uint8_t>(v >> 24)
+
+
+cdef inline uint64_t u8to64_le(uint8_t* p) nogil:
+    return (<uint64_t>p[0] |
+            <uint64_t>p[1] << 8 |
+            <uint64_t>p[2] << 16 |
+            <uint64_t>p[3] << 24 |
+            <uint64_t>p[4] << 32 |
+            <uint64_t>p[5] << 40 |
+            <uint64_t>p[6] << 48 |
+            <uint64_t>p[7] << 56)
+
+
+cdef inline void _sipround(uint64_t* v0, uint64_t* v1,
+                           uint64_t* v2, uint64_t* v3) nogil:
+    v0[0] += v1[0]
+    v1[0] = _rotl(v1[0], 13)
+    v1[0] ^= v0[0]
+    v0[0] = _rotl(v0[0], 32)
+    v2[0] += v3[0]
+    v3[0] = _rotl(v3[0], 16)
+    v3[0] ^= v2[0]
+    v0[0] += v3[0]
+    v3[0] = _rotl(v3[0], 21)
+    v3[0] ^= v0[0]
+    v2[0] += v1[0]
+    v1[0] = _rotl(v1[0], 17)
+    v1[0] ^= v2[0]
+    v2[0] = _rotl(v2[0], 32)
+
+
+cpdef uint64_t siphash(bytes data, bytes key) except? 0:
+    if len(key) != 16:
+        raise ValueError(
+            'key should be a 16-byte bytestring, got {!r} (len {})'.format(
+                key, len(key)))
+    return low_level_siphash(data, len(data), key)
+
+
+@cython.cdivision(True)
+cdef uint64_t low_level_siphash(uint8_t* data, size_t datalen,
+                                uint8_t* key) nogil:
+    cdef uint64_t v0 = 0x736f6d6570736575ULL
+    cdef uint64_t v1 = 0x646f72616e646f6dULL
+    cdef uint64_t v2 = 0x6c7967656e657261ULL
+    cdef uint64_t v3 = 0x7465646279746573ULL
+    cdef uint64_t b
+    cdef uint64_t k0 = u8to64_le(key)
+    cdef uint64_t k1 = u8to64_le(key + 8)
+    cdef uint64_t m
+    cdef int i
+    cdef uint8_t* end = data + datalen - (datalen % sizeof(uint64_t))
+    cdef int left = datalen & 7
+    cdef int left_byte
+
+    b = (<uint64_t>datalen) << 56
+    v3 ^= k1
+    v2 ^= k0
+    v1 ^= k1
+    v0 ^= k0
+
+    while (data != end):
+        m = u8to64_le(data)
+        v3 ^= m
+        for i in range(cROUNDS):
+            _sipround(&v0, &v1, &v2, &v3)
+        v0 ^= m
+
+        data += sizeof(uint64_t)
+
+    for i in range(left-1, -1, -1):
+        b |= (<uint64_t>data[i]) << (i * 8)
+
+    v3 ^= b
+
+    for i in range(cROUNDS):
+        _sipround(&v0, &v1, &v2, &v3)
+
+    v0 ^= b
+    v2 ^= 0xff
+
+    for i in range(dROUNDS):
+        _sipround(&v0, &v1, &v2, &v3)
+
+    b = v0 ^ v1 ^ v2 ^ v3
+
+    return b
diff --git a/pandas/_libs/hashtable.pxd b/pandas/_libs/hashtable.pxd
new file mode 100644
index 0000000000000..d735b3c0673b2
--- /dev/null
+++ b/pandas/_libs/hashtable.pxd
@@ -0,0 +1,53 @@
+from khash cimport (kh_int64_t, kh_uint64_t, kh_float64_t, kh_pymap_t,
+                    kh_str_t, uint64_t, int64_t, float64_t)
+from numpy cimport ndarray
+
+# prototypes for sharing
+
+cdef class HashTable:
+    pass
+
+cdef class UInt64HashTable(HashTable):
+    cdef kh_uint64_t *table
+
+    cpdef get_item(self, uint64_t val)
+    cpdef set_item(self, uint64_t key, Py_ssize_t val)
+
+cdef class Int64HashTable(HashTable):
+    cdef kh_int64_t *table
+
+    cpdef get_item(self, int64_t val)
+    cpdef set_item(self, int64_t key, Py_ssize_t val)
+
+cdef class Float64HashTable(HashTable):
+    cdef kh_float64_t *table
+
+    cpdef get_item(self, float64_t val)
+    cpdef set_item(self, float64_t key, Py_ssize_t val)
+
+cdef class PyObjectHashTable(HashTable):
+    cdef kh_pymap_t *table
+
+    cpdef get_item(self, object val)
+    cpdef set_item(self, object key, Py_ssize_t val)
+
+
+cdef class StringHashTable(HashTable):
+    cdef kh_str_t *table
+
+    cpdef get_item(self, object val)
+    cpdef set_item(self, object key, Py_ssize_t val)
+
+cdef struct Int64VectorData:
+    int64_t *data
+    size_t n, m
+
+cdef class Int64Vector:
+    cdef Int64VectorData *data
+    cdef ndarray ao
+    cdef bint external_view_exists
+
+    cdef resize(self)
+    cpdef to_array(self)
+    cdef inline void append(self, int64_t x)
+    cdef extend(self, int64_t[:] x)
diff --git a/pandas/_libs/hashtable.pyx b/pandas/_libs/hashtable.pyx
new file mode 100644
index 0000000000000..b9a72a0c8285f
--- /dev/null
+++ b/pandas/_libs/hashtable.pyx
@@ -0,0 +1,177 @@
+# cython: profile=False
+
+cimport cython
+
+from cpython cimport (PyObject, Py_INCREF, PyList_Check, PyTuple_Check,
+                      PyMem_Malloc, PyMem_Realloc, PyMem_Free,
+                      PyString_Check, PyBytes_Check,
+                      PyUnicode_Check)
+
+from libc.stdlib cimport malloc, free
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport ndarray, uint8_t, uint32_t
+cnp.import_array()
+
+cdef extern from "numpy/npy_math.h":
+    double NAN "NPY_NAN"
+
+
+from khash cimport (
+    khiter_t,
+
+    kh_str_t, kh_init_str, kh_put_str, kh_exist_str,
+    kh_get_str, kh_destroy_str, kh_resize_str,
+
+    kh_put_strbox, kh_get_strbox, kh_init_strbox,
+
+    kh_int64_t, kh_init_int64, kh_resize_int64, kh_destroy_int64,
+    kh_get_int64, kh_exist_int64, kh_put_int64,
+
+    kh_float64_t, kh_exist_float64, kh_put_float64, kh_init_float64,
+    kh_get_float64, kh_destroy_float64, kh_resize_float64,
+
+    kh_resize_uint64, kh_exist_uint64, kh_destroy_uint64, kh_put_uint64,
+    kh_get_uint64, kh_init_uint64,
+
+    kh_destroy_pymap, kh_exist_pymap, kh_init_pymap, kh_get_pymap,
+    kh_put_pymap, kh_resize_pymap)
+
+
+cimport util
+
+from missing cimport checknull
+
+
+nan = np.nan
+
+cdef int64_t iNaT = util.get_nat()
+_SIZE_HINT_LIMIT = (1 << 20) + 7
+
+
+cdef size_t _INIT_VEC_CAP = 128
+
+include "hashtable_class_helper.pxi"
+include "hashtable_func_helper.pxi"
+
+cdef class Factorizer:
+    cdef public PyObjectHashTable table
+    cdef public ObjectVector uniques
+    cdef public Py_ssize_t count
+
+    def __init__(self, size_hint):
+        self.table = PyObjectHashTable(size_hint)
+        self.uniques = ObjectVector()
+        self.count = 0
+
+    def get_count(self):
+        return self.count
+
+    def factorize(self, ndarray[object] values, sort=False, na_sentinel=-1,
+                  na_value=None):
+        """
+        Factorize values with nans replaced by na_sentinel
+        >>> factorize(np.array([1,2,np.nan], dtype='O'), na_sentinel=20)
+        array([ 0,  1, 20])
+        """
+        if self.uniques.external_view_exists:
+            uniques = ObjectVector()
+            uniques.extend(self.uniques.to_array())
+            self.uniques = uniques
+        labels = self.table.get_labels(values, self.uniques,
+                                       self.count, na_sentinel, na_value)
+        mask = (labels == na_sentinel)
+        # sort on
+        if sort:
+            if labels.dtype != np.intp:
+                labels = labels.astype(np.intp)
+            sorter = self.uniques.to_array().argsort()
+            reverse_indexer = np.empty(len(sorter), dtype=np.intp)
+            reverse_indexer.put(sorter, np.arange(len(sorter)))
+            labels = reverse_indexer.take(labels, mode='clip')
+            labels[mask] = na_sentinel
+        self.count = len(self.uniques)
+        return labels
+
+    def unique(self, ndarray[object] values):
+        # just for fun
+        return self.table.unique(values)
+
+
+cdef class Int64Factorizer:
+    cdef public Int64HashTable table
+    cdef public Int64Vector uniques
+    cdef public Py_ssize_t count
+
+    def __init__(self, size_hint):
+        self.table = Int64HashTable(size_hint)
+        self.uniques = Int64Vector()
+        self.count = 0
+
+    def get_count(self):
+        return self.count
+
+    def factorize(self, int64_t[:] values, sort=False,
+                  na_sentinel=-1, na_value=None):
+        """
+        Factorize values with nans replaced by na_sentinel
+        >>> factorize(np.array([1,2,np.nan], dtype='O'), na_sentinel=20)
+        array([ 0,  1, 20])
+        """
+        if self.uniques.external_view_exists:
+            uniques = Int64Vector()
+            uniques.extend(self.uniques.to_array())
+            self.uniques = uniques
+        labels = self.table.get_labels(values, self.uniques,
+                                       self.count, na_sentinel,
+                                       na_value=na_value)
+
+        # sort on
+        if sort:
+            if labels.dtype != np.intp:
+                labels = labels.astype(np.intp)
+
+            sorter = self.uniques.to_array().argsort()
+            reverse_indexer = np.empty(len(sorter), dtype=np.intp)
+            reverse_indexer.put(sorter, np.arange(len(sorter)))
+
+            labels = reverse_indexer.take(labels)
+
+        self.count = len(self.uniques)
+        return labels
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def unique_label_indices(ndarray[int64_t, ndim=1] labels):
+    """
+    indices of the first occurrences of the unique labels
+    *excluding* -1. equivalent to:
+        np.unique(labels, return_index=True)[1]
+    """
+    cdef:
+        int ret = 0
+        Py_ssize_t i, n = len(labels)
+        kh_int64_t * table = kh_init_int64()
+        Int64Vector idx = Int64Vector()
+        ndarray[int64_t, ndim=1] arr
+        Int64VectorData *ud = idx.data
+
+    kh_resize_int64(table, min(n, _SIZE_HINT_LIMIT))
+
+    with nogil:
+        for i in range(n):
+            kh_put_int64(table, labels[i], &ret)
+            if ret != 0:
+                if needs_resize(ud):
+                    with gil:
+                        idx.resize()
+                append_data_int64(ud, i)
+
+    kh_destroy_int64(table)
+
+    arr = idx.to_array()
+    arr = arr[labels[arr].argsort()]
+
+    return arr[1:] if arr.size != 0 and labels[arr[0]] == -1 else arr
diff --git a/pandas/_libs/hashtable_class_helper.pxi.in b/pandas/_libs/hashtable_class_helper.pxi.in
new file mode 100644
index 0000000000000..4d2b6f845eb71
--- /dev/null
+++ b/pandas/_libs/hashtable_class_helper.pxi.in
@@ -0,0 +1,922 @@
+"""
+Template for each `dtype` helper function for hashtable
+
+WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
+"""
+
+
+#----------------------------------------------------------------------
+# VectorData
+#----------------------------------------------------------------------
+
+{{py:
+
+# name, dtype, arg
+# the generated StringVector is not actually used
+# but is included for completeness (rather ObjectVector is used
+# for uniques in hashtables)
+
+dtypes = [('Float64', 'float64', 'float64_t'),
+          ('Int64', 'int64', 'int64_t'),
+          ('String', 'string', 'char *'),
+          ('UInt64', 'uint64', 'uint64_t')]
+}}
+
+{{for name, dtype, arg in dtypes}}
+
+
+{{if dtype != 'int64'}}
+
+ctypedef struct {{name}}VectorData:
+    {{arg}} *data
+    size_t n, m
+
+{{endif}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cdef inline void append_data_{{dtype}}({{name}}VectorData *data,
+                                       {{arg}} x) nogil:
+
+    data.data[data.n] = x
+    data.n += 1
+
+{{endfor}}
+
+ctypedef fused vector_data:
+    Int64VectorData
+    UInt64VectorData
+    Float64VectorData
+    StringVectorData
+
+cdef inline bint needs_resize(vector_data *data) nogil:
+    return data.n == data.m
+
+#----------------------------------------------------------------------
+# Vector
+#----------------------------------------------------------------------
+
+{{py:
+
+# name, dtype, arg, idtype
+dtypes = [('Float64', 'float64', 'float64_t', 'np.float64'),
+          ('UInt64', 'uint64', 'uint64_t', 'np.uint64'),
+          ('Int64', 'int64', 'int64_t', 'np.int64')]
+
+}}
+
+{{for name, dtype, arg, idtype in dtypes}}
+
+cdef class {{name}}Vector:
+
+    {{if dtype != 'int64'}}
+    cdef:
+        bint external_view_exists
+        {{name}}VectorData *data
+        ndarray ao
+    {{endif}}
+
+    def __cinit__(self):
+        self.data = <{{name}}VectorData *>PyMem_Malloc(
+            sizeof({{name}}VectorData))
+        if not self.data:
+            raise MemoryError()
+        self.external_view_exists = False
+        self.data.n = 0
+        self.data.m = _INIT_VEC_CAP
+        self.ao = np.empty(self.data.m, dtype={{idtype}})
+        self.data.data = <{{arg}}*> self.ao.data
+
+    cdef resize(self):
+        self.data.m = max(self.data.m * 4, _INIT_VEC_CAP)
+        self.ao.resize(self.data.m, refcheck=False)
+        self.data.data = <{{arg}}*> self.ao.data
+
+    def __dealloc__(self):
+        if self.data is not NULL:
+            PyMem_Free(self.data)
+            self.data = NULL
+
+    def __len__(self):
+        return self.data.n
+
+    cpdef to_array(self):
+        if self.data.m != self.data.n:
+            if self.external_view_exists:
+                # should never happen
+                raise ValueError("should have raised on append()")
+            self.ao.resize(self.data.n, refcheck=False)
+            self.data.m = self.data.n
+        self.external_view_exists = True
+        return self.ao
+
+    cdef inline void append(self, {{arg}} x):
+
+        if needs_resize(self.data):
+            if self.external_view_exists:
+                raise ValueError("external reference but Vector.resize() needed")
+            self.resize()
+
+        append_data_{{dtype}}(self.data, x)
+
+    cdef extend(self, {{arg}}[:] x):
+        for i in range(len(x)):
+            self.append(x[i])
+
+{{endfor}}
+
+cdef class StringVector:
+
+    cdef:
+        StringVectorData *data
+        bint external_view_exists
+
+    def __cinit__(self):
+        self.data = <StringVectorData *>PyMem_Malloc(
+            sizeof(StringVectorData))
+        if not self.data:
+            raise MemoryError()
+        self.external_view_exists = False
+        self.data.n = 0
+        self.data.m = _INIT_VEC_CAP
+        self.data.data = <char **> malloc(self.data.m * sizeof(char *))
+        if not self.data.data:
+            raise MemoryError()
+
+    cdef resize(self):
+        cdef:
+            char **orig_data
+            size_t i, m
+
+        m = self.data.m
+        self.data.m = max(self.data.m * 4, _INIT_VEC_CAP)
+
+        orig_data = self.data.data
+        self.data.data = <char **> malloc(self.data.m * sizeof(char *))
+        if not self.data.data:
+            raise MemoryError()
+        for i in range(m):
+            self.data.data[i] = orig_data[i]
+
+    def __dealloc__(self):
+        if self.data is not NULL:
+            if self.data.data is not NULL:
+                free(self.data.data)
+            PyMem_Free(self.data)
+            self.data = NULL
+
+    def __len__(self):
+        return self.data.n
+
+    def to_array(self):
+        cdef:
+            ndarray ao
+            size_t n
+            object val
+
+        ao = np.empty(self.data.n, dtype=np.object)
+        for i in range(self.data.n):
+            val = self.data.data[i]
+            ao[i] = val
+        self.external_view_exists = True
+        self.data.m = self.data.n
+        return ao
+
+    cdef inline void append(self, char * x):
+
+        if needs_resize(self.data):
+            self.resize()
+
+        append_data_string(self.data, x)
+
+    cdef extend(self, ndarray[:] x):
+        for i in range(len(x)):
+            self.append(x[i])
+
+cdef class ObjectVector:
+
+    cdef:
+        PyObject **data
+        size_t n, m
+        ndarray ao
+        bint external_view_exists
+
+    def __cinit__(self):
+        self.external_view_exists = False
+        self.n = 0
+        self.m = _INIT_VEC_CAP
+        self.ao = np.empty(_INIT_VEC_CAP, dtype=object)
+        self.data = <PyObject**> self.ao.data
+
+    def __len__(self):
+        return self.n
+
+    cdef inline append(self, object o):
+        if self.n == self.m:
+            if self.external_view_exists:
+                raise ValueError("external reference but Vector.resize() needed")
+            self.m = max(self.m * 2, _INIT_VEC_CAP)
+            self.ao.resize(self.m, refcheck=False)
+            self.data = <PyObject**> self.ao.data
+
+        Py_INCREF(o)
+        self.data[self.n] = <PyObject*> o
+        self.n += 1
+
+    def to_array(self):
+        if self.m != self.n:
+            if self.external_view_exists:
+                raise ValueError("should have raised on append()")
+            self.ao.resize(self.n, refcheck=False)
+            self.m = self.n
+        self.external_view_exists = True
+        return self.ao
+
+    cdef extend(self, ndarray[:] x):
+        for i in range(len(x)):
+            self.append(x[i])
+
+#----------------------------------------------------------------------
+# HashTable
+#----------------------------------------------------------------------
+
+
+cdef class HashTable:
+
+    pass
+
+{{py:
+
+# name, dtype, float_group, default_na_value
+dtypes = [('Float64', 'float64', True, 'nan'),
+          ('UInt64', 'uint64', False, 0),
+          ('Int64', 'int64', False, 'iNaT')]
+
+def get_dispatch(dtypes):
+  for (name, dtype, float_group, default_na_value) in dtypes:
+    unique_template = """\
+        cdef:
+           Py_ssize_t i, n = len(values)
+           int ret = 0
+           {dtype}_t val
+           khiter_t k
+           bint seen_na = 0
+           {name}Vector uniques = {name}Vector()
+           {name}VectorData *ud
+
+        ud = uniques.data
+
+        with nogil:
+            for i in range(n):
+                val = values[i]
+                IF {float_group}:
+                  if val == val:
+                      k = kh_get_{dtype}(self.table, val)
+                      if k == self.table.n_buckets:
+                          kh_put_{dtype}(self.table, val, &ret)
+                          if needs_resize(ud):
+                              with gil:
+                                  uniques.resize()
+                          append_data_{dtype}(ud, val)
+                  elif not seen_na:
+                      seen_na = 1
+                      if needs_resize(ud):
+                          with gil:
+                              uniques.resize()
+                      append_data_{dtype}(ud, NAN)
+                ELSE:
+                  k = kh_get_{dtype}(self.table, val)
+                  if k == self.table.n_buckets:
+                      kh_put_{dtype}(self.table, val, &ret)
+                      if needs_resize(ud):
+                          with gil:
+                              uniques.resize()
+                      append_data_{dtype}(ud, val)
+        return uniques.to_array()
+      """
+
+    unique_template = unique_template.format(name=name, dtype=dtype, float_group=float_group)
+
+    yield (name, dtype, float_group, default_na_value, unique_template)
+}}
+
+
+{{for name, dtype, float_group, default_na_value, unique_template in get_dispatch(dtypes)}}
+
+cdef class {{name}}HashTable(HashTable):
+
+    def __cinit__(self, size_hint=1):
+        self.table = kh_init_{{dtype}}()
+        if size_hint is not None:
+            kh_resize_{{dtype}}(self.table, size_hint)
+
+    def __len__(self):
+        return self.table.size
+
+    def __dealloc__(self):
+        if self.table is not NULL:
+            kh_destroy_{{dtype}}(self.table)
+            self.table = NULL
+
+    def __contains__(self, object key):
+        cdef khiter_t k
+        k = kh_get_{{dtype}}(self.table, key)
+        return k != self.table.n_buckets
+
+    def sizeof(self, deep=False):
+        """ return the size of my table in bytes """
+        return self.table.n_buckets * (sizeof({{dtype}}_t) + # keys
+                                       sizeof(size_t) + # vals
+                                       sizeof(uint32_t)) # flags
+
+    cpdef get_item(self, {{dtype}}_t val):
+        cdef khiter_t k
+        k = kh_get_{{dtype}}(self.table, val)
+        if k != self.table.n_buckets:
+            return self.table.vals[k]
+        else:
+            raise KeyError(val)
+
+    cpdef set_item(self, {{dtype}}_t key, Py_ssize_t val):
+        cdef:
+            khiter_t k
+            int ret = 0
+
+        k = kh_put_{{dtype}}(self.table, key, &ret)
+        self.table.keys[k] = key
+        if kh_exist_{{dtype}}(self.table, k):
+            self.table.vals[k] = val
+        else:
+            raise KeyError(key)
+
+    @cython.boundscheck(False)
+    def map(self, {{dtype}}_t[:] keys, int64_t[:] values):
+        cdef:
+            Py_ssize_t i, n = len(values)
+            int ret = 0
+            {{dtype}}_t key
+            khiter_t k
+
+        with nogil:
+            for i in range(n):
+                key = keys[i]
+                k = kh_put_{{dtype}}(self.table, key, &ret)
+                self.table.vals[k] = <Py_ssize_t> values[i]
+
+    @cython.boundscheck(False)
+    def map_locations(self, ndarray[{{dtype}}_t, ndim=1] values):
+        cdef:
+            Py_ssize_t i, n = len(values)
+            int ret = 0
+            {{dtype}}_t val
+            khiter_t k
+
+        with nogil:
+            for i in range(n):
+                val = values[i]
+                k = kh_put_{{dtype}}(self.table, val, &ret)
+                self.table.vals[k] = i
+
+    @cython.boundscheck(False)
+    def lookup(self, {{dtype}}_t[:] values):
+        cdef:
+            Py_ssize_t i, n = len(values)
+            int ret = 0
+            {{dtype}}_t val
+            khiter_t k
+            int64_t[:] locs = np.empty(n, dtype=np.int64)
+
+        with nogil:
+            for i in range(n):
+                val = values[i]
+                k = kh_get_{{dtype}}(self.table, val)
+                if k != self.table.n_buckets:
+                    locs[i] = self.table.vals[k]
+                else:
+                    locs[i] = -1
+
+        return np.asarray(locs)
+
+    def factorize(self, {{dtype}}_t values):
+        uniques = {{name}}Vector()
+        labels = self.get_labels(values, uniques, 0, 0)
+        return uniques.to_array(), labels
+
+    @cython.boundscheck(False)
+    def get_labels(self, {{dtype}}_t[:] values, {{name}}Vector uniques,
+                   Py_ssize_t count_prior, Py_ssize_t na_sentinel,
+                   object na_value=None):
+        cdef:
+            Py_ssize_t i, n = len(values)
+            int64_t[:] labels
+            Py_ssize_t idx, count = count_prior
+            int ret = 0
+            {{dtype}}_t val, na_value2
+            khiter_t k
+            {{name}}VectorData *ud
+            bint use_na_value
+
+        labels = np.empty(n, dtype=np.int64)
+        ud = uniques.data
+        use_na_value = na_value is not None
+
+        if use_na_value:
+            # We need this na_value2 because we want to allow users
+            # to *optionally* specify an NA sentinel *of the correct* type.
+            # We use None, to make it optional, which requires `object` type
+            # for the parameter. To please the compiler, we use na_value2,
+            # which is only used if it's *specified*.
+            na_value2 = <{{dtype}}_t>na_value
+        else:
+            na_value2 = {{default_na_value}}
+
+        with nogil:
+            for i in range(n):
+                val = values[i]
+
+                if val != val or (use_na_value and val == na_value2):
+                    labels[i] = na_sentinel
+                    continue
+
+                k = kh_get_{{dtype}}(self.table, val)
+
+                if k != self.table.n_buckets:
+                    idx = self.table.vals[k]
+                    labels[i] = idx
+                else:
+                    k = kh_put_{{dtype}}(self.table, val, &ret)
+                    self.table.vals[k] = count
+
+                    if needs_resize(ud):
+                        with gil:
+                            if uniques.external_view_exists:
+                                raise ValueError("external reference to uniques held, "
+                                        "but Vector.resize() needed")
+                            uniques.resize()
+                    append_data_{{dtype}}(ud, val)
+                    labels[i] = count
+                    count += 1
+
+        return np.asarray(labels)
+
+    @cython.boundscheck(False)
+    def get_labels_groupby(self, {{dtype}}_t[:] values):
+        cdef:
+            Py_ssize_t i, n = len(values)
+            int64_t[:] labels
+            Py_ssize_t idx, count = 0
+            int ret = 0
+            {{dtype}}_t val
+            khiter_t k
+            {{name}}Vector uniques = {{name}}Vector()
+            {{name}}VectorData *ud
+
+        labels = np.empty(n, dtype=np.int64)
+        ud = uniques.data
+
+        with nogil:
+            for i in range(n):
+                val = values[i]
+
+                # specific for groupby
+                {{if dtype != 'uint64'}}
+                if val < 0:
+                    labels[i] = -1
+                    continue
+                {{endif}}
+
+                k = kh_get_{{dtype}}(self.table, val)
+                if k != self.table.n_buckets:
+                    idx = self.table.vals[k]
+                    labels[i] = idx
+                else:
+                    k = kh_put_{{dtype}}(self.table, val, &ret)
+                    self.table.vals[k] = count
+
+                    if needs_resize(ud):
+                        with gil:
+                            uniques.resize()
+                    append_data_{{dtype}}(ud, val)
+                    labels[i] = count
+                    count += 1
+
+        arr_uniques = uniques.to_array()
+
+        return np.asarray(labels), arr_uniques
+
+    @cython.boundscheck(False)
+    def unique(self, ndarray[{{dtype}}_t, ndim=1] values):
+        if values.flags.writeable:
+          # If the value is writeable (mutable) then use memview
+          return self.unique_memview(values)
+
+        # We cannot use the memoryview version on readonly-buffers due to
+        # a limitation of Cython's typed memoryviews. Instead we can use
+        # the slightly slower Cython ndarray type directly.
+        # see https://github.com/cython/cython/issues/1605
+{{unique_template}}
+
+    @cython.boundscheck(False)
+    def unique_memview(self, {{dtype}}_t[:] values):
+{{unique_template}}
+
+{{endfor}}
+
+
+cdef class StringHashTable(HashTable):
+    # these by-definition *must* be strings
+    # or a sentinel np.nan / None missing value
+    na_string_sentinel = '__nan__'
+
+    def __init__(self, int size_hint=1):
+        self.table = kh_init_str()
+        if size_hint is not None:
+            kh_resize_str(self.table, size_hint)
+
+    def __dealloc__(self):
+        if self.table is not NULL:
+            kh_destroy_str(self.table)
+            self.table = NULL
+
+    def sizeof(self, deep=False):
+        """ return the size of my table in bytes """
+        return self.table.n_buckets * (sizeof(char *) + # keys
+                                       sizeof(size_t) + # vals
+                                       sizeof(uint32_t)) # flags
+
+    cpdef get_item(self, object val):
+        cdef:
+            khiter_t k
+            char *v
+        v = util.get_c_string(val)
+
+        k = kh_get_str(self.table, v)
+        if k != self.table.n_buckets:
+            return self.table.vals[k]
+        else:
+            raise KeyError(val)
+
+    cpdef set_item(self, object key, Py_ssize_t val):
+        cdef:
+            khiter_t k
+            int ret = 0
+            char *v
+
+        v = util.get_c_string(val)
+
+        k = kh_put_str(self.table, v, &ret)
+        self.table.keys[k] = key
+        if kh_exist_str(self.table, k):
+            self.table.vals[k] = val
+        else:
+            raise KeyError(key)
+
+    @cython.boundscheck(False)
+    def get_indexer(self, ndarray[object] values):
+        cdef:
+            Py_ssize_t i, n = len(values)
+            ndarray[int64_t] labels = np.empty(n, dtype=np.int64)
+            int64_t *resbuf = <int64_t*> labels.data
+            khiter_t k
+            kh_str_t *table = self.table
+            char *v
+            char **vecs
+
+        vecs = <char **> malloc(n * sizeof(char *))
+        for i in range(n):
+            val = values[i]
+            v = util.get_c_string(val)
+            vecs[i] = v
+
+        with nogil:
+            for i in range(n):
+                k = kh_get_str(table, vecs[i])
+                if k != table.n_buckets:
+                    resbuf[i] = table.vals[k]
+                else:
+                    resbuf[i] = -1
+
+        free(vecs)
+        return labels
+
+    @cython.boundscheck(False)
+    def unique(self, ndarray[object] values):
+        cdef:
+            Py_ssize_t i, count, n = len(values)
+            int64_t[:] uindexer
+            int ret = 0
+            object val
+            ObjectVector uniques
+            khiter_t k
+            char *v
+            char **vecs
+
+        vecs = <char **> malloc(n * sizeof(char *))
+        uindexer = np.empty(n, dtype=np.int64)
+        for i in range(n):
+            val = values[i]
+            v = util.get_c_string(val)
+            vecs[i] = v
+
+        count = 0
+        with nogil:
+            for i in range(n):
+                v = vecs[i]
+                k = kh_get_str(self.table, v)
+                if k == self.table.n_buckets:
+                    kh_put_str(self.table, v, &ret)
+                    uindexer[count] = i
+                    count += 1
+        free(vecs)
+
+        # uniques
+        uniques = ObjectVector()
+        for i in range(count):
+            uniques.append(values[uindexer[i]])
+        return uniques.to_array()
+
+    def factorize(self, ndarray[object] values):
+        uniques = ObjectVector()
+        labels = self.get_labels(values, uniques, 0, 0)
+        return uniques.to_array(), labels
+
+    @cython.boundscheck(False)
+    def lookup(self, ndarray[object] values):
+        cdef:
+            Py_ssize_t i, n = len(values)
+            int ret = 0
+            object val
+            char *v
+            khiter_t k
+            int64_t[:] locs = np.empty(n, dtype=np.int64)
+
+        # these by-definition *must* be strings
+        vecs = <char **> malloc(n * sizeof(char *))
+        for i in range(n):
+            val = values[i]
+
+            if PyUnicode_Check(val) or PyString_Check(val):
+                v = util.get_c_string(val)
+            else:
+                v = util.get_c_string(self.na_string_sentinel)
+            vecs[i] = v
+
+        with nogil:
+            for i in range(n):
+                v = vecs[i]
+                k = kh_get_str(self.table, v)
+                if k != self.table.n_buckets:
+                    locs[i] = self.table.vals[k]
+                else:
+                    locs[i] = -1
+
+        free(vecs)
+        return np.asarray(locs)
+
+    @cython.boundscheck(False)
+    def map_locations(self, ndarray[object] values):
+        cdef:
+            Py_ssize_t i, n = len(values)
+            int ret = 0
+            object val
+            char *v
+            char **vecs
+            khiter_t k
+
+        # these by-definition *must* be strings
+        vecs = <char **> malloc(n * sizeof(char *))
+        for i in range(n):
+            val = values[i]
+
+            if PyUnicode_Check(val) or PyString_Check(val):
+                v = util.get_c_string(val)
+            else:
+                v = util.get_c_string(self.na_string_sentinel)
+            vecs[i] = v
+
+        with nogil:
+            for i in range(n):
+                v = vecs[i]
+                k = kh_put_str(self.table, v, &ret)
+                self.table.vals[k] = i
+        free(vecs)
+
+    @cython.boundscheck(False)
+    def get_labels(self, ndarray[object] values, ObjectVector uniques,
+                   Py_ssize_t count_prior, int64_t na_sentinel,
+                   object na_value=None):
+        cdef:
+            Py_ssize_t i, n = len(values)
+            int64_t[:] labels
+            int64_t[:] uindexer
+            Py_ssize_t idx, count = count_prior
+            int ret = 0
+            object val
+            char *v
+            char **vecs
+            khiter_t k
+            bint use_na_value
+
+        # these by-definition *must* be strings
+        labels = np.zeros(n, dtype=np.int64)
+        uindexer = np.empty(n, dtype=np.int64)
+        use_na_value = na_value is not None
+
+        # pre-filter out missing
+        # and assign pointers
+        vecs = <char **> malloc(n * sizeof(char *))
+        for i in range(n):
+            val = values[i]
+
+            if ((PyUnicode_Check(val) or PyString_Check(val)) and
+                    not (use_na_value and val == na_value)):
+                v = util.get_c_string(val)
+                vecs[i] = v
+            else:
+                labels[i] = na_sentinel
+
+        # compute
+        with nogil:
+            for i in range(n):
+                if labels[i] == na_sentinel:
+                    continue
+
+                v = vecs[i]
+                k = kh_get_str(self.table, v)
+                if k != self.table.n_buckets:
+                    idx = self.table.vals[k]
+                    labels[i] = <int64_t>idx
+                else:
+                    k = kh_put_str(self.table, v, &ret)
+                    self.table.vals[k] = count
+                    uindexer[count] = i
+                    labels[i] = <int64_t>count
+                    count += 1
+
+        free(vecs)
+
+        # uniques
+        for i in range(count):
+            uniques.append(values[uindexer[i]])
+
+        return np.asarray(labels)
+
+na_sentinel = object
+
+cdef class PyObjectHashTable(HashTable):
+
+    def __init__(self, size_hint=1):
+        self.table = kh_init_pymap()
+        kh_resize_pymap(self.table, size_hint)
+
+    def __dealloc__(self):
+        if self.table is not NULL:
+            kh_destroy_pymap(self.table)
+            self.table = NULL
+
+    def __len__(self):
+        return self.table.size
+
+    def __contains__(self, object key):
+        cdef khiter_t k
+        hash(key)
+        if key != key or key is None:
+            key = na_sentinel
+        k = kh_get_pymap(self.table, <PyObject*>key)
+        return k != self.table.n_buckets
+
+    def sizeof(self, deep=False):
+        """ return the size of my table in bytes """
+        return self.table.n_buckets * (sizeof(PyObject *) + # keys
+                                       sizeof(size_t) + # vals
+                                       sizeof(uint32_t)) # flags
+
+    cpdef get_item(self, object val):
+        cdef khiter_t k
+        if val != val or val is None:
+            val = na_sentinel
+        k = kh_get_pymap(self.table, <PyObject*>val)
+        if k != self.table.n_buckets:
+            return self.table.vals[k]
+        else:
+            raise KeyError(val)
+
+    cpdef set_item(self, object key, Py_ssize_t val):
+        cdef:
+            khiter_t k
+            int ret = 0
+            char* buf
+
+        hash(key)
+        if key != key or key is None:
+            key = na_sentinel
+        k = kh_put_pymap(self.table, <PyObject*>key, &ret)
+        # self.table.keys[k] = key
+        if kh_exist_pymap(self.table, k):
+            self.table.vals[k] = val
+        else:
+            raise KeyError(key)
+
+    def map_locations(self, ndarray[object] values):
+        cdef:
+            Py_ssize_t i, n = len(values)
+            int ret = 0
+            object val
+            khiter_t k
+
+        for i in range(n):
+            val = values[i]
+            hash(val)
+            if val != val or val is None:
+                val = na_sentinel
+
+            k = kh_put_pymap(self.table, <PyObject*>val, &ret)
+            self.table.vals[k] = i
+
+    def lookup(self, ndarray[object] values):
+        cdef:
+            Py_ssize_t i, n = len(values)
+            int ret = 0
+            object val
+            khiter_t k
+            int64_t[:] locs = np.empty(n, dtype=np.int64)
+
+        for i in range(n):
+            val = values[i]
+            hash(val)
+            if val != val or val is None:
+                val = na_sentinel
+
+            k = kh_get_pymap(self.table, <PyObject*>val)
+            if k != self.table.n_buckets:
+                locs[i] = self.table.vals[k]
+            else:
+                locs[i] = -1
+
+        return np.asarray(locs)
+
+    def unique(self, ndarray[object] values):
+        cdef:
+            Py_ssize_t i, n = len(values)
+            int ret = 0
+            object val
+            khiter_t k
+            ObjectVector uniques = ObjectVector()
+            bint seen_na = 0
+
+        for i in range(n):
+            val = values[i]
+            hash(val)
+
+            # `val is None` below is exception to prevent mangling of None and
+            # other NA values; note however that other NA values (ex: pd.NaT
+            # and np.nan) will still get mangled, so many not be a permanent
+            # solution; see GH 20866
+            if not checknull(val) or val is None:
+                k = kh_get_pymap(self.table, <PyObject*>val)
+                if k == self.table.n_buckets:
+                    kh_put_pymap(self.table, <PyObject*>val, &ret)
+                    uniques.append(val)
+            elif not seen_na:
+                seen_na = 1
+                uniques.append(nan)
+
+        return uniques.to_array()
+
+    def get_labels(self, ndarray[object] values, ObjectVector uniques,
+                   Py_ssize_t count_prior, int64_t na_sentinel,
+                   object na_value=None):
+        cdef:
+            Py_ssize_t i, n = len(values)
+            int64_t[:] labels
+            Py_ssize_t idx, count = count_prior
+            int ret = 0
+            object val
+            khiter_t k
+            bint use_na_value
+
+        labels = np.empty(n, dtype=np.int64)
+        use_na_value = na_value is not None
+
+        for i in range(n):
+            val = values[i]
+            hash(val)
+
+            if ((val != val or val is None) or
+                    (use_na_value and val == na_value)):
+                labels[i] = na_sentinel
+                continue
+
+            k = kh_get_pymap(self.table, <PyObject*>val)
+            if k != self.table.n_buckets:
+                idx = self.table.vals[k]
+                labels[i] = idx
+            else:
+                k = kh_put_pymap(self.table, <PyObject*>val, &ret)
+                self.table.vals[k] = count
+                uniques.append(val)
+                labels[i] = count
+                count += 1
+
+        return np.asarray(labels)
diff --git a/pandas/_libs/hashtable_func_helper.pxi.in b/pandas/_libs/hashtable_func_helper.pxi.in
new file mode 100644
index 0000000000000..521e564447c59
--- /dev/null
+++ b/pandas/_libs/hashtable_func_helper.pxi.in
@@ -0,0 +1,362 @@
+"""
+Template for each `dtype` helper function for hashtable
+
+WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
+"""
+
+#----------------------------------------------------------------------
+# VectorData
+#----------------------------------------------------------------------
+
+{{py:
+
+# dtype, ttype
+dtypes = [('float64', 'float64', 'float64_t'),
+          ('uint64', 'uint64', 'uint64_t'),
+          ('object', 'pymap', 'object'),
+          ('int64', 'int64', 'int64_t')]
+
+}}
+
+{{for dtype, ttype, scalar in dtypes}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+{{if dtype == 'object'}}
+cdef build_count_table_{{dtype}}(ndarray[{{dtype}}] values,
+                                 kh_{{ttype}}_t *table, bint dropna):
+{{else}}
+cdef build_count_table_{{dtype}}({{dtype}}_t[:] values,
+                                 kh_{{ttype}}_t *table, bint dropna):
+{{endif}}
+    cdef:
+        khiter_t k
+        Py_ssize_t i, n = len(values)
+
+        {{scalar}} val
+
+        int ret = 0
+
+    {{if dtype == 'object'}}
+    kh_resize_{{ttype}}(table, n // 10)
+
+    for i in range(n):
+        val = values[i]
+
+        if not checknull(val) or not dropna:
+            k = kh_get_{{ttype}}(table, <PyObject*> val)
+            if k != table.n_buckets:
+                table.vals[k] += 1
+            else:
+                k = kh_put_{{ttype}}(table, <PyObject*> val, &ret)
+                table.vals[k] = 1
+    {{else}}
+    with nogil:
+        kh_resize_{{ttype}}(table, n)
+
+        for i in range(n):
+            val = values[i]
+
+            {{if dtype == 'float64'}}
+            if val == val or not dropna:
+            {{else}}
+            if True:
+            {{endif}}
+                k = kh_get_{{ttype}}(table, val)
+                if k != table.n_buckets:
+                    table.vals[k] += 1
+                else:
+                    k = kh_put_{{ttype}}(table, val, &ret)
+                    table.vals[k] = 1
+    {{endif}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+{{if dtype == 'object'}}
+cpdef value_count_{{dtype}}(ndarray[{{dtype}}] values, bint dropna):
+{{else}}
+cpdef value_count_{{dtype}}({{scalar}}[:] values, bint dropna):
+{{endif}}
+    cdef:
+        Py_ssize_t i=0
+        kh_{{ttype}}_t *table
+
+        {{if dtype != 'object'}}
+        {{dtype}}_t[:] result_keys
+        int64_t[:] result_counts
+        {{endif}}
+
+        Py_ssize_t k
+
+    table = kh_init_{{ttype}}()
+    {{if dtype == 'object'}}
+    build_count_table_{{dtype}}(values, table, 1)
+    {{else}}
+    build_count_table_{{dtype}}(values, table, dropna)
+    {{endif}}
+
+    result_keys = np.empty(table.n_occupied, dtype=np.{{dtype}})
+    result_counts = np.zeros(table.n_occupied, dtype=np.int64)
+
+    {{if dtype == 'object'}}
+    for k in range(table.n_buckets):
+        if kh_exist_{{ttype}}(table, k):
+            result_keys[i] = <{{dtype}}> table.keys[k]
+            result_counts[i] = table.vals[k]
+            i += 1
+    {{else}}
+    with nogil:
+        for k in range(table.n_buckets):
+            if kh_exist_{{ttype}}(table, k):
+                result_keys[i] = table.keys[k]
+                result_counts[i] = table.vals[k]
+                i += 1
+    {{endif}}
+
+    kh_destroy_{{ttype}}(table)
+
+    {{if dtype == 'object'}}
+    return result_keys, result_counts
+    {{else}}
+    return np.asarray(result_keys), np.asarray(result_counts)
+    {{endif}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+{{if dtype == 'object'}}
+
+def duplicated_{{dtype}}(ndarray[{{dtype}}] values, object keep='first'):
+{{else}}
+
+
+def duplicated_{{dtype}}({{scalar}}[:] values, object keep='first'):
+{{endif}}
+    cdef:
+        int ret = 0
+        {{if dtype != 'object'}}
+        {{dtype}}_t value
+        {{endif}}
+        Py_ssize_t k, i, n = len(values)
+        kh_{{ttype}}_t * table = kh_init_{{ttype}}()
+        ndarray[uint8_t, ndim=1, cast=True] out = np.empty(n, dtype='bool')
+
+    kh_resize_{{ttype}}(table, min(n, _SIZE_HINT_LIMIT))
+
+    if keep not in ('last', 'first', False):
+        raise ValueError('keep must be either "first", "last" or False')
+
+    if keep == 'last':
+        {{if dtype == 'object'}}
+        for i from n > i >= 0:
+            kh_put_{{ttype}}(table, <PyObject*> values[i], &ret)
+            out[i] = ret == 0
+        {{else}}
+        with nogil:
+            for i from n > i >= 0:
+                kh_put_{{ttype}}(table, values[i], &ret)
+                out[i] = ret == 0
+        {{endif}}
+    elif keep == 'first':
+        {{if dtype == 'object'}}
+        for i from 0 <= i < n:
+            kh_put_{{ttype}}(table, <PyObject*> values[i], &ret)
+            out[i] = ret == 0
+        {{else}}
+        with nogil:
+            for i from 0 <= i < n:
+                kh_put_{{ttype}}(table, values[i], &ret)
+                out[i] = ret == 0
+        {{endif}}
+    else:
+        {{if dtype == 'object'}}
+        for i from 0 <= i < n:
+            value = values[i]
+            k = kh_get_{{ttype}}(table, <PyObject*> value)
+            if k != table.n_buckets:
+                out[table.vals[k]] = 1
+                out[i] = 1
+            else:
+                k = kh_put_{{ttype}}(table, <PyObject*> value, &ret)
+                table.keys[k] = <PyObject*> value
+                table.vals[k] = i
+                out[i] = 0
+        {{else}}
+        with nogil:
+            for i from 0 <= i < n:
+                value = values[i]
+                k = kh_get_{{ttype}}(table, value)
+                if k != table.n_buckets:
+                    out[table.vals[k]] = 1
+                    out[i] = 1
+                else:
+                    k = kh_put_{{ttype}}(table, value, &ret)
+                    table.keys[k] = value
+                    table.vals[k] = i
+                    out[i] = 0
+        {{endif}}
+    kh_destroy_{{ttype}}(table)
+    return out
+
+
+#----------------------------------------------------------------------
+# Membership
+#----------------------------------------------------------------------
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+{{if dtype == 'object'}}
+
+def ismember_{{dtype}}(ndarray[{{scalar}}] arr, ndarray[{{scalar}}] values, bint hasnans=0):
+{{else}}
+
+def ismember_{{dtype}}({{scalar}}[:] arr, {{scalar}}[:] values, bint hasnans=0):
+{{endif}}
+
+    """
+    Return boolean of values in arr on an
+    element by-element basis
+
+    Parameters
+    ----------
+    arr : {{dtype}} ndarray
+    values : {{dtype}} ndarray
+    hasnans : bint, optional
+
+    Returns
+    -------
+    boolean ndarry len of (arr)
+    """
+    cdef:
+        Py_ssize_t i, n, k
+        int ret = 0
+        ndarray[uint8_t] result
+        {{scalar}} val
+        kh_{{ttype}}_t * table = kh_init_{{ttype}}()
+
+
+    # construct the table
+    n = len(values)
+    kh_resize_{{ttype}}(table, min(n, len(values)))
+
+    {{if dtype == 'object'}}
+    for i in range(n):
+        kh_put_{{ttype}}(table, <PyObject*> values[i], &ret)
+    {{else}}
+    with nogil:
+        for i in range(n):
+            kh_put_{{ttype}}(table, values[i], &ret)
+    {{endif}}
+
+    # test membership
+    n = len(arr)
+    result = np.empty(n, dtype=np.uint8)
+
+    {{if dtype == 'object'}}
+    for i in range(n):
+        val = arr[i]
+        k = kh_get_{{ttype}}(table, <PyObject*> val)
+        if k != table.n_buckets:
+            result[i] = 1
+        else:
+            result[i] = hasnans and val != val
+    {{else}}
+    with nogil:
+        for i in range(n):
+            val = arr[i]
+            k = kh_get_{{ttype}}(table, val)
+            if k != table.n_buckets:
+                result[i] = 1
+            else:
+                result[i] = hasnans and val != val
+    {{endif}}
+
+    kh_destroy_{{ttype}}(table)
+    return result.view(np.bool_)
+
+{{endfor}}
+
+
+
+#----------------------------------------------------------------------
+# Mode Computations
+#----------------------------------------------------------------------
+
+{{py:
+
+# dtype, ctype, table_type, npy_dtype
+dtypes = [('float64', 'float64_t', 'float64', 'float64'),
+          ('int64', 'int64_t', 'int64', 'int64'),
+          ('uint64', 'uint64_t', 'uint64', 'uint64'),
+          ('object', 'object', 'pymap', 'object_')]
+}}
+
+{{for dtype, ctype, table_type, npy_dtype in dtypes}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+
+{{if dtype == 'object'}}
+
+
+def mode_{{dtype}}(ndarray[{{ctype}}] values, bint dropna):
+{{else}}
+
+
+def mode_{{dtype}}({{ctype}}[:] values, bint dropna):
+{{endif}}
+    cdef:
+        int count, max_count = 1
+        int j = -1 # so you can do +=
+        Py_ssize_t k
+        kh_{{table_type}}_t *table
+        ndarray[{{ctype}}] modes
+
+    table = kh_init_{{table_type}}()
+    {{if dtype == 'object'}}
+    build_count_table_{{dtype}}(values, table, dropna)
+    {{else}}
+    build_count_table_{{dtype}}(values, table, dropna)
+    {{endif}}
+
+    modes = np.empty(table.n_buckets, dtype=np.{{npy_dtype}})
+
+    {{if dtype != 'object'}}
+    with nogil:
+        for k in range(table.n_buckets):
+            if kh_exist_{{table_type}}(table, k):
+                count = table.vals[k]
+                if count == max_count:
+                    j += 1
+                elif count > max_count:
+                    max_count = count
+                    j = 0
+                else:
+                    continue
+
+                modes[j] = table.keys[k]
+    {{else}}
+    for k in range(table.n_buckets):
+        if kh_exist_{{table_type}}(table, k):
+            count = table.vals[k]
+
+            if count == max_count:
+                j += 1
+            elif count > max_count:
+                max_count = count
+                j = 0
+            else:
+                continue
+
+            modes[j] = <object> table.keys[k]
+    {{endif}}
+
+    kh_destroy_{{table_type}}(table)
+
+    return modes[:j + 1]
+
+{{endfor}}
diff --git a/pandas/_libs/index.pyx b/pandas/_libs/index.pyx
new file mode 100644
index 0000000000000..41047d9c25c22
--- /dev/null
+++ b/pandas/_libs/index.pyx
@@ -0,0 +1,708 @@
+# cython: profile=False
+from datetime import datetime, timedelta, date
+
+cimport cython
+
+from cpython cimport PyTuple_Check, PyList_Check
+from cpython.slice cimport PySlice_Check
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport (ndarray, float64_t, int32_t,
+                    int64_t, uint8_t, uint64_t, intp_t)
+cnp.import_array()
+
+cdef extern from "numpy/arrayobject.h":
+    # These can be cimported directly from numpy in cython>=0.27.3
+    cdef enum NPY_TYPES:
+        NPY_DATETIME
+        NPY_TIMEDELTA
+
+cimport util
+
+from tslibs.conversion cimport maybe_datetimelike_to_i8
+
+from hashtable cimport HashTable
+
+from pandas._libs import algos, hashtable as _hash
+from pandas._libs.tslibs import period as periodlib
+from pandas._libs.tslib import Timestamp, Timedelta
+from pandas._libs.missing import checknull
+
+cdef int64_t iNaT = util.get_nat()
+
+
+cdef inline bint is_definitely_invalid_key(object val):
+    if PyTuple_Check(val):
+        try:
+            hash(val)
+        except TypeError:
+            return True
+
+    # we have a _data, means we are a NDFrame
+    return (PySlice_Check(val) or cnp.PyArray_Check(val)
+            or PyList_Check(val) or hasattr(val, '_data'))
+
+
+def get_value_at(ndarray arr, object loc):
+    if arr.descr.type_num == NPY_DATETIME:
+        return Timestamp(util.get_value_at(arr, loc))
+    elif arr.descr.type_num == NPY_TIMEDELTA:
+        return Timedelta(util.get_value_at(arr, loc))
+    return util.get_value_at(arr, loc)
+
+
+cpdef object get_value_box(ndarray arr, object loc):
+    cdef:
+        Py_ssize_t i, sz
+
+    if util.is_float_object(loc):
+        casted = int(loc)
+        if casted == loc:
+            loc = casted
+    i = <Py_ssize_t> loc
+    sz = cnp.PyArray_SIZE(arr)
+
+    if i < 0 and sz > 0:
+        i += sz
+
+    if i >= sz or sz == 0 or i < 0:
+        raise IndexError('index out of bounds')
+
+    if arr.descr.type_num == NPY_DATETIME:
+        return Timestamp(util.get_value_1d(arr, i))
+    elif arr.descr.type_num == NPY_TIMEDELTA:
+        return Timedelta(util.get_value_1d(arr, i))
+    else:
+        return util.get_value_1d(arr, i)
+
+
+# Don't populate hash tables in monotonic indexes larger than this
+_SIZE_CUTOFF = 1000000
+
+
+cdef class IndexEngine:
+
+    cdef readonly:
+        object vgetter
+        HashTable mapping
+        bint over_size_threshold
+
+    cdef:
+        bint unique, monotonic_inc, monotonic_dec
+        bint need_monotonic_check, need_unique_check
+
+    def __init__(self, vgetter, n):
+        self.vgetter = vgetter
+
+        self.over_size_threshold = n >= _SIZE_CUTOFF
+        self.clear_mapping()
+
+    def __contains__(self, object val):
+        self._ensure_mapping_populated()
+        hash(val)
+        return val in self.mapping
+
+    cpdef get_value(self, ndarray arr, object key, object tz=None):
+        """
+        arr : 1-dimensional ndarray
+        """
+        cdef:
+            object loc
+            void* data_ptr
+
+        loc = self.get_loc(key)
+        if PySlice_Check(loc) or cnp.PyArray_Check(loc):
+            return arr[loc]
+        else:
+            if arr.descr.type_num == NPY_DATETIME:
+                return Timestamp(util.get_value_at(arr, loc), tz=tz)
+            elif arr.descr.type_num == NPY_TIMEDELTA:
+                return Timedelta(util.get_value_at(arr, loc))
+            return util.get_value_at(arr, loc)
+
+    cpdef set_value(self, ndarray arr, object key, object value):
+        """
+        arr : 1-dimensional ndarray
+        """
+        cdef:
+            object loc
+            void* data_ptr
+
+        loc = self.get_loc(key)
+        value = convert_scalar(arr, value)
+
+        if PySlice_Check(loc) or cnp.PyArray_Check(loc):
+            arr[loc] = value
+        else:
+            util.set_value_at(arr, loc, value)
+
+    cpdef get_loc(self, object val):
+        if is_definitely_invalid_key(val):
+            raise TypeError("'{val}' is an invalid key".format(val=val))
+
+        if self.over_size_threshold and self.is_monotonic_increasing:
+            if not self.is_unique:
+                return self._get_loc_duplicates(val)
+            values = self._get_index_values()
+            loc = _bin_search(values, val)  # .searchsorted(val, side='left')
+            if loc >= len(values):
+                raise KeyError(val)
+            if util.get_value_at(values, loc) != val:
+                raise KeyError(val)
+            return loc
+
+        self._ensure_mapping_populated()
+        if not self.unique:
+            return self._get_loc_duplicates(val)
+
+        self._check_type(val)
+
+        try:
+            return self.mapping.get_item(val)
+        except (TypeError, ValueError):
+            raise KeyError(val)
+
+    cdef inline _get_loc_duplicates(self, object val):
+        cdef:
+            Py_ssize_t diff
+
+        if self.is_monotonic_increasing:
+            values = self._get_index_values()
+            left = values.searchsorted(val, side='left')
+            right = values.searchsorted(val, side='right')
+
+            diff = right - left
+            if diff == 0:
+                raise KeyError(val)
+            elif diff == 1:
+                return left
+            else:
+                return slice(left, right)
+
+        return self._maybe_get_bool_indexer(val)
+
+    cdef _maybe_get_bool_indexer(self, object val):
+        cdef:
+            ndarray[uint8_t, ndim=1, cast=True] indexer
+            ndarray[intp_t, ndim=1] found
+            int count
+
+        indexer = self._get_index_values() == val
+        found = np.where(indexer)[0]
+        count = len(found)
+
+        if count > 1:
+            return indexer
+        if count == 1:
+            return int(found[0])
+
+        raise KeyError(val)
+
+    def sizeof(self, deep=False):
+        """ return the sizeof our mapping """
+        if not self.is_mapping_populated:
+            return 0
+        return self.mapping.sizeof(deep=deep)
+
+    def __sizeof__(self):
+        return self.sizeof()
+
+    @property
+    def is_unique(self):
+        if self.need_unique_check:
+            self._do_unique_check()
+
+        return self.unique == 1
+
+    cdef inline _do_unique_check(self):
+
+        # this de-facto the same
+        self._ensure_mapping_populated()
+
+    @property
+    def is_monotonic_increasing(self):
+        if self.need_monotonic_check:
+            self._do_monotonic_check()
+
+        return self.monotonic_inc == 1
+
+    @property
+    def is_monotonic_decreasing(self):
+        if self.need_monotonic_check:
+            self._do_monotonic_check()
+
+        return self.monotonic_dec == 1
+
+    cdef inline _do_monotonic_check(self):
+        cdef object is_unique
+        try:
+            values = self._get_index_values()
+            self.monotonic_inc, self.monotonic_dec, is_unique = \
+                self._call_monotonic(values)
+        except TypeError:
+            self.monotonic_inc = 0
+            self.monotonic_dec = 0
+            is_unique = 0
+
+        self.need_monotonic_check = 0
+
+        # we can only be sure of uniqueness if is_unique=1
+        if is_unique:
+            self.unique = 1
+            self.need_unique_check = 0
+
+    cdef _get_index_values(self):
+        return self.vgetter()
+
+    def _call_monotonic(self, values):
+        raise NotImplementedError
+
+    cdef _make_hash_table(self, n):
+        raise NotImplementedError
+
+    cdef _check_type(self, object val):
+        hash(val)
+
+    @property
+    def is_mapping_populated(self):
+        return self.mapping is not None
+
+    cdef inline _ensure_mapping_populated(self):
+        # this populates the mapping
+        # if its not already populated
+        # also satisfies the need_unique_check
+
+        if not self.is_mapping_populated:
+
+            values = self._get_index_values()
+            self.mapping = self._make_hash_table(len(values))
+            self._call_map_locations(values)
+
+            if len(self.mapping) == len(values):
+                self.unique = 1
+
+        self.need_unique_check = 0
+
+    cpdef _call_map_locations(self, values):
+        self.mapping.map_locations(values)
+
+    def clear_mapping(self):
+        self.mapping = None
+        self.need_monotonic_check = 1
+        self.need_unique_check = 1
+
+        self.unique = 0
+        self.monotonic_inc = 0
+        self.monotonic_dec = 0
+
+    def get_indexer(self, values):
+        self._ensure_mapping_populated()
+        return self.mapping.lookup(values)
+
+    def get_indexer_non_unique(self, targets):
+        """ return an indexer suitable for takng from a non unique index
+            return the labels in the same order ast the target
+            and a missing indexer into the targets (which correspond
+            to the -1 indices in the results """
+
+        cdef:
+            ndarray values, x
+            ndarray[int64_t] result, missing
+            set stargets
+            dict d = {}
+            object val
+            int count = 0, count_missing = 0
+            Py_ssize_t i, j, n, n_t, n_alloc
+
+        self._ensure_mapping_populated()
+        values = np.array(self._get_index_values(), copy=False)
+        stargets = set(targets)
+        n = len(values)
+        n_t = len(targets)
+        if n > 10000:
+            n_alloc = 10000
+        else:
+            n_alloc = n
+
+        result = np.empty(n_alloc, dtype=np.int64)
+        missing = np.empty(n_t, dtype=np.int64)
+
+        # form the set of the results (like ismember)
+        members = np.empty(n, dtype=np.uint8)
+        for i in range(n):
+            val = util.get_value_1d(values, i)
+            if val in stargets:
+                if val not in d:
+                    d[val] = []
+                d[val].append(i)
+
+        for i in range(n_t):
+
+            val = util.get_value_1d(targets, i)
+
+            # found
+            if val in d:
+                for j in d[val]:
+
+                    # realloc if needed
+                    if count >= n_alloc:
+                        n_alloc += 10000
+                        result = np.resize(result, n_alloc)
+
+                    result[count] = j
+                    count += 1
+
+            # value not found
+            else:
+
+                if count >= n_alloc:
+                    n_alloc += 10000
+                    result = np.resize(result, n_alloc)
+                result[count] = -1
+                count += 1
+                missing[count_missing] = i
+                count_missing += 1
+
+        return result[0:count], missing[0:count_missing]
+
+
+cdef Py_ssize_t _bin_search(ndarray values, object val) except -1:
+    cdef:
+        Py_ssize_t mid, lo = 0, hi = len(values) - 1
+        object pval
+
+    if hi >= 0 and val > util.get_value_at(values, hi):
+        return len(values)
+
+    while lo < hi:
+        mid = (lo + hi) // 2
+        pval = util.get_value_at(values, mid)
+        if val < pval:
+            hi = mid
+        elif val > pval:
+            lo = mid + 1
+        else:
+            while mid > 0 and val == util.get_value_at(values, mid - 1):
+                mid -= 1
+            return mid
+
+    if val <= util.get_value_at(values, mid):
+        return mid
+    else:
+        return mid + 1
+
+
+cdef class DatetimeEngine(Int64Engine):
+
+    cdef _get_box_dtype(self):
+        return 'M8[ns]'
+
+    def __contains__(self, object val):
+        if self.over_size_threshold and self.is_monotonic_increasing:
+            if not self.is_unique:
+                return self._get_loc_duplicates(val)
+            values = self._get_index_values()
+            conv = maybe_datetimelike_to_i8(val)
+            loc = values.searchsorted(conv, side='left')
+            return util.get_value_at(values, loc) == conv
+
+        self._ensure_mapping_populated()
+        return maybe_datetimelike_to_i8(val) in self.mapping
+
+    cdef _get_index_values(self):
+        return self.vgetter().view('i8')
+
+    def _call_monotonic(self, values):
+        return algos.is_monotonic_int64(values, timelike=True)
+
+    cpdef get_loc(self, object val):
+        if is_definitely_invalid_key(val):
+            raise TypeError
+
+        # Welcome to the spaghetti factory
+        if self.over_size_threshold and self.is_monotonic_increasing:
+            if not self.is_unique:
+                val = maybe_datetimelike_to_i8(val)
+                return self._get_loc_duplicates(val)
+            values = self._get_index_values()
+
+            try:
+                conv = maybe_datetimelike_to_i8(val)
+                loc = values.searchsorted(conv, side='left')
+            except TypeError:
+                self._date_check_type(val)
+                raise KeyError(val)
+
+            if loc == len(values) or util.get_value_at(values, loc) != conv:
+                raise KeyError(val)
+            return loc
+
+        self._ensure_mapping_populated()
+        if not self.unique:
+            val = maybe_datetimelike_to_i8(val)
+            return self._get_loc_duplicates(val)
+
+        try:
+            return self.mapping.get_item(val.value)
+        except KeyError:
+            raise KeyError(val)
+        except AttributeError:
+            pass
+
+        try:
+            val = maybe_datetimelike_to_i8(val)
+            return self.mapping.get_item(val)
+        except (TypeError, ValueError):
+            self._date_check_type(val)
+            raise KeyError(val)
+
+    cdef inline _date_check_type(self, object val):
+        hash(val)
+        if not util.is_integer_object(val):
+            raise KeyError(val)
+
+    def get_indexer(self, values):
+        self._ensure_mapping_populated()
+        if values.dtype != self._get_box_dtype():
+            return np.repeat(-1, len(values)).astype('i4')
+        values = np.asarray(values).view('i8')
+        return self.mapping.lookup(values)
+
+    def get_pad_indexer(self, other, limit=None):
+        if other.dtype != self._get_box_dtype():
+            return np.repeat(-1, len(other)).astype('i4')
+        other = np.asarray(other).view('i8')
+        return algos.pad_int64(self._get_index_values(), other, limit=limit)
+
+    def get_backfill_indexer(self, other, limit=None):
+        if other.dtype != self._get_box_dtype():
+            return np.repeat(-1, len(other)).astype('i4')
+        other = np.asarray(other).view('i8')
+        return algos.backfill_int64(self._get_index_values(), other,
+                                    limit=limit)
+
+
+cdef class TimedeltaEngine(DatetimeEngine):
+
+    cdef _get_box_dtype(self):
+        return 'm8[ns]'
+
+
+cdef class PeriodEngine(Int64Engine):
+
+    cdef _get_index_values(self):
+        return super(PeriodEngine, self).vgetter()
+
+    cpdef _call_map_locations(self, values):
+        super(PeriodEngine, self)._call_map_locations(values.view('i8'))
+
+    def _call_monotonic(self, values):
+        return super(PeriodEngine, self)._call_monotonic(values.view('i8'))
+
+    def get_indexer(self, values):
+        cdef ndarray[int64_t, ndim=1] ordinals
+
+        super(PeriodEngine, self)._ensure_mapping_populated()
+
+        freq = super(PeriodEngine, self).vgetter().freq
+        ordinals = periodlib.extract_ordinals(values, freq)
+
+        return self.mapping.lookup(ordinals)
+
+    def get_pad_indexer(self, other, limit=None):
+        freq = super(PeriodEngine, self).vgetter().freq
+        ordinal = periodlib.extract_ordinals(other, freq)
+
+        return algos.pad_int64(self._get_index_values(),
+                               np.asarray(ordinal), limit=limit)
+
+    def get_backfill_indexer(self, other, limit=None):
+        freq = super(PeriodEngine, self).vgetter().freq
+        ordinal = periodlib.extract_ordinals(other, freq)
+
+        return algos.backfill_int64(self._get_index_values(),
+                                    np.asarray(ordinal), limit=limit)
+
+    def get_indexer_non_unique(self, targets):
+        freq = super(PeriodEngine, self).vgetter().freq
+        ordinal = periodlib.extract_ordinals(targets, freq)
+        ordinal_array = np.asarray(ordinal)
+
+        return super(PeriodEngine, self).get_indexer_non_unique(ordinal_array)
+
+
+cpdef convert_scalar(ndarray arr, object value):
+    # we don't turn integers
+    # into datetimes/timedeltas
+
+    # we don't turn bools into int/float/complex
+
+    if arr.descr.type_num == NPY_DATETIME:
+        if util.is_array(value):
+            pass
+        elif isinstance(value, (datetime, np.datetime64, date)):
+            return Timestamp(value).value
+        elif value is None or value != value:
+            return iNaT
+        elif util.is_string_object(value):
+            return Timestamp(value).value
+        raise ValueError("cannot set a Timestamp with a non-timestamp")
+
+    elif arr.descr.type_num == NPY_TIMEDELTA:
+        if util.is_array(value):
+            pass
+        elif isinstance(value, timedelta):
+            return Timedelta(value).value
+        elif value is None or value != value:
+            return iNaT
+        elif util.is_string_object(value):
+            return Timedelta(value).value
+        raise ValueError("cannot set a Timedelta with a non-timedelta")
+
+    if (issubclass(arr.dtype.type, (np.integer, np.floating, np.complex)) and
+            not issubclass(arr.dtype.type, np.bool_)):
+        if util.is_bool_object(value):
+            raise ValueError('Cannot assign bool to float/integer series')
+
+    if issubclass(arr.dtype.type, (np.integer, np.bool_)):
+        if util.is_float_object(value) and value != value:
+            raise ValueError('Cannot assign nan to integer series')
+
+    return value
+
+
+cdef class BaseMultiIndexCodesEngine:
+    """
+    Base class for MultiIndexUIntEngine and MultiIndexPyIntEngine, which
+    represent each label in a MultiIndex as an integer, by juxtaposing the bits
+    encoding each level, with appropriate offsets.
+
+    For instance: if 3 levels have respectively 3, 6 and 1 possible values,
+    then their labels can be represented using respectively 2, 3 and 1 bits,
+    as follows:
+     _ _ _ _____ _ __ __ __
+    |0|0|0| ... |0| 0|a1|a0| -> offset 0 (first level)
+     — — — ————— — —— —— ——
+    |0|0|0| ... |0|b2|b1|b0| -> offset 2 (bits required for first level)
+     — — — ————— — —— —— ——
+    |0|0|0| ... |0| 0| 0|c0| -> offset 5 (bits required for first two levels)
+     ‾ ‾ ‾ ‾‾‾‾‾ ‾ ‾‾ ‾‾ ‾‾
+    and the resulting unsigned integer representation will be:
+     _ _ _ _____ _ __ __ __ __ __ __
+    |0|0|0| ... |0|c0|b2|b1|b0|a1|a0|
+     ‾ ‾ ‾ ‾‾‾‾‾ ‾ ‾‾ ‾‾ ‾‾ ‾‾ ‾‾ ‾‾
+
+    Offsets are calculated at initialization, labels are transformed by method
+    _codes_to_ints.
+
+    Keys are located by first locating each component against the respective
+    level, then locating (the integer representation of) codes.
+    """
+    def __init__(self, object levels, object labels,
+                 ndarray[uint64_t, ndim=1] offsets):
+        """
+        Parameters
+        ----------
+        levels : list-like of numpy arrays
+            Levels of the MultiIndex
+        labels : list-like of numpy arrays of integer dtype
+            Labels of the MultiIndex
+        offsets : numpy array of uint64 dtype
+            Pre-calculated offsets, one for each level of the index
+        """
+
+        self.levels = levels
+        self.offsets = offsets
+
+        # Transform labels in a single array, and add 1 so that we are working
+        # with positive integers (-1 for NaN becomes 0):
+        codes = (np.array(labels, dtype='int64').T + 1).astype('uint64',
+                                                               copy=False)
+
+        # Map each codes combination in the index to an integer unambiguously
+        # (no collisions possible), based on the "offsets", which describe the
+        # number of bits to switch labels for each level:
+        lab_ints = self._codes_to_ints(codes)
+
+        # Initialize underlying index (e.g. libindex.UInt64Engine) with
+        # integers representing labels: we will use its get_loc and get_indexer
+        self._base.__init__(self, lambda: lab_ints, len(lab_ints))
+
+    def _extract_level_codes(self, object target, object method=None):
+        """
+        Map the requested list of (tuple) keys to their integer representations
+        for searching in the underlying integer index.
+
+        Parameters
+        ----------
+        target : list-like of keys
+            Each key is a tuple, with a label for each level of the index.
+
+        Returns
+        ------
+        int_keys : 1-dimensional array of dtype uint64 or object
+            Integers representing one combination each
+        """
+
+        level_codes = [lev.get_indexer(codes) + 1 for lev, codes
+                       in zip(self.levels, zip(*target))]
+        return self._codes_to_ints(np.array(level_codes, dtype='uint64').T)
+
+    def get_indexer(self, object target, object method=None,
+                    object limit=None):
+        lab_ints = self._extract_level_codes(target)
+
+        # All methods (exact, backfill, pad) directly map to the respective
+        # methods of the underlying (integers) index...
+        if method is not None:
+            # but underlying backfill and pad methods require index and keys
+            # to be sorted. The index already is (checked in
+            # Index._get_fill_indexer), sort (integer representations of) keys:
+            order = np.argsort(lab_ints)
+            lab_ints = lab_ints[order]
+            indexer = (getattr(self._base, 'get_{}_indexer'.format(method))
+                       (self, lab_ints, limit=limit))
+            indexer = indexer[order]
+        else:
+            indexer = self._base.get_indexer(self, lab_ints)
+
+        return indexer
+
+    def get_loc(self, object key):
+        if is_definitely_invalid_key(key):
+            raise TypeError("'{key}' is an invalid key".format(key=key))
+        if not PyTuple_Check(key):
+            raise KeyError(key)
+        try:
+            indices = [0 if checknull(v) else lev.get_loc(v) + 1
+                       for lev, v in zip(self.levels, key)]
+        except KeyError:
+            raise KeyError(key)
+
+        # Transform indices into single integer:
+        lab_int = self._codes_to_ints(np.array(indices, dtype='uint64'))
+
+        return self._base.get_loc(self, lab_int)
+
+    def get_indexer_non_unique(self, object target):
+        # This needs to be overridden just because the default one works on
+        # target._values, and target can be itself a MultiIndex.
+
+        lab_ints = self._extract_level_codes(target)
+        indexer = self._base.get_indexer_non_unique(self, lab_ints)
+
+        return indexer
+
+    def __contains__(self, object val):
+        # Default __contains__ looks in the underlying mapping, which in this
+        # case only contains integer representations.
+        try:
+            self.get_loc(val)
+            return True
+        except (KeyError, TypeError, ValueError):
+            return False
+
+
+# Generated from template.
+include "index_class_helper.pxi"
diff --git a/pandas/_libs/index_class_helper.pxi.in b/pandas/_libs/index_class_helper.pxi.in
new file mode 100644
index 0000000000000..4ea35da0626f3
--- /dev/null
+++ b/pandas/_libs/index_class_helper.pxi.in
@@ -0,0 +1,83 @@
+"""
+Template for functions of IndexEngine subclasses.
+
+WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
+"""
+
+#----------------------------------------------------------------------
+# IndexEngine Subclass Methods
+#----------------------------------------------------------------------
+
+{{py:
+
+# name, dtype, ctype
+dtypes = [('Float64', 'float64', 'float64_t'),
+          ('UInt64', 'uint64', 'uint64_t'),
+          ('Int64', 'int64', 'int64_t'),
+          ('Object', 'object', 'object')]
+}}
+
+{{for name, dtype, ctype in dtypes}}
+
+
+cdef class {{name}}Engine(IndexEngine):
+
+    def _call_monotonic(self, values):
+        return algos.is_monotonic_{{dtype}}(values, timelike=False)
+
+    def get_backfill_indexer(self, other, limit=None):
+        return algos.backfill_{{dtype}}(self._get_index_values(),
+                                        other, limit=limit)
+
+    def get_pad_indexer(self, other, limit=None):
+        return algos.pad_{{dtype}}(self._get_index_values(),
+                                   other, limit=limit)
+
+    cdef _make_hash_table(self, n):
+        {{if name == 'Object'}}
+        return _hash.PyObjectHashTable(n)
+        {{else}}
+        return _hash.{{name}}HashTable(n)
+        {{endif}}
+
+    {{if name != 'Float64' and name != 'Object'}}
+    cdef _check_type(self, object val):
+        hash(val)
+        if util.is_bool_object(val):
+            raise KeyError(val)
+        elif util.is_float_object(val):
+            raise KeyError(val)
+    {{endif}}
+
+    {{if name != 'Object'}}
+    cdef _get_index_values(self):
+        return algos.ensure_{{dtype}}(self.vgetter())
+
+    cdef _maybe_get_bool_indexer(self, object val):
+        cdef:
+            ndarray[uint8_t, ndim=1, cast=True] indexer
+            ndarray[intp_t, ndim=1] found
+            ndarray[{{ctype}}] values
+            int count = 0
+
+        {{if name != 'Float64'}}
+        if not util.is_integer_object(val):
+            raise KeyError(val)
+        {{endif}}
+
+        # A view is needed for some subclasses, such as PeriodEngine:
+        values = self._get_index_values().view('{{dtype}}')
+        indexer = values == val
+        found = np.where(indexer)[0]
+        count = len(found)
+
+        if count > 1:
+            return indexer
+        if count == 1:
+            return int(found[0])
+
+        raise KeyError(val)
+
+    {{endif}}
+
+{{endfor}}
diff --git a/pandas/_libs/indexing.pyx b/pandas/_libs/indexing.pyx
new file mode 100644
index 0000000000000..fb707a3c3e5e2
--- /dev/null
+++ b/pandas/_libs/indexing.pyx
@@ -0,0 +1,22 @@
+# cython: profile=False
+
+cdef class _NDFrameIndexerBase:
+    '''
+    A base class for _NDFrameIndexer for fast instantiation and attribute
+    access.
+    '''
+    cdef public object obj, name, _ndim
+
+    def __init__(self, name, obj):
+        self.obj = obj
+        self.name = name
+        self._ndim = None
+
+    @property
+    def ndim(self):
+        # Delay `ndim` instantiation until required as reading it
+        # from `obj` isn't entirely cheap.
+        ndim = self._ndim
+        if ndim is None:
+            ndim = self._ndim = self.obj.ndim
+        return ndim
diff --git a/pandas/_libs/internals.pyx b/pandas/_libs/internals.pyx
new file mode 100644
index 0000000000000..b46a05a0842c3
--- /dev/null
+++ b/pandas/_libs/internals.pyx
@@ -0,0 +1,438 @@
+# -*- coding: utf-8 -*-
+
+cimport cython
+from cython cimport Py_ssize_t
+
+from cpython cimport PyObject
+from cpython.slice cimport PySlice_Check
+
+cdef extern from "Python.h":
+    Py_ssize_t PY_SSIZE_T_MAX
+
+import numpy as np
+from numpy cimport int64_t
+
+cdef extern from "compat_helper.h":
+    cdef int slice_get_indices(PyObject* s, Py_ssize_t length,
+                               Py_ssize_t *start, Py_ssize_t *stop,
+                               Py_ssize_t *step,
+                               Py_ssize_t *slicelength) except -1
+
+
+cdef class BlockPlacement:
+    # __slots__ = '_as_slice', '_as_array', '_len'
+    cdef slice _as_slice
+    cdef object _as_array
+
+    cdef bint _has_slice, _has_array, _is_known_slice_like
+
+    def __init__(self, val):
+        cdef slice slc
+
+        self._has_slice = False
+        self._has_array = False
+
+        if PySlice_Check(val):
+            slc = slice_canonize(val)
+
+            if slc.start != slc.stop:
+                self._as_slice = slc
+                self._has_slice = True
+            else:
+                arr = np.empty(0, dtype=np.int64)
+                self._as_array = arr
+                self._has_array = True
+        else:
+            # Cython memoryview interface requires ndarray to be writeable.
+            arr = np.require(val, dtype=np.int64, requirements='W')
+            assert arr.ndim == 1
+            self._as_array = arr
+            self._has_array = True
+
+    def __str__(self):
+        cdef slice s = self._ensure_has_slice()
+        if s is not None:
+            v = self._as_slice
+        else:
+            v = self._as_array
+
+        return '%s(%r)' % (self.__class__.__name__, v)
+
+    __repr__ = __str__
+
+    def __len__(self):
+        cdef slice s = self._ensure_has_slice()
+        if s is not None:
+            return slice_len(s)
+        else:
+            return len(self._as_array)
+
+    def __iter__(self):
+        cdef slice s = self._ensure_has_slice()
+        cdef Py_ssize_t start, stop, step, _
+        if s is not None:
+            start, stop, step, _ = slice_get_indices_ex(s)
+            return iter(range(start, stop, step))
+        else:
+            return iter(self._as_array)
+
+    @property
+    def as_slice(self):
+        cdef slice s = self._ensure_has_slice()
+        if s is None:
+            raise TypeError('Not slice-like')
+        else:
+            return s
+
+    @property
+    def indexer(self):
+        cdef slice s = self._ensure_has_slice()
+        if s is not None:
+            return s
+        else:
+            return self._as_array
+
+    def isin(self, arr):
+        from pandas.core.index import Int64Index
+        return Int64Index(self.as_array, copy=False).isin(arr)
+
+    @property
+    def as_array(self):
+        cdef Py_ssize_t start, stop, end, _
+        if not self._has_array:
+            start, stop, step, _ = slice_get_indices_ex(self._as_slice)
+            self._as_array = np.arange(start, stop, step,
+                                       dtype=np.int64)
+            self._has_array = True
+        return self._as_array
+
+    @property
+    def is_slice_like(self):
+        cdef slice s = self._ensure_has_slice()
+        return s is not None
+
+    def __getitem__(self, loc):
+        cdef slice s = self._ensure_has_slice()
+        if s is not None:
+            val = slice_getitem(s, loc)
+        else:
+            val = self._as_array[loc]
+
+        if not PySlice_Check(val) and val.ndim == 0:
+            return val
+
+        return BlockPlacement(val)
+
+    def delete(self, loc):
+        return BlockPlacement(np.delete(self.as_array, loc, axis=0))
+
+    def append(self, others):
+        if len(others) == 0:
+            return self
+
+        return BlockPlacement(np.concatenate([self.as_array] +
+                                             [o.as_array for o in others]))
+
+    cdef iadd(self, other):
+        cdef slice s = self._ensure_has_slice()
+        cdef Py_ssize_t other_int, start, stop, step, l
+
+        if isinstance(other, int) and s is not None:
+            other_int = <Py_ssize_t>other
+
+            if other_int == 0:
+                return self
+
+            start, stop, step, l = slice_get_indices_ex(s)
+            start += other_int
+            stop += other_int
+
+            if ((step > 0 and start < 0) or
+                    (step < 0 and stop < step)):
+                raise ValueError("iadd causes length change")
+
+            if stop < 0:
+                self._as_slice = slice(start, None, step)
+            else:
+                self._as_slice = slice(start, stop, step)
+
+            self._has_array = False
+            self._as_array = None
+        else:
+            newarr = self.as_array + other
+            if (newarr < 0).any():
+                raise ValueError("iadd causes length change")
+
+            self._as_array = newarr
+            self._has_array = True
+            self._has_slice = False
+            self._as_slice = None
+
+        return self
+
+    cdef BlockPlacement copy(self):
+        cdef slice s = self._ensure_has_slice()
+        if s is not None:
+            return BlockPlacement(s)
+        else:
+            return BlockPlacement(self._as_array)
+
+    def add(self, other):
+        return self.copy().iadd(other)
+
+    def sub(self, other):
+        return self.add(-other)
+
+    cdef slice _ensure_has_slice(self):
+        if not self._has_slice:
+            self._as_slice = indexer_as_slice(self._as_array)
+            self._has_slice = True
+        return self._as_slice
+
+
+cpdef slice_canonize(slice s):
+    """
+    Convert slice to canonical bounded form.
+    """
+    cdef:
+        Py_ssize_t start = 0, stop = 0, step = 1, length
+
+    if s.step is None:
+        step = 1
+    else:
+        step = <Py_ssize_t>s.step
+        if step == 0:
+            raise ValueError("slice step cannot be zero")
+
+    if step > 0:
+        if s.stop is None:
+            raise ValueError("unbounded slice")
+
+        stop = <Py_ssize_t>s.stop
+        if s.start is None:
+            start = 0
+        else:
+            start = <Py_ssize_t>s.start
+            if start > stop:
+                start = stop
+    elif step < 0:
+        if s.start is None:
+            raise ValueError("unbounded slice")
+
+        start = <Py_ssize_t>s.start
+        if s.stop is None:
+            stop = -1
+        else:
+            stop = <Py_ssize_t>s.stop
+            if stop > start:
+                stop = start
+
+    if start < 0 or (stop < 0 and s.stop is not None):
+        raise ValueError("unbounded slice")
+
+    if stop < 0:
+        return slice(start, None, step)
+    else:
+        return slice(start, stop, step)
+
+
+cpdef Py_ssize_t slice_len(
+        slice slc, Py_ssize_t objlen=PY_SSIZE_T_MAX) except -1:
+    """
+    Get length of a bounded slice.
+
+    The slice must not have any "open" bounds that would create dependency on
+    container size, i.e.:
+    - if ``s.step is None or s.step > 0``, ``s.stop`` is not ``None``
+    - if ``s.step < 0``, ``s.start`` is not ``None``
+
+    Otherwise, the result is unreliable.
+
+    """
+    cdef:
+        Py_ssize_t start, stop, step, length
+
+    if slc is None:
+        raise TypeError("slc must be slice")
+
+    slice_get_indices(<PyObject *>slc, objlen,
+                      &start, &stop, &step, &length)
+
+    return length
+
+
+cpdef slice_get_indices_ex(slice slc, Py_ssize_t objlen=PY_SSIZE_T_MAX):
+    """
+    Get (start, stop, step, length) tuple for a slice.
+
+    If `objlen` is not specified, slice must be bounded, otherwise the result
+    will be wrong.
+
+    """
+    cdef:
+        Py_ssize_t start, stop, step, length
+
+    if slc is None:
+        raise TypeError("slc should be a slice")
+
+    slice_get_indices(<PyObject *>slc, objlen,
+                      &start, &stop, &step, &length)
+
+    return start, stop, step, length
+
+
+def slice_getitem(slice slc not None, ind):
+    cdef:
+        Py_ssize_t s_start, s_stop, s_step, s_len
+        Py_ssize_t ind_start, ind_stop, ind_step, ind_len
+
+    s_start, s_stop, s_step, s_len = slice_get_indices_ex(slc)
+
+    if PySlice_Check(ind):
+        ind_start, ind_stop, ind_step, ind_len = slice_get_indices_ex(ind,
+                                                                      s_len)
+
+        if ind_step > 0 and ind_len == s_len:
+            # short-cut for no-op slice
+            if ind_len == s_len:
+                return slc
+
+        if ind_step < 0:
+            s_start = s_stop - s_step
+            ind_step = -ind_step
+
+        s_step *= ind_step
+        s_stop = s_start + ind_stop * s_step
+        s_start = s_start + ind_start * s_step
+
+        if s_step < 0 and s_stop < 0:
+            return slice(s_start, None, s_step)
+        else:
+            return slice(s_start, s_stop, s_step)
+
+    else:
+        return np.arange(s_start, s_stop, s_step, dtype=np.int64)[ind]
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+cpdef slice indexer_as_slice(int64_t[:] vals):
+    cdef:
+        Py_ssize_t i, n, start, stop
+        int64_t d
+
+    if vals is None:
+        raise TypeError("vals must be ndarray")
+
+    n = vals.shape[0]
+
+    if n == 0 or vals[0] < 0:
+        return None
+
+    if n == 1:
+        return slice(vals[0], vals[0] + 1, 1)
+
+    if vals[1] < 0:
+        return None
+
+    # n > 2
+    d = vals[1] - vals[0]
+
+    if d == 0:
+        return None
+
+    for i in range(2, n):
+        if vals[i] < 0 or vals[i] - vals[i - 1] != d:
+            return None
+
+    start = vals[0]
+    stop = start + n * d
+    if stop < 0 and d < 0:
+        return slice(start, None, d)
+    else:
+        return slice(start, stop, d)
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def get_blkno_indexers(int64_t[:] blknos, bint group=True):
+    """
+    Enumerate contiguous runs of integers in ndarray.
+
+    Iterate over elements of `blknos` yielding ``(blkno, slice(start, stop))``
+    pairs for each contiguous run found.
+
+    If `group` is True and there is more than one run for a certain blkno,
+    ``(blkno, array)`` with an array containing positions of all elements equal
+    to blkno.
+
+    Returns
+    -------
+    iter : iterator of (int, slice or array)
+
+    """
+    # There's blkno in this function's name because it's used in block &
+    # blockno handling.
+    cdef:
+        int64_t cur_blkno
+        Py_ssize_t i, start, stop, n, diff
+
+        object blkno
+        list group_order
+        dict group_slices
+        int64_t[:] res_view
+
+    n = blknos.shape[0]
+
+    if n == 0:
+        return
+
+    start = 0
+    cur_blkno = blknos[start]
+
+    if group == False:
+        for i in range(1, n):
+            if blknos[i] != cur_blkno:
+                yield cur_blkno, slice(start, i)
+
+                start = i
+                cur_blkno = blknos[i]
+
+        yield cur_blkno, slice(start, n)
+    else:
+        group_order = []
+        group_dict = {}
+
+        for i in range(1, n):
+            if blknos[i] != cur_blkno:
+                if cur_blkno not in group_dict:
+                    group_order.append(cur_blkno)
+                    group_dict[cur_blkno] = [(start, i)]
+                else:
+                    group_dict[cur_blkno].append((start, i))
+
+                start = i
+                cur_blkno = blknos[i]
+
+        if cur_blkno not in group_dict:
+            group_order.append(cur_blkno)
+            group_dict[cur_blkno] = [(start, n)]
+        else:
+            group_dict[cur_blkno].append((start, n))
+
+        for blkno in group_order:
+            slices = group_dict[blkno]
+            if len(slices) == 1:
+                yield blkno, slice(slices[0][0], slices[0][1])
+            else:
+                tot_len = sum(stop - start for start, stop in slices)
+                result = np.empty(tot_len, dtype=np.int64)
+                res_view = result
+
+                i = 0
+                for start, stop in slices:
+                    for diff in range(start, stop):
+                        res_view[i] = diff
+                        i += 1
+
+                yield blkno, result
\ No newline at end of file
diff --git a/pandas/_libs/interval.pyx b/pandas/_libs/interval.pyx
new file mode 100644
index 0000000000000..fbb7265a17f8b
--- /dev/null
+++ b/pandas/_libs/interval.pyx
@@ -0,0 +1,391 @@
+cimport numpy as cnp
+import numpy as np
+
+cimport util
+cimport cython
+import cython
+from numpy cimport ndarray
+from tslib import Timestamp
+from tslibs.timezones cimport tz_compare
+
+from cpython.object cimport (Py_EQ, Py_NE, Py_GT, Py_LT, Py_GE, Py_LE,
+                             PyObject_RichCompare)
+
+import numbers
+_VALID_CLOSED = frozenset(['left', 'right', 'both', 'neither'])
+
+
+cdef class IntervalMixin(object):
+
+    @property
+    def closed_left(self):
+        """
+        Check if the interval is closed on the left side.
+
+        For the meaning of `closed` and `open` see :class:`~pandas.Interval`.
+
+        Returns
+        -------
+        bool
+            ``True`` if the Interval is closed on the left-side, else
+            ``False``.
+        """
+        return self.closed in ('left', 'both')
+
+    @property
+    def closed_right(self):
+        """
+        Check if the interval is closed on the right side.
+
+        For the meaning of `closed` and `open` see :class:`~pandas.Interval`.
+
+        Returns
+        -------
+        bool
+            ``True`` if the Interval is closed on the left-side, else
+            ``False``.
+        """
+        return self.closed in ('right', 'both')
+
+    @property
+    def open_left(self):
+        """
+        Check if the interval is open on the left side.
+
+        For the meaning of `closed` and `open` see :class:`~pandas.Interval`.
+
+        Returns
+        -------
+        bool
+            ``True`` if the Interval is closed on the left-side, else
+            ``False``.
+        """
+        return not self.closed_left
+
+    @property
+    def open_right(self):
+        """
+        Check if the interval is open on the right side.
+
+        For the meaning of `closed` and `open` see :class:`~pandas.Interval`.
+
+        Returns
+        -------
+        bool
+            ``True`` if the Interval is closed on the left-side, else
+            ``False``.
+        """
+        return not self.closed_right
+
+    @property
+    def mid(self):
+        """
+        Return the midpoint of the Interval
+        """
+        try:
+            return 0.5 * (self.left + self.right)
+        except TypeError:
+            # datetime safe version
+            return self.left + 0.5 * self.length
+
+    @property
+    def length(self):
+        """Return the length of the Interval"""
+        try:
+            return self.right - self.left
+        except TypeError:
+            # length not defined for some types, e.g. string
+            msg = 'cannot compute length between {left!r} and {right!r}'
+            raise TypeError(msg.format(left=self.left, right=self.right))
+
+
+cdef _interval_like(other):
+    return (hasattr(other, 'left')
+            and hasattr(other, 'right')
+            and hasattr(other, 'closed'))
+
+
+cdef class Interval(IntervalMixin):
+    """
+    Immutable object implementing an Interval, a bounded slice-like interval.
+
+    .. versionadded:: 0.20.0
+
+    Parameters
+    ----------
+    left : orderable scalar
+        Left bound for the interval.
+    right : orderable scalar
+        Right bound for the interval.
+    closed : {'left', 'right', 'both', 'neither'}, default 'right'
+        Whether the interval is closed on the left-side, right-side, both or
+        neither.
+    closed : {'right', 'left', 'both', 'neither'}, default 'right'
+        Whether the interval is closed on the left-side, right-side, both or
+        neither. See the Notes for more detailed explanation.
+
+    Notes
+    -----
+    The parameters `left` and `right` must be from the same type, you must be
+    able to compare them and they must satisfy ``left <= right``.
+
+    A closed interval (in mathematics denoted by square brackets) contains
+    its endpoints, i.e. the closed interval ``[0, 5]`` is characterized by the
+    conditions ``0 <= x <= 5``. This is what ``closed='both'`` stands for.
+    An open interval (in mathematics denoted by parentheses) does not contain
+    its endpoints, i.e. the open interval ``(0, 5)`` is characterized by the
+    conditions ``0 < x < 5``. This is what ``closed='neither'`` stands for.
+    Intervals can also be half-open or half-closed, i.e. ``[0, 5)`` is
+    described by ``0 <= x < 5`` (``closed='left'``) and ``(0, 5]`` is
+    described by ``0 < x <= 5`` (``closed='right'``).
+
+    Examples
+    --------
+    It is possible to build Intervals of different types, like numeric ones:
+
+    >>> iv = pd.Interval(left=0, right=5)
+    >>> iv
+    Interval(0, 5, closed='right')
+
+    You can check if an element belongs to it
+
+    >>> 2.5 in iv
+    True
+
+    You can test the bounds (``closed='right'``, so ``0 < x <= 5``):
+
+    >>> 0 in iv
+    False
+    >>> 5 in iv
+    True
+    >>> 0.0001 in iv
+    True
+
+    Calculate its length
+
+    >>> iv.length
+    5
+
+    You can operate with `+` and `*` over an Interval and the operation
+    is applied to each of its bounds, so the result depends on the type
+    of the bound elements
+
+    >>> shifted_iv = iv + 3
+    >>> shifted_iv
+    Interval(3, 8, closed='right')
+    >>> extended_iv = iv * 10.0
+    >>> extended_iv
+    Interval(0.0, 50.0, closed='right')
+
+    To create a time interval you can use Timestamps as the bounds
+
+    >>> year_2017 = pd.Interval(pd.Timestamp('2017-01-01 00:00:00'),
+    ...                         pd.Timestamp('2018-01-01 00:00:00'),
+    ...                         closed='left')
+    >>> pd.Timestamp('2017-01-01 00:00') in year_2017
+    True
+    >>> year_2017.length
+    Timedelta('365 days 00:00:00')
+
+    And also you can create string intervals
+
+    >>> volume_1 = pd.Interval('Ant', 'Dog', closed='both')
+    >>> 'Bee' in volume_1
+    True
+
+    See Also
+    --------
+    IntervalIndex : An Index of Interval objects that are all closed on the
+        same side.
+    cut : Convert continuous data into discrete bins (Categorical
+        of Interval objects).
+    qcut : Convert continuous data into bins (Categorical of Interval objects)
+        based on quantiles.
+    Period : Represents a period of time.
+    """
+    _typ = "interval"
+
+    cdef readonly object left
+    """Left bound for the interval"""
+
+    cdef readonly object right
+    """Right bound for the interval"""
+
+    cdef readonly str closed
+    """
+    Whether the interval is closed on the left-side, right-side, both or
+    neither
+    """
+
+    def __init__(self, left, right, str closed='right'):
+        # note: it is faster to just do these checks than to use a special
+        # constructor (__cinit__/__new__) to avoid them
+        if closed not in _VALID_CLOSED:
+            msg = "invalid option for 'closed': {closed}".format(closed=closed)
+            raise ValueError(msg)
+        if not left <= right:
+            raise ValueError('left side of interval must be <= right side')
+        if (isinstance(left, Timestamp) and
+                not tz_compare(left.tzinfo, right.tzinfo)):
+            # GH 18538
+            msg = ("left and right must have the same time zone, got "
+                   "'{left_tz}' and '{right_tz}'")
+            raise ValueError(msg.format(left_tz=left.tzinfo,
+                                        right_tz=right.tzinfo))
+        self.left = left
+        self.right = right
+        self.closed = closed
+
+    def __hash__(self):
+        return hash((self.left, self.right, self.closed))
+
+    def __contains__(self, key):
+        if _interval_like(key):
+            raise TypeError('__contains__ not defined for two intervals')
+        return ((self.left < key if self.open_left else self.left <= key) and
+                (key < self.right if self.open_right else key <= self.right))
+
+    def __richcmp__(self, other, int op):
+        if hasattr(other, 'ndim'):
+            # let numpy (or IntervalIndex) handle vectorization
+            return NotImplemented
+
+        if _interval_like(other):
+            self_tuple = (self.left, self.right, self.closed)
+            other_tuple = (other.left, other.right, other.closed)
+            return PyObject_RichCompare(self_tuple, other_tuple, op)
+
+        # nb. could just return NotImplemented now, but handling this
+        # explicitly allows us to opt into the Python 3 behavior, even on
+        # Python 2.
+        if op == Py_EQ or op == Py_NE:
+            return NotImplemented
+        else:
+            name = type(self).__name__
+            other = type(other).__name__
+            op_str = {Py_LT: '<', Py_LE: '<=', Py_GT: '>', Py_GE: '>='}[op]
+            raise TypeError('unorderable types: {name}() {op} {other}()'
+                            .format(name=name, op=op_str, other=other))
+
+    def __reduce__(self):
+        args = (self.left, self.right, self.closed)
+        return (type(self), args)
+
+    def _repr_base(self):
+        left = self.left
+        right = self.right
+
+        # TODO: need more general formatting methodology here
+        if isinstance(left, Timestamp) and isinstance(right, Timestamp):
+            left = left._short_repr
+            right = right._short_repr
+
+        return left, right
+
+    def __repr__(self):
+
+        left, right = self._repr_base()
+        name = type(self).__name__
+        repr_str = '{name}({left!r}, {right!r}, closed={closed!r})'.format(
+            name=name, left=left, right=right, closed=self.closed)
+        return repr_str
+
+    def __str__(self):
+
+        left, right = self._repr_base()
+        start_symbol = '[' if self.closed_left else '('
+        end_symbol = ']' if self.closed_right else ')'
+        return '{start}{left}, {right}{end}'.format(
+            start=start_symbol, left=left, right=right, end=end_symbol)
+
+    def __add__(self, y):
+        if isinstance(y, numbers.Number):
+            return Interval(self.left + y, self.right + y)
+        elif isinstance(y, Interval) and isinstance(self, numbers.Number):
+            return Interval(y.left + self, y.right + self)
+        return NotImplemented
+
+    def __sub__(self, y):
+        if isinstance(y, numbers.Number):
+            return Interval(self.left - y, self.right - y)
+        return NotImplemented
+
+    def __mul__(self, y):
+        if isinstance(y, numbers.Number):
+            return Interval(self.left * y, self.right * y)
+        elif isinstance(y, Interval) and isinstance(self, numbers.Number):
+            return Interval(y.left * self, y.right * self)
+        return NotImplemented
+
+    def __div__(self, y):
+        if isinstance(y, numbers.Number):
+            return Interval(self.left / y, self.right / y)
+        return NotImplemented
+
+    def __truediv__(self, y):
+        if isinstance(y, numbers.Number):
+            return Interval(self.left / y, self.right / y)
+        return NotImplemented
+
+    def __floordiv__(self, y):
+        if isinstance(y, numbers.Number):
+            return Interval(self.left // y, self.right // y)
+        return NotImplemented
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cpdef intervals_to_interval_bounds(ndarray intervals,
+                                   bint validate_closed=True):
+    """
+    Parameters
+    ----------
+    intervals : ndarray
+        object array of Intervals / nulls
+
+    validate_closed: boolean, default True
+        boolean indicating if all intervals must be closed on the same side.
+        Mismatching closed will raise if True, else return None for closed.
+
+    Returns
+    -------
+    tuples (left: ndarray object array,
+            right: ndarray object array,
+            closed: str)
+
+    """
+
+    cdef:
+        object closed = None, interval
+        int64_t n = len(intervals)
+        ndarray left, right
+        bint seen_closed = False
+
+    left = np.empty(n, dtype=intervals.dtype)
+    right = np.empty(n, dtype=intervals.dtype)
+
+    for i in range(len(intervals)):
+        interval = intervals[i]
+        if util._checknull(interval):
+            left[i] = np.nan
+            right[i] = np.nan
+            continue
+
+        if not isinstance(interval, Interval):
+            raise TypeError("type {typ} with value {iv} is not an interval"
+                            .format(typ=type(interval), iv=interval))
+
+        left[i] = interval.left
+        right[i] = interval.right
+        if not seen_closed:
+            seen_closed = True
+            closed = interval.closed
+        elif closed != interval.closed:
+            closed = None
+            if validate_closed:
+                msg = 'intervals must all be closed on the same side'
+                raise ValueError(msg)
+
+    return left, right, closed
+
+include "intervaltree.pxi"
diff --git a/pandas/_libs/intervaltree.pxi.in b/pandas/_libs/intervaltree.pxi.in
new file mode 100644
index 0000000000000..9ed76242a95c3
--- /dev/null
+++ b/pandas/_libs/intervaltree.pxi.in
@@ -0,0 +1,401 @@
+"""
+Template for intervaltree
+
+WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
+"""
+
+from numpy cimport (
+    int64_t, int32_t, float64_t, float32_t, uint64_t,
+    ndarray,
+    PyArray_ArgSort, NPY_QUICKSORT, PyArray_Take)
+import numpy as np
+
+cimport cython
+from cython cimport Py_ssize_t
+
+cimport numpy as cnp
+cnp.import_array()
+
+from hashtable cimport Int64Vector, Int64VectorData
+
+
+ctypedef fused scalar_t:
+    float64_t
+    float32_t
+    int64_t
+    int32_t
+    uint64_t
+
+
+#----------------------------------------------------------------------
+# IntervalTree
+#----------------------------------------------------------------------
+
+cdef class IntervalTree(IntervalMixin):
+    """A centered interval tree
+
+    Based off the algorithm described on Wikipedia:
+    http://en.wikipedia.org/wiki/Interval_tree
+
+    we are emulating the IndexEngine interface
+    """
+    cdef:
+        readonly object left, right, root, dtype
+        readonly str closed
+        object _left_sorter, _right_sorter
+
+    def __init__(self, left, right, closed='right', leaf_size=100):
+        """
+        Parameters
+        ----------
+        left, right : np.ndarray[ndim=1]
+            Left and right bounds for each interval. Assumed to contain no
+            NaNs.
+        closed : {'left', 'right', 'both', 'neither'}, optional
+            Whether the intervals are closed on the left-side, right-side, both
+            or neither. Defaults to 'right'.
+        leaf_size : int, optional
+            Parameter that controls when the tree switches from creating nodes
+            to brute-force search. Tune this parameter to optimize query
+            performance.
+        """
+        if closed not in ['left', 'right', 'both', 'neither']:
+            raise ValueError("invalid option for 'closed': %s" % closed)
+
+        left = np.asarray(left)
+        right = np.asarray(right)
+        self.dtype = np.result_type(left, right)
+        self.left = np.asarray(left, dtype=self.dtype)
+        self.right = np.asarray(right, dtype=self.dtype)
+
+        indices = np.arange(len(left), dtype='int64')
+
+        self.closed = closed
+
+        node_cls = NODE_CLASSES[str(self.dtype), closed]
+        self.root = node_cls(self.left, self.right, indices, leaf_size)
+
+    @property
+    def left_sorter(self):
+        """How to sort the left labels; this is used for binary search
+        """
+        if self._left_sorter is None:
+            self._left_sorter = np.argsort(self.left)
+        return self._left_sorter
+
+    @property
+    def right_sorter(self):
+        """How to sort the right labels
+        """
+        if self._right_sorter is None:
+            self._right_sorter = np.argsort(self.right)
+        return self._right_sorter
+
+    def get_loc(self, scalar_t key):
+        """Return all positions corresponding to intervals that overlap with
+        the given scalar key
+        """
+        result = Int64Vector()
+        self.root.query(result, key)
+        if not result.data.n:
+            raise KeyError(key)
+        return result.to_array()
+
+    def _get_partial_overlap(self, key_left, key_right, side):
+        """Return all positions corresponding to intervals with the given side
+        falling between the left and right bounds of an interval query
+        """
+        if side == 'left':
+            values = self.left
+            sorter = self.left_sorter
+        else:
+            values = self.right
+            sorter = self.right_sorter
+        key = [key_left, key_right]
+        i, j = values.searchsorted(key, sorter=sorter)
+        return sorter[i:j]
+
+    def get_loc_interval(self, key_left, key_right):
+        """Lookup the intervals enclosed in the given interval bounds
+
+        The given interval is presumed to have closed bounds.
+        """
+        import pandas as pd
+        left_overlap = self._get_partial_overlap(key_left, key_right, 'left')
+        right_overlap = self._get_partial_overlap(key_left, key_right, 'right')
+        enclosing = self.get_loc(0.5 * (key_left + key_right))
+        combined = np.concatenate([left_overlap, right_overlap, enclosing])
+        uniques = pd.unique(combined)
+        return uniques
+
+    def get_indexer(self, scalar_t[:] target):
+        """Return the positions corresponding to unique intervals that overlap
+        with the given array of scalar targets.
+        """
+
+        # TODO: write get_indexer_intervals
+        cdef:
+            size_t old_len
+            Py_ssize_t i
+            Int64Vector result
+
+        result = Int64Vector()
+        old_len = 0
+        for i in range(len(target)):
+            self.root.query(result, target[i])
+            if result.data.n == old_len:
+                result.append(-1)
+            elif result.data.n > old_len + 1:
+                raise KeyError(
+                    'indexer does not intersect a unique set of intervals')
+            old_len = result.data.n
+        return result.to_array()
+
+    def get_indexer_non_unique(self, scalar_t[:] target):
+        """Return the positions corresponding to intervals that overlap with
+        the given array of scalar targets. Non-unique positions are repeated.
+        """
+        cdef:
+            size_t old_len
+            Py_ssize_t i
+            Int64Vector result, missing
+
+        result = Int64Vector()
+        missing = Int64Vector()
+        old_len = 0
+        for i in range(len(target)):
+            self.root.query(result, target[i])
+            if result.data.n == old_len:
+                result.append(-1)
+                missing.append(i)
+            old_len = result.data.n
+        return result.to_array(), missing.to_array()
+
+    def __repr__(self):
+        return ('<IntervalTree[{dtype},{closed}]: '
+                '{n_elements} elements>'.format(
+                    dtype=self.dtype, closed=self.closed,
+                    n_elements=self.root.n_elements))
+
+    # compat with IndexEngine interface
+    def clear_mapping(self):
+        pass
+
+
+cdef take(ndarray source, ndarray indices):
+    """Take the given positions from a 1D ndarray
+    """
+    return PyArray_Take(source, indices, 0)
+
+
+cdef sort_values_and_indices(all_values, all_indices, subset):
+    indices = take(all_indices, subset)
+    values = take(all_values, subset)
+    sorter = PyArray_ArgSort(values, 0, NPY_QUICKSORT)
+    sorted_values = take(values, sorter)
+    sorted_indices = take(indices, sorter)
+    return sorted_values, sorted_indices
+
+#----------------------------------------------------------------------
+# Nodes
+#----------------------------------------------------------------------
+
+# we need specialized nodes and leaves to optimize for different dtype and
+# closed values
+
+{{py:
+
+nodes = []
+for dtype in ['float32', 'float64', 'int32', 'int64', 'uint64']:
+    for closed, cmp_left, cmp_right in [
+        ('left', '<=', '<'),
+        ('right', '<', '<='),
+        ('both', '<=', '<='),
+        ('neither', '<', '<')]:
+        cmp_left_converse = '<' if cmp_left == '<=' else '<='
+        cmp_right_converse = '<' if cmp_right == '<=' else '<='
+        nodes.append((dtype, dtype.title(),
+                      closed, closed.title(),
+                      cmp_left,
+                      cmp_right,
+                      cmp_left_converse,
+                      cmp_right_converse))
+
+}}
+
+NODE_CLASSES = {}
+
+{{for dtype, dtype_title, closed, closed_title, cmp_left, cmp_right,
+      cmp_left_converse, cmp_right_converse in nodes}}
+
+cdef class {{dtype_title}}Closed{{closed_title}}IntervalNode:
+    """Non-terminal node for an IntervalTree
+
+    Categorizes intervals by those that fall to the left, those that fall to
+    the right, and those that overlap with the pivot.
+    """
+    cdef:
+        {{dtype_title}}Closed{{closed_title}}IntervalNode left_node, right_node
+        {{dtype}}_t[:] center_left_values, center_right_values, left, right
+        int64_t[:] center_left_indices, center_right_indices, indices
+        {{dtype}}_t min_left, max_right
+        readonly {{dtype}}_t pivot
+        readonly int64_t n_elements, n_center, leaf_size
+        readonly bint is_leaf_node
+
+    def __init__(self,
+                 ndarray[{{dtype}}_t, ndim=1] left,
+                 ndarray[{{dtype}}_t, ndim=1] right,
+                 ndarray[int64_t, ndim=1] indices,
+                 int64_t leaf_size):
+
+        self.n_elements = len(left)
+        self.leaf_size = leaf_size
+
+        # min_left and min_right are used to speed-up query by skipping
+        # query on sub-nodes. If this node has size 0, query is cheap,
+        # so these values don't matter.
+        if left.size > 0:
+            self.min_left = left.min()
+            self.max_right = right.max()
+        else:
+            self.min_left = 0
+            self.max_right = 0
+
+        if self.n_elements <= leaf_size:
+            # make this a terminal (leaf) node
+            self.is_leaf_node = True
+            self.left = left
+            self.right = right
+            self.indices = indices
+            self.n_center = 0
+        else:
+            # calculate a pivot so we can create child nodes
+            self.is_leaf_node = False
+            self.pivot = np.median(left + right) / 2
+            left_set, right_set, center_set = self.classify_intervals(
+                left, right)
+
+            self.left_node = self.new_child_node(left, right,
+                                                 indices, left_set)
+            self.right_node = self.new_child_node(left, right,
+                                                  indices, right_set)
+
+            self.center_left_values, self.center_left_indices = \
+                sort_values_and_indices(left, indices, center_set)
+            self.center_right_values, self.center_right_indices = \
+                sort_values_and_indices(right, indices, center_set)
+            self.n_center = len(self.center_left_indices)
+
+    @cython.wraparound(False)
+    @cython.boundscheck(False)
+    cdef classify_intervals(self, {{dtype}}_t[:] left, {{dtype}}_t[:] right):
+        """Classify the given intervals based upon whether they fall to the
+        left, right, or overlap with this node's pivot.
+        """
+        cdef:
+            Int64Vector left_ind, right_ind, overlapping_ind
+            Py_ssize_t i
+
+        left_ind = Int64Vector()
+        right_ind = Int64Vector()
+        overlapping_ind = Int64Vector()
+
+        for i in range(self.n_elements):
+            if right[i] {{cmp_right_converse}} self.pivot:
+                left_ind.append(i)
+            elif self.pivot {{cmp_left_converse}} left[i]:
+                right_ind.append(i)
+            else:
+                overlapping_ind.append(i)
+
+        return (left_ind.to_array(),
+                right_ind.to_array(),
+                overlapping_ind.to_array())
+
+    cdef new_child_node(self,
+                        ndarray[{{dtype}}_t, ndim=1] left,
+                        ndarray[{{dtype}}_t, ndim=1] right,
+                        ndarray[int64_t, ndim=1] indices,
+                        ndarray[int64_t, ndim=1] subset):
+        """Create a new child node.
+        """
+        left = take(left, subset)
+        right = take(right, subset)
+        indices = take(indices, subset)
+        return {{dtype_title}}Closed{{closed_title}}IntervalNode(
+            left, right, indices, self.leaf_size)
+
+    @cython.wraparound(False)
+    @cython.boundscheck(False)
+    @cython.initializedcheck(False)
+    cpdef query(self, Int64Vector result, scalar_t point):
+        """Recursively query this node and its sub-nodes for intervals that
+        overlap with the query point.
+        """
+        cdef:
+            int64_t[:] indices
+            {{dtype}}_t[:] values
+            Py_ssize_t i
+
+        if self.is_leaf_node:
+            # Once we get down to a certain size, it doesn't make sense to
+            # continue the binary tree structure. Instead, we use linear
+            # search.
+            for i in range(self.n_elements):
+                if self.left[i] {{cmp_left}} point {{cmp_right}} self.right[i]:
+                    result.append(self.indices[i])
+        else:
+            # There are child nodes. Based on comparing our query to the pivot,
+            # look at the center values, then go to the relevant child.
+            if point < self.pivot:
+                values = self.center_left_values
+                indices = self.center_left_indices
+                for i in range(self.n_center):
+                    if not values[i] {{cmp_left}} point:
+                        break
+                    result.append(indices[i])
+                if point {{cmp_right}} self.left_node.max_right:
+                    self.left_node.query(result, point)
+            elif point > self.pivot:
+                values = self.center_right_values
+                indices = self.center_right_indices
+                for i in range(self.n_center - 1, -1, -1):
+                    if not point {{cmp_right}} values[i]:
+                        break
+                    result.append(indices[i])
+                if self.right_node.min_left {{cmp_left}} point:
+                    self.right_node.query(result, point)
+            else:
+                result.extend(self.center_left_indices)
+
+    def __repr__(self):
+        if self.is_leaf_node:
+            return ('<{{dtype_title}}Closed{{closed_title}}IntervalNode: '
+                    '%s elements (terminal)>' % self.n_elements)
+        else:
+            n_left = self.left_node.n_elements
+            n_right = self.right_node.n_elements
+            n_center = self.n_elements - n_left - n_right
+            return ('<{{dtype_title}}Closed{{closed_title}}IntervalNode: '
+                    'pivot %s, %s elements (%s left, %s right, %s '
+                    'overlapping)>' % (self.pivot, self.n_elements,
+                                       n_left, n_right, n_center))
+
+    def counts(self):
+        """
+        Inspect counts on this node
+        useful for debugging purposes
+        """
+        if self.is_leaf_node:
+            return self.n_elements
+        else:
+            m = len(self.center_left_values)
+            l = self.left_node.counts()
+            r = self.right_node.counts()
+            return (m, (l, r))
+
+NODE_CLASSES['{{dtype}}',
+             '{{closed}}'] = {{dtype_title}}Closed{{closed_title}}IntervalNode
+
+{{endfor}}
diff --git a/pandas/src/join.pyx b/pandas/_libs/join.pyx
similarity index 86%
rename from pandas/src/join.pyx
rename to pandas/_libs/join.pyx
index 8a9cf01375a68..27d2a639d13e6 100644
--- a/pandas/src/join.pyx
+++ b/pandas/_libs/join.pyx
@@ -1,3 +1,25 @@
+# cython: profile=False
+
+cimport cython
+from cython cimport Py_ssize_t
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport (ndarray,
+                    int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
+                    uint32_t, uint64_t, float32_t, float64_t)
+cnp.import_array()
+
+
+cdef double NaN = <double> np.NaN
+cdef double nan = NaN
+
+from pandas._libs.algos import groupsort_indexer, ensure_platform_int
+from pandas.core.algorithms import take_nd
+
+include "join_func_helper.pxi"
+
+
 def inner_join(ndarray[int64_t] left, ndarray[int64_t] right,
                Py_ssize_t max_groups):
     cdef:
@@ -48,6 +70,7 @@ def inner_join(ndarray[int64_t] left, ndarray[int64_t] right,
     return (_get_result_indexer(left_sorter, left_indexer),
             _get_result_indexer(right_sorter, right_indexer))
 
+
 def left_outer_join(ndarray[int64_t] left, ndarray[int64_t] right,
                     Py_ssize_t max_groups, sort=True):
     cdef:
@@ -108,25 +131,22 @@ def left_outer_join(ndarray[int64_t] left, ndarray[int64_t] right,
             # no multiple matches for any row on the left
             # this is a short-cut to avoid groupsort_indexer
             # otherwise, the `else` path also works in this case
-            if left_sorter.dtype != np.int_:
-                left_sorter = left_sorter.astype(np.int_)
+            left_sorter = ensure_platform_int(left_sorter)
 
-            rev = np.empty(len(left), dtype=np.int_)
+            rev = np.empty(len(left), dtype=np.intp)
             rev.put(left_sorter, np.arange(len(left)))
         else:
             rev, _ = groupsort_indexer(left_indexer, len(left))
 
-        if rev.dtype != np.int_:
-              rev = rev.astype(np.int_)
+        rev = ensure_platform_int(rev)
         right_indexer = right_indexer.take(rev)
         left_indexer = left_indexer.take(rev)
 
     return left_indexer, right_indexer
 
 
-
 def full_outer_join(ndarray[int64_t] left, ndarray[int64_t] right,
-                          Py_ssize_t max_groups):
+                    Py_ssize_t max_groups):
     cdef:
         Py_ssize_t i, j, k, count = 0
         ndarray[int64_t] left_count, right_count, left_sorter, right_sorter
@@ -188,13 +208,9 @@ def full_outer_join(ndarray[int64_t] left, ndarray[int64_t] right,
             _get_result_indexer(right_sorter, right_indexer))
 
 
-
 def _get_result_indexer(sorter, indexer):
-    if indexer.dtype != np.int_:
-        indexer = indexer.astype(np.int_)
     if len(sorter) > 0:
-        res = sorter.take(indexer)
-        np.putmask(res, indexer == -1, -1)
+        res = take_nd(sorter, indexer, fill_value=-1)
     else:
         # length-0 case
         res = np.empty(len(indexer), dtype=np.int64)
@@ -203,7 +219,6 @@ def _get_result_indexer(sorter, indexer):
     return res
 
 
-
 def ffill_indexer(ndarray[int64_t] indexer):
     cdef:
         Py_ssize_t i, n = len(indexer)
@@ -224,26 +239,4 @@ def ffill_indexer(ndarray[int64_t] indexer):
     return result
 
 
-def ffill_by_group(ndarray[int64_t] indexer, ndarray[int64_t] group_ids,
-                   int64_t max_group):
-    cdef:
-        Py_ssize_t i, n = len(indexer)
-        ndarray[int64_t] result, last_obs
-        int64_t gid, val
-
-    result = np.empty(n, dtype=np.int64)
-
-    last_obs = np.empty(max_group, dtype=np.int64)
-    last_obs.fill(-1)
-
-    for i in range(n):
-        gid = group_ids[i]
-        val = indexer[i]
-        if val == -1:
-            result[i] = last_obs[gid]
-        else:
-            result[i] = val
-            last_obs[gid] = val
-
-    return result
-
+include "join_helper.pxi"
diff --git a/pandas/_libs/join_func_helper.pxi.in b/pandas/_libs/join_func_helper.pxi.in
new file mode 100644
index 0000000000000..73d231b8588dc
--- /dev/null
+++ b/pandas/_libs/join_func_helper.pxi.in
@@ -0,0 +1,374 @@
+# cython: boundscheck=False, wraparound=False
+"""
+Template for each `dtype` helper function for hashtable
+
+WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
+"""
+
+#----------------------------------------------------------------------
+# asof_join_by
+#----------------------------------------------------------------------
+
+from hashtable cimport PyObjectHashTable, UInt64HashTable, Int64HashTable
+
+{{py:
+
+# table_type, by_dtype
+by_dtypes = [('PyObjectHashTable', 'object'), ('Int64HashTable', 'int64_t'),
+             ('UInt64HashTable', 'uint64_t')]
+
+# on_dtype
+on_dtypes = ['uint8_t', 'uint16_t', 'uint32_t', 'uint64_t',
+             'int8_t', 'int16_t', 'int32_t', 'int64_t',
+             'float', 'double']
+
+}}
+
+
+
+{{for table_type, by_dtype in by_dtypes}}
+{{for on_dtype in on_dtypes}}
+
+
+def asof_join_backward_{{on_dtype}}_by_{{by_dtype}}(
+        ndarray[{{on_dtype}}] left_values,
+        ndarray[{{on_dtype}}] right_values,
+        ndarray[{{by_dtype}}] left_by_values,
+        ndarray[{{by_dtype}}] right_by_values,
+        bint allow_exact_matches=1,
+        tolerance=None):
+
+    cdef:
+        Py_ssize_t left_pos, right_pos, left_size, right_size, found_right_pos
+        ndarray[int64_t] left_indexer, right_indexer
+        bint has_tolerance = 0
+        {{on_dtype}} tolerance_ = 0
+        {{on_dtype}} diff = 0
+        {{table_type}} hash_table
+        {{by_dtype}} by_value
+
+    # if we are using tolerance, set our objects
+    if tolerance is not None:
+        has_tolerance = 1
+        tolerance_ = tolerance
+
+    left_size = len(left_values)
+    right_size = len(right_values)
+
+    left_indexer = np.empty(left_size, dtype=np.int64)
+    right_indexer = np.empty(left_size, dtype=np.int64)
+
+    hash_table = {{table_type}}(right_size)
+
+    right_pos = 0
+    for left_pos in range(left_size):
+        # restart right_pos if it went negative in a previous iteration
+        if right_pos < 0:
+            right_pos = 0
+
+        # find last position in right whose value is less than left's
+        if allow_exact_matches:
+            while right_pos < right_size and\
+                right_values[right_pos] <= left_values[left_pos]:
+                hash_table.set_item(right_by_values[right_pos], right_pos)
+                right_pos += 1
+        else:
+            while right_pos < right_size and\
+                right_values[right_pos] < left_values[left_pos]:
+                hash_table.set_item(right_by_values[right_pos], right_pos)
+                right_pos += 1
+        right_pos -= 1
+
+        # save positions as the desired index
+        by_value = left_by_values[left_pos]
+        found_right_pos = hash_table.get_item(by_value)\
+                          if by_value in hash_table else -1
+        left_indexer[left_pos] = left_pos
+        right_indexer[left_pos] = found_right_pos
+
+        # if needed, verify that tolerance is met
+        if has_tolerance and found_right_pos != -1:
+            diff = left_values[left_pos] - right_values[found_right_pos]
+            if diff > tolerance_:
+                right_indexer[left_pos] = -1
+
+    return left_indexer, right_indexer
+
+
+def asof_join_forward_{{on_dtype}}_by_{{by_dtype}}(
+        ndarray[{{on_dtype}}] left_values,
+        ndarray[{{on_dtype}}] right_values,
+        ndarray[{{by_dtype}}] left_by_values,
+        ndarray[{{by_dtype}}] right_by_values,
+        bint allow_exact_matches=1,
+        tolerance=None):
+
+    cdef:
+        Py_ssize_t left_pos, right_pos, left_size, right_size, found_right_pos
+        ndarray[int64_t] left_indexer, right_indexer
+        bint has_tolerance = 0
+        {{on_dtype}} tolerance_ = 0
+        {{on_dtype}} diff = 0
+        {{table_type}} hash_table
+        {{by_dtype}} by_value
+
+    # if we are using tolerance, set our objects
+    if tolerance is not None:
+        has_tolerance = 1
+        tolerance_ = tolerance
+
+    left_size = len(left_values)
+    right_size = len(right_values)
+
+    left_indexer = np.empty(left_size, dtype=np.int64)
+    right_indexer = np.empty(left_size, dtype=np.int64)
+
+    hash_table = {{table_type}}(right_size)
+
+    right_pos = right_size - 1
+    for left_pos in range(left_size - 1, -1, -1):
+        # restart right_pos if it went over in a previous iteration
+        if right_pos == right_size:
+            right_pos = right_size - 1
+
+        # find first position in right whose value is greater than left's
+        if allow_exact_matches:
+            while right_pos >= 0 and\
+                right_values[right_pos] >= left_values[left_pos]:
+                hash_table.set_item(right_by_values[right_pos], right_pos)
+                right_pos -= 1
+        else:
+            while right_pos >= 0 and\
+                right_values[right_pos] > left_values[left_pos]:
+                hash_table.set_item(right_by_values[right_pos], right_pos)
+                right_pos -= 1
+        right_pos += 1
+
+        # save positions as the desired index
+        by_value = left_by_values[left_pos]
+        found_right_pos = hash_table.get_item(by_value)\
+                          if by_value in hash_table else -1
+        left_indexer[left_pos] = left_pos
+        right_indexer[left_pos] = found_right_pos
+
+        # if needed, verify that tolerance is met
+        if has_tolerance and found_right_pos != -1:
+            diff = right_values[found_right_pos] - left_values[left_pos]
+            if diff > tolerance_:
+                right_indexer[left_pos] = -1
+
+    return left_indexer, right_indexer
+
+
+def asof_join_nearest_{{on_dtype}}_by_{{by_dtype}}(
+        ndarray[{{on_dtype}}] left_values,
+        ndarray[{{on_dtype}}] right_values,
+        ndarray[{{by_dtype}}] left_by_values,
+        ndarray[{{by_dtype}}] right_by_values,
+        bint allow_exact_matches=1,
+        tolerance=None):
+
+    cdef:
+        Py_ssize_t left_size, right_size, i
+        ndarray[int64_t] left_indexer, right_indexer, bli, bri, fli, fri
+        {{on_dtype}} bdiff, fdiff
+
+    left_size = len(left_values)
+    right_size = len(right_values)
+
+    left_indexer = np.empty(left_size, dtype=np.int64)
+    right_indexer = np.empty(left_size, dtype=np.int64)
+
+    # search both forward and backward
+    bli, bri =\
+        asof_join_backward_{{on_dtype}}_by_{{by_dtype}}(left_values,
+                                                        right_values,
+                                                        left_by_values,
+                                                        right_by_values,
+                                                        allow_exact_matches,
+                                                        tolerance)
+    fli, fri =\
+        asof_join_forward_{{on_dtype}}_by_{{by_dtype}}(left_values,
+                                                       right_values,
+                                                       left_by_values,
+                                                       right_by_values,
+                                                       allow_exact_matches,
+                                                       tolerance)
+
+    for i in range(len(bri)):
+        # choose timestamp from right with smaller difference
+        if bri[i] != -1 and fri[i] != -1:
+            bdiff = left_values[bli[i]] - right_values[bri[i]]
+            fdiff = right_values[fri[i]] - left_values[fli[i]]
+            right_indexer[i] = bri[i] if bdiff <= fdiff else fri[i]
+        else:
+            right_indexer[i] = bri[i] if bri[i] != -1 else fri[i]
+        left_indexer[i] = bli[i]
+
+    return left_indexer, right_indexer
+
+{{endfor}}
+{{endfor}}
+
+
+#----------------------------------------------------------------------
+# asof_join
+#----------------------------------------------------------------------
+
+{{py:
+
+# on_dtype
+dtypes = ['uint8_t', 'uint16_t', 'uint32_t', 'uint64_t',
+          'int8_t', 'int16_t', 'int32_t', 'int64_t',
+          'float', 'double']
+
+}}
+
+{{for on_dtype in dtypes}}
+
+
+def asof_join_backward_{{on_dtype}}(
+        ndarray[{{on_dtype}}] left_values,
+        ndarray[{{on_dtype}}] right_values,
+        bint allow_exact_matches=1,
+        tolerance=None):
+
+    cdef:
+        Py_ssize_t left_pos, right_pos, left_size, right_size
+        ndarray[int64_t] left_indexer, right_indexer
+        bint has_tolerance = 0
+        {{on_dtype}} tolerance_ = 0
+        {{on_dtype}} diff = 0
+
+    # if we are using tolerance, set our objects
+    if tolerance is not None:
+        has_tolerance = 1
+        tolerance_ = tolerance
+
+    left_size = len(left_values)
+    right_size = len(right_values)
+
+    left_indexer = np.empty(left_size, dtype=np.int64)
+    right_indexer = np.empty(left_size, dtype=np.int64)
+
+    right_pos = 0
+    for left_pos in range(left_size):
+        # restart right_pos if it went negative in a previous iteration
+        if right_pos < 0:
+            right_pos = 0
+
+        # find last position in right whose value is less than left's
+        if allow_exact_matches:
+            while right_pos < right_size and\
+                right_values[right_pos] <= left_values[left_pos]:
+                right_pos += 1
+        else:
+            while right_pos < right_size and\
+                right_values[right_pos] < left_values[left_pos]:
+                right_pos += 1
+        right_pos -= 1
+
+        # save positions as the desired index
+        left_indexer[left_pos] = left_pos
+        right_indexer[left_pos] = right_pos
+
+        # if needed, verify that tolerance is met
+        if has_tolerance and right_pos != -1:
+            diff = left_values[left_pos] - right_values[right_pos]
+            if diff > tolerance_:
+                right_indexer[left_pos] = -1
+
+    return left_indexer, right_indexer
+
+
+def asof_join_forward_{{on_dtype}}(
+        ndarray[{{on_dtype}}] left_values,
+        ndarray[{{on_dtype}}] right_values,
+        bint allow_exact_matches=1,
+        tolerance=None):
+
+    cdef:
+        Py_ssize_t left_pos, right_pos, left_size, right_size
+        ndarray[int64_t] left_indexer, right_indexer
+        bint has_tolerance = 0
+        {{on_dtype}} tolerance_ = 0
+        {{on_dtype}} diff = 0
+
+    # if we are using tolerance, set our objects
+    if tolerance is not None:
+        has_tolerance = 1
+        tolerance_ = tolerance
+
+    left_size = len(left_values)
+    right_size = len(right_values)
+
+    left_indexer = np.empty(left_size, dtype=np.int64)
+    right_indexer = np.empty(left_size, dtype=np.int64)
+
+    right_pos = right_size - 1
+    for left_pos in range(left_size - 1, -1, -1):
+        # restart right_pos if it went over in a previous iteration
+        if right_pos == right_size:
+            right_pos = right_size - 1
+
+        # find first position in right whose value is greater than left's
+        if allow_exact_matches:
+            while right_pos >= 0 and\
+                right_values[right_pos] >= left_values[left_pos]:
+                right_pos -= 1
+        else:
+            while right_pos >= 0 and\
+                right_values[right_pos] > left_values[left_pos]:
+                right_pos -= 1
+        right_pos += 1
+
+        # save positions as the desired index
+        left_indexer[left_pos] = left_pos
+        right_indexer[left_pos] = right_pos\
+                                  if right_pos != right_size else -1
+
+        # if needed, verify that tolerance is met
+        if has_tolerance and right_pos != right_size:
+            diff = right_values[right_pos] - left_values[left_pos]
+            if diff > tolerance_:
+                right_indexer[left_pos] = -1
+
+    return left_indexer, right_indexer
+
+
+def asof_join_nearest_{{on_dtype}}(
+        ndarray[{{on_dtype}}] left_values,
+        ndarray[{{on_dtype}}] right_values,
+        bint allow_exact_matches=1,
+        tolerance=None):
+
+    cdef:
+        Py_ssize_t left_size, right_size, i
+        ndarray[int64_t] left_indexer, right_indexer, bli, bri, fli, fri
+        {{on_dtype}} bdiff, fdiff
+
+    left_size = len(left_values)
+    right_size = len(right_values)
+
+    left_indexer = np.empty(left_size, dtype=np.int64)
+    right_indexer = np.empty(left_size, dtype=np.int64)
+
+    # search both forward and backward
+    bli, bri = asof_join_backward_{{on_dtype}}(left_values, right_values,
+                                               allow_exact_matches, tolerance)
+    fli, fri = asof_join_forward_{{on_dtype}}(left_values, right_values,
+                                              allow_exact_matches, tolerance)
+
+    for i in range(len(bri)):
+        # choose timestamp from right with smaller difference
+        if bri[i] != -1 and fri[i] != -1:
+            bdiff = left_values[bli[i]] - right_values[bri[i]]
+            fdiff = right_values[fri[i]] - left_values[fli[i]]
+            right_indexer[i] = bri[i] if bdiff <= fdiff else fri[i]
+        else:
+            right_indexer[i] = bri[i] if bri[i] != -1 else fri[i]
+        left_indexer[i] = bli[i]
+
+    return left_indexer, right_indexer
+
+{{endfor}}
diff --git a/pandas/_libs/join_helper.pxi.in b/pandas/_libs/join_helper.pxi.in
new file mode 100644
index 0000000000000..feb8cfb76a7f0
--- /dev/null
+++ b/pandas/_libs/join_helper.pxi.in
@@ -0,0 +1,408 @@
+"""
+Template for each `dtype` helper function for join
+
+WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
+"""
+
+#----------------------------------------------------------------------
+# left_join_indexer, inner_join_indexer, outer_join_indexer
+#----------------------------------------------------------------------
+
+{{py:
+
+# name, c_type, dtype
+dtypes = [('float64', 'float64_t', 'np.float64'),
+          ('float32', 'float32_t', 'np.float32'),
+          ('object', 'object', 'object'),
+          ('int32', 'int32_t', 'np.int32'),
+          ('int64', 'int64_t', 'np.int64'),
+          ('uint64', 'uint64_t', 'np.uint64')]
+
+def get_dispatch(dtypes):
+
+    for name, c_type, dtype in dtypes:
+        yield name, c_type, dtype
+
+}}
+
+{{for name, c_type, dtype in get_dispatch(dtypes)}}
+
+# Joins on ordered, unique indices
+
+# right might contain non-unique values
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def left_join_indexer_unique_{{name}}(ndarray[{{c_type}}] left,
+                                      ndarray[{{c_type}}] right):
+    cdef:
+        Py_ssize_t i, j, nleft, nright
+        ndarray[int64_t] indexer
+        {{c_type}} lval, rval
+
+    i = 0
+    j = 0
+    nleft = len(left)
+    nright = len(right)
+
+    indexer = np.empty(nleft, dtype=np.int64)
+    while True:
+        if i == nleft:
+            break
+
+        if j == nright:
+            indexer[i] = -1
+            i += 1
+            continue
+
+        rval = right[j]
+
+        while i < nleft - 1 and left[i] == rval:
+            indexer[i] = j
+            i += 1
+
+        if left[i] == right[j]:
+            indexer[i] = j
+            i += 1
+            while i < nleft - 1 and left[i] == rval:
+                indexer[i] = j
+                i += 1
+            j += 1
+        elif left[i] > rval:
+            indexer[i] = -1
+            j += 1
+        else:
+            indexer[i] = -1
+            i += 1
+    return indexer
+
+
+# @cython.wraparound(False)
+# @cython.boundscheck(False)
+def left_join_indexer_{{name}}(ndarray[{{c_type}}] left,
+                               ndarray[{{c_type}}] right):
+    """
+    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
+    """
+    cdef:
+        Py_ssize_t i, j, k, nright, nleft, count
+        {{c_type}} lval, rval
+        ndarray[int64_t] lindexer, rindexer
+        ndarray[{{c_type}}] result
+
+    nleft = len(left)
+    nright = len(right)
+
+    i = 0
+    j = 0
+    count = 0
+    if nleft > 0:
+        while i < nleft:
+            if j == nright:
+                count += nleft - i
+                break
+
+            lval = left[i]
+            rval = right[j]
+
+            if lval == rval:
+                count += 1
+                if i < nleft - 1:
+                    if j < nright - 1 and right[j + 1] == rval:
+                        j += 1
+                    else:
+                        i += 1
+                        if left[i] != rval:
+                            j += 1
+                elif j < nright - 1:
+                    j += 1
+                    if lval != right[j]:
+                        i += 1
+                else:
+                    # end of the road
+                    break
+            elif lval < rval:
+                count += 1
+                i += 1
+            else:
+                j += 1
+
+    # do it again now that result size is known
+
+    lindexer = np.empty(count, dtype=np.int64)
+    rindexer = np.empty(count, dtype=np.int64)
+    result = np.empty(count, dtype={{dtype}})
+
+    i = 0
+    j = 0
+    count = 0
+    if nleft > 0:
+        while i < nleft:
+            if j == nright:
+                while i < nleft:
+                    lindexer[count] = i
+                    rindexer[count] = -1
+                    result[count] = left[i]
+                    i += 1
+                    count += 1
+                break
+
+            lval = left[i]
+            rval = right[j]
+
+            if lval == rval:
+                lindexer[count] = i
+                rindexer[count] = j
+                result[count] = lval
+                count += 1
+                if i < nleft - 1:
+                    if j < nright - 1 and right[j + 1] == rval:
+                        j += 1
+                    else:
+                        i += 1
+                        if left[i] != rval:
+                            j += 1
+                elif j < nright - 1:
+                    j += 1
+                    if lval != right[j]:
+                        i += 1
+                else:
+                    # end of the road
+                    break
+            elif lval < rval:
+                lindexer[count] = i
+                rindexer[count] = -1
+                result[count] = left[i]
+                count += 1
+                i += 1
+            else:
+                j += 1
+
+    return result, lindexer, rindexer
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def inner_join_indexer_{{name}}(ndarray[{{c_type}}] left,
+                                ndarray[{{c_type}}] right):
+    """
+    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
+    """
+    cdef:
+        Py_ssize_t i, j, k, nright, nleft, count
+        {{c_type}} lval, rval
+        ndarray[int64_t] lindexer, rindexer
+        ndarray[{{c_type}}] result
+
+    nleft = len(left)
+    nright = len(right)
+
+    i = 0
+    j = 0
+    count = 0
+    if nleft > 0 and nright > 0:
+        while True:
+            if i == nleft:
+                break
+            if j == nright:
+                break
+
+            lval = left[i]
+            rval = right[j]
+            if lval == rval:
+                count += 1
+                if i < nleft - 1:
+                    if j < nright - 1 and right[j + 1] == rval:
+                        j += 1
+                    else:
+                        i += 1
+                        if left[i] != rval:
+                            j += 1
+                elif j < nright - 1:
+                    j += 1
+                    if lval != right[j]:
+                        i += 1
+                else:
+                    # end of the road
+                    break
+            elif lval < rval:
+                i += 1
+            else:
+                j += 1
+
+    # do it again now that result size is known
+
+    lindexer = np.empty(count, dtype=np.int64)
+    rindexer = np.empty(count, dtype=np.int64)
+    result = np.empty(count, dtype={{dtype}})
+
+    i = 0
+    j = 0
+    count = 0
+    if nleft > 0 and nright > 0:
+        while True:
+            if i == nleft:
+                break
+            if j == nright:
+                break
+
+            lval = left[i]
+            rval = right[j]
+            if lval == rval:
+                lindexer[count] = i
+                rindexer[count] = j
+                result[count] = rval
+                count += 1
+                if i < nleft - 1:
+                    if j < nright - 1 and right[j + 1] == rval:
+                        j += 1
+                    else:
+                        i += 1
+                        if left[i] != rval:
+                            j += 1
+                elif j < nright - 1:
+                    j += 1
+                    if lval != right[j]:
+                        i += 1
+                else:
+                    # end of the road
+                    break
+            elif lval < rval:
+                i += 1
+            else:
+                j += 1
+
+    return result, lindexer, rindexer
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def outer_join_indexer_{{name}}(ndarray[{{c_type}}] left,
+                                ndarray[{{c_type}}] right):
+    cdef:
+        Py_ssize_t i, j, nright, nleft, count
+        {{c_type}} lval, rval
+        ndarray[int64_t] lindexer, rindexer
+        ndarray[{{c_type}}] result
+
+    nleft = len(left)
+    nright = len(right)
+
+    i = 0
+    j = 0
+    count = 0
+    if nleft == 0:
+        count = nright
+    elif nright == 0:
+        count = nleft
+    else:
+        while True:
+            if i == nleft:
+                count += nright - j
+                break
+            if j == nright:
+                count += nleft - i
+                break
+
+            lval = left[i]
+            rval = right[j]
+            if lval == rval:
+                count += 1
+                if i < nleft - 1:
+                    if j < nright - 1 and right[j + 1] == rval:
+                        j += 1
+                    else:
+                        i += 1
+                        if left[i] != rval:
+                            j += 1
+                elif j < nright - 1:
+                    j += 1
+                    if lval != right[j]:
+                        i += 1
+                else:
+                    # end of the road
+                    break
+            elif lval < rval:
+                count += 1
+                i += 1
+            else:
+                count += 1
+                j += 1
+
+    lindexer = np.empty(count, dtype=np.int64)
+    rindexer = np.empty(count, dtype=np.int64)
+    result = np.empty(count, dtype={{dtype}})
+
+    # do it again, but populate the indexers / result
+
+    i = 0
+    j = 0
+    count = 0
+    if nleft == 0:
+        for j in range(nright):
+            lindexer[j] = -1
+            rindexer[j] = j
+            result[j] = right[j]
+    elif nright == 0:
+        for i in range(nleft):
+            lindexer[i] = i
+            rindexer[i] = -1
+            result[i] = left[i]
+    else:
+        while True:
+            if i == nleft:
+                while j < nright:
+                    lindexer[count] = -1
+                    rindexer[count] = j
+                    result[count] = right[j]
+                    count += 1
+                    j += 1
+                break
+            if j == nright:
+                while i < nleft:
+                    lindexer[count] = i
+                    rindexer[count] = -1
+                    result[count] = left[i]
+                    count += 1
+                    i += 1
+                break
+
+            lval = left[i]
+            rval = right[j]
+
+            if lval == rval:
+                lindexer[count] = i
+                rindexer[count] = j
+                result[count] = lval
+                count += 1
+                if i < nleft - 1:
+                    if j < nright - 1 and right[j + 1] == rval:
+                        j += 1
+                    else:
+                        i += 1
+                        if left[i] != rval:
+                            j += 1
+                elif j < nright - 1:
+                    j += 1
+                    if lval != right[j]:
+                        i += 1
+                else:
+                    # end of the road
+                    break
+            elif lval < rval:
+                lindexer[count] = i
+                rindexer[count] = -1
+                result[count] = lval
+                count += 1
+                i += 1
+            else:
+                lindexer[count] = -1
+                rindexer[count] = j
+                result[count] = rval
+                count += 1
+                j += 1
+
+    return result, lindexer, rindexer
+
+{{endfor}}
diff --git a/pandas/_libs/khash.pxd b/pandas/_libs/khash.pxd
new file mode 100644
index 0000000000000..4c00e273b33b7
--- /dev/null
+++ b/pandas/_libs/khash.pxd
@@ -0,0 +1,142 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+from cpython cimport PyObject
+from numpy cimport int64_t, uint64_t, int32_t, uint32_t, float64_t
+
+cdef extern from "khash_python.h":
+    ctypedef uint32_t khint_t
+    ctypedef khint_t khiter_t
+
+    ctypedef struct kh_pymap_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        PyObject **keys
+        size_t *vals
+
+    kh_pymap_t* kh_init_pymap()
+    void kh_destroy_pymap(kh_pymap_t*)
+    void kh_clear_pymap(kh_pymap_t*)
+    khint_t kh_get_pymap(kh_pymap_t*, PyObject*)
+    void kh_resize_pymap(kh_pymap_t*, khint_t)
+    khint_t kh_put_pymap(kh_pymap_t*, PyObject*, int*)
+    void kh_del_pymap(kh_pymap_t*, khint_t)
+
+    bint kh_exist_pymap(kh_pymap_t*, khiter_t)
+
+    ctypedef struct kh_pyset_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        PyObject **keys
+        size_t *vals
+
+    kh_pyset_t* kh_init_pyset()
+    void kh_destroy_pyset(kh_pyset_t*)
+    void kh_clear_pyset(kh_pyset_t*)
+    khint_t kh_get_pyset(kh_pyset_t*, PyObject*)
+    void kh_resize_pyset(kh_pyset_t*, khint_t)
+    khint_t kh_put_pyset(kh_pyset_t*, PyObject*, int*)
+    void kh_del_pyset(kh_pyset_t*, khint_t)
+
+    bint kh_exist_pyset(kh_pyset_t*, khiter_t)
+
+    ctypedef char* kh_cstr_t
+
+    ctypedef struct kh_str_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        kh_cstr_t *keys
+        size_t *vals
+
+    kh_str_t* kh_init_str() nogil
+    void kh_destroy_str(kh_str_t*) nogil
+    void kh_clear_str(kh_str_t*) nogil
+    khint_t kh_get_str(kh_str_t*, kh_cstr_t) nogil
+    void kh_resize_str(kh_str_t*, khint_t) nogil
+    khint_t kh_put_str(kh_str_t*, kh_cstr_t, int*) nogil
+    void kh_del_str(kh_str_t*, khint_t) nogil
+
+    bint kh_exist_str(kh_str_t*, khiter_t) nogil
+
+    ctypedef struct kh_int64_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        int64_t *keys
+        size_t *vals
+
+    kh_int64_t* kh_init_int64() nogil
+    void kh_destroy_int64(kh_int64_t*) nogil
+    void kh_clear_int64(kh_int64_t*) nogil
+    khint_t kh_get_int64(kh_int64_t*, int64_t) nogil
+    void kh_resize_int64(kh_int64_t*, khint_t) nogil
+    khint_t kh_put_int64(kh_int64_t*, int64_t, int*) nogil
+    void kh_del_int64(kh_int64_t*, khint_t) nogil
+
+    bint kh_exist_int64(kh_int64_t*, khiter_t) nogil
+
+    ctypedef uint64_t khuint64_t
+
+    ctypedef struct kh_uint64_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        khuint64_t *keys
+        size_t *vals
+
+    kh_uint64_t* kh_init_uint64() nogil
+    void kh_destroy_uint64(kh_uint64_t*) nogil
+    void kh_clear_uint64(kh_uint64_t*) nogil
+    khint_t kh_get_uint64(kh_uint64_t*, uint64_t) nogil
+    void kh_resize_uint64(kh_uint64_t*, khint_t) nogil
+    khint_t kh_put_uint64(kh_uint64_t*, uint64_t, int*) nogil
+    void kh_del_uint64(kh_uint64_t*, khint_t) nogil
+
+    bint kh_exist_uint64(kh_uint64_t*, khiter_t) nogil
+
+    ctypedef struct kh_float64_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        float64_t *keys
+        size_t *vals
+
+    kh_float64_t* kh_init_float64() nogil
+    void kh_destroy_float64(kh_float64_t*) nogil
+    void kh_clear_float64(kh_float64_t*) nogil
+    khint_t kh_get_float64(kh_float64_t*, float64_t) nogil
+    void kh_resize_float64(kh_float64_t*, khint_t) nogil
+    khint_t kh_put_float64(kh_float64_t*, float64_t, int*) nogil
+    void kh_del_float64(kh_float64_t*, khint_t) nogil
+
+    bint kh_exist_float64(kh_float64_t*, khiter_t) nogil
+
+    ctypedef struct kh_int32_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        int32_t *keys
+        size_t *vals
+
+    kh_int32_t* kh_init_int32() nogil
+    void kh_destroy_int32(kh_int32_t*) nogil
+    void kh_clear_int32(kh_int32_t*) nogil
+    khint_t kh_get_int32(kh_int32_t*, int32_t) nogil
+    void kh_resize_int32(kh_int32_t*, khint_t) nogil
+    khint_t kh_put_int32(kh_int32_t*, int32_t, int*) nogil
+    void kh_del_int32(kh_int32_t*, khint_t) nogil
+
+    bint kh_exist_int32(kh_int32_t*, khiter_t) nogil
+
+    # sweep factorize
+
+    ctypedef struct kh_strbox_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        kh_cstr_t *keys
+        PyObject **vals
+
+    kh_strbox_t* kh_init_strbox() nogil
+    void kh_destroy_strbox(kh_strbox_t*) nogil
+    void kh_clear_strbox(kh_strbox_t*) nogil
+    khint_t kh_get_strbox(kh_strbox_t*, kh_cstr_t) nogil
+    void kh_resize_strbox(kh_strbox_t*, khint_t) nogil
+    khint_t kh_put_strbox(kh_strbox_t*, kh_cstr_t, int*) nogil
+    void kh_del_strbox(kh_strbox_t*, khint_t) nogil
+
+    bint kh_exist_strbox(kh_strbox_t*, khiter_t) nogil
diff --git a/pandas/_libs/lib.pyx b/pandas/_libs/lib.pyx
new file mode 100644
index 0000000000000..ae9d240afcb93
--- /dev/null
+++ b/pandas/_libs/lib.pyx
@@ -0,0 +1,757 @@
+# cython: profile=False
+import operator
+
+cimport cython
+from cython cimport Py_ssize_t
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport (ndarray, PyArray_NDIM, PyArray_GETITEM,
+                    PyArray_ITER_DATA, PyArray_ITER_NEXT, PyArray_IterNew,
+                    flatiter, NPY_OBJECT,
+                    int64_t,
+                    float32_t, float64_t,
+                    uint8_t, uint64_t,
+                    complex128_t)
+cnp.import_array()
+
+from cpython cimport (Py_INCREF, PyTuple_SET_ITEM,
+                      PyList_Check, PyFloat_Check,
+                      PyString_Check,
+                      PyBytes_Check,
+                      PyUnicode_Check,
+                      PyTuple_New,
+                      Py_EQ,
+                      PyObject_RichCompareBool)
+
+from cpython.datetime cimport (PyDateTime_Check, PyDate_Check,
+                               PyTime_Check, PyDelta_Check,
+                               PyDateTime_IMPORT)
+PyDateTime_IMPORT
+
+from tslib import NaT, array_to_datetime
+from missing cimport checknull
+
+
+cimport util
+cdef int64_t NPY_NAT = util.get_nat()
+from util cimport is_array, _checknull
+
+
+def values_from_object(object o):
+    """ return my values or the object if we are say an ndarray """
+    cdef f
+
+    f = getattr(o, 'get_values', None)
+    if f is not None:
+        o = f()
+
+    return o
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def memory_usage_of_objects(ndarray[object, ndim=1] arr):
+    """ return the memory usage of an object array in bytes,
+    does not include the actual bytes of the pointers """
+    cdef Py_ssize_t i, n
+    cdef int64_t s = 0
+
+    n = len(arr)
+    for i from 0 <= i < n:
+        s += arr[i].__sizeof__()
+    return s
+
+
+# ----------------------------------------------------------------------
+
+
+cpdef bint is_scalar(object val):
+    """
+    Return True if given value is scalar.
+
+    This includes:
+    - numpy array scalar (e.g. np.int64)
+    - Python builtin numerics
+    - Python builtin byte arrays and strings
+    - None
+    - instances of datetime.datetime
+    - instances of datetime.timedelta
+    - Period
+    - instances of decimal.Decimal
+    - Interval
+    - DateOffset
+
+    """
+
+    return (cnp.PyArray_IsAnyScalar(val)
+            # As of numpy-1.9, PyArray_IsAnyScalar misses bytearrays on Py3.
+            or PyBytes_Check(val)
+            # We differ from numpy (as of 1.10), which claims that None is
+            # not scalar in np.isscalar().
+            or val is None
+            or PyDate_Check(val)
+            or PyDelta_Check(val)
+            or PyTime_Check(val)
+            or util.is_period_object(val)
+            or is_decimal(val)
+            or is_interval(val)
+            or is_offset(val))
+
+
+def item_from_zerodim(object val):
+    """
+    If the value is a zerodim array, return the item it contains.
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    result : object
+
+    Examples
+    --------
+    >>> item_from_zerodim(1)
+    1
+    >>> item_from_zerodim('foobar')
+    'foobar'
+    >>> item_from_zerodim(np.array(1))
+    1
+    >>> item_from_zerodim(np.array([1]))
+    array([1])
+
+    """
+    if cnp.PyArray_IsZeroDim(val):
+        return cnp.PyArray_ToScalar(cnp.PyArray_DATA(val), val)
+    return val
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def fast_unique_multiple(list arrays):
+    cdef:
+        ndarray[object] buf
+        Py_ssize_t k = len(arrays)
+        Py_ssize_t i, j, n
+        list uniques = []
+        dict table = {}
+        object val, stub = 0
+
+    for i from 0 <= i < k:
+        buf = arrays[i]
+        n = len(buf)
+        for j from 0 <= j < n:
+            val = buf[j]
+            if val not in table:
+                table[val] = stub
+                uniques.append(val)
+    try:
+        uniques.sort()
+    except Exception:
+        pass
+
+    return uniques
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def fast_unique_multiple_list(list lists, bint sort=True):
+    cdef:
+        list buf
+        Py_ssize_t k = len(lists)
+        Py_ssize_t i, j, n
+        list uniques = []
+        dict table = {}
+        object val, stub = 0
+
+    for i from 0 <= i < k:
+        buf = lists[i]
+        n = len(buf)
+        for j from 0 <= j < n:
+            val = buf[j]
+            if val not in table:
+                table[val] = stub
+                uniques.append(val)
+    if sort:
+        try:
+            uniques.sort()
+        except Exception:
+            pass
+
+    return uniques
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def fast_unique_multiple_list_gen(object gen, bint sort=True):
+    """
+    Generate a list of unique values from a generator of lists.
+
+    Parameters
+    ----------
+    gen : generator object
+        A generator of lists from which the unique list is created
+    sort : boolean
+        Whether or not to sort the resulting unique list
+
+    Returns
+    -------
+    unique_list : list of unique values
+    """
+    cdef:
+        list buf
+        Py_ssize_t j, n
+        list uniques = []
+        dict table = {}
+        object val, stub = 0
+
+    for buf in gen:
+        n = len(buf)
+        for j from 0 <= j < n:
+            val = buf[j]
+            if val not in table:
+                table[val] = stub
+                uniques.append(val)
+    if sort:
+        try:
+            uniques.sort()
+        except Exception:
+            pass
+
+    return uniques
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def dicts_to_array(list dicts, list columns):
+    cdef:
+        Py_ssize_t i, j, k, n
+        ndarray[object, ndim=2] result
+        dict row
+        object col, onan = np.nan
+
+    k = len(columns)
+    n = len(dicts)
+
+    result = np.empty((n, k), dtype='O')
+
+    for i in range(n):
+        row = dicts[i]
+        for j in range(k):
+            col = columns[j]
+            if col in row:
+                result[i, j] = row[col]
+            else:
+                result[i, j] = onan
+
+    return result
+
+
+def fast_zip(list ndarrays):
+    """
+    For zipping multiple ndarrays into an ndarray of tuples
+    """
+    cdef:
+        Py_ssize_t i, j, k, n
+        ndarray[object] result
+        flatiter it
+        object val, tup
+
+    k = len(ndarrays)
+    n = len(ndarrays[0])
+
+    result = np.empty(n, dtype=object)
+
+    # initialize tuples on first pass
+    arr = ndarrays[0]
+    it = <flatiter> PyArray_IterNew(arr)
+    for i in range(n):
+        val = PyArray_GETITEM(arr, PyArray_ITER_DATA(it))
+        tup = PyTuple_New(k)
+
+        PyTuple_SET_ITEM(tup, 0, val)
+        Py_INCREF(val)
+        result[i] = tup
+        PyArray_ITER_NEXT(it)
+
+    for j in range(1, k):
+        arr = ndarrays[j]
+        it = <flatiter> PyArray_IterNew(arr)
+        if len(arr) != n:
+            raise ValueError('all arrays must be same length')
+
+        for i in range(n):
+            val = PyArray_GETITEM(arr, PyArray_ITER_DATA(it))
+            PyTuple_SET_ITEM(result[i], j, val)
+            Py_INCREF(val)
+            PyArray_ITER_NEXT(it)
+
+    return result
+
+
+def get_reverse_indexer(ndarray[int64_t] indexer, Py_ssize_t length):
+    """
+    Reverse indexing operation.
+
+    Given `indexer`, make `indexer_inv` of it, such that::
+
+        indexer_inv[indexer[x]] = x
+
+    .. note:: If indexer is not unique, only first occurrence is accounted.
+
+    """
+
+    cdef:
+        Py_ssize_t i, n = len(indexer)
+        ndarray[int64_t] rev_indexer
+        int64_t idx
+
+    rev_indexer = np.empty(length, dtype=np.int64)
+    rev_indexer.fill(-1)
+    for i in range(n):
+        idx = indexer[i]
+        if idx != -1:
+            rev_indexer[idx] = i
+
+    return rev_indexer
+
+
+def has_infs_f4(ndarray[float32_t] arr):
+    cdef:
+        Py_ssize_t i, n = len(arr)
+        float32_t inf, neginf, val
+
+    inf = np.inf
+    neginf = -inf
+
+    for i in range(n):
+        val = arr[i]
+        if val == inf or val == neginf:
+            return True
+    return False
+
+
+def has_infs_f8(ndarray[float64_t] arr):
+    cdef:
+        Py_ssize_t i, n = len(arr)
+        float64_t inf, neginf, val
+
+    inf = np.inf
+    neginf = -inf
+
+    for i in range(n):
+        val = arr[i]
+        if val == inf or val == neginf:
+            return True
+    return False
+
+
+def maybe_indices_to_slice(ndarray[int64_t] indices, int max_len):
+    cdef:
+        Py_ssize_t i, n = len(indices)
+        int k, vstart, vlast, v
+
+    if n == 0:
+        return slice(0, 0)
+
+    vstart = indices[0]
+    if vstart < 0 or max_len <= vstart:
+        return indices
+
+    if n == 1:
+        return slice(vstart, vstart + 1)
+
+    vlast = indices[n - 1]
+    if vlast < 0 or max_len <= vlast:
+        return indices
+
+    k = indices[1] - indices[0]
+    if k == 0:
+        return indices
+    else:
+        for i in range(2, n):
+            v = indices[i]
+            if v - indices[i - 1] != k:
+                return indices
+
+        if k > 0:
+            return slice(vstart, vlast + 1, k)
+        else:
+            if vlast == 0:
+                return slice(vstart, None, k)
+            else:
+                return slice(vstart, vlast - 1, k)
+
+
+def maybe_booleans_to_slice(ndarray[uint8_t] mask):
+    cdef:
+        Py_ssize_t i, n = len(mask)
+        Py_ssize_t start, end
+        bint started = 0, finished = 0
+
+    for i in range(n):
+        if mask[i]:
+            if finished:
+                return mask.view(np.bool_)
+            if not started:
+                started = 1
+                start = i
+        else:
+            if finished:
+                continue
+
+            if started:
+                end = i
+                finished = 1
+
+    if not started:
+        return slice(0, 0)
+    if not finished:
+        return slice(start, None)
+    else:
+        return slice(start, end)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cpdef bint array_equivalent_object(object[:] left, object[:] right):
+    """ perform an element by element comparion on 1-d object arrays
+        taking into account nan positions """
+    cdef:
+        Py_ssize_t i, n = left.shape[0]
+        object x, y
+
+    for i in range(n):
+        x = left[i]
+        y = right[i]
+
+        # we are either not equal or both nan
+        # I think None == None will be true here
+        if not (PyObject_RichCompareBool(x, y, Py_EQ) or
+                _checknull(x) and _checknull(y)):
+            return False
+    return True
+
+
+def astype_intsafe(ndarray[object] arr, new_dtype):
+    cdef:
+        Py_ssize_t i, n = len(arr)
+        object v
+        bint is_datelike
+        ndarray result
+
+    # on 32-bit, 1.6.2 numpy M8[ns] is a subdtype of integer, which is weird
+    is_datelike = new_dtype in ['M8[ns]', 'm8[ns]']
+
+    result = np.empty(n, dtype=new_dtype)
+    for i in range(n):
+        v = arr[i]
+        if is_datelike and checknull(v):
+            result[i] = NPY_NAT
+        else:
+            # we can use the unsafe version because we know `result` is mutable
+            # since it was created from `np.empty`
+            util.set_value_at_unsafe(result, i, v)
+
+    return result
+
+
+cpdef ndarray[object] astype_unicode(ndarray arr):
+    cdef:
+        Py_ssize_t i, n = arr.size
+        ndarray[object] result = np.empty(n, dtype=object)
+
+    for i in range(n):
+        # we can use the unsafe version because we know `result` is mutable
+        # since it was created from `np.empty`
+        util.set_value_at_unsafe(result, i, unicode(arr[i]))
+
+    return result
+
+
+cpdef ndarray[object] astype_str(ndarray arr):
+    cdef:
+        Py_ssize_t i, n = arr.size
+        ndarray[object] result = np.empty(n, dtype=object)
+
+    for i in range(n):
+        # we can use the unsafe version because we know `result` is mutable
+        # since it was created from `np.empty`
+        util.set_value_at_unsafe(result, i, str(arr[i]))
+
+    return result
+
+
+def clean_index_list(list obj):
+    """
+    Utility used in pandas.core.index._ensure_index
+    """
+    cdef:
+        Py_ssize_t i, n = len(obj)
+        object v
+        bint all_arrays = 1
+
+    for i in range(n):
+        v = obj[i]
+        if not (PyList_Check(v) or util.is_array(v) or hasattr(v, '_data')):
+            all_arrays = 0
+            break
+
+    if all_arrays:
+        return obj, all_arrays
+
+    # don't force numpy coerce with nan's
+    inferred = infer_dtype(obj)
+    if inferred in ['string', 'bytes', 'unicode',
+                    'mixed', 'mixed-integer']:
+        return np.asarray(obj, dtype=object), 0
+    elif inferred in ['integer']:
+
+        # TODO: we infer an integer but it *could* be a unint64
+        try:
+            return np.asarray(obj, dtype='int64'), 0
+        except OverflowError:
+            return np.asarray(obj, dtype='object'), 0
+
+    return np.asarray(obj), 0
+
+
+# ------------------------------------------------------------------------------
+# Groupby-related functions
+
+# TODO: could do even better if we know something about the data. eg, index has
+# 1-min data, binner has 5-min data, then bins are just strides in index. This
+# is a general, O(max(len(values), len(binner))) method.
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def generate_bins_dt64(ndarray[int64_t] values, ndarray[int64_t] binner,
+                       object closed='left', bint hasnans=0):
+    """
+    Int64 (datetime64) version of generic python version in groupby.py
+    """
+    cdef:
+        Py_ssize_t lenidx, lenbin, i, j, bc, vc
+        ndarray[int64_t] bins
+        int64_t l_bin, r_bin, nat_count
+        bint right_closed = closed == 'right'
+
+    nat_count = 0
+    if hasnans:
+        mask = values == iNaT
+        nat_count = np.sum(mask)
+        values = values[~mask]
+
+    lenidx = len(values)
+    lenbin = len(binner)
+
+    if lenidx <= 0 or lenbin <= 0:
+        raise ValueError("Invalid length for values or for binner")
+
+    # check binner fits data
+    if values[0] < binner[0]:
+        raise ValueError("Values falls before first bin")
+
+    if values[lenidx - 1] > binner[lenbin - 1]:
+        raise ValueError("Values falls after last bin")
+
+    bins = np.empty(lenbin - 1, dtype=np.int64)
+
+    j = 0  # index into values
+    bc = 0  # bin count
+
+    # linear scan
+    if right_closed:
+        for i in range(0, lenbin - 1):
+            r_bin = binner[i + 1]
+            # count values in current bin, advance to next bin
+            while j < lenidx and values[j] <= r_bin:
+                j += 1
+            bins[bc] = j
+            bc += 1
+    else:
+        for i in range(0, lenbin - 1):
+            r_bin = binner[i + 1]
+            # count values in current bin, advance to next bin
+            while j < lenidx and values[j] < r_bin:
+                j += 1
+            bins[bc] = j
+            bc += 1
+
+    if nat_count > 0:
+        # shift bins by the number of NaT
+        bins = bins + nat_count
+        bins = np.insert(bins, 0, nat_count)
+
+    return bins
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def row_bool_subset(ndarray[float64_t, ndim=2] values,
+                    ndarray[uint8_t, cast=True] mask):
+    cdef:
+        Py_ssize_t i, j, n, k, pos = 0
+        ndarray[float64_t, ndim=2] out
+
+    n, k = (<object> values).shape
+    assert(n == len(mask))
+
+    out = np.empty((mask.sum(), k), dtype=np.float64)
+
+    for i in range(n):
+        if mask[i]:
+            for j in range(k):
+                out[pos, j] = values[i, j]
+            pos += 1
+
+    return out
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def row_bool_subset_object(ndarray[object, ndim=2] values,
+                           ndarray[uint8_t, cast=True] mask):
+    cdef:
+        Py_ssize_t i, j, n, k, pos = 0
+        ndarray[object, ndim=2] out
+
+    n, k = (<object> values).shape
+    assert(n == len(mask))
+
+    out = np.empty((mask.sum(), k), dtype=object)
+
+    for i in range(n):
+        if mask[i]:
+            for j in range(k):
+                out[pos, j] = values[i, j]
+            pos += 1
+
+    return out
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def get_level_sorter(ndarray[int64_t, ndim=1] label,
+                     ndarray[int64_t, ndim=1] starts):
+    """
+    argsort for a single level of a multi-index, keeping the order of higher
+    levels unchanged. `starts` points to starts of same-key indices w.r.t
+    to leading levels; equivalent to:
+        np.hstack([label[starts[i]:starts[i+1]].argsort(kind='mergesort')
+            + starts[i] for i in range(len(starts) - 1)])
+    """
+    cdef:
+        int64_t l, r
+        Py_ssize_t i
+        ndarray[int64_t, ndim=1] out = np.empty(len(label), dtype=np.int64)
+
+    for i in range(len(starts) - 1):
+        l, r = starts[i], starts[i + 1]
+        out[l:r] = l + label[l:r].argsort(kind='mergesort')
+
+    return out
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def count_level_2d(ndarray[uint8_t, ndim=2, cast=True] mask,
+                   ndarray[int64_t, ndim=1] labels,
+                   Py_ssize_t max_bin,
+                   int axis):
+    cdef:
+        Py_ssize_t i, j, k, n
+        ndarray[int64_t, ndim=2] counts
+
+    assert(axis == 0 or axis == 1)
+    n, k = (<object> mask).shape
+
+    if axis == 0:
+        counts = np.zeros((max_bin, k), dtype='i8')
+        with nogil:
+            for i from 0 <= i < n:
+                for j from 0 <= j < k:
+                    counts[labels[i], j] += mask[i, j]
+
+    else:  # axis == 1
+        counts = np.zeros((n, max_bin), dtype='i8')
+        with nogil:
+            for i from 0 <= i < n:
+                for j from 0 <= j < k:
+                    counts[i, labels[j]] += mask[i, j]
+
+    return counts
+
+
+def generate_slices(ndarray[int64_t] labels, Py_ssize_t ngroups):
+    cdef:
+        Py_ssize_t i, group_size, n, start
+        int64_t lab
+        object slobj
+        ndarray[int64_t] starts, ends
+
+    n = len(labels)
+
+    starts = np.zeros(ngroups, dtype=np.int64)
+    ends = np.zeros(ngroups, dtype=np.int64)
+
+    start = 0
+    group_size = 0
+    for i in range(n):
+        lab = labels[i]
+        if lab < 0:
+            start += 1
+        else:
+            group_size += 1
+            if i == n - 1 or lab != labels[i + 1]:
+                starts[lab] = start
+                ends[lab] = start + group_size
+                start += group_size
+                group_size = 0
+
+    return starts, ends
+
+
+def indices_fast(object index, ndarray[int64_t] labels, list keys,
+                 list sorted_labels):
+    cdef:
+        Py_ssize_t i, j, k, lab, cur, start, n = len(labels)
+        dict result = {}
+        object tup
+
+    k = len(keys)
+
+    if n == 0:
+        return result
+
+    start = 0
+    cur = labels[0]
+    for i in range(1, n):
+        lab = labels[i]
+
+        if lab != cur:
+            if lab != -1:
+                tup = PyTuple_New(k)
+                for j in range(k):
+                    val = util.get_value_at(keys[j],
+                                            sorted_labels[j][i - 1])
+                    PyTuple_SET_ITEM(tup, j, val)
+                    Py_INCREF(val)
+
+                result[tup] = index[start:i]
+            start = i
+        cur = lab
+
+    tup = PyTuple_New(k)
+    for j in range(k):
+        val = util.get_value_at(keys[j],
+                                sorted_labels[j][n - 1])
+        PyTuple_SET_ITEM(tup, j, val)
+        Py_INCREF(val)
+    result[tup] = index[start:]
+
+    return result
+
+
+include "inference.pyx"
diff --git a/pandas/_libs/missing.pxd b/pandas/_libs/missing.pxd
new file mode 100644
index 0000000000000..f3d990db1c3fd
--- /dev/null
+++ b/pandas/_libs/missing.pxd
@@ -0,0 +1,6 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+cdef bint is_null_datetimelike(object val)
+cpdef bint checknull(object val)
+cpdef bint checknull_old(object val)
diff --git a/pandas/_libs/missing.pyx b/pandas/_libs/missing.pyx
new file mode 100644
index 0000000000000..dfd044131afb4
--- /dev/null
+++ b/pandas/_libs/missing.pyx
@@ -0,0 +1,310 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+from cpython cimport PyFloat_Check, PyComplex_Check
+
+cimport cython
+from cython cimport Py_ssize_t
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport ndarray, int64_t, uint8_t
+cnp.import_array()
+
+cimport util
+
+from tslibs.np_datetime cimport get_timedelta64_value, get_datetime64_value
+from tslibs.nattype import NaT
+
+cdef double INF = <double> np.inf
+cdef double NEGINF = -INF
+
+cdef int64_t NPY_NAT = util.get_nat()
+
+
+cdef inline bint is_null_datetimelike(object val):
+    # determine if we have a null for a timedelta/datetime (or integer
+    # versions)
+    if util._checknull(val):
+        return True
+    elif val is NaT:
+        return True
+    elif util.is_timedelta64_object(val):
+        return val.view('int64') == NPY_NAT
+    elif util.is_datetime64_object(val):
+        return val.view('int64') == NPY_NAT
+    elif util.is_integer_object(val):
+        return val == NPY_NAT
+    return False
+
+
+cdef inline bint _check_all_nulls(object val):
+    """ utility to check if a value is any type of null """
+    cdef bint res
+    if PyFloat_Check(val) or PyComplex_Check(val):
+        res = val != val
+    elif val is NaT:
+        res = 1
+    elif val is None:
+        res = 1
+    elif util.is_datetime64_object(val):
+        res = get_datetime64_value(val) == NPY_NAT
+    elif util.is_timedelta64_object(val):
+        res = get_timedelta64_value(val) == NPY_NAT
+    else:
+        res = 0
+    return res
+
+
+cpdef bint checknull(object val):
+    """
+    Return boolean describing of the input is NA-like, defined here as any
+    of:
+     - None
+     - nan
+     - NaT
+     - np.datetime64 representation of NaT
+     - np.timedelta64 representation of NaT
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    result : bool
+
+    Notes
+    -----
+    The difference between `checknull` and `checknull_old` is that `checknull`
+    does *not* consider INF or NEGINF to be NA.
+    """
+    if util.is_float_object(val) or util.is_complex_object(val):
+        return val != val  # and val != INF and val != NEGINF
+    elif util.is_datetime64_object(val):
+        return get_datetime64_value(val) == NPY_NAT
+    elif val is NaT:
+        return True
+    elif util.is_timedelta64_object(val):
+        return get_timedelta64_value(val) == NPY_NAT
+    elif util.is_array(val):
+        return False
+    else:
+        return util._checknull(val)
+
+
+cpdef bint checknull_old(object val):
+    """
+    Return boolean describing of the input is NA-like, defined here as any
+    of:
+     - None
+     - nan
+     - INF
+     - NEGINF
+     - NaT
+     - np.datetime64 representation of NaT
+     - np.timedelta64 representation of NaT
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    result : bool
+
+    Notes
+    -----
+    The difference between `checknull` and `checknull_old` is that `checknull`
+    does *not* consider INF or NEGINF to be NA.
+    """
+    if util.is_float_object(val) or util.is_complex_object(val):
+        return val != val or val == INF or val == NEGINF
+    elif util.is_datetime64_object(val):
+        return get_datetime64_value(val) == NPY_NAT
+    elif val is NaT:
+        return True
+    elif util.is_timedelta64_object(val):
+        return get_timedelta64_value(val) == NPY_NAT
+    elif util.is_array(val):
+        return False
+    else:
+        return util._checknull(val)
+
+
+cdef inline bint _check_none_nan_inf_neginf(object val):
+    try:
+        return val is None or (PyFloat_Check(val) and
+                               (val != val or val == INF or val == NEGINF))
+    except ValueError:
+        return False
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def isnaobj(ndarray arr):
+    """
+    Return boolean mask denoting which elements of a 1-D array are na-like,
+    according to the criteria defined in `_check_all_nulls`:
+     - None
+     - nan
+     - NaT
+     - np.datetime64 representation of NaT
+     - np.timedelta64 representation of NaT
+
+    Parameters
+    ----------
+    arr : ndarray
+
+    Returns
+    -------
+    result : ndarray (dtype=np.bool_)
+    """
+    cdef:
+        Py_ssize_t i, n
+        object val
+        ndarray[uint8_t] result
+
+    assert arr.ndim == 1, "'arr' must be 1-D."
+
+    n = len(arr)
+    result = np.empty(n, dtype=np.uint8)
+    for i in range(n):
+        val = arr[i]
+        result[i] = _check_all_nulls(val)
+    return result.view(np.bool_)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def isnaobj_old(ndarray arr):
+    """
+    Return boolean mask denoting which elements of a 1-D array are na-like,
+    defined as being any of:
+     - None
+     - nan
+     - INF
+     - NEGINF
+     - NaT
+
+    Parameters
+    ----------
+    arr : ndarray
+
+    Returns
+    -------
+    result : ndarray (dtype=np.bool_)
+    """
+    cdef:
+        Py_ssize_t i, n
+        object val
+        ndarray[uint8_t] result
+
+    assert arr.ndim == 1, "'arr' must be 1-D."
+
+    n = len(arr)
+    result = np.zeros(n, dtype=np.uint8)
+    for i in range(n):
+        val = arr[i]
+        result[i] = val is NaT or _check_none_nan_inf_neginf(val)
+    return result.view(np.bool_)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def isnaobj2d(ndarray arr):
+    """
+    Return boolean mask denoting which elements of a 2-D array are na-like,
+    according to the criteria defined in `checknull`:
+     - None
+     - nan
+     - NaT
+     - np.datetime64 representation of NaT
+     - np.timedelta64 representation of NaT
+
+    Parameters
+    ----------
+    arr : ndarray
+
+    Returns
+    -------
+    result : ndarray (dtype=np.bool_)
+
+    Notes
+    -----
+    The difference between `isnaobj2d` and `isnaobj2d_old` is that `isnaobj2d`
+    does *not* consider INF or NEGINF to be NA.
+    """
+    cdef:
+        Py_ssize_t i, j, n, m
+        object val
+        ndarray[uint8_t, ndim=2] result
+
+    assert arr.ndim == 2, "'arr' must be 2-D."
+
+    n, m = (<object> arr).shape
+    result = np.zeros((n, m), dtype=np.uint8)
+    for i in range(n):
+        for j in range(m):
+            val = arr[i, j]
+            if checknull(val):
+                result[i, j] = 1
+    return result.view(np.bool_)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def isnaobj2d_old(ndarray arr):
+    """
+    Return boolean mask denoting which elements of a 2-D array are na-like,
+    according to the criteria defined in `checknull_old`:
+     - None
+     - nan
+     - INF
+     - NEGINF
+     - NaT
+     - np.datetime64 representation of NaT
+     - np.timedelta64 representation of NaT
+
+    Parameters
+    ----------
+    arr : ndarray
+
+    Returns
+    -------
+    result : ndarray (dtype=np.bool_)
+
+    Notes
+    -----
+    The difference between `isnaobj2d` and `isnaobj2d_old` is that `isnaobj2d`
+    does *not* consider INF or NEGINF to be NA.
+    """
+    cdef:
+        Py_ssize_t i, j, n, m
+        object val
+        ndarray[uint8_t, ndim=2] result
+
+    assert arr.ndim == 2, "'arr' must be 2-D."
+
+    n, m = (<object> arr).shape
+    result = np.zeros((n, m), dtype=np.uint8)
+    for i in range(n):
+        for j in range(m):
+            val = arr[i, j]
+            if checknull_old(val):
+                result[i, j] = 1
+    return result.view(np.bool_)
+
+
+cpdef bint isposinf_scalar(object val):
+    if util.is_float_object(val) and val == INF:
+        return True
+    else:
+        return False
+
+
+cpdef bint isneginf_scalar(object val):
+    if util.is_float_object(val) and val == NEGINF:
+        return True
+    else:
+        return False
diff --git a/pandas/_libs/ops.pyx b/pandas/_libs/ops.pyx
new file mode 100644
index 0000000000000..148018ece20e2
--- /dev/null
+++ b/pandas/_libs/ops.pyx
@@ -0,0 +1,296 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+import operator
+
+from cpython cimport (PyFloat_Check, PyBool_Check,
+                      PyObject_RichCompareBool,
+                      Py_EQ, Py_NE, Py_LT, Py_LE, Py_GT, Py_GE)
+
+cimport cython
+from cython cimport Py_ssize_t
+
+import numpy as np
+from numpy cimport ndarray, uint8_t
+
+
+from util cimport UINT8_MAX, _checknull
+
+from missing cimport checknull
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def scalar_compare(ndarray[object] values, object val, object op):
+    """
+    Compare each element of `values` array with the scalar `val`, with
+    the comparison operation described by `op`.
+
+    Parameters
+    ----------
+    values : ndarray[object]
+    val : object
+    op : {operator.eq, operator.ne,
+          operator.le, operator.lt,
+          operator.ge, operator.gt}
+
+    Returns
+    -------
+    result : ndarray[bool]
+    """
+    cdef:
+        Py_ssize_t i, n = len(values)
+        ndarray[uint8_t, cast=True] result
+        bint isnull_val
+        int flag
+        object x
+
+    if op is operator.lt:
+        flag = Py_LT
+    elif op is operator.le:
+        flag = Py_LE
+    elif op is operator.gt:
+        flag = Py_GT
+    elif op is operator.ge:
+        flag = Py_GE
+    elif op is operator.eq:
+        flag = Py_EQ
+    elif op is operator.ne:
+        flag = Py_NE
+    else:
+        raise ValueError('Unrecognized operator')
+
+    result = np.empty(n, dtype=bool).view(np.uint8)
+    isnull_val = checknull(val)
+
+    if flag == Py_NE:
+        for i in range(n):
+            x = values[i]
+            if checknull(x):
+                result[i] = True
+            elif isnull_val:
+                result[i] = True
+            else:
+                try:
+                    result[i] = PyObject_RichCompareBool(x, val, flag)
+                except (TypeError):
+                    result[i] = True
+    elif flag == Py_EQ:
+        for i in range(n):
+            x = values[i]
+            if checknull(x):
+                result[i] = False
+            elif isnull_val:
+                result[i] = False
+            else:
+                try:
+                    result[i] = PyObject_RichCompareBool(x, val, flag)
+                except (TypeError):
+                    result[i] = False
+
+    else:
+        for i in range(n):
+            x = values[i]
+            if checknull(x):
+                result[i] = False
+            elif isnull_val:
+                result[i] = False
+            else:
+                result[i] = PyObject_RichCompareBool(x, val, flag)
+
+    return result.view(bool)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def vec_compare(ndarray[object] left, ndarray[object] right, object op):
+    """
+    Compare the elements of `left` with the elements of `right` pointwise,
+    with the comparison operation described by `op`.
+
+    Parameters
+    ----------
+    left : ndarray[object]
+    right : ndarray[object]
+    op : {operator.eq, operator.ne,
+          operator.le, operator.lt,
+          operator.ge, operator.gt}
+
+    Returns
+    -------
+    result : ndarray[bool]
+    """
+    cdef:
+        Py_ssize_t i, n = len(left)
+        ndarray[uint8_t, cast=True] result
+        int flag
+
+    if n != len(right):
+        raise ValueError('Arrays were different lengths: %d vs %d'
+                         % (n, len(right)))
+
+    if op is operator.lt:
+        flag = Py_LT
+    elif op is operator.le:
+        flag = Py_LE
+    elif op is operator.gt:
+        flag = Py_GT
+    elif op is operator.ge:
+        flag = Py_GE
+    elif op is operator.eq:
+        flag = Py_EQ
+    elif op is operator.ne:
+        flag = Py_NE
+    else:
+        raise ValueError('Unrecognized operator')
+
+    result = np.empty(n, dtype=bool).view(np.uint8)
+
+    if flag == Py_NE:
+        for i in range(n):
+            x = left[i]
+            y = right[i]
+
+            if checknull(x) or checknull(y):
+                result[i] = True
+            else:
+                result[i] = PyObject_RichCompareBool(x, y, flag)
+    else:
+        for i in range(n):
+            x = left[i]
+            y = right[i]
+
+            if checknull(x) or checknull(y):
+                result[i] = False
+            else:
+                result[i] = PyObject_RichCompareBool(x, y, flag)
+
+    return result.view(bool)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def scalar_binop(ndarray[object] values, object val, object op):
+    """
+    Apply the given binary operator `op` between each element of the array
+    `values` and the scalar `val`.
+
+    Parameters
+    ----------
+    values : ndarray[object]
+    val : object
+    op : binary operator
+
+    Returns
+    -------
+    result : ndarray[object]
+    """
+    cdef:
+        Py_ssize_t i, n = len(values)
+        ndarray[object] result
+        object x
+
+    result = np.empty(n, dtype=object)
+    if _checknull(val):
+        result.fill(val)
+        return result
+
+    for i in range(n):
+        x = values[i]
+        if _checknull(x):
+            result[i] = x
+        else:
+            result[i] = op(x, val)
+
+    return maybe_convert_bool(result)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def vec_binop(ndarray[object] left, ndarray[object] right, object op):
+    """
+    Apply the given binary operator `op` pointwise to the elements of
+    arrays `left` and `right`.
+
+    Parameters
+    ----------
+    left : ndarray[object]
+    right : ndarray[object]
+    op : binary operator
+
+    Returns
+    -------
+    result : ndarray[object]
+    """
+    cdef:
+        Py_ssize_t i, n = len(left)
+        ndarray[object] result
+
+    if n != len(right):
+        raise ValueError('Arrays were different lengths: %d vs %d'
+                         % (n, len(right)))
+
+    result = np.empty(n, dtype=object)
+
+    for i in range(n):
+        x = left[i]
+        y = right[i]
+        try:
+            result[i] = op(x, y)
+        except TypeError:
+            if _checknull(x):
+                result[i] = x
+            elif _checknull(y):
+                result[i] = y
+            else:
+                raise
+
+    return maybe_convert_bool(result)
+
+
+def maybe_convert_bool(ndarray[object] arr,
+                       true_values=None, false_values=None):
+    cdef:
+        Py_ssize_t i, n
+        ndarray[uint8_t] result
+        object val
+        set true_vals, false_vals
+        int na_count = 0
+
+    n = len(arr)
+    result = np.empty(n, dtype=np.uint8)
+
+    # the defaults
+    true_vals = set(('True', 'TRUE', 'true'))
+    false_vals = set(('False', 'FALSE', 'false'))
+
+    if true_values is not None:
+        true_vals = true_vals | set(true_values)
+
+    if false_values is not None:
+        false_vals = false_vals | set(false_values)
+
+    for i from 0 <= i < n:
+        val = arr[i]
+
+        if PyBool_Check(val):
+            if val is True:
+                result[i] = 1
+            else:
+                result[i] = 0
+        elif val in true_vals:
+            result[i] = 1
+        elif val in false_vals:
+            result[i] = 0
+        elif PyFloat_Check(val):
+            result[i] = UINT8_MAX
+            na_count += 1
+        else:
+            return arr
+
+    if na_count > 0:
+        mask = result == UINT8_MAX
+        arr = result.view(np.bool_).astype(object)
+        np.putmask(arr, mask, np.nan)
+        return arr
+    else:
+        return result.view(np.bool_)
diff --git a/pandas/_libs/parsers.pyx b/pandas/_libs/parsers.pyx
new file mode 100644
index 0000000000000..a24e2cdd99f6f
--- /dev/null
+++ b/pandas/_libs/parsers.pyx
@@ -0,0 +1,2260 @@
+# Copyright (c) 2012, Lambda Foundry, Inc.
+# See LICENSE for the license
+import os
+import sys
+import time
+import warnings
+
+from csv import QUOTE_MINIMAL, QUOTE_NONNUMERIC, QUOTE_NONE
+
+from libc.stdlib cimport free
+from libc.string cimport strncpy, strlen, strcasecmp
+
+cimport cython
+from cython cimport Py_ssize_t
+
+from cpython cimport (PyObject, PyBytes_FromString,
+                      PyBytes_AsString, PyBytes_Check,
+                      PyUnicode_Check, PyUnicode_AsUTF8String,
+                      PyErr_Occurred, PyErr_Fetch)
+from cpython.ref cimport Py_XDECREF
+
+
+cdef extern from "Python.h":
+    object PyUnicode_FromString(char *v)
+
+    object PyUnicode_Decode(char *v, Py_ssize_t size, char *encoding,
+                            char *errors)
+
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport ndarray, uint8_t, uint64_t, int64_t
+cnp.import_array()
+
+from util cimport UINT64_MAX, INT64_MAX, INT64_MIN
+import lib
+
+from khash cimport (
+    khiter_t,
+    kh_str_t, kh_init_str, kh_put_str, kh_exist_str,
+    kh_get_str, kh_destroy_str,
+    kh_float64_t, kh_get_float64, kh_destroy_float64,
+    kh_put_float64, kh_init_float64,
+    kh_strbox_t, kh_put_strbox, kh_get_strbox, kh_init_strbox,
+    kh_destroy_strbox)
+
+import pandas.compat as compat
+from pandas.core.dtypes.common import (
+    is_categorical_dtype,
+    is_integer_dtype, is_float_dtype,
+    is_bool_dtype, is_object_dtype,
+    is_datetime64_dtype,
+    pandas_dtype)
+from pandas.core.arrays import Categorical
+from pandas.core.dtypes.concat import union_categoricals
+import pandas.io.common as com
+
+from pandas.errors import (ParserError, DtypeWarning,
+                           EmptyDataError, ParserWarning)
+
+# Import CParserError as alias of ParserError for backwards compatibility.
+# Ultimately, we want to remove this import. See gh-12665 and gh-14479.
+CParserError = ParserError
+
+
+cdef bint PY3 = (sys.version_info[0] >= 3)
+
+cdef double INF = <double> np.inf
+cdef double NEGINF = -INF
+
+
+cdef extern from "errno.h":
+    int errno
+
+cdef extern from "headers/portable.h":
+    # I *think* this is here so that strcasecmp is defined on Windows
+    # so we don't get
+    # `parsers.obj : error LNK2001: unresolved external symbol strcasecmp`
+    # in Appveyor.
+    # In a sane world, the `from libc.string cimport` above would fail
+    # loudly.
+    pass
+
+try:
+    basestring
+except NameError:
+    basestring = str
+
+
+cdef extern from "parser/tokenizer.h":
+
+    ctypedef enum ParserState:
+        START_RECORD
+        START_FIELD
+        ESCAPED_CHAR
+        IN_FIELD
+        IN_QUOTED_FIELD
+        ESCAPE_IN_QUOTED_FIELD
+        QUOTE_IN_QUOTED_FIELD
+        EAT_CRNL
+        EAT_CRNL_NOP
+        EAT_WHITESPACE
+        EAT_COMMENT
+        EAT_LINE_COMMENT
+        WHITESPACE_LINE
+        SKIP_LINE
+        FINISHED
+
+    enum: ERROR_OVERFLOW
+
+    ctypedef void* (*io_callback)(void *src, size_t nbytes, size_t *bytes_read,
+                                  int *status)
+    ctypedef int (*io_cleanup)(void *src)
+
+    ctypedef struct parser_t:
+        void *source
+        io_callback cb_io
+        io_cleanup cb_cleanup
+
+        int64_t chunksize  # Number of bytes to prepare for each chunk
+        char *data         # pointer to data to be processed
+        int64_t datalen    # amount of data available
+        int64_t datapos
+
+        # where to write out tokenized data
+        char *stream
+        int64_t stream_len
+        int64_t stream_cap
+
+        # Store words in (potentially ragged) matrix for now, hmm
+        char **words
+        int64_t *word_starts  # where we are in the stream
+        int64_t words_len
+        int64_t words_cap
+
+        char *pword_start        # pointer to stream start of current field
+        int64_t word_start       # position start of current field
+
+        int64_t *line_start      # position in words for start of line
+        int64_t *line_fields     # Number of fields in each line
+        int64_t lines            # Number of lines observed
+        int64_t file_lines       # Number of lines observed (with bad/skipped)
+        int64_t lines_cap        # Vector capacity
+
+        # Tokenizing stuff
+        ParserState state
+        int doublequote            # is " represented by ""? */
+        char delimiter             # field separator */
+        int delim_whitespace       # consume tabs / spaces instead
+        char quotechar             # quote character */
+        char escapechar            # escape character */
+        char lineterminator
+        int skipinitialspace       # ignore spaces following delimiter? */
+        int quoting                # style of quoting to write */
+
+        # hmm =/
+        # int numeric_field
+
+        char commentchar
+        int allow_embedded_newline
+        int strict                 # raise exception on bad CSV */
+
+        int usecols
+
+        int expected_fields
+        int error_bad_lines
+        int warn_bad_lines
+
+        # floating point options
+        char decimal
+        char sci
+
+        # thousands separator (comma, period)
+        char thousands
+
+        int header                  # Boolean: 1: has header, 0: no header
+        int64_t header_start        # header row start
+        int64_t header_end          # header row end
+
+        void *skipset
+        PyObject *skipfunc
+        int64_t skip_first_N_rows
+        int64_t skipfooter
+        # pick one, depending on whether the converter requires GIL
+        double (*double_converter_nogil)(const char *, char **,
+                                         char, char, char, int) nogil
+        double (*double_converter_withgil)(const char *, char **,
+                                           char, char, char, int)
+
+        #  error handling
+        char *warn_msg
+        char *error_msg
+
+        int64_t skip_empty_lines
+
+    ctypedef struct coliter_t:
+        char **words
+        int64_t *line_start
+        int64_t col
+
+    ctypedef struct uint_state:
+        int seen_sint
+        int seen_uint
+        int seen_null
+
+    void uint_state_init(uint_state *self)
+    int uint64_conflict(uint_state *self)
+
+    void coliter_setup(coliter_t *it, parser_t *parser,
+                       int64_t i, int64_t start) nogil
+    void COLITER_NEXT(coliter_t, const char *) nogil
+
+    parser_t* parser_new()
+
+    int parser_init(parser_t *self) nogil
+    void parser_free(parser_t *self) nogil
+    void parser_del(parser_t *self) nogil
+    int parser_add_skiprow(parser_t *self, int64_t row)
+
+    int parser_set_skipfirstnrows(parser_t *self, int64_t nrows)
+
+    void parser_set_default_options(parser_t *self)
+
+    int parser_consume_rows(parser_t *self, size_t nrows)
+
+    int parser_trim_buffers(parser_t *self)
+
+    int tokenize_all_rows(parser_t *self) nogil
+    int tokenize_nrows(parser_t *self, size_t nrows) nogil
+
+    int64_t str_to_int64(char *p_item, int64_t int_min,
+                         int64_t int_max, int *error, char tsep) nogil
+    uint64_t str_to_uint64(uint_state *state, char *p_item, int64_t int_max,
+                           uint64_t uint_max, int *error, char tsep) nogil
+
+    double xstrtod(const char *p, char **q, char decimal, char sci,
+                   char tsep, int skip_trailing) nogil
+    double precise_xstrtod(const char *p, char **q, char decimal, char sci,
+                           char tsep, int skip_trailing) nogil
+    double round_trip(const char *p, char **q, char decimal, char sci,
+                      char tsep, int skip_trailing) nogil
+
+    int to_boolean(const char *item, uint8_t *val) nogil
+
+
+cdef extern from "parser/io.h":
+    void *new_mmap(char *fname)
+    int del_mmap(void *src)
+    void* buffer_mmap_bytes(void *source, size_t nbytes,
+                            size_t *bytes_read, int *status)
+
+    void *new_file_source(char *fname, size_t buffer_size)
+
+    void *new_rd_source(object obj)
+
+    int del_file_source(void *src)
+    int del_rd_source(void *src)
+
+    void* buffer_file_bytes(void *source, size_t nbytes,
+                            size_t *bytes_read, int *status)
+
+    void* buffer_rd_bytes(void *source, size_t nbytes,
+                          size_t *bytes_read, int *status)
+
+
+DEFAULT_CHUNKSIZE = 256 * 1024
+
+
+cdef class TextReader:
+    """
+
+    # source: StringIO or file object
+
+    """
+
+    cdef:
+        parser_t *parser
+        object file_handle, na_fvalues
+        object true_values, false_values
+        object handle
+        bint na_filter, keep_default_na, verbose, has_usecols, has_mi_columns
+        int64_t parser_start
+        list clocks
+        char *c_encoding
+        kh_str_t *false_set
+        kh_str_t *true_set
+
+    cdef public:
+        int64_t leading_cols, table_width, skipfooter, buffer_lines
+        object allow_leading_cols
+        object delimiter, converters, delim_whitespace
+        object na_values
+        object memory_map
+        object header, orig_header, names, header_start, header_end
+        object index_col
+        object low_memory
+        object skiprows
+        object dtype
+        object encoding
+        object compression
+        object mangle_dupe_cols
+        object tupleize_cols
+        object usecols
+        list dtype_cast_order
+        set noconvert
+
+    def __cinit__(self, source,
+                  delimiter=b',',
+
+                  header=0,
+                  header_start=0,
+                  header_end=0,
+                  index_col=None,
+                  names=None,
+
+                  memory_map=False,
+                  tokenize_chunksize=DEFAULT_CHUNKSIZE,
+                  delim_whitespace=False,
+
+                  compression=None,
+
+                  converters=None,
+
+                  skipinitialspace=False,
+                  escapechar=None,
+                  doublequote=True,
+                  quotechar=b'"',
+                  quoting=0,
+                  lineterminator=None,
+
+                  encoding=None,
+
+                  comment=None,
+                  decimal=b'.',
+                  thousands=None,
+
+                  dtype=None,
+                  usecols=None,
+                  error_bad_lines=True,
+                  warn_bad_lines=True,
+
+                  na_filter=True,
+                  na_values=None,
+                  na_fvalues=None,
+                  keep_default_na=True,
+
+                  true_values=None,
+                  false_values=None,
+                  allow_leading_cols=True,
+                  low_memory=False,
+                  skiprows=None,
+                  skipfooter=0,
+                  verbose=False,
+                  mangle_dupe_cols=True,
+                  tupleize_cols=False,
+                  float_precision=None,
+                  skip_blank_lines=True):
+
+        # set encoding for native Python and C library
+        if encoding is not None:
+            if not isinstance(encoding, bytes):
+                encoding = encoding.encode('utf-8')
+            encoding = encoding.lower()
+            self.c_encoding = <char*> encoding
+        else:
+            self.c_encoding = NULL
+
+        self.encoding = encoding
+
+        self.parser = parser_new()
+        self.parser.chunksize = tokenize_chunksize
+
+        self.mangle_dupe_cols = mangle_dupe_cols
+        self.tupleize_cols = tupleize_cols
+
+        # For timekeeping
+        self.clocks = []
+
+        self.compression = compression
+        self.memory_map = memory_map
+
+        self.parser.usecols = (usecols is not None)
+
+        self._setup_parser_source(source)
+        parser_set_default_options(self.parser)
+
+        parser_init(self.parser)
+
+        if delim_whitespace:
+            self.parser.delim_whitespace = delim_whitespace
+        else:
+            if len(delimiter) > 1:
+                raise ValueError('only length-1 separators excluded right now')
+            self.parser.delimiter = ord(delimiter)
+
+        # ----------------------------------------
+        # parser options
+
+        self.parser.doublequote = doublequote
+        self.parser.skipinitialspace = skipinitialspace
+        self.parser.skip_empty_lines = skip_blank_lines
+
+        if lineterminator is not None:
+            if len(lineterminator) != 1:
+                raise ValueError('Only length-1 line terminators supported')
+            self.parser.lineterminator = ord(lineterminator)
+
+        if len(decimal) != 1:
+            raise ValueError('Only length-1 decimal markers supported')
+        self.parser.decimal = ord(decimal)
+
+        if thousands is not None:
+            if len(thousands) != 1:
+                raise ValueError('Only length-1 thousands markers supported')
+            self.parser.thousands = ord(thousands)
+
+        if escapechar is not None:
+            if len(escapechar) != 1:
+                raise ValueError('Only length-1 escapes supported')
+            self.parser.escapechar = ord(escapechar)
+
+        self._set_quoting(quotechar, quoting)
+
+        dtype_order = ['int64', 'float64', 'bool', 'object']
+        if quoting == QUOTE_NONNUMERIC:
+            # consistent with csv module semantics, cast all to float
+            dtype_order = dtype_order[1:]
+        self.dtype_cast_order = [np.dtype(x) for x in dtype_order]
+
+        if comment is not None:
+            if len(comment) > 1:
+                raise ValueError('Only length-1 comment characters supported')
+            self.parser.commentchar = ord(comment)
+
+        # error handling of bad lines
+        self.parser.error_bad_lines = int(error_bad_lines)
+        self.parser.warn_bad_lines = int(warn_bad_lines)
+
+        self.skiprows = skiprows
+        if skiprows is not None:
+            self._make_skiprow_set()
+
+        self.skipfooter = skipfooter
+
+        # suboptimal
+        if usecols is not None:
+            self.has_usecols = 1
+            # GH-20558, validate usecols at higher level and only pass clean
+            # usecols into TextReader.
+            self.usecols = usecols
+
+        # XXX
+        if skipfooter > 0:
+            self.parser.error_bad_lines = 0
+            self.parser.warn_bad_lines = 0
+
+        self.delimiter = delimiter
+        self.delim_whitespace = delim_whitespace
+
+        self.na_values = na_values
+        if na_fvalues is None:
+            na_fvalues = set()
+        self.na_fvalues = na_fvalues
+
+        self.true_values = _maybe_encode(true_values) + _true_values
+        self.false_values = _maybe_encode(false_values) + _false_values
+
+        self.true_set = kset_from_list(self.true_values)
+        self.false_set = kset_from_list(self.false_values)
+
+        self.keep_default_na = keep_default_na
+        self.converters = converters
+        self.na_filter = na_filter
+
+        self.verbose = verbose
+        self.low_memory = low_memory
+        self.parser.double_converter_nogil = xstrtod
+        self.parser.double_converter_withgil = NULL
+        if float_precision == 'high':
+            self.parser.double_converter_nogil = precise_xstrtod
+            self.parser.double_converter_withgil = NULL
+        elif float_precision == 'round_trip':  # avoid gh-15140
+            self.parser.double_converter_nogil = NULL
+            self.parser.double_converter_withgil = round_trip
+
+        if isinstance(dtype, dict):
+            dtype = {k: pandas_dtype(dtype[k])
+                     for k in dtype}
+        elif dtype is not None:
+            dtype = pandas_dtype(dtype)
+
+        self.dtype = dtype
+
+        # XXX
+        self.noconvert = set()
+
+        self.index_col = index_col
+
+        # ----------------------------------------
+        # header stuff
+
+        self.allow_leading_cols = allow_leading_cols
+        self.leading_cols = 0
+
+        # TODO: no header vs. header is not the first row
+        self.has_mi_columns = 0
+        self.orig_header = header
+        if header is None:
+            # sentinel value
+            self.parser.header_start = -1
+            self.parser.header_end = -1
+            self.parser.header = -1
+            self.parser_start = 0
+            self.header = []
+        else:
+            if isinstance(header, list):
+                if len(header) > 1:
+                    # need to artificially skip the final line
+                    # which is still a header line
+                    header = list(header)
+                    header.append(header[-1] + 1)
+                    self.parser.header_end = header[-1]
+                    self.has_mi_columns = 1
+                else:
+                    self.parser.header_end = header[0]
+
+                self.parser_start = header[-1] + 1
+                self.parser.header_start = header[0]
+                self.parser.header = header[0]
+                self.header = header
+            else:
+                self.parser.header_start = header
+                self.parser.header_end = header
+                self.parser_start = header + 1
+                self.parser.header = header
+                self.header = [ header ]
+
+        self.names = names
+        self.header, self.table_width = self._get_header()
+
+        if not self.table_width:
+            raise EmptyDataError("No columns to parse from file")
+
+        # Compute buffer_lines as function of table width.
+        heuristic = 2**20 // self.table_width
+        self.buffer_lines = 1
+        while self.buffer_lines * 2 < heuristic:
+            self.buffer_lines *= 2
+
+    def __init__(self, *args, **kwargs):
+        pass
+
+    def __dealloc__(self):
+        parser_free(self.parser)
+        if self.true_set:
+            kh_destroy_str(self.true_set)
+            self.true_set = NULL
+        if self.false_set:
+            kh_destroy_str(self.false_set)
+            self.false_set = NULL
+        parser_del(self.parser)
+
+    def close(self):
+        # we need to properly close an open derived
+        # filehandle here, e.g. and UTFRecoder
+        if self.handle is not None:
+            try:
+                self.handle.close()
+            except:
+                pass
+        # also preemptively free all allocated memory
+        parser_free(self.parser)
+        if self.true_set:
+            kh_destroy_str(self.true_set)
+            self.true_set = NULL
+        if self.false_set:
+            kh_destroy_str(self.false_set)
+            self.false_set = NULL
+
+    def set_error_bad_lines(self, int status):
+        self.parser.error_bad_lines = status
+
+    def _set_quoting(self, quote_char, quoting):
+        if not isinstance(quoting, int):
+            raise TypeError('"quoting" must be an integer')
+
+        if not QUOTE_MINIMAL <= quoting <= QUOTE_NONE:
+            raise TypeError('bad "quoting" value')
+
+        if not isinstance(quote_char, (str, compat.text_type,
+                                       bytes)) and quote_char is not None:
+            dtype = type(quote_char).__name__
+            raise TypeError('"quotechar" must be string, '
+                            'not {dtype}'.format(dtype=dtype))
+
+        if quote_char is None or quote_char == '':
+            if quoting != QUOTE_NONE:
+                raise TypeError("quotechar must be set if quoting enabled")
+            self.parser.quoting = quoting
+            self.parser.quotechar = -1
+        elif len(quote_char) > 1:  # 0-len case handled earlier
+            raise TypeError('"quotechar" must be a 1-character string')
+        else:
+            self.parser.quoting = quoting
+            self.parser.quotechar = ord(quote_char)
+
+    cdef _make_skiprow_set(self):
+        if isinstance(self.skiprows, (int, np.integer)):
+            parser_set_skipfirstnrows(self.parser, self.skiprows)
+        elif not callable(self.skiprows):
+            for i in self.skiprows:
+                parser_add_skiprow(self.parser, i)
+        else:
+            self.parser.skipfunc = <PyObject *> self.skiprows
+
+    cdef _setup_parser_source(self, source):
+        cdef:
+            int status
+            void *ptr
+
+        self.parser.cb_io = NULL
+        self.parser.cb_cleanup = NULL
+
+        if self.compression:
+            if self.compression == 'gzip':
+                import gzip
+                if isinstance(source, basestring):
+                    source = gzip.GzipFile(source, 'rb')
+                else:
+                    source = gzip.GzipFile(fileobj=source)
+            elif self.compression == 'bz2':
+                import bz2
+                if isinstance(source, basestring) or PY3:
+                    source = bz2.BZ2File(source, 'rb')
+                else:
+                    content = source.read()
+                    source.close()
+                    source = compat.StringIO(bz2.decompress(content))
+            elif self.compression == 'zip':
+                import zipfile
+                zip_file = zipfile.ZipFile(source)
+                zip_names = zip_file.namelist()
+
+                if len(zip_names) == 1:
+                    file_name = zip_names.pop()
+                    source = zip_file.open(file_name)
+
+                elif len(zip_names) == 0:
+                    raise ValueError('Zero files found in compressed '
+                                     'zip file %s', source)
+                else:
+                    raise ValueError('Multiple files found in compressed '
+                                     'zip file %s', str(zip_names))
+            elif self.compression == 'xz':
+                lzma = compat.import_lzma()
+
+                if isinstance(source, basestring):
+                    source = lzma.LZMAFile(source, 'rb')
+                else:
+                    source = lzma.LZMAFile(filename=source)
+            else:
+                raise ValueError('Unrecognized compression type: %s' %
+                                 self.compression)
+
+            if b'utf-16' in (self.encoding or b''):
+                # we need to read utf-16 through UTF8Recoder.
+                # if source is utf-16, convert source to utf-8 by UTF8Recoder.
+                source = com.UTF8Recoder(source, self.encoding.decode('utf-8'))
+                self.encoding = b'utf-8'
+                self.c_encoding = <char*> self.encoding
+
+            self.handle = source
+
+        if isinstance(source, basestring):
+            if not isinstance(source, bytes):
+                source = source.encode(sys.getfilesystemencoding() or 'utf-8')
+
+            if self.memory_map:
+                ptr = new_mmap(source)
+                if ptr == NULL:
+                    # fall back
+                    ptr = new_file_source(source, self.parser.chunksize)
+                    self.parser.cb_io = &buffer_file_bytes
+                    self.parser.cb_cleanup = &del_file_source
+                else:
+                    self.parser.cb_io = &buffer_mmap_bytes
+                    self.parser.cb_cleanup = &del_mmap
+            else:
+                ptr = new_file_source(source, self.parser.chunksize)
+                self.parser.cb_io = &buffer_file_bytes
+                self.parser.cb_cleanup = &del_file_source
+
+            if ptr == NULL:
+                if not os.path.exists(source):
+                    raise compat.FileNotFoundError(
+                        'File %s does not exist' % source)
+                raise IOError('Initializing from file failed')
+
+            self.parser.source = ptr
+
+        elif hasattr(source, 'read'):
+            # e.g., StringIO
+
+            ptr = new_rd_source(source)
+            if ptr == NULL:
+                raise IOError('Initializing parser from file-like '
+                              'object failed')
+
+            self.parser.source = ptr
+            self.parser.cb_io = &buffer_rd_bytes
+            self.parser.cb_cleanup = &del_rd_source
+        else:
+            raise IOError('Expected file path name or file-like object,'
+                          ' got %s type' % type(source))
+
+    cdef _get_header(self):
+        # header is now a list of lists, so field_count should use header[0]
+
+        cdef:
+            Py_ssize_t i, start, field_count, passed_count, unnamed_count  # noqa
+            char *word
+            object name
+            int status
+            int64_t hr, data_line
+            char *errors = "strict"
+            cdef StringPath path = _string_path(self.c_encoding)
+
+        header = []
+        if self.parser.header_start >= 0:
+
+            # Header is in the file
+            for level, hr in enumerate(self.header):
+
+                this_header = []
+
+                if self.parser.lines < hr + 1:
+                    self._tokenize_rows(hr + 2)
+
+                if self.parser.lines == 0:
+                    field_count = 0
+                    start = self.parser.line_start[0]
+
+                # e.g., if header=3 and file only has 2 lines
+                elif (self.parser.lines < hr + 1
+                      and not isinstance(self.orig_header, list)) or (
+                          self.parser.lines < hr):
+                    msg = self.orig_header
+                    if isinstance(msg, list):
+                        msg = "[%s], len of %d," % (
+                            ','.join(str(m) for m in msg), len(msg))
+                    raise ParserError(
+                        'Passed header=%s but only %d lines in file'
+                        % (msg, self.parser.lines))
+
+                else:
+                    field_count = self.parser.line_fields[hr]
+                    start = self.parser.line_start[hr]
+
+                counts = {}
+                unnamed_count = 0
+                for i in range(field_count):
+                    word = self.parser.words[start + i]
+
+                    if path == CSTRING:
+                        name = PyBytes_FromString(word)
+                    elif path == UTF8:
+                        name = PyUnicode_FromString(word)
+                    elif path == ENCODED:
+                        name = PyUnicode_Decode(word, strlen(word),
+                                                self.c_encoding, errors)
+
+                    if name == '':
+                        if self.has_mi_columns:
+                            name = 'Unnamed: %d_level_%d' % (i, level)
+                        else:
+                            name = 'Unnamed: %d' % i
+                        unnamed_count += 1
+
+                    count = counts.get(name, 0)
+
+                    if not self.has_mi_columns and self.mangle_dupe_cols:
+                        while count > 0:
+                            counts[name] = count + 1
+                            name = '%s.%d' % (name, count)
+                            count = counts.get(name, 0)
+
+                    this_header.append(name)
+                    counts[name] = count + 1
+
+                if self.has_mi_columns:
+
+                    # If we have grabbed an extra line, but it's not in our
+                    # format, save in the buffer, and create an blank extra
+                    # line for the rest of the parsing code.
+                    if hr == self.header[-1]:
+                        lc = len(this_header)
+                        ic = (len(self.index_col) if self.index_col
+                              is not None else 0)
+                        if lc != unnamed_count and lc - ic > unnamed_count:
+                            hr -= 1
+                            self.parser_start -= 1
+                            this_header = [None] * lc
+
+                data_line = hr + 1
+                header.append(this_header)
+
+            if self.names is not None:
+                header = [ self.names ]
+
+        elif self.names is not None:
+            # Enforce this unless usecols
+            if not self.has_usecols:
+                self.parser.expected_fields = len(self.names)
+
+            # Names passed
+            if self.parser.lines < 1:
+                self._tokenize_rows(1)
+
+            header = [ self.names ]
+            data_line = 0
+
+            if self.parser.lines < 1:
+                field_count = len(header[0])
+            else:
+                field_count = self.parser.line_fields[data_line]
+        else:
+            # No header passed nor to be found in the file
+            if self.parser.lines < 1:
+                self._tokenize_rows(1)
+
+            return None, self.parser.line_fields[0]
+
+        # Corner case, not enough lines in the file
+        if self.parser.lines < data_line + 1:
+            field_count = len(header[0])
+        else:  # not self.has_usecols:
+
+            field_count = self.parser.line_fields[data_line]
+
+            # #2981
+            if self.names is not None:
+                field_count = max(field_count, len(self.names))
+
+            passed_count = len(header[0])
+
+            # if passed_count > field_count:
+            #     raise ParserError('Column names have %d fields, '
+            #                        'data has %d fields'
+            #                        % (passed_count, field_count))
+
+            if self.has_usecols and self.allow_leading_cols and \
+                    not callable(self.usecols):
+                nuse = len(self.usecols)
+                if nuse == passed_count:
+                    self.leading_cols = 0
+                elif self.names is None and nuse < passed_count:
+                    self.leading_cols = field_count - passed_count
+                elif passed_count != field_count:
+                    raise ValueError('Passed header names '
+                                     'mismatches usecols')
+            # oh boy, #2442, #2981
+            elif self.allow_leading_cols and passed_count < field_count:
+                self.leading_cols = field_count - passed_count
+
+        return header, field_count
+
+    def read(self, rows=None):
+        """
+        rows=None --> read all rows
+        """
+        cdef:
+            int status
+
+        if self.low_memory:
+            # Conserve intermediate space
+            columns = self._read_low_memory(rows)
+        else:
+            # Don't care about memory usage
+            columns = self._read_rows(rows, 1)
+
+        return columns
+
+    cdef _read_low_memory(self, rows):
+        cdef:
+            size_t rows_read = 0
+            chunks = []
+
+        if rows is None:
+            while True:
+                try:
+                    chunk = self._read_rows(self.buffer_lines, 0)
+                    if len(chunk) == 0:
+                        break
+                except StopIteration:
+                    break
+                else:
+                    chunks.append(chunk)
+        else:
+            while rows_read < rows:
+                try:
+                    crows = min(self.buffer_lines, rows - rows_read)
+
+                    chunk = self._read_rows(crows, 0)
+                    if len(chunk) == 0:
+                        break
+
+                    rows_read += len(list(chunk.values())[0])
+                except StopIteration:
+                    break
+                else:
+                    chunks.append(chunk)
+
+        parser_trim_buffers(self.parser)
+
+        if len(chunks) == 0:
+            raise StopIteration
+
+        # destructive to chunks
+        return _concatenate_chunks(chunks)
+
+    cdef _tokenize_rows(self, size_t nrows):
+        cdef int status
+        with nogil:
+            status = tokenize_nrows(self.parser, nrows)
+
+        if self.parser.warn_msg != NULL:
+            print >> sys.stderr, self.parser.warn_msg
+            free(self.parser.warn_msg)
+            self.parser.warn_msg = NULL
+
+        if status < 0:
+            raise_parser_error('Error tokenizing data', self.parser)
+
+    cdef _read_rows(self, rows, bint trim):
+        cdef:
+            int64_t buffered_lines
+            int64_t irows, footer = 0
+
+        self._start_clock()
+
+        if rows is not None:
+            irows = rows
+            buffered_lines = self.parser.lines - self.parser_start
+            if buffered_lines < irows:
+                self._tokenize_rows(irows - buffered_lines)
+
+            if self.skipfooter > 0:
+                raise ValueError('skipfooter can only be used to read '
+                                 'the whole file')
+        else:
+            with nogil:
+                status = tokenize_all_rows(self.parser)
+
+            if self.parser.warn_msg != NULL:
+                print >> sys.stderr, self.parser.warn_msg
+                free(self.parser.warn_msg)
+                self.parser.warn_msg = NULL
+
+            if status < 0:
+                raise_parser_error('Error tokenizing data', self.parser)
+            footer = self.skipfooter
+
+        if self.parser_start >= self.parser.lines:
+            raise StopIteration
+        self._end_clock('Tokenization')
+
+        self._start_clock()
+        columns = self._convert_column_data(rows=rows,
+                                            footer=footer,
+                                            upcast_na=True)
+        self._end_clock('Type conversion')
+
+        self._start_clock()
+        if len(columns) > 0:
+            rows_read = len(list(columns.values())[0])
+            # trim
+            parser_consume_rows(self.parser, rows_read)
+            if trim:
+                parser_trim_buffers(self.parser)
+            self.parser_start -= rows_read
+
+        self._end_clock('Parser memory cleanup')
+
+        return columns
+
+    cdef _start_clock(self):
+        self.clocks.append(time.time())
+
+    cdef _end_clock(self, what):
+        if self.verbose:
+            elapsed = time.time() - self.clocks.pop(-1)
+            print('%s took: %.2f ms' % (what, elapsed * 1000))
+
+    def set_noconvert(self, i):
+        self.noconvert.add(i)
+
+    def remove_noconvert(self, i):
+        self.noconvert.remove(i)
+
+    def _convert_column_data(self, rows=None, upcast_na=False, footer=0):
+        cdef:
+            int64_t i
+            int nused
+            kh_str_t *na_hashset = NULL
+            int64_t start, end
+            object name, na_flist, col_dtype = None
+            bint na_filter = 0
+            int64_t num_cols
+
+        start = self.parser_start
+
+        if rows is None:
+            end = self.parser.lines
+        else:
+            end = min(start + rows, self.parser.lines)
+
+        # # skip footer
+        # if footer > 0:
+        #     end -= footer
+
+        num_cols = -1
+        for i in range(self.parser.lines):
+            num_cols = (num_cols < self.parser.line_fields[i]) * \
+                self.parser.line_fields[i] + \
+                (num_cols >= self.parser.line_fields[i]) * num_cols
+
+        if self.table_width - self.leading_cols > num_cols:
+            raise ParserError(
+                "Too many columns specified: expected %s and found %s" %
+                (self.table_width - self.leading_cols, num_cols))
+
+        results = {}
+        nused = 0
+        for i in range(self.table_width):
+            if i < self.leading_cols:
+                # Pass through leading columns always
+                name = i
+            elif self.usecols and not callable(self.usecols) and \
+                    nused == len(self.usecols):
+                # Once we've gathered all requested columns, stop. GH5766
+                break
+            else:
+                name = self._get_column_name(i, nused)
+                usecols = set()
+                if callable(self.usecols):
+                    if self.usecols(name):
+                        usecols = {i}
+                else:
+                    usecols = self.usecols
+                if self.has_usecols and not (i in usecols or
+                                             name in usecols):
+                    continue
+                nused += 1
+
+            conv = self._get_converter(i, name)
+
+            # XXX
+            na_flist = set()
+            if self.na_filter:
+                na_list, na_flist = self._get_na_list(i, name)
+                if na_list is None:
+                    na_filter = 0
+                else:
+                    na_filter = 1
+                    na_hashset = kset_from_list(na_list)
+            else:
+                na_filter = 0
+
+            col_dtype = None
+            if self.dtype is not None:
+                if isinstance(self.dtype, dict):
+                    if name in self.dtype:
+                        col_dtype = self.dtype[name]
+                    elif i in self.dtype:
+                        col_dtype = self.dtype[i]
+                else:
+                    if self.dtype.names:
+                        # structured array
+                        col_dtype = np.dtype(self.dtype.descr[i][1])
+                    else:
+                        col_dtype = self.dtype
+
+            if conv:
+                if col_dtype is not None:
+                    warnings.warn(("Both a converter and dtype were specified "
+                                   "for column {0} - only the converter will "
+                                   "be used").format(name), ParserWarning,
+                                  stacklevel=5)
+                results[i] = _apply_converter(conv, self.parser, i, start, end,
+                                              self.c_encoding)
+                continue
+
+            # Should return as the desired dtype (inferred or specified)
+            col_res, na_count = self._convert_tokens(
+                i, start, end, name, na_filter, na_hashset,
+                na_flist, col_dtype)
+
+            if na_filter:
+                self._free_na_set(na_hashset)
+
+            if upcast_na and na_count > 0:
+                col_res = _maybe_upcast(col_res)
+
+            if col_res is None:
+                raise ParserError('Unable to parse column %d' % i)
+
+            results[i] = col_res
+
+        self.parser_start += end - start
+
+        return results
+
+    cdef inline _convert_tokens(self, Py_ssize_t i, int start, int end,
+                                object name, bint na_filter,
+                                kh_str_t *na_hashset,
+                                object na_flist, object col_dtype):
+
+        if col_dtype is not None:
+            col_res, na_count = self._convert_with_dtype(
+                col_dtype, i, start, end, na_filter,
+                1, na_hashset, na_flist)
+
+            # Fallback on the parse (e.g. we requested int dtype,
+            # but its actually a float).
+            if col_res is not None:
+                return col_res, na_count
+
+        if i in self.noconvert:
+            return self._string_convert(i, start, end, na_filter, na_hashset)
+        else:
+            col_res = None
+            for dt in self.dtype_cast_order:
+                try:
+                    col_res, na_count = self._convert_with_dtype(
+                        dt, i, start, end, na_filter, 0, na_hashset, na_flist)
+                except ValueError:
+                    # This error is raised from trying to convert to uint64,
+                    # and we discover that we cannot convert to any numerical
+                    # dtype successfully. As a result, we leave the data
+                    # column AS IS with object dtype.
+                    col_res, na_count = self._convert_with_dtype(
+                        np.dtype('object'), i, start, end, 0,
+                        0, na_hashset, na_flist)
+                except OverflowError:
+                    col_res, na_count = self._convert_with_dtype(
+                        np.dtype('object'), i, start, end, na_filter,
+                        0, na_hashset, na_flist)
+
+                if col_res is not None:
+                    break
+
+        # we had a fallback parse on the dtype, so now try to cast
+        # only allow safe casts, eg. with a nan you cannot safely cast to int
+        if col_res is not None and col_dtype is not None:
+            try:
+                col_res = col_res.astype(col_dtype, casting='safe')
+            except TypeError:
+
+                # float -> int conversions can fail the above
+                # even with no nans
+                col_res_orig = col_res
+                col_res = col_res.astype(col_dtype)
+                if (col_res != col_res_orig).any():
+                    raise ValueError(
+                        "cannot safely convert passed user dtype of "
+                        "{col_dtype} for {col_res} dtyped data in "
+                        "column {column}".format(
+                            col_dtype=col_dtype,
+                            col_res=col_res_orig.dtype.name,
+                            column=i))
+
+        return col_res, na_count
+
+    cdef _convert_with_dtype(self, object dtype, Py_ssize_t i,
+                             int64_t start, int64_t end,
+                             bint na_filter,
+                             bint user_dtype,
+                             kh_str_t *na_hashset,
+                             object na_flist):
+        if is_integer_dtype(dtype):
+            try:
+                result, na_count = _try_int64(self.parser, i, start,
+                                              end, na_filter, na_hashset)
+                if user_dtype and na_count is not None:
+                    if na_count > 0:
+                        raise ValueError("Integer column has NA values in "
+                                         "column {column}".format(column=i))
+            except OverflowError:
+                result = _try_uint64(self.parser, i, start, end,
+                                     na_filter, na_hashset)
+                na_count = 0
+
+            if result is not None and dtype != 'int64':
+                result = result.astype(dtype)
+
+            return result, na_count
+
+        elif is_float_dtype(dtype):
+            result, na_count = _try_double(self.parser, i, start, end,
+                                           na_filter, na_hashset, na_flist)
+
+            if result is not None and dtype != 'float64':
+                result = result.astype(dtype)
+            return result, na_count
+
+        elif is_bool_dtype(dtype):
+            result, na_count = _try_bool_flex(self.parser, i, start, end,
+                                              na_filter, na_hashset,
+                                              self.true_set, self.false_set)
+            return result, na_count
+        elif dtype.kind == 'S':
+            # TODO: na handling
+            width = dtype.itemsize
+            if width > 0:
+                result = _to_fw_string(self.parser, i, start, end, width)
+                return result, 0
+
+            # treat as a regular string parsing
+            return self._string_convert(i, start, end, na_filter,
+                                        na_hashset)
+        elif dtype.kind == 'U':
+            width = dtype.itemsize
+            if width > 0:
+                raise TypeError("the dtype %s is not "
+                                "supported for parsing" % dtype)
+
+            # unicode variable width
+            return self._string_convert(i, start, end, na_filter,
+                                        na_hashset)
+        elif is_categorical_dtype(dtype):
+            # TODO: I suspect that _categorical_convert could be
+            # optimized when dtype is an instance of CategoricalDtype
+            codes, cats, na_count = _categorical_convert(
+                self.parser, i, start, end, na_filter,
+                na_hashset, self.c_encoding)
+            cat = Categorical._from_inferred_categories(cats, codes, dtype)
+            return cat, na_count
+
+        elif is_object_dtype(dtype):
+            return self._string_convert(i, start, end, na_filter,
+                                        na_hashset)
+        elif is_datetime64_dtype(dtype):
+            raise TypeError("the dtype %s is not supported "
+                            "for parsing, pass this column "
+                            "using parse_dates instead" % dtype)
+        else:
+            raise TypeError("the dtype %s is not "
+                            "supported for parsing" % dtype)
+
+    cdef _string_convert(self, Py_ssize_t i, int64_t start, int64_t end,
+                         bint na_filter, kh_str_t *na_hashset):
+
+        cdef StringPath path = _string_path(self.c_encoding)
+
+        if path == UTF8:
+            return _string_box_utf8(self.parser, i, start, end, na_filter,
+                                    na_hashset)
+        elif path == ENCODED:
+            return _string_box_decode(self.parser, i, start, end,
+                                      na_filter, na_hashset, self.c_encoding)
+        elif path == CSTRING:
+            return _string_box_factorize(self.parser, i, start, end,
+                                         na_filter, na_hashset)
+
+    def _get_converter(self, i, name):
+        if self.converters is None:
+            return None
+
+        if name is not None and name in self.converters:
+            return self.converters[name]
+
+        # Converter for position, if any
+        return self.converters.get(i)
+
+    cdef _get_na_list(self, i, name):
+        if self.na_values is None:
+            return None, set()
+
+        if isinstance(self.na_values, dict):
+            key = None
+            values = None
+
+            if name is not None and name in self.na_values:
+                key = name
+            elif i in self.na_values:
+                key = i
+            else:  # No na_values provided for this column.
+                if self.keep_default_na:
+                    return _NA_VALUES, set()
+
+                return list(), set()
+
+            values = self.na_values[key]
+            if values is not None and not isinstance(values, list):
+                values = list(values)
+
+            fvalues = self.na_fvalues[key]
+            if fvalues is not None and not isinstance(fvalues, set):
+                fvalues = set(fvalues)
+
+            return _ensure_encoded(values), fvalues
+        else:
+            if not isinstance(self.na_values, list):
+                self.na_values = list(self.na_values)
+            if not isinstance(self.na_fvalues, set):
+                self.na_fvalues = set(self.na_fvalues)
+
+            return _ensure_encoded(self.na_values), self.na_fvalues
+
+    cdef _free_na_set(self, kh_str_t *table):
+        kh_destroy_str(table)
+
+    cdef _get_column_name(self, Py_ssize_t i, Py_ssize_t nused):
+        cdef int64_t j
+        if self.has_usecols and self.names is not None:
+            if (not callable(self.usecols) and
+                    len(self.names) == len(self.usecols)):
+                return self.names[nused]
+            else:
+                return self.names[i - self.leading_cols]
+        else:
+            if self.header is not None:
+                j = i - self.leading_cols
+                # hack for #2442
+                if j == len(self.header[0]):
+                    return j
+                else:
+                    return self.header[0][j]
+            else:
+                return None
+
+
+cdef object _true_values = [b'True', b'TRUE', b'true']
+cdef object _false_values = [b'False', b'FALSE', b'false']
+
+
+def _ensure_encoded(list lst):
+    cdef list result = []
+    for x in lst:
+        if PyUnicode_Check(x):
+            x = PyUnicode_AsUTF8String(x)
+        elif not PyBytes_Check(x):
+            x = asbytes(x)
+
+        result.append(x)
+    return result
+
+
+cdef asbytes(object o):
+    if PY3:
+        return str(o).encode('utf-8')
+    else:
+        return str(o)
+
+
+# common NA values
+# no longer excluding inf representations
+# '1.#INF','-1.#INF', '1.#INF000000',
+_NA_VALUES = _ensure_encoded(list(com._NA_VALUES))
+
+
+def _maybe_upcast(arr):
+    """
+
+    """
+    if issubclass(arr.dtype.type, np.integer):
+        na_value = na_values[arr.dtype]
+        arr = arr.astype(float)
+        np.putmask(arr, arr == na_value, np.nan)
+    elif arr.dtype == np.bool_:
+        mask = arr.view(np.uint8) == na_values[np.uint8]
+        arr = arr.astype(object)
+        np.putmask(arr, mask, np.nan)
+
+    return arr
+
+
+cdef enum StringPath:
+    CSTRING
+    UTF8
+    ENCODED
+
+
+# factored out logic to pick string converter
+cdef inline StringPath _string_path(char *encoding):
+    if encoding != NULL and encoding != b"utf-8":
+        return ENCODED
+    elif PY3 or encoding != NULL:
+        return UTF8
+    else:
+        return CSTRING
+
+
+# ----------------------------------------------------------------------
+# Type conversions / inference support code
+
+
+cdef _string_box_factorize(parser_t *parser, int64_t col,
+                           int64_t line_start, int64_t line_end,
+                           bint na_filter, kh_str_t *na_hashset):
+    cdef:
+        int error, na_count = 0
+        Py_ssize_t i, lines
+        coliter_t it
+        const char *word = NULL
+        ndarray[object] result
+
+        int ret = 0
+        kh_strbox_t *table
+
+        object pyval
+
+        object NA = na_values[np.object_]
+        khiter_t k
+
+    table = kh_init_strbox()
+    lines = line_end - line_start
+    result = np.empty(lines, dtype=np.object_)
+    coliter_setup(&it, parser, col, line_start)
+
+    for i in range(lines):
+        COLITER_NEXT(it, word)
+
+        if na_filter:
+            k = kh_get_str(na_hashset, word)
+            # in the hash table
+            if k != na_hashset.n_buckets:
+                na_count += 1
+                result[i] = NA
+                continue
+
+        k = kh_get_strbox(table, word)
+
+        # in the hash table
+        if k != table.n_buckets:
+            # this increments the refcount, but need to test
+            pyval = <object> table.vals[k]
+        else:
+            # box it. new ref?
+            pyval = PyBytes_FromString(word)
+
+            k = kh_put_strbox(table, word, &ret)
+            table.vals[k] = <PyObject*> pyval
+
+        result[i] = pyval
+
+    kh_destroy_strbox(table)
+
+    return result, na_count
+
+
+cdef _string_box_utf8(parser_t *parser, int64_t col,
+                      int64_t line_start, int64_t line_end,
+                      bint na_filter, kh_str_t *na_hashset):
+    cdef:
+        int error, na_count = 0
+        Py_ssize_t i, lines
+        coliter_t it
+        const char *word = NULL
+        ndarray[object] result
+
+        int ret = 0
+        kh_strbox_t *table
+
+        object pyval
+
+        object NA = na_values[np.object_]
+        khiter_t k
+
+    table = kh_init_strbox()
+    lines = line_end - line_start
+    result = np.empty(lines, dtype=np.object_)
+    coliter_setup(&it, parser, col, line_start)
+
+    for i in range(lines):
+        COLITER_NEXT(it, word)
+
+        if na_filter:
+            k = kh_get_str(na_hashset, word)
+            # in the hash table
+            if k != na_hashset.n_buckets:
+                na_count += 1
+                result[i] = NA
+                continue
+
+        k = kh_get_strbox(table, word)
+
+        # in the hash table
+        if k != table.n_buckets:
+            # this increments the refcount, but need to test
+            pyval = <object> table.vals[k]
+        else:
+            # box it. new ref?
+            pyval = PyUnicode_FromString(word)
+
+            k = kh_put_strbox(table, word, &ret)
+            table.vals[k] = <PyObject *> pyval
+
+        result[i] = pyval
+
+    kh_destroy_strbox(table)
+
+    return result, na_count
+
+
+cdef _string_box_decode(parser_t *parser, int64_t col,
+                        int64_t line_start, int64_t line_end,
+                        bint na_filter, kh_str_t *na_hashset,
+                        char *encoding):
+    cdef:
+        int error, na_count = 0
+        Py_ssize_t i, size, lines
+        coliter_t it
+        const char *word = NULL
+        ndarray[object] result
+
+        int ret = 0
+        kh_strbox_t *table
+
+        char *errors = "strict"
+
+        object pyval
+
+        object NA = na_values[np.object_]
+        khiter_t k
+
+    table = kh_init_strbox()
+    lines = line_end - line_start
+    result = np.empty(lines, dtype=np.object_)
+    coliter_setup(&it, parser, col, line_start)
+
+    for i in range(lines):
+        COLITER_NEXT(it, word)
+
+        if na_filter:
+            k = kh_get_str(na_hashset, word)
+            # in the hash table
+            if k != na_hashset.n_buckets:
+                na_count += 1
+                result[i] = NA
+                continue
+
+        k = kh_get_strbox(table, word)
+
+        # in the hash table
+        if k != table.n_buckets:
+            # this increments the refcount, but need to test
+            pyval = <object> table.vals[k]
+        else:
+            # box it. new ref?
+            size = strlen(word)
+            pyval = PyUnicode_Decode(word, size, encoding, errors)
+
+            k = kh_put_strbox(table, word, &ret)
+            table.vals[k] = <PyObject *> pyval
+
+        result[i] = pyval
+
+    kh_destroy_strbox(table)
+
+    return result, na_count
+
+
+@cython.boundscheck(False)
+cdef _categorical_convert(parser_t *parser, int64_t col,
+                          int64_t line_start, int64_t line_end,
+                          bint na_filter, kh_str_t *na_hashset,
+                          char *encoding):
+    "Convert column data into codes, categories"
+    cdef:
+        int error, na_count = 0
+        Py_ssize_t i, size, lines
+        coliter_t it
+        const char *word = NULL
+
+        int64_t NA = -1
+        int64_t[:] codes
+        int64_t current_category = 0
+
+        char *errors = "strict"
+        cdef StringPath path = _string_path(encoding)
+
+        int ret = 0
+        kh_str_t *table
+        khiter_t k
+
+    lines = line_end - line_start
+    codes = np.empty(lines, dtype=np.int64)
+
+    # factorize parsed values, creating a hash table
+    # bytes -> category code
+    with nogil:
+        table = kh_init_str()
+        coliter_setup(&it, parser, col, line_start)
+
+        for i in range(lines):
+            COLITER_NEXT(it, word)
+
+            if na_filter:
+                k = kh_get_str(na_hashset, word)
+                # is in NA values
+                if k != na_hashset.n_buckets:
+                    na_count += 1
+                    codes[i] = NA
+                    continue
+
+            k = kh_get_str(table, word)
+            # not in the hash table
+            if k == table.n_buckets:
+                k = kh_put_str(table, word, &ret)
+                table.vals[k] = current_category
+                current_category += 1
+
+            codes[i] = table.vals[k]
+
+    # parse and box categories to python strings
+    result = np.empty(table.n_occupied, dtype=np.object_)
+    if path == ENCODED:
+        for k in range(table.n_buckets):
+            if kh_exist_str(table, k):
+                size = strlen(table.keys[k])
+                result[table.vals[k]] = PyUnicode_Decode(
+                    table.keys[k], size, encoding, errors)
+    elif path == UTF8:
+        for k in range(table.n_buckets):
+            if kh_exist_str(table, k):
+                result[table.vals[k]] = PyUnicode_FromString(table.keys[k])
+    elif path == CSTRING:
+        for k in range(table.n_buckets):
+            if kh_exist_str(table, k):
+                result[table.vals[k]] = PyBytes_FromString(table.keys[k])
+
+    kh_destroy_str(table)
+    return np.asarray(codes), result, na_count
+
+
+cdef _to_fw_string(parser_t *parser, int64_t col, int64_t line_start,
+                   int64_t line_end, int64_t width):
+    cdef:
+        Py_ssize_t i
+        coliter_t it
+        const char *word = NULL
+        char *data
+        ndarray result
+
+    result = np.empty(line_end - line_start, dtype='|S%d' % width)
+    data = <char*> result.data
+
+    with nogil:
+        _to_fw_string_nogil(parser, col, line_start, line_end, width, data)
+
+    return result
+
+
+cdef inline void _to_fw_string_nogil(parser_t *parser, int64_t col,
+                                     int64_t line_start, int64_t line_end,
+                                     size_t width, char *data) nogil:
+    cdef:
+        int64_t i
+        coliter_t it
+        const char *word = NULL
+
+    coliter_setup(&it, parser, col, line_start)
+
+    for i in range(line_end - line_start):
+        COLITER_NEXT(it, word)
+        strncpy(data, word, width)
+        data += width
+
+
+cdef char* cinf = b'inf'
+cdef char* cposinf = b'+inf'
+cdef char* cneginf = b'-inf'
+
+
+cdef _try_double(parser_t *parser, int64_t col,
+                 int64_t line_start, int64_t line_end,
+                 bint na_filter, kh_str_t *na_hashset, object na_flist):
+    cdef:
+        int error, na_count = 0
+        Py_ssize_t i, lines
+        coliter_t it
+        const char *word = NULL
+        char *p_end
+        double *data
+        double NA = na_values[np.float64]
+        kh_float64_t *na_fset
+        ndarray result
+        khiter_t k
+        bint use_na_flist = len(na_flist) > 0
+
+    lines = line_end - line_start
+    result = np.empty(lines, dtype=np.float64)
+    data = <double *> result.data
+    na_fset = kset_float64_from_list(na_flist)
+    if parser.double_converter_nogil != NULL:  # if it can run without the GIL
+        with nogil:
+            error = _try_double_nogil(parser, parser.double_converter_nogil,
+                                      col, line_start, line_end,
+                                      na_filter, na_hashset, use_na_flist,
+                                      na_fset, NA, data, &na_count)
+    else:
+        assert parser.double_converter_withgil != NULL
+        error = _try_double_nogil(parser,
+                                  <double (*)(const char *, char **,
+                                              char, char, char, int)
+                                  nogil>parser.double_converter_withgil,
+                                  col, line_start, line_end,
+                                  na_filter, na_hashset, use_na_flist,
+                                  na_fset, NA, data, &na_count)
+    kh_destroy_float64(na_fset)
+    if error != 0:
+        return None, None
+    return result, na_count
+
+
+cdef inline int _try_double_nogil(parser_t *parser,
+                                  double (*double_converter)(
+                                      const char *, char **, char,
+                                      char, char, int) nogil,
+                                  int col, int line_start, int line_end,
+                                  bint na_filter, kh_str_t *na_hashset,
+                                  bint use_na_flist,
+                                  const kh_float64_t *na_flist,
+                                  double NA, double *data,
+                                  int *na_count) nogil:
+    cdef:
+        int error,
+        Py_ssize_t i, lines = line_end - line_start
+        coliter_t it
+        const char *word = NULL
+        char *p_end
+        khiter_t k, k64
+
+    global errno
+
+    na_count[0] = 0
+    coliter_setup(&it, parser, col, line_start)
+
+    if na_filter:
+        for i in range(lines):
+            COLITER_NEXT(it, word)
+
+            k = kh_get_str(na_hashset, word)
+            # in the hash table
+            if k != na_hashset.n_buckets:
+                na_count[0] += 1
+                data[0] = NA
+            else:
+                data[0] = double_converter(word, &p_end, parser.decimal,
+                                           parser.sci, parser.thousands, 1)
+                if errno != 0 or p_end[0] or p_end == word:
+                    if (strcasecmp(word, cinf) == 0 or
+                            strcasecmp(word, cposinf) == 0):
+                        data[0] = INF
+                    elif strcasecmp(word, cneginf) == 0:
+                        data[0] = NEGINF
+                    else:
+                        # Just return a non-zero value since
+                        # the errno is never consumed.
+                        return 1
+                if use_na_flist:
+                    k64 = kh_get_float64(na_flist, data[0])
+                    if k64 != na_flist.n_buckets:
+                        na_count[0] += 1
+                        data[0] = NA
+            data += 1
+    else:
+        for i in range(lines):
+            COLITER_NEXT(it, word)
+            data[0] = double_converter(word, &p_end, parser.decimal,
+                                       parser.sci, parser.thousands, 1)
+            if errno != 0 or p_end[0] or p_end == word:
+                if (strcasecmp(word, cinf) == 0 or
+                        strcasecmp(word, cposinf) == 0):
+                    data[0] = INF
+                elif strcasecmp(word, cneginf) == 0:
+                    data[0] = NEGINF
+                else:
+                    # Just return a non-zero value since
+                    # the errno is never consumed.
+                    return 1
+            data += 1
+
+    return 0
+
+
+cdef _try_uint64(parser_t *parser, int64_t col,
+                 int64_t line_start, int64_t line_end,
+                 bint na_filter, kh_str_t *na_hashset):
+    cdef:
+        int error
+        Py_ssize_t i, lines
+        coliter_t it
+        uint64_t *data
+        ndarray result
+        khiter_t k
+        uint_state state
+
+    lines = line_end - line_start
+    result = np.empty(lines, dtype=np.uint64)
+    data = <uint64_t *> result.data
+
+    uint_state_init(&state)
+    coliter_setup(&it, parser, col, line_start)
+    with nogil:
+        error = _try_uint64_nogil(parser, col, line_start, line_end,
+                                  na_filter, na_hashset, data, &state)
+    if error != 0:
+        if error == ERROR_OVERFLOW:
+            # Can't get the word variable
+            raise OverflowError('Overflow')
+        return None
+
+    if uint64_conflict(&state):
+        raise ValueError('Cannot convert to numerical dtype')
+
+    if state.seen_sint:
+        raise OverflowError('Overflow')
+
+    return result
+
+
+cdef inline int _try_uint64_nogil(parser_t *parser, int64_t col,
+                                  int64_t line_start,
+                                  int64_t line_end, bint na_filter,
+                                  const kh_str_t *na_hashset,
+                                  uint64_t *data, uint_state *state) nogil:
+    cdef:
+        int error
+        Py_ssize_t i, lines = line_end - line_start
+        coliter_t it
+        const char *word = NULL
+        khiter_t k
+
+    coliter_setup(&it, parser, col, line_start)
+
+    if na_filter:
+        for i in range(lines):
+            COLITER_NEXT(it, word)
+            k = kh_get_str(na_hashset, word)
+            # in the hash table
+            if k != na_hashset.n_buckets:
+                state.seen_null = 1
+                data[i] = 0
+                continue
+
+            data[i] = str_to_uint64(state, word, INT64_MAX, UINT64_MAX,
+                                    &error, parser.thousands)
+            if error != 0:
+                return error
+    else:
+        for i in range(lines):
+            COLITER_NEXT(it, word)
+            data[i] = str_to_uint64(state, word, INT64_MAX, UINT64_MAX,
+                                    &error, parser.thousands)
+            if error != 0:
+                return error
+
+    return 0
+
+
+cdef _try_int64(parser_t *parser, int64_t col,
+                int64_t line_start, int64_t line_end,
+                bint na_filter, kh_str_t *na_hashset):
+    cdef:
+        int error, na_count = 0
+        Py_ssize_t i, lines
+        coliter_t it
+        int64_t *data
+        ndarray result
+
+        int64_t NA = na_values[np.int64]
+        khiter_t k
+
+    lines = line_end - line_start
+    result = np.empty(lines, dtype=np.int64)
+    data = <int64_t *> result.data
+    coliter_setup(&it, parser, col, line_start)
+    with nogil:
+        error = _try_int64_nogil(parser, col, line_start, line_end,
+                                 na_filter, na_hashset, NA, data, &na_count)
+    if error != 0:
+        if error == ERROR_OVERFLOW:
+            # Can't get the word variable
+            raise OverflowError('Overflow')
+        return None, None
+
+    return result, na_count
+
+
+cdef inline int _try_int64_nogil(parser_t *parser, int64_t col,
+                                 int64_t line_start,
+                                 int64_t line_end, bint na_filter,
+                                 const kh_str_t *na_hashset, int64_t NA,
+                                 int64_t *data, int *na_count) nogil:
+    cdef:
+        int error
+        Py_ssize_t i, lines = line_end - line_start
+        coliter_t it
+        const char *word = NULL
+        khiter_t k
+
+    na_count[0] = 0
+    coliter_setup(&it, parser, col, line_start)
+
+    if na_filter:
+        for i in range(lines):
+            COLITER_NEXT(it, word)
+            k = kh_get_str(na_hashset, word)
+            # in the hash table
+            if k != na_hashset.n_buckets:
+                na_count[0] += 1
+                data[i] = NA
+                continue
+
+            data[i] = str_to_int64(word, INT64_MIN, INT64_MAX,
+                                   &error, parser.thousands)
+            if error != 0:
+                return error
+    else:
+        for i in range(lines):
+            COLITER_NEXT(it, word)
+            data[i] = str_to_int64(word, INT64_MIN, INT64_MAX,
+                                   &error, parser.thousands)
+            if error != 0:
+                return error
+
+    return 0
+
+
+cdef _try_bool_flex(parser_t *parser, int64_t col,
+                    int64_t line_start, int64_t line_end,
+                    bint na_filter, const kh_str_t *na_hashset,
+                    const kh_str_t *true_hashset,
+                    const kh_str_t *false_hashset):
+    cdef:
+        int error, na_count = 0
+        Py_ssize_t i, lines
+        coliter_t it
+        const char *word = NULL
+        uint8_t *data
+        ndarray result
+
+        uint8_t NA = na_values[np.bool_]
+        khiter_t k
+
+    lines = line_end - line_start
+    result = np.empty(lines, dtype=np.uint8)
+    data = <uint8_t *> result.data
+    with nogil:
+        error = _try_bool_flex_nogil(parser, col, line_start, line_end,
+                                     na_filter, na_hashset, true_hashset,
+                                     false_hashset, NA, data, &na_count)
+    if error != 0:
+        return None, None
+    return result.view(np.bool_), na_count
+
+
+cdef inline int _try_bool_flex_nogil(parser_t *parser, int64_t col,
+                                     int64_t line_start,
+                                     int64_t line_end, bint na_filter,
+                                     const kh_str_t *na_hashset,
+                                     const kh_str_t *true_hashset,
+                                     const kh_str_t *false_hashset,
+                                     uint8_t NA, uint8_t *data,
+                                     int *na_count) nogil:
+    cdef:
+        int error = 0
+        Py_ssize_t i, lines = line_end - line_start
+        coliter_t it
+        const char *word = NULL
+        khiter_t k
+
+    na_count[0] = 0
+    coliter_setup(&it, parser, col, line_start)
+
+    if na_filter:
+        for i in range(lines):
+            COLITER_NEXT(it, word)
+
+            k = kh_get_str(na_hashset, word)
+            # in the hash table
+            if k != na_hashset.n_buckets:
+                na_count[0] += 1
+                data[0] = NA
+                data += 1
+                continue
+
+            k = kh_get_str(true_hashset, word)
+            if k != true_hashset.n_buckets:
+                data[0] = 1
+                data += 1
+                continue
+            k = kh_get_str(false_hashset, word)
+            if k != false_hashset.n_buckets:
+                data[0] = 0
+                data += 1
+                continue
+
+            error = to_boolean(word, data)
+            if error != 0:
+                return error
+            data += 1
+    else:
+        for i in range(lines):
+            COLITER_NEXT(it, word)
+
+            k = kh_get_str(true_hashset, word)
+            if k != true_hashset.n_buckets:
+                data[0] = 1
+                data += 1
+                continue
+
+            k = kh_get_str(false_hashset, word)
+            if k != false_hashset.n_buckets:
+                data[0] = 0
+                data += 1
+                continue
+
+            error = to_boolean(word, data)
+            if error != 0:
+                return error
+            data += 1
+
+    return 0
+
+
+cdef kh_str_t* kset_from_list(list values) except NULL:
+    # caller takes responsibility for freeing the hash table
+    cdef:
+        Py_ssize_t i
+        khiter_t k
+        kh_str_t *table
+        int ret = 0
+
+        object val
+
+    table = kh_init_str()
+
+    for i in range(len(values)):
+        val = values[i]
+
+        # None creeps in sometimes, which isn't possible here
+        if not PyBytes_Check(val):
+            raise ValueError('Must be all encoded bytes')
+
+        k = kh_put_str(table, PyBytes_AsString(val), &ret)
+
+    return table
+
+
+cdef kh_float64_t* kset_float64_from_list(values) except NULL:
+    # caller takes responsibility for freeing the hash table
+    cdef:
+        Py_ssize_t i
+        khiter_t k
+        kh_float64_t *table
+        int ret = 0
+        cnp.float64_t val
+        object value
+
+    table = kh_init_float64()
+
+    for value in values:
+        val = float(value)
+
+        k = kh_put_float64(table, val, &ret)
+
+    return table
+
+
+cdef raise_parser_error(object base, parser_t *parser):
+    cdef:
+        object old_exc
+        object exc_type
+        PyObject *type
+        PyObject *value
+        PyObject *traceback
+
+    if PyErr_Occurred():
+        PyErr_Fetch(&type, &value, &traceback)
+        Py_XDECREF(traceback)
+
+        if value != NULL:
+            old_exc = <object> value
+            Py_XDECREF(value)
+
+            # PyErr_Fetch only returned the error message in *value,
+            # so the Exception class must be extracted from *type.
+            if isinstance(old_exc, compat.string_types):
+                if type != NULL:
+                    exc_type = <object> type
+                else:
+                    exc_type = ParserError
+
+                Py_XDECREF(type)
+                raise exc_type(old_exc)
+            else:
+                Py_XDECREF(type)
+                raise old_exc
+
+    message = '%s. C error: ' % base
+    if parser.error_msg != NULL:
+        if PY3:
+            message += parser.error_msg.decode('utf-8')
+        else:
+            message += parser.error_msg
+    else:
+        message += 'no error message set'
+
+    raise ParserError(message)
+
+
+def _concatenate_chunks(list chunks):
+    cdef:
+        list names = list(chunks[0].keys())
+        object name
+        list warning_columns
+        object warning_names
+        object common_type
+
+    result = {}
+    warning_columns = list()
+    for name in names:
+        arrs = [chunk.pop(name) for chunk in chunks]
+        # Check each arr for consistent types.
+        dtypes = {a.dtype for a in arrs}
+        numpy_dtypes = {x for x in dtypes if not is_categorical_dtype(x)}
+        if len(numpy_dtypes) > 1:
+            common_type = np.find_common_type(numpy_dtypes, [])
+            if common_type == np.object:
+                warning_columns.append(str(name))
+
+        dtype = dtypes.pop()
+        if is_categorical_dtype(dtype):
+            sort_categories = isinstance(dtype, str)
+            result[name] = union_categoricals(arrs,
+                                              sort_categories=sort_categories)
+        else:
+            result[name] = np.concatenate(arrs)
+
+    if warning_columns:
+        warning_names = ','.join(warning_columns)
+        warning_message = " ".join([
+            "Columns (%s) have mixed types." % warning_names,
+            "Specify dtype option on import or set low_memory=False."
+          ])
+        warnings.warn(warning_message, DtypeWarning, stacklevel=8)
+    return result
+
+
+# ----------------------------------------------------------------------
+# NA values
+def _compute_na_values():
+    int64info = np.iinfo(np.int64)
+    int32info = np.iinfo(np.int32)
+    int16info = np.iinfo(np.int16)
+    int8info = np.iinfo(np.int8)
+    uint64info = np.iinfo(np.uint64)
+    uint32info = np.iinfo(np.uint32)
+    uint16info = np.iinfo(np.uint16)
+    uint8info = np.iinfo(np.uint8)
+    na_values = {
+        np.float64: np.nan,
+        np.int64: int64info.min,
+        np.int32: int32info.min,
+        np.int16: int16info.min,
+        np.int8: int8info.min,
+        np.uint64: uint64info.max,
+        np.uint32: uint32info.max,
+        np.uint16: uint16info.max,
+        np.uint8: uint8info.max,
+        np.bool_: uint8info.max,
+        np.object_: np.nan   # oof
+    }
+    return na_values
+
+
+na_values = _compute_na_values()
+
+for k in list(na_values):
+    na_values[np.dtype(k)] = na_values[k]
+
+
+cdef _apply_converter(object f, parser_t *parser, int64_t col,
+                      int64_t line_start, int64_t line_end,
+                      char* c_encoding):
+    cdef:
+        int error
+        Py_ssize_t i, lines
+        coliter_t it
+        const char *word = NULL
+        char *errors = "strict"
+        ndarray[object] result
+        object val
+
+    lines = line_end - line_start
+    result = np.empty(lines, dtype=np.object_)
+
+    coliter_setup(&it, parser, col, line_start)
+
+    if not PY3 and c_encoding == NULL:
+        for i in range(lines):
+            COLITER_NEXT(it, word)
+            val = PyBytes_FromString(word)
+            result[i] = f(val)
+    elif ((PY3 and c_encoding == NULL) or c_encoding == b'utf-8'):
+        for i in range(lines):
+            COLITER_NEXT(it, word)
+            val = PyUnicode_FromString(word)
+            result[i] = f(val)
+    else:
+        for i in range(lines):
+            COLITER_NEXT(it, word)
+            val = PyUnicode_Decode(word, strlen(word),
+                                   c_encoding, errors)
+            result[i] = f(val)
+
+    return lib.maybe_convert_objects(result)
+
+
+def _maybe_encode(values):
+    if values is None:
+        return []
+    return [x.encode('utf-8') if isinstance(x, unicode) else x for x in values]
+
+
+def sanitize_objects(ndarray[object] values, set na_values,
+                     convert_empty=True):
+    """
+    Convert specified values, including the given set na_values and empty
+    strings if convert_empty is True, to np.nan.
+
+    Parameters
+    ----------
+    values : ndarray[object]
+    na_values : set
+    convert_empty : bool (default True)
+    """
+    cdef:
+        Py_ssize_t i, n
+        object val, onan
+        Py_ssize_t na_count = 0
+        dict memo = {}
+
+    n = len(values)
+    onan = np.nan
+
+    for i from 0 <= i < n:
+        val = values[i]
+        if (convert_empty and val == '') or (val in na_values):
+            values[i] = onan
+            na_count += 1
+        elif val in memo:
+            values[i] = memo[val]
+        else:
+            memo[val] = val
+
+    return na_count
diff --git a/pandas/_libs/properties.pyx b/pandas/_libs/properties.pyx
new file mode 100644
index 0000000000000..0f2900619fdb6
--- /dev/null
+++ b/pandas/_libs/properties.pyx
@@ -0,0 +1,69 @@
+# -*- coding: utf-8 -*-
+
+from cython cimport Py_ssize_t
+
+from cpython cimport (
+    PyDict_Contains, PyDict_GetItem, PyDict_SetItem)
+
+
+cdef class CachedProperty(object):
+
+    cdef readonly:
+        object func, name, __doc__
+
+    def __init__(self, func):
+        self.func = func
+        self.name = func.__name__
+        self.__doc__ = getattr(func, '__doc__', None)
+
+    def __get__(self, obj, typ):
+        if obj is None:
+            # accessed on the class, not the instance
+            return self
+
+        # Get the cache or set a default one if needed
+        cache = getattr(obj, '_cache', None)
+        if cache is None:
+            try:
+                cache = obj._cache = {}
+            except (AttributeError):
+                return self
+
+        if PyDict_Contains(cache, self.name):
+            # not necessary to Py_INCREF
+            val = <object> PyDict_GetItem(cache, self.name)
+        else:
+            val = self.func(obj)
+            PyDict_SetItem(cache, self.name, val)
+        return val
+
+    def __set__(self, obj, value):
+        raise AttributeError("Can't set attribute")
+
+
+cache_readonly = CachedProperty
+
+
+cdef class AxisProperty(object):
+
+    cdef readonly:
+        Py_ssize_t axis
+        object __doc__
+
+    def __init__(self, axis=0, doc=""):
+        self.axis = axis
+        self.__doc__ = doc
+
+    def __get__(self, obj, type):
+        cdef:
+            list axes
+
+        if obj is None:
+            # Only instances have _data, not classes
+            return self
+        else:
+            axes = obj._data.axes
+        return axes[self.axis]
+
+    def __set__(self, obj, value):
+        obj._set_axis(self.axis, value)
diff --git a/pandas/_libs/reduction.pyx b/pandas/_libs/reduction.pyx
new file mode 100644
index 0000000000000..3588ac14c87d1
--- /dev/null
+++ b/pandas/_libs/reduction.pyx
@@ -0,0 +1,637 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+from distutils.version import LooseVersion
+
+from cython cimport Py_ssize_t
+from cpython cimport Py_INCREF
+
+from libc.stdlib cimport malloc, free
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport (ndarray,
+                    int64_t,
+                    PyArray_SETITEM,
+                    PyArray_ITER_NEXT, PyArray_ITER_DATA, PyArray_IterNew,
+                    flatiter)
+cnp.import_array()
+
+cimport util
+from lib import maybe_convert_objects
+
+is_numpy_prior_1_6_2 = LooseVersion(np.__version__) < '1.6.2'
+
+
+cdef _get_result_array(object obj, Py_ssize_t size, Py_ssize_t cnt):
+
+    if (util.is_array(obj) or
+            isinstance(obj, list) and len(obj) == cnt or
+            getattr(obj, 'shape', None) == (cnt,)):
+        raise ValueError('function does not reduce')
+
+    return np.empty(size, dtype='O')
+
+
+cdef class Reducer:
+    """
+    Performs generic reduction operation on a C or Fortran-contiguous ndarray
+    while avoiding ndarray construction overhead
+    """
+    cdef:
+        Py_ssize_t increment, chunksize, nresults
+        object arr, dummy, f, labels, typ, ityp, index
+
+    def __init__(self, object arr, object f, axis=1, dummy=None,
+                 labels=None):
+        n, k = arr.shape
+
+        if axis == 0:
+            if not arr.flags.f_contiguous:
+                arr = arr.copy('F')
+
+            self.nresults = k
+            self.chunksize = n
+            self.increment = n * arr.dtype.itemsize
+        else:
+            if not arr.flags.c_contiguous:
+                arr = arr.copy('C')
+
+            self.nresults = n
+            self.chunksize = k
+            self.increment = k * arr.dtype.itemsize
+
+        self.f = f
+        self.arr = arr
+        self.labels = labels
+        self.dummy, self.typ, self.index, self.ityp = self._check_dummy(
+            dummy=dummy)
+
+    def _check_dummy(self, dummy=None):
+        cdef object index=None, typ=None, ityp=None
+
+        if dummy is None:
+            dummy = np.empty(self.chunksize, dtype=self.arr.dtype)
+
+            # our ref is stolen later since we are creating this array
+            # in cython, so increment first
+            Py_INCREF(dummy)
+
+        else:
+
+            # we passed a series-like
+            if hasattr(dummy, 'values'):
+
+                typ = type(dummy)
+                index = getattr(dummy, 'index', None)
+                dummy = dummy.values
+
+            if dummy.dtype != self.arr.dtype:
+                raise ValueError('Dummy array must be same dtype')
+            if len(dummy) != self.chunksize:
+                raise ValueError('Dummy array must be length %d' %
+                                 self.chunksize)
+
+        return dummy, typ, index, ityp
+
+    def get_result(self):
+        cdef:
+            char* dummy_buf
+            ndarray arr, result, chunk
+            Py_ssize_t i, incr
+            flatiter it
+            bint has_labels
+            object res, name, labels, index
+            object cached_typ=None
+
+        arr = self.arr
+        chunk = self.dummy
+        dummy_buf = chunk.data
+        chunk.data = arr.data
+        labels = self.labels
+        has_labels = labels is not None
+        has_index = self.index is not None
+        incr = self.increment
+
+        try:
+            for i in range(self.nresults):
+
+                if has_labels:
+                    name = util.get_value_at(labels, i)
+                else:
+                    name = None
+
+                # create the cached type
+                # each time just reassign the data
+                if i == 0:
+
+                    if self.typ is not None:
+
+                        # recreate with the index if supplied
+                        if has_index:
+
+                            cached_typ = self.typ(
+                                chunk, index=self.index, name=name)
+
+                        else:
+
+                            # use the passsed typ, sans index
+                            cached_typ = self.typ(chunk, name=name)
+
+                # use the cached_typ if possible
+                if cached_typ is not None:
+
+                    if has_index:
+                        object.__setattr__(cached_typ, 'index', self.index)
+
+                    object.__setattr__(
+                        cached_typ._data._block, 'values', chunk)
+                    object.__setattr__(cached_typ, 'name', name)
+                    res = self.f(cached_typ)
+                else:
+                    res = self.f(chunk)
+
+                if hasattr(res, 'values') and util.is_array(res.values):
+                    res = res.values
+                if i == 0:
+                    result = _get_result_array(res,
+                                               self.nresults,
+                                               len(self.dummy))
+                    it = <flatiter> PyArray_IterNew(result)
+
+                PyArray_SETITEM(result, PyArray_ITER_DATA(it), res)
+                chunk.data = chunk.data + self.increment
+                PyArray_ITER_NEXT(it)
+        except Exception, e:
+            if hasattr(e, 'args'):
+                e.args = e.args + (i,)
+            raise
+        finally:
+            # so we don't free the wrong memory
+            chunk.data = dummy_buf
+
+        if result.dtype == np.object_:
+            result = maybe_convert_objects(result)
+
+        return result
+
+
+cdef class SeriesBinGrouper:
+    """
+    Performs grouping operation according to bin edges, rather than labels
+    """
+    cdef:
+        Py_ssize_t nresults, ngroups
+        bint passed_dummy
+
+    cdef public:
+        object arr, index, dummy_arr, dummy_index
+        object values, f, bins, typ, ityp, name
+
+    def __init__(self, object series, object f, object bins, object dummy):
+        n = len(series)
+
+        self.bins = bins
+        self.f = f
+
+        values = series.values
+        if not values.flags.c_contiguous:
+            values = values.copy('C')
+        self.arr = values
+        self.typ = series._constructor
+        self.ityp = series.index._constructor
+        self.index = series.index.values
+        self.name = getattr(series, 'name', None)
+
+        self.dummy_arr, self.dummy_index = self._check_dummy(dummy)
+        self.passed_dummy = dummy is not None
+
+        # kludge for #1688
+        if len(bins) > 0 and bins[-1] == len(series):
+            self.ngroups = len(bins)
+        else:
+            self.ngroups = len(bins) + 1
+
+    def _check_dummy(self, dummy=None):
+        # both values and index must be an ndarray!
+
+        if dummy is None:
+            values = np.empty(0, dtype=self.arr.dtype)
+            index = None
+        else:
+            values = dummy.values
+            if values.dtype != self.arr.dtype:
+                raise ValueError('Dummy array must be same dtype')
+            if not values.flags.contiguous:
+                values = values.copy()
+            index = dummy.index.values
+            if not index.flags.contiguous:
+                index = index.copy()
+
+        return values, index
+
+    def get_result(self):
+        cdef:
+            ndarray arr, result
+            ndarray[int64_t] counts
+            Py_ssize_t i, n, group_size
+            object res
+            bint initialized = 0
+            Slider vslider, islider
+            object name, cached_typ=None, cached_ityp=None
+
+        counts = np.zeros(self.ngroups, dtype=np.int64)
+
+        if self.ngroups > 0:
+            counts[0] = self.bins[0]
+            for i in range(1, self.ngroups):
+                if i == self.ngroups - 1:
+                    counts[i] = len(self.arr) - self.bins[i - 1]
+                else:
+                    counts[i] = self.bins[i] - self.bins[i - 1]
+
+        group_size = 0
+        n = len(self.arr)
+        name = self.name
+
+        vslider = Slider(self.arr, self.dummy_arr)
+        islider = Slider(self.index, self.dummy_index)
+
+        try:
+            for i in range(self.ngroups):
+                group_size = counts[i]
+
+                islider.set_length(group_size)
+                vslider.set_length(group_size)
+
+                if cached_typ is None:
+                    cached_ityp = self.ityp(islider.buf)
+                    cached_typ = self.typ(vslider.buf, index=cached_ityp,
+                                          name=name)
+                else:
+                    object.__setattr__(cached_ityp, '_data', islider.buf)
+                    cached_ityp._engine.clear_mapping()
+                    object.__setattr__(
+                        cached_typ._data._block, 'values', vslider.buf)
+                    object.__setattr__(cached_typ, '_index', cached_ityp)
+                    object.__setattr__(cached_typ, 'name', name)
+
+                cached_ityp._engine.clear_mapping()
+                res = self.f(cached_typ)
+                res = _extract_result(res)
+                if not initialized:
+                    initialized = 1
+                    result = _get_result_array(res,
+                                               self.ngroups,
+                                               len(self.dummy_arr))
+
+                util.assign_value_1d(result, i, res)
+
+                islider.advance(group_size)
+                vslider.advance(group_size)
+
+        except:
+            raise
+        finally:
+            # so we don't free the wrong memory
+            islider.reset()
+            vslider.reset()
+
+        if result.dtype == np.object_:
+            result = maybe_convert_objects(result)
+
+        return result, counts
+
+
+cdef class SeriesGrouper:
+    """
+    Performs generic grouping operation while avoiding ndarray construction
+    overhead
+    """
+    cdef:
+        Py_ssize_t nresults, ngroups
+        bint passed_dummy
+
+    cdef public:
+        object arr, index, dummy_arr, dummy_index
+        object f, labels, values, typ, ityp, name
+
+    def __init__(self, object series, object f, object labels,
+                 Py_ssize_t ngroups, object dummy):
+        n = len(series)
+
+        self.labels = labels
+        self.f = f
+
+        values = series.values
+        if not values.flags.c_contiguous:
+            values = values.copy('C')
+        self.arr = values
+        self.typ = series._constructor
+        self.ityp = series.index._constructor
+        self.index = series.index.values
+        self.name = getattr(series, 'name', None)
+
+        self.dummy_arr, self.dummy_index = self._check_dummy(dummy)
+        self.passed_dummy = dummy is not None
+        self.ngroups = ngroups
+
+    def _check_dummy(self, dummy=None):
+        # both values and index must be an ndarray!
+
+        if dummy is None:
+            values = np.empty(0, dtype=self.arr.dtype)
+            index = None
+        else:
+            values = dummy.values
+            if dummy.dtype != self.arr.dtype:
+                raise ValueError('Dummy array must be same dtype')
+            if not values.flags.contiguous:
+                values = values.copy()
+            index = dummy.index.values
+            if not index.flags.contiguous:
+                index = index.copy()
+
+        return values, index
+
+    def get_result(self):
+        cdef:
+            ndarray arr, result
+            ndarray[int64_t] labels, counts
+            Py_ssize_t i, n, group_size, lab
+            object res
+            bint initialized = 0
+            Slider vslider, islider
+            object name, cached_typ=None, cached_ityp=None
+
+        labels = self.labels
+        counts = np.zeros(self.ngroups, dtype=np.int64)
+        group_size = 0
+        n = len(self.arr)
+        name = self.name
+
+        vslider = Slider(self.arr, self.dummy_arr)
+        islider = Slider(self.index, self.dummy_index)
+
+        try:
+            for i in range(n):
+                group_size += 1
+
+                lab = labels[i]
+
+                if i == n - 1 or lab != labels[i + 1]:
+                    if lab == -1:
+                        islider.advance(group_size)
+                        vslider.advance(group_size)
+                        group_size = 0
+                        continue
+
+                    islider.set_length(group_size)
+                    vslider.set_length(group_size)
+
+                    if cached_typ is None:
+                        cached_ityp = self.ityp(islider.buf)
+                        cached_typ = self.typ(vslider.buf, index=cached_ityp,
+                                              name=name)
+                    else:
+                        object.__setattr__(cached_ityp, '_data', islider.buf)
+                        cached_ityp._engine.clear_mapping()
+                        object.__setattr__(
+                            cached_typ._data._block, 'values', vslider.buf)
+                        object.__setattr__(cached_typ, '_index', cached_ityp)
+                        object.__setattr__(cached_typ, 'name', name)
+
+                    cached_ityp._engine.clear_mapping()
+                    res = self.f(cached_typ)
+                    res = _extract_result(res)
+                    if not initialized:
+                        initialized = 1
+                        result = _get_result_array(res,
+                                                   self.ngroups,
+                                                   len(self.dummy_arr))
+
+                    util.assign_value_1d(result, lab, res)
+                    counts[lab] = group_size
+                    islider.advance(group_size)
+                    vslider.advance(group_size)
+
+                    group_size = 0
+
+        except:
+            raise
+        finally:
+            # so we don't free the wrong memory
+            islider.reset()
+            vslider.reset()
+
+        if result.dtype == np.object_:
+            result = maybe_convert_objects(result)
+
+        return result, counts
+
+
+cdef inline _extract_result(object res):
+    """ extract the result object, it might be a 0-dim ndarray
+        or a len-1 0-dim, or a scalar """
+    if hasattr(res, 'values') and util.is_array(res.values):
+        res = res.values
+    if not np.isscalar(res):
+        if util.is_array(res):
+            if res.ndim == 0:
+                res = res.item()
+            elif res.ndim == 1 and len(res) == 1:
+                res = res[0]
+    return res
+
+cdef class Slider:
+    """
+    Only handles contiguous data for now
+    """
+    cdef:
+        ndarray values, buf
+        Py_ssize_t stride, orig_len, orig_stride
+        char *orig_data
+
+    def __init__(self, object values, object buf):
+        assert(values.ndim == 1)
+
+        if not values.flags.contiguous:
+            values = values.copy()
+
+        assert(values.dtype == buf.dtype)
+        self.values = values
+        self.buf = buf
+        self.stride = values.strides[0]
+
+        self.orig_data = self.buf.data
+        self.orig_len = self.buf.shape[0]
+        self.orig_stride = self.buf.strides[0]
+
+        self.buf.data = self.values.data
+        self.buf.strides[0] = self.stride
+
+    cpdef advance(self, Py_ssize_t k):
+        self.buf.data = <char*> self.buf.data + self.stride * k
+
+    cdef move(self, int start, int end):
+        """
+        For slicing
+        """
+        self.buf.data = self.values.data + self.stride * start
+        self.buf.shape[0] = end - start
+
+    cpdef set_length(self, Py_ssize_t length):
+        self.buf.shape[0] = length
+
+    cpdef reset(self):
+
+        self.buf.shape[0] = self.orig_len
+        self.buf.data = self.orig_data
+        self.buf.strides[0] = self.orig_stride
+
+
+class InvalidApply(Exception):
+    pass
+
+
+def apply_frame_axis0(object frame, object f, object names,
+                      ndarray[int64_t] starts, ndarray[int64_t] ends):
+    cdef:
+        BlockSlider slider
+        Py_ssize_t i, n = len(starts)
+        list results
+        object piece
+        dict item_cache
+
+    if frame.index._has_complex_internals:
+        raise InvalidApply('Cannot modify frame index internals')
+
+    results = []
+
+    # Need to infer if our low-level mucking is going to cause a segfault
+    if n > 0:
+        chunk = frame.iloc[starts[0]:ends[0]]
+        object.__setattr__(chunk, 'name', names[0])
+        try:
+            result = f(chunk)
+            if result is chunk:
+                raise InvalidApply('Function unsafe for fast apply')
+        except:
+            raise InvalidApply('Let this error raise above us')
+
+    slider = BlockSlider(frame)
+
+    mutated = False
+    item_cache = slider.dummy._item_cache
+    try:
+        for i in range(n):
+            slider.move(starts[i], ends[i])
+
+            item_cache.clear()  # ugh
+
+            object.__setattr__(slider.dummy, 'name', names[i])
+            piece = f(slider.dummy)
+
+            # I'm paying the price for index-sharing, ugh
+            try:
+                if piece.index is slider.dummy.index:
+                    piece = piece.copy(deep='all')
+                else:
+                    mutated = True
+            except AttributeError:
+                pass
+
+            results.append(piece)
+    finally:
+        slider.reset()
+
+    return results, mutated
+
+
+cdef class BlockSlider:
+    """
+    Only capable of sliding on axis=0
+    """
+
+    cdef public:
+        object frame, dummy, index
+        int nblocks
+        Slider idx_slider
+        list blocks
+
+    cdef:
+        char **base_ptrs
+
+    def __init__(self, frame):
+        self.frame = frame
+        self.dummy = frame[:0]
+        self.index = self.dummy.index
+
+        self.blocks = [b.values for b in self.dummy._data.blocks]
+
+        for x in self.blocks:
+            util.set_array_not_contiguous(x)
+
+        self.nblocks = len(self.blocks)
+        self.idx_slider = Slider(
+            self.frame.index.values, self.dummy.index.values)
+
+        self.base_ptrs = <char**> malloc(sizeof(char*) * len(self.blocks))
+        for i, block in enumerate(self.blocks):
+            self.base_ptrs[i] = (<ndarray> block).data
+
+    def __dealloc__(self):
+        free(self.base_ptrs)
+
+    cpdef move(self, int start, int end):
+        cdef:
+            ndarray arr
+            object index
+
+        # move blocks
+        for i in range(self.nblocks):
+            arr = self.blocks[i]
+
+            # axis=1 is the frame's axis=0
+            arr.data = self.base_ptrs[i] + arr.strides[1] * start
+            arr.shape[1] = end - start
+
+        # move and set the index
+        self.idx_slider.move(start, end)
+        object.__setattr__(self.index, '_data', self.idx_slider.buf)
+        self.index._engine.clear_mapping()
+
+    cdef reset(self):
+        cdef:
+            ndarray arr
+
+        # reset blocks
+        for i in range(self.nblocks):
+            arr = self.blocks[i]
+
+            # axis=1 is the frame's axis=0
+            arr.data = self.base_ptrs[i]
+            arr.shape[1] = 0
+
+
+def reduce(arr, f, axis=0, dummy=None, labels=None):
+    """
+
+    Parameters
+    -----------
+    arr : NDFrame object
+    f : function
+    axis : integer axis
+    dummy : type of reduced output (series)
+    labels : Index or None
+    """
+
+    if labels is not None:
+        if labels._has_complex_internals:
+            raise Exception('Cannot use shortcut')
+
+        # pass as an ndarray
+        if hasattr(labels, 'values'):
+            labels = labels.values
+
+    reducer = Reducer(arr, f, axis=axis, dummy=dummy, labels=labels)
+    return reducer.get_result()
diff --git a/pandas/_libs/reshape.pyx b/pandas/_libs/reshape.pyx
new file mode 100644
index 0000000000000..1d7893f69c31d
--- /dev/null
+++ b/pandas/_libs/reshape.pyx
@@ -0,0 +1,17 @@
+# cython: profile=False
+
+cimport cython
+from cython cimport Py_ssize_t
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport (ndarray,
+                    int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
+                    uint32_t, uint64_t, float32_t, float64_t)
+cnp.import_array()
+
+
+cdef double NaN = <double> np.NaN
+cdef double nan = NaN
+
+include "reshape_helper.pxi"
diff --git a/pandas/_libs/reshape_helper.pxi.in b/pandas/_libs/reshape_helper.pxi.in
new file mode 100644
index 0000000000000..bb9a5977f8b45
--- /dev/null
+++ b/pandas/_libs/reshape_helper.pxi.in
@@ -0,0 +1,81 @@
+"""
+Template for each `dtype` helper function for take
+
+WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
+"""
+
+# ----------------------------------------------------------------------
+# reshape
+# ----------------------------------------------------------------------
+
+{{py:
+
+# name, c_type
+dtypes = [('uint8', 'uint8_t'),
+          ('uint16', 'uint16_t'),
+          ('uint32', 'uint32_t'),
+          ('uint64', 'uint64_t'),
+          ('int8', 'int8_t'),
+          ('int16', 'int16_t'),
+          ('int32', 'int32_t'),
+          ('int64', 'int64_t'),
+          ('float32', 'float32_t'),
+          ('float64', 'float64_t'),
+          ('object', 'object')]
+}}
+
+{{for dtype, c_type in dtypes}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def unstack_{{dtype}}(ndarray[{{c_type}}, ndim=2] values,
+                      ndarray[uint8_t, ndim=1] mask,
+                      Py_ssize_t stride,
+                      Py_ssize_t length,
+                      Py_ssize_t width,
+                      ndarray[{{c_type}}, ndim=2] new_values,
+                      ndarray[uint8_t, ndim=2] new_mask):
+    """
+    transform long sorted_values to wide new_values
+
+    Parameters
+    ----------
+    values : typed ndarray
+    mask : boolean ndarray
+    stride : int
+    length : int
+    width : int
+    new_values : typed ndarray
+        result array
+    new_mask : boolean ndarray
+        result mask
+
+    """
+
+    cdef:
+        Py_ssize_t i, j, w, nulls, s, offset
+
+    {{if dtype == 'object'}}
+    if True:
+    {{else}}
+    with nogil:
+    {{endif}}
+
+        for i in range(stride):
+
+            nulls = 0
+            for j in range(length):
+
+                for w in range(width):
+
+                    offset = j * width + w
+
+                    if mask[offset]:
+                        s = i * width + w
+                        new_values[j, s] = values[offset - nulls, i]
+                        new_mask[j, s] = 1
+                    else:
+                        nulls += 1
+
+{{endfor}}
diff --git a/pandas/_libs/skiplist.pxd b/pandas/_libs/skiplist.pxd
new file mode 100644
index 0000000000000..82a0862112199
--- /dev/null
+++ b/pandas/_libs/skiplist.pxd
@@ -0,0 +1,48 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+from cython cimport Py_ssize_t
+
+from numpy cimport double_t
+
+
+cdef extern from "src/skiplist.h":
+    ctypedef struct node_t:
+        node_t **next
+        int *width
+        double value
+        int is_nil
+        int levels
+        int ref_count
+
+    ctypedef struct skiplist_t:
+        node_t *head
+        node_t **tmp_chain
+        int *tmp_steps
+        int size
+        int maxlevels
+
+    skiplist_t* skiplist_init(int) nogil
+    void skiplist_destroy(skiplist_t*) nogil
+    double skiplist_get(skiplist_t*, int, int*) nogil
+    int skiplist_insert(skiplist_t*, double) nogil
+    int skiplist_remove(skiplist_t*, double) nogil
+
+
+# Note: Node is declared here so that IndexableSkiplist can be exposed;
+# Node itself not intended to be exposed.
+cdef class Node:
+    cdef public:
+        double_t value
+        list next
+        list width
+
+
+cdef class IndexableSkiplist:
+    cdef:
+        Py_ssize_t size, maxlevels
+        Node head
+
+    cpdef get(self, Py_ssize_t i)
+    cpdef insert(self, double value)
+    cpdef remove(self, double value)
diff --git a/pandas/src/skiplist.pyx b/pandas/_libs/skiplist.pyx
similarity index 91%
rename from pandas/src/skiplist.pyx
rename to pandas/_libs/skiplist.pyx
index 4e00fd276c729..5ede31b24118d 100644
--- a/pandas/src/skiplist.pyx
+++ b/pandas/_libs/skiplist.pyx
@@ -6,34 +6,29 @@
 
 # Cython version: Wes McKinney
 
-cdef extern from "numpy/arrayobject.h":
+from libc.math cimport log
 
-    void import_array()
+import numpy as np
+cimport numpy as cnp
+from numpy cimport double_t
+cnp.import_array()
 
-cdef extern from "math.h":
-    double log(double x)
 
 # MSVC does not have log2!
 
 cdef double Log2(double x):
     return log(x) / log(2.)
 
-cimport numpy as np
-from numpy cimport *
-import numpy as np
 
 from random import random
 
-# initialize numpy
-import_array()
-
 # TODO: optimize this, make less messy
 
 cdef class Node:
-    cdef public:
-        double_t value
-        list next
-        list width
+    # cdef public:
+    #    double_t value
+    #    list next
+    #    list width
 
     def __init__(self, double_t value, list next, list width):
         self.value = value
@@ -44,13 +39,13 @@ cdef class Node:
 NIL = Node(np.inf, [], [])
 
 cdef class IndexableSkiplist:
-    '''
+    """
     Sorted collection supporting O(lg n) insertion, removal, and
     lookup by rank.
-    '''
-    cdef:
-        Py_ssize_t size, maxlevels
-        Node head
+    """
+    # cdef:
+    #    Py_ssize_t size, maxlevels
+    #    Node head
 
     def __init__(self, expected_size=100):
         self.size = 0
@@ -75,7 +70,6 @@ cdef class IndexableSkiplist:
                 i -= node.width[level]
                 node = node.next[level]
 
-
         return node.value
 
     cpdef insert(self, double value):
diff --git a/pandas/_libs/sparse.pyx b/pandas/_libs/sparse.pyx
new file mode 100644
index 0000000000000..2abd270652433
--- /dev/null
+++ b/pandas/_libs/sparse.pyx
@@ -0,0 +1,870 @@
+# -*- coding: utf-8 -*-
+import operator
+import sys
+
+cimport cython
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport (ndarray, uint8_t, int64_t, int32_t, int16_t, int8_t,
+                    float64_t, float32_t)
+cnp.import_array()
+
+
+from distutils.version import LooseVersion
+
+# numpy versioning
+_np_version = np.version.short_version
+_np_version_under1p10 = LooseVersion(_np_version) < LooseVersion('1.10')
+_np_version_under1p11 = LooseVersion(_np_version) < LooseVersion('1.11')
+
+
+# -----------------------------------------------------------------------------
+# Preamble stuff
+
+cdef float64_t NaN = <float64_t> np.NaN
+cdef float64_t INF = <float64_t> np.inf
+
+cdef inline int int_max(int a, int b): return a if a >= b else b
+cdef inline int int_min(int a, int b): return a if a <= b else b
+
+# -----------------------------------------------------------------------------
+
+
+cdef class SparseIndex:
+    """
+    Abstract superclass for sparse index types.
+    """
+
+    def __init__(self):
+        raise NotImplementedError
+
+
+cdef class IntIndex(SparseIndex):
+    """
+    Object for holding exact integer sparse indexing information
+
+    Parameters
+    ----------
+    length : integer
+    indices : array-like
+        Contains integers corresponding to the indices.
+    """
+
+    cdef readonly:
+        Py_ssize_t length, npoints
+        ndarray indices
+
+    def __init__(self, Py_ssize_t length, indices):
+        self.length = length
+        self.indices = np.ascontiguousarray(indices, dtype=np.int32)
+        self.npoints = len(self.indices)
+
+        self.check_integrity()
+
+    def __reduce__(self):
+        args = (self.length, self.indices)
+        return IntIndex, args
+
+    def __repr__(self):
+        output = 'IntIndex\n'
+        output += 'Indices: %s\n' % repr(self.indices)
+        return output
+
+    def check_integrity(self):
+        """
+        Checks the following:
+
+        - Indices are strictly ascending
+        - Number of indices is at most self.length
+        - Indices are at least 0 and at most the total length less one
+
+        A ValueError is raised if any of these conditions is violated.
+        """
+
+        cdef:
+            int32_t index, prev = -1
+
+        if self.npoints > self.length:
+            msg = ("Too many indices. Expected "
+                   "{exp} but found {act}").format(
+                exp=self.length, act=self.npoints)
+            raise ValueError(msg)
+
+        # Indices are vacuously ordered and non-negative
+        # if the sequence of indices is empty.
+        if self.npoints == 0:
+            return
+
+        if min(self.indices) < 0:
+            raise ValueError("No index can be less than zero")
+
+        if max(self.indices) >= self.length:
+            raise ValueError("All indices must be less than the length")
+
+        for index in self.indices:
+            if prev != -1 and index <= prev:
+                raise ValueError("Indices must be strictly increasing")
+
+            prev = index
+
+    def equals(self, other):
+        if not isinstance(other, IntIndex):
+            return False
+
+        if self is other:
+            return True
+
+        same_length = self.length == other.length
+        same_indices = np.array_equal(self.indices, other.indices)
+        return same_length and same_indices
+
+    @property
+    def ngaps(self):
+        return self.length - self.npoints
+
+    def to_int_index(self):
+        return self
+
+    def to_block_index(self):
+        locs, lens = get_blocks(self.indices)
+        return BlockIndex(self.length, locs, lens)
+
+    cpdef IntIndex intersect(self, SparseIndex y_):
+        cdef:
+            Py_ssize_t out_length, xi, yi = 0, result_indexer = 0
+            int32_t xind
+            ndarray[int32_t, ndim=1] xindices, yindices, new_indices
+            IntIndex y
+
+        # if is one already, returns self
+        y = y_.to_int_index()
+
+        if self.length != y.length:
+            raise Exception('Indices must reference same underlying length')
+
+        xindices = self.indices
+        yindices = y.indices
+        new_indices = np.empty(min(
+            len(xindices), len(yindices)), dtype=np.int32)
+
+        for xi from 0 <= xi < self.npoints:
+            xind = xindices[xi]
+
+            while yi < y.npoints and yindices[yi] < xind:
+                yi += 1
+
+            if yi >= y.npoints:
+                break
+
+            # TODO: would a two-pass algorithm be faster?
+            if yindices[yi] == xind:
+                new_indices[result_indexer] = xind
+                result_indexer += 1
+
+        new_indices = new_indices[:result_indexer]
+        return IntIndex(self.length, new_indices)
+
+    cpdef IntIndex make_union(self, SparseIndex y_):
+
+        cdef:
+            ndarray[int32_t, ndim=1] new_indices
+            IntIndex y
+
+        # if is one already, returns self
+        y = y_.to_int_index()
+
+        if self.length != y.length:
+            raise ValueError('Indices must reference same underlying length')
+
+        new_indices = np.union1d(self.indices, y.indices)
+        return IntIndex(self.length, new_indices)
+
+    @cython.wraparound(False)
+    cpdef int32_t lookup(self, Py_ssize_t index):
+        """
+        Return the internal location if value exists on given index.
+        Return -1 otherwise.
+        """
+        cdef:
+            int32_t res
+            ndarray[int32_t, ndim=1] inds
+
+        inds = self.indices
+        if self.npoints == 0:
+            return -1
+        elif index < 0 or self.length <= index:
+            return -1
+
+        res = inds.searchsorted(index)
+        if res == self.npoints:
+            return -1
+        elif inds[res] == index:
+            return res
+        else:
+            return -1
+
+    @cython.wraparound(False)
+    cpdef ndarray[int32_t] lookup_array(self, ndarray[
+            int32_t, ndim=1] indexer):
+        """
+        Vectorized lookup, returns ndarray[int32_t]
+        """
+        cdef:
+            Py_ssize_t n, i, ind_val
+            ndarray[int32_t, ndim=1] inds
+            ndarray[uint8_t, ndim=1, cast=True] mask
+            ndarray[int32_t, ndim=1] masked
+            ndarray[int32_t, ndim=1] res
+            ndarray[int32_t, ndim=1] results
+
+        n = len(indexer)
+        results = np.empty(n, dtype=np.int32)
+        results.fill(-1)
+
+        if self.npoints == 0:
+            return results
+
+        inds = self.indices
+        mask = (inds[0] <= indexer) & (indexer <= inds[len(inds) - 1])
+
+        masked = indexer[mask]
+        res = inds.searchsorted(masked).astype(np.int32)
+
+        res[inds[res] != masked] = -1
+        results[mask] = res
+        return results
+
+    cpdef ndarray reindex(self, ndarray[float64_t, ndim=1] values,
+                          float64_t fill_value, SparseIndex other_):
+        cdef:
+            Py_ssize_t i = 0, j = 0
+            IntIndex other
+            ndarray[float64_t, ndim=1] result
+            ndarray[int32_t, ndim=1] sinds, oinds
+
+        other = other_.to_int_index()
+
+        oinds = other.indices
+        sinds = self.indices
+
+        result = np.empty(other.npoints, dtype=np.float64)
+        result.fill(fill_value)
+
+        for 0 <= i < other.npoints:
+            while oinds[i] > sinds[j] and j < self.npoints:
+                j += 1
+
+            if j == self.npoints:
+                break
+
+            if oinds[i] < sinds[j]:
+                continue
+            elif oinds[i] == sinds[j]:
+                result[i] = values[j]
+                j += 1
+
+        return result
+
+    cpdef put(self, ndarray[float64_t, ndim=1] values,
+              ndarray[int32_t, ndim=1] indices, object to_put):
+        pass
+
+    cpdef take(self, ndarray[float64_t, ndim=1] values,
+               ndarray[int32_t, ndim=1] indices):
+        pass
+
+cpdef get_blocks(ndarray[int32_t, ndim=1] indices):
+    cdef:
+        Py_ssize_t init_len, i, npoints, result_indexer = 0
+        int32_t block, length = 1, cur, prev
+        ndarray[int32_t, ndim=1] locs, lens
+
+    npoints = len(indices)
+
+    # just handle the special empty case separately
+    if npoints == 0:
+        return np.array([], dtype=np.int32), np.array([], dtype=np.int32)
+
+    # block size can't be longer than npoints
+    locs = np.empty(npoints, dtype=np.int32)
+    lens = np.empty(npoints, dtype=np.int32)
+
+    # TODO: two-pass algorithm faster?
+    prev = block = indices[0]
+    for i from 1 <= i < npoints:
+        cur = indices[i]
+        if cur - prev > 1:
+            # new block
+            locs[result_indexer] = block
+            lens[result_indexer] = length
+            block = cur
+            length = 1
+            result_indexer += 1
+        else:
+            # same block, increment length
+            length += 1
+
+        prev = cur
+
+    locs[result_indexer] = block
+    lens[result_indexer] = length
+    result_indexer += 1
+    locs = locs[:result_indexer]
+    lens = lens[:result_indexer]
+    return locs, lens
+
+# -----------------------------------------------------------------------------
+# BlockIndex
+
+cdef class BlockIndex(SparseIndex):
+    """
+    Object for holding block-based sparse indexing information
+
+    Parameters
+    ----------
+    """
+    cdef readonly:
+        int32_t nblocks, npoints, length
+        ndarray blocs, blengths
+
+    cdef:
+        object __weakref__  # need to be picklable
+        int32_t *locbuf
+        int32_t *lenbuf
+
+    def __init__(self, length, blocs, blengths):
+
+        self.blocs = np.ascontiguousarray(blocs, dtype=np.int32)
+        self.blengths = np.ascontiguousarray(blengths, dtype=np.int32)
+
+        # in case we need
+        self.locbuf = <int32_t*> self.blocs.data
+        self.lenbuf = <int32_t*> self.blengths.data
+
+        self.length = length
+        self.nblocks = np.int32(len(self.blocs))
+        self.npoints = self.blengths.sum()
+
+        # self.block_start = blocs
+        # self.block_end = blocs + blengths
+
+        self.check_integrity()
+
+    def __reduce__(self):
+        args = (self.length, self.blocs, self.blengths)
+        return BlockIndex, args
+
+    def __repr__(self):
+        output = 'BlockIndex\n'
+        output += 'Block locations: %s\n' % repr(self.blocs)
+        output += 'Block lengths: %s' % repr(self.blengths)
+
+        return output
+
+    @property
+    def ngaps(self):
+        return self.length - self.npoints
+
+    cpdef check_integrity(self):
+        """
+        Check:
+        - Locations are in ascending order
+        - No overlapping blocks
+        - Blocks to not start after end of index, nor extend beyond end
+        """
+        cdef:
+            Py_ssize_t i
+            ndarray[int32_t, ndim=1] blocs, blengths
+
+        blocs = self.blocs
+        blengths = self.blengths
+
+        if len(blocs) != len(blengths):
+            raise ValueError('block bound arrays must be same length')
+
+        for i from 0 <= i < self.nblocks:
+            if i > 0:
+                if blocs[i] <= blocs[i - 1]:
+                    raise ValueError('Locations not in ascending order')
+
+            if i < self.nblocks - 1:
+                if blocs[i] + blengths[i] > blocs[i + 1]:
+                    raise ValueError('Block %d overlaps' % i)
+            else:
+                if blocs[i] + blengths[i] > self.length:
+                    raise ValueError('Block %d extends beyond end' % i)
+
+            # no zero-length blocks
+            if blengths[i] == 0:
+                raise ValueError('Zero-length block %d' % i)
+
+    def equals(self, other):
+        if not isinstance(other, BlockIndex):
+            return False
+
+        if self is other:
+            return True
+
+        same_length = self.length == other.length
+        same_blocks = (np.array_equal(self.blocs, other.blocs) and
+                       np.array_equal(self.blengths, other.blengths))
+        return same_length and same_blocks
+
+    def to_block_index(self):
+        return self
+
+    def to_int_index(self):
+        cdef:
+            int32_t i = 0, j, b
+            int32_t offset
+            ndarray[int32_t, ndim=1] indices
+
+        indices = np.empty(self.npoints, dtype=np.int32)
+
+        for b from 0 <= b < self.nblocks:
+            offset = self.locbuf[b]
+
+            for j from 0 <= j < self.lenbuf[b]:
+                indices[i] = offset + j
+                i += 1
+
+        return IntIndex(self.length, indices)
+
+    cpdef BlockIndex intersect(self, SparseIndex other):
+        """
+        Intersect two BlockIndex objects
+
+        Parameters
+        ----------
+
+        Returns
+        -------
+        intersection : BlockIndex
+        """
+        cdef:
+            BlockIndex y
+            ndarray[int32_t, ndim=1] xloc, xlen, yloc, ylen, out_bloc, out_blen
+            Py_ssize_t xi = 0, yi = 0, max_len, result_indexer = 0
+            int32_t cur_loc, cur_length, diff
+
+        y = other.to_block_index()
+
+        if self.length != y.length:
+            raise Exception('Indices must reference same underlying length')
+
+        xloc = self.blocs
+        xlen = self.blengths
+        yloc = y.blocs
+        ylen = y.blengths
+
+        # block may be split, but can't exceed original len / 2 + 1
+        max_len = int(min(self.length, y.length) / 2) + 1
+        out_bloc = np.empty(max_len, dtype=np.int32)
+        out_blen = np.empty(max_len, dtype=np.int32)
+
+        while True:
+            # we are done (or possibly never began)
+            if xi >= self.nblocks or yi >= y.nblocks:
+                break
+
+            # completely symmetric...would like to avoid code dup but oh well
+            if xloc[xi] >= yloc[yi]:
+                cur_loc = xloc[xi]
+                diff = xloc[xi] - yloc[yi]
+
+                if ylen[yi] <= diff:
+                    # have to skip this block
+                    yi += 1
+                    continue
+
+                if ylen[yi] - diff < xlen[xi]:
+                    # take end of y block, move onward
+                    cur_length = ylen[yi] - diff
+                    yi += 1
+                else:
+                    # take end of x block
+                    cur_length = xlen[xi]
+                    xi += 1
+
+            else:  # xloc[xi] < yloc[yi]
+                cur_loc = yloc[yi]
+                diff = yloc[yi] - xloc[xi]
+
+                if xlen[xi] <= diff:
+                    # have to skip this block
+                    xi += 1
+                    continue
+
+                if xlen[xi] - diff < ylen[yi]:
+                    # take end of x block, move onward
+                    cur_length = xlen[xi] - diff
+                    xi += 1
+                else:
+                    # take end of y block
+                    cur_length = ylen[yi]
+                    yi += 1
+
+            out_bloc[result_indexer] = cur_loc
+            out_blen[result_indexer] = cur_length
+            result_indexer += 1
+
+        out_bloc = out_bloc[:result_indexer]
+        out_blen = out_blen[:result_indexer]
+
+        return BlockIndex(self.length, out_bloc, out_blen)
+
+    cpdef BlockIndex make_union(self, SparseIndex y):
+        """
+        Combine together two BlockIndex objects, accepting indices if contained
+        in one or the other
+
+        Parameters
+        ----------
+        other : SparseIndex
+
+        Notes
+        -----
+        union is a protected keyword in Cython, hence make_union
+
+        Returns
+        -------
+        union : BlockIndex
+        """
+        return BlockUnion(self, y.to_block_index()).result
+
+    cpdef Py_ssize_t lookup(self, Py_ssize_t index):
+        """
+        Return the internal location if value exists on given index.
+        Return -1 otherwise.
+        """
+        cdef:
+            Py_ssize_t i, cum_len
+            ndarray[int32_t, ndim=1] locs, lens
+
+        locs = self.blocs
+        lens = self.blengths
+
+        if self.nblocks == 0:
+            return -1
+        elif index < locs[0]:
+            return -1
+
+        cum_len = 0
+        for i from 0 <= i < self.nblocks:
+            if index >= locs[i] and index < locs[i] + lens[i]:
+                return cum_len + index - locs[i]
+            cum_len += lens[i]
+
+        return -1
+
+    @cython.wraparound(False)
+    cpdef ndarray[int32_t] lookup_array(self, ndarray[
+            int32_t, ndim=1] indexer):
+        """
+        Vectorized lookup, returns ndarray[int32_t]
+        """
+        cdef:
+            Py_ssize_t n, i, j, ind_val
+            ndarray[int32_t, ndim=1] locs, lens
+            ndarray[int32_t, ndim=1] results
+
+        locs = self.blocs
+        lens = self.blengths
+
+        n = len(indexer)
+        results = np.empty(n, dtype=np.int32)
+        results.fill(-1)
+
+        if self.npoints == 0:
+            return results
+
+        for i from 0 <= i < n:
+            ind_val = indexer[i]
+            if not (ind_val < 0 or self.length <= ind_val):
+                cum_len = 0
+                for j from 0 <= j < self.nblocks:
+                    if ind_val >= locs[j] and ind_val < locs[j] + lens[j]:
+                        results[i] = cum_len + ind_val - locs[j]
+                    cum_len += lens[j]
+        return results
+
+    cpdef ndarray reindex(self, ndarray[float64_t, ndim=1] values,
+                          float64_t fill_value, SparseIndex other_):
+        cdef:
+            Py_ssize_t i = 0, j = 0, ocur, ocurlen
+            BlockIndex other
+            ndarray[float64_t, ndim=1] result
+            ndarray[int32_t, ndim=1] slocs, slens, olocs, olens
+
+        other = other_.to_block_index()
+
+        olocs = other.blocs
+        olens = other.blengths
+        slocs = self.blocs
+        slens = self.blengths
+
+        result = np.empty(other.npoints, dtype=np.float64)
+
+        for 0 <= i < other.nblocks:
+            ocur = olocs[i]
+            ocurlen = olens[i]
+
+            while slocs[j] + slens[j] < ocur:
+                j += 1
+
+    cpdef put(self, ndarray[float64_t, ndim=1] values,
+              ndarray[int32_t, ndim=1] indices, object to_put):
+        pass
+
+    cpdef take(self, ndarray[float64_t, ndim=1] values,
+               ndarray[int32_t, ndim=1] indices):
+        pass
+
+
+cdef class BlockMerge(object):
+    """
+    Object-oriented approach makes sharing state between recursive functions a
+    lot easier and reduces code duplication
+    """
+    cdef:
+        BlockIndex x, y, result
+        ndarray xstart, xlen, xend, ystart, ylen, yend
+        int32_t xi, yi  # block indices
+
+    def __init__(self, BlockIndex x, BlockIndex y):
+        self.x = x
+        self.y = y
+
+        if x.length != y.length:
+            raise Exception('Indices must reference same underlying length')
+
+        self.xstart = self.x.blocs
+        self.ystart = self.y.blocs
+
+        self.xend = self.x.blocs + self.x.blengths
+        self.yend = self.y.blocs + self.y.blengths
+
+        # self.xlen = self.x.blengths
+        # self.ylen = self.y.blengths
+
+        self.xi = 0
+        self.yi = 0
+
+        self.result = self._make_merged_blocks()
+
+    cdef _make_merged_blocks(self):
+        raise NotImplementedError
+
+    cdef _set_current_indices(self, int32_t xi, int32_t yi, bint mode):
+        if mode == 0:
+            self.xi = xi
+            self.yi = yi
+        else:
+            self.xi = yi
+            self.yi = xi
+
+cdef class BlockIntersection(BlockMerge):
+    """
+    not done yet
+    """
+    pass
+
+cdef class BlockUnion(BlockMerge):
+    """
+    Object-oriented approach makes sharing state between recursive functions a
+    lot easier and reduces code duplication
+    """
+
+    cdef _make_merged_blocks(self):
+        cdef:
+            ndarray[int32_t, ndim=1] xstart, xend, ystart
+            ndarray[int32_t, ndim=1] yend, out_bloc, out_blen
+            int32_t nstart, nend, diff
+            Py_ssize_t max_len, result_indexer = 0
+
+        xstart = self.xstart
+        xend = self.xend
+        ystart = self.ystart
+        yend = self.yend
+
+        max_len = int(min(self.x.length, self.y.length) / 2) + 1
+        out_bloc = np.empty(max_len, dtype=np.int32)
+        out_blen = np.empty(max_len, dtype=np.int32)
+
+        while True:
+            # we are done (or possibly never began)
+            if self.xi >= self.x.nblocks and self.yi >= self.y.nblocks:
+                break
+            elif self.yi >= self.y.nblocks:
+                # through with y, just pass through x blocks
+                nstart = xstart[self.xi]
+                nend = xend[self.xi]
+                self.xi += 1
+            elif self.xi >= self.x.nblocks:
+                # through with x, just pass through y blocks
+                nstart = ystart[self.yi]
+                nend = yend[self.yi]
+                self.yi += 1
+            else:
+                # find end of new block
+                if xstart[self.xi] < ystart[self.yi]:
+                    nstart = xstart[self.xi]
+                    nend = self._find_next_block_end(0)
+                else:
+                    nstart = ystart[self.yi]
+                    nend = self._find_next_block_end(1)
+
+            out_bloc[result_indexer] = nstart
+            out_blen[result_indexer] = nend - nstart
+            result_indexer += 1
+
+        out_bloc = out_bloc[:result_indexer]
+        out_blen = out_blen[:result_indexer]
+
+        return BlockIndex(self.x.length, out_bloc, out_blen)
+
+    cdef int32_t _find_next_block_end(self, bint mode) except -1:
+        """
+        Wow, this got complicated in a hurry
+
+        mode 0: block started in index x
+        mode 1: block started in index y
+        """
+        cdef:
+            ndarray[int32_t, ndim=1] xstart, xend, ystart, yend
+            int32_t xi, yi, xnblocks, ynblocks, nend
+
+        if mode != 0 and mode != 1:
+            raise Exception('Mode must be 0 or 1')
+
+        # so symmetric code will work
+        if mode == 0:
+            xstart = self.xstart
+            xend = self.xend
+            xi = self.xi
+
+            ystart = self.ystart
+            yend = self.yend
+            yi = self.yi
+            ynblocks = self.y.nblocks
+        else:
+            xstart = self.ystart
+            xend = self.yend
+            xi = self.yi
+
+            ystart = self.xstart
+            yend = self.xend
+            yi = self.xi
+            ynblocks = self.x.nblocks
+
+        nend = xend[xi]
+
+        # print 'here xi=%d, yi=%d, mode=%d, nend=%d' % (self.xi, self.yi,
+        #                                                mode, nend)
+
+        # done with y?
+        if yi == ynblocks:
+            self._set_current_indices(xi + 1, yi, mode)
+            return nend
+        elif nend < ystart[yi]:
+            # block ends before y block
+            self._set_current_indices(xi + 1, yi, mode)
+            return nend
+        else:
+            while yi < ynblocks and nend > yend[yi]:
+                yi += 1
+
+            self._set_current_indices(xi + 1, yi, mode)
+
+            if yi == ynblocks:
+                return nend
+
+            if nend < ystart[yi]:
+                # we're done, return the block end
+                return nend
+            else:
+                # merge blocks, continue searching
+                # this also catches the case where blocks
+                return self._find_next_block_end(1 - mode)
+
+
+# -----------------------------------------------------------------------------
+# Sparse arithmetic
+
+include "sparse_op_helper.pxi"
+
+
+# -----------------------------------------------------------------------------
+# Indexing operations
+
+def get_reindexer(ndarray[object, ndim=1] values, dict index_map):
+    cdef object idx
+    cdef Py_ssize_t i
+    cdef Py_ssize_t new_length = len(values)
+    cdef ndarray[int32_t, ndim=1] indexer
+
+    indexer = np.empty(new_length, dtype=np.int32)
+
+    for i in range(new_length):
+        idx = values[i]
+        if idx in index_map:
+            indexer[i] = index_map[idx]
+        else:
+            indexer[i] = -1
+
+    return indexer
+
+# def reindex_block(ndarray[float64_t, ndim=1] values,
+#                   BlockIndex sparse_index,
+#                   ndarray[int32_t, ndim=1] indexer):
+#     cdef:
+#         Py_ssize_t i, length
+#         ndarray[float64_t, ndim=1] out
+
+#     out = np.empty(length, dtype=np.float64)
+
+#     for i from 0 <= i < length:
+#         if indexer[i] == -1:
+#             pass
+
+
+# cdef class SparseCruncher(object):
+#     """
+#     Class to acquire float pointer for convenient operations on sparse data
+#     structures
+#     """
+#     cdef:
+#         SparseIndex index
+#         float64_t* buf
+
+#     def __init__(self, ndarray[float64_t, ndim=1, mode='c'] values,
+#                  SparseIndex index):
+
+#         self.index = index
+#         self.buf = <float64_t*> values.data
+
+
+def reindex_integer(ndarray[float64_t, ndim=1] values,
+                    IntIndex sparse_index,
+                    ndarray[int32_t, ndim=1] indexer):
+    pass
+
+
+# -----------------------------------------------------------------------------
+# SparseArray mask create operations
+
+def make_mask_object_ndarray(ndarray[object, ndim=1] arr, object fill_value):
+    cdef object value
+    cdef Py_ssize_t i
+    cdef Py_ssize_t new_length = len(arr)
+    cdef ndarray[int8_t, ndim=1] mask
+
+    mask = np.ones(new_length, dtype=np.int8)
+
+    for i in range(new_length):
+        value = arr[i]
+        if value == fill_value and type(value) == type(fill_value):
+            mask[i] = 0
+
+    return mask.view(dtype=np.bool)
diff --git a/pandas/_libs/sparse_op_helper.pxi.in b/pandas/_libs/sparse_op_helper.pxi.in
new file mode 100644
index 0000000000000..d1d9a6f02a72c
--- /dev/null
+++ b/pandas/_libs/sparse_op_helper.pxi.in
@@ -0,0 +1,341 @@
+"""
+Template for each `dtype` helper function for sparse ops
+
+WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
+"""
+
+#----------------------------------------------------------------------
+# Sparse op
+#----------------------------------------------------------------------
+
+{{py:
+
+# dtype, float_group
+dtypes = [('float64', True), ('int64', False)]
+
+}}
+
+{{for dtype, float_group in dtypes}}
+
+{{if float_group}}
+
+cdef inline {{dtype}}_t __div_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
+    if b == 0:
+        if a > 0:
+            return INF
+        elif a < 0:
+            return -INF
+        else:
+            return NaN
+    else:
+        return float(a) / b
+
+cdef inline {{dtype}}_t __truediv_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
+    return __div_{{dtype}}(a, b)
+
+cdef inline {{dtype}}_t __floordiv_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
+    if b == 0:
+        # numpy >= 1.11 returns NaN
+        # for a // 0, rather than +-inf
+        if _np_version_under1p11:
+            if a > 0:
+                return INF
+            elif a < 0:
+                return -INF
+        return NaN
+    else:
+        return a // b
+
+cdef inline {{dtype}}_t __mod_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
+    if b == 0:
+        return NaN
+    else:
+        return a % b
+
+{{else}}
+
+cdef inline float64_t __div_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
+    if b == 0:
+        if a > 0:
+            return INF
+        elif a < 0:
+            return -INF
+        else:
+            return NaN
+    else:
+        return float(a) / b
+
+cdef inline float64_t __truediv_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
+    return __div_{{dtype}}(a, b)
+
+cdef inline {{dtype}}_t __floordiv_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
+    if b == 0:
+        return 0
+    else:
+        return a // b
+
+cdef inline {{dtype}}_t __mod_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
+    if b == 0:
+        return 0
+    else:
+        return a % b
+
+{{endif}}
+
+{{endfor}}
+
+#----------------------------------------------------------------------
+# sparse array op
+#----------------------------------------------------------------------
+
+{{py:
+
+# dtype, arith_comp_group, logical_group
+dtypes = [('float64', True, False),
+          ('int64', True, True),
+          ('uint8', False, True)]
+# do not generate arithmetic / comparison template for uint8,
+# it should be done in fused types
+
+def get_op(tup):
+    assert isinstance(tup, tuple)
+    assert len(tup) == 4
+
+    opname, lval, rval, dtype = tup
+
+    ops_dict = {'add': '{0} + {1}',
+                'sub': '{0} - {1}',
+                'mul': '{0} * {1}',
+                'div': '__div_{2}({0}, {1})',
+                'mod': '__mod_{2}({0}, {1})',
+                'truediv': '__truediv_{2}({0}, {1})',
+                'floordiv': '__floordiv_{2}({0}, {1})',
+                'pow': '{0} ** {1}',
+                'eq': '{0} == {1}',
+                'ne': '{0} != {1}',
+                'lt': '{0} < {1}',
+                'gt': '{0} > {1}',
+                'le': '{0} <= {1}',
+                'ge': '{0} >= {1}',
+
+                'and': '{0} & {1}',     # logical op
+                'or': '{0} | {1}'}
+
+    return ops_dict[opname].format(lval, rval, dtype)
+
+
+def get_dispatch(dtypes):
+
+    ops_list = ['add', 'sub', 'mul', 'div', 'mod', 'truediv',
+                'floordiv', 'pow',
+                'eq', 'ne', 'lt', 'gt', 'le', 'ge',
+                'and', 'or']
+
+    for opname in ops_list:
+        for dtype, arith_comp_group, logical_group in dtypes:
+
+            if opname in ('div', 'truediv'):
+                rdtype = 'float64'
+            elif opname in ('eq', 'ne', 'lt', 'gt', 'le', 'ge'):
+                # comparison op
+                rdtype = 'uint8'
+            elif opname in ('and', 'or'):
+                # logical op
+                rdtype = 'uint8'
+            else:
+                rdtype = dtype
+
+            if opname in ('and', 'or'):
+                if logical_group:
+                    yield opname, dtype, rdtype
+            else:
+                if arith_comp_group:
+                    yield opname, dtype, rdtype
+
+}}
+
+
+{{for opname, dtype, rdtype in get_dispatch(dtypes)}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cdef inline tuple block_op_{{opname}}_{{dtype}}(ndarray x_,
+                                                BlockIndex xindex,
+                                                {{dtype}}_t xfill,
+                                                ndarray y_,
+                                                BlockIndex yindex,
+                                                {{dtype}}_t yfill):
+    '''
+    Binary operator on BlockIndex objects with fill values
+    '''
+
+    cdef:
+        BlockIndex out_index
+        Py_ssize_t xi = 0, yi = 0, out_i = 0 # fp buf indices
+        int32_t xbp = 0, ybp = 0 # block positions
+        int32_t xloc, yloc
+        Py_ssize_t xblock = 0, yblock = 0 # block numbers
+
+        ndarray[{{dtype}}_t, ndim=1] x, y
+        ndarray[{{rdtype}}_t, ndim=1] out
+
+    # to suppress Cython warning
+    x = x_
+    y = y_
+
+    out_index = xindex.make_union(yindex)
+    out = np.empty(out_index.npoints, dtype=np.{{rdtype}})
+
+    # Wow, what a hack job. Need to do something about this
+
+    # walk the two SparseVectors, adding matched locations...
+    for out_i from 0 <= out_i < out_index.npoints:
+        if yblock == yindex.nblocks:
+            # use y fill value
+            out[out_i] = {{(opname, 'x[xi]', 'yfill', dtype) | get_op}}
+            xi += 1
+
+            # advance x location
+            xbp += 1
+            if xbp == xindex.lenbuf[xblock]:
+                xblock += 1
+                xbp = 0
+            continue
+
+        if xblock == xindex.nblocks:
+            # use x fill value
+            out[out_i] = {{(opname, 'xfill', 'y[yi]', dtype) | get_op}}
+            yi += 1
+
+            # advance y location
+            ybp += 1
+            if ybp == yindex.lenbuf[yblock]:
+                yblock += 1
+                ybp = 0
+            continue
+
+        yloc = yindex.locbuf[yblock] + ybp
+        xloc = xindex.locbuf[xblock] + xbp
+
+        # each index in the out_index had to come from either x, y, or both
+        if xloc == yloc:
+            out[out_i] = {{(opname, 'x[xi]', 'y[yi]', dtype) | get_op}}
+            xi += 1
+            yi += 1
+
+            # advance both locations
+            xbp += 1
+            if xbp == xindex.lenbuf[xblock]:
+                xblock += 1
+                xbp = 0
+
+            ybp += 1
+            if ybp == yindex.lenbuf[yblock]:
+                yblock += 1
+                ybp = 0
+
+        elif xloc < yloc:
+            # use y fill value
+            out[out_i] = {{(opname, 'x[xi]', 'yfill', dtype) | get_op}}
+            xi += 1
+
+            # advance x location
+            xbp += 1
+            if xbp == xindex.lenbuf[xblock]:
+                xblock += 1
+                xbp = 0
+        else:
+            # use x fill value
+            out[out_i] = {{(opname, 'xfill', 'y[yi]', dtype) | get_op}}
+            yi += 1
+
+            # advance y location
+            ybp += 1
+            if ybp == yindex.lenbuf[yblock]:
+                yblock += 1
+                ybp = 0
+
+    return out, out_index, {{(opname, 'xfill', 'yfill', dtype) | get_op}}
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cdef inline tuple int_op_{{opname}}_{{dtype}}(ndarray x_, IntIndex xindex,
+                                              {{dtype}}_t xfill,
+                                              ndarray y_, IntIndex yindex,
+                                              {{dtype}}_t yfill):
+    cdef:
+        IntIndex out_index
+        Py_ssize_t xi = 0, yi = 0, out_i = 0 # fp buf indices
+        int32_t xloc, yloc
+        ndarray[int32_t, ndim=1] xindices, yindices, out_indices
+        ndarray[{{dtype}}_t, ndim=1] x, y
+        ndarray[{{rdtype}}_t, ndim=1] out
+
+    # suppress Cython compiler warnings due to inlining
+    x = x_
+    y = y_
+
+    # need to do this first to know size of result array
+    out_index = xindex.make_union(yindex)
+    out = np.empty(out_index.npoints, dtype=np.{{rdtype}})
+
+    xindices = xindex.indices
+    yindices = yindex.indices
+    out_indices = out_index.indices
+
+    # walk the two SparseVectors, adding matched locations...
+    for out_i from 0 <= out_i < out_index.npoints:
+        if xi == xindex.npoints:
+            # use x fill value
+            out[out_i] = {{(opname, 'xfill', 'y[yi]', dtype) | get_op}}
+            yi += 1
+            continue
+
+        if yi == yindex.npoints:
+            # use y fill value
+            out[out_i] = {{(opname, 'x[xi]', 'yfill', dtype) | get_op}}
+            xi += 1
+            continue
+
+        xloc = xindices[xi]
+        yloc = yindices[yi]
+
+        # each index in the out_index had to come from either x, y, or both
+        if xloc == yloc:
+            out[out_i] = {{(opname, 'x[xi]', 'y[yi]', dtype) | get_op}}
+            xi += 1
+            yi += 1
+        elif xloc < yloc:
+            # use y fill value
+            out[out_i] = {{(opname, 'x[xi]', 'yfill', dtype) | get_op}}
+            xi += 1
+        else:
+            # use x fill value
+            out[out_i] = {{(opname, 'xfill', 'y[yi]', dtype) | get_op}}
+            yi += 1
+
+    return out, out_index, {{(opname, 'xfill', 'yfill', dtype) | get_op}}
+
+
+cpdef sparse_{{opname}}_{{dtype}}(ndarray[{{dtype}}_t, ndim=1] x,
+                                  SparseIndex xindex, {{dtype}}_t xfill,
+                                  ndarray[{{dtype}}_t, ndim=1] y,
+                                  SparseIndex yindex, {{dtype}}_t yfill):
+
+    if isinstance(xindex, BlockIndex):
+        return block_op_{{opname}}_{{dtype}}(x, xindex.to_block_index(), xfill,
+                                             y, yindex.to_block_index(), yfill)
+    elif isinstance(xindex, IntIndex):
+        return int_op_{{opname}}_{{dtype}}(x, xindex.to_int_index(), xfill,
+                                           y, yindex.to_int_index(), yfill)
+    else:
+        raise NotImplementedError
+
+
+cpdef sparse_fill_{{opname}}_{{dtype}}({{dtype}}_t xfill,
+                                       {{dtype}}_t yfill):
+    return {{(opname, 'xfill', 'yfill', dtype) | get_op}}
+
+{{endfor}}
diff --git a/pandas/_libs/src/compat_helper.h b/pandas/_libs/src/compat_helper.h
new file mode 100644
index 0000000000000..bdff61d7d4150
--- /dev/null
+++ b/pandas/_libs/src/compat_helper.h
@@ -0,0 +1,50 @@
+/*
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+*/
+
+#ifndef PANDAS__LIBS_SRC_COMPAT_HELPER_H_
+#define PANDAS__LIBS_SRC_COMPAT_HELPER_H_
+
+#include "Python.h"
+#include "numpy_helper.h"
+
+/*
+PySlice_GetIndicesEx changes signature in PY3
+but 3.6.1 in particular changes the behavior of this function slightly
+https://bugs.python.org/issue27867
+
+
+In 3.6.1 PySlice_GetIndicesEx was changed to a macro
+inadvertently breaking ABI compat.  For now, undefing
+the macro, which restores compat.
+https://github.com/pandas-dev/pandas/issues/15961
+https://bugs.python.org/issue29943
+*/
+
+#ifndef PYPY_VERSION
+# if PY_VERSION_HEX < 0x03070000 && defined(PySlice_GetIndicesEx)
+#   undef PySlice_GetIndicesEx
+# endif
+#endif
+
+PANDAS_INLINE int slice_get_indices(PyObject *s,
+                                    Py_ssize_t length,
+                                    Py_ssize_t *start,
+                                    Py_ssize_t *stop,
+                                    Py_ssize_t *step,
+                                    Py_ssize_t *slicelength) {
+#if PY_VERSION_HEX >= 0x03000000
+  return PySlice_GetIndicesEx(s, length, start, stop,
+                              step, slicelength);
+#else
+  return PySlice_GetIndicesEx((PySliceObject *)s, length, start,
+                              stop, step, slicelength);
+#endif
+}
+
+#endif  // PANDAS__LIBS_SRC_COMPAT_HELPER_H_
diff --git a/pandas/_libs/src/datetime/np_datetime.c b/pandas/_libs/src/datetime/np_datetime.c
new file mode 100644
index 0000000000000..89753ccf7d773
--- /dev/null
+++ b/pandas/_libs/src/datetime/np_datetime.c
@@ -0,0 +1,959 @@
+/*
+
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+
+Copyright (c) 2005-2011, NumPy Developers
+All rights reserved.
+
+This file is derived from NumPy 1.7. See NUMPY_LICENSE.txt
+
+*/
+
+#define NO_IMPORT
+
+#include <Python.h>
+#include <datetime.h>
+
+#include <numpy/arrayobject.h>
+#include <numpy/arrayscalars.h>
+#include "np_datetime.h"
+
+#if PY_MAJOR_VERSION >= 3
+#define PyInt_AsLong PyLong_AsLong
+#endif
+
+const pandas_datetimestruct _NS_MIN_DTS = {
+    1677, 9, 21, 0, 12, 43, 145225, 0, 0};
+const pandas_datetimestruct _NS_MAX_DTS = {
+    2262, 4, 11, 23, 47, 16, 854775, 807000, 0};
+
+
+const int days_per_month_table[2][12] = {
+    {31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31},
+    {31, 29, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31}};
+
+/*
+ * Returns 1 if the given year is a leap year, 0 otherwise.
+ */
+int is_leapyear(npy_int64 year) {
+    return (year & 0x3) == 0 && /* year % 4 == 0 */
+           ((year % 100) != 0 || (year % 400) == 0);
+}
+
+/*
+ * Sakamoto's method, from wikipedia
+ */
+int dayofweek(int y, int m, int d) {
+    int day;
+    static const int t[] = {0, 3, 2, 5, 0, 3, 5, 1, 4, 6, 2, 4};
+    y -= m < 3;
+    day = (y + y / 4 - y / 100 + y / 400 + t[m - 1] + d) % 7;
+    // convert to python day
+    return (day + 6) % 7;
+}
+
+/*
+ * Adjusts a datetimestruct based on a minutes offset. Assumes
+ * the current values are valid.g
+ */
+void add_minutes_to_datetimestruct(pandas_datetimestruct *dts, int minutes) {
+    int isleap;
+
+    /* MINUTES */
+    dts->min += minutes;
+    while (dts->min < 0) {
+        dts->min += 60;
+        dts->hour--;
+    }
+    while (dts->min >= 60) {
+        dts->min -= 60;
+        dts->hour++;
+    }
+
+    /* HOURS */
+    while (dts->hour < 0) {
+        dts->hour += 24;
+        dts->day--;
+    }
+    while (dts->hour >= 24) {
+        dts->hour -= 24;
+        dts->day++;
+    }
+
+    /* DAYS */
+    if (dts->day < 1) {
+        dts->month--;
+        if (dts->month < 1) {
+            dts->year--;
+            dts->month = 12;
+        }
+        isleap = is_leapyear(dts->year);
+        dts->day += days_per_month_table[isleap][dts->month - 1];
+    } else if (dts->day > 28) {
+        isleap = is_leapyear(dts->year);
+        if (dts->day > days_per_month_table[isleap][dts->month - 1]) {
+            dts->day -= days_per_month_table[isleap][dts->month - 1];
+            dts->month++;
+            if (dts->month > 12) {
+                dts->year++;
+                dts->month = 1;
+            }
+        }
+    }
+}
+
+/*
+ * Calculates the days offset from the 1970 epoch.
+ */
+npy_int64 get_datetimestruct_days(const pandas_datetimestruct *dts) {
+    int i, month;
+    npy_int64 year, days = 0;
+    const int *month_lengths;
+
+    year = dts->year - 1970;
+    days = year * 365;
+
+    /* Adjust for leap years */
+    if (days >= 0) {
+        /*
+         * 1968 is the closest leap year before 1970.
+         * Exclude the current year, so add 1.
+         */
+        year += 1;
+        /* Add one day for each 4 years */
+        days += year / 4;
+        /* 1900 is the closest previous year divisible by 100 */
+        year += 68;
+        /* Subtract one day for each 100 years */
+        days -= year / 100;
+        /* 1600 is the closest previous year divisible by 400 */
+        year += 300;
+        /* Add one day for each 400 years */
+        days += year / 400;
+    } else {
+        /*
+         * 1972 is the closest later year after 1970.
+         * Include the current year, so subtract 2.
+         */
+        year -= 2;
+        /* Subtract one day for each 4 years */
+        days += year / 4;
+        /* 2000 is the closest later year divisible by 100 */
+        year -= 28;
+        /* Add one day for each 100 years */
+        days -= year / 100;
+        /* 2000 is also the closest later year divisible by 400 */
+        /* Subtract one day for each 400 years */
+        days += year / 400;
+    }
+
+    month_lengths = days_per_month_table[is_leapyear(dts->year)];
+    month = dts->month - 1;
+
+    /* Add the months */
+    for (i = 0; i < month; ++i) {
+        days += month_lengths[i];
+    }
+
+    /* Add the days */
+    days += dts->day - 1;
+
+    return days;
+}
+
+/*
+ * Modifies '*days_' to be the day offset within the year,
+ * and returns the year.
+ */
+static npy_int64 days_to_yearsdays(npy_int64 *days_) {
+    const npy_int64 days_per_400years = (400 * 365 + 100 - 4 + 1);
+    /* Adjust so it's relative to the year 2000 (divisible by 400) */
+    npy_int64 days = (*days_) - (365 * 30 + 7);
+    npy_int64 year;
+
+    /* Break down the 400 year cycle to get the year and day within the year */
+    if (days >= 0) {
+        year = 400 * (days / days_per_400years);
+        days = days % days_per_400years;
+    } else {
+        year = 400 * ((days - (days_per_400years - 1)) / days_per_400years);
+        days = days % days_per_400years;
+        if (days < 0) {
+            days += days_per_400years;
+        }
+    }
+
+    /* Work out the year/day within the 400 year cycle */
+    if (days >= 366) {
+        year += 100 * ((days - 1) / (100 * 365 + 25 - 1));
+        days = (days - 1) % (100 * 365 + 25 - 1);
+        if (days >= 365) {
+            year += 4 * ((days + 1) / (4 * 365 + 1));
+            days = (days + 1) % (4 * 365 + 1);
+            if (days >= 366) {
+                year += (days - 1) / 365;
+                days = (days - 1) % 365;
+            }
+        }
+    }
+
+    *days_ = days;
+    return year + 2000;
+}
+
+/*
+ * Adjusts a datetimestruct based on a seconds offset. Assumes
+ * the current values are valid.
+ */
+NPY_NO_EXPORT void add_seconds_to_datetimestruct(pandas_datetimestruct *dts,
+                                                 int seconds) {
+    int minutes;
+
+    dts->sec += seconds;
+    if (dts->sec < 0) {
+        minutes = dts->sec / 60;
+        dts->sec = dts->sec % 60;
+        if (dts->sec < 0) {
+            --minutes;
+            dts->sec += 60;
+        }
+        add_minutes_to_datetimestruct(dts, minutes);
+    } else if (dts->sec >= 60) {
+        minutes = dts->sec / 60;
+        dts->sec = dts->sec % 60;
+        add_minutes_to_datetimestruct(dts, minutes);
+    }
+}
+
+/*
+ * Fills in the year, month, day in 'dts' based on the days
+ * offset from 1970.
+ */
+static void set_datetimestruct_days(npy_int64 days,
+                                    pandas_datetimestruct *dts) {
+    const int *month_lengths;
+    int i;
+
+    dts->year = days_to_yearsdays(&days);
+    month_lengths = days_per_month_table[is_leapyear(dts->year)];
+
+    for (i = 0; i < 12; ++i) {
+        if (days < month_lengths[i]) {
+            dts->month = i + 1;
+            dts->day = days + 1;
+            return;
+        } else {
+            days -= month_lengths[i];
+        }
+    }
+}
+
+/*
+ * Compares two pandas_datetimestruct objects chronologically
+ */
+int cmp_pandas_datetimestruct(const pandas_datetimestruct *a,
+                              const pandas_datetimestruct *b) {
+    if (a->year > b->year) {
+        return 1;
+    } else if (a->year < b->year) {
+        return -1;
+    }
+
+    if (a->month > b->month) {
+        return 1;
+    } else if (a->month < b->month) {
+        return -1;
+    }
+
+    if (a->day > b->day) {
+        return 1;
+    } else if (a->day < b->day) {
+        return -1;
+    }
+
+    if (a->hour > b->hour) {
+        return 1;
+    } else if (a->hour < b->hour) {
+        return -1;
+    }
+
+    if (a->min > b->min) {
+        return 1;
+    } else if (a->min < b->min) {
+        return -1;
+    }
+
+    if (a->sec > b->sec) {
+        return 1;
+    } else if (a->sec < b->sec) {
+        return -1;
+    }
+
+    if (a->us > b->us) {
+        return 1;
+    } else if (a->us < b->us) {
+        return -1;
+    }
+
+    if (a->ps > b->ps) {
+        return 1;
+    } else if (a->ps < b->ps) {
+        return -1;
+    }
+
+    if (a->as > b->as) {
+        return 1;
+    } else if (a->as < b->as) {
+        return -1;
+    }
+
+    return 0;
+}
+
+/*
+ *
+ * Tests for and converts a Python datetime.datetime or datetime.date
+ * object into a NumPy pandas_datetimestruct.  Uses tzinfo (if present)
+ * to convert to UTC time.
+ *
+ * While the C API has PyDate_* and PyDateTime_* functions, the following
+ * implementation just asks for attributes, and thus supports
+ * datetime duck typing. The tzinfo time zone conversion would require
+ * this style of access anyway.
+ *
+ * Returns -1 on error, 0 on success, and 1 (with no error set)
+ * if obj doesn't have the needed date or datetime attributes.
+ */
+int convert_pydatetime_to_datetimestruct(PyObject *obj,
+                                         pandas_datetimestruct *out) {
+    PyObject *tmp;
+    int isleap;
+
+    /* Initialize the output to all zeros */
+    memset(out, 0, sizeof(pandas_datetimestruct));
+    out->month = 1;
+    out->day = 1;
+
+    /* Need at least year/month/day attributes */
+    if (!PyObject_HasAttrString(obj, "year") ||
+        !PyObject_HasAttrString(obj, "month") ||
+        !PyObject_HasAttrString(obj, "day")) {
+        return 1;
+    }
+
+    /* Get the year */
+    tmp = PyObject_GetAttrString(obj, "year");
+    if (tmp == NULL) {
+        return -1;
+    }
+    out->year = PyInt_AsLong(tmp);
+    if (out->year == -1 && PyErr_Occurred()) {
+        Py_DECREF(tmp);
+        return -1;
+    }
+    Py_DECREF(tmp);
+
+    /* Get the month */
+    tmp = PyObject_GetAttrString(obj, "month");
+    if (tmp == NULL) {
+        return -1;
+    }
+    out->month = PyInt_AsLong(tmp);
+    if (out->month == -1 && PyErr_Occurred()) {
+        Py_DECREF(tmp);
+        return -1;
+    }
+    Py_DECREF(tmp);
+
+    /* Get the day */
+    tmp = PyObject_GetAttrString(obj, "day");
+    if (tmp == NULL) {
+        return -1;
+    }
+    out->day = PyInt_AsLong(tmp);
+    if (out->day == -1 && PyErr_Occurred()) {
+        Py_DECREF(tmp);
+        return -1;
+    }
+    Py_DECREF(tmp);
+
+    /* Validate that the month and day are valid for the year */
+    if (out->month < 1 || out->month > 12) {
+        goto invalid_date;
+    }
+    isleap = is_leapyear(out->year);
+    if (out->day < 1 ||
+        out->day > days_per_month_table[isleap][out->month - 1]) {
+        goto invalid_date;
+    }
+
+    /* Check for time attributes (if not there, return success as a date) */
+    if (!PyObject_HasAttrString(obj, "hour") ||
+        !PyObject_HasAttrString(obj, "minute") ||
+        !PyObject_HasAttrString(obj, "second") ||
+        !PyObject_HasAttrString(obj, "microsecond")) {
+        return 0;
+    }
+
+    /* Get the hour */
+    tmp = PyObject_GetAttrString(obj, "hour");
+    if (tmp == NULL) {
+        return -1;
+    }
+    out->hour = PyInt_AsLong(tmp);
+    if (out->hour == -1 && PyErr_Occurred()) {
+        Py_DECREF(tmp);
+        return -1;
+    }
+    Py_DECREF(tmp);
+
+    /* Get the minute */
+    tmp = PyObject_GetAttrString(obj, "minute");
+    if (tmp == NULL) {
+        return -1;
+    }
+    out->min = PyInt_AsLong(tmp);
+    if (out->min == -1 && PyErr_Occurred()) {
+        Py_DECREF(tmp);
+        return -1;
+    }
+    Py_DECREF(tmp);
+
+    /* Get the second */
+    tmp = PyObject_GetAttrString(obj, "second");
+    if (tmp == NULL) {
+        return -1;
+    }
+    out->sec = PyInt_AsLong(tmp);
+    if (out->sec == -1 && PyErr_Occurred()) {
+        Py_DECREF(tmp);
+        return -1;
+    }
+    Py_DECREF(tmp);
+
+    /* Get the microsecond */
+    tmp = PyObject_GetAttrString(obj, "microsecond");
+    if (tmp == NULL) {
+        return -1;
+    }
+    out->us = PyInt_AsLong(tmp);
+    if (out->us == -1 && PyErr_Occurred()) {
+        Py_DECREF(tmp);
+        return -1;
+    }
+    Py_DECREF(tmp);
+
+    if (out->hour < 0 || out->hour >= 24 || out->min < 0 || out->min >= 60 ||
+        out->sec < 0 || out->sec >= 60 || out->us < 0 || out->us >= 1000000) {
+        goto invalid_time;
+    }
+
+    /* Apply the time zone offset if it exists */
+    if (PyObject_HasAttrString(obj, "tzinfo")) {
+        tmp = PyObject_GetAttrString(obj, "tzinfo");
+        if (tmp == NULL) {
+            return -1;
+        }
+        if (tmp == Py_None) {
+            Py_DECREF(tmp);
+        } else {
+            PyObject *offset;
+            int seconds_offset, minutes_offset;
+
+            /* The utcoffset function should return a timedelta */
+            offset = PyObject_CallMethod(tmp, "utcoffset", "O", obj);
+            if (offset == NULL) {
+                Py_DECREF(tmp);
+                return -1;
+            }
+            Py_DECREF(tmp);
+
+            /*
+             * The timedelta should have a function "total_seconds"
+             * which contains the value we want.
+             */
+            tmp = PyObject_CallMethod(offset, "total_seconds", "");
+            if (tmp == NULL) {
+                return -1;
+            }
+            seconds_offset = PyInt_AsLong(tmp);
+            if (seconds_offset == -1 && PyErr_Occurred()) {
+                Py_DECREF(tmp);
+                return -1;
+            }
+            Py_DECREF(tmp);
+
+            /* Convert to a minutes offset and apply it */
+            minutes_offset = seconds_offset / 60;
+
+            add_minutes_to_datetimestruct(out, -minutes_offset);
+        }
+    }
+
+    return 0;
+
+invalid_date:
+    PyErr_Format(PyExc_ValueError,
+                 "Invalid date (%d,%d,%d) when converting to NumPy datetime",
+                 (int)out->year, (int)out->month, (int)out->day);
+    return -1;
+
+invalid_time:
+    PyErr_Format(PyExc_ValueError,
+                 "Invalid time (%d,%d,%d,%d) when converting "
+                 "to NumPy datetime",
+                 (int)out->hour, (int)out->min, (int)out->sec, (int)out->us);
+    return -1;
+}
+
+npy_datetime pandas_datetimestruct_to_datetime(PANDAS_DATETIMEUNIT fr,
+                                               pandas_datetimestruct *d) {
+    npy_datetime result = PANDAS_DATETIME_NAT;
+
+    convert_datetimestruct_to_datetime(fr, d, &result);
+    return result;
+}
+
+void pandas_datetime_to_datetimestruct(npy_datetime val, PANDAS_DATETIMEUNIT fr,
+                                       pandas_datetimestruct *result) {
+    convert_datetime_to_datetimestruct(fr, val, result);
+}
+
+void pandas_timedelta_to_timedeltastruct(npy_timedelta val,
+                                         PANDAS_DATETIMEUNIT fr,
+                                         pandas_timedeltastruct *result) {
+    convert_timedelta_to_timedeltastruct(fr, val, result);
+}
+
+
+/*
+ * Converts a datetime from a datetimestruct to a datetime based
+ * on a metadata unit. The date is assumed to be valid.
+ *
+ * Returns 0 on success, -1 on failure.
+ */
+int convert_datetimestruct_to_datetime(PANDAS_DATETIMEUNIT base,
+                                       const pandas_datetimestruct *dts,
+                                       npy_datetime *out) {
+    npy_datetime ret;
+
+    if (base == PANDAS_FR_Y) {
+        /* Truncate to the year */
+        ret = dts->year - 1970;
+    } else if (base == PANDAS_FR_M) {
+        /* Truncate to the month */
+        ret = 12 * (dts->year - 1970) + (dts->month - 1);
+    } else {
+        /* Otherwise calculate the number of days to start */
+        npy_int64 days = get_datetimestruct_days(dts);
+
+        switch (base) {
+            case PANDAS_FR_W:
+                /* Truncate to weeks */
+                if (days >= 0) {
+                    ret = days / 7;
+                } else {
+                    ret = (days - 6) / 7;
+                }
+                break;
+            case PANDAS_FR_D:
+                ret = days;
+                break;
+            case PANDAS_FR_h:
+                ret = days * 24 + dts->hour;
+                break;
+            case PANDAS_FR_m:
+                ret = (days * 24 + dts->hour) * 60 + dts->min;
+                break;
+            case PANDAS_FR_s:
+                ret = ((days * 24 + dts->hour) * 60 + dts->min) * 60 + dts->sec;
+                break;
+            case PANDAS_FR_ms:
+                ret = (((days * 24 + dts->hour) * 60 + dts->min) * 60 +
+                       dts->sec) *
+                          1000 +
+                      dts->us / 1000;
+                break;
+            case PANDAS_FR_us:
+                ret = (((days * 24 + dts->hour) * 60 + dts->min) * 60 +
+                       dts->sec) *
+                          1000000 +
+                      dts->us;
+                break;
+            case PANDAS_FR_ns:
+                ret = ((((days * 24 + dts->hour) * 60 + dts->min) * 60 +
+                        dts->sec) *
+                           1000000 +
+                       dts->us) *
+                          1000 +
+                      dts->ps / 1000;
+                break;
+            case PANDAS_FR_ps:
+                ret = ((((days * 24 + dts->hour) * 60 + dts->min) * 60 +
+                        dts->sec) *
+                           1000000 +
+                       dts->us) *
+                          1000000 +
+                      dts->ps;
+                break;
+            case PANDAS_FR_fs:
+                /* only 2.6 hours */
+                ret = (((((days * 24 + dts->hour) * 60 + dts->min) * 60 +
+                         dts->sec) *
+                            1000000 +
+                        dts->us) *
+                           1000000 +
+                       dts->ps) *
+                          1000 +
+                      dts->as / 1000;
+                break;
+            case PANDAS_FR_as:
+                /* only 9.2 secs */
+                ret = (((((days * 24 + dts->hour) * 60 + dts->min) * 60 +
+                         dts->sec) *
+                            1000000 +
+                        dts->us) *
+                           1000000 +
+                       dts->ps) *
+                          1000000 +
+                      dts->as;
+                break;
+            default:
+                /* Something got corrupted */
+                PyErr_SetString(
+                    PyExc_ValueError,
+                    "NumPy datetime metadata with corrupt unit value");
+                return -1;
+        }
+    }
+
+    *out = ret;
+
+    return 0;
+}
+
+/*
+ * Converts a datetime based on the given metadata into a datetimestruct
+ */
+int convert_datetime_to_datetimestruct(PANDAS_DATETIMEUNIT base,
+                                       npy_datetime dt,
+                                       pandas_datetimestruct *out) {
+    npy_int64 perday;
+
+    /* Initialize the output to all zeros */
+    memset(out, 0, sizeof(pandas_datetimestruct));
+    out->year = 1970;
+    out->month = 1;
+    out->day = 1;
+
+    /*
+     * Note that care must be taken with the / and % operators
+     * for negative values.
+     */
+    switch (base) {
+        case PANDAS_FR_Y:
+            out->year = 1970 + dt;
+            break;
+
+        case PANDAS_FR_M:
+            if (dt >= 0) {
+                out->year = 1970 + dt / 12;
+                out->month = dt % 12 + 1;
+            } else {
+                out->year = 1969 + (dt + 1) / 12;
+                out->month = 12 + (dt + 1) % 12;
+            }
+            break;
+
+        case PANDAS_FR_W:
+            /* A week is 7 days */
+            set_datetimestruct_days(dt * 7, out);
+            break;
+
+        case PANDAS_FR_D:
+            set_datetimestruct_days(dt, out);
+            break;
+
+        case PANDAS_FR_h:
+            perday = 24LL;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt;
+            break;
+
+        case PANDAS_FR_m:
+            perday = 24LL * 60;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt / 60;
+            out->min = dt % 60;
+            break;
+
+        case PANDAS_FR_s:
+            perday = 24LL * 60 * 60;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt / (60 * 60);
+            out->min = (dt / 60) % 60;
+            out->sec = dt % 60;
+            break;
+
+        case PANDAS_FR_ms:
+            perday = 24LL * 60 * 60 * 1000;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt / (60 * 60 * 1000LL);
+            out->min = (dt / (60 * 1000LL)) % 60;
+            out->sec = (dt / 1000LL) % 60;
+            out->us = (dt % 1000LL) * 1000;
+            break;
+
+        case PANDAS_FR_us:
+            perday = 24LL * 60LL * 60LL * 1000LL * 1000LL;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt / (60 * 60 * 1000000LL);
+            out->min = (dt / (60 * 1000000LL)) % 60;
+            out->sec = (dt / 1000000LL) % 60;
+            out->us = dt % 1000000LL;
+            break;
+
+        case PANDAS_FR_ns:
+            perday = 24LL * 60LL * 60LL * 1000LL * 1000LL * 1000LL;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt / (60 * 60 * 1000000000LL);
+            out->min = (dt / (60 * 1000000000LL)) % 60;
+            out->sec = (dt / 1000000000LL) % 60;
+            out->us = (dt / 1000LL) % 1000000LL;
+            out->ps = (dt % 1000LL) * 1000;
+            break;
+
+        case PANDAS_FR_ps:
+            perday = 24LL * 60 * 60 * 1000 * 1000 * 1000 * 1000;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt / (60 * 60 * 1000000000000LL);
+            out->min = (dt / (60 * 1000000000000LL)) % 60;
+            out->sec = (dt / 1000000000000LL) % 60;
+            out->us = (dt / 1000000LL) % 1000000LL;
+            out->ps = dt % 1000000LL;
+            break;
+
+        case PANDAS_FR_fs:
+            /* entire range is only +- 2.6 hours */
+            if (dt >= 0) {
+                out->hour = dt / (60 * 60 * 1000000000000000LL);
+                out->min = (dt / (60 * 1000000000000000LL)) % 60;
+                out->sec = (dt / 1000000000000000LL) % 60;
+                out->us = (dt / 1000000000LL) % 1000000LL;
+                out->ps = (dt / 1000LL) % 1000000LL;
+                out->as = (dt % 1000LL) * 1000;
+            } else {
+                npy_datetime minutes;
+
+                minutes = dt / (60 * 1000000000000000LL);
+                dt = dt % (60 * 1000000000000000LL);
+                if (dt < 0) {
+                    dt += (60 * 1000000000000000LL);
+                    --minutes;
+                }
+                /* Offset the negative minutes */
+                add_minutes_to_datetimestruct(out, minutes);
+                out->sec = (dt / 1000000000000000LL) % 60;
+                out->us = (dt / 1000000000LL) % 1000000LL;
+                out->ps = (dt / 1000LL) % 1000000LL;
+                out->as = (dt % 1000LL) * 1000;
+            }
+            break;
+
+        case PANDAS_FR_as:
+            /* entire range is only +- 9.2 seconds */
+            if (dt >= 0) {
+                out->sec = (dt / 1000000000000000000LL) % 60;
+                out->us = (dt / 1000000000000LL) % 1000000LL;
+                out->ps = (dt / 1000000LL) % 1000000LL;
+                out->as = dt % 1000000LL;
+            } else {
+                npy_datetime seconds;
+
+                seconds = dt / 1000000000000000000LL;
+                dt = dt % 1000000000000000000LL;
+                if (dt < 0) {
+                    dt += 1000000000000000000LL;
+                    --seconds;
+                }
+                /* Offset the negative seconds */
+                add_seconds_to_datetimestruct(out, seconds);
+                out->us = (dt / 1000000000000LL) % 1000000LL;
+                out->ps = (dt / 1000000LL) % 1000000LL;
+                out->as = dt % 1000000LL;
+            }
+            break;
+
+        default:
+            PyErr_SetString(PyExc_RuntimeError,
+                            "NumPy datetime metadata is corrupted with invalid "
+                            "base unit");
+            return -1;
+    }
+
+    return 0;
+}
+
+/*
+ * Converts a timedelta from a timedeltastruct to a timedelta based
+ * on a metadata unit. The timedelta is assumed to be valid.
+ *
+ * Returns 0 on success, -1 on failure.
+ */
+int convert_timedelta_to_timedeltastruct(PANDAS_DATETIMEUNIT base,
+                                         npy_timedelta td,
+                                         pandas_timedeltastruct *out) {
+    npy_int64 frac;
+    npy_int64 sfrac;
+    npy_int64 ifrac;
+    int sign;
+    npy_int64 DAY_NS = 86400000000000LL;
+
+    /* Initialize the output to all zeros */
+    memset(out, 0, sizeof(pandas_timedeltastruct));
+
+    switch (base) {
+        case PANDAS_FR_ns:
+
+        // put frac in seconds
+        if (td < 0 && td % (1000LL * 1000LL * 1000LL) != 0)
+            frac = td / (1000LL * 1000LL * 1000LL) - 1;
+        else
+            frac = td / (1000LL * 1000LL * 1000LL);
+
+        if (frac < 0) {
+            sign = -1;
+
+            // even fraction
+            if ((-frac % 86400LL) != 0) {
+              out->days = -frac / 86400LL + 1;
+              frac += 86400LL * out->days;
+            } else {
+              frac = -frac;
+            }
+        } else {
+            sign = 1;
+            out->days = 0;
+        }
+
+        if (frac >= 86400) {
+            out->days += frac / 86400LL;
+            frac -= out->days * 86400LL;
+        }
+
+        if (frac >= 3600) {
+            out->hrs = frac / 3600LL;
+            frac -= out->hrs * 3600LL;
+        } else {
+            out->hrs = 0;
+        }
+
+        if (frac >= 60) {
+            out->min = frac / 60LL;
+            frac -= out->min * 60LL;
+        } else {
+            out->min = 0;
+        }
+
+        if (frac >= 0) {
+            out->sec = frac;
+            frac -= out->sec;
+        } else {
+            out->sec = 0;
+        }
+
+        sfrac = (out->hrs * 3600LL + out->min * 60LL
+                 + out->sec) * (1000LL * 1000LL * 1000LL);
+
+        if (sign < 0)
+            out->days = -out->days;
+
+        ifrac = td - (out->days * DAY_NS + sfrac);
+
+        if (ifrac != 0) {
+            out->ms = ifrac / (1000LL * 1000LL);
+            ifrac -= out->ms * 1000LL * 1000LL;
+            out->us = ifrac / 1000LL;
+            ifrac -= out->us * 1000LL;
+            out->ns = ifrac;
+        } else {
+            out->ms = 0;
+            out->us = 0;
+            out->ns = 0;
+        }
+
+        out->seconds = out->hrs * 3600 + out->min * 60 + out->sec;
+        out->microseconds = out->ms * 1000 + out->us;
+        out->nanoseconds = out->ns;
+        break;
+
+        default:
+            PyErr_SetString(PyExc_RuntimeError,
+                            "NumPy timedelta metadata is corrupted with "
+                            "invalid base unit");
+            return -1;
+    }
+
+    return 0;
+}
diff --git a/pandas/_libs/src/datetime/np_datetime.h b/pandas/_libs/src/datetime/np_datetime.h
new file mode 100644
index 0000000000000..b6c0852bfe764
--- /dev/null
+++ b/pandas/_libs/src/datetime/np_datetime.h
@@ -0,0 +1,110 @@
+/*
+
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+
+Copyright (c) 2005-2011, NumPy Developers
+All rights reserved.
+
+This file is derived from NumPy 1.7. See NUMPY_LICENSE.txt
+
+*/
+
+#ifndef PANDAS__LIBS_SRC_DATETIME_NP_DATETIME_H_
+#define PANDAS__LIBS_SRC_DATETIME_NP_DATETIME_H_
+
+#include <numpy/ndarraytypes.h>
+
+typedef enum {
+        PANDAS_FR_Y = 0,  // Years
+        PANDAS_FR_M = 1,  // Months
+        PANDAS_FR_W = 2,  // Weeks
+        // Gap where NPY_FR_B was
+        PANDAS_FR_D = 4,  // Days
+        PANDAS_FR_h = 5,  // hours
+        PANDAS_FR_m = 6,  // minutes
+        PANDAS_FR_s = 7,  // seconds
+        PANDAS_FR_ms = 8,  // milliseconds
+        PANDAS_FR_us = 9,  // microseconds
+        PANDAS_FR_ns = 10,  // nanoseconds
+        PANDAS_FR_ps = 11,  // picoseconds
+        PANDAS_FR_fs = 12,  // femtoseconds
+        PANDAS_FR_as = 13,  // attoseconds
+        PANDAS_FR_GENERIC = 14  // Generic, unbound units, can
+                                // convert to anything
+} PANDAS_DATETIMEUNIT;
+
+#define PANDAS_DATETIME_NUMUNITS 13
+
+#define PANDAS_DATETIME_NAT NPY_MIN_INT64
+
+typedef struct {
+        npy_int64 year;
+        npy_int32 month, day, hour, min, sec, us, ps, as;
+} pandas_datetimestruct;
+
+typedef struct {
+        npy_int64 days;
+        npy_int32 hrs, min, sec, ms, us, ns, seconds, microseconds, nanoseconds;
+} pandas_timedeltastruct;
+
+extern const pandas_datetimestruct _NS_MIN_DTS;
+extern const pandas_datetimestruct _NS_MAX_DTS;
+
+// stuff pandas needs
+// ----------------------------------------------------------------------------
+
+int convert_pydatetime_to_datetimestruct(PyObject *obj,
+                                         pandas_datetimestruct *out);
+
+npy_datetime pandas_datetimestruct_to_datetime(PANDAS_DATETIMEUNIT fr,
+                                               pandas_datetimestruct *d);
+
+void pandas_datetime_to_datetimestruct(npy_datetime val, PANDAS_DATETIMEUNIT fr,
+                                       pandas_datetimestruct *result);
+
+void pandas_timedelta_to_timedeltastruct(npy_timedelta val,
+                                         PANDAS_DATETIMEUNIT fr,
+                                         pandas_timedeltastruct *result);
+
+int dayofweek(int y, int m, int d);
+
+extern const int days_per_month_table[2][12];
+
+// stuff numpy-derived code needs in header
+// ----------------------------------------------------------------------------
+
+int is_leapyear(npy_int64 year);
+
+/*
+ * Calculates the days offset from the 1970 epoch.
+ */
+npy_int64
+get_datetimestruct_days(const pandas_datetimestruct *dts);
+
+
+/*
+ * Compares two pandas_datetimestruct objects chronologically
+ */
+int cmp_pandas_datetimestruct(const pandas_datetimestruct *a,
+                              const pandas_datetimestruct *b);
+
+
+/*
+ * Adjusts a datetimestruct based on a minutes offset. Assumes
+ * the current values are valid.
+ */
+void
+add_minutes_to_datetimestruct(pandas_datetimestruct *dts, int minutes);
+
+
+int
+convert_datetime_to_datetimestruct(PANDAS_DATETIMEUNIT base,
+                                   npy_datetime dt,
+                                   pandas_datetimestruct *out);
+
+#endif  // PANDAS__LIBS_SRC_DATETIME_NP_DATETIME_H_
diff --git a/pandas/_libs/src/datetime/np_datetime_strings.c b/pandas/_libs/src/datetime/np_datetime_strings.c
new file mode 100644
index 0000000000000..2ea69e2ac1636
--- /dev/null
+++ b/pandas/_libs/src/datetime/np_datetime_strings.c
@@ -0,0 +1,882 @@
+/*
+
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+
+Written by Mark Wiebe (mwwiebe@gmail.com)
+Copyright (c) 2011 by Enthought, Inc.
+
+Copyright (c) 2005-2011, NumPy Developers
+All rights reserved.
+
+See NUMPY_LICENSE.txt for the license.
+
+This file implements string parsing and creation for NumPy datetime.
+
+*/
+
+#define PY_SSIZE_T_CLEAN
+#define NO_IMPORT
+
+#include <Python.h>
+
+#include <time.h>
+
+#include <numpy/arrayobject.h>
+#include "numpy/arrayscalars.h"
+
+#include "np_datetime.h"
+#include "np_datetime_strings.h"
+
+
+/*
+ * Parses (almost) standard ISO 8601 date strings. The differences are:
+ *
+ * + Only seconds may have a decimal point, with up to 18 digits after it
+ *   (maximum attoseconds precision).
+ * + Either a 'T' as in ISO 8601 or a ' ' may be used to separate
+ *   the date and the time. Both are treated equivalently.
+ * + Doesn't (yet) handle the "YYYY-DDD" or "YYYY-Www" formats.
+ * + Doesn't handle leap seconds (seconds value has 60 in these cases).
+ * + Doesn't handle 24:00:00 as synonym for midnight (00:00:00) tomorrow
+ * + Accepts special values "NaT" (not a time), "Today", (current
+ *   day according to local time) and "Now" (current time in UTC).
+ * + ':' separator between hours, minutes, and seconds is optional. When
+ *   omitted, each component must be 2 digits if it appears. (GH-10041)
+ *
+ * 'str' must be a NULL-terminated string, and 'len' must be its length.
+ *
+ * 'out' gets filled with the parsed date-time.
+ * 'out_local' gets set to 1 if the parsed time contains timezone,
+ *      to 0 otherwise.
+ * 'out_tzoffset' gets set to timezone offset by minutes
+ *      if the parsed time was in local time,
+ *      to 0 otherwise. The values 'now' and 'today' don't get counted
+ *      as local, and neither do UTC +/-#### timezone offsets, because
+ *      they aren't using the computer's local timezone offset.
+ *
+ * Returns 0 on success, -1 on failure.
+ */
+int parse_iso_8601_datetime(char *str, int len,
+                            pandas_datetimestruct *out,
+                            int *out_local, int *out_tzoffset) {
+    int year_leap = 0;
+    int i, numdigits;
+    char *substr, sublen;
+
+    /* If year-month-day are separated by a valid separator,
+     * months/days without leading zeroes will be parsed
+     * (though not iso8601). If the components aren't separated,
+     * 4 (YYYY) or 8 (YYYYMMDD) digits are expected. 6 digits are
+     * forbidden here (but parsed as YYMMDD elsewhere).
+    */
+    int has_ymd_sep = 0;
+    char ymd_sep = '\0';
+    char valid_ymd_sep[] = {'-', '.', '/', '\\', ' '};
+    int valid_ymd_sep_len = sizeof(valid_ymd_sep);
+
+    /* hour-minute-second may or may not separated by ':'. If not, then
+     * each component must be 2 digits. */
+    int has_hms_sep = 0;
+    int hour_was_2_digits = 0;
+
+    /* Initialize the output to all zeros */
+    memset(out, 0, sizeof(pandas_datetimestruct));
+    out->month = 1;
+    out->day = 1;
+
+    substr = str;
+    sublen = len;
+
+    /* Skip leading whitespace */
+    while (sublen > 0 && isspace(*substr)) {
+        ++substr;
+        --sublen;
+    }
+
+    /* Leading '-' sign for negative year */
+    if (*substr == '-') {
+        ++substr;
+        --sublen;
+    }
+
+    if (sublen == 0) {
+        goto parse_error;
+    }
+
+    /* PARSE THE YEAR (4 digits) */
+    out->year = 0;
+    if (sublen >= 4 && isdigit(substr[0]) && isdigit(substr[1]) &&
+        isdigit(substr[2]) && isdigit(substr[3])) {
+        out->year = 1000 * (substr[0] - '0') + 100 * (substr[1] - '0') +
+                    10 * (substr[2] - '0') + (substr[3] - '0');
+
+        substr += 4;
+        sublen -= 4;
+    }
+
+    /* Negate the year if necessary */
+    if (str[0] == '-') {
+        out->year = -out->year;
+    }
+    /* Check whether it's a leap-year */
+    year_leap = is_leapyear(out->year);
+
+    /* Next character must be a separator, start of month, or end of string */
+    if (sublen == 0) {
+        if (out_local != NULL) {
+            *out_local = 0;
+        }
+        goto finish;
+    }
+
+    if (!isdigit(*substr)) {
+        for (i = 0; i < valid_ymd_sep_len; ++i) {
+            if (*substr == valid_ymd_sep[i]) {
+                break;
+            }
+        }
+        if (i == valid_ymd_sep_len) {
+            goto parse_error;
+        }
+        has_ymd_sep = 1;
+        ymd_sep = valid_ymd_sep[i];
+        ++substr;
+        --sublen;
+        /* Cannot have trailing separator */
+        if (sublen == 0 || !isdigit(*substr)) {
+            goto parse_error;
+        }
+    }
+
+    /* PARSE THE MONTH */
+    /* First digit required */
+    out->month = (*substr - '0');
+    ++substr;
+    --sublen;
+    /* Second digit optional if there was a separator */
+    if (isdigit(*substr)) {
+        out->month = 10 * out->month + (*substr - '0');
+        ++substr;
+        --sublen;
+    } else if (!has_ymd_sep) {
+        goto parse_error;
+    }
+    if (out->month < 1 || out->month > 12) {
+        PyErr_Format(PyExc_ValueError,
+                     "Month out of range in datetime string \"%s\"", str);
+        goto error;
+    }
+
+    /* Next character must be the separator, start of day, or end of string */
+    if (sublen == 0) {
+        /* Forbid YYYYMM. Parsed instead as YYMMDD by someone else. */
+        if (!has_ymd_sep) {
+            goto parse_error;
+        }
+        if (out_local != NULL) {
+            *out_local = 0;
+        }
+        goto finish;
+    }
+
+    if (has_ymd_sep) {
+        /* Must have separator, but cannot be trailing */
+        if (*substr != ymd_sep || sublen == 1) {
+            goto parse_error;
+        }
+        ++substr;
+        --sublen;
+    }
+
+    /* PARSE THE DAY */
+    /* First digit required */
+    if (!isdigit(*substr)) {
+        goto parse_error;
+    }
+    out->day = (*substr - '0');
+    ++substr;
+    --sublen;
+    /* Second digit optional if there was a separator */
+    if (isdigit(*substr)) {
+        out->day = 10 * out->day + (*substr - '0');
+        ++substr;
+        --sublen;
+    } else if (!has_ymd_sep) {
+        goto parse_error;
+    }
+    if (out->day < 1 ||
+        out->day > days_per_month_table[year_leap][out->month - 1]) {
+        PyErr_Format(PyExc_ValueError,
+                     "Day out of range in datetime string \"%s\"", str);
+        goto error;
+    }
+
+    /* Next character must be a 'T', ' ', or end of string */
+    if (sublen == 0) {
+        if (out_local != NULL) {
+            *out_local = 0;
+        }
+        goto finish;
+    }
+
+    if ((*substr != 'T' && *substr != ' ') || sublen == 1) {
+        goto parse_error;
+    }
+    ++substr;
+    --sublen;
+
+    /* PARSE THE HOURS */
+    /* First digit required */
+    if (!isdigit(*substr)) {
+        goto parse_error;
+    }
+    out->hour = (*substr - '0');
+    ++substr;
+    --sublen;
+    /* Second digit optional */
+    if (isdigit(*substr)) {
+        hour_was_2_digits = 1;
+        out->hour = 10 * out->hour + (*substr - '0');
+        ++substr;
+        --sublen;
+        if (out->hour >= 24) {
+            PyErr_Format(PyExc_ValueError,
+                         "Hours out of range in datetime string \"%s\"", str);
+            goto error;
+        }
+    }
+
+    /* Next character must be a ':' or the end of the string */
+    if (sublen == 0) {
+        if (!hour_was_2_digits) {
+            goto parse_error;
+        }
+        goto finish;
+    }
+
+    if (*substr == ':') {
+        has_hms_sep = 1;
+        ++substr;
+        --sublen;
+        /* Cannot have a trailing separator */
+        if (sublen == 0 || !isdigit(*substr)) {
+            goto parse_error;
+        }
+    } else if (!isdigit(*substr)) {
+        if (!hour_was_2_digits) {
+            goto parse_error;
+        }
+        goto parse_timezone;
+    }
+
+    /* PARSE THE MINUTES */
+    /* First digit required */
+    out->min = (*substr - '0');
+    ++substr;
+    --sublen;
+    /* Second digit optional if there was a separator */
+    if (isdigit(*substr)) {
+        out->min = 10 * out->min + (*substr - '0');
+        ++substr;
+        --sublen;
+        if (out->min >= 60) {
+            PyErr_Format(PyExc_ValueError,
+                         "Minutes out of range in datetime string \"%s\"", str);
+            goto error;
+        }
+    } else if (!has_hms_sep) {
+        goto parse_error;
+    }
+
+    if (sublen == 0) {
+        goto finish;
+    }
+
+    /* If we make it through this condition block, then the next
+     * character is a digit. */
+    if (has_hms_sep && *substr == ':') {
+        ++substr;
+        --sublen;
+        /* Cannot have a trailing ':' */
+        if (sublen == 0 || !isdigit(*substr)) {
+            goto parse_error;
+        }
+    } else if (!has_hms_sep && isdigit(*substr)) {
+    } else {
+        goto parse_timezone;
+    }
+
+    /* PARSE THE SECONDS */
+    /* First digit required */
+    out->sec = (*substr - '0');
+    ++substr;
+    --sublen;
+    /* Second digit optional if there was a separator */
+    if (isdigit(*substr)) {
+        out->sec = 10 * out->sec + (*substr - '0');
+        ++substr;
+        --sublen;
+        if (out->sec >= 60) {
+            PyErr_Format(PyExc_ValueError,
+                         "Seconds out of range in datetime string \"%s\"", str);
+            goto error;
+        }
+    } else if (!has_hms_sep) {
+        goto parse_error;
+    }
+
+    /* Next character may be a '.' indicating fractional seconds */
+    if (sublen > 0 && *substr == '.') {
+        ++substr;
+        --sublen;
+    } else {
+        goto parse_timezone;
+    }
+
+    /* PARSE THE MICROSECONDS (0 to 6 digits) */
+    numdigits = 0;
+    for (i = 0; i < 6; ++i) {
+        out->us *= 10;
+        if (sublen > 0 && isdigit(*substr)) {
+            out->us += (*substr - '0');
+            ++substr;
+            --sublen;
+            ++numdigits;
+        }
+    }
+
+    if (sublen == 0 || !isdigit(*substr)) {
+        goto parse_timezone;
+    }
+
+    /* PARSE THE PICOSECONDS (0 to 6 digits) */
+    numdigits = 0;
+    for (i = 0; i < 6; ++i) {
+        out->ps *= 10;
+        if (sublen > 0 && isdigit(*substr)) {
+            out->ps += (*substr - '0');
+            ++substr;
+            --sublen;
+            ++numdigits;
+        }
+    }
+
+    if (sublen == 0 || !isdigit(*substr)) {
+        goto parse_timezone;
+    }
+
+    /* PARSE THE ATTOSECONDS (0 to 6 digits) */
+    numdigits = 0;
+    for (i = 0; i < 6; ++i) {
+        out->as *= 10;
+        if (sublen > 0 && isdigit(*substr)) {
+            out->as += (*substr - '0');
+            ++substr;
+            --sublen;
+            ++numdigits;
+        }
+    }
+
+parse_timezone:
+    /* trim any whitepsace between time/timeezone */
+    while (sublen > 0 && isspace(*substr)) {
+        ++substr;
+        --sublen;
+    }
+
+    if (sublen == 0) {
+        // Unlike NumPy, treating no time zone as naive
+        goto finish;
+    }
+
+    /* UTC specifier */
+    if (*substr == 'Z') {
+        /* "Z" should be equivalent to tz offset "+00:00" */
+        if (out_local != NULL) {
+            *out_local = 1;
+        }
+
+        if (out_tzoffset != NULL) {
+            *out_tzoffset = 0;
+        }
+
+        if (sublen == 1) {
+            goto finish;
+        } else {
+            ++substr;
+            --sublen;
+        }
+    } else if (*substr == '-' || *substr == '+') {
+        /* Time zone offset */
+        int offset_neg = 0, offset_hour = 0, offset_minute = 0;
+
+        /*
+         * Since "local" means local with respect to the current
+         * machine, we say this is non-local.
+         */
+
+        if (*substr == '-') {
+            offset_neg = 1;
+        }
+        ++substr;
+        --sublen;
+
+        /* The hours offset */
+        if (sublen >= 2 && isdigit(substr[0]) && isdigit(substr[1])) {
+            offset_hour = 10 * (substr[0] - '0') + (substr[1] - '0');
+            substr += 2;
+            sublen -= 2;
+            if (offset_hour >= 24) {
+                PyErr_Format(PyExc_ValueError,
+                             "Timezone hours offset out of range "
+                             "in datetime string \"%s\"",
+                             str);
+                goto error;
+            }
+        } else if (sublen >= 1 && isdigit(substr[0])) {
+            offset_hour = substr[0] - '0';
+            ++substr;
+            --sublen;
+        } else {
+            goto parse_error;
+        }
+
+        /* The minutes offset is optional */
+        if (sublen > 0) {
+            /* Optional ':' */
+            if (*substr == ':') {
+                ++substr;
+                --sublen;
+            }
+
+            /* The minutes offset (at the end of the string) */
+            if (sublen >= 2 && isdigit(substr[0]) && isdigit(substr[1])) {
+                offset_minute = 10 * (substr[0] - '0') + (substr[1] - '0');
+                substr += 2;
+                sublen -= 2;
+                if (offset_minute >= 60) {
+                    PyErr_Format(PyExc_ValueError,
+                                 "Timezone minutes offset out of range "
+                                 "in datetime string \"%s\"",
+                                 str);
+                    goto error;
+                }
+            } else if (sublen >= 1 && isdigit(substr[0])) {
+                offset_minute = substr[0] - '0';
+                ++substr;
+                --sublen;
+            } else {
+                goto parse_error;
+            }
+        }
+
+        /* Apply the time zone offset */
+        if (offset_neg) {
+            offset_hour = -offset_hour;
+            offset_minute = -offset_minute;
+        }
+        if (out_local != NULL) {
+            *out_local = 1;
+            // Unlike NumPy, do not change internal value to local time
+            *out_tzoffset = 60 * offset_hour + offset_minute;
+        }
+    }
+
+    /* Skip trailing whitespace */
+    while (sublen > 0 && isspace(*substr)) {
+        ++substr;
+        --sublen;
+    }
+
+    if (sublen != 0) {
+        goto parse_error;
+    }
+
+finish:
+    return 0;
+
+parse_error:
+    PyErr_Format(PyExc_ValueError,
+                 "Error parsing datetime string \"%s\" at position %d", str,
+                 (int)(substr - str));
+    return -1;
+
+error:
+    return -1;
+}
+
+/*
+ * Provides a string length to use for converting datetime
+ * objects with the given local and unit settings.
+ */
+int get_datetime_iso_8601_strlen(int local, PANDAS_DATETIMEUNIT base) {
+    int len = 0;
+
+    switch (base) {
+        /* Generic units can only be used to represent NaT */
+        /*case PANDAS_FR_GENERIC:*/
+        /*    return 4;*/
+        case PANDAS_FR_as:
+            len += 3; /* "###" */
+        case PANDAS_FR_fs:
+            len += 3; /* "###" */
+        case PANDAS_FR_ps:
+            len += 3; /* "###" */
+        case PANDAS_FR_ns:
+            len += 3; /* "###" */
+        case PANDAS_FR_us:
+            len += 3; /* "###" */
+        case PANDAS_FR_ms:
+            len += 4; /* ".###" */
+        case PANDAS_FR_s:
+            len += 3; /* ":##" */
+        case PANDAS_FR_m:
+            len += 3; /* ":##" */
+        case PANDAS_FR_h:
+            len += 3; /* "T##" */
+        case PANDAS_FR_D:
+        case PANDAS_FR_W:
+            len += 3; /* "-##" */
+        case PANDAS_FR_M:
+            len += 3; /* "-##" */
+        case PANDAS_FR_Y:
+            len += 21; /* 64-bit year */
+            break;
+        default:
+            len += 3; /* handle the now defunct NPY_FR_B */
+            break;
+    }
+
+    if (base >= PANDAS_FR_h) {
+        if (local) {
+            len += 5; /* "+####" or "-####" */
+        } else {
+            len += 1; /* "Z" */
+        }
+    }
+
+    len += 1; /* NULL terminator */
+
+    return len;
+}
+
+
+/*
+ * Converts an pandas_datetimestruct to an (almost) ISO 8601
+ * NULL-terminated string using timezone Z (UTC). If the string fits in
+ * the space exactly, it leaves out the NULL terminator and returns success.
+ *
+ * The differences from ISO 8601 are the 'NaT' string, and
+ * the number of year digits is >= 4 instead of strictly 4.
+ *
+ * 'base' restricts the output to that unit. Set 'base' to
+ * -1 to auto-detect a base after which all the values are zero.
+ *
+ *  Returns 0 on success, -1 on failure (for example if the output
+ *  string was too short).
+ */
+int make_iso_8601_datetime(pandas_datetimestruct *dts, char *outstr, int outlen,
+                           PANDAS_DATETIMEUNIT base) {
+    char *substr = outstr, sublen = outlen;
+    int tmplen;
+
+    /*
+     * Print weeks with the same precision as days.
+     *
+     * TODO: Could print weeks with YYYY-Www format if the week
+     *       epoch is a Monday.
+     */
+    if (base == PANDAS_FR_W) {
+        base = PANDAS_FR_D;
+    }
+
+/* YEAR */
+/*
+ * Can't use PyOS_snprintf, because it always produces a '\0'
+ * character at the end, and NumPy string types are permitted
+ * to have data all the way to the end of the buffer.
+ */
+#ifdef _WIN32
+    tmplen = _snprintf(substr, sublen, "%04" NPY_INT64_FMT, dts->year);
+#else
+    tmplen = snprintf(substr, sublen, "%04" NPY_INT64_FMT, dts->year);
+#endif
+    /* If it ran out of space or there isn't space for the NULL terminator */
+    if (tmplen < 0 || tmplen > sublen) {
+        goto string_too_short;
+    }
+    substr += tmplen;
+    sublen -= tmplen;
+
+    /* Stop if the unit is years */
+    if (base == PANDAS_FR_Y) {
+        if (sublen > 0) {
+            *substr = '\0';
+        }
+        return 0;
+    }
+
+    /* MONTH */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = '-';
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->month / 10) + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->month % 10) + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is months */
+    if (base == PANDAS_FR_M) {
+        if (sublen > 0) {
+            *substr = '\0';
+        }
+        return 0;
+    }
+
+    /* DAY */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = '-';
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->day / 10) + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->day % 10) + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is days */
+    if (base == PANDAS_FR_D) {
+        if (sublen > 0) {
+            *substr = '\0';
+        }
+        return 0;
+    }
+
+    /* HOUR */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = 'T';
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->hour / 10) + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->hour % 10) + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is hours */
+    if (base == PANDAS_FR_h) {
+        goto add_time_zone;
+    }
+
+    /* MINUTE */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = ':';
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->min / 10) + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->min % 10) + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is minutes */
+    if (base == PANDAS_FR_m) {
+        goto add_time_zone;
+    }
+
+    /* SECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = ':';
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->sec / 10) + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->sec % 10) + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is seconds */
+    if (base == PANDAS_FR_s) {
+        goto add_time_zone;
+    }
+
+    /* MILLISECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = '.';
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->us / 100000) % 10 + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->us / 10000) % 10 + '0');
+    if (sublen < 4) {
+        goto string_too_short;
+    }
+    substr[3] = (char)((dts->us / 1000) % 10 + '0');
+    substr += 4;
+    sublen -= 4;
+
+    /* Stop if the unit is milliseconds */
+    if (base == PANDAS_FR_ms) {
+        goto add_time_zone;
+    }
+
+    /* MICROSECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = (char)((dts->us / 100) % 10 + '0');
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->us / 10) % 10 + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)(dts->us % 10 + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is microseconds */
+    if (base == PANDAS_FR_us) {
+        goto add_time_zone;
+    }
+
+    /* NANOSECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = (char)((dts->ps / 100000) % 10 + '0');
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->ps / 10000) % 10 + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->ps / 1000) % 10 + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is nanoseconds */
+    if (base == PANDAS_FR_ns) {
+        goto add_time_zone;
+    }
+
+    /* PICOSECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = (char)((dts->ps / 100) % 10 + '0');
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->ps / 10) % 10 + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)(dts->ps % 10 + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is picoseconds */
+    if (base == PANDAS_FR_ps) {
+        goto add_time_zone;
+    }
+
+    /* FEMTOSECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = (char)((dts->as / 100000) % 10 + '0');
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->as / 10000) % 10 + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->as / 1000) % 10 + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is femtoseconds */
+    if (base == PANDAS_FR_fs) {
+        goto add_time_zone;
+    }
+
+    /* ATTOSECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = (char)((dts->as / 100) % 10 + '0');
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->as / 10) % 10 + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)(dts->as % 10 + '0');
+    substr += 3;
+    sublen -= 3;
+
+add_time_zone:
+    /* UTC "Zulu" time */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = 'Z';
+    substr += 1;
+    sublen -= 1;
+
+    /* Add a NULL terminator, and return */
+    if (sublen > 0) {
+        substr[0] = '\0';
+    }
+
+    return 0;
+
+string_too_short:
+    PyErr_Format(PyExc_RuntimeError,
+                 "The string provided for NumPy ISO datetime formatting "
+                 "was too short, with length %d",
+                 outlen);
+    return -1;
+}
diff --git a/pandas/_libs/src/datetime/np_datetime_strings.h b/pandas/_libs/src/datetime/np_datetime_strings.h
new file mode 100644
index 0000000000000..ef7fe200aa58e
--- /dev/null
+++ b/pandas/_libs/src/datetime/np_datetime_strings.h
@@ -0,0 +1,79 @@
+/*
+
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+
+Written by Mark Wiebe (mwwiebe@gmail.com)
+Copyright (c) 2011 by Enthought, Inc.
+
+Copyright (c) 2005-2011, NumPy Developers
+All rights reserved.
+
+See NUMPY_LICENSE.txt for the license.
+
+This file implements string parsing and creation for NumPy datetime.
+
+*/
+
+#ifndef PANDAS__LIBS_SRC_DATETIME_NP_DATETIME_STRINGS_H_
+#define PANDAS__LIBS_SRC_DATETIME_NP_DATETIME_STRINGS_H_
+
+/*
+ * Parses (almost) standard ISO 8601 date strings. The differences are:
+ *
+ * + The date "20100312" is parsed as the year 20100312, not as
+ *   equivalent to "2010-03-12". The '-' in the dates are not optional.
+ * + Only seconds may have a decimal point, with up to 18 digits after it
+ *   (maximum attoseconds precision).
+ * + Either a 'T' as in ISO 8601 or a ' ' may be used to separate
+ *   the date and the time. Both are treated equivalently.
+ * + Doesn't (yet) handle the "YYYY-DDD" or "YYYY-Www" formats.
+ * + Doesn't handle leap seconds (seconds value has 60 in these cases).
+ * + Doesn't handle 24:00:00 as synonym for midnight (00:00:00) tomorrow
+ * + Accepts special values "NaT" (not a time), "Today", (current
+ *   day according to local time) and "Now" (current time in UTC).
+ *
+ * 'str' must be a NULL-terminated string, and 'len' must be its length.
+ *
+ * 'out' gets filled with the parsed date-time.
+ * 'out_local' gets whether returned value contains timezone. 0 for UTC, 1 for local time.
+ * 'out_tzoffset' gets set to timezone offset by minutes
+ *      if the parsed time was in local time,
+ *      to 0 otherwise. The values 'now' and 'today' don't get counted
+ *      as local, and neither do UTC +/-#### timezone offsets, because
+ *      they aren't using the computer's local timezone offset.
+ *
+ * Returns 0 on success, -1 on failure.
+ */
+int
+parse_iso_8601_datetime(char *str, int len,
+                    pandas_datetimestruct *out,
+                    int *out_local,
+                    int *out_tzoffset);
+
+/*
+ * Provides a string length to use for converting datetime
+ * objects with the given local and unit settings.
+ */
+int
+get_datetime_iso_8601_strlen(int local, PANDAS_DATETIMEUNIT base);
+
+/*
+ * Converts an pandas_datetimestruct to an (almost) ISO 8601
+ * NULL-terminated string using timezone Z (UTC).
+ *
+ * 'base' restricts the output to that unit. Set 'base' to
+ * -1 to auto-detect a base after which all the values are zero.
+ *
+ *  Returns 0 on success, -1 on failure (for example if the output
+ *  string was too short).
+ */
+int
+make_iso_8601_datetime(pandas_datetimestruct *dts, char *outstr, int outlen,
+                       PANDAS_DATETIMEUNIT base);
+
+#endif  // PANDAS__LIBS_SRC_DATETIME_NP_DATETIME_STRINGS_H_
diff --git a/pandas/_libs/src/headers/cmath b/pandas/_libs/src/headers/cmath
new file mode 100644
index 0000000000000..d8e2239406cae
--- /dev/null
+++ b/pandas/_libs/src/headers/cmath
@@ -0,0 +1,15 @@
+#ifndef _PANDAS_MATH_H_
+#define _PANDAS_MATH_H_
+
+// In older versions of Visual Studio there wasn't a std::signbit defined
+// This defines it using _copysign
+#if defined(_MSC_VER) && (_MSC_VER < 1800)
+#include <cmath>
+namespace std {
+  __inline int signbit(double num) { return _copysign(1.0, num) < 0; }
+}
+#else
+#include <cmath>
+#endif
+
+#endif
diff --git a/pandas/src/headers/ms_inttypes.h b/pandas/_libs/src/headers/ms_inttypes.h
similarity index 100%
rename from pandas/src/headers/ms_inttypes.h
rename to pandas/_libs/src/headers/ms_inttypes.h
diff --git a/pandas/src/headers/ms_stdint.h b/pandas/_libs/src/headers/ms_stdint.h
similarity index 100%
rename from pandas/src/headers/ms_stdint.h
rename to pandas/_libs/src/headers/ms_stdint.h
diff --git a/pandas/src/headers/portable.h b/pandas/_libs/src/headers/portable.h
similarity index 100%
rename from pandas/src/headers/portable.h
rename to pandas/_libs/src/headers/portable.h
diff --git a/pandas/src/headers/stdint.h b/pandas/_libs/src/headers/stdint.h
similarity index 100%
rename from pandas/src/headers/stdint.h
rename to pandas/_libs/src/headers/stdint.h
diff --git a/pandas/_libs/src/helper.h b/pandas/_libs/src/helper.h
new file mode 100644
index 0000000000000..26b4d033b963b
--- /dev/null
+++ b/pandas/_libs/src/helper.h
@@ -0,0 +1,25 @@
+/*
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+*/
+
+#ifndef PANDAS__LIBS_SRC_HELPER_H_
+#define PANDAS__LIBS_SRC_HELPER_H_
+
+#ifndef PANDAS_INLINE
+  #if defined(__GNUC__)
+    #define PANDAS_INLINE static __inline__
+  #elif defined(_MSC_VER)
+    #define PANDAS_INLINE static __inline
+  #elif defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
+    #define PANDAS_INLINE static inline
+  #else
+    #define PANDAS_INLINE
+  #endif
+#endif
+
+#endif  // PANDAS__LIBS_SRC_HELPER_H_
diff --git a/pandas/_libs/src/inference.pyx b/pandas/_libs/src/inference.pyx
new file mode 100644
index 0000000000000..1fa07dbed6822
--- /dev/null
+++ b/pandas/_libs/src/inference.pyx
@@ -0,0 +1,1599 @@
+import sys
+from decimal import Decimal
+cimport util
+cimport cython
+from tslibs.nattype import NaT
+from tslibs.conversion cimport convert_to_tsobject
+from tslibs.timedeltas cimport convert_to_timedelta64
+from tslibs.timezones cimport get_timezone, tz_compare
+
+iNaT = util.get_nat()
+
+cdef bint PY2 = sys.version_info[0] == 2
+cdef double nan = <double> np.NaN
+
+cdef extern from "numpy/arrayobject.h":
+    # cython's numpy.dtype specification is incorrect, which leads to
+    # errors in issubclass(self.dtype.type, np.bool_), so we directly
+    # include the correct version
+    # https://github.com/cython/cython/issues/2022
+
+    ctypedef class numpy.dtype [object PyArray_Descr]:
+        # Use PyDataType_* macros when possible, however there are no macros
+        # for accessing some of the fields, so some are defined. Please
+        # ask on cython-dev if you need more.
+        cdef int type_num
+        cdef int itemsize "elsize"
+        cdef char byteorder
+        cdef object fields
+        cdef tuple names
+
+from util cimport UINT8_MAX, UINT64_MAX, INT64_MAX, INT64_MIN
+
+# core.common import for fast inference checks
+
+cpdef bint is_float(object obj):
+    return util.is_float_object(obj)
+
+
+cpdef bint is_integer(object obj):
+    return util.is_integer_object(obj)
+
+
+cpdef bint is_bool(object obj):
+    return util.is_bool_object(obj)
+
+
+cpdef bint is_complex(object obj):
+    return util.is_complex_object(obj)
+
+
+cpdef bint is_decimal(object obj):
+    return isinstance(obj, Decimal)
+
+
+cpdef bint is_interval(object obj):
+    return getattr(obj, '_typ', '_typ') == 'interval'
+
+
+cpdef bint is_period(object val):
+    """ Return a boolean if this is a Period object """
+    return util.is_period_object(val)
+
+cdef inline bint is_offset(object val):
+    return getattr(val, '_typ', '_typ') == 'dateoffset'
+
+_TYPE_MAP = {
+    'categorical': 'categorical',
+    'category': 'categorical',
+    'int8': 'integer',
+    'int16': 'integer',
+    'int32': 'integer',
+    'int64': 'integer',
+    'i': 'integer',
+    'uint8': 'integer',
+    'uint16': 'integer',
+    'uint32': 'integer',
+    'uint64': 'integer',
+    'u': 'integer',
+    'float32': 'floating',
+    'float64': 'floating',
+    'f': 'floating',
+    'complex128': 'complex',
+    'c': 'complex',
+    'string': 'string' if PY2 else 'bytes',
+    'S': 'string' if PY2 else 'bytes',
+    'unicode': 'unicode' if PY2 else 'string',
+    'U': 'unicode' if PY2 else 'string',
+    'bool': 'boolean',
+    'b': 'boolean',
+    'datetime64[ns]': 'datetime64',
+    'M': 'datetime64',
+    'timedelta64[ns]': 'timedelta64',
+    'm': 'timedelta64',
+}
+
+# types only exist on certain platform
+try:
+    np.float128
+    _TYPE_MAP['float128'] = 'floating'
+except AttributeError:
+    pass
+try:
+    np.complex256
+    _TYPE_MAP['complex256'] = 'complex'
+except AttributeError:
+    pass
+try:
+    np.float16
+    _TYPE_MAP['float16'] = 'floating'
+except AttributeError:
+    pass
+
+
+cdef class Seen(object):
+    """
+    Class for keeping track of the types of elements
+    encountered when trying to perform type conversions.
+    """
+
+    cdef:
+        bint int_             # seen_int
+        bint bool_            # seen_bool
+        bint null_            # seen_null
+        bint uint_            # seen_uint (unsigned integer)
+        bint sint_            # seen_sint (signed integer)
+        bint float_           # seen_float
+        bint object_          # seen_object
+        bint complex_         # seen_complex
+        bint datetime_        # seen_datetime
+        bint coerce_numeric   # coerce data to numeric
+        bint timedelta_       # seen_timedelta
+        bint datetimetz_      # seen_datetimetz
+
+    def __cinit__(self, bint coerce_numeric=0):
+        """
+        Initialize a Seen instance.
+
+        Parameters
+        ----------
+        coerce_numeric : bint, default 0
+            Whether or not to force conversion to a numeric data type if
+            initial methods to convert to numeric fail.
+        """
+        self.int_ = 0
+        self.bool_ = 0
+        self.null_ = 0
+        self.uint_ = 0
+        self.sint_ = 0
+        self.float_ = 0
+        self.object_ = 0
+        self.complex_ = 0
+        self.datetime_ = 0
+        self.timedelta_ = 0
+        self.datetimetz_ = 0
+        self.coerce_numeric = coerce_numeric
+
+    cdef inline bint check_uint64_conflict(self) except -1:
+        """
+        Check whether we can safely convert a uint64 array to a numeric dtype.
+
+        There are two cases when conversion to numeric dtype with a uint64
+        array is not safe (and will therefore not be performed)
+
+        1) A NaN element is encountered.
+
+           uint64 cannot be safely cast to float64 due to truncation issues
+           at the extreme ends of the range.
+
+        2) A negative number is encountered.
+
+           There is no numerical dtype that can hold both negative numbers
+           and numbers greater than INT64_MAX. Hence, at least one number
+           will be improperly cast if we convert to a numeric dtype.
+
+        Returns
+        -------
+        return_values : bool
+            Whether or not we should return the original input array to avoid
+            data truncation.
+
+        Raises
+        ------
+        ValueError : uint64 elements were detected, and at least one of the
+                     two conflict cases was also detected. However, we are
+                     trying to force conversion to a numeric dtype.
+        """
+        return (self.uint_ and (self.null_ or self.sint_)
+                and not self.coerce_numeric)
+
+    cdef inline saw_null(self):
+        """
+        Set flags indicating that a null value was encountered.
+        """
+        self.null_ = 1
+        self.float_ = 1
+
+    cdef saw_int(self, object val):
+        """
+        Set flags indicating that an integer value was encountered.
+
+        In addition to setting a flag that an integer was seen, we
+        also set two flags depending on the type of integer seen:
+
+        1) sint_ : a negative (signed) number in the
+                   range of [-2**63, 0) was encountered
+        2) uint_ : a positive number in the range of
+                   [2**63, 2**64) was encountered
+
+        Parameters
+        ----------
+        val : Python int
+            Value with which to set the flags.
+        """
+        self.int_ = 1
+        self.sint_ = self.sint_ or (oINT64_MIN <= val < 0)
+        self.uint_ = self.uint_ or (oINT64_MAX < val <= oUINT64_MAX)
+
+    @property
+    def numeric_(self):
+        return self.complex_ or self.float_ or self.int_
+
+    @property
+    def is_bool(self):
+        return not (self.datetime_ or self.numeric_ or self.timedelta_)
+
+    @property
+    def is_float_or_complex(self):
+        return not (self.bool_ or self.datetime_ or self.timedelta_)
+
+
+cdef _try_infer_map(v):
+    """ if its in our map, just return the dtype """
+    cdef:
+        object attr, val
+    for attr in ['name', 'kind', 'base']:
+        val = getattr(v.dtype, attr)
+        if val in _TYPE_MAP:
+            return _TYPE_MAP[val]
+    return None
+
+
+def infer_dtype(object value, bint skipna=False):
+    """
+    Efficiently infer the type of a passed val, or list-like
+    array of values. Return a string describing the type.
+
+    Parameters
+    ----------
+    value : scalar, list, ndarray, or pandas type
+    skipna : bool, default False
+        Ignore NaN values when inferring the type. The default of ``False``
+        will be deprecated in a later version of pandas.
+
+        .. versionadded:: 0.21.0
+
+    Returns
+    -------
+    string describing the common type of the input data.
+    Results can include:
+
+    - string
+    - unicode
+    - bytes
+    - floating
+    - integer
+    - mixed-integer
+    - mixed-integer-float
+    - decimal
+    - complex
+    - categorical
+    - boolean
+    - datetime64
+    - datetime
+    - date
+    - timedelta64
+    - timedelta
+    - time
+    - period
+    - mixed
+
+    Raises
+    ------
+    TypeError if ndarray-like but cannot infer the dtype
+
+    Notes
+    -----
+    - 'mixed' is the catchall for anything that is not otherwise
+      specialized
+    - 'mixed-integer-float' are floats and integers
+    - 'mixed-integer' are integers mixed with non-integers
+
+    Examples
+    --------
+    >>> infer_dtype(['foo', 'bar'])
+    'string'
+
+    >>> infer_dtype(['a', np.nan, 'b'], skipna=True)
+    'string'
+
+    >>> infer_dtype(['a', np.nan, 'b'], skipna=False)
+    'mixed'
+
+    >>> infer_dtype([b'foo', b'bar'])
+    'bytes'
+
+    >>> infer_dtype([1, 2, 3])
+    'integer'
+
+    >>> infer_dtype([1, 2, 3.5])
+    'mixed-integer-float'
+
+    >>> infer_dtype([1.0, 2.0, 3.5])
+    'floating'
+
+    >>> infer_dtype(['a', 1])
+    'mixed-integer'
+
+    >>> infer_dtype([Decimal(1), Decimal(2.0)])
+    'decimal'
+
+    >>> infer_dtype([True, False])
+    'boolean'
+
+    >>> infer_dtype([True, False, np.nan])
+    'mixed'
+
+    >>> infer_dtype([pd.Timestamp('20130101')])
+    'datetime'
+
+    >>> infer_dtype([datetime.date(2013, 1, 1)])
+    'date'
+
+    >>> infer_dtype([np.datetime64('2013-01-01')])
+    'datetime64'
+
+    >>> infer_dtype([datetime.timedelta(0, 1, 1)])
+    'timedelta'
+
+    >>> infer_dtype(pd.Series(list('aabc')).astype('category'))
+    'categorical'
+    """
+    cdef:
+        Py_ssize_t i, n
+        object val
+        ndarray values
+        bint seen_pdnat = False
+        bint seen_val = False
+
+    if util.is_array(value):
+        values = value
+    elif hasattr(value, 'dtype'):
+
+        # this will handle ndarray-like
+        # e.g. categoricals
+        try:
+            values = getattr(value, '_values', getattr(
+                value, 'values', value))
+        except:
+            value = _try_infer_map(value)
+            if value is not None:
+                return value
+
+            # its ndarray like but we can't handle
+            raise ValueError("cannot infer type for {0}".format(type(value)))
+
+    else:
+        if not PyList_Check(value):
+            value = list(value)
+        from pandas.core.dtypes.cast import (
+            construct_1d_object_array_from_listlike)
+        values = construct_1d_object_array_from_listlike(value)
+
+    values = getattr(values, 'values', values)
+    val = _try_infer_map(values)
+    if val is not None:
+        return val
+
+    if values.dtype != np.object_:
+        values = values.astype('O')
+
+    # make contiguous
+    values = values.ravel()
+
+    n = len(values)
+    if n == 0:
+        return 'empty'
+
+    # try to use a valid value
+    for i in range(n):
+        val = util.get_value_1d(values, i)
+
+        # do not use is_nul_datetimelike to keep
+        # np.datetime64('nat') and np.timedelta64('nat')
+        if util._checknull(val):
+            pass
+        elif val is NaT:
+            seen_pdnat = True
+        else:
+            seen_val = True
+            break
+
+    # if all values are nan/NaT
+    if seen_val is False and seen_pdnat is True:
+        return 'datetime'
+        # float/object nan is handled in latter logic
+
+    if util.is_datetime64_object(val):
+        if is_datetime64_array(values):
+            return 'datetime64'
+        elif is_timedelta_or_timedelta64_array(values):
+            return 'timedelta'
+
+    elif is_timedelta(val):
+        if is_timedelta_or_timedelta64_array(values):
+            return 'timedelta'
+
+    elif util.is_integer_object(val):
+        # a timedelta will show true here as well
+        if is_timedelta(val):
+            if is_timedelta_or_timedelta64_array(values):
+                return 'timedelta'
+
+        if is_integer_array(values):
+            return 'integer'
+        elif is_integer_float_array(values):
+            return 'mixed-integer-float'
+        elif is_timedelta_or_timedelta64_array(values):
+            return 'timedelta'
+        return 'mixed-integer'
+
+    elif is_datetime(val):
+        if is_datetime_array(values):
+            return 'datetime'
+
+    elif is_date(val):
+        if is_date_array(values, skipna=skipna):
+            return 'date'
+
+    elif is_time(val):
+        if is_time_array(values, skipna=skipna):
+            return 'time'
+
+    elif is_decimal(val):
+        return 'decimal'
+
+    elif util.is_float_object(val):
+        if is_float_array(values):
+            return 'floating'
+        elif is_integer_float_array(values):
+            return 'mixed-integer-float'
+
+    elif util.is_bool_object(val):
+        if is_bool_array(values, skipna=skipna):
+            return 'boolean'
+
+    elif PyString_Check(val):
+        if is_string_array(values, skipna=skipna):
+            return 'string'
+
+    elif PyUnicode_Check(val):
+        if is_unicode_array(values, skipna=skipna):
+            return 'unicode'
+
+    elif PyBytes_Check(val):
+        if is_bytes_array(values, skipna=skipna):
+            return 'bytes'
+
+    elif is_period(val):
+        if is_period_array(values):
+            return 'period'
+
+    elif is_interval(val):
+        if is_interval_array(values):
+            return 'interval'
+
+    for i in range(n):
+        val = util.get_value_1d(values, i)
+        if (util.is_integer_object(val) and
+                not util.is_timedelta64_object(val) and
+                not util.is_datetime64_object(val)):
+            return 'mixed-integer'
+
+    return 'mixed'
+
+
+cpdef object infer_datetimelike_array(object arr):
+    """
+    infer if we have a datetime or timedelta array
+    - date: we have *only* date and maybe strings, nulls
+    - datetime: we have *only* datetimes and maybe strings, nulls
+    - timedelta: we have *only* timedeltas and maybe strings, nulls
+    - nat: we do not have *any* date, datetimes or timedeltas, but do have
+      at least a NaT
+    - mixed: other objects (strings, a mix of tz-aware and tz-naive, or
+                            actual objects)
+
+    Parameters
+    ----------
+    arr : object array
+
+    Returns
+    -------
+    string: {datetime, timedelta, date, nat, mixed}
+
+    """
+
+    cdef:
+        Py_ssize_t i, n = len(arr)
+        bint seen_timedelta = 0, seen_date = 0, seen_datetime = 0
+        bint seen_tz_aware = 0, seen_tz_naive = 0
+        bint seen_nat = 0
+        list objs = []
+        object v
+
+    for i in range(n):
+        v = arr[i]
+        if util.is_string_object(v):
+            objs.append(v)
+
+            if len(objs) == 3:
+                break
+
+        elif util._checknull(v):
+            # nan or None
+            pass
+        elif v is NaT:
+            seen_nat = 1
+        elif is_datetime(v):
+            # datetime
+            seen_datetime = 1
+
+            # disambiguate between tz-naive and tz-aware
+            if v.tzinfo is None:
+                seen_tz_naive = 1
+            else:
+                seen_tz_aware = 1
+
+            if seen_tz_naive and seen_tz_aware:
+                return 'mixed'
+        elif util.is_datetime64_object(v):
+            # np.datetime64
+            seen_datetime = 1
+        elif is_date(v):
+            seen_date = 1
+        elif is_timedelta(v) or util.is_timedelta64_object(v):
+            # timedelta, or timedelta64
+            seen_timedelta = 1
+        else:
+            return 'mixed'
+
+    if seen_date and not (seen_datetime or seen_timedelta):
+        return 'date'
+    elif seen_datetime and not seen_timedelta:
+        return 'datetime'
+    elif seen_timedelta and not seen_datetime:
+        return 'timedelta'
+    elif seen_nat:
+        return 'nat'
+
+    # short-circuit by trying to
+    # actually convert these strings
+    # this is for performance as we don't need to try
+    # convert *every* string array
+    if len(objs):
+        try:
+            array_to_datetime(objs, errors='raise')
+            return 'datetime'
+        except:
+            pass
+
+        # we are *not* going to infer from strings
+        # for timedelta as too much ambiguity
+
+    return 'mixed'
+
+
+cdef inline bint is_null_datetime64(v):
+    # determine if we have a null for a datetime (or integer versions),
+    # excluding np.timedelta64('nat')
+    if util._checknull(v):
+        return True
+    elif v is NaT:
+        return True
+    elif util.is_datetime64_object(v):
+        return v.view('int64') == iNaT
+    return False
+
+
+cdef inline bint is_null_timedelta64(v):
+    # determine if we have a null for a timedelta (or integer versions),
+    # excluding np.datetime64('nat')
+    if util._checknull(v):
+        return True
+    elif v is NaT:
+        return True
+    elif util.is_timedelta64_object(v):
+        return v.view('int64') == iNaT
+    return False
+
+
+cdef inline bint is_null_period(v):
+    # determine if we have a null for a Period (or integer versions),
+    # excluding np.datetime64('nat') and np.timedelta64('nat')
+    if util._checknull(v):
+        return True
+    elif v is NaT:
+        return True
+    return False
+
+
+cdef inline bint is_datetime(object o):
+    return PyDateTime_Check(o)
+
+cdef inline bint is_date(object o):
+    return PyDate_Check(o)
+
+cdef inline bint is_time(object o):
+    return PyTime_Check(o)
+
+cdef inline bint is_timedelta(object o):
+    return PyDelta_Check(o) or util.is_timedelta64_object(o)
+
+
+cdef class Validator:
+
+    cdef:
+        Py_ssize_t n
+        dtype dtype
+        bint skipna
+
+    def __cinit__(
+        self,
+        Py_ssize_t n,
+        dtype dtype=np.dtype(np.object_),
+        bint skipna=False
+    ):
+        self.n = n
+        self.dtype = dtype
+        self.skipna = skipna
+
+    cdef bint validate(self, ndarray values) except -1:
+        if not self.n:
+            return False
+
+        if self.is_array_typed():
+            return True
+        elif self.dtype.type_num == NPY_OBJECT:
+            if self.skipna:
+                return self._validate_skipna(values)
+            else:
+                return self._validate(values)
+        else:
+            return False
+
+    @cython.wraparound(False)
+    @cython.boundscheck(False)
+    cdef bint _validate(self, ndarray values) except -1:
+        cdef:
+            Py_ssize_t i
+            Py_ssize_t n = self.n
+
+        for i in range(n):
+            if not self.is_valid(values[i]):
+                return False
+
+        return self.finalize_validate()
+
+    @cython.wraparound(False)
+    @cython.boundscheck(False)
+    cdef bint _validate_skipna(self, ndarray values) except -1:
+        cdef:
+            Py_ssize_t i
+            Py_ssize_t n = self.n
+
+        for i in range(n):
+            if not self.is_valid_skipna(values[i]):
+                return False
+
+        return self.finalize_validate_skipna()
+
+    cdef bint is_valid(self, object value) except -1:
+        return self.is_value_typed(value)
+
+    cdef bint is_valid_skipna(self, object value) except -1:
+        return self.is_valid(value) or self.is_valid_null(value)
+
+    cdef bint is_value_typed(self, object value) except -1:
+        raise NotImplementedError(
+            '{} child class must define is_value_typed'.format(
+                type(self).__name__
+            )
+        )
+
+    cdef bint is_valid_null(self, object value) except -1:
+        return util._checknull(value)
+
+    cdef bint is_array_typed(self) except -1:
+        return False
+
+    cdef inline bint finalize_validate(self):
+        return True
+
+    cdef bint finalize_validate_skipna(self):
+        # TODO(phillipc): Remove the existing validate methods and replace them
+        # with the skipna versions upon full deprecation of skipna=False
+        return True
+
+
+cdef class BoolValidator(Validator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return util.is_bool_object(value)
+
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.bool_)
+
+
+cpdef bint is_bool_array(ndarray values, bint skipna=False):
+    cdef:
+        BoolValidator validator = BoolValidator(
+            len(values),
+            values.dtype,
+            skipna=skipna
+        )
+    return validator.validate(values)
+
+
+cdef class IntegerValidator(Validator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return util.is_integer_object(value)
+
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.integer)
+
+
+cpdef bint is_integer_array(ndarray values):
+    cdef:
+        IntegerValidator validator = IntegerValidator(
+            len(values),
+            values.dtype,
+        )
+    return validator.validate(values)
+
+
+cdef class IntegerFloatValidator(Validator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return util.is_integer_object(value) or util.is_float_object(value)
+
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.integer)
+
+
+cdef bint is_integer_float_array(ndarray values):
+    cdef:
+        IntegerFloatValidator validator = IntegerFloatValidator(
+            len(values),
+            values.dtype,
+        )
+    return validator.validate(values)
+
+
+cdef class FloatValidator(Validator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return util.is_float_object(value)
+
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.floating)
+
+
+cpdef bint is_float_array(ndarray values):
+    cdef FloatValidator validator = FloatValidator(len(values), values.dtype)
+    return validator.validate(values)
+
+
+cdef class StringValidator(Validator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return PyString_Check(value)
+
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.str_)
+
+
+cpdef bint is_string_array(ndarray values, bint skipna=False):
+    cdef:
+        StringValidator validator = StringValidator(
+            len(values),
+            values.dtype,
+            skipna=skipna,
+        )
+    return validator.validate(values)
+
+
+cdef class UnicodeValidator(Validator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return PyUnicode_Check(value)
+
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.unicode_)
+
+
+cdef bint is_unicode_array(ndarray values, bint skipna=False):
+    cdef:
+        UnicodeValidator validator = UnicodeValidator(
+            len(values),
+            values.dtype,
+            skipna=skipna,
+        )
+    return validator.validate(values)
+
+
+cdef class BytesValidator(Validator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return PyBytes_Check(value)
+
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.bytes_)
+
+
+cdef bint is_bytes_array(ndarray values, bint skipna=False):
+    cdef:
+        BytesValidator validator = BytesValidator(
+            len(values),
+            values.dtype,
+            skipna=skipna
+        )
+    return validator.validate(values)
+
+
+cdef class TemporalValidator(Validator):
+
+    cdef Py_ssize_t generic_null_count
+
+    def __cinit__(
+        self,
+        Py_ssize_t n,
+        dtype dtype=np.dtype(np.object_),
+        bint skipna=False
+    ):
+        self.n = n
+        self.dtype = dtype
+        self.skipna = skipna
+        self.generic_null_count = 0
+
+    cdef inline bint is_valid(self, object value) except -1:
+        return self.is_value_typed(value) or self.is_valid_null(value)
+
+    cdef bint is_valid_null(self, object value) except -1:
+        raise NotImplementedError(
+            '{} child class must define is_valid_null'.format(
+                type(self).__name__
+            )
+        )
+
+    cdef inline bint is_valid_skipna(self, object value) except -1:
+        cdef:
+            bint is_typed_null = self.is_valid_null(value)
+            bint is_generic_null = util._checknull(value)
+        self.generic_null_count += is_typed_null and is_generic_null
+        return self.is_value_typed(value) or is_typed_null or is_generic_null
+
+    cdef inline bint finalize_validate_skipna(self):
+        return self.generic_null_count != self.n
+
+
+cdef class DatetimeValidator(TemporalValidator):
+
+    cdef bint is_value_typed(self, object value) except -1:
+        return is_datetime(value)
+
+    cdef inline bint is_valid_null(self, object value) except -1:
+        return is_null_datetime64(value)
+
+
+cpdef bint is_datetime_array(ndarray values):
+    cdef:
+        DatetimeValidator validator = DatetimeValidator(
+            len(values),
+            skipna=True,
+        )
+    return validator.validate(values)
+
+
+cdef class Datetime64Validator(DatetimeValidator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return util.is_datetime64_object(value)
+
+
+cpdef bint is_datetime64_array(ndarray values):
+    cdef:
+        Datetime64Validator validator = Datetime64Validator(
+            len(values),
+            skipna=True,
+        )
+    return validator.validate(values)
+
+
+cpdef bint is_datetime_with_singletz_array(ndarray values):
+    """
+    Check values have the same tzinfo attribute.
+    Doesn't check values are datetime-like types.
+    """
+
+    cdef Py_ssize_t i, j, n = len(values)
+    cdef object base_val, base_tz, val, tz
+
+    if n == 0:
+        return False
+
+    for i in range(n):
+        base_val = values[i]
+        if base_val is not NaT:
+            base_tz = get_timezone(getattr(base_val, 'tzinfo', None))
+
+            for j in range(i, n):
+                val = values[j]
+                if val is not NaT:
+                    tz = getattr(val, 'tzinfo', None)
+                    if not tz_compare(base_tz, tz):
+                        return False
+            break
+
+    return True
+
+
+cdef class TimedeltaValidator(TemporalValidator):
+
+    cdef bint is_value_typed(self, object value) except -1:
+        return PyDelta_Check(value)
+
+    cdef inline bint is_valid_null(self, object value) except -1:
+        return is_null_timedelta64(value)
+
+
+cpdef bint is_timedelta_array(ndarray values):
+    cdef:
+        TimedeltaValidator validator = TimedeltaValidator(
+            len(values),
+            skipna=True,
+        )
+    return validator.validate(values)
+
+
+cdef class Timedelta64Validator(TimedeltaValidator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return util.is_timedelta64_object(value)
+
+
+cpdef bint is_timedelta64_array(ndarray values):
+    cdef:
+        Timedelta64Validator validator = Timedelta64Validator(
+            len(values),
+            skipna=True,
+        )
+    return validator.validate(values)
+
+
+cdef class AnyTimedeltaValidator(TimedeltaValidator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return is_timedelta(value)
+
+
+cpdef bint is_timedelta_or_timedelta64_array(ndarray values):
+    """ infer with timedeltas and/or nat/none """
+    cdef:
+        AnyTimedeltaValidator validator = AnyTimedeltaValidator(
+            len(values),
+            skipna=True,
+        )
+    return validator.validate(values)
+
+
+cdef class DateValidator(Validator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return is_date(value)
+
+
+cpdef bint is_date_array(ndarray values, bint skipna=False):
+    cdef DateValidator validator = DateValidator(len(values), skipna=skipna)
+    return validator.validate(values)
+
+
+cdef class TimeValidator(Validator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return is_time(value)
+
+
+cpdef bint is_time_array(ndarray values, bint skipna=False):
+    cdef TimeValidator validator = TimeValidator(len(values), skipna=skipna)
+    return validator.validate(values)
+
+
+cdef class PeriodValidator(TemporalValidator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return is_period(value)
+
+    cdef inline bint is_valid_null(self, object value) except -1:
+        return is_null_period(value)
+
+
+cpdef bint is_period_array(ndarray values):
+    cdef PeriodValidator validator = PeriodValidator(len(values), skipna=True)
+    return validator.validate(values)
+
+
+cdef class IntervalValidator(Validator):
+
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return is_interval(value)
+
+
+cpdef bint is_interval_array(ndarray values):
+    cdef:
+        IntervalValidator validator = IntervalValidator(
+            len(values),
+            skipna=True,
+        )
+    return validator.validate(values)
+
+
+cdef extern from "parse_helper.h":
+    int floatify(object, double *result, int *maybe_int) except -1
+
+# constants that will be compared to potentially arbitrarily large
+# python int
+cdef object oINT64_MAX = <int64_t> INT64_MAX
+cdef object oINT64_MIN = <int64_t> INT64_MIN
+cdef object oUINT64_MAX = <uint64_t> UINT64_MAX
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def maybe_convert_numeric(ndarray[object] values, set na_values,
+                          bint convert_empty=True, bint coerce_numeric=False):
+    """
+    Convert object array to a numeric array if possible.
+
+    Parameters
+    ----------
+    values : ndarray
+        Array of object elements to convert.
+    na_values : set
+        Set of values that should be interpreted as NaN.
+    convert_empty : bool, default True
+        If an empty array-like object is encountered, whether to interpret
+        that element as NaN or not. If set to False, a ValueError will be
+        raised if such an element is encountered and 'coerce_numeric' is False.
+    coerce_numeric : bool, default False
+        If initial attempts to convert to numeric have failed, whether to
+        force conversion to numeric via alternative methods or by setting the
+        element to NaN. Otherwise, an Exception will be raised when such an
+        element is encountered.
+
+        This boolean also has an impact on how conversion behaves when a
+        numeric array has no suitable numerical dtype to return (i.e. uint64,
+        int32, uint8). If set to False, the original object array will be
+        returned. Otherwise, a ValueError will be raised.
+
+    Returns
+    -------
+    numeric_array : array of converted object values to numerical ones
+    """
+
+    if len(values) == 0:
+        return np.array([], dtype='i8')
+
+    # fastpath for ints - try to convert all based on first value
+    cdef object val = values[0]
+
+    if util.is_integer_object(val):
+        try:
+            maybe_ints = values.astype('i8')
+            if (maybe_ints == values).all():
+                return maybe_ints
+        except (ValueError, OverflowError, TypeError):
+            pass
+
+    # otherwise, iterate and do full infererence
+    cdef:
+        int status, maybe_int
+        Py_ssize_t i, n = values.size
+        Seen seen = Seen(coerce_numeric)
+        ndarray[float64_t] floats = np.empty(n, dtype='f8')
+        ndarray[complex128_t] complexes = np.empty(n, dtype='c16')
+        ndarray[int64_t] ints = np.empty(n, dtype='i8')
+        ndarray[uint64_t] uints = np.empty(n, dtype='u8')
+        ndarray[uint8_t] bools = np.empty(n, dtype='u1')
+        float64_t fval
+
+    for i in range(n):
+        val = values[i]
+
+        if val.__hash__ is not None and val in na_values:
+            seen.saw_null()
+            floats[i] = complexes[i] = nan
+        elif util.is_float_object(val):
+            fval = val
+            if fval != fval:
+                seen.null_ = True
+
+            floats[i] = complexes[i] = fval
+            seen.float_ = True
+        elif util.is_integer_object(val):
+            floats[i] = complexes[i] = val
+
+            val = int(val)
+            seen.saw_int(val)
+
+            if val >= 0:
+                if val <= oUINT64_MAX:
+                    uints[i] = val
+                else:
+                    seen.float_ = True
+
+            if val <= oINT64_MAX:
+                ints[i] = val
+
+            if seen.sint_ and seen.uint_:
+                seen.float_ = True
+
+        elif util.is_bool_object(val):
+            floats[i] = uints[i] = ints[i] = bools[i] = val
+            seen.bool_ = True
+        elif val is None:
+            seen.saw_null()
+            floats[i] = complexes[i] = nan
+        elif hasattr(val, '__len__') and len(val) == 0:
+            if convert_empty or seen.coerce_numeric:
+                seen.saw_null()
+                floats[i] = complexes[i] = nan
+            else:
+                raise ValueError('Empty string encountered')
+        elif util.is_complex_object(val):
+            complexes[i] = val
+            seen.complex_ = True
+        elif is_decimal(val):
+            floats[i] = complexes[i] = val
+            seen.float_ = True
+        else:
+            try:
+                status = floatify(val, &fval, &maybe_int)
+
+                if fval in na_values:
+                    seen.saw_null()
+                    floats[i] = complexes[i] = nan
+                else:
+                    if fval != fval:
+                        seen.null_ = True
+
+                    floats[i] = fval
+
+                if maybe_int:
+                    as_int = int(val)
+
+                    if as_int in na_values:
+                        seen.saw_null()
+                    else:
+                        seen.saw_int(as_int)
+
+                    if not (seen.float_ or as_int in na_values):
+                        if as_int < oINT64_MIN or as_int > oUINT64_MAX:
+                            raise ValueError('Integer out of range.')
+
+                        if as_int >= 0:
+                            uints[i] = as_int
+                        if as_int <= oINT64_MAX:
+                            ints[i] = as_int
+
+                    seen.float_ = seen.float_ or (seen.uint_ and seen.sint_)
+                else:
+                    seen.float_ = True
+            except (TypeError, ValueError) as e:
+                if not seen.coerce_numeric:
+                    raise type(e)(str(e) + ' at position {}'.format(i))
+                elif "uint64" in str(e):  # Exception from check functions.
+                    raise
+                seen.saw_null()
+                floats[i] = nan
+
+    if seen.check_uint64_conflict():
+        return values
+
+    if seen.complex_:
+        return complexes
+    elif seen.float_:
+        return floats
+    elif seen.int_:
+        if seen.uint_:
+            return uints
+        else:
+            return ints
+    elif seen.bool_:
+        return bools.view(np.bool_)
+    elif seen.uint_:
+        return uints
+    return ints
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def maybe_convert_objects(ndarray[object] objects, bint try_float=0,
+                          bint safe=0, bint convert_datetime=0,
+                          bint convert_timedelta=0):
+    """
+    Type inference function-- convert object array to proper dtype
+    """
+    cdef:
+        Py_ssize_t i, n
+        ndarray[float64_t] floats
+        ndarray[complex128_t] complexes
+        ndarray[int64_t] ints
+        ndarray[uint64_t] uints
+        ndarray[uint8_t] bools
+        ndarray[int64_t] idatetimes
+        ndarray[int64_t] itimedeltas
+        Seen seen = Seen()
+        object val, onan
+        float64_t fval, fnan
+
+    n = len(objects)
+
+    floats = np.empty(n, dtype='f8')
+    complexes = np.empty(n, dtype='c16')
+    ints = np.empty(n, dtype='i8')
+    uints = np.empty(n, dtype='u8')
+    bools = np.empty(n, dtype=np.uint8)
+
+    if convert_datetime:
+        datetimes = np.empty(n, dtype='M8[ns]')
+        idatetimes = datetimes.view(np.int64)
+
+    if convert_timedelta:
+        timedeltas = np.empty(n, dtype='m8[ns]')
+        itimedeltas = timedeltas.view(np.int64)
+
+    onan = np.nan
+    fnan = np.nan
+
+    for i from 0 <= i < n:
+        val = objects[i]
+
+        if val is None:
+            seen.null_ = 1
+            floats[i] = complexes[i] = fnan
+        elif val is NaT:
+            if convert_datetime:
+                idatetimes[i] = iNaT
+                seen.datetime_ = 1
+            if convert_timedelta:
+                itimedeltas[i] = iNaT
+                seen.timedelta_ = 1
+            if not (convert_datetime or convert_timedelta):
+                seen.object_ = 1
+        elif util.is_bool_object(val):
+            seen.bool_ = 1
+            bools[i] = val
+        elif util.is_float_object(val):
+            floats[i] = complexes[i] = val
+            seen.float_ = 1
+        elif util.is_datetime64_object(val):
+            if convert_datetime:
+                idatetimes[i] = convert_to_tsobject(
+                    val, None, None, 0, 0).value
+                seen.datetime_ = 1
+            else:
+                seen.object_ = 1
+                break
+        elif is_timedelta(val):
+            if convert_timedelta:
+                itimedeltas[i] = convert_to_timedelta64(val, 'ns')
+                seen.timedelta_ = 1
+            else:
+                seen.object_ = 1
+                break
+        elif util.is_integer_object(val):
+            seen.int_ = 1
+            floats[i] = <float64_t> val
+            complexes[i] = <double complex> val
+            if not seen.null_:
+                seen.saw_int(int(val))
+
+                if ((seen.uint_ and seen.sint_) or
+                        val > oUINT64_MAX or val < oINT64_MIN):
+                    seen.object_ = 1
+                    break
+
+                if seen.uint_:
+                    uints[i] = val
+                elif seen.sint_:
+                    ints[i] = val
+                else:
+                    uints[i] = val
+                    ints[i] = val
+
+        elif util.is_complex_object(val):
+            complexes[i] = val
+            seen.complex_ = 1
+        elif PyDateTime_Check(val) or util.is_datetime64_object(val):
+
+            # if we have an tz's attached then return the objects
+            if convert_datetime:
+                if getattr(val, 'tzinfo', None) is not None:
+                    seen.datetimetz_ = 1
+                    break
+                else:
+                    seen.datetime_ = 1
+                    idatetimes[i] = convert_to_tsobject(
+                        val, None, None, 0, 0).value
+            else:
+                seen.object_ = 1
+                break
+        elif try_float and not util.is_string_object(val):
+            # this will convert Decimal objects
+            try:
+                floats[i] = float(val)
+                complexes[i] = complex(val)
+                seen.float_ = 1
+            except Exception:
+                seen.object_ = 1
+                break
+        else:
+            seen.object_ = 1
+            break
+
+    # we try to coerce datetime w/tz but must all have the same tz
+    if seen.datetimetz_:
+        if len({getattr(val, 'tzinfo', None) for val in objects}) == 1:
+            from pandas import DatetimeIndex
+            return DatetimeIndex(objects)
+        seen.object_ = 1
+
+    if not seen.object_:
+        if not safe:
+            if seen.null_:
+                if seen.is_float_or_complex:
+                    if seen.complex_:
+                        return complexes
+                    elif seen.float_ or seen.int_:
+                        return floats
+            else:
+                if not seen.bool_:
+                    if seen.datetime_:
+                        if not seen.numeric_:
+                            return datetimes
+                    elif seen.timedelta_:
+                        if not seen.numeric_:
+                            return timedeltas
+                    else:
+                        if seen.complex_:
+                            return complexes
+                        elif seen.float_:
+                            return floats
+                        elif seen.int_:
+                            if seen.uint_:
+                                return uints
+                            else:
+                                return ints
+                elif seen.is_bool:
+                    return bools.view(np.bool_)
+
+        else:
+            # don't cast int to float, etc.
+            if seen.null_:
+                if seen.is_float_or_complex:
+                    if seen.complex_:
+                        if not seen.int_:
+                            return complexes
+                    elif seen.float_:
+                        if not seen.int_:
+                            return floats
+            else:
+                if not seen.bool_:
+                    if seen.datetime_:
+                        if not seen.numeric_:
+                            return datetimes
+                    elif seen.timedelta_:
+                        if not seen.numeric_:
+                            return timedeltas
+                    else:
+                        if seen.complex_:
+                            if not seen.int_:
+                                return complexes
+                        elif seen.float_:
+                            if not seen.int_:
+                                return floats
+                        elif seen.int_:
+                            if seen.uint_:
+                                return uints
+                            else:
+                                return ints
+                elif seen.is_bool:
+                    return bools.view(np.bool_)
+
+    return objects
+
+
+def map_infer_mask(ndarray arr, object f, ndarray[uint8_t] mask,
+                   bint convert=1):
+    """
+    Substitute for np.vectorize with pandas-friendly dtype inference
+
+    Parameters
+    ----------
+    arr : ndarray
+    f : function
+
+    Returns
+    -------
+    mapped : ndarray
+    """
+    cdef:
+        Py_ssize_t i, n
+        ndarray[object] result
+        object val
+
+    n = len(arr)
+    result = np.empty(n, dtype=object)
+    for i in range(n):
+        if mask[i]:
+            val = util.get_value_at(arr, i)
+        else:
+            val = f(util.get_value_at(arr, i))
+
+            # unbox 0-dim arrays, GH #690
+            if is_array(val) and PyArray_NDIM(val) == 0:
+                # is there a faster way to unbox?
+                val = val.item()
+
+        result[i] = val
+
+    if convert:
+        return maybe_convert_objects(result,
+                                     try_float=0,
+                                     convert_datetime=0,
+                                     convert_timedelta=0)
+
+    return result
+
+
+def map_infer(ndarray arr, object f, bint convert=1):
+    """
+    Substitute for np.vectorize with pandas-friendly dtype inference
+
+    Parameters
+    ----------
+    arr : ndarray
+    f : function
+
+    Returns
+    -------
+    mapped : ndarray
+    """
+    cdef:
+        Py_ssize_t i, n
+        ndarray[object] result
+        object val
+
+    n = len(arr)
+    result = np.empty(n, dtype=object)
+    for i in range(n):
+        val = f(util.get_value_at(arr, i))
+
+        # unbox 0-dim arrays, GH #690
+        if is_array(val) and PyArray_NDIM(val) == 0:
+            # is there a faster way to unbox?
+            val = val.item()
+
+        result[i] = val
+
+    if convert:
+        return maybe_convert_objects(result,
+                                     try_float=0,
+                                     convert_datetime=0,
+                                     convert_timedelta=0)
+
+    return result
+
+
+def to_object_array(list rows, int min_width=0):
+    """
+    Convert a list of lists into an object array.
+
+    Parameters
+    ----------
+    rows : 2-d array (N, K)
+        A list of lists to be converted into an array
+    min_width : int
+        The minimum width of the object array. If a list
+        in `rows` contains fewer than `width` elements,
+        the remaining elements in the corresponding row
+        will all be `NaN`.
+
+    Returns
+    -------
+    obj_array : numpy array of the object dtype
+    """
+    cdef:
+        Py_ssize_t i, j, n, k, tmp
+        ndarray[object, ndim=2] result
+        list row
+
+    n = len(rows)
+
+    k = min_width
+    for i from 0 <= i < n:
+        tmp = len(rows[i])
+        if tmp > k:
+            k = tmp
+
+    result = np.empty((n, k), dtype=object)
+
+    for i from 0 <= i < n:
+        row = rows[i]
+
+        for j from 0 <= j < len(row):
+            result[i, j] = row[j]
+
+    return result
+
+
+def tuples_to_object_array(ndarray[object] tuples):
+    cdef:
+        Py_ssize_t i, j, n, k, tmp
+        ndarray[object, ndim=2] result
+        tuple tup
+
+    n = len(tuples)
+    k = len(tuples[0])
+    result = np.empty((n, k), dtype=object)
+    for i in range(n):
+        tup = tuples[i]
+        for j in range(k):
+            result[i, j] = tup[j]
+
+    return result
+
+
+def to_object_array_tuples(list rows):
+    cdef:
+        Py_ssize_t i, j, n, k, tmp
+        ndarray[object, ndim=2] result
+        tuple row
+
+    n = len(rows)
+
+    k = 0
+    for i from 0 <= i < n:
+        tmp = len(rows[i])
+        if tmp > k:
+            k = tmp
+
+    result = np.empty((n, k), dtype=object)
+
+    try:
+        for i in range(n):
+            row = rows[i]
+            for j from 0 <= j < len(row):
+                result[i, j] = row[j]
+    except Exception:
+        # upcast any subclasses to tuple
+        for i in range(n):
+            row = tuple(rows[i])
+            for j from 0 <= j < len(row):
+                result[i, j] = row[j]
+
+    return result
+
+
+def fast_multiget(dict mapping, ndarray keys, default=np.nan):
+    cdef:
+        Py_ssize_t i, n = len(keys)
+        object val
+        ndarray[object] output = np.empty(n, dtype='O')
+
+    if n == 0:
+        # kludge, for Series
+        return np.empty(0, dtype='f8')
+
+    keys = getattr(keys, 'values', keys)
+
+    for i in range(n):
+        val = util.get_value_1d(keys, i)
+        if val in mapping:
+            output[i] = mapping[val]
+        else:
+            output[i] = default
+
+    return maybe_convert_objects(output)
diff --git a/pandas/src/klib/khash.h b/pandas/_libs/src/klib/khash.h
similarity index 97%
rename from pandas/src/klib/khash.h
rename to pandas/_libs/src/klib/khash.h
index 4350ff06f37f0..869607a44c001 100644
--- a/pandas/src/klib/khash.h
+++ b/pandas/_libs/src/klib/khash.h
@@ -52,7 +52,7 @@ int main() {
 	* The capacity is a power of 2. This seems to dramatically improve the
 	  speed for simple keys. Thank Zilong Tan for the suggestion. Reference:
 
-	   - http://code.google.com/p/ulib/
+	   - https://github.com/stefanocasazza/ULib
 	   - http://nothings.org/computer/judy/
 
 	* Allow to optionally use linear probing which usually has better
@@ -132,11 +132,11 @@ typedef double khfloat64_t;
 
 #ifndef PANDAS_INLINE
   #if defined(__GNUC__)
-    #define PANDAS_INLINE __inline__
+    #define PANDAS_INLINE static __inline__
   #elif defined(_MSC_VER)
-    #define PANDAS_INLINE __inline
+    #define PANDAS_INLINE static __inline
   #elif defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
-    #define PANDAS_INLINE inline
+    #define PANDAS_INLINE static inline
   #else
     #define PANDAS_INLINE
   #endif
@@ -152,7 +152,7 @@ typedef khint_t khiter_t;
 #define __ac_set_isempty_false(flag, i) (flag[i>>5]&=~(1ul<<(i&0x1fU)))
 #define __ac_set_isempty_true(flag, i) (flag[i>>5]|=(1ul<<(i&0x1fU)))
 #define __ac_set_isboth_false(flag, i) __ac_set_isempty_false(flag, i)
-#define __ac_set_isdel_true(flag, i) (0)
+#define __ac_set_isdel_true(flag, i) ((void)0)
 
 #ifdef KHASH_LINEAR
 #define __ac_inc(k, m) 1
@@ -324,7 +324,7 @@ static const double __ac_HASH_UPPER = 0.77;
 	}
 
 #define KHASH_INIT(name, khkey_t, khval_t, kh_is_map, __hash_func, __hash_equal) \
-	KHASH_INIT2(name, static PANDAS_INLINE, khkey_t, khval_t, kh_is_map, __hash_func, __hash_equal)
+	KHASH_INIT2(name, PANDAS_INLINE, khkey_t, khval_t, kh_is_map, __hash_func, __hash_equal)
 
 /* --- BEGIN OF HASH FUNCTIONS --- */
 
@@ -354,7 +354,7 @@ static const double __ac_HASH_UPPER = 0.77;
   @param  s     Pointer to a null terminated string
   @return       The hash value
  */
-static PANDAS_INLINE khint_t __ac_X31_hash_string(const char *s)
+PANDAS_INLINE khint_t __ac_X31_hash_string(const char *s)
 {
 	khint_t h = *s;
 	if (h) for (++s ; *s; ++s) h = (h << 5) - h + *s;
@@ -371,7 +371,7 @@ static PANDAS_INLINE khint_t __ac_X31_hash_string(const char *s)
  */
 #define kh_str_hash_equal(a, b) (strcmp(a, b) == 0)
 
-static PANDAS_INLINE khint_t __ac_Wang_hash(khint_t key)
+PANDAS_INLINE khint_t __ac_Wang_hash(khint_t key)
 {
     key += ~(key << 15);
     key ^=  (key >> 10);
@@ -567,12 +567,14 @@ typedef const char *kh_cstr_t;
 
 #define kh_exist_str(h, k) (kh_exist(h, k))
 #define kh_exist_float64(h, k) (kh_exist(h, k))
+#define kh_exist_uint64(h, k) (kh_exist(h, k))
 #define kh_exist_int64(h, k) (kh_exist(h, k))
 #define kh_exist_int32(h, k) (kh_exist(h, k))
 
 KHASH_MAP_INIT_STR(str, size_t)
 KHASH_MAP_INIT_INT(int32, size_t)
 KHASH_MAP_INIT_INT64(int64, size_t)
+KHASH_MAP_INIT_UINT64(uint64, size_t)
 
 
 #endif /* __AC_KHASH_H */
diff --git a/pandas/_libs/src/klib/khash_python.h b/pandas/_libs/src/klib/khash_python.h
new file mode 100644
index 0000000000000..dd75ae5ec7e28
--- /dev/null
+++ b/pandas/_libs/src/klib/khash_python.h
@@ -0,0 +1,64 @@
+#include <string.h>
+#include <Python.h>
+
+#include "khash.h"
+
+// Previously we were using the built in cpython hash function for doubles
+// python 2.7 https://github.com/python/cpython/blob/2.7/Objects/object.c#L1021
+// python 3.5 https://github.com/python/cpython/blob/3.5/Python/pyhash.c#L85
+
+// The python 3 hash function has the invariant hash(x) == hash(int(x)) == hash(decimal(x))
+// and the size of hash may be different by platform / version (long in py2, Py_ssize_t in py3).
+// We don't need those invariants because types will be cast before hashing, and if Py_ssize_t
+// is 64 bits the truncation causes collission issues.  Given all that, we use our own
+// simple hash, viewing the double bytes as an int64 and using khash's default
+// hash for 64 bit integers.
+// GH 13436
+khint64_t PANDAS_INLINE asint64(double key) {
+  khint64_t val;
+  memcpy(&val, &key, sizeof(double));
+  return val;
+}
+#define kh_float64_hash_func(key) (khint32_t)((asint64(key))>>33^(asint64(key))^(asint64(key))<<11)
+#define kh_float64_hash_equal(a, b) ((a) == (b) || ((b) != (b) && (a) != (a)))
+
+#define KHASH_MAP_INIT_FLOAT64(name, khval_t)								\
+	KHASH_INIT(name, khfloat64_t, khval_t, 1, kh_float64_hash_func, kh_float64_hash_equal)
+
+KHASH_MAP_INIT_FLOAT64(float64, size_t)
+
+
+int PANDAS_INLINE pyobject_cmp(PyObject* a, PyObject* b) {
+	int result = PyObject_RichCompareBool(a, b, Py_EQ);
+	if (result < 0) {
+		PyErr_Clear();
+		return 0;
+	}
+	return result;
+}
+
+
+#define kh_python_hash_func(key) (PyObject_Hash(key))
+#define kh_python_hash_equal(a, b) (pyobject_cmp(a, b))
+
+
+// Python object
+
+typedef PyObject* kh_pyobject_t;
+
+#define KHASH_MAP_INIT_PYOBJECT(name, khval_t)							\
+	KHASH_INIT(name, kh_pyobject_t, khval_t, 1,						\
+			   kh_python_hash_func, kh_python_hash_equal)
+
+KHASH_MAP_INIT_PYOBJECT(pymap, Py_ssize_t)
+
+#define KHASH_SET_INIT_PYOBJECT(name)                                  \
+	KHASH_INIT(name, kh_pyobject_t, char, 0,     \
+			   kh_python_hash_func, kh_python_hash_equal)
+
+KHASH_SET_INIT_PYOBJECT(pyset)
+
+#define kh_exist_pymap(h, k) (kh_exist(h, k))
+#define kh_exist_pyset(h, k) (kh_exist(h, k))
+
+KHASH_MAP_INIT_STR(strbox, kh_pyobject_t)
diff --git a/pandas/src/msgpack/pack.h b/pandas/_libs/src/msgpack/pack.h
similarity index 100%
rename from pandas/src/msgpack/pack.h
rename to pandas/_libs/src/msgpack/pack.h
diff --git a/pandas/src/msgpack/pack_template.h b/pandas/_libs/src/msgpack/pack_template.h
similarity index 100%
rename from pandas/src/msgpack/pack_template.h
rename to pandas/_libs/src/msgpack/pack_template.h
diff --git a/pandas/src/msgpack/sysdep.h b/pandas/_libs/src/msgpack/sysdep.h
similarity index 100%
rename from pandas/src/msgpack/sysdep.h
rename to pandas/_libs/src/msgpack/sysdep.h
diff --git a/pandas/src/msgpack/unpack.h b/pandas/_libs/src/msgpack/unpack.h
similarity index 97%
rename from pandas/src/msgpack/unpack.h
rename to pandas/_libs/src/msgpack/unpack.h
index 5deb7cde0b929..591fad1ae4661 100644
--- a/pandas/src/msgpack/unpack.h
+++ b/pandas/_libs/src/msgpack/unpack.h
@@ -265,9 +265,9 @@ static inline int unpack_callback_ext(unpack_user* u, const char* base, const ch
     }
     // length also includes the typecode, so the actual data is length-1
 #if PY_MAJOR_VERSION == 2
-    py = PyObject_CallFunction(u->ext_hook, "(is#)", typecode, pos, length-1);
+    py = PyObject_CallFunction(u->ext_hook, (char*)"(is#)", typecode, pos, (Py_ssize_t)length-1);
 #else
-    py = PyObject_CallFunction(u->ext_hook, "(iy#)", typecode, pos, length-1);
+    py = PyObject_CallFunction(u->ext_hook, (char*)"(iy#)", typecode, pos, (Py_ssize_t)length-1);
 #endif
     if (!py)
         return -1;
diff --git a/pandas/src/msgpack/unpack_define.h b/pandas/_libs/src/msgpack/unpack_define.h
similarity index 100%
rename from pandas/src/msgpack/unpack_define.h
rename to pandas/_libs/src/msgpack/unpack_define.h
diff --git a/pandas/src/msgpack/unpack_template.h b/pandas/_libs/src/msgpack/unpack_template.h
similarity index 99%
rename from pandas/src/msgpack/unpack_template.h
rename to pandas/_libs/src/msgpack/unpack_template.h
index d34eceda6ab69..fba372ddcb3e4 100644
--- a/pandas/src/msgpack/unpack_template.h
+++ b/pandas/_libs/src/msgpack/unpack_template.h
@@ -17,7 +17,7 @@
  */
 
 #ifndef USE_CASE_RANGE
-#if !defined(_MSC_VER)
+#ifdef __GNUC__
 #define USE_CASE_RANGE
 #endif
 #endif
@@ -89,7 +89,7 @@ static inline int unpack_execute(unpack_context* ctx, const char* data, size_t l
     */
     unpack_user* user = &ctx->user;
 
-    PyObject* obj;
+    PyObject* obj = NULL;
     unpack_stack* c = NULL;
 
     int ret;
diff --git a/pandas/_libs/src/numpy_helper.h b/pandas/_libs/src/numpy_helper.h
new file mode 100644
index 0000000000000..5cfa51dc8a0be
--- /dev/null
+++ b/pandas/_libs/src/numpy_helper.h
@@ -0,0 +1,56 @@
+/*
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+*/
+
+#ifndef PANDAS__LIBS_SRC_NUMPY_HELPER_H_
+#define PANDAS__LIBS_SRC_NUMPY_HELPER_H_
+
+#include "Python.h"
+#include "helper.h"
+#include "numpy/arrayobject.h"
+#include "numpy/arrayscalars.h"
+
+
+PANDAS_INLINE npy_int64 get_nat(void) { return NPY_MIN_INT64; }
+
+PANDAS_INLINE int assign_value_1d(PyArrayObject* ap, Py_ssize_t _i,
+                                  PyObject* v) {
+    npy_intp i = (npy_intp)_i;
+    char* item = (char*)PyArray_DATA(ap) + i * PyArray_STRIDE(ap, 0);
+    return PyArray_DESCR(ap)->f->setitem(v, item, ap);
+}
+
+PANDAS_INLINE PyObject* get_value_1d(PyArrayObject* ap, Py_ssize_t i) {
+    char* item = (char*)PyArray_DATA(ap) + i * PyArray_STRIDE(ap, 0);
+    return PyArray_Scalar(item, PyArray_DESCR(ap), (PyObject*)ap);
+}
+
+// returns ASCII or UTF8 (py3) view on python str
+// python object owns memory, should not be freed
+PANDAS_INLINE const char* get_c_string(PyObject* obj) {
+#if PY_VERSION_HEX >= 0x03000000
+    return PyUnicode_AsUTF8(obj);
+#else
+    return PyString_AsString(obj);
+#endif
+}
+
+PANDAS_INLINE PyObject* char_to_string(const char* data) {
+#if PY_VERSION_HEX >= 0x03000000
+    return PyUnicode_FromString(data);
+#else
+    return PyString_FromString(data);
+#endif
+}
+
+
+void set_array_not_contiguous(PyArrayObject* ao) {
+    ao->flags &= ~(NPY_C_CONTIGUOUS | NPY_F_CONTIGUOUS);
+}
+
+#endif  // PANDAS__LIBS_SRC_NUMPY_HELPER_H_
diff --git a/pandas/_libs/src/parse_helper.h b/pandas/_libs/src/parse_helper.h
new file mode 100644
index 0000000000000..6dd8b66eab33d
--- /dev/null
+++ b/pandas/_libs/src/parse_helper.h
@@ -0,0 +1,273 @@
+/*
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+*/
+
+#ifndef PANDAS__LIBS_SRC_PARSE_HELPER_H_
+#define PANDAS__LIBS_SRC_PARSE_HELPER_H_
+
+#include <errno.h>
+#include <float.h>
+#include "headers/portable.h"
+
+static double xstrtod(const char *p, char **q, char decimal, char sci,
+                      int skip_trailing, int *maybe_int);
+
+int to_double(char *item, double *p_value, char sci, char decimal,
+              int *maybe_int) {
+    char *p_end = NULL;
+
+    *p_value = xstrtod(item, &p_end, decimal, sci, 1, maybe_int);
+
+    return (errno == 0) && (!*p_end);
+}
+
+#if PY_VERSION_HEX < 0x02060000
+#define PyBytes_Check PyString_Check
+#define PyBytes_AS_STRING PyString_AS_STRING
+#endif
+
+int floatify(PyObject *str, double *result, int *maybe_int) {
+    int status;
+    char *data;
+    PyObject *tmp = NULL;
+    const char sci = 'E';
+    const char dec = '.';
+
+    if (PyBytes_Check(str)) {
+        data = PyBytes_AS_STRING(str);
+    } else if (PyUnicode_Check(str)) {
+        tmp = PyUnicode_AsUTF8String(str);
+        data = PyBytes_AS_STRING(tmp);
+    } else {
+        PyErr_SetString(PyExc_TypeError, "Invalid object type");
+        return -1;
+    }
+
+    status = to_double(data, result, sci, dec, maybe_int);
+
+    if (!status) {
+        /* handle inf/-inf */
+        if (strlen(data) == 3) {
+            if (0 == strcasecmp(data, "inf")) {
+                *result = HUGE_VAL;
+                *maybe_int = 0;
+            } else {
+                goto parsingerror;
+            }
+        } else if (strlen(data) == 4) {
+            if (0 == strcasecmp(data, "-inf")) {
+                *result = -HUGE_VAL;
+                *maybe_int = 0;
+            } else if (0 == strcasecmp(data, "+inf")) {
+                *result = HUGE_VAL;
+                *maybe_int = 0;
+            } else {
+                goto parsingerror;
+            }
+        } else {
+            goto parsingerror;
+        }
+    }
+
+    Py_XDECREF(tmp);
+    return 0;
+
+parsingerror:
+    PyErr_Format(PyExc_ValueError, "Unable to parse string \"%s\"", data);
+    Py_XDECREF(tmp);
+    return -1;
+
+    /*
+    #if PY_VERSION_HEX >= 0x03000000
+      return PyFloat_FromString(str);
+    #else
+      return PyFloat_FromString(str, NULL);
+    #endif
+    */
+}
+
+// ---------------------------------------------------------------------------
+// Implementation of xstrtod
+
+//
+// strtod.c
+//
+// Convert string to double
+//
+// Copyright (C) 2002 Michael Ringgaard. All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions
+// are met:
+//
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the project nor the names of its contributors
+//    may be used to endorse or promote products derived from this software
+//    without specific prior written permission.
+//
+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+// AND
+// ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+// ARE DISCLAIMED.  IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE
+// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+// OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+// HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+// LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+// OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+// SUCH DAMAGE.
+//
+// -----------------------------------------------------------------------
+// Modifications by Warren Weckesser, March 2011:
+// * Rename strtod() to xstrtod().
+// * Added decimal and sci arguments.
+// * Skip trailing spaces.
+// * Commented out the other functions.
+//
+
+PANDAS_INLINE void lowercase(char *p) {
+    for (; *p; ++p) *p = tolower(*p);
+}
+
+PANDAS_INLINE void uppercase(char *p) {
+    for (; *p; ++p) *p = toupper(*p);
+}
+
+static double xstrtod(const char *str, char **endptr, char decimal, char sci,
+                      int skip_trailing, int *maybe_int) {
+    double number;
+    int exponent;
+    int negative;
+    char *p = (char *)str;
+    double p10;
+    int n;
+    int num_digits;
+    int num_decimals;
+
+    errno = 0;
+    *maybe_int = 1;
+
+    // Skip leading whitespace
+    while (isspace(*p)) p++;
+
+    // Handle optional sign
+    negative = 0;
+    switch (*p) {
+        case '-':
+            negative = 1;  // Fall through to increment position
+        case '+':
+            p++;
+    }
+
+    number = 0.;
+    exponent = 0;
+    num_digits = 0;
+    num_decimals = 0;
+
+    // Process string of digits
+    while (isdigit(*p)) {
+        number = number * 10. + (*p - '0');
+        p++;
+        num_digits++;
+    }
+
+    // Process decimal part
+    if (*p == decimal) {
+        *maybe_int = 0;
+        p++;
+
+        while (isdigit(*p)) {
+            number = number * 10. + (*p - '0');
+            p++;
+            num_digits++;
+            num_decimals++;
+        }
+
+        exponent -= num_decimals;
+    }
+
+    if (num_digits == 0) {
+        errno = ERANGE;
+        return 0.0;
+    }
+
+    // Correct for sign
+    if (negative) number = -number;
+
+    // Process an exponent string
+    if (toupper(*p) == toupper(sci)) {
+        *maybe_int = 0;
+
+        // Handle optional sign
+        negative = 0;
+        switch (*++p) {
+            case '-':
+                negative = 1;  // Fall through to increment pos
+            case '+':
+                p++;
+        }
+
+        // Process string of digits
+        num_digits = 0;
+        n = 0;
+        while (isdigit(*p)) {
+            n = n * 10 + (*p - '0');
+            num_digits++;
+            p++;
+        }
+
+        if (negative)
+            exponent -= n;
+        else
+            exponent += n;
+
+        // If no digits, after the 'e'/'E', un-consume it
+        if (num_digits == 0) p--;
+    }
+
+    if (exponent < DBL_MIN_EXP || exponent > DBL_MAX_EXP) {
+        errno = ERANGE;
+        return HUGE_VAL;
+    }
+
+    // Scale the result
+    p10 = 10.;
+    n = exponent;
+    if (n < 0) n = -n;
+    while (n) {
+        if (n & 1) {
+            if (exponent < 0)
+                number /= p10;
+            else
+                number *= p10;
+        }
+        n >>= 1;
+        p10 *= p10;
+    }
+
+    if (number == HUGE_VAL) {
+        errno = ERANGE;
+    }
+
+    if (skip_trailing) {
+        // Skip trailing whitespace
+        while (isspace(*p)) p++;
+    }
+
+    if (endptr) *endptr = p;
+
+    return number;
+}
+
+#endif  // PANDAS__LIBS_SRC_PARSE_HELPER_H_
diff --git a/pandas/_libs/src/parser/io.c b/pandas/_libs/src/parser/io.c
new file mode 100644
index 0000000000000..8300e889d4157
--- /dev/null
+++ b/pandas/_libs/src/parser/io.c
@@ -0,0 +1,276 @@
+/*
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+*/
+
+#include "io.h"
+
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <fcntl.h>
+
+#ifndef O_BINARY
+#define O_BINARY 0
+#endif /* O_BINARY */
+
+/*
+  On-disk FILE, uncompressed
+*/
+
+void *new_file_source(char *fname, size_t buffer_size) {
+    file_source *fs = (file_source *)malloc(sizeof(file_source));
+    if (fs == NULL) {
+        return NULL;
+    }
+
+    fs->fd = open(fname, O_RDONLY | O_BINARY);
+    if (fs->fd == -1) {
+        free(fs);
+        return NULL;
+    }
+
+    // Only allocate this heap memory if we are not memory-mapping the file
+    fs->buffer = (char *)malloc((buffer_size + 1) * sizeof(char));
+
+    if (fs->buffer == NULL) {
+        close(fs->fd);
+        free(fs);
+        return NULL;
+    }
+
+    memset(fs->buffer, '\0', buffer_size + 1);
+    fs->size = buffer_size;
+
+    return (void *)fs;
+}
+
+void *new_rd_source(PyObject *obj) {
+    rd_source *rds = (rd_source *)malloc(sizeof(rd_source));
+
+    /* hold on to this object */
+    Py_INCREF(obj);
+    rds->obj = obj;
+    rds->buffer = NULL;
+    rds->position = 0;
+
+    return (void *)rds;
+}
+
+/*
+
+  Cleanup callbacks
+
+ */
+
+int del_file_source(void *ptr) {
+    file_source *fs = ptr;
+    if (fs == NULL) return 0;
+
+    free(fs->buffer);
+    close(fs->fd);
+    free(fs);
+
+    return 0;
+}
+
+int del_rd_source(void *rds) {
+    Py_XDECREF(RDS(rds)->obj);
+    Py_XDECREF(RDS(rds)->buffer);
+    free(rds);
+
+    return 0;
+}
+
+/*
+
+  IO callbacks
+
+ */
+
+void *buffer_file_bytes(void *source, size_t nbytes, size_t *bytes_read,
+                        int *status) {
+    file_source *fs = FS(source);
+    ssize_t rv;
+
+    if (nbytes > fs->size) {
+        nbytes = fs->size;
+    }
+
+    rv = read(fs->fd, fs->buffer, nbytes);
+    switch (rv) {
+    case -1:
+        *status = CALLING_READ_FAILED;
+        *bytes_read = 0;
+        return NULL;
+    case 0:
+        *status = REACHED_EOF;
+        *bytes_read = 0;
+        return NULL;
+    default:
+        *status = 0;
+        *bytes_read = rv;
+        fs->buffer[rv] = '\0';
+        break;
+    }
+
+    return (void *)fs->buffer;
+}
+
+void *buffer_rd_bytes(void *source, size_t nbytes, size_t *bytes_read,
+                      int *status) {
+    PyGILState_STATE state;
+    PyObject *result, *func, *args, *tmp;
+
+    void *retval;
+
+    size_t length;
+    rd_source *src = RDS(source);
+    state = PyGILState_Ensure();
+
+    /* delete old object */
+    Py_XDECREF(src->buffer);
+    src->buffer = NULL;
+    args = Py_BuildValue("(i)", nbytes);
+
+    func = PyObject_GetAttrString(src->obj, "read");
+
+    /* TODO: does this release the GIL? */
+    result = PyObject_CallObject(func, args);
+    Py_XDECREF(args);
+    Py_XDECREF(func);
+
+    if (result == NULL) {
+        PyGILState_Release(state);
+        *bytes_read = 0;
+        *status = CALLING_READ_FAILED;
+        return NULL;
+    } else if (!PyBytes_Check(result)) {
+        tmp = PyUnicode_AsUTF8String(result);
+        Py_XDECREF(result);
+        result = tmp;
+    }
+
+    length = PySequence_Length(result);
+
+    if (length == 0)
+        *status = REACHED_EOF;
+    else
+        *status = 0;
+
+    /* hang on to the Python object */
+    src->buffer = result;
+    retval = (void *)PyBytes_AsString(result);
+
+    PyGILState_Release(state);
+
+    /* TODO: more error handling */
+    *bytes_read = length;
+
+    return retval;
+}
+
+#ifdef HAVE_MMAP
+
+#include <sys/mman.h>
+
+void *new_mmap(char *fname) {
+    memory_map *mm;
+    struct stat stat;
+    size_t filesize;
+
+    mm = (memory_map *)malloc(sizeof(memory_map));
+    if (mm == NULL) {
+        fprintf(stderr, "new_file_buffer: malloc() failed.\n");
+        return (NULL);
+    }
+    mm->fd = open(fname, O_RDONLY | O_BINARY);
+    if (mm->fd == -1) {
+        fprintf(stderr, "new_file_buffer: open(%s) failed. errno =%d\n",
+          fname, errno);
+        free(mm);
+        return NULL;
+    }
+
+    if (fstat(mm->fd, &stat) == -1) {
+        fprintf(stderr, "new_file_buffer: fstat() failed. errno =%d\n",
+          errno);
+        close(mm->fd);
+        free(mm);
+        return NULL;
+    }
+    filesize = stat.st_size; /* XXX This might be 32 bits. */
+
+    mm->memmap = mmap(NULL, filesize, PROT_READ, MAP_SHARED, mm->fd, 0);
+    if (mm->memmap == MAP_FAILED) {
+        /* XXX Eventually remove this print statement. */
+        fprintf(stderr, "new_file_buffer: mmap() failed.\n");
+        close(mm->fd);
+        free(mm);
+        return NULL;
+    }
+
+    mm->size = (off_t)filesize;
+    mm->position = 0;
+
+    return mm;
+}
+
+int del_mmap(void *ptr) {
+    memory_map *mm = ptr;
+
+    if (mm == NULL) return 0;
+
+    munmap(mm->memmap, mm->size);
+    close(mm->fd);
+    free(mm);
+
+    return 0;
+}
+
+void *buffer_mmap_bytes(void *source, size_t nbytes, size_t *bytes_read,
+                        int *status) {
+    void *retval;
+    memory_map *src = source;
+    size_t remaining = src->size - src->position;
+
+    if (remaining == 0) {
+        *bytes_read = 0;
+        *status = REACHED_EOF;
+        return NULL;
+    }
+
+    if (nbytes > remaining) {
+        nbytes = remaining;
+    }
+
+    retval = src->memmap + src->position;
+
+    /* advance position in mmap data structure */
+    src->position += nbytes;
+
+    *bytes_read = nbytes;
+    *status = 0;
+
+    return retval;
+}
+
+#else
+
+/* kludgy */
+
+void *new_mmap(char *fname) { return NULL; }
+
+int del_mmap(void *src) { return 0; }
+
+/* don't use this! */
+
+void *buffer_mmap_bytes(void *source, size_t nbytes, size_t *bytes_read,
+                        int *status) {
+    return NULL;
+}
+
+#endif
diff --git a/pandas/_libs/src/parser/io.h b/pandas/_libs/src/parser/io.h
new file mode 100644
index 0000000000000..d22e8ddaea88d
--- /dev/null
+++ b/pandas/_libs/src/parser/io.h
@@ -0,0 +1,70 @@
+/*
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+*/
+
+#ifndef PANDAS__LIBS_SRC_PARSER_IO_H_
+#define PANDAS__LIBS_SRC_PARSER_IO_H_
+
+#include "Python.h"
+#include "tokenizer.h"
+
+typedef struct _file_source {
+    /* The file being read. */
+    int fd;
+
+    char *buffer;
+    size_t size;
+} file_source;
+
+#define FS(source) ((file_source *)source)
+
+#if !defined(_WIN32) && !defined(HAVE_MMAP)
+#define HAVE_MMAP
+#endif
+
+typedef struct _memory_map {
+    int fd;
+
+    /* Size of the file, in bytes. */
+    char *memmap;
+    size_t size;
+
+    size_t position;
+} memory_map;
+
+#define MM(src) ((memory_map *)src)
+
+void *new_mmap(char *fname);
+
+int del_mmap(void *src);
+
+void *buffer_mmap_bytes(void *source, size_t nbytes, size_t *bytes_read,
+                        int *status);
+
+typedef struct _rd_source {
+    PyObject *obj;
+    PyObject *buffer;
+    size_t position;
+} rd_source;
+
+#define RDS(source) ((rd_source *)source)
+
+void *new_file_source(char *fname, size_t buffer_size);
+
+void *new_rd_source(PyObject *obj);
+
+int del_file_source(void *src);
+int del_rd_source(void *src);
+
+void *buffer_file_bytes(void *source, size_t nbytes, size_t *bytes_read,
+                        int *status);
+
+void *buffer_rd_bytes(void *source, size_t nbytes, size_t *bytes_read,
+                      int *status);
+
+#endif  // PANDAS__LIBS_SRC_PARSER_IO_H_
diff --git a/pandas/_libs/src/parser/tokenizer.c b/pandas/_libs/src/parser/tokenizer.c
new file mode 100644
index 0000000000000..25eede6c286dc
--- /dev/null
+++ b/pandas/_libs/src/parser/tokenizer.c
@@ -0,0 +1,2002 @@
+/*
+
+Copyright (c) 2012, Lambda Foundry, Inc., except where noted
+
+Incorporates components of WarrenWeckesser/textreader, licensed under 3-clause
+BSD
+
+See LICENSE for the license
+
+*/
+
+/*
+
+Low-level ascii-file processing for pandas. Combines some elements from
+Python's built-in csv module and Warren Weckesser's textreader project on
+GitHub. See Python Software Foundation License and BSD licenses for these.
+
+*/
+
+#include "tokenizer.h"
+
+#include <ctype.h>
+#include <float.h>
+#include <math.h>
+
+static void *safe_realloc(void *buffer, size_t size) {
+    void *result;
+    // OSX is weird.
+    // http://stackoverflow.com/questions/9560609/
+    // different-realloc-behaviour-in-linux-and-osx
+
+    result = realloc(buffer, size);
+    TRACE(("safe_realloc: buffer = %p, size = %zu, result = %p\n", buffer, size,
+           result))
+
+    return result;
+}
+
+void coliter_setup(coliter_t *self, parser_t *parser, int i, int start) {
+    // column i, starting at 0
+    self->words = parser->words;
+    self->col = i;
+    self->line_start = parser->line_start + start;
+}
+
+coliter_t *coliter_new(parser_t *self, int i) {
+    // column i, starting at 0
+    coliter_t *iter = (coliter_t *)malloc(sizeof(coliter_t));
+
+    if (NULL == iter) {
+        return NULL;
+    }
+
+    coliter_setup(iter, self, i, 0);
+    return iter;
+}
+
+static void free_if_not_null(void **ptr) {
+    TRACE(("free_if_not_null %p\n", *ptr))
+    if (*ptr != NULL) {
+        free(*ptr);
+        *ptr = NULL;
+    }
+}
+
+/*
+
+  Parser / tokenizer
+
+*/
+
+static void *grow_buffer(void *buffer, int64_t length, int64_t *capacity,
+                         int64_t space, int64_t elsize, int *error) {
+    int64_t cap = *capacity;
+    void *newbuffer = buffer;
+
+    // Can we fit potentially nbytes tokens (+ null terminators) in the stream?
+    while ((length + space >= cap) && (newbuffer != NULL)) {
+        cap = cap ? cap << 1 : 2;
+        buffer = newbuffer;
+        newbuffer = safe_realloc(newbuffer, elsize * cap);
+    }
+
+    if (newbuffer == NULL) {
+        // realloc failed so don't change *capacity, set *error to errno
+        // and return the last good realloc'd buffer so it can be freed
+        *error = errno;
+        newbuffer = buffer;
+    } else {
+        // realloc worked, update *capacity and set *error to 0
+        // sigh, multiple return values
+        *capacity = cap;
+        *error = 0;
+    }
+    return newbuffer;
+}
+
+void parser_set_default_options(parser_t *self) {
+    self->decimal = '.';
+    self->sci = 'E';
+
+    // For tokenization
+    self->state = START_RECORD;
+
+    self->delimiter = ',';  // XXX
+    self->delim_whitespace = 0;
+
+    self->doublequote = 0;
+    self->quotechar = '"';
+    self->escapechar = 0;
+
+    self->lineterminator = '\0'; /* NUL->standard logic */
+
+    self->skipinitialspace = 0;
+    self->quoting = QUOTE_MINIMAL;
+    self->allow_embedded_newline = 1;
+    self->strict = 0;
+
+    self->expected_fields = -1;
+    self->error_bad_lines = 0;
+    self->warn_bad_lines = 0;
+
+    self->commentchar = '#';
+    self->thousands = '\0';
+
+    self->skipset = NULL;
+    self->skipfunc = NULL;
+    self->skip_first_N_rows = -1;
+    self->skip_footer = 0;
+}
+
+int get_parser_memory_footprint(parser_t *self) { return 0; }
+
+parser_t *parser_new() { return (parser_t *)calloc(1, sizeof(parser_t)); }
+
+int parser_clear_data_buffers(parser_t *self) {
+    free_if_not_null((void *)&self->stream);
+    free_if_not_null((void *)&self->words);
+    free_if_not_null((void *)&self->word_starts);
+    free_if_not_null((void *)&self->line_start);
+    free_if_not_null((void *)&self->line_fields);
+    return 0;
+}
+
+int parser_cleanup(parser_t *self) {
+    int status = 0;
+
+    // XXX where to put this
+    free_if_not_null((void *)&self->error_msg);
+    free_if_not_null((void *)&self->warn_msg);
+
+    if (self->skipset != NULL) {
+        kh_destroy_int64((kh_int64_t *)self->skipset);
+        self->skipset = NULL;
+    }
+
+    if (parser_clear_data_buffers(self) < 0) {
+        status = -1;
+    }
+
+    if (self->cb_cleanup != NULL) {
+        if (self->cb_cleanup(self->source) < 0) {
+            status = -1;
+        }
+        self->cb_cleanup = NULL;
+    }
+
+    return status;
+}
+
+int parser_init(parser_t *self) {
+    int64_t sz;
+
+    /*
+      Initialize data buffers
+    */
+
+    self->stream = NULL;
+    self->words = NULL;
+    self->word_starts = NULL;
+    self->line_start = NULL;
+    self->line_fields = NULL;
+    self->error_msg = NULL;
+    self->warn_msg = NULL;
+
+    // token stream
+    self->stream = (char *)malloc(STREAM_INIT_SIZE * sizeof(char));
+    if (self->stream == NULL) {
+        parser_cleanup(self);
+        return PARSER_OUT_OF_MEMORY;
+    }
+    self->stream_cap = STREAM_INIT_SIZE;
+    self->stream_len = 0;
+
+    // word pointers and metadata
+    sz = STREAM_INIT_SIZE / 10;
+    sz = sz ? sz : 1;
+    self->words = (char **)malloc(sz * sizeof(char *));
+    self->word_starts = (int64_t *)malloc(sz * sizeof(int64_t));
+    self->words_cap = sz;
+    self->words_len = 0;
+
+    // line pointers and metadata
+    self->line_start = (int64_t *)malloc(sz * sizeof(int64_t));
+
+    self->line_fields = (int64_t *)malloc(sz * sizeof(int64_t));
+
+    self->lines_cap = sz;
+    self->lines = 0;
+    self->file_lines = 0;
+
+    if (self->stream == NULL || self->words == NULL ||
+        self->word_starts == NULL || self->line_start == NULL ||
+        self->line_fields == NULL) {
+        parser_cleanup(self);
+
+        return PARSER_OUT_OF_MEMORY;
+    }
+
+    /* amount of bytes buffered */
+    self->datalen = 0;
+    self->datapos = 0;
+
+    self->line_start[0] = 0;
+    self->line_fields[0] = 0;
+
+    self->pword_start = self->stream;
+    self->word_start = 0;
+
+    self->state = START_RECORD;
+
+    self->error_msg = NULL;
+    self->warn_msg = NULL;
+
+    self->commentchar = '\0';
+
+    return 0;
+}
+
+void parser_free(parser_t *self) {
+    // opposite of parser_init
+    parser_cleanup(self);
+}
+
+void parser_del(parser_t *self) {
+    free(self);
+}
+
+static int make_stream_space(parser_t *self, size_t nbytes) {
+    int64_t i, cap;
+    int status;
+    void *orig_ptr, *newptr;
+
+    // Can we fit potentially nbytes tokens (+ null terminators) in the stream?
+
+    /*
+      TOKEN STREAM
+    */
+
+    orig_ptr = (void *)self->stream;
+    TRACE(
+        ("\n\nmake_stream_space: nbytes = %zu.  grow_buffer(self->stream...)\n",
+         nbytes))
+    self->stream = (char *)grow_buffer((void *)self->stream, self->stream_len,
+                                       (size_t*)&self->stream_cap, nbytes * 2,
+                                       sizeof(char), &status);
+    TRACE(
+        ("make_stream_space: self->stream=%p, self->stream_len = %zu, "
+         "self->stream_cap=%zu, status=%zu\n",
+         self->stream, self->stream_len, self->stream_cap, status))
+
+    if (status != 0) {
+        return PARSER_OUT_OF_MEMORY;
+    }
+
+    // realloc sets errno when moving buffer?
+    if (self->stream != orig_ptr) {
+        self->pword_start = self->stream + self->word_start;
+
+        for (i = 0; i < self->words_len; ++i) {
+            self->words[i] = self->stream + self->word_starts[i];
+        }
+    }
+
+    /*
+      WORD VECTORS
+    */
+
+    cap = self->words_cap;
+    self->words =
+        (char **)grow_buffer((void *)self->words, self->words_len,
+                             (size_t*)&self->words_cap, nbytes,
+                             sizeof(char *), &status);
+    TRACE(
+        ("make_stream_space: grow_buffer(self->self->words, %zu, %zu, %zu, "
+         "%d)\n",
+         self->words_len, self->words_cap, nbytes, status))
+    if (status != 0) {
+        return PARSER_OUT_OF_MEMORY;
+    }
+
+    // realloc took place
+    if (cap != self->words_cap) {
+        TRACE(
+            ("make_stream_space: cap != self->words_cap, nbytes = %d, "
+             "self->words_cap=%d\n",
+             nbytes, self->words_cap))
+        newptr = safe_realloc((void *)self->word_starts,
+                              sizeof(int64_t) * self->words_cap);
+        if (newptr == NULL) {
+            return PARSER_OUT_OF_MEMORY;
+        } else {
+            self->word_starts = (int64_t *)newptr;
+        }
+    }
+
+    /*
+      LINE VECTORS
+    */
+    cap = self->lines_cap;
+    self->line_start =
+        (int64_t *)grow_buffer((void *)self->line_start, self->lines + 1,
+                           (size_t*)&self->lines_cap, nbytes,
+                           sizeof(int64_t), &status);
+    TRACE((
+        "make_stream_space: grow_buffer(self->line_start, %zu, %zu, %zu, %d)\n",
+        self->lines + 1, self->lines_cap, nbytes, status))
+    if (status != 0) {
+        return PARSER_OUT_OF_MEMORY;
+    }
+
+    // realloc took place
+    if (cap != self->lines_cap) {
+        TRACE(("make_stream_space: cap != self->lines_cap, nbytes = %d\n",
+               nbytes))
+        newptr = safe_realloc((void *)self->line_fields,
+                              sizeof(int64_t) * self->lines_cap);
+        if (newptr == NULL) {
+            return PARSER_OUT_OF_MEMORY;
+        } else {
+            self->line_fields = (int64_t *)newptr;
+        }
+    }
+
+    return 0;
+}
+
+static int push_char(parser_t *self, char c) {
+    TRACE(("push_char: self->stream[%zu] = %x, stream_cap=%zu\n",
+           self->stream_len + 1, c, self->stream_cap))
+    if (self->stream_len >= self->stream_cap) {
+        TRACE(
+            ("push_char: ERROR!!! self->stream_len(%d) >= "
+             "self->stream_cap(%d)\n",
+             self->stream_len, self->stream_cap))
+        int64_t bufsize = 100;
+        self->error_msg = (char *)malloc(bufsize);
+        snprintf(self->error_msg, bufsize,
+                 "Buffer overflow caught - possible malformed input file.\n");
+        return PARSER_OUT_OF_MEMORY;
+    }
+    self->stream[self->stream_len++] = c;
+    return 0;
+}
+
+int P_INLINE end_field(parser_t *self) {
+    // XXX cruft
+    if (self->words_len >= self->words_cap) {
+        TRACE(
+            ("end_field: ERROR!!! self->words_len(%zu) >= "
+             "self->words_cap(%zu)\n",
+             self->words_len, self->words_cap))
+        int64_t bufsize = 100;
+        self->error_msg = (char *)malloc(bufsize);
+        snprintf(self->error_msg, bufsize,
+                 "Buffer overflow caught - possible malformed input file.\n");
+        return PARSER_OUT_OF_MEMORY;
+    }
+
+    // null terminate token
+    push_char(self, '\0');
+
+    // set pointer and metadata
+    self->words[self->words_len] = self->pword_start;
+
+    TRACE(("end_field: Char diff: %d\n", self->pword_start - self->words[0]));
+
+    TRACE(("end_field: Saw word %s at: %d. Total: %d\n", self->pword_start,
+           self->word_start, self->words_len + 1))
+
+    self->word_starts[self->words_len] = self->word_start;
+    self->words_len++;
+
+    // increment line field count
+    self->line_fields[self->lines]++;
+
+    // New field begin in stream
+    self->pword_start = self->stream + self->stream_len;
+    self->word_start = self->stream_len;
+
+    return 0;
+}
+
+static void append_warning(parser_t *self, const char *msg) {
+    int64_t ex_length;
+    int64_t length = strlen(msg);
+    void *newptr;
+
+    if (self->warn_msg == NULL) {
+        self->warn_msg = (char *)malloc(length + 1);
+        strncpy(self->warn_msg, msg, strlen(msg) + 1);
+    } else {
+        ex_length = strlen(self->warn_msg);
+        newptr = safe_realloc(self->warn_msg, ex_length + length + 1);
+        if (newptr != NULL) {
+            self->warn_msg = (char *)newptr;
+            strncpy(self->warn_msg + ex_length, msg, strlen(msg) + 1);
+        }
+    }
+}
+
+static int end_line(parser_t *self) {
+    char *msg;
+    int64_t fields;
+    int ex_fields = self->expected_fields;
+    int64_t bufsize = 100;  // for error or warning messages
+
+    fields = self->line_fields[self->lines];
+
+    TRACE(("end_line: Line end, nfields: %d\n", fields));
+
+    TRACE(("end_line: lines: %d\n", self->lines));
+    if (self->lines > 0) {
+        if (self->expected_fields >= 0) {
+            ex_fields = self->expected_fields;
+        } else {
+            ex_fields = self->line_fields[self->lines - 1];
+        }
+    }
+    TRACE(("end_line: ex_fields: %d\n", ex_fields));
+
+    if (self->state == START_FIELD_IN_SKIP_LINE ||
+        self->state == IN_FIELD_IN_SKIP_LINE ||
+        self->state == IN_QUOTED_FIELD_IN_SKIP_LINE ||
+        self->state == QUOTE_IN_QUOTED_FIELD_IN_SKIP_LINE) {
+        TRACE(("end_line: Skipping row %d\n", self->file_lines));
+        // increment file line count
+        self->file_lines++;
+
+        // skip the tokens from this bad line
+        self->line_start[self->lines] += fields;
+
+        // reset field count
+        self->line_fields[self->lines] = 0;
+        return 0;
+    }
+
+    if (!(self->lines <= (int64_t) self->header_end + 1) &&
+        (self->expected_fields < 0 && fields > ex_fields) && !(self->usecols)) {
+        // increment file line count
+        self->file_lines++;
+
+        // skip the tokens from this bad line
+        self->line_start[self->lines] += fields;
+
+        // reset field count
+        self->line_fields[self->lines] = 0;
+
+        // file_lines is now the actual file line number (starting at 1)
+        if (self->error_bad_lines) {
+            self->error_msg = (char *)malloc(bufsize);
+            snprintf(self->error_msg, bufsize,
+                    "Expected %d fields in line %lld, saw %lld\n",
+                    ex_fields, (long long)self->file_lines, (long long)fields);
+
+            TRACE(("Error at line %d, %d fields\n", self->file_lines, fields));
+
+            return -1;
+        } else {
+            // simply skip bad lines
+            if (self->warn_bad_lines) {
+                // pass up error message
+                msg = (char *)malloc(bufsize);
+                snprintf(msg, bufsize,
+                        "Skipping line %lld: expected %d fields, saw %lld\n",
+                         (long long)self->file_lines, ex_fields,
+                         (long long)fields);
+                append_warning(self, msg);
+                free(msg);
+            }
+        }
+    } else {
+        // missing trailing delimiters
+        if ((self->lines >= (int64_t) self->header_end + 1) &&
+                fields < ex_fields) {
+            // might overrun the buffer when closing fields
+            if (make_stream_space(self, ex_fields - fields) < 0) {
+                int64_t bufsize = 100;
+                self->error_msg = (char *)malloc(bufsize);
+                snprintf(self->error_msg, bufsize, "out of memory");
+                return -1;
+            }
+
+            while (fields < ex_fields) {
+                end_field(self);
+                fields++;
+            }
+        }
+
+        // increment both line counts
+        self->file_lines++;
+        self->lines++;
+
+        // good line, set new start point
+        if (self->lines >= self->lines_cap) {
+            TRACE((
+                "end_line: ERROR!!! self->lines(%zu) >= self->lines_cap(%zu)\n",
+                self->lines, self->lines_cap))
+            int64_t bufsize = 100;
+            self->error_msg = (char *)malloc(bufsize);
+            snprintf(self->error_msg, bufsize,
+                     "Buffer overflow caught - "
+                     "possible malformed input file.\n");
+            return PARSER_OUT_OF_MEMORY;
+        }
+        self->line_start[self->lines] =
+            (self->line_start[self->lines - 1] + fields);
+
+        TRACE(
+            ("end_line: new line start: %d\n", self->line_start[self->lines]));
+
+        // new line start with 0 fields
+        self->line_fields[self->lines] = 0;
+    }
+
+    TRACE(("end_line: Finished line, at %d\n", self->lines));
+
+    return 0;
+}
+
+int parser_add_skiprow(parser_t *self, int64_t row) {
+    khiter_t k;
+    kh_int64_t *set;
+    int ret = 0;
+
+    if (self->skipset == NULL) {
+        self->skipset = (void *)kh_init_int64();
+    }
+
+    set = (kh_int64_t *)self->skipset;
+
+    k = kh_put_int64(set, row, &ret);
+    set->keys[k] = row;
+
+    return 0;
+}
+
+int parser_set_skipfirstnrows(parser_t *self, int64_t nrows) {
+    // self->file_lines is zero based so subtract 1 from nrows
+    if (nrows > 0) {
+        self->skip_first_N_rows = nrows - 1;
+    }
+
+    return 0;
+}
+
+static int parser_buffer_bytes(parser_t *self, size_t nbytes) {
+    int status;
+    size_t bytes_read;
+
+    status = 0;
+    self->datapos = 0;
+    self->data = self->cb_io(self->source, nbytes, &bytes_read, &status);
+    TRACE((
+        "parser_buffer_bytes self->cb_io: nbytes=%zu, datalen: %d, status=%d\n",
+        nbytes, bytes_read, status));
+    self->datalen = bytes_read;
+
+    if (status != REACHED_EOF && self->data == NULL) {
+        int64_t bufsize = 200;
+        self->error_msg = (char *)malloc(bufsize);
+
+        if (status == CALLING_READ_FAILED) {
+            snprintf(self->error_msg, bufsize,
+                     "Calling read(nbytes) on source failed. "
+                     "Try engine='python'.");
+        } else {
+            snprintf(self->error_msg, bufsize, "Unknown error in IO callback");
+        }
+        return -1;
+    }
+
+    TRACE(("datalen: %d\n", self->datalen));
+
+    return status;
+}
+
+/*
+
+  Tokenization macros and state machine code
+
+*/
+
+#define PUSH_CHAR(c)                                                          \
+    TRACE(                                                                    \
+        ("PUSH_CHAR: Pushing %c, slen= %d, stream_cap=%zu, stream_len=%zu\n", \
+         c, slen, self->stream_cap, self->stream_len))                        \
+    if (slen >= self->stream_cap) {                                           \
+        TRACE(("PUSH_CHAR: ERROR!!! slen(%d) >= stream_cap(%d)\n", slen,      \
+               self->stream_cap))                                             \
+        int64_t bufsize = 100;                                                \
+        self->error_msg = (char *)malloc(bufsize);                            \
+        snprintf(self->error_msg, bufsize,                                    \
+                 "Buffer overflow caught - possible malformed input file.\n");\
+        return PARSER_OUT_OF_MEMORY;                                          \
+    }                                                                         \
+    *stream++ = c;                                                            \
+    slen++;
+
+// This is a little bit of a hack but works for now
+
+#define END_FIELD()                           \
+    self->stream_len = slen;                  \
+    if (end_field(self) < 0) {                \
+        goto parsingerror;                    \
+    }                                         \
+    stream = self->stream + self->stream_len; \
+    slen = self->stream_len;
+
+#define END_LINE_STATE(STATE)                                        \
+    self->stream_len = slen;                                         \
+    if (end_line(self) < 0) {                                        \
+        goto parsingerror;                                           \
+    }                                                                \
+    stream = self->stream + self->stream_len;                        \
+    slen = self->stream_len;                                         \
+    self->state = STATE;                                             \
+    if (line_limit > 0 && self->lines == start_lines + (int64_t)line_limit) {  \
+        goto linelimit;                                              \
+    }
+
+#define END_LINE_AND_FIELD_STATE(STATE)                              \
+    self->stream_len = slen;                                         \
+    if (end_line(self) < 0) {                                        \
+        goto parsingerror;                                           \
+    }                                                                \
+    if (end_field(self) < 0) {                                       \
+        goto parsingerror;                                           \
+    }                                                                \
+    stream = self->stream + self->stream_len;                        \
+    slen = self->stream_len;                                         \
+    self->state = STATE;                                             \
+    if (line_limit > 0 && self->lines == start_lines + (int64_t)line_limit) { \
+        goto linelimit;                                              \
+    }
+
+#define END_LINE() END_LINE_STATE(START_RECORD)
+
+#define IS_WHITESPACE(c) ((c == ' ' || c == '\t'))
+
+#define IS_TERMINATOR(c)                            \
+    ((self->lineterminator == '\0' && c == '\n') || \
+     (self->lineterminator != '\0' && c == self->lineterminator))
+
+#define IS_QUOTE(c) ((c == self->quotechar && self->quoting != QUOTE_NONE))
+
+// don't parse '\r' with a custom line terminator
+#define IS_CARRIAGE(c) ((self->lineterminator == '\0' && c == '\r'))
+
+#define IS_COMMENT_CHAR(c) \
+    ((self->commentchar != '\0' && c == self->commentchar))
+
+#define IS_ESCAPE_CHAR(c) ((self->escapechar != '\0' && c == self->escapechar))
+
+#define IS_SKIPPABLE_SPACE(c) \
+    ((!self->delim_whitespace && c == ' ' && self->skipinitialspace))
+
+// applied when in a field
+#define IS_DELIMITER(c)                                   \
+    ((!self->delim_whitespace && c == self->delimiter) || \
+     (self->delim_whitespace && IS_WHITESPACE(c)))
+
+#define _TOKEN_CLEANUP()                                                \
+    self->stream_len = slen;                                            \
+    self->datapos = i;                                                  \
+    TRACE(("_TOKEN_CLEANUP: datapos: %d, datalen: %d\n", self->datapos, \
+           self->datalen));
+
+#define CHECK_FOR_BOM()                                                   \
+    if (*buf == '\xef' && *(buf + 1) == '\xbb' && *(buf + 2) == '\xbf') { \
+        buf += 3;                                                         \
+        self->datapos += 3;                                               \
+    }
+
+int skip_this_line(parser_t *self, int64_t rownum) {
+    int should_skip;
+    PyObject *result;
+    PyGILState_STATE state;
+
+    if (self->skipfunc != NULL) {
+        state = PyGILState_Ensure();
+        result = PyObject_CallFunction(self->skipfunc, "i", rownum);
+
+        // Error occurred. It will be processed
+        // and caught at the Cython level.
+        if (result == NULL) {
+            should_skip = -1;
+        } else {
+            should_skip = PyObject_IsTrue(result);
+        }
+
+        Py_XDECREF(result);
+        PyGILState_Release(state);
+
+        return should_skip;
+    } else if (self->skipset != NULL) {
+        return (kh_get_int64((kh_int64_t *)self->skipset, self->file_lines) !=
+                ((kh_int64_t *)self->skipset)->n_buckets);
+    } else {
+        return (rownum <= self->skip_first_N_rows);
+    }
+}
+
+int tokenize_bytes(parser_t *self, size_t line_limit, int64_t start_lines) {
+    int64_t i, slen;
+    int should_skip;
+    char c;
+    char *stream;
+    char *buf = self->data + self->datapos;
+
+    if (make_stream_space(self, self->datalen - self->datapos) < 0) {
+        int64_t bufsize = 100;
+        self->error_msg = (char *)malloc(bufsize);
+        snprintf(self->error_msg, bufsize, "out of memory");
+        return -1;
+    }
+
+    stream = self->stream + self->stream_len;
+    slen = self->stream_len;
+
+    TRACE(("%s\n", buf));
+
+    if (self->file_lines == 0) {
+        CHECK_FOR_BOM();
+    }
+
+    for (i = self->datapos; i < self->datalen; ++i) {
+        // next character in file
+        c = *buf++;
+
+        TRACE(
+            ("tokenize_bytes - Iter: %d Char: 0x%x Line %d field_count %d, "
+             "state %d\n",
+             i, c, self->file_lines + 1, self->line_fields[self->lines],
+             self->state));
+
+        switch (self->state) {
+            case START_FIELD_IN_SKIP_LINE:
+                if (IS_TERMINATOR(c)) {
+                    END_LINE();
+                } else if (IS_CARRIAGE(c)) {
+                    self->file_lines++;
+                    self->state = EAT_CRNL_NOP;
+                } else if (IS_QUOTE(c)) {
+                    self->state = IN_QUOTED_FIELD_IN_SKIP_LINE;
+                } else if (IS_DELIMITER(c)) {
+                    // Do nothing, we're starting a new field again.
+                } else {
+                    self->state = IN_FIELD_IN_SKIP_LINE;
+                }
+                break;
+
+            case IN_FIELD_IN_SKIP_LINE:
+                if (IS_TERMINATOR(c)) {
+                    END_LINE();
+                } else if (IS_CARRIAGE(c)) {
+                    self->file_lines++;
+                    self->state = EAT_CRNL_NOP;
+                } else if (IS_DELIMITER(c)) {
+                    self->state = START_FIELD_IN_SKIP_LINE;
+                }
+                break;
+
+            case IN_QUOTED_FIELD_IN_SKIP_LINE:
+                if (IS_QUOTE(c)) {
+                    if (self->doublequote) {
+                        self->state = QUOTE_IN_QUOTED_FIELD_IN_SKIP_LINE;
+                    } else {
+                        self->state = IN_FIELD_IN_SKIP_LINE;
+                    }
+                }
+                break;
+
+            case QUOTE_IN_QUOTED_FIELD_IN_SKIP_LINE:
+                if (IS_QUOTE(c)) {
+                    self->state = IN_QUOTED_FIELD_IN_SKIP_LINE;
+                } else if (IS_TERMINATOR(c)) {
+                    END_LINE();
+                } else if (IS_CARRIAGE(c)) {
+                    self->file_lines++;
+                    self->state = EAT_CRNL_NOP;
+                } else if (IS_DELIMITER(c)) {
+                    self->state = START_FIELD_IN_SKIP_LINE;
+                } else {
+                    self->state = IN_FIELD_IN_SKIP_LINE;
+                }
+                break;
+
+            case WHITESPACE_LINE:
+                if (IS_TERMINATOR(c)) {
+                    self->file_lines++;
+                    self->state = START_RECORD;
+                    break;
+                } else if (IS_CARRIAGE(c)) {
+                    self->file_lines++;
+                    self->state = EAT_CRNL_NOP;
+                    break;
+                } else if (!self->delim_whitespace) {
+                    if (IS_WHITESPACE(c) && c != self->delimiter) {
+                    } else {  // backtrack
+                        // use i + 1 because buf has been incremented but not i
+                        do {
+                            --buf;
+                            --i;
+                        } while (i + 1 > self->datapos && !IS_TERMINATOR(*buf));
+
+                        // reached a newline rather than the beginning
+                        if (IS_TERMINATOR(*buf)) {
+                            ++buf;  // move pointer to first char after newline
+                            ++i;
+                        }
+                        self->state = START_FIELD;
+                    }
+                    break;
+                }
+            // fall through
+
+            case EAT_WHITESPACE:
+                if (IS_TERMINATOR(c)) {
+                    END_LINE();
+                    self->state = START_RECORD;
+                    break;
+                } else if (IS_CARRIAGE(c)) {
+                    self->state = EAT_CRNL;
+                    break;
+                } else if (IS_COMMENT_CHAR(c)) {
+                    self->state = EAT_COMMENT;
+                    break;
+                } else if (!IS_WHITESPACE(c)) {
+                    self->state = START_FIELD;
+                    // fall through to subsequent state
+                } else {
+                    // if whitespace char, keep slurping
+                    break;
+                }
+
+            case START_RECORD:
+                // start of record
+                should_skip = skip_this_line(self, self->file_lines);
+
+                if (should_skip == -1) {
+                    goto parsingerror;
+                } else if (should_skip) {
+                    if (IS_QUOTE(c)) {
+                        self->state = IN_QUOTED_FIELD_IN_SKIP_LINE;
+                    } else {
+                        self->state = IN_FIELD_IN_SKIP_LINE;
+
+                        if (IS_TERMINATOR(c)) {
+                            END_LINE();
+                        }
+                    }
+                    break;
+                } else if (IS_TERMINATOR(c)) {
+                    // \n\r possible?
+                    if (self->skip_empty_lines) {
+                        self->file_lines++;
+                    } else {
+                        END_LINE();
+                    }
+                    break;
+                } else if (IS_CARRIAGE(c)) {
+                    if (self->skip_empty_lines) {
+                        self->file_lines++;
+                        self->state = EAT_CRNL_NOP;
+                    } else {
+                        self->state = EAT_CRNL;
+                    }
+                    break;
+                } else if (IS_COMMENT_CHAR(c)) {
+                    self->state = EAT_LINE_COMMENT;
+                    break;
+                } else if (IS_WHITESPACE(c)) {
+                    if (self->delim_whitespace) {
+                        if (self->skip_empty_lines) {
+                            self->state = WHITESPACE_LINE;
+                        } else {
+                            self->state = EAT_WHITESPACE;
+                        }
+                        break;
+                    } else if (c != self->delimiter && self->skip_empty_lines) {
+                        self->state = WHITESPACE_LINE;
+                        break;
+                    }
+                    // fall through
+                }
+
+                // normal character - fall through
+                // to handle as START_FIELD
+                self->state = START_FIELD;
+
+            case START_FIELD:
+                // expecting field
+                if (IS_TERMINATOR(c)) {
+                    END_FIELD();
+                    END_LINE();
+                } else if (IS_CARRIAGE(c)) {
+                    END_FIELD();
+                    self->state = EAT_CRNL;
+                } else if (IS_QUOTE(c)) {
+                    // start quoted field
+                    self->state = IN_QUOTED_FIELD;
+                } else if (IS_ESCAPE_CHAR(c)) {
+                    // possible escaped character
+                    self->state = ESCAPED_CHAR;
+                } else if (IS_SKIPPABLE_SPACE(c)) {
+                    // ignore space at start of field
+                } else if (IS_DELIMITER(c)) {
+                    if (self->delim_whitespace) {
+                        self->state = EAT_WHITESPACE;
+                    } else {
+                        // save empty field
+                        END_FIELD();
+                    }
+                } else if (IS_COMMENT_CHAR(c)) {
+                    END_FIELD();
+                    self->state = EAT_COMMENT;
+                } else {
+                    // begin new unquoted field
+                    PUSH_CHAR(c);
+                    self->state = IN_FIELD;
+                }
+                break;
+
+            case ESCAPED_CHAR:
+                PUSH_CHAR(c);
+                self->state = IN_FIELD;
+                break;
+
+            case EAT_LINE_COMMENT:
+                if (IS_TERMINATOR(c)) {
+                    self->file_lines++;
+                    self->state = START_RECORD;
+                } else if (IS_CARRIAGE(c)) {
+                    self->file_lines++;
+                    self->state = EAT_CRNL_NOP;
+                }
+                break;
+
+            case IN_FIELD:
+                // in unquoted field
+                if (IS_TERMINATOR(c)) {
+                    END_FIELD();
+                    END_LINE();
+                } else if (IS_CARRIAGE(c)) {
+                    END_FIELD();
+                    self->state = EAT_CRNL;
+                } else if (IS_ESCAPE_CHAR(c)) {
+                    // possible escaped character
+                    self->state = ESCAPED_CHAR;
+                } else if (IS_DELIMITER(c)) {
+                    // end of field - end of line not reached yet
+                    END_FIELD();
+
+                    if (self->delim_whitespace) {
+                        self->state = EAT_WHITESPACE;
+                    } else {
+                        self->state = START_FIELD;
+                    }
+                } else if (IS_COMMENT_CHAR(c)) {
+                    END_FIELD();
+                    self->state = EAT_COMMENT;
+                } else {
+                    // normal character - save in field
+                    PUSH_CHAR(c);
+                }
+                break;
+
+            case IN_QUOTED_FIELD:
+                // in quoted field
+                if (IS_ESCAPE_CHAR(c)) {
+                    // possible escape character
+                    self->state = ESCAPE_IN_QUOTED_FIELD;
+                } else if (IS_QUOTE(c)) {
+                    if (self->doublequote) {
+                        // double quote - " represented by ""
+                        self->state = QUOTE_IN_QUOTED_FIELD;
+                    } else {
+                        // end of quote part of field
+                        self->state = IN_FIELD;
+                    }
+                } else {
+                    // normal character - save in field
+                    PUSH_CHAR(c);
+                }
+                break;
+
+            case ESCAPE_IN_QUOTED_FIELD:
+                PUSH_CHAR(c);
+                self->state = IN_QUOTED_FIELD;
+                break;
+
+            case QUOTE_IN_QUOTED_FIELD:
+                // double quote - seen a quote in an quoted field
+                if (IS_QUOTE(c)) {
+                    // save "" as "
+
+                    PUSH_CHAR(c);
+                    self->state = IN_QUOTED_FIELD;
+                } else if (IS_DELIMITER(c)) {
+                    // end of field - end of line not reached yet
+                    END_FIELD();
+
+                    if (self->delim_whitespace) {
+                        self->state = EAT_WHITESPACE;
+                    } else {
+                        self->state = START_FIELD;
+                    }
+                } else if (IS_TERMINATOR(c)) {
+                    END_FIELD();
+                    END_LINE();
+                } else if (IS_CARRIAGE(c)) {
+                    END_FIELD();
+                    self->state = EAT_CRNL;
+                } else if (!self->strict) {
+                    PUSH_CHAR(c);
+                    self->state = IN_FIELD;
+                } else {
+                    int64_t bufsize = 100;
+                    self->error_msg = (char *)malloc(bufsize);
+                    snprintf(self->error_msg, bufsize,
+                            "delimiter expected after quote in quote");
+                    goto parsingerror;
+                }
+                break;
+
+            case EAT_COMMENT:
+                if (IS_TERMINATOR(c)) {
+                    END_LINE();
+                } else if (IS_CARRIAGE(c)) {
+                    self->state = EAT_CRNL;
+                }
+                break;
+
+            // only occurs with non-custom line terminator,
+            // which is why we directly check for '\n'
+            case EAT_CRNL:
+                if (c == '\n') {
+                    END_LINE();
+                } else if (IS_DELIMITER(c)) {
+                    if (self->delim_whitespace) {
+                        END_LINE_STATE(EAT_WHITESPACE);
+                    } else {
+                        // Handle \r-delimited files
+                        END_LINE_AND_FIELD_STATE(START_FIELD);
+                    }
+                } else {
+                    if (self->delim_whitespace) {
+                        /* XXX
+                        * first character of a new record--need to back up and
+                        * reread
+                        * to handle properly...
+                        */
+                        i--;
+                        buf--;  // back up one character (HACK!)
+                        END_LINE_STATE(START_RECORD);
+                    } else {
+                        // \r line terminator
+                        // UGH. we don't actually want
+                        // to consume the token. fix this later
+                        self->stream_len = slen;
+                        if (end_line(self) < 0) {
+                            goto parsingerror;
+                        }
+
+                        stream = self->stream + self->stream_len;
+                        slen = self->stream_len;
+                        self->state = START_RECORD;
+
+                        --i;
+                        buf--;  // let's try this character again (HACK!)
+                        if (line_limit > 0 &&
+                            self->lines == start_lines + line_limit) {
+                            goto linelimit;
+                        }
+                    }
+                }
+                break;
+
+            // only occurs with non-custom line terminator,
+            // which is why we directly check for '\n'
+            case EAT_CRNL_NOP:  // inside an ignored comment line
+                self->state = START_RECORD;
+                // \r line terminator -- parse this character again
+                if (c != '\n' && !IS_DELIMITER(c)) {
+                    --i;
+                    --buf;
+                }
+                break;
+            default:
+                break;
+        }
+    }
+
+    _TOKEN_CLEANUP();
+
+    TRACE(("Finished tokenizing input\n"))
+
+    return 0;
+
+parsingerror:
+    i++;
+    _TOKEN_CLEANUP();
+
+    return -1;
+
+linelimit:
+    i++;
+    _TOKEN_CLEANUP();
+
+    return 0;
+}
+
+static int parser_handle_eof(parser_t *self) {
+    int64_t bufsize = 100;
+
+    TRACE(
+        ("handling eof, datalen: %d, pstate: %d\n", self->datalen, self->state))
+
+    if (self->datalen != 0) return -1;
+
+    switch (self->state) {
+        case START_RECORD:
+        case WHITESPACE_LINE:
+        case EAT_CRNL_NOP:
+        case EAT_LINE_COMMENT:
+            return 0;
+
+        case ESCAPE_IN_QUOTED_FIELD:
+        case IN_QUOTED_FIELD:
+            self->error_msg = (char *)malloc(bufsize);
+            snprintf(self->error_msg, bufsize,
+                    "EOF inside string starting at line %lld",
+                    (long long)self->file_lines);
+            return -1;
+
+        case ESCAPED_CHAR:
+            self->error_msg = (char *)malloc(bufsize);
+            snprintf(self->error_msg, bufsize,
+                     "EOF following escape character");
+            return -1;
+
+        case IN_FIELD:
+        case START_FIELD:
+        case QUOTE_IN_QUOTED_FIELD:
+            if (end_field(self) < 0) return -1;
+            break;
+
+        default:
+            break;
+    }
+
+    if (end_line(self) < 0)
+        return -1;
+    else
+        return 0;
+}
+
+int parser_consume_rows(parser_t *self, size_t nrows) {
+    int64_t i, offset, word_deletions, char_count;
+
+    if (nrows > self->lines) {
+        nrows = self->lines;
+    }
+
+    /* do nothing */
+    if (nrows == 0) return 0;
+
+    /* cannot guarantee that nrows + 1 has been observed */
+    word_deletions = self->line_start[nrows - 1] + self->line_fields[nrows - 1];
+    char_count = (self->word_starts[word_deletions - 1] +
+                  strlen(self->words[word_deletions - 1]) + 1);
+
+    TRACE(("parser_consume_rows: Deleting %d words, %d chars\n", word_deletions,
+           char_count));
+
+    /* move stream, only if something to move */
+    if (char_count < self->stream_len) {
+        memmove((void *)self->stream, (void *)(self->stream + char_count),
+                self->stream_len - char_count);
+    }
+    /* buffer counts */
+    self->stream_len -= char_count;
+
+    /* move token metadata */
+    for (i = 0; i < self->words_len - word_deletions; ++i) {
+        offset = i + word_deletions;
+
+        self->words[i] = self->words[offset] - char_count;
+        self->word_starts[i] = self->word_starts[offset] - char_count;
+    }
+    self->words_len -= word_deletions;
+
+    /* move current word pointer to stream */
+    self->pword_start -= char_count;
+    self->word_start -= char_count;
+
+    /* move line metadata */
+    for (i = 0; i < self->lines - nrows + 1; ++i) {
+        offset = i + nrows;
+        self->line_start[i] = self->line_start[offset] - word_deletions;
+        self->line_fields[i] = self->line_fields[offset];
+    }
+    self->lines -= nrows;
+
+    return 0;
+}
+
+static size_t _next_pow2(size_t sz) {
+    size_t result = 1;
+    while (result < sz) result *= 2;
+    return result;
+}
+
+int parser_trim_buffers(parser_t *self) {
+    /*
+      Free memory
+     */
+    size_t new_cap;
+    void *newptr;
+
+    int64_t i;
+
+    /* trim words, word_starts */
+    new_cap = _next_pow2(self->words_len) + 1;
+    if (new_cap < self->words_cap) {
+        TRACE(("parser_trim_buffers: new_cap < self->words_cap\n"));
+        newptr = safe_realloc((void *)self->words, new_cap * sizeof(char *));
+        if (newptr == NULL) {
+            return PARSER_OUT_OF_MEMORY;
+        } else {
+            self->words = (char **)newptr;
+        }
+        newptr = safe_realloc((void *)self->word_starts,
+                              new_cap * sizeof(int64_t));
+        if (newptr == NULL) {
+            return PARSER_OUT_OF_MEMORY;
+        } else {
+            self->word_starts = (int64_t *)newptr;
+            self->words_cap = new_cap;
+        }
+    }
+
+    /* trim stream */
+    new_cap = _next_pow2(self->stream_len) + 1;
+    TRACE(
+        ("parser_trim_buffers: new_cap = %zu, stream_cap = %zu, lines_cap = "
+         "%zu\n",
+         new_cap, self->stream_cap, self->lines_cap));
+    if (new_cap < self->stream_cap) {
+        TRACE(
+            ("parser_trim_buffers: new_cap < self->stream_cap, calling "
+             "safe_realloc\n"));
+        newptr = safe_realloc((void *)self->stream, new_cap);
+        if (newptr == NULL) {
+            return PARSER_OUT_OF_MEMORY;
+        } else {
+            // Update the pointers in the self->words array (char **) if
+            // `safe_realloc`
+            //  moved the `self->stream` buffer. This block mirrors a similar
+            //  block in
+            //  `make_stream_space`.
+            if (self->stream != newptr) {
+                self->pword_start = (char *)newptr + self->word_start;
+
+                for (i = 0; i < self->words_len; ++i) {
+                    self->words[i] = (char *)newptr + self->word_starts[i];
+                }
+            }
+
+            self->stream = newptr;
+            self->stream_cap = new_cap;
+        }
+    }
+
+    /* trim line_start, line_fields */
+    new_cap = _next_pow2(self->lines) + 1;
+    if (new_cap < self->lines_cap) {
+        TRACE(("parser_trim_buffers: new_cap < self->lines_cap\n"));
+        newptr = safe_realloc((void *)self->line_start,
+                              new_cap * sizeof(int64_t));
+        if (newptr == NULL) {
+            return PARSER_OUT_OF_MEMORY;
+        } else {
+            self->line_start = (int64_t *)newptr;
+        }
+        newptr = safe_realloc((void *)self->line_fields,
+                              new_cap * sizeof(int64_t));
+        if (newptr == NULL) {
+            return PARSER_OUT_OF_MEMORY;
+        } else {
+            self->line_fields = (int64_t *)newptr;
+            self->lines_cap = new_cap;
+        }
+    }
+
+    return 0;
+}
+
+/*
+  nrows : number of rows to tokenize (or until reach EOF)
+  all : tokenize all the data vs. certain number of rows
+ */
+
+int _tokenize_helper(parser_t *self, size_t nrows, int all) {
+    int status = 0;
+    int64_t start_lines = self->lines;
+
+    if (self->state == FINISHED) {
+        return 0;
+    }
+
+    TRACE((
+        "_tokenize_helper: Asked to tokenize %d rows, datapos=%d, datalen=%d\n",
+        nrows, self->datapos, self->datalen));
+
+    while (1) {
+        if (!all && self->lines - start_lines >= nrows) break;
+
+        if (self->datapos == self->datalen) {
+            status = parser_buffer_bytes(self, self->chunksize);
+
+            if (status == REACHED_EOF) {
+                // close out last line
+                status = parser_handle_eof(self);
+                self->state = FINISHED;
+                break;
+            } else if (status != 0) {
+                return status;
+            }
+        }
+
+        TRACE(
+            ("_tokenize_helper: Trying to process %d bytes, datalen=%d, "
+             "datapos= %d\n",
+             self->datalen - self->datapos, self->datalen, self->datapos));
+
+        status = tokenize_bytes(self, nrows, start_lines);
+
+        if (status < 0) {
+            // XXX
+            TRACE(
+                ("_tokenize_helper: Status %d returned from tokenize_bytes, "
+                 "breaking\n",
+                 status));
+            status = -1;
+            break;
+        }
+    }
+    TRACE(("leaving tokenize_helper\n"));
+    return status;
+}
+
+int tokenize_nrows(parser_t *self, size_t nrows) {
+    int status = _tokenize_helper(self, nrows, 0);
+    return status;
+}
+
+int tokenize_all_rows(parser_t *self) {
+    int status = _tokenize_helper(self, -1, 1);
+    return status;
+}
+
+P_INLINE void uppercase(char *p) {
+    for (; *p; ++p) *p = toupper(*p);
+}
+
+int P_INLINE to_longlong(char *item, long long *p_value) {
+    char *p_end;
+
+    // Try integer conversion.  We explicitly give the base to be 10. If
+    // we used 0, strtoll() would convert '012' to 10, because the leading 0 in
+    // '012' signals an octal number in C.  For a general purpose reader, that
+    // would be a bug, not a feature.
+    *p_value = strtoll(item, &p_end, 10);
+
+    // Allow trailing spaces.
+    while (isspace(*p_end)) ++p_end;
+
+    return (errno == 0) && (!*p_end);
+}
+
+int to_boolean(const char *item, uint8_t *val) {
+    char *tmp;
+    int i, status = 0;
+    int bufsize = sizeof(char) * (strlen(item) + 1);
+
+    static const char *tstrs[1] = {"TRUE"};
+    static const char *fstrs[1] = {"FALSE"};
+
+    tmp = malloc(bufsize);
+    strncpy(tmp, item, bufsize);
+    uppercase(tmp);
+
+    for (i = 0; i < 1; ++i) {
+        if (strcmp(tmp, tstrs[i]) == 0) {
+            *val = 1;
+            goto done;
+        }
+    }
+
+    for (i = 0; i < 1; ++i) {
+        if (strcmp(tmp, fstrs[i]) == 0) {
+            *val = 0;
+            goto done;
+        }
+    }
+
+    status = -1;
+
+done:
+    free(tmp);
+    return status;
+}
+
+#ifdef TEST
+
+int main(int argc, char *argv[]) {
+    double x, y;
+    long long xi;
+    int status;
+    char *s;
+
+    s = "123,789";
+    status = to_longlong_thousands(s, &xi, ',');
+    printf("s = '%s'\n", s);
+    printf("status = %d\n", status);
+    printf("x = %d\n", (int)xi);
+
+    return 0;
+}
+#endif
+
+// ---------------------------------------------------------------------------
+// Implementation of xstrtod
+
+//
+// strtod.c
+//
+// Convert string to double
+//
+// Copyright (C) 2002 Michael Ringgaard. All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions
+// are met:
+//
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the project nor the names of its contributors
+//    may be used to endorse or promote products derived from this software
+//    without specific prior written permission.
+//
+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+// AND
+// ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+// ARE DISCLAIMED.  IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE
+// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+// OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+// HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+// LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+// OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+// SUCH DAMAGE.
+//
+// -----------------------------------------------------------------------
+// Modifications by Warren Weckesser, March 2011:
+// * Rename strtod() to xstrtod().
+// * Added decimal and sci arguments.
+// * Skip trailing spaces.
+// * Commented out the other functions.
+// Modifications by Richard T Guy, August 2013:
+// * Add tsep argument for thousands separator
+//
+
+double xstrtod(const char *str, char **endptr, char decimal, char sci,
+               char tsep, int skip_trailing) {
+    double number;
+    int exponent;
+    int negative;
+    char *p = (char *)str;
+    double p10;
+    int n;
+    int num_digits;
+    int num_decimals;
+
+    errno = 0;
+
+    // Skip leading whitespace.
+    while (isspace(*p)) p++;
+
+    // Handle optional sign.
+    negative = 0;
+    switch (*p) {
+        case '-':
+            negative = 1;  // Fall through to increment position.
+        case '+':
+            p++;
+    }
+
+    number = 0.;
+    exponent = 0;
+    num_digits = 0;
+    num_decimals = 0;
+
+    // Process string of digits.
+    while (isdigit(*p)) {
+        number = number * 10. + (*p - '0');
+        p++;
+        num_digits++;
+
+        p += (tsep != '\0' && *p == tsep);
+    }
+
+    // Process decimal part.
+    if (*p == decimal) {
+        p++;
+
+        while (isdigit(*p)) {
+            number = number * 10. + (*p - '0');
+            p++;
+            num_digits++;
+            num_decimals++;
+        }
+
+        exponent -= num_decimals;
+    }
+
+    if (num_digits == 0) {
+        errno = ERANGE;
+        return 0.0;
+    }
+
+    // Correct for sign.
+    if (negative) number = -number;
+
+    // Process an exponent string.
+    if (toupper(*p) == toupper(sci)) {
+        // Handle optional sign.
+        negative = 0;
+        switch (*++p) {
+            case '-':
+                negative = 1;  // Fall through to increment pos.
+            case '+':
+                p++;
+        }
+
+        // Process string of digits.
+        num_digits = 0;
+        n = 0;
+        while (isdigit(*p)) {
+            n = n * 10 + (*p - '0');
+            num_digits++;
+            p++;
+        }
+
+        if (negative)
+            exponent -= n;
+        else
+            exponent += n;
+
+        // If no digits, after the 'e'/'E', un-consume it
+        if (num_digits == 0) p--;
+    }
+
+    if (exponent < DBL_MIN_EXP || exponent > DBL_MAX_EXP) {
+        errno = ERANGE;
+        return HUGE_VAL;
+    }
+
+    // Scale the result.
+    p10 = 10.;
+    n = exponent;
+    if (n < 0) n = -n;
+    while (n) {
+        if (n & 1) {
+            if (exponent < 0)
+                number /= p10;
+            else
+                number *= p10;
+        }
+        n >>= 1;
+        p10 *= p10;
+    }
+
+    if (number == HUGE_VAL) {
+        errno = ERANGE;
+    }
+
+    if (skip_trailing) {
+        // Skip trailing whitespace.
+        while (isspace(*p)) p++;
+    }
+
+    if (endptr) *endptr = p;
+
+    return number;
+}
+
+double precise_xstrtod(const char *str, char **endptr, char decimal, char sci,
+                       char tsep, int skip_trailing) {
+    double number;
+    int exponent;
+    int negative;
+    char *p = (char *)str;
+    int num_digits;
+    int num_decimals;
+    int max_digits = 17;
+    int n;
+    // Cache powers of 10 in memory.
+    static double e[] = {
+        1.,    1e1,   1e2,   1e3,   1e4,   1e5,   1e6,   1e7,   1e8,   1e9,
+        1e10,  1e11,  1e12,  1e13,  1e14,  1e15,  1e16,  1e17,  1e18,  1e19,
+        1e20,  1e21,  1e22,  1e23,  1e24,  1e25,  1e26,  1e27,  1e28,  1e29,
+        1e30,  1e31,  1e32,  1e33,  1e34,  1e35,  1e36,  1e37,  1e38,  1e39,
+        1e40,  1e41,  1e42,  1e43,  1e44,  1e45,  1e46,  1e47,  1e48,  1e49,
+        1e50,  1e51,  1e52,  1e53,  1e54,  1e55,  1e56,  1e57,  1e58,  1e59,
+        1e60,  1e61,  1e62,  1e63,  1e64,  1e65,  1e66,  1e67,  1e68,  1e69,
+        1e70,  1e71,  1e72,  1e73,  1e74,  1e75,  1e76,  1e77,  1e78,  1e79,
+        1e80,  1e81,  1e82,  1e83,  1e84,  1e85,  1e86,  1e87,  1e88,  1e89,
+        1e90,  1e91,  1e92,  1e93,  1e94,  1e95,  1e96,  1e97,  1e98,  1e99,
+        1e100, 1e101, 1e102, 1e103, 1e104, 1e105, 1e106, 1e107, 1e108, 1e109,
+        1e110, 1e111, 1e112, 1e113, 1e114, 1e115, 1e116, 1e117, 1e118, 1e119,
+        1e120, 1e121, 1e122, 1e123, 1e124, 1e125, 1e126, 1e127, 1e128, 1e129,
+        1e130, 1e131, 1e132, 1e133, 1e134, 1e135, 1e136, 1e137, 1e138, 1e139,
+        1e140, 1e141, 1e142, 1e143, 1e144, 1e145, 1e146, 1e147, 1e148, 1e149,
+        1e150, 1e151, 1e152, 1e153, 1e154, 1e155, 1e156, 1e157, 1e158, 1e159,
+        1e160, 1e161, 1e162, 1e163, 1e164, 1e165, 1e166, 1e167, 1e168, 1e169,
+        1e170, 1e171, 1e172, 1e173, 1e174, 1e175, 1e176, 1e177, 1e178, 1e179,
+        1e180, 1e181, 1e182, 1e183, 1e184, 1e185, 1e186, 1e187, 1e188, 1e189,
+        1e190, 1e191, 1e192, 1e193, 1e194, 1e195, 1e196, 1e197, 1e198, 1e199,
+        1e200, 1e201, 1e202, 1e203, 1e204, 1e205, 1e206, 1e207, 1e208, 1e209,
+        1e210, 1e211, 1e212, 1e213, 1e214, 1e215, 1e216, 1e217, 1e218, 1e219,
+        1e220, 1e221, 1e222, 1e223, 1e224, 1e225, 1e226, 1e227, 1e228, 1e229,
+        1e230, 1e231, 1e232, 1e233, 1e234, 1e235, 1e236, 1e237, 1e238, 1e239,
+        1e240, 1e241, 1e242, 1e243, 1e244, 1e245, 1e246, 1e247, 1e248, 1e249,
+        1e250, 1e251, 1e252, 1e253, 1e254, 1e255, 1e256, 1e257, 1e258, 1e259,
+        1e260, 1e261, 1e262, 1e263, 1e264, 1e265, 1e266, 1e267, 1e268, 1e269,
+        1e270, 1e271, 1e272, 1e273, 1e274, 1e275, 1e276, 1e277, 1e278, 1e279,
+        1e280, 1e281, 1e282, 1e283, 1e284, 1e285, 1e286, 1e287, 1e288, 1e289,
+        1e290, 1e291, 1e292, 1e293, 1e294, 1e295, 1e296, 1e297, 1e298, 1e299,
+        1e300, 1e301, 1e302, 1e303, 1e304, 1e305, 1e306, 1e307, 1e308};
+    errno = 0;
+
+    // Skip leading whitespace.
+    while (isspace(*p)) p++;
+
+    // Handle optional sign.
+    negative = 0;
+    switch (*p) {
+        case '-':
+            negative = 1;  // Fall through to increment position.
+        case '+':
+            p++;
+    }
+
+    number = 0.;
+    exponent = 0;
+    num_digits = 0;
+    num_decimals = 0;
+
+    // Process string of digits.
+    while (isdigit(*p)) {
+        if (num_digits < max_digits) {
+            number = number * 10. + (*p - '0');
+            num_digits++;
+        } else {
+            ++exponent;
+        }
+
+        p++;
+        p += (tsep != '\0' && *p == tsep);
+    }
+
+    // Process decimal part
+    if (*p == decimal) {
+        p++;
+
+        while (num_digits < max_digits && isdigit(*p)) {
+            number = number * 10. + (*p - '0');
+            p++;
+            num_digits++;
+            num_decimals++;
+        }
+
+        if (num_digits >= max_digits)  // Consume extra decimal digits.
+            while (isdigit(*p)) ++p;
+
+        exponent -= num_decimals;
+    }
+
+    if (num_digits == 0) {
+        errno = ERANGE;
+        return 0.0;
+    }
+
+    // Correct for sign.
+    if (negative) number = -number;
+
+    // Process an exponent string.
+    if (toupper(*p) == toupper(sci)) {
+        // Handle optional sign
+        negative = 0;
+        switch (*++p) {
+            case '-':
+                negative = 1;  // Fall through to increment pos.
+            case '+':
+                p++;
+        }
+
+        // Process string of digits.
+        num_digits = 0;
+        n = 0;
+        while (isdigit(*p)) {
+            n = n * 10 + (*p - '0');
+            num_digits++;
+            p++;
+        }
+
+        if (negative)
+            exponent -= n;
+        else
+            exponent += n;
+
+        // If no digits after the 'e'/'E', un-consume it.
+        if (num_digits == 0) p--;
+    }
+
+    if (exponent > 308) {
+        errno = ERANGE;
+        return HUGE_VAL;
+    } else if (exponent > 0) {
+        number *= e[exponent];
+    } else if (exponent < -308) {  // Subnormal
+        if (exponent < -616)       // Prevent invalid array access.
+            number = 0.;
+        number /= e[-308 - exponent];
+        number /= e[308];
+    } else {
+        number /= e[-exponent];
+    }
+
+    if (number == HUGE_VAL || number == -HUGE_VAL) errno = ERANGE;
+
+    if (skip_trailing) {
+        // Skip trailing whitespace.
+        while (isspace(*p)) p++;
+    }
+
+    if (endptr) *endptr = p;
+    return number;
+}
+
+double round_trip(const char *p, char **q, char decimal, char sci, char tsep,
+                  int skip_trailing) {
+    double r = PyOS_string_to_double(p, q, 0);
+    PyErr_Clear();
+    return r;
+}
+
+// End of xstrtod code
+// ---------------------------------------------------------------------------
+
+void uint_state_init(uint_state *self) {
+    self->seen_sint = 0;
+    self->seen_uint = 0;
+    self->seen_null = 0;
+}
+
+int uint64_conflict(uint_state *self) {
+    return self->seen_uint && (self->seen_sint || self->seen_null);
+}
+
+int64_t str_to_int64(const char *p_item, int64_t int_min, int64_t int_max,
+                     int *error, char tsep) {
+    const char *p = (const char *)p_item;
+    int isneg = 0;
+    int64_t number = 0;
+    int d;
+
+    // Skip leading spaces.
+    while (isspace(*p)) {
+        ++p;
+    }
+
+    // Handle sign.
+    if (*p == '-') {
+        isneg = 1;
+        ++p;
+    } else if (*p == '+') {
+        p++;
+    }
+
+    // Check that there is a first digit.
+    if (!isdigit(*p)) {
+        // Error...
+        *error = ERROR_NO_DIGITS;
+        return 0;
+    }
+
+    if (isneg) {
+        // If number is greater than pre_min, at least one more digit
+        // can be processed without overflowing.
+        int dig_pre_min = -(int_min % 10);
+        int64_t pre_min = int_min / 10;
+
+        // Process the digits.
+        d = *p;
+        if (tsep != '\0') {
+            while (1) {
+                if (d == tsep) {
+                    d = *++p;
+                    continue;
+                } else if (!isdigit(d)) {
+                    break;
+                }
+                if ((number > pre_min) ||
+                    ((number == pre_min) && (d - '0' <= dig_pre_min))) {
+                    number = number * 10 - (d - '0');
+                    d = *++p;
+                } else {
+                    *error = ERROR_OVERFLOW;
+                    return 0;
+                }
+            }
+        } else {
+            while (isdigit(d)) {
+                if ((number > pre_min) ||
+                    ((number == pre_min) && (d - '0' <= dig_pre_min))) {
+                    number = number * 10 - (d - '0');
+                    d = *++p;
+                } else {
+                    *error = ERROR_OVERFLOW;
+                    return 0;
+                }
+            }
+        }
+    } else {
+        // If number is less than pre_max, at least one more digit
+        // can be processed without overflowing.
+        int64_t pre_max = int_max / 10;
+        int dig_pre_max = int_max % 10;
+
+        // Process the digits.
+        d = *p;
+        if (tsep != '\0') {
+            while (1) {
+                if (d == tsep) {
+                    d = *++p;
+                    continue;
+                } else if (!isdigit(d)) {
+                    break;
+                }
+                if ((number < pre_max) ||
+                    ((number == pre_max) && (d - '0' <= dig_pre_max))) {
+                    number = number * 10 + (d - '0');
+                    d = *++p;
+
+                } else {
+                    *error = ERROR_OVERFLOW;
+                    return 0;
+                }
+            }
+        } else {
+            while (isdigit(d)) {
+                if ((number < pre_max) ||
+                    ((number == pre_max) && (d - '0' <= dig_pre_max))) {
+                    number = number * 10 + (d - '0');
+                    d = *++p;
+
+                } else {
+                    *error = ERROR_OVERFLOW;
+                    return 0;
+                }
+            }
+        }
+    }
+
+    // Skip trailing spaces.
+    while (isspace(*p)) {
+        ++p;
+    }
+
+    // Did we use up all the characters?
+    if (*p) {
+        *error = ERROR_INVALID_CHARS;
+        return 0;
+    }
+
+    *error = 0;
+    return number;
+}
+
+uint64_t str_to_uint64(uint_state *state, const char *p_item, int64_t int_max,
+                       uint64_t uint_max, int *error, char tsep) {
+    const char *p = (const char *)p_item;
+    uint64_t pre_max = uint_max / 10;
+    int dig_pre_max = uint_max % 10;
+    uint64_t number = 0;
+    int d;
+
+    // Skip leading spaces.
+    while (isspace(*p)) {
+        ++p;
+    }
+
+    // Handle sign.
+    if (*p == '-') {
+        state->seen_sint = 1;
+        *error = 0;
+        return 0;
+    } else if (*p == '+') {
+        p++;
+    }
+
+    // Check that there is a first digit.
+    if (!isdigit(*p)) {
+        // Error...
+        *error = ERROR_NO_DIGITS;
+        return 0;
+    }
+
+    // If number is less than pre_max, at least one more digit
+    // can be processed without overflowing.
+    //
+    // Process the digits.
+    d = *p;
+    if (tsep != '\0') {
+        while (1) {
+            if (d == tsep) {
+                d = *++p;
+                continue;
+            } else if (!isdigit(d)) {
+                break;
+            }
+            if ((number < pre_max) ||
+                ((number == pre_max) && (d - '0' <= dig_pre_max))) {
+                number = number * 10 + (d - '0');
+                d = *++p;
+
+            } else {
+                *error = ERROR_OVERFLOW;
+                return 0;
+            }
+        }
+    } else {
+        while (isdigit(d)) {
+            if ((number < pre_max) ||
+                ((number == pre_max) && (d - '0' <= dig_pre_max))) {
+                number = number * 10 + (d - '0');
+                d = *++p;
+
+            } else {
+                *error = ERROR_OVERFLOW;
+                return 0;
+            }
+        }
+    }
+
+    // Skip trailing spaces.
+    while (isspace(*p)) {
+        ++p;
+    }
+
+    // Did we use up all the characters?
+    if (*p) {
+        *error = ERROR_INVALID_CHARS;
+        return 0;
+    }
+
+    if (number > (uint64_t)int_max) {
+        state->seen_uint = 1;
+    }
+
+    *error = 0;
+    return number;
+}
diff --git a/pandas/_libs/src/parser/tokenizer.h b/pandas/_libs/src/parser/tokenizer.h
new file mode 100644
index 0000000000000..63baf91e3c136
--- /dev/null
+++ b/pandas/_libs/src/parser/tokenizer.h
@@ -0,0 +1,279 @@
+/*
+
+Copyright (c) 2012, Lambda Foundry, Inc., except where noted
+
+Incorporates components of WarrenWeckesser/textreader, licensed under 3-clause
+BSD
+
+See LICENSE for the license
+
+*/
+
+#ifndef PANDAS__LIBS_SRC_PARSER_TOKENIZER_H_
+#define PANDAS__LIBS_SRC_PARSER_TOKENIZER_H_
+
+#include <errno.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <time.h>
+#include "Python.h"
+
+#include <ctype.h>
+
+#define ERROR_OK 0
+#define ERROR_NO_DIGITS 1
+#define ERROR_OVERFLOW 2
+#define ERROR_INVALID_CHARS 3
+
+#include "../headers/stdint.h"
+
+#include "khash.h"
+
+#define CHUNKSIZE 1024 * 256
+#define KB 1024
+#define MB 1024 * KB
+#define STREAM_INIT_SIZE 32
+
+#define REACHED_EOF 1
+#define CALLING_READ_FAILED 2
+
+#ifndef P_INLINE
+#if defined(__GNUC__)
+#define P_INLINE static __inline__
+#elif defined(_MSC_VER)
+#define P_INLINE
+#elif defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
+#define P_INLINE static inline
+#else
+#define P_INLINE
+#endif
+#endif
+
+#if defined(_MSC_VER)
+#define strtoll _strtoi64
+#endif
+
+/*
+
+  C flat file parsing low level code for pandas / NumPy
+
+ */
+
+#define FALSE 0
+#define TRUE 1
+
+// Maximum number of columns in a file.
+#define MAX_NUM_COLUMNS 2000
+
+// Maximum number of characters in single field.
+#define FIELD_BUFFER_SIZE 2000
+
+/*
+ *  Common set of error types for the read_rows() and tokenize()
+ *  functions.
+ */
+#define ERROR_OUT_OF_MEMORY 1
+#define ERROR_INVALID_COLUMN_INDEX 10
+#define ERROR_CHANGED_NUMBER_OF_FIELDS 12
+#define ERROR_TOO_MANY_CHARS 21
+#define ERROR_TOO_MANY_FIELDS 22
+#define ERROR_NO_DATA 23
+
+// #define VERBOSE
+#if defined(VERBOSE)
+#define TRACE(X) printf X;
+#else
+#define TRACE(X)
+#endif
+
+#define PARSER_OUT_OF_MEMORY -1
+
+/*
+ *  XXX Might want to couple count_rows() with read_rows() to avoid duplication
+ *      of some file I/O.
+ */
+
+/*
+ *  WORD_BUFFER_SIZE determines the maximum amount of non-delimiter
+ *  text in a row.
+ */
+#define WORD_BUFFER_SIZE 4000
+
+typedef enum {
+    START_RECORD,
+    START_FIELD,
+    ESCAPED_CHAR,
+    IN_FIELD,
+    IN_QUOTED_FIELD,
+    ESCAPE_IN_QUOTED_FIELD,
+    QUOTE_IN_QUOTED_FIELD,
+    EAT_CRNL,
+    EAT_CRNL_NOP,
+    EAT_WHITESPACE,
+    EAT_COMMENT,
+    EAT_LINE_COMMENT,
+    WHITESPACE_LINE,
+    START_FIELD_IN_SKIP_LINE,
+    IN_FIELD_IN_SKIP_LINE,
+    IN_QUOTED_FIELD_IN_SKIP_LINE,
+    QUOTE_IN_QUOTED_FIELD_IN_SKIP_LINE,
+    FINISHED
+} ParserState;
+
+typedef enum {
+    QUOTE_MINIMAL,
+    QUOTE_ALL,
+    QUOTE_NONNUMERIC,
+    QUOTE_NONE
+} QuoteStyle;
+
+typedef void *(*io_callback)(void *src, size_t nbytes, size_t *bytes_read,
+                             int *status);
+typedef int (*io_cleanup)(void *src);
+
+typedef struct parser_t {
+    void *source;
+    io_callback cb_io;
+    io_cleanup cb_cleanup;
+
+    int64_t chunksize;      // Number of bytes to prepare for each chunk
+    char *data;             // pointer to data to be processed
+    int64_t datalen;        // amount of data available
+    int64_t datapos;
+
+    // where to write out tokenized data
+    char *stream;
+    int64_t stream_len;
+    int64_t stream_cap;
+
+    // Store words in (potentially ragged) matrix for now, hmm
+    char **words;
+    int64_t *word_starts;   // where we are in the stream
+    int64_t words_len;
+    int64_t words_cap;
+
+    char *pword_start;      // pointer to stream start of current field
+    int64_t word_start;     // position start of current field
+
+    int64_t *line_start;    // position in words for start of line
+    int64_t *line_fields;   // Number of fields in each line
+    int64_t lines;          // Number of (good) lines observed
+    int64_t file_lines;     // Number of lines (including bad or skipped)
+    int64_t lines_cap;      // Vector capacity
+
+    // Tokenizing stuff
+    ParserState state;
+    int doublequote;      /* is " represented by ""? */
+    char delimiter;       /* field separator */
+    int delim_whitespace; /* delimit by consuming space/tabs instead */
+    char quotechar;       /* quote character */
+    char escapechar;      /* escape character */
+    char lineterminator;
+    int skipinitialspace; /* ignore spaces following delimiter? */
+    int quoting;          /* style of quoting to write */
+
+    // krufty, hmm =/
+    int numeric_field;
+
+    char commentchar;
+    int allow_embedded_newline;
+    int strict; /* raise exception on bad CSV */
+
+    int usecols;  // Boolean: 1: usecols provided, 0: none provided
+
+    int expected_fields;
+    int error_bad_lines;
+    int warn_bad_lines;
+
+    // floating point options
+    char decimal;
+    char sci;
+
+    // thousands separator (comma, period)
+    char thousands;
+
+    int header;            // Boolean: 1: has header, 0: no header
+    int64_t header_start;  // header row start
+    int64_t header_end;    // header row end
+
+    void *skipset;
+    PyObject *skipfunc;
+    int64_t skip_first_N_rows;
+    int skip_footer;
+    // pick one, depending on whether the converter requires GIL
+    double (*double_converter_nogil)(const char *, char **,
+                                     char, char, char, int);
+    double (*double_converter_withgil)(const char *, char **,
+                                       char, char, char, int);
+
+    // error handling
+    char *warn_msg;
+    char *error_msg;
+
+    int skip_empty_lines;
+} parser_t;
+
+typedef struct coliter_t {
+    char **words;
+    int64_t *line_start;
+    int col;
+} coliter_t;
+
+void coliter_setup(coliter_t *self, parser_t *parser, int i, int start);
+coliter_t *coliter_new(parser_t *self, int i);
+
+#define COLITER_NEXT(iter, word)                          \
+    do {                                                  \
+        const int64_t i = *iter.line_start++ + iter.col;      \
+        word = i < *iter.line_start ? iter.words[i] : ""; \
+    } while (0)
+
+parser_t *parser_new(void);
+
+int parser_init(parser_t *self);
+
+int parser_consume_rows(parser_t *self, size_t nrows);
+
+int parser_trim_buffers(parser_t *self);
+
+int parser_add_skiprow(parser_t *self, int64_t row);
+
+int parser_set_skipfirstnrows(parser_t *self, int64_t nrows);
+
+void parser_free(parser_t *self);
+
+void parser_del(parser_t *self);
+
+void parser_set_default_options(parser_t *self);
+
+int tokenize_nrows(parser_t *self, size_t nrows);
+
+int tokenize_all_rows(parser_t *self);
+
+// Have parsed / type-converted a chunk of data
+// and want to free memory from the token stream
+
+typedef struct uint_state {
+    int seen_sint;
+    int seen_uint;
+    int seen_null;
+} uint_state;
+
+void uint_state_init(uint_state *self);
+
+int uint64_conflict(uint_state *self);
+
+uint64_t str_to_uint64(uint_state *state, const char *p_item, int64_t int_max,
+                       uint64_t uint_max, int *error, char tsep);
+int64_t str_to_int64(const char *p_item, int64_t int_min, int64_t int_max,
+                     int *error, char tsep);
+double xstrtod(const char *p, char **q, char decimal, char sci, char tsep,
+               int skip_trailing);
+double precise_xstrtod(const char *p, char **q, char decimal, char sci,
+                       char tsep, int skip_trailing);
+double round_trip(const char *p, char **q, char decimal, char sci, char tsep,
+                  int skip_trailing);
+int to_boolean(const char *item, uint8_t *val);
+
+#endif  // PANDAS__LIBS_SRC_PARSER_TOKENIZER_H_
diff --git a/pandas/_libs/src/period_helper.c b/pandas/_libs/src/period_helper.c
new file mode 100644
index 0000000000000..cb6f0a220fafe
--- /dev/null
+++ b/pandas/_libs/src/period_helper.c
@@ -0,0 +1,601 @@
+/*
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+
+Borrowed and derived code from scikits.timeseries that we will expose via
+Cython to pandas. This primarily concerns interval representation and
+frequency conversion routines.
+
+See end of file for stuff pandas uses (search for 'pandas').
+*/
+
+#include "period_helper.h"
+#include "../datetime/np_datetime.h"
+
+/* ------------------------------------------------------------------
+ * Code derived from scikits.timeseries
+ * ------------------------------------------------------------------*/
+
+static int mod_compat(int x, int m) {
+    int result = x % m;
+    if (result < 0) return result + m;
+    return result;
+}
+
+static int floordiv(int x, int divisor) {
+    if (x < 0) {
+        if (mod_compat(x, divisor)) {
+            return x / divisor - 1;
+        } else {
+            return x / divisor;
+        }
+    } else {
+        return x / divisor;
+    }
+}
+
+
+static int monthToQuarter(int month) { return ((month - 1) / 3) + 1; }
+
+
+/* Find the unix_date (days elapsed since datetime(1970, 1, 1)
+ * for the given year/month/day.
+ * Assumes GREGORIAN_CALENDAR */
+npy_int64 unix_date_from_ymd(int year, int month, int day) {
+    /* Calculate the absolute date */
+    pandas_datetimestruct dts;
+    npy_int64 unix_date;
+
+    memset(&dts, 0, sizeof(pandas_datetimestruct));
+    dts.year = year;
+    dts.month = month;
+    dts.day = day;
+    unix_date = pandas_datetimestruct_to_datetime(PANDAS_FR_D, &dts);
+    return unix_date;
+}
+
+
+///////////////////////////////////////////////
+
+// frequency specific conversion routines
+// each function must take an integer fromDate and
+// a char relation ('S' or 'E' for 'START' or 'END')
+///////////////////////////////////////////////////////////////////////
+
+// helpers for frequency conversion routines //
+
+static npy_int64 daytime_conversion_factor_matrix[7][7] = {
+    {1, 24, 1440, 86400, 86400000, 86400000000, 86400000000000},
+    {0,  1,   60,  3600,  3600000,  3600000000,  3600000000000},
+    {0,  0,   1,     60,    60000,    60000000,    60000000000},
+    {0,  0,   0,      1,     1000,     1000000,     1000000000},
+    {0,  0,   0,      0,        1,        1000,        1000000},
+    {0,  0,   0,      0,        0,           1,           1000},
+    {0,  0,   0,      0,        0,           0,              1}};
+
+int max_value(int a, int b) { return a > b ? a : b; }
+
+PANDAS_INLINE int min_value(int a, int b) { return a < b ? a : b; }
+
+PANDAS_INLINE int get_freq_group(int freq) { return (freq / 1000) * 1000; }
+
+
+npy_int64 get_daytime_conversion_factor(int from_index, int to_index) {
+    int row = min_value(from_index, to_index);
+    int col = max_value(from_index, to_index);
+    // row or col < 6 means frequency strictly lower than Daily, which
+    // do not use daytime_conversion_factors
+    if (row < 6) {
+        return 0;
+    } else if (col < 6) {
+        return 0;
+    }
+    return daytime_conversion_factor_matrix[row - 6][col - 6];
+}
+
+PANDAS_INLINE npy_int64 upsample_daytime(npy_int64 ordinal,
+                                         asfreq_info *af_info) {
+    if (af_info->is_end) {
+        return (ordinal + 1) * af_info->intraday_conversion_factor - 1;
+    } else {
+        return ordinal * af_info->intraday_conversion_factor;
+    }
+}
+
+PANDAS_INLINE npy_int64 downsample_daytime(npy_int64 ordinal,
+                                           asfreq_info *af_info) {
+    return ordinal / (af_info->intraday_conversion_factor);
+}
+
+PANDAS_INLINE npy_int64 transform_via_day(npy_int64 ordinal,
+                                          asfreq_info *af_info,
+                                          freq_conv_func first_func,
+                                          freq_conv_func second_func) {
+    npy_int64 result;
+
+    result = (*first_func)(ordinal, af_info);
+    result = (*second_func)(result, af_info);
+
+    return result;
+}
+
+static npy_int64 DtoB_weekday(npy_int64 unix_date) {
+    return floordiv(unix_date + 4, 7) * 5 + mod_compat(unix_date + 4, 7) - 4;
+}
+
+static npy_int64 DtoB(pandas_datetimestruct *dts,
+                      int roll_back, npy_int64 unix_date) {
+    int day_of_week = dayofweek(dts->year, dts->month, dts->day);
+
+    if (roll_back == 1) {
+        if (day_of_week > 4) {
+            // change to friday before weekend
+            unix_date -= (day_of_week - 4);
+        }
+    } else {
+        if (day_of_week > 4) {
+            // change to Monday after weekend
+            unix_date += (7 - day_of_week);
+        }
+    }
+    return DtoB_weekday(unix_date);
+}
+
+
+//************ FROM DAILY ***************
+
+static npy_int64 asfreq_DTtoA(npy_int64 ordinal, asfreq_info *af_info) {
+    pandas_datetimestruct dts;
+    ordinal = downsample_daytime(ordinal, af_info);
+    pandas_datetime_to_datetimestruct(ordinal, PANDAS_FR_D, &dts);
+    if (dts.month > af_info->to_end) {
+        return (npy_int64)(dts.year + 1 - 1970);
+    } else {
+        return (npy_int64)(dts.year - 1970);
+    }
+}
+
+static int DtoQ_yq(npy_int64 ordinal, asfreq_info *af_info, int *year) {
+    pandas_datetimestruct dts;
+    int quarter;
+
+    pandas_datetime_to_datetimestruct(ordinal, PANDAS_FR_D, &dts);
+    if (af_info->to_end != 12) {
+        dts.month -= af_info->to_end;
+        if (dts.month <= 0) {
+            dts.month += 12;
+        } else {
+            dts.year += 1;
+        }
+    }
+
+    *year = dts.year;
+    quarter = monthToQuarter(dts.month);
+    return quarter;
+}
+
+static npy_int64 asfreq_DTtoQ(npy_int64 ordinal, asfreq_info *af_info) {
+    int year, quarter;
+
+    ordinal = downsample_daytime(ordinal, af_info);
+
+    quarter = DtoQ_yq(ordinal, af_info, &year);
+    return (npy_int64)((year - 1970) * 4 + quarter - 1);
+}
+
+static npy_int64 asfreq_DTtoM(npy_int64 ordinal, asfreq_info *af_info) {
+    pandas_datetimestruct dts;
+
+    ordinal = downsample_daytime(ordinal, af_info);
+
+    pandas_datetime_to_datetimestruct(ordinal, PANDAS_FR_D, &dts);
+    return (npy_int64)((dts.year - 1970) * 12 + dts.month - 1);
+}
+
+static npy_int64 asfreq_DTtoW(npy_int64 ordinal, asfreq_info *af_info) {
+    ordinal = downsample_daytime(ordinal, af_info);
+    return floordiv(ordinal + 3 - af_info->to_end, 7) + 1;
+}
+
+static npy_int64 asfreq_DTtoB(npy_int64 ordinal, asfreq_info *af_info) {
+    int roll_back;
+    pandas_datetimestruct dts;
+    npy_int64 unix_date = downsample_daytime(ordinal, af_info);
+    pandas_datetime_to_datetimestruct(unix_date, PANDAS_FR_D, &dts);
+
+    // This usage defines roll_back the opposite way from the others
+    roll_back = 1 - af_info->is_end;
+    return DtoB(&dts, roll_back, unix_date);
+}
+
+//************ FROM BUSINESS ***************
+
+static npy_int64 asfreq_BtoDT(npy_int64 ordinal, asfreq_info *af_info) {
+    ordinal = floordiv(ordinal + 3, 5) * 7 + mod_compat(ordinal + 3, 5) - 3;
+
+    return upsample_daytime(ordinal, af_info);
+}
+
+static npy_int64 asfreq_BtoA(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_BtoDT, asfreq_DTtoA);
+}
+
+static npy_int64 asfreq_BtoQ(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_BtoDT, asfreq_DTtoQ);
+}
+
+static npy_int64 asfreq_BtoM(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_BtoDT, asfreq_DTtoM);
+}
+
+static npy_int64 asfreq_BtoW(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_BtoDT, asfreq_DTtoW);
+}
+
+//************ FROM WEEKLY ***************
+
+static npy_int64 asfreq_WtoDT(npy_int64 ordinal, asfreq_info *af_info) {
+    ordinal = ordinal * 7 + af_info->from_end - 4 +
+               (7 - 1) * (af_info->is_end - 1);
+    return upsample_daytime(ordinal, af_info);
+}
+
+static npy_int64 asfreq_WtoA(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_WtoDT, asfreq_DTtoA);
+}
+
+static npy_int64 asfreq_WtoQ(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_WtoDT, asfreq_DTtoQ);
+}
+
+static npy_int64 asfreq_WtoM(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_WtoDT, asfreq_DTtoM);
+}
+
+static npy_int64 asfreq_WtoW(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_WtoDT, asfreq_DTtoW);
+}
+
+static npy_int64 asfreq_WtoB(npy_int64 ordinal, asfreq_info *af_info) {
+    int roll_back;
+    pandas_datetimestruct dts;
+    npy_int64 unix_date = asfreq_WtoDT(ordinal, af_info);
+
+    pandas_datetime_to_datetimestruct(unix_date, PANDAS_FR_D, &dts);
+    roll_back = af_info->is_end;
+    return DtoB(&dts, roll_back, unix_date);
+}
+
+//************ FROM MONTHLY ***************
+static void MtoD_ym(npy_int64 ordinal, int *year, int *month) {
+    *year = floordiv(ordinal, 12) + 1970;
+    *month = mod_compat(ordinal, 12) + 1;
+}
+
+static npy_int64 asfreq_MtoDT(npy_int64 ordinal, asfreq_info *af_info) {
+    npy_int64 unix_date;
+    int year, month;
+
+    ordinal += af_info->is_end;
+    MtoD_ym(ordinal, &year, &month);
+
+    unix_date = unix_date_from_ymd(year, month, 1);
+    unix_date -= af_info->is_end;
+    return upsample_daytime(unix_date, af_info);
+}
+
+static npy_int64 asfreq_MtoA(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_MtoDT, asfreq_DTtoA);
+}
+
+static npy_int64 asfreq_MtoQ(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_MtoDT, asfreq_DTtoQ);
+}
+
+static npy_int64 asfreq_MtoW(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_MtoDT, asfreq_DTtoW);
+}
+
+static npy_int64 asfreq_MtoB(npy_int64 ordinal, asfreq_info *af_info) {
+    int roll_back;
+    pandas_datetimestruct dts;
+    npy_int64 unix_date = asfreq_MtoDT(ordinal, af_info);
+
+    pandas_datetime_to_datetimestruct(unix_date, PANDAS_FR_D, &dts);
+    roll_back = af_info->is_end;
+    return DtoB(&dts, roll_back, unix_date);
+}
+
+//************ FROM QUARTERLY ***************
+
+static void QtoD_ym(npy_int64 ordinal, int *year, int *month,
+                    asfreq_info *af_info) {
+    *year = floordiv(ordinal, 4) + 1970;
+    *month = mod_compat(ordinal, 4) * 3 + 1;
+
+    if (af_info->from_end != 12) {
+        *month += af_info->from_end;
+        if (*month > 12) {
+            *month -= 12;
+        } else {
+            *year -= 1;
+        }
+    }
+}
+
+static npy_int64 asfreq_QtoDT(npy_int64 ordinal, asfreq_info *af_info) {
+    npy_int64 unix_date;
+    int year, month;
+
+    ordinal += af_info->is_end;
+    QtoD_ym(ordinal, &year, &month, af_info);
+
+    unix_date = unix_date_from_ymd(year, month, 1);
+    unix_date -= af_info->is_end;
+    return upsample_daytime(unix_date, af_info);
+}
+
+static npy_int64 asfreq_QtoQ(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_QtoDT, asfreq_DTtoQ);
+}
+
+static npy_int64 asfreq_QtoA(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_QtoDT, asfreq_DTtoA);
+}
+
+static npy_int64 asfreq_QtoM(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_QtoDT, asfreq_DTtoM);
+}
+
+static npy_int64 asfreq_QtoW(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_QtoDT, asfreq_DTtoW);
+}
+
+static npy_int64 asfreq_QtoB(npy_int64 ordinal, asfreq_info *af_info) {
+    int roll_back;
+    pandas_datetimestruct dts;
+    npy_int64 unix_date = asfreq_QtoDT(ordinal, af_info);
+
+    pandas_datetime_to_datetimestruct(unix_date, PANDAS_FR_D, &dts);
+    roll_back = af_info->is_end;
+    return DtoB(&dts, roll_back, unix_date);
+}
+
+//************ FROM ANNUAL ***************
+
+static void AtoD_ym(npy_int64 ordinal, npy_int64 *year, int *month,
+                    asfreq_info *af_info) {
+    *year = ordinal + 1970;
+    *month = 1;
+
+    if (af_info->from_end != 12) {
+        *month += af_info->from_end;
+        if (*month > 12) {
+            // This case is never reached, but is kept for symmetry
+            // with QtoD_ym
+            *month -= 12;
+        } else {
+            *year -= 1;
+        }
+    }
+}
+
+static npy_int64 asfreq_AtoDT(npy_int64 ordinal, asfreq_info *af_info) {
+    npy_int64 unix_date, year;
+    int month;
+
+    ordinal += af_info->is_end;
+    AtoD_ym(ordinal, &year, &month, af_info);
+
+    unix_date = unix_date_from_ymd(year, month, 1);
+    unix_date -= af_info->is_end;
+    return upsample_daytime(unix_date, af_info);
+}
+
+static npy_int64 asfreq_AtoA(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_AtoDT, asfreq_DTtoA);
+}
+
+static npy_int64 asfreq_AtoQ(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_AtoDT, asfreq_DTtoQ);
+}
+
+static npy_int64 asfreq_AtoM(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_AtoDT, asfreq_DTtoM);
+}
+
+static npy_int64 asfreq_AtoW(npy_int64 ordinal, asfreq_info *af_info) {
+    return transform_via_day(ordinal, af_info, asfreq_AtoDT, asfreq_DTtoW);
+}
+
+static npy_int64 asfreq_AtoB(npy_int64 ordinal, asfreq_info *af_info) {
+    int roll_back;
+    pandas_datetimestruct dts;
+    npy_int64 unix_date = asfreq_AtoDT(ordinal, af_info);
+
+    pandas_datetime_to_datetimestruct(unix_date, PANDAS_FR_D, &dts);
+    roll_back = af_info->is_end;
+    return DtoB(&dts, roll_back, unix_date);
+}
+
+static npy_int64 nofunc(npy_int64 ordinal, asfreq_info *af_info) {
+    return INT_ERR_CODE;
+}
+static npy_int64 no_op(npy_int64 ordinal, asfreq_info *af_info) {
+    return ordinal;
+}
+
+// end of frequency specific conversion routines
+
+freq_conv_func get_asfreq_func(int fromFreq, int toFreq) {
+    int fromGroup = get_freq_group(fromFreq);
+    int toGroup = get_freq_group(toFreq);
+
+    if (fromGroup == FR_UND) {
+        fromGroup = FR_DAY;
+    }
+
+    switch (fromGroup) {
+        case FR_ANN:
+            switch (toGroup) {
+                case FR_ANN:
+                    return &asfreq_AtoA;
+                case FR_QTR:
+                    return &asfreq_AtoQ;
+                case FR_MTH:
+                    return &asfreq_AtoM;
+                case FR_WK:
+                    return &asfreq_AtoW;
+                case FR_BUS:
+                    return &asfreq_AtoB;
+                case FR_DAY:
+                case FR_HR:
+                case FR_MIN:
+                case FR_SEC:
+                case FR_MS:
+                case FR_US:
+                case FR_NS:
+                    return &asfreq_AtoDT;
+
+                default:
+                    return &nofunc;
+            }
+
+        case FR_QTR:
+            switch (toGroup) {
+                case FR_ANN:
+                    return &asfreq_QtoA;
+                case FR_QTR:
+                    return &asfreq_QtoQ;
+                case FR_MTH:
+                    return &asfreq_QtoM;
+                case FR_WK:
+                    return &asfreq_QtoW;
+                case FR_BUS:
+                    return &asfreq_QtoB;
+                case FR_DAY:
+                case FR_HR:
+                case FR_MIN:
+                case FR_SEC:
+                case FR_MS:
+                case FR_US:
+                case FR_NS:
+                    return &asfreq_QtoDT;
+                default:
+                    return &nofunc;
+            }
+
+        case FR_MTH:
+            switch (toGroup) {
+                case FR_ANN:
+                    return &asfreq_MtoA;
+                case FR_QTR:
+                    return &asfreq_MtoQ;
+                case FR_MTH:
+                    return &no_op;
+                case FR_WK:
+                    return &asfreq_MtoW;
+                case FR_BUS:
+                    return &asfreq_MtoB;
+                case FR_DAY:
+                case FR_HR:
+                case FR_MIN:
+                case FR_SEC:
+                case FR_MS:
+                case FR_US:
+                case FR_NS:
+                    return &asfreq_MtoDT;
+                default:
+                    return &nofunc;
+            }
+
+        case FR_WK:
+            switch (toGroup) {
+                case FR_ANN:
+                    return &asfreq_WtoA;
+                case FR_QTR:
+                    return &asfreq_WtoQ;
+                case FR_MTH:
+                    return &asfreq_WtoM;
+                case FR_WK:
+                    return &asfreq_WtoW;
+                case FR_BUS:
+                    return &asfreq_WtoB;
+                case FR_DAY:
+                case FR_HR:
+                case FR_MIN:
+                case FR_SEC:
+                case FR_MS:
+                case FR_US:
+                case FR_NS:
+                    return &asfreq_WtoDT;
+                default:
+                    return &nofunc;
+            }
+
+        case FR_BUS:
+            switch (toGroup) {
+                case FR_ANN:
+                    return &asfreq_BtoA;
+                case FR_QTR:
+                    return &asfreq_BtoQ;
+                case FR_MTH:
+                    return &asfreq_BtoM;
+                case FR_WK:
+                    return &asfreq_BtoW;
+                case FR_BUS:
+                    return &no_op;
+                case FR_DAY:
+                case FR_HR:
+                case FR_MIN:
+                case FR_SEC:
+                case FR_MS:
+                case FR_US:
+                case FR_NS:
+                    return &asfreq_BtoDT;
+                default:
+                    return &nofunc;
+            }
+
+        case FR_DAY:
+        case FR_HR:
+        case FR_MIN:
+        case FR_SEC:
+        case FR_MS:
+        case FR_US:
+        case FR_NS:
+            switch (toGroup) {
+                case FR_ANN:
+                    return &asfreq_DTtoA;
+                case FR_QTR:
+                    return &asfreq_DTtoQ;
+                case FR_MTH:
+                    return &asfreq_DTtoM;
+                case FR_WK:
+                    return &asfreq_DTtoW;
+                case FR_BUS:
+                    return &asfreq_DTtoB;
+                case FR_DAY:
+                case FR_HR:
+                case FR_MIN:
+                case FR_SEC:
+                case FR_MS:
+                case FR_US:
+                case FR_NS:
+                    if (fromGroup > toGroup) {
+                        return &downsample_daytime;
+                    } else {
+                        return &upsample_daytime;
+                    }
+                default:
+                    return &nofunc;
+            }
+
+        default:
+            return &nofunc;
+    }
+}
diff --git a/pandas/_libs/src/period_helper.h b/pandas/_libs/src/period_helper.h
new file mode 100644
index 0000000000000..8f538b261db9e
--- /dev/null
+++ b/pandas/_libs/src/period_helper.h
@@ -0,0 +1,112 @@
+/*
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+
+Borrowed and derived code from scikits.timeseries that we will expose via
+Cython to pandas. This primarily concerns interval representation and
+frequency conversion routines.
+*/
+
+#ifndef PANDAS__LIBS_SRC_PERIOD_HELPER_H_
+#define PANDAS__LIBS_SRC_PERIOD_HELPER_H_
+
+#include <Python.h>
+#include "headers/stdint.h"
+#include "helper.h"
+#include "limits.h"
+#include "numpy/ndarraytypes.h"
+
+/*** FREQUENCY CONSTANTS ***/
+
+#define FR_ANN 1000      /* Annual */
+#define FR_ANNDEC FR_ANN /* Annual - December year end*/
+#define FR_ANNJAN 1001   /* Annual - January year end*/
+#define FR_ANNFEB 1002   /* Annual - February year end*/
+#define FR_ANNMAR 1003   /* Annual - March year end*/
+#define FR_ANNAPR 1004   /* Annual - April year end*/
+#define FR_ANNMAY 1005   /* Annual - May year end*/
+#define FR_ANNJUN 1006   /* Annual - June year end*/
+#define FR_ANNJUL 1007   /* Annual - July year end*/
+#define FR_ANNAUG 1008   /* Annual - August year end*/
+#define FR_ANNSEP 1009   /* Annual - September year end*/
+#define FR_ANNOCT 1010   /* Annual - October year end*/
+#define FR_ANNNOV 1011   /* Annual - November year end*/
+
+/* The standard quarterly frequencies with various fiscal year ends
+   eg, Q42005 for Q@OCT runs Aug 1, 2005 to Oct 31, 2005 */
+#define FR_QTR 2000      /* Quarterly - December year end (default quarterly) */
+#define FR_QTRDEC FR_QTR /* Quarterly - December year end */
+#define FR_QTRJAN 2001   /* Quarterly - January year end */
+#define FR_QTRFEB 2002   /* Quarterly - February year end */
+#define FR_QTRMAR 2003   /* Quarterly - March year end */
+#define FR_QTRAPR 2004   /* Quarterly - April year end */
+#define FR_QTRMAY 2005   /* Quarterly - May year end */
+#define FR_QTRJUN 2006   /* Quarterly - June year end */
+#define FR_QTRJUL 2007   /* Quarterly - July year end */
+#define FR_QTRAUG 2008   /* Quarterly - August year end */
+#define FR_QTRSEP 2009   /* Quarterly - September year end */
+#define FR_QTROCT 2010   /* Quarterly - October year end */
+#define FR_QTRNOV 2011   /* Quarterly - November year end */
+
+#define FR_MTH 3000 /* Monthly */
+
+#define FR_WK 4000     /* Weekly */
+#define FR_WKSUN FR_WK /* Weekly - Sunday end of week */
+#define FR_WKMON 4001  /* Weekly - Monday end of week */
+#define FR_WKTUE 4002  /* Weekly - Tuesday end of week */
+#define FR_WKWED 4003  /* Weekly - Wednesday end of week */
+#define FR_WKTHU 4004  /* Weekly - Thursday end of week */
+#define FR_WKFRI 4005  /* Weekly - Friday end of week */
+#define FR_WKSAT 4006  /* Weekly - Saturday end of week */
+
+#define FR_BUS 5000 /* Business days */
+#define FR_DAY 6000 /* Daily */
+#define FR_HR 7000  /* Hourly */
+#define FR_MIN 8000 /* Minutely */
+#define FR_SEC 9000 /* Secondly */
+#define FR_MS 10000 /* Millisecondly */
+#define FR_US 11000 /* Microsecondly */
+#define FR_NS 12000 /* Nanosecondly */
+
+#define FR_UND -10000 /* Undefined */
+
+#define INT_ERR_CODE INT32_MIN
+
+typedef struct asfreq_info {
+    int is_end;
+    // char relation == 'S' (for START) --> is_end = 0
+    // char relation == 'E' (for END) --> is_end = 1
+
+    int from_end;
+    int to_end;
+    // weekly:
+    // from_end --> day the week ends on in the "from" frequency
+    // to_end   --> day the week ends on in the "to" frequency
+    //
+    // annual:
+    // from_end --> month the year ends on in the "from" frequency
+    // to_end   --> month the year ends on in the "to" frequency
+    //
+    // quarterly:
+    // from_end --> month the year ends on in the "from" frequency
+    // to_end   --> month the year ends on in the "to" frequency
+
+    npy_int64 intraday_conversion_factor;
+} asfreq_info;
+
+typedef npy_int64 (*freq_conv_func)(npy_int64, asfreq_info *af_info);
+
+/*
+ * new pandas API helper functions here
+ */
+
+freq_conv_func get_asfreq_func(int fromFreq, int toFreq);
+
+npy_int64 get_daytime_conversion_factor(int from_index, int to_index);
+int max_value(int a, int b);
+
+#endif  // PANDAS__LIBS_SRC_PERIOD_HELPER_H_
diff --git a/pandas/_libs/src/skiplist.h b/pandas/_libs/src/skiplist.h
new file mode 100644
index 0000000000000..f9527e72f577e
--- /dev/null
+++ b/pandas/_libs/src/skiplist.h
@@ -0,0 +1,290 @@
+/*
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+
+Flexibly-sized, index-able skiplist data structure for maintaining a sorted
+list of values
+
+Port of Wes McKinney's Cython version of Raymond Hettinger's original pure
+Python recipe (http://rhettinger.wordpress.com/2010/02/06/lost-knowledge/)
+*/
+
+#ifndef PANDAS__LIBS_SRC_SKIPLIST_H_
+#define PANDAS__LIBS_SRC_SKIPLIST_H_
+
+#include <math.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+
+#ifndef PANDAS_INLINE
+#if defined(__GNUC__)
+#define PANDAS_INLINE static __inline__
+#elif defined(_MSC_VER)
+#define PANDAS_INLINE static __inline
+#elif defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
+#define PANDAS_INLINE static inline
+#else
+#define PANDAS_INLINE
+#endif
+#endif
+
+PANDAS_INLINE float __skiplist_nanf(void) {
+    const union {
+        int __i;
+        float __f;
+    } __bint = {0x7fc00000UL};
+    return __bint.__f;
+}
+#define PANDAS_NAN ((double)__skiplist_nanf())
+
+PANDAS_INLINE double Log2(double val) { return log(val) / log(2.); }
+
+typedef struct node_t node_t;
+
+struct node_t {
+    node_t **next;
+    int *width;
+    double value;
+    int is_nil;
+    int levels;
+    int ref_count;
+};
+
+typedef struct {
+    node_t *head;
+    node_t **tmp_chain;
+    int *tmp_steps;
+    int size;
+    int maxlevels;
+} skiplist_t;
+
+PANDAS_INLINE double urand(void) {
+    return ((double)rand() + 1) / ((double)RAND_MAX + 2);
+}
+
+PANDAS_INLINE int int_min(int a, int b) { return a < b ? a : b; }
+
+PANDAS_INLINE node_t *node_init(double value, int levels) {
+    node_t *result;
+    result = (node_t *)malloc(sizeof(node_t));
+    if (result) {
+        result->value = value;
+        result->levels = levels;
+        result->is_nil = 0;
+        result->ref_count = 0;
+        result->next = (node_t **)malloc(levels * sizeof(node_t *));
+        result->width = (int *)malloc(levels * sizeof(int));
+        if (!(result->next && result->width) && (levels != 0)) {
+            free(result->next);
+            free(result->width);
+            free(result);
+            return NULL;
+        }
+    }
+    return result;
+}
+
+// do this ourselves
+PANDAS_INLINE void node_incref(node_t *node) { ++(node->ref_count); }
+
+PANDAS_INLINE void node_decref(node_t *node) { --(node->ref_count); }
+
+static void node_destroy(node_t *node) {
+    int i;
+    if (node) {
+        if (node->ref_count <= 1) {
+            for (i = 0; i < node->levels; ++i) {
+                node_destroy(node->next[i]);
+            }
+            free(node->next);
+            free(node->width);
+            // printf("Reference count was 1, freeing\n");
+            free(node);
+        } else {
+            node_decref(node);
+        }
+        // pretty sure that freeing the struct above will be enough
+    }
+}
+
+PANDAS_INLINE void skiplist_destroy(skiplist_t *skp) {
+    if (skp) {
+        node_destroy(skp->head);
+        free(skp->tmp_steps);
+        free(skp->tmp_chain);
+        free(skp);
+    }
+}
+
+PANDAS_INLINE skiplist_t *skiplist_init(int expected_size) {
+    skiplist_t *result;
+    node_t *NIL, *head;
+    int maxlevels, i;
+
+    maxlevels = 1 + Log2((double)expected_size);
+    result = (skiplist_t *)malloc(sizeof(skiplist_t));
+    if (!result) {
+        return NULL;
+    }
+    result->tmp_chain = (node_t **)malloc(maxlevels * sizeof(node_t *));
+    result->tmp_steps = (int *)malloc(maxlevels * sizeof(int));
+    result->maxlevels = maxlevels;
+    result->size = 0;
+
+    head = result->head = node_init(PANDAS_NAN, maxlevels);
+    NIL = node_init(0.0, 0);
+
+    if (!(result->tmp_chain && result->tmp_steps && result->head && NIL)) {
+        skiplist_destroy(result);
+        node_destroy(NIL);
+        return NULL;
+    }
+
+    node_incref(head);
+
+    NIL->is_nil = 1;
+
+    for (i = 0; i < maxlevels; ++i) {
+        head->next[i] = NIL;
+        head->width[i] = 1;
+        node_incref(NIL);
+    }
+
+    return result;
+}
+
+// 1 if left < right, 0 if left == right, -1 if left > right
+PANDAS_INLINE int _node_cmp(node_t *node, double value) {
+    if (node->is_nil || node->value > value) {
+        return -1;
+    } else if (node->value < value) {
+        return 1;
+    } else {
+        return 0;
+    }
+}
+
+PANDAS_INLINE double skiplist_get(skiplist_t *skp, int i, int *ret) {
+    node_t *node;
+    int level;
+
+    if (i < 0 || i >= skp->size) {
+        *ret = 0;
+        return 0;
+    }
+
+    node = skp->head;
+    ++i;
+    for (level = skp->maxlevels - 1; level >= 0; --level) {
+        while (node->width[level] <= i) {
+            i -= node->width[level];
+            node = node->next[level];
+        }
+    }
+
+    *ret = 1;
+    return node->value;
+}
+
+PANDAS_INLINE int skiplist_insert(skiplist_t *skp, double value) {
+    node_t *node, *prevnode, *newnode, *next_at_level;
+    int *steps_at_level;
+    int size, steps, level;
+    node_t **chain;
+
+    chain = skp->tmp_chain;
+
+    steps_at_level = skp->tmp_steps;
+    memset(steps_at_level, 0, skp->maxlevels * sizeof(int));
+
+    node = skp->head;
+
+    for (level = skp->maxlevels - 1; level >= 0; --level) {
+        next_at_level = node->next[level];
+        while (_node_cmp(next_at_level, value) >= 0) {
+            steps_at_level[level] += node->width[level];
+            node = next_at_level;
+            next_at_level = node->next[level];
+        }
+        chain[level] = node;
+    }
+
+    size = int_min(skp->maxlevels, 1 - ((int)Log2(urand())));
+
+    newnode = node_init(value, size);
+    if (!newnode) {
+        return -1;
+    }
+    steps = 0;
+
+    for (level = 0; level < size; ++level) {
+        prevnode = chain[level];
+        newnode->next[level] = prevnode->next[level];
+
+        prevnode->next[level] = newnode;
+        node_incref(newnode);  // increment the reference count
+
+        newnode->width[level] = prevnode->width[level] - steps;
+        prevnode->width[level] = steps + 1;
+
+        steps += steps_at_level[level];
+    }
+
+    for (level = size; level < skp->maxlevels; ++level) {
+        chain[level]->width[level] += 1;
+    }
+
+    ++(skp->size);
+
+    return 1;
+}
+
+PANDAS_INLINE int skiplist_remove(skiplist_t *skp, double value) {
+    int level, size;
+    node_t *node, *prevnode, *tmpnode, *next_at_level;
+    node_t **chain;
+
+    chain = skp->tmp_chain;
+    node = skp->head;
+
+    for (level = skp->maxlevels - 1; level >= 0; --level) {
+        next_at_level = node->next[level];
+        while (_node_cmp(next_at_level, value) > 0) {
+            node = next_at_level;
+            next_at_level = node->next[level];
+        }
+        chain[level] = node;
+    }
+
+    if (value != chain[0]->next[0]->value) {
+        return 0;
+    }
+
+    size = chain[0]->next[0]->levels;
+
+    for (level = 0; level < size; ++level) {
+        prevnode = chain[level];
+
+        tmpnode = prevnode->next[level];
+
+        prevnode->width[level] += tmpnode->width[level] - 1;
+        prevnode->next[level] = tmpnode->next[level];
+
+        tmpnode->next[level] = NULL;
+        node_destroy(tmpnode);  // decrement refcount or free
+    }
+
+    for (level = size; level < skp->maxlevels; ++level) {
+        --(chain[level]->width[level]);
+    }
+
+    --(skp->size);
+    return 1;
+}
+
+#endif  // PANDAS__LIBS_SRC_SKIPLIST_H_
diff --git a/pandas/src/ujson/lib/ultrajson.h b/pandas/_libs/src/ujson/lib/ultrajson.h
similarity index 84%
rename from pandas/src/ujson/lib/ultrajson.h
rename to pandas/_libs/src/ujson/lib/ultrajson.h
index ba1958723fa94..0470fef450dde 100644
--- a/pandas/src/ujson/lib/ultrajson.h
+++ b/pandas/_libs/src/ujson/lib/ultrajson.h
@@ -26,7 +26,7 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 
 Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
-http://code.google.com/p/stringencoders/
+https://github.com/client9/stringencoders
 Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights reserved.
 
 Numeric decoder derived from from TCL library
@@ -49,8 +49,8 @@ tree doesn't have cyclic references.
 
 */
 
-#ifndef __ULTRAJSON_H__
-#define __ULTRAJSON_H__
+#ifndef PANDAS__LIBS_SRC_UJSON_LIB_ULTRAJSON_H_
+#define PANDAS__LIBS_SRC_UJSON_LIB_ULTRAJSON_H_
 
 #include <stdio.h>
 #include <wchar.h>
@@ -95,7 +95,7 @@ typedef __int64 JSLONG;
 
 #define FASTCALL_MSVC __fastcall
 #define FASTCALL_ATTR
-#define INLINE_PREFIX __inline
+#define INLINE_PREFIX static __inline
 
 #else
 
@@ -114,7 +114,7 @@ typedef uint32_t JSUINT32;
 #define FASTCALL_ATTR
 #endif
 
-#define INLINE_PREFIX inline
+#define INLINE_PREFIX static inline
 
 typedef uint8_t JSUINT8;
 typedef uint16_t JSUTF16;
@@ -140,28 +140,26 @@ typedef int64_t JSLONG;
 #endif
 
 #if !defined(__LITTLE_ENDIAN__) && !defined(__BIG_ENDIAN__)
-#error "Endianess not supported"
+#error "Endianness not supported"
 #endif
 
-enum JSTYPES
-{
-  JT_NULL,        // NULL
-  JT_TRUE,        //boolean true
-  JT_FALSE,       //boolean false
-  JT_INT,         //(JSINT32 (signed 32-bit))
-  JT_LONG,        //(JSINT64 (signed 64-bit))
-  JT_DOUBLE,    //(double)
-  JT_UTF8,        //(char 8-bit)
-  JT_ARRAY,       // Array structure
-  JT_OBJECT,    // Key/Value structure
-  JT_INVALID,    // Internal, do not return nor expect
+enum JSTYPES {
+  JT_NULL,     // NULL
+  JT_TRUE,     // boolean true
+  JT_FALSE,    // boolean false
+  JT_INT,      // (JSINT32 (signed 32-bit))
+  JT_LONG,     // (JSINT64 (signed 64-bit))
+  JT_DOUBLE,   // (double)
+  JT_UTF8,     // (char 8-bit)
+  JT_ARRAY,    // Array structure
+  JT_OBJECT,   // Key/Value structure
+  JT_INVALID,  // Internal, do not return nor expect
 };
 
 typedef void * JSOBJ;
 typedef void * JSITER;
 
-typedef struct __JSONTypeContext
-{
+typedef struct __JSONTypeContext {
   int type;
   void *encoder;
   void *prv;
@@ -173,16 +171,17 @@ typedef void (*JSPFN_ITERBEGIN)(JSOBJ obj, JSONTypeContext *tc);
 typedef int (*JSPFN_ITERNEXT)(JSOBJ obj, JSONTypeContext *tc);
 typedef void (*JSPFN_ITEREND)(JSOBJ obj, JSONTypeContext *tc);
 typedef JSOBJ (*JSPFN_ITERGETVALUE)(JSOBJ obj, JSONTypeContext *tc);
-typedef char *(*JSPFN_ITERGETNAME)(JSOBJ obj, JSONTypeContext *tc, size_t *outLen);
+typedef char *(*JSPFN_ITERGETNAME)(JSOBJ obj, JSONTypeContext *tc,
+                                   size_t *outLen);
 typedef void *(*JSPFN_MALLOC)(size_t size);
 typedef void (*JSPFN_FREE)(void *pptr);
 typedef void *(*JSPFN_REALLOC)(void *base, size_t size);
 
-typedef struct __JSONObjectEncoder
-{
+typedef struct __JSONObjectEncoder {
   void (*beginTypeContext)(JSOBJ obj, JSONTypeContext *tc);
   void (*endTypeContext)(JSOBJ obj, JSONTypeContext *tc);
-  const char *(*getStringValue)(JSOBJ obj, JSONTypeContext *tc, size_t *_outLen);
+  const char *(*getStringValue)(JSOBJ obj, JSONTypeContext *tc,
+                                size_t *_outLen);
   JSINT64 (*getLongValue)(JSOBJ obj, JSONTypeContext *tc);
   JSINT32 (*getIntValue)(JSOBJ obj, JSONTypeContext *tc);
   double (*getDoubleValue)(JSOBJ obj, JSONTypeContext *tc);
@@ -234,7 +233,7 @@ typedef struct __JSONObjectEncoder
   int recursionMax;
 
   /*
-  Configuration for max decimals of double floating poiunt numbers to encode (0-9) */
+  Configuration for max decimals of double floating point numbers to encode (0-9) */
   int doublePrecision;
 
   /*
@@ -246,7 +245,7 @@ typedef struct __JSONObjectEncoder
   int encodeHTMLChars;
 
   /*
-  Set to an error message if error occured */
+  Set to an error message if error occurred */
   const char *errorMsg;
   JSOBJ errorObj;
 
@@ -256,10 +255,8 @@ typedef struct __JSONObjectEncoder
   char *end;
   int heap;
   int level;
-
 } JSONObjectEncoder;
 
-
 /*
 Encode an object structure into JSON.
 
@@ -279,12 +276,10 @@ Life cycle of the provided buffer must still be handled by caller.
 If the return value doesn't equal the specified buffer caller must release the memory using
 JSONObjectEncoder.free or free() as specified when calling this function.
 */
-EXPORTFUNCTION char *JSON_EncodeObject(JSOBJ obj, JSONObjectEncoder *enc, char *buffer, size_t cbBuffer);
-
-
+EXPORTFUNCTION char *JSON_EncodeObject(JSOBJ obj, JSONObjectEncoder *enc,
+                                       char *buffer, size_t cbBuffer);
 
-typedef struct __JSONObjectDecoder
-{
+typedef struct __JSONObjectDecoder {
   JSOBJ (*newString)(void *prv, wchar_t *start, wchar_t *end);
   int (*objectAddKey)(void *prv, JSOBJ obj, JSOBJ name, JSOBJ value);
   int (*arrayAddItem)(void *prv, JSOBJ obj, JSOBJ value);
@@ -308,7 +303,15 @@ typedef struct __JSONObjectDecoder
   void *prv;
 } JSONObjectDecoder;
 
-EXPORTFUNCTION JSOBJ JSON_DecodeObject(JSONObjectDecoder *dec, const char *buffer, size_t cbBuffer);
+EXPORTFUNCTION JSOBJ JSON_DecodeObject(JSONObjectDecoder *dec,
+                                       const char *buffer, size_t cbBuffer);
 EXPORTFUNCTION void encode(JSOBJ, JSONObjectEncoder *, const char *, size_t);
 
-#endif
+#define Buffer_Reserve(__enc, __len)                                  \
+    if ((size_t)((__enc)->end - (__enc)->offset) < (size_t)(__len)) { \
+        Buffer_Realloc((__enc), (__len));                             \
+    }
+
+void Buffer_Realloc(JSONObjectEncoder *enc, size_t cbNeeded);
+
+#endif  // PANDAS__LIBS_SRC_UJSON_LIB_ULTRAJSON_H_
diff --git a/pandas/_libs/src/ujson/lib/ultrajsondec.c b/pandas/_libs/src/ujson/lib/ultrajsondec.c
new file mode 100644
index 0000000000000..a847b0f5d5102
--- /dev/null
+++ b/pandas/_libs/src/ujson/lib/ultrajsondec.c
@@ -0,0 +1,1151 @@
+/*
+Copyright (c) 2011-2013, ESN Social Software AB and Jonas Tarnstrom
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+* Redistributions of source code must retain the above copyright
+notice, this list of conditions and the following disclaimer.
+* Redistributions in binary form must reproduce the above copyright
+notice, this list of conditions and the following disclaimer in the
+documentation and/or other materials provided with the distribution.
+* Neither the name of the ESN Social Software AB nor the
+names of its contributors may be used to endorse or promote products
+derived from this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE
+LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
+ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+
+Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
+https://github.com/client9/stringencoders
+Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights
+reserved.
+
+Numeric decoder derived from from TCL library
+http://www.opensource.apple.com/source/tcl/tcl-14/tcl/license.terms
+* Copyright (c) 1988-1993 The Regents of the University of California.
+* Copyright (c) 1994 Sun Microsystems, Inc.
+*/
+
+#include <assert.h>
+#include <errno.h>
+#include <limits.h>
+#include <locale.h>
+#include <math.h>
+#include <stdlib.h>
+#include <string.h>
+#include <wchar.h>
+#include "ultrajson.h"
+
+#ifndef TRUE
+#define TRUE 1
+#define FALSE 0
+#endif
+#ifndef NULL
+#define NULL 0
+#endif
+
+struct DecoderState {
+    char *start;
+    char *end;
+    wchar_t *escStart;
+    wchar_t *escEnd;
+    int escHeap;
+    int lastType;
+    JSUINT32 objDepth;
+    void *prv;
+    JSONObjectDecoder *dec;
+};
+
+JSOBJ FASTCALL_MSVC decode_any(struct DecoderState *ds) FASTCALL_ATTR;
+typedef JSOBJ (*PFN_DECODER)(struct DecoderState *ds);
+
+static JSOBJ SetError(struct DecoderState *ds, int offset,
+                      const char *message) {
+    ds->dec->errorOffset = ds->start + offset;
+    ds->dec->errorStr = (char *)message;
+    return NULL;
+}
+
+double createDouble(double intNeg, double intValue, double frcValue,
+                    int frcDecimalCount) {
+    static const double g_pow10[] = {1.0,
+                                     0.1,
+                                     0.01,
+                                     0.001,
+                                     0.0001,
+                                     0.00001,
+                                     0.000001,
+                                     0.0000001,
+                                     0.00000001,
+                                     0.000000001,
+                                     0.0000000001,
+                                     0.00000000001,
+                                     0.000000000001,
+                                     0.0000000000001,
+                                     0.00000000000001,
+                                     0.000000000000001};
+    return (intValue + (frcValue * g_pow10[frcDecimalCount])) * intNeg;
+}
+
+FASTCALL_ATTR JSOBJ FASTCALL_MSVC decodePreciseFloat(struct DecoderState *ds) {
+    char *end;
+    double value;
+    errno = 0;
+
+    value = strtod(ds->start, &end);
+
+    if (errno == ERANGE) {
+        return SetError(ds, -1, "Range error when decoding numeric as double");
+    }
+
+    ds->start = end;
+    return ds->dec->newDouble(ds->prv, value);
+}
+
+FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_numeric(struct DecoderState *ds) {
+    int intNeg = 1;
+    int mantSize = 0;
+    JSUINT64 intValue;
+    int chr;
+    int decimalCount = 0;
+    double frcValue = 0.0;
+    double expNeg;
+    double expValue;
+    char *offset = ds->start;
+
+    JSUINT64 overflowLimit = LLONG_MAX;
+
+    if (*(offset) == '-') {
+        offset++;
+        intNeg = -1;
+        overflowLimit = LLONG_MIN;
+    }
+
+    // Scan integer part
+    intValue = 0;
+
+    while (1) {
+        chr = (int)(unsigned char)*(offset);
+
+        switch (chr) {
+            case '0':
+            case '1':
+            case '2':
+            case '3':
+            case '4':
+            case '5':
+            case '6':
+            case '7':
+            case '8':
+            case '9': {
+                // FIXME: Check for arithemtic overflow here
+                // PERF: Don't do 64-bit arithmetic here unless we know we have
+                // to
+                intValue = intValue * 10ULL + (JSLONG)(chr - 48);
+
+                if (intValue > overflowLimit) {
+                    return SetError(ds, -1, overflowLimit == LLONG_MAX
+                                                ? "Value is too big"
+                                                : "Value is too small");
+                }
+
+                offset++;
+                mantSize++;
+                break;
+            }
+            case '.': {
+                offset++;
+                goto DECODE_FRACTION;
+                break;
+            }
+            case 'e':
+            case 'E': {
+                offset++;
+                goto DECODE_EXPONENT;
+                break;
+            }
+
+            default: {
+                goto BREAK_INT_LOOP;
+                break;
+            }
+        }
+    }
+
+BREAK_INT_LOOP:
+
+    ds->lastType = JT_INT;
+    ds->start = offset;
+
+    if ((intValue >> 31)) {
+        return ds->dec->newLong(ds->prv, (JSINT64)(intValue * (JSINT64)intNeg));
+    } else {
+        return ds->dec->newInt(ds->prv, (JSINT32)(intValue * intNeg));
+    }
+
+DECODE_FRACTION:
+
+    if (ds->dec->preciseFloat) {
+        return decodePreciseFloat(ds);
+    }
+
+    // Scan fraction part
+    frcValue = 0.0;
+    for (;;) {
+        chr = (int)(unsigned char)*(offset);
+
+        switch (chr) {
+            case '0':
+            case '1':
+            case '2':
+            case '3':
+            case '4':
+            case '5':
+            case '6':
+            case '7':
+            case '8':
+            case '9': {
+                if (decimalCount < JSON_DOUBLE_MAX_DECIMALS) {
+                    frcValue = frcValue * 10.0 + (double)(chr - 48);
+                    decimalCount++;
+                }
+                offset++;
+                break;
+            }
+            case 'e':
+            case 'E': {
+                offset++;
+                goto DECODE_EXPONENT;
+                break;
+            }
+            default: { goto BREAK_FRC_LOOP; }
+        }
+    }
+
+BREAK_FRC_LOOP:
+    // FIXME: Check for arithemtic overflow here
+    ds->lastType = JT_DOUBLE;
+    ds->start = offset;
+    return ds->dec->newDouble(
+        ds->prv,
+        createDouble((double)intNeg, (double)intValue, frcValue, decimalCount));
+
+DECODE_EXPONENT:
+    if (ds->dec->preciseFloat) {
+        return decodePreciseFloat(ds);
+    }
+
+    expNeg = 1.0;
+
+    if (*(offset) == '-') {
+        expNeg = -1.0;
+        offset++;
+    } else if (*(offset) == '+') {
+        expNeg = +1.0;
+        offset++;
+    }
+
+    expValue = 0.0;
+
+    for (;;) {
+        chr = (int)(unsigned char)*(offset);
+
+        switch (chr) {
+            case '0':
+            case '1':
+            case '2':
+            case '3':
+            case '4':
+            case '5':
+            case '6':
+            case '7':
+            case '8':
+            case '9': {
+                expValue = expValue * 10.0 + (double)(chr - 48);
+                offset++;
+                break;
+            }
+            default: { goto BREAK_EXP_LOOP; }
+        }
+    }
+
+BREAK_EXP_LOOP:
+    // FIXME: Check for arithemtic overflow here
+    ds->lastType = JT_DOUBLE;
+    ds->start = offset;
+    return ds->dec->newDouble(
+        ds->prv,
+        createDouble((double)intNeg, (double)intValue, frcValue, decimalCount) *
+            pow(10.0, expValue * expNeg));
+}
+
+FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_true(struct DecoderState *ds) {
+    char *offset = ds->start;
+    offset++;
+
+    if (*(offset++) != 'r') goto SETERROR;
+    if (*(offset++) != 'u') goto SETERROR;
+    if (*(offset++) != 'e') goto SETERROR;
+
+    ds->lastType = JT_TRUE;
+    ds->start = offset;
+    return ds->dec->newTrue(ds->prv);
+
+SETERROR:
+    return SetError(ds, -1, "Unexpected character found when decoding 'true'");
+}
+
+FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_false(struct DecoderState *ds) {
+    char *offset = ds->start;
+    offset++;
+
+    if (*(offset++) != 'a') goto SETERROR;
+    if (*(offset++) != 'l') goto SETERROR;
+    if (*(offset++) != 's') goto SETERROR;
+    if (*(offset++) != 'e') goto SETERROR;
+
+    ds->lastType = JT_FALSE;
+    ds->start = offset;
+    return ds->dec->newFalse(ds->prv);
+
+SETERROR:
+    return SetError(ds, -1, "Unexpected character found when decoding 'false'");
+}
+
+FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_null(struct DecoderState *ds) {
+    char *offset = ds->start;
+    offset++;
+
+    if (*(offset++) != 'u') goto SETERROR;
+    if (*(offset++) != 'l') goto SETERROR;
+    if (*(offset++) != 'l') goto SETERROR;
+
+    ds->lastType = JT_NULL;
+    ds->start = offset;
+    return ds->dec->newNull(ds->prv);
+
+SETERROR:
+    return SetError(ds, -1, "Unexpected character found when decoding 'null'");
+}
+
+FASTCALL_ATTR void FASTCALL_MSVC SkipWhitespace(struct DecoderState *ds) {
+    char *offset;
+
+    for (offset = ds->start; (ds->end - offset) > 0; offset++) {
+        switch (*offset) {
+            case ' ':
+            case '\t':
+            case '\r':
+            case '\n':
+                break;
+
+            default:
+                ds->start = offset;
+                return;
+        }
+    }
+
+    if (offset == ds->end) {
+        ds->start = ds->end;
+    }
+}
+
+enum DECODESTRINGSTATE {
+    DS_ISNULL = 0x32,
+    DS_ISQUOTE,
+    DS_ISESCAPE,
+    DS_UTFLENERROR,
+};
+
+static const JSUINT8 g_decoderLookup[256] = {
+    /* 0x00 */ DS_ISNULL,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0x10 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0x20 */ 1,
+    1,
+    DS_ISQUOTE,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0x30 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0x40 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0x50 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    DS_ISESCAPE,
+    1,
+    1,
+    1,
+    /* 0x60 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0x70 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0x80 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0x90 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0xa0 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0xb0 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0xc0 */ 2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    /* 0xd0 */ 2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    /* 0xe0 */ 3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    /* 0xf0 */ 4,
+    4,
+    4,
+    4,
+    4,
+    4,
+    4,
+    4,
+    DS_UTFLENERROR,
+    DS_UTFLENERROR,
+    DS_UTFLENERROR,
+    DS_UTFLENERROR,
+    DS_UTFLENERROR,
+    DS_UTFLENERROR,
+    DS_UTFLENERROR,
+    DS_UTFLENERROR,
+};
+
+FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_string(struct DecoderState *ds) {
+    JSUTF16 sur[2] = {0};
+    int iSur = 0;
+    int index;
+    wchar_t *escOffset;
+    wchar_t *escStart;
+    size_t escLen = (ds->escEnd - ds->escStart);
+    JSUINT8 *inputOffset;
+    JSUINT8 oct;
+    JSUTF32 ucs;
+    ds->lastType = JT_INVALID;
+    ds->start++;
+
+    if ((size_t)(ds->end - ds->start) > escLen) {
+        size_t newSize = (ds->end - ds->start);
+
+        if (ds->escHeap) {
+            if (newSize > (SIZE_MAX / sizeof(wchar_t))) {
+                return SetError(ds, -1, "Could not reserve memory block");
+            }
+            escStart = (wchar_t *)ds->dec->realloc(ds->escStart,
+                                                   newSize * sizeof(wchar_t));
+            if (!escStart) {
+                ds->dec->free(ds->escStart);
+                return SetError(ds, -1, "Could not reserve memory block");
+            }
+            ds->escStart = escStart;
+        } else {
+            wchar_t *oldStart = ds->escStart;
+            if (newSize > (SIZE_MAX / sizeof(wchar_t))) {
+                return SetError(ds, -1, "Could not reserve memory block");
+            }
+            ds->escStart =
+                (wchar_t *)ds->dec->malloc(newSize * sizeof(wchar_t));
+            if (!ds->escStart) {
+                return SetError(ds, -1, "Could not reserve memory block");
+            }
+            ds->escHeap = 1;
+            memcpy(ds->escStart, oldStart, escLen * sizeof(wchar_t));
+        }
+
+        ds->escEnd = ds->escStart + newSize;
+    }
+
+    escOffset = ds->escStart;
+    inputOffset = (JSUINT8 *)ds->start;
+
+    for (;;) {
+        switch (g_decoderLookup[(JSUINT8)(*inputOffset)]) {
+            case DS_ISNULL: {
+                return SetError(ds, -1,
+                                "Unmatched ''\"' when when decoding 'string'");
+            }
+            case DS_ISQUOTE: {
+                ds->lastType = JT_UTF8;
+                inputOffset++;
+                ds->start += ((char *)inputOffset - (ds->start));
+                return ds->dec->newString(ds->prv, ds->escStart, escOffset);
+            }
+            case DS_UTFLENERROR: {
+                return SetError(
+                    ds, -1,
+                    "Invalid UTF-8 sequence length when decoding 'string'");
+            }
+            case DS_ISESCAPE:
+                inputOffset++;
+                switch (*inputOffset) {
+                    case '\\':
+                        *(escOffset++) = L'\\';
+                        inputOffset++;
+                        continue;
+                    case '\"':
+                        *(escOffset++) = L'\"';
+                        inputOffset++;
+                        continue;
+                    case '/':
+                        *(escOffset++) = L'/';
+                        inputOffset++;
+                        continue;
+                    case 'b':
+                        *(escOffset++) = L'\b';
+                        inputOffset++;
+                        continue;
+                    case 'f':
+                        *(escOffset++) = L'\f';
+                        inputOffset++;
+                        continue;
+                    case 'n':
+                        *(escOffset++) = L'\n';
+                        inputOffset++;
+                        continue;
+                    case 'r':
+                        *(escOffset++) = L'\r';
+                        inputOffset++;
+                        continue;
+                    case 't':
+                        *(escOffset++) = L'\t';
+                        inputOffset++;
+                        continue;
+
+                    case 'u': {
+                        int index;
+                        inputOffset++;
+
+                        for (index = 0; index < 4; index++) {
+                            switch (*inputOffset) {
+                                case '\0':
+                                    return SetError(ds, -1,
+                                                    "Unterminated unicode "
+                                                    "escape sequence when "
+                                                    "decoding 'string'");
+                                default:
+                                    return SetError(ds, -1,
+                                                    "Unexpected character in "
+                                                    "unicode escape sequence "
+                                                    "when decoding 'string'");
+
+                                case '0':
+                                case '1':
+                                case '2':
+                                case '3':
+                                case '4':
+                                case '5':
+                                case '6':
+                                case '7':
+                                case '8':
+                                case '9':
+                                    sur[iSur] = (sur[iSur] << 4) +
+                                                (JSUTF16)(*inputOffset - '0');
+                                    break;
+
+                                case 'a':
+                                case 'b':
+                                case 'c':
+                                case 'd':
+                                case 'e':
+                                case 'f':
+                                    sur[iSur] = (sur[iSur] << 4) + 10 +
+                                                (JSUTF16)(*inputOffset - 'a');
+                                    break;
+
+                                case 'A':
+                                case 'B':
+                                case 'C':
+                                case 'D':
+                                case 'E':
+                                case 'F':
+                                    sur[iSur] = (sur[iSur] << 4) + 10 +
+                                                (JSUTF16)(*inputOffset - 'A');
+                                    break;
+                            }
+
+                            inputOffset++;
+                        }
+
+                        if (iSur == 0) {
+                            if ((sur[iSur] & 0xfc00) == 0xd800) {
+                                // First of a surrogate pair, continue parsing
+                                iSur++;
+                                break;
+                            }
+                            (*escOffset++) = (wchar_t)sur[iSur];
+                            iSur = 0;
+                        } else {
+                            // Decode pair
+                            if ((sur[1] & 0xfc00) != 0xdc00) {
+                                return SetError(ds, -1,
+                                                "Unpaired high surrogate when "
+                                                "decoding 'string'");
+                            }
+#if WCHAR_MAX == 0xffff
+                            (*escOffset++) = (wchar_t)sur[0];
+                            (*escOffset++) = (wchar_t)sur[1];
+#else
+                            (*escOffset++) =
+                                (wchar_t)0x10000 +
+                                (((sur[0] - 0xd800) << 10) | (sur[1] - 0xdc00));
+#endif
+                            iSur = 0;
+                        }
+                        break;
+                    }
+
+                    case '\0':
+                        return SetError(ds, -1,
+                                        "Unterminated escape sequence when "
+                                        "decoding 'string'");
+                    default:
+                        return SetError(ds, -1,
+                                        "Unrecognized escape sequence when "
+                                        "decoding 'string'");
+                }
+                break;
+
+            case 1: {
+                *(escOffset++) = (wchar_t)(*inputOffset++);
+                break;
+            }
+
+            case 2: {
+                ucs = (*inputOffset++) & 0x1f;
+                ucs <<= 6;
+                if (((*inputOffset) & 0x80) != 0x80) {
+                    return SetError(ds, -1,
+                                    "Invalid octet in UTF-8 sequence when "
+                                    "decoding 'string'");
+                }
+                ucs |= (*inputOffset++) & 0x3f;
+                if (ucs < 0x80)
+                    return SetError(ds, -1,
+                                    "Overlong 2 byte UTF-8 sequence detected "
+                                    "when decoding 'string'");
+                *(escOffset++) = (wchar_t)ucs;
+                break;
+            }
+
+            case 3: {
+                JSUTF32 ucs = 0;
+                ucs |= (*inputOffset++) & 0x0f;
+
+                for (index = 0; index < 2; index++) {
+                    ucs <<= 6;
+                    oct = (*inputOffset++);
+
+                    if ((oct & 0x80) != 0x80) {
+                        return SetError(ds, -1,
+                                        "Invalid octet in UTF-8 sequence when "
+                                        "decoding 'string'");
+                    }
+
+                    ucs |= oct & 0x3f;
+                }
+
+                if (ucs < 0x800)
+                    return SetError(ds, -1,
+                                    "Overlong 3 byte UTF-8 sequence detected "
+                                    "when encoding string");
+                *(escOffset++) = (wchar_t)ucs;
+                break;
+            }
+
+            case 4: {
+                JSUTF32 ucs = 0;
+                ucs |= (*inputOffset++) & 0x07;
+
+                for (index = 0; index < 3; index++) {
+                    ucs <<= 6;
+                    oct = (*inputOffset++);
+
+                    if ((oct & 0x80) != 0x80) {
+                        return SetError(ds, -1,
+                                        "Invalid octet in UTF-8 sequence when "
+                                        "decoding 'string'");
+                    }
+
+                    ucs |= oct & 0x3f;
+                }
+
+                if (ucs < 0x10000)
+                    return SetError(ds, -1,
+                                    "Overlong 4 byte UTF-8 sequence detected "
+                                    "when decoding 'string'");
+
+#if WCHAR_MAX == 0xffff
+                if (ucs >= 0x10000) {
+                    ucs -= 0x10000;
+                    *(escOffset++) = (wchar_t)(ucs >> 10) + 0xd800;
+                    *(escOffset++) = (wchar_t)(ucs & 0x3ff) + 0xdc00;
+                } else {
+                    *(escOffset++) = (wchar_t)ucs;
+                }
+#else
+                *(escOffset++) = (wchar_t)ucs;
+#endif
+                break;
+            }
+        }
+    }
+}
+
+FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_array(struct DecoderState *ds) {
+    JSOBJ itemValue;
+    JSOBJ newObj;
+    int len;
+    ds->objDepth++;
+    if (ds->objDepth > JSON_MAX_OBJECT_DEPTH) {
+        return SetError(ds, -1, "Reached object decoding depth limit");
+    }
+
+    newObj = ds->dec->newArray(ds->prv, ds->dec);
+    len = 0;
+
+    ds->lastType = JT_INVALID;
+    ds->start++;
+
+    for (;;) {
+        SkipWhitespace(ds);
+
+        if ((*ds->start) == ']') {
+            ds->objDepth--;
+            if (len == 0) {
+                ds->start++;
+                return ds->dec->endArray(ds->prv, newObj);
+            }
+
+            ds->dec->releaseObject(ds->prv, newObj, ds->dec);
+            return SetError(
+                ds, -1,
+                "Unexpected character found when decoding array value (1)");
+        }
+
+        itemValue = decode_any(ds);
+
+        if (itemValue == NULL) {
+            ds->dec->releaseObject(ds->prv, newObj, ds->dec);
+            return NULL;
+        }
+
+        if (!ds->dec->arrayAddItem(ds->prv, newObj, itemValue)) {
+            ds->dec->releaseObject(ds->prv, newObj, ds->dec);
+            return NULL;
+        }
+
+        SkipWhitespace(ds);
+
+        switch (*(ds->start++)) {
+            case ']': {
+                ds->objDepth--;
+                return ds->dec->endArray(ds->prv, newObj);
+            }
+            case ',':
+                break;
+
+            default:
+                ds->dec->releaseObject(ds->prv, newObj, ds->dec);
+                return SetError(
+                    ds, -1,
+                    "Unexpected character found when decoding array value (2)");
+        }
+
+        len++;
+    }
+}
+
+FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_object(struct DecoderState *ds) {
+    JSOBJ itemName;
+    JSOBJ itemValue;
+    JSOBJ newObj;
+
+    ds->objDepth++;
+    if (ds->objDepth > JSON_MAX_OBJECT_DEPTH) {
+        return SetError(ds, -1, "Reached object decoding depth limit");
+    }
+
+    newObj = ds->dec->newObject(ds->prv, ds->dec);
+
+    ds->start++;
+
+    for (;;) {
+        SkipWhitespace(ds);
+
+        if ((*ds->start) == '}') {
+            ds->objDepth--;
+            ds->start++;
+            return ds->dec->endObject(ds->prv, newObj);
+        }
+
+        ds->lastType = JT_INVALID;
+        itemName = decode_any(ds);
+
+        if (itemName == NULL) {
+            ds->dec->releaseObject(ds->prv, newObj, ds->dec);
+            return NULL;
+        }
+
+        if (ds->lastType != JT_UTF8) {
+            ds->dec->releaseObject(ds->prv, newObj, ds->dec);
+            ds->dec->releaseObject(ds->prv, itemName, ds->dec);
+            return SetError(
+                ds, -1,
+                "Key name of object must be 'string' when decoding 'object'");
+        }
+
+        SkipWhitespace(ds);
+
+        if (*(ds->start++) != ':') {
+            ds->dec->releaseObject(ds->prv, newObj, ds->dec);
+            ds->dec->releaseObject(ds->prv, itemName, ds->dec);
+            return SetError(ds, -1, "No ':' found when decoding object value");
+        }
+
+        SkipWhitespace(ds);
+
+        itemValue = decode_any(ds);
+
+        if (itemValue == NULL) {
+            ds->dec->releaseObject(ds->prv, newObj, ds->dec);
+            ds->dec->releaseObject(ds->prv, itemName, ds->dec);
+            return NULL;
+        }
+
+        if (!ds->dec->objectAddKey(ds->prv, newObj, itemName, itemValue)) {
+            ds->dec->releaseObject(ds->prv, newObj, ds->dec);
+            ds->dec->releaseObject(ds->prv, itemName, ds->dec);
+            ds->dec->releaseObject(ds->prv, itemValue, ds->dec);
+            return NULL;
+        }
+
+        SkipWhitespace(ds);
+
+        switch (*(ds->start++)) {
+            case '}': {
+                ds->objDepth--;
+                return ds->dec->endObject(ds->prv, newObj);
+            }
+            case ',':
+                break;
+
+            default:
+                ds->dec->releaseObject(ds->prv, newObj, ds->dec);
+                return SetError(
+                    ds, -1,
+                    "Unexpected character found when decoding object value");
+        }
+    }
+}
+
+FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_any(struct DecoderState *ds) {
+    for (;;) {
+        switch (*ds->start) {
+            case '\"':
+                return decode_string(ds);
+            case '0':
+            case '1':
+            case '2':
+            case '3':
+            case '4':
+            case '5':
+            case '6':
+            case '7':
+            case '8':
+            case '9':
+            case '-':
+                return decode_numeric(ds);
+
+            case '[':
+                return decode_array(ds);
+            case '{':
+                return decode_object(ds);
+            case 't':
+                return decode_true(ds);
+            case 'f':
+                return decode_false(ds);
+            case 'n':
+                return decode_null(ds);
+
+            case ' ':
+            case '\t':
+            case '\r':
+            case '\n':
+                // White space
+                ds->start++;
+                break;
+
+            default:
+                return SetError(ds, -1, "Expected object or value");
+        }
+    }
+}
+
+JSOBJ JSON_DecodeObject(JSONObjectDecoder *dec, const char *buffer,
+                        size_t cbBuffer) {
+    /*
+    FIXME: Base the size of escBuffer of that of cbBuffer so that the unicode
+    escaping doesn't run into the wall each time */
+    char *locale;
+    struct DecoderState ds;
+    wchar_t escBuffer[(JSON_MAX_STACK_BUFFER_SIZE / sizeof(wchar_t))];
+    JSOBJ ret;
+
+    ds.start = (char *)buffer;
+    ds.end = ds.start + cbBuffer;
+
+    ds.escStart = escBuffer;
+    ds.escEnd = ds.escStart + (JSON_MAX_STACK_BUFFER_SIZE / sizeof(wchar_t));
+    ds.escHeap = 0;
+    ds.prv = dec->prv;
+    ds.dec = dec;
+    ds.dec->errorStr = NULL;
+    ds.dec->errorOffset = NULL;
+    ds.objDepth = 0;
+
+    ds.dec = dec;
+
+    locale = setlocale(LC_NUMERIC, NULL);
+    if (strcmp(locale, "C")) {
+        locale = strdup(locale);
+        if (!locale) {
+            return SetError(&ds, -1, "Could not reserve memory block");
+        }
+        setlocale(LC_NUMERIC, "C");
+        ret = decode_any(&ds);
+        setlocale(LC_NUMERIC, locale);
+        free(locale);
+    } else {
+        ret = decode_any(&ds);
+    }
+
+    if (ds.escHeap) {
+        dec->free(ds.escStart);
+    }
+
+    SkipWhitespace(&ds);
+
+    if (ds.start != ds.end && ret) {
+        dec->releaseObject(ds.prv, ret, ds.dec);
+        return SetError(&ds, -1, "Trailing data");
+    }
+
+    return ret;
+}
diff --git a/pandas/_libs/src/ujson/lib/ultrajsonenc.c b/pandas/_libs/src/ujson/lib/ultrajsonenc.c
new file mode 100644
index 0000000000000..2d6c823a45515
--- /dev/null
+++ b/pandas/_libs/src/ujson/lib/ultrajsonenc.c
@@ -0,0 +1,1143 @@
+/*
+Copyright (c) 2011-2013, ESN Social Software AB and Jonas Tarnstrom
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+    * Redistributions of source code must retain the above copyright
+      notice, this list of conditions and the following disclaimer.
+    * Redistributions in binary form must reproduce the above copyright
+      notice, this list of conditions and the following disclaimer in the
+      documentation and/or other materials provided with the distribution.
+    * Neither the name of the ESN Social Software AB nor the
+      names of its contributors may be used to endorse or promote products
+      derived from this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE
+LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
+ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+
+Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
+https://github.com/client9/stringencoders
+Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights
+reserved.
+
+Numeric decoder derived from from TCL library
+http://www.opensource.apple.com/source/tcl/tcl-14/tcl/license.terms
+ * Copyright (c) 1988-1993 The Regents of the University of California.
+ * Copyright (c) 1994 Sun Microsystems, Inc.
+*/
+
+#include <assert.h>
+#include <float.h>
+#include <locale.h>
+#include <math.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include "ultrajson.h"
+
+#ifndef TRUE
+#define TRUE 1
+#endif
+#ifndef FALSE
+#define FALSE 0
+#endif
+
+/*
+Worst cases being:
+
+Control characters (ASCII < 32)
+0x00 (1 byte) input => \u0000 output (6 bytes)
+1 * 6 => 6 (6 bytes required)
+
+or UTF-16 surrogate pairs
+4 bytes input in UTF-8 => \uXXXX\uYYYY (12 bytes).
+
+4 * 6 => 24 bytes (12 bytes required)
+
+The extra 2 bytes are for the quotes around the string
+
+*/
+#define RESERVE_STRING(_len) (2 + ((_len)*6))
+
+static const double g_pow10[] = {1,
+                                 10,
+                                 100,
+                                 1000,
+                                 10000,
+                                 100000,
+                                 1000000,
+                                 10000000,
+                                 100000000,
+                                 1000000000,
+                                 10000000000,
+                                 100000000000,
+                                 1000000000000,
+                                 10000000000000,
+                                 100000000000000,
+                                 1000000000000000};
+static const char g_hexChars[] = "0123456789abcdef";
+static const char g_escapeChars[] = "0123456789\\b\\t\\n\\f\\r\\\"\\\\\\/";
+
+/*
+FIXME: While this is fine dandy and working it's a magic value mess which
+probably only the author understands.
+Needs a cleanup and more documentation */
+
+/*
+Table for pure ascii output escaping all characters above 127 to \uXXXX */
+static const JSUINT8 g_asciiOutputTable[256] = {
+    /* 0x00 */ 0,
+    30,
+    30,
+    30,
+    30,
+    30,
+    30,
+    30,
+    10,
+    12,
+    14,
+    30,
+    16,
+    18,
+    30,
+    30,
+    /* 0x10 */ 30,
+    30,
+    30,
+    30,
+    30,
+    30,
+    30,
+    30,
+    30,
+    30,
+    30,
+    30,
+    30,
+    30,
+    30,
+    30,
+    /* 0x20 */ 1,
+    1,
+    20,
+    1,
+    1,
+    1,
+    29,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    24,
+    /* 0x30 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    29,
+    1,
+    29,
+    1,
+    /* 0x40 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0x50 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    22,
+    1,
+    1,
+    1,
+    /* 0x60 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0x70 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0x80 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0x90 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0xa0 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0xb0 */ 1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    1,
+    /* 0xc0 */ 2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    /* 0xd0 */ 2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2,
+    /* 0xe0 */ 3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    3,
+    /* 0xf0 */ 4,
+    4,
+    4,
+    4,
+    4,
+    4,
+    4,
+    4,
+    5,
+    5,
+    5,
+    5,
+    6,
+    6,
+    1,
+    1};
+
+static void SetError(JSOBJ obj, JSONObjectEncoder *enc, const char *message) {
+    enc->errorMsg = message;
+    enc->errorObj = obj;
+}
+
+/*
+FIXME: Keep track of how big these get across several encoder calls and try to
+make an estimate
+That way we won't run our head into the wall each call */
+void Buffer_Realloc(JSONObjectEncoder *enc, size_t cbNeeded) {
+    size_t curSize = enc->end - enc->start;
+    size_t newSize = curSize * 2;
+    size_t offset = enc->offset - enc->start;
+
+    while (newSize < curSize + cbNeeded) {
+        newSize *= 2;
+    }
+
+    if (enc->heap) {
+        enc->start = (char *)enc->realloc(enc->start, newSize);
+        if (!enc->start) {
+            SetError(NULL, enc, "Could not reserve memory block");
+            return;
+        }
+    } else {
+        char *oldStart = enc->start;
+        enc->heap = 1;
+        enc->start = (char *)enc->malloc(newSize);
+        if (!enc->start) {
+            SetError(NULL, enc, "Could not reserve memory block");
+            return;
+        }
+        memcpy(enc->start, oldStart, offset);
+    }
+    enc->offset = enc->start + offset;
+    enc->end = enc->start + newSize;
+}
+
+FASTCALL_ATTR INLINE_PREFIX void FASTCALL_MSVC
+Buffer_AppendShortHexUnchecked(char *outputOffset, unsigned short value) {
+    *(outputOffset++) = g_hexChars[(value & 0xf000) >> 12];
+    *(outputOffset++) = g_hexChars[(value & 0x0f00) >> 8];
+    *(outputOffset++) = g_hexChars[(value & 0x00f0) >> 4];
+    *(outputOffset++) = g_hexChars[(value & 0x000f) >> 0];
+}
+
+int Buffer_EscapeStringUnvalidated(JSONObjectEncoder *enc, const char *io,
+                                   const char *end) {
+    char *of = (char *)enc->offset;
+
+    for (;;) {
+        switch (*io) {
+            case 0x00: {
+                if (io < end) {
+                    *(of++) = '\\';
+                    *(of++) = 'u';
+                    *(of++) = '0';
+                    *(of++) = '0';
+                    *(of++) = '0';
+                    *(of++) = '0';
+                    break;
+                } else {
+                    enc->offset += (of - enc->offset);
+                    return TRUE;
+                }
+            }
+            case '\"':
+                (*of++) = '\\';
+                (*of++) = '\"';
+                break;
+            case '\\':
+                (*of++) = '\\';
+                (*of++) = '\\';
+                break;
+            case '/':
+                (*of++) = '\\';
+                (*of++) = '/';
+                break;
+            case '\b':
+                (*of++) = '\\';
+                (*of++) = 'b';
+                break;
+            case '\f':
+                (*of++) = '\\';
+                (*of++) = 'f';
+                break;
+            case '\n':
+                (*of++) = '\\';
+                (*of++) = 'n';
+                break;
+            case '\r':
+                (*of++) = '\\';
+                (*of++) = 'r';
+                break;
+            case '\t':
+                (*of++) = '\\';
+                (*of++) = 't';
+                break;
+
+            case 0x26:  // '/'
+            case 0x3c:  // '<'
+            case 0x3e:  // '>'
+            {
+                if (enc->encodeHTMLChars) {
+                    // Fall through to \u00XX case below.
+                } else {
+                    // Same as default case below.
+                    (*of++) = (*io);
+                    break;
+                }
+            }
+            case 0x01:
+            case 0x02:
+            case 0x03:
+            case 0x04:
+            case 0x05:
+            case 0x06:
+            case 0x07:
+            case 0x0b:
+            case 0x0e:
+            case 0x0f:
+            case 0x10:
+            case 0x11:
+            case 0x12:
+            case 0x13:
+            case 0x14:
+            case 0x15:
+            case 0x16:
+            case 0x17:
+            case 0x18:
+            case 0x19:
+            case 0x1a:
+            case 0x1b:
+            case 0x1c:
+            case 0x1d:
+            case 0x1e:
+            case 0x1f: {
+                *(of++) = '\\';
+                *(of++) = 'u';
+                *(of++) = '0';
+                *(of++) = '0';
+                *(of++) = g_hexChars[(unsigned char)(((*io) & 0xf0) >> 4)];
+                *(of++) = g_hexChars[(unsigned char)((*io) & 0x0f)];
+                break;
+            }
+            default:
+                (*of++) = (*io);
+                break;
+        }
+        io++;
+    }
+}
+
+int Buffer_EscapeStringValidated(JSOBJ obj, JSONObjectEncoder *enc,
+                                 const char *io, const char *end) {
+    JSUTF32 ucs;
+    char *of = (char *)enc->offset;
+
+    for (;;) {
+        JSUINT8 utflen = g_asciiOutputTable[(unsigned char)*io];
+
+        switch (utflen) {
+            case 0: {
+                if (io < end) {
+                    *(of++) = '\\';
+                    *(of++) = 'u';
+                    *(of++) = '0';
+                    *(of++) = '0';
+                    *(of++) = '0';
+                    *(of++) = '0';
+                    io++;
+                    continue;
+                } else {
+                    enc->offset += (of - enc->offset);
+                    return TRUE;
+                }
+            }
+
+            case 1: {
+                *(of++) = (*io++);
+                continue;
+            }
+
+            case 2: {
+                JSUTF32 in;
+                JSUTF16 in16;
+
+                if (end - io < 1) {
+                    enc->offset += (of - enc->offset);
+                    SetError(
+                        obj, enc,
+                        "Unterminated UTF-8 sequence when encoding string");
+                    return FALSE;
+                }
+
+                memcpy(&in16, io, sizeof(JSUTF16));
+                in = (JSUTF32)in16;
+
+#ifdef __LITTLE_ENDIAN__
+                ucs = ((in & 0x1f) << 6) | ((in >> 8) & 0x3f);
+#else
+                ucs = ((in & 0x1f00) >> 2) | (in & 0x3f);
+#endif
+
+                if (ucs < 0x80) {
+                    enc->offset += (of - enc->offset);
+                    SetError(obj, enc,
+                             "Overlong 2 byte UTF-8 sequence detected when "
+                             "encoding string");
+                    return FALSE;
+                }
+
+                io += 2;
+                break;
+            }
+
+            case 3: {
+                JSUTF32 in;
+                JSUTF16 in16;
+                JSUINT8 in8;
+
+                if (end - io < 2) {
+                    enc->offset += (of - enc->offset);
+                    SetError(
+                        obj, enc,
+                        "Unterminated UTF-8 sequence when encoding string");
+                    return FALSE;
+                }
+
+                memcpy(&in16, io, sizeof(JSUTF16));
+                memcpy(&in8, io + 2, sizeof(JSUINT8));
+#ifdef __LITTLE_ENDIAN__
+                in = (JSUTF32)in16;
+                in |= in8 << 16;
+                ucs = ((in & 0x0f) << 12) | ((in & 0x3f00) >> 2) |
+                      ((in & 0x3f0000) >> 16);
+#else
+                in = in16 << 8;
+                in |= in8;
+                ucs =
+                    ((in & 0x0f0000) >> 4) | ((in & 0x3f00) >> 2) | (in & 0x3f);
+#endif
+
+                if (ucs < 0x800) {
+                    enc->offset += (of - enc->offset);
+                    SetError(obj, enc,
+                             "Overlong 3 byte UTF-8 sequence detected when "
+                             "encoding string");
+                    return FALSE;
+                }
+
+                io += 3;
+                break;
+            }
+            case 4: {
+                JSUTF32 in;
+
+                if (end - io < 3) {
+                    enc->offset += (of - enc->offset);
+                    SetError(
+                        obj, enc,
+                        "Unterminated UTF-8 sequence when encoding string");
+                    return FALSE;
+                }
+
+                memcpy(&in, io, sizeof(JSUTF32));
+#ifdef __LITTLE_ENDIAN__
+                ucs = ((in & 0x07) << 18) | ((in & 0x3f00) << 4) |
+                      ((in & 0x3f0000) >> 10) | ((in & 0x3f000000) >> 24);
+#else
+                ucs = ((in & 0x07000000) >> 6) | ((in & 0x3f0000) >> 4) |
+                      ((in & 0x3f00) >> 2) | (in & 0x3f);
+#endif
+                if (ucs < 0x10000) {
+                    enc->offset += (of - enc->offset);
+                    SetError(obj, enc,
+                             "Overlong 4 byte UTF-8 sequence detected when "
+                             "encoding string");
+                    return FALSE;
+                }
+
+                io += 4;
+                break;
+            }
+
+            case 5:
+            case 6: {
+                enc->offset += (of - enc->offset);
+                SetError(
+                    obj, enc,
+                    "Unsupported UTF-8 sequence length when encoding string");
+                return FALSE;
+            }
+
+            case 29: {
+                if (enc->encodeHTMLChars) {
+                    // Fall through to \u00XX case 30 below.
+                } else {
+                    // Same as case 1 above.
+                    *(of++) = (*io++);
+                    continue;
+                }
+            }
+
+            case 30: {
+                // \uXXXX encode
+                *(of++) = '\\';
+                *(of++) = 'u';
+                *(of++) = '0';
+                *(of++) = '0';
+                *(of++) = g_hexChars[(unsigned char)(((*io) & 0xf0) >> 4)];
+                *(of++) = g_hexChars[(unsigned char)((*io) & 0x0f)];
+                io++;
+                continue;
+            }
+            case 10:
+            case 12:
+            case 14:
+            case 16:
+            case 18:
+            case 20:
+            case 22:
+            case 24: {
+                *(of++) = *((char *)(g_escapeChars + utflen + 0));
+                *(of++) = *((char *)(g_escapeChars + utflen + 1));
+                io++;
+                continue;
+            }
+            // This can never happen, it's here to make L4 VC++ happy
+            default: {
+                ucs = 0;
+                break;
+            }
+        }
+
+        /*
+        If the character is a UTF8 sequence of length > 1 we end up here */
+        if (ucs >= 0x10000) {
+            ucs -= 0x10000;
+            *(of++) = '\\';
+            *(of++) = 'u';
+            Buffer_AppendShortHexUnchecked(
+                of, (unsigned short)(ucs >> 10) + 0xd800);
+            of += 4;
+
+            *(of++) = '\\';
+            *(of++) = 'u';
+            Buffer_AppendShortHexUnchecked(
+                of, (unsigned short)(ucs & 0x3ff) + 0xdc00);
+            of += 4;
+        } else {
+            *(of++) = '\\';
+            *(of++) = 'u';
+            Buffer_AppendShortHexUnchecked(of, (unsigned short)ucs);
+            of += 4;
+        }
+    }
+}
+
+#define Buffer_AppendCharUnchecked(__enc, __chr) *((__enc)->offset++) = __chr;
+
+FASTCALL_ATTR INLINE_PREFIX void FASTCALL_MSVC strreverse(char *begin,
+                                                          char *end) {
+    char aux;
+    while (end > begin) aux = *end, *end-- = *begin, *begin++ = aux;
+}
+
+void Buffer_AppendIntUnchecked(JSONObjectEncoder *enc, JSINT32 value) {
+    char *wstr;
+    JSUINT32 uvalue = (value < 0) ? -value : value;
+    wstr = enc->offset;
+
+    // Conversion. Number is reversed.
+    do {
+        *wstr++ = (char)(48 + (uvalue % 10));
+    } while (uvalue /= 10);
+    if (value < 0) *wstr++ = '-';
+
+    // Reverse string
+    strreverse(enc->offset, wstr - 1);
+    enc->offset += (wstr - (enc->offset));
+}
+
+void Buffer_AppendLongUnchecked(JSONObjectEncoder *enc, JSINT64 value) {
+    char *wstr;
+    JSUINT64 uvalue = (value < 0) ? -value : value;
+
+    wstr = enc->offset;
+    // Conversion. Number is reversed.
+
+    do {
+        *wstr++ = (char)(48 + (uvalue % 10ULL));
+    } while (uvalue /= 10ULL);
+    if (value < 0) *wstr++ = '-';
+
+    // Reverse string
+    strreverse(enc->offset, wstr - 1);
+    enc->offset += (wstr - (enc->offset));
+}
+
+int Buffer_AppendDoubleUnchecked(JSOBJ obj, JSONObjectEncoder *enc,
+                                 double value) {
+    /* if input is beyond the thresholds, revert to exponential */
+    const double thres_max = (double)1e16 - 1;
+    const double thres_min = (double)1e-15;
+    char precision_str[20];
+    int count;
+    double diff = 0.0;
+    char *str = enc->offset;
+    char *wstr = str;
+    unsigned long long whole;
+    double tmp;
+    unsigned long long frac;
+    int neg;
+    double pow10;
+
+    if (value == HUGE_VAL || value == -HUGE_VAL) {
+        SetError(obj, enc, "Invalid Inf value when encoding double");
+        return FALSE;
+    }
+
+    if (!(value == value)) {
+        SetError(obj, enc, "Invalid Nan value when encoding double");
+        return FALSE;
+    }
+
+    /* we'll work in positive values and deal with the
+    negative sign issue later */
+    neg = 0;
+    if (value < 0) {
+        neg = 1;
+        value = -value;
+    }
+
+    /*
+    for very large or small numbers switch back to native sprintf for
+    exponentials.  anyone want to write code to replace this? */
+    if (value > thres_max || (value != 0.0 && fabs(value) < thres_min)) {
+        precision_str[0] = '%';
+        precision_str[1] = '.';
+#if defined(_WIN32) && defined(_MSC_VER)
+        sprintf_s(precision_str + 2, sizeof(precision_str) - 2, "%ug",
+                  enc->doublePrecision);
+        enc->offset += sprintf_s(str, enc->end - enc->offset, precision_str,
+                                 neg ? -value : value);
+#else
+        snprintf(precision_str + 2, sizeof(precision_str) - 2, "%ug",
+                 enc->doublePrecision);
+        enc->offset += snprintf(str, enc->end - enc->offset, precision_str,
+                                neg ? -value : value);
+#endif
+        return TRUE;
+    }
+
+    pow10 = g_pow10[enc->doublePrecision];
+
+    whole = (unsigned long long)value;
+    tmp = (value - whole) * pow10;
+    frac = (unsigned long long)(tmp);
+    diff = tmp - frac;
+
+    if (diff > 0.5) {
+        ++frac;
+    } else if (diff == 0.5 && ((frac == 0) || (frac & 1))) {
+        /* if halfway, round up if odd, OR
+        if last digit is 0.  That last part is strange */
+        ++frac;
+    }
+
+    // handle rollover, e.g.
+    // case 0.99 with prec 1 is 1.0 and case 0.95 with prec is 1.0 as well
+    if (frac >= pow10) {
+        frac = 0;
+        ++whole;
+    }
+
+    if (enc->doublePrecision == 0) {
+        diff = value - whole;
+
+        if (diff > 0.5) {
+            /* greater than 0.5, round up, e.g. 1.6 -> 2 */
+            ++whole;
+        } else if (diff == 0.5 && (whole & 1)) {
+            /* exactly 0.5 and ODD, then round up */
+            /* 1.5 -> 2, but 2.5 -> 2 */
+            ++whole;
+        }
+
+        // vvvvvvvvvvvvvvvvvvv  Diff from modp_dto2
+    } else if (frac) {
+        count = enc->doublePrecision;
+        // now do fractional part, as an unsigned number
+        // we know it is not 0 but we can have leading zeros, these
+        // should be removed
+        while (!(frac % 10)) {
+            --count;
+            frac /= 10;
+        }
+        //^^^^^^^^^^^^^^^^^^^  Diff from modp_dto2
+
+        // now do fractional part, as an unsigned number
+        do {
+            --count;
+            *wstr++ = (char)(48 + (frac % 10));
+        } while (frac /= 10);
+        // add extra 0s
+        while (count-- > 0) {
+            *wstr++ = '0';
+        }
+        // add decimal
+        *wstr++ = '.';
+    } else {
+        *wstr++ = '0';
+        *wstr++ = '.';
+    }
+
+    // Do whole part. Take care of sign
+    // conversion. Number is reversed.
+    do {
+        *wstr++ = (char)(48 + (whole % 10));
+    } while (whole /= 10);
+
+    if (neg) {
+        *wstr++ = '-';
+    }
+    strreverse(str, wstr - 1);
+    enc->offset += (wstr - (enc->offset));
+
+    return TRUE;
+}
+
+/*
+FIXME:
+Handle integration functions returning NULL here */
+
+/*
+FIXME:
+Perhaps implement recursion detection */
+
+void encode(JSOBJ obj, JSONObjectEncoder *enc, const char *name,
+            size_t cbName) {
+    const char *value;
+    char *objName;
+    int count;
+    JSOBJ iterObj;
+    size_t szlen;
+    JSONTypeContext tc;
+    tc.encoder = enc;
+
+    if (enc->level > enc->recursionMax) {
+        SetError(obj, enc, "Maximum recursion level reached");
+        return;
+    }
+
+    /*
+    This reservation must hold
+
+    length of _name as encoded worst case +
+    maxLength of double to string OR maxLength of JSLONG to string
+    */
+
+    Buffer_Reserve(enc, 256 + RESERVE_STRING(cbName));
+    if (enc->errorMsg) {
+        return;
+    }
+
+    if (name) {
+        Buffer_AppendCharUnchecked(enc, '\"');
+
+        if (enc->forceASCII) {
+            if (!Buffer_EscapeStringValidated(obj, enc, name, name + cbName)) {
+                return;
+            }
+        } else {
+            if (!Buffer_EscapeStringUnvalidated(enc, name, name + cbName)) {
+                return;
+            }
+        }
+
+        Buffer_AppendCharUnchecked(enc, '\"');
+
+        Buffer_AppendCharUnchecked(enc, ':');
+#ifndef JSON_NO_EXTRA_WHITESPACE
+        Buffer_AppendCharUnchecked(enc, ' ');
+#endif
+    }
+
+    enc->beginTypeContext(obj, &tc);
+
+    switch (tc.type) {
+        case JT_INVALID: {
+            return;
+        }
+
+        case JT_ARRAY: {
+            count = 0;
+            enc->iterBegin(obj, &tc);
+
+            Buffer_AppendCharUnchecked(enc, '[');
+
+            while (enc->iterNext(obj, &tc)) {
+                if (count > 0) {
+                    Buffer_AppendCharUnchecked(enc, ',');
+#ifndef JSON_NO_EXTRA_WHITESPACE
+                    Buffer_AppendCharUnchecked(buffer, ' ');
+#endif
+                }
+
+                iterObj = enc->iterGetValue(obj, &tc);
+
+                enc->level++;
+                encode(iterObj, enc, NULL, 0);
+                count++;
+            }
+
+            enc->iterEnd(obj, &tc);
+            Buffer_Reserve(enc, 2);
+            Buffer_AppendCharUnchecked(enc, ']');
+            break;
+        }
+
+        case JT_OBJECT: {
+            count = 0;
+            enc->iterBegin(obj, &tc);
+
+            Buffer_AppendCharUnchecked(enc, '{');
+
+            while (enc->iterNext(obj, &tc)) {
+                if (count > 0) {
+                    Buffer_AppendCharUnchecked(enc, ',');
+#ifndef JSON_NO_EXTRA_WHITESPACE
+                    Buffer_AppendCharUnchecked(enc, ' ');
+#endif
+                }
+
+                iterObj = enc->iterGetValue(obj, &tc);
+                objName = enc->iterGetName(obj, &tc, &szlen);
+
+                enc->level++;
+                encode(iterObj, enc, objName, szlen);
+                count++;
+            }
+
+            enc->iterEnd(obj, &tc);
+            Buffer_Reserve(enc, 2);
+            Buffer_AppendCharUnchecked(enc, '}');
+            break;
+        }
+
+        case JT_LONG: {
+            Buffer_AppendLongUnchecked(enc, enc->getLongValue(obj, &tc));
+            break;
+        }
+
+        case JT_INT: {
+            Buffer_AppendIntUnchecked(enc, enc->getIntValue(obj, &tc));
+            break;
+        }
+
+        case JT_TRUE: {
+            Buffer_AppendCharUnchecked(enc, 't');
+            Buffer_AppendCharUnchecked(enc, 'r');
+            Buffer_AppendCharUnchecked(enc, 'u');
+            Buffer_AppendCharUnchecked(enc, 'e');
+            break;
+        }
+
+        case JT_FALSE: {
+            Buffer_AppendCharUnchecked(enc, 'f');
+            Buffer_AppendCharUnchecked(enc, 'a');
+            Buffer_AppendCharUnchecked(enc, 'l');
+            Buffer_AppendCharUnchecked(enc, 's');
+            Buffer_AppendCharUnchecked(enc, 'e');
+            break;
+        }
+
+        case JT_NULL: {
+            Buffer_AppendCharUnchecked(enc, 'n');
+            Buffer_AppendCharUnchecked(enc, 'u');
+            Buffer_AppendCharUnchecked(enc, 'l');
+            Buffer_AppendCharUnchecked(enc, 'l');
+            break;
+        }
+
+        case JT_DOUBLE: {
+            if (!Buffer_AppendDoubleUnchecked(obj, enc,
+                                              enc->getDoubleValue(obj, &tc))) {
+                enc->endTypeContext(obj, &tc);
+                enc->level--;
+                return;
+            }
+            break;
+        }
+
+        case JT_UTF8: {
+            value = enc->getStringValue(obj, &tc, &szlen);
+            Buffer_Reserve(enc, RESERVE_STRING(szlen));
+            if (enc->errorMsg) {
+                enc->endTypeContext(obj, &tc);
+                return;
+            }
+            Buffer_AppendCharUnchecked(enc, '\"');
+
+            if (enc->forceASCII) {
+                if (!Buffer_EscapeStringValidated(obj, enc, value,
+                                                  value + szlen)) {
+                    enc->endTypeContext(obj, &tc);
+                    enc->level--;
+                    return;
+                }
+            } else {
+                if (!Buffer_EscapeStringUnvalidated(enc, value,
+                                                    value + szlen)) {
+                    enc->endTypeContext(obj, &tc);
+                    enc->level--;
+                    return;
+                }
+            }
+
+            Buffer_AppendCharUnchecked(enc, '\"');
+            break;
+        }
+    }
+
+    enc->endTypeContext(obj, &tc);
+    enc->level--;
+}
+
+char *JSON_EncodeObject(JSOBJ obj, JSONObjectEncoder *enc, char *_buffer,
+                        size_t _cbBuffer) {
+    char *locale;
+    enc->malloc = enc->malloc ? enc->malloc : malloc;
+    enc->free = enc->free ? enc->free : free;
+    enc->realloc = enc->realloc ? enc->realloc : realloc;
+    enc->errorMsg = NULL;
+    enc->errorObj = NULL;
+    enc->level = 0;
+
+    if (enc->recursionMax < 1) {
+        enc->recursionMax = JSON_MAX_RECURSION_DEPTH;
+    }
+
+    if (enc->doublePrecision < 0 ||
+        enc->doublePrecision > JSON_DOUBLE_MAX_DECIMALS) {
+        enc->doublePrecision = JSON_DOUBLE_MAX_DECIMALS;
+    }
+
+    if (_buffer == NULL) {
+        _cbBuffer = 32768;
+        enc->start = (char *)enc->malloc(_cbBuffer);
+        if (!enc->start) {
+            SetError(obj, enc, "Could not reserve memory block");
+            return NULL;
+        }
+        enc->heap = 1;
+    } else {
+        enc->start = _buffer;
+        enc->heap = 0;
+    }
+
+    enc->end = enc->start + _cbBuffer;
+    enc->offset = enc->start;
+
+    locale = setlocale(LC_NUMERIC, NULL);
+    if (strcmp(locale, "C")) {
+        locale = strdup(locale);
+        if (!locale) {
+            SetError(NULL, enc, "Could not reserve memory block");
+            return NULL;
+        }
+        setlocale(LC_NUMERIC, "C");
+        encode(obj, enc, NULL, 0);
+        setlocale(LC_NUMERIC, locale);
+        free(locale);
+    } else {
+        encode(obj, enc, NULL, 0);
+    }
+
+    Buffer_Reserve(enc, 1);
+    if (enc->errorMsg) {
+        return NULL;
+    }
+    Buffer_AppendCharUnchecked(enc, '\0');
+
+    return enc->start;
+}
diff --git a/pandas/_libs/src/ujson/python/JSONtoObj.c b/pandas/_libs/src/ujson/python/JSONtoObj.c
new file mode 100644
index 0000000000000..85cf1d5e5e7a1
--- /dev/null
+++ b/pandas/_libs/src/ujson/python/JSONtoObj.c
@@ -0,0 +1,638 @@
+/*
+Copyright (c) 2011-2013, ESN Social Software AB and Jonas Tarnstrom
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+    * Redistributions of source code must retain the above copyright
+      notice, this list of conditions and the following disclaimer.
+    * Redistributions in binary form must reproduce the above copyright
+      notice, this list of conditions and the following disclaimer in the
+      documentation and/or other materials provided with the distribution.
+    * Neither the name of the ESN Social Software AB nor the
+      names of its contributors may be used to endorse or promote products
+      derived from this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
+ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+
+Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
+https://github.com/client9/stringencoders
+Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights reserved.
+
+Numeric decoder derived from from TCL library
+http://www.opensource.apple.com/source/tcl/tcl-14/tcl/license.terms
+ * Copyright (c) 1988-1993 The Regents of the University of California.
+ * Copyright (c) 1994 Sun Microsystems, Inc.
+*/
+
+// "py_defines.h" needs to be included first to
+// avoid compilation errors, but it does violate
+// styleguide checks with regards to include order.
+#include "py_defines.h"
+#define PY_ARRAY_UNIQUE_SYMBOL UJSON_NUMPY
+#define NO_IMPORT_ARRAY
+#include <numpy/arrayobject.h>  // NOLINT(build/include_order)
+#include <ultrajson.h>          // NOLINT(build/include_order)
+
+#define PRINTMARK()
+
+typedef struct __PyObjectDecoder {
+    JSONObjectDecoder dec;
+
+    void *npyarr;       // Numpy context buffer
+    void *npyarr_addr;  // Ref to npyarr ptr to track DECREF calls
+    npy_intp curdim;    // Current array dimension
+
+    PyArray_Descr *dtype;
+} PyObjectDecoder;
+
+typedef struct __NpyArrContext {
+    PyObject *ret;
+    PyObject *labels[2];
+    PyArray_Dims shape;
+
+    PyObjectDecoder *dec;
+
+    npy_intp i;
+    npy_intp elsize;
+    npy_intp elcount;
+} NpyArrContext;
+
+// Numpy handling based on numpy internal code, specifically the function
+// PyArray_FromIter.
+
+// numpy related functions are inter-dependent so declare them all here,
+// to ensure the compiler catches any errors
+
+// standard numpy array handling
+JSOBJ Object_npyNewArray(void *prv, void *decoder);
+JSOBJ Object_npyEndArray(void *prv, JSOBJ obj);
+int Object_npyArrayAddItem(void *prv, JSOBJ obj, JSOBJ value);
+
+// for more complex dtypes (object and string) fill a standard Python list
+// and convert to a numpy array when done.
+JSOBJ Object_npyNewArrayList(void *prv, void *decoder);
+JSOBJ Object_npyEndArrayList(void *prv, JSOBJ obj);
+int Object_npyArrayListAddItem(void *prv, JSOBJ obj, JSOBJ value);
+
+// labelled support, encode keys and values of JS object into separate numpy
+// arrays
+JSOBJ Object_npyNewObject(void *prv, void *decoder);
+JSOBJ Object_npyEndObject(void *prv, JSOBJ obj);
+int Object_npyObjectAddKey(void *prv, JSOBJ obj, JSOBJ name, JSOBJ value);
+
+// free the numpy context buffer
+void Npy_releaseContext(NpyArrContext *npyarr) {
+    PRINTMARK();
+    if (npyarr) {
+        if (npyarr->shape.ptr) {
+            PyObject_Free(npyarr->shape.ptr);
+        }
+        if (npyarr->dec) {
+            npyarr->dec->npyarr = NULL;
+            npyarr->dec->curdim = 0;
+        }
+        Py_XDECREF(npyarr->labels[0]);
+        Py_XDECREF(npyarr->labels[1]);
+        Py_XDECREF(npyarr->ret);
+        PyObject_Free(npyarr);
+    }
+}
+
+JSOBJ Object_npyNewArray(void *prv, void *_decoder) {
+    NpyArrContext *npyarr;
+    PyObjectDecoder *decoder = (PyObjectDecoder *)_decoder;
+    PRINTMARK();
+    if (decoder->curdim <= 0) {
+        // start of array - initialise the context buffer
+        npyarr = decoder->npyarr = PyObject_Malloc(sizeof(NpyArrContext));
+        decoder->npyarr_addr = npyarr;
+
+        if (!npyarr) {
+            PyErr_NoMemory();
+            return NULL;
+        }
+
+        npyarr->dec = decoder;
+        npyarr->labels[0] = npyarr->labels[1] = NULL;
+
+        npyarr->shape.ptr = PyObject_Malloc(sizeof(npy_intp) * NPY_MAXDIMS);
+        npyarr->shape.len = 1;
+        npyarr->ret = NULL;
+
+        npyarr->elsize = 0;
+        npyarr->elcount = 4;
+        npyarr->i = 0;
+    } else {
+        // starting a new dimension continue the current array (and reshape
+        // after)
+        npyarr = (NpyArrContext *)decoder->npyarr;
+        if (decoder->curdim >= npyarr->shape.len) {
+            npyarr->shape.len++;
+        }
+    }
+
+    npyarr->shape.ptr[decoder->curdim] = 0;
+    decoder->curdim++;
+    return npyarr;
+}
+
+PyObject *Npy_returnLabelled(NpyArrContext *npyarr) {
+    PyObject *ret = npyarr->ret;
+    npy_intp i;
+
+    if (npyarr->labels[0] || npyarr->labels[1]) {
+        // finished decoding, build tuple with values and labels
+        ret = PyTuple_New(npyarr->shape.len + 1);
+        for (i = 0; i < npyarr->shape.len; i++) {
+            if (npyarr->labels[i]) {
+                PyTuple_SET_ITEM(ret, i + 1, npyarr->labels[i]);
+                npyarr->labels[i] = NULL;
+            } else {
+                Py_INCREF(Py_None);
+                PyTuple_SET_ITEM(ret, i + 1, Py_None);
+            }
+        }
+        PyTuple_SET_ITEM(ret, 0, npyarr->ret);
+    }
+
+    return ret;
+}
+
+JSOBJ Object_npyEndArray(void *prv, JSOBJ obj) {
+    PyObject *ret;
+    char *new_data;
+    NpyArrContext *npyarr = (NpyArrContext *)obj;
+    int emptyType = NPY_DEFAULT_TYPE;
+    npy_intp i;
+    PRINTMARK();
+    if (!npyarr) {
+        return NULL;
+    }
+
+    ret = npyarr->ret;
+    i = npyarr->i;
+
+    npyarr->dec->curdim--;
+
+    if (i == 0 || !npyarr->ret) {
+        // empty array would not have been initialised so do it now.
+        if (npyarr->dec->dtype) {
+            emptyType = npyarr->dec->dtype->type_num;
+        }
+        npyarr->ret = ret =
+            PyArray_EMPTY(npyarr->shape.len, npyarr->shape.ptr, emptyType, 0);
+    } else if (npyarr->dec->curdim <= 0) {
+        // realloc to final size
+        new_data = PyDataMem_RENEW(PyArray_DATA(ret), i * npyarr->elsize);
+        if (new_data == NULL) {
+            PyErr_NoMemory();
+            Npy_releaseContext(npyarr);
+            return NULL;
+        }
+        ((PyArrayObject *)ret)->data = (void *)new_data;
+        // PyArray_BYTES(ret) = new_data;
+    }
+
+    if (npyarr->dec->curdim <= 0) {
+        // finished decoding array, reshape if necessary
+        if (npyarr->shape.len > 1) {
+            npyarr->ret = PyArray_Newshape((PyArrayObject *)ret, &npyarr->shape,
+                                           NPY_ANYORDER);
+            Py_DECREF(ret);
+        }
+
+        ret = Npy_returnLabelled(npyarr);
+
+        npyarr->ret = NULL;
+        Npy_releaseContext(npyarr);
+    }
+
+    return ret;
+}
+
+int Object_npyArrayAddItem(void *prv, JSOBJ obj, JSOBJ value) {
+    PyObject *type;
+    PyArray_Descr *dtype;
+    npy_intp i;
+    char *new_data, *item;
+    NpyArrContext *npyarr = (NpyArrContext *)obj;
+    PRINTMARK();
+    if (!npyarr) {
+        return 0;
+    }
+
+    i = npyarr->i;
+
+    npyarr->shape.ptr[npyarr->dec->curdim - 1]++;
+
+    if (PyArray_Check((PyObject *)value)) {
+        // multidimensional array, keep decoding values.
+        return 1;
+    }
+
+    if (!npyarr->ret) {
+        // Array not initialised yet.
+        // We do it here so we can 'sniff' the data type if none was provided
+        if (!npyarr->dec->dtype) {
+            type = PyObject_Type(value);
+            if (!PyArray_DescrConverter(type, &dtype)) {
+                Py_DECREF(type);
+                goto fail;
+            }
+            Py_INCREF(dtype);
+            Py_DECREF(type);
+        } else {
+            dtype = PyArray_DescrNew(npyarr->dec->dtype);
+        }
+
+        // If it's an object or string then fill a Python list and subsequently
+        // convert. Otherwise we would need to somehow mess about with
+        // reference counts when renewing memory.
+        npyarr->elsize = dtype->elsize;
+        if (PyDataType_REFCHK(dtype) || npyarr->elsize == 0) {
+            Py_XDECREF(dtype);
+
+            if (npyarr->dec->curdim > 1) {
+                PyErr_SetString(PyExc_ValueError,
+                                "Cannot decode multidimensional arrays with "
+                                "variable length elements to numpy");
+                goto fail;
+            }
+            npyarr->elcount = 0;
+            npyarr->ret = PyList_New(0);
+            if (!npyarr->ret) {
+                goto fail;
+            }
+            ((JSONObjectDecoder *)npyarr->dec)->newArray =
+                Object_npyNewArrayList;
+            ((JSONObjectDecoder *)npyarr->dec)->arrayAddItem =
+                Object_npyArrayListAddItem;
+            ((JSONObjectDecoder *)npyarr->dec)->endArray =
+                Object_npyEndArrayList;
+            return Object_npyArrayListAddItem(prv, obj, value);
+        }
+
+        npyarr->ret = PyArray_NewFromDescr(
+            &PyArray_Type, dtype, 1, &npyarr->elcount, NULL, NULL, 0, NULL);
+
+        if (!npyarr->ret) {
+            goto fail;
+        }
+    }
+
+    if (i >= npyarr->elcount) {
+        // Grow PyArray_DATA(ret):
+        // this is similar for the strategy for PyListObject, but we use
+        // 50% overallocation => 0, 4, 8, 14, 23, 36, 56, 86 ...
+        if (npyarr->elsize == 0) {
+            PyErr_SetString(PyExc_ValueError,
+                            "Cannot decode multidimensional arrays with "
+                            "variable length elements to numpy");
+            goto fail;
+        }
+
+        npyarr->elcount = (i >> 1) + (i < 4 ? 4 : 2) + i;
+        if (npyarr->elcount <= NPY_MAX_INTP / npyarr->elsize) {
+            new_data = PyDataMem_RENEW(PyArray_DATA(npyarr->ret),
+                                       npyarr->elcount * npyarr->elsize);
+        } else {
+            PyErr_NoMemory();
+            goto fail;
+        }
+        ((PyArrayObject *)npyarr->ret)->data = (void *)new_data;
+
+        // PyArray_BYTES(npyarr->ret) = new_data;
+    }
+
+    PyArray_DIMS(npyarr->ret)[0] = i + 1;
+
+    if ((item = PyArray_GETPTR1(npyarr->ret, i)) == NULL ||
+        PyArray_SETITEM(npyarr->ret, item, value) == -1) {
+        goto fail;
+    }
+
+    Py_DECREF((PyObject *)value);
+    npyarr->i++;
+    return 1;
+
+fail:
+
+    Npy_releaseContext(npyarr);
+    return 0;
+}
+
+JSOBJ Object_npyNewArrayList(void *prv, void *_decoder) {
+    PyObjectDecoder *decoder = (PyObjectDecoder *)_decoder;
+    PRINTMARK();
+    PyErr_SetString(
+        PyExc_ValueError,
+        "nesting not supported for object or variable length dtypes");
+    Npy_releaseContext(decoder->npyarr);
+    return NULL;
+}
+
+JSOBJ Object_npyEndArrayList(void *prv, JSOBJ obj) {
+    PyObject *list, *ret;
+    NpyArrContext *npyarr = (NpyArrContext *)obj;
+    PRINTMARK();
+    if (!npyarr) {
+        return NULL;
+    }
+
+    // convert decoded list to numpy array
+    list = (PyObject *)npyarr->ret;
+    npyarr->ret = PyArray_FROM_O(list);
+
+    ret = Npy_returnLabelled(npyarr);
+    npyarr->ret = list;
+
+    ((JSONObjectDecoder *)npyarr->dec)->newArray = Object_npyNewArray;
+    ((JSONObjectDecoder *)npyarr->dec)->arrayAddItem = Object_npyArrayAddItem;
+    ((JSONObjectDecoder *)npyarr->dec)->endArray = Object_npyEndArray;
+    Npy_releaseContext(npyarr);
+    return ret;
+}
+
+int Object_npyArrayListAddItem(void *prv, JSOBJ obj, JSOBJ value) {
+    NpyArrContext *npyarr = (NpyArrContext *)obj;
+    PRINTMARK();
+    if (!npyarr) {
+        return 0;
+    }
+    PyList_Append((PyObject *)npyarr->ret, value);
+    Py_DECREF((PyObject *)value);
+    npyarr->elcount++;
+    return 1;
+}
+
+JSOBJ Object_npyNewObject(void *prv, void *_decoder) {
+    PyObjectDecoder *decoder = (PyObjectDecoder *)_decoder;
+    PRINTMARK();
+    if (decoder->curdim > 1) {
+        PyErr_SetString(PyExc_ValueError,
+                        "labels only supported up to 2 dimensions");
+        return NULL;
+    }
+
+    return ((JSONObjectDecoder *)decoder)->newArray(prv, decoder);
+}
+
+JSOBJ Object_npyEndObject(void *prv, JSOBJ obj) {
+    PyObject *list;
+    npy_intp labelidx;
+    NpyArrContext *npyarr = (NpyArrContext *)obj;
+    PRINTMARK();
+    if (!npyarr) {
+        return NULL;
+    }
+
+    labelidx = npyarr->dec->curdim - 1;
+
+    list = npyarr->labels[labelidx];
+    if (list) {
+        npyarr->labels[labelidx] = PyArray_FROM_O(list);
+        Py_DECREF(list);
+    }
+
+    return (PyObject *)((JSONObjectDecoder *)npyarr->dec)->endArray(prv, obj);
+}
+
+int Object_npyObjectAddKey(void *prv, JSOBJ obj, JSOBJ name, JSOBJ value) {
+    PyObject *label, *labels;
+    npy_intp labelidx;
+    // add key to label array, value to values array
+    NpyArrContext *npyarr = (NpyArrContext *)obj;
+    PRINTMARK();
+    if (!npyarr) {
+        return 0;
+    }
+
+    label = (PyObject *)name;
+    labelidx = npyarr->dec->curdim - 1;
+
+    if (!npyarr->labels[labelidx]) {
+        npyarr->labels[labelidx] = PyList_New(0);
+    }
+    labels = npyarr->labels[labelidx];
+    // only fill label array once, assumes all column labels are the same
+    // for 2-dimensional arrays.
+    if (PyList_Check(labels) && PyList_GET_SIZE(labels) <= npyarr->elcount) {
+        PyList_Append(labels, label);
+    }
+
+    if (((JSONObjectDecoder *)npyarr->dec)->arrayAddItem(prv, obj, value)) {
+        Py_DECREF(label);
+        return 1;
+    }
+    return 0;
+}
+
+int Object_objectAddKey(void *prv, JSOBJ obj, JSOBJ name, JSOBJ value) {
+    int ret = PyDict_SetItem(obj, name, value);
+    Py_DECREF((PyObject *)name);
+    Py_DECREF((PyObject *)value);
+    return ret == 0 ? 1 : 0;
+}
+
+int Object_arrayAddItem(void *prv, JSOBJ obj, JSOBJ value) {
+    int ret = PyList_Append(obj, value);
+    Py_DECREF((PyObject *)value);
+    return ret == 0 ? 1 : 0;
+}
+
+JSOBJ Object_newString(void *prv, wchar_t *start, wchar_t *end) {
+    return PyUnicode_FromWideChar(start, (end - start));
+}
+
+JSOBJ Object_newTrue(void *prv) { Py_RETURN_TRUE; }
+
+JSOBJ Object_newFalse(void *prv) { Py_RETURN_FALSE; }
+
+JSOBJ Object_newNull(void *prv) { Py_RETURN_NONE; }
+
+JSOBJ Object_newObject(void *prv, void *decoder) { return PyDict_New(); }
+
+JSOBJ Object_endObject(void *prv, JSOBJ obj) { return obj; }
+
+JSOBJ Object_newArray(void *prv, void *decoder) { return PyList_New(0); }
+
+JSOBJ Object_endArray(void *prv, JSOBJ obj) { return obj; }
+
+JSOBJ Object_newInteger(void *prv, JSINT32 value) {
+    return PyInt_FromLong((long)value);
+}
+
+JSOBJ Object_newLong(void *prv, JSINT64 value) {
+    return PyLong_FromLongLong(value);
+}
+
+JSOBJ Object_newDouble(void *prv, double value) {
+    return PyFloat_FromDouble(value);
+}
+
+static void Object_releaseObject(void *prv, JSOBJ obj, void *_decoder) {
+    PyObjectDecoder *decoder = (PyObjectDecoder *)_decoder;
+    if (obj != decoder->npyarr_addr) {
+        Py_XDECREF(((PyObject *)obj));
+    }
+}
+
+static char *g_kwlist[] = {"obj",      "precise_float", "numpy",
+                           "labelled", "dtype",         NULL};
+
+PyObject *JSONToObj(PyObject *self, PyObject *args, PyObject *kwargs) {
+    PyObject *ret;
+    PyObject *sarg;
+    PyObject *arg;
+    PyObject *opreciseFloat = NULL;
+    JSONObjectDecoder *decoder;
+    PyObjectDecoder pyDecoder;
+    PyArray_Descr *dtype = NULL;
+    int numpy = 0, labelled = 0;
+
+    JSONObjectDecoder dec = {
+        Object_newString, Object_objectAddKey,  Object_arrayAddItem,
+        Object_newTrue,   Object_newFalse,      Object_newNull,
+        Object_newObject, Object_endObject,     Object_newArray,
+        Object_endArray,  Object_newInteger,    Object_newLong,
+        Object_newDouble, Object_releaseObject, PyObject_Malloc,
+        PyObject_Free,    PyObject_Realloc};
+
+    dec.preciseFloat = 0;
+    dec.prv = NULL;
+
+    pyDecoder.dec = dec;
+    pyDecoder.curdim = 0;
+    pyDecoder.npyarr = NULL;
+    pyDecoder.npyarr_addr = NULL;
+
+    decoder = (JSONObjectDecoder *)&pyDecoder;
+
+    if (!PyArg_ParseTupleAndKeywords(args, kwargs, "O|OiiO&", g_kwlist, &arg,
+                                     &opreciseFloat, &numpy, &labelled,
+                                     PyArray_DescrConverter2, &dtype)) {
+        Npy_releaseContext(pyDecoder.npyarr);
+        return NULL;
+    }
+
+    if (opreciseFloat && PyObject_IsTrue(opreciseFloat)) {
+        decoder->preciseFloat = 1;
+    }
+
+    if (PyString_Check(arg)) {
+        sarg = arg;
+    } else if (PyUnicode_Check(arg)) {
+        sarg = PyUnicode_AsUTF8String(arg);
+        if (sarg == NULL) {
+            // Exception raised above us by codec according to docs
+            return NULL;
+        }
+    } else {
+        PyErr_Format(PyExc_TypeError, "Expected String or Unicode");
+        return NULL;
+    }
+
+    decoder->errorStr = NULL;
+    decoder->errorOffset = NULL;
+
+    if (numpy) {
+        pyDecoder.dtype = dtype;
+        decoder->newArray = Object_npyNewArray;
+        decoder->endArray = Object_npyEndArray;
+        decoder->arrayAddItem = Object_npyArrayAddItem;
+
+        if (labelled) {
+            decoder->newObject = Object_npyNewObject;
+            decoder->endObject = Object_npyEndObject;
+            decoder->objectAddKey = Object_npyObjectAddKey;
+        }
+    }
+
+    ret = JSON_DecodeObject(decoder, PyString_AS_STRING(sarg),
+                            PyString_GET_SIZE(sarg));
+
+    if (sarg != arg) {
+        Py_DECREF(sarg);
+    }
+
+    if (PyErr_Occurred()) {
+        if (ret) {
+            Py_DECREF((PyObject *)ret);
+        }
+        Npy_releaseContext(pyDecoder.npyarr);
+        return NULL;
+    }
+
+    if (decoder->errorStr) {
+        /*
+        FIXME: It's possible to give a much nicer error message here with actual
+        failing element in input etc*/
+
+        PyErr_Format(PyExc_ValueError, "%s", decoder->errorStr);
+
+        if (ret) {
+            Py_DECREF((PyObject *)ret);
+        }
+        Npy_releaseContext(pyDecoder.npyarr);
+
+        return NULL;
+    }
+
+    return ret;
+}
+
+PyObject *JSONFileToObj(PyObject *self, PyObject *args, PyObject *kwargs) {
+    PyObject *read;
+    PyObject *string;
+    PyObject *result;
+    PyObject *file = NULL;
+    PyObject *argtuple;
+
+    if (!PyArg_ParseTuple(args, "O", &file)) {
+        return NULL;
+    }
+
+    if (!PyObject_HasAttrString(file, "read")) {
+        PyErr_Format(PyExc_TypeError, "expected file");
+        return NULL;
+    }
+
+    read = PyObject_GetAttrString(file, "read");
+
+    if (!PyCallable_Check(read)) {
+        Py_XDECREF(read);
+        PyErr_Format(PyExc_TypeError, "expected file");
+        return NULL;
+    }
+
+    string = PyObject_CallObject(read, NULL);
+    Py_XDECREF(read);
+
+    if (string == NULL) {
+        return NULL;
+    }
+
+    argtuple = PyTuple_Pack(1, string);
+
+    result = JSONToObj(self, argtuple, kwargs);
+
+    Py_XDECREF(argtuple);
+    Py_XDECREF(string);
+
+    if (result == NULL) {
+        return NULL;
+    }
+
+    return result;
+}
diff --git a/pandas/_libs/src/ujson/python/objToJSON.c b/pandas/_libs/src/ujson/python/objToJSON.c
new file mode 100644
index 0000000000000..e7f334b267461
--- /dev/null
+++ b/pandas/_libs/src/ujson/python/objToJSON.c
@@ -0,0 +1,2533 @@
+/*
+Copyright (c) 2011-2013, ESN Social Software AB and Jonas Tarnstrom
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+* Redistributions of source code must retain the above copyright
+notice, this list of conditions and the following disclaimer.
+* Redistributions in binary form must reproduce the above copyright
+notice, this list of conditions and the following disclaimer in the
+documentation and/or other materials provided with the distribution.
+* Neither the name of the ESN Social Software AB nor the
+names of its contributors may be used to endorse or promote products
+derived from this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
+ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+
+Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
+https://github.com/client9/stringencoders
+Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights reserved.
+
+Numeric decoder derived from from TCL library
+http://www.opensource.apple.com/source/tcl/tcl-14/tcl/license.terms
+* Copyright (c) 1988-1993 The Regents of the University of California.
+* Copyright (c) 1994 Sun Microsystems, Inc.
+*/
+#define PY_ARRAY_UNIQUE_SYMBOL UJSON_NUMPY
+
+// "py_defines.h" needs to be included first to
+// avoid compilation errors, but it does violate
+// styleguide checks with regards to include order.
+#include "py_defines.h"           // NOLINT(build/include_order)
+#include <math.h>                 // NOLINT(build/include_order)
+#include <numpy/arrayobject.h>    // NOLINT(build/include_order)
+#include <numpy/arrayscalars.h>   // NOLINT(build/include_order)
+#include <numpy/npy_math.h>       // NOLINT(build/include_order)
+#include <stdio.h>                // NOLINT(build/include_order)
+#include <ultrajson.h>            // NOLINT(build/include_order)
+#include <np_datetime.h>          // NOLINT(build/include_order)
+#include <np_datetime_strings.h>  // NOLINT(build/include_order)
+#include "datetime.h"
+
+static PyObject *type_decimal;
+
+#define NPY_JSON_BUFSIZE 32768
+
+static PyTypeObject *cls_dataframe;
+static PyTypeObject *cls_series;
+static PyTypeObject *cls_index;
+static PyTypeObject *cls_nat;
+
+npy_int64 get_nat(void) { return NPY_MIN_INT64; }
+
+typedef void *(*PFN_PyTypeToJSON)(JSOBJ obj, JSONTypeContext *ti,
+                                  void *outValue, size_t *_outLen);
+
+#if (PY_VERSION_HEX < 0x02050000)
+typedef ssize_t Py_ssize_t;
+#endif
+
+typedef struct __NpyArrContext {
+    PyObject *array;
+    char *dataptr;
+    int curdim;     // current dimension in array's order
+    int stridedim;  // dimension we are striding over
+    int inc;        // stride dimension increment (+/- 1)
+    npy_intp dim;
+    npy_intp stride;
+    npy_intp ndim;
+    npy_intp index[NPY_MAXDIMS];
+    int type_num;
+    PyArray_GetItemFunc *getitem;
+
+    char **rowLabels;
+    char **columnLabels;
+} NpyArrContext;
+
+typedef struct __PdBlockContext {
+    int colIdx;
+    int ncols;
+    int transpose;
+
+    int *cindices;             // frame column -> block column map
+    NpyArrContext **npyCtxts;  // NpyArrContext for each column
+} PdBlockContext;
+
+typedef struct __TypeContext {
+    JSPFN_ITERBEGIN iterBegin;
+    JSPFN_ITEREND iterEnd;
+    JSPFN_ITERNEXT iterNext;
+    JSPFN_ITERGETNAME iterGetName;
+    JSPFN_ITERGETVALUE iterGetValue;
+    PFN_PyTypeToJSON PyTypeToJSON;
+    PyObject *newObj;
+    PyObject *dictObj;
+    Py_ssize_t index;
+    Py_ssize_t size;
+    PyObject *itemValue;
+    PyObject *itemName;
+    PyObject *attrList;
+    PyObject *iterator;
+
+    double doubleValue;
+    JSINT64 longValue;
+
+    char *cStr;
+    NpyArrContext *npyarr;
+    PdBlockContext *pdblock;
+    int transpose;
+    char **rowLabels;
+    char **columnLabels;
+    npy_intp rowLabelsLen;
+    npy_intp columnLabelsLen;
+} TypeContext;
+
+typedef struct __PyObjectEncoder {
+    JSONObjectEncoder enc;
+
+    // pass through the NpyArrContext when encoding multi-dimensional arrays
+    NpyArrContext *npyCtxtPassthru;
+
+    // pass through the PdBlockContext when encoding blocks
+    PdBlockContext *blkCtxtPassthru;
+
+    // pass-through to encode numpy data directly
+    int npyType;
+    void *npyValue;
+    TypeContext basicTypeContext;
+
+    int datetimeIso;
+    PANDAS_DATETIMEUNIT datetimeUnit;
+
+    // output format style for pandas data types
+    int outputFormat;
+    int originalOutputFormat;
+
+    PyObject *defaultHandler;
+} PyObjectEncoder;
+
+#define GET_TC(__ptrtc) ((TypeContext *)((__ptrtc)->prv))
+
+enum PANDAS_FORMAT { SPLIT, RECORDS, INDEX, COLUMNS, VALUES };
+
+#define PRINTMARK()
+
+int PdBlock_iterNext(JSOBJ, JSONTypeContext *);
+
+// import_array() compat
+#if (PY_VERSION_HEX >= 0x03000000)
+void *initObjToJSON(void)
+#else
+void initObjToJSON(void)
+#endif
+{
+    PyObject *mod_pandas;
+    PyObject *mod_nattype;
+    PyObject *mod_decimal = PyImport_ImportModule("decimal");
+    type_decimal = PyObject_GetAttrString(mod_decimal, "Decimal");
+    Py_INCREF(type_decimal);
+    Py_DECREF(mod_decimal);
+
+    PyDateTime_IMPORT;
+
+    mod_pandas = PyImport_ImportModule("pandas");
+    if (mod_pandas) {
+        cls_dataframe =
+            (PyTypeObject *)PyObject_GetAttrString(mod_pandas, "DataFrame");
+        cls_index = (PyTypeObject *)PyObject_GetAttrString(mod_pandas, "Index");
+        cls_series =
+            (PyTypeObject *)PyObject_GetAttrString(mod_pandas, "Series");
+        Py_DECREF(mod_pandas);
+    }
+
+    mod_nattype = PyImport_ImportModule("pandas._libs.tslibs.nattype");
+    if (mod_nattype) {
+        cls_nat = (PyTypeObject *)PyObject_GetAttrString(mod_nattype,
+                                                         "NaTType");
+        Py_DECREF(mod_nattype);
+    }
+
+    /* Initialise numpy API and use 2/3 compatible return */
+    import_array();
+    return NUMPY_IMPORT_ARRAY_RETVAL;
+}
+
+static TypeContext *createTypeContext(void) {
+    TypeContext *pc;
+
+    pc = PyObject_Malloc(sizeof(TypeContext));
+    if (!pc) {
+        PyErr_NoMemory();
+        return NULL;
+    }
+    pc->newObj = NULL;
+    pc->dictObj = NULL;
+    pc->itemValue = NULL;
+    pc->itemName = NULL;
+    pc->attrList = NULL;
+    pc->index = 0;
+    pc->size = 0;
+    pc->longValue = 0;
+    pc->doubleValue = 0.0;
+    pc->cStr = NULL;
+    pc->npyarr = NULL;
+    pc->pdblock = NULL;
+    pc->rowLabels = NULL;
+    pc->columnLabels = NULL;
+    pc->transpose = 0;
+    pc->rowLabelsLen = 0;
+    pc->columnLabelsLen = 0;
+
+    return pc;
+}
+
+static PyObject *get_values(PyObject *obj) {
+    PyObject *values = PyObject_GetAttrString(obj, "values");
+    PRINTMARK();
+
+    if (values && !PyArray_CheckExact(values)) {
+        if (PyObject_HasAttrString(values, "values")) {
+            PyObject *subvals = get_values(values);
+            PyErr_Clear();
+            PRINTMARK();
+            // subvals are sometimes missing a dimension
+            if (subvals) {
+                PyArrayObject *reshape = (PyArrayObject *)subvals;
+                PyObject *shape = PyObject_GetAttrString(obj, "shape");
+                PyArray_Dims dims;
+                PRINTMARK();
+
+                if (!shape || !PyArray_IntpConverter(shape, &dims)) {
+                    subvals = NULL;
+                } else {
+                    subvals = PyArray_Newshape(reshape, &dims, NPY_ANYORDER);
+                    PyDimMem_FREE(dims.ptr);
+                }
+                Py_DECREF(reshape);
+                Py_XDECREF(shape);
+            }
+            Py_DECREF(values);
+            values = subvals;
+        } else {
+            PRINTMARK();
+            Py_DECREF(values);
+            values = NULL;
+        }
+    }
+
+    if (!values && PyObject_HasAttrString(obj, "get_values")) {
+        PRINTMARK();
+        values = PyObject_CallMethod(obj, "get_values", NULL);
+        if (values && !PyArray_CheckExact(values)) {
+            PRINTMARK();
+            Py_DECREF(values);
+            values = NULL;
+        }
+    }
+
+    if (!values) {
+        PyObject *typeRepr = PyObject_Repr((PyObject *)Py_TYPE(obj));
+        PyObject *repr;
+        PRINTMARK();
+        if (PyObject_HasAttrString(obj, "dtype")) {
+            PyObject *dtype = PyObject_GetAttrString(obj, "dtype");
+            repr = PyObject_Repr(dtype);
+            Py_DECREF(dtype);
+        } else {
+            repr = PyString_FromString("<unknown dtype>");
+        }
+
+        PyErr_Format(PyExc_ValueError, "%s or %s are not JSON serializable yet",
+                     PyString_AS_STRING(repr), PyString_AS_STRING(typeRepr));
+        Py_DECREF(repr);
+        Py_DECREF(typeRepr);
+
+        return NULL;
+    }
+
+    return values;
+}
+
+static PyObject *get_sub_attr(PyObject *obj, char *attr, char *subAttr) {
+    PyObject *tmp = PyObject_GetAttrString(obj, attr);
+    PyObject *ret;
+
+    if (tmp == 0) {
+        return 0;
+    }
+    ret = PyObject_GetAttrString(tmp, subAttr);
+    Py_DECREF(tmp);
+
+    return ret;
+}
+
+static int is_simple_frame(PyObject *obj) {
+    PyObject *check = get_sub_attr(obj, "_data", "is_mixed_type");
+    int ret = (check == Py_False);
+
+    if (!check) {
+        return 0;
+    }
+
+    Py_DECREF(check);
+    return ret;
+}
+
+static Py_ssize_t get_attr_length(PyObject *obj, char *attr) {
+    PyObject *tmp = PyObject_GetAttrString(obj, attr);
+    Py_ssize_t ret;
+
+    if (tmp == 0) {
+        return 0;
+    }
+    ret = PyObject_Length(tmp);
+    Py_DECREF(tmp);
+
+    if (ret == -1) {
+        return 0;
+    }
+
+    return ret;
+}
+
+static npy_int64 get_long_attr(PyObject *o, const char *attr) {
+  npy_int64 long_val;
+  PyObject *value = PyObject_GetAttrString(o, attr);
+  long_val = (PyLong_Check(value) ?
+              PyLong_AsLongLong(value) : PyInt_AS_LONG(value));
+  Py_DECREF(value);
+  return long_val;
+}
+
+static npy_float64 total_seconds(PyObject *td) {
+  npy_float64 double_val;
+  PyObject *value = PyObject_CallMethod(td, "total_seconds", NULL);
+  double_val = PyFloat_AS_DOUBLE(value);
+  Py_DECREF(value);
+  return double_val;
+}
+
+static PyObject *get_item(PyObject *obj, Py_ssize_t i) {
+    PyObject *tmp = PyInt_FromSsize_t(i);
+    PyObject *ret;
+
+    if (tmp == 0) {
+        return 0;
+    }
+    ret = PyObject_GetItem(obj, tmp);
+    Py_DECREF(tmp);
+
+    return ret;
+}
+
+static void *CDouble(JSOBJ obj, JSONTypeContext *tc, void *outValue,
+                     size_t *_outLen) {
+    PRINTMARK();
+    *((double *)outValue) = GET_TC(tc)->doubleValue;
+    return NULL;
+}
+
+static void *CLong(JSOBJ obj, JSONTypeContext *tc, void *outValue,
+                   size_t *_outLen) {
+    PRINTMARK();
+    *((JSINT64 *)outValue) = GET_TC(tc)->longValue;
+    return NULL;
+}
+
+#ifdef _LP64
+static void *PyIntToINT64(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
+                          size_t *_outLen) {
+    PyObject *obj = (PyObject *)_obj;
+    *((JSINT64 *)outValue) = PyInt_AS_LONG(obj);
+    return NULL;
+}
+#else
+static void *PyIntToINT32(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
+                          size_t *_outLen) {
+    PyObject *obj = (PyObject *)_obj;
+    *((JSINT32 *)outValue) = PyInt_AS_LONG(obj);
+    return NULL;
+}
+#endif
+
+static void *PyLongToINT64(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
+                           size_t *_outLen) {
+    *((JSINT64 *)outValue) = GET_TC(tc)->longValue;
+    return NULL;
+}
+
+static void *NpyFloatToDOUBLE(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
+                              size_t *_outLen) {
+    PyObject *obj = (PyObject *)_obj;
+    PyArray_CastScalarToCtype(obj, outValue, PyArray_DescrFromType(NPY_DOUBLE));
+    return NULL;
+}
+
+static void *PyFloatToDOUBLE(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
+                             size_t *_outLen) {
+    PyObject *obj = (PyObject *)_obj;
+    *((double *)outValue) = PyFloat_AsDouble(obj);
+    return NULL;
+}
+
+static void *PyStringToUTF8(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
+                            size_t *_outLen) {
+    PyObject *obj = (PyObject *)_obj;
+    *_outLen = PyString_GET_SIZE(obj);
+    return PyString_AS_STRING(obj);
+}
+
+static void *PyUnicodeToUTF8(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
+                             size_t *_outLen) {
+    PyObject *obj, *newObj;
+    obj = (PyObject *)_obj;
+
+#if (PY_VERSION_HEX >= 0x03030000)
+    if (PyUnicode_IS_COMPACT_ASCII(obj)) {
+        Py_ssize_t len;
+        char *data = PyUnicode_AsUTF8AndSize(obj, &len);
+        *_outLen = len;
+        return data;
+    }
+#endif
+
+    newObj = PyUnicode_EncodeUTF8(PyUnicode_AS_UNICODE(obj),
+                                  PyUnicode_GET_SIZE(obj), NULL);
+
+    GET_TC(tc)->newObj = newObj;
+
+    *_outLen = PyString_GET_SIZE(newObj);
+    return PyString_AS_STRING(newObj);
+}
+
+static void *PandasDateTimeStructToJSON(pandas_datetimestruct *dts,
+                                        JSONTypeContext *tc, void *outValue,
+                                        size_t *_outLen) {
+    PANDAS_DATETIMEUNIT base = ((PyObjectEncoder *)tc->encoder)->datetimeUnit;
+
+    if (((PyObjectEncoder *)tc->encoder)->datetimeIso) {
+        PRINTMARK();
+        *_outLen = (size_t)get_datetime_iso_8601_strlen(0, base);
+        GET_TC(tc)->cStr = PyObject_Malloc(sizeof(char) * (*_outLen));
+        if (!GET_TC(tc)->cStr) {
+            PyErr_NoMemory();
+            ((JSONObjectEncoder *)tc->encoder)->errorMsg = "";
+            return NULL;
+        }
+
+        if (!make_iso_8601_datetime(dts, GET_TC(tc)->cStr, *_outLen, base)) {
+            PRINTMARK();
+            *_outLen = strlen(GET_TC(tc)->cStr);
+            return GET_TC(tc)->cStr;
+        } else {
+            PRINTMARK();
+            PyErr_SetString(PyExc_ValueError,
+                            "Could not convert datetime value to string");
+            ((JSONObjectEncoder *)tc->encoder)->errorMsg = "";
+            PyObject_Free(GET_TC(tc)->cStr);
+            return NULL;
+        }
+    } else {
+        PRINTMARK();
+        *((JSINT64 *)outValue) = pandas_datetimestruct_to_datetime(base, dts);
+        return NULL;
+    }
+}
+
+static void *NpyDateTimeScalarToJSON(JSOBJ _obj, JSONTypeContext *tc,
+                                     void *outValue, size_t *_outLen) {
+    pandas_datetimestruct dts;
+    PyDatetimeScalarObject *obj = (PyDatetimeScalarObject *)_obj;
+    PRINTMARK();
+
+    pandas_datetime_to_datetimestruct(
+        obj->obval, (PANDAS_DATETIMEUNIT)obj->obmeta.base, &dts);
+    return PandasDateTimeStructToJSON(&dts, tc, outValue, _outLen);
+}
+
+static void *PyDateTimeToJSON(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
+                              size_t *_outLen) {
+    pandas_datetimestruct dts;
+    PyObject *obj = (PyObject *)_obj;
+
+    PRINTMARK();
+
+    if (!convert_pydatetime_to_datetimestruct(obj, &dts)) {
+        PRINTMARK();
+        return PandasDateTimeStructToJSON(&dts, tc, outValue, _outLen);
+    } else {
+        if (!PyErr_Occurred()) {
+            PyErr_SetString(PyExc_ValueError,
+                            "Could not convert datetime value to string");
+        }
+        ((JSONObjectEncoder *)tc->encoder)->errorMsg = "";
+        return NULL;
+    }
+}
+
+static void *NpyDatetime64ToJSON(JSOBJ _obj, JSONTypeContext *tc,
+                                 void *outValue, size_t *_outLen) {
+    pandas_datetimestruct dts;
+    PRINTMARK();
+
+    pandas_datetime_to_datetimestruct((npy_datetime)GET_TC(tc)->longValue,
+                                      PANDAS_FR_ns, &dts);
+    return PandasDateTimeStructToJSON(&dts, tc, outValue, _outLen);
+}
+
+static void *PyTimeToJSON(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
+                          size_t *outLen) {
+    PyObject *obj = (PyObject *)_obj;
+    PyObject *str;
+    PyObject *tmp;
+
+    str = PyObject_CallMethod(obj, "isoformat", NULL);
+    if (str == NULL) {
+        PRINTMARK();
+        *outLen = 0;
+        if (!PyErr_Occurred()) {
+            PyErr_SetString(PyExc_ValueError, "Failed to convert time");
+        }
+        ((JSONObjectEncoder *)tc->encoder)->errorMsg = "";
+        return NULL;
+    }
+    if (PyUnicode_Check(str)) {
+        tmp = str;
+        str = PyUnicode_AsUTF8String(str);
+        Py_DECREF(tmp);
+    }
+
+    GET_TC(tc)->newObj = str;
+
+    *outLen = PyString_GET_SIZE(str);
+    outValue = (void *)PyString_AS_STRING(str);
+    return outValue;
+}
+
+static int NpyTypeToJSONType(PyObject *obj, JSONTypeContext *tc, int npyType,
+                             void *value) {
+    PyArray_VectorUnaryFunc *castfunc;
+    npy_double doubleVal;
+    npy_int64 longVal;
+
+    if (PyTypeNum_ISFLOAT(npyType)) {
+        PRINTMARK();
+        castfunc =
+            PyArray_GetCastFunc(PyArray_DescrFromType(npyType), NPY_DOUBLE);
+        if (!castfunc) {
+            PyErr_Format(PyExc_ValueError,
+                         "Cannot cast numpy dtype %d to double", npyType);
+        }
+        castfunc(value, &doubleVal, 1, NULL, NULL);
+        if (npy_isnan(doubleVal) || npy_isinf(doubleVal)) {
+            PRINTMARK();
+            return JT_NULL;
+        }
+        GET_TC(tc)->doubleValue = (double)doubleVal;
+        GET_TC(tc)->PyTypeToJSON = CDouble;
+        return JT_DOUBLE;
+    }
+
+    if (PyTypeNum_ISDATETIME(npyType)) {
+        PRINTMARK();
+        castfunc =
+            PyArray_GetCastFunc(PyArray_DescrFromType(npyType), NPY_INT64);
+        if (!castfunc) {
+            PyErr_Format(PyExc_ValueError, "Cannot cast numpy dtype %d to long",
+                         npyType);
+        }
+        castfunc(value, &longVal, 1, NULL, NULL);
+        if (longVal == get_nat()) {
+            PRINTMARK();
+            return JT_NULL;
+        }
+        GET_TC(tc)->longValue = (JSINT64)longVal;
+        GET_TC(tc)->PyTypeToJSON = NpyDatetime64ToJSON;
+        return ((PyObjectEncoder *)tc->encoder)->datetimeIso ? JT_UTF8
+                                                             : JT_LONG;
+    }
+
+    if (PyTypeNum_ISINTEGER(npyType)) {
+        PRINTMARK();
+        castfunc =
+            PyArray_GetCastFunc(PyArray_DescrFromType(npyType), NPY_INT64);
+        if (!castfunc) {
+            PyErr_Format(PyExc_ValueError, "Cannot cast numpy dtype %d to long",
+                         npyType);
+        }
+        castfunc(value, &longVal, 1, NULL, NULL);
+        GET_TC(tc)->longValue = (JSINT64)longVal;
+        GET_TC(tc)->PyTypeToJSON = CLong;
+        return JT_LONG;
+    }
+
+    if (PyTypeNum_ISBOOL(npyType)) {
+        PRINTMARK();
+        return *((npy_bool *)value) == NPY_TRUE ? JT_TRUE : JT_FALSE;
+    }
+
+    PRINTMARK();
+    return JT_INVALID;
+}
+
+//=============================================================================
+// Numpy array iteration functions
+//=============================================================================
+
+static void NpyArr_freeItemValue(JSOBJ _obj, JSONTypeContext *tc) {
+    if (GET_TC(tc)->npyarr &&
+        GET_TC(tc)->itemValue != GET_TC(tc)->npyarr->array) {
+        PRINTMARK();
+        Py_XDECREF(GET_TC(tc)->itemValue);
+        GET_TC(tc)->itemValue = NULL;
+    }
+}
+
+int NpyArr_iterNextNone(JSOBJ _obj, JSONTypeContext *tc) { return 0; }
+
+void NpyArr_iterBegin(JSOBJ _obj, JSONTypeContext *tc) {
+    PyArrayObject *obj;
+    NpyArrContext *npyarr;
+
+    if (GET_TC(tc)->newObj) {
+        obj = (PyArrayObject *)GET_TC(tc)->newObj;
+    } else {
+        obj = (PyArrayObject *)_obj;
+    }
+
+    if (PyArray_SIZE(obj) < 0) {
+        PRINTMARK();
+        GET_TC(tc)->iterNext = NpyArr_iterNextNone;
+    } else {
+        PRINTMARK();
+        npyarr = PyObject_Malloc(sizeof(NpyArrContext));
+        GET_TC(tc)->npyarr = npyarr;
+
+        if (!npyarr) {
+            PyErr_NoMemory();
+            GET_TC(tc)->iterNext = NpyArr_iterNextNone;
+            return;
+        }
+
+        npyarr->array = (PyObject *)obj;
+        npyarr->getitem = (PyArray_GetItemFunc *)PyArray_DESCR(obj)->f->getitem;
+        npyarr->dataptr = PyArray_DATA(obj);
+        npyarr->ndim = PyArray_NDIM(obj) - 1;
+        npyarr->curdim = 0;
+        npyarr->type_num = PyArray_DESCR(obj)->type_num;
+
+        if (GET_TC(tc)->transpose) {
+            npyarr->dim = PyArray_DIM(obj, npyarr->ndim);
+            npyarr->stride = PyArray_STRIDE(obj, npyarr->ndim);
+            npyarr->stridedim = npyarr->ndim;
+            npyarr->index[npyarr->ndim] = 0;
+            npyarr->inc = -1;
+        } else {
+            npyarr->dim = PyArray_DIM(obj, 0);
+            npyarr->stride = PyArray_STRIDE(obj, 0);
+            npyarr->stridedim = 0;
+            npyarr->index[0] = 0;
+            npyarr->inc = 1;
+        }
+
+        npyarr->columnLabels = GET_TC(tc)->columnLabels;
+        npyarr->rowLabels = GET_TC(tc)->rowLabels;
+    }
+}
+
+void NpyArr_iterEnd(JSOBJ obj, JSONTypeContext *tc) {
+    NpyArrContext *npyarr = GET_TC(tc)->npyarr;
+    PRINTMARK();
+
+    if (npyarr) {
+        NpyArr_freeItemValue(obj, tc);
+        PyObject_Free(npyarr);
+    }
+}
+
+void NpyArrPassThru_iterBegin(JSOBJ obj, JSONTypeContext *tc) { PRINTMARK(); }
+
+void NpyArrPassThru_iterEnd(JSOBJ obj, JSONTypeContext *tc) {
+    NpyArrContext *npyarr = GET_TC(tc)->npyarr;
+    PRINTMARK();
+    // finished this dimension, reset the data pointer
+    npyarr->curdim--;
+    npyarr->dataptr -= npyarr->stride * npyarr->index[npyarr->stridedim];
+    npyarr->stridedim -= npyarr->inc;
+    npyarr->dim = PyArray_DIM(npyarr->array, npyarr->stridedim);
+    npyarr->stride = PyArray_STRIDE(npyarr->array, npyarr->stridedim);
+    npyarr->dataptr += npyarr->stride;
+
+    NpyArr_freeItemValue(obj, tc);
+}
+
+int NpyArr_iterNextItem(JSOBJ obj, JSONTypeContext *tc) {
+    NpyArrContext *npyarr = GET_TC(tc)->npyarr;
+    PRINTMARK();
+
+    if (PyErr_Occurred()) {
+        return 0;
+    }
+
+    if (npyarr->index[npyarr->stridedim] >= npyarr->dim) {
+        PRINTMARK();
+        return 0;
+    }
+
+    NpyArr_freeItemValue(obj, tc);
+
+#if NPY_API_VERSION < 0x00000007
+    if (PyArray_ISDATETIME(npyarr->array)) {
+        PRINTMARK();
+        GET_TC(tc)
+            ->itemValue = PyArray_ToScalar(npyarr->dataptr, npyarr->array);
+    } else if (PyArray_ISNUMBER(npyarr->array))  // NOLINT
+#else
+    if (PyArray_ISNUMBER(npyarr->array) || PyArray_ISDATETIME(npyarr->array))  // NOLINT
+#endif
+    {
+        PRINTMARK();
+        GET_TC(tc)->itemValue = obj;
+        Py_INCREF(obj);
+        ((PyObjectEncoder *)tc->encoder)->npyType = PyArray_TYPE(npyarr->array);
+        ((PyObjectEncoder *)tc->encoder)->npyValue = npyarr->dataptr;
+        ((PyObjectEncoder *)tc->encoder)->npyCtxtPassthru = npyarr;
+    } else {
+        PRINTMARK();
+        GET_TC(tc)->itemValue = npyarr->getitem(npyarr->dataptr, npyarr->array);
+    }
+
+    npyarr->dataptr += npyarr->stride;
+    npyarr->index[npyarr->stridedim]++;
+    return 1;
+}
+
+int NpyArr_iterNext(JSOBJ _obj, JSONTypeContext *tc) {
+    NpyArrContext *npyarr = GET_TC(tc)->npyarr;
+    PRINTMARK();
+
+    if (PyErr_Occurred()) {
+        PRINTMARK();
+        return 0;
+    }
+
+    if (npyarr->curdim >= npyarr->ndim ||
+        npyarr->index[npyarr->stridedim] >= npyarr->dim) {
+        PRINTMARK();
+        // innermost dimension, start retrieving item values
+        GET_TC(tc)->iterNext = NpyArr_iterNextItem;
+        return NpyArr_iterNextItem(_obj, tc);
+    }
+
+    // dig a dimension deeper
+    npyarr->index[npyarr->stridedim]++;
+
+    npyarr->curdim++;
+    npyarr->stridedim += npyarr->inc;
+    npyarr->dim = PyArray_DIM(npyarr->array, npyarr->stridedim);
+    npyarr->stride = PyArray_STRIDE(npyarr->array, npyarr->stridedim);
+    npyarr->index[npyarr->stridedim] = 0;
+
+    ((PyObjectEncoder *)tc->encoder)->npyCtxtPassthru = npyarr;
+    GET_TC(tc)->itemValue = npyarr->array;
+    return 1;
+}
+
+JSOBJ NpyArr_iterGetValue(JSOBJ obj, JSONTypeContext *tc) {
+    PRINTMARK();
+    return GET_TC(tc)->itemValue;
+}
+
+static void NpyArr_getLabel(JSOBJ obj, JSONTypeContext *tc, size_t *outLen,
+                            npy_intp idx, char **labels) {
+    JSONObjectEncoder *enc = (JSONObjectEncoder *)tc->encoder;
+    PRINTMARK();
+    *outLen = strlen(labels[idx]);
+    Buffer_Reserve(enc, *outLen);
+    memcpy(enc->offset, labels[idx], sizeof(char) * (*outLen));
+    enc->offset += *outLen;
+    *outLen = 0;
+}
+
+char *NpyArr_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen) {
+    NpyArrContext *npyarr = GET_TC(tc)->npyarr;
+    npy_intp idx;
+    PRINTMARK();
+
+    if (GET_TC(tc)->iterNext == NpyArr_iterNextItem) {
+        idx = npyarr->index[npyarr->stridedim] - 1;
+        NpyArr_getLabel(obj, tc, outLen, idx, npyarr->columnLabels);
+    } else {
+        idx = npyarr->index[npyarr->stridedim - npyarr->inc] - 1;
+        NpyArr_getLabel(obj, tc, outLen, idx, npyarr->rowLabels);
+    }
+    return NULL;
+}
+
+//=============================================================================
+// Pandas block iteration functions
+//
+// Serialises a DataFrame column by column to avoid unnecessary data copies and
+// more representative serialisation when dealing with mixed dtypes.
+//
+// Uses a dedicated NpyArrContext for each column.
+//=============================================================================
+
+void PdBlockPassThru_iterEnd(JSOBJ obj, JSONTypeContext *tc) {
+    PdBlockContext *blkCtxt = GET_TC(tc)->pdblock;
+    PRINTMARK();
+
+    if (blkCtxt->transpose) {
+        blkCtxt->colIdx++;
+    } else {
+        blkCtxt->colIdx = 0;
+    }
+
+    NpyArr_freeItemValue(obj, tc);
+}
+
+int PdBlock_iterNextItem(JSOBJ obj, JSONTypeContext *tc) {
+    PdBlockContext *blkCtxt = GET_TC(tc)->pdblock;
+    PRINTMARK();
+
+    if (blkCtxt->colIdx >= blkCtxt->ncols) {
+        return 0;
+    }
+
+    GET_TC(tc)->npyarr = blkCtxt->npyCtxts[blkCtxt->colIdx];
+    blkCtxt->colIdx++;
+    return NpyArr_iterNextItem(obj, tc);
+}
+
+char *PdBlock_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen) {
+    PdBlockContext *blkCtxt = GET_TC(tc)->pdblock;
+    NpyArrContext *npyarr = blkCtxt->npyCtxts[0];
+    npy_intp idx;
+    PRINTMARK();
+
+    if (GET_TC(tc)->iterNext == PdBlock_iterNextItem) {
+        idx = blkCtxt->colIdx - 1;
+        NpyArr_getLabel(obj, tc, outLen, idx, npyarr->columnLabels);
+    } else {
+        idx = GET_TC(tc)->iterNext != PdBlock_iterNext
+                  ? npyarr->index[npyarr->stridedim - npyarr->inc] - 1
+                  : npyarr->index[npyarr->stridedim];
+
+        NpyArr_getLabel(obj, tc, outLen, idx, npyarr->rowLabels);
+    }
+    return NULL;
+}
+
+char *PdBlock_iterGetName_Transpose(JSOBJ obj, JSONTypeContext *tc,
+                                    size_t *outLen) {
+    PdBlockContext *blkCtxt = GET_TC(tc)->pdblock;
+    NpyArrContext *npyarr = blkCtxt->npyCtxts[blkCtxt->colIdx];
+    npy_intp idx;
+    PRINTMARK();
+
+    if (GET_TC(tc)->iterNext == NpyArr_iterNextItem) {
+        idx = npyarr->index[npyarr->stridedim] - 1;
+        NpyArr_getLabel(obj, tc, outLen, idx, npyarr->columnLabels);
+    } else {
+        idx = blkCtxt->colIdx;
+        NpyArr_getLabel(obj, tc, outLen, idx, npyarr->rowLabels);
+    }
+    return NULL;
+}
+
+int PdBlock_iterNext(JSOBJ obj, JSONTypeContext *tc) {
+    PdBlockContext *blkCtxt = GET_TC(tc)->pdblock;
+    NpyArrContext *npyarr;
+    PRINTMARK();
+
+    if (PyErr_Occurred() || ((JSONObjectEncoder *)tc->encoder)->errorMsg) {
+        return 0;
+    }
+
+    if (blkCtxt->transpose) {
+        if (blkCtxt->colIdx >= blkCtxt->ncols) {
+            return 0;
+        }
+    } else {
+        npyarr = blkCtxt->npyCtxts[0];
+        if (npyarr->index[npyarr->stridedim] >= npyarr->dim) {
+            return 0;
+        }
+    }
+
+    ((PyObjectEncoder *)tc->encoder)->blkCtxtPassthru = blkCtxt;
+    GET_TC(tc)->itemValue = obj;
+
+    return 1;
+}
+
+void PdBlockPassThru_iterBegin(JSOBJ obj, JSONTypeContext *tc) {
+    PdBlockContext *blkCtxt = GET_TC(tc)->pdblock;
+    PRINTMARK();
+
+    if (blkCtxt->transpose) {
+        // if transposed we exhaust each column before moving to the next
+        GET_TC(tc)->iterNext = NpyArr_iterNextItem;
+        GET_TC(tc)->iterGetName = PdBlock_iterGetName_Transpose;
+        GET_TC(tc)->npyarr = blkCtxt->npyCtxts[blkCtxt->colIdx];
+    }
+}
+
+void PdBlock_iterBegin(JSOBJ _obj, JSONTypeContext *tc) {
+    PyObject *obj, *blocks, *block, *values, *tmp;
+    PyArrayObject *locs;
+    PdBlockContext *blkCtxt;
+    NpyArrContext *npyarr;
+    Py_ssize_t i;
+    PyArray_Descr *dtype;
+    NpyIter *iter;
+    NpyIter_IterNextFunc *iternext;
+    npy_int64 **dataptr;
+    npy_int64 colIdx;
+    npy_intp idx;
+
+    PRINTMARK();
+
+    i = 0;
+    blocks = NULL;
+    dtype = PyArray_DescrFromType(NPY_INT64);
+    obj = (PyObject *)_obj;
+
+    GET_TC(tc)
+        ->iterGetName = GET_TC(tc)->transpose ? PdBlock_iterGetName_Transpose
+                                              : PdBlock_iterGetName;
+
+    blkCtxt = PyObject_Malloc(sizeof(PdBlockContext));
+    if (!blkCtxt) {
+        PyErr_NoMemory();
+        GET_TC(tc)->iterNext = NpyArr_iterNextNone;
+        goto BLKRET;
+    }
+    GET_TC(tc)->pdblock = blkCtxt;
+
+    blkCtxt->colIdx = 0;
+    blkCtxt->transpose = GET_TC(tc)->transpose;
+    blkCtxt->ncols = get_attr_length(obj, "columns");
+
+    if (blkCtxt->ncols == 0) {
+        blkCtxt->npyCtxts = NULL;
+        blkCtxt->cindices = NULL;
+
+        GET_TC(tc)->iterNext = NpyArr_iterNextNone;
+        goto BLKRET;
+    }
+
+    blkCtxt->npyCtxts =
+        PyObject_Malloc(sizeof(NpyArrContext *) * blkCtxt->ncols);
+    if (!blkCtxt->npyCtxts) {
+        PyErr_NoMemory();
+        GET_TC(tc)->iterNext = NpyArr_iterNextNone;
+        goto BLKRET;
+    }
+    for (i = 0; i < blkCtxt->ncols; i++) {
+        blkCtxt->npyCtxts[i] = NULL;
+    }
+
+    blkCtxt->cindices = PyObject_Malloc(sizeof(int) * blkCtxt->ncols);
+    if (!blkCtxt->cindices) {
+        PyErr_NoMemory();
+        GET_TC(tc)->iterNext = NpyArr_iterNextNone;
+        goto BLKRET;
+    }
+
+    blocks = get_sub_attr(obj, "_data", "blocks");
+    if (!blocks) {
+        GET_TC(tc)->iterNext = NpyArr_iterNextNone;
+        goto BLKRET;
+    }
+
+    // force transpose so each NpyArrContext strides down its column
+    GET_TC(tc)->transpose = 1;
+
+    for (i = 0; i < PyObject_Length(blocks); i++) {
+        block = get_item(blocks, i);
+        if (!block) {
+            GET_TC(tc)->iterNext = NpyArr_iterNextNone;
+            goto BLKRET;
+        }
+
+        tmp = get_values(block);
+        if (!tmp) {
+            ((JSONObjectEncoder *)tc->encoder)->errorMsg = "";
+            Py_DECREF(block);
+            GET_TC(tc)->iterNext = NpyArr_iterNextNone;
+            goto BLKRET;
+        }
+
+        values = PyArray_Transpose((PyArrayObject *)tmp, NULL);
+        Py_DECREF(tmp);
+        if (!values) {
+            Py_DECREF(block);
+            GET_TC(tc)->iterNext = NpyArr_iterNextNone;
+            goto BLKRET;
+        }
+
+        locs = (PyArrayObject *)get_sub_attr(block, "mgr_locs", "as_array");
+        if (!locs) {
+            Py_DECREF(block);
+            Py_DECREF(values);
+            GET_TC(tc)->iterNext = NpyArr_iterNextNone;
+            goto BLKRET;
+        }
+
+        iter = NpyIter_New(locs, NPY_ITER_READONLY, NPY_KEEPORDER,
+                           NPY_NO_CASTING, dtype);
+        if (!iter) {
+            Py_DECREF(block);
+            Py_DECREF(values);
+            Py_DECREF(locs);
+            GET_TC(tc)->iterNext = NpyArr_iterNextNone;
+            goto BLKRET;
+        }
+        iternext = NpyIter_GetIterNext(iter, NULL);
+        if (!iternext) {
+            NpyIter_Deallocate(iter);
+            Py_DECREF(block);
+            Py_DECREF(values);
+            Py_DECREF(locs);
+            GET_TC(tc)->iterNext = NpyArr_iterNextNone;
+            goto BLKRET;
+        }
+        dataptr = (npy_int64 **)NpyIter_GetDataPtrArray(iter);
+        do {
+            colIdx = **dataptr;
+            idx = NpyIter_GetIterIndex(iter);
+
+            blkCtxt->cindices[colIdx] = idx;
+
+            // Reference freed in Pdblock_iterend
+            Py_INCREF(values);
+            GET_TC(tc)->newObj = values;
+
+            // init a dedicated context for this column
+            NpyArr_iterBegin(obj, tc);
+            npyarr = GET_TC(tc)->npyarr;
+
+            // set the dataptr to our desired column and initialise
+            if (npyarr != NULL) {
+                npyarr->dataptr += npyarr->stride * idx;
+                NpyArr_iterNext(obj, tc);
+            }
+            GET_TC(tc)->itemValue = NULL;
+            ((PyObjectEncoder *)tc->encoder)->npyCtxtPassthru = NULL;
+
+            blkCtxt->npyCtxts[colIdx] = npyarr;
+            GET_TC(tc)->newObj = NULL;
+        } while (iternext(iter));
+
+        NpyIter_Deallocate(iter);
+        Py_DECREF(block);
+        Py_DECREF(values);
+        Py_DECREF(locs);
+    }
+    GET_TC(tc)->npyarr = blkCtxt->npyCtxts[0];
+
+BLKRET:
+    Py_XDECREF(dtype);
+    Py_XDECREF(blocks);
+}
+
+void PdBlock_iterEnd(JSOBJ obj, JSONTypeContext *tc) {
+    PdBlockContext *blkCtxt;
+    NpyArrContext *npyarr;
+    int i;
+    PRINTMARK();
+
+    GET_TC(tc)->itemValue = NULL;
+    npyarr = GET_TC(tc)->npyarr;
+
+    blkCtxt = GET_TC(tc)->pdblock;
+
+    if (blkCtxt) {
+        for (i = 0; i < blkCtxt->ncols; i++) {
+            npyarr = blkCtxt->npyCtxts[i];
+            if (npyarr) {
+                if (npyarr->array) {
+                    Py_DECREF(npyarr->array);
+                    npyarr->array = NULL;
+                }
+
+                GET_TC(tc)->npyarr = npyarr;
+                NpyArr_iterEnd(obj, tc);
+
+                blkCtxt->npyCtxts[i] = NULL;
+            }
+        }
+
+        if (blkCtxt->npyCtxts) {
+            PyObject_Free(blkCtxt->npyCtxts);
+        }
+        if (blkCtxt->cindices) {
+            PyObject_Free(blkCtxt->cindices);
+        }
+        PyObject_Free(blkCtxt);
+    }
+}
+
+//=============================================================================
+// Tuple iteration functions
+// itemValue is borrowed reference, no ref counting
+//=============================================================================
+void Tuple_iterBegin(JSOBJ obj, JSONTypeContext *tc) {
+    GET_TC(tc)->index = 0;
+    GET_TC(tc)->size = PyTuple_GET_SIZE((PyObject *)obj);
+    GET_TC(tc)->itemValue = NULL;
+}
+
+int Tuple_iterNext(JSOBJ obj, JSONTypeContext *tc) {
+    PyObject *item;
+
+    if (GET_TC(tc)->index >= GET_TC(tc)->size) {
+        return 0;
+    }
+
+    item = PyTuple_GET_ITEM(obj, GET_TC(tc)->index);
+
+    GET_TC(tc)->itemValue = item;
+    GET_TC(tc)->index++;
+    return 1;
+}
+
+void Tuple_iterEnd(JSOBJ obj, JSONTypeContext *tc) {}
+
+JSOBJ Tuple_iterGetValue(JSOBJ obj, JSONTypeContext *tc) {
+    return GET_TC(tc)->itemValue;
+}
+
+char *Tuple_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen) {
+    return NULL;
+}
+
+//=============================================================================
+// Iterator iteration functions
+// itemValue is borrowed reference, no ref counting
+//=============================================================================
+void Iter_iterBegin(JSOBJ obj, JSONTypeContext *tc) {
+    GET_TC(tc)->itemValue = NULL;
+    GET_TC(tc)->iterator = PyObject_GetIter(obj);
+}
+
+int Iter_iterNext(JSOBJ obj, JSONTypeContext *tc) {
+    PyObject *item;
+
+    if (GET_TC(tc)->itemValue) {
+        Py_DECREF(GET_TC(tc)->itemValue);
+        GET_TC(tc)->itemValue = NULL;
+    }
+
+    item = PyIter_Next(GET_TC(tc)->iterator);
+
+    if (item == NULL) {
+        return 0;
+    }
+
+    GET_TC(tc)->itemValue = item;
+    return 1;
+}
+
+void Iter_iterEnd(JSOBJ obj, JSONTypeContext *tc) {
+    if (GET_TC(tc)->itemValue) {
+        Py_DECREF(GET_TC(tc)->itemValue);
+        GET_TC(tc)->itemValue = NULL;
+    }
+
+    if (GET_TC(tc)->iterator) {
+        Py_DECREF(GET_TC(tc)->iterator);
+        GET_TC(tc)->iterator = NULL;
+    }
+}
+
+JSOBJ Iter_iterGetValue(JSOBJ obj, JSONTypeContext *tc) {
+    return GET_TC(tc)->itemValue;
+}
+
+char *Iter_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen) {
+    return NULL;
+}
+
+//=============================================================================
+// Dir iteration functions
+// itemName ref is borrowed from PyObject_Dir (attrList). No refcount
+// itemValue ref is from PyObject_GetAttr. Ref counted
+//=============================================================================
+void Dir_iterBegin(JSOBJ obj, JSONTypeContext *tc) {
+    GET_TC(tc)->attrList = PyObject_Dir(obj);
+    GET_TC(tc)->index = 0;
+    GET_TC(tc)->size = PyList_GET_SIZE(GET_TC(tc)->attrList);
+    PRINTMARK();
+}
+
+void Dir_iterEnd(JSOBJ obj, JSONTypeContext *tc) {
+    if (GET_TC(tc)->itemValue) {
+        Py_DECREF(GET_TC(tc)->itemValue);
+        GET_TC(tc)->itemValue = NULL;
+    }
+
+    if (GET_TC(tc)->itemName) {
+        Py_DECREF(GET_TC(tc)->itemName);
+        GET_TC(tc)->itemName = NULL;
+    }
+
+    Py_DECREF((PyObject *)GET_TC(tc)->attrList);
+    PRINTMARK();
+}
+
+int Dir_iterNext(JSOBJ _obj, JSONTypeContext *tc) {
+    PyObject *obj = (PyObject *)_obj;
+    PyObject *itemValue = GET_TC(tc)->itemValue;
+    PyObject *itemName = GET_TC(tc)->itemName;
+    PyObject *attr;
+    PyObject *attrName;
+    char *attrStr;
+
+    if (PyErr_Occurred() || ((JSONObjectEncoder *)tc->encoder)->errorMsg) {
+        return 0;
+    }
+
+    if (itemValue) {
+        Py_DECREF(GET_TC(tc)->itemValue);
+        GET_TC(tc)->itemValue = itemValue = NULL;
+    }
+
+    if (itemName) {
+        Py_DECREF(GET_TC(tc)->itemName);
+        GET_TC(tc)->itemName = itemName = NULL;
+    }
+
+    for (; GET_TC(tc)->index < GET_TC(tc)->size; GET_TC(tc)->index++) {
+        attrName = PyList_GET_ITEM(GET_TC(tc)->attrList, GET_TC(tc)->index);
+#if PY_MAJOR_VERSION >= 3
+        attr = PyUnicode_AsUTF8String(attrName);
+#else
+        attr = attrName;
+        Py_INCREF(attr);
+#endif
+        attrStr = PyString_AS_STRING(attr);
+
+        if (attrStr[0] == '_') {
+            PRINTMARK();
+            Py_DECREF(attr);
+            continue;
+        }
+
+        itemValue = PyObject_GetAttr(obj, attrName);
+        if (itemValue == NULL) {
+            PyErr_Clear();
+            Py_DECREF(attr);
+            PRINTMARK();
+            continue;
+        }
+
+        if (PyCallable_Check(itemValue)) {
+            Py_DECREF(itemValue);
+            Py_DECREF(attr);
+            PRINTMARK();
+            continue;
+        }
+
+        GET_TC(tc)->itemName = itemName;
+        GET_TC(tc)->itemValue = itemValue;
+        GET_TC(tc)->index++;
+
+        PRINTMARK();
+        itemName = attr;
+        break;
+    }
+
+    if (itemName == NULL) {
+        GET_TC(tc)->index = GET_TC(tc)->size;
+        GET_TC(tc)->itemValue = NULL;
+        return 0;
+    }
+
+    GET_TC(tc)->itemName = itemName;
+    GET_TC(tc)->itemValue = itemValue;
+    GET_TC(tc)->index++;
+
+    PRINTMARK();
+    return 1;
+}
+
+JSOBJ Dir_iterGetValue(JSOBJ obj, JSONTypeContext *tc) {
+    PRINTMARK();
+    return GET_TC(tc)->itemValue;
+}
+
+char *Dir_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen) {
+    PRINTMARK();
+    *outLen = PyString_GET_SIZE(GET_TC(tc)->itemName);
+    return PyString_AS_STRING(GET_TC(tc)->itemName);
+}
+
+//=============================================================================
+// List iteration functions
+// itemValue is borrowed from object (which is list). No refcounting
+//=============================================================================
+void List_iterBegin(JSOBJ obj, JSONTypeContext *tc) {
+    GET_TC(tc)->index = 0;
+    GET_TC(tc)->size = PyList_GET_SIZE((PyObject *)obj);
+}
+
+int List_iterNext(JSOBJ obj, JSONTypeContext *tc) {
+    if (GET_TC(tc)->index >= GET_TC(tc)->size) {
+        PRINTMARK();
+        return 0;
+    }
+
+    GET_TC(tc)->itemValue = PyList_GET_ITEM(obj, GET_TC(tc)->index);
+    GET_TC(tc)->index++;
+    return 1;
+}
+
+void List_iterEnd(JSOBJ obj, JSONTypeContext *tc) {}
+
+JSOBJ List_iterGetValue(JSOBJ obj, JSONTypeContext *tc) {
+    return GET_TC(tc)->itemValue;
+}
+
+char *List_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen) {
+    return NULL;
+}
+
+//=============================================================================
+// pandas Index iteration functions
+//=============================================================================
+void Index_iterBegin(JSOBJ obj, JSONTypeContext *tc) {
+    GET_TC(tc)->index = 0;
+    GET_TC(tc)->cStr = PyObject_Malloc(20 * sizeof(char));
+    if (!GET_TC(tc)->cStr) {
+        PyErr_NoMemory();
+    }
+    PRINTMARK();
+}
+
+int Index_iterNext(JSOBJ obj, JSONTypeContext *tc) {
+    Py_ssize_t index;
+    if (!GET_TC(tc)->cStr) {
+        return 0;
+    }
+
+    index = GET_TC(tc)->index;
+    Py_XDECREF(GET_TC(tc)->itemValue);
+    if (index == 0) {
+        memcpy(GET_TC(tc)->cStr, "name", sizeof(char) * 5);
+        GET_TC(tc)->itemValue = PyObject_GetAttrString(obj, "name");
+    } else if (index == 1) {
+        memcpy(GET_TC(tc)->cStr, "data", sizeof(char) * 5);
+        GET_TC(tc)->itemValue = get_values(obj);
+        if (!GET_TC(tc)->itemValue) {
+            return 0;
+        }
+    } else {
+        PRINTMARK();
+        return 0;
+    }
+
+    GET_TC(tc)->index++;
+    PRINTMARK();
+    return 1;
+}
+
+void Index_iterEnd(JSOBJ obj, JSONTypeContext *tc) { PRINTMARK(); }
+
+JSOBJ Index_iterGetValue(JSOBJ obj, JSONTypeContext *tc) {
+    return GET_TC(tc)->itemValue;
+}
+
+char *Index_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen) {
+    *outLen = strlen(GET_TC(tc)->cStr);
+    return GET_TC(tc)->cStr;
+}
+
+//=============================================================================
+// pandas Series iteration functions
+//=============================================================================
+void Series_iterBegin(JSOBJ obj, JSONTypeContext *tc) {
+    PyObjectEncoder *enc = (PyObjectEncoder *)tc->encoder;
+    GET_TC(tc)->index = 0;
+    GET_TC(tc)->cStr = PyObject_Malloc(20 * sizeof(char));
+    enc->outputFormat = VALUES;  // for contained series
+    if (!GET_TC(tc)->cStr) {
+        PyErr_NoMemory();
+    }
+    PRINTMARK();
+}
+
+int Series_iterNext(JSOBJ obj, JSONTypeContext *tc) {
+    Py_ssize_t index;
+    if (!GET_TC(tc)->cStr) {
+        return 0;
+    }
+
+    index = GET_TC(tc)->index;
+    Py_XDECREF(GET_TC(tc)->itemValue);
+    if (index == 0) {
+        memcpy(GET_TC(tc)->cStr, "name", sizeof(char) * 5);
+        GET_TC(tc)->itemValue = PyObject_GetAttrString(obj, "name");
+    } else if (index == 1) {
+        memcpy(GET_TC(tc)->cStr, "index", sizeof(char) * 6);
+        GET_TC(tc)->itemValue = PyObject_GetAttrString(obj, "index");
+    } else if (index == 2) {
+        memcpy(GET_TC(tc)->cStr, "data", sizeof(char) * 5);
+        GET_TC(tc)->itemValue = get_values(obj);
+        if (!GET_TC(tc)->itemValue) {
+            return 0;
+        }
+    } else {
+        PRINTMARK();
+        return 0;
+    }
+
+    GET_TC(tc)->index++;
+    PRINTMARK();
+    return 1;
+}
+
+void Series_iterEnd(JSOBJ obj, JSONTypeContext *tc) {
+    PyObjectEncoder *enc = (PyObjectEncoder *)tc->encoder;
+    enc->outputFormat = enc->originalOutputFormat;
+    PRINTMARK();
+}
+
+JSOBJ Series_iterGetValue(JSOBJ obj, JSONTypeContext *tc) {
+    return GET_TC(tc)->itemValue;
+}
+
+char *Series_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen) {
+    *outLen = strlen(GET_TC(tc)->cStr);
+    return GET_TC(tc)->cStr;
+}
+
+//=============================================================================
+// pandas DataFrame iteration functions
+//=============================================================================
+void DataFrame_iterBegin(JSOBJ obj, JSONTypeContext *tc) {
+    PyObjectEncoder *enc = (PyObjectEncoder *)tc->encoder;
+    GET_TC(tc)->index = 0;
+    GET_TC(tc)->cStr = PyObject_Malloc(20 * sizeof(char));
+    enc->outputFormat = VALUES;  // for contained series & index
+    if (!GET_TC(tc)->cStr) {
+        PyErr_NoMemory();
+    }
+    PRINTMARK();
+}
+
+int DataFrame_iterNext(JSOBJ obj, JSONTypeContext *tc) {
+    Py_ssize_t index;
+    if (!GET_TC(tc)->cStr) {
+        return 0;
+    }
+
+    index = GET_TC(tc)->index;
+    Py_XDECREF(GET_TC(tc)->itemValue);
+    if (index == 0) {
+        memcpy(GET_TC(tc)->cStr, "columns", sizeof(char) * 8);
+        GET_TC(tc)->itemValue = PyObject_GetAttrString(obj, "columns");
+    } else if (index == 1) {
+        memcpy(GET_TC(tc)->cStr, "index", sizeof(char) * 6);
+        GET_TC(tc)->itemValue = PyObject_GetAttrString(obj, "index");
+    } else if (index == 2) {
+        memcpy(GET_TC(tc)->cStr, "data", sizeof(char) * 5);
+        if (is_simple_frame(obj)) {
+            GET_TC(tc)->itemValue = get_values(obj);
+            if (!GET_TC(tc)->itemValue) {
+                return 0;
+            }
+        } else {
+            Py_INCREF(obj);
+            GET_TC(tc)->itemValue = obj;
+        }
+    } else {
+        PRINTMARK();
+        return 0;
+    }
+
+    GET_TC(tc)->index++;
+    PRINTMARK();
+    return 1;
+}
+
+void DataFrame_iterEnd(JSOBJ obj, JSONTypeContext *tc) {
+    PyObjectEncoder *enc = (PyObjectEncoder *)tc->encoder;
+    enc->outputFormat = enc->originalOutputFormat;
+    PRINTMARK();
+}
+
+JSOBJ DataFrame_iterGetValue(JSOBJ obj, JSONTypeContext *tc) {
+    return GET_TC(tc)->itemValue;
+}
+
+char *DataFrame_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen) {
+    *outLen = strlen(GET_TC(tc)->cStr);
+    return GET_TC(tc)->cStr;
+}
+
+//=============================================================================
+// Dict iteration functions
+// itemName might converted to string (Python_Str). Do refCounting
+// itemValue is borrowed from object (which is dict). No refCounting
+//=============================================================================
+void Dict_iterBegin(JSOBJ obj, JSONTypeContext *tc) {
+    GET_TC(tc)->index = 0;
+    PRINTMARK();
+}
+
+int Dict_iterNext(JSOBJ obj, JSONTypeContext *tc) {
+#if PY_MAJOR_VERSION >= 3
+    PyObject *itemNameTmp;
+#endif
+
+    if (GET_TC(tc)->itemName) {
+        Py_DECREF(GET_TC(tc)->itemName);
+        GET_TC(tc)->itemName = NULL;
+    }
+
+    if (!PyDict_Next((PyObject *)GET_TC(tc)->dictObj, &GET_TC(tc)->index,
+                     &GET_TC(tc)->itemName, &GET_TC(tc)->itemValue)) {
+        PRINTMARK();
+        return 0;
+    }
+
+    if (PyUnicode_Check(GET_TC(tc)->itemName)) {
+        GET_TC(tc)->itemName = PyUnicode_AsUTF8String(GET_TC(tc)->itemName);
+    } else if (!PyString_Check(GET_TC(tc)->itemName)) {
+        GET_TC(tc)->itemName = PyObject_Str(GET_TC(tc)->itemName);
+#if PY_MAJOR_VERSION >= 3
+        itemNameTmp = GET_TC(tc)->itemName;
+        GET_TC(tc)->itemName = PyUnicode_AsUTF8String(GET_TC(tc)->itemName);
+        Py_DECREF(itemNameTmp);
+#endif
+    } else {
+        Py_INCREF(GET_TC(tc)->itemName);
+    }
+    PRINTMARK();
+    return 1;
+}
+
+void Dict_iterEnd(JSOBJ obj, JSONTypeContext *tc) {
+    if (GET_TC(tc)->itemName) {
+        Py_DECREF(GET_TC(tc)->itemName);
+        GET_TC(tc)->itemName = NULL;
+    }
+    Py_DECREF(GET_TC(tc)->dictObj);
+    PRINTMARK();
+}
+
+JSOBJ Dict_iterGetValue(JSOBJ obj, JSONTypeContext *tc) {
+    return GET_TC(tc)->itemValue;
+}
+
+char *Dict_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen) {
+    *outLen = PyString_GET_SIZE(GET_TC(tc)->itemName);
+    return PyString_AS_STRING(GET_TC(tc)->itemName);
+}
+
+void NpyArr_freeLabels(char **labels, npy_intp len) {
+    npy_intp i;
+
+    if (labels) {
+        for (i = 0; i < len; i++) {
+            PyObject_Free(labels[i]);
+        }
+        PyObject_Free(labels);
+    }
+}
+
+char **NpyArr_encodeLabels(PyArrayObject *labels, JSONObjectEncoder *enc,
+                           npy_intp num) {
+    // NOTE this function steals a reference to labels.
+    PyObjectEncoder *pyenc = (PyObjectEncoder *)enc;
+    PyObject *item = NULL;
+    npy_intp i, stride, len, need_quotes;
+    char **ret;
+    char *dataptr, *cLabel, *origend, *origst, *origoffset;
+    char labelBuffer[NPY_JSON_BUFSIZE];
+    PyArray_GetItemFunc *getitem;
+    int type_num;
+    PRINTMARK();
+
+    if (!labels) {
+        return 0;
+    }
+
+    if (PyArray_SIZE(labels) < num) {
+        PyErr_SetString(
+            PyExc_ValueError,
+            "Label array sizes do not match corresponding data shape");
+        Py_DECREF(labels);
+        return 0;
+    }
+
+    ret = PyObject_Malloc(sizeof(char *) * num);
+    if (!ret) {
+        PyErr_NoMemory();
+        Py_DECREF(labels);
+        return 0;
+    }
+
+    for (i = 0; i < num; i++) {
+        ret[i] = NULL;
+    }
+
+    origst = enc->start;
+    origend = enc->end;
+    origoffset = enc->offset;
+
+    stride = PyArray_STRIDE(labels, 0);
+    dataptr = PyArray_DATA(labels);
+    getitem = (PyArray_GetItemFunc *)PyArray_DESCR(labels)->f->getitem;
+    type_num = PyArray_TYPE(labels);
+
+    for (i = 0; i < num; i++) {
+#if NPY_API_VERSION < 0x00000007
+        if (PyTypeNum_ISDATETIME(type_num)) {
+            item = PyArray_ToScalar(dataptr, labels);
+        } else if (PyTypeNum_ISNUMBER(type_num))  // NOLINT
+#else
+        if (PyTypeNum_ISDATETIME(type_num) || PyTypeNum_ISNUMBER(type_num))  // NOLINT
+#endif
+        {
+            item = (PyObject *)labels;
+            pyenc->npyType = type_num;
+            pyenc->npyValue = dataptr;
+        } else {
+            item = getitem(dataptr, labels);
+            if (!item) {
+                NpyArr_freeLabels(ret, num);
+                ret = 0;
+                break;
+            }
+        }
+
+        cLabel = JSON_EncodeObject(item, enc, labelBuffer, NPY_JSON_BUFSIZE);
+
+        if (item != (PyObject *)labels) {
+            Py_DECREF(item);
+        }
+
+        if (PyErr_Occurred() || enc->errorMsg) {
+            NpyArr_freeLabels(ret, num);
+            ret = 0;
+            break;
+        }
+
+        need_quotes = ((*cLabel) != '"');
+        len = enc->offset - cLabel + 1 + 2 * need_quotes;
+        ret[i] = PyObject_Malloc(sizeof(char) * len);
+
+        if (!ret[i]) {
+            PyErr_NoMemory();
+            ret = 0;
+            break;
+        }
+
+        if (need_quotes) {
+            ret[i][0] = '"';
+            memcpy(ret[i] + 1, cLabel, sizeof(char) * (len - 4));
+            ret[i][len - 3] = '"';
+        } else {
+            memcpy(ret[i], cLabel, sizeof(char) * (len - 2));
+        }
+        ret[i][len - 2] = ':';
+        ret[i][len - 1] = '\0';
+        dataptr += stride;
+    }
+
+    enc->start = origst;
+    enc->end = origend;
+    enc->offset = origoffset;
+
+    Py_DECREF(labels);
+    return ret;
+}
+
+void Object_invokeDefaultHandler(PyObject *obj, PyObjectEncoder *enc) {
+    PyObject *tmpObj = NULL;
+    PRINTMARK();
+    tmpObj = PyObject_CallFunctionObjArgs(enc->defaultHandler, obj, NULL);
+    if (!PyErr_Occurred()) {
+        if (tmpObj == NULL) {
+            PyErr_SetString(PyExc_TypeError,
+                            "Failed to execute default handler");
+        } else {
+            encode(tmpObj, (JSONObjectEncoder *)enc, NULL, 0);
+        }
+    }
+    Py_XDECREF(tmpObj);
+    return;
+}
+
+void Object_beginTypeContext(JSOBJ _obj, JSONTypeContext *tc) {
+    PyObject *obj, *exc, *toDictFunc, *tmpObj, *values;
+    TypeContext *pc;
+    PyObjectEncoder *enc;
+    double val;
+    npy_int64 value;
+    int base;
+    PRINTMARK();
+
+    tc->prv = NULL;
+
+    if (!_obj) {
+        tc->type = JT_INVALID;
+        return;
+    }
+
+    obj = (PyObject *)_obj;
+    enc = (PyObjectEncoder *)tc->encoder;
+
+    if (enc->npyType >= 0) {
+        PRINTMARK();
+        tc->prv = &(enc->basicTypeContext);
+        tc->type = NpyTypeToJSONType(obj, tc, enc->npyType, enc->npyValue);
+
+        if (tc->type == JT_INVALID) {
+            if (enc->defaultHandler) {
+                enc->npyType = -1;
+                PRINTMARK();
+                Object_invokeDefaultHandler(
+                    enc->npyCtxtPassthru->getitem(enc->npyValue,
+                                                  enc->npyCtxtPassthru->array),
+                    enc);
+            } else {
+                PyErr_Format(PyExc_RuntimeError, "Unhandled numpy dtype %d",
+                             enc->npyType);
+            }
+        }
+        enc->npyCtxtPassthru = NULL;
+        enc->npyType = -1;
+        return;
+    }
+
+    if (PyBool_Check(obj)) {
+        PRINTMARK();
+        tc->type = (obj == Py_True) ? JT_TRUE : JT_FALSE;
+        return;
+    } else if (obj == Py_None) {
+        PRINTMARK();
+        tc->type = JT_NULL;
+        return;
+    }
+
+    pc = createTypeContext();
+    if (!pc) {
+        tc->type = JT_INVALID;
+        return;
+    }
+    tc->prv = pc;
+
+    if (PyIter_Check(obj) ||
+        (PyArray_Check(obj) && !PyArray_CheckScalar(obj))) {
+        PRINTMARK();
+        goto ISITERABLE;
+    }
+
+    if (PyLong_Check(obj)) {
+        PRINTMARK();
+        pc->PyTypeToJSON = PyLongToINT64;
+        tc->type = JT_LONG;
+        GET_TC(tc)->longValue = PyLong_AsLongLong(obj);
+
+        exc = PyErr_Occurred();
+
+        if (exc && PyErr_ExceptionMatches(PyExc_OverflowError)) {
+            PRINTMARK();
+            goto INVALID;
+        }
+
+        return;
+    } else if (PyInt_Check(obj)) {
+        PRINTMARK();
+
+#ifdef _LP64
+        pc->PyTypeToJSON = PyIntToINT64;
+        tc->type = JT_LONG;
+#else
+        pc->PyTypeToJSON = PyIntToINT32;
+        tc->type = JT_INT;
+#endif
+        return;
+    } else if (PyFloat_Check(obj)) {
+        PRINTMARK();
+        val = PyFloat_AS_DOUBLE(obj);
+        if (npy_isnan(val) || npy_isinf(val)) {
+            tc->type = JT_NULL;
+        } else {
+            pc->PyTypeToJSON = PyFloatToDOUBLE;
+            tc->type = JT_DOUBLE;
+        }
+        return;
+    } else if (PyString_Check(obj)) {
+        PRINTMARK();
+        pc->PyTypeToJSON = PyStringToUTF8;
+        tc->type = JT_UTF8;
+        return;
+    } else if (PyUnicode_Check(obj)) {
+        PRINTMARK();
+        pc->PyTypeToJSON = PyUnicodeToUTF8;
+        tc->type = JT_UTF8;
+        return;
+    } else if (PyObject_IsInstance(obj, type_decimal)) {
+        PRINTMARK();
+        pc->PyTypeToJSON = PyFloatToDOUBLE;
+        tc->type = JT_DOUBLE;
+        return;
+    } else if (PyDateTime_Check(obj) || PyDate_Check(obj)) {
+        if (PyObject_TypeCheck(obj, cls_nat)) {
+            PRINTMARK();
+            tc->type = JT_NULL;
+            return;
+        }
+
+        PRINTMARK();
+        pc->PyTypeToJSON = PyDateTimeToJSON;
+        if (enc->datetimeIso) {
+            PRINTMARK();
+            tc->type = JT_UTF8;
+        } else {
+            PRINTMARK();
+            tc->type = JT_LONG;
+        }
+        return;
+    } else if (PyTime_Check(obj)) {
+        PRINTMARK();
+        pc->PyTypeToJSON = PyTimeToJSON;
+        tc->type = JT_UTF8;
+        return;
+    } else if (PyArray_IsScalar(obj, Datetime)) {
+        PRINTMARK();
+        if (((PyDatetimeScalarObject *)obj)->obval == get_nat()) {
+            PRINTMARK();
+            tc->type = JT_NULL;
+            return;
+        }
+
+        PRINTMARK();
+        pc->PyTypeToJSON = NpyDateTimeScalarToJSON;
+        tc->type = enc->datetimeIso ? JT_UTF8 : JT_LONG;
+        return;
+    } else if (PyDelta_Check(obj)) {
+        if (PyObject_HasAttrString(obj, "value")) {
+            PRINTMARK();
+            value = get_long_attr(obj, "value");
+        } else {
+            PRINTMARK();
+            value =
+                total_seconds(obj) * 1000000000LL;  // nanoseconds per second
+        }
+
+        base = ((PyObjectEncoder *)tc->encoder)->datetimeUnit;
+        switch (base) {
+            case PANDAS_FR_ns:
+                break;
+            case PANDAS_FR_us:
+                value /= 1000LL;
+                break;
+            case PANDAS_FR_ms:
+                value /= 1000000LL;
+                break;
+            case PANDAS_FR_s:
+                value /= 1000000000LL;
+                break;
+        }
+
+        exc = PyErr_Occurred();
+
+        if (exc && PyErr_ExceptionMatches(PyExc_OverflowError)) {
+            PRINTMARK();
+            goto INVALID;
+        }
+
+        if (value == get_nat()) {
+            PRINTMARK();
+            tc->type = JT_NULL;
+            return;
+        }
+
+        GET_TC(tc)->longValue = value;
+
+        PRINTMARK();
+        pc->PyTypeToJSON = PyLongToINT64;
+        tc->type = JT_LONG;
+        return;
+    } else if (PyArray_IsScalar(obj, Integer)) {
+        PRINTMARK();
+        pc->PyTypeToJSON = PyLongToINT64;
+        tc->type = JT_LONG;
+        PyArray_CastScalarToCtype(obj, &(GET_TC(tc)->longValue),
+                                  PyArray_DescrFromType(NPY_INT64));
+
+        exc = PyErr_Occurred();
+
+        if (exc && PyErr_ExceptionMatches(PyExc_OverflowError)) {
+            PRINTMARK();
+            goto INVALID;
+        }
+
+        return;
+    } else if (PyArray_IsScalar(obj, Bool)) {
+        PRINTMARK();
+        PyArray_CastScalarToCtype(obj, &(GET_TC(tc)->longValue),
+                                  PyArray_DescrFromType(NPY_BOOL));
+        tc->type = (GET_TC(tc)->longValue) ? JT_TRUE : JT_FALSE;
+        return;
+    } else if (PyArray_IsScalar(obj, Float) || PyArray_IsScalar(obj, Double)) {
+        PRINTMARK();
+        pc->PyTypeToJSON = NpyFloatToDOUBLE;
+        tc->type = JT_DOUBLE;
+        return;
+    } else if (PyArray_Check(obj) && PyArray_CheckScalar(obj)) {
+        tmpObj = PyObject_Repr(obj);
+        PyErr_Format(PyExc_TypeError,
+                     "%s (0d array) is not JSON serializable at the moment",
+                     PyString_AS_STRING(tmpObj));
+        Py_DECREF(tmpObj);
+        goto INVALID;
+    }
+
+ISITERABLE:
+
+    if (PyObject_TypeCheck(obj, cls_index)) {
+        if (enc->outputFormat == SPLIT) {
+            PRINTMARK();
+            tc->type = JT_OBJECT;
+            pc->iterBegin = Index_iterBegin;
+            pc->iterEnd = Index_iterEnd;
+            pc->iterNext = Index_iterNext;
+            pc->iterGetValue = Index_iterGetValue;
+            pc->iterGetName = Index_iterGetName;
+            return;
+        }
+
+        pc->newObj = get_values(obj);
+        if (pc->newObj) {
+            PRINTMARK();
+            tc->type = JT_ARRAY;
+            pc->iterBegin = NpyArr_iterBegin;
+            pc->iterEnd = NpyArr_iterEnd;
+            pc->iterNext = NpyArr_iterNext;
+            pc->iterGetValue = NpyArr_iterGetValue;
+            pc->iterGetName = NpyArr_iterGetName;
+        } else {
+            goto INVALID;
+        }
+
+        return;
+    } else if (PyObject_TypeCheck(obj, cls_series)) {
+        if (enc->outputFormat == SPLIT) {
+            PRINTMARK();
+            tc->type = JT_OBJECT;
+            pc->iterBegin = Series_iterBegin;
+            pc->iterEnd = Series_iterEnd;
+            pc->iterNext = Series_iterNext;
+            pc->iterGetValue = Series_iterGetValue;
+            pc->iterGetName = Series_iterGetName;
+            return;
+        }
+
+        pc->newObj = get_values(obj);
+        if (!pc->newObj) {
+            goto INVALID;
+        }
+
+        if (enc->outputFormat == INDEX || enc->outputFormat == COLUMNS) {
+            PRINTMARK();
+            tc->type = JT_OBJECT;
+            tmpObj = PyObject_GetAttrString(obj, "index");
+            if (!tmpObj) {
+                goto INVALID;
+            }
+            values = get_values(tmpObj);
+            Py_DECREF(tmpObj);
+            if (!values) {
+                goto INVALID;
+            }
+            pc->columnLabelsLen = PyArray_DIM(pc->newObj, 0);
+            pc->columnLabels = NpyArr_encodeLabels((PyArrayObject *)values,
+                                                   (JSONObjectEncoder *)enc,
+                                                   pc->columnLabelsLen);
+            if (!pc->columnLabels) {
+                goto INVALID;
+            }
+        } else {
+            PRINTMARK();
+            tc->type = JT_ARRAY;
+        }
+        pc->iterBegin = NpyArr_iterBegin;
+        pc->iterEnd = NpyArr_iterEnd;
+        pc->iterNext = NpyArr_iterNext;
+        pc->iterGetValue = NpyArr_iterGetValue;
+        pc->iterGetName = NpyArr_iterGetName;
+        return;
+    } else if (PyArray_Check(obj)) {
+        if (enc->npyCtxtPassthru) {
+            PRINTMARK();
+            pc->npyarr = enc->npyCtxtPassthru;
+            tc->type = (pc->npyarr->columnLabels ? JT_OBJECT : JT_ARRAY);
+
+            pc->iterBegin = NpyArrPassThru_iterBegin;
+            pc->iterNext = NpyArr_iterNext;
+            pc->iterEnd = NpyArrPassThru_iterEnd;
+            pc->iterGetValue = NpyArr_iterGetValue;
+            pc->iterGetName = NpyArr_iterGetName;
+
+            enc->npyCtxtPassthru = NULL;
+            return;
+        }
+
+        PRINTMARK();
+        tc->type = JT_ARRAY;
+        pc->iterBegin = NpyArr_iterBegin;
+        pc->iterEnd = NpyArr_iterEnd;
+        pc->iterNext = NpyArr_iterNext;
+        pc->iterGetValue = NpyArr_iterGetValue;
+        pc->iterGetName = NpyArr_iterGetName;
+        return;
+    } else if (PyObject_TypeCheck(obj, cls_dataframe)) {
+        if (enc->blkCtxtPassthru) {
+            PRINTMARK();
+            pc->pdblock = enc->blkCtxtPassthru;
+            tc->type =
+                (pc->pdblock->npyCtxts[0]->columnLabels ? JT_OBJECT : JT_ARRAY);
+
+            pc->iterBegin = PdBlockPassThru_iterBegin;
+            pc->iterEnd = PdBlockPassThru_iterEnd;
+            pc->iterNext = PdBlock_iterNextItem;
+            pc->iterGetName = PdBlock_iterGetName;
+            pc->iterGetValue = NpyArr_iterGetValue;
+
+            enc->blkCtxtPassthru = NULL;
+            return;
+        }
+
+        if (enc->outputFormat == SPLIT) {
+            PRINTMARK();
+            tc->type = JT_OBJECT;
+            pc->iterBegin = DataFrame_iterBegin;
+            pc->iterEnd = DataFrame_iterEnd;
+            pc->iterNext = DataFrame_iterNext;
+            pc->iterGetValue = DataFrame_iterGetValue;
+            pc->iterGetName = DataFrame_iterGetName;
+            return;
+        }
+
+        PRINTMARK();
+        if (is_simple_frame(obj)) {
+            pc->iterBegin = NpyArr_iterBegin;
+            pc->iterEnd = NpyArr_iterEnd;
+            pc->iterNext = NpyArr_iterNext;
+            pc->iterGetName = NpyArr_iterGetName;
+
+            pc->newObj = get_values(obj);
+            if (!pc->newObj) {
+                goto INVALID;
+            }
+        } else {
+            pc->iterBegin = PdBlock_iterBegin;
+            pc->iterEnd = PdBlock_iterEnd;
+            pc->iterNext = PdBlock_iterNext;
+            pc->iterGetName = PdBlock_iterGetName;
+        }
+        pc->iterGetValue = NpyArr_iterGetValue;
+
+        if (enc->outputFormat == VALUES) {
+            PRINTMARK();
+            tc->type = JT_ARRAY;
+        } else if (enc->outputFormat == RECORDS) {
+            PRINTMARK();
+            tc->type = JT_ARRAY;
+            tmpObj = PyObject_GetAttrString(obj, "columns");
+            if (!tmpObj) {
+                goto INVALID;
+            }
+            values = get_values(tmpObj);
+            if (!values) {
+                Py_DECREF(tmpObj);
+                goto INVALID;
+            }
+            pc->columnLabelsLen = PyObject_Size(tmpObj);
+            pc->columnLabels = NpyArr_encodeLabels((PyArrayObject *)values,
+                                                   (JSONObjectEncoder *)enc,
+                                                   pc->columnLabelsLen);
+            Py_DECREF(tmpObj);
+            if (!pc->columnLabels) {
+                goto INVALID;
+            }
+        } else if (enc->outputFormat == INDEX || enc->outputFormat == COLUMNS) {
+            PRINTMARK();
+            tc->type = JT_OBJECT;
+            tmpObj = (enc->outputFormat == INDEX
+                          ? PyObject_GetAttrString(obj, "index")
+                          : PyObject_GetAttrString(obj, "columns"));
+            if (!tmpObj) {
+                goto INVALID;
+            }
+            values = get_values(tmpObj);
+            if (!values) {
+                Py_DECREF(tmpObj);
+                goto INVALID;
+            }
+            pc->rowLabelsLen = PyObject_Size(tmpObj);
+            pc->rowLabels =
+                NpyArr_encodeLabels((PyArrayObject *)values,
+                                    (JSONObjectEncoder *)enc, pc->rowLabelsLen);
+            Py_DECREF(tmpObj);
+            tmpObj = (enc->outputFormat == INDEX
+                          ? PyObject_GetAttrString(obj, "columns")
+                          : PyObject_GetAttrString(obj, "index"));
+            if (!tmpObj) {
+                NpyArr_freeLabels(pc->rowLabels, pc->rowLabelsLen);
+                pc->rowLabels = NULL;
+                goto INVALID;
+            }
+            values = get_values(tmpObj);
+            if (!values) {
+                Py_DECREF(tmpObj);
+                NpyArr_freeLabels(pc->rowLabels, pc->rowLabelsLen);
+                pc->rowLabels = NULL;
+                goto INVALID;
+            }
+            pc->columnLabelsLen = PyObject_Size(tmpObj);
+            pc->columnLabels = NpyArr_encodeLabels((PyArrayObject *)values,
+                                                   (JSONObjectEncoder *)enc,
+                                                   pc->columnLabelsLen);
+            Py_DECREF(tmpObj);
+            if (!pc->columnLabels) {
+                NpyArr_freeLabels(pc->rowLabels, pc->rowLabelsLen);
+                pc->rowLabels = NULL;
+                goto INVALID;
+            }
+
+            if (enc->outputFormat == COLUMNS) {
+                PRINTMARK();
+                pc->transpose = 1;
+            }
+        } else {
+            goto INVALID;
+        }
+        return;
+    } else if (PyDict_Check(obj)) {
+        PRINTMARK();
+        tc->type = JT_OBJECT;
+        pc->iterBegin = Dict_iterBegin;
+        pc->iterEnd = Dict_iterEnd;
+        pc->iterNext = Dict_iterNext;
+        pc->iterGetValue = Dict_iterGetValue;
+        pc->iterGetName = Dict_iterGetName;
+        pc->dictObj = obj;
+        Py_INCREF(obj);
+
+        return;
+    } else if (PyList_Check(obj)) {
+        PRINTMARK();
+        tc->type = JT_ARRAY;
+        pc->iterBegin = List_iterBegin;
+        pc->iterEnd = List_iterEnd;
+        pc->iterNext = List_iterNext;
+        pc->iterGetValue = List_iterGetValue;
+        pc->iterGetName = List_iterGetName;
+        return;
+    } else if (PyTuple_Check(obj)) {
+        PRINTMARK();
+        tc->type = JT_ARRAY;
+        pc->iterBegin = Tuple_iterBegin;
+        pc->iterEnd = Tuple_iterEnd;
+        pc->iterNext = Tuple_iterNext;
+        pc->iterGetValue = Tuple_iterGetValue;
+        pc->iterGetName = Tuple_iterGetName;
+        return;
+    } else if (PyAnySet_Check(obj)) {
+        PRINTMARK();
+        tc->type = JT_ARRAY;
+        pc->iterBegin = Iter_iterBegin;
+        pc->iterEnd = Iter_iterEnd;
+        pc->iterNext = Iter_iterNext;
+        pc->iterGetValue = Iter_iterGetValue;
+        pc->iterGetName = Iter_iterGetName;
+        return;
+    }
+
+    toDictFunc = PyObject_GetAttrString(obj, "toDict");
+
+    if (toDictFunc) {
+        PyObject *tuple = PyTuple_New(0);
+        PyObject *toDictResult = PyObject_Call(toDictFunc, tuple, NULL);
+        Py_DECREF(tuple);
+        Py_DECREF(toDictFunc);
+
+        if (toDictResult == NULL) {
+            PyErr_Clear();
+            tc->type = JT_NULL;
+            return;
+        }
+
+        if (!PyDict_Check(toDictResult)) {
+            Py_DECREF(toDictResult);
+            tc->type = JT_NULL;
+            return;
+        }
+
+        PRINTMARK();
+        tc->type = JT_OBJECT;
+        pc->iterBegin = Dict_iterBegin;
+        pc->iterEnd = Dict_iterEnd;
+        pc->iterNext = Dict_iterNext;
+        pc->iterGetValue = Dict_iterGetValue;
+        pc->iterGetName = Dict_iterGetName;
+        pc->dictObj = toDictResult;
+        return;
+    }
+
+    PyErr_Clear();
+
+    if (enc->defaultHandler) {
+        Object_invokeDefaultHandler(obj, enc);
+        goto INVALID;
+    }
+
+    PRINTMARK();
+    tc->type = JT_OBJECT;
+    pc->iterBegin = Dir_iterBegin;
+    pc->iterEnd = Dir_iterEnd;
+    pc->iterNext = Dir_iterNext;
+    pc->iterGetValue = Dir_iterGetValue;
+    pc->iterGetName = Dir_iterGetName;
+    return;
+
+INVALID:
+    tc->type = JT_INVALID;
+    PyObject_Free(tc->prv);
+    tc->prv = NULL;
+    return;
+}
+
+void Object_endTypeContext(JSOBJ obj, JSONTypeContext *tc) {
+    PRINTMARK();
+    if (tc->prv) {
+        Py_XDECREF(GET_TC(tc)->newObj);
+        GET_TC(tc)->newObj = NULL;
+        NpyArr_freeLabels(GET_TC(tc)->rowLabels, GET_TC(tc)->rowLabelsLen);
+        GET_TC(tc)->rowLabels = NULL;
+        NpyArr_freeLabels(GET_TC(tc)->columnLabels,
+                          GET_TC(tc)->columnLabelsLen);
+        GET_TC(tc)->columnLabels = NULL;
+
+        PyObject_Free(GET_TC(tc)->cStr);
+        GET_TC(tc)->cStr = NULL;
+        if (tc->prv != &(((PyObjectEncoder *)tc->encoder)->basicTypeContext)) {  // NOLINT
+            PyObject_Free(tc->prv);
+        }
+        tc->prv = NULL;
+    }
+}
+
+const char *Object_getStringValue(JSOBJ obj, JSONTypeContext *tc,
+                                  size_t *_outLen) {
+    return GET_TC(tc)->PyTypeToJSON(obj, tc, NULL, _outLen);
+}
+
+JSINT64 Object_getLongValue(JSOBJ obj, JSONTypeContext *tc) {
+    JSINT64 ret;
+    GET_TC(tc)->PyTypeToJSON(obj, tc, &ret, NULL);
+    return ret;
+}
+
+JSINT32 Object_getIntValue(JSOBJ obj, JSONTypeContext *tc) {
+    JSINT32 ret;
+    GET_TC(tc)->PyTypeToJSON(obj, tc, &ret, NULL);
+    return ret;
+}
+
+double Object_getDoubleValue(JSOBJ obj, JSONTypeContext *tc) {
+    double ret;
+    GET_TC(tc)->PyTypeToJSON(obj, tc, &ret, NULL);
+    return ret;
+}
+
+static void Object_releaseObject(JSOBJ _obj) { Py_DECREF((PyObject *)_obj); }
+
+void Object_iterBegin(JSOBJ obj, JSONTypeContext *tc) {
+    GET_TC(tc)->iterBegin(obj, tc);
+}
+
+int Object_iterNext(JSOBJ obj, JSONTypeContext *tc) {
+    return GET_TC(tc)->iterNext(obj, tc);
+}
+
+void Object_iterEnd(JSOBJ obj, JSONTypeContext *tc) {
+    GET_TC(tc)->iterEnd(obj, tc);
+}
+
+JSOBJ Object_iterGetValue(JSOBJ obj, JSONTypeContext *tc) {
+    return GET_TC(tc)->iterGetValue(obj, tc);
+}
+
+char *Object_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen) {
+    return GET_TC(tc)->iterGetName(obj, tc, outLen);
+}
+
+PyObject *objToJSON(PyObject *self, PyObject *args, PyObject *kwargs) {
+    static char *kwlist[] = {
+        "obj",    "ensure_ascii", "double_precision", "encode_html_chars",
+        "orient", "date_unit",    "iso_dates",        "default_handler",
+        NULL};
+
+    char buffer[65536];
+    char *ret;
+    PyObject *newobj;
+    PyObject *oinput = NULL;
+    PyObject *oensureAscii = NULL;
+    int idoublePrecision = 10;  // default double precision setting
+    PyObject *oencodeHTMLChars = NULL;
+    char *sOrient = NULL;
+    char *sdateFormat = NULL;
+    PyObject *oisoDates = 0;
+    PyObject *odefHandler = 0;
+
+    PyObjectEncoder pyEncoder = {{
+        Object_beginTypeContext,
+        Object_endTypeContext,
+        Object_getStringValue,
+        Object_getLongValue,
+        Object_getIntValue,
+        Object_getDoubleValue,
+        Object_iterBegin,
+        Object_iterNext,
+        Object_iterEnd,
+        Object_iterGetValue,
+        Object_iterGetName,
+        Object_releaseObject,
+        PyObject_Malloc,
+        PyObject_Realloc,
+        PyObject_Free,
+        -1,  // recursionMax
+        idoublePrecision,
+        1,  // forceAscii
+        0,  // encodeHTMLChars
+    }};
+    JSONObjectEncoder *encoder = (JSONObjectEncoder *)&pyEncoder;
+
+    pyEncoder.npyCtxtPassthru = NULL;
+    pyEncoder.blkCtxtPassthru = NULL;
+    pyEncoder.npyType = -1;
+    pyEncoder.npyValue = NULL;
+    pyEncoder.datetimeIso = 0;
+    pyEncoder.datetimeUnit = PANDAS_FR_ms;
+    pyEncoder.outputFormat = COLUMNS;
+    pyEncoder.defaultHandler = 0;
+    pyEncoder.basicTypeContext.newObj = NULL;
+    pyEncoder.basicTypeContext.dictObj = NULL;
+    pyEncoder.basicTypeContext.itemValue = NULL;
+    pyEncoder.basicTypeContext.itemName = NULL;
+    pyEncoder.basicTypeContext.attrList = NULL;
+    pyEncoder.basicTypeContext.iterator = NULL;
+    pyEncoder.basicTypeContext.cStr = NULL;
+    pyEncoder.basicTypeContext.npyarr = NULL;
+    pyEncoder.basicTypeContext.rowLabels = NULL;
+    pyEncoder.basicTypeContext.columnLabels = NULL;
+
+    PRINTMARK();
+
+    if (!PyArg_ParseTupleAndKeywords(args, kwargs, "O|OiOssOO", kwlist, &oinput,
+                                     &oensureAscii, &idoublePrecision,
+                                     &oencodeHTMLChars, &sOrient, &sdateFormat,
+                                     &oisoDates, &odefHandler)) {
+        return NULL;
+    }
+
+    if (oensureAscii != NULL && !PyObject_IsTrue(oensureAscii)) {
+        encoder->forceASCII = 0;
+    }
+
+    if (oencodeHTMLChars != NULL && PyObject_IsTrue(oencodeHTMLChars)) {
+        encoder->encodeHTMLChars = 1;
+    }
+
+    if (idoublePrecision > JSON_DOUBLE_MAX_DECIMALS || idoublePrecision < 0) {
+        PyErr_Format(
+            PyExc_ValueError,
+            "Invalid value '%d' for option 'double_precision', max is '%u'",
+            idoublePrecision, JSON_DOUBLE_MAX_DECIMALS);
+        return NULL;
+    }
+    encoder->doublePrecision = idoublePrecision;
+
+    if (sOrient != NULL) {
+        if (strcmp(sOrient, "records") == 0) {
+            pyEncoder.outputFormat = RECORDS;
+        } else if (strcmp(sOrient, "index") == 0) {
+            pyEncoder.outputFormat = INDEX;
+        } else if (strcmp(sOrient, "split") == 0) {
+            pyEncoder.outputFormat = SPLIT;
+        } else if (strcmp(sOrient, "values") == 0) {
+            pyEncoder.outputFormat = VALUES;
+        } else if (strcmp(sOrient, "columns") != 0) {
+            PyErr_Format(PyExc_ValueError,
+                         "Invalid value '%s' for option 'orient'", sOrient);
+            return NULL;
+        }
+    }
+
+    if (sdateFormat != NULL) {
+        if (strcmp(sdateFormat, "s") == 0) {
+            pyEncoder.datetimeUnit = PANDAS_FR_s;
+        } else if (strcmp(sdateFormat, "ms") == 0) {
+            pyEncoder.datetimeUnit = PANDAS_FR_ms;
+        } else if (strcmp(sdateFormat, "us") == 0) {
+            pyEncoder.datetimeUnit = PANDAS_FR_us;
+        } else if (strcmp(sdateFormat, "ns") == 0) {
+            pyEncoder.datetimeUnit = PANDAS_FR_ns;
+        } else {
+            PyErr_Format(PyExc_ValueError,
+                         "Invalid value '%s' for option 'date_unit'",
+                         sdateFormat);
+            return NULL;
+        }
+    }
+
+    if (oisoDates != NULL && PyObject_IsTrue(oisoDates)) {
+        pyEncoder.datetimeIso = 1;
+    }
+
+    if (odefHandler != NULL && odefHandler != Py_None) {
+        if (!PyCallable_Check(odefHandler)) {
+            PyErr_SetString(PyExc_TypeError, "Default handler is not callable");
+            return NULL;
+        }
+        pyEncoder.defaultHandler = odefHandler;
+    }
+
+    pyEncoder.originalOutputFormat = pyEncoder.outputFormat;
+    PRINTMARK();
+    ret = JSON_EncodeObject(oinput, encoder, buffer, sizeof(buffer));
+    PRINTMARK();
+
+    if (PyErr_Occurred()) {
+        PRINTMARK();
+        return NULL;
+    }
+
+    if (encoder->errorMsg) {
+        PRINTMARK();
+        if (ret != buffer) {
+            encoder->free(ret);
+        }
+
+        PyErr_Format(PyExc_OverflowError, "%s", encoder->errorMsg);
+        return NULL;
+    }
+
+    newobj = PyString_FromString(ret);
+
+    if (ret != buffer) {
+        encoder->free(ret);
+    }
+
+    PRINTMARK();
+
+    return newobj;
+}
+
+PyObject *objToJSONFile(PyObject *self, PyObject *args, PyObject *kwargs) {
+    PyObject *data;
+    PyObject *file;
+    PyObject *string;
+    PyObject *write;
+    PyObject *argtuple;
+
+    PRINTMARK();
+
+    if (!PyArg_ParseTuple(args, "OO", &data, &file)) {
+        return NULL;
+    }
+
+    if (!PyObject_HasAttrString(file, "write")) {
+        PyErr_Format(PyExc_TypeError, "expected file");
+        return NULL;
+    }
+
+    write = PyObject_GetAttrString(file, "write");
+
+    if (!PyCallable_Check(write)) {
+        Py_XDECREF(write);
+        PyErr_Format(PyExc_TypeError, "expected file");
+        return NULL;
+    }
+
+    argtuple = PyTuple_Pack(1, data);
+
+    string = objToJSON(self, argtuple, kwargs);
+
+    if (string == NULL) {
+        Py_XDECREF(write);
+        Py_XDECREF(argtuple);
+        return NULL;
+    }
+
+    Py_XDECREF(argtuple);
+
+    argtuple = PyTuple_Pack(1, string);
+    if (argtuple == NULL) {
+        Py_XDECREF(write);
+        return NULL;
+    }
+    if (PyObject_CallObject(write, argtuple) == NULL) {
+        Py_XDECREF(write);
+        Py_XDECREF(argtuple);
+        return NULL;
+    }
+
+    Py_XDECREF(write);
+    Py_DECREF(argtuple);
+    Py_XDECREF(string);
+
+    PRINTMARK();
+
+    Py_RETURN_NONE;
+}
diff --git a/pandas/src/ujson/python/py_defines.h b/pandas/_libs/src/ujson/python/py_defines.h
similarity index 91%
rename from pandas/src/ujson/python/py_defines.h
rename to pandas/_libs/src/ujson/python/py_defines.h
index 7a5083e131512..82385fdd48a3b 100644
--- a/pandas/src/ujson/python/py_defines.h
+++ b/pandas/_libs/src/ujson/python/py_defines.h
@@ -16,7 +16,7 @@ modification, are permitted provided that the following conditions are met:
 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
 ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
 WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE LIABLE 
+DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE LIABLE
 FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
@@ -26,7 +26,7 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 
 Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
-http://code.google.com/p/stringencoders/
+https://github.com/client9/stringencoders
 Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights reserved.
 
 Numeric decoder derived from from TCL library
@@ -35,6 +35,9 @@ Numeric decoder derived from from TCL library
  * Copyright (c) 1994 Sun Microsystems, Inc.
 */
 
+#ifndef PANDAS__LIBS_SRC_UJSON_PYTHON_PY_DEFINES_H_
+#define PANDAS__LIBS_SRC_UJSON_PYTHON_PY_DEFINES_H_
+
 #include <Python.h>
 
 #if PY_MAJOR_VERSION >= 3
@@ -51,3 +54,5 @@ Numeric decoder derived from from TCL library
 #define PyString_FromString     PyUnicode_FromString
 
 #endif
+
+#endif  // PANDAS__LIBS_SRC_UJSON_PYTHON_PY_DEFINES_H_
diff --git a/pandas/_libs/src/ujson/python/ujson.c b/pandas/_libs/src/ujson/python/ujson.c
new file mode 100644
index 0000000000000..da19afab030b1
--- /dev/null
+++ b/pandas/_libs/src/ujson/python/ujson.c
@@ -0,0 +1,122 @@
+/*
+Copyright (c) 2011-2013, ESN Social Software AB and Jonas Tarnstrom
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+* Redistributions of source code must retain the above copyright
+notice, this list of conditions and the following disclaimer.
+* Redistributions in binary form must reproduce the above copyright
+notice, this list of conditions and the following disclaimer in the
+documentation and/or other materials provided with the distribution.
+* Neither the name of the ESN Social Software AB nor the
+names of its contributors may be used to endorse or promote products
+derived from this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
+ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+
+Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
+https://github.com/client9/stringencoders
+Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights reserved.
+
+Numeric decoder derived from from TCL library
+http://www.opensource.apple.com/source/tcl/tcl-14/tcl/license.terms
+* Copyright (c) 1988-1993 The Regents of the University of California.
+* Copyright (c) 1994 Sun Microsystems, Inc.
+*/
+
+#include "py_defines.h"
+#include "version.h"
+
+/* objToJSON */
+PyObject *objToJSON(PyObject *self, PyObject *args, PyObject *kwargs);
+void initObjToJSON(void);
+
+/* JSONToObj */
+PyObject *JSONToObj(PyObject *self, PyObject *args, PyObject *kwargs);
+
+/* objToJSONFile */
+PyObject *objToJSONFile(PyObject *self, PyObject *args, PyObject *kwargs);
+
+/* JSONFileToObj */
+PyObject *JSONFileToObj(PyObject *self, PyObject *args, PyObject *kwargs);
+
+#define ENCODER_HELP_TEXT                                                  \
+    "Use ensure_ascii=false to output UTF-8. Pass in double_precision to " \
+    "alter the maximum digit precision of doubles. Set "                   \
+    "encode_html_chars=True to encode < > & as unicode escape sequences."
+
+static PyMethodDef ujsonMethods[] = {
+    {"encode", (PyCFunction)objToJSON, METH_VARARGS | METH_KEYWORDS,
+     "Converts arbitrary object recursively into JSON. " ENCODER_HELP_TEXT},
+    {"decode", (PyCFunction)JSONToObj, METH_VARARGS | METH_KEYWORDS,
+     "Converts JSON as string to dict object structure. Use precise_float=True "
+     "to use high precision float decoder."},
+    {"dumps", (PyCFunction)objToJSON, METH_VARARGS | METH_KEYWORDS,
+     "Converts arbitrary object recursively into JSON. " ENCODER_HELP_TEXT},
+    {"loads", (PyCFunction)JSONToObj, METH_VARARGS | METH_KEYWORDS,
+     "Converts JSON as string to dict object structure. Use precise_float=True "
+     "to use high precision float decoder."},
+    {"dump", (PyCFunction)objToJSONFile, METH_VARARGS | METH_KEYWORDS,
+     "Converts arbitrary object recursively into JSON "
+     "file. " ENCODER_HELP_TEXT},
+    {"load", (PyCFunction)JSONFileToObj, METH_VARARGS | METH_KEYWORDS,
+     "Converts JSON as file to dict object structure. Use precise_float=True "
+     "to use high precision float decoder."},
+    {NULL, NULL, 0, NULL} /* Sentinel */
+};
+
+#if PY_MAJOR_VERSION >= 3
+
+static struct PyModuleDef moduledef = {
+    PyModuleDef_HEAD_INIT,
+    "_libjson",
+    0,            /* m_doc */
+    -1,           /* m_size */
+    ujsonMethods, /* m_methods */
+    NULL,         /* m_reload */
+    NULL,         /* m_traverse */
+    NULL,         /* m_clear */
+    NULL          /* m_free */
+};
+
+#define PYMODINITFUNC PyMODINIT_FUNC PyInit_json(void)
+#define PYMODULE_CREATE() PyModule_Create(&moduledef)
+#define MODINITERROR return NULL
+
+#else
+
+#define PYMODINITFUNC PyMODINIT_FUNC initjson(void)
+#define PYMODULE_CREATE() Py_InitModule("json", ujsonMethods)
+#define MODINITERROR return
+
+#endif
+
+PYMODINITFUNC {
+    PyObject *module;
+    PyObject *version_string;
+
+    initObjToJSON();
+    module = PYMODULE_CREATE();
+
+    if (module == NULL) {
+        MODINITERROR;
+    }
+
+    version_string = PyString_FromString(UJSON_VERSION);
+    PyModule_AddObject(module, "__version__", version_string);
+
+#if PY_MAJOR_VERSION >= 3
+    return module;
+#endif
+}
diff --git a/pandas/src/ujson/python/version.h b/pandas/_libs/src/ujson/python/version.h
similarity index 90%
rename from pandas/src/ujson/python/version.h
rename to pandas/_libs/src/ujson/python/version.h
index 0ccfbfe74521c..ef6d28bf3a1f7 100644
--- a/pandas/src/ujson/python/version.h
+++ b/pandas/_libs/src/ujson/python/version.h
@@ -16,7 +16,7 @@ modification, are permitted provided that the following conditions are met:
 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
 ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
 WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE LIABLE 
+DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE LIABLE
 FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
@@ -26,7 +26,7 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 
 Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
-http://code.google.com/p/stringencoders/
+https://github.com/client9/stringencoders
 Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights reserved.
 
 Numeric decoder derived from from TCL library
@@ -35,4 +35,9 @@ Numeric decoder derived from from TCL library
  * Copyright (c) 1994 Sun Microsystems, Inc.
 */
 
+#ifndef PANDAS__LIBS_SRC_UJSON_PYTHON_VERSION_H_
+#define PANDAS__LIBS_SRC_UJSON_PYTHON_VERSION_H_
+
 #define UJSON_VERSION "1.33"
+
+#endif  // PANDAS__LIBS_SRC_UJSON_PYTHON_VERSION_H_
diff --git a/pandas/_libs/src/util.pxd b/pandas/_libs/src/util.pxd
new file mode 100644
index 0000000000000..2c1876fad95d2
--- /dev/null
+++ b/pandas/_libs/src/util.pxd
@@ -0,0 +1,178 @@
+from numpy cimport ndarray, NPY_C_CONTIGUOUS, NPY_F_CONTIGUOUS
+cimport numpy as cnp
+cnp.import_array()
+
+cimport cpython
+from cpython cimport PyTypeObject
+
+cdef extern from "Python.h":
+    # Note: importing extern-style allows us to declare these as nogil
+    # functions, whereas `from cpython cimport` does not.
+    bint PyUnicode_Check(object obj) nogil
+    bint PyString_Check(object obj) nogil
+    bint PyBool_Check(object obj) nogil
+    bint PyFloat_Check(object obj) nogil
+    bint PyComplex_Check(object obj) nogil
+    bint PyObject_TypeCheck(object obj, PyTypeObject* type) nogil
+
+
+cdef extern from "numpy/arrayobject.h":
+    PyTypeObject PyFloatingArrType_Type
+
+cdef extern from "numpy/ndarrayobject.h":
+    PyTypeObject PyTimedeltaArrType_Type
+    PyTypeObject PyDatetimeArrType_Type
+    PyTypeObject PyComplexFloatingArrType_Type
+    PyTypeObject PyBoolArrType_Type
+
+    bint PyArray_IsIntegerScalar(obj) nogil
+    bint PyArray_Check(obj) nogil
+
+# --------------------------------------------------------------------
+# Type Checking
+
+cdef inline bint is_string_object(object obj) nogil:
+    return PyString_Check(obj) or PyUnicode_Check(obj)
+
+
+cdef inline bint is_integer_object(object obj) nogil:
+    return not PyBool_Check(obj) and PyArray_IsIntegerScalar(obj)
+
+
+cdef inline bint is_float_object(object obj) nogil:
+    return (PyFloat_Check(obj) or
+            (PyObject_TypeCheck(obj, &PyFloatingArrType_Type)))
+
+
+cdef inline bint is_complex_object(object obj) nogil:
+    return (PyComplex_Check(obj) or
+            PyObject_TypeCheck(obj, &PyComplexFloatingArrType_Type))
+
+
+cdef inline bint is_bool_object(object obj) nogil:
+    return (PyBool_Check(obj) or
+            PyObject_TypeCheck(obj, &PyBoolArrType_Type))
+
+
+cdef inline bint is_timedelta64_object(object obj) nogil:
+    return PyObject_TypeCheck(obj, &PyTimedeltaArrType_Type)
+
+
+cdef inline bint is_datetime64_object(object obj) nogil:
+    return PyObject_TypeCheck(obj, &PyDatetimeArrType_Type)
+
+# --------------------------------------------------------------------
+
+cdef extern from "numpy_helper.h":
+    void set_array_not_contiguous(ndarray ao)
+
+    int assign_value_1d(ndarray, Py_ssize_t, object) except -1
+    cnp.int64_t get_nat()
+    object get_value_1d(ndarray, Py_ssize_t)
+    char *get_c_string(object) except NULL
+    object char_to_string(char*)
+
+ctypedef fused numeric:
+    cnp.int8_t
+    cnp.int16_t
+    cnp.int32_t
+    cnp.int64_t
+
+    cnp.uint8_t
+    cnp.uint16_t
+    cnp.uint32_t
+    cnp.uint64_t
+
+    cnp.float32_t
+    cnp.float64_t
+
+cdef extern from "headers/stdint.h":
+    enum: UINT8_MAX
+    enum: UINT16_MAX
+    enum: UINT32_MAX
+    enum: UINT64_MAX
+    enum: INT8_MIN
+    enum: INT8_MAX
+    enum: INT16_MIN
+    enum: INT16_MAX
+    enum: INT32_MAX
+    enum: INT32_MIN
+    enum: INT64_MAX
+    enum: INT64_MIN
+
+cdef inline object get_value_at(ndarray arr, object loc):
+    cdef:
+        Py_ssize_t i, sz
+        int casted
+
+    if is_float_object(loc):
+        casted = int(loc)
+        if casted == loc:
+            loc = casted
+    i = <Py_ssize_t> loc
+    sz = cnp.PyArray_SIZE(arr)
+
+    if i < 0 and sz > 0:
+        i += sz
+    elif i >= sz or sz == 0:
+        raise IndexError('index out of bounds')
+
+    return get_value_1d(arr, i)
+
+cdef inline set_value_at_unsafe(ndarray arr, object loc, object value):
+    """Sets a value into the array without checking the writeable flag.
+
+    This should be used when setting values in a loop, check the writeable
+    flag above the loop and then eschew the check on each iteration.
+    """
+    cdef:
+        Py_ssize_t i, sz
+    if is_float_object(loc):
+        casted = int(loc)
+        if casted == loc:
+            loc = casted
+    i = <Py_ssize_t> loc
+    sz = cnp.PyArray_SIZE(arr)
+
+    if i < 0:
+        i += sz
+    elif i >= sz:
+        raise IndexError('index out of bounds')
+
+    assign_value_1d(arr, i, value)
+
+cdef inline set_value_at(ndarray arr, object loc, object value):
+    """Sets a value into the array after checking that the array is mutable.
+    """
+    if not cnp.PyArray_ISWRITEABLE(arr):
+        raise ValueError('assignment destination is read-only')
+
+    set_value_at_unsafe(arr, loc, value)
+
+
+cdef inline is_array(object o):
+    return cnp.PyArray_Check(o)
+
+cdef inline bint _checknull(object val):
+    try:
+        return val is None or (cpython.PyFloat_Check(val) and val != val)
+    except ValueError:
+        return False
+
+cdef inline bint is_period_object(object val):
+    return getattr(val, '_typ', '_typ') == 'period'
+
+
+cdef inline bint is_offset_object(object val):
+    """
+    Check if an object is a DateOffset object.
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    is_date_offset : bool
+    """
+    return getattr(val, '_typ', None) == "dateoffset"
diff --git a/pandas/_libs/testing.pyx b/pandas/_libs/testing.pyx
new file mode 100644
index 0000000000000..ab7f3c3de2131
--- /dev/null
+++ b/pandas/_libs/testing.pyx
@@ -0,0 +1,213 @@
+import numpy as np
+
+from pandas import compat
+from pandas.core.dtypes.missing import isna, array_equivalent
+from pandas.core.dtypes.common import is_dtype_equal
+
+cdef NUMERIC_TYPES = (
+    bool,
+    int,
+    float,
+    np.bool,
+    np.int8,
+    np.int16,
+    np.int32,
+    np.int64,
+    np.uint8,
+    np.uint16,
+    np.uint32,
+    np.uint64,
+    np.float16,
+    np.float32,
+    np.float64,
+)
+
+cdef bint is_comparable_as_number(obj):
+    return isinstance(obj, NUMERIC_TYPES)
+
+cdef bint isiterable(obj):
+    return hasattr(obj, '__iter__')
+
+cdef bint has_length(obj):
+    return hasattr(obj, '__len__')
+
+cdef bint is_dictlike(obj):
+    return hasattr(obj, 'keys') and hasattr(obj, '__getitem__')
+
+cdef bint decimal_almost_equal(double desired, double actual, int decimal):
+    # Code from
+    # http://docs.scipy.org/doc/numpy/reference/generated
+    # /numpy.testing.assert_almost_equal.html
+    return abs(desired - actual) < (0.5 * 10.0 ** -decimal)
+
+cpdef assert_dict_equal(a, b, bint compare_keys=True):
+    assert is_dictlike(a) and is_dictlike(b), (
+        "Cannot compare dict objects, one or both is not dict-like"
+    )
+
+    a_keys = frozenset(a.keys())
+    b_keys = frozenset(b.keys())
+
+    if compare_keys:
+        assert a_keys == b_keys
+
+    for k in a_keys:
+        assert_almost_equal(a[k], b[k])
+
+    return True
+
+cpdef assert_almost_equal(a, b,
+                          check_less_precise=False,
+                          bint check_dtype=True,
+                          obj=None, lobj=None, robj=None):
+    """Check that left and right objects are almost equal.
+
+    Parameters
+    ----------
+    a : object
+    b : object
+    check_less_precise : bool or int, default False
+        Specify comparison precision.
+        5 digits (False) or 3 digits (True) after decimal points are
+        compared. If an integer, then this will be the number of decimal
+        points to compare
+    check_dtype: bool, default True
+        check dtype if both a and b are np.ndarray
+    obj : str, default None
+        Specify object name being compared, internally used to show
+        appropriate assertion message
+    lobj : str, default None
+        Specify left object name being compared, internally used to show
+        appropriate assertion message
+    robj : str, default None
+        Specify right object name being compared, internally used to show
+        appropriate assertion message
+    """
+
+    cdef:
+        int decimal
+        double diff = 0.0
+        Py_ssize_t i, na, nb
+        double fa, fb
+        bint is_unequal = False, a_is_ndarray, b_is_ndarray
+
+    if lobj is None:
+        lobj = a
+    if robj is None:
+        robj = b
+
+    assert isinstance(check_less_precise, (int, bool))
+
+    if isinstance(a, dict) or isinstance(b, dict):
+        return assert_dict_equal(a, b)
+
+    if (isinstance(a, compat.string_types) or
+            isinstance(b, compat.string_types)):
+        assert a == b, "%r != %r" % (a, b)
+        return True
+
+    a_is_ndarray = isinstance(a, np.ndarray)
+    b_is_ndarray = isinstance(b, np.ndarray)
+
+    if obj is None:
+        if a_is_ndarray or b_is_ndarray:
+            obj = 'numpy array'
+        else:
+            obj = 'Iterable'
+
+    if isiterable(a):
+
+        if not isiterable(b):
+            from pandas.util.testing import assert_class_equal
+            # classes can't be the same, to raise error
+            assert_class_equal(a, b, obj=obj)
+
+        assert has_length(a) and has_length(b), (
+            "Can't compare objects without length, one or both is invalid: "
+            "(%r, %r)" % (a, b))
+
+        if a_is_ndarray and b_is_ndarray:
+            na, nb = a.size, b.size
+            if a.shape != b.shape:
+                from pandas.util.testing import raise_assert_detail
+                raise_assert_detail(
+                    obj, '{0} shapes are different'.format(obj),
+                    a.shape, b.shape)
+
+            if check_dtype and not is_dtype_equal(a, b):
+                from pandas.util.testing import assert_attr_equal
+                assert_attr_equal('dtype', a, b, obj=obj)
+
+            try:
+                if array_equivalent(a, b, strict_nan=True):
+                    return True
+            except:
+                pass
+        else:
+            na, nb = len(a), len(b)
+
+        if na != nb:
+            from pandas.util.testing import raise_assert_detail
+
+            # if we have a small diff set, print it
+            if abs(na - nb) < 10:
+                r = list(set(a) ^ set(b))
+            else:
+                r = None
+
+            raise_assert_detail(obj, '{0} length are different'.format(obj),
+                                na, nb, r)
+
+        for i in xrange(len(a)):
+            try:
+                assert_almost_equal(a[i], b[i],
+                                    check_less_precise=check_less_precise)
+            except AssertionError:
+                is_unequal = True
+                diff += 1
+
+        if is_unequal:
+            from pandas.util.testing import raise_assert_detail
+            msg = '{0} values are different ({1} %)'.format(
+                obj, np.round(diff * 100.0 / na, 5))
+            raise_assert_detail(obj, msg, lobj, robj)
+
+        return True
+
+    elif isiterable(b):
+        from pandas.util.testing import assert_class_equal
+        # classes can't be the same, to raise error
+        assert_class_equal(a, b, obj=obj)
+
+    if a == b:
+        # object comparison
+        return True
+    if isna(a) and isna(b):
+        # nan / None comparison
+        return True
+    if is_comparable_as_number(a) and is_comparable_as_number(b):
+        if array_equivalent(a, b, strict_nan=True):
+            # inf comparison
+            return True
+
+        if check_less_precise is True:
+            decimal = 3
+        elif check_less_precise is False:
+            decimal = 5
+        else:
+            decimal = check_less_precise
+
+        fa, fb = a, b
+
+        # case for zero
+        if abs(fa) < 1e-5:
+            if not decimal_almost_equal(fa, fb, decimal):
+                assert False, ('(very low values) expected %.5f but '
+                               'got %.5f, with decimal %d' % (fb, fa, decimal))
+        else:
+            if not decimal_almost_equal(1, fb / fa, decimal):
+                assert False, ('expected %.5f but got %.5f, '
+                               'with decimal %d' % (fb, fa, decimal))
+        return True
+
+    raise AssertionError("{0} != {1}".format(a, b))
diff --git a/pandas/_libs/tslib.pyx b/pandas/_libs/tslib.pyx
new file mode 100644
index 0000000000000..6588b5476e2b9
--- /dev/null
+++ b/pandas/_libs/tslib.pyx
@@ -0,0 +1,785 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+cimport numpy as cnp
+from numpy cimport int64_t, ndarray, float64_t
+import numpy as np
+cnp.import_array()
+
+
+from cpython cimport PyFloat_Check, PyUnicode_Check
+
+from util cimport (is_integer_object, is_float_object, is_string_object,
+                   is_datetime64_object)
+
+from cpython.datetime cimport (PyDateTime_Check, PyDate_Check,
+                               PyDateTime_CheckExact,
+                               PyDateTime_IMPORT,
+                               timedelta, datetime, date, time)
+# import datetime C API
+PyDateTime_IMPORT
+
+
+from tslibs.np_datetime cimport (check_dts_bounds,
+                                 pandas_datetimestruct,
+                                 _string_to_dts,
+                                 dt64_to_dtstruct, dtstruct_to_dt64,
+                                 pydatetime_to_dt64, pydate_to_dt64,
+                                 get_datetime64_value)
+from tslibs.np_datetime import OutOfBoundsDatetime
+
+from tslibs.parsing import parse_datetime_string
+
+cimport cython
+from cython cimport Py_ssize_t
+
+
+import pytz
+UTC = pytz.utc
+
+
+from tslibs.timedeltas cimport cast_from_unit
+from tslibs.timedeltas import Timedelta
+from tslibs.timezones cimport (is_utc, is_tzlocal, is_fixed_offset,
+                               treat_tz_as_pytz, get_dst_info)
+from tslibs.conversion cimport (tz_convert_single, _TSObject,
+                                convert_datetime_to_tsobject,
+                                get_datetime64_nanos,
+                                tz_convert_utc_to_tzlocal)
+from tslibs.conversion import tz_convert_single
+
+from tslibs.nattype import NaT, nat_strings, iNaT
+from tslibs.nattype cimport checknull_with_nat, NPY_NAT
+
+from tslibs.timestamps cimport (create_timestamp_from_ts,
+                                _NS_UPPER_BOUND, _NS_LOWER_BOUND)
+from tslibs.timestamps import Timestamp
+
+cdef bint PY2 = str == bytes
+
+
+cdef inline object create_datetime_from_ts(
+        int64_t value, pandas_datetimestruct dts,
+        object tz, object freq):
+    """ convenience routine to construct a datetime.datetime from its parts """
+    return datetime(dts.year, dts.month, dts.day, dts.hour,
+                    dts.min, dts.sec, dts.us, tz)
+
+cdef inline object create_date_from_ts(
+        int64_t value, pandas_datetimestruct dts,
+        object tz, object freq):
+    """ convenience routine to construct a datetime.date from its parts """
+    return date(dts.year, dts.month, dts.day)
+
+cdef inline object create_time_from_ts(
+        int64_t value, pandas_datetimestruct dts,
+        object tz, object freq):
+    """ convenience routine to construct a datetime.time from its parts """
+    return time(dts.hour, dts.min, dts.sec, dts.us)
+
+
+def ints_to_pydatetime(ndarray[int64_t] arr, tz=None, freq=None,
+                       box="datetime"):
+    """
+    Convert an i8 repr to an ndarray of datetimes, date, time or Timestamp
+
+    Parameters
+    ----------
+    arr  : array of i8
+    tz   : str, default None
+         convert to this timezone
+    freq : str/Offset, default None
+         freq to convert
+    box  : {'datetime', 'timestamp', 'date', 'time'}, default 'datetime'
+         If datetime, convert to datetime.datetime
+         If date, convert to datetime.date
+         If time, convert to datetime.time
+         If Timestamp, convert to pandas.Timestamp
+
+    Returns
+    -------
+    result : array of dtype specified by box
+    """
+
+    cdef:
+        Py_ssize_t i, n = len(arr)
+        ndarray[int64_t] trans, deltas
+        pandas_datetimestruct dts
+        object dt
+        int64_t value
+        ndarray[object] result = np.empty(n, dtype=object)
+        object (*func_create)(int64_t, pandas_datetimestruct, object, object)
+
+    if box == "date":
+        assert (tz is None), "tz should be None when converting to date"
+
+        func_create = create_date_from_ts
+    elif box == "timestamp":
+        func_create = create_timestamp_from_ts
+
+        if is_string_object(freq):
+            from pandas.tseries.frequencies import to_offset
+            freq = to_offset(freq)
+    elif box == "time":
+        func_create = create_time_from_ts
+    elif box == "datetime":
+        func_create = create_datetime_from_ts
+    else:
+        raise ValueError("box must be one of 'datetime', 'date', 'time' or"
+                         " 'timestamp'")
+
+    if tz is not None:
+        if is_utc(tz):
+            for i in range(n):
+                value = arr[i]
+                if value == NPY_NAT:
+                    result[i] = NaT
+                else:
+                    dt64_to_dtstruct(value, &dts)
+                    result[i] = func_create(value, dts, tz, freq)
+        elif is_tzlocal(tz) or is_fixed_offset(tz):
+            for i in range(n):
+                value = arr[i]
+                if value == NPY_NAT:
+                    result[i] = NaT
+                else:
+                    # Python datetime objects do not support nanosecond
+                    # resolution (yet, PEP 564). Need to compute new value
+                    # using the i8 representation.
+                    local_value = tz_convert_utc_to_tzlocal(value, tz)
+                    dt64_to_dtstruct(local_value, &dts)
+                    result[i] = func_create(value, dts, tz, freq)
+        else:
+            trans, deltas, typ = get_dst_info(tz)
+
+            for i in range(n):
+
+                value = arr[i]
+                if value == NPY_NAT:
+                    result[i] = NaT
+                else:
+
+                    # Adjust datetime64 timestamp, recompute datetimestruct
+                    pos = trans.searchsorted(value, side='right') - 1
+                    if treat_tz_as_pytz(tz):
+                        # find right representation of dst etc in pytz timezone
+                        new_tz = tz._tzinfos[tz._transition_info[pos]]
+                    else:
+                        # no zone-name change for dateutil tzs - dst etc
+                        # represented in single object.
+                        new_tz = tz
+
+                    dt64_to_dtstruct(value + deltas[pos], &dts)
+                    result[i] = func_create(value, dts, new_tz, freq)
+    else:
+        for i in range(n):
+
+            value = arr[i]
+            if value == NPY_NAT:
+                result[i] = NaT
+            else:
+                dt64_to_dtstruct(value, &dts)
+                result[i] = func_create(value, dts, None, freq)
+
+    return result
+
+
+def ints_to_pytimedelta(ndarray[int64_t] arr, box=False):
+    # convert an i8 repr to an ndarray of timedelta or Timedelta (if box ==
+    # True)
+
+    cdef:
+        Py_ssize_t i, n = len(arr)
+        int64_t value
+        ndarray[object] result = np.empty(n, dtype=object)
+
+    for i in range(n):
+
+        value = arr[i]
+        if value == NPY_NAT:
+            result[i] = NaT
+        else:
+            if box:
+                result[i] = Timedelta(value)
+            else:
+                result[i] = timedelta(microseconds=int(value) / 1000)
+
+    return result
+
+
+def _test_parse_iso8601(object ts):
+    """
+    TESTING ONLY: Parse string into Timestamp using iso8601 parser. Used
+    only for testing, actual construction uses `convert_str_to_tsobject`
+    """
+    cdef:
+        _TSObject obj
+        int out_local = 0, out_tzoffset = 0
+
+    obj = _TSObject()
+
+    if ts == 'now':
+        return Timestamp.utcnow()
+    elif ts == 'today':
+        return Timestamp.now().normalize()
+
+    _string_to_dts(ts, &obj.dts, &out_local, &out_tzoffset)
+    obj.value = dtstruct_to_dt64(&obj.dts)
+    check_dts_bounds(&obj.dts)
+    if out_local == 1:
+        obj.tzinfo = pytz.FixedOffset(out_tzoffset)
+        obj.value = tz_convert_single(obj.value, obj.tzinfo, 'UTC')
+        return Timestamp(obj.value, tz=obj.tzinfo)
+    else:
+        return Timestamp(obj.value)
+
+
+cpdef inline object _localize_pydatetime(object dt, object tz):
+    """
+    Take a datetime/Timestamp in UTC and localizes to timezone tz.
+    """
+    if tz is None:
+        return dt
+    elif isinstance(dt, Timestamp):
+        return dt.tz_localize(tz)
+    elif tz == 'UTC' or tz is UTC:
+        return UTC.localize(dt)
+    try:
+        # datetime.replace with pytz may be incorrect result
+        return tz.localize(dt)
+    except AttributeError:
+        return dt.replace(tzinfo=tz)
+
+
+def format_array_from_datetime(ndarray[int64_t] values, object tz=None,
+                               object format=None, object na_rep=None):
+    """
+    return a np object array of the string formatted values
+
+    Parameters
+    ----------
+    values : a 1-d i8 array
+    tz : the timezone (or None)
+    format : optional, default is None
+          a strftime capable string
+    na_rep : optional, default is None
+          a nat format
+
+    """
+    cdef:
+        int64_t val, ns, N = len(values)
+        ndarray[int64_t] consider_values
+        bint show_ms = 0, show_us = 0, show_ns = 0, basic_format = 0
+        ndarray[object] result = np.empty(N, dtype=object)
+        object ts, res
+        pandas_datetimestruct dts
+
+    if na_rep is None:
+        na_rep = 'NaT'
+
+    # if we don't have a format nor tz, then choose
+    # a format based on precision
+    basic_format = format is None and tz is None
+    if basic_format:
+        consider_values = values[values != NPY_NAT]
+        show_ns = (consider_values % 1000).any()
+
+        if not show_ns:
+            consider_values //= 1000
+            show_us = (consider_values % 1000).any()
+
+            if not show_ms:
+                consider_values //= 1000
+                show_ms = (consider_values % 1000).any()
+
+    for i in range(N):
+        val = values[i]
+
+        if val == NPY_NAT:
+            result[i] = na_rep
+        elif basic_format:
+
+            dt64_to_dtstruct(val, &dts)
+            res = '%d-%.2d-%.2d %.2d:%.2d:%.2d' % (dts.year,
+                                                   dts.month,
+                                                   dts.day,
+                                                   dts.hour,
+                                                   dts.min,
+                                                   dts.sec)
+
+            if show_ns:
+                ns = dts.ps / 1000
+                res += '.%.9d' % (ns + 1000 * dts.us)
+            elif show_us:
+                res += '.%.6d' % dts.us
+            elif show_ms:
+                res += '.%.3d' % (dts.us /1000)
+
+            result[i] = res
+
+        else:
+
+            ts = Timestamp(val, tz=tz)
+            if format is None:
+                result[i] = str(ts)
+            else:
+
+                # invalid format string
+                # requires dates > 1900
+                try:
+                    result[i] = ts.strftime(format)
+                except ValueError:
+                    result[i] = str(ts)
+
+    return result
+
+
+cpdef array_with_unit_to_datetime(ndarray values, unit, errors='coerce'):
+    """
+    convert the ndarray according to the unit
+    if errors:
+      - raise: return converted values or raise OutOfBoundsDatetime
+          if out of range on the conversion or
+          ValueError for other conversions (e.g. a string)
+      - ignore: return non-convertible values as the same unit
+      - coerce: NaT for non-convertibles
+
+    """
+    cdef:
+        Py_ssize_t i, j, n=len(values)
+        int64_t m
+        ndarray[float64_t] fvalues
+        ndarray mask
+        bint is_ignore = errors=='ignore'
+        bint is_coerce = errors=='coerce'
+        bint is_raise = errors=='raise'
+        bint need_to_iterate = True
+        ndarray[int64_t] iresult
+        ndarray[object] oresult
+
+    assert is_ignore or is_coerce or is_raise
+
+    if unit == 'ns':
+        if issubclass(values.dtype.type, np.integer):
+            return values.astype('M8[ns]')
+        return array_to_datetime(values.astype(object), errors=errors)
+
+    m = cast_from_unit(None, unit)
+
+    if is_raise:
+
+        # try a quick conversion to i8
+        # if we have nulls that are not type-compat
+        # then need to iterate
+        try:
+            iresult = values.astype('i8', casting='same_kind', copy=False)
+            mask = iresult == iNaT
+            iresult[mask] = 0
+            fvalues = iresult.astype('f8') * m
+            need_to_iterate = False
+        except:
+            pass
+
+        # check the bounds
+        if not need_to_iterate:
+
+            if ((fvalues < _NS_LOWER_BOUND).any()
+                    or (fvalues > _NS_UPPER_BOUND).any()):
+                raise OutOfBoundsDatetime(
+                    "cannot convert input with unit '{0}'".format(unit))
+            result = (iresult * m).astype('M8[ns]')
+            iresult = result.view('i8')
+            iresult[mask] = iNaT
+            return result
+
+    result = np.empty(n, dtype='M8[ns]')
+    iresult = result.view('i8')
+
+    try:
+        for i in range(n):
+            val = values[i]
+
+            if checknull_with_nat(val):
+                iresult[i] = NPY_NAT
+
+            elif is_integer_object(val) or is_float_object(val):
+
+                if val != val or val == NPY_NAT:
+                    iresult[i] = NPY_NAT
+                else:
+                    try:
+                        iresult[i] = cast_from_unit(val, unit)
+                    except OverflowError:
+                        if is_raise:
+                            raise OutOfBoundsDatetime(
+                                "cannot convert input {0} with the unit "
+                                "'{1}'".format(val, unit))
+                        elif is_ignore:
+                            raise AssertionError
+                        iresult[i] = NPY_NAT
+
+            elif is_string_object(val):
+                if len(val) == 0 or val in nat_strings:
+                    iresult[i] = NPY_NAT
+
+                else:
+                    try:
+                        iresult[i] = cast_from_unit(float(val), unit)
+                    except ValueError:
+                        if is_raise:
+                            raise ValueError(
+                                "non convertible value {0} with the unit "
+                                "'{1}'".format(val, unit))
+                        elif is_ignore:
+                            raise AssertionError
+                        iresult[i] = NPY_NAT
+                    except:
+                        if is_raise:
+                            raise OutOfBoundsDatetime(
+                                "cannot convert input {0} with the unit "
+                                "'{1}'".format(val, unit))
+                        elif is_ignore:
+                            raise AssertionError
+                        iresult[i] = NPY_NAT
+
+            else:
+
+                if is_raise:
+                    raise ValueError("unit='{0}' not valid with non-numerical "
+                                     "val='{1}'".format(unit, val))
+                if is_ignore:
+                    raise AssertionError
+
+                iresult[i] = NPY_NAT
+
+        return result
+
+    except AssertionError:
+        pass
+
+    # we have hit an exception
+    # and are in ignore mode
+    # redo as object
+
+    oresult = np.empty(n, dtype=object)
+    for i in range(n):
+        val = values[i]
+
+        if checknull_with_nat(val):
+            oresult[i] = NaT
+        elif is_integer_object(val) or is_float_object(val):
+
+            if val != val or val == NPY_NAT:
+                oresult[i] = NaT
+            else:
+                try:
+                    oresult[i] = Timestamp(cast_from_unit(val, unit))
+                except:
+                    oresult[i] = val
+
+        elif is_string_object(val):
+            if len(val) == 0 or val in nat_strings:
+                oresult[i] = NaT
+
+            else:
+                oresult[i] = val
+
+    return oresult
+
+
+cpdef array_to_datetime(ndarray[object] values, errors='raise',
+                        dayfirst=False, yearfirst=False,
+                        format=None, utc=None,
+                        require_iso8601=False):
+    cdef:
+        Py_ssize_t i, n = len(values)
+        object val, py_dt
+        ndarray[int64_t] iresult
+        ndarray[object] oresult
+        pandas_datetimestruct dts
+        bint utc_convert = bool(utc)
+        bint seen_integer = 0
+        bint seen_string = 0
+        bint seen_datetime = 0
+        bint is_raise = errors=='raise'
+        bint is_ignore = errors=='ignore'
+        bint is_coerce = errors=='coerce'
+        _TSObject _ts
+        int out_local=0, out_tzoffset=0
+
+    # specify error conditions
+    assert is_raise or is_ignore or is_coerce
+
+    try:
+        result = np.empty(n, dtype='M8[ns]')
+        iresult = result.view('i8')
+        for i in range(n):
+            val = values[i]
+
+            if checknull_with_nat(val):
+                iresult[i] = NPY_NAT
+
+            elif PyDateTime_Check(val):
+                seen_datetime = 1
+                if val.tzinfo is not None:
+                    if utc_convert:
+                        try:
+                            _ts = convert_datetime_to_tsobject(val, None)
+                            iresult[i] = _ts.value
+                        except OutOfBoundsDatetime:
+                            if is_coerce:
+                                iresult[i] = NPY_NAT
+                                continue
+                            raise
+                    else:
+                        raise ValueError('Tz-aware datetime.datetime cannot '
+                                         'be converted to datetime64 unless '
+                                         'utc=True')
+                else:
+                    iresult[i] = pydatetime_to_dt64(val, &dts)
+                    if not PyDateTime_CheckExact(val):
+                        # i.e. a Timestamp object
+                        iresult[i] += val.nanosecond
+                    try:
+                        check_dts_bounds(&dts)
+                    except OutOfBoundsDatetime:
+                        if is_coerce:
+                            iresult[i] = NPY_NAT
+                            continue
+                        raise
+
+            elif PyDate_Check(val):
+                seen_datetime = 1
+                iresult[i] = pydate_to_dt64(val, &dts)
+                try:
+                    check_dts_bounds(&dts)
+                except OutOfBoundsDatetime:
+                    if is_coerce:
+                        iresult[i] = NPY_NAT
+                        continue
+                    raise
+
+            elif is_datetime64_object(val):
+                seen_datetime = 1
+                if get_datetime64_value(val) == NPY_NAT:
+                    iresult[i] = NPY_NAT
+                else:
+                    try:
+                        iresult[i] = get_datetime64_nanos(val)
+                    except OutOfBoundsDatetime:
+                        if is_coerce:
+                            iresult[i] = NPY_NAT
+                            continue
+                        raise
+
+            elif is_integer_object(val) or is_float_object(val):
+                # these must be ns unit by-definition
+                seen_integer = 1
+
+                if val != val or val == NPY_NAT:
+                    iresult[i] = NPY_NAT
+                elif is_raise or is_ignore:
+                    iresult[i] = val
+                else:
+                    # coerce
+                    # we now need to parse this as if unit='ns'
+                    # we can ONLY accept integers at this point
+                    # if we have previously (or in future accept
+                    # datetimes/strings, then we must coerce)
+                    try:
+                        iresult[i] = cast_from_unit(val, 'ns')
+                    except:
+                        iresult[i] = NPY_NAT
+
+            elif is_string_object(val):
+                # string
+                seen_string = 1
+
+                if len(val) == 0 or val in nat_strings:
+                    iresult[i] = NPY_NAT
+                    continue
+                if PyUnicode_Check(val) and PY2:
+                    val = val.encode('utf-8')
+
+                try:
+                    _string_to_dts(val, &dts, &out_local, &out_tzoffset)
+                except ValueError:
+                    # A ValueError at this point is a _parsing_ error
+                    # specifically _not_ OutOfBoundsDatetime
+                    if _parse_today_now(val, &iresult[i]):
+                        continue
+                    elif require_iso8601:
+                        # if requiring iso8601 strings, skip trying
+                        # other formats
+                        if is_coerce:
+                            iresult[i] = NPY_NAT
+                            continue
+                        elif is_raise:
+                            raise ValueError("time data {val} doesn't match "
+                                             "format specified"
+                                             .format(val=val))
+                        return values
+
+                    try:
+                        py_dt = parse_datetime_string(val, dayfirst=dayfirst,
+                                                      yearfirst=yearfirst)
+                    except Exception:
+                        if is_coerce:
+                            iresult[i] = NPY_NAT
+                            continue
+                        raise TypeError("invalid string coercion to datetime")
+
+                    try:
+                        _ts = convert_datetime_to_tsobject(py_dt, None)
+                        iresult[i] = _ts.value
+                    except OutOfBoundsDatetime:
+                        if is_coerce:
+                            iresult[i] = NPY_NAT
+                            continue
+                        raise
+                except:
+                    # TODO: What exception are we concerned with here?
+                    if is_coerce:
+                        iresult[i] = NPY_NAT
+                        continue
+                    raise
+                else:
+                    # No error raised by string_to_dts, pick back up
+                    # where we left off
+                    value = dtstruct_to_dt64(&dts)
+                    if out_local == 1:
+                        tz = pytz.FixedOffset(out_tzoffset)
+                        value = tz_convert_single(value, tz, 'UTC')
+                    iresult[i] = value
+                    try:
+                        check_dts_bounds(&dts)
+                    except OutOfBoundsDatetime:
+                        # GH#19382 for just-barely-OutOfBounds falling back to
+                        # dateutil parser will return incorrect result because
+                        # it will ignore nanoseconds
+                        if is_coerce:
+                            iresult[i] = NPY_NAT
+                            continue
+                        elif require_iso8601:
+                            if is_raise:
+                                raise ValueError("time data {val} doesn't "
+                                                 "match format specified"
+                                                 .format(val=val))
+                            return values
+                        raise
+
+            else:
+                if is_coerce:
+                    iresult[i] = NPY_NAT
+                else:
+                    raise TypeError("{0} is not convertible to datetime"
+                                    .format(type(val)))
+
+        if seen_datetime and seen_integer:
+            # we have mixed datetimes & integers
+
+            if is_coerce:
+                # coerce all of the integers/floats to NaT, preserve
+                # the datetimes and other convertibles
+                for i in range(n):
+                    val = values[i]
+                    if is_integer_object(val) or is_float_object(val):
+                        result[i] = NPY_NAT
+            elif is_raise:
+                raise ValueError(
+                    "mixed datetimes and integers in passed array")
+            else:
+                raise TypeError
+
+        return result
+    except OutOfBoundsDatetime:
+        if is_raise:
+            raise
+
+        oresult = np.empty(n, dtype=object)
+        for i in range(n):
+            val = values[i]
+
+            # set as nan except if its a NaT
+            if checknull_with_nat(val):
+                if PyFloat_Check(val):
+                    oresult[i] = np.nan
+                else:
+                    oresult[i] = NaT
+            elif is_datetime64_object(val):
+                if get_datetime64_value(val) == NPY_NAT:
+                    oresult[i] = NaT
+                else:
+                    oresult[i] = val.item()
+            else:
+                oresult[i] = val
+        return oresult
+    except TypeError:
+        oresult = np.empty(n, dtype=object)
+
+        for i in range(n):
+            val = values[i]
+            if checknull_with_nat(val):
+                oresult[i] = val
+            elif is_string_object(val):
+
+                if len(val) == 0 or val in nat_strings:
+                    oresult[i] = 'NaT'
+                    continue
+
+                try:
+                    oresult[i] = parse_datetime_string(val, dayfirst=dayfirst,
+                                                       yearfirst=yearfirst)
+                    pydatetime_to_dt64(oresult[i], &dts)
+                    check_dts_bounds(&dts)
+                except Exception:
+                    if is_raise:
+                        raise
+                    return values
+                    # oresult[i] = val
+            else:
+                if is_raise:
+                    raise
+                return values
+
+        return oresult
+
+
+cdef inline bint _parse_today_now(str val, int64_t* iresult):
+    # We delay this check for as long as possible
+    # because it catches relatively rare cases
+    if val == 'now':
+        # Note: this is *not* the same as Timestamp('now')
+        iresult[0] = Timestamp.utcnow().value
+        return True
+    elif val == 'today':
+        iresult[0] = Timestamp.today().value
+        return True
+    return False
+
+# ----------------------------------------------------------------------
+# Some general helper functions
+
+
+cpdef normalize_date(object dt):
+    """
+    Normalize datetime.datetime value to midnight. Returns datetime.date as a
+    datetime.datetime at midnight
+
+    Returns
+    -------
+    normalized : datetime.datetime or Timestamp
+    """
+    if PyDateTime_Check(dt):
+        if not PyDateTime_CheckExact(dt):
+            # i.e. a Timestamp object
+            return dt.replace(hour=0, minute=0, second=0, microsecond=0,
+                              nanosecond=0)
+        else:
+            # regular datetime object
+            return dt.replace(hour=0, minute=0, second=0, microsecond=0)
+            # TODO: Make sure DST crossing is handled correctly here
+    elif PyDate_Check(dt):
+        return datetime(dt.year, dt.month, dt.day)
+    else:
+        raise TypeError('Unrecognized type: %s' % type(dt))
diff --git a/pandas/_libs/tslibs/__init__.py b/pandas/_libs/tslibs/__init__.py
new file mode 100644
index 0000000000000..f3aa0424f0376
--- /dev/null
+++ b/pandas/_libs/tslibs/__init__.py
@@ -0,0 +1,2 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
diff --git a/pandas/_libs/tslibs/ccalendar.pxd b/pandas/_libs/tslibs/ccalendar.pxd
new file mode 100644
index 0000000000000..04fb6eaf49c84
--- /dev/null
+++ b/pandas/_libs/tslibs/ccalendar.pxd
@@ -0,0 +1,13 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+from cython cimport Py_ssize_t
+
+from numpy cimport int64_t, int32_t
+
+
+cdef int dayofweek(int y, int m, int d) nogil
+cdef bint is_leapyear(int64_t year) nogil
+cpdef int32_t get_days_in_month(int year, Py_ssize_t month) nogil
+cpdef int32_t get_week_of_year(int year, int month, int day) nogil
+cpdef int32_t get_day_of_year(int year, int month, int day) nogil
diff --git a/pandas/_libs/tslibs/ccalendar.pyx b/pandas/_libs/tslibs/ccalendar.pyx
new file mode 100644
index 0000000000000..0901d474d044c
--- /dev/null
+++ b/pandas/_libs/tslibs/ccalendar.pyx
@@ -0,0 +1,230 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+# cython: boundscheck=False
+"""
+Cython implementations of functions resembling the stdlib calendar module
+"""
+
+cimport cython
+from cython cimport Py_ssize_t
+
+cimport numpy as cnp
+from numpy cimport int64_t, int32_t
+cnp.import_array()
+
+from locale import LC_TIME
+from strptime import LocaleTime
+
+# ----------------------------------------------------------------------
+# Constants
+
+# Slightly more performant cython lookups than a 2D table
+# The first 12 entries correspond to month lengths for non-leap years.
+# The remaining 12 entries give month lengths for leap years
+cdef int32_t* days_per_month_array = [
+    31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31,
+    31, 29, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31]
+
+cdef int* sakamoto_arr = [0, 3, 2, 5, 0, 3, 5, 1, 4, 6, 2, 4]
+
+# The first 13 entries give the month days elapsed as of the first of month N
+# (or the total number of days in the year for N=13) in non-leap years.
+# The remaining 13 entries give the days elapsed in leap years.
+cdef int32_t* _month_offset = [
+    0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365,
+    0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366]
+
+# Canonical location for other modules to find name constants
+MONTHS = ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL',
+          'AUG', 'SEP', 'OCT', 'NOV', 'DEC']
+# The first blank line is consistent with calendar.month_name in the calendar
+# standard library
+MONTHS_FULL = ['', 'January', 'February', 'March', 'April', 'May', 'June',
+               'July', 'August', 'September', 'October', 'November',
+               'December']
+MONTH_NUMBERS = {name: num for num, name in enumerate(MONTHS)}
+MONTH_ALIASES = {(num + 1): name for num, name in enumerate(MONTHS)}
+MONTH_TO_CAL_NUM = {name: num + 1 for num, name in enumerate(MONTHS)}
+
+DAYS = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
+DAYS_FULL = ['Monday', 'Tuesday', 'Wednesday', 'Thursday', 'Friday',
+             'Saturday', 'Sunday']
+int_to_weekday = {num: name for num, name in enumerate(DAYS)}
+weekday_to_int = {int_to_weekday[key]: key for key in int_to_weekday}
+
+# ----------------------------------------------------------------------
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cpdef inline int32_t get_days_in_month(int year, Py_ssize_t month) nogil:
+    """Return the number of days in the given month of the given year.
+
+    Parameters
+    ----------
+    year : int
+    month : int
+
+    Returns
+    -------
+    days_in_month : int
+
+    Notes
+    -----
+    Assumes that the arguments are valid.  Passing a month not between 1 and 12
+    risks a segfault.
+    """
+    return days_per_month_array[12 * is_leapyear(year) + month - 1]
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+@cython.cdivision
+cdef int dayofweek(int y, int m, int d) nogil:
+    """Find the day of week for the date described by the Y/M/D triple y, m, d
+    using Sakamoto's method, from wikipedia.
+
+    0 represents Monday.  See [1]_.
+
+    Parameters
+    ----------
+    y : int
+    m : int
+    d : int
+
+    Returns
+    -------
+    weekday : int
+
+    Notes
+    -----
+    Assumes that y, m, d, represents a valid date.
+
+    See Also
+    --------
+    [1] https://docs.python.org/3/library/calendar.html#calendar.weekday
+
+    [2] https://en.wikipedia.org/wiki/\
+    Determination_of_the_day_of_the_week#Sakamoto.27s_methods
+    """
+    cdef:
+        int day
+
+    y -= m < 3
+    day = (y + y / 4 - y / 100 + y / 400 + sakamoto_arr[m - 1] + d) % 7
+    # convert to python day
+    return (day + 6) % 7
+
+
+cdef bint is_leapyear(int64_t year) nogil:
+    """Returns 1 if the given year is a leap year, 0 otherwise.
+
+    Parameters
+    ----------
+    year : int
+
+    Returns
+    -------
+    is_leap : bool
+    """
+    return ((year & 0x3) == 0 and  # year % 4 == 0
+            ((year % 100) != 0 or (year % 400) == 0))
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cpdef int32_t get_week_of_year(int year, int month, int day) nogil:
+    """Return the ordinal week-of-year for the given day.
+
+    Parameters
+    ----------
+    year : int
+    month : int
+    day : int
+
+    Returns
+    -------
+    week_of_year : int32_t
+
+    Notes
+    -----
+    Assumes the inputs describe a valid date.
+    """
+    cdef:
+        bint isleap
+        int32_t doy, dow
+        int woy
+
+    isleap = is_leapyear(year)
+
+    doy = get_day_of_year(year, month, day)
+    dow = dayofweek(year, month, day)
+
+    # estimate
+    woy = (doy - 1) - dow + 3
+    if woy >= 0:
+        woy = woy / 7 + 1
+
+    # verify
+    if woy < 0:
+        if (woy > -2) or (woy == -2 and is_leapyear(year - 1)):
+            woy = 53
+        else:
+            woy = 52
+    elif woy == 53:
+        if 31 - day + dow < 3:
+            woy = 1
+
+    return woy
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cpdef int32_t get_day_of_year(int year, int month, int day) nogil:
+    """Return the ordinal day-of-year for the given day.
+
+    Parameters
+    ----------
+    year : int
+    month : int
+    day : int
+
+    Returns
+    -------
+    day_of_year : int32_t
+
+    Notes
+    -----
+    Assumes the inputs describe a valid date.
+    """
+    cdef:
+        bint isleap
+        int32_t mo_off
+        int day_of_year
+
+    isleap = is_leapyear(year)
+
+    mo_off = _month_offset[isleap * 13 + month - 1]
+
+    day_of_year = mo_off + day
+    return day_of_year
+
+
+cpdef get_locale_names(object name_type, object locale=None):
+    """Returns an array of localized day or month names
+
+    Parameters
+    ----------
+    name_type : string, attribute of LocaleTime() in which to return localized
+        names
+    locale : string
+
+    Returns
+    -------
+    list of locale names
+
+    """
+    from pandas.util.testing import set_locale
+
+    with set_locale(locale, LC_TIME):
+        return getattr(LocaleTime(), name_type)
diff --git a/pandas/_libs/tslibs/conversion.pxd b/pandas/_libs/tslibs/conversion.pxd
new file mode 100644
index 0000000000000..8f887dc3af203
--- /dev/null
+++ b/pandas/_libs/tslibs/conversion.pxd
@@ -0,0 +1,33 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+from cpython.datetime cimport datetime, tzinfo
+
+from numpy cimport int64_t, int32_t
+
+from np_datetime cimport pandas_datetimestruct
+
+
+cdef class _TSObject:
+    cdef:
+        pandas_datetimestruct dts      # pandas_datetimestruct
+        int64_t value               # numpy dt64
+        object tzinfo
+
+
+cdef convert_to_tsobject(object ts, object tz, object unit,
+                         bint dayfirst, bint yearfirst,
+                         int32_t nanos=*)
+
+cdef _TSObject convert_datetime_to_tsobject(datetime ts, object tz,
+                                            int32_t nanos=*)
+
+cpdef int64_t tz_convert_single(int64_t val, object tz1, object tz2)
+
+cdef int64_t get_datetime64_nanos(object val) except? -1
+
+cpdef int64_t pydt_to_i8(object pydt) except? -1
+
+cdef maybe_datetimelike_to_i8(object val)
+
+cdef int64_t tz_convert_utc_to_tzlocal(int64_t utc_val, tzinfo tz)
diff --git a/pandas/_libs/tslibs/conversion.pyx b/pandas/_libs/tslibs/conversion.pyx
new file mode 100644
index 0000000000000..3cbef82437544
--- /dev/null
+++ b/pandas/_libs/tslibs/conversion.pyx
@@ -0,0 +1,1180 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+cimport cython
+from cython cimport Py_ssize_t
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport int64_t, int32_t, ndarray
+cnp.import_array()
+
+import pytz
+
+# stdlib datetime imports
+from datetime import time as datetime_time
+from cpython.datetime cimport (datetime, tzinfo,
+                               PyDateTime_Check, PyDate_Check,
+                               PyDateTime_CheckExact, PyDateTime_IMPORT)
+PyDateTime_IMPORT
+
+from np_datetime cimport (check_dts_bounds,
+                          pandas_datetimestruct,
+                          pandas_datetime_to_datetimestruct, _string_to_dts,
+                          PANDAS_DATETIMEUNIT, PANDAS_FR_ns,
+                          npy_datetime,
+                          dt64_to_dtstruct, dtstruct_to_dt64,
+                          get_datetime64_unit, get_datetime64_value,
+                          pydatetime_to_dt64)
+from np_datetime import OutOfBoundsDatetime
+
+from util cimport (is_string_object,
+                   is_datetime64_object,
+                   is_integer_object, is_float_object, is_array)
+
+from timedeltas cimport cast_from_unit
+from timezones cimport (is_utc, is_tzlocal, is_fixed_offset,
+                        treat_tz_as_dateutil, treat_tz_as_pytz,
+                        get_utcoffset, get_dst_info,
+                        get_timezone, maybe_get_tz, tz_compare)
+from parsing import parse_datetime_string
+
+from nattype import nat_strings, NaT
+from nattype cimport NPY_NAT, checknull_with_nat
+
+# ----------------------------------------------------------------------
+# Constants
+
+cdef int64_t DAY_NS = 86400000000000LL
+NS_DTYPE = np.dtype('M8[ns]')
+TD_DTYPE = np.dtype('m8[ns]')
+
+UTC = pytz.UTC
+
+# ----------------------------------------------------------------------
+# Misc Helpers
+
+# TODO: How to declare np.datetime64 as the input type?
+cdef inline int64_t get_datetime64_nanos(object val) except? -1:
+    """
+    Extract the value and unit from a np.datetime64 object, then convert the
+    value to nanoseconds if necessary.
+    """
+    cdef:
+        pandas_datetimestruct dts
+        PANDAS_DATETIMEUNIT unit
+        npy_datetime ival
+
+    unit = get_datetime64_unit(val)
+    ival = get_datetime64_value(val)
+
+    if unit != PANDAS_FR_ns:
+        pandas_datetime_to_datetimestruct(ival, unit, &dts)
+        check_dts_bounds(&dts)
+        ival = dtstruct_to_dt64(&dts)
+
+    return ival
+
+
+def ensure_datetime64ns(ndarray arr, copy=True):
+    """
+    Ensure a np.datetime64 array has dtype specifically 'datetime64[ns]'
+
+    Parameters
+    ----------
+    arr : ndarray
+    copy : boolean, default True
+
+    Returns
+    -------
+    result : ndarray with dtype datetime64[ns]
+
+    """
+    cdef:
+        Py_ssize_t i, n = arr.size
+        ndarray[int64_t] ivalues, iresult
+        PANDAS_DATETIMEUNIT unit
+        pandas_datetimestruct dts
+
+    shape = (<object> arr).shape
+
+    ivalues = arr.view(np.int64).ravel()
+
+    result = np.empty(shape, dtype='M8[ns]')
+    iresult = result.ravel().view(np.int64)
+
+    if len(iresult) == 0:
+        return result
+
+    unit = get_datetime64_unit(arr.flat[0])
+    if unit == PANDAS_FR_ns:
+        if copy:
+            arr = arr.copy()
+        result = arr
+    else:
+        for i in range(n):
+            if ivalues[i] != NPY_NAT:
+                pandas_datetime_to_datetimestruct(ivalues[i], unit, &dts)
+                iresult[i] = dtstruct_to_dt64(&dts)
+                check_dts_bounds(&dts)
+            else:
+                iresult[i] = NPY_NAT
+
+    return result
+
+
+def ensure_timedelta64ns(ndarray arr, copy=True):
+    """
+    Ensure a np.timedelta64 array has dtype specifically 'timedelta64[ns]'
+
+    Parameters
+    ----------
+    arr : ndarray
+    copy : boolean, default True
+
+    Returns
+    -------
+    result : ndarray with dtype timedelta64[ns]
+
+    """
+    return arr.astype(TD_DTYPE, copy=copy)
+
+
+def datetime_to_datetime64(ndarray[object] values):
+    """
+    Convert ndarray of datetime-like objects to int64 array representing
+    nanosecond timestamps.
+
+    Parameters
+    ----------
+    values : ndarray
+
+    Returns
+    -------
+    result : ndarray with dtype int64
+    inferred_tz : tzinfo or None
+    """
+    cdef:
+        Py_ssize_t i, n = len(values)
+        object val, inferred_tz = None
+        ndarray[int64_t] iresult
+        pandas_datetimestruct dts
+        _TSObject _ts
+
+    result = np.empty(n, dtype='M8[ns]')
+    iresult = result.view('i8')
+    for i in range(n):
+        val = values[i]
+        if checknull_with_nat(val):
+            iresult[i] = NPY_NAT
+        elif PyDateTime_Check(val):
+            if val.tzinfo is not None:
+                if inferred_tz is not None:
+                    if not tz_compare(val.tzinfo, inferred_tz):
+                        raise ValueError('Array must be all same time zone')
+                else:
+                    inferred_tz = get_timezone(val.tzinfo)
+
+                _ts = convert_datetime_to_tsobject(val, None)
+                iresult[i] = _ts.value
+                check_dts_bounds(&_ts.dts)
+            else:
+                if inferred_tz is not None:
+                    raise ValueError('Cannot mix tz-aware with '
+                                     'tz-naive values')
+                iresult[i] = pydatetime_to_dt64(val, &dts)
+                check_dts_bounds(&dts)
+        else:
+            raise TypeError('Unrecognized value type: %s' % type(val))
+
+    return result, inferred_tz
+
+
+cdef inline maybe_datetimelike_to_i8(object val):
+    """
+    Try to convert to a nanosecond timestamp.  Fall back to returning the
+    input value.
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    val : int64 timestamp or original input
+    """
+    cdef:
+        pandas_datetimestruct dts
+    try:
+        return val.value
+    except AttributeError:
+        if is_datetime64_object(val):
+            return get_datetime64_value(val)
+        elif PyDateTime_Check(val):
+            return convert_datetime_to_tsobject(val, None).value
+        return val
+
+
+# ----------------------------------------------------------------------
+# _TSObject Conversion
+
+# lightweight C object to hold datetime & int64 pair
+cdef class _TSObject:
+    # cdef:
+    #    pandas_datetimestruct dts      # pandas_datetimestruct
+    #    int64_t value               # numpy dt64
+    #    object tzinfo
+
+    @property
+    def value(self):
+        return self.value
+
+
+cpdef int64_t pydt_to_i8(object pydt) except? -1:
+    """
+    Convert to int64 representation compatible with numpy datetime64; converts
+    to UTC
+
+    Parameters
+    ----------
+    pydt : object
+
+    Returns
+    -------
+    i8value : np.int64
+    """
+    cdef:
+        _TSObject ts
+
+    ts = convert_to_tsobject(pydt, None, None, 0, 0)
+
+    return ts.value
+
+
+cdef convert_to_tsobject(object ts, object tz, object unit,
+                         bint dayfirst, bint yearfirst, int32_t nanos=0):
+    """
+    Extract datetime and int64 from any of:
+        - np.int64 (with unit providing a possible modifier)
+        - np.datetime64
+        - a float (with unit providing a possible modifier)
+        - python int or long object (with unit providing a possible modifier)
+        - iso8601 string object
+        - python datetime object
+        - another timestamp object
+    """
+    cdef:
+        _TSObject obj
+
+    if tz is not None:
+        tz = maybe_get_tz(tz)
+
+    obj = _TSObject()
+
+    if is_string_object(ts):
+        return convert_str_to_tsobject(ts, tz, unit, dayfirst, yearfirst)
+
+    if ts is None or ts is NaT:
+        obj.value = NPY_NAT
+    elif is_datetime64_object(ts):
+        if ts.view('i8') == NPY_NAT:
+            obj.value = NPY_NAT
+        else:
+            obj.value = get_datetime64_nanos(ts)
+            dt64_to_dtstruct(obj.value, &obj.dts)
+    elif is_integer_object(ts):
+        if ts == NPY_NAT:
+            obj.value = NPY_NAT
+        else:
+            ts = ts * cast_from_unit(None, unit)
+            obj.value = ts
+            dt64_to_dtstruct(ts, &obj.dts)
+    elif is_float_object(ts):
+        if ts != ts or ts == NPY_NAT:
+            obj.value = NPY_NAT
+        else:
+            ts = cast_from_unit(ts, unit)
+            obj.value = ts
+            dt64_to_dtstruct(ts, &obj.dts)
+    elif PyDateTime_Check(ts):
+        return convert_datetime_to_tsobject(ts, tz, nanos)
+    elif PyDate_Check(ts):
+        # Keep the converter same as PyDateTime's
+        ts = datetime.combine(ts, datetime_time())
+        return convert_datetime_to_tsobject(ts, tz)
+    elif getattr(ts, '_typ', None) == 'period':
+        raise ValueError("Cannot convert Period to Timestamp "
+                         "unambiguously. Use to_timestamp")
+    else:
+        raise TypeError('Cannot convert input [{}] of type {} to '
+                        'Timestamp'.format(ts, type(ts)))
+
+    if tz is not None:
+        localize_tso(obj, tz)
+
+    if obj.value != NPY_NAT:
+        # check_overflows needs to run after localize_tso
+        check_dts_bounds(&obj.dts)
+        check_overflows(obj)
+    return obj
+
+
+cdef _TSObject convert_datetime_to_tsobject(datetime ts, object tz,
+                                            int32_t nanos=0):
+    """
+    Convert a datetime (or Timestamp) input `ts`, along with optional timezone
+    object `tz` to a _TSObject.
+
+    The optional argument `nanos` allows for cases where datetime input
+    needs to be supplemented with higher-precision information.
+
+    Parameters
+    ----------
+    ts : datetime or Timestamp
+        Value to be converted to _TSObject
+    tz : tzinfo or None
+        timezone for the timezone-aware output
+    nanos : int32_t, default is 0
+        nanoseconds supplement the precision of the datetime input ts
+
+    Returns
+    -------
+    obj : _TSObject
+    """
+    cdef:
+        _TSObject obj = _TSObject()
+
+    if tz is not None:
+        tz = maybe_get_tz(tz)
+
+        if ts.tzinfo is not None:
+            # Convert the current timezone to the passed timezone
+            ts = ts.astimezone(tz)
+            obj.value = pydatetime_to_dt64(ts, &obj.dts)
+            obj.tzinfo = ts.tzinfo
+        elif not is_utc(tz):
+            ts = _localize_pydatetime(ts, tz)
+            obj.value = pydatetime_to_dt64(ts, &obj.dts)
+            obj.tzinfo = ts.tzinfo
+        else:
+            # UTC
+            obj.value = pydatetime_to_dt64(ts, &obj.dts)
+            obj.tzinfo = pytz.utc
+    else:
+        obj.value = pydatetime_to_dt64(ts, &obj.dts)
+        obj.tzinfo = ts.tzinfo
+
+    if obj.tzinfo is not None and not is_utc(obj.tzinfo):
+        offset = get_utcoffset(obj.tzinfo, ts)
+        obj.value -= int(offset.total_seconds() * 1e9)
+
+    if not PyDateTime_CheckExact(ts):
+        # datetime instance but not datetime type --> Timestamp
+        obj.value += ts.nanosecond
+        obj.dts.ps = ts.nanosecond * 1000
+
+    if nanos:
+        obj.value += nanos
+        obj.dts.ps = nanos * 1000
+
+    check_dts_bounds(&obj.dts)
+    check_overflows(obj)
+    return obj
+
+
+cdef _TSObject convert_str_to_tsobject(object ts, object tz, object unit,
+                                       bint dayfirst=False,
+                                       bint yearfirst=False):
+    """
+    Convert a string-like (bytes or unicode) input `ts`, along with optional
+    timezone object `tz` to a _TSObject.
+
+    The optional arguments `dayfirst` and `yearfirst` are passed to the
+    dateutil parser.
+
+    Parameters
+    ----------
+    ts : bytes or unicode
+        Value to be converted to _TSObject
+    tz : tzinfo or None
+        timezone for the timezone-aware output
+    dayfirst : bool, default False
+        When parsing an ambiguous date string, interpret e.g. "3/4/1975" as
+        April 3, as opposed to the standard US interpretation March 4.
+    yearfirst : bool, default False
+        When parsing an ambiguous date string, interpret e.g. "01/05/09"
+        as "May 9, 2001", as opposed to the default "Jan 5, 2009"
+
+    Returns
+    -------
+    obj : _TSObject
+    """
+    cdef:
+        _TSObject obj
+        int out_local = 0, out_tzoffset = 0
+        datetime dt
+
+    if tz is not None:
+        tz = maybe_get_tz(tz)
+
+    obj = _TSObject()
+
+    assert is_string_object(ts)
+
+    if len(ts) == 0 or ts in nat_strings:
+        ts = NaT
+    elif ts == 'now':
+        # Issue 9000, we short-circuit rather than going
+        # into np_datetime_strings which returns utc
+        ts = datetime.now(tz)
+    elif ts == 'today':
+        # Issue 9000, we short-circuit rather than going
+        # into np_datetime_strings which returns a normalized datetime
+        ts = datetime.now(tz)
+        # equiv: datetime.today().replace(tzinfo=tz)
+    else:
+        try:
+            _string_to_dts(ts, &obj.dts, &out_local, &out_tzoffset)
+            obj.value = dtstruct_to_dt64(&obj.dts)
+            check_dts_bounds(&obj.dts)
+            if out_local == 1:
+                obj.tzinfo = pytz.FixedOffset(out_tzoffset)
+                obj.value = tz_convert_single(obj.value, obj.tzinfo, 'UTC')
+                if tz is None:
+                    check_dts_bounds(&obj.dts)
+                    check_overflows(obj)
+                    return obj
+                else:
+                    # Keep the converter same as PyDateTime's
+                    obj = convert_to_tsobject(obj.value, obj.tzinfo,
+                                              None, 0, 0)
+                    dt = datetime(obj.dts.year, obj.dts.month, obj.dts.day,
+                                  obj.dts.hour, obj.dts.min, obj.dts.sec,
+                                  obj.dts.us, obj.tzinfo)
+                    obj = convert_datetime_to_tsobject(dt, tz,
+                                                       nanos=obj.dts.ps / 1000)
+                    return obj
+
+            else:
+                ts = obj.value
+                if tz is not None:
+                    # shift for localize_tso
+                    ts = tz_localize_to_utc(np.array([ts], dtype='i8'), tz,
+                                            ambiguous='raise',
+                                            errors='raise')[0]
+
+        except OutOfBoundsDatetime:
+            # GH#19382 for just-barely-OutOfBounds falling back to dateutil
+            # parser will return incorrect result because it will ignore
+            # nanoseconds
+            raise
+
+        except ValueError:
+            try:
+                ts = parse_datetime_string(ts, dayfirst=dayfirst,
+                                           yearfirst=yearfirst)
+            except Exception:
+                raise ValueError("could not convert string to Timestamp")
+
+    return convert_to_tsobject(ts, tz, unit, dayfirst, yearfirst)
+
+
+cdef inline check_overflows(_TSObject obj):
+    """
+    Check that we haven't silently overflowed in timezone conversion
+    
+    Parameters
+    ----------
+    obj : _TSObject
+
+    Returns
+    -------
+    None
+
+    Raises
+    ------
+    OutOfBoundsDatetime
+    """
+    # GH#12677
+    if obj.dts.year == 1677:
+        if not (obj.value < 0):
+            raise OutOfBoundsDatetime
+    elif obj.dts.year == 2262:
+        if not (obj.value > 0):
+            raise OutOfBoundsDatetime
+
+
+# ----------------------------------------------------------------------
+# Localization
+
+cdef inline void localize_tso(_TSObject obj, tzinfo tz):
+    """
+    Given the UTC nanosecond timestamp in obj.value, find the wall-clock
+    representation of that timestamp in the given timezone.
+
+    Parameters
+    ----------
+    obj : _TSObject
+    tz : tzinfo
+
+    Returns
+    -------
+    None
+
+    Notes
+    -----
+    Sets obj.tzinfo inplace, alters obj.dts inplace.
+    """
+    cdef:
+        ndarray[int64_t] trans, deltas
+        int64_t delta, local_val
+        Py_ssize_t posn
+
+    assert obj.tzinfo is None
+
+    if is_utc(tz):
+        pass
+    elif obj.value == NPY_NAT:
+        pass
+    elif is_tzlocal(tz):
+        local_val = tz_convert_utc_to_tzlocal(obj.value, tz)
+        dt64_to_dtstruct(local_val, &obj.dts)
+    else:
+        # Adjust datetime64 timestamp, recompute datetimestruct
+        trans, deltas, typ = get_dst_info(tz)
+
+        pos = trans.searchsorted(obj.value, side='right') - 1
+
+        # static/pytz/dateutil specific code
+        if is_fixed_offset(tz):
+            # statictzinfo
+            assert len(deltas) == 1, len(deltas)
+            dt64_to_dtstruct(obj.value + deltas[0], &obj.dts)
+        elif treat_tz_as_pytz(tz):
+            tz = tz._tzinfos[tz._transition_info[pos]]
+            dt64_to_dtstruct(obj.value + deltas[pos], &obj.dts)
+        elif treat_tz_as_dateutil(tz):
+            dt64_to_dtstruct(obj.value + deltas[pos], &obj.dts)
+        else:
+            pass
+
+    obj.tzinfo = tz
+
+
+cdef inline datetime _localize_pydatetime(datetime dt, tzinfo tz):
+    """
+    Take a datetime/Timestamp in UTC and localizes to timezone tz.
+
+    NB: Unlike the version in tslib, this treats datetime and Timestamp objects
+        identically, i.e. discards nanos from Timestamps.
+        It also assumes that the `tz` input is not None.
+    """
+    if tz == 'UTC' or tz is UTC:
+        return UTC.localize(dt)
+    try:
+        # datetime.replace with pytz may be incorrect result
+        return tz.localize(dt)
+    except AttributeError:
+        return dt.replace(tzinfo=tz)
+
+# ----------------------------------------------------------------------
+# Timezone Conversion
+
+cdef inline int64_t tz_convert_tzlocal_to_utc(int64_t val, tzinfo tz):
+    """
+    Parameters
+    ----------
+    val : int64_t
+    tz : tzinfo
+
+    Returns
+    -------
+    utc_date : int64_t
+
+    See Also
+    --------
+    tz_convert_utc_to_tzlocal
+    """
+    cdef:
+        pandas_datetimestruct dts
+        int64_t utc_date, delta
+        datetime dt
+
+    dt64_to_dtstruct(val, &dts)
+    dt = datetime(dts.year, dts.month, dts.day, dts.hour,
+                  dts.min, dts.sec, dts.us, tz)
+    delta = int(get_utcoffset(tz, dt).total_seconds()) * 1000000000
+    utc_date = val - delta
+    return utc_date
+
+
+cdef inline int64_t tz_convert_utc_to_tzlocal(int64_t utc_val, tzinfo tz):
+    """
+    Parameters
+    ----------
+    utc_val : int64_t
+    tz : tzinfo
+
+    Returns
+    -------
+    local_val : int64_t
+
+    See Also
+    --------
+    tz_convert_tzlocal_to_utc
+
+    Notes
+    -----
+    The key difference between this and tz_convert_tzlocal_to_utc is a
+    an addition flipped to a subtraction in the last line.
+    """
+    cdef:
+        pandas_datetimestruct dts
+        int64_t local_val, delta
+        datetime dt
+
+    dt64_to_dtstruct(utc_val, &dts)
+    dt = datetime(dts.year, dts.month, dts.day, dts.hour,
+                  dts.min, dts.sec, dts.us, tz)
+    delta = int(get_utcoffset(tz, dt).total_seconds()) * 1000000000
+    local_val = utc_val + delta
+    return local_val
+
+
+cpdef int64_t tz_convert_single(int64_t val, object tz1, object tz2):
+    """
+    Convert the val (in i8) from timezone1 to timezone2
+
+    This is a single timezone version of tz_convert
+
+    Parameters
+    ----------
+    val : int64
+    tz1 : string / timezone object
+    tz2 : string / timezone object
+
+    Returns
+    -------
+    int64 converted
+
+    """
+
+    cdef:
+        ndarray[int64_t] trans, deltas
+        Py_ssize_t pos
+        int64_t v, offset, utc_date
+        pandas_datetimestruct dts
+
+    # See GH#17734 We should always be converting either from UTC or to UTC
+    assert (is_utc(tz1) or tz1 == 'UTC') or (is_utc(tz2) or tz2 == 'UTC')
+
+    if val == NPY_NAT:
+        return val
+
+    # Convert to UTC
+    if is_tzlocal(tz1):
+        utc_date = tz_convert_tzlocal_to_utc(val, tz1)
+    elif get_timezone(tz1) != 'UTC':
+        trans, deltas, typ = get_dst_info(tz1)
+        pos = trans.searchsorted(val, side='right') - 1
+        if pos < 0:
+            raise ValueError('First time before start of DST info')
+        offset = deltas[pos]
+        utc_date = val - offset
+    else:
+        utc_date = val
+
+    if get_timezone(tz2) == 'UTC':
+        return utc_date
+    elif is_tzlocal(tz2):
+        return tz_convert_utc_to_tzlocal(utc_date, tz2)
+
+    # Convert UTC to other timezone
+    trans, deltas, typ = get_dst_info(tz2)
+
+    pos = trans.searchsorted(utc_date, side='right') - 1
+    if pos < 0:
+        raise ValueError('First time before start of DST info')
+
+    offset = deltas[pos]
+    return utc_date + offset
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def tz_convert(ndarray[int64_t] vals, object tz1, object tz2):
+    """
+    Convert the values (in i8) from timezone1 to timezone2
+
+    Parameters
+    ----------
+    vals : int64 ndarray
+    tz1 : string / timezone object
+    tz2 : string / timezone object
+
+    Returns
+    -------
+    int64 ndarray of converted
+    """
+
+    cdef:
+        ndarray[int64_t] utc_dates, tt, result, trans, deltas
+        Py_ssize_t i, j, pos, n = len(vals)
+        ndarray[Py_ssize_t] posn
+        int64_t v, offset, delta
+        pandas_datetimestruct dts
+
+    if len(vals) == 0:
+        return np.array([], dtype=np.int64)
+
+    # Convert to UTC
+    if get_timezone(tz1) != 'UTC':
+        utc_dates = np.empty(n, dtype=np.int64)
+        if is_tzlocal(tz1):
+            for i in range(n):
+                v = vals[i]
+                if v == NPY_NAT:
+                    utc_dates[i] = NPY_NAT
+                else:
+                    utc_dates[i] = tz_convert_tzlocal_to_utc(v, tz1)
+        else:
+            trans, deltas, typ = get_dst_info(tz1)
+
+            # all-NaT
+            tt = vals[vals != NPY_NAT]
+            if not len(tt):
+                return vals
+
+            posn = trans.searchsorted(tt, side='right')
+            j = 0
+            for i in range(n):
+                v = vals[i]
+                if v == NPY_NAT:
+                    utc_dates[i] = NPY_NAT
+                else:
+                    pos = posn[j] - 1
+                    j = j + 1
+                    if pos < 0:
+                        raise ValueError('First time before start of DST info')
+                    offset = deltas[pos]
+                    utc_dates[i] = v - offset
+    else:
+        utc_dates = vals
+
+    if get_timezone(tz2) == 'UTC':
+        return utc_dates
+
+    result = np.zeros(n, dtype=np.int64)
+    if is_tzlocal(tz2):
+        for i in range(n):
+            v = utc_dates[i]
+            if v == NPY_NAT:
+                result[i] = NPY_NAT
+            else:
+                result[i] = tz_convert_utc_to_tzlocal(v, tz2)
+        return result
+
+    # Convert UTC to other timezone
+    trans, deltas, typ = get_dst_info(tz2)
+
+    # use first non-NaT element
+    # if all-NaT, return all-NaT
+    if (result == NPY_NAT).all():
+        return result
+
+    # if all NaT, return all NaT
+    tt = utc_dates[utc_dates!=NPY_NAT]
+    if not len(tt):
+        return utc_dates
+
+    posn = trans.searchsorted(tt, side='right')
+
+    j = 0
+    for i in range(n):
+        v = utc_dates[i]
+        if vals[i] == NPY_NAT:
+            result[i] = vals[i]
+        else:
+            pos = posn[j] - 1
+            j = j + 1
+            if pos < 0:
+                raise ValueError('First time before start of DST info')
+            offset = deltas[pos]
+            result[i] = v + offset
+    return result
+
+
+# TODO: cdef scalar version to call from convert_str_to_tsobject
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def tz_localize_to_utc(ndarray[int64_t] vals, object tz, object ambiguous=None,
+                       object errors='raise'):
+    """
+    Localize tzinfo-naive i8 to given time zone (using pytz). If
+    there are ambiguities in the values, raise AmbiguousTimeError.
+
+    Returns
+    -------
+    localized : DatetimeIndex
+    """
+    cdef:
+        ndarray[int64_t] trans, deltas, idx_shifted
+        ndarray ambiguous_array
+        Py_ssize_t i, idx, pos, ntrans, n = len(vals)
+        int64_t *tdata
+        int64_t v, left, right
+        ndarray[int64_t] result, result_a, result_b, dst_hours
+        pandas_datetimestruct dts
+        bint infer_dst = False, is_dst = False, fill = False
+        bint is_coerce = errors == 'coerce', is_raise = errors == 'raise'
+
+    # Vectorized version of DstTzInfo.localize
+
+    assert is_coerce or is_raise
+
+    if tz == UTC or tz is None:
+        return vals
+
+    result = np.empty(n, dtype=np.int64)
+
+    if is_tzlocal(tz):
+        for i in range(n):
+            v = vals[i]
+            result[i] = tz_convert_tzlocal_to_utc(v, tz)
+        return result
+
+    if is_string_object(ambiguous):
+        if ambiguous == 'infer':
+            infer_dst = True
+        elif ambiguous == 'NaT':
+            fill = True
+    elif isinstance(ambiguous, bool):
+        is_dst = True
+        if ambiguous:
+            ambiguous_array = np.ones(len(vals), dtype=bool)
+        else:
+            ambiguous_array = np.zeros(len(vals), dtype=bool)
+    elif hasattr(ambiguous, '__iter__'):
+        is_dst = True
+        if len(ambiguous) != len(vals):
+            raise ValueError("Length of ambiguous bool-array must be "
+                             "the same size as vals")
+        ambiguous_array = np.asarray(ambiguous)
+
+    trans, deltas, typ = get_dst_info(tz)
+
+    tdata = <int64_t*> trans.data
+    ntrans = len(trans)
+
+    result_a = np.empty(n, dtype=np.int64)
+    result_b = np.empty(n, dtype=np.int64)
+    result_a.fill(NPY_NAT)
+    result_b.fill(NPY_NAT)
+
+    # left side
+    idx_shifted = (np.maximum(0, trans.searchsorted(
+        vals - DAY_NS, side='right') - 1)).astype(np.int64)
+
+    for i in range(n):
+        v = vals[i] - deltas[idx_shifted[i]]
+        pos = bisect_right_i8(tdata, v, ntrans) - 1
+
+        # timestamp falls to the left side of the DST transition
+        if v + deltas[pos] == vals[i]:
+            result_a[i] = v
+
+    # right side
+    idx_shifted = (np.maximum(0, trans.searchsorted(
+        vals + DAY_NS, side='right') - 1)).astype(np.int64)
+
+    for i in range(n):
+        v = vals[i] - deltas[idx_shifted[i]]
+        pos = bisect_right_i8(tdata, v, ntrans) - 1
+
+        # timestamp falls to the right side of the DST transition
+        if v + deltas[pos] == vals[i]:
+            result_b[i] = v
+
+    if infer_dst:
+        dst_hours = np.empty(n, dtype=np.int64)
+        dst_hours.fill(NPY_NAT)
+
+        # Get the ambiguous hours (given the above, these are the hours
+        # where result_a != result_b and neither of them are NAT)
+        both_nat = np.logical_and(result_a != NPY_NAT, result_b != NPY_NAT)
+        both_eq = result_a == result_b
+        trans_idx = np.squeeze(np.nonzero(np.logical_and(both_nat, ~both_eq)))
+        if trans_idx.size == 1:
+            stamp = _render_tstamp(vals[trans_idx])
+            raise pytz.AmbiguousTimeError(
+                "Cannot infer dst time from %s as there "
+                "are no repeated times" % stamp)
+        # Split the array into contiguous chunks (where the difference between
+        # indices is 1).  These are effectively dst transitions in different
+        # years which is useful for checking that there is not an ambiguous
+        # transition in an individual year.
+        if trans_idx.size > 0:
+            one_diff = np.where(np.diff(trans_idx) != 1)[0] +1
+            trans_grp = np.array_split(trans_idx, one_diff)
+
+            # Iterate through each day, if there are no hours where the
+            # delta is negative (indicates a repeat of hour) the switch
+            # cannot be inferred
+            for grp in trans_grp:
+
+                delta = np.diff(result_a[grp])
+                if grp.size == 1 or np.all(delta > 0):
+                    stamp = _render_tstamp(vals[grp[0]])
+                    raise pytz.AmbiguousTimeError(stamp)
+
+                # Find the index for the switch and pull from a for dst and b
+                # for standard
+                switch_idx = (delta <= 0).nonzero()[0]
+                if switch_idx.size > 1:
+                    raise pytz.AmbiguousTimeError(
+                        "There are %i dst switches when "
+                        "there should only be 1." % switch_idx.size)
+                switch_idx = switch_idx[0] + 1
+                # Pull the only index and adjust
+                a_idx = grp[:switch_idx]
+                b_idx = grp[switch_idx:]
+                dst_hours[grp] = np.hstack((result_a[a_idx], result_b[b_idx]))
+
+    for i in range(n):
+        left = result_a[i]
+        right = result_b[i]
+        if vals[i] == NPY_NAT:
+            result[i] = vals[i]
+        elif left != NPY_NAT and right != NPY_NAT:
+            if left == right:
+                result[i] = left
+            else:
+                if infer_dst and dst_hours[i] != NPY_NAT:
+                    result[i] = dst_hours[i]
+                elif is_dst:
+                    if ambiguous_array[i]:
+                        result[i] = left
+                    else:
+                        result[i] = right
+                elif fill:
+                    result[i] = NPY_NAT
+                else:
+                    stamp = _render_tstamp(vals[i])
+                    raise pytz.AmbiguousTimeError(
+                        "Cannot infer dst time from %r, try using the "
+                        "'ambiguous' argument" % stamp)
+        elif left != NPY_NAT:
+            result[i] = left
+        elif right != NPY_NAT:
+            result[i] = right
+        else:
+            if is_coerce:
+                result[i] = NPY_NAT
+            else:
+                stamp = _render_tstamp(vals[i])
+                raise pytz.NonExistentTimeError(stamp)
+
+    return result
+
+
+cdef inline bisect_right_i8(int64_t *data, int64_t val, Py_ssize_t n):
+    cdef Py_ssize_t pivot, left = 0, right = n
+
+    assert n >= 1
+
+    # edge cases
+    if val > data[n - 1]:
+        return n
+
+    if val < data[0]:
+        return 0
+
+    while left < right:
+        pivot = left + (right - left) // 2
+
+        if data[pivot] <= val:
+            left = pivot + 1
+        else:
+            right = pivot
+
+    return left
+
+
+cdef inline str _render_tstamp(int64_t val):
+    """ Helper function to render exception messages"""
+    from pandas._libs.tslib import Timestamp
+    return str(Timestamp(val))
+
+
+# ----------------------------------------------------------------------
+# Normalization
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def date_normalize(ndarray[int64_t] stamps, tz=None):
+    """
+    Normalize each of the (nanosecond) timestamps in the given array by
+    rounding down to the beginning of the day (i.e. midnight).  If `tz`
+    is not None, then this is midnight for this timezone.
+
+    Parameters
+    ----------
+    stamps : int64 ndarray
+    tz : tzinfo or None
+
+    Returns
+    -------
+    result : int64 ndarray of converted of normalized nanosecond timestamps
+    """
+    cdef:
+        Py_ssize_t i, n = len(stamps)
+        pandas_datetimestruct dts
+        ndarray[int64_t] result = np.empty(n, dtype=np.int64)
+
+    if tz is not None:
+        tz = maybe_get_tz(tz)
+        result = _normalize_local(stamps, tz)
+    else:
+        with nogil:
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    result[i] = NPY_NAT
+                    continue
+                dt64_to_dtstruct(stamps[i], &dts)
+                result[i] = _normalized_stamp(&dts)
+
+    return result
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cdef ndarray[int64_t] _normalize_local(ndarray[int64_t] stamps, object tz):
+    """
+    Normalize each of the (nanosecond) timestamps in the given array by
+    rounding down to the beginning of the day (i.e. midnight) for the
+    given timezone `tz`.
+
+    Parameters
+    ----------
+    stamps : int64 ndarray
+    tz : tzinfo or None
+
+    Returns
+    -------
+    result : int64 ndarray of converted of normalized nanosecond timestamps
+    """
+    cdef:
+        Py_ssize_t n = len(stamps)
+        ndarray[int64_t] result = np.empty(n, dtype=np.int64)
+        ndarray[int64_t] trans, deltas, pos
+        pandas_datetimestruct dts
+
+    if is_utc(tz):
+        with nogil:
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    result[i] = NPY_NAT
+                    continue
+                dt64_to_dtstruct(stamps[i], &dts)
+                result[i] = _normalized_stamp(&dts)
+    elif is_tzlocal(tz):
+        for i in range(n):
+            if stamps[i] == NPY_NAT:
+                result[i] = NPY_NAT
+                continue
+            local_val = tz_convert_utc_to_tzlocal(stamps[i], tz)
+            dt64_to_dtstruct(local_val, &dts)
+            result[i] = _normalized_stamp(&dts)
+    else:
+        # Adjust datetime64 timestamp, recompute datetimestruct
+        trans, deltas, typ = get_dst_info(tz)
+
+        _pos = trans.searchsorted(stamps, side='right') - 1
+        if _pos.dtype != np.int64:
+            _pos = _pos.astype(np.int64)
+        pos = _pos
+
+        # statictzinfo
+        if typ not in ['pytz', 'dateutil']:
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    result[i] = NPY_NAT
+                    continue
+                dt64_to_dtstruct(stamps[i] + deltas[0], &dts)
+                result[i] = _normalized_stamp(&dts)
+        else:
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    result[i] = NPY_NAT
+                    continue
+                dt64_to_dtstruct(stamps[i] + deltas[pos[i]], &dts)
+                result[i] = _normalized_stamp(&dts)
+
+    return result
+
+
+cdef inline int64_t _normalized_stamp(pandas_datetimestruct *dts) nogil:
+    """
+    Normalize the given datetimestruct to midnight, then convert to int64_t.
+
+    Parameters
+    ----------
+    *dts : pointer to pandas_datetimestruct
+
+    Returns
+    -------
+    stamp : int64
+    """
+    dts.hour = 0
+    dts.min = 0
+    dts.sec = 0
+    dts.us = 0
+    dts.ps = 0
+    return dtstruct_to_dt64(dts)
+
+
+def is_date_array_normalized(ndarray[int64_t] stamps, tz=None):
+    """
+    Check if all of the given (nanosecond) timestamps are normalized to
+    midnight, i.e. hour == minute == second == 0.  If the optional timezone
+    `tz` is not None, then this is midnight for this timezone.
+
+    Parameters
+    ----------
+    stamps : int64 ndarray
+    tz : tzinfo or None
+
+    Returns
+    -------
+    is_normalized : bool True if all stamps are normalized
+    """
+    cdef:
+        Py_ssize_t i, n = len(stamps)
+        ndarray[int64_t] trans, deltas
+        pandas_datetimestruct dts
+        int64_t local_val
+
+    if tz is None or is_utc(tz):
+        for i in range(n):
+            dt64_to_dtstruct(stamps[i], &dts)
+            if (dts.hour + dts.min + dts.sec + dts.us) > 0:
+                return False
+    elif is_tzlocal(tz):
+        for i in range(n):
+            local_val = tz_convert_utc_to_tzlocal(stamps[i], tz)
+            dt64_to_dtstruct(local_val, &dts)
+            if (dts.hour + dts.min + dts.sec + dts.us) > 0:
+                return False
+    else:
+        trans, deltas, typ = get_dst_info(tz)
+
+        for i in range(n):
+            # Adjust datetime64 timestamp, recompute datetimestruct
+            pos = trans.searchsorted(stamps[i]) - 1
+            inf = tz._transition_info[pos]
+
+            dt64_to_dtstruct(stamps[i] + deltas[pos], &dts)
+            if (dts.hour + dts.min + dts.sec + dts.us) > 0:
+                return False
+
+    return True
diff --git a/pandas/_libs/tslibs/fields.pyx b/pandas/_libs/tslibs/fields.pyx
new file mode 100644
index 0000000000000..ccf67e765e079
--- /dev/null
+++ b/pandas/_libs/tslibs/fields.pyx
@@ -0,0 +1,671 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+"""
+Functions for accessing attributes of Timestamp/datetime64/datetime-like
+objects and arrays
+"""
+
+cimport cython
+from cython cimport Py_ssize_t
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport ndarray, int64_t, int32_t, int8_t
+cnp.import_array()
+
+from ccalendar import get_locale_names, MONTHS_FULL, DAYS_FULL
+from ccalendar cimport (get_days_in_month, is_leapyear, dayofweek,
+                        get_week_of_year, get_day_of_year)
+from np_datetime cimport (pandas_datetimestruct, pandas_timedeltastruct,
+                          dt64_to_dtstruct, td64_to_tdstruct)
+from nattype cimport NPY_NAT
+
+
+def get_time_micros(ndarray[int64_t] dtindex):
+    """
+    Return the number of microseconds in the time component of a
+    nanosecond timestamp.
+
+    Parameters
+    ----------
+    dtindex : ndarray[int64_t]
+
+    Returns
+    -------
+    micros : ndarray[int64_t]
+    """
+    cdef:
+        ndarray[int64_t] micros
+
+    micros = np.mod(dtindex, 86400000000000, dtype=np.int64) // 1000LL
+    return micros
+
+
+def build_field_sarray(ndarray[int64_t] dtindex):
+    """
+    Datetime as int64 representation to a structured array of fields
+    """
+    cdef:
+        Py_ssize_t i, count = 0
+        pandas_datetimestruct dts
+        ndarray[int32_t] years, months, days, hours, minutes, seconds, mus
+
+    count = len(dtindex)
+
+    sa_dtype = [('Y', 'i4'),  # year
+                ('M', 'i4'),  # month
+                ('D', 'i4'),  # day
+                ('h', 'i4'),  # hour
+                ('m', 'i4'),  # min
+                ('s', 'i4'),  # second
+                ('u', 'i4')]  # microsecond
+
+    out = np.empty(count, dtype=sa_dtype)
+
+    years = out['Y']
+    months = out['M']
+    days = out['D']
+    hours = out['h']
+    minutes = out['m']
+    seconds = out['s']
+    mus = out['u']
+
+    for i in range(count):
+        dt64_to_dtstruct(dtindex[i], &dts)
+        years[i] = dts.year
+        months[i] = dts.month
+        days[i] = dts.day
+        hours[i] = dts.hour
+        minutes[i] = dts.min
+        seconds[i] = dts.sec
+        mus[i] = dts.us
+
+    return out
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def get_date_name_field(ndarray[int64_t] dtindex, object field,
+                        object locale=None):
+    """
+    Given a int64-based datetime index, return array of strings of date
+    name based on requested field (e.g. weekday_name)
+    """
+    cdef:
+        Py_ssize_t i, count = 0
+        ndarray[object] out, names
+        pandas_datetimestruct dts
+        int dow
+
+    count = len(dtindex)
+    out = np.empty(count, dtype=object)
+
+    if field == 'day_name' or field == 'weekday_name':
+        if locale is None:
+            names = np.array(DAYS_FULL, dtype=np.object_)
+        else:
+            names = np.array(get_locale_names('f_weekday', locale),
+                             dtype=np.object_)
+        for i in range(count):
+            if dtindex[i] == NPY_NAT:
+                out[i] = np.nan
+                continue
+
+            dt64_to_dtstruct(dtindex[i], &dts)
+            dow = dayofweek(dts.year, dts.month, dts.day)
+            out[i] = names[dow].capitalize()
+        return out
+    elif field == 'month_name':
+        if locale is None:
+            names = np.array(MONTHS_FULL, dtype=np.object_)
+        else:
+            names = np.array(get_locale_names('f_month', locale),
+                             dtype=np.object_)
+        for i in range(count):
+            if dtindex[i] == NPY_NAT:
+                out[i] = np.nan
+                continue
+
+            dt64_to_dtstruct(dtindex[i], &dts)
+            out[i] = names[dts.month].capitalize()
+        return out
+
+    raise ValueError("Field %s not supported" % field)
+
+
+@cython.wraparound(False)
+def get_start_end_field(ndarray[int64_t] dtindex, object field,
+                        object freqstr=None, int month_kw=12):
+    """
+    Given an int64-based datetime index return array of indicators
+    of whether timestamps are at the start/end of the month/quarter/year
+    (defined by frequency).
+    """
+    cdef:
+        Py_ssize_t i
+        int count = 0
+        bint is_business = 0
+        int end_month = 12
+        int start_month = 1
+        ndarray[int8_t] out
+        ndarray[int32_t, ndim=2] _month_offset
+        bint isleap
+        pandas_datetimestruct dts
+        int mo_off, dom, doy, dow, ldom
+
+    _month_offset = np.array(
+        [[0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365],
+         [0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366]],
+        dtype=np.int32)
+
+    count = len(dtindex)
+    out = np.zeros(count, dtype='int8')
+
+    if freqstr:
+        if freqstr == 'C':
+            raise ValueError(
+                "Custom business days is not supported by %s" % field)
+        is_business = freqstr[0] == 'B'
+
+        # YearBegin(), BYearBegin() use month = starting month of year.
+        # QuarterBegin(), BQuarterBegin() use startingMonth = starting
+        # month of year. Other offests use month, startingMonth as ending
+        # month of year.
+
+        if (freqstr[0:2] in ['MS', 'QS', 'AS']) or (
+                freqstr[1:3] in ['MS', 'QS', 'AS']):
+            end_month = 12 if month_kw == 1 else month_kw - 1
+            start_month = month_kw
+        else:
+            end_month = month_kw
+            start_month = (end_month % 12) + 1
+    else:
+        end_month = 12
+        start_month = 1
+
+    if field == 'is_month_start':
+        if is_business:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dom = dts.day
+                dow = dayofweek(dts.year, dts.month, dts.day)
+
+                if (dom == 1 and dow < 5) or (dom <= 3 and dow == 0):
+                    out[i] = 1
+            return out.view(bool)
+        else:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dom = dts.day
+
+                if dom == 1:
+                    out[i] = 1
+            return out.view(bool)
+
+    elif field == 'is_month_end':
+        if is_business:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                isleap = is_leapyear(dts.year)
+                mo_off = _month_offset[isleap, dts.month - 1]
+                dom = dts.day
+                doy = mo_off + dom
+                ldom = _month_offset[isleap, dts.month]
+                dow = dayofweek(dts.year, dts.month, dts.day)
+
+                if (ldom == doy and dow < 5) or (
+                        dow == 4 and (ldom - doy <= 2)):
+                    out[i] = 1
+            return out.view(bool)
+        else:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                isleap = is_leapyear(dts.year)
+                mo_off = _month_offset[isleap, dts.month - 1]
+                dom = dts.day
+                doy = mo_off + dom
+                ldom = _month_offset[isleap, dts.month]
+
+                if ldom == doy:
+                    out[i] = 1
+            return out.view(bool)
+
+    elif field == 'is_quarter_start':
+        if is_business:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dom = dts.day
+                dow = dayofweek(dts.year, dts.month, dts.day)
+
+                if ((dts.month - start_month) % 3 == 0) and (
+                        (dom == 1 and dow < 5) or (dom <= 3 and dow == 0)):
+                    out[i] = 1
+            return out.view(bool)
+        else:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dom = dts.day
+
+                if ((dts.month - start_month) % 3 == 0) and dom == 1:
+                    out[i] = 1
+            return out.view(bool)
+
+    elif field == 'is_quarter_end':
+        if is_business:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                isleap = is_leapyear(dts.year)
+                mo_off = _month_offset[isleap, dts.month - 1]
+                dom = dts.day
+                doy = mo_off + dom
+                ldom = _month_offset[isleap, dts.month]
+                dow = dayofweek(dts.year, dts.month, dts.day)
+
+                if ((dts.month - end_month) % 3 == 0) and (
+                        (ldom == doy and dow < 5) or (
+                            dow == 4 and (ldom - doy <= 2))):
+                    out[i] = 1
+            return out.view(bool)
+        else:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                isleap = is_leapyear(dts.year)
+                mo_off = _month_offset[isleap, dts.month - 1]
+                dom = dts.day
+                doy = mo_off + dom
+                ldom = _month_offset[isleap, dts.month]
+
+                if ((dts.month - end_month) % 3 == 0) and (ldom == doy):
+                    out[i] = 1
+            return out.view(bool)
+
+    elif field == 'is_year_start':
+        if is_business:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dom = dts.day
+                dow = dayofweek(dts.year, dts.month, dts.day)
+
+                if (dts.month == start_month) and (
+                        (dom == 1 and dow < 5) or (dom <= 3 and dow == 0)):
+                    out[i] = 1
+            return out.view(bool)
+        else:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dom = dts.day
+
+                if (dts.month == start_month) and dom == 1:
+                    out[i] = 1
+            return out.view(bool)
+
+    elif field == 'is_year_end':
+        if is_business:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                isleap = is_leapyear(dts.year)
+                dom = dts.day
+                mo_off = _month_offset[isleap, dts.month - 1]
+                doy = mo_off + dom
+                dow = dayofweek(dts.year, dts.month, dts.day)
+                ldom = _month_offset[isleap, dts.month]
+
+                if (dts.month == end_month) and (
+                        (ldom == doy and dow < 5) or (
+                            dow == 4 and (ldom - doy <= 2))):
+                    out[i] = 1
+            return out.view(bool)
+        else:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                isleap = is_leapyear(dts.year)
+                mo_off = _month_offset[isleap, dts.month - 1]
+                dom = dts.day
+                doy = mo_off + dom
+                ldom = _month_offset[isleap, dts.month]
+
+                if (dts.month == end_month) and (ldom == doy):
+                    out[i] = 1
+            return out.view(bool)
+
+    raise ValueError("Field %s not supported" % field)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def get_date_field(ndarray[int64_t] dtindex, object field):
+    """
+    Given a int64-based datetime index, extract the year, month, etc.,
+    field and return an array of these values.
+    """
+    cdef:
+        Py_ssize_t i, count = 0
+        ndarray[int32_t] out
+        pandas_datetimestruct dts
+
+    count = len(dtindex)
+    out = np.empty(count, dtype='i4')
+
+    if field == 'Y':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.year
+        return out
+
+    elif field == 'M':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.month
+        return out
+
+    elif field == 'D':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.day
+        return out
+
+    elif field == 'h':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.hour
+        return out
+
+    elif field == 'm':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.min
+        return out
+
+    elif field == 's':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.sec
+        return out
+
+    elif field == 'us':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.us
+        return out
+
+    elif field == 'ns':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.ps / 1000
+        return out
+    elif field == 'doy':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = get_day_of_year(dts.year, dts.month, dts.day)
+        return out
+
+    elif field == 'dow':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dayofweek(dts.year, dts.month, dts.day)
+        return out
+
+    elif field == 'woy':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = get_week_of_year(dts.year, dts.month, dts.day)
+        return out
+
+    elif field == 'q':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.month
+                out[i] = ((out[i] - 1) / 3) + 1
+        return out
+
+    elif field == 'dim':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = get_days_in_month(dts.year, dts.month)
+        return out
+    elif field == 'is_leap_year':
+        return isleapyear_arr(get_date_field(dtindex, 'Y'))
+
+    raise ValueError("Field %s not supported" % field)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def get_timedelta_field(ndarray[int64_t] tdindex, object field):
+    """
+    Given a int64-based timedelta index, extract the days, hrs, sec.,
+    field and return an array of these values.
+    """
+    cdef:
+        Py_ssize_t i, count = 0
+        ndarray[int32_t] out
+        pandas_timedeltastruct tds
+
+    count = len(tdindex)
+    out = np.empty(count, dtype='i4')
+
+    if field == 'days':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.days
+        return out
+
+    elif field == 'h':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.hrs
+        return out
+
+    elif field == 's':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.sec
+        return out
+
+    elif field == 'seconds':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.seconds
+        return out
+
+    elif field == 'ms':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.ms
+        return out
+
+    elif field == 'microseconds':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.microseconds
+        return out
+
+    elif field == 'us':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.us
+        return out
+
+    elif field == 'ns':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.ns
+        return out
+
+    elif field == 'nanoseconds':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.nanoseconds
+        return out
+
+    raise ValueError("Field %s not supported" % field)
+
+
+cpdef isleapyear_arr(ndarray years):
+    """vectorized version of isleapyear; NaT evaluates as False"""
+    cdef:
+        ndarray[int8_t] out
+
+    out = np.zeros(len(years), dtype='int8')
+    out[np.logical_or(years % 400 == 0,
+                      np.logical_and(years % 4 == 0,
+                                     years % 100 > 0))] = 1
+    return out.view(bool)
diff --git a/pandas/_libs/tslibs/frequencies.pxd b/pandas/_libs/tslibs/frequencies.pxd
new file mode 100644
index 0000000000000..98d600c540ace
--- /dev/null
+++ b/pandas/_libs/tslibs/frequencies.pxd
@@ -0,0 +1,10 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+cpdef object get_rule_month(object source, object default=*)
+
+cpdef get_freq_code(freqstr)
+cpdef object get_freq(object freq)
+cpdef str get_base_alias(freqstr)
+cpdef int get_to_timestamp_base(int base)
+cpdef str get_freq_str(base, mult=*)
diff --git a/pandas/_libs/tslibs/frequencies.pyx b/pandas/_libs/tslibs/frequencies.pyx
new file mode 100644
index 0000000000000..abaf8cad09bdb
--- /dev/null
+++ b/pandas/_libs/tslibs/frequencies.pyx
@@ -0,0 +1,512 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+import re
+
+cimport cython
+
+cimport numpy as cnp
+from numpy cimport int64_t
+cnp.import_array()
+
+from util cimport is_integer_object, is_string_object
+
+from ccalendar import MONTH_NUMBERS
+
+# ----------------------------------------------------------------------
+# Constants
+
+# hack to handle WOM-1MON
+opattern = re.compile(
+    r'([+\-]?\d*|[+\-]?\d*\.\d*)\s*([A-Za-z]+([\-][\dA-Za-z\-]+)?)'
+)
+
+_INVALID_FREQ_ERROR = "Invalid frequency: {0}"
+
+# ---------------------------------------------------------------------
+# Period codes
+
+
+class FreqGroup(object):
+    FR_ANN = 1000
+    FR_QTR = 2000
+    FR_MTH = 3000
+    FR_WK = 4000
+    FR_BUS = 5000
+    FR_DAY = 6000
+    FR_HR = 7000
+    FR_MIN = 8000
+    FR_SEC = 9000
+    FR_MS = 10000
+    FR_US = 11000
+    FR_NS = 12000
+
+
+# period frequency constants corresponding to scikits timeseries
+# originals
+_period_code_map = {
+    # Annual freqs with various fiscal year ends.
+    # eg, 2005 for A-FEB runs Mar 1, 2004 to Feb 28, 2005
+    "A-DEC": 1000,  # Annual - December year end
+    "A-JAN": 1001,  # Annual - January year end
+    "A-FEB": 1002,  # Annual - February year end
+    "A-MAR": 1003,  # Annual - March year end
+    "A-APR": 1004,  # Annual - April year end
+    "A-MAY": 1005,  # Annual - May year end
+    "A-JUN": 1006,  # Annual - June year end
+    "A-JUL": 1007,  # Annual - July year end
+    "A-AUG": 1008,  # Annual - August year end
+    "A-SEP": 1009,  # Annual - September year end
+    "A-OCT": 1010,  # Annual - October year end
+    "A-NOV": 1011,  # Annual - November year end
+
+    # Quarterly frequencies with various fiscal year ends.
+    # eg, Q42005 for Q-OCT runs Aug 1, 2005 to Oct 31, 2005
+    "Q-DEC": 2000,    # Quarterly - December year end
+    "Q-JAN": 2001,    # Quarterly - January year end
+    "Q-FEB": 2002,    # Quarterly - February year end
+    "Q-MAR": 2003,    # Quarterly - March year end
+    "Q-APR": 2004,    # Quarterly - April year end
+    "Q-MAY": 2005,    # Quarterly - May year end
+    "Q-JUN": 2006,    # Quarterly - June year end
+    "Q-JUL": 2007,    # Quarterly - July year end
+    "Q-AUG": 2008,    # Quarterly - August year end
+    "Q-SEP": 2009,    # Quarterly - September year end
+    "Q-OCT": 2010,    # Quarterly - October year end
+    "Q-NOV": 2011,    # Quarterly - November year end
+
+    "M": 3000,        # Monthly
+
+    "W-SUN": 4000,    # Weekly - Sunday end of week
+    "W-MON": 4001,    # Weekly - Monday end of week
+    "W-TUE": 4002,    # Weekly - Tuesday end of week
+    "W-WED": 4003,    # Weekly - Wednesday end of week
+    "W-THU": 4004,    # Weekly - Thursday end of week
+    "W-FRI": 4005,    # Weekly - Friday end of week
+    "W-SAT": 4006,    # Weekly - Saturday end of week
+
+    "B": 5000,        # Business days
+    "D": 6000,        # Daily
+    "H": 7000,        # Hourly
+    "T": 8000,        # Minutely
+    "S": 9000,        # Secondly
+    "L": 10000,       # Millisecondly
+    "U": 11000,       # Microsecondly
+    "N": 12000}       # Nanosecondly
+
+
+_reverse_period_code_map = {
+    _period_code_map[key]: key for key in _period_code_map}
+
+# Yearly aliases; careful not to put these in _reverse_period_code_map
+_period_code_map.update({'Y' + key[1:]: _period_code_map[key]
+                         for key in _period_code_map
+                         if key.startswith('A-')})
+
+_period_code_map.update({
+    "Q": 2000,   # Quarterly - December year end (default quarterly)
+    "A": 1000,   # Annual
+    "W": 4000,   # Weekly
+    "C": 5000})  # Custom Business Day
+
+_lite_rule_alias = {
+    'W': 'W-SUN',
+    'Q': 'Q-DEC',
+
+    'A': 'A-DEC',      # YearEnd(month=12),
+    'Y': 'A-DEC',
+    'AS': 'AS-JAN',    # YearBegin(month=1),
+    'YS': 'AS-JAN',
+    'BA': 'BA-DEC',    # BYearEnd(month=12),
+    'BY': 'BA-DEC',
+    'BAS': 'BAS-JAN',  # BYearBegin(month=1),
+    'BYS': 'BAS-JAN',
+
+    'Min': 'T',
+    'min': 'T',
+    'ms': 'L',
+    'us': 'U',
+    'ns': 'N'}
+
+_dont_uppercase = set(('MS', 'ms'))
+
+# ----------------------------------------------------------------------
+
+cpdef get_freq_code(freqstr):
+    """
+    Return freq str or tuple to freq code and stride (mult)
+
+    Parameters
+    ----------
+    freqstr : str or tuple
+
+    Returns
+    -------
+    return : tuple of base frequency code and stride (mult)
+
+    Examples
+    --------
+    >>> get_freq_code('3D')
+    (6000, 3)
+
+    >>> get_freq_code('D')
+    (6000, 1)
+
+    >>> get_freq_code(('D', 3))
+    (6000, 3)
+    """
+    if getattr(freqstr, '_typ', None) == 'dateoffset':
+        freqstr = (freqstr.rule_code, freqstr.n)
+
+    if isinstance(freqstr, tuple):
+        if (is_integer_object(freqstr[0]) and
+                is_integer_object(freqstr[1])):
+            # e.g., freqstr = (2000, 1)
+            return freqstr
+        else:
+            # e.g., freqstr = ('T', 5)
+            try:
+                code = _period_str_to_code(freqstr[0])
+                stride = freqstr[1]
+            except:
+                if is_integer_object(freqstr[1]):
+                    raise
+                code = _period_str_to_code(freqstr[1])
+                stride = freqstr[0]
+            return code, stride
+
+    if is_integer_object(freqstr):
+        return (freqstr, 1)
+
+    base, stride = _base_and_stride(freqstr)
+    code = _period_str_to_code(base)
+
+    return code, stride
+
+
+cpdef _base_and_stride(freqstr):
+    """
+    Return base freq and stride info from string representation
+
+    Examples
+    --------
+    _freq_and_stride('5Min') -> 'Min', 5
+    """
+    groups = opattern.match(freqstr)
+
+    if not groups:
+        raise ValueError("Could not evaluate {freq}".format(freq=freqstr))
+
+    stride = groups.group(1)
+
+    if len(stride):
+        stride = int(stride)
+    else:
+        stride = 1
+
+    base = groups.group(2)
+
+    return (base, stride)
+
+
+cpdef _period_str_to_code(freqstr):
+    freqstr = _lite_rule_alias.get(freqstr, freqstr)
+
+    if freqstr not in _dont_uppercase:
+        lower = freqstr.lower()
+        freqstr = _lite_rule_alias.get(lower, freqstr)
+
+    if freqstr not in _dont_uppercase:
+        freqstr = freqstr.upper()
+    try:
+        return _period_code_map[freqstr]
+    except KeyError:
+        raise ValueError(_INVALID_FREQ_ERROR.format(freqstr))
+
+
+cpdef str get_freq_str(base, mult=1):
+    """
+    Return the summary string associated with this offset code, possibly
+    adjusted by a multiplier.
+
+    Parameters
+    ----------
+    base : int (member of FreqGroup)
+
+    Returns
+    -------
+    freq_str : str
+
+    Examples
+    --------
+    >>> get_freq_str(1000)
+    'A-DEC'
+
+    >>> get_freq_str(2000, 2)
+    '2Q-DEC'
+
+    >>> get_freq_str("foo")
+    """
+    code = _reverse_period_code_map.get(base)
+    if mult == 1:
+        return code
+    return str(mult) + code
+
+
+cpdef str get_base_alias(freqstr):
+    """
+    Returns the base frequency alias, e.g., '5D' -> 'D'
+
+    Parameters
+    ----------
+    freqstr : str
+
+    Returns
+    -------
+    base_alias : str
+    """
+    return _base_and_stride(freqstr)[0]
+
+
+cpdef int get_to_timestamp_base(int base):
+    """
+    Return frequency code group used for base of to_timestamp against
+    frequency code.
+
+    Parameters
+    ----------
+    base : int (member of FreqGroup)
+
+    Returns
+    -------
+    base : int
+
+    Examples
+    --------
+    # Return day freq code against longer freq than day
+    >>> get_to_timestamp_base(get_freq_code('D')[0])
+    6000
+    >>> get_to_timestamp_base(get_freq_code('W')[0])
+    6000
+    >>> get_to_timestamp_base(get_freq_code('M')[0])
+    6000
+
+    # Return second freq code against hour between second
+    >>> get_to_timestamp_base(get_freq_code('H')[0])
+    9000
+    >>> get_to_timestamp_base(get_freq_code('S')[0])
+    9000
+    """
+    if base < FreqGroup.FR_BUS:
+        return FreqGroup.FR_DAY
+    elif FreqGroup.FR_HR <= base <= FreqGroup.FR_SEC:
+        return FreqGroup.FR_SEC
+    return base
+
+
+cpdef object get_freq(object freq):
+    """
+    Return frequency code of given frequency str.
+    If input is not string, return input as it is.
+
+    Examples
+    --------
+    >>> get_freq('A')
+    1000
+
+    >>> get_freq('3A')
+    1000
+    """
+    if is_string_object(freq):
+        base, mult = get_freq_code(freq)
+        freq = base
+    return freq
+
+
+# ----------------------------------------------------------------------
+# Frequency comparison
+
+cpdef bint is_subperiod(source, target):
+    """
+    Returns True if downsampling is possible between source and target
+    frequencies
+
+    Parameters
+    ----------
+    source : string or DateOffset
+        Frequency converting from
+    target : string or DateOffset
+        Frequency converting to
+
+    Returns
+    -------
+    is_subperiod : boolean
+    """
+
+    if target is None or source is None:
+        return False
+    source = _maybe_coerce_freq(source)
+    target = _maybe_coerce_freq(target)
+
+    if _is_annual(target):
+        if _is_quarterly(source):
+            return _quarter_months_conform(get_rule_month(source),
+                                           get_rule_month(target))
+        return source in {'D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif _is_quarterly(target):
+        return source in {'D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif _is_monthly(target):
+        return source in {'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif _is_weekly(target):
+        return source in {target, 'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif target == 'B':
+        return source in {'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif target == 'C':
+        return source in {'C', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif target == 'D':
+        return source in {'D', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif target == 'H':
+        return source in {'H', 'T', 'S', 'L', 'U', 'N'}
+    elif target == 'T':
+        return source in {'T', 'S', 'L', 'U', 'N'}
+    elif target == 'S':
+        return source in {'S', 'L', 'U', 'N'}
+    elif target == 'L':
+        return source in {'L', 'U', 'N'}
+    elif target == 'U':
+        return source in {'U', 'N'}
+    elif target == 'N':
+        return source in {'N'}
+
+
+cpdef bint is_superperiod(source, target):
+    """
+    Returns True if upsampling is possible between source and target
+    frequencies
+
+    Parameters
+    ----------
+    source : string
+        Frequency converting from
+    target : string
+        Frequency converting to
+
+    Returns
+    -------
+    is_superperiod : boolean
+    """
+    if target is None or source is None:
+        return False
+    source = _maybe_coerce_freq(source)
+    target = _maybe_coerce_freq(target)
+
+    if _is_annual(source):
+        if _is_annual(target):
+            return get_rule_month(source) == get_rule_month(target)
+
+        if _is_quarterly(target):
+            smonth = get_rule_month(source)
+            tmonth = get_rule_month(target)
+            return _quarter_months_conform(smonth, tmonth)
+        return target in {'D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif _is_quarterly(source):
+        return target in {'D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif _is_monthly(source):
+        return target in {'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif _is_weekly(source):
+        return target in {source, 'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif source == 'B':
+        return target in {'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif source == 'C':
+        return target in {'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif source == 'D':
+        return target in {'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif source == 'H':
+        return target in {'H', 'T', 'S', 'L', 'U', 'N'}
+    elif source == 'T':
+        return target in {'T', 'S', 'L', 'U', 'N'}
+    elif source == 'S':
+        return target in {'S', 'L', 'U', 'N'}
+    elif source == 'L':
+        return target in {'L', 'U', 'N'}
+    elif source == 'U':
+        return target in {'U', 'N'}
+    elif source == 'N':
+        return target in {'N'}
+
+
+cdef str _maybe_coerce_freq(code):
+    """ we might need to coerce a code to a rule_code
+    and uppercase it
+
+    Parameters
+    ----------
+    source : string or DateOffset
+        Frequency converting from
+
+    Returns
+    -------
+    code : string
+    """
+    assert code is not None
+    if getattr(code, '_typ', None) == 'dateoffset':
+        # i.e. isinstance(code, ABCDateOffset):
+        code = code.rule_code
+    return code.upper()
+
+
+cdef bint _quarter_months_conform(str source, str target):
+    snum = MONTH_NUMBERS[source]
+    tnum = MONTH_NUMBERS[target]
+    return snum % 3 == tnum % 3
+
+
+cdef bint _is_annual(str rule):
+    rule = rule.upper()
+    return rule == 'A' or rule.startswith('A-')
+
+
+cdef bint _is_quarterly(str rule):
+    rule = rule.upper()
+    return rule == 'Q' or rule.startswith('Q-') or rule.startswith('BQ')
+
+
+cdef bint _is_monthly(str rule):
+    rule = rule.upper()
+    return rule == 'M' or rule == 'BM'
+
+
+cdef bint _is_weekly(str rule):
+    rule = rule.upper()
+    return rule == 'W' or rule.startswith('W-')
+
+
+# ----------------------------------------------------------------------
+
+cpdef object get_rule_month(object source, object default='DEC'):
+    """
+    Return starting month of given freq, default is December.
+
+    Parameters
+    ----------
+    source : object
+    default : object (default "DEC")
+
+    Returns
+    -------
+    rule_month: object (usually string)
+
+    Examples
+    --------
+    >>> get_rule_month('D')
+    'DEC'
+
+    >>> get_rule_month('A-JAN')
+    'JAN'
+    """
+    if hasattr(source, 'freqstr'):
+        source = source.freqstr
+    source = source.upper()
+    if '-' not in source:
+        return default
+    else:
+        return source.split('-')[1]
diff --git a/pandas/_libs/tslibs/nattype.pxd b/pandas/_libs/tslibs/nattype.pxd
new file mode 100644
index 0000000000000..96e02142d501b
--- /dev/null
+++ b/pandas/_libs/tslibs/nattype.pxd
@@ -0,0 +1,9 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+from numpy cimport int64_t
+cdef int64_t NPY_NAT
+
+cdef bint _nat_scalar_rules[6]
+
+cdef bint checknull_with_nat(object val)
diff --git a/pandas/_libs/tslibs/nattype.pyx b/pandas/_libs/tslibs/nattype.pyx
new file mode 100644
index 0000000000000..be76b55fa169b
--- /dev/null
+++ b/pandas/_libs/tslibs/nattype.pyx
@@ -0,0 +1,589 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+from cpython cimport (
+    PyFloat_Check, PyComplex_Check,
+    PyObject_RichCompare,
+    Py_GT, Py_GE, Py_EQ, Py_NE, Py_LT, Py_LE)
+
+from cpython.datetime cimport (datetime,
+                               PyDateTime_Check, PyDelta_Check,
+                               PyDateTime_IMPORT)
+PyDateTime_IMPORT
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport int64_t
+cnp.import_array()
+
+from util cimport (get_nat,
+                   is_integer_object, is_float_object,
+                   is_datetime64_object, is_timedelta64_object)
+
+# ----------------------------------------------------------------------
+# Constants
+nat_strings = set(['NaT', 'nat', 'NAT', 'nan', 'NaN', 'NAN'])
+
+cdef int64_t NPY_NAT = get_nat()
+iNaT = NPY_NAT  # python-visible constant
+
+cdef bint _nat_scalar_rules[6]
+_nat_scalar_rules[Py_EQ] = False
+_nat_scalar_rules[Py_NE] = True
+_nat_scalar_rules[Py_LT] = False
+_nat_scalar_rules[Py_LE] = False
+_nat_scalar_rules[Py_GT] = False
+_nat_scalar_rules[Py_GE] = False
+
+# ----------------------------------------------------------------------
+
+
+def _make_nan_func(func_name, doc):
+    def f(*args, **kwargs):
+        return np.nan
+    f.__name__ = func_name
+    f.__doc__ = doc
+    return f
+
+
+def _make_nat_func(func_name, doc):
+    def f(*args, **kwargs):
+        return NaT
+    f.__name__ = func_name
+    f.__doc__ = doc
+    return f
+
+
+def _make_error_func(func_name, cls):
+    def f(*args, **kwargs):
+        raise ValueError("NaTType does not support " + func_name)
+
+    f.__name__ = func_name
+    if isinstance(cls, str):
+        # passed the literal docstring directly
+        f.__doc__ = cls
+    elif cls is not None:
+        f.__doc__ = getattr(cls, func_name).__doc__
+    return f
+
+
+cdef _nat_divide_op(self, other):
+    if PyDelta_Check(other) or is_timedelta64_object(other) or other is NaT:
+        return np.nan
+    if is_integer_object(other) or is_float_object(other):
+        return NaT
+    return NotImplemented
+
+
+cdef _nat_rdivide_op(self, other):
+    if PyDelta_Check(other):
+        return np.nan
+    return NotImplemented
+
+
+def __nat_unpickle(*args):
+    # return constant defined in the module
+    return NaT
+
+# ----------------------------------------------------------------------
+
+
+cdef class _NaT(datetime):
+    cdef readonly:
+        int64_t value
+        object freq
+
+    def __hash__(_NaT self):
+        # py3k needs this defined here
+        return hash(self.value)
+
+    def __richcmp__(_NaT self, object other, int op):
+        cdef int ndim = getattr(other, 'ndim', -1)
+
+        if ndim == -1:
+            return _nat_scalar_rules[op]
+
+        if ndim == 0:
+            if is_datetime64_object(other):
+                return _nat_scalar_rules[op]
+            else:
+                raise TypeError('Cannot compare type %r with type %r' %
+                                (type(self).__name__, type(other).__name__))
+        # Note: instead of passing "other, self, _reverse_ops[op]", we observe
+        # that `_nat_scalar_rules` is invariant under `_reverse_ops`,
+        # rendering it unnecessary.
+        return PyObject_RichCompare(other, self, op)
+
+    def __add__(self, other):
+        if PyDateTime_Check(other):
+            return NaT
+
+        elif hasattr(other, 'delta'):
+            # Timedelta, offsets.Tick, offsets.Week
+            return NaT
+        elif getattr(other, '_typ', None) in ['dateoffset', 'series',
+                                              'period', 'datetimeindex',
+                                              'timedeltaindex']:
+            # Duplicate logic in _Timestamp.__add__ to avoid needing
+            # to subclass; allows us to @final(_Timestamp.__add__)
+            return NotImplemented
+        return NaT
+
+    def __sub__(self, other):
+        # Duplicate some logic from _Timestamp.__sub__ to avoid needing
+        # to subclass; allows us to @final(_Timestamp.__sub__)
+        if PyDateTime_Check(other):
+            return NaT
+        elif PyDelta_Check(other):
+            return NaT
+
+        elif getattr(other, '_typ', None) == 'datetimeindex':
+            # a Timestamp-DatetimeIndex -> yields a negative TimedeltaIndex
+            return -other.__sub__(self)
+
+        elif getattr(other, '_typ', None) == 'timedeltaindex':
+            # a Timestamp-TimedeltaIndex -> yields a negative TimedeltaIndex
+            return (-other).__add__(self)
+
+        elif hasattr(other, 'delta'):
+            # offsets.Tick, offsets.Week
+            neg_other = -other
+            return self + neg_other
+
+        elif getattr(other, '_typ', None) in ['period', 'series',
+                                              'periodindex', 'dateoffset']:
+            return NotImplemented
+
+        return NaT
+
+    def __pos__(self):
+        return NaT
+
+    def __neg__(self):
+        return NaT
+
+    def __div__(self, other):
+        return _nat_divide_op(self, other)
+
+    def __truediv__(self, other):
+        return _nat_divide_op(self, other)
+
+    def __floordiv__(self, other):
+        return _nat_divide_op(self, other)
+
+    def __mul__(self, other):
+        if is_integer_object(other) or is_float_object(other):
+            return NaT
+        return NotImplemented
+
+    @property
+    def asm8(self):
+        return np.datetime64(NPY_NAT, 'ns')
+
+    def to_datetime64(self):
+        """ Returns a numpy.datetime64 object with 'ns' precision """
+        return np.datetime64('NaT')
+
+
+class NaTType(_NaT):
+    """(N)ot-(A)-(T)ime, the time equivalent of NaN"""
+
+    def __new__(cls):
+        cdef _NaT base
+
+        base = _NaT.__new__(cls, 1, 1, 1)
+        base.value = NPY_NAT
+        base.freq = None
+
+        return base
+
+    def __repr__(self):
+        return 'NaT'
+
+    def __str__(self):
+        return 'NaT'
+
+    def isoformat(self, sep='T'):
+        # This allows Timestamp(ts.isoformat()) to always correctly roundtrip.
+        return 'NaT'
+
+    def __hash__(self):
+        return NPY_NAT
+
+    def __int__(self):
+        return NPY_NAT
+
+    def __long__(self):
+        return NPY_NAT
+
+    def __reduce_ex__(self, protocol):
+        # python 3.6 compat
+        # http://bugs.python.org/issue28730
+        # now __reduce_ex__ is defined and higher priority than __reduce__
+        return self.__reduce__()
+
+    def __reduce__(self):
+        return (__nat_unpickle, (None, ))
+
+    def total_seconds(self):
+        """
+        Total duration of timedelta in seconds (to ns precision)
+        """
+        # GH 10939
+        return np.nan
+
+    @property
+    def is_leap_year(self):
+        return False
+
+    @property
+    def is_month_start(self):
+        return False
+
+    @property
+    def is_quarter_start(self):
+        return False
+
+    @property
+    def is_year_start(self):
+        return False
+
+    @property
+    def is_month_end(self):
+        return False
+
+    @property
+    def is_quarter_end(self):
+        return False
+
+    @property
+    def is_year_end(self):
+        return False
+
+    def __rdiv__(self, other):
+        return _nat_rdivide_op(self, other)
+
+    def __rtruediv__(self, other):
+        return _nat_rdivide_op(self, other)
+
+    def __rfloordiv__(self, other):
+        return _nat_rdivide_op(self, other)
+
+    def __rmul__(self, other):
+        if is_integer_object(other) or is_float_object(other):
+            return NaT
+        return NotImplemented
+
+    # ----------------------------------------------------------------------
+    # inject the Timestamp field properties
+    # these by definition return np.nan
+
+    year = property(fget=lambda self: np.nan)
+    quarter = property(fget=lambda self: np.nan)
+    month = property(fget=lambda self: np.nan)
+    day = property(fget=lambda self: np.nan)
+    hour = property(fget=lambda self: np.nan)
+    minute = property(fget=lambda self: np.nan)
+    second = property(fget=lambda self: np.nan)
+    millisecond = property(fget=lambda self: np.nan)
+    microsecond = property(fget=lambda self: np.nan)
+    nanosecond = property(fget=lambda self: np.nan)
+
+    week = property(fget=lambda self: np.nan)
+    dayofyear = property(fget=lambda self: np.nan)
+    weekofyear = property(fget=lambda self: np.nan)
+    days_in_month = property(fget=lambda self: np.nan)
+    daysinmonth = property(fget=lambda self: np.nan)
+    dayofweek = property(fget=lambda self: np.nan)
+    weekday_name = property(fget=lambda self: np.nan)
+
+    # inject Timedelta properties
+    days = property(fget=lambda self: np.nan)
+    seconds = property(fget=lambda self: np.nan)
+    microseconds = property(fget=lambda self: np.nan)
+    nanoseconds = property(fget=lambda self: np.nan)
+
+    # inject pd.Period properties
+    qyear = property(fget=lambda self: np.nan)
+
+    # ----------------------------------------------------------------------
+    # GH9513 NaT methods (except to_datetime64) to raise, return np.nan, or
+    # return NaT create functions that raise, for binding to NaTType
+    # These are the ones that can get their docstrings from datetime.
+
+    # nan methods
+    weekday = _make_nan_func('weekday', datetime.weekday.__doc__)
+    isoweekday = _make_nan_func('isoweekday', datetime.isoweekday.__doc__)
+    month_name = _make_nan_func('month_name',  # noqa:E128
+        """
+        Return the month name of the Timestamp with specified locale.
+
+        Parameters
+        ----------
+        locale : string, default None (English locale)
+            locale determining the language in which to return the month name
+
+        Returns
+        -------
+        month_name : string
+
+        .. versionadded:: 0.23.0
+        """)
+    day_name = _make_nan_func('day_name', # noqa:E128
+        """
+        Return the day name of the Timestamp with specified locale.
+
+        Parameters
+        ----------
+        locale : string, default None (English locale)
+            locale determining the language in which to return the day name
+
+        Returns
+        -------
+        day_name : string
+
+        .. versionadded:: 0.23.0
+        """)
+    # _nat_methods
+    date = _make_nat_func('date', datetime.date.__doc__)
+
+    utctimetuple = _make_error_func('utctimetuple', datetime)
+    timetz = _make_error_func('timetz', datetime)
+    timetuple = _make_error_func('timetuple', datetime)
+    strptime = _make_error_func('strptime', datetime)
+    strftime = _make_error_func('strftime', datetime)
+    isocalendar = _make_error_func('isocalendar', datetime)
+    dst = _make_error_func('dst', datetime)
+    ctime = _make_error_func('ctime', datetime)
+    time = _make_error_func('time', datetime)
+    toordinal = _make_error_func('toordinal', datetime)
+    tzname = _make_error_func('tzname', datetime)
+    utcoffset = _make_error_func('utcoffset', datetime)
+
+    # ----------------------------------------------------------------------
+    # The remaining methods have docstrings copy/pasted from the analogous
+    # Timestamp methods.
+
+    utcfromtimestamp = _make_error_func('utcfromtimestamp',  # noqa:E128
+        """
+        Timestamp.utcfromtimestamp(ts)
+
+        Construct a naive UTC datetime from a POSIX timestamp.
+        """
+    )
+    fromtimestamp = _make_error_func('fromtimestamp',  # noqa:E128
+        """
+        Timestamp.fromtimestamp(ts)
+
+        timestamp[, tz] -> tz's local time from POSIX timestamp.
+        """
+    )
+    combine = _make_error_func('combine',  # noqa:E128
+        """
+        Timsetamp.combine(date, time)
+
+        date, time -> datetime with same date and time fields
+        """
+    )
+    utcnow = _make_error_func('utcnow',  # noqa:E128
+        """
+        Timestamp.utcnow()
+
+        Return a new Timestamp representing UTC day and time.
+        """
+    )
+
+    timestamp = _make_error_func('timestamp',  # noqa:E128
+        """Return POSIX timestamp as float.""")
+
+    # GH9513 NaT methods (except to_datetime64) to raise, return np.nan, or
+    # return NaT create functions that raise, for binding to NaTType
+    astimezone = _make_error_func('astimezone',  # noqa:E128
+        """
+        Convert tz-aware Timestamp to another time zone.
+
+        Parameters
+        ----------
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will be converted to.
+            None will remove timezone holding UTC time.
+
+        Returns
+        -------
+        converted : Timestamp
+
+        Raises
+        ------
+        TypeError
+            If Timestamp is tz-naive.
+        """)
+    fromordinal = _make_error_func('fromordinal',  # noqa:E128
+        """
+        Timestamp.fromordinal(ordinal, freq=None, tz=None)
+
+        passed an ordinal, translate and convert to a ts
+        note: by definition there cannot be any tz info on the ordinal itself
+
+        Parameters
+        ----------
+        ordinal : int
+            date corresponding to a proleptic Gregorian ordinal
+        freq : str, DateOffset
+            Offset which Timestamp will have
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will have.
+        """)
+
+    # _nat_methods
+    to_pydatetime = _make_nat_func('to_pydatetime',  # noqa:E128
+        """
+        Convert a Timestamp object to a native Python datetime object.
+
+        If warn=True, issue a warning if nanoseconds is nonzero.
+        """)
+
+    now = _make_nat_func('now',  # noqa:E128
+        """
+        Timestamp.now(tz=None)
+
+        Returns new Timestamp object representing current time local to
+        tz.
+
+        Parameters
+        ----------
+        tz : str or timezone object, default None
+            Timezone to localize to
+        """)
+    today = _make_nat_func('today',  # noqa:E128
+        """
+        Timestamp.today(cls, tz=None)
+
+        Return the current time in the local timezone.  This differs
+        from datetime.today() in that it can be localized to a
+        passed timezone.
+
+        Parameters
+        ----------
+        tz : str or timezone object, default None
+            Timezone to localize to
+        """)
+    round = _make_nat_func('round',  # noqa:E128
+        """
+        Round the Timestamp to the specified resolution
+
+        Returns
+        -------
+        a new Timestamp rounded to the given resolution of `freq`
+
+        Parameters
+        ----------
+        freq : a freq string indicating the rounding resolution
+
+        Raises
+        ------
+        ValueError if the freq cannot be converted
+        """)
+    floor = _make_nat_func('floor',  # noqa:E128
+        """
+        return a new Timestamp floored to this resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the flooring resolution
+        """)
+    ceil = _make_nat_func('ceil',  # noqa:E128
+        """
+        return a new Timestamp ceiled to this resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the ceiling resolution
+        """)
+
+    tz_convert = _make_nat_func('tz_convert',  # noqa:E128
+        """
+        Convert tz-aware Timestamp to another time zone.
+
+        Parameters
+        ----------
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will be converted to.
+            None will remove timezone holding UTC time.
+
+        Returns
+        -------
+        converted : Timestamp
+
+        Raises
+        ------
+        TypeError
+            If Timestamp is tz-naive.
+        """)
+    tz_localize = _make_nat_func('tz_localize',  # noqa:E128
+        """
+        Convert naive Timestamp to local time zone, or remove
+        timezone from tz-aware Timestamp.
+
+        Parameters
+        ----------
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will be converted to.
+            None will remove timezone holding local time.
+
+        ambiguous : bool, 'NaT', default 'raise'
+            - bool contains flags to determine if time is dst or not (note
+              that this flag is only applicable for ambiguous fall dst dates)
+            - 'NaT' will return NaT for an ambiguous time
+            - 'raise' will raise an AmbiguousTimeError for an ambiguous time
+
+        errors : 'raise', 'coerce', default 'raise'
+            - 'raise' will raise a NonExistentTimeError if a timestamp is not
+               valid in the specified timezone (e.g. due to a transition from
+               or to DST time)
+            - 'coerce' will return NaT if the timestamp can not be converted
+              into the specified timezone
+
+              .. versionadded:: 0.19.0
+
+        Returns
+        -------
+        localized : Timestamp
+
+        Raises
+        ------
+        TypeError
+            If the Timestamp is tz-aware and tz is not None.
+        """)
+    replace = _make_nat_func('replace',  # noqa:E128
+        """
+        implements datetime.replace, handles nanoseconds
+
+        Parameters
+        ----------
+        year : int, optional
+        month : int, optional
+        day : int, optional
+        hour : int, optional
+        minute : int, optional
+        second : int, optional
+        microsecond : int, optional
+        nanosecond: int, optional
+        tzinfo : tz-convertible, optional
+        fold : int, optional, default is 0
+            added in 3.6, NotImplemented
+
+        Returns
+        -------
+        Timestamp with fields replaced
+        """)
+
+
+NaT = NaTType()
+
+
+# ----------------------------------------------------------------------
+
+cdef inline bint checknull_with_nat(object val):
+    """ utility to check if a value is a nat or not """
+    return val is None or (
+        PyFloat_Check(val) and val != val) or val is NaT
diff --git a/pandas/_libs/tslibs/np_datetime.pxd b/pandas/_libs/tslibs/np_datetime.pxd
new file mode 100644
index 0000000000000..1a0baa8271643
--- /dev/null
+++ b/pandas/_libs/tslibs/np_datetime.pxd
@@ -0,0 +1,76 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+from cpython.datetime cimport date, datetime
+
+from numpy cimport int64_t, int32_t
+
+cdef extern from "numpy/ndarrayobject.h":
+    ctypedef int64_t npy_timedelta
+    ctypedef int64_t npy_datetime
+
+cdef extern from "numpy/ndarraytypes.h":
+    ctypedef struct PyArray_DatetimeMetaData:
+        PANDAS_DATETIMEUNIT base
+        int64_t num
+
+cdef extern from "numpy/arrayscalars.h":
+    ctypedef struct PyDatetimeScalarObject:
+        # PyObject_HEAD
+        npy_datetime obval
+        PyArray_DatetimeMetaData obmeta
+
+    ctypedef struct PyTimedeltaScalarObject:
+        # PyObject_HEAD
+        npy_timedelta obval
+        PyArray_DatetimeMetaData obmeta
+
+cdef extern from "../src/datetime/np_datetime.h":
+    ctypedef struct pandas_datetimestruct:
+        int64_t year
+        int32_t month, day, hour, min, sec, us, ps, as
+
+    ctypedef struct pandas_timedeltastruct:
+        int64_t days
+        int32_t hrs, min, sec, ms, us, ns, seconds, microseconds, nanoseconds
+
+    ctypedef enum PANDAS_DATETIMEUNIT:
+        PANDAS_FR_Y
+        PANDAS_FR_M
+        PANDAS_FR_W
+        PANDAS_FR_D
+        PANDAS_FR_B
+        PANDAS_FR_h
+        PANDAS_FR_m
+        PANDAS_FR_s
+        PANDAS_FR_ms
+        PANDAS_FR_us
+        PANDAS_FR_ns
+        PANDAS_FR_ps
+        PANDAS_FR_fs
+        PANDAS_FR_as
+
+    void pandas_datetime_to_datetimestruct(npy_datetime val,
+                                           PANDAS_DATETIMEUNIT fr,
+                                           pandas_datetimestruct *result) nogil
+
+
+cdef int reverse_ops[6]
+
+cdef bint cmp_scalar(int64_t lhs, int64_t rhs, int op) except -1
+
+cdef check_dts_bounds(pandas_datetimestruct *dts)
+
+cdef int64_t dtstruct_to_dt64(pandas_datetimestruct* dts) nogil
+cdef void dt64_to_dtstruct(int64_t dt64, pandas_datetimestruct* out) nogil
+cdef void td64_to_tdstruct(int64_t td64, pandas_timedeltastruct* out) nogil
+
+cdef int64_t pydatetime_to_dt64(datetime val, pandas_datetimestruct *dts)
+cdef int64_t pydate_to_dt64(date val, pandas_datetimestruct *dts)
+
+cdef npy_datetime get_datetime64_value(object obj) nogil
+cdef npy_timedelta get_timedelta64_value(object obj) nogil
+cdef PANDAS_DATETIMEUNIT get_datetime64_unit(object obj) nogil
+
+cdef int _string_to_dts(object val, pandas_datetimestruct* dts,
+                        int* out_local, int* out_tzoffset) except? -1
diff --git a/pandas/_libs/tslibs/np_datetime.pyx b/pandas/_libs/tslibs/np_datetime.pyx
new file mode 100644
index 0000000000000..7f861a50f03b8
--- /dev/null
+++ b/pandas/_libs/tslibs/np_datetime.pyx
@@ -0,0 +1,201 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+from cpython cimport (Py_EQ, Py_NE, Py_GE, Py_GT, Py_LT, Py_LE,
+                      PyUnicode_Check, PyUnicode_AsASCIIString)
+
+from cpython.datetime cimport (datetime, date,
+                               PyDateTime_IMPORT,
+                               PyDateTime_GET_YEAR, PyDateTime_GET_MONTH,
+                               PyDateTime_GET_DAY, PyDateTime_DATE_GET_HOUR,
+                               PyDateTime_DATE_GET_MINUTE,
+                               PyDateTime_DATE_GET_SECOND,
+                               PyDateTime_DATE_GET_MICROSECOND)
+PyDateTime_IMPORT
+
+from numpy cimport int64_t
+
+cdef extern from "../src/datetime/np_datetime.h":
+    int cmp_pandas_datetimestruct(pandas_datetimestruct *a,
+                                  pandas_datetimestruct *b)
+
+    npy_datetime pandas_datetimestruct_to_datetime(PANDAS_DATETIMEUNIT fr,
+                                                   pandas_datetimestruct *d
+                                                   ) nogil
+
+    void pandas_datetime_to_datetimestruct(npy_datetime val,
+                                           PANDAS_DATETIMEUNIT fr,
+                                           pandas_datetimestruct *result) nogil
+
+    void pandas_timedelta_to_timedeltastruct(npy_timedelta val,
+                                             PANDAS_DATETIMEUNIT fr,
+                                             pandas_timedeltastruct *result
+                                            ) nogil
+
+    pandas_datetimestruct _NS_MIN_DTS, _NS_MAX_DTS
+
+cdef extern from "../src/datetime/np_datetime_strings.h":
+    int parse_iso_8601_datetime(char *str, int len,
+                                pandas_datetimestruct *out,
+                                int *out_local, int *out_tzoffset)
+
+# ----------------------------------------------------------------------
+# numpy object inspection
+
+cdef inline npy_datetime get_datetime64_value(object obj) nogil:
+    """
+    returns the int64 value underlying scalar numpy datetime64 object
+
+    Note that to interpret this as a datetime, the corresponding unit is
+    also needed.  That can be found using `get_datetime64_unit`.
+    """
+    return (<PyDatetimeScalarObject*>obj).obval
+
+
+cdef inline npy_timedelta get_timedelta64_value(object obj) nogil:
+    """
+    returns the int64 value underlying scalar numpy timedelta64 object
+    """
+    return (<PyTimedeltaScalarObject*>obj).obval
+
+
+cdef inline PANDAS_DATETIMEUNIT get_datetime64_unit(object obj) nogil:
+    """
+    returns the unit part of the dtype for a numpy datetime64 object.
+    """
+    return <PANDAS_DATETIMEUNIT>(<PyDatetimeScalarObject*>obj).obmeta.base
+
+# ----------------------------------------------------------------------
+# Comparison
+
+cdef int reverse_ops[6]
+
+reverse_ops[Py_LT] = Py_GT
+reverse_ops[Py_LE] = Py_GE
+reverse_ops[Py_EQ] = Py_EQ
+reverse_ops[Py_NE] = Py_NE
+reverse_ops[Py_GT] = Py_LT
+reverse_ops[Py_GE] = Py_LE
+
+
+cdef inline bint cmp_scalar(int64_t lhs, int64_t rhs, int op) except -1:
+    """
+    cmp_scalar is a more performant version of PyObject_RichCompare
+    typed for int64_t arguments.
+    """
+    if op == Py_EQ:
+        return lhs == rhs
+    elif op == Py_NE:
+        return lhs != rhs
+    elif op == Py_LT:
+        return lhs < rhs
+    elif op == Py_LE:
+        return lhs <= rhs
+    elif op == Py_GT:
+        return lhs > rhs
+    elif op == Py_GE:
+        return lhs >= rhs
+
+
+class OutOfBoundsDatetime(ValueError):
+    pass
+
+
+cdef inline check_dts_bounds(pandas_datetimestruct *dts):
+    """Raises OutOfBoundsDatetime if the given date is outside the range that
+    can be represented by nanosecond-resolution 64-bit integers."""
+    cdef:
+        bint error = False
+
+    if (dts.year <= 1677 and
+            cmp_pandas_datetimestruct(dts, &_NS_MIN_DTS) == -1):
+        error = True
+    elif (dts.year >= 2262 and
+          cmp_pandas_datetimestruct(dts, &_NS_MAX_DTS) == 1):
+        error = True
+
+    if error:
+        fmt = '%d-%.2d-%.2d %.2d:%.2d:%.2d' % (dts.year, dts.month,
+                                               dts.day, dts.hour,
+                                               dts.min, dts.sec)
+        raise OutOfBoundsDatetime(
+            'Out of bounds nanosecond timestamp: {fmt}'.format(fmt=fmt))
+
+
+# ----------------------------------------------------------------------
+# Conversion
+
+cdef inline int64_t dtstruct_to_dt64(pandas_datetimestruct* dts) nogil:
+    """Convenience function to call pandas_datetimestruct_to_datetime
+    with the by-far-most-common frequency PANDAS_FR_ns"""
+    return pandas_datetimestruct_to_datetime(PANDAS_FR_ns, dts)
+
+
+cdef inline void dt64_to_dtstruct(int64_t dt64,
+                                  pandas_datetimestruct* out) nogil:
+    """Convenience function to call pandas_datetime_to_datetimestruct
+    with the by-far-most-common frequency PANDAS_FR_ns"""
+    pandas_datetime_to_datetimestruct(dt64, PANDAS_FR_ns, out)
+    return
+
+cdef inline void td64_to_tdstruct(int64_t td64,
+                                  pandas_timedeltastruct* out) nogil:
+    """Convenience function to call pandas_timedelta_to_timedeltastruct
+    with the by-far-most-common frequency PANDAS_FR_ns"""
+    pandas_timedelta_to_timedeltastruct(td64, PANDAS_FR_ns, out)
+    return
+
+
+cdef inline int64_t pydatetime_to_dt64(datetime val,
+                                       pandas_datetimestruct *dts):
+    dts.year = PyDateTime_GET_YEAR(val)
+    dts.month = PyDateTime_GET_MONTH(val)
+    dts.day = PyDateTime_GET_DAY(val)
+    dts.hour = PyDateTime_DATE_GET_HOUR(val)
+    dts.min = PyDateTime_DATE_GET_MINUTE(val)
+    dts.sec = PyDateTime_DATE_GET_SECOND(val)
+    dts.us = PyDateTime_DATE_GET_MICROSECOND(val)
+    dts.ps = dts.as = 0
+    return dtstruct_to_dt64(dts)
+
+
+cdef inline int64_t pydate_to_dt64(date val,
+                                   pandas_datetimestruct *dts):
+    dts.year = PyDateTime_GET_YEAR(val)
+    dts.month = PyDateTime_GET_MONTH(val)
+    dts.day = PyDateTime_GET_DAY(val)
+    dts.hour = dts.min = dts.sec = dts.us = 0
+    dts.ps = dts.as = 0
+    return dtstruct_to_dt64(dts)
+
+
+cdef inline int _string_to_dts(object val, pandas_datetimestruct* dts,
+                               int* out_local, int* out_tzoffset) except? -1:
+    cdef:
+        int result
+        char *tmp
+
+    if PyUnicode_Check(val):
+        val = PyUnicode_AsASCIIString(val)
+
+    tmp = val
+    result = _cstring_to_dts(tmp, len(val), dts, out_local, out_tzoffset)
+
+    if result == -1:
+        raise ValueError('Unable to parse %s' % str(val))
+    return result
+
+
+cdef inline int _cstring_to_dts(char *val, int length,
+                                pandas_datetimestruct* dts,
+                                int* out_local, int* out_tzoffset) except? -1:
+    # Note: without this "extra layer" between _string_to_dts
+    # and parse_iso_8601_datetime, calling _string_to_dts raises
+    # `SystemError: <class 'str'> returned a result with an error set`
+    # in Python3
+    cdef:
+        int result
+
+    result = parse_iso_8601_datetime(val, length,
+                                     dts, out_local, out_tzoffset)
+    return result
diff --git a/pandas/_libs/tslibs/offsets.pyx b/pandas/_libs/tslibs/offsets.pyx
new file mode 100644
index 0000000000000..841db80cf094e
--- /dev/null
+++ b/pandas/_libs/tslibs/offsets.pyx
@@ -0,0 +1,1032 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+cimport cython
+from cython cimport Py_ssize_t
+
+import time
+from cpython.datetime cimport datetime, timedelta, time as dt_time
+
+from dateutil.relativedelta import relativedelta
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport int64_t
+cnp.import_array()
+
+
+from util cimport is_string_object, is_integer_object
+
+from ccalendar import MONTHS, DAYS
+from ccalendar cimport get_days_in_month, dayofweek
+from conversion cimport tz_convert_single, pydt_to_i8
+from frequencies cimport get_freq_code
+from nattype cimport NPY_NAT
+from np_datetime cimport (pandas_datetimestruct,
+                          dtstruct_to_dt64, dt64_to_dtstruct)
+
+# ---------------------------------------------------------------------
+# Constants
+
+
+class WeekDay(object):
+    # TODO: Remove: This is not used outside of tests
+    MON = 0
+    TUE = 1
+    WED = 2
+    THU = 3
+    FRI = 4
+    SAT = 5
+    SUN = 6
+
+
+_offset_to_period_map = {
+    'WEEKDAY': 'D',
+    'EOM': 'M',
+    'BM': 'M',
+    'BQS': 'Q',
+    'QS': 'Q',
+    'BQ': 'Q',
+    'BA': 'A',
+    'AS': 'A',
+    'BAS': 'A',
+    'MS': 'M',
+    'D': 'D',
+    'C': 'C',
+    'B': 'B',
+    'T': 'T',
+    'S': 'S',
+    'L': 'L',
+    'U': 'U',
+    'N': 'N',
+    'H': 'H',
+    'Q': 'Q',
+    'A': 'A',
+    'W': 'W',
+    'M': 'M',
+    'Y': 'A',
+    'BY': 'A',
+    'YS': 'A',
+    'BYS': 'A'}
+
+need_suffix = ['QS', 'BQ', 'BQS', 'YS', 'AS', 'BY', 'BA', 'BYS', 'BAS']
+
+for __prefix in need_suffix:
+    for _m in MONTHS:
+        key = '%s-%s' % (__prefix, _m)
+        _offset_to_period_map[key] = _offset_to_period_map[__prefix]
+
+for __prefix in ['A', 'Q']:
+    for _m in MONTHS:
+        _alias = '%s-%s' % (__prefix, _m)
+        _offset_to_period_map[_alias] = _alias
+
+for _d in DAYS:
+    _offset_to_period_map['W-%s' % _d] = 'W-%s' % _d
+
+
+# ---------------------------------------------------------------------
+# Misc Helpers
+
+cdef to_offset(object obj):
+    """
+    Wrap pandas.tseries.frequencies.to_offset to keep centralize runtime
+    imports
+    """
+    from pandas.tseries.frequencies import to_offset
+    return to_offset(obj)
+
+
+def as_datetime(obj):
+    f = getattr(obj, 'to_pydatetime', None)
+    if f is not None:
+        obj = f()
+    return obj
+
+
+cpdef bint _is_normalized(dt):
+    if (dt.hour != 0 or dt.minute != 0 or dt.second != 0 or
+            dt.microsecond != 0 or getattr(dt, 'nanosecond', 0) != 0):
+        return False
+    return True
+
+
+def apply_index_wraps(func):
+    # Note: normally we would use `@functools.wraps(func)`, but this does
+    # not play nicely with cython class methods
+    def wrapper(self, other):
+        result = func(self, other)
+        if self.normalize:
+            result = result.to_period('D').to_timestamp()
+        return result
+
+    # do @functools.wraps(func) manually since it doesn't work on cdef funcs
+    wrapper.__name__ = func.__name__
+    wrapper.__doc__ = func.__doc__
+    try:
+        wrapper.__module__ = func.__module__
+    except AttributeError:
+        # AttributeError: 'method_descriptor' object has no
+        # attribute '__module__'
+        pass
+    return wrapper
+
+
+# ---------------------------------------------------------------------
+# Business Helpers
+
+cpdef int get_lastbday(int year, int month) nogil:
+    """
+    Find the last day of the month that is a business day.
+
+    Parameters
+    ----------
+    year : int
+    month : int
+
+    Returns
+    -------
+    last_bday : int
+    """
+    cdef:
+        int wkday, days_in_month
+
+    wkday = dayofweek(year, month, 1)
+    days_in_month = get_days_in_month(year, month)
+    return days_in_month - max(((wkday + days_in_month - 1) % 7) - 4, 0)
+
+
+cpdef int get_firstbday(int year, int month) nogil:
+    """
+    Find the first day of the month that is a business day.
+
+    Parameters
+    ----------
+    year : int
+    month : int
+
+    Returns
+    -------
+    first_bday : int
+    """
+    cdef:
+        int first, wkday
+
+    wkday = dayofweek(year, month, 1)
+    first = 1
+    if wkday == 5:  # on Saturday
+        first = 3
+    elif wkday == 6:  # on Sunday
+        first = 2
+    return first
+
+
+def _get_calendar(weekmask, holidays, calendar):
+    """Generate busdaycalendar"""
+    if isinstance(calendar, np.busdaycalendar):
+        if not holidays:
+            holidays = tuple(calendar.holidays)
+        elif not isinstance(holidays, tuple):
+            holidays = tuple(holidays)
+        else:
+            # trust that calendar.holidays and holidays are
+            # consistent
+            pass
+        return calendar, holidays
+
+    if holidays is None:
+        holidays = []
+    try:
+        holidays = holidays + calendar.holidays().tolist()
+    except AttributeError:
+        pass
+    holidays = [_to_dt64(dt, dtype='datetime64[D]') for dt in holidays]
+    holidays = tuple(sorted(holidays))
+
+    kwargs = {'weekmask': weekmask}
+    if holidays:
+        kwargs['holidays'] = holidays
+
+    busdaycalendar = np.busdaycalendar(**kwargs)
+    return busdaycalendar, holidays
+
+
+def _to_dt64(dt, dtype='datetime64'):
+    # Currently
+    # > np.datetime64(dt.datetime(2013,5,1),dtype='datetime64[D]')
+    # numpy.datetime64('2013-05-01T02:00:00.000000+0200')
+    # Thus astype is needed to cast datetime to datetime64[D]
+    if getattr(dt, 'tzinfo', None) is not None:
+        i8 = pydt_to_i8(dt)
+        dt = tz_convert_single(i8, 'UTC', dt.tzinfo)
+        dt = np.int64(dt).astype('datetime64[ns]')
+    else:
+        dt = np.datetime64(dt)
+    if dt.dtype.name != dtype:
+        dt = dt.astype(dtype)
+    return dt
+
+
+# ---------------------------------------------------------------------
+# Validation
+
+
+def _validate_business_time(t_input):
+    if is_string_object(t_input):
+        try:
+            t = time.strptime(t_input, '%H:%M')
+            return dt_time(hour=t.tm_hour, minute=t.tm_min)
+        except ValueError:
+            raise ValueError("time data must match '%H:%M' format")
+    elif isinstance(t_input, dt_time):
+        if t_input.second != 0 or t_input.microsecond != 0:
+            raise ValueError(
+                "time data must be specified only with hour and minute")
+        return t_input
+    else:
+        raise ValueError("time data must be string or datetime.time")
+
+
+# ---------------------------------------------------------------------
+# Constructor Helpers
+
+relativedelta_kwds = set([
+    'years', 'months', 'weeks', 'days',
+    'year', 'month', 'week', 'day', 'weekday',
+    'hour', 'minute', 'second', 'microsecond',
+    'nanosecond', 'nanoseconds',
+    'hours', 'minutes', 'seconds', 'milliseconds', 'microseconds'])
+
+
+def _determine_offset(kwds):
+    # timedelta is used for sub-daily plural offsets and all singular
+    # offsets relativedelta is used for plural offsets of daily length or
+    # more nanosecond(s) are handled by apply_wraps
+    kwds_no_nanos = dict(
+        (k, v) for k, v in kwds.items()
+        if k not in ('nanosecond', 'nanoseconds')
+    )
+    # TODO: Are nanosecond and nanoseconds allowed somewhere?
+
+    _kwds_use_relativedelta = ('years', 'months', 'weeks', 'days',
+                               'year', 'month', 'week', 'day', 'weekday',
+                               'hour', 'minute', 'second', 'microsecond')
+
+    use_relativedelta = False
+    if len(kwds_no_nanos) > 0:
+        if any(k in _kwds_use_relativedelta for k in kwds_no_nanos):
+            offset = relativedelta(**kwds_no_nanos)
+            use_relativedelta = True
+        else:
+            # sub-daily offset - use timedelta (tz-aware)
+            offset = timedelta(**kwds_no_nanos)
+    else:
+        offset = timedelta(1)
+    return offset, use_relativedelta
+
+
+# ---------------------------------------------------------------------
+# Mixins & Singletons
+
+
+class ApplyTypeError(TypeError):
+    # sentinel class for catching the apply error to return NotImplemented
+    pass
+
+
+# TODO: unused.  remove?
+class CacheableOffset(object):
+    _cacheable = True
+
+
+# ---------------------------------------------------------------------
+# Base Classes
+
+class _BaseOffset(object):
+    """
+    Base class for DateOffset methods that are not overridden by subclasses
+    and will (after pickle errors are resolved) go into a cdef class.
+    """
+    _typ = "dateoffset"
+    _normalize_cache = True
+    _cacheable = False
+    _day_opt = None
+    _attributes = frozenset(['n', 'normalize'])
+
+    def __init__(self, n=1, normalize=False):
+        n = self._validate_n(n)
+        object.__setattr__(self, "n", n)
+        object.__setattr__(self, "normalize", normalize)
+        object.__setattr__(self, "_cache", {})
+
+    def __setattr__(self, name, value):
+        raise AttributeError("DateOffset objects are immutable.")
+
+    def __eq__(self, other):
+        if is_string_object(other):
+            other = to_offset(other)
+
+        try:
+            return self._params == other._params
+        except AttributeError:
+            # other is not a DateOffset object
+            return False
+
+        return self._params == other._params
+
+    def __ne__(self, other):
+        return not self == other
+
+    def __hash__(self):
+        return hash(self._params)
+
+    @property
+    def _params(self):
+        """
+        Returns a tuple containing all of the attributes needed to evaluate
+        equality between two DateOffset objects.
+        """
+        # NB: non-cython subclasses override property with cache_readonly
+        all_paras = self.__dict__.copy()
+        if 'holidays' in all_paras and not all_paras['holidays']:
+            all_paras.pop('holidays')
+        exclude = ['kwds', 'name', 'calendar']
+        attrs = [(k, v) for k, v in all_paras.items()
+                 if (k not in exclude) and (k[0] != '_')]
+        attrs = sorted(set(attrs))
+        params = tuple([str(self.__class__)] + attrs)
+        return params
+
+    @property
+    def kwds(self):
+        # for backwards-compatibility
+        kwds = {name: getattr(self, name, None) for name in self._attributes
+                if name not in ['n', 'normalize']}
+        return {name: kwds[name] for name in kwds if kwds[name] is not None}
+
+    def __call__(self, other):
+        return self.apply(other)
+
+    def __mul__(self, other):
+        return self.__class__(n=other * self.n, normalize=self.normalize,
+                              **self.kwds)
+
+    def __neg__(self):
+        # Note: we are defering directly to __mul__ instead of __rmul__, as
+        # that allows us to use methods that can go in a `cdef class`
+        return self * -1
+
+    def copy(self):
+        # Note: we are defering directly to __mul__ instead of __rmul__, as
+        # that allows us to use methods that can go in a `cdef class`
+        return self * 1
+
+    # TODO: this is never true.  fix it or get rid of it
+    def _should_cache(self):
+        return self.isAnchored() and self._cacheable
+
+    def __repr__(self):
+        className = getattr(self, '_outputName', type(self).__name__)
+
+        if abs(self.n) != 1:
+            plural = 's'
+        else:
+            plural = ''
+
+        n_str = ""
+        if self.n != 1:
+            n_str = "%s * " % self.n
+
+        out = '<%s' % n_str + className + plural + self._repr_attrs() + '>'
+        return out
+
+    def _get_offset_day(self, datetime other):
+        # subclass must implement `_day_opt`; calling from the base class
+        # will raise NotImplementedError.
+        return get_day_of_month(other, self._day_opt)
+
+    def _validate_n(self, n):
+        """
+        Require that `n` be a nonzero integer.
+
+        Parameters
+        ----------
+        n : int
+
+        Returns
+        -------
+        nint : int
+
+        Raises
+        ------
+        TypeError if `int(n)` raises
+        ValueError if n != int(n)
+        """
+        try:
+            nint = int(n)
+        except (ValueError, TypeError):
+            raise TypeError('`n` argument must be an integer, '
+                            'got {ntype}'.format(ntype=type(n)))
+        if n != nint:
+            raise ValueError('`n` argument must be an integer, '
+                             'got {n}'.format(n=n))
+        return nint
+
+    def __setstate__(self, state):
+        """Reconstruct an instance from a pickled state"""
+        if 'offset' in state:
+            # Older (<0.22.0) versions have offset attribute instead of _offset
+            if '_offset' in state:  # pragma: no cover
+                raise AssertionError('Unexpected key `_offset`')
+            state['_offset'] = state.pop('offset')
+            state['kwds']['offset'] = state['_offset']
+
+        if '_offset' in state and not isinstance(state['_offset'], timedelta):
+            # relativedelta, we need to populate using its kwds
+            offset = state['_offset']
+            odict = offset.__dict__
+            kwds = {key: odict[key] for key in odict if odict[key]}
+            state.update(kwds)
+
+        if '_cache' not in state:
+            state['_cache'] = {}
+
+        self.__dict__.update(state)
+
+        if 'weekmask' in state and 'holidays' in state:
+            calendar, holidays = _get_calendar(weekmask=self.weekmask,
+                                               holidays=self.holidays,
+                                               calendar=None)
+            object.__setattr__(self, "calendar", calendar)
+            object.__setattr__(self, "holidays", holidays)
+
+    def __getstate__(self):
+        """Return a pickleable state"""
+        state = self.__dict__.copy()
+
+        # we don't want to actually pickle the calendar object
+        # as its a np.busyday; we recreate on deserilization
+        if 'calendar' in state:
+            del state['calendar']
+        try:
+            state['kwds'].pop('calendar')
+        except KeyError:
+            pass
+
+        return state
+
+
+class BaseOffset(_BaseOffset):
+    # Here we add __rfoo__ methods that don't play well with cdef classes
+    def __rmul__(self, other):
+        return self.__mul__(other)
+
+    def __radd__(self, other):
+        return self.__add__(other)
+
+    def __rsub__(self, other):
+        if getattr(other, '_typ', None) in ['datetimeindex', 'series']:
+            # i.e. isinstance(other, (ABCDatetimeIndex, ABCSeries))
+            return other - self
+        return -self + other
+
+
+# ----------------------------------------------------------------------
+# RelativeDelta Arithmetic
+
+cdef inline int year_add_months(pandas_datetimestruct dts, int months) nogil:
+    """new year number after shifting pandas_datetimestruct number of months"""
+    return dts.year + (dts.month + months - 1) / 12
+
+
+cdef inline int month_add_months(pandas_datetimestruct dts, int months) nogil:
+    """
+    New month number after shifting pandas_datetimestruct
+    number of months.
+    """
+    cdef int new_month = (dts.month + months) % 12
+    return 12 if new_month == 0 else new_month
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def shift_quarters(int64_t[:] dtindex, int quarters,
+                   int q1start_month, object day, int modby=3):
+    """
+    Given an int64 array representing nanosecond timestamps, shift all elements
+    by the specified number of quarters using DateOffset semantics.
+
+    Parameters
+    ----------
+    dtindex : int64_t[:] timestamps for input dates
+    quarters : int number of quarters to shift
+    q1start_month : int month in which Q1 begins by convention
+    day : {'start', 'end', 'business_start', 'business_end'}
+    modby : int (3 for quarters, 12 for years)
+
+    Returns
+    -------
+    out : ndarray[int64_t]
+    """
+    cdef:
+        Py_ssize_t i
+        pandas_datetimestruct dts
+        int count = len(dtindex)
+        int months_to_roll, months_since, n, compare_day
+        bint roll_check
+        int64_t[:] out = np.empty(count, dtype='int64')
+
+    if day == 'start':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                n = quarters
+
+                months_since = (dts.month - q1start_month) % modby
+
+                # offset semantics - if on the anchor point and going backwards
+                # shift to next
+                if n <= 0 and (months_since != 0 or
+                               (months_since == 0 and dts.day > 1)):
+                    n += 1
+
+                dts.year = year_add_months(dts, modby * n - months_since)
+                dts.month = month_add_months(dts, modby * n - months_since)
+                dts.day = 1
+
+                out[i] = dtstruct_to_dt64(&dts)
+
+    elif day == 'end':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                n = quarters
+
+                months_since = (dts.month - q1start_month) % modby
+
+                if n <= 0 and months_since != 0:
+                    # The general case of this condition would be
+                    # `months_since != 0 or (months_since == 0 and
+                    #    dts.day > get_days_in_month(dts.year, dts.month))`
+                    # but the get_days_in_month inequality would never hold.
+                    n += 1
+                elif n > 0 and (months_since == 0 and
+                                dts.day < get_days_in_month(dts.year,
+                                                            dts.month)):
+                    n -= 1
+
+                dts.year = year_add_months(dts, modby * n - months_since)
+                dts.month = month_add_months(dts, modby * n - months_since)
+                dts.day = get_days_in_month(dts.year, dts.month)
+
+                out[i] = dtstruct_to_dt64(&dts)
+
+    elif day == 'business_start':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                n = quarters
+
+                months_since = (dts.month - q1start_month) % modby
+                # compare_day is only relevant for comparison in the case
+                # where months_since == 0.
+                compare_day = get_firstbday(dts.year, dts.month)
+
+                if n <= 0 and (months_since != 0 or
+                               (months_since == 0 and dts.day > compare_day)):
+                    # make sure to roll forward, so negate
+                    n += 1
+                elif n > 0 and (months_since == 0 and dts.day < compare_day):
+                    # pretend to roll back if on same month but
+                    # before compare_day
+                    n -= 1
+
+                dts.year = year_add_months(dts, modby * n - months_since)
+                dts.month = month_add_months(dts, modby * n - months_since)
+
+                dts.day = get_firstbday(dts.year, dts.month)
+
+                out[i] = dtstruct_to_dt64(&dts)
+
+    elif day == 'business_end':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                n = quarters
+
+                months_since = (dts.month - q1start_month) % modby
+                # compare_day is only relevant for comparison in the case
+                # where months_since == 0.
+                compare_day = get_lastbday(dts.year, dts.month)
+
+                if n <= 0 and (months_since != 0 or
+                               (months_since == 0 and dts.day > compare_day)):
+                    # make sure to roll forward, so negate
+                    n += 1
+                elif n > 0 and (months_since == 0 and dts.day < compare_day):
+                    # pretend to roll back if on same month but
+                    # before compare_day
+                    n -= 1
+
+                dts.year = year_add_months(dts, modby * n - months_since)
+                dts.month = month_add_months(dts, modby * n - months_since)
+
+                dts.day = get_lastbday(dts.year, dts.month)
+
+                out[i] = dtstruct_to_dt64(&dts)
+
+    else:
+        raise ValueError("day must be None, 'start', 'end', "
+                         "'business_start', or 'business_end'")
+
+    return np.asarray(out)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def shift_months(int64_t[:] dtindex, int months, object day=None):
+    """
+    Given an int64-based datetime index, shift all elements
+    specified number of months using DateOffset semantics
+
+    day: {None, 'start', 'end'}
+       * None: day of month
+       * 'start' 1st day of month
+       * 'end' last day of month
+    """
+    cdef:
+        Py_ssize_t i
+        pandas_datetimestruct dts
+        int count = len(dtindex)
+        int months_to_roll
+        bint roll_check
+        int64_t[:] out = np.empty(count, dtype='int64')
+
+    if day is None:
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dts.year = year_add_months(dts, months)
+                dts.month = month_add_months(dts, months)
+
+                dts.day = min(dts.day, get_days_in_month(dts.year, dts.month))
+                out[i] = dtstruct_to_dt64(&dts)
+    elif day == 'start':
+        roll_check = False
+        if months <= 0:
+            months += 1
+            roll_check = True
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                months_to_roll = months
+
+                # offset semantics - if on the anchor point and going backwards
+                # shift to next
+                if roll_check and dts.day == 1:
+                    months_to_roll -= 1
+
+                dts.year = year_add_months(dts, months_to_roll)
+                dts.month = month_add_months(dts, months_to_roll)
+                dts.day = 1
+
+                out[i] = dtstruct_to_dt64(&dts)
+    elif day == 'end':
+        roll_check = False
+        if months > 0:
+            months -= 1
+            roll_check = True
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                months_to_roll = months
+
+                # similar semantics - when adding shift forward by one
+                # month if already at an end of month
+                if roll_check and dts.day == get_days_in_month(dts.year,
+                                                               dts.month):
+                    months_to_roll += 1
+
+                dts.year = year_add_months(dts, months_to_roll)
+                dts.month = month_add_months(dts, months_to_roll)
+
+                dts.day = get_days_in_month(dts.year, dts.month)
+                out[i] = dtstruct_to_dt64(&dts)
+
+    elif day == 'business_start':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                months_to_roll = months
+                compare_day = get_firstbday(dts.year, dts.month)
+
+                months_to_roll = roll_convention(dts.day, months_to_roll,
+                                                 compare_day)
+
+                dts.year = year_add_months(dts, months_to_roll)
+                dts.month = month_add_months(dts, months_to_roll)
+
+                dts.day = get_firstbday(dts.year, dts.month)
+                out[i] = dtstruct_to_dt64(&dts)
+
+    elif day == 'business_end':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                months_to_roll = months
+                compare_day = get_lastbday(dts.year, dts.month)
+
+                months_to_roll = roll_convention(dts.day, months_to_roll,
+                                                 compare_day)
+
+                dts.year = year_add_months(dts, months_to_roll)
+                dts.month = month_add_months(dts, months_to_roll)
+
+                dts.day = get_lastbday(dts.year, dts.month)
+                out[i] = dtstruct_to_dt64(&dts)
+
+    else:
+        raise ValueError("day must be None, 'start', 'end', "
+                         "'business_start', or 'business_end'")
+
+    return np.asarray(out)
+
+
+cpdef datetime shift_month(datetime stamp, int months, object day_opt=None):
+    """
+    Given a datetime (or Timestamp) `stamp`, an integer `months` and an
+    option `day_opt`, return a new datetimelike that many months later,
+    with day determined by `day_opt` using relativedelta semantics.
+
+    Scalar analogue of shift_months
+
+    Parameters
+    ----------
+    stamp : datetime or Timestamp
+    months : int
+    day_opt : None, 'start', 'end', or an integer
+        None: returned datetimelike has the same day as the input, or the
+              last day of the month if the new month is too short
+        'start': returned datetimelike has day=1
+        'end': returned datetimelike has day on the last day of the month
+        int: returned datetimelike has day equal to day_opt
+
+    Returns
+    -------
+    shifted : datetime or Timestamp (same as input `stamp`)
+    """
+    cdef:
+        int year, month, day
+        int days_in_month, dy
+
+    dy = (stamp.month + months) // 12
+    month = (stamp.month + months) % 12
+
+    if month == 0:
+        month = 12
+        dy -= 1
+    year = stamp.year + dy
+
+    if day_opt is None:
+        days_in_month = get_days_in_month(year, month)
+        day = min(stamp.day, days_in_month)
+    elif day_opt == 'start':
+        day = 1
+    elif day_opt == 'end':
+        day = get_days_in_month(year, month)
+    elif day_opt == 'business_start':
+        # first business day of month
+        day = get_firstbday(year, month)
+    elif day_opt == 'business_end':
+        # last business day of month
+        day = get_lastbday(year, month)
+    elif is_integer_object(day_opt):
+        days_in_month = get_days_in_month(year, month)
+        day = min(day_opt, days_in_month)
+    else:
+        raise ValueError(day_opt)
+    return stamp.replace(year=year, month=month, day=day)
+
+
+cpdef int get_day_of_month(datetime other, day_opt) except? -1:
+    """
+    Find the day in `other`'s month that satisfies a DateOffset's onOffset
+    policy, as described by the `day_opt` argument.
+
+    Parameters
+    ----------
+    other : datetime or Timestamp
+    day_opt : 'start', 'end'
+        'start': returns 1
+        'end': returns last day of the month
+
+    Returns
+    -------
+    day_of_month : int
+
+    Examples
+    -------
+    >>> other = datetime(2017, 11, 14)
+    >>> get_day_of_month(other, 'start')
+    1
+    >>> get_day_of_month(other, 'end')
+    30
+
+    """
+    cdef:
+        int days_in_month
+
+    if day_opt == 'start':
+        return 1
+    elif day_opt == 'end':
+        days_in_month = get_days_in_month(other.year, other.month)
+        return days_in_month
+    elif day_opt == 'business_start':
+        # first business day of month
+        return get_firstbday(other.year, other.month)
+    elif day_opt == 'business_end':
+        # last business day of month
+        return get_lastbday(other.year, other.month)
+    elif is_integer_object(day_opt):
+        days_in_month = get_days_in_month(other.year, other.month)
+        return min(day_opt, days_in_month)
+    elif day_opt is None:
+        # Note: unlike `shift_month`, get_day_of_month does not
+        # allow day_opt = None
+        raise NotImplementedError
+    else:
+        raise ValueError(day_opt)
+
+
+cpdef int roll_convention(int other, int n, int compare) nogil:
+    """
+    Possibly increment or decrement the number of periods to shift
+    based on rollforward/rollbackward conventions.
+
+    Parameters
+    ----------
+    other : int, generally the day component of a datetime
+    n : number of periods to increment, before adjusting for rolling
+    compare : int, generally the day component of a datetime, in the same
+              month as the datetime form which `other` was taken.
+
+    Returns
+    -------
+    n : int number of periods to increment
+    """
+    if n > 0 and other < compare:
+        n -= 1
+    elif n <= 0 and other > compare:
+        # as if rolled forward already
+        n += 1
+    return n
+
+
+cpdef int roll_qtrday(datetime other, int n, int month, object day_opt,
+                      int modby=3) except? -1:
+    """
+    Possibly increment or decrement the number of periods to shift
+    based on rollforward/rollbackward conventions.
+
+    Parameters
+    ----------
+    other : datetime or Timestamp
+    n : number of periods to increment, before adjusting for rolling
+    month : int reference month giving the first month of the year
+    day_opt : 'start', 'end', 'business_start', 'business_end'
+        The convention to use in finding the day in a given month against
+        which to compare for rollforward/rollbackward decisions.
+    modby : int 3 for quarters, 12 for years
+
+    Returns
+    -------
+    n : int number of periods to increment
+    """
+    cdef:
+        int months_since
+    # TODO: Merge this with roll_yearday by setting modby=12 there?
+    #       code de-duplication versus perf hit?
+    # TODO: with small adjustments this could be used in shift_quarters
+    months_since = other.month % modby - month % modby
+
+    if n > 0:
+        if months_since < 0 or (months_since == 0 and
+                                other.day < get_day_of_month(other,
+                                                             day_opt)):
+            # pretend to roll back if on same month but
+            # before compare_day
+            n -= 1
+    else:
+        if months_since > 0 or (months_since == 0 and
+                                other.day > get_day_of_month(other,
+                                                             day_opt)):
+            # make sure to roll forward, so negate
+            n += 1
+    return n
+
+
+cpdef int roll_yearday(datetime other, int n, int month,
+                       object day_opt) except? -1:
+    """
+    Possibly increment or decrement the number of periods to shift
+    based on rollforward/rollbackward conventions.
+
+    Parameters
+    ----------
+    other : datetime or Timestamp
+    n : number of periods to increment, before adjusting for rolling
+    month : reference month giving the first month of the year
+    day_opt : 'start', 'end'
+        'start': returns 1
+        'end': returns last day of the month
+
+    Returns
+    -------
+    n : int number of periods to increment
+
+    Notes
+    -----
+    * Mirrors `roll_check` in shift_months
+
+    Examples
+    -------
+    >>> month = 3
+    >>> day_opt = 'start'              # `other` will be compared to March 1
+    >>> other = datetime(2017, 2, 10)  # before March 1
+    >>> roll_yearday(other, 2, month, day_opt)
+    1
+    >>> roll_yearday(other, -7, month, day_opt)
+    -7
+    >>>
+    >>> other = Timestamp('2014-03-15', tz='US/Eastern')  # after March 1
+    >>> roll_yearday(other, 2, month, day_opt)
+    2
+    >>> roll_yearday(other, -7, month, day_opt)
+    -6
+
+    >>> month = 6
+    >>> day_opt = 'end'                # `other` will be compared to June 30
+    >>> other = datetime(1999, 6, 29)  # before June 30
+    >>> roll_yearday(other, 5, month, day_opt)
+    4
+    >>> roll_yearday(other, -7, month, day_opt)
+    -7
+    >>>
+    >>> other = Timestamp(2072, 8, 24, 6, 17, 18)  # after June 30
+    >>> roll_yearday(other, 5, month, day_opt)
+    5
+    >>> roll_yearday(other, -7, month, day_opt)
+    -6
+
+    """
+    # Note: The other.day < ... condition will never hold when day_opt=='start'
+    # and the other.day > ... condition will never hold when day_opt=='end'.
+    # At some point these extra checks may need to be optimized away.
+    # But that point isn't today.
+    if n > 0:
+        if other.month < month or (other.month == month and
+                                   other.day < get_day_of_month(other,
+                                                                day_opt)):
+            n -= 1
+    else:
+        if other.month > month or (other.month == month and
+                                   other.day > get_day_of_month(other,
+                                                                day_opt)):
+            n += 1
+    return n
diff --git a/pandas/_libs/tslibs/parsing.pyx b/pandas/_libs/tslibs/parsing.pyx
new file mode 100644
index 0000000000000..2ecd55ea88170
--- /dev/null
+++ b/pandas/_libs/tslibs/parsing.pyx
@@ -0,0 +1,681 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+"""
+Parsing functions for datetime and datetime-like strings.
+"""
+import sys
+import re
+
+from cpython cimport PyString_Check, PyUnicode_Check
+
+from libc.stdlib cimport free
+
+cimport cython
+from cython cimport Py_ssize_t
+
+
+from datetime import datetime
+import time
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport int64_t, ndarray
+cnp.import_array()
+
+# Avoid import from outside _libs
+if sys.version_info.major == 2:
+    string_types = basestring
+    from StringIO import StringIO
+else:
+    string_types = str
+    from io import StringIO
+
+
+# dateutil compat
+from dateutil.tz import (tzoffset,
+                         tzlocal as _dateutil_tzlocal,
+                         tzfile as _dateutil_tzfile,
+                         tzutc as _dateutil_tzutc,
+                         tzstr as _dateutil_tzstr)
+from dateutil.relativedelta import relativedelta
+from dateutil.parser import DEFAULTPARSER
+from dateutil.parser import parse as du_parse
+
+from ccalendar import MONTH_NUMBERS
+from nattype import nat_strings
+
+# ----------------------------------------------------------------------
+# Constants
+
+
+class DateParseError(ValueError):
+    pass
+
+
+_DEFAULT_DATETIME = datetime(1, 1, 1).replace(hour=0, minute=0,
+                                              second=0, microsecond=0)
+
+cdef object _TIMEPAT = re.compile(r'^([01]?[0-9]|2[0-3]):([0-5][0-9])')
+
+cdef set _not_datelike_strings = {'a', 'A', 'm', 'M', 'p', 'P', 't', 'T'}
+
+NAT_SENTINEL = object()
+# This allows us to reference NaT without having to import it
+
+# ----------------------------------------------------------------------
+
+
+def parse_datetime_string(date_string, freq=None, dayfirst=False,
+                          yearfirst=False, **kwargs):
+    """parse datetime string, only returns datetime.
+    Also cares special handling matching time patterns.
+
+    Returns
+    -------
+    datetime
+    """
+
+    cdef:
+        object dt
+
+    if not _does_string_look_like_datetime(date_string):
+        raise ValueError('Given date string not likely a datetime.')
+
+    if _TIMEPAT.match(date_string):
+        # use current datetime as default, not pass _DEFAULT_DATETIME
+        dt = du_parse(date_string, dayfirst=dayfirst,
+                      yearfirst=yearfirst, **kwargs)
+        return dt
+
+    try:
+        dt, _, _ = _parse_dateabbr_string(date_string, _DEFAULT_DATETIME, freq)
+        return dt
+    except DateParseError:
+        raise
+    except ValueError:
+        pass
+
+    try:
+        dt = du_parse(date_string, default=_DEFAULT_DATETIME,
+                      dayfirst=dayfirst, yearfirst=yearfirst, **kwargs)
+    except TypeError:
+        # following may be raised from dateutil
+        # TypeError: 'NoneType' object is not iterable
+        raise ValueError('Given date string not likely a datetime.')
+
+    return dt
+
+
+def parse_time_string(arg, freq=None, dayfirst=None, yearfirst=None):
+    """
+    Try hard to parse datetime string, leveraging dateutil plus some extra
+    goodies like quarter recognition.
+
+    Parameters
+    ----------
+    arg : compat.string_types
+    freq : str or DateOffset, default None
+        Helps with interpreting time string if supplied
+    dayfirst : bool, default None
+        If None uses default from print_config
+    yearfirst : bool, default None
+        If None uses default from print_config
+
+    Returns
+    -------
+    datetime, datetime/dateutil.parser._result, str
+    """
+    if not isinstance(arg, string_types):
+        return arg
+
+    if getattr(freq, "_typ", None) == "dateoffset":
+        freq = freq.rule_code
+
+    if dayfirst is None:
+        from pandas.core.config import get_option
+        dayfirst = get_option("display.date_dayfirst")
+    if yearfirst is None:
+        from pandas.core.config import get_option
+        yearfirst = get_option("display.date_yearfirst")
+
+    res = parse_datetime_string_with_reso(arg, freq=freq,
+                                          dayfirst=dayfirst,
+                                          yearfirst=yearfirst)
+    if res[0] is NAT_SENTINEL:
+        from pandas._libs.tslib import NaT
+        res = (NaT,) + res[1:]
+    return res
+
+
+def parse_datetime_string_with_reso(date_string, freq=None, dayfirst=False,
+                                    yearfirst=False, **kwargs):
+    """parse datetime string, only returns datetime
+
+    Returns
+    -------
+    datetime
+    """
+
+    cdef:
+        object parsed, reso
+
+    if not _does_string_look_like_datetime(date_string):
+        raise ValueError('Given date string not likely a datetime.')
+
+    try:
+        return _parse_dateabbr_string(date_string, _DEFAULT_DATETIME, freq)
+    except DateParseError:
+        raise
+    except ValueError:
+        pass
+
+    try:
+        parsed, reso = dateutil_parse(date_string, _DEFAULT_DATETIME,
+                                      dayfirst=dayfirst, yearfirst=yearfirst)
+    except Exception as e:
+        # TODO: allow raise of errors within instead
+        raise DateParseError(e)
+    if parsed is None:
+        raise DateParseError("Could not parse %s" % date_string)
+    return parsed, parsed, reso
+
+
+cpdef bint _does_string_look_like_datetime(object date_string):
+    if date_string.startswith('0'):
+        # Strings starting with 0 are more consistent with a
+        # date-like string than a number
+        return True
+
+    try:
+        if float(date_string) < 1000:
+            return False
+    except ValueError:
+        pass
+
+    if date_string in _not_datelike_strings:
+        return False
+
+    return True
+
+
+cdef inline object _parse_dateabbr_string(object date_string, object default,
+                                          object freq):
+    cdef:
+        object ret
+        int year, quarter = -1, month, mnum, date_len
+
+    # special handling for possibilities eg, 2Q2005, 2Q05, 2005Q1, 05Q1
+    assert isinstance(date_string, string_types)
+
+    # len(date_string) == 0
+    # should be NaT???
+
+    if date_string in nat_strings:
+        return NAT_SENTINEL, NAT_SENTINEL, ''
+
+    date_string = date_string.upper()
+    date_len = len(date_string)
+
+    if date_len == 4:
+        # parse year only like 2000
+        try:
+            ret = default.replace(year=int(date_string))
+            return ret, ret, 'year'
+        except ValueError:
+            pass
+
+    try:
+        if 4 <= date_len <= 7:
+            i = date_string.index('Q', 1, 6)
+            if i == 1:
+                quarter = int(date_string[0])
+                if date_len == 4 or (date_len == 5
+                                     and date_string[i + 1] == '-'):
+                    # r'(\d)Q-?(\d\d)')
+                    year = 2000 + int(date_string[-2:])
+                elif date_len == 6 or (date_len == 7
+                                       and date_string[i + 1] == '-'):
+                    # r'(\d)Q-?(\d\d\d\d)')
+                    year = int(date_string[-4:])
+                else:
+                    raise ValueError
+            elif i == 2 or i == 3:
+                # r'(\d\d)-?Q(\d)'
+                if date_len == 4 or (date_len == 5
+                                     and date_string[i - 1] == '-'):
+                    quarter = int(date_string[-1])
+                    year = 2000 + int(date_string[:2])
+                else:
+                    raise ValueError
+            elif i == 4 or i == 5:
+                if date_len == 6 or (date_len == 7
+                                     and date_string[i - 1] == '-'):
+                    # r'(\d\d\d\d)-?Q(\d)'
+                    quarter = int(date_string[-1])
+                    year = int(date_string[:4])
+                else:
+                    raise ValueError
+
+            if not (1 <= quarter <= 4):
+                msg = ('Incorrect quarterly string is given, quarter must be '
+                       'between 1 and 4: {0}')
+                raise DateParseError(msg.format(date_string))
+
+            if freq is not None:
+                # hack attack, #1228
+                try:
+                    mnum = MONTH_NUMBERS[_get_rule_month(freq)] + 1
+                except (KeyError, ValueError):
+                    msg = ('Unable to retrieve month information from given '
+                           'freq: {0}').format(freq)
+                    raise DateParseError(msg)
+
+                month = (mnum + (quarter - 1) * 3) % 12 + 1
+                if month > mnum:
+                    year -= 1
+            else:
+                month = (quarter - 1) * 3 + 1
+
+            ret = default.replace(year=year, month=month)
+            return ret, ret, 'quarter'
+
+    except DateParseError:
+        raise
+    except ValueError:
+        pass
+
+    if date_len == 6 and (freq == 'M' or
+                          getattr(freq, 'rule_code', None) == 'M'):
+        year = int(date_string[:4])
+        month = int(date_string[4:6])
+        try:
+            ret = default.replace(year=year, month=month)
+            return ret, ret, 'month'
+        except ValueError:
+            pass
+
+    for pat in ['%Y-%m', '%m-%Y', '%b %Y', '%b-%Y']:
+        try:
+            ret = datetime.strptime(date_string, pat)
+            return ret, ret, 'month'
+        except ValueError:
+            pass
+
+    raise ValueError('Unable to parse {0}'.format(date_string))
+
+
+def dateutil_parse(object timestr, object default, ignoretz=False,
+                   tzinfos=None, **kwargs):
+    """ lifted from dateutil to get resolution"""
+
+    cdef:
+        object fobj, res, attr, ret, tzdata
+        object reso = None
+        dict repl = {}
+
+    fobj = StringIO(str(timestr))
+    res = DEFAULTPARSER._parse(fobj, **kwargs)
+
+    # dateutil 2.2 compat
+    if isinstance(res, tuple):  # PyTuple_Check
+        res, _ = res
+
+    if res is None:
+        msg = "Unknown datetime string format, unable to parse: {0}"
+        raise ValueError(msg.format(timestr))
+
+    for attr in ["year", "month", "day", "hour",
+                 "minute", "second", "microsecond"]:
+        value = getattr(res, attr)
+        if value is not None:
+            repl[attr] = value
+            reso = attr
+
+    if reso is None:
+        msg = "Unable to parse datetime string: {0}"
+        raise ValueError(msg.format(timestr))
+
+    if reso == 'microsecond':
+        if repl['microsecond'] == 0:
+            reso = 'second'
+        elif repl['microsecond'] % 1000 == 0:
+            reso = 'millisecond'
+
+    ret = default.replace(**repl)
+    if res.weekday is not None and not res.day:
+        ret = ret + relativedelta.relativedelta(weekday=res.weekday)
+    if not ignoretz:
+        if callable(tzinfos) or tzinfos and res.tzname in tzinfos:
+            if callable(tzinfos):
+                tzdata = tzinfos(res.tzname, res.tzoffset)
+            else:
+                tzdata = tzinfos.get(res.tzname)
+            if isinstance(tzdata, datetime.tzinfo):
+                tzinfo = tzdata
+            elif isinstance(tzdata, string_types):
+                tzinfo = _dateutil_tzstr(tzdata)
+            elif isinstance(tzdata, int):
+                tzinfo = tzoffset(res.tzname, tzdata)
+            else:
+                raise ValueError("offset must be tzinfo subclass, "
+                                 "tz string, or int offset")
+            ret = ret.replace(tzinfo=tzinfo)
+        elif res.tzname and res.tzname in time.tzname:
+            ret = ret.replace(tzinfo=_dateutil_tzlocal())
+        elif res.tzoffset == 0:
+            ret = ret.replace(tzinfo=_dateutil_tzutc())
+        elif res.tzoffset:
+            ret = ret.replace(tzinfo=tzoffset(res.tzname, res.tzoffset))
+    return ret, reso
+
+
+cpdef object _get_rule_month(object source, object default='DEC'):
+    """
+    Return starting month of given freq, default is December.
+
+    Example
+    -------
+    >>> _get_rule_month('D')
+    'DEC'
+
+    >>> _get_rule_month('A-JAN')
+    'JAN'
+    """
+    if hasattr(source, 'freqstr'):
+        source = source.freqstr
+    source = source.upper()
+    if '-' not in source:
+        return default
+    else:
+        return source.split('-')[1]
+
+
+# ----------------------------------------------------------------------
+# Parsing for type-inference
+
+
+def try_parse_dates(ndarray[object] values, parser=None,
+                    dayfirst=False, default=None):
+    cdef:
+        Py_ssize_t i, n
+        ndarray[object] result
+
+    n = len(values)
+    result = np.empty(n, dtype='O')
+
+    if parser is None:
+        if default is None:  # GH2618
+            date = datetime.now()
+            default = datetime(date.year, date.month, 1)
+
+        parse_date = lambda x: du_parse(x, dayfirst=dayfirst, default=default)
+
+        # EAFP here
+        try:
+            for i from 0 <= i < n:
+                if values[i] == '':
+                    result[i] = np.nan
+                else:
+                    result[i] = parse_date(values[i])
+        except Exception:
+            # failed
+            return values
+    else:
+        parse_date = parser
+
+        try:
+            for i from 0 <= i < n:
+                if values[i] == '':
+                    result[i] = np.nan
+                else:
+                    result[i] = parse_date(values[i])
+        except Exception:
+            # raise if passed parser and it failed
+            raise
+
+    return result
+
+
+def try_parse_date_and_time(ndarray[object] dates, ndarray[object] times,
+                            date_parser=None, time_parser=None,
+                            dayfirst=False, default=None):
+    cdef:
+        Py_ssize_t i, n
+        ndarray[object] result
+
+    n = len(dates)
+    if len(times) != n:
+        raise ValueError('Length of dates and times must be equal')
+    result = np.empty(n, dtype='O')
+
+    if date_parser is None:
+        if default is None:  # GH2618
+            date = datetime.now()
+            default = datetime(date.year, date.month, 1)
+
+        parse_date = lambda x: du_parse(x, dayfirst=dayfirst, default=default)
+
+    else:
+        parse_date = date_parser
+
+    if time_parser is None:
+        parse_time = lambda x: du_parse(x)
+
+    else:
+        parse_time = time_parser
+
+    for i from 0 <= i < n:
+        d = parse_date(str(dates[i]))
+        t = parse_time(str(times[i]))
+        result[i] = datetime(d.year, d.month, d.day,
+                             t.hour, t.minute, t.second)
+
+    return result
+
+
+def try_parse_year_month_day(ndarray[object] years, ndarray[object] months,
+                             ndarray[object] days):
+    cdef:
+        Py_ssize_t i, n
+        ndarray[object] result
+
+    n = len(years)
+    if len(months) != n or len(days) != n:
+        raise ValueError('Length of years/months/days must all be equal')
+    result = np.empty(n, dtype='O')
+
+    for i from 0 <= i < n:
+        result[i] = datetime(int(years[i]), int(months[i]), int(days[i]))
+
+    return result
+
+
+def try_parse_datetime_components(ndarray[object] years,
+                                  ndarray[object] months,
+                                  ndarray[object] days,
+                                  ndarray[object] hours,
+                                  ndarray[object] minutes,
+                                  ndarray[object] seconds):
+
+    cdef:
+        Py_ssize_t i, n
+        ndarray[object] result
+        int secs
+        double float_secs
+        double micros
+
+    n = len(years)
+    if (len(months) != n or len(days) != n or len(hours) != n or
+            len(minutes) != n or len(seconds) != n):
+        raise ValueError('Length of all datetime components must be equal')
+    result = np.empty(n, dtype='O')
+
+    for i from 0 <= i < n:
+        float_secs = float(seconds[i])
+        secs = int(float_secs)
+
+        micros = float_secs - secs
+        if micros > 0:
+            micros = micros * 1000000
+
+        result[i] = datetime(int(years[i]), int(months[i]), int(days[i]),
+                             int(hours[i]), int(minutes[i]), secs,
+                             int(micros))
+
+    return result
+
+
+# ----------------------------------------------------------------------
+# Miscellaneous
+
+_DATEUTIL_LEXER_SPLIT = None
+try:
+    # Since these are private methods from dateutil, it is safely imported
+    # here so in case this interface changes, pandas will just fallback
+    # to not using the functionality
+    from dateutil.parser import _timelex
+
+    if hasattr(_timelex, 'split'):
+        def _lexer_split_from_str(dt_str):
+            # The StringIO(str(_)) is for dateutil 2.2 compatibility
+            return _timelex.split(StringIO(str(dt_str)))
+
+        _DATEUTIL_LEXER_SPLIT = _lexer_split_from_str
+except (ImportError, AttributeError):
+    pass
+
+
+def _format_is_iso(f):
+    """
+    Does format match the iso8601 set that can be handled by the C parser?
+    Generally of form YYYY-MM-DDTHH:MM:SS - date separator can be different
+    but must be consistent.  Leading 0s in dates and times are optional.
+    """
+    iso_template = '%Y{date_sep}%m{date_sep}%d{time_sep}%H:%M:%S.%f'.format
+    excluded_formats = ['%Y%m%d', '%Y%m', '%Y']
+
+    for date_sep in [' ', '/', '\\', '-', '.', '']:
+        for time_sep in [' ', 'T']:
+            if (iso_template(date_sep=date_sep,
+                             time_sep=time_sep
+                             ).startswith(f) and f not in excluded_formats):
+                return True
+    return False
+
+
+def _guess_datetime_format(dt_str, dayfirst=False, dt_str_parse=du_parse,
+                           dt_str_split=_DATEUTIL_LEXER_SPLIT):
+    """
+    Guess the datetime format of a given datetime string.
+
+    Parameters
+    ----------
+    dt_str : string, datetime string to guess the format of
+    dayfirst : boolean, default False
+        If True parses dates with the day first, eg 20/01/2005
+        Warning: dayfirst=True is not strict, but will prefer to parse
+        with day first (this is a known bug).
+    dt_str_parse : function, defaults to `compat.parse_date` (dateutil)
+        This function should take in a datetime string and return
+        a `datetime.datetime` guess that the datetime string represents
+    dt_str_split : function, defaults to `_DATEUTIL_LEXER_SPLIT` (dateutil)
+        This function should take in a datetime string and return
+        a list of strings, the guess of the various specific parts
+        e.g. '2011/12/30' -> ['2011', '/', '12', '/', '30']
+
+    Returns
+    -------
+    ret : datetime format string (for `strftime` or `strptime`)
+    """
+    if dt_str_parse is None or dt_str_split is None:
+        return None
+
+    if not isinstance(dt_str, string_types):
+        return None
+
+    day_attribute_and_format = (('day',), '%d', 2)
+
+    # attr name, format, padding (if any)
+    datetime_attrs_to_format = [
+        (('year', 'month', 'day'), '%Y%m%d', 0),
+        (('year',), '%Y', 0),
+        (('month',), '%B', 0),
+        (('month',), '%b', 0),
+        (('month',), '%m', 2),
+        day_attribute_and_format,
+        (('hour',), '%H', 2),
+        (('minute',), '%M', 2),
+        (('second',), '%S', 2),
+        (('microsecond',), '%f', 6),
+        (('second', 'microsecond'), '%S.%f', 0),
+    ]
+
+    if dayfirst:
+        datetime_attrs_to_format.remove(day_attribute_and_format)
+        datetime_attrs_to_format.insert(0, day_attribute_and_format)
+
+    try:
+        parsed_datetime = dt_str_parse(dt_str, dayfirst=dayfirst)
+    except:
+        # In case the datetime can't be parsed, its format cannot be guessed
+        return None
+
+    if parsed_datetime is None:
+        return None
+
+    try:
+        tokens = dt_str_split(dt_str)
+    except:
+        # In case the datetime string can't be split, its format cannot
+        # be guessed
+        return None
+
+    format_guess = [None] * len(tokens)
+    found_attrs = set()
+
+    for attrs, attr_format, padding in datetime_attrs_to_format:
+        # If a given attribute has been placed in the format string, skip
+        # over other formats for that same underlying attribute (IE, month
+        # can be represented in multiple different ways)
+        if set(attrs) & found_attrs:
+            continue
+
+        if all(getattr(parsed_datetime, attr) is not None for attr in attrs):
+            for i, token_format in enumerate(format_guess):
+                token_filled = tokens[i].zfill(padding)
+                if (token_format is None and
+                        token_filled == parsed_datetime.strftime(attr_format)):
+                    format_guess[i] = attr_format
+                    tokens[i] = token_filled
+                    found_attrs.update(attrs)
+                    break
+
+    # Only consider it a valid guess if we have a year, month and day
+    if len({'year', 'month', 'day'} & found_attrs) != 3:
+        return None
+
+    output_format = []
+    for i, guess in enumerate(format_guess):
+        if guess is not None:
+            # Either fill in the format placeholder (like %Y)
+            output_format.append(guess)
+        else:
+            # Or just the token separate (IE, the dashes in "01-01-2013")
+            try:
+                # If the token is numeric, then we likely didn't parse it
+                # properly, so our guess is wrong
+                float(tokens[i])
+                return None
+            except ValueError:
+                pass
+
+            output_format.append(tokens[i])
+
+    guessed_format = ''.join(output_format)
+
+    # rebuild string, capturing any inferred padding
+    dt_str = ''.join(tokens)
+    if parsed_datetime.strftime(guessed_format) == dt_str:
+        return guessed_format
+    else:
+        return None
diff --git a/pandas/_libs/tslibs/period.pyx b/pandas/_libs/tslibs/period.pyx
new file mode 100644
index 0000000000000..6985d3b8df363
--- /dev/null
+++ b/pandas/_libs/tslibs/period.pyx
@@ -0,0 +1,1856 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+from datetime import datetime, date, timedelta
+
+from cpython cimport (
+    PyUnicode_Check,
+    PyObject_RichCompareBool,
+    Py_EQ, Py_NE)
+
+from numpy cimport int64_t, import_array, ndarray
+import numpy as np
+import_array()
+
+from libc.stdlib cimport free, malloc
+from libc.time cimport strftime, tm
+from libc.string cimport strlen, memset
+
+from pandas.compat import PY2
+
+cimport cython
+
+from cpython.datetime cimport (PyDateTime_Check, PyDelta_Check,
+                               PyDateTime_IMPORT)
+# import datetime C API
+PyDateTime_IMPORT
+
+from np_datetime cimport (pandas_datetimestruct, dtstruct_to_dt64,
+                          dt64_to_dtstruct,
+                          PANDAS_FR_D,
+                          pandas_datetime_to_datetimestruct,
+                          PANDAS_DATETIMEUNIT)
+
+cdef extern from "../src/datetime/np_datetime.h":
+    int64_t pandas_datetimestruct_to_datetime(PANDAS_DATETIMEUNIT fr,
+                                              pandas_datetimestruct *d
+                                              ) nogil
+
+cimport util
+from util cimport is_period_object, is_string_object, INT32_MIN
+
+from pandas._libs.missing cimport is_null_datetimelike
+
+from timestamps import Timestamp
+from timezones cimport is_utc, is_tzlocal, get_utcoffset, get_dst_info
+from timedeltas cimport delta_to_nanoseconds
+
+cimport ccalendar
+from ccalendar cimport dayofweek, get_day_of_year, is_leapyear
+from ccalendar import MONTH_NUMBERS
+from conversion cimport tz_convert_utc_to_tzlocal
+from frequencies cimport (get_freq_code, get_base_alias,
+                          get_to_timestamp_base, get_freq_str,
+                          get_rule_month)
+from parsing import parse_time_string, NAT_SENTINEL
+from resolution import Resolution
+from nattype import nat_strings, NaT, iNaT
+from nattype cimport _nat_scalar_rules, NPY_NAT
+
+from pandas.tseries import offsets
+from pandas.tseries import frequencies
+
+
+cdef extern from "period_helper.h":
+    int FR_ANN
+    int FR_QTR
+    int FR_MTH
+    int FR_WK
+    int FR_DAY
+    int FR_HR
+    int FR_MIN
+    int FR_SEC
+    int FR_MS
+    int FR_US
+    int FR_NS
+    int FR_BUS
+    int FR_UND
+
+    ctypedef struct asfreq_info:
+        int64_t intraday_conversion_factor
+        int is_end
+
+        int to_end
+        int from_end
+
+    ctypedef int64_t (*freq_conv_func)(int64_t, asfreq_info*) nogil
+
+    freq_conv_func get_asfreq_func(int fromFreq, int toFreq) nogil
+
+    int64_t get_daytime_conversion_factor(int from_index, int to_index) nogil
+    int max_value(int left, int right) nogil
+
+
+@cython.cdivision
+cdef char* c_strftime(pandas_datetimestruct *dts, char *fmt):
+    """
+    Generate a nice string representation of the period
+    object, originally from DateObject_strftime
+
+    Parameters
+    ----------
+    dts : pandas_datetimestruct*
+    fmt : char*
+
+    Returns
+    -------
+    result : char*
+    """
+    cdef:
+        tm c_date
+        char *result
+        int result_len = strlen(fmt) + 50
+
+    c_date.tm_sec = dts.sec
+    c_date.tm_min = dts.min
+    c_date.tm_hour = dts.hour
+    c_date.tm_mday = dts.day
+    c_date.tm_mon = dts.month - 1
+    c_date.tm_year = dts.year - 1900
+    c_date.tm_wday = (dayofweek(dts.year, dts.month, dts.day) + 1) % 7
+    c_date.tm_yday = get_day_of_year(dts.year, dts.month, dts.day) - 1
+    c_date.tm_isdst = -1
+
+    result = <char*>malloc(result_len * sizeof(char))
+
+    strftime(result, result_len, fmt, &c_date)
+
+    return result
+
+
+# ----------------------------------------------------------------------
+# Conversion between date_info and pandas_datetimestruct
+
+cdef inline int get_freq_group(int freq) nogil:
+    return (freq // 1000) * 1000
+
+
+cdef inline int get_freq_group_index(int freq) nogil:
+    return freq // 1000
+
+
+# specifically _dont_ use cdvision or else ordinals near -1 are assigned to
+# incorrect dates GH#19643
+@cython.cdivision(False)
+cdef int64_t get_period_ordinal(pandas_datetimestruct *dts, int freq) nogil:
+    """
+    Generate an ordinal in period space
+
+    Parameters
+    ----------
+    dts: pandas_datetimestruct*
+    freq : int
+
+    Returns
+    -------
+    period_ordinal : int64_t
+    """
+    cdef:
+        int64_t unix_date, seconds, delta
+        int64_t weeks
+        int64_t day_adj
+        int freq_group, fmonth, mdiff
+
+    freq_group = get_freq_group(freq)
+
+    if freq_group == FR_ANN:
+        fmonth = freq - FR_ANN
+        if fmonth == 0:
+            fmonth = 12
+
+        mdiff = dts.month - fmonth
+        if mdiff <= 0:
+            return dts.year - 1970
+        else:
+            return dts.year - 1970 + 1
+
+    elif freq_group == FR_QTR:
+        fmonth = freq - FR_QTR
+        if fmonth == 0:
+            fmonth = 12
+
+        mdiff = dts.month - fmonth
+        # TODO: Aren't the next two conditions equivalent to
+        # unconditional incrementing?
+        if mdiff < 0:
+            mdiff += 12
+        if dts.month >= fmonth:
+            mdiff += 12
+
+        return (dts.year - 1970) * 4 + (mdiff - 1) // 3
+
+    elif freq == FR_MTH:
+        return (dts.year - 1970) * 12 + dts.month - 1
+
+    unix_date = pandas_datetimestruct_to_datetime(PANDAS_FR_D, dts)
+
+    if freq >= FR_SEC:
+        seconds = unix_date * 86400 + dts.hour * 3600 + dts.min * 60 + dts.sec
+
+        if freq == FR_MS:
+            return seconds * 1000 + dts.us // 1000
+
+        elif freq == FR_US:
+            return seconds * 1000000 + dts.us
+
+        elif freq == FR_NS:
+            return (seconds * 1000000000 +
+                    dts.us * 1000 + dts.ps // 1000)
+
+        else:
+            return seconds
+
+    elif freq == FR_MIN:
+        return unix_date * 1440 + dts.hour * 60 + dts.min
+
+    elif freq == FR_HR:
+        return unix_date * 24 + dts.hour
+
+    elif freq == FR_DAY:
+        return unix_date
+
+    elif freq == FR_UND:
+        return unix_date
+
+    elif freq == FR_BUS:
+        # calculate the current week (counting from 1970-01-01) treating
+        # sunday as last day of a week
+        weeks = (unix_date + 3) // 7
+        # calculate the current weekday (in range 1 .. 7)
+        delta = (unix_date + 3) % 7 + 1
+        # return the number of business days in full weeks plus the business
+        # days in the last - possible partial - week
+        if delta <= 5:
+            return (5 * weeks) + delta - 4
+        else:
+            return (5 * weeks) + (5 + 1) - 4
+
+    elif freq_group == FR_WK:
+        day_adj = freq - FR_WK
+        return (unix_date + 3 - day_adj) // 7 + 1
+
+    # raise ValueError
+
+
+cdef void get_date_info(int64_t ordinal, int freq,
+                        pandas_datetimestruct *dts) nogil:
+    cdef:
+        int64_t unix_date
+        double abstime
+
+    unix_date = get_unix_date(ordinal, freq)
+    abstime = get_abs_time(freq, unix_date, ordinal)
+
+    while abstime < 0:
+        abstime += 86400
+        unix_date -= 1
+
+    while abstime >= 86400:
+        abstime -= 86400
+        unix_date += 1
+
+    date_info_from_days_and_time(dts, unix_date, abstime)
+
+
+cdef int64_t get_unix_date(int64_t period_ordinal, int freq) nogil:
+    """
+    Returns the proleptic Gregorian ordinal of the date, as an integer.
+    This corresponds to the number of days since Jan., 1st, 1970 AD.
+    When the instance has a frequency less than daily, the proleptic date
+    is calculated for the last day of the period.
+
+    Parameters
+    ----------
+    period_ordinal : int64_t
+    freq : int
+
+    Returns
+    -------
+    unix_date : int64_t number of days since datetime(1970, 1, 1)
+    """
+    cdef:
+        asfreq_info af_info
+        freq_conv_func toDaily = NULL
+
+    if freq == FR_DAY:
+        return period_ordinal
+
+    toDaily = get_asfreq_func(freq, FR_DAY)
+    get_asfreq_info(freq, FR_DAY, True, &af_info)
+    return toDaily(period_ordinal, &af_info)
+
+
+@cython.cdivision
+cdef void date_info_from_days_and_time(pandas_datetimestruct *dts,
+                                       int64_t unix_date,
+                                       double abstime) nogil:
+    """
+    Set the instance's value using the given date and time.
+
+    Parameters
+    ----------
+    dts : pandas_datetimestruct*
+    unix_date : int64_t
+        days elapsed since datetime(1970, 1, 1)
+    abstime : double
+        seconds elapsed since beginning of day described by unix_date
+
+    Notes
+    -----
+    Updates dts inplace
+    """
+    cdef:
+        int inttime
+        int hour, minute
+        double second, subsecond_fraction
+
+    # Bounds check
+    # The calling function is responsible for ensuring that
+    # abstime >= 0.0 and abstime <= 86400
+
+    # Calculate the date
+    pandas_datetime_to_datetimestruct(unix_date, PANDAS_FR_D, dts)
+
+    # Calculate the time
+    inttime = <int>abstime
+    hour = inttime / 3600
+    minute = (inttime % 3600) / 60
+    second = abstime - <double>(hour * 3600 + minute * 60)
+
+    dts.hour = hour
+    dts.min = minute
+    dts.sec = <int>second
+
+    subsecond_fraction = second - dts.sec
+    dts.us = int((subsecond_fraction) * 1e6)
+    dts.ps = int(((subsecond_fraction) * 1e6 - dts.us) * 1e6)
+
+
+@cython.cdivision
+cdef double get_abs_time(int freq, int64_t unix_date, int64_t ordinal) nogil:
+    cdef:
+        int freq_index, day_index, base_index
+        int64_t per_day, start_ord
+        double unit, result
+
+    if freq <= FR_DAY:
+        return 0
+
+    freq_index = freq // 1000
+    day_index = FR_DAY // 1000
+    base_index = FR_SEC // 1000
+
+    per_day = get_daytime_conversion_factor(day_index, freq_index)
+    unit = get_daytime_conversion_factor(freq_index, base_index)
+
+    if base_index < freq_index:
+        unit = 1 / unit
+
+    start_ord = unix_date * per_day
+    result = <double>(unit * (ordinal - start_ord))
+    return result
+
+
+cdef int get_yq(int64_t ordinal, int freq, int *quarter, int *year):
+    """
+    Find the year and quarter of a Period with the given ordinal and frequency
+
+    Parameters
+    ----------
+    ordinal : int64_t
+    freq : int
+    quarter : *int
+    year : *int
+
+    Returns
+    -------
+    qtr_freq : int
+        describes the implied quarterly frequency associated with `freq`
+
+    Notes
+    -----
+    Sets quarter and year inplace
+    """
+    cdef:
+        asfreq_info af_info
+        int qtr_freq
+        int64_t unix_date
+
+    unix_date = get_unix_date(ordinal, freq)
+
+    if get_freq_group(freq) == FR_QTR:
+        qtr_freq = freq
+    else:
+        qtr_freq = FR_QTR
+
+    assert (qtr_freq % 1000) <= 12
+    get_asfreq_info(FR_DAY, qtr_freq, True, &af_info)
+
+    quarter[0] = DtoQ_yq(unix_date, &af_info, year)
+    return qtr_freq
+
+
+cdef int DtoQ_yq(int64_t unix_date, asfreq_info *af_info, int *year):
+    cdef:
+        pandas_datetimestruct dts
+        int quarter
+
+    date_info_from_days_and_time(&dts, unix_date, 0)
+
+    if af_info.to_end != 12:
+        dts.month -= af_info.to_end
+        if dts.month <= 0:
+            dts.month += 12
+        else:
+            dts.year += 1
+
+    year[0] = dts.year
+    quarter = month_to_quarter(dts.month)
+    return quarter
+
+
+cdef inline int month_to_quarter(int month):
+    return (month - 1) // 3 + 1
+
+
+# ----------------------------------------------------------------------
+# Period logic
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def dt64arr_to_periodarr(ndarray[int64_t] dtarr, int freq, tz=None):
+    """
+    Convert array of datetime64 values (passed in as 'i8' dtype) to a set of
+    periods corresponding to desired frequency, per period convention.
+    """
+    cdef:
+        ndarray[int64_t] out
+        Py_ssize_t i, l
+        pandas_datetimestruct dts
+
+    l = len(dtarr)
+
+    out = np.empty(l, dtype='i8')
+
+    if tz is None:
+        with nogil:
+            for i in range(l):
+                if dtarr[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+                dt64_to_dtstruct(dtarr[i], &dts)
+                out[i] = get_period_ordinal(&dts, freq)
+    else:
+        out = localize_dt64arr_to_period(dtarr, freq, tz)
+    return out
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def periodarr_to_dt64arr(ndarray[int64_t] periodarr, int freq):
+    """
+    Convert array to datetime64 values from a set of ordinals corresponding to
+    periods per period convention.
+    """
+    cdef:
+        ndarray[int64_t] out
+        Py_ssize_t i, l
+
+    l = len(periodarr)
+
+    out = np.empty(l, dtype='i8')
+
+    with nogil:
+        for i in range(l):
+            if periodarr[i] == NPY_NAT:
+                out[i] = NPY_NAT
+                continue
+            out[i] = period_ordinal_to_dt64(periodarr[i], freq)
+
+    return out
+
+
+cpdef int64_t period_asfreq(int64_t ordinal, int freq1, int freq2, bint end):
+    """
+    Convert period ordinal from one frequency to another, and if upsampling,
+    choose to use start ('S') or end ('E') of period.
+    """
+    cdef:
+        int64_t retval
+        freq_conv_func func
+        asfreq_info af_info
+
+    if ordinal == iNaT:
+        return iNaT
+
+    func = get_asfreq_func(freq1, freq2)
+    get_asfreq_info(freq1, freq2, end, &af_info)
+    retval = func(ordinal, &af_info)
+
+    if retval == INT32_MIN:
+        raise ValueError('Frequency conversion failed')
+
+    return retval
+
+
+cdef void get_asfreq_info(int from_freq, int to_freq,
+                          bint is_end, asfreq_info *af_info) nogil:
+    """
+    Construct the `asfreq_info` object used to convert an ordinal from
+    `from_freq` to `to_freq`.
+
+    Parameters
+    ----------
+    from_freq : int
+    to_freq int
+    is_end : bool
+    af_info : *asfreq_info
+    """
+    cdef:
+        int from_group = get_freq_group(from_freq)
+        int to_group = get_freq_group(to_freq)
+
+    af_info.is_end = is_end
+
+    af_info.intraday_conversion_factor = get_daytime_conversion_factor(
+        get_freq_group_index(max_value(from_group, FR_DAY)),
+        get_freq_group_index(max_value(to_group, FR_DAY)))
+
+    if from_group == FR_WK:
+        af_info.from_end = calc_week_end(from_freq, from_group)
+    elif from_group == FR_ANN:
+        af_info.from_end = calc_a_year_end(from_freq, from_group)
+    elif from_group == FR_QTR:
+        af_info.from_end = calc_a_year_end(from_freq, from_group)
+
+    if to_group == FR_WK:
+        af_info.to_end = calc_week_end(to_freq, to_group)
+    elif to_group == FR_ANN:
+        af_info.to_end = calc_a_year_end(to_freq, to_group)
+    elif to_group == FR_QTR:
+        af_info.to_end = calc_a_year_end(to_freq, to_group)
+
+
+@cython.cdivision
+cdef int calc_a_year_end(int freq, int group) nogil:
+    cdef:
+        int result = (freq - group) % 12
+    if result == 0:
+        return 12
+    else:
+        return result
+
+
+cdef inline int calc_week_end(int freq, int group) nogil:
+    return freq - group
+
+
+def period_asfreq_arr(ndarray[int64_t] arr, int freq1, int freq2, bint end):
+    """
+    Convert int64-array of period ordinals from one frequency to another, and
+    if upsampling, choose to use start ('S') or end ('E') of period.
+    """
+    cdef:
+        ndarray[int64_t] result
+        Py_ssize_t i, n
+        freq_conv_func func
+        asfreq_info af_info
+        int64_t val
+
+    n = len(arr)
+    result = np.empty(n, dtype=np.int64)
+
+    func = get_asfreq_func(freq1, freq2)
+    get_asfreq_info(freq1, freq2, end, &af_info)
+
+    mask = arr == iNaT
+    if mask.any():      # NaT process
+        for i in range(n):
+            val = arr[i]
+            if val != iNaT:
+                val = func(val, &af_info)
+                if val == INT32_MIN:
+                    raise ValueError("Unable to convert to desired frequency.")
+            result[i] = val
+    else:
+        for i in range(n):
+            val = func(arr[i], &af_info)
+            if val == INT32_MIN:
+                raise ValueError("Unable to convert to desired frequency.")
+            result[i] = val
+
+    return result
+
+
+cpdef int64_t period_ordinal(int y, int m, int d, int h, int min,
+                             int s, int us, int ps, int freq):
+    """
+    Find the ordinal representation of the given datetime components at the
+    frequency `freq`.
+
+    Parameters
+    ----------
+    y : int
+    m : int
+    d : int
+    h : int
+    min : int
+    s : int
+    us : int
+    ps : int
+
+    Returns
+    -------
+    ordinal : int64_t
+    """
+    cdef:
+        pandas_datetimestruct dts
+    dts.year = y
+    dts.month = m
+    dts.day = d
+    dts.hour = h
+    dts.min = min
+    dts.sec = s
+    dts.us = us
+    dts.ps = ps
+    return get_period_ordinal(&dts, freq)
+
+
+cpdef int64_t period_ordinal_to_dt64(int64_t ordinal, int freq) nogil:
+    cdef:
+        pandas_datetimestruct dts
+
+    if ordinal == NPY_NAT:
+        return NPY_NAT
+
+    get_date_info(ordinal, freq, &dts)
+    return dtstruct_to_dt64(&dts)
+
+
+def period_format(int64_t value, int freq, object fmt=None):
+    cdef:
+        int freq_group
+
+    if value == iNaT:
+        return repr(NaT)
+
+    if fmt is None:
+        freq_group = get_freq_group(freq)
+        if freq_group == 1000:    # FR_ANN
+            fmt = b'%Y'
+        elif freq_group == 2000:  # FR_QTR
+            fmt = b'%FQ%q'
+        elif freq_group == 3000:  # FR_MTH
+            fmt = b'%Y-%m'
+        elif freq_group == 4000:  # WK
+            left = period_asfreq(value, freq, 6000, 0)
+            right = period_asfreq(value, freq, 6000, 1)
+            return '%s/%s' % (period_format(left, 6000),
+                              period_format(right, 6000))
+        elif (freq_group == 5000      # BUS
+              or freq_group == 6000):  # DAY
+            fmt = b'%Y-%m-%d'
+        elif freq_group == 7000:   # HR
+            fmt = b'%Y-%m-%d %H:00'
+        elif freq_group == 8000:   # MIN
+            fmt = b'%Y-%m-%d %H:%M'
+        elif freq_group == 9000:   # SEC
+            fmt = b'%Y-%m-%d %H:%M:%S'
+        elif freq_group == 10000:  # MILLISEC
+            fmt = b'%Y-%m-%d %H:%M:%S.%l'
+        elif freq_group == 11000:  # MICROSEC
+            fmt = b'%Y-%m-%d %H:%M:%S.%u'
+        elif freq_group == 12000:  # NANOSEC
+            fmt = b'%Y-%m-%d %H:%M:%S.%n'
+        else:
+            raise ValueError('Unknown freq: %d' % freq)
+
+    return _period_strftime(value, freq, fmt)
+
+
+cdef list extra_fmts = [(b"%q", b"^`AB`^"),
+                        (b"%f", b"^`CD`^"),
+                        (b"%F", b"^`EF`^"),
+                        (b"%l", b"^`GH`^"),
+                        (b"%u", b"^`IJ`^"),
+                        (b"%n", b"^`KL`^")]
+
+cdef list str_extra_fmts = ["^`AB`^", "^`CD`^", "^`EF`^",
+                            "^`GH`^", "^`IJ`^", "^`KL`^"]
+
+cdef object _period_strftime(int64_t value, int freq, object fmt):
+    cdef:
+        Py_ssize_t i
+        pandas_datetimestruct dts
+        char *formatted
+        object pat, repl, result
+        list found_pat = [False] * len(extra_fmts)
+        int year, quarter
+
+    if PyUnicode_Check(fmt):
+        fmt = fmt.encode('utf-8')
+
+    get_date_info(value, freq, &dts)
+    for i in range(len(extra_fmts)):
+        pat = extra_fmts[i][0]
+        repl = extra_fmts[i][1]
+        if pat in fmt:
+            fmt = fmt.replace(pat, repl)
+            found_pat[i] = True
+
+    formatted = c_strftime(&dts, <char*> fmt)
+
+    result = util.char_to_string(formatted)
+    free(formatted)
+
+    for i in range(len(extra_fmts)):
+        if found_pat[i]:
+            if get_yq(value, freq, &quarter, &year) < 0:
+                raise ValueError('Unable to get quarter and year')
+
+            if i == 0:
+                repl = '%d' % quarter
+            elif i == 1:  # %f, 2-digit year
+                repl = '%.2d' % (year % 100)
+            elif i == 2:
+                repl = '%d' % year
+            elif i == 3:
+                repl = '%03d' % (value % 1000)
+            elif i == 4:
+                repl = '%06d' % (value % 1000000)
+            elif i == 5:
+                repl = '%09d' % (value % 1000000000)
+
+            result = result.replace(str_extra_fmts[i], repl)
+
+    if PY2:
+        result = result.decode('utf-8', 'ignore')
+
+    return result
+
+
+# ----------------------------------------------------------------------
+# period accessors
+
+ctypedef int (*accessor)(int64_t ordinal, int freq) except INT32_MIN
+
+
+cdef int pyear(int64_t ordinal, int freq):
+    cdef:
+        pandas_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return dts.year
+
+
+@cython.cdivision
+cdef int pqyear(int64_t ordinal, int freq):
+    cdef:
+        int year, quarter
+    get_yq(ordinal, freq, &quarter, &year)
+    return year
+
+
+cdef int pquarter(int64_t ordinal, int freq):
+    cdef:
+        int year, quarter
+    get_yq(ordinal, freq, &quarter, &year)
+    return quarter
+
+
+cdef int pmonth(int64_t ordinal, int freq):
+    cdef:
+        pandas_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return dts.month
+
+
+cdef int pday(int64_t ordinal, int freq):
+    cdef:
+        pandas_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return dts.day
+
+
+cdef int pweekday(int64_t ordinal, int freq):
+    cdef:
+        pandas_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return dayofweek(dts.year, dts.month, dts.day)
+
+
+cdef int pday_of_year(int64_t ordinal, int freq):
+    cdef:
+        pandas_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return get_day_of_year(dts.year, dts.month, dts.day)
+
+
+cdef int pweek(int64_t ordinal, int freq):
+    cdef:
+        pandas_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return ccalendar.get_week_of_year(dts.year, dts.month, dts.day)
+
+
+cdef int phour(int64_t ordinal, int freq):
+    cdef:
+        pandas_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return dts.hour
+
+
+cdef int pminute(int64_t ordinal, int freq):
+    cdef:
+        pandas_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return dts.min
+
+
+cdef int psecond(int64_t ordinal, int freq):
+    cdef:
+        pandas_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return <int>dts.sec
+
+
+cdef int pdays_in_month(int64_t ordinal, int freq):
+    cdef:
+        pandas_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return ccalendar.get_days_in_month(dts.year, dts.month)
+
+
+def get_period_field_arr(int code, ndarray[int64_t] arr, int freq):
+    cdef:
+        Py_ssize_t i, sz
+        ndarray[int64_t] out
+        accessor f
+
+    func = _get_accessor_func(code)
+    if func is NULL:
+        raise ValueError('Unrecognized period code: %d' % code)
+
+    sz = len(arr)
+    out = np.empty(sz, dtype=np.int64)
+
+    for i in range(sz):
+        if arr[i] == iNaT:
+            out[i] = -1
+            continue
+        out[i] = func(arr[i], freq)
+
+    return out
+
+
+cdef accessor _get_accessor_func(int code):
+    if code == 0:
+        return <accessor>pyear
+    elif code == 1:
+        return <accessor>pqyear
+    elif code == 2:
+        return <accessor>pquarter
+    elif code == 3:
+        return <accessor>pmonth
+    elif code == 4:
+        return <accessor>pday
+    elif code == 5:
+        return <accessor>phour
+    elif code == 6:
+        return <accessor>pminute
+    elif code == 7:
+        return <accessor>psecond
+    elif code == 8:
+        return <accessor>pweek
+    elif code == 9:
+        return <accessor>pday_of_year
+    elif code == 10:
+        return <accessor>pweekday
+    elif code == 11:
+        return <accessor>pdays_in_month
+    return NULL
+
+
+def extract_ordinals(ndarray[object] values, freq):
+    cdef:
+        Py_ssize_t i, n = len(values)
+        ndarray[int64_t] ordinals = np.empty(n, dtype=np.int64)
+        object p
+
+    freqstr = Period._maybe_convert_freq(freq).freqstr
+
+    for i in range(n):
+        p = values[i]
+
+        if is_null_datetimelike(p):
+            ordinals[i] = iNaT
+        else:
+            try:
+                ordinals[i] = p.ordinal
+
+                if p.freqstr != freqstr:
+                    msg = _DIFFERENT_FREQ_INDEX.format(freqstr, p.freqstr)
+                    raise IncompatibleFrequency(msg)
+
+            except AttributeError:
+                p = Period(p, freq=freq)
+                if p is NaT:
+                    # input may contain NaT-like string
+                    ordinals[i] = iNaT
+                else:
+                    ordinals[i] = p.ordinal
+
+    return ordinals
+
+
+def extract_freq(ndarray[object] values):
+    cdef:
+        Py_ssize_t i, n = len(values)
+        object p
+
+    for i in range(n):
+        p = values[i]
+
+        try:
+            # now Timestamp / NaT has freq attr
+            if is_period_object(p):
+                return p.freq
+        except AttributeError:
+            pass
+
+    raise ValueError('freq not specified and cannot be inferred')
+
+
+# -----------------------------------------------------------------------
+# period helpers
+
+
+cdef ndarray[int64_t] localize_dt64arr_to_period(ndarray[int64_t] stamps,
+                                                 int freq, object tz):
+    cdef:
+        Py_ssize_t n = len(stamps)
+        ndarray[int64_t] result = np.empty(n, dtype=np.int64)
+        ndarray[int64_t] trans, deltas, pos
+        pandas_datetimestruct dts
+        int64_t local_val
+
+    if is_utc(tz):
+        for i in range(n):
+            if stamps[i] == NPY_NAT:
+                result[i] = NPY_NAT
+                continue
+            dt64_to_dtstruct(stamps[i], &dts)
+            result[i] = get_period_ordinal(&dts, freq)
+
+    elif is_tzlocal(tz):
+        for i in range(n):
+            if stamps[i] == NPY_NAT:
+                result[i] = NPY_NAT
+                continue
+            local_val = tz_convert_utc_to_tzlocal(stamps[i], tz)
+            dt64_to_dtstruct(local_val, &dts)
+            result[i] = get_period_ordinal(&dts, freq)
+    else:
+        # Adjust datetime64 timestamp, recompute datetimestruct
+        trans, deltas, typ = get_dst_info(tz)
+
+        _pos = trans.searchsorted(stamps, side='right') - 1
+        if _pos.dtype != np.int64:
+            _pos = _pos.astype(np.int64)
+        pos = _pos
+
+        # statictzinfo
+        if typ not in ['pytz', 'dateutil']:
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    result[i] = NPY_NAT
+                    continue
+                dt64_to_dtstruct(stamps[i] + deltas[0], &dts)
+                result[i] = get_period_ordinal(&dts, freq)
+        else:
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    result[i] = NPY_NAT
+                    continue
+                dt64_to_dtstruct(stamps[i] + deltas[pos[i]], &dts)
+                result[i] = get_period_ordinal(&dts, freq)
+
+    return result
+
+
+_DIFFERENT_FREQ = "Input has different freq={1} from Period(freq={0})"
+_DIFFERENT_FREQ_INDEX = ("Input has different freq={1} "
+                         "from PeriodIndex(freq={0})")
+
+
+class IncompatibleFrequency(ValueError):
+    pass
+
+
+cdef class _Period(object):
+
+    cdef readonly:
+        int64_t ordinal
+        object freq
+
+    _typ = 'period'
+
+    def __cinit__(self, ordinal, freq):
+        self.ordinal = ordinal
+        self.freq = freq
+
+    @classmethod
+    def _maybe_convert_freq(cls, object freq):
+
+        if isinstance(freq, (int, tuple)):
+            code, stride = get_freq_code(freq)
+            freq = get_freq_str(code, stride)
+
+        freq = frequencies.to_offset(freq)
+
+        if freq.n <= 0:
+            raise ValueError('Frequency must be positive, because it'
+                             ' represents span: {0}'.format(freq.freqstr))
+
+        return freq
+
+    @classmethod
+    def _from_ordinal(cls, ordinal, freq):
+        """
+        Fast creation from an ordinal and freq that are already validated!
+        """
+        if ordinal == iNaT:
+            return NaT
+        else:
+            freq = cls._maybe_convert_freq(freq)
+            self = _Period.__new__(cls, ordinal, freq)
+            return self
+
+    def __richcmp__(self, other, op):
+        if is_period_object(other):
+            if other.freq != self.freq:
+                msg = _DIFFERENT_FREQ.format(self.freqstr, other.freqstr)
+                raise IncompatibleFrequency(msg)
+            return PyObject_RichCompareBool(self.ordinal, other.ordinal, op)
+        elif other is NaT:
+            return _nat_scalar_rules[op]
+        # index/series like
+        elif hasattr(other, '_typ'):
+            return NotImplemented
+        else:
+            if op == Py_EQ:
+                return NotImplemented
+            elif op == Py_NE:
+                return NotImplemented
+            raise TypeError('Cannot compare type %r with type %r' %
+                            (type(self).__name__, type(other).__name__))
+
+    def __hash__(self):
+        return hash((self.ordinal, self.freqstr))
+
+    def _add_delta(self, other):
+        cdef:
+            int64_t nanos, offset_nanos
+
+        if (PyDelta_Check(other) or util.is_timedelta64_object(other) or
+                isinstance(other, offsets.Tick)):
+            offset = frequencies.to_offset(self.freq.rule_code)
+            if isinstance(offset, offsets.Tick):
+                nanos = delta_to_nanoseconds(other)
+                offset_nanos = delta_to_nanoseconds(offset)
+                if nanos % offset_nanos == 0:
+                    ordinal = self.ordinal + (nanos // offset_nanos)
+                    return Period(ordinal=ordinal, freq=self.freq)
+            msg = 'Input cannot be converted to Period(freq={0})'
+            raise IncompatibleFrequency(msg.format(self.freqstr))
+        elif util.is_offset_object(other):
+            freqstr = other.rule_code
+            base = get_base_alias(freqstr)
+            if base == self.freq.rule_code:
+                ordinal = self.ordinal + other.n
+                return Period(ordinal=ordinal, freq=self.freq)
+            msg = _DIFFERENT_FREQ.format(self.freqstr, other.freqstr)
+            raise IncompatibleFrequency(msg)
+        else:  # pragma no cover
+            return NotImplemented
+
+    def __add__(self, other):
+        if is_period_object(self):
+            if (PyDelta_Check(other) or util.is_timedelta64_object(other) or
+                    util.is_offset_object(other)):
+                return self._add_delta(other)
+            elif other is NaT:
+                return NaT
+            elif util.is_integer_object(other):
+                ordinal = self.ordinal + other * self.freq.n
+                return Period(ordinal=ordinal, freq=self.freq)
+            elif (PyDateTime_Check(other) or
+                  is_period_object(other) or util.is_datetime64_object(other)):
+                # can't add datetime-like
+                # GH#17983
+                sname = type(self).__name__
+                oname = type(other).__name__
+                raise TypeError("unsupported operand type(s) for +: '{self}' "
+                                "and '{other}'".format(self=sname,
+                                                       other=oname))
+            else:  # pragma: no cover
+                return NotImplemented
+        elif is_period_object(other):
+            # this can be reached via __radd__ because of cython rules
+            return other + self
+        else:
+            return NotImplemented
+
+    def __sub__(self, other):
+        if is_period_object(self):
+            if (PyDelta_Check(other) or util.is_timedelta64_object(other) or
+                    util.is_offset_object(other)):
+                neg_other = -other
+                return self + neg_other
+            elif util.is_integer_object(other):
+                ordinal = self.ordinal - other * self.freq.n
+                return Period(ordinal=ordinal, freq=self.freq)
+            elif is_period_object(other):
+                if other.freq != self.freq:
+                    msg = _DIFFERENT_FREQ.format(self.freqstr, other.freqstr)
+                    raise IncompatibleFrequency(msg)
+                return (self.ordinal - other.ordinal) * self.freq
+            elif getattr(other, '_typ', None) == 'periodindex':
+                # GH#21314 PeriodIndex - Period returns an object-index
+                # of DateOffset objects, for which we cannot use __neg__
+                # directly, so we have to apply it pointwise
+                return other.__sub__(self).map(lambda x: -x)
+            else:  # pragma: no cover
+                return NotImplemented
+        elif is_period_object(other):
+            if self is NaT:
+                return NaT
+            return NotImplemented
+        else:
+            return NotImplemented
+
+    def asfreq(self, freq, how='E'):
+        """
+        Convert Period to desired frequency, either at the start or end of the
+        interval
+
+        Parameters
+        ----------
+        freq : string
+        how : {'E', 'S', 'end', 'start'}, default 'end'
+            Start or end of the timespan
+
+        Returns
+        -------
+        resampled : Period
+        """
+        freq = self._maybe_convert_freq(freq)
+        how = _validate_end_alias(how)
+        base1, mult1 = get_freq_code(self.freq)
+        base2, mult2 = get_freq_code(freq)
+
+        # mult1 can't be negative or 0
+        end = how == 'E'
+        if end:
+            ordinal = self.ordinal + mult1 - 1
+        else:
+            ordinal = self.ordinal
+        ordinal = period_asfreq(ordinal, base1, base2, end)
+
+        return Period(ordinal=ordinal, freq=freq)
+
+    @property
+    def start_time(self):
+        """
+        Get the Timestamp for the start of the period.
+
+        Returns
+        -------
+        Timestamp
+
+        See also
+        --------
+        Period.end_time : Return the end Timestamp.
+        Period.dayofyear : Return the day of year.
+        Period.daysinmonth : Return the days in that month.
+        Period.dayofweek : Return the day of the week.
+
+        Examples
+        --------
+        >>> period = pd.Period('2012-1-1', freq='D')
+        >>> period
+        Period('2012-01-01', 'D')
+
+        >>> period.start_time
+        Timestamp('2012-01-01 00:00:00')
+
+        >>> period.end_time
+        Timestamp('2012-01-01 23:59:59.999999999')
+        """
+        return self.to_timestamp(how='S')
+
+    @property
+    def end_time(self):
+        # freq.n can't be negative or 0
+        # ordinal = (self + self.freq.n).start_time.value - 1
+        ordinal = (self + 1).start_time.value - 1
+        return Timestamp(ordinal)
+
+    def to_timestamp(self, freq=None, how='start', tz=None):
+        """
+        Return the Timestamp representation of the Period at the target
+        frequency at the specified end (how) of the Period
+
+        Parameters
+        ----------
+        freq : string or DateOffset
+            Target frequency. Default is 'D' if self.freq is week or
+            longer and 'S' otherwise
+        how: str, default 'S' (start)
+            'S', 'E'. Can be aliased as case insensitive
+            'Start', 'Finish', 'Begin', 'End'
+
+        Returns
+        -------
+        Timestamp
+        """
+        if freq is not None:
+            freq = self._maybe_convert_freq(freq)
+        how = _validate_end_alias(how)
+
+        if freq is None:
+            base, mult = get_freq_code(self.freq)
+            freq = get_to_timestamp_base(base)
+
+        base, mult = get_freq_code(freq)
+        val = self.asfreq(freq, how)
+
+        dt64 = period_ordinal_to_dt64(val.ordinal, base)
+        return Timestamp(dt64, tz=tz)
+
+    @property
+    def year(self):
+        base, mult = get_freq_code(self.freq)
+        return pyear(self.ordinal, base)
+
+    @property
+    def month(self):
+        base, mult = get_freq_code(self.freq)
+        return pmonth(self.ordinal, base)
+
+    @property
+    def day(self):
+        """
+        Get day of the month that a Period falls on.
+
+        Returns
+        -------
+        int
+
+        See Also
+        --------
+        Period.dayofweek : Get the day of the week
+
+        Period.dayofyear : Get the day of the year
+
+        Examples
+        --------
+        >>> p = pd.Period("2018-03-11", freq='H')
+        >>> p.day
+        11
+        """
+        base, mult = get_freq_code(self.freq)
+        return pday(self.ordinal, base)
+
+    @property
+    def hour(self):
+        """
+        Get the hour of the day component of the Period.
+
+        Returns
+        -------
+        int
+            The hour as an integer, between 0 and 23.
+
+        See Also
+        --------
+        Period.second : Get the second component of the Period.
+        Period.minute : Get the minute component of the Period.
+
+        Examples
+        --------
+        >>> p = pd.Period("2018-03-11 13:03:12.050000")
+        >>> p.hour
+        13
+
+        Period longer than a day
+
+        >>> p = pd.Period("2018-03-11", freq="M")
+        >>> p.hour
+        0
+        """
+        base, mult = get_freq_code(self.freq)
+        return phour(self.ordinal, base)
+
+    @property
+    def minute(self):
+        """
+        Get minute of the hour component of the Period.
+
+        Returns
+        -------
+        int
+            The minute as an integer, between 0 and 59.
+
+        See Also
+        --------
+        Period.hour : Get the hour component of the Period.
+        Period.second : Get the second component of the Period.
+
+        Examples
+        --------
+        >>> p = pd.Period("2018-03-11 13:03:12.050000")
+        >>> p.minute
+        3
+        """
+        base, mult = get_freq_code(self.freq)
+        return pminute(self.ordinal, base)
+
+    @property
+    def second(self):
+        """
+        Get the second component of the Period.
+
+        Returns
+        -------
+        int
+            The second of the Period (ranges from 0 to 59).
+
+        See Also
+        --------
+        Period.hour : Get the hour component of the Period.
+        Period.minute : Get the minute component of the Period.
+
+        Examples
+        --------
+        >>> p = pd.Period("2018-03-11 13:03:12.050000")
+        >>> p.second
+        12
+        """
+        base, mult = get_freq_code(self.freq)
+        return psecond(self.ordinal, base)
+
+    @property
+    def weekofyear(self):
+        base, mult = get_freq_code(self.freq)
+        return pweek(self.ordinal, base)
+
+    @property
+    def week(self):
+        """
+        Get the week of the year on the given Period.
+
+        Returns
+        -------
+        int
+
+        See Also
+        --------
+        Period.dayofweek : Get the day component of the Period.
+        Period.weekday : Get the day component of the Period.
+
+        Examples
+        --------
+        >>> p = pd.Period("2018-03-11", "H")
+        >>> p.week
+        10
+
+        >>> p = pd.Period("2018-02-01", "D")
+        >>> p.week
+        5
+
+        >>> p = pd.Period("2018-01-06", "D")
+        >>> p.week
+        1
+        """
+        return self.weekofyear
+
+    @property
+    def dayofweek(self):
+        """
+        Return the day of the week.
+
+        This attribute returns the day of the week on which the particular
+        date for the given period occurs depending on the frequency with
+        Monday=0, Sunday=6.
+
+        Returns
+        -------
+        Int
+            Range from 0 to 6 (included).
+
+        See also
+        --------
+        Period.dayofyear : Return the day of the year.
+        Period.daysinmonth : Return the number of days in that month.
+
+        Examples
+        --------
+        >>> period1 = pd.Period('2012-1-1 19:00', freq='H')
+        >>> period1
+        Period('2012-01-01 19:00', 'H')
+        >>> period1.dayofweek
+        6
+
+        >>> period2 = pd.Period('2013-1-9 11:00', freq='H')
+        >>> period2
+        Period('2013-01-09 11:00', 'H')
+        >>> period2.dayofweek
+        2
+        """
+        base, mult = get_freq_code(self.freq)
+        return pweekday(self.ordinal, base)
+
+    @property
+    def weekday(self):
+        return self.dayofweek
+
+    @property
+    def dayofyear(self):
+        """
+        Return the day of the year.
+
+        This attribute returns the day of the year on which the particular
+        date occurs. The return value ranges between 1 to 365 for regular
+        years and 1 to 366 for leap years.
+
+        Returns
+        -------
+        int
+            The day of year.
+
+        See Also
+        --------
+        Period.day : Return the day of the month.
+        Period.dayofweek : Return the day of week.
+        PeriodIndex.dayofyear : Return the day of year of all indexes.
+
+        Examples
+        --------
+        >>> period = pd.Period("2015-10-23", freq='H')
+        >>> period.dayofyear
+        296
+        >>> period = pd.Period("2012-12-31", freq='D')
+        >>> period.dayofyear
+        366
+        >>> period = pd.Period("2013-01-01", freq='D')
+        >>> period.dayofyear
+        1
+        """
+        base, mult = get_freq_code(self.freq)
+        return pday_of_year(self.ordinal, base)
+
+    @property
+    def quarter(self):
+        base, mult = get_freq_code(self.freq)
+        return pquarter(self.ordinal, base)
+
+    @property
+    def qyear(self):
+        base, mult = get_freq_code(self.freq)
+        return pqyear(self.ordinal, base)
+
+    @property
+    def days_in_month(self):
+        """
+        Get the total number of days in the month that this period falls on.
+
+        Returns
+        -------
+        int
+
+        See Also
+        --------
+        Period.daysinmonth : Gets the number of days in the month.
+        DatetimeIndex.daysinmonth : Gets the number of days in the month.
+        calendar.monthrange : Returns a tuple containing weekday
+            (0-6 ~ Mon-Sun) and number of days (28-31).
+
+        Examples
+        --------
+        >>> p = pd.Period('2018-2-17')
+        >>> p.days_in_month
+        28
+
+        >>> pd.Period('2018-03-01').days_in_month
+        31
+
+        Handles the leap year case as well:
+
+        >>> p = pd.Period('2016-2-17')
+        >>> p.days_in_month
+        29
+        """
+        base, mult = get_freq_code(self.freq)
+        return pdays_in_month(self.ordinal, base)
+
+    @property
+    def daysinmonth(self):
+        """
+        Get the total number of days of the month that the Period falls in.
+
+        Returns
+        -------
+        int
+
+        See Also
+        --------
+        Period.days_in_month : Return the days of the month
+        Period.dayofyear : Return the day of the year
+
+        Examples
+        --------
+        >>> p = pd.Period("2018-03-11", freq='H')
+        >>> p.daysinmonth
+        31
+        """
+        return self.days_in_month
+
+    @property
+    def is_leap_year(self):
+        return bool(is_leapyear(self.year))
+
+    @classmethod
+    def now(cls, freq=None):
+        return Period(datetime.now(), freq=freq)
+
+    # HACK IT UP AND YOU BETTER FIX IT SOON
+    def __str__(self):
+        return self.__unicode__()
+
+    @property
+    def freqstr(self):
+        return self.freq.freqstr
+
+    def __repr__(self):
+        base, mult = get_freq_code(self.freq)
+        formatted = period_format(self.ordinal, base)
+        return "Period('%s', '%s')" % (formatted, self.freqstr)
+
+    def __unicode__(self):
+        """
+        Return a string representation for a particular DataFrame
+
+        Invoked by unicode(df) in py2 only. Yields a Unicode String in both
+        py2/py3.
+        """
+        base, mult = get_freq_code(self.freq)
+        formatted = period_format(self.ordinal, base)
+        value = ("%s" % formatted)
+        return value
+
+    def __setstate__(self, state):
+        self.freq=state[1]
+        self.ordinal=state[2]
+
+    def __reduce__(self):
+        object_state = None, self.freq, self.ordinal
+        return (Period, object_state)
+
+    def strftime(self, fmt):
+        """
+        Returns the string representation of the :class:`Period`, depending
+        on the selected ``fmt``. ``fmt`` must be a string
+        containing one or several directives.  The method recognizes the same
+        directives as the :func:`time.strftime` function of the standard Python
+        distribution, as well as the specific additional directives ``%f``,
+        ``%F``, ``%q``. (formatting & docs originally from scikits.timeries)
+
+        +-----------+--------------------------------+-------+
+        | Directive | Meaning                        | Notes |
+        +===========+================================+=======+
+        | ``%a``    | Locale's abbreviated weekday   |       |
+        |           | name.                          |       |
+        +-----------+--------------------------------+-------+
+        | ``%A``    | Locale's full weekday name.    |       |
+        +-----------+--------------------------------+-------+
+        | ``%b``    | Locale's abbreviated month     |       |
+        |           | name.                          |       |
+        +-----------+--------------------------------+-------+
+        | ``%B``    | Locale's full month name.      |       |
+        +-----------+--------------------------------+-------+
+        | ``%c``    | Locale's appropriate date and  |       |
+        |           | time representation.           |       |
+        +-----------+--------------------------------+-------+
+        | ``%d``    | Day of the month as a decimal  |       |
+        |           | number [01,31].                |       |
+        +-----------+--------------------------------+-------+
+        | ``%f``    | 'Fiscal' year without a        | \(1)  |
+        |           | century  as a decimal number   |       |
+        |           | [00,99]                        |       |
+        +-----------+--------------------------------+-------+
+        | ``%F``    | 'Fiscal' year with a century   | \(2)  |
+        |           | as a decimal number            |       |
+        +-----------+--------------------------------+-------+
+        | ``%H``    | Hour (24-hour clock) as a      |       |
+        |           | decimal number [00,23].        |       |
+        +-----------+--------------------------------+-------+
+        | ``%I``    | Hour (12-hour clock) as a      |       |
+        |           | decimal number [01,12].        |       |
+        +-----------+--------------------------------+-------+
+        | ``%j``    | Day of the year as a decimal   |       |
+        |           | number [001,366].              |       |
+        +-----------+--------------------------------+-------+
+        | ``%m``    | Month as a decimal number      |       |
+        |           | [01,12].                       |       |
+        +-----------+--------------------------------+-------+
+        | ``%M``    | Minute as a decimal number     |       |
+        |           | [00,59].                       |       |
+        +-----------+--------------------------------+-------+
+        | ``%p``    | Locale's equivalent of either  | \(3)  |
+        |           | AM or PM.                      |       |
+        +-----------+--------------------------------+-------+
+        | ``%q``    | Quarter as a decimal number    |       |
+        |           | [01,04]                        |       |
+        +-----------+--------------------------------+-------+
+        | ``%S``    | Second as a decimal number     | \(4)  |
+        |           | [00,61].                       |       |
+        +-----------+--------------------------------+-------+
+        | ``%U``    | Week number of the year        | \(5)  |
+        |           | (Sunday as the first day of    |       |
+        |           | the week) as a decimal number  |       |
+        |           | [00,53].  All days in a new    |       |
+        |           | year preceding the first       |       |
+        |           | Sunday are considered to be in |       |
+        |           | week 0.                        |       |
+        +-----------+--------------------------------+-------+
+        | ``%w``    | Weekday as a decimal number    |       |
+        |           | [0(Sunday),6].                 |       |
+        +-----------+--------------------------------+-------+
+        | ``%W``    | Week number of the year        | \(5)  |
+        |           | (Monday as the first day of    |       |
+        |           | the week) as a decimal number  |       |
+        |           | [00,53].  All days in a new    |       |
+        |           | year preceding the first       |       |
+        |           | Monday are considered to be in |       |
+        |           | week 0.                        |       |
+        +-----------+--------------------------------+-------+
+        | ``%x``    | Locale's appropriate date      |       |
+        |           | representation.                |       |
+        +-----------+--------------------------------+-------+
+        | ``%X``    | Locale's appropriate time      |       |
+        |           | representation.                |       |
+        +-----------+--------------------------------+-------+
+        | ``%y``    | Year without century as a      |       |
+        |           | decimal number [00,99].        |       |
+        +-----------+--------------------------------+-------+
+        | ``%Y``    | Year with century as a decimal |       |
+        |           | number.                        |       |
+        +-----------+--------------------------------+-------+
+        | ``%Z``    | Time zone name (no characters  |       |
+        |           | if no time zone exists).       |       |
+        +-----------+--------------------------------+-------+
+        | ``%%``    | A literal ``'%'`` character.   |       |
+        +-----------+--------------------------------+-------+
+
+        Notes
+        -----
+
+        (1)
+            The ``%f`` directive is the same as ``%y`` if the frequency is
+            not quarterly.
+            Otherwise, it corresponds to the 'fiscal' year, as defined by
+            the :attr:`qyear` attribute.
+
+        (2)
+            The ``%F`` directive is the same as ``%Y`` if the frequency is
+            not quarterly.
+            Otherwise, it corresponds to the 'fiscal' year, as defined by
+            the :attr:`qyear` attribute.
+
+        (3)
+            The ``%p`` directive only affects the output hour field
+            if the ``%I`` directive is used to parse the hour.
+
+        (4)
+            The range really is ``0`` to ``61``; this accounts for leap
+            seconds and the (very rare) double leap seconds.
+
+        (5)
+            The ``%U`` and ``%W`` directives are only used in calculations
+            when the day of the week and the year are specified.
+
+        Examples
+        --------
+
+        >>> a = Period(freq='Q-JUL', year=2006, quarter=1)
+        >>> a.strftime('%F-Q%q')
+        '2006-Q1'
+        >>> # Output the last month in the quarter of this date
+        >>> a.strftime('%b-%Y')
+        'Oct-2005'
+        >>>
+        >>> a = Period(freq='D', year=2001, month=1, day=1)
+        >>> a.strftime('%d-%b-%Y')
+        '01-Jan-2006'
+        >>> a.strftime('%b. %d, %Y was a %A')
+        'Jan. 01, 2001 was a Monday'
+        """
+        base, mult = get_freq_code(self.freq)
+        return period_format(self.ordinal, base, fmt)
+
+
+class Period(_Period):
+    """
+    Represents a period of time
+
+    Parameters
+    ----------
+    value : Period or compat.string_types, default None
+        The time period represented (e.g., '4Q2005')
+    freq : str, default None
+        One of pandas period strings or corresponding objects
+    year : int, default None
+    month : int, default 1
+    quarter : int, default None
+    day : int, default 1
+    hour : int, default 0
+    minute : int, default 0
+    second : int, default 0
+    """
+
+    def __new__(cls, value=None, freq=None, ordinal=None,
+                year=None, month=None, quarter=None, day=None,
+                hour=None, minute=None, second=None):
+        # freq points to a tuple (base, mult);  base is one of the defined
+        # periods such as A, Q, etc. Every five minutes would be, e.g.,
+        # ('T', 5) but may be passed in as a string like '5T'
+
+        # ordinal is the period offset from the gregorian proleptic epoch
+
+        cdef _Period self
+
+        if freq is not None:
+            freq = cls._maybe_convert_freq(freq)
+
+        if ordinal is not None and value is not None:
+            raise ValueError(("Only value or ordinal but not both should be "
+                              "given but not both"))
+        elif ordinal is not None:
+            if not util.is_integer_object(ordinal):
+                raise ValueError("Ordinal must be an integer")
+            if freq is None:
+                raise ValueError('Must supply freq for ordinal value')
+
+        elif value is None:
+            if (year is None and month is None and
+                    quarter is None and day is None and
+                    hour is None and minute is None and second is None):
+                ordinal = iNaT
+            else:
+                if freq is None:
+                    raise ValueError("If value is None, freq cannot be None")
+
+                # set defaults
+                month = 1 if month is None else month
+                day = 1 if day is None else day
+                hour = 0 if hour is None else hour
+                minute = 0 if minute is None else minute
+                second = 0 if second is None else second
+
+                ordinal = _ordinal_from_fields(year, month, quarter, day,
+                                               hour, minute, second, freq)
+
+        elif is_period_object(value):
+            other = value
+            if freq is None or get_freq_code(
+                    freq) == get_freq_code(other.freq):
+                ordinal = other.ordinal
+                freq = other.freq
+            else:
+                converted = other.asfreq(freq)
+                ordinal = converted.ordinal
+
+        elif is_null_datetimelike(value) or value in nat_strings:
+            ordinal = iNaT
+
+        elif is_string_object(value) or util.is_integer_object(value):
+            if util.is_integer_object(value):
+                value = str(value)
+            value = value.upper()
+            dt, _, reso = parse_time_string(value, freq)
+            if dt is NAT_SENTINEL:
+                ordinal = iNaT
+
+            if freq is None:
+                try:
+                    freq = Resolution.get_freq(reso)
+                except KeyError:
+                    raise ValueError(
+                        "Invalid frequency or could not infer: %s" % reso)
+
+        elif isinstance(value, datetime):
+            dt = value
+            if freq is None:
+                raise ValueError('Must supply freq for datetime value')
+        elif util.is_datetime64_object(value):
+            dt = Timestamp(value)
+            if freq is None:
+                raise ValueError('Must supply freq for datetime value')
+        elif isinstance(value, date):
+            dt = datetime(year=value.year, month=value.month, day=value.day)
+            if freq is None:
+                raise ValueError('Must supply freq for datetime value')
+        else:
+            msg = "Value must be Period, string, integer, or datetime"
+            raise ValueError(msg)
+
+        if ordinal is None:
+            base, mult = get_freq_code(freq)
+            ordinal = period_ordinal(dt.year, dt.month, dt.day,
+                                     dt.hour, dt.minute, dt.second,
+                                     dt.microsecond, 0, base)
+
+        return cls._from_ordinal(ordinal, freq)
+
+
+cdef int64_t _ordinal_from_fields(year, month, quarter, day,
+                                  hour, minute, second, freq):
+    base, mult = get_freq_code(freq)
+    if quarter is not None:
+        year, month = _quarter_to_myear(year, quarter, freq)
+
+    return period_ordinal(year, month, day, hour,
+                          minute, second, 0, 0, base)
+
+
+def _quarter_to_myear(year, quarter, freq):
+    if quarter is not None:
+        if quarter <= 0 or quarter > 4:
+            raise ValueError('Quarter must be 1 <= q <= 4')
+
+        mnum = MONTH_NUMBERS[get_rule_month(freq)] + 1
+        month = (mnum + (quarter - 1) * 3) % 12 + 1
+        if month > mnum:
+            year -= 1
+
+    return year, month
+
+
+def _validate_end_alias(how):
+    how_dict = {'S': 'S', 'E': 'E',
+                'START': 'S', 'FINISH': 'E',
+                'BEGIN': 'S', 'END': 'E'}
+    how = how_dict.get(str(how).upper())
+    if how not in set(['S', 'E']):
+        raise ValueError('How must be one of S or E')
+    return how
diff --git a/pandas/_libs/tslibs/resolution.pyx b/pandas/_libs/tslibs/resolution.pyx
new file mode 100644
index 0000000000000..210b201cd08ea
--- /dev/null
+++ b/pandas/_libs/tslibs/resolution.pyx
@@ -0,0 +1,654 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+from cython cimport Py_ssize_t
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport ndarray, int64_t, int32_t
+cnp.import_array()
+
+from util cimport is_string_object, get_nat
+
+from pandas._libs.khash cimport (khiter_t,
+                                 kh_destroy_int64, kh_put_int64,
+                                 kh_init_int64, kh_int64_t,
+                                 kh_resize_int64, kh_get_int64)
+
+from cpython.datetime cimport datetime
+
+from np_datetime cimport pandas_datetimestruct, dt64_to_dtstruct
+from frequencies cimport get_freq_code
+from timezones cimport (is_utc, is_tzlocal,
+                        maybe_get_tz, get_dst_info, get_utcoffset)
+from fields import build_field_sarray
+from conversion import tz_convert
+from conversion cimport tz_convert_utc_to_tzlocal
+from ccalendar import MONTH_ALIASES, int_to_weekday
+from ccalendar cimport get_days_in_month
+
+from pandas._libs.properties import cache_readonly
+from pandas._libs.tslib import Timestamp
+
+from pandas.core.algorithms import unique  # TODO: Avoid this non-cython import
+
+# ----------------------------------------------------------------------
+# Constants
+
+cdef int64_t NPY_NAT = get_nat()
+
+cdef int RESO_NS = 0
+cdef int RESO_US = 1
+cdef int RESO_MS = 2
+cdef int RESO_SEC = 3
+cdef int RESO_MIN = 4
+cdef int RESO_HR = 5
+cdef int RESO_DAY = 6
+
+_ONE_MICRO = <int64_t>1000L
+_ONE_MILLI = <int64_t>(_ONE_MICRO * 1000)
+_ONE_SECOND = <int64_t>(_ONE_MILLI * 1000)
+_ONE_MINUTE = <int64_t>(60 * _ONE_SECOND)
+_ONE_HOUR = <int64_t>(60 * _ONE_MINUTE)
+_ONE_DAY = <int64_t>(24 * _ONE_HOUR)
+
+# ----------------------------------------------------------------------
+
+cpdef resolution(ndarray[int64_t] stamps, tz=None):
+    cdef:
+        Py_ssize_t i, n = len(stamps)
+        pandas_datetimestruct dts
+        int reso = RESO_DAY, curr_reso
+
+    if tz is not None:
+        tz = maybe_get_tz(tz)
+        return _reso_local(stamps, tz)
+    else:
+        for i in range(n):
+            if stamps[i] == NPY_NAT:
+                continue
+            dt64_to_dtstruct(stamps[i], &dts)
+            curr_reso = _reso_stamp(&dts)
+            if curr_reso < reso:
+                reso = curr_reso
+        return reso
+
+
+cdef _reso_local(ndarray[int64_t] stamps, object tz):
+    cdef:
+        Py_ssize_t n = len(stamps)
+        int reso = RESO_DAY, curr_reso
+        ndarray[int64_t] trans, deltas, pos
+        pandas_datetimestruct dts
+        int64_t local_val
+
+    if is_utc(tz):
+        for i in range(n):
+            if stamps[i] == NPY_NAT:
+                continue
+            dt64_to_dtstruct(stamps[i], &dts)
+            curr_reso = _reso_stamp(&dts)
+            if curr_reso < reso:
+                reso = curr_reso
+    elif is_tzlocal(tz):
+        for i in range(n):
+            if stamps[i] == NPY_NAT:
+                continue
+            local_val = tz_convert_utc_to_tzlocal(stamps[i], tz)
+            dt64_to_dtstruct(local_val, &dts)
+            curr_reso = _reso_stamp(&dts)
+            if curr_reso < reso:
+                reso = curr_reso
+    else:
+        # Adjust datetime64 timestamp, recompute datetimestruct
+        trans, deltas, typ = get_dst_info(tz)
+
+        _pos = trans.searchsorted(stamps, side='right') - 1
+        if _pos.dtype != np.int64:
+            _pos = _pos.astype(np.int64)
+        pos = _pos
+
+        # statictzinfo
+        if typ not in ['pytz', 'dateutil']:
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    continue
+                dt64_to_dtstruct(stamps[i] + deltas[0], &dts)
+                curr_reso = _reso_stamp(&dts)
+                if curr_reso < reso:
+                    reso = curr_reso
+        else:
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    continue
+                dt64_to_dtstruct(stamps[i] + deltas[pos[i]], &dts)
+                curr_reso = _reso_stamp(&dts)
+                if curr_reso < reso:
+                    reso = curr_reso
+
+    return reso
+
+
+cdef inline int _reso_stamp(pandas_datetimestruct *dts):
+    if dts.us != 0:
+        if dts.us % 1000 == 0:
+            return RESO_MS
+        return RESO_US
+    elif dts.sec != 0:
+        return RESO_SEC
+    elif dts.min != 0:
+        return RESO_MIN
+    elif dts.hour != 0:
+        return RESO_HR
+    return RESO_DAY
+
+
+def get_freq_group(freq):
+    """
+    Return frequency code group of given frequency str or offset.
+
+    Example
+    -------
+    >>> get_freq_group('W-MON')
+    4000
+
+    >>> get_freq_group('W-FRI')
+    4000
+    """
+    if getattr(freq, '_typ', None) == 'dateoffset':
+        freq = freq.rule_code
+
+    if is_string_object(freq):
+        base, mult = get_freq_code(freq)
+        freq = base
+    elif isinstance(freq, int):
+        pass
+    else:
+        raise ValueError('input must be str, offset or int')
+    return (freq // 1000) * 1000
+
+
+class Resolution(object):
+
+    # Note: cython won't allow us to reference the cdef versions at the
+    # module level
+    RESO_NS = 0
+    RESO_US = 1
+    RESO_MS = 2
+    RESO_SEC = 3
+    RESO_MIN = 4
+    RESO_HR = 5
+    RESO_DAY = 6
+
+    _reso_str_map = {
+        RESO_NS: 'nanosecond',
+        RESO_US: 'microsecond',
+        RESO_MS: 'millisecond',
+        RESO_SEC: 'second',
+        RESO_MIN: 'minute',
+        RESO_HR: 'hour',
+        RESO_DAY: 'day'}
+
+    # factor to multiply a value by to convert it to the next finer grained
+    # resolution
+    _reso_mult_map = {
+        RESO_NS: None,
+        RESO_US: 1000,
+        RESO_MS: 1000,
+        RESO_SEC: 1000,
+        RESO_MIN: 60,
+        RESO_HR: 60,
+        RESO_DAY: 24}
+
+    _reso_str_bump_map = {
+        'D': 'H',
+        'H': 'T',
+        'T': 'S',
+        'S': 'L',
+        'L': 'U',
+        'U': 'N',
+        'N': None}
+
+    _str_reso_map = {v: k for k, v in _reso_str_map.items()}
+
+    _reso_freq_map = {
+        'year': 'A',
+        'quarter': 'Q',
+        'month': 'M',
+        'day': 'D',
+        'hour': 'H',
+        'minute': 'T',
+        'second': 'S',
+        'millisecond': 'L',
+        'microsecond': 'U',
+        'nanosecond': 'N'}
+
+    _freq_reso_map = {v: k for k, v in _reso_freq_map.items()}
+
+    @classmethod
+    def get_str(cls, reso):
+        """
+        Return resolution str against resolution code.
+
+        Example
+        -------
+        >>> Resolution.get_str(Resolution.RESO_SEC)
+        'second'
+        """
+        return cls._reso_str_map.get(reso, 'day')
+
+    @classmethod
+    def get_reso(cls, resostr):
+        """
+        Return resolution str against resolution code.
+
+        Example
+        -------
+        >>> Resolution.get_reso('second')
+        2
+
+        >>> Resolution.get_reso('second') == Resolution.RESO_SEC
+        True
+        """
+        return cls._str_reso_map.get(resostr, cls.RESO_DAY)
+
+    @classmethod
+    def get_freq_group(cls, resostr):
+        """
+        Return frequency str against resolution str.
+
+        Example
+        -------
+        >>> f.Resolution.get_freq_group('day')
+        4000
+        """
+        return get_freq_group(cls.get_freq(resostr))
+
+    @classmethod
+    def get_freq(cls, resostr):
+        """
+        Return frequency str against resolution str.
+
+        Example
+        -------
+        >>> f.Resolution.get_freq('day')
+        'D'
+        """
+        return cls._reso_freq_map[resostr]
+
+    @classmethod
+    def get_str_from_freq(cls, freq):
+        """
+        Return resolution str against frequency str.
+
+        Example
+        -------
+        >>> Resolution.get_str_from_freq('H')
+        'hour'
+        """
+        return cls._freq_reso_map.get(freq, 'day')
+
+    @classmethod
+    def get_reso_from_freq(cls, freq):
+        """
+        Return resolution code against frequency str.
+
+        Example
+        -------
+        >>> Resolution.get_reso_from_freq('H')
+        4
+
+        >>> Resolution.get_reso_from_freq('H') == Resolution.RESO_HR
+        True
+        """
+        return cls.get_reso(cls.get_str_from_freq(freq))
+
+    @classmethod
+    def get_stride_from_decimal(cls, value, freq):
+        """
+        Convert freq with decimal stride into a higher freq with integer stride
+
+        Parameters
+        ----------
+        value : integer or float
+        freq : string
+            Frequency string
+
+        Raises
+        ------
+        ValueError
+            If the float cannot be converted to an integer at any resolution.
+
+        Example
+        -------
+        >>> Resolution.get_stride_from_decimal(1.5, 'T')
+        (90, 'S')
+
+        >>> Resolution.get_stride_from_decimal(1.04, 'H')
+        (3744, 'S')
+
+        >>> Resolution.get_stride_from_decimal(1, 'D')
+        (1, 'D')
+        """
+        if np.isclose(value % 1, 0):
+            return int(value), freq
+        else:
+            start_reso = cls.get_reso_from_freq(freq)
+            if start_reso == 0:
+                raise ValueError("Could not convert to integer offset "
+                                 "at any resolution")
+
+            next_value = cls._reso_mult_map[start_reso] * value
+            next_name = cls._reso_str_bump_map[freq]
+            return cls.get_stride_from_decimal(next_value, next_name)
+
+
+# ----------------------------------------------------------------------
+# Frequency Inference
+
+
+# TODO: this is non performant logic here (and duplicative) and this
+# simply should call unique_1d directly
+# plus no reason to depend on khash directly
+cdef ndarray[int64_t, ndim=1] unique_deltas(ndarray[int64_t] arr):
+    cdef:
+        Py_ssize_t i, n = len(arr)
+        int64_t val
+        khiter_t k
+        kh_int64_t *table
+        int ret = 0
+        list uniques = []
+
+    table = kh_init_int64()
+    kh_resize_int64(table, 10)
+    for i in range(n - 1):
+        val = arr[i + 1] - arr[i]
+        k = kh_get_int64(table, val)
+        if k == table.n_buckets:
+            kh_put_int64(table, val, &ret)
+            uniques.append(val)
+    kh_destroy_int64(table)
+
+    result = np.array(uniques, dtype=np.int64)
+    result.sort()
+    return result
+
+
+cdef inline bint _is_multiple(int64_t us, int64_t mult):
+    return us % mult == 0
+
+
+cdef inline str _maybe_add_count(str base, int64_t count):
+    if count != 1:
+        return '{count}{base}'.format(count=count, base=base)
+    else:
+        return base
+
+
+cdef class _FrequencyInferer(object):
+    """
+    Not sure if I can avoid the state machine here
+    """
+    cdef public:
+        object index
+        object values
+        bint warn
+        bint is_monotonic
+        dict _cache
+
+    def __init__(self, index, warn=True):
+        self.index = index
+        self.values = np.asarray(index).view('i8')
+
+        # This moves the values, which are implicitly in UTC, to the
+        # the timezone so they are in local time
+        if hasattr(index, 'tz'):
+            if index.tz is not None:
+                self.values = tz_convert(self.values, 'UTC', index.tz)
+
+        self.warn = warn
+
+        if len(index) < 3:
+            raise ValueError('Need at least 3 dates to infer frequency')
+
+        self.is_monotonic = (self.index.is_monotonic_increasing or
+                             self.index.is_monotonic_decreasing)
+
+    @cache_readonly
+    def deltas(self):
+        return unique_deltas(self.values)
+
+    @cache_readonly
+    def deltas_asi8(self):
+        return unique_deltas(self.index.asi8)
+
+    @cache_readonly
+    def is_unique(self):
+        return len(self.deltas) == 1
+
+    @cache_readonly
+    def is_unique_asi8(self):
+        return len(self.deltas_asi8) == 1
+
+    def get_freq(self):
+        if not self.is_monotonic or not self.index.is_unique:
+            return None
+
+        delta = self.deltas[0]
+        if _is_multiple(delta, _ONE_DAY):
+            return self._infer_daily_rule()
+        else:
+            # Business hourly, maybe. 17: one day / 65: one weekend
+            if self.hour_deltas in ([1, 17], [1, 65], [1, 17, 65]):
+                return 'BH'
+            # Possibly intraday frequency.  Here we use the
+            # original .asi8 values as the modified values
+            # will not work around DST transitions.  See #8772
+            elif not self.is_unique_asi8:
+                return None
+            delta = self.deltas_asi8[0]
+            if _is_multiple(delta, _ONE_HOUR):
+                # Hours
+                return _maybe_add_count('H', delta / _ONE_HOUR)
+            elif _is_multiple(delta, _ONE_MINUTE):
+                # Minutes
+                return _maybe_add_count('T', delta / _ONE_MINUTE)
+            elif _is_multiple(delta, _ONE_SECOND):
+                # Seconds
+                return _maybe_add_count('S', delta / _ONE_SECOND)
+            elif _is_multiple(delta, _ONE_MILLI):
+                # Milliseconds
+                return _maybe_add_count('L', delta / _ONE_MILLI)
+            elif _is_multiple(delta, _ONE_MICRO):
+                # Microseconds
+                return _maybe_add_count('U', delta / _ONE_MICRO)
+            else:
+                # Nanoseconds
+                return _maybe_add_count('N', delta)
+
+    @cache_readonly
+    def day_deltas(self):
+        return [x / _ONE_DAY for x in self.deltas]
+
+    @cache_readonly
+    def hour_deltas(self):
+        return [x / _ONE_HOUR for x in self.deltas]
+
+    @cache_readonly
+    def fields(self):
+        return build_field_sarray(self.values)
+
+    @cache_readonly
+    def rep_stamp(self):
+        return Timestamp(self.values[0])
+
+    cdef month_position_check(self):
+        # TODO: cythonize this, very slow
+        cdef:
+            int32_t daysinmonth, y, m, d
+            bint calendar_end = True
+            bint business_end = True
+            bint calendar_start = True
+            bint business_start = True
+            bint cal
+            int32_t[:] years
+            int32_t[:] months
+            int32_t[:] days
+
+        fields = self.fields
+        years = fields['Y']
+        months = fields['M']
+        days = fields['D']
+        weekdays = self.index.dayofweek
+
+        for y, m, d, wd in zip(years, months, days, weekdays):
+
+            if calendar_start:
+                calendar_start &= d == 1
+            if business_start:
+                business_start &= d == 1 or (d <= 3 and wd == 0)
+
+            if calendar_end or business_end:
+                daysinmonth = get_days_in_month(y, m)
+                cal = d == daysinmonth
+                if calendar_end:
+                    calendar_end &= cal
+                if business_end:
+                    business_end &= cal or (daysinmonth - d < 3 and wd == 4)
+            elif not calendar_start and not business_start:
+                break
+
+        if calendar_end:
+            return 'ce'
+        elif business_end:
+            return 'be'
+        elif calendar_start:
+            return 'cs'
+        elif business_start:
+            return 'bs'
+        else:
+            return None
+
+    @cache_readonly
+    def mdiffs(self):
+        nmonths = self.fields['Y'] * 12 + self.fields['M']
+        return unique_deltas(nmonths.astype('i8'))
+
+    @cache_readonly
+    def ydiffs(self):
+        return unique_deltas(self.fields['Y'].astype('i8'))
+
+    cdef _infer_daily_rule(self):
+        annual_rule = self._get_annual_rule()
+        if annual_rule:
+            nyears = self.ydiffs[0]
+            month = MONTH_ALIASES[self.rep_stamp.month]
+            alias = '{prefix}-{month}'.format(prefix=annual_rule, month=month)
+            return _maybe_add_count(alias, nyears)
+
+        quarterly_rule = self._get_quarterly_rule()
+        if quarterly_rule:
+            nquarters = self.mdiffs[0] / 3
+            mod_dict = {0: 12, 2: 11, 1: 10}
+            month = MONTH_ALIASES[mod_dict[self.rep_stamp.month % 3]]
+            alias = '{prefix}-{month}'.format(prefix=quarterly_rule,
+                                              month=month)
+            return _maybe_add_count(alias, nquarters)
+
+        monthly_rule = self._get_monthly_rule()
+        if monthly_rule:
+            return _maybe_add_count(monthly_rule, self.mdiffs[0])
+
+        if self.is_unique:
+            days = self.deltas[0] / _ONE_DAY
+            if days % 7 == 0:
+                # Weekly
+                day = int_to_weekday[self.rep_stamp.weekday()]
+                return _maybe_add_count('W-{day}'.format(day=day), days / 7)
+            else:
+                return _maybe_add_count('D', days)
+
+        if self._is_business_daily():
+            return 'B'
+
+        wom_rule = self._get_wom_rule()
+        if wom_rule:
+            return wom_rule
+
+    cdef _get_annual_rule(self):
+        if len(self.ydiffs) > 1:
+            return None
+
+        if len(unique(self.fields['M'])) > 1:
+            return None
+
+        pos_check = self.month_position_check()
+        return {'cs': 'AS', 'bs': 'BAS',
+                'ce': 'A', 'be': 'BA'}.get(pos_check)
+
+    cdef _get_quarterly_rule(self):
+        if len(self.mdiffs) > 1:
+            return None
+
+        if not self.mdiffs[0] % 3 == 0:
+            return None
+
+        pos_check = self.month_position_check()
+        return {'cs': 'QS', 'bs': 'BQS',
+                'ce': 'Q', 'be': 'BQ'}.get(pos_check)
+
+    cdef _get_monthly_rule(self):
+        if len(self.mdiffs) > 1:
+            return None
+        pos_check = self.month_position_check()
+        return {'cs': 'MS', 'bs': 'BMS',
+                'ce': 'M', 'be': 'BM'}.get(pos_check)
+
+    cdef bint _is_business_daily(self):
+        # quick check: cannot be business daily
+        if self.day_deltas != [1, 3]:
+            return False
+
+        # probably business daily, but need to confirm
+        first_weekday = self.index[0].weekday()
+        shifts = np.diff(self.index.asi8)
+        shifts = np.floor_divide(shifts, _ONE_DAY)
+        weekdays = np.mod(first_weekday + np.cumsum(shifts), 7)
+        return np.all(((weekdays == 0) & (shifts == 3)) |
+                      ((weekdays > 0) & (weekdays <= 4) & (shifts == 1)))
+
+    cdef _get_wom_rule(self):
+        #         wdiffs = unique(np.diff(self.index.week))
+        # We also need -47, -49, -48 to catch index spanning year boundary
+        #     if not lib.ismember(wdiffs, set([4, 5, -47, -49, -48])).all():
+        #         return None
+
+        weekdays = unique(self.index.weekday)
+        if len(weekdays) > 1:
+            return None
+
+        week_of_months = unique((self.index.day - 1) // 7)
+        # Only attempt to infer up to WOM-4. See #9425
+        week_of_months = week_of_months[week_of_months < 4]
+        if len(week_of_months) == 0 or len(week_of_months) > 1:
+            return None
+
+        # get which week
+        week = week_of_months[0] + 1
+        wd = int_to_weekday[weekdays[0]]
+
+        return 'WOM-{week}{weekday}'.format(week=week, weekday=wd)
+
+
+cdef class _TimedeltaFrequencyInferer(_FrequencyInferer):
+
+    cdef _infer_daily_rule(self):
+        if self.is_unique:
+            days = self.deltas[0] / _ONE_DAY
+            if days % 7 == 0:
+                # Weekly
+                wd = int_to_weekday[self.rep_stamp.weekday()]
+                alias = 'W-{weekday}'.format(weekday=wd)
+                return _maybe_add_count(alias, days / 7)
+            else:
+                return _maybe_add_count('D', days)
diff --git a/pandas/_libs/tslibs/strptime.pyx b/pandas/_libs/tslibs/strptime.pyx
new file mode 100644
index 0000000000000..77ce8e4ed4127
--- /dev/null
+++ b/pandas/_libs/tslibs/strptime.pyx
@@ -0,0 +1,673 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+"""Strptime-related classes and functions.
+"""
+import time
+import locale
+import calendar
+import re
+
+
+# Python 2 vs Python 3
+try:
+    from thread import allocate_lock as _thread_allocate_lock
+except:
+    try:
+        from _thread import allocate_lock as _thread_allocate_lock
+    except:
+        try:
+            from dummy_thread import allocate_lock as _thread_allocate_lock
+        except:
+            from _dummy_thread import allocate_lock as _thread_allocate_lock
+
+import pytz
+
+from cython cimport Py_ssize_t
+from cpython cimport PyFloat_Check
+
+cimport cython
+
+import numpy as np
+from numpy cimport ndarray, int64_t
+
+from datetime import date as datetime_date
+from cpython.datetime cimport datetime
+
+from np_datetime cimport (check_dts_bounds,
+                          dtstruct_to_dt64, pandas_datetimestruct)
+
+from util cimport is_string_object
+
+from nattype cimport checknull_with_nat, NPY_NAT
+from nattype import nat_strings
+
+cdef dict _parse_code_table = {'y': 0,
+                               'Y': 1,
+                               'm': 2,
+                               'B': 3,
+                               'b': 4,
+                               'd': 5,
+                               'H': 6,
+                               'I': 7,
+                               'M': 8,
+                               'S': 9,
+                               'f': 10,
+                               'A': 11,
+                               'a': 12,
+                               'w': 13,
+                               'j': 14,
+                               'U': 15,
+                               'W': 16,
+                               'Z': 17,
+                               'p': 18,  # an additional key, only with I
+                               'z': 19}
+
+
+def array_strptime(ndarray[object] values, object fmt,
+                   bint exact=True, errors='raise'):
+    """
+    Calculates the datetime structs represented by the passed array of strings
+
+    Parameters
+    ----------
+    values : ndarray of string-like objects
+    fmt : string-like regex
+    exact : matches must be exact if True, search if False
+    coerce : if invalid values found, coerce to NaT
+    """
+
+    cdef:
+        Py_ssize_t i, n = len(values)
+        pandas_datetimestruct dts
+        ndarray[int64_t] iresult
+        ndarray[object] result_timezone
+        int year, month, day, minute, hour, second, weekday, julian
+        int week_of_year, week_of_year_start, parse_code, ordinal
+        int64_t us, ns
+        object val, group_key, ampm, found, timezone
+        dict found_key
+        bint is_raise = errors=='raise'
+        bint is_ignore = errors=='ignore'
+        bint is_coerce = errors=='coerce'
+
+    assert is_raise or is_ignore or is_coerce
+
+    if fmt is not None:
+        if '%W' in fmt or '%U' in fmt:
+            if '%Y' not in fmt and '%y' not in fmt:
+                raise ValueError("Cannot use '%W' or '%U' without "
+                                 "day and year")
+            if ('%A' not in fmt and '%a' not in fmt and '%w' not
+                    in fmt):
+                raise ValueError("Cannot use '%W' or '%U' without "
+                                 "day and year")
+        elif '%Z' in fmt and '%z' in fmt:
+            raise ValueError("Cannot parse both %Z and %z")
+
+    global _TimeRE_cache, _regex_cache
+    with _cache_lock:
+        if _getlang() != _TimeRE_cache.locale_time.lang:
+            _TimeRE_cache = TimeRE()
+            _regex_cache.clear()
+        if len(_regex_cache) > _CACHE_MAX_SIZE:
+            _regex_cache.clear()
+        locale_time = _TimeRE_cache.locale_time
+        format_regex = _regex_cache.get(fmt)
+        if not format_regex:
+            try:
+                format_regex = _TimeRE_cache.compile(fmt)
+            # KeyError raised when a bad format is found; can be specified as
+            # \\, in which case it was a stray % but with a space after it
+            except KeyError, err:
+                bad_directive = err.args[0]
+                if bad_directive == "\\":
+                    bad_directive = "%"
+                del err
+                raise ValueError("'%s' is a bad directive in format '%s'" %
+                                 (bad_directive, fmt))
+            # IndexError only occurs when the format string is "%"
+            except IndexError:
+                raise ValueError("stray %% in format '%s'" % fmt)
+            _regex_cache[fmt] = format_regex
+
+    result = np.empty(n, dtype='M8[ns]')
+    iresult = result.view('i8')
+    result_timezone = np.empty(n, dtype='object')
+
+    dts.us = dts.ps = dts.as = 0
+
+    for i in range(n):
+        val = values[i]
+        if is_string_object(val):
+            if val in nat_strings:
+                iresult[i] = NPY_NAT
+                continue
+        else:
+            if checknull_with_nat(val):
+                iresult[i] = NPY_NAT
+                continue
+            else:
+                val = str(val)
+
+        # exact matching
+        if exact:
+            found = format_regex.match(val)
+            if not found:
+                if is_coerce:
+                    iresult[i] = NPY_NAT
+                    continue
+                raise ValueError("time data %r does not match "
+                                 "format %r (match)" % (values[i], fmt))
+            if len(val) != found.end():
+                if is_coerce:
+                    iresult[i] = NPY_NAT
+                    continue
+                raise ValueError("unconverted data remains: %s" %
+                                 values[i][found.end():])
+
+        # search
+        else:
+            found = format_regex.search(val)
+            if not found:
+                if is_coerce:
+                    iresult[i] = NPY_NAT
+                    continue
+                raise ValueError("time data %r does not match format "
+                                 "%r (search)" % (values[i], fmt))
+
+        year = 1900
+        month = day = 1
+        hour = minute = second = ns = us = 0
+        timezone = None
+        # Default to -1 to signify that values not known; not critical to have,
+        # though
+        week_of_year = -1
+        week_of_year_start = -1
+        # weekday and julian defaulted to -1 so as to signal need to calculate
+        # values
+        weekday = julian = -1
+        found_dict = found.groupdict()
+        for group_key in found_dict.iterkeys():
+            # Directives not explicitly handled below:
+            #   c, x, X
+            #      handled by making out of other directives
+            #   U, W
+            #      worthless without day of the week
+            parse_code = _parse_code_table[group_key]
+
+            if parse_code == 0:
+                year = int(found_dict['y'])
+                # Open Group specification for strptime() states that a %y
+                # value in the range of [00, 68] is in the century 2000, while
+                # [69,99] is in the century 1900
+                if year <= 68:
+                    year += 2000
+                else:
+                    year += 1900
+            elif parse_code == 1:
+                year = int(found_dict['Y'])
+            elif parse_code == 2:
+                month = int(found_dict['m'])
+            elif parse_code == 3:
+            # elif group_key == 'B':
+                month = locale_time.f_month.index(found_dict['B'].lower())
+            elif parse_code == 4:
+            # elif group_key == 'b':
+                month = locale_time.a_month.index(found_dict['b'].lower())
+            elif parse_code == 5:
+            # elif group_key == 'd':
+                day = int(found_dict['d'])
+            elif parse_code == 6:
+            # elif group_key == 'H':
+                hour = int(found_dict['H'])
+            elif parse_code == 7:
+                hour = int(found_dict['I'])
+                ampm = found_dict.get('p', '').lower()
+                # If there was no AM/PM indicator, we'll treat this like AM
+                if ampm in ('', locale_time.am_pm[0]):
+                    # We're in AM so the hour is correct unless we're
+                    # looking at 12 midnight.
+                    # 12 midnight == 12 AM == hour 0
+                    if hour == 12:
+                        hour = 0
+                elif ampm == locale_time.am_pm[1]:
+                    # We're in PM so we need to add 12 to the hour unless
+                    # we're looking at 12 noon.
+                    # 12 noon == 12 PM == hour 12
+                    if hour != 12:
+                        hour += 12
+            elif parse_code == 8:
+                minute = int(found_dict['M'])
+            elif parse_code == 9:
+                second = int(found_dict['S'])
+            elif parse_code == 10:
+                s = found_dict['f']
+                # Pad to always return nanoseconds
+                s += "0" * (9 - len(s))
+                us = long(s)
+                ns = us % 1000
+                us = us / 1000
+            elif parse_code == 11:
+                weekday = locale_time.f_weekday.index(found_dict['A'].lower())
+            elif parse_code == 12:
+                weekday = locale_time.a_weekday.index(found_dict['a'].lower())
+            elif parse_code == 13:
+                weekday = int(found_dict['w'])
+                if weekday == 0:
+                    weekday = 6
+                else:
+                    weekday -= 1
+            elif parse_code == 14:
+                julian = int(found_dict['j'])
+            elif parse_code == 15 or parse_code == 16:
+                week_of_year = int(found_dict[group_key])
+                if group_key == 'U':
+                    # U starts week on Sunday.
+                    week_of_year_start = 6
+                else:
+                    # W starts week on Monday.
+                    week_of_year_start = 0
+            elif parse_code == 17:
+                timezone = pytz.timezone(found_dict['Z'])
+            elif parse_code == 19:
+                timezone = parse_timezone_directive(found_dict['z'])
+
+        # If we know the wk of the year and what day of that wk, we can figure
+        # out the Julian day of the year.
+        if julian == -1 and week_of_year != -1 and weekday != -1:
+            week_starts_Mon = True if week_of_year_start == 0 else False
+            julian = _calc_julian_from_U_or_W(year, week_of_year, weekday,
+                                              week_starts_Mon)
+        # Cannot pre-calculate datetime_date() since can change in Julian
+        # calculation and thus could have different value for the day of the wk
+        # calculation.
+        try:
+            if julian == -1:
+                # Need to add 1 to result since first day of the year is 1, not
+                # 0.
+                ordinal = datetime_date(year, month, day).toordinal()
+                julian = ordinal - datetime_date(year, 1, 1).toordinal() + 1
+            else:
+                # Assume that if they bothered to include Julian day it will
+                # be accurate.
+                datetime_result = datetime_date.fromordinal(
+                    (julian - 1) + datetime_date(year, 1, 1).toordinal())
+                year = datetime_result.year
+                month = datetime_result.month
+                day = datetime_result.day
+        except ValueError:
+            if is_coerce:
+                iresult[i] = NPY_NAT
+                continue
+            raise
+        if weekday == -1:
+            weekday = datetime_date(year, month, day).weekday()
+
+        dts.year = year
+        dts.month = month
+        dts.day = day
+        dts.hour = hour
+        dts.min = minute
+        dts.sec = second
+        dts.us = us
+        dts.ps = ns * 1000
+
+        iresult[i] = dtstruct_to_dt64(&dts)
+        try:
+            check_dts_bounds(&dts)
+        except ValueError:
+            if is_coerce:
+                iresult[i] = NPY_NAT
+                continue
+            raise
+
+        result_timezone[i] = timezone
+
+    return result, result_timezone
+
+
+"""_getlang, LocaleTime, TimeRE, _calc_julian_from_U_or_W are vendored
+from the standard library, see
+https://github.com/python/cpython/blob/master/Lib/_strptime.py
+The original module-level docstring follows.
+
+Strptime-related classes and functions.
+CLASSES:
+    LocaleTime -- Discovers and stores locale-specific time information
+    TimeRE -- Creates regexes for pattern matching a string of text containing
+                time information
+FUNCTIONS:
+    _getlang -- Figure out what language is being used for the locale
+    strptime -- Calculates the time struct represented by the passed-in string
+"""
+
+
+def _getlang():
+    """Figure out what language is being used for the locale"""
+    return locale.getlocale(locale.LC_TIME)
+
+
+class LocaleTime(object):
+    """Stores and handles locale-specific information related to time.
+
+    ATTRIBUTES:
+        f_weekday -- full weekday names (7-item list)
+        a_weekday -- abbreviated weekday names (7-item list)
+        f_month -- full month names (13-item list; dummy value in [0], which
+                    is added by code)
+        a_month -- abbreviated month names (13-item list, dummy value in
+                    [0], which is added by code)
+        am_pm -- AM/PM representation (2-item list)
+        LC_date_time -- format string for date/time representation (string)
+        LC_date -- format string for date representation (string)
+        LC_time -- format string for time representation (string)
+        timezone -- daylight- and non-daylight-savings timezone representation
+                    (2-item list of sets)
+        lang -- Language used by instance (2-item tuple)
+    """
+
+    def __init__(self):
+        """Set all attributes.
+
+        Order of methods called matters for dependency reasons.
+
+        The locale language is set at the offset and then checked again before
+        exiting.  This is to make sure that the attributes were not set with a
+        mix of information from more than one locale.  This would most likely
+        happen when using threads where one thread calls a locale-dependent
+        function while another thread changes the locale while the function in
+        the other thread is still running.  Proper coding would call for
+        locks to prevent changing the locale while locale-dependent code is
+        running.  The check here is done in case someone does not think about
+        doing this.
+
+        Only other possible issue is if someone changed the timezone and did
+        not call tz.tzset .  That is an issue for the programmer, though,
+        since changing the timezone is worthless without that call.
+
+        """
+        self.lang = _getlang()
+        self.__calc_weekday()
+        self.__calc_month()
+        self.__calc_am_pm()
+        self.__calc_timezone()
+        self.__calc_date_time()
+        if _getlang() != self.lang:
+            raise ValueError("locale changed during initialization")
+
+    def __pad(self, seq, front):
+        # Add '' to seq to either the front (is True), else the back.
+        seq = list(seq)
+        if front:
+            seq.insert(0, '')
+        else:
+            seq.append('')
+        return seq
+
+    def __calc_weekday(self):
+        # Set self.a_weekday and self.f_weekday using the calendar
+        # module.
+        a_weekday = [calendar.day_abbr[i].lower() for i in range(7)]
+        f_weekday = [calendar.day_name[i].lower() for i in range(7)]
+        self.a_weekday = a_weekday
+        self.f_weekday = f_weekday
+
+    def __calc_month(self):
+        # Set self.f_month and self.a_month using the calendar module.
+        a_month = [calendar.month_abbr[i].lower() for i in range(13)]
+        f_month = [calendar.month_name[i].lower() for i in range(13)]
+        self.a_month = a_month
+        self.f_month = f_month
+
+    def __calc_am_pm(self):
+        # Set self.am_pm by using time.strftime().
+
+        # The magic date (1999,3,17,hour,44,55,2,76,0) is not really that
+        # magical; just happened to have used it everywhere else where a
+        # static date was needed.
+        am_pm = []
+        for hour in (01, 22):
+            time_tuple = time.struct_time(
+                (1999, 3, 17, hour, 44, 55, 2, 76, 0))
+            am_pm.append(time.strftime("%p", time_tuple).lower())
+        self.am_pm = am_pm
+
+    def __calc_date_time(self):
+        # Set self.date_time, self.date, & self.time by using
+        # time.strftime().
+
+        # Use (1999,3,17,22,44,55,2,76,0) for magic date because the amount of
+        # overloaded numbers is minimized.  The order in which searches for
+        # values within the format string is very important; it eliminates
+        # possible ambiguity for what something represents.
+        time_tuple = time.struct_time((1999, 3, 17, 22, 44, 55, 2, 76, 0))
+        date_time = [None, None, None]
+        date_time[0] = time.strftime("%c", time_tuple).lower()
+        date_time[1] = time.strftime("%x", time_tuple).lower()
+        date_time[2] = time.strftime("%X", time_tuple).lower()
+        replacement_pairs = [('%', '%%'), (self.f_weekday[2], '%A'),
+                             (self.f_month[3], '%B'),
+                             (self.a_weekday[2], '%a'),
+                             (self.a_month[3], '%b'), (self.am_pm[1], '%p'),
+                             ('1999', '%Y'), ('99', '%y'), ('22', '%H'),
+                             ('44', '%M'), ('55', '%S'), ('76', '%j'),
+                             ('17', '%d'), ('03', '%m'), ('3', '%m'),
+                             # '3' needed for when no leading zero.
+                             ('2', '%w'), ('10', '%I')]
+        replacement_pairs.extend([(tz, "%Z") for tz_values in self.timezone
+                                  for tz in tz_values])
+        for offset, directive in ((0, '%c'), (1, '%x'), (2, '%X')):
+            current_format = date_time[offset]
+            for old, new in replacement_pairs:
+                # Must deal with possible lack of locale info
+                # manifesting itself as the empty string (e.g., Swedish's
+                # lack of AM/PM info) or a platform returning a tuple of empty
+                # strings (e.g., MacOS 9 having timezone as ('','')).
+                if old:
+                    current_format = current_format.replace(old, new)
+            # If %W is used, then Sunday, 2005-01-03 will fall on week 0 since
+            # 2005-01-03 occurs before the first Monday of the year.  Otherwise
+            # %U is used.
+            time_tuple = time.struct_time((1999, 1, 3, 1, 1, 1, 6, 3, 0))
+            if '00' in time.strftime(directive, time_tuple):
+                U_W = '%W'
+            else:
+                U_W = '%U'
+            date_time[offset] = current_format.replace('11', U_W)
+        self.LC_date_time = date_time[0]
+        self.LC_date = date_time[1]
+        self.LC_time = date_time[2]
+
+    def __calc_timezone(self):
+        # Set self.timezone by using time.tzname.
+        # Do not worry about possibility of time.tzname[0] == timetzname[1]
+        # and time.daylight; handle that in strptime .
+        try:
+            time.tzset()
+        except AttributeError:
+            pass
+        no_saving = frozenset(["utc", "gmt", time.tzname[0].lower()])
+        if time.daylight:
+            has_saving = frozenset([time.tzname[1].lower()])
+        else:
+            has_saving = frozenset()
+        self.timezone = (no_saving, has_saving)
+
+
+class TimeRE(dict):
+    """
+    Handle conversion from format directives to regexes.
+
+    Creates regexes for pattern matching a string of text containing
+    time information
+    """
+
+    def __init__(self, locale_time=None):
+        """Create keys/values.
+
+        Order of execution is important for dependency reasons.
+
+        """
+        if locale_time:
+            self.locale_time = locale_time
+        else:
+            self.locale_time = LocaleTime()
+        base = super(TimeRE, self)
+        base.__init__({
+            # The " \d" part of the regex is to make %c from ANSI C work
+            'd': r"(?P<d>3[0-1]|[1-2]\d|0[1-9]|[1-9]| [1-9])",
+            'f': r"(?P<f>[0-9]{1,9})",
+            'H': r"(?P<H>2[0-3]|[0-1]\d|\d)",
+            'I': r"(?P<I>1[0-2]|0[1-9]|[1-9])",
+            'j': (r"(?P<j>36[0-6]|3[0-5]\d|[1-2]\d\d|0[1-9]\d|00[1-9]|"
+                  r"[1-9]\d|0[1-9]|[1-9])"),
+            'm': r"(?P<m>1[0-2]|0[1-9]|[1-9])",
+            'M': r"(?P<M>[0-5]\d|\d)",
+            'S': r"(?P<S>6[0-1]|[0-5]\d|\d)",
+            'U': r"(?P<U>5[0-3]|[0-4]\d|\d)",
+            'w': r"(?P<w>[0-6])",
+            # W is set below by using 'U'
+            'y': r"(?P<y>\d\d)",
+            # XXX: Does 'Y' need to worry about having less or more than
+            #     4 digits?
+            'Y': r"(?P<Y>\d\d\d\d)",
+            'z': r"(?P<z>[+-]\d\d:?[0-5]\d(:?[0-5]\d(\.\d{1,6})?)?|Z)",
+            'A': self.__seqToRE(self.locale_time.f_weekday, 'A'),
+            'a': self.__seqToRE(self.locale_time.a_weekday, 'a'),
+            'B': self.__seqToRE(self.locale_time.f_month[1:], 'B'),
+            'b': self.__seqToRE(self.locale_time.a_month[1:], 'b'),
+            'p': self.__seqToRE(self.locale_time.am_pm, 'p'),
+            'Z': self.__seqToRE(pytz.all_timezones, 'Z'),
+            '%': '%'})
+        base.__setitem__('W', base.__getitem__('U').replace('U', 'W'))
+        base.__setitem__('c', self.pattern(self.locale_time.LC_date_time))
+        base.__setitem__('x', self.pattern(self.locale_time.LC_date))
+        base.__setitem__('X', self.pattern(self.locale_time.LC_time))
+
+    def __seqToRE(self, to_convert, directive):
+        """Convert a list to a regex string for matching a directive.
+
+        Want possible matching values to be from longest to shortest.  This
+        prevents the possibility of a match occurring for a value that also
+        a substring of a larger value that should have matched (e.g., 'abc'
+        matching when 'abcdef' should have been the match).
+
+        """
+        to_convert = sorted(to_convert, key=len, reverse=True)
+        for value in to_convert:
+            if value != '':
+                break
+        else:
+            return ''
+        regex = '|'.join(re.escape(stuff) for stuff in to_convert)
+        regex = '(?P<%s>%s' % (directive, regex)
+        return '%s)' % regex
+
+    def pattern(self, format):
+        """Return regex pattern for the format string.
+
+        Need to make sure that any characters that might be interpreted as
+        regex syntax are escaped.
+
+        """
+        processed_format = ''
+        # The sub() call escapes all characters that might be misconstrued
+        # as regex syntax.  Cannot use re.escape since we have to deal with
+        # format directives (%m, etc.).
+        regex_chars = re.compile(r"([\\.^$*+?\(\){}\[\]|])")
+        format = regex_chars.sub(r"\\\1", format)
+        whitespace_replacement = re.compile(r'\s+')
+        format = whitespace_replacement.sub(r'\\s+', format)
+        while '%' in format:
+            directive_index = format.index('%') +1
+            processed_format = "%s%s%s" % (processed_format,
+                                           format[:directive_index -1],
+                                           self[format[directive_index]])
+            format = format[directive_index +1:]
+        return "%s%s" % (processed_format, format)
+
+    def compile(self, format):
+        """Return a compiled re object for the format string."""
+        return re.compile(self.pattern(format), re.IGNORECASE)
+
+
+_cache_lock = _thread_allocate_lock()
+# DO NOT modify _TimeRE_cache or _regex_cache without acquiring the cache lock
+# first!
+_TimeRE_cache = TimeRE()
+_CACHE_MAX_SIZE = 5  # Max number of regexes stored in _regex_cache
+_regex_cache = {}
+
+
+cdef _calc_julian_from_U_or_W(int year, int week_of_year,
+                              int day_of_week, int week_starts_Mon):
+    """Calculate the Julian day based on the year, week of the year, and day of
+    the week, with week_start_day representing whether the week of the year
+    assumes the week starts on Sunday or Monday (6 or 0)."""
+
+    cdef:
+        int first_weekday, week_0_length, days_to_week
+
+    first_weekday = datetime_date(year, 1, 1).weekday()
+    # If we are dealing with the %U directive (week starts on Sunday), it's
+    # easier to just shift the view to Sunday being the first day of the
+    # week.
+    if not week_starts_Mon:
+        first_weekday = (first_weekday + 1) % 7
+        day_of_week = (day_of_week + 1) % 7
+
+    # Need to watch out for a week 0 (when the first day of the year is not
+    # the same as that specified by %U or %W).
+    week_0_length = (7 - first_weekday) % 7
+    if week_of_year == 0:
+        return 1 + day_of_week - first_weekday
+    else:
+        days_to_week = week_0_length + (7 * (week_of_year - 1))
+        return 1 + days_to_week + day_of_week
+
+cdef parse_timezone_directive(object z):
+    """
+    Parse the '%z' directive and return a pytz.FixedOffset
+
+    Parameters
+    ----------
+    z : string of the UTC offset
+
+    Returns
+    -------
+    pytz.FixedOffset
+
+    Notes
+    -----
+    This is essentially similar to the cpython implementation
+    https://github.com/python/cpython/blob/master/Lib/_strptime.py#L457-L479
+    """
+
+    cdef:
+        int gmtoff_fraction, hours, minutes, seconds, pad_number, microseconds
+        int total_minutes
+        object gmtoff_remainder, gmtoff_remainder_padding
+
+    if z == 'Z':
+        return pytz.FixedOffset(0)
+    if z[3] == ':':
+        z = z[:3] + z[4:]
+        if len(z) > 5:
+            if z[5] != ':':
+                msg = "Inconsistent use of : in {0}"
+                raise ValueError(msg.format(z))
+            z = z[:5] + z[6:]
+    hours = int(z[1:3])
+    minutes = int(z[3:5])
+    seconds = int(z[5:7] or 0)
+
+    # Pad to always return microseconds.
+    gmtoff_remainder = z[8:]
+    pad_number = 6 - len(gmtoff_remainder)
+    gmtoff_remainder_padding = "0" * pad_number
+    microseconds = int(gmtoff_remainder + gmtoff_remainder_padding)
+
+    total_minutes = ((hours * 60) + minutes + (seconds / 60) +
+                     (microseconds / 60000000))
+    total_minutes = -total_minutes if z.startswith("-") else total_minutes
+    return pytz.FixedOffset(total_minutes)
diff --git a/pandas/_libs/tslibs/timedeltas.pxd b/pandas/_libs/tslibs/timedeltas.pxd
new file mode 100644
index 0000000000000..3e7b88b208e89
--- /dev/null
+++ b/pandas/_libs/tslibs/timedeltas.pxd
@@ -0,0 +1,13 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+from cpython.datetime cimport timedelta
+
+from numpy cimport int64_t, ndarray
+
+# Exposed for tslib, not intended for outside use.
+cdef parse_timedelta_string(object ts)
+cpdef int64_t cast_from_unit(object ts, object unit) except? -1
+cpdef int64_t delta_to_nanoseconds(delta) except? -1
+cpdef convert_to_timedelta64(object ts, object unit)
+cpdef array_to_timedelta64(ndarray[object] values, unit=*, errors=*)
diff --git a/pandas/_libs/tslibs/timedeltas.pyx b/pandas/_libs/tslibs/timedeltas.pyx
new file mode 100644
index 0000000000000..f68dc421a1ee9
--- /dev/null
+++ b/pandas/_libs/tslibs/timedeltas.pyx
@@ -0,0 +1,1350 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+import collections
+import textwrap
+import warnings
+
+import sys
+cdef bint PY3 = (sys.version_info[0] >= 3)
+
+from cython cimport Py_ssize_t
+
+from cpython cimport PyUnicode_Check, Py_NE, Py_EQ, PyObject_RichCompare
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport int64_t, ndarray
+cnp.import_array()
+
+from cpython.datetime cimport (datetime, timedelta,
+                               PyDateTime_CheckExact,
+                               PyDateTime_Check, PyDelta_Check,
+                               PyDateTime_IMPORT)
+PyDateTime_IMPORT
+
+
+cimport util
+from util cimport (is_timedelta64_object, is_datetime64_object,
+                   is_integer_object, is_float_object,
+                   is_string_object)
+
+from np_datetime cimport (cmp_scalar, reverse_ops, td64_to_tdstruct,
+                          pandas_timedeltastruct)
+
+from nattype import nat_strings, NaT
+from nattype cimport checknull_with_nat, NPY_NAT
+
+# ----------------------------------------------------------------------
+# Constants
+
+cdef int64_t DAY_NS = 86400000000000LL
+
+# components named tuple
+Components = collections.namedtuple('Components', [
+    'days', 'hours', 'minutes', 'seconds',
+    'milliseconds', 'microseconds', 'nanoseconds'])
+
+cdef dict timedelta_abbrevs = { 'D': 'd',
+                                'd': 'd',
+                                'days': 'd',
+                                'day': 'd',
+                                'hours': 'h',
+                                'hour': 'h',
+                                'hr': 'h',
+                                'h': 'h',
+                                'm': 'm',
+                                'minute': 'm',
+                                'min': 'm',
+                                'minutes': 'm',
+                                's': 's',
+                                'seconds': 's',
+                                'sec': 's',
+                                'second': 's',
+                                'ms': 'ms',
+                                'milliseconds': 'ms',
+                                'millisecond': 'ms',
+                                'milli': 'ms',
+                                'millis': 'ms',
+                                'us': 'us',
+                                'microseconds': 'us',
+                                'microsecond': 'us',
+                                'micro': 'us',
+                                'micros': 'us',
+                                'ns': 'ns',
+                                'nanoseconds': 'ns',
+                                'nano': 'ns',
+                                'nanos': 'ns',
+                                'nanosecond': 'ns'}
+
+_no_input = object()
+
+# ----------------------------------------------------------------------
+
+cpdef int64_t delta_to_nanoseconds(delta) except? -1:
+    if util.is_array(delta):
+        return delta.astype('m8[ns]').astype('int64')
+    if hasattr(delta, 'nanos'):
+        return delta.nanos
+    if hasattr(delta, 'delta'):
+        delta = delta.delta
+    if is_timedelta64_object(delta):
+        return delta.astype("timedelta64[ns]").item()
+    if is_integer_object(delta):
+        return delta
+
+    return (delta.days * 24 * 60 * 60 * 1000000 +
+            delta.seconds * 1000000 +
+            delta.microseconds) * 1000
+
+
+cpdef convert_to_timedelta64(object ts, object unit):
+    """
+    Convert an incoming object to a timedelta64 if possible
+
+    Handle these types of objects:
+        - timedelta/Timedelta
+        - timedelta64
+        - an offset
+        - np.int64 (with unit providing a possible modifier)
+        - None/NaT
+
+    Return an ns based int64
+
+    # kludgy here until we have a timedelta scalar
+    # handle the numpy < 1.7 case
+    """
+    if checknull_with_nat(ts):
+        return np.timedelta64(NPY_NAT)
+    elif isinstance(ts, Timedelta):
+        # already in the proper format
+        ts = np.timedelta64(ts.value)
+    elif is_datetime64_object(ts):
+        # only accept a NaT here
+        if ts.astype('int64') == NPY_NAT:
+            return np.timedelta64(NPY_NAT)
+    elif is_timedelta64_object(ts):
+        ts = ts.astype("m8[{0}]".format(unit.lower()))
+    elif is_integer_object(ts):
+        if ts == NPY_NAT:
+            return np.timedelta64(NPY_NAT)
+        else:
+            if util.is_array(ts):
+                ts = ts.astype('int64').item()
+            if unit in ['Y', 'M', 'W']:
+                ts = np.timedelta64(ts, unit)
+            else:
+                ts = cast_from_unit(ts, unit)
+                ts = np.timedelta64(ts)
+    elif is_float_object(ts):
+        if util.is_array(ts):
+            ts = ts.astype('int64').item()
+        if unit in ['Y', 'M', 'W']:
+            ts = np.timedelta64(int(ts), unit)
+        else:
+            ts = cast_from_unit(ts, unit)
+            ts = np.timedelta64(ts)
+    elif is_string_object(ts):
+        ts = np.timedelta64(parse_timedelta_string(ts))
+    elif hasattr(ts, 'delta'):
+        ts = np.timedelta64(delta_to_nanoseconds(ts), 'ns')
+
+    if PyDelta_Check(ts):
+        ts = np.timedelta64(delta_to_nanoseconds(ts), 'ns')
+    elif not is_timedelta64_object(ts):
+        raise ValueError("Invalid type for timedelta "
+                         "scalar: {ts_type}".format(ts_type=type(ts)))
+    return ts.astype('timedelta64[ns]')
+
+
+cpdef array_to_timedelta64(ndarray[object] values, unit='ns', errors='raise'):
+    """
+    Convert an ndarray to an array of timedeltas. If errors == 'coerce',
+    coerce non-convertible objects to NaT. Otherwise, raise.
+    """
+
+    cdef:
+        Py_ssize_t i, n
+        ndarray[int64_t] iresult
+
+    if errors not in ('ignore', 'raise', 'coerce'):
+        raise ValueError("errors must be one of 'ignore', "
+                         "'raise', or 'coerce'}")
+
+    n = values.shape[0]
+    result = np.empty(n, dtype='m8[ns]')
+    iresult = result.view('i8')
+
+    # Usually, we have all strings. If so, we hit the fast path.
+    # If this path fails, we try conversion a different way, and
+    # this is where all of the error handling will take place.
+    try:
+        for i in range(n):
+            result[i] = parse_timedelta_string(values[i])
+    except:
+        for i in range(n):
+            try:
+                result[i] = convert_to_timedelta64(values[i], unit)
+            except ValueError:
+                if errors == 'coerce':
+                    result[i] = NPY_NAT
+                else:
+                    raise
+
+    return iresult
+
+
+cpdef inline int64_t cast_from_unit(object ts, object unit) except? -1:
+    """ return a casting of the unit represented to nanoseconds
+        round the fractional part of a float to our precision, p """
+    cdef:
+        int64_t m
+        int p
+
+    if unit == 'D' or unit == 'd':
+        m = 1000000000L * 86400
+        p = 9
+    elif unit == 'h':
+        m = 1000000000L * 3600
+        p = 9
+    elif unit == 'm':
+        m = 1000000000L * 60
+        p = 9
+    elif unit == 's':
+        m = 1000000000L
+        p = 9
+    elif unit == 'ms':
+        m = 1000000L
+        p = 6
+    elif unit == 'us':
+        m = 1000L
+        p = 3
+    elif unit == 'ns' or unit is None:
+        m = 1L
+        p = 0
+    else:
+        raise ValueError("cannot cast unit {0}".format(unit))
+
+    # just give me the unit back
+    if ts is None:
+        return m
+
+    # cast the unit, multiply base/frace separately
+    # to avoid precision issues from float -> int
+    base = <int64_t> ts
+    frac = ts - base
+    if p:
+        frac = round(frac, p)
+    return <int64_t> (base * m) + <int64_t> (frac * m)
+
+
+cdef inline _decode_if_necessary(object ts):
+    # decode ts if necessary
+    if not PyUnicode_Check(ts) and not PY3:
+        ts = str(ts).decode('utf-8')
+
+    return ts
+
+
+cdef inline parse_timedelta_string(object ts):
+    """
+    Parse a regular format timedelta string. Return an int64_t (in ns)
+    or raise a ValueError on an invalid parse.
+    """
+
+    cdef:
+        unicode c
+        bint neg=0, have_dot=0, have_value=0, have_hhmmss=0
+        object current_unit=None
+        int64_t result=0, m=0, r
+        list number=[], frac=[], unit=[]
+
+    # neg : tracks if we have a leading negative for the value
+    # have_dot : tracks if we are processing a dot (either post hhmmss or
+    #            inside an expression)
+    # have_value : track if we have at least 1 leading unit
+    # have_hhmmss : tracks if we have a regular format hh:mm:ss
+
+    if len(ts) == 0 or ts in nat_strings:
+        return NPY_NAT
+
+    ts = _decode_if_necessary(ts)
+
+    for c in ts:
+
+        # skip whitespace / commas
+        if c == ' ' or c == ',':
+            pass
+
+        # positive signs are ignored
+        elif c == '+':
+            pass
+
+        # neg
+        elif c == '-':
+
+            if neg or have_value or have_hhmmss:
+                raise ValueError("only leading negative signs are allowed")
+
+            neg = 1
+
+        # number (ascii codes)
+        elif ord(c) >= 48 and ord(c) <= 57:
+
+            if have_dot:
+
+                # we found a dot, but now its just a fraction
+                if len(unit):
+                    number.append(c)
+                    have_dot = 0
+                else:
+                    frac.append(c)
+
+            elif not len(unit):
+                number.append(c)
+
+            else:
+                r = timedelta_from_spec(number, frac, unit)
+                unit, number, frac = [], [c], []
+
+                result += timedelta_as_neg(r, neg)
+
+        # hh:mm:ss.
+        elif c == ':':
+
+            # we flip this off if we have a leading value
+            if have_value:
+                neg = 0
+
+            # we are in the pattern hh:mm:ss pattern
+            if len(number):
+                if current_unit is None:
+                    current_unit = 'h'
+                    m = 1000000000L * 3600
+                elif current_unit == 'h':
+                    current_unit = 'm'
+                    m = 1000000000L * 60
+                elif current_unit == 'm':
+                    current_unit = 's'
+                    m = 1000000000L
+                r = <int64_t> int(''.join(number)) * m
+                result += timedelta_as_neg(r, neg)
+                have_hhmmss = 1
+            else:
+                raise ValueError("expecting hh:mm:ss format, "
+                                 "received: {0}".format(ts))
+
+            unit, number = [], []
+
+        # after the decimal point
+        elif c == '.':
+
+            if len(number) and current_unit is not None:
+
+                # by definition we had something like
+                # so we need to evaluate the final field from a
+                # hh:mm:ss (so current_unit is 'm')
+                if current_unit != 'm':
+                    raise ValueError("expected hh:mm:ss format before .")
+                m = 1000000000L
+                r = <int64_t> int(''.join(number)) * m
+                result += timedelta_as_neg(r, neg)
+                have_value = 1
+                unit, number, frac = [], [], []
+
+            have_dot = 1
+
+        # unit
+        else:
+            unit.append(c)
+            have_value = 1
+            have_dot = 0
+
+    # we had a dot, but we have a fractional
+    # value since we have an unit
+    if have_dot and len(unit):
+        r = timedelta_from_spec(number, frac, unit)
+        result += timedelta_as_neg(r, neg)
+
+    # we have a dot as part of a regular format
+    # e.g. hh:mm:ss.fffffff
+    elif have_dot:
+
+        if ((len(number) or len(frac)) and not len(unit)
+                and current_unit is None):
+            raise ValueError("no units specified")
+
+        if len(frac) > 0 and len(frac) <= 3:
+            m = 10**(3 -len(frac)) * 1000L * 1000L
+        elif len(frac) > 3 and len(frac) <= 6:
+            m = 10**(6 -len(frac)) * 1000L
+        else:
+            m = 10**(9 -len(frac))
+
+        r = <int64_t> int(''.join(frac)) * m
+        result += timedelta_as_neg(r, neg)
+
+    # we have a regular format
+    # we must have seconds at this point (hence the unit is still 'm')
+    elif current_unit is not None:
+        if current_unit != 'm':
+            raise ValueError("expected hh:mm:ss format")
+        m = 1000000000L
+        r = <int64_t> int(''.join(number)) * m
+        result += timedelta_as_neg(r, neg)
+
+    # we have a last abbreviation
+    elif len(unit):
+        if len(number):
+            r = timedelta_from_spec(number, frac, unit)
+            result += timedelta_as_neg(r, neg)
+        else:
+            raise ValueError("unit abbreviation w/o a number")
+
+    # treat as nanoseconds
+    # but only if we don't have anything else
+    else:
+        if have_value:
+            raise ValueError("have leftover units")
+        if len(number):
+            r = timedelta_from_spec(number, frac, 'ns')
+            result += timedelta_as_neg(r, neg)
+
+    return result
+
+
+cdef inline int64_t timedelta_as_neg(int64_t value, bint neg):
+    """
+
+    Parameters
+    ----------
+    value : int64_t of the timedelta value
+    neg : boolean if the a negative value
+    """
+    if neg:
+        return -value
+    return value
+
+
+cdef inline timedelta_from_spec(object number, object frac, object unit):
+    """
+
+    Parameters
+    ----------
+    number : a list of number digits
+    frac : a list of frac digits
+    unit : a list of unit characters
+    """
+    cdef object n
+
+    try:
+        unit = ''.join(unit)
+        unit = timedelta_abbrevs[unit.lower()]
+    except KeyError:
+        raise ValueError("invalid abbreviation: {0}".format(unit))
+
+    n = ''.join(number) + '.' + ''.join(frac)
+    return cast_from_unit(float(n), unit)
+
+
+# ----------------------------------------------------------------------
+# Timedelta ops utilities
+
+cdef bint _validate_ops_compat(other):
+    # return True if we are compat with operating
+    if checknull_with_nat(other):
+        return True
+    elif PyDelta_Check(other) or is_timedelta64_object(other):
+        return True
+    elif is_string_object(other):
+        return True
+    elif hasattr(other, 'delta'):
+        return True
+    return False
+
+
+def _op_unary_method(func, name):
+    def f(self):
+        return Timedelta(func(self.value), unit='ns')
+    f.__name__ = name
+    return f
+
+
+def _binary_op_method_timedeltalike(op, name):
+    # define a binary operation that only works if the other argument is
+    # timedelta like or an array of timedeltalike
+    def f(self, other):
+        if hasattr(other, '_typ'):
+            # Series, DataFrame, ...
+            if other._typ == 'dateoffset' and hasattr(other, 'delta'):
+                # Tick offset
+                return op(self, other.delta)
+            return NotImplemented
+
+        elif other is NaT:
+            return NaT
+
+        elif is_timedelta64_object(other):
+            # convert to Timedelta below; avoid catching this in
+            # has-dtype check before then
+            pass
+
+        elif is_datetime64_object(other) or PyDateTime_CheckExact(other):
+            # the PyDateTime_CheckExact case is for a datetime object that
+            # is specifically *not* a Timestamp, as the Timestamp case will be
+            # handled after `_validate_ops_compat` returns False below
+            from timestamps import Timestamp
+            return op(self, Timestamp(other))
+            # We are implicitly requiring the canonical behavior to be
+            # defined by Timestamp methods.
+
+        elif hasattr(other, 'dtype'):
+            # nd-array like
+            if other.dtype.kind not in ['m', 'M']:
+                # raise rathering than letting numpy return wrong answer
+                return NotImplemented
+            return op(self.to_timedelta64(), other)
+
+        elif not _validate_ops_compat(other):
+            return NotImplemented
+
+        try:
+            other = Timedelta(other)
+        except ValueError:
+            # failed to parse as timedelta
+            return NotImplemented
+
+        if other is NaT:
+            # e.g. if original other was timedelta64('NaT')
+            return NaT
+        return Timedelta(op(self.value, other.value), unit='ns')
+
+    f.__name__ = name
+    return f
+
+
+# ----------------------------------------------------------------------
+# Timedelta Construction
+
+cdef inline int64_t parse_iso_format_string(object ts) except? -1:
+    """
+    Extracts and cleanses the appropriate values from a match object with
+    groups for each component of an ISO 8601 duration
+
+    Parameters
+    ----------
+    ts:
+        ISO 8601 Duration formatted string
+
+    Returns
+    -------
+    ns: int64_t
+        Precision in nanoseconds of matched ISO 8601 duration
+
+    Raises
+    ------
+    ValueError
+        If ``ts`` cannot be parsed
+    """
+
+    cdef:
+        unicode c
+        int64_t result = 0, r
+        int p=0
+        object dec_unit = 'ms', err_msg
+        bint have_dot=0, have_value=0, neg=0
+        list number=[], unit=[]
+
+    ts = _decode_if_necessary(ts)
+
+    err_msg = "Invalid ISO 8601 Duration format - {}".format(ts)
+
+    for c in ts:
+        # number (ascii codes)
+        if ord(c) >= 48 and ord(c) <= 57:
+
+            have_value = 1
+            if have_dot:
+                if p == 3 and dec_unit != 'ns':
+                    unit.append(dec_unit)
+                    if dec_unit == 'ms':
+                        dec_unit = 'us'
+                    elif dec_unit == 'us':
+                        dec_unit = 'ns'
+                    p = 0
+                p += 1
+
+            if not len(unit):
+                number.append(c)
+            else:
+                # if in days, pop trailing T
+                if unit[-1] == 'T':
+                    unit.pop()
+                elif 'H' in unit or 'M' in unit:
+                    if len(number) > 2:
+                        raise ValueError(err_msg)
+                r = timedelta_from_spec(number, '0', unit)
+                result += timedelta_as_neg(r, neg)
+
+                neg = 0
+                unit, number = [], [c]
+        else:
+            if c == 'P':
+                pass  # ignore leading character
+            elif c == '-':
+                if neg or have_value:
+                    raise ValueError(err_msg)
+                else:
+                    neg = 1
+            elif c in ['D', 'T', 'H', 'M']:
+                unit.append(c)
+            elif c == '.':
+                # append any seconds
+                if len(number):
+                    r = timedelta_from_spec(number, '0', 'S')
+                    result += timedelta_as_neg(r, neg)
+                    unit, number = [], []
+                have_dot = 1
+            elif c == 'S':
+                if have_dot:  # ms, us, or ns
+                    if not len(number) or p > 3:
+                        raise ValueError(err_msg)
+                    # pad to 3 digits as required
+                    pad = 3 - p
+                    while pad > 0:
+                        number.append('0')
+                        pad -= 1
+
+                    r = timedelta_from_spec(number, '0', dec_unit)
+                    result += timedelta_as_neg(r, neg)
+                else:  # seconds
+                    if len(number) <= 2:
+                        r = timedelta_from_spec(number, '0', 'S')
+                        result += timedelta_as_neg(r, neg)
+                    else:
+                        raise ValueError(err_msg)
+            else:
+                raise ValueError(err_msg)
+
+    if not have_value:
+        # Received string only - never parsed any values
+        raise ValueError(err_msg)
+
+    return result
+
+
+cdef _to_py_int_float(v):
+    # Note: This used to be defined inside Timedelta.__new__
+    # but cython will not allow `cdef` functions to be defined dynamically.
+    if is_integer_object(v):
+        return int(v)
+    elif is_float_object(v):
+        return float(v)
+    raise TypeError("Invalid type {0}. Must be int or "
+                    "float.".format(type(v)))
+
+
+# Similar to Timestamp/datetime, this is a construction requirement for
+# timedeltas that we need to do object instantiation in python. This will
+# serve as a C extension type that shadows the Python class, where we do any
+# heavy lifting.
+cdef class _Timedelta(timedelta):
+    cdef readonly:
+        int64_t value      # nanoseconds
+        object freq        # frequency reference
+        bint is_populated  # are my components populated
+        int64_t _d, _h, _m, _s, _ms, _us, _ns
+
+    # higher than np.ndarray and np.matrix
+    __array_priority__ = 100
+
+    def __hash__(_Timedelta self):
+        if self._has_ns():
+            return hash(self.value)
+        else:
+            return timedelta.__hash__(self)
+
+    def __richcmp__(_Timedelta self, object other, int op):
+        cdef:
+            _Timedelta ots
+            int ndim
+
+        if isinstance(other, _Timedelta):
+            ots = other
+        elif PyDelta_Check(other):
+            ots = Timedelta(other)
+        else:
+            ndim = getattr(other, "ndim", -1)
+
+            if ndim != -1:
+                if ndim == 0:
+                    if is_timedelta64_object(other):
+                        other = Timedelta(other)
+                    else:
+                        if op == Py_EQ:
+                            return False
+                        elif op == Py_NE:
+                            return True
+
+                        # only allow ==, != ops
+                        raise TypeError('Cannot compare type {!r} with type ' \
+                                        '{!r}'.format(type(self).__name__,
+                                                      type(other).__name__))
+                if util.is_array(other):
+                    return PyObject_RichCompare(np.array([self]), other, op)
+                return PyObject_RichCompare(other, self, reverse_ops[op])
+            else:
+                if op == Py_EQ:
+                    return False
+                elif op == Py_NE:
+                    return True
+                raise TypeError('Cannot compare type {!r} with type ' \
+                                '{!r}'.format(type(self).__name__,
+                                              type(other).__name__))
+
+        return cmp_scalar(self.value, ots.value, op)
+
+    cpdef bint _has_ns(self):
+        return self.value % 1000 != 0
+
+    def _ensure_components(_Timedelta self):
+        """
+        compute the components
+        """
+        if self.is_populated:
+            return
+
+        cdef:
+            pandas_timedeltastruct tds
+
+        td64_to_tdstruct(self.value, &tds)
+        self._d = tds.days
+        self._h = tds.hrs
+        self._m = tds.min
+        self._s = tds.sec
+        self._ms = tds.ms
+        self._us = tds.us
+        self._ns = tds.ns
+        self._seconds = tds.seconds
+        self._microseconds = tds.microseconds
+
+        self.is_populated = 1
+
+    cpdef timedelta to_pytimedelta(_Timedelta self):
+        """
+        return an actual datetime.timedelta object
+        note: we lose nanosecond resolution if any
+        """
+        return timedelta(microseconds=int(self.value) / 1000)
+
+    def to_timedelta64(self):
+        """ Returns a numpy.timedelta64 object with 'ns' precision """
+        return np.timedelta64(self.value, 'ns')
+
+    def total_seconds(self):
+        """
+        Total duration of timedelta in seconds (to ns precision)
+        """
+        return self.value / 1e9
+
+    def view(self, dtype):
+        """ array view compat """
+        return np.timedelta64(self.value).view(dtype)
+
+    @property
+    def components(self):
+        """ Return a Components NamedTuple-like """
+        self._ensure_components()
+        # return the named tuple
+        return Components(self._d, self._h, self._m, self._s,
+                          self._ms, self._us, self._ns)
+
+    @property
+    def delta(self):
+        """
+        Return the timedelta in nanoseconds (ns), for internal compatibility.
+
+        Returns
+        -------
+        int
+            Timedelta in nanoseconds.
+
+        Examples
+        --------
+        >>> td = pd.Timedelta('1 days 42 ns')
+        >>> td.delta
+        86400000000042
+
+        >>> td = pd.Timedelta('3 s')
+        >>> td.delta
+        3000000000
+
+        >>> td = pd.Timedelta('3 ms 5 us')
+        >>> td.delta
+        3005000
+
+        >>> td = pd.Timedelta(42, unit='ns')
+        >>> td.delta
+        42
+        """
+        return self.value
+
+    @property
+    def asm8(self):
+        """ return a numpy timedelta64 array view of myself """
+        return np.int64(self.value).view('m8[ns]')
+
+    @property
+    def resolution(self):
+        """ return a string representing the lowest resolution that we have """
+
+        self._ensure_components()
+        if self._ns:
+            return "N"
+        elif self._us:
+            return "U"
+        elif self._ms:
+            return "L"
+        elif self._s:
+            return "S"
+        elif self._m:
+            return "T"
+        elif self._h:
+            return "H"
+        else:
+            return "D"
+
+    @property
+    def nanoseconds(self):
+        """
+        Return the number of nanoseconds (n), where 0 <= n < 1 microsecond.
+       
+        Returns
+        -------
+        int
+            Number of nanoseconds.
+
+        See Also
+        --------
+        Timedelta.components : Return all attributes with assigned values
+            (i.e. days, hours, minutes, seconds, milliseconds, microseconds,
+            nanoseconds).
+
+        Examples
+        --------
+        **Using string input**
+
+        >>> td = pd.Timedelta('1 days 2 min 3 us 42 ns')
+        >>> td.nanoseconds
+        42
+
+        **Using integer input**
+
+        >>> td = pd.Timedelta(42, unit='ns')
+        >>> td.nanoseconds
+        42
+        """
+        self._ensure_components()
+        return self._ns
+
+    def _repr_base(self, format=None):
+        """
+
+        Parameters
+        ----------
+        format : None|all|sub_day|long
+
+        Returns
+        -------
+        converted : string of a Timedelta
+
+        """
+        cdef object sign, seconds_pretty, subs, fmt, comp_dict
+
+        self._ensure_components()
+
+        if self._d < 0:
+            sign = " +"
+        else:
+            sign = " "
+
+        if format == 'all':
+            fmt = "{days} days{sign}{hours:02}:{minutes:02}:{seconds:02}." \
+                  "{milliseconds:03}{microseconds:03}{nanoseconds:03}"
+        else:
+            # if we have a partial day
+            subs = (self._h or self._m or self._s or
+                    self._ms or self._us or self._ns)
+
+            # by default not showing nano
+            if self._ms or self._us or self._ns:
+                seconds_fmt = "{seconds:02}.{milliseconds:03}{microseconds:03}"
+            else:
+                seconds_fmt = "{seconds:02}"
+
+            if format == 'sub_day' and not self._d:
+                fmt = "{hours:02}:{minutes:02}:" + seconds_fmt
+            elif subs or format == 'long':
+                fmt = "{days} days{sign}{hours:02}:{minutes:02}:" + seconds_fmt
+            else:
+                fmt = "{days} days"
+
+        comp_dict = self.components._asdict()
+        comp_dict['sign'] = sign
+
+        return fmt.format(**comp_dict)
+
+    def __repr__(self):
+        return "Timedelta('{0}')".format(self._repr_base(format='long'))
+
+    def __str__(self):
+        return self._repr_base(format='long')
+
+    def __bool__(self):
+        return self.value != 0
+
+    def isoformat(self):
+        """
+        Format Timedelta as ISO 8601 Duration like
+        ``P[n]Y[n]M[n]DT[n]H[n]M[n]S``, where the ``[n]`` s are replaced by the
+        values. See https://en.wikipedia.org/wiki/ISO_8601#Durations
+
+        .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        formatted : str
+
+        Notes
+        -----
+        The longest component is days, whose value may be larger than
+        365.
+        Every component is always included, even if its value is 0.
+        Pandas uses nanosecond precision, so up to 9 decimal places may
+        be included in the seconds component.
+        Trailing 0's are removed from the seconds component after the decimal.
+        We do not 0 pad components, so it's `...T5H...`, not `...T05H...`
+
+        Examples
+        --------
+        >>> td = pd.Timedelta(days=6, minutes=50, seconds=3,
+        ...                   milliseconds=10, microseconds=10, nanoseconds=12)
+        >>> td.isoformat()
+        'P6DT0H50M3.010010012S'
+        >>> pd.Timedelta(hours=1, seconds=10).isoformat()
+        'P0DT0H0M10S'
+        >>> pd.Timedelta(hours=1, seconds=10).isoformat()
+        'P0DT0H0M10S'
+        >>> pd.Timedelta(days=500.5).isoformat()
+        'P500DT12H0MS'
+
+        See Also
+        --------
+        Timestamp.isoformat
+        """
+        components = self.components
+        seconds = '{}.{:0>3}{:0>3}{:0>3}'.format(components.seconds,
+                                                 components.milliseconds,
+                                                 components.microseconds,
+                                                 components.nanoseconds)
+        # Trim unnecessary 0s, 1.000000000 -> 1
+        seconds = seconds.rstrip('0').rstrip('.')
+        tpl = 'P{td.days}DT{td.hours}H{td.minutes}M{seconds}S'.format(
+            td=components, seconds=seconds)
+        return tpl
+
+
+# Python front end to C extension type _Timedelta
+# This serves as the box for timedelta64
+
+class Timedelta(_Timedelta):
+    """
+    Represents a duration, the difference between two dates or times.
+
+    Timedelta is the pandas equivalent of python's ``datetime.timedelta``
+    and is interchangeable with it in most cases.
+
+    Parameters
+    ----------
+    value : Timedelta, timedelta, np.timedelta64, string, or integer
+    unit : string, {'ns', 'us', 'ms', 's', 'm', 'h', 'D'}, optional
+        Denote the unit of the input, if input is an integer. Default 'ns'.
+    days, seconds, microseconds,
+    milliseconds, minutes, hours, weeks : numeric, optional
+        Values for construction in compat with datetime.timedelta.
+        np ints and floats will be coerced to python ints and floats.
+
+    Notes
+    -----
+    The ``.value`` attribute is always in ns.
+
+    """
+    def __new__(cls, object value=_no_input, unit=None, **kwargs):
+        cdef _Timedelta td_base
+
+        if value is _no_input:
+            if not len(kwargs):
+                raise ValueError("cannot construct a Timedelta without a "
+                                 "value/unit or descriptive keywords "
+                                 "(days,seconds....)")
+
+            kwargs = {key: _to_py_int_float(kwargs[key]) for key in kwargs}
+
+            nano = kwargs.pop('nanoseconds', 0)
+            try:
+                value = nano + convert_to_timedelta64(timedelta(**kwargs),
+                                                      'ns')
+            except TypeError as e:
+                raise ValueError("cannot construct a Timedelta from the "
+                                 "passed arguments, allowed keywords are "
+                                 "[weeks, days, hours, minutes, seconds, "
+                                 "milliseconds, microseconds, nanoseconds]")
+
+        if isinstance(value, Timedelta):
+            value = value.value
+        elif is_string_object(value):
+            if len(value) > 0 and value[0] == 'P':
+                value = parse_iso_format_string(value)
+            else:
+                value = parse_timedelta_string(value)
+            value = np.timedelta64(value)
+        elif PyDelta_Check(value):
+            value = convert_to_timedelta64(value, 'ns')
+        elif is_timedelta64_object(value):
+            if unit is not None:
+                value = value.astype('timedelta64[{0}]'.format(unit))
+            value = value.astype('timedelta64[ns]')
+        elif hasattr(value, 'delta'):
+            value = np.timedelta64(delta_to_nanoseconds(value.delta), 'ns')
+        elif is_integer_object(value) or is_float_object(value):
+            # unit=None is de-facto 'ns'
+            value = convert_to_timedelta64(value, unit)
+        elif checknull_with_nat(value):
+            return NaT
+        else:
+            raise ValueError(
+                "Value must be Timedelta, string, integer, "
+                "float, timedelta or convertible")
+
+        if is_timedelta64_object(value):
+            value = value.view('i8')
+
+        # nat
+        if value == NPY_NAT:
+            return NaT
+
+        # make timedelta happy
+        td_base = _Timedelta.__new__(cls, microseconds=int(value) / 1000)
+        td_base.value = value
+        td_base.is_populated = 0
+        return td_base
+
+    def __setstate__(self, state):
+        (value) = state
+        self.value = value
+
+    def __reduce__(self):
+        object_state = self.value,
+        return (Timedelta, object_state)
+
+    def _round(self, freq, rounder):
+        cdef:
+            int64_t result, unit
+
+        from pandas.tseries.frequencies import to_offset
+        unit = to_offset(freq).nanos
+        result = unit * rounder(self.value / float(unit))
+        return Timedelta(result, unit='ns')
+
+    def round(self, freq):
+        """
+        Round the Timedelta to the specified resolution
+
+        Returns
+        -------
+        a new Timedelta rounded to the given resolution of `freq`
+
+        Parameters
+        ----------
+        freq : a freq string indicating the rounding resolution
+
+        Raises
+        ------
+        ValueError if the freq cannot be converted
+        """
+        return self._round(freq, np.round)
+
+    def floor(self, freq):
+        """
+        return a new Timedelta floored to this resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the flooring resolution
+        """
+        return self._round(freq, np.floor)
+
+    def ceil(self, freq):
+        """
+        return a new Timedelta ceiled to this resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the ceiling resolution
+        """
+        return self._round(freq, np.ceil)
+
+    # ----------------------------------------------------------------
+    # Arithmetic Methods
+    # TODO: Can some of these be defined in the cython class?
+
+    __inv__ = _op_unary_method(lambda x: -x, '__inv__')
+    __neg__ = _op_unary_method(lambda x: -x, '__neg__')
+    __pos__ = _op_unary_method(lambda x: x, '__pos__')
+    __abs__ = _op_unary_method(lambda x: abs(x), '__abs__')
+
+    __add__ = _binary_op_method_timedeltalike(lambda x, y: x + y, '__add__')
+    __radd__ = _binary_op_method_timedeltalike(lambda x, y: x + y, '__radd__')
+    __sub__ = _binary_op_method_timedeltalike(lambda x, y: x - y, '__sub__')
+    __rsub__ = _binary_op_method_timedeltalike(lambda x, y: y - x, '__rsub__')
+
+    def __mul__(self, other):
+        if hasattr(other, '_typ'):
+            # Series, DataFrame, ...
+            if other._typ == 'dateoffset' and hasattr(other, 'delta'):
+                # Tick offset; this op will raise TypeError
+                return other.delta * self
+            return NotImplemented
+
+        elif hasattr(other, 'dtype'):
+            # ndarray-like
+            return other * self.to_timedelta64()
+
+        elif other is NaT:
+            raise TypeError('Cannot multiply Timedelta with NaT')
+
+        elif not (is_integer_object(other) or is_float_object(other)):
+            # only integers and floats allowed
+            return NotImplemented
+
+        return Timedelta(other * self.value, unit='ns')
+
+    __rmul__ = __mul__
+
+    def __truediv__(self, other):
+        if hasattr(other, '_typ'):
+            # Series, DataFrame, ...
+            if other._typ == 'dateoffset' and hasattr(other, 'delta'):
+                # Tick offset
+                return self / other.delta
+            return NotImplemented
+
+        elif is_timedelta64_object(other):
+            # convert to Timedelta below
+            pass
+
+        elif hasattr(other, 'dtype'):
+            return self.to_timedelta64() / other
+
+        elif is_integer_object(other) or is_float_object(other):
+            # integers or floats
+            return Timedelta(self.value / other, unit='ns')
+
+        elif not _validate_ops_compat(other):
+            return NotImplemented
+
+        other = Timedelta(other)
+        if other is NaT:
+            return np.nan
+        return self.value / float(other.value)
+
+    def __rtruediv__(self, other):
+        if hasattr(other, '_typ'):
+            # Series, DataFrame, ...
+            if other._typ == 'dateoffset' and hasattr(other, 'delta'):
+                # Tick offset
+                return other.delta / self
+            return NotImplemented
+
+        elif is_timedelta64_object(other):
+            # convert to Timedelta below
+            pass
+
+        elif hasattr(other, 'dtype'):
+            return other / self.to_timedelta64()
+
+        elif not _validate_ops_compat(other):
+            return NotImplemented
+
+        other = Timedelta(other)
+        if other is NaT:
+            return NaT
+        return float(other.value) / self.value
+
+    if not PY3:
+        __div__ = __truediv__
+        __rdiv__ = __rtruediv__
+
+    def __floordiv__(self, other):
+        # numpy does not implement floordiv for timedelta64 dtype, so we cannot
+        # just defer
+        if hasattr(other, '_typ'):
+            # Series, DataFrame, ...
+            if other._typ == 'dateoffset' and hasattr(other, 'delta'):
+                # Tick offset
+                return self // other.delta
+            return NotImplemented
+
+        elif is_timedelta64_object(other):
+            # convert to Timedelta below
+            pass
+
+        elif hasattr(other, 'dtype'):
+            if other.dtype.kind == 'm':
+                # also timedelta-like
+                return _broadcast_floordiv_td64(self.value, other, _floordiv)
+            elif other.dtype.kind in ['i', 'u', 'f']:
+                if other.ndim == 0:
+                    return Timedelta(self.value // other)
+                else:
+                    return self.to_timedelta64() // other
+
+            raise TypeError('Invalid dtype {dtype} for '
+                            '{op}'.format(dtype=other.dtype,
+                                          op='__floordiv__'))
+
+        elif is_integer_object(other) or is_float_object(other):
+            return Timedelta(self.value // other, unit='ns')
+
+        elif not _validate_ops_compat(other):
+            return NotImplemented
+
+        other = Timedelta(other)
+        if other is NaT:
+            return np.nan
+        return self.value // other.value
+
+    def __rfloordiv__(self, other):
+        # numpy does not implement floordiv for timedelta64 dtype, so we cannot
+        # just defer
+        if hasattr(other, '_typ'):
+            # Series, DataFrame, ...
+            if other._typ == 'dateoffset' and hasattr(other, 'delta'):
+                # Tick offset
+                return other.delta // self
+            return NotImplemented
+
+        elif is_timedelta64_object(other):
+            # convert to Timedelta below
+            pass
+
+        elif hasattr(other, 'dtype'):
+            if other.dtype.kind == 'm':
+                # also timedelta-like
+                return _broadcast_floordiv_td64(self.value, other, _rfloordiv)
+            elif other.dtype.kind == 'i':
+                # Backwards compatibility
+                # GH-19761
+                msg = textwrap.dedent("""\
+                Floor division between integer array and Timedelta is
+                deprecated. Use 'array // timedelta.value' instead.
+                If you want to obtain epochs from an array of timestamps,
+                you can rather use
+                '(array - pd.Timestamp("1970-01-01")) // pd.Timedelta("1s")'.
+                """)
+                warnings.warn(msg, FutureWarning)
+                return other // self.value
+            raise TypeError('Invalid dtype {dtype} for '
+                            '{op}'.format(dtype=other.dtype,
+                                          op='__floordiv__'))
+
+        elif is_float_object(other) and util._checknull(other):
+            # i.e. np.nan
+            return NotImplemented
+
+        elif not _validate_ops_compat(other):
+            return NotImplemented
+
+        other = Timedelta(other)
+        if other is NaT:
+            return np.nan
+        return other.value // self.value
+
+    def __mod__(self, other):
+        # Naive implementation, room for optimization
+        return self.__divmod__(other)[1]
+
+    def __rmod__(self, other):
+        # Naive implementation, room for optimization
+        if hasattr(other, 'dtype') and other.dtype.kind == 'i':
+            # TODO: Remove this check with backwards-compat shim
+            # for integer / Timedelta is removed.
+            raise TypeError("Invalid type {dtype} for "
+                            "{op}".format(dtype=other.dtype, op='__mod__'))
+        return self.__rdivmod__(other)[1]
+
+    def __divmod__(self, other):
+        # Naive implementation, room for optimization
+        div = self // other
+        return div, self - div * other
+
+    def __rdivmod__(self, other):
+        # Naive implementation, room for optimization
+        if hasattr(other, 'dtype') and other.dtype.kind == 'i':
+            # TODO: Remove this check with backwards-compat shim
+            # for integer / Timedelta is removed.
+            raise TypeError("Invalid type {dtype} for "
+                            "{op}".format(dtype=other.dtype, op='__mod__'))
+        div = other // self
+        return div, other - div * self
+
+
+cdef _floordiv(int64_t value, right):
+    return value // right
+
+
+cdef _rfloordiv(int64_t value, right):
+    # analogous to referencing operator.div, but there is no operator.rfloordiv
+    return right // value
+
+
+cdef _broadcast_floordiv_td64(int64_t value, object other,
+                              object (*operation)(int64_t value,
+                                                  object right)):
+    """Boilerplate code shared by Timedelta.__floordiv__ and
+    Timedelta.__rfloordiv__ because np.timedelta64 does not implement these.
+
+    Parameters
+    ----------
+    value : int64_t; `self.value` from a Timedelta object
+    other : object
+    operation : function, either _floordiv or _rfloordiv
+
+    Returns
+    -------
+    result : varies based on `other`
+    """
+    # assumes other.dtype.kind == 'm', i.e. other is timedelta-like
+    cdef:
+        int ndim = getattr(other, 'ndim', -1)
+
+    # We need to watch out for np.timedelta64('NaT').
+    mask = other.view('i8') == NPY_NAT
+
+    if ndim == 0:
+        if mask:
+            return np.nan
+
+        return operation(value, other.astype('m8[ns]').astype('i8'))
+
+    else:
+        res = operation(value, other.astype('m8[ns]').astype('i8'))
+
+        if mask.any():
+            res = res.astype('f8')
+            res[mask] = np.nan
+        return res
+
+
+# resolution in ns
+Timedelta.min = Timedelta(np.iinfo(np.int64).min + 1)
+Timedelta.max = Timedelta(np.iinfo(np.int64).max)
diff --git a/pandas/_libs/tslibs/timestamps.pxd b/pandas/_libs/tslibs/timestamps.pxd
new file mode 100644
index 0000000000000..8e7380b37209e
--- /dev/null
+++ b/pandas/_libs/tslibs/timestamps.pxd
@@ -0,0 +1,11 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+from numpy cimport int64_t
+from np_datetime cimport pandas_datetimestruct
+
+cdef object create_timestamp_from_ts(int64_t value,
+                                     pandas_datetimestruct dts,
+                                     object tz, object freq)
+
+cdef int64_t _NS_UPPER_BOUND, _NS_LOWER_BOUND
diff --git a/pandas/_libs/tslibs/timestamps.pyx b/pandas/_libs/tslibs/timestamps.pyx
new file mode 100644
index 0000000000000..123ccebf83a56
--- /dev/null
+++ b/pandas/_libs/tslibs/timestamps.pyx
@@ -0,0 +1,1109 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+import warnings
+
+from cpython cimport (PyObject_RichCompareBool, PyObject_RichCompare,
+                      Py_GT, Py_GE, Py_EQ, Py_NE, Py_LT, Py_LE)
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport int64_t, int32_t, ndarray
+cnp.import_array()
+
+from datetime import time as datetime_time
+from cpython.datetime cimport (datetime,
+                               PyDateTime_Check, PyDelta_Check, PyTZInfo_Check,
+                               PyDateTime_IMPORT)
+PyDateTime_IMPORT
+
+from util cimport (is_datetime64_object, is_timedelta64_object,
+                   is_integer_object, is_string_object, is_array,
+                   INT64_MAX)
+
+cimport ccalendar
+from conversion import tz_localize_to_utc, date_normalize
+from conversion cimport (tz_convert_single, _TSObject,
+                         convert_to_tsobject, convert_datetime_to_tsobject)
+from fields import get_start_end_field, get_date_name_field
+from nattype import NaT
+from nattype cimport NPY_NAT
+from np_datetime import OutOfBoundsDatetime
+from np_datetime cimport (reverse_ops, cmp_scalar, check_dts_bounds,
+                          pandas_datetimestruct, dt64_to_dtstruct)
+from timedeltas import Timedelta
+from timedeltas cimport delta_to_nanoseconds
+from timezones cimport (
+    get_timezone, is_utc, maybe_get_tz, treat_tz_as_pytz, tz_compare)
+
+# ----------------------------------------------------------------------
+# Constants
+_zero_time = datetime_time(0, 0)
+_no_input = object()
+
+# ----------------------------------------------------------------------
+
+
+cdef inline object create_timestamp_from_ts(int64_t value,
+                                            pandas_datetimestruct dts,
+                                            object tz, object freq):
+    """ convenience routine to construct a Timestamp from its parts """
+    cdef _Timestamp ts_base
+    ts_base = _Timestamp.__new__(Timestamp, dts.year, dts.month,
+                                 dts.day, dts.hour, dts.min,
+                                 dts.sec, dts.us, tz)
+    ts_base.value = value
+    ts_base.freq = freq
+    ts_base.nanosecond = dts.ps / 1000
+
+    return ts_base
+
+
+def round_ns(values, rounder, freq):
+
+    """
+    Applies rounding function at given frequency
+
+    Parameters
+    ----------
+    values : :obj:`ndarray`
+    rounder : function, eg. 'ceil', 'floor', 'round'
+    freq : str, obj
+
+    Returns
+    -------
+    :obj:`ndarray`
+    """
+
+    from pandas.tseries.frequencies import to_offset
+    unit = to_offset(freq).nanos
+
+    # GH21262 If the Timestamp is multiple of the freq str
+    # don't apply any rounding
+    mask = values % unit == 0
+    if mask.all():
+        return values
+    r = values.copy()
+
+    if unit < 1000:
+        # for nano rounding, work with the last 6 digits separately
+        # due to float precision
+        buff = 1000000
+        r[~mask] = (buff * (values[~mask] // buff) +
+                    unit * (rounder((values[~mask] % buff) *
+                            (1 / float(unit)))).astype('i8'))
+    else:
+        if unit % 1000 != 0:
+            msg = 'Precision will be lost using frequency: {}'
+            warnings.warn(msg.format(freq))
+        # GH19206
+        # to deal with round-off when unit is large
+        if unit >= 1e9:
+            divisor = 10 ** int(np.log10(unit / 1e7))
+        else:
+            divisor = 10
+        r[~mask] = (unit * rounder((values[~mask] *
+                    (divisor / float(unit))) / divisor)
+                    .astype('i8'))
+    return r
+
+
+# This is PITA. Because we inherit from datetime, which has very specific
+# construction requirements, we need to do object instantiation in python
+# (see Timestamp class above). This will serve as a C extension type that
+# shadows the python class, where we do any heavy lifting.
+cdef class _Timestamp(datetime):
+
+    cdef readonly:
+        int64_t value, nanosecond
+        object freq       # frequency reference
+        list _date_attributes
+
+    def __hash__(_Timestamp self):
+        if self.nanosecond:
+            return hash(self.value)
+        return datetime.__hash__(self)
+
+    def __richcmp__(_Timestamp self, object other, int op):
+        cdef:
+            _Timestamp ots
+            int ndim
+
+        if isinstance(other, _Timestamp):
+            ots = other
+        elif other is NaT:
+            return op == Py_NE
+        elif PyDateTime_Check(other):
+            if self.nanosecond == 0:
+                val = self.to_pydatetime()
+                return PyObject_RichCompareBool(val, other, op)
+
+            try:
+                ots = Timestamp(other)
+            except ValueError:
+                return self._compare_outside_nanorange(other, op)
+        else:
+            ndim = getattr(other, "ndim", -1)
+
+            if ndim != -1:
+                if ndim == 0:
+                    if is_datetime64_object(other):
+                        other = Timestamp(other)
+                    else:
+                        if op == Py_EQ:
+                            return False
+                        elif op == Py_NE:
+                            return True
+
+                        # only allow ==, != ops
+                        raise TypeError('Cannot compare type %r with type %r' %
+                                        (type(self).__name__,
+                                         type(other).__name__))
+                elif is_array(other):
+                    # avoid recursion error GH#15183
+                    return PyObject_RichCompare(np.array([self]), other, op)
+                return PyObject_RichCompare(other, self, reverse_ops[op])
+            else:
+                if op == Py_EQ:
+                    return False
+                elif op == Py_NE:
+                    return True
+                raise TypeError('Cannot compare type %r with type %r' %
+                                (type(self).__name__, type(other).__name__))
+
+        self._assert_tzawareness_compat(other)
+        return cmp_scalar(self.value, ots.value, op)
+
+    def __reduce_ex__(self, protocol):
+        # python 3.6 compat
+        # http://bugs.python.org/issue28730
+        # now __reduce_ex__ is defined and higher priority than __reduce__
+        return self.__reduce__()
+
+    def __repr__(self):
+        stamp = self._repr_base
+        zone = None
+
+        try:
+            stamp += self.strftime('%z')
+            if self.tzinfo:
+                zone = get_timezone(self.tzinfo)
+        except ValueError:
+            year2000 = self.replace(year=2000)
+            stamp += year2000.strftime('%z')
+            if self.tzinfo:
+                zone = get_timezone(self.tzinfo)
+
+        try:
+            stamp += zone.strftime(' %%Z')
+        except:
+            pass
+
+        tz = ", tz='{0}'".format(zone) if zone is not None else ""
+        freq = "" if self.freq is None else ", freq='{0}'".format(self.freqstr)
+
+        return "Timestamp('{stamp}'{tz}{freq})".format(stamp=stamp,
+                                                       tz=tz, freq=freq)
+
+    cdef bint _compare_outside_nanorange(_Timestamp self, datetime other,
+                                         int op) except -1:
+        cdef datetime dtval = self.to_pydatetime()
+
+        self._assert_tzawareness_compat(other)
+
+        if self.nanosecond == 0:
+            return PyObject_RichCompareBool(dtval, other, op)
+        else:
+            if op == Py_EQ:
+                return False
+            elif op == Py_NE:
+                return True
+            elif op == Py_LT:
+                return dtval < other
+            elif op == Py_LE:
+                return dtval < other
+            elif op == Py_GT:
+                return dtval >= other
+            elif op == Py_GE:
+                return dtval >= other
+
+    cdef int _assert_tzawareness_compat(_Timestamp self,
+                                        object other) except -1:
+        if self.tzinfo is None:
+            if other.tzinfo is not None:
+                raise TypeError('Cannot compare tz-naive and tz-aware '
+                                'timestamps')
+        elif other.tzinfo is None:
+            raise TypeError('Cannot compare tz-naive and tz-aware timestamps')
+
+    cpdef datetime to_pydatetime(_Timestamp self, warn=True):
+        """
+        Convert a Timestamp object to a native Python datetime object.
+
+        If warn=True, issue a warning if nanoseconds is nonzero.
+        """
+        if self.nanosecond != 0 and warn:
+            warnings.warn("Discarding nonzero nanoseconds in conversion",
+                          UserWarning, stacklevel=2)
+
+        return datetime(self.year, self.month, self.day,
+                        self.hour, self.minute, self.second,
+                        self.microsecond, self.tzinfo)
+
+    cpdef to_datetime64(self):
+        """ Returns a numpy.datetime64 object with 'ns' precision """
+        return np.datetime64(self.value, 'ns')
+
+    def __add__(self, other):
+        cdef int64_t other_int, nanos
+
+        if is_timedelta64_object(other):
+            other_int = other.astype('timedelta64[ns]').view('i8')
+            return Timestamp(self.value + other_int,
+                             tz=self.tzinfo, freq=self.freq)
+
+        elif is_integer_object(other):
+            if self is NaT:
+                # to be compat with Period
+                return NaT
+            elif self.freq is None:
+                raise ValueError("Cannot add integral value to Timestamp "
+                                 "without freq.")
+            return Timestamp((self.freq * other).apply(self), freq=self.freq)
+
+        elif PyDelta_Check(other) or hasattr(other, 'delta'):
+            # delta --> offsets.Tick
+            nanos = delta_to_nanoseconds(other)
+            result = Timestamp(self.value + nanos,
+                               tz=self.tzinfo, freq=self.freq)
+            if getattr(other, 'normalize', False):
+                # DateOffset
+                result = result.normalize()
+            return result
+
+        # index/series like
+        elif hasattr(other, '_typ'):
+            return NotImplemented
+
+        result = datetime.__add__(self, other)
+        if PyDateTime_Check(result):
+            result = Timestamp(result)
+            result.nanosecond = self.nanosecond
+        return result
+
+    def __sub__(self, other):
+        if (is_timedelta64_object(other) or is_integer_object(other) or
+                PyDelta_Check(other) or hasattr(other, 'delta')):
+            # `delta` attribute is for offsets.Tick or offsets.Week obj
+            neg_other = -other
+            return self + neg_other
+
+        # a Timestamp-DatetimeIndex -> yields a negative TimedeltaIndex
+        elif getattr(other, '_typ', None) == 'datetimeindex':
+            # timezone comparison is performed in DatetimeIndex._sub_datelike
+            return -other.__sub__(self)
+
+        # a Timestamp-TimedeltaIndex -> yields a negative TimedeltaIndex
+        elif getattr(other, '_typ', None) == 'timedeltaindex':
+            return (-other).__add__(self)
+
+        elif other is NaT:
+            return NaT
+
+        # coerce if necessary if we are a Timestamp-like
+        if (PyDateTime_Check(self)
+                and (PyDateTime_Check(other) or is_datetime64_object(other))):
+            self = Timestamp(self)
+            other = Timestamp(other)
+
+            # validate tz's
+            if not tz_compare(self.tzinfo, other.tzinfo):
+                raise TypeError("Timestamp subtraction must have the "
+                                "same timezones or no timezones")
+
+            # scalar Timestamp/datetime - Timestamp/datetime -> yields a
+            # Timedelta
+            try:
+                return Timedelta(self.value - other.value)
+            except (OverflowError, OutOfBoundsDatetime):
+                pass
+
+        # scalar Timestamp/datetime - Timedelta -> yields a Timestamp (with
+        # same timezone if specified)
+        return datetime.__sub__(self, other)
+
+    cdef int64_t _maybe_convert_value_to_local(self):
+        """Convert UTC i8 value to local i8 value if tz exists"""
+        cdef:
+            int64_t val
+        val = self.value
+        if self.tz is not None and not is_utc(self.tz):
+            val = tz_convert_single(self.value, 'UTC', self.tz)
+        return val
+
+    cpdef bint _get_start_end_field(self, str field):
+        cdef:
+            int64_t val
+            dict kwds
+            ndarray out
+            int month_kw
+
+        freq = self.freq
+        if freq:
+            kwds = freq.kwds
+            month_kw = kwds.get('startingMonth', kwds.get('month', 12))
+            freqstr = self.freqstr
+        else:
+            month_kw = 12
+            freqstr = None
+
+        val = self._maybe_convert_value_to_local()
+        out = get_start_end_field(np.array([val], dtype=np.int64),
+                                  field, freqstr, month_kw)
+        return out[0]
+
+    cpdef _get_date_name_field(self, object field, object locale):
+        cdef:
+            int64_t val
+            ndarray out
+
+        val = self._maybe_convert_value_to_local()
+        out = get_date_name_field(np.array([val], dtype=np.int64),
+                                  field, locale=locale)
+        return out[0]
+
+    @property
+    def _repr_base(self):
+        return '{date} {time}'.format(date=self._date_repr,
+                                      time=self._time_repr)
+
+    @property
+    def _date_repr(self):
+        # Ideal here would be self.strftime("%Y-%m-%d"), but
+        # the datetime strftime() methods require year >= 1900
+        return '%d-%.2d-%.2d' % (self.year, self.month, self.day)
+
+    @property
+    def _time_repr(self):
+        result = '%.2d:%.2d:%.2d' % (self.hour, self.minute, self.second)
+
+        if self.nanosecond != 0:
+            result += '.%.9d' % (self.nanosecond + 1000 * self.microsecond)
+        elif self.microsecond != 0:
+            result += '.%.6d' % self.microsecond
+
+        return result
+
+    @property
+    def _short_repr(self):
+        # format a Timestamp with only _date_repr if possible
+        # otherwise _repr_base
+        if (self.hour == 0 and
+                self.minute == 0 and
+                self.second == 0 and
+                self.microsecond == 0 and
+                self.nanosecond == 0):
+            return self._date_repr
+        return self._repr_base
+
+    @property
+    def asm8(self):
+        return np.datetime64(self.value, 'ns')
+
+    def timestamp(self):
+        """Return POSIX timestamp as float."""
+        # py27 compat, see GH#17329
+        return round(self.value / 1e9, 6)
+
+
+# ----------------------------------------------------------------------
+
+# Python front end to C extension type _Timestamp
+# This serves as the box for datetime64
+
+
+class Timestamp(_Timestamp):
+    """Pandas replacement for datetime.datetime
+
+    Timestamp is the pandas equivalent of python's Datetime
+    and is interchangeable with it in most cases. It's the type used
+    for the entries that make up a DatetimeIndex, and other timeseries
+    oriented data structures in pandas.
+
+    Parameters
+    ----------
+    ts_input : datetime-like, str, int, float
+        Value to be converted to Timestamp
+    freq : str, DateOffset
+        Offset which Timestamp will have
+    tz : str, pytz.timezone, dateutil.tz.tzfile or None
+        Time zone for time which Timestamp will have.
+    unit : str
+        Unit used for conversion if ts_input is of type int or float. The
+        valid values are 'D', 'h', 'm', 's', 'ms', 'us', and 'ns'. For
+        example, 's' means seconds and 'ms' means milliseconds.
+    year, month, day : int
+        .. versionadded:: 0.19.0
+    hour, minute, second, microsecond : int, optional, default 0
+        .. versionadded:: 0.19.0
+    nanosecond : int, optional, default 0
+        .. versionadded:: 0.23.0
+    tzinfo : datetime.tzinfo, optional, default None
+        .. versionadded:: 0.19.0
+
+    Notes
+    -----
+    There are essentially three calling conventions for the constructor. The
+    primary form accepts four parameters. They can be passed by position or
+    keyword.
+
+    The other two forms mimic the parameters from ``datetime.datetime``. They
+    can be passed by either position or keyword, but not both mixed together.
+
+    Examples
+    --------
+    Using the primary calling convention:
+
+    This converts a datetime-like string
+    >>> pd.Timestamp('2017-01-01T12')
+    Timestamp('2017-01-01 12:00:00')
+
+    This converts a float representing a Unix epoch in units of seconds
+    >>> pd.Timestamp(1513393355.5, unit='s')
+    Timestamp('2017-12-16 03:02:35.500000')
+
+    This converts an int representing a Unix-epoch in units of seconds
+    and for a particular timezone
+    >>> pd.Timestamp(1513393355, unit='s', tz='US/Pacific')
+    Timestamp('2017-12-15 19:02:35-0800', tz='US/Pacific')
+
+    Using the other two forms that mimic the API for ``datetime.datetime``:
+
+    >>> pd.Timestamp(2017, 1, 1, 12)
+    Timestamp('2017-01-01 12:00:00')
+
+    >>> pd.Timestamp(year=2017, month=1, day=1, hour=12)
+    Timestamp('2017-01-01 12:00:00')
+    """
+
+    @classmethod
+    def fromordinal(cls, ordinal, freq=None, tz=None):
+        """
+        Timestamp.fromordinal(ordinal, freq=None, tz=None)
+
+        passed an ordinal, translate and convert to a ts
+        note: by definition there cannot be any tz info on the ordinal itself
+
+        Parameters
+        ----------
+        ordinal : int
+            date corresponding to a proleptic Gregorian ordinal
+        freq : str, DateOffset
+            Offset which Timestamp will have
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will have.
+        """
+        return cls(datetime.fromordinal(ordinal),
+                   freq=freq, tz=tz)
+
+    @classmethod
+    def now(cls, tz=None):
+        """
+        Timestamp.now(tz=None)
+
+        Returns new Timestamp object representing current time local to
+        tz.
+
+        Parameters
+        ----------
+        tz : str or timezone object, default None
+            Timezone to localize to
+        """
+        if is_string_object(tz):
+            tz = maybe_get_tz(tz)
+        return cls(datetime.now(tz))
+
+    @classmethod
+    def today(cls, tz=None):
+        """
+        Timestamp.today(cls, tz=None)
+
+        Return the current time in the local timezone.  This differs
+        from datetime.today() in that it can be localized to a
+        passed timezone.
+
+        Parameters
+        ----------
+        tz : str or timezone object, default None
+            Timezone to localize to
+        """
+        return cls.now(tz)
+
+    @classmethod
+    def utcnow(cls):
+        """
+        Timestamp.utcnow()
+
+        Return a new Timestamp representing UTC day and time.
+        """
+        return cls.now('UTC')
+
+    @classmethod
+    def utcfromtimestamp(cls, ts):
+        """
+        Timestamp.utcfromtimestamp(ts)
+
+        Construct a naive UTC datetime from a POSIX timestamp.
+        """
+        return cls(datetime.utcfromtimestamp(ts))
+
+    @classmethod
+    def fromtimestamp(cls, ts):
+        """
+        Timestamp.fromtimestamp(ts)
+
+        timestamp[, tz] -> tz's local time from POSIX timestamp.
+        """
+        return cls(datetime.fromtimestamp(ts))
+
+    @classmethod
+    def combine(cls, date, time):
+        """
+        Timsetamp.combine(date, time)
+
+        date, time -> datetime with same date and time fields
+        """
+        return cls(datetime.combine(date, time))
+
+    def __new__(cls, object ts_input=_no_input,
+                object freq=None, tz=None, unit=None,
+                year=None, month=None, day=None,
+                hour=None, minute=None, second=None, microsecond=None,
+                nanosecond=None, tzinfo=None):
+        # The parameter list folds together legacy parameter names (the first
+        # four) and positional and keyword parameter names from pydatetime.
+        #
+        # There are three calling forms:
+        #
+        # - In the legacy form, the first parameter, ts_input, is required
+        #   and may be datetime-like, str, int, or float. The second
+        #   parameter, offset, is optional and may be str or DateOffset.
+        #
+        # - ints in the first, second, and third arguments indicate
+        #   pydatetime positional arguments. Only the first 8 arguments
+        #   (standing in for year, month, day, hour, minute, second,
+        #   microsecond, tzinfo) may be non-None. As a shortcut, we just
+        #   check that the second argument is an int.
+        #
+        # - Nones for the first four (legacy) arguments indicate pydatetime
+        #   keyword arguments. year, month, and day are required. As a
+        #   shortcut, we just check that the first argument was not passed.
+        #
+        # Mixing pydatetime positional and keyword arguments is forbidden!
+
+        cdef _TSObject ts
+
+        _date_attributes = [year, month, day, hour, minute, second,
+                            microsecond, nanosecond]
+
+        if tzinfo is not None:
+            if not PyTZInfo_Check(tzinfo):
+                # tzinfo must be a datetime.tzinfo object, GH#17690
+                raise TypeError('tzinfo must be a datetime.tzinfo object, '
+                                'not %s' % type(tzinfo))
+            elif tz is not None:
+                raise ValueError('Can provide at most one of tz, tzinfo')
+
+        if is_string_object(ts_input):
+            # User passed a date string to parse.
+            # Check that the user didn't also pass a date attribute kwarg.
+            if any(arg is not None for arg in _date_attributes):
+                raise ValueError('Cannot pass a date attribute keyword '
+                                 'argument when passing a date string')
+
+        elif ts_input is _no_input:
+            # User passed keyword arguments.
+            if tz is None:
+                # Handle the case where the user passes `tz` and not `tzinfo`
+                tz = tzinfo
+            return Timestamp(datetime(year, month, day, hour or 0,
+                                      minute or 0, second or 0,
+                                      microsecond or 0, tzinfo),
+                             nanosecond=nanosecond, tz=tz)
+        elif is_integer_object(freq):
+            # User passed positional arguments:
+            # Timestamp(year, month, day[, hour[, minute[, second[,
+            # microsecond[, nanosecond[, tzinfo]]]]]])
+            return Timestamp(datetime(ts_input, freq, tz, unit or 0,
+                                      year or 0, month or 0, day or 0,
+                                      minute), nanosecond=hour, tz=minute)
+
+        if tzinfo is not None:
+            # User passed tzinfo instead of tz; avoid silently ignoring
+            tz, tzinfo = tzinfo, None
+
+        ts = convert_to_tsobject(ts_input, tz, unit, 0, 0, nanosecond or 0)
+
+        if ts.value == NPY_NAT:
+            return NaT
+
+        if is_string_object(freq):
+            from pandas.tseries.frequencies import to_offset
+            freq = to_offset(freq)
+
+        return create_timestamp_from_ts(ts.value, ts.dts, ts.tzinfo, freq)
+
+    def _round(self, freq, rounder):
+        if self.tz is not None:
+            value = self.tz_localize(None).value
+        else:
+            value = self.value
+
+        value = np.array([value], dtype=np.int64)
+
+        # Will only ever contain 1 element for timestamp
+        r = round_ns(value, rounder, freq)[0]
+        result = Timestamp(r, unit='ns')
+        if self.tz is not None:
+            result = result.tz_localize(self.tz)
+        return result
+
+    def round(self, freq):
+        """
+        Round the Timestamp to the specified resolution
+
+        Returns
+        -------
+        a new Timestamp rounded to the given resolution of `freq`
+
+        Parameters
+        ----------
+        freq : a freq string indicating the rounding resolution
+
+        Raises
+        ------
+        ValueError if the freq cannot be converted
+        """
+        return self._round(freq, np.round)
+
+    def floor(self, freq):
+        """
+        return a new Timestamp floored to this resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the flooring resolution
+        """
+        return self._round(freq, np.floor)
+
+    def ceil(self, freq):
+        """
+        return a new Timestamp ceiled to this resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the ceiling resolution
+        """
+        return self._round(freq, np.ceil)
+
+    @property
+    def tz(self):
+        """
+        Alias for tzinfo
+        """
+        return self.tzinfo
+
+    @tz.setter
+    def tz(self, value):
+        # GH 3746: Prevent localizing or converting the index by setting tz
+        raise AttributeError("Cannot directly set timezone. Use tz_localize() "
+                             "or tz_convert() as appropriate")
+
+    def __setstate__(self, state):
+        self.value = state[0]
+        self.freq = state[1]
+        self.tzinfo = state[2]
+
+    def __reduce__(self):
+        object_state = self.value, self.freq, self.tzinfo
+        return (Timestamp, object_state)
+
+    def to_period(self, freq=None):
+        """
+        Return an period of which this timestamp is an observation.
+        """
+        from pandas import Period
+
+        if freq is None:
+            freq = self.freq
+
+        return Period(self, freq=freq)
+
+    @property
+    def dayofweek(self):
+        return self.weekday()
+
+    def day_name(self, locale=None):
+        """
+        Return the day name of the Timestamp with specified locale.
+
+        Parameters
+        ----------
+        locale : string, default None (English locale)
+            locale determining the language in which to return the day name
+
+        Returns
+        -------
+        day_name : string
+
+        .. versionadded:: 0.23.0
+        """
+        return self._get_date_name_field('day_name', locale)
+
+    def month_name(self, locale=None):
+        """
+        Return the month name of the Timestamp with specified locale.
+
+        Parameters
+        ----------
+        locale : string, default None (English locale)
+            locale determining the language in which to return the month name
+
+        Returns
+        -------
+        month_name : string
+
+        .. versionadded:: 0.23.0
+        """
+        return self._get_date_name_field('month_name', locale)
+
+    @property
+    def weekday_name(self):
+        """
+        .. deprecated:: 0.23.0
+            Use ``Timestamp.day_name()`` instead
+        """
+        warnings.warn("`weekday_name` is deprecated and will be removed in a "
+                      "future version. Use `day_name` instead",
+                      FutureWarning)
+        return self.day_name()
+
+    @property
+    def dayofyear(self):
+        return ccalendar.get_day_of_year(self.year, self.month, self.day)
+
+    @property
+    def week(self):
+        return ccalendar.get_week_of_year(self.year, self.month, self.day)
+
+    weekofyear = week
+
+    @property
+    def quarter(self):
+        return ((self.month - 1) // 3) + 1
+
+    @property
+    def days_in_month(self):
+        return ccalendar.get_days_in_month(self.year, self.month)
+
+    daysinmonth = days_in_month
+
+    @property
+    def freqstr(self):
+        return getattr(self.freq, 'freqstr', self.freq)
+
+    @property
+    def is_month_start(self):
+        if self.freq is None:
+            # fast-path for non-business frequencies
+            return self.day == 1
+        return self._get_start_end_field('is_month_start')
+
+    @property
+    def is_month_end(self):
+        if self.freq is None:
+            # fast-path for non-business frequencies
+            return self.day == self.days_in_month
+        return self._get_start_end_field('is_month_end')
+
+    @property
+    def is_quarter_start(self):
+        if self.freq is None:
+            # fast-path for non-business frequencies
+            return self.day == 1 and self.month % 3 == 1
+        return self._get_start_end_field('is_quarter_start')
+
+    @property
+    def is_quarter_end(self):
+        if self.freq is None:
+            # fast-path for non-business frequencies
+            return (self.month % 3) == 0 and self.day == self.days_in_month
+        return self._get_start_end_field('is_quarter_end')
+
+    @property
+    def is_year_start(self):
+        if self.freq is None:
+            # fast-path for non-business frequencies
+            return self.day == self.month == 1
+        return self._get_start_end_field('is_year_start')
+
+    @property
+    def is_year_end(self):
+        if self.freq is None:
+            # fast-path for non-business frequencies
+            return self.month == 12 and self.day == 31
+        return self._get_start_end_field('is_year_end')
+
+    @property
+    def is_leap_year(self):
+        return bool(ccalendar.is_leapyear(self.year))
+
+    def tz_localize(self, tz, ambiguous='raise', errors='raise'):
+        """
+        Convert naive Timestamp to local time zone, or remove
+        timezone from tz-aware Timestamp.
+
+        Parameters
+        ----------
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will be converted to.
+            None will remove timezone holding local time.
+
+        ambiguous : bool, 'NaT', default 'raise'
+            - bool contains flags to determine if time is dst or not (note
+              that this flag is only applicable for ambiguous fall dst dates)
+            - 'NaT' will return NaT for an ambiguous time
+            - 'raise' will raise an AmbiguousTimeError for an ambiguous time
+
+        errors : 'raise', 'coerce', default 'raise'
+            - 'raise' will raise a NonExistentTimeError if a timestamp is not
+               valid in the specified timezone (e.g. due to a transition from
+               or to DST time)
+            - 'coerce' will return NaT if the timestamp can not be converted
+              into the specified timezone
+
+              .. versionadded:: 0.19.0
+
+        Returns
+        -------
+        localized : Timestamp
+
+        Raises
+        ------
+        TypeError
+            If the Timestamp is tz-aware and tz is not None.
+        """
+        if ambiguous == 'infer':
+            raise ValueError('Cannot infer offset with only one time.')
+
+        if self.tzinfo is None:
+            # tz naive, localize
+            tz = maybe_get_tz(tz)
+            if not is_string_object(ambiguous):
+                ambiguous = [ambiguous]
+            value = tz_localize_to_utc(np.array([self.value], dtype='i8'), tz,
+                                       ambiguous=ambiguous, errors=errors)[0]
+            return Timestamp(value, tz=tz)
+        else:
+            if tz is None:
+                # reset tz
+                value = tz_convert_single(self.value, 'UTC', self.tz)
+                return Timestamp(value, tz=None)
+            else:
+                raise TypeError('Cannot localize tz-aware Timestamp, use '
+                                'tz_convert for conversions')
+
+    def tz_convert(self, tz):
+        """
+        Convert tz-aware Timestamp to another time zone.
+
+        Parameters
+        ----------
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will be converted to.
+            None will remove timezone holding UTC time.
+
+        Returns
+        -------
+        converted : Timestamp
+
+        Raises
+        ------
+        TypeError
+            If Timestamp is tz-naive.
+        """
+        if self.tzinfo is None:
+            # tz naive, use tz_localize
+            raise TypeError('Cannot convert tz-naive Timestamp, use '
+                            'tz_localize to localize')
+        else:
+            # Same UTC timestamp, different time zone
+            return Timestamp(self.value, tz=tz)
+
+    astimezone = tz_convert
+
+    def replace(self, year=None, month=None, day=None,
+                hour=None, minute=None, second=None, microsecond=None,
+                nanosecond=None, tzinfo=object, fold=0):
+        """
+        implements datetime.replace, handles nanoseconds
+
+        Parameters
+        ----------
+        year : int, optional
+        month : int, optional
+        day : int, optional
+        hour : int, optional
+        minute : int, optional
+        second : int, optional
+        microsecond : int, optional
+        nanosecond: int, optional
+        tzinfo : tz-convertible, optional
+        fold : int, optional, default is 0
+            added in 3.6, NotImplemented
+
+        Returns
+        -------
+        Timestamp with fields replaced
+        """
+
+        cdef:
+            pandas_datetimestruct dts
+            int64_t value, value_tz, offset
+            object _tzinfo, result, k, v
+            datetime ts_input
+
+        # set to naive if needed
+        _tzinfo = self.tzinfo
+        value = self.value
+        if _tzinfo is not None:
+            value_tz = tz_convert_single(value, _tzinfo, 'UTC')
+            value += value - value_tz
+
+        # setup components
+        dt64_to_dtstruct(value, &dts)
+        dts.ps = self.nanosecond * 1000
+
+        # replace
+        def validate(k, v):
+            """ validate integers """
+            if not is_integer_object(v):
+                raise ValueError("value must be an integer, received "
+                                 "{v} for {k}".format(v=type(v), k=k))
+            return v
+
+        if year is not None:
+            dts.year = validate('year', year)
+        if month is not None:
+            dts.month = validate('month', month)
+        if day is not None:
+            dts.day = validate('day', day)
+        if hour is not None:
+            dts.hour = validate('hour', hour)
+        if minute is not None:
+            dts.min = validate('minute', minute)
+        if second is not None:
+            dts.sec = validate('second', second)
+        if microsecond is not None:
+            dts.us = validate('microsecond', microsecond)
+        if nanosecond is not None:
+            dts.ps = validate('nanosecond', nanosecond) * 1000
+        if tzinfo is not object:
+            _tzinfo = tzinfo
+
+        # reconstruct & check bounds
+        if _tzinfo is not None and treat_tz_as_pytz(_tzinfo):
+            # replacing across a DST boundary may induce a new tzinfo object
+            # see GH#18319
+            ts_input = _tzinfo.localize(datetime(dts.year, dts.month, dts.day,
+                                                 dts.hour, dts.min, dts.sec,
+                                                 dts.us))
+            _tzinfo = ts_input.tzinfo
+        else:
+            ts_input = datetime(dts.year, dts.month, dts.day,
+                                dts.hour, dts.min, dts.sec, dts.us,
+                                tzinfo=_tzinfo)
+
+        ts = convert_datetime_to_tsobject(ts_input, _tzinfo)
+        value = ts.value + (dts.ps // 1000)
+        if value != NPY_NAT:
+            check_dts_bounds(&dts)
+
+        return create_timestamp_from_ts(value, dts, _tzinfo, self.freq)
+
+    def isoformat(self, sep='T'):
+        base = super(_Timestamp, self).isoformat(sep=sep)
+        if self.nanosecond == 0:
+            return base
+
+        if self.tzinfo is not None:
+            base1, base2 = base[:-6], base[-6:]
+        else:
+            base1, base2 = base, ""
+
+        if self.microsecond != 0:
+            base1 += "%.3d" % self.nanosecond
+        else:
+            base1 += ".%.9d" % self.nanosecond
+
+        return base1 + base2
+
+    def _has_time_component(self):
+        """
+        Returns if the Timestamp has a time component
+        in addition to the date part
+        """
+        return (self.time() != _zero_time
+                or self.tzinfo is not None
+                or self.nanosecond != 0)
+
+    def to_julian_date(self):
+        """
+        Convert TimeStamp to a Julian Date.
+        0 Julian date is noon January 1, 4713 BC.
+        """
+        year = self.year
+        month = self.month
+        day = self.day
+        if month <= 2:
+            year -= 1
+            month += 12
+        return (day +
+                np.fix((153 * month - 457) / 5) +
+                365 * year +
+                np.floor(year / 4) -
+                np.floor(year / 100) +
+                np.floor(year / 400) +
+                1721118.5 +
+                (self.hour +
+                 self.minute / 60.0 +
+                 self.second / 3600.0 +
+                 self.microsecond / 3600.0 / 1e+6 +
+                 self.nanosecond / 3600.0 / 1e+9
+                ) / 24.0)
+
+    def normalize(self):
+        """
+        Normalize Timestamp to midnight, preserving
+        tz information.
+        """
+        normalized_value = date_normalize(
+            np.array([self.value], dtype='i8'), tz=self.tz)[0]
+        return Timestamp(normalized_value).tz_localize(self.tz)
+
+    def __radd__(self, other):
+        # __radd__ on cython extension types like _Timestamp is not used, so
+        # define it here instead
+        return self + other
+
+
+# Add the min and max fields at the class level
+cdef int64_t _NS_UPPER_BOUND = INT64_MAX
+# the smallest value we could actually represent is
+#   INT64_MIN + 1 == -9223372036854775807
+# but to allow overflow free conversion with a microsecond resolution
+# use the smallest value with a 0 nanosecond unit (0s in last 3 digits)
+cdef int64_t _NS_LOWER_BOUND = -9223372036854775000
+
+# Resolution is in nanoseconds
+Timestamp.min = Timestamp(_NS_LOWER_BOUND)
+Timestamp.max = Timestamp(_NS_UPPER_BOUND)
diff --git a/pandas/_libs/tslibs/timezones.pxd b/pandas/_libs/tslibs/timezones.pxd
new file mode 100644
index 0000000000000..67353f3eec614
--- /dev/null
+++ b/pandas/_libs/tslibs/timezones.pxd
@@ -0,0 +1,17 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+cdef bint is_utc(object tz)
+cdef bint is_tzlocal(object tz)
+
+cdef bint treat_tz_as_pytz(object tz)
+cdef bint treat_tz_as_dateutil(object tz)
+
+cpdef bint tz_compare(object start, object end)
+cpdef object get_timezone(object tz)
+cpdef object maybe_get_tz(object tz)
+
+cpdef get_utcoffset(tzinfo, obj)
+cdef bint is_fixed_offset(object tz)
+
+cdef object get_dst_info(object tz)
diff --git a/pandas/_libs/tslibs/timezones.pyx b/pandas/_libs/tslibs/timezones.pyx
new file mode 100644
index 0000000000000..74fadbdb64763
--- /dev/null
+++ b/pandas/_libs/tslibs/timezones.pyx
@@ -0,0 +1,354 @@
+# -*- coding: utf-8 -*-
+# cython: profile=False
+
+cimport cython
+from cython cimport Py_ssize_t
+
+# dateutil compat
+from dateutil.tz import (
+    tzutc as _dateutil_tzutc,
+    tzlocal as _dateutil_tzlocal,
+    tzfile as _dateutil_tzfile)
+
+from dateutil.tz import gettz as dateutil_gettz
+
+from pytz.tzinfo import BaseTzInfo as _pytz_BaseTzInfo
+import pytz
+UTC = pytz.utc
+
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport ndarray, int64_t
+cnp.import_array()
+
+# ----------------------------------------------------------------------
+from util cimport is_string_object, is_integer_object, get_nat
+
+cdef int64_t NPY_NAT = get_nat()
+
+# ----------------------------------------------------------------------
+
+cdef inline bint is_utc(object tz):
+    return tz is UTC or isinstance(tz, _dateutil_tzutc)
+
+
+cdef inline bint is_tzlocal(object tz):
+    return isinstance(tz, _dateutil_tzlocal)
+
+
+cdef inline bint treat_tz_as_pytz(object tz):
+    return hasattr(tz, '_utc_transition_times') and hasattr(
+        tz, '_transition_info')
+
+
+cdef inline bint treat_tz_as_dateutil(object tz):
+    return hasattr(tz, '_trans_list') and hasattr(tz, '_trans_idx')
+
+
+cpdef inline object get_timezone(object tz):
+    """
+    We need to do several things here:
+    1) Distinguish between pytz and dateutil timezones
+    2) Not be over-specific (e.g. US/Eastern with/without DST is same *zone*
+       but a different tz object)
+    3) Provide something to serialize when we're storing a datetime object
+       in pytables.
+
+    We return a string prefaced with dateutil if it's a dateutil tz, else just
+    the tz name. It needs to be a string so that we can serialize it with
+    UJSON/pytables. maybe_get_tz (below) is the inverse of this process.
+    """
+    if is_utc(tz):
+        return 'UTC'
+    else:
+        if treat_tz_as_dateutil(tz):
+            if '.tar.gz' in tz._filename:
+                raise ValueError(
+                    'Bad tz filename. Dateutil on python 3 on windows has a '
+                    'bug which causes tzfile._filename to be the same for all '
+                    'timezone files. Please construct dateutil timezones '
+                    'implicitly by passing a string like "dateutil/Europe'
+                    '/London" when you construct your pandas objects instead '
+                    'of passing a timezone object. See '
+                    'https://github.com/pandas-dev/pandas/pull/7362')
+            return 'dateutil/' + tz._filename
+        else:
+            # tz is a pytz timezone or unknown.
+            try:
+                zone = tz.zone
+                if zone is None:
+                    return tz
+                return zone
+            except AttributeError:
+                return tz
+
+
+cpdef inline object maybe_get_tz(object tz):
+    """
+    (Maybe) Construct a timezone object from a string. If tz is a string, use
+    it to construct a timezone object. Otherwise, just return tz.
+    """
+    if is_string_object(tz):
+        if tz == 'tzlocal()':
+            tz = _dateutil_tzlocal()
+        elif tz.startswith('dateutil/'):
+            zone = tz[9:]
+            tz = dateutil_gettz(zone)
+            # On Python 3 on Windows, the filename is not always set correctly.
+            if isinstance(tz, _dateutil_tzfile) and '.tar.gz' in tz._filename:
+                tz._filename = zone
+        else:
+            tz = pytz.timezone(tz)
+    elif is_integer_object(tz):
+        tz = pytz.FixedOffset(tz / 60)
+    return tz
+
+
+def _p_tz_cache_key(tz):
+    """ Python interface for cache function to facilitate testing."""
+    return tz_cache_key(tz)
+
+
+# Timezone data caches, key is the pytz string or dateutil file name.
+dst_cache = {}
+
+
+cdef inline object tz_cache_key(object tz):
+    """
+    Return the key in the cache for the timezone info object or None
+    if unknown.
+
+    The key is currently the tz string for pytz timezones, the filename for
+    dateutil timezones.
+
+    Notes
+    =====
+    This cannot just be the hash of a timezone object. Unfortunately, the
+    hashes of two dateutil tz objects which represent the same timezone are
+    not equal (even though the tz objects will compare equal and represent
+    the same tz file). Also, pytz objects are not always hashable so we use
+    str(tz) instead.
+    """
+    if isinstance(tz, _pytz_BaseTzInfo):
+        return tz.zone
+    elif isinstance(tz, _dateutil_tzfile):
+        if '.tar.gz' in tz._filename:
+            raise ValueError('Bad tz filename. Dateutil on python 3 on '
+                             'windows has a bug which causes tzfile._filename '
+                             'to be the same for all timezone files. Please '
+                             'construct dateutil timezones implicitly by '
+                             'passing a string like "dateutil/Europe/London" '
+                             'when you construct your pandas objects instead '
+                             'of passing a timezone object. See '
+                             'https://github.com/pandas-dev/pandas/pull/7362')
+        return 'dateutil' + tz._filename
+    else:
+        return None
+
+
+# ----------------------------------------------------------------------
+# UTC Offsets
+
+
+cpdef get_utcoffset(tzinfo, obj):
+    try:
+        return tzinfo._utcoffset
+    except AttributeError:
+        return tzinfo.utcoffset(obj)
+
+
+cdef inline bint is_fixed_offset(object tz):
+    if treat_tz_as_dateutil(tz):
+        if len(tz._trans_idx) == 0 and len(tz._trans_list) == 0:
+            return 1
+        else:
+            return 0
+    elif treat_tz_as_pytz(tz):
+        if (len(tz._transition_info) == 0
+                and len(tz._utc_transition_times) == 0):
+            return 1
+        else:
+            return 0
+    return 1
+
+
+cdef object get_utc_trans_times_from_dateutil_tz(object tz):
+    """
+    Transition times in dateutil timezones are stored in local non-dst
+    time.  This code converts them to UTC. It's the reverse of the code
+    in dateutil.tz.tzfile.__init__.
+    """
+    new_trans = list(tz._trans_list)
+    last_std_offset = 0
+    for i, (trans, tti) in enumerate(zip(tz._trans_list, tz._trans_idx)):
+        if not tti.isdst:
+            last_std_offset = tti.offset
+        new_trans[i] = trans - last_std_offset
+    return new_trans
+
+
+cpdef ndarray unbox_utcoffsets(object transinfo):
+    cdef:
+        Py_ssize_t i, sz
+        ndarray[int64_t] arr
+
+    sz = len(transinfo)
+    arr = np.empty(sz, dtype='i8')
+
+    for i in range(sz):
+        arr[i] = int(transinfo[i][0].total_seconds()) * 1000000000
+
+    return arr
+
+
+# ----------------------------------------------------------------------
+# Daylight Savings
+
+
+cdef object get_dst_info(object tz):
+    """
+    return a tuple of :
+      (UTC times of DST transitions,
+       UTC offsets in microseconds corresponding to DST transitions,
+       string of type of transitions)
+
+    """
+    cache_key = tz_cache_key(tz)
+    if cache_key is None:
+        num = int(get_utcoffset(tz, None).total_seconds()) * 1000000000
+        return (np.array([NPY_NAT + 1], dtype=np.int64),
+                np.array([num], dtype=np.int64),
+                None)
+
+    if cache_key not in dst_cache:
+        if treat_tz_as_pytz(tz):
+            trans = np.array(tz._utc_transition_times, dtype='M8[ns]')
+            trans = trans.view('i8')
+            try:
+                if tz._utc_transition_times[0].year == 1:
+                    trans[0] = NPY_NAT + 1
+            except Exception:
+                pass
+            deltas = unbox_utcoffsets(tz._transition_info)
+            typ = 'pytz'
+
+        elif treat_tz_as_dateutil(tz):
+            if len(tz._trans_list):
+                # get utc trans times
+                trans_list = get_utc_trans_times_from_dateutil_tz(tz)
+                trans = np.hstack([
+                    np.array([0], dtype='M8[s]'),  # place holder for 1st item
+                    np.array(trans_list, dtype='M8[s]')]).astype(
+                    'M8[ns]')  # all trans listed
+                trans = trans.view('i8')
+                trans[0] = NPY_NAT + 1
+
+                # deltas
+                deltas = np.array([v.offset for v in (
+                    tz._ttinfo_before,) + tz._trans_idx], dtype='i8')
+                deltas *= 1000000000
+                typ = 'dateutil'
+
+            elif is_fixed_offset(tz):
+                trans = np.array([NPY_NAT + 1], dtype=np.int64)
+                deltas = np.array([tz._ttinfo_std.offset],
+                                  dtype='i8') * 1000000000
+                typ = 'fixed'
+            else:
+                trans = np.array([], dtype='M8[ns]')
+                deltas = np.array([], dtype='i8')
+                typ = None
+
+        else:
+            # static tzinfo
+            trans = np.array([NPY_NAT + 1], dtype=np.int64)
+            num = int(get_utcoffset(tz, None).total_seconds()) * 1000000000
+            deltas = np.array([num], dtype=np.int64)
+            typ = 'static'
+
+        dst_cache[cache_key] = (trans, deltas, typ)
+
+    return dst_cache[cache_key]
+
+
+def infer_tzinfo(start, end):
+    if start is not None and end is not None:
+        tz = start.tzinfo
+        if not tz_compare(tz, end.tzinfo):
+            msg = 'Inputs must both have the same timezone, {tz1} != {tz2}'
+            raise AssertionError(msg.format(tz1=tz, tz2=end.tzinfo))
+    elif start is not None:
+        tz = start.tzinfo
+    elif end is not None:
+        tz = end.tzinfo
+    else:
+        tz = None
+    return tz
+
+
+cpdef bint tz_compare(object start, object end):
+    """
+    Compare string representations of timezones
+
+    The same timezone can be represented as different instances of
+    timezones. For example
+    `<DstTzInfo 'Europe/Paris' LMT+0:09:00 STD>` and
+    `<DstTzInfo 'Europe/Paris' CET+1:00:00 STD>` are essentially same
+    timezones but aren't evaluated such, but the string representation
+    for both of these is `'Europe/Paris'`.
+
+    This exists only to add a notion of equality to pytz-style zones
+    that is compatible with the notion of equality expected of tzinfo
+    subclasses.
+
+    Parameters
+    ----------
+    start : tzinfo
+    end : tzinfo
+
+    Returns:
+    -------
+    compare : bint
+
+    """
+    # GH 18523
+    return get_timezone(start) == get_timezone(end)
+
+
+cpdef tz_standardize(object tz):
+    """
+    If the passed tz is a pytz timezone object, "normalize" it to the a
+    consistent version
+
+    Parameters
+    ----------
+    tz : tz object
+
+    Returns:
+    -------
+    tz object
+
+    Examples:
+    --------
+    >>> tz
+    <DstTzInfo 'US/Pacific' PST-1 day, 16:00:00 STD>
+
+    >>> tz_standardize(tz)
+    <DstTzInfo 'US/Pacific' LMT-1 day, 16:07:00 STD>
+
+    >>> tz
+    <DstTzInfo 'US/Pacific' LMT-1 day, 16:07:00 STD>
+
+    >>> tz_standardize(tz)
+    <DstTzInfo 'US/Pacific' LMT-1 day, 16:07:00 STD>
+
+    >>> tz
+    dateutil.tz.tz.tzutc
+
+    >>> tz_standardize(tz)
+    dateutil.tz.tz.tzutc
+    """
+    if treat_tz_as_pytz(tz):
+        return pytz.timezone(str(tz))
+    return tz
diff --git a/pandas/_libs/window.pyx b/pandas/_libs/window.pyx
new file mode 100644
index 0000000000000..5121d293efcb6
--- /dev/null
+++ b/pandas/_libs/window.pyx
@@ -0,0 +1,1823 @@
+# cython: profile=False
+# cython: boundscheck=False, wraparound=False, cdivision=True
+
+cimport cython
+from cython cimport Py_ssize_t
+from libcpp.deque cimport deque
+
+from libc.stdlib cimport malloc, free
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport ndarray, double_t, int64_t, float64_t
+cnp.import_array()
+
+
+cdef extern from "../src/headers/cmath" namespace "std":
+    int signbit(double) nogil
+    double sqrt(double x) nogil
+
+cimport util
+from util cimport numeric
+
+from skiplist cimport (IndexableSkiplist,
+                       node_t, skiplist_t,
+                       skiplist_init, skiplist_destroy,
+                       skiplist_get, skiplist_insert, skiplist_remove)
+
+cdef cnp.float32_t MINfloat32 = np.NINF
+cdef cnp.float64_t MINfloat64 = np.NINF
+
+cdef cnp.float32_t MAXfloat32 = np.inf
+cdef cnp.float64_t MAXfloat64 = np.inf
+
+cdef double NaN = <double> np.NaN
+
+cdef inline int int_max(int a, int b): return a if a >= b else b
+cdef inline int int_min(int a, int b): return a if a <= b else b
+
+
+# Cython implementations of rolling sum, mean, variance, skewness,
+# other statistical moment functions
+#
+# Misc implementation notes
+# -------------------------
+#
+# - In Cython x * x is faster than x ** 2 for C types, this should be
+#   periodically revisited to see if it's still true.
+#
+
+
+def _check_minp(win, minp, N, floor=None):
+    """
+    Parameters
+    ----------
+    win: int
+    minp: int or None
+    N: len of window
+    floor: int, optional
+        default 1
+
+    Returns
+    -------
+    minimum period
+    """
+
+    if minp is None:
+        minp = 1
+    if not util.is_integer_object(minp):
+        raise ValueError("min_periods must be an integer")
+    if minp > win:
+        raise ValueError("min_periods (%d) must be <= "
+                         "window (%d)" % (minp, win))
+    elif minp > N:
+        minp = N + 1
+    elif minp < 0:
+        raise ValueError('min_periods must be >= 0')
+    if floor is None:
+        floor = 1
+
+    return max(minp, floor)
+
+# original C implementation by N. Devillard.
+# This code in public domain.
+# Function :   kth_smallest()
+# In       :   array of elements, # of elements in the array, rank k
+# Out      :   one element
+# Job      :   find the kth smallest element in the array
+
+#             Reference:
+
+#               Author: Wirth, Niklaus
+#                Title: Algorithms + data structures = programs
+#            Publisher: Englewood Cliffs: Prentice-Hall, 1976
+# Physical description: 366 p.
+#               Series: Prentice-Hall Series in Automatic Computation
+
+# ----------------------------------------------------------------------
+# The indexer objects for rolling
+# These define start/end indexers to compute offsets
+
+
+cdef class WindowIndexer:
+
+    cdef:
+        ndarray start, end
+        int64_t N, minp, win
+        bint is_variable
+
+    def get_data(self):
+        return (self.start, self.end, <int64_t>self.N,
+                <int64_t>self.win, <int64_t>self.minp,
+                self.is_variable)
+
+
+cdef class MockFixedWindowIndexer(WindowIndexer):
+    """
+
+    We are just checking parameters of the indexer,
+    and returning a consistent API with fixed/variable
+    indexers.
+
+    Parameters
+    ----------
+    input: ndarray
+        input data array
+    win: int64_t
+        window size
+    minp: int64_t
+        min number of obs in a window to consider non-NaN
+    index: object
+        index of the input
+    floor: optional
+        unit for flooring
+    left_closed: bint
+        left endpoint closedness
+    right_closed: bint
+        right endpoint closedness
+
+    """
+    def __init__(self, ndarray input, int64_t win, int64_t minp,
+                 bint left_closed, bint right_closed,
+                 object index=None, object floor=None):
+
+        assert index is None
+        self.is_variable = 0
+        self.N = len(input)
+        self.minp = _check_minp(win, minp, self.N, floor=floor)
+        self.start = np.empty(0, dtype='int64')
+        self.end = np.empty(0, dtype='int64')
+        self.win = win
+
+
+cdef class FixedWindowIndexer(WindowIndexer):
+    """
+    create a fixed length window indexer object
+    that has start & end, that point to offsets in
+    the index object; these are defined based on the win
+    arguments
+
+    Parameters
+    ----------
+    input: ndarray
+        input data array
+    win: int64_t
+        window size
+    minp: int64_t
+        min number of obs in a window to consider non-NaN
+    index: object
+        index of the input
+    floor: optional
+        unit for flooring the unit
+    left_closed: bint
+        left endpoint closedness
+    right_closed: bint
+        right endpoint closedness
+
+    """
+    def __init__(self, ndarray input, int64_t win, int64_t minp,
+                 bint left_closed, bint right_closed,
+                 object index=None, object floor=None):
+        cdef ndarray start_s, start_e, end_s, end_e
+
+        assert index is None
+        self.is_variable = 0
+        self.N = len(input)
+        self.minp = _check_minp(win, minp, self.N, floor=floor)
+
+        start_s = np.zeros(win, dtype='int64')
+        start_e = np.arange(win, self.N, dtype='int64') - win + 1
+        self.start = np.concatenate([start_s, start_e])
+
+        end_s = np.arange(win, dtype='int64') + 1
+        end_e = start_e + win
+        self.end = np.concatenate([end_s, end_e])
+        self.win = win
+
+
+cdef class VariableWindowIndexer(WindowIndexer):
+    """
+    create a variable length window indexer object
+    that has start & end, that point to offsets in
+    the index object; these are defined based on the win
+    arguments
+
+    Parameters
+    ----------
+    input: ndarray
+        input data array
+    win: int64_t
+        window size
+    minp: int64_t
+        min number of obs in a window to consider non-NaN
+    index: ndarray
+        index of the input
+    left_closed: bint
+        left endpoint closedness
+        True if the left endpoint is closed, False if open
+    right_closed: bint
+        right endpoint closedness
+        True if the right endpoint is closed, False if open
+    floor: optional
+        unit for flooring the unit
+    """
+    def __init__(self, ndarray input, int64_t win, int64_t minp,
+                 bint left_closed, bint right_closed, ndarray index,
+                 object floor=None):
+
+        self.is_variable = 1
+        self.N = len(index)
+        self.minp = _check_minp(win, minp, self.N, floor=floor)
+
+        self.start = np.empty(self.N, dtype='int64')
+        self.start.fill(-1)
+
+        self.end = np.empty(self.N, dtype='int64')
+        self.end.fill(-1)
+
+        self.build(index, win, left_closed, right_closed)
+
+        # max window size
+        self.win = (self.end - self.start).max()
+
+    def build(self, ndarray[int64_t] index, int64_t win, bint left_closed,
+              bint right_closed):
+
+        cdef:
+            ndarray[int64_t] start, end
+            int64_t start_bound, end_bound, N
+            Py_ssize_t i, j
+
+        start = self.start
+        end = self.end
+        N = self.N
+
+        start[0] = 0
+
+        # right endpoint is closed
+        if right_closed:
+            end[0] = 1
+        # right endpoint is open
+        else:
+            end[0] = 0
+
+        with nogil:
+
+            # start is start of slice interval (including)
+            # end is end of slice interval (not including)
+            for i in range(1, N):
+                end_bound = index[i]
+                start_bound = index[i] - win
+
+                # left endpoint is closed
+                if left_closed:
+                    start_bound -= 1
+
+                # advance the start bound until we are
+                # within the constraint
+                start[i] = i
+                for j in range(start[i - 1], i):
+                    if index[j] > start_bound:
+                        start[i] = j
+                        break
+
+                # end bound is previous end
+                # or current index
+                if index[end[i - 1]] <= end_bound:
+                    end[i] = i + 1
+                else:
+                    end[i] = end[i - 1]
+
+                # right endpoint is open
+                if not right_closed:
+                    end[i] -= 1
+
+
+def get_window_indexer(input, win, minp, index, closed,
+                       floor=None, use_mock=True):
+    """
+    return the correct window indexer for the computation
+
+    Parameters
+    ----------
+    input: 1d ndarray
+    win: integer, window size
+    minp: integer, minimum periods
+    index: 1d ndarray, optional
+        index to the input array
+    closed: string, default None
+        {'right', 'left', 'both', 'neither'}
+        window endpoint closedness. Defaults to 'right' in
+        VariableWindowIndexer and to 'both' in FixedWindowIndexer
+    floor: optional
+        unit for flooring the unit
+    use_mock: boolean, default True
+        if we are a fixed indexer, return a mock indexer
+        instead of the FixedWindow Indexer. This is a type
+        compat Indexer that allows us to use a standard
+        code path with all of the indexers.
+
+
+    Returns
+    -------
+    tuple of 1d int64 ndarrays of the offsets & data about the window
+
+    """
+
+    cdef:
+        bint left_closed = False
+        bint right_closed = False
+
+    assert closed is None or closed in ['right', 'left', 'both', 'neither']
+
+    # if windows is variable, default is 'right', otherwise default is 'both'
+    if closed is None:
+        closed = 'right' if index is not None else 'both'
+
+    if closed in ['right', 'both']:
+        right_closed = True
+
+    if closed in ['left', 'both']:
+        left_closed = True
+
+    if index is not None:
+        indexer = VariableWindowIndexer(input, win, minp, left_closed,
+                                        right_closed, index, floor)
+    elif use_mock:
+        indexer = MockFixedWindowIndexer(input, win, minp, left_closed,
+                                         right_closed, index, floor)
+    else:
+        indexer = FixedWindowIndexer(input, win, minp, left_closed,
+                                     right_closed, index, floor)
+    return indexer.get_data()
+
+# ----------------------------------------------------------------------
+# Rolling count
+# this is only an impl for index not None, IOW, freq aware
+
+
+def roll_count(ndarray[double_t] input, int64_t win, int64_t minp,
+               object index, object closed):
+    cdef:
+        double val, count_x = 0.0
+        int64_t s, e, nobs, N
+        Py_ssize_t i, j
+        ndarray[int64_t] start, end
+        ndarray[double_t] output
+
+    start, end, N, win, minp, _ = get_window_indexer(input, win,
+                                                     minp, index, closed)
+    output = np.empty(N, dtype=float)
+
+    with nogil:
+
+        for i in range(0, N):
+            s = start[i]
+            e = end[i]
+
+            if i == 0:
+
+                # setup
+                count_x = 0.0
+                for j in range(s, e):
+                    val = input[j]
+                    if val == val:
+                        count_x += 1.0
+
+            else:
+
+                # calculate deletes
+                for j in range(start[i - 1], s):
+                    val = input[j]
+                    if val == val:
+                        count_x -= 1.0
+
+                # calculate adds
+                for j in range(end[i - 1], e):
+                    val = input[j]
+                    if val == val:
+                        count_x += 1.0
+
+            if count_x >= minp:
+                output[i] = count_x
+            else:
+                output[i] = NaN
+
+    return output
+
+# ----------------------------------------------------------------------
+# Rolling sum
+
+
+cdef inline double calc_sum(int64_t minp, int64_t nobs, double sum_x) nogil:
+    cdef double result
+
+    if nobs >= minp:
+        result = sum_x
+    else:
+        result = NaN
+
+    return result
+
+
+cdef inline void add_sum(double val, int64_t *nobs, double *sum_x) nogil:
+    """ add a value from the sum calc """
+
+    # Not NaN
+    if val == val:
+        nobs[0] = nobs[0] + 1
+        sum_x[0] = sum_x[0] + val
+
+
+cdef inline void remove_sum(double val, int64_t *nobs, double *sum_x) nogil:
+    """ remove a value from the sum calc """
+
+    if val == val:
+        nobs[0] = nobs[0] - 1
+        sum_x[0] = sum_x[0] - val
+
+
+def roll_sum(ndarray[double_t] input, int64_t win, int64_t minp,
+             object index, object closed):
+    cdef:
+        double val, prev_x, sum_x = 0
+        int64_t s, e, range_endpoint
+        int64_t nobs = 0, i, j, N
+        bint is_variable
+        ndarray[int64_t] start, end
+        ndarray[double_t] output
+
+    start, end, N, win, minp, is_variable = get_window_indexer(input, win,
+                                                               minp, index,
+                                                               closed,
+                                                               floor=0)
+    output = np.empty(N, dtype=float)
+
+    # for performance we are going to iterate
+    # fixed windows separately, makes the code more complex as we have 2 paths
+    # but is faster
+
+    if is_variable:
+
+        # variable window
+        with nogil:
+
+            for i in range(0, N):
+                s = start[i]
+                e = end[i]
+
+                if i == 0:
+
+                    # setup
+                    sum_x = 0.0
+                    nobs = 0
+                    for j in range(s, e):
+                        add_sum(input[j], &nobs, &sum_x)
+
+                else:
+
+                    # calculate deletes
+                    for j in range(start[i - 1], s):
+                        remove_sum(input[j], &nobs, &sum_x)
+
+                    # calculate adds
+                    for j in range(end[i - 1], e):
+                        add_sum(input[j], &nobs, &sum_x)
+
+                output[i] = calc_sum(minp, nobs, sum_x)
+
+    else:
+
+        # fixed window
+
+        range_endpoint = int_max(minp, 1) - 1
+
+        with nogil:
+
+            for i in range(0, range_endpoint):
+                add_sum(input[i], &nobs, &sum_x)
+                output[i] = NaN
+
+            for i in range(range_endpoint, N):
+                val = input[i]
+                add_sum(val, &nobs, &sum_x)
+
+                if i > win - 1:
+                    prev_x = input[i - win]
+                    remove_sum(prev_x, &nobs, &sum_x)
+
+                output[i] = calc_sum(minp, nobs, sum_x)
+
+    return output
+
+# ----------------------------------------------------------------------
+# Rolling mean
+
+
+cdef inline double calc_mean(int64_t minp, Py_ssize_t nobs,
+                             Py_ssize_t neg_ct, double sum_x) nogil:
+    cdef double result
+
+    if nobs >= minp:
+        result = sum_x / <double>nobs
+        if neg_ct == 0 and result < 0:
+            # all positive
+            result = 0
+        elif neg_ct == nobs and result > 0:
+            # all negative
+            result = 0
+        else:
+            pass
+    else:
+        result = NaN
+    return result
+
+
+cdef inline void add_mean(double val, Py_ssize_t *nobs, double *sum_x,
+                          Py_ssize_t *neg_ct) nogil:
+    """ add a value from the mean calc """
+
+    # Not NaN
+    if val == val:
+        nobs[0] = nobs[0] + 1
+        sum_x[0] = sum_x[0] + val
+        if signbit(val):
+            neg_ct[0] = neg_ct[0] + 1
+
+
+cdef inline void remove_mean(double val, Py_ssize_t *nobs, double *sum_x,
+                             Py_ssize_t *neg_ct) nogil:
+    """ remove a value from the mean calc """
+
+    if val == val:
+        nobs[0] = nobs[0] - 1
+        sum_x[0] = sum_x[0] - val
+        if signbit(val):
+            neg_ct[0] = neg_ct[0] - 1
+
+
+def roll_mean(ndarray[double_t] input, int64_t win, int64_t minp,
+              object index, object closed):
+    cdef:
+        double val, prev_x, result, sum_x = 0
+        int64_t s, e
+        bint is_variable
+        Py_ssize_t nobs = 0, i, j, neg_ct = 0, N
+        ndarray[int64_t] start, end
+        ndarray[double_t] output
+
+    start, end, N, win, minp, is_variable = get_window_indexer(input, win,
+                                                               minp, index,
+                                                               closed)
+    output = np.empty(N, dtype=float)
+
+    # for performance we are going to iterate
+    # fixed windows separately, makes the code more complex as we have 2 paths
+    # but is faster
+
+    if is_variable:
+
+        with nogil:
+
+            for i in range(0, N):
+                s = start[i]
+                e = end[i]
+
+                if i == 0:
+
+                    # setup
+                    sum_x = 0.0
+                    nobs = 0
+                    for j in range(s, e):
+                        val = input[j]
+                        add_mean(val, &nobs, &sum_x, &neg_ct)
+
+                else:
+
+                    # calculate deletes
+                    for j in range(start[i - 1], s):
+                        val = input[j]
+                        remove_mean(val, &nobs, &sum_x, &neg_ct)
+
+                    # calculate adds
+                    for j in range(end[i - 1], e):
+                        val = input[j]
+                        add_mean(val, &nobs, &sum_x, &neg_ct)
+
+                output[i] = calc_mean(minp, nobs, neg_ct, sum_x)
+
+    else:
+
+        with nogil:
+            for i from 0 <= i < minp - 1:
+                val = input[i]
+                add_mean(val, &nobs, &sum_x, &neg_ct)
+                output[i] = NaN
+
+            for i from minp - 1 <= i < N:
+                val = input[i]
+                add_mean(val, &nobs, &sum_x, &neg_ct)
+
+                if i > win - 1:
+                    prev_x = input[i - win]
+                    remove_mean(prev_x, &nobs, &sum_x, &neg_ct)
+
+                output[i] = calc_mean(minp, nobs, neg_ct, sum_x)
+
+    return output
+
+# ----------------------------------------------------------------------
+# Rolling variance
+
+
+cdef inline double calc_var(int64_t minp, int ddof, double nobs,
+                            double ssqdm_x) nogil:
+    cdef double result
+
+    # Variance is unchanged if no observation is added or removed
+    if (nobs >= minp) and (nobs > ddof):
+
+        # pathological case
+        if nobs == 1:
+            result = 0
+        else:
+            result = ssqdm_x / (nobs - <double>ddof)
+            if result < 0:
+                result = 0
+    else:
+        result = NaN
+
+    return result
+
+
+cdef inline void add_var(double val, double *nobs, double *mean_x,
+                         double *ssqdm_x) nogil:
+    """ add a value from the var calc """
+    cdef double delta
+
+    # Not NaN
+    if val == val:
+        nobs[0] = nobs[0] + 1
+
+        # a part of Welford's method for the online variance-calculation
+        # https://en.wikipedia.org/wiki/Algorithms_for_calculating_variance
+        delta = val - mean_x[0]
+        mean_x[0] = mean_x[0] + delta / nobs[0]
+        ssqdm_x[0] = ssqdm_x[0] + ((nobs[0] - 1) * delta ** 2) / nobs[0]
+
+
+cdef inline void remove_var(double val, double *nobs, double *mean_x,
+                            double *ssqdm_x) nogil:
+    """ remove a value from the var calc """
+    cdef double delta
+
+    # Not NaN
+    if val == val:
+        nobs[0] = nobs[0] - 1
+        if nobs[0]:
+            # a part of Welford's method for the online variance-calculation
+            # https://en.wikipedia.org/wiki/Algorithms_for_calculating_variance
+            delta = val - mean_x[0]
+            mean_x[0] = mean_x[0] - delta / nobs[0]
+            ssqdm_x[0] = ssqdm_x[0] - ((nobs[0] + 1) * delta ** 2) / nobs[0]
+        else:
+            mean_x[0] = 0
+            ssqdm_x[0] = 0
+
+
+def roll_var(ndarray[double_t] input, int64_t win, int64_t minp,
+             object index, object closed, int ddof=1):
+    """
+    Numerically stable implementation using Welford's method.
+    """
+    cdef:
+        double val, prev, mean_x = 0, ssqdm_x = 0, nobs = 0, delta, mean_x_old
+        int64_t s, e
+        bint is_variable
+        Py_ssize_t i, j, N
+        ndarray[int64_t] start, end
+        ndarray[double_t] output
+
+    start, end, N, win, minp, is_variable = get_window_indexer(input, win,
+                                                               minp, index,
+                                                               closed)
+    output = np.empty(N, dtype=float)
+
+    # Check for windows larger than array, addresses #7297
+    win = min(win, N)
+
+    # for performance we are going to iterate
+    # fixed windows separately, makes the code more complex as we
+    # have 2 paths but is faster
+
+    if is_variable:
+
+        with nogil:
+
+            for i in range(0, N):
+
+                s = start[i]
+                e = end[i]
+
+                # Over the first window, observations can only be added
+                # never removed
+                if i == 0:
+
+                    for j in range(s, e):
+                        add_var(input[j], &nobs, &mean_x, &ssqdm_x)
+
+                else:
+
+                    # After the first window, observations can both be added
+                    # and removed
+
+                    # calculate adds
+                    for j in range(end[i - 1], e):
+                        add_var(input[j], &nobs, &mean_x, &ssqdm_x)
+
+                    # calculate deletes
+                    for j in range(start[i - 1], s):
+                        remove_var(input[j], &nobs, &mean_x, &ssqdm_x)
+
+                output[i] = calc_var(minp, ddof, nobs, ssqdm_x)
+
+    else:
+
+        with nogil:
+
+            # Over the first window, observations can only be added, never
+            # removed
+            for i from 0 <= i < win:
+                add_var(input[i], &nobs, &mean_x, &ssqdm_x)
+                output[i] = calc_var(minp, ddof, nobs, ssqdm_x)
+
+            # a part of Welford's method for the online variance-calculation
+            # https://en.wikipedia.org/wiki/Algorithms_for_calculating_variance
+
+            # After the first window, observations can both be added and
+            # removed
+            for i from win <= i < N:
+                val = input[i]
+                prev = input[i - win]
+
+                if val == val:
+                    if prev == prev:
+
+                        # Adding one observation and removing another one
+                        delta = val - prev
+                        mean_x_old = mean_x
+
+                        mean_x += delta / nobs
+                        ssqdm_x += ((nobs - 1) * val
+                                    + (nobs + 1) * prev
+                                    - 2 * nobs * mean_x_old) * delta / nobs
+
+                    else:
+                        add_var(val, &nobs, &mean_x, &ssqdm_x)
+                elif prev == prev:
+                    remove_var(prev, &nobs, &mean_x, &ssqdm_x)
+
+                output[i] = calc_var(minp, ddof, nobs, ssqdm_x)
+
+    return output
+
+
+# ----------------------------------------------------------------------
+# Rolling skewness
+
+cdef inline double calc_skew(int64_t minp, int64_t nobs, double x, double xx,
+                             double xxx) nogil:
+    cdef double result, dnobs
+    cdef double A, B, C, R
+
+    if nobs >= minp:
+        dnobs = <double>nobs
+        A = x / dnobs
+        B = xx / dnobs - A * A
+        C = xxx / dnobs - A * A * A - 3 * A * B
+
+        # #18044: with uniform distribution, floating issue will
+        #         cause B != 0. and cause the result is a very
+        #         large number.
+        #
+        #         in core/nanops.py nanskew/nankurt call the function
+        #         _zero_out_fperr(m2) to fix floating error.
+        #         if the variance is less than 1e-14, it could be
+        #         treat as zero, here we follow the original
+        #         skew/kurt behaviour to check B <= 1e-14
+        if B <= 1e-14 or nobs < 3:
+            result = NaN
+        else:
+            R = sqrt(B)
+            result = ((sqrt(dnobs * (dnobs - 1.)) * C) /
+                      ((dnobs - 2) * R * R * R))
+    else:
+        result = NaN
+
+    return result
+
+cdef inline void add_skew(double val, int64_t *nobs, double *x, double *xx,
+                          double *xxx) nogil:
+    """ add a value from the skew calc """
+
+    # Not NaN
+    if val == val:
+        nobs[0] = nobs[0] + 1
+
+        # seriously don't ask me why this is faster
+        x[0] = x[0] + val
+        xx[0] = xx[0] + val * val
+        xxx[0] = xxx[0] + val * val * val
+
+cdef inline void remove_skew(double val, int64_t *nobs, double *x, double *xx,
+                             double *xxx) nogil:
+    """ remove a value from the skew calc """
+
+    # Not NaN
+    if val == val:
+        nobs[0] = nobs[0] - 1
+
+        # seriously don't ask me why this is faster
+        x[0] = x[0] - val
+        xx[0] = xx[0] - val * val
+        xxx[0] = xxx[0] - val * val * val
+
+
+def roll_skew(ndarray[double_t] input, int64_t win, int64_t minp,
+              object index, object closed):
+    cdef:
+        double val, prev
+        double x = 0, xx = 0, xxx = 0
+        int64_t nobs = 0, i, j, N
+        int64_t s, e
+        bint is_variable
+        ndarray[int64_t] start, end
+        ndarray[double_t] output
+
+    start, end, N, win, minp, is_variable = get_window_indexer(input, win,
+                                                               minp, index,
+                                                               closed)
+    output = np.empty(N, dtype=float)
+
+    if is_variable:
+
+        with nogil:
+
+            for i in range(0, N):
+
+                s = start[i]
+                e = end[i]
+
+                # Over the first window, observations can only be added
+                # never removed
+                if i == 0:
+
+                    for j in range(s, e):
+                        val = input[j]
+                        add_skew(val, &nobs, &x, &xx, &xxx)
+
+                else:
+
+                    # After the first window, observations can both be added
+                    # and removed
+
+                    # calculate adds
+                    for j in range(end[i - 1], e):
+                        val = input[j]
+                        add_skew(val, &nobs, &x, &xx, &xxx)
+
+                    # calculate deletes
+                    for j in range(start[i - 1], s):
+                        val = input[j]
+                        remove_skew(val, &nobs, &x, &xx, &xxx)
+
+                output[i] = calc_skew(minp, nobs, x, xx, xxx)
+
+    else:
+
+        with nogil:
+            for i from 0 <= i < minp - 1:
+                val = input[i]
+                add_skew(val, &nobs, &x, &xx, &xxx)
+                output[i] = NaN
+
+            for i from minp - 1 <= i < N:
+                val = input[i]
+                add_skew(val, &nobs, &x, &xx, &xxx)
+
+                if i > win - 1:
+                    prev = input[i - win]
+                    remove_skew(prev, &nobs, &x, &xx, &xxx)
+
+                output[i] = calc_skew(minp, nobs, x, xx, xxx)
+
+    return output
+
+# ----------------------------------------------------------------------
+# Rolling kurtosis
+
+
+cdef inline double calc_kurt(int64_t minp, int64_t nobs, double x, double xx,
+                             double xxx, double xxxx) nogil:
+    cdef double result, dnobs
+    cdef double A, B, C, D, R, K
+
+    if nobs >= minp:
+        dnobs = <double>nobs
+        A = x / dnobs
+        R = A * A
+        B = xx / dnobs - R
+        R = R * A
+        C = xxx / dnobs - R - 3 * A * B
+        R = R * A
+        D = xxxx / dnobs - R - 6 * B * A * A - 4 * C * A
+
+        # #18044: with uniform distribution, floating issue will
+        #         cause B != 0. and cause the result is a very
+        #         large number.
+        #
+        #         in core/nanops.py nanskew/nankurt call the function
+        #         _zero_out_fperr(m2) to fix floating error.
+        #         if the variance is less than 1e-14, it could be
+        #         treat as zero, here we follow the original
+        #         skew/kurt behaviour to check B <= 1e-14
+        if B <= 1e-14 or nobs < 4:
+            result = NaN
+        else:
+            K = (dnobs * dnobs - 1.) * D / (B * B) - 3 * ((dnobs - 1.) ** 2)
+            result = K / ((dnobs - 2.) * (dnobs - 3.))
+    else:
+        result = NaN
+
+    return result
+
+cdef inline void add_kurt(double val, int64_t *nobs, double *x, double *xx,
+                          double *xxx, double *xxxx) nogil:
+    """ add a value from the kurotic calc """
+
+    # Not NaN
+    if val == val:
+        nobs[0] = nobs[0] + 1
+
+        # seriously don't ask me why this is faster
+        x[0] = x[0] + val
+        xx[0] = xx[0] + val * val
+        xxx[0] = xxx[0] + val * val * val
+        xxxx[0] = xxxx[0] + val * val * val * val
+
+cdef inline void remove_kurt(double val, int64_t *nobs, double *x, double *xx,
+                             double *xxx, double *xxxx) nogil:
+    """ remove a value from the kurotic calc """
+
+    # Not NaN
+    if val == val:
+        nobs[0] = nobs[0] - 1
+
+        # seriously don't ask me why this is faster
+        x[0] = x[0] - val
+        xx[0] = xx[0] - val * val
+        xxx[0] = xxx[0] - val * val * val
+        xxxx[0] = xxxx[0] - val * val * val * val
+
+
+def roll_kurt(ndarray[double_t] input, int64_t win, int64_t minp,
+              object index, object closed):
+    cdef:
+        double val, prev
+        double x = 0, xx = 0, xxx = 0, xxxx = 0
+        int64_t nobs = 0, i, j, N
+        int64_t s, e
+        bint is_variable
+        ndarray[int64_t] start, end
+        ndarray[double_t] output
+
+    start, end, N, win, minp, is_variable = get_window_indexer(input, win,
+                                                               minp, index,
+                                                               closed)
+    output = np.empty(N, dtype=float)
+
+    if is_variable:
+
+        with nogil:
+
+            for i in range(0, N):
+
+                s = start[i]
+                e = end[i]
+
+                # Over the first window, observations can only be added
+                # never removed
+                if i == 0:
+
+                    for j in range(s, e):
+                        add_kurt(input[j], &nobs, &x, &xx, &xxx, &xxxx)
+
+                else:
+
+                    # After the first window, observations can both be added
+                    # and removed
+
+                    # calculate adds
+                    for j in range(end[i - 1], e):
+                        add_kurt(input[j], &nobs, &x, &xx, &xxx, &xxxx)
+
+                    # calculate deletes
+                    for j in range(start[i - 1], s):
+                        remove_kurt(input[j], &nobs, &x, &xx, &xxx, &xxxx)
+
+                output[i] = calc_kurt(minp, nobs, x, xx, xxx, xxxx)
+
+    else:
+
+        with nogil:
+
+            for i from 0 <= i < minp - 1:
+                add_kurt(input[i], &nobs, &x, &xx, &xxx, &xxxx)
+                output[i] = NaN
+
+            for i from minp - 1 <= i < N:
+                add_kurt(input[i], &nobs, &x, &xx, &xxx, &xxxx)
+
+                if i > win - 1:
+                    prev = input[i - win]
+                    remove_kurt(prev, &nobs, &x, &xx, &xxx, &xxxx)
+
+                output[i] = calc_kurt(minp, nobs, x, xx, xxx, xxxx)
+
+    return output
+
+# ----------------------------------------------------------------------
+# Rolling median, min, max
+
+
+def roll_median_c(ndarray[float64_t] input, int64_t win, int64_t minp,
+                  object index, object closed):
+    cdef:
+        double val, res, prev
+        bint err = 0, is_variable
+        int ret = 0
+        skiplist_t *sl
+        Py_ssize_t i, j
+        int64_t nobs = 0, N, s, e
+        int midpoint
+        ndarray[int64_t] start, end
+        ndarray[double_t] output
+
+    # we use the Fixed/Variable Indexer here as the
+    # actual skiplist ops outweigh any window computation costs
+    start, end, N, win, minp, is_variable = get_window_indexer(
+        input, win,
+        minp, index, closed,
+        use_mock=False)
+    output = np.empty(N, dtype=float)
+
+    sl = skiplist_init(<int>win)
+    if sl == NULL:
+        raise MemoryError("skiplist_init failed")
+
+    with nogil:
+
+        for i in range(0, N):
+            s = start[i]
+            e = end[i]
+
+            if i == 0:
+
+                # setup
+                val = input[i]
+                if val == val:
+                    nobs += 1
+                    err = skiplist_insert(sl, val) != 1
+                    if err:
+                        break
+
+            else:
+
+                # calculate deletes
+                for j in range(start[i - 1], s):
+                    val = input[j]
+                    if val == val:
+                        skiplist_remove(sl, val)
+                        nobs -= 1
+
+                # calculate adds
+                for j in range(end[i - 1], e):
+                    val = input[j]
+                    if val == val:
+                        nobs += 1
+                        err = skiplist_insert(sl, val) != 1
+                        if err:
+                            break
+
+            if nobs >= minp:
+                midpoint = <int>(nobs / 2)
+                if nobs % 2:
+                    res = skiplist_get(sl, midpoint, &ret)
+                else:
+                    res = (skiplist_get(sl, midpoint, &ret) +
+                           skiplist_get(sl, (midpoint - 1), &ret)) / 2
+            else:
+                res = NaN
+
+            output[i] = res
+
+    skiplist_destroy(sl)
+    if err:
+        raise MemoryError("skiplist_insert failed")
+    return output
+
+# ----------------------------------------------------------------------
+
+# Moving maximum / minimum code taken from Bottleneck under the terms
+# of its Simplified BSD license
+# https://github.com/kwgoodman/bottleneck
+
+
+cdef inline numeric init_mm(numeric ai, Py_ssize_t *nobs, bint is_max) nogil:
+
+    if numeric in cython.floating:
+        if ai == ai:
+            nobs[0] = nobs[0] + 1
+        elif is_max:
+            if numeric == cython.float:
+                ai = MINfloat32
+            else:
+                ai = MINfloat64
+        else:
+            if numeric == cython.float:
+                ai = MAXfloat32
+            else:
+                ai = MAXfloat64
+
+    else:
+        nobs[0] = nobs[0] + 1
+
+    return ai
+
+
+cdef inline void remove_mm(numeric aold, Py_ssize_t *nobs) nogil:
+    """ remove a value from the mm calc """
+    if numeric in cython.floating and aold == aold:
+        nobs[0] = nobs[0] - 1
+
+
+cdef inline numeric calc_mm(int64_t minp, Py_ssize_t nobs,
+                            numeric value) nogil:
+    cdef numeric result
+
+    if numeric in cython.floating:
+        if nobs >= minp:
+            result = value
+        else:
+            result = NaN
+    else:
+        result = value
+
+    return result
+
+
+def roll_max(ndarray[numeric] input, int64_t win, int64_t minp,
+             object index, object closed):
+    """
+    Moving max of 1d array of any numeric type along axis=0 ignoring NaNs.
+
+    Parameters
+    ----------
+    input: numpy array
+    window: int, size of rolling window
+    minp: if number of observations in window
+          is below this, output a NaN
+    index: ndarray, optional
+       index for window computation
+    closed: 'right', 'left', 'both', 'neither'
+            make the interval closed on the right, left,
+            both or neither endpoints
+    """
+    return _roll_min_max(input, win, minp, index, closed=closed, is_max=1)
+
+
+def roll_min(ndarray[numeric] input, int64_t win, int64_t minp,
+             object index, object closed):
+    """
+    Moving max of 1d array of any numeric type along axis=0 ignoring NaNs.
+
+    Parameters
+    ----------
+    input: numpy array
+    window: int, size of rolling window
+    minp: if number of observations in window
+          is below this, output a NaN
+    index: ndarray, optional
+       index for window computation
+    """
+    return _roll_min_max(input, win, minp, index, is_max=0, closed=closed)
+
+
+cdef _roll_min_max(ndarray[numeric] input, int64_t win, int64_t minp,
+                   object index, object closed, bint is_max):
+    """
+    Moving min/max of 1d array of any numeric type along axis=0
+    ignoring NaNs.
+    """
+
+    cdef:
+        numeric ai
+        bint is_variable, should_replace
+        int64_t N, i, removed, window_i
+        Py_ssize_t nobs = 0
+        deque Q[int64_t]
+        ndarray[int64_t] starti, endi
+        ndarray[numeric, ndim=1] output
+    cdef:
+        int64_t* death
+        numeric* ring
+        numeric* minvalue
+        numeric* end
+        numeric* last
+
+    cdef:
+        cdef numeric r
+
+    starti, endi, N, win, minp, is_variable = get_window_indexer(
+        input, win,
+        minp, index, closed)
+
+    output = np.empty(N, dtype=input.dtype)
+
+    Q = deque[int64_t]()
+
+    if is_variable:
+
+        with nogil:
+
+            # This is using a modified version of the C++ code in this
+            # SO post: http://bit.ly/2nOoHlY
+            # The original impl didn't deal with variable window sizes
+            # So the code was optimized for that
+
+            for i from starti[0] <= i < endi[0]:
+                ai = init_mm(input[i], &nobs, is_max)
+
+                if is_max:
+                    while not Q.empty() and ai >= input[Q.back()]:
+                        Q.pop_back()
+                else:
+                    while not Q.empty() and ai <= input[Q.back()]:
+                        Q.pop_back()
+                Q.push_back(i)
+
+            for i from endi[0] <= i < N:
+                output[i-1] = calc_mm(minp, nobs, input[Q.front()])
+
+                ai = init_mm(input[i], &nobs, is_max)
+
+                if is_max:
+                    while not Q.empty() and ai >= input[Q.back()]:
+                        Q.pop_back()
+                else:
+                    while not Q.empty() and ai <= input[Q.back()]:
+                        Q.pop_back()
+
+                while not Q.empty() and Q.front() <= i - (endi[i] - starti[i]):
+                    Q.pop_front()
+
+                Q.push_back(i)
+
+            output[N-1] = calc_mm(minp, nobs, input[Q.front()])
+
+    else:
+        # setup the rings of death!
+        ring = <numeric *>malloc(win * sizeof(numeric))
+        death = <int64_t *>malloc(win * sizeof(int64_t))
+
+        end = ring + win
+        last = ring
+        minvalue = ring
+        ai = input[0]
+        minvalue[0] = init_mm(input[0], &nobs, is_max)
+        death[0] = win
+        nobs = 0
+
+        with nogil:
+
+            for i in range(N):
+                ai = init_mm(input[i], &nobs, is_max)
+
+                if i >= win:
+                    remove_mm(input[i - win], &nobs)
+
+                if death[minvalue - ring] == i:
+                    minvalue = minvalue + 1
+                    if minvalue >= end:
+                        minvalue = ring
+
+                if is_max:
+                    should_replace = ai >= minvalue[0]
+                else:
+                    should_replace = ai <= minvalue[0]
+                if should_replace:
+
+                    minvalue[0] = ai
+                    death[minvalue - ring] = i + win
+                    last = minvalue
+
+                else:
+
+                    if is_max:
+                        should_replace = last[0] <= ai
+                    else:
+                        should_replace = last[0] >= ai
+                    while should_replace:
+                        if last == ring:
+                            last = end
+                        last -= 1
+                        if is_max:
+                            should_replace = last[0] <= ai
+                        else:
+                            should_replace = last[0] >= ai
+
+                    last += 1
+                    if last == end:
+                        last = ring
+                    last[0] = ai
+                    death[last - ring] = i + win
+
+                output[i] = calc_mm(minp, nobs, minvalue[0])
+
+            for i in range(minp - 1):
+                if numeric in cython.floating:
+                    output[i] = NaN
+                else:
+                    output[i] = 0
+
+            free(ring)
+            free(death)
+
+    # print("output: {0}".format(output))
+    return output
+
+
+cdef enum InterpolationType:
+    LINEAR,
+    LOWER,
+    HIGHER,
+    NEAREST,
+    MIDPOINT
+
+
+interpolation_types = {
+    'linear': LINEAR,
+    'lower': LOWER,
+    'higher': HIGHER,
+    'nearest': NEAREST,
+    'midpoint': MIDPOINT,
+}
+
+
+def roll_quantile(ndarray[float64_t, cast=True] input, int64_t win,
+                  int64_t minp, object index, object closed,
+                  double quantile, str interpolation):
+    """
+    O(N log(window)) implementation using skip list
+    """
+    cdef:
+        double val, prev, midpoint, idx_with_fraction
+        skiplist_t *skiplist
+        int64_t nobs = 0, i, j, s, e, N
+        Py_ssize_t idx
+        bint is_variable
+        ndarray[int64_t] start, end
+        ndarray[double_t] output
+        double vlow, vhigh
+        InterpolationType interpolation_type
+        int ret = 0
+
+    if quantile <= 0.0 or quantile >= 1.0:
+        raise ValueError("quantile value {0} not in [0, 1]".format(quantile))
+
+    try:
+        interpolation_type = interpolation_types[interpolation]
+    except KeyError:
+        raise ValueError("Interpolation '{}' is not supported"
+                         .format(interpolation))
+
+    # we use the Fixed/Variable Indexer here as the
+    # actual skiplist ops outweigh any window computation costs
+    start, end, N, win, minp, is_variable = get_window_indexer(
+        input, win,
+        minp, index, closed,
+        use_mock=False)
+    output = np.empty(N, dtype=float)
+    skiplist = skiplist_init(<int>win)
+    if skiplist == NULL:
+        raise MemoryError("skiplist_init failed")
+
+    with nogil:
+        for i in range(0, N):
+            s = start[i]
+            e = end[i]
+
+            if i == 0:
+
+                # setup
+                val = input[i]
+                if val == val:
+                    nobs += 1
+                    skiplist_insert(skiplist, val)
+
+            else:
+
+                # calculate deletes
+                for j in range(start[i - 1], s):
+                    val = input[j]
+                    if val == val:
+                        skiplist_remove(skiplist, val)
+                        nobs -= 1
+
+                # calculate adds
+                for j in range(end[i - 1], e):
+                    val = input[j]
+                    if val == val:
+                        nobs += 1
+                        skiplist_insert(skiplist, val)
+
+            if nobs >= minp:
+                if nobs == 1:
+                    # Single value in skip list
+                    output[i] = skiplist_get(skiplist, 0, &ret)
+                else:
+                    idx_with_fraction = quantile * (nobs - 1)
+                    idx = <int> idx_with_fraction
+
+                    if idx_with_fraction == idx:
+                        # no need to interpolate
+                        output[i] = skiplist_get(skiplist, idx, &ret)
+                        continue
+
+                    if interpolation_type == LINEAR:
+                        vlow = skiplist_get(skiplist, idx, &ret)
+                        vhigh = skiplist_get(skiplist, idx + 1, &ret)
+                        output[i] = ((vlow + (vhigh - vlow) *
+                                      (idx_with_fraction - idx)))
+                    elif interpolation_type == LOWER:
+                        output[i] = skiplist_get(skiplist, idx, &ret)
+                    elif interpolation_type == HIGHER:
+                        output[i] = skiplist_get(skiplist, idx + 1, &ret)
+                    elif interpolation_type == NEAREST:
+                        # the same behaviour as round()
+                        if idx_with_fraction - idx == 0.5:
+                            if idx % 2 == 0:
+                                output[i] = skiplist_get(skiplist, idx, &ret)
+                            else:
+                                output[i] = skiplist_get(
+                                    skiplist, idx + 1, &ret)
+                        elif idx_with_fraction - idx < 0.5:
+                            output[i] = skiplist_get(skiplist, idx, &ret)
+                        else:
+                            output[i] = skiplist_get(skiplist, idx + 1, &ret)
+                    elif interpolation_type == MIDPOINT:
+                        vlow = skiplist_get(skiplist, idx, &ret)
+                        vhigh = skiplist_get(skiplist, idx + 1, &ret)
+                        output[i] = <double> (vlow + vhigh) / 2
+            else:
+                output[i] = NaN
+
+    return output
+
+
+def roll_generic(object obj,
+                 int64_t win, int64_t minp, object index, object closed,
+                 int offset, object func, bint raw,
+                 object args, object kwargs):
+    cdef:
+        ndarray[double_t] output, counts, bufarr
+        ndarray[float64_t, cast=True] arr
+        float64_t *buf
+        float64_t *oldbuf
+        int64_t nobs = 0, i, j, s, e, N
+        bint is_variable
+        ndarray[int64_t] start, end
+
+    n = len(obj)
+    if n == 0:
+        return obj
+
+    arr = np.asarray(obj)
+
+    # ndarray input
+    if raw:
+        if not arr.flags.c_contiguous:
+            arr = arr.copy('C')
+
+    counts = roll_sum(np.concatenate([np.isfinite(arr).astype(float),
+                                      np.array([0.] * offset)]),
+                      win, minp, index, closed)[offset:]
+
+    start, end, N, win, minp, is_variable = get_window_indexer(arr, win,
+                                                               minp, index,
+                                                               closed,
+                                                               floor=0)
+
+    output = np.empty(N, dtype=float)
+
+    if is_variable:
+        # variable window arr or series
+
+        if offset != 0:
+            raise ValueError("unable to roll_generic with a non-zero offset")
+
+        for i in range(0, N):
+            s = start[i]
+            e = end[i]
+
+            if counts[i] >= minp:
+                if raw:
+                    output[i] = func(arr[s:e], *args, **kwargs)
+                else:
+                    output[i] = func(obj.iloc[s:e], *args, **kwargs)
+            else:
+                output[i] = NaN
+
+    elif not raw:
+        # series
+        for i from 0 <= i < N:
+            if counts[i] >= minp:
+                sl = slice(int_max(i + offset - win + 1, 0),
+                           int_min(i + offset + 1, N))
+                output[i] = func(obj.iloc[sl], *args, **kwargs)
+            else:
+                output[i] = NaN
+
+    else:
+
+        # truncated windows at the beginning, through first full-length window
+        for i from 0 <= i < (int_min(win, N) - offset):
+            if counts[i] >= minp:
+                output[i] = func(arr[0: (i + offset + 1)], *args, **kwargs)
+            else:
+                output[i] = NaN
+
+        # remaining full-length windows
+        buf = <float64_t *> arr.data
+        bufarr = np.empty(win, dtype=float)
+        oldbuf = <float64_t *> bufarr.data
+        for i from (win - offset) <= i < (N - offset):
+            buf = buf + 1
+            bufarr.data = <char *> buf
+            if counts[i] >= minp:
+                output[i] = func(bufarr, *args, **kwargs)
+            else:
+                output[i] = NaN
+        bufarr.data = <char *> oldbuf
+
+        # truncated windows at the end
+        for i from int_max(N - offset, 0) <= i < N:
+            if counts[i] >= minp:
+                output[i] = func(arr[int_max(i + offset - win + 1, 0): N],
+                                 *args,
+                                 **kwargs)
+            else:
+                output[i] = NaN
+
+    return output
+
+
+def roll_window(ndarray[float64_t, ndim=1, cast=True] input,
+                ndarray[float64_t, ndim=1, cast=True] weights,
+                int minp, bint avg=True):
+    """
+    Assume len(weights) << len(input)
+    """
+    cdef:
+        ndarray[double_t] output, tot_wgt, counts
+        Py_ssize_t in_i, win_i, win_n, win_k, in_n, in_k
+        float64_t val_in, val_win, c, w
+
+    in_n = len(input)
+    win_n = len(weights)
+    output = np.zeros(in_n, dtype=float)
+    counts = np.zeros(in_n, dtype=float)
+    if avg:
+        tot_wgt = np.zeros(in_n, dtype=float)
+
+    minp = _check_minp(len(weights), minp, in_n)
+
+    if avg:
+        for win_i from 0 <= win_i < win_n:
+            val_win = weights[win_i]
+            if val_win != val_win:
+                continue
+
+            for in_i from 0 <= in_i < in_n - (win_n - win_i) + 1:
+                val_in = input[in_i]
+                if val_in == val_in:
+                    output[in_i + (win_n - win_i) - 1] += val_in * val_win
+                    counts[in_i + (win_n - win_i) - 1] += 1
+                    tot_wgt[in_i + (win_n - win_i) - 1] += val_win
+
+        for in_i from 0 <= in_i < in_n:
+            c = counts[in_i]
+            if c < minp:
+                output[in_i] = NaN
+            else:
+                w = tot_wgt[in_i]
+                if w == 0:
+                    output[in_i] = NaN
+                else:
+                    output[in_i] /= tot_wgt[in_i]
+
+    else:
+        for win_i from 0 <= win_i < win_n:
+            val_win = weights[win_i]
+            if val_win != val_win:
+                continue
+
+            for in_i from 0 <= in_i < in_n - (win_n - win_i) + 1:
+                val_in = input[in_i]
+
+                if val_in == val_in:
+                    output[in_i + (win_n - win_i) - 1] += val_in * val_win
+                    counts[in_i + (win_n - win_i) - 1] += 1
+
+        for in_i from 0 <= in_i < in_n:
+            c = counts[in_i]
+            if c < minp:
+                output[in_i] = NaN
+
+    return output
+
+# ----------------------------------------------------------------------
+# Exponentially weighted moving average
+
+
+def ewma(ndarray[double_t] input, double_t com, int adjust, int ignore_na,
+         int minp):
+    """
+    Compute exponentially-weighted moving average using center-of-mass.
+
+    Parameters
+    ----------
+    input : ndarray (float64 type)
+    com : float64
+    adjust: int
+    ignore_na: int
+    minp: int
+
+    Returns
+    -------
+    y : ndarray
+    """
+
+    cdef Py_ssize_t N = len(input)
+    cdef ndarray[double_t] output = np.empty(N, dtype=float)
+    if N == 0:
+        return output
+
+    minp = max(minp, 1)
+
+    cdef double alpha, old_wt_factor, new_wt, weighted_avg, old_wt, cur
+    cdef Py_ssize_t i, nobs
+
+    alpha = 1. / (1. + com)
+    old_wt_factor = 1. - alpha
+    new_wt = 1. if adjust else alpha
+
+    weighted_avg = input[0]
+    is_observation = (weighted_avg == weighted_avg)
+    nobs = int(is_observation)
+    output[0] = weighted_avg if (nobs >= minp) else NaN
+    old_wt = 1.
+
+    for i from 1 <= i < N:
+        cur = input[i]
+        is_observation = (cur == cur)
+        nobs += int(is_observation)
+        if weighted_avg == weighted_avg:
+
+            if is_observation or (not ignore_na):
+
+                old_wt *= old_wt_factor
+                if is_observation:
+
+                    # avoid numerical errors on constant series
+                    if weighted_avg != cur:
+                        weighted_avg = ((old_wt * weighted_avg) +
+                                        (new_wt * cur)) / (old_wt + new_wt)
+                    if adjust:
+                        old_wt += new_wt
+                    else:
+                        old_wt = 1.
+        elif is_observation:
+            weighted_avg = cur
+
+        output[i] = weighted_avg if (nobs >= minp) else NaN
+
+    return output
+
+# ----------------------------------------------------------------------
+# Exponentially weighted moving covariance
+
+
+def ewmcov(ndarray[double_t] input_x, ndarray[double_t] input_y,
+           double_t com, int adjust, int ignore_na, int minp, int bias):
+    """
+    Compute exponentially-weighted moving variance using center-of-mass.
+
+    Parameters
+    ----------
+    input_x : ndarray (float64 type)
+    input_y : ndarray (float64 type)
+    com : float64
+    adjust: int
+    ignore_na: int
+    minp: int
+    bias: int
+
+    Returns
+    -------
+    y : ndarray
+    """
+
+    cdef Py_ssize_t N = len(input_x)
+    if len(input_y) != N:
+        raise ValueError("arrays are of different lengths "
+                         "(%d and %d)" % (N, len(input_y)))
+    cdef ndarray[double_t] output = np.empty(N, dtype=float)
+    if N == 0:
+        return output
+
+    minp = max(minp, 1)
+
+    cdef double alpha, old_wt_factor, new_wt, mean_x, mean_y, cov
+    cdef double sum_wt, sum_wt2, old_wt, cur_x, cur_y, old_mean_x, old_mean_y
+    cdef Py_ssize_t i, nobs
+
+    alpha = 1. / (1. + com)
+    old_wt_factor = 1. - alpha
+    new_wt = 1. if adjust else alpha
+
+    mean_x = input_x[0]
+    mean_y = input_y[0]
+    is_observation = ((mean_x == mean_x) and (mean_y == mean_y))
+    nobs = int(is_observation)
+    if not is_observation:
+        mean_x = NaN
+        mean_y = NaN
+    output[0] = (0. if bias else NaN) if (nobs >= minp) else NaN
+    cov = 0.
+    sum_wt = 1.
+    sum_wt2 = 1.
+    old_wt = 1.
+
+    for i from 1 <= i < N:
+        cur_x = input_x[i]
+        cur_y = input_y[i]
+        is_observation = ((cur_x == cur_x) and (cur_y == cur_y))
+        nobs += int(is_observation)
+        if mean_x == mean_x:
+            if is_observation or (not ignore_na):
+                sum_wt *= old_wt_factor
+                sum_wt2 *= (old_wt_factor * old_wt_factor)
+                old_wt *= old_wt_factor
+                if is_observation:
+                    old_mean_x = mean_x
+                    old_mean_y = mean_y
+
+                    # avoid numerical errors on constant series
+                    if mean_x != cur_x:
+                        mean_x = ((old_wt * old_mean_x) +
+                                  (new_wt * cur_x)) / (old_wt + new_wt)
+
+                    # avoid numerical errors on constant series
+                    if mean_y != cur_y:
+                        mean_y = ((old_wt * old_mean_y) +
+                                  (new_wt * cur_y)) / (old_wt + new_wt)
+                    cov = ((old_wt * (cov + ((old_mean_x - mean_x) *
+                                             (old_mean_y - mean_y)))) +
+                           (new_wt * ((cur_x - mean_x) *
+                                      (cur_y - mean_y)))) / (old_wt + new_wt)
+                    sum_wt += new_wt
+                    sum_wt2 += (new_wt * new_wt)
+                    old_wt += new_wt
+                    if not adjust:
+                        sum_wt /= old_wt
+                        sum_wt2 /= (old_wt * old_wt)
+                        old_wt = 1.
+        elif is_observation:
+            mean_x = cur_x
+            mean_y = cur_y
+
+        if nobs >= minp:
+            if not bias:
+                numerator = sum_wt * sum_wt
+                denominator = numerator - sum_wt2
+                if (denominator > 0.):
+                    output[i] = ((numerator / denominator) * cov)
+                else:
+                    output[i] = NaN
+            else:
+                output[i] = cov
+        else:
+            output[i] = NaN
+
+    return output
diff --git a/pandas/_libs/writers.pyx b/pandas/_libs/writers.pyx
new file mode 100644
index 0000000000000..6f07d04b3fad3
--- /dev/null
+++ b/pandas/_libs/writers.pyx
@@ -0,0 +1,174 @@
+# -*- coding: utf-8 -*-
+
+cimport cython
+from cython cimport Py_ssize_t
+
+from cpython cimport (PyString_Check, PyBytes_Check, PyUnicode_Check,
+                      PyBytes_GET_SIZE, PyUnicode_GET_SIZE)
+
+try:
+    from cpython cimport PyString_GET_SIZE
+except ImportError:
+    from cpython cimport PyUnicode_GET_SIZE as PyString_GET_SIZE
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport ndarray, uint8_t
+cnp.import_array()
+
+cimport util
+
+
+ctypedef fused pandas_string:
+    str
+    unicode
+    bytes
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def write_csv_rows(list data, ndarray data_index,
+                   int nlevels, ndarray cols, object writer):
+    """
+    Write the given data to the writer object, pre-allocating where possible
+    for performance improvements.
+
+    Parameters
+    ----------
+    data : list
+    data_index : ndarray
+    nlevels : int
+    cols : ndarray
+    writer : object
+    """
+    cdef int N, j, i, ncols
+    cdef list rows
+    cdef object val
+
+    # In crude testing, N>100 yields little marginal improvement
+    N = 100
+
+    # pre-allocate rows
+    ncols = len(cols)
+    rows = [[None] * (nlevels + ncols) for x in range(N)]
+
+    j = -1
+    if nlevels == 1:
+        for j in range(len(data_index)):
+            row = rows[j % N]
+            row[0] = data_index[j]
+            for i in range(ncols):
+                row[1 + i] = data[i][j]
+
+            if j >= N - 1 and j % N == N - 1:
+                writer.writerows(rows)
+    elif nlevels > 1:
+        for j in range(len(data_index)):
+            row = rows[j % N]
+            row[:nlevels] = list(data_index[j])
+            for i in range(ncols):
+                row[nlevels + i] = data[i][j]
+
+            if j >= N - 1 and j % N == N - 1:
+                writer.writerows(rows)
+    else:
+        for j in range(len(data_index)):
+            row = rows[j % N]
+            for i in range(ncols):
+                row[i] = data[i][j]
+
+            if j >= N - 1 and j % N == N - 1:
+                writer.writerows(rows)
+
+    if j >= 0 and (j < N - 1 or (j % N) != N - 1):
+        writer.writerows(rows[:((j + 1) % N)])
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def convert_json_to_lines(object arr):
+    """
+    replace comma separated json with line feeds, paying special attention
+    to quotes & brackets
+    """
+    cdef:
+        Py_ssize_t i = 0, num_open_brackets_seen = 0, length
+        bint in_quotes = 0, is_escaping = 0
+        ndarray[uint8_t] narr
+        unsigned char v, comma, left_bracket, right_brack, newline
+
+    newline = ord('\n')
+    comma = ord(',')
+    left_bracket = ord('{')
+    right_bracket = ord('}')
+    quote = ord('"')
+    backslash = ord('\\')
+
+    narr = np.frombuffer(arr.encode('utf-8'), dtype='u1').copy()
+    length = narr.shape[0]
+    for i in range(length):
+        v = narr[i]
+        if v == quote and i > 0 and not is_escaping:
+            in_quotes = ~in_quotes
+        if v == backslash or is_escaping:
+            is_escaping = ~is_escaping
+        if v == comma:  # commas that should be \n
+            if num_open_brackets_seen == 0 and not in_quotes:
+                narr[i] = newline
+        elif v == left_bracket:
+            if not in_quotes:
+                num_open_brackets_seen += 1
+        elif v == right_bracket:
+            if not in_quotes:
+                num_open_brackets_seen -= 1
+
+    return narr.tostring().decode('utf-8')
+
+
+# stata, pytables
+@cython.boundscheck(False)
+@cython.wraparound(False)
+cpdef Py_ssize_t max_len_string_array(pandas_string[:] arr):
+    """ return the maximum size of elements in a 1-dim string array """
+    cdef:
+        Py_ssize_t i, m = 0, l = 0, length = arr.shape[0]
+        pandas_string v
+
+    for i in range(length):
+        v = arr[i]
+        if PyString_Check(v):
+            l = PyString_GET_SIZE(v)
+        elif PyBytes_Check(v):
+            l = PyBytes_GET_SIZE(v)
+        elif PyUnicode_Check(v):
+            l = PyUnicode_GET_SIZE(v)
+
+        if l > m:
+            m = l
+
+    return m
+
+
+# ------------------------------------------------------------------
+# PyTables Helpers
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def string_array_replace_from_nan_rep(
+        ndarray[object, ndim=1] arr, object nan_rep,
+        object replace=None):
+    """
+    Replace the values in the array with 'replacement' if
+    they are 'nan_rep'. Return the same array.
+    """
+
+    cdef int length = arr.shape[0], i = 0
+    if replace is None:
+        replace = np.nan
+
+    for i from 0 <= i < length:
+        if arr[i] == nan_rep:
+            arr[i] = replace
+
+    return arr
diff --git a/pandas/_version.py b/pandas/_version.py
index 61e9f3ff187ea..f4c8938c683da 100644
--- a/pandas/_version.py
+++ b/pandas/_version.py
@@ -1,4 +1,3 @@
-
 # This file helps to compute a version number in source trees obtained from
 # git-archive tarball (such as those provided by githubs download-from-tag
 # feature). Distribution tarballs (built by setup.py sdist) and build
@@ -13,6 +12,7 @@
 import re
 import subprocess
 import sys
+from pandas.compat import PY3
 
 
 def get_keywords():
@@ -26,7 +26,7 @@ def get_keywords():
     return keywords
 
 
-class VersioneerConfig:
+class VersioneerConfig(object):
     pass
 
 
@@ -76,7 +76,7 @@ def run_command(commands, args, cwd=None, verbose=False, hide_stderr=False):
             if e.errno == errno.ENOENT:
                 continue
             if verbose:
-                print("unable to run %s" % dispcmd)
+                print("unable to run {dispcmd}".format(dispcmd=dispcmd))
                 print(e)
             return None
     else:
@@ -84,11 +84,11 @@ def run_command(commands, args, cwd=None, verbose=False, hide_stderr=False):
             print("unable to find command, tried %s" % (commands,))
         return None
     stdout = p.communicate()[0].strip()
-    if sys.version_info[0] >= 3:
+    if PY3:
         stdout = stdout.decode()
     if p.returncode != 0:
         if verbose:
-            print("unable to run %s (error)" % dispcmd)
+            print("unable to run {dispcmd} (error)".format(dispcmd=dispcmd))
         return None
     return stdout
 
@@ -99,8 +99,10 @@ def versions_from_parentdir(parentdir_prefix, root, verbose):
     dirname = os.path.basename(root)
     if not dirname.startswith(parentdir_prefix):
         if verbose:
-            print("guessing rootdir is '%s', but '%s' doesn't start with "
-                  "prefix '%s'" % (root, dirname, parentdir_prefix))
+            print("guessing rootdir is '{root}', but '{dirname}' "
+                  "doesn't start with prefix '{parentdir_prefix}'".format(
+                      root=root, dirname=dirname,
+                      parentdir_prefix=parentdir_prefix))
         raise NotThisMethod("rootdir doesn't start with parentdir_prefix")
     return {"version": dirname[len(parentdir_prefix):],
             "full-revisionid": None,
@@ -140,11 +142,11 @@ def git_versions_from_keywords(keywords, tag_prefix, verbose):
         if verbose:
             print("keywords are unexpanded, not using")
         raise NotThisMethod("unexpanded keywords, not a git-archive tarball")
-    refs = set([r.strip() for r in refnames.strip("()").split(",")])
+    refs = {r.strip() for r in refnames.strip("()").split(",")}
     # starting in git-1.8.3, tags are listed as "tag: foo-1.0" instead of
     # just "foo-1.0". If we see a "tag: " prefix, prefer those.
     TAG = "tag: "
-    tags = set([r[len(TAG):] for r in refs if r.startswith(TAG)])
+    tags = {r[len(TAG):] for r in refs if r.startswith(TAG)}
     if not tags:
         # Either we're using git < 1.8.3, or there really are no tags. We use
         # a heuristic: assume all version tags have a digit. The old git %d
@@ -153,17 +155,17 @@ def git_versions_from_keywords(keywords, tag_prefix, verbose):
         # between branches and tags. By ignoring refnames without digits, we
         # filter out many common branch names like "release" and
         # "stabilization", as well as "HEAD" and "master".
-        tags = set([r for r in refs if re.search(r'\d', r)])
+        tags = {r for r in refs if re.search(r'\d', r)}
         if verbose:
-            print("discarding '%s', no digits" % ",".join(refs-tags))
+            print("discarding '{}', no digits".format(",".join(refs - tags)))
     if verbose:
-        print("likely tags: %s" % ",".join(sorted(tags)))
+        print("likely tags: {}".format(",".join(sorted(tags))))
     for ref in sorted(tags):
         # sorting will prefer e.g. "2.0" over "2.0rc1"
         if ref.startswith(tag_prefix):
             r = ref[len(tag_prefix):]
             if verbose:
-                print("picking %s" % r)
+                print("picking {r}".format(r=r))
             return {"version": r,
                     "full-revisionid": keywords["full"].strip(),
                     "dirty": False, "error": None
@@ -185,7 +187,7 @@ def git_pieces_from_vcs(tag_prefix, root, verbose, run_command=run_command):
 
     if not os.path.exists(os.path.join(root, ".git")):
         if verbose:
-            print("no .git in %s" % root)
+            print("no .git in {root}".format(root=root))
         raise NotThisMethod("no .git directory")
 
     GITS = ["git"]
@@ -227,18 +229,21 @@ def git_pieces_from_vcs(tag_prefix, root, verbose, run_command=run_command):
         mo = re.search(r'^(.+)-(\d+)-g([0-9a-f]+)$', git_describe)
         if not mo:
             # unparseable. Maybe git-describe is misbehaving?
-            pieces["error"] = ("unable to parse git-describe output: '%s'"
-                               % describe_out)
+            pieces["error"] = ("unable to parse git-describe output: "
+                               "'{describe_out}'".format(
+                                   describe_out=describe_out))
             return pieces
 
         # tag
         full_tag = mo.group(1)
         if not full_tag.startswith(tag_prefix):
             if verbose:
-                fmt = "tag '%s' doesn't start with prefix '%s'"
-                print(fmt % (full_tag, tag_prefix))
-            pieces["error"] = ("tag '%s' doesn't start with prefix '%s'"
-                               % (full_tag, tag_prefix))
+                fmt = "tag '{full_tag}' doesn't start with prefix " \
+                      "'{tag_prefix}'"
+                print(fmt.format(full_tag=full_tag, tag_prefix=tag_prefix))
+            pieces["error"] = ("tag '{full_tag}' doesn't start with "
+                               "prefix '{tag_prefix}'".format(
+                                   full_tag, tag_prefix))
             return pieces
         pieces["closest-tag"] = full_tag[len(tag_prefix):]
 
@@ -276,13 +281,13 @@ def render_pep440(pieces):
         rendered = pieces["closest-tag"]
         if pieces["distance"] or pieces["dirty"]:
             rendered += plus_or_dot(pieces)
-            rendered += "%d.g%s" % (pieces["distance"], pieces["short"])
+            rendered += "{:d}.g{}".format(pieces["distance"], pieces["short"])
             if pieces["dirty"]:
                 rendered += ".dirty"
     else:
         # exception #1
-        rendered = "0+untagged.%d.g%s" % (pieces["distance"],
-                                          pieces["short"])
+        rendered = "0+untagged.{:d}.g{}".format(pieces["distance"],
+                                                pieces["short"])
         if pieces["dirty"]:
             rendered += ".dirty"
     return rendered
@@ -316,17 +321,17 @@ def render_pep440_post(pieces):
     if pieces["closest-tag"]:
         rendered = pieces["closest-tag"]
         if pieces["distance"] or pieces["dirty"]:
-            rendered += ".post%d" % pieces["distance"]
+            rendered += ".post{:d}".format(pieces["distance"])
             if pieces["dirty"]:
                 rendered += ".dev0"
             rendered += plus_or_dot(pieces)
-            rendered += "g%s" % pieces["short"]
+            rendered += "g{}".format(pieces["short"])
     else:
         # exception #1
         rendered = "0.post%d" % pieces["distance"]
         if pieces["dirty"]:
             rendered += ".dev0"
-        rendered += "+g%s" % pieces["short"]
+        rendered += "+g{}".format(pieces["short"])
     return rendered
 
 
@@ -360,7 +365,7 @@ def render_git_describe(pieces):
     if pieces["closest-tag"]:
         rendered = pieces["closest-tag"]
         if pieces["distance"]:
-            rendered += "-%d-g%s" % (pieces["distance"], pieces["short"])
+            rendered += "-{:d}-g{}".format(pieces["distance"], pieces["short"])
     else:
         # exception #1
         rendered = pieces["short"]
@@ -378,7 +383,7 @@ def render_git_describe_long(pieces):
 
     if pieces["closest-tag"]:
         rendered = pieces["closest-tag"]
-        rendered += "-%d-g%s" % (pieces["distance"], pieces["short"])
+        rendered += "-{:d}-g{}".format(pieces["distance"], pieces["short"])
     else:
         # exception #1
         rendered = pieces["short"]
@@ -410,7 +415,7 @@ def render(pieces, style):
     elif style == "git-describe-long":
         rendered = render_git_describe_long(pieces)
     else:
-        raise ValueError("unknown style '%s'" % style)
+        raise ValueError("unknown style '{style}'".format(style=style))
 
     return {"version": rendered, "full-revisionid": pieces["long"],
             "dirty": pieces["dirty"], "error": None}
diff --git a/pandas/algos.pyx b/pandas/algos.pyx
deleted file mode 100644
index 44b1996272356..0000000000000
--- a/pandas/algos.pyx
+++ /dev/null
@@ -1,2357 +0,0 @@
-from numpy cimport *
-cimport numpy as np
-import numpy as np
-
-cimport cython
-
-import_array()
-
-cdef float64_t FP_ERR = 1e-13
-
-cimport util
-
-from libc.stdlib cimport malloc, free
-
-from numpy cimport NPY_INT8 as NPY_int8
-from numpy cimport NPY_INT16 as NPY_int16
-from numpy cimport NPY_INT32 as NPY_int32
-from numpy cimport NPY_INT64 as NPY_int64
-from numpy cimport NPY_FLOAT16 as NPY_float16
-from numpy cimport NPY_FLOAT32 as NPY_float32
-from numpy cimport NPY_FLOAT64 as NPY_float64
-
-from numpy cimport (int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
-                    uint32_t, uint64_t, float16_t, float32_t, float64_t)
-
-int8 = np.dtype(np.int8)
-int16 = np.dtype(np.int16)
-int32 = np.dtype(np.int32)
-int64 = np.dtype(np.int64)
-float16 = np.dtype(np.float16)
-float32 = np.dtype(np.float32)
-float64 = np.dtype(np.float64)
-
-cdef np.int8_t MINint8 = np.iinfo(np.int8).min
-cdef np.int16_t MINint16 = np.iinfo(np.int16).min
-cdef np.int32_t MINint32 = np.iinfo(np.int32).min
-cdef np.int64_t MINint64 = np.iinfo(np.int64).min
-cdef np.float16_t MINfloat16 = np.NINF
-cdef np.float32_t MINfloat32 = np.NINF
-cdef np.float64_t MINfloat64 = np.NINF
-
-cdef np.int8_t MAXint8 = np.iinfo(np.int8).max
-cdef np.int16_t MAXint16 = np.iinfo(np.int16).max
-cdef np.int32_t MAXint32 = np.iinfo(np.int32).max
-cdef np.int64_t MAXint64 = np.iinfo(np.int64).max
-cdef np.float16_t MAXfloat16 = np.inf
-cdef np.float32_t MAXfloat32 = np.inf
-cdef np.float64_t MAXfloat64 = np.inf
-
-cdef double NaN = <double> np.NaN
-cdef double nan = NaN
-
-
-cdef inline int int_max(int a, int b): return a if a >= b else b
-cdef inline int int_min(int a, int b): return a if a <= b else b
-
-
-cdef extern from "src/headers/math.h":
-    double sqrt(double x)
-    double fabs(double)
-    int signbit(double)
-
-from pandas import lib
-
-include "skiplist.pyx"
-
-
-cdef:
-    int TIEBREAK_AVERAGE = 0
-    int TIEBREAK_MIN = 1
-    int TIEBREAK_MAX = 2
-    int TIEBREAK_FIRST = 3
-    int TIEBREAK_FIRST_DESCENDING = 4
-    int TIEBREAK_DENSE = 5
-
-tiebreakers = {
-    'average' : TIEBREAK_AVERAGE,
-    'min' : TIEBREAK_MIN,
-    'max' : TIEBREAK_MAX,
-    'first' : TIEBREAK_FIRST,
-    'dense' : TIEBREAK_DENSE,
-}
-
-
-# ctypedef fused pvalue_t:
-#     float64_t
-#     int64_t
-#     object
-
-# from cython cimport floating, integral
-
-cdef _take_2d_float64(ndarray[float64_t, ndim=2] values,
-                      object idx):
-    cdef:
-        Py_ssize_t i, j, N, K
-        ndarray[Py_ssize_t, ndim=2, cast=True] indexer = idx
-        ndarray[float64_t, ndim=2] result
-        object val
-
-    N, K = (<object> values).shape
-    result = np.empty_like(values)
-    for i in range(N):
-        for j in range(K):
-            result[i, j] = values[i, indexer[i, j]]
-    return result
-
-cdef _take_2d_int64(ndarray[int64_t, ndim=2] values,
-                      object idx):
-    cdef:
-        Py_ssize_t i, j, N, K
-        ndarray[Py_ssize_t, ndim=2, cast=True] indexer = idx
-        ndarray[int64_t, ndim=2] result
-        object val
-
-    N, K = (<object> values).shape
-    result = np.empty_like(values)
-    for i in range(N):
-        for j in range(K):
-            result[i, j] = values[i, indexer[i, j]]
-    return result
-
-cdef _take_2d_object(ndarray[object, ndim=2] values,
-                     object idx):
-    cdef:
-        Py_ssize_t i, j, N, K
-        ndarray[Py_ssize_t, ndim=2, cast=True] indexer = idx
-        ndarray[object, ndim=2] result
-        object val
-
-    N, K = (<object> values).shape
-    result = values.copy()
-    for i in range(N):
-        for j in range(K):
-            result[i, j] = values[i, indexer[i, j]]
-    return result
-
-
-def rank_1d_float64(object in_arr, ties_method='average', ascending=True,
-                    na_option='keep', pct=False):
-    """
-    Fast NaN-friendly version of scipy.stats.rankdata
-    """
-
-    cdef:
-        Py_ssize_t i, j, n, dups = 0, total_tie_count = 0
-        ndarray[float64_t] sorted_data, ranks, values
-        ndarray[int64_t] argsorted
-        float64_t val, nan_value
-        float64_t sum_ranks = 0
-        int tiebreak = 0
-        bint keep_na = 0
-        float count = 0.0
-    tiebreak = tiebreakers[ties_method]
-
-    values = np.asarray(in_arr).copy()
-
-    keep_na = na_option == 'keep'
-
-    if ascending ^ (na_option == 'top'):
-        nan_value = np.inf
-    else:
-        nan_value = -np.inf
-    mask = np.isnan(values)
-    np.putmask(values, mask, nan_value)
-
-    n = len(values)
-    ranks = np.empty(n, dtype='f8')
-
-    # py2.5/win32 hack, can't pass i8
-    if tiebreak == TIEBREAK_FIRST:
-        # need to use a stable sort here
-        _as = values.argsort(kind='mergesort')
-        if not ascending:
-            tiebreak = TIEBREAK_FIRST_DESCENDING
-    else:
-        _as = values.argsort()
-
-    if not ascending:
-        _as = _as[::-1]
-
-    sorted_data = values.take(_as)
-    argsorted = _as.astype('i8')
-
-    for i in range(n):
-        sum_ranks += i + 1
-        dups += 1
-        val = sorted_data[i]
-        if (val == nan_value) and keep_na:
-            ranks[argsorted[i]] = nan
-            continue
-        count += 1.0
-        if i == n - 1 or sorted_data[i + 1] != val:
-            if tiebreak == TIEBREAK_AVERAGE:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = sum_ranks / dups
-            elif tiebreak == TIEBREAK_MIN:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = i - dups + 2
-            elif tiebreak == TIEBREAK_MAX:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = i + 1
-            elif tiebreak == TIEBREAK_FIRST:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = j + 1
-            elif tiebreak == TIEBREAK_FIRST_DESCENDING:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = 2 * i - j - dups + 2
-            elif tiebreak == TIEBREAK_DENSE:
-                total_tie_count += 1
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = total_tie_count
-            sum_ranks = dups = 0
-    if pct:
-        return ranks / count
-    else:
-        return ranks
-
-
-def rank_1d_int64(object in_arr, ties_method='average', ascending=True,
-                  na_option='keep', pct=False):
-    """
-    Fast NaN-friendly version of scipy.stats.rankdata
-    """
-
-    cdef:
-        Py_ssize_t i, j, n, dups = 0, total_tie_count = 0
-        ndarray[int64_t] sorted_data, values
-        ndarray[float64_t] ranks
-        ndarray[int64_t] argsorted
-        int64_t val
-        float64_t sum_ranks = 0
-        int tiebreak = 0
-        float count = 0.0
-    tiebreak = tiebreakers[ties_method]
-
-    values = np.asarray(in_arr)
-
-    n = len(values)
-    ranks = np.empty(n, dtype='f8')
-
-    # py2.5/win32 hack, can't pass i8
-    if tiebreak == TIEBREAK_FIRST:
-        # need to use a stable sort here
-        _as = values.argsort(kind='mergesort')
-        if not ascending:
-            tiebreak = TIEBREAK_FIRST_DESCENDING
-    else:
-        _as = values.argsort()
-
-    if not ascending:
-        _as = _as[::-1]
-
-    sorted_data = values.take(_as)
-    argsorted = _as.astype('i8')
-
-    for i in range(n):
-        sum_ranks += i + 1
-        dups += 1
-        val = sorted_data[i]
-        count += 1.0
-        if i == n - 1 or fabs(sorted_data[i + 1] - val) > 0:
-            if tiebreak == TIEBREAK_AVERAGE:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = sum_ranks / dups
-            elif tiebreak == TIEBREAK_MIN:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = i - dups + 2
-            elif tiebreak == TIEBREAK_MAX:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = i + 1
-            elif tiebreak == TIEBREAK_FIRST:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = j + 1
-            elif tiebreak == TIEBREAK_FIRST_DESCENDING:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = 2 * i - j - dups + 2
-            elif tiebreak == TIEBREAK_DENSE:
-                total_tie_count += 1
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = total_tie_count
-            sum_ranks = dups = 0
-    if pct:
-        return ranks / count
-    else:
-        return ranks
-
-
-def rank_2d_float64(object in_arr, axis=0, ties_method='average',
-                    ascending=True, na_option='keep', pct=False):
-    """
-    Fast NaN-friendly version of scipy.stats.rankdata
-    """
-
-    cdef:
-        Py_ssize_t i, j, z, k, n, dups = 0, total_tie_count = 0
-        ndarray[float64_t, ndim=2] ranks, values
-        ndarray[int64_t, ndim=2] argsorted
-        float64_t val, nan_value
-        float64_t sum_ranks = 0
-        int tiebreak = 0
-        bint keep_na = 0
-        float count = 0.0
-
-    tiebreak = tiebreakers[ties_method]
-
-    keep_na = na_option == 'keep'
-
-    in_arr = np.asarray(in_arr)
-
-    if axis == 0:
-        values = in_arr.T.copy()
-    else:
-        values = in_arr.copy()
-
-    if ascending ^ (na_option == 'top'):
-        nan_value = np.inf
-    else:
-        nan_value = -np.inf
-
-    np.putmask(values, np.isnan(values), nan_value)
-
-    n, k = (<object> values).shape
-    ranks = np.empty((n, k), dtype='f8')
-
-    if tiebreak == TIEBREAK_FIRST:
-        # need to use a stable sort here
-        _as = values.argsort(axis=1, kind='mergesort')
-        if not ascending:
-            tiebreak = TIEBREAK_FIRST_DESCENDING
-    else:
-        _as = values.argsort(1)
-
-    if not ascending:
-        _as = _as[:, ::-1]
-
-    values = _take_2d_float64(values, _as)
-    argsorted = _as.astype('i8')
-
-    for i in range(n):
-        dups = sum_ranks = 0
-        total_tie_count = 0
-        count = 0.0
-        for j in range(k):
-            sum_ranks += j + 1
-            dups += 1
-            val = values[i, j]
-            if val == nan_value and keep_na:
-                ranks[i, argsorted[i, j]] = nan
-                continue
-            count += 1.0
-            if j == k - 1 or values[i, j + 1] != val:
-                if tiebreak == TIEBREAK_AVERAGE:
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = sum_ranks / dups
-                elif tiebreak == TIEBREAK_MIN:
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = j - dups + 2
-                elif tiebreak == TIEBREAK_MAX:
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = j + 1
-                elif tiebreak == TIEBREAK_FIRST:
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = z + 1
-                elif tiebreak == TIEBREAK_FIRST_DESCENDING:
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = 2 * j - z - dups + 2
-                elif tiebreak == TIEBREAK_DENSE:
-                    total_tie_count += 1
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = total_tie_count
-                sum_ranks = dups = 0
-        if pct:
-            ranks[i, :] /= count
-    if axis == 0:
-        return ranks.T
-    else:
-        return ranks
-
-
-def rank_2d_int64(object in_arr, axis=0, ties_method='average',
-                    ascending=True, na_option='keep', pct=False):
-    """
-    Fast NaN-friendly version of scipy.stats.rankdata
-    """
-
-    cdef:
-        Py_ssize_t i, j, z, k, n, dups = 0, total_tie_count = 0
-        ndarray[float64_t, ndim=2] ranks
-        ndarray[int64_t, ndim=2] argsorted
-        ndarray[int64_t, ndim=2, cast=True] values
-        int64_t val
-        float64_t sum_ranks = 0
-        int tiebreak = 0
-        float count = 0.0
-    tiebreak = tiebreakers[ties_method]
-
-    if axis == 0:
-        values = np.asarray(in_arr).T
-    else:
-        values = np.asarray(in_arr)
-
-    n, k = (<object> values).shape
-    ranks = np.empty((n, k), dtype='f8')
-
-    if tiebreak == TIEBREAK_FIRST:
-        # need to use a stable sort here
-        _as = values.argsort(axis=1, kind='mergesort')
-        if not ascending:
-            tiebreak = TIEBREAK_FIRST_DESCENDING
-    else:
-        _as = values.argsort(1)
-
-    if not ascending:
-        _as = _as[:, ::-1]
-
-    values = _take_2d_int64(values, _as)
-    argsorted = _as.astype('i8')
-
-    for i in range(n):
-        dups = sum_ranks = 0
-        total_tie_count = 0
-        count = 0.0
-        for j in range(k):
-            sum_ranks += j + 1
-            dups += 1
-            val = values[i, j]
-            count += 1.0
-            if j == k - 1 or fabs(values[i, j + 1] - val) > FP_ERR:
-                if tiebreak == TIEBREAK_AVERAGE:
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = sum_ranks / dups
-                elif tiebreak == TIEBREAK_MIN:
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = j - dups + 2
-                elif tiebreak == TIEBREAK_MAX:
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = j + 1
-                elif tiebreak == TIEBREAK_FIRST:
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = z + 1
-                elif tiebreak == TIEBREAK_FIRST_DESCENDING:
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = 2 * j - z - dups + 2
-                elif tiebreak == TIEBREAK_DENSE:
-                    total_tie_count += 1
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = total_tie_count
-                sum_ranks = dups = 0
-        if pct:
-            ranks[i, :] /= count
-    if axis == 0:
-        return ranks.T
-    else:
-        return ranks
-
-
-def rank_1d_generic(object in_arr, bint retry=1, ties_method='average',
-                    ascending=True, na_option='keep', pct=False):
-    """
-    Fast NaN-friendly version of scipy.stats.rankdata
-    """
-
-    cdef:
-        Py_ssize_t i, j, n, dups = 0, total_tie_count = 0
-        ndarray[float64_t] ranks
-        ndarray sorted_data, values
-        ndarray[int64_t] argsorted
-        object val, nan_value
-        float64_t sum_ranks = 0
-        int tiebreak = 0
-        bint keep_na = 0
-        float count = 0.0
-
-
-    tiebreak = tiebreakers[ties_method]
-
-    keep_na = na_option == 'keep'
-
-    values = np.array(in_arr, copy=True)
-
-    if values.dtype != np.object_:
-        values = values.astype('O')
-
-    if ascending ^ (na_option == 'top'):
-        # always greater than everything
-        nan_value = Infinity()
-    else:
-        nan_value = NegInfinity()
-
-    mask = lib.isnullobj(values)
-    np.putmask(values, mask, nan_value)
-
-    n = len(values)
-    ranks = np.empty(n, dtype='f8')
-
-    # py2.5/win32 hack, can't pass i8
-    try:
-        _as = values.argsort()
-    except TypeError:
-        if not retry:
-            raise
-
-        valid_locs = (~mask).nonzero()[0]
-        ranks.put(valid_locs, rank_1d_generic(values.take(valid_locs), 0,
-                                              ties_method=ties_method,
-                                              ascending=ascending))
-        np.putmask(ranks, mask, np.nan)
-        return ranks
-
-    if not ascending:
-        _as = _as[::-1]
-
-    sorted_data = values.take(_as)
-    argsorted = _as.astype('i8')
-    for i in range(n):
-        sum_ranks += i + 1
-        dups += 1
-        val = util.get_value_at(sorted_data, i)
-        if val is nan_value and keep_na:
-            ranks[argsorted[i]] = nan
-            continue
-        if (i == n - 1 or
-            are_diff(util.get_value_at(sorted_data, i + 1), val)):
-            count += 1.0
-            if tiebreak == TIEBREAK_AVERAGE:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = sum_ranks / dups
-            elif tiebreak == TIEBREAK_MIN:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = i - dups + 2
-            elif tiebreak == TIEBREAK_MAX:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = i + 1
-            elif tiebreak == TIEBREAK_FIRST:
-                raise ValueError('first not supported for non-numeric data')
-            elif tiebreak == TIEBREAK_DENSE:
-                total_tie_count += 1
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = total_tie_count
-            sum_ranks = dups = 0
-    if pct:
-        return ranks / count
-    else:
-        return ranks
-
-cdef inline are_diff(object left, object right):
-    try:
-        return fabs(left - right) > FP_ERR
-    except TypeError:
-        return left != right
-
-_return_false = lambda self, other: False
-_return_true = lambda self, other: True
-
-class Infinity(object):
-
-    __lt__ = _return_false
-    __le__ = _return_false
-    __eq__ = _return_false
-    __ne__ = _return_true
-    __gt__ = _return_true
-    __ge__ = _return_true
-    __cmp__ = _return_false
-
-class NegInfinity(object):
-
-    __lt__ = _return_true
-    __le__ = _return_true
-    __eq__ = _return_false
-    __ne__ = _return_true
-    __gt__ = _return_false
-    __ge__ = _return_false
-    __cmp__ = _return_true
-
-def rank_2d_generic(object in_arr, axis=0, ties_method='average',
-                    ascending=True, na_option='keep', pct=False):
-    """
-    Fast NaN-friendly version of scipy.stats.rankdata
-    """
-
-    cdef:
-        Py_ssize_t i, j, z, k, n, infs, dups = 0
-        Py_ssize_t total_tie_count = 0
-        ndarray[float64_t, ndim=2] ranks
-        ndarray[object, ndim=2] values
-        ndarray[int64_t, ndim=2] argsorted
-        object val, nan_value
-        float64_t sum_ranks = 0
-        int tiebreak = 0
-        bint keep_na = 0
-        float count = 0.0
-
-    tiebreak = tiebreakers[ties_method]
-
-    keep_na = na_option == 'keep'
-
-    in_arr = np.asarray(in_arr)
-
-    if axis == 0:
-        values = in_arr.T.copy()
-    else:
-        values = in_arr.copy()
-
-    if values.dtype != np.object_:
-        values = values.astype('O')
-
-    if ascending ^ (na_option == 'top'):
-        # always greater than everything
-        nan_value = Infinity()
-    else:
-        nan_value = NegInfinity()
-
-    mask = lib.isnullobj2d(values)
-    np.putmask(values, mask, nan_value)
-
-    n, k = (<object> values).shape
-    ranks = np.empty((n, k), dtype='f8')
-
-    try:
-        _as = values.argsort(1)
-    except TypeError:
-        values = in_arr
-        for i in range(len(values)):
-            ranks[i] = rank_1d_generic(in_arr[i],
-                                       ties_method=ties_method,
-                                       ascending=ascending,
-                                       pct=pct)
-        if axis == 0:
-            return ranks.T
-        else:
-            return ranks
-
-    if not ascending:
-        _as = _as[:, ::-1]
-
-    values = _take_2d_object(values, _as)
-    argsorted = _as.astype('i8')
-
-    for i in range(n):
-        dups = sum_ranks = infs = 0
-        total_tie_count = 0
-        count = 0.0
-        for j in range(k):
-            val = values[i, j]
-            if val is nan_value and keep_na:
-                ranks[i, argsorted[i, j]] = nan
-                infs += 1
-                continue
-            count += 1.0
-            sum_ranks += (j - infs) + 1
-            dups += 1
-            if j == k - 1 or are_diff(values[i, j + 1], val):
-                if tiebreak == TIEBREAK_AVERAGE:
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = sum_ranks / dups
-                elif tiebreak == TIEBREAK_MIN:
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = j - dups + 2
-                elif tiebreak == TIEBREAK_MAX:
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = j + 1
-                elif tiebreak == TIEBREAK_FIRST:
-                    raise ValueError('first not supported for '
-                                     'non-numeric data')
-                elif tiebreak == TIEBREAK_DENSE:
-                    total_tie_count += 1
-                    for z in range(j - dups + 1, j + 1):
-                        ranks[i, argsorted[i, z]] = total_tie_count
-                sum_ranks = dups = 0
-        if pct:
-            ranks[i, :] /= count
-    if axis == 0:
-        return ranks.T
-    else:
-        return ranks
-
-# def _take_indexer_2d(ndarray[float64_t, ndim=2] values,
-#                      ndarray[Py_ssize_t, ndim=2, cast=True] indexer):
-#     cdef:
-#         Py_ssize_t i, j, N, K
-#         ndarray[float64_t, ndim=2] result
-
-#     N, K = (<object> values).shape
-#     result = np.empty_like(values)
-#     for i in range(N):
-#         for j in range(K):
-#             result[i, j] = values[i, indexer[i, j]]
-#     return result
-
-
-# Cython implementations of rolling sum, mean, variance, skewness,
-# other statistical moment functions
-#
-# Misc implementation notes
-# -------------------------
-#
-# - In Cython x * x is faster than x ** 2 for C types, this should be
-#   periodically revisited to see if it's still true.
-#
-# -
-
-def _check_minp(win, minp, N, floor=1):
-    if minp > win:
-        raise ValueError('min_periods (%d) must be <= window (%d)'
-                        % (minp, win))
-    elif minp > N:
-        minp = N + 1
-    elif minp < 0:
-        raise ValueError('min_periods must be >= 0')
-    return max(minp, floor)
-
-# original C implementation by N. Devillard.
-# This code in public domain.
-# Function :   kth_smallest()
-# In       :   array of elements, # of elements in the array, rank k
-# Out      :   one element
-# Job      :   find the kth smallest element in the array
-
-#             Reference:
-
-#               Author: Wirth, Niklaus
-#                Title: Algorithms + data structures = programs
-#            Publisher: Englewood Cliffs: Prentice-Hall, 1976
-# Physical description: 366 p.
-#               Series: Prentice-Hall Series in Automatic Computation
-
-
-ctypedef fused numeric:
-    int8_t
-    int16_t
-    int32_t
-    int64_t
-
-    uint8_t
-    uint16_t
-    uint32_t
-    uint64_t
-
-    float32_t
-    float64_t
-
-
-cdef inline Py_ssize_t swap(numeric *a, numeric *b) nogil except -1:
-    cdef numeric t
-
-    # cython doesn't allow pointer dereference so use array syntax
-    t = a[0]
-    a[0] = b[0]
-    b[0] = t
-    return 0
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-cpdef numeric kth_smallest(numeric[:] a, Py_ssize_t k):
-    cdef:
-        Py_ssize_t i, j, l, m, n = a.size
-        numeric x
-    with nogil:
-        l = 0
-        m = n - 1
-
-        while l < m:
-            x = a[k]
-            i = l
-            j = m
-
-            while 1:
-                while a[i] < x: i += 1
-                while x < a[j]: j -= 1
-                if i <= j:
-                    swap(&a[i], &a[j])
-                    i += 1; j -= 1
-
-                if i > j: break
-
-            if j < k: l = i
-            if k < i: m = j
-        return a[k]
-
-
-cdef inline kth_smallest_c(float64_t* a, Py_ssize_t k, Py_ssize_t n):
-    cdef:
-        Py_ssize_t i,j,l,m
-        double_t x, t
-
-    l = 0
-    m = n-1
-    while (l<m):
-        x = a[k]
-        i = l
-        j = m
-
-        while 1:
-            while a[i] < x: i += 1
-            while x < a[j]: j -= 1
-            if i <= j:
-                swap(&a[i], &a[j])
-                i += 1; j -= 1
-
-            if i > j: break
-
-        if j < k: l = i
-        if k < i: m = j
-    return a[k]
-
-
-cpdef numeric median(numeric[:] arr):
-    '''
-    A faster median
-    '''
-    cdef Py_ssize_t n = arr.size
-
-    if n == 0:
-        return np.NaN
-
-    arr = arr.copy()
-
-    if n % 2:
-        return kth_smallest(arr, n // 2)
-    else:
-        return (kth_smallest(arr, n // 2) +
-                kth_smallest(arr, n // 2 - 1)) / 2
-
-
-# -------------- Min, Max subsequence
-
-def max_subseq(ndarray[double_t] arr):
-    cdef:
-        Py_ssize_t i=0,s=0,e=0,T,n
-        double m, S
-
-    n = len(arr)
-
-    if len(arr) == 0:
-        return (-1,-1,None)
-
-    m = arr[0]
-    S = m
-    T = 0
-
-    for i in range(1, n):
-        # S = max { S + A[i], A[i] )
-        if (S > 0):
-            S = S + arr[i]
-        else:
-            S = arr[i]
-            T = i
-        if S > m:
-            s = T
-            e = i
-            m = S
-
-    return (s, e, m)
-
-def min_subseq(ndarray[double_t] arr):
-    cdef:
-        Py_ssize_t s, e
-        double m
-
-    (s, e, m) = max_subseq(-arr)
-
-    return (s, e, -m)
-
-#-------------------------------------------------------------------------------
-# Rolling sum
-
-def roll_sum(ndarray[double_t] input, int win, int minp):
-    cdef double val, prev, sum_x = 0
-    cdef int nobs = 0, i
-    cdef int N = len(input)
-
-    cdef ndarray[double_t] output = np.empty(N, dtype=float)
-
-    minp = _check_minp(win, minp, N)
-
-    for i from 0 <= i < minp - 1:
-        val = input[i]
-
-        # Not NaN
-        if val == val:
-            nobs += 1
-            sum_x += val
-
-        output[i] = NaN
-
-    for i from minp - 1 <= i < N:
-        val = input[i]
-
-        if val == val:
-            nobs += 1
-            sum_x += val
-
-        if i > win - 1:
-            prev = input[i - win]
-            if prev == prev:
-                sum_x -= prev
-                nobs -= 1
-
-        if nobs >= minp:
-            output[i] = sum_x
-        else:
-            output[i] = NaN
-
-    return output
-
-#-------------------------------------------------------------------------------
-# Rolling mean
-
-def roll_mean(ndarray[double_t] input,
-               int win, int minp):
-    cdef:
-        double val, prev, result, sum_x = 0
-        Py_ssize_t nobs = 0, i, neg_ct = 0
-        Py_ssize_t N = len(input)
-
-    cdef ndarray[double_t] output = np.empty(N, dtype=float)
-    minp = _check_minp(win, minp, N)
-
-    for i from 0 <= i < minp - 1:
-        val = input[i]
-
-        # Not NaN
-        if val == val:
-            nobs += 1
-            sum_x += val
-            if signbit(val):
-                neg_ct += 1
-
-        output[i] = NaN
-
-    for i from minp - 1 <= i < N:
-        val = input[i]
-
-        if val == val:
-            nobs += 1
-            sum_x += val
-            if signbit(val):
-                neg_ct += 1
-
-        if i > win - 1:
-            prev = input[i - win]
-            if prev == prev:
-                sum_x -= prev
-                nobs -= 1
-                if signbit(prev):
-                    neg_ct -= 1
-
-        if nobs >= minp:
-            result = sum_x / nobs
-            if neg_ct == 0 and result < 0:
-                # all positive
-                output[i] = 0
-            elif neg_ct == nobs and result > 0:
-                # all negative
-                output[i] = 0
-            else:
-                output[i] = result
-        else:
-            output[i] = NaN
-
-    return output
-
-#-------------------------------------------------------------------------------
-# Exponentially weighted moving average
-
-def ewma(ndarray[double_t] input, double_t com, int adjust, int ignore_na, int minp):
-    '''
-    Compute exponentially-weighted moving average using center-of-mass.
-
-    Parameters
-    ----------
-    input : ndarray (float64 type)
-    com : float64
-    adjust: int
-    ignore_na: int
-    minp: int
-
-    Returns
-    -------
-    y : ndarray
-    '''
-
-    cdef Py_ssize_t N = len(input)
-    cdef ndarray[double_t] output = np.empty(N, dtype=float)
-    if N == 0:
-        return output
-
-    minp = max(minp, 1)
-
-    cdef double alpha, old_wt_factor, new_wt, weighted_avg, old_wt, cur
-    cdef Py_ssize_t i, nobs
-
-    alpha = 1. / (1. + com)
-    old_wt_factor = 1. - alpha
-    new_wt = 1. if adjust else alpha
-
-    weighted_avg = input[0]
-    is_observation = (weighted_avg == weighted_avg)
-    nobs = int(is_observation)
-    output[0] = weighted_avg if (nobs >= minp) else NaN
-    old_wt = 1.
-
-    for i from 1 <= i < N:
-        cur = input[i]
-        is_observation = (cur == cur)
-        nobs += int(is_observation)
-        if weighted_avg == weighted_avg:
-            if is_observation or (not ignore_na):
-                old_wt *= old_wt_factor
-                if is_observation:
-                    if weighted_avg != cur:  # avoid numerical errors on constant series
-                        weighted_avg = ((old_wt * weighted_avg) + (new_wt * cur)) / (old_wt + new_wt)
-                    if adjust:
-                        old_wt += new_wt
-                    else:
-                        old_wt = 1.
-        elif is_observation:
-            weighted_avg = cur
-
-        output[i] = weighted_avg if (nobs >= minp) else NaN
-
-    return output
-
-#-------------------------------------------------------------------------------
-# Exponentially weighted moving covariance
-
-def ewmcov(ndarray[double_t] input_x, ndarray[double_t] input_y,
-           double_t com, int adjust, int ignore_na, int minp, int bias):
-    '''
-    Compute exponentially-weighted moving variance using center-of-mass.
-
-    Parameters
-    ----------
-    input_x : ndarray (float64 type)
-    input_y : ndarray (float64 type)
-    com : float64
-    adjust: int
-    ignore_na: int
-    minp: int
-    bias: int
-
-    Returns
-    -------
-    y : ndarray
-    '''
-
-    cdef Py_ssize_t N = len(input_x)
-    if len(input_y) != N:
-        raise ValueError('arrays are of different lengths (%d and %d)' % (N, len(input_y)))
-    cdef ndarray[double_t] output = np.empty(N, dtype=float)
-    if N == 0:
-        return output
-
-    minp = max(minp, 1)
-
-    cdef double alpha, old_wt_factor, new_wt, mean_x, mean_y, cov
-    cdef double sum_wt, sum_wt2, old_wt, cur_x, cur_y, old_mean_x, old_mean_y
-    cdef Py_ssize_t i, nobs
-
-    alpha = 1. / (1. + com)
-    old_wt_factor = 1. - alpha
-    new_wt = 1. if adjust else alpha
-
-    mean_x = input_x[0]
-    mean_y = input_y[0]
-    is_observation = ((mean_x == mean_x) and (mean_y == mean_y))
-    nobs = int(is_observation)
-    if not is_observation:
-        mean_x = NaN
-        mean_y = NaN
-    output[0] = (0. if bias else NaN) if (nobs >= minp) else NaN
-    cov = 0.
-    sum_wt = 1.
-    sum_wt2 = 1.
-    old_wt = 1.
-
-    for i from 1 <= i < N:
-        cur_x = input_x[i]
-        cur_y = input_y[i]
-        is_observation = ((cur_x == cur_x) and (cur_y == cur_y))
-        nobs += int(is_observation)
-        if mean_x == mean_x:
-            if is_observation or (not ignore_na):
-                sum_wt *= old_wt_factor
-                sum_wt2 *= (old_wt_factor * old_wt_factor)
-                old_wt *= old_wt_factor
-                if is_observation:
-                    old_mean_x = mean_x
-                    old_mean_y = mean_y
-                    if mean_x != cur_x:  # avoid numerical errors on constant series
-                        mean_x = ((old_wt * old_mean_x) + (new_wt * cur_x)) / (old_wt + new_wt)
-                    if mean_y != cur_y:  # avoid numerical errors on constant series
-                        mean_y = ((old_wt * old_mean_y) + (new_wt * cur_y)) / (old_wt + new_wt)
-                    cov = ((old_wt * (cov + ((old_mean_x - mean_x) * (old_mean_y - mean_y)))) +
-                           (new_wt * ((cur_x - mean_x) * (cur_y - mean_y)))) / (old_wt + new_wt)
-                    sum_wt += new_wt
-                    sum_wt2 += (new_wt * new_wt)
-                    old_wt += new_wt
-                    if not adjust:
-                        sum_wt /= old_wt
-                        sum_wt2 /= (old_wt * old_wt)
-                        old_wt = 1.
-        elif is_observation:
-            mean_x = cur_x
-            mean_y = cur_y
-
-        if nobs >= minp:
-            if not bias:
-                numerator = sum_wt * sum_wt
-                denominator = numerator - sum_wt2
-                output[i] = ((numerator / denominator) * cov) if (denominator > 0.) else NaN
-            else:
-                output[i] = cov
-        else:
-            output[i] = NaN
-
-    return output
-
-#----------------------------------------------------------------------
-# Pairwise correlation/covariance
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def nancorr(ndarray[float64_t, ndim=2] mat, cov=False, minp=None):
-    cdef:
-        Py_ssize_t i, j, xi, yi, N, K
-        ndarray[float64_t, ndim=2] result
-        ndarray[uint8_t, ndim=2] mask
-        int64_t nobs = 0
-        float64_t vx, vy, sumx, sumy, sumxx, sumyy, meanx, meany, divisor
-
-    N, K = (<object> mat).shape
-
-    if minp is None:
-        minp = 1
-
-    result = np.empty((K, K), dtype=np.float64)
-    mask = np.isfinite(mat).view(np.uint8)
-
-    for xi in range(K):
-        for yi in range(xi + 1):
-            nobs = sumxx = sumyy = sumx = sumy = 0
-            for i in range(N):
-                if mask[i, xi] and mask[i, yi]:
-                    vx = mat[i, xi]
-                    vy = mat[i, yi]
-                    nobs += 1
-                    sumx += vx
-                    sumy += vy
-
-            if nobs < minp:
-                result[xi, yi] = result[yi, xi] = np.NaN
-            else:
-                meanx = sumx / nobs
-                meany = sumy / nobs
-
-                # now the cov numerator
-                sumx = 0
-
-                for i in range(N):
-                    if mask[i, xi] and mask[i, yi]:
-                        vx = mat[i, xi] - meanx
-                        vy = mat[i, yi] - meany
-
-                        sumx += vx * vy
-                        sumxx += vx * vx
-                        sumyy += vy * vy
-
-                divisor = (nobs - 1.0) if cov else sqrt(sumxx * sumyy)
-
-                if divisor != 0:
-                    result[xi, yi] = result[yi, xi] = sumx / divisor
-                else:
-                    result[xi, yi] = result[yi, xi] = np.NaN
-
-    return result
-
-#----------------------------------------------------------------------
-# Pairwise Spearman correlation
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def nancorr_spearman(ndarray[float64_t, ndim=2] mat, Py_ssize_t minp=1):
-    cdef:
-        Py_ssize_t i, j, xi, yi, N, K
-        ndarray[float64_t, ndim=2] result
-        ndarray[float64_t, ndim=1] maskedx
-        ndarray[float64_t, ndim=1] maskedy
-        ndarray[uint8_t, ndim=2] mask
-        int64_t nobs = 0
-        float64_t vx, vy, sumx, sumxx, sumyy, mean, divisor
-
-    N, K = (<object> mat).shape
-
-    result = np.empty((K, K), dtype=np.float64)
-    mask = np.isfinite(mat).view(np.uint8)
-
-    for xi in range(K):
-        for yi in range(xi + 1):
-            nobs = 0
-            for i in range(N):
-                if mask[i, xi] and mask[i, yi]:
-                    nobs += 1
-
-            if nobs < minp:
-                result[xi, yi] = result[yi, xi] = np.NaN
-            else:
-                maskedx = np.empty(nobs, dtype=np.float64)
-                maskedy = np.empty(nobs, dtype=np.float64)
-                j = 0
-                for i in range(N):
-                    if mask[i, xi] and mask[i, yi]:
-                        maskedx[j] = mat[i, xi]
-                        maskedy[j] = mat[i, yi]
-                        j += 1
-                maskedx = rank_1d_float64(maskedx)
-                maskedy = rank_1d_float64(maskedy)
-
-                mean = (nobs + 1) / 2.
-
-                # now the cov numerator
-                sumx = sumxx = sumyy = 0
-
-                for i in range(nobs):
-                    vx = maskedx[i] - mean
-                    vy = maskedy[i] - mean
-
-                    sumx += vx * vy
-                    sumxx += vx * vx
-                    sumyy += vy * vy
-
-                divisor = sqrt(sumxx * sumyy)
-
-                if divisor != 0:
-                    result[xi, yi] = result[yi, xi] = sumx / divisor
-                else:
-                    result[xi, yi] = result[yi, xi] = np.NaN
-
-    return result
-
-#----------------------------------------------------------------------
-# Rolling variance
-
-def roll_var(ndarray[double_t] input, int win, int minp, int ddof=1):
-    """
-    Numerically stable implementation using Welford's method.
-    """
-    cdef double val, prev, mean_x = 0, ssqdm_x = 0, nobs = 0, delta
-    cdef Py_ssize_t i
-    cdef Py_ssize_t N = len(input)
-
-    cdef ndarray[double_t] output = np.empty(N, dtype=float)
-
-    minp = _check_minp(win, minp, N)
-
-    # Check for windows larger than array, addresses #7297
-    win = min(win, N)
-
-    # Over the first window, observations can only be added, never removed
-    for i from 0 <= i < win:
-        val = input[i]
-
-        # Not NaN
-        if val == val:
-            nobs += 1
-            delta = (val - mean_x)
-            mean_x += delta / nobs
-            ssqdm_x += delta * (val - mean_x)
-
-        if (nobs >= minp) and (nobs > ddof):
-            #pathological case
-            if nobs == 1:
-                val = 0
-            else:
-                val = ssqdm_x / (nobs - ddof)
-                if val < 0:
-                    val = 0
-        else:
-            val = NaN
-
-        output[i] = val
-
-    # After the first window, observations can both be added and removed
-    for i from win <= i < N:
-        val = input[i]
-        prev = input[i - win]
-
-        if val == val:
-            if prev == prev:
-                # Adding one observation and removing another one
-                delta = val - prev
-                prev -= mean_x
-                mean_x += delta / nobs
-                val -= mean_x
-                ssqdm_x += (val + prev) * delta
-            else:
-                # Adding one observation and not removing any
-                nobs += 1
-                delta = (val - mean_x)
-                mean_x += delta / nobs
-                ssqdm_x += delta * (val - mean_x)
-        elif prev == prev:
-            # Adding no new observation, but removing one
-            nobs -= 1
-            if nobs:
-                delta = (prev - mean_x)
-                mean_x -= delta  / nobs
-                ssqdm_x -= delta * (prev - mean_x)
-            else:
-                mean_x = 0
-                ssqdm_x = 0
-        # Variance is unchanged if no observation is added or removed
-
-        if (nobs >= minp) and (nobs > ddof):
-            #pathological case
-            if nobs == 1:
-                val = 0
-            else:
-                val = ssqdm_x / (nobs - ddof)
-                if val < 0:
-                    val = 0
-        else:
-            val = NaN
-
-        output[i] = val
-
-    return output
-
-
-#-------------------------------------------------------------------------------
-# Rolling skewness
-
-def roll_skew(ndarray[double_t] input, int win, int minp):
-    cdef double val, prev
-    cdef double x = 0, xx = 0, xxx = 0
-    cdef Py_ssize_t nobs = 0, i
-    cdef Py_ssize_t N = len(input)
-
-    cdef ndarray[double_t] output = np.empty(N, dtype=float)
-
-    # 3 components of the skewness equation
-    cdef double A, B, C, R
-
-    minp = _check_minp(win, minp, N)
-
-    for i from 0 <= i < minp - 1:
-        val = input[i]
-
-        # Not NaN
-        if val == val:
-            nobs += 1
-            x += val
-            xx += val * val
-            xxx += val * val * val
-
-        output[i] = NaN
-
-    for i from minp - 1 <= i < N:
-        val = input[i]
-
-        if val == val:
-            nobs += 1
-            x += val
-            xx += val * val
-            xxx += val * val * val
-
-        if i > win - 1:
-            prev = input[i - win]
-            if prev == prev:
-                x -= prev
-                xx -= prev * prev
-                xxx -= prev * prev * prev
-
-                nobs -= 1
-        if nobs >= minp:
-            A = x / nobs
-            B = xx / nobs - A * A
-            C = xxx / nobs - A * A * A - 3 * A * B
-            if B <= 0 or nobs < 3:
-                output[i] = NaN
-            else:
-                R = sqrt(B)
-                output[i] = ((sqrt(nobs * (nobs - 1.)) * C) /
-                             ((nobs-2) * R * R * R))
-        else:
-            output[i] = NaN
-
-    return output
-
-#-------------------------------------------------------------------------------
-# Rolling kurtosis
-
-
-def roll_kurt(ndarray[double_t] input,
-               int win, int minp):
-    cdef double val, prev
-    cdef double x = 0, xx = 0, xxx = 0, xxxx = 0
-    cdef Py_ssize_t nobs = 0, i
-    cdef Py_ssize_t N = len(input)
-
-    cdef ndarray[double_t] output = np.empty(N, dtype=float)
-
-    # 5 components of the kurtosis equation
-    cdef double A, B, C, D, R, K
-
-    minp = _check_minp(win, minp, N)
-
-    for i from 0 <= i < minp - 1:
-        val = input[i]
-
-        # Not NaN
-        if val == val:
-            nobs += 1
-
-            # seriously don't ask me why this is faster
-            x += val
-            xx += val * val
-            xxx += val * val * val
-            xxxx += val * val * val * val
-
-        output[i] = NaN
-
-    for i from minp - 1 <= i < N:
-        val = input[i]
-
-        if val == val:
-            nobs += 1
-            x += val
-            xx += val * val
-            xxx += val * val * val
-            xxxx += val * val * val * val
-
-        if i > win - 1:
-            prev = input[i - win]
-            if prev == prev:
-                x -= prev
-                xx -= prev * prev
-                xxx -= prev * prev * prev
-                xxxx -= prev * prev * prev * prev
-
-                nobs -= 1
-
-        if nobs >= minp:
-            A = x / nobs
-            R = A * A
-            B = xx / nobs - R
-            R = R * A
-            C = xxx / nobs - R - 3 * A * B
-            R = R * A
-            D = xxxx / nobs - R - 6*B*A*A - 4*C*A
-
-            if B == 0 or nobs < 4:
-                output[i] = NaN
-
-            else:
-                K = (nobs * nobs - 1.)*D/(B*B) - 3*((nobs-1.)**2)
-                K = K / ((nobs - 2.)*(nobs-3.))
-
-                output[i] = K
-
-        else:
-            output[i] = NaN
-
-    return output
-
-#-------------------------------------------------------------------------------
-# Rolling median, min, max
-
-ctypedef double_t (* skiplist_f)(object sl, int n, int p)
-
-cdef _roll_skiplist_op(ndarray arg, int win, int minp, skiplist_f op):
-    cdef ndarray[double_t] input = arg
-    cdef double val, prev, midpoint
-    cdef IndexableSkiplist skiplist
-    cdef Py_ssize_t nobs = 0, i
-
-    cdef Py_ssize_t N = len(input)
-    cdef ndarray[double_t] output = np.empty(N, dtype=float)
-
-    skiplist = IndexableSkiplist(win)
-
-    minp = _check_minp(win, minp, N)
-
-    for i from 0 <= i < minp - 1:
-        val = input[i]
-
-        # Not NaN
-        if val == val:
-            nobs += 1
-            skiplist.insert(val)
-
-        output[i] = NaN
-
-    for i from minp - 1 <= i < N:
-        val = input[i]
-
-        if i > win - 1:
-            prev = input[i - win]
-
-            if prev == prev:
-                skiplist.remove(prev)
-                nobs -= 1
-
-        if val == val:
-            nobs += 1
-            skiplist.insert(val)
-
-        output[i] = op(skiplist, nobs, minp)
-
-    return output
-
-from skiplist cimport *
-
-def roll_median_c(ndarray[float64_t] arg, int win, int minp):
-    cdef double val, res, prev
-    cdef:
-        int ret=0
-        skiplist_t *sl
-        Py_ssize_t midpoint, nobs = 0, i
-
-
-    cdef Py_ssize_t N = len(arg)
-    cdef ndarray[double_t] output = np.empty(N, dtype=float)
-
-    sl = skiplist_init(win)
-
-    minp = _check_minp(win, minp, N)
-
-    for i from 0 <= i < minp - 1:
-        val = arg[i]
-
-        # Not NaN
-        if val == val:
-            nobs += 1
-            skiplist_insert(sl, val)
-
-        output[i] = NaN
-
-    for i from minp - 1 <= i < N:
-        val = arg[i]
-
-        if i > win - 1:
-            prev = arg[i - win]
-
-            if prev == prev:
-                skiplist_remove(sl, prev)
-                nobs -= 1
-
-        if val == val:
-            nobs += 1
-            skiplist_insert(sl, val)
-
-        if nobs >= minp:
-            midpoint = nobs / 2
-            if nobs % 2:
-                res = skiplist_get(sl, midpoint, &ret)
-            else:
-                res = (skiplist_get(sl, midpoint, &ret) +
-                       skiplist_get(sl, (midpoint - 1), &ret)) / 2
-        else:
-            res = NaN
-
-        output[i] = res
-
-    skiplist_destroy(sl)
-
-    return output
-
-def roll_median_cython(ndarray input, int win, int minp):
-    '''
-    O(N log(window)) implementation using skip list
-    '''
-    return _roll_skiplist_op(input, win, minp, _get_median)
-
-# Unfortunately had to resort to some hackery here, would like for
-# Cython to be able to get this right.
-
-cdef double_t _get_median(object sl, int nobs, int minp):
-    cdef Py_ssize_t midpoint
-    cdef IndexableSkiplist skiplist = <IndexableSkiplist> sl
-    if nobs >= minp:
-        midpoint = nobs / 2
-        if nobs % 2:
-            return skiplist.get(midpoint)
-        else:
-            return (skiplist.get(midpoint) +
-                    skiplist.get(midpoint - 1)) / 2
-    else:
-        return NaN
-
-#----------------------------------------------------------------------
-
-# Moving maximum / minimum code taken from Bottleneck under the terms
-# of its Simplified BSD license
-# https://github.com/kwgoodman/bottleneck
-
-cdef struct pairs:
-    double value
-    int death
-
-from libc cimport stdlib
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def roll_max2(ndarray[float64_t] a, int window, int minp):
-    "Moving max of 1d array of dtype=float64 along axis=0 ignoring NaNs."
-    cdef np.float64_t ai, aold
-    cdef Py_ssize_t count
-    cdef pairs* ring
-    cdef pairs* minpair
-    cdef pairs* end
-    cdef pairs* last
-    cdef Py_ssize_t i0
-    cdef np.npy_intp *dim
-    dim = PyArray_DIMS(a)
-    cdef Py_ssize_t n0 = dim[0]
-    cdef np.npy_intp *dims = [n0]
-    cdef np.ndarray[np.float64_t, ndim=1] y = PyArray_EMPTY(1, dims,
-		NPY_float64, 0)
-
-    if window < 1:
-        raise ValueError('Invalid window size %d'
-                         % (window))
-
-    if minp > window:
-        raise ValueError('Invalid min_periods size %d greater than window %d'
-                        % (minp, window))
-
-    minp = _check_minp(window, minp, n0)
-
-    ring = <pairs*>stdlib.malloc(window * sizeof(pairs))
-    end = ring + window
-    last = ring
-
-    minpair = ring
-    ai = a[0]
-    if ai == ai:
-        minpair.value = ai
-    else:
-        minpair.value = MINfloat64
-    minpair.death = window
-
-    count = 0
-    for i0 in range(n0):
-        ai = a[i0]
-        if ai == ai:
-            count += 1
-        else:
-            ai = MINfloat64
-        if i0 >= window:
-            aold = a[i0 - window]
-            if aold == aold:
-                count -= 1
-        if minpair.death == i0:
-            minpair += 1
-            if minpair >= end:
-                minpair = ring
-        if ai >= minpair.value:
-            minpair.value = ai
-            minpair.death = i0 + window
-            last = minpair
-        else:
-            while last.value <= ai:
-                if last == ring:
-                    last = end
-                last -= 1
-            last += 1
-            if last == end:
-                last = ring
-            last.value = ai
-            last.death = i0 + window
-        if count >= minp:
-            y[i0] = minpair.value
-        else:
-            y[i0] = NaN
-
-    for i0 in range(minp - 1):
-        y[i0] = NaN
-
-    stdlib.free(ring)
-    return y
-
-def roll_max(ndarray input, int win, int minp):
-    '''
-    O(N log(window)) implementation using skip list
-    '''
-    return _roll_skiplist_op(input, win, minp, _get_max)
-
-
-cdef double_t _get_max(object skiplist, int nobs, int minp):
-    if nobs >= minp:
-        return <IndexableSkiplist> skiplist.get(nobs - 1)
-    else:
-        return NaN
-
-def roll_min(ndarray input, int win, int minp):
-    '''
-    O(N log(window)) implementation using skip list
-    '''
-    return _roll_skiplist_op(input, win, minp, _get_min)
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def roll_min2(np.ndarray[np.float64_t, ndim=1] a, int window, int minp):
-    "Moving min of 1d array of dtype=float64 along axis=0 ignoring NaNs."
-    cdef np.float64_t ai, aold
-    cdef Py_ssize_t count
-    cdef pairs* ring
-    cdef pairs* minpair
-    cdef pairs* end
-    cdef pairs* last
-    cdef Py_ssize_t i0
-    cdef np.npy_intp *dim
-    dim = PyArray_DIMS(a)
-    cdef Py_ssize_t n0 = dim[0]
-    cdef np.npy_intp *dims = [n0]
-    cdef np.ndarray[np.float64_t, ndim=1] y = PyArray_EMPTY(1, dims,
-		NPY_float64, 0)
-
-    if window < 1:
-        raise ValueError('Invalid window size %d'
-                         % (window))
-
-    if minp > window:
-        raise ValueError('Invalid min_periods size %d greater than window %d'
-                        % (minp, window))
-
-    minp = _check_minp(window, minp, n0)
-
-    ring = <pairs*>stdlib.malloc(window * sizeof(pairs))
-    end = ring + window
-    last = ring
-
-    minpair = ring
-    ai = a[0]
-    if ai == ai:
-        minpair.value = ai
-    else:
-        minpair.value = MAXfloat64
-    minpair.death = window
-
-    count = 0
-    for i0 in range(n0):
-        ai = a[i0]
-        if ai == ai:
-            count += 1
-        else:
-            ai = MAXfloat64
-        if i0 >= window:
-            aold = a[i0 - window]
-            if aold == aold:
-                count -= 1
-        if minpair.death == i0:
-            minpair += 1
-            if minpair >= end:
-                minpair = ring
-        if ai <= minpair.value:
-            minpair.value = ai
-            minpair.death = i0 + window
-            last = minpair
-        else:
-            while last.value >= ai:
-                if last == ring:
-                    last = end
-                last -= 1
-            last += 1
-            if last == end:
-                last = ring
-            last.value = ai
-            last.death = i0 + window
-        if count >= minp:
-            y[i0] = minpair.value
-        else:
-            y[i0] = NaN
-
-    for i0 in range(minp - 1):
-        y[i0] = NaN
-
-    stdlib.free(ring)
-    return y
-
-cdef double_t _get_min(object skiplist, int nobs, int minp):
-    if nobs >= minp:
-        return <IndexableSkiplist> skiplist.get(0)
-    else:
-        return NaN
-
-def roll_quantile(ndarray[float64_t, cast=True] input, int win,
-                  int minp, double quantile):
-    '''
-    O(N log(window)) implementation using skip list
-    '''
-    cdef double val, prev, midpoint
-    cdef IndexableSkiplist skiplist
-    cdef Py_ssize_t nobs = 0, i
-    cdef Py_ssize_t N = len(input)
-    cdef ndarray[double_t] output = np.empty(N, dtype=float)
-
-    skiplist = IndexableSkiplist(win)
-
-    minp = _check_minp(win, minp, N)
-
-    for i from 0 <= i < minp - 1:
-        val = input[i]
-
-        # Not NaN
-        if val == val:
-            nobs += 1
-            skiplist.insert(val)
-
-        output[i] = NaN
-
-    for i from minp - 1 <= i < N:
-        val = input[i]
-
-        if i > win - 1:
-            prev = input[i - win]
-
-            if prev == prev:
-                skiplist.remove(prev)
-                nobs -= 1
-
-        if val == val:
-            nobs += 1
-            skiplist.insert(val)
-
-        if nobs >= minp:
-            idx = int((quantile / 1.) * (nobs - 1))
-            output[i] = skiplist.get(idx)
-        else:
-            output[i] = NaN
-
-    return output
-
-def roll_generic(ndarray[float64_t, cast=True] input,
-                 int win, int minp, int offset,
-                 object func, object args, object kwargs):
-    cdef ndarray[double_t] output, counts, bufarr
-    cdef Py_ssize_t i, n
-    cdef float64_t *buf
-    cdef float64_t *oldbuf
-
-    if not input.flags.c_contiguous:
-        input = input.copy('C')
-
-    n = len(input)
-    if n == 0:
-        return input
-
-    minp = _check_minp(win, minp, n, floor=0)
-    output = np.empty(n, dtype=float)
-    counts = roll_sum(np.concatenate((np.isfinite(input).astype(float), np.array([0.] * offset))), win, minp)[offset:]
-
-    # truncated windows at the beginning, through first full-length window
-    for i from 0 <= i < (int_min(win, n) - offset):
-        if counts[i] >= minp:
-            output[i] = func(input[0 : (i + offset + 1)], *args, **kwargs)
-        else:
-            output[i] = NaN
-
-    # remaining full-length windows
-    buf = <float64_t*> input.data
-    bufarr = np.empty(win, dtype=float)
-    oldbuf = <float64_t*> bufarr.data
-    for i from (win - offset) <= i < (n - offset):
-        buf = buf + 1
-        bufarr.data = <char*> buf
-        if counts[i] >= minp:
-            output[i] = func(bufarr, *args, **kwargs)
-        else:
-            output[i] = NaN
-    bufarr.data = <char*> oldbuf
-
-    # truncated windows at the end
-    for i from int_max(n - offset, 0) <= i < n:
-        if counts[i] >= minp:
-            output[i] = func(input[int_max(i + offset - win + 1, 0) : n], *args, **kwargs)
-        else:
-            output[i] = NaN
-
-    return output
-
-
-def roll_window(ndarray[float64_t, ndim=1, cast=True] input,
-                ndarray[float64_t, ndim=1, cast=True] weights,
-                int minp, bint avg=True):
-    """
-    Assume len(weights) << len(input)
-    """
-    cdef:
-        ndarray[double_t] output, tot_wgt, counts
-        Py_ssize_t in_i, win_i, win_n, win_k, in_n, in_k
-        float64_t val_in, val_win, c, w
-
-    in_n = len(input)
-    win_n = len(weights)
-    output = np.zeros(in_n, dtype=float)
-    counts = np.zeros(in_n, dtype=float)
-    if avg:
-        tot_wgt = np.zeros(in_n, dtype=float)
-
-    minp = _check_minp(len(weights), minp, in_n)
-
-    if avg:
-        for win_i from 0 <= win_i < win_n:
-            val_win = weights[win_i]
-            if val_win != val_win:
-                continue
-
-            for in_i from 0 <= in_i < in_n - (win_n - win_i) + 1:
-                val_in = input[in_i]
-                if val_in == val_in:
-                    output[in_i + (win_n - win_i) - 1] += val_in * val_win
-                    counts[in_i + (win_n - win_i) - 1] += 1
-                    tot_wgt[in_i + (win_n - win_i) - 1] += val_win
-
-        for in_i from 0 <= in_i < in_n:
-            c = counts[in_i]
-            if c < minp:
-                output[in_i] = NaN
-            else:
-                w = tot_wgt[in_i]
-                if w == 0:
-                    output[in_i] = NaN
-                else:
-                    output[in_i] /= tot_wgt[in_i]
-
-    else:
-        for win_i from 0 <= win_i < win_n:
-            val_win = weights[win_i]
-            if val_win != val_win:
-                continue
-
-            for in_i from 0 <= in_i < in_n - (win_n - win_i) + 1:
-                val_in = input[in_i]
-
-                if val_in == val_in:
-                    output[in_i + (win_n - win_i) - 1] += val_in * val_win
-                    counts[in_i + (win_n - win_i) - 1] += 1
-
-        for in_i from 0 <= in_i < in_n:
-            c = counts[in_i]
-            if c < minp:
-                output[in_i] = NaN
-
-    return output
-
-
-#----------------------------------------------------------------------
-# group operations
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def is_lexsorted(list list_of_arrays):
-    cdef:
-        int i
-        Py_ssize_t n, nlevels
-        int64_t k, cur, pre
-        ndarray arr
-
-    nlevels = len(list_of_arrays)
-    n = len(list_of_arrays[0])
-
-    cdef int64_t **vecs = <int64_t**> malloc(nlevels * sizeof(int64_t*))
-    for i from 0 <= i < nlevels:
-        # vecs[i] = <int64_t *> (<ndarray> list_of_arrays[i]).data
-
-        arr = list_of_arrays[i]
-        vecs[i] = <int64_t *> arr.data
-    # assume uniqueness??
-
-    for i from 1 <= i < n:
-        for k from 0 <= k < nlevels:
-            cur = vecs[k][i]
-            pre = vecs[k][i-1]
-            if cur == pre:
-                continue
-            elif cur > pre:
-                break
-            else:
-                return False
-    free(vecs)
-    return True
-
-
-@cython.boundscheck(False)
-def groupby_indices(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[int64_t] labels, counts, arr, seen
-        int64_t loc
-        dict ids = {}
-        object val
-        int64_t k
-
-    ids, labels, counts = group_labels(values)
-    seen = np.zeros_like(counts)
-
-    # try not to get in trouble here...
-    cdef int64_t **vecs = <int64_t **> malloc(len(ids) * sizeof(int64_t*))
-    result = {}
-    for i from 0 <= i < len(counts):
-        arr = np.empty(counts[i], dtype=np.int64)
-        result[ids[i]] = arr
-        vecs[i] = <int64_t *> arr.data
-
-    for i from 0 <= i < n:
-        k = labels[i]
-
-        # was NaN
-        if k == -1:
-            continue
-
-        loc = seen[k]
-        vecs[k][loc] = i
-        seen[k] = loc + 1
-
-    free(vecs)
-
-    return result
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_labels(ndarray[object] values):
-    '''
-    Compute label vector from input values and associated useful data
-
-    Returns
-    -------
-    '''
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[int64_t] labels = np.empty(n, dtype=np.int64)
-        ndarray[int64_t] counts = np.empty(n, dtype=np.int64)
-        dict ids = {}, reverse = {}
-        int64_t idx
-        object val
-        int64_t count = 0
-
-    for i from 0 <= i < n:
-        val = values[i]
-
-        # is NaN
-        if val != val:
-            labels[i] = -1
-            continue
-
-        # for large number of groups, not doing try: except: makes a big
-        # difference
-        if val in ids:
-            idx = ids[val]
-            labels[i] = idx
-            counts[idx] = counts[idx] + 1
-        else:
-            ids[val] = count
-            reverse[count] = val
-            labels[i] = count
-            counts[count] = 1
-            count += 1
-
-    return reverse, labels, counts[:count].copy()
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def groupsort_indexer(ndarray[int64_t] index, Py_ssize_t ngroups):
-    cdef:
-        Py_ssize_t i, loc, label, n
-        ndarray[int64_t] counts, where, result
-
-    # count group sizes, location 0 for NA
-    counts = np.zeros(ngroups + 1, dtype=np.int64)
-    n = len(index)
-    for i from 0 <= i < n:
-        counts[index[i] + 1] += 1
-
-    # mark the start of each contiguous group of like-indexed data
-    where = np.zeros(ngroups + 1, dtype=np.int64)
-    for i from 1 <= i < ngroups + 1:
-        where[i] = where[i - 1] + counts[i - 1]
-
-    # this is our indexer
-    result = np.zeros(n, dtype=np.int64)
-    for i from 0 <= i < n:
-        label = index[i] + 1
-        result[where[label]] = i
-        where[label] += 1
-
-    return result, counts
-
-# TODO: aggregate multiple columns in single pass
-#----------------------------------------------------------------------
-# first, nth, last
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def group_nth_object(ndarray[object, ndim=2] out,
-                     ndarray[int64_t] counts,
-                     ndarray[object, ndim=2] values,
-                     ndarray[int64_t] labels,
-                     int64_t rank):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab
-        object val
-        float64_t count
-        ndarray[int64_t, ndim=2] nobs
-        ndarray[object, ndim=2] resx
-
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
-    resx = np.empty((<object> out).shape, dtype=object)
-
-    N, K = (<object> values).shape
-
-    for i in range(N):
-        lab = labels[i]
-        if lab < 0:
-            continue
-
-        counts[lab] += 1
-        for j in range(K):
-            val = values[i, j]
-
-            # not nan
-            if val == val:
-                nobs[lab, j] += 1
-                if nobs[lab, j] == rank:
-                    resx[lab, j] = val
-
-    for i in range(len(counts)):
-        for j in range(K):
-            if nobs[i, j] == 0:
-                out[i, j] = <object> nan
-            else:
-                out[i, j] = resx[i, j]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def group_nth_bin_object(ndarray[object, ndim=2] out,
-                         ndarray[int64_t] counts,
-                         ndarray[object, ndim=2] values,
-                         ndarray[int64_t] bins, int64_t rank):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, ngroups, b
-        object val
-        float64_t count
-        ndarray[object, ndim=2] resx
-        ndarray[float64_t, ndim=2] nobs
-
-    nobs = np.zeros((<object> out).shape, dtype=np.float64)
-    resx = np.empty((<object> out).shape, dtype=object)
-
-    if len(bins) == 0:
-        return
-    if bins[len(bins) - 1] == len(values):
-        ngroups = len(bins)
-    else:
-        ngroups = len(bins) + 1
-
-    N, K = (<object> values).shape
-
-    b = 0
-    for i in range(N):
-        while b < ngroups - 1 and i >= bins[b]:
-            b += 1
-
-        counts[b] += 1
-        for j in range(K):
-            val = values[i, j]
-
-            # not nan
-            if val == val:
-                nobs[b, j] += 1
-                if nobs[b, j] == rank:
-                    resx[b, j] = val
-
-    for i in range(ngroups):
-        for j in range(K):
-            if nobs[i, j] == 0:
-                out[i, j] = nan
-            else:
-                out[i, j] = resx[i, j]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def group_last_object(ndarray[object, ndim=2] out,
-                      ndarray[int64_t] counts,
-                      ndarray[object, ndim=2] values,
-                      ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab
-        object val
-        float64_t count
-        ndarray[object, ndim=2] resx
-        ndarray[int64_t, ndim=2] nobs
-
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
-    resx = np.empty((<object> out).shape, dtype=object)
-
-    N, K = (<object> values).shape
-
-    for i in range(N):
-        lab = labels[i]
-        if lab < 0:
-            continue
-
-        counts[lab] += 1
-        for j in range(K):
-            val = values[i, j]
-
-            # not nan
-            if val == val:
-                nobs[lab, j] += 1
-                resx[lab, j] = val
-
-    for i in range(len(counts)):
-        for j in range(K):
-            if nobs[i, j] == 0:
-                out[i, j] = nan
-            else:
-                out[i, j] = resx[i, j]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def group_last_bin_object(ndarray[object, ndim=2] out,
-                          ndarray[int64_t] counts,
-                          ndarray[object, ndim=2] values,
-                          ndarray[int64_t] bins):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, ngroups, b
-        object val
-        float64_t count
-        ndarray[object, ndim=2] resx
-        ndarray[float64_t, ndim=2] nobs
-
-    nobs = np.zeros((<object> out).shape, dtype=np.float64)
-    resx = np.empty((<object> out).shape, dtype=object)
-
-    if len(bins) == 0:
-        return
-    if bins[len(bins) - 1] == len(values):
-        ngroups = len(bins)
-    else:
-        ngroups = len(bins) + 1
-
-    N, K = (<object> values).shape
-
-    b = 0
-    for i in range(N):
-        while b < ngroups - 1 and i >= bins[b]:
-            b += 1
-
-        counts[b] += 1
-        for j in range(K):
-            val = values[i, j]
-
-            # not nan
-            if val == val:
-                nobs[b, j] += 1
-                resx[b, j] = val
-
-    for i in range(ngroups):
-        for j in range(K):
-            if nobs[i, j] == 0:
-                out[i, j] = nan
-            else:
-                out[i, j] = resx[i, j]
-
-
-
-#----------------------------------------------------------------------
-# median
-
-def group_median(ndarray[float64_t, ndim=2] out,
-                 ndarray[int64_t] counts,
-                 ndarray[float64_t, ndim=2] values,
-                 ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, ngroups, size
-        ndarray[int64_t] _counts
-        ndarray data
-        float64_t* ptr
-    ngroups = len(counts)
-    N, K = (<object> values).shape
-
-    indexer, _counts = groupsort_indexer(labels, ngroups)
-    counts[:] = _counts[1:]
-
-    data = np.empty((K, N), dtype=np.float64)
-    ptr = <float64_t*> data.data
-
-    take_2d_axis1_float64_float64(values.T, indexer, out=data)
-
-    for i in range(K):
-        # exclude NA group
-        ptr += _counts[0]
-        for j in range(ngroups):
-            size = _counts[j + 1]
-            out[j, i] = _median_linear(ptr, size)
-            ptr += size
-
-
-cdef inline float64_t _median_linear(float64_t* a, int n):
-    cdef int i, j, na_count = 0
-    cdef float64_t result
-    cdef float64_t* tmp
-
-    # count NAs
-    for i in range(n):
-        if a[i] != a[i]:
-            na_count += 1
-
-    if na_count:
-        if na_count == n:
-            return NaN
-
-        tmp = <float64_t*> malloc((n - na_count) * sizeof(float64_t))
-
-        j = 0
-        for i in range(n):
-            if a[i] == a[i]:
-                tmp[j] = a[i]
-                j += 1
-
-        a = tmp
-        n -= na_count
-
-
-    if n % 2:
-        result = kth_smallest_c( a, n / 2, n)
-    else:
-        result = (kth_smallest_c(a, n / 2, n) +
-                  kth_smallest_c(a, n / 2 - 1, n)) / 2
-
-    if na_count:
-        free(a)
-
-    return result
-
-include "join.pyx"
-include "generated.pyx"
diff --git a/pandas/api/__init__.py b/pandas/api/__init__.py
new file mode 100644
index 0000000000000..afff059e7b601
--- /dev/null
+++ b/pandas/api/__init__.py
@@ -0,0 +1,2 @@
+""" public toolkit API """
+from . import types, extensions  # noqa
diff --git a/pandas/api/extensions/__init__.py b/pandas/api/extensions/__init__.py
new file mode 100644
index 0000000000000..851a63725952a
--- /dev/null
+++ b/pandas/api/extensions/__init__.py
@@ -0,0 +1,8 @@
+"""Public API for extending panadas objects."""
+from pandas.core.accessor import (register_dataframe_accessor,  # noqa
+                                  register_index_accessor,
+                                  register_series_accessor)
+from pandas.core.algorithms import take  # noqa
+from pandas.core.arrays.base import (ExtensionArray,    # noqa
+                                     ExtensionScalarOpsMixin)
+from pandas.core.dtypes.dtypes import ExtensionDtype  # noqa
diff --git a/pandas/api/types/__init__.py b/pandas/api/types/__init__.py
new file mode 100644
index 0000000000000..438e4afa3f580
--- /dev/null
+++ b/pandas/api/types/__init__.py
@@ -0,0 +1,9 @@
+""" public toolkit API """
+
+from pandas.core.dtypes.api import *  # noqa
+from pandas.core.dtypes.dtypes import (CategoricalDtype,  # noqa
+                                       DatetimeTZDtype,
+                                       PeriodDtype,
+                                       IntervalDtype)
+from pandas.core.dtypes.concat import union_categoricals  # noqa
+from pandas._libs.lib import infer_dtype  # noqa
diff --git a/pandas/compat/__init__.py b/pandas/compat/__init__.py
index 9df53bd3239bf..28a55133e68aa 100644
--- a/pandas/compat/__init__.py
+++ b/pandas/compat/__init__.py
@@ -7,7 +7,7 @@
 Key items to import for 2/3 compatible code:
 * iterators: range(), map(), zip(), filter(), reduce()
 * lists: lrange(), lmap(), lzip(), lfilter()
-* unicode: u() [u"" is a syntax error in Python 3.0-3.2]
+* unicode: u() [no unicode builtin in Python 3]
 * longs: long (int in Python 3)
 * callable
 * iterable method compatibility: iteritems, iterkeys, itervalues
@@ -20,27 +20,31 @@
 * add_metaclass(metaclass) - class decorator that recreates class with with the
   given metaclass instead (and avoids intermediary class creation)
 
-Python 2.6 compatibility:
-* OrderedDict
-* Counter
-
 Other items:
-* OrderedDefaultDict
 * platform checker
 """
 # pylint disable=W0611
+# flake8: noqa
+
+import re
 import functools
 import itertools
 from distutils.version import LooseVersion
 from itertools import product
 import sys
+import platform
 import types
 from unicodedata import east_asian_width
 import struct
+import inspect
+from collections import namedtuple
 
 PY2 = sys.version_info[0] == 2
-PY3 = (sys.version_info[0] >= 3)
-PY35 = (sys.version_info >= (3, 5))
+PY3 = sys.version_info[0] >= 3
+PY35 = sys.version_info >= (3, 5)
+PY36 = sys.version_info >= (3, 6)
+PY37 = sys.version_info >= (3, 7)
+PYPY = platform.python_implementation() == 'PyPy'
 
 try:
     import __builtin__ as builtins
@@ -71,15 +75,51 @@ def str_to_bytes(s, encoding=None):
     def bytes_to_str(b, encoding=None):
         return b.decode(encoding or 'utf-8')
 
+    # The signature version below is directly copied from Django,
+    # https://github.com/django/django/pull/4846
+    def signature(f):
+        sig = inspect.signature(f)
+        args = [
+            p.name for p in sig.parameters.values()
+            if p.kind == inspect.Parameter.POSITIONAL_OR_KEYWORD
+        ]
+        varargs = [
+            p.name for p in sig.parameters.values()
+            if p.kind == inspect.Parameter.VAR_POSITIONAL
+        ]
+        varargs = varargs[0] if varargs else None
+        keywords = [
+            p.name for p in sig.parameters.values()
+            if p.kind == inspect.Parameter.VAR_KEYWORD
+        ]
+        keywords = keywords[0] if keywords else None
+        defaults = [
+            p.default for p in sig.parameters.values()
+            if p.kind == inspect.Parameter.POSITIONAL_OR_KEYWORD
+            and p.default is not p.empty
+        ] or None
+        argspec = namedtuple('Signature', ['args', 'defaults',
+                                           'varargs', 'keywords'])
+        return argspec(args, defaults, varargs, keywords)
+
+    def get_range_parameters(data):
+        """Gets the start, stop, and step parameters from a range object"""
+        return data.start, data.stop, data.step
+
     # have to explicitly put builtins into the namespace
     range = range
     map = map
     zip = zip
     filter = filter
+    intern = sys.intern
     reduce = functools.reduce
     long = int
     unichr = chr
 
+    # This was introduced in Python 3.3, but we don't support
+    # Python 3.x < 3.5, so checking PY3 is safe.
+    FileNotFoundError = FileNotFoundError
+
     # list-producing versions of the major Python iterating functions
     def lrange(*args, **kwargs):
         return list(range(*args, **kwargs))
@@ -93,11 +133,15 @@ def lmap(*args, **kwargs):
     def lfilter(*args, **kwargs):
         return list(filter(*args, **kwargs))
 
+    from importlib import reload
+    reload = reload
+
 else:
     # Python 2
-    import re
     _name_re = re.compile(r"[a-zA-Z_][a-zA-Z0-9_]*$")
 
+    FileNotFoundError = IOError
+
     def isidentifier(s, dotted=False):
         return bool(_name_re.match(s))
 
@@ -107,8 +151,30 @@ def str_to_bytes(s, encoding='ascii'):
     def bytes_to_str(b, encoding='ascii'):
         return b
 
+    def signature(f):
+        return inspect.getargspec(f)
+
+    def get_range_parameters(data):
+        """Gets the start, stop, and step parameters from a range object"""
+        # seems we only have indexing ops to infer
+        # rather than direct accessors
+        if len(data) > 1:
+            step = data[1] - data[0]
+            stop = data[-1] + step
+            start = data[0]
+        elif len(data):
+            start = data[0]
+            stop = data[0] + 1
+            step = 1
+        else:
+            start = stop = 0
+            step = 1
+
+        return start, stop, step
+
     # import iterator versions of these functions
     range = xrange
+    intern = intern
     zip = itertools.izip
     filter = itertools.ifilter
     map = itertools.imap
@@ -122,31 +188,30 @@ def bytes_to_str(b, encoding='ascii'):
     lmap = builtins.map
     lfilter = builtins.filter
 
+    reload = builtins.reload
 
-def iteritems(obj, **kwargs):
-    """replacement for six's iteritems for Python2/3 compat
-       uses 'iteritems' if available and otherwise uses 'items'.
+if PY2:
+    def iteritems(obj, **kw):
+        return obj.iteritems(**kw)
 
-       Passes kwargs to method.
-    """
-    func = getattr(obj, "iteritems", None)
-    if not func:
-        func = obj.items
-    return func(**kwargs)
+    def iterkeys(obj, **kw):
+        return obj.iterkeys(**kw)
 
+    def itervalues(obj, **kw):
+        return obj.itervalues(**kw)
+
+    next = lambda it: it.next()
+else:
+    def iteritems(obj, **kw):
+        return iter(obj.items(**kw))
 
-def iterkeys(obj, **kwargs):
-    func = getattr(obj, "iterkeys", None)
-    if not func:
-        func = obj.keys
-    return func(**kwargs)
+    def iterkeys(obj, **kw):
+        return iter(obj.keys(**kw))
 
+    def itervalues(obj, **kw):
+        return iter(obj.values(**kw))
 
-def itervalues(obj, **kwargs):
-    func = getattr(obj, "itervalues", None)
-    if not func:
-        func = obj.values
-    return func(**kwargs)
+    next = next
 
 
 def bind_method(cls, name, func):
@@ -197,6 +262,16 @@ def u(s):
     def u_safe(s):
         return s
 
+    def to_str(s):
+        """
+        Convert bytes and non-string into Python 3 str
+        """
+        if isinstance(s, binary_type):
+            s = bytes_to_str(s)
+        elif not isinstance(s, string_types):
+            s = str(s)
+        return s
+
     def strlen(data, encoding=None):
         # encoding is for compat with PY2
         return len(data)
@@ -206,10 +281,26 @@ def east_asian_len(data, encoding=None, ambiguous_width=1):
         Calculate display width considering unicode East Asian Width
         """
         if isinstance(data, text_type):
-            return sum([_EAW_MAP.get(east_asian_width(c), ambiguous_width) for c in data])
+            return sum(_EAW_MAP.get(east_asian_width(c), ambiguous_width) for c in data)
         else:
             return len(data)
 
+    def import_lzma():
+        """ import lzma from the std library """
+        import lzma
+        return lzma
+
+    def set_function_name(f, name, cls):
+        """ Bind the name/qualname attributes of the function """
+        f.__name__ = name
+        f.__qualname__ = '{klass}.{name}'.format(
+            klass=cls.__name__,
+            name=name)
+        f.__module__ = cls.__module__
+        return f
+
+    ResourceWarning = ResourceWarning
+
 else:
     string_types = basestring,
     integer_types = (int, long)
@@ -226,6 +317,14 @@ def u_safe(s):
         except:
             return s
 
+    def to_str(s):
+        """
+        Convert unicode and non-string into Python 2 str
+        """
+        if not isinstance(s, string_types):
+            s = str(s)
+        return s
+
     def strlen(data, encoding=None):
         try:
             data = data.decode(encoding)
@@ -242,10 +341,24 @@ def east_asian_len(data, encoding=None, ambiguous_width=1):
                 data = data.decode(encoding)
             except UnicodeError:
                 pass
-            return sum([_EAW_MAP.get(east_asian_width(c), ambiguous_width) for c in data])
+            return sum(_EAW_MAP.get(east_asian_width(c), ambiguous_width) for c in data)
         else:
             return len(data)
 
+    def import_lzma():
+        """ import the backported lzma library
+        or raise ImportError if not available """
+        from backports import lzma
+        return lzma
+
+    def set_function_name(f, name, cls):
+        """ Bind the name attributes of the function """
+        f.__name__ = name
+        return f
+
+    class ResourceWarning(Warning):
+        pass
+
 string_and_binary_types = string_types + (binary_type,)
 
 
@@ -257,6 +370,20 @@ def callable(obj):
         return any("__call__" in klass.__dict__ for klass in type(obj).__mro__)
 
 
+if PY2:
+    # In PY2 functools.wraps doesn't provide metadata pytest needs to generate
+    # decorated tests using parametrization. See pytest GH issue #2782
+    def wraps(wrapped, assigned=functools.WRAPPER_ASSIGNMENTS,
+              updated=functools.WRAPPER_UPDATES):
+        def wrapper(f):
+            f = functools.wraps(wrapped, assigned, updated)(f)
+            f.__wrapped__ = wrapped
+            return f
+        return wrapper
+else:
+    wraps = functools.wraps
+
+
 def add_metaclass(metaclass):
     """Class decorator for creating a class with a metaclass."""
     def wrapper(cls):
@@ -268,478 +395,7 @@ def wrapper(cls):
         return metaclass(cls.__name__, cls.__bases__, orig_vars)
     return wrapper
 
-
-# ----------------------------------------------------------------------------
-# Python 2.6 compatibility shims
-#
-
-# OrderedDict Shim from  Raymond Hettinger, python core dev
-# http://code.activestate.com/recipes/576693-ordered-dictionary-for-py24/
-# here to support versions before 2.6
-if not PY3:
-    # don't need this except in 2.6
-    try:
-        from thread import get_ident as _get_ident
-    except ImportError:
-        from dummy_thread import get_ident as _get_ident
-
-try:
-    from _abcoll import KeysView, ValuesView, ItemsView
-except ImportError:
-    pass
-
-
-class _OrderedDict(dict):
-
-    """Dictionary that remembers insertion order"""
-    # An inherited dict maps keys to values.
-    # The inherited dict provides __getitem__, __len__, __contains__, and get.
-    # The remaining methods are order-aware.
-    # Big-O running times for all methods are the same as for regular
-    # dictionaries.
-
-    # The internal self.__map dictionary maps keys to links in a doubly linked
-    # list.  The circular doubly linked list starts and ends with a sentinel
-    # element.  The sentinel element never gets deleted (this simplifies the
-    # algorithm).  Each link is stored as a list of length three:  [PREV, NEXT,
-    # KEY].
-
-    def __init__(self, *args, **kwds):
-        """Initialize an ordered dictionary. Signature is the same as for
-        regular dictionaries, but keyword arguments are not recommended
-        because their insertion order is arbitrary.
-        """
-        if len(args) > 1:
-            raise TypeError('expected at most 1 arguments, got %d' % len(args))
-        try:
-            self.__root
-        except AttributeError:
-            self.__root = root = []                     # sentinel node
-            root[:] = [root, root, None]
-            self.__map = {}
-        self.__update(*args, **kwds)
-
-    def __setitem__(self, key, value, dict_setitem=dict.__setitem__):
-        """od.__setitem__(i, y) <==> od[i]=y"""
-        # Setting a new item creates a new link which goes at the end of the
-        # linked list, and the inherited dictionary is updated with the new
-        # key/value pair.
-        if key not in self:
-            root = self.__root
-            last = root[0]
-            last[1] = root[0] = self.__map[key] = [last, root, key]
-        dict_setitem(self, key, value)
-
-    def __delitem__(self, key, dict_delitem=dict.__delitem__):
-        """od.__delitem__(y) <==> del od[y]"""
-        # Deleting an existing item uses self.__map to find the link which is
-        # then removed by updating the links in the predecessor and successor
-        # nodes.
-        dict_delitem(self, key)
-        link_prev, link_next, key = self.__map.pop(key)
-        link_prev[1] = link_next
-        link_next[0] = link_prev
-
-    def __iter__(self):
-        """od.__iter__() <==> iter(od)"""
-        root = self.__root
-        curr = root[1]
-        while curr is not root:
-            yield curr[2]
-            curr = curr[1]
-
-    def __reversed__(self):
-        """od.__reversed__() <==> reversed(od)"""
-        root = self.__root
-        curr = root[0]
-        while curr is not root:
-            yield curr[2]
-            curr = curr[0]
-
-    def clear(self):
-        """od.clear() -> None.  Remove all items from od."""
-        try:
-            for node in itervalues(self.__map):
-                del node[:]
-            root = self.__root
-            root[:] = [root, root, None]
-            self.__map.clear()
-        except AttributeError:
-            pass
-        dict.clear(self)
-
-    def popitem(self, last=True):
-        """od.popitem() -> (k, v), return and remove a (key, value) pair.
-
-        Pairs are returned in LIFO order if last is true or FIFO order if
-        false.
-        """
-        if not self:
-            raise KeyError('dictionary is empty')
-        root = self.__root
-        if last:
-            link = root[0]
-            link_prev = link[0]
-            link_prev[1] = root
-            root[0] = link_prev
-        else:
-            link = root[1]
-            link_next = link[1]
-            root[1] = link_next
-            link_next[0] = root
-        key = link[2]
-        del self.__map[key]
-        value = dict.pop(self, key)
-        return key, value
-
-    # -- the following methods do not depend on the internal structure --
-
-    def keys(self):
-        """od.keys() -> list of keys in od"""
-        return list(self)
-
-    def values(self):
-        """od.values() -> list of values in od"""
-        return [self[key] for key in self]
-
-    def items(self):
-        """od.items() -> list of (key, value) pairs in od"""
-        return [(key, self[key]) for key in self]
-
-    def iterkeys(self):
-        """od.iterkeys() -> an iterator over the keys in od"""
-        return iter(self)
-
-    def itervalues(self):
-        """od.itervalues -> an iterator over the values in od"""
-        for k in self:
-            yield self[k]
-
-    def iteritems(self):
-        """od.iteritems -> an iterator over the (key, value) items in od"""
-        for k in self:
-            yield (k, self[k])
-
-    def update(*args, **kwds):
-        """od.update(E, **F) -> None.  Update od from dict/iterable E and F.
-
-        If E is a dict instance, does:        for k in E: od[k] = E[k]
-        If E has a .keys() method, does:      for k in E.keys(): od[k] = E[k]
-        Or if E is an iterable of items, does:for k, v in E: od[k] = v
-        In either case, this is followed by:  for k, v in F.items(): od[k] = v
-        """
-        if len(args) > 2:
-            raise TypeError('update() takes at most 2 positional '
-                            'arguments (%d given)' % (len(args),))
-        elif not args:
-            raise TypeError('update() takes at least 1 argument (0 given)')
-        self = args[0]
-        # Make progressively weaker assumptions about "other"
-        other = ()
-        if len(args) == 2:
-            other = args[1]
-        if isinstance(other, dict):
-            for key in other:
-                self[key] = other[key]
-        elif hasattr(other, 'keys'):
-            for key in other.keys():
-                self[key] = other[key]
-        else:
-            for key, value in other:
-                self[key] = value
-        for key, value in kwds.items():
-            self[key] = value
-    # let subclasses override update without breaking __init__
-    __update = update
-
-    __marker = object()
-
-    def pop(self, key, default=__marker):
-        """od.pop(k[,d]) -> v, remove specified key and return the
-        corresponding value.  If key is not found, d is returned if given,
-        otherwise KeyError is raised.
-        """
-        if key in self:
-            result = self[key]
-            del self[key]
-            return result
-        if default is self.__marker:
-            raise KeyError(key)
-        return default
-
-    def setdefault(self, key, default=None):
-        """od.setdefault(k[,d]) -> od.get(k,d), also set od[k]=d if k not in od
-        """
-        if key in self:
-            return self[key]
-        self[key] = default
-        return default
-
-    def __repr__(self, _repr_running={}):
-        """od.__repr__() <==> repr(od)"""
-        call_key = id(self), _get_ident()
-        if call_key in _repr_running:
-            return '...'
-        _repr_running[call_key] = 1
-        try:
-            if not self:
-                return '%s()' % (self.__class__.__name__,)
-            return '%s(%r)' % (self.__class__.__name__, list(self.items()))
-        finally:
-            del _repr_running[call_key]
-
-    def __reduce__(self):
-        """Return state information for pickling"""
-        items = [[k, self[k]] for k in self]
-        inst_dict = vars(self).copy()
-        for k in vars(OrderedDict()):
-            inst_dict.pop(k, None)
-        if inst_dict:
-            return (self.__class__, (items,), inst_dict)
-        return self.__class__, (items,)
-
-    def copy(self):
-        """od.copy() -> a shallow copy of od"""
-        return self.__class__(self)
-
-    @classmethod
-    def fromkeys(cls, iterable, value=None):
-        """OD.fromkeys(S[, v]) -> New ordered dictionary with keys from S and
-        values equal to v (which defaults to None).
-        """
-        d = cls()
-        for key in iterable:
-            d[key] = value
-        return d
-
-    def __eq__(self, other):
-        """od.__eq__(y) <==> od==y.  Comparison to another OD is
-        order-sensitive while comparison to a regular mapping is
-        order-insensitive.
-        """
-        if isinstance(other, OrderedDict):
-            return (len(self) == len(other) and
-                    list(self.items()) == list(other.items()))
-        return dict.__eq__(self, other)
-
-    def __ne__(self, other):
-        return not self == other
-
-    # -- the following methods are only used in Python 2.7 --
-
-    def viewkeys(self):
-        """od.viewkeys() -> a set-like object providing a view on od's keys"""
-        return KeysView(self)
-
-    def viewvalues(self):
-        """od.viewvalues() -> an object providing a view on od's values"""
-        return ValuesView(self)
-
-    def viewitems(self):
-        """od.viewitems() -> a set-like object providing a view on od's items
-        """
-        return ItemsView(self)
-
-
-# {{{ http://code.activestate.com/recipes/576611/ (r11)
-
-try:
-    from operator import itemgetter
-    from heapq import nlargest
-except ImportError:
-    pass
-
-
-class _Counter(dict):
-
-    """Dict subclass for counting hashable objects.  Sometimes called a bag
-    or multiset.  Elements are stored as dictionary keys and their counts
-    are stored as dictionary values.
-
-    >>> Counter('zyzygy')
-    Counter({'y': 3, 'z': 2, 'g': 1})
-
-    """
-
-    def __init__(self, iterable=None, **kwds):
-        """Create a new, empty Counter object.  And if given, count elements
-        from an input iterable.  Or, initialize the count from another mapping
-        of elements to their counts.
-
-        >>> c = Counter()                    # a new, empty counter
-        >>> c = Counter('gallahad')          # a new counter from an iterable
-        >>> c = Counter({'a': 4, 'b': 2})    # a new counter from a mapping
-        >>> c = Counter(a=4, b=2)            # a new counter from keyword args
-
-        """
-        self.update(iterable, **kwds)
-
-    def __missing__(self, key):
-        return 0
-
-    def most_common(self, n=None):
-        """List the n most common elements and their counts from the most
-        common to the least.  If n is None, then list all element counts.
-
-        >>> Counter('abracadabra').most_common(3)
-        [('a', 5), ('r', 2), ('b', 2)]
-
-        """
-        if n is None:
-            return sorted(iteritems(self), key=itemgetter(1), reverse=True)
-        return nlargest(n, iteritems(self), key=itemgetter(1))
-
-    def elements(self):
-        """Iterator over elements repeating each as many times as its count.
-
-        >>> c = Counter('ABCABC')
-        >>> sorted(c.elements())
-        ['A', 'A', 'B', 'B', 'C', 'C']
-
-        If an element's count has been set to zero or is a negative number,
-        elements() will ignore it.
-
-        """
-        for elem, count in iteritems(self):
-            for _ in range(count):
-                yield elem
-
-    # Override dict methods where the meaning changes for Counter objects.
-
-    @classmethod
-    def fromkeys(cls, iterable, v=None):
-        raise NotImplementedError(
-            'Counter.fromkeys() is undefined.  Use Counter(iterable) instead.')
-
-    def update(self, iterable=None, **kwds):
-        """Like dict.update() but add counts instead of replacing them.
-
-        Source can be an iterable, a dictionary, or another Counter instance.
-
-        >>> c = Counter('which')
-        >>> c.update('witch')           # add elements from another iterable
-        >>> d = Counter('watch')
-        >>> c.update(d)                 # add elements from another counter
-        >>> c['h']                      # four 'h' in which, witch, and watch
-        4
-
-        """
-        if iterable is not None:
-            if hasattr(iterable, 'iteritems'):
-                if self:
-                    self_get = self.get
-                    for elem, count in iteritems(iterable):
-                        self[elem] = self_get(elem, 0) + count
-                else:
-                    dict.update(
-                        self, iterable)  # fast path when counter is empty
-            else:
-                self_get = self.get
-                for elem in iterable:
-                    self[elem] = self_get(elem, 0) + 1
-        if kwds:
-            self.update(kwds)
-
-    def copy(self):
-        """Like dict.copy() but returns a Counter instance instead of a dict.
-        """
-        return Counter(self)
-
-    def __delitem__(self, elem):
-        """Like dict.__delitem__() but does not raise KeyError for missing
-        values.
-        """
-        if elem in self:
-            dict.__delitem__(self, elem)
-
-    def __repr__(self):
-        if not self:
-            return '%s()' % self.__class__.__name__
-        items = ', '.join(map('%r: %r'.__mod__, self.most_common()))
-        return '%s({%s})' % (self.__class__.__name__, items)
-
-    # Multiset-style mathematical operations discussed in:
-    #       Knuth TAOCP Volume II section 4.6.3 exercise 19
-    #       and at http://en.wikipedia.org/wiki/Multiset
-    #
-    # Outputs guaranteed to only include positive counts.
-    #
-    # To strip negative and zero counts, add-in an empty counter:
-    #       c += Counter()
-
-    def __add__(self, other):
-        """Add counts from two counters.
-
-        >>> Counter('abbb') + Counter('bcc')
-        Counter({'b': 4, 'c': 2, 'a': 1})
-
-        """
-        if not isinstance(other, Counter):
-            return NotImplemented
-        result = Counter()
-        for elem in set(self) | set(other):
-            newcount = self[elem] + other[elem]
-            if newcount > 0:
-                result[elem] = newcount
-        return result
-
-    def __sub__(self, other):
-        """Subtract count, but keep only results with positive counts.
-
-        >>> Counter('abbbc') - Counter('bccd')
-        Counter({'b': 2, 'a': 1})
-
-        """
-        if not isinstance(other, Counter):
-            return NotImplemented
-        result = Counter()
-        for elem in set(self) | set(other):
-            newcount = self[elem] - other[elem]
-            if newcount > 0:
-                result[elem] = newcount
-        return result
-
-    def __or__(self, other):
-        """Union is the maximum of value in either of the input counters.
-
-        >>> Counter('abbb') | Counter('bcc')
-        Counter({'b': 3, 'c': 2, 'a': 1})
-
-        """
-        if not isinstance(other, Counter):
-            return NotImplemented
-        _max = max
-        result = Counter()
-        for elem in set(self) | set(other):
-            newcount = _max(self[elem], other[elem])
-            if newcount > 0:
-                result[elem] = newcount
-        return result
-
-    def __and__(self, other):
-        """Intersection is the minimum of corresponding counts.
-
-        >>> Counter('abbb') & Counter('bcc')
-        Counter({'b': 1})
-
-        """
-        if not isinstance(other, Counter):
-            return NotImplemented
-        _min = min
-        result = Counter()
-        if len(self) < len(other):
-            self, other = other, self
-        for elem in filter(self.__contains__, other):
-            newcount = _min(self[elem], other[elem])
-            if newcount > 0:
-                result[elem] = newcount
-        return result
-
-if sys.version_info[:2] < (2, 7):
-    OrderedDict = _OrderedDict
-    Counter = _Counter
-else:
-    from collections import OrderedDict, Counter
+from collections import OrderedDict, Counter
 
 if PY3:
     def raise_with_traceback(exc, traceback=Ellipsis):
@@ -759,53 +415,40 @@ def raise_with_traceback(exc, traceback=Ellipsis):
 If traceback is not passed, uses sys.exc_info() to get traceback."""
 
 
-# http://stackoverflow.com/questions/4126348
-# Thanks to @martineau at SO
-
-from dateutil import parser as _date_parser
+# dateutil minimum version
 import dateutil
-if LooseVersion(dateutil.__version__) < '2.0':
-    @functools.wraps(_date_parser.parse)
-    def parse_date(timestr, *args, **kwargs):
-        timestr = bytes(timestr)
-        return _date_parser.parse(timestr, *args, **kwargs)
-else:
-    parse_date = _date_parser.parse
-
 
-class OrderedDefaultdict(OrderedDict):
+if LooseVersion(dateutil.__version__) < LooseVersion('2.5'):
+    raise ImportError('dateutil 2.5.0 is the minimum required version')
+from dateutil import parser as _date_parser
+parse_date = _date_parser.parse
 
-    def __init__(self, *args, **kwargs):
-        newdefault = None
-        newargs = ()
-        if args:
-            newdefault = args[0]
-            if not (newdefault is None or callable(newdefault)):
-                raise TypeError('first argument must be callable or None')
-            newargs = args[1:]
-        self.default_factory = newdefault
-        super(self.__class__, self).__init__(*newargs, **kwargs)
 
-    def __missing__(self, key):
-        if self.default_factory is None:
-            raise KeyError(key)
-        self[key] = value = self.default_factory()
-        return value
+# In Python 3.7, the private re._pattern_type is removed.
+# Python 3.5+ have typing.re.Pattern
+if PY36:
+    import typing
+    re_type = typing.re.Pattern
+else:
+    re_type = type(re.compile(''))
 
-    def __reduce__(self):  # optional, for pickle support
-        args = self.default_factory if self.default_factory else tuple()
-        return type(self), args, None, None, list(self.items())
+# https://github.com/pandas-dev/pandas/pull/9123
+def is_platform_little_endian():
+    """ am I little endian """
+    return sys.byteorder == 'little'
 
 
-# https://github.com/pydata/pandas/pull/9123
 def is_platform_windows():
     return sys.platform == 'win32' or sys.platform == 'cygwin'
 
+
 def is_platform_linux():
     return sys.platform == 'linux2'
 
+
 def is_platform_mac():
     return sys.platform == 'darwin'
 
+
 def is_platform_32bit():
     return struct.calcsize("P") * 8 < 64
diff --git a/pandas/compat/chainmap.py b/pandas/compat/chainmap.py
index 9edd2ef056a52..cf1cad5694570 100644
--- a/pandas/compat/chainmap.py
+++ b/pandas/compat/chainmap.py
@@ -5,6 +5,7 @@
 
 
 class DeepChainMap(ChainMap):
+
     def __setitem__(self, key, value):
         for mapping in self.maps:
             if key in mapping:
diff --git a/pandas/compat/chainmap_impl.py b/pandas/compat/chainmap_impl.py
index 92d2424057f83..c4aa8c8d6ab30 100644
--- a/pandas/compat/chainmap_impl.py
+++ b/pandas/compat/chainmap_impl.py
@@ -33,23 +33,23 @@ def wrapper(self):
 
 
 class ChainMap(MutableMapping):
-    ''' A ChainMap groups multiple dicts (or other mappings) together
-    to create a single, updateable view.
+    """ A ChainMap groups multiple dicts (or other mappings) together
+    to create a single, updatable view.
 
     The underlying mappings are stored in a list.  That list is public and can
-    accessed or updated using the *maps* attribute.  There is no other state.
+    be accessed / updated using the *maps* attribute.  There is no other state.
 
     Lookups search the underlying mappings successively until a key is found.
     In contrast, writes, updates, and deletions only operate on the first
     mapping.
 
-    '''
+    """
 
     def __init__(self, *maps):
-        '''Initialize a ChainMap by setting *maps* to the given mappings.
+        """Initialize a ChainMap by setting *maps* to the given mappings.
         If no mappings are provided, a single empty dictionary is used.
 
-        '''
+        """
         self.maps = list(maps) or [{}]          # always at least one map
 
     def __missing__(self, key):
@@ -58,16 +58,19 @@ def __missing__(self, key):
     def __getitem__(self, key):
         for mapping in self.maps:
             try:
-                return mapping[key]             # can't use 'key in mapping' with defaultdict
+                # can't use 'key in mapping' with defaultdict
+                return mapping[key]
             except KeyError:
                 pass
-        return self.__missing__(key)            # support subclasses that define __missing__
+        # support subclasses that define __missing__
+        return self.__missing__(key)
 
     def get(self, key, default=None):
         return self[key] if key in self else default
 
     def __len__(self):
-        return len(set().union(*self.maps))     # reuses stored hash values if possible
+        # reuses stored hash values if possible
+        return len(set().union(*self.maps))
 
     def __iter__(self):
         return iter(set().union(*self.maps))
@@ -89,16 +92,19 @@ def fromkeys(cls, iterable, *args):
         return cls(dict.fromkeys(iterable, *args))
 
     def copy(self):
-        'New ChainMap or subclass with a new copy of maps[0] and refs to maps[1:]'
+        """
+        New ChainMap or subclass with a new copy of maps[0] and refs to
+        maps[1:]
+        """
         return self.__class__(self.maps[0].copy(), *self.maps[1:])
 
     __copy__ = copy
 
     def new_child(self, m=None):                # like Django's Context.push()
-        '''
+        """
         New ChainMap with a new map followed by all previous maps. If no
         map is provided, an empty dict is used.
-        '''
+        """
         if m is None:
             m = {}
         return self.__class__(m, *self.maps)
@@ -115,21 +121,29 @@ def __delitem__(self, key):
         try:
             del self.maps[0][key]
         except KeyError:
-            raise KeyError('Key not found in the first mapping: {!r}'.format(key))
+            raise KeyError('Key not found in the first mapping: {!r}'
+                           .format(key))
 
     def popitem(self):
-        'Remove and return an item pair from maps[0]. Raise KeyError is maps[0] is empty.'
+        """
+        Remove and return an item pair from maps[0]. Raise KeyError is maps[0]
+        is empty.
+        """
         try:
             return self.maps[0].popitem()
         except KeyError:
             raise KeyError('No keys found in the first mapping.')
 
     def pop(self, key, *args):
-        'Remove *key* from maps[0] and return its value. Raise KeyError if *key* not in maps[0].'
+        """
+        Remove *key* from maps[0] and return its value. Raise KeyError if
+        *key* not in maps[0].
+        """
         try:
             return self.maps[0].pop(key, *args)
         except KeyError:
-            raise KeyError('Key not found in the first mapping: {!r}'.format(key))
+            raise KeyError('Key not found in the first mapping: {!r}'
+                           .format(key))
 
     def clear(self):
         'Clear maps[0], leaving maps[1:] intact.'
diff --git a/pandas/compat/numpy/__init__.py b/pandas/compat/numpy/__init__.py
new file mode 100644
index 0000000000000..cb8ad5e3ea46f
--- /dev/null
+++ b/pandas/compat/numpy/__init__.py
@@ -0,0 +1,78 @@
+""" support numpy compatiblitiy across versions """
+
+import re
+import numpy as np
+from distutils.version import LooseVersion
+from pandas.compat import string_types, string_and_binary_types
+
+
+# numpy versioning
+_np_version = np.__version__
+_nlv = LooseVersion(_np_version)
+_np_version_under1p10 = _nlv < LooseVersion('1.10')
+_np_version_under1p11 = _nlv < LooseVersion('1.11')
+_np_version_under1p12 = _nlv < LooseVersion('1.12')
+_np_version_under1p13 = _nlv < LooseVersion('1.13')
+_np_version_under1p14 = _nlv < LooseVersion('1.14')
+_np_version_under1p15 = _nlv < LooseVersion('1.15')
+
+if _nlv < '1.9':
+    raise ImportError('this version of pandas is incompatible with '
+                      'numpy < 1.9.0\n'
+                      'your numpy version is {0}.\n'
+                      'Please upgrade numpy to >= 1.9.0 to use '
+                      'this pandas version'.format(_np_version))
+
+
+_tz_regex = re.compile('[+-]0000$')
+
+
+def tz_replacer(s):
+    if isinstance(s, string_types):
+        if s.endswith('Z'):
+            s = s[:-1]
+        elif _tz_regex.search(s):
+            s = s[:-5]
+    return s
+
+
+def np_datetime64_compat(s, *args, **kwargs):
+    """
+    provide compat for construction of strings to numpy datetime64's with
+    tz-changes in 1.11 that make '2015-01-01 09:00:00Z' show a deprecation
+    warning, when need to pass '2015-01-01 09:00:00'
+    """
+
+    if not _np_version_under1p11:
+        s = tz_replacer(s)
+    return np.datetime64(s, *args, **kwargs)
+
+
+def np_array_datetime64_compat(arr, *args, **kwargs):
+    """
+    provide compat for construction of an array of strings to a
+    np.array(..., dtype=np.datetime64(..))
+    tz-changes in 1.11 that make '2015-01-01 09:00:00Z' show a deprecation
+    warning, when need to pass '2015-01-01 09:00:00'
+    """
+
+    if not _np_version_under1p11:
+
+        # is_list_like
+        if hasattr(arr, '__iter__') and not \
+           isinstance(arr, string_and_binary_types):
+            arr = [tz_replacer(s) for s in arr]
+        else:
+            arr = tz_replacer(arr)
+
+    return np.array(arr, *args, **kwargs)
+
+
+__all__ = ['np',
+           '_np_version_under1p10',
+           '_np_version_under1p11',
+           '_np_version_under1p12',
+           '_np_version_under1p13',
+           '_np_version_under1p14',
+           '_np_version_under1p15'
+           ]
diff --git a/pandas/compat/numpy/function.py b/pandas/compat/numpy/function.py
new file mode 100644
index 0000000000000..d42be56963569
--- /dev/null
+++ b/pandas/compat/numpy/function.py
@@ -0,0 +1,362 @@
+"""
+For compatibility with numpy libraries, pandas functions or
+methods have to accept '*args' and '**kwargs' parameters to
+accommodate numpy arguments that are not actually used or
+respected in the pandas implementation.
+
+To ensure that users do not abuse these parameters, validation
+is performed in 'validators.py' to make sure that any extra
+parameters passed correspond ONLY to those in the numpy signature.
+Part of that validation includes whether or not the user attempted
+to pass in non-default values for these extraneous parameters. As we
+want to discourage users from relying on these parameters when calling
+the pandas implementation, we want them only to pass in the default values
+for these parameters.
+
+This module provides a set of commonly used default arguments for functions
+and methods that are spread throughout the codebase. This module will make it
+easier to adjust to future upstream changes in the analogous numpy signatures.
+"""
+
+from numpy import ndarray
+from pandas.util._validators import (validate_args, validate_kwargs,
+                                     validate_args_and_kwargs)
+from pandas.errors import UnsupportedFunctionCall
+from pandas.core.dtypes.common import is_integer, is_bool
+from pandas.compat import OrderedDict
+
+
+class CompatValidator(object):
+
+    def __init__(self, defaults, fname=None, method=None,
+                 max_fname_arg_count=None):
+        self.fname = fname
+        self.method = method
+        self.defaults = defaults
+        self.max_fname_arg_count = max_fname_arg_count
+
+    def __call__(self, args, kwargs, fname=None,
+                 max_fname_arg_count=None, method=None):
+        if args or kwargs:
+            fname = self.fname if fname is None else fname
+            max_fname_arg_count = (self.max_fname_arg_count if
+                                   max_fname_arg_count is None
+                                   else max_fname_arg_count)
+            method = self.method if method is None else method
+
+            if method == 'args':
+                validate_args(fname, args, max_fname_arg_count, self.defaults)
+            elif method == 'kwargs':
+                validate_kwargs(fname, kwargs, self.defaults)
+            elif method == 'both':
+                validate_args_and_kwargs(fname, args, kwargs,
+                                         max_fname_arg_count,
+                                         self.defaults)
+            else:
+                raise ValueError("invalid validation method "
+                                 "'{method}'".format(method=method))
+
+
+ARGMINMAX_DEFAULTS = dict(out=None)
+validate_argmin = CompatValidator(ARGMINMAX_DEFAULTS, fname='argmin',
+                                  method='both', max_fname_arg_count=1)
+validate_argmax = CompatValidator(ARGMINMAX_DEFAULTS, fname='argmax',
+                                  method='both', max_fname_arg_count=1)
+
+
+def process_skipna(skipna, args):
+    if isinstance(skipna, ndarray) or skipna is None:
+        args = (skipna,) + args
+        skipna = True
+
+    return skipna, args
+
+
+def validate_argmin_with_skipna(skipna, args, kwargs):
+    """
+    If 'Series.argmin' is called via the 'numpy' library,
+    the third parameter in its signature is 'out', which
+    takes either an ndarray or 'None', so check if the
+    'skipna' parameter is either an instance of ndarray or
+    is None, since 'skipna' itself should be a boolean
+    """
+
+    skipna, args = process_skipna(skipna, args)
+    validate_argmin(args, kwargs)
+    return skipna
+
+
+def validate_argmax_with_skipna(skipna, args, kwargs):
+    """
+    If 'Series.argmax' is called via the 'numpy' library,
+    the third parameter in its signature is 'out', which
+    takes either an ndarray or 'None', so check if the
+    'skipna' parameter is either an instance of ndarray or
+    is None, since 'skipna' itself should be a boolean
+    """
+
+    skipna, args = process_skipna(skipna, args)
+    validate_argmax(args, kwargs)
+    return skipna
+
+
+ARGSORT_DEFAULTS = OrderedDict()
+ARGSORT_DEFAULTS['axis'] = -1
+ARGSORT_DEFAULTS['kind'] = 'quicksort'
+ARGSORT_DEFAULTS['order'] = None
+validate_argsort = CompatValidator(ARGSORT_DEFAULTS, fname='argsort',
+                                   max_fname_arg_count=0, method='both')
+
+# two different signatures of argsort, this second validation
+# for when the `kind` param is supported
+ARGSORT_DEFAULTS_KIND = OrderedDict()
+ARGSORT_DEFAULTS_KIND['axis'] = -1
+ARGSORT_DEFAULTS_KIND['order'] = None
+validate_argsort_kind = CompatValidator(ARGSORT_DEFAULTS_KIND, fname='argsort',
+                                        max_fname_arg_count=0, method='both')
+
+
+def validate_argsort_with_ascending(ascending, args, kwargs):
+    """
+    If 'Categorical.argsort' is called via the 'numpy' library, the
+    first parameter in its signature is 'axis', which takes either
+    an integer or 'None', so check if the 'ascending' parameter has
+    either integer type or is None, since 'ascending' itself should
+    be a boolean
+    """
+
+    if is_integer(ascending) or ascending is None:
+        args = (ascending,) + args
+        ascending = True
+
+    validate_argsort_kind(args, kwargs, max_fname_arg_count=3)
+    return ascending
+
+
+CLIP_DEFAULTS = dict(out=None)
+validate_clip = CompatValidator(CLIP_DEFAULTS, fname='clip',
+                                method='both', max_fname_arg_count=3)
+
+
+def validate_clip_with_axis(axis, args, kwargs):
+    """
+    If 'NDFrame.clip' is called via the numpy library, the third
+    parameter in its signature is 'out', which can takes an ndarray,
+    so check if the 'axis' parameter is an instance of ndarray, since
+    'axis' itself should either be an integer or None
+    """
+
+    if isinstance(axis, ndarray):
+        args = (axis,) + args
+        axis = None
+
+    validate_clip(args, kwargs)
+    return axis
+
+
+COMPRESS_DEFAULTS = OrderedDict()
+COMPRESS_DEFAULTS['axis'] = None
+COMPRESS_DEFAULTS['out'] = None
+validate_compress = CompatValidator(COMPRESS_DEFAULTS, fname='compress',
+                                    method='both', max_fname_arg_count=1)
+
+CUM_FUNC_DEFAULTS = OrderedDict()
+CUM_FUNC_DEFAULTS['dtype'] = None
+CUM_FUNC_DEFAULTS['out'] = None
+validate_cum_func = CompatValidator(CUM_FUNC_DEFAULTS, method='both',
+                                    max_fname_arg_count=1)
+validate_cumsum = CompatValidator(CUM_FUNC_DEFAULTS, fname='cumsum',
+                                  method='both', max_fname_arg_count=1)
+
+
+def validate_cum_func_with_skipna(skipna, args, kwargs, name):
+    """
+    If this function is called via the 'numpy' library, the third
+    parameter in its signature is 'dtype', which takes either a
+    'numpy' dtype or 'None', so check if the 'skipna' parameter is
+    a boolean or not
+    """
+    if not is_bool(skipna):
+        args = (skipna,) + args
+        skipna = True
+
+    validate_cum_func(args, kwargs, fname=name)
+    return skipna
+
+
+ALLANY_DEFAULTS = OrderedDict()
+ALLANY_DEFAULTS['dtype'] = None
+ALLANY_DEFAULTS['out'] = None
+validate_all = CompatValidator(ALLANY_DEFAULTS, fname='all',
+                               method='both', max_fname_arg_count=1)
+validate_any = CompatValidator(ALLANY_DEFAULTS, fname='any',
+                               method='both', max_fname_arg_count=1)
+
+LOGICAL_FUNC_DEFAULTS = dict(out=None)
+validate_logical_func = CompatValidator(LOGICAL_FUNC_DEFAULTS, method='kwargs')
+
+MINMAX_DEFAULTS = dict(out=None)
+validate_min = CompatValidator(MINMAX_DEFAULTS, fname='min',
+                               method='both', max_fname_arg_count=1)
+validate_max = CompatValidator(MINMAX_DEFAULTS, fname='max',
+                               method='both', max_fname_arg_count=1)
+
+RESHAPE_DEFAULTS = dict(order='C')
+validate_reshape = CompatValidator(RESHAPE_DEFAULTS, fname='reshape',
+                                   method='both', max_fname_arg_count=1)
+
+REPEAT_DEFAULTS = dict(axis=None)
+validate_repeat = CompatValidator(REPEAT_DEFAULTS, fname='repeat',
+                                  method='both', max_fname_arg_count=1)
+
+ROUND_DEFAULTS = dict(out=None)
+validate_round = CompatValidator(ROUND_DEFAULTS, fname='round',
+                                 method='both', max_fname_arg_count=1)
+
+SORT_DEFAULTS = OrderedDict()
+SORT_DEFAULTS['axis'] = -1
+SORT_DEFAULTS['kind'] = 'quicksort'
+SORT_DEFAULTS['order'] = None
+validate_sort = CompatValidator(SORT_DEFAULTS, fname='sort',
+                                method='kwargs')
+
+STAT_FUNC_DEFAULTS = OrderedDict()
+STAT_FUNC_DEFAULTS['dtype'] = None
+STAT_FUNC_DEFAULTS['out'] = None
+validate_stat_func = CompatValidator(STAT_FUNC_DEFAULTS,
+                                     method='kwargs')
+validate_sum = CompatValidator(STAT_FUNC_DEFAULTS, fname='sort',
+                               method='both', max_fname_arg_count=1)
+validate_mean = CompatValidator(STAT_FUNC_DEFAULTS, fname='mean',
+                                method='both', max_fname_arg_count=1)
+
+STAT_DDOF_FUNC_DEFAULTS = OrderedDict()
+STAT_DDOF_FUNC_DEFAULTS['dtype'] = None
+STAT_DDOF_FUNC_DEFAULTS['out'] = None
+validate_stat_ddof_func = CompatValidator(STAT_DDOF_FUNC_DEFAULTS,
+                                          method='kwargs')
+
+TAKE_DEFAULTS = OrderedDict()
+TAKE_DEFAULTS['out'] = None
+TAKE_DEFAULTS['mode'] = 'raise'
+validate_take = CompatValidator(TAKE_DEFAULTS, fname='take',
+                                method='kwargs')
+
+
+def validate_take_with_convert(convert, args, kwargs):
+    """
+    If this function is called via the 'numpy' library, the third
+    parameter in its signature is 'axis', which takes either an
+    ndarray or 'None', so check if the 'convert' parameter is either
+    an instance of ndarray or is None
+    """
+
+    if isinstance(convert, ndarray) or convert is None:
+        args = (convert,) + args
+        convert = True
+
+    validate_take(args, kwargs, max_fname_arg_count=3, method='both')
+    return convert
+
+
+TRANSPOSE_DEFAULTS = dict(axes=None)
+validate_transpose = CompatValidator(TRANSPOSE_DEFAULTS, fname='transpose',
+                                     method='both', max_fname_arg_count=0)
+
+
+def validate_transpose_for_generic(inst, kwargs):
+    try:
+        validate_transpose(tuple(), kwargs)
+    except ValueError as e:
+        klass = type(inst).__name__
+        msg = str(e)
+
+        # the Panel class actual relies on the 'axes' parameter if called
+        # via the 'numpy' library, so let's make sure the error is specific
+        # about saying that the parameter is not supported for particular
+        # implementations of 'transpose'
+        if "the 'axes' parameter is not supported" in msg:
+            msg += " for {klass} instances".format(klass=klass)
+
+        raise ValueError(msg)
+
+
+def validate_window_func(name, args, kwargs):
+    numpy_args = ('axis', 'dtype', 'out')
+    msg = ("numpy operations are not "
+           "valid with window objects. "
+           "Use .{func}() directly instead ".format(func=name))
+
+    if len(args) > 0:
+        raise UnsupportedFunctionCall(msg)
+
+    for arg in numpy_args:
+        if arg in kwargs:
+            raise UnsupportedFunctionCall(msg)
+
+
+def validate_rolling_func(name, args, kwargs):
+    numpy_args = ('axis', 'dtype', 'out')
+    msg = ("numpy operations are not "
+           "valid with window objects. "
+           "Use .rolling(...).{func}() instead ".format(func=name))
+
+    if len(args) > 0:
+        raise UnsupportedFunctionCall(msg)
+
+    for arg in numpy_args:
+        if arg in kwargs:
+            raise UnsupportedFunctionCall(msg)
+
+
+def validate_expanding_func(name, args, kwargs):
+    numpy_args = ('axis', 'dtype', 'out')
+    msg = ("numpy operations are not "
+           "valid with window objects. "
+           "Use .expanding(...).{func}() instead ".format(func=name))
+
+    if len(args) > 0:
+        raise UnsupportedFunctionCall(msg)
+
+    for arg in numpy_args:
+        if arg in kwargs:
+            raise UnsupportedFunctionCall(msg)
+
+
+def validate_groupby_func(name, args, kwargs, allowed=None):
+    """
+    'args' and 'kwargs' should be empty, except for allowed
+    kwargs because all of
+    their necessary parameters are explicitly listed in
+    the function signature
+    """
+    if allowed is None:
+        allowed = []
+
+    kwargs = set(kwargs) - set(allowed)
+
+    if len(args) + len(kwargs) > 0:
+        raise UnsupportedFunctionCall((
+            "numpy operations are not valid "
+            "with groupby. Use .groupby(...)."
+            "{func}() instead".format(func=name)))
+
+
+RESAMPLER_NUMPY_OPS = ('min', 'max', 'sum', 'prod',
+                       'mean', 'std', 'var')
+
+
+def validate_resampler_func(method, args, kwargs):
+    """
+    'args' and 'kwargs' should be empty because all of
+    their necessary parameters are explicitly listed in
+    the function signature
+    """
+    if len(args) + len(kwargs) > 0:
+        if method in RESAMPLER_NUMPY_OPS:
+            raise UnsupportedFunctionCall((
+                "numpy operations are not valid "
+                "with resample. Use .resample(...)."
+                "{func}() instead".format(func=method)))
+        else:
+            raise TypeError("too many arguments passed in")
diff --git a/pandas/compat/openpyxl_compat.py b/pandas/compat/openpyxl_compat.py
deleted file mode 100644
index 266aded2071b6..0000000000000
--- a/pandas/compat/openpyxl_compat.py
+++ /dev/null
@@ -1,35 +0,0 @@
-"""
-Detect incompatible version of OpenPyXL
-
-GH7169
-"""
-
-from distutils.version import LooseVersion
-
-start_ver = '1.6.1'
-stop_ver = '2.0.0'
-
-
-def is_compat(major_ver=1):
-    """Detect whether the installed version of openpyxl is supported
-
-    Parameters
-    ----------
-    ver : int
-        1 requests compatibility status among the 1.x.y series
-        2 requests compatibility status of 2.0.0 and later
-    Returns
-    -------
-    compat : bool
-        ``True`` if openpyxl is installed and is a compatible version.
-        ``False`` otherwise.
-    """
-    import openpyxl
-    ver = LooseVersion(openpyxl.__version__)
-    if major_ver == 1:
-        return LooseVersion(start_ver) <= ver < LooseVersion(stop_ver)
-    elif major_ver == 2:
-        return LooseVersion(stop_ver) <= ver
-    else:
-        raise ValueError('cannot test for openpyxl compatibility with ver {0}'
-                .format(major_ver))
diff --git a/pandas/compat/pickle_compat.py b/pandas/compat/pickle_compat.py
index e794725574119..c1a9a9fc1ed13 100644
--- a/pandas/compat/pickle_compat.py
+++ b/pandas/compat/pickle_compat.py
@@ -1,30 +1,34 @@
-""" support pre 0.12 series pickle compatibility """
+"""
+Support pre-0.12 series pickle compatibility.
+"""
 
 import sys
-import numpy as np
-import pandas
+import pandas  # noqa
 import copy
 import pickle as pkl
 from pandas import compat, Index
-from pandas.compat import u, string_types
+from pandas.compat import u, string_types  # noqa
+
 
 def load_reduce(self):
     stack = self.stack
     args = stack.pop()
     func = stack[-1]
 
-    if type(args[0]) is type:
-        n = args[0].__name__
+    if len(args) and type(args[0]) is type:
+        n = args[0].__name__  # noqa
 
     try:
         stack[-1] = func(*args)
         return
     except Exception as e:
 
-        # if we have a deprecated function
-        # try to replace and try again
+        # If we have a deprecated function,
+        # try to replace and try again.
+
+        msg = '_reconstruct: First argument must be a sub-type of ndarray'
 
-        if '_reconstruct: First argument must be a sub-type of ndarray' in str(e):
+        if msg in str(e):
             try:
                 cls = args[0]
                 stack[-1] = object.__new__(cls)
@@ -32,34 +36,121 @@ def load_reduce(self):
             except:
                 pass
 
-        # try to reencode the arguments
-        if getattr(self,'encoding',None) is not None:
-            args = tuple([arg.encode(self.encoding)
-                          if isinstance(arg, string_types)
-                          else arg for arg in args])
+        # try to re-encode the arguments
+        if getattr(self, 'encoding', None) is not None:
+            args = tuple(arg.encode(self.encoding)
+                         if isinstance(arg, string_types)
+                         else arg for arg in args)
             try:
                 stack[-1] = func(*args)
                 return
             except:
                 pass
 
-        if getattr(self,'is_verbose',None):
+        # unknown exception, re-raise
+        if getattr(self, 'is_verbose', None):
             print(sys.exc_info())
             print(func, args)
         raise
 
-    stack[-1] = value
+
+# If classes are moved, provide compat here.
+_class_locations_map = {
+
+    # 15477
+    ('pandas.core.base', 'FrozenNDArray'):
+        ('pandas.core.indexes.frozen', 'FrozenNDArray'),
+    ('pandas.core.base', 'FrozenList'):
+        ('pandas.core.indexes.frozen', 'FrozenList'),
+
+    # 10890
+    ('pandas.core.series', 'TimeSeries'):
+        ('pandas.core.series', 'Series'),
+    ('pandas.sparse.series', 'SparseTimeSeries'):
+        ('pandas.core.sparse.series', 'SparseSeries'),
+
+    # 12588, extensions moving
+    ('pandas._sparse', 'BlockIndex'):
+        ('pandas._libs.sparse', 'BlockIndex'),
+    ('pandas.tslib', 'Timestamp'):
+        ('pandas._libs.tslib', 'Timestamp'),
+
+    # 18543 moving period
+    ('pandas._period', 'Period'): ('pandas._libs.tslibs.period', 'Period'),
+    ('pandas._libs.period', 'Period'):
+        ('pandas._libs.tslibs.period', 'Period'),
+
+    # 18014 moved __nat_unpickle from _libs.tslib-->_libs.tslibs.nattype
+    ('pandas.tslib', '__nat_unpickle'):
+        ('pandas._libs.tslibs.nattype', '__nat_unpickle'),
+    ('pandas._libs.tslib', '__nat_unpickle'):
+        ('pandas._libs.tslibs.nattype', '__nat_unpickle'),
+
+    # 15998 top-level dirs moving
+    ('pandas.sparse.array', 'SparseArray'):
+        ('pandas.core.sparse.array', 'SparseArray'),
+    ('pandas.sparse.series', 'SparseSeries'):
+        ('pandas.core.sparse.series', 'SparseSeries'),
+    ('pandas.sparse.frame', 'SparseDataFrame'):
+        ('pandas.core.sparse.frame', 'SparseDataFrame'),
+    ('pandas.indexes.base', '_new_Index'):
+        ('pandas.core.indexes.base', '_new_Index'),
+    ('pandas.indexes.base', 'Index'):
+        ('pandas.core.indexes.base', 'Index'),
+    ('pandas.indexes.numeric', 'Int64Index'):
+        ('pandas.core.indexes.numeric', 'Int64Index'),
+    ('pandas.indexes.range', 'RangeIndex'):
+        ('pandas.core.indexes.range', 'RangeIndex'),
+    ('pandas.indexes.multi', 'MultiIndex'):
+        ('pandas.core.indexes.multi', 'MultiIndex'),
+    ('pandas.tseries.index', '_new_DatetimeIndex'):
+        ('pandas.core.indexes.datetimes', '_new_DatetimeIndex'),
+    ('pandas.tseries.index', 'DatetimeIndex'):
+        ('pandas.core.indexes.datetimes', 'DatetimeIndex'),
+    ('pandas.tseries.period', 'PeriodIndex'):
+        ('pandas.core.indexes.period', 'PeriodIndex'),
+
+    # 19269, arrays moving
+    ('pandas.core.categorical', 'Categorical'):
+        ('pandas.core.arrays', 'Categorical'),
+
+    # 19939, add timedeltaindex, float64index compat from 15998 move
+    ('pandas.tseries.tdi', 'TimedeltaIndex'):
+        ('pandas.core.indexes.timedeltas', 'TimedeltaIndex'),
+    ('pandas.indexes.numeric', 'Float64Index'):
+        ('pandas.core.indexes.numeric', 'Float64Index'),
+}
+
+
+# our Unpickler sub-class to override methods and some dispatcher
+# functions for compat
 
 if compat.PY3:
     class Unpickler(pkl._Unpickler):
-        pass
+
+        def find_class(self, module, name):
+            # override superclass
+            key = (module, name)
+            module, name = _class_locations_map.get(key, key)
+            return super(Unpickler, self).find_class(module, name)
+
 else:
+
     class Unpickler(pkl.Unpickler):
-        pass
+
+        def find_class(self, module, name):
+            # override superclass
+            key = (module, name)
+            module, name = _class_locations_map.get(key, key)
+            __import__(module)
+            mod = sys.modules[module]
+            klass = getattr(mod, name)
+            return klass
 
 Unpickler.dispatch = copy.copy(Unpickler.dispatch)
 Unpickler.dispatch[pkl.REDUCE[0]] = load_reduce
 
+
 def load_newobj(self):
     args = self.stack.pop()
     cls = self.stack[-1]
@@ -71,9 +162,11 @@ def load_newobj(self):
         obj = cls.__new__(cls, *args)
 
     self.stack[-1] = obj
+
+
 Unpickler.dispatch[pkl.NEWOBJ[0]] = load_newobj
 
-# py3 compat
+
 def load_newobj_ex(self):
     kwargs = self.stack.pop()
     args = self.stack.pop()
@@ -85,11 +178,14 @@ def load_newobj_ex(self):
     else:
         obj = cls.__new__(cls, *args, **kwargs)
     self.append(obj)
+
+
 try:
     Unpickler.dispatch[pkl.NEWOBJ_EX[0]] = load_newobj_ex
 except:
     pass
 
+
 def load(fh, encoding=None, compat=False, is_verbose=False):
     """load a pickle, with a provided encoding
 
diff --git a/pandas/computation/api.py b/pandas/computation/api.py
deleted file mode 100644
index db8269a497768..0000000000000
--- a/pandas/computation/api.py
+++ /dev/null
@@ -1,2 +0,0 @@
-from pandas.computation.eval import eval
-from pandas.computation.expr import Expr
diff --git a/pandas/computation/eval.py b/pandas/computation/eval.py
deleted file mode 100644
index e3096a85ca7d7..0000000000000
--- a/pandas/computation/eval.py
+++ /dev/null
@@ -1,242 +0,0 @@
-#!/usr/bin/env python
-
-"""Top level ``eval`` module.
-"""
-
-import tokenize
-from pandas.core import common as com
-from pandas.computation.expr import Expr, _parsers, tokenize_string
-from pandas.computation.scope import _ensure_scope
-from pandas.compat import DeepChainMap, builtins
-from pandas.computation.engines import _engines
-from distutils.version import LooseVersion
-
-
-def _check_engine(engine):
-    """Make sure a valid engine is passed.
-
-    Parameters
-    ----------
-    engine : str
-
-    Raises
-    ------
-    KeyError
-      * If an invalid engine is passed
-    ImportError
-      * If numexpr was requested but doesn't exist
-    """
-    if engine not in _engines:
-        raise KeyError('Invalid engine {0!r} passed, valid engines are'
-                       ' {1}'.format(engine, list(_engines.keys())))
-
-    # TODO: validate this in a more general way (thinking of future engines
-    # that won't necessarily be import-able)
-    # Could potentially be done on engine instantiation
-    if engine == 'numexpr':
-        try:
-            import numexpr
-        except ImportError:
-            raise ImportError("'numexpr' not found. Cannot use "
-                              "engine='numexpr' for query/eval "
-                              "if 'numexpr' is not installed")
-        else:
-            ne_version = numexpr.__version__
-            if ne_version < LooseVersion('2.1'):
-                raise ImportError("'numexpr' version is %s, "
-                                  "must be >= 2.1" % ne_version)
-
-
-def _check_parser(parser):
-    """Make sure a valid parser is passed.
-
-    Parameters
-    ----------
-    parser : str
-
-    Raises
-    ------
-    KeyError
-      * If an invalid parser is passed
-    """
-    if parser not in _parsers:
-        raise KeyError('Invalid parser {0!r} passed, valid parsers are'
-                       ' {1}'.format(parser, _parsers.keys()))
-
-
-def _check_resolvers(resolvers):
-    if resolvers is not None:
-        for resolver in resolvers:
-            if not hasattr(resolver, '__getitem__'):
-                name = type(resolver).__name__
-                raise TypeError('Resolver of type %r does not implement '
-                                'the __getitem__ method' % name)
-
-
-def _check_expression(expr):
-    """Make sure an expression is not an empty string
-
-    Parameters
-    ----------
-    expr : object
-        An object that can be converted to a string
-
-    Raises
-    ------
-    ValueError
-      * If expr is an empty string
-    """
-    if not expr:
-        raise ValueError("expr cannot be an empty string")
-
-
-def _convert_expression(expr):
-    """Convert an object to an expression.
-
-    Thus function converts an object to an expression (a unicode string) and
-    checks to make sure it isn't empty after conversion. This is used to
-    convert operators to their string representation for recursive calls to
-    :func:`~pandas.eval`.
-
-    Parameters
-    ----------
-    expr : object
-        The object to be converted to a string.
-
-    Returns
-    -------
-    s : unicode
-        The string representation of an object.
-
-    Raises
-    ------
-    ValueError
-      * If the expression is empty.
-    """
-    s = com.pprint_thing(expr)
-    _check_expression(s)
-    return s
-
-
-def _check_for_locals(expr, stack_level, parser):
-    at_top_of_stack = stack_level == 0
-    not_pandas_parser = parser != 'pandas'
-
-    if not_pandas_parser:
-        msg = "The '@' prefix is only supported by the pandas parser"
-    elif at_top_of_stack:
-        msg = ("The '@' prefix is not allowed in "
-               "top-level eval calls, \nplease refer to "
-               "your variables by name without the '@' "
-               "prefix")
-
-    if at_top_of_stack or not_pandas_parser:
-        for toknum, tokval in tokenize_string(expr):
-            if toknum == tokenize.OP and tokval == '@':
-                raise SyntaxError(msg)
-
-
-def eval(expr, parser='pandas', engine='numexpr', truediv=True,
-         local_dict=None, global_dict=None, resolvers=(), level=0,
-         target=None):
-    """Evaluate a Python expression as a string using various backends.
-
-    The following arithmetic operations are supported: ``+``, ``-``, ``*``,
-    ``/``, ``**``, ``%``, ``//`` (python engine only) along with the following
-    boolean operations: ``|`` (or), ``&`` (and), and ``~`` (not).
-    Additionally, the ``'pandas'`` parser allows the use of :keyword:`and`,
-    :keyword:`or`, and :keyword:`not` with the same semantics as the
-    corresponding bitwise operators.  :class:`~pandas.Series` and
-    :class:`~pandas.DataFrame` objects are supported and behave as they would
-    with plain ol' Python evaluation.
-
-    Parameters
-    ----------
-    expr : str or unicode
-        The expression to evaluate. This string cannot contain any Python
-        `statements
-        <http://docs.python.org/2/reference/simple_stmts.html#simple-statements>`__,
-        only Python `expressions
-        <http://docs.python.org/2/reference/simple_stmts.html#expression-statements>`__.
-    parser : string, default 'pandas', {'pandas', 'python'}
-        The parser to use to construct the syntax tree from the expression. The
-        default of ``'pandas'`` parses code slightly different than standard
-        Python. Alternatively, you can parse an expression using the
-        ``'python'`` parser to retain strict Python semantics.  See the
-        :ref:`enhancing performance <enhancingperf.eval>` documentation for
-        more details.
-    engine : string, default 'numexpr', {'python', 'numexpr'}
-
-        The engine used to evaluate the expression. Supported engines are
-
-        - ``'numexpr'``: This default engine evaluates pandas objects using
-                         numexpr for large speed ups in complex expressions
-                         with large frames.
-        - ``'python'``: Performs operations as if you had ``eval``'d in top
-                        level python. This engine is generally not that useful.
-
-        More backends may be available in the future.
-
-    truediv : bool, optional
-        Whether to use true division, like in Python >= 3
-    local_dict : dict or None, optional
-        A dictionary of local variables, taken from locals() by default.
-    global_dict : dict or None, optional
-        A dictionary of global variables, taken from globals() by default.
-    resolvers : list of dict-like or None, optional
-        A list of objects implementing the ``__getitem__`` special method that
-        you can use to inject an additional collection of namespaces to use for
-        variable lookup. For example, this is used in the
-        :meth:`~pandas.DataFrame.query` method to inject the
-        :attr:`~pandas.DataFrame.index` and :attr:`~pandas.DataFrame.columns`
-        variables that refer to their respective :class:`~pandas.DataFrame`
-        instance attributes.
-    level : int, optional
-        The number of prior stack frames to traverse and add to the current
-        scope. Most users will **not** need to change this parameter.
-    target : a target object for assignment, optional, default is None
-        essentially this is a passed in resolver
-
-    Returns
-    -------
-    ndarray, numeric scalar, DataFrame, Series
-
-    Notes
-    -----
-    The ``dtype`` of any objects involved in an arithmetic ``%`` operation are
-    recursively cast to ``float64``.
-
-    See the :ref:`enhancing performance <enhancingperf.eval>` documentation for
-    more details.
-
-    See Also
-    --------
-    pandas.DataFrame.query
-    pandas.DataFrame.eval
-    """
-    expr = _convert_expression(expr)
-    _check_engine(engine)
-    _check_parser(parser)
-    _check_resolvers(resolvers)
-    _check_for_locals(expr, level, parser)
-
-    # get our (possibly passed-in) scope
-    level += 1
-    env = _ensure_scope(level, global_dict=global_dict,
-                        local_dict=local_dict, resolvers=resolvers,
-                        target=target)
-
-    parsed_expr = Expr(expr, engine=engine, parser=parser, env=env,
-                       truediv=truediv)
-
-    # construct the engine and evaluate the parsed expression
-    eng = _engines[engine]
-    eng_inst = eng(parsed_expr)
-    ret = eng_inst.evaluate()
-
-    # assign if needed
-    if env.target is not None and parsed_expr.assigner is not None:
-        env.target[parsed_expr.assigner] = ret
-        return None
-
-    return ret
diff --git a/pandas/computation/expressions.py b/pandas/computation/expressions.py
index 70541c94b4e8e..d194cd2404c9d 100644
--- a/pandas/computation/expressions.py
+++ b/pandas/computation/expressions.py
@@ -1,264 +1,15 @@
-"""
-Expressions
------------
-
-Offer fast expression evaluation through numexpr
-
-"""
-
 import warnings
-import numpy as np
-from pandas.core.common import _values_from_object
-from distutils.version import LooseVersion
-
-try:
-    import numexpr as ne
-    ver = ne.__version__
-    _NUMEXPR_INSTALLED = ver >= LooseVersion('2.1')
-    if not _NUMEXPR_INSTALLED:
-        warnings.warn("The installed version of numexpr {ver} is not supported "
-                      "in pandas and will be not be used\nThe minimum supported "
-                      "version is 2.1\n".format(ver=ver), UserWarning)
-
-except ImportError:  # pragma: no cover
-    _NUMEXPR_INSTALLED = False
-
-_TEST_MODE = None
-_TEST_RESULT = None
-_USE_NUMEXPR = _NUMEXPR_INSTALLED
-_evaluate = None
-_where = None
-
-# the set of dtypes that we will allow pass to numexpr
-_ALLOWED_DTYPES = {
-    'evaluate': set(['int64', 'int32', 'float64', 'float32', 'bool']),
-    'where': set(['int64', 'float64', 'bool'])
-}
-
-# the minimum prod shape that we will use numexpr
-_MIN_ELEMENTS = 10000
 
 
 def set_use_numexpr(v=True):
-    # set/unset to use numexpr
-    global _USE_NUMEXPR
-    if _NUMEXPR_INSTALLED:
-        _USE_NUMEXPR = v
-
-    # choose what we are going to do
-    global _evaluate, _where
-    if not _USE_NUMEXPR:
-        _evaluate = _evaluate_standard
-        _where = _where_standard
-    else:
-        _evaluate = _evaluate_numexpr
-        _where = _where_numexpr
-
-
-def set_numexpr_threads(n=None):
-    # if we are using numexpr, set the threads to n
-    # otherwise reset
-    if _NUMEXPR_INSTALLED and _USE_NUMEXPR:
-        if n is None:
-            n = ne.detect_number_of_cores()
-        ne.set_num_threads(n)
-
-
-def _evaluate_standard(op, op_str, a, b, raise_on_error=True, **eval_kwargs):
-    """ standard evaluation """
-    if _TEST_MODE:
-        _store_test_result(False)
-    return op(a, b)
-
-
-def _can_use_numexpr(op, op_str, a, b, dtype_check):
-    """ return a boolean if we WILL be using numexpr """
-    if op_str is not None:
-
-        # required min elements (otherwise we are adding overhead)
-        if np.prod(a.shape) > _MIN_ELEMENTS:
-
-            # check for dtype compatiblity
-            dtypes = set()
-            for o in [a, b]:
-                if hasattr(o, 'get_dtype_counts'):
-                    s = o.get_dtype_counts()
-                    if len(s) > 1:
-                        return False
-                    dtypes |= set(s.index)
-                elif isinstance(o, np.ndarray):
-                    dtypes |= set([o.dtype.name])
-
-            # allowed are a superset
-            if not len(dtypes) or _ALLOWED_DTYPES[dtype_check] >= dtypes:
-                return True
-
-    return False
-
-
-def _evaluate_numexpr(op, op_str, a, b, raise_on_error=False, truediv=True, reversed=False,
-                      **eval_kwargs):
-    result = None
-
-    if _can_use_numexpr(op, op_str, a, b, 'evaluate'):
-        try:
-
-            # we were originally called by a reversed op
-            # method
-            if reversed:
-                a,b = b,a
-
-            a_value = getattr(a, "values", a)
-            b_value = getattr(b, "values", b)
-            result = ne.evaluate('a_value %s b_value' % op_str,
-                                 local_dict={'a_value': a_value,
-                                             'b_value': b_value},
-                                 casting='safe', truediv=truediv,
-                                 **eval_kwargs)
-        except ValueError as detail:
-            if 'unknown type object' in str(detail):
-                pass
-        except Exception as detail:
-            if raise_on_error:
-                raise
-
-    if _TEST_MODE:
-        _store_test_result(result is not None)
-
-    if result is None:
-        result = _evaluate_standard(op, op_str, a, b, raise_on_error)
-
-    return result
-
-
-def _where_standard(cond, a, b, raise_on_error=True):
-    return np.where(_values_from_object(cond), _values_from_object(a),
-                    _values_from_object(b))
-
-
-def _where_numexpr(cond, a, b, raise_on_error=False):
-    result = None
-
-    if _can_use_numexpr(None, 'where', a, b, 'where'):
-
-        try:
-            cond_value = getattr(cond, 'values', cond)
-            a_value = getattr(a, 'values', a)
-            b_value = getattr(b, 'values', b)
-            result = ne.evaluate('where(cond_value, a_value, b_value)',
-                                 local_dict={'cond_value': cond_value,
-                                             'a_value': a_value,
-                                             'b_value': b_value},
-                                 casting='safe')
-        except ValueError as detail:
-            if 'unknown type object' in str(detail):
-                pass
-        except Exception as detail:
-            if raise_on_error:
-                raise TypeError(str(detail))
-
-    if result is None:
-        result = _where_standard(cond, a, b, raise_on_error)
-
-    return result
-
-
-# turn myself on
-set_use_numexpr(True)
-
-
-def _has_bool_dtype(x):
-    try:
-        return x.dtype == bool
-    except AttributeError:
-        try:
-            return 'bool' in x.blocks
-        except AttributeError:
-            return isinstance(x, (bool, np.bool_))
-
-
-def _bool_arith_check(op_str, a, b, not_allowed=frozenset(('/', '//', '**')),
-                      unsupported=None):
-    if unsupported is None:
-        unsupported = {'+': '|', '*': '&', '-': '^'}
-
-    if _has_bool_dtype(a) and _has_bool_dtype(b):
-        if op_str in unsupported:
-            warnings.warn("evaluating in Python space because the %r operator"
-                          " is not supported by numexpr for the bool "
-                          "dtype, use %r instead" % (op_str,
-                                                     unsupported[op_str]))
-            return False
-
-        if op_str in not_allowed:
-            raise NotImplementedError("operator %r not implemented for bool "
-                                      "dtypes" % op_str)
-    return True
-
-
-def evaluate(op, op_str, a, b, raise_on_error=False, use_numexpr=True,
-             **eval_kwargs):
-    """ evaluate and return the expression of the op on a and b
-
-        Parameters
-        ----------
-
-        op :    the actual operand
-        op_str: the string version of the op
-        a :     left operand
-        b :     right operand
-        raise_on_error : pass the error to the higher level if indicated
-                         (default is False), otherwise evaluate the op with and
-                         return the results
-        use_numexpr : whether to try to use numexpr (default True)
-        """
-    use_numexpr = use_numexpr and _bool_arith_check(op_str, a, b)
-    if use_numexpr:
-        return _evaluate(op, op_str, a, b, raise_on_error=raise_on_error,
-                         **eval_kwargs)
-    return _evaluate_standard(op, op_str, a, b, raise_on_error=raise_on_error)
-
-
-def where(cond, a, b, raise_on_error=False, use_numexpr=True):
-    """ evaluate the where condition cond on a and b
-
-        Parameters
-        ----------
-
-        cond : a boolean array
-        a :    return if cond is True
-        b :    return if cond is False
-        raise_on_error : pass the error to the higher level if indicated
-                         (default is False), otherwise evaluate the op with and
-                         return the results
-        use_numexpr : whether to try to use numexpr (default True)
-        """
-
-    if use_numexpr:
-        return _where(cond, a, b, raise_on_error=raise_on_error)
-    return _where_standard(cond, a, b, raise_on_error=raise_on_error)
-
-
-def set_test_mode(v=True):
     """
-    Keeps track of whether numexpr  was used.  Stores an additional ``True``
-    for every successful use of evaluate with numexpr since the last
-    ``get_test_result``
+    .. deprecated:: 0.20.0
+        Use ``pandas.set_option('compute.use_numexpr', v)`` instead.
     """
-    global _TEST_MODE, _TEST_RESULT
-    _TEST_MODE = v
-    _TEST_RESULT = []
-
-
-def _store_test_result(used_numexpr):
-    global _TEST_RESULT
-    if used_numexpr:
-        _TEST_RESULT.append(used_numexpr)
-
-
-def get_test_result():
-    """get test result and reset test_results"""
-    global _TEST_RESULT
-    res = _TEST_RESULT
-    _TEST_RESULT = []
-    return res
+    warnings.warn("pandas.computation.expressions.set_use_numexpr is "
+                  "deprecated and will be removed in a future version.\n"
+                  "you can toggle usage of numexpr via "
+                  "pandas.get_option('compute.use_numexpr')",
+                  FutureWarning, stacklevel=2)
+    from pandas import set_option
+    set_option('compute.use_numexpr', v)
diff --git a/pandas/computation/ops.py b/pandas/computation/ops.py
deleted file mode 100644
index f6d5f171036ea..0000000000000
--- a/pandas/computation/ops.py
+++ /dev/null
@@ -1,528 +0,0 @@
-"""Operator classes for eval.
-"""
-
-import operator as op
-from functools import partial
-from datetime import datetime
-
-import numpy as np
-
-import pandas as pd
-from pandas.compat import PY3, string_types, text_type
-import pandas.core.common as com
-from pandas.core.base import StringMixin
-from pandas.computation.common import _ensure_decoded, _result_type_many
-from pandas.computation.scope import _DEFAULT_GLOBALS
-
-
-_reductions = 'sum', 'prod'
-
-_unary_math_ops = ('sin', 'cos', 'exp', 'log', 'expm1', 'log1p',
-                   'sqrt', 'sinh', 'cosh', 'tanh', 'arcsin', 'arccos',
-                   'arctan', 'arccosh', 'arcsinh', 'arctanh', 'abs')
-_binary_math_ops = ('arctan2',)
-_mathops = _unary_math_ops + _binary_math_ops
-
-
-_LOCAL_TAG = '__pd_eval_local_'
-
-
-class UndefinedVariableError(NameError):
-
-    """NameError subclass for local variables."""
-
-    def __init__(self, name, is_local):
-        if is_local:
-            msg = 'local variable {0!r} is not defined'
-        else:
-            msg = 'name {0!r} is not defined'
-        super(UndefinedVariableError, self).__init__(msg.format(name))
-
-
-class Term(StringMixin):
-
-    def __new__(cls, name, env, side=None, encoding=None):
-        klass = Constant if not isinstance(name, string_types) else cls
-        supr_new = super(Term, klass).__new__
-        return supr_new(klass)
-
-    def __init__(self, name, env, side=None, encoding=None):
-        self._name = name
-        self.env = env
-        self.side = side
-        tname = text_type(name)
-        self.is_local = (tname.startswith(_LOCAL_TAG) or
-                         tname in _DEFAULT_GLOBALS)
-        self._value = self._resolve_name()
-        self.encoding = encoding
-
-    @property
-    def local_name(self):
-        return self.name.replace(_LOCAL_TAG, '')
-
-    def __unicode__(self):
-        return com.pprint_thing(self.name)
-
-    def __call__(self, *args, **kwargs):
-        return self.value
-
-    def evaluate(self, *args, **kwargs):
-        return self
-
-    def _resolve_name(self):
-        res = self.env.resolve(self.local_name, is_local=self.is_local)
-        self.update(res)
-
-        if hasattr(res, 'ndim') and res.ndim > 2:
-            raise NotImplementedError("N-dimensional objects, where N > 2,"
-                                      " are not supported with eval")
-        return res
-
-    def update(self, value):
-        """
-        search order for local (i.e., @variable) variables:
-
-        scope, key_variable
-        [('locals', 'local_name'),
-         ('globals', 'local_name'),
-         ('locals', 'key'),
-         ('globals', 'key')]
-        """
-        key = self.name
-
-        # if it's a variable name (otherwise a constant)
-        if isinstance(key, string_types):
-            self.env.swapkey(self.local_name, key, new_value=value)
-
-        self.value = value
-
-    @property
-    def isscalar(self):
-        return np.isscalar(self._value)
-
-    @property
-    def type(self):
-        try:
-            # potentially very slow for large, mixed dtype frames
-            return self._value.values.dtype
-        except AttributeError:
-            try:
-                # ndarray
-                return self._value.dtype
-            except AttributeError:
-                # scalar
-                return type(self._value)
-
-    return_type = type
-
-    @property
-    def raw(self):
-        return com.pprint_thing('{0}(name={1!r}, type={2})'
-                                ''.format(self.__class__.__name__, self.name,
-                                          self.type))
-
-    @property
-    def is_datetime(self):
-        try:
-            t = self.type.type
-        except AttributeError:
-            t = self.type
-
-        return issubclass(t, (datetime, np.datetime64))
-
-    @property
-    def value(self):
-        return self._value
-
-    @value.setter
-    def value(self, new_value):
-        self._value = new_value
-
-    @property
-    def name(self):
-        return self._name
-
-    @name.setter
-    def name(self, new_name):
-        self._name = new_name
-
-    @property
-    def ndim(self):
-        return self._value.ndim
-
-
-class Constant(Term):
-
-    def __init__(self, value, env, side=None, encoding=None):
-        super(Constant, self).__init__(value, env, side=side,
-                                       encoding=encoding)
-
-    def _resolve_name(self):
-        return self._name
-
-    @property
-    def name(self):
-        return self.value
-
-
-_bool_op_map = {'not': '~', 'and': '&', 'or': '|'}
-
-
-class Op(StringMixin):
-
-    """Hold an operator of arbitrary arity
-    """
-
-    def __init__(self, op, operands, *args, **kwargs):
-        self.op = _bool_op_map.get(op, op)
-        self.operands = operands
-        self.encoding = kwargs.get('encoding', None)
-
-    def __iter__(self):
-        return iter(self.operands)
-
-    def __unicode__(self):
-        """Print a generic n-ary operator and its operands using infix
-        notation"""
-        # recurse over the operands
-        parened = ('({0})'.format(com.pprint_thing(opr))
-                   for opr in self.operands)
-        return com.pprint_thing(' {0} '.format(self.op).join(parened))
-
-    @property
-    def return_type(self):
-        # clobber types to bool if the op is a boolean operator
-        if self.op in (_cmp_ops_syms + _bool_ops_syms):
-            return np.bool_
-        return _result_type_many(*(term.type for term in com.flatten(self)))
-
-    @property
-    def has_invalid_return_type(self):
-        types = self.operand_types
-        obj_dtype_set = frozenset([np.dtype('object')])
-        return self.return_type == object and types - obj_dtype_set
-
-    @property
-    def operand_types(self):
-        return frozenset(term.type for term in com.flatten(self))
-
-    @property
-    def isscalar(self):
-        return all(operand.isscalar for operand in self.operands)
-
-    @property
-    def is_datetime(self):
-        try:
-            t = self.return_type.type
-        except AttributeError:
-            t = self.return_type
-
-        return issubclass(t, (datetime, np.datetime64))
-
-
-def _in(x, y):
-    """Compute the vectorized membership of ``x in y`` if possible, otherwise
-    use Python.
-    """
-    try:
-        return x.isin(y)
-    except AttributeError:
-        if com.is_list_like(x):
-            try:
-                return y.isin(x)
-            except AttributeError:
-                pass
-        return x in y
-
-
-def _not_in(x, y):
-    """Compute the vectorized membership of ``x not in y`` if possible,
-    otherwise use Python.
-    """
-    try:
-        return ~x.isin(y)
-    except AttributeError:
-        if com.is_list_like(x):
-            try:
-                return ~y.isin(x)
-            except AttributeError:
-                pass
-        return x not in y
-
-
-_cmp_ops_syms = '>', '<', '>=', '<=', '==', '!=', 'in', 'not in'
-_cmp_ops_funcs = op.gt, op.lt, op.ge, op.le, op.eq, op.ne, _in, _not_in
-_cmp_ops_dict = dict(zip(_cmp_ops_syms, _cmp_ops_funcs))
-
-_bool_ops_syms = '&', '|', 'and', 'or'
-_bool_ops_funcs = op.and_, op.or_, op.and_, op.or_
-_bool_ops_dict = dict(zip(_bool_ops_syms, _bool_ops_funcs))
-
-_arith_ops_syms = '+', '-', '*', '/', '**', '//', '%'
-_arith_ops_funcs = (op.add, op.sub, op.mul, op.truediv if PY3 else op.div,
-                    op.pow, op.floordiv, op.mod)
-_arith_ops_dict = dict(zip(_arith_ops_syms, _arith_ops_funcs))
-
-_special_case_arith_ops_syms = '**', '//', '%'
-_special_case_arith_ops_funcs = op.pow, op.floordiv, op.mod
-_special_case_arith_ops_dict = dict(zip(_special_case_arith_ops_syms,
-                                        _special_case_arith_ops_funcs))
-
-_binary_ops_dict = {}
-
-for d in (_cmp_ops_dict, _bool_ops_dict, _arith_ops_dict):
-    _binary_ops_dict.update(d)
-
-
-def _cast_inplace(terms, dtype):
-    """Cast an expression inplace.
-
-    Parameters
-    ----------
-    terms : Op
-        The expression that should cast.
-    dtype : str or numpy.dtype
-        The dtype to cast to.
-    """
-    dt = np.dtype(dtype)
-    for term in terms:
-        try:
-            new_value = term.value.astype(dt)
-        except AttributeError:
-            new_value = dt.type(term.value)
-        term.update(new_value)
-
-
-def is_term(obj):
-    return isinstance(obj, Term)
-
-
-class BinOp(Op):
-
-    """Hold a binary operator and its operands
-
-    Parameters
-    ----------
-    op : str
-    left : Term or Op
-    right : Term or Op
-    """
-
-    def __init__(self, op, lhs, rhs, **kwargs):
-        super(BinOp, self).__init__(op, (lhs, rhs))
-        self.lhs = lhs
-        self.rhs = rhs
-
-        self._disallow_scalar_only_bool_ops()
-
-        self.convert_values()
-
-        try:
-            self.func = _binary_ops_dict[op]
-        except KeyError:
-            # has to be made a list for python3
-            keys = list(_binary_ops_dict.keys())
-            raise ValueError('Invalid binary operator {0!r}, valid'
-                             ' operators are {1}'.format(op, keys))
-
-    def __call__(self, env):
-        """Recursively evaluate an expression in Python space.
-
-        Parameters
-        ----------
-        env : Scope
-
-        Returns
-        -------
-        object
-            The result of an evaluated expression.
-        """
-        # handle truediv
-        if self.op == '/' and env.scope['truediv']:
-            self.func = op.truediv
-
-        # recurse over the left/right nodes
-        left = self.lhs(env)
-        right = self.rhs(env)
-
-        return self.func(left, right)
-
-    def evaluate(self, env, engine, parser, term_type, eval_in_python):
-        """Evaluate a binary operation *before* being passed to the engine.
-
-        Parameters
-        ----------
-        env : Scope
-        engine : str
-        parser : str
-        term_type : type
-        eval_in_python : list
-
-        Returns
-        -------
-        term_type
-            The "pre-evaluated" expression as an instance of ``term_type``
-        """
-        if engine == 'python':
-            res = self(env)
-        else:
-            # recurse over the left/right nodes
-            left = self.lhs.evaluate(env, engine=engine, parser=parser,
-                                     term_type=term_type,
-                                     eval_in_python=eval_in_python)
-            right = self.rhs.evaluate(env, engine=engine, parser=parser,
-                                      term_type=term_type,
-                                      eval_in_python=eval_in_python)
-
-            # base cases
-            if self.op in eval_in_python:
-                res = self.func(left.value, right.value)
-            else:
-                res = pd.eval(self, local_dict=env, engine=engine,
-                              parser=parser)
-
-        name = env.add_tmp(res)
-        return term_type(name, env=env)
-
-    def convert_values(self):
-        """Convert datetimes to a comparable value in an expression.
-        """
-        def stringify(value):
-            if self.encoding is not None:
-                encoder = partial(com.pprint_thing_encoded,
-                                  encoding=self.encoding)
-            else:
-                encoder = com.pprint_thing
-            return encoder(value)
-
-        lhs, rhs = self.lhs, self.rhs
-
-        if is_term(lhs) and lhs.is_datetime and is_term(rhs) and rhs.isscalar:
-            v = rhs.value
-            if isinstance(v, (int, float)):
-                v = stringify(v)
-            v = pd.Timestamp(_ensure_decoded(v))
-            if v.tz is not None:
-                v = v.tz_convert('UTC')
-            self.rhs.update(v)
-
-        if is_term(rhs) and rhs.is_datetime and is_term(lhs) and lhs.isscalar:
-            v = lhs.value
-            if isinstance(v, (int, float)):
-                v = stringify(v)
-            v = pd.Timestamp(_ensure_decoded(v))
-            if v.tz is not None:
-                v = v.tz_convert('UTC')
-            self.lhs.update(v)
-
-    def _disallow_scalar_only_bool_ops(self):
-        if ((self.lhs.isscalar or self.rhs.isscalar) and
-            self.op in _bool_ops_dict and
-            (not (issubclass(self.rhs.return_type, (bool, np.bool_)) and
-                  issubclass(self.lhs.return_type, (bool, np.bool_))))):
-            raise NotImplementedError("cannot evaluate scalar only bool ops")
-
-
-def isnumeric(dtype):
-    return issubclass(np.dtype(dtype).type, np.number)
-
-
-class Div(BinOp):
-
-    """Div operator to special case casting.
-
-    Parameters
-    ----------
-    lhs, rhs : Term or Op
-        The Terms or Ops in the ``/`` expression.
-    truediv : bool
-        Whether or not to use true division. With Python 3 this happens
-        regardless of the value of ``truediv``.
-    """
-
-    def __init__(self, lhs, rhs, truediv, *args, **kwargs):
-        super(Div, self).__init__('/', lhs, rhs, *args, **kwargs)
-
-        if not isnumeric(lhs.return_type) or not isnumeric(rhs.return_type):
-            raise TypeError("unsupported operand type(s) for {0}:"
-                            " '{1}' and '{2}'".format(self.op,
-                                                      lhs.return_type,
-                                                      rhs.return_type))
-
-        if truediv or PY3:
-            _cast_inplace(com.flatten(self), np.float_)
-
-
-_unary_ops_syms = '+', '-', '~', 'not'
-_unary_ops_funcs = op.pos, op.neg, op.invert, op.invert
-_unary_ops_dict = dict(zip(_unary_ops_syms, _unary_ops_funcs))
-
-
-class UnaryOp(Op):
-
-    """Hold a unary operator and its operands
-
-    Parameters
-    ----------
-    op : str
-        The token used to represent the operator.
-    operand : Term or Op
-        The Term or Op operand to the operator.
-
-    Raises
-    ------
-    ValueError
-        * If no function associated with the passed operator token is found.
-    """
-
-    def __init__(self, op, operand):
-        super(UnaryOp, self).__init__(op, (operand,))
-        self.operand = operand
-
-        try:
-            self.func = _unary_ops_dict[op]
-        except KeyError:
-            raise ValueError('Invalid unary operator {0!r}, valid operators '
-                             'are {1}'.format(op, _unary_ops_syms))
-
-    def __call__(self, env):
-        operand = self.operand(env)
-        return self.func(operand)
-
-    def __unicode__(self):
-        return com.pprint_thing('{0}({1})'.format(self.op, self.operand))
-
-    @property
-    def return_type(self):
-        operand = self.operand
-        if operand.return_type == np.dtype('bool'):
-            return np.dtype('bool')
-        if (isinstance(operand, Op) and
-            (operand.op in _cmp_ops_dict or operand.op in _bool_ops_dict)):
-            return np.dtype('bool')
-        return np.dtype('int')
-
-
-class MathCall(Op):
-    def __init__(self, func, args):
-        super(MathCall, self).__init__(func.name, args)
-        self.func = func
-
-    def __call__(self, env):
-        operands = [op(env) for op in self.operands]
-        return self.func.func(*operands)
-
-    def __unicode__(self):
-        operands = map(str, self.operands)
-        return com.pprint_thing('{0}({1})'.format(self.op, ','.join(operands)))
-
-
-class FuncNode(object):
-    def __init__(self, name):
-        if name not in _mathops:
-            raise ValueError("\"{0}\" is not a supported function".format(name))
-        self.name = name
-        self.func = getattr(np, name)
-
-    def __call__(self, *args):
-        return MathCall(self, args)
diff --git a/pandas/computation/pytables.py b/pandas/computation/pytables.py
deleted file mode 100644
index 1bc5b8b723657..0000000000000
--- a/pandas/computation/pytables.py
+++ /dev/null
@@ -1,619 +0,0 @@
-""" manage PyTables query interface via Expressions """
-
-import ast
-import time
-import warnings
-from functools import partial
-from datetime import datetime, timedelta
-import numpy as np
-import pandas as pd
-from pandas.compat import u, string_types, PY3, DeepChainMap
-from pandas.core.base import StringMixin
-import pandas.core.common as com
-from pandas.computation import expr, ops
-from pandas.computation.ops import is_term, UndefinedVariableError
-from pandas.computation.scope import _ensure_scope
-from pandas.computation.expr import BaseExprVisitor
-from pandas.computation.common import _ensure_decoded
-from pandas.tseries.timedeltas import _coerce_scalar_to_timedelta_type
-
-
-class Scope(expr.Scope):
-    __slots__ = 'queryables',
-
-    def __init__(self, level, global_dict=None, local_dict=None,
-                 queryables=None):
-        super(Scope, self).__init__(level + 1, global_dict=global_dict,
-                                    local_dict=local_dict)
-        self.queryables = queryables or dict()
-
-
-class Term(ops.Term):
-
-    def __new__(cls, name, env, side=None, encoding=None):
-        klass = Constant if not isinstance(name, string_types) else cls
-        supr_new = StringMixin.__new__
-        return supr_new(klass)
-
-    def __init__(self, name, env, side=None, encoding=None):
-        super(Term, self).__init__(name, env, side=side, encoding=encoding)
-
-    def _resolve_name(self):
-        # must be a queryables
-        if self.side == 'left':
-            if self.name not in self.env.queryables:
-                raise NameError('name {0!r} is not defined'.format(self.name))
-            return self.name
-
-        # resolve the rhs (and allow it to be None)
-        try:
-            return self.env.resolve(self.name, is_local=False)
-        except UndefinedVariableError:
-            return self.name
-
-    @property
-    def value(self):
-        return self._value
-
-
-class Constant(Term):
-
-    def __init__(self, value, env, side=None, encoding=None):
-        super(Constant, self).__init__(value, env, side=side,
-                                       encoding=encoding)
-
-    def _resolve_name(self):
-        return self._name
-
-
-class BinOp(ops.BinOp):
-
-    _max_selectors = 31
-
-    def __init__(self, op, lhs, rhs, queryables, encoding):
-        super(BinOp, self).__init__(op, lhs, rhs)
-        self.queryables = queryables
-        self.encoding = encoding
-        self.filter = None
-        self.condition = None
-
-    def _disallow_scalar_only_bool_ops(self):
-        pass
-
-    def prune(self, klass):
-
-        def pr(left, right):
-            """ create and return a new specialized BinOp from myself """
-
-            if left is None:
-                return right
-            elif right is None:
-                return left
-
-            k = klass
-            if isinstance(left, ConditionBinOp):
-                if (isinstance(left, ConditionBinOp) and
-                        isinstance(right, ConditionBinOp)):
-                    k = JointConditionBinOp
-                elif isinstance(left, k):
-                    return left
-                elif isinstance(right, k):
-                    return right
-
-            elif isinstance(left, FilterBinOp):
-                if (isinstance(left, FilterBinOp) and
-                        isinstance(right, FilterBinOp)):
-                    k = JointFilterBinOp
-                elif isinstance(left, k):
-                    return left
-                elif isinstance(right, k):
-                    return right
-
-            return k(self.op, left, right, queryables=self.queryables,
-                     encoding=self.encoding).evaluate()
-
-        left, right = self.lhs, self.rhs
-
-        if is_term(left) and is_term(right):
-            res = pr(left.value, right.value)
-        elif not is_term(left) and is_term(right):
-            res = pr(left.prune(klass), right.value)
-        elif is_term(left) and not is_term(right):
-            res = pr(left.value, right.prune(klass))
-        elif not (is_term(left) or is_term(right)):
-            res = pr(left.prune(klass), right.prune(klass))
-
-        return res
-
-    def conform(self, rhs):
-        """ inplace conform rhs """
-        if not com.is_list_like(rhs):
-            rhs = [rhs]
-        if isinstance(rhs, np.ndarray):
-            rhs = rhs.ravel()
-        return rhs
-
-    @property
-    def is_valid(self):
-        """ return True if this is a valid field """
-        return self.lhs in self.queryables
-
-    @property
-    def is_in_table(self):
-        """ return True if this is a valid column name for generation (e.g. an
-        actual column in the table) """
-        return self.queryables.get(self.lhs) is not None
-
-    @property
-    def kind(self):
-        """ the kind of my field """
-        return getattr(self.queryables.get(self.lhs),'kind',None)
-
-    @property
-    def meta(self):
-        """ the meta of my field """
-        return getattr(self.queryables.get(self.lhs),'meta',None)
-
-    @property
-    def metadata(self):
-        """ the metadata of my field """
-        return getattr(self.queryables.get(self.lhs),'metadata',None)
-
-    def generate(self, v):
-        """ create and return the op string for this TermValue """
-        val = v.tostring(self.encoding)
-        return "(%s %s %s)" % (self.lhs, self.op, val)
-
-    def convert_value(self, v):
-        """ convert the expression that is in the term to something that is
-        accepted by pytables """
-
-        def stringify(value):
-            if self.encoding is not None:
-                encoder = partial(com.pprint_thing_encoded,
-                                  encoding=self.encoding)
-            else:
-                encoder = com.pprint_thing
-            return encoder(value)
-
-        kind = _ensure_decoded(self.kind)
-        meta = _ensure_decoded(self.meta)
-        if kind == u('datetime64') or kind == u('datetime'):
-            if isinstance(v, (int, float)):
-                v = stringify(v)
-            v = _ensure_decoded(v)
-            v = pd.Timestamp(v)
-            if v.tz is not None:
-                v = v.tz_convert('UTC')
-            return TermValue(v, v.value, kind)
-        elif (isinstance(v, datetime) or hasattr(v, 'timetuple') or
-                kind == u('date')):
-            v = time.mktime(v.timetuple())
-            return TermValue(v, pd.Timestamp(v), kind)
-        elif kind == u('timedelta64') or kind == u('timedelta'):
-            v = _coerce_scalar_to_timedelta_type(v, unit='s').value
-            return TermValue(int(v), v, kind)
-        elif meta == u('category'):
-            metadata = com._values_from_object(self.metadata)
-            result = metadata.searchsorted(v,side='left')
-            return TermValue(result, result, u('integer'))
-        elif kind == u('integer'):
-            v = int(float(v))
-            return TermValue(v, v, kind)
-        elif kind == u('float'):
-            v = float(v)
-            return TermValue(v, v, kind)
-        elif kind == u('bool'):
-            if isinstance(v, string_types):
-                v = not v.strip().lower() in [u('false'), u('f'), u('no'),
-                                              u('n'), u('none'), u('0'),
-                                              u('[]'), u('{}'), u('')]
-            else:
-                v = bool(v)
-            return TermValue(v, v, kind)
-        elif not isinstance(v, string_types):
-            v = stringify(v)
-            return TermValue(v, stringify(v), u('string'))
-
-        # string quoting
-        return TermValue(v, stringify(v), u('string'))
-
-    def convert_values(self):
-        pass
-
-
-class FilterBinOp(BinOp):
-
-    def __unicode__(self):
-        return com.pprint_thing("[Filter : [{0}] -> "
-                                "[{1}]".format(self.filter[0], self.filter[1]))
-
-    def invert(self):
-        """ invert the filter """
-        if self.filter is not None:
-            f = list(self.filter)
-            f[1] = self.generate_filter_op(invert=True)
-            self.filter = tuple(f)
-        return self
-
-    def format(self):
-        """ return the actual filter format """
-        return [self.filter]
-
-    def evaluate(self):
-
-        if not self.is_valid:
-            raise ValueError("query term is not valid [%s]" % self)
-
-        rhs = self.conform(self.rhs)
-        values = [TermValue(v, v, self.kind) for v in rhs]
-
-        if self.is_in_table:
-
-            # if too many values to create the expression, use a filter instead
-            if self.op in ['==', '!='] and len(values) > self._max_selectors:
-
-                filter_op = self.generate_filter_op()
-                self.filter = (
-                    self.lhs,
-                    filter_op,
-                    pd.Index([v.value for v in values]))
-
-                return self
-            return None
-
-        # equality conditions
-        if self.op in ['==', '!=']:
-
-            filter_op = self.generate_filter_op()
-            self.filter = (
-                self.lhs,
-                filter_op,
-                pd.Index([v.value for v in values]))
-
-        else:
-            raise TypeError(
-                "passing a filterable condition to a non-table indexer [%s]" %
-                self)
-
-        return self
-
-    def generate_filter_op(self, invert=False):
-        if (self.op == '!=' and not invert) or (self.op == '==' and invert):
-            return lambda axis, vals: ~axis.isin(vals)
-        else:
-            return lambda axis, vals: axis.isin(vals)
-
-
-class JointFilterBinOp(FilterBinOp):
-
-    def format(self):
-        raise NotImplementedError("unable to collapse Joint Filters")
-
-    def evaluate(self):
-        return self
-
-
-class ConditionBinOp(BinOp):
-
-    def __unicode__(self):
-        return com.pprint_thing("[Condition : [{0}]]".format(self.condition))
-
-    def invert(self):
-        """ invert the condition """
-        # if self.condition is not None:
-        #    self.condition = "~(%s)" % self.condition
-        # return self
-        raise NotImplementedError("cannot use an invert condition when "
-                                  "passing to numexpr")
-
-    def format(self):
-        """ return the actual ne format """
-        return self.condition
-
-    def evaluate(self):
-
-        if not self.is_valid:
-            raise ValueError("query term is not valid [%s]" % self)
-
-        # convert values if we are in the table
-        if not self.is_in_table:
-            return None
-
-        rhs = self.conform(self.rhs)
-        values = [self.convert_value(v) for v in rhs]
-
-        # equality conditions
-        if self.op in ['==', '!=']:
-
-            # too many values to create the expression?
-            if len(values) <= self._max_selectors:
-                vs = [self.generate(v) for v in values]
-                self.condition = "(%s)" % ' | '.join(vs)
-
-            # use a filter after reading
-            else:
-                return None
-        else:
-            self.condition = self.generate(values[0])
-
-        return self
-
-
-class JointConditionBinOp(ConditionBinOp):
-
-    def evaluate(self):
-        self.condition = "(%s %s %s)" % (
-            self.lhs.condition,
-            self.op,
-            self.rhs.condition)
-        return self
-
-
-class UnaryOp(ops.UnaryOp):
-
-    def prune(self, klass):
-
-        if self.op != '~':
-            raise NotImplementedError("UnaryOp only support invert type ops")
-
-        operand = self.operand
-        operand = operand.prune(klass)
-
-        if operand is not None:
-            if issubclass(klass, ConditionBinOp):
-                if operand.condition is not None:
-                    return operand.invert()
-            elif issubclass(klass, FilterBinOp):
-                if operand.filter is not None:
-                    return operand.invert()
-
-        return None
-
-
-_op_classes = {'unary': UnaryOp}
-
-
-class ExprVisitor(BaseExprVisitor):
-    const_type = Constant
-    term_type = Term
-
-    def __init__(self, env, engine, parser, **kwargs):
-        super(ExprVisitor, self).__init__(env, engine, parser)
-        for bin_op in self.binary_ops:
-            setattr(self, 'visit_{0}'.format(self.binary_op_nodes_map[bin_op]),
-                    lambda node, bin_op=bin_op: partial(BinOp, bin_op,
-                                                        **kwargs))
-
-    def visit_UnaryOp(self, node, **kwargs):
-        if isinstance(node.op, (ast.Not, ast.Invert)):
-            return UnaryOp('~', self.visit(node.operand))
-        elif isinstance(node.op, ast.USub):
-            return self.const_type(-self.visit(node.operand).value, self.env)
-        elif isinstance(node.op, ast.UAdd):
-            raise NotImplementedError('Unary addition not supported')
-
-    def visit_Index(self, node, **kwargs):
-        return self.visit(node.value).value
-
-    def visit_Assign(self, node, **kwargs):
-        cmpr = ast.Compare(ops=[ast.Eq()], left=node.targets[0],
-                           comparators=[node.value])
-        return self.visit(cmpr)
-
-    def visit_Subscript(self, node, **kwargs):
-        # only allow simple suscripts
-
-        value = self.visit(node.value)
-        slobj = self.visit(node.slice)
-        try:
-            value = value.value
-        except:
-            pass
-
-        try:
-            return self.const_type(value[slobj], self.env)
-        except TypeError:
-            raise ValueError("cannot subscript {0!r} with "
-                             "{1!r}".format(value, slobj))
-
-    def visit_Attribute(self, node, **kwargs):
-        attr = node.attr
-        value = node.value
-
-        ctx = node.ctx.__class__
-        if ctx == ast.Load:
-            # resolve the value
-            resolved = self.visit(value)
-
-            # try to get the value to see if we are another expression
-            try:
-                resolved = resolved.value
-            except (AttributeError):
-                pass
-
-            try:
-                return self.term_type(getattr(resolved, attr), self.env)
-            except AttributeError:
-
-                # something like datetime.datetime where scope is overriden
-                if isinstance(value, ast.Name) and value.id == attr:
-                    return resolved
-
-        raise ValueError("Invalid Attribute context {0}".format(ctx.__name__))
-
-    def translate_In(self, op):
-        return ast.Eq() if isinstance(op, ast.In) else op
-
-    def _rewrite_membership_op(self, node, left, right):
-        return self.visit(node.op), node.op, left, right
-
-
-class Expr(expr.Expr):
-
-    """ hold a pytables like expression, comprised of possibly multiple 'terms'
-
-    Parameters
-    ----------
-    where : string term expression, Expr, or list-like of Exprs
-    queryables : a "kinds" map (dict of column name -> kind), or None if column
-        is non-indexable
-    encoding : an encoding that will encode the query terms
-
-    Returns
-    -------
-    an Expr object
-
-    Examples
-    --------
-
-    'index>=date'
-    "columns=['A', 'D']"
-    'columns=A'
-    'columns==A'
-    "~(columns=['A','B'])"
-    'index>df.index[3] & string="bar"'
-    '(index>df.index[3] & index<=df.index[6]) | string="bar"'
-    "ts>=Timestamp('2012-02-01')"
-    "major_axis>=20130101"
-    """
-
-    def __init__(self, where, op=None, value=None, queryables=None,
-                 encoding=None, scope_level=0):
-
-        # try to be back compat
-        where = self.parse_back_compat(where, op, value)
-
-        self.encoding = encoding
-        self.condition = None
-        self.filter = None
-        self.terms = None
-        self._visitor = None
-
-        # capture the environment if needed
-        local_dict = DeepChainMap()
-
-        if isinstance(where, Expr):
-            local_dict = where.env.scope
-            where = where.expr
-
-        elif isinstance(where, (list, tuple)):
-            for idx, w in enumerate(where):
-                if isinstance(w, Expr):
-                    local_dict = w.env.scope
-                else:
-                    w = self.parse_back_compat(w)
-                    where[idx] = w
-            where = ' & ' .join(["(%s)" % w for w in where])
-
-        self.expr = where
-        self.env = Scope(scope_level + 1, local_dict=local_dict)
-
-        if queryables is not None and isinstance(self.expr, string_types):
-            self.env.queryables.update(queryables)
-            self._visitor = ExprVisitor(self.env, queryables=queryables,
-                                        parser='pytables', engine='pytables',
-                                        encoding=encoding)
-            self.terms = self.parse()
-
-    def parse_back_compat(self, w, op=None, value=None):
-        """ allow backward compatibility for passed arguments """
-
-        if isinstance(w, dict):
-            w, op, value = w.get('field'), w.get('op'), w.get('value')
-            if not isinstance(w, string_types):
-                raise TypeError(
-                    "where must be passed as a string if op/value are passed")
-            warnings.warn("passing a dict to Expr is deprecated, "
-                          "pass the where as a single string",
-                          DeprecationWarning)
-        if isinstance(w, tuple):
-            if len(w) == 2:
-                w, value = w
-                op = '=='
-            elif len(w) == 3:
-                w, op, value = w
-            warnings.warn("passing a tuple into Expr is deprecated, "
-                          "pass the where as a single string",
-                          DeprecationWarning, stacklevel=10)
-
-        if op is not None:
-            if not isinstance(w, string_types):
-                raise TypeError(
-                    "where must be passed as a string if op/value are passed")
-
-            if isinstance(op, Expr):
-                raise TypeError("invalid op passed, must be a string")
-            w = "{0}{1}".format(w, op)
-            if value is not None:
-                if isinstance(value, Expr):
-                    raise TypeError("invalid value passed, must be a string")
-
-                # stringify with quotes these values
-                def convert(v):
-                    if isinstance(v, (datetime,np.datetime64,timedelta,np.timedelta64)) or hasattr(v, 'timetuple'):
-                        return "'{0}'".format(v)
-                    return v
-
-                if isinstance(value, (list,tuple)):
-                    value = [ convert(v) for v in value ]
-                else:
-                    value = convert(value)
-
-                w = "{0}{1}".format(w, value)
-
-            warnings.warn("passing multiple values to Expr is deprecated, "
-                          "pass the where as a single string",
-                          DeprecationWarning)
-
-        return w
-
-    def __unicode__(self):
-        if self.terms is not None:
-            return com.pprint_thing(self.terms)
-        return com.pprint_thing(self.expr)
-
-    def evaluate(self):
-        """ create and return the numexpr condition and filter """
-
-        try:
-            self.condition = self.terms.prune(ConditionBinOp)
-        except AttributeError:
-            raise ValueError("cannot process expression [{0}], [{1}] is not a "
-                             "valid condition".format(self.expr, self))
-        try:
-            self.filter = self.terms.prune(FilterBinOp)
-        except AttributeError:
-            raise ValueError("cannot process expression [{0}], [{1}] is not a "
-                             "valid filter".format(self.expr, self))
-
-        return self.condition, self.filter
-
-
-class TermValue(object):
-
-    """ hold a term value the we use to construct a condition/filter """
-
-    def __init__(self, value, converted, kind):
-        self.value = value
-        self.converted = converted
-        self.kind = kind
-
-    def tostring(self, encoding):
-        """ quote the string if not encoded
-            else encode and return """
-        if self.kind == u('string'):
-            if encoding is not None:
-                return self.converted
-            return '"%s"' % self.converted
-        return self.converted
-
-
-def maybe_expression(s):
-    """ loose checking if s is a pytables-acceptable expression """
-    if not isinstance(s, string_types):
-        return False
-    ops = ExprVisitor.binary_ops + ExprVisitor.unary_ops + ('=',)
-
-    # make sure we have an op at least
-    return any(op in s for op in ops)
diff --git a/pandas/computation/tests/test_eval.py b/pandas/computation/tests/test_eval.py
deleted file mode 100644
index 8db0b82f1aa2e..0000000000000
--- a/pandas/computation/tests/test_eval.py
+++ /dev/null
@@ -1,1808 +0,0 @@
-#!/usr/bin/env python
-
-import warnings
-import operator
-from itertools import product
-from distutils.version import LooseVersion
-
-import nose
-from nose.tools import assert_raises
-
-from numpy.random import randn, rand, randint
-import numpy as np
-from numpy.testing import assert_allclose
-from numpy.testing.decorators import slow
-
-import pandas as pd
-from pandas.core import common as com
-from pandas import DataFrame, Series, Panel, date_range
-from pandas.util.testing import makeCustomDataframe as mkdf
-
-from pandas.computation import pytables
-from pandas.computation.engines import _engines, NumExprClobberingError
-from pandas.computation.expr import PythonExprVisitor, PandasExprVisitor
-from pandas.computation.ops import (_binary_ops_dict,
-                                    _special_case_arith_ops_syms,
-                                    _arith_ops_syms, _bool_ops_syms,
-                                    _unary_math_ops, _binary_math_ops)
-
-import pandas.computation.expr as expr
-import pandas.util.testing as tm
-from pandas.util.testing import (assert_frame_equal, randbool,
-                                 assertRaisesRegexp,
-                                 assert_produces_warning, assert_series_equal)
-from pandas.compat import PY3, u, reduce
-
-_series_frame_incompatible = _bool_ops_syms
-_scalar_skip = 'in', 'not in'
-
-
-def engine_has_neg_frac(engine):
-    return _engines[engine].has_neg_frac
-
-
-def _eval_single_bin(lhs, cmp1, rhs, engine):
-    c = _binary_ops_dict[cmp1]
-    if engine_has_neg_frac(engine):
-        try:
-            return c(lhs, rhs)
-        except ValueError as e:
-            try:
-                msg = e.message
-            except AttributeError:
-                msg = e
-            msg = u(msg)
-            if msg == u('negative number cannot be raised to a fractional'
-                        ' power'):
-                return np.nan
-            raise
-    return c(lhs, rhs)
-
-
-def _series_and_2d_ndarray(lhs, rhs):
-    return ((isinstance(lhs, Series) and
-             isinstance(rhs, np.ndarray) and rhs.ndim > 1)
-            or (isinstance(rhs, Series) and
-                isinstance(lhs, np.ndarray) and lhs.ndim > 1))
-
-
-def _series_and_frame(lhs, rhs):
-    return ((isinstance(lhs, Series) and isinstance(rhs, DataFrame))
-            or (isinstance(rhs, Series) and isinstance(lhs, DataFrame)))
-
-
-def _bool_and_frame(lhs, rhs):
-    return isinstance(lhs, bool) and isinstance(rhs, pd.core.generic.NDFrame)
-
-
-def _is_py3_complex_incompat(result, expected):
-    return (PY3 and isinstance(expected, (complex, np.complexfloating)) and
-            np.isnan(result))
-
-
-_good_arith_ops = com.difference(_arith_ops_syms, _special_case_arith_ops_syms)
-
-class TestEvalNumexprPandas(tm.TestCase):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestEvalNumexprPandas, cls).setUpClass()
-        tm.skip_if_no_ne()
-        import numexpr as ne
-        cls.ne = ne
-        cls.engine = 'numexpr'
-        cls.parser = 'pandas'
-
-    @classmethod
-    def tearDownClass(cls):
-        super(TestEvalNumexprPandas, cls).tearDownClass()
-        del cls.engine, cls.parser
-        if hasattr(cls, 'ne'):
-            del cls.ne
-
-    def setup_data(self):
-        nan_df1 = DataFrame(rand(10, 5))
-        nan_df1[nan_df1 > 0.5] = np.nan
-        nan_df2 = DataFrame(rand(10, 5))
-        nan_df2[nan_df2 > 0.5] = np.nan
-
-        self.pandas_lhses = (DataFrame(randn(10, 5)), Series(randn(5)),
-                             Series([1, 2, np.nan, np.nan, 5]), nan_df1)
-        self.pandas_rhses = (DataFrame(randn(10, 5)), Series(randn(5)),
-                             Series([1, 2, np.nan, np.nan, 5]), nan_df2)
-        self.scalar_lhses = randn(),
-        self.scalar_rhses = randn(),
-
-        self.lhses = self.pandas_lhses + self.scalar_lhses
-        self.rhses = self.pandas_rhses + self.scalar_rhses
-
-    def setup_ops(self):
-        self.cmp_ops = expr._cmp_ops_syms
-        self.cmp2_ops = self.cmp_ops[::-1]
-        self.bin_ops = expr._bool_ops_syms
-        self.special_case_ops = _special_case_arith_ops_syms
-        self.arith_ops = _good_arith_ops
-        self.unary_ops = '-', '~', 'not '
-
-    def setUp(self):
-        self.setup_ops()
-        self.setup_data()
-        self.current_engines = filter(lambda x: x != self.engine, _engines)
-
-    def tearDown(self):
-        del self.lhses, self.rhses, self.scalar_rhses, self.scalar_lhses
-        del self.pandas_rhses, self.pandas_lhses, self.current_engines
-
-    @slow
-    def test_complex_cmp_ops(self):
-        cmp_ops = ('!=', '==', '<=', '>=', '<', '>')
-        cmp2_ops = ('>', '<')
-        for lhs, cmp1, rhs, binop, cmp2 in product(self.lhses, cmp_ops,
-                                                   self.rhses, self.bin_ops,
-                                                   cmp2_ops):
-            self.check_complex_cmp_op(lhs, cmp1, rhs, binop, cmp2)
-
-    def test_simple_cmp_ops(self):
-        bool_lhses = (DataFrame(randbool(size=(10, 5))),
-                      Series(randbool((5,))), randbool())
-        bool_rhses = (DataFrame(randbool(size=(10, 5))),
-                      Series(randbool((5,))), randbool())
-        for lhs, rhs, cmp_op in product(bool_lhses, bool_rhses, self.cmp_ops):
-            self.check_simple_cmp_op(lhs, cmp_op, rhs)
-
-    @slow
-    def test_binary_arith_ops(self):
-        for lhs, op, rhs in product(self.lhses, self.arith_ops, self.rhses):
-            self.check_binary_arith_op(lhs, op, rhs)
-
-    def test_modulus(self):
-        for lhs, rhs in product(self.lhses, self.rhses):
-            self.check_modulus(lhs, '%', rhs)
-
-    def test_floor_division(self):
-        for lhs, rhs in product(self.lhses, self.rhses):
-            self.check_floor_division(lhs, '//', rhs)
-
-    def test_pow(self):
-        tm._skip_if_windows()
-
-        # odd failure on win32 platform, so skip
-        for lhs, rhs in product(self.lhses, self.rhses):
-            self.check_pow(lhs, '**', rhs)
-
-    @slow
-    def test_single_invert_op(self):
-        for lhs, op, rhs in product(self.lhses, self.cmp_ops, self.rhses):
-            self.check_single_invert_op(lhs, op, rhs)
-
-    @slow
-    def test_compound_invert_op(self):
-        for lhs, op, rhs in product(self.lhses, self.cmp_ops, self.rhses):
-            self.check_compound_invert_op(lhs, op, rhs)
-
-    @slow
-    def test_chained_cmp_op(self):
-        mids = self.lhses
-        cmp_ops = '<', '>'
-        for lhs, cmp1, mid, cmp2, rhs in product(self.lhses, cmp_ops,
-                                                 mids, cmp_ops, self.rhses):
-            self.check_chained_cmp_op(lhs, cmp1, mid, cmp2, rhs)
-
-    def check_complex_cmp_op(self, lhs, cmp1, rhs, binop, cmp2):
-        skip_these = _scalar_skip
-        ex = '(lhs {cmp1} rhs) {binop} (lhs {cmp2} rhs)'.format(cmp1=cmp1,
-                                                                binop=binop,
-                                                                cmp2=cmp2)
-        scalar_with_in_notin = (np.isscalar(rhs) and (cmp1 in skip_these or
-                                cmp2 in skip_these))
-        if scalar_with_in_notin:
-            with tm.assertRaises(TypeError):
-                pd.eval(ex, engine=self.engine, parser=self.parser)
-            self.assertRaises(TypeError, pd.eval, ex, engine=self.engine,
-                              parser=self.parser, local_dict={'lhs': lhs,
-                                                              'rhs': rhs})
-        else:
-            lhs_new = _eval_single_bin(lhs, cmp1, rhs, self.engine)
-            rhs_new = _eval_single_bin(lhs, cmp2, rhs, self.engine)
-            if (isinstance(lhs_new, Series) and isinstance(rhs_new, DataFrame)
-                    and binop in _series_frame_incompatible):
-                pass
-                # TODO: the code below should be added back when left and right
-                # hand side bool ops are fixed.
-
-                # try:
-                    # self.assertRaises(Exception, pd.eval, ex,
-                                    #local_dict={'lhs': lhs, 'rhs': rhs},
-                                    # engine=self.engine, parser=self.parser)
-                # except AssertionError:
-                    #import ipdb; ipdb.set_trace()
-                    # raise
-            else:
-                expected = _eval_single_bin(
-                    lhs_new, binop, rhs_new, self.engine)
-                result = pd.eval(ex, engine=self.engine, parser=self.parser)
-                tm.assert_numpy_array_equal(result, expected)
-
-    def check_chained_cmp_op(self, lhs, cmp1, mid, cmp2, rhs):
-        skip_these = _scalar_skip
-
-        def check_operands(left, right, cmp_op):
-            return _eval_single_bin(left, cmp_op, right, self.engine)
-
-        lhs_new = check_operands(lhs, mid, cmp1)
-        rhs_new = check_operands(mid, rhs, cmp2)
-
-        if lhs_new is not None and rhs_new is not None:
-            ex1 = 'lhs {0} mid {1} rhs'.format(cmp1, cmp2)
-            ex2 = 'lhs {0} mid and mid {1} rhs'.format(cmp1, cmp2)
-            ex3 = '(lhs {0} mid) & (mid {1} rhs)'.format(cmp1, cmp2)
-            expected = _eval_single_bin(lhs_new, '&', rhs_new, self.engine)
-
-            for ex in (ex1, ex2, ex3):
-                result = pd.eval(ex, engine=self.engine,
-                                 parser=self.parser)
-                tm.assert_numpy_array_equal(result, expected)
-
-    def check_simple_cmp_op(self, lhs, cmp1, rhs):
-        ex = 'lhs {0} rhs'.format(cmp1)
-        if cmp1 in ('in', 'not in') and not com.is_list_like(rhs):
-            self.assertRaises(TypeError, pd.eval, ex, engine=self.engine,
-                              parser=self.parser, local_dict={'lhs': lhs,
-                                                              'rhs': rhs})
-        else:
-            expected = _eval_single_bin(lhs, cmp1, rhs, self.engine)
-            result = pd.eval(ex, engine=self.engine, parser=self.parser)
-            tm.assert_numpy_array_equal(result, expected)
-
-    def check_binary_arith_op(self, lhs, arith1, rhs):
-        ex = 'lhs {0} rhs'.format(arith1)
-        result = pd.eval(ex, engine=self.engine, parser=self.parser)
-        expected = _eval_single_bin(lhs, arith1, rhs, self.engine)
-        tm.assert_numpy_array_equal(result, expected)
-        ex = 'lhs {0} rhs {0} rhs'.format(arith1)
-        result = pd.eval(ex, engine=self.engine, parser=self.parser)
-        nlhs = _eval_single_bin(lhs, arith1, rhs,
-                                self.engine)
-        self.check_alignment(result, nlhs, rhs, arith1)
-
-    def check_alignment(self, result, nlhs, ghs, op):
-        try:
-            nlhs, ghs = nlhs.align(ghs)
-        except (ValueError, TypeError, AttributeError):
-            # ValueError: series frame or frame series align
-            # TypeError, AttributeError: series or frame with scalar align
-            pass
-        else:
-            expected = self.ne.evaluate('nlhs {0} ghs'.format(op))
-            tm.assert_numpy_array_equal(result, expected)
-
-    # modulus, pow, and floor division require special casing
-
-    def check_modulus(self, lhs, arith1, rhs):
-        ex = 'lhs {0} rhs'.format(arith1)
-        result = pd.eval(ex, engine=self.engine, parser=self.parser)
-        expected = lhs % rhs
-        assert_allclose(result, expected)
-        expected = self.ne.evaluate('expected {0} rhs'.format(arith1))
-        assert_allclose(result, expected)
-
-    def check_floor_division(self, lhs, arith1, rhs):
-        ex = 'lhs {0} rhs'.format(arith1)
-
-        if self.engine == 'python':
-            res = pd.eval(ex, engine=self.engine, parser=self.parser)
-            expected = lhs // rhs
-            tm.assert_numpy_array_equal(res, expected)
-        else:
-            self.assertRaises(TypeError, pd.eval, ex, local_dict={'lhs': lhs,
-                                                                  'rhs': rhs},
-                              engine=self.engine, parser=self.parser)
-
-    def get_expected_pow_result(self, lhs, rhs):
-        try:
-            expected = _eval_single_bin(lhs, '**', rhs, self.engine)
-        except ValueError as e:
-            msg = 'negative number cannot be raised to a fractional power'
-            try:
-                emsg = e.message
-            except AttributeError:
-                emsg = e
-
-            emsg = u(emsg)
-
-            if emsg == msg:
-                if self.engine == 'python':
-                    raise nose.SkipTest(emsg)
-                else:
-                    expected = np.nan
-            else:
-                raise
-        return expected
-
-    def check_pow(self, lhs, arith1, rhs):
-        ex = 'lhs {0} rhs'.format(arith1)
-        expected = self.get_expected_pow_result(lhs, rhs)
-        result = pd.eval(ex, engine=self.engine, parser=self.parser)
-
-        if (np.isscalar(lhs) and np.isscalar(rhs) and
-                _is_py3_complex_incompat(result, expected)):
-            self.assertRaises(AssertionError, tm.assert_numpy_array_equal,
-                              result, expected)
-        else:
-            assert_allclose(result, expected)
-
-            ex = '(lhs {0} rhs) {0} rhs'.format(arith1)
-            result = pd.eval(ex, engine=self.engine, parser=self.parser)
-            expected = self.get_expected_pow_result(
-                self.get_expected_pow_result(lhs, rhs), rhs)
-            assert_allclose(result, expected)
-
-    def check_single_invert_op(self, lhs, cmp1, rhs):
-        # simple
-        for el in (lhs, rhs):
-            try:
-                elb = el.astype(bool)
-            except AttributeError:
-                elb = np.array([bool(el)])
-            expected = ~elb
-            result = pd.eval('~elb', engine=self.engine, parser=self.parser)
-            tm.assert_numpy_array_equal(expected, result)
-
-            for engine in self.current_engines:
-                tm.skip_if_no_ne(engine)
-                tm.assert_numpy_array_equal(result, pd.eval('~elb', engine=engine,
-                                            parser=self.parser))
-
-    def check_compound_invert_op(self, lhs, cmp1, rhs):
-        skip_these = 'in', 'not in'
-        ex = '~(lhs {0} rhs)'.format(cmp1)
-
-        if np.isscalar(rhs) and cmp1 in skip_these:
-            self.assertRaises(TypeError, pd.eval, ex, engine=self.engine,
-                              parser=self.parser, local_dict={'lhs': lhs,
-                                                              'rhs': rhs})
-        else:
-            # compound
-            if np.isscalar(lhs) and np.isscalar(rhs):
-                lhs, rhs = map(lambda x: np.array([x]), (lhs, rhs))
-            expected = _eval_single_bin(lhs, cmp1, rhs, self.engine)
-            if np.isscalar(expected):
-                expected = not expected
-            else:
-                expected = ~expected
-            result = pd.eval(ex, engine=self.engine, parser=self.parser)
-            tm.assert_numpy_array_equal(expected, result)
-
-            # make sure the other engines work the same as this one
-            for engine in self.current_engines:
-                tm.skip_if_no_ne(engine)
-                ev = pd.eval(ex, engine=self.engine, parser=self.parser)
-                tm.assert_numpy_array_equal(ev, result)
-
-    def ex(self, op, var_name='lhs'):
-        return '{0}{1}'.format(op, var_name)
-
-    def test_frame_invert(self):
-        expr = self.ex('~')
-
-        # ~ ##
-        # frame
-        # float always raises
-        lhs = DataFrame(randn(5, 2))
-        if self.engine == 'numexpr':
-            with tm.assertRaises(NotImplementedError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-
-        # int raises on numexpr
-        lhs = DataFrame(randint(5, size=(5, 2)))
-        if self.engine == 'numexpr':
-            with tm.assertRaises(NotImplementedError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = ~lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_frame_equal(expect, result)
-
-        # bool always works
-        lhs = DataFrame(rand(5, 2) > 0.5)
-        expect = ~lhs
-        result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        assert_frame_equal(expect, result)
-
-        # object raises
-        lhs = DataFrame({'b': ['a', 1, 2.0], 'c': rand(3) > 0.5})
-        if self.engine == 'numexpr':
-            with tm.assertRaises(ValueError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-
-    def test_series_invert(self):
-        # ~ ####
-        expr = self.ex('~')
-
-        # series
-        # float raises
-        lhs = Series(randn(5))
-        if self.engine == 'numexpr':
-            with tm.assertRaises(NotImplementedError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-
-        # int raises on numexpr
-        lhs = Series(randint(5, size=5))
-        if self.engine == 'numexpr':
-            with tm.assertRaises(NotImplementedError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = ~lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_series_equal(expect, result)
-
-        # bool
-        lhs = Series(rand(5) > 0.5)
-        expect = ~lhs
-        result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        assert_series_equal(expect, result)
-
-        # float
-        # int
-        # bool
-
-        # object
-        lhs = Series(['a', 1, 2.0])
-        if self.engine == 'numexpr':
-            with tm.assertRaises(ValueError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-
-    def test_frame_negate(self):
-        expr = self.ex('-')
-
-        # float
-        lhs = DataFrame(randn(5, 2))
-        expect = -lhs
-        result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        assert_frame_equal(expect, result)
-
-        # int
-        lhs = DataFrame(randint(5, size=(5, 2)))
-        expect = -lhs
-        result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        assert_frame_equal(expect, result)
-
-        # bool doesn't work with numexpr but works elsewhere
-        lhs = DataFrame(rand(5, 2) > 0.5)
-        if self.engine == 'numexpr':
-            with tm.assertRaises(NotImplementedError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = -lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_frame_equal(expect, result)
-
-    def test_series_negate(self):
-        expr = self.ex('-')
-
-        # float
-        lhs = Series(randn(5))
-        expect = -lhs
-        result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        assert_series_equal(expect, result)
-
-        # int
-        lhs = Series(randint(5, size=5))
-        expect = -lhs
-        result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        assert_series_equal(expect, result)
-
-        # bool doesn't work with numexpr but works elsewhere
-        lhs = Series(rand(5) > 0.5)
-        if self.engine == 'numexpr':
-            with tm.assertRaises(NotImplementedError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = -lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_series_equal(expect, result)
-
-    def test_frame_pos(self):
-        expr = self.ex('+')
-
-        # float
-        lhs = DataFrame(randn(5, 2))
-        if self.engine == 'python':
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_frame_equal(expect, result)
-
-        # int
-        lhs = DataFrame(randint(5, size=(5, 2)))
-        if self.engine == 'python':
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_frame_equal(expect, result)
-
-        # bool doesn't work with numexpr but works elsewhere
-        lhs = DataFrame(rand(5, 2) > 0.5)
-        if self.engine == 'python':
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_frame_equal(expect, result)
-
-    def test_series_pos(self):
-        expr = self.ex('+')
-
-        # float
-        lhs = Series(randn(5))
-        if self.engine == 'python':
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_series_equal(expect, result)
-
-        # int
-        lhs = Series(randint(5, size=5))
-        if self.engine == 'python':
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_series_equal(expect, result)
-
-        # bool doesn't work with numexpr but works elsewhere
-        lhs = Series(rand(5) > 0.5)
-        if self.engine == 'python':
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_series_equal(expect, result)
-
-    def test_scalar_unary(self):
-        with tm.assertRaises(TypeError):
-            pd.eval('~1.0', engine=self.engine, parser=self.parser)
-
-        self.assertEqual(
-            pd.eval('-1.0', parser=self.parser, engine=self.engine), -1.0)
-        self.assertEqual(
-            pd.eval('+1.0', parser=self.parser, engine=self.engine), +1.0)
-
-        self.assertEqual(
-            pd.eval('~1', parser=self.parser, engine=self.engine), ~1)
-        self.assertEqual(
-            pd.eval('-1', parser=self.parser, engine=self.engine), -1)
-        self.assertEqual(
-            pd.eval('+1', parser=self.parser, engine=self.engine), +1)
-
-        self.assertEqual(
-            pd.eval('~True', parser=self.parser, engine=self.engine), ~True)
-        self.assertEqual(
-            pd.eval('~False', parser=self.parser, engine=self.engine), ~False)
-        self.assertEqual(
-            pd.eval('-True', parser=self.parser, engine=self.engine), -True)
-        self.assertEqual(
-            pd.eval('-False', parser=self.parser, engine=self.engine), -False)
-        self.assertEqual(
-            pd.eval('+True', parser=self.parser, engine=self.engine), +True)
-        self.assertEqual(
-            pd.eval('+False', parser=self.parser, engine=self.engine), +False)
-
-    def test_disallow_scalar_bool_ops(self):
-        exprs = '1 or 2', '1 and 2'
-        exprs += 'a and b', 'a or b'
-        exprs += '1 or 2 and (3 + 2) > 3',
-        exprs += '2 * x > 2 or 1 and 2',
-        exprs += '2 * df > 3 and 1 or a',
-
-        x, a, b, df = np.random.randn(3), 1, 2, DataFrame(randn(3, 2))
-        for ex in exprs:
-            with tm.assertRaises(NotImplementedError):
-                pd.eval(ex, engine=self.engine, parser=self.parser)
-
-    def test_identical(self):
-        # GH 10546
-        x = 1
-        result = pd.eval('x', engine=self.engine, parser=self.parser)
-        self.assertEqual(result, 1)
-        self.assertTrue(np.isscalar(result))
-
-        x = 1.5
-        result = pd.eval('x', engine=self.engine, parser=self.parser)
-        self.assertEqual(result, 1.5)
-        self.assertTrue(np.isscalar(result))
-
-        x = False
-        result = pd.eval('x', engine=self.engine, parser=self.parser)
-        self.assertEqual(result, False)
-        self.assertTrue(np.isscalar(result))
-
-        x = np.array([1])
-        result = pd.eval('x', engine=self.engine, parser=self.parser)
-        tm.assert_numpy_array_equal(result, np.array([1]))
-        self.assertEqual(result.shape, (1, ))
-
-        x = np.array([1.5])
-        result = pd.eval('x', engine=self.engine, parser=self.parser)
-        tm.assert_numpy_array_equal(result, np.array([1.5]))
-        self.assertEqual(result.shape, (1, ))
-
-        x = np.array([False])
-        result = pd.eval('x', engine=self.engine, parser=self.parser)
-        tm.assert_numpy_array_equal(result, np.array([False]))
-        self.assertEqual(result.shape, (1, ))
-
-
-class TestEvalNumexprPython(TestEvalNumexprPandas):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestEvalNumexprPython, cls).setUpClass()
-        tm.skip_if_no_ne()
-        import numexpr as ne
-        cls.ne = ne
-        cls.engine = 'numexpr'
-        cls.parser = 'python'
-
-    def setup_ops(self):
-        self.cmp_ops = list(filter(lambda x: x not in ('in', 'not in'),
-                                   expr._cmp_ops_syms))
-        self.cmp2_ops = self.cmp_ops[::-1]
-        self.bin_ops = [s for s in expr._bool_ops_syms
-                        if s not in ('and', 'or')]
-        self.special_case_ops = _special_case_arith_ops_syms
-        self.arith_ops = _good_arith_ops
-        self.unary_ops = '+', '-', '~'
-
-    def check_chained_cmp_op(self, lhs, cmp1, mid, cmp2, rhs):
-        ex1 = 'lhs {0} mid {1} rhs'.format(cmp1, cmp2)
-        with tm.assertRaises(NotImplementedError):
-            pd.eval(ex1, engine=self.engine, parser=self.parser)
-
-
-class TestEvalPythonPython(TestEvalNumexprPython):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestEvalPythonPython, cls).setUpClass()
-        cls.engine = 'python'
-        cls.parser = 'python'
-
-    def check_modulus(self, lhs, arith1, rhs):
-        ex = 'lhs {0} rhs'.format(arith1)
-        result = pd.eval(ex, engine=self.engine, parser=self.parser)
-
-        expected = lhs % rhs
-        assert_allclose(result, expected)
-
-        expected = _eval_single_bin(expected, arith1, rhs, self.engine)
-        assert_allclose(result, expected)
-
-    def check_alignment(self, result, nlhs, ghs, op):
-        try:
-            nlhs, ghs = nlhs.align(ghs)
-        except (ValueError, TypeError, AttributeError):
-            # ValueError: series frame or frame series align
-            # TypeError, AttributeError: series or frame with scalar align
-            pass
-        else:
-            expected = eval('nlhs {0} ghs'.format(op))
-            tm.assert_numpy_array_equal(result, expected)
-
-
-class TestEvalPythonPandas(TestEvalPythonPython):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestEvalPythonPandas, cls).setUpClass()
-        cls.engine = 'python'
-        cls.parser = 'pandas'
-
-    def check_chained_cmp_op(self, lhs, cmp1, mid, cmp2, rhs):
-        TestEvalNumexprPandas.check_chained_cmp_op(self, lhs, cmp1, mid, cmp2,
-                                                   rhs)
-
-
-f = lambda *args, **kwargs: np.random.randn()
-
-
-ENGINES_PARSERS = list(product(_engines, expr._parsers))
-
-
-#-------------------------------------
-# basic and complex alignment
-
-def _is_datetime(x):
-    return issubclass(x.dtype.type, np.datetime64)
-
-
-def should_warn(*args):
-    not_mono = not any(map(operator.attrgetter('is_monotonic'), args))
-    only_one_dt = reduce(operator.xor, map(_is_datetime, args))
-    return not_mono and only_one_dt
-
-
-class TestAlignment(object):
-
-    index_types = 'i', 'u', 'dt'
-    lhs_index_types = index_types + ('s',)  # 'p'
-
-    def check_align_nested_unary_op(self, engine, parser):
-        tm.skip_if_no_ne(engine)
-        s = 'df * ~2'
-        df = mkdf(5, 3, data_gen_f=f)
-        res = pd.eval(s, engine=engine, parser=parser)
-        assert_frame_equal(res, df * ~2)
-
-    def test_align_nested_unary_op(self):
-        for engine, parser in ENGINES_PARSERS:
-            yield self.check_align_nested_unary_op, engine, parser
-
-    def check_basic_frame_alignment(self, engine, parser):
-        tm.skip_if_no_ne(engine)
-        args = product(self.lhs_index_types, self.index_types,
-                       self.index_types)
-        with warnings.catch_warnings(record=True):
-            warnings.simplefilter('always', RuntimeWarning)
-            for lr_idx_type, rr_idx_type, c_idx_type in args:
-                df = mkdf(10, 10, data_gen_f=f, r_idx_type=lr_idx_type,
-                          c_idx_type=c_idx_type)
-                df2 = mkdf(20, 10, data_gen_f=f, r_idx_type=rr_idx_type,
-                           c_idx_type=c_idx_type)
-                # only warns if not monotonic and not sortable
-                if should_warn(df.index, df2.index):
-                    with tm.assert_produces_warning(RuntimeWarning):
-                        res = pd.eval('df + df2', engine=engine, parser=parser)
-                else:
-                    res = pd.eval('df + df2', engine=engine, parser=parser)
-                assert_frame_equal(res, df + df2)
-
-    def test_basic_frame_alignment(self):
-        for engine, parser in ENGINES_PARSERS:
-            yield self.check_basic_frame_alignment, engine, parser
-
-    def check_frame_comparison(self, engine, parser):
-        tm.skip_if_no_ne(engine)
-        args = product(self.lhs_index_types, repeat=2)
-        for r_idx_type, c_idx_type in args:
-            df = mkdf(10, 10, data_gen_f=f, r_idx_type=r_idx_type,
-                      c_idx_type=c_idx_type)
-            res = pd.eval('df < 2', engine=engine, parser=parser)
-            assert_frame_equal(res, df < 2)
-
-            df3 = DataFrame(randn(*df.shape), index=df.index,
-                            columns=df.columns)
-            res = pd.eval('df < df3', engine=engine, parser=parser)
-            assert_frame_equal(res, df < df3)
-
-    def test_frame_comparison(self):
-        for engine, parser in ENGINES_PARSERS:
-            yield self.check_frame_comparison, engine, parser
-
-    def check_medium_complex_frame_alignment(self, engine, parser):
-        tm.skip_if_no_ne(engine)
-        args = product(self.lhs_index_types, self.index_types,
-                       self.index_types, self.index_types)
-
-        with warnings.catch_warnings(record=True):
-            warnings.simplefilter('always', RuntimeWarning)
-
-            for r1, c1, r2, c2 in args:
-                df = mkdf(3, 2, data_gen_f=f, r_idx_type=r1, c_idx_type=c1)
-                df2 = mkdf(4, 2, data_gen_f=f, r_idx_type=r2, c_idx_type=c2)
-                df3 = mkdf(5, 2, data_gen_f=f, r_idx_type=r2, c_idx_type=c2)
-                if should_warn(df.index, df2.index, df3.index):
-                    with tm.assert_produces_warning(RuntimeWarning):
-                        res = pd.eval('df + df2 + df3', engine=engine,
-                                      parser=parser)
-                else:
-                    res = pd.eval('df + df2 + df3', engine=engine, parser=parser)
-                assert_frame_equal(res, df + df2 + df3)
-
-    @slow
-    def test_medium_complex_frame_alignment(self):
-        for engine, parser in ENGINES_PARSERS:
-            yield self.check_medium_complex_frame_alignment, engine, parser
-
-    def check_basic_frame_series_alignment(self, engine, parser):
-        tm.skip_if_no_ne(engine)
-
-        def testit(r_idx_type, c_idx_type, index_name):
-            df = mkdf(10, 10, data_gen_f=f, r_idx_type=r_idx_type,
-                      c_idx_type=c_idx_type)
-            index = getattr(df, index_name)
-            s = Series(np.random.randn(5), index[:5])
-
-            if should_warn(df.index, s.index):
-                with tm.assert_produces_warning(RuntimeWarning):
-                    res = pd.eval('df + s', engine=engine, parser=parser)
-            else:
-                res = pd.eval('df + s', engine=engine, parser=parser)
-
-            if r_idx_type == 'dt' or c_idx_type == 'dt':
-                expected = df.add(s) if engine == 'numexpr' else df + s
-            else:
-                expected = df + s
-            assert_frame_equal(res, expected)
-
-        args = product(self.lhs_index_types, self.index_types,
-                       ('index', 'columns'))
-        with warnings.catch_warnings(record=True):
-            warnings.simplefilter('always', RuntimeWarning)
-            for r_idx_type, c_idx_type, index_name in args:
-                testit(r_idx_type, c_idx_type, index_name)
-
-    def test_basic_frame_series_alignment(self):
-        for engine, parser in ENGINES_PARSERS:
-            yield self.check_basic_frame_series_alignment, engine, parser
-
-    def check_basic_series_frame_alignment(self, engine, parser):
-        tm.skip_if_no_ne(engine)
-
-        def testit(r_idx_type, c_idx_type, index_name):
-            df = mkdf(10, 7, data_gen_f=f, r_idx_type=r_idx_type,
-                      c_idx_type=c_idx_type)
-            index = getattr(df, index_name)
-            s = Series(np.random.randn(5), index[:5])
-            if should_warn(s.index, df.index):
-                with tm.assert_produces_warning(RuntimeWarning):
-                    res = pd.eval('s + df', engine=engine, parser=parser)
-            else:
-                res = pd.eval('s + df', engine=engine, parser=parser)
-
-            if r_idx_type == 'dt' or c_idx_type == 'dt':
-                expected = df.add(s) if engine == 'numexpr' else s + df
-            else:
-                expected = s + df
-            assert_frame_equal(res, expected)
-
-        # only test dt with dt, otherwise weird joins result
-        args = product(['i', 'u', 's'], ['i', 'u', 's'], ('index', 'columns'))
-        for r_idx_type, c_idx_type, index_name in args:
-            testit(r_idx_type, c_idx_type, index_name)
-
-        # dt with dt
-        args = product(['dt'], ['dt'], ('index', 'columns'))
-        with warnings.catch_warnings(record=True):
-            warnings.simplefilter('always', RuntimeWarning)
-            for r_idx_type, c_idx_type, index_name in args:
-                testit(r_idx_type, c_idx_type, index_name)
-
-    def test_basic_series_frame_alignment(self):
-        for engine, parser in ENGINES_PARSERS:
-            yield self.check_basic_series_frame_alignment, engine, parser
-
-    def check_series_frame_commutativity(self, engine, parser):
-        tm.skip_if_no_ne(engine)
-        args = product(self.lhs_index_types, self.index_types, ('+', '*'),
-                       ('index', 'columns'))
-
-        with warnings.catch_warnings(record=True):
-            warnings.simplefilter('always', RuntimeWarning)
-            for r_idx_type, c_idx_type, op, index_name in args:
-                df = mkdf(10, 10, data_gen_f=f, r_idx_type=r_idx_type,
-                          c_idx_type=c_idx_type)
-                index = getattr(df, index_name)
-                s = Series(np.random.randn(5), index[:5])
-
-                lhs = 's {0} df'.format(op)
-                rhs = 'df {0} s'.format(op)
-                if should_warn(df.index, s.index):
-                    with tm.assert_produces_warning(RuntimeWarning):
-                        a = pd.eval(lhs, engine=engine, parser=parser)
-                    with tm.assert_produces_warning(RuntimeWarning):
-                        b = pd.eval(rhs, engine=engine, parser=parser)
-                else:
-                    a = pd.eval(lhs, engine=engine, parser=parser)
-                    b = pd.eval(rhs, engine=engine, parser=parser)
-
-                if r_idx_type != 'dt' and c_idx_type != 'dt':
-                    if engine == 'numexpr':
-                        assert_frame_equal(a, b)
-
-    def test_series_frame_commutativity(self):
-        for engine, parser in ENGINES_PARSERS:
-            yield self.check_series_frame_commutativity, engine, parser
-
-    def check_complex_series_frame_alignment(self, engine, parser):
-        tm.skip_if_no_ne(engine)
-
-        import random
-        args = product(self.lhs_index_types, self.index_types,
-                       self.index_types, self.index_types)
-        n = 3
-        m1 = 5
-        m2 = 2 * m1
-
-        with warnings.catch_warnings(record=True):
-            warnings.simplefilter('always', RuntimeWarning)
-            for r1, r2, c1, c2 in args:
-                index_name = random.choice(['index', 'columns'])
-                obj_name = random.choice(['df', 'df2'])
-
-                df = mkdf(m1, n, data_gen_f=f, r_idx_type=r1, c_idx_type=c1)
-                df2 = mkdf(m2, n, data_gen_f=f, r_idx_type=r2, c_idx_type=c2)
-                index = getattr(locals().get(obj_name), index_name)
-                s = Series(np.random.randn(n), index[:n])
-
-                if r2 == 'dt' or c2 == 'dt':
-                    if engine == 'numexpr':
-                        expected2 = df2.add(s)
-                    else:
-                        expected2 = df2 + s
-                else:
-                    expected2 = df2 + s
-
-                if r1 == 'dt' or c1 == 'dt':
-                    if engine == 'numexpr':
-                        expected = expected2.add(df)
-                    else:
-                        expected = expected2 + df
-                else:
-                    expected = expected2 + df
-
-                if should_warn(df2.index, s.index, df.index):
-                    with tm.assert_produces_warning(RuntimeWarning):
-                        res = pd.eval('df2 + s + df', engine=engine,
-                                      parser=parser)
-                else:
-                    res = pd.eval('df2 + s + df', engine=engine, parser=parser)
-                tm.assert_equal(res.shape, expected.shape)
-                assert_frame_equal(res, expected)
-
-    @slow
-    def test_complex_series_frame_alignment(self):
-        for engine, parser in ENGINES_PARSERS:
-            yield self.check_complex_series_frame_alignment, engine, parser
-
-    def check_performance_warning_for_poor_alignment(self, engine, parser):
-        tm.skip_if_no_ne(engine)
-        df = DataFrame(randn(1000, 10))
-        s = Series(randn(10000))
-        if engine == 'numexpr':
-            seen = pd.io.common.PerformanceWarning
-        else:
-            seen = False
-
-        with assert_produces_warning(seen):
-            pd.eval('df + s', engine=engine, parser=parser)
-
-        s = Series(randn(1000))
-        with assert_produces_warning(False):
-            pd.eval('df + s', engine=engine, parser=parser)
-
-        df = DataFrame(randn(10, 10000))
-        s = Series(randn(10000))
-        with assert_produces_warning(False):
-            pd.eval('df + s', engine=engine, parser=parser)
-
-        df = DataFrame(randn(10, 10))
-        s = Series(randn(10000))
-
-        is_python_engine = engine == 'python'
-
-        if not is_python_engine:
-            wrn = pd.io.common.PerformanceWarning
-        else:
-            wrn = False
-
-        with assert_produces_warning(wrn) as w:
-            pd.eval('df + s', engine=engine, parser=parser)
-
-            if not is_python_engine:
-                tm.assert_equal(len(w), 1)
-                msg = str(w[0].message)
-                expected = ("Alignment difference on axis {0} is larger"
-                            " than an order of magnitude on term {1!r}, "
-                            "by more than {2:.4g}; performance may suffer"
-                            "".format(1, 'df', np.log10(s.size - df.shape[1])))
-                tm.assert_equal(msg, expected)
-
-    def test_performance_warning_for_poor_alignment(self):
-        for engine, parser in ENGINES_PARSERS:
-            yield (self.check_performance_warning_for_poor_alignment, engine,
-                   parser)
-
-
-#------------------------------------
-# slightly more complex ops
-
-class TestOperationsNumExprPandas(tm.TestCase):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestOperationsNumExprPandas, cls).setUpClass()
-        tm.skip_if_no_ne()
-        cls.engine = 'numexpr'
-        cls.parser = 'pandas'
-        cls.arith_ops = expr._arith_ops_syms + expr._cmp_ops_syms
-
-    @classmethod
-    def tearDownClass(cls):
-        super(TestOperationsNumExprPandas, cls).tearDownClass()
-        del cls.engine, cls.parser
-
-    def eval(self, *args, **kwargs):
-        kwargs['engine'] = self.engine
-        kwargs['parser'] = self.parser
-        kwargs['level'] = kwargs.pop('level', 0) + 1
-        return pd.eval(*args, **kwargs)
-
-    def test_simple_arith_ops(self):
-        ops = self.arith_ops
-
-        for op in filter(lambda x: x != '//', ops):
-            ex = '1 {0} 1'.format(op)
-            ex2 = 'x {0} 1'.format(op)
-            ex3 = '1 {0} (x + 1)'.format(op)
-
-            if op in ('in', 'not in'):
-                self.assertRaises(TypeError, pd.eval, ex,
-                                  engine=self.engine, parser=self.parser)
-            else:
-                expec = _eval_single_bin(1, op, 1, self.engine)
-                x = self.eval(ex, engine=self.engine, parser=self.parser)
-                tm.assert_equal(x, expec)
-
-                expec = _eval_single_bin(x, op, 1, self.engine)
-                y = self.eval(ex2, local_dict={'x': x}, engine=self.engine,
-                              parser=self.parser)
-                tm.assert_equal(y, expec)
-
-                expec = _eval_single_bin(1, op, x + 1, self.engine)
-                y = self.eval(ex3, local_dict={'x': x},
-                              engine=self.engine, parser=self.parser)
-                tm.assert_equal(y, expec)
-
-    def test_simple_bool_ops(self):
-        for op, lhs, rhs in product(expr._bool_ops_syms, (True, False),
-                                    (True, False)):
-            ex = '{0} {1} {2}'.format(lhs, op, rhs)
-            res = self.eval(ex)
-            exp = eval(ex)
-            self.assertEqual(res, exp)
-
-    def test_bool_ops_with_constants(self):
-        for op, lhs, rhs in product(expr._bool_ops_syms, ('True', 'False'),
-                                    ('True', 'False')):
-            ex = '{0} {1} {2}'.format(lhs, op, rhs)
-            res = self.eval(ex)
-            exp = eval(ex)
-            self.assertEqual(res, exp)
-
-    def test_panel_fails(self):
-        x = Panel(randn(3, 4, 5))
-        y = Series(randn(10))
-        assert_raises(NotImplementedError, self.eval, 'x + y',
-                      local_dict={'x': x, 'y': y})
-
-    def test_4d_ndarray_fails(self):
-        x = randn(3, 4, 5, 6)
-        y = Series(randn(10))
-        assert_raises(NotImplementedError, self.eval, 'x + y',
-                      local_dict={'x': x, 'y': y})
-
-    def test_constant(self):
-        x = self.eval('1')
-        tm.assert_equal(x, 1)
-
-    def test_single_variable(self):
-        df = DataFrame(randn(10, 2))
-        df2 = self.eval('df', local_dict={'df': df})
-        assert_frame_equal(df, df2)
-
-    def test_truediv(self):
-        s = np.array([1])
-        ex = 's / 1'
-        d = {'s': s}
-
-        if PY3:
-            res = self.eval(ex, truediv=False)
-            tm.assert_numpy_array_equal(res, np.array([1.0]))
-
-            res = self.eval(ex, truediv=True)
-            tm.assert_numpy_array_equal(res, np.array([1.0]))
-
-            res = self.eval('1 / 2', truediv=True)
-            expec = 0.5
-            self.assertEqual(res, expec)
-
-            res = self.eval('1 / 2', truediv=False)
-            expec = 0.5
-            self.assertEqual(res, expec)
-
-            res = self.eval('s / 2', truediv=False)
-            expec = 0.5
-            self.assertEqual(res, expec)
-
-            res = self.eval('s / 2', truediv=True)
-            expec = 0.5
-            self.assertEqual(res, expec)
-        else:
-            res = self.eval(ex, truediv=False)
-            tm.assert_numpy_array_equal(res, np.array([1]))
-
-            res = self.eval(ex, truediv=True)
-            tm.assert_numpy_array_equal(res, np.array([1.0]))
-
-            res = self.eval('1 / 2', truediv=True)
-            expec = 0.5
-            self.assertEqual(res, expec)
-
-            res = self.eval('1 / 2', truediv=False)
-            expec = 0
-            self.assertEqual(res, expec)
-
-            res = self.eval('s / 2', truediv=False)
-            expec = 0
-            self.assertEqual(res, expec)
-
-            res = self.eval('s / 2', truediv=True)
-            expec = 0.5
-            self.assertEqual(res, expec)
-
-    def test_failing_subscript_with_name_error(self):
-        df = DataFrame(np.random.randn(5, 3))
-        with tm.assertRaises(NameError):
-            self.eval('df[x > 2] > 2')
-
-    def test_lhs_expression_subscript(self):
-        df = DataFrame(np.random.randn(5, 3))
-        result = self.eval('(df + 1)[df > 2]', local_dict={'df': df})
-        expected = (df + 1)[df > 2]
-        assert_frame_equal(result, expected)
-
-    def test_attr_expression(self):
-        df = DataFrame(np.random.randn(5, 3), columns=list('abc'))
-        expr1 = 'df.a < df.b'
-        expec1 = df.a < df.b
-        expr2 = 'df.a + df.b + df.c'
-        expec2 = df.a + df.b + df.c
-        expr3 = 'df.a + df.b + df.c[df.b < 0]'
-        expec3 = df.a + df.b + df.c[df.b < 0]
-        exprs = expr1, expr2, expr3
-        expecs = expec1, expec2, expec3
-        for e, expec in zip(exprs, expecs):
-            assert_series_equal(expec, self.eval(e, local_dict={'df': df}))
-
-    def test_assignment_fails(self):
-        df = DataFrame(np.random.randn(5, 3), columns=list('abc'))
-        df2 = DataFrame(np.random.randn(5, 3))
-        expr1 = 'df = df2'
-        self.assertRaises(ValueError, self.eval, expr1,
-                          local_dict={'df': df, 'df2': df2})
-
-    def test_assignment_column(self):
-        tm.skip_if_no_ne('numexpr')
-        df = DataFrame(np.random.randn(5, 2), columns=list('ab'))
-        orig_df = df.copy()
-
-        # multiple assignees
-        self.assertRaises(SyntaxError, df.eval, 'd c = a + b')
-
-        # invalid assignees
-        self.assertRaises(SyntaxError, df.eval, 'd,c = a + b')
-        self.assertRaises(
-            SyntaxError, df.eval, 'Timestamp("20131001") = a + b')
-
-        # single assignment - existing variable
-        expected = orig_df.copy()
-        expected['a'] = expected['a'] + expected['b']
-        df = orig_df.copy()
-        df.eval('a = a + b')
-        assert_frame_equal(df, expected)
-
-        # single assignment - new variable
-        expected = orig_df.copy()
-        expected['c'] = expected['a'] + expected['b']
-        df = orig_df.copy()
-        df.eval('c = a + b')
-        assert_frame_equal(df, expected)
-
-        # with a local name overlap
-        def f():
-            df = orig_df.copy()
-            a = 1
-            df.eval('a = 1 + b')
-            return df
-
-        df = f()
-        expected = orig_df.copy()
-        expected['a'] = 1 + expected['b']
-        assert_frame_equal(df, expected)
-
-        df = orig_df.copy()
-
-        def f():
-            a = 1
-            old_a = df.a.copy()
-            df.eval('a = a + b')
-            result = old_a + df.b
-            assert_series_equal(result, df.a, check_names=False)
-            self.assertTrue(result.name is None)
-
-        f()
-
-        # multiple assignment
-        df = orig_df.copy()
-        df.eval('c = a + b')
-        self.assertRaises(SyntaxError, df.eval, 'c = a = b')
-
-        # explicit targets
-        df = orig_df.copy()
-        self.eval('c = df.a + df.b', local_dict={'df': df}, target=df)
-        expected = orig_df.copy()
-        expected['c'] = expected['a'] + expected['b']
-        assert_frame_equal(df, expected)
-
-    def test_basic_period_index_boolean_expression(self):
-        df = mkdf(2, 2, data_gen_f=f, c_idx_type='p', r_idx_type='i')
-
-        e = df < 2
-        r = self.eval('df < 2', local_dict={'df': df})
-        x = df < 2
-
-        assert_frame_equal(r, e)
-        assert_frame_equal(x, e)
-
-    def test_basic_period_index_subscript_expression(self):
-        df = mkdf(2, 2, data_gen_f=f, c_idx_type='p', r_idx_type='i')
-        r = self.eval('df[df < 2 + 3]', local_dict={'df': df})
-        e = df[df < 2 + 3]
-        assert_frame_equal(r, e)
-
-    def test_nested_period_index_subscript_expression(self):
-        df = mkdf(2, 2, data_gen_f=f, c_idx_type='p', r_idx_type='i')
-        r = self.eval('df[df[df < 2] < 2] + df * 2', local_dict={'df': df})
-        e = df[df[df < 2] < 2] + df * 2
-        assert_frame_equal(r, e)
-
-    def test_date_boolean(self):
-        df = DataFrame(randn(5, 3))
-        df['dates1'] = date_range('1/1/2012', periods=5)
-        res = self.eval('df.dates1 < 20130101', local_dict={'df': df},
-                        engine=self.engine, parser=self.parser)
-        expec = df.dates1 < '20130101'
-        assert_series_equal(res, expec, check_names=False)
-
-    def test_simple_in_ops(self):
-        if self.parser != 'python':
-            res = pd.eval('1 in [1, 2]', engine=self.engine,
-                          parser=self.parser)
-            self.assertTrue(res)
-
-            res = pd.eval('2 in (1, 2)', engine=self.engine,
-                          parser=self.parser)
-            self.assertTrue(res)
-
-            res = pd.eval('3 in (1, 2)', engine=self.engine,
-                          parser=self.parser)
-            self.assertFalse(res)
-
-            res = pd.eval('3 not in (1, 2)', engine=self.engine,
-                          parser=self.parser)
-            self.assertTrue(res)
-
-            res = pd.eval('[3] not in (1, 2)', engine=self.engine,
-                          parser=self.parser)
-            self.assertTrue(res)
-
-            res = pd.eval('[3] in ([3], 2)', engine=self.engine,
-                          parser=self.parser)
-            self.assertTrue(res)
-
-            res = pd.eval('[[3]] in [[[3]], 2]', engine=self.engine,
-                          parser=self.parser)
-            self.assertTrue(res)
-
-            res = pd.eval('(3,) in [(3,), 2]', engine=self.engine,
-                          parser=self.parser)
-            self.assertTrue(res)
-
-            res = pd.eval('(3,) not in [(3,), 2]', engine=self.engine,
-                          parser=self.parser)
-            self.assertFalse(res)
-
-            res = pd.eval('[(3,)] in [[(3,)], 2]', engine=self.engine,
-                          parser=self.parser)
-            self.assertTrue(res)
-        else:
-            with tm.assertRaises(NotImplementedError):
-                pd.eval('1 in [1, 2]', engine=self.engine, parser=self.parser)
-            with tm.assertRaises(NotImplementedError):
-                pd.eval('2 in (1, 2)', engine=self.engine, parser=self.parser)
-            with tm.assertRaises(NotImplementedError):
-                pd.eval('3 in (1, 2)', engine=self.engine, parser=self.parser)
-            with tm.assertRaises(NotImplementedError):
-                pd.eval('3 not in (1, 2)', engine=self.engine,
-                        parser=self.parser)
-            with tm.assertRaises(NotImplementedError):
-                pd.eval('[(3,)] in (1, 2, [(3,)])', engine=self.engine,
-                        parser=self.parser)
-            with tm.assertRaises(NotImplementedError):
-                pd.eval('[3] not in (1, 2, [[3]])', engine=self.engine,
-                        parser=self.parser)
-
-
-class TestOperationsNumExprPython(TestOperationsNumExprPandas):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestOperationsNumExprPython, cls).setUpClass()
-        cls.engine = 'numexpr'
-        cls.parser = 'python'
-        tm.skip_if_no_ne(cls.engine)
-        cls.arith_ops = expr._arith_ops_syms + expr._cmp_ops_syms
-        cls.arith_ops = filter(lambda x: x not in ('in', 'not in'),
-                               cls.arith_ops)
-
-    def test_check_many_exprs(self):
-        a = 1
-        expr = ' * '.join('a' * 33)
-        expected = 1
-        res = pd.eval(expr, engine=self.engine, parser=self.parser)
-        tm.assert_equal(res, expected)
-
-    def test_fails_and(self):
-        df = DataFrame(np.random.randn(5, 3))
-        self.assertRaises(NotImplementedError, pd.eval, 'df > 2 and df > 3',
-                          local_dict={'df': df}, parser=self.parser,
-                          engine=self.engine)
-
-    def test_fails_or(self):
-        df = DataFrame(np.random.randn(5, 3))
-        self.assertRaises(NotImplementedError, pd.eval, 'df > 2 or df > 3',
-                          local_dict={'df': df}, parser=self.parser,
-                          engine=self.engine)
-
-    def test_fails_not(self):
-        df = DataFrame(np.random.randn(5, 3))
-        self.assertRaises(NotImplementedError, pd.eval, 'not df > 2',
-                          local_dict={'df': df}, parser=self.parser,
-                          engine=self.engine)
-
-    def test_fails_ampersand(self):
-        df = DataFrame(np.random.randn(5, 3))
-        ex = '(df + 2)[df > 1] > 0 & (df > 0)'
-        with tm.assertRaises(NotImplementedError):
-            pd.eval(ex, parser=self.parser, engine=self.engine)
-
-    def test_fails_pipe(self):
-        df = DataFrame(np.random.randn(5, 3))
-        ex = '(df + 2)[df > 1] > 0 | (df > 0)'
-        with tm.assertRaises(NotImplementedError):
-            pd.eval(ex, parser=self.parser, engine=self.engine)
-
-    def test_bool_ops_with_constants(self):
-        for op, lhs, rhs in product(expr._bool_ops_syms, ('True', 'False'),
-                                    ('True', 'False')):
-            ex = '{0} {1} {2}'.format(lhs, op, rhs)
-            if op in ('and', 'or'):
-                with tm.assertRaises(NotImplementedError):
-                    self.eval(ex)
-            else:
-                res = self.eval(ex)
-                exp = eval(ex)
-                self.assertEqual(res, exp)
-
-    def test_simple_bool_ops(self):
-        for op, lhs, rhs in product(expr._bool_ops_syms, (True, False),
-                                    (True, False)):
-            ex = 'lhs {0} rhs'.format(op)
-            if op in ('and', 'or'):
-                with tm.assertRaises(NotImplementedError):
-                    pd.eval(ex, engine=self.engine, parser=self.parser)
-            else:
-                res = pd.eval(ex, engine=self.engine, parser=self.parser)
-                exp = eval(ex)
-                self.assertEqual(res, exp)
-
-
-class TestOperationsPythonPython(TestOperationsNumExprPython):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestOperationsPythonPython, cls).setUpClass()
-        cls.engine = cls.parser = 'python'
-        cls.arith_ops = expr._arith_ops_syms + expr._cmp_ops_syms
-        cls.arith_ops = filter(lambda x: x not in ('in', 'not in'),
-                               cls.arith_ops)
-
-
-class TestOperationsPythonPandas(TestOperationsNumExprPandas):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestOperationsPythonPandas, cls).setUpClass()
-        cls.engine = 'python'
-        cls.parser = 'pandas'
-        cls.arith_ops = expr._arith_ops_syms + expr._cmp_ops_syms
-
-
-class TestMathPythonPython(tm.TestCase):
-    @classmethod
-    def setUpClass(cls):
-        super(TestMathPythonPython, cls).setUpClass()
-        tm.skip_if_no_ne()
-        cls.engine = 'python'
-        cls.parser = 'pandas'
-        cls.unary_fns = _unary_math_ops
-        cls.binary_fns = _binary_math_ops
-
-    @classmethod
-    def tearDownClass(cls):
-        del cls.engine, cls.parser
-
-    def eval(self, *args, **kwargs):
-        kwargs['engine'] = self.engine
-        kwargs['parser'] = self.parser
-        kwargs['level'] = kwargs.pop('level', 0) + 1
-        return pd.eval(*args, **kwargs)
-
-    def test_unary_functions(self):
-        df = DataFrame({'a': np.random.randn(10)})
-        a = df.a
-        for fn in self.unary_fns:
-            expr = "{0}(a)".format(fn)
-            got = self.eval(expr)
-            expect = getattr(np, fn)(a)
-            pd.util.testing.assert_almost_equal(got, expect)
-
-    def test_binary_functions(self):
-        df = DataFrame({'a': np.random.randn(10),
-                        'b': np.random.randn(10)})
-        a = df.a
-        b = df.b
-        for fn in self.binary_fns:
-            expr = "{0}(a, b)".format(fn)
-            got = self.eval(expr)
-            expect = getattr(np, fn)(a, b)
-            np.testing.assert_allclose(got, expect)
-
-    def test_df_use_case(self):
-        df = DataFrame({'a': np.random.randn(10),
-                        'b': np.random.randn(10)})
-        df.eval("e = arctan2(sin(a), b)",
-                engine=self.engine,
-                parser=self.parser)
-        got = df.e
-        expect = np.arctan2(np.sin(df.a), df.b)
-        pd.util.testing.assert_almost_equal(got, expect)
-
-    def test_df_arithmetic_subexpression(self):
-        df = DataFrame({'a': np.random.randn(10),
-                        'b': np.random.randn(10)})
-        df.eval("e = sin(a + b)",
-                engine=self.engine,
-                parser=self.parser)
-        got = df.e
-        expect = np.sin(df.a + df.b)
-        pd.util.testing.assert_almost_equal(got, expect)
-
-    def check_result_type(self, dtype, expect_dtype):
-        df = DataFrame({'a': np.random.randn(10).astype(dtype)})
-        self.assertEqual(df.a.dtype, dtype)
-        df.eval("b = sin(a)",
-                engine=self.engine,
-                parser=self.parser)
-        got = df.b
-        expect = np.sin(df.a)
-        self.assertEqual(expect.dtype, got.dtype)
-        self.assertEqual(expect_dtype, got.dtype)
-        pd.util.testing.assert_almost_equal(got, expect)
-
-    def test_result_types(self):
-        self.check_result_type(np.int32, np.float64)
-        self.check_result_type(np.int64, np.float64)
-        self.check_result_type(np.float32, np.float32)
-        self.check_result_type(np.float64, np.float64)
-        # Did not test complex64 because DataFrame is converting it to
-        # complex128. Due to https://github.com/pydata/pandas/issues/10952
-        self.check_result_type(np.complex128, np.complex128)
-
-    def test_undefined_func(self):
-        df = DataFrame({'a': np.random.randn(10)})
-        with tm.assertRaisesRegexp(ValueError,
-                                   "\"mysin\" is not a supported function"):
-            df.eval("mysin(a)",
-                    engine=self.engine,
-                    parser=self.parser)
-
-    def test_keyword_arg(self):
-        df = DataFrame({'a': np.random.randn(10)})
-        with tm.assertRaisesRegexp(TypeError,
-                                   "Function \"sin\" does not support "
-                                   "keyword arguments"):
-            df.eval("sin(x=a)",
-                    engine=self.engine,
-                    parser=self.parser)
-
-
-class TestMathPythonPandas(TestMathPythonPython):
-    @classmethod
-    def setUpClass(cls):
-        super(TestMathPythonPandas, cls).setUpClass()
-        cls.engine = 'python'
-        cls.parser = 'pandas'
-
-
-class TestMathNumExprPandas(TestMathPythonPython):
-    @classmethod
-    def setUpClass(cls):
-        super(TestMathNumExprPandas, cls).setUpClass()
-        cls.engine = 'numexpr'
-        cls.parser = 'pandas'
-
-
-class TestMathNumExprPython(TestMathPythonPython):
-    @classmethod
-    def setUpClass(cls):
-        super(TestMathNumExprPython, cls).setUpClass()
-        cls.engine = 'numexpr'
-        cls.parser = 'python'
-
-
-_var_s = randn(10)
-
-
-class TestScope(object):
-
-    def check_global_scope(self, e, engine, parser):
-        tm.skip_if_no_ne(engine)
-        tm.assert_numpy_array_equal(_var_s * 2, pd.eval(e, engine=engine,
-                                    parser=parser))
-
-    def test_global_scope(self):
-        e = '_var_s * 2'
-        for engine, parser in product(_engines, expr._parsers):
-            yield self.check_global_scope, e, engine, parser
-
-    def check_no_new_locals(self, engine, parser):
-        tm.skip_if_no_ne(engine)
-        x = 1
-        lcls = locals().copy()
-        pd.eval('x + 1', local_dict=lcls, engine=engine, parser=parser)
-        lcls2 = locals().copy()
-        lcls2.pop('lcls')
-        tm.assert_equal(lcls, lcls2)
-
-    def test_no_new_locals(self):
-        for engine, parser in product(_engines, expr._parsers):
-            yield self.check_no_new_locals, engine, parser
-
-    def check_no_new_globals(self, engine, parser):
-        tm.skip_if_no_ne(engine)
-        x = 1
-        gbls = globals().copy()
-        pd.eval('x + 1', engine=engine, parser=parser)
-        gbls2 = globals().copy()
-        tm.assert_equal(gbls, gbls2)
-
-    def test_no_new_globals(self):
-        for engine, parser in product(_engines, expr._parsers):
-            yield self.check_no_new_globals, engine, parser
-
-
-def test_invalid_engine():
-    tm.skip_if_no_ne()
-    assertRaisesRegexp(KeyError, 'Invalid engine \'asdf\' passed',
-                       pd.eval, 'x + y', local_dict={'x': 1, 'y': 2},
-                       engine='asdf')
-
-
-def test_invalid_parser():
-    tm.skip_if_no_ne()
-    assertRaisesRegexp(KeyError, 'Invalid parser \'asdf\' passed',
-                       pd.eval, 'x + y', local_dict={'x': 1, 'y': 2},
-                       parser='asdf')
-
-
-_parsers = {'python': PythonExprVisitor, 'pytables': pytables.ExprVisitor,
-            'pandas': PandasExprVisitor}
-
-
-def check_disallowed_nodes(engine, parser):
-    tm.skip_if_no_ne(engine)
-    VisitorClass = _parsers[parser]
-    uns_ops = VisitorClass.unsupported_nodes
-    inst = VisitorClass('x + 1', engine, parser)
-
-    for ops in uns_ops:
-        assert_raises(NotImplementedError, getattr(inst, ops))
-
-
-def test_disallowed_nodes():
-    for engine, visitor in product(_parsers, repeat=2):
-        yield check_disallowed_nodes, engine, visitor
-
-
-def check_syntax_error_exprs(engine, parser):
-    tm.skip_if_no_ne(engine)
-    e = 's +'
-    assert_raises(SyntaxError, pd.eval, e, engine=engine, parser=parser)
-
-
-def test_syntax_error_exprs():
-    for engine, parser in ENGINES_PARSERS:
-        yield check_syntax_error_exprs, engine, parser
-
-
-def check_name_error_exprs(engine, parser):
-    tm.skip_if_no_ne(engine)
-    e = 's + t'
-    with tm.assertRaises(NameError):
-        pd.eval(e, engine=engine, parser=parser)
-
-
-def test_name_error_exprs():
-    for engine, parser in ENGINES_PARSERS:
-        yield check_name_error_exprs, engine, parser
-
-
-def check_invalid_numexpr_version(engine, parser):
-    def testit():
-        a, b = 1, 2
-        res = pd.eval('a + b', engine=engine, parser=parser)
-        tm.assert_equal(res, 3)
-
-    if engine == 'numexpr':
-        try:
-            import numexpr as ne
-        except ImportError:
-            raise nose.SkipTest("no numexpr")
-        else:
-            if ne.__version__ < LooseVersion('2.1'):
-                with tm.assertRaisesRegexp(ImportError, "'numexpr' version is "
-                                           ".+, must be >= 2.1"):
-                    testit()
-            else:
-                testit()
-    else:
-        testit()
-
-
-def test_invalid_numexpr_version():
-    for engine, parser in ENGINES_PARSERS:
-        yield check_invalid_numexpr_version, engine, parser
-
-
-def check_invalid_local_variable_reference(engine, parser):
-    tm.skip_if_no_ne(engine)
-
-    a, b = 1, 2
-    exprs = 'a + @b', '@a + b', '@a + @b'
-    for expr in exprs:
-        if parser != 'pandas':
-            with tm.assertRaisesRegexp(SyntaxError, "The '@' prefix is only"):
-                pd.eval(exprs, engine=engine, parser=parser)
-        else:
-            with tm.assertRaisesRegexp(SyntaxError, "The '@' prefix is not"):
-                pd.eval(exprs, engine=engine, parser=parser)
-
-
-def test_invalid_local_variable_reference():
-    for engine, parser in ENGINES_PARSERS:
-        yield check_invalid_local_variable_reference, engine, parser
-
-
-def check_numexpr_builtin_raises(engine, parser):
-    tm.skip_if_no_ne(engine)
-    sin, dotted_line = 1, 2
-    if engine == 'numexpr':
-        with tm.assertRaisesRegexp(NumExprClobberingError,
-                                'Variables in expression .+'):
-            pd.eval('sin + dotted_line', engine=engine, parser=parser)
-    else:
-        res = pd.eval('sin + dotted_line', engine=engine, parser=parser)
-        tm.assert_equal(res, sin + dotted_line)
-
-
-def test_numexpr_builtin_raises():
-    for engine, parser in ENGINES_PARSERS:
-        yield check_numexpr_builtin_raises, engine, parser
-
-
-def check_bad_resolver_raises(engine, parser):
-    tm.skip_if_no_ne(engine)
-    cannot_resolve = 42, 3.0
-    with tm.assertRaisesRegexp(TypeError, 'Resolver of type .+'):
-        pd.eval('1 + 2', resolvers=cannot_resolve, engine=engine,
-                parser=parser)
-
-
-def test_bad_resolver_raises():
-    for engine, parser in ENGINES_PARSERS:
-        yield check_bad_resolver_raises, engine, parser
-
-
-def check_more_than_one_expression_raises(engine, parser):
-    tm.skip_if_no_ne(engine)
-    with tm.assertRaisesRegexp(SyntaxError,
-                               'only a single expression is allowed'):
-        pd.eval('1 + 1; 2 + 2', engine=engine, parser=parser)
-
-
-def test_more_than_one_expression_raises():
-    for engine, parser in ENGINES_PARSERS:
-        yield check_more_than_one_expression_raises, engine, parser
-
-
-def check_bool_ops_fails_on_scalars(gen, lhs, cmp, rhs, engine, parser):
-    tm.skip_if_no_ne(engine)
-    mid = gen[type(lhs)]()
-    ex1 = 'lhs {0} mid {1} rhs'.format(cmp, cmp)
-    ex2 = 'lhs {0} mid and mid {1} rhs'.format(cmp, cmp)
-    ex3 = '(lhs {0} mid) & (mid {1} rhs)'.format(cmp, cmp)
-    for ex in (ex1, ex2, ex3):
-        with tm.assertRaises(NotImplementedError):
-            pd.eval(ex, engine=engine, parser=parser)
-
-
-def test_bool_ops_fails_on_scalars():
-    _bool_ops_syms = 'and', 'or'
-    dtypes = int, float
-    gen = {int: lambda: np.random.randint(10), float: np.random.randn}
-    for engine, parser, dtype1, cmp, dtype2 in product(_engines, expr._parsers,
-                                                       dtypes, _bool_ops_syms,
-                                                       dtypes):
-        yield (check_bool_ops_fails_on_scalars, gen, gen[dtype1](), cmp,
-               gen[dtype2](), engine, parser)
-
-
-def check_inf(engine, parser):
-    tm.skip_if_no_ne(engine)
-    s = 'inf + 1'
-    expected = np.inf
-    result = pd.eval(s, engine=engine, parser=parser)
-    tm.assert_equal(result, expected)
-
-
-def test_inf():
-    for engine, parser in ENGINES_PARSERS:
-        yield check_inf, engine, parser
-
-
-def check_negate_lt_eq_le(engine, parser):
-    tm.skip_if_no_ne(engine)
-    df = pd.DataFrame([[0, 10], [1, 20]], columns=['cat', 'count'])
-    expected = df[~(df.cat > 0)]
-
-    result = df.query('~(cat > 0)', engine=engine, parser=parser)
-    tm.assert_frame_equal(result, expected)
-
-    if parser == 'python':
-        with tm.assertRaises(NotImplementedError):
-            df.query('not (cat > 0)', engine=engine, parser=parser)
-    else:
-        result = df.query('not (cat > 0)', engine=engine, parser=parser)
-        tm.assert_frame_equal(result, expected)
-
-def test_negate_lt_eq_le():
-    for engine, parser in product(_engines, expr._parsers):
-        yield check_negate_lt_eq_le, engine, parser
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/conftest.py b/pandas/conftest.py
new file mode 100644
index 0000000000000..8ca90722d17f7
--- /dev/null
+++ b/pandas/conftest.py
@@ -0,0 +1,339 @@
+import os
+import importlib
+
+import pytest
+
+import pandas
+import numpy as np
+import pandas as pd
+from pandas.compat import PY3
+import pandas.util._test_decorators as td
+
+
+def pytest_addoption(parser):
+    parser.addoption("--skip-slow", action="store_true",
+                     help="skip slow tests")
+    parser.addoption("--skip-network", action="store_true",
+                     help="skip network tests")
+    parser.addoption("--run-high-memory", action="store_true",
+                     help="run high memory tests")
+    parser.addoption("--only-slow", action="store_true",
+                     help="run only slow tests")
+    parser.addoption("--strict-data-files", action="store_true",
+                     help="Fail if a test is skipped for missing data file.")
+
+
+def pytest_runtest_setup(item):
+    if 'slow' in item.keywords and item.config.getoption("--skip-slow"):
+        pytest.skip("skipping due to --skip-slow")
+
+    if 'slow' not in item.keywords and item.config.getoption("--only-slow"):
+        pytest.skip("skipping due to --only-slow")
+
+    if 'network' in item.keywords and item.config.getoption("--skip-network"):
+        pytest.skip("skipping due to --skip-network")
+
+    if 'high_memory' in item.keywords and not item.config.getoption(
+            "--run-high-memory"):
+        pytest.skip(
+            "skipping high memory test since --run-high-memory was not set")
+
+
+# Configurations for all tests and all test modules
+
+@pytest.fixture(autouse=True)
+def configure_tests():
+    pd.set_option('chained_assignment', 'raise')
+
+
+# For running doctests: make np and pd names available
+
+@pytest.fixture(autouse=True)
+def add_imports(doctest_namespace):
+    doctest_namespace['np'] = np
+    doctest_namespace['pd'] = pd
+
+
+@pytest.fixture(params=['bsr', 'coo', 'csc', 'csr', 'dia', 'dok', 'lil'])
+def spmatrix(request):
+    from scipy import sparse
+    return getattr(sparse, request.param + '_matrix')
+
+
+@pytest.fixture
+def ip():
+    """
+    Get an instance of IPython.InteractiveShell.
+
+    Will raise a skip if IPython is not installed.
+    """
+
+    pytest.importorskip('IPython', minversion="6.0.0")
+    from IPython.core.interactiveshell import InteractiveShell
+    return InteractiveShell()
+
+
+@pytest.fixture(params=[True, False, None])
+def observed(request):
+    """ pass in the observed keyword to groupby for [True, False]
+    This indicates whether categoricals should return values for
+    values which are not in the grouper [False / None], or only values which
+    appear in the grouper [True]. [None] is supported for future compatiblity
+    if we decide to change the default (and would need to warn if this
+    parameter is not passed)"""
+    return request.param
+
+
+_all_arithmetic_operators = ['__add__', '__radd__',
+                             '__sub__', '__rsub__',
+                             '__mul__', '__rmul__',
+                             '__floordiv__', '__rfloordiv__',
+                             '__truediv__', '__rtruediv__',
+                             '__pow__', '__rpow__',
+                             '__mod__', '__rmod__']
+if not PY3:
+    _all_arithmetic_operators.extend(['__div__', '__rdiv__'])
+
+
+@pytest.fixture(params=_all_arithmetic_operators)
+def all_arithmetic_operators(request):
+    """
+    Fixture for dunder names for common arithmetic operations
+    """
+    return request.param
+
+
+@pytest.fixture(params=['__eq__', '__ne__', '__le__',
+                        '__lt__', '__ge__', '__gt__'])
+def all_compare_operators(request):
+    """
+    Fixture for dunder names for common compare operations
+
+    * >=
+    * >
+    * ==
+    * !=
+    * <
+    * <=
+    """
+    return request.param
+
+
+@pytest.fixture(params=[None, 'gzip', 'bz2', 'zip',
+                        pytest.param('xz', marks=td.skip_if_no_lzma)])
+def compression(request):
+    """
+    Fixture for trying common compression types in compression tests
+    """
+    return request.param
+
+
+@pytest.fixture(params=['gzip', 'bz2', 'zip',
+                        pytest.param('xz', marks=td.skip_if_no_lzma)])
+def compression_only(request):
+    """
+    Fixture for trying common compression types in compression tests excluding
+    uncompressed case
+    """
+    return request.param
+
+
+@pytest.fixture(scope='module')
+def datetime_tz_utc():
+    from datetime import timezone
+    return timezone.utc
+
+
+@pytest.fixture(params=['inner', 'outer', 'left', 'right'])
+def join_type(request):
+    """
+    Fixture for trying all types of join operations
+    """
+    return request.param
+
+
+@pytest.fixture
+def datapath(request):
+    """Get the path to a data file.
+
+    Parameters
+    ----------
+    path : str
+        Path to the file, relative to ``pandas/tests/``
+
+    Returns
+    -------
+    path : path including ``pandas/tests``.
+
+    Raises
+    ------
+    ValueError
+        If the path doesn't exist and the --strict-data-files option is set.
+    """
+    BASE_PATH = os.path.join(os.path.dirname(__file__), 'tests')
+
+    def deco(*args):
+        path = os.path.join(BASE_PATH, *args)
+        if not os.path.exists(path):
+            if request.config.getoption("--strict-data-files"):
+                msg = "Could not find file {} and --strict-data-files is set."
+                raise ValueError(msg.format(path))
+            else:
+                msg = "Could not find {}."
+                pytest.skip(msg.format(path))
+        return path
+    return deco
+
+
+@pytest.fixture
+def iris(datapath):
+    """The iris dataset as a DataFrame."""
+    return pandas.read_csv(datapath('data', 'iris.csv'))
+
+
+@pytest.fixture(params=['nlargest', 'nsmallest'])
+def nselect_method(request):
+    """
+    Fixture for trying all nselect methods
+    """
+    return request.param
+
+
+@pytest.fixture(params=['left', 'right', 'both', 'neither'])
+def closed(request):
+    """
+    Fixture for trying all interval closed parameters
+    """
+    return request.param
+
+
+@pytest.fixture(params=[None, np.nan, pd.NaT, float('nan'), np.float('NaN')])
+def nulls_fixture(request):
+    """
+    Fixture for each null type in pandas
+    """
+    return request.param
+
+
+nulls_fixture2 = nulls_fixture  # Generate cartesian product of nulls_fixture
+
+
+TIMEZONES = [None, 'UTC', 'US/Eastern', 'Asia/Tokyo', 'dateutil/US/Pacific']
+
+
+@td.parametrize_fixture_doc(str(TIMEZONES))
+@pytest.fixture(params=TIMEZONES)
+def tz_naive_fixture(request):
+    """
+    Fixture for trying timezones including default (None): {0}
+    """
+    return request.param
+
+
+@td.parametrize_fixture_doc(str(TIMEZONES[1:]))
+@pytest.fixture(params=TIMEZONES[1:])
+def tz_aware_fixture(request):
+    """
+    Fixture for trying explicit timezones: {0}
+    """
+    return request.param
+
+
+@pytest.fixture(params=[str, 'str', 'U'])
+def string_dtype(request):
+    """Parametrized fixture for string dtypes.
+
+    * str
+    * 'str'
+    * 'U'
+    """
+    return request.param
+
+
+@pytest.fixture(params=["float32", "float64"])
+def float_dtype(request):
+    """
+    Parameterized fixture for float dtypes.
+
+    * float32
+    * float64
+    """
+
+    return request.param
+
+
+@pytest.fixture(params=["complex64", "complex128"])
+def complex_dtype(request):
+    """
+    Parameterized fixture for complex dtypes.
+
+    * complex64
+    * complex128
+    """
+
+    return request.param
+
+
+UNSIGNED_INT_DTYPES = ["uint8", "uint16", "uint32", "uint64"]
+SIGNED_INT_DTYPES = ["int8", "int16", "int32", "int64"]
+ALL_INT_DTYPES = UNSIGNED_INT_DTYPES + SIGNED_INT_DTYPES
+
+
+@pytest.fixture(params=SIGNED_INT_DTYPES)
+def sint_dtype(request):
+    """
+    Parameterized fixture for signed integer dtypes.
+
+    * int8
+    * int16
+    * int32
+    * int64
+    """
+
+    return request.param
+
+
+@pytest.fixture(params=UNSIGNED_INT_DTYPES)
+def uint_dtype(request):
+    """
+    Parameterized fixture for unsigned integer dtypes.
+
+    * uint8
+    * uint16
+    * uint32
+    * uint64
+    """
+
+    return request.param
+
+
+@pytest.fixture(params=ALL_INT_DTYPES)
+def any_int_dtype(request):
+    """
+    Parameterized fixture for any integer dtypes.
+
+    * int8
+    * uint8
+    * int16
+    * uint16
+    * int32
+    * uint32
+    * int64
+    * uint64
+    """
+
+    return request.param
+
+
+@pytest.fixture
+def mock():
+    """
+    Fixture providing the 'mock' module.
+
+    Uses 'unittest.mock' for Python 3. Attempts to import the 3rd party 'mock'
+    package for Python 2, skipping if not present.
+    """
+    if PY3:
+        return importlib.import_module("unittest.mock")
+    else:
+        return pytest.importorskip("mock")
diff --git a/pandas/core/accessor.py b/pandas/core/accessor.py
new file mode 100644
index 0000000000000..7a853d575aa69
--- /dev/null
+++ b/pandas/core/accessor.py
@@ -0,0 +1,241 @@
+# -*- coding: utf-8 -*-
+"""
+
+accessor.py contains base classes for implementing accessor properties
+that can be mixed into or pinned onto other pandas classes.
+
+"""
+import warnings
+
+from pandas.util._decorators import Appender
+
+
+class DirNamesMixin(object):
+    _accessors = frozenset([])
+    _deprecations = frozenset(
+        ['asobject', 'base', 'data', 'flags', 'itemsize', 'strides'])
+
+    def _dir_deletions(self):
+        """ delete unwanted __dir__ for this object """
+        return self._accessors | self._deprecations
+
+    def _dir_additions(self):
+        """ add additional __dir__ for this object """
+        rv = set()
+        for accessor in self._accessors:
+            try:
+                getattr(self, accessor)
+                rv.add(accessor)
+            except AttributeError:
+                pass
+        return rv
+
+    def __dir__(self):
+        """
+        Provide method name lookup and completion
+        Only provide 'public' methods
+        """
+        rv = set(dir(type(self)))
+        rv = (rv - self._dir_deletions()) | self._dir_additions()
+        return sorted(rv)
+
+
+class PandasDelegate(object):
+    """ an abstract base class for delegating methods/properties """
+
+    def _delegate_property_get(self, name, *args, **kwargs):
+        raise TypeError("You cannot access the "
+                        "property {name}".format(name=name))
+
+    def _delegate_property_set(self, name, value, *args, **kwargs):
+        raise TypeError("The property {name} cannot be set".format(name=name))
+
+    def _delegate_method(self, name, *args, **kwargs):
+        raise TypeError("You cannot call method {name}".format(name=name))
+
+    @classmethod
+    def _add_delegate_accessors(cls, delegate, accessors, typ,
+                                overwrite=False):
+        """
+        add accessors to cls from the delegate class
+
+        Parameters
+        ----------
+        cls : the class to add the methods/properties to
+        delegate : the class to get methods/properties & doc-strings
+        acccessors : string list of accessors to add
+        typ : 'property' or 'method'
+        overwrite : boolean, default False
+           overwrite the method/property in the target class if it exists
+        """
+
+        def _create_delegator_property(name):
+
+            def _getter(self):
+                return self._delegate_property_get(name)
+
+            def _setter(self, new_values):
+                return self._delegate_property_set(name, new_values)
+
+            _getter.__name__ = name
+            _setter.__name__ = name
+
+            return property(fget=_getter, fset=_setter,
+                            doc=getattr(delegate, name).__doc__)
+
+        def _create_delegator_method(name):
+
+            def f(self, *args, **kwargs):
+                return self._delegate_method(name, *args, **kwargs)
+
+            f.__name__ = name
+            f.__doc__ = getattr(delegate, name).__doc__
+
+            return f
+
+        for name in accessors:
+
+            if typ == 'property':
+                f = _create_delegator_property(name)
+            else:
+                f = _create_delegator_method(name)
+
+            # don't overwrite existing methods/properties
+            if overwrite or not hasattr(cls, name):
+                setattr(cls, name, f)
+
+
+# Ported with modifications from xarray
+# https://github.com/pydata/xarray/blob/master/xarray/core/extensions.py
+# 1. We don't need to catch and re-raise AttributeErrors as RuntimeErrors
+# 2. We use a UserWarning instead of a custom Warning
+
+class CachedAccessor(object):
+    """Custom property-like object (descriptor) for caching accessors.
+
+    Parameters
+    ----------
+    name : str
+        The namespace this will be accessed under, e.g. ``df.foo``
+    accessor : cls
+        The class with the extension methods. The class' __init__ method
+        should expect one of a ``Series``, ``DataFrame`` or ``Index`` as
+        the single argument ``data``
+    """
+    def __init__(self, name, accessor):
+        self._name = name
+        self._accessor = accessor
+
+    def __get__(self, obj, cls):
+        if obj is None:
+            # we're accessing the attribute of the class, i.e., Dataset.geo
+            return self._accessor
+        accessor_obj = self._accessor(obj)
+        # Replace the property with the accessor object. Inspired by:
+        # http://www.pydanny.com/cached-property.html
+        # We need to use object.__setattr__ because we overwrite __setattr__ on
+        # NDFrame
+        object.__setattr__(obj, self._name, accessor_obj)
+        return accessor_obj
+
+
+def _register_accessor(name, cls):
+    def decorator(accessor):
+        if hasattr(cls, name):
+            warnings.warn(
+                'registration of accessor {!r} under name {!r} for type '
+                '{!r} is overriding a preexisting attribute with the same '
+                'name.'.format(accessor, name, cls),
+                UserWarning,
+                stacklevel=2)
+        setattr(cls, name, CachedAccessor(name, accessor))
+        cls._accessors.add(name)
+        return accessor
+    return decorator
+
+
+_doc = """Register a custom accessor on %(klass)s objects.
+
+Parameters
+----------
+name : str
+    Name under which the accessor should be registered. A warning is issued
+    if this name conflicts with a preexisting attribute.
+
+Notes
+-----
+When accessed, your accessor will be initialized with the pandas object
+the user is interacting with. So the signature must be
+
+.. code-block:: python
+
+    def __init__(self, pandas_object):
+
+For consistency with pandas methods, you should raise an ``AttributeError``
+if the data passed to your accessor has an incorrect dtype.
+
+>>> pd.Series(['a', 'b']).dt
+Traceback (most recent call last):
+...
+AttributeError: Can only use .dt accessor with datetimelike values
+
+Examples
+--------
+
+In your library code::
+
+    import pandas as pd
+
+    @pd.api.extensions.register_dataframe_accessor("geo")
+    class GeoAccessor(object):
+        def __init__(self, pandas_obj):
+            self._obj = pandas_obj
+
+        @property
+        def center(self):
+            # return the geographic center point of this DataFrame
+            lat = self._obj.latitude
+            lon = self._obj.longitude
+            return (float(lon.mean()), float(lat.mean()))
+
+        def plot(self):
+            # plot this array's data on a map, e.g., using Cartopy
+            pass
+
+Back in an interactive IPython session:
+
+    >>> ds = pd.DataFrame({'longitude': np.linspace(0, 10),
+    ...                    'latitude': np.linspace(0, 20)})
+    >>> ds.geo.center
+    (5.0, 10.0)
+    >>> ds.geo.plot()
+    # plots data on a map
+
+See also
+--------
+%(others)s
+"""
+
+
+@Appender(_doc % dict(klass="DataFrame",
+                      others=("register_series_accessor, "
+                              "register_index_accessor")))
+def register_dataframe_accessor(name):
+    from pandas import DataFrame
+    return _register_accessor(name, DataFrame)
+
+
+@Appender(_doc % dict(klass="Series",
+                      others=("register_dataframe_accessor, "
+                              "register_index_accessor")))
+def register_series_accessor(name):
+    from pandas import Series
+    return _register_accessor(name, Series)
+
+
+@Appender(_doc % dict(klass="Index",
+                      others=("register_dataframe_accessor, "
+                              "register_series_accessor")))
+def register_index_accessor(name):
+    from pandas import Index
+    return _register_accessor(name, Index)
diff --git a/pandas/core/algorithms.py b/pandas/core/algorithms.py
index e5347f03b5462..dc726a736d34f 100644
--- a/pandas/core/algorithms.py
+++ b/pandas/core/algorithms.py
@@ -3,14 +3,244 @@
 intended for public consumption
 """
 from __future__ import division
-from warnings import warn
+from warnings import warn, catch_warnings
+from textwrap import dedent
+
 import numpy as np
 
-from pandas import compat, lib, _np_version_under1p8
-import pandas.core.common as com
-import pandas.algos as algos
-import pandas.hashtable as htable
-from pandas.compat import string_types
+from pandas.core.dtypes.cast import (
+    maybe_promote, construct_1d_object_array_from_listlike)
+from pandas.core.dtypes.generic import (
+    ABCSeries, ABCIndex,
+    ABCIndexClass)
+from pandas.core.dtypes.common import (
+    is_array_like,
+    is_unsigned_integer_dtype, is_signed_integer_dtype,
+    is_integer_dtype, is_complex_dtype,
+    is_object_dtype,
+    is_extension_array_dtype,
+    is_categorical_dtype, is_sparse,
+    is_period_dtype,
+    is_numeric_dtype, is_float_dtype,
+    is_bool_dtype, needs_i8_conversion,
+    is_datetimetz,
+    is_datetime64_any_dtype, is_datetime64tz_dtype,
+    is_timedelta64_dtype, is_datetimelike,
+    is_interval_dtype, is_scalar, is_list_like,
+    _ensure_platform_int, _ensure_object,
+    _ensure_float64, _ensure_uint64,
+    _ensure_int64)
+from pandas.compat.numpy import _np_version_under1p10
+from pandas.core.dtypes.missing import isna, na_value_for_dtype
+
+from pandas.core import common as com
+from pandas._libs import algos, lib, hashtable as htable
+from pandas._libs.tslib import iNaT
+from pandas.util._decorators import (Appender, Substitution,
+                                     deprecate_kwarg)
+
+_shared_docs = {}
+
+
+# --------------- #
+# dtype access    #
+# --------------- #
+def _ensure_data(values, dtype=None):
+    """
+    routine to ensure that our data is of the correct
+    input dtype for lower-level routines
+
+    This will coerce:
+    - ints -> int64
+    - uint -> uint64
+    - bool -> uint64 (TODO this should be uint8)
+    - datetimelike -> i8
+    - datetime64tz -> i8 (in local tz)
+    - categorical -> codes
+
+    Parameters
+    ----------
+    values : array-like
+    dtype : pandas_dtype, optional
+        coerce to this dtype
+
+    Returns
+    -------
+    (ndarray, pandas_dtype, algo dtype as a string)
+
+    """
+
+    # we check some simple dtypes first
+    try:
+        if is_object_dtype(dtype):
+            return _ensure_object(np.asarray(values)), 'object', 'object'
+        if is_bool_dtype(values) or is_bool_dtype(dtype):
+            # we are actually coercing to uint64
+            # until our algos support uint8 directly (see TODO)
+            return np.asarray(values).astype('uint64'), 'bool', 'uint64'
+        elif is_signed_integer_dtype(values) or is_signed_integer_dtype(dtype):
+            return _ensure_int64(values), 'int64', 'int64'
+        elif (is_unsigned_integer_dtype(values) or
+              is_unsigned_integer_dtype(dtype)):
+            return _ensure_uint64(values), 'uint64', 'uint64'
+        elif is_float_dtype(values) or is_float_dtype(dtype):
+            return _ensure_float64(values), 'float64', 'float64'
+        elif is_object_dtype(values) and dtype is None:
+            return _ensure_object(np.asarray(values)), 'object', 'object'
+        elif is_complex_dtype(values) or is_complex_dtype(dtype):
+
+            # ignore the fact that we are casting to float
+            # which discards complex parts
+            with catch_warnings(record=True):
+                values = _ensure_float64(values)
+            return values, 'float64', 'float64'
+
+    except (TypeError, ValueError):
+        # if we are trying to coerce to a dtype
+        # and it is incompat this will fall thru to here
+        return _ensure_object(values), 'object', 'object'
+
+    # datetimelike
+    if (needs_i8_conversion(values) or
+            is_period_dtype(dtype) or
+            is_datetime64_any_dtype(dtype) or
+            is_timedelta64_dtype(dtype)):
+        if is_period_dtype(values) or is_period_dtype(dtype):
+            from pandas import PeriodIndex
+            values = PeriodIndex(values)
+            dtype = values.dtype
+        elif is_timedelta64_dtype(values) or is_timedelta64_dtype(dtype):
+            from pandas import TimedeltaIndex
+            values = TimedeltaIndex(values)
+            dtype = values.dtype
+        else:
+            # Datetime
+            from pandas import DatetimeIndex
+            values = DatetimeIndex(values)
+            dtype = values.dtype
+
+        return values.asi8, dtype, 'int64'
+
+    elif (is_categorical_dtype(values) and
+          (is_categorical_dtype(dtype) or dtype is None)):
+        values = getattr(values, 'values', values)
+        values = values.codes
+        dtype = 'category'
+
+        # we are actually coercing to int64
+        # until our algos support int* directly (not all do)
+        values = _ensure_int64(values)
+
+        return values, dtype, 'int64'
+
+    # we have failed, return object
+    values = np.asarray(values)
+    return _ensure_object(values), 'object', 'object'
+
+
+def _reconstruct_data(values, dtype, original):
+    """
+    reverse of _ensure_data
+
+    Parameters
+    ----------
+    values : ndarray
+    dtype : pandas_dtype
+    original : ndarray-like
+
+    Returns
+    -------
+    Index for extension types, otherwise ndarray casted to dtype
+    """
+    from pandas import Index
+    if is_extension_array_dtype(dtype):
+        pass
+    elif is_datetime64tz_dtype(dtype) or is_period_dtype(dtype):
+        values = Index(original)._shallow_copy(values, name=None)
+    elif is_bool_dtype(dtype):
+        values = values.astype(dtype)
+
+        # we only support object dtypes bool Index
+        if isinstance(original, Index):
+            values = values.astype(object)
+    elif dtype is not None:
+        values = values.astype(dtype)
+
+    return values
+
+
+def _ensure_arraylike(values):
+    """
+    ensure that we are arraylike if not already
+    """
+    if not is_array_like(values):
+        inferred = lib.infer_dtype(values)
+        if inferred in ['mixed', 'string', 'unicode']:
+            if isinstance(values, tuple):
+                values = list(values)
+            values = construct_1d_object_array_from_listlike(values)
+        else:
+            values = np.asarray(values)
+    return values
+
+
+_hashtables = {
+    'float64': (htable.Float64HashTable, htable.Float64Vector),
+    'uint64': (htable.UInt64HashTable, htable.UInt64Vector),
+    'int64': (htable.Int64HashTable, htable.Int64Vector),
+    'string': (htable.StringHashTable, htable.ObjectVector),
+    'object': (htable.PyObjectHashTable, htable.ObjectVector)
+}
+
+
+def _get_hashtable_algo(values):
+    """
+    Parameters
+    ----------
+    values : arraylike
+
+    Returns
+    -------
+    tuples(hashtable class,
+           vector class,
+           values,
+           dtype,
+           ndtype)
+    """
+    values, dtype, ndtype = _ensure_data(values)
+
+    if ndtype == 'object':
+
+        # its cheaper to use a String Hash Table than Object
+        if lib.infer_dtype(values) in ['string']:
+            ndtype = 'string'
+        else:
+            ndtype = 'object'
+
+    htable, table = _hashtables[ndtype]
+    return (htable, table, values, dtype, ndtype)
+
+
+def _get_data_algo(values, func_map):
+
+    if is_categorical_dtype(values):
+        values = values._values_for_rank()
+
+    values, dtype, ndtype = _ensure_data(values)
+    if ndtype == 'object':
+
+        # its cheaper to use a String Hash Table than Object
+        if lib.infer_dtype(values) in ['string']:
+            ndtype = 'string'
+
+    f = func_map.get(ndtype, func_map['object'])
+
+    return f, values
+
+
+# --------------- #
+# top-level algos #
+# --------------- #
 
 def match(to_match, values, na_sentinel=-1):
     """
@@ -33,38 +263,122 @@ def match(to_match, values, na_sentinel=-1):
     match : ndarray of integers
     """
     values = com._asarray_tuplesafe(values)
-    if issubclass(values.dtype.type, string_types):
-        values = np.array(values, dtype='O')
-
-    f = lambda htype, caster: _match_generic(to_match, values, htype, caster)
-    result = _hashtable_algo(f, values.dtype, np.int64)
+    htable, _, values, dtype, ndtype = _get_hashtable_algo(values)
+    to_match, _, _ = _ensure_data(to_match, dtype)
+    table = htable(min(len(to_match), 1000000))
+    table.map_locations(values)
+    result = table.lookup(to_match)
 
     if na_sentinel != -1:
 
         # replace but return a numpy array
         # use a Series because it handles dtype conversions properly
-        from pandas.core.series import Series
-        result = Series(result.ravel()).replace(-1,na_sentinel).values.reshape(result.shape)
+        from pandas import Series
+        result = Series(result.ravel()).replace(-1, na_sentinel).values.\
+            reshape(result.shape)
 
     return result
 
 
 def unique(values):
     """
-    Compute unique values (not necessarily sorted) efficiently from input array
-    of values
+    Hash table-based unique. Uniques are returned in order
+    of appearance. This does NOT sort.
+
+    Significantly faster than numpy.unique. Includes NA values.
 
     Parameters
     ----------
-    values : array-like
+    values : 1d array-like
 
     Returns
     -------
-    uniques
+    unique values.
+      - If the input is an Index, the return is an Index
+      - If the input is a Categorical dtype, the return is a Categorical
+      - If the input is a Series/ndarray, the return will be an ndarray
+
+    Examples
+    --------
+    >>> pd.unique(pd.Series([2, 1, 3, 3]))
+    array([2, 1, 3])
+
+    >>> pd.unique(pd.Series([2] + [1] * 5))
+    array([2, 1])
+
+    >>> pd.unique(Series([pd.Timestamp('20160101'),
+    ...                   pd.Timestamp('20160101')]))
+    array(['2016-01-01T00:00:00.000000000'], dtype='datetime64[ns]')
+
+    >>> pd.unique(pd.Series([pd.Timestamp('20160101', tz='US/Eastern'),
+    ...                      pd.Timestamp('20160101', tz='US/Eastern')]))
+    array([Timestamp('2016-01-01 00:00:00-0500', tz='US/Eastern')],
+          dtype=object)
+
+    >>> pd.unique(pd.Index([pd.Timestamp('20160101', tz='US/Eastern'),
+    ...                     pd.Timestamp('20160101', tz='US/Eastern')]))
+    DatetimeIndex(['2016-01-01 00:00:00-05:00'],
+    ...           dtype='datetime64[ns, US/Eastern]', freq=None)
+
+    >>> pd.unique(list('baabc'))
+    array(['b', 'a', 'c'], dtype=object)
+
+    An unordered Categorical will return categories in the
+    order of appearance.
+
+    >>> pd.unique(Series(pd.Categorical(list('baabc'))))
+    [b, a, c]
+    Categories (3, object): [b, a, c]
+
+    >>> pd.unique(Series(pd.Categorical(list('baabc'),
+    ...                                 categories=list('abc'))))
+    [b, a, c]
+    Categories (3, object): [b, a, c]
+
+    An ordered Categorical preserves the category ordering.
+
+    >>> pd.unique(Series(pd.Categorical(list('baabc'),
+    ...                                 categories=list('abc'),
+    ...                                 ordered=True)))
+    [b, a, c]
+    Categories (3, object): [a < b < c]
+
+    An array of tuples
+
+    >>> pd.unique([('a', 'b'), ('b', 'a'), ('a', 'c'), ('b', 'a')])
+    array([('a', 'b'), ('b', 'a'), ('a', 'c')], dtype=object)
+
+    See Also
+    --------
+    pandas.Index.unique
+    pandas.Series.unique
+
     """
-    values = com._asarray_tuplesafe(values)
-    f = lambda htype, caster: _unique_generic(values, htype, caster)
-    return _hashtable_algo(f, values.dtype)
+
+    values = _ensure_arraylike(values)
+
+    if is_extension_array_dtype(values):
+        # Dispatch to extension dtype's unique.
+        return values.unique()
+
+    original = values
+    htable, _, values, dtype, ndtype = _get_hashtable_algo(values)
+
+    table = htable(len(values))
+    uniques = table.unique(values)
+    uniques = _reconstruct_data(uniques, dtype, original)
+
+    if isinstance(original, ABCSeries) and is_datetime64tz_dtype(dtype):
+        # we are special casing datetime64tz_dtype
+        # to return an object array of tz-aware Timestamps
+
+        # TODO: it must return DatetimeArray with tz in pandas 2.0
+        uniques = uniques.astype(object).values
+
+    return uniques
+
+
+unique1d = unique
 
 
 def isin(comps, values):
@@ -81,150 +395,262 @@ def isin(comps, values):
     boolean array same length as comps
     """
 
-    if not com.is_list_like(comps):
+    if not is_list_like(comps):
         raise TypeError("only list-like objects are allowed to be passed"
-                        " to isin(), you passed a "
-                        "[{0}]".format(type(comps).__name__))
-    comps = np.asarray(comps)
-    if not com.is_list_like(values):
+                        " to isin(), you passed a [{comps_type}]"
+                        .format(comps_type=type(comps).__name__))
+    if not is_list_like(values):
         raise TypeError("only list-like objects are allowed to be passed"
-                        " to isin(), you passed a "
-                        "[{0}]".format(type(values).__name__))
+                        " to isin(), you passed a [{values_type}]"
+                        .format(values_type=type(values).__name__))
+
+    if not isinstance(values, (ABCIndex, ABCSeries, np.ndarray)):
+        values = construct_1d_object_array_from_listlike(list(values))
+
+    if is_categorical_dtype(comps):
+        # TODO(extension)
+        # handle categoricals
+        return comps._values.isin(values)
+
+    comps = com._values_from_object(comps)
+
+    comps, dtype, _ = _ensure_data(comps)
+    values, _, _ = _ensure_data(values, dtype=dtype)
 
-    # GH11232
-    # work-around for numpy < 1.8 and comparisions on py3
     # faster for larger cases to use np.in1d
-    if (_np_version_under1p8 and compat.PY3) or len(comps) > 1000000:
-        f = lambda x, y: np.in1d(x,np.asarray(list(y)))
-    else:
-        f = lambda x, y: lib.ismember_int64(x,set(y))
-
-    # may need i8 conversion for proper membership testing
-    if com.is_datetime64_dtype(comps):
-        from pandas.tseries.tools import to_datetime
-        values = to_datetime(values)._values.view('i8')
-        comps = comps.view('i8')
-    elif com.is_timedelta64_dtype(comps):
-        from pandas.tseries.timedeltas import to_timedelta
-        values = to_timedelta(values)._values.view('i8')
-        comps = comps.view('i8')
-    elif com.is_int64_dtype(comps):
-        pass
-    else:
-        f = lambda x, y: lib.ismember(x, set(values))
+    f = lambda x, y: htable.ismember_object(x, values)
+
+    # GH16012
+    # Ensure np.in1d doesn't get object types or it *may* throw an exception
+    if len(comps) > 1000000 and not is_object_dtype(comps):
+        f = lambda x, y: np.in1d(x, y)
+    elif is_integer_dtype(comps):
+        try:
+            values = values.astype('int64', copy=False)
+            comps = comps.astype('int64', copy=False)
+            f = lambda x, y: htable.ismember_int64(x, y)
+        except (TypeError, ValueError):
+            values = values.astype(object)
+            comps = comps.astype(object)
+
+    elif is_float_dtype(comps):
+        try:
+            values = values.astype('float64', copy=False)
+            comps = comps.astype('float64', copy=False)
+            checknull = isna(values).any()
+            f = lambda x, y: htable.ismember_float64(x, y, checknull)
+        except (TypeError, ValueError):
+            values = values.astype(object)
+            comps = comps.astype(object)
 
     return f(comps, values)
 
-def _hashtable_algo(f, dtype, return_dtype=None):
-    """
-    f(HashTable, type_caster) -> result
-    """
-    if com.is_float_dtype(dtype):
-        return f(htable.Float64HashTable, com._ensure_float64)
-    elif com.is_integer_dtype(dtype):
-        return f(htable.Int64HashTable, com._ensure_int64)
-    elif com.is_datetime64_dtype(dtype):
-        return_dtype = return_dtype or 'M8[ns]'
-        return f(htable.Int64HashTable, com._ensure_int64).view(return_dtype)
-    elif com.is_timedelta64_dtype(dtype):
-        return_dtype = return_dtype or 'm8[ns]'
-        return f(htable.Int64HashTable, com._ensure_int64).view(return_dtype)
-    else:
-        return f(htable.PyObjectHashTable, com._ensure_object)
 
+def _factorize_array(values, na_sentinel=-1, size_hint=None,
+                     na_value=None):
+    """Factorize an array-like to labels and uniques.
 
-def _match_generic(values, index, table_type, type_caster):
-    values = type_caster(values)
-    index = type_caster(index)
-    table = table_type(min(len(index), 1000000))
-    table.map_locations(index)
-    return table.lookup(values)
+    This doesn't do any coercion of types or unboxing before factorization.
 
+    Parameters
+    ----------
+    values : ndarray
+    na_sentinel : int, default -1
+    size_hint : int, optional
+        Passsed through to the hashtable's 'get_labels' method
+    na_value : object, optional
+        A value in `values` to consider missing. Note: only use this
+        parameter when you know that you don't have any values pandas would
+        consider missing in the array (NaN for float data, iNaT for
+        datetimes, etc.).
 
-def _unique_generic(values, table_type, type_caster):
-    values = type_caster(values)
-    table = table_type(min(len(values), 1000000))
-    uniques = table.unique(values)
-    return type_caster(uniques)
+    Returns
+    -------
+    labels, uniques : ndarray
+    """
+    (hash_klass, vec_klass), values = _get_data_algo(values, _hashtables)
 
+    table = hash_klass(size_hint or len(values))
+    uniques = vec_klass()
+    labels = table.get_labels(values, uniques, 0, na_sentinel,
+                              na_value=na_value)
 
+    labels = _ensure_platform_int(labels)
+    uniques = uniques.to_array()
+    return labels, uniques
 
 
-def factorize(values, sort=False, order=None, na_sentinel=-1, size_hint=None):
-    """
-    Encode input values as an enumerated type or categorical variable
+_shared_docs['factorize'] = """
+    Encode the object as an enumerated type or categorical variable.
+
+    This method is useful for obtaining a numeric representation of an
+    array when all that matters is identifying distinct values. `factorize`
+    is available as both a top-level function :func:`pandas.factorize`,
+    and as a method :meth:`Series.factorize` and :meth:`Index.factorize`.
 
     Parameters
     ----------
-    values : ndarray (1-d)
-        Sequence
-    sort : boolean, default False
-        Sort by values
-    order : deprecated
+    %(values)s%(sort)s%(order)s
     na_sentinel : int, default -1
-        Value to mark "not found"
-    size_hint : hint to the hashtable sizer
+        Value to mark "not found".
+    %(size_hint)s\
 
     Returns
     -------
-    labels : the indexer to the original array
-    uniques : ndarray (1-d) or Index
-        the unique values. Index is returned when passed values is Index or Series
+    labels : ndarray
+        An integer ndarray that's an indexer into `uniques`.
+        ``uniques.take(labels)`` will have the same values as `values`.
+    uniques : ndarray, Index, or Categorical
+        The unique valid values. When `values` is Categorical, `uniques`
+        is a Categorical. When `values` is some other pandas object, an
+        `Index` is returned. Otherwise, a 1-D ndarray is returned.
 
-    note: an array of Periods will ignore sort as it returns an always sorted PeriodIndex
-    """
-    if order is not None:
-        msg = "order is deprecated. See https://github.com/pydata/pandas/issues/6926"
-        warn(msg, FutureWarning, stacklevel=2)
+        .. note ::
 
-    from pandas.core.index import Index
-    from pandas.core.series import Series
-    vals = np.asarray(values)
+           Even if there's a missing value in `values`, `uniques` will
+           *not* contain an entry for it.
 
-    is_datetime = com.is_datetime64_dtype(vals)
-    is_timedelta = com.is_timedelta64_dtype(vals)
-    (hash_klass, vec_klass), vals = _get_data_algo(vals, _hashtables)
+    See Also
+    --------
+    pandas.cut : Discretize continuous-valued array.
+    pandas.unique : Find the unique value in an array.
 
-    table = hash_klass(size_hint or len(vals))
-    uniques = vec_klass()
-    labels = table.get_labels(vals, uniques, 0, na_sentinel)
+    Examples
+    --------
+    These examples all show factorize as a top-level method like
+    ``pd.factorize(values)``. The results are identical for methods like
+    :meth:`Series.factorize`.
+
+    >>> labels, uniques = pd.factorize(['b', 'b', 'a', 'c', 'b'])
+    >>> labels
+    array([0, 0, 1, 2, 0])
+    >>> uniques
+    array(['b', 'a', 'c'], dtype=object)
+
+    With ``sort=True``, the `uniques` will be sorted, and `labels` will be
+    shuffled so that the relationship is the maintained.
+
+    >>> labels, uniques = pd.factorize(['b', 'b', 'a', 'c', 'b'], sort=True)
+    >>> labels
+    array([1, 1, 0, 2, 1])
+    >>> uniques
+    array(['a', 'b', 'c'], dtype=object)
+
+    Missing values are indicated in `labels` with `na_sentinel`
+    (``-1`` by default). Note that missing values are never
+    included in `uniques`.
+
+    >>> labels, uniques = pd.factorize(['b', None, 'a', 'c', 'b'])
+    >>> labels
+    array([ 0, -1,  1,  2,  0])
+    >>> uniques
+    array(['b', 'a', 'c'], dtype=object)
+
+    Thus far, we've only factorized lists (which are internally coerced to
+    NumPy arrays). When factorizing pandas objects, the type of `uniques`
+    will differ. For Categoricals, a `Categorical` is returned.
+
+    >>> cat = pd.Categorical(['a', 'a', 'c'], categories=['a', 'b', 'c'])
+    >>> labels, uniques = pd.factorize(cat)
+    >>> labels
+    array([0, 0, 1])
+    >>> uniques
+    [a, c]
+    Categories (3, object): [a, b, c]
+
+    Notice that ``'b'`` is in ``uniques.categories``, despite not being
+    present in ``cat.values``.
+
+    For all other pandas objects, an Index of the appropriate type is
+    returned.
+
+    >>> cat = pd.Series(['a', 'a', 'c'])
+    >>> labels, uniques = pd.factorize(cat)
+    >>> labels
+    array([0, 0, 1])
+    >>> uniques
+    Index(['a', 'c'], dtype='object')
+    """
 
-    labels = com._ensure_platform_int(labels)
 
-    uniques = uniques.to_array()
+@Substitution(
+    values=dedent("""\
+    values : sequence
+        A 1-D sequence. Sequences that aren't pandas objects are
+        coerced to ndarrays before factorization.
+    """),
+    order=dedent("""\
+    order
+        .. deprecated:: 0.23.0
+
+           This parameter has no effect and is deprecated.
+    """),
+    sort=dedent("""\
+    sort : bool, default False
+        Sort `uniques` and shuffle `labels` to maintain the
+        relationship.
+    """),
+    size_hint=dedent("""\
+    size_hint : int, optional
+        Hint to the hashtable sizer.
+    """),
+)
+@Appender(_shared_docs['factorize'])
+@deprecate_kwarg(old_arg_name='order', new_arg_name=None)
+def factorize(values, sort=False, order=None, na_sentinel=-1, size_hint=None):
+    # Implementation notes: This method is responsible for 3 things
+    # 1.) coercing data to array-like (ndarray, Index, extension array)
+    # 2.) factorizing labels and uniques
+    # 3.) Maybe boxing the output in an Index
+    #
+    # Step 2 is dispatched to extension types (like Categorical). They are
+    # responsible only for factorization. All data coercion, sorting and boxing
+    # should happen here.
+
+    values = _ensure_arraylike(values)
+    original = values
+
+    if is_extension_array_dtype(values):
+        values = getattr(values, '_values', values)
+        labels, uniques = values.factorize(na_sentinel=na_sentinel)
+        dtype = original.dtype
+    else:
+        values, dtype, _ = _ensure_data(values)
+
+        if (is_datetime64_any_dtype(original) or
+                is_timedelta64_dtype(original) or
+                is_period_dtype(original)):
+            na_value = na_value_for_dtype(original.dtype)
+        else:
+            na_value = None
+
+        labels, uniques = _factorize_array(values,
+                                           na_sentinel=na_sentinel,
+                                           size_hint=size_hint,
+                                           na_value=na_value)
 
     if sort and len(uniques) > 0:
+        from pandas.core.sorting import safe_sort
         try:
-            sorter = uniques.argsort()
-        except:
-            # unorderable in py3 if mixed str/int
-            t = hash_klass(len(uniques))
-            t.map_locations(com._ensure_object(uniques))
-
-            # order ints before strings
-            ordered = np.concatenate([
-                np.sort(np.array([ e for i, e in enumerate(uniques) if f(e) ],dtype=object)) for f in [ lambda x: not isinstance(x,string_types),
-                                                                                                        lambda x: isinstance(x,string_types) ]
-                ])
-            sorter = com._ensure_platform_int(t.lookup(com._ensure_object(ordered)))
-
-        reverse_indexer = np.empty(len(sorter), dtype=np.int_)
-        reverse_indexer.put(sorter, np.arange(len(sorter)))
-
-        mask = labels < 0
-        labels = reverse_indexer.take(labels)
-        np.putmask(labels, mask, -1)
-
-        uniques = uniques.take(sorter)
-
-    if is_datetime:
-        uniques = uniques.astype('M8[ns]')
-    elif is_timedelta:
-        uniques = uniques.astype('m8[ns]')
-    if isinstance(values, Index):
-        uniques = values._shallow_copy(uniques, name=None)
-    elif isinstance(values, Series):
+            order = uniques.argsort()
+            order2 = order.argsort()
+            labels = take_1d(order2, labels, fill_value=na_sentinel)
+            uniques = uniques.take(order)
+        except TypeError:
+            # Mixed types, where uniques.argsort fails.
+            uniques, labels = safe_sort(uniques, labels,
+                                        na_sentinel=na_sentinel,
+                                        assume_unique=True)
+
+    uniques = _reconstruct_data(uniques, dtype, original)
+
+    # return original tenor
+    if isinstance(original, ABCIndexClass):
+        uniques = original._shallow_copy(uniques, name=None)
+    elif isinstance(original, ABCSeries):
+        from pandas import Index
         uniques = Index(uniques)
+
     return labels, uniques
 
 
@@ -253,128 +679,194 @@ def value_counts(values, sort=True, ascending=False, normalize=False,
     value_counts : Series
 
     """
-    from pandas.core.series import Series
-    from pandas.tools.tile import cut
-    from pandas import Index, PeriodIndex, DatetimeIndex
-
+    from pandas.core.series import Series, Index
     name = getattr(values, 'name', None)
-    values = Series(values).values
 
     if bins is not None:
         try:
-            cat, bins = cut(values, bins, retbins=True)
+            from pandas.core.reshape.tile import cut
+            values = Series(values)
+            ii = cut(values, bins, include_lowest=True)
         except TypeError:
             raise TypeError("bins argument only works with numeric data.")
-        values = cat.codes
 
-    if com.is_categorical_dtype(values.dtype):
-        result = values.value_counts(dropna)
+        # count, remove nulls (from the index), and but the bins
+        result = ii.value_counts(dropna=dropna)
+        result = result[result.index.notna()]
+        result.index = result.index.astype('interval')
+        result = result.sort_index()
+
+        # if we are dropna and we have NO values
+        if dropna and (result.values == 0).all():
+            result = result.iloc[0:0]
+
+        # normalizing is by len of all (regardless of dropna)
+        counts = np.array([len(ii)])
 
     else:
 
-        dtype = values.dtype
-        is_period = com.is_period_arraylike(values)
-        is_datetimetz = com.is_datetimetz(values)
+        if is_categorical_dtype(values) or is_sparse(values):
 
-        if com.is_datetime_or_timedelta_dtype(dtype) or is_period or is_datetimetz:
+            # handle Categorical and sparse,
+            result = Series(values)._values.value_counts(dropna=dropna)
+            result.name = name
+            counts = result.values
 
-            if is_period:
-                values = PeriodIndex(values)
-            elif is_datetimetz:
-                tz = getattr(values, 'tz', None)
-                values = DatetimeIndex(values).tz_localize(None)
+        else:
+            keys, counts = _value_counts_arraylike(values, dropna)
 
-            values = values.view(np.int64)
-            keys, counts = htable.value_count_scalar64(values, dropna)
+            if not isinstance(keys, Index):
+                keys = Index(keys)
+            result = Series(counts, index=keys, name=name)
 
-            if dropna:
-                from pandas.tslib import iNaT
-                msk = keys != iNaT
-                keys, counts = keys[msk], counts[msk]
+    if sort:
+        result = result.sort_values(ascending=ascending)
 
-            # localize to the original tz if necessary
-            if is_datetimetz:
-                keys = DatetimeIndex(keys).tz_localize(tz)
+    if normalize:
+        result = result / float(counts.sum())
 
-            # convert the keys back to the dtype we came in
-            else:
-                keys = keys.astype(dtype)
+    return result
 
 
-        elif com.is_integer_dtype(dtype):
-            values = com._ensure_int64(values)
-            keys, counts = htable.value_count_scalar64(values, dropna)
-        elif com.is_float_dtype(dtype):
-            values = com._ensure_float64(values)
-            keys, counts = htable.value_count_scalar64(values, dropna)
+def _value_counts_arraylike(values, dropna):
+    """
+    Parameters
+    ----------
+    values : arraylike
+    dropna : boolean
 
-        else:
-            values = com._ensure_object(values)
-            mask = com.isnull(values)
-            keys, counts = htable.value_count_object(values, mask)
-            if not dropna and mask.any():
+    Returns
+    -------
+    (uniques, counts)
+
+    """
+    values = _ensure_arraylike(values)
+    original = values
+    values, dtype, ndtype = _ensure_data(values)
+
+    if needs_i8_conversion(dtype):
+        # i8
+
+        keys, counts = htable.value_count_int64(values, dropna)
+
+        if dropna:
+            msk = keys != iNaT
+            keys, counts = keys[msk], counts[msk]
+
+    else:
+        # ndarray like
+
+        # TODO: handle uint8
+        f = getattr(htable, "value_count_{dtype}".format(dtype=ndtype))
+        keys, counts = f(values, dropna)
+
+        mask = isna(values)
+        if not dropna and mask.any():
+            if not isna(keys).any():
                 keys = np.insert(keys, 0, np.NaN)
                 counts = np.insert(counts, 0, mask.sum())
 
-        if not isinstance(keys, Index):
-            keys = Index(keys)
-        result = Series(counts, index=keys, name=name)
+    keys = _reconstruct_data(keys, original.dtype, original)
 
-        if bins is not None:
-            # TODO: This next line should be more efficient
-            result = result.reindex(np.arange(len(cat.categories)), fill_value=0)
-            result.index = bins[:-1]
+    return keys, counts
 
-    if sort:
-        result = result.sort_values(ascending=ascending)
 
-    if normalize:
-        result = result / float(values.size)
+def duplicated(values, keep='first'):
+    """
+    Return boolean ndarray denoting duplicate values.
 
-    return result
+    .. versionadded:: 0.19.0
 
+    Parameters
+    ----------
+    values : ndarray-like
+        Array over which to check for duplicate values.
+    keep : {'first', 'last', False}, default 'first'
+        - ``first`` : Mark duplicates as ``True`` except for the first
+          occurrence.
+        - ``last`` : Mark duplicates as ``True`` except for the last
+          occurrence.
+        - False : Mark all duplicates as ``True``.
 
-def mode(values):
-    """Returns the mode or mode(s) of the passed Series or ndarray (sorted)"""
-    # must sort because hash order isn't necessarily defined.
-    from pandas.core.series import Series
+    Returns
+    -------
+    duplicated : ndarray
+    """
 
-    if isinstance(values, Series):
-        constructor = values._constructor
-        values = values.values
-    else:
-        values = np.asanyarray(values)
-        constructor = Series
+    values, dtype, ndtype = _ensure_data(values)
+    f = getattr(htable, "duplicated_{dtype}".format(dtype=ndtype))
+    return f(values, keep=keep)
 
-    dtype = values.dtype
-    if com.is_integer_dtype(values):
-        values = com._ensure_int64(values)
-        result = constructor(sorted(htable.mode_int64(values)), dtype=dtype)
 
-    elif issubclass(values.dtype.type, (np.datetime64, np.timedelta64)):
-        dtype = values.dtype
-        values = values.view(np.int64)
-        result = constructor(sorted(htable.mode_int64(values)), dtype=dtype)
+def mode(values, dropna=True):
+    """
+    Returns the mode(s) of an array.
 
-    elif com.is_categorical_dtype(values):
-        result = constructor(values.mode())
-    else:
-        mask = com.isnull(values)
-        values = com._ensure_object(values)
-        res = htable.mode_object(values, mask)
-        try:
-            res = sorted(res)
-        except TypeError as e:
-            warn("Unable to sort modes: %s" % e)
-        result = constructor(res, dtype=dtype)
+    Parameters
+    ----------
+    values : array-like
+        Array over which to check for duplicate values.
+    dropna : boolean, default True
+        Don't consider counts of NaN/NaT.
 
-    return result
+        .. versionadded:: 0.24.0
+
+    Returns
+    -------
+    mode : Series
+    """
+    from pandas import Series
+
+    values = _ensure_arraylike(values)
+    original = values
+
+    # categorical is a fast-path
+    if is_categorical_dtype(values):
+        if isinstance(values, Series):
+            return Series(values.values.mode(dropna=dropna), name=values.name)
+        return values.mode(dropna=dropna)
+
+    if dropna and is_datetimelike(values):
+        mask = values.isnull()
+        values = values[~mask]
+
+    values, dtype, ndtype = _ensure_data(values)
+
+    f = getattr(htable, "mode_{dtype}".format(dtype=ndtype))
+    result = f(values, dropna=dropna)
+    try:
+        result = np.sort(result)
+    except TypeError as e:
+        warn("Unable to sort modes: {error}".format(error=e))
+
+    result = _reconstruct_data(result, original.dtype, original)
+    return Series(result)
 
 
 def rank(values, axis=0, method='average', na_option='keep',
          ascending=True, pct=False):
     """
+    Rank the values along a given axis.
 
+    Parameters
+    ----------
+    values : array-like
+        Array whose values will be ranked. The number of dimensions in this
+        array must not exceed 2.
+    axis : int, default 0
+        Axis over which to perform rankings.
+    method : {'average', 'min', 'max', 'first', 'dense'}, default 'average'
+        The method by which tiebreaks are broken during the ranking.
+    na_option : {'keep', 'top'}, default 'keep'
+        The method by which NaNs are placed in the ranking.
+        - ``keep``: rank each NaN value with a NaN ranking
+        - ``top``: replace each NaN with either +/- inf so that they
+                   there are ranked at the top
+    ascending : boolean, default True
+        Whether or not the elements should be ranked in ascending order.
+    pct : boolean, default False
+        Whether or not to the display the returned rankings in integer form
+        (e.g. 1, 2, 3) or in percentile form (e.g. 0.333..., 0.666..., 1).
     """
     if values.ndim == 1:
         f, values = _get_data_algo(values, _rank1d_functions)
@@ -384,10 +876,115 @@ def rank(values, axis=0, method='average', na_option='keep',
         f, values = _get_data_algo(values, _rank2d_functions)
         ranks = f(values, axis=axis, ties_method=method,
                   ascending=ascending, na_option=na_option, pct=pct)
+    else:
+        raise TypeError("Array with ndim > 2 are not supported.")
 
     return ranks
 
 
+def checked_add_with_arr(arr, b, arr_mask=None, b_mask=None):
+    """
+    Perform array addition that checks for underflow and overflow.
+
+    Performs the addition of an int64 array and an int64 integer (or array)
+    but checks that they do not result in overflow first. For elements that
+    are indicated to be NaN, whether or not there is overflow for that element
+    is automatically ignored.
+
+    Parameters
+    ----------
+    arr : array addend.
+    b : array or scalar addend.
+    arr_mask : boolean array or None
+        array indicating which elements to exclude from checking
+    b_mask : boolean array or boolean or None
+        array or scalar indicating which element(s) to exclude from checking
+
+    Returns
+    -------
+    sum : An array for elements x + b for each element x in arr if b is
+          a scalar or an array for elements x + y for each element pair
+          (x, y) in (arr, b).
+
+    Raises
+    ------
+    OverflowError if any x + y exceeds the maximum or minimum int64 value.
+    """
+    def _broadcast(arr_or_scalar, shape):
+        """
+        Helper function to broadcast arrays / scalars to the desired shape.
+        """
+        if _np_version_under1p10:
+            if is_scalar(arr_or_scalar):
+                out = np.empty(shape)
+                out.fill(arr_or_scalar)
+            else:
+                out = arr_or_scalar
+        else:
+            out = np.broadcast_to(arr_or_scalar, shape)
+        return out
+
+    # For performance reasons, we broadcast 'b' to the new array 'b2'
+    # so that it has the same size as 'arr'.
+    b2 = _broadcast(b, arr.shape)
+    if b_mask is not None:
+        # We do the same broadcasting for b_mask as well.
+        b2_mask = _broadcast(b_mask, arr.shape)
+    else:
+        b2_mask = None
+
+    # For elements that are NaN, regardless of their value, we should
+    # ignore whether they overflow or not when doing the checked add.
+    if arr_mask is not None and b2_mask is not None:
+        not_nan = np.logical_not(arr_mask | b2_mask)
+    elif arr_mask is not None:
+        not_nan = np.logical_not(arr_mask)
+    elif b_mask is not None:
+        not_nan = np.logical_not(b2_mask)
+    else:
+        not_nan = np.empty(arr.shape, dtype=bool)
+        not_nan.fill(True)
+
+    # gh-14324: For each element in 'arr' and its corresponding element
+    # in 'b2', we check the sign of the element in 'b2'. If it is positive,
+    # we then check whether its sum with the element in 'arr' exceeds
+    # np.iinfo(np.int64).max. If so, we have an overflow error. If it
+    # it is negative, we then check whether its sum with the element in
+    # 'arr' exceeds np.iinfo(np.int64).min. If so, we have an overflow
+    # error as well.
+    mask1 = b2 > 0
+    mask2 = b2 < 0
+
+    if not mask1.any():
+        to_raise = ((np.iinfo(np.int64).min - b2 > arr) & not_nan).any()
+    elif not mask2.any():
+        to_raise = ((np.iinfo(np.int64).max - b2 < arr) & not_nan).any()
+    else:
+        to_raise = (((np.iinfo(np.int64).max -
+                      b2[mask1] < arr[mask1]) & not_nan[mask1]).any() or
+                    ((np.iinfo(np.int64).min -
+                      b2[mask2] > arr[mask2]) & not_nan[mask2]).any())
+
+    if to_raise:
+        raise OverflowError("Overflow in int64 addition")
+    return arr + b
+
+
+_rank1d_functions = {
+    'float64': algos.rank_1d_float64,
+    'int64': algos.rank_1d_int64,
+    'uint64': algos.rank_1d_uint64,
+    'object': algos.rank_1d_object
+}
+
+_rank2d_functions = {
+    'float64': algos.rank_2d_float64,
+    'int64': algos.rank_2d_int64,
+    'uint64': algos.rank_2d_uint64,
+    'object': algos.rank_2d_object
+}
+
+
 def quantile(x, q, interpolation_method='fraction'):
     """
     Compute sample quantile or quantiles of the input array. For example, q=0.5
@@ -428,12 +1025,18 @@ def quantile(x, q, interpolation_method='fraction'):
 
     """
     x = np.asarray(x)
-    mask = com.isnull(x)
+    mask = isna(x)
 
     x = x[~mask]
 
     values = np.sort(x)
 
+    def _interpolate(a, b, fraction):
+        """Returns the point at the given fraction between a and b, where
+        'fraction' must be between 0 and 1.
+        """
+        return a + (b - a) * fraction
+
     def _get_score(at):
         if len(values) == 0:
             return np.nan
@@ -455,163 +1058,779 @@ def _get_score(at):
 
         return score
 
-    if np.isscalar(q):
+    if is_scalar(q):
         return _get_score(q)
     else:
         q = np.asarray(q, np.float64)
         return algos.arrmap_float64(q, _get_score)
 
 
-def _interpolate(a, b, fraction):
-    """Returns the point at the given fraction between a and b, where
-    'fraction' must be between 0 and 1.
-    """
-    return a + (b - a) * fraction
+# --------------- #
+# select n        #
+# --------------- #
 
+class SelectN(object):
 
-def _get_data_algo(values, func_map):
-    mask = None
-    if com.is_float_dtype(values):
-        f = func_map['float64']
-        values = com._ensure_float64(values)
-
-    elif com.needs_i8_conversion(values):
-
-        # if we have NaT, punt to object dtype
-        mask = com.isnull(values)
-        if mask.ravel().any():
-            f = func_map['generic']
-            values = com._ensure_object(values)
-            values[mask] = np.nan
-        else:
-            f = func_map['int64']
-            values = values.view('i8')
+    def __init__(self, obj, n, keep):
+        self.obj = obj
+        self.n = n
+        self.keep = keep
 
-    elif com.is_integer_dtype(values):
-        f = func_map['int64']
-        values = com._ensure_int64(values)
-    else:
-        f = func_map['generic']
-        values = com._ensure_object(values)
-    return f, values
+        if self.keep not in ('first', 'last', 'all'):
+            raise ValueError('keep must be either "first", "last" or "all"')
+
+    def nlargest(self):
+        return self.compute('nlargest')
 
+    def nsmallest(self):
+        return self.compute('nsmallest')
 
-def group_position(*args):
+    @staticmethod
+    def is_valid_dtype_n_method(dtype):
+        """
+        Helper function to determine if dtype is valid for
+        nsmallest/nlargest methods
+        """
+        return ((is_numeric_dtype(dtype) and not is_complex_dtype(dtype)) or
+                needs_i8_conversion(dtype))
+
+
+class SelectNSeries(SelectN):
     """
-    Get group position
+    Implement n largest/smallest for Series
+
+    Parameters
+    ----------
+    obj : Series
+    n : int
+    keep : {'first', 'last'}, default 'first'
+
+    Returns
+    -------
+    nordered : Series
     """
-    from collections import defaultdict
-    table = defaultdict(int)
 
-    result = []
-    for tup in zip(*args):
-        result.append(table[tup])
-        table[tup] += 1
+    def compute(self, method):
 
-    return result
+        n = self.n
+        dtype = self.obj.dtype
+        if not self.is_valid_dtype_n_method(dtype):
+            raise TypeError("Cannot use method '{method}' with "
+                            "dtype {dtype}".format(method=method,
+                                                   dtype=dtype))
+
+        if n <= 0:
+            return self.obj[[]]
+
+        dropped = self.obj.dropna()
+
+        # slow method
+        if n >= len(self.obj):
+
+            reverse_it = (self.keep == 'last' or method == 'nlargest')
+            ascending = method == 'nsmallest'
+            slc = np.s_[::-1] if reverse_it else np.s_[:]
+            return dropped[slc].sort_values(ascending=ascending).head(n)
+
+        # fast method
+        arr, pandas_dtype, _ = _ensure_data(dropped.values)
+        if method == 'nlargest':
+            arr = -arr
+            if is_integer_dtype(pandas_dtype):
+                # GH 21426: ensure reverse ordering at boundaries
+                arr -= 1
+
+        if self.keep == 'last':
+            arr = arr[::-1]
+
+        narr = len(arr)
+        n = min(n, narr)
+
+        kth_val = algos.kth_smallest(arr.copy(), n - 1)
+        ns, = np.nonzero(arr <= kth_val)
+        inds = ns[arr[ns].argsort(kind='mergesort')]
+
+        if self.keep != 'all':
+            inds = inds[:n]
 
+        if self.keep == 'last':
+            # reverse indices
+            inds = narr - 1 - inds
 
-_dtype_map = {'datetime64[ns]': 'int64', 'timedelta64[ns]': 'int64'}
+        return dropped.iloc[inds]
 
 
-def _finalize_nsmallest(arr, kth_val, n, keep, narr):
-    ns, = np.nonzero(arr <= kth_val)
-    inds = ns[arr[ns].argsort(kind='mergesort')][:n]
-    if keep == 'last':
-        # reverse indices
-        return narr - 1 - inds
+class SelectNFrame(SelectN):
+    """
+    Implement n largest/smallest for DataFrame
+
+    Parameters
+    ----------
+    obj : DataFrame
+    n : int
+    keep : {'first', 'last'}, default 'first'
+    columns : list or str
+
+    Returns
+    -------
+    nordered : DataFrame
+    """
+
+    def __init__(self, obj, n, keep, columns):
+        super(SelectNFrame, self).__init__(obj, n, keep)
+        if not is_list_like(columns):
+            columns = [columns]
+        columns = list(columns)
+        self.columns = columns
+
+    def compute(self, method):
+
+        from pandas import Int64Index
+        n = self.n
+        frame = self.obj
+        columns = self.columns
+
+        for column in columns:
+            dtype = frame[column].dtype
+            if not self.is_valid_dtype_n_method(dtype):
+                raise TypeError((
+                    "Column {column!r} has dtype {dtype}, cannot use method "
+                    "{method!r} with this dtype"
+                ).format(column=column, dtype=dtype, method=method))
+
+        def get_indexer(current_indexer, other_indexer):
+            """Helper function to concat `current_indexer` and `other_indexer`
+            depending on `method`
+            """
+            if method == 'nsmallest':
+                return current_indexer.append(other_indexer)
+            else:
+                return other_indexer.append(current_indexer)
+
+        # Below we save and reset the index in case index contains duplicates
+        original_index = frame.index
+        cur_frame = frame = frame.reset_index(drop=True)
+        cur_n = n
+        indexer = Int64Index([])
+
+        for i, column in enumerate(columns):
+
+            # For each column we apply method to cur_frame[column].
+            # If it is the last column in columns, or if the values
+            # returned are unique in frame[column] we save this index
+            # and break
+            # Otherwise we must save the index of the non duplicated values
+            # and set the next cur_frame to cur_frame filtered on all
+            # duplcicated values (#GH15297)
+            series = cur_frame[column]
+            values = getattr(series, method)(cur_n, keep=self.keep)
+            is_last_column = len(columns) - 1 == i
+            if is_last_column or values.nunique() == series.isin(values).sum():
+
+                # Last column in columns or values are unique in
+                # series => values
+                # is all that matters
+                indexer = get_indexer(indexer, values.index)
+                break
+
+            duplicated_filter = series.duplicated(keep=False)
+            duplicated = values[duplicated_filter]
+            non_duplicated = values[~duplicated_filter]
+            indexer = get_indexer(indexer, non_duplicated.index)
+
+            # Must set cur frame to include all duplicated values
+            # to consider for the next column, we also can reduce
+            # cur_n by the current length of the indexer
+            cur_frame = cur_frame[series.isin(duplicated)]
+            cur_n = n - len(indexer)
+
+        frame = frame.take(indexer)
+
+        # Restore the index on frame
+        frame.index = original_index.take(indexer)
+        return frame
+
+
+# ------- ## ---- #
+# take #
+# ---- #
+
+
+def _view_wrapper(f, arr_dtype=None, out_dtype=None, fill_wrap=None):
+    def wrapper(arr, indexer, out, fill_value=np.nan):
+        if arr_dtype is not None:
+            arr = arr.view(arr_dtype)
+        if out_dtype is not None:
+            out = out.view(out_dtype)
+        if fill_wrap is not None:
+            fill_value = fill_wrap(fill_value)
+        f(arr, indexer, out, fill_value=fill_value)
+
+    return wrapper
+
+
+def _convert_wrapper(f, conv_dtype):
+    def wrapper(arr, indexer, out, fill_value=np.nan):
+        arr = arr.astype(conv_dtype)
+        f(arr, indexer, out, fill_value=fill_value)
+
+    return wrapper
+
+
+def _take_2d_multi_object(arr, indexer, out, fill_value, mask_info):
+    # this is not ideal, performance-wise, but it's better than raising
+    # an exception (best to optimize in Cython to avoid getting here)
+    row_idx, col_idx = indexer
+    if mask_info is not None:
+        (row_mask, col_mask), (row_needs, col_needs) = mask_info
+    else:
+        row_mask = row_idx == -1
+        col_mask = col_idx == -1
+        row_needs = row_mask.any()
+        col_needs = col_mask.any()
+    if fill_value is not None:
+        if row_needs:
+            out[row_mask, :] = fill_value
+        if col_needs:
+            out[:, col_mask] = fill_value
+    for i in range(len(row_idx)):
+        u_ = row_idx[i]
+        for j in range(len(col_idx)):
+            v = col_idx[j]
+            out[i, j] = arr[u_, v]
+
+
+def _take_nd_object(arr, indexer, out, axis, fill_value, mask_info):
+    if mask_info is not None:
+        mask, needs_masking = mask_info
     else:
-        return inds
+        mask = indexer == -1
+        needs_masking = mask.any()
+    if arr.dtype != out.dtype:
+        arr = arr.astype(out.dtype)
+    if arr.shape[axis] > 0:
+        arr.take(_ensure_platform_int(indexer), axis=axis, out=out)
+    if needs_masking:
+        outindexer = [slice(None)] * arr.ndim
+        outindexer[axis] = mask
+        out[tuple(outindexer)] = fill_value
+
+
+_take_1d_dict = {
+    ('int8', 'int8'): algos.take_1d_int8_int8,
+    ('int8', 'int32'): algos.take_1d_int8_int32,
+    ('int8', 'int64'): algos.take_1d_int8_int64,
+    ('int8', 'float64'): algos.take_1d_int8_float64,
+    ('int16', 'int16'): algos.take_1d_int16_int16,
+    ('int16', 'int32'): algos.take_1d_int16_int32,
+    ('int16', 'int64'): algos.take_1d_int16_int64,
+    ('int16', 'float64'): algos.take_1d_int16_float64,
+    ('int32', 'int32'): algos.take_1d_int32_int32,
+    ('int32', 'int64'): algos.take_1d_int32_int64,
+    ('int32', 'float64'): algos.take_1d_int32_float64,
+    ('int64', 'int64'): algos.take_1d_int64_int64,
+    ('int64', 'float64'): algos.take_1d_int64_float64,
+    ('float32', 'float32'): algos.take_1d_float32_float32,
+    ('float32', 'float64'): algos.take_1d_float32_float64,
+    ('float64', 'float64'): algos.take_1d_float64_float64,
+    ('object', 'object'): algos.take_1d_object_object,
+    ('bool', 'bool'): _view_wrapper(algos.take_1d_bool_bool, np.uint8,
+                                    np.uint8),
+    ('bool', 'object'): _view_wrapper(algos.take_1d_bool_object, np.uint8,
+                                      None),
+    ('datetime64[ns]', 'datetime64[ns]'): _view_wrapper(
+        algos.take_1d_int64_int64, np.int64, np.int64, np.int64)
+}
 
+_take_2d_axis0_dict = {
+    ('int8', 'int8'): algos.take_2d_axis0_int8_int8,
+    ('int8', 'int32'): algos.take_2d_axis0_int8_int32,
+    ('int8', 'int64'): algos.take_2d_axis0_int8_int64,
+    ('int8', 'float64'): algos.take_2d_axis0_int8_float64,
+    ('int16', 'int16'): algos.take_2d_axis0_int16_int16,
+    ('int16', 'int32'): algos.take_2d_axis0_int16_int32,
+    ('int16', 'int64'): algos.take_2d_axis0_int16_int64,
+    ('int16', 'float64'): algos.take_2d_axis0_int16_float64,
+    ('int32', 'int32'): algos.take_2d_axis0_int32_int32,
+    ('int32', 'int64'): algos.take_2d_axis0_int32_int64,
+    ('int32', 'float64'): algos.take_2d_axis0_int32_float64,
+    ('int64', 'int64'): algos.take_2d_axis0_int64_int64,
+    ('int64', 'float64'): algos.take_2d_axis0_int64_float64,
+    ('float32', 'float32'): algos.take_2d_axis0_float32_float32,
+    ('float32', 'float64'): algos.take_2d_axis0_float32_float64,
+    ('float64', 'float64'): algos.take_2d_axis0_float64_float64,
+    ('object', 'object'): algos.take_2d_axis0_object_object,
+    ('bool', 'bool'): _view_wrapper(algos.take_2d_axis0_bool_bool, np.uint8,
+                                    np.uint8),
+    ('bool', 'object'): _view_wrapper(algos.take_2d_axis0_bool_object,
+                                      np.uint8, None),
+    ('datetime64[ns]', 'datetime64[ns]'):
+    _view_wrapper(algos.take_2d_axis0_int64_int64, np.int64, np.int64,
+                  fill_wrap=np.int64)
+}
 
-def nsmallest(arr, n, keep='first'):
-    '''
-    Find the indices of the n smallest values of a numpy array.
+_take_2d_axis1_dict = {
+    ('int8', 'int8'): algos.take_2d_axis1_int8_int8,
+    ('int8', 'int32'): algos.take_2d_axis1_int8_int32,
+    ('int8', 'int64'): algos.take_2d_axis1_int8_int64,
+    ('int8', 'float64'): algos.take_2d_axis1_int8_float64,
+    ('int16', 'int16'): algos.take_2d_axis1_int16_int16,
+    ('int16', 'int32'): algos.take_2d_axis1_int16_int32,
+    ('int16', 'int64'): algos.take_2d_axis1_int16_int64,
+    ('int16', 'float64'): algos.take_2d_axis1_int16_float64,
+    ('int32', 'int32'): algos.take_2d_axis1_int32_int32,
+    ('int32', 'int64'): algos.take_2d_axis1_int32_int64,
+    ('int32', 'float64'): algos.take_2d_axis1_int32_float64,
+    ('int64', 'int64'): algos.take_2d_axis1_int64_int64,
+    ('int64', 'float64'): algos.take_2d_axis1_int64_float64,
+    ('float32', 'float32'): algos.take_2d_axis1_float32_float32,
+    ('float32', 'float64'): algos.take_2d_axis1_float32_float64,
+    ('float64', 'float64'): algos.take_2d_axis1_float64_float64,
+    ('object', 'object'): algos.take_2d_axis1_object_object,
+    ('bool', 'bool'): _view_wrapper(algos.take_2d_axis1_bool_bool, np.uint8,
+                                    np.uint8),
+    ('bool', 'object'): _view_wrapper(algos.take_2d_axis1_bool_object,
+                                      np.uint8, None),
+    ('datetime64[ns]', 'datetime64[ns]'):
+    _view_wrapper(algos.take_2d_axis1_int64_int64, np.int64, np.int64,
+                  fill_wrap=np.int64)
+}
 
-    Note: Fails silently with NaN.
+_take_2d_multi_dict = {
+    ('int8', 'int8'): algos.take_2d_multi_int8_int8,
+    ('int8', 'int32'): algos.take_2d_multi_int8_int32,
+    ('int8', 'int64'): algos.take_2d_multi_int8_int64,
+    ('int8', 'float64'): algos.take_2d_multi_int8_float64,
+    ('int16', 'int16'): algos.take_2d_multi_int16_int16,
+    ('int16', 'int32'): algos.take_2d_multi_int16_int32,
+    ('int16', 'int64'): algos.take_2d_multi_int16_int64,
+    ('int16', 'float64'): algos.take_2d_multi_int16_float64,
+    ('int32', 'int32'): algos.take_2d_multi_int32_int32,
+    ('int32', 'int64'): algos.take_2d_multi_int32_int64,
+    ('int32', 'float64'): algos.take_2d_multi_int32_float64,
+    ('int64', 'int64'): algos.take_2d_multi_int64_int64,
+    ('int64', 'float64'): algos.take_2d_multi_int64_float64,
+    ('float32', 'float32'): algos.take_2d_multi_float32_float32,
+    ('float32', 'float64'): algos.take_2d_multi_float32_float64,
+    ('float64', 'float64'): algos.take_2d_multi_float64_float64,
+    ('object', 'object'): algos.take_2d_multi_object_object,
+    ('bool', 'bool'): _view_wrapper(algos.take_2d_multi_bool_bool, np.uint8,
+                                    np.uint8),
+    ('bool', 'object'): _view_wrapper(algos.take_2d_multi_bool_object,
+                                      np.uint8, None),
+    ('datetime64[ns]', 'datetime64[ns]'):
+    _view_wrapper(algos.take_2d_multi_int64_int64, np.int64, np.int64,
+                  fill_wrap=np.int64)
+}
 
-    '''
-    if keep == 'last':
-        arr = arr[::-1]
 
-    narr = len(arr)
-    n = min(n, narr)
+def _get_take_nd_function(ndim, arr_dtype, out_dtype, axis=0, mask_info=None):
+    if ndim <= 2:
+        tup = (arr_dtype.name, out_dtype.name)
+        if ndim == 1:
+            func = _take_1d_dict.get(tup, None)
+        elif ndim == 2:
+            if axis == 0:
+                func = _take_2d_axis0_dict.get(tup, None)
+            else:
+                func = _take_2d_axis1_dict.get(tup, None)
+        if func is not None:
+            return func
+
+        tup = (out_dtype.name, out_dtype.name)
+        if ndim == 1:
+            func = _take_1d_dict.get(tup, None)
+        elif ndim == 2:
+            if axis == 0:
+                func = _take_2d_axis0_dict.get(tup, None)
+            else:
+                func = _take_2d_axis1_dict.get(tup, None)
+        if func is not None:
+            func = _convert_wrapper(func, out_dtype)
+            return func
 
-    sdtype = str(arr.dtype)
-    arr = arr.view(_dtype_map.get(sdtype, sdtype))
+    def func(arr, indexer, out, fill_value=np.nan):
+        indexer = _ensure_int64(indexer)
+        _take_nd_object(arr, indexer, out, axis=axis, fill_value=fill_value,
+                        mask_info=mask_info)
 
-    kth_val = algos.kth_smallest(arr.copy(), n - 1)
-    return _finalize_nsmallest(arr, kth_val, n, keep, narr)
+    return func
 
 
-def nlargest(arr, n, keep='first'):
+def take(arr, indices, axis=0, allow_fill=False, fill_value=None):
     """
-    Find the indices of the n largest values of a numpy array.
+    Take elements from an array.
+
+    .. versionadded:: 0.23.0
 
-    Note: Fails silently with NaN.
+    Parameters
+    ----------
+    arr : sequence
+        Non array-likes (sequences without a dtype) are coerced
+        to an ndarray.
+    indices : sequence of integers
+        Indices to be taken.
+    axis : int, default 0
+        The axis over which to select values.
+    allow_fill : bool, default False
+        How to handle negative values in `indices`.
+
+        * False: negative values in `indices` indicate positional indices
+          from the right (the default). This is similar to :func:`numpy.take`.
+
+        * True: negative values in `indices` indicate
+          missing values. These values are set to `fill_value`. Any other
+          other negative values raise a ``ValueError``.
+
+    fill_value : any, optional
+        Fill value to use for NA-indices when `allow_fill` is True.
+        This may be ``None``, in which case the default NA value for
+        the type (``self.dtype.na_value``) is used.
+
+        For multi-dimensional `arr`, each *element* is filled with
+        `fill_value`.
+
+    Returns
+    -------
+    ndarray or ExtensionArray
+        Same type as the input.
+
+    Raises
+    ------
+    IndexError
+        When `indices` is out of bounds for the array.
+    ValueError
+        When the indexer contains negative values other than ``-1``
+        and `allow_fill` is True.
+
+    Notes
+    -----
+    When `allow_fill` is False, `indices` may be whatever dimensionality
+    is accepted by NumPy for `arr`.
+
+    When `allow_fill` is True, `indices` should be 1-D.
+
+    See Also
+    --------
+    numpy.take
+
+    Examples
+    --------
+    >>> from pandas.api.extensions import take
+
+    With the default ``allow_fill=False``, negative numbers indicate
+    positional indices from the right.
+
+    >>> take(np.array([10, 20, 30]), [0, 0, -1])
+    array([10, 10, 30])
+
+    Setting ``allow_fill=True`` will place `fill_value` in those positions.
+
+    >>> take(np.array([10, 20, 30]), [0, 0, -1], allow_fill=True)
+    array([10., 10., nan])
+
+    >>> take(np.array([10, 20, 30]), [0, 0, -1], allow_fill=True,
+    ...      fill_value=-10)
+    array([ 10,  10, -10])
     """
-    sdtype = str(arr.dtype)
-    arr = arr.view(_dtype_map.get(sdtype, sdtype))
-    return nsmallest(-arr, n, keep=keep)
+    from pandas.core.indexing import validate_indices
 
+    if not is_array_like(arr):
+        arr = np.asarray(arr)
 
-def select_n_slow(dropped, n, keep, method):
-    reverse_it = (keep == 'last' or method == 'nlargest')
-    ascending = method == 'nsmallest'
-    slc = np.s_[::-1] if reverse_it else np.s_[:]
-    return dropped[slc].sort_values(ascending=ascending).head(n)
+    indices = np.asarray(indices, dtype=np.intp)
 
+    if allow_fill:
+        # Pandas style, -1 means NA
+        validate_indices(indices, len(arr))
+        result = take_1d(arr, indices, axis=axis, allow_fill=True,
+                         fill_value=fill_value)
+    else:
+        # NumPy style
+        result = arr.take(indices, axis=axis)
+    return result
 
-_select_methods = {'nsmallest': nsmallest, 'nlargest': nlargest}
 
+def take_nd(arr, indexer, axis=0, out=None, fill_value=np.nan, mask_info=None,
+            allow_fill=True):
+    """
+    Specialized Cython take which sets NaN values in one pass
 
-def select_n(series, n, keep, method):
-    """Implement n largest/smallest.
+    This dispatches to ``take`` defined on ExtensionArrays. It does not
+    currently dispatch to ``SparseArray.take`` for sparse ``arr``.
 
     Parameters
     ----------
-    n : int
-    keep : {'first', 'last'}, default 'first'
-    method : str, {'nlargest', 'nsmallest'}
+    arr : array-like
+        Input array.
+    indexer : ndarray
+        1-D array of indices to take, subarrays corresponding to -1 value
+        indices are filed with fill_value
+    axis : int, default 0
+        Axis to take from
+    out : ndarray or None, default None
+        Optional output array, must be appropriate type to hold input and
+        fill_value together, if indexer has any -1 value entries; call
+        _maybe_promote to determine this type for any fill_value
+    fill_value : any, default np.nan
+        Fill value to replace -1 values with
+    mask_info : tuple of (ndarray, boolean)
+        If provided, value should correspond to:
+            (indexer != -1, (indexer != -1).any())
+        If not provided, it will be computed internally if necessary
+    allow_fill : boolean, default True
+        If False, indexer is assumed to contain no -1 values so no filling
+        will be done.  This short-circuits computation of a mask.  Result is
+        undefined if allow_fill == False and -1 is present in indexer.
 
     Returns
     -------
-    nordered : Series
+    subarray : array-like
+        May be the same type as the input, or cast to an ndarray.
     """
-    dtype = series.dtype
-    if not issubclass(dtype.type, (np.integer, np.floating, np.datetime64,
-                                   np.timedelta64)):
-        raise TypeError("Cannot use method %r with dtype %s" % (method, dtype))
 
-    if keep not in ('first', 'last'):
-        raise ValueError('keep must be either "first", "last"')
+    # TODO(EA): Remove these if / elifs as datetimeTZ, interval, become EAs
+    # dispatch to internal type takes
+    if is_extension_array_dtype(arr):
+        return arr.take(indexer, fill_value=fill_value, allow_fill=allow_fill)
+    elif is_datetimetz(arr):
+        return arr.take(indexer, fill_value=fill_value, allow_fill=allow_fill)
+    elif is_interval_dtype(arr):
+        return arr.take(indexer, fill_value=fill_value, allow_fill=allow_fill)
+
+    if is_sparse(arr):
+        arr = arr.get_values()
+    elif isinstance(arr, (ABCIndexClass, ABCSeries)):
+        arr = arr.values
+
+    arr = np.asarray(arr)
+
+    if indexer is None:
+        indexer = np.arange(arr.shape[axis], dtype=np.int64)
+        dtype, fill_value = arr.dtype, arr.dtype.type()
+    else:
+        indexer = _ensure_int64(indexer, copy=False)
+        if not allow_fill:
+            dtype, fill_value = arr.dtype, arr.dtype.type()
+            mask_info = None, False
+        else:
+            # check for promotion based on types only (do this first because
+            # it's faster than computing a mask)
+            dtype, fill_value = maybe_promote(arr.dtype, fill_value)
+            if dtype != arr.dtype and (out is None or out.dtype != dtype):
+                # check if promotion is actually required based on indexer
+                if mask_info is not None:
+                    mask, needs_masking = mask_info
+                else:
+                    mask = indexer == -1
+                    needs_masking = mask.any()
+                    mask_info = mask, needs_masking
+                if needs_masking:
+                    if out is not None and out.dtype != dtype:
+                        raise TypeError('Incompatible type for fill_value')
+                else:
+                    # if not, then depromote, set fill_value to dummy
+                    # (it won't be used but we don't want the cython code
+                    # to crash when trying to cast it to dtype)
+                    dtype, fill_value = arr.dtype, arr.dtype.type()
+
+    flip_order = False
+    if arr.ndim == 2:
+        if arr.flags.f_contiguous:
+            flip_order = True
+
+    if flip_order:
+        arr = arr.T
+        axis = arr.ndim - axis - 1
+        if out is not None:
+            out = out.T
+
+    # at this point, it's guaranteed that dtype can hold both the arr values
+    # and the fill_value
+    if out is None:
+        out_shape = list(arr.shape)
+        out_shape[axis] = len(indexer)
+        out_shape = tuple(out_shape)
+        if arr.flags.f_contiguous and axis == arr.ndim - 1:
+            # minor tweak that can make an order-of-magnitude difference
+            # for dataframes initialized directly from 2-d ndarrays
+            # (s.t. df.values is c-contiguous and df._data.blocks[0] is its
+            # f-contiguous transpose)
+            out = np.empty(out_shape, dtype=dtype, order='F')
+        else:
+            out = np.empty(out_shape, dtype=dtype)
 
-    if n <= 0:
-        return series[[]]
+    func = _get_take_nd_function(arr.ndim, arr.dtype, out.dtype, axis=axis,
+                                 mask_info=mask_info)
+    func(arr, indexer, out, fill_value)
 
-    dropped = series.dropna()
+    if flip_order:
+        out = out.T
+    return out
 
-    if n >= len(series):
-        return select_n_slow(dropped, n, keep, method)
 
-    inds = _select_methods[method](dropped.values, n, keep)
-    return dropped.iloc[inds]
+take_1d = take_nd
 
 
-_rank1d_functions = {
-    'float64': algos.rank_1d_float64,
-    'int64': algos.rank_1d_int64,
-    'generic': algos.rank_1d_generic
+def take_2d_multi(arr, indexer, out=None, fill_value=np.nan, mask_info=None,
+                  allow_fill=True):
+    """
+    Specialized Cython take which sets NaN values in one pass
+    """
+    if indexer is None or (indexer[0] is None and indexer[1] is None):
+        row_idx = np.arange(arr.shape[0], dtype=np.int64)
+        col_idx = np.arange(arr.shape[1], dtype=np.int64)
+        indexer = row_idx, col_idx
+        dtype, fill_value = arr.dtype, arr.dtype.type()
+    else:
+        row_idx, col_idx = indexer
+        if row_idx is None:
+            row_idx = np.arange(arr.shape[0], dtype=np.int64)
+        else:
+            row_idx = _ensure_int64(row_idx)
+        if col_idx is None:
+            col_idx = np.arange(arr.shape[1], dtype=np.int64)
+        else:
+            col_idx = _ensure_int64(col_idx)
+        indexer = row_idx, col_idx
+        if not allow_fill:
+            dtype, fill_value = arr.dtype, arr.dtype.type()
+            mask_info = None, False
+        else:
+            # check for promotion based on types only (do this first because
+            # it's faster than computing a mask)
+            dtype, fill_value = maybe_promote(arr.dtype, fill_value)
+            if dtype != arr.dtype and (out is None or out.dtype != dtype):
+                # check if promotion is actually required based on indexer
+                if mask_info is not None:
+                    (row_mask, col_mask), (row_needs, col_needs) = mask_info
+                else:
+                    row_mask = row_idx == -1
+                    col_mask = col_idx == -1
+                    row_needs = row_mask.any()
+                    col_needs = col_mask.any()
+                    mask_info = (row_mask, col_mask), (row_needs, col_needs)
+                if row_needs or col_needs:
+                    if out is not None and out.dtype != dtype:
+                        raise TypeError('Incompatible type for fill_value')
+                else:
+                    # if not, then depromote, set fill_value to dummy
+                    # (it won't be used but we don't want the cython code
+                    # to crash when trying to cast it to dtype)
+                    dtype, fill_value = arr.dtype, arr.dtype.type()
+
+    # at this point, it's guaranteed that dtype can hold both the arr values
+    # and the fill_value
+    if out is None:
+        out_shape = len(row_idx), len(col_idx)
+        out = np.empty(out_shape, dtype=dtype)
+
+    func = _take_2d_multi_dict.get((arr.dtype.name, out.dtype.name), None)
+    if func is None and arr.dtype != out.dtype:
+        func = _take_2d_multi_dict.get((out.dtype.name, out.dtype.name), None)
+        if func is not None:
+            func = _convert_wrapper(func, out.dtype)
+    if func is None:
+
+        def func(arr, indexer, out, fill_value=np.nan):
+            _take_2d_multi_object(arr, indexer, out, fill_value=fill_value,
+                                  mask_info=mask_info)
+
+    func(arr, indexer, out=out, fill_value=fill_value)
+    return out
+
+
+# ---- #
+# diff #
+# ---- #
+
+_diff_special = {
+    'float64': algos.diff_2d_float64,
+    'float32': algos.diff_2d_float32,
+    'int64': algos.diff_2d_int64,
+    'int32': algos.diff_2d_int32,
+    'int16': algos.diff_2d_int16,
+    'int8': algos.diff_2d_int8,
 }
 
-_rank2d_functions = {
-    'float64': algos.rank_2d_float64,
-    'int64': algos.rank_2d_int64,
-    'generic': algos.rank_2d_generic
-}
 
-_hashtables = {
-    'float64': (htable.Float64HashTable, htable.Float64Vector),
-    'int64': (htable.Int64HashTable, htable.Int64Vector),
-    'generic': (htable.PyObjectHashTable, htable.ObjectVector)
-}
+def diff(arr, n, axis=0):
+    """
+    difference of n between self,
+    analogous to s-s.shift(n)
+
+    Parameters
+    ----------
+    arr : ndarray
+    n : int
+        number of periods
+    axis : int
+        axis to shift on
+
+    Returns
+    -------
+    shifted
+
+    """
+
+    n = int(n)
+    na = np.nan
+    dtype = arr.dtype
+
+    is_timedelta = False
+    if needs_i8_conversion(arr):
+        dtype = np.float64
+        arr = arr.view('i8')
+        na = iNaT
+        is_timedelta = True
+
+    elif is_bool_dtype(dtype):
+        dtype = np.object_
+
+    elif is_integer_dtype(dtype):
+        dtype = np.float64
+
+    dtype = np.dtype(dtype)
+    out_arr = np.empty(arr.shape, dtype=dtype)
+
+    na_indexer = [slice(None)] * arr.ndim
+    na_indexer[axis] = slice(None, n) if n >= 0 else slice(n, None)
+    out_arr[tuple(na_indexer)] = na
+
+    if arr.ndim == 2 and arr.dtype.name in _diff_special:
+        f = _diff_special[arr.dtype.name]
+        f(arr, out_arr, n, axis)
+    else:
+        res_indexer = [slice(None)] * arr.ndim
+        res_indexer[axis] = slice(n, None) if n >= 0 else slice(None, n)
+        res_indexer = tuple(res_indexer)
+
+        lag_indexer = [slice(None)] * arr.ndim
+        lag_indexer[axis] = slice(None, -n) if n > 0 else slice(-n, None)
+        lag_indexer = tuple(lag_indexer)
+
+        # need to make sure that we account for na for datelike/timedelta
+        # we don't actually want to subtract these i8 numbers
+        if is_timedelta:
+            res = arr[res_indexer]
+            lag = arr[lag_indexer]
+
+            mask = (arr[res_indexer] == na) | (arr[lag_indexer] == na)
+            if mask.any():
+                res = res.copy()
+                res[mask] = 0
+                lag = lag.copy()
+                lag[mask] = 0
+
+            result = res - lag
+            result[mask] = na
+            out_arr[res_indexer] = result
+        else:
+            out_arr[res_indexer] = arr[res_indexer] - arr[lag_indexer]
+
+    if is_timedelta:
+        from pandas import TimedeltaIndex
+        out_arr = TimedeltaIndex(out_arr.ravel().astype('int64')).asi8.reshape(
+            out_arr.shape).astype('timedelta64[ns]')
+
+    return out_arr
diff --git a/pandas/core/api.py b/pandas/core/api.py
index e2ac57e37cba6..fa58e932ead13 100644
--- a/pandas/core/api.py
+++ b/pandas/core/api.py
@@ -1,33 +1,80 @@
 
 # pylint: disable=W0614,W0401,W0611
+# flake8: noqa
 
 import numpy as np
 
-from pandas.core.algorithms import factorize, match, unique, value_counts
-from pandas.core.common import isnull, notnull
-from pandas.core.categorical import Categorical
-from pandas.core.groupby import Grouper
-from pandas.core.format import set_eng_float_format
-from pandas.core.index import Index, CategoricalIndex, Int64Index, Float64Index, MultiIndex
+from pandas.core.algorithms import factorize, unique, value_counts
+from pandas.core.dtypes.missing import isna, isnull, notna, notnull
+from pandas.core.arrays import Categorical
+from pandas.core.groupby.groupby import Grouper
+from pandas.io.formats.format import set_eng_float_format
+from pandas.core.index import (Index, CategoricalIndex, Int64Index,
+                               UInt64Index, RangeIndex, Float64Index,
+                               MultiIndex, IntervalIndex,
+                               TimedeltaIndex, DatetimeIndex,
+                               PeriodIndex, NaT)
+from pandas.core.indexes.period import Period, period_range, pnow
+from pandas.core.indexes.timedeltas import Timedelta, timedelta_range
+from pandas.core.indexes.datetimes import Timestamp, date_range, bdate_range
+from pandas.core.indexes.interval import Interval, interval_range
 
-from pandas.core.series import Series, TimeSeries
+from pandas.core.series import Series
 from pandas.core.frame import DataFrame
-from pandas.core.panel import Panel, WidePanel
-from pandas.core.panel4d import Panel4D
-from pandas.core.groupby import groupby
-from pandas.core.reshape import (pivot_simple as pivot, get_dummies,
-                                 lreshape, wide_to_long)
+from pandas.core.panel import Panel
+
+# TODO: Remove import when statsmodels updates #18264
+from pandas.core.reshape.reshape import get_dummies
 
 from pandas.core.indexing import IndexSlice
+from pandas.core.tools.numeric import to_numeric
 from pandas.tseries.offsets import DateOffset
-from pandas.tseries.tools import to_datetime
-from pandas.tseries.index import (DatetimeIndex, Timestamp,
-                                  date_range, bdate_range)
-from pandas.tseries.tdi import TimedeltaIndex, Timedelta
-from pandas.tseries.period import Period, PeriodIndex
+from pandas.core.tools.datetimes import to_datetime
+from pandas.core.tools.timedeltas import to_timedelta
+
+# see gh-14094.
+from pandas.util._depr_module import _DeprecatedModule
 
-# legacy
-import pandas.core.datetools as datetools
+_removals = ['day', 'bday', 'businessDay', 'cday', 'customBusinessDay',
+             'customBusinessMonthEnd', 'customBusinessMonthBegin',
+             'monthEnd', 'yearEnd', 'yearBegin', 'bmonthEnd', 'bmonthBegin',
+             'cbmonthEnd', 'cbmonthBegin', 'bquarterEnd', 'quarterEnd',
+             'byearEnd', 'week']
+datetools = _DeprecatedModule(deprmod='pandas.core.datetools',
+                              removals=_removals)
 
 from pandas.core.config import (get_option, set_option, reset_option,
                                 describe_option, option_context, options)
+
+
+# deprecation, xref #13790
+def match(*args, **kwargs):
+
+    import warnings
+    warnings.warn("pd.match() is deprecated and will be removed "
+                  "in a future version",
+                  FutureWarning, stacklevel=2)
+    from pandas.core.algorithms import match
+    return match(*args, **kwargs)
+
+
+def groupby(*args, **kwargs):
+    import warnings
+
+    warnings.warn("pd.groupby() is deprecated and will be removed; "
+                  "Please use the Series.groupby() or "
+                  "DataFrame.groupby() methods",
+                  FutureWarning, stacklevel=2)
+    return args[0].groupby(*args[1:], **kwargs)
+
+
+# Deprecation: xref gh-16747
+class TimeGrouper(object):
+
+    def __new__(cls, *args, **kwargs):
+        from pandas.core.resample import TimeGrouper
+        import warnings
+        warnings.warn("pd.TimeGrouper is deprecated and will be removed; "
+                      "Please use pd.Grouper(freq=...)",
+                      FutureWarning, stacklevel=2)
+        return TimeGrouper(*args, **kwargs)
diff --git a/pandas/core/apply.py b/pandas/core/apply.py
new file mode 100644
index 0000000000000..27ac5038276d6
--- /dev/null
+++ b/pandas/core/apply.py
@@ -0,0 +1,411 @@
+import warnings
+import numpy as np
+from pandas import compat
+from pandas._libs import reduction
+from pandas.core.dtypes.generic import ABCSeries
+from pandas.core.dtypes.common import (
+    is_extension_type,
+    is_sequence)
+from pandas.util._decorators import cache_readonly
+
+from pandas.io.formats.printing import pprint_thing
+
+
+def frame_apply(obj, func, axis=0, broadcast=None,
+                raw=False, reduce=None, result_type=None,
+                ignore_failures=False,
+                args=None, kwds=None):
+    """ construct and return a row or column based frame apply object """
+
+    axis = obj._get_axis_number(axis)
+    if axis == 0:
+        klass = FrameRowApply
+    elif axis == 1:
+        klass = FrameColumnApply
+
+    return klass(obj, func, broadcast=broadcast,
+                 raw=raw, reduce=reduce, result_type=result_type,
+                 ignore_failures=ignore_failures,
+                 args=args, kwds=kwds)
+
+
+class FrameApply(object):
+
+    def __init__(self, obj, func, broadcast, raw, reduce, result_type,
+                 ignore_failures, args, kwds):
+        self.obj = obj
+        self.raw = raw
+        self.ignore_failures = ignore_failures
+        self.args = args or ()
+        self.kwds = kwds or {}
+
+        if result_type not in [None, 'reduce', 'broadcast', 'expand']:
+            raise ValueError("invalid value for result_type, must be one "
+                             "of {None, 'reduce', 'broadcast', 'expand'}")
+
+        if broadcast is not None:
+            warnings.warn("The broadcast argument is deprecated and will "
+                          "be removed in a future version. You can specify "
+                          "result_type='broadcast' to broadcast the result "
+                          "to the original dimensions",
+                          FutureWarning, stacklevel=4)
+            if broadcast:
+                result_type = 'broadcast'
+
+        if reduce is not None:
+            warnings.warn("The reduce argument is deprecated and will "
+                          "be removed in a future version. You can specify "
+                          "result_type='reduce' to try to reduce the result "
+                          "to the original dimensions",
+                          FutureWarning, stacklevel=4)
+            if reduce:
+
+                if result_type is not None:
+                    raise ValueError(
+                        "cannot pass both reduce=True and result_type")
+
+                result_type = 'reduce'
+
+        self.result_type = result_type
+
+        # curry if needed
+        if kwds or args and not isinstance(func, np.ufunc):
+            def f(x):
+                return func(x, *args, **kwds)
+        else:
+            f = func
+
+        self.f = f
+
+        # results
+        self.result = None
+        self.res_index = None
+        self.res_columns = None
+
+    @property
+    def columns(self):
+        return self.obj.columns
+
+    @property
+    def index(self):
+        return self.obj.index
+
+    @cache_readonly
+    def values(self):
+        return self.obj.values
+
+    @cache_readonly
+    def dtypes(self):
+        return self.obj.dtypes
+
+    @property
+    def agg_axis(self):
+        return self.obj._get_agg_axis(self.axis)
+
+    def get_result(self):
+        """ compute the results """
+
+        # all empty
+        if len(self.columns) == 0 and len(self.index) == 0:
+            return self.apply_empty_result()
+
+        # string dispatch
+        if isinstance(self.f, compat.string_types):
+            # Support for `frame.transform('method')`
+            # Some methods (shift, etc.) require the axis argument, others
+            # don't, so inspect and insert if necessary.
+            func = getattr(self.obj, self.f)
+            sig = compat.signature(func)
+            if 'axis' in sig.args:
+                self.kwds['axis'] = self.axis
+            return func(*self.args, **self.kwds)
+
+        # ufunc
+        elif isinstance(self.f, np.ufunc):
+            with np.errstate(all='ignore'):
+                results = self.f(self.values)
+            return self.obj._constructor(data=results, index=self.index,
+                                         columns=self.columns, copy=False)
+
+        # broadcasting
+        if self.result_type == 'broadcast':
+            return self.apply_broadcast()
+
+        # one axis empty
+        elif not all(self.obj.shape):
+            return self.apply_empty_result()
+
+        # raw
+        elif self.raw and not self.obj._is_mixed_type:
+            return self.apply_raw()
+
+        return self.apply_standard()
+
+    def apply_empty_result(self):
+        """
+        we have an empty result; at least 1 axis is 0
+
+        we will try to apply the function to an empty
+        series in order to see if this is a reduction function
+        """
+
+        # we are not asked to reduce or infer reduction
+        # so just return a copy of the existing object
+        if self.result_type not in ['reduce', None]:
+            return self.obj.copy()
+
+        # we may need to infer
+        reduce = self.result_type == 'reduce'
+
+        from pandas import Series
+        if not reduce:
+
+            EMPTY_SERIES = Series([])
+            try:
+                r = self.f(EMPTY_SERIES, *self.args, **self.kwds)
+                reduce = not isinstance(r, Series)
+            except Exception:
+                pass
+
+        if reduce:
+            return self.obj._constructor_sliced(np.nan, index=self.agg_axis)
+        else:
+            return self.obj.copy()
+
+    def apply_raw(self):
+        """ apply to the values as a numpy array """
+
+        try:
+            result = reduction.reduce(self.values, self.f, axis=self.axis)
+        except Exception:
+            result = np.apply_along_axis(self.f, self.axis, self.values)
+
+        # TODO: mixed type case
+        if result.ndim == 2:
+            return self.obj._constructor(result,
+                                         index=self.index,
+                                         columns=self.columns)
+        else:
+            return self.obj._constructor_sliced(result,
+                                                index=self.agg_axis)
+
+    def apply_broadcast(self, target):
+        result_values = np.empty_like(target.values)
+
+        # axis which we want to compare compliance
+        result_compare = target.shape[0]
+
+        for i, col in enumerate(target.columns):
+            res = self.f(target[col])
+            ares = np.asarray(res).ndim
+
+            # must be a scalar or 1d
+            if ares > 1:
+                raise ValueError("too many dims to broadcast")
+            elif ares == 1:
+
+                # must match return dim
+                if result_compare != len(res):
+                    raise ValueError("cannot broadcast result")
+
+            result_values[:, i] = res
+
+        # we *always* preserve the original index / columns
+        result = self.obj._constructor(result_values,
+                                       index=target.index,
+                                       columns=target.columns)
+        return result
+
+    def apply_standard(self):
+
+        # try to reduce first (by default)
+        # this only matters if the reduction in values is of different dtype
+        # e.g. if we want to apply to a SparseFrame, then can't directly reduce
+
+        # we cannot reduce using non-numpy dtypes,
+        # as demonstrated in gh-12244
+        if (self.result_type in ['reduce', None] and
+                not self.dtypes.apply(is_extension_type).any()):
+
+            # Create a dummy Series from an empty array
+            from pandas import Series
+            values = self.values
+            index = self.obj._get_axis(self.axis)
+            labels = self.agg_axis
+            empty_arr = np.empty(len(index), dtype=values.dtype)
+            dummy = Series(empty_arr, index=index, dtype=values.dtype)
+
+            try:
+                result = reduction.reduce(values, self.f,
+                                          axis=self.axis,
+                                          dummy=dummy,
+                                          labels=labels)
+                return self.obj._constructor_sliced(result, index=labels)
+            except Exception:
+                pass
+
+        # compute the result using the series generator
+        self.apply_series_generator()
+
+        # wrap results
+        return self.wrap_results()
+
+    def apply_series_generator(self):
+        series_gen = self.series_generator
+        res_index = self.result_index
+
+        i = None
+        keys = []
+        results = {}
+        if self.ignore_failures:
+            successes = []
+            for i, v in enumerate(series_gen):
+                try:
+                    results[i] = self.f(v)
+                    keys.append(v.name)
+                    successes.append(i)
+                except Exception:
+                    pass
+
+            # so will work with MultiIndex
+            if len(successes) < len(res_index):
+                res_index = res_index.take(successes)
+
+        else:
+            try:
+                for i, v in enumerate(series_gen):
+                    results[i] = self.f(v)
+                    keys.append(v.name)
+            except Exception as e:
+                if hasattr(e, 'args'):
+
+                    # make sure i is defined
+                    if i is not None:
+                        k = res_index[i]
+                        e.args = e.args + ('occurred at index %s' %
+                                           pprint_thing(k), )
+                raise
+
+        self.results = results
+        self.res_index = res_index
+        self.res_columns = self.result_columns
+
+    def wrap_results(self):
+        results = self.results
+
+        # see if we can infer the results
+        if len(results) > 0 and is_sequence(results[0]):
+
+            return self.wrap_results_for_axis()
+
+        # dict of scalars
+        result = self.obj._constructor_sliced(results)
+        result.index = self.res_index
+
+        return result
+
+
+class FrameRowApply(FrameApply):
+    axis = 0
+
+    def get_result(self):
+
+        # dispatch to agg
+        if isinstance(self.f, (list, dict)):
+            return self.obj.aggregate(self.f, axis=self.axis,
+                                      *self.args, **self.kwds)
+
+        return super(FrameRowApply, self).get_result()
+
+    def apply_broadcast(self):
+        return super(FrameRowApply, self).apply_broadcast(self.obj)
+
+    @property
+    def series_generator(self):
+        return (self.obj._ixs(i, axis=1)
+                for i in range(len(self.columns)))
+
+    @property
+    def result_index(self):
+        return self.columns
+
+    @property
+    def result_columns(self):
+        return self.index
+
+    def wrap_results_for_axis(self):
+        """ return the results for the rows """
+
+        results = self.results
+        result = self.obj._constructor(data=results)
+
+        if not isinstance(results[0], ABCSeries):
+            try:
+                result.index = self.res_columns
+            except ValueError:
+                pass
+
+        try:
+            result.columns = self.res_index
+        except ValueError:
+            pass
+
+        return result
+
+
+class FrameColumnApply(FrameApply):
+    axis = 1
+
+    def apply_broadcast(self):
+        result = super(FrameColumnApply, self).apply_broadcast(self.obj.T)
+        return result.T
+
+    @property
+    def series_generator(self):
+        constructor = self.obj._constructor_sliced
+        return (constructor(arr, index=self.columns, name=name)
+                for i, (arr, name) in enumerate(zip(self.values,
+                                                    self.index)))
+
+    @property
+    def result_index(self):
+        return self.index
+
+    @property
+    def result_columns(self):
+        return self.columns
+
+    def wrap_results_for_axis(self):
+        """ return the results for the columns """
+        results = self.results
+
+        # we have requested to expand
+        if self.result_type == 'expand':
+            result = self.infer_to_same_shape()
+
+        # we have a non-series and don't want inference
+        elif not isinstance(results[0], ABCSeries):
+            from pandas import Series
+            result = Series(results)
+            result.index = self.res_index
+
+        # we may want to infer results
+        else:
+            result = self.infer_to_same_shape()
+
+        return result
+
+    def infer_to_same_shape(self):
+        """ infer the results to the same shape as the input object """
+        results = self.results
+
+        result = self.obj._constructor(data=results)
+        result = result.T
+
+        # set the index
+        result.index = self.res_index
+
+        # infer dtypes
+        result = result.infer_objects()
+
+        return result
diff --git a/pandas/core/arrays/__init__.py b/pandas/core/arrays/__init__.py
new file mode 100644
index 0000000000000..f57348116c195
--- /dev/null
+++ b/pandas/core/arrays/__init__.py
@@ -0,0 +1,3 @@
+from .base import (ExtensionArray,    # noqa
+                   ExtensionScalarOpsMixin)
+from .categorical import Categorical  # noqa
diff --git a/pandas/core/arrays/base.py b/pandas/core/arrays/base.py
new file mode 100644
index 0000000000000..a572fff1c44d7
--- /dev/null
+++ b/pandas/core/arrays/base.py
@@ -0,0 +1,739 @@
+"""An interface for extending pandas with custom arrays.
+
+.. warning::
+
+   This is an experimental API and subject to breaking changes
+   without warning.
+"""
+import numpy as np
+
+import operator
+
+from pandas.errors import AbstractMethodError
+from pandas.compat.numpy import function as nv
+from pandas.compat import set_function_name, PY3
+from pandas.core.dtypes.common import is_list_like
+from pandas.core import ops
+
+_not_implemented_message = "{} does not implement {}."
+
+
+class ExtensionArray(object):
+    """Abstract base class for custom 1-D array types.
+
+    pandas will recognize instances of this class as proper arrays
+    with a custom type and will not attempt to coerce them to objects. They
+    may be stored directly inside a :class:`DataFrame` or :class:`Series`.
+
+    .. versionadded:: 0.23.0
+
+    Notes
+    -----
+    The interface includes the following abstract methods that must be
+    implemented by subclasses:
+
+    * _from_sequence
+    * _from_factorized
+    * __getitem__
+    * __len__
+    * dtype
+    * nbytes
+    * isna
+    * take
+    * copy
+    * _concat_same_type
+
+    An additional method is available to satisfy pandas' internal,
+    private block API.
+
+    * _formatting_values
+
+    Some methods require casting the ExtensionArray to an ndarray of Python
+    objects with ``self.astype(object)``, which may be expensive. When
+    performance is a concern, we highly recommend overriding the following
+    methods:
+
+    * fillna
+    * unique
+    * factorize / _values_for_factorize
+    * argsort / _values_for_argsort
+
+    This class does not inherit from 'abc.ABCMeta' for performance reasons.
+    Methods and properties required by the interface raise
+    ``pandas.errors.AbstractMethodError`` and no ``register`` method is
+    provided for registering virtual subclasses.
+
+    ExtensionArrays are limited to 1 dimension.
+
+    They may be backed by none, one, or many NumPy arrays. For example,
+    ``pandas.Categorical`` is an extension array backed by two arrays,
+    one for codes and one for categories. An array of IPv6 address may
+    be backed by a NumPy structured array with two fields, one for the
+    lower 64 bits and one for the upper 64 bits. Or they may be backed
+    by some other storage type, like Python lists. Pandas makes no
+    assumptions on how the data are stored, just that it can be converted
+    to a NumPy array.
+    The ExtensionArray interface does not impose any rules on how this data
+    is stored. However, currently, the backing data cannot be stored in
+    attributes called ``.values`` or ``._values`` to ensure full compatibility
+    with pandas internals. But other names as ``.data``, ``._data``,
+    ``._items``, ... can be freely used.
+    """
+    # '_typ' is for pandas.core.dtypes.generic.ABCExtensionArray.
+    # Don't override this.
+    _typ = 'extension'
+
+    # ------------------------------------------------------------------------
+    # Constructors
+    # ------------------------------------------------------------------------
+    @classmethod
+    def _from_sequence(cls, scalars):
+        """Construct a new ExtensionArray from a sequence of scalars.
+
+        Parameters
+        ----------
+        scalars : Sequence
+            Each element will be an instance of the scalar type for this
+            array, ``cls.dtype.type``.
+        Returns
+        -------
+        ExtensionArray
+        """
+        raise AbstractMethodError(cls)
+
+    @classmethod
+    def _from_factorized(cls, values, original):
+        """Reconstruct an ExtensionArray after factorization.
+
+        Parameters
+        ----------
+        values : ndarray
+            An integer ndarray with the factorized values.
+        original : ExtensionArray
+            The original ExtensionArray that factorize was called on.
+
+        See Also
+        --------
+        pandas.factorize
+        ExtensionArray.factorize
+        """
+        raise AbstractMethodError(cls)
+
+    # ------------------------------------------------------------------------
+    # Must be a Sequence
+    # ------------------------------------------------------------------------
+
+    def __getitem__(self, item):
+        # type (Any) -> Any
+        """Select a subset of self.
+
+        Parameters
+        ----------
+        item : int, slice, or ndarray
+            * int: The position in 'self' to get.
+
+            * slice: A slice object, where 'start', 'stop', and 'step' are
+              integers or None
+
+            * ndarray: A 1-d boolean NumPy ndarray the same length as 'self'
+
+        Returns
+        -------
+        item : scalar or ExtensionArray
+
+        Notes
+        -----
+        For scalar ``item``, return a scalar value suitable for the array's
+        type. This should be an instance of ``self.dtype.type``.
+
+        For slice ``key``, return an instance of ``ExtensionArray``, even
+        if the slice is length 0 or 1.
+
+        For a boolean mask, return an instance of ``ExtensionArray``, filtered
+        to the values where ``item`` is True.
+        """
+        raise AbstractMethodError(self)
+
+    def __setitem__(self, key, value):
+        # type: (Union[int, np.ndarray], Any) -> None
+        """Set one or more values inplace.
+
+        This method is not required to satisfy the pandas extension array
+        interface.
+
+        Parameters
+        ----------
+        key : int, ndarray, or slice
+            When called from, e.g. ``Series.__setitem__``, ``key`` will be
+            one of
+
+            * scalar int
+            * ndarray of integers.
+            * boolean ndarray
+            * slice object
+
+        value : ExtensionDtype.type, Sequence[ExtensionDtype.type], or object
+            value or values to be set of ``key``.
+
+        Returns
+        -------
+        None
+        """
+        # Some notes to the ExtensionArray implementor who may have ended up
+        # here. While this method is not required for the interface, if you
+        # *do* choose to implement __setitem__, then some semantics should be
+        # observed:
+        #
+        # * Setting multiple values : ExtensionArrays should support setting
+        #   multiple values at once, 'key' will be a sequence of integers and
+        #  'value' will be a same-length sequence.
+        #
+        # * Broadcasting : For a sequence 'key' and a scalar 'value',
+        #   each position in 'key' should be set to 'value'.
+        #
+        # * Coercion : Most users will expect basic coercion to work. For
+        #   example, a string like '2018-01-01' is coerced to a datetime
+        #   when setting on a datetime64ns array. In general, if the
+        #   __init__ method coerces that value, then so should __setitem__
+        raise NotImplementedError(_not_implemented_message.format(
+            type(self), '__setitem__')
+        )
+
+    def __len__(self):
+        # type: () -> int
+        """Length of this array
+
+        Returns
+        -------
+        length : int
+        """
+        raise AbstractMethodError(self)
+
+    def __iter__(self):
+        """Iterate over elements of the array.
+
+        """
+        # This needs to be implemented so that pandas recognizes extension
+        # arrays as list-like. The default implementation makes successive
+        # calls to ``__getitem__``, which may be slower than necessary.
+        for i in range(len(self)):
+            yield self[i]
+
+    # ------------------------------------------------------------------------
+    # Required attributes
+    # ------------------------------------------------------------------------
+    @property
+    def dtype(self):
+        # type: () -> ExtensionDtype
+        """An instance of 'ExtensionDtype'."""
+        raise AbstractMethodError(self)
+
+    @property
+    def shape(self):
+        # type: () -> Tuple[int, ...]
+        """Return a tuple of the array dimensions."""
+        return (len(self),)
+
+    @property
+    def ndim(self):
+        # type: () -> int
+        """Extension Arrays are only allowed to be 1-dimensional."""
+        return 1
+
+    @property
+    def nbytes(self):
+        # type: () -> int
+        """The number of bytes needed to store this object in memory.
+
+        """
+        # If this is expensive to compute, return an approximate lower bound
+        # on the number of bytes needed.
+        raise AbstractMethodError(self)
+
+    # ------------------------------------------------------------------------
+    # Additional Methods
+    # ------------------------------------------------------------------------
+    def astype(self, dtype, copy=True):
+        """Cast to a NumPy array with 'dtype'.
+
+        Parameters
+        ----------
+        dtype : str or dtype
+            Typecode or data-type to which the array is cast.
+        copy : bool, default True
+            Whether to copy the data, even if not necessary. If False,
+            a copy is made only if the old dtype does not match the
+            new dtype.
+
+        Returns
+        -------
+        array : ndarray
+            NumPy ndarray with 'dtype' for its dtype.
+        """
+        return np.array(self, dtype=dtype, copy=copy)
+
+    def isna(self):
+        # type: () -> np.ndarray
+        """Boolean NumPy array indicating if each value is missing.
+
+        This should return a 1-D array the same length as 'self'.
+        """
+        raise AbstractMethodError(self)
+
+    def _values_for_argsort(self):
+        # type: () -> ndarray
+        """Return values for sorting.
+
+        Returns
+        -------
+        ndarray
+            The transformed values should maintain the ordering between values
+            within the array.
+
+        See Also
+        --------
+        ExtensionArray.argsort
+        """
+        # Note: this is used in `ExtensionArray.argsort`.
+        return np.array(self)
+
+    def argsort(self, ascending=True, kind='quicksort', *args, **kwargs):
+        """
+        Return the indices that would sort this array.
+
+        Parameters
+        ----------
+        ascending : bool, default True
+            Whether the indices should result in an ascending
+            or descending sort.
+        kind : {'quicksort', 'mergesort', 'heapsort'}, optional
+            Sorting algorithm.
+        *args, **kwargs:
+            passed through to :func:`numpy.argsort`.
+
+        Returns
+        -------
+        index_array : ndarray
+            Array of indices that sort ``self``.
+
+        See Also
+        --------
+        numpy.argsort : Sorting implementation used internally.
+        """
+        # Implementor note: You have two places to override the behavior of
+        # argsort.
+        # 1. _values_for_argsort : construct the values passed to np.argsort
+        # 2. argsort : total control over sorting.
+        ascending = nv.validate_argsort_with_ascending(ascending, args, kwargs)
+        values = self._values_for_argsort()
+        result = np.argsort(values, kind=kind, **kwargs)
+        if not ascending:
+            result = result[::-1]
+        return result
+
+    def fillna(self, value=None, method=None, limit=None):
+        """ Fill NA/NaN values using the specified method.
+
+        Parameters
+        ----------
+        value : scalar, array-like
+            If a scalar value is passed it is used to fill all missing values.
+            Alternatively, an array-like 'value' can be given. It's expected
+            that the array-like have the same length as 'self'.
+        method : {'backfill', 'bfill', 'pad', 'ffill', None}, default None
+            Method to use for filling holes in reindexed Series
+            pad / ffill: propagate last valid observation forward to next valid
+            backfill / bfill: use NEXT valid observation to fill gap
+        limit : int, default None
+            If method is specified, this is the maximum number of consecutive
+            NaN values to forward/backward fill. In other words, if there is
+            a gap with more than this number of consecutive NaNs, it will only
+            be partially filled. If method is not specified, this is the
+            maximum number of entries along the entire axis where NaNs will be
+            filled.
+
+        Returns
+        -------
+        filled : ExtensionArray with NA/NaN filled
+        """
+        from pandas.api.types import is_array_like
+        from pandas.util._validators import validate_fillna_kwargs
+        from pandas.core.missing import pad_1d, backfill_1d
+
+        value, method = validate_fillna_kwargs(value, method)
+
+        mask = self.isna()
+
+        if is_array_like(value):
+            if len(value) != len(self):
+                raise ValueError("Length of 'value' does not match. Got ({}) "
+                                 " expected {}".format(len(value), len(self)))
+            value = value[mask]
+
+        if mask.any():
+            if method is not None:
+                func = pad_1d if method == 'pad' else backfill_1d
+                new_values = func(self.astype(object), limit=limit,
+                                  mask=mask)
+                new_values = self._from_sequence(new_values)
+            else:
+                # fill with value
+                new_values = self.copy()
+                new_values[mask] = value
+        else:
+            new_values = self.copy()
+        return new_values
+
+    def unique(self):
+        """Compute the ExtensionArray of unique values.
+
+        Returns
+        -------
+        uniques : ExtensionArray
+        """
+        from pandas import unique
+
+        uniques = unique(self.astype(object))
+        return self._from_sequence(uniques)
+
+    def _values_for_factorize(self):
+        # type: () -> Tuple[ndarray, Any]
+        """Return an array and missing value suitable for factorization.
+
+        Returns
+        -------
+        values : ndarray
+
+            An array suitable for factorization. This should maintain order
+            and be a supported dtype (Float64, Int64, UInt64, String, Object).
+            By default, the extension array is cast to object dtype.
+        na_value : object
+            The value in `values` to consider missing. This will be treated
+            as NA in the factorization routines, so it will be coded as
+            `na_sentinal` and not included in `uniques`. By default,
+            ``np.nan`` is used.
+        """
+        return self.astype(object), np.nan
+
+    def factorize(self, na_sentinel=-1):
+        # type: (int) -> Tuple[ndarray, ExtensionArray]
+        """Encode the extension array as an enumerated type.
+
+        Parameters
+        ----------
+        na_sentinel : int, default -1
+            Value to use in the `labels` array to indicate missing values.
+
+        Returns
+        -------
+        labels : ndarray
+            An integer NumPy array that's an indexer into the original
+            ExtensionArray.
+        uniques : ExtensionArray
+            An ExtensionArray containing the unique values of `self`.
+
+            .. note::
+
+               uniques will *not* contain an entry for the NA value of
+               the ExtensionArray if there are any missing values present
+               in `self`.
+
+        See Also
+        --------
+        pandas.factorize : Top-level factorize method that dispatches here.
+
+        Notes
+        -----
+        :meth:`pandas.factorize` offers a `sort` keyword as well.
+        """
+        # Impelmentor note: There are two ways to override the behavior of
+        # pandas.factorize
+        # 1. _values_for_factorize and _from_factorize.
+        #    Specify the values passed to pandas' internal factorization
+        #    routines, and how to convert from those values back to the
+        #    original ExtensionArray.
+        # 2. ExtensionArray.factorize.
+        #    Complete control over factorization.
+        from pandas.core.algorithms import _factorize_array
+
+        arr, na_value = self._values_for_factorize()
+
+        labels, uniques = _factorize_array(arr, na_sentinel=na_sentinel,
+                                           na_value=na_value)
+
+        uniques = self._from_factorized(uniques, self)
+        return labels, uniques
+
+    # ------------------------------------------------------------------------
+    # Indexing methods
+    # ------------------------------------------------------------------------
+
+    def take(self, indices, allow_fill=False, fill_value=None):
+        # type: (Sequence[int], bool, Optional[Any]) -> ExtensionArray
+        """Take elements from an array.
+
+        Parameters
+        ----------
+        indices : sequence of integers
+            Indices to be taken.
+        allow_fill : bool, default False
+            How to handle negative values in `indices`.
+
+            * False: negative values in `indices` indicate positional indices
+              from the right (the default). This is similar to
+              :func:`numpy.take`.
+
+            * True: negative values in `indices` indicate
+              missing values. These values are set to `fill_value`. Any other
+              other negative values raise a ``ValueError``.
+
+        fill_value : any, optional
+            Fill value to use for NA-indices when `allow_fill` is True.
+            This may be ``None``, in which case the default NA value for
+            the type, ``self.dtype.na_value``, is used.
+
+            For many ExtensionArrays, there will be two representations of
+            `fill_value`: a user-facing "boxed" scalar, and a low-level
+            physical NA value. `fill_value` should be the user-facing version,
+            and the implementation should handle translating that to the
+            physical version for processing the take if necessary.
+
+        Returns
+        -------
+        ExtensionArray
+
+        Raises
+        ------
+        IndexError
+            When the indices are out of bounds for the array.
+        ValueError
+            When `indices` contains negative values other than ``-1``
+            and `allow_fill` is True.
+
+        Notes
+        -----
+        ExtensionArray.take is called by ``Series.__getitem__``, ``.loc``,
+        ``iloc``, when `indices` is a sequence of values. Additionally,
+        it's called by :meth:`Series.reindex`, or any other method
+        that causes realignment, with a `fill_value`.
+
+        See Also
+        --------
+        numpy.take
+        pandas.api.extensions.take
+
+        Examples
+        --------
+        Here's an example implementation, which relies on casting the
+        extension array to object dtype. This uses the helper method
+        :func:`pandas.api.extensions.take`.
+
+        .. code-block:: python
+
+           def take(self, indices, allow_fill=False, fill_value=None):
+               from pandas.core.algorithms import take
+
+               # If the ExtensionArray is backed by an ndarray, then
+               # just pass that here instead of coercing to object.
+               data = self.astype(object)
+
+               if allow_fill and fill_value is None:
+                   fill_value = self.dtype.na_value
+
+               # fill value should always be translated from the scalar
+               # type for the array, to the physical storage type for
+               # the data, before passing to take.
+
+               result = take(data, indices, fill_value=fill_value,
+                             allow_fill=allow_fill)
+               return self._from_sequence(result)
+        """
+        # Implementer note: The `fill_value` parameter should be a user-facing
+        # value, an instance of self.dtype.type. When passed `fill_value=None`,
+        # the default of `self.dtype.na_value` should be used.
+        # This may differ from the physical storage type your ExtensionArray
+        # uses. In this case, your implementation is responsible for casting
+        # the user-facing type to the storage type, before using
+        # pandas.api.extensions.take
+        raise AbstractMethodError(self)
+
+    def copy(self, deep=False):
+        # type: (bool) -> ExtensionArray
+        """Return a copy of the array.
+
+        Parameters
+        ----------
+        deep : bool, default False
+            Also copy the underlying data backing this array.
+
+        Returns
+        -------
+        ExtensionArray
+        """
+        raise AbstractMethodError(self)
+
+    # ------------------------------------------------------------------------
+    # Block-related methods
+    # ------------------------------------------------------------------------
+
+    def _formatting_values(self):
+        # type: () -> np.ndarray
+        # At the moment, this has to be an array since we use result.dtype
+        """An array of values to be printed in, e.g. the Series repr"""
+        return np.array(self)
+
+    @classmethod
+    def _concat_same_type(cls, to_concat):
+        # type: (Sequence[ExtensionArray]) -> ExtensionArray
+        """Concatenate multiple array
+
+        Parameters
+        ----------
+        to_concat : sequence of this type
+
+        Returns
+        -------
+        ExtensionArray
+        """
+        raise AbstractMethodError(cls)
+
+    # The _can_hold_na attribute is set to True so that pandas internals
+    # will use the ExtensionDtype.na_value as the NA value in operations
+    # such as take(), reindex(), shift(), etc.  In addition, those results
+    # will then be of the ExtensionArray subclass rather than an array
+    # of objects
+    _can_hold_na = True
+
+    @property
+    def _ndarray_values(self):
+        # type: () -> np.ndarray
+        """Internal pandas method for lossy conversion to a NumPy ndarray.
+
+        This method is not part of the pandas interface.
+
+        The expectation is that this is cheap to compute, and is primarily
+        used for interacting with our indexers.
+        """
+        return np.array(self)
+
+
+class ExtensionOpsMixin(object):
+    """
+    A base class for linking the operators to their dunder names
+    """
+    @classmethod
+    def _add_arithmetic_ops(cls):
+        cls.__add__ = cls._create_arithmetic_method(operator.add)
+        cls.__radd__ = cls._create_arithmetic_method(ops.radd)
+        cls.__sub__ = cls._create_arithmetic_method(operator.sub)
+        cls.__rsub__ = cls._create_arithmetic_method(ops.rsub)
+        cls.__mul__ = cls._create_arithmetic_method(operator.mul)
+        cls.__rmul__ = cls._create_arithmetic_method(ops.rmul)
+        cls.__pow__ = cls._create_arithmetic_method(operator.pow)
+        cls.__rpow__ = cls._create_arithmetic_method(ops.rpow)
+        cls.__mod__ = cls._create_arithmetic_method(operator.mod)
+        cls.__rmod__ = cls._create_arithmetic_method(ops.rmod)
+        cls.__floordiv__ = cls._create_arithmetic_method(operator.floordiv)
+        cls.__rfloordiv__ = cls._create_arithmetic_method(ops.rfloordiv)
+        cls.__truediv__ = cls._create_arithmetic_method(operator.truediv)
+        cls.__rtruediv__ = cls._create_arithmetic_method(ops.rtruediv)
+        if not PY3:
+            cls.__div__ = cls._create_arithmetic_method(operator.div)
+            cls.__rdiv__ = cls._create_arithmetic_method(ops.rdiv)
+
+        cls.__divmod__ = cls._create_arithmetic_method(divmod)
+        cls.__rdivmod__ = cls._create_arithmetic_method(ops.rdivmod)
+
+    @classmethod
+    def _add_comparison_ops(cls):
+        cls.__eq__ = cls._create_comparison_method(operator.eq)
+        cls.__ne__ = cls._create_comparison_method(operator.ne)
+        cls.__lt__ = cls._create_comparison_method(operator.lt)
+        cls.__gt__ = cls._create_comparison_method(operator.gt)
+        cls.__le__ = cls._create_comparison_method(operator.le)
+        cls.__ge__ = cls._create_comparison_method(operator.ge)
+
+
+class ExtensionScalarOpsMixin(ExtensionOpsMixin):
+    """A mixin for defining the arithmetic and logical operations on
+    an ExtensionArray class, where it is assumed that the underlying objects
+    have the operators already defined.
+
+    Usage
+    ------
+    If you have defined a subclass MyExtensionArray(ExtensionArray), then
+    use MyExtensionArray(ExtensionArray, ExtensionScalarOpsMixin) to
+    get the arithmetic operators.  After the definition of MyExtensionArray,
+    insert the lines
+
+    MyExtensionArray._add_arithmetic_ops()
+    MyExtensionArray._add_comparison_ops()
+
+    to link the operators to your class.
+    """
+
+    @classmethod
+    def _create_method(cls, op, coerce_to_dtype=True):
+        """
+        A class method that returns a method that will correspond to an
+        operator for an ExtensionArray subclass, by dispatching to the
+        relevant operator defined on the individual elements of the
+        ExtensionArray.
+
+        Parameters
+        ----------
+        op : function
+            An operator that takes arguments op(a, b)
+        coerce_to_dtype :  bool
+            boolean indicating whether to attempt to convert
+            the result to the underlying ExtensionArray dtype
+            (default True)
+
+        Returns
+        -------
+        A method that can be bound to a method of a class
+
+        Example
+        -------
+        Given an ExtensionArray subclass called MyExtensionArray, use
+
+        >>> __add__ = cls._create_method(operator.add)
+
+        in the class definition of MyExtensionArray to create the operator
+        for addition, that will be based on the operator implementation
+        of the underlying elements of the ExtensionArray
+
+        """
+
+        def _binop(self, other):
+            def convert_values(param):
+                if isinstance(param, ExtensionArray) or is_list_like(param):
+                    ovalues = param
+                else:  # Assume its an object
+                    ovalues = [param] * len(self)
+                return ovalues
+            lvalues = self
+            rvalues = convert_values(other)
+
+            # If the operator is not defined for the underlying objects,
+            # a TypeError should be raised
+            res = [op(a, b) for (a, b) in zip(lvalues, rvalues)]
+
+            if coerce_to_dtype:
+                try:
+                    res = self._from_sequence(res)
+                except TypeError:
+                    pass
+
+            return res
+
+        op_name = ops._get_op_name(op, True)
+        return set_function_name(_binop, op_name, cls)
+
+    @classmethod
+    def _create_arithmetic_method(cls, op):
+        return cls._create_method(op)
+
+    @classmethod
+    def _create_comparison_method(cls, op):
+        return cls._create_method(op, coerce_to_dtype=False)
diff --git a/pandas/core/arrays/categorical.py b/pandas/core/arrays/categorical.py
new file mode 100644
index 0000000000000..0252b5b52ae94
--- /dev/null
+++ b/pandas/core/arrays/categorical.py
@@ -0,0 +1,2611 @@
+# pylint: disable=E1101,W0232
+
+import numpy as np
+from warnings import warn
+import textwrap
+
+from pandas import compat
+from pandas.compat import u, lzip
+from pandas._libs import lib, algos as libalgos
+
+from pandas.core.dtypes.generic import (
+    ABCSeries, ABCIndexClass, ABCCategoricalIndex)
+from pandas.core.dtypes.missing import isna, notna
+from pandas.core.dtypes.inference import is_hashable
+from pandas.core.dtypes.cast import (
+    maybe_infer_to_datetimelike,
+    coerce_indexer_dtype)
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas.core.dtypes.common import (
+    _ensure_int64,
+    _ensure_object,
+    _ensure_platform_int,
+    is_dtype_equal,
+    is_datetimelike,
+    is_datetime64_dtype,
+    is_timedelta64_dtype,
+    is_categorical,
+    is_categorical_dtype,
+    is_list_like, is_sequence,
+    is_scalar, is_iterator,
+    is_dict_like)
+
+from pandas.core.algorithms import factorize, take_1d, unique1d, take
+from pandas.core.accessor import PandasDelegate
+from pandas.core.base import (PandasObject,
+                              NoNewAttributesMixin, _shared_docs)
+import pandas.core.common as com
+from pandas.core.missing import interpolate_2d
+from pandas.compat.numpy import function as nv
+from pandas.util._decorators import (
+    Appender, cache_readonly, deprecate_kwarg, Substitution)
+
+import pandas.core.algorithms as algorithms
+
+from pandas.io.formats.terminal import get_terminal_size
+from pandas.util._validators import validate_bool_kwarg, validate_fillna_kwargs
+from pandas.core.config import get_option
+
+from .base import ExtensionArray
+
+
+_take_msg = textwrap.dedent("""\
+    Interpreting negative values in 'indexer' as missing values.
+    In the future, this will change to meaning positional indices
+    from the right.
+
+    Use 'allow_fill=True' to retain the previous behavior and silence this
+    warning.
+
+    Use 'allow_fill=False' to accept the new behavior.""")
+
+
+def _cat_compare_op(op):
+    def f(self, other):
+        # On python2, you can usually compare any type to any type, and
+        # Categoricals can be seen as a custom type, but having different
+        # results depending whether categories are the same or not is kind of
+        # insane, so be a bit stricter here and use the python3 idea of
+        # comparing only things of equal type.
+        if isinstance(other, ABCSeries):
+            return NotImplemented
+
+        if not self.ordered:
+            if op in ['__lt__', '__gt__', '__le__', '__ge__']:
+                raise TypeError("Unordered Categoricals can only compare "
+                                "equality or not")
+        if isinstance(other, Categorical):
+            # Two Categoricals can only be be compared if the categories are
+            # the same (maybe up to ordering, depending on ordered)
+
+            msg = ("Categoricals can only be compared if "
+                   "'categories' are the same.")
+            if len(self.categories) != len(other.categories):
+                raise TypeError(msg + " Categories are different lengths")
+            elif (self.ordered and not (self.categories ==
+                                        other.categories).all()):
+                raise TypeError(msg)
+            elif not set(self.categories) == set(other.categories):
+                raise TypeError(msg)
+
+            if not (self.ordered == other.ordered):
+                raise TypeError("Categoricals can only be compared if "
+                                "'ordered' is the same")
+            if not self.ordered and not self.categories.equals(
+                    other.categories):
+                # both unordered and different order
+                other_codes = _get_codes_for_values(other, self.categories)
+            else:
+                other_codes = other._codes
+
+            na_mask = (self._codes == -1) | (other_codes == -1)
+            f = getattr(self._codes, op)
+            ret = f(other_codes)
+            if na_mask.any():
+                # In other series, the leads to False, so do that here too
+                ret[na_mask] = False
+            return ret
+
+        # Numpy-1.9 and earlier may convert a scalar to a zerodim array during
+        # comparison operation when second arg has higher priority, e.g.
+        #
+        #     cat[0] < cat
+        #
+        # With cat[0], for example, being ``np.int64(1)`` by the time it gets
+        # into this function would become ``np.array(1)``.
+        other = lib.item_from_zerodim(other)
+        if is_scalar(other):
+            if other in self.categories:
+                i = self.categories.get_loc(other)
+                return getattr(self._codes, op)(i)
+            else:
+                if op == '__eq__':
+                    return np.repeat(False, len(self))
+                elif op == '__ne__':
+                    return np.repeat(True, len(self))
+                else:
+                    msg = ("Cannot compare a Categorical for op {op} with a "
+                           "scalar, which is not a category.")
+                    raise TypeError(msg.format(op=op))
+        else:
+
+            # allow categorical vs object dtype array comparisons for equality
+            # these are only positional comparisons
+            if op in ['__eq__', '__ne__']:
+                return getattr(np.array(self), op)(np.array(other))
+
+            msg = ("Cannot compare a Categorical for op {op} with type {typ}."
+                   "\nIf you want to compare values, use 'np.asarray(cat) "
+                   "<op> other'.")
+            raise TypeError(msg.format(op=op, typ=type(other)))
+
+    f.__name__ = op
+
+    return f
+
+
+def _maybe_to_categorical(array):
+    """
+    Coerce to a categorical if a series is given.
+
+    Internal use ONLY.
+    """
+    if isinstance(array, (ABCSeries, ABCCategoricalIndex)):
+        return array._values
+    elif isinstance(array, np.ndarray):
+        return Categorical(array)
+    return array
+
+
+def contains(cat, key, container):
+    """
+    Helper for membership check for ``key`` in ``cat``.
+
+    This is a helper method for :method:`__contains__`
+    and :class:`CategoricalIndex.__contains__`.
+
+    Returns True if ``key`` is in ``cat.categories`` and the
+    location of ``key`` in ``categories`` is in ``container``.
+
+    Parameters
+    ----------
+    cat : :class:`Categorical`or :class:`categoricalIndex`
+    key : a hashable object
+        The key to check membership for.
+    container : Container (e.g. list-like or mapping)
+        The container to check for membership in.
+
+    Returns
+    -------
+    is_in : bool
+        True if ``key`` is in ``self.categories`` and location of
+        ``key`` in ``categories`` is in ``container``, else False.
+
+    Notes
+    -----
+    This method does not check for NaN values. Do that separately
+    before calling this method.
+    """
+    hash(key)
+
+    # get location of key in categories.
+    # If a KeyError, the key isn't in categories, so logically
+    #  can't be in container either.
+    try:
+        loc = cat.categories.get_loc(key)
+    except KeyError:
+        return False
+
+    # loc is the location of key in categories, but also the *value*
+    # for key in container. So, `key` may be in categories,
+    # but still not in `container`. Example ('b' in categories,
+    # but not in values):
+    # 'b' in Categorical(['a'], categories=['a', 'b'])  # False
+    if is_scalar(loc):
+        return loc in container
+    else:
+        # if categories is an IntervalIndex, loc is an array.
+        return any(loc_ in container for loc_ in loc)
+
+
+_codes_doc = """The category codes of this categorical.
+
+Level codes are an array if integer which are the positions of the real
+values in the categories array.
+
+There is not setter, use the other categorical methods and the normal item
+setter to change values in the categorical.
+"""
+
+
+class Categorical(ExtensionArray, PandasObject):
+    """
+    Represents a categorical variable in classic R / S-plus fashion
+
+    `Categoricals` can only take on only a limited, and usually fixed, number
+    of possible values (`categories`). In contrast to statistical categorical
+    variables, a `Categorical` might have an order, but numerical operations
+    (additions, divisions, ...) are not possible.
+
+    All values of the `Categorical` are either in `categories` or `np.nan`.
+    Assigning values outside of `categories` will raise a `ValueError`. Order
+    is defined by the order of the `categories`, not lexical order of the
+    values.
+
+    Parameters
+    ----------
+    values : list-like
+        The values of the categorical. If categories are given, values not in
+        categories will be replaced with NaN.
+    categories : Index-like (unique), optional
+        The unique categories for this categorical. If not given, the
+        categories are assumed to be the unique values of values.
+    ordered : boolean, (default False)
+        Whether or not this categorical is treated as a ordered categorical.
+        If not given, the resulting categorical will not be ordered.
+    dtype : CategoricalDtype
+        An instance of ``CategoricalDtype`` to use for this categorical
+
+        .. versionadded:: 0.21.0
+
+    Attributes
+    ----------
+    categories : Index
+        The categories of this categorical
+    codes : ndarray
+        The codes (integer positions, which point to the categories) of this
+        categorical, read only.
+    ordered : boolean
+        Whether or not this Categorical is ordered.
+    dtype : CategoricalDtype
+        The instance of ``CategoricalDtype`` storing the ``categories``
+        and ``ordered``.
+
+        .. versionadded:: 0.21.0
+
+    Methods
+    -------
+    from_codes
+    __array__
+
+    Raises
+    ------
+    ValueError
+        If the categories do not validate.
+    TypeError
+        If an explicit ``ordered=True`` is given but no `categories` and the
+        `values` are not sortable.
+
+    Examples
+    --------
+    >>> pd.Categorical([1, 2, 3, 1, 2, 3])
+    [1, 2, 3, 1, 2, 3]
+    Categories (3, int64): [1, 2, 3]
+
+    >>> pd.Categorical(['a', 'b', 'c', 'a', 'b', 'c'])
+    [a, b, c, a, b, c]
+    Categories (3, object): [a, b, c]
+
+    Ordered `Categoricals` can be sorted according to the custom order
+    of the categories and can have a min and max value.
+
+    >>> c = pd.Categorical(['a','b','c','a','b','c'], ordered=True,
+    ...                    categories=['c', 'b', 'a'])
+    >>> c
+    [a, b, c, a, b, c]
+    Categories (3, object): [c < b < a]
+    >>> c.min()
+    'c'
+
+    Notes
+    -----
+    See the `user guide
+    <http://pandas.pydata.org/pandas-docs/stable/categorical.html>`_ for more.
+
+    See also
+    --------
+    pandas.api.types.CategoricalDtype : Type for categorical data
+    CategoricalIndex : An Index with an underlying ``Categorical``
+    """
+
+    # For comparisons, so that numpy uses our implementation if the compare
+    # ops, which raise
+    __array_priority__ = 1000
+    _dtype = CategoricalDtype(ordered=False)
+    _deprecations = frozenset(['labels'])
+    _typ = 'categorical'
+
+    def __init__(self, values, categories=None, ordered=None, dtype=None,
+                 fastpath=False):
+
+        # Ways of specifying the dtype (prioritized ordered)
+        # 1. dtype is a CategoricalDtype
+        #    a.) with known categories, use dtype.categories
+        #    b.) else with Categorical values, use values.dtype
+        #    c.) else, infer from values
+        #    d.) specifying dtype=CategoricalDtype and categories is an error
+        # 2. dtype is a string 'category'
+        #    a.) use categories, ordered
+        #    b.) use values.dtype
+        #    c.) infer from values
+        # 3. dtype is None
+        #    a.) use categories, ordered
+        #    b.) use values.dtype
+        #    c.) infer from values
+
+        if dtype is not None:
+            # The dtype argument takes precedence over values.dtype (if any)
+            if isinstance(dtype, compat.string_types):
+                if dtype == 'category':
+                    dtype = CategoricalDtype(categories, ordered)
+                else:
+                    msg = "Unknown `dtype` {dtype}"
+                    raise ValueError(msg.format(dtype=dtype))
+            elif categories is not None or ordered is not None:
+                raise ValueError("Cannot specify both `dtype` and `categories`"
+                                 " or `ordered`.")
+
+            categories = dtype.categories
+            ordered = dtype.ordered
+
+        elif is_categorical(values):
+            # If no "dtype" was passed, use the one from "values", but honor
+            # the "ordered" and "categories" arguments
+            dtype = values.dtype._from_categorical_dtype(values.dtype,
+                                                         categories, ordered)
+        else:
+            # If dtype=None and values is not categorical, create a new dtype
+            dtype = CategoricalDtype(categories, ordered)
+
+        # At this point, dtype is always a CategoricalDtype
+        # if dtype.categories is None, we are inferring
+
+        if fastpath:
+            self._codes = coerce_indexer_dtype(values, categories)
+            self._dtype = self._dtype.update_dtype(dtype)
+            return
+
+        # null_mask indicates missing values we want to exclude from inference.
+        # This means: only missing values in list-likes (not arrays/ndframes).
+        null_mask = np.array(False)
+
+        # sanitize input
+        if is_categorical_dtype(values):
+            if dtype.categories is None:
+                dtype = CategoricalDtype(values.categories, dtype.ordered)
+
+        elif not isinstance(values, (ABCIndexClass, ABCSeries)):
+            # _sanitize_array coerces np.nan to a string under certain versions
+            # of numpy
+            values = maybe_infer_to_datetimelike(values, convert_dates=True)
+            if not isinstance(values, np.ndarray):
+                values = _convert_to_list_like(values)
+                from pandas.core.series import _sanitize_array
+                # By convention, empty lists result in object dtype:
+                if len(values) == 0:
+                    sanitize_dtype = 'object'
+                else:
+                    sanitize_dtype = None
+                null_mask = isna(values)
+                if null_mask.any():
+                    values = [values[idx] for idx in np.where(~null_mask)[0]]
+                values = _sanitize_array(values, None, dtype=sanitize_dtype)
+
+        if dtype.categories is None:
+            try:
+                codes, categories = factorize(values, sort=True)
+            except TypeError:
+                codes, categories = factorize(values, sort=False)
+                if dtype.ordered:
+                    # raise, as we don't have a sortable data structure and so
+                    # the user should give us one by specifying categories
+                    raise TypeError("'values' is not ordered, please "
+                                    "explicitly specify the categories order "
+                                    "by passing in a categories argument.")
+            except ValueError:
+
+                # FIXME
+                raise NotImplementedError("> 1 ndim Categorical are not "
+                                          "supported at this time")
+
+            # we're inferring from values
+            dtype = CategoricalDtype(categories, dtype.ordered)
+
+        elif is_categorical_dtype(values):
+            old_codes = (values.cat.codes if isinstance(values, ABCSeries)
+                         else values.codes)
+            codes = _recode_for_categories(old_codes, values.dtype.categories,
+                                           dtype.categories)
+
+        else:
+            codes = _get_codes_for_values(values, dtype.categories)
+
+        if null_mask.any():
+            # Reinsert -1 placeholders for previously removed missing values
+            full_codes = - np.ones(null_mask.shape, dtype=codes.dtype)
+            full_codes[~null_mask] = codes
+            codes = full_codes
+
+        self._dtype = self._dtype.update_dtype(dtype)
+        self._codes = coerce_indexer_dtype(codes, dtype.categories)
+
+    @property
+    def categories(self):
+        """The categories of this categorical.
+
+        Setting assigns new values to each category (effectively a rename of
+        each individual category).
+
+        The assigned value has to be a list-like object. All items must be
+        unique and the number of items in the new categories must be the same
+        as the number of items in the old categories.
+
+        Assigning to `categories` is a inplace operation!
+
+        Raises
+        ------
+        ValueError
+            If the new categories do not validate as categories or if the
+            number of new categories is unequal the number of old categories
+
+        See also
+        --------
+        rename_categories
+        reorder_categories
+        add_categories
+        remove_categories
+        remove_unused_categories
+        set_categories
+        """
+        return self.dtype.categories
+
+    @categories.setter
+    def categories(self, categories):
+        new_dtype = CategoricalDtype(categories, ordered=self.ordered)
+        if (self.dtype.categories is not None and
+                len(self.dtype.categories) != len(new_dtype.categories)):
+            raise ValueError("new categories need to have the same number of "
+                             "items as the old categories!")
+        self._dtype = new_dtype
+
+    @property
+    def ordered(self):
+        """Whether the categories have an ordered relationship"""
+        return self.dtype.ordered
+
+    @property
+    def dtype(self):
+        """The :class:`~pandas.api.types.CategoricalDtype` for this instance"""
+        return self._dtype
+
+    @property
+    def _ndarray_values(self):
+        return self.codes
+
+    @property
+    def _constructor(self):
+        return Categorical
+
+    @classmethod
+    def _from_sequence(cls, scalars):
+        return Categorical(scalars)
+
+    def copy(self):
+        """ Copy constructor. """
+        return self._constructor(values=self._codes.copy(),
+                                 categories=self.categories,
+                                 ordered=self.ordered,
+                                 fastpath=True)
+
+    def astype(self, dtype, copy=True):
+        """
+        Coerce this type to another dtype
+
+        Parameters
+        ----------
+        dtype : numpy dtype or pandas type
+        copy : bool, default True
+            By default, astype always returns a newly allocated object.
+            If copy is set to False and dtype is categorical, the original
+            object is returned.
+
+            .. versionadded:: 0.19.0
+
+        """
+        if is_categorical_dtype(dtype):
+            # GH 10696/18593
+            dtype = self.dtype.update_dtype(dtype)
+            self = self.copy() if copy else self
+            if dtype == self.dtype:
+                return self
+            return self._set_dtype(dtype)
+        return np.array(self, dtype=dtype, copy=copy)
+
+    @cache_readonly
+    def ndim(self):
+        """Number of dimensions of the Categorical """
+        return self._codes.ndim
+
+    @cache_readonly
+    def size(self):
+        """ return the len of myself """
+        return len(self)
+
+    @cache_readonly
+    def itemsize(self):
+        """ return the size of a single category """
+        return self.categories.itemsize
+
+    def tolist(self):
+        """
+        Return a list of the values.
+
+        These are each a scalar type, which is a Python scalar
+        (for str, int, float) or a pandas scalar
+        (for Timestamp/Timedelta/Interval/Period)
+        """
+        return list(self)
+
+    @property
+    def base(self):
+        """ compat, we are always our own object """
+        return None
+
+    @classmethod
+    def _from_inferred_categories(cls, inferred_categories, inferred_codes,
+                                  dtype):
+        """Construct a Categorical from inferred values
+
+        For inferred categories (`dtype` is None) the categories are sorted.
+        For explicit `dtype`, the `inferred_categories` are cast to the
+        appropriate type.
+
+        Parameters
+        ----------
+
+        inferred_categories : Index
+        inferred_codes : Index
+        dtype : CategoricalDtype or 'category'
+
+        Returns
+        -------
+        Categorical
+        """
+        from pandas import Index, to_numeric, to_datetime, to_timedelta
+
+        cats = Index(inferred_categories)
+
+        known_categories = (isinstance(dtype, CategoricalDtype) and
+                            dtype.categories is not None)
+
+        if known_categories:
+            # Convert to a specialzed type with `dtype` if specified
+            if dtype.categories.is_numeric():
+                cats = to_numeric(inferred_categories, errors='coerce')
+            elif is_datetime64_dtype(dtype.categories):
+                cats = to_datetime(inferred_categories, errors='coerce')
+            elif is_timedelta64_dtype(dtype.categories):
+                cats = to_timedelta(inferred_categories, errors='coerce')
+
+        if known_categories:
+            # recode from observation order to dtype.categories order
+            categories = dtype.categories
+            codes = _recode_for_categories(inferred_codes, cats, categories)
+        elif not cats.is_monotonic_increasing:
+            # sort categories and recode for unknown categories
+            unsorted = cats.copy()
+            categories = cats.sort_values()
+            codes = _recode_for_categories(inferred_codes, unsorted,
+                                           categories)
+            dtype = CategoricalDtype(categories, ordered=False)
+        else:
+            dtype = CategoricalDtype(cats, ordered=False)
+            codes = inferred_codes
+
+        return cls(codes, dtype=dtype, fastpath=True)
+
+    @classmethod
+    def from_codes(cls, codes, categories, ordered=False):
+        """
+        Make a Categorical type from codes and categories arrays.
+
+        This constructor is useful if you already have codes and categories and
+        so do not need the (computation intensive) factorization step, which is
+        usually done on the constructor.
+
+        If your data does not follow this convention, please use the normal
+        constructor.
+
+        Parameters
+        ----------
+        codes : array-like, integers
+            An integer array, where each integer points to a category in
+            categories or -1 for NaN
+        categories : index-like
+            The categories for the categorical. Items need to be unique.
+        ordered : boolean, (default False)
+            Whether or not this categorical is treated as a ordered
+            categorical. If not given, the resulting categorical will be
+            unordered.
+        """
+        try:
+            codes = coerce_indexer_dtype(np.asarray(codes), categories)
+        except (ValueError, TypeError):
+            raise ValueError(
+                "codes need to be convertible to an arrays of integers")
+
+        categories = CategoricalDtype.validate_categories(categories)
+
+        if len(codes) and (codes.max() >= len(categories) or codes.min() < -1):
+            raise ValueError("codes need to be between -1 and "
+                             "len(categories)-1")
+
+        return cls(codes, categories=categories, ordered=ordered,
+                   fastpath=True)
+
+    _codes = None
+
+    def _get_codes(self):
+        """ Get the codes.
+
+        Returns
+        -------
+        codes : integer array view
+            A non writable view of the `codes` array.
+        """
+        v = self._codes.view()
+        v.flags.writeable = False
+        return v
+
+    def _set_codes(self, codes):
+        """
+        Not settable by the user directly
+        """
+        raise ValueError("cannot set Categorical codes directly")
+
+    codes = property(fget=_get_codes, fset=_set_codes, doc=_codes_doc)
+
+    def _set_categories(self, categories, fastpath=False):
+        """ Sets new categories inplace
+
+        Parameters
+        ----------
+        fastpath : boolean (default: False)
+           Don't perform validation of the categories for uniqueness or nulls
+
+        Examples
+        --------
+        >>> c = Categorical(['a', 'b'])
+        >>> c
+        [a, b]
+        Categories (2, object): [a, b]
+
+        >>> c._set_categories(pd.Index(['a', 'c']))
+        >>> c
+        [a, c]
+        Categories (2, object): [a, c]
+        """
+
+        if fastpath:
+            new_dtype = CategoricalDtype._from_fastpath(categories,
+                                                        self.ordered)
+        else:
+            new_dtype = CategoricalDtype(categories, ordered=self.ordered)
+        if (not fastpath and self.dtype.categories is not None and
+                len(new_dtype.categories) != len(self.dtype.categories)):
+            raise ValueError("new categories need to have the same number of "
+                             "items than the old categories!")
+
+        self._dtype = new_dtype
+
+    def _codes_for_groupby(self, sort, observed):
+        """
+        Code the categories to ensure we can groupby for categoricals.
+
+        If observed=True, we return a new Categorical with the observed
+        categories only.
+
+        If sort=False, return a copy of self, coded with categories as
+        returned by .unique(), followed by any categories not appearing in
+        the data. If sort=True, return self.
+
+        This method is needed solely to ensure the categorical index of the
+        GroupBy result has categories in the order of appearance in the data
+        (GH-8868).
+
+        Parameters
+        ----------
+        sort : boolean
+            The value of the sort parameter groupby was called with.
+        observed : boolean
+            Account only for the observed values
+
+        Returns
+        -------
+        Categorical
+            If sort=False, the new categories are set to the order of
+            appearance in codes (unless ordered=True, in which case the
+            original order is preserved), followed by any unrepresented
+            categories in the original order.
+        """
+
+        # we only care about observed values
+        if observed:
+            unique_codes = unique1d(self.codes)
+            cat = self.copy()
+
+            take_codes = unique_codes[unique_codes != -1]
+            if self.ordered:
+                take_codes = np.sort(take_codes)
+
+            # we recode according to the uniques
+            categories = self.categories.take(take_codes)
+            codes = _recode_for_categories(self.codes,
+                                           self.categories,
+                                           categories)
+
+            # return a new categorical that maps our new codes
+            # and categories
+            dtype = CategoricalDtype(categories, ordered=self.ordered)
+            return type(self)(codes, dtype=dtype, fastpath=True)
+
+        # Already sorted according to self.categories; all is fine
+        if sort:
+            return self
+
+        # sort=False should order groups in as-encountered order (GH-8868)
+        cat = self.unique()
+
+        # But for groupby to work, all categories should be present,
+        # including those missing from the data (GH-13179), which .unique()
+        # above dropped
+        cat.add_categories(
+            self.categories[~self.categories.isin(cat.categories)],
+            inplace=True)
+
+        return self.reorder_categories(cat.categories)
+
+    def _set_dtype(self, dtype):
+        """Internal method for directly updating the CategoricalDtype
+
+        Parameters
+        ----------
+        dtype : CategoricalDtype
+
+        Notes
+        -----
+        We don't do any validation here. It's assumed that the dtype is
+        a (valid) instance of `CategoricalDtype`.
+        """
+        codes = _recode_for_categories(self.codes, self.categories,
+                                       dtype.categories)
+        return type(self)(codes, dtype=dtype, fastpath=True)
+
+    def set_ordered(self, value, inplace=False):
+        """
+        Sets the ordered attribute to the boolean value
+
+        Parameters
+        ----------
+        value : boolean to set whether this categorical is ordered (True) or
+           not (False)
+        inplace : boolean (default: False)
+           Whether or not to set the ordered attribute inplace or return a copy
+           of this categorical with ordered set to the value
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        new_dtype = CategoricalDtype(self.categories, ordered=value)
+        cat = self if inplace else self.copy()
+        cat._dtype = new_dtype
+        if not inplace:
+            return cat
+
+    def as_ordered(self, inplace=False):
+        """
+        Sets the Categorical to be ordered
+
+        Parameters
+        ----------
+        inplace : boolean (default: False)
+           Whether or not to set the ordered attribute inplace or return a copy
+           of this categorical with ordered set to True
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        return self.set_ordered(True, inplace=inplace)
+
+    def as_unordered(self, inplace=False):
+        """
+        Sets the Categorical to be unordered
+
+        Parameters
+        ----------
+        inplace : boolean (default: False)
+           Whether or not to set the ordered attribute inplace or return a copy
+           of this categorical with ordered set to False
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        return self.set_ordered(False, inplace=inplace)
+
+    def set_categories(self, new_categories, ordered=None, rename=False,
+                       inplace=False):
+        """ Sets the categories to the specified new_categories.
+
+        `new_categories` can include new categories (which will result in
+        unused categories) or remove old categories (which results in values
+        set to NaN). If `rename==True`, the categories will simple be renamed
+        (less or more items than in old categories will result in values set to
+        NaN or in unused categories respectively).
+
+        This method can be used to perform more than one action of adding,
+        removing, and reordering simultaneously and is therefore faster than
+        performing the individual steps via the more specialised methods.
+
+        On the other hand this methods does not do checks (e.g., whether the
+        old categories are included in the new categories on a reorder), which
+        can result in surprising changes, for example when using special string
+        dtypes on python3, which does not considers a S1 string equal to a
+        single char python string.
+
+        Raises
+        ------
+        ValueError
+            If new_categories does not validate as categories
+
+        Parameters
+        ----------
+        new_categories : Index-like
+           The categories in new order.
+        ordered : boolean, (default: False)
+           Whether or not the categorical is treated as a ordered categorical.
+           If not given, do not change the ordered information.
+        rename : boolean (default: False)
+           Whether or not the new_categories should be considered as a rename
+           of the old categories or as reordered categories.
+        inplace : boolean (default: False)
+           Whether or not to reorder the categories inplace or return a copy of
+           this categorical with reordered categories.
+
+        Returns
+        -------
+        cat : Categorical with reordered categories or None if inplace.
+
+        See also
+        --------
+        rename_categories
+        reorder_categories
+        add_categories
+        remove_categories
+        remove_unused_categories
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if ordered is None:
+            ordered = self.dtype.ordered
+        new_dtype = CategoricalDtype(new_categories, ordered=ordered)
+
+        cat = self if inplace else self.copy()
+        if rename:
+            if (cat.dtype.categories is not None and
+                    len(new_dtype.categories) < len(cat.dtype.categories)):
+                # remove all _codes which are larger and set to -1/NaN
+                self._codes[self._codes >= len(new_dtype.categories)] = -1
+        else:
+            codes = _recode_for_categories(self.codes, self.categories,
+                                           new_dtype.categories)
+            cat._codes = codes
+        cat._dtype = new_dtype
+
+        if not inplace:
+            return cat
+
+    def rename_categories(self, new_categories, inplace=False):
+        """ Renames categories.
+
+        Raises
+        ------
+        ValueError
+            If new categories are list-like and do not have the same number of
+            items than the current categories or do not validate as categories
+
+        Parameters
+        ----------
+        new_categories : list-like, dict-like or callable
+
+           * list-like: all items must be unique and the number of items in
+             the new categories must match the existing number of categories.
+
+           * dict-like: specifies a mapping from
+             old categories to new. Categories not contained in the mapping
+             are passed through and extra categories in the mapping are
+             ignored.
+
+             .. versionadded:: 0.21.0
+
+           * callable : a callable that is called on all items in the old
+             categories and whose return values comprise the new categories.
+
+             .. versionadded:: 0.23.0
+
+           .. warning::
+
+              Currently, Series are considered list like. In a future version
+              of pandas they'll be considered dict-like.
+
+        inplace : boolean (default: False)
+           Whether or not to rename the categories inplace or return a copy of
+           this categorical with renamed categories.
+
+        Returns
+        -------
+        cat : Categorical or None
+           With ``inplace=False``, the new categorical is returned.
+           With ``inplace=True``, there is no return value.
+
+        See also
+        --------
+        reorder_categories
+        add_categories
+        remove_categories
+        remove_unused_categories
+        set_categories
+
+        Examples
+        --------
+        >>> c = Categorical(['a', 'a', 'b'])
+        >>> c.rename_categories([0, 1])
+        [0, 0, 1]
+        Categories (2, int64): [0, 1]
+
+        For dict-like ``new_categories``, extra keys are ignored and
+        categories not in the dictionary are passed through
+
+        >>> c.rename_categories({'a': 'A', 'c': 'C'})
+        [A, A, b]
+        Categories (2, object): [A, b]
+
+        You may also provide a callable to create the new categories
+
+        >>> c.rename_categories(lambda x: x.upper())
+        [A, A, B]
+        Categories (2, object): [A, B]
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        cat = self if inplace else self.copy()
+
+        if isinstance(new_categories, ABCSeries):
+            msg = ("Treating Series 'new_categories' as a list-like and using "
+                   "the values. In a future version, 'rename_categories' will "
+                   "treat Series like a dictionary.\n"
+                   "For dict-like, use 'new_categories.to_dict()'\n"
+                   "For list-like, use 'new_categories.values'.")
+            warn(msg, FutureWarning, stacklevel=2)
+            new_categories = list(new_categories)
+
+        if is_dict_like(new_categories):
+            cat.categories = [new_categories.get(item, item)
+                              for item in cat.categories]
+        elif callable(new_categories):
+            cat.categories = [new_categories(item) for item in cat.categories]
+        else:
+            cat.categories = new_categories
+        if not inplace:
+            return cat
+
+    def reorder_categories(self, new_categories, ordered=None, inplace=False):
+        """ Reorders categories as specified in new_categories.
+
+        `new_categories` need to include all old categories and no new category
+        items.
+
+        Raises
+        ------
+        ValueError
+            If the new categories do not contain all old category items or any
+            new ones
+
+        Parameters
+        ----------
+        new_categories : Index-like
+           The categories in new order.
+        ordered : boolean, optional
+           Whether or not the categorical is treated as a ordered categorical.
+           If not given, do not change the ordered information.
+        inplace : boolean (default: False)
+           Whether or not to reorder the categories inplace or return a copy of
+           this categorical with reordered categories.
+
+        Returns
+        -------
+        cat : Categorical with reordered categories or None if inplace.
+
+        See also
+        --------
+        rename_categories
+        add_categories
+        remove_categories
+        remove_unused_categories
+        set_categories
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if set(self.dtype.categories) != set(new_categories):
+            raise ValueError("items in new_categories are not the same as in "
+                             "old categories")
+        return self.set_categories(new_categories, ordered=ordered,
+                                   inplace=inplace)
+
+    def add_categories(self, new_categories, inplace=False):
+        """ Add new categories.
+
+        `new_categories` will be included at the last/highest place in the
+        categories and will be unused directly after this call.
+
+        Raises
+        ------
+        ValueError
+            If the new categories include old categories or do not validate as
+            categories
+
+        Parameters
+        ----------
+        new_categories : category or list-like of category
+           The new categories to be included.
+        inplace : boolean (default: False)
+           Whether or not to add the categories inplace or return a copy of
+           this categorical with added categories.
+
+        Returns
+        -------
+        cat : Categorical with new categories added or None if inplace.
+
+        See also
+        --------
+        rename_categories
+        reorder_categories
+        remove_categories
+        remove_unused_categories
+        set_categories
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if not is_list_like(new_categories):
+            new_categories = [new_categories]
+        already_included = set(new_categories) & set(self.dtype.categories)
+        if len(already_included) != 0:
+            msg = ("new categories must not include old categories: "
+                   "{already_included!s}")
+            raise ValueError(msg.format(already_included=already_included))
+        new_categories = list(self.dtype.categories) + list(new_categories)
+        new_dtype = CategoricalDtype(new_categories, self.ordered)
+
+        cat = self if inplace else self.copy()
+        cat._dtype = new_dtype
+        cat._codes = coerce_indexer_dtype(cat._codes, new_dtype.categories)
+        if not inplace:
+            return cat
+
+    def remove_categories(self, removals, inplace=False):
+        """ Removes the specified categories.
+
+        `removals` must be included in the old categories. Values which were in
+        the removed categories will be set to NaN
+
+        Raises
+        ------
+        ValueError
+            If the removals are not contained in the categories
+
+        Parameters
+        ----------
+        removals : category or list of categories
+           The categories which should be removed.
+        inplace : boolean (default: False)
+           Whether or not to remove the categories inplace or return a copy of
+           this categorical with removed categories.
+
+        Returns
+        -------
+        cat : Categorical with removed categories or None if inplace.
+
+        See also
+        --------
+        rename_categories
+        reorder_categories
+        add_categories
+        remove_unused_categories
+        set_categories
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if not is_list_like(removals):
+            removals = [removals]
+
+        removal_set = set(list(removals))
+        not_included = removal_set - set(self.dtype.categories)
+        new_categories = [c for c in self.dtype.categories
+                          if c not in removal_set]
+
+        # GH 10156
+        if any(isna(removals)):
+            not_included = [x for x in not_included if notna(x)]
+            new_categories = [x for x in new_categories if notna(x)]
+
+        if len(not_included) != 0:
+            msg = "removals must all be in old categories: {not_included!s}"
+            raise ValueError(msg.format(not_included=not_included))
+
+        return self.set_categories(new_categories, ordered=self.ordered,
+                                   rename=False, inplace=inplace)
+
+    def remove_unused_categories(self, inplace=False):
+        """ Removes categories which are not used.
+
+        Parameters
+        ----------
+        inplace : boolean (default: False)
+           Whether or not to drop unused categories inplace or return a copy of
+           this categorical with unused categories dropped.
+
+        Returns
+        -------
+        cat : Categorical with unused categories dropped or None if inplace.
+
+        See also
+        --------
+        rename_categories
+        reorder_categories
+        add_categories
+        remove_categories
+        set_categories
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        cat = self if inplace else self.copy()
+        idx, inv = np.unique(cat._codes, return_inverse=True)
+
+        if idx.size != 0 and idx[0] == -1:  # na sentinel
+            idx, inv = idx[1:], inv - 1
+
+        new_categories = cat.dtype.categories.take(idx)
+        new_dtype = CategoricalDtype._from_fastpath(new_categories,
+                                                    ordered=self.ordered)
+        cat._dtype = new_dtype
+        cat._codes = coerce_indexer_dtype(inv, new_dtype.categories)
+
+        if not inplace:
+            return cat
+
+    def map(self, mapper):
+        """
+        Map categories using input correspondence (dict, Series, or function).
+
+        Maps the categories to new categories. If the mapping correspondence is
+        one-to-one the result is a :class:`~pandas.Categorical` which has the
+        same order property as the original, otherwise a :class:`~pandas.Index`
+        is returned.
+
+        If a `dict` or :class:`~pandas.Series` is used any unmapped category is
+        mapped to `NaN`. Note that if this happens an :class:`~pandas.Index`
+        will be returned.
+
+        Parameters
+        ----------
+        mapper : function, dict, or Series
+            Mapping correspondence.
+
+        Returns
+        -------
+        pandas.Categorical or pandas.Index
+            Mapped categorical.
+
+        See Also
+        --------
+        CategoricalIndex.map : Apply a mapping correspondence on a
+            :class:`~pandas.CategoricalIndex`.
+        Index.map : Apply a mapping correspondence on an
+            :class:`~pandas.Index`.
+        Series.map : Apply a mapping correspondence on a
+            :class:`~pandas.Series`.
+        Series.apply : Apply more complex functions on a
+            :class:`~pandas.Series`.
+
+        Examples
+        --------
+        >>> cat = pd.Categorical(['a', 'b', 'c'])
+        >>> cat
+        [a, b, c]
+        Categories (3, object): [a, b, c]
+        >>> cat.map(lambda x: x.upper())
+        [A, B, C]
+        Categories (3, object): [A, B, C]
+        >>> cat.map({'a': 'first', 'b': 'second', 'c': 'third'})
+        [first, second, third]
+        Categories (3, object): [first, second, third]
+
+        If the mapping is one-to-one the ordering of the categories is
+        preserved:
+
+        >>> cat = pd.Categorical(['a', 'b', 'c'], ordered=True)
+        >>> cat
+        [a, b, c]
+        Categories (3, object): [a < b < c]
+        >>> cat.map({'a': 3, 'b': 2, 'c': 1})
+        [3, 2, 1]
+        Categories (3, int64): [3 < 2 < 1]
+
+        If the mapping is not one-to-one an :class:`~pandas.Index` is returned:
+
+        >>> cat.map({'a': 'first', 'b': 'second', 'c': 'first'})
+        Index(['first', 'second', 'first'], dtype='object')
+
+        If a `dict` is used, all unmapped categories are mapped to `NaN` and
+        the result is an :class:`~pandas.Index`:
+
+        >>> cat.map({'a': 'first', 'b': 'second'})
+        Index(['first', 'second', nan], dtype='object')
+        """
+        new_categories = self.categories.map(mapper)
+        try:
+            return self.from_codes(self._codes.copy(),
+                                   categories=new_categories,
+                                   ordered=self.ordered)
+        except ValueError:
+            return np.take(new_categories, self._codes)
+
+    __eq__ = _cat_compare_op('__eq__')
+    __ne__ = _cat_compare_op('__ne__')
+    __lt__ = _cat_compare_op('__lt__')
+    __gt__ = _cat_compare_op('__gt__')
+    __le__ = _cat_compare_op('__le__')
+    __ge__ = _cat_compare_op('__ge__')
+
+    # for Series/ndarray like compat
+    @property
+    def shape(self):
+        """ Shape of the Categorical.
+
+        For internal compatibility with numpy arrays.
+
+        Returns
+        -------
+        shape : tuple
+        """
+
+        return tuple([len(self._codes)])
+
+    def shift(self, periods):
+        """
+        Shift Categorical by desired number of periods.
+
+        Parameters
+        ----------
+        periods : int
+            Number of periods to move, can be positive or negative
+
+        Returns
+        -------
+        shifted : Categorical
+        """
+        # since categoricals always have ndim == 1, an axis parameter
+        # doesn't make any sense here.
+        codes = self.codes
+        if codes.ndim > 1:
+            raise NotImplementedError("Categorical with ndim > 1.")
+        if np.prod(codes.shape) and (periods != 0):
+            codes = np.roll(codes, _ensure_platform_int(periods), axis=0)
+            if periods > 0:
+                codes[:periods] = -1
+            else:
+                codes[periods:] = -1
+
+        return self.from_codes(codes, categories=self.categories,
+                               ordered=self.ordered)
+
+    def __array__(self, dtype=None):
+        """
+        The numpy array interface.
+
+        Returns
+        -------
+        values : numpy array
+            A numpy array of either the specified dtype or,
+            if dtype==None (default), the same dtype as
+            categorical.categories.dtype
+        """
+        ret = take_1d(self.categories.values, self._codes)
+        if dtype and not is_dtype_equal(dtype, self.categories.dtype):
+            return np.asarray(ret, dtype)
+        return ret
+
+    def __setstate__(self, state):
+        """Necessary for making this object picklable"""
+        if not isinstance(state, dict):
+            raise Exception('invalid pickle state')
+
+        # Provide compatibility with pre-0.15.0 Categoricals.
+        if '_categories' not in state and '_levels' in state:
+            state['_categories'] = self.dtype.validate_categories(state.pop(
+                '_levels'))
+        if '_codes' not in state and 'labels' in state:
+            state['_codes'] = coerce_indexer_dtype(
+                state.pop('labels'), state['_categories'])
+
+        # 0.16.0 ordered change
+        if '_ordered' not in state:
+
+            # >=15.0 < 0.16.0
+            if 'ordered' in state:
+                state['_ordered'] = state.pop('ordered')
+            else:
+                state['_ordered'] = False
+
+        # 0.21.0 CategoricalDtype change
+        if '_dtype' not in state:
+            state['_dtype'] = CategoricalDtype(state['_categories'],
+                                               state['_ordered'])
+
+        for k, v in compat.iteritems(state):
+            setattr(self, k, v)
+
+    @property
+    def T(self):
+        return self
+
+    @property
+    def nbytes(self):
+        return self._codes.nbytes + self.dtype.categories.values.nbytes
+
+    def memory_usage(self, deep=False):
+        """
+        Memory usage of my values
+
+        Parameters
+        ----------
+        deep : bool
+            Introspect the data deeply, interrogate
+            `object` dtypes for system-level memory consumption
+
+        Returns
+        -------
+        bytes used
+
+        Notes
+        -----
+        Memory usage does not include memory consumed by elements that
+        are not components of the array if deep=False
+
+        See Also
+        --------
+        numpy.ndarray.nbytes
+        """
+        return self._codes.nbytes + self.dtype.categories.memory_usage(
+            deep=deep)
+
+    @Substitution(klass='Categorical')
+    @Appender(_shared_docs['searchsorted'])
+    @deprecate_kwarg(old_arg_name='v', new_arg_name='value')
+    def searchsorted(self, value, side='left', sorter=None):
+        if not self.ordered:
+            raise ValueError("Categorical not ordered\nyou can use "
+                             ".as_ordered() to change the Categorical to an "
+                             "ordered one")
+
+        from pandas.core.series import Series
+
+        values_as_codes = _get_codes_for_values(Series(value).values,
+                                                self.categories)
+
+        if -1 in values_as_codes:
+            raise ValueError("Value(s) to be inserted must be in categories.")
+
+        return self.codes.searchsorted(values_as_codes, side=side,
+                                       sorter=sorter)
+
+    def isna(self):
+        """
+        Detect missing values
+
+        Missing values (-1 in .codes) are detected.
+
+        Returns
+        -------
+        a boolean array of whether my values are null
+
+        See also
+        --------
+        isna : top-level isna
+        isnull : alias of isna
+        Categorical.notna : boolean inverse of Categorical.isna
+
+        """
+
+        ret = self._codes == -1
+        return ret
+    isnull = isna
+
+    def notna(self):
+        """
+        Inverse of isna
+
+        Both missing values (-1 in .codes) and NA as a category are detected as
+        null.
+
+        Returns
+        -------
+        a boolean array of whether my values are not null
+
+        See also
+        --------
+        notna : top-level notna
+        notnull : alias of notna
+        Categorical.isna : boolean inverse of Categorical.notna
+
+        """
+        return ~self.isna()
+    notnull = notna
+
+    def put(self, *args, **kwargs):
+        """
+        Replace specific elements in the Categorical with given values.
+        """
+        raise NotImplementedError(("'put' is not yet implemented "
+                                   "for Categorical"))
+
+    def dropna(self):
+        """
+        Return the Categorical without null values.
+
+        Missing values (-1 in .codes) are detected.
+
+        Returns
+        -------
+        valid : Categorical
+        """
+        result = self[self.notna()]
+
+        return result
+
+    def value_counts(self, dropna=True):
+        """
+        Returns a Series containing counts of each category.
+
+        Every category will have an entry, even those with a count of 0.
+
+        Parameters
+        ----------
+        dropna : boolean, default True
+            Don't include counts of NaN.
+
+        Returns
+        -------
+        counts : Series
+
+        See Also
+        --------
+        Series.value_counts
+
+        """
+        from numpy import bincount
+        from pandas import Series, CategoricalIndex
+
+        code, cat = self._codes, self.categories
+        ncat, mask = len(cat), 0 <= code
+        ix, clean = np.arange(ncat), mask.all()
+
+        if dropna or clean:
+            obs = code if clean else code[mask]
+            count = bincount(obs, minlength=ncat or None)
+        else:
+            count = bincount(np.where(mask, code, ncat))
+            ix = np.append(ix, -1)
+
+        ix = self._constructor(ix, dtype=self.dtype,
+                               fastpath=True)
+
+        return Series(count, index=CategoricalIndex(ix), dtype='int64')
+
+    def get_values(self):
+        """ Return the values.
+
+        For internal compatibility with pandas formatting.
+
+        Returns
+        -------
+        values : numpy array
+            A numpy array of the same dtype as categorical.categories.dtype or
+            Index if datetime / periods
+        """
+        # if we are a datetime and period index, return Index to keep metadata
+        if is_datetimelike(self.categories):
+            return self.categories.take(self._codes, fill_value=np.nan)
+        return np.array(self)
+
+    def check_for_ordered(self, op):
+        """ assert that we are ordered """
+        if not self.ordered:
+            raise TypeError("Categorical is not ordered for operation {op}\n"
+                            "you can use .as_ordered() to change the "
+                            "Categorical to an ordered one\n".format(op=op))
+
+    def _values_for_argsort(self):
+        return self._codes.copy()
+
+    def argsort(self, *args, **kwargs):
+        # TODO(PY2): use correct signature
+        # We have to do *args, **kwargs to avoid a a py2-only signature
+        # issue since np.argsort differs from argsort.
+        """Return the indices that would sort the Categorical.
+
+        Parameters
+        ----------
+        ascending : bool, default True
+            Whether the indices should result in an ascending
+            or descending sort.
+        kind : {'quicksort', 'mergesort', 'heapsort'}, optional
+            Sorting algorithm.
+        *args, **kwargs:
+            passed through to :func:`numpy.argsort`.
+
+        Returns
+        -------
+        argsorted : numpy array
+
+        See also
+        --------
+        numpy.ndarray.argsort
+
+        Notes
+        -----
+        While an ordering is applied to the category values, arg-sorting
+        in this context refers more to organizing and grouping together
+        based on matching category values. Thus, this function can be
+        called on an unordered Categorical instance unlike the functions
+        'Categorical.min' and 'Categorical.max'.
+
+        Examples
+        --------
+        >>> pd.Categorical(['b', 'b', 'a', 'c']).argsort()
+        array([2, 0, 1, 3])
+
+        >>> cat = pd.Categorical(['b', 'b', 'a', 'c'],
+        ...                      categories=['c', 'b', 'a'],
+        ...                      ordered=True)
+        >>> cat.argsort()
+        array([3, 0, 1, 2])
+        """
+        # Keep the implementation here just for the docstring.
+        return super(Categorical, self).argsort(*args, **kwargs)
+
+    def sort_values(self, inplace=False, ascending=True, na_position='last'):
+        """ Sorts the Categorical by category value returning a new
+        Categorical by default.
+
+        While an ordering is applied to the category values, sorting in this
+        context refers more to organizing and grouping together based on
+        matching category values. Thus, this function can be called on an
+        unordered Categorical instance unlike the functions 'Categorical.min'
+        and 'Categorical.max'.
+
+        Parameters
+        ----------
+        inplace : boolean, default False
+            Do operation in place.
+        ascending : boolean, default True
+            Order ascending. Passing False orders descending. The
+            ordering parameter provides the method by which the
+            category values are organized.
+        na_position : {'first', 'last'} (optional, default='last')
+            'first' puts NaNs at the beginning
+            'last' puts NaNs at the end
+
+        Returns
+        -------
+        y : Categorical or None
+
+        See Also
+        --------
+        Categorical.sort
+        Series.sort_values
+
+        Examples
+        --------
+        >>> c = pd.Categorical([1, 2, 2, 1, 5])
+        >>> c
+        [1, 2, 2, 1, 5]
+        Categories (3, int64): [1, 2, 5]
+        >>> c.sort_values()
+        [1, 1, 2, 2, 5]
+        Categories (3, int64): [1, 2, 5]
+        >>> c.sort_values(ascending=False)
+        [5, 2, 2, 1, 1]
+        Categories (3, int64): [1, 2, 5]
+
+        Inplace sorting can be done as well:
+
+        >>> c.sort_values(inplace=True)
+        >>> c
+        [1, 1, 2, 2, 5]
+        Categories (3, int64): [1, 2, 5]
+        >>>
+        >>> c = pd.Categorical([1, 2, 2, 1, 5])
+
+        'sort_values' behaviour with NaNs. Note that 'na_position'
+        is independent of the 'ascending' parameter:
+
+        >>> c = pd.Categorical([np.nan, 2, 2, np.nan, 5])
+        >>> c
+        [NaN, 2.0, 2.0, NaN, 5.0]
+        Categories (2, int64): [2, 5]
+        >>> c.sort_values()
+        [2.0, 2.0, 5.0, NaN, NaN]
+        Categories (2, int64): [2, 5]
+        >>> c.sort_values(ascending=False)
+        [5.0, 2.0, 2.0, NaN, NaN]
+        Categories (2, int64): [2, 5]
+        >>> c.sort_values(na_position='first')
+        [NaN, NaN, 2.0, 2.0, 5.0]
+        Categories (2, int64): [2, 5]
+        >>> c.sort_values(ascending=False, na_position='first')
+        [NaN, NaN, 5.0, 2.0, 2.0]
+        Categories (2, int64): [2, 5]
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if na_position not in ['last', 'first']:
+            msg = 'invalid na_position: {na_position!r}'
+            raise ValueError(msg.format(na_position=na_position))
+
+        codes = np.sort(self._codes)
+        if not ascending:
+            codes = codes[::-1]
+
+        # NaN handling
+        na_mask = (codes == -1)
+        if na_mask.any():
+            n_nans = len(codes[na_mask])
+            if na_position == "first":
+                # in this case sort to the front
+                new_codes = codes.copy()
+                new_codes[0:n_nans] = -1
+                new_codes[n_nans:] = codes[~na_mask]
+                codes = new_codes
+            elif na_position == "last":
+                # ... and to the end
+                new_codes = codes.copy()
+                pos = len(codes) - n_nans
+                new_codes[0:pos] = codes[~na_mask]
+                new_codes[pos:] = -1
+                codes = new_codes
+        if inplace:
+            self._codes = codes
+            return
+        else:
+            return self._constructor(values=codes, categories=self.categories,
+                                     ordered=self.ordered, fastpath=True)
+
+    def _values_for_rank(self):
+        """
+        For correctly ranking ordered categorical data. See GH#15420
+
+        Ordered categorical data should be ranked on the basis of
+        codes with -1 translated to NaN.
+
+        Returns
+        -------
+        numpy array
+
+        """
+        from pandas import Series
+        if self.ordered:
+            values = self.codes
+            mask = values == -1
+            if mask.any():
+                values = values.astype('float64')
+                values[mask] = np.nan
+        elif self.categories.is_numeric():
+            values = np.array(self)
+        else:
+            #  reorder the categories (so rank can use the float codes)
+            #  instead of passing an object array to rank
+            values = np.array(
+                self.rename_categories(Series(self.categories).rank().values)
+            )
+        return values
+
+    def ravel(self, order='C'):
+        """ Return a flattened (numpy) array.
+
+        For internal compatibility with numpy arrays.
+
+        Returns
+        -------
+        raveled : numpy array
+        """
+        return np.array(self)
+
+    def view(self):
+        """Return a view of myself.
+
+        For internal compatibility with numpy arrays.
+
+        Returns
+        -------
+        view : Categorical
+           Returns `self`!
+        """
+        return self
+
+    def to_dense(self):
+        """Return my 'dense' representation
+
+        For internal compatibility with numpy arrays.
+
+        Returns
+        -------
+        dense : array
+        """
+        return np.asarray(self)
+
+    @deprecate_kwarg(old_arg_name='fill_value', new_arg_name='value')
+    def fillna(self, value=None, method=None, limit=None):
+        """ Fill NA/NaN values using the specified method.
+
+        Parameters
+        ----------
+        value : scalar, dict, Series
+            If a scalar value is passed it is used to fill all missing values.
+            Alternatively, a Series or dict can be used to fill in different
+            values for each index. The value should not be a list. The
+            value(s) passed should either be in the categories or should be
+            NaN.
+        method : {'backfill', 'bfill', 'pad', 'ffill', None}, default None
+            Method to use for filling holes in reindexed Series
+            pad / ffill: propagate last valid observation forward to next valid
+            backfill / bfill: use NEXT valid observation to fill gap
+        limit : int, default None
+            (Not implemented yet for Categorical!)
+            If method is specified, this is the maximum number of consecutive
+            NaN values to forward/backward fill. In other words, if there is
+            a gap with more than this number of consecutive NaNs, it will only
+            be partially filled. If method is not specified, this is the
+            maximum number of entries along the entire axis where NaNs will be
+            filled.
+
+        Returns
+        -------
+        filled : Categorical with NA/NaN filled
+        """
+        value, method = validate_fillna_kwargs(
+            value, method, validate_scalar_dict_value=False
+        )
+
+        if value is None:
+            value = np.nan
+        if limit is not None:
+            raise NotImplementedError("specifying a limit for fillna has not "
+                                      "been implemented yet")
+
+        values = self._codes
+
+        # pad / bfill
+        if method is not None:
+
+            values = self.to_dense().reshape(-1, len(self))
+            values = interpolate_2d(values, method, 0, None,
+                                    value).astype(self.categories.dtype)[0]
+            values = _get_codes_for_values(values, self.categories)
+
+        else:
+
+            # If value is a dict or a Series (a dict value has already
+            # been converted to a Series)
+            if isinstance(value, ABCSeries):
+                if not value[~value.isin(self.categories)].isna().all():
+                    raise ValueError("fill value must be in categories")
+
+                values_codes = _get_codes_for_values(value, self.categories)
+                indexer = np.where(values_codes != -1)
+                values[indexer] = values_codes[values_codes != -1]
+
+            # If value is not a dict or Series it should be a scalar
+            elif is_hashable(value):
+                if not isna(value) and value not in self.categories:
+                    raise ValueError("fill value must be in categories")
+
+                mask = values == -1
+                if mask.any():
+                    values = values.copy()
+                    if isna(value):
+                        values[mask] = -1
+                    else:
+                        values[mask] = self.categories.get_loc(value)
+
+            else:
+                raise TypeError('"value" parameter must be a scalar, dict '
+                                'or Series, but you passed a '
+                                '"{0}"'.format(type(value).__name__))
+
+        return self._constructor(values, categories=self.categories,
+                                 ordered=self.ordered, fastpath=True)
+
+    def take_nd(self, indexer, allow_fill=None, fill_value=None):
+        """
+        Take elements from the Categorical.
+
+        Parameters
+        ----------
+        indexer : sequence of integers
+        allow_fill : bool, default None.
+            How to handle negative values in `indexer`.
+
+            * False: negative values in `indices` indicate positional indices
+              from the right. This is similar to
+              :func:`numpy.take`.
+
+            * True: negative values in `indices` indicate missing values
+              (the default). These values are set to `fill_value`. Any other
+              other negative values raise a ``ValueError``.
+
+            .. versionchanged:: 0.23.0
+
+               Deprecated the default value of `allow_fill`. The deprecated
+               default is ``True``. In the future, this will change to
+               ``False``.
+
+        Returns
+        -------
+        Categorical
+            This Categorical will have the same categories and ordered as
+            `self`.
+        """
+        indexer = np.asarray(indexer, dtype=np.intp)
+        if allow_fill is None:
+            if (indexer < 0).any():
+                warn(_take_msg, FutureWarning, stacklevel=2)
+                allow_fill = True
+
+        if isna(fill_value):
+            # For categorical, any NA value is considered a user-facing
+            # NA value. Our storage NA value is -1.
+            fill_value = -1
+
+        codes = take(self._codes, indexer, allow_fill=allow_fill,
+                     fill_value=fill_value)
+        result = self._constructor(codes, categories=self.categories,
+                                   ordered=self.ordered, fastpath=True)
+        return result
+
+    take = take_nd
+
+    def _slice(self, slicer):
+        """ Return a slice of myself.
+
+        For internal compatibility with numpy arrays.
+        """
+
+        # only allow 1 dimensional slicing, but can
+        # in a 2-d case be passd (slice(None),....)
+        if isinstance(slicer, tuple) and len(slicer) == 2:
+            if not com.is_null_slice(slicer[0]):
+                raise AssertionError("invalid slicing for a 1-ndim "
+                                     "categorical")
+            slicer = slicer[1]
+
+        _codes = self._codes[slicer]
+        return self._constructor(values=_codes, categories=self.categories,
+                                 ordered=self.ordered, fastpath=True)
+
+    def __len__(self):
+        """The length of this Categorical."""
+        return len(self._codes)
+
+    def __iter__(self):
+        """Returns an Iterator over the values of this Categorical."""
+        return iter(self.get_values().tolist())
+
+    def __contains__(self, key):
+        """Returns True if `key` is in this Categorical."""
+        # if key is a NaN, check if any NaN is in self.
+        if isna(key):
+            return self.isna().any()
+
+        return contains(self, key, container=self._codes)
+
+    def _tidy_repr(self, max_vals=10, footer=True):
+        """ a short repr displaying only max_vals and an optional (but default
+        footer)
+        """
+        num = max_vals // 2
+        head = self[:num]._get_repr(length=False, footer=False)
+        tail = self[-(max_vals - num):]._get_repr(length=False, footer=False)
+
+        result = u('{head}, ..., {tail}').format(head=head[:-1], tail=tail[1:])
+        if footer:
+            result = u('{result}\n{footer}').format(result=result,
+                                                    footer=self._repr_footer())
+
+        return compat.text_type(result)
+
+    def _repr_categories(self):
+        """ return the base repr for the categories """
+        max_categories = (10 if get_option("display.max_categories") == 0 else
+                          get_option("display.max_categories"))
+        from pandas.io.formats import format as fmt
+        if len(self.categories) > max_categories:
+            num = max_categories // 2
+            head = fmt.format_array(self.categories[:num], None)
+            tail = fmt.format_array(self.categories[-num:], None)
+            category_strs = head + ["..."] + tail
+        else:
+            category_strs = fmt.format_array(self.categories, None)
+
+        # Strip all leading spaces, which format_array adds for columns...
+        category_strs = [x.strip() for x in category_strs]
+        return category_strs
+
+    def _repr_categories_info(self):
+        """ Returns a string representation of the footer."""
+
+        category_strs = self._repr_categories()
+        dtype = getattr(self.categories, 'dtype_str',
+                        str(self.categories.dtype))
+
+        levheader = "Categories ({length}, {dtype}): ".format(
+            length=len(self.categories), dtype=dtype)
+        width, height = get_terminal_size()
+        max_width = get_option("display.width") or width
+        if com.in_ipython_frontend():
+            # 0 = no breaks
+            max_width = 0
+        levstring = ""
+        start = True
+        cur_col_len = len(levheader)  # header
+        sep_len, sep = (3, " < ") if self.ordered else (2, ", ")
+        linesep = sep.rstrip() + "\n"  # remove whitespace
+        for val in category_strs:
+            if max_width != 0 and cur_col_len + sep_len + len(val) > max_width:
+                levstring += linesep + (" " * (len(levheader) + 1))
+                cur_col_len = len(levheader) + 1  # header + a whitespace
+            elif not start:
+                levstring += sep
+                cur_col_len += len(val)
+            levstring += val
+            start = False
+        # replace to simple save space by
+        return levheader + "[" + levstring.replace(" < ... < ", " ... ") + "]"
+
+    def _repr_footer(self):
+
+        return u('Length: {length}\n{info}').format(
+            length=len(self), info=self._repr_categories_info())
+
+    def _get_repr(self, length=True, na_rep='NaN', footer=True):
+        from pandas.io.formats import format as fmt
+        formatter = fmt.CategoricalFormatter(self, length=length,
+                                             na_rep=na_rep, footer=footer)
+        result = formatter.to_string()
+        return compat.text_type(result)
+
+    def __unicode__(self):
+        """ Unicode representation. """
+        _maxlen = 10
+        if len(self._codes) > _maxlen:
+            result = self._tidy_repr(_maxlen)
+        elif len(self._codes) > 0:
+            result = self._get_repr(length=len(self) > _maxlen)
+        else:
+            msg = self._get_repr(length=False, footer=True).replace("\n", ", ")
+            result = ('[], {repr_msg}'.format(repr_msg=msg))
+
+        return result
+
+    def _maybe_coerce_indexer(self, indexer):
+        """ return an indexer coerced to the codes dtype """
+        if isinstance(indexer, np.ndarray) and indexer.dtype.kind == 'i':
+            indexer = indexer.astype(self._codes.dtype)
+        return indexer
+
+    def __getitem__(self, key):
+        """ Return an item. """
+        if isinstance(key, (int, np.integer)):
+            i = self._codes[key]
+            if i == -1:
+                return np.nan
+            else:
+                return self.categories[i]
+        else:
+            return self._constructor(values=self._codes[key],
+                                     dtype=self.dtype, fastpath=True)
+
+    def __setitem__(self, key, value):
+        """ Item assignment.
+
+
+        Raises
+        ------
+        ValueError
+            If (one or more) Value is not in categories or if a assigned
+            `Categorical` does not have the same categories
+        """
+
+        # require identical categories set
+        if isinstance(value, Categorical):
+            if not value.categories.equals(self.categories):
+                raise ValueError("Cannot set a Categorical with another, "
+                                 "without identical categories")
+
+        rvalue = value if is_list_like(value) else [value]
+
+        from pandas import Index
+        to_add = Index(rvalue).difference(self.categories)
+
+        # no assignments of values not in categories, but it's always ok to set
+        # something to np.nan
+        if len(to_add) and not isna(to_add).all():
+            raise ValueError("Cannot setitem on a Categorical with a new "
+                             "category, set the categories first")
+
+        # set by position
+        if isinstance(key, (int, np.integer)):
+            pass
+
+        # tuple of indexers (dataframe)
+        elif isinstance(key, tuple):
+            # only allow 1 dimensional slicing, but can
+            # in a 2-d case be passd (slice(None),....)
+            if len(key) == 2:
+                if not com.is_null_slice(key[0]):
+                    raise AssertionError("invalid slicing for a 1-ndim "
+                                         "categorical")
+                key = key[1]
+            elif len(key) == 1:
+                key = key[0]
+            else:
+                raise AssertionError("invalid slicing for a 1-ndim "
+                                     "categorical")
+
+        # slicing in Series or Categorical
+        elif isinstance(key, slice):
+            pass
+
+        # Array of True/False in Series or Categorical
+        else:
+            # There is a bug in numpy, which does not accept a Series as a
+            # indexer
+            # https://github.com/pandas-dev/pandas/issues/6168
+            # https://github.com/numpy/numpy/issues/4240 -> fixed in numpy 1.9
+            # FIXME: remove when numpy 1.9 is the lowest numpy version pandas
+            # accepts...
+            key = np.asarray(key)
+
+        lindexer = self.categories.get_indexer(rvalue)
+        lindexer = self._maybe_coerce_indexer(lindexer)
+        self._codes[key] = lindexer
+
+    def _reverse_indexer(self):
+        """
+        Compute the inverse of a categorical, returning
+        a dict of categories -> indexers.
+
+        *This is an internal function*
+
+        Returns
+        -------
+        dict of categories -> indexers
+
+        Example
+        -------
+        In [1]: c = pd.Categorical(list('aabca'))
+
+        In [2]: c
+        Out[2]:
+        [a, a, b, c, a]
+        Categories (3, object): [a, b, c]
+
+        In [3]: c.categories
+        Out[3]: Index([u'a', u'b', u'c'], dtype='object')
+
+        In [4]: c.codes
+        Out[4]: array([0, 0, 1, 2, 0], dtype=int8)
+
+        In [5]: c._reverse_indexer()
+        Out[5]: {'a': array([0, 1, 4]), 'b': array([2]), 'c': array([3])}
+
+        """
+        categories = self.categories
+        r, counts = libalgos.groupsort_indexer(self.codes.astype('int64'),
+                                               categories.size)
+        counts = counts.cumsum()
+        result = [r[counts[indexer]:counts[indexer + 1]]
+                  for indexer in range(len(counts) - 1)]
+        result = dict(zip(categories, result))
+        return result
+
+    # reduction ops #
+    def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
+                filter_type=None, **kwds):
+        """ perform the reduction type operation """
+        func = getattr(self, name, None)
+        if func is None:
+            msg = 'Categorical cannot perform the operation {op}'
+            raise TypeError(msg.format(op=name))
+        return func(numeric_only=numeric_only, **kwds)
+
+    def min(self, numeric_only=None, **kwargs):
+        """ The minimum value of the object.
+
+        Only ordered `Categoricals` have a minimum!
+
+        Raises
+        ------
+        TypeError
+            If the `Categorical` is not `ordered`.
+
+        Returns
+        -------
+        min : the minimum of this `Categorical`
+        """
+        self.check_for_ordered('min')
+        if numeric_only:
+            good = self._codes != -1
+            pointer = self._codes[good].min(**kwargs)
+        else:
+            pointer = self._codes.min(**kwargs)
+        if pointer == -1:
+            return np.nan
+        else:
+            return self.categories[pointer]
+
+    def max(self, numeric_only=None, **kwargs):
+        """ The maximum value of the object.
+
+        Only ordered `Categoricals` have a maximum!
+
+        Raises
+        ------
+        TypeError
+            If the `Categorical` is not `ordered`.
+
+        Returns
+        -------
+        max : the maximum of this `Categorical`
+        """
+        self.check_for_ordered('max')
+        if numeric_only:
+            good = self._codes != -1
+            pointer = self._codes[good].max(**kwargs)
+        else:
+            pointer = self._codes.max(**kwargs)
+        if pointer == -1:
+            return np.nan
+        else:
+            return self.categories[pointer]
+
+    def mode(self, dropna=True):
+        """
+        Returns the mode(s) of the Categorical.
+
+        Always returns `Categorical` even if only one value.
+
+        Parameters
+        ----------
+        dropna : boolean, default True
+            Don't consider counts of NaN/NaT.
+
+            .. versionadded:: 0.24.0
+
+        Returns
+        -------
+        modes : `Categorical` (sorted)
+        """
+
+        import pandas._libs.hashtable as htable
+        values = self._codes
+        if dropna:
+            good = self._codes != -1
+            values = self._codes[good]
+        values = sorted(htable.mode_int64(_ensure_int64(values), dropna))
+        result = self._constructor(values=values, categories=self.categories,
+                                   ordered=self.ordered, fastpath=True)
+        return result
+
+    def unique(self):
+        """
+        Return the ``Categorical`` which ``categories`` and ``codes`` are
+        unique. Unused categories are NOT returned.
+
+        - unordered category: values and categories are sorted by appearance
+          order.
+        - ordered category: values are sorted by appearance order, categories
+          keeps existing order.
+
+        Returns
+        -------
+        unique values : ``Categorical``
+
+        Examples
+        --------
+        An unordered Categorical will return categories in the
+        order of appearance.
+
+        >>> pd.Categorical(list('baabc'))
+        [b, a, c]
+        Categories (3, object): [b, a, c]
+
+        >>> pd.Categorical(list('baabc'), categories=list('abc'))
+        [b, a, c]
+        Categories (3, object): [b, a, c]
+
+        An ordered Categorical preserves the category ordering.
+
+        >>> pd.Categorical(list('baabc'),
+        ...                categories=list('abc'),
+        ...                ordered=True)
+        [b, a, c]
+        Categories (3, object): [a < b < c]
+
+        See Also
+        --------
+        unique
+        CategoricalIndex.unique
+        Series.unique
+
+        """
+
+        # unlike np.unique, unique1d does not sort
+        unique_codes = unique1d(self.codes)
+        cat = self.copy()
+
+        # keep nan in codes
+        cat._codes = unique_codes
+
+        # exclude nan from indexer for categories
+        take_codes = unique_codes[unique_codes != -1]
+        if self.ordered:
+            take_codes = np.sort(take_codes)
+        return cat.set_categories(cat.categories.take(take_codes))
+
+    def _values_for_factorize(self):
+        codes = self.codes.astype('int64')
+        return codes, -1
+
+    @classmethod
+    def _from_factorized(cls, uniques, original):
+        return original._constructor(original.categories.take(uniques),
+                                     categories=original.categories,
+                                     ordered=original.ordered)
+
+    def equals(self, other):
+        """
+        Returns True if categorical arrays are equal.
+
+        Parameters
+        ----------
+        other : `Categorical`
+
+        Returns
+        -------
+        are_equal : boolean
+        """
+        if self.is_dtype_equal(other):
+            if self.categories.equals(other.categories):
+                # fastpath to avoid re-coding
+                other_codes = other._codes
+            else:
+                other_codes = _recode_for_categories(other.codes,
+                                                     other.categories,
+                                                     self.categories)
+            return np.array_equal(self._codes, other_codes)
+        return False
+
+    def is_dtype_equal(self, other):
+        """
+        Returns True if categoricals are the same dtype
+          same categories, and same ordered
+
+        Parameters
+        ----------
+        other : Categorical
+
+        Returns
+        -------
+        are_equal : boolean
+        """
+
+        try:
+            return hash(self.dtype) == hash(other.dtype)
+        except (AttributeError, TypeError):
+            return False
+
+    def describe(self):
+        """ Describes this Categorical
+
+        Returns
+        -------
+        description: `DataFrame`
+            A dataframe with frequency and counts by category.
+        """
+        counts = self.value_counts(dropna=False)
+        freqs = counts / float(counts.sum())
+
+        from pandas.core.reshape.concat import concat
+        result = concat([counts, freqs], axis=1)
+        result.columns = ['counts', 'freqs']
+        result.index.name = 'categories'
+
+        return result
+
+    def repeat(self, repeats, *args, **kwargs):
+        """
+        Repeat elements of a Categorical.
+
+        See also
+        --------
+        numpy.ndarray.repeat
+
+        """
+        nv.validate_repeat(args, kwargs)
+        codes = self._codes.repeat(repeats)
+        return self._constructor(values=codes, categories=self.categories,
+                                 ordered=self.ordered, fastpath=True)
+
+    # Implement the ExtensionArray interface
+    @property
+    def _can_hold_na(self):
+        return True
+
+    @classmethod
+    def _concat_same_type(self, to_concat):
+        from pandas.core.dtypes.concat import _concat_categorical
+
+        return _concat_categorical(to_concat)
+
+    def _formatting_values(self):
+        return self
+
+    def isin(self, values):
+        """
+        Check whether `values` are contained in Categorical.
+
+        Return a boolean NumPy Array showing whether each element in
+        the Categorical matches an element in the passed sequence of
+        `values` exactly.
+
+        Parameters
+        ----------
+        values : set or list-like
+            The sequence of values to test. Passing in a single string will
+            raise a ``TypeError``. Instead, turn a single string into a
+            list of one element.
+
+        Returns
+        -------
+        isin : numpy.ndarray (bool dtype)
+
+        Raises
+        ------
+        TypeError
+          * If `values` is not a set or list-like
+
+        See Also
+        --------
+        pandas.Series.isin : equivalent method on Series
+
+        Examples
+        --------
+
+        >>> s = pd.Categorical(['lama', 'cow', 'lama', 'beetle', 'lama',
+        ...                'hippo'])
+        >>> s.isin(['cow', 'lama'])
+        array([ True,  True,  True, False,  True, False])
+
+        Passing a single string as ``s.isin('lama')`` will raise an error. Use
+        a list of one element instead:
+
+        >>> s.isin(['lama'])
+        array([ True, False,  True, False,  True, False])
+        """
+        from pandas.core.series import _sanitize_array
+        if not is_list_like(values):
+            raise TypeError("only list-like objects are allowed to be passed"
+                            " to isin(), you passed a [{values_type}]"
+                            .format(values_type=type(values).__name__))
+        values = _sanitize_array(values, None, None)
+        null_mask = np.asarray(isna(values))
+        code_values = self.categories.get_indexer(values)
+        code_values = code_values[null_mask | (code_values >= 0)]
+        return algorithms.isin(self.codes, code_values)
+
+
+# The Series.cat accessor
+
+
+class CategoricalAccessor(PandasDelegate, PandasObject, NoNewAttributesMixin):
+    """
+    Accessor object for categorical properties of the Series values.
+
+    Be aware that assigning to `categories` is a inplace operation, while all
+    methods return new categorical data per default (but can be called with
+    `inplace=True`).
+
+    Parameters
+    ----------
+    data : Series or CategoricalIndex
+
+    Examples
+    --------
+    >>> s.cat.categories
+    >>> s.cat.categories = list('abc')
+    >>> s.cat.rename_categories(list('cab'))
+    >>> s.cat.reorder_categories(list('cab'))
+    >>> s.cat.add_categories(['d','e'])
+    >>> s.cat.remove_categories(['d'])
+    >>> s.cat.remove_unused_categories()
+    >>> s.cat.set_categories(list('abcde'))
+    >>> s.cat.as_ordered()
+    >>> s.cat.as_unordered()
+
+    """
+
+    def __init__(self, data):
+        self._validate(data)
+        self.categorical = data.values
+        self.index = data.index
+        self.name = data.name
+        self._freeze()
+
+    @staticmethod
+    def _validate(data):
+        if not is_categorical_dtype(data.dtype):
+            raise AttributeError("Can only use .cat accessor with a "
+                                 "'category' dtype")
+
+    def _delegate_property_get(self, name):
+        return getattr(self.categorical, name)
+
+    def _delegate_property_set(self, name, new_values):
+        return setattr(self.categorical, name, new_values)
+
+    @property
+    def codes(self):
+        from pandas import Series
+        return Series(self.categorical.codes, index=self.index)
+
+    def _delegate_method(self, name, *args, **kwargs):
+        from pandas import Series
+        method = getattr(self.categorical, name)
+        res = method(*args, **kwargs)
+        if res is not None:
+            return Series(res, index=self.index, name=self.name)
+
+
+CategoricalAccessor._add_delegate_accessors(delegate=Categorical,
+                                            accessors=["categories",
+                                                       "ordered"],
+                                            typ='property')
+CategoricalAccessor._add_delegate_accessors(delegate=Categorical, accessors=[
+    "rename_categories", "reorder_categories", "add_categories",
+    "remove_categories", "remove_unused_categories", "set_categories",
+    "as_ordered", "as_unordered"], typ='method')
+
+# utility routines
+
+
+def _get_codes_for_values(values, categories):
+    """
+    utility routine to turn values into codes given the specified categories
+    """
+
+    from pandas.core.algorithms import _get_data_algo, _hashtables
+    if not is_dtype_equal(values.dtype, categories.dtype):
+        values = _ensure_object(values)
+        categories = _ensure_object(categories)
+
+    (hash_klass, vec_klass), vals = _get_data_algo(values, _hashtables)
+    (_, _), cats = _get_data_algo(categories, _hashtables)
+    t = hash_klass(len(cats))
+    t.map_locations(cats)
+    return coerce_indexer_dtype(t.lookup(vals), cats)
+
+
+def _recode_for_categories(codes, old_categories, new_categories):
+    """
+    Convert a set of codes for to a new set of categories
+
+    Parameters
+    ----------
+    codes : array
+    old_categories, new_categories : Index
+
+    Returns
+    -------
+    new_codes : array
+
+    Examples
+    --------
+    >>> old_cat = pd.Index(['b', 'a', 'c'])
+    >>> new_cat = pd.Index(['a', 'b'])
+    >>> codes = np.array([0, 1, 1, 2])
+    >>> _recode_for_categories(codes, old_cat, new_cat)
+    array([ 1,  0,  0, -1])
+    """
+    from pandas.core.algorithms import take_1d
+
+    if len(old_categories) == 0:
+        # All null anyway, so just retain the nulls
+        return codes.copy()
+    indexer = coerce_indexer_dtype(new_categories.get_indexer(old_categories),
+                                   new_categories)
+    new_codes = take_1d(indexer, codes.copy(), fill_value=-1)
+    return new_codes
+
+
+def _convert_to_list_like(list_like):
+    if hasattr(list_like, "dtype"):
+        return list_like
+    if isinstance(list_like, list):
+        return list_like
+    if (is_sequence(list_like) or isinstance(list_like, tuple) or
+            is_iterator(list_like)):
+        return list(list_like)
+    elif is_scalar(list_like):
+        return [list_like]
+    else:
+        # is this reached?
+        return [list_like]
+
+
+def _factorize_from_iterable(values):
+    """
+    Factorize an input `values` into `categories` and `codes`. Preserves
+    categorical dtype in `categories`.
+
+    *This is an internal function*
+
+    Parameters
+    ----------
+    values : list-like
+
+    Returns
+    -------
+    codes : ndarray
+    categories : Index
+        If `values` has a categorical dtype, then `categories` is
+        a CategoricalIndex keeping the categories and order of `values`.
+    """
+    from pandas.core.indexes.category import CategoricalIndex
+
+    if not is_list_like(values):
+        raise TypeError("Input must be list-like")
+
+    if is_categorical(values):
+        if isinstance(values, (ABCCategoricalIndex, ABCSeries)):
+            values = values._values
+        categories = CategoricalIndex(values.categories,
+                                      categories=values.categories,
+                                      ordered=values.ordered)
+        codes = values.codes
+    else:
+        cat = Categorical(values, ordered=True)
+        categories = cat.categories
+        codes = cat.codes
+    return codes, categories
+
+
+def _factorize_from_iterables(iterables):
+    """
+    A higher-level wrapper over `_factorize_from_iterable`.
+
+    *This is an internal function*
+
+    Parameters
+    ----------
+    iterables : list-like of list-likes
+
+    Returns
+    -------
+    codes_list : list of ndarrays
+    categories_list : list of Indexes
+
+    Notes
+    -----
+    See `_factorize_from_iterable` for more info.
+    """
+    if len(iterables) == 0:
+        # For consistency, it should return a list of 2 lists.
+        return [[], []]
+    return map(list, lzip(*[_factorize_from_iterable(it) for it in iterables]))
diff --git a/pandas/core/base.py b/pandas/core/base.py
index d3850be13b6f0..6625a3bbe97d7 100644
--- a/pandas/core/base.py
+++ b/pandas/core/base.py
@@ -1,22 +1,40 @@
 """
 Base and utility classes for pandas objects.
 """
+import warnings
+import textwrap
 from pandas import compat
+from pandas.compat import builtins
 import numpy as np
-from pandas.core import common as com
+
+from pandas.core.dtypes.missing import isna
+from pandas.core.dtypes.generic import ABCDataFrame, ABCSeries, ABCIndexClass
+from pandas.core.dtypes.common import (
+    is_datetimelike,
+    is_object_dtype,
+    is_list_like,
+    is_scalar,
+    is_extension_type,
+    is_extension_array_dtype)
+
+from pandas.util._validators import validate_bool_kwarg
+from pandas.errors import AbstractMethodError
+from pandas.core import common as com, algorithms
 import pandas.core.nanops as nanops
-import pandas.lib as lib
-from pandas.util.decorators import Appender, cache_readonly, deprecate_kwarg
-from pandas.core.strings import StringMethods
-from pandas.core.common import AbstractMethodError
+import pandas._libs.lib as lib
+from pandas.compat.numpy import function as nv
+from pandas.compat import PYPY
+from pandas.util._decorators import (Appender, cache_readonly,
+                                     deprecate_kwarg, Substitution)
+
+from pandas.core.accessor import DirNamesMixin
 
 _shared_docs = dict()
 _indexops_doc_kwargs = dict(klass='IndexOpsMixin', inplace='',
-                            duplicated='IndexOpsMixin')
+                            unique='IndexOpsMixin', duplicated='IndexOpsMixin')
 
 
 class StringMixin(object):
-
     """implements string methods so long as object defines a `__unicode__`
     method.
 
@@ -25,7 +43,7 @@ class StringMixin(object):
     # side note - this could be made into a metaclass if more than one
     #             object needs
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Formatting
 
     def __unicode__(self):
@@ -64,7 +82,7 @@ def __repr__(self):
         return str(self)
 
 
-class PandasObject(StringMixin):
+class PandasObject(StringMixin, DirNamesMixin):
 
     """baseclass for various pandas objects"""
 
@@ -83,23 +101,6 @@ def __unicode__(self):
         # Should be overwritten by base classes
         return object.__repr__(self)
 
-    def _dir_additions(self):
-        """ add addtional __dir__ for this object """
-        return set()
-
-    def _dir_deletions(self):
-        """ delete unwanted __dir__ for this object """
-        return set()
-
-    def __dir__(self):
-        """
-        Provide method name lookup and completion
-        Only provide 'public' methods
-        """
-        rv = set(dir(type(self)))
-        rv = (rv - self._dir_deletions()) | self._dir_additions()
-        return sorted(rv)
-
     def _reset_cache(self, key=None):
         """
         Reset cached properties. If ``key`` is passed, only clears that key.
@@ -111,217 +112,621 @@ def _reset_cache(self, key=None):
         else:
             self._cache.pop(key, None)
 
-class PandasDelegate(PandasObject):
-    """ an abstract base class for delegating methods/properties """
+    def __sizeof__(self):
+        """
+        Generates the total memory usage for an object that returns
+        either a value or Series of values
+        """
+        if hasattr(self, 'memory_usage'):
+            mem = self.memory_usage(deep=True)
+            if not is_scalar(mem):
+                mem = mem.sum()
+            return int(mem)
 
-    def _delegate_property_get(self, name, *args, **kwargs):
-        raise TypeError("You cannot access the property {name}".format(name=name))
+        # no memory_usage attribute, so fall back to
+        # object's 'sizeof'
+        return super(PandasObject, self).__sizeof__()
 
-    def _delegate_property_set(self, name, value, *args, **kwargs):
-        raise TypeError("The property {name} cannot be set".format(name=name))
 
-    def _delegate_method(self, name, *args, **kwargs):
-        raise TypeError("You cannot call method {name}".format(name=name))
+class NoNewAttributesMixin(object):
+    """Mixin which prevents adding new attributes.
 
-    @classmethod
-    def _add_delegate_accessors(cls, delegate, accessors, typ, overwrite=False):
-        """
-        add accessors to cls from the delegate class
+    Prevents additional attributes via xxx.attribute = "something" after a
+    call to `self.__freeze()`. Mainly used to prevent the user from using
+    wrong attributes on a accessor (`Series.cat/.str/.dt`).
 
-        Parameters
-        ----------
-        cls : the class to add the methods/properties to
-        delegate : the class to get methods/properties & doc-strings
-        acccessors : string list of accessors to add
-        typ : 'property' or 'method'
-        overwrite : boolean, default False
-           overwrite the method/property in the target class if it exists
+    If you really want to add a new attribute at a later time, you need to use
+    `object.__setattr__(self, key, value)`.
+    """
 
-        """
+    def _freeze(self):
+        """Prevents setting additional attributes"""
+        object.__setattr__(self, "__frozen", True)
 
-        def _create_delegator_property(name):
+    # prevent adding any attribute via s.xxx.new_attribute = ...
+    def __setattr__(self, key, value):
+        # _cache is used by a decorator
+        # We need to check both 1.) cls.__dict__ and 2.) getattr(self, key)
+        # because
+        # 1.) getattr is false for attributes that raise errors
+        # 2.) cls.__dict__ doesn't traverse into base classes
+        if (getattr(self, "__frozen", False) and not
+                (key == "_cache" or
+                 key in type(self).__dict__ or
+                 getattr(self, key, None) is not None)):
+            raise AttributeError("You cannot add any new attribute '{key}'".
+                                 format(key=key))
+        object.__setattr__(self, key, value)
 
-            def _getter(self):
-                return self._delegate_property_get(name)
-            def _setter(self, new_values):
-                return self._delegate_property_set(name, new_values)
 
-            _getter.__name__ = name
-            _setter.__name__ = name
+class GroupByError(Exception):
+    pass
 
-            return property(fget=_getter, fset=_setter, doc=getattr(delegate,name).__doc__)
 
-        def _create_delegator_method(name):
+class DataError(GroupByError):
+    pass
 
-            def f(self, *args, **kwargs):
-                return self._delegate_method(name, *args, **kwargs)
 
-            f.__name__ = name
-            f.__doc__ = getattr(delegate,name).__doc__
+class SpecificationError(GroupByError):
+    pass
 
-            return f
 
-        for name in accessors:
+class SelectionMixin(object):
+    """
+    mixin implementing the selection & aggregation interface on a group-like
+    object sub-classes need to define: obj, exclusions
+    """
+    _selection = None
+    _internal_names = ['_cache', '__setstate__']
+    _internal_names_set = set(_internal_names)
+    _builtin_table = {
+        builtins.sum: np.sum,
+        builtins.max: np.max,
+        builtins.min: np.min
+    }
+    _cython_table = {
+        builtins.sum: 'sum',
+        builtins.max: 'max',
+        builtins.min: 'min',
+        np.all: 'all',
+        np.any: 'any',
+        np.sum: 'sum',
+        np.mean: 'mean',
+        np.prod: 'prod',
+        np.std: 'std',
+        np.var: 'var',
+        np.median: 'median',
+        np.max: 'max',
+        np.min: 'min',
+        np.cumprod: 'cumprod',
+        np.cumsum: 'cumsum'
+    }
 
-            if typ == 'property':
-                f = _create_delegator_property(name)
-            else:
-                f = _create_delegator_method(name)
+    @property
+    def _selection_name(self):
+        """
+        return a name for myself; this would ideally be called
+        the 'name' property, but we cannot conflict with the
+        Series.name property which can be set
+        """
+        if self._selection is None:
+            return None  # 'result'
+        else:
+            return self._selection
 
-            # don't overwrite existing methods/properties
-            if overwrite or not hasattr(cls, name):
-                setattr(cls,name,f)
+    @property
+    def _selection_list(self):
+        if not isinstance(self._selection, (list, tuple, ABCSeries,
+                                            ABCIndexClass, np.ndarray)):
+            return [self._selection]
+        return self._selection
 
+    @cache_readonly
+    def _selected_obj(self):
 
-class AccessorProperty(object):
-    """Descriptor for implementing accessor properties like Series.str
-    """
-    def __init__(self, accessor_cls, construct_accessor):
-        self.accessor_cls = accessor_cls
-        self.construct_accessor = construct_accessor
-        self.__doc__ = accessor_cls.__doc__
+        if self._selection is None or isinstance(self.obj, ABCSeries):
+            return self.obj
+        else:
+            return self.obj[self._selection]
 
-    def __get__(self, instance, owner=None):
-        if instance is None:
-            # this ensures that Series.str.<method> is well defined
-            return self.accessor_cls
-        return self.construct_accessor(instance)
+    @cache_readonly
+    def ndim(self):
+        return self._selected_obj.ndim
 
-    def __set__(self, instance, value):
-        raise AttributeError("can't set attribute")
+    @cache_readonly
+    def _obj_with_exclusions(self):
+        if self._selection is not None and isinstance(self.obj,
+                                                      ABCDataFrame):
+            return self.obj.reindex(columns=self._selection_list)
 
-    def __delete__(self, instance):
-        raise AttributeError("can't delete attribute")
+        if len(self.exclusions) > 0:
+            return self.obj.drop(self.exclusions, axis=1)
+        else:
+            return self.obj
+
+    def __getitem__(self, key):
+        if self._selection is not None:
+            raise Exception('Column(s) {selection} already selected'
+                            .format(selection=self._selection))
+
+        if isinstance(key, (list, tuple, ABCSeries, ABCIndexClass,
+                            np.ndarray)):
+            if len(self.obj.columns.intersection(key)) != len(key):
+                bad_keys = list(set(key).difference(self.obj.columns))
+                raise KeyError("Columns not found: {missing}"
+                               .format(missing=str(bad_keys)[1:-1]))
+            return self._gotitem(list(key), ndim=2)
+
+        elif not getattr(self, 'as_index', False):
+            if key not in self.obj.columns:
+                raise KeyError("Column not found: {key}".format(key=key))
+            return self._gotitem(key, ndim=2)
 
+        else:
+            if key not in self.obj:
+                raise KeyError("Column not found: {key}".format(key=key))
+            return self._gotitem(key, ndim=1)
 
-class FrozenList(PandasObject, list):
+    def _gotitem(self, key, ndim, subset=None):
+        """
+        sub-classes to define
+        return a sliced object
 
-    """
-    Container that doesn't allow setting item *but*
-    because it's technically non-hashable, will be used
-    for lookups, appropriately, etc.
-    """
-    # Sidenote: This has to be of type list, otherwise it messes up PyTables
-    #           typechecks
+        Parameters
+        ----------
+        key : string / list of selections
+        ndim : 1,2
+            requested ndim of result
+        subset : object, default None
+            subset to act on
 
-    def __add__(self, other):
-        if isinstance(other, tuple):
-            other = list(other)
-        return self.__class__(super(FrozenList, self).__add__(other))
+        """
+        raise AbstractMethodError(self)
 
-    __iadd__ = __add__
+    def aggregate(self, func, *args, **kwargs):
+        raise AbstractMethodError(self)
 
-    # Python 2 compat
-    def __getslice__(self, i, j):
-        return self.__class__(super(FrozenList, self).__getslice__(i, j))
+    agg = aggregate
 
-    def __getitem__(self, n):
-        # Python 3 compat
-        if isinstance(n, slice):
-            return self.__class__(super(FrozenList, self).__getitem__(n))
-        return super(FrozenList, self).__getitem__(n)
+    def _try_aggregate_string_function(self, arg, *args, **kwargs):
+        """
+        if arg is a string, then try to operate on it:
+        - try to find a function (or attribute) on ourselves
+        - try to find a numpy function
+        - raise
 
-    def __radd__(self, other):
-        if isinstance(other, tuple):
-            other = list(other)
-        return self.__class__(other + list(self))
+        """
+        assert isinstance(arg, compat.string_types)
+
+        f = getattr(self, arg, None)
+        if f is not None:
+            if callable(f):
+                return f(*args, **kwargs)
+
+            # people may try to aggregate on a non-callable attribute
+            # but don't let them think they can pass args to it
+            assert len(args) == 0
+            assert len([kwarg for kwarg in kwargs
+                        if kwarg not in ['axis', '_level']]) == 0
+            return f
 
-    def __eq__(self, other):
-        if isinstance(other, (tuple, FrozenList)):
-            other = list(other)
-        return super(FrozenList, self).__eq__(other)
+        f = getattr(np, arg, None)
+        if f is not None:
+            return f(self, *args, **kwargs)
 
-    __req__ = __eq__
+        raise ValueError("{arg} is an unknown string function".format(arg=arg))
 
-    def __mul__(self, other):
-        return self.__class__(super(FrozenList, self).__mul__(other))
+    def _aggregate(self, arg, *args, **kwargs):
+        """
+        provide an implementation for the aggregators
 
-    __imul__ = __mul__
+        Parameters
+        ----------
+        arg : string, dict, function
+        *args : args to pass on to the function
+        **kwargs : kwargs to pass on to the function
 
-    def __reduce__(self):
-        return self.__class__, (list(self),)
+        Returns
+        -------
+        tuple of result, how
 
-    def __hash__(self):
-        return hash(tuple(self))
+        Notes
+        -----
+        how can be a string describe the required post-processing, or
+        None if not required
+        """
+        is_aggregator = lambda x: isinstance(x, (list, tuple, dict))
+        is_nested_renamer = False
+
+        _axis = kwargs.pop('_axis', None)
+        if _axis is None:
+            _axis = getattr(self, 'axis', 0)
+        _level = kwargs.pop('_level', None)
+
+        if isinstance(arg, compat.string_types):
+            return self._try_aggregate_string_function(arg, *args,
+                                                       **kwargs), None
+
+        if isinstance(arg, dict):
+
+            # aggregate based on the passed dict
+            if _axis != 0:  # pragma: no cover
+                raise ValueError('Can only pass dict with axis=0')
+
+            obj = self._selected_obj
+
+            def nested_renaming_depr(level=4):
+                # deprecation of nested renaming
+                # GH 15931
+                warnings.warn(
+                    ("using a dict with renaming "
+                     "is deprecated and will be removed in a future "
+                     "version"),
+                    FutureWarning, stacklevel=level)
+
+            # if we have a dict of any non-scalars
+            # eg. {'A' : ['mean']}, normalize all to
+            # be list-likes
+            if any(is_aggregator(x) for x in compat.itervalues(arg)):
+                new_arg = compat.OrderedDict()
+                for k, v in compat.iteritems(arg):
+                    if not isinstance(v, (tuple, list, dict)):
+                        new_arg[k] = [v]
+                    else:
+                        new_arg[k] = v
+
+                    # the keys must be in the columns
+                    # for ndim=2, or renamers for ndim=1
+
+                    # ok for now, but deprecated
+                    # {'A': { 'ra': 'mean' }}
+                    # {'A': { 'ra': ['mean'] }}
+                    # {'ra': ['mean']}
+
+                    # not ok
+                    # {'ra' : { 'A' : 'mean' }}
+                    if isinstance(v, dict):
+                        is_nested_renamer = True
+
+                        if k not in obj.columns:
+                            msg = ('cannot perform renaming for {key} with a '
+                                   'nested dictionary').format(key=k)
+                            raise SpecificationError(msg)
+                        nested_renaming_depr(4 + (_level or 0))
+
+                    elif isinstance(obj, ABCSeries):
+                        nested_renaming_depr()
+                    elif isinstance(obj, ABCDataFrame) and \
+                            k not in obj.columns:
+                        raise KeyError(
+                            "Column '{col}' does not exist!".format(col=k))
+
+                arg = new_arg
 
-    def _disabled(self, *args, **kwargs):
-        """This method will not function because object is immutable."""
-        raise TypeError("'%s' does not support mutable operations." %
-                        self.__class__.__name__)
+            else:
+                # deprecation of renaming keys
+                # GH 15931
+                keys = list(compat.iterkeys(arg))
+                if (isinstance(obj, ABCDataFrame) and
+                        len(obj.columns.intersection(keys)) != len(keys)):
+                    nested_renaming_depr()
+
+            from pandas.core.reshape.concat import concat
+
+            def _agg_1dim(name, how, subset=None):
+                """
+                aggregate a 1-dim with how
+                """
+                colg = self._gotitem(name, ndim=1, subset=subset)
+                if colg.ndim != 1:
+                    raise SpecificationError("nested dictionary is ambiguous "
+                                             "in aggregation")
+                return colg.aggregate(how, _level=(_level or 0) + 1)
+
+            def _agg_2dim(name, how):
+                """
+                aggregate a 2-dim with how
+                """
+                colg = self._gotitem(self._selection, ndim=2,
+                                     subset=obj)
+                return colg.aggregate(how, _level=None)
+
+            def _agg(arg, func):
+                """
+                run the aggregations over the arg with func
+                return an OrderedDict
+                """
+                result = compat.OrderedDict()
+                for fname, agg_how in compat.iteritems(arg):
+                    result[fname] = func(fname, agg_how)
+                return result
+
+            # set the final keys
+            keys = list(compat.iterkeys(arg))
+            result = compat.OrderedDict()
+
+            # nested renamer
+            if is_nested_renamer:
+                result = list(_agg(arg, _agg_1dim).values())
+
+                if all(isinstance(r, dict) for r in result):
+
+                    result, results = compat.OrderedDict(), result
+                    for r in results:
+                        result.update(r)
+                    keys = list(compat.iterkeys(result))
+
+                else:
+
+                    if self._selection is not None:
+                        keys = None
+
+            # some selection on the object
+            elif self._selection is not None:
+
+                sl = set(self._selection_list)
+
+                # we are a Series like object,
+                # but may have multiple aggregations
+                if len(sl) == 1:
+
+                    result = _agg(arg, lambda fname,
+                                  agg_how: _agg_1dim(self._selection, agg_how))
+
+                # we are selecting the same set as we are aggregating
+                elif not len(sl - set(keys)):
+
+                    result = _agg(arg, _agg_1dim)
+
+                # we are a DataFrame, with possibly multiple aggregations
+                else:
+
+                    result = _agg(arg, _agg_2dim)
+
+            # no selection
+            else:
 
-    def __unicode__(self):
-        from pandas.core.common import pprint_thing
-        return pprint_thing(self, quote_strings=True,
-                            escape_chars=('\t', '\r', '\n'))
+                try:
+                    result = _agg(arg, _agg_1dim)
+                except SpecificationError:
+
+                    # we are aggregating expecting all 1d-returns
+                    # but we have 2d
+                    result = _agg(arg, _agg_2dim)
+
+            # combine results
+
+            def is_any_series():
+                # return a boolean if we have *any* nested series
+                return any(isinstance(r, ABCSeries)
+                           for r in compat.itervalues(result))
+
+            def is_any_frame():
+                # return a boolean if we have *any* nested series
+                return any(isinstance(r, ABCDataFrame)
+                           for r in compat.itervalues(result))
+
+            if isinstance(result, list):
+                return concat(result, keys=keys, axis=1, sort=True), True
+
+            elif is_any_frame():
+                # we have a dict of DataFrames
+                # return a MI DataFrame
+
+                return concat([result[k] for k in keys],
+                              keys=keys, axis=1), True
+
+            elif isinstance(self, ABCSeries) and is_any_series():
+
+                # we have a dict of Series
+                # return a MI Series
+                try:
+                    result = concat(result)
+                except TypeError:
+                    # we want to give a nice error here if
+                    # we have non-same sized objects, so
+                    # we don't automatically broadcast
+
+                    raise ValueError("cannot perform both aggregation "
+                                     "and transformation operations "
+                                     "simultaneously")
+
+                return result, True
+
+            # fall thru
+            from pandas import DataFrame, Series
+            try:
+                result = DataFrame(result)
+            except ValueError:
+
+                # we have a dict of scalars
+                result = Series(result,
+                                name=getattr(self, 'name', None))
+
+            return result, True
+        elif is_list_like(arg) and arg not in compat.string_types:
+            # we require a list, but not an 'str'
+            return self._aggregate_multiple_funcs(arg,
+                                                  _level=_level,
+                                                  _axis=_axis), None
+        else:
+            result = None
 
-    def __repr__(self):
-        return "%s(%s)" % (self.__class__.__name__,
-                           str(self))
+        f = self._is_cython_func(arg)
+        if f and not args and not kwargs:
+            return getattr(self, f)(), None
 
-    __setitem__ = __setslice__ = __delitem__ = __delslice__ = _disabled
-    pop = append = extend = remove = sort = insert = _disabled
+        # caller can react
+        return result, True
 
-class FrozenNDArray(PandasObject, np.ndarray):
+    def _aggregate_multiple_funcs(self, arg, _level, _axis):
+        from pandas.core.reshape.concat import concat
 
-    # no __array_finalize__ for now because no metadata
-    def __new__(cls, data, dtype=None, copy=False):
-        if copy is None:
-            copy = not isinstance(data, FrozenNDArray)
-        res = np.array(data, dtype=dtype, copy=copy).view(cls)
-        return res
+        if _axis != 0:
+            raise NotImplementedError("axis other than 0 is not supported")
 
-    def _disabled(self, *args, **kwargs):
-        """This method will not function because object is immutable."""
-        raise TypeError("'%s' does not support mutable operations." %
-                        self.__class__)
+        if self._selected_obj.ndim == 1:
+            obj = self._selected_obj
+        else:
+            obj = self._obj_with_exclusions
+
+        results = []
+        keys = []
+
+        # degenerate case
+        if obj.ndim == 1:
+            for a in arg:
+                try:
+                    colg = self._gotitem(obj.name, ndim=1, subset=obj)
+                    results.append(colg.aggregate(a))
+
+                    # make sure we find a good name
+                    name = com._get_callable_name(a) or a
+                    keys.append(name)
+                except (TypeError, DataError):
+                    pass
+                except SpecificationError:
+                    raise
+
+        # multiples
+        else:
+            for index, col in enumerate(obj):
+                try:
+                    colg = self._gotitem(col, ndim=1,
+                                         subset=obj.iloc[:, index])
+                    results.append(colg.aggregate(arg))
+                    keys.append(col)
+                except (TypeError, DataError):
+                    pass
+                except ValueError:
+                    # cannot aggregate
+                    continue
+                except SpecificationError:
+                    raise
+
+        # if we are empty
+        if not len(results):
+            raise ValueError("no results")
 
-    __setitem__ = __setslice__ = __delitem__ = __delslice__ = _disabled
-    put = itemset = fill = _disabled
+        try:
+            return concat(results, keys=keys, axis=1, sort=False)
+        except TypeError:
+
+            # we are concatting non-NDFrame objects,
+            # e.g. a list of scalars
+
+            from pandas.core.dtypes.cast import is_nested_object
+            from pandas import Series
+            result = Series(results, index=keys, name=self.name)
+            if is_nested_object(result):
+                raise ValueError("cannot combine transform and "
+                                 "aggregation operations")
+            return result
+
+    def _shallow_copy(self, obj=None, obj_type=None, **kwargs):
+        """ return a new object with the replacement attributes """
+        if obj is None:
+            obj = self._selected_obj.copy()
+        if obj_type is None:
+            obj_type = self._constructor
+        if isinstance(obj, obj_type):
+            obj = obj.obj
+        for attr in self._attributes:
+            if attr not in kwargs:
+                kwargs[attr] = getattr(self, attr)
+        return obj_type(obj, **kwargs)
+
+    def _is_cython_func(self, arg):
+        """ if we define an internal function for this argument, return it """
+        return self._cython_table.get(arg)
+
+    def _is_builtin_func(self, arg):
+        """
+        if we define an builtin function for this argument, return it,
+        otherwise return the arg
+        """
+        return self._builtin_table.get(arg, arg)
 
-    def _shallow_copy(self):
-        return self.view()
 
-    def values(self):
-        """returns *copy* of underlying array"""
-        arr = self.view(np.ndarray).copy()
-        return arr
+class GroupByMixin(object):
+    """ provide the groupby facilities to the mixed object """
 
-    def __unicode__(self):
+    @staticmethod
+    def _dispatch(name, *args, **kwargs):
+        """ dispatch to apply """
+
+        def outer(self, *args, **kwargs):
+            def f(x):
+                x = self._shallow_copy(x, groupby=self._groupby)
+                return getattr(x, name)(*args, **kwargs)
+            return self._groupby.apply(f)
+        outer.__name__ = name
+        return outer
+
+    def _gotitem(self, key, ndim, subset=None):
         """
-        Return a string representation for this object.
+        sub-classes to define
+        return a sliced object
 
-        Invoked by unicode(df) in py2 only. Yields a Unicode String in both
-        py2/py3.
+        Parameters
+        ----------
+        key : string / list of selections
+        ndim : 1,2
+            requested ndim of result
+        subset : object, default None
+            subset to act on
         """
-        prepr = com.pprint_thing(self, escape_chars=('\t', '\r', '\n'),
-                                 quote_strings=True)
-        return "%s(%s, dtype='%s')" % (type(self).__name__, prepr, self.dtype)
+        # create a new object to prevent aliasing
+        if subset is None:
+            subset = self.obj
+
+        # we need to make a shallow copy of ourselves
+        # with the same groupby
+        kwargs = dict([(attr, getattr(self, attr))
+                       for attr in self._attributes])
+        self = self.__class__(subset,
+                              groupby=self._groupby[key],
+                              parent=self,
+                              **kwargs)
+        self._reset_cache()
+        if subset.ndim == 2:
+            if is_scalar(key) and key in subset or is_list_like(key):
+                self._selection = key
+        return self
 
 
 class IndexOpsMixin(object):
-    """ common ops mixin to support a unified inteface / docs for Series / Index """
+    """ common ops mixin to support a unified interface / docs for Series /
+    Index
+    """
 
     # ndarray compatibility
     __array_priority__ = 1000
 
-    def transpose(self):
+    def transpose(self, *args, **kwargs):
         """ return the transpose, which is by definition self """
+        nv.validate_transpose(args, kwargs)
         return self
 
-    T = property(transpose, doc="return the transpose, which is by definition self")
+    T = property(transpose, doc="return the transpose, which is by "
+                                "definition self")
 
     @property
     def shape(self):
         """ return a tuple of the shape of the underlying data """
-        return self.values.shape
+        return self._values.shape
 
     @property
     def ndim(self):
-        """ return the number of dimensions of the underlying data, by definition 1 """
+        """ return the number of dimensions of the underlying data,
+        by definition 1
+        """
         return 1
 
     def item(self):
-        """ return the first element of the underlying data as a python scalar """
+        """ return the first element of the underlying data as a python
+        scalar
+        """
         try:
             return self.values.item()
         except IndexError:
@@ -332,45 +737,104 @@ def item(self):
     @property
     def data(self):
         """ return the data pointer of the underlying data """
+        warnings.warn("{obj}.data is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
         return self.values.data
 
     @property
     def itemsize(self):
         """ return the size of the dtype of the item of the underlying data """
-        return self.values.itemsize
+        warnings.warn("{obj}.itemsize is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
+        return self._ndarray_values.itemsize
 
     @property
     def nbytes(self):
         """ return the number of bytes in the underlying data """
-        return self.values.nbytes
+        return self._values.nbytes
 
     @property
     def strides(self):
         """ return the strides of the underlying data """
-        return self.values.strides
+        warnings.warn("{obj}.strides is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
+        return self._ndarray_values.strides
 
     @property
     def size(self):
         """ return the number of elements in the underlying data """
-        return self.values.size
+        return self._values.size
 
     @property
     def flags(self):
         """ return the ndarray.flags for the underlying data """
+        warnings.warn("{obj}.flags is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
         return self.values.flags
 
     @property
     def base(self):
-        """ return the base object if the memory of the underlying data is shared """
+        """ return the base object if the memory of the underlying data is
+        shared
+        """
+        warnings.warn("{obj}.base is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
         return self.values.base
 
     @property
-    def _values(self):
-        """ the internal implementation """
+    def _ndarray_values(self):
+        # type: () -> np.ndarray
+        """The data as an ndarray, possibly losing information.
+
+        The expectation is that this is cheap to compute, and is primarily
+        used for interacting with our indexers.
+
+        - categorical -> codes
+        """
+        if is_extension_array_dtype(self):
+            return self.values._ndarray_values
         return self.values
 
+    @property
+    def empty(self):
+        return not self.size
+
     def max(self):
-        """ The maximum value of the object """
+        """
+        Return the maximum value of the Index.
+
+        Returns
+        -------
+        scalar
+            Maximum value.
+
+        See Also
+        --------
+        Index.min : Return the minimum value in an Index.
+        Series.max : Return the maximum value in a Series.
+        DataFrame.max : Return the maximum values in a DataFrame.
+
+        Examples
+        --------
+        >>> idx = pd.Index([3, 2, 1])
+        >>> idx.max()
+        3
+
+        >>> idx = pd.Index(['c', 'b', 'a'])
+        >>> idx.max()
+        'c'
+
+        For a MultiIndex, the maximum is determined lexicographically.
+
+        >>> idx = pd.MultiIndex.from_product([('a', 'b'), (2, 1)])
+        >>> idx.max()
+        ('b', 2)
+        """
         return nanops.nanmax(self.values)
 
     def argmax(self, axis=None):
@@ -384,7 +848,36 @@ def argmax(self, axis=None):
         return nanops.nanargmax(self.values)
 
     def min(self):
-        """ The minimum value of the object """
+        """
+        Return the minimum value of the Index.
+
+        Returns
+        -------
+        scalar
+            Minimum value.
+
+        See Also
+        --------
+        Index.max : Return the maximum value of the object.
+        Series.min : Return the minimum value in a Series.
+        DataFrame.min : Return the minimum values in a DataFrame.
+
+        Examples
+        --------
+        >>> idx = pd.Index([3, 2, 1])
+        >>> idx.min()
+        1
+
+        >>> idx = pd.Index(['c', 'b', 'a'])
+        >>> idx.min()
+        'a'
+
+        For a MultiIndex, the minimum is determined lexicographically.
+
+        >>> idx = pd.MultiIndex.from_product([('a', 'b'), (2, 1)])
+        >>> idx.min()
+        ('a', 1)
+        """
         return nanops.nanmin(self.values)
 
     def argmin(self, axis=None):
@@ -397,19 +890,121 @@ def argmin(self, axis=None):
         """
         return nanops.nanargmin(self.values)
 
+    def tolist(self):
+        """
+        Return a list of the values.
+
+        These are each a scalar type, which is a Python scalar
+        (for str, int, float) or a pandas scalar
+        (for Timestamp/Timedelta/Interval/Period)
+
+        See Also
+        --------
+        numpy.ndarray.tolist
+        """
+        if is_datetimelike(self._values):
+            return [com._maybe_box_datetimelike(x) for x in self._values]
+        elif is_extension_array_dtype(self._values):
+            return list(self._values)
+        else:
+            return self._values.tolist()
+
+    def __iter__(self):
+        """
+        Return an iterator of the values.
+
+        These are each a scalar type, which is a Python scalar
+        (for str, int, float) or a pandas scalar
+        (for Timestamp/Timedelta/Interval/Period)
+        """
+        return iter(self.tolist())
+
     @cache_readonly
     def hasnans(self):
         """ return if I have any nans; enables various perf speedups """
-        return com.isnull(self).any()
+        return isna(self).any()
 
     def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
                 filter_type=None, **kwds):
         """ perform the reduction type operation if we can """
-        func = getattr(self,name,None)
+        func = getattr(self, name, None)
         if func is None:
-            raise TypeError("{klass} cannot perform the operation {op}".format(klass=self.__class__.__name__,op=name))
+            raise TypeError("{klass} cannot perform the operation {op}".format(
+                            klass=self.__class__.__name__, op=name))
         return func(**kwds)
 
+    def _map_values(self, mapper, na_action=None):
+        """An internal function that maps values using the input
+        correspondence (which can be a dict, Series, or function).
+
+        Parameters
+        ----------
+        mapper : function, dict, or Series
+            The input correspondence object
+        na_action : {None, 'ignore'}
+            If 'ignore', propagate NA values, without passing them to the
+            mapping function
+
+        Returns
+        -------
+        applied : Union[Index, MultiIndex], inferred
+            The output of the mapping function applied to the index.
+            If the function returns a tuple with more than one element
+            a MultiIndex will be returned.
+
+        """
+
+        # we can fastpath dict/Series to an efficient map
+        # as we know that we are not going to have to yield
+        # python types
+        if isinstance(mapper, dict):
+            if hasattr(mapper, '__missing__'):
+                # If a dictionary subclass defines a default value method,
+                # convert mapper to a lookup function (GH #15999).
+                dict_with_default = mapper
+                mapper = lambda x: dict_with_default[x]
+            else:
+                # Dictionary does not have a default. Thus it's safe to
+                # convert to an Series for efficiency.
+                # we specify the keys here to handle the
+                # possibility that they are tuples
+                from pandas import Series
+                mapper = Series(mapper)
+
+        if isinstance(mapper, ABCSeries):
+            # Since values were input this means we came from either
+            # a dict or a series and mapper should be an index
+            if is_extension_type(self.dtype):
+                values = self._values
+            else:
+                values = self.values
+
+            indexer = mapper.index.get_indexer(values)
+            new_values = algorithms.take_1d(mapper._values, indexer)
+
+            return new_values
+
+        # we must convert to python types
+        if is_extension_type(self.dtype):
+            values = self._values
+            if na_action is not None:
+                raise NotImplementedError
+            map_f = lambda values, f: values.map(f)
+        else:
+            values = self.astype(object)
+            values = getattr(values, 'values', values)
+            if na_action == 'ignore':
+                def map_f(values, f):
+                    return lib.map_infer_mask(values, f,
+                                              isna(values).view(np.uint8))
+            else:
+                map_f = lib.map_infer
+
+        # mapper is a function
+        new_values = map_f(values, mapper)
+
+        return new_values
+
     def value_counts(self, normalize=False, sort=True, ascending=False,
                      bins=None, dropna=True):
         """
@@ -439,34 +1034,21 @@ def value_counts(self, normalize=False, sort=True, ascending=False,
         counts : Series
         """
         from pandas.core.algorithms import value_counts
-        from pandas.tseries.api import DatetimeIndex, PeriodIndex
         result = value_counts(self, sort=sort, ascending=ascending,
                               normalize=normalize, bins=bins, dropna=dropna)
-
-        if isinstance(self, PeriodIndex):
-            # preserve freq
-            result.index = self._simple_new(result.index.values,
-                                            freq=self.freq)
-        elif isinstance(self, DatetimeIndex):
-            result.index = self._simple_new(result.index.values,
-                                            tz=getattr(self, 'tz', None))
         return result
 
     def unique(self):
-        """
-        Return array of unique values in the object. Significantly faster than
-        numpy.unique. Includes NA values.
+        values = self._values
 
-        Returns
-        -------
-        uniques : ndarray
-        """
-        from pandas.core.nanops import unique1d
-        values = self.values
-        if hasattr(values,'unique'):
-            return values.unique()
+        if hasattr(values, 'unique'):
 
-        return unique1d(values)
+            result = values.unique()
+        else:
+            from pandas.core.algorithms import unique1d
+            result = unique1d(values)
+
+        return result
 
     def nunique(self, dropna=True):
         """
@@ -485,94 +1067,174 @@ def nunique(self, dropna=True):
         """
         uniqs = self.unique()
         n = len(uniqs)
-        if dropna and com.isnull(uniqs).any():
+        if dropna and isna(uniqs).any():
             n -= 1
         return n
 
+    @property
+    def is_unique(self):
+        """
+        Return boolean if values in the object are unique
 
-    def factorize(self, sort=False, na_sentinel=-1):
+        Returns
+        -------
+        is_unique : boolean
+        """
+        return self.nunique() == len(self)
+
+    @property
+    def is_monotonic(self):
+        """
+        Return boolean if values in the object are
+        monotonic_increasing
+
+        .. versionadded:: 0.19.0
+
+        Returns
+        -------
+        is_monotonic : boolean
+        """
+        from pandas import Index
+        return Index(self).is_monotonic
+
+    is_monotonic_increasing = is_monotonic
+
+    @property
+    def is_monotonic_decreasing(self):
+        """
+        Return boolean if values in the object are
+        monotonic_decreasing
+
+        .. versionadded:: 0.19.0
+
+        Returns
+        -------
+        is_monotonic_decreasing : boolean
         """
-        Encode the object as an enumerated type or categorical variable
+        from pandas import Index
+        return Index(self).is_monotonic_decreasing
+
+    def memory_usage(self, deep=False):
+        """
+        Memory usage of the values
 
         Parameters
         ----------
-        sort : boolean, default False
-            Sort by values
-        na_sentinel: int, default -1
-            Value to mark "not found"
+        deep : bool
+            Introspect the data deeply, interrogate
+            `object` dtypes for system-level memory consumption
 
         Returns
         -------
-        labels : the indexer to the original array
-        uniques : the unique Index
-        """
-        from pandas.core.algorithms import factorize
-        return factorize(self, sort=sort, na_sentinel=na_sentinel)
-
-    def searchsorted(self, key, side='left'):
-        """ np.ndarray searchsorted compat """
-
-        ### FIXME in GH7447
-        #### needs coercion on the key (DatetimeIndex does alreay)
-        #### needs tests/doc-string
-        return self.values.searchsorted(key, side=side)
-
-    # string methods
-    def _make_str_accessor(self):
-        from pandas.core.series import Series
-        from pandas.core.index import Index
-        if isinstance(self, Series) and not com.is_object_dtype(self.dtype):
-            # this really should exclude all series with any non-string values,
-            # but that isn't practical for performance reasons until we have a
-            # str dtype (GH 9343)
-            raise AttributeError("Can only use .str accessor with string "
-                                 "values, which use np.object_ dtype in "
-                                 "pandas")
-        elif isinstance(self, Index):
-            # see scc/inferrence.pyx which can contain string values
-            allowed_types = ('string', 'unicode', 'mixed', 'mixed-integer')
-            if self.inferred_type not in allowed_types:
-                message = ("Can only use .str accessor with string values "
-                           "(i.e. inferred_type is 'string', 'unicode' or 'mixed')")
-                raise AttributeError(message)
-            if self.nlevels > 1:
-                message = "Can only use .str accessor with Index, not MultiIndex"
-                raise AttributeError(message)
-        return StringMethods(self)
-
-    str = AccessorProperty(StringMethods, _make_str_accessor)
-
-    def _dir_additions(self):
-        return set()
-
-    def _dir_deletions(self):
-        try:
-            getattr(self, 'str')
-        except AttributeError:
-            return set(['str'])
-        return set()
+        bytes used
+
+        Notes
+        -----
+        Memory usage does not include memory consumed by elements that
+        are not components of the array if deep=False or if used on PyPy
+
+        See Also
+        --------
+        numpy.ndarray.nbytes
+        """
+        if hasattr(self.values, 'memory_usage'):
+            return self.values.memory_usage(deep=deep)
+
+        v = self.values.nbytes
+        if deep and is_object_dtype(self) and not PYPY:
+            v += lib.memory_usage_of_objects(self.values)
+        return v
+
+    @Substitution(
+        values='', order='', size_hint='',
+        sort=textwrap.dedent("""\
+            sort : boolean, default False
+                Sort `uniques` and shuffle `labels` to maintain the
+                relationship.
+            """))
+    @Appender(algorithms._shared_docs['factorize'])
+    def factorize(self, sort=False, na_sentinel=-1):
+        return algorithms.factorize(self, sort=sort, na_sentinel=na_sentinel)
 
-    _shared_docs['drop_duplicates'] = (
-        """Return %(klass)s with duplicate values removed
+    _shared_docs['searchsorted'] = (
+        """Find indices where elements should be inserted to maintain order.
+
+        Find the indices into a sorted %(klass)s `self` such that, if the
+        corresponding elements in `value` were inserted before the indices,
+        the order of `self` would be preserved.
 
         Parameters
         ----------
-
-        keep : {'first', 'last', False}, default 'first'
-            - ``first`` : Drop duplicates except for the first occurrence.
-            - ``last`` : Drop duplicates except for the last occurrence.
-            - False : Drop all duplicates.
-        take_last : deprecated
-        %(inplace)s
+        value : array_like
+            Values to insert into `self`.
+        side : {'left', 'right'}, optional
+            If 'left', the index of the first suitable location found is given.
+            If 'right', return the last such index.  If there is no suitable
+            index, return either 0 or N (where N is the length of `self`).
+        sorter : 1-D array_like, optional
+            Optional array of integer indices that sort `self` into ascending
+            order. They are typically the result of ``np.argsort``.
 
         Returns
         -------
-        deduplicated : %(klass)s
+        indices : array of ints
+            Array of insertion points with the same shape as `value`.
+
+        See Also
+        --------
+        numpy.searchsorted
+
+        Notes
+        -----
+        Binary search is used to find the required insertion points.
+
+        Examples
+        --------
+
+        >>> x = pd.Series([1, 2, 3])
+        >>> x
+        0    1
+        1    2
+        2    3
+        dtype: int64
+
+        >>> x.searchsorted(4)
+        array([3])
+
+        >>> x.searchsorted([0, 4])
+        array([0, 3])
+
+        >>> x.searchsorted([1, 3], side='left')
+        array([0, 2])
+
+        >>> x.searchsorted([1, 3], side='right')
+        array([1, 3])
+
+        >>> x = pd.Categorical(['apple', 'bread', 'bread',
+                                'cheese', 'milk'], ordered=True)
+        [apple, bread, bread, cheese, milk]
+        Categories (4, object): [apple < bread < cheese < milk]
+
+        >>> x.searchsorted('bread')
+        array([1])     # Note: an array, not a scalar
+
+        >>> x.searchsorted(['bread'], side='right')
+        array([3])
         """)
 
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
-    @Appender(_shared_docs['drop_duplicates'] % _indexops_doc_kwargs)
+    @Substitution(klass='IndexOpsMixin')
+    @Appender(_shared_docs['searchsorted'])
+    @deprecate_kwarg(old_arg_name='key', new_arg_name='value')
+    def searchsorted(self, value, side='left', sorter=None):
+        # needs coercion on the key (DatetimeIndex does already)
+        return self.values.searchsorted(value, side=side, sorter=sorter)
+
     def drop_duplicates(self, keep='first', inplace=False):
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if isinstance(self, ABCIndexClass):
+            if self.is_unique:
+                return self._shallow_copy()
+
         duplicated = self.duplicated(keep=keep)
         result = self[np.logical_not(duplicated)]
         if inplace:
@@ -580,34 +1242,17 @@ def drop_duplicates(self, keep='first', inplace=False):
         else:
             return result
 
-    _shared_docs['duplicated'] = (
-        """Return boolean %(duplicated)s denoting duplicate values
-
-        Parameters
-        ----------
-        keep : {'first', 'last', False}, default 'first'
-            - ``first`` : Mark duplicates as ``True`` except for the first occurrence.
-            - ``last`` : Mark duplicates as ``True`` except for the last occurrence.
-            - False : Mark all duplicates as ``True``.
-        take_last : deprecated
-
-        Returns
-        -------
-        duplicated : %(duplicated)s
-        """)
-
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
-    @Appender(_shared_docs['duplicated'] % _indexops_doc_kwargs)
     def duplicated(self, keep='first'):
-        keys = com._values_from_object(com._ensure_object(self.values))
-        duplicated = lib.duplicated(keys, keep=keep)
-        try:
-            return self._constructor(duplicated,
+        from pandas.core.algorithms import duplicated
+        if isinstance(self, ABCIndexClass):
+            if self.is_unique:
+                return np.zeros(len(self), dtype=np.bool)
+            return duplicated(self, keep=keep)
+        else:
+            return self._constructor(duplicated(self, keep=keep),
                                      index=self.index).__finalize__(self)
-        except AttributeError:
-            return np.array(duplicated, dtype=bool)
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # abstracts
 
     def _update_inplace(self, result, **kwargs):
diff --git a/pandas/core/categorical.py b/pandas/core/categorical.py
index 9decd5e212cbf..530a3ecb5f378 100644
--- a/pandas/core/categorical.py
+++ b/pandas/core/categorical.py
@@ -1,1862 +1,8 @@
-# pylint: disable=E1101,W0232
+import warnings
 
-import numpy as np
-from warnings import warn
-import types
+# TODO: Remove after 0.23.x
+warnings.warn("'pandas.core' is private. Use 'pandas.Categorical'",
+              FutureWarning, stacklevel=2)
 
-from pandas import compat, lib
-from pandas.compat import u
-
-from pandas.core.algorithms import factorize
-from pandas.core.base import PandasObject, PandasDelegate
-import pandas.core.common as com
-from pandas.util.decorators import cache_readonly, deprecate_kwarg
-
-from pandas.core.common import (ABCSeries, ABCIndexClass, ABCPeriodIndex, ABCCategoricalIndex,
-                                isnull, notnull, is_dtype_equal,
-                                is_categorical_dtype, is_integer_dtype, is_object_dtype,
-                                _possibly_infer_to_datetimelike, get_dtype_kinds,
-                                is_list_like, is_sequence, is_null_slice, is_bool,
-                                _ensure_platform_int, _ensure_object, _ensure_int64,
-                                _coerce_indexer_dtype, take_1d)
-from pandas.core.dtypes import CategoricalDtype
-from pandas.util.terminal import get_terminal_size
-from pandas.core.config import get_option
-
-def _cat_compare_op(op):
-    def f(self, other):
-        # On python2, you can usually compare any type to any type, and Categoricals can be
-        # seen as a custom type, but having different results depending whether categories are
-        # the same or not is kind of insane, so be a bit stricter here and use the python3 idea
-        # of comparing only things of equal type.
-        if not self.ordered:
-            if op in ['__lt__', '__gt__','__le__','__ge__']:
-                raise TypeError("Unordered Categoricals can only compare equality or not")
-        if isinstance(other, Categorical):
-            # Two Categoricals can only be be compared if the categories are the same
-            if (len(self.categories) != len(other.categories)) or \
-                    not ((self.categories == other.categories).all()):
-                raise TypeError("Categoricals can only be compared if 'categories' are the same")
-            if not (self.ordered == other.ordered):
-                raise TypeError("Categoricals can only be compared if 'ordered' is the same")
-            na_mask = (self._codes == -1) | (other._codes == -1)
-            f = getattr(self._codes, op)
-            ret = f(other._codes)
-            if na_mask.any():
-                # In other series, the leads to False, so do that here too
-                ret[na_mask] = False
-            return ret
-
-        # Numpy-1.9 and earlier may convert a scalar to a zerodim array during
-        # comparison operation when second arg has higher priority, e.g.
-        #
-        #     cat[0] < cat
-        #
-        # With cat[0], for example, being ``np.int64(1)`` by the time it gets
-        # into this function would become ``np.array(1)``.
-        other = lib.item_from_zerodim(other)
-        if lib.isscalar(other):
-            if other in self.categories:
-                i = self.categories.get_loc(other)
-                return getattr(self._codes, op)(i)
-            else:
-                if op == '__eq__':
-                    return np.repeat(False, len(self))
-                elif op == '__ne__':
-                    return np.repeat(True, len(self))
-                else:
-                    msg  = "Cannot compare a Categorical for op {op} with a scalar, " \
-                           "which is not a category."
-                    raise TypeError(msg.format(op=op))
-        else:
-
-            # allow categorical vs object dtype array comparisons for equality
-            # these are only positional comparisons
-            if op in ['__eq__','__ne__']:
-                return getattr(np.array(self),op)(np.array(other))
-
-            msg = "Cannot compare a Categorical for op {op} with type {typ}. If you want to \n" \
-                  "compare values, use 'np.asarray(cat) <op> other'."
-            raise TypeError(msg.format(op=op,typ=type(other)))
-
-    f.__name__ = op
-
-    return f
-
-def maybe_to_categorical(array):
-    """ coerce to a categorical if a series is given """
-    if isinstance(array, (ABCSeries, ABCCategoricalIndex)):
-        return array._values
-    return array
-
-_codes_doc = """The category codes of this categorical.
-
-Level codes are an array if integer which are the positions of the real
-values in the categories array.
-
-There is not setter, use the other categorical methods and the normal item setter to change
-values in the categorical.
-"""
-
-_categories_doc = """The categories of this categorical.
-
-Setting assigns new values to each category (effectively a rename of
-each individual category).
-
-The assigned value has to be a list-like object. All items must be unique and the number of items
-in the new categories must be the same as the number of items in the old categories.
-
-Assigning to `categories` is a inplace operation!
-
-Raises
-------
-ValueError
-    If the new categories do not validate as categories or if the number of new categories is
-    unequal the number of old categories
-
-See also
---------
-rename_categories
-reorder_categories
-add_categories
-remove_categories
-remove_unused_categories
-set_categories
-"""
-class Categorical(PandasObject):
-
-    """
-    Represents a categorical variable in classic R / S-plus fashion
-
-    `Categoricals` can only take on only a limited, and usually fixed, number
-    of possible values (`categories`). In contrast to statistical categorical
-    variables, a `Categorical` might have an order, but numerical operations
-    (additions, divisions, ...) are not possible.
-
-    All values of the `Categorical` are either in `categories` or `np.nan`.
-    Assigning values outside of `categories` will raise a `ValueError`. Order is
-    defined by the order of the `categories`, not lexical order of the values.
-
-    Parameters
-    ----------
-    values : list-like
-        The values of the categorical. If categories are given, values not in categories will
-        be replaced with NaN.
-    categories : Index-like (unique), optional
-        The unique categories for this categorical. If not given, the categories are assumed
-        to be the unique values of values.
-    ordered : boolean, (default False)
-        Whether or not this categorical is treated as a ordered categorical. If not given,
-        the resulting categorical will not be ordered.
-
-    Attributes
-    ----------
-    categories : Index
-        The categories of this categorical
-    codes : ndarray
-        The codes (integer positions, which point to the categories) of this categorical, read only.
-    ordered : boolean
-        Whether or not this Categorical is ordered.
-
-    Raises
-    ------
-    ValueError
-        If the categories do not validate.
-    TypeError
-        If an explicit ``ordered=True`` is given but no `categories` and the `values` are
-        not sortable.
-
-
-    Examples
-    --------
-    >>> from pandas import Categorical
-    >>> Categorical([1, 2, 3, 1, 2, 3])
-    [1, 2, 3, 1, 2, 3]
-    Categories (3, int64): [1 < 2 < 3]
-
-    >>> Categorical(['a', 'b', 'c', 'a', 'b', 'c'])
-    [a, b, c, a, b, c]
-    Categories (3, object): [a < b < c]
-
-    >>> a = Categorical(['a','b','c','a','b','c'], ['c', 'b', 'a'], ordered=True)
-    >>> a.min()
-    'c'
-    """
-    dtype = CategoricalDtype()
-    """The dtype (always "category")"""
-
-    """Whether or not this Categorical is ordered.
-
-    Only ordered `Categoricals` can be sorted (according to the order
-    of the categories) and have a min and max value.
-
-    See also
-    --------
-    Categorical.sort
-    Categorical.order
-    Categorical.min
-    Categorical.max
-    """
-
-    # For comparisons, so that numpy uses our implementation if the compare ops, which raise
-    __array_priority__ = 1000
-    _typ = 'categorical'
-
-    def __init__(self, values, categories=None, ordered=False, name=None, fastpath=False,
-                 levels=None):
-
-        if fastpath:
-            # fast path
-            self._codes = _coerce_indexer_dtype(values, categories)
-            self._categories = self._validate_categories(categories, fastpath=isinstance(categories, ABCIndexClass))
-            self._ordered = ordered
-            return
-
-        if not name is None:
-            msg = "the 'name' keyword is removed, use 'name' with consumers of the " \
-                  "categorical instead (e.g. 'Series(cat, name=\"something\")'"
-            warn(msg, UserWarning, stacklevel=2)
-
-        # TODO: Remove after deprecation period in 2017/ after 0.18
-        if not levels is None:
-            warn("Creating a 'Categorical' with 'levels' is deprecated, use 'categories' instead",
-                 FutureWarning, stacklevel=2)
-            if categories is None:
-                categories = levels
-            else:
-                raise ValueError("Cannot pass in both 'categories' and (deprecated) 'levels', "
-                                 "use only 'categories'", stacklevel=2)
-
-        # sanitize input
-        if is_categorical_dtype(values):
-
-            # we are either a Series or a CategoricalIndex
-            if isinstance(values, (ABCSeries, ABCCategoricalIndex)):
-                values = values._values
-
-            if ordered is None:
-                ordered = values.ordered
-            if categories is None:
-                categories = values.categories
-            values = values.__array__()
-
-        elif isinstance(values, ABCIndexClass):
-            pass
-
-        else:
-
-            # on numpy < 1.6 datetimelike get inferred to all i8 by _sanitize_array
-            # which is fine, but since factorize does this correctly no need here
-            # this is an issue because _sanitize_array also coerces np.nan to a string
-            # under certain versions of numpy as well
-            values = _possibly_infer_to_datetimelike(values, convert_dates=True)
-            if not isinstance(values, np.ndarray):
-                values = _convert_to_list_like(values)
-                from pandas.core.series import _sanitize_array
-                # On list with NaNs, int values will be converted to float. Use "object" dtype
-                # to prevent this. In the end objects will be casted to int/... in the category
-                # assignment step.
-                dtype = 'object' if isnull(values).any() else None
-                values = _sanitize_array(values, None, dtype=dtype)
-
-
-        if categories is None:
-            try:
-                codes, categories = factorize(values, sort=True)
-            except TypeError:
-                codes, categories = factorize(values, sort=False)
-                if ordered:
-                    # raise, as we don't have a sortable data structure and so the user should
-                    # give us one by specifying categories
-                    raise TypeError("'values' is not ordered, please explicitly specify the "
-                                    "categories order by passing in a categories argument.")
-            except ValueError:
-
-                ### FIXME ####
-                raise NotImplementedError("> 1 ndim Categorical are not supported at this time")
-
-            categories = self._validate_categories(categories)
-
-        else:
-            # there were two ways if categories are present
-            # - the old one, where each value is a int pointer to the levels array -> not anymore
-            #   possible, but code outside of pandas could call us like that, so make some checks
-            # - the new one, where each value is also in the categories array (or np.nan)
-
-            # make sure that we always have the same type here, no matter what we get passed in
-            categories = self._validate_categories(categories)
-            codes = _get_codes_for_values(values, categories)
-
-            # TODO: check for old style usage. These warnings should be removes after 0.18/ in 2016
-            if is_integer_dtype(values) and not is_integer_dtype(categories):
-                warn("Values and categories have different dtypes. Did you mean to use\n"
-                     "'Categorical.from_codes(codes, categories)'?", RuntimeWarning, stacklevel=2)
-
-            if len(values) and is_integer_dtype(values) and (codes == -1).all():
-                warn("None of the categories were found in values. Did you mean to use\n"
-                     "'Categorical.from_codes(codes, categories)'?", RuntimeWarning, stacklevel=2)
-
-        self.set_ordered(ordered or False, inplace=True)
-        self._categories = categories
-        self._codes = _coerce_indexer_dtype(codes, categories)
-
-    def copy(self):
-        """ Copy constructor. """
-        return Categorical(values=self._codes.copy(),categories=self.categories,
-                           ordered=self.ordered, fastpath=True)
-
-    def astype(self, dtype):
-        """ coerce this type to another dtype """
-        if is_categorical_dtype(dtype):
-            return self
-        return np.array(self, dtype=dtype)
-
-    @cache_readonly
-    def ndim(self):
-        """Number of dimensions of the Categorical """
-        return self._codes.ndim
-
-    @cache_readonly
-    def size(self):
-        """ return the len of myself """
-        return len(self)
-
-    @cache_readonly
-    def itemsize(self):
-        """ return the size of a single category """
-        return self.categories.itemsize
-
-    def reshape(self, new_shape, **kwargs):
-        """ compat with .reshape """
-        return self
-
-    @property
-    def base(self):
-        """ compat, we are always our own object """
-        return None
-
-    @classmethod
-    def from_array(cls, data, **kwargs):
-        """
-        Make a Categorical type from a single array-like object.
-
-        For internal compatibility with numpy arrays.
-
-        Parameters
-        ----------
-        data : array-like
-            Can be an Index or array-like. The categories are assumed to be
-            the unique values of `data`.
-        """
-        return Categorical(data, **kwargs)
-
-    @classmethod
-    def from_codes(cls, codes, categories, ordered=False, name=None):
-        """
-        Make a Categorical type from codes and categories arrays.
-
-        This constructor is useful if you already have codes and categories and so do not need the
-        (computation intensive) factorization step, which is usually done on the constructor.
-
-        If your data does not follow this convention, please use the normal constructor.
-
-        Parameters
-        ----------
-        codes : array-like, integers
-            An integer array, where each integer points to a category in categories or -1 for NaN
-        categories : index-like
-            The categories for the categorical. Items need to be unique.
-        ordered : boolean, (default False)
-            Whether or not this categorical is treated as a ordered categorical. If not given,
-            the resulting categorical will be unordered.
-        """
-        if not name is None:
-            msg = "the 'name' keyword is removed, use 'name' with consumers of the " \
-                  "categorical instead (e.g. 'Series(cat, name=\"something\")'"
-            warn(msg, UserWarning, stacklevel=2)
-
-        try:
-            codes = np.asarray(codes, np.int64)
-        except:
-            raise ValueError("codes need to be convertible to an arrays of integers")
-
-        categories = cls._validate_categories(categories)
-
-        if len(codes) and (codes.max() >= len(categories) or codes.min() < -1):
-            raise ValueError("codes need to be between -1 and len(categories)-1")
-
-        return Categorical(codes, categories=categories, ordered=ordered, fastpath=True)
-
-    _codes = None
-
-    def _get_codes(self):
-        """ Get the codes.
-
-        Returns
-        -------
-        codes : integer array view
-            A non writable view of the `codes` array.
-        """
-        v = self._codes.view()
-        v.flags.writeable = False
-        return v
-
-    def _set_codes(self, codes):
-        """
-        Not settable by the user directly
-        """
-        raise ValueError("cannot set Categorical codes directly")
-
-    codes = property(fget=_get_codes, fset=_set_codes, doc=_codes_doc)
-
-    def _get_labels(self):
-        """
-        Get the category labels (deprecated).
-
-        Deprecated, use .codes!
-        """
-        warn("'labels' is deprecated. Use 'codes' instead", FutureWarning, stacklevel=2)
-        return self.codes
-
-    labels = property(fget=_get_labels, fset=_set_codes)
-
-    _categories = None
-
-    @classmethod
-    def _validate_categories(cls, categories, fastpath=False):
-        """
-        Validates that we have good categories
-
-        Parameters
-        ----------
-        fastpath : boolean (default: False)
-           Don't perform validation of the categories for uniqueness or nulls
-
-        """
-        if not isinstance(categories, ABCIndexClass):
-            dtype = None
-            if not hasattr(categories, "dtype"):
-                categories = _convert_to_list_like(categories)
-                # on categories with NaNs, int values would be converted to float.
-                # Use "object" dtype to prevent this.
-                if isnull(categories).any():
-                    without_na = np.array([x for x in categories if notnull(x)])
-                    with_na = np.array(categories)
-                    if with_na.dtype != without_na.dtype:
-                        dtype = "object"
-
-            from pandas import Index
-            categories = Index(categories, dtype=dtype)
-
-        if not fastpath:
-
-            # check properties of the categories
-            # we don't allow NaNs in the categories themselves
-
-            if categories.hasnans:
-                # NaNs in cats deprecated in 0.17, remove in 0.18 or 0.19 GH 10748
-                msg = ('\nSetting NaNs in `categories` is deprecated and '
-                       'will be removed in a future version of pandas.')
-                warn(msg, FutureWarning, stacklevel=3)
-
-            # categories must be unique
-
-            if not categories.is_unique:
-                raise ValueError('Categorical categories must be unique')
-
-        return categories
-
-    def _set_categories(self, categories, fastpath=False):
-        """ Sets new categories
-
-        Parameters
-        ----------
-        fastpath : boolean (default: False)
-           Don't perform validation of the categories for uniqueness or nulls
-
-        """
-
-        categories = self._validate_categories(categories, fastpath=fastpath)
-        if not fastpath and not self._categories is None and len(categories) != len(self._categories):
-            raise ValueError("new categories need to have the same number of items than the old "
-                             "categories!")
-
-        self._categories = categories
-
-    def _get_categories(self):
-        """ Gets the categories """
-        # categories is an Index, which is immutable -> no need to copy
-        return self._categories
-
-    categories = property(fget=_get_categories, fset=_set_categories, doc=_categories_doc)
-
-    def _set_levels(self, levels):
-        """ set new levels (deprecated, use "categories") """
-        warn("Assigning to 'levels' is deprecated, use 'categories'", FutureWarning, stacklevel=2)
-        self.categories = levels
-
-    def _get_levels(self):
-        """ Gets the levels (deprecated, use "categories") """
-        warn("Accessing 'levels' is deprecated, use 'categories'", FutureWarning, stacklevel=2)
-        return self.categories
-
-    # TODO: Remove after deprecation period in 2017/ after 0.18
-    levels = property(fget=_get_levels, fset=_set_levels)
-
-    _ordered = None
-
-    def _set_ordered(self, value):
-        """ Sets the ordered attribute to the boolean value """
-        warn("Setting 'ordered' directly is deprecated, use 'set_ordered'", FutureWarning,
-             stacklevel=2)
-        self.set_ordered(value, inplace=True)
-
-    def set_ordered(self, value, inplace=False):
-        """
-        Sets the ordered attribute to the boolean value
-
-        Parameters
-        ----------
-        value : boolean to set whether this categorical is ordered (True) or not (False)
-        inplace : boolean (default: False)
-           Whether or not to set the ordered attribute inplace or return a copy of this categorical
-           with ordered set to the value
-        """
-        if not is_bool(value):
-            raise TypeError("ordered must be a boolean value")
-        cat = self if inplace else self.copy()
-        cat._ordered = value
-        if not inplace:
-            return cat
-
-    def as_ordered(self, inplace=False):
-        """
-        Sets the Categorical to be ordered
-
-        Parameters
-        ----------
-        inplace : boolean (default: False)
-           Whether or not to set the ordered attribute inplace or return a copy of this categorical
-           with ordered set to True
-        """
-        return self.set_ordered(True, inplace=inplace)
-
-    def as_unordered(self, inplace=False):
-        """
-        Sets the Categorical to be unordered
-
-        Parameters
-        ----------
-        inplace : boolean (default: False)
-           Whether or not to set the ordered attribute inplace or return a copy of this categorical
-           with ordered set to False
-        """
-        return self.set_ordered(False, inplace=inplace)
-
-    def _get_ordered(self):
-        """ Gets the ordered attribute """
-        return self._ordered
-
-    ordered = property(fget=_get_ordered, fset=_set_ordered)
-
-    def set_categories(self, new_categories, ordered=None, rename=False, inplace=False):
-        """ Sets the categories to the specified new_categories.
-
-        `new_categories` can include new categories (which will result in unused categories) or
-        or remove old categories (which results in values set to NaN). If `rename==True`,
-        the categories will simple be renamed (less or more items than in old categories will
-        result in values set to NaN or in unused categories respectively).
-
-        This method can be used to perform more than one action of adding, removing,
-        and reordering simultaneously and is therefore faster than performing the individual steps
-        via the more specialised methods.
-
-        On the other hand this methods does not do checks (e.g., whether the old categories are
-        included in the new categories on a reorder), which can result in surprising changes, for
-        example when using special string dtypes on python3, which does not considers a S1 string
-        equal to a single char python string.
-
-        Raises
-        ------
-        ValueError
-            If new_categories does not validate as categories
-
-        Parameters
-        ----------
-        new_categories : Index-like
-           The categories in new order.
-        ordered : boolean, (default: False)
-           Whether or not the categorical is treated as a ordered categorical. If not given,
-           do not change the ordered information.
-        rename : boolean (default: False)
-           Whether or not the new_categories should be considered as a rename of the old
-           categories or as reordered categories.
-        inplace : boolean (default: False)
-           Whether or not to reorder the categories inplace or return a copy of this categorical
-           with reordered categories.
-
-        Returns
-        -------
-        cat : Categorical with reordered categories or None if inplace.
-
-        See also
-        --------
-        rename_categories
-        reorder_categories
-        add_categories
-        remove_categories
-        remove_unused_categories
-        """
-        new_categories = self._validate_categories(new_categories)
-        cat = self if inplace else self.copy()
-        if rename:
-            if not cat._categories is None and len(new_categories) < len(cat._categories):
-                # remove all _codes which are larger and set to -1/NaN
-                self._codes[self._codes >= len(new_categories)] = -1
-        else:
-            values = cat.__array__()
-            cat._codes = _get_codes_for_values(values, new_categories)
-        cat._categories = new_categories
-
-        if ordered is None:
-            ordered = self.ordered
-        cat.set_ordered(ordered, inplace=True)
-
-        if not inplace:
-            return cat
-
-    def rename_categories(self, new_categories, inplace=False):
-        """ Renames categories.
-
-        The new categories has to be a list-like object. All items must be unique and the number of
-        items in the new categories must be the same as the number of items in the old categories.
-
-        Raises
-        ------
-        ValueError
-            If the new categories do not have the same number of items than the current categories
-            or do not validate as categories
-
-        Parameters
-        ----------
-        new_categories : Index-like
-           The renamed categories.
-        inplace : boolean (default: False)
-           Whether or not to rename the categories inplace or return a copy of this categorical
-           with renamed categories.
-
-        Returns
-        -------
-        cat : Categorical with renamed categories added or None if inplace.
-
-        See also
-        --------
-        reorder_categories
-        add_categories
-        remove_categories
-        remove_unused_categories
-        set_categories
-        """
-        cat = self if inplace else self.copy()
-        cat.categories = new_categories
-        if not inplace:
-            return cat
-
-    def reorder_categories(self, new_categories, ordered=None, inplace=False):
-        """ Reorders categories as specified in new_categories.
-
-        `new_categories` need to include all old categories and no new category items.
-
-        Raises
-        ------
-        ValueError
-            If the new categories do not contain all old category items or any new ones
-
-        Parameters
-        ----------
-        new_categories : Index-like
-           The categories in new order.
-        ordered : boolean, optional
-           Whether or not the categorical is treated as a ordered categorical. If not given,
-           do not change the ordered information.
-        inplace : boolean (default: False)
-           Whether or not to reorder the categories inplace or return a copy of this categorical
-           with reordered categories.
-
-        Returns
-        -------
-        cat : Categorical with reordered categories or None if inplace.
-
-        See also
-        --------
-        rename_categories
-        add_categories
-        remove_categories
-        remove_unused_categories
-        set_categories
-        """
-        if set(self._categories) != set(new_categories):
-            raise ValueError("items in new_categories are not the same as in old categories")
-        return self.set_categories(new_categories, ordered=ordered, inplace=inplace)
-
-    def add_categories(self, new_categories, inplace=False):
-        """ Add new categories.
-
-        `new_categories` will be included at the last/highest place in the categories and will be
-        unused directly after this call.
-
-        Raises
-        ------
-        ValueError
-            If the new categories include old categories or do not validate as categories
-
-        Parameters
-        ----------
-        new_categories : category or list-like of category
-           The new categories to be included.
-        inplace : boolean (default: False)
-           Whether or not to add the categories inplace or return a copy of this categorical
-           with added categories.
-
-        Returns
-        -------
-        cat : Categorical with new categories added or None if inplace.
-
-        See also
-        --------
-        rename_categories
-        reorder_categories
-        remove_categories
-        remove_unused_categories
-        set_categories
-        """
-        if not is_list_like(new_categories):
-            new_categories = [new_categories]
-        already_included = set(new_categories) & set(self._categories)
-        if len(already_included) != 0:
-            msg = "new categories must not include old categories: %s" % str(already_included)
-            raise ValueError(msg)
-        new_categories = list(self._categories) + list(new_categories)
-        cat = self if inplace else self.copy()
-        cat._categories = self._validate_categories(new_categories)
-        cat._codes = _coerce_indexer_dtype(cat._codes, new_categories)
-        if not inplace:
-            return cat
-
-    def remove_categories(self, removals, inplace=False):
-        """ Removes the specified categories.
-
-        `removals` must be included in the old categories. Values which were in the removed
-        categories will be set to NaN
-
-        Raises
-        ------
-        ValueError
-            If the removals are not contained in the categories
-
-        Parameters
-        ----------
-        removals : category or list of categories
-           The categories which should be removed.
-        inplace : boolean (default: False)
-           Whether or not to remove the categories inplace or return a copy of this categorical
-           with removed categories.
-
-        Returns
-        -------
-        cat : Categorical with removed categories or None if inplace.
-
-        See also
-        --------
-        rename_categories
-        reorder_categories
-        add_categories
-        remove_unused_categories
-        set_categories
-        """
-        if not is_list_like(removals):
-            removals = [removals]
-
-        removal_set = set(list(removals))
-        not_included = removal_set - set(self._categories)
-        new_categories = [ c for c in self._categories if c not in removal_set ]
-
-        # GH 10156
-        if any(isnull(removals)):
-            not_included = [x for x in not_included if notnull(x)]
-            new_categories = [x for x in new_categories if notnull(x)]
-
-        if len(not_included) != 0:
-            raise ValueError("removals must all be in old categories: %s" % str(not_included))
-
-        return self.set_categories(new_categories, ordered=self.ordered, rename=False,
-                                   inplace=inplace)
-
-
-    def remove_unused_categories(self, inplace=False):
-        """ Removes categories which are not used.
-
-        Parameters
-        ----------
-        inplace : boolean (default: False)
-           Whether or not to drop unused categories inplace or return a copy of this categorical
-           with unused categories dropped.
-
-        Returns
-        -------
-        cat : Categorical with unused categories dropped or None if inplace.
-
-        See also
-        --------
-        rename_categories
-        reorder_categories
-        add_categories
-        remove_categories
-        set_categories
-        """
-        cat = self if inplace else self.copy()
-        _used = sorted(np.unique(cat._codes))
-        new_categories = cat.categories.take(_ensure_platform_int(_used))
-
-        from pandas.core.index import _ensure_index
-        new_categories = _ensure_index(new_categories)
-        cat._codes = _get_codes_for_values(cat.__array__(), new_categories)
-        cat._categories = new_categories
-        if not inplace:
-            return cat
-
-
-    __eq__ = _cat_compare_op('__eq__')
-    __ne__ = _cat_compare_op('__ne__')
-    __lt__ = _cat_compare_op('__lt__')
-    __gt__ = _cat_compare_op('__gt__')
-    __le__ = _cat_compare_op('__le__')
-    __ge__ = _cat_compare_op('__ge__')
-
-    # for Series/ndarray like compat
-    @property
-    def shape(self):
-        """ Shape of the Categorical.
-
-        For internal compatibility with numpy arrays.
-
-        Returns
-        -------
-        shape : tuple
-        """
-
-        return tuple([len(self._codes)])
-
-    def shift(self, periods):
-        """
-        Shift Categorical by desired number of periods.
-
-        Parameters
-        ----------
-        periods : int
-            Number of periods to move, can be positive or negative
-
-        Returns
-        -------
-        shifted : Categorical
-        """
-        # since categoricals always have ndim == 1, an axis parameter
-        # doesnt make any sense here.
-        codes = self.codes
-        if codes.ndim > 1:
-            raise NotImplementedError("Categorical with ndim > 1.")
-        if np.prod(codes.shape) and (periods != 0):
-            codes = np.roll(codes, com._ensure_platform_int(periods), axis=0)
-            if periods > 0:
-                codes[:periods] = -1
-            else:
-                codes[periods:] = -1
-
-        return Categorical.from_codes(codes,
-                                      categories=self.categories,
-                                      ordered=self.ordered)
-
-    def __array__(self, dtype=None):
-        """
-        The numpy array interface.
-
-        Returns
-        -------
-        values : numpy array
-            A numpy array of either the specified dtype or, if dtype==None (default), the same
-            dtype as categorical.categories.dtype
-        """
-        ret = take_1d(self.categories.values, self._codes)
-        if dtype and not is_dtype_equal(dtype,self.categories.dtype):
-            return np.asarray(ret, dtype)
-        return ret
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-        if not isinstance(state, dict):
-            raise Exception('invalid pickle state')
-
-        # Provide compatibility with pre-0.15.0 Categoricals.
-        if '_codes' not in state and 'labels' in state:
-            state['_codes'] = state.pop('labels')
-        if '_categories' not in state and '_levels' in state:
-            state['_categories'] = \
-                self._validate_categories(state.pop('_levels'))
-
-        # 0.16.0 ordered change
-        if '_ordered' not in state:
-
-            # >=15.0 < 0.16.0
-            if 'ordered' in state:
-                state['_ordered'] = state.pop('ordered')
-            else:
-                state['_ordered'] = False
-
-        for k, v in compat.iteritems(state):
-            setattr(self, k, v)
-
-    @property
-    def T(self):
-        return self
-
-    @property
-    def nbytes(self):
-        return self._codes.nbytes + self._categories.values.nbytes
-
-    def searchsorted(self, v, side='left', sorter=None):
-        """Find indices where elements should be inserted to maintain order.
-
-        Find the indices into a sorted Categorical `self` such that, if the
-        corresponding elements in `v` were inserted before the indices, the
-        order of `self` would be preserved.
-
-        Parameters
-        ----------
-        v : array_like
-            Array-like values or a scalar value, to insert/search for in `self`.
-        side : {'left', 'right'}, optional
-            If 'left', the index of the first suitable location found is given.
-            If 'right', return the last such index.  If there is no suitable
-            index, return either 0 or N (where N is the length of `a`).
-        sorter : 1-D array_like, optional
-            Optional array of integer indices that sort `self` into ascending
-            order. They are typically the result of ``np.argsort``.
-
-        Returns
-        -------
-        indices : array of ints
-            Array of insertion points with the same shape as `v`.
-
-        See Also
-        --------
-        Series.searchsorted
-        numpy.searchsorted
-
-        Notes
-        -----
-        Binary search is used to find the required insertion points.
-
-        Examples
-        --------
-        >>> x = pd.Categorical(['apple', 'bread', 'bread', 'cheese', 'milk' ])
-        [apple, bread, bread, cheese, milk]
-        Categories (4, object): [apple < bread < cheese < milk]
-        >>> x.searchsorted('bread')
-        array([1])     # Note: an array, not a scalar
-        >>> x.searchsorted(['bread'])
-        array([1])
-        >>> x.searchsorted(['bread', 'eggs'])
-        array([1, 4])
-        >>> x.searchsorted(['bread', 'eggs'], side='right')
-        array([3, 4])	    # eggs before milk
-        >>> x = pd.Categorical(['apple', 'bread', 'bread', 'cheese', 'milk', 'donuts' ])
-        >>> x.searchsorted(['bread', 'eggs'], side='right', sorter=[0, 1, 2, 3, 5, 4])
-        array([3, 5])       # eggs after donuts, after switching milk and donuts
-        """
-        if not self.ordered:
-            raise ValueError("Categorical not ordered\n"
-                             "you can use .as_ordered() to change the Categorical to an ordered one\n")
-
-        from pandas.core.series import Series
-        values_as_codes = self.categories.values.searchsorted(Series(v).values, side)
-        return self.codes.searchsorted(values_as_codes, sorter=sorter)
-
-    def isnull(self):
-        """
-        Detect missing values
-
-        Both missing values (-1 in .codes) and NA as a category are detected.
-
-        Returns
-        -------
-        a boolean array of whether my values are null
-
-        See also
-        --------
-        pandas.isnull : pandas version
-        Categorical.notnull : boolean inverse of Categorical.isnull
-        """
-
-        ret = self._codes == -1
-
-        # String/object and float categories can hold np.nan
-        if self.categories.dtype.kind in ['S', 'O', 'f']:
-            if np.nan in self.categories:
-                nan_pos = np.where(isnull(self.categories))[0]
-                # we only have one NA in categories
-                ret = np.logical_or(ret , self._codes == nan_pos)
-        return ret
-
-    def notnull(self):
-        """
-        Reverse of isnull
-
-        Both missing values (-1 in .codes) and NA as a category are detected as null.
-
-        Returns
-        -------
-        a boolean array of whether my values are not null
-
-        See also
-        --------
-        pandas.notnull : pandas version
-        Categorical.isnull : boolean inverse of Categorical.notnull
-        """
-        return ~self.isnull()
-
-    def dropna(self):
-        """
-        Return the Categorical without null values.
-
-        Both missing values (-1 in .codes) and NA as a category are detected.
-        NA is removed from the categories if present.
-
-        Returns
-        -------
-        valid : Categorical
-        """
-        result = self[self.notnull()]
-        if isnull(result.categories).any():
-            result = result.remove_categories([np.nan])
-        return result
-
-    def value_counts(self, dropna=True):
-        """
-        Returns a Series containing counts of each category.
-
-        Every category will have an entry, even those with a count of 0.
-
-        Parameters
-        ----------
-        dropna : boolean, default True
-            Don't include counts of NaN, even if NaN is a category.
-
-        Returns
-        -------
-        counts : Series
-        """
-        from numpy import bincount
-        from pandas.core.common import isnull
-        from pandas.core.series import Series
-        from pandas.core.index import CategoricalIndex
-
-        obj = self.remove_categories([np.nan]) \
-                if dropna and isnull(self.categories).any() else self
-
-        code, cat = obj._codes, obj.categories
-        ncat, mask = len(cat), 0 <= code
-        ix, clean = np.arange(ncat), mask.all()
-
-        if dropna or clean:
-            count = bincount(code if clean else code[mask], minlength=ncat)
-        else:
-            count = bincount(np.where(mask, code, ncat))
-            ix = np.append(ix, -1)
-
-        ix = Categorical(ix, categories=cat,
-                ordered=obj.ordered, fastpath=True)
-
-        return Series(count, index=CategoricalIndex(ix), dtype='int64')
-
-    def get_values(self):
-        """ Return the values.
-
-        For internal compatibility with pandas formatting.
-
-        Returns
-        -------
-        values : numpy array
-            A numpy array of the same dtype as categorical.categories.dtype or
-            Index if datetime / periods
-        """
-        # if we are a datetime and period index, return Index to keep metadata
-        if com.is_datetimelike(self.categories):
-            return self.categories.take(self._codes)
-        return np.array(self)
-
-    def check_for_ordered(self, op):
-        """ assert that we are ordered """
-        if not self.ordered:
-            raise TypeError("Categorical is not ordered for operation {op}\n"
-                            "you can use .as_ordered() to change the Categorical to an ordered one\n".format(op=op))
-
-    def argsort(self, ascending=True, **kwargs):
-        """ Implements ndarray.argsort.
-
-        For internal compatibility with numpy arrays.
-
-        Only ordered Categoricals can be argsorted!
-
-        Returns
-        -------
-        argsorted : numpy array
-        """
-        result = np.argsort(self._codes.copy(), **kwargs)
-        if not ascending:
-            result = result[::-1]
-        return result
-
-    def sort_values(self, inplace=False, ascending=True, na_position='last'):
-        """ Sorts the Category by category value returning a new Categorical by default.
-
-        Only ordered Categoricals can be sorted!
-
-        Categorical.sort is the equivalent but sorts the Categorical inplace.
-
-        Parameters
-        ----------
-        inplace : boolean, default False
-            Do operation in place.
-        ascending : boolean, default True
-            Sort ascending. Passing False sorts descending
-        na_position : {'first', 'last'} (optional, default='last')
-            'first' puts NaNs at the beginning
-            'last' puts NaNs at the end
-
-        Returns
-        -------
-        y : Category or None
-
-        See Also
-        --------
-        Category.sort
-        """
-        if na_position not in ['last','first']:
-            raise ValueError('invalid na_position: {!r}'.format(na_position))
-
-        codes = np.sort(self._codes)
-        if not ascending:
-            codes = codes[::-1]
-
-        # NaN handling
-        na_mask = (codes==-1)
-        if na_mask.any():
-            n_nans = len(codes[na_mask])
-            if na_position=="first" and not ascending:
-                # in this case sort to the front
-                new_codes = codes.copy()
-                new_codes[0:n_nans] = -1
-                new_codes[n_nans:] = codes[~na_mask]
-                codes = new_codes
-            elif na_position=="last" and not ascending:
-                # ... and to the end
-                new_codes = codes.copy()
-                pos = len(codes)-n_nans
-                new_codes[0:pos] = codes[~na_mask]
-                new_codes[pos:] = -1
-                codes = new_codes
-        if inplace:
-            self._codes = codes
-            return
-        else:
-            return Categorical(values=codes,categories=self.categories, ordered=self.ordered,
-                               fastpath=True)
-
-    def order(self, inplace=False, ascending=True, na_position='last'):
-        """
-        DEPRECATED: use :meth:`Categorical.sort_values`
-
-        Sorts the Category by category value returning a new Categorical by default.
-
-        Only ordered Categoricals can be sorted!
-
-        Categorical.sort is the equivalent but sorts the Categorical inplace.
-
-        Parameters
-        ----------
-        inplace : boolean, default False
-            Do operation in place.
-        ascending : boolean, default True
-            Sort ascending. Passing False sorts descending
-        na_position : {'first', 'last'} (optional, default='last')
-            'first' puts NaNs at the beginning
-            'last' puts NaNs at the end
-
-        Returns
-        -------
-        y : Category or None
-
-        See Also
-        --------
-        Category.sort
-        """
-        warn("order is deprecated, use sort_values(...)",
-             FutureWarning, stacklevel=2)
-        return self.sort_values(inplace=inplace, ascending=ascending, na_position=na_position)
-
-    def sort(self, inplace=True, ascending=True, na_position='last'):
-        """ Sorts the Category inplace by category value.
-
-        Only ordered Categoricals can be sorted!
-
-        Catgorical.order is the equivalent but returns a new Categorical.
-
-        Parameters
-        ----------
-        ascending : boolean, default True
-            Sort ascending. Passing False sorts descending
-        inplace : boolean, default False
-            Do operation in place.
-        na_position : {'first', 'last'} (optional, default='last')
-            'first' puts NaNs at the beginning
-            'last' puts NaNs at the end
-
-        Returns
-        -------
-        y : Category or None
-
-        See Also
-        --------
-        Category.sort_values
-        """
-        return self.sort_values(inplace=inplace, ascending=ascending,
-                                na_position=na_position)
-
-    def ravel(self, order='C'):
-        """ Return a flattened (numpy) array.
-
-        For internal compatibility with numpy arrays.
-
-        Returns
-        -------
-        raveled : numpy array
-        """
-        return np.array(self)
-
-    def view(self):
-        """Return a view of myself.
-
-        For internal compatibility with numpy arrays.
-
-        Returns
-        -------
-        view : Categorical
-           Returns `self`!
-        """
-        return self
-
-    def to_dense(self):
-        """Return my 'dense' representation
-
-        For internal compatibility with numpy arrays.
-
-        Returns
-        -------
-        dense : array
-        """
-        return np.asarray(self)
-
-    @deprecate_kwarg(old_arg_name='fill_value', new_arg_name='value')
-    def fillna(self, value=None, method=None, limit=None):
-        """ Fill NA/NaN values using the specified method.
-
-        Parameters
-        ----------
-        method : {'backfill', 'bfill', 'pad', 'ffill', None}, default None
-            Method to use for filling holes in reindexed Series
-            pad / ffill: propagate last valid observation forward to next valid
-            backfill / bfill: use NEXT valid observation to fill gap
-        value : scalar
-            Value to use to fill holes (e.g. 0)
-        limit : int, default None
-            (Not implemented yet for Categorical!)
-            If method is specified, this is the maximum number of consecutive
-            NaN values to forward/backward fill. In other words, if there is
-            a gap with more than this number of consecutive NaNs, it will only
-            be partially filled. If method is not specified, this is the
-            maximum number of entries along the entire axis where NaNs will be
-            filled.
-
-        Returns
-        -------
-        filled : Categorical with NA/NaN filled
-        """
-
-        if value is None:
-            value = np.nan
-        if limit is not None:
-            raise NotImplementedError("specifying a limit for fillna has not "
-                                      "been implemented yet")
-
-        values = self._codes
-
-        # Make sure that we also get NA in categories
-        if self.categories.dtype.kind in ['S', 'O', 'f']:
-            if np.nan in self.categories:
-                values = values.copy()
-                nan_pos = np.where(isnull(self.categories))[0]
-                # we only have one NA in categories
-                values[values == nan_pos] = -1
-
-        # pad / bfill
-        if method is not None:
-
-            values = self.to_dense().reshape(-1, len(self))
-            values = com.interpolate_2d(
-                values, method, 0, None, value).astype(self.categories.dtype)[0]
-            values = _get_codes_for_values(values, self.categories)
-
-        else:
-
-            if not isnull(value) and value not in self.categories:
-                raise ValueError("fill value must be in categories")
-
-            mask = values==-1
-            if mask.any():
-                values = values.copy()
-                values[mask] = self.categories.get_loc(value)
-
-        return Categorical(values, categories=self.categories, ordered=self.ordered,
-                           fastpath=True)
-
-    def take_nd(self, indexer, allow_fill=True, fill_value=None):
-        """ Take the codes by the indexer, fill with the fill_value.
-
-        For internal compatibility with numpy arrays.
-        """
-
-        # filling must always be None/nan here
-        # but is passed thru internally
-        assert isnull(fill_value)
-
-        codes = take_1d(self._codes, indexer, allow_fill=True, fill_value=-1)
-        result = Categorical(codes, categories=self.categories, ordered=self.ordered,
-                             fastpath=True)
-        return result
-
-    take = take_nd
-
-    def _slice(self, slicer):
-        """ Return a slice of myself.
-
-        For internal compatibility with numpy arrays.
-        """
-
-        # only allow 1 dimensional slicing, but can
-        # in a 2-d case be passd (slice(None),....)
-        if isinstance(slicer, tuple) and len(slicer) == 2:
-            if not is_null_slice(slicer[0]):
-                raise AssertionError("invalid slicing for a 1-ndim categorical")
-            slicer = slicer[1]
-
-        _codes = self._codes[slicer]
-        return Categorical(values=_codes,categories=self.categories, ordered=self.ordered,
-                           fastpath=True)
-
-    def __len__(self):
-        """The length of this Categorical."""
-        return len(self._codes)
-
-    def __iter__(self):
-        """Returns an Iterator over the values of this Categorical."""
-        return iter(self.get_values())
-
-    def _tidy_repr(self, max_vals=10, footer=True):
-        """ a short repr displaying only max_vals and an optional (but default footer) """
-        num = max_vals // 2
-        head = self[:num]._get_repr(length=False, footer=False)
-        tail = self[-(max_vals - num):]._get_repr(length=False,
-                                                  footer=False)
-
-        result = '%s, ..., %s' % (head[:-1], tail[1:])
-        if footer:
-            result = '%s\n%s' % (result, self._repr_footer())
-
-        return compat.text_type(result)
-
-    def _repr_categories(self):
-        """ return the base repr for the categories """
-        max_categories = (10 if get_option("display.max_categories") == 0
-                    else get_option("display.max_categories"))
-        from pandas.core import format as fmt
-        category_strs = fmt.format_array(self.categories, None)
-        if len(category_strs) > max_categories:
-            num = max_categories // 2
-            head = category_strs[:num]
-            tail = category_strs[-(max_categories - num):]
-            category_strs = head + ["..."] + tail
-
-        # Strip all leading spaces, which format_array adds for columns...
-        category_strs = [x.strip() for x in category_strs]
-        return category_strs
-
-    def _repr_categories_info(self):
-        """ Returns a string representation of the footer."""
-
-        category_strs = self._repr_categories()
-        dtype = getattr(self.categories, 'dtype_str', str(self.categories.dtype))
-
-        levheader = "Categories (%d, %s): " % (len(self.categories), dtype)
-        width, height = get_terminal_size()
-        max_width = get_option("display.width") or width
-        if com.in_ipython_frontend():
-            # 0 = no breaks
-            max_width = 0
-        levstring = ""
-        start = True
-        cur_col_len = len(levheader) # header
-        sep_len, sep = (3, " < ") if self.ordered else (2, ", ")
-        linesep = sep.rstrip() + "\n" # remove whitespace
-        for val in category_strs:
-            if max_width != 0 and cur_col_len + sep_len + len(val) > max_width:
-                levstring += linesep + (" " * (len(levheader) + 1))
-                cur_col_len = len(levheader) + 1 # header + a whitespace
-            elif not start:
-                levstring += sep
-                cur_col_len += len(val)
-            levstring += val
-            start = False
-        # replace to simple save space by
-        return levheader + "["+levstring.replace(" < ... < ", " ... ")+"]"
-
-    def _repr_footer(self):
-
-        return u('Length: %d\n%s') % (len(self), self._repr_categories_info())
-
-    def _get_repr(self, length=True, na_rep='NaN', footer=True):
-        from pandas.core import format as fmt
-        formatter = fmt.CategoricalFormatter(self,
-                                             length=length,
-                                             na_rep=na_rep,
-                                             footer=footer)
-        result = formatter.to_string()
-        return compat.text_type(result)
-
-    def __unicode__(self):
-        """ Unicode representation. """
-        _maxlen = 10
-        if len(self._codes) > _maxlen:
-            result = self._tidy_repr(_maxlen)
-        elif len(self._codes) > 0:
-            result = self._get_repr(length=len(self) > _maxlen)
-        else:
-            result = '[], %s' % self._get_repr(length=False,
-                                               footer=True,
-                                               ).replace("\n",", ")
-
-        return result
-
-    def _maybe_coerce_indexer(self, indexer):
-        """ return an indexer coerced to the codes dtype """
-        if isinstance(indexer, np.ndarray) and indexer.dtype.kind == 'i':
-            indexer = indexer.astype(self._codes.dtype)
-        return indexer
-
-    def __getitem__(self, key):
-        """ Return an item. """
-        if isinstance(key, (int, np.integer)):
-            i = self._codes[key]
-            if i == -1:
-                return np.nan
-            else:
-                return self.categories[i]
-        else:
-            return Categorical(values=self._codes[key], categories=self.categories,
-                               ordered=self.ordered, fastpath=True)
-
-    def __setitem__(self, key, value):
-        """ Item assignment.
-
-
-        Raises
-        ------
-        ValueError
-            If (one or more) Value is not in categories or if a assigned `Categorical` has not the
-            same categories
-
-        """
-
-        # require identical categories set
-        if isinstance(value, Categorical):
-            if not value.categories.equals(self.categories):
-                raise ValueError("Cannot set a Categorical with another, without identical "
-                                 "categories")
-
-        rvalue = value if is_list_like(value) else [value]
-
-        from pandas import Index
-        to_add = Index(rvalue).difference(self.categories)
-
-        # no assignments of values not in categories, but it's always ok to set something to np.nan
-        if len(to_add) and not isnull(to_add).all():
-            raise ValueError("cannot setitem on a Categorical with a new category,"
-                             " set the categories first")
-
-        # set by position
-        if isinstance(key, (int, np.integer)):
-            pass
-
-        # tuple of indexers (dataframe)
-        elif isinstance(key, tuple):
-            # only allow 1 dimensional slicing, but can
-            # in a 2-d case be passd (slice(None),....)
-            if len(key) == 2:
-                if not is_null_slice(key[0]):
-                    raise AssertionError("invalid slicing for a 1-ndim categorical")
-                key = key[1]
-            elif len(key) == 1:
-                key = key[0]
-            else:
-                raise AssertionError("invalid slicing for a 1-ndim categorical")
-
-        # slicing in Series or Categorical
-        elif isinstance(key, slice):
-            pass
-
-        # Array of True/False in Series or Categorical
-        else:
-            # There is a bug in numpy, which does not accept a Series as a indexer
-            # https://github.com/pydata/pandas/issues/6168
-            # https://github.com/numpy/numpy/issues/4240 -> fixed in numpy 1.9
-            # FIXME: remove when numpy 1.9 is the lowest numpy version pandas accepts...
-            key = np.asarray(key)
-
-        lindexer = self.categories.get_indexer(rvalue)
-
-        # FIXME: the following can be removed after https://github.com/pydata/pandas/issues/7820
-        # is fixed.
-        # float categories do currently return -1 for np.nan, even if np.nan is included in the
-        # index -> "repair" this here
-        if isnull(rvalue).any() and isnull(self.categories).any():
-            nan_pos = np.where(isnull(self.categories))[0]
-            lindexer[lindexer == -1] = nan_pos
-
-        lindexer = self._maybe_coerce_indexer(lindexer)
-        self._codes[key] = lindexer
-
-    #### reduction ops ####
-    def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
-                filter_type=None, **kwds):
-        """ perform the reduction type operation """
-        func = getattr(self,name,None)
-        if func is None:
-            raise TypeError("Categorical cannot perform the operation {op}".format(op=name))
-        return func(numeric_only=numeric_only, **kwds)
-
-    def min(self, numeric_only=None, **kwargs):
-        """ The minimum value of the object.
-
-        Only ordered `Categoricals` have a minimum!
-
-        Raises
-        ------
-        TypeError
-            If the `Categorical` is not `ordered`.
-
-        Returns
-        -------
-        min : the minimum of this `Categorical`
-        """
-        self.check_for_ordered('min')
-        if numeric_only:
-            good = self._codes != -1
-            pointer = self._codes[good].min(**kwargs)
-        else:
-            pointer = self._codes.min(**kwargs)
-        if pointer == -1:
-            return np.nan
-        else:
-            return self.categories[pointer]
-
-
-    def max(self, numeric_only=None, **kwargs):
-        """ The maximum value of the object.
-
-        Only ordered `Categoricals` have a maximum!
-
-        Raises
-        ------
-        TypeError
-            If the `Categorical` is not `ordered`.
-
-        Returns
-        -------
-        max : the maximum of this `Categorical`
-        """
-        self.check_for_ordered('max')
-        if numeric_only:
-            good = self._codes != -1
-            pointer = self._codes[good].max(**kwargs)
-        else:
-            pointer = self._codes.max(**kwargs)
-        if pointer == -1:
-            return np.nan
-        else:
-            return self.categories[pointer]
-
-    def mode(self):
-        """
-        Returns the mode(s) of the Categorical.
-
-        Empty if nothing occurs at least 2 times.  Always returns `Categorical` even
-        if only one value.
-
-        Returns
-        -------
-        modes : `Categorical` (sorted)
-        """
-
-        import pandas.hashtable as htable
-        good = self._codes != -1
-        result = Categorical(sorted(htable.mode_int64(_ensure_int64(self._codes[good]))),
-                             categories=self.categories,ordered=self.ordered, fastpath=True)
-        return result
-
-    def unique(self):
-        """
-        Return the ``Categorical`` which ``categories`` and ``codes`` are unique.
-        Unused categories are NOT returned.
-
-        - unordered category: values and categories are sorted by appearance
-          order.
-        - ordered category: values are sorted by appearance order, categories
-          keeps existing order.
-
-        Returns
-        -------
-        unique values : ``Categorical``
-        """
-
-        from pandas.core.nanops import unique1d
-        # unlike np.unique, unique1d does not sort
-        unique_codes = unique1d(self.codes)
-        cat = self.copy()
-        # keep nan in codes
-        cat._codes = unique_codes
-        # exclude nan from indexer for categories
-        take_codes = unique_codes[unique_codes != -1]
-        if self.ordered:
-            take_codes = sorted(take_codes)
-        return cat.set_categories(cat.categories.take(take_codes))
-
-    def equals(self, other):
-        """
-        Returns True if categorical arrays are equal.
-
-        Parameters
-        ----------
-        other : `Categorical`
-
-        Returns
-        -------
-        are_equal : boolean
-        """
-        return self.is_dtype_equal(other) and np.array_equal(self._codes, other._codes)
-
-    def is_dtype_equal(self, other):
-        """
-        Returns True if categoricals are the same dtype
-          same categories, and same ordered
-
-        Parameters
-        ----------
-        other : Categorical
-
-        Returns
-        -------
-        are_equal : boolean
-        """
-
-        try:
-            return self.categories.equals(other.categories) and self.ordered == other.ordered
-        except (AttributeError, TypeError):
-            return False
-
-    def describe(self):
-        """ Describes this Categorical
-
-        Returns
-        -------
-        description: `DataFrame`
-            A dataframe with frequency and counts by category.
-        """
-        counts = self.value_counts(dropna=False)
-        freqs = counts / float(counts.sum())
-
-        from pandas.tools.merge import concat
-        result = concat([counts,freqs],axis=1)
-        result.columns = ['counts','freqs']
-        result.index.name = 'categories'
-
-        return result
-
-    def repeat(self, repeats):
-        """
-        Repeat elements of a Categorical.
-
-        See also
-        --------
-        numpy.ndarray.repeat
-
-        """
-        codes = self._codes.repeat(repeats)
-        return Categorical(values=codes, categories=self.categories,
-                           ordered=self.ordered, fastpath=True)
-
-
-##### The Series.cat accessor #####
-
-class CategoricalAccessor(PandasDelegate):
-    """
-    Accessor object for categorical properties of the Series values.
-
-    Be aware that assigning to `categories` is a inplace operation, while all methods return
-    new categorical data per default (but can be called with `inplace=True`).
-
-    Examples
-    --------
-    >>> s.cat.categories
-    >>> s.cat.categories = list('abc')
-    >>> s.cat.rename_categories(list('cab'))
-    >>> s.cat.reorder_categories(list('cab'))
-    >>> s.cat.add_categories(['d','e'])
-    >>> s.cat.remove_categories(['d'])
-    >>> s.cat.remove_unused_categories()
-    >>> s.cat.set_categories(list('abcde'))
-    >>> s.cat.as_ordered()
-    >>> s.cat.as_unordered()
-
-    """
-
-    def __init__(self, values, index):
-        self.categorical = values
-        self.index = index
-
-    def _delegate_property_get(self, name):
-        return getattr(self.categorical, name)
-
-    def _delegate_property_set(self, name, new_values):
-        return setattr(self.categorical, name, new_values)
-
-    @property
-    def codes(self):
-        from pandas import Series
-        return Series(self.categorical.codes, index=self.index)
-
-    def _delegate_method(self, name, *args, **kwargs):
-        from pandas import Series
-        method = getattr(self.categorical, name)
-        res = method(*args, **kwargs)
-        if not res is None:
-            return Series(res, index=self.index)
-
-CategoricalAccessor._add_delegate_accessors(delegate=Categorical,
-                                            accessors=["categories", "ordered"],
-                                            typ='property')
-CategoricalAccessor._add_delegate_accessors(delegate=Categorical,
-                                            accessors=["rename_categories",
-                                                       "reorder_categories",
-                                                       "add_categories",
-                                                       "remove_categories",
-                                                       "remove_unused_categories",
-                                                       "set_categories",
-                                                       "as_ordered",
-                                                       "as_unordered"],
-                                            typ='method')
-
-##### utility routines #####
-
-def _get_codes_for_values(values, categories):
-    """
-    utility routine to turn values into codes given the specified categories
-    """
-
-    from pandas.core.algorithms import _get_data_algo, _hashtables
-    if not is_dtype_equal(values.dtype,categories.dtype):
-        values = _ensure_object(values)
-        categories = _ensure_object(categories)
-
-    (hash_klass, vec_klass), vals = _get_data_algo(values, _hashtables)
-    (_, _), cats = _get_data_algo(categories, _hashtables)
-    t = hash_klass(len(cats))
-    t.map_locations(cats)
-    return _coerce_indexer_dtype(t.lookup(vals), cats)
-
-def _convert_to_list_like(list_like):
-    if hasattr(list_like, "dtype"):
-        return list_like
-    if isinstance(list_like, list):
-        return list_like
-    if (is_sequence(list_like) or isinstance(list_like, tuple)
-        or isinstance(list_like, types.GeneratorType)):
-        return list(list_like)
-    elif np.isscalar(list_like):
-        return [list_like]
-    else:
-        # is this reached?
-        return [list_like]
-
-def _concat_compat(to_concat, axis=0):
-    """Concatenate an object/categorical array of arrays, each of which is a
-    single dtype
-
-    Parameters
-    ----------
-    to_concat : array of arrays
-    axis : int
-        Axis to provide concatenation in the current implementation this is
-        always 0, e.g. we only have 1D categoricals
-
-    Returns
-    -------
-    Categorical
-        A single array, preserving the combined dtypes
-    """
-
-    def convert_categorical(x):
-        # coerce to object dtype
-        if is_categorical_dtype(x.dtype):
-            return x.get_values()
-        return x.ravel()
-
-    if get_dtype_kinds(to_concat) - set(['object', 'category']):
-        # convert to object type and perform a regular concat
-        from pandas.core.common import _concat_compat
-        return _concat_compat([np.array(x, copy=False, dtype=object)
-                               for x in to_concat], axis=0)
-
-    # we could have object blocks and categoricals here
-    # if we only have a single categoricals then combine everything
-    # else its a non-compat categorical
-    categoricals = [x for x in to_concat if is_categorical_dtype(x.dtype)]
-
-    # validate the categories
-    categories = categoricals[0]
-    rawcats = categories.categories
-    for x in categoricals[1:]:
-        if not categories.is_dtype_equal(x):
-            raise ValueError("incompatible categories in categorical concat")
-
-    # we've already checked that all categoricals are the same, so if their
-    # length is equal to the input then we have all the same categories
-    if len(categoricals) == len(to_concat):
-        # concating numeric types is much faster than concating object types
-        # and fastpath takes a shorter path through the constructor
-        return Categorical(np.concatenate([x.codes for x in to_concat], axis=0),
-                           rawcats,
-                           ordered=categoricals[0].ordered,
-                           fastpath=True)
-    else:
-        concatted = np.concatenate(list(map(convert_categorical, to_concat)),
-                                   axis=0)
-        return Categorical(concatted, rawcats)
+from pandas.core.arrays import Categorical  # noqa
+from pandas.core.dtypes.dtypes import CategoricalDtype  # noqa
diff --git a/pandas/core/common.py b/pandas/core/common.py
index 724843d379f64..1de8269c9a0c6 100644
--- a/pandas/core/common.py
+++ b/pandas/core/common.py
@@ -2,29 +2,22 @@
 Misc tools for implementing data structures
 """
 
-import re
-import collections
-import numbers
-import codecs
-import csv
-import types
 from datetime import datetime, timedelta
 from functools import partial
+import inspect
+import collections
 
-from numpy.lib.format import read_array, write_array
 import numpy as np
+from pandas._libs import lib, tslib
 
-import pandas as pd
-import pandas.algos as algos
-import pandas.lib as lib
-import pandas.tslib as tslib
 from pandas import compat
-from pandas.compat import StringIO, BytesIO, range, long, u, zip, map, string_types, iteritems
-from pandas.core.dtypes import CategoricalDtype, CategoricalDtypeType, DatetimeTZDtype, DatetimeTZDtypeType
+from pandas.compat import long, zip, iteritems, PY36, OrderedDict
 from pandas.core.config import get_option
-
-class PandasError(Exception):
-    pass
+from pandas.core.dtypes.generic import ABCSeries, ABCIndex
+from pandas.core.dtypes.common import _NS_DTYPE, is_integer
+from pandas.core.dtypes.inference import _iterable_not_string
+from pandas.core.dtypes.missing import isna, isnull, notnull  # noqa
+from pandas.core.dtypes.cast import construct_1d_object_array_from_listlike
 
 
 class SettingWithCopyError(ValueError):
@@ -35,374 +28,6 @@ class SettingWithCopyWarning(Warning):
     pass
 
 
-class AmbiguousIndexError(PandasError, KeyError):
-    pass
-
-
-class AbstractMethodError(NotImplementedError):
-    """Raise this error instead of NotImplementedError for abstract methods
-    while keeping compatibility with Python 2 and Python 3.
-    """
-    def __init__(self, class_instance):
-        self.class_instance = class_instance
-
-    def __str__(self):
-        return "This method must be defined in the concrete class of " \
-               + self.class_instance.__class__.__name__
-
-_POSSIBLY_CAST_DTYPES = set([np.dtype(t).name
-                             for t in ['O', 'int8',
-                                       'uint8', 'int16', 'uint16', 'int32',
-                                       'uint32', 'int64', 'uint64']])
-
-_NS_DTYPE = np.dtype('M8[ns]')
-_TD_DTYPE = np.dtype('m8[ns]')
-_INT64_DTYPE = np.dtype(np.int64)
-_DATELIKE_DTYPES = set([np.dtype(t) for t in ['M8[ns]', '<M8[ns]', '>M8[ns]',
-                                              'm8[ns]', '<m8[ns]', '>m8[ns]']])
-_int8_max = np.iinfo(np.int8).max
-_int16_max = np.iinfo(np.int16).max
-_int32_max = np.iinfo(np.int32).max
-_int64_max = np.iinfo(np.int64).max
-
-# define abstract base classes to enable isinstance type checking on our
-# objects
-def create_pandas_abc_type(name, attr, comp):
-    @classmethod
-    def _check(cls, inst):
-        return getattr(inst, attr, '_typ') in comp
-    dct = dict(__instancecheck__=_check,
-               __subclasscheck__=_check)
-    meta = type("ABCBase", (type,), dct)
-    return meta(name, tuple(), dct)
-
-
-ABCIndex = create_pandas_abc_type("ABCIndex", "_typ", ("index",))
-ABCInt64Index = create_pandas_abc_type("ABCInt64Index", "_typ", ("int64index",))
-ABCFloat64Index = create_pandas_abc_type("ABCFloat64Index", "_typ", ("float64index",))
-ABCMultiIndex = create_pandas_abc_type("ABCMultiIndex", "_typ", ("multiindex",))
-ABCDatetimeIndex = create_pandas_abc_type("ABCDatetimeIndex", "_typ", ("datetimeindex",))
-ABCTimedeltaIndex = create_pandas_abc_type("ABCTimedeltaIndex", "_typ", ("timedeltaindex",))
-ABCPeriodIndex = create_pandas_abc_type("ABCPeriodIndex", "_typ", ("periodindex",))
-ABCCategoricalIndex = create_pandas_abc_type("ABCCategoricalIndex", "_typ", ("categoricalindex",))
-ABCIndexClass = create_pandas_abc_type("ABCIndexClass", "_typ", ("index",
-                                                                 "int64index",
-                                                                 "float64index",
-                                                                 "multiindex",
-                                                                 "datetimeindex",
-                                                                 "timedeltaindex",
-                                                                 "periodindex",
-                                                                 "categoricalindex"))
-
-ABCSeries = create_pandas_abc_type("ABCSeries", "_typ", ("series",))
-ABCDataFrame = create_pandas_abc_type("ABCDataFrame", "_typ", ("dataframe",))
-ABCPanel = create_pandas_abc_type("ABCPanel", "_typ", ("panel",))
-ABCSparseSeries = create_pandas_abc_type("ABCSparseSeries", "_subtyp",
-                                         ('sparse_series',
-                                          'sparse_time_series'))
-ABCSparseArray = create_pandas_abc_type("ABCSparseArray", "_subtyp",
-                                        ('sparse_array', 'sparse_series'))
-ABCCategorical = create_pandas_abc_type("ABCCategorical","_typ",("categorical"))
-ABCPeriod = create_pandas_abc_type("ABCPeriod", "_typ", ("period",))
-
-class _ABCGeneric(type):
-
-    def __instancecheck__(cls, inst):
-        return hasattr(inst, "_data")
-
-
-ABCGeneric = _ABCGeneric("ABCGeneric", tuple(), {})
-
-
-def bind_method(cls, name, func):
-    """Bind a method to class, python 2 and python 3 compatible.
-
-    Parameters
-    ----------
-
-    cls : type
-        class to receive bound method
-    name : basestring
-        name of method on class instance
-    func : function
-        function to be bound as method
-
-
-    Returns
-    -------
-    None
-    """
-    # only python 2 has bound/unbound method issue
-    if not compat.PY3:
-        setattr(cls, name, types.MethodType(func, None, cls))
-    else:
-        setattr(cls, name, func)
-
-def isnull(obj):
-    """Detect missing values (NaN in numeric arrays, None/NaN in object arrays)
-
-    Parameters
-    ----------
-    arr : ndarray or object value
-        Object to check for null-ness
-
-    Returns
-    -------
-    isnulled : array-like of bool or bool
-        Array or bool indicating whether an object is null or if an array is
-        given which of the element is null.
-
-    See also
-    --------
-    pandas.notnull: boolean inverse of pandas.isnull
-    """
-    return _isnull(obj)
-
-
-def _isnull_new(obj):
-    if lib.isscalar(obj):
-        return lib.checknull(obj)
-    # hack (for now) because MI registers as ndarray
-    elif isinstance(obj, pd.MultiIndex):
-        raise NotImplementedError("isnull is not defined for MultiIndex")
-    elif isinstance(obj, (ABCSeries, np.ndarray, pd.Index)):
-        return _isnull_ndarraylike(obj)
-    elif isinstance(obj, ABCGeneric):
-        return obj._constructor(obj._data.isnull(func=isnull))
-    elif isinstance(obj, list) or hasattr(obj, '__array__'):
-        return _isnull_ndarraylike(np.asarray(obj))
-    else:
-        return obj is None
-
-
-def _isnull_old(obj):
-    """Detect missing values. Treat None, NaN, INF, -INF as null.
-
-    Parameters
-    ----------
-    arr: ndarray or object value
-
-    Returns
-    -------
-    boolean ndarray or boolean
-    """
-    if lib.isscalar(obj):
-        return lib.checknull_old(obj)
-    # hack (for now) because MI registers as ndarray
-    elif isinstance(obj, pd.MultiIndex):
-        raise NotImplementedError("isnull is not defined for MultiIndex")
-    elif isinstance(obj, (ABCSeries, np.ndarray, pd.Index)):
-        return _isnull_ndarraylike_old(obj)
-    elif isinstance(obj, ABCGeneric):
-        return obj._constructor(obj._data.isnull(func=_isnull_old))
-    elif isinstance(obj, list) or hasattr(obj, '__array__'):
-        return _isnull_ndarraylike_old(np.asarray(obj))
-    else:
-        return obj is None
-
-_isnull = _isnull_new
-
-
-def _use_inf_as_null(key):
-    """Option change callback for null/inf behaviour
-    Choose which replacement for numpy.isnan / -numpy.isfinite is used.
-
-    Parameters
-    ----------
-    flag: bool
-        True means treat None, NaN, INF, -INF as null (old way),
-        False means None and NaN are null, but INF, -INF are not null
-        (new way).
-
-    Notes
-    -----
-    This approach to setting global module values is discussed and
-    approved here:
-
-    * http://stackoverflow.com/questions/4859217/
-      programmatically-creating-variables-in-python/4859312#4859312
-    """
-    flag = get_option(key)
-    if flag:
-        globals()['_isnull'] = _isnull_old
-    else:
-        globals()['_isnull'] = _isnull_new
-
-
-def _isnull_ndarraylike(obj):
-
-    values = getattr(obj, 'values', obj)
-    dtype = values.dtype
-
-    if dtype.kind in ('O', 'S', 'U'):
-        if is_categorical_dtype(values):
-            from pandas import Categorical
-            if not isinstance(values, Categorical):
-                values = values.values
-            result = values.isnull()
-        else:
-
-            # Working around NumPy ticket 1542
-            shape = values.shape
-
-            if dtype.kind in ('S', 'U'):
-                result = np.zeros(values.shape, dtype=bool)
-            else:
-                result = np.empty(shape, dtype=bool)
-                vec = lib.isnullobj(values.ravel())
-                result[...] = vec.reshape(shape)
-
-    elif is_datetimelike(obj):
-        # this is the NaT pattern
-        result = values.view('i8') == tslib.iNaT
-    else:
-        result = np.isnan(values)
-
-    # box
-    if isinstance(obj, ABCSeries):
-        from pandas import Series
-        result = Series(result, index=obj.index, name=obj.name, copy=False)
-
-    return result
-
-def _isnull_ndarraylike_old(obj):
-    values = getattr(obj, 'values', obj)
-    dtype = values.dtype
-
-    if dtype.kind in ('O', 'S', 'U'):
-        # Working around NumPy ticket 1542
-        shape = values.shape
-
-        if values.dtype.kind in ('S', 'U'):
-            result = np.zeros(values.shape, dtype=bool)
-        else:
-            result = np.empty(shape, dtype=bool)
-            vec = lib.isnullobj_old(values.ravel())
-            result[:] = vec.reshape(shape)
-
-    elif dtype in _DATELIKE_DTYPES:
-        # this is the NaT pattern
-        result = values.view('i8') == tslib.iNaT
-    else:
-        result = ~np.isfinite(values)
-
-    # box
-    if isinstance(obj, ABCSeries):
-        from pandas import Series
-        result = Series(result, index=obj.index, name=obj.name, copy=False)
-
-    return result
-
-
-def notnull(obj):
-    """Replacement for numpy.isfinite / -numpy.isnan which is suitable for use
-    on object arrays.
-
-    Parameters
-    ----------
-    arr : ndarray or object value
-        Object to check for *not*-null-ness
-
-    Returns
-    -------
-    isnulled : array-like of bool or bool
-        Array or bool indicating whether an object is *not* null or if an array
-        is given which of the element is *not* null.
-
-    See also
-    --------
-    pandas.isnull : boolean inverse of pandas.notnull
-    """
-    res = isnull(obj)
-    if np.isscalar(res):
-        return not res
-    return ~res
-
-def is_null_datelike_scalar(other):
-    """ test whether the object is a null datelike, e.g. Nat
-    but guard against passing a non-scalar """
-    if other is pd.NaT or other is None:
-        return True
-    elif np.isscalar(other):
-
-        # a timedelta
-        if hasattr(other,'dtype'):
-            return other.view('i8') == tslib.iNaT
-        elif is_integer(other) and other == tslib.iNaT:
-            return True
-        return isnull(other)
-    return False
-
-def array_equivalent(left, right, strict_nan=False):
-    """
-    True if two arrays, left and right, have equal non-NaN elements, and NaNs in
-    corresponding locations.  False otherwise. It is assumed that left and right
-    are NumPy arrays of the same dtype. The behavior of this function
-    (particularly with respect to NaNs) is not defined if the dtypes are
-    different.
-
-    Parameters
-    ----------
-    left, right : ndarrays
-    strict_nan : bool, default False
-        If True, consider NaN and None to be different.
-
-    Returns
-    -------
-    b : bool
-        Returns True if the arrays are equivalent.
-
-    Examples
-    --------
-    >>> array_equivalent(
-    ...     np.array([1, 2, np.nan]),
-    ...     np.array([1, 2, np.nan]))
-    True
-    >>> array_equivalent(
-    ...     np.array([1, np.nan, 2]),
-    ...     np.array([1, 2, np.nan]))
-    False
-    """
-
-    left, right = np.asarray(left), np.asarray(right)
-    if left.shape != right.shape: return False
-
-    # Object arrays can contain None, NaN and NaT.
-    if issubclass(left.dtype.type, np.object_) or issubclass(right.dtype.type, np.object_):
-
-        if not strict_nan:
-            # pd.isnull considers NaN and None to be equivalent.
-            return lib.array_equivalent_object(_ensure_object(left.ravel()),
-                                               _ensure_object(right.ravel()))
-
-        for left_value, right_value in zip(left, right):
-            if left_value is tslib.NaT and right_value is not tslib.NaT:
-                return False
-
-            elif isinstance(left_value, float) and np.isnan(left_value):
-                if not isinstance(right_value, float) or not np.isnan(right_value):
-                    return False
-            else:
-                if left_value != right_value:
-                    return False
-        return True
-
-    # NaNs can occur in float and complex arrays.
-    if issubclass(left.dtype.type, (np.floating, np.complexfloating)):
-        return ((left == right) | (np.isnan(left) & np.isnan(right))).all()
-
-    # numpy will will not allow this type of datetimelike vs integer comparison
-    elif is_datetimelike_v_numeric(left, right):
-        return False
-
-    # NaNs cannot occur otherwise.
-    return np.array_equal(left, right)
-
-def _iterable_not_string(x):
-    return (isinstance(x, collections.Iterable) and
-            not isinstance(x, compat.string_types))
-
-
 def flatten(l):
     """Flatten an arbitrarily nested sequence.
 
@@ -427,1409 +52,22 @@ def flatten(l):
             yield el
 
 
-def mask_missing(arr, values_to_mask):
-    """
-    Return a masking array of same size/shape as arr
-    with entries equaling any member of values_to_mask set to True
-    """
-    if not isinstance(values_to_mask, (list, np.ndarray)):
-        values_to_mask = [values_to_mask]
-
-    try:
-        values_to_mask = np.array(values_to_mask, dtype=arr.dtype)
-    except Exception:
-        values_to_mask = np.array(values_to_mask, dtype=object)
-
-    na_mask = isnull(values_to_mask)
-    nonna = values_to_mask[~na_mask]
-
-    mask = None
-    for x in nonna:
-        if mask is None:
-            mask = arr == x
-
-            # if x is a string and arr is not, then we get False and we must
-            # expand the mask to size arr.shape
-            if np.isscalar(mask):
-                mask = np.zeros(arr.shape, dtype=bool)
-        else:
-            mask |= arr == x
-
-    if na_mask.any():
-        if mask is None:
-            mask = isnull(arr)
-        else:
-            mask |= isnull(arr)
-
-    return mask
-
-
-def _pickle_array(arr):
-    arr = arr.view(np.ndarray)
-
-    buf = BytesIO()
-    write_array(buf, arr)
-
-    return buf.getvalue()
-
-
-def _unpickle_array(bytes):
-    arr = read_array(BytesIO(bytes))
-
-    # All datetimes should be stored as M8[ns].  When unpickling with
-    # numpy1.6, it will read these as M8[us].  So this ensures all
-    # datetime64 types are read as MS[ns]
-    if is_datetime64_dtype(arr):
-        arr = arr.view(_NS_DTYPE)
-
-    return arr
-
-
-def _view_wrapper(f, arr_dtype=None, out_dtype=None, fill_wrap=None):
-    def wrapper(arr, indexer, out, fill_value=np.nan):
-        if arr_dtype is not None:
-            arr = arr.view(arr_dtype)
-        if out_dtype is not None:
-            out = out.view(out_dtype)
-        if fill_wrap is not None:
-            fill_value = fill_wrap(fill_value)
-        f(arr, indexer, out, fill_value=fill_value)
-    return wrapper
-
-
-def _convert_wrapper(f, conv_dtype):
-    def wrapper(arr, indexer, out, fill_value=np.nan):
-        arr = arr.astype(conv_dtype)
-        f(arr, indexer, out, fill_value=fill_value)
-    return wrapper
-
-
-def _take_2d_multi_generic(arr, indexer, out, fill_value, mask_info):
-    # this is not ideal, performance-wise, but it's better than raising
-    # an exception (best to optimize in Cython to avoid getting here)
-    row_idx, col_idx = indexer
-    if mask_info is not None:
-        (row_mask, col_mask), (row_needs, col_needs) = mask_info
-    else:
-        row_mask = row_idx == -1
-        col_mask = col_idx == -1
-        row_needs = row_mask.any()
-        col_needs = col_mask.any()
-    if fill_value is not None:
-        if row_needs:
-            out[row_mask, :] = fill_value
-        if col_needs:
-            out[:, col_mask] = fill_value
-    for i in range(len(row_idx)):
-        u_ = row_idx[i]
-        for j in range(len(col_idx)):
-            v = col_idx[j]
-            out[i, j] = arr[u_, v]
-
-
-def _take_nd_generic(arr, indexer, out, axis, fill_value, mask_info):
-    if mask_info is not None:
-        mask, needs_masking = mask_info
-    else:
-        mask = indexer == -1
-        needs_masking = mask.any()
-    if arr.dtype != out.dtype:
-        arr = arr.astype(out.dtype)
-    if arr.shape[axis] > 0:
-        arr.take(_ensure_platform_int(indexer), axis=axis, out=out)
-    if needs_masking:
-        outindexer = [slice(None)] * arr.ndim
-        outindexer[axis] = mask
-        out[tuple(outindexer)] = fill_value
-
-
-_take_1d_dict = {
-    ('int8', 'int8'): algos.take_1d_int8_int8,
-    ('int8', 'int32'): algos.take_1d_int8_int32,
-    ('int8', 'int64'): algos.take_1d_int8_int64,
-    ('int8', 'float64'): algos.take_1d_int8_float64,
-    ('int16', 'int16'): algos.take_1d_int16_int16,
-    ('int16', 'int32'): algos.take_1d_int16_int32,
-    ('int16', 'int64'): algos.take_1d_int16_int64,
-    ('int16', 'float64'): algos.take_1d_int16_float64,
-    ('int32', 'int32'): algos.take_1d_int32_int32,
-    ('int32', 'int64'): algos.take_1d_int32_int64,
-    ('int32', 'float64'): algos.take_1d_int32_float64,
-    ('int64', 'int64'): algos.take_1d_int64_int64,
-    ('int64', 'float64'): algos.take_1d_int64_float64,
-    ('float32', 'float32'): algos.take_1d_float32_float32,
-    ('float32', 'float64'): algos.take_1d_float32_float64,
-    ('float64', 'float64'): algos.take_1d_float64_float64,
-    ('object', 'object'): algos.take_1d_object_object,
-    ('bool', 'bool'):
-    _view_wrapper(algos.take_1d_bool_bool, np.uint8, np.uint8),
-    ('bool', 'object'):
-    _view_wrapper(algos.take_1d_bool_object, np.uint8, None),
-    ('datetime64[ns]', 'datetime64[ns]'):
-    _view_wrapper(algos.take_1d_int64_int64, np.int64, np.int64, np.int64)
-}
-
-
-_take_2d_axis0_dict = {
-    ('int8', 'int8'): algos.take_2d_axis0_int8_int8,
-    ('int8', 'int32'): algos.take_2d_axis0_int8_int32,
-    ('int8', 'int64'): algos.take_2d_axis0_int8_int64,
-    ('int8', 'float64'): algos.take_2d_axis0_int8_float64,
-    ('int16', 'int16'): algos.take_2d_axis0_int16_int16,
-    ('int16', 'int32'): algos.take_2d_axis0_int16_int32,
-    ('int16', 'int64'): algos.take_2d_axis0_int16_int64,
-    ('int16', 'float64'): algos.take_2d_axis0_int16_float64,
-    ('int32', 'int32'): algos.take_2d_axis0_int32_int32,
-    ('int32', 'int64'): algos.take_2d_axis0_int32_int64,
-    ('int32', 'float64'): algos.take_2d_axis0_int32_float64,
-    ('int64', 'int64'): algos.take_2d_axis0_int64_int64,
-    ('int64', 'float64'): algos.take_2d_axis0_int64_float64,
-    ('float32', 'float32'): algos.take_2d_axis0_float32_float32,
-    ('float32', 'float64'): algos.take_2d_axis0_float32_float64,
-    ('float64', 'float64'): algos.take_2d_axis0_float64_float64,
-    ('object', 'object'): algos.take_2d_axis0_object_object,
-    ('bool', 'bool'):
-    _view_wrapper(algos.take_2d_axis0_bool_bool, np.uint8, np.uint8),
-    ('bool', 'object'):
-    _view_wrapper(algos.take_2d_axis0_bool_object, np.uint8, None),
-    ('datetime64[ns]', 'datetime64[ns]'):
-    _view_wrapper(algos.take_2d_axis0_int64_int64, np.int64, np.int64,
-                  fill_wrap=np.int64)
-}
-
-
-_take_2d_axis1_dict = {
-    ('int8', 'int8'): algos.take_2d_axis1_int8_int8,
-    ('int8', 'int32'): algos.take_2d_axis1_int8_int32,
-    ('int8', 'int64'): algos.take_2d_axis1_int8_int64,
-    ('int8', 'float64'): algos.take_2d_axis1_int8_float64,
-    ('int16', 'int16'): algos.take_2d_axis1_int16_int16,
-    ('int16', 'int32'): algos.take_2d_axis1_int16_int32,
-    ('int16', 'int64'): algos.take_2d_axis1_int16_int64,
-    ('int16', 'float64'): algos.take_2d_axis1_int16_float64,
-    ('int32', 'int32'): algos.take_2d_axis1_int32_int32,
-    ('int32', 'int64'): algos.take_2d_axis1_int32_int64,
-    ('int32', 'float64'): algos.take_2d_axis1_int32_float64,
-    ('int64', 'int64'): algos.take_2d_axis1_int64_int64,
-    ('int64', 'float64'): algos.take_2d_axis1_int64_float64,
-    ('float32', 'float32'): algos.take_2d_axis1_float32_float32,
-    ('float32', 'float64'): algos.take_2d_axis1_float32_float64,
-    ('float64', 'float64'): algos.take_2d_axis1_float64_float64,
-    ('object', 'object'): algos.take_2d_axis1_object_object,
-    ('bool', 'bool'):
-    _view_wrapper(algos.take_2d_axis1_bool_bool, np.uint8, np.uint8),
-    ('bool', 'object'):
-    _view_wrapper(algos.take_2d_axis1_bool_object, np.uint8, None),
-    ('datetime64[ns]', 'datetime64[ns]'):
-    _view_wrapper(algos.take_2d_axis1_int64_int64, np.int64, np.int64,
-                  fill_wrap=np.int64)
-}
-
-
-_take_2d_multi_dict = {
-    ('int8', 'int8'): algos.take_2d_multi_int8_int8,
-    ('int8', 'int32'): algos.take_2d_multi_int8_int32,
-    ('int8', 'int64'): algos.take_2d_multi_int8_int64,
-    ('int8', 'float64'): algos.take_2d_multi_int8_float64,
-    ('int16', 'int16'): algos.take_2d_multi_int16_int16,
-    ('int16', 'int32'): algos.take_2d_multi_int16_int32,
-    ('int16', 'int64'): algos.take_2d_multi_int16_int64,
-    ('int16', 'float64'): algos.take_2d_multi_int16_float64,
-    ('int32', 'int32'): algos.take_2d_multi_int32_int32,
-    ('int32', 'int64'): algos.take_2d_multi_int32_int64,
-    ('int32', 'float64'): algos.take_2d_multi_int32_float64,
-    ('int64', 'int64'): algos.take_2d_multi_int64_int64,
-    ('int64', 'float64'): algos.take_2d_multi_int64_float64,
-    ('float32', 'float32'): algos.take_2d_multi_float32_float32,
-    ('float32', 'float64'): algos.take_2d_multi_float32_float64,
-    ('float64', 'float64'): algos.take_2d_multi_float64_float64,
-    ('object', 'object'): algos.take_2d_multi_object_object,
-    ('bool', 'bool'):
-    _view_wrapper(algos.take_2d_multi_bool_bool, np.uint8, np.uint8),
-    ('bool', 'object'):
-    _view_wrapper(algos.take_2d_multi_bool_object, np.uint8, None),
-    ('datetime64[ns]', 'datetime64[ns]'):
-    _view_wrapper(algos.take_2d_multi_int64_int64, np.int64, np.int64,
-                  fill_wrap=np.int64)
-}
-
-
-def _get_take_nd_function(ndim, arr_dtype, out_dtype, axis=0, mask_info=None):
-    if ndim <= 2:
-        tup = (arr_dtype.name, out_dtype.name)
-        if ndim == 1:
-            func = _take_1d_dict.get(tup, None)
-        elif ndim == 2:
-            if axis == 0:
-                func = _take_2d_axis0_dict.get(tup, None)
-            else:
-                func = _take_2d_axis1_dict.get(tup, None)
-        if func is not None:
-            return func
-
-        tup = (out_dtype.name, out_dtype.name)
-        if ndim == 1:
-            func = _take_1d_dict.get(tup, None)
-        elif ndim == 2:
-            if axis == 0:
-                func = _take_2d_axis0_dict.get(tup, None)
-            else:
-                func = _take_2d_axis1_dict.get(tup, None)
-        if func is not None:
-            func = _convert_wrapper(func, out_dtype)
-            return func
-
-    def func(arr, indexer, out, fill_value=np.nan):
-        indexer = _ensure_int64(indexer)
-        _take_nd_generic(arr, indexer, out, axis=axis,
-                         fill_value=fill_value, mask_info=mask_info)
-    return func
-
-
-def take_nd(arr, indexer, axis=0, out=None, fill_value=np.nan,
-            mask_info=None, allow_fill=True):
-    """
-    Specialized Cython take which sets NaN values in one pass
-
-    Parameters
-    ----------
-    arr : ndarray
-        Input array
-    indexer : ndarray
-        1-D array of indices to take, subarrays corresponding to -1 value
-        indicies are filed with fill_value
-    axis : int, default 0
-        Axis to take from
-    out : ndarray or None, default None
-        Optional output array, must be appropriate type to hold input and
-        fill_value together, if indexer has any -1 value entries; call
-        common._maybe_promote to determine this type for any fill_value
-    fill_value : any, default np.nan
-        Fill value to replace -1 values with
-    mask_info : tuple of (ndarray, boolean)
-        If provided, value should correspond to:
-            (indexer != -1, (indexer != -1).any())
-        If not provided, it will be computed internally if necessary
-    allow_fill : boolean, default True
-        If False, indexer is assumed to contain no -1 values so no filling
-        will be done.  This short-circuits computation of a mask.  Result is
-        undefined if allow_fill == False and -1 is present in indexer.
-    """
-
-    # dispatch to internal type takes
-    if is_categorical(arr):
-        return arr.take_nd(indexer, fill_value=fill_value,
-                           allow_fill=allow_fill)
-    elif is_datetimetz(arr):
-        return arr.take(indexer, fill_value=fill_value, allow_fill=allow_fill)
-
-    if indexer is None:
-        indexer = np.arange(arr.shape[axis], dtype=np.int64)
-        dtype, fill_value = arr.dtype, arr.dtype.type()
-    else:
-        indexer = _ensure_int64(indexer)
-        if not allow_fill:
-            dtype, fill_value = arr.dtype, arr.dtype.type()
-            mask_info = None, False
-        else:
-            # check for promotion based on types only (do this first because
-            # it's faster than computing a mask)
-            dtype, fill_value = _maybe_promote(arr.dtype, fill_value)
-            if dtype != arr.dtype and (out is None or out.dtype != dtype):
-                # check if promotion is actually required based on indexer
-                if mask_info is not None:
-                    mask, needs_masking = mask_info
-                else:
-                    mask = indexer == -1
-                    needs_masking = mask.any()
-                    mask_info = mask, needs_masking
-                if needs_masking:
-                    if out is not None and out.dtype != dtype:
-                        raise TypeError('Incompatible type for fill_value')
-                else:
-                    # if not, then depromote, set fill_value to dummy
-                    # (it won't be used but we don't want the cython code
-                    # to crash when trying to cast it to dtype)
-                    dtype, fill_value = arr.dtype, arr.dtype.type()
-
-    flip_order = False
-    if arr.ndim == 2:
-        if arr.flags.f_contiguous:
-            flip_order = True
-
-    if flip_order:
-        arr = arr.T
-        axis = arr.ndim - axis - 1
-        if out is not None:
-            out = out.T
-
-    # at this point, it's guaranteed that dtype can hold both the arr values
-    # and the fill_value
-    if out is None:
-        out_shape = list(arr.shape)
-        out_shape[axis] = len(indexer)
-        out_shape = tuple(out_shape)
-        if arr.flags.f_contiguous and axis == arr.ndim - 1:
-            # minor tweak that can make an order-of-magnitude difference
-            # for dataframes initialized directly from 2-d ndarrays
-            # (s.t. df.values is c-contiguous and df._data.blocks[0] is its
-            # f-contiguous transpose)
-            out = np.empty(out_shape, dtype=dtype, order='F')
-        else:
-            out = np.empty(out_shape, dtype=dtype)
-
-    func = _get_take_nd_function(arr.ndim, arr.dtype, out.dtype,
-                                 axis=axis, mask_info=mask_info)
-    indexer = _ensure_int64(indexer)
-    func(arr, indexer, out, fill_value)
-
-    if flip_order:
-        out = out.T
-    return out
-
-
-take_1d = take_nd
-
-
-def take_2d_multi(arr, indexer, out=None, fill_value=np.nan,
-                  mask_info=None, allow_fill=True):
-    """
-    Specialized Cython take which sets NaN values in one pass
-    """
-    if indexer is None or (indexer[0] is None and indexer[1] is None):
-        row_idx = np.arange(arr.shape[0], dtype=np.int64)
-        col_idx = np.arange(arr.shape[1], dtype=np.int64)
-        indexer = row_idx, col_idx
-        dtype, fill_value = arr.dtype, arr.dtype.type()
-    else:
-        row_idx, col_idx = indexer
-        if row_idx is None:
-            row_idx = np.arange(arr.shape[0], dtype=np.int64)
-        else:
-            row_idx = _ensure_int64(row_idx)
-        if col_idx is None:
-            col_idx = np.arange(arr.shape[1], dtype=np.int64)
-        else:
-            col_idx = _ensure_int64(col_idx)
-        indexer = row_idx, col_idx
-        if not allow_fill:
-            dtype, fill_value = arr.dtype, arr.dtype.type()
-            mask_info = None, False
-        else:
-            # check for promotion based on types only (do this first because
-            # it's faster than computing a mask)
-            dtype, fill_value = _maybe_promote(arr.dtype, fill_value)
-            if dtype != arr.dtype and (out is None or out.dtype != dtype):
-                # check if promotion is actually required based on indexer
-                if mask_info is not None:
-                    (row_mask, col_mask), (row_needs, col_needs) = mask_info
-                else:
-                    row_mask = row_idx == -1
-                    col_mask = col_idx == -1
-                    row_needs = row_mask.any()
-                    col_needs = col_mask.any()
-                    mask_info = (row_mask, col_mask), (row_needs, col_needs)
-                if row_needs or col_needs:
-                    if out is not None and out.dtype != dtype:
-                        raise TypeError('Incompatible type for fill_value')
-                else:
-                    # if not, then depromote, set fill_value to dummy
-                    # (it won't be used but we don't want the cython code
-                    # to crash when trying to cast it to dtype)
-                    dtype, fill_value = arr.dtype, arr.dtype.type()
-
-    # at this point, it's guaranteed that dtype can hold both the arr values
-    # and the fill_value
-    if out is None:
-        out_shape = len(row_idx), len(col_idx)
-        out = np.empty(out_shape, dtype=dtype)
-
-    func = _take_2d_multi_dict.get((arr.dtype.name, out.dtype.name), None)
-    if func is None and arr.dtype != out.dtype:
-        func = _take_2d_multi_dict.get((out.dtype.name, out.dtype.name), None)
-        if func is not None:
-            func = _convert_wrapper(func, out.dtype)
-    if func is None:
-        def func(arr, indexer, out, fill_value=np.nan):
-            _take_2d_multi_generic(arr, indexer, out,
-                                   fill_value=fill_value, mask_info=mask_info)
-    func(arr, indexer, out=out, fill_value=fill_value)
-    return out
-
-_diff_special = {
-    'float64': algos.diff_2d_float64,
-    'float32': algos.diff_2d_float32,
-    'int64': algos.diff_2d_int64,
-    'int32': algos.diff_2d_int32,
-    'int16': algos.diff_2d_int16,
-    'int8': algos.diff_2d_int8,
-}
-
-def diff(arr, n, axis=0):
-    """ difference of n between self,
-        analagoust to s-s.shift(n) """
-
-    n = int(n)
-    na = np.nan
-    dtype = arr.dtype
-    is_timedelta = False
-    if needs_i8_conversion(arr):
-        dtype = np.float64
-        arr = arr.view('i8')
-        na = tslib.iNaT
-        is_timedelta = True
-    elif issubclass(dtype.type, np.integer):
-        dtype = np.float64
-    elif issubclass(dtype.type, np.bool_):
-        dtype = np.object_
-
-    dtype = np.dtype(dtype)
-    out_arr = np.empty(arr.shape, dtype=dtype)
-
-    na_indexer = [slice(None)] * arr.ndim
-    na_indexer[axis] = slice(None, n) if n >= 0 else slice(n, None)
-    out_arr[tuple(na_indexer)] = na
-
-    if arr.ndim == 2 and arr.dtype.name in _diff_special:
-        f = _diff_special[arr.dtype.name]
-        f(arr, out_arr, n, axis)
-    else:
-        res_indexer = [slice(None)] * arr.ndim
-        res_indexer[axis] = slice(n, None) if n >= 0 else slice(None, n)
-        res_indexer = tuple(res_indexer)
-
-        lag_indexer = [slice(None)] * arr.ndim
-        lag_indexer[axis] = slice(None, -n) if n > 0 else slice(-n, None)
-        lag_indexer = tuple(lag_indexer)
-
-        # need to make sure that we account for na for datelike/timedelta
-        # we don't actually want to subtract these i8 numbers
-        if is_timedelta:
-            res = arr[res_indexer]
-            lag = arr[lag_indexer]
-
-            mask = (arr[res_indexer] == na) | (arr[lag_indexer] == na)
-            if mask.any():
-                res = res.copy()
-                res[mask] = 0
-                lag = lag.copy()
-                lag[mask] = 0
-
-            result = res - lag
-            result[mask] = na
-            out_arr[res_indexer] = result
-        else:
-            out_arr[res_indexer] = arr[res_indexer] - arr[lag_indexer]
-
-    if is_timedelta:
-        from pandas import TimedeltaIndex
-        out_arr = TimedeltaIndex(out_arr.ravel().astype('int64')).asi8.reshape(out_arr.shape).astype('timedelta64[ns]')
-
-    return out_arr
-
-def _coerce_indexer_dtype(indexer, categories):
-    """ coerce the indexer input array to the smallest dtype possible """
-    l = len(categories)
-    if l < _int8_max:
-        return _ensure_int8(indexer)
-    elif l < _int16_max:
-        return _ensure_int16(indexer)
-    elif l < _int32_max:
-        return _ensure_int32(indexer)
-    return _ensure_int64(indexer)
-
-def _coerce_to_dtypes(result, dtypes):
-    """ given a dtypes and a result set, coerce the result elements to the
-    dtypes
-    """
-    if len(result) != len(dtypes):
-        raise AssertionError("_coerce_to_dtypes requires equal len arrays")
-
-    from pandas.tseries.timedeltas import _coerce_scalar_to_timedelta_type
-
-    def conv(r, dtype):
-        try:
-            if isnull(r):
-                pass
-            elif dtype == _NS_DTYPE:
-                r = lib.Timestamp(r)
-            elif dtype == _TD_DTYPE:
-                r = _coerce_scalar_to_timedelta_type(r)
-            elif dtype == np.bool_:
-                # messy. non 0/1 integers do not get converted.
-                if is_integer(r) and r not in [0,1]:
-                    return int(r)
-                r = bool(r)
-            elif dtype.kind == 'f':
-                r = float(r)
-            elif dtype.kind == 'i':
-                r = int(r)
-        except:
-            pass
-
-        return r
-
-    return [conv(r, dtype) for r, dtype in zip(result, dtypes)]
-
-
-def _infer_fill_value(val):
-    """
-    infer the fill value for the nan/NaT from the provided scalar/ndarray/list-like
-    if we are a NaT, return the correct dtyped element to provide proper block construction
-
-    """
-
-    if not is_list_like(val):
-        val = [val]
-    val = np.array(val,copy=False)
-    if is_datetimelike(val):
-        return np.array('NaT',dtype=val.dtype)
-    elif is_object_dtype(val.dtype):
-        dtype = lib.infer_dtype(_ensure_object(val))
-        if dtype in ['datetime','datetime64']:
-            return np.array('NaT',dtype=_NS_DTYPE)
-        elif dtype in ['timedelta','timedelta64']:
-            return np.array('NaT',dtype=_TD_DTYPE)
-    return np.nan
-
-
-def _infer_dtype_from_scalar(val):
-    """ interpret the dtype from a scalar, upcast floats and ints
-        return the new value and the dtype """
-
-    dtype = np.object_
-
-    # a 1-element ndarray
-    if isinstance(val, np.ndarray):
-        if val.ndim != 0:
-            raise ValueError(
-                "invalid ndarray passed to _infer_dtype_from_scalar")
-
-        dtype = val.dtype
-        val = val.item()
-
-    elif isinstance(val, compat.string_types):
-
-        # If we create an empty array using a string to infer
-        # the dtype, NumPy will only allocate one character per entry
-        # so this is kind of bad. Alternately we could use np.repeat
-        # instead of np.empty (but then you still don't want things
-        # coming out as np.str_!
-
-        dtype = np.object_
-
-    elif isinstance(val, (np.datetime64, datetime)) and getattr(val,'tz',None) is None:
-        val = lib.Timestamp(val).value
-        dtype = np.dtype('M8[ns]')
-
-    elif isinstance(val, (np.timedelta64, timedelta)):
-        val = tslib.convert_to_timedelta(val,'ns')
-        dtype = np.dtype('m8[ns]')
-
-    elif is_bool(val):
-        dtype = np.bool_
-
-    # provide implicity upcast on scalars
-    elif is_integer(val):
-        dtype = np.int64
-
-    elif is_float(val):
-        dtype = np.float64
-
-    elif is_complex(val):
-        dtype = np.complex_
-
-    return dtype, val
-
-
-def _maybe_promote(dtype, fill_value=np.nan):
-
-    # if we passed an array here, determine the fill value by dtype
-    if isinstance(fill_value, np.ndarray):
-        if issubclass(fill_value.dtype.type, (np.datetime64, np.timedelta64)):
-            fill_value = tslib.iNaT
-        else:
-
-            # we need to change to object type as our
-            # fill_value is of object type
-            if fill_value.dtype == np.object_:
-                dtype = np.dtype(np.object_)
-            fill_value = np.nan
-
-    # returns tuple of (dtype, fill_value)
-    if issubclass(dtype.type, (np.datetime64, np.timedelta64)):
-        # for now: refuse to upcast datetime64
-        # (this is because datetime64 will not implicitly upconvert
-        #  to object correctly as of numpy 1.6.1)
-        if isnull(fill_value):
-            fill_value = tslib.iNaT
-        else:
-            if issubclass(dtype.type, np.datetime64):
-                try:
-                    fill_value = lib.Timestamp(fill_value).value
-                except:
-                    # the proper thing to do here would probably be to upcast
-                    # to object (but numpy 1.6.1 doesn't do this properly)
-                    fill_value = tslib.iNaT
-            else:
-                fill_value = tslib.iNaT
-    elif is_float(fill_value):
-        if issubclass(dtype.type, np.bool_):
-            dtype = np.object_
-        elif issubclass(dtype.type, np.integer):
-            dtype = np.float64
-    elif is_bool(fill_value):
-        if not issubclass(dtype.type, np.bool_):
-            dtype = np.object_
-    elif is_integer(fill_value):
-        if issubclass(dtype.type, np.bool_):
-            dtype = np.object_
-        elif issubclass(dtype.type, np.integer):
-            # upcast to prevent overflow
-            arr = np.asarray(fill_value)
-            if arr != arr.astype(dtype):
-                dtype = arr.dtype
-    elif is_complex(fill_value):
-        if issubclass(dtype.type, np.bool_):
-            dtype = np.object_
-        elif issubclass(dtype.type, (np.integer, np.floating)):
-            dtype = np.complex128
-    else:
-        dtype = np.object_
-
-    # in case we have a string that looked like a number
-    if is_categorical_dtype(dtype):
-        dtype = dtype
-    elif issubclass(np.dtype(dtype).type, compat.string_types):
-        dtype = np.object_
-
-    return dtype, fill_value
-
-
-def _maybe_upcast_putmask(result, mask, other):
-    """
-    A safe version of putmask that potentially upcasts the result
-
-    Parameters
-    ----------
-    result : ndarray
-        The destination array. This will be mutated in-place if no upcasting is
-        necessary.
-    mask : boolean ndarray
-    other : ndarray or scalar
-        The source array or value
-
-    Returns
-    -------
-    result : ndarray
-    changed : boolean
-        Set to true if the result array was upcasted
-    """
-
-    if mask.any():
-        # Two conversions for date-like dtypes that can't be done automatically
-        # in np.place:
-        #   NaN -> NaT
-        #   integer or integer array -> date-like array
-        if result.dtype in _DATELIKE_DTYPES:
-            if lib.isscalar(other):
-                if isnull(other):
-                    other = result.dtype.type('nat')
-                elif is_integer(other):
-                    other = np.array(other, dtype=result.dtype)
-            elif is_integer_dtype(other):
-                other = np.array(other, dtype=result.dtype)
-
-        def changeit():
-
-            # try to directly set by expanding our array to full
-            # length of the boolean
-            try:
-                om = other[mask]
-                om_at = om.astype(result.dtype)
-                if (om == om_at).all():
-                    new_result = result.values.copy()
-                    new_result[mask] = om_at
-                    result[:] = new_result
-                    return result, False
-            except:
-                pass
-
-            # we are forced to change the dtype of the result as the input
-            # isn't compatible
-            r, _ = _maybe_upcast(result, fill_value=other, copy=True)
-            np.place(r, mask, other)
-
-            return r, True
-
-        # we want to decide whether place will work
-        # if we have nans in the False portion of our mask then we need to
-        # upcast (possibly), otherwise we DON't want to upcast (e.g. if we
-        # have values, say integers, in the success portion then it's ok to not
-        # upcast)
-        new_dtype, _ = _maybe_promote(result.dtype, other)
-        if new_dtype != result.dtype:
-
-            # we have a scalar or len 0 ndarray
-            # and its nan and we are changing some values
-            if (np.isscalar(other) or
-                    (isinstance(other, np.ndarray) and other.ndim < 1)):
-                if isnull(other):
-                    return changeit()
-
-            # we have an ndarray and the masking has nans in it
-            else:
-
-                if isnull(other[mask]).any():
-                    return changeit()
-
-        try:
-            np.place(result, mask, other)
-        except:
-            return changeit()
-
-    return result, False
-
-
-def _maybe_upcast(values, fill_value=np.nan, dtype=None, copy=False):
-    """ provide explict type promotion and coercion
-
-    Parameters
-    ----------
-    values : the ndarray that we want to maybe upcast
-    fill_value : what we want to fill with
-    dtype : if None, then use the dtype of the values, else coerce to this type
-    copy : if True always make a copy even if no upcast is required
-    """
-
-    if is_internal_type(values):
-        if copy:
-            values = values.copy()
-    else:
-        if dtype is None:
-            dtype = values.dtype
-        new_dtype, fill_value = _maybe_promote(dtype, fill_value)
-        if new_dtype != values.dtype:
-            values = values.astype(new_dtype)
-        elif copy:
-            values = values.copy()
-
-    return values, fill_value
-
-
-def _possibly_cast_item(obj, item, dtype):
-    chunk = obj[item]
-
-    if chunk.values.dtype != dtype:
-        if dtype in (np.object_, np.bool_):
-            obj[item] = chunk.astype(np.object_)
-        elif not issubclass(dtype, (np.integer, np.bool_)):  # pragma: no cover
-            raise ValueError("Unexpected dtype encountered: %s" % dtype)
-
-
-def _possibly_downcast_to_dtype(result, dtype):
-    """ try to cast to the specified dtype (e.g. convert back to bool/int
-    or could be an astype of float64->float32
-    """
-
-    if np.isscalar(result):
-        return result
-
-    trans = lambda x: x
-    if isinstance(dtype, compat.string_types):
-        if dtype == 'infer':
-            inferred_type = lib.infer_dtype(_ensure_object(result.ravel()))
-            if inferred_type == 'boolean':
-                dtype = 'bool'
-            elif inferred_type == 'integer':
-                dtype = 'int64'
-            elif inferred_type == 'datetime64':
-                dtype = 'datetime64[ns]'
-            elif inferred_type == 'timedelta64':
-                dtype = 'timedelta64[ns]'
-
-            # try to upcast here
-            elif inferred_type == 'floating':
-                dtype = 'int64'
-                if issubclass(result.dtype.type, np.number):
-                    trans = lambda x: x.round()
-
-            else:
-                dtype = 'object'
-
-    if isinstance(dtype, compat.string_types):
-        dtype = np.dtype(dtype)
-
-    try:
-
-        # don't allow upcasts here (except if empty)
-        if dtype.kind == result.dtype.kind:
-            if result.dtype.itemsize <= dtype.itemsize and np.prod(result.shape):
-                return result
-
-        if issubclass(dtype.type, np.floating):
-            return result.astype(dtype)
-        elif dtype == np.bool_ or issubclass(dtype.type, np.integer):
-
-            # if we don't have any elements, just astype it
-            if not np.prod(result.shape):
-                return trans(result).astype(dtype)
-
-            # do a test on the first element, if it fails then we are done
-            r = result.ravel()
-            arr = np.array([r[0]])
-            if not np.allclose(arr, trans(arr).astype(dtype)):
-                return result
-
-            # a comparable, e.g. a Decimal may slip in here
-            elif not isinstance(r[0], (np.integer, np.floating, np.bool, int,
-                                       float, bool)):
-                return result
-
-            if (issubclass(result.dtype.type, (np.object_, np.number)) and
-                    notnull(result).all()):
-                new_result = trans(result).astype(dtype)
-                try:
-                    if np.allclose(new_result, result):
-                        return new_result
-                except:
-
-                    # comparison of an object dtype with a number type could
-                    # hit here
-                    if (new_result == result).all():
-                        return new_result
-
-        # a datetimelike
-        elif dtype.kind in ['M','m'] and result.dtype.kind in ['i']:
-            try:
-                result = result.astype(dtype)
-            except:
-                pass
-
-    except:
-        pass
-
-    return result
-
-
-def _maybe_convert_string_to_object(values):
-    """
-    Convert string-like and string-like array to convert object dtype.
-    This is to avoid numpy to handle the array as str dtype.
-    """
-    if isinstance(values, string_types):
-        values = np.array([values], dtype=object)
-    elif (isinstance(values, np.ndarray) and
-        issubclass(values.dtype.type, (np.string_, np.unicode_))):
-        values = values.astype(object)
-    return values
-
-
-def _lcd_dtypes(a_dtype, b_dtype):
-    """ return the lcd dtype to hold these types """
-
-    if is_datetime64_dtype(a_dtype) or is_datetime64_dtype(b_dtype):
-        return _NS_DTYPE
-    elif is_timedelta64_dtype(a_dtype) or is_timedelta64_dtype(b_dtype):
-        return _TD_DTYPE
-    elif is_complex_dtype(a_dtype):
-        if is_complex_dtype(b_dtype):
-            return a_dtype
-        return np.float64
-    elif is_integer_dtype(a_dtype):
-        if is_integer_dtype(b_dtype):
-            if a_dtype.itemsize == b_dtype.itemsize:
-                return a_dtype
-            return np.int64
-        return np.float64
-    elif is_float_dtype(a_dtype):
-        if is_float_dtype(b_dtype):
-            if a_dtype.itemsize == b_dtype.itemsize:
-                return a_dtype
-            else:
-                return np.float64
-        elif is_integer(b_dtype):
-            return np.float64
-    return np.object
-
-
-def _fill_zeros(result, x, y, name, fill):
-    """
-    if this is a reversed op, then flip x,y
-
-    if we have an integer value (or array in y)
-    and we have 0's, fill them with the fill,
-    return the result
-
-    mask the nan's from x
-    """
-    if fill is None or is_float_dtype(result):
-        return result
-
-    if name.startswith(('r', '__r')):
-        x,y = y,x
-
-    is_typed_variable = (hasattr(y, 'dtype') or hasattr(y,'type'))
-    is_scalar = lib.isscalar(y)
-
-    if not is_typed_variable and not is_scalar:
-        return result
-
-    if is_scalar:
-        y = np.array(y)
-
-    if is_integer_dtype(y):
-
-        if (y == 0).any():
-
-            # GH 7325, mask and nans must be broadcastable (also: PR 9308)
-            # Raveling and then reshaping makes np.putmask faster
-            mask = ((y == 0) & ~np.isnan(result)).ravel()
-
-            shape = result.shape
-            result = result.astype('float64', copy=False).ravel()
-
-            np.putmask(result, mask, fill)
-
-            # if we have a fill of inf, then sign it correctly
-            # (GH 6178 and PR 9308)
-            if np.isinf(fill):
-                signs = np.sign(y if name.startswith(('r', '__r')) else x)
-                negative_inf_mask = (signs.ravel() < 0) & mask
-                np.putmask(result, negative_inf_mask, -fill)
-
-            if "floordiv" in name:  # (PR 9308)
-                nan_mask = ((y == 0) & (x == 0)).ravel()
-                np.putmask(result, nan_mask, np.nan)
-
-            result = result.reshape(shape)
-
-    return result
-
-
-def _interp_wrapper(f, wrap_dtype, na_override=None):
-    def wrapper(arr, mask, limit=None):
-        view = arr.view(wrap_dtype)
-        f(view, mask, limit=limit)
-    return wrapper
-
-
-_pad_1d_datetime = _interp_wrapper(algos.pad_inplace_int64, np.int64)
-_pad_2d_datetime = _interp_wrapper(algos.pad_2d_inplace_int64, np.int64)
-_backfill_1d_datetime = _interp_wrapper(algos.backfill_inplace_int64,
-                                        np.int64)
-_backfill_2d_datetime = _interp_wrapper(algos.backfill_2d_inplace_int64,
-                                        np.int64)
-
-
-def pad_1d(values, limit=None, mask=None, dtype=None):
-
-    if dtype is None:
-        dtype = values.dtype
-    _method = None
-    if is_float_dtype(values):
-        _method = getattr(algos, 'pad_inplace_%s' % dtype.name, None)
-    elif dtype in _DATELIKE_DTYPES or is_datetime64_dtype(values):
-        _method = _pad_1d_datetime
-    elif is_integer_dtype(values):
-        values = _ensure_float64(values)
-        _method = algos.pad_inplace_float64
-    elif values.dtype == np.object_:
-        _method = algos.pad_inplace_object
-
-    if _method is None:
-        raise ValueError('Invalid dtype for pad_1d [%s]' % dtype.name)
-
-    if mask is None:
-        mask = isnull(values)
-    mask = mask.view(np.uint8)
-    _method(values, mask, limit=limit)
-    return values
-
-
-def backfill_1d(values, limit=None, mask=None, dtype=None):
-
-    if dtype is None:
-        dtype = values.dtype
-    _method = None
-    if is_float_dtype(values):
-        _method = getattr(algos, 'backfill_inplace_%s' % dtype.name, None)
-    elif dtype in _DATELIKE_DTYPES or is_datetime64_dtype(values):
-        _method = _backfill_1d_datetime
-    elif is_integer_dtype(values):
-        values = _ensure_float64(values)
-        _method = algos.backfill_inplace_float64
-    elif values.dtype == np.object_:
-        _method = algos.backfill_inplace_object
-
-    if _method is None:
-        raise ValueError('Invalid dtype for backfill_1d [%s]' % dtype.name)
-
-    if mask is None:
-        mask = isnull(values)
-    mask = mask.view(np.uint8)
-
-    _method(values, mask, limit=limit)
-    return values
-
-
-def pad_2d(values, limit=None, mask=None, dtype=None):
-
-    if dtype is None:
-        dtype = values.dtype
-    _method = None
-    if is_float_dtype(values):
-        _method = getattr(algos, 'pad_2d_inplace_%s' % dtype.name, None)
-    elif dtype in _DATELIKE_DTYPES or is_datetime64_dtype(values):
-        _method = _pad_2d_datetime
-    elif is_integer_dtype(values):
-        values = _ensure_float64(values)
-        _method = algos.pad_2d_inplace_float64
-    elif values.dtype == np.object_:
-        _method = algos.pad_2d_inplace_object
-
-    if _method is None:
-        raise ValueError('Invalid dtype for pad_2d [%s]' % dtype.name)
-
-    if mask is None:
-        mask = isnull(values)
-    mask = mask.view(np.uint8)
-
-    if np.all(values.shape):
-        _method(values, mask, limit=limit)
-    else:
-        # for test coverage
-        pass
-    return values
-
-
-def backfill_2d(values, limit=None, mask=None, dtype=None):
-
-    if dtype is None:
-        dtype = values.dtype
-    _method = None
-    if is_float_dtype(values):
-        _method = getattr(algos, 'backfill_2d_inplace_%s' % dtype.name, None)
-    elif dtype in _DATELIKE_DTYPES or is_datetime64_dtype(values):
-        _method = _backfill_2d_datetime
-    elif is_integer_dtype(values):
-        values = _ensure_float64(values)
-        _method = algos.backfill_2d_inplace_float64
-    elif values.dtype == np.object_:
-        _method = algos.backfill_2d_inplace_object
-
-    if _method is None:
-        raise ValueError('Invalid dtype for backfill_2d [%s]' % dtype.name)
-
-    if mask is None:
-        mask = isnull(values)
-    mask = mask.view(np.uint8)
-
-    if np.all(values.shape):
-        _method(values, mask, limit=limit)
-    else:
-        # for test coverage
-        pass
-    return values
-
-
-def _clean_interp_method(method, **kwargs):
-    order = kwargs.get('order')
-    valid = ['linear', 'time', 'index', 'values', 'nearest', 'zero', 'slinear',
-             'quadratic', 'cubic', 'barycentric', 'polynomial',
-             'krogh', 'piecewise_polynomial',
-             'pchip', 'spline']
-    if method in ('spline', 'polynomial') and order is None:
-        raise ValueError("You must specify the order of the spline or "
-                         "polynomial.")
-    if method not in valid:
-        raise ValueError("method must be one of {0}."
-                         "Got '{1}' instead.".format(valid, method))
-    return method
-
-
-def interpolate_1d(xvalues, yvalues, method='linear', limit=None,
-                   limit_direction='forward',
-                   fill_value=None, bounds_error=False, order=None, **kwargs):
-    """
-    Logic for the 1-d interpolation.  The result should be 1-d, inputs
-    xvalues and yvalues will each be 1-d arrays of the same length.
-
-    Bounds_error is currently hardcoded to False since non-scipy ones don't
-    take it as an argumnet.
-    """
-    # Treat the original, non-scipy methods first.
-
-    invalid = isnull(yvalues)
-    valid = ~invalid
-
-    if not valid.any():
-        # have to call np.asarray(xvalues) since xvalues could be an Index
-        # which cant be mutated
-        result = np.empty_like(np.asarray(xvalues), dtype=np.float64)
-        result.fill(np.nan)
-        return result
-
-    if valid.all():
-        return yvalues
-
-    if method == 'time':
-        if not getattr(xvalues, 'is_all_dates', None):
-        # if not issubclass(xvalues.dtype.type, np.datetime64):
-            raise ValueError('time-weighted interpolation only works '
-                             'on Series or DataFrames with a '
-                             'DatetimeIndex')
-        method = 'values'
-
-    def _interp_limit(invalid, fw_limit, bw_limit):
-        "Get idx of values that won't be filled b/c they exceed the limits."
-        for x in np.where(invalid)[0]:
-            if invalid[max(0, x - fw_limit):x + bw_limit + 1].all():
-                yield x
-
-    valid_limit_directions = ['forward', 'backward', 'both']
-    limit_direction = limit_direction.lower()
-    if limit_direction not in valid_limit_directions:
-        msg = 'Invalid limit_direction: expecting one of %r, got %r.' % (
-            valid_limit_directions, limit_direction)
-        raise ValueError(msg)
-
-    from pandas import Series
-    ys = Series(yvalues)
-    start_nans = set(range(ys.first_valid_index()))
-    end_nans = set(range(1 + ys.last_valid_index(), len(valid)))
-
-    # This is a list of the indexes in the series whose yvalue is currently NaN,
-    # but whose interpolated yvalue will be overwritten with NaN after computing
-    # the interpolation. For each index in this list, one of these conditions is
-    # true of the corresponding NaN in the yvalues:
-    #
-    # a) It is one of a chain of NaNs at the beginning of the series, and either
-    #    limit is not specified or limit_direction is 'forward'.
-    # b) It is one of a chain of NaNs at the end of the series, and limit is
-    #    specified and limit_direction is 'backward' or 'both'.
-    # c) Limit is nonzero and it is further than limit from the nearest non-NaN
-    #    value (with respect to the limit_direction setting).
-    #
-    # The default behavior is to fill forward with no limit, ignoring NaNs at
-    # the beginning (see issues #9218 and #10420)
-    violate_limit = sorted(start_nans)
-
-    if limit:
-        if limit_direction == 'forward':
-            violate_limit = sorted(start_nans | set(_interp_limit(invalid, limit, 0)))
-        if limit_direction == 'backward':
-            violate_limit = sorted(end_nans | set(_interp_limit(invalid, 0, limit)))
-        if limit_direction == 'both':
-            violate_limit = sorted(_interp_limit(invalid, limit, limit))
-
-    xvalues = getattr(xvalues, 'values', xvalues)
-    yvalues = getattr(yvalues, 'values', yvalues)
-    result = yvalues.copy()
-
-    if method in ['linear', 'time', 'index', 'values']:
-        if method in ('values', 'index'):
-            inds = np.asarray(xvalues)
-            # hack for DatetimeIndex, #1646
-            if issubclass(inds.dtype.type, np.datetime64):
-                inds = inds.view(np.int64)
-            if inds.dtype == np.object_:
-                inds = lib.maybe_convert_objects(inds)
-        else:
-            inds = xvalues
-        result[invalid] = np.interp(inds[invalid], inds[valid], yvalues[valid])
-        result[violate_limit] = np.nan
-        return result
-
-    sp_methods = ['nearest', 'zero', 'slinear', 'quadratic', 'cubic',
-                  'barycentric', 'krogh', 'spline', 'polynomial',
-                  'piecewise_polynomial', 'pchip']
-    if method in sp_methods:
-        inds = np.asarray(xvalues)
-        # hack for DatetimeIndex, #1646
-        if issubclass(inds.dtype.type, np.datetime64):
-            inds = inds.view(np.int64)
-        result[invalid] = _interpolate_scipy_wrapper(
-            inds[valid], yvalues[valid], inds[invalid], method=method,
-            fill_value=fill_value,
-            bounds_error=bounds_error, order=order, **kwargs)
-        result[violate_limit] = np.nan
-        return result
-
-
-def _interpolate_scipy_wrapper(x, y, new_x, method, fill_value=None,
-                               bounds_error=False, order=None, **kwargs):
-    """
-    passed off to scipy.interpolate.interp1d. method is scipy's kind.
-    Returns an array interpolated at new_x.  Add any new methods to
-    the list in _clean_interp_method
-    """
-    try:
-        from scipy import interpolate
-        from pandas import DatetimeIndex
-    except ImportError:
-        raise ImportError('{0} interpolation requires Scipy'.format(method))
-
-    new_x = np.asarray(new_x)
-
-    # ignores some kwargs that could be passed along.
-    alt_methods = {
-        'barycentric': interpolate.barycentric_interpolate,
-        'krogh': interpolate.krogh_interpolate,
-        'piecewise_polynomial': interpolate.piecewise_polynomial_interpolate,
-    }
-
-    if getattr(x, 'is_all_dates', False):
-        # GH 5975, scipy.interp1d can't hande datetime64s
-        x, new_x = x._values.astype('i8'), new_x.astype('i8')
-
-    try:
-        alt_methods['pchip'] = interpolate.pchip_interpolate
-    except AttributeError:
-        if method == 'pchip':
-            raise ImportError("Your version of scipy does not support "
-                              "PCHIP interpolation.")
-
-    interp1d_methods = ['nearest', 'zero', 'slinear', 'quadratic', 'cubic',
-                        'polynomial']
-    if method in interp1d_methods:
-        if method == 'polynomial':
-            method = order
-        terp = interpolate.interp1d(x, y, kind=method, fill_value=fill_value,
-                                    bounds_error=bounds_error)
-        new_y = terp(new_x)
-    elif method == 'spline':
-        # GH #10633
-        if not order:
-            raise ValueError("order needs to be specified and greater than 0")
-        terp = interpolate.UnivariateSpline(x, y, k=order, **kwargs)
-        new_y = terp(new_x)
-    else:
-        # GH 7295: need to be able to write for some reason
-        # in some circumstances: check all three
-        if not x.flags.writeable:
-            x = x.copy()
-        if not y.flags.writeable:
-            y = y.copy()
-        if not new_x.flags.writeable:
-            new_x = new_x.copy()
-        method = alt_methods[method]
-        new_y = method(x, y, new_x, **kwargs)
-    return new_y
-
-
-def interpolate_2d(values, method='pad', axis=0, limit=None, fill_value=None, dtype=None):
-    """ perform an actual interpolation of values, values will be make 2-d if
-    needed fills inplace, returns the result
-    """
-
-    transf = (lambda x: x) if axis == 0 else (lambda x: x.T)
-
-    # reshape a 1 dim if needed
-    ndim = values.ndim
-    if values.ndim == 1:
-        if axis != 0:  # pragma: no cover
-            raise AssertionError("cannot interpolate on a ndim == 1 with "
-                                 "axis != 0")
-        values = values.reshape(tuple((1,) + values.shape))
-
-    if fill_value is None:
-        mask = None
-    else:  # todo create faster fill func without masking
-        mask = mask_missing(transf(values), fill_value)
-
-    method = _clean_fill_method(method)
-    if method == 'pad':
-        values = transf(pad_2d(transf(values), limit=limit, mask=mask, dtype=dtype))
-    else:
-        values = transf(backfill_2d(transf(values), limit=limit, mask=mask, dtype=dtype))
-
-    # reshape back
-    if ndim == 1:
-        values = values[0]
-
-    return values
-
-
 def _consensus_name_attr(objs):
     name = objs[0].name
     for obj in objs[1:]:
-        if obj.name != name:
-            return None
-    return name
-
-
-_fill_methods = {'pad': pad_1d, 'backfill': backfill_1d}
-
-
-def _get_fill_func(method):
-    method = _clean_fill_method(method)
-    return _fill_methods[method]
-
-
-#----------------------------------------------------------------------
-# Lots of little utilities
-
-def _validate_date_like_dtype(dtype):
-    try:
-        typ = np.datetime_data(dtype)[0]
-    except ValueError as e:
-        raise TypeError('%s' % e)
-    if typ != 'generic' and typ != 'ns':
-        raise ValueError('%r is too specific of a frequency, try passing %r'
-                         % (dtype.name, dtype.type.__name__))
-
-
-def _invalidate_string_dtypes(dtype_set):
-    """Change string like dtypes to object for ``DataFrame.select_dtypes()``."""
-    non_string_dtypes = dtype_set - _string_dtypes
-    if non_string_dtypes != dtype_set:
-        raise TypeError("string dtypes are not allowed, use 'object' instead")
-
-
-def _get_dtype_from_object(dtype):
-    """Get a numpy dtype.type-style object. This handles the
-       datetime64[ns] and datetime64[ns, TZ] compat
-
-    Notes
-    -----
-    If nothing can be found, returns ``object``.
-    """
-    # type object from a dtype
-    if isinstance(dtype, type) and issubclass(dtype, np.generic):
-        return dtype
-    elif is_categorical(dtype):
-        return CategoricalDtype().type
-    elif is_datetimetz(dtype):
-        return DatetimeTZDtype(dtype).type
-    elif isinstance(dtype, np.dtype):  # dtype object
-        try:
-            _validate_date_like_dtype(dtype)
-        except TypeError:
-            # should still pass if we don't have a datelike
-            pass
-        return dtype.type
-    elif isinstance(dtype, compat.string_types):
-        if dtype == 'datetime' or dtype == 'timedelta':
-            dtype += '64'
-
         try:
-            return _get_dtype_from_object(getattr(np,dtype))
-        except AttributeError:
-            # handles cases like _get_dtype(int)
-            # i.e., python objects that are valid dtypes (unlike user-defined
-            # types, in general)
-            # further handle internal types
-            pass
-
-    return _get_dtype_from_object(np.dtype(dtype))
+            if obj.name != name:
+                name = None
+        except ValueError:
+            name = None
+    return name
 
 
 def _get_info_slice(obj, indexer):
     """Slice the info axis of `obj` with `indexer`."""
     if not hasattr(obj, '_info_axis_number'):
-        raise TypeError('object of type %r has no info axis' %
-                        type(obj).__name__)
+        msg = 'object of type {typ!r} has no info axis'
+        raise TypeError(msg.format(typ=type(obj).__name__))
     slices = [slice(None)] * obj.ndim
     slices[obj._info_axis_number] = indexer
     return tuple(slices)
@@ -1855,222 +93,17 @@ def _maybe_box_datetimelike(value):
 
     return value
 
-_values_from_object = lib.values_from_object
-
-
-def _possibly_castable(arr):
-    # return False to force a non-fastpath
-
-    # check datetime64[ns]/timedelta64[ns] are valid
-    # otherwise try to coerce
-    kind = arr.dtype.kind
-    if kind == 'M' or kind == 'm':
-        return arr.dtype in _DATELIKE_DTYPES
-
-    return arr.dtype.name not in _POSSIBLY_CAST_DTYPES
-
-
-def _possibly_convert_platform(values):
-    """ try to do platform conversion, allow ndarray or list here """
-
-    if isinstance(values, (list, tuple)):
-        values = lib.list_to_object_array(values)
-    if getattr(values, 'dtype', None) == np.object_:
-        if hasattr(values, '_values'):
-            values = values._values
-        values = lib.maybe_convert_objects(values)
-
-    return values
-
-
-def _possibly_cast_to_datetime(value, dtype, errors='raise'):
-    """ try to cast the array/value to a datetimelike dtype, converting float
-    nan to iNaT
-    """
-    from pandas.tseries.timedeltas import to_timedelta
-    from pandas.tseries.tools import to_datetime
-
-    if dtype is not None:
-        if isinstance(dtype, compat.string_types):
-            dtype = np.dtype(dtype)
-
-        is_datetime64 = is_datetime64_dtype(dtype)
-        is_datetime64tz = is_datetime64tz_dtype(dtype)
-        is_timedelta64 = is_timedelta64_dtype(dtype)
-
-        if is_datetime64 or is_datetime64tz or is_timedelta64:
-
-            # force the dtype if needed
-            if is_datetime64 and not is_dtype_equal(dtype,_NS_DTYPE):
-                if dtype.name == 'datetime64[ns]':
-                    dtype = _NS_DTYPE
-                else:
-                    raise TypeError(
-                        "cannot convert datetimelike to dtype [%s]" % dtype)
-            elif is_datetime64tz:
-                pass
-            elif is_timedelta64 and not is_dtype_equal(dtype,_TD_DTYPE):
-                if dtype.name == 'timedelta64[ns]':
-                    dtype = _TD_DTYPE
-                else:
-                    raise TypeError(
-                        "cannot convert timedeltalike to dtype [%s]" % dtype)
-
-            if np.isscalar(value):
-                if value == tslib.iNaT or isnull(value):
-                    value = tslib.iNaT
-            else:
-                value = np.array(value,copy=False)
-
-                # have a scalar array-like (e.g. NaT)
-                if value.ndim == 0:
-                    value = tslib.iNaT
-
-                # we have an array of datetime or timedeltas & nulls
-                elif np.prod(value.shape) or not is_dtype_equal(value.dtype, dtype):
-                    try:
-                        if is_datetime64:
-                            value = to_datetime(value, errors=errors)._values
-                        elif is_datetime64tz:
-                            # input has to be UTC at this point, so just localize
-                            value = to_datetime(value, errors=errors).tz_localize(dtype.tz)
-                        elif is_timedelta64:
-                            value = to_timedelta(value, errors=errors)._values
-                    except (AttributeError, ValueError):
-                        pass
-
-        # coerce datetimelike to object
-        elif is_datetime64_dtype(value) and not is_datetime64_dtype(dtype):
-            if is_object_dtype(dtype):
-                ints = np.asarray(value).view('i8')
-                return tslib.ints_to_pydatetime(ints)
-
-            # we have a non-castable dtype that was passed
-            raise TypeError('Cannot cast datetime64 to %s' % dtype)
-
-    else:
-
-        is_array = isinstance(value, np.ndarray)
-
-        # catch a datetime/timedelta that is not of ns variety
-        # and no coercion specified
-        if is_array and value.dtype.kind in ['M', 'm']:
-            dtype = value.dtype
-
-            if dtype.kind == 'M' and dtype != _NS_DTYPE:
-                value = value.astype(_NS_DTYPE)
-
-            elif dtype.kind == 'm' and dtype != _TD_DTYPE:
-                value = to_timedelta(value)
-
-        # only do this if we have an array and the dtype of the array is not
-        # setup already we are not an integer/object, so don't bother with this
-        # conversion
-        elif not (is_array and not (issubclass(value.dtype.type, np.integer) or
-                                    value.dtype == np.object_)):
-            value = _possibly_infer_to_datetimelike(value)
-
-    return value
-
-
-def _possibly_infer_to_datetimelike(value, convert_dates=False):
-    """
-    we might have a array (or single object) that is datetime like,
-    and no dtype is passed don't change the value unless we find a
-    datetime/timedelta set
-
-    this is pretty strict in that a datetime/timedelta is REQUIRED
-    in addition to possible nulls/string likes
-
-    ONLY strings are NOT datetimelike
-
-    Parameters
-    ----------
-    value : np.array / Series / Index / list-like
-    convert_dates : boolean, default False
-       if True try really hard to convert dates (such as datetime.date), other
-       leave inferred dtype 'date' alone
 
-    """
-
-    if isinstance(value, (ABCDatetimeIndex, ABCPeriodIndex)):
-        return value
-    elif isinstance(value, ABCSeries):
-        if isinstance(value._values, ABCDatetimeIndex):
-            return value._values
-
-    v = value
-    if not is_list_like(v):
-        v = [v]
-    v = np.array(v,copy=False)
-    shape = v.shape
-    if not v.ndim == 1:
-        v = v.ravel()
-
-    if len(v):
-
-        def _try_datetime(v):
-            # safe coerce to datetime64
-            try:
-                v = tslib.array_to_datetime(v, errors='raise')
-            except ValueError:
-
-                # we might have a sequence of the same-datetimes with tz's
-                # if so coerce to a DatetimeIndex; if they are not the same, then
-                # these stay as object dtype
-                try:
-                    from pandas import to_datetime
-                    return to_datetime(v)
-                except:
-                    pass
-
-            except:
-                pass
-
-            return v.reshape(shape)
-
-        def _try_timedelta(v):
-            # safe coerce to timedelta64
-
-            # will try first with a string & object conversion
-            from pandas.tseries.timedeltas import to_timedelta
-            try:
-                return to_timedelta(v)._values.reshape(shape)
-            except:
-                return v
-
-        # do a quick inference for perf
-        sample = v[:min(3,len(v))]
-        inferred_type = lib.infer_dtype(sample)
-
-        if inferred_type in ['datetime', 'datetime64'] or (convert_dates and inferred_type in ['date']):
-            value = _try_datetime(v)
-        elif inferred_type in ['timedelta', 'timedelta64']:
-            value = _try_timedelta(v)
-
-        # its possible to have nulls intermixed within the datetime or timedelta
-        # these will in general have an inferred_type of 'mixed', so have to try
-        # both datetime and timedelta
-
-        # try timedelta first to avoid spurious datetime conversions
-        # e.g. '00:00:01' is a timedelta but technically is also a datetime
-        elif inferred_type in ['mixed']:
-
-            if lib.is_possible_datetimelike_array(_ensure_object(v)):
-                value = _try_timedelta(v)
-                if lib.infer_dtype(value) in ['mixed']:
-                    value = _try_datetime(v)
-
-    return value
+_values_from_object = lib.values_from_object
 
 
 def is_bool_indexer(key):
-    if isinstance(key, (ABCSeries, np.ndarray)):
+    if isinstance(key, (ABCSeries, np.ndarray, ABCIndex)):
         if key.dtype == np.object_:
             key = np.asarray(_values_from_object(key))
 
             if not lib.is_bool_array(key):
-                if isnull(key).any():
+                if isna(key).any():
                     raise ValueError('cannot index with vector containing '
                                      'NA / NaN values')
                 return False
@@ -2088,17 +121,8 @@ def is_bool_indexer(key):
 
 
 def _default_index(n):
-    from pandas.core.index import Int64Index
-    values = np.arange(n, dtype=np.int64)
-    result = Int64Index(values,name=None)
-    result.is_unique = True
-    return result
-
-
-def ensure_float(arr):
-    if issubclass(arr.dtype.type, (np.integer, np.bool_)):
-        arr = arr.astype(float)
-    return arr
+    from pandas.core.index import RangeIndex
+    return RangeIndex(0, n, name=None)
 
 
 def _mut_exclusive(**kwargs):
@@ -2106,31 +130,56 @@ def _mut_exclusive(**kwargs):
     label1, val1 = item1
     label2, val2 = item2
     if val1 is not None and val2 is not None:
-        raise TypeError('mutually exclusive arguments: %r and %r' %
-                        (label1, label2))
+        msg = 'mutually exclusive arguments: {label1!r} and {label2!r}'
+        raise TypeError(msg.format(label1=label1, label2=label2))
     elif val1 is not None:
         return val1
     else:
         return val2
 
 
-def _not_none(*args):
-    return (arg for arg in args if arg is not None)
+def _not_none(*args):
+    """Returns a generator consisting of the arguments that are not None"""
+    return (arg for arg in args if arg is not None)
+
+
+def _any_none(*args):
+    """Returns a boolean indicating if any argument is None"""
+    for arg in args:
+        if arg is None:
+            return True
+    return False
+
+
+def _all_none(*args):
+    """Returns a boolean indicating if all arguments are None"""
+    for arg in args:
+        if arg is not None:
+            return False
+    return True
+
 
-def _any_none(*args):
+def _any_not_none(*args):
+    """Returns a boolean indicating if any argument is not None"""
     for arg in args:
-        if arg is None:
+        if arg is not None:
             return True
     return False
 
 
 def _all_not_none(*args):
+    """Returns a boolean indicating if all arguments are not None"""
     for arg in args:
         if arg is None:
             return False
     return True
 
 
+def _count_not_none(*args):
+    """Returns the count of arguments that are not None"""
+    return sum(x is not None for x in args)
+
+
 def _try_sort(iterable):
     listed = list(iterable)
     try:
@@ -2139,74 +188,21 @@ def _try_sort(iterable):
         return listed
 
 
-def _count_not_none(*args):
-    return sum(x is not None for x in args)
-
-#------------------------------------------------------------------------------
-# miscellaneous python tools
-
-
-
-
-def adjoin(space, *lists, **kwargs):
-    """
-    Glues together two sets of strings using the amount of space requested.
-    The idea is to prettify.
-
-    ----------
-    space : int
-        number of spaces for padding
-    lists : str
-        list of str which being joined
-    strlen : callable
-        function used to calculate the length of each str. Needed for unicode
-        handling.
-    justfunc : callable
-        function used to justify str. Needed for unicode handling.
-    """
-    strlen = kwargs.pop('strlen', len)
-    justfunc = kwargs.pop('justfunc', _justify)
-
-    out_lines = []
-    newLists = []
-    lengths = [max(map(strlen, x)) + space for x in lists[:-1]]
-    # not the last one
-    lengths.append(max(map(len, lists[-1])))
-    maxLen = max(map(len, lists))
-    for i, lst in enumerate(lists):
-        nl = justfunc(lst, lengths[i], mode='left')
-        nl.extend([' ' * lengths[i]] * (maxLen - len(lst)))
-        newLists.append(nl)
-    toJoin = zip(*newLists)
-    for lines in toJoin:
-        out_lines.append(_join_unicode(lines))
-    return _join_unicode(out_lines, sep='\n')
-
-def _justify(texts, max_len, mode='right'):
-    """
-    Perform ljust, center, rjust against string or list-like
-    """
-    if mode == 'left':
-        return [x.ljust(max_len) for x in texts]
-    elif mode == 'center':
-        return [x.center(max_len) for x in texts]
+def _dict_keys_to_ordered_list(mapping):
+    # when pandas drops support for Python < 3.6, this function
+    # can be replaced by a simple list(mapping.keys())
+    if PY36 or isinstance(mapping, OrderedDict):
+        keys = list(mapping.keys())
     else:
-        return [x.rjust(max_len) for x in texts]
-
-def _join_unicode(lines, sep=''):
-    try:
-        return sep.join(lines)
-    except UnicodeDecodeError:
-        sep = compat.text_type(sep)
-        return sep.join([x.decode('utf-8') if isinstance(x, str) else x
-                         for x in lines])
+        keys = _try_sort(mapping)
+    return keys
 
 
 def iterpairs(seq):
     """
     Parameters
     ----------
-    seq: sequence
+    seq : sequence
 
     Returns
     -------
@@ -2234,7 +230,7 @@ def split_ranges(mask):
     ranges = [(0, len(mask))]
 
     for pos, val in enumerate(mask):
-        if not val:  # this pos should be ommited, split off the prefix range
+        if not val:  # this pos should be omitted, split off the prefix range
             r = ranges.pop()
             if pos > r[0]:  # yield non-zero range
                 yield (r[0], pos)
@@ -2244,19 +240,6 @@ def split_ranges(mask):
         yield ranges[-1]
 
 
-def indent(string, spaces=4):
-    dent = ' ' * spaces
-    return '\n'.join([dent + x for x in string.split('\n')])
-
-
-def banner(message):
-    """
-    Return 80-char width message declaration with = bars on top and bottom.
-    """
-    bar = '=' * 80
-    return '%s\n%s\n%s' % (bar, message, bar)
-
-
 def _long_prod(vals):
     result = long(1)
     for x in vals:
@@ -2265,7 +248,6 @@ def _long_prod(vals):
 
 
 class groupby(dict):
-
     """
     A simple groupby different from the one in itertools.
 
@@ -2277,6 +259,7 @@ def __init__(self, seq, key=lambda x: x):
         for value in seq:
             k = key(value)
             self.setdefault(k, []).append(value)
+
     try:
         __iter__ = dict.iteritems
     except AttributeError:  # pragma: no cover
@@ -2290,7 +273,7 @@ def map_indices_py(arr):
     Returns a dictionary with (element, index) pairs for each element in the
     given array/list
     """
-    return dict([(x, i) for i, x in enumerate(arr)])
+    return {x: i for i, x in enumerate(arr)}
 
 
 def union(*seqs):
@@ -2318,14 +301,13 @@ def intersection(*seqs):
 def _asarray_tuplesafe(values, dtype=None):
     from pandas.core.index import Index
 
-    if not (isinstance(values, (list, tuple))
-            or hasattr(values, '__array__')):
+    if not (isinstance(values, (list, tuple)) or hasattr(values, '__array__')):
         values = list(values)
     elif isinstance(values, Index):
         return values.values
 
     if isinstance(values, list) and dtype in [np.object_, object]:
-        return lib.list_to_object_array(values)
+        return construct_1d_object_array_from_listlike(values)
 
     result = np.asarray(values, dtype=dtype)
 
@@ -2333,22 +315,27 @@ def _asarray_tuplesafe(values, dtype=None):
         result = np.asarray(values, dtype=object)
 
     if result.ndim == 2:
-        if isinstance(values, list):
-            return lib.list_to_object_array(values)
-        else:
-            # Making a 1D array that safely contains tuples is a bit tricky
-            # in numpy, leading to the following
-            try:
-                result = np.empty(len(values), dtype=object)
-                result[:] = values
-            except ValueError:
-                # we have a list-of-list
-                result[:] = [tuple(x) for x in values]
+        # Avoid building an array of arrays:
+        # TODO: verify whether any path hits this except #18819 (invalid)
+        values = [tuple(x) for x in values]
+        result = construct_1d_object_array_from_listlike(values)
 
     return result
 
 
-def _index_labels_to_array(labels):
+def _index_labels_to_array(labels, dtype=None):
+    """
+    Transform label or iterable of labels to array, for use in Index.
+
+    Parameters
+    ----------
+    dtype : dtype
+        If specified, use as dtype of the resulting array, otherwise infer.
+
+    Returns
+    -------
+    array
+    """
     if isinstance(labels, (compat.string_types, tuple)):
         labels = [labels]
 
@@ -2358,7 +345,7 @@ def _index_labels_to_array(labels):
         except TypeError:  # non-iterable
             labels = [labels]
 
-    labels = _asarray_tuplesafe(labels)
+    labels = _asarray_tuplesafe(labels, dtype=dtype)
 
     return labels
 
@@ -2368,327 +355,24 @@ def _maybe_make_list(obj):
         return [obj]
     return obj
 
-########################
-##### TYPE TESTING #####
-########################
-
-is_bool = lib.is_bool
-
-
-is_integer = lib.is_integer
-
-
-is_float = lib.is_float
-
-
-is_complex = lib.is_complex
-
-
-def is_iterator(obj):
-    # python 3 generators have __next__ instead of next
-    return hasattr(obj, 'next') or hasattr(obj, '__next__')
-
-
-def is_number(obj):
-    return isinstance(obj, (numbers.Number, np.number))
-
-def is_period_arraylike(arr):
-    """ return if we are period arraylike / PeriodIndex """
-    if isinstance(arr, pd.PeriodIndex):
-        return True
-    elif isinstance(arr, (np.ndarray, ABCSeries)):
-        return arr.dtype == object and lib.infer_dtype(arr) == 'period'
-    return getattr(arr, 'inferred_type', None) == 'period'
-
-def is_datetime_arraylike(arr):
-    """ return if we are datetime arraylike / DatetimeIndex """
-    if isinstance(arr, ABCDatetimeIndex):
-        return True
-    elif isinstance(arr, (np.ndarray, ABCSeries)):
-        return arr.dtype == object and lib.infer_dtype(arr) == 'datetime'
-    return getattr(arr, 'inferred_type', None) == 'datetime'
-
-def is_datetimelike(arr):
-    return arr.dtype in _DATELIKE_DTYPES or isinstance(arr, ABCPeriodIndex) or is_datetimetz(arr)
-
-def _coerce_to_dtype(dtype):
-    """ coerce a string / np.dtype to a dtype """
-    if is_categorical_dtype(dtype):
-        dtype = CategoricalDtype()
-    elif is_datetime64tz_dtype(dtype):
-        dtype = DatetimeTZDtype(dtype)
-    else:
-        dtype = np.dtype(dtype)
-    return dtype
-
-def _get_dtype(arr_or_dtype):
-    if isinstance(arr_or_dtype, np.dtype):
-        return arr_or_dtype
-    elif isinstance(arr_or_dtype, type):
-        return np.dtype(arr_or_dtype)
-    elif isinstance(arr_or_dtype, CategoricalDtype):
-        return arr_or_dtype
-    elif isinstance(arr_or_dtype, DatetimeTZDtype):
-        return arr_or_dtype
-    elif isinstance(arr_or_dtype, compat.string_types):
-        if is_categorical_dtype(arr_or_dtype):
-            return CategoricalDtype.construct_from_string(arr_or_dtype)
-        elif is_datetime64tz_dtype(arr_or_dtype):
-            return DatetimeTZDtype.construct_from_string(arr_or_dtype)
-
-    if hasattr(arr_or_dtype, 'dtype'):
-        arr_or_dtype = arr_or_dtype.dtype
-    return np.dtype(arr_or_dtype)
-
-def _get_dtype_type(arr_or_dtype):
-    if isinstance(arr_or_dtype, np.dtype):
-        return arr_or_dtype.type
-    elif isinstance(arr_or_dtype, type):
-        return np.dtype(arr_or_dtype).type
-    elif isinstance(arr_or_dtype, CategoricalDtype):
-        return CategoricalDtypeType
-    elif isinstance(arr_or_dtype, DatetimeTZDtype):
-        return DatetimeTZDtypeType
-    elif isinstance(arr_or_dtype, compat.string_types):
-        if is_categorical_dtype(arr_or_dtype):
-            return CategoricalDtypeType
-        elif is_datetime64tz_dtype(arr_or_dtype):
-            return DatetimeTZDtypeType
-        return _get_dtype_type(np.dtype(arr_or_dtype))
-    try:
-        return arr_or_dtype.dtype.type
-    except AttributeError:
-        return type(None)
-
-def is_dtype_equal(source, target):
-    """ return a boolean if the dtypes are equal """
-    try:
-        source = _get_dtype(source)
-        target = _get_dtype(target)
-        return source == target
-    except (TypeError, AttributeError):
-
-        # invalid comparison
-        # object == category will hit this
-        return False
-
-def is_any_int_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, np.integer)
-
-
-def is_integer_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return (issubclass(tipo, np.integer) and
-            not issubclass(tipo, (np.datetime64, np.timedelta64)))
-
-def is_int64_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, np.int64)
-
-
-def is_int_or_datetime_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return (issubclass(tipo, np.integer) or
-            issubclass(tipo, (np.datetime64, np.timedelta64)))
-
-def is_datetime64_dtype(arr_or_dtype):
-    try:
-        tipo = _get_dtype_type(arr_or_dtype)
-    except TypeError:
-        return False
-    return issubclass(tipo, np.datetime64)
-
-def is_datetime64tz_dtype(arr_or_dtype):
-    return DatetimeTZDtype.is_dtype(arr_or_dtype)
-
-def is_datetime64_any_dtype(arr_or_dtype):
-    return is_datetime64_dtype(arr_or_dtype) or is_datetime64tz_dtype(arr_or_dtype)
-
-def is_datetime64_ns_dtype(arr_or_dtype):
-    try:
-        tipo = _get_dtype(arr_or_dtype)
-    except TypeError:
-        return False
-    return tipo == _NS_DTYPE
-
-def is_timedelta64_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, np.timedelta64)
-
-
-def is_timedelta64_ns_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return tipo == _TD_DTYPE
-
-
-def is_datetime_or_timedelta_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, (np.datetime64, np.timedelta64))
-
-
-def is_datetimelike_v_numeric(a, b):
-    # return if we have an i8 convertible and numeric comparision
-    if not hasattr(a,'dtype'):
-        a = np.asarray(a)
-    if not hasattr(b, 'dtype'):
-        b = np.asarray(b)
-    is_numeric = lambda x: is_integer_dtype(x) or is_float_dtype(x)
-    is_datetimelike = needs_i8_conversion
-    return (is_datetimelike(a) and is_numeric(b)) or (
-        is_datetimelike(b) and is_numeric(a))
-
-def is_datetimelike_v_object(a, b):
-    # return if we have an i8 convertible and object comparision
-    if not hasattr(a,'dtype'):
-        a = np.asarray(a)
-    if not hasattr(b, 'dtype'):
-        b = np.asarray(b)
-    f = lambda x: is_object_dtype(x)
-    is_object = lambda x: is_integer_dtype(x) or is_float_dtype(x)
-    is_datetimelike = needs_i8_conversion
-    return (is_datetimelike(a) and is_object(b)) or (
-        is_datetimelike(b) and is_object(a))
-
-needs_i8_conversion = lambda arr_or_dtype: is_datetime_or_timedelta_dtype(arr_or_dtype) or \
-                      is_datetime64tz_dtype(arr_or_dtype)
-
-def i8_boxer(arr_or_dtype):
-    """ return the scalar boxer for the dtype """
-    if is_datetime64_dtype(arr_or_dtype) or is_datetime64tz_dtype(arr_or_dtype):
-        return lib.Timestamp
-    elif is_timedelta64_dtype(arr_or_dtype):
-        return lambda x: lib.Timedelta(x,unit='ns')
-    raise ValueError("cannot find a scalar boxer for {0}".format(arr_or_dtype))
-
-def is_numeric_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return (issubclass(tipo, (np.number, np.bool_))
-            and not issubclass(tipo, (np.datetime64, np.timedelta64)))
-
-
-def is_float_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, np.floating)
-
-
-def is_floating_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return isinstance(tipo, np.floating)
-
-
-def is_bool_dtype(arr_or_dtype):
-    try:
-        tipo = _get_dtype_type(arr_or_dtype)
-    except ValueError:
-        # this isn't even a dtype
-        return False
-    return issubclass(tipo, np.bool_)
-
-def is_sparse(array):
-    """ return if we are a sparse array """
-    return isinstance(array, (ABCSparseArray, ABCSparseSeries))
-
-def is_datetimetz(array):
-    """ return if we are a datetime with tz array """
-    return (isinstance(array, ABCDatetimeIndex) and getattr(array,'tz',None) is not None) or is_datetime64tz_dtype(array)
-
-def is_internal_type(value):
-    """
-    if we are a klass that is preserved by the internals
-    these are internal klasses that we represent (and don't use a np.array)
-    """
-    if is_categorical(value):
-        return True
-    elif is_sparse(value):
-        return True
-    elif is_datetimetz(value):
-        return True
-    return False
-
-def is_categorical(array):
-    """ return if we are a categorical possibility """
-    return isinstance(array, ABCCategorical) or is_categorical_dtype(array)
-
-def is_categorical_dtype(arr_or_dtype):
-    return CategoricalDtype.is_dtype(arr_or_dtype)
-
-def is_complex_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, np.complexfloating)
-
-
-def is_object_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, np.object_)
-
-
-def is_re(obj):
-    return isinstance(obj, re._pattern_type)
-
-
-def is_re_compilable(obj):
-    try:
-        re.compile(obj)
-    except TypeError:
-        return False
-    else:
-        return True
-
-
-def is_list_like(arg):
-     return (hasattr(arg, '__iter__') and
-            not isinstance(arg, compat.string_and_binary_types))
 
 def is_null_slice(obj):
     """ we have a null slice """
     return (isinstance(obj, slice) and obj.start is None and
             obj.stop is None and obj.step is None)
 
-def is_full_slice(obj, l):
-    """ we have a full length slice """
-    return (isinstance(obj, slice) and obj.start == 0 and
-            obj.stop == l and obj.step is None)
-
-def is_hashable(arg):
-    """Return True if hash(arg) will succeed, False otherwise.
-
-    Some types will pass a test against collections.Hashable but fail when they
-    are actually hashed with hash().
-
-    Distinguish between these and other types by trying the call to hash() and
-    seeing if they raise TypeError.
 
-    Examples
-    --------
-    >>> a = ([],)
-    >>> isinstance(a, collections.Hashable)
-    True
-    >>> is_hashable(a)
-    False
+def is_true_slices(l):
     """
-    # unfortunately, we can't use isinstance(arg, collections.Hashable), which
-    # can be faster than calling hash, because numpy scalars on Python 3 fail
-    # this test
-
-    # reconsider this decision once this numpy bug is fixed:
-    # https://github.com/numpy/numpy/issues/5562
-
-    try:
-        hash(arg)
-    except TypeError:
-        return False
-    else:
-        return True
+    Find non-trivial slices in "l": return a list of booleans with same length.
+    """
+    return [isinstance(k, slice) and not is_null_slice(k) for k in l]
 
 
-def is_sequence(x):
-    try:
-        iter(x)
-        len(x)  # it has a length
-        return not isinstance(x, compat.string_and_binary_types)
-    except (TypeError, AttributeError):
-        return False
+def is_full_slice(obj, l):
+    """ we have a full length slice """
+    return (isinstance(obj, slice) and obj.start == 0 and obj.stop == l and
+            obj.step is None)
 
 
 def _get_callable_name(obj):
@@ -2707,358 +391,30 @@ def _get_callable_name(obj):
     # distinguishing between no name and a name of ''
     return None
 
-_string_dtypes = frozenset(map(_get_dtype_from_object, (compat.binary_type,
-                                                        compat.text_type)))
-
-
-_ensure_float64 = algos.ensure_float64
-_ensure_float32 = algos.ensure_float32
-_ensure_int64 = algos.ensure_int64
-_ensure_int32 = algos.ensure_int32
-_ensure_int16 = algos.ensure_int16
-_ensure_int8 = algos.ensure_int8
-_ensure_platform_int = algos.ensure_platform_int
-_ensure_object = algos.ensure_object
-
-
-def _astype_nansafe(arr, dtype, copy=True):
-    """ return a view if copy is False, but
-        need to be very careful as the result shape could change! """
-    if not isinstance(dtype, np.dtype):
-        dtype = _coerce_to_dtype(dtype)
-
-    if issubclass(dtype.type, compat.text_type):
-        # in Py3 that's str, in Py2 that's unicode
-        return lib.astype_unicode(arr.ravel()).reshape(arr.shape)
-    elif issubclass(dtype.type, compat.string_types):
-        return lib.astype_str(arr.ravel()).reshape(arr.shape)
-    elif is_datetime64_dtype(arr):
-        if dtype == object:
-            return tslib.ints_to_pydatetime(arr.view(np.int64))
-        elif dtype == np.int64:
-            return arr.view(dtype)
-        elif dtype != _NS_DTYPE:
-            raise TypeError("cannot astype a datetimelike from [%s] to [%s]" %
-                            (arr.dtype, dtype))
-        return arr.astype(_NS_DTYPE)
-    elif is_timedelta64_dtype(arr):
-        if dtype == np.int64:
-            return arr.view(dtype)
-        elif dtype == object:
-            return tslib.ints_to_pytimedelta(arr.view(np.int64))
-
-        # in py3, timedelta64[ns] are int64
-        elif ((compat.PY3 and dtype not in [_INT64_DTYPE, _TD_DTYPE]) or
-                (not compat.PY3 and dtype != _TD_DTYPE)):
-
-            # allow frequency conversions
-            if dtype.kind == 'm':
-                mask = isnull(arr)
-                result = arr.astype(dtype).astype(np.float64)
-                result[mask] = np.nan
-                return result
-
-            raise TypeError("cannot astype a timedelta from [%s] to [%s]" %
-                            (arr.dtype, dtype))
-
-        return arr.astype(_TD_DTYPE)
-    elif (np.issubdtype(arr.dtype, np.floating) and
-          np.issubdtype(dtype, np.integer)):
-
-        if np.isnan(arr).any():
-            raise ValueError('Cannot convert NA to integer')
-    elif arr.dtype == np.object_ and np.issubdtype(dtype.type, np.integer):
-        # work around NumPy brokenness, #1987
-        return lib.astype_intsafe(arr.ravel(), dtype).reshape(arr.shape)
-
-    if copy:
-        return arr.astype(dtype)
-    return arr.view(dtype)
-
-
-def _clean_fill_method(method, allow_nearest=False):
-    if method is None:
-        return None
-    method = method.lower()
-    if method == 'ffill':
-        method = 'pad'
-    if method == 'bfill':
-        method = 'backfill'
-
-    valid_methods = ['pad', 'backfill']
-    expecting = 'pad (ffill) or backfill (bfill)'
-    if allow_nearest:
-        valid_methods.append('nearest')
-        expecting = 'pad (ffill), backfill (bfill) or nearest'
-    if method not in valid_methods:
-        msg = ('Invalid fill method. Expecting %s. Got %s'
-               % (expecting, method))
-        raise ValueError(msg)
-    return method
-
-
-def _clean_reindex_fill_method(method):
-    return _clean_fill_method(method, allow_nearest=True)
-
-
-def _all_none(*args):
-    for arg in args:
-        if arg is not None:
-            return False
-    return True
-
-
-class UTF8Recoder:
-
-    """
-    Iterator that reads an encoded stream and reencodes the input to UTF-8
-    """
-
-    def __init__(self, f, encoding):
-        self.reader = codecs.getreader(encoding)(f)
-
-    def __iter__(self):
-        return self
-
-    def read(self, bytes=-1):
-        return self.reader.read(bytes).encode('utf-8')
-
-    def readline(self):
-        return self.reader.readline().encode('utf-8')
-
-    def next(self):
-        return next(self.reader).encode("utf-8")
-
-    # Python 3 iterator
-    __next__ = next
-
-
-def _get_handle(path, mode, encoding=None, compression=None):
-    """Gets file handle for given path and mode.
-    NOTE: Under Python 3.2, getting a compressed file handle means reading in
-    the entire file, decompressing it and decoding it to ``str`` all at once
-    and then wrapping it in a StringIO.
-    """
-    if compression is not None:
-        if encoding is not None and not compat.PY3:
-            msg = 'encoding + compression not yet supported in Python 2'
-            raise ValueError(msg)
-
-        if compression == 'gzip':
-            import gzip
-            f = gzip.GzipFile(path, mode)
-        elif compression == 'bz2':
-            import bz2
-            f = bz2.BZ2File(path, mode)
-        else:
-            raise ValueError('Unrecognized compression type: %s' %
-                             compression)
-        if compat.PY3:
-            from io import TextIOWrapper
-            f = TextIOWrapper(f, encoding=encoding)
-        return f
-    else:
-        if compat.PY3:
-            if encoding:
-                f = open(path, mode, encoding=encoding)
-            else:
-                f = open(path, mode, errors='replace')
-        else:
-            f = open(path, mode)
-
-    return f
-
-
-if compat.PY3:  # pragma: no cover
-    def UnicodeReader(f, dialect=csv.excel, encoding="utf-8", **kwds):
-        # ignore encoding
-        return csv.reader(f, dialect=dialect, **kwds)
-
-    def UnicodeWriter(f, dialect=csv.excel, encoding="utf-8", **kwds):
-        return csv.writer(f, dialect=dialect, **kwds)
-else:
-    class UnicodeReader:
-
-        """
-        A CSV reader which will iterate over lines in the CSV file "f",
-        which is encoded in the given encoding.
-
-        On Python 3, this is replaced (below) by csv.reader, which handles
-        unicode.
-        """
-
-        def __init__(self, f, dialect=csv.excel, encoding="utf-8", **kwds):
-            f = UTF8Recoder(f, encoding)
-            self.reader = csv.reader(f, dialect=dialect, **kwds)
-
-        def next(self):
-            row = next(self.reader)
-            return [compat.text_type(s, "utf-8") for s in row]
-
-        # python 3 iterator
-        __next__ = next
-
-        def __iter__(self):  # pragma: no cover
-            return self
-
-    class UnicodeWriter:
-
-        """
-        A CSV writer which will write rows to CSV file "f",
-        which is encoded in the given encoding.
-        """
-
-        def __init__(self, f, dialect=csv.excel, encoding="utf-8", **kwds):
-            # Redirect output to a queue
-            self.queue = StringIO()
-            self.writer = csv.writer(self.queue, dialect=dialect, **kwds)
-            self.stream = f
-            self.encoder = codecs.getincrementalencoder(encoding)()
-            self.quoting = kwds.get("quoting", None)
-
-        def writerow(self, row):
-            def _check_as_is(x):
-                return (self.quoting == csv.QUOTE_NONNUMERIC and
-                        is_number(x)) or isinstance(x, str)
-
-            row = [x if _check_as_is(x)
-                   else pprint_thing(x).encode('utf-8') for x in row]
-
-            self.writer.writerow([s for s in row])
-            # Fetch UTF-8 output from the queue ...
-            data = self.queue.getvalue()
-            data = data.decode("utf-8")
-            # ... and reencode it into the target encoding
-            data = self.encoder.encode(data)
-            # write to the target stream
-            self.stream.write(data)
-            # empty queue
-            self.queue.truncate(0)
-
-        def writerows(self, rows):
-            def _check_as_is(x):
-                return (self.quoting == csv.QUOTE_NONNUMERIC and
-                        is_number(x)) or isinstance(x, str)
-
-            for i, row in enumerate(rows):
-                rows[i] = [x if _check_as_is(x)
-                           else pprint_thing(x).encode('utf-8') for x in row]
-
-            self.writer.writerows([[s for s in row] for row in rows])
-            # Fetch UTF-8 output from the queue ...
-            data = self.queue.getvalue()
-            data = data.decode("utf-8")
-            # ... and reencode it into the target encoding
-            data = self.encoder.encode(data)
-            # write to the target stream
-            self.stream.write(data)
-            # empty queue
-            self.queue.truncate(0)
-
-
-def get_dtype_kinds(l):
-    """
-    Parameters
-    ----------
-    l : list of arrays
-
-    Returns
-    -------
-    a set of kinds that exist in this list of arrays
-    """
-
-    typs = set()
-    for arr in l:
-
-        dtype = arr.dtype
-        if is_categorical_dtype(dtype):
-            typ = 'category'
-        elif is_sparse(arr):
-            typ = 'sparse'
-        elif is_datetimetz(arr):
-            typ = 'datetimetz'
-        elif is_datetime64_dtype(dtype):
-            typ = 'datetime'
-        elif is_timedelta64_dtype(dtype):
-            typ = 'timedelta'
-        elif is_object_dtype(dtype):
-            typ = 'object'
-        elif is_bool_dtype(dtype):
-            typ = 'bool'
-        else:
-            typ = dtype.kind
-        typs.add(typ)
-    return typs
 
-def _concat_compat(to_concat, axis=0):
+def _apply_if_callable(maybe_callable, obj, **kwargs):
     """
-    provide concatenation of an array of arrays each of which is a single
-    'normalized' dtypes (in that for example, if its object, then it is a non-datetimelike
-    provde a combined dtype for the resulting array the preserves the overall dtype if possible)
+    Evaluate possibly callable input using obj and kwargs if it is callable,
+    otherwise return as it is
 
     Parameters
     ----------
-    to_concat : array of arrays
-    axis : axis to provide concatenation
-
-    Returns
-    -------
-    a single array, preserving the combined dtypes
+    maybe_callable : possibly a callable
+    obj : NDFrame
+    **kwargs
     """
 
-    # filter empty arrays
-    # 1-d dtypes always are included here
-    def is_nonempty(x):
-        try:
-            return x.shape[axis] > 0
-        except Exception:
-            return True
-    nonempty = [x for x in to_concat if is_nonempty(x)]
-
-    # If all arrays are empty, there's nothing to convert, just short-cut to
-    # the concatenation, #3121.
-    #
-    # Creating an empty array directly is tempting, but the winnings would be
-    # marginal given that it would still require shape & dtype calculation and
-    # np.concatenate which has them both implemented is compiled.
-
-    typs = get_dtype_kinds(to_concat)
-
-    # these are mandated to handle empties as well
-    if 'datetime' in typs or 'datetimetz' in typs or 'timedelta' in typs:
-        from pandas.tseries.common import _concat_compat
-        return _concat_compat(to_concat, axis=axis)
-
-    elif 'sparse' in typs:
-        from pandas.sparse.array import _concat_compat
-        return _concat_compat(to_concat, axis=axis)
+    if callable(maybe_callable):
+        return maybe_callable(obj, **kwargs)
 
-    elif 'category' in typs:
-        from pandas.core.categorical import _concat_compat
-        return _concat_compat(to_concat, axis=axis)
+    return maybe_callable
 
-    if not nonempty:
-
-        # we have all empties, but may need to coerce the result dtype to object if we
-        # have non-numeric type operands (numpy would otherwise cast this to float)
-        typs = get_dtype_kinds(to_concat)
-        if len(typs) != 1:
-
-            if not len(typs-set(['i','u','f'])) or not len(typs-set(['bool','i','u'])):
-                # let numpy coerce
-                pass
-            else:
-                # coerce to object
-                to_concat = [ x.astype('object') for x in to_concat ]
-
-    return np.concatenate(to_concat,axis=axis)
 
 def _where_compat(mask, arr1, arr2):
     if arr1.dtype == _NS_DTYPE and arr2.dtype == _NS_DTYPE:
         new_vals = np.where(mask, arr1.view('i8'), arr2.view('i8'))
         return new_vals.view(_NS_DTYPE)
 
-    import pandas.tslib as tslib
     if arr1.dtype == _NS_DTYPE:
         arr1 = tslib.ints_to_pydatetime(arr1.view('i8'))
     if arr2.dtype == _NS_DTYPE:
@@ -3066,6 +422,7 @@ def _where_compat(mask, arr1, arr2):
 
     return np.where(mask, arr1, arr2)
 
+
 def _dict_compat(d):
     """
     Helper function to convert datetimelike-keyed dicts to Timestamp-keyed dict
@@ -3079,27 +436,69 @@ def _dict_compat(d):
     dict
 
     """
-    return dict((_maybe_box_datetimelike(key), value) for key, value in iteritems(d))
+    return dict((_maybe_box_datetimelike(key), value)
+                for key, value in iteritems(d))
 
-def sentinel_factory():
 
+def standardize_mapping(into):
+    """
+    Helper function to standardize a supplied mapping.
+
+    .. versionadded:: 0.21.0
+
+    Parameters
+    ----------
+    into : instance or subclass of collections.Mapping
+        Must be a class, an initialized collections.defaultdict,
+        or an instance of a collections.Mapping subclass.
+
+    Returns
+    -------
+    mapping : a collections.Mapping subclass or other constructor
+        a callable object that can accept an iterator to create
+        the desired Mapping.
+
+    See Also
+    --------
+    DataFrame.to_dict
+    Series.to_dict
+    """
+    if not inspect.isclass(into):
+        if isinstance(into, collections.defaultdict):
+            return partial(
+                collections.defaultdict, into.default_factory)
+        into = type(into)
+    if not issubclass(into, collections.Mapping):
+        raise TypeError('unsupported type: {into}'.format(into=into))
+    elif into == collections.defaultdict:
+        raise TypeError(
+            'to_dict() only accepts initialized defaultdicts')
+    return into
+
+
+def sentinel_factory():
     class Sentinel(object):
         pass
 
     return Sentinel()
 
+
+# ----------------------------------------------------------------------
+# Detect our environment
+
 def in_interactive_session():
     """ check if we're running in an interactive shell
 
     returns True if running under python/ipython interactive shell
     """
+
     def check_main():
         import __main__ as main
         return (not hasattr(main, '__file__') or
                 get_option('mode.sim_interactive'))
 
     try:
-        return __IPYTHON__ or check_main()
+        return __IPYTHON__ or check_main()  # noqa
     except:
         return check_main()
 
@@ -3108,14 +507,14 @@ def in_qtconsole():
     """
     check if we're inside an IPython qtconsole
 
-    DEPRECATED: This is no longer needed, or working, in IPython 3 and above.
+    .. deprecated:: 0.14.1
+       This is no longer needed, or working, in IPython 3 and above.
     """
     try:
-        ip = get_ipython()
+        ip = get_ipython()  # noqa
         front_end = (
             ip.config.get('KernelApp', {}).get('parent_appname', "") or
-            ip.config.get('IPKernelApp', {}).get('parent_appname', "")
-        )
+            ip.config.get('IPKernelApp', {}).get('parent_appname', ""))
         if 'qtconsole' in front_end.lower():
             return True
     except:
@@ -3127,15 +526,14 @@ def in_ipnb():
     """
     check if we're inside an IPython Notebook
 
-    DEPRECATED: This is no longer used in pandas, and won't work in IPython 3
-    and above.
+    .. deprecated:: 0.14.1
+       This is no longer needed, or working, in IPython 3 and above.
     """
     try:
-        ip = get_ipython()
+        ip = get_ipython()  # noqa
         front_end = (
             ip.config.get('KernelApp', {}).get('parent_appname', "") or
-            ip.config.get('IPKernelApp', {}).get('parent_appname', "")
-        )
+            ip.config.get('IPKernelApp', {}).get('parent_appname', ""))
         if 'notebook' in front_end.lower():
             return True
     except:
@@ -3148,228 +546,87 @@ def in_ipython_frontend():
     check if we're inside an an IPython zmq frontend
     """
     try:
-        ip = get_ipython()
+        ip = get_ipython()  # noqa
         return 'zmq' in str(type(ip)).lower()
     except:
         pass
 
     return False
 
-# Unicode consolidation
-# ---------------------
-#
-# pprinting utility functions for generating Unicode text or
-# bytes(3.x)/str(2.x) representations of objects.
-# Try to use these as much as possible rather then rolling your own.
-#
-# When to use
-# -----------
-#
-# 1) If you're writing code internal to pandas (no I/O directly involved),
-#    use pprint_thing().
-#
-#    It will always return unicode text which can handled by other
-#    parts of the package without breakage.
-#
-# 2) If you need to send something to the console, use console_encode().
-#
-#    console_encode() should (hopefully) choose the right encoding for you
-#    based on the encoding set in option "display.encoding"
-#
-# 3) if you need to write something out to file, use
-#    pprint_thing_encoded(encoding).
-#
-#    If no encoding is specified, it defaults to utf-8. Since encoding pure
-#    ascii with utf-8 is a no-op you can safely use the default utf-8 if you're
-#    working with straight ascii.
-
-
-def _pprint_seq(seq, _nest_lvl=0, max_seq_items=None, **kwds):
-    """
-    internal. pprinter for iterables. you should probably use pprint_thing()
-    rather then calling this directly.
-
-    bounds length of printed sequence, depending on options
-    """
-    if isinstance(seq, set):
-        fmt = u("{%s}")
-    else:
-        fmt = u("[%s]") if hasattr(seq, '__setitem__') else u("(%s)")
-
-    if max_seq_items is False:
-        nitems = len(seq)
-    else:
-        nitems = max_seq_items or get_option("max_seq_items") or len(seq)
-
-    s = iter(seq)
-    r = []
-    for i in range(min(nitems, len(seq))):  # handle sets, no slicing
-        r.append(pprint_thing(next(s), _nest_lvl + 1, max_seq_items=max_seq_items, **kwds))
-    body = ", ".join(r)
-
-    if nitems < len(seq):
-        body += ", ..."
-    elif isinstance(seq, tuple) and len(seq) == 1:
-        body += ','
-
-    return fmt % body
-
-
-def _pprint_dict(seq, _nest_lvl=0, max_seq_items=None, **kwds):
-    """
-    internal. pprinter for iterables. you should probably use pprint_thing()
-    rather then calling this directly.
-    """
-    fmt = u("{%s}")
-    pairs = []
-
-    pfmt = u("%s: %s")
-
-    if max_seq_items is False:
-        nitems = len(seq)
-    else:
-        nitems = max_seq_items or get_option("max_seq_items") or len(seq)
-
-    for k, v in list(seq.items())[:nitems]:
-        pairs.append(pfmt % (pprint_thing(k, _nest_lvl + 1, max_seq_items=max_seq_items, **kwds),
-                             pprint_thing(v, _nest_lvl + 1, max_seq_items=max_seq_items, **kwds)))
-
-    if nitems < len(seq):
-        return fmt % (", ".join(pairs) + ", ...")
-    else:
-        return fmt % ", ".join(pairs)
 
-
-def pprint_thing(thing, _nest_lvl=0, escape_chars=None, default_escapes=False,
-                 quote_strings=False, max_seq_items=None):
+def _random_state(state=None):
     """
-    This function is the sanctioned way of converting objects
-    to a unicode representation.
-
-    properly handles nested sequences containing unicode strings
-    (unicode(object) does not)
+    Helper function for processing random_state arguments.
 
     Parameters
     ----------
-    thing : anything to be formatted
-    _nest_lvl : internal use only. pprint_thing() is mutually-recursive
-        with pprint_sequence, this argument is used to keep track of the
-        current nesting level, and limit it.
-    escape_chars : list or dict, optional
-        Characters to escape. If a dict is passed the values are the
-        replacements
-    default_escapes : bool, default False
-        Whether the input escape characters replaces or adds to the defaults
-    max_seq_items : False, int, default None
-        Pass thru to other pretty printers to limit sequence printing
+    state : int, np.random.RandomState, None.
+        If receives an int, passes to np.random.RandomState() as seed.
+        If receives an np.random.RandomState object, just returns object.
+        If receives `None`, returns np.random.
+        If receives anything else, raises an informative ValueError.
+        Default None.
 
     Returns
     -------
-    result - unicode object on py2, str on py3. Always Unicode.
-
+    np.random.RandomState
     """
-    def as_escaped_unicode(thing, escape_chars=escape_chars):
-        # Unicode is fine, else we try to decode using utf-8 and 'replace'
-        # if that's not it either, we have no way of knowing and the user
-        # should deal with it himself.
 
-        try:
-            result = compat.text_type(thing)  # we should try this first
-        except UnicodeDecodeError:
-            # either utf-8 or we replace errors
-            result = str(thing).decode('utf-8', "replace")
-
-        translate = {'\t': r'\t',
-                     '\n': r'\n',
-                     '\r': r'\r',
-                     }
-        if isinstance(escape_chars, dict):
-            if default_escapes:
-                translate.update(escape_chars)
-            else:
-                translate = escape_chars
-            escape_chars = list(escape_chars.keys())
-        else:
-            escape_chars = escape_chars or tuple()
-        for c in escape_chars:
-            result = result.replace(c, translate[c])
-
-        return compat.text_type(result)
-
-    if (compat.PY3 and hasattr(thing, '__next__')) or hasattr(thing, 'next'):
-        return compat.text_type(thing)
-    elif (isinstance(thing, dict) and
-          _nest_lvl < get_option("display.pprint_nest_depth")):
-        result = _pprint_dict(thing, _nest_lvl, quote_strings=True, max_seq_items=max_seq_items)
-    elif is_sequence(thing) and _nest_lvl < \
-            get_option("display.pprint_nest_depth"):
-        result = _pprint_seq(thing, _nest_lvl, escape_chars=escape_chars,
-                             quote_strings=quote_strings, max_seq_items=max_seq_items)
-    elif isinstance(thing, compat.string_types) and quote_strings:
-        if compat.PY3:
-            fmt = "'%s'"
-        else:
-            fmt = "u'%s'"
-        result = fmt % as_escaped_unicode(thing)
+    if is_integer(state):
+        return np.random.RandomState(state)
+    elif isinstance(state, np.random.RandomState):
+        return state
+    elif state is None:
+        return np.random
     else:
-        result = as_escaped_unicode(thing)
-
-    return compat.text_type(result)  # always unicode
+        raise ValueError("random_state must be an integer, a numpy "
+                         "RandomState, or None")
 
 
-def pprint_thing_encoded(object, encoding='utf-8', errors='replace', **kwds):
-    value = pprint_thing(object)  # get unicode representation of object
-    return value.encode(encoding, errors, **kwds)
-
-
-def console_encode(object, **kwds):
+def _get_distinct_objs(objs):
     """
-    this is the sanctioned way to prepare something for
-    sending *to the console*, it delegates to pprint_thing() to get
-    a unicode representation of the object relies on the global encoding
-    set in display.encoding. Use this everywhere
-    where you output to the console.
+    Return a list with distinct elements of "objs" (different ids).
+    Preserves order.
     """
-    return pprint_thing_encoded(object,
-                                get_option("display.encoding"))
-
-def _maybe_match_name(a, b):
-    a_has = hasattr(a, 'name')
-    b_has = hasattr(b, 'name')
-    if a_has and b_has:
-        if a.name == b.name:
-            return a.name
-        else:
-            return None
-    elif a_has:
-        return a.name
-    elif b_has:
-        return b.name
-    return None
+    ids = set()
+    res = []
+    for obj in objs:
+        if not id(obj) in ids:
+            ids.add(id(obj))
+            res.append(obj)
+    return res
 
-def _random_state(state=None):
+
+def _pipe(obj, func, *args, **kwargs):
     """
-    Helper function for processing random_state arguments.
+    Apply a function ``func`` to object ``obj`` either by passing obj as the
+    first argument to the function or, in the case that the func is a tuple,
+    interpret the first element of the tuple as a function and pass the obj to
+    that function as a keyword argument whose key is the value of the second
+    element of the tuple.
 
     Parameters
     ----------
-    state : int, np.random.RandomState, None.
-        If receives an int, passes to np.random.RandomState() as seed.
-        If receives an np.random.RandomState object, just returns object.
-        If receives `None`, returns an np.random.RandomState object.
-        If receives anything else, raises an informative ValueError.
-        Default None.
+    func : callable or tuple of (callable, string)
+        Function to apply to this object or, alternatively, a
+        ``(callable, data_keyword)`` tuple where ``data_keyword`` is a
+        string indicating the keyword of `callable`` that expects the
+        object.
+    args : iterable, optional
+        positional arguments passed into ``func``.
+    kwargs : dict, optional
+        a dictionary of keyword arguments passed into ``func``.
 
     Returns
     -------
-    np.random.RandomState
+    object : the return type of ``func``.
     """
-
-    if is_integer(state):
-        return np.random.RandomState(state)
-    elif isinstance(state, np.random.RandomState):
-        return state
-    elif state is None:
-        return np.random.RandomState()
+    if isinstance(func, tuple):
+        func, target = func
+        if target in kwargs:
+            msg = '%s is both the pipe target and a keyword argument' % target
+            raise ValueError(msg)
+        kwargs[target] = obj
+        return func(*args, **kwargs)
     else:
-        raise ValueError("random_state must be an integer, a numpy RandomState, or None")
+        return func(obj, *args, **kwargs)
diff --git a/pandas/computation/tests/__init__.py b/pandas/core/computation/__init__.py
similarity index 100%
rename from pandas/computation/tests/__init__.py
rename to pandas/core/computation/__init__.py
diff --git a/pandas/computation/align.py b/pandas/core/computation/align.py
similarity index 83%
rename from pandas/computation/align.py
rename to pandas/core/computation/align.py
index b5f730378c3cf..22c8b641cf974 100644
--- a/pandas/computation/align.py
+++ b/pandas/core/computation/align.py
@@ -9,8 +9,9 @@
 
 import pandas as pd
 from pandas import compat
+from pandas.errors import PerformanceWarning
 import pandas.core.common as com
-from pandas.computation.common import _result_type_many
+from pandas.core.computation.common import _result_type_many
 
 
 def _align_core_single_unary_op(term):
@@ -88,27 +89,22 @@ def _align_core(terms):
         for axis, items in zip(range(ndim), axes):
             ti = terms[i].value
 
-            if hasattr(ti, 'reindex_axis'):
+            if hasattr(ti, 'reindex'):
                 transpose = isinstance(ti, pd.Series) and naxes > 1
                 reindexer = axes[naxes - 1] if transpose else items
 
                 term_axis_size = len(ti.axes[axis])
                 reindexer_size = len(reindexer)
 
-                ordm = np.log10(abs(reindexer_size - term_axis_size))
+                ordm = np.log10(max(1, abs(reindexer_size - term_axis_size)))
                 if ordm >= 1 and reindexer_size >= 10000:
-                    warnings.warn('Alignment difference on axis {0} is larger '
-                                  'than an order of magnitude on term {1!r}, '
-                                  'by more than {2:.4g}; performance may '
-                                  'suffer'.format(axis, terms[i].name, ordm),
-                                  category=pd.io.common.PerformanceWarning,
-                                  stacklevel=6)
-
-                if transpose:
-                    f = partial(ti.reindex, index=reindexer, copy=False)
-                else:
-                    f = partial(ti.reindex_axis, reindexer, axis=axis,
-                                copy=False)
+                    w = ('Alignment difference on axis {axis} is larger '
+                         'than an order of magnitude on term {term!r}, by '
+                         'more than {ordm:.4g}; performance may suffer'
+                         ).format(axis=axis, term=terms[i].name, ordm=ordm)
+                    warnings.warn(w, category=PerformanceWarning, stacklevel=6)
+
+                f = partial(ti.reindex, reindexer, axis=axis, copy=False)
 
                 terms[i].update(f())
 
@@ -130,7 +126,7 @@ def _align(terms):
         return np.result_type(terms.type), None
 
     # if all resolved variables are numeric scalars
-    if all(term.isscalar for term in terms):
+    if all(term.is_scalar for term in terms):
         return _result_type_many(*(term.value for term in terms)).type, None
 
     # perform the main alignment
@@ -173,8 +169,8 @@ def _reconstruct_object(typ, obj, axes, dtype):
         ret_value = res_t.type(obj)
     else:
         ret_value = typ(obj).astype(res_t)
-        # The condition is to distinguish 0-dim array (returned in case of scalar)
-        # and 1 element array
+        # The condition is to distinguish 0-dim array (returned in case of
+        # scalar) and 1 element array
         # e.g. np.array(0) and np.array([0])
         if len(obj.shape) == 1 and len(obj) == 1:
             if not isinstance(ret_value, np.ndarray):
diff --git a/pandas/core/computation/api.py b/pandas/core/computation/api.py
new file mode 100644
index 0000000000000..a6fe5aae822df
--- /dev/null
+++ b/pandas/core/computation/api.py
@@ -0,0 +1,14 @@
+# flake8: noqa
+
+from pandas.core.computation.eval import eval
+
+
+# deprecation, xref #13790
+def Expr(*args, **kwargs):
+    import warnings
+
+    warnings.warn("pd.Expr is deprecated as it is not "
+                  "applicable to user code",
+                  FutureWarning, stacklevel=2)
+    from pandas.core.computation.expr import Expr
+    return Expr(*args, **kwargs)
diff --git a/pandas/core/computation/check.py b/pandas/core/computation/check.py
new file mode 100644
index 0000000000000..2a9ed0fb9764d
--- /dev/null
+++ b/pandas/core/computation/check.py
@@ -0,0 +1,22 @@
+import warnings
+from distutils.version import LooseVersion
+
+_NUMEXPR_INSTALLED = False
+_MIN_NUMEXPR_VERSION = "2.4.6"
+
+try:
+    import numexpr as ne
+    ver = LooseVersion(ne.__version__)
+    _NUMEXPR_INSTALLED = ver >= LooseVersion(_MIN_NUMEXPR_VERSION)
+
+    if not _NUMEXPR_INSTALLED:
+        warnings.warn(
+            "The installed version of numexpr {ver} is not supported "
+            "in pandas and will be not be used\nThe minimum supported "
+            "version is {min_ver}\n".format(
+                ver=ver, min_ver=_MIN_NUMEXPR_VERSION), UserWarning)
+
+except ImportError:  # pragma: no cover
+    pass
+
+__all__ = ['_NUMEXPR_INSTALLED']
diff --git a/pandas/computation/common.py b/pandas/core/computation/common.py
similarity index 100%
rename from pandas/computation/common.py
rename to pandas/core/computation/common.py
diff --git a/pandas/computation/engines.py b/pandas/core/computation/engines.py
similarity index 85%
rename from pandas/computation/engines.py
rename to pandas/core/computation/engines.py
index 58b822af546c8..155ff554cf99c 100644
--- a/pandas/computation/engines.py
+++ b/pandas/core/computation/engines.py
@@ -1,13 +1,16 @@
-"""Engine classes for :func:`~pandas.eval`
+"""
+Engine classes for :func:`~pandas.eval`
 """
 
 import abc
 
 from pandas import compat
-from pandas.compat import DeepChainMap, map
-from pandas.core import common as com
-from pandas.computation.align import _align, _reconstruct_object
-from pandas.computation.ops import UndefinedVariableError, _mathops, _reductions
+from pandas.compat import map
+import pandas.io.formats.printing as printing
+from pandas.core.computation.align import _align, _reconstruct_object
+from pandas.core.computation.ops import (
+    UndefinedVariableError,
+    _mathops, _reductions)
 
 
 _ne_builtins = frozenset(_mathops + _reductions)
@@ -30,8 +33,9 @@ def _check_ne_builtin_clash(expr):
 
     if overlap:
         s = ', '.join(map(repr, overlap))
-        raise NumExprClobberingError('Variables in expression "%s" overlap with '
-                                     'numexpr builtins: (%s)' % (expr, s))
+        raise NumExprClobberingError('Variables in expression "{expr}" '
+                                     'overlap with builtins: ({s})'
+                                     .format(expr=expr, s=s))
 
 
 class AbstractEngine(object):
@@ -52,7 +56,7 @@ def convert(self):
 
         Defaults to return the expression as a string.
         """
-        return com.pprint_thing(self.expr)
+        return printing.pprint_thing(self.expr)
 
     def evaluate(self):
         """Run the engine on the expression
diff --git a/pandas/core/computation/eval.py b/pandas/core/computation/eval.py
new file mode 100644
index 0000000000000..434d7f6ccfe13
--- /dev/null
+++ b/pandas/core/computation/eval.py
@@ -0,0 +1,347 @@
+#!/usr/bin/env python
+
+"""Top level ``eval`` module.
+"""
+
+import warnings
+import tokenize
+from pandas.io.formats.printing import pprint_thing
+from pandas.core.computation.scope import _ensure_scope
+from pandas.compat import string_types
+from pandas.core.computation.engines import _engines
+from pandas.util._validators import validate_bool_kwarg
+
+
+def _check_engine(engine):
+    """Make sure a valid engine is passed.
+
+    Parameters
+    ----------
+    engine : str
+
+    Raises
+    ------
+    KeyError
+      * If an invalid engine is passed
+    ImportError
+      * If numexpr was requested but doesn't exist
+
+    Returns
+    -------
+    string engine
+
+    """
+    from pandas.core.computation.check import _NUMEXPR_INSTALLED
+
+    if engine is None:
+        if _NUMEXPR_INSTALLED:
+            engine = 'numexpr'
+        else:
+            engine = 'python'
+
+    if engine not in _engines:
+        valid = list(_engines.keys())
+        raise KeyError('Invalid engine {engine!r} passed, valid engines are'
+                       ' {valid}'.format(engine=engine, valid=valid))
+
+    # TODO: validate this in a more general way (thinking of future engines
+    # that won't necessarily be import-able)
+    # Could potentially be done on engine instantiation
+    if engine == 'numexpr':
+        if not _NUMEXPR_INSTALLED:
+            raise ImportError("'numexpr' is not installed or an "
+                              "unsupported version. Cannot use "
+                              "engine='numexpr' for query/eval "
+                              "if 'numexpr' is not installed")
+
+    return engine
+
+
+def _check_parser(parser):
+    """Make sure a valid parser is passed.
+
+    Parameters
+    ----------
+    parser : str
+
+    Raises
+    ------
+    KeyError
+      * If an invalid parser is passed
+    """
+    from pandas.core.computation.expr import _parsers
+
+    if parser not in _parsers:
+        raise KeyError('Invalid parser {parser!r} passed, valid parsers are'
+                       ' {valid}'.format(parser=parser, valid=_parsers.keys()))
+
+
+def _check_resolvers(resolvers):
+    if resolvers is not None:
+        for resolver in resolvers:
+            if not hasattr(resolver, '__getitem__'):
+                name = type(resolver).__name__
+                raise TypeError('Resolver of type {name!r} does not implement '
+                                'the __getitem__ method'.format(name=name))
+
+
+def _check_expression(expr):
+    """Make sure an expression is not an empty string
+
+    Parameters
+    ----------
+    expr : object
+        An object that can be converted to a string
+
+    Raises
+    ------
+    ValueError
+      * If expr is an empty string
+    """
+    if not expr:
+        raise ValueError("expr cannot be an empty string")
+
+
+def _convert_expression(expr):
+    """Convert an object to an expression.
+
+    Thus function converts an object to an expression (a unicode string) and
+    checks to make sure it isn't empty after conversion. This is used to
+    convert operators to their string representation for recursive calls to
+    :func:`~pandas.eval`.
+
+    Parameters
+    ----------
+    expr : object
+        The object to be converted to a string.
+
+    Returns
+    -------
+    s : unicode
+        The string representation of an object.
+
+    Raises
+    ------
+    ValueError
+      * If the expression is empty.
+    """
+    s = pprint_thing(expr)
+    _check_expression(s)
+    return s
+
+
+def _check_for_locals(expr, stack_level, parser):
+    from pandas.core.computation.expr import tokenize_string
+
+    at_top_of_stack = stack_level == 0
+    not_pandas_parser = parser != 'pandas'
+
+    if not_pandas_parser:
+        msg = "The '@' prefix is only supported by the pandas parser"
+    elif at_top_of_stack:
+        msg = ("The '@' prefix is not allowed in "
+               "top-level eval calls, \nplease refer to "
+               "your variables by name without the '@' "
+               "prefix")
+
+    if at_top_of_stack or not_pandas_parser:
+        for toknum, tokval in tokenize_string(expr):
+            if toknum == tokenize.OP and tokval == '@':
+                raise SyntaxError(msg)
+
+
+def eval(expr, parser='pandas', engine=None, truediv=True,
+         local_dict=None, global_dict=None, resolvers=(), level=0,
+         target=None, inplace=False):
+    """Evaluate a Python expression as a string using various backends.
+
+    The following arithmetic operations are supported: ``+``, ``-``, ``*``,
+    ``/``, ``**``, ``%``, ``//`` (python engine only) along with the following
+    boolean operations: ``|`` (or), ``&`` (and), and ``~`` (not).
+    Additionally, the ``'pandas'`` parser allows the use of :keyword:`and`,
+    :keyword:`or`, and :keyword:`not` with the same semantics as the
+    corresponding bitwise operators.  :class:`~pandas.Series` and
+    :class:`~pandas.DataFrame` objects are supported and behave as they would
+    with plain ol' Python evaluation.
+
+    Parameters
+    ----------
+    expr : str or unicode
+        The expression to evaluate. This string cannot contain any Python
+        `statements
+        <https://docs.python.org/3/reference/simple_stmts.html#simple-statements>`__,
+        only Python `expressions
+        <https://docs.python.org/3/reference/simple_stmts.html#expression-statements>`__.
+    parser : string, default 'pandas', {'pandas', 'python'}
+        The parser to use to construct the syntax tree from the expression. The
+        default of ``'pandas'`` parses code slightly different than standard
+        Python. Alternatively, you can parse an expression using the
+        ``'python'`` parser to retain strict Python semantics.  See the
+        :ref:`enhancing performance <enhancingperf.eval>` documentation for
+        more details.
+    engine : string or None, default 'numexpr', {'python', 'numexpr'}
+
+        The engine used to evaluate the expression. Supported engines are
+
+        - None         : tries to use ``numexpr``, falls back to ``python``
+        - ``'numexpr'``: This default engine evaluates pandas objects using
+                         numexpr for large speed ups in complex expressions
+                         with large frames.
+        - ``'python'``: Performs operations as if you had ``eval``'d in top
+                        level python. This engine is generally not that useful.
+
+        More backends may be available in the future.
+
+    truediv : bool, optional
+        Whether to use true division, like in Python >= 3
+    local_dict : dict or None, optional
+        A dictionary of local variables, taken from locals() by default.
+    global_dict : dict or None, optional
+        A dictionary of global variables, taken from globals() by default.
+    resolvers : list of dict-like or None, optional
+        A list of objects implementing the ``__getitem__`` special method that
+        you can use to inject an additional collection of namespaces to use for
+        variable lookup. For example, this is used in the
+        :meth:`~pandas.DataFrame.query` method to inject the
+        ``DataFrame.index`` and ``DataFrame.columns``
+        variables that refer to their respective :class:`~pandas.DataFrame`
+        instance attributes.
+    level : int, optional
+        The number of prior stack frames to traverse and add to the current
+        scope. Most users will **not** need to change this parameter.
+    target : object, optional, default None
+        This is the target object for assignment. It is used when there is
+        variable assignment in the expression. If so, then `target` must
+        support item assignment with string keys, and if a copy is being
+        returned, it must also support `.copy()`.
+    inplace : bool, default False
+        If `target` is provided, and the expression mutates `target`, whether
+        to modify `target` inplace. Otherwise, return a copy of `target` with
+        the mutation.
+
+    Returns
+    -------
+    ndarray, numeric scalar, DataFrame, Series
+
+    Raises
+    ------
+    ValueError
+        There are many instances where such an error can be raised:
+
+        - `target=None`, but the expression is multiline.
+        - The expression is multiline, but not all them have item assignment.
+          An example of such an arrangement is this:
+
+          a = b + 1
+          a + 2
+
+          Here, there are expressions on different lines, making it multiline,
+          but the last line has no variable assigned to the output of `a + 2`.
+        - `inplace=True`, but the expression is missing item assignment.
+        - Item assignment is provided, but the `target` does not support
+          string item assignment.
+        - Item assignment is provided and `inplace=False`, but the `target`
+          does not support the `.copy()` method
+
+    Notes
+    -----
+    The ``dtype`` of any objects involved in an arithmetic ``%`` operation are
+    recursively cast to ``float64``.
+
+    See the :ref:`enhancing performance <enhancingperf.eval>` documentation for
+    more details.
+
+    See Also
+    --------
+    pandas.DataFrame.query
+    pandas.DataFrame.eval
+    """
+    from pandas.core.computation.expr import Expr
+
+    inplace = validate_bool_kwarg(inplace, "inplace")
+
+    if isinstance(expr, string_types):
+        _check_expression(expr)
+        exprs = [e.strip() for e in expr.splitlines() if e.strip() != '']
+    else:
+        exprs = [expr]
+    multi_line = len(exprs) > 1
+
+    if multi_line and target is None:
+        raise ValueError("multi-line expressions are only valid in the "
+                         "context of data, use DataFrame.eval")
+
+    ret = None
+    first_expr = True
+    target_modified = False
+
+    for expr in exprs:
+        expr = _convert_expression(expr)
+        engine = _check_engine(engine)
+        _check_parser(parser)
+        _check_resolvers(resolvers)
+        _check_for_locals(expr, level, parser)
+
+        # get our (possibly passed-in) scope
+        env = _ensure_scope(level + 1, global_dict=global_dict,
+                            local_dict=local_dict, resolvers=resolvers,
+                            target=target)
+
+        parsed_expr = Expr(expr, engine=engine, parser=parser, env=env,
+                           truediv=truediv)
+
+        # construct the engine and evaluate the parsed expression
+        eng = _engines[engine]
+        eng_inst = eng(parsed_expr)
+        ret = eng_inst.evaluate()
+
+        if parsed_expr.assigner is None:
+            if multi_line:
+                raise ValueError("Multi-line expressions are only valid"
+                                 " if all expressions contain an assignment")
+            elif inplace:
+                raise ValueError("Cannot operate inplace "
+                                 "if there is no assignment")
+
+        # assign if needed
+        assigner = parsed_expr.assigner
+        if env.target is not None and assigner is not None:
+            target_modified = True
+
+            # if returning a copy, copy only on the first assignment
+            if not inplace and first_expr:
+                try:
+                    target = env.target.copy()
+                except AttributeError:
+                    raise ValueError("Cannot return a copy of the target")
+            else:
+                target = env.target
+
+            # TypeError is most commonly raised (e.g. int, list), but you
+            # get IndexError if you try to do this assignment on np.ndarray.
+            # we will ignore numpy warnings here; e.g. if trying
+            # to use a non-numeric indexer
+            try:
+                with warnings.catch_warnings(record=True):
+                    target[assigner] = ret
+            except (TypeError, IndexError):
+                raise ValueError("Cannot assign expression output to target")
+
+            if not resolvers:
+                resolvers = ({assigner: ret},)
+            else:
+                # existing resolver needs updated to handle
+                # case of mutating existing column in copy
+                for resolver in resolvers:
+                    if assigner in resolver:
+                        resolver[assigner] = ret
+                        break
+                else:
+                    resolvers += ({assigner: ret},)
+
+            ret = None
+            first_expr = False
+
+    # We want to exclude `inplace=None` as being False.
+    if inplace is False:
+        return target if target_modified else ret
diff --git a/pandas/computation/expr.py b/pandas/core/computation/expr.py
similarity index 81%
rename from pandas/computation/expr.py
rename to pandas/core/computation/expr.py
index 2ae6f29f74efc..b68b6970a89cc 100644
--- a/pandas/computation/expr.py
+++ b/pandas/core/computation/expr.py
@@ -2,26 +2,25 @@
 """
 
 import ast
-import operator
-import sys
-import inspect
 import tokenize
-import datetime
 
 from functools import partial
+import numpy as np
 
 import pandas as pd
 from pandas import compat
 from pandas.compat import StringIO, lmap, zip, reduce, string_types
 from pandas.core.base import StringMixin
 from pandas.core import common as com
-from pandas.tools.util import compose
-from pandas.computation.ops import (_cmp_ops_syms, _bool_ops_syms,
-                                    _arith_ops_syms, _unary_ops_syms, is_term)
-from pandas.computation.ops import _reductions, _mathops, _LOCAL_TAG
-from pandas.computation.ops import Op, BinOp, UnaryOp, Term, Constant, Div
-from pandas.computation.ops import UndefinedVariableError, FuncNode
-from pandas.computation.scope import Scope, _ensure_scope
+import pandas.io.formats.printing as printing
+from pandas.core.reshape.util import compose
+from pandas.core.computation.ops import (
+    _cmp_ops_syms, _bool_ops_syms,
+    _arith_ops_syms, _unary_ops_syms, is_term)
+from pandas.core.computation.ops import _reductions, _mathops, _LOCAL_TAG
+from pandas.core.computation.ops import Op, BinOp, UnaryOp, Term, Constant, Div
+from pandas.core.computation.ops import UndefinedVariableError, FuncNode
+from pandas.core.computation.scope import Scope
 
 
 def tokenize_string(source):
@@ -190,8 +189,8 @@ def _filter_nodes(superclass, all_nodes=_all_nodes):
 # and we don't want `stmt` and friends in their so get only the class whose
 # names are capitalized
 _base_supported_nodes = (_all_node_names - _unsupported_nodes) | _hacked_nodes
-_msg = 'cannot both support and not support {0}'.format(_unsupported_nodes &
-                                                        _base_supported_nodes)
+_msg = 'cannot both support and not support {intersection}'.format(
+    intersection=_unsupported_nodes & _base_supported_nodes)
 assert not _unsupported_nodes & _base_supported_nodes, _msg
 
 
@@ -201,8 +200,8 @@ def _node_not_implemented(node_name, cls):
     """
 
     def f(self, *args, **kwargs):
-        raise NotImplementedError("{0!r} nodes are not "
-                                  "implemented".format(node_name))
+        raise NotImplementedError("{name!r} nodes are not "
+                                  "implemented".format(name=node_name))
     return f
 
 
@@ -218,7 +217,7 @@ def disallowed(cls):
         cls.unsupported_nodes = ()
         for node in nodes:
             new_method = _node_not_implemented(node, cls)
-            name = 'visit_{0}'.format(node)
+            name = 'visit_{node}'.format(node=node)
             cls.unsupported_nodes += (name,)
             setattr(cls, name, new_method)
         return cls
@@ -252,13 +251,14 @@ def add_ops(op_classes):
     """Decorator to add default implementation of ops."""
     def f(cls):
         for op_attr_name, op_class in compat.iteritems(op_classes):
-            ops = getattr(cls, '{0}_ops'.format(op_attr_name))
-            ops_map = getattr(cls, '{0}_op_nodes_map'.format(op_attr_name))
+            ops = getattr(cls, '{name}_ops'.format(name=op_attr_name))
+            ops_map = getattr(cls, '{name}_op_nodes_map'.format(
+                name=op_attr_name))
             for op in ops:
                 op_node = ops_map[op]
                 if op_node is not None:
                     made_op = _op_maker(op_class, op)
-                    setattr(cls, 'visit_{0}'.format(op_node), made_op)
+                    setattr(cls, 'visit_{node}'.format(node=op_node), made_op)
         return cls
     return f
 
@@ -307,7 +307,14 @@ def __init__(self, env, engine, parser, preparser=_preparse):
     def visit(self, node, **kwargs):
         if isinstance(node, string_types):
             clean = self.preparser(node)
-            node = ast.fix_missing_locations(ast.parse(clean))
+            try:
+                node = ast.fix_missing_locations(ast.parse(clean))
+            except SyntaxError as e:
+                from keyword import iskeyword
+                if any(iskeyword(x) for x in clean.split()):
+                    e.msg = ("Python keyword not valid identifier"
+                             " in numexpr query")
+                raise e
 
         method = 'visit_' + node.__class__.__name__
         visitor = getattr(self, method)
@@ -350,7 +357,7 @@ def _rewrite_membership_op(self, node, left, right):
         op = self.visit(op_instance)
         return op, op_instance, left, right
 
-    def _possibly_transform_eq_ne(self, node, left=None, right=None):
+    def _maybe_transform_eq_ne(self, node, left=None, right=None):
         if left is None:
             left = self.visit(node.left, side='left')
         if right is None:
@@ -359,7 +366,20 @@ def _possibly_transform_eq_ne(self, node, left=None, right=None):
                                                                 right)
         return op, op_class, left, right
 
-    def _possibly_eval(self, binop, eval_in_python):
+    def _maybe_downcast_constants(self, left, right):
+        f32 = np.dtype(np.float32)
+        if left.is_scalar and not right.is_scalar and right.return_type == f32:
+            # right is a float32 array, left is a scalar
+            name = self.env.add_tmp(np.float32(left.value))
+            left = self.term_type(name, self.env)
+        if right.is_scalar and not left.is_scalar and left.return_type == f32:
+            # left is a float32 array, right is a scalar
+            name = self.env.add_tmp(np.float32(right.value))
+            right = self.term_type(name, self.env)
+
+        return left, right
+
+    def _maybe_eval(self, binop, eval_in_python):
         # eval `in` and `not in` (for now) in "partial" python space
         # things that can be evaluated in "eval" space will be turned into
         # temporary variables. for example,
@@ -369,40 +389,42 @@ def _possibly_eval(self, binop, eval_in_python):
         return binop.evaluate(self.env, self.engine, self.parser,
                               self.term_type, eval_in_python)
 
-    def _possibly_evaluate_binop(self, op, op_class, lhs, rhs,
-                                 eval_in_python=('in', 'not in'),
-                                 maybe_eval_in_python=('==', '!=', '<', '>',
-                                                       '<=', '>=')):
+    def _maybe_evaluate_binop(self, op, op_class, lhs, rhs,
+                              eval_in_python=('in', 'not in'),
+                              maybe_eval_in_python=('==', '!=', '<', '>',
+                                                    '<=', '>=')):
         res = op(lhs, rhs)
 
         if res.has_invalid_return_type:
-            raise TypeError("unsupported operand type(s) for {0}:"
-                            " '{1}' and '{2}'".format(res.op, lhs.type,
-                                                      rhs.type))
+            raise TypeError("unsupported operand type(s) for {op}:"
+                            " '{lhs}' and '{rhs}'".format(op=res.op,
+                                                          lhs=lhs.type,
+                                                          rhs=rhs.type))
 
         if self.engine != 'pytables':
-            if (res.op in _cmp_ops_syms
-                    and getattr(lhs, 'is_datetime', False)
-                    or getattr(rhs, 'is_datetime', False)):
+            if (res.op in _cmp_ops_syms and
+                    getattr(lhs, 'is_datetime', False) or
+                    getattr(rhs, 'is_datetime', False)):
                 # all date ops must be done in python bc numexpr doesn't work
                 # well with NaT
-                return self._possibly_eval(res, self.binary_ops)
+                return self._maybe_eval(res, self.binary_ops)
 
         if res.op in eval_in_python:
             # "in"/"not in" ops are always evaluated in python
-            return self._possibly_eval(res, eval_in_python)
+            return self._maybe_eval(res, eval_in_python)
         elif self.engine != 'pytables':
-            if (getattr(lhs, 'return_type', None) == object
-                    or getattr(rhs, 'return_type', None) == object):
+            if (getattr(lhs, 'return_type', None) == object or
+                    getattr(rhs, 'return_type', None) == object):
                 # evaluate "==" and "!=" in python if either of our operands
                 # has an object return type
-                return self._possibly_eval(res, eval_in_python +
-                                           maybe_eval_in_python)
+                return self._maybe_eval(res, eval_in_python +
+                                        maybe_eval_in_python)
         return res
 
     def visit_BinOp(self, node, **kwargs):
-        op, op_class, left, right = self._possibly_transform_eq_ne(node)
-        return self._possibly_evaluate_binop(op, op_class, left, right)
+        op, op_class, left, right = self._maybe_transform_eq_ne(node)
+        left, right = self._maybe_downcast_constants(left, right)
+        return self._maybe_evaluate_binop(op, op_class, left, right)
 
     def visit_Div(self, node, **kwargs):
         truediv = self.env.scope['truediv']
@@ -427,7 +449,7 @@ def visit_Str(self, node, **kwargs):
         return self.term_type(name, self.env)
 
     def visit_List(self, node, **kwargs):
-        name = self.env.add_tmp([self.visit(e).value for e in node.elts])
+        name = self.env.add_tmp([self.visit(e)(self.env) for e in node.elts])
         return self.term_type(name, self.env)
 
     visit_Tuple = visit_List
@@ -514,10 +536,12 @@ def visit_Attribute(self, node, **kwargs):
                 if isinstance(value, ast.Name) and value.id == attr:
                     return resolved
 
-        raise ValueError("Invalid Attribute context {0}".format(ctx.__name__))
+        raise ValueError("Invalid Attribute context {name}"
+                         .format(name=ctx.__name__))
 
     def visit_Call_35(self, node, side=None, **kwargs):
-        """ in 3.5 the starargs attribute was changed to be more flexible, #11097 """
+        """ in 3.5 the starargs attribute was changed to be more flexible,
+        #11097 """
 
         if isinstance(node.func, ast.Attribute):
             res = self.visit_Attribute(node.func)
@@ -535,31 +559,34 @@ def visit_Call_35(self, node, side=None, **kwargs):
                     raise
 
         if res is None:
-            raise ValueError("Invalid function call {0}".format(node.func.id))
+            raise ValueError("Invalid function call {func}"
+                             .format(func=node.func.id))
         if hasattr(res, 'value'):
             res = res.value
 
         if isinstance(res, FuncNode):
 
-            new_args = [ self.visit(arg) for arg in node.args ]
+            new_args = [self.visit(arg) for arg in node.args]
 
             if node.keywords:
-                raise TypeError("Function \"{0}\" does not support keyword "
-                                "arguments".format(res.name))
+                raise TypeError("Function \"{name}\" does not support keyword "
+                                "arguments".format(name=res.name))
 
             return res(*new_args, **kwargs)
 
         else:
 
-            new_args = [ self.visit(arg).value for arg in node.args ]
+            new_args = [self.visit(arg).value for arg in node.args]
 
             for key in node.keywords:
                 if not isinstance(key, ast.keyword):
                     raise ValueError("keyword error in function call "
-                                     "'{0}'".format(node.func.id))
+                                     "'{func}'".format(func=node.func.id))
 
                 if key.arg:
-                    kwargs.append(ast.keyword(keyword.arg, self.visit(keyword.value)))
+                    # TODO: bug?
+                    kwargs.append(ast.keyword(
+                        keyword.arg, self.visit(keyword.value)))  # noqa
 
             return self.const_type(res(*new_args, **kwargs), self.env)
 
@@ -582,7 +609,8 @@ def visit_Call_legacy(self, node, side=None, **kwargs):
                     raise
 
         if res is None:
-            raise ValueError("Invalid function call {0}".format(node.func.id))
+            raise ValueError("Invalid function call {func}"
+                             .format(func=node.func.id))
         if hasattr(res, 'value'):
             res = res.value
 
@@ -593,8 +621,8 @@ def visit_Call_legacy(self, node, side=None, **kwargs):
                 args += self.visit(node.starargs)
 
             if node.keywords or node.kwargs:
-                raise TypeError("Function \"{0}\" does not support keyword "
-                                "arguments".format(res.name))
+                raise TypeError("Function \"{name}\" does not support keyword "
+                                "arguments".format(name=res.name))
 
             return res(*args, **kwargs)
 
@@ -607,7 +635,7 @@ def visit_Call_legacy(self, node, side=None, **kwargs):
             for key in node.keywords:
                 if not isinstance(key, ast.keyword):
                     raise ValueError("keyword error in function call "
-                                     "'{0}'".format(node.func.id))
+                                     "'{func}'".format(func=node.func.id))
                 keywords[key.arg] = self.visit(key.value).value
             if node.kwargs is not None:
                 keywords.update(self.visit(node.kwargs).value)
@@ -647,15 +675,16 @@ def visitor(x, y):
             lhs = self._try_visit_binop(x)
             rhs = self._try_visit_binop(y)
 
-            op, op_class, lhs, rhs = self._possibly_transform_eq_ne(node, lhs,
-                                                                    rhs)
-            return self._possibly_evaluate_binop(op, node.op, lhs, rhs)
+            op, op_class, lhs, rhs = self._maybe_transform_eq_ne(
+                node, lhs, rhs)
+            return self._maybe_evaluate_binop(op, node.op, lhs, rhs)
 
         operands = node.values
         return reduce(visitor, operands)
 
+
 # ast.Call signature changed on 3.5,
-# conditionally change  which methods is named
+# conditionally change which methods is named
 # visit_Call depending on Python version, #11097
 if compat.PY35:
     BaseExprVisitor.visit_Call = BaseExprVisitor.visit_Call_35
@@ -717,7 +746,7 @@ def __call__(self):
         return self.terms(self.env)
 
     def __unicode__(self):
-        return com.pprint_thing(self.terms)
+        return printing.pprint_thing(self.terms)
 
     def __len__(self):
         return len(self.expr)
diff --git a/pandas/core/computation/expressions.py b/pandas/core/computation/expressions.py
new file mode 100644
index 0000000000000..781101f5804e6
--- /dev/null
+++ b/pandas/core/computation/expressions.py
@@ -0,0 +1,248 @@
+"""
+Expressions
+-----------
+
+Offer fast expression evaluation through numexpr
+
+"""
+
+import warnings
+import numpy as np
+
+import pandas.core.common as com
+from pandas.core.computation.check import _NUMEXPR_INSTALLED
+from pandas.core.config import get_option
+
+if _NUMEXPR_INSTALLED:
+    import numexpr as ne
+
+_TEST_MODE = None
+_TEST_RESULT = None
+_USE_NUMEXPR = _NUMEXPR_INSTALLED
+_evaluate = None
+_where = None
+
+# the set of dtypes that we will allow pass to numexpr
+_ALLOWED_DTYPES = {
+    'evaluate': set(['int64', 'int32', 'float64', 'float32', 'bool']),
+    'where': set(['int64', 'float64', 'bool'])
+}
+
+# the minimum prod shape that we will use numexpr
+_MIN_ELEMENTS = 10000
+
+
+def set_use_numexpr(v=True):
+    # set/unset to use numexpr
+    global _USE_NUMEXPR
+    if _NUMEXPR_INSTALLED:
+        _USE_NUMEXPR = v
+
+    # choose what we are going to do
+    global _evaluate, _where
+    if not _USE_NUMEXPR:
+        _evaluate = _evaluate_standard
+        _where = _where_standard
+    else:
+        _evaluate = _evaluate_numexpr
+        _where = _where_numexpr
+
+
+def set_numexpr_threads(n=None):
+    # if we are using numexpr, set the threads to n
+    # otherwise reset
+    if _NUMEXPR_INSTALLED and _USE_NUMEXPR:
+        if n is None:
+            n = ne.detect_number_of_cores()
+        ne.set_num_threads(n)
+
+
+def _evaluate_standard(op, op_str, a, b, **eval_kwargs):
+    """ standard evaluation """
+    if _TEST_MODE:
+        _store_test_result(False)
+    with np.errstate(all='ignore'):
+        return op(a, b)
+
+
+def _can_use_numexpr(op, op_str, a, b, dtype_check):
+    """ return a boolean if we WILL be using numexpr """
+    if op_str is not None:
+
+        # required min elements (otherwise we are adding overhead)
+        if np.prod(a.shape) > _MIN_ELEMENTS:
+
+            # check for dtype compatibility
+            dtypes = set()
+            for o in [a, b]:
+                if hasattr(o, 'get_dtype_counts'):
+                    s = o.get_dtype_counts()
+                    if len(s) > 1:
+                        return False
+                    dtypes |= set(s.index)
+                elif isinstance(o, np.ndarray):
+                    dtypes |= set([o.dtype.name])
+
+            # allowed are a superset
+            if not len(dtypes) or _ALLOWED_DTYPES[dtype_check] >= dtypes:
+                return True
+
+    return False
+
+
+def _evaluate_numexpr(op, op_str, a, b, truediv=True,
+                      reversed=False, **eval_kwargs):
+    result = None
+
+    if _can_use_numexpr(op, op_str, a, b, 'evaluate'):
+        try:
+
+            # we were originally called by a reversed op
+            # method
+            if reversed:
+                a, b = b, a
+
+            a_value = getattr(a, "values", a)
+            b_value = getattr(b, "values", b)
+            result = ne.evaluate('a_value {op} b_value'.format(op=op_str),
+                                 local_dict={'a_value': a_value,
+                                             'b_value': b_value},
+                                 casting='safe', truediv=truediv,
+                                 **eval_kwargs)
+        except ValueError as detail:
+            if 'unknown type object' in str(detail):
+                pass
+
+    if _TEST_MODE:
+        _store_test_result(result is not None)
+
+    if result is None:
+        result = _evaluate_standard(op, op_str, a, b)
+
+    return result
+
+
+def _where_standard(cond, a, b):
+    return np.where(com._values_from_object(cond), com._values_from_object(a),
+                    com._values_from_object(b))
+
+
+def _where_numexpr(cond, a, b):
+    result = None
+
+    if _can_use_numexpr(None, 'where', a, b, 'where'):
+
+        try:
+            cond_value = getattr(cond, 'values', cond)
+            a_value = getattr(a, 'values', a)
+            b_value = getattr(b, 'values', b)
+            result = ne.evaluate('where(cond_value, a_value, b_value)',
+                                 local_dict={'cond_value': cond_value,
+                                             'a_value': a_value,
+                                             'b_value': b_value},
+                                 casting='safe')
+        except ValueError as detail:
+            if 'unknown type object' in str(detail):
+                pass
+        except Exception as detail:
+            raise TypeError(str(detail))
+
+    if result is None:
+        result = _where_standard(cond, a, b)
+
+    return result
+
+
+# turn myself on
+set_use_numexpr(get_option('compute.use_numexpr'))
+
+
+def _has_bool_dtype(x):
+    try:
+        return x.dtype == bool
+    except AttributeError:
+        try:
+            return 'bool' in x.dtypes
+        except AttributeError:
+            return isinstance(x, (bool, np.bool_))
+
+
+def _bool_arith_check(op_str, a, b, not_allowed=frozenset(('/', '//', '**')),
+                      unsupported=None):
+    if unsupported is None:
+        unsupported = {'+': '|', '*': '&', '-': '^'}
+
+    if _has_bool_dtype(a) and _has_bool_dtype(b):
+        if op_str in unsupported:
+            warnings.warn("evaluating in Python space because the {op!r} "
+                          "operator is not supported by numexpr for "
+                          "the bool dtype, use {alt_op!r} instead"
+                          .format(op=op_str, alt_op=unsupported[op_str]))
+            return False
+
+        if op_str in not_allowed:
+            raise NotImplementedError("operator {op!r} not implemented for "
+                                      "bool dtypes".format(op=op_str))
+    return True
+
+
+def evaluate(op, op_str, a, b, use_numexpr=True,
+             **eval_kwargs):
+    """ evaluate and return the expression of the op on a and b
+
+        Parameters
+        ----------
+
+        op :    the actual operand
+        op_str: the string version of the op
+        a :     left operand
+        b :     right operand
+        use_numexpr : whether to try to use numexpr (default True)
+        """
+
+    use_numexpr = use_numexpr and _bool_arith_check(op_str, a, b)
+    if use_numexpr:
+        return _evaluate(op, op_str, a, b, **eval_kwargs)
+    return _evaluate_standard(op, op_str, a, b)
+
+
+def where(cond, a, b, use_numexpr=True):
+    """ evaluate the where condition cond on a and b
+
+        Parameters
+        ----------
+
+        cond : a boolean array
+        a :    return if cond is True
+        b :    return if cond is False
+        use_numexpr : whether to try to use numexpr (default True)
+        """
+
+    if use_numexpr:
+        return _where(cond, a, b)
+    return _where_standard(cond, a, b)
+
+
+def set_test_mode(v=True):
+    """
+    Keeps track of whether numexpr was used.  Stores an additional ``True``
+    for every successful use of evaluate with numexpr since the last
+    ``get_test_result``
+    """
+    global _TEST_MODE, _TEST_RESULT
+    _TEST_MODE = v
+    _TEST_RESULT = []
+
+
+def _store_test_result(used_numexpr):
+    global _TEST_RESULT
+    if used_numexpr:
+        _TEST_RESULT.append(used_numexpr)
+
+
+def get_test_result():
+    """get test result and reset test_results"""
+    global _TEST_RESULT
+    res = _TEST_RESULT
+    _TEST_RESULT = []
+    return res
diff --git a/pandas/core/computation/ops.py b/pandas/core/computation/ops.py
new file mode 100644
index 0000000000000..ca0c4db4947c4
--- /dev/null
+++ b/pandas/core/computation/ops.py
@@ -0,0 +1,549 @@
+"""Operator classes for eval.
+"""
+
+import operator as op
+from functools import partial
+from datetime import datetime
+
+import numpy as np
+
+from pandas.core.dtypes.common import is_list_like, is_scalar
+import pandas as pd
+from pandas.compat import PY3, string_types, text_type
+import pandas.core.common as com
+from pandas.io.formats.printing import pprint_thing, pprint_thing_encoded
+from pandas.core.base import StringMixin
+from pandas.core.computation.common import _ensure_decoded, _result_type_many
+from pandas.core.computation.scope import _DEFAULT_GLOBALS
+
+
+_reductions = 'sum', 'prod'
+
+_unary_math_ops = ('sin', 'cos', 'exp', 'log', 'expm1', 'log1p',
+                   'sqrt', 'sinh', 'cosh', 'tanh', 'arcsin', 'arccos',
+                   'arctan', 'arccosh', 'arcsinh', 'arctanh', 'abs')
+_binary_math_ops = ('arctan2',)
+_mathops = _unary_math_ops + _binary_math_ops
+
+
+_LOCAL_TAG = '__pd_eval_local_'
+
+
+class UndefinedVariableError(NameError):
+
+    """NameError subclass for local variables."""
+
+    def __init__(self, name, is_local):
+        if is_local:
+            msg = 'local variable {0!r} is not defined'
+        else:
+            msg = 'name {0!r} is not defined'
+        super(UndefinedVariableError, self).__init__(msg.format(name))
+
+
+class Term(StringMixin):
+
+    def __new__(cls, name, env, side=None, encoding=None):
+        klass = Constant if not isinstance(name, string_types) else cls
+        supr_new = super(Term, klass).__new__
+        return supr_new(klass)
+
+    def __init__(self, name, env, side=None, encoding=None):
+        self._name = name
+        self.env = env
+        self.side = side
+        tname = text_type(name)
+        self.is_local = (tname.startswith(_LOCAL_TAG) or
+                         tname in _DEFAULT_GLOBALS)
+        self._value = self._resolve_name()
+        self.encoding = encoding
+
+    @property
+    def local_name(self):
+        return self.name.replace(_LOCAL_TAG, '')
+
+    def __unicode__(self):
+        return pprint_thing(self.name)
+
+    def __call__(self, *args, **kwargs):
+        return self.value
+
+    def evaluate(self, *args, **kwargs):
+        return self
+
+    def _resolve_name(self):
+        res = self.env.resolve(self.local_name, is_local=self.is_local)
+        self.update(res)
+
+        if hasattr(res, 'ndim') and res.ndim > 2:
+            raise NotImplementedError("N-dimensional objects, where N > 2,"
+                                      " are not supported with eval")
+        return res
+
+    def update(self, value):
+        """
+        search order for local (i.e., @variable) variables:
+
+        scope, key_variable
+        [('locals', 'local_name'),
+         ('globals', 'local_name'),
+         ('locals', 'key'),
+         ('globals', 'key')]
+        """
+        key = self.name
+
+        # if it's a variable name (otherwise a constant)
+        if isinstance(key, string_types):
+            self.env.swapkey(self.local_name, key, new_value=value)
+
+        self.value = value
+
+    @property
+    def is_scalar(self):
+        return is_scalar(self._value)
+
+    @property
+    def type(self):
+        try:
+            # potentially very slow for large, mixed dtype frames
+            return self._value.values.dtype
+        except AttributeError:
+            try:
+                # ndarray
+                return self._value.dtype
+            except AttributeError:
+                # scalar
+                return type(self._value)
+
+    return_type = type
+
+    @property
+    def raw(self):
+        return pprint_thing('{0}(name={1!r}, type={2})'
+                            ''.format(self.__class__.__name__, self.name,
+                                      self.type))
+
+    @property
+    def is_datetime(self):
+        try:
+            t = self.type.type
+        except AttributeError:
+            t = self.type
+
+        return issubclass(t, (datetime, np.datetime64))
+
+    @property
+    def value(self):
+        return self._value
+
+    @value.setter
+    def value(self, new_value):
+        self._value = new_value
+
+    @property
+    def name(self):
+        return self._name
+
+    @name.setter
+    def name(self, new_name):
+        self._name = new_name
+
+    @property
+    def ndim(self):
+        return self._value.ndim
+
+
+class Constant(Term):
+
+    def __init__(self, value, env, side=None, encoding=None):
+        super(Constant, self).__init__(value, env, side=side,
+                                       encoding=encoding)
+
+    def _resolve_name(self):
+        return self._name
+
+    @property
+    def name(self):
+        return self.value
+
+    def __unicode__(self):
+        # in python 2 str() of float
+        # can truncate shorter than repr()
+        return repr(self.name)
+
+
+_bool_op_map = {'not': '~', 'and': '&', 'or': '|'}
+
+
+class Op(StringMixin):
+
+    """Hold an operator of arbitrary arity
+    """
+
+    def __init__(self, op, operands, *args, **kwargs):
+        self.op = _bool_op_map.get(op, op)
+        self.operands = operands
+        self.encoding = kwargs.get('encoding', None)
+
+    def __iter__(self):
+        return iter(self.operands)
+
+    def __unicode__(self):
+        """Print a generic n-ary operator and its operands using infix
+        notation"""
+        # recurse over the operands
+        parened = ('({0})'.format(pprint_thing(opr))
+                   for opr in self.operands)
+        return pprint_thing(' {0} '.format(self.op).join(parened))
+
+    @property
+    def return_type(self):
+        # clobber types to bool if the op is a boolean operator
+        if self.op in (_cmp_ops_syms + _bool_ops_syms):
+            return np.bool_
+        return _result_type_many(*(term.type for term in com.flatten(self)))
+
+    @property
+    def has_invalid_return_type(self):
+        types = self.operand_types
+        obj_dtype_set = frozenset([np.dtype('object')])
+        return self.return_type == object and types - obj_dtype_set
+
+    @property
+    def operand_types(self):
+        return frozenset(term.type for term in com.flatten(self))
+
+    @property
+    def is_scalar(self):
+        return all(operand.is_scalar for operand in self.operands)
+
+    @property
+    def is_datetime(self):
+        try:
+            t = self.return_type.type
+        except AttributeError:
+            t = self.return_type
+
+        return issubclass(t, (datetime, np.datetime64))
+
+
+def _in(x, y):
+    """Compute the vectorized membership of ``x in y`` if possible, otherwise
+    use Python.
+    """
+    try:
+        return x.isin(y)
+    except AttributeError:
+        if is_list_like(x):
+            try:
+                return y.isin(x)
+            except AttributeError:
+                pass
+        return x in y
+
+
+def _not_in(x, y):
+    """Compute the vectorized membership of ``x not in y`` if possible,
+    otherwise use Python.
+    """
+    try:
+        return ~x.isin(y)
+    except AttributeError:
+        if is_list_like(x):
+            try:
+                return ~y.isin(x)
+            except AttributeError:
+                pass
+        return x not in y
+
+
+_cmp_ops_syms = '>', '<', '>=', '<=', '==', '!=', 'in', 'not in'
+_cmp_ops_funcs = op.gt, op.lt, op.ge, op.le, op.eq, op.ne, _in, _not_in
+_cmp_ops_dict = dict(zip(_cmp_ops_syms, _cmp_ops_funcs))
+
+_bool_ops_syms = '&', '|', 'and', 'or'
+_bool_ops_funcs = op.and_, op.or_, op.and_, op.or_
+_bool_ops_dict = dict(zip(_bool_ops_syms, _bool_ops_funcs))
+
+_arith_ops_syms = '+', '-', '*', '/', '**', '//', '%'
+_arith_ops_funcs = (op.add, op.sub, op.mul, op.truediv if PY3 else op.div,
+                    op.pow, op.floordiv, op.mod)
+_arith_ops_dict = dict(zip(_arith_ops_syms, _arith_ops_funcs))
+
+_special_case_arith_ops_syms = '**', '//', '%'
+_special_case_arith_ops_funcs = op.pow, op.floordiv, op.mod
+_special_case_arith_ops_dict = dict(zip(_special_case_arith_ops_syms,
+                                        _special_case_arith_ops_funcs))
+
+_binary_ops_dict = {}
+
+for d in (_cmp_ops_dict, _bool_ops_dict, _arith_ops_dict):
+    _binary_ops_dict.update(d)
+
+
+def _cast_inplace(terms, acceptable_dtypes, dtype):
+    """Cast an expression inplace.
+
+    Parameters
+    ----------
+    terms : Op
+        The expression that should cast.
+    acceptable_dtypes : list of acceptable numpy.dtype
+        Will not cast if term's dtype in this list.
+
+        .. versionadded:: 0.19.0
+
+    dtype : str or numpy.dtype
+        The dtype to cast to.
+    """
+    dt = np.dtype(dtype)
+    for term in terms:
+        if term.type in acceptable_dtypes:
+            continue
+
+        try:
+            new_value = term.value.astype(dt)
+        except AttributeError:
+            new_value = dt.type(term.value)
+        term.update(new_value)
+
+
+def is_term(obj):
+    return isinstance(obj, Term)
+
+
+class BinOp(Op):
+
+    """Hold a binary operator and its operands
+
+    Parameters
+    ----------
+    op : str
+    left : Term or Op
+    right : Term or Op
+    """
+
+    def __init__(self, op, lhs, rhs, **kwargs):
+        super(BinOp, self).__init__(op, (lhs, rhs))
+        self.lhs = lhs
+        self.rhs = rhs
+
+        self._disallow_scalar_only_bool_ops()
+
+        self.convert_values()
+
+        try:
+            self.func = _binary_ops_dict[op]
+        except KeyError:
+            # has to be made a list for python3
+            keys = list(_binary_ops_dict.keys())
+            raise ValueError('Invalid binary operator {0!r}, valid'
+                             ' operators are {1}'.format(op, keys))
+
+    def __call__(self, env):
+        """Recursively evaluate an expression in Python space.
+
+        Parameters
+        ----------
+        env : Scope
+
+        Returns
+        -------
+        object
+            The result of an evaluated expression.
+        """
+        # handle truediv
+        if self.op == '/' and env.scope['truediv']:
+            self.func = op.truediv
+
+        # recurse over the left/right nodes
+        left = self.lhs(env)
+        right = self.rhs(env)
+
+        return self.func(left, right)
+
+    def evaluate(self, env, engine, parser, term_type, eval_in_python):
+        """Evaluate a binary operation *before* being passed to the engine.
+
+        Parameters
+        ----------
+        env : Scope
+        engine : str
+        parser : str
+        term_type : type
+        eval_in_python : list
+
+        Returns
+        -------
+        term_type
+            The "pre-evaluated" expression as an instance of ``term_type``
+        """
+        if engine == 'python':
+            res = self(env)
+        else:
+            # recurse over the left/right nodes
+            left = self.lhs.evaluate(env, engine=engine, parser=parser,
+                                     term_type=term_type,
+                                     eval_in_python=eval_in_python)
+            right = self.rhs.evaluate(env, engine=engine, parser=parser,
+                                      term_type=term_type,
+                                      eval_in_python=eval_in_python)
+
+            # base cases
+            if self.op in eval_in_python:
+                res = self.func(left.value, right.value)
+            else:
+                res = pd.eval(self, local_dict=env, engine=engine,
+                              parser=parser)
+
+        name = env.add_tmp(res)
+        return term_type(name, env=env)
+
+    def convert_values(self):
+        """Convert datetimes to a comparable value in an expression.
+        """
+        def stringify(value):
+            if self.encoding is not None:
+                encoder = partial(pprint_thing_encoded,
+                                  encoding=self.encoding)
+            else:
+                encoder = pprint_thing
+            return encoder(value)
+
+        lhs, rhs = self.lhs, self.rhs
+
+        if is_term(lhs) and lhs.is_datetime and is_term(rhs) and rhs.is_scalar:
+            v = rhs.value
+            if isinstance(v, (int, float)):
+                v = stringify(v)
+            v = pd.Timestamp(_ensure_decoded(v))
+            if v.tz is not None:
+                v = v.tz_convert('UTC')
+            self.rhs.update(v)
+
+        if is_term(rhs) and rhs.is_datetime and is_term(lhs) and lhs.is_scalar:
+            v = lhs.value
+            if isinstance(v, (int, float)):
+                v = stringify(v)
+            v = pd.Timestamp(_ensure_decoded(v))
+            if v.tz is not None:
+                v = v.tz_convert('UTC')
+            self.lhs.update(v)
+
+    def _disallow_scalar_only_bool_ops(self):
+        if ((self.lhs.is_scalar or self.rhs.is_scalar) and
+            self.op in _bool_ops_dict and
+            (not (issubclass(self.rhs.return_type, (bool, np.bool_)) and
+                  issubclass(self.lhs.return_type, (bool, np.bool_))))):
+            raise NotImplementedError("cannot evaluate scalar only bool ops")
+
+
+def isnumeric(dtype):
+    return issubclass(np.dtype(dtype).type, np.number)
+
+
+class Div(BinOp):
+
+    """Div operator to special case casting.
+
+    Parameters
+    ----------
+    lhs, rhs : Term or Op
+        The Terms or Ops in the ``/`` expression.
+    truediv : bool
+        Whether or not to use true division. With Python 3 this happens
+        regardless of the value of ``truediv``.
+    """
+
+    def __init__(self, lhs, rhs, truediv, *args, **kwargs):
+        super(Div, self).__init__('/', lhs, rhs, *args, **kwargs)
+
+        if not isnumeric(lhs.return_type) or not isnumeric(rhs.return_type):
+            raise TypeError("unsupported operand type(s) for {0}:"
+                            " '{1}' and '{2}'".format(self.op,
+                                                      lhs.return_type,
+                                                      rhs.return_type))
+
+        if truediv or PY3:
+            # do not upcast float32s to float64 un-necessarily
+            acceptable_dtypes = [np.float32, np.float_]
+            _cast_inplace(com.flatten(self), acceptable_dtypes, np.float_)
+
+
+_unary_ops_syms = '+', '-', '~', 'not'
+_unary_ops_funcs = op.pos, op.neg, op.invert, op.invert
+_unary_ops_dict = dict(zip(_unary_ops_syms, _unary_ops_funcs))
+
+
+class UnaryOp(Op):
+
+    """Hold a unary operator and its operands
+
+    Parameters
+    ----------
+    op : str
+        The token used to represent the operator.
+    operand : Term or Op
+        The Term or Op operand to the operator.
+
+    Raises
+    ------
+    ValueError
+        * If no function associated with the passed operator token is found.
+    """
+
+    def __init__(self, op, operand):
+        super(UnaryOp, self).__init__(op, (operand,))
+        self.operand = operand
+
+        try:
+            self.func = _unary_ops_dict[op]
+        except KeyError:
+            raise ValueError('Invalid unary operator {0!r}, valid operators '
+                             'are {1}'.format(op, _unary_ops_syms))
+
+    def __call__(self, env):
+        operand = self.operand(env)
+        return self.func(operand)
+
+    def __unicode__(self):
+        return pprint_thing('{0}({1})'.format(self.op, self.operand))
+
+    @property
+    def return_type(self):
+        operand = self.operand
+        if operand.return_type == np.dtype('bool'):
+            return np.dtype('bool')
+        if (isinstance(operand, Op) and
+                (operand.op in _cmp_ops_dict or operand.op in _bool_ops_dict)):
+            return np.dtype('bool')
+        return np.dtype('int')
+
+
+class MathCall(Op):
+
+    def __init__(self, func, args):
+        super(MathCall, self).__init__(func.name, args)
+        self.func = func
+
+    def __call__(self, env):
+        operands = [op(env) for op in self.operands]
+        with np.errstate(all='ignore'):
+            return self.func.func(*operands)
+
+    def __unicode__(self):
+        operands = map(str, self.operands)
+        return pprint_thing('{0}({1})'.format(self.op, ','.join(operands)))
+
+
+class FuncNode(object):
+
+    def __init__(self, name):
+        if name not in _mathops:
+            raise ValueError(
+                "\"{0}\" is not a supported function".format(name))
+        self.name = name
+        self.func = getattr(np, name)
+
+    def __call__(self, *args):
+        return MathCall(self, args)
diff --git a/pandas/core/computation/pytables.py b/pandas/core/computation/pytables.py
new file mode 100644
index 0000000000000..26eefa75b2675
--- /dev/null
+++ b/pandas/core/computation/pytables.py
@@ -0,0 +1,601 @@
+""" manage PyTables query interface via Expressions """
+
+import ast
+from functools import partial
+import numpy as np
+import pandas as pd
+
+from pandas.core.dtypes.common import is_list_like
+import pandas.core.common as com
+from pandas.compat import u, string_types, DeepChainMap
+from pandas.core.base import StringMixin
+from pandas.io.formats.printing import pprint_thing, pprint_thing_encoded
+from pandas.core.computation import expr, ops
+from pandas.core.computation.ops import is_term, UndefinedVariableError
+from pandas.core.computation.expr import BaseExprVisitor
+from pandas.core.computation.common import _ensure_decoded
+from pandas.core.tools.timedeltas import _coerce_scalar_to_timedelta_type
+
+
+class Scope(expr.Scope):
+    __slots__ = 'queryables',
+
+    def __init__(self, level, global_dict=None, local_dict=None,
+                 queryables=None):
+        super(Scope, self).__init__(level + 1, global_dict=global_dict,
+                                    local_dict=local_dict)
+        self.queryables = queryables or dict()
+
+
+class Term(ops.Term):
+
+    def __new__(cls, name, env, side=None, encoding=None):
+        klass = Constant if not isinstance(name, string_types) else cls
+        supr_new = StringMixin.__new__
+        return supr_new(klass)
+
+    def __init__(self, name, env, side=None, encoding=None):
+        super(Term, self).__init__(name, env, side=side, encoding=encoding)
+
+    def _resolve_name(self):
+        # must be a queryables
+        if self.side == 'left':
+            if self.name not in self.env.queryables:
+                raise NameError('name {name!r} is not defined'
+                                .format(name=self.name))
+            return self.name
+
+        # resolve the rhs (and allow it to be None)
+        try:
+            return self.env.resolve(self.name, is_local=False)
+        except UndefinedVariableError:
+            return self.name
+
+    @property
+    def value(self):
+        return self._value
+
+
+class Constant(Term):
+
+    def __init__(self, value, env, side=None, encoding=None):
+        super(Constant, self).__init__(value, env, side=side,
+                                       encoding=encoding)
+
+    def _resolve_name(self):
+        return self._name
+
+
+class BinOp(ops.BinOp):
+
+    _max_selectors = 31
+
+    def __init__(self, op, lhs, rhs, queryables, encoding):
+        super(BinOp, self).__init__(op, lhs, rhs)
+        self.queryables = queryables
+        self.encoding = encoding
+        self.filter = None
+        self.condition = None
+
+    def _disallow_scalar_only_bool_ops(self):
+        pass
+
+    def prune(self, klass):
+
+        def pr(left, right):
+            """ create and return a new specialized BinOp from myself """
+
+            if left is None:
+                return right
+            elif right is None:
+                return left
+
+            k = klass
+            if isinstance(left, ConditionBinOp):
+                if (isinstance(left, ConditionBinOp) and
+                        isinstance(right, ConditionBinOp)):
+                    k = JointConditionBinOp
+                elif isinstance(left, k):
+                    return left
+                elif isinstance(right, k):
+                    return right
+
+            elif isinstance(left, FilterBinOp):
+                if (isinstance(left, FilterBinOp) and
+                        isinstance(right, FilterBinOp)):
+                    k = JointFilterBinOp
+                elif isinstance(left, k):
+                    return left
+                elif isinstance(right, k):
+                    return right
+
+            return k(self.op, left, right, queryables=self.queryables,
+                     encoding=self.encoding).evaluate()
+
+        left, right = self.lhs, self.rhs
+
+        if is_term(left) and is_term(right):
+            res = pr(left.value, right.value)
+        elif not is_term(left) and is_term(right):
+            res = pr(left.prune(klass), right.value)
+        elif is_term(left) and not is_term(right):
+            res = pr(left.value, right.prune(klass))
+        elif not (is_term(left) or is_term(right)):
+            res = pr(left.prune(klass), right.prune(klass))
+
+        return res
+
+    def conform(self, rhs):
+        """ inplace conform rhs """
+        if not is_list_like(rhs):
+            rhs = [rhs]
+        if isinstance(rhs, np.ndarray):
+            rhs = rhs.ravel()
+        return rhs
+
+    @property
+    def is_valid(self):
+        """ return True if this is a valid field """
+        return self.lhs in self.queryables
+
+    @property
+    def is_in_table(self):
+        """ return True if this is a valid column name for generation (e.g. an
+        actual column in the table) """
+        return self.queryables.get(self.lhs) is not None
+
+    @property
+    def kind(self):
+        """ the kind of my field """
+        return getattr(self.queryables.get(self.lhs), 'kind', None)
+
+    @property
+    def meta(self):
+        """ the meta of my field """
+        return getattr(self.queryables.get(self.lhs), 'meta', None)
+
+    @property
+    def metadata(self):
+        """ the metadata of my field """
+        return getattr(self.queryables.get(self.lhs), 'metadata', None)
+
+    def generate(self, v):
+        """ create and return the op string for this TermValue """
+        val = v.tostring(self.encoding)
+        return "({lhs} {op} {val})".format(lhs=self.lhs, op=self.op, val=val)
+
+    def convert_value(self, v):
+        """ convert the expression that is in the term to something that is
+        accepted by pytables """
+
+        def stringify(value):
+            if self.encoding is not None:
+                encoder = partial(pprint_thing_encoded,
+                                  encoding=self.encoding)
+            else:
+                encoder = pprint_thing
+            return encoder(value)
+
+        kind = _ensure_decoded(self.kind)
+        meta = _ensure_decoded(self.meta)
+        if kind == u('datetime64') or kind == u('datetime'):
+            if isinstance(v, (int, float)):
+                v = stringify(v)
+            v = _ensure_decoded(v)
+            v = pd.Timestamp(v)
+            if v.tz is not None:
+                v = v.tz_convert('UTC')
+            return TermValue(v, v.value, kind)
+        elif kind == u('timedelta64') or kind == u('timedelta'):
+            v = _coerce_scalar_to_timedelta_type(v, unit='s').value
+            return TermValue(int(v), v, kind)
+        elif meta == u('category'):
+            metadata = com._values_from_object(self.metadata)
+            result = metadata.searchsorted(v, side='left')
+
+            # result returns 0 if v is first element or if v is not in metadata
+            # check that metadata contains v
+            if not result and v not in metadata:
+                result = -1
+            return TermValue(result, result, u('integer'))
+        elif kind == u('integer'):
+            v = int(float(v))
+            return TermValue(v, v, kind)
+        elif kind == u('float'):
+            v = float(v)
+            return TermValue(v, v, kind)
+        elif kind == u('bool'):
+            if isinstance(v, string_types):
+                v = not v.strip().lower() in [u('false'), u('f'), u('no'),
+                                              u('n'), u('none'), u('0'),
+                                              u('[]'), u('{}'), u('')]
+            else:
+                v = bool(v)
+            return TermValue(v, v, kind)
+        elif isinstance(v, string_types):
+            # string quoting
+            return TermValue(v, stringify(v), u('string'))
+        else:
+            raise TypeError("Cannot compare {v} of type {typ} to {kind} column"
+                            .format(v=v, typ=type(v), kind=kind))
+
+    def convert_values(self):
+        pass
+
+
+class FilterBinOp(BinOp):
+
+    def __unicode__(self):
+        return pprint_thing("[Filter : [{lhs}] -> [{op}]"
+                            .format(lhs=self.filter[0], op=self.filter[1]))
+
+    def invert(self):
+        """ invert the filter """
+        if self.filter is not None:
+            f = list(self.filter)
+            f[1] = self.generate_filter_op(invert=True)
+            self.filter = tuple(f)
+        return self
+
+    def format(self):
+        """ return the actual filter format """
+        return [self.filter]
+
+    def evaluate(self):
+
+        if not self.is_valid:
+            raise ValueError("query term is not valid [{slf}]"
+                             .format(slf=self))
+
+        rhs = self.conform(self.rhs)
+        values = [TermValue(v, v, self.kind) for v in rhs]
+
+        if self.is_in_table:
+
+            # if too many values to create the expression, use a filter instead
+            if self.op in ['==', '!='] and len(values) > self._max_selectors:
+
+                filter_op = self.generate_filter_op()
+                self.filter = (
+                    self.lhs,
+                    filter_op,
+                    pd.Index([v.value for v in values]))
+
+                return self
+            return None
+
+        # equality conditions
+        if self.op in ['==', '!=']:
+
+            filter_op = self.generate_filter_op()
+            self.filter = (
+                self.lhs,
+                filter_op,
+                pd.Index([v.value for v in values]))
+
+        else:
+            raise TypeError("passing a filterable condition to a non-table "
+                            "indexer [{slf}]".format(slf=self))
+
+        return self
+
+    def generate_filter_op(self, invert=False):
+        if (self.op == '!=' and not invert) or (self.op == '==' and invert):
+            return lambda axis, vals: ~axis.isin(vals)
+        else:
+            return lambda axis, vals: axis.isin(vals)
+
+
+class JointFilterBinOp(FilterBinOp):
+
+    def format(self):
+        raise NotImplementedError("unable to collapse Joint Filters")
+
+    def evaluate(self):
+        return self
+
+
+class ConditionBinOp(BinOp):
+
+    def __unicode__(self):
+        return pprint_thing("[Condition : [{cond}]]"
+                            .format(cond=self.condition))
+
+    def invert(self):
+        """ invert the condition """
+        # if self.condition is not None:
+        #    self.condition = "~(%s)" % self.condition
+        # return self
+        raise NotImplementedError("cannot use an invert condition when "
+                                  "passing to numexpr")
+
+    def format(self):
+        """ return the actual ne format """
+        return self.condition
+
+    def evaluate(self):
+
+        if not self.is_valid:
+            raise ValueError("query term is not valid [{slf}]"
+                             .format(slf=self))
+
+        # convert values if we are in the table
+        if not self.is_in_table:
+            return None
+
+        rhs = self.conform(self.rhs)
+        values = [self.convert_value(v) for v in rhs]
+
+        # equality conditions
+        if self.op in ['==', '!=']:
+
+            # too many values to create the expression?
+            if len(values) <= self._max_selectors:
+                vs = [self.generate(v) for v in values]
+                self.condition = "({cond})".format(cond=' | '.join(vs))
+
+            # use a filter after reading
+            else:
+                return None
+        else:
+            self.condition = self.generate(values[0])
+
+        return self
+
+
+class JointConditionBinOp(ConditionBinOp):
+
+    def evaluate(self):
+        self.condition = "({lhs} {op} {rhs})".format(lhs=self.lhs.condition,
+                                                     op=self.op,
+                                                     rhs=self.rhs.condition)
+        return self
+
+
+class UnaryOp(ops.UnaryOp):
+
+    def prune(self, klass):
+
+        if self.op != '~':
+            raise NotImplementedError("UnaryOp only support invert type ops")
+
+        operand = self.operand
+        operand = operand.prune(klass)
+
+        if operand is not None:
+            if issubclass(klass, ConditionBinOp):
+                if operand.condition is not None:
+                    return operand.invert()
+            elif issubclass(klass, FilterBinOp):
+                if operand.filter is not None:
+                    return operand.invert()
+
+        return None
+
+
+_op_classes = {'unary': UnaryOp}
+
+
+class ExprVisitor(BaseExprVisitor):
+    const_type = Constant
+    term_type = Term
+
+    def __init__(self, env, engine, parser, **kwargs):
+        super(ExprVisitor, self).__init__(env, engine, parser)
+        for bin_op in self.binary_ops:
+            bin_node = self.binary_op_nodes_map[bin_op]
+            setattr(self, 'visit_{node}'.format(node=bin_node),
+                    lambda node, bin_op=bin_op: partial(BinOp, bin_op,
+                                                        **kwargs))
+
+    def visit_UnaryOp(self, node, **kwargs):
+        if isinstance(node.op, (ast.Not, ast.Invert)):
+            return UnaryOp('~', self.visit(node.operand))
+        elif isinstance(node.op, ast.USub):
+            return self.const_type(-self.visit(node.operand).value, self.env)
+        elif isinstance(node.op, ast.UAdd):
+            raise NotImplementedError('Unary addition not supported')
+
+    def visit_Index(self, node, **kwargs):
+        return self.visit(node.value).value
+
+    def visit_Assign(self, node, **kwargs):
+        cmpr = ast.Compare(ops=[ast.Eq()], left=node.targets[0],
+                           comparators=[node.value])
+        return self.visit(cmpr)
+
+    def visit_Subscript(self, node, **kwargs):
+        # only allow simple suscripts
+
+        value = self.visit(node.value)
+        slobj = self.visit(node.slice)
+        try:
+            value = value.value
+        except:
+            pass
+
+        try:
+            return self.const_type(value[slobj], self.env)
+        except TypeError:
+            raise ValueError("cannot subscript {value!r} with "
+                             "{slobj!r}".format(value=value, slobj=slobj))
+
+    def visit_Attribute(self, node, **kwargs):
+        attr = node.attr
+        value = node.value
+
+        ctx = node.ctx.__class__
+        if ctx == ast.Load:
+            # resolve the value
+            resolved = self.visit(value)
+
+            # try to get the value to see if we are another expression
+            try:
+                resolved = resolved.value
+            except (AttributeError):
+                pass
+
+            try:
+                return self.term_type(getattr(resolved, attr), self.env)
+            except AttributeError:
+
+                # something like datetime.datetime where scope is overridden
+                if isinstance(value, ast.Name) and value.id == attr:
+                    return resolved
+
+        raise ValueError("Invalid Attribute context {name}"
+                         .format(name=ctx.__name__))
+
+    def translate_In(self, op):
+        return ast.Eq() if isinstance(op, ast.In) else op
+
+    def _rewrite_membership_op(self, node, left, right):
+        return self.visit(node.op), node.op, left, right
+
+
+def _validate_where(w):
+    """
+    Validate that the where statement is of the right type.
+
+    The type may either be String, Expr, or list-like of Exprs.
+
+    Parameters
+    ----------
+    w : String term expression, Expr, or list-like of Exprs.
+
+    Returns
+    -------
+    where : The original where clause if the check was successful.
+
+    Raises
+    ------
+    TypeError : An invalid data type was passed in for w (e.g. dict).
+    """
+
+    if not (isinstance(w, (Expr, string_types)) or is_list_like(w)):
+        raise TypeError("where must be passed as a string, Expr, "
+                        "or list-like of Exprs")
+
+    return w
+
+
+class Expr(expr.Expr):
+
+    """ hold a pytables like expression, comprised of possibly multiple 'terms'
+
+    Parameters
+    ----------
+    where : string term expression, Expr, or list-like of Exprs
+    queryables : a "kinds" map (dict of column name -> kind), or None if column
+        is non-indexable
+    encoding : an encoding that will encode the query terms
+
+    Returns
+    -------
+    an Expr object
+
+    Examples
+    --------
+
+    'index>=date'
+    "columns=['A', 'D']"
+    'columns=A'
+    'columns==A'
+    "~(columns=['A','B'])"
+    'index>df.index[3] & string="bar"'
+    '(index>df.index[3] & index<=df.index[6]) | string="bar"'
+    "ts>=Timestamp('2012-02-01')"
+    "major_axis>=20130101"
+    """
+
+    def __init__(self, where, queryables=None, encoding=None, scope_level=0):
+
+        where = _validate_where(where)
+
+        self.encoding = encoding
+        self.condition = None
+        self.filter = None
+        self.terms = None
+        self._visitor = None
+
+        # capture the environment if needed
+        local_dict = DeepChainMap()
+
+        if isinstance(where, Expr):
+            local_dict = where.env.scope
+            where = where.expr
+
+        elif isinstance(where, (list, tuple)):
+            for idx, w in enumerate(where):
+                if isinstance(w, Expr):
+                    local_dict = w.env.scope
+                else:
+                    w = _validate_where(w)
+                    where[idx] = w
+            where = ' & '.join(map('({})'.format, com.flatten(where)))  # noqa
+
+        self.expr = where
+        self.env = Scope(scope_level + 1, local_dict=local_dict)
+
+        if queryables is not None and isinstance(self.expr, string_types):
+            self.env.queryables.update(queryables)
+            self._visitor = ExprVisitor(self.env, queryables=queryables,
+                                        parser='pytables', engine='pytables',
+                                        encoding=encoding)
+            self.terms = self.parse()
+
+    def __unicode__(self):
+        if self.terms is not None:
+            return pprint_thing(self.terms)
+        return pprint_thing(self.expr)
+
+    def evaluate(self):
+        """ create and return the numexpr condition and filter """
+
+        try:
+            self.condition = self.terms.prune(ConditionBinOp)
+        except AttributeError:
+            raise ValueError("cannot process expression [{expr}], [{slf}] "
+                             "is not a valid condition".format(expr=self.expr,
+                                                               slf=self))
+        try:
+            self.filter = self.terms.prune(FilterBinOp)
+        except AttributeError:
+            raise ValueError("cannot process expression [{expr}], [{slf}] "
+                             "is not a valid filter".format(expr=self.expr,
+                                                            slf=self))
+
+        return self.condition, self.filter
+
+
+class TermValue(object):
+
+    """ hold a term value the we use to construct a condition/filter """
+
+    def __init__(self, value, converted, kind):
+        self.value = value
+        self.converted = converted
+        self.kind = kind
+
+    def tostring(self, encoding):
+        """ quote the string if not encoded
+            else encode and return """
+        if self.kind == u'string':
+            if encoding is not None:
+                return self.converted
+            return '"{converted}"'.format(converted=self.converted)
+        elif self.kind == u'float':
+            # python 2 str(float) is not always
+            # round-trippable so use repr()
+            return repr(self.converted)
+        return self.converted
+
+
+def maybe_expression(s):
+    """ loose checking if s is a pytables-acceptable expression """
+    if not isinstance(s, string_types):
+        return False
+    ops = ExprVisitor.binary_ops + ExprVisitor.unary_ops + ('=',)
+
+    # make sure we have an op at least
+    return any(op in s for op in ops)
diff --git a/pandas/computation/scope.py b/pandas/core/computation/scope.py
similarity index 93%
rename from pandas/computation/scope.py
rename to pandas/core/computation/scope.py
index 875aaa959b264..c3128be0f5599 100644
--- a/pandas/computation/scope.py
+++ b/pandas/core/computation/scope.py
@@ -1,4 +1,5 @@
-"""Module for scope operations
+"""
+Module for scope operations
 """
 
 import sys
@@ -10,10 +11,11 @@
 
 import numpy as np
 
-import pandas as pd
+import pandas
+import pandas as pd  # noqa
 from pandas.compat import DeepChainMap, map, StringIO
 from pandas.core.base import StringMixin
-import pandas.computation as compu
+import pandas.core.computation as compu
 
 
 def _ensure_scope(level, global_dict=None, local_dict=None, resolvers=(),
@@ -46,7 +48,7 @@ def _raw_hex_id(obj):
 
 
 _DEFAULT_GLOBALS = {
-    'Timestamp': pd.lib.Timestamp,
+    'Timestamp': pandas._libs.tslib.Timestamp,
     'datetime': datetime.datetime,
     'True': True,
     'False': False,
@@ -135,8 +137,10 @@ def __init__(self, level, global_dict=None, local_dict=None, resolvers=(),
     def __unicode__(self):
         scope_keys = _get_pretty_string(list(self.scope.keys()))
         res_keys = _get_pretty_string(list(self.resolvers.keys()))
-        return '%s(scope=%s, resolvers=%s)' % (type(self).__name__, scope_keys,
-                                               res_keys)
+        unicode_str = '{name}(scope={scope_keys}, resolvers={res_keys})'
+        return unicode_str.format(name=type(self).__name__,
+                                  scope_keys=scope_keys,
+                                  res_keys=res_keys)
 
     @property
     def has_resolvers(self):
@@ -267,8 +271,9 @@ def add_tmp(self, value):
         name : basestring
             The name of the temporary variable created.
         """
-        name = '{0}_{1}_{2}'.format(type(value).__name__, self.ntemps,
-                                    _raw_hex_id(self))
+        name = '{name}_{num}_{hex_id}'.format(name=type(value).__name__,
+                                              num=self.ntemps,
+                                              hex_id=_raw_hex_id(self))
 
         # add to inner most scope
         assert name not in self.temps
diff --git a/pandas/core/config.py b/pandas/core/config.py
index e974689470c46..369e0568346ef 100644
--- a/pandas/core/config.py
+++ b/pandas/core/config.py
@@ -23,7 +23,7 @@
 - all options in a certain sub - namespace can be reset at once.
 - the user can set / get / reset or ask for the description of an option.
 - a developer can register and mark an option as deprecated.
-- you can register a callback to be invoked when the the option value
+- you can register a callback to be invoked when the option value
   is set or reset. Changing the stored value is considered misuse, but
   is not verboten.
 
@@ -33,8 +33,8 @@
 - Data is stored using nested dictionaries, and should be accessed
   through the provided API.
 
-- "Registered options" and "Deprecated options" have metadata associcated
-  with them, which are stored in auxilary dictionaries keyed on the
+- "Registered options" and "Deprecated options" have metadata associated
+  with them, which are stored in auxiliary dictionaries keyed on the
   fully-qualified key, e.g. "x.y.z.option".
 
 - the config_init module is imported by the package's __init__.py file.
@@ -57,8 +57,8 @@
 import pandas.compat as compat
 
 DeprecatedOption = namedtuple('DeprecatedOption', 'key msg rkey removal_ver')
-RegisteredOption = namedtuple(
-    'RegisteredOption', 'key defval doc validator cb')
+RegisteredOption = namedtuple('RegisteredOption',
+                              'key defval doc validator cb')
 
 _deprecated_options = {}  # holds deprecated option metdata
 _registered_options = {}  # holds registered option metdata
@@ -67,20 +67,20 @@
 
 
 class OptionError(AttributeError, KeyError):
-
     """Exception for pandas.options, backwards compatible with KeyError
-    checks"""
-
+    checks
+    """
 
 #
 # User API
 
+
 def _get_single_key(pat, silent):
     keys = _select_options(pat)
     if len(keys) == 0:
         if not silent:
             _warn_if_deprecated(pat)
-        raise OptionError('No such keys(s): %r' % pat)
+        raise OptionError('No such keys(s): {pat!r}'.format(pat=pat))
     if len(keys) > 1:
         raise OptionError('Pattern matched multiple keys')
     key = keys[0]
@@ -106,14 +106,14 @@ def _set_option(*args, **kwargs):
     nargs = len(args)
     if not nargs or nargs % 2 != 0:
         raise ValueError("Must provide an even number of non-keyword "
-                             "arguments")
+                         "arguments")
 
     # default to false
     silent = kwargs.pop('silent', False)
 
     if kwargs:
-        raise TypeError('_set_option() got an unexpected keyword '
-                'argument "{0}"'.format(list(kwargs.keys())[0]))
+        msg = '_set_option() got an unexpected keyword argument "{kwarg}"'
+        raise TypeError(msg.format(list(kwargs.keys())[0]))
 
     for k, v in zip(args[::2], args[1::2]):
         key = _get_single_key(k, silent)
@@ -127,7 +127,12 @@ def _set_option(*args, **kwargs):
         root[k] = v
 
         if o.cb:
-            o.cb(key)
+            if silent:
+                with warnings.catch_warnings(record=True):
+                    o.cb(key)
+            else:
+                o.cb(key)
+
 
 def _describe_option(pat='', _print_desc=True):
 
@@ -168,9 +173,7 @@ def get_default_val(pat):
 
 
 class DictWrapper(object):
-
-    """ provide attribute-style access to a nested dict
-    """
+    """ provide attribute-style access to a nested dict"""
 
     def __init__(self, d, prefix=""):
         object.__setattr__(self, "d", d)
@@ -193,7 +196,10 @@ def __getattr__(self, key):
         if prefix:
             prefix += "."
         prefix += key
-        v = object.__getattribute__(self, "d")[key]
+        try:
+            v = object.__getattribute__(self, "d")[key]
+        except KeyError:
+            raise OptionError("No such option")
         if isinstance(v, dict):
             return DictWrapper(v, prefix)
         else:
@@ -202,12 +208,11 @@ def __getattr__(self, key):
     def __dir__(self):
         return list(self.d.keys())
 
-
 # For user convenience,  we'd like to have the available options described
 # in the docstring. For dev convenience we'd like to generate the docstrings
 # dynamically instead of maintaining them by hand. To this, we use the
 # class below which wraps functions inside a callable, and converts
-# __doc__ into a propery function. The doctsrings below are templates
+# __doc__ into a property function. The doctsrings below are templates
 # using the py2.6+ advanced formatting syntax to plug in a concise list
 # of options, and option descriptions.
 
@@ -228,6 +233,7 @@ def __doc__(self):
         return self.__doc_tmpl__.format(opts_desc=opts_desc,
                                         opts_list=opts_list)
 
+
 _get_option_tmpl = """
 get_option(pat)
 
@@ -384,10 +390,8 @@ class option_context(object):
 
     def __init__(self, *args):
         if not (len(args) % 2 == 0 and len(args) >= 2):
-            raise ValueError(
-                'Need to invoke as'
-                'option_context(pat, val, [(pat, val), ...)).'
-            )
+            raise ValueError('Need to invoke as'
+                             'option_context(pat, val, [(pat, val), ...)).')
 
         self.ops = list(zip(args[::2], args[1::2]))
 
@@ -435,9 +439,11 @@ def register_option(key, defval, doc='', validator=None, cb=None):
     key = key.lower()
 
     if key in _registered_options:
-        raise OptionError("Option '%s' has already been registered" % key)
+        msg = "Option '{key}' has already been registered"
+        raise OptionError(msg.format(key=key))
     if key in _reserved_keys:
-        raise OptionError("Option '%s' is a reserved key" % key)
+        msg = "Option '{key}' is a reserved key"
+        raise OptionError(msg.format(key=key))
 
     # the default value should be legal
     if validator:
@@ -448,22 +454,21 @@ def register_option(key, defval, doc='', validator=None, cb=None):
 
     for k in path:
         if not bool(re.match('^' + tokenize.Name + '$', k)):
-            raise ValueError("%s is not a valid identifier" % k)
+            raise ValueError("{k} is not a valid identifier".format(k=k))
         if keyword.iskeyword(k):
-            raise ValueError("%s is a python keyword" % k)
+            raise ValueError("{k} is a python keyword".format(k=k))
 
     cursor = _global_config
+    msg = "Path prefix to option '{option}' is already an option"
     for i, p in enumerate(path[:-1]):
         if not isinstance(cursor, dict):
-            raise OptionError("Path prefix to option '%s' is already an option"
-                              % '.'.join(path[:i]))
+            raise OptionError(msg.format(option='.'.join(path[:i])))
         if p not in cursor:
             cursor[p] = {}
         cursor = cursor[p]
 
     if not isinstance(cursor, dict):
-        raise OptionError("Path prefix to option '%s' is already an option"
-                          % '.'.join(path[:-1]))
+        raise OptionError(msg.format(option='.'.join(path[:-1])))
 
     cursor[path[-1]] = defval  # initialize
 
@@ -515,15 +520,15 @@ def deprecate_option(key, msg=None, rkey=None, removal_ver=None):
     key = key.lower()
 
     if key in _deprecated_options:
-        raise OptionError("Option '%s' has already been defined as deprecated."
-                          % key)
+        msg = "Option '{key}' has already been defined as deprecated."
+        raise OptionError(msg.format(key=key))
 
     _deprecated_options[key] = DeprecatedOption(key, msg, rkey, removal_ver)
 
-
 #
 # functions internal to the module
 
+
 def _select_options(pat):
     """returns a list of keys matching `pat`
 
@@ -611,17 +616,18 @@ def _warn_if_deprecated(key):
     if d:
         if d.msg:
             print(d.msg)
-            warnings.warn(d.msg, DeprecationWarning)
+            warnings.warn(d.msg, FutureWarning)
         else:
-            msg = "'%s' is deprecated" % key
+            msg = "'{key}' is deprecated".format(key=key)
             if d.removal_ver:
-                msg += ' and will be removed in %s' % d.removal_ver
+                msg += (' and will be removed in {version}'
+                        .format(version=d.removal_ver))
             if d.rkey:
-                msg += ", please use '%s' instead." % d.rkey
+                msg += ", please use '{rkey}' instead.".format(rkey=d.rkey)
             else:
                 msg += ', please refrain from using it.'
 
-            warnings.warn(msg, DeprecationWarning)
+            warnings.warn(msg, FutureWarning)
         return True
     return False
 
@@ -632,7 +638,7 @@ def _build_option_description(k):
     o = _get_registered_option(k)
     d = _get_deprecated_option(k)
 
-    s = u('%s ') % k
+    s = u('{k} ').format(k=k)
 
     if o.doc:
         s += '\n'.join(o.doc.strip().split('\n'))
@@ -640,12 +646,13 @@ def _build_option_description(k):
         s += 'No description available.'
 
     if o:
-        s += u('\n    [default: %s] [currently: %s]') % (o.defval,
-                                                         _get_option(k, True))
+        s += (u('\n    [default: {default}] [currently: {current}]')
+              .format(default=o.defval, current=_get_option(k, True)))
 
     if d:
         s += u('\n    (Deprecated')
-        s += (u(', use `%s` instead.') % d.rkey if d.rkey else '')
+        s += (u(', use `{rkey}` instead.')
+              .format(rkey=d.rkey if d.rkey else ''))
         s += u(')')
 
     s += '\n\n'
@@ -681,14 +688,13 @@ def pp(name, ks):
     else:
         return s
 
-
 #
 # helpers
 
 
 @contextmanager
 def config_prefix(prefix):
-    """contextmanager for multiple invocations of API  with a common prefix
+    """contextmanager for multiple invocations of API with a common prefix
 
     supported API functions: (register / get / set )__option
 
@@ -717,9 +723,8 @@ def config_prefix(prefix):
     global register_option, get_option, set_option, reset_option
 
     def wrap(func):
-
         def inner(key, *args, **kwds):
-            pkey = '%s.%s' % (prefix, key)
+            pkey = '{prefix}.{key}'.format(prefix=prefix, key=key)
             return func(pkey, *args, **kwds)
 
         return inner
@@ -735,10 +740,10 @@ def inner(key, *args, **kwds):
     get_option = _get_option
     register_option = _register_option
 
-
 # These factories and methods are handy for use as the validator
 # arg in register_option
 
+
 def is_type_factory(_type):
     """
 
@@ -748,14 +753,15 @@ def is_type_factory(_type):
 
     Returns
     -------
-    validator - a function of a single argument x , which returns the
-                True if type(x) is equal to `_type`
+    validator - a function of a single argument x , which raises
+                ValueError if type(x) is not equal to `_type`
 
     """
 
     def inner(x):
         if type(x) != _type:
-            raise ValueError("Value must have type '%s'" % str(_type))
+            msg = "Value must have type '{typ!s}'"
+            raise ValueError(msg.format(typ=_type))
 
     return inner
 
@@ -769,34 +775,44 @@ def is_instance_factory(_type):
 
     Returns
     -------
-    validator - a function of a single argument x , which returns the
-                True if x is an instance of `_type`
+    validator - a function of a single argument x , which raises
+                ValueError if x is not an instance of `_type`
 
     """
     if isinstance(_type, (tuple, list)):
         _type = tuple(_type)
-        from pandas.core.common import pprint_thing
+        from pandas.io.formats.printing import pprint_thing
         type_repr = "|".join(map(pprint_thing, _type))
     else:
-        type_repr = "'%s'" % _type
+        type_repr = "'{typ}'".format(typ=_type)
 
     def inner(x):
         if not isinstance(x, _type):
-            raise ValueError("Value must be an instance of %s" % type_repr)
+            msg = "Value must be an instance of {type_repr}"
+            raise ValueError(msg.format(type_repr=type_repr))
 
     return inner
 
 
 def is_one_of_factory(legal_values):
+
+    callables = [c for c in legal_values if callable(c)]
+    legal_values = [c for c in legal_values if not callable(c)]
+
     def inner(x):
-        from pandas.core.common import pprint_thing as pp
-        if not x in legal_values:
-            pp_values = lmap(pp, legal_values)
-            raise ValueError("Value must be one of %s"
-                             % pp("|".join(pp_values)))
+        from pandas.io.formats.printing import pprint_thing as pp
+        if x not in legal_values:
+
+            if not any(c(x) for c in callables):
+                pp_values = pp("|".join(lmap(pp, legal_values)))
+                msg = "Value must be one of {pp_values}"
+                if len(callables):
+                    msg += " or a callable"
+                raise ValueError(msg.format(pp_values=pp_values))
 
     return inner
 
+
 # common type validators, for convenience
 # usage: register_option(... , validator = is_int)
 is_int = is_type_factory(int)
@@ -805,3 +821,21 @@ def inner(x):
 is_str = is_type_factory(str)
 is_unicode = is_type_factory(compat.text_type)
 is_text = is_instance_factory((str, bytes))
+
+
+def is_callable(obj):
+    """
+
+    Parameters
+    ----------
+    `obj` - the object to be checked
+
+    Returns
+    -------
+    validator - returns True if object is callable
+        raises ValueError otherwise.
+
+    """
+    if not callable(obj):
+        raise ValueError("Value must be a callable")
+    return True
diff --git a/pandas/core/config_init.py b/pandas/core/config_init.py
index 751a530ce73cc..b836a35b8cf29 100644
--- a/pandas/core/config_init.py
+++ b/pandas/core/config_init.py
@@ -9,14 +9,45 @@
 module is imported, register them here rather then in the module.
 
 """
-
 import pandas.core.config as cf
-from pandas.core.config import (is_int, is_bool, is_text, is_float,
-                                is_instance_factory, is_one_of_factory,
-                                get_default_val)
-from pandas.core.format import detect_console_encoding
+from pandas.core.config import (is_int, is_bool, is_text, is_instance_factory,
+                                is_one_of_factory, is_callable)
+from pandas.io.formats.console import detect_console_encoding
+from pandas.io.formats.terminal import is_terminal
+
+# compute
+
+use_bottleneck_doc = """
+: bool
+    Use the bottleneck library to accelerate if it is installed,
+    the default is True
+    Valid values: False,True
+"""
+
+
+def use_bottleneck_cb(key):
+    from pandas.core import nanops
+    nanops.set_use_bottleneck(cf.get_option(key))
+
+
+use_numexpr_doc = """
+: bool
+    Use the numexpr library to accelerate computation if it is installed,
+    the default is True
+    Valid values: False,True
+"""
 
 
+def use_numexpr_cb(key):
+    from pandas.core.computation import expressions
+    expressions.set_use_numexpr(cf.get_option(key))
+
+
+with cf.config_prefix('compute'):
+    cf.register_option('use_bottleneck', True, use_bottleneck_doc,
+                       validator=is_bool, cb=use_bottleneck_cb)
+    cf.register_option('use_numexpr', True, use_numexpr_doc,
+                       validator=is_bool, cb=use_numexpr_cb)
 #
 # options from the "display" namespace
 
@@ -61,8 +92,8 @@
 
 pc_max_categories_doc = """
 : int
-    This sets the maximum number of categories pandas should output when printing
-    out a `Categorical` or a Series of dtype "category".
+    This sets the maximum number of categories pandas should output when
+    printing out a `Categorical` or a Series of dtype "category".
 """
 
 pc_max_info_cols_doc = """
@@ -110,7 +141,7 @@
     The callable should accept a floating point number and return
     a string with the desired format of the number. This is used
     in some places like SeriesFormatter.
-    See core.format.EngFormatter for an example.
+    See formats.format.EngFormatter for an example.
 """
 
 max_colwidth_doc = """
@@ -139,29 +170,49 @@
     frame is truncated (e.g. not display all rows and/or columns)
 """
 
-pc_line_width_doc = """
-: int
-    Deprecated.
-"""
-
 pc_east_asian_width_doc = """
 : boolean
-    Whether to use the Unicode East Asian Width to calculate the display text width
+    Whether to use the Unicode East Asian Width to calculate the display text
+    width.
     Enabling this may affect to the performance (default: False)
 """
+
 pc_ambiguous_as_wide_doc = """
 : boolean
     Whether to handle Unicode characters belong to Ambiguous as Wide (width=2)
     (default: False)
 """
 
-pc_line_width_deprecation_warning = """\
-line_width has been deprecated, use display.width instead (currently both are
-identical)
+pc_latex_repr_doc = """
+: boolean
+    Whether to produce a latex DataFrame representation for jupyter
+    environments that support it.
+    (default: False)
 """
 
-pc_height_deprecation_warning = """\
-height has been deprecated.
+pc_table_schema_doc = """
+: boolean
+    Whether to publish a Table Schema representation for frontends
+    that support it.
+    (default: False)
+"""
+
+pc_html_border_doc = """
+: int
+    A ``border=value`` attribute is inserted in the ``<table>`` tag
+    for the DataFrame HTML repr.
+"""
+
+pc_html_border_deprecation_warning = """\
+html.border has been deprecated, use display.html.border instead
+(currently both are identical)
+"""
+
+pc_html_use_mathjax_doc = """\
+: boolean
+    When True, Jupyter notebook will process table contents using MathJax,
+    rendering mathematical expressions enclosed by the dollar symbol.
+    (default: True)
 """
 
 pc_width_doc = """
@@ -173,11 +224,6 @@
     terminal and hence it is not possible to correctly detect the width.
 """
 
-pc_height_doc = """
-: int
-    Deprecated.
-"""
-
 pc_chop_threshold_doc = """
 : float or None
     if set to a float value, all float values smaller then the given threshold
@@ -197,7 +243,8 @@
 : int or None
     df.info() will usually show null-counts for each column.
     For large frames this can be quite slow. max_info_rows and max_info_cols
-    limit this null check only to frames with smaller dimensions then specified.
+    limit this null check only to frames with smaller dimensions than
+    specified.
 """
 
 pc_large_repr_doc = """
@@ -207,56 +254,72 @@
     df.info() (the behaviour in earlier versions of pandas).
 """
 
-pc_mpl_style_doc = """
-: bool
-    Setting this to 'default' will modify the rcParams used by matplotlib
-    to give plots a more pleasing visual style by default.
-    Setting this to None/False restores the values to their initial value.
-"""
-
 pc_memory_usage_doc = """
-: bool or None
+: bool, string or None
     This specifies if the memory usage of a DataFrame should be displayed when
-    df.info() is called.
+    df.info() is called. Valid values True,False,'deep'
 """
 
-style_backup = dict()
+pc_latex_escape = """
+: bool
+    This specifies if the to_latex method of a Dataframe uses escapes special
+    characters.
+    Valid values: False,True
+"""
 
+pc_latex_longtable = """
+:bool
+    This specifies if the to_latex method of a Dataframe uses the longtable
+    format.
+    Valid values: False,True
+"""
 
-def mpl_style_cb(key):
-    import sys
-    from pandas.tools.plotting import mpl_stylesheet
-    global style_backup
+pc_latex_multicolumn = """
+: bool
+    This specifies if the to_latex method of a Dataframe uses multicolumns
+    to pretty-print MultiIndex columns.
+    Valid values: False,True
+"""
+
+pc_latex_multicolumn_format = """
+: string
+    This specifies the format for multicolumn headers.
+    Can be surrounded with '|'.
+    Valid values: 'l', 'c', 'r', 'p{<width>}'
+"""
 
-    val = cf.get_option(key)
+pc_latex_multirow = """
+: bool
+    This specifies if the to_latex method of a Dataframe uses multirows
+    to pretty-print MultiIndex rows.
+    Valid values: False,True
+"""
 
-    if 'matplotlib' not in sys.modules.keys():
-        if not(val):  # starting up, we get reset to None
-            return val
-        raise Exception("matplotlib has not been imported. aborting")
+style_backup = dict()
 
-    import matplotlib.pyplot as plt
 
-    if val == 'default':
-        style_backup = dict([(k, plt.rcParams[k]) for k in mpl_stylesheet])
-        plt.rcParams.update(mpl_stylesheet)
-    elif not val:
-        if style_backup:
-            plt.rcParams.update(style_backup)
+def table_schema_cb(key):
+    from pandas.io.formats.printing import _enable_data_resource_formatter
+    _enable_data_resource_formatter(cf.get_option(key))
 
-    return val
 
 with cf.config_prefix('display'):
     cf.register_option('precision', 6, pc_precision_doc, validator=is_int)
-    cf.register_option('float_format', None, float_format_doc)
+    cf.register_option('float_format', None, float_format_doc,
+                       validator=is_one_of_factory([None, is_callable]))
     cf.register_option('column_space', 12, validator=is_int)
     cf.register_option('max_info_rows', 1690785, pc_max_info_rows_doc,
                        validator=is_instance_factory((int, type(None))))
     cf.register_option('max_rows', 60, pc_max_rows_doc,
                        validator=is_instance_factory([type(None), int]))
-    cf.register_option('max_categories', 8, pc_max_categories_doc, validator=is_int)
+    cf.register_option('max_categories', 8, pc_max_categories_doc,
+                       validator=is_int)
     cf.register_option('max_colwidth', 50, max_colwidth_doc, validator=is_int)
-    cf.register_option('max_columns', 20, pc_max_cols_doc,
+    if is_terminal():
+        max_cols = 0  # automatically determine optimal number of columns
+    else:
+        max_cols = 20  # cannot determine optimal number of columns
+    cf.register_option('max_columns', max_cols, pc_max_cols_doc,
                        validator=is_instance_factory([type(None), int]))
     cf.register_option('large_repr', 'truncate', pc_large_repr_doc,
                        validator=is_one_of_factory(['truncate', 'info']))
@@ -281,42 +344,60 @@ def mpl_style_cb(key):
                        validator=is_one_of_factory([True, False, 'truncate']))
     cf.register_option('chop_threshold', None, pc_chop_threshold_doc)
     cf.register_option('max_seq_items', 100, pc_max_seq_items)
-    cf.register_option('mpl_style', None, pc_mpl_style_doc,
-                       validator=is_one_of_factory([None, False, 'default']),
-                       cb=mpl_style_cb)
-    cf.register_option('height', 60, pc_height_doc,
-                       validator=is_instance_factory([type(None), int]))
     cf.register_option('width', 80, pc_width_doc,
                        validator=is_instance_factory([type(None), int]))
-    # redirected to width, make defval identical
-    cf.register_option('line_width', get_default_val('display.width'),
-                       pc_line_width_doc)
     cf.register_option('memory_usage', True, pc_memory_usage_doc,
-                        validator=is_instance_factory([type(None), bool]))
+                       validator=is_one_of_factory([None, True,
+                                                    False, 'deep']))
     cf.register_option('unicode.east_asian_width', False,
                        pc_east_asian_width_doc, validator=is_bool)
     cf.register_option('unicode.ambiguous_as_wide', False,
                        pc_east_asian_width_doc, validator=is_bool)
+    cf.register_option('latex.repr', False,
+                       pc_latex_repr_doc, validator=is_bool)
+    cf.register_option('latex.escape', True, pc_latex_escape,
+                       validator=is_bool)
+    cf.register_option('latex.longtable', False, pc_latex_longtable,
+                       validator=is_bool)
+    cf.register_option('latex.multicolumn', True, pc_latex_multicolumn,
+                       validator=is_bool)
+    cf.register_option('latex.multicolumn_format', 'l', pc_latex_multicolumn,
+                       validator=is_text)
+    cf.register_option('latex.multirow', False, pc_latex_multirow,
+                       validator=is_bool)
+    cf.register_option('html.table_schema', False, pc_table_schema_doc,
+                       validator=is_bool, cb=table_schema_cb)
+    cf.register_option('html.border', 1, pc_html_border_doc,
+                       validator=is_int)
+    cf.register_option('html.use_mathjax', True, pc_html_use_mathjax_doc,
+                       validator=is_bool)
+
+with cf.config_prefix('html'):
+    cf.register_option('border', 1, pc_html_border_doc,
+                       validator=is_int)
 
-cf.deprecate_option('display.line_width',
-                    msg=pc_line_width_deprecation_warning,
-                    rkey='display.width')
+cf.deprecate_option('html.border', msg=pc_html_border_deprecation_warning,
+                    rkey='display.html.border')
 
-cf.deprecate_option('display.height',
-                    msg=pc_height_deprecation_warning,
-                    rkey='display.max_rows')
 
 tc_sim_interactive_doc = """
 : boolean
     Whether to simulate interactive mode for purposes of testing
 """
+
 with cf.config_prefix('mode'):
     cf.register_option('sim_interactive', False, tc_sim_interactive_doc)
 
 use_inf_as_null_doc = """
 : boolean
-    True means treat None, NaN, INF, -INF as null (old way),
-    False means None and NaN are null, but INF, -INF are not null
+    use_inf_as_null had been deprecated and will be removed in a future
+    version. Use `use_inf_as_na` instead.
+"""
+
+use_inf_as_na_doc = """
+: boolean
+    True means treat None, NaN, INF, -INF as NA (old way),
+    False means None and NaN are null, but INF, -INF are not NA
     (new way).
 """
 
@@ -324,13 +405,19 @@ def mpl_style_cb(key):
 # or we'll hit circular deps.
 
 
-def use_inf_as_null_cb(key):
-    from pandas.core.common import _use_inf_as_null
-    _use_inf_as_null(key)
+def use_inf_as_na_cb(key):
+    from pandas.core.dtypes.missing import _use_inf_as_na
+    _use_inf_as_na(key)
+
 
 with cf.config_prefix('mode'):
+    cf.register_option('use_inf_as_na', False, use_inf_as_na_doc,
+                       cb=use_inf_as_na_cb)
     cf.register_option('use_inf_as_null', False, use_inf_as_null_doc,
-                       cb=use_inf_as_null_cb)
+                       cb=use_inf_as_na_cb)
+
+cf.deprecate_option('mode.use_inf_as_null', msg=use_inf_as_null_doc,
+                    rkey='mode.use_inf_as_na')
 
 
 # user warnings
@@ -344,38 +431,75 @@ def use_inf_as_null_cb(key):
     cf.register_option('chained_assignment', 'warn', chained_assignment,
                        validator=is_one_of_factory([None, 'warn', 'raise']))
 
-
 # Set up the io.excel specific configuration.
 writer_engine_doc = """
 : string
     The default Excel writer engine for '{ext}' files. Available options:
-    '{default}' (the default){others}.
-"""
-
-with cf.config_prefix('io.excel'):
-    # going forward, will be additional writers
-    for ext, options in [('xls', ['xlwt']),
-                         ('xlsm', ['openpyxl'])]:
-        default = options.pop(0)
-        if options:
-            options = " " + ", ".join(options)
-        else:
-            options = ""
-        doc = writer_engine_doc.format(ext=ext, default=default,
-                                       others=options)
-        cf.register_option(ext + '.writer', default, doc, validator=str)
-
-    def _register_xlsx(engine, other):
-        cf.register_option('xlsx.writer', engine,
-                           writer_engine_doc.format(ext='xlsx',
-                                                    default=engine,
-                                                    others=", '%s'" % other),
-                           validator=str)
-
-    try:
-        # better memory footprint
-        import xlsxwriter
-        _register_xlsx('xlsxwriter', 'openpyxl')
-    except ImportError:
-        # fallback
-        _register_xlsx('openpyxl', 'xlsxwriter')
+    auto, {others}.
+"""
+
+_xls_options = ['xlwt']
+_xlsm_options = ['openpyxl']
+_xlsx_options = ['openpyxl', 'xlsxwriter']
+
+
+with cf.config_prefix("io.excel.xls"):
+    cf.register_option("writer", "auto",
+                       writer_engine_doc.format(
+                           ext='xls',
+                           others=', '.join(_xls_options)),
+                       validator=str)
+
+with cf.config_prefix("io.excel.xlsm"):
+    cf.register_option("writer", "auto",
+                       writer_engine_doc.format(
+                           ext='xlsm',
+                           others=', '.join(_xlsm_options)),
+                       validator=str)
+
+
+with cf.config_prefix("io.excel.xlsx"):
+    cf.register_option("writer", "auto",
+                       writer_engine_doc.format(
+                           ext='xlsx',
+                           others=', '.join(_xlsx_options)),
+                       validator=str)
+
+
+# Set up the io.parquet specific configuration.
+parquet_engine_doc = """
+: string
+    The default parquet reader/writer engine. Available options:
+    'auto', 'pyarrow', 'fastparquet', the default is 'auto'
+"""
+
+with cf.config_prefix('io.parquet'):
+    cf.register_option(
+        'engine', 'auto', parquet_engine_doc,
+        validator=is_one_of_factory(['auto', 'pyarrow', 'fastparquet']))
+
+# --------
+# Plotting
+# ---------
+
+register_converter_doc = """
+: bool
+    Whether to register converters with matplotlib's units registry for
+    dates, times, datetimes, and Periods. Toggling to False will remove
+    the converters, restoring any converters that pandas overwrote.
+"""
+
+
+def register_converter_cb(key):
+    from pandas.plotting import register_matplotlib_converters
+    from pandas.plotting import deregister_matplotlib_converters
+
+    if cf.get_option(key):
+        register_matplotlib_converters()
+    else:
+        deregister_matplotlib_converters()
+
+
+with cf.config_prefix("plotting.matplotlib"):
+    cf.register_option("register_converters", True, register_converter_doc,
+                       validator=bool, cb=register_converter_cb)
diff --git a/pandas/core/convert.py b/pandas/core/convert.py
deleted file mode 100644
index 3745d4f5f6914..0000000000000
--- a/pandas/core/convert.py
+++ /dev/null
@@ -1,132 +0,0 @@
-"""
-Functions for converting object to other types
-"""
-
-import numpy as np
-
-import pandas as pd
-from pandas.core.common import (_possibly_cast_to_datetime, is_object_dtype,
-                                isnull)
-import pandas.lib as lib
-
-# TODO: Remove in 0.18 or 2017, which ever is sooner
-def _possibly_convert_objects(values, convert_dates=True,
-                              convert_numeric=True,
-                              convert_timedeltas=True,
-                              copy=True):
-    """ if we have an object dtype, try to coerce dates and/or numbers """
-
-    # if we have passed in a list or scalar
-    if isinstance(values, (list, tuple)):
-        values = np.array(values, dtype=np.object_)
-    if not hasattr(values, 'dtype'):
-        values = np.array([values], dtype=np.object_)
-
-    # convert dates
-    if convert_dates and values.dtype == np.object_:
-
-        # we take an aggressive stance and convert to datetime64[ns]
-        if convert_dates == 'coerce':
-            new_values = _possibly_cast_to_datetime(
-                values, 'M8[ns]', errors='coerce')
-
-            # if we are all nans then leave me alone
-            if not isnull(new_values).all():
-                values = new_values
-
-        else:
-            values = lib.maybe_convert_objects(
-                values, convert_datetime=convert_dates)
-
-    # convert timedeltas
-    if convert_timedeltas and values.dtype == np.object_:
-
-        if convert_timedeltas == 'coerce':
-            from pandas.tseries.timedeltas import to_timedelta
-            new_values = to_timedelta(values, coerce=True)
-
-            # if we are all nans then leave me alone
-            if not isnull(new_values).all():
-                values = new_values
-
-        else:
-            values = lib.maybe_convert_objects(
-                values, convert_timedelta=convert_timedeltas)
-
-    # convert to numeric
-    if values.dtype == np.object_:
-        if convert_numeric:
-            try:
-                new_values = lib.maybe_convert_numeric(
-                    values, set(), coerce_numeric=True)
-
-                # if we are all nans then leave me alone
-                if not isnull(new_values).all():
-                    values = new_values
-
-            except:
-                pass
-        else:
-            # soft-conversion
-            values = lib.maybe_convert_objects(values)
-
-    values = values.copy() if copy else values
-
-    return values
-
-
-def _soft_convert_objects(values, datetime=True, numeric=True, timedelta=True,
-                          coerce=False, copy=True):
-    """ if we have an object dtype, try to coerce dates and/or numbers """
-
-    conversion_count = sum((datetime, numeric, timedelta))
-    if conversion_count == 0:
-        raise ValueError('At least one of datetime, numeric or timedelta must '
-                         'be True.')
-    elif conversion_count > 1 and coerce:
-            raise ValueError("Only one of 'datetime', 'numeric' or "
-                             "'timedelta' can be True when when coerce=True.")
-
-
-    if isinstance(values, (list, tuple)):
-        # List or scalar
-        values = np.array(values, dtype=np.object_)
-    elif not hasattr(values, 'dtype'):
-        values = np.array([values], dtype=np.object_)
-    elif not is_object_dtype(values.dtype):
-        # If not object, do not attempt conversion
-        values = values.copy() if copy else values
-        return values
-
-    # If 1 flag is coerce, ensure 2 others are False
-    if coerce:
-        # Immediate return if coerce
-        if datetime:
-            return pd.to_datetime(values, errors='coerce', box=False)
-        elif timedelta:
-            return pd.to_timedelta(values, errors='coerce', box=False)
-        elif numeric:
-            return pd.to_numeric(values, errors='coerce')
-
-    # Soft conversions
-    if datetime:
-        values = lib.maybe_convert_objects(values,
-                                           convert_datetime=datetime)
-
-    if timedelta and is_object_dtype(values.dtype):
-        # Object check to ensure only run if previous did not convert
-        values = lib.maybe_convert_objects(values,
-                                           convert_timedelta=timedelta)
-
-    if numeric and is_object_dtype(values.dtype):
-        try:
-            converted = lib.maybe_convert_numeric(values,
-                                                   set(),
-                                                   coerce_numeric=True)
-            # If all NaNs, then do not-alter
-            values = converted if not isnull(converted).all() else values
-            values = values.copy() if copy else values
-        except:
-            pass
-
-    return values
diff --git a/pandas/core/datetools.py b/pandas/core/datetools.py
index 28cd97f437f29..83167a45369c4 100644
--- a/pandas/core/datetools.py
+++ b/pandas/core/datetools.py
@@ -1,9 +1,21 @@
-"""A collection of random tools for dealing with dates in Python"""
+"""A collection of random tools for dealing with dates in Python.
 
-from pandas.tseries.tools import *
+.. deprecated:: 0.19.0
+    Use pandas.tseries module instead.
+"""
+
+# flake8: noqa
+
+import warnings
+
+from pandas.core.tools.datetimes import *
 from pandas.tseries.offsets import *
 from pandas.tseries.frequencies import *
 
+warnings.warn("The pandas.core.datetools module is deprecated and will be "
+              "removed in a future version. Please use the pandas.tseries "
+              "module instead.", FutureWarning, stacklevel=2)
+
 day = DateOffset()
 bday = BDay()
 businessDay = bday
diff --git a/pandas/core/dtypes.py b/pandas/core/dtypes.py
deleted file mode 100644
index 0b13471aadcfb..0000000000000
--- a/pandas/core/dtypes.py
+++ /dev/null
@@ -1,198 +0,0 @@
-""" define extension dtypes """
-
-import re
-import numpy as np
-from pandas import compat
-
-class ExtensionDtype(object):
-    """
-    A np.dtype duck-typed class, suitable for holding a custom dtype.
-
-    THIS IS NOT A REAL NUMPY DTYPE
-    """
-    name = None
-    names = None
-    type = None
-    subdtype = None
-    kind = None
-    str = None
-    num = 100
-    shape = tuple()
-    itemsize = 8
-    base = None
-    isbuiltin = 0
-    isnative = 0
-    _metadata = []
-
-    def __unicode__(self):
-        return self.name
-
-    def __str__(self):
-        """
-        Return a string representation for a particular Object
-
-        Invoked by str(df) in both py2/py3.
-        Yields Bytestring in Py2, Unicode String in py3.
-        """
-
-        if compat.PY3:
-            return self.__unicode__()
-        return self.__bytes__()
-
-    def __bytes__(self):
-        """
-        Return a string representation for a particular object.
-
-        Invoked by bytes(obj) in py3 only.
-        Yields a bytestring in both py2/py3.
-        """
-        from pandas.core.config import get_option
-
-        encoding = get_option("display.encoding")
-        return self.__unicode__().encode(encoding, 'replace')
-
-    def __repr__(self):
-        """
-        Return a string representation for a particular object.
-
-        Yields Bytestring in Py2, Unicode String in py3.
-        """
-        return str(self)
-
-    def __hash__(self):
-        raise NotImplementedError("sub-classes should implement an __hash__ method")
-
-    def __eq__(self, other):
-        raise NotImplementedError("sub-classes should implement an __eq__ method")
-
-    @classmethod
-    def is_dtype(cls, dtype):
-        """ Return a boolean if we if the passed type is an actual dtype that we can match (via string or type) """
-        if hasattr(dtype, 'dtype'):
-            dtype = dtype.dtype
-        if isinstance(dtype, cls):
-            return True
-        elif isinstance(dtype, np.dtype):
-            return False
-        try:
-            return cls.construct_from_string(dtype) is not None
-        except:
-            return False
-
-class CategoricalDtypeType(type):
-    """
-    the type of CategoricalDtype, this metaclass determines subclass ability
-    """
-    pass
-
-class CategoricalDtype(ExtensionDtype):
-
-    """
-    A np.dtype duck-typed class, suitable for holding a custom categorical dtype.
-
-    THIS IS NOT A REAL NUMPY DTYPE, but essentially a sub-class of np.object
-    """
-    name = 'category'
-    type = CategoricalDtypeType
-    kind = 'O'
-    str = '|O08'
-    base = np.dtype('O')
-
-    def __hash__(self):
-        # make myself hashable
-        return hash(str(self))
-
-    def __eq__(self, other):
-        if isinstance(other, compat.string_types):
-            return other == self.name
-
-        return isinstance(other, CategoricalDtype)
-
-    @classmethod
-    def construct_from_string(cls, string):
-        """ attempt to construct this type from a string, raise a TypeError if its not possible """
-        try:
-            if string == 'category':
-                return cls()
-        except:
-            pass
-
-        raise TypeError("cannot construct a CategoricalDtype")
-
-class DatetimeTZDtypeType(type):
-    """
-    the type of DatetimeTZDtype, this metaclass determines subclass ability
-    """
-    pass
-
-class DatetimeTZDtype(ExtensionDtype):
-
-    """
-    A np.dtype duck-typed class, suitable for holding a custom datetime with tz dtype.
-
-    THIS IS NOT A REAL NUMPY DTYPE, but essentially a sub-class of np.datetime64[ns]
-    """
-    type = DatetimeTZDtypeType
-    kind = 'M'
-    str = '|M8[ns]'
-    num = 101
-    base = np.dtype('M8[ns]')
-    _metadata = ['unit','tz']
-    _match = re.compile("(datetime64|M8)\[(?P<unit>.+), (?P<tz>.+)\]")
-
-    def __init__(self, unit, tz=None):
-        """
-        Parameters
-        ----------
-        unit : string unit that this represents, currently must be 'ns'
-        tz : string tz that this represents
-        """
-
-        if isinstance(unit, DatetimeTZDtype):
-            self.unit, self.tz = unit.unit, unit.tz
-            return
-
-        if tz is None:
-
-            # we were passed a string that we can construct
-            try:
-                m = self._match.search(unit)
-                if m is not None:
-                    self.unit = m.groupdict()['unit']
-                    self.tz = m.groupdict()['tz']
-                    return
-            except:
-                raise ValueError("could not construct DatetimeTZDtype")
-
-            raise ValueError("DatetimeTZDtype constructor must have a tz supplied")
-
-        if unit != 'ns':
-            raise ValueError("DatetimeTZDtype only supports ns units")
-        self.unit = unit
-        self.tz = tz
-
-    @classmethod
-    def construct_from_string(cls, string):
-        """ attempt to construct this type from a string, raise a TypeError if its not possible """
-        try:
-            return cls(unit=string)
-        except ValueError:
-            raise TypeError("could not construct DatetimeTZDtype")
-
-    def __unicode__(self):
-        # format the tz
-        return "datetime64[{unit}, {tz}]".format(unit=self.unit, tz=self.tz)
-
-    @property
-    def name(self):
-        return str(self)
-
-    def __hash__(self):
-        # make myself hashable
-        return hash(str(self))
-
-    def __eq__(self, other):
-        if isinstance(other, compat.string_types):
-            return other == self.name
-
-        return isinstance(other, DatetimeTZDtype) and self.unit == other.unit and self.tz == other.tz
diff --git a/pandas/io/tests/__init__.py b/pandas/core/dtypes/__init__.py
similarity index 100%
rename from pandas/io/tests/__init__.py
rename to pandas/core/dtypes/__init__.py
diff --git a/pandas/core/dtypes/api.py b/pandas/core/dtypes/api.py
new file mode 100644
index 0000000000000..738e1ea9062f6
--- /dev/null
+++ b/pandas/core/dtypes/api.py
@@ -0,0 +1,82 @@
+# flake8: noqa
+
+import sys
+
+from .common import (pandas_dtype,
+                     is_dtype_equal,
+                     is_extension_type,
+
+                     # categorical
+                     is_categorical,
+                     is_categorical_dtype,
+
+                     # interval
+                     is_interval,
+                     is_interval_dtype,
+
+                     # datetimelike
+                     is_datetimetz,
+                     is_datetime64_dtype,
+                     is_datetime64tz_dtype,
+                     is_datetime64_any_dtype,
+                     is_datetime64_ns_dtype,
+                     is_timedelta64_dtype,
+                     is_timedelta64_ns_dtype,
+                     is_period,
+                     is_period_dtype,
+
+                     # string-like
+                     is_string_dtype,
+                     is_object_dtype,
+
+                     # sparse
+                     is_sparse,
+
+                     # numeric types
+                     is_scalar,
+                     is_sparse,
+                     is_bool,
+                     is_integer,
+                     is_float,
+                     is_complex,
+                     is_number,
+                     is_integer_dtype,
+                     is_int64_dtype,
+                     is_numeric_dtype,
+                     is_float_dtype,
+                     is_bool_dtype,
+                     is_complex_dtype,
+                     is_signed_integer_dtype,
+                     is_unsigned_integer_dtype,
+
+                     # like
+                     is_re,
+                     is_re_compilable,
+                     is_dict_like,
+                     is_iterator,
+                     is_file_like,
+                     is_array_like,
+                     is_list_like,
+                     is_hashable,
+                     is_named_tuple)
+
+
+# deprecated
+m = sys.modules['pandas.core.dtypes.api']
+
+for t in ['is_any_int_dtype', 'is_floating_dtype', 'is_sequence']:
+
+    def outer(t=t):
+
+        def wrapper(arr_or_dtype):
+            import warnings
+            import pandas
+            warnings.warn("{t} is deprecated and will be "
+                          "removed in a future version".format(t=t),
+                          FutureWarning, stacklevel=3)
+            return getattr(pandas.core.dtypes.common, t)(arr_or_dtype)
+        return wrapper
+
+    setattr(m, t, outer(t))
+
+del sys, m, t, outer
diff --git a/pandas/core/dtypes/base.py b/pandas/core/dtypes/base.py
new file mode 100644
index 0000000000000..49e98c16c716e
--- /dev/null
+++ b/pandas/core/dtypes/base.py
@@ -0,0 +1,189 @@
+"""Extend pandas with custom array types"""
+import numpy as np
+
+from pandas import compat
+from pandas.errors import AbstractMethodError
+
+
+class _DtypeOpsMixin(object):
+    # Not all of pandas' extension dtypes are compatibile with
+    # the new ExtensionArray interface. This means PandasExtensionDtype
+    # can't subclass ExtensionDtype yet, as is_extension_array_dtype would
+    # incorrectly say that these types are extension types.
+    #
+    # In the interim, we put methods that are shared between the two base
+    # classes ExtensionDtype and PandasExtensionDtype here. Both those base
+    # classes will inherit from this Mixin. Once everything is compatible, this
+    # class's methods can be moved to ExtensionDtype and removed.
+
+    # na_value is the default NA value to use for this type. This is used in
+    # e.g. ExtensionArray.take. This should be the user-facing "boxed" version
+    # of the NA value, not the physical NA vaalue for storage.
+    # e.g. for JSONArray, this is an empty dictionary.
+    na_value = np.nan
+
+    def __eq__(self, other):
+        """Check whether 'other' is equal to self.
+
+        By default, 'other' is considered equal if
+
+        * it's a string matching 'self.name'.
+        * it's an instance of this type.
+
+        Parameters
+        ----------
+        other : Any
+
+        Returns
+        -------
+        bool
+        """
+        if isinstance(other, compat.string_types):
+            return other == self.name
+        elif isinstance(other, type(self)):
+            return True
+        else:
+            return False
+
+    def __ne__(self, other):
+        return not self.__eq__(other)
+
+    @property
+    def names(self):
+        # type: () -> Optional[List[str]]
+        """Ordered list of field names, or None if there are no fields.
+
+        This is for compatibility with NumPy arrays, and may be removed in the
+        future.
+        """
+        return None
+
+    @classmethod
+    def is_dtype(cls, dtype):
+        """Check if we match 'dtype'.
+
+        Parameters
+        ----------
+        dtype : object
+            The object to check.
+
+        Returns
+        -------
+        is_dtype : bool
+
+        Notes
+        -----
+        The default implementation is True if
+
+        1. ``cls.construct_from_string(dtype)`` is an instance
+           of ``cls``.
+        2. ``dtype`` is an object and is an instance of ``cls``
+        3. ``dtype`` has a ``dtype`` attribute, and any of the above
+           conditions is true for ``dtype.dtype``.
+        """
+        dtype = getattr(dtype, 'dtype', dtype)
+
+        if isinstance(dtype, np.dtype):
+            return False
+        elif dtype is None:
+            return False
+        elif isinstance(dtype, cls):
+            return True
+        try:
+            return cls.construct_from_string(dtype) is not None
+        except TypeError:
+            return False
+
+
+class ExtensionDtype(_DtypeOpsMixin):
+    """A custom data type, to be paired with an ExtensionArray.
+
+    .. versionadded:: 0.23.0
+
+    Notes
+    -----
+    The interface includes the following abstract methods that must
+    be implemented by subclasses:
+
+    * type
+    * name
+    * construct_from_string
+
+    The `na_value` class attribute can be used to set the default NA value
+    for this type. :attr:`numpy.nan` is used by default.
+
+    This class does not inherit from 'abc.ABCMeta' for performance reasons.
+    Methods and properties required by the interface raise
+    ``pandas.errors.AbstractMethodError`` and no ``register`` method is
+    provided for registering virtual subclasses.
+    """
+
+    def __str__(self):
+        return self.name
+
+    @property
+    def type(self):
+        # type: () -> type
+        """The scalar type for the array, e.g. ``int``
+
+        It's expected ``ExtensionArray[item]`` returns an instance
+        of ``ExtensionDtype.type`` for scalar ``item``.
+        """
+        raise AbstractMethodError(self)
+
+    @property
+    def kind(self):
+        # type () -> str
+        """A character code (one of 'biufcmMOSUV'), default 'O'
+
+        This should match the NumPy dtype used when the array is
+        converted to an ndarray, which is probably 'O' for object if
+        the extension type cannot be represented as a built-in NumPy
+        type.
+
+        See Also
+        --------
+        numpy.dtype.kind
+        """
+        return 'O'
+
+    @property
+    def name(self):
+        # type: () -> str
+        """A string identifying the data type.
+
+        Will be used for display in, e.g. ``Series.dtype``
+        """
+        raise AbstractMethodError(self)
+
+    @classmethod
+    def construct_from_string(cls, string):
+        """Attempt to construct this type from a string.
+
+        Parameters
+        ----------
+        string : str
+
+        Returns
+        -------
+        self : instance of 'cls'
+
+        Raises
+        ------
+        TypeError
+            If a class cannot be constructed from this 'string'.
+
+        Examples
+        --------
+        If the extension dtype can be constructed without any arguments,
+        the following may be an adequate implementation.
+
+        >>> @classmethod
+        ... def construct_from_string(cls, string)
+        ...     if string == cls.name:
+        ...         return cls()
+        ...     else:
+        ...         raise TypeError("Cannot construct a '{}' from "
+        ...                         "'{}'".format(cls, string))
+        """
+        raise AbstractMethodError(cls)
diff --git a/pandas/core/dtypes/cast.py b/pandas/core/dtypes/cast.py
new file mode 100644
index 0000000000000..65328dfc7347e
--- /dev/null
+++ b/pandas/core/dtypes/cast.py
@@ -0,0 +1,1343 @@
+""" routings for casting """
+
+from datetime import datetime, timedelta
+
+import numpy as np
+import warnings
+
+from pandas._libs import tslib, lib
+from pandas._libs.tslib import iNaT
+from pandas.compat import string_types, text_type, PY3
+from .common import (_ensure_object, is_bool, is_integer, is_float,
+                     is_complex, is_datetimetz, is_categorical_dtype,
+                     is_datetimelike,
+                     is_extension_type,
+                     is_extension_array_dtype,
+                     is_object_dtype,
+                     is_datetime64tz_dtype, is_datetime64_dtype,
+                     is_datetime64_ns_dtype,
+                     is_timedelta64_dtype, is_timedelta64_ns_dtype,
+                     is_dtype_equal,
+                     is_float_dtype, is_complex_dtype,
+                     is_integer_dtype,
+                     is_unsigned_integer_dtype,
+                     is_datetime_or_timedelta_dtype,
+                     is_bool_dtype, is_scalar,
+                     is_string_dtype, _string_dtypes,
+                     pandas_dtype,
+                     _ensure_int8, _ensure_int16,
+                     _ensure_int32, _ensure_int64,
+                     _NS_DTYPE, _TD_DTYPE, _INT64_DTYPE,
+                     _POSSIBLY_CAST_DTYPES)
+from .dtypes import (ExtensionDtype, PandasExtensionDtype, DatetimeTZDtype,
+                     PeriodDtype)
+from .generic import (ABCDatetimeIndex, ABCPeriodIndex,
+                      ABCSeries)
+from .missing import isna, notna
+from .inference import is_list_like
+
+_int8_max = np.iinfo(np.int8).max
+_int16_max = np.iinfo(np.int16).max
+_int32_max = np.iinfo(np.int32).max
+_int64_max = np.iinfo(np.int64).max
+
+
+def maybe_convert_platform(values):
+    """ try to do platform conversion, allow ndarray or list here """
+
+    if isinstance(values, (list, tuple)):
+        values = construct_1d_object_array_from_listlike(list(values))
+    if getattr(values, 'dtype', None) == np.object_:
+        if hasattr(values, '_values'):
+            values = values._values
+        values = lib.maybe_convert_objects(values)
+
+    return values
+
+
+def is_nested_object(obj):
+    """
+    return a boolean if we have a nested object, e.g. a Series with 1 or
+    more Series elements
+
+    This may not be necessarily be performant.
+
+    """
+
+    if isinstance(obj, ABCSeries) and is_object_dtype(obj):
+
+        if any(isinstance(v, ABCSeries) for v in obj.values):
+            return True
+
+    return False
+
+
+def maybe_downcast_to_dtype(result, dtype):
+    """ try to cast to the specified dtype (e.g. convert back to bool/int
+    or could be an astype of float64->float32
+    """
+
+    if is_scalar(result):
+        return result
+
+    def trans(x):
+        return x
+
+    if isinstance(dtype, string_types):
+        if dtype == 'infer':
+            inferred_type = lib.infer_dtype(_ensure_object(result.ravel()))
+            if inferred_type == 'boolean':
+                dtype = 'bool'
+            elif inferred_type == 'integer':
+                dtype = 'int64'
+            elif inferred_type == 'datetime64':
+                dtype = 'datetime64[ns]'
+            elif inferred_type == 'timedelta64':
+                dtype = 'timedelta64[ns]'
+
+            # try to upcast here
+            elif inferred_type == 'floating':
+                dtype = 'int64'
+                if issubclass(result.dtype.type, np.number):
+
+                    def trans(x):  # noqa
+                        return x.round()
+            else:
+                dtype = 'object'
+
+    if isinstance(dtype, string_types):
+        dtype = np.dtype(dtype)
+
+    try:
+
+        # don't allow upcasts here (except if empty)
+        if dtype.kind == result.dtype.kind:
+            if (result.dtype.itemsize <= dtype.itemsize and
+                    np.prod(result.shape)):
+                return result
+
+        if is_bool_dtype(dtype) or is_integer_dtype(dtype):
+
+            # if we don't have any elements, just astype it
+            if not np.prod(result.shape):
+                return trans(result).astype(dtype)
+
+            # do a test on the first element, if it fails then we are done
+            r = result.ravel()
+            arr = np.array([r[0]])
+
+            # if we have any nulls, then we are done
+            if (isna(arr).any() or
+                    not np.allclose(arr, trans(arr).astype(dtype), rtol=0)):
+                return result
+
+            # a comparable, e.g. a Decimal may slip in here
+            elif not isinstance(r[0], (np.integer, np.floating, np.bool, int,
+                                       float, bool)):
+                return result
+
+            if (issubclass(result.dtype.type, (np.object_, np.number)) and
+                    notna(result).all()):
+                new_result = trans(result).astype(dtype)
+                try:
+                    if np.allclose(new_result, result, rtol=0):
+                        return new_result
+                except Exception:
+
+                    # comparison of an object dtype with a number type could
+                    # hit here
+                    if (new_result == result).all():
+                        return new_result
+        elif (issubclass(dtype.type, np.floating) and
+                not is_bool_dtype(result.dtype)):
+            return result.astype(dtype)
+
+        # a datetimelike
+        # GH12821, iNaT is casted to float
+        elif dtype.kind in ['M', 'm'] and result.dtype.kind in ['i', 'f']:
+            try:
+                result = result.astype(dtype)
+            except Exception:
+                if dtype.tz:
+                    # convert to datetime and change timezone
+                    from pandas import to_datetime
+                    result = to_datetime(result).tz_localize('utc')
+                    result = result.tz_convert(dtype.tz)
+
+    except Exception:
+        pass
+
+    return result
+
+
+def maybe_upcast_putmask(result, mask, other):
+    """
+    A safe version of putmask that potentially upcasts the result
+
+    Parameters
+    ----------
+    result : ndarray
+        The destination array. This will be mutated in-place if no upcasting is
+        necessary.
+    mask : boolean ndarray
+    other : ndarray or scalar
+        The source array or value
+
+    Returns
+    -------
+    result : ndarray
+    changed : boolean
+        Set to true if the result array was upcasted
+    """
+
+    if mask.any():
+        # Two conversions for date-like dtypes that can't be done automatically
+        # in np.place:
+        #   NaN -> NaT
+        #   integer or integer array -> date-like array
+        if is_datetimelike(result.dtype):
+            if is_scalar(other):
+                if isna(other):
+                    other = result.dtype.type('nat')
+                elif is_integer(other):
+                    other = np.array(other, dtype=result.dtype)
+            elif is_integer_dtype(other):
+                other = np.array(other, dtype=result.dtype)
+
+        def changeit():
+
+            # try to directly set by expanding our array to full
+            # length of the boolean
+            try:
+                om = other[mask]
+                om_at = om.astype(result.dtype)
+                if (om == om_at).all():
+                    new_result = result.values.copy()
+                    new_result[mask] = om_at
+                    result[:] = new_result
+                    return result, False
+            except Exception:
+                pass
+
+            # we are forced to change the dtype of the result as the input
+            # isn't compatible
+            r, _ = maybe_upcast(result, fill_value=other, copy=True)
+            np.place(r, mask, other)
+
+            return r, True
+
+        # we want to decide whether place will work
+        # if we have nans in the False portion of our mask then we need to
+        # upcast (possibly), otherwise we DON't want to upcast (e.g. if we
+        # have values, say integers, in the success portion then it's ok to not
+        # upcast)
+        new_dtype, _ = maybe_promote(result.dtype, other)
+        if new_dtype != result.dtype:
+
+            # we have a scalar or len 0 ndarray
+            # and its nan and we are changing some values
+            if (is_scalar(other) or
+                    (isinstance(other, np.ndarray) and other.ndim < 1)):
+                if isna(other):
+                    return changeit()
+
+            # we have an ndarray and the masking has nans in it
+            else:
+
+                if isna(other[mask]).any():
+                    return changeit()
+
+        try:
+            np.place(result, mask, other)
+        except Exception:
+            return changeit()
+
+    return result, False
+
+
+def maybe_promote(dtype, fill_value=np.nan):
+    # if we passed an array here, determine the fill value by dtype
+    if isinstance(fill_value, np.ndarray):
+        if issubclass(fill_value.dtype.type, (np.datetime64, np.timedelta64)):
+            fill_value = iNaT
+        else:
+
+            # we need to change to object type as our
+            # fill_value is of object type
+            if fill_value.dtype == np.object_:
+                dtype = np.dtype(np.object_)
+            fill_value = np.nan
+
+    # returns tuple of (dtype, fill_value)
+    if issubclass(dtype.type, (np.datetime64, np.timedelta64)):
+        # for now: refuse to upcast datetime64
+        # (this is because datetime64 will not implicitly upconvert
+        #  to object correctly as of numpy 1.6.1)
+        if isna(fill_value):
+            fill_value = iNaT
+        else:
+            if issubclass(dtype.type, np.datetime64):
+                try:
+                    fill_value = tslib.Timestamp(fill_value).value
+                except Exception:
+                    # the proper thing to do here would probably be to upcast
+                    # to object (but numpy 1.6.1 doesn't do this properly)
+                    fill_value = iNaT
+            elif issubclass(dtype.type, np.timedelta64):
+                try:
+                    fill_value = tslib.Timedelta(fill_value).value
+                except Exception:
+                    # as for datetimes, cannot upcast to object
+                    fill_value = iNaT
+            else:
+                fill_value = iNaT
+    elif is_datetimetz(dtype):
+        if isna(fill_value):
+            fill_value = iNaT
+    elif is_extension_array_dtype(dtype) and isna(fill_value):
+        fill_value = dtype.na_value
+    elif is_float(fill_value):
+        if issubclass(dtype.type, np.bool_):
+            dtype = np.object_
+        elif issubclass(dtype.type, np.integer):
+            dtype = np.float64
+    elif is_bool(fill_value):
+        if not issubclass(dtype.type, np.bool_):
+            dtype = np.object_
+    elif is_integer(fill_value):
+        if issubclass(dtype.type, np.bool_):
+            dtype = np.object_
+        elif issubclass(dtype.type, np.integer):
+            # upcast to prevent overflow
+            arr = np.asarray(fill_value)
+            if arr != arr.astype(dtype):
+                dtype = arr.dtype
+    elif is_complex(fill_value):
+        if issubclass(dtype.type, np.bool_):
+            dtype = np.object_
+        elif issubclass(dtype.type, (np.integer, np.floating)):
+            dtype = np.complex128
+    elif fill_value is None:
+        if is_float_dtype(dtype) or is_complex_dtype(dtype):
+            fill_value = np.nan
+        elif is_integer_dtype(dtype):
+            dtype = np.float64
+            fill_value = np.nan
+        elif is_datetime_or_timedelta_dtype(dtype):
+            fill_value = iNaT
+        else:
+            dtype = np.object_
+            fill_value = np.nan
+    else:
+        dtype = np.object_
+
+    # in case we have a string that looked like a number
+    if is_extension_array_dtype(dtype):
+        pass
+    elif is_datetimetz(dtype):
+        pass
+    elif issubclass(np.dtype(dtype).type, string_types):
+        dtype = np.object_
+
+    return dtype, fill_value
+
+
+def infer_dtype_from(val, pandas_dtype=False):
+    """
+    interpret the dtype from a scalar or array. This is a convenience
+    routines to infer dtype from a scalar or an array
+
+    Parameters
+    ----------
+    pandas_dtype : bool, default False
+        whether to infer dtype including pandas extension types.
+        If False, scalar/array belongs to pandas extension types is inferred as
+        object
+    """
+    if is_scalar(val):
+        return infer_dtype_from_scalar(val, pandas_dtype=pandas_dtype)
+    return infer_dtype_from_array(val, pandas_dtype=pandas_dtype)
+
+
+def infer_dtype_from_scalar(val, pandas_dtype=False):
+    """
+    interpret the dtype from a scalar
+
+    Parameters
+    ----------
+    pandas_dtype : bool, default False
+        whether to infer dtype including pandas extension types.
+        If False, scalar belongs to pandas extension types is inferred as
+        object
+    """
+
+    dtype = np.object_
+
+    # a 1-element ndarray
+    if isinstance(val, np.ndarray):
+        msg = "invalid ndarray passed to _infer_dtype_from_scalar"
+        if val.ndim != 0:
+            raise ValueError(msg)
+
+        dtype = val.dtype
+        val = val.item()
+
+    elif isinstance(val, string_types):
+
+        # If we create an empty array using a string to infer
+        # the dtype, NumPy will only allocate one character per entry
+        # so this is kind of bad. Alternately we could use np.repeat
+        # instead of np.empty (but then you still don't want things
+        # coming out as np.str_!
+
+        dtype = np.object_
+
+    elif isinstance(val, (np.datetime64, datetime)):
+        val = tslib.Timestamp(val)
+        if val is tslib.NaT or val.tz is None:
+            dtype = np.dtype('M8[ns]')
+        else:
+            if pandas_dtype:
+                dtype = DatetimeTZDtype(unit='ns', tz=val.tz)
+            else:
+                # return datetimetz as object
+                return np.object_, val
+        val = val.value
+
+    elif isinstance(val, (np.timedelta64, timedelta)):
+        val = tslib.Timedelta(val).value
+        dtype = np.dtype('m8[ns]')
+
+    elif is_bool(val):
+        dtype = np.bool_
+
+    elif is_integer(val):
+        if isinstance(val, np.integer):
+            dtype = type(val)
+        else:
+            dtype = np.int64
+
+    elif is_float(val):
+        if isinstance(val, np.floating):
+            dtype = type(val)
+        else:
+            dtype = np.float64
+
+    elif is_complex(val):
+        dtype = np.complex_
+
+    elif pandas_dtype:
+        if lib.is_period(val):
+            dtype = PeriodDtype(freq=val.freq)
+            val = val.ordinal
+
+    return dtype, val
+
+
+def infer_dtype_from_array(arr, pandas_dtype=False):
+    """
+    infer the dtype from a scalar or array
+
+    Parameters
+    ----------
+    arr : scalar or array
+    pandas_dtype : bool, default False
+        whether to infer dtype including pandas extension types.
+        If False, array belongs to pandas extension types
+        is inferred as object
+
+    Returns
+    -------
+    tuple (numpy-compat/pandas-compat dtype, array)
+
+    Notes
+    -----
+    if pandas_dtype=False. these infer to numpy dtypes
+    exactly with the exception that mixed / object dtypes
+    are not coerced by stringifying or conversion
+
+    if pandas_dtype=True. datetime64tz-aware/categorical
+    types will retain there character.
+
+    Examples
+    --------
+    >>> np.asarray([1, '1'])
+    array(['1', '1'], dtype='<U21')
+
+    >>> infer_dtype_from_array([1, '1'])
+    (numpy.object_, [1, '1'])
+
+    """
+
+    if isinstance(arr, np.ndarray):
+        return arr.dtype, arr
+
+    if not is_list_like(arr):
+        arr = [arr]
+
+    if pandas_dtype and is_extension_type(arr):
+        return arr.dtype, arr
+
+    elif isinstance(arr, ABCSeries):
+        return arr.dtype, np.asarray(arr)
+
+    # don't force numpy coerce with nan's
+    inferred = lib.infer_dtype(arr)
+    if inferred in ['string', 'bytes', 'unicode',
+                    'mixed', 'mixed-integer']:
+        return (np.object_, arr)
+
+    arr = np.asarray(arr)
+    return arr.dtype, arr
+
+
+def maybe_infer_dtype_type(element):
+    """Try to infer an object's dtype, for use in arithmetic ops
+
+    Uses `element.dtype` if that's available.
+    Objects implementing the iterator protocol are cast to a NumPy array,
+    and from there the array's type is used.
+
+    Parameters
+    ----------
+    element : object
+        Possibly has a `.dtype` attribute, and possibly the iterator
+        protocol.
+
+    Returns
+    -------
+    tipo : type
+
+    Examples
+    --------
+    >>> from collections import namedtuple
+    >>> Foo = namedtuple("Foo", "dtype")
+    >>> maybe_infer_dtype_type(Foo(np.dtype("i8")))
+    numpy.int64
+    """
+    tipo = None
+    if hasattr(element, 'dtype'):
+        tipo = element.dtype
+    elif is_list_like(element):
+        element = np.asarray(element)
+        tipo = element.dtype
+    return tipo
+
+
+def maybe_upcast(values, fill_value=np.nan, dtype=None, copy=False):
+    """ provide explicit type promotion and coercion
+
+    Parameters
+    ----------
+    values : the ndarray that we want to maybe upcast
+    fill_value : what we want to fill with
+    dtype : if None, then use the dtype of the values, else coerce to this type
+    copy : if True always make a copy even if no upcast is required
+    """
+
+    if is_extension_type(values):
+        if copy:
+            values = values.copy()
+    else:
+        if dtype is None:
+            dtype = values.dtype
+        new_dtype, fill_value = maybe_promote(dtype, fill_value)
+        if new_dtype != values.dtype:
+            values = values.astype(new_dtype)
+        elif copy:
+            values = values.copy()
+
+    return values, fill_value
+
+
+def maybe_cast_item(obj, item, dtype):
+    chunk = obj[item]
+
+    if chunk.values.dtype != dtype:
+        if dtype in (np.object_, np.bool_):
+            obj[item] = chunk.astype(np.object_)
+        elif not issubclass(dtype, (np.integer, np.bool_)):  # pragma: no cover
+            raise ValueError("Unexpected dtype encountered: {dtype}"
+                             .format(dtype=dtype))
+
+
+def invalidate_string_dtypes(dtype_set):
+    """Change string like dtypes to object for
+    ``DataFrame.select_dtypes()``.
+    """
+    non_string_dtypes = dtype_set - _string_dtypes
+    if non_string_dtypes != dtype_set:
+        raise TypeError("string dtypes are not allowed, use 'object' instead")
+
+
+def maybe_convert_string_to_object(values):
+    """
+
+    Convert string-like and string-like array to convert object dtype.
+    This is to avoid numpy to handle the array as str dtype.
+    """
+    if isinstance(values, string_types):
+        values = np.array([values], dtype=object)
+    elif (isinstance(values, np.ndarray) and
+          issubclass(values.dtype.type, (np.string_, np.unicode_))):
+        values = values.astype(object)
+    return values
+
+
+def maybe_convert_scalar(values):
+    """
+    Convert a python scalar to the appropriate numpy dtype if possible
+    This avoids numpy directly converting according to platform preferences
+    """
+    if is_scalar(values):
+        dtype, values = infer_dtype_from_scalar(values)
+        try:
+            values = dtype(values)
+        except TypeError:
+            pass
+    return values
+
+
+def coerce_indexer_dtype(indexer, categories):
+    """ coerce the indexer input array to the smallest dtype possible """
+    length = len(categories)
+    if length < _int8_max:
+        return _ensure_int8(indexer)
+    elif length < _int16_max:
+        return _ensure_int16(indexer)
+    elif length < _int32_max:
+        return _ensure_int32(indexer)
+    return _ensure_int64(indexer)
+
+
+def coerce_to_dtypes(result, dtypes):
+    """
+    given a dtypes and a result set, coerce the result elements to the
+    dtypes
+    """
+    if len(result) != len(dtypes):
+        raise AssertionError("_coerce_to_dtypes requires equal len arrays")
+
+    from pandas.core.tools.timedeltas import _coerce_scalar_to_timedelta_type
+
+    def conv(r, dtype):
+        try:
+            if isna(r):
+                pass
+            elif dtype == _NS_DTYPE:
+                r = tslib.Timestamp(r)
+            elif dtype == _TD_DTYPE:
+                r = _coerce_scalar_to_timedelta_type(r)
+            elif dtype == np.bool_:
+                # messy. non 0/1 integers do not get converted.
+                if is_integer(r) and r not in [0, 1]:
+                    return int(r)
+                r = bool(r)
+            elif dtype.kind == 'f':
+                r = float(r)
+            elif dtype.kind == 'i':
+                r = int(r)
+        except Exception:
+            pass
+
+        return r
+
+    return [conv(r, dtype) for r, dtype in zip(result, dtypes)]
+
+
+def astype_nansafe(arr, dtype, copy=True):
+    """ return a view if copy is False, but
+        need to be very careful as the result shape could change! """
+    if not isinstance(dtype, np.dtype):
+        dtype = pandas_dtype(dtype)
+
+    if issubclass(dtype.type, text_type):
+        # in Py3 that's str, in Py2 that's unicode
+        return lib.astype_unicode(arr.ravel()).reshape(arr.shape)
+
+    elif issubclass(dtype.type, string_types):
+        return lib.astype_str(arr.ravel()).reshape(arr.shape)
+
+    elif is_datetime64_dtype(arr):
+        if is_object_dtype(dtype):
+            return tslib.ints_to_pydatetime(arr.view(np.int64))
+        elif dtype == np.int64:
+            return arr.view(dtype)
+
+        # allow frequency conversions
+        if dtype.kind == 'M':
+            return arr.astype(dtype)
+
+        raise TypeError("cannot astype a datetimelike from [{from_dtype}] "
+                        "to [{to_dtype}]".format(from_dtype=arr.dtype,
+                                                 to_dtype=dtype))
+
+    elif is_timedelta64_dtype(arr):
+        if is_object_dtype(dtype):
+            return tslib.ints_to_pytimedelta(arr.view(np.int64))
+        elif dtype == np.int64:
+            return arr.view(dtype)
+
+        # in py3, timedelta64[ns] are int64
+        if ((PY3 and dtype not in [_INT64_DTYPE, _TD_DTYPE]) or
+                (not PY3 and dtype != _TD_DTYPE)):
+
+            # allow frequency conversions
+            # we return a float here!
+            if dtype.kind == 'm':
+                mask = isna(arr)
+                result = arr.astype(dtype).astype(np.float64)
+                result[mask] = np.nan
+                return result
+        elif dtype == _TD_DTYPE:
+            return arr.astype(_TD_DTYPE, copy=copy)
+
+        raise TypeError("cannot astype a timedelta from [{from_dtype}] "
+                        "to [{to_dtype}]".format(from_dtype=arr.dtype,
+                                                 to_dtype=dtype))
+
+    elif (np.issubdtype(arr.dtype, np.floating) and
+          np.issubdtype(dtype, np.integer)):
+
+        if not np.isfinite(arr).all():
+            raise ValueError('Cannot convert non-finite values (NA or inf) to '
+                             'integer')
+
+    elif is_object_dtype(arr):
+
+        # work around NumPy brokenness, #1987
+        if np.issubdtype(dtype.type, np.integer):
+            return lib.astype_intsafe(arr.ravel(), dtype).reshape(arr.shape)
+
+        # if we have a datetime/timedelta array of objects
+        # then coerce to a proper dtype and recall astype_nansafe
+
+        elif is_datetime64_dtype(dtype):
+            from pandas import to_datetime
+            return astype_nansafe(to_datetime(arr).values, dtype, copy=copy)
+        elif is_timedelta64_dtype(dtype):
+            from pandas import to_timedelta
+            return astype_nansafe(to_timedelta(arr).values, dtype, copy=copy)
+
+    if dtype.name in ("datetime64", "timedelta64"):
+        msg = ("Passing in '{dtype}' dtype with no frequency is "
+               "deprecated and will raise in a future version. "
+               "Please pass in '{dtype}[ns]' instead.")
+        warnings.warn(msg.format(dtype=dtype.name),
+                      FutureWarning, stacklevel=5)
+        dtype = np.dtype(dtype.name + "[ns]")
+
+    if copy:
+        return arr.astype(dtype, copy=True)
+    return arr.view(dtype)
+
+
+def maybe_convert_objects(values, convert_dates=True, convert_numeric=True,
+                          convert_timedeltas=True, copy=True):
+    """ if we have an object dtype, try to coerce dates and/or numbers """
+
+    # if we have passed in a list or scalar
+    if isinstance(values, (list, tuple)):
+        values = np.array(values, dtype=np.object_)
+    if not hasattr(values, 'dtype'):
+        values = np.array([values], dtype=np.object_)
+
+    # convert dates
+    if convert_dates and values.dtype == np.object_:
+
+        # we take an aggressive stance and convert to datetime64[ns]
+        if convert_dates == 'coerce':
+            new_values = maybe_cast_to_datetime(
+                values, 'M8[ns]', errors='coerce')
+
+            # if we are all nans then leave me alone
+            if not isna(new_values).all():
+                values = new_values
+
+        else:
+            values = lib.maybe_convert_objects(values,
+                                               convert_datetime=convert_dates)
+
+    # convert timedeltas
+    if convert_timedeltas and values.dtype == np.object_:
+
+        if convert_timedeltas == 'coerce':
+            from pandas.core.tools.timedeltas import to_timedelta
+            new_values = to_timedelta(values, errors='coerce')
+
+            # if we are all nans then leave me alone
+            if not isna(new_values).all():
+                values = new_values
+
+        else:
+            values = lib.maybe_convert_objects(
+                values, convert_timedelta=convert_timedeltas)
+
+    # convert to numeric
+    if values.dtype == np.object_:
+        if convert_numeric:
+            try:
+                new_values = lib.maybe_convert_numeric(values, set(),
+                                                       coerce_numeric=True)
+
+                # if we are all nans then leave me alone
+                if not isna(new_values).all():
+                    values = new_values
+
+            except Exception:
+                pass
+        else:
+            # soft-conversion
+            values = lib.maybe_convert_objects(values)
+
+    values = values.copy() if copy else values
+
+    return values
+
+
+def soft_convert_objects(values, datetime=True, numeric=True, timedelta=True,
+                         coerce=False, copy=True):
+    """ if we have an object dtype, try to coerce dates and/or numbers """
+
+    conversion_count = sum((datetime, numeric, timedelta))
+    if conversion_count == 0:
+        raise ValueError('At least one of datetime, numeric or timedelta must '
+                         'be True.')
+    elif conversion_count > 1 and coerce:
+        raise ValueError("Only one of 'datetime', 'numeric' or "
+                         "'timedelta' can be True when when coerce=True.")
+
+    if isinstance(values, (list, tuple)):
+        # List or scalar
+        values = np.array(values, dtype=np.object_)
+    elif not hasattr(values, 'dtype'):
+        values = np.array([values], dtype=np.object_)
+    elif not is_object_dtype(values.dtype):
+        # If not object, do not attempt conversion
+        values = values.copy() if copy else values
+        return values
+
+    # If 1 flag is coerce, ensure 2 others are False
+    if coerce:
+        # Immediate return if coerce
+        if datetime:
+            from pandas import to_datetime
+            return to_datetime(values, errors='coerce', box=False)
+        elif timedelta:
+            from pandas import to_timedelta
+            return to_timedelta(values, errors='coerce', box=False)
+        elif numeric:
+            from pandas import to_numeric
+            return to_numeric(values, errors='coerce')
+
+    # Soft conversions
+    if datetime:
+        values = lib.maybe_convert_objects(values, convert_datetime=datetime)
+
+    if timedelta and is_object_dtype(values.dtype):
+        # Object check to ensure only run if previous did not convert
+        values = lib.maybe_convert_objects(values, convert_timedelta=timedelta)
+
+    if numeric and is_object_dtype(values.dtype):
+        try:
+            converted = lib.maybe_convert_numeric(values, set(),
+                                                  coerce_numeric=True)
+            # If all NaNs, then do not-alter
+            values = converted if not isna(converted).all() else values
+            values = values.copy() if copy else values
+        except Exception:
+            pass
+
+    return values
+
+
+def maybe_castable(arr):
+    # return False to force a non-fastpath
+
+    # check datetime64[ns]/timedelta64[ns] are valid
+    # otherwise try to coerce
+    kind = arr.dtype.kind
+    if kind == 'M':
+        return is_datetime64_ns_dtype(arr.dtype)
+    elif kind == 'm':
+        return is_timedelta64_ns_dtype(arr.dtype)
+
+    return arr.dtype.name not in _POSSIBLY_CAST_DTYPES
+
+
+def maybe_infer_to_datetimelike(value, convert_dates=False):
+    """
+    we might have a array (or single object) that is datetime like,
+    and no dtype is passed don't change the value unless we find a
+    datetime/timedelta set
+
+    this is pretty strict in that a datetime/timedelta is REQUIRED
+    in addition to possible nulls/string likes
+
+    Parameters
+    ----------
+    value : np.array / Series / Index / list-like
+    convert_dates : boolean, default False
+       if True try really hard to convert dates (such as datetime.date), other
+       leave inferred dtype 'date' alone
+
+    """
+
+    if isinstance(value, (ABCDatetimeIndex, ABCPeriodIndex)):
+        return value
+    elif isinstance(value, ABCSeries):
+        if isinstance(value._values, ABCDatetimeIndex):
+            return value._values
+
+    v = value
+
+    if not is_list_like(v):
+        v = [v]
+    v = np.array(v, copy=False)
+
+    # we only care about object dtypes
+    if not is_object_dtype(v):
+        return value
+
+    shape = v.shape
+    if not v.ndim == 1:
+        v = v.ravel()
+
+    if not len(v):
+        return value
+
+    def try_datetime(v):
+        # safe coerce to datetime64
+        try:
+            # GH19671
+            v = tslib.array_to_datetime(v,
+                                        require_iso8601=True,
+                                        errors='raise')
+        except ValueError:
+
+            # we might have a sequence of the same-datetimes with tz's
+            # if so coerce to a DatetimeIndex; if they are not the same,
+            # then these stay as object dtype, xref GH19671
+            try:
+                from pandas._libs.tslibs import conversion
+                from pandas import DatetimeIndex
+
+                values, tz = conversion.datetime_to_datetime64(v)
+                return DatetimeIndex(values).tz_localize(
+                    'UTC').tz_convert(tz=tz)
+            except (ValueError, TypeError):
+                pass
+
+        except Exception:
+            pass
+
+        return v.reshape(shape)
+
+    def try_timedelta(v):
+        # safe coerce to timedelta64
+
+        # will try first with a string & object conversion
+        from pandas import to_timedelta
+        try:
+            return to_timedelta(v)._ndarray_values.reshape(shape)
+        except Exception:
+            return v.reshape(shape)
+
+    inferred_type = lib.infer_datetimelike_array(_ensure_object(v))
+
+    if inferred_type == 'date' and convert_dates:
+        value = try_datetime(v)
+    elif inferred_type == 'datetime':
+        value = try_datetime(v)
+    elif inferred_type == 'timedelta':
+        value = try_timedelta(v)
+    elif inferred_type == 'nat':
+
+        # if all NaT, return as datetime
+        if isna(v).all():
+            value = try_datetime(v)
+        else:
+
+            # We have at least a NaT and a string
+            # try timedelta first to avoid spurious datetime conversions
+            # e.g. '00:00:01' is a timedelta but
+            # technically is also a datetime
+            value = try_timedelta(v)
+            if lib.infer_dtype(value) in ['mixed']:
+                value = try_datetime(v)
+
+    return value
+
+
+def maybe_cast_to_datetime(value, dtype, errors='raise'):
+    """ try to cast the array/value to a datetimelike dtype, converting float
+    nan to iNaT
+    """
+    from pandas.core.tools.timedeltas import to_timedelta
+    from pandas.core.tools.datetimes import to_datetime
+
+    if dtype is not None:
+        if isinstance(dtype, string_types):
+            dtype = np.dtype(dtype)
+
+        is_datetime64 = is_datetime64_dtype(dtype)
+        is_datetime64tz = is_datetime64tz_dtype(dtype)
+        is_timedelta64 = is_timedelta64_dtype(dtype)
+
+        if is_datetime64 or is_datetime64tz or is_timedelta64:
+
+            # force the dtype if needed
+            msg = ("Passing in '{dtype}' dtype with no frequency is "
+                   "deprecated and will raise in a future version. "
+                   "Please pass in '{dtype}[ns]' instead.")
+
+            if is_datetime64 and not is_dtype_equal(dtype, _NS_DTYPE):
+                if dtype.name in ('datetime64', 'datetime64[ns]'):
+                    if dtype.name == 'datetime64':
+                        warnings.warn(msg.format(dtype=dtype.name),
+                                      FutureWarning, stacklevel=5)
+                    dtype = _NS_DTYPE
+                else:
+                    raise TypeError("cannot convert datetimelike to "
+                                    "dtype [{dtype}]".format(dtype=dtype))
+            elif is_datetime64tz:
+
+                # our NaT doesn't support tz's
+                # this will coerce to DatetimeIndex with
+                # a matching dtype below
+                if is_scalar(value) and isna(value):
+                    value = [value]
+
+            elif is_timedelta64 and not is_dtype_equal(dtype, _TD_DTYPE):
+                if dtype.name in ('timedelta64', 'timedelta64[ns]'):
+                    if dtype.name == 'timedelta64':
+                        warnings.warn(msg.format(dtype=dtype.name),
+                                      FutureWarning, stacklevel=5)
+                    dtype = _TD_DTYPE
+                else:
+                    raise TypeError("cannot convert timedeltalike to "
+                                    "dtype [{dtype}]".format(dtype=dtype))
+
+            if is_scalar(value):
+                if value == iNaT or isna(value):
+                    value = iNaT
+            else:
+                value = np.array(value, copy=False)
+
+                # have a scalar array-like (e.g. NaT)
+                if value.ndim == 0:
+                    value = iNaT
+
+                # we have an array of datetime or timedeltas & nulls
+                elif np.prod(value.shape) or not is_dtype_equal(value.dtype,
+                                                                dtype):
+                    try:
+                        if is_datetime64:
+                            value = to_datetime(value, errors=errors)._values
+                        elif is_datetime64tz:
+                            # The string check can be removed once issue #13712
+                            # is solved. String data that is passed with a
+                            # datetime64tz is assumed to be naive which should
+                            # be localized to the timezone.
+                            is_dt_string = is_string_dtype(value)
+                            value = to_datetime(value, errors=errors)
+                            if is_dt_string:
+                                # Strings here are naive, so directly localize
+                                value = value.tz_localize(dtype.tz)
+                            else:
+                                # Numeric values are UTC at this point,
+                                # so localize and convert
+                                value = (value.tz_localize('UTC')
+                                         .tz_convert(dtype.tz))
+                        elif is_timedelta64:
+                            value = to_timedelta(value, errors=errors)._values
+                    except (AttributeError, ValueError, TypeError):
+                        pass
+
+        # coerce datetimelike to object
+        elif is_datetime64_dtype(value) and not is_datetime64_dtype(dtype):
+            if is_object_dtype(dtype):
+                if value.dtype != _NS_DTYPE:
+                    value = value.astype(_NS_DTYPE)
+                ints = np.asarray(value).view('i8')
+                return tslib.ints_to_pydatetime(ints)
+
+            # we have a non-castable dtype that was passed
+            raise TypeError('Cannot cast datetime64 to {dtype}'
+                            .format(dtype=dtype))
+
+    else:
+
+        is_array = isinstance(value, np.ndarray)
+
+        # catch a datetime/timedelta that is not of ns variety
+        # and no coercion specified
+        if is_array and value.dtype.kind in ['M', 'm']:
+            dtype = value.dtype
+
+            if dtype.kind == 'M' and dtype != _NS_DTYPE:
+                value = value.astype(_NS_DTYPE)
+
+            elif dtype.kind == 'm' and dtype != _TD_DTYPE:
+                value = to_timedelta(value)
+
+        # only do this if we have an array and the dtype of the array is not
+        # setup already we are not an integer/object, so don't bother with this
+        # conversion
+        elif not (is_array and not (issubclass(value.dtype.type, np.integer) or
+                                    value.dtype == np.object_)):
+            value = maybe_infer_to_datetimelike(value)
+
+    return value
+
+
+def find_common_type(types):
+    """
+    Find a common data type among the given dtypes.
+
+    Parameters
+    ----------
+    types : list of dtypes
+
+    Returns
+    -------
+    pandas extension or numpy dtype
+
+    See Also
+    --------
+    numpy.find_common_type
+
+    """
+
+    if len(types) == 0:
+        raise ValueError('no types given')
+
+    first = types[0]
+
+    # workaround for find_common_type([np.dtype('datetime64[ns]')] * 2)
+    # => object
+    if all(is_dtype_equal(first, t) for t in types[1:]):
+        return first
+
+    if any(isinstance(t, (PandasExtensionDtype, ExtensionDtype))
+           for t in types):
+        return np.object
+
+    # take lowest unit
+    if all(is_datetime64_dtype(t) for t in types):
+        return np.dtype('datetime64[ns]')
+    if all(is_timedelta64_dtype(t) for t in types):
+        return np.dtype('timedelta64[ns]')
+
+    # don't mix bool / int or float or complex
+    # this is different from numpy, which casts bool with float/int as int
+    has_bools = any(is_bool_dtype(t) for t in types)
+    if has_bools:
+        has_ints = any(is_integer_dtype(t) for t in types)
+        has_floats = any(is_float_dtype(t) for t in types)
+        has_complex = any(is_complex_dtype(t) for t in types)
+        if has_ints or has_floats or has_complex:
+            return np.object
+
+    return np.find_common_type(types, [])
+
+
+def cast_scalar_to_array(shape, value, dtype=None):
+    """
+    create np.ndarray of specified shape and dtype, filled with values
+
+    Parameters
+    ----------
+    shape : tuple
+    value : scalar value
+    dtype : np.dtype, optional
+        dtype to coerce
+
+    Returns
+    -------
+    ndarray of shape, filled with value, of specified / inferred dtype
+
+    """
+
+    if dtype is None:
+        dtype, fill_value = infer_dtype_from_scalar(value)
+    else:
+        fill_value = value
+
+    values = np.empty(shape, dtype=dtype)
+    values.fill(fill_value)
+
+    return values
+
+
+def construct_1d_arraylike_from_scalar(value, length, dtype):
+    """
+    create a np.ndarray / pandas type of specified shape and dtype
+    filled with values
+
+    Parameters
+    ----------
+    value : scalar value
+    length : int
+    dtype : pandas_dtype / np.dtype
+
+    Returns
+    -------
+    np.ndarray / pandas type of length, filled with value
+
+    """
+    if is_datetimetz(dtype):
+        from pandas import DatetimeIndex
+        subarr = DatetimeIndex([value] * length, dtype=dtype)
+    elif is_categorical_dtype(dtype):
+        from pandas import Categorical
+        subarr = Categorical([value] * length, dtype=dtype)
+    else:
+        if not isinstance(dtype, (np.dtype, type(np.dtype))):
+            dtype = dtype.dtype
+
+        # coerce if we have nan for an integer dtype
+        if is_integer_dtype(dtype) and isna(value):
+            dtype = np.float64
+        subarr = np.empty(length, dtype=dtype)
+        subarr.fill(value)
+
+    return subarr
+
+
+def construct_1d_object_array_from_listlike(values):
+    """
+    Transform any list-like object in a 1-dimensional numpy array of object
+    dtype.
+
+    Parameters
+    ----------
+    values : any iterable which has a len()
+
+    Raises
+    ------
+    TypeError
+        * If `values` does not have a len()
+
+    Returns
+    -------
+    1-dimensional numpy array of dtype object
+    """
+    # numpy will try to interpret nested lists as further dimensions, hence
+    # making a 1D array that contains list-likes is a bit tricky:
+    result = np.empty(len(values), dtype='object')
+    result[:] = values
+    return result
+
+
+def construct_1d_ndarray_preserving_na(values, dtype=None, copy=False):
+    """
+    Construct a new ndarray, coercing `values` to `dtype`, preserving NA.
+
+    Parameters
+    ----------
+    values : Sequence
+    dtype : numpy.dtype, optional
+    copy : bool, default False
+        Note that copies may still be made with ``copy=False`` if casting
+        is required.
+
+    Returns
+    -------
+    arr : ndarray[dtype]
+
+    Examples
+    --------
+    >>> np.array([1.0, 2.0, None], dtype='str')
+    array(['1.0', '2.0', 'None'], dtype='<U4')
+
+    >>> construct_1d_ndarray_preserving_na([1.0, 2.0, None], dtype='str')
+
+
+    """
+    subarr = np.array(values, dtype=dtype, copy=copy)
+
+    if dtype is not None and dtype.kind in ("U", "S"):
+        # GH-21083
+        # We can't just return np.array(subarr, dtype='str') since
+        # NumPy will convert the non-string objects into strings
+        # Including NA values. Se we have to go
+        # string -> object -> update NA, which requires an
+        # additional pass over the data.
+        na_values = isna(values)
+        subarr2 = subarr.astype(object)
+        subarr2[na_values] = np.asarray(values, dtype=object)[na_values]
+        subarr = subarr2
+
+    return subarr
+
+
+def maybe_cast_to_integer_array(arr, dtype, copy=False):
+    """
+    Takes any dtype and returns the casted version, raising for when data is
+    incompatible with integer/unsigned integer dtypes.
+
+    .. versionadded:: 0.24.0
+
+    Parameters
+    ----------
+    arr : array-like
+        The array to cast.
+    dtype : str, np.dtype
+        The integer dtype to cast the array to.
+    copy: boolean, default False
+        Whether to make a copy of the array before returning.
+
+    Returns
+    -------
+    int_arr : ndarray
+        An array of integer or unsigned integer dtype
+
+    Raises
+    ------
+    OverflowError : the dtype is incompatible with the data
+    ValueError : loss of precision has occurred during casting
+
+    Examples
+    --------
+    If you try to coerce negative values to unsigned integers, it raises:
+
+    >>> Series([-1], dtype="uint64")
+    Traceback (most recent call last):
+        ...
+    OverflowError: Trying to coerce negative values to unsigned integers
+
+    Also, if you try to coerce float values to integers, it raises:
+
+    >>> Series([1, 2, 3.5], dtype="int64")
+    Traceback (most recent call last):
+        ...
+    ValueError: Trying to coerce float values to integers
+    """
+
+    try:
+        if not hasattr(arr, "astype"):
+            casted = np.array(arr, dtype=dtype, copy=copy)
+        else:
+            casted = arr.astype(dtype, copy=copy)
+    except OverflowError:
+        raise OverflowError("The elements provided in the data cannot all be "
+                            "casted to the dtype {dtype}".format(dtype=dtype))
+
+    if np.array_equal(arr, casted):
+        return casted
+
+    # We do this casting to allow for proper
+    # data and dtype checking.
+    #
+    # We didn't do this earlier because NumPy
+    # doesn't handle `uint64` correctly.
+    arr = np.asarray(arr)
+
+    if is_unsigned_integer_dtype(dtype) and (arr < 0).any():
+        raise OverflowError("Trying to coerce negative values "
+                            "to unsigned integers")
+
+    if is_integer_dtype(dtype) and (is_float_dtype(arr) or
+                                    is_object_dtype(arr)):
+        raise ValueError("Trying to coerce float values to integers")
diff --git a/pandas/core/dtypes/common.py b/pandas/core/dtypes/common.py
new file mode 100644
index 0000000000000..05f82c67ddb8b
--- /dev/null
+++ b/pandas/core/dtypes/common.py
@@ -0,0 +1,2029 @@
+""" common type operations """
+
+import numpy as np
+from pandas.compat import (string_types, text_type, binary_type,
+                           PY3, PY36)
+from pandas._libs import algos, lib
+from pandas._libs.tslibs import conversion
+from pandas.core.dtypes.dtypes import (
+    CategoricalDtype, CategoricalDtypeType, DatetimeTZDtype,
+    DatetimeTZDtypeType, PeriodDtype, PeriodDtypeType, IntervalDtype,
+    IntervalDtypeType, ExtensionDtype, PandasExtensionDtype)
+from pandas.core.dtypes.generic import (
+    ABCCategorical, ABCPeriodIndex, ABCDatetimeIndex, ABCSeries,
+    ABCSparseArray, ABCSparseSeries, ABCCategoricalIndex, ABCIndexClass,
+    ABCDateOffset)
+from pandas.core.dtypes.inference import (  # noqa:F401
+    is_bool, is_integer, is_hashable, is_iterator, is_float,
+    is_dict_like, is_scalar, is_string_like, is_list_like, is_number,
+    is_file_like, is_re, is_re_compilable, is_sequence, is_nested_list_like,
+    is_named_tuple, is_array_like, is_decimal, is_complex, is_interval)
+
+
+_POSSIBLY_CAST_DTYPES = set([np.dtype(t).name
+                             for t in ['O', 'int8', 'uint8', 'int16', 'uint16',
+                                       'int32', 'uint32', 'int64', 'uint64']])
+
+_NS_DTYPE = conversion.NS_DTYPE
+_TD_DTYPE = conversion.TD_DTYPE
+_INT64_DTYPE = np.dtype(np.int64)
+
+# oh the troubles to reduce import time
+_is_scipy_sparse = None
+
+_ensure_float64 = algos.ensure_float64
+_ensure_float32 = algos.ensure_float32
+
+_ensure_datetime64ns = conversion.ensure_datetime64ns
+_ensure_timedelta64ns = conversion.ensure_timedelta64ns
+
+
+def _ensure_float(arr):
+    """
+    Ensure that an array object has a float dtype if possible.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array whose data type we want to enforce as float.
+
+    Returns
+    -------
+    float_arr : The original array cast to the float dtype if
+                possible. Otherwise, the original array is returned.
+    """
+
+    if issubclass(arr.dtype.type, (np.integer, np.bool_)):
+        arr = arr.astype(float)
+    return arr
+
+
+_ensure_uint64 = algos.ensure_uint64
+_ensure_int64 = algos.ensure_int64
+_ensure_int32 = algos.ensure_int32
+_ensure_int16 = algos.ensure_int16
+_ensure_int8 = algos.ensure_int8
+_ensure_platform_int = algos.ensure_platform_int
+_ensure_object = algos.ensure_object
+
+
+def _ensure_categorical(arr):
+    """
+    Ensure that an array-like object is a Categorical (if not already).
+
+    Parameters
+    ----------
+    arr : array-like
+        The array that we want to convert into a Categorical.
+
+    Returns
+    -------
+    cat_arr : The original array cast as a Categorical. If it already
+              is a Categorical, we return as is.
+    """
+
+    if not is_categorical(arr):
+        from pandas import Categorical
+        arr = Categorical(arr)
+    return arr
+
+
+def is_object_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of the object dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like or dtype is of the object dtype.
+
+    Examples
+    --------
+    >>> is_object_dtype(object)
+    True
+    >>> is_object_dtype(int)
+    False
+    >>> is_object_dtype(np.array([], dtype=object))
+    True
+    >>> is_object_dtype(np.array([], dtype=int))
+    False
+    >>> is_object_dtype([1, 2, 3])
+    False
+    """
+
+    if arr_or_dtype is None:
+        return False
+    tipo = _get_dtype_type(arr_or_dtype)
+    return issubclass(tipo, np.object_)
+
+
+def is_sparse(arr):
+    """
+    Check whether an array-like is a pandas sparse array.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like is a pandas sparse array.
+
+    Examples
+    --------
+    >>> is_sparse(np.array([1, 2, 3]))
+    False
+    >>> is_sparse(pd.SparseArray([1, 2, 3]))
+    True
+    >>> is_sparse(pd.SparseSeries([1, 2, 3]))
+    True
+
+    This function checks only for pandas sparse array instances, so
+    sparse arrays from other libraries will return False.
+
+    >>> from scipy.sparse import bsr_matrix
+    >>> is_sparse(bsr_matrix([1, 2, 3]))
+    False
+    """
+
+    return isinstance(arr, (ABCSparseArray, ABCSparseSeries))
+
+
+def is_scipy_sparse(arr):
+    """
+    Check whether an array-like is a scipy.sparse.spmatrix instance.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like is a
+              scipy.sparse.spmatrix instance.
+
+    Notes
+    -----
+    If scipy is not installed, this function will always return False.
+
+    Examples
+    --------
+    >>> from scipy.sparse import bsr_matrix
+    >>> is_scipy_sparse(bsr_matrix([1, 2, 3]))
+    True
+    >>> is_scipy_sparse(pd.SparseArray([1, 2, 3]))
+    False
+    >>> is_scipy_sparse(pd.SparseSeries([1, 2, 3]))
+    False
+    """
+
+    global _is_scipy_sparse
+
+    if _is_scipy_sparse is None:
+        try:
+            from scipy.sparse import issparse as _is_scipy_sparse
+        except ImportError:
+            _is_scipy_sparse = lambda _: False
+
+    return _is_scipy_sparse(arr)
+
+
+def is_categorical(arr):
+    """
+    Check whether an array-like is a Categorical instance.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like is of a Categorical instance.
+
+    Examples
+    --------
+    >>> is_categorical([1, 2, 3])
+    False
+
+    Categoricals, Series Categoricals, and CategoricalIndex will return True.
+
+    >>> cat = pd.Categorical([1, 2, 3])
+    >>> is_categorical(cat)
+    True
+    >>> is_categorical(pd.Series(cat))
+    True
+    >>> is_categorical(pd.CategoricalIndex([1, 2, 3]))
+    True
+    """
+
+    return isinstance(arr, ABCCategorical) or is_categorical_dtype(arr)
+
+
+def is_datetimetz(arr):
+    """
+    Check whether an array-like is a datetime array-like with a timezone
+    component in its dtype.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like is a datetime array-like with
+              a timezone component in its dtype.
+
+    Examples
+    --------
+    >>> is_datetimetz([1, 2, 3])
+    False
+
+    Although the following examples are both DatetimeIndex objects,
+    the first one returns False because it has no timezone component
+    unlike the second one, which returns True.
+
+    >>> is_datetimetz(pd.DatetimeIndex([1, 2, 3]))
+    False
+    >>> is_datetimetz(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+    True
+
+    The object need not be a DatetimeIndex object. It just needs to have
+    a dtype which has a timezone component.
+
+    >>> dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+    >>> s = pd.Series([], dtype=dtype)
+    >>> is_datetimetz(s)
+    True
+    """
+
+    # TODO: do we need this function?
+    # It seems like a repeat of is_datetime64tz_dtype.
+
+    return ((isinstance(arr, ABCDatetimeIndex) and
+             getattr(arr, 'tz', None) is not None) or
+            is_datetime64tz_dtype(arr))
+
+
+def is_offsetlike(arr_or_obj):
+    """
+    Check if obj or all elements of list-like is DateOffset
+
+    Parameters
+    ----------
+    arr_or_obj : object
+
+    Returns
+    -------
+    boolean : Whether the object is a DateOffset or listlike of DatetOffsets
+
+    Examples
+    --------
+    >>> is_offsetlike(pd.DateOffset(days=1))
+    True
+    >>> is_offsetlike('offset')
+    False
+    >>> is_offsetlike([pd.offsets.Minute(4), pd.offsets.MonthEnd()])
+    True
+    >>> is_offsetlike(np.array([pd.DateOffset(months=3), pd.Timestamp.now()]))
+    False
+    """
+    if isinstance(arr_or_obj, ABCDateOffset):
+        return True
+    elif (is_list_like(arr_or_obj) and len(arr_or_obj) and
+          is_object_dtype(arr_or_obj)):
+        return all(isinstance(x, ABCDateOffset) for x in arr_or_obj)
+    return False
+
+
+def is_period(arr):
+    """
+    Check whether an array-like is a periodical index.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like is a periodical index.
+
+    Examples
+    --------
+    >>> is_period([1, 2, 3])
+    False
+    >>> is_period(pd.Index([1, 2, 3]))
+    False
+    >>> is_period(pd.PeriodIndex(["2017-01-01"], freq="D"))
+    True
+    """
+
+    # TODO: do we need this function?
+    # It seems like a repeat of is_period_arraylike.
+    return isinstance(arr, ABCPeriodIndex) or is_period_arraylike(arr)
+
+
+def is_datetime64_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of the datetime64 dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like or dtype is of
+              the datetime64 dtype.
+
+    Examples
+    --------
+    >>> is_datetime64_dtype(object)
+    False
+    >>> is_datetime64_dtype(np.datetime64)
+    True
+    >>> is_datetime64_dtype(np.array([], dtype=int))
+    False
+    >>> is_datetime64_dtype(np.array([], dtype=np.datetime64))
+    True
+    >>> is_datetime64_dtype([1, 2, 3])
+    False
+    """
+
+    if arr_or_dtype is None:
+        return False
+    try:
+        tipo = _get_dtype_type(arr_or_dtype)
+    except TypeError:
+        return False
+    return issubclass(tipo, np.datetime64)
+
+
+def is_datetime64tz_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of a DatetimeTZDtype dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like or dtype is of
+              a DatetimeTZDtype dtype.
+
+    Examples
+    --------
+    >>> is_datetime64tz_dtype(object)
+    False
+    >>> is_datetime64tz_dtype([1, 2, 3])
+    False
+    >>> is_datetime64tz_dtype(pd.DatetimeIndex([1, 2, 3]))  # tz-naive
+    False
+    >>> is_datetime64tz_dtype(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+    True
+
+    >>> dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+    >>> s = pd.Series([], dtype=dtype)
+    >>> is_datetime64tz_dtype(dtype)
+    True
+    >>> is_datetime64tz_dtype(s)
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    return DatetimeTZDtype.is_dtype(arr_or_dtype)
+
+
+def is_timedelta64_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of the timedelta64 dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like or dtype is
+              of the timedelta64 dtype.
+
+    Examples
+    --------
+    >>> is_timedelta64_dtype(object)
+    False
+    >>> is_timedelta64_dtype(np.timedelta64)
+    True
+    >>> is_timedelta64_dtype([1, 2, 3])
+    False
+    >>> is_timedelta64_dtype(pd.Series([], dtype="timedelta64[ns]"))
+    True
+    >>> is_timedelta64_dtype('0 days')
+    False
+    """
+
+    if arr_or_dtype is None:
+        return False
+    try:
+        tipo = _get_dtype_type(arr_or_dtype)
+    except:
+        return False
+    return issubclass(tipo, np.timedelta64)
+
+
+def is_period_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of the Period dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like or dtype is of the Period dtype.
+
+    Examples
+    --------
+    >>> is_period_dtype(object)
+    False
+    >>> is_period_dtype(PeriodDtype(freq="D"))
+    True
+    >>> is_period_dtype([1, 2, 3])
+    False
+    >>> is_period_dtype(pd.Period("2017-01-01"))
+    False
+    >>> is_period_dtype(pd.PeriodIndex([], freq="A"))
+    True
+    """
+
+    # TODO: Consider making Period an instance of PeriodDtype
+    if arr_or_dtype is None:
+        return False
+    return PeriodDtype.is_dtype(arr_or_dtype)
+
+
+def is_interval_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of the Interval dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like or dtype is
+              of the Interval dtype.
+
+    Examples
+    --------
+    >>> is_interval_dtype(object)
+    False
+    >>> is_interval_dtype(IntervalDtype())
+    True
+    >>> is_interval_dtype([1, 2, 3])
+    False
+    >>>
+    >>> interval = pd.Interval(1, 2, closed="right")
+    >>> is_interval_dtype(interval)
+    False
+    >>> is_interval_dtype(pd.IntervalIndex([interval]))
+    True
+    """
+
+    # TODO: Consider making Interval an instance of IntervalDtype
+    if arr_or_dtype is None:
+        return False
+    return IntervalDtype.is_dtype(arr_or_dtype)
+
+
+def is_categorical_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of the Categorical dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like or dtype is
+              of the Categorical dtype.
+
+    Examples
+    --------
+    >>> is_categorical_dtype(object)
+    False
+    >>> is_categorical_dtype(CategoricalDtype())
+    True
+    >>> is_categorical_dtype([1, 2, 3])
+    False
+    >>> is_categorical_dtype(pd.Categorical([1, 2, 3]))
+    True
+    >>> is_categorical_dtype(pd.CategoricalIndex([1, 2, 3]))
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    return CategoricalDtype.is_dtype(arr_or_dtype)
+
+
+def is_string_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of the string dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of the string dtype.
+
+    Examples
+    --------
+    >>> is_string_dtype(str)
+    True
+    >>> is_string_dtype(object)
+    True
+    >>> is_string_dtype(int)
+    False
+    >>>
+    >>> is_string_dtype(np.array(['a', 'b']))
+    True
+    >>> is_string_dtype(pd.Series([1, 2]))
+    False
+    """
+
+    # TODO: gh-15585: consider making the checks stricter.
+
+    if arr_or_dtype is None:
+        return False
+    try:
+        dtype = _get_dtype(arr_or_dtype)
+        return dtype.kind in ('O', 'S', 'U') and not is_period_dtype(dtype)
+    except TypeError:
+        return False
+
+
+def is_period_arraylike(arr):
+    """
+    Check whether an array-like is a periodical array-like or PeriodIndex.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like is a periodical
+              array-like or PeriodIndex instance.
+
+    Examples
+    --------
+    >>> is_period_arraylike([1, 2, 3])
+    False
+    >>> is_period_arraylike(pd.Index([1, 2, 3]))
+    False
+    >>> is_period_arraylike(pd.PeriodIndex(["2017-01-01"], freq="D"))
+    True
+    """
+
+    if isinstance(arr, ABCPeriodIndex):
+        return True
+    elif isinstance(arr, (np.ndarray, ABCSeries)):
+        return arr.dtype == object and lib.infer_dtype(arr) == 'period'
+    return getattr(arr, 'inferred_type', None) == 'period'
+
+
+def is_datetime_arraylike(arr):
+    """
+    Check whether an array-like is a datetime array-like or DatetimeIndex.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like is a datetime
+              array-like or DatetimeIndex.
+
+    Examples
+    --------
+    >>> is_datetime_arraylike([1, 2, 3])
+    False
+    >>> is_datetime_arraylike(pd.Index([1, 2, 3]))
+    False
+    >>> is_datetime_arraylike(pd.DatetimeIndex([1, 2, 3]))
+    True
+    """
+
+    if isinstance(arr, ABCDatetimeIndex):
+        return True
+    elif isinstance(arr, (np.ndarray, ABCSeries)):
+        return arr.dtype == object and lib.infer_dtype(arr) == 'datetime'
+    return getattr(arr, 'inferred_type', None) == 'datetime'
+
+
+def is_datetimelike(arr):
+    """
+    Check whether an array-like is a datetime-like array-like.
+
+    Acceptable datetime-like objects are (but not limited to) datetime
+    indices, periodic indices, and timedelta indices.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like is a datetime-like array-like.
+
+    Examples
+    --------
+    >>> is_datetimelike([1, 2, 3])
+    False
+    >>> is_datetimelike(pd.Index([1, 2, 3]))
+    False
+    >>> is_datetimelike(pd.DatetimeIndex([1, 2, 3]))
+    True
+    >>> is_datetimelike(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+    True
+    >>> is_datetimelike(pd.PeriodIndex([], freq="A"))
+    True
+    >>> is_datetimelike(np.array([], dtype=np.datetime64))
+    True
+    >>> is_datetimelike(pd.Series([], dtype="timedelta64[ns]"))
+    True
+    >>>
+    >>> dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+    >>> s = pd.Series([], dtype=dtype)
+    >>> is_datetimelike(s)
+    True
+    """
+
+    return (is_datetime64_dtype(arr) or is_datetime64tz_dtype(arr) or
+            is_timedelta64_dtype(arr) or
+            isinstance(arr, ABCPeriodIndex) or
+            is_datetimetz(arr))
+
+
+def is_dtype_equal(source, target):
+    """
+    Check if two dtypes are equal.
+
+    Parameters
+    ----------
+    source : The first dtype to compare
+    target : The second dtype to compare
+
+    Returns
+    ----------
+    boolean : Whether or not the two dtypes are equal.
+
+    Examples
+    --------
+    >>> is_dtype_equal(int, float)
+    False
+    >>> is_dtype_equal("int", int)
+    True
+    >>> is_dtype_equal(object, "category")
+    False
+    >>> is_dtype_equal(CategoricalDtype(), "category")
+    True
+    >>> is_dtype_equal(DatetimeTZDtype(), "datetime64")
+    False
+    """
+
+    try:
+        source = _get_dtype(source)
+        target = _get_dtype(target)
+        return source == target
+    except (TypeError, AttributeError):
+
+        # invalid comparison
+        # object == category will hit this
+        return False
+
+
+def is_dtype_union_equal(source, target):
+    """
+    Check whether two arrays have compatible dtypes to do a union.
+    numpy types are checked with ``is_dtype_equal``. Extension types are
+    checked separately.
+
+    Parameters
+    ----------
+    source : The first dtype to compare
+    target : The second dtype to compare
+
+    Returns
+    ----------
+    boolean : Whether or not the two dtypes are equal.
+
+    >>> is_dtype_equal("int", int)
+    True
+
+    >>> is_dtype_equal(CategoricalDtype(['a', 'b'],
+    ...                CategoricalDtype(['b', 'c']))
+    True
+
+    >>> is_dtype_equal(CategoricalDtype(['a', 'b'],
+    ...                CategoricalDtype(['b', 'c'], ordered=True))
+    False
+    """
+    source = _get_dtype(source)
+    target = _get_dtype(target)
+    if is_categorical_dtype(source) and is_categorical_dtype(target):
+        # ordered False for both
+        return source.ordered is target.ordered
+    return is_dtype_equal(source, target)
+
+
+def is_any_int_dtype(arr_or_dtype):
+    """Check whether the provided array or dtype is of an integer dtype.
+
+    .. deprecated:: 0.20.0
+
+    In this function, timedelta64 instances are also considered "any-integer"
+    type objects and will return True.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of an integer dtype.
+
+    Examples
+    --------
+    >>> is_any_int_dtype(str)
+    False
+    >>> is_any_int_dtype(int)
+    True
+    >>> is_any_int_dtype(float)
+    False
+    >>> is_any_int_dtype(np.uint64)
+    True
+    >>> is_any_int_dtype(np.datetime64)
+    False
+    >>> is_any_int_dtype(np.timedelta64)
+    True
+    >>> is_any_int_dtype(np.array(['a', 'b']))
+    False
+    >>> is_any_int_dtype(pd.Series([1, 2]))
+    True
+    >>> is_any_int_dtype(np.array([], dtype=np.timedelta64))
+    True
+    >>> is_any_int_dtype(pd.Index([1, 2.]))  # float
+    False
+    """
+
+    if arr_or_dtype is None:
+        return False
+    tipo = _get_dtype_type(arr_or_dtype)
+    return issubclass(tipo, np.integer)
+
+
+def is_integer_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of an integer dtype.
+
+    Unlike in `in_any_int_dtype`, timedelta64 instances will return False.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of an integer dtype
+              and not an instance of timedelta64.
+
+    Examples
+    --------
+    >>> is_integer_dtype(str)
+    False
+    >>> is_integer_dtype(int)
+    True
+    >>> is_integer_dtype(float)
+    False
+    >>> is_integer_dtype(np.uint64)
+    True
+    >>> is_integer_dtype(np.datetime64)
+    False
+    >>> is_integer_dtype(np.timedelta64)
+    False
+    >>> is_integer_dtype(np.array(['a', 'b']))
+    False
+    >>> is_integer_dtype(pd.Series([1, 2]))
+    True
+    >>> is_integer_dtype(np.array([], dtype=np.timedelta64))
+    False
+    >>> is_integer_dtype(pd.Index([1, 2.]))  # float
+    False
+    """
+
+    if arr_or_dtype is None:
+        return False
+    tipo = _get_dtype_type(arr_or_dtype)
+    return (issubclass(tipo, np.integer) and
+            not issubclass(tipo, (np.datetime64, np.timedelta64)))
+
+
+def is_signed_integer_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of a signed integer dtype.
+
+    Unlike in `in_any_int_dtype`, timedelta64 instances will return False.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of a signed integer dtype
+              and not an instance of timedelta64.
+
+    Examples
+    --------
+    >>> is_signed_integer_dtype(str)
+    False
+    >>> is_signed_integer_dtype(int)
+    True
+    >>> is_signed_integer_dtype(float)
+    False
+    >>> is_signed_integer_dtype(np.uint64)  # unsigned
+    False
+    >>> is_signed_integer_dtype(np.datetime64)
+    False
+    >>> is_signed_integer_dtype(np.timedelta64)
+    False
+    >>> is_signed_integer_dtype(np.array(['a', 'b']))
+    False
+    >>> is_signed_integer_dtype(pd.Series([1, 2]))
+    True
+    >>> is_signed_integer_dtype(np.array([], dtype=np.timedelta64))
+    False
+    >>> is_signed_integer_dtype(pd.Index([1, 2.]))  # float
+    False
+    >>> is_signed_integer_dtype(np.array([1, 2], dtype=np.uint32))  # unsigned
+    False
+    """
+
+    if arr_or_dtype is None:
+        return False
+    tipo = _get_dtype_type(arr_or_dtype)
+    return (issubclass(tipo, np.signedinteger) and
+            not issubclass(tipo, (np.datetime64, np.timedelta64)))
+
+
+def is_unsigned_integer_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of an unsigned integer dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of an
+              unsigned integer dtype.
+
+    Examples
+    --------
+    >>> is_unsigned_integer_dtype(str)
+    False
+    >>> is_unsigned_integer_dtype(int)  # signed
+    False
+    >>> is_unsigned_integer_dtype(float)
+    False
+    >>> is_unsigned_integer_dtype(np.uint64)
+    True
+    >>> is_unsigned_integer_dtype(np.array(['a', 'b']))
+    False
+    >>> is_unsigned_integer_dtype(pd.Series([1, 2]))  # signed
+    False
+    >>> is_unsigned_integer_dtype(pd.Index([1, 2.]))  # float
+    False
+    >>> is_unsigned_integer_dtype(np.array([1, 2], dtype=np.uint32))
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    tipo = _get_dtype_type(arr_or_dtype)
+    return (issubclass(tipo, np.unsignedinteger) and
+            not issubclass(tipo, (np.datetime64, np.timedelta64)))
+
+
+def is_int64_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of the int64 dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of the int64 dtype.
+
+    Notes
+    -----
+    Depending on system architecture, the return value of `is_int64_dtype(
+    int)` will be True if the OS uses 64-bit integers and False if the OS
+    uses 32-bit integers.
+
+    Examples
+    --------
+    >>> is_int64_dtype(str)
+    False
+    >>> is_int64_dtype(np.int32)
+    False
+    >>> is_int64_dtype(np.int64)
+    True
+    >>> is_int64_dtype(float)
+    False
+    >>> is_int64_dtype(np.uint64)  # unsigned
+    False
+    >>> is_int64_dtype(np.array(['a', 'b']))
+    False
+    >>> is_int64_dtype(np.array([1, 2], dtype=np.int64))
+    True
+    >>> is_int64_dtype(pd.Index([1, 2.]))  # float
+    False
+    >>> is_int64_dtype(np.array([1, 2], dtype=np.uint32))  # unsigned
+    False
+    """
+
+    if arr_or_dtype is None:
+        return False
+    tipo = _get_dtype_type(arr_or_dtype)
+    return issubclass(tipo, np.int64)
+
+
+def is_int_or_datetime_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of an
+    integer, timedelta64, or datetime64 dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of an
+              integer, timedelta64, or datetime64 dtype.
+
+    Examples
+    --------
+    >>> is_int_or_datetime_dtype(str)
+    False
+    >>> is_int_or_datetime_dtype(int)
+    True
+    >>> is_int_or_datetime_dtype(float)
+    False
+    >>> is_int_or_datetime_dtype(np.uint64)
+    True
+    >>> is_int_or_datetime_dtype(np.datetime64)
+    True
+    >>> is_int_or_datetime_dtype(np.timedelta64)
+    True
+    >>> is_int_or_datetime_dtype(np.array(['a', 'b']))
+    False
+    >>> is_int_or_datetime_dtype(pd.Series([1, 2]))
+    True
+    >>> is_int_or_datetime_dtype(np.array([], dtype=np.timedelta64))
+    True
+    >>> is_int_or_datetime_dtype(np.array([], dtype=np.datetime64))
+    True
+    >>> is_int_or_datetime_dtype(pd.Index([1, 2.]))  # float
+    False
+    """
+
+    if arr_or_dtype is None:
+        return False
+    tipo = _get_dtype_type(arr_or_dtype)
+    return (issubclass(tipo, np.integer) or
+            issubclass(tipo, (np.datetime64, np.timedelta64)))
+
+
+def is_datetime64_any_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of the datetime64 dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of the datetime64 dtype.
+
+    Examples
+    --------
+    >>> is_datetime64_any_dtype(str)
+    False
+    >>> is_datetime64_any_dtype(int)
+    False
+    >>> is_datetime64_any_dtype(np.datetime64)  # can be tz-naive
+    True
+    >>> is_datetime64_any_dtype(DatetimeTZDtype("ns", "US/Eastern"))
+    True
+    >>> is_datetime64_any_dtype(np.array(['a', 'b']))
+    False
+    >>> is_datetime64_any_dtype(np.array([1, 2]))
+    False
+    >>> is_datetime64_any_dtype(np.array([], dtype=np.datetime64))
+    True
+    >>> is_datetime64_any_dtype(pd.DatetimeIndex([1, 2, 3],
+                                dtype=np.datetime64))
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    return (is_datetime64_dtype(arr_or_dtype) or
+            is_datetime64tz_dtype(arr_or_dtype))
+
+
+def is_datetime64_ns_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of the datetime64[ns] dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of the datetime64[ns] dtype.
+
+    Examples
+    --------
+    >>> is_datetime64_ns_dtype(str)
+    False
+    >>> is_datetime64_ns_dtype(int)
+    False
+    >>> is_datetime64_ns_dtype(np.datetime64)  # no unit
+    False
+    >>> is_datetime64_ns_dtype(DatetimeTZDtype("ns", "US/Eastern"))
+    True
+    >>> is_datetime64_ns_dtype(np.array(['a', 'b']))
+    False
+    >>> is_datetime64_ns_dtype(np.array([1, 2]))
+    False
+    >>> is_datetime64_ns_dtype(np.array([], dtype=np.datetime64))  # no unit
+    False
+    >>> is_datetime64_ns_dtype(np.array([],
+                               dtype="datetime64[ps]"))  # wrong unit
+    False
+    >>> is_datetime64_ns_dtype(pd.DatetimeIndex([1, 2, 3],
+                               dtype=np.datetime64))  # has 'ns' unit
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    try:
+        tipo = _get_dtype(arr_or_dtype)
+    except TypeError:
+        if is_datetime64tz_dtype(arr_or_dtype):
+            tipo = _get_dtype(arr_or_dtype.dtype)
+        else:
+            return False
+    return tipo == _NS_DTYPE or getattr(tipo, 'base', None) == _NS_DTYPE
+
+
+def is_timedelta64_ns_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of the timedelta64[ns] dtype.
+
+    This is a very specific dtype, so generic ones like `np.timedelta64`
+    will return False if passed into this function.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of the
+              timedelta64[ns] dtype.
+
+    Examples
+    --------
+    >>> is_timedelta64_ns_dtype(np.dtype('m8[ns]'))
+    True
+    >>> is_timedelta64_ns_dtype(np.dtype('m8[ps]'))  # Wrong frequency
+    False
+    >>> is_timedelta64_ns_dtype(np.array([1, 2], dtype='m8[ns]'))
+    True
+    >>> is_timedelta64_ns_dtype(np.array([1, 2], dtype=np.timedelta64))
+    False
+    """
+
+    if arr_or_dtype is None:
+        return False
+    try:
+        tipo = _get_dtype(arr_or_dtype)
+        return tipo == _TD_DTYPE
+    except TypeError:
+        return False
+
+
+def is_datetime_or_timedelta_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of
+    a timedelta64 or datetime64 dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of a
+              timedelta64, or datetime64 dtype.
+
+    Examples
+    --------
+    >>> is_datetime_or_timedelta_dtype(str)
+    False
+    >>> is_datetime_or_timedelta_dtype(int)
+    False
+    >>> is_datetime_or_timedelta_dtype(np.datetime64)
+    True
+    >>> is_datetime_or_timedelta_dtype(np.timedelta64)
+    True
+    >>> is_datetime_or_timedelta_dtype(np.array(['a', 'b']))
+    False
+    >>> is_datetime_or_timedelta_dtype(pd.Series([1, 2]))
+    False
+    >>> is_datetime_or_timedelta_dtype(np.array([], dtype=np.timedelta64))
+    True
+    >>> is_datetime_or_timedelta_dtype(np.array([], dtype=np.datetime64))
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    tipo = _get_dtype_type(arr_or_dtype)
+    return issubclass(tipo, (np.datetime64, np.timedelta64))
+
+
+def _is_unorderable_exception(e):
+    """
+    Check if the exception raised is an unorderable exception.
+
+    The error message differs for 3 <= PY <= 3.5 and PY >= 3.6, so
+    we need to condition based on Python version.
+
+    Parameters
+    ----------
+    e : Exception or sub-class
+        The exception object to check.
+
+    Returns
+    -------
+    boolean : Whether or not the exception raised is an unorderable exception.
+    """
+
+    if PY36:
+        return "'>' not supported between instances of" in str(e)
+
+    elif PY3:
+        return 'unorderable' in str(e)
+    return False
+
+
+def is_numeric_v_string_like(a, b):
+    """
+    Check if we are comparing a string-like object to a numeric ndarray.
+
+    NumPy doesn't like to compare such objects, especially numeric arrays
+    and scalar string-likes.
+
+    Parameters
+    ----------
+    a : array-like, scalar
+        The first object to check.
+    b : array-like, scalar
+        The second object to check.
+
+    Returns
+    -------
+    boolean : Whether we return a comparing a string-like
+              object to a numeric array.
+
+    Examples
+    --------
+    >>> is_numeric_v_string_like(1, 1)
+    False
+    >>> is_numeric_v_string_like("foo", "foo")
+    False
+    >>> is_numeric_v_string_like(1, "foo")  # non-array numeric
+    False
+    >>> is_numeric_v_string_like(np.array([1]), "foo")
+    True
+    >>> is_numeric_v_string_like("foo", np.array([1]))  # symmetric check
+    True
+    >>> is_numeric_v_string_like(np.array([1, 2]), np.array(["foo"]))
+    True
+    >>> is_numeric_v_string_like(np.array(["foo"]), np.array([1, 2]))
+    True
+    >>> is_numeric_v_string_like(np.array([1]), np.array([2]))
+    False
+    >>> is_numeric_v_string_like(np.array(["foo"]), np.array(["foo"]))
+    False
+    """
+
+    is_a_array = isinstance(a, np.ndarray)
+    is_b_array = isinstance(b, np.ndarray)
+
+    is_a_numeric_array = is_a_array and is_numeric_dtype(a)
+    is_b_numeric_array = is_b_array and is_numeric_dtype(b)
+    is_a_string_array = is_a_array and is_string_like_dtype(a)
+    is_b_string_array = is_b_array and is_string_like_dtype(b)
+
+    is_a_scalar_string_like = not is_a_array and is_string_like(a)
+    is_b_scalar_string_like = not is_b_array and is_string_like(b)
+
+    return ((is_a_numeric_array and is_b_scalar_string_like) or
+            (is_b_numeric_array and is_a_scalar_string_like) or
+            (is_a_numeric_array and is_b_string_array) or
+            (is_b_numeric_array and is_a_string_array))
+
+
+def is_datetimelike_v_numeric(a, b):
+    """
+    Check if we are comparing a datetime-like object to a numeric object.
+
+    By "numeric," we mean an object that is either of an int or float dtype.
+
+    Parameters
+    ----------
+    a : array-like, scalar
+        The first object to check.
+    b : array-like, scalar
+        The second object to check.
+
+    Returns
+    -------
+    boolean : Whether we return a comparing a datetime-like
+              to a numeric object.
+
+    Examples
+    --------
+    >>> dt = np.datetime64(pd.datetime(2017, 1, 1))
+    >>>
+    >>> is_datetimelike_v_numeric(1, 1)
+    False
+    >>> is_datetimelike_v_numeric(dt, dt)
+    False
+    >>> is_datetimelike_v_numeric(1, dt)
+    True
+    >>> is_datetimelike_v_numeric(dt, 1)  # symmetric check
+    True
+    >>> is_datetimelike_v_numeric(np.array([dt]), 1)
+    True
+    >>> is_datetimelike_v_numeric(np.array([1]), dt)
+    True
+    >>> is_datetimelike_v_numeric(np.array([dt]), np.array([1]))
+    True
+    >>> is_datetimelike_v_numeric(np.array([1]), np.array([2]))
+    False
+    >>> is_datetimelike_v_numeric(np.array([dt]), np.array([dt]))
+    False
+    """
+
+    if not hasattr(a, 'dtype'):
+        a = np.asarray(a)
+    if not hasattr(b, 'dtype'):
+        b = np.asarray(b)
+
+    def is_numeric(x):
+        """
+        Check if an object has a numeric dtype (i.e. integer or float).
+        """
+        return is_integer_dtype(x) or is_float_dtype(x)
+
+    is_datetimelike = needs_i8_conversion
+    return ((is_datetimelike(a) and is_numeric(b)) or
+            (is_datetimelike(b) and is_numeric(a)))
+
+
+def is_datetimelike_v_object(a, b):
+    """
+    Check if we are comparing a datetime-like object to an object instance.
+
+    Parameters
+    ----------
+    a : array-like, scalar
+        The first object to check.
+    b : array-like, scalar
+        The second object to check.
+
+    Returns
+    -------
+    boolean : Whether we return a comparing a datetime-like
+              to an object instance.
+
+    Examples
+    --------
+    >>> obj = object()
+    >>> dt = np.datetime64(pd.datetime(2017, 1, 1))
+    >>>
+    >>> is_datetimelike_v_object(obj, obj)
+    False
+    >>> is_datetimelike_v_object(dt, dt)
+    False
+    >>> is_datetimelike_v_object(obj, dt)
+    True
+    >>> is_datetimelike_v_object(dt, obj)  # symmetric check
+    True
+    >>> is_datetimelike_v_object(np.array([dt]), obj)
+    True
+    >>> is_datetimelike_v_object(np.array([obj]), dt)
+    True
+    >>> is_datetimelike_v_object(np.array([dt]), np.array([obj]))
+    True
+    >>> is_datetimelike_v_object(np.array([obj]), np.array([obj]))
+    False
+    >>> is_datetimelike_v_object(np.array([dt]), np.array([1]))
+    False
+    >>> is_datetimelike_v_object(np.array([dt]), np.array([dt]))
+    False
+    """
+
+    if not hasattr(a, 'dtype'):
+        a = np.asarray(a)
+    if not hasattr(b, 'dtype'):
+        b = np.asarray(b)
+
+    is_datetimelike = needs_i8_conversion
+    return ((is_datetimelike(a) and is_object_dtype(b)) or
+            (is_datetimelike(b) and is_object_dtype(a)))
+
+
+def needs_i8_conversion(arr_or_dtype):
+    """
+    Check whether the array or dtype should be converted to int64.
+
+    An array-like or dtype "needs" such a conversion if the array-like
+    or dtype is of a datetime-like dtype
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype should be converted to int64.
+
+    Examples
+    --------
+    >>> needs_i8_conversion(str)
+    False
+    >>> needs_i8_conversion(np.int64)
+    False
+    >>> needs_i8_conversion(np.datetime64)
+    True
+    >>> needs_i8_conversion(np.array(['a', 'b']))
+    False
+    >>> needs_i8_conversion(pd.Series([1, 2]))
+    False
+    >>> needs_i8_conversion(pd.Series([], dtype="timedelta64[ns]"))
+    True
+    >>> needs_i8_conversion(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    return (is_datetime_or_timedelta_dtype(arr_or_dtype) or
+            is_datetime64tz_dtype(arr_or_dtype) or
+            is_period_dtype(arr_or_dtype))
+
+
+def is_numeric_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of a numeric dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of a numeric dtype.
+
+    Examples
+    --------
+    >>> is_numeric_dtype(str)
+    False
+    >>> is_numeric_dtype(int)
+    True
+    >>> is_numeric_dtype(float)
+    True
+    >>> is_numeric_dtype(np.uint64)
+    True
+    >>> is_numeric_dtype(np.datetime64)
+    False
+    >>> is_numeric_dtype(np.timedelta64)
+    False
+    >>> is_numeric_dtype(np.array(['a', 'b']))
+    False
+    >>> is_numeric_dtype(pd.Series([1, 2]))
+    True
+    >>> is_numeric_dtype(pd.Index([1, 2.]))
+    True
+    >>> is_numeric_dtype(np.array([], dtype=np.timedelta64))
+    False
+    """
+
+    if arr_or_dtype is None:
+        return False
+    tipo = _get_dtype_type(arr_or_dtype)
+    return (issubclass(tipo, (np.number, np.bool_)) and
+            not issubclass(tipo, (np.datetime64, np.timedelta64)))
+
+
+def is_string_like_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of a string-like dtype.
+
+    Unlike `is_string_dtype`, the object dtype is excluded because it
+    is a mixed dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of the string dtype.
+
+    Examples
+    --------
+    >>> is_string_like_dtype(str)
+    True
+    >>> is_string_like_dtype(object)
+    False
+    >>> is_string_like_dtype(np.array(['a', 'b']))
+    True
+    >>> is_string_like_dtype(pd.Series([1, 2]))
+    False
+    """
+
+    if arr_or_dtype is None:
+        return False
+    try:
+        dtype = _get_dtype(arr_or_dtype)
+        return dtype.kind in ('S', 'U')
+    except TypeError:
+        return False
+
+
+def is_float_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of a float dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of a float dtype.
+
+    Examples
+    --------
+    >>> is_float_dtype(str)
+    False
+    >>> is_float_dtype(int)
+    False
+    >>> is_float_dtype(float)
+    True
+    >>> is_float_dtype(np.array(['a', 'b']))
+    False
+    >>> is_float_dtype(pd.Series([1, 2]))
+    False
+    >>> is_float_dtype(pd.Index([1, 2.]))
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    tipo = _get_dtype_type(arr_or_dtype)
+    return issubclass(tipo, np.floating)
+
+
+def is_floating_dtype(arr_or_dtype):
+    """Check whether the provided array or dtype is an instance of
+    numpy's float dtype.
+
+    .. deprecated:: 0.20.0
+
+    Unlike, `is_float_dtype`, this check is a lot stricter, as it requires
+    `isinstance` of `np.floating` and not `issubclass`.
+    """
+
+    if arr_or_dtype is None:
+        return False
+    tipo = _get_dtype_type(arr_or_dtype)
+    return isinstance(tipo, np.floating)
+
+
+def is_bool_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of a boolean dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of a boolean dtype.
+
+    Examples
+    --------
+    >>> is_bool_dtype(str)
+    False
+    >>> is_bool_dtype(int)
+    False
+    >>> is_bool_dtype(bool)
+    True
+    >>> is_bool_dtype(np.bool)
+    True
+    >>> is_bool_dtype(np.array(['a', 'b']))
+    False
+    >>> is_bool_dtype(pd.Series([1, 2]))
+    False
+    >>> is_bool_dtype(np.array([True, False]))
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    try:
+        tipo = _get_dtype_type(arr_or_dtype)
+    except ValueError:
+        # this isn't even a dtype
+        return False
+
+    if isinstance(arr_or_dtype, ABCIndexClass):
+
+        # TODO(jreback)
+        # we don't have a boolean Index class
+        # so its object, we need to infer to
+        # guess this
+        return (arr_or_dtype.is_object and
+                arr_or_dtype.inferred_type == 'boolean')
+
+    return issubclass(tipo, np.bool_)
+
+
+def is_extension_type(arr):
+    """
+    Check whether an array-like is of a pandas extension class instance.
+
+    Extension classes include categoricals, pandas sparse objects (i.e.
+    classes represented within the pandas library and not ones external
+    to it like scipy sparse matrices), and datetime-like arrays.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array-like is of a pandas
+              extension class instance.
+
+    Examples
+    --------
+    >>> is_extension_type([1, 2, 3])
+    False
+    >>> is_extension_type(np.array([1, 2, 3]))
+    False
+    >>>
+    >>> cat = pd.Categorical([1, 2, 3])
+    >>>
+    >>> is_extension_type(cat)
+    True
+    >>> is_extension_type(pd.Series(cat))
+    True
+    >>> is_extension_type(pd.SparseArray([1, 2, 3]))
+    True
+    >>> is_extension_type(pd.SparseSeries([1, 2, 3]))
+    True
+    >>>
+    >>> from scipy.sparse import bsr_matrix
+    >>> is_extension_type(bsr_matrix([1, 2, 3]))
+    False
+    >>> is_extension_type(pd.DatetimeIndex([1, 2, 3]))
+    False
+    >>> is_extension_type(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+    True
+    >>>
+    >>> dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+    >>> s = pd.Series([], dtype=dtype)
+    >>> is_extension_type(s)
+    True
+    """
+
+    if is_categorical(arr):
+        return True
+    elif is_sparse(arr):
+        return True
+    elif is_datetimetz(arr):
+        return True
+    return False
+
+
+def is_extension_array_dtype(arr_or_dtype):
+    """Check if an object is a pandas extension array type.
+
+    Parameters
+    ----------
+    arr_or_dtype : object
+
+    Returns
+    -------
+    bool
+
+    Notes
+    -----
+    This checks whether an object implements the pandas extension
+    array interface. In pandas, this includes:
+
+    * Categorical
+
+    Third-party libraries may implement arrays or types satisfying
+    this interface as well.
+    """
+    from pandas.core.arrays import ExtensionArray
+
+    if isinstance(arr_or_dtype, (ABCIndexClass, ABCSeries)):
+        arr_or_dtype = arr_or_dtype._values
+
+    return isinstance(arr_or_dtype, (ExtensionDtype, ExtensionArray))
+
+
+def is_complex_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of a complex dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean : Whether or not the array or dtype is of a compex dtype.
+
+    Examples
+    --------
+    >>> is_complex_dtype(str)
+    False
+    >>> is_complex_dtype(int)
+    False
+    >>> is_complex_dtype(np.complex)
+    True
+    >>> is_complex_dtype(np.array(['a', 'b']))
+    False
+    >>> is_complex_dtype(pd.Series([1, 2]))
+    False
+    >>> is_complex_dtype(np.array([1 + 1j, 5]))
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    tipo = _get_dtype_type(arr_or_dtype)
+    return issubclass(tipo, np.complexfloating)
+
+
+def _coerce_to_dtype(dtype):
+    """
+    Coerce a string or np.dtype to a pandas or numpy
+    dtype if possible.
+
+    If we cannot convert to a pandas dtype initially,
+    we convert to a numpy dtype.
+
+    Parameters
+    ----------
+    dtype : The dtype that we want to coerce.
+
+    Returns
+    -------
+    pd_or_np_dtype : The coerced dtype.
+    """
+
+    if is_categorical_dtype(dtype):
+        categories = getattr(dtype, 'categories', None)
+        ordered = getattr(dtype, 'ordered', False)
+        dtype = CategoricalDtype(categories=categories, ordered=ordered)
+    elif is_datetime64tz_dtype(dtype):
+        dtype = DatetimeTZDtype(dtype)
+    elif is_period_dtype(dtype):
+        dtype = PeriodDtype(dtype)
+    elif is_interval_dtype(dtype):
+        dtype = IntervalDtype(dtype)
+    else:
+        dtype = np.dtype(dtype)
+    return dtype
+
+
+def _get_dtype(arr_or_dtype):
+    """
+    Get the dtype instance associated with an array
+    or dtype object.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype object whose dtype we want to extract.
+
+    Returns
+    -------
+    obj_dtype : The extract dtype instance from the
+                passed in array or dtype object.
+
+    Raises
+    ------
+    TypeError : The passed in object is None.
+    """
+
+    if arr_or_dtype is None:
+        raise TypeError("Cannot deduce dtype from null object")
+    if isinstance(arr_or_dtype, np.dtype):
+        return arr_or_dtype
+    elif isinstance(arr_or_dtype, type):
+        return np.dtype(arr_or_dtype)
+    elif isinstance(arr_or_dtype, ExtensionDtype):
+        return arr_or_dtype
+    elif isinstance(arr_or_dtype, DatetimeTZDtype):
+        return arr_or_dtype
+    elif isinstance(arr_or_dtype, PeriodDtype):
+        return arr_or_dtype
+    elif isinstance(arr_or_dtype, IntervalDtype):
+        return arr_or_dtype
+    elif isinstance(arr_or_dtype, string_types):
+        if is_categorical_dtype(arr_or_dtype):
+            return CategoricalDtype.construct_from_string(arr_or_dtype)
+        elif is_datetime64tz_dtype(arr_or_dtype):
+            return DatetimeTZDtype.construct_from_string(arr_or_dtype)
+        elif is_period_dtype(arr_or_dtype):
+            return PeriodDtype.construct_from_string(arr_or_dtype)
+        elif is_interval_dtype(arr_or_dtype):
+            return IntervalDtype.construct_from_string(arr_or_dtype)
+    elif isinstance(arr_or_dtype, (ABCCategorical, ABCCategoricalIndex)):
+        return arr_or_dtype.dtype
+
+    if hasattr(arr_or_dtype, 'dtype'):
+        arr_or_dtype = arr_or_dtype.dtype
+    return np.dtype(arr_or_dtype)
+
+
+def _get_dtype_type(arr_or_dtype):
+    """
+    Get the type (NOT dtype) instance associated with
+    an array or dtype object.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype object whose type we want to extract.
+
+    Returns
+    -------
+    obj_type : The extract type instance from the
+               passed in array or dtype object.
+    """
+
+    if isinstance(arr_or_dtype, np.dtype):
+        return arr_or_dtype.type
+    elif isinstance(arr_or_dtype, type):
+        return np.dtype(arr_or_dtype).type
+    elif isinstance(arr_or_dtype, CategoricalDtype):
+        return CategoricalDtypeType
+    elif isinstance(arr_or_dtype, DatetimeTZDtype):
+        return DatetimeTZDtypeType
+    elif isinstance(arr_or_dtype, IntervalDtype):
+        return IntervalDtypeType
+    elif isinstance(arr_or_dtype, PeriodDtype):
+        return PeriodDtypeType
+    elif isinstance(arr_or_dtype, string_types):
+        if is_categorical_dtype(arr_or_dtype):
+            return CategoricalDtypeType
+        elif is_datetime64tz_dtype(arr_or_dtype):
+            return DatetimeTZDtypeType
+        elif is_period_dtype(arr_or_dtype):
+            return PeriodDtypeType
+        elif is_interval_dtype(arr_or_dtype):
+            return IntervalDtypeType
+        return _get_dtype_type(np.dtype(arr_or_dtype))
+    try:
+        return arr_or_dtype.dtype.type
+    except AttributeError:
+        return type(None)
+
+
+def _get_dtype_from_object(dtype):
+    """
+    Get a numpy dtype.type-style object for a dtype object.
+
+    This methods also includes handling of the datetime64[ns] and
+    datetime64[ns, TZ] objects.
+
+    If no dtype can be found, we return ``object``.
+
+    Parameters
+    ----------
+    dtype : dtype, type
+        The dtype object whose numpy dtype.type-style
+        object we want to extract.
+
+    Returns
+    -------
+    dtype_object : The extracted numpy dtype.type-style object.
+    """
+
+    if isinstance(dtype, type) and issubclass(dtype, np.generic):
+        # Type object from a dtype
+        return dtype
+    elif is_categorical(dtype):
+        return CategoricalDtype().type
+    elif is_datetimetz(dtype):
+        return DatetimeTZDtype(dtype).type
+    elif isinstance(dtype, np.dtype):  # dtype object
+        try:
+            _validate_date_like_dtype(dtype)
+        except TypeError:
+            # Should still pass if we don't have a date-like
+            pass
+        return dtype.type
+    elif isinstance(dtype, string_types):
+        if dtype in ['datetimetz', 'datetime64tz']:
+            return DatetimeTZDtype.type
+        elif dtype in ['period']:
+            raise NotImplementedError
+
+        if dtype == 'datetime' or dtype == 'timedelta':
+            dtype += '64'
+
+        try:
+            return _get_dtype_from_object(getattr(np, dtype))
+        except (AttributeError, TypeError):
+            # Handles cases like _get_dtype(int) i.e.,
+            # Python objects that are valid dtypes
+            # (unlike user-defined types, in general)
+            #
+            # TypeError handles the float16 type code of 'e'
+            # further handle internal types
+            pass
+
+    return _get_dtype_from_object(np.dtype(dtype))
+
+
+def _validate_date_like_dtype(dtype):
+    """
+    Check whether the dtype is a date-like dtype. Raises an error if invalid.
+
+    Parameters
+    ----------
+    dtype : dtype, type
+        The dtype to check.
+
+    Raises
+    ------
+    TypeError : The dtype could not be casted to a date-like dtype.
+    ValueError : The dtype is an illegal date-like dtype (e.g. the
+                 the frequency provided is too specific)
+    """
+
+    try:
+        typ = np.datetime_data(dtype)[0]
+    except ValueError as e:
+        raise TypeError('{error}'.format(error=e))
+    if typ != 'generic' and typ != 'ns':
+        msg = '{name!r} is too specific of a frequency, try passing {type!r}'
+        raise ValueError(msg.format(name=dtype.name, type=dtype.type.__name__))
+
+
+_string_dtypes = frozenset(map(_get_dtype_from_object, (binary_type,
+                                                        text_type)))
+
+
+def pandas_dtype(dtype):
+    """
+    Converts input into a pandas only dtype object or a numpy dtype object.
+
+    Parameters
+    ----------
+    dtype : object to be converted
+
+    Returns
+    -------
+    np.dtype or a pandas dtype
+    """
+
+    if isinstance(dtype, DatetimeTZDtype):
+        return dtype
+    elif isinstance(dtype, PeriodDtype):
+        return dtype
+    elif isinstance(dtype, CategoricalDtype):
+        return dtype
+    elif isinstance(dtype, IntervalDtype):
+        return dtype
+    elif isinstance(dtype, string_types):
+        try:
+            return DatetimeTZDtype.construct_from_string(dtype)
+        except TypeError:
+            pass
+
+        if dtype.startswith('period[') or dtype.startswith('Period['):
+            # do not parse string like U as period[U]
+            try:
+                return PeriodDtype.construct_from_string(dtype)
+            except TypeError:
+                pass
+
+        elif dtype.startswith('interval') or dtype.startswith('Interval'):
+            try:
+                return IntervalDtype.construct_from_string(dtype)
+            except TypeError:
+                pass
+
+        try:
+            return CategoricalDtype.construct_from_string(dtype)
+        except TypeError:
+            pass
+    elif isinstance(dtype, (PandasExtensionDtype, ExtensionDtype)):
+        return dtype
+
+    try:
+        npdtype = np.dtype(dtype)
+    except (TypeError, ValueError):
+        raise
+
+    # Any invalid dtype (such as pd.Timestamp) should raise an error.
+    # np.dtype(invalid_type).kind = 0 for such objects. However, this will
+    # also catch some valid dtypes such as object, np.object_ and 'object'
+    # which we safeguard against by catching them earlier and returning
+    # np.dtype(valid_dtype) before this condition is evaluated.
+    if dtype in [object, np.object_, 'object', 'O']:
+        return npdtype
+    elif npdtype.kind == 'O':
+        raise TypeError('dtype {dtype} not understood'.format(dtype=dtype))
+
+    return npdtype
diff --git a/pandas/core/dtypes/concat.py b/pandas/core/dtypes/concat.py
new file mode 100644
index 0000000000000..9f6813bc38464
--- /dev/null
+++ b/pandas/core/dtypes/concat.py
@@ -0,0 +1,654 @@
+"""
+Utility functions related to concat
+"""
+
+import numpy as np
+import pandas._libs.tslib as tslib
+from pandas import compat
+from pandas.core.dtypes.common import (
+    is_categorical_dtype,
+    is_sparse,
+    is_extension_array_dtype,
+    is_datetimetz,
+    is_datetime64_dtype,
+    is_timedelta64_dtype,
+    is_period_dtype,
+    is_object_dtype,
+    is_bool_dtype,
+    is_dtype_equal,
+    _NS_DTYPE,
+    _TD_DTYPE)
+from pandas.core.dtypes.generic import (
+    ABCDatetimeIndex, ABCTimedeltaIndex,
+    ABCPeriodIndex, ABCRangeIndex, ABCSparseDataFrame)
+
+
+def get_dtype_kinds(l):
+    """
+    Parameters
+    ----------
+    l : list of arrays
+
+    Returns
+    -------
+    a set of kinds that exist in this list of arrays
+    """
+
+    typs = set()
+    for arr in l:
+
+        dtype = arr.dtype
+        if is_categorical_dtype(dtype):
+            typ = 'category'
+        elif is_sparse(arr):
+            typ = 'sparse'
+        elif isinstance(arr, ABCRangeIndex):
+            typ = 'range'
+        elif is_datetimetz(arr):
+            # if to_concat contains different tz,
+            # the result must be object dtype
+            typ = str(arr.dtype)
+        elif is_datetime64_dtype(dtype):
+            typ = 'datetime'
+        elif is_timedelta64_dtype(dtype):
+            typ = 'timedelta'
+        elif is_object_dtype(dtype):
+            typ = 'object'
+        elif is_bool_dtype(dtype):
+            typ = 'bool'
+        elif is_period_dtype(dtype):
+            typ = str(arr.dtype)
+        else:
+            typ = dtype.kind
+        typs.add(typ)
+    return typs
+
+
+def _get_series_result_type(result, objs=None):
+    """
+    return appropriate class of Series concat
+    input is either dict or array-like
+    """
+    # concat Series with axis 1
+    if isinstance(result, dict):
+        # concat Series with axis 1
+        if all(is_sparse(c) for c in compat.itervalues(result)):
+            from pandas.core.sparse.api import SparseDataFrame
+            return SparseDataFrame
+        else:
+            from pandas.core.frame import DataFrame
+            return DataFrame
+
+    # otherwise it is a SingleBlockManager (axis = 0)
+    if result._block.is_sparse:
+        from pandas.core.sparse.api import SparseSeries
+        return SparseSeries
+    else:
+        return objs[0]._constructor
+
+
+def _get_frame_result_type(result, objs):
+    """
+    return appropriate class of DataFrame-like concat
+    if all blocks are SparseBlock, return SparseDataFrame
+    otherwise, return 1st obj
+    """
+
+    if result.blocks and all(b.is_sparse for b in result.blocks):
+        from pandas.core.sparse.api import SparseDataFrame
+        return SparseDataFrame
+    else:
+        return next(obj for obj in objs if not isinstance(obj,
+                                                          ABCSparseDataFrame))
+
+
+def _get_sliced_frame_result_type(data, obj):
+    """
+    return appropriate class of Series. When data is sparse
+    it will return a SparseSeries, otherwise it will return
+    the Series.
+
+    Parameters
+    ----------
+    data : array-like
+    obj : DataFrame
+
+    Returns
+    -------
+    Series or SparseSeries
+    """
+    if is_sparse(data):
+        from pandas.core.sparse.api import SparseSeries
+        return SparseSeries
+    return obj._constructor_sliced
+
+
+def _concat_compat(to_concat, axis=0):
+    """
+    provide concatenation of an array of arrays each of which is a single
+    'normalized' dtypes (in that for example, if it's object, then it is a
+    non-datetimelike and provide a combined dtype for the resulting array that
+    preserves the overall dtype if possible)
+
+    Parameters
+    ----------
+    to_concat : array of arrays
+    axis : axis to provide concatenation
+
+    Returns
+    -------
+    a single array, preserving the combined dtypes
+    """
+
+    # filter empty arrays
+    # 1-d dtypes always are included here
+    def is_nonempty(x):
+        try:
+            return x.shape[axis] > 0
+        except Exception:
+            return True
+
+    nonempty = [x for x in to_concat if is_nonempty(x)]
+
+    # If all arrays are empty, there's nothing to convert, just short-cut to
+    # the concatenation, #3121.
+    #
+    # Creating an empty array directly is tempting, but the winnings would be
+    # marginal given that it would still require shape & dtype calculation and
+    # np.concatenate which has them both implemented is compiled.
+
+    typs = get_dtype_kinds(to_concat)
+
+    _contains_datetime = any(typ.startswith('datetime') for typ in typs)
+    _contains_period = any(typ.startswith('period') for typ in typs)
+
+    if 'category' in typs:
+        # this must be priort to _concat_datetime,
+        # to support Categorical + datetime-like
+        return _concat_categorical(to_concat, axis=axis)
+
+    elif _contains_datetime or 'timedelta' in typs or _contains_period:
+        return _concat_datetime(to_concat, axis=axis, typs=typs)
+
+    # these are mandated to handle empties as well
+    elif 'sparse' in typs:
+        return _concat_sparse(to_concat, axis=axis, typs=typs)
+
+    extensions = [is_extension_array_dtype(x) for x in to_concat]
+    if any(extensions) and axis == 1:
+        to_concat = [np.atleast_2d(x.astype('object')) for x in to_concat]
+
+    if not nonempty:
+        # we have all empties, but may need to coerce the result dtype to
+        # object if we have non-numeric type operands (numpy would otherwise
+        # cast this to float)
+        typs = get_dtype_kinds(to_concat)
+        if len(typs) != 1:
+
+            if (not len(typs - set(['i', 'u', 'f'])) or
+                    not len(typs - set(['bool', 'i', 'u']))):
+                # let numpy coerce
+                pass
+            else:
+                # coerce to object
+                to_concat = [x.astype('object') for x in to_concat]
+
+    return np.concatenate(to_concat, axis=axis)
+
+
+def _concat_categorical(to_concat, axis=0):
+    """Concatenate an object/categorical array of arrays, each of which is a
+    single dtype
+
+    Parameters
+    ----------
+    to_concat : array of arrays
+    axis : int
+        Axis to provide concatenation in the current implementation this is
+        always 0, e.g. we only have 1D categoricals
+
+    Returns
+    -------
+    Categorical
+        A single array, preserving the combined dtypes
+    """
+
+    def _concat_asobject(to_concat):
+        to_concat = [x.get_values() if is_categorical_dtype(x.dtype)
+                     else np.asarray(x).ravel() for x in to_concat]
+        res = _concat_compat(to_concat)
+        if axis == 1:
+            return res.reshape(1, len(res))
+        else:
+            return res
+
+    # we could have object blocks and categoricals here
+    # if we only have a single categoricals then combine everything
+    # else its a non-compat categorical
+    categoricals = [x for x in to_concat if is_categorical_dtype(x.dtype)]
+
+    # validate the categories
+    if len(categoricals) != len(to_concat):
+        pass
+    else:
+        # when all categories are identical
+        first = to_concat[0]
+        if all(first.is_dtype_equal(other) for other in to_concat[1:]):
+            return union_categoricals(categoricals)
+
+    return _concat_asobject(to_concat)
+
+
+def union_categoricals(to_union, sort_categories=False, ignore_order=False):
+    """
+    Combine list-like of Categorical-like, unioning categories. All
+    categories must have the same dtype.
+
+    .. versionadded:: 0.19.0
+
+    Parameters
+    ----------
+    to_union : list-like of Categorical, CategoricalIndex,
+               or Series with dtype='category'
+    sort_categories : boolean, default False
+        If true, resulting categories will be lexsorted, otherwise
+        they will be ordered as they appear in the data.
+    ignore_order: boolean, default False
+        If true, the ordered attribute of the Categoricals will be ignored.
+        Results in an unordered categorical.
+
+        .. versionadded:: 0.20.0
+
+    Returns
+    -------
+    result : Categorical
+
+    Raises
+    ------
+    TypeError
+        - all inputs do not have the same dtype
+        - all inputs do not have the same ordered property
+        - all inputs are ordered and their categories are not identical
+        - sort_categories=True and Categoricals are ordered
+    ValueError
+        Empty list of categoricals passed
+
+    Notes
+    -----
+
+    To learn more about categories, see `link
+    <http://pandas.pydata.org/pandas-docs/stable/categorical.html#unioning>`__
+
+    Examples
+    --------
+
+    >>> from pandas.api.types import union_categoricals
+
+    If you want to combine categoricals that do not necessarily have
+    the same categories, `union_categoricals` will combine a list-like
+    of categoricals. The new categories will be the union of the
+    categories being combined.
+
+    >>> a = pd.Categorical(["b", "c"])
+    >>> b = pd.Categorical(["a", "b"])
+    >>> union_categoricals([a, b])
+    [b, c, a, b]
+    Categories (3, object): [b, c, a]
+
+    By default, the resulting categories will be ordered as they appear
+    in the `categories` of the data. If you want the categories to be
+    lexsorted, use `sort_categories=True` argument.
+
+    >>> union_categoricals([a, b], sort_categories=True)
+    [b, c, a, b]
+    Categories (3, object): [a, b, c]
+
+    `union_categoricals` also works with the case of combining two
+    categoricals of the same categories and order information (e.g. what
+    you could also `append` for).
+
+    >>> a = pd.Categorical(["a", "b"], ordered=True)
+    >>> b = pd.Categorical(["a", "b", "a"], ordered=True)
+    >>> union_categoricals([a, b])
+    [a, b, a, b, a]
+    Categories (2, object): [a < b]
+
+    Raises `TypeError` because the categories are ordered and not identical.
+
+    >>> a = pd.Categorical(["a", "b"], ordered=True)
+    >>> b = pd.Categorical(["a", "b", "c"], ordered=True)
+    >>> union_categoricals([a, b])
+    TypeError: to union ordered Categoricals, all categories must be the same
+
+    New in version 0.20.0
+
+    Ordered categoricals with different categories or orderings can be
+    combined by using the `ignore_ordered=True` argument.
+
+    >>> a = pd.Categorical(["a", "b", "c"], ordered=True)
+    >>> b = pd.Categorical(["c", "b", "a"], ordered=True)
+    >>> union_categoricals([a, b], ignore_order=True)
+    [a, b, c, c, b, a]
+    Categories (3, object): [a, b, c]
+
+    `union_categoricals` also works with a `CategoricalIndex`, or `Series`
+    containing categorical data, but note that the resulting array will
+    always be a plain `Categorical`
+
+    >>> a = pd.Series(["b", "c"], dtype='category')
+    >>> b = pd.Series(["a", "b"], dtype='category')
+    >>> union_categoricals([a, b])
+    [b, c, a, b]
+    Categories (3, object): [b, c, a]
+    """
+    from pandas import Index, Categorical, CategoricalIndex, Series
+    from pandas.core.arrays.categorical import _recode_for_categories
+
+    if len(to_union) == 0:
+        raise ValueError('No Categoricals to union')
+
+    def _maybe_unwrap(x):
+        if isinstance(x, (CategoricalIndex, Series)):
+            return x.values
+        elif isinstance(x, Categorical):
+            return x
+        else:
+            raise TypeError("all components to combine must be Categorical")
+
+    to_union = [_maybe_unwrap(x) for x in to_union]
+    first = to_union[0]
+
+    if not all(is_dtype_equal(other.categories.dtype, first.categories.dtype)
+               for other in to_union[1:]):
+        raise TypeError("dtype of categories must be the same")
+
+    ordered = False
+    if all(first.is_dtype_equal(other) for other in to_union[1:]):
+        # identical categories - fastpath
+        categories = first.categories
+        ordered = first.ordered
+
+        if all(first.categories.equals(other.categories)
+               for other in to_union[1:]):
+            new_codes = np.concatenate([c.codes for c in to_union])
+        else:
+            codes = [first.codes] + [_recode_for_categories(other.codes,
+                                                            other.categories,
+                                                            first.categories)
+                                     for other in to_union[1:]]
+            new_codes = np.concatenate(codes)
+
+        if sort_categories and not ignore_order and ordered:
+            raise TypeError("Cannot use sort_categories=True with "
+                            "ordered Categoricals")
+
+        if sort_categories and not categories.is_monotonic_increasing:
+            categories = categories.sort_values()
+            indexer = categories.get_indexer(first.categories)
+
+            from pandas.core.algorithms import take_1d
+            new_codes = take_1d(indexer, new_codes, fill_value=-1)
+    elif ignore_order or all(not c.ordered for c in to_union):
+        # different categories - union and recode
+        cats = first.categories.append([c.categories for c in to_union[1:]])
+        categories = Index(cats.unique())
+        if sort_categories:
+            categories = categories.sort_values()
+
+        new_codes = []
+        for c in to_union:
+            new_codes.append(_recode_for_categories(c.codes, c.categories,
+                                                    categories))
+        new_codes = np.concatenate(new_codes)
+    else:
+        # ordered - to show a proper error message
+        if all(c.ordered for c in to_union):
+            msg = ("to union ordered Categoricals, "
+                   "all categories must be the same")
+            raise TypeError(msg)
+        else:
+            raise TypeError('Categorical.ordered must be the same')
+
+    if ignore_order:
+        ordered = False
+
+    return Categorical(new_codes, categories=categories, ordered=ordered,
+                       fastpath=True)
+
+
+def _concatenate_2d(to_concat, axis):
+    # coerce to 2d if needed & concatenate
+    if axis == 1:
+        to_concat = [np.atleast_2d(x) for x in to_concat]
+    return np.concatenate(to_concat, axis=axis)
+
+
+def _concat_datetime(to_concat, axis=0, typs=None):
+    """
+    provide concatenation of an datetimelike array of arrays each of which is a
+    single M8[ns], datetimet64[ns, tz] or m8[ns] dtype
+
+    Parameters
+    ----------
+    to_concat : array of arrays
+    axis : axis to provide concatenation
+    typs : set of to_concat dtypes
+
+    Returns
+    -------
+    a single array, preserving the combined dtypes
+    """
+
+    if typs is None:
+        typs = get_dtype_kinds(to_concat)
+
+    # multiple types, need to coerce to object
+    if len(typs) != 1:
+        return _concatenate_2d([_convert_datetimelike_to_object(x)
+                                for x in to_concat],
+                               axis=axis)
+
+    # must be single dtype
+    if any(typ.startswith('datetime') for typ in typs):
+
+        if 'datetime' in typs:
+            to_concat = [np.array(x, copy=False).view(np.int64)
+                         for x in to_concat]
+            return _concatenate_2d(to_concat, axis=axis).view(_NS_DTYPE)
+        else:
+            # when to_concat has different tz, len(typs) > 1.
+            # thus no need to care
+            return _concat_datetimetz(to_concat)
+
+    elif 'timedelta' in typs:
+        return _concatenate_2d([x.view(np.int64) for x in to_concat],
+                               axis=axis).view(_TD_DTYPE)
+
+    elif any(typ.startswith('period') for typ in typs):
+        # PeriodIndex must be handled by PeriodIndex,
+        # Thus can't meet this condition ATM
+        # Must be changed when we adding PeriodDtype
+        raise NotImplementedError("unable to concat PeriodDtype")
+
+
+def _convert_datetimelike_to_object(x):
+    # coerce datetimelike array to object dtype
+
+    # if dtype is of datetimetz or timezone
+    if x.dtype.kind == _NS_DTYPE.kind:
+        if getattr(x, 'tz', None) is not None:
+            x = x.astype(object).values
+        else:
+            shape = x.shape
+            x = tslib.ints_to_pydatetime(x.view(np.int64).ravel(),
+                                         box="timestamp")
+            x = x.reshape(shape)
+
+    elif x.dtype == _TD_DTYPE:
+        shape = x.shape
+        x = tslib.ints_to_pytimedelta(x.view(np.int64).ravel(), box=True)
+        x = x.reshape(shape)
+
+    return x
+
+
+def _concat_datetimetz(to_concat, name=None):
+    """
+    concat DatetimeIndex with the same tz
+    all inputs must be DatetimeIndex
+    it is used in DatetimeIndex.append also
+    """
+    # do not pass tz to set because tzlocal cannot be hashed
+    if len({str(x.dtype) for x in to_concat}) != 1:
+        raise ValueError('to_concat must have the same tz')
+    tz = to_concat[0].tz
+    # no need to localize because internal repr will not be changed
+    new_values = np.concatenate([x.asi8 for x in to_concat])
+    return to_concat[0]._simple_new(new_values, tz=tz, name=name)
+
+
+def _concat_index_same_dtype(indexes, klass=None):
+    klass = klass if klass is not None else indexes[0].__class__
+    return klass(np.concatenate([x._values for x in indexes]))
+
+
+def _concat_index_asobject(to_concat, name=None):
+    """
+    concat all inputs as object. DatetimeIndex, TimedeltaIndex and
+    PeriodIndex are converted to object dtype before concatenation
+    """
+    from pandas import Index
+    from pandas.core.arrays import ExtensionArray
+
+    klasses = (ABCDatetimeIndex, ABCTimedeltaIndex, ABCPeriodIndex,
+               ExtensionArray)
+    to_concat = [x.astype(object) if isinstance(x, klasses) else x
+                 for x in to_concat]
+
+    self = to_concat[0]
+    attribs = self._get_attributes_dict()
+    attribs['name'] = name
+
+    to_concat = [x._values if isinstance(x, Index) else x
+                 for x in to_concat]
+    return self._shallow_copy_with_infer(np.concatenate(to_concat), **attribs)
+
+
+def _concat_sparse(to_concat, axis=0, typs=None):
+    """
+    provide concatenation of an sparse/dense array of arrays each of which is a
+    single dtype
+
+    Parameters
+    ----------
+    to_concat : array of arrays
+    axis : axis to provide concatenation
+    typs : set of to_concat dtypes
+
+    Returns
+    -------
+    a single array, preserving the combined dtypes
+    """
+
+    from pandas.core.sparse.array import SparseArray, _make_index
+
+    def convert_sparse(x, axis):
+        # coerce to native type
+        if isinstance(x, SparseArray):
+            x = x.get_values()
+        else:
+            x = np.asarray(x)
+        x = x.ravel()
+        if axis > 0:
+            x = np.atleast_2d(x)
+        return x
+
+    if typs is None:
+        typs = get_dtype_kinds(to_concat)
+
+    if len(typs) == 1:
+        # concat input as it is if all inputs are sparse
+        # and have the same fill_value
+        fill_values = {c.fill_value for c in to_concat}
+        if len(fill_values) == 1:
+            sp_values = [c.sp_values for c in to_concat]
+            indexes = [c.sp_index.to_int_index() for c in to_concat]
+
+            indices = []
+            loc = 0
+            for idx in indexes:
+                indices.append(idx.indices + loc)
+                loc += idx.length
+            sp_values = np.concatenate(sp_values)
+            indices = np.concatenate(indices)
+            sp_index = _make_index(loc, indices, kind=to_concat[0].sp_index)
+
+            return SparseArray(sp_values, sparse_index=sp_index,
+                               fill_value=to_concat[0].fill_value)
+
+    # input may be sparse / dense mixed and may have different fill_value
+    # input must contain sparse at least 1
+    sparses = [c for c in to_concat if is_sparse(c)]
+    fill_values = [c.fill_value for c in sparses]
+    sp_indexes = [c.sp_index for c in sparses]
+
+    # densify and regular concat
+    to_concat = [convert_sparse(x, axis) for x in to_concat]
+    result = np.concatenate(to_concat, axis=axis)
+
+    if not len(typs - set(['sparse', 'f', 'i'])):
+        # sparsify if inputs are sparse and dense numerics
+        # first sparse input's fill_value and SparseIndex is used
+        result = SparseArray(result.ravel(), fill_value=fill_values[0],
+                             kind=sp_indexes[0])
+    else:
+        # coerce to object if needed
+        result = result.astype('object')
+    return result
+
+
+def _concat_rangeindex_same_dtype(indexes):
+    """
+    Concatenates multiple RangeIndex instances. All members of "indexes" must
+    be of type RangeIndex; result will be RangeIndex if possible, Int64Index
+    otherwise. E.g.:
+    indexes = [RangeIndex(3), RangeIndex(3, 6)] -> RangeIndex(6)
+    indexes = [RangeIndex(3), RangeIndex(4, 6)] -> Int64Index([0,1,2,4,5])
+    """
+    from pandas import Int64Index, RangeIndex
+
+    start = step = next = None
+
+    # Filter the empty indexes
+    non_empty_indexes = [obj for obj in indexes if len(obj)]
+
+    for obj in non_empty_indexes:
+
+        if start is None:
+            # This is set by the first non-empty index
+            start = obj._start
+            if step is None and len(obj) > 1:
+                step = obj._step
+        elif step is None:
+            # First non-empty index had only one element
+            if obj._start == start:
+                return _concat_index_same_dtype(indexes, klass=Int64Index)
+            step = obj._start - start
+
+        non_consecutive = ((step != obj._step and len(obj) > 1) or
+                           (next is not None and obj._start != next))
+        if non_consecutive:
+            return _concat_index_same_dtype(indexes, klass=Int64Index)
+
+        if step is not None:
+            next = obj[-1] + step
+
+    if non_empty_indexes:
+        # Get the stop value from "next" or alternatively
+        # from the last non-empty index
+        stop = non_empty_indexes[-1]._stop if next is None else next
+        return RangeIndex(start, stop, step)
+
+    # Here all "indexes" had 0 length, i.e. were empty.
+    # In this case return an empty range index.
+    return RangeIndex(0, 0)
diff --git a/pandas/core/dtypes/dtypes.py b/pandas/core/dtypes/dtypes.py
new file mode 100644
index 0000000000000..1e762c2be92a6
--- /dev/null
+++ b/pandas/core/dtypes/dtypes.py
@@ -0,0 +1,729 @@
+""" define extension dtypes """
+
+import re
+import numpy as np
+from pandas import compat
+from pandas.core.dtypes.generic import ABCIndexClass, ABCCategoricalIndex
+
+from .base import ExtensionDtype, _DtypeOpsMixin
+
+
+class PandasExtensionDtype(_DtypeOpsMixin):
+    """
+    A np.dtype duck-typed class, suitable for holding a custom dtype.
+
+    THIS IS NOT A REAL NUMPY DTYPE
+    """
+    type = None
+    subdtype = None
+    kind = None
+    str = None
+    num = 100
+    shape = tuple()
+    itemsize = 8
+    base = None
+    isbuiltin = 0
+    isnative = 0
+    _metadata = []
+    _cache = {}
+
+    def __unicode__(self):
+        return self.name
+
+    def __str__(self):
+        """
+        Return a string representation for a particular Object
+
+        Invoked by str(df) in both py2/py3.
+        Yields Bytestring in Py2, Unicode String in py3.
+        """
+
+        if compat.PY3:
+            return self.__unicode__()
+        return self.__bytes__()
+
+    def __bytes__(self):
+        """
+        Return a string representation for a particular object.
+
+        Invoked by bytes(obj) in py3 only.
+        Yields a bytestring in both py2/py3.
+        """
+        from pandas.core.config import get_option
+
+        encoding = get_option("display.encoding")
+        return self.__unicode__().encode(encoding, 'replace')
+
+    def __repr__(self):
+        """
+        Return a string representation for a particular object.
+
+        Yields Bytestring in Py2, Unicode String in py3.
+        """
+        return str(self)
+
+    def __hash__(self):
+        raise NotImplementedError("sub-classes should implement an __hash__ "
+                                  "method")
+
+    def __getstate__(self):
+        # pickle support; we don't want to pickle the cache
+        return {k: getattr(self, k, None) for k in self._metadata}
+
+    @classmethod
+    def reset_cache(cls):
+        """ clear the cache """
+        cls._cache = {}
+
+
+class CategoricalDtypeType(type):
+    """
+    the type of CategoricalDtype, this metaclass determines subclass ability
+    """
+    pass
+
+
+class CategoricalDtype(PandasExtensionDtype, ExtensionDtype):
+    """
+    Type for categorical data with the categories and orderedness
+
+    .. versionchanged:: 0.21.0
+
+    Parameters
+    ----------
+    categories : sequence, optional
+        Must be unique, and must not contain any nulls.
+    ordered : bool, default False
+
+    Attributes
+    ----------
+    categories
+    ordered
+
+    Methods
+    -------
+    None
+
+    Notes
+    -----
+    This class is useful for specifying the type of a ``Categorical``
+    independent of the values. See :ref:`categorical.categoricaldtype`
+    for more.
+
+    Examples
+    --------
+    >>> t = CategoricalDtype(categories=['b', 'a'], ordered=True)
+    >>> pd.Series(['a', 'b', 'a', 'c'], dtype=t)
+    0      a
+    1      b
+    2      a
+    3    NaN
+    dtype: category
+    Categories (2, object): [b < a]
+
+    See Also
+    --------
+    pandas.Categorical
+    """
+    # TODO: Document public vs. private API
+    name = 'category'
+    type = CategoricalDtypeType
+    kind = 'O'
+    str = '|O08'
+    base = np.dtype('O')
+    _metadata = ['categories', 'ordered']
+    _cache = {}
+
+    def __init__(self, categories=None, ordered=None):
+        self._finalize(categories, ordered, fastpath=False)
+
+    @classmethod
+    def _from_fastpath(cls, categories=None, ordered=None):
+        self = cls.__new__(cls)
+        self._finalize(categories, ordered, fastpath=True)
+        return self
+
+    @classmethod
+    def _from_categorical_dtype(cls, dtype, categories=None, ordered=None):
+        if categories is ordered is None:
+            return dtype
+        if categories is None:
+            categories = dtype.categories
+        if ordered is None:
+            ordered = dtype.ordered
+        return cls(categories, ordered)
+
+    def _finalize(self, categories, ordered, fastpath=False):
+
+        if ordered is not None:
+            self.validate_ordered(ordered)
+
+        if categories is not None:
+            categories = self.validate_categories(categories,
+                                                  fastpath=fastpath)
+
+        self._categories = categories
+        self._ordered = ordered
+
+    def __setstate__(self, state):
+        self._categories = state.pop('categories', None)
+        self._ordered = state.pop('ordered', False)
+
+    def __hash__(self):
+        # _hash_categories returns a uint64, so use the negative
+        # space for when we have unknown categories to avoid a conflict
+        if self.categories is None:
+            if self.ordered:
+                return -1
+            else:
+                return -2
+        # We *do* want to include the real self.ordered here
+        return int(self._hash_categories(self.categories, self.ordered))
+
+    def __eq__(self, other):
+        """
+        Rules for CDT equality:
+        1) Any CDT is equal to the string 'category'
+        2) Any CDT is equal to itself
+        3) Any CDT is equal to a CDT with categories=None regardless of ordered
+        4) A CDT with ordered=True is only equal to another CDT with
+           ordered=True and identical categories in the same order
+        5) A CDT with ordered={False, None} is only equal to another CDT with
+           ordered={False, None} and identical categories, but same order is
+           not required. There is no distinction between False/None.
+        6) Any other comparison returns False
+        """
+        if isinstance(other, compat.string_types):
+            return other == self.name
+        elif other is self:
+            return True
+        elif not (hasattr(other, 'ordered') and hasattr(other, 'categories')):
+            return False
+        elif self.categories is None or other.categories is None:
+            # We're forced into a suboptimal corner thanks to math and
+            # backwards compatibility. We require that `CDT(...) == 'category'`
+            # for all CDTs **including** `CDT(None, ...)`. Therefore, *all*
+            # CDT(., .) = CDT(None, False) and *all*
+            # CDT(., .) = CDT(None, True).
+            return True
+        elif self.ordered or other.ordered:
+            # At least one has ordered=True; equal if both have ordered=True
+            # and the same values for categories in the same order.
+            return ((self.ordered == other.ordered) and
+                    self.categories.equals(other.categories))
+        else:
+            # Neither has ordered=True; equal if both have the same categories,
+            # but same order is not necessary.  There is no distinction between
+            # ordered=False and ordered=None: CDT(., False) and CDT(., None)
+            # will be equal if they have the same categories.
+            return hash(self) == hash(other)
+
+    def __repr__(self):
+        tpl = u'CategoricalDtype(categories={}ordered={})'
+        if self.categories is None:
+            data = u"None, "
+        else:
+            data = self.categories._format_data(name=self.__class__.__name__)
+        return tpl.format(data, self.ordered)
+
+    @staticmethod
+    def _hash_categories(categories, ordered=True):
+        from pandas.core.util.hashing import (
+            hash_array, _combine_hash_arrays, hash_tuples
+        )
+
+        if len(categories) and isinstance(categories[0], tuple):
+            # assumes if any individual category is a tuple, then all our. ATM
+            # I don't really want to support just some of the categories being
+            # tuples.
+            categories = list(categories)  # breaks if a np.array of categories
+            cat_array = hash_tuples(categories)
+        else:
+            if categories.dtype == 'O':
+                types = [type(x) for x in categories]
+                if not len(set(types)) == 1:
+                    # TODO: hash_array doesn't handle mixed types. It casts
+                    # everything to a str first, which means we treat
+                    # {'1', '2'} the same as {'1', 2}
+                    # find a better solution
+                    cat_array = np.array([hash(x) for x in categories])
+                    hashed = hash((tuple(categories), ordered))
+                    return hashed
+            cat_array = hash_array(np.asarray(categories), categorize=False)
+        if ordered:
+            cat_array = np.vstack([
+                cat_array, np.arange(len(cat_array), dtype=cat_array.dtype)
+            ])
+        else:
+            cat_array = [cat_array]
+        hashed = _combine_hash_arrays(iter(cat_array),
+                                      num_items=len(cat_array))
+        if len(hashed) == 0:
+            # bug in Numpy<1.12 for length 0 arrays. Just return the correct
+            # value of 0
+            return 0
+        else:
+            return np.bitwise_xor.reduce(hashed)
+
+    @classmethod
+    def construct_from_string(cls, string):
+        """ attempt to construct this type from a string, raise a TypeError if
+        it's not possible """
+        try:
+            if string == 'category':
+                return cls()
+        except:
+            pass
+
+        raise TypeError("cannot construct a CategoricalDtype")
+
+    @staticmethod
+    def validate_ordered(ordered):
+        """
+        Validates that we have a valid ordered parameter. If
+        it is not a boolean, a TypeError will be raised.
+
+        Parameters
+        ----------
+        ordered : object
+            The parameter to be verified.
+
+        Raises
+        ------
+        TypeError
+            If 'ordered' is not a boolean.
+        """
+        from pandas.core.dtypes.common import is_bool
+        if not is_bool(ordered):
+            raise TypeError("'ordered' must either be 'True' or 'False'")
+
+    @staticmethod
+    def validate_categories(categories, fastpath=False):
+        """
+        Validates that we have good categories
+
+        Parameters
+        ----------
+        categories : array-like
+        fastpath : bool
+            Whether to skip nan and uniqueness checks
+
+        Returns
+        -------
+        categories : Index
+        """
+        from pandas import Index
+
+        if not isinstance(categories, ABCIndexClass):
+            categories = Index(categories, tupleize_cols=False)
+
+        if not fastpath:
+
+            if categories.hasnans:
+                raise ValueError('Categorial categories cannot be null')
+
+            if not categories.is_unique:
+                raise ValueError('Categorical categories must be unique')
+
+        if isinstance(categories, ABCCategoricalIndex):
+            categories = categories.categories
+
+        return categories
+
+    def update_dtype(self, dtype):
+        """
+        Returns a CategoricalDtype with categories and ordered taken from dtype
+        if specified, otherwise falling back to self if unspecified
+
+        Parameters
+        ----------
+        dtype : CategoricalDtype
+
+        Returns
+        -------
+        new_dtype : CategoricalDtype
+        """
+        if isinstance(dtype, compat.string_types) and dtype == 'category':
+            # dtype='category' should not change anything
+            return self
+        elif not self.is_dtype(dtype):
+            msg = ('a CategoricalDtype must be passed to perform an update, '
+                   'got {dtype!r}').format(dtype=dtype)
+            raise ValueError(msg)
+        elif dtype.categories is not None and dtype.ordered is self.ordered:
+            return dtype
+
+        # dtype is CDT: keep current categories/ordered if None
+        new_categories = dtype.categories
+        if new_categories is None:
+            new_categories = self.categories
+
+        new_ordered = dtype.ordered
+        if new_ordered is None:
+            new_ordered = self.ordered
+
+        return CategoricalDtype(new_categories, new_ordered)
+
+    @property
+    def categories(self):
+        """
+        An ``Index`` containing the unique categories allowed.
+        """
+        return self._categories
+
+    @property
+    def ordered(self):
+        """Whether the categories have an ordered relationship"""
+        return self._ordered
+
+
+class DatetimeTZDtypeType(type):
+    """
+    the type of DatetimeTZDtype, this metaclass determines subclass ability
+    """
+    pass
+
+
+class DatetimeTZDtype(PandasExtensionDtype):
+
+    """
+    A np.dtype duck-typed class, suitable for holding a custom datetime with tz
+    dtype.
+
+    THIS IS NOT A REAL NUMPY DTYPE, but essentially a sub-class of
+    np.datetime64[ns]
+    """
+    type = DatetimeTZDtypeType
+    kind = 'M'
+    str = '|M8[ns]'
+    num = 101
+    base = np.dtype('M8[ns]')
+    _metadata = ['unit', 'tz']
+    _match = re.compile(r"(datetime64|M8)\[(?P<unit>.+), (?P<tz>.+)\]")
+    _cache = {}
+
+    def __new__(cls, unit=None, tz=None):
+        """ Create a new unit if needed, otherwise return from the cache
+
+        Parameters
+        ----------
+        unit : string unit that this represents, currently must be 'ns'
+        tz : string tz that this represents
+        """
+
+        if isinstance(unit, DatetimeTZDtype):
+            unit, tz = unit.unit, unit.tz
+
+        elif unit is None:
+            # we are called as an empty constructor
+            # generally for pickle compat
+            return object.__new__(cls)
+
+        elif tz is None:
+
+            # we were passed a string that we can construct
+            try:
+                m = cls._match.search(unit)
+                if m is not None:
+                    unit = m.groupdict()['unit']
+                    tz = m.groupdict()['tz']
+            except:
+                raise ValueError("could not construct DatetimeTZDtype")
+
+        elif isinstance(unit, compat.string_types):
+
+            if unit != 'ns':
+                raise ValueError("DatetimeTZDtype only supports ns units")
+
+            unit = unit
+            tz = tz
+
+        if tz is None:
+            raise ValueError("DatetimeTZDtype constructor must have a tz "
+                             "supplied")
+
+        # hash with the actual tz if we can
+        # some cannot be hashed, so stringfy
+        try:
+            key = (unit, tz)
+            hash(key)
+        except TypeError:
+            key = (unit, str(tz))
+
+        # set/retrieve from cache
+        try:
+            return cls._cache[key]
+        except KeyError:
+            u = object.__new__(cls)
+            u.unit = unit
+            u.tz = tz
+            cls._cache[key] = u
+            return u
+
+    @classmethod
+    def construct_from_string(cls, string):
+        """ attempt to construct this type from a string, raise a TypeError if
+        it's not possible
+        """
+        try:
+            return cls(unit=string)
+        except ValueError:
+            raise TypeError("could not construct DatetimeTZDtype")
+
+    def __unicode__(self):
+        # format the tz
+        return "datetime64[{unit}, {tz}]".format(unit=self.unit, tz=self.tz)
+
+    @property
+    def name(self):
+        return str(self)
+
+    def __hash__(self):
+        # make myself hashable
+        return hash(str(self))
+
+    def __eq__(self, other):
+        if isinstance(other, compat.string_types):
+            return other == self.name
+
+        return (isinstance(other, DatetimeTZDtype) and
+                self.unit == other.unit and
+                str(self.tz) == str(other.tz))
+
+
+class PeriodDtypeType(type):
+    """
+    the type of PeriodDtype, this metaclass determines subclass ability
+    """
+    pass
+
+
+class PeriodDtype(PandasExtensionDtype):
+    """
+    A Period duck-typed class, suitable for holding a period with freq dtype.
+
+    THIS IS NOT A REAL NUMPY DTYPE, but essentially a sub-class of np.int64.
+    """
+    type = PeriodDtypeType
+    kind = 'O'
+    str = '|O08'
+    base = np.dtype('O')
+    num = 102
+    _metadata = ['freq']
+    _match = re.compile(r"(P|p)eriod\[(?P<freq>.+)\]")
+    _cache = {}
+
+    def __new__(cls, freq=None):
+        """
+        Parameters
+        ----------
+        freq : frequency
+        """
+
+        if isinstance(freq, PeriodDtype):
+            return freq
+
+        elif freq is None:
+            # empty constructor for pickle compat
+            return object.__new__(cls)
+
+        from pandas.tseries.offsets import DateOffset
+        if not isinstance(freq, DateOffset):
+            freq = cls._parse_dtype_strict(freq)
+
+        try:
+            return cls._cache[freq.freqstr]
+        except KeyError:
+            u = object.__new__(cls)
+            u.freq = freq
+            cls._cache[freq.freqstr] = u
+            return u
+
+    @classmethod
+    def _parse_dtype_strict(cls, freq):
+        if isinstance(freq, compat.string_types):
+            if freq.startswith('period[') or freq.startswith('Period['):
+                m = cls._match.search(freq)
+                if m is not None:
+                    freq = m.group('freq')
+            from pandas.tseries.frequencies import to_offset
+            freq = to_offset(freq)
+            if freq is not None:
+                return freq
+
+        raise ValueError("could not construct PeriodDtype")
+
+    @classmethod
+    def construct_from_string(cls, string):
+        """
+        attempt to construct this type from a string, raise a TypeError
+        if its not possible
+        """
+        from pandas.tseries.offsets import DateOffset
+        if isinstance(string, (compat.string_types, DateOffset)):
+            # avoid tuple to be regarded as freq
+            try:
+                return cls(freq=string)
+            except ValueError:
+                pass
+        raise TypeError("could not construct PeriodDtype")
+
+    def __unicode__(self):
+        return "period[{freq}]".format(freq=self.freq.freqstr)
+
+    @property
+    def name(self):
+        return str(self)
+
+    def __hash__(self):
+        # make myself hashable
+        return hash(str(self))
+
+    def __eq__(self, other):
+        if isinstance(other, compat.string_types):
+            return other == self.name or other == self.name.title()
+
+        return isinstance(other, PeriodDtype) and self.freq == other.freq
+
+    @classmethod
+    def is_dtype(cls, dtype):
+        """
+        Return a boolean if we if the passed type is an actual dtype that we
+        can match (via string or type)
+        """
+
+        if isinstance(dtype, compat.string_types):
+            # PeriodDtype can be instantiated from freq string like "U",
+            # but doesn't regard freq str like "U" as dtype.
+            if dtype.startswith('period[') or dtype.startswith('Period['):
+                try:
+                    if cls._parse_dtype_strict(dtype) is not None:
+                        return True
+                    else:
+                        return False
+                except ValueError:
+                    return False
+            else:
+                return False
+        return super(PeriodDtype, cls).is_dtype(dtype)
+
+
+class IntervalDtypeType(type):
+    """
+    the type of IntervalDtype, this metaclass determines subclass ability
+    """
+    pass
+
+
+class IntervalDtype(PandasExtensionDtype):
+    """
+    A Interval duck-typed class, suitable for holding an interval
+
+    THIS IS NOT A REAL NUMPY DTYPE
+    """
+    name = 'interval'
+    type = IntervalDtypeType
+    kind = None
+    str = '|O08'
+    base = np.dtype('O')
+    num = 103
+    _metadata = ['subtype']
+    _match = re.compile(r"(I|i)nterval\[(?P<subtype>.+)\]")
+    _cache = {}
+
+    def __new__(cls, subtype=None):
+        """
+        Parameters
+        ----------
+        subtype : the dtype of the Interval
+        """
+        from pandas.core.dtypes.common import (
+            is_categorical_dtype, is_string_dtype, pandas_dtype)
+
+        if isinstance(subtype, IntervalDtype):
+            return subtype
+        elif subtype is None:
+            # we are called as an empty constructor
+            # generally for pickle compat
+            u = object.__new__(cls)
+            u.subtype = None
+            return u
+        elif (isinstance(subtype, compat.string_types) and
+              subtype.lower() == 'interval'):
+            subtype = None
+        else:
+            if isinstance(subtype, compat.string_types):
+                m = cls._match.search(subtype)
+                if m is not None:
+                    subtype = m.group('subtype')
+
+            try:
+                subtype = pandas_dtype(subtype)
+            except TypeError:
+                raise ValueError("could not construct IntervalDtype")
+
+        if is_categorical_dtype(subtype) or is_string_dtype(subtype):
+            # GH 19016
+            msg = ('category, object, and string subtypes are not supported '
+                   'for IntervalDtype')
+            raise TypeError(msg)
+
+        try:
+            return cls._cache[str(subtype)]
+        except KeyError:
+            u = object.__new__(cls)
+            u.subtype = subtype
+            cls._cache[str(subtype)] = u
+            return u
+
+    @classmethod
+    def construct_from_string(cls, string):
+        """
+        attempt to construct this type from a string, raise a TypeError
+        if its not possible
+        """
+        if isinstance(string, compat.string_types):
+            return cls(string)
+        msg = "a string needs to be passed, got type {typ}"
+        raise TypeError(msg.format(typ=type(string)))
+
+    def __unicode__(self):
+        if self.subtype is None:
+            return "interval"
+        return "interval[{subtype}]".format(subtype=self.subtype)
+
+    def __hash__(self):
+        # make myself hashable
+        return hash(str(self))
+
+    def __eq__(self, other):
+        if isinstance(other, compat.string_types):
+            return other.lower() in (self.name.lower(), str(self).lower())
+        elif not isinstance(other, IntervalDtype):
+            return False
+        elif self.subtype is None or other.subtype is None:
+            # None should match any subtype
+            return True
+        else:
+            from pandas.core.dtypes.common import is_dtype_equal
+            return is_dtype_equal(self.subtype, other.subtype)
+
+    @classmethod
+    def is_dtype(cls, dtype):
+        """
+        Return a boolean if we if the passed type is an actual dtype that we
+        can match (via string or type)
+        """
+
+        if isinstance(dtype, compat.string_types):
+            if dtype.lower().startswith('interval'):
+                try:
+                    if cls.construct_from_string(dtype) is not None:
+                        return True
+                    else:
+                        return False
+                except ValueError:
+                    return False
+            else:
+                return False
+        return super(IntervalDtype, cls).is_dtype(dtype)
diff --git a/pandas/core/dtypes/generic.py b/pandas/core/dtypes/generic.py
new file mode 100644
index 0000000000000..cb54c94d29205
--- /dev/null
+++ b/pandas/core/dtypes/generic.py
@@ -0,0 +1,70 @@
+""" define generic base classes for pandas objects """
+
+
+# define abstract base classes to enable isinstance type checking on our
+# objects
+def create_pandas_abc_type(name, attr, comp):
+    @classmethod
+    def _check(cls, inst):
+        return getattr(inst, attr, '_typ') in comp
+
+    dct = dict(__instancecheck__=_check, __subclasscheck__=_check)
+    meta = type("ABCBase", (type, ), dct)
+    return meta(name, tuple(), dct)
+
+
+ABCIndex = create_pandas_abc_type("ABCIndex", "_typ", ("index", ))
+ABCInt64Index = create_pandas_abc_type("ABCInt64Index", "_typ",
+                                       ("int64index", ))
+ABCUInt64Index = create_pandas_abc_type("ABCUInt64Index", "_typ",
+                                        ("uint64index", ))
+ABCRangeIndex = create_pandas_abc_type("ABCRangeIndex", "_typ",
+                                       ("rangeindex", ))
+ABCFloat64Index = create_pandas_abc_type("ABCFloat64Index", "_typ",
+                                         ("float64index", ))
+ABCMultiIndex = create_pandas_abc_type("ABCMultiIndex", "_typ",
+                                       ("multiindex", ))
+ABCDatetimeIndex = create_pandas_abc_type("ABCDatetimeIndex", "_typ",
+                                          ("datetimeindex", ))
+ABCTimedeltaIndex = create_pandas_abc_type("ABCTimedeltaIndex", "_typ",
+                                           ("timedeltaindex", ))
+ABCPeriodIndex = create_pandas_abc_type("ABCPeriodIndex", "_typ",
+                                        ("periodindex", ))
+ABCCategoricalIndex = create_pandas_abc_type("ABCCategoricalIndex", "_typ",
+                                             ("categoricalindex", ))
+ABCIntervalIndex = create_pandas_abc_type("ABCIntervalIndex", "_typ",
+                                          ("intervalindex", ))
+ABCIndexClass = create_pandas_abc_type("ABCIndexClass", "_typ",
+                                       ("index", "int64index", "rangeindex",
+                                        "float64index", "uint64index",
+                                        "multiindex", "datetimeindex",
+                                        "timedeltaindex", "periodindex",
+                                        "categoricalindex", "intervalindex"))
+
+ABCSeries = create_pandas_abc_type("ABCSeries", "_typ", ("series", ))
+ABCDataFrame = create_pandas_abc_type("ABCDataFrame", "_typ", ("dataframe", ))
+ABCSparseDataFrame = create_pandas_abc_type("ABCSparseDataFrame", "_subtyp",
+                                            ("sparse_frame", ))
+ABCPanel = create_pandas_abc_type("ABCPanel", "_typ", ("panel",))
+ABCSparseSeries = create_pandas_abc_type("ABCSparseSeries", "_subtyp",
+                                         ('sparse_series',
+                                          'sparse_time_series'))
+ABCSparseArray = create_pandas_abc_type("ABCSparseArray", "_subtyp",
+                                        ('sparse_array', 'sparse_series'))
+ABCCategorical = create_pandas_abc_type("ABCCategorical", "_typ",
+                                        ("categorical"))
+ABCPeriod = create_pandas_abc_type("ABCPeriod", "_typ", ("period", ))
+ABCDateOffset = create_pandas_abc_type("ABCDateOffset", "_typ",
+                                       ("dateoffset",))
+ABCInterval = create_pandas_abc_type("ABCInterval", "_typ", ("interval", ))
+ABCExtensionArray = create_pandas_abc_type("ABCExtensionArray", "_typ",
+                                           ("extension", "categorical",))
+
+
+class _ABCGeneric(type):
+
+    def __instancecheck__(cls, inst):
+        return hasattr(inst, "_data")
+
+
+ABCGeneric = _ABCGeneric("ABCGeneric", tuple(), {})
diff --git a/pandas/core/dtypes/inference.py b/pandas/core/dtypes/inference.py
new file mode 100644
index 0000000000000..d747e69d1ff39
--- /dev/null
+++ b/pandas/core/dtypes/inference.py
@@ -0,0 +1,476 @@
+""" basic inference routines """
+
+import collections
+import re
+import numpy as np
+from collections import Iterable
+from numbers import Number
+from pandas.compat import (PY2, string_types, text_type,
+                           string_and_binary_types, re_type)
+from pandas._libs import lib
+
+is_bool = lib.is_bool
+
+is_integer = lib.is_integer
+
+is_float = lib.is_float
+
+is_complex = lib.is_complex
+
+is_scalar = lib.is_scalar
+
+is_decimal = lib.is_decimal
+
+is_interval = lib.is_interval
+
+
+def is_number(obj):
+    """
+    Check if the object is a number.
+
+    Returns True when the object is a number, and False if is not.
+
+    Parameters
+    ----------
+    obj : any type
+        The object to check if is a number.
+
+    Returns
+    -------
+    is_number : bool
+        Whether `obj` is a number or not.
+
+    See Also
+    --------
+    pandas.api.types.is_integer: checks a subgroup of numbers
+
+    Examples
+    --------
+    >>> pd.api.types.is_number(1)
+    True
+    >>> pd.api.types.is_number(7.15)
+    True
+
+    Booleans are valid because they are int subclass.
+
+    >>> pd.api.types.is_number(False)
+    True
+
+    >>> pd.api.types.is_number("foo")
+    False
+    >>> pd.api.types.is_number("5")
+    False
+    """
+
+    return isinstance(obj, (Number, np.number))
+
+
+def is_string_like(obj):
+    """
+    Check if the object is a string.
+
+    Parameters
+    ----------
+    obj : The object to check.
+
+    Examples
+    --------
+    >>> is_string_like("foo")
+    True
+    >>> is_string_like(1)
+    False
+
+    Returns
+    -------
+    is_str_like : bool
+        Whether `obj` is a string or not.
+    """
+
+    return isinstance(obj, (text_type, string_types))
+
+
+def _iterable_not_string(obj):
+    """
+    Check if the object is an iterable but not a string.
+
+    Parameters
+    ----------
+    obj : The object to check.
+
+    Returns
+    -------
+    is_iter_not_string : bool
+        Whether `obj` is a non-string iterable.
+
+    Examples
+    --------
+    >>> _iterable_not_string([1, 2, 3])
+    True
+    >>> _iterable_not_string("foo")
+    False
+    >>> _iterable_not_string(1)
+    False
+    """
+
+    return (isinstance(obj, collections.Iterable) and
+            not isinstance(obj, string_types))
+
+
+def is_iterator(obj):
+    """
+    Check if the object is an iterator.
+
+    For example, lists are considered iterators
+    but not strings or datetime objects.
+
+    Parameters
+    ----------
+    obj : The object to check.
+
+    Returns
+    -------
+    is_iter : bool
+        Whether `obj` is an iterator.
+
+    Examples
+    --------
+    >>> is_iterator([1, 2, 3])
+    True
+    >>> is_iterator(datetime(2017, 1, 1))
+    False
+    >>> is_iterator("foo")
+    False
+    >>> is_iterator(1)
+    False
+    """
+
+    if not hasattr(obj, '__iter__'):
+        return False
+
+    if PY2:
+        return hasattr(obj, 'next')
+    else:
+        # Python 3 generators have
+        # __next__ instead of next
+        return hasattr(obj, '__next__')
+
+
+def is_file_like(obj):
+    """
+    Check if the object is a file-like object.
+
+    For objects to be considered file-like, they must
+    be an iterator AND have either a `read` and/or `write`
+    method as an attribute.
+
+    Note: file-like objects must be iterable, but
+    iterable objects need not be file-like.
+
+    .. versionadded:: 0.20.0
+
+    Parameters
+    ----------
+    obj : The object to check.
+
+    Returns
+    -------
+    is_file_like : bool
+        Whether `obj` has file-like properties.
+
+    Examples
+    --------
+    >>> buffer(StringIO("data"))
+    >>> is_file_like(buffer)
+    True
+    >>> is_file_like([1, 2, 3])
+    False
+    """
+
+    if not (hasattr(obj, 'read') or hasattr(obj, 'write')):
+        return False
+
+    if not hasattr(obj, "__iter__"):
+        return False
+
+    return True
+
+
+def is_re(obj):
+    """
+    Check if the object is a regex pattern instance.
+
+    Parameters
+    ----------
+    obj : The object to check.
+
+    Returns
+    -------
+    is_regex : bool
+        Whether `obj` is a regex pattern.
+
+    Examples
+    --------
+    >>> is_re(re.compile(".*"))
+    True
+    >>> is_re("foo")
+    False
+    """
+
+    return isinstance(obj, re_type)
+
+
+def is_re_compilable(obj):
+    """
+    Check if the object can be compiled into a regex pattern instance.
+
+    Parameters
+    ----------
+    obj : The object to check.
+
+    Returns
+    -------
+    is_regex_compilable : bool
+        Whether `obj` can be compiled as a regex pattern.
+
+    Examples
+    --------
+    >>> is_re_compilable(".*")
+    True
+    >>> is_re_compilable(1)
+    False
+    """
+
+    try:
+        re.compile(obj)
+    except TypeError:
+        return False
+    else:
+        return True
+
+
+def is_list_like(obj):
+    """
+    Check if the object is list-like.
+
+    Objects that are considered list-like are for example Python
+    lists, tuples, sets, NumPy arrays, and Pandas Series.
+
+    Strings and datetime objects, however, are not considered list-like.
+
+    Parameters
+    ----------
+    obj : The object to check.
+
+    Returns
+    -------
+    is_list_like : bool
+        Whether `obj` has list-like properties.
+
+    Examples
+    --------
+    >>> is_list_like([1, 2, 3])
+    True
+    >>> is_list_like({1, 2, 3})
+    True
+    >>> is_list_like(datetime(2017, 1, 1))
+    False
+    >>> is_list_like("foo")
+    False
+    >>> is_list_like(1)
+    False
+    """
+
+    return (isinstance(obj, Iterable) and
+            not isinstance(obj, string_and_binary_types))
+
+
+def is_array_like(obj):
+    """
+    Check if the object is array-like.
+
+    For an object to be considered array-like, it must be list-like and
+    have a `dtype` attribute.
+
+    Parameters
+    ----------
+    obj : The object to check.
+
+    Returns
+    -------
+    is_array_like : bool
+        Whether `obj` has array-like properties.
+
+    Examples
+    --------
+    >>> is_array_like(np.array([1, 2, 3]))
+    True
+    >>> is_array_like(pd.Series(["a", "b"]))
+    True
+    >>> is_array_like(pd.Index(["2016-01-01"]))
+    True
+    >>> is_array_like([1, 2, 3])
+    False
+    >>> is_array_like(("a", "b"))
+    False
+    """
+
+    return is_list_like(obj) and hasattr(obj, "dtype")
+
+
+def is_nested_list_like(obj):
+    """
+    Check if the object is list-like, and that all of its elements
+    are also list-like.
+
+    .. versionadded:: 0.20.0
+
+    Parameters
+    ----------
+    obj : The object to check.
+
+    Returns
+    -------
+    is_list_like : bool
+        Whether `obj` has list-like properties.
+
+    Examples
+    --------
+    >>> is_nested_list_like([[1, 2, 3]])
+    True
+    >>> is_nested_list_like([{1, 2, 3}, {1, 2, 3}])
+    True
+    >>> is_nested_list_like(["foo"])
+    False
+    >>> is_nested_list_like([])
+    False
+    >>> is_nested_list_like([[1, 2, 3], 1])
+    False
+
+    Notes
+    -----
+    This won't reliably detect whether a consumable iterator (e. g.
+    a generator) is a nested-list-like without consuming the iterator.
+    To avoid consuming it, we always return False if the outer container
+    doesn't define `__len__`.
+
+    See Also
+    --------
+    is_list_like
+    """
+    return (is_list_like(obj) and hasattr(obj, '__len__') and
+            len(obj) > 0 and all(is_list_like(item) for item in obj))
+
+
+def is_dict_like(obj):
+    """
+    Check if the object is dict-like.
+
+    Parameters
+    ----------
+    obj : The object to check.
+
+    Returns
+    -------
+    is_dict_like : bool
+        Whether `obj` has dict-like properties.
+
+    Examples
+    --------
+    >>> is_dict_like({1: 2})
+    True
+    >>> is_dict_like([1, 2, 3])
+    False
+    """
+
+    return hasattr(obj, '__getitem__') and hasattr(obj, 'keys')
+
+
+def is_named_tuple(obj):
+    """
+    Check if the object is a named tuple.
+
+    Parameters
+    ----------
+    obj : The object to check.
+
+    Returns
+    -------
+    is_named_tuple : bool
+        Whether `obj` is a named tuple.
+
+    Examples
+    --------
+    >>> Point = namedtuple("Point", ["x", "y"])
+    >>> p = Point(1, 2)
+    >>>
+    >>> is_named_tuple(p)
+    True
+    >>> is_named_tuple((1, 2))
+    False
+    """
+
+    return isinstance(obj, tuple) and hasattr(obj, '_fields')
+
+
+def is_hashable(obj):
+    """Return True if hash(obj) will succeed, False otherwise.
+
+    Some types will pass a test against collections.Hashable but fail when they
+    are actually hashed with hash().
+
+    Distinguish between these and other types by trying the call to hash() and
+    seeing if they raise TypeError.
+
+    Examples
+    --------
+    >>> a = ([],)
+    >>> isinstance(a, collections.Hashable)
+    True
+    >>> is_hashable(a)
+    False
+    """
+    # Unfortunately, we can't use isinstance(obj, collections.Hashable), which
+    # can be faster than calling hash. That is because numpy scalars on Python
+    # 3 fail this test.
+
+    # Reconsider this decision once this numpy bug is fixed:
+    # https://github.com/numpy/numpy/issues/5562
+
+    try:
+        hash(obj)
+    except TypeError:
+        return False
+    else:
+        return True
+
+
+def is_sequence(obj):
+    """
+    Check if the object is a sequence of objects.
+    String types are not included as sequences here.
+
+    Parameters
+    ----------
+    obj : The object to check.
+
+    Returns
+    -------
+    is_sequence : bool
+        Whether `obj` is a sequence of objects.
+
+    Examples
+    --------
+    >>> l = [1, 2, 3]
+    >>>
+    >>> is_sequence(l)
+    True
+    >>> is_sequence(iter(l))
+    False
+    """
+
+    try:
+        iter(obj)  # Can iterate over it.
+        len(obj)   # Has a length associated with it.
+        return not isinstance(obj, string_and_binary_types)
+    except (TypeError, AttributeError):
+        return False
diff --git a/pandas/core/dtypes/missing.py b/pandas/core/dtypes/missing.py
new file mode 100644
index 0000000000000..ad4588f254174
--- /dev/null
+++ b/pandas/core/dtypes/missing.py
@@ -0,0 +1,532 @@
+"""
+missing types & inference
+"""
+import numpy as np
+from pandas._libs import lib, missing as libmissing
+from pandas._libs.tslib import NaT, iNaT
+from .generic import (ABCMultiIndex, ABCSeries,
+                      ABCIndexClass, ABCGeneric,
+                      ABCExtensionArray)
+from .common import (is_string_dtype, is_datetimelike,
+                     is_datetimelike_v_numeric, is_float_dtype,
+                     is_datetime64_dtype, is_datetime64tz_dtype,
+                     is_timedelta64_dtype, is_interval_dtype,
+                     is_period_dtype,
+                     is_complex_dtype,
+                     is_string_like_dtype, is_bool_dtype,
+                     is_integer_dtype, is_dtype_equal,
+                     is_extension_array_dtype,
+                     needs_i8_conversion, _ensure_object,
+                     pandas_dtype,
+                     is_scalar,
+                     is_object_dtype,
+                     is_integer,
+                     _TD_DTYPE,
+                     _NS_DTYPE)
+from .inference import is_list_like
+
+isposinf_scalar = libmissing.isposinf_scalar
+isneginf_scalar = libmissing.isneginf_scalar
+
+
+def isna(obj):
+    """
+    Detect missing values for an array-like object.
+
+    This function takes a scalar or array-like object and indicates
+    whether values are missing (``NaN`` in numeric arrays, ``None`` or ``NaN``
+    in object arrays, ``NaT`` in datetimelike).
+
+    Parameters
+    ----------
+    obj : scalar or array-like
+        Object to check for null or missing values.
+
+    Returns
+    -------
+    bool or array-like of bool
+        For scalar input, returns a scalar boolean.
+        For array input, returns an array of boolean indicating whether each
+        corresponding element is missing.
+
+    See Also
+    --------
+    notna : boolean inverse of pandas.isna.
+    Series.isna : Detect missing values in a Series.
+    DataFrame.isna : Detect missing values in a DataFrame.
+    Index.isna : Detect missing values in an Index.
+
+    Examples
+    --------
+    Scalar arguments (including strings) result in a scalar boolean.
+
+    >>> pd.isna('dog')
+    False
+
+    >>> pd.isna(np.nan)
+    True
+
+    ndarrays result in an ndarray of booleans.
+
+    >>> array = np.array([[1, np.nan, 3], [4, 5, np.nan]])
+    >>> array
+    array([[ 1., nan,  3.],
+           [ 4.,  5., nan]])
+    >>> pd.isna(array)
+    array([[False,  True, False],
+           [False, False,  True]])
+
+    For indexes, an ndarray of booleans is returned.
+
+    >>> index = pd.DatetimeIndex(["2017-07-05", "2017-07-06", None,
+    ...                           "2017-07-08"])
+    >>> index
+    DatetimeIndex(['2017-07-05', '2017-07-06', 'NaT', '2017-07-08'],
+                  dtype='datetime64[ns]', freq=None)
+    >>> pd.isna(index)
+    array([False, False,  True, False])
+
+    For Series and DataFrame, the same type is returned, containing booleans.
+
+    >>> df = pd.DataFrame([['ant', 'bee', 'cat'], ['dog', None, 'fly']])
+    >>> df
+         0     1    2
+    0  ant   bee  cat
+    1  dog  None  fly
+    >>> pd.isna(df)
+           0      1      2
+    0  False  False  False
+    1  False   True  False
+
+    >>> pd.isna(df[1])
+    0    False
+    1     True
+    Name: 1, dtype: bool
+    """
+    return _isna(obj)
+
+
+isnull = isna
+
+
+def _isna_new(obj):
+    if is_scalar(obj):
+        return libmissing.checknull(obj)
+    # hack (for now) because MI registers as ndarray
+    elif isinstance(obj, ABCMultiIndex):
+        raise NotImplementedError("isna is not defined for MultiIndex")
+    elif isinstance(obj, (ABCSeries, np.ndarray, ABCIndexClass,
+                          ABCExtensionArray)):
+        return _isna_ndarraylike(obj)
+    elif isinstance(obj, ABCGeneric):
+        return obj._constructor(obj._data.isna(func=isna))
+    elif isinstance(obj, list):
+        return _isna_ndarraylike(np.asarray(obj, dtype=object))
+    elif hasattr(obj, '__array__'):
+        return _isna_ndarraylike(np.asarray(obj))
+    else:
+        return obj is None
+
+
+def _isna_old(obj):
+    """Detect missing values. Treat None, NaN, INF, -INF as null.
+
+    Parameters
+    ----------
+    arr: ndarray or object value
+
+    Returns
+    -------
+    boolean ndarray or boolean
+    """
+    if is_scalar(obj):
+        return libmissing.checknull_old(obj)
+    # hack (for now) because MI registers as ndarray
+    elif isinstance(obj, ABCMultiIndex):
+        raise NotImplementedError("isna is not defined for MultiIndex")
+    elif isinstance(obj, (ABCSeries, np.ndarray, ABCIndexClass)):
+        return _isna_ndarraylike_old(obj)
+    elif isinstance(obj, ABCGeneric):
+        return obj._constructor(obj._data.isna(func=_isna_old))
+    elif isinstance(obj, list):
+        return _isna_ndarraylike_old(np.asarray(obj, dtype=object))
+    elif hasattr(obj, '__array__'):
+        return _isna_ndarraylike_old(np.asarray(obj))
+    else:
+        return obj is None
+
+
+_isna = _isna_new
+
+
+def _use_inf_as_na(key):
+    """Option change callback for na/inf behaviour
+    Choose which replacement for numpy.isnan / -numpy.isfinite is used.
+
+    Parameters
+    ----------
+    flag: bool
+        True means treat None, NaN, INF, -INF as null (old way),
+        False means None and NaN are null, but INF, -INF are not null
+        (new way).
+
+    Notes
+    -----
+    This approach to setting global module values is discussed and
+    approved here:
+
+    * http://stackoverflow.com/questions/4859217/
+      programmatically-creating-variables-in-python/4859312#4859312
+    """
+    from pandas.core.config import get_option
+    flag = get_option(key)
+    if flag:
+        globals()['_isna'] = _isna_old
+    else:
+        globals()['_isna'] = _isna_new
+
+
+def _isna_ndarraylike(obj):
+    values = getattr(obj, 'values', obj)
+    dtype = values.dtype
+
+    if is_extension_array_dtype(obj):
+        if isinstance(obj, (ABCIndexClass, ABCSeries)):
+            values = obj._values
+        else:
+            values = obj
+        result = values.isna()
+    elif is_interval_dtype(values):
+        # TODO(IntervalArray): remove this if block
+        from pandas import IntervalIndex
+        result = IntervalIndex(obj).isna()
+    elif is_string_dtype(dtype):
+        # Working around NumPy ticket 1542
+        shape = values.shape
+
+        if is_string_like_dtype(dtype):
+            # object array of strings
+            result = np.zeros(values.shape, dtype=bool)
+        else:
+            # object array of non-strings
+            result = np.empty(shape, dtype=bool)
+            vec = libmissing.isnaobj(values.ravel())
+            result[...] = vec.reshape(shape)
+
+    elif needs_i8_conversion(obj):
+        # this is the NaT pattern
+        result = values.view('i8') == iNaT
+    else:
+        result = np.isnan(values)
+
+    # box
+    if isinstance(obj, ABCSeries):
+        from pandas import Series
+        result = Series(result, index=obj.index, name=obj.name, copy=False)
+
+    return result
+
+
+def _isna_ndarraylike_old(obj):
+    values = getattr(obj, 'values', obj)
+    dtype = values.dtype
+
+    if is_string_dtype(dtype):
+        # Working around NumPy ticket 1542
+        shape = values.shape
+
+        if is_string_like_dtype(dtype):
+            result = np.zeros(values.shape, dtype=bool)
+        else:
+            result = np.empty(shape, dtype=bool)
+            vec = libmissing.isnaobj_old(values.ravel())
+            result[:] = vec.reshape(shape)
+
+    elif is_datetime64_dtype(dtype):
+        # this is the NaT pattern
+        result = values.view('i8') == iNaT
+    else:
+        result = ~np.isfinite(values)
+
+    # box
+    if isinstance(obj, ABCSeries):
+        from pandas import Series
+        result = Series(result, index=obj.index, name=obj.name, copy=False)
+
+    return result
+
+
+def notna(obj):
+    """
+    Detect non-missing values for an array-like object.
+
+    This function takes a scalar or array-like object and indicates
+    whether values are valid (not missing, which is ``NaN`` in numeric
+    arrays, ``None`` or ``NaN`` in object arrays, ``NaT`` in datetimelike).
+
+    Parameters
+    ----------
+    obj : array-like or object value
+        Object to check for *not* null or *non*-missing values.
+
+    Returns
+    -------
+    bool or array-like of bool
+        For scalar input, returns a scalar boolean.
+        For array input, returns an array of boolean indicating whether each
+        corresponding element is valid.
+
+    See Also
+    --------
+    isna : boolean inverse of pandas.notna.
+    Series.notna : Detect valid values in a Series.
+    DataFrame.notna : Detect valid values in a DataFrame.
+    Index.notna : Detect valid values in an Index.
+
+    Examples
+    --------
+    Scalar arguments (including strings) result in a scalar boolean.
+
+    >>> pd.notna('dog')
+    True
+
+    >>> pd.notna(np.nan)
+    False
+
+    ndarrays result in an ndarray of booleans.
+
+    >>> array = np.array([[1, np.nan, 3], [4, 5, np.nan]])
+    >>> array
+    array([[ 1., nan,  3.],
+           [ 4.,  5., nan]])
+    >>> pd.notna(array)
+    array([[ True, False,  True],
+           [ True,  True, False]])
+
+    For indexes, an ndarray of booleans is returned.
+
+    >>> index = pd.DatetimeIndex(["2017-07-05", "2017-07-06", None,
+    ...                          "2017-07-08"])
+    >>> index
+    DatetimeIndex(['2017-07-05', '2017-07-06', 'NaT', '2017-07-08'],
+                  dtype='datetime64[ns]', freq=None)
+    >>> pd.notna(index)
+    array([ True,  True, False,  True])
+
+    For Series and DataFrame, the same type is returned, containing booleans.
+
+    >>> df = pd.DataFrame([['ant', 'bee', 'cat'], ['dog', None, 'fly']])
+    >>> df
+         0     1    2
+    0  ant   bee  cat
+    1  dog  None  fly
+    >>> pd.notna(df)
+          0      1     2
+    0  True   True  True
+    1  True  False  True
+
+    >>> pd.notna(df[1])
+    0     True
+    1    False
+    Name: 1, dtype: bool
+    """
+    res = isna(obj)
+    if is_scalar(res):
+        return not res
+    return ~res
+
+
+notnull = notna
+
+
+def is_null_datelike_scalar(other):
+    """ test whether the object is a null datelike, e.g. Nat
+    but guard against passing a non-scalar """
+    if other is NaT or other is None:
+        return True
+    elif is_scalar(other):
+
+        # a timedelta
+        if hasattr(other, 'dtype'):
+            return other.view('i8') == iNaT
+        elif is_integer(other) and other == iNaT:
+            return True
+        return isna(other)
+    return False
+
+
+def _isna_compat(arr, fill_value=np.nan):
+    """
+    Parameters
+    ----------
+    arr: a numpy array
+    fill_value: fill value, default to np.nan
+
+    Returns
+    -------
+    True if we can fill using this fill_value
+    """
+    dtype = arr.dtype
+    if isna(fill_value):
+        return not (is_bool_dtype(dtype) or
+                    is_integer_dtype(dtype))
+    return True
+
+
+def array_equivalent(left, right, strict_nan=False):
+    """
+    True if two arrays, left and right, have equal non-NaN elements, and NaNs
+    in corresponding locations.  False otherwise. It is assumed that left and
+    right are NumPy arrays of the same dtype. The behavior of this function
+    (particularly with respect to NaNs) is not defined if the dtypes are
+    different.
+
+    Parameters
+    ----------
+    left, right : ndarrays
+    strict_nan : bool, default False
+        If True, consider NaN and None to be different.
+
+    Returns
+    -------
+    b : bool
+        Returns True if the arrays are equivalent.
+
+    Examples
+    --------
+    >>> array_equivalent(
+    ...     np.array([1, 2, np.nan]),
+    ...     np.array([1, 2, np.nan]))
+    True
+    >>> array_equivalent(
+    ...     np.array([1, np.nan, 2]),
+    ...     np.array([1, 2, np.nan]))
+    False
+    """
+
+    left, right = np.asarray(left), np.asarray(right)
+
+    # shape compat
+    if left.shape != right.shape:
+        return False
+
+    # Object arrays can contain None, NaN and NaT.
+    # string dtypes must be come to this path for NumPy 1.7.1 compat
+    if is_string_dtype(left) or is_string_dtype(right):
+
+        if not strict_nan:
+            # isna considers NaN and None to be equivalent.
+            return lib.array_equivalent_object(
+                _ensure_object(left.ravel()), _ensure_object(right.ravel()))
+
+        for left_value, right_value in zip(left, right):
+            if left_value is NaT and right_value is not NaT:
+                return False
+
+            elif isinstance(left_value, float) and np.isnan(left_value):
+                if (not isinstance(right_value, float) or
+                        not np.isnan(right_value)):
+                    return False
+            else:
+                if left_value != right_value:
+                    return False
+        return True
+
+    # NaNs can occur in float and complex arrays.
+    if is_float_dtype(left) or is_complex_dtype(left):
+
+        # empty
+        if not (np.prod(left.shape) and np.prod(right.shape)):
+            return True
+        return ((left == right) | (isna(left) & isna(right))).all()
+
+    # numpy will will not allow this type of datetimelike vs integer comparison
+    elif is_datetimelike_v_numeric(left, right):
+        return False
+
+    # M8/m8
+    elif needs_i8_conversion(left) and needs_i8_conversion(right):
+        if not is_dtype_equal(left.dtype, right.dtype):
+            return False
+
+        left = left.view('i8')
+        right = right.view('i8')
+
+    # if we have structured dtypes, compare first
+    if (left.dtype.type is np.void or
+            right.dtype.type is np.void):
+        if left.dtype != right.dtype:
+            return False
+
+    return np.array_equal(left, right)
+
+
+def _infer_fill_value(val):
+    """
+    infer the fill value for the nan/NaT from the provided
+    scalar/ndarray/list-like if we are a NaT, return the correct dtyped
+    element to provide proper block construction
+    """
+
+    if not is_list_like(val):
+        val = [val]
+    val = np.array(val, copy=False)
+    if is_datetimelike(val):
+        return np.array('NaT', dtype=val.dtype)
+    elif is_object_dtype(val.dtype):
+        dtype = lib.infer_dtype(_ensure_object(val))
+        if dtype in ['datetime', 'datetime64']:
+            return np.array('NaT', dtype=_NS_DTYPE)
+        elif dtype in ['timedelta', 'timedelta64']:
+            return np.array('NaT', dtype=_TD_DTYPE)
+    return np.nan
+
+
+def _maybe_fill(arr, fill_value=np.nan):
+    """
+    if we have a compatible fill_value and arr dtype, then fill
+    """
+    if _isna_compat(arr, fill_value):
+        arr.fill(fill_value)
+    return arr
+
+
+def na_value_for_dtype(dtype, compat=True):
+    """
+    Return a dtype compat na value
+
+    Parameters
+    ----------
+    dtype : string / dtype
+    compat : boolean, default True
+
+    Returns
+    -------
+    np.dtype or a pandas dtype
+    """
+    dtype = pandas_dtype(dtype)
+
+    if is_extension_array_dtype(dtype):
+        return dtype.na_value
+    if (is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype) or
+            is_timedelta64_dtype(dtype) or is_period_dtype(dtype)):
+        return NaT
+    elif is_float_dtype(dtype):
+        return np.nan
+    elif is_integer_dtype(dtype):
+        if compat:
+            return 0
+        return np.nan
+    elif is_bool_dtype(dtype):
+        return False
+    return np.nan
+
+
+def remove_na_arraylike(arr):
+    """
+    Return array-like containing only true/non-NaN values, possibly empty.
+    """
+    if is_extension_array_dtype(arr):
+        return arr[notna(arr)]
+    else:
+        return arr[notna(lib.values_from_object(arr))]
diff --git a/pandas/core/format.py b/pandas/core/format.py
deleted file mode 100644
index 322d97ab6b58f..0000000000000
--- a/pandas/core/format.py
+++ /dev/null
@@ -1,2560 +0,0 @@
-# -*- coding: utf-8 -*-
-from __future__ import print_function
-from distutils.version import LooseVersion
-# pylint: disable=W0141
-
-import sys
-
-from pandas.core.base import PandasObject
-from pandas.core.common import adjoin, notnull
-from pandas.core.index import Index, MultiIndex, _ensure_index
-from pandas import compat
-from pandas.compat import(StringIO, lzip, range, map, zip, reduce, u,
-                          OrderedDict)
-from pandas.util.terminal import get_terminal_size
-from pandas.core.config import get_option, set_option
-import pandas.core.common as com
-import pandas.lib as lib
-from pandas.tslib import iNaT, Timestamp, Timedelta, format_array_from_datetime
-from pandas.tseries.index import DatetimeIndex
-from pandas.tseries.period import PeriodIndex
-import pandas as pd
-import numpy as np
-
-import itertools
-import csv
-import warnings
-
-common_docstring = """
-    Parameters
-    ----------
-    buf : StringIO-like, optional
-        buffer to write to
-    columns : sequence, optional
-        the subset of columns to write; default None writes all columns
-    col_space : int, optional
-        the minimum width of each column
-    header : bool, optional
-        whether to print column labels, default True
-    index : bool, optional
-        whether to print index (row) labels, default True
-    na_rep : string, optional
-        string representation of NAN to use, default 'NaN'
-    formatters : list or dict of one-parameter functions, optional
-        formatter functions to apply to columns' elements by position or name,
-        default None. The result of each function must be a unicode string.
-        List must be of length equal to the number of columns.
-    float_format : one-parameter function, optional
-        formatter function to apply to columns' elements if they are floats,
-        default None. The result of this function must be a unicode string.
-    sparsify : bool, optional
-        Set to False for a DataFrame with a hierarchical index to print every
-        multiindex key at each row, default True
-    index_names : bool, optional
-        Prints the names of the indexes, default True"""
-
-justify_docstring  = """
-    justify : {'left', 'right'}, default None
-        Left or right-justify the column labels. If None uses the option from
-        the print configuration (controlled by set_option), 'right' out
-        of the box."""
-
-return_docstring = """
-
-    Returns
-    -------
-    formatted : string (or unicode, depending on data and options)"""
-
-docstring_to_string = common_docstring + justify_docstring + return_docstring
-
-class CategoricalFormatter(object):
-
-    def __init__(self, categorical, buf=None, length=True,
-                 na_rep='NaN', footer=True):
-        self.categorical = categorical
-        self.buf = buf if buf is not None else StringIO(u(""))
-        self.na_rep = na_rep
-        self.length = length
-        self.footer = footer
-
-    def _get_footer(self):
-        footer = ''
-
-        if self.length:
-            if footer:
-                footer += ', '
-            footer += "Length: %d" % len(self.categorical)
-
-        level_info = self.categorical._repr_categories_info()
-
-        # Levels are added in a newline
-        if footer:
-            footer += '\n'
-        footer += level_info
-
-        return compat.text_type(footer)
-
-    def _get_formatted_values(self):
-        return format_array(self.categorical.get_values(), None,
-                            float_format=None,
-                            na_rep=self.na_rep)
-
-    def to_string(self):
-        categorical = self.categorical
-
-        if len(categorical) == 0:
-            if self.footer:
-                return self._get_footer()
-            else:
-                return u('')
-
-        fmt_values = self._get_formatted_values()
-
-        result = ['%s' % i for i in fmt_values]
-        result = [i.strip() for i in result]
-        result = u(', ').join(result)
-        result = [u('[')+result+u(']')]
-        if self.footer:
-            footer = self._get_footer()
-            if footer:
-                result.append(footer)
-
-        return compat.text_type(u('\n').join(result))
-
-
-class SeriesFormatter(object):
-
-    def __init__(self, series, buf=None, length=True, header=True,
-                 na_rep='NaN', name=False, float_format=None, dtype=True,
-                 max_rows=None):
-        self.series = series
-        self.buf = buf if buf is not None else StringIO()
-        self.name = name
-        self.na_rep = na_rep
-        self.header = header
-        self.length = length
-        self.max_rows = max_rows
-
-        if float_format is None:
-            float_format = get_option("display.float_format")
-        self.float_format = float_format
-        self.dtype = dtype
-        self.adj = _get_adjustment()
-
-        self._chk_truncate()
-
-    def _chk_truncate(self):
-        from pandas.tools.merge import concat
-        max_rows = self.max_rows
-        truncate_v = max_rows and (len(self.series) > max_rows)
-        series = self.series
-        if truncate_v:
-            if max_rows == 1:
-                row_num = max_rows
-                series = series.iloc[:max_rows]
-            else:
-                row_num = max_rows // 2
-                series = concat((series.iloc[:row_num], series.iloc[-row_num:]))
-            self.tr_row_num = row_num
-        self.tr_series = series
-        self.truncate_v = truncate_v
-
-    def _get_footer(self):
-        name = self.series.name
-        footer = u('')
-
-        if getattr(self.series.index, 'freq', None) is not None:
-            footer += 'Freq: %s' % self.series.index.freqstr
-
-        if self.name is not False and name is not None:
-            if footer:
-                footer += ', '
-
-            series_name = com.pprint_thing(name,
-                                           escape_chars=('\t', '\r', '\n'))
-            footer += ("Name: %s" %
-                       series_name) if name is not None else ""
-
-        if self.length:
-            if footer:
-                footer += ', '
-            footer += 'Length: %d' % len(self.series)
-
-        if self.dtype is not False and self.dtype is not None:
-            name = getattr(self.tr_series.dtype, 'name', None)
-            if name:
-                if footer:
-                    footer += ', '
-                footer += 'dtype: %s' % com.pprint_thing(name)
-
-        # level infos are added to the end and in a new line, like it is done for Categoricals
-        if com.is_categorical_dtype(self.tr_series.dtype):
-            level_info = self.tr_series._values._repr_categories_info()
-            if footer:
-                footer += "\n"
-            footer += level_info
-
-        return compat.text_type(footer)
-
-    def _get_formatted_index(self):
-        index = self.tr_series.index
-        is_multi = isinstance(index, MultiIndex)
-
-        if is_multi:
-            have_header = any(name for name in index.names)
-            fmt_index = index.format(names=True)
-        else:
-            have_header = index.name is not None
-            fmt_index = index.format(name=True)
-        return fmt_index, have_header
-
-    def _get_formatted_values(self):
-        return format_array(self.tr_series._values, None,
-                            float_format=self.float_format,
-                            na_rep=self.na_rep)
-
-    def to_string(self):
-        series = self.tr_series
-        footer = self._get_footer()
-
-        if len(series) == 0:
-            return 'Series([], ' + footer + ')'
-
-        fmt_index, have_header = self._get_formatted_index()
-        fmt_values = self._get_formatted_values()
-
-        maxlen = max(self.adj.len(x) for x in fmt_index)  # max index len
-        pad_space = min(maxlen, 60)
-
-        if self.truncate_v:
-            n_header_rows = 0
-            row_num = self.tr_row_num
-            width = self.adj.len(fmt_values[row_num-1])
-            if width > 3:
-                dot_str = '...'
-            else:
-                dot_str = '..'
-            # Series uses mode=center because it has single value columns
-            # DataFrame uses mode=left
-            dot_str = self.adj.justify([dot_str], width, mode='center')[0]
-            fmt_values.insert(row_num + n_header_rows, dot_str)
-            fmt_index.insert(row_num + 1, '')
-
-        result = self.adj.adjoin(3, *[fmt_index[1:], fmt_values])
-
-        if self.header and have_header:
-            result = fmt_index[0] + '\n' + result
-
-        if footer:
-            result += '\n' + footer
-
-        return compat.text_type(u('').join(result))
-
-
-class TextAdjustment(object):
-
-    def __init__(self):
-        self.encoding = get_option("display.encoding")
-
-    def len(self, text):
-        return compat.strlen(text, encoding=self.encoding)
-
-    def justify(self, texts, max_len, mode='right'):
-        return com._justify(texts, max_len, mode=mode)
-
-    def adjoin(self, space, *lists, **kwargs):
-        return com.adjoin(space, *lists, strlen=self.len,
-                          justfunc=self.justify, **kwargs)
-
-
-class EastAsianTextAdjustment(TextAdjustment):
-
-    def __init__(self):
-        super(EastAsianTextAdjustment, self).__init__()
-        if get_option("display.unicode.ambiguous_as_wide"):
-            self.ambiguous_width = 2
-        else:
-            self.ambiguous_width = 1
-
-    def len(self, text):
-        return compat.east_asian_len(text, encoding=self.encoding,
-                                     ambiguous_width=self.ambiguous_width)
-
-    def justify(self, texts, max_len, mode='right'):
-        # re-calculate padding space per str considering East Asian Width
-        def _get_pad(t):
-            return max_len - self.len(t) + len(t)
-
-        if mode == 'left':
-            return [x.ljust(_get_pad(x)) for x in texts]
-        elif mode == 'center':
-            return [x.center(_get_pad(x)) for x in texts]
-        else:
-            return [x.rjust(_get_pad(x)) for x in texts]
-
-
-def _get_adjustment():
-    use_east_asian_width = get_option("display.unicode.east_asian_width")
-    if use_east_asian_width:
-        return EastAsianTextAdjustment()
-    else:
-        return TextAdjustment()
-
-
-class TableFormatter(object):
-    is_truncated = False
-    show_dimensions = None
-
-    @property
-    def should_show_dimensions(self):
-        return self.show_dimensions is True or (self.show_dimensions == 'truncate' and
-                                                self.is_truncated)
-
-    def _get_formatter(self, i):
-        if isinstance(self.formatters, (list, tuple)):
-            if com.is_integer(i):
-                return self.formatters[i]
-            else:
-                return None
-        else:
-            if com.is_integer(i) and i not in self.columns:
-                i = self.columns[i]
-            return self.formatters.get(i, None)
-
-
-class DataFrameFormatter(TableFormatter):
-
-    """
-    Render a DataFrame
-
-    self.to_string() : console-friendly tabular output
-    self.to_html()   : html table
-    self.to_latex()   : LaTeX tabular environment table
-
-    """
-
-    __doc__ = __doc__ if __doc__ else ''
-    __doc__ += common_docstring + justify_docstring + return_docstring
-
-    def __init__(self, frame, buf=None, columns=None, col_space=None,
-                 header=True, index=True, na_rep='NaN', formatters=None,
-                 justify=None, float_format=None, sparsify=None,
-                 index_names=True, line_width=None, max_rows=None,
-                 max_cols=None, show_dimensions=False, **kwds):
-        self.frame = frame
-        self.buf = buf if buf is not None else StringIO()
-        self.show_index_names = index_names
-
-        if sparsify is None:
-            sparsify = get_option("display.multi_sparse")
-
-        self.sparsify = sparsify
-
-        self.float_format = float_format
-        self.formatters = formatters if formatters is not None else {}
-        self.na_rep = na_rep
-        self.col_space = col_space
-        self.header = header
-        self.index = index
-        self.line_width = line_width
-        self.max_rows = max_rows
-        self.max_cols = max_cols
-        self.max_rows_displayed = min(max_rows or len(self.frame),
-                                      len(self.frame))
-        self.show_dimensions = show_dimensions
-
-        if justify is None:
-            self.justify = get_option("display.colheader_justify")
-        else:
-            self.justify = justify
-
-        self.kwds = kwds
-
-        if columns is not None:
-            self.columns = _ensure_index(columns)
-            self.frame = self.frame[self.columns]
-        else:
-            self.columns = frame.columns
-
-        self._chk_truncate()
-        self.adj = _get_adjustment()
-
-    def _chk_truncate(self):
-        '''
-        Checks whether the frame should be truncated. If so, slices
-        the frame up.
-        '''
-        from pandas.tools.merge import concat
-
-        # Column of which first element is used to determine width of a dot col
-        self.tr_size_col = -1
-
-        # Cut the data to the information actually printed
-        max_cols = self.max_cols
-        max_rows = self.max_rows
-
-        if max_cols == 0 or max_rows == 0:  # assume we are in the terminal (why else = 0)
-            (w, h) = get_terminal_size()
-            self.w = w
-            self.h = h
-            if self.max_rows == 0:
-                dot_row = 1
-                prompt_row = 1
-                if self.show_dimensions:
-                    show_dimension_rows = 3
-                n_add_rows = self.header + dot_row + show_dimension_rows + prompt_row
-                max_rows_adj = self.h - n_add_rows  # rows available to fill with actual data
-                self.max_rows_adj = max_rows_adj
-
-            # Format only rows and columns that could potentially fit the screen
-            if max_cols == 0 and len(self.frame.columns) > w:
-                max_cols = w
-            if max_rows == 0 and len(self.frame) > h:
-                max_rows = h
-
-        if not hasattr(self, 'max_rows_adj'):
-            self.max_rows_adj = max_rows
-        if not hasattr(self, 'max_cols_adj'):
-            self.max_cols_adj = max_cols
-
-        max_cols_adj = self.max_cols_adj
-        max_rows_adj = self.max_rows_adj
-
-        truncate_h = max_cols_adj and (len(self.columns) > max_cols_adj)
-        truncate_v = max_rows_adj and (len(self.frame) > max_rows_adj)
-
-        frame = self.frame
-        if truncate_h:
-            if max_cols_adj == 0:
-                col_num = len(frame.columns)
-            elif max_cols_adj == 1:
-                frame = frame.iloc[:, :max_cols]
-                col_num = max_cols
-            else:
-                col_num = (max_cols_adj // 2)
-                frame = concat((frame.iloc[:, :col_num], frame.iloc[:, -col_num:]), axis=1)
-            self.tr_col_num = col_num
-        if truncate_v:
-            if max_rows_adj == 0:
-                row_num = len(frame)
-            if max_rows_adj == 1:
-                row_num = max_rows
-                frame = frame.iloc[:max_rows, :]
-            else:
-                row_num = max_rows_adj // 2
-                frame = concat((frame.iloc[:row_num, :], frame.iloc[-row_num:, :]))
-            self.tr_row_num = row_num
-
-        self.tr_frame = frame
-        self.truncate_h = truncate_h
-        self.truncate_v = truncate_v
-        self.is_truncated = self.truncate_h or self.truncate_v
-
-    def _to_str_columns(self):
-        """
-        Render a DataFrame to a list of columns (as lists of strings).
-        """
-        frame = self.tr_frame
-
-        # may include levels names also
-
-        str_index = self._get_formatted_index(frame)
-        str_columns = self._get_formatted_column_labels(frame)
-
-        if self.header:
-            stringified = []
-            for i, c in enumerate(frame):
-                cheader = str_columns[i]
-                max_colwidth = max(self.col_space or 0,
-                                   *(self.adj.len(x) for x in cheader))
-                fmt_values = self._format_col(i)
-                fmt_values = _make_fixed_width(fmt_values, self.justify,
-                                               minimum=max_colwidth,
-                                               adj=self.adj)
-
-                max_len = max(np.max([self.adj.len(x) for x in fmt_values]),
-                              max_colwidth)
-                cheader = self.adj.justify(cheader, max_len, mode=self.justify)
-                stringified.append(cheader + fmt_values)
-        else:
-            stringified = []
-            for i, c in enumerate(frame):
-                fmt_values = self._format_col(i)
-                fmt_values = _make_fixed_width(fmt_values, self.justify,
-                                               minimum=(self.col_space or 0),
-                                               adj=self.adj)
-
-                stringified.append(fmt_values)
-
-        strcols = stringified
-        if self.index:
-            strcols.insert(0, str_index)
-
-        # Add ... to signal truncated
-        truncate_h = self.truncate_h
-        truncate_v = self.truncate_v
-
-        if truncate_h:
-            col_num = self.tr_col_num
-            col_width = self.adj.len(strcols[self.tr_size_col][0])  # infer from column header
-            strcols.insert(self.tr_col_num + 1, ['...'.center(col_width)] * (len(str_index)))
-        if truncate_v:
-            n_header_rows = len(str_index) - len(frame)
-            row_num = self.tr_row_num
-            for ix, col in enumerate(strcols):
-                cwidth = self.adj.len(strcols[ix][row_num])  # infer from above row
-                is_dot_col = False
-                if truncate_h:
-                    is_dot_col = ix == col_num + 1
-                if cwidth > 3 or is_dot_col:
-                    my_str = '...'
-                else:
-                    my_str = '..'
-
-                if ix == 0:
-                    dot_mode = 'left'
-                elif is_dot_col:
-                    cwidth = self.adj.len(strcols[self.tr_size_col][0])
-                    dot_mode = 'center'
-                else:
-                    dot_mode = 'right'
-                dot_str = self.adj.justify([my_str], cwidth, mode=dot_mode)[0]
-                strcols[ix].insert(row_num + n_header_rows, dot_str)
-        return strcols
-
-    def to_string(self):
-        """
-        Render a DataFrame to a console-friendly tabular output.
-        """
-        from pandas import Series
-
-        frame = self.frame
-
-        if len(frame.columns) == 0 or len(frame.index) == 0:
-            info_line = (u('Empty %s\nColumns: %s\nIndex: %s')
-                         % (type(self.frame).__name__,
-                            com.pprint_thing(frame.columns),
-                            com.pprint_thing(frame.index)))
-            text = info_line
-        else:
-            strcols = self._to_str_columns()
-            if self.line_width is None:  # no need to wrap around just print the whole frame
-                text = self.adj.adjoin(1, *strcols)
-            elif not isinstance(self.max_cols, int) or self.max_cols > 0:  # need to wrap around
-                text = self._join_multiline(*strcols)
-            else:  # max_cols == 0. Try to fit frame to terminal
-                text = self.adj.adjoin(1, *strcols).split('\n')
-                row_lens = Series(text).apply(len)
-                max_len_col_ix = np.argmax(row_lens)
-                max_len = row_lens[max_len_col_ix]
-                headers = [ele[0] for ele in strcols]
-                # Size of last col determines dot col size. See `self._to_str_columns
-                size_tr_col = len(headers[self.tr_size_col])
-                max_len += size_tr_col  # Need to make space for largest row plus truncate dot col
-                dif = max_len - self.w
-                adj_dif = dif
-                col_lens = Series([Series(ele).apply(len).max() for ele in strcols])
-                n_cols = len(col_lens)
-                counter = 0
-                while adj_dif > 0 and n_cols > 1:
-                    counter += 1
-                    mid = int(round(n_cols / 2.))
-                    mid_ix = col_lens.index[mid]
-                    col_len = col_lens[mid_ix]
-                    adj_dif -= (col_len + 1)  # adjoin adds one
-                    col_lens = col_lens.drop(mid_ix)
-                    n_cols = len(col_lens)
-                max_cols_adj = n_cols - self.index  # subtract index column
-                self.max_cols_adj = max_cols_adj
-
-                # Call again _chk_truncate to cut frame appropriately
-                # and then generate string representation
-                self._chk_truncate()
-                strcols = self._to_str_columns()
-                text = self.adj.adjoin(1, *strcols)
-
-        self.buf.writelines(text)
-
-        if self.should_show_dimensions:
-            self.buf.write("\n\n[%d rows x %d columns]"
-                           % (len(frame), len(frame.columns)))
-
-    def _join_multiline(self, *strcols):
-        lwidth = self.line_width
-        adjoin_width = 1
-        strcols = list(strcols)
-        if self.index:
-            idx = strcols.pop(0)
-            lwidth -= np.array([self.adj.len(x) for x in idx]).max() + adjoin_width
-
-        col_widths = [np.array([self.adj.len(x) for x in col]).max()
-                      if len(col) > 0 else 0
-                      for col in strcols]
-        col_bins = _binify(col_widths, lwidth)
-        nbins = len(col_bins)
-
-        if self.truncate_v:
-            nrows = self.max_rows_adj + 1
-        else:
-            nrows = len(self.frame)
-
-        str_lst = []
-        st = 0
-        for i, ed in enumerate(col_bins):
-            row = strcols[st:ed]
-            row.insert(0, idx)
-            if nbins > 1:
-                if ed <= len(strcols) and i < nbins - 1:
-                    row.append([' \\'] + ['  '] * (nrows - 1))
-                else:
-                    row.append([' '] * nrows)
-            str_lst.append(self.adj.adjoin(adjoin_width, *row))
-            st = ed
-        return '\n\n'.join(str_lst)
-
-    def to_latex(self, column_format=None, longtable=False):
-        """
-        Render a DataFrame to a LaTeX tabular/longtable environment output.
-        """
-        self.escape = self.kwds.get('escape', True)
-
-        def get_col_type(dtype):
-            if issubclass(dtype.type, np.number):
-                return 'r'
-            else:
-                return 'l'
-
-        frame = self.frame
-
-        if len(frame.columns) == 0 or len(frame.index) == 0:
-            info_line = (u('Empty %s\nColumns: %s\nIndex: %s')
-                         % (type(self.frame).__name__,
-                            frame.columns, frame.index))
-            strcols = [[info_line]]
-        else:
-            strcols = self._to_str_columns()
-
-        if self.index and isinstance(self.frame.index, MultiIndex):
-            clevels = self.frame.columns.nlevels
-            strcols.pop(0)
-            name = any(self.frame.index.names)
-            for i, lev in enumerate(self.frame.index.levels):
-                lev2 = lev.format()
-                blank = ' ' * len(lev2[0])
-                lev3 = [blank] * clevels
-                if name:
-                    lev3.append(lev.name)
-                for level_idx, group in itertools.groupby(
-                        self.frame.index.labels[i]):
-                    count = len(list(group))
-                    lev3.extend([lev2[level_idx]] + [blank] * (count - 1))
-                strcols.insert(i, lev3)
-
-        if column_format is None:
-            dtypes = self.frame.dtypes._values
-            column_format = ''.join(map(get_col_type, dtypes))
-            if self.index:
-                index_format = 'l' * self.frame.index.nlevels
-                column_format = index_format + column_format
-        elif not isinstance(column_format,
-                            compat.string_types):  # pragma: no cover
-            raise AssertionError('column_format must be str or unicode, not %s'
-                                 % type(column_format))
-
-        def write(buf, frame, column_format, strcols, longtable=False):
-            if not longtable:
-                buf.write('\\begin{tabular}{%s}\n' % column_format)
-                buf.write('\\toprule\n')
-            else:
-                buf.write('\\begin{longtable}{%s}\n' % column_format)
-                buf.write('\\toprule\n')
-
-            nlevels = frame.columns.nlevels
-            if any(frame.index.names):
-                nlevels += 1
-            for i, row in enumerate(zip(*strcols)):
-                if i == nlevels and self.header:
-                    buf.write('\\midrule\n')  # End of header
-                    if longtable:
-                        buf.write('\\endhead\n')
-                        buf.write('\\midrule\n')
-                        buf.write('\\multicolumn{3}{r}{{Continued on next '
-                                  'page}} \\\\\n')
-                        buf.write('\midrule\n')
-                        buf.write('\endfoot\n\n')
-                        buf.write('\\bottomrule\n')
-                        buf.write('\\endlastfoot\n')
-                if self.escape:
-                    crow = [(x.replace('\\', '\\textbackslash')  # escape backslashes first
-                             .replace('_', '\\_')
-                             .replace('%', '\\%')
-                             .replace('$', '\\$')
-                             .replace('#', '\\#')
-                             .replace('{', '\\{')
-                             .replace('}', '\\}')
-                             .replace('~', '\\textasciitilde')
-                             .replace('^', '\\textasciicircum')
-                             .replace('&', '\\&') if x else '{}') for x in row]
-                else:
-                    crow = [x if x else '{}' for x in row]
-                buf.write(' & '.join(crow))
-                buf.write(' \\\\\n')
-
-            if not longtable:
-                buf.write('\\bottomrule\n')
-                buf.write('\\end{tabular}\n')
-            else:
-                buf.write('\\end{longtable}\n')
-
-        if hasattr(self.buf, 'write'):
-            write(self.buf, frame, column_format, strcols, longtable)
-        elif isinstance(self.buf, compat.string_types):
-            with open(self.buf, 'w') as f:
-                write(f, frame, column_format, strcols, longtable)
-        else:
-            raise TypeError('buf is not a file name and it has no write '
-                            'method')
-
-    def _format_col(self, i):
-        frame = self.tr_frame
-        formatter = self._get_formatter(i)
-        return format_array(
-            frame.iloc[:, i]._values,
-            formatter, float_format=self.float_format, na_rep=self.na_rep,
-            space=self.col_space
-        )
-
-    def to_html(self, classes=None, notebook=False):
-        """
-        Render a DataFrame to a html table.
-
-        Parameters
-        ----------
-        notebook : {True, False}, optional, default False
-            Whether the generated HTML is for IPython Notebook.
-
-        """
-        html_renderer = HTMLFormatter(self, classes=classes,
-                                      max_rows=self.max_rows,
-                                      max_cols=self.max_cols,
-                                      notebook=notebook)
-        if hasattr(self.buf, 'write'):
-            html_renderer.write_result(self.buf)
-        elif isinstance(self.buf, compat.string_types):
-            with open(self.buf, 'w') as f:
-                html_renderer.write_result(f)
-        else:
-            raise TypeError('buf is not a file name and it has no write '
-                            ' method')
-
-    def _get_formatted_column_labels(self, frame):
-        from pandas.core.index import _sparsify
-
-        def is_numeric_dtype(dtype):
-            return issubclass(dtype.type, np.number)
-
-        columns = frame.columns
-
-        if isinstance(columns, MultiIndex):
-            fmt_columns = columns.format(sparsify=False, adjoin=False)
-            fmt_columns = lzip(*fmt_columns)
-            dtypes = self.frame.dtypes._values
-
-            # if we have a Float level, they don't use leading space at all
-            restrict_formatting = any([l.is_floating for l in columns.levels])
-            need_leadsp = dict(zip(fmt_columns, map(is_numeric_dtype, dtypes)))
-
-            def space_format(x, y):
-                if y not in self.formatters and need_leadsp[x] and not restrict_formatting:
-                    return ' ' + y
-                return y
-
-            str_columns = list(zip(*[[space_format(x, y) for y in x] for x in fmt_columns]))
-            if self.sparsify:
-                str_columns = _sparsify(str_columns)
-
-            str_columns = [list(x) for x in zip(*str_columns)]
-        else:
-            fmt_columns = columns.format()
-            dtypes = self.frame.dtypes
-            need_leadsp = dict(zip(fmt_columns, map(is_numeric_dtype, dtypes)))
-            str_columns = [[' ' + x
-                            if not self._get_formatter(i) and need_leadsp[x]
-                            else x]
-                           for i, (col, x) in
-                           enumerate(zip(columns, fmt_columns))]
-
-        if self.show_index_names and self.has_index_names:
-            for x in str_columns:
-                x.append('')
-
-        # self.str_columns = str_columns
-        return str_columns
-
-    @property
-    def has_index_names(self):
-        return _has_names(self.frame.index)
-
-    @property
-    def has_column_names(self):
-        return _has_names(self.frame.columns)
-
-    def _get_formatted_index(self, frame):
-        # Note: this is only used by to_string() and to_latex(), not by to_html().
-        index = frame.index
-        columns = frame.columns
-
-        show_index_names = self.show_index_names and self.has_index_names
-        show_col_names = (self.show_index_names and self.has_column_names)
-
-        fmt = self._get_formatter('__index__')
-
-        if isinstance(index, MultiIndex):
-            fmt_index = index.format(sparsify=self.sparsify, adjoin=False,
-                                     names=show_index_names,
-                                     formatter=fmt)
-        else:
-            fmt_index = [index.format(name=show_index_names, formatter=fmt)]
-        fmt_index = [tuple(_make_fixed_width(list(x), justify='left',
-                                             minimum=(self.col_space or 0),
-                                             adj=self.adj))
-                     for x in fmt_index]
-
-        adjoined = self.adj.adjoin(1, *fmt_index).split('\n')
-
-        # empty space for columns
-        if show_col_names:
-            col_header = ['%s' % x for x in self._get_column_name_list()]
-        else:
-            col_header = [''] * columns.nlevels
-
-        if self.header:
-            return col_header + adjoined
-        else:
-            return adjoined
-
-    def _get_column_name_list(self):
-        names = []
-        columns = self.frame.columns
-        if isinstance(columns, MultiIndex):
-            names.extend('' if name is None else name
-                         for name in columns.names)
-        else:
-            names.append('' if columns.name is None else columns.name)
-        return names
-
-
-class HTMLFormatter(TableFormatter):
-
-    indent_delta = 2
-
-    def __init__(self, formatter, classes=None, max_rows=None, max_cols=None,
-                 notebook=False):
-        self.fmt = formatter
-        self.classes = classes
-
-        self.frame = self.fmt.frame
-        self.columns = self.fmt.tr_frame.columns
-        self.elements = []
-        self.bold_rows = self.fmt.kwds.get('bold_rows', False)
-        self.escape = self.fmt.kwds.get('escape', True)
-
-        self.max_rows = max_rows or len(self.fmt.frame)
-        self.max_cols = max_cols or len(self.fmt.columns)
-        self.show_dimensions = self.fmt.show_dimensions
-        self.is_truncated = (self.max_rows < len(self.fmt.frame) or
-                             self.max_cols < len(self.fmt.columns))
-        self.notebook = notebook
-
-    def write(self, s, indent=0):
-        rs = com.pprint_thing(s)
-        self.elements.append(' ' * indent + rs)
-
-    def write_th(self, s, indent=0, tags=None):
-        if (self.fmt.col_space is not None
-                and self.fmt.col_space > 0):
-            tags = (tags or "")
-            tags += 'style="min-width: %s;"' % self.fmt.col_space
-
-        return self._write_cell(s, kind='th', indent=indent, tags=tags)
-
-    def write_td(self, s, indent=0, tags=None):
-        return self._write_cell(s, kind='td', indent=indent, tags=tags)
-
-    def _write_cell(self, s, kind='td', indent=0, tags=None):
-        if tags is not None:
-            start_tag = '<%s %s>' % (kind, tags)
-        else:
-            start_tag = '<%s>' % kind
-
-        if self.escape:
-            # escape & first to prevent double escaping of &
-            esc = OrderedDict(
-                [('&', r'&amp;'), ('<', r'&lt;'), ('>', r'&gt;')]
-            )
-        else:
-            esc = {}
-        rs = com.pprint_thing(s, escape_chars=esc).strip()
-        self.write(
-            '%s%s</%s>' % (start_tag, rs, kind), indent)
-
-    def write_tr(self, line, indent=0, indent_delta=4, header=False,
-                 align=None, tags=None, nindex_levels=0):
-        if tags is None:
-            tags = {}
-
-        if align is None:
-            self.write('<tr>', indent)
-        else:
-            self.write('<tr style="text-align: %s;">' % align, indent)
-        indent += indent_delta
-
-        for i, s in enumerate(line):
-            val_tag = tags.get(i, None)
-            if header or (self.bold_rows and i < nindex_levels):
-                self.write_th(s, indent, tags=val_tag)
-            else:
-                self.write_td(s, indent, tags=val_tag)
-
-        indent -= indent_delta
-        self.write('</tr>', indent)
-
-    def write_result(self, buf):
-        indent = 0
-        frame = self.frame
-
-        _classes = ['dataframe']  # Default class.
-        if self.classes is not None:
-            if isinstance(self.classes, str):
-                self.classes = self.classes.split()
-            if not isinstance(self.classes, (list, tuple)):
-                raise AssertionError(('classes must be list or tuple, '
-                                      'not %s') % type(self.classes))
-            _classes.extend(self.classes)
-
-        if self.notebook:
-            div_style = ''
-            try:
-                import IPython
-                if IPython.__version__ < LooseVersion('3.0.0'):
-                    div_style = ' style="max-width:1500px;overflow:auto;"'
-            except ImportError:
-                pass
-
-            self.write('<div{0}>'.format(div_style))
-
-        self.write('<table border="1" class="%s">' % ' '.join(_classes),
-                   indent)
-
-        indent += self.indent_delta
-        indent = self._write_header(indent)
-        indent = self._write_body(indent)
-
-        self.write('</table>', indent)
-        if self.should_show_dimensions:
-            by = chr(215) if compat.PY3 else unichr(215)  # ×
-            self.write(u('<p>%d rows %s %d columns</p>') %
-                       (len(frame), by, len(frame.columns)))
-
-        if self.notebook:
-            self.write('</div>')
-
-        _put_lines(buf, self.elements)
-
-    def _write_header(self, indent):
-        truncate_h = self.fmt.truncate_h
-        row_levels = self.frame.index.nlevels
-        if not self.fmt.header:
-            # write nothing
-            return indent
-
-        def _column_header():
-            if self.fmt.index:
-                row = [''] * (self.frame.index.nlevels - 1)
-            else:
-                row = []
-
-            if isinstance(self.columns, MultiIndex):
-                if self.fmt.has_column_names and self.fmt.index:
-                    row.append(single_column_table(self.columns.names))
-                else:
-                    row.append('')
-                style = "text-align: %s;" % self.fmt.justify
-                row.extend([single_column_table(c, self.fmt.justify, style) for
-                            c in self.columns])
-            else:
-                if self.fmt.index:
-                    row.append(self.columns.name or '')
-                row.extend(self.columns)
-            return row
-
-        self.write('<thead>', indent)
-        row = []
-
-        indent += self.indent_delta
-
-        if isinstance(self.columns, MultiIndex):
-            template = 'colspan="%d" halign="left"'
-
-            if self.fmt.sparsify:
-                # GH3547
-                sentinel = com.sentinel_factory()
-            else:
-                sentinel = None
-            levels = self.columns.format(sparsify=sentinel,
-                                         adjoin=False, names=False)
-            level_lengths = _get_level_lengths(levels, sentinel)
-            inner_lvl = len(level_lengths) - 1
-            for lnum, (records, values) in enumerate(zip(level_lengths,
-                                                         levels)):
-                if truncate_h:
-                    # modify the header lines
-                    ins_col = self.fmt.tr_col_num
-                    if self.fmt.sparsify:
-                        recs_new = {}
-                        # Increment tags after ... col.
-                        for tag, span in list(records.items()):
-                            if tag >= ins_col:
-                                recs_new[tag + 1] = span
-                            elif tag + span > ins_col:
-                                recs_new[tag] = span + 1
-                                if lnum == inner_lvl:
-                                    values = values[:ins_col] + (u('...'),) + \
-                                        values[ins_col:]
-                                else:  # sparse col headers do not receive a ...
-                                    values = (values[:ins_col] + (values[ins_col - 1],) +
-                                              values[ins_col:])
-                            else:
-                                recs_new[tag] = span
-                            # if ins_col lies between tags, all col headers get ...
-                            if tag + span == ins_col:
-                                recs_new[ins_col] = 1
-                                values = values[:ins_col] + (u('...'),) + \
-                                    values[ins_col:]
-                        records = recs_new
-                        inner_lvl = len(level_lengths) - 1
-                        if lnum == inner_lvl:
-                            records[ins_col] = 1
-                    else:
-                        recs_new = {}
-                        for tag, span in list(records.items()):
-                            if tag >= ins_col:
-                                recs_new[tag + 1] = span
-                            else:
-                                recs_new[tag] = span
-                        recs_new[ins_col] = 1
-                        records = recs_new
-                        values = values[:ins_col] + [u('...')] + values[ins_col:]
-
-                name = self.columns.names[lnum]
-                row = [''] * (row_levels - 1) + ['' if name is None
-                                                 else com.pprint_thing(name)]
-
-                if row == [""] and self.fmt.index is False:
-                    row = []
-
-                tags = {}
-                j = len(row)
-                for i, v in enumerate(values):
-                    if i in records:
-                        if records[i] > 1:
-                            tags[j] = template % records[i]
-                    else:
-                        continue
-                    j += 1
-                    row.append(v)
-                self.write_tr(row, indent, self.indent_delta, tags=tags,
-                              header=True)
-        else:
-            col_row = _column_header()
-            align = self.fmt.justify
-
-            if truncate_h:
-                ins_col = row_levels + self.fmt.tr_col_num
-                col_row.insert(ins_col, '...')
-
-            self.write_tr(col_row, indent, self.indent_delta, header=True,
-                          align=align)
-
-        if self.fmt.has_index_names and self.fmt.index:
-            row = [
-                x if x is not None else '' for x in self.frame.index.names
-            ] + [''] * min(len(self.columns), self.max_cols)
-            if truncate_h:
-                ins_col = row_levels + self.fmt.tr_col_num
-                row.insert(ins_col, '')
-            self.write_tr(row, indent, self.indent_delta, header=True)
-
-        indent -= self.indent_delta
-        self.write('</thead>', indent)
-
-        return indent
-
-    def _write_body(self, indent):
-        self.write('<tbody>', indent)
-        indent += self.indent_delta
-
-        fmt_values = {}
-        for i in range(min(len(self.columns), self.max_cols)):
-            fmt_values[i] = self.fmt._format_col(i)
-
-        # write values
-        if self.fmt.index:
-            if isinstance(self.frame.index, MultiIndex):
-                self._write_hierarchical_rows(fmt_values, indent)
-            else:
-                self._write_regular_rows(fmt_values, indent)
-        else:
-            for i in range(len(self.frame)):
-                row = [fmt_values[j][i] for j in range(len(self.columns))]
-                self.write_tr(row, indent, self.indent_delta, tags=None)
-
-        indent -= self.indent_delta
-        self.write('</tbody>', indent)
-        indent -= self.indent_delta
-
-        return indent
-
-    def _write_regular_rows(self, fmt_values, indent):
-        truncate_h = self.fmt.truncate_h
-        truncate_v = self.fmt.truncate_v
-
-        ncols = len(self.fmt.tr_frame.columns)
-        nrows = len(self.fmt.tr_frame)
-        fmt = self.fmt._get_formatter('__index__')
-        if fmt is not None:
-            index_values = self.fmt.tr_frame.index.map(fmt)
-        else:
-            index_values = self.fmt.tr_frame.index.format()
-
-        row = []
-        for i in range(nrows):
-
-            if truncate_v and i == (self.fmt.tr_row_num):
-                str_sep_row = ['...' for ele in row]
-                self.write_tr(str_sep_row, indent, self.indent_delta, tags=None,
-                              nindex_levels=1)
-
-            row = []
-            row.append(index_values[i])
-            row.extend(fmt_values[j][i] for j in range(ncols))
-
-            if truncate_h:
-                dot_col_ix = self.fmt.tr_col_num + 1
-                row.insert(dot_col_ix, '...')
-            self.write_tr(row, indent, self.indent_delta, tags=None,
-                          nindex_levels=1)
-
-    def _write_hierarchical_rows(self, fmt_values, indent):
-        template = 'rowspan="%d" valign="top"'
-
-        truncate_h = self.fmt.truncate_h
-        truncate_v = self.fmt.truncate_v
-        frame = self.fmt.tr_frame
-        ncols = len(frame.columns)
-        nrows = len(frame)
-        row_levels = self.frame.index.nlevels
-
-        idx_values = frame.index.format(sparsify=False, adjoin=False, names=False)
-        idx_values = lzip(*idx_values)
-
-        if self.fmt.sparsify:
-            # GH3547
-            sentinel = com.sentinel_factory()
-            levels = frame.index.format(sparsify=sentinel, adjoin=False, names=False)
-
-            level_lengths = _get_level_lengths(levels, sentinel)
-            inner_lvl = len(level_lengths) - 1
-            if truncate_v:
-                # Insert ... row and adjust idx_values and
-                # level_lengths to take this into account.
-                ins_row = self.fmt.tr_row_num
-                for lnum, records in enumerate(level_lengths):
-                    rec_new = {}
-                    for tag, span in list(records.items()):
-                        if tag >= ins_row:
-                            rec_new[tag + 1] = span
-                        elif tag + span > ins_row:
-                            rec_new[tag] = span + 1
-                            dot_row = list(idx_values[ins_row - 1])
-                            dot_row[-1] = u('...')
-                            idx_values.insert(ins_row, tuple(dot_row))
-                        else:
-                            rec_new[tag] = span
-                        # If ins_row lies between tags, all cols idx cols receive ...
-                        if tag + span == ins_row:
-                            rec_new[ins_row] = 1
-                            if lnum == 0:
-                                idx_values.insert(ins_row, tuple([u('...')]*len(level_lengths)))
-                    level_lengths[lnum] = rec_new
-
-                level_lengths[inner_lvl][ins_row] = 1
-                for ix_col in range(len(fmt_values)):
-                    fmt_values[ix_col].insert(ins_row, '...')
-                nrows += 1
-
-            for i in range(nrows):
-                row = []
-                tags = {}
-
-                sparse_offset = 0
-                j = 0
-                for records, v in zip(level_lengths, idx_values[i]):
-                    if i in records:
-                        if records[i] > 1:
-                            tags[j] = template % records[i]
-                    else:
-                        sparse_offset += 1
-                        continue
-
-                    j += 1
-                    row.append(v)
-
-                row.extend(fmt_values[j][i] for j in range(ncols))
-                if truncate_h:
-                    row.insert(row_levels - sparse_offset + self.fmt.tr_col_num, '...')
-                self.write_tr(row, indent, self.indent_delta, tags=tags,
-                              nindex_levels=len(levels) - sparse_offset)
-        else:
-            for i in range(len(frame)):
-                idx_values = list(zip(*frame.index.format(sparsify=False,
-                                                          adjoin=False,
-                                                          names=False)))
-                row = []
-                row.extend(idx_values[i])
-                row.extend(fmt_values[j][i] for j in range(ncols))
-                if truncate_h:
-                    row.insert(row_levels + self.fmt.tr_col_num, '...')
-                self.write_tr(row, indent, self.indent_delta, tags=None,
-                              nindex_levels=frame.index.nlevels)
-
-
-def _get_level_lengths(levels, sentinel=''):
-    from itertools import groupby
-
-    def _make_grouper():
-        record = {'count': 0}
-
-        def grouper(x):
-            if x != sentinel:
-                record['count'] += 1
-            return record['count']
-        return grouper
-
-    result = []
-    for lev in levels:
-        i = 0
-        f = _make_grouper()
-        recs = {}
-        for key, gpr in groupby(lev, f):
-            values = list(gpr)
-            recs[i] = len(values)
-            i += len(values)
-
-        result.append(recs)
-
-    return result
-
-
-class CSVFormatter(object):
-
-    def __init__(self, obj, path_or_buf=None, sep=",", na_rep='', float_format=None,
-                 cols=None, header=True, index=True, index_label=None,
-                 mode='w', nanRep=None, encoding=None, compression=None, quoting=None,
-                 line_terminator='\n', chunksize=None, engine=None,
-                 tupleize_cols=False, quotechar='"', date_format=None,
-                 doublequote=True, escapechar=None, decimal='.'):
-
-        if engine is not None:
-            warnings.warn("'engine' keyword is deprecated and "
-                          "will be removed in a future version",
-                          FutureWarning, stacklevel=3)
-        self.engine = engine  # remove for 0.18
-        self.obj = obj
-
-        if path_or_buf is None:
-            path_or_buf = StringIO()
-
-        self.path_or_buf = path_or_buf
-        self.sep = sep
-        self.na_rep = na_rep
-        self.float_format = float_format
-        self.decimal = decimal
-
-        self.header = header
-        self.index = index
-        self.index_label = index_label
-        self.mode = mode
-        self.encoding = encoding
-        self.compression = compression
-
-        if quoting is None:
-            quoting = csv.QUOTE_MINIMAL
-        self.quoting = quoting
-
-        if quoting == csv.QUOTE_NONE:
-            # prevents crash in _csv
-            quotechar = None
-        self.quotechar = quotechar
-
-        self.doublequote = doublequote
-        self.escapechar = escapechar
-
-        self.line_terminator = line_terminator
-
-        self.date_format = date_format
-
-        # GH3457
-        if not self.obj.columns.is_unique and engine == 'python':
-            raise NotImplementedError("columns.is_unique == False not "
-                                      "supported with engine='python'")
-
-        self.tupleize_cols = tupleize_cols
-        self.has_mi_columns = isinstance(obj.columns, MultiIndex
-                                         ) and not self.tupleize_cols
-
-        # validate mi options
-        if self.has_mi_columns:
-            if cols is not None:
-                raise TypeError("cannot specify cols with a MultiIndex on the "
-                                "columns")
-
-        if cols is not None:
-            if isinstance(cols, Index):
-                cols = cols.to_native_types(na_rep=na_rep,
-                                            float_format=float_format,
-                                            date_format=date_format,
-                                            quoting=self.quoting)
-            else:
-                cols = np.asarray(list(cols))
-            self.obj = self.obj.loc[:, cols]
-
-        # update columns to include possible multiplicity of dupes
-        # and make sure sure cols is just a list of labels
-        cols = self.obj.columns
-        if isinstance(cols, Index):
-            cols = cols.to_native_types(na_rep=na_rep,
-                                        float_format=float_format,
-                                        date_format=date_format,
-                                        quoting=self.quoting)
-        else:
-            cols = np.asarray(list(cols))
-
-        # save it
-        self.cols = cols
-
-        # preallocate data 2d list
-        self.blocks = self.obj._data.blocks
-        ncols = sum(b.shape[0] for b in self.blocks)
-        self.data = [None] * ncols
-
-        if chunksize is None:
-            chunksize = (100000 // (len(self.cols) or 1)) or 1
-        self.chunksize = int(chunksize)
-
-        self.data_index = obj.index
-        if isinstance(obj.index, PeriodIndex):
-            self.data_index = obj.index.to_timestamp()
-
-        if (isinstance(self.data_index, DatetimeIndex) and
-                date_format is not None):
-            self.data_index = Index([x.strftime(date_format)
-                                     if notnull(x) else ''
-                                     for x in self.data_index])
-
-        self.nlevels = getattr(self.data_index, 'nlevels', 1)
-        if not index:
-            self.nlevels = 0
-
-    # original python implem. of df.to_csv
-    # invoked by df.to_csv(engine=python)
-    def _helper_csv(self, writer, na_rep=None, cols=None,
-                    header=True, index=True,
-                    index_label=None, float_format=None, date_format=None):
-        if cols is None:
-            cols = self.columns
-
-        has_aliases = isinstance(header, (tuple, list, np.ndarray, Index))
-        if has_aliases or header:
-            if index:
-                # should write something for index label
-                if index_label is not False:
-                    if index_label is None:
-                        if isinstance(self.obj.index, MultiIndex):
-                            index_label = []
-                            for i, name in enumerate(self.obj.index.names):
-                                if name is None:
-                                    name = ''
-                                index_label.append(name)
-                        else:
-                            index_label = self.obj.index.name
-                            if index_label is None:
-                                index_label = ['']
-                            else:
-                                index_label = [index_label]
-                    elif not isinstance(index_label,
-                                        (list, tuple, np.ndarray, Index)):
-                        # given a string for a DF with Index
-                        index_label = [index_label]
-
-                    encoded_labels = list(index_label)
-                else:
-                    encoded_labels = []
-
-                if has_aliases:
-                    if len(header) != len(cols):
-                        raise ValueError(('Writing %d cols but got %d aliases'
-                                          % (len(cols), len(header))))
-                    else:
-                        write_cols = header
-                else:
-                    write_cols = cols
-                encoded_cols = list(write_cols)
-
-                writer.writerow(encoded_labels + encoded_cols)
-            else:
-                encoded_cols = list(cols)
-                writer.writerow(encoded_cols)
-
-        if date_format is None:
-            date_formatter = lambda x: Timestamp(x)._repr_base
-        else:
-            def strftime_with_nulls(x):
-                x = Timestamp(x)
-                if notnull(x):
-                    return x.strftime(date_format)
-
-            date_formatter = lambda x: strftime_with_nulls(x)
-
-        data_index = self.obj.index
-
-        if isinstance(self.obj.index, PeriodIndex):
-            data_index = self.obj.index.to_timestamp()
-
-        if isinstance(data_index, DatetimeIndex) and date_format is not None:
-            data_index = Index([date_formatter(x) for x in data_index])
-
-        values = self.obj.copy()
-        values.index = data_index
-        values.columns = values.columns.to_native_types(
-            na_rep=na_rep,
-            float_format=float_format,
-            date_format=date_format,
-            quoting=self.quoting)
-        values = values[cols]
-
-        series = {}
-        for k, v in compat.iteritems(values._series):
-            series[k] = v._values
-
-        nlevels = getattr(data_index, 'nlevels', 1)
-        for j, idx in enumerate(data_index):
-            row_fields = []
-            if index:
-                if nlevels == 1:
-                    row_fields = [idx]
-                else:  # handle MultiIndex
-                    row_fields = list(idx)
-            for i, col in enumerate(cols):
-                val = series[col][j]
-                if lib.checknull(val):
-                    val = na_rep
-
-                if float_format is not None and com.is_float(val):
-                    val = float_format % val
-                elif isinstance(val, (np.datetime64, Timestamp)):
-                    val = date_formatter(val)
-
-                row_fields.append(val)
-
-            writer.writerow(row_fields)
-
-    def save(self):
-        # create the writer & save
-        if hasattr(self.path_or_buf, 'write'):
-            f = self.path_or_buf
-            close = False
-        else:
-            f = com._get_handle(self.path_or_buf, self.mode,
-                                encoding=self.encoding,
-                                compression=self.compression)
-            close = True
-
-        try:
-            writer_kwargs = dict(lineterminator=self.line_terminator,
-                                 delimiter=self.sep, quoting=self.quoting,
-                                 doublequote=self.doublequote,
-                                 escapechar=self.escapechar,
-                                 quotechar=self.quotechar)
-            if self.encoding is not None:
-                writer_kwargs['encoding'] = self.encoding
-                self.writer = com.UnicodeWriter(f, **writer_kwargs)
-            else:
-                self.writer = csv.writer(f, **writer_kwargs)
-
-            if self.engine == 'python':
-                # to be removed in 0.13
-                self._helper_csv(self.writer, na_rep=self.na_rep,
-                                 float_format=self.float_format,
-                                 cols=self.cols, header=self.header,
-                                 index=self.index,
-                                 index_label=self.index_label,
-                                 date_format=self.date_format)
-
-            else:
-                self._save()
-
-        finally:
-            if close:
-                f.close()
-
-    def _save_header(self):
-
-        writer = self.writer
-        obj = self.obj
-        index_label = self.index_label
-        cols = self.cols
-        has_mi_columns = self.has_mi_columns
-        header = self.header
-        encoded_labels = []
-
-        has_aliases = isinstance(header, (tuple, list, np.ndarray, Index))
-        if not (has_aliases or self.header):
-            return
-        if has_aliases:
-            if len(header) != len(cols):
-                raise ValueError(('Writing %d cols but got %d aliases'
-                                  % (len(cols), len(header))))
-            else:
-                write_cols = header
-        else:
-            write_cols = cols
-
-        if self.index:
-            # should write something for index label
-            if index_label is not False:
-                if index_label is None:
-                    if isinstance(obj.index, MultiIndex):
-                        index_label = []
-                        for i, name in enumerate(obj.index.names):
-                            if name is None:
-                                name = ''
-                            index_label.append(name)
-                    else:
-                        index_label = obj.index.name
-                        if index_label is None:
-                            index_label = ['']
-                        else:
-                            index_label = [index_label]
-                elif not isinstance(index_label, (list, tuple, np.ndarray, Index)):
-                    # given a string for a DF with Index
-                    index_label = [index_label]
-
-                encoded_labels = list(index_label)
-            else:
-                encoded_labels = []
-
-        if not has_mi_columns:
-            encoded_labels += list(write_cols)
-
-        # write out the mi
-        if has_mi_columns:
-            columns = obj.columns
-
-            # write out the names for each level, then ALL of the values for
-            # each level
-            for i in range(columns.nlevels):
-
-                # we need at least 1 index column to write our col names
-                col_line = []
-                if self.index:
-
-                    # name is the first column
-                    col_line.append(columns.names[i])
-
-                    if isinstance(index_label, list) and len(index_label) > 1:
-                        col_line.extend([''] * (len(index_label) - 1))
-
-                col_line.extend(columns.get_level_values(i))
-
-                writer.writerow(col_line)
-
-            # add blanks for the columns, so that we
-            # have consistent seps
-            encoded_labels.extend([''] * len(columns))
-
-        # write out the index label line
-        writer.writerow(encoded_labels)
-
-    def _save(self):
-
-        self._save_header()
-
-        nrows = len(self.data_index)
-
-        # write in chunksize bites
-        chunksize = self.chunksize
-        chunks = int(nrows / chunksize) + 1
-
-        for i in range(chunks):
-            start_i = i * chunksize
-            end_i = min((i + 1) * chunksize, nrows)
-            if start_i >= end_i:
-                break
-
-            self._save_chunk(start_i, end_i)
-
-    def _save_chunk(self, start_i, end_i):
-
-        data_index = self.data_index
-
-        # create the data for a chunk
-        slicer = slice(start_i, end_i)
-        for i in range(len(self.blocks)):
-            b = self.blocks[i]
-            d = b.to_native_types(slicer=slicer,
-                                  na_rep=self.na_rep,
-                                  float_format=self.float_format,
-                                  decimal=self.decimal,
-                                  date_format=self.date_format,
-                                  quoting=self.quoting)
-
-            for col_loc, col in zip(b.mgr_locs, d):
-                # self.data is a preallocated list
-                self.data[col_loc] = col
-
-        ix = data_index.to_native_types(slicer=slicer,
-                                        na_rep=self.na_rep,
-                                        float_format=self.float_format,
-                                        date_format=self.date_format,
-                                        quoting=self.quoting)
-
-        lib.write_csv_rows(self.data, ix, self.nlevels, self.cols, self.writer)
-
-# from collections import namedtuple
-# ExcelCell = namedtuple("ExcelCell",
-#                        'row, col, val, style, mergestart, mergeend')
-
-
-class ExcelCell(object):
-    __fields__ = ('row', 'col', 'val', 'style', 'mergestart', 'mergeend')
-    __slots__ = __fields__
-
-    def __init__(self, row, col, val,
-                 style=None, mergestart=None, mergeend=None):
-        self.row = row
-        self.col = col
-        self.val = val
-        self.style = style
-        self.mergestart = mergestart
-        self.mergeend = mergeend
-
-
-header_style = {"font": {"bold": True},
-                "borders": {"top": "thin",
-                            "right": "thin",
-                            "bottom": "thin",
-                            "left": "thin"},
-                "alignment": {"horizontal": "center", "vertical": "top"}}
-
-
-class ExcelFormatter(object):
-
-    """
-    Class for formatting a DataFrame to a list of ExcelCells,
-
-    Parameters
-    ----------
-    df : dataframe
-    na_rep: na representation
-    float_format : string, default None
-            Format string for floating point numbers
-    cols : sequence, optional
-        Columns to write
-    header : boolean or list of string, default True
-        Write out column names. If a list of string is given it is
-        assumed to be aliases for the column names
-    index : boolean, default True
-        output row names (index)
-    index_label : string or sequence, default None
-            Column label for index column(s) if desired. If None is given, and
-            `header` and `index` are True, then the index names are used. A
-            sequence should be given if the DataFrame uses MultiIndex.
-    merge_cells : boolean, default False
-            Format MultiIndex and Hierarchical Rows as merged cells.
-    inf_rep : string, default `'inf'`
-        representation for np.inf values (which aren't representable in Excel)
-        A `'-'` sign will be added in front of -inf.
-    """
-
-    def __init__(self, df, na_rep='', float_format=None, cols=None,
-                 header=True, index=True, index_label=None, merge_cells=False,
-                 inf_rep='inf'):
-        self.rowcounter = 0
-        self.na_rep = na_rep
-        self.df = df
-        if cols is not None:
-            self.df = df.loc[:, cols]
-        self.columns = self.df.columns
-        self.float_format = float_format
-        self.index = index
-        self.index_label = index_label
-        self.header = header
-        self.merge_cells = merge_cells
-        self.inf_rep = inf_rep
-
-    def _format_value(self, val):
-        if lib.checknull(val):
-            val = self.na_rep
-        elif com.is_float(val):
-            if np.isposinf(val):
-                val = self.inf_rep
-            elif np.isneginf(val):
-                val = '-%s' % self.inf_rep
-            elif self.float_format is not None:
-                val = float(self.float_format % val)
-        return val
-
-    def _format_header_mi(self):
-
-        if self.columns.nlevels > 1:
-            if not self.index:
-                raise NotImplementedError("Writing to Excel with MultiIndex"
-                                          " columns and no index ('index'=False) "
-                                          "is not yet implemented.")
-
-        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
-        if not(has_aliases or self.header):
-            return
-
-        columns = self.columns
-        level_strs = columns.format(sparsify=True, adjoin=False, names=False)
-        level_lengths = _get_level_lengths(level_strs)
-        coloffset = 0
-        lnum = 0
-
-        if self.index and isinstance(self.df.index, MultiIndex):
-            coloffset = len(self.df.index[0]) - 1
-
-        if self.merge_cells:
-            # Format multi-index as a merged cells.
-            for lnum in range(len(level_lengths)):
-                name = columns.names[lnum]
-                yield ExcelCell(lnum, coloffset, name, header_style)
-
-            for lnum, (spans, levels, labels) in enumerate(zip(level_lengths,
-                                                               columns.levels,
-                                                               columns.labels)
-                                                           ):
-                values = levels.take(labels)
-                for i in spans:
-                    if spans[i] > 1:
-                        yield ExcelCell(lnum,
-                                        coloffset + i + 1,
-                                        values[i],
-                                        header_style,
-                                        lnum,
-                                        coloffset + i + spans[i])
-                    else:
-                        yield ExcelCell(lnum,
-                                        coloffset + i + 1,
-                                        values[i],
-                                        header_style)
-        else:
-            # Format in legacy format with dots to indicate levels.
-            for i, values in enumerate(zip(*level_strs)):
-                v = ".".join(map(com.pprint_thing, values))
-                yield ExcelCell(lnum, coloffset + i + 1, v, header_style)
-
-        self.rowcounter = lnum
-
-    def _format_header_regular(self):
-        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
-        if has_aliases or self.header:
-            coloffset = 0
-
-            if self.index:
-                coloffset = 1
-                if isinstance(self.df.index, MultiIndex):
-                    coloffset = len(self.df.index[0])
-
-            colnames = self.columns
-            if has_aliases:
-                if len(self.header) != len(self.columns):
-                    raise ValueError(('Writing %d cols but got %d aliases'
-                                      % (len(self.columns), len(self.header))))
-                else:
-                    colnames = self.header
-
-            for colindex, colname in enumerate(colnames):
-                yield ExcelCell(self.rowcounter, colindex + coloffset, colname,
-                                header_style)
-
-    def _format_header(self):
-        if isinstance(self.columns, MultiIndex):
-            gen = self._format_header_mi()
-        else:
-            gen = self._format_header_regular()
-
-        gen2 = ()
-        if self.df.index.names:
-            row = [x if x is not None else ''
-                   for x in self.df.index.names] + [''] * len(self.columns)
-            if reduce(lambda x, y: x and y, map(lambda x: x != '', row)):
-                gen2 = (ExcelCell(self.rowcounter, colindex, val, header_style)
-                        for colindex, val in enumerate(row))
-                self.rowcounter += 1
-        return itertools.chain(gen, gen2)
-
-    def _format_body(self):
-
-        if isinstance(self.df.index, MultiIndex):
-            return self._format_hierarchical_rows()
-        else:
-            return self._format_regular_rows()
-
-    def _format_regular_rows(self):
-        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
-        if has_aliases or self.header:
-            self.rowcounter += 1
-
-        coloffset = 0
-        # output index and index_label?
-        if self.index:
-            # chek aliases
-            # if list only take first as this is not a MultiIndex
-            if self.index_label and isinstance(self.index_label,
-                                               (list, tuple, np.ndarray, Index)):
-                index_label = self.index_label[0]
-            # if string good to go
-            elif self.index_label and isinstance(self.index_label, str):
-                index_label = self.index_label
-            else:
-                index_label = self.df.index.names[0]
-
-            if isinstance(self.columns, MultiIndex):
-                self.rowcounter += 1
-
-            if index_label and self.header is not False:
-                yield ExcelCell(self.rowcounter - 1,
-                                0,
-                                index_label,
-                                header_style)
-
-            # write index_values
-            index_values = self.df.index
-            if isinstance(self.df.index, PeriodIndex):
-                index_values = self.df.index.to_timestamp()
-
-            coloffset = 1
-            for idx, idxval in enumerate(index_values):
-                yield ExcelCell(self.rowcounter + idx, 0, idxval, header_style)
-
-        # Write the body of the frame data series by series.
-        for colidx in range(len(self.columns)):
-            series = self.df.iloc[:, colidx]
-            for i, val in enumerate(series):
-                yield ExcelCell(self.rowcounter + i, colidx + coloffset, val)
-
-    def _format_hierarchical_rows(self):
-        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
-        if has_aliases or self.header:
-            self.rowcounter += 1
-
-        gcolidx = 0
-
-        if self.index:
-            index_labels = self.df.index.names
-            # check for aliases
-            if self.index_label and isinstance(self.index_label,
-                                               (list, tuple, np.ndarray, Index)):
-                index_labels = self.index_label
-
-            # MultiIndex columns require an extra row
-            # with index names (blank if None) for
-            # unambigous round-trip
-            if isinstance(self.columns, MultiIndex):
-                self.rowcounter += 1
-
-            # if index labels are not empty go ahead and dump
-            if (any(x is not None for x in index_labels)
-                    and self.header is not False):
-
-                for cidx, name in enumerate(index_labels):
-                    yield ExcelCell(self.rowcounter - 1,
-                                    cidx,
-                                    name,
-                                    header_style)
-
-            if self.merge_cells:
-                # Format hierarchical rows as merged cells.
-                level_strs = self.df.index.format(sparsify=True, adjoin=False,
-                                                  names=False)
-                level_lengths = _get_level_lengths(level_strs)
-
-                for spans, levels, labels in zip(level_lengths,
-                                                 self.df.index.levels,
-                                                 self.df.index.labels):
-                    values = levels.take(labels)
-                    for i in spans:
-                        if spans[i] > 1:
-                            yield ExcelCell(self.rowcounter + i,
-                                            gcolidx,
-                                            values[i],
-                                            header_style,
-                                            self.rowcounter + i + spans[i] - 1,
-                                            gcolidx)
-                        else:
-                            yield ExcelCell(self.rowcounter + i,
-                                            gcolidx,
-                                            values[i],
-                                            header_style)
-                    gcolidx += 1
-
-            else:
-                # Format hierarchical rows with non-merged values.
-                for indexcolvals in zip(*self.df.index):
-                    for idx, indexcolval in enumerate(indexcolvals):
-                        yield ExcelCell(self.rowcounter + idx,
-                                        gcolidx,
-                                        indexcolval,
-                                        header_style)
-                    gcolidx += 1
-
-        # Write the body of the frame data series by series.
-        for colidx in range(len(self.columns)):
-            series = self.df.iloc[:, colidx]
-            for i, val in enumerate(series):
-                yield ExcelCell(self.rowcounter + i, gcolidx + colidx, val)
-
-    def get_formatted_cells(self):
-        for cell in itertools.chain(self._format_header(),
-                                    self._format_body()):
-            cell.val = self._format_value(cell.val)
-            yield cell
-
-# ----------------------------------------------------------------------
-# Array formatters
-
-
-def format_array(values, formatter, float_format=None, na_rep='NaN',
-                 digits=None, space=None, justify='right'):
-
-    if com.is_categorical_dtype(values):
-        fmt_klass = CategoricalArrayFormatter
-    elif com.is_float_dtype(values.dtype):
-        fmt_klass = FloatArrayFormatter
-    elif com.is_period_arraylike(values):
-        fmt_klass = PeriodArrayFormatter
-    elif com.is_integer_dtype(values.dtype):
-        fmt_klass = IntArrayFormatter
-    elif com.is_datetimetz(values):
-        fmt_klass = Datetime64TZFormatter
-    elif com.is_datetime64_dtype(values.dtype):
-        fmt_klass = Datetime64Formatter
-    elif com.is_timedelta64_dtype(values.dtype):
-        fmt_klass = Timedelta64Formatter
-    else:
-        fmt_klass = GenericArrayFormatter
-
-    if space is None:
-        space = get_option("display.column_space")
-
-    if float_format is None:
-        float_format = get_option("display.float_format")
-
-    if digits is None:
-        digits = get_option("display.precision")
-
-    fmt_obj = fmt_klass(values, digits=digits, na_rep=na_rep,
-                        float_format=float_format,
-                        formatter=formatter, space=space,
-                        justify=justify)
-
-    return fmt_obj.get_result()
-
-
-class GenericArrayFormatter(object):
-
-    def __init__(self, values, digits=7, formatter=None, na_rep='NaN',
-                 space=12, float_format=None, justify='right'):
-        self.values = values
-        self.digits = digits
-        self.na_rep = na_rep
-        self.space = space
-        self.formatter = formatter
-        self.float_format = float_format
-        self.justify = justify
-
-    def get_result(self):
-        fmt_values = self._format_strings()
-        return _make_fixed_width(fmt_values, self.justify)
-
-    def _format_strings(self):
-        if self.float_format is None:
-            float_format = get_option("display.float_format")
-            if float_format is None:
-                fmt_str = '%% .%dg' % get_option("display.precision")
-                float_format = lambda x: fmt_str % x
-        else:
-            float_format = self.float_format
-
-        formatter = self.formatter if self.formatter is not None else \
-            (lambda x: com.pprint_thing(x, escape_chars=('\t', '\r', '\n')))
-
-        def _format(x):
-            if self.na_rep is not None and lib.checknull(x):
-                if x is None:
-                    return 'None'
-                elif x is pd.NaT:
-                    return 'NaT'
-                return self.na_rep
-            elif isinstance(x, PandasObject):
-                return '%s' % x
-            else:
-                # object dtype
-                return '%s' % formatter(x)
-
-        vals = self.values
-        if isinstance(vals, Index):
-            vals = vals._values
-
-        is_float = lib.map_infer(vals, com.is_float) & notnull(vals)
-        leading_space = is_float.any()
-
-        fmt_values = []
-        for i, v in enumerate(vals):
-            if not is_float[i] and leading_space:
-                fmt_values.append(' %s' % _format(v))
-            elif is_float[i]:
-                fmt_values.append(float_format(v))
-            else:
-                fmt_values.append(' %s' % _format(v))
-
-        return fmt_values
-
-
-class FloatArrayFormatter(GenericArrayFormatter):
-
-    """
-
-    """
-
-    def __init__(self, *args, **kwargs):
-        GenericArrayFormatter.__init__(self, *args, **kwargs)
-
-        if self.float_format is not None and self.formatter is None:
-            self.formatter = self.float_format
-
-    def _format_with(self, fmt_str):
-        def _val(x, threshold):
-            if notnull(x):
-                if (threshold is None or
-                        abs(x) > get_option("display.chop_threshold")):
-                    return fmt_str % x
-                else:
-                    if fmt_str.endswith("e"):  # engineering format
-                        return "0"
-                    else:
-                        return fmt_str % 0
-            else:
-
-                return self.na_rep
-
-        threshold = get_option("display.chop_threshold")
-        fmt_values = [_val(x, threshold) for x in self.values]
-        return _trim_zeros(fmt_values, self.na_rep)
-
-    def _format_strings(self):
-        if self.formatter is not None:
-            fmt_values = [self.formatter(x) for x in self.values]
-        else:
-            fmt_str = '%% .%df' % self.digits
-            fmt_values = self._format_with(fmt_str)
-
-            if len(fmt_values) > 0:
-                maxlen = max(len(x) for x in fmt_values)
-            else:
-                maxlen = 0
-
-            too_long = maxlen > self.digits + 6
-
-            abs_vals = np.abs(self.values)
-
-            # this is pretty arbitrary for now
-            has_large_values = (abs_vals > 1e8).any()
-            has_small_values = ((abs_vals < 10 ** (-self.digits)) &
-                                (abs_vals > 0)).any()
-
-            if too_long and has_large_values:
-                fmt_str = '%% .%de' % self.digits
-                fmt_values = self._format_with(fmt_str)
-            elif has_small_values:
-                fmt_str = '%% .%de' % self.digits
-                fmt_values = self._format_with(fmt_str)
-
-        return fmt_values
-
-
-class IntArrayFormatter(GenericArrayFormatter):
-
-    def _format_strings(self):
-        formatter = self.formatter or (lambda x: '% d' % x)
-        fmt_values = [formatter(x) for x in self.values]
-        return fmt_values
-
-
-class Datetime64Formatter(GenericArrayFormatter):
-    def __init__(self, values, nat_rep='NaT', date_format=None, **kwargs):
-        super(Datetime64Formatter, self).__init__(values, **kwargs)
-        self.nat_rep = nat_rep
-        self.date_format = date_format
-
-    def _format_strings(self):
-        """ we by definition have DO NOT have a TZ """
-
-        values = self.values
-        if not isinstance(values, DatetimeIndex):
-            values = DatetimeIndex(values)
-
-        fmt_values = format_array_from_datetime(values.asi8.ravel(),
-                                                format=_get_format_datetime64_from_values(values, self.date_format),
-                                                na_rep=self.nat_rep).reshape(values.shape)
-        return fmt_values.tolist()
-
-
-class PeriodArrayFormatter(IntArrayFormatter):
-
-    def _format_strings(self):
-        values = PeriodIndex(self.values).to_native_types()
-        formatter = self.formatter or (lambda x: '%s' % x)
-        fmt_values = [formatter(x) for x in values]
-        return fmt_values
-
-
-class CategoricalArrayFormatter(GenericArrayFormatter):
-
-    def __init__(self, values, *args, **kwargs):
-        GenericArrayFormatter.__init__(self, values, *args, **kwargs)
-
-    def _format_strings(self):
-        fmt_values = format_array(self.values.get_values(), self.formatter,
-                                  float_format=self.float_format,
-                                  na_rep=self.na_rep, digits=self.digits,
-                                  space=self.space, justify=self.justify)
-        return fmt_values
-
-
-def _is_dates_only(values):
-    # return a boolean if we are only dates (and don't have a timezone)
-    values = DatetimeIndex(values)
-    if values.tz is not None:
-        return False
-
-    values_int = values.asi8
-    consider_values = values_int != iNaT
-    one_day_nanos = (86400 * 1e9)
-    even_days = np.logical_and(consider_values, values_int % one_day_nanos != 0).sum() == 0
-    if even_days:
-        return True
-    return False
-
-def _format_datetime64(x, tz=None, nat_rep='NaT'):
-    if x is None or lib.checknull(x):
-        return nat_rep
-
-    if tz is not None or not isinstance(x, Timestamp):
-        x = Timestamp(x, tz=tz)
-
-    return str(x)
-
-
-def _format_datetime64_dateonly(x, nat_rep='NaT', date_format=None):
-    if x is None or lib.checknull(x):
-        return nat_rep
-
-    if not isinstance(x, Timestamp):
-        x = Timestamp(x)
-
-    if date_format:
-        return x.strftime(date_format)
-    else:
-        return x._date_repr
-
-def _get_format_datetime64(is_dates_only, nat_rep='NaT', date_format=None):
-
-    if is_dates_only:
-        return lambda x, tz=None: _format_datetime64_dateonly(x,
-                                                              nat_rep=nat_rep,
-                                                              date_format=date_format)
-    else:
-        return lambda x, tz=None: _format_datetime64(x, tz=tz, nat_rep=nat_rep)
-
-
-def _get_format_datetime64_from_values(values, date_format):
-    """ given values and a date_format, return a string format """
-    is_dates_only = _is_dates_only(values)
-    if is_dates_only:
-        return date_format or "%Y-%m-%d"
-    return date_format
-
-
-class Datetime64TZFormatter(Datetime64Formatter):
-
-    def _format_strings(self):
-        """ we by definition have a TZ """
-
-        values = self.values.asobject
-        is_dates_only = _is_dates_only(values)
-        formatter = (self.formatter or _get_format_datetime64(is_dates_only, date_format=self.date_format))
-        fmt_values = [ formatter(x) for x in values ]
-
-        return fmt_values
-
-class Timedelta64Formatter(GenericArrayFormatter):
-
-    def __init__(self, values, nat_rep='NaT', box=False, **kwargs):
-        super(Timedelta64Formatter, self).__init__(values, **kwargs)
-        self.nat_rep = nat_rep
-        self.box = box
-
-    def _format_strings(self):
-        formatter = self.formatter or _get_format_timedelta64(self.values, nat_rep=self.nat_rep,
-                                                              box=self.box)
-        fmt_values = np.array([formatter(x) for x in self.values])
-        return fmt_values
-
-
-def _get_format_timedelta64(values, nat_rep='NaT', box=False):
-    """
-    Return a formatter function for a range of timedeltas.
-    These will all have the same format argument
-
-    If box, then show the return in quotes
-    """
-
-    values_int = values.astype(np.int64)
-
-    consider_values = values_int != iNaT
-
-    one_day_nanos = (86400 * 1e9)
-    even_days = np.logical_and(consider_values, values_int % one_day_nanos != 0).sum() == 0
-    all_sub_day = np.logical_and(consider_values, np.abs(values_int) >= one_day_nanos).sum() == 0
-
-    if even_days:
-        format = 'even_day'
-    elif all_sub_day:
-        format = 'sub_day'
-    else:
-        format = 'long'
-
-    def _formatter(x):
-        if x is None or lib.checknull(x):
-            return nat_rep
-
-        if not isinstance(x, Timedelta):
-            x = Timedelta(x)
-        result = x._repr_base(format=format)
-        if box:
-            result = "'{0}'".format(result)
-        return result
-
-    return _formatter
-
-
-def _make_fixed_width(strings, justify='right', minimum=None,
-                      adj=None):
-
-    if len(strings) == 0 or justify == 'all':
-        return strings
-
-    if adj is None:
-        adj = _get_adjustment()
-
-    max_len = np.max([adj.len(x) for x in strings])
-
-    if minimum is not None:
-        max_len = max(minimum, max_len)
-
-    conf_max = get_option("display.max_colwidth")
-    if conf_max is not None and max_len > conf_max:
-        max_len = conf_max
-
-    def just(x):
-        if conf_max is not None:
-            if (conf_max > 3) & (adj.len(x) > max_len):
-                x = x[:max_len - 3] + '...'
-        return x
-
-    strings = [just(x) for x in strings]
-    result = adj.justify(strings, max_len, mode=justify)
-    return result
-
-
-def _trim_zeros(str_floats, na_rep='NaN'):
-    """
-    Trims zeros and decimal points.
-    """
-    trimmed = str_floats
-
-    def _cond(values):
-        non_na = [x for x in values if x != na_rep]
-        return (len(non_na) > 0 and all([x.endswith('0') for x in non_na]) and
-                not(any([('e' in x) or ('E' in x) for x in non_na])))
-
-    while _cond(trimmed):
-        trimmed = [x[:-1] if x != na_rep else x for x in trimmed]
-
-    # trim decimal points
-    return [x[:-1] if x.endswith('.') and x != na_rep else x for x in trimmed]
-
-
-def single_column_table(column, align=None, style=None):
-    table = '<table'
-    if align is not None:
-        table += (' align="%s"' % align)
-    if style is not None:
-        table += (' style="%s"' % style)
-    table += '><tbody>'
-    for i in column:
-        table += ('<tr><td>%s</td></tr>' % str(i))
-    table += '</tbody></table>'
-    return table
-
-
-def single_row_table(row):  # pragma: no cover
-    table = '<table><tbody><tr>'
-    for i in row:
-        table += ('<td>%s</td>' % str(i))
-    table += '</tr></tbody></table>'
-    return table
-
-
-def _has_names(index):
-    if isinstance(index, MultiIndex):
-        return any([x is not None for x in index.names])
-    else:
-        return index.name is not None
-
-
-# ------------------------------------------------------------------------------
-# Global formatting options
-
-_initial_defencoding = None
-
-
-def detect_console_encoding():
-    """
-    Try to find the most capable encoding supported by the console.
-    slighly modified from the way IPython handles the same issue.
-    """
-    import locale
-    global _initial_defencoding
-
-    encoding = None
-    try:
-        encoding = sys.stdout.encoding or sys.stdin.encoding
-    except AttributeError:
-        pass
-
-    # try again for something better
-    if not encoding or 'ascii' in encoding.lower():
-        try:
-            encoding = locale.getpreferredencoding()
-        except Exception:
-            pass
-
-    # when all else fails. this will usually be "ascii"
-    if not encoding or 'ascii' in encoding.lower():
-        encoding = sys.getdefaultencoding()
-
-    # GH3360, save the reported defencoding at import time
-    # MPL backends may change it. Make available for debugging.
-    if not _initial_defencoding:
-        _initial_defencoding = sys.getdefaultencoding()
-
-    return encoding
-
-
-def get_console_size():
-    """Return console size as tuple = (width, height).
-
-    Returns (None,None) in non-interactive session.
-    """
-    display_width = get_option('display.width')
-    # deprecated.
-    display_height = get_option('display.height', silent=True)
-
-    # Consider
-    # interactive shell terminal, can detect term size
-    # interactive non-shell terminal (ipnb/ipqtconsole), cannot detect term
-    # size non-interactive script, should disregard term size
-
-    # in addition
-    # width,height have default values, but setting to 'None' signals
-    # should use Auto-Detection, But only in interactive shell-terminal.
-    # Simple. yeah.
-
-    if com.in_interactive_session():
-        if com.in_ipython_frontend():
-            # sane defaults for interactive non-shell terminal
-            # match default for width,height in config_init
-            from pandas.core.config import get_default_val
-            terminal_width = get_default_val('display.width')
-            terminal_height = get_default_val('display.height')
-        else:
-            # pure terminal
-            terminal_width, terminal_height = get_terminal_size()
-    else:
-        terminal_width, terminal_height = None, None
-
-    # Note if the User sets width/Height to None (auto-detection)
-    # and we're in a script (non-inter), this will return (None,None)
-    # caller needs to deal.
-    return (display_width or terminal_width, display_height or terminal_height)
-
-
-class EngFormatter(object):
-
-    """
-    Formats float values according to engineering format.
-
-    Based on matplotlib.ticker.EngFormatter
-    """
-
-    # The SI engineering prefixes
-    ENG_PREFIXES = {
-        -24: "y",
-        -21: "z",
-        -18: "a",
-        -15: "f",
-        -12: "p",
-        -9: "n",
-        -6: "u",
-        -3: "m",
-        0: "",
-        3: "k",
-        6: "M",
-        9: "G",
-        12: "T",
-        15: "P",
-        18: "E",
-        21: "Z",
-        24: "Y"
-    }
-
-    def __init__(self, accuracy=None, use_eng_prefix=False):
-        self.accuracy = accuracy
-        self.use_eng_prefix = use_eng_prefix
-
-    def __call__(self, num):
-        """ Formats a number in engineering notation, appending a letter
-        representing the power of 1000 of the original number. Some examples:
-
-        >>> format_eng(0)       # for self.accuracy = 0
-        ' 0'
-
-        >>> format_eng(1000000) # for self.accuracy = 1,
-                                #     self.use_eng_prefix = True
-        ' 1.0M'
-
-        >>> format_eng("-1e-6") # for self.accuracy = 2
-                                #     self.use_eng_prefix = False
-        '-1.00E-06'
-
-        @param num: the value to represent
-        @type num: either a numeric value or a string that can be converted to
-                   a numeric value (as per decimal.Decimal constructor)
-
-        @return: engineering formatted string
-        """
-        import decimal
-        import math
-        dnum = decimal.Decimal(str(num))
-
-        sign = 1
-
-        if dnum < 0:  # pragma: no cover
-            sign = -1
-            dnum = -dnum
-
-        if dnum != 0:
-            pow10 = decimal.Decimal(int(math.floor(dnum.log10() / 3) * 3))
-        else:
-            pow10 = decimal.Decimal(0)
-
-        pow10 = pow10.min(max(self.ENG_PREFIXES.keys()))
-        pow10 = pow10.max(min(self.ENG_PREFIXES.keys()))
-        int_pow10 = int(pow10)
-
-        if self.use_eng_prefix:
-            prefix = self.ENG_PREFIXES[int_pow10]
-        else:
-            if int_pow10 < 0:
-                prefix = 'E-%02d' % (-int_pow10)
-            else:
-                prefix = 'E+%02d' % int_pow10
-
-        mant = sign * dnum / (10 ** pow10)
-
-        if self.accuracy is None:  # pragma: no cover
-            format_str = u("% g%s")
-        else:
-            format_str = (u("%% .%if%%s") % self.accuracy)
-
-        formatted = format_str % (mant, prefix)
-
-        return formatted  # .strip()
-
-
-def set_eng_float_format(accuracy=3, use_eng_prefix=False):
-    """
-    Alter default behavior on how float is formatted in DataFrame.
-    Format float in engineering format. By accuracy, we mean the number of
-    decimal digits after the floating point.
-
-    See also EngFormatter.
-    """
-
-    set_option("display.float_format", EngFormatter(accuracy, use_eng_prefix))
-    set_option("display.column_space", max(12, accuracy + 9))
-
-
-def _put_lines(buf, lines):
-    if any(isinstance(x, compat.text_type) for x in lines):
-        lines = [compat.text_type(x) for x in lines]
-    buf.write('\n'.join(lines))
-
-
-def _binify(cols, line_width):
-    adjoin_width = 1
-    bins = []
-    curr_width = 0
-    i_last_column = len(cols) - 1
-    for i, w in enumerate(cols):
-        w_adjoined = w + adjoin_width
-        curr_width += w_adjoined
-        if i_last_column == i:
-            wrap = curr_width + 1 > line_width and i > 0
-        else:
-            wrap = curr_width + 2 > line_width and i > 0
-        if wrap:
-            bins.append(i)
-            curr_width = w_adjoined
-
-    bins.append(len(cols))
-    return bins
-
-if __name__ == '__main__':
-    arr = np.array([746.03, 0.00, 5620.00, 1592.36])
-    # arr = np.array([11111111.1, 1.55])
-    # arr = [314200.0034, 1.4125678]
-    arr = np.array([327763.3119, 345040.9076, 364460.9915, 398226.8688,
-                    383800.5172, 433442.9262, 539415.0568, 568590.4108,
-                    599502.4276, 620921.8593, 620898.5294, 552427.1093,
-                    555221.2193, 519639.7059, 388175.7, 379199.5854,
-                    614898.25, 504833.3333, 560600., 941214.2857,
-                    1134250., 1219550., 855736.85, 1042615.4286,
-                    722621.3043, 698167.1818, 803750.])
-    fmt = FloatArrayFormatter(arr, digits=7)
-    print(fmt.get_result())
diff --git a/pandas/core/frame.py b/pandas/core/frame.py
index e92de770ac4bd..a420266561c5a 100644
--- a/pandas/core/frame.py
+++ b/pandas/core/frame.py
@@ -18,60 +18,117 @@
 import sys
 import types
 import warnings
+from textwrap import dedent
 
-from numpy import nan as NA
 import numpy as np
 import numpy.ma as ma
 
-from pandas.core.common import (isnull, notnull, PandasError, _try_sort, _not_none,
-                                _default_index, _maybe_upcast, is_sequence,
-                                _infer_dtype_from_scalar, _values_from_object,
-                                is_list_like, _maybe_box_datetimelike,
-                                is_categorical_dtype, is_object_dtype,
-                                is_internal_type, is_datetimetz,
-                                _possibly_infer_to_datetimelike, _dict_compat)
+from pandas.core.accessor import CachedAccessor
+from pandas.core.dtypes.cast import (
+    maybe_upcast,
+    cast_scalar_to_array,
+    construct_1d_arraylike_from_scalar,
+    maybe_cast_to_datetime,
+    maybe_infer_to_datetimelike,
+    maybe_convert_platform,
+    maybe_downcast_to_dtype,
+    invalidate_string_dtypes,
+    coerce_to_dtypes,
+    maybe_upcast_putmask,
+    find_common_type)
+from pandas.core.dtypes.common import (
+    is_categorical_dtype,
+    is_object_dtype,
+    is_extension_type,
+    is_extension_array_dtype,
+    is_datetimetz,
+    is_datetime64_any_dtype,
+    is_bool_dtype,
+    is_integer_dtype,
+    is_float_dtype,
+    is_integer,
+    is_scalar,
+    is_dtype_equal,
+    needs_i8_conversion,
+    _get_dtype_from_object,
+    _ensure_float64,
+    _ensure_int64,
+    _ensure_platform_int,
+    is_list_like,
+    is_nested_list_like,
+    is_iterator,
+    is_sequence,
+    is_named_tuple)
+from pandas.core.dtypes.concat import _get_sliced_frame_result_type
+from pandas.core.dtypes.missing import isna, notna
+
+
 from pandas.core.generic import NDFrame, _shared_docs
-from pandas.core.index import Index, MultiIndex, _ensure_index
-from pandas.core.indexing import (maybe_droplevels,
-                                  convert_to_index_sliceable,
+from pandas.core.index import (Index, MultiIndex, _ensure_index,
+                               _ensure_index_from_sequences)
+from pandas.core.indexing import (maybe_droplevels, convert_to_index_sliceable,
                                   check_bool_indexer)
 from pandas.core.internals import (BlockManager,
                                    create_block_manager_from_arrays,
                                    create_block_manager_from_blocks)
 from pandas.core.series import Series
-from pandas.core.categorical import Categorical
-import pandas.computation.expressions as expressions
-from pandas.computation.eval import eval as _eval
-from numpy import percentile as _quantile
-from pandas.compat import(range, zip, lrange, lmap, lzip, StringIO, u,
-                          OrderedDict, raise_with_traceback)
+from pandas.core.arrays import Categorical, ExtensionArray
+import pandas.core.algorithms as algorithms
+from pandas.compat import (range, map, zip, lrange, lmap, lzip, StringIO, u,
+                           OrderedDict, raise_with_traceback)
 from pandas import compat
-from pandas.sparse.array import SparseArray
-from pandas.util.decorators import (cache_readonly, deprecate, Appender,
-                                    Substitution, deprecate_kwarg)
-
-from pandas.tseries.period import PeriodIndex
-from pandas.tseries.index import DatetimeIndex
-from pandas.tseries.tdi import TimedeltaIndex
-
+from pandas.compat import PY36
+from pandas.compat.numpy import function as nv
+from pandas.util._decorators import (Appender, Substitution,
+                                     rewrite_axis_style_signature,
+                                     deprecate_kwarg)
+from pandas.util._validators import (validate_bool_kwarg,
+                                     validate_axis_style_args)
+
+from pandas.core.indexes.period import PeriodIndex
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexes.timedeltas import TimedeltaIndex
 
-import pandas.core.algorithms as algos
-import pandas.core.base as base
 import pandas.core.common as com
-import pandas.core.format as fmt
 import pandas.core.nanops as nanops
 import pandas.core.ops as ops
+import pandas.io.formats.console as console
+import pandas.io.formats.format as fmt
+from pandas.io.formats.printing import pprint_thing
+import pandas.plotting._core as gfx
 
-import pandas.lib as lib
-import pandas.algos as _algos
+from pandas._libs import lib, algos as libalgos
 
 from pandas.core.config import get_option
 
-#----------------------------------------------------------------------
+# ---------------------------------------------------------------------
 # Docstring templates
 
-_shared_doc_kwargs = dict(axes='index, columns', klass='DataFrame',
-                          axes_single_arg="{0, 1, 'index', 'columns'}")
+_shared_doc_kwargs = dict(
+    axes='index, columns', klass='DataFrame',
+    axes_single_arg="{0 or 'index', 1 or 'columns'}",
+    axis="""
+    axis : {0 or 'index', 1 or 'columns'}, default 0
+        - 0 or 'index': apply function to each column.
+        - 1 or 'columns': apply function to each row.""",
+    optional_by="""
+        by : str or list of str
+            Name or list of names to sort by.
+
+            - if `axis` is 0 or `'index'` then `by` may contain index
+              levels and/or column labels
+            - if `axis` is 1 or `'columns'` then `by` may contain column
+              levels and/or index labels
+
+            .. versionchanged:: 0.23.0
+               Allow specifying index or column level names.""",
+    versionadded_to_excel='',
+    optional_labels="""labels : array-like, optional
+            New labels / index to conform the axis specified by 'axis' to.""",
+    optional_axis="""axis : int or str, optional
+            Axis to target. Can be either the axis name ('index', 'columns')
+            or number (0, 1).""",
+)
 
 _numeric_only_doc = """numeric_only : boolean, default None
     Include only float, int, boolean data. If None, will attempt to use
@@ -90,21 +147,26 @@
 ----------%s
 right : DataFrame
 how : {'left', 'right', 'outer', 'inner'}, default 'inner'
-    * left: use only keys from left frame (SQL: left outer join)
-    * right: use only keys from right frame (SQL: right outer join)
-    * outer: use union of keys from both frames (SQL: full outer join)
-    * inner: use intersection of keys from both frames (SQL: inner join)
+    * left: use only keys from left frame, similar to a SQL left outer join;
+      preserve key order
+    * right: use only keys from right frame, similar to a SQL right outer join;
+      preserve key order
+    * outer: use union of keys from both frames, similar to a SQL full outer
+      join; sort keys lexicographically
+    * inner: use intersection of keys from both frames, similar to a SQL inner
+      join; preserve the order of the left keys
 on : label or list
-    Field names to join on. Must be found in both DataFrames. If on is
-    None and not merging on indexes, then it merges on the intersection of
-    the columns by default.
+    Column or index level names to join on. These must be found in both
+    DataFrames. If `on` is None and not merging on indexes then this defaults
+    to the intersection of the columns in both DataFrames.
 left_on : label or list, or array-like
-    Field names to join on in left DataFrame. Can be a vector or list of
-    vectors of the length of the DataFrame to use a particular vector as
-    the join key instead of columns
+    Column or index level names to join on in the left DataFrame. Can also
+    be an array or list of arrays of the length of the left DataFrame.
+    These arrays are treated as if they are columns.
 right_on : label or list, or array-like
-    Field names to join on in right DataFrame or vector/list of vectors per
-    left_on docs
+    Column or index level names to join on in the right DataFrame. Can also
+    be an array or list of arrays of the length of the right DataFrame.
+    These arrays are treated as if they are columns.
 left_index : boolean, default False
     Use the index from the left DataFrame as the join key(s). If it is a
     MultiIndex, the number of keys in the other DataFrame (either the index
@@ -113,7 +175,8 @@
     Use the index from the right DataFrame as the join key. Same caveats as
     left_index
 sort : boolean, default False
-    Sort the join keys lexicographically in the result DataFrame
+    Sort the join keys lexicographically in the result DataFrame. If False,
+    the order of the join keys depends on the join type (how keyword)
 suffixes : 2-length sequence (tuple, list, ...)
     Suffix to apply to overlapping column names in the left and right
     side, respectively
@@ -129,7 +192,23 @@
     "right_only" for observations whose merge key only appears in 'right'
     DataFrame, and "both" if the observation's merge key is found in both.
 
-    .. versionadded:: 0.17.0
+validate : string, default None
+    If specified, checks if merge is of specified type.
+
+    * "one_to_one" or "1:1": check if merge keys are unique in both
+      left and right datasets.
+    * "one_to_many" or "1:m": check if merge keys are unique in left
+      dataset.
+    * "many_to_one" or "m:1": check if merge keys are unique in right
+      dataset.
+    * "many_to_many" or "m:m": allowed, but does not result in checks.
+
+    .. versionadded:: 0.21.0
+
+Notes
+-----
+Support for specifying index levels as the `on`, `left_on`, and
+`right_on` parameters was added in version 0.23.0
 
 Examples
 --------
@@ -141,7 +220,7 @@
 2   baz  3         2   qux  7
 3   foo  4         3   bar  8
 
->>> merge(A, B, left_on='lkey', right_on='rkey', how='outer')
+>>> A.merge(B, left_on='lkey', right_on='rkey', how='outer')
    lkey  value_x  rkey  value_y
 0  foo   1        foo   5
 1  foo   4        foo   5
@@ -155,41 +234,81 @@
 merged : DataFrame
     The output type will the be same as 'left', if it is a subclass
     of DataFrame.
+
+See also
+--------
+merge_ordered
+merge_asof
+DataFrame.join
 """
 
-#----------------------------------------------------------------------
+# -----------------------------------------------------------------------
 # DataFrame class
 
 
 class DataFrame(NDFrame):
-
     """ Two-dimensional size-mutable, potentially heterogeneous tabular data
     structure with labeled axes (rows and columns). Arithmetic operations
     align on both row and column labels. Can be thought of as a dict-like
-    container for Series objects. The primary pandas data structure
+    container for Series objects. The primary pandas data structure.
 
     Parameters
     ----------
     data : numpy ndarray (structured or homogeneous), dict, or DataFrame
         Dict can contain Series, arrays, constants, or list-like objects
+
+        .. versionchanged :: 0.23.0
+           If data is a dict, argument order is maintained for Python 3.6
+           and later.
+
     index : Index or array-like
-        Index to use for resulting frame. Will default to np.arange(n) if
+        Index to use for resulting frame. Will default to RangeIndex if
         no indexing information part of input data and no index provided
     columns : Index or array-like
         Column labels to use for resulting frame. Will default to
-        np.arange(n) if no column labels are provided
+        RangeIndex (0, 1, 2, ..., n) if no column labels are provided
     dtype : dtype, default None
-        Data type to force, otherwise infer
+        Data type to force. Only a single dtype is allowed. If None, infer
     copy : boolean, default False
         Copy data from inputs. Only affects DataFrame / 2d ndarray input
 
     Examples
     --------
-    >>> d = {'col1': ts1, 'col2': ts2}
-    >>> df = DataFrame(data=d, index=index)
-    >>> df2 = DataFrame(np.random.randn(10, 5))
-    >>> df3 = DataFrame(np.random.randn(10, 5),
-    ...                 columns=['a', 'b', 'c', 'd', 'e'])
+    Constructing DataFrame from a dictionary.
+
+    >>> d = {'col1': [1, 2], 'col2': [3, 4]}
+    >>> df = pd.DataFrame(data=d)
+    >>> df
+       col1  col2
+    0     1     3
+    1     2     4
+
+    Notice that the inferred dtype is int64.
+
+    >>> df.dtypes
+    col1    int64
+    col2    int64
+    dtype: object
+
+    To enforce a single dtype:
+
+    >>> df = pd.DataFrame(data=d, dtype=np.int8)
+    >>> df.dtypes
+    col1    int8
+    col2    int8
+    dtype: object
+
+    Constructing DataFrame from numpy ndarray:
+
+    >>> df2 = pd.DataFrame(np.random.randint(low=0, high=10, size=(5, 5)),
+    ...                    columns=['a', 'b', 'c', 'd', 'e'])
+    >>> df2
+        a   b   c   d   e
+    0   2   8   8   3   4
+    1   4   2   9   0   9
+    2   1   0   7   8   0
+    3   5   1   7   1   3
+    4   6   0   2   4   2
 
     See also
     --------
@@ -204,6 +323,9 @@ def _constructor(self):
         return DataFrame
 
     _constructor_sliced = Series
+    _deprecations = NDFrame._deprecations | frozenset(
+        ['sortlevel', 'get_value', 'set_value', 'from_csv', 'from_items'])
+    _accessors = set()
 
     @property
     def _constructor_expanddim(self):
@@ -236,7 +358,7 @@ def __init__(self, data=None, index=None, columns=None, dtype=None,
             else:
                 mask = ma.getmaskarray(data)
                 if mask.any():
-                    data, fill_value = _maybe_upcast(data, copy=True)
+                    data, fill_value = maybe_upcast(data, copy=True)
                     data[mask] = fill_value
                 else:
                     data = data.copy()
@@ -246,11 +368,11 @@ def __init__(self, data=None, index=None, columns=None, dtype=None,
         elif isinstance(data, (np.ndarray, Series, Index)):
             if data.dtype.names:
                 data_columns = list(data.dtype.names)
-                data = dict((k, data[k]) for k in data_columns)
+                data = {k: data[k] for k in data_columns}
                 if columns is None:
                     columns = data_columns
                 mgr = self._init_dict(data, index, columns, dtype=dtype)
-            elif getattr(data, 'name', None):
+            elif getattr(data, 'name', None) is not None:
                 mgr = self._init_dict({data.name: data}, index, columns,
                                       dtype=dtype)
             else:
@@ -261,6 +383,8 @@ def __init__(self, data=None, index=None, columns=None, dtype=None,
                 data = list(data)
             if len(data) > 0:
                 if is_list_like(data[0]) and getattr(data[0], 'ndim', 1) == 1:
+                    if is_named_tuple(data[0]) and columns is None:
+                        columns = data[0]._fields
                     arrays, columns = _to_arrays(data, columns, dtype=dtype)
                     columns = _ensure_index(columns)
 
@@ -269,9 +393,9 @@ def __init__(self, data=None, index=None, columns=None, dtype=None,
                         if isinstance(data[0], Series):
                             index = _get_names_from_index(data)
                         elif isinstance(data[0], Categorical):
-                            index = _default_index(len(data[0]))
+                            index = com._default_index(len(data[0]))
                         else:
-                            index = _default_index(len(data))
+                            index = com._default_index(len(data))
 
                     mgr = _arrays_to_mgr(arrays, columns, index, columns,
                                          dtype=dtype)
@@ -287,21 +411,16 @@ def __init__(self, data=None, index=None, columns=None, dtype=None,
                 arr = np.array(data, dtype=dtype, copy=copy)
             except (ValueError, TypeError) as e:
                 exc = TypeError('DataFrame constructor called with '
-                                'incompatible data and dtype: %s' % e)
+                                'incompatible data and dtype: {e}'.format(e=e))
                 raise_with_traceback(exc)
 
             if arr.ndim == 0 and index is not None and columns is not None:
-                if isinstance(data, compat.string_types) and dtype is None:
-                    dtype = np.object_
-                if dtype is None:
-                    dtype, data = _infer_dtype_from_scalar(data)
-
-                values = np.empty((len(index), len(columns)), dtype=dtype)
-                values.fill(data)
-                mgr = self._init_ndarray(values, index, columns, dtype=dtype,
-                                         copy=False)
+                values = cast_scalar_to_array((len(index), len(columns)),
+                                              data, dtype=dtype)
+                mgr = self._init_ndarray(values, index, columns,
+                                         dtype=values.dtype, copy=False)
             else:
-                raise PandasError('DataFrame constructor not properly called!')
+                raise ValueError('DataFrame constructor not properly called!')
 
         NDFrame.__init__(self, mgr, fastpath=True)
 
@@ -311,58 +430,36 @@ def _init_dict(self, data, index, columns, dtype=None):
         Needs to handle a lot of exceptional cases.
         """
         if columns is not None:
-            columns = _ensure_index(columns)
-
-            # GH10856
-            # raise ValueError if only scalars in dict
-            if index is None:
-                extract_index(list(data.values()))
-
-            # prefilter if columns passed
-            data = dict((k, v) for k, v in compat.iteritems(data)
-                        if k in columns)
+            arrays = Series(data, index=columns, dtype=object)
+            data_names = arrays.index
 
+            missing = arrays.isnull()
             if index is None:
-                index = extract_index(list(data.values()))
-
+                # GH10856
+                # raise ValueError if only scalars in dict
+                index = extract_index(arrays[~missing])
             else:
                 index = _ensure_index(index)
 
-            arrays = []
-            data_names = []
-            for k in columns:
-                if k not in data:
-                    # no obvious "empty" int column
-                    if dtype is not None and issubclass(dtype.type,
-                                                        np.integer):
-                        continue
-
-                    if dtype is None:
-                        # 1783
-                        v = np.empty(len(index), dtype=object)
-                    elif np.issubdtype(dtype, np.flexible):
-                        v = np.empty(len(index), dtype=object)
-                    else:
-                        v = np.empty(len(index), dtype=dtype)
-
-                    v.fill(NA)
+            # no obvious "empty" int column
+            if missing.any() and not is_integer_dtype(dtype):
+                if dtype is None or np.issubdtype(dtype, np.flexible):
+                    # 1783
+                    nan_dtype = object
                 else:
-                    v = data[k]
-                data_names.append(k)
-                arrays.append(v)
+                    nan_dtype = dtype
+                v = construct_1d_arraylike_from_scalar(np.nan, len(index),
+                                                       nan_dtype)
+                arrays.loc[missing] = [v] * missing.sum()
 
         else:
-            keys = list(data.keys())
-            if not isinstance(data, OrderedDict):
-                keys = _try_sort(keys)
+            keys = com._dict_keys_to_ordered_list(data)
             columns = data_names = Index(keys)
             arrays = [data[k] for k in keys]
 
-        return _arrays_to_mgr(arrays, data_names, index, columns,
-                              dtype=dtype)
+        return _arrays_to_mgr(arrays, data_names, index, columns, dtype=dtype)
 
-    def _init_ndarray(self, values, index, columns, dtype=None,
-                      copy=False):
+    def _init_ndarray(self, values, index, columns, dtype=None, copy=False):
         # input must be a ndarray, list, Series, index
 
         if isinstance(values, Series):
@@ -383,45 +480,49 @@ def _get_axes(N, K, index=index, columns=columns):
             # return axes or defaults
 
             if index is None:
-                index = _default_index(N)
+                index = com._default_index(N)
             else:
                 index = _ensure_index(index)
 
             if columns is None:
-                columns = _default_index(K)
+                columns = com._default_index(K)
             else:
                 columns = _ensure_index(columns)
             return index, columns
 
         # we could have a categorical type passed or coerced to 'category'
         # recast this to an _arrays_to_mgr
-        if is_categorical_dtype(getattr(values,'dtype',None)) or is_categorical_dtype(dtype):
+        if (is_categorical_dtype(getattr(values, 'dtype', None)) or
+                is_categorical_dtype(dtype)):
 
-            if not hasattr(values,'dtype'):
+            if not hasattr(values, 'dtype'):
                 values = _prep_ndarray(values, copy=copy)
                 values = values.ravel()
             elif copy:
                 values = values.copy()
 
-            index, columns = _get_axes(len(values),1)
-            return _arrays_to_mgr([ values ], columns, index, columns,
+            index, columns = _get_axes(len(values), 1)
+            return _arrays_to_mgr([values], columns, index, columns,
+                                  dtype=dtype)
+        elif (is_datetimetz(values) or is_extension_array_dtype(values)):
+            # GH19157
+            if columns is None:
+                columns = [0]
+            return _arrays_to_mgr([values], columns, index, columns,
                                   dtype=dtype)
-        elif is_datetimetz(values):
-            return self._init_dict({ 0 : values }, index, columns,
-                                   dtype=dtype)
 
         # by definition an array here
         # the dtypes will be coerced to a single dtype
         values = _prep_ndarray(values, copy=copy)
 
         if dtype is not None:
-
-            if values.dtype != dtype:
+            if not is_dtype_equal(values.dtype, dtype):
                 try:
                     values = values.astype(dtype)
                 except Exception as orig:
-                    e = ValueError("failed to cast to '%s' (Exception was: %s)"
-                                   % (dtype, orig))
+                    e = ValueError("failed to cast to '{dtype}' (Exception "
+                                   "was: {orig})".format(dtype=dtype,
+                                                         orig=orig))
                     raise_with_traceback(e)
 
         index, columns = _get_axes(*values.shape)
@@ -431,15 +532,24 @@ def _get_axes(N, K, index=index, columns=columns):
         # on the entire block; this is to convert if we have datetimelike's
         # embedded in an object type
         if dtype is None and is_object_dtype(values):
-            values = _possibly_infer_to_datetimelike(values)
+            values = maybe_infer_to_datetimelike(values)
 
         return create_block_manager_from_blocks([values], [columns, index])
 
     @property
     def axes(self):
         """
-        Return a list with the row axis labels and column axis labels as the
-        only members. They are returned in that order.
+        Return a list representing the axes of the DataFrame.
+
+        It has the row axis labels and column axis labels as the only members.
+        They are returned in that order.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'col1': [1, 2], 'col2': [3, 4]})
+        >>> df.axes
+        [RangeIndex(start=0, stop=2, step=1), Index(['coll', 'col2'],
+        dtype='object')]
         """
         return [self.index, self.columns]
 
@@ -447,8 +557,23 @@ def axes(self):
     def shape(self):
         """
         Return a tuple representing the dimensionality of the DataFrame.
+
+        See Also
+        --------
+        ndarray.shape
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'col1': [1, 2], 'col2': [3, 4]})
+        >>> df.shape
+        (2, 2)
+
+        >>> df = pd.DataFrame({'col1': [1, 2], 'col2': [3, 4],
+        ...                    'col3': [5, 6]})
+        >>> df.shape
+        (2, 3)
         """
-        return (len(self.index), len(self.columns))
+        return len(self.index), len(self.columns)
 
     def _repr_fits_vertical_(self):
         """
@@ -468,7 +593,7 @@ def _repr_fits_horizontal_(self, ignore_width=False):
         GH3541, GH3573
         """
 
-        width, height = fmt.get_console_size()
+        width, height = console.get_console_size()
         max_columns = get_option("display.max_columns")
         nb_columns = len(self.columns)
 
@@ -477,9 +602,9 @@ def _repr_fits_horizontal_(self, ignore_width=False):
                 ((not ignore_width) and width and nb_columns > (width // 2))):
             return False
 
-        if (ignore_width  # used by repr_html under IPython notebook
-                # scripts ignore terminal dims
-                or not com.in_interactive_session()):
+        # used by repr_html under IPython notebook or scripts ignore terminal
+        # dims
+        if ignore_width or not com.in_interactive_session():
             return True
 
         if (get_option('display.width') is not None or
@@ -490,7 +615,7 @@ def _repr_fits_horizontal_(self, ignore_width=False):
             max_rows = get_option("display.max_rows")
 
         # when auto-detecting, so width=None and not in ipython front end
-        # check whether repr fits horizontal by actualy checking
+        # check whether repr fits horizontal by actually checking
         # the width of the rendered repr
         buf = StringIO()
 
@@ -506,16 +631,15 @@ def _repr_fits_horizontal_(self, ignore_width=False):
 
         d.to_string(buf=buf)
         value = buf.getvalue()
-        repr_width = max([len(l) for l in value.split('\n')])
+        repr_width = max(len(l) for l in value.split('\n'))
 
         return repr_width < width
 
     def _info_repr(self):
         """True if the repr should show the info view."""
         info_repr_option = (get_option("display.large_repr") == "info")
-        return info_repr_option and not (
-            self._repr_fits_horizontal_() and self._repr_fits_vertical_()
-        )
+        return info_repr_option and not (self._repr_fits_horizontal_() and
+                                         self._repr_fits_vertical_())
 
     def __unicode__(self):
         """
@@ -533,7 +657,7 @@ def __unicode__(self):
         max_cols = get_option("display.max_columns")
         show_dimensions = get_option("display.show_dimensions")
         if get_option("display.expand_frame_repr"):
-            width, _ = fmt.get_console_size()
+            width, _ = console.get_console_size()
         else:
             width = None
         self.to_string(buf=buf, max_rows=max_rows, max_cols=max_cols,
@@ -550,8 +674,8 @@ def _repr_html_(self):
         # behaves badly when outputting an HTML table
         # that doesn't fit the window, so disable it.
         # XXX: In IPython 3.x and above, the Qt console will not attempt to
-        # display HTML, so this check can be removed when support for IPython 2.x
-        # is no longer needed.
+        # display HTML, so this check can be removed when support for
+        # IPython 2.x is no longer needed.
         if com.in_qtconsole():
             # 'HTML output is disabled in QtConsole'
             return None
@@ -560,8 +684,8 @@ def _repr_html_(self):
             buf = StringIO(u(""))
             self.info(buf=buf)
             # need to escape the <class>, should be the first line.
-            val = buf.getvalue().replace('<', r'&lt;', 1).replace('>',
-                                                                  r'&gt;', 1)
+            val = buf.getvalue().replace('<', r'&lt;', 1)
+            val = val.replace('>', r'&gt;', 1)
             return '<pre>' + val + '</pre>'
 
         if get_option("display.notebook_repr_html"):
@@ -570,19 +694,31 @@ def _repr_html_(self):
             show_dimensions = get_option("display.show_dimensions")
 
             return self.to_html(max_rows=max_rows, max_cols=max_cols,
-                                show_dimensions=show_dimensions,
-                                notebook=True)
+                                show_dimensions=show_dimensions, notebook=True)
         else:
             return None
 
+    @property
+    def style(self):
+        """
+        Property returning a Styler object containing methods for
+        building a styled HTML representation fo the DataFrame.
+
+        See Also
+        --------
+        pandas.io.formats.style.Styler
+        """
+        from pandas.io.formats.style import Styler
+        return Styler(self)
+
     def iteritems(self):
         """
         Iterator over (column name, Series) pairs.
 
         See also
         --------
-        iterrows : Iterate over the rows of a DataFrame as (index, Series) pairs.
-        itertuples : Iterate over the rows of a DataFrame as tuples of the values.
+        iterrows : Iterate over DataFrame rows as (index, Series) pairs.
+        itertuples : Iterate over DataFrame rows as namedtuples of the values.
 
         """
         if self.columns.is_unique and hasattr(self, '_item_cache'):
@@ -590,11 +726,11 @@ def iteritems(self):
                 yield k, self._get_item_cache(k)
         else:
             for i, k in enumerate(self.columns):
-                yield k, self._ixs(i,axis=1)
+                yield k, self._ixs(i, axis=1)
 
     def iterrows(self):
         """
-        Iterate over the rows of a DataFrame as (index, Series) pairs.
+        Iterate over DataFrame rows as (index, Series) pairs.
 
         Notes
         -----
@@ -615,8 +751,8 @@ def iterrows(self):
            int64
 
            To preserve dtypes while iterating over the rows, it is better
-           to use :meth:`itertuples` which returns tuples of the values
-           and which is generally faster as ``iterrows``.
+           to use :meth:`itertuples` which returns namedtuples of the values
+           and which is generally faster than ``iterrows``.
 
         2. You should **never modify** something you are iterating over.
            This is not guaranteed to work in all cases. Depending on the
@@ -630,54 +766,81 @@ def iterrows(self):
 
         See also
         --------
-        itertuples : Iterate over the rows of a DataFrame as tuples of the values.
+        itertuples : Iterate over DataFrame rows as namedtuples of the values.
         iteritems : Iterate over (column name, Series) pairs.
 
         """
         columns = self.columns
+        klass = self._constructor_sliced
         for k, v in zip(self.index, self.values):
-            s = Series(v, index=columns, name=k)
+            s = klass(v, index=columns, name=k)
             yield k, s
 
-    def itertuples(self, index=True):
+    def itertuples(self, index=True, name="Pandas"):
         """
-        Iterate over the rows of DataFrame as tuples, with index value
-        as first element of the tuple.
+        Iterate over DataFrame rows as namedtuples, with index value as first
+        element of the tuple.
 
         Parameters
         ----------
         index : boolean, default True
             If True, return the index as the first element of the tuple.
+        name : string, default "Pandas"
+            The name of the returned namedtuples or None to return regular
+            tuples.
+
+        Notes
+        -----
+        The column names will be renamed to positional names if they are
+        invalid Python identifiers, repeated, or start with an underscore.
+        With a large number of columns (>255), regular tuples are returned.
 
         See also
         --------
-        iterrows : Iterate over the rows of a DataFrame as (index, Series) pairs.
+        iterrows : Iterate over DataFrame rows as (index, Series) pairs.
         iteritems : Iterate over (column name, Series) pairs.
 
         Examples
         --------
 
-        >>> df = pd.DataFrame({'col1': [1, 2], 'col2': [0.1, 0.2]}, index=['a', 'b'])
+        >>> df = pd.DataFrame({'col1': [1, 2], 'col2': [0.1, 0.2]},
+                              index=['a', 'b'])
         >>> df
            col1  col2
         a     1   0.1
         b     2   0.2
         >>> for row in df.itertuples():
         ...     print(row)
-        ('a', 1, 0.10000000000000001)
-        ('b', 2, 0.20000000000000001)
+        ...
+        Pandas(Index='a', col1=1, col2=0.10000000000000001)
+        Pandas(Index='b', col1=2, col2=0.20000000000000001)
 
         """
         arrays = []
+        fields = []
         if index:
             arrays.append(self.index)
+            fields.append("Index")
 
         # use integer indexing because of possible duplicate column names
         arrays.extend(self.iloc[:, k] for k in range(len(self.columns)))
+
+        # Python 3 supports at most 255 arguments to constructor, and
+        # things get slow with this many fields in Python 2
+        if name is not None and len(self.columns) + index < 256:
+            # `rename` is unsupported in Python 2.6
+            try:
+                itertuple = collections.namedtuple(name,
+                                                   fields + list(self.columns),
+                                                   rename=True)
+                return map(itertuple._make, zip(*arrays))
+            except Exception:
+                pass
+
+        # fallback to regular tuples
         return zip(*arrays)
 
-    if compat.PY3:  # pragma: no cover
-        items = iteritems
+    items = iteritems
 
     def __len__(self):
         """Returns length of info axis, but here we use the index """
@@ -685,7 +848,8 @@ def __len__(self):
 
     def dot(self, other):
         """
-        Matrix multiplication with DataFrame or Series objects
+        Matrix multiplication with DataFrame or Series objects.  Can also be
+        called using `self @ other` in Python >= 3.5.
 
         Parameters
         ----------
@@ -710,12 +874,12 @@ def dot(self, other):
             lvals = self.values
             rvals = np.asarray(other)
             if lvals.shape[1] != rvals.shape[0]:
-                raise ValueError('Dot product shape mismatch, %s vs %s' %
-                                 (lvals.shape, rvals.shape))
+                raise ValueError('Dot product shape mismatch, '
+                                 '{l} vs {r}'.format(l=lvals.shape,
+                                                     r=rvals.shape))
 
         if isinstance(other, DataFrame):
-            return self._constructor(np.dot(lvals, rvals),
-                                     index=left.index,
+            return self._constructor(np.dot(lvals, rvals), index=left.index,
                                      columns=other.columns)
         elif isinstance(other, Series):
             return Series(np.dot(lvals, rvals), index=left.index)
@@ -726,32 +890,84 @@ def dot(self, other):
             else:
                 return Series(result, index=left.index)
         else:  # pragma: no cover
-            raise TypeError('unsupported type: %s' % type(other))
+            raise TypeError('unsupported type: {oth}'.format(oth=type(other)))
+
+    def __matmul__(self, other):
+        """ Matrix multiplication using binary `@` operator in Python>=3.5 """
+        return self.dot(other)
 
-    #----------------------------------------------------------------------
+    def __rmatmul__(self, other):
+        """ Matrix multiplication using binary `@` operator in Python>=3.5 """
+        return self.T.dot(np.transpose(other)).T
+
+    # ----------------------------------------------------------------------
     # IO methods (to / from other formats)
 
     @classmethod
-    def from_dict(cls, data, orient='columns', dtype=None):
+    def from_dict(cls, data, orient='columns', dtype=None, columns=None):
         """
-        Construct DataFrame from dict of array-like or dicts
+        Construct DataFrame from dict of array-like or dicts.
+
+        Creates DataFrame object from dictionary by columns or by index
+        allowing dtype specification.
 
         Parameters
         ----------
         data : dict
-            {field : array-like} or {field : dict}
+            Of the form {field : array-like} or {field : dict}.
         orient : {'columns', 'index'}, default 'columns'
             The "orientation" of the data. If the keys of the passed dict
             should be the columns of the resulting DataFrame, pass 'columns'
             (default). Otherwise if the keys should be rows, pass 'index'.
         dtype : dtype, default None
-            Data type to force, otherwise infer
+            Data type to force, otherwise infer.
+        columns : list, default None
+            Column labels to use when ``orient='index'``. Raises a ValueError
+            if used with ``orient='columns'``.
+
+            .. versionadded:: 0.23.0
 
         Returns
         -------
-        DataFrame
-        """
-        index, columns = None, None
+        pandas.DataFrame
+
+        See Also
+        --------
+        DataFrame.from_records : DataFrame from ndarray (structured
+            dtype), list of tuples, dict, or DataFrame
+        DataFrame : DataFrame object creation using constructor
+
+        Examples
+        --------
+        By default the keys of the dict become the DataFrame columns:
+
+        >>> data = {'col_1': [3, 2, 1, 0], 'col_2': ['a', 'b', 'c', 'd']}
+        >>> pd.DataFrame.from_dict(data)
+           col_1 col_2
+        0      3     a
+        1      2     b
+        2      1     c
+        3      0     d
+
+        Specify ``orient='index'`` to create the DataFrame using dictionary
+        keys as rows:
+
+        >>> data = {'row_1': [3, 2, 1, 0], 'row_2': ['a', 'b', 'c', 'd']}
+        >>> pd.DataFrame.from_dict(data, orient='index')
+               0  1  2  3
+        row_1  3  2  1  0
+        row_2  a  b  c  d
+
+        When using the 'index' orientation, the column names can be
+        specified manually:
+
+        >>> pd.DataFrame.from_dict(data, orient='index',
+        ...                        columns=['A', 'B', 'C', 'D'])
+               A  B  C  D
+        row_1  3  2  1  0
+        row_2  a  b  c  d
+        """
+        index = None
         orient = orient.lower()
         if orient == 'index':
             if len(data) > 0:
@@ -760,92 +976,221 @@ def from_dict(cls, data, orient='columns', dtype=None):
                     data = _from_nested_dict(data)
                 else:
                     data, index = list(data.values()), list(data.keys())
-        elif orient != 'columns':  # pragma: no cover
+        elif orient == 'columns':
+            if columns is not None:
+                raise ValueError("cannot use columns parameter with "
+                                 "orient='columns'")
+        else:  # pragma: no cover
             raise ValueError('only recognize index or columns for orient')
 
         return cls(data, index=index, columns=columns, dtype=dtype)
 
-    @deprecate_kwarg(old_arg_name='outtype', new_arg_name='orient')
-    def to_dict(self, orient='dict'):
-        """Convert DataFrame to dictionary.
+    def to_dict(self, orient='dict', into=dict):
+        """
+        Convert the DataFrame to a dictionary.
+
+        The type of the key-value pairs can be customized with the parameters
+        (see below).
 
         Parameters
         ----------
         orient : str {'dict', 'list', 'series', 'split', 'records', 'index'}
             Determines the type of the values of the dictionary.
 
-            - dict (default) : dict like {column -> {index -> value}}
-            - list : dict like {column -> [values]}
-            - series : dict like {column -> Series(values)}
-            - split : dict like
-              {index -> [index], columns -> [columns], data -> [values]}
-            - records : list like
+            - 'dict' (default) : dict like {column -> {index -> value}}
+            - 'list' : dict like {column -> [values]}
+            - 'series' : dict like {column -> Series(values)}
+            - 'split' : dict like
+              {'index' -> [index], 'columns' -> [columns], 'data' -> [values]}
+            - 'records' : list like
               [{column -> value}, ... , {column -> value}]
-            - index : dict like {index -> {column -> value}}
-
-              .. versionadded:: 0.17.0
+            - 'index' : dict like {index -> {column -> value}}
 
             Abbreviations are allowed. `s` indicates `series` and `sp`
             indicates `split`.
 
+        into : class, default dict
+            The collections.Mapping subclass used for all Mappings
+            in the return value.  Can be the actual class or an empty
+            instance of the mapping type you want.  If you want a
+            collections.defaultdict, you must pass it initialized.
+
+            .. versionadded:: 0.21.0
+
         Returns
         -------
-        result : dict like {column -> {index -> value}}
+        result : collections.Mapping like {column -> {index -> value}}
+
+        See Also
+        --------
+        DataFrame.from_dict: create a DataFrame from a dictionary
+        DataFrame.to_json: convert a DataFrame to JSON format
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'col1': [1, 2],
+        ...                    'col2': [0.5, 0.75]},
+        ...                   index=['a', 'b'])
+        >>> df
+           col1  col2
+        a     1   0.50
+        b     2   0.75
+        >>> df.to_dict()
+        {'col1': {'a': 1, 'b': 2}, 'col2': {'a': 0.5, 'b': 0.75}}
+
+        You can specify the return orientation.
+
+        >>> df.to_dict('series')
+        {'col1': a    1
+                 b    2
+                 Name: col1, dtype: int64,
+         'col2': a    0.50
+                 b    0.75
+                 Name: col2, dtype: float64}
+
+        >>> df.to_dict('split')
+        {'index': ['a', 'b'], 'columns': ['col1', 'col2'],
+         'data': [[1.0, 0.5], [2.0, 0.75]]}
+
+        >>> df.to_dict('records')
+        [{'col1': 1.0, 'col2': 0.5}, {'col1': 2.0, 'col2': 0.75}]
+
+        >>> df.to_dict('index')
+        {'a': {'col1': 1.0, 'col2': 0.5}, 'b': {'col1': 2.0, 'col2': 0.75}}
+
+        You can also specify the mapping type.
+
+        >>> from collections import OrderedDict, defaultdict
+        >>> df.to_dict(into=OrderedDict)
+        OrderedDict([('col1', OrderedDict([('a', 1), ('b', 2)])),
+                     ('col2', OrderedDict([('a', 0.5), ('b', 0.75)]))])
+
+        If you want a `defaultdict`, you need to initialize it:
+
+        >>> dd = defaultdict(list)
+        >>> df.to_dict('records', into=dd)
+        [defaultdict(<class 'list'>, {'col1': 1.0, 'col2': 0.5}),
+         defaultdict(<class 'list'>, {'col1': 2.0, 'col2': 0.75})]
         """
         if not self.columns.is_unique:
             warnings.warn("DataFrame columns are not unique, some "
-                          "columns will be omitted.", UserWarning)
+                          "columns will be omitted.", UserWarning,
+                          stacklevel=2)
+        # GH16122
+        into_c = com.standardize_mapping(into)
         if orient.lower().startswith('d'):
-            return dict((k, v.to_dict()) for k, v in compat.iteritems(self))
+            return into_c(
+                (k, v.to_dict(into)) for k, v in compat.iteritems(self))
         elif orient.lower().startswith('l'):
-            return dict((k, v.tolist()) for k, v in compat.iteritems(self))
+            return into_c((k, v.tolist()) for k, v in compat.iteritems(self))
         elif orient.lower().startswith('sp'):
-            return {'index': self.index.tolist(),
-                    'columns': self.columns.tolist(),
-                    'data': self.values.tolist()}
+            return into_c((('index', self.index.tolist()),
+                           ('columns', self.columns.tolist()),
+                           ('data', lib.map_infer(self.values.ravel(),
+                                                  com._maybe_box_datetimelike)
+                            .reshape(self.values.shape).tolist())))
         elif orient.lower().startswith('s'):
-            return dict((k, v) for k, v in compat.iteritems(self))
+            return into_c((k, com._maybe_box_datetimelike(v))
+                          for k, v in compat.iteritems(self))
         elif orient.lower().startswith('r'):
-            return [dict((k, v) for k, v in zip(self.columns, row))
+            return [into_c((k, com._maybe_box_datetimelike(v))
+                           for k, v in zip(self.columns, np.atleast_1d(row)))
                     for row in self.values]
         elif orient.lower().startswith('i'):
-            return dict((k, v.to_dict()) for k, v in self.iterrows())
+            return into_c((t[0], dict(zip(self.columns, t[1:])))
+                          for t in self.itertuples())
         else:
-            raise ValueError("orient '%s' not understood" % orient)
+            raise ValueError("orient '{o}' not understood".format(o=orient))
+
+    def to_gbq(self, destination_table, project_id=None, chunksize=None,
+               reauth=False, if_exists='fail', private_key=None,
+               auth_local_webserver=False, table_schema=None, location=None,
+               progress_bar=True, verbose=None):
+        """
+        Write a DataFrame to a Google BigQuery table.
 
-    def to_gbq(self, destination_table, project_id, chunksize=10000,
-               verbose=True, reauth=False, if_exists='fail'):
-        """Write a DataFrame to a Google BigQuery table.
+        This function requires the `pandas-gbq package
+        <https://pandas-gbq.readthedocs.io>`__.
 
-        THIS IS AN EXPERIMENTAL LIBRARY
+        See the `How to authenticate with Google BigQuery
+        <https://pandas-gbq.readthedocs.io/en/latest/howto/authentication.html>`__
+        guide for authentication instructions.
 
         Parameters
         ----------
-        dataframe : DataFrame
-            DataFrame to be written
-        destination_table : string
-            Name of table to be written, in the form 'dataset.tablename'
-        project_id : str
-            Google BigQuery Account project ID.
-        chunksize : int (default 10000)
+        destination_table : str
+            Name of table to be written, in the form ``dataset.tablename``.
+        project_id : str, optional
+            Google BigQuery Account project ID. Optional when available from
+            the environment.
+        chunksize : int, optional
             Number of rows to be inserted in each chunk from the dataframe.
-        verbose : boolean (default True)
-            Show percentage complete
-        reauth : boolean (default False)
-            Force Google BigQuery to reauthenticate the user. This is useful
+            Set to ``None`` to load the whole dataframe at once.
+        reauth : bool, default False
+            Force Google BigQuery to re-authenticate the user. This is useful
             if multiple accounts are used.
-        if_exists : {'fail', 'replace', 'append'}, default 'fail'
-            'fail': If table exists, do nothing.
-            'replace': If table exists, drop it, recreate it, and insert data.
-            'append': If table exists, insert data. Create if does not exist.
+        if_exists : str, default 'fail'
+            Behavior when the destination table exists. Value can be one of:
+
+            ``'fail'``
+                If table exists, do nothing.
+            ``'replace'``
+                If table exists, drop it, recreate it, and insert data.
+            ``'append'``
+                If table exists, insert data. Create if does not exist.
+        private_key : str, optional
+            Service account private key in JSON format. Can be file path
+            or string contents. This is useful for remote server
+            authentication (eg. Jupyter/IPython notebook on remote host).
+        auth_local_webserver : bool, default False
+            Use the `local webserver flow`_ instead of the `console flow`_
+            when getting user credentials.
+
+            .. _local webserver flow:
+                http://google-auth-oauthlib.readthedocs.io/en/latest/reference/google_auth_oauthlib.flow.html#google_auth_oauthlib.flow.InstalledAppFlow.run_local_server
+            .. _console flow:
+                http://google-auth-oauthlib.readthedocs.io/en/latest/reference/google_auth_oauthlib.flow.html#google_auth_oauthlib.flow.InstalledAppFlow.run_console
+
+            *New in version 0.2.0 of pandas-gbq*.
+        table_schema : list of dicts, optional
+            List of BigQuery table fields to which according DataFrame
+            columns conform to, e.g. ``[{'name': 'col1', 'type':
+            'STRING'},...]``. If schema is not provided, it will be
+            generated according to dtypes of DataFrame columns. See
+            BigQuery API documentation on available names of a field.
+
+            *New in version 0.3.1 of pandas-gbq*.
+        location : str, optional
+            Location where the load job should run. See the `BigQuery locations
+            documentation
+            <https://cloud.google.com/bigquery/docs/dataset-locations>`__ for a
+            list of available locations. The location must match that of the
+            target dataset.
+
+            *New in version 0.5.0 of pandas-gbq*.
+        progress_bar : bool, default True
+            Use the library `tqdm` to show the progress bar for the upload,
+            chunk by chunk.
+
+            *New in version 0.5.0 of pandas-gbq*.
+        verbose : bool, deprecated
+            Deprecated in Pandas-GBQ 0.4.0. Use the `logging module
+            to adjust verbosity instead
+            <https://pandas-gbq.readthedocs.io/en/latest/intro.html#logging>`__.
 
-            .. versionadded:: 0.17.0
+        See Also
+        --------
+        pandas_gbq.to_gbq : This function in the pandas-gbq library.
+        pandas.read_gbq : Read a DataFrame from Google BigQuery.
         """
-
         from pandas.io import gbq
-        return gbq.to_gbq(self, destination_table, project_id=project_id,
-                          chunksize=chunksize, verbose=verbose,
-                          reauth=reauth, if_exists=if_exists)
+        return gbq.to_gbq(
+            self, destination_table, project_id=project_id,
+            chunksize=chunksize, reauth=reauth,
+            if_exists=if_exists, private_key=private_key,
+            auth_local_webserver=auth_local_webserver,
+            table_schema=table_schema, location=location,
+            progress_bar=progress_bar, verbose=verbose)
 
     @classmethod
     def from_records(cls, data, index=None, exclude=None, columns=None,
@@ -868,7 +1213,7 @@ def from_records(cls, data, index=None, exclude=None, columns=None,
             in the result (any names not found in the data will become all-NA
             columns)
         coerce_float : boolean, default False
-            Attempt to convert values to non-string, non-numeric objects (like
+            Attempt to convert values of non-string, non-numeric objects (like
             decimal.Decimal) to floating point, useful for SQL result sets
 
         Returns
@@ -880,7 +1225,7 @@ def from_records(cls, data, index=None, exclude=None, columns=None,
         if columns is not None:
             columns = _ensure_index(columns)
 
-        if com.is_iterator(data):
+        if is_iterator(data):
             if nrows == 0:
                 return cls()
 
@@ -953,9 +1298,9 @@ def from_records(cls, data, index=None, exclude=None, columns=None,
             else:
                 try:
                     to_remove = [arr_columns.get_loc(field) for field in index]
-
-                    result_index = MultiIndex.from_arrays(
-                        [arrays[i] for i in to_remove], names=index)
+                    index_data = [arrays[i] for i in to_remove]
+                    result_index = _ensure_index_from_sequences(index_data,
+                                                                names=index)
 
                     exclude.update(index)
                 except Exception:
@@ -969,30 +1314,86 @@ def from_records(cls, data, index=None, exclude=None, columns=None,
             arr_columns = arr_columns.drop(arr_exclude)
             columns = columns.drop(exclude)
 
-        mgr = _arrays_to_mgr(arrays, arr_columns, result_index,
-                             columns)
+        mgr = _arrays_to_mgr(arrays, arr_columns, result_index, columns)
 
         return cls(mgr)
 
-    def to_records(self, index=True, convert_datetime64=True):
+    def to_records(self, index=True, convert_datetime64=None):
         """
-        Convert DataFrame to record array. Index will be put in the
-        'index' field of the record array if requested
+        Convert DataFrame to a NumPy record array.
+
+        Index will be put in the 'index' field of the record array if
+        requested.
 
         Parameters
         ----------
         index : boolean, default True
-            Include index in resulting record array, stored in 'index' field
-        convert_datetime64 : boolean, default True
+            Include index in resulting record array, stored in 'index' field.
+        convert_datetime64 : boolean, default None
+            .. deprecated:: 0.23.0
+
             Whether to convert the index to datetime.datetime if it is a
-            DatetimeIndex
+            DatetimeIndex.
 
         Returns
         -------
-        y : recarray
-        """
+        y : numpy.recarray
+
+        See Also
+        --------
+        DataFrame.from_records: convert structured or record ndarray
+            to DataFrame.
+        numpy.recarray: ndarray that allows field access using
+            attributes, analogous to typed columns in a
+            spreadsheet.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'A': [1, 2], 'B': [0.5, 0.75]},
+        ...                   index=['a', 'b'])
+        >>> df
+           A     B
+        a  1  0.50
+        b  2  0.75
+        >>> df.to_records()
+        rec.array([('a', 1, 0.5 ), ('b', 2, 0.75)],
+                  dtype=[('index', 'O'), ('A', '<i8'), ('B', '<f8')])
+
+        The index can be excluded from the record array:
+
+        >>> df.to_records(index=False)
+        rec.array([(1, 0.5 ), (2, 0.75)],
+                  dtype=[('A', '<i8'), ('B', '<f8')])
+
+        By default, timestamps are converted to `datetime.datetime`:
+
+        >>> df.index = pd.date_range('2018-01-01 09:00', periods=2, freq='min')
+        >>> df
+                             A     B
+        2018-01-01 09:00:00  1  0.50
+        2018-01-01 09:01:00  2  0.75
+        >>> df.to_records()
+        rec.array([(datetime.datetime(2018, 1, 1, 9, 0), 1, 0.5 ),
+                   (datetime.datetime(2018, 1, 1, 9, 1), 2, 0.75)],
+                  dtype=[('index', 'O'), ('A', '<i8'), ('B', '<f8')])
+
+        The timestamp conversion can be disabled so NumPy's datetime64
+        data type is used instead:
+
+        >>> df.to_records(convert_datetime64=False)
+        rec.array([('2018-01-01T09:00:00.000000000', 1, 0.5 ),
+                   ('2018-01-01T09:01:00.000000000', 2, 0.75)],
+                  dtype=[('index', '<M8[ns]'), ('A', '<i8'), ('B', '<f8')])
+        """
+
+        if convert_datetime64 is not None:
+            warnings.warn("The 'convert_datetime64' parameter is "
+                          "deprecated and will be removed in a future "
+                          "version",
+                          FutureWarning, stacklevel=2)
+
         if index:
-            if com.is_datetime64_dtype(self.index) and convert_datetime64:
+            if is_datetime64_any_dtype(self.index) and convert_datetime64:
                 ix_vals = [self.index.to_pydatetime()]
             else:
                 if isinstance(self.index, MultiIndex):
@@ -1012,17 +1413,29 @@ def to_records(self, index=True, convert_datetime64=True):
                         count += 1
             elif index_names[0] is None:
                 index_names = ['index']
-            names = index_names + lmap(str, self.columns)
+            names = (lmap(compat.text_type, index_names) +
+                     lmap(compat.text_type, self.columns))
         else:
             arrays = [self[c].get_values() for c in self.columns]
-            names = lmap(str, self.columns)
+            names = lmap(compat.text_type, self.columns)
 
-        dtype = np.dtype([(x, v.dtype) for x, v in zip(names, arrays)])
-        return np.rec.fromarrays(arrays, dtype=dtype, names=names)
+        formats = [v.dtype for v in arrays]
+        return np.rec.fromarrays(
+            arrays,
+            dtype={'names': names, 'formats': formats}
+        )
 
     @classmethod
     def from_items(cls, items, columns=None, orient='columns'):
-        """
+        """Construct a dataframe from a list of tuples
+
+        .. deprecated:: 0.23.0
+          `from_items` is deprecated and will be removed in a future version.
+          Use :meth:`DataFrame.from_dict(dict(items)) <DataFrame.from_dict>`
+          instead.
+          :meth:`DataFrame.from_dict(OrderedDict(items)) <DataFrame.from_dict>`
+          may be used to preserve the key order.
+
         Convert (key, value) pairs to DataFrame. The keys will be the axis
         index (usually the columns, but depends on the specified
         orientation). The values should be arrays or Series.
@@ -1043,6 +1456,13 @@ def from_items(cls, items, columns=None, orient='columns'):
         -------
         frame : DataFrame
         """
+
+        warnings.warn("from_items is deprecated. Please use "
+                      "DataFrame.from_dict(dict(items), ...) instead. "
+                      "DataFrame.from_dict(OrderedDict(items)) may be used to "
+                      "preserve the key order.",
+                      FutureWarning, stacklevel=2)
+
         keys, values = lzip(*items)
 
         if orient == 'columns':
@@ -1061,16 +1481,34 @@ def from_items(cls, items, columns=None, orient='columns'):
                 columns = _ensure_index(keys)
                 arrays = values
 
-            return cls._from_arrays(arrays, columns, None)
+            # GH 17312
+            # Provide more informative error msg when scalar values passed
+            try:
+                return cls._from_arrays(arrays, columns, None)
+
+            except ValueError:
+                if not is_nested_list_like(values):
+                    raise ValueError('The value in each (key, value) pair '
+                                     'must be an array, Series, or dict')
+
         elif orient == 'index':
             if columns is None:
                 raise TypeError("Must pass columns with orient='index'")
 
             keys = _ensure_index(keys)
 
-            arr = np.array(values, dtype=object).T
-            data = [lib.maybe_convert_objects(v) for v in arr]
-            return cls._from_arrays(data, columns, keys)
+            # GH 17312
+            # Provide more informative error msg when scalar values passed
+            try:
+                arr = np.array(values, dtype=object).T
+                data = [lib.maybe_convert_objects(v) for v in arr]
+                return cls._from_arrays(data, columns, keys)
+
+            except TypeError:
+                if not is_nested_list_like(values):
+                    raise ValueError('The value in each (key, value) pair '
+                                     'must be an array, Series, or dict')
+
         else:  # pragma: no cover
             raise ValueError("'orient' must be either 'columns' or 'index'")
 
@@ -1080,11 +1518,13 @@ def _from_arrays(cls, arrays, columns, index, dtype=None):
         return cls(mgr)
 
     @classmethod
-    def from_csv(cls, path, header=0, sep=',', index_col=0,
-                 parse_dates=True, encoding=None, tupleize_cols=False,
+    def from_csv(cls, path, header=0, sep=',', index_col=0, parse_dates=True,
+                 encoding=None, tupleize_cols=None,
                  infer_datetime_format=False):
-        """
-        Read CSV file (DISCOURAGED, please use :func:`pandas.read_csv` instead).
+        """Read CSV file.
+
+        .. deprecated:: 0.21.0
+            Use :func:`pandas.read_csv` instead.
 
         It is preferable to use the more powerful :func:`pandas.read_csv`
         for most general purposes, but ``from_csv`` makes for an easy
@@ -1131,6 +1571,13 @@ def from_csv(cls, path, header=0, sep=',', index_col=0,
         y : DataFrame
 
         """
+
+        warnings.warn("from_csv is deprecated. Please use read_csv(...) "
+                      "instead. Note that some of the default arguments are "
+                      "different, so please refer to the documentation "
+                      "for from_csv when changing your function calls",
+                      FutureWarning, stacklevel=2)
+
         from pandas.io.parsers import read_table
         return read_table(path, header=header, sep=sep,
                           parse_dates=parse_dates, index_col=index_col,
@@ -1150,9 +1597,9 @@ def to_sparse(self, fill_value=None, kind='block'):
         -------
         y : SparseDataFrame
         """
-        from pandas.core.sparse import SparseDataFrame
+        from pandas.core.sparse.frame import SparseDataFrame
         return SparseDataFrame(self._series, index=self.index,
-                               default_kind=kind,
+                               columns=self.columns, default_kind=kind,
                                default_fill_value=fill_value)
 
     def to_panel(self):
@@ -1160,6 +1607,8 @@ def to_panel(self):
         Transform long (stacked) format (DataFrame) into wide (3D, Panel)
         format.
 
+        .. deprecated:: 0.20.0
+
         Currently the index of the DataFrame must be a 2-level MultiIndex. This
         may be generalized later
 
@@ -1180,7 +1629,7 @@ def to_panel(self):
 
         # minor axis must be sorted
         if self.index.lexsort_depth < 2:
-            selfsorted = self.sortlevel(0)
+            selfsorted = self.sort_index(level=0)
         else:
             selfsorted = self
 
@@ -1200,21 +1649,20 @@ def to_panel(self):
 
         # create new manager
         new_mgr = selfsorted._data.reshape_nd(axes=new_axes,
-                                              labels=[major_labels, minor_labels],
+                                              labels=[major_labels,
+                                                      minor_labels],
                                               shape=shape,
                                               ref_items=selfsorted.columns)
 
         return self._constructor_expanddim(new_mgr)
 
-    to_wide = deprecate('to_wide', to_panel)
-
     def to_csv(self, path_or_buf=None, sep=",", na_rep='', float_format=None,
                columns=None, header=True, index=True, index_label=None,
-               mode='w', encoding=None, compression=None, quoting=None, 
+               mode='w', encoding=None, compression=None, quoting=None,
                quotechar='"', line_terminator='\n', chunksize=None,
-               tupleize_cols=False, date_format=None, doublequote=True,
-               escapechar=None, decimal='.', **kwds):
-        """Write DataFrame to a comma-separated values (csv) file
+               tupleize_cols=None, date_format=None, doublequote=True,
+               escapechar=None, decimal='.'):
+        r"""Write DataFrame to a comma-separated values (csv) file
 
         Parameters
         ----------
@@ -1230,8 +1678,8 @@ def to_csv(self, path_or_buf=None, sep=",", na_rep='', float_format=None,
         columns : sequence, optional
             Columns to write
         header : boolean or list of string, default True
-            Write out column names. If a list of string is given it is assumed
-            to be aliases for the column names
+            Write out the column names. If a list of strings is given it is
+            assumed to be aliases for the column names
         index : boolean, default True
             Write row names (index)
         index_label : string or sequence, or False, default None
@@ -1240,22 +1688,22 @@ def to_csv(self, path_or_buf=None, sep=",", na_rep='', float_format=None,
             sequence should be given if the DataFrame uses MultiIndex.  If
             False do not print fields for index names. Use index_label=False
             for easier importing in R
-        nanRep : None
-            deprecated, use na_rep
         mode : str
             Python write mode, default 'w'
         encoding : string, optional
             A string representing the encoding to use in the output file,
             defaults to 'ascii' on Python 2 and 'utf-8' on Python 3.
         compression : string, optional
-            a string representing the compression to use in the output file, 
-            allowed values are 'gzip', 'bz2',
-            only used when the first argument is a filename
-        line_terminator : string, default '\\n'
+            A string representing the compression to use in the output file.
+            Allowed values are 'gzip', 'bz2', 'zip', 'xz'. This input is only
+            used when the first argument is a filename.
+        line_terminator : string, default ``'\n'``
             The newline character or character sequence to use in the output
             file
         quoting : optional constant from csv module
-            defaults to csv.QUOTE_MINIMAL
+            defaults to csv.QUOTE_MINIMAL. If you have set a `float_format`
+            then floats are converted to strings and thus csv.QUOTE_NONNUMERIC
+            will treat them as non-numeric
         quotechar : string (length 1), default '\"'
             character used to quote fields
         doublequote : boolean, default True
@@ -1265,164 +1713,251 @@ def to_csv(self, path_or_buf=None, sep=",", na_rep='', float_format=None,
         chunksize : int or None
             rows to write at a time
         tupleize_cols : boolean, default False
-            write multi_index columns as a list of tuples (if True)
-            or new (expanded format) if False)
+            .. deprecated:: 0.21.0
+               This argument will be removed and will always write each row
+               of the multi-index as a separate row in the CSV file.
+
+            Write MultiIndex columns as a list of tuples (if True) or in
+            the new, expanded format, where each MultiIndex column is a row
+            in the CSV (if False).
         date_format : string, default None
             Format string for datetime objects
         decimal: string, default '.'
-            Character recognized as decimal separator. E.g. use ',' for European data
-
-            .. versionadded:: 0.16.0
-
-        """
-
-        formatter = fmt.CSVFormatter(self, path_or_buf,
-                                     line_terminator=line_terminator,
-                                     sep=sep, encoding=encoding,
-                                     compression=compression,
-                                     quoting=quoting, na_rep=na_rep,
-                                     float_format=float_format, cols=columns,
-                                     header=header, index=index,
-                                     index_label=index_label, mode=mode,
-                                     chunksize=chunksize, quotechar=quotechar,
-                                     engine=kwds.get("engine"),
-                                     tupleize_cols=tupleize_cols,
-                                     date_format=date_format,
-                                     doublequote=doublequote,
-                                     escapechar=escapechar,
-                                     decimal=decimal)
+            Character recognized as decimal separator. E.g. use ',' for
+            European data
+
+        """
+
+        if tupleize_cols is not None:
+            warnings.warn("The 'tupleize_cols' parameter is deprecated and "
+                          "will be removed in a future version",
+                          FutureWarning, stacklevel=2)
+        else:
+            tupleize_cols = False
+
+        from pandas.io.formats.csvs import CSVFormatter
+        formatter = CSVFormatter(self, path_or_buf,
+                                 line_terminator=line_terminator, sep=sep,
+                                 encoding=encoding,
+                                 compression=compression, quoting=quoting,
+                                 na_rep=na_rep, float_format=float_format,
+                                 cols=columns, header=header, index=index,
+                                 index_label=index_label, mode=mode,
+                                 chunksize=chunksize, quotechar=quotechar,
+                                 tupleize_cols=tupleize_cols,
+                                 date_format=date_format,
+                                 doublequote=doublequote,
+                                 escapechar=escapechar, decimal=decimal)
         formatter.save()
 
         if path_or_buf is None:
             return formatter.path_or_buf.getvalue()
 
+    @Appender(_shared_docs['to_excel'] % _shared_doc_kwargs)
     def to_excel(self, excel_writer, sheet_name='Sheet1', na_rep='',
                  float_format=None, columns=None, header=True, index=True,
                  index_label=None, startrow=0, startcol=0, engine=None,
-                 merge_cells=True, encoding=None, inf_rep='inf',
-                 verbose=True):
-        """
-        Write DataFrame to a excel sheet
-
-        Parameters
-        ----------
-        excel_writer : string or ExcelWriter object
-            File path or existing ExcelWriter
-        sheet_name : string, default 'Sheet1'
-            Name of sheet which will contain DataFrame
-        na_rep : string, default ''
-            Missing data representation
-        float_format : string, default None
-            Format string for floating point numbers
-        columns : sequence, optional
-            Columns to write
-        header : boolean or list of string, default True
-            Write out column names. If a list of string is given it is
-            assumed to be aliases for the column names
-        index : boolean, default True
-            Write row names (index)
-        index_label : string or sequence, default None
-            Column label for index column(s) if desired. If None is given, and
-            `header` and `index` are True, then the index names are used. A
-            sequence should be given if the DataFrame uses MultiIndex.
-        startrow :
-            upper left cell row to dump data frame
-        startcol :
-            upper left cell column to dump data frame
-        engine : string, default None
-            write engine to use - you can also set this via the options
-            ``io.excel.xlsx.writer``, ``io.excel.xls.writer``, and
-            ``io.excel.xlsm.writer``.
-        merge_cells : boolean, default True
-            Write MultiIndex and Hierarchical Rows as merged cells.
-        encoding: string, default None
-            encoding of the resulting excel file. Only necessary for xlwt,
-            other writers support unicode natively.
-        inf_rep : string, default 'inf'
-            Representation for infinity (there is no native representation for
-            infinity in Excel)
-
-        Notes
-        -----
-        If passing an existing ExcelWriter object, then the sheet will be added
-        to the existing workbook.  This can be used to save different
-        DataFrames to one workbook:
-
-        >>> writer = ExcelWriter('output.xlsx')
-        >>> df1.to_excel(writer,'Sheet1')
-        >>> df2.to_excel(writer,'Sheet2')
-        >>> writer.save()
-
-        For compatibility with to_csv, to_excel serializes lists and dicts to
-        strings before writing.
-        """
-        from pandas.io.excel import ExcelWriter
-        need_save = False
-        if encoding is None:
-            encoding = 'ascii'
-
-        if isinstance(excel_writer, compat.string_types):
-            excel_writer = ExcelWriter(excel_writer, engine=engine)
-            need_save = True
-
-        formatter = fmt.ExcelFormatter(self,
-                                       na_rep=na_rep,
-                                       cols=columns,
-                                       header=header,
-                                       float_format=float_format,
-                                       index=index,
-                                       index_label=index_label,
-                                       merge_cells=merge_cells,
-                                       inf_rep=inf_rep)
-        formatted_cells = formatter.get_formatted_cells()
-        excel_writer.write_cells(formatted_cells, sheet_name,
-                                 startrow=startrow, startcol=startcol)
-        if need_save:
-            excel_writer.save()
-
-    def to_stata(
-        self, fname, convert_dates=None, write_index=True, encoding="latin-1",
-            byteorder=None, time_stamp=None, data_label=None):
-        """
-        A class for writing Stata binary dta files from array-like objects
+                 merge_cells=True, encoding=None, inf_rep='inf', verbose=True,
+                 freeze_panes=None):
+
+        from pandas.io.formats.excel import ExcelFormatter
+        formatter = ExcelFormatter(self, na_rep=na_rep, cols=columns,
+                                   header=header,
+                                   float_format=float_format, index=index,
+                                   index_label=index_label,
+                                   merge_cells=merge_cells,
+                                   inf_rep=inf_rep)
+        formatter.write(excel_writer, sheet_name=sheet_name, startrow=startrow,
+                        startcol=startcol, freeze_panes=freeze_panes,
+                        engine=engine)
+
+    @deprecate_kwarg(old_arg_name='encoding', new_arg_name=None)
+    def to_stata(self, fname, convert_dates=None, write_index=True,
+                 encoding="latin-1", byteorder=None, time_stamp=None,
+                 data_label=None, variable_labels=None, version=114,
+                 convert_strl=None):
+        """
+        Export Stata binary dta files.
 
         Parameters
         ----------
-        fname : file path or buffer
-            Where to save the dta file.
+        fname : path (string), buffer or path object
+            string, path object (pathlib.Path or py._path.local.LocalPath) or
+            object implementing a binary write() functions. If using a buffer
+            then the buffer will not be automatically closed after the file
+            data has been written.
         convert_dates : dict
-            Dictionary mapping column of datetime types to the stata internal
-            format that you want to use for the dates. Options are
-            'tc', 'td', 'tm', 'tw', 'th', 'tq', 'ty'. Column can be either a
-            number or a name.
+            Dictionary mapping columns containing datetime types to stata
+            internal format to use when writing the dates. Options are 'tc',
+            'td', 'tm', 'tw', 'th', 'tq', 'ty'. Column can be either an integer
+            or a name. Datetime columns that do not have a conversion type
+            specified will be converted to 'tc'. Raises NotImplementedError if
+            a datetime column has timezone information.
+        write_index : bool
+            Write the index to Stata dataset.
         encoding : str
-            Default is latin-1. Note that Stata does not support unicode.
+            Default is latin-1. Unicode is not supported.
         byteorder : str
-            Can be ">", "<", "little", or "big". The default is None which uses
-            `sys.byteorder`
+            Can be ">", "<", "little", or "big". default is `sys.byteorder`.
+        time_stamp : datetime
+            A datetime to use as file creation date.  Default is the current
+            time.
+        data_label : str
+            A label for the data set.  Must be 80 characters or smaller.
+        variable_labels : dict
+            Dictionary containing columns as keys and variable labels as
+            values. Each label must be 80 characters or smaller.
+
+            .. versionadded:: 0.19.0
+
+        version : {114, 117}
+            Version to use in the output dta file.  Version 114 can be used
+            read by Stata 10 and later.  Version 117 can be read by Stata 13
+            or later. Version 114 limits string variables to 244 characters or
+            fewer while 117 allows strings with lengths up to 2,000,000
+            characters.
+
+            .. versionadded:: 0.23.0
+
+        convert_strl : list, optional
+            List of column names to convert to string columns to Stata StrL
+            format. Only available if version is 117.  Storing strings in the
+            StrL format can produce smaller dta files if strings have more than
+            8 characters and values are repeated.
+
+            .. versionadded:: 0.23.0
+
+        Raises
+        ------
+        NotImplementedError
+            * If datetimes contain timezone information
+            * Column dtype is not representable in Stata
+        ValueError
+            * Columns listed in convert_dates are neither datetime64[ns]
+              or datetime.datetime
+            * Column listed in convert_dates is not in DataFrame
+            * Categorical label contains more than 32,000 characters
+
+            .. versionadded:: 0.19.0
+
+        See Also
+        --------
+        pandas.read_stata : Import Stata data files
+        pandas.io.stata.StataWriter : low-level writer for Stata data files
+        pandas.io.stata.StataWriter117 : low-level writer for version 117 files
 
         Examples
         --------
+        >>> data.to_stata('./data_file.dta')
+
+        Or with dates
+
+        >>> data.to_stata('./date_data_file.dta', {2 : 'tw'})
+
+        Alternatively you can create an instance of the StataWriter class
+
         >>> writer = StataWriter('./data_file.dta', data)
         >>> writer.write_file()
 
-        Or with dates
+        With dates:
 
         >>> writer = StataWriter('./date_data_file.dta', data, {2 : 'tw'})
         >>> writer.write_file()
         """
-        from pandas.io.stata import StataWriter
-        writer = StataWriter(fname, self, convert_dates=convert_dates,
-                             encoding=encoding, byteorder=byteorder,
-                             time_stamp=time_stamp, data_label=data_label,
-                             write_index=write_index)
+        kwargs = {}
+        if version not in (114, 117):
+            raise ValueError('Only formats 114 and 117 supported.')
+        if version == 114:
+            if convert_strl is not None:
+                raise ValueError('strl support is only available when using '
+                                 'format 117')
+            from pandas.io.stata import StataWriter as statawriter
+        else:
+            from pandas.io.stata import StataWriter117 as statawriter
+            kwargs['convert_strl'] = convert_strl
+
+        writer = statawriter(fname, self, convert_dates=convert_dates,
+                             byteorder=byteorder, time_stamp=time_stamp,
+                             data_label=data_label, write_index=write_index,
+                             variable_labels=variable_labels, **kwargs)
         writer.write_file()
 
+    def to_feather(self, fname):
+        """
+        write out the binary feather-format for DataFrames
+
+        .. versionadded:: 0.20.0
+
+        Parameters
+        ----------
+        fname : str
+            string file path
+
+        """
+        from pandas.io.feather_format import to_feather
+        to_feather(self, fname)
+
+    def to_parquet(self, fname, engine='auto', compression='snappy',
+                   **kwargs):
+        """
+        Write a DataFrame to the binary parquet format.
+
+        .. versionadded:: 0.21.0
+
+        This function writes the dataframe as a `parquet file
+        <https://parquet.apache.org/>`_. You can choose different parquet
+        backends, and have the option of compression. See
+        :ref:`the user guide <io.parquet>` for more details.
+
+        Parameters
+        ----------
+        fname : str
+            String file path.
+        engine : {'auto', 'pyarrow', 'fastparquet'}, default 'auto'
+            Parquet library to use. If 'auto', then the option
+            ``io.parquet.engine`` is used. The default ``io.parquet.engine``
+            behavior is to try 'pyarrow', falling back to 'fastparquet' if
+            'pyarrow' is unavailable.
+        compression : {'snappy', 'gzip', 'brotli', None}, default 'snappy'
+            Name of the compression to use. Use ``None`` for no compression.
+        **kwargs
+            Additional arguments passed to the parquet library. See
+            :ref:`pandas io <io.parquet>` for more details.
+
+        See Also
+        --------
+        read_parquet : Read a parquet file.
+        DataFrame.to_csv : Write a csv file.
+        DataFrame.to_sql : Write to a sql table.
+        DataFrame.to_hdf : Write to hdf.
+
+        Notes
+        -----
+        This function requires either the `fastparquet
+        <https://pypi.org/project/fastparquet>`_ or `pyarrow
+        <https://arrow.apache.org/docs/python/>`_ library.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame(data={'col1': [1, 2], 'col2': [3, 4]})
+        >>> df.to_parquet('df.parquet.gzip', compression='gzip')
+        >>> pd.read_parquet('df.parquet.gzip')
+           col1  col2
+        0     1     3
+        1     2     4
+        """
+        from pandas.io.parquet import to_parquet
+        to_parquet(self, fname, engine,
+                   compression=compression, **kwargs)
+
+    @Substitution(header='Write out the column names. If a list of strings '
+                         'is given, it is assumed to be aliases for the '
+                         'column names')
     @Appender(fmt.docstring_to_string, indents=1)
-    def to_string(self, buf=None, columns=None, col_space=None,
-                  header=True, index=True, na_rep='NaN', formatters=None,
-                  float_format=None, sparsify=None, index_names=True,
-                  justify=None, line_width=None, max_rows=None, max_cols=None,
+    def to_string(self, buf=None, columns=None, col_space=None, header=True,
+                  index=True, na_rep='NaN', formatters=None, float_format=None,
+                  sparsify=None, index_names=True, justify=None,
+                  line_width=None, max_rows=None, max_cols=None,
                   show_dimensions=False):
         """
         Render a DataFrame to a console-friendly tabular output.
@@ -1432,8 +1967,7 @@ def to_string(self, buf=None, columns=None, col_space=None,
                                            col_space=col_space, na_rep=na_rep,
                                            formatters=formatters,
                                            float_format=float_format,
-                                           sparsify=sparsify,
-                                           justify=justify,
+                                           sparsify=sparsify, justify=justify,
                                            index_names=index_names,
                                            header=header, index=index,
                                            line_width=line_width,
@@ -1446,13 +1980,14 @@ def to_string(self, buf=None, columns=None, col_space=None,
             result = formatter.buf.getvalue()
             return result
 
+    @Substitution(header='whether to print column labels, default True')
     @Appender(fmt.docstring_to_string, indents=1)
-    def to_html(self, buf=None, columns=None, col_space=None, colSpace=None,
-                header=True, index=True, na_rep='NaN', formatters=None,
-                float_format=None, sparsify=None, index_names=True,
-                justify=None, bold_rows=True, classes=None, escape=True,
-                max_rows=None, max_cols=None, show_dimensions=False,
-                notebook=False):
+    def to_html(self, buf=None, columns=None, col_space=None, header=True,
+                index=True, na_rep='NaN', formatters=None, float_format=None,
+                sparsify=None, index_names=True, justify=None, bold_rows=True,
+                classes=None, escape=True, max_rows=None, max_cols=None,
+                show_dimensions=False, notebook=False, decimal='.',
+                border=None, table_id=None):
         """
         Render a DataFrame as an HTML table.
 
@@ -1463,112 +1998,183 @@ def to_html(self, buf=None, columns=None, col_space=None, colSpace=None,
         classes : str or list or tuple, default None
             CSS class(es) to apply to the resulting html table
         escape : boolean, default True
-            Convert the characters <, >, and & to HTML-safe sequences.=
+            Convert the characters <, >, and & to HTML-safe sequences.
         max_rows : int, optional
             Maximum number of rows to show before truncating. If None, show
             all.
         max_cols : int, optional
             Maximum number of columns to show before truncating. If None, show
             all.
+        decimal : string, default '.'
+            Character recognized as decimal separator, e.g. ',' in Europe
 
-        """
-
-        if colSpace is not None:  # pragma: no cover
-            warnings.warn("colSpace is deprecated, use col_space",
-                          FutureWarning, stacklevel=2)
-            col_space = colSpace
-
-        formatter = fmt.DataFrameFormatter(self, buf=buf, columns=columns,
-                                           col_space=col_space, na_rep=na_rep,
-                                           formatters=formatters,
-                                           float_format=float_format,
-                                           sparsify=sparsify,
-                                           justify=justify,
-                                           index_names=index_names,
-                                           header=header, index=index,
-                                           bold_rows=bold_rows,
-                                           escape=escape,
-                                           max_rows=max_rows,
-                                           max_cols=max_cols,
-                                           show_dimensions=show_dimensions)
-        formatter.to_html(classes=classes, notebook=notebook)
+            .. versionadded:: 0.18.0
 
-        if buf is None:
-            return formatter.buf.getvalue()
+        border : int
+            A ``border=border`` attribute is included in the opening
+            `<table>` tag. Default ``pd.options.html.border``.
 
-    @Appender(fmt.common_docstring + fmt.return_docstring, indents=1)
-    def to_latex(self, buf=None, columns=None, col_space=None, colSpace=None,
-                 header=True, index=True, na_rep='NaN', formatters=None,
-                 float_format=None, sparsify=None, index_names=True,
-                 bold_rows=True, column_format=None,
-                 longtable=False, escape=True):
-        """
-        Render a DataFrame to a tabular environment table. You can splice
-        this into a LaTeX document. Requires \\usepackage{booktabs}.
+            .. versionadded:: 0.19.0
 
-        `to_latex`-specific options:
+        table_id : str, optional
+            A css id is included in the opening `<table>` tag if specified.
 
-        bold_rows : boolean, default True
-            Make the row labels bold in the output
-        column_format : str, default None
-            The columns format as specified in `LaTeX table format
-            <https://en.wikibooks.org/wiki/LaTeX/Tables>`__ e.g 'rcl' for 3 columns
-        longtable : boolean, default False
-            Use a longtable environment instead of tabular. Requires adding
-            a \\usepackage{longtable} to your LaTeX preamble.
-        escape : boolean, default True
-            When set to False prevents from escaping latex special
-            characters in column names.
+            .. versionadded:: 0.23.0
 
         """
 
-        if colSpace is not None:  # pragma: no cover
-            warnings.warn("colSpace is deprecated, use col_space",
-                          FutureWarning, stacklevel=2)
-            col_space = colSpace
+        if (justify is not None and
+                justify not in fmt._VALID_JUSTIFY_PARAMETERS):
+            raise ValueError("Invalid value for justify parameter")
 
         formatter = fmt.DataFrameFormatter(self, buf=buf, columns=columns,
                                            col_space=col_space, na_rep=na_rep,
-                                           header=header, index=index,
                                            formatters=formatters,
                                            float_format=float_format,
-                                           bold_rows=bold_rows,
-                                           sparsify=sparsify,
+                                           sparsify=sparsify, justify=justify,
                                            index_names=index_names,
-                                           escape=escape)
-        formatter.to_latex(column_format=column_format, longtable=longtable)
+                                           header=header, index=index,
+                                           bold_rows=bold_rows, escape=escape,
+                                           max_rows=max_rows,
+                                           max_cols=max_cols,
+                                           show_dimensions=show_dimensions,
+                                           decimal=decimal, table_id=table_id)
+        # TODO: a generic formatter wld b in DataFrameFormatter
+        formatter.to_html(classes=classes, notebook=notebook, border=border)
 
         if buf is None:
             return formatter.buf.getvalue()
 
-    def info(self, verbose=None, buf=None, max_cols=None, memory_usage=None, null_counts=None):
+    def info(self, verbose=None, buf=None, max_cols=None, memory_usage=None,
+             null_counts=None):
         """
-        Concise summary of a DataFrame.
+        Print a concise summary of a DataFrame.
+
+        This method prints information about a DataFrame including
+        the index dtype and column dtypes, non-null values and memory usage.
 
         Parameters
         ----------
-        verbose : {None, True, False}, optional
-            Whether to print the full summary.
-            None follows the `display.max_info_columns` setting.
-            True or False overrides the `display.max_info_columns` setting.
+        verbose : bool, optional
+            Whether to print the full summary. By default, the setting in
+            ``pandas.options.display.max_info_columns`` is followed.
         buf : writable buffer, defaults to sys.stdout
-        max_cols : int, default None
-            Determines whether full summary or short summary is printed.
-            None follows the `display.max_info_columns` setting.
-        memory_usage : boolean, default None
+            Where to send the output. By default, the output is printed to
+            sys.stdout. Pass a writable buffer if you need to further process
+            the output.
+        max_cols : int, optional
+            When to switch from the verbose to the truncated output. If the
+            DataFrame has more than `max_cols` columns, the truncated output
+            is used. By default, the setting in
+            ``pandas.options.display.max_info_columns`` is used.
+        memory_usage : bool, str, optional
             Specifies whether total memory usage of the DataFrame
-            elements (including index) should be displayed. None follows
-            the `display.memory_usage` setting. True or False overrides
-            the `display.memory_usage` setting. Memory usage is shown in
-            human-readable units (base-2 representation).
-        null_counts : boolean, default None
-            Whether to show the non-null counts
-            If None, then only show if the frame is smaller than max_info_rows and max_info_columns.
-            If True, always show counts.
-            If False, never show counts.
+            elements (including the index) should be displayed. By default,
+            this follows the ``pandas.options.display.memory_usage`` setting.
+
+            True always show memory usage. False never shows memory usage.
+            A value of 'deep' is equivalent to "True with deep introspection".
+            Memory usage is shown in human-readable units (base-2
+            representation). Without deep introspection a memory estimation is
+            made based in column dtype and number of rows assuming values
+            consume the same memory amount for corresponding dtypes. With deep
+            memory introspection, a real memory usage calculation is performed
+            at the cost of computational resources.
+        null_counts : bool, optional
+            Whether to show the non-null counts. By default, this is shown
+            only if the frame is smaller than
+            ``pandas.options.display.max_info_rows`` and
+            ``pandas.options.display.max_info_columns``. A value of True always
+            shows the counts, and False never shows the counts.
+
+        Returns
+        -------
+        None
+            This method prints a summary of a DataFrame and returns None.
+
+        See Also
+        --------
+        DataFrame.describe: Generate descriptive statistics of DataFrame
+            columns.
+        DataFrame.memory_usage: Memory usage of DataFrame columns.
 
+        Examples
+        --------
+        >>> int_values = [1, 2, 3, 4, 5]
+        >>> text_values = ['alpha', 'beta', 'gamma', 'delta', 'epsilon']
+        >>> float_values = [0.0, 0.25, 0.5, 0.75, 1.0]
+        >>> df = pd.DataFrame({"int_col": int_values, "text_col": text_values,
+        ...                   "float_col": float_values})
+        >>> df
+           int_col text_col  float_col
+        0        1    alpha       0.00
+        1        2     beta       0.25
+        2        3    gamma       0.50
+        3        4    delta       0.75
+        4        5  epsilon       1.00
+
+        Prints information of all columns:
+
+        >>> df.info(verbose=True)
+        <class 'pandas.core.frame.DataFrame'>
+        RangeIndex: 5 entries, 0 to 4
+        Data columns (total 3 columns):
+        int_col      5 non-null int64
+        text_col     5 non-null object
+        float_col    5 non-null float64
+        dtypes: float64(1), int64(1), object(1)
+        memory usage: 200.0+ bytes
+
+        Prints a summary of columns count and its dtypes but not per column
+        information:
+
+        >>> df.info(verbose=False)
+        <class 'pandas.core.frame.DataFrame'>
+        RangeIndex: 5 entries, 0 to 4
+        Columns: 3 entries, int_col to float_col
+        dtypes: float64(1), int64(1), object(1)
+        memory usage: 200.0+ bytes
+
+        Pipe output of DataFrame.info to buffer instead of sys.stdout, get
+        buffer content and writes to a text file:
+
+        >>> import io
+        >>> buffer = io.StringIO()
+        >>> df.info(buf=buffer)
+        >>> s = buffer.getvalue()
+        >>> with open("df_info.txt", "w", encoding="utf-8") as f:
+        ...     f.write(s)
+        260
+
+        The `memory_usage` parameter allows deep introspection mode, specially
+        useful for big DataFrames and fine-tune memory optimization:
+
+        >>> random_strings_array = np.random.choice(['a', 'b', 'c'], 10 ** 6)
+        >>> df = pd.DataFrame({
+        ...     'column_1': np.random.choice(['a', 'b', 'c'], 10 ** 6),
+        ...     'column_2': np.random.choice(['a', 'b', 'c'], 10 ** 6),
+        ...     'column_3': np.random.choice(['a', 'b', 'c'], 10 ** 6)
+        ... })
+        >>> df.info()
+        <class 'pandas.core.frame.DataFrame'>
+        RangeIndex: 1000000 entries, 0 to 999999
+        Data columns (total 3 columns):
+        column_1    1000000 non-null object
+        column_2    1000000 non-null object
+        column_3    1000000 non-null object
+        dtypes: object(3)
+        memory usage: 22.9+ MB
+
+        >>> df.info(memory_usage='deep')
+        <class 'pandas.core.frame.DataFrame'>
+        RangeIndex: 1000000 entries, 0 to 999999
+        Data columns (total 3 columns):
+        column_1    1000000 non-null object
+        column_2    1000000 non-null object
+        column_3    1000000 non-null object
+        dtypes: object(3)
+        memory usage: 188.8 MB
         """
-        from pandas.core.format import _put_lines
 
         if buf is None:  # pragma: no cover
             buf = sys.stdout
@@ -1576,19 +2182,19 @@ def info(self, verbose=None, buf=None, max_cols=None, memory_usage=None, null_co
         lines = []
 
         lines.append(str(type(self)))
-        lines.append(self.index.summary())
+        lines.append(self.index._summary())
 
         if len(self.columns) == 0:
-            lines.append('Empty %s' % type(self).__name__)
-            _put_lines(buf, lines)
+            lines.append('Empty {name}'.format(name=type(self).__name__))
+            fmt.buffer_put_lines(buf, lines)
             return
 
         cols = self.columns
 
         # hack
         if max_cols is None:
-            max_cols = get_option(
-                'display.max_info_columns', len(self.columns) + 1)
+            max_cols = get_option('display.max_info_columns',
+                                  len(self.columns) + 1)
 
         max_rows = get_option('display.max_info_rows', len(self) + 1)
 
@@ -1602,39 +2208,44 @@ def info(self, verbose=None, buf=None, max_cols=None, memory_usage=None, null_co
         def _verbose_repr():
             lines.append('Data columns (total %d columns):' %
                          len(self.columns))
-            space = max([len(com.pprint_thing(k)) for k in self.columns]) + 4
+            space = max(len(pprint_thing(k)) for k in self.columns) + 4
             counts = None
 
-            tmpl = "%s%s"
+            tmpl = "{count}{dtype}"
             if show_counts:
                 counts = self.count()
                 if len(cols) != len(counts):  # pragma: no cover
-                    raise AssertionError('Columns must equal counts (%d != %d)' %
-                                         (len(cols), len(counts)))
-                tmpl = "%s non-null %s"
+                    raise AssertionError(
+                        'Columns must equal counts '
+                        '({cols:d} != {counts:d})'.format(
+                            cols=len(cols), counts=len(counts)))
+                tmpl = "{count} non-null {dtype}"
 
             dtypes = self.dtypes
             for i, col in enumerate(self.columns):
-                dtype = dtypes[col]
-                col = com.pprint_thing(col)
+                dtype = dtypes.iloc[i]
+                col = pprint_thing(col)
 
                 count = ""
                 if show_counts:
                     count = counts.iloc[i]
 
-                lines.append(_put_str(col, space) +
-                             tmpl % (count, dtype))
+                lines.append(_put_str(col, space) + tmpl.format(count=count,
+                                                                dtype=dtype))
 
         def _non_verbose_repr():
-            lines.append(self.columns.summary(name='Columns'))
+            lines.append(self.columns._summary(name='Columns'))
 
         def _sizeof_fmt(num, size_qualifier):
             # returns size in human readable format
             for x in ['bytes', 'KB', 'MB', 'GB', 'TB']:
                 if num < 1024.0:
-                    return "%3.1f%s %s" % (num, size_qualifier, x)
+                    return ("{num:3.1f}{size_q} "
+                            "{x}".format(num=num, size_q=size_qualifier, x=x))
                 num /= 1024.0
-            return "%3.1f%s %s" % (num, size_qualifier, 'PB')
+            return "{num:3.1f}{size_q} {pb}".format(num=num,
+                                                    size_q=size_qualifier,
+                                                    pb='PB')
 
         if verbose:
             _verbose_repr()
@@ -1647,101 +2258,262 @@ def _sizeof_fmt(num, size_qualifier):
                 _verbose_repr()
 
         counts = self.get_dtype_counts()
-        dtypes = ['%s(%d)' % k for k in sorted(compat.iteritems(counts))]
-        lines.append('dtypes: %s' % ', '.join(dtypes))
+        dtypes = ['{k}({kk:d})'.format(k=k[0], kk=k[1]) for k
+                  in sorted(compat.iteritems(counts))]
+        lines.append('dtypes: {types}'.format(types=', '.join(dtypes)))
+
         if memory_usage is None:
             memory_usage = get_option('display.memory_usage')
-        if memory_usage:  # append memory usage of df to display
-            # size_qualifier is just a best effort; not guaranteed to catch all
-            # cases (e.g., it misses categorical data even with object
-            # categories)
-            size_qualifier = ('+' if 'object' in counts
-                              or is_object_dtype(self.index) else '')
-            mem_usage = self.memory_usage(index=True).sum()
-            lines.append("memory usage: %s\n" %
-                            _sizeof_fmt(mem_usage, size_qualifier))
-        _put_lines(buf, lines)
-
-    def memory_usage(self, index=False):
-        """Memory usage of DataFrame columns.
+        if memory_usage:
+            # append memory usage of df to display
+            size_qualifier = ''
+            if memory_usage == 'deep':
+                deep = True
+            else:
+                # size_qualifier is just a best effort; not guaranteed to catch
+                # all cases (e.g., it misses categorical data even with object
+                # categories)
+                deep = False
+                if ('object' in counts or
+                        self.index._is_memory_usage_qualified()):
+                    size_qualifier = '+'
+            mem_usage = self.memory_usage(index=True, deep=deep).sum()
+            lines.append("memory usage: {mem}\n".format(
+                mem=_sizeof_fmt(mem_usage, size_qualifier)))
+
+        fmt.buffer_put_lines(buf, lines)
+
+    def memory_usage(self, index=True, deep=False):
+        """
+        Return the memory usage of each column in bytes.
+
+        The memory usage can optionally include the contribution of
+        the index and elements of `object` dtype.
+
+        This value is displayed in `DataFrame.info` by default. This can be
+        suppressed by setting ``pandas.options.display.memory_usage`` to False.
 
         Parameters
         ----------
-        index : bool
-            Specifies whether to include memory usage of DataFrame's
-            index in returned Series. If `index=True` (default is False)
-            the first index of the Series is `Index`.
+        index : bool, default True
+            Specifies whether to include the memory usage of the DataFrame's
+            index in returned Series. If ``index=True`` the memory usage of the
+            index the first item in the output.
+        deep : bool, default False
+            If True, introspect the data deeply by interrogating
+            `object` dtypes for system-level memory consumption, and include
+            it in the returned values.
 
         Returns
         -------
         sizes : Series
-            A series with column names as index and memory usage of
-            columns with units of bytes.
-
-        Notes
-        -----
-        Memory usage does not include memory consumed by elements that
-        are not components of the array.
+            A Series whose index is the original column names and whose values
+            is the memory usage of each column in bytes.
 
         See Also
         --------
-        numpy.ndarray.nbytes
-        """
-        result = Series([ c.values.nbytes for col, c in self.iteritems() ],
-                        index=self.columns)
+        numpy.ndarray.nbytes : Total bytes consumed by the elements of an
+            ndarray.
+        Series.memory_usage : Bytes consumed by a Series.
+        pandas.Categorical : Memory-efficient array for string values with
+            many repeated values.
+        DataFrame.info : Concise summary of a DataFrame.
+
+        Examples
+        --------
+        >>> dtypes = ['int64', 'float64', 'complex128', 'object', 'bool']
+        >>> data = dict([(t, np.ones(shape=5000).astype(t))
+        ...              for t in dtypes])
+        >>> df = pd.DataFrame(data)
+        >>> df.head()
+           int64  float64  complex128 object  bool
+        0      1      1.0      (1+0j)      1  True
+        1      1      1.0      (1+0j)      1  True
+        2      1      1.0      (1+0j)      1  True
+        3      1      1.0      (1+0j)      1  True
+        4      1      1.0      (1+0j)      1  True
+
+        >>> df.memory_usage()
+        Index            80
+        int64         40000
+        float64       40000
+        complex128    80000
+        object        40000
+        bool           5000
+        dtype: int64
+
+        >>> df.memory_usage(index=False)
+        int64         40000
+        float64       40000
+        complex128    80000
+        object        40000
+        bool           5000
+        dtype: int64
+
+        The memory footprint of `object` dtype columns is ignored by default:
+
+        >>> df.memory_usage(deep=True)
+        Index             80
+        int64          40000
+        float64        40000
+        complex128     80000
+        object        160000
+        bool            5000
+        dtype: int64
+
+        Use a Categorical for efficient storage of an object-dtype column with
+        many repeated values.
+
+        >>> df['object'].astype('category').memory_usage(deep=True)
+        5168
+        """
+        result = Series([c.memory_usage(index=False, deep=deep)
+                         for col, c in self.iteritems()], index=self.columns)
         if index:
-             result = Series(self.index.nbytes,
-                        index=['Index']).append(result)
+            result = Series(self.index.memory_usage(deep=deep),
+                            index=['Index']).append(result)
         return result
 
-    def transpose(self):
-        """Transpose index and columns"""
-        return super(DataFrame, self).transpose(1, 0)
+    def transpose(self, *args, **kwargs):
+        """
+        Transpose index and columns.
 
-    T = property(transpose)
+        Reflect the DataFrame over its main diagonal by writing rows as columns
+        and vice-versa. The property :attr:`.T` is an accessor to the method
+        :meth:`transpose`.
 
-    #----------------------------------------------------------------------
-    # Picklability
+        Parameters
+        ----------
+        copy : bool, default False
+            If True, the underlying data is copied. Otherwise (default), no
+            copy is made if possible.
+        *args, **kwargs
+            Additional keywords have no effect but might be accepted for
+            compatibility with numpy.
+
+        Returns
+        -------
+        DataFrame
+            The transposed DataFrame.
+
+        See Also
+        --------
+        numpy.transpose : Permute the dimensions of a given array.
+
+        Notes
+        -----
+        Transposing a DataFrame with mixed dtypes will result in a homogeneous
+        DataFrame with the `object` dtype. In such a case, a copy of the data
+        is always made.
+
+        Examples
+        --------
+        **Square DataFrame with homogeneous dtype**
+
+        >>> d1 = {'col1': [1, 2], 'col2': [3, 4]}
+        >>> df1 = pd.DataFrame(data=d1)
+        >>> df1
+           col1  col2
+        0     1     3
+        1     2     4
+
+        >>> df1_transposed = df1.T # or df1.transpose()
+        >>> df1_transposed
+              0  1
+        col1  1  2
+        col2  3  4
+
+        When the dtype is homogeneous in the original DataFrame, we get a
+        transposed DataFrame with the same dtype:
+
+        >>> df1.dtypes
+        col1    int64
+        col2    int64
+        dtype: object
+        >>> df1_transposed.dtypes
+        0    int64
+        1    int64
+        dtype: object
+
+        **Non-square DataFrame with mixed dtypes**
+
+        >>> d2 = {'name': ['Alice', 'Bob'],
+        ...       'score': [9.5, 8],
+        ...       'employed': [False, True],
+        ...       'kids': [0, 0]}
+        >>> df2 = pd.DataFrame(data=d2)
+        >>> df2
+            name  score  employed  kids
+        0  Alice    9.5     False     0
+        1    Bob    8.0      True     0
+
+        >>> df2_transposed = df2.T # or df2.transpose()
+        >>> df2_transposed
+                      0     1
+        name      Alice   Bob
+        score       9.5     8
+        employed  False  True
+        kids          0     0
+
+        When the DataFrame has mixed dtypes, we get a transposed DataFrame with
+        the `object` dtype:
+
+        >>> df2.dtypes
+        name         object
+        score       float64
+        employed       bool
+        kids          int64
+        dtype: object
+        >>> df2_transposed.dtypes
+        0    object
+        1    object
+        dtype: object
+        """
+        nv.validate_transpose(args, dict())
+        return super(DataFrame, self).transpose(1, 0, **kwargs)
+
+    T = property(transpose)
+
+    # ----------------------------------------------------------------------
+    # Picklability
 
     # legacy pickle formats
     def _unpickle_frame_compat(self, state):  # pragma: no cover
-        from pandas.core.common import _unpickle_array
         if len(state) == 2:  # pragma: no cover
             series, idx = state
             columns = sorted(series)
         else:
             series, cols, idx = state
-            columns = _unpickle_array(cols)
+            columns = com._unpickle_array(cols)
 
-        index = _unpickle_array(idx)
+        index = com._unpickle_array(idx)
         self._data = self._init_dict(series, index, columns, None)
 
     def _unpickle_matrix_compat(self, state):  # pragma: no cover
-        from pandas.core.common import _unpickle_array
         # old unpickling
         (vals, idx, cols), object_state = state
 
-        index = _unpickle_array(idx)
-        dm = DataFrame(vals, index=index, columns=_unpickle_array(cols),
+        index = com._unpickle_array(idx)
+        dm = DataFrame(vals, index=index, columns=com._unpickle_array(cols),
                        copy=False)
 
         if object_state is not None:
             ovals, _, ocols = object_state
             objects = DataFrame(ovals, index=index,
-                                columns=_unpickle_array(ocols),
-                                copy=False)
+                                columns=com._unpickle_array(ocols), copy=False)
 
             dm = dm.join(objects)
 
         self._data = dm._data
 
-    #----------------------------------------------------------------------
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Getting and setting elements
 
     def get_value(self, index, col, takeable=False):
-        """
-        Quickly retrieve single value at passed column and index
+        """Quickly retrieve single value at passed column and index
+
+        .. deprecated:: 0.21.0
+            Use .at[] or .iat[] accessors instead.
 
         Parameters
         ----------
@@ -1754,17 +2526,37 @@ def get_value(self, index, col, takeable=False):
         value : scalar value
         """
 
+        warnings.warn("get_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._get_value(index, col, takeable=takeable)
+
+    def _get_value(self, index, col, takeable=False):
+
         if takeable:
             series = self._iget_item_cache(col)
-            return _maybe_box_datetimelike(series._values[index])
+            return com._maybe_box_datetimelike(series._values[index])
 
         series = self._get_item_cache(col)
         engine = self.index._engine
-        return engine.get_value(series.get_values(), index)
+
+        try:
+            return engine.get_value(series._values, index)
+        except (TypeError, ValueError):
+
+            # we cannot handle direct indexing
+            # use positional
+            col = self.columns.get_loc(col)
+            index = self.index.get_loc(index)
+            return self._get_value(index, col, takeable=True)
+    _get_value.__doc__ = get_value.__doc__
 
     def set_value(self, index, col, value, takeable=False):
-        """
-        Put single value at passed column and index
+        """Put single value at passed column and index
+
+        .. deprecated:: 0.21.0
+            Use .at[] or .iat[] accessors instead.
 
         Parameters
         ----------
@@ -1779,10 +2571,17 @@ def set_value(self, index, col, value, takeable=False):
             If label pair is contained, will be reference to calling DataFrame,
             otherwise a new object
         """
+        warnings.warn("set_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._set_value(index, col, value, takeable=takeable)
+
+    def _set_value(self, index, col, value, takeable=False):
         try:
             if takeable is True:
                 series = self._iget_item_cache(col)
-                return series.set_value(index, value, takeable=True)
+                return series._set_value(index, value, takeable=True)
 
             series = self._get_item_cache(col)
             engine = self.index._engine
@@ -1795,23 +2594,7 @@ def set_value(self, index, col, value, takeable=False):
             self._item_cache.pop(col, None)
 
             return self
-
-    def irow(self, i, copy=False):
-        """
-        DEPRECATED. Use ``.iloc[i]`` instead
-        """
-
-        warnings.warn("irow(i) is deprecated. Please use .iloc[i]",
-                      FutureWarning, stacklevel=2)
-        return self._ixs(i, axis=0)
-
-    def icol(self, i):
-        """
-        DEPRECATED. Use ``.iloc[:, i]`` instead
-        """
-        warnings.warn("icol(i) is deprecated. Please use .iloc[:,i]",
-                      FutureWarning, stacklevel=2)
-        return self._ixs(i, axis=1)
+    _set_value.__doc__ = set_value.__doc__
 
     def _ixs(self, i, axis=0):
         """
@@ -1821,7 +2604,6 @@ def _ixs(self, i, axis=0):
 
         # irow
         if axis == 0:
-
             """
             Notes
             -----
@@ -1835,22 +2617,24 @@ def _ixs(self, i, axis=0):
                 if isinstance(label, Index):
                     # a location index by definition
                     result = self.take(i, axis=axis)
-                    copy=True
+                    copy = True
                 else:
                     new_values = self._data.fast_xs(i)
-                    if lib.isscalar(new_values):
+                    if is_scalar(new_values):
                         return new_values
 
                     # if we are a copy, mark as such
-                    copy = isinstance(new_values,np.ndarray) and new_values.base is None
-                    result = Series(new_values, index=self.columns,
-                                    name=self.index[i], dtype=new_values.dtype)
+                    copy = (isinstance(new_values, np.ndarray) and
+                            new_values.base is None)
+                    result = self._constructor_sliced(new_values,
+                                                      index=self.columns,
+                                                      name=self.index[i],
+                                                      dtype=new_values.dtype)
                 result._set_is_copy(self, copy=copy)
                 return result
 
         # icol
         else:
-
             """
             Notes
             -----
@@ -1861,10 +2645,10 @@ def _ixs(self, i, axis=0):
             if isinstance(i, slice):
                 # need to return view
                 lab_slice = slice(label[0], label[-1])
-                return self.ix[:, lab_slice]
+                return self.loc[:, lab_slice]
             else:
                 if isinstance(label, Index):
-                    return self.take(i, axis=1, convert=True)
+                    return self._take(i, axis=1)
 
                 index_len = len(self.index)
 
@@ -1876,24 +2660,15 @@ def _ixs(self, i, axis=0):
 
                 if index_len and not len(values):
                     values = np.array([np.nan] * index_len, dtype=object)
-                result = self._constructor_sliced.from_array(
-                    values, index=self.index,
-                    name=label, fastpath=True)
+                result = self._box_col_values(values, label)
 
                 # this is a cached value, mark it so
                 result._set_as_cached(label, self)
 
                 return result
 
-    def iget_value(self, i, j):
-        """
-        DEPRECATED. Use ``.iat[i, j]`` instead
-        """
-        warnings.warn("iget_value(i, j) is deprecated. Please use .iat[i, j]",
-                      FutureWarning, stacklevel=2)
-        return self.iat[i, j]
-
     def __getitem__(self, key):
+        key = com._apply_if_callable(key, self)
 
         # shortcut if we are an actual column
         is_mi_columns = isinstance(self.columns, MultiIndex)
@@ -1944,7 +2719,7 @@ def _getitem_array(self, key):
             # with all other indexing behavior
             if isinstance(key, Series) and not key.index.equals(self.index):
                 warnings.warn("Boolean Series key will be reindexed to match "
-                              "DataFrame index.", UserWarning)
+                              "DataFrame index.", UserWarning, stacklevel=3)
             elif len(key) != len(self.index):
                 raise ValueError('Item wrong length %d instead of %d.' %
                                  (len(key), len(self.index)))
@@ -1952,10 +2727,11 @@ def _getitem_array(self, key):
             # be reindexed to match DataFrame rows
             key = check_bool_indexer(self.index, key)
             indexer = key.nonzero()[0]
-            return self.take(indexer, axis=0, convert=False)
+            return self._take(indexer, axis=0)
         else:
-            indexer = self.ix._convert_to_indexer(key, axis=1)
-            return self.take(indexer, axis=1, convert=True)
+            indexer = self.loc._convert_to_indexer(key, axis=1,
+                                                   raise_missing=True)
+            return self._take(indexer, axis=1)
 
     def _getitem_multilevel(self, key):
         loc = self.columns.get_loc(key)
@@ -1968,14 +2744,25 @@ def _getitem_multilevel(self, key):
             else:
                 new_values = self.values[:, loc]
                 result = self._constructor(new_values, index=self.index,
-                                   columns=result_columns).__finalize__(self)
+                                           columns=result_columns)
+                result = result.__finalize__(self)
+
+            # If there is only one column being returned, and its name is
+            # either an empty string, or a tuple with an empty string as its
+            # first element, then treat the empty string as a placeholder
+            # and return the column as if the user had provided that empty
+            # string in the key. If the result is a Series, exclude the
+            # implied empty string from its name.
             if len(result.columns) == 1:
                 top = result.columns[0]
-                if ((type(top) == str and top == '') or
-                        (type(top) == tuple and top[0] == '')):
+                if isinstance(top, tuple):
+                    top = top[0]
+                if top == '':
                     result = result['']
                     if isinstance(result, Series):
-                        result = self._constructor_sliced(result, index=self.index, name=key)
+                        result = self._constructor_sliced(result,
+                                                          index=self.index,
+                                                          name=key)
 
             result._set_is_copy(self)
             return result
@@ -1983,21 +2770,25 @@ def _getitem_multilevel(self, key):
             return self._get_item_cache(key)
 
     def _getitem_frame(self, key):
-        if key.values.dtype != np.bool_:
+        if key.values.size and not is_bool_dtype(key.values):
             raise ValueError('Must pass DataFrame with boolean values only')
         return self.where(key)
 
-    def query(self, expr, **kwargs):
+    def query(self, expr, inplace=False, **kwargs):
         """Query the columns of a frame with a boolean expression.
 
-        .. versionadded:: 0.13
-
         Parameters
         ----------
         expr : string
             The query string to evaluate.  You can refer to variables
             in the environment by prefixing them with an '@' character like
             ``@a + b``.
+        inplace : bool
+            Whether the query should modify the data in place or return
+            a modified copy
+
+            .. versionadded:: 0.18.0
+
         kwargs : dict
             See the documentation for :func:`pandas.eval` for complete details
             on the keyword arguments accepted by :meth:`DataFrame.query`.
@@ -2035,7 +2826,8 @@ def query(self, expr, **kwargs):
         by default, which allows you to treat both the index and columns of the
         frame as a column in the frame.
         The identifier ``index`` is used for the frame index; you can also
-        use the name of the index to identify it in a query.
+        use the name of the index to identify it in a query. Please note that
+        Python keywords may not be used as identifiers.
 
         For further details and examples see the ``query`` documentation in
         :ref:`indexing <indexing.query>`.
@@ -2049,28 +2841,48 @@ def query(self, expr, **kwargs):
         --------
         >>> from numpy.random import randn
         >>> from pandas import DataFrame
-        >>> df = DataFrame(randn(10, 2), columns=list('ab'))
+        >>> df = pd.DataFrame(randn(10, 2), columns=list('ab'))
         >>> df.query('a > b')
         >>> df[df.a > df.b]  # same result as the previous expression
         """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if not isinstance(expr, compat.string_types):
+            msg = "expr must be a string to be evaluated, {0} given"
+            raise ValueError(msg.format(type(expr)))
         kwargs['level'] = kwargs.pop('level', 0) + 1
+        kwargs['target'] = None
         res = self.eval(expr, **kwargs)
 
         try:
-            return self.loc[res]
+            new_data = self.loc[res]
         except ValueError:
             # when res is multi-dimensional loc raises, but this is sometimes a
             # valid query
-            return self[res]
+            new_data = self[res]
+
+        if inplace:
+            self._update_inplace(new_data)
+        else:
+            return new_data
+
+    def eval(self, expr, inplace=False, **kwargs):
+        """
+        Evaluate a string describing operations on DataFrame columns.
 
-    def eval(self, expr, **kwargs):
-        """Evaluate an expression in the context of the calling DataFrame
-        instance.
+        Operates on columns only, not specific rows or elements.  This allows
+        `eval` to run arbitrary code, which can make you vulnerable to code
+        injection if you pass user input to this function.
 
         Parameters
         ----------
-        expr : string
+        expr : str
             The expression string to evaluate.
+        inplace : bool, default False
+            If the expression contains an assignment, whether to perform the
+            operation inplace and mutate the existing DataFrame. Otherwise,
+            a new DataFrame is returned.
+
+            .. versionadded:: 0.18.0.
         kwargs : dict
             See the documentation for :func:`~pandas.eval` for complete details
             on the keyword arguments accepted by
@@ -2078,12 +2890,17 @@ def eval(self, expr, **kwargs):
 
         Returns
         -------
-        ret : ndarray, scalar, or pandas object
+        ndarray, scalar, or pandas object
+            The result of the evaluation.
 
         See Also
         --------
-        pandas.DataFrame.query
-        pandas.eval
+        DataFrame.query : Evaluates a boolean expression to query the columns
+            of a frame.
+        DataFrame.assign : Can evaluate an expression or function to create new
+            values for a column.
+        pandas.eval : Evaluate a Python expression as a string using various
+            backends.
 
         Notes
         -----
@@ -2093,30 +2910,73 @@ def eval(self, expr, **kwargs):
 
         Examples
         --------
-        >>> from numpy.random import randn
-        >>> from pandas import DataFrame
-        >>> df = DataFrame(randn(10, 2), columns=list('ab'))
-        >>> df.eval('a + b')
-        >>> df.eval('c = a + b')
+        >>> df = pd.DataFrame({'A': range(1, 6), 'B': range(10, 0, -2)})
+        >>> df
+           A   B
+        0  1  10
+        1  2   8
+        2  3   6
+        3  4   4
+        4  5   2
+        >>> df.eval('A + B')
+        0    11
+        1    10
+        2     9
+        3     8
+        4     7
+        dtype: int64
+
+        Assignment is allowed though by default the original DataFrame is not
+        modified.
+
+        >>> df.eval('C = A + B')
+           A   B   C
+        0  1  10  11
+        1  2   8  10
+        2  3   6   9
+        3  4   4   8
+        4  5   2   7
+        >>> df
+           A   B
+        0  1  10
+        1  2   8
+        2  3   6
+        3  4   4
+        4  5   2
+
+        Use ``inplace=True`` to modify the original DataFrame.
+
+        >>> df.eval('C = A + B', inplace=True)
+        >>> df
+           A   B   C
+        0  1  10  11
+        1  2   8  10
+        2  3   6   9
+        3  4   4   8
+        4  5   2   7
         """
+        from pandas.core.computation.eval import eval as _eval
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
         resolvers = kwargs.pop('resolvers', None)
         kwargs['level'] = kwargs.pop('level', 0) + 1
         if resolvers is None:
             index_resolvers = self._get_index_resolvers()
             resolvers = dict(self.iteritems()), index_resolvers
-        kwargs['target'] = self
-        kwargs['resolvers'] = kwargs.get('resolvers', ()) + resolvers
-        return _eval(expr, **kwargs)
+        if 'target' not in kwargs:
+            kwargs['target'] = self
+        kwargs['resolvers'] = kwargs.get('resolvers', ()) + tuple(resolvers)
+        return _eval(expr, inplace=inplace, **kwargs)
 
     def select_dtypes(self, include=None, exclude=None):
-        """Return a subset of a DataFrame including/excluding columns based on
-        their ``dtype``.
+        """
+        Return a subset of the DataFrame's columns based on the column dtypes.
 
         Parameters
         ----------
-        include, exclude : list-like
-            A list of dtypes or strings to be included/excluded. You must pass
-            in a non-empty sequence for at least one of these.
+        include, exclude : scalar or list-like
+            A selection of dtypes or strings to be included/excluded. At least
+            one of these parameters must be supplied.
 
         Raises
         ------
@@ -2124,8 +2984,6 @@ def select_dtypes(self, include=None, exclude=None):
             * If both of ``include`` and ``exclude`` are empty
             * If ``include`` and ``exclude`` have overlapping elements
             * If any kind of string dtype is passed in.
-        TypeError
-            * If either of ``include`` or ``exclude`` is not a sequence
 
         Returns
         -------
@@ -2135,47 +2993,66 @@ def select_dtypes(self, include=None, exclude=None):
 
         Notes
         -----
-        * To select all *numeric* types use the numpy dtype ``numpy.number``
+        * To select all *numeric* types, use ``np.number`` or ``'number'``
         * To select strings you must use the ``object`` dtype, but note that
           this will return *all* object dtype columns
         * See the `numpy dtype hierarchy
           <http://docs.scipy.org/doc/numpy/reference/arrays.scalars.html>`__
-        * To select Pandas categorical dtypes, use 'category'
+        * To select datetimes, use ``np.datetime64``, ``'datetime'`` or
+          ``'datetime64'``
+        * To select timedeltas, use ``np.timedelta64``, ``'timedelta'`` or
+          ``'timedelta64'``
+        * To select Pandas categorical dtypes, use ``'category'``
+        * To select Pandas datetimetz dtypes, use ``'datetimetz'`` (new in
+          0.20.0) or ``'datetime64[ns, tz]'``
 
         Examples
         --------
-        >>> df = pd.DataFrame({'a': np.random.randn(6).astype('f4'),
+        >>> df = pd.DataFrame({'a': [1, 2] * 3,
         ...                    'b': [True, False] * 3,
         ...                    'c': [1.0, 2.0] * 3})
         >>> df
                 a      b  c
-        0  0.3962   True  1
-        1  0.1459  False  2
-        2  0.2623   True  1
-        3  0.0764  False  2
-        4 -0.9703   True  1
-        5 -1.2094  False  2
-        >>> df.select_dtypes(include=['float64'])
-           c
-        0  1
-        1  2
-        2  1
-        3  2
-        4  1
-        5  2
-        >>> df.select_dtypes(exclude=['floating'])
-               b
-        0   True
+        0       1   True  1.0
+        1       2  False  2.0
+        2       1   True  1.0
+        3       2  False  2.0
+        4       1   True  1.0
+        5       2  False  2.0
+
+        >>> df.select_dtypes(include='bool')
+           b
+        0  True
         1  False
-        2   True
+        2  True
         3  False
-        4   True
+        4  True
         5  False
-        """
-        include, exclude = include or (), exclude or ()
-        if not (com.is_list_like(include) and com.is_list_like(exclude)):
-            raise TypeError('include and exclude must both be non-string'
-                            ' sequences')
+
+        >>> df.select_dtypes(include=['float64'])
+           c
+        0  1.0
+        1  2.0
+        2  1.0
+        3  2.0
+        4  1.0
+        5  2.0
+
+        >>> df.select_dtypes(exclude=['int'])
+               b    c
+        0   True  1.0
+        1  False  2.0
+        2   True  1.0
+        3  False  2.0
+        4   True  1.0
+        5  False  2.0
+        """
+
+        if not is_list_like(include):
+            include = (include,) if include is not None else ()
+        if not is_list_like(exclude):
+            exclude = (exclude,) if exclude is not None else ()
+
         selection = tuple(map(frozenset, (include, exclude)))
 
         if not any(selection):
@@ -2183,16 +3060,15 @@ def select_dtypes(self, include=None, exclude=None):
                              'nonempty')
 
         # convert the myriad valid dtypes object to a single representation
-        include, exclude = map(lambda x:
-                               frozenset(map(com._get_dtype_from_object, x)),
-                               selection)
+        include, exclude = map(
+            lambda x: frozenset(map(_get_dtype_from_object, x)), selection)
         for dtypes in (include, exclude):
-            com._invalidate_string_dtypes(dtypes)
+            invalidate_string_dtypes(dtypes)
 
         # can't both include AND exclude!
         if not include.isdisjoint(exclude):
-            raise ValueError('include and exclude overlap on %s'
-                             % (include & exclude))
+            raise ValueError('include and exclude overlap on {inc_ex}'.format(
+                inc_ex=(include & exclude)))
 
         # empty include/exclude -> defaults to True
         # three cases (we've already raised if both are empty)
@@ -2208,15 +3084,15 @@ def select_dtypes(self, include=None, exclude=None):
         include_these = Series(not bool(include), index=self.columns)
         exclude_these = Series(not bool(exclude), index=self.columns)
 
-        def is_dtype_instance_mapper(column, dtype):
-            return column, functools.partial(issubclass, dtype.type)
+        def is_dtype_instance_mapper(idx, dtype):
+            return idx, functools.partial(issubclass, dtype.type)
 
-        for column, f in itertools.starmap(is_dtype_instance_mapper,
-                                           self.dtypes.iteritems()):
+        for idx, f in itertools.starmap(is_dtype_instance_mapper,
+                                        enumerate(self.dtypes)):
             if include:  # checks for the case of empty include or exclude
-                include_these[column] = any(map(f, include))
+                include_these.iloc[idx] = any(map(f, include))
             if exclude:
-                exclude_these[column] = not any(map(f, exclude))
+                exclude_these.iloc[idx] = not any(map(f, exclude))
 
         dtype_indexer = include_these & exclude_these
         return self.loc[com._get_info_slice(self, dtype_indexer)]
@@ -2230,27 +3106,28 @@ def _box_item_values(self, key, values):
 
     def _box_col_values(self, values, items):
         """ provide boxed values for a column """
-        return self._constructor_sliced.from_array(values, index=self.index,
-                                                   name=items, fastpath=True)
+        klass = _get_sliced_frame_result_type(values, self)
+        return klass(values, index=self.index, name=items, fastpath=True)
 
     def __setitem__(self, key, value):
+        key = com._apply_if_callable(key, self)
 
         # see if we can slice the rows
         indexer = convert_to_index_sliceable(self, key)
         if indexer is not None:
             return self._setitem_slice(indexer, value)
 
-        if isinstance(key, (Series, np.ndarray, list, Index)):
-            self._setitem_array(key, value)
-        elif isinstance(key, DataFrame):
+        if isinstance(key, DataFrame) or getattr(key, 'ndim', None) == 2:
             self._setitem_frame(key, value)
+        elif isinstance(key, (Series, np.ndarray, list, Index)):
+            self._setitem_array(key, value)
         else:
             # set column
             self._set_item(key, value)
 
     def _setitem_slice(self, key, value):
         self._check_setitem_copy()
-        self.ix._setitem_with_indexer(key, value)
+        self.loc._setitem_with_indexer(key, value)
 
     def _setitem_array(self, key, value):
         # also raises Exception if object array with NA values
@@ -2261,7 +3138,7 @@ def _setitem_array(self, key, value):
             key = check_bool_indexer(self.index, key)
             indexer = key.nonzero()[0]
             self._check_setitem_copy()
-            self.ix._setitem_with_indexer(indexer, value)
+            self.loc._setitem_with_indexer(indexer, value)
         else:
             if isinstance(value, DataFrame):
                 if len(value.columns) != len(key):
@@ -2269,19 +3146,28 @@ def _setitem_array(self, key, value):
                 for k1, k2 in zip(key, value.columns):
                     self[k1] = value[k2]
             else:
-                indexer = self.ix._convert_to_indexer(key, axis=1)
+                indexer = self.loc._convert_to_indexer(key, axis=1)
                 self._check_setitem_copy()
-                self.ix._setitem_with_indexer((slice(None), indexer), value)
+                self.loc._setitem_with_indexer((slice(None), indexer), value)
 
     def _setitem_frame(self, key, value):
         # support boolean setting with DataFrame input, e.g.
         # df[df > df2] = 0
-        if key.values.size and not com.is_bool_dtype(key.values):
-            raise TypeError('Must pass DataFrame with boolean values only')
+        if isinstance(key, np.ndarray):
+            if key.shape != self.shape:
+                raise ValueError(
+                    'Array conditional must be same shape as self'
+                )
+            key = self._constructor(key, **self._construct_axes_dict())
+
+        if key.values.size and not is_bool_dtype(key.values):
+            raise TypeError(
+                'Must pass DataFrame or 2-d ndarray with boolean values only'
+            )
 
         self._check_inplace_setting(value)
         self._check_setitem_copy()
-        self.where(-key, value, inplace=True)
+        self._where(-key, value, inplace=True)
 
     def _ensure_valid_index(self, value):
         """
@@ -2290,16 +3176,15 @@ def _ensure_valid_index(self, value):
         """
         # GH5632, make sure that we are a Series convertible
         if not len(self.index) and is_list_like(value):
-                try:
-                    value = Series(value)
-                except:
-                    raise ValueError('Cannot set a frame with no defined index '
-                                     'and a value that cannot be converted to a '
-                                     'Series')
-
-                self._data = self._data.reindex_axis(value.index.copy(), axis=1,
-                                                     fill_value=np.nan)
+            try:
+                value = Series(value)
+            except:
+                raise ValueError('Cannot set a frame with no defined index '
+                                 'and a value that cannot be converted to a '
+                                 'Series')
 
+            self._data = self._data.reindex_axis(value.index.copy(), axis=1,
+                                                 fill_value=np.nan)
 
     def _set_item(self, key, value):
         """
@@ -2318,7 +3203,7 @@ def _set_item(self, key, value):
 
         # check if we are modifying a copy
         # try to set first as we want an invalid
-        # value exeption to occur first
+        # value exception to occur first
         if len(self):
             self._check_setitem_copy()
 
@@ -2326,35 +3211,37 @@ def insert(self, loc, column, value, allow_duplicates=False):
         """
         Insert column into DataFrame at specified location.
 
-        If `allow_duplicates` is False, raises Exception if column
-        is already contained in the DataFrame.
+        Raises a ValueError if `column` is already contained in the DataFrame,
+        unless `allow_duplicates` is set to True.
 
         Parameters
         ----------
         loc : int
-            Must have 0 <= loc <= len(columns)
-        column : object
+            Insertion index. Must verify 0 <= loc <= len(columns)
+        column : string, number, or hashable object
+            label of the inserted column
         value : int, Series, or array-like
+        allow_duplicates : bool, optional
         """
         self._ensure_valid_index(value)
-        value = self._sanitize_column(column, value)
-        self._data.insert(
-            loc, column, value, allow_duplicates=allow_duplicates)
+        value = self._sanitize_column(column, value, broadcast=False)
+        self._data.insert(loc, column, value,
+                          allow_duplicates=allow_duplicates)
 
     def assign(self, **kwargs):
-        """
+        r"""
         Assign new columns to a DataFrame, returning a new object
-        (a copy) with all the original columns in addition to the new ones.
-
-        .. versionadded:: 0.16.0
+        (a copy) with the new columns added to the original ones.
+        Existing columns that are re-assigned will be overwritten.
 
         Parameters
         ----------
         kwargs : keyword, value pairs
             keywords are the column names. If the values are
             callable, they are computed on the DataFrame and
-            assigned to the new columns. If the values are
-            not callable, (e.g. a Series, scalar, or array),
+            assigned to the new columns. The callable must not
+            change input DataFrame (though pandas doesn't check it).
+            If the values are not callable, (e.g. a Series, scalar, or array),
             they are simply assigned.
 
         Returns
@@ -2365,16 +3252,21 @@ def assign(self, **kwargs):
 
         Notes
         -----
-        Since ``kwargs`` is a dictionary, the order of your
-        arguments may not be preserved. The make things predicatable,
-        the columns are inserted in alphabetical order, at the end of
-        your DataFrame. Assigning multiple columns within the same
-        ``assign`` is possible, but you cannot reference other columns
-        created within the same ``assign`` call.
+        Assigning multiple columns within the same ``assign`` is possible.
+        For Python 3.6 and above, later items in '\*\*kwargs' may refer to
+        newly created or modified columns in 'df'; items are computed and
+        assigned into 'df' in order.  For Python 3.5 and below, the order of
+        keyword arguments is not specified, you cannot refer to newly created
+        or modified columns. All items are computed first, and then assigned
+        in alphabetical order.
+
+        .. versionchanged :: 0.23.0
+
+            Keyword argument order is maintained for Python 3.6 and later.
 
         Examples
         --------
-        >>> df = DataFrame({'A': range(1, 11), 'B': np.random.randn(10)})
+        >>> df = pd.DataFrame({'A': range(1, 11), 'B': np.random.randn(10)})
 
         Where the value is a callable, evaluated on `df`:
 
@@ -2406,27 +3298,55 @@ def assign(self, **kwargs):
         7   8 -1.495604  2.079442
         8   9  0.549296  2.197225
         9  10 -0.758542  2.302585
-        """
-        data = self.copy()
 
-        # do all calculations first...
-        results = {}
-        for k, v in kwargs.items():
+        Where the keyword arguments depend on each other
 
-            if callable(v):
-                results[k] = v(data)
-            else:
-                results[k] = v
+        >>> df = pd.DataFrame({'A': [1, 2, 3]})
 
-        # ... and then assign
-        for k, v in sorted(results.items()):
-            data[k] = v
+        >>> df.assign(B=df.A, C=lambda x:x['A']+ x['B'])
+            A  B  C
+         0  1  1  2
+         1  2  2  4
+         2  3  3  6
+        """
+        data = self.copy()
 
+        # >= 3.6 preserve order of kwargs
+        if PY36:
+            for k, v in kwargs.items():
+                data[k] = com._apply_if_callable(v, data)
+        else:
+            # <= 3.5: do all calculations first...
+            results = OrderedDict()
+            for k, v in kwargs.items():
+                results[k] = com._apply_if_callable(v, data)
+
+            # <= 3.5 and earlier
+            results = sorted(results.items())
+            # ... and then assign
+            for k, v in results:
+                data[k] = v
         return data
 
-    def _sanitize_column(self, key, value):
-        # Need to make sure new columns (which go into the BlockManager as new
-        # blocks) are always copied
+    def _sanitize_column(self, key, value, broadcast=True):
+        """
+        Ensures new columns (which go into the BlockManager as new blocks) are
+        always copied and converted into an array.
+
+        Parameters
+        ----------
+        key : object
+        value : scalar, Series, or array-like
+        broadcast : bool, default True
+            If ``key`` matches multiple duplicate column names in the
+            DataFrame, this parameter indicates whether ``value`` should be
+            tiled so that the returned array contains a (duplicated) column for
+            each occurrence of the key. If False, ``value`` will not be tiled.
+
+        Returns
+        -------
+        sanitized_column : numpy-array
+        """
 
         def reindexer(value):
             # reindex if necessary
@@ -2437,7 +3357,7 @@ def reindexer(value):
 
                 # GH 4107
                 try:
-                    value = value.reindex(self.index).values
+                    value = value.reindex(self.index)._values
                 except Exception as e:
 
                     # duplicate axis
@@ -2460,46 +3380,51 @@ def reindexer(value):
                 if isinstance(loc, (slice, Series, np.ndarray, Index)):
                     cols = maybe_droplevels(self.columns[loc], key)
                     if len(cols) and not cols.equals(value.columns):
-                        value = value.reindex_axis(cols, axis=1)
+                        value = value.reindex(cols, axis=1)
             # now align rows
             value = reindexer(value).T
 
-        elif isinstance(value, Categorical):
+        elif isinstance(value, ExtensionArray):
+            from pandas.core.series import _sanitize_index
+            # Explicitly copy here, instead of in _sanitize_index,
+            # as sanitize_index won't copy an EA, even with copy=True
             value = value.copy()
+            value = _sanitize_index(value, self.index, copy=False)
 
-        elif (isinstance(value, Index) or is_sequence(value)):
+        elif isinstance(value, Index) or is_sequence(value):
             from pandas.core.series import _sanitize_index
 
             # turn me into an ndarray
             value = _sanitize_index(value, self.index, copy=False)
             if not isinstance(value, (np.ndarray, Index)):
                 if isinstance(value, list) and len(value) > 0:
-                    value = com._possibly_convert_platform(value)
+                    value = maybe_convert_platform(value)
                 else:
                     value = com._asarray_tuplesafe(value)
             elif value.ndim == 2:
                 value = value.copy().T
+            elif isinstance(value, Index):
+                value = value.copy(deep=True)
             else:
                 value = value.copy()
 
             # possibly infer to datetimelike
             if is_object_dtype(value.dtype):
-                value = _possibly_infer_to_datetimelike(value)
+                value = maybe_infer_to_datetimelike(value)
 
         else:
             # upcast the scalar
-            dtype, value = _infer_dtype_from_scalar(value)
-            value = np.repeat(value, len(self.index)).astype(dtype)
-            value = com._possibly_cast_to_datetime(value, dtype)
+            value = cast_scalar_to_array(len(self.index), value)
+            value = maybe_cast_to_datetime(value, value.dtype)
 
         # return internal types directly
-        if is_internal_type(value):
+        if is_extension_type(value) or is_extension_array_dtype(value):
             return value
 
         # broadcast across multiple columns if necessary
-        if key in self.columns and value.ndim == 1:
-            if not self.columns.is_unique or isinstance(self.columns,
-                                                        MultiIndex):
+        if broadcast and key in self.columns and value.ndim == 1:
+            if (not self.columns.is_unique or
+                    isinstance(self.columns, MultiIndex)):
                 existing_piece = self[key]
                 if isinstance(existing_piece, DataFrame):
                     value = np.tile(value, (len(existing_piece.columns), 1))
@@ -2558,24 +3483,24 @@ def lookup(self, row_labels, col_labels):
         else:
             result = np.empty(n, dtype='O')
             for i, (r, c) in enumerate(zip(row_labels, col_labels)):
-                result[i] = self.get_value(r, c)
+                result[i] = self._get_value(r, c)
 
         if is_object_dtype(result):
             result = lib.maybe_convert_objects(result)
 
         return result
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Reindexing and alignment
 
-    def _reindex_axes(self, axes, level, limit, tolerance, method,
-                      fill_value, copy):
+    def _reindex_axes(self, axes, level, limit, tolerance, method, fill_value,
+                      copy):
         frame = self
 
         columns = axes['columns']
         if columns is not None:
-            frame = frame._reindex_columns(columns, copy, level, fill_value,
-                                           limit, tolerance)
+            frame = frame._reindex_columns(columns, method, copy, level,
+                                           fill_value, limit, tolerance)
 
         index = axes['index']
         if index is not None:
@@ -2584,19 +3509,19 @@ def _reindex_axes(self, axes, level, limit, tolerance, method,
 
         return frame
 
-    def _reindex_index(self, new_index, method, copy, level, fill_value=NA,
+    def _reindex_index(self, new_index, method, copy, level, fill_value=np.nan,
                        limit=None, tolerance=None):
-        new_index, indexer = self.index.reindex(new_index, method, level,
-                                                limit=limit,
+        new_index, indexer = self.index.reindex(new_index, method=method,
+                                                level=level, limit=limit,
                                                 tolerance=tolerance)
         return self._reindex_with_indexers({0: [new_index, indexer]},
                                            copy=copy, fill_value=fill_value,
                                            allow_dups=False)
 
-    def _reindex_columns(self, new_columns, copy, level, fill_value=NA,
-                         limit=None, tolerance=None):
-        new_columns, indexer = self.columns.reindex(new_columns, level=level,
-                                                    limit=limit,
+    def _reindex_columns(self, new_columns, method, copy, level,
+                         fill_value=None, limit=None, tolerance=None):
+        new_columns, indexer = self.columns.reindex(new_columns, method=method,
+                                                    level=level, limit=limit,
                                                     tolerance=tolerance)
         return self._reindex_with_indexers({1: [new_columns, indexer]},
                                            copy=copy, fill_value=fill_value,
@@ -2610,12 +3535,12 @@ def _reindex_multi(self, axes, copy, fill_value):
 
         if row_indexer is not None and col_indexer is not None:
             indexer = row_indexer, col_indexer
-            new_values = com.take_2d_multi(self.values, indexer,
-                                           fill_value=fill_value)
+            new_values = algorithms.take_2d_multi(self.values, indexer,
+                                                  fill_value=fill_value)
             return self._constructor(new_values, index=new_index,
                                      columns=new_columns)
         else:
-            return self._reindex_with_indexers({0: [new_index,   row_indexer],
+            return self._reindex_with_indexers({0: [new_index, row_indexer],
                                                 1: [new_columns, col_indexer]},
                                                copy=copy,
                                                fill_value=fill_value)
@@ -2624,35 +3549,260 @@ def _reindex_multi(self, axes, copy, fill_value):
     def align(self, other, join='outer', axis=None, level=None, copy=True,
               fill_value=None, method=None, limit=None, fill_axis=0,
               broadcast_axis=None):
-        return super(DataFrame, self).align(other, join=join, axis=axis, level=level, copy=copy,
-                                            fill_value=fill_value, method=method, limit=limit,
-                                            fill_axis=fill_axis, broadcast_axis=broadcast_axis)
+        return super(DataFrame, self).align(other, join=join, axis=axis,
+                                            level=level, copy=copy,
+                                            fill_value=fill_value,
+                                            method=method, limit=limit,
+                                            fill_axis=fill_axis,
+                                            broadcast_axis=broadcast_axis)
 
     @Appender(_shared_docs['reindex'] % _shared_doc_kwargs)
-    def reindex(self, index=None, columns=None, **kwargs):
-        return super(DataFrame, self).reindex(index=index, columns=columns,
-                                              **kwargs)
+    @rewrite_axis_style_signature('labels', [('method', None),
+                                             ('copy', True),
+                                             ('level', None),
+                                             ('fill_value', np.nan),
+                                             ('limit', None),
+                                             ('tolerance', None)])
+    def reindex(self, *args, **kwargs):
+        axes = validate_axis_style_args(self, args, kwargs, 'labels',
+                                        'reindex')
+        kwargs.update(axes)
+        # Pop these, since the values are in `kwargs` under different names
+        kwargs.pop('axis', None)
+        kwargs.pop('labels', None)
+        return super(DataFrame, self).reindex(**kwargs)
 
     @Appender(_shared_docs['reindex_axis'] % _shared_doc_kwargs)
     def reindex_axis(self, labels, axis=0, method=None, level=None, copy=True,
                      limit=None, fill_value=np.nan):
-        return super(DataFrame, self).reindex_axis(labels=labels, axis=axis,
-                                                   method=method, level=level,
-                                                   copy=copy, limit=limit,
-                                                   fill_value=fill_value)
+        return super(DataFrame,
+                     self).reindex_axis(labels=labels, axis=axis,
+                                        method=method, level=level, copy=copy,
+                                        limit=limit, fill_value=fill_value)
+
+    def drop(self, labels=None, axis=0, index=None, columns=None,
+             level=None, inplace=False, errors='raise'):
+        """
+        Drop specified labels from rows or columns.
+
+        Remove rows or columns by specifying label names and corresponding
+        axis, or by specifying directly index or column names. When using a
+        multi-index, labels on different levels can be removed by specifying
+        the level.
+
+        Parameters
+        ----------
+        labels : single label or list-like
+            Index or column labels to drop.
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            Whether to drop labels from the index (0 or 'index') or
+            columns (1 or 'columns').
+        index, columns : single label or list-like
+            Alternative to specifying axis (``labels, axis=1``
+            is equivalent to ``columns=labels``).
+
+            .. versionadded:: 0.21.0
+        level : int or level name, optional
+            For MultiIndex, level from which the labels will be removed.
+        inplace : bool, default False
+            If True, do operation inplace and return None.
+        errors : {'ignore', 'raise'}, default 'raise'
+            If 'ignore', suppress error and only existing labels are
+            dropped.
+
+        Returns
+        -------
+        dropped : pandas.DataFrame
+
+        See Also
+        --------
+        DataFrame.loc : Label-location based indexer for selection by label.
+        DataFrame.dropna : Return DataFrame with labels on given axis omitted
+            where (all or any) data are missing
+        DataFrame.drop_duplicates : Return DataFrame with duplicate rows
+            removed, optionally only considering certain columns
+        Series.drop : Return Series with specified index labels removed.
+
+        Raises
+        ------
+        KeyError
+            If none of the labels are found in the selected axis
+
+        Examples
+        --------
+        >>> df = pd.DataFrame(np.arange(12).reshape(3,4),
+        ...                   columns=['A', 'B', 'C', 'D'])
+        >>> df
+           A  B   C   D
+        0  0  1   2   3
+        1  4  5   6   7
+        2  8  9  10  11
+
+        Drop columns
+
+        >>> df.drop(['B', 'C'], axis=1)
+           A   D
+        0  0   3
+        1  4   7
+        2  8  11
+
+        >>> df.drop(columns=['B', 'C'])
+           A   D
+        0  0   3
+        1  4   7
+        2  8  11
+
+        Drop a row by index
+
+        >>> df.drop([0, 1])
+           A  B   C   D
+        2  8  9  10  11
+
+        Drop columns and/or rows of MultiIndex DataFrame
+
+        >>> midx = pd.MultiIndex(levels=[['lama', 'cow', 'falcon'],
+        ...                              ['speed', 'weight', 'length']],
+        ...                      labels=[[0, 0, 0, 1, 1, 1, 2, 2, 2],
+        ...                              [0, 1, 2, 0, 1, 2, 0, 1, 2]])
+        >>> df = pd.DataFrame(index=midx, columns=['big', 'small'],
+        ...                   data=[[45, 30], [200, 100], [1.5, 1], [30, 20],
+        ...                         [250, 150], [1.5, 0.8], [320, 250],
+        ...                         [1, 0.8], [0.3,0.2]])
+        >>> df
+                        big     small
+        lama    speed   45.0    30.0
+                weight  200.0   100.0
+                length  1.5     1.0
+        cow     speed   30.0    20.0
+                weight  250.0   150.0
+                length  1.5     0.8
+        falcon  speed   320.0   250.0
+                weight  1.0     0.8
+                length  0.3     0.2
+
+        >>> df.drop(index='cow', columns='small')
+                        big
+        lama    speed   45.0
+                weight  200.0
+                length  1.5
+        falcon  speed   320.0
+                weight  1.0
+                length  0.3
+
+        >>> df.drop(index='length', level=1)
+                        big     small
+        lama    speed   45.0    30.0
+                weight  200.0   100.0
+        cow     speed   30.0    20.0
+                weight  250.0   150.0
+        falcon  speed   320.0   250.0
+                weight  1.0     0.8
+        """
+        return super(DataFrame, self).drop(labels=labels, axis=axis,
+                                           index=index, columns=columns,
+                                           level=level, inplace=inplace,
+                                           errors=errors)
+
+    @rewrite_axis_style_signature('mapper', [('copy', True),
+                                             ('inplace', False),
+                                             ('level', None)])
+    def rename(self, *args, **kwargs):
+        """Alter axes labels.
+
+        Function / dict values must be unique (1-to-1). Labels not contained in
+        a dict / Series will be left as-is. Extra labels listed don't throw an
+        error.
+
+        See the :ref:`user guide <basics.rename>` for more.
+
+        Parameters
+        ----------
+        mapper, index, columns : dict-like or function, optional
+            dict-like or functions transformations to apply to
+            that axis' values. Use either ``mapper`` and ``axis`` to
+            specify the axis to target with ``mapper``, or ``index`` and
+            ``columns``.
+        axis : int or str, optional
+            Axis to target with ``mapper``. Can be either the axis name
+            ('index', 'columns') or number (0, 1). The default is 'index'.
+        copy : boolean, default True
+            Also copy underlying data
+        inplace : boolean, default False
+            Whether to return a new DataFrame. If True then value of copy is
+            ignored.
+        level : int or level name, default None
+            In case of a MultiIndex, only rename labels in the specified
+            level.
+
+        Returns
+        -------
+        renamed : DataFrame
+
+        See Also
+        --------
+        pandas.DataFrame.rename_axis
+
+        Examples
+        --------
+
+        ``DataFrame.rename`` supports two calling conventions
+
+        * ``(index=index_mapper, columns=columns_mapper, ...)``
+        * ``(mapper, axis={'index', 'columns'}, ...)``
+
+        We *highly* recommend using keyword arguments to clarify your
+        intent.
+
+        >>> df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
+        >>> df.rename(index=str, columns={"A": "a", "B": "c"})
+           a  c
+        0  1  4
+        1  2  5
+        2  3  6
+
+        >>> df.rename(index=str, columns={"A": "a", "C": "c"})
+           a  B
+        0  1  4
+        1  2  5
+        2  3  6
 
-    @Appender(_shared_docs['rename'] % _shared_doc_kwargs)
-    def rename(self, index=None, columns=None, **kwargs):
-        return super(DataFrame, self).rename(index=index, columns=columns,
-                                             **kwargs)
+        Using axis-style parameters
 
-    @Appender(_shared_docs['fillna'] % _shared_doc_kwargs)
+        >>> df.rename(str.lower, axis='columns')
+           a  b
+        0  1  4
+        1  2  5
+        2  3  6
+
+        >>> df.rename({1: 2, 2: 4}, axis='index')
+           A  B
+        0  1  4
+        2  2  5
+        4  3  6
+        """
+        axes = validate_axis_style_args(self, args, kwargs, 'mapper', 'rename')
+        kwargs.update(axes)
+        # Pop these, since the values are in `kwargs` under different names
+        kwargs.pop('axis', None)
+        kwargs.pop('mapper', None)
+        return super(DataFrame, self).rename(**kwargs)
+
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(NDFrame.fillna.__doc__)
     def fillna(self, value=None, method=None, axis=None, inplace=False,
                limit=None, downcast=None, **kwargs):
-        return super(DataFrame, self).fillna(value=value, method=method,
-                                             axis=axis, inplace=inplace,
-                                             limit=limit, downcast=downcast,
-                                             **kwargs)
+        return super(DataFrame,
+                     self).fillna(value=value, method=method, axis=axis,
+                                  inplace=inplace, limit=limit,
+                                  downcast=downcast, **kwargs)
+
+    @Appender(_shared_docs['replace'] % _shared_doc_kwargs)
+    def replace(self, to_replace=None, value=None, inplace=False, limit=None,
+                regex=False, method='pad'):
+        return super(DataFrame, self).replace(to_replace=to_replace,
+                                              value=value, inplace=inplace,
+                                              limit=limit, regex=regex,
+                                              method=method)
 
     @Appender(_shared_docs['shift'] % _shared_doc_kwargs)
     def shift(self, periods=1, freq=None, axis=0):
@@ -2681,14 +3831,50 @@ def set_index(self, keys, drop=True, append=False, inplace=False,
 
         Examples
         --------
-        >>> indexed_df = df.set_index(['A', 'B'])
-        >>> indexed_df2 = df.set_index(['A', [0, 1, 2, 0, 1, 2]])
-        >>> indexed_df3 = df.set_index([[0, 1, 2, 0, 1, 2]])
+        >>> df = pd.DataFrame({'month': [1, 4, 7, 10],
+        ...                    'year': [2012, 2014, 2013, 2014],
+        ...                    'sale':[55, 40, 84, 31]})
+           month  sale  year
+        0  1      55    2012
+        1  4      40    2014
+        2  7      84    2013
+        3  10     31    2014
+
+        Set the index to become the 'month' column:
+
+        >>> df.set_index('month')
+               sale  year
+        month
+        1      55    2012
+        4      40    2014
+        7      84    2013
+        10     31    2014
+
+        Create a multi-index using columns 'year' and 'month':
+
+        >>> df.set_index(['year', 'month'])
+                    sale
+        year  month
+        2012  1     55
+        2014  4     40
+        2013  7     84
+        2014  10    31
+
+        Create a multi-index using a set of values and a column:
+
+        >>> df.set_index([[1, 2, 3, 4], 'year'])
+                 month  sale
+           year
+        1  2012  1      55
+        2  2014  4      40
+        3  2013  7      84
+        4  2014  10     31
 
         Returns
         -------
         dataframe : DataFrame
         """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
         if not isinstance(keys, list):
             keys = [keys]
 
@@ -2703,7 +3889,7 @@ def set_index(self, keys, drop=True, append=False, inplace=False,
             names = [x for x in self.index.names]
             if isinstance(self.index, MultiIndex):
                 for i in range(self.index.nlevels):
-                    arrays.append(self.index.get_level_values(i))
+                    arrays.append(self.index._get_level_values(i))
             else:
                 arrays.append(self.index)
 
@@ -2713,12 +3899,12 @@ def set_index(self, keys, drop=True, append=False, inplace=False,
                 # append all but the last column so we don't have to modify
                 # the end of this loop
                 for n in range(col.nlevels - 1):
-                    arrays.append(col.get_level_values(n))
+                    arrays.append(col._get_level_values(n))
 
-                level = col.get_level_values(col.nlevels - 1)
+                level = col._get_level_values(col.nlevels - 1)
                 names.extend(col.names)
             elif isinstance(col, Series):
-                level = col.values
+                level = col._values
                 names.append(col.name)
             elif isinstance(col, Index):
                 level = col
@@ -2733,11 +3919,12 @@ def set_index(self, keys, drop=True, append=False, inplace=False,
                     to_remove.append(col)
             arrays.append(level)
 
-        index = MultiIndex.from_arrays(arrays, names=names)
+        index = _ensure_index_from_sequences(arrays, names)
 
         if verify_integrity and not index.is_unique:
-            duplicates = index.get_duplicates()
-            raise ValueError('Index has duplicate keys: %s' % duplicates)
+            duplicates = index[index.duplicated()].unique()
+            raise ValueError('Index has duplicate keys: {dup}'.format(
+                dup=duplicates))
 
         for c in to_remove:
             del frame[c]
@@ -2780,119 +3967,319 @@ def reset_index(self, level=None, drop=False, inplace=False, col_level=0,
         Returns
         -------
         resetted : DataFrame
-        """
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([('bird',    389.0),
+        ...                    ('bird',     24.0),
+        ...                    ('mammal',   80.5),
+        ...                    ('mammal', np.nan)],
+        ...                   index=['falcon', 'parrot', 'lion', 'monkey'],
+        ...                   columns=('class', 'max_speed'))
+        >>> df
+                 class  max_speed
+        falcon    bird      389.0
+        parrot    bird       24.0
+        lion    mammal       80.5
+        monkey  mammal        NaN
+
+        When we reset the index, the old index is added as a column, and a
+        new sequential index is used:
+
+        >>> df.reset_index()
+            index   class  max_speed
+        0  falcon    bird      389.0
+        1  parrot    bird       24.0
+        2    lion  mammal       80.5
+        3  monkey  mammal        NaN
+
+        We can use the `drop` parameter to avoid the old index being added as
+        a column:
+
+        >>> df.reset_index(drop=True)
+            class  max_speed
+        0    bird      389.0
+        1    bird       24.0
+        2  mammal       80.5
+        3  mammal        NaN
+
+        You can also use `reset_index` with `MultiIndex`.
+
+        >>> index = pd.MultiIndex.from_tuples([('bird', 'falcon'),
+        ...                                    ('bird', 'parrot'),
+        ...                                    ('mammal', 'lion'),
+        ...                                    ('mammal', 'monkey')],
+        ...                                   names=['class', 'name'])
+        >>> columns = pd.MultiIndex.from_tuples([('speed', 'max'),
+        ...                                      ('species', 'type')])
+        >>> df = pd.DataFrame([(389.0, 'fly'),
+        ...                    ( 24.0, 'fly'),
+        ...                    ( 80.5, 'run'),
+        ...                    (np.nan, 'jump')],
+        ...                   index=index,
+        ...                   columns=columns)
+        >>> df
+                       speed species
+                         max    type
+        class  name
+        bird   falcon  389.0     fly
+               parrot   24.0     fly
+        mammal lion     80.5     run
+               monkey    NaN    jump
+
+        If the index has multiple levels, we can reset a subset of them:
+
+        >>> df.reset_index(level='class')
+                 class  speed species
+                          max    type
+        name
+        falcon    bird  389.0     fly
+        parrot    bird   24.0     fly
+        lion    mammal   80.5     run
+        monkey  mammal    NaN    jump
+
+        If we are not dropping the index, by default, it is placed in the top
+        level. We can place it in another level:
+
+        >>> df.reset_index(level='class', col_level=1)
+                        speed species
+                 class    max    type
+        name
+        falcon    bird  389.0     fly
+        parrot    bird   24.0     fly
+        lion    mammal   80.5     run
+        monkey  mammal    NaN    jump
+
+        When the index is inserted under another level, we can specify under
+        which one with the parameter `col_fill`:
+
+        >>> df.reset_index(level='class', col_level=1, col_fill='species')
+                      species  speed species
+                        class    max    type
+        name
+        falcon           bird  389.0     fly
+        parrot           bird   24.0     fly
+        lion           mammal   80.5     run
+        monkey         mammal    NaN    jump
+
+        If we specify a nonexistent level for `col_fill`, it is created:
+
+        >>> df.reset_index(level='class', col_level=1, col_fill='genus')
+                        genus  speed species
+                        class    max    type
+        name
+        falcon           bird  389.0     fly
+        parrot           bird   24.0     fly
+        lion           mammal   80.5     run
+        monkey         mammal    NaN    jump
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
         if inplace:
             new_obj = self
         else:
             new_obj = self.copy()
 
         def _maybe_casted_values(index, labels=None):
-            if isinstance(index, PeriodIndex):
-                values = index.asobject.values
-            elif (isinstance(index, DatetimeIndex) and
-                  index.tz is not None):
-                values = index
-            else:
-                values = index.values
+            values = index._values
+            if not isinstance(index, (PeriodIndex, DatetimeIndex)):
                 if values.dtype == np.object_:
                     values = lib.maybe_convert_objects(values)
 
             # if we have the labels, extract the values with a mask
             if labels is not None:
                 mask = labels == -1
-                values = values.take(labels)
-                if mask.any():
-                    values, changed = com._maybe_upcast_putmask(values,
-                                                                mask, np.nan)
-            return values
 
-        new_index = np.arange(len(new_obj),dtype='int64')
-        if isinstance(self.index, MultiIndex):
-            if level is not None:
-                if not isinstance(level, (tuple, list)):
-                    level = [level]
-                level = [self.index._get_level_number(lev) for lev in level]
-                if len(level) < len(self.index.levels):
-                    new_index = self.index.droplevel(level)
-
-            if not drop:
-                names = self.index.names
-                zipped = lzip(self.index.levels, self.index.labels)
-
-                multi_col = isinstance(self.columns, MultiIndex)
-                for i, (lev, lab) in reversed(list(enumerate(zipped))):
-                    col_name = names[i]
-                    if col_name is None:
-                        col_name = 'level_%d' % i
-
-                    if multi_col:
-                        if col_fill is None:
-                            col_name = tuple([col_name] *
-                                             self.columns.nlevels)
-                        else:
-                            name_lst = [col_fill] * self.columns.nlevels
-                            lev_num = self.columns._get_level_number(col_level)
-                            name_lst[lev_num] = col_name
-                            col_name = tuple(name_lst)
-
-                    # to ndarray and maybe infer different dtype
-                    level_values = _maybe_casted_values(lev, lab)
-                    if level is None or i in level:
-                        new_obj.insert(0, col_name, level_values)
-
-        elif not drop:
-            name = self.index.name
-            if name is None or name == 'index':
-                name = 'index' if 'index' not in self else 'level_0'
-            if isinstance(self.columns, MultiIndex):
-                if col_fill is None:
-                    name = tuple([name] * self.columns.nlevels)
+                # we can have situations where the whole mask is -1,
+                # meaning there is nothing found in labels, so make all nan's
+                if mask.all():
+                    values = np.empty(len(mask))
+                    values.fill(np.nan)
                 else:
-                    name_lst = [col_fill] * self.columns.nlevels
+                    values = values.take(labels)
+                    if mask.any():
+                        values, changed = maybe_upcast_putmask(
+                            values, mask, np.nan)
+            return values
+
+        new_index = com._default_index(len(new_obj))
+        if level is not None:
+            if not isinstance(level, (tuple, list)):
+                level = [level]
+            level = [self.index._get_level_number(lev) for lev in level]
+            if len(level) < self.index.nlevels:
+                new_index = self.index.droplevel(level)
+
+        if not drop:
+            if isinstance(self.index, MultiIndex):
+                names = [n if n is not None else ('level_%d' % i)
+                         for (i, n) in enumerate(self.index.names)]
+                to_insert = lzip(self.index.levels, self.index.labels)
+            else:
+                default = 'index' if 'index' not in self else 'level_0'
+                names = ([default] if self.index.name is None
+                         else [self.index.name])
+                to_insert = ((self.index, None),)
+
+            multi_col = isinstance(self.columns, MultiIndex)
+            for i, (lev, lab) in reversed(list(enumerate(to_insert))):
+                if not (level is None or i in level):
+                    continue
+                name = names[i]
+                if multi_col:
+                    col_name = (list(name) if isinstance(name, tuple)
+                                else [name])
+                    if col_fill is None:
+                        if len(col_name) not in (1, self.columns.nlevels):
+                            raise ValueError("col_fill=None is incompatible "
+                                             "with incomplete column name "
+                                             "{}".format(name))
+                        col_fill = col_name[0]
+
                     lev_num = self.columns._get_level_number(col_level)
-                    name_lst[lev_num] = name
+                    name_lst = [col_fill] * lev_num + col_name
+                    missing = self.columns.nlevels - len(name_lst)
+                    name_lst += [col_fill] * missing
                     name = tuple(name_lst)
-            values = _maybe_casted_values(self.index)
-            new_obj.insert(0, name, values)
+                # to ndarray and maybe infer different dtype
+                level_values = _maybe_casted_values(lev, lab)
+                new_obj.insert(0, name, level_values)
 
         new_obj.index = new_index
         if not inplace:
             return new_obj
 
-
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Reindex-based selection methods
 
+    @Appender(_shared_docs['isna'] % _shared_doc_kwargs)
+    def isna(self):
+        return super(DataFrame, self).isna()
+
+    @Appender(_shared_docs['isna'] % _shared_doc_kwargs)
+    def isnull(self):
+        return super(DataFrame, self).isnull()
+
+    @Appender(_shared_docs['notna'] % _shared_doc_kwargs)
+    def notna(self):
+        return super(DataFrame, self).notna()
+
+    @Appender(_shared_docs['notna'] % _shared_doc_kwargs)
+    def notnull(self):
+        return super(DataFrame, self).notnull()
+
     def dropna(self, axis=0, how='any', thresh=None, subset=None,
                inplace=False):
         """
-        Return object with labels on given axis omitted where alternately any
-        or all of the data are missing
+        Remove missing values.
+
+        See the :ref:`User Guide <missing_data>` for more on which values are
+        considered missing, and how to work with missing data.
 
         Parameters
         ----------
-        axis : {0 or 'index', 1 or 'columns'}, or tuple/list thereof
-            Pass tuple or list to drop on multiple axes
-        how : {'any', 'all'}
-            * any : if any NA values are present, drop that label
-            * all : if all values are NA, drop that label
-        thresh : int, default None
-            int value : require that many non-NA values
-        subset : array-like
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            Determine if rows or columns which contain missing values are
+            removed.
+
+            * 0, or 'index' : Drop rows which contain missing values.
+            * 1, or 'columns' : Drop columns which contain missing value.
+
+            .. deprecated:: 0.23.0
+                Pass tuple or list to drop on multiple axes.
+                Only a single axis is allowed.
+
+        how : {'any', 'all'}, default 'any'
+            Determine if row or column is removed from DataFrame, when we have
+            at least one NA or all NA.
+
+            * 'any' : If any NA values are present, drop that row or column.
+            * 'all' : If all values are NA, drop that row or column.
+        thresh : int, optional
+            Require that many non-NA values.
+        subset : array-like, optional
             Labels along other axis to consider, e.g. if you are dropping rows
-            these would be a list of columns to include
-        inplace : boolean, defalt False
+            these would be a list of columns to include.
+        inplace : bool, default False
             If True, do operation inplace and return None.
 
         Returns
         -------
-        dropped : DataFrame
+        DataFrame
+            DataFrame with NA entries dropped from it.
+
+        See Also
+        --------
+        DataFrame.isna: Indicate missing values.
+        DataFrame.notna : Indicate existing (non-missing) values.
+        DataFrame.fillna : Replace missing values.
+        Series.dropna : Drop missing values.
+        Index.dropna : Drop missing indices.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({"name": ['Alfred', 'Batman', 'Catwoman'],
+        ...                    "toy": [np.nan, 'Batmobile', 'Bullwhip'],
+        ...                    "born": [pd.NaT, pd.Timestamp("1940-04-25"),
+        ...                             pd.NaT]})
+        >>> df
+               name        toy       born
+        0    Alfred        NaN        NaT
+        1    Batman  Batmobile 1940-04-25
+        2  Catwoman   Bullwhip        NaT
+
+        Drop the rows where at least one element is missing.
+
+        >>> df.dropna()
+             name        toy       born
+        1  Batman  Batmobile 1940-04-25
+
+        Drop the columns where at least one element is missing.
+
+        >>> df.dropna(axis='columns')
+               name
+        0    Alfred
+        1    Batman
+        2  Catwoman
+
+        Drop the rows where all elements are missing.
+
+        >>> df.dropna(how='all')
+               name        toy       born
+        0    Alfred        NaN        NaT
+        1    Batman  Batmobile 1940-04-25
+        2  Catwoman   Bullwhip        NaT
+
+        Keep only the rows with at least 2 non-NA values.
+
+        >>> df.dropna(thresh=2)
+               name        toy       born
+        1    Batman  Batmobile 1940-04-25
+        2  Catwoman   Bullwhip        NaT
+
+        Define in which columns to look for missing values.
+
+        >>> df.dropna(subset=['name', 'born'])
+               name        toy       born
+        1    Batman  Batmobile 1940-04-25
+
+        Keep the DataFrame with valid entries in the same variable.
+
+        >>> df.dropna(inplace=True)
+        >>> df
+             name        toy       born
+        1  Batman  Batmobile 1940-04-25
         """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
         if isinstance(axis, (tuple, list)):
+            # GH20987
+            msg = ("supplying multiple axes to axis is deprecated and "
+                   "will be removed in a future version.")
+            warnings.warn(msg, FutureWarning, stacklevel=2)
+
             result = self
             for ax in axis:
-                result = result.dropna(how=how, thresh=thresh,
-                                       subset=subset, axis=ax)
+                result = result.dropna(how=how, thresh=thresh, subset=subset,
+                                       axis=ax)
         else:
             axis = self._get_axis_number(axis)
             agg_axis = 1 - axis
@@ -2903,8 +4290,8 @@ def dropna(self, axis=0, how='any', thresh=None, subset=None,
                 indices = ax.get_indexer_for(subset)
                 check = indices == -1
                 if check.any():
-                    raise KeyError(list(np.compress(check,subset)))
-                agg_obj = self.take(indices,axis=agg_axis)
+                    raise KeyError(list(np.compress(check, subset)))
+                agg_obj = self.take(indices, axis=agg_axis)
 
             count = agg_obj.count(axis=agg_axis)
 
@@ -2916,19 +4303,17 @@ def dropna(self, axis=0, how='any', thresh=None, subset=None,
                 mask = count > 0
             else:
                 if how is not None:
-                    raise ValueError('invalid how option: %s' % how)
+                    raise ValueError('invalid how option: {h}'.format(h=how))
                 else:
                     raise TypeError('must specify how or thresh')
 
-            result = self.take(mask.nonzero()[0], axis=axis, convert=False)
+            result = self._take(mask.nonzero()[0], axis=axis)
 
         if inplace:
             self._update_inplace(result)
         else:
             return result
 
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
-    @deprecate_kwarg(old_arg_name='cols', new_arg_name='subset', stacklevel=3)
     def drop_duplicates(self, subset=None, keep='first', inplace=False):
         """
         Return DataFrame with duplicate rows removed, optionally only
@@ -2943,15 +4328,14 @@ def drop_duplicates(self, subset=None, keep='first', inplace=False):
             - ``first`` : Drop duplicates except for the first occurrence.
             - ``last`` : Drop duplicates except for the last occurrence.
             - False : Drop all duplicates.
-        take_last : deprecated
         inplace : boolean, default False
             Whether to drop duplicates in place or to return a copy
-        cols : kwargs only argument of subset [deprecated]
 
         Returns
         -------
         deduplicated : DataFrame
         """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
         duplicated = self.duplicated(subset, keep=keep)
 
         if inplace:
@@ -2961,8 +4345,6 @@ def drop_duplicates(self, subset=None, keep='first', inplace=False):
         else:
             return self[-duplicated]
 
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
-    @deprecate_kwarg(old_arg_name='cols', new_arg_name='subset', stacklevel=3)
     def duplicated(self, subset=None, keep='first'):
         """
         Return boolean Series denoting duplicate rows, optionally only
@@ -2979,210 +4361,161 @@ def duplicated(self, subset=None, keep='first'):
             - ``last`` : Mark duplicates as ``True`` except for the
               last occurrence.
             - False : Mark all duplicates as ``True``.
-        take_last : deprecated
-        cols : kwargs only argument of subset [deprecated]
 
         Returns
         -------
         duplicated : Series
         """
-        from pandas.core.groupby import get_group_index
-        from pandas.core.algorithms import factorize
-        from pandas.hashtable import duplicated_int64, _SIZE_HINT_LIMIT
+        from pandas.core.sorting import get_group_index
+        from pandas._libs.hashtable import duplicated_int64, _SIZE_HINT_LIMIT
 
         def f(vals):
-
-            # if we have integers we can directly index with these
-            if com.is_integer_dtype(vals):
-                from pandas.core.nanops import unique1d
-                labels, shape = vals, unique1d(vals)
-            else:
-                labels, shape = factorize(vals, size_hint=min(len(self), _SIZE_HINT_LIMIT))
-            return labels.astype('i8',copy=False), len(shape)
+            labels, shape = algorithms.factorize(
+                vals, size_hint=min(len(self), _SIZE_HINT_LIMIT))
+            return labels.astype('i8', copy=False), len(shape)
 
         if subset is None:
             subset = self.columns
-        elif not np.iterable(subset) or \
-                isinstance(subset, compat.string_types) or \
-                isinstance(subset, tuple) and subset in self.columns:
+        elif (not np.iterable(subset) or
+              isinstance(subset, compat.string_types) or
+              isinstance(subset, tuple) and subset in self.columns):
             subset = subset,
 
-        vals = (self[col].values for col in subset)
-        labels, shape = map(list, zip( * map(f, vals)))
+        # Verify all columns in subset exist in the queried dataframe
+        # Otherwise, raise a KeyError, same as if you try to __getitem__ with a
+        # key that doesn't exist.
+        diff = Index(subset).difference(self.columns)
+        if not diff.empty:
+            raise KeyError(diff)
+
+        vals = (col.values for name, col in self.iteritems()
+                if name in subset)
+        labels, shape = map(list, zip(*map(f, vals)))
 
         ids = get_group_index(labels, shape, sort=False, xnull=False)
         return Series(duplicated_int64(ids, keep), index=self.index)
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Sorting
 
     @Appender(_shared_docs['sort_values'] % _shared_doc_kwargs)
     def sort_values(self, by, axis=0, ascending=True, inplace=False,
                     kind='quicksort', na_position='last'):
-
+        inplace = validate_bool_kwarg(inplace, 'inplace')
         axis = self._get_axis_number(axis)
-        labels = self._get_axis(axis)
+        stacklevel = 2  # Number of stack levels from df.sort_values
 
-        if axis != 0:
-            raise ValueError('When sorting by column, axis must be 0 '
-                             '(rows)')
         if not isinstance(by, list):
             by = [by]
-        if com.is_sequence(ascending) and len(by) != len(ascending):
-            raise ValueError('Length of ascending (%d) != length of by'
-                             ' (%d)' % (len(ascending), len(by)))
+        if is_sequence(ascending) and len(by) != len(ascending):
+            raise ValueError('Length of ascending (%d) != length of by (%d)' %
+                             (len(ascending), len(by)))
         if len(by) > 1:
-            from pandas.core.groupby import _lexsort_indexer
+            from pandas.core.sorting import lexsort_indexer
 
-            def trans(v):
-                if com.needs_i8_conversion(v):
-                    return v.view('i8')
-                return v
             keys = []
             for x in by:
-                k = self[x].values
-                if k.ndim == 2:
-                    raise ValueError('Cannot sort by duplicate column %s' % str(x))
-                keys.append(trans(k))
-            indexer = _lexsort_indexer(keys, orders=ascending,
-                                       na_position=na_position)
-            indexer = com._ensure_platform_int(indexer)
+                k = self._get_label_or_level_values(x, axis=axis,
+                                                    stacklevel=stacklevel)
+                keys.append(k)
+            indexer = lexsort_indexer(keys, orders=ascending,
+                                      na_position=na_position)
+            indexer = _ensure_platform_int(indexer)
         else:
-            from pandas.core.groupby import _nargsort
+            from pandas.core.sorting import nargsort
 
             by = by[0]
-            k = self[by].values
-            if k.ndim == 2:
-
-                # try to be helpful
-                if isinstance(self.columns, MultiIndex):
-                    raise ValueError('Cannot sort by column %s in a multi-index'
-                                     '  you need to explicity provide all the levels'
-                                     % str(by))
+            k = self._get_label_or_level_values(by, axis=axis,
+                                                stacklevel=stacklevel)
 
-                raise ValueError('Cannot sort by duplicate column %s'
-                                 % str(by))
             if isinstance(ascending, (tuple, list)):
                 ascending = ascending[0]
 
-            indexer = _nargsort(k, kind=kind, ascending=ascending,
-                                na_position=na_position)
+            indexer = nargsort(k, kind=kind, ascending=ascending,
+                               na_position=na_position)
 
-        new_data = self._data.take(indexer, axis=self._get_block_manager_axis(axis),
-                                   convert=False, verify=False)
+        new_data = self._data.take(indexer,
+                                   axis=self._get_block_manager_axis(axis),
+                                   verify=False)
 
         if inplace:
             return self._update_inplace(new_data)
         else:
             return self._constructor(new_data).__finalize__(self)
 
-    def sort(self, columns=None, axis=0, ascending=True,
-             inplace=False, kind='quicksort', na_position='last'):
-        """
-        DEPRECATED: use :meth:`DataFrame.sort_values`
-
-        Sort DataFrame either by labels (along either axis) or by the values in
-        column(s)
-
-        Parameters
-        ----------
-        columns : object
-            Column name(s) in frame. Accepts a column name or a list
-            for a nested sort. A tuple will be interpreted as the
-            levels of a multi-index.
-        ascending : boolean or list, default True
-            Sort ascending vs. descending. Specify list for multiple sort
-            orders
-        axis : {0 or 'index', 1 or 'columns'}, default 0
-            Sort index/rows versus columns
-        inplace : boolean, default False
-            Sort the DataFrame without creating a new instance
-        kind : {'quicksort', 'mergesort', 'heapsort'}, optional
-            This option is only applied when sorting on a single column or label.
-        na_position : {'first', 'last'} (optional, default='last')
-            'first' puts NaNs at the beginning
-            'last' puts NaNs at the end
-
-        Examples
-        --------
-        >>> result = df.sort(['A', 'B'], ascending=[1, 0])
-
-        Returns
-        -------
-        sorted : DataFrame
-        """
-
-        if columns is None:
-            warnings.warn("sort(....) is deprecated, use sort_index(.....)",
-                          FutureWarning, stacklevel=2)
-            return self.sort_index(axis=axis, ascending=ascending, inplace=inplace)
-
-        warnings.warn("sort(columns=....) is deprecated, use sort_values(by=.....)",
-                      FutureWarning, stacklevel=2)
-        return self.sort_values(by=columns, axis=axis, ascending=ascending,
-                                inplace=inplace, kind=kind, na_position=na_position)
-
     @Appender(_shared_docs['sort_index'] % _shared_doc_kwargs)
     def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
-                   kind='quicksort', na_position='last', sort_remaining=True, by=None):
+                   kind='quicksort', na_position='last', sort_remaining=True,
+                   by=None):
 
+        # TODO: this can be combined with Series.sort_index impl as
+        # almost identical
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
         # 10726
         if by is not None:
-            warnings.warn("by argument to sort_index is deprecated, pls use .sort_values(by=...)",
+            warnings.warn("by argument to sort_index is deprecated, "
+                          "please use .sort_values(by=...)",
                           FutureWarning, stacklevel=2)
             if level is not None:
                 raise ValueError("unable to simultaneously sort by and level")
-            return self.sort_values(by, axis=axis, ascending=ascending, inplace=inplace)
-
+            return self.sort_values(by, axis=axis, ascending=ascending,
+                                    inplace=inplace)
 
         axis = self._get_axis_number(axis)
         labels = self._get_axis(axis)
 
-        # sort by the index
+        # make sure that the axis is lexsorted to start
+        # if not we need to reconstruct to get the correct indexer
+        labels = labels._sort_levels_monotonic()
         if level is not None:
 
             new_axis, indexer = labels.sortlevel(level, ascending=ascending,
                                                  sort_remaining=sort_remaining)
 
         elif isinstance(labels, MultiIndex):
-            from pandas.core.groupby import _lexsort_indexer
+            from pandas.core.sorting import lexsort_indexer
 
-            # make sure that the axis is lexsorted to start
-            # if not we need to reconstruct to get the correct indexer
-            if not labels.is_lexsorted():
-                labels = MultiIndex.from_tuples(labels.values)
-
-            indexer = _lexsort_indexer(labels.labels, orders=ascending,
-                                       na_position=na_position)
+            indexer = lexsort_indexer(labels._get_labels_for_sorting(),
+                                      orders=ascending,
+                                      na_position=na_position)
         else:
-            from pandas.core.groupby import _nargsort
+            from pandas.core.sorting import nargsort
 
-            # GH11080 - Check monotonic-ness before sort an index
-            # if monotonic (already sorted), return None or copy() according to 'inplace'
-            if (ascending and labels.is_monotonic_increasing) or \
-               (not ascending and labels.is_monotonic_decreasing):
+            # Check monotonic-ness before sort an index
+            # GH11080
+            if ((ascending and labels.is_monotonic_increasing) or
+                    (not ascending and labels.is_monotonic_decreasing)):
                 if inplace:
                     return
                 else:
                     return self.copy()
 
-            indexer = _nargsort(labels, kind=kind, ascending=ascending,
-                                na_position=na_position)
+            indexer = nargsort(labels, kind=kind, ascending=ascending,
+                               na_position=na_position)
+
+        baxis = self._get_block_manager_axis(axis)
+        new_data = self._data.take(indexer,
+                                   axis=baxis,
+                                   verify=False)
 
-        new_data = self._data.take(indexer, axis=self._get_block_manager_axis(axis),
-                                   convert=False, verify=False)
+        # reconstruct axis if needed
+        new_data.axes[baxis] = new_data.axes[baxis]._sort_levels_monotonic()
 
         if inplace:
             return self._update_inplace(new_data)
         else:
             return self._constructor(new_data).__finalize__(self)
 
-    def sortlevel(self, level=0, axis=0, ascending=True,
-                  inplace=False, sort_remaining=True):
-        """
-        Sort multilevel index by chosen axis and primary level. Data will be
+    def sortlevel(self, level=0, axis=0, ascending=True, inplace=False,
+                  sort_remaining=True):
+        """Sort multilevel index by chosen axis and primary level. Data will be
         lexicographically sorted by the chosen level followed by the other
-        levels (in order)
+        levels (in order).
+
+        .. deprecated:: 0.20.0
+            Use :meth:`DataFrame.sort_index`
+
 
         Parameters
         ----------
@@ -3203,58 +4536,123 @@ def sortlevel(self, level=0, axis=0, ascending=True,
         DataFrame.sort_index(level=...)
 
         """
+        warnings.warn("sortlevel is deprecated, use sort_index(level= ...)",
+                      FutureWarning, stacklevel=2)
         return self.sort_index(level=level, axis=axis, ascending=ascending,
                                inplace=inplace, sort_remaining=sort_remaining)
 
-
-    def _nsorted(self, columns, n, method, keep):
-        if not com.is_list_like(columns):
-            columns = [columns]
-        columns = list(columns)
-        ser = getattr(self[columns[0]], method)(n, keep=keep)
-        ascending = dict(nlargest=False, nsmallest=True)[method]
-        return self.loc[ser.index].sort_values(columns, ascending=ascending,
-                                               kind='mergesort')
-
     def nlargest(self, n, columns, keep='first'):
-        """Get the rows of a DataFrame sorted by the `n` largest
-        values of `columns`.
+        """
+        Return the first `n` rows ordered by `columns` in descending order.
 
-        .. versionadded:: 0.17.0
+        Return the first `n` rows with the largest values in `columns`, in
+        descending order. The columns that are not specified are returned as
+        well, but not used for ordering.
+
+        This method is equivalent to
+        ``df.sort_values(columns, ascending=False).head(n)``, but more
+        performant.
 
         Parameters
         ----------
         n : int
-            Number of items to retrieve
-        columns : list or str
-            Column name or names to order by
-        keep : {'first', 'last', False}, default 'first'
+            Number of rows to return.
+        columns : label or list of labels
+            Column label(s) to order by.
+        keep : {'first', 'last', 'all'}, default 'first'
             Where there are duplicate values:
-            - ``first`` : take the first occurrence.
-            - ``last`` : take the last occurrence.
+
+            - `first` : prioritize the first occurrence(s)
+            - `last` : prioritize the last occurrence(s)
+            - ``all`` : do not drop any duplicates, even it means
+                        selecting more than `n` items.
+
+            .. versionadded:: 0.24.0
 
         Returns
         -------
         DataFrame
+            The first `n` rows ordered by the given columns in descending
+            order.
 
-        Examples
+        See Also
         --------
-        >>> df = DataFrame({'a': [1, 10, 8, 11, -1],
-        ...                 'b': list('abdce'),
-        ...                 'c': [1.0, 2.0, np.nan, 3.0, 4.0]})
-        >>> df.nlargest(3, 'a')
-            a  b   c
-        3  11  c   3
-        1  10  b   2
-        2   8  d NaN
-        """
-        return self._nsorted(columns, n, 'nlargest', keep)
+        DataFrame.nsmallest : Return the first `n` rows ordered by `columns` in
+            ascending order.
+        DataFrame.sort_values : Sort DataFrame by the values
+        DataFrame.head : Return the first `n` rows without re-ordering.
 
-    def nsmallest(self, n, columns, keep='first'):
-        """Get the rows of a DataFrame sorted by the `n` smallest
-        values of `columns`.
+        Notes
+        -----
+        This function cannot be used with all column types. For example, when
+        specifying columns with `object` or `category` dtypes, ``TypeError`` is
+        raised.
 
-        .. versionadded:: 0.17.0
+        Examples
+        --------
+        >>> df = pd.DataFrame({'a': [1, 10, 8, 11, 8, 2],
+        ...                    'b': list('abdcef'),
+        ...                    'c': [1.0, 2.0, np.nan, 3.0, 4.0, 9.0]})
+        >>> df
+            a  b    c
+        0   1  a  1.0
+        1  10  b  2.0
+        2   8  d  NaN
+        3  11  c  3.0
+        4   8  e  4.0
+        5   2  f  9.0
+
+        In the following example, we will use ``nlargest`` to select the three
+        rows having the largest values in column "a".
+
+        >>> df.nlargest(3, 'a')
+            a  b    c
+        3  11  c  3.0
+        1  10  b  2.0
+        2   8  d  NaN
+
+        When using ``keep='last'``, ties are resolved in reverse order:
+
+        >>> df.nlargest(3, 'a', keep='last')
+            a  b    c
+        3  11  c  3.0
+        1  10  b  2.0
+        4   8  e  4.0
+
+        When using ``keep='all'``, all duplicate items are maintained:
+
+        >>> df.nlargest(3, 'a', keep='all')
+            a  b    c
+        3  11  c  3.0
+        1  10  b  2.0
+        2   8  d  NaN
+        4   8  e  4.0
+
+        To order by the largest values in column "a" and then "c", we can
+        specify multiple columns like in the next example.
+
+        >>> df.nlargest(3, ['a', 'c'])
+            a  b    c
+        4   8  e  4.0
+        3  11  c  3.0
+        1  10  b  2.0
+
+        Attempting to use ``nlargest`` on non-numeric dtypes will raise a
+        ``TypeError``:
+
+        >>> df.nlargest(3, 'b')
+
+        Traceback (most recent call last):
+        TypeError: Column 'b' has dtype object, cannot use method 'nlargest'
+        """
+        return algorithms.SelectNFrame(self,
+                                       n=n,
+                                       keep=keep,
+                                       columns=columns).nlargest()
+
+    def nsmallest(self, n, columns, keep='first'):
+        """Get the rows of a DataFrame sorted by the `n` smallest
+        values of `columns`.
 
         Parameters
         ----------
@@ -3262,10 +4660,14 @@ def nsmallest(self, n, columns, keep='first'):
             Number of items to retrieve
         columns : list or str
             Column name or names to order by
-        keep : {'first', 'last', False}, default 'first'
+        keep : {'first', 'last', 'all'}, default 'first'
             Where there are duplicate values:
             - ``first`` : take the first occurrence.
             - ``last`` : take the last occurrence.
+            - ``all`` : do not drop any duplicates, even it means
+                        selecting more than `n` items.
+
+            .. versionadded:: 0.24.0
 
         Returns
         -------
@@ -3273,18 +4675,67 @@ def nsmallest(self, n, columns, keep='first'):
 
         Examples
         --------
-        >>> df = DataFrame({'a': [1, 10, 8, 11, -1],
-        ...                 'b': list('abdce'),
-        ...                 'c': [1.0, 2.0, np.nan, 3.0, 4.0]})
+        >>> df = pd.DataFrame({'a': [1, 10, 8, 11, 8, 2],
+        ...                    'b': list('abdcef'),
+        ...                    'c': [1.0, 2.0, np.nan, 3.0, 4.0, 9.0]})
+        >>> df
+            a  b    c
+        0   1  a  1.0
+        1  10  b  2.0
+        2   8  d  NaN
+        3  11  c  3.0
+        4   8  e  4.0
+        5   2  f  9.0
+
+        In the following example, we will use ``nsmallest`` to select the
+        three rows having the smallest values in column "a".
+
         >>> df.nsmallest(3, 'a')
-           a  b   c
-        4 -1  e   4
-        0  1  a   1
-        2  8  d NaN
+           a  b    c
+        0  1  a  1.0
+        5  2  f  9.0
+        2  8  d  NaN
+
+        When using ``keep='last'``, ties are resolved in reverse order:
+
+        >>> df.nsmallest(3, 'a', keep='last')
+           a  b    c
+        0  1  a  1.0
+        5  2  f  9.0
+        4  8  e  4.0
+
+        When using ``keep='all'``, all duplicate items are maintained:
+
+        >>> df.nsmallest(3, 'a', keep='all')
+           a  b    c
+        0  1  a  1.0
+        5  2  f  9.0
+        2  8  d  NaN
+        4  8  e  4.0
+
+        To order by the largest values in column "a" and then "c", we can
+        specify multiple columns like in the next example.
+
+        >>> df.nsmallest(3, ['a', 'c'])
+           a  b    c
+        0  1  a  1.0
+        5  2  f  9.0
+        4  8  e  4.0
+
+        Attempting to use ``nsmallest`` on non-numeric dtypes will raise a
+        ``TypeError``:
+
+        >>> df.nsmallest(3, 'b')
+
+        Traceback (most recent call last):
+        TypeError: Column 'b' has dtype object, cannot use method 'nsmallest'
         """
-        return self._nsorted(columns, n, 'nsmallest', keep)
+        return algorithms.SelectNFrame(self,
+                                       n=n,
+                                       keep=keep,
+                                       columns=columns).nsmallest()
 
-    def swaplevel(self, i, j, axis=0):
+    def swaplevel(self, i=-2, j=-1, axis=0):
         """
         Swap levels i and j in a MultiIndex on a particular axis
 
@@ -3295,7 +4746,13 @@ def swaplevel(self, i, j, axis=0):
 
         Returns
         -------
-        swapped : type of caller (new object)
+        swapped : same type as caller (new object)
+
+        .. versionchanged:: 0.18.1
+
+           The indexes ``i`` and ``j`` are now optional, and default to
+           the two innermost levels of the index.
+
         """
         result = self.copy()
 
@@ -3336,7 +4793,7 @@ def reorder_levels(self, order, axis=0):
             result.columns = result.columns.reorder_levels(order)
         return result
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Arithmetic / combination related
 
     def _combine_frame(self, other, func, fill_value=None, level=None):
@@ -3344,131 +4801,83 @@ def _combine_frame(self, other, func, fill_value=None, level=None):
         new_index, new_columns = this.index, this.columns
 
         def _arith_op(left, right):
-            if fill_value is not None:
-                left_mask = isnull(left)
-                right_mask = isnull(right)
-                left = left.copy()
-                right = right.copy()
-
-                # one but not both
-                mask = left_mask ^ right_mask
-                left[left_mask & mask] = fill_value
-                right[right_mask & mask] = fill_value
-
+            # for the mixed_type case where we iterate over columns,
+            # _arith_op(left, right) is equivalent to
+            # left._binop(right, func, fill_value=fill_value)
+            left, right = ops.fill_binop(left, right, fill_value)
             return func(left, right)
 
         if this._is_mixed_type or other._is_mixed_type:
-
-            # unique
+            # iterate over columns
             if this.columns.is_unique:
-
-                def f(col):
-                    r = _arith_op(this[col].values, other[col].values)
-                    return self._constructor_sliced(r, index=new_index,
-                                                    dtype=r.dtype)
-
-                result = dict([(col, f(col)) for col in this])
-
-            # non-unique
+                # unique columns
+                result = {col: _arith_op(this[col], other[col])
+                          for col in this}
+                result = self._constructor(result, index=new_index,
+                                           columns=new_columns, copy=False)
             else:
-
-                def f(i):
-                    r = _arith_op(this.iloc[:, i].values,
-                                  other.iloc[:, i].values)
-                    return self._constructor_sliced(r, index=new_index,
-                                                    dtype=r.dtype)
-
-                result = dict([
-                    (i, f(i)) for i, col in enumerate(this.columns)
-                ])
+                # non-unique columns
+                result = {i: _arith_op(this.iloc[:, i], other.iloc[:, i])
+                          for i, col in enumerate(this.columns)}
                 result = self._constructor(result, index=new_index, copy=False)
                 result.columns = new_columns
-                return result
+            return result
 
         else:
             result = _arith_op(this.values, other.values)
 
-        return self._constructor(result, index=new_index,
-                                 columns=new_columns, copy=False)
-
-    def _combine_series(self, other, func, fill_value=None, axis=None,
-                        level=None):
-        if axis is not None:
-            axis = self._get_axis_name(axis)
-            if axis == 'index':
-                return self._combine_match_index(other, func, level=level, fill_value=fill_value)
-            else:
-                return self._combine_match_columns(other, func, level=level, fill_value=fill_value)
-        return self._combine_series_infer(other, func, level=level, fill_value=fill_value)
+        return self._constructor(result, index=new_index, columns=new_columns,
+                                 copy=False)
 
-    def _combine_series_infer(self, other, func, level=None, fill_value=None):
-        if len(other) == 0:
-            return self * NA
+    def _combine_match_index(self, other, func, level=None):
+        left, right = self.align(other, join='outer', axis=0, level=level,
+                                 copy=False)
+        new_data = func(left.values.T, right.values).T
+        return self._constructor(new_data,
+                                 index=left.index, columns=self.columns,
+                                 copy=False)
 
-        if len(self) == 0:
-            # Ambiguous case, use _series so works with DataFrame
-            return self._constructor(data=self._series, index=self.index,
-                                     columns=self.columns)
+    def _combine_match_columns(self, other, func, level=None, try_cast=True):
+        left, right = self.align(other, join='outer', axis=1, level=level,
+                                 copy=False)
 
-        return self._combine_match_columns(other, func, level=level, fill_value=fill_value)
-
-    def _combine_match_index(self, other, func, level=None, fill_value=None):
-        left, right = self.align(other, join='outer', axis=0, level=level, copy=False)
-        if fill_value is not None:
-            raise NotImplementedError("fill_value %r not supported." %
-                                      fill_value)
-        return self._constructor(func(left.values.T, right.values).T,
-                                 index=left.index,
-                                 columns=self.columns, copy=False)
-
-    def _combine_match_columns(self, other, func, level=None, fill_value=None):
-        left, right = self.align(other, join='outer', axis=1, level=level, copy=False)
-        if fill_value is not None:
-            raise NotImplementedError("fill_value %r not supported" %
-                                      fill_value)
-
-        new_data = left._data.eval(
-            func=func, other=right, axes=[left.columns, self.index])
+        new_data = left._data.eval(func=func, other=right,
+                                   axes=[left.columns, self.index],
+                                   try_cast=try_cast)
         return self._constructor(new_data)
 
-    def _combine_const(self, other, func, raise_on_error=True):
-        if self.empty:
-            return self
-
-        new_data = self._data.eval(func=func, other=other, raise_on_error=raise_on_error)
+    def _combine_const(self, other, func, errors='raise', try_cast=True):
+        new_data = self._data.eval(func=func, other=other,
+                                   errors=errors,
+                                   try_cast=try_cast)
         return self._constructor(new_data)
 
-    def _compare_frame_evaluate(self, other, func, str_rep):
+    def _compare_frame(self, other, func, str_rep):
+        # compare_frame assumes self._indexed_same(other)
 
+        import pandas.core.computation.expressions as expressions
         # unique
         if self.columns.is_unique:
+
             def _compare(a, b):
-                return dict([(col, func(a[col], b[col])) for col in a.columns])
+                return {col: func(a[col], b[col]) for col in a.columns}
+
             new_data = expressions.evaluate(_compare, str_rep, self, other)
             return self._constructor(data=new_data, index=self.index,
                                      columns=self.columns, copy=False)
         # non-unique
         else:
+
             def _compare(a, b):
-                return dict([(i, func(a.iloc[:, i], b.iloc[:, i]))
-                             for i, col in enumerate(a.columns)])
+                return {i: func(a.iloc[:, i], b.iloc[:, i])
+                        for i, col in enumerate(a.columns)}
+
             new_data = expressions.evaluate(_compare, str_rep, self, other)
             result = self._constructor(data=new_data, index=self.index,
                                        copy=False)
             result.columns = self.columns
             return result
 
-    def _compare_frame(self, other, func, str_rep):
-        if not self._indexed_same(other):
-            raise ValueError('Can only compare identically-labeled '
-                             'DataFrame objects')
-        return self._compare_frame_evaluate(other, func, str_rep)
-
-    def _flex_compare_frame(self, other, func, str_rep, level):
-        if not self._indexed_same(other):
-            self, other = self.align(other, 'outer', level=level, copy=False)
-        return self._compare_frame_evaluate(other, func, str_rep)
-
     def combine(self, other, func, fill_value=None, overwrite=True):
         """
         Add two DataFrame objects and do not propagate NaN values, so if for a
@@ -3479,6 +4888,8 @@ def combine(self, other, func, fill_value=None, overwrite=True):
         ----------
         other : DataFrame
         func : function
+            Function that takes two series as inputs and return a Series or a
+            scalar
         fill_value : scalar value
         overwrite : boolean, default True
             If True then overwrite values for common keys in the calling frame
@@ -3486,8 +4897,21 @@ def combine(self, other, func, fill_value=None, overwrite=True):
         Returns
         -------
         result : DataFrame
-        """
 
+        Examples
+        --------
+        >>> df1 = DataFrame({'A': [0, 0], 'B': [4, 4]})
+        >>> df2 = DataFrame({'A': [1, 1], 'B': [3, 3]})
+        >>> df1.combine(df2, lambda s1, s2: s1 if s1.sum() < s2.sum() else s2)
+           A  B
+        0  0  3
+        1  0  3
+
+        See Also
+        --------
+        DataFrame.combine_first : Combine two DataFrame objects and default to
+            non-null values in frame calling the method
+        """
         other_idxlen = len(other.index)  # save for compare
 
         this, other = self.align(other, copy=False)
@@ -3511,11 +4935,11 @@ def combine(self, other, func, fill_value=None, overwrite=True):
             this_dtype = series.dtype
             other_dtype = otherSeries.dtype
 
-            this_mask = isnull(series)
-            other_mask = isnull(otherSeries)
+            this_mask = isna(series)
+            other_mask = isna(otherSeries)
 
             # don't overwrite columns unecessarily
-            # DO propogate if this column is not in the intersection
+            # DO propagate if this column is not in the intersection
             if not overwrite and other_mask.all():
                 result[col] = this[col].copy()
                 continue
@@ -3526,37 +4950,29 @@ def combine(self, other, func, fill_value=None, overwrite=True):
                 series[this_mask] = fill_value
                 otherSeries[other_mask] = fill_value
 
-            # if we have different dtypes, possibily promote
+            # if we have different dtypes, possibly promote
             new_dtype = this_dtype
-            if this_dtype != other_dtype:
-                new_dtype = com._lcd_dtypes(this_dtype, other_dtype)
-                series = series.astype(new_dtype)
-                otherSeries = otherSeries.astype(new_dtype)
+            if not is_dtype_equal(this_dtype, other_dtype):
+                new_dtype = find_common_type([this_dtype, other_dtype])
+                if not is_dtype_equal(this_dtype, new_dtype):
+                    series = series.astype(new_dtype)
+                if not is_dtype_equal(other_dtype, new_dtype):
+                    otherSeries = otherSeries.astype(new_dtype)
 
             # see if we need to be represented as i8 (datetimelike)
             # try to keep us at this dtype
-            needs_i8_conversion = com.needs_i8_conversion(new_dtype)
-            if needs_i8_conversion:
-                this_dtype = new_dtype
+            needs_i8_conversion_i = needs_i8_conversion(new_dtype)
+            if needs_i8_conversion_i:
                 arr = func(series, otherSeries, True)
             else:
                 arr = func(series, otherSeries)
 
-            if do_fill:
-                arr = com.ensure_float(arr)
-                arr[this_mask & other_mask] = NA
-
-            # try to downcast back to the original dtype
-            if needs_i8_conversion:
-                arr = com._possibly_cast_to_datetime(arr, this_dtype)
-            else:
-                arr = com._possibly_downcast_to_dtype(arr, this_dtype)
+            arr = maybe_downcast_to_dtype(arr, this_dtype)
 
             result[col] = arr
 
         # convert_objects just in case
-        return self._constructor(result,
-                                 index=new_index,
+        return self._constructor(result, index=new_index,
                                  columns=new_columns)._convert(datetime=True,
                                                                copy=False)
 
@@ -3570,51 +4986,144 @@ def combine_first(self, other):
         ----------
         other : DataFrame
 
+        Returns
+        -------
+        combined : DataFrame
+
         Examples
         --------
-        a's values prioritized, use values from b to fill holes:
-
-        >>> a.combine_first(b)
+        df1's values prioritized, use values from df2 to fill holes:
 
+        >>> df1 = pd.DataFrame([[1, np.nan]])
+        >>> df2 = pd.DataFrame([[3, 4]])
+        >>> df1.combine_first(df2)
+           0    1
+        0  1  4.0
 
-        Returns
-        -------
-        combined : DataFrame
+        See Also
+        --------
+        DataFrame.combine : Perform series-wise operation on two DataFrames
+            using a given function
         """
+        import pandas.core.computation.expressions as expressions
+
         def combiner(x, y, needs_i8_conversion=False):
             x_values = x.values if hasattr(x, 'values') else x
             y_values = y.values if hasattr(y, 'values') else y
             if needs_i8_conversion:
-                mask = isnull(x)
+                mask = isna(x)
                 x_values = x_values.view('i8')
                 y_values = y_values.view('i8')
             else:
-                mask = isnull(x_values)
+                mask = isna(x_values)
 
-            return expressions.where(mask, y_values, x_values,
-                                     raise_on_error=True)
+            return expressions.where(mask, y_values, x_values)
 
         return self.combine(other, combiner, overwrite=False)
 
     def update(self, other, join='left', overwrite=True, filter_func=None,
                raise_conflict=False):
         """
-        Modify DataFrame in place using non-NA values from passed
-        DataFrame. Aligns on indices
+        Modify in place using non-NA values from another DataFrame.
+
+        Aligns on indices. There is no return value.
 
         Parameters
         ----------
         other : DataFrame, or object coercible into a DataFrame
+            Should have at least one matching index/column label
+            with the original DataFrame. If a Series is passed,
+            its name attribute must be set, and that will be
+            used as the column name to align with the original DataFrame.
         join : {'left'}, default 'left'
-        overwrite : boolean, default True
-            If True then overwrite values for common keys in the calling frame
-        filter_func : callable(1d-array) -> 1d-array<boolean>, default None
+            Only left join is implemented, keeping the index and columns of the
+            original object.
+        overwrite : bool, default True
+            How to handle non-NA values for overlapping keys:
+
+            * True: overwrite original DataFrame's values
+              with values from `other`.
+            * False: only update values that are NA in
+              the original DataFrame.
+
+        filter_func : callable(1d-array) -> boolean 1d-array, optional
             Can choose to replace values other than NA. Return True for values
-            that should be updated
-        raise_conflict : boolean
-            If True, will raise an error if the DataFrame and other both
-            contain data in the same place.
+            that should be updated.
+        raise_conflict : bool, default False
+            If True, will raise a ValueError if the DataFrame and `other`
+            both contain non-NA data in the same place.
+
+        Raises
+        ------
+        ValueError
+            When `raise_conflict` is True and there's overlapping non-NA data.
+
+        See Also
+        --------
+        dict.update : Similar method for dictionaries.
+        DataFrame.merge : For column(s)-on-columns(s) operations.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'A': [1, 2, 3],
+        ...                    'B': [400, 500, 600]})
+        >>> new_df = pd.DataFrame({'B': [4, 5, 6],
+        ...                        'C': [7, 8, 9]})
+        >>> df.update(new_df)
+        >>> df
+           A  B
+        0  1  4
+        1  2  5
+        2  3  6
+
+        The DataFrame's length does not increase as a result of the update,
+        only values at matching index/column labels are updated.
+
+        >>> df = pd.DataFrame({'A': ['a', 'b', 'c'],
+        ...                    'B': ['x', 'y', 'z']})
+        >>> new_df = pd.DataFrame({'B': ['d', 'e', 'f', 'g', 'h', 'i']})
+        >>> df.update(new_df)
+        >>> df
+           A  B
+        0  a  d
+        1  b  e
+        2  c  f
+
+        For Series, it's name attribute must be set.
+
+        >>> df = pd.DataFrame({'A': ['a', 'b', 'c'],
+        ...                    'B': ['x', 'y', 'z']})
+        >>> new_column = pd.Series(['d', 'e'], name='B', index=[0, 2])
+        >>> df.update(new_column)
+        >>> df
+           A  B
+        0  a  d
+        1  b  y
+        2  c  e
+        >>> df = pd.DataFrame({'A': ['a', 'b', 'c'],
+        ...                    'B': ['x', 'y', 'z']})
+        >>> new_df = pd.DataFrame({'B': ['d', 'e']}, index=[1, 2])
+        >>> df.update(new_df)
+        >>> df
+           A  B
+        0  a  x
+        1  b  d
+        2  c  e
+
+        If `other` contains NaNs the corresponding values are not updated
+        in the original dataframe.
+
+        >>> df = pd.DataFrame({'A': [1, 2, 3],
+        ...                    'B': [400, 500, 600]})
+        >>> new_df = pd.DataFrame({'B': [4, np.nan, 6]})
+        >>> df.update(new_df)
+        >>> df
+           A      B
+        0  1    4.0
+        1  2  500.0
+        2  3    6.0
         """
+        import pandas.core.computation.expressions as expressions
         # TODO: Support other joins
         if join != 'left':  # pragma: no cover
             raise NotImplementedError("Only left join is supported")
@@ -3628,137 +5137,415 @@ def update(self, other, join='left', overwrite=True, filter_func=None,
             this = self[col].values
             that = other[col].values
             if filter_func is not None:
-                mask = ~filter_func(this) | isnull(that)
+                with np.errstate(all='ignore'):
+                    mask = ~filter_func(this) | isna(that)
             else:
                 if raise_conflict:
-                    mask_this = notnull(that)
-                    mask_that = notnull(this)
+                    mask_this = notna(that)
+                    mask_that = notna(this)
                     if any(mask_this & mask_that):
                         raise ValueError("Data overlaps.")
 
                 if overwrite:
-                    mask = isnull(that)
-
-                    # don't overwrite columns unecessarily
-                    if mask.all():
-                        continue
+                    mask = isna(that)
                 else:
-                    mask = notnull(this)
-
-            self[col] = expressions.where(
-                mask, this, that, raise_on_error=True)
+                    mask = notna(this)
 
-    #----------------------------------------------------------------------
-    # Misc methods
-
-    def first_valid_index(self):
-        """
-        Return label for first non-NA/null value
-        """
-        return self.index[self.count(1) > 0][0]
+            # don't overwrite columns unecessarily
+            if mask.all():
+                continue
 
-    def last_valid_index(self):
-        """
-        Return label for last non-NA/null value
-        """
-        return self.index[self.count(1) > 0][-1]
+            self[col] = expressions.where(mask, this, that)
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Data reshaping
 
     def pivot(self, index=None, columns=None, values=None):
         """
+        Return reshaped DataFrame organized by given index / column values.
+
         Reshape data (produce a "pivot" table) based on column values. Uses
-        unique values from index / columns to form axes and return either
-        DataFrame or Panel, depending on whether you request a single value
-        column (DataFrame) or all columns (Panel)
+        unique values from specified `index` / `columns` to form axes of the
+        resulting DataFrame. This function does not support data
+        aggregation, multiple values will result in a MultiIndex in the
+        columns. See the :ref:`User Guide <reshaping>` for more on reshaping.
 
         Parameters
         ----------
         index : string or object, optional
-            Column name to use to make new frame's index. If None, uses
+            Column to use to make new frame's index. If None, uses
             existing index.
         columns : string or object
-            Column name to use to make new frame's columns
-        values : string or object, optional
-            Column name to use for populating new frame's values
+            Column to use to make new frame's columns.
+        values : string, object or a list of the previous, optional
+            Column(s) to use for populating new frame's values. If not
+            specified, all remaining columns will be used and the result will
+            have hierarchically indexed columns.
+
+            .. versionchanged :: 0.23.0
+               Also accept list of column names.
+
+        Returns
+        -------
+        DataFrame
+            Returns reshaped DataFrame.
+
+        Raises
+        ------
+        ValueError:
+            When there are any `index`, `columns` combinations with multiple
+            values. `DataFrame.pivot_table` when you need to aggregate.
+
+        See Also
+        --------
+        DataFrame.pivot_table : generalization of pivot that can handle
+            duplicate values for one index/column pair.
+        DataFrame.unstack : pivot based on the index values instead of a
+            column.
 
         Notes
         -----
         For finer-tuned control, see hierarchical indexing documentation along
-        with the related stack/unstack methods
+        with the related stack/unstack methods.
 
         Examples
         --------
+        >>> df = pd.DataFrame({'foo': ['one', 'one', 'one', 'two', 'two',
+        ...                            'two'],
+        ...                    'bar': ['A', 'B', 'C', 'A', 'B', 'C'],
+        ...                    'baz': [1, 2, 3, 4, 5, 6],
+        ...                    'zoo': ['x', 'y', 'z', 'q', 'w', 't']})
         >>> df
-            foo   bar  baz
-        0   one   A    1.
-        1   one   B    2.
-        2   one   C    3.
-        3   two   A    4.
-        4   two   B    5.
-        5   two   C    6.
-
-        >>> df.pivot('foo', 'bar', 'baz')
-             A   B   C
+            foo   bar  baz  zoo
+        0   one   A    1    x
+        1   one   B    2    y
+        2   one   C    3    z
+        3   two   A    4    q
+        4   two   B    5    w
+        5   two   C    6    t
+
+        >>> df.pivot(index='foo', columns='bar', values='baz')
+        bar  A   B   C
+        foo
         one  1   2   3
         two  4   5   6
 
-        >>> df.pivot('foo', 'bar')['baz']
-             A   B   C
+        >>> df.pivot(index='foo', columns='bar')['baz']
+        bar  A   B   C
+        foo
         one  1   2   3
         two  4   5   6
 
-        Returns
-        -------
-        pivoted : DataFrame
-            If no values column specified, will have hierarchically indexed
-            columns
+        >>> df.pivot(index='foo', columns='bar', values=['baz', 'zoo'])
+              baz       zoo
+        bar   A  B  C   A  B  C
+        foo
+        one   1  2  3   x  y  z
+        two   4  5  6   q  w  t
+
+        A ValueError is raised if there are any duplicates.
+
+        >>> df = pd.DataFrame({"foo": ['one', 'one', 'two', 'two'],
+        ...                    "bar": ['A', 'A', 'B', 'C'],
+        ...                    "baz": [1, 2, 3, 4]})
+        >>> df
+           foo bar  baz
+        0  one   A    1
+        1  one   A    2
+        2  two   B    3
+        3  two   C    4
+
+        Notice that the first two rows are the same for our `index`
+        and `columns` arguments.
+
+        >>> df.pivot(index='foo', columns='bar', values='baz')
+        Traceback (most recent call last):
+           ...
+        ValueError: Index contains duplicate entries, cannot reshape
         """
-        from pandas.core.reshape import pivot
+        from pandas.core.reshape.reshape import pivot
         return pivot(self, index=index, columns=columns, values=values)
 
-    def stack(self, level=-1, dropna=True):
-        """
-        Pivot a level of the (possibly hierarchical) column labels, returning a
-        DataFrame (or Series in the case of an object with a single level of
-        column labels) having a hierarchical index with a new inner-most level
-        of row labels.
-        The level involved will automatically get sorted.
+    _shared_docs['pivot_table'] = """
+        Create a spreadsheet-style pivot table as a DataFrame. The levels in
+        the pivot table will be stored in MultiIndex objects (hierarchical
+        indexes) on the index and columns of the result DataFrame
 
         Parameters
-        ----------
-        level : int, string, or list of these, default last level
-            Level(s) to stack, can pass level name
+        ----------%s
+        values : column to aggregate, optional
+        index : column, Grouper, array, or list of the previous
+            If an array is passed, it must be the same length as the data. The
+            list can contain any of the other types (except list).
+            Keys to group by on the pivot table index.  If an array is passed,
+            it is being used as the same manner as column values.
+        columns : column, Grouper, array, or list of the previous
+            If an array is passed, it must be the same length as the data. The
+            list can contain any of the other types (except list).
+            Keys to group by on the pivot table column.  If an array is passed,
+            it is being used as the same manner as column values.
+        aggfunc : function, list of functions, dict, default numpy.mean
+            If list of functions passed, the resulting pivot table will have
+            hierarchical columns whose top level are the function names
+            (inferred from the function objects themselves)
+            If dict is passed, the key is column to aggregate and value
+            is function or list of functions
+        fill_value : scalar, default None
+            Value to replace missing values with
+        margins : boolean, default False
+            Add all row / columns (e.g. for subtotal / grand totals)
         dropna : boolean, default True
-            Whether to drop rows in the resulting Frame/Series with no valid
-            values
+            Do not include columns whose entries are all NaN
+        margins_name : string, default 'All'
+            Name of the row / column that will contain the totals
+            when margins is True.
 
         Examples
-        ----------
-        >>> s
-             a   b
-        one  1.  2.
-        two  3.  4.
-
-        >>> s.stack()
-        one a    1
-            b    2
-        two a    3
-            b    4
+        --------
+        >>> df = pd.DataFrame({"A": ["foo", "foo", "foo", "foo", "foo",
+        ...                          "bar", "bar", "bar", "bar"],
+        ...                    "B": ["one", "one", "one", "two", "two",
+        ...                          "one", "one", "two", "two"],
+        ...                    "C": ["small", "large", "large", "small",
+        ...                          "small", "large", "small", "small",
+        ...                          "large"],
+        ...                    "D": [1, 2, 2, 3, 3, 4, 5, 6, 7]})
+        >>> df
+             A    B      C  D
+        0  foo  one  small  1
+        1  foo  one  large  2
+        2  foo  one  large  2
+        3  foo  two  small  3
+        4  foo  two  small  3
+        5  bar  one  large  4
+        6  bar  one  small  5
+        7  bar  two  small  6
+        8  bar  two  large  7
+
+        >>> table = pivot_table(df, values='D', index=['A', 'B'],
+        ...                     columns=['C'], aggfunc=np.sum)
+        >>> table
+        C        large  small
+        A   B
+        bar one    4.0    5.0
+            two    7.0    6.0
+        foo one    4.0    1.0
+            two    NaN    6.0
+
+        >>> table = pivot_table(df, values='D', index=['A', 'B'],
+        ...                     columns=['C'], aggfunc=np.sum)
+        >>> table
+        C        large  small
+        A   B
+        bar one    4.0    5.0
+            two    7.0    6.0
+        foo one    4.0    1.0
+            two    NaN    6.0
+
+        >>> table = pivot_table(df, values=['D', 'E'], index=['A', 'C'],
+        ...                     aggfunc={'D': np.mean,
+        ...                              'E': [min, max, np.mean]})
+        >>> table
+                          D   E
+                       mean max median min
+        A   C
+        bar large  5.500000  16   14.5  13
+            small  5.500000  15   14.5  14
+        foo large  2.000000  10    9.5   9
+            small  2.333333  12   11.0   8
 
         Returns
         -------
-        stacked : DataFrame or Series
+        table : DataFrame
+
+        See also
+        --------
+        DataFrame.pivot : pivot without aggregation that can handle
+            non-numeric data
+        """
+
+    @Substitution('')
+    @Appender(_shared_docs['pivot_table'])
+    def pivot_table(self, values=None, index=None, columns=None,
+                    aggfunc='mean', fill_value=None, margins=False,
+                    dropna=True, margins_name='All'):
+        from pandas.core.reshape.pivot import pivot_table
+        return pivot_table(self, values=values, index=index, columns=columns,
+                           aggfunc=aggfunc, fill_value=fill_value,
+                           margins=margins, dropna=dropna,
+                           margins_name=margins_name)
+
+    def stack(self, level=-1, dropna=True):
         """
-        from pandas.core.reshape import stack, stack_multiple
+        Stack the prescribed level(s) from columns to index.
+
+        Return a reshaped DataFrame or Series having a multi-level
+        index with one or more new inner-most levels compared to the current
+        DataFrame. The new inner-most levels are created by pivoting the
+        columns of the current dataframe:
+
+          - if the columns have a single level, the output is a Series;
+          - if the columns have multiple levels, the new index
+            level(s) is (are) taken from the prescribed level(s) and
+            the output is a DataFrame.
+
+        The new index levels are sorted.
+
+        Parameters
+        ----------
+        level : int, str, list, default -1
+            Level(s) to stack from the column axis onto the index
+            axis, defined as one index or label, or a list of indices
+            or labels.
+        dropna : bool, default True
+            Whether to drop rows in the resulting Frame/Series with
+            missing values. Stacking a column level onto the index
+            axis can create combinations of index and column values
+            that are missing from the original dataframe. See Examples
+            section.
+
+        Returns
+        -------
+        DataFrame or Series
+            Stacked dataframe or series.
+
+        See Also
+        --------
+        DataFrame.unstack : Unstack prescribed level(s) from index axis
+             onto column axis.
+        DataFrame.pivot : Reshape dataframe from long format to wide
+             format.
+        DataFrame.pivot_table : Create a spreadsheet-style pivot table
+             as a DataFrame.
+
+        Notes
+        -----
+        The function is named by analogy with a collection of books
+        being re-organised from being side by side on a horizontal
+        position (the columns of the dataframe) to being stacked
+        vertically on top of of each other (in the index of the
+        dataframe).
+
+        Examples
+        --------
+        **Single level columns**
+
+        >>> df_single_level_cols = pd.DataFrame([[0, 1], [2, 3]],
+        ...                                     index=['cat', 'dog'],
+        ...                                     columns=['weight', 'height'])
+
+        Stacking a dataframe with a single level column axis returns a Series:
+
+        >>> df_single_level_cols
+             weight height
+        cat       0      1
+        dog       2      3
+        >>> df_single_level_cols.stack()
+        cat  weight    0
+             height    1
+        dog  weight    2
+             height    3
+        dtype: int64
+
+        **Multi level columns: simple case**
+
+        >>> multicol1 = pd.MultiIndex.from_tuples([('weight', 'kg'),
+        ...                                        ('weight', 'pounds')])
+        >>> df_multi_level_cols1 = pd.DataFrame([[1, 2], [2, 4]],
+        ...                                     index=['cat', 'dog'],
+        ...                                     columns=multicol1)
+
+        Stacking a dataframe with a multi-level column axis:
+
+        >>> df_multi_level_cols1
+             weight
+                 kg    pounds
+        cat       1        2
+        dog       2        4
+        >>> df_multi_level_cols1.stack()
+                    weight
+        cat kg           1
+            pounds       2
+        dog kg           2
+            pounds       4
+
+        **Missing values**
+
+        >>> multicol2 = pd.MultiIndex.from_tuples([('weight', 'kg'),
+        ...                                        ('height', 'm')])
+        >>> df_multi_level_cols2 = pd.DataFrame([[1.0, 2.0], [3.0, 4.0]],
+        ...                                     index=['cat', 'dog'],
+        ...                                     columns=multicol2)
+
+        It is common to have missing values when stacking a dataframe
+        with multi-level columns, as the stacked dataframe typically
+        has more values than the original dataframe. Missing values
+        are filled with NaNs:
+
+        >>> df_multi_level_cols2
+            weight height
+                kg      m
+        cat    1.0    2.0
+        dog    3.0    4.0
+        >>> df_multi_level_cols2.stack()
+                height  weight
+        cat kg     NaN     1.0
+            m      2.0     NaN
+        dog kg     NaN     3.0
+            m      4.0     NaN
+
+        **Prescribing the level(s) to be stacked**
+
+        The first parameter controls which level or levels are stacked:
+
+        >>> df_multi_level_cols2.stack(0)
+                     kg    m
+        cat height  NaN  2.0
+            weight  1.0  NaN
+        dog height  NaN  4.0
+            weight  3.0  NaN
+        >>> df_multi_level_cols2.stack([0, 1])
+        cat  height  m     2.0
+             weight  kg    1.0
+        dog  height  m     4.0
+             weight  kg    3.0
+        dtype: float64
+
+        **Dropping missing values**
+
+        >>> df_multi_level_cols3 = pd.DataFrame([[None, 1.0], [2.0, 3.0]],
+        ...                                     index=['cat', 'dog'],
+        ...                                     columns=multicol2)
+
+        Note that rows where all values are missing are dropped by
+        default but this behaviour can be controlled via the dropna
+        keyword parameter:
+
+        >>> df_multi_level_cols3
+            weight height
+                kg      m
+        cat    NaN    1.0
+        dog    2.0    3.0
+        >>> df_multi_level_cols3.stack(dropna=False)
+                height  weight
+        cat kg     NaN     NaN
+            m      1.0     NaN
+        dog kg     NaN     2.0
+            m      3.0     NaN
+        >>> df_multi_level_cols3.stack(dropna=True)
+                height  weight
+        cat m      1.0     NaN
+        dog kg     NaN     2.0
+            m      3.0     NaN
+        """
+        from pandas.core.reshape.reshape import stack, stack_multiple
 
         if isinstance(level, (tuple, list)):
             return stack_multiple(self, level, dropna=dropna)
         else:
             return stack(self, level, dropna=dropna)
 
-    def unstack(self, level=-1):
+    def unstack(self, level=-1, fill_value=None):
         """
         Pivot a level of the (necessarily hierarchical) index labels, returning
         a DataFrame having a new level of column labels whose inner-most level
@@ -3771,6 +5558,10 @@ def unstack(self, level=-1):
         ----------
         level : int, string, or list of these, default -1 (last level)
             Level(s) of index to unstack, can pass level name
+        fill_value : replace NaN with this value if the unstack produces
+            missing values
+
+            .. versionadded:: 0.18.0
 
         See also
         --------
@@ -3784,324 +5575,580 @@ def unstack(self, level=-1):
         ...                                    ('two', 'a'), ('two', 'b')])
         >>> s = pd.Series(np.arange(1.0, 5.0), index=index)
         >>> s
-        one  a   1
-             b   2
-        two  a   3
-             b   4
+        one  a   1.0
+             b   2.0
+        two  a   3.0
+             b   4.0
         dtype: float64
 
         >>> s.unstack(level=-1)
              a   b
-        one  1  2
-        two  3  4
+        one  1.0  2.0
+        two  3.0  4.0
 
         >>> s.unstack(level=0)
            one  two
-        a  1   3
-        b  2   4
+        a  1.0   3.0
+        b  2.0   4.0
 
         >>> df = s.unstack(level=0)
         >>> df.unstack()
-        one  a  1.
-             b  3.
-        two  a  2.
-             b  4.
+        one  a  1.0
+             b  2.0
+        two  a  3.0
+             b  4.0
+        dtype: float64
 
         Returns
         -------
         unstacked : DataFrame or Series
         """
-        from pandas.core.reshape import unstack
-        return unstack(self, level)
+        from pandas.core.reshape.reshape import unstack
+        return unstack(self, level, fill_value)
+
+    _shared_docs['melt'] = ("""
+    "Unpivots" a DataFrame from wide format to long format, optionally
+    leaving identifier variables set.
 
-    #----------------------------------------------------------------------
+    This function is useful to massage a DataFrame into a format where one
+    or more columns are identifier variables (`id_vars`), while all other
+    columns, considered measured variables (`value_vars`), are "unpivoted" to
+    the row axis, leaving just two non-identifier columns, 'variable' and
+    'value'.
+
+    %(versionadded)s
+    Parameters
+    ----------
+    frame : DataFrame
+    id_vars : tuple, list, or ndarray, optional
+        Column(s) to use as identifier variables.
+    value_vars : tuple, list, or ndarray, optional
+        Column(s) to unpivot. If not specified, uses all columns that
+        are not set as `id_vars`.
+    var_name : scalar
+        Name to use for the 'variable' column. If None it uses
+        ``frame.columns.name`` or 'variable'.
+    value_name : scalar, default 'value'
+        Name to use for the 'value' column.
+    col_level : int or string, optional
+        If columns are a MultiIndex then use this level to melt.
+
+    See also
+    --------
+    %(other)s
+    pivot_table
+    DataFrame.pivot
+
+    Examples
+    --------
+    >>> import pandas as pd
+    >>> df = pd.DataFrame({'A': {0: 'a', 1: 'b', 2: 'c'},
+    ...                    'B': {0: 1, 1: 3, 2: 5},
+    ...                    'C': {0: 2, 1: 4, 2: 6}})
+    >>> df
+       A  B  C
+    0  a  1  2
+    1  b  3  4
+    2  c  5  6
+
+    >>> %(caller)sid_vars=['A'], value_vars=['B'])
+       A variable  value
+    0  a        B      1
+    1  b        B      3
+    2  c        B      5
+
+    >>> %(caller)sid_vars=['A'], value_vars=['B', 'C'])
+       A variable  value
+    0  a        B      1
+    1  b        B      3
+    2  c        B      5
+    3  a        C      2
+    4  b        C      4
+    5  c        C      6
+
+    The names of 'variable' and 'value' columns can be customized:
+
+    >>> %(caller)sid_vars=['A'], value_vars=['B'],
+    ...         var_name='myVarname', value_name='myValname')
+       A myVarname  myValname
+    0  a         B          1
+    1  b         B          3
+    2  c         B          5
+
+    If you have multi-index columns:
+
+    >>> df.columns = [list('ABC'), list('DEF')]
+    >>> df
+       A  B  C
+       D  E  F
+    0  a  1  2
+    1  b  3  4
+    2  c  5  6
+
+    >>> %(caller)scol_level=0, id_vars=['A'], value_vars=['B'])
+       A variable  value
+    0  a        B      1
+    1  b        B      3
+    2  c        B      5
+
+    >>> %(caller)sid_vars=[('A', 'D')], value_vars=[('B', 'E')])
+      (A, D) variable_0 variable_1  value
+    0      a          B          E      1
+    1      b          B          E      3
+    2      c          B          E      5
+
+    """)
+
+    @Appender(_shared_docs['melt'] %
+              dict(caller='df.melt(',
+                   versionadded='.. versionadded:: 0.20.0\n',
+                   other='melt'))
+    def melt(self, id_vars=None, value_vars=None, var_name=None,
+             value_name='value', col_level=None):
+        from pandas.core.reshape.melt import melt
+        return melt(self, id_vars=id_vars, value_vars=value_vars,
+                    var_name=var_name, value_name=value_name,
+                    col_level=col_level)
+
+    # ----------------------------------------------------------------------
     # Time series-related
 
     def diff(self, periods=1, axis=0):
         """
-        1st discrete difference of object
+        First discrete difference of element.
+
+        Calculates the difference of a DataFrame element compared with another
+        element in the DataFrame (default is the element in the same column
+        of the previous row).
 
         Parameters
         ----------
         periods : int, default 1
-            Periods to shift for forming difference
+            Periods to shift for calculating difference, accepts negative
+            values.
         axis : {0 or 'index', 1 or 'columns'}, default 0
             Take difference over rows (0) or columns (1).
 
-            .. versionadded: 0.16.1
+            .. versionadded:: 0.16.1.
 
         Returns
         -------
         diffed : DataFrame
+
+        See Also
+        --------
+        Series.diff: First discrete difference for a Series.
+        DataFrame.pct_change: Percent change over given number of periods.
+        DataFrame.shift: Shift index by desired number of periods with an
+            optional time freq.
+
+        Examples
+        --------
+        Difference with previous row
+
+        >>> df = pd.DataFrame({'a': [1, 2, 3, 4, 5, 6],
+        ...                    'b': [1, 1, 2, 3, 5, 8],
+        ...                    'c': [1, 4, 9, 16, 25, 36]})
+        >>> df
+           a  b   c
+        0  1  1   1
+        1  2  1   4
+        2  3  2   9
+        3  4  3  16
+        4  5  5  25
+        5  6  8  36
+
+        >>> df.diff()
+             a    b     c
+        0  NaN  NaN   NaN
+        1  1.0  0.0   3.0
+        2  1.0  1.0   5.0
+        3  1.0  1.0   7.0
+        4  1.0  2.0   9.0
+        5  1.0  3.0  11.0
+
+        Difference with previous column
+
+        >>> df.diff(axis=1)
+            a    b     c
+        0 NaN  0.0   0.0
+        1 NaN -1.0   3.0
+        2 NaN -1.0   7.0
+        3 NaN -1.0  13.0
+        4 NaN  0.0  20.0
+        5 NaN  2.0  28.0
+
+        Difference with 3rd previous row
+
+        >>> df.diff(periods=3)
+             a    b     c
+        0  NaN  NaN   NaN
+        1  NaN  NaN   NaN
+        2  NaN  NaN   NaN
+        3  3.0  2.0  15.0
+        4  3.0  4.0  21.0
+        5  3.0  6.0  27.0
+
+        Difference with following row
+
+        >>> df.diff(periods=-1)
+             a    b     c
+        0 -1.0  0.0  -3.0
+        1 -1.0 -1.0  -5.0
+        2 -1.0 -1.0  -7.0
+        3 -1.0 -2.0  -9.0
+        4 -1.0 -3.0 -11.0
+        5  NaN  NaN   NaN
         """
         bm_axis = self._get_block_manager_axis(axis)
         new_data = self._data.diff(n=periods, axis=bm_axis)
         return self._constructor(new_data)
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Function application
 
-    def apply(self, func, axis=0, broadcast=False, raw=False, reduce=None,
-              args=(), **kwds):
+    def _gotitem(self,
+                 key,           # type: Union[str, List[str]]
+                 ndim,          # type: int
+                 subset=None    # type: Union[Series, DataFrame, None]
+                 ):
+        # type: (...) -> Union[Series, DataFrame]
+        """
+        sub-classes to define
+        return a sliced object
+
+        Parameters
+        ----------
+        key : string / list of selections
+        ndim : 1,2
+            requested ndim of result
+        subset : object, default None
+            subset to act on
+        """
+        if subset is None:
+            subset = self
+        elif subset.ndim == 1:  # is Series
+            return subset
+
+        # TODO: _shallow_copy(subset)?
+        return subset[key]
+
+    _agg_doc = dedent("""
+    The aggregation operations are always performed over an axis, either the
+    index (default) or the column axis. This behavior is different from
+    `numpy` aggregation functions (`mean`, `median`, `prod`, `sum`, `std`,
+    `var`), where the default is to compute the aggregation of the flattened
+    array, e.g., ``numpy.mean(arr_2d)`` as opposed to ``numpy.mean(arr_2d,
+    axis=0)``.
+
+    `agg` is an alias for `aggregate`. Use the alias.
+
+    Examples
+    --------
+    >>> df = pd.DataFrame([[1, 2, 3],
+    ...                    [4, 5, 6],
+    ...                    [7, 8, 9],
+    ...                    [np.nan, np.nan, np.nan]],
+    ...                   columns=['A', 'B', 'C'])
+
+    Aggregate these functions over the rows.
+
+    >>> df.agg(['sum', 'min'])
+            A     B     C
+    sum  12.0  15.0  18.0
+    min   1.0   2.0   3.0
+
+    Different aggregations per column.
+
+    >>> df.agg({'A' : ['sum', 'min'], 'B' : ['min', 'max']})
+            A    B
+    max   NaN  8.0
+    min   1.0  2.0
+    sum  12.0  NaN
+
+    Aggregate over the columns.
+
+    >>> df.agg("mean", axis="columns")
+    0    2.0
+    1    5.0
+    2    8.0
+    3    NaN
+    dtype: float64
+
+    See also
+    --------
+    DataFrame.apply : Perform any type of operations.
+    DataFrame.transform : Perform transformation type operations.
+    pandas.core.groupby.GroupBy : Perform operations over groups.
+    pandas.core.resample.Resampler : Perform operations over resampled bins.
+    pandas.core.window.Rolling : Perform operations over rolling window.
+    pandas.core.window.Expanding : Perform operations over expanding window.
+    pandas.core.window.EWM : Perform operation over exponential weighted
+        window.
+    """)
+
+    @Appender(_agg_doc)
+    @Appender(_shared_docs['aggregate'] % dict(
+        versionadded='.. versionadded:: 0.20.0',
+        **_shared_doc_kwargs))
+    def aggregate(self, func, axis=0, *args, **kwargs):
+        axis = self._get_axis_number(axis)
+
+        # TODO: flipped axis
+        result = None
+        if axis == 0:
+            try:
+                result, how = self._aggregate(func, axis=0, *args, **kwargs)
+            except TypeError:
+                pass
+        if result is None:
+            return self.apply(func, axis=axis, args=args, **kwargs)
+        return result
+
+    agg = aggregate
+
+    def apply(self, func, axis=0, broadcast=None, raw=False, reduce=None,
+              result_type=None, args=(), **kwds):
         """
-        Applies function along input axis of DataFrame.
+        Apply a function along an axis of the DataFrame.
 
-        Objects passed to functions are Series objects having index
-        either the DataFrame's index (axis=0) or the columns (axis=1).
-        Return type depends on whether passed function aggregates, or the
-        reduce argument if the DataFrame is empty.
+        Objects passed to the function are Series objects whose index is
+        either the DataFrame's index (``axis=0``) or the DataFrame's columns
+        (``axis=1``). By default (``result_type=None``), the final return type
+        is inferred from the return type of the applied function. Otherwise,
+        it depends on the `result_type` argument.
 
         Parameters
         ----------
         func : function
-            Function to apply to each column/row
+            Function to apply to each column or row.
         axis : {0 or 'index', 1 or 'columns'}, default 0
-            * 0 or 'index': apply function to each column
-            * 1 or 'columns': apply function to each row
-        broadcast : boolean, default False
-            For aggregation functions, return object of same size with values
-            propagated
-        reduce : boolean or None, default None
+            Axis along which the function is applied:
+
+            * 0 or 'index': apply function to each column.
+            * 1 or 'columns': apply function to each row.
+        broadcast : bool, optional
+            Only relevant for aggregation functions:
+
+            * ``False`` or ``None`` : returns a Series whose length is the
+              length of the index or the number of columns (based on the
+              `axis` parameter)
+            * ``True`` : results will be broadcast to the original shape
+              of the frame, the original index and columns will be retained.
+
+            .. deprecated:: 0.23.0
+               This argument will be removed in a future version, replaced
+               by result_type='broadcast'.
+
+        raw : bool, default False
+            * ``False`` : passes each row or column as a Series to the
+              function.
+            * ``True`` : the passed function will receive ndarray objects
+              instead.
+              If you are just applying a NumPy reduction function this will
+              achieve much better performance.
+        reduce : bool or None, default None
             Try to apply reduction procedures. If the DataFrame is empty,
-            apply will use reduce to determine whether the result should be a
-            Series or a DataFrame. If reduce is None (the default), apply's
-            return value will be guessed by calling func an empty Series (note:
-            while guessing, exceptions raised by func will be ignored). If
-            reduce is True a Series will always be returned, and if False a
-            DataFrame will always be returned.
-        raw : boolean, default False
-            If False, convert each row or column into a Series. If raw=True the
-            passed function will receive ndarray objects instead. If you are
-            just applying a NumPy reduction function this will achieve much
-            better performance
+            `apply` will use `reduce` to determine whether the result
+            should be a Series or a DataFrame. If ``reduce=None`` (the
+            default), `apply`'s return value will be guessed by calling
+            `func` on an empty Series
+            (note: while guessing, exceptions raised by `func` will be
+            ignored).
+            If ``reduce=True`` a Series will always be returned, and if
+            ``reduce=False`` a DataFrame will always be returned.
+
+            .. deprecated:: 0.23.0
+               This argument will be removed in a future version, replaced
+               by ``result_type='reduce'``.
+
+        result_type : {'expand', 'reduce', 'broadcast', None}, default None
+            These only act when ``axis=1`` (columns):
+
+            * 'expand' : list-like results will be turned into columns.
+            * 'reduce' : returns a Series if possible rather than expanding
+              list-like results. This is the opposite of 'expand'.
+            * 'broadcast' : results will be broadcast to the original shape
+              of the DataFrame, the original index and columns will be
+              retained.
+
+            The default behaviour (None) depends on the return value of the
+            applied function: list-like results will be returned as a Series
+            of those. However if the apply function returns a Series these
+            are expanded to columns.
+
+            .. versionadded:: 0.23.0
+
         args : tuple
-            Positional arguments to pass to function in addition to the
-            array/series
-        Additional keyword arguments will be passed as keywords to the function
+            Positional arguments to pass to `func` in addition to the
+            array/series.
+        **kwds
+            Additional keyword arguments to pass as keywords arguments to
+            `func`.
 
         Notes
         -----
-        In the current implementation apply calls func twice on the
+        In the current implementation apply calls `func` twice on the
         first column/row to decide whether it can take a fast or slow
-        code path. This can lead to unexpected behavior if func has
+        code path. This can lead to unexpected behavior if `func` has
         side-effects, as they will take effect twice for the first
         column/row.
 
-        Examples
-        --------
-        >>> df.apply(numpy.sqrt) # returns DataFrame
-        >>> df.apply(numpy.sum, axis=0) # equiv to df.sum(0)
-        >>> df.apply(numpy.sum, axis=1) # equiv to df.sum(1)
-
         See also
         --------
         DataFrame.applymap: For elementwise operations
+        DataFrame.aggregate: only perform aggregating type operations
+        DataFrame.transform: only perform transforming type operations
 
-        Returns
-        -------
-        applied : Series or DataFrame
-        """
-        axis = self._get_axis_number(axis)
-        if kwds or args and not isinstance(func, np.ufunc):
-            f = lambda x: func(x, *args, **kwds)
-        else:
-            f = func
-
-        if len(self.columns) == 0 and len(self.index) == 0:
-            return self._apply_empty_result(func, axis, reduce, *args, **kwds)
-
-        if isinstance(f, np.ufunc):
-            results = f(self.values)
-            return self._constructor(data=results, index=self.index,
-                                     columns=self.columns, copy=False)
-        else:
-            if not broadcast:
-                if not all(self.shape):
-                    return self._apply_empty_result(func, axis, reduce, *args,
-                                                    **kwds)
-
-                if raw and not self._is_mixed_type:
-                    return self._apply_raw(f, axis)
-                else:
-                    if reduce is None:
-                        reduce = True
-                    return self._apply_standard(f, axis, reduce=reduce)
-            else:
-                return self._apply_broadcast(f, axis)
-
-    def _apply_empty_result(self, func, axis, reduce, *args, **kwds):
-        if reduce is None:
-            reduce = False
-            try:
-                reduce = not isinstance(func(_EMPTY_SERIES, *args, **kwds),
-                                        Series)
-            except Exception:
-                pass
-
-        if reduce:
-            return Series(NA, index=self._get_agg_axis(axis))
-        else:
-            return self.copy()
-
-    def _apply_raw(self, func, axis):
-        try:
-            result = lib.reduce(self.values, func, axis=axis)
-        except Exception:
-            result = np.apply_along_axis(func, axis, self.values)
-
-        # TODO: mixed type case
-        if result.ndim == 2:
-            return DataFrame(result, index=self.index,
-                             columns=self.columns)
-        else:
-            return Series(result, index=self._get_agg_axis(axis))
-
-    def _apply_standard(self, func, axis, ignore_failures=False, reduce=True):
+        Examples
+        --------
 
-        # skip if we are mixed datelike and trying reduce across axes
-        # GH6125
-        if reduce and axis==1 and self._is_mixed_type and self._is_datelike_mixed_type:
-            reduce=False
+        >>> df = pd.DataFrame([[4, 9],] * 3, columns=['A', 'B'])
+        >>> df
+           A  B
+        0  4  9
+        1  4  9
+        2  4  9
 
-        # try to reduce first (by default)
-        # this only matters if the reduction in values is of different dtype
-        # e.g. if we want to apply to a SparseFrame, then can't directly reduce
-        if reduce:
+        Using a numpy universal function (in this case the same as
+        ``np.sqrt(df)``):
 
-            values = self.values
+        >>> df.apply(np.sqrt)
+             A    B
+        0  2.0  3.0
+        1  2.0  3.0
+        2  2.0  3.0
 
-            # Create a dummy Series from an empty array
-            index = self._get_axis(axis)
-            empty_arr = np.empty(len(index), dtype=values.dtype)
-            dummy = Series(empty_arr, index=self._get_axis(axis),
-                           dtype=values.dtype)
+        Using a reducing function on either axis
 
-            try:
-                labels = self._get_agg_axis(axis)
-                result = lib.reduce(values, func, axis=axis, dummy=dummy,
-                                    labels=labels)
-                return Series(result, index=labels)
-            except Exception:
-                pass
-
-        dtype = object if self._is_mixed_type else None
-        if axis == 0:
-            series_gen = (self._ixs(i,axis=1) for i in range(len(self.columns)))
-            res_index = self.columns
-            res_columns = self.index
-        elif axis == 1:
-            res_index = self.index
-            res_columns = self.columns
-            values = self.values
-            series_gen = (Series.from_array(arr, index=res_columns, name=name, dtype=dtype)
-                          for i, (arr, name) in
-                          enumerate(zip(values, res_index)))
-        else:  # pragma : no cover
-            raise AssertionError('Axis must be 0 or 1, got %s' % str(axis))
-
-        i = None
-        keys = []
-        results = {}
-        if ignore_failures:
-            successes = []
-            for i, v in enumerate(series_gen):
-                try:
-                    results[i] = func(v)
-                    keys.append(v.name)
-                    successes.append(i)
-                except Exception:
-                    pass
-            # so will work with MultiIndex
-            if len(successes) < len(res_index):
-                res_index = res_index.take(successes)
-        else:
-            try:
-                for i, v in enumerate(series_gen):
-                    results[i] = func(v)
-                    keys.append(v.name)
-            except Exception as e:
-                if hasattr(e, 'args'):
-                    # make sure i is defined
-                    if i is not None:
-                        k = res_index[i]
-                        e.args = e.args + ('occurred at index %s' %
-                                           com.pprint_thing(k),)
-                raise
-
-        if len(results) > 0 and is_sequence(results[0]):
-            if not isinstance(results[0], Series):
-                index = res_columns
-            else:
-                index = None
+        >>> df.apply(np.sum, axis=0)
+        A    12
+        B    27
+        dtype: int64
 
-            result = self._constructor(data=results, index=index)
-            result.columns = res_index
+        >>> df.apply(np.sum, axis=1)
+        0    13
+        1    13
+        2    13
+        dtype: int64
 
-            if axis == 1:
-                result = result.T
-            result = result._convert(datetime=True, timedelta=True, copy=False)
+        Retuning a list-like will result in a Series
 
-        else:
+        >>> df.apply(lambda x: [1, 2], axis=1)
+        0    [1, 2]
+        1    [1, 2]
+        2    [1, 2]
+        dtype: object
 
-            result = Series(results)
-            result.index = res_index
+        Passing result_type='expand' will expand list-like results
+        to columns of a Dataframe
 
-        return result
+        >>> df.apply(lambda x: [1, 2], axis=1, result_type='expand')
+           0  1
+        0  1  2
+        1  1  2
+        2  1  2
 
-    def _apply_broadcast(self, func, axis):
-        if axis == 0:
-            target = self
-        elif axis == 1:
-            target = self.T
-        else:  # pragma: no cover
-            raise AssertionError('Axis must be 0 or 1, got %s' % axis)
+        Returning a Series inside the function is similar to passing
+        ``result_type='expand'``. The resulting column names
+        will be the Series index.
 
-        result_values = np.empty_like(target.values)
-        columns = target.columns
-        for i, col in enumerate(columns):
-            result_values[:, i] = func(target[col])
+        >>> df.apply(lambda x: pd.Series([1, 2], index=['foo', 'bar']), axis=1)
+           foo  bar
+        0    1    2
+        1    1    2
+        2    1    2
 
-        result = self._constructor(result_values, index=target.index,
-                                   columns=target.columns)
+        Passing ``result_type='broadcast'`` will ensure the same shape
+        result, whether list-like or scalar is returned by the function,
+        and broadcast it along the axis. The resulting column names will
+        be the originals.
 
-        if axis == 1:
-            result = result.T
+        >>> df.apply(lambda x: [1, 2], axis=1, result_type='broadcast')
+           A  B
+        0  1  2
+        1  1  2
+        2  1  2
 
-        return result
+        Returns
+        -------
+        applied : Series or DataFrame
+        """
+        from pandas.core.apply import frame_apply
+        op = frame_apply(self,
+                         func=func,
+                         axis=axis,
+                         broadcast=broadcast,
+                         raw=raw,
+                         reduce=reduce,
+                         result_type=result_type,
+                         args=args,
+                         kwds=kwds)
+        return op.get_result()
 
     def applymap(self, func):
         """
-        Apply a function to a DataFrame that is intended to operate
-        elementwise, i.e. like doing map(func, series) for each series in the
-        DataFrame
+        Apply a function to a Dataframe elementwise.
+
+        This method applies a function that accepts and returns a scalar
+        to every element of a DataFrame.
 
         Parameters
         ----------
-        func : function
-            Python function, returns a single value from a single value
+        func : callable
+            Python function, returns a single value from a single value.
 
         Returns
         -------
-        applied : DataFrame
+        DataFrame
+            Transformed DataFrame.
 
         See also
         --------
-        DataFrame.apply : For operations on rows/columns
+        DataFrame.apply : Apply a function along input axis of DataFrame
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([[1, 2.12], [3.356, 4.567]])
+        >>> df
+               0      1
+        0  1.000  2.120
+        1  3.356  4.567
+
+        >>> df.applymap(lambda x: len(str(x)))
+           0  1
+        0  3  4
+        1  5  5
+
+        Note that a vectorized version of `func` often exists, which will
+        be much faster. You could square each number elementwise.
+
+        >>> df.applymap(lambda x: x**2)
+                   0          1
+        0   1.000000   4.494400
+        1  11.262736  20.857489
 
+        But it's better to avoid applymap in that case.
+
+        >>> df ** 2
+                   0          1
+        0   1.000000   4.494400
+        1  11.262736  20.857489
         """
 
         # if we have a dtype == 'M8[ns]', provide boxed values
         def infer(x):
-            if com.needs_i8_conversion(x):
-                f = com.i8_boxer(x)
-                x = lib.map_infer(_values_from_object(x), f)
-            return lib.map_infer(_values_from_object(x), func)
+            if x.empty:
+                return lib.map_infer(x, func)
+            return lib.map_infer(x.astype(object).values, func)
+
         return self.apply(infer)
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Merging / joining methods
 
-    def append(self, other, ignore_index=False, verify_integrity=False):
+    def append(self, other, ignore_index=False,
+               verify_integrity=False, sort=None):
         """
         Append rows of `other` to the end of this frame, returning a new
         object. Columns not in this frame are added as new columns.
@@ -4114,6 +6161,14 @@ def append(self, other, ignore_index=False, verify_integrity=False):
             If True, do not use the index labels.
         verify_integrity : boolean, default False
             If True, raise ValueError on creating index with duplicates.
+        sort : boolean, default None
+            Sort columns if the columns of `self` and `other` are not aligned.
+            The default sorting is deprecated and will change to not-sorting
+            in a future version of pandas. Explicitly pass ``sort=True`` to
+            silence the warning and sort. Explicitly pass ``sort=False`` to
+            silence the warning and not sort.
+
+            .. versionadded:: 0.23.0
 
         Returns
         -------
@@ -4121,9 +6176,14 @@ def append(self, other, ignore_index=False, verify_integrity=False):
 
         Notes
         -----
-        If a list of dict/series is passed and the keys are all contained in the
-        DataFrame's index, the order of the columns in the resulting DataFrame
-        will be unchanged.
+        If a list of dict/series is passed and the keys are all contained in
+        the DataFrame's index, the order of the columns in the resulting
+        DataFrame will be unchanged.
+
+        Iteratively appending rows to a DataFrame can be more computationally
+        intensive than a single concatenate. A better solution is to append
+        those rows to a list and then concatenate the list with the original
+        DataFrame all at once.
 
         See also
         --------
@@ -4155,6 +6215,33 @@ def append(self, other, ignore_index=False, verify_integrity=False):
         2  5  6
         3  7  8
 
+        The following, while not recommended methods for generating DataFrames,
+        show two ways to generate a DataFrame from multiple data sources.
+
+        Less efficient:
+
+        >>> df = pd.DataFrame(columns=['A'])
+        >>> for i in range(5):
+        ...     df = df.append({'A': i}, ignore_index=True)
+        >>> df
+           A
+        0  0
+        1  1
+        2  2
+        3  3
+        4  4
+
+        More efficient:
+
+        >>> pd.concat([pd.DataFrame([i], columns=['A']) for i in range(5)],
+        ...           ignore_index=True)
+           A
+        0  0
+        1  1
+        2  2
+        3  3
+        4  4
+
         """
         if isinstance(other, (Series, dict)):
             if isinstance(other, dict):
@@ -4163,28 +6250,38 @@ def append(self, other, ignore_index=False, verify_integrity=False):
                 raise TypeError('Can only append a Series if ignore_index=True'
                                 ' or if the Series has a name')
 
-            index = None if other.name is None else [other.name]
-            combined_columns = self.columns.tolist() + self.columns.union(other.index).difference(self.columns).tolist()
+            if other.name is None:
+                index = None
+            else:
+                # other must have the same index name as self, otherwise
+                # index name will be reset
+                index = Index([other.name], name=self.index.name)
+
+            idx_diff = other.index.difference(self.columns)
+            try:
+                combined_columns = self.columns.append(idx_diff)
+            except TypeError:
+                combined_columns = self.columns.astype(object).append(idx_diff)
             other = other.reindex(combined_columns, copy=False)
             other = DataFrame(other.values.reshape((1, len(other))),
                               index=index,
                               columns=combined_columns)
             other = other._convert(datetime=True, timedelta=True)
-
             if not self.columns.equals(combined_columns):
                 self = self.reindex(columns=combined_columns)
         elif isinstance(other, list) and not isinstance(other[0], DataFrame):
             other = DataFrame(other)
             if (self.columns.get_indexer(other.columns) >= 0).all():
-                other = other.ix[:, self.columns]
+                other = other.loc[:, self.columns]
 
-        from pandas.tools.merge import concat
+        from pandas.core.reshape.concat import concat
         if isinstance(other, (list, tuple)):
             to_concat = [self] + other
         else:
             to_concat = [self, other]
         return concat(to_concat, ignore_index=ignore_index,
-                      verify_integrity=verify_integrity)
+                      verify_integrity=verify_integrity,
+                      sort=sort)
 
     def join(self, other, on=None, how='left', lsuffix='', rsuffix='',
              sort=False):
@@ -4199,32 +6296,110 @@ def join(self, other, on=None, how='left', lsuffix='', rsuffix='',
             Index should be similar to one of the columns in this one. If a
             Series is passed, its name attribute must be set, and that will be
             used as the column name in the resulting joined DataFrame
-        on : column name, tuple/list of column names, or array-like
-            Column(s) to use for joining, otherwise join on index. If multiples
-            columns given, the passed DataFrame must have a MultiIndex. Can
-            pass an array as the join key if not already contained in the
-            calling DataFrame. Like an Excel VLOOKUP operation
-        how : {'left', 'right', 'outer', 'inner'}
-            How to handle indexes of the two objects. Default: 'left'
-            for joining on index, None otherwise
-
-            * left: use calling frame's index
-            * right: use input frame's index
-            * outer: form union of indexes
-            * inner: use intersection of indexes
+        on : name, tuple/list of names, or array-like
+            Column or index level name(s) in the caller to join on the index
+            in `other`, otherwise joins index-on-index. If multiple
+            values given, the `other` DataFrame must have a MultiIndex. Can
+            pass an array as the join key if it is not already contained in
+            the calling DataFrame. Like an Excel VLOOKUP operation
+        how : {'left', 'right', 'outer', 'inner'}, default: 'left'
+            How to handle the operation of the two objects.
+
+            * left: use calling frame's index (or column if on is specified)
+            * right: use other frame's index
+            * outer: form union of calling frame's index (or column if on is
+              specified) with other frame's index, and sort it
+              lexicographically
+            * inner: form intersection of calling frame's index (or column if
+              on is specified) with other frame's index, preserving the order
+              of the calling's one
         lsuffix : string
             Suffix to use from left frame's overlapping columns
         rsuffix : string
             Suffix to use from right frame's overlapping columns
         sort : boolean, default False
             Order result DataFrame lexicographically by the join key. If False,
-            preserves the index order of the calling (left) DataFrame
+            the order of the join key depends on the join type (how keyword)
 
         Notes
         -----
         on, lsuffix, and rsuffix options are not supported when passing a list
         of DataFrame objects
 
+        Support for specifying index levels as the `on` parameter was added
+        in version 0.23.0
+
+        Examples
+        --------
+        >>> caller = pd.DataFrame({'key': ['K0', 'K1', 'K2', 'K3', 'K4', 'K5'],
+        ...                        'A': ['A0', 'A1', 'A2', 'A3', 'A4', 'A5']})
+
+        >>> caller
+            A key
+        0  A0  K0
+        1  A1  K1
+        2  A2  K2
+        3  A3  K3
+        4  A4  K4
+        5  A5  K5
+
+        >>> other = pd.DataFrame({'key': ['K0', 'K1', 'K2'],
+        ...                       'B': ['B0', 'B1', 'B2']})
+
+        >>> other
+            B key
+        0  B0  K0
+        1  B1  K1
+        2  B2  K2
+
+        Join DataFrames using their indexes.
+
+        >>> caller.join(other, lsuffix='_caller', rsuffix='_other')
+
+        >>>     A key_caller    B key_other
+            0  A0         K0   B0        K0
+            1  A1         K1   B1        K1
+            2  A2         K2   B2        K2
+            3  A3         K3  NaN       NaN
+            4  A4         K4  NaN       NaN
+            5  A5         K5  NaN       NaN
+
+
+        If we want to join using the key columns, we need to set key to be
+        the index in both caller and other. The joined DataFrame will have
+        key as its index.
+
+        >>> caller.set_index('key').join(other.set_index('key'))
+
+        >>>      A    B
+            key
+            K0   A0   B0
+            K1   A1   B1
+            K2   A2   B2
+            K3   A3  NaN
+            K4   A4  NaN
+            K5   A5  NaN
+
+        Another option to join using the key columns is to use the on
+        parameter. DataFrame.join always uses other's index but we can use any
+        column in the caller. This method preserves the original caller's
+        index in the result.
+
+        >>> caller.join(other.set_index('key'), on='key')
+
+        >>>     A key    B
+            0  A0  K0   B0
+            1  A1  K1   B1
+            2  A2  K2   B2
+            3  A3  K3  NaN
+            4  A4  K4  NaN
+            5  A5  K5  NaN
+
+
+        See also
+        --------
+        DataFrame.merge : For column(s)-on-columns(s) operations
+
         Returns
         -------
         joined : DataFrame
@@ -4235,7 +6410,8 @@ def join(self, other, on=None, how='left', lsuffix='', rsuffix='',
 
     def _join_compat(self, other, on=None, how='left', lsuffix='', rsuffix='',
                      sort=False):
-        from pandas.tools.merge import merge, concat
+        from pandas.core.reshape.merge import merge
+        from pandas.core.reshape.concat import concat
 
         if isinstance(other, Series):
             if other.name is None:
@@ -4251,26 +6427,25 @@ def _join_compat(self, other, on=None, how='left', lsuffix='', rsuffix='',
                 raise ValueError('Joining multiple DataFrames only supported'
                                  ' for joining on index')
 
-            # join indexes only using concat
-            if how == 'left':
-                how = 'outer'
-                join_axes = [self.index]
-            else:
-                join_axes = None
-
             frames = [self] + list(other)
 
             can_concat = all(df.index.is_unique for df in frames)
 
+            # join indexes only using concat
             if can_concat:
+                if how == 'left':
+                    how = 'outer'
+                    join_axes = [self.index]
+                else:
+                    join_axes = None
                 return concat(frames, axis=1, join=how, join_axes=join_axes,
                               verify_integrity=True)
 
             joined = frames[0]
 
             for frame in frames[1:]:
-                joined = merge(joined, frame, how=how,
-                               left_index=True, right_index=True)
+                joined = merge(joined, frame, how=how, left_index=True,
+                               right_index=True)
 
             return joined
 
@@ -4278,19 +6453,18 @@ def _join_compat(self, other, on=None, how='left', lsuffix='', rsuffix='',
     @Appender(_merge_doc, indents=2)
     def merge(self, right, how='inner', on=None, left_on=None, right_on=None,
               left_index=False, right_index=False, sort=False,
-              suffixes=('_x', '_y'), copy=True, indicator=False):
-        from pandas.tools.merge import merge
-        return merge(self, right, how=how, on=on,
-                     left_on=left_on, right_on=right_on,
-                     left_index=left_index, right_index=right_index, sort=sort,
-                     suffixes=suffixes, copy=copy, indicator=indicator)
+              suffixes=('_x', '_y'), copy=True, indicator=False,
+              validate=None):
+        from pandas.core.reshape.merge import merge
+        return merge(self, right, how=how, on=on, left_on=left_on,
+                     right_on=right_on, left_index=left_index,
+                     right_index=right_index, sort=sort, suffixes=suffixes,
+                     copy=copy, indicator=indicator, validate=validate)
 
-    def round(self, decimals=0, out=None):
+    def round(self, decimals=0, *args, **kwargs):
         """
         Round a DataFrame to a variable number of decimal places.
 
-        .. versionadded:: 0.17.0
-
         Parameters
         ----------
         decimals : int, dict, Series
@@ -4332,30 +6506,50 @@ def round(self, decimals=0, out=None):
         Returns
         -------
         DataFrame object
+
+        See Also
+        --------
+        numpy.around
+        Series.round
+
         """
-        from pandas.tools.merge import concat
+        from pandas.core.reshape.concat import concat
 
         def _dict_round(df, decimals):
-            for col in df:
+            for col, vals in df.iteritems():
                 try:
-                    yield np.round(df[col], decimals[col])
+                    yield _series_round(vals, decimals[col])
                 except KeyError:
-                    yield df[col]
+                    yield vals
+
+        def _series_round(s, decimals):
+            if is_integer_dtype(s) or is_float_dtype(s):
+                return s.round(decimals)
+            return s
+
+        nv.validate_round(args, kwargs)
 
         if isinstance(decimals, (dict, Series)):
+            if isinstance(decimals, Series):
+                if not decimals.index.is_unique:
+                    raise ValueError("Index of decimals must be unique")
             new_cols = [col for col in _dict_round(self, decimals)]
-        elif com.is_integer(decimals):
-            # Dispatch to numpy.round
-            new_cols = [np.round(self[col], decimals) for col in self]
+        elif is_integer(decimals):
+            # Dispatch to Series.round
+            new_cols = [_series_round(v, decimals)
+                        for _, v in self.iteritems()]
         else:
-            raise TypeError("decimals must be an integer, a dict-like or a Series")
+            raise TypeError("decimals must be an integer, a dict-like or a "
+                            "Series")
 
         if len(new_cols) > 0:
-            return concat(new_cols, axis=1)
+            return self._constructor(concat(new_cols, axis=1),
+                                     index=self.index,
+                                     columns=self.columns)
         else:
             return self
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Statistical methods, etc.
 
     def corr(self, method='pearson', min_periods=1):
@@ -4379,27 +6573,32 @@ def corr(self, method='pearson', min_periods=1):
         """
         numeric_df = self._get_numeric_data()
         cols = numeric_df.columns
+        idx = cols.copy()
         mat = numeric_df.values
 
         if method == 'pearson':
-            correl = _algos.nancorr(com._ensure_float64(mat),
-                                    minp=min_periods)
+            correl = libalgos.nancorr(_ensure_float64(mat), minp=min_periods)
         elif method == 'spearman':
-            correl = _algos.nancorr_spearman(com._ensure_float64(mat),
-                                             minp=min_periods)
+            correl = libalgos.nancorr_spearman(_ensure_float64(mat),
+                                               minp=min_periods)
         else:
             if min_periods is None:
                 min_periods = 1
-            mat = mat.T
+            mat = _ensure_float64(mat).T
             corrf = nanops.get_corr_func(method)
             K = len(cols)
             correl = np.empty((K, K), dtype=float)
             mask = np.isfinite(mat)
             for i, ac in enumerate(mat):
                 for j, bc in enumerate(mat):
+                    if i > j:
+                        continue
+
                     valid = mask[i] & mask[j]
                     if valid.sum() < min_periods:
-                        c = NA
+                        c = np.nan
+                    elif i == j:
+                        c = 1.
                     elif not valid.all():
                         c = corrf(ac[valid], bc[valid])
                     else:
@@ -4407,11 +6606,26 @@ def corr(self, method='pearson', min_periods=1):
                     correl[i, j] = c
                     correl[j, i] = c
 
-        return self._constructor(correl, index=cols, columns=cols)
+        return self._constructor(correl, index=idx, columns=cols)
 
     def cov(self, min_periods=None):
         """
-        Compute pairwise covariance of columns, excluding NA/null values
+        Compute pairwise covariance of columns, excluding NA/null values.
+
+        Compute the pairwise covariance among the series of a DataFrame.
+        The returned data frame is the `covariance matrix
+        <https://en.wikipedia.org/wiki/Covariance_matrix>`__ of the columns
+        of the DataFrame.
+
+        Both NA and null values are automatically excluded from the
+        calculation. (See the note below about bias from missing values.)
+        A threshold can be set for the minimum number of
+        observations for each value created. Comparisons with observations
+        below this threshold will be returned as ``NaN``.
+
+        This method is generally used for the analysis of time series data to
+        understand the relationship between different measures
+        across time.
 
         Parameters
         ----------
@@ -4421,18 +6635,78 @@ def cov(self, min_periods=None):
 
         Returns
         -------
-        y : DataFrame
+        DataFrame
+            The covariance matrix of the series of the DataFrame.
+
+        See Also
+        --------
+        pandas.Series.cov : compute covariance with another Series
+        pandas.core.window.EWM.cov: exponential weighted sample covariance
+        pandas.core.window.Expanding.cov : expanding sample covariance
+        pandas.core.window.Rolling.cov : rolling sample covariance
 
         Notes
         -----
-        `y` contains the covariance matrix of the DataFrame's time series.
-        The covariance is normalized by N-1 (unbiased estimator).
+        Returns the covariance matrix of the DataFrame's time series.
+        The covariance is normalized by N-1.
+
+        For DataFrames that have Series that are missing data (assuming that
+        data is `missing at random
+        <https://en.wikipedia.org/wiki/Missing_data#Missing_at_random>`__)
+        the returned covariance matrix will be an unbiased estimate
+        of the variance and covariance between the member Series.
+
+        However, for many applications this estimate may not be acceptable
+        because the estimate covariance matrix is not guaranteed to be positive
+        semi-definite. This could lead to estimate correlations having
+        absolute values which are greater than one, and/or a non-invertible
+        covariance matrix. See `Estimation of covariance matrices
+        <http://en.wikipedia.org/w/index.php?title=Estimation_of_covariance_
+        matrices>`__ for more details.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([(1, 2), (0, 3), (2, 0), (1, 1)],
+        ...                   columns=['dogs', 'cats'])
+        >>> df.cov()
+                  dogs      cats
+        dogs  0.666667 -1.000000
+        cats -1.000000  1.666667
+
+        >>> np.random.seed(42)
+        >>> df = pd.DataFrame(np.random.randn(1000, 5),
+        ...                   columns=['a', 'b', 'c', 'd', 'e'])
+        >>> df.cov()
+                  a         b         c         d         e
+        a  0.998438 -0.020161  0.059277 -0.008943  0.014144
+        b -0.020161  1.059352 -0.008543 -0.024738  0.009826
+        c  0.059277 -0.008543  1.010670 -0.001486 -0.000271
+        d -0.008943 -0.024738 -0.001486  0.921297 -0.013692
+        e  0.014144  0.009826 -0.000271 -0.013692  0.977795
+
+        **Minimum number of periods**
+
+        This method also supports an optional ``min_periods`` keyword
+        that specifies the required minimum number of non-NA observations for
+        each column pair in order to have a valid result:
+
+        >>> np.random.seed(42)
+        >>> df = pd.DataFrame(np.random.randn(20, 3),
+        ...                   columns=['a', 'b', 'c'])
+        >>> df.loc[df.index[:5], 'a'] = np.nan
+        >>> df.loc[df.index[5:10], 'b'] = np.nan
+        >>> df.cov(min_periods=12)
+                  a         b         c
+        a  0.316741       NaN -0.150812
+        b       NaN  1.248003  0.191417
+        c -0.150812  0.191417  0.895202
         """
         numeric_df = self._get_numeric_data()
         cols = numeric_df.columns
+        idx = cols.copy()
         mat = numeric_df.values
 
-        if notnull(mat).all():
+        if notna(mat).all():
             if min_periods is not None and min_periods > len(mat):
                 baseCov = np.empty((mat.shape[1], mat.shape[1]))
                 baseCov.fill(np.nan)
@@ -4440,10 +6714,10 @@ def cov(self, min_periods=None):
                 baseCov = np.cov(mat.T)
             baseCov = baseCov.reshape((len(cols), len(cols)))
         else:
-            baseCov = _algos.nancorr(com._ensure_float64(mat), cov=True,
-                                     minp=min_periods)
+            baseCov = libalgos.nancorr(_ensure_float64(mat), cov=True,
+                                       minp=min_periods)
 
-        return self._constructor(baseCov, index=cols, columns=cols)
+        return self._constructor(baseCov, index=idx, columns=cols)
 
     def corrwith(self, other, axis=0, drop=False):
         """
@@ -4452,7 +6726,7 @@ def corrwith(self, other, axis=0, drop=False):
 
         Parameters
         ----------
-        other : DataFrame
+        other : DataFrame, Series
         axis : {0 or 'index', 1 or 'columns'}, default 0
             0 or 'index' to compute column-wise, 1 or 'columns' for row-wise
         drop : boolean, default False
@@ -4463,10 +6737,11 @@ def corrwith(self, other, axis=0, drop=False):
         correls : Series
         """
         axis = self._get_axis_number(axis)
+        this = self._get_numeric_data()
+
         if isinstance(other, Series):
-            return self.apply(other.corr, axis=axis)
+            return this.apply(other.corr, axis=axis)
 
-        this = self._get_numeric_data()
         other = other._get_numeric_data()
 
         left, right = this.align(other, join='inner', copy=False)
@@ -4495,27 +6770,83 @@ def corrwith(self, other, axis=0, drop=False):
 
         return correl
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # ndarray-like stats methods
 
     def count(self, axis=0, level=None, numeric_only=False):
         """
-        Return Series with number of non-NA/null observations over requested
-        axis. Works with non-floating point data as well (detects NaN and None)
+        Count non-NA cells for each column or row.
+
+        The values `None`, `NaN`, `NaT`, and optionally `numpy.inf` (depending
+        on `pandas.options.mode.use_inf_as_na`) are considered NA.
 
         Parameters
         ----------
         axis : {0 or 'index', 1 or 'columns'}, default 0
-            0 or 'index' for row-wise, 1 or 'columns' for column-wise
-        level : int or level name, default None
-            If the axis is a MultiIndex (hierarchical), count along a
-            particular level, collapsing into a DataFrame
+            If 0 or 'index' counts are generated for each column.
+            If 1 or 'columns' counts are generated for each **row**.
+        level : int or str, optional
+            If the axis is a `MultiIndex` (hierarchical), count along a
+            particular `level`, collapsing into a `DataFrame`.
+            A `str` specifies the level name.
         numeric_only : boolean, default False
-            Include only float, int, boolean data
+            Include only `float`, `int` or `boolean` data.
 
         Returns
         -------
-        count : Series (or DataFrame if level specified)
+        Series or DataFrame
+            For each column/row the number of non-NA/null entries.
+            If `level` is specified returns a `DataFrame`.
+
+        See Also
+        --------
+        Series.count: number of non-NA elements in a Series
+        DataFrame.shape: number of DataFrame rows and columns (including NA
+            elements)
+        DataFrame.isna: boolean same-sized DataFrame showing places of NA
+            elements
+
+        Examples
+        --------
+        Constructing DataFrame from a dictionary:
+
+        >>> df = pd.DataFrame({"Person":
+        ...                    ["John", "Myla", None, "John", "Myla"],
+        ...                    "Age": [24., np.nan, 21., 33, 26],
+        ...                    "Single": [False, True, True, True, False]})
+        >>> df
+           Person   Age  Single
+        0    John  24.0   False
+        1    Myla   NaN    True
+        2    None  21.0    True
+        3    John  33.0    True
+        4    Myla  26.0   False
+
+        Notice the uncounted NA values:
+
+        >>> df.count()
+        Person    4
+        Age       4
+        Single    5
+        dtype: int64
+
+        Counts for each **row**:
+
+        >>> df.count(axis='columns')
+        0    3
+        1    2
+        2    2
+        3    3
+        4    3
+        dtype: int64
+
+        Counts for one level of a `MultiIndex`:
+
+        >>> df.set_index(["Person", "Single"]).count(level="Person")
+                Age
+        Person
+        John      2
+        Myla      1
         """
         axis = self._get_axis_number(axis)
         if level is not None:
@@ -4531,10 +6862,14 @@ def count(self, axis=0, level=None, numeric_only=False):
         if len(frame._get_axis(axis)) == 0:
             result = Series(0, index=frame._get_agg_axis(axis))
         else:
-            if frame._is_mixed_type:
-                result = notnull(frame).sum(axis=axis)
+            if frame._is_mixed_type or frame._data.any_extension_types:
+                # the or any_extension_types is really only hit for single-
+                # column frames with an extension array
+                result = notna(frame).sum(axis=axis)
             else:
-                counts = notnull(frame.values).sum(axis=axis)
+                # GH13407
+                series_counts = notna(frame).sum(axis=axis)
+                counts = series_counts.values
                 result = Series(counts, index=frame._get_agg_axis(axis))
 
         return result.astype('int64')
@@ -4549,16 +6884,16 @@ def _count_level(self, level, axis=0, numeric_only=False):
         agg_axis = frame._get_agg_axis(axis)
 
         if not isinstance(count_axis, MultiIndex):
-            raise TypeError("Can only count levels on hierarchical %s." %
-                            self._get_axis_name(axis))
+            raise TypeError("Can only count levels on hierarchical "
+                            "{ax}.".format(ax=self._get_axis_name(axis)))
 
         if frame._is_mixed_type:
-            # Since we have mixed types, calling notnull(frame.values) might
+            # Since we have mixed types, calling notna(frame.values) might
             # upcast everything to object
-            mask = notnull(frame).values
+            mask = notna(frame).values
         else:
             # But use the speedup when we have homogeneous dtypes
-            mask = notnull(frame.values)
+            mask = notna(frame.values)
 
         if axis == 1:
             # We're transposing the mask rather than frame to avoid potential
@@ -4569,11 +6904,10 @@ def _count_level(self, level, axis=0, numeric_only=False):
             level = count_axis._get_level_number(level)
 
         level_index = count_axis.levels[level]
-        labels = com._ensure_int64(count_axis.labels[level])
+        labels = _ensure_int64(count_axis.labels[level])
         counts = lib.count_level_2d(mask, labels, len(level_index), axis=0)
 
-        result = DataFrame(counts, index=level_index,
-                           columns=agg_axis)
+        result = DataFrame(counts, index=level_index, columns=agg_axis)
 
         if axis == 1:
             # Undo our earlier transpose
@@ -4583,9 +6917,17 @@ def _count_level(self, level, axis=0, numeric_only=False):
 
     def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
                 filter_type=None, **kwds):
-        axis = self._get_axis_number(axis)
-        f = lambda x: op(x, axis=axis, skipna=skipna, **kwds)
-        labels = self._get_agg_axis(axis)
+        if axis is None and filter_type == 'bool':
+            labels = None
+            constructor = None
+        else:
+            # TODO: Make other agg func handle axis=None properly
+            axis = self._get_axis_number(axis)
+            labels = self._get_agg_axis(axis)
+            constructor = self._constructor
+
+        def f(x):
+            return op(x, axis=axis, skipna=skipna, **kwds)
 
         # exclude timedelta/datetime unless we are uniform types
         if axis == 1 and self._is_mixed_type and self._is_datelike_mixed_type:
@@ -4595,6 +6937,13 @@ def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
             try:
                 values = self.values
                 result = f(values)
+
+                if (filter_type == 'bool' and is_object_dtype(values) and
+                        axis is None):
+                    # work around https://github.com/numpy/numpy/issues/10489
+                    # TODO: combine with hasattr(result, 'dtype') further down
+                    # hard since we don't have `values` down there.
+                    result = np.bool_(result)
             except Exception as e:
 
                 # try by-column first
@@ -4604,11 +6953,21 @@ def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
                         # this can end up with a non-reduction
                         # but not always. if the types are mixed
                         # with datelike then need to make sure a series
-                        result = self.apply(f,reduce=False)
+
+                        # we only end up here if we have not specified
+                        # numeric_only and yet we have tried a
+                        # column-by-column reduction, where we have mixed type.
+                        # So let's just do what we can
+                        from pandas.core.apply import frame_apply
+                        opa = frame_apply(self,
+                                          func=f,
+                                          result_type='expand',
+                                          ignore_failures=True)
+                        result = opa.get_result()
                         if result.ndim == self.ndim:
                             result = result.iloc[0]
                         return result
-                    except:
+                    except Exception:
                         pass
 
                 if filter_type is None or filter_type == 'numeric':
@@ -4616,11 +6975,12 @@ def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
                 elif filter_type == 'bool':
                     data = self._get_bool_data()
                 else:  # pragma: no cover
-                    e = NotImplementedError("Handling exception with filter_"
-                                            "type %s not implemented."
-                                            % filter_type)
+                    e = NotImplementedError(
+                        "Handling exception with filter_type {f} not"
+                        "implemented.".format(f=filter_type))
                     raise_with_traceback(e)
-                result = f(data.values)
+                with np.errstate(all='ignore'):
+                    result = f(data.values)
                 labels = data._get_agg_axis(axis)
         else:
             if numeric_only:
@@ -4629,8 +6989,8 @@ def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
                 elif filter_type == 'bool':
                     data = self._get_bool_data()
                 else:  # pragma: no cover
-                    msg = ("Generating numeric_only data with filter_type %s"
-                           "not supported." % filter_type)
+                    msg = ("Generating numeric_only data with filter_type {f}"
+                           "not supported.".format(f=filter_type))
                     raise NotImplementedError(msg)
                 values = data.values
                 labels = data._get_agg_axis(axis)
@@ -4642,15 +7002,48 @@ def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
             try:
                 if filter_type is None or filter_type == 'numeric':
                     result = result.astype(np.float64)
-                elif filter_type == 'bool' and notnull(result).all():
+                elif filter_type == 'bool' and notna(result).all():
                     result = result.astype(np.bool_)
             except (ValueError, TypeError):
 
                 # try to coerce to the original dtypes item by item if we can
                 if axis == 0:
-                    result = com._coerce_to_dtypes(result, self.dtypes)
+                    result = coerce_to_dtypes(result, self.dtypes)
+
+        if constructor is not None:
+            result = Series(result, index=labels)
+        return result
+
+    def nunique(self, axis=0, dropna=True):
+        """
+        Return Series with number of distinct observations over requested
+        axis.
 
-        return Series(result, index=labels)
+        .. versionadded:: 0.20.0
+
+        Parameters
+        ----------
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+        dropna : boolean, default True
+            Don't include NaN in the counts.
+
+        Returns
+        -------
+        nunique : Series
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'A': [1, 2, 3], 'B': [1, 1, 1]})
+        >>> df.nunique()
+        A    3
+        B    1
+
+        >>> df.nunique(axis=1)
+        0    1
+        1    2
+        2    2
+        """
+        return self.apply(Series.nunique, axis=axis, dropna=dropna)
 
     def idxmin(self, axis=0, skipna=True):
         """
@@ -4663,7 +7056,12 @@ def idxmin(self, axis=0, skipna=True):
             0 or 'index' for row-wise, 1 or 'columns' for column-wise
         skipna : boolean, default True
             Exclude NA/null values. If an entire row/column is NA, the result
-            will be NA
+            will be NA.
+
+        Raises
+        ------
+        ValueError
+            * If the row/column is empty
 
         Returns
         -------
@@ -4680,7 +7078,7 @@ def idxmin(self, axis=0, skipna=True):
         axis = self._get_axis_number(axis)
         indices = nanops.nanargmin(self.values, axis=axis, skipna=skipna)
         index = self._get_axis(axis)
-        result = [index[i] if i >= 0 else NA for i in indices]
+        result = [index[i] if i >= 0 else np.nan for i in indices]
         return Series(result, index=self._get_agg_axis(axis))
 
     def idxmax(self, axis=0, skipna=True):
@@ -4694,7 +7092,12 @@ def idxmax(self, axis=0, skipna=True):
             0 or 'index' for row-wise, 1 or 'columns' for column-wise
         skipna : boolean, default True
             Exclude NA/null values. If an entire row/column is NA, the result
-            will be first index.
+            will be NA.
+
+        Raises
+        ------
+        ValueError
+            * If the row/column is empty
 
         Returns
         -------
@@ -4711,11 +7114,11 @@ def idxmax(self, axis=0, skipna=True):
         axis = self._get_axis_number(axis)
         indices = nanops.nanargmax(self.values, axis=axis, skipna=skipna)
         index = self._get_axis(axis)
-        result = [index[i] if i >= 0 else NA for i in indices]
+        result = [index[i] if i >= 0 else np.nan for i in indices]
         return Series(result, index=self._get_agg_axis(axis))
 
     def _get_agg_axis(self, axis_num):
-        """ let's be explict about this """
+        """ let's be explicit about this """
         if axis_num == 0:
             return self.columns
         elif axis_num == 1:
@@ -4723,16 +7126,15 @@ def _get_agg_axis(self, axis_num):
         else:
             raise ValueError('Axis must be 0 or 1 (got %r)' % axis_num)
 
-    def mode(self, axis=0, numeric_only=False):
+    def mode(self, axis=0, numeric_only=False, dropna=True):
         """
-        Gets the mode(s) of each element along the axis selected. Empty if nothing
-        has 2+ occurrences. Adds a row for each mode per label, fills in gaps
-        with nan.
+        Gets the mode(s) of each element along the axis selected. Adds a row
+        for each mode per label, fills in gaps with nan.
 
         Note that there could be multiple values returned for the selected
-        axis (when more than one item share the maximum frequency), which is the
-        reason why a dataframe is returned. If you want to impute missing values
-        with the mode in a dataframe ``df``, you can just do this:
+        axis (when more than one item share the maximum frequency), which is
+        the reason why a dataframe is returned. If you want to impute missing
+        values with the mode in a dataframe ``df``, you can just do this:
         ``df.fillna(df.mode().iloc[0])``
 
         Parameters
@@ -4742,6 +7144,10 @@ def mode(self, axis=0, numeric_only=False):
             * 1 or 'columns' : get mode of each row
         numeric_only : boolean, default False
             if True, only apply to numeric columns
+        dropna : boolean, default True
+            Don't consider counts of NaN/NaT.
+
+            .. versionadded:: 0.24.0
 
         Returns
         -------
@@ -4756,10 +7162,14 @@ def mode(self, axis=0, numeric_only=False):
         1  2
         """
         data = self if not numeric_only else self._get_numeric_data()
-        f = lambda s: s.mode()
+
+        def f(s):
+            return s.mode(dropna=dropna)
+
         return data.apply(f, axis=axis)
 
-    def quantile(self, q=0.5, axis=0, numeric_only=True):
+    def quantile(self, q=0.5, axis=0, numeric_only=True,
+                 interpolation='linear'):
         """
         Return values at the given quantile over requested axis, a la
         numpy.percentile.
@@ -4770,22 +7180,37 @@ def quantile(self, q=0.5, axis=0, numeric_only=True):
             0 <= q <= 1, the quantile(s) to compute
         axis : {0, 1, 'index', 'columns'} (default 0)
             0 or 'index' for row-wise, 1 or 'columns' for column-wise
-
+        numeric_only : boolean, default True
+            If False, the quantile of datetime and timedelta data will be
+            computed as well
+        interpolation : {'linear', 'lower', 'higher', 'midpoint', 'nearest'}
+            .. versionadded:: 0.18.0
+
+            This optional parameter specifies the interpolation method to use,
+            when the desired quantile lies between two data points `i` and `j`:
+
+            * linear: `i + (j - i) * fraction`, where `fraction` is the
+              fractional part of the index surrounded by `i` and `j`.
+            * lower: `i`.
+            * higher: `j`.
+            * nearest: `i` or `j` whichever is nearest.
+            * midpoint: (`i` + `j`) / 2.
 
         Returns
         -------
         quantiles : Series or DataFrame
-            If ``q`` is an array, a DataFrame will be returned where the
-            index is ``q``, the columns are the columns of self, and the
-            values are the quantiles.
-            If ``q`` is a float, a Series will be returned where the
-            index is the columns of self and the values are the quantiles.
+
+            - If ``q`` is an array, a DataFrame will be returned where the
+              index is ``q``, the columns are the columns of self, and the
+              values are the quantiles.
+            - If ``q`` is a float, a Series will be returned where the
+              index is the columns of self and the values are the quantiles.
 
         Examples
         --------
 
-        >>> df = DataFrame(np.array([[1, 1], [2, 10], [3, 100], [4, 100]]),
-                          columns=['a', 'b'])
+        >>> df = pd.DataFrame(np.array([[1, 1], [2, 10], [3, 100], [4, 100]]),
+                              columns=['a', 'b'])
         >>> df.quantile(.1)
         a    1.3
         b    3.7
@@ -4794,103 +7219,48 @@ def quantile(self, q=0.5, axis=0, numeric_only=True):
                a     b
         0.1  1.3   3.7
         0.5  2.5  55.0
-        """
-        self._check_percentile(q)
-        per = np.asarray(q) * 100
 
-        if not com.is_list_like(per):
-            per = [per]
-            q = [q]
-            squeeze = True
-        else:
-            squeeze = False
+        Specifying `numeric_only=False` will also compute the quantile of
+        datetime and timedelta data.
 
-        def f(arr, per):
-            if arr._is_datelike_mixed_type:
-                values = _values_from_object(arr).view('i8')
-            else:
-                values = arr.astype(float)
-            values = values[notnull(values)]
-            if len(values) == 0:
-                return NA
-            else:
-                return _quantile(values, per)
+        >>> df = pd.DataFrame({'A': [1, 2],
+                               'B': [pd.Timestamp('2010'),
+                                     pd.Timestamp('2011')],
+                               'C': [pd.Timedelta('1 days'),
+                                     pd.Timedelta('2 days')]})
+        >>> df.quantile(0.5, numeric_only=False)
+        A                    1.5
+        B    2010-07-02 12:00:00
+        C        1 days 12:00:00
+        Name: 0.5, dtype: object
 
-        data = self._get_numeric_data() if numeric_only else self
+        See Also
+        --------
+        pandas.core.window.Rolling.quantile
+        """
+        self._check_percentile(q)
 
+        data = self._get_numeric_data() if numeric_only else self
         axis = self._get_axis_number(axis)
+        is_transposed = axis == 1
 
-        if axis == 1:
+        if is_transposed:
             data = data.T
 
-        # need to know which cols are timestamp going in so that we can
-        # map timestamp over them after getting the quantile.
-        is_dt_col = data.dtypes.map(com.is_datetime64_dtype)
-        is_dt_col = is_dt_col[is_dt_col].index
-
-        quantiles = [[f(vals, x) for x in per]
-                     for (_, vals) in data.iteritems()]
-
-        result = self._constructor(quantiles, index=data._info_axis,
-                                   columns=q).T
-        if len(is_dt_col) > 0:
-            result[is_dt_col] = result[is_dt_col].applymap(lib.Timestamp)
-        if squeeze:
-            if result.shape == (1, 1):
-                result = result.T.iloc[:, 0]  # don't want scalar
-            else:
-                result = result.T.squeeze()
-            result.name = None  # For groupby, so it can set an index name
-        return result
+        result = data._data.quantile(qs=q,
+                                     axis=1,
+                                     interpolation=interpolation,
+                                     transposed=is_transposed)
 
-    def rank(self, axis=0, numeric_only=None, method='average',
-             na_option='keep', ascending=True, pct=False):
-        """
-        Compute numerical data ranks (1 through n) along axis. Equal values are
-        assigned a rank that is the average of the ranks of those values
+        if result.ndim == 2:
+            result = self._constructor(result)
+        else:
+            result = self._constructor_sliced(result, name=q)
 
-        Parameters
-        ----------
-        axis : {0 or 'index', 1 or 'columns'}, default 0
-            Ranks over columns (0) or rows (1)
-        numeric_only : boolean, default None
-            Include only float, int, boolean data
-        method : {'average', 'min', 'max', 'first', 'dense'}
-            * average: average rank of group
-            * min: lowest rank in group
-            * max: highest rank in group
-            * first: ranks assigned in order they appear in the array
-            * dense: like 'min', but rank always increases by 1 between groups
-        na_option : {'keep', 'top', 'bottom'}
-            * keep: leave NA values where they are
-            * top: smallest rank if ascending
-            * bottom: smallest rank if descending
-        ascending : boolean, default True
-            False for ranks by high (1) to low (N)
-        pct : boolean, default False
-            Computes percentage rank of data
+        if is_transposed:
+            result = result.T
 
-        Returns
-        -------
-        ranks : DataFrame
-        """
-        axis = self._get_axis_number(axis)
-        if numeric_only is None:
-            try:
-                ranks = algos.rank(self.values, axis=axis, method=method,
-                                   ascending=ascending, na_option=na_option,
-                                   pct=pct)
-                return self._constructor(ranks, index=self.index,
-                                         columns=self.columns)
-            except TypeError:
-                numeric_only = True
-        if numeric_only:
-            data = self._get_numeric_data()
-        else:
-            data = self
-        ranks = algos.rank(data.values, axis=axis, method=method,
-                           ascending=ascending, na_option=na_option, pct=pct)
-        return self._constructor(ranks, index=data.index, columns=data.columns)
+        return result
 
     def to_timestamp(self, freq=None, how='start', axis=0, copy=True):
         """
@@ -4922,7 +7292,8 @@ def to_timestamp(self, freq=None, how='start', axis=0, copy=True):
         elif axis == 1:
             new_data.set_axis(0, self.columns.to_timestamp(freq=freq, how=how))
         else:  # pragma: no cover
-            raise AssertionError('Axis must be 0 or 1. Got %s' % str(axis))
+            raise AssertionError('Axis must be 0 or 1. Got {ax!s}'.format(
+                ax=axis))
 
         return self._constructor(new_data)
 
@@ -4953,7 +7324,8 @@ def to_period(self, freq=None, axis=0, copy=True):
         elif axis == 1:
             new_data.set_axis(0, self.columns.to_period(freq=freq))
         else:  # pragma: no cover
-            raise AssertionError('Axis must be 0 or 1. Got %s' % str(axis))
+            raise AssertionError('Axis must be 0 or 1. Got {ax!s}'.format(
+                ax=axis))
 
         return self._constructor(new_data)
 
@@ -4980,7 +7352,7 @@ def isin(self, values):
         --------
         When ``values`` is a list:
 
-        >>> df = DataFrame({'A': [1, 2, 3], 'B': ['a', 'b', 'f']})
+        >>> df = pd.DataFrame({'A': [1, 2, 3], 'B': ['a', 'b', 'f']})
         >>> df.isin([1, 3, 12, 'a'])
                A      B
         0   True   True
@@ -4989,7 +7361,7 @@ def isin(self, values):
 
         When ``values`` is a dict:
 
-        >>> df = DataFrame({'A': [1, 2, 3], 'B': [1, 4, 7]})
+        >>> df = pd.DataFrame({'A': [1, 2, 3], 'B': [1, 4, 7]})
         >>> df.isin({'A': [1, 3], 'B': [4, 7, 12]})
                A      B
         0   True  False  # Note that B didn't match the 1 here.
@@ -4998,103 +7370,58 @@ def isin(self, values):
 
         When ``values`` is a Series or DataFrame:
 
-        >>> df = DataFrame({'A': [1, 2, 3], 'B': ['a', 'b', 'f']})
-        >>> other = DataFrame({'A': [1, 3, 3, 2], 'B': ['e', 'f', 'f', 'e']})
-        >>> df.isin(other)
+        >>> df = pd.DataFrame({'A': [1, 2, 3], 'B': ['a', 'b', 'f']})
+        >>> df2 = pd.DataFrame({'A': [1, 3, 3, 2], 'B': ['e', 'f', 'f', 'e']})
+        >>> df.isin(df2)
                A      B
         0   True  False
-        1  False  False  # Column A in `other` has a 3, but not at index 1.
+        1  False  False  # Column A in `df2` has a 3, but not at index 1.
         2   True   True
         """
         if isinstance(values, dict):
-            from collections import defaultdict
-            from pandas.tools.merge import concat
-            values = defaultdict(list, values)
+            from pandas.core.reshape.concat import concat
+            values = collections.defaultdict(list, values)
             return concat((self.iloc[:, [i]].isin(values[col])
                            for i, col in enumerate(self.columns)), axis=1)
         elif isinstance(values, Series):
             if not values.index.is_unique:
-                raise ValueError("ValueError: cannot compute isin with"
-                                 " a duplicate axis.")
+                raise ValueError("cannot compute isin with "
+                                 "a duplicate axis.")
             return self.eq(values.reindex_like(self), axis='index')
         elif isinstance(values, DataFrame):
             if not (values.columns.is_unique and values.index.is_unique):
-                raise ValueError("ValueError: cannot compute isin with"
-                                 " a duplicate axis.")
+                raise ValueError("cannot compute isin with "
+                                 "a duplicate axis.")
             return self.eq(values.reindex_like(self))
         else:
             if not is_list_like(values):
-                raise TypeError("only list-like or dict-like objects are"
-                                " allowed to be passed to DataFrame.isin(), "
+                raise TypeError("only list-like or dict-like objects are "
+                                "allowed to be passed to DataFrame.isin(), "
                                 "you passed a "
                                 "{0!r}".format(type(values).__name__))
-            return DataFrame(lib.ismember(self.values.ravel(),
-                                          set(values)).reshape(self.shape),
-                             self.index,
-                             self.columns)
-
-    #----------------------------------------------------------------------
-    # Deprecated stuff
-
-    def combineAdd(self, other):
-        """
-        DEPRECATED. Use ``DataFrame.add(other, fill_value=0.)`` instead.
+            return DataFrame(
+                algorithms.isin(self.values.ravel(),
+                                values).reshape(self.shape), self.index,
+                self.columns)
 
-        Add two DataFrame objects and do not propagate
-        NaN values, so if for a (column, time) one frame is missing a
-        value, it will default to the other frame's value (which might
-        be NaN as well)
-
-        Parameters
-        ----------
-        other : DataFrame
-
-        Returns
-        -------
-        DataFrame
-
-        See also
-        --------
-        DataFrame.add
-
-        """
-        warnings.warn("'combineAdd' is deprecated. Use "
-                      "'DataFrame.add(other, fill_value=0.)' instead",
-                      FutureWarning, stacklevel=2)
-        return self.add(other, fill_value=0.)
-
-    def combineMult(self, other):
-        """
-        DEPRECATED. Use ``DataFrame.mul(other, fill_value=1.)`` instead.
-
-        Multiply two DataFrame objects and do not propagate NaN values, so if
-        for a (column, time) one frame is missing a value, it will default to
-        the other frame's value (which might be NaN as well)
-
-        Parameters
-        ----------
-        other : DataFrame
-
-        Returns
-        -------
-        DataFrame
-
-        See also
-        --------
-        DataFrame.mul
-
-        """
-        warnings.warn("'combineMult' is deprecated. Use "
-                      "'DataFrame.mul(other, fill_value=1.)' instead",
-                      FutureWarning, stacklevel=2)
-        return self.mul(other, fill_value=1.)
+    # ----------------------------------------------------------------------
+    # Add plotting methods to DataFrame
+    plot = CachedAccessor("plot", gfx.FramePlotMethods)
+    hist = gfx.hist_frame
+    boxplot = gfx.boxplot_frame
 
 
 DataFrame._setup_axes(['index', 'columns'], info_axis=1, stat_axis=0,
-                      axes_are_reversed=True, aliases={'rows': 0})
+                      axes_are_reversed=True, aliases={'rows': 0},
+                      docs={
+                          'index': 'The index (row labels) of the DataFrame.',
+                          'columns': 'The column labels of the DataFrame.'})
 DataFrame._add_numeric_operations()
+DataFrame._add_series_or_dataframe_operations()
+
+ops.add_flex_arithmetic_methods(DataFrame)
+ops.add_special_arithmetic_methods(DataFrame)
 
-_EMPTY_SERIES = Series([])
 
 def _arrays_to_mgr(arrays, arr_names, index, columns, dtype=None):
     """
@@ -5104,8 +7431,6 @@ def _arrays_to_mgr(arrays, arr_names, index, columns, dtype=None):
     # figure out the index, if necessary
     if index is None:
         index = extract_index(arrays)
-    else:
-        index = _ensure_index(index)
 
     # don't force copy because getting jammed in an ndarray anyway
     arrays = _homogenize(arrays, index, dtype)
@@ -5159,11 +7484,11 @@ def extract_index(data):
 
             if have_series:
                 if lengths[0] != len(index):
-                    msg = ('array length %d does not match index length %d'
-                           % (lengths[0], len(index)))
+                    msg = ('array length %d does not match index length %d' %
+                           (lengths[0], len(index)))
                     raise ValueError(msg)
             else:
-                index = Index(np.arange(lengths[0]))
+                index = com._default_index(lengths[0])
 
     return _ensure_index(index)
 
@@ -5174,13 +7499,13 @@ def _prep_ndarray(values, copy=True):
             return np.empty((0, 0), dtype=object)
 
         def convert(v):
-            return com._possibly_convert_platform(v)
+            return maybe_convert_platform(v)
 
         # we could have a 1-dim or 2-dim list here
         # this is equiv of np.asarray, but does object conversion
         # and platform dtype preservation
         try:
-            if com.is_list_like(values[0]) or hasattr(values[0], 'len'):
+            if is_list_like(values[0]) or hasattr(values[0], 'len'):
                 values = np.array([convert(v) for v in values])
             else:
                 values = convert(values)
@@ -5208,11 +7533,11 @@ def _to_arrays(data, columns, coerce_float=False, dtype=None):
     """
     if isinstance(data, DataFrame):
         if columns is not None:
-            arrays = [data._ixs(i,axis=1).values for i, col in enumerate(data.columns)
-                      if col in columns]
+            arrays = [data._ixs(i, axis=1).values
+                      for i, col in enumerate(data.columns) if col in columns]
         else:
             columns = data.columns
-            arrays = [data._ixs(i,axis=1).values for i in range(len(columns))]
+            arrays = [data._ixs(i, axis=1).values for i in range(len(columns))]
 
         return arrays, columns
 
@@ -5227,18 +7552,17 @@ def _to_arrays(data, columns, coerce_float=False, dtype=None):
                                dtype=dtype)
     elif isinstance(data[0], collections.Mapping):
         return _list_of_dict_to_arrays(data, columns,
-                                       coerce_float=coerce_float,
-                                       dtype=dtype)
+                                       coerce_float=coerce_float, dtype=dtype)
     elif isinstance(data[0], Series):
         return _list_of_series_to_arrays(data, columns,
                                          coerce_float=coerce_float,
                                          dtype=dtype)
     elif isinstance(data[0], Categorical):
         if columns is None:
-            columns = _default_index(len(data))
+            columns = com._default_index(len(data))
         return data, columns
-    elif (isinstance(data, (np.ndarray, Series, Index))
-          and data.dtype.names is not None):
+    elif (isinstance(data, (np.ndarray, Series, Index)) and
+          data.dtype.names is not None):
 
         columns = list(data.dtype.names)
         arrays = [data[k] for k in columns]
@@ -5246,8 +7570,7 @@ def _to_arrays(data, columns, coerce_float=False, dtype=None):
     else:
         # last ditch effort
         data = lmap(tuple, data)
-        return _list_to_arrays(data, columns,
-                               coerce_float=coerce_float,
+        return _list_to_arrays(data, columns, coerce_float=coerce_float,
                                dtype=dtype)
 
 
@@ -5260,7 +7583,7 @@ def _masked_rec_array_to_mgr(data, index, columns, dtype, copy):
     if index is None:
         index = _get_names_from_index(fdata)
         if index is None:
-            index = _default_index(len(data))
+            index = com._default_index(len(data))
     index = _ensure_index(index)
 
     if columns is not None:
@@ -5272,7 +7595,7 @@ def _masked_rec_array_to_mgr(data, index, columns, dtype, copy):
     for fv, arr, col in zip(fill_value, arrays, arr_columns):
         mask = ma.getmaskarray(data[col])
         if mask.any():
-            arr, fv = _maybe_upcast(arr, fill_value=fv, copy=True)
+            arr, fv = maybe_upcast(arr, fill_value=fv, copy=True)
             arr[mask] = fv
         new_arrays.append(arr)
 
@@ -5292,10 +7615,8 @@ def _reorder_arrays(arrays, arr_columns, columns):
     # reorder according to the columns
     if (columns is not None and len(columns) and arr_columns is not None and
             len(arr_columns)):
-        indexer = _ensure_index(
-            arr_columns).get_indexer(columns)
-        arr_columns = _ensure_index(
-            [arr_columns[i] for i in indexer])
+        indexer = _ensure_index(arr_columns).get_indexer(columns)
+        arr_columns = _ensure_index([arr_columns[i] for i in indexer])
         arrays = [arrays[i] for i in indexer]
     return arrays, arr_columns
 
@@ -5311,12 +7632,10 @@ def _list_to_arrays(data, columns, coerce_float=False, dtype=None):
 
 
 def _list_of_series_to_arrays(data, columns, coerce_float=False, dtype=None):
-    from pandas.core.index import _get_combined_index
+    from pandas.core.index import _get_objs_combined_axis
 
     if columns is None:
-        columns = _get_combined_index([
-            s.index for s in data if getattr(s, 'index', None) is not None
-        ])
+        columns = _get_objs_combined_axis(data, sort=False)
 
     indexer_cache = {}
 
@@ -5324,15 +7643,15 @@ def _list_of_series_to_arrays(data, columns, coerce_float=False, dtype=None):
     for s in data:
         index = getattr(s, 'index', None)
         if index is None:
-            index = _default_index(len(s))
+            index = com._default_index(len(s))
 
         if id(index) in indexer_cache:
             indexer = indexer_cache[id(index)]
         else:
             indexer = indexer_cache[id(index)] = index.get_indexer(columns)
 
-        values = _values_from_object(s)
-        aligned_values.append(com.take_1d(values, indexer))
+        values = com._values_from_object(s)
+        aligned_values.append(algorithms.take_1d(values, indexer))
 
     values = np.vstack(aligned_values)
 
@@ -5347,7 +7666,8 @@ def _list_of_series_to_arrays(data, columns, coerce_float=False, dtype=None):
 def _list_of_dict_to_arrays(data, columns, coerce_float=False, dtype=None):
     if columns is None:
         gen = (list(x.keys()) for x in data)
-        columns = lib.fast_unique_multiple_list_gen(gen)
+        sort = not any(isinstance(d, OrderedDict) for d in data)
+        columns = lib.fast_unique_multiple_list_gen(gen, sort=sort)
 
     # assure that they are of the base dict class and not of derived
     # classes
@@ -5360,31 +7680,32 @@ def _list_of_dict_to_arrays(data, columns, coerce_float=False, dtype=None):
 
 def _convert_object_array(content, columns, coerce_float=False, dtype=None):
     if columns is None:
-        columns = _default_index(len(content))
+        columns = com._default_index(len(content))
     else:
         if len(columns) != len(content):  # pragma: no cover
             # caller's responsibility to check for this...
-            raise AssertionError('%d columns passed, passed data had %s '
-                                 'columns' % (len(columns), len(content)))
+            raise AssertionError('{col:d} columns passed, passed data had '
+                                 '{con} columns'.format(col=len(columns),
+                                                        con=len(content)))
 
     # provide soft conversion of object dtypes
     def convert(arr):
         if dtype != object and dtype != np.object:
             arr = lib.maybe_convert_objects(arr, try_float=coerce_float)
-            arr = com._possibly_cast_to_datetime(arr, dtype)
+            arr = maybe_cast_to_datetime(arr, dtype)
         return arr
 
-    arrays = [ convert(arr) for arr in content ]
+    arrays = [convert(arr) for arr in content]
 
     return arrays, columns
 
 
 def _get_names_from_index(data):
-    index = lrange(len(data))
-    has_some_name = any([getattr(s, 'name', None) is not None for s in data])
+    has_some_name = any(getattr(s, 'name', None) is not None for s in data)
     if not has_some_name:
-        return index
+        return com._default_index(len(data))
 
+    index = lrange(len(data))
     count = 0
     for i, s in enumerate(data):
         n = getattr(s, 'name', None)
@@ -5417,10 +7738,10 @@ def _homogenize(data, index, dtype=None):
                     oindex = index.astype('O')
 
                 if isinstance(index, (DatetimeIndex, TimedeltaIndex)):
-                    v = _dict_compat(v)
+                    v = com._dict_compat(v)
                 else:
                     v = dict(v)
-                v = lib.fast_multiget(v, oindex.values, default=NA)
+                v = lib.fast_multiget(v, oindex.values, default=np.nan)
             v = _sanitize_array(v, index, dtype=dtype, copy=False,
                                 raise_cast_failure=False)
 
@@ -5440,37 +7761,4 @@ def _from_nested_dict(data):
 
 
 def _put_str(s, space):
-    return ('%s' % s)[:space].ljust(space)
-
-
-#----------------------------------------------------------------------
-# Add plotting methods to DataFrame
-
-import pandas.tools.plotting as gfx
-
-DataFrame.plot = base.AccessorProperty(gfx.FramePlotMethods, gfx.FramePlotMethods)
-DataFrame.hist = gfx.hist_frame
-
-
-@Appender(_shared_docs['boxplot'] % _shared_doc_kwargs)
-def boxplot(self, column=None, by=None, ax=None, fontsize=None,
-            rot=0, grid=True, figsize=None, layout=None, return_type=None,
-            **kwds):
-    import pandas.tools.plotting as plots
-    import matplotlib.pyplot as plt
-    ax = plots.boxplot(self, column=column, by=by, ax=ax,
-                       fontsize=fontsize, grid=grid, rot=rot,
-                       figsize=figsize, layout=layout, return_type=return_type,
-                       **kwds)
-    plt.draw_if_interactive()
-    return ax
-
-DataFrame.boxplot = boxplot
-
-ops.add_flex_arithmetic_methods(DataFrame, **ops.frame_flex_funcs)
-ops.add_special_arithmetic_methods(DataFrame, **ops.frame_special_funcs)
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
+    return u'{s}'.format(s=s)[:space].ljust(space)
diff --git a/pandas/core/generic.py b/pandas/core/generic.py
index 98f9677fb6784..26c23b84a9c04 100644
--- a/pandas/core/generic.py
+++ b/pandas/core/generic.py
@@ -1,58 +1,89 @@
 # pylint: disable=W0231,E1101
+import collections
+import functools
 import warnings
 import operator
 import weakref
 import gc
+import json
 
 import numpy as np
-import pandas.lib as lib
-
 import pandas as pd
-from pandas.core.base import PandasObject
+
+from pandas._libs import tslib, properties
+from pandas.core.dtypes.common import (
+    _ensure_int64,
+    _ensure_object,
+    is_scalar,
+    is_number,
+    is_integer, is_bool,
+    is_bool_dtype,
+    is_categorical_dtype,
+    is_numeric_dtype,
+    is_datetime64_dtype,
+    is_timedelta64_dtype,
+    is_datetime64tz_dtype,
+    is_list_like,
+    is_dict_like,
+    is_re_compilable,
+    is_period_arraylike,
+    is_object_dtype,
+    pandas_dtype)
+from pandas.core.dtypes.cast import maybe_promote, maybe_upcast_putmask
+from pandas.core.dtypes.inference import is_hashable
+from pandas.core.dtypes.missing import isna, notna
+from pandas.core.dtypes.generic import ABCSeries, ABCPanel, ABCDataFrame
+
+from pandas.core.base import PandasObject, SelectionMixin
 from pandas.core.index import (Index, MultiIndex, _ensure_index,
-                               InvalidIndexError)
+                               InvalidIndexError, RangeIndex)
 import pandas.core.indexing as indexing
-from pandas.tseries.index import DatetimeIndex
-from pandas.tseries.period import PeriodIndex
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexes.period import PeriodIndex, Period
 from pandas.core.internals import BlockManager
+import pandas.core.algorithms as algos
 import pandas.core.common as com
-import pandas.core.datetools as datetools
+import pandas.core.missing as missing
+from pandas.io.formats.printing import pprint_thing
+from pandas.io.formats.format import format_percentiles, DataFrameFormatter
+from pandas.tseries.frequencies import to_offset
 from pandas import compat
-from pandas.compat import map, zip, lrange, string_types, isidentifier
-from pandas.core.common import (isnull, notnull, is_list_like,
-                                _values_from_object, _maybe_promote,
-                                _maybe_box_datetimelike, ABCSeries,
-                                SettingWithCopyError, SettingWithCopyWarning,
-                                AbstractMethodError)
+from pandas.compat.numpy import function as nv
+from pandas.compat import (map, zip, lzip, lrange, string_types, to_str,
+                           isidentifier, set_function_name, cPickle as pkl)
+from pandas.core.ops import _align_method_FRAME
 import pandas.core.nanops as nanops
-from pandas.util.decorators import Appender, Substitution, deprecate_kwarg
+from pandas.util._decorators import (Appender, Substitution,
+                                     deprecate_kwarg)
+from pandas.util._validators import validate_bool_kwarg, validate_fillna_kwargs
 from pandas.core import config
 
-
 # goal is to be able to define the docs close to function, while still being
 # able to share
 _shared_docs = dict()
-_shared_doc_kwargs = dict(axes='keywords for axes',
-                          klass='NDFrame',
-                          axes_single_arg='int or labels for object',
-                          args_transpose='axes to permute (int or label for'
-                                         ' object)')
-
-
-def is_dictlike(x):
-    return isinstance(x, (dict, com.ABCSeries))
+_shared_doc_kwargs = dict(
+    axes='keywords for axes', klass='NDFrame',
+    axes_single_arg='int or labels for object',
+    args_transpose='axes to permute (int or label for object)',
+    optional_by="""
+        by : str or list of str
+            Name or list of names to sort by""")
 
 
 def _single_replace(self, to_replace, method, inplace, limit):
+    """
+    Replaces values in a Series using the fill method specified when no
+    replacement value is given in the replace method
+    """
     if self.ndim != 1:
         raise TypeError('cannot replace {0} with method {1} on a {2}'
                         .format(to_replace, method, type(self).__name__))
 
     orig_dtype = self.dtype
     result = self if inplace else self.copy()
-    fill_f = com._get_fill_func(method)
+    fill_f = missing.get_fill_func(method)
 
-    mask = com.mask_missing(result.values, to_replace)
+    mask = missing.mask_missing(result.values, to_replace)
     values = fill_f(result.values, limit=limit, mask=mask)
 
     if values.dtype == orig_dtype and inplace:
@@ -68,8 +99,7 @@ def _single_replace(self, to_replace, method, inplace, limit):
     return result
 
 
-class NDFrame(PandasObject):
-
+class NDFrame(PandasObject, SelectionMixin):
     """
     N-dimensional analogue of DataFrame. Store multi-dimensional in a
     size-mutable, labeled data structure
@@ -80,14 +110,16 @@ class NDFrame(PandasObject):
     axes : list
     copy : boolean, default False
     """
-    _internal_names = ['_data', '_cacher', '_item_cache', '_cache',
-                       'is_copy', '_subtyp', '_index',
-                       '_default_kind', '_default_fill_value', '_metadata',
-                       '__array_struct__', '__array_interface__']
+    _internal_names = ['_data', '_cacher', '_item_cache', '_cache', '_is_copy',
+                       '_subtyp', '_name', '_index', '_default_kind',
+                       '_default_fill_value', '_metadata', '__array_struct__',
+                       '__array_interface__']
     _internal_names_set = set(_internal_names)
     _accessors = frozenset([])
+    _deprecations = frozenset(['as_blocks', 'blocks',
+                               'consolidate', 'convert_objects', 'is_copy'])
     _metadata = []
-    is_copy = None
+    _is_copy = None
 
     def __init__(self, data, axes=None, copy=False, dtype=None,
                  fastpath=False):
@@ -102,29 +134,54 @@ def __init__(self, data, axes=None, copy=False, dtype=None,
                 for i, ax in enumerate(axes):
                     data = data.reindex_axis(ax, axis=i)
 
-        object.__setattr__(self, 'is_copy', None)
+        object.__setattr__(self, '_is_copy', None)
         object.__setattr__(self, '_data', data)
         object.__setattr__(self, '_item_cache', {})
 
+    @property
+    def is_copy(self):
+        warnings.warn("Attribute 'is_copy' is deprecated and will be removed "
+                      "in a future version.", FutureWarning, stacklevel=2)
+        return self._is_copy
+
+    @is_copy.setter
+    def is_copy(self, msg):
+        warnings.warn("Attribute 'is_copy' is deprecated and will be removed "
+                      "in a future version.", FutureWarning, stacklevel=2)
+        self._is_copy = msg
+
+    def _repr_data_resource_(self):
+        """
+        Not a real Jupyter special repr method, but we use the same
+        naming convention.
+        """
+        if config.get_option("display.html.table_schema"):
+            data = self.head(config.get_option('display.max_rows'))
+            payload = json.loads(data.to_json(orient='table'),
+                                 object_pairs_hook=collections.OrderedDict)
+            return payload
+
     def _validate_dtype(self, dtype):
         """ validate the passed dtype """
 
         if dtype is not None:
-            dtype = com._coerce_to_dtype(dtype)
+            dtype = pandas_dtype(dtype)
 
             # a compound dtype
             if dtype.kind == 'V':
                 raise NotImplementedError("compound dtypes are not implemented"
-                                          "in the {0} constructor"
+                                          " in the {0} constructor"
                                           .format(self.__class__.__name__))
+
         return dtype
 
     def _init_mgr(self, mgr, axes=None, dtype=None, copy=False):
         """ passed a manager and a axes dict """
         for a, axe in axes.items():
             if axe is not None:
-                mgr = mgr.reindex_axis(
-                    axe, axis=self._get_block_manager_axis(a), copy=False)
+                mgr = mgr.reindex_axis(axe,
+                                       axis=self._get_block_manager_axis(a),
+                                       copy=False)
 
         # make a copy if explicitly requested
         if copy:
@@ -135,33 +192,36 @@ def _init_mgr(self, mgr, axes=None, dtype=None, copy=False):
                 mgr = mgr.astype(dtype=dtype)
         return mgr
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Construction
 
     @property
     def _constructor(self):
-        """Used when a manipulation result has the same dimesions as the
+        """Used when a manipulation result has the same dimensions as the
         original.
         """
-        raise AbstractMethodError(self)
+        raise com.AbstractMethodError(self)
 
     def __unicode__(self):
         # unicode representation based upon iterating over self
         # (since, by definition, `PandasContainers` are iterable)
-        prepr = '[%s]' % ','.join(map(com.pprint_thing, self))
+        prepr = '[%s]' % ','.join(map(pprint_thing, self))
         return '%s(%s)' % (self.__class__.__name__, prepr)
 
     def _dir_additions(self):
-        """ add the string-like attributes from the info_axis """
-        return set([c for c in self._info_axis
-                if isinstance(c, string_types) and isidentifier(c)])
+        """ add the string-like attributes from the info_axis.
+        If info_axis is a MultiIndex, it's first level values are used.
+        """
+        additions = {c for c in self._info_axis.unique(level=0)[:100]
+                     if isinstance(c, string_types) and isidentifier(c)}
+        return super(NDFrame, self)._dir_additions().union(additions)
 
     @property
     def _constructor_sliced(self):
         """Used when a manipulation result has one lower dimension(s) as the
         original, such as DataFrame single columns slicing.
         """
-        raise AbstractMethodError(self)
+        raise com.AbstractMethodError(self)
 
     @property
     def _constructor_expanddim(self):
@@ -170,31 +230,32 @@ def _constructor_expanddim(self):
         """
         raise NotImplementedError
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Axis
 
     @classmethod
-    def _setup_axes(
-        cls, axes, info_axis=None, stat_axis=None, aliases=None, slicers=None,
-            axes_are_reversed=False, build_axes=True, ns=None):
-        """ provide axes setup for the major PandasObjects
-
-            axes : the names of the axes in order (lowest to highest)
-            info_axis_num : the axis of the selector dimension (int)
-            stat_axis_num : the number of axis for the default stats (int)
-            aliases : other names for a single axis (dict)
-            slicers : how axes slice to others (dict)
-            axes_are_reversed : boolean whether to treat passed axes as
-                reversed (DataFrame)
-            build_axes : setup the axis properties (default True)
-            """
+    def _setup_axes(cls, axes, info_axis=None, stat_axis=None, aliases=None,
+                    slicers=None, axes_are_reversed=False, build_axes=True,
+                    ns=None, docs=None):
+        """Provide axes setup for the major PandasObjects.
+
+        Parameters
+        ----------
+        axes : the names of the axes in order (lowest to highest)
+        info_axis_num : the axis of the selector dimension (int)
+        stat_axis_num : the number of axis for the default stats (int)
+        aliases : other names for a single axis (dict)
+        slicers : how axes slice to others (dict)
+        axes_are_reversed : boolean whether to treat passed axes as
+            reversed (DataFrame)
+        build_axes : setup the axis properties (default True)
+        """
 
         cls._AXIS_ORDERS = axes
-        cls._AXIS_NUMBERS = dict((a, i) for i, a in enumerate(axes))
+        cls._AXIS_NUMBERS = {a: i for i, a in enumerate(axes)}
         cls._AXIS_LEN = len(axes)
         cls._AXIS_ALIASES = aliases or dict()
-        cls._AXIS_IALIASES = dict((v, k)
-                                  for k, v in cls._AXIS_ALIASES.items())
+        cls._AXIS_IALIASES = {v: k for k, v in cls._AXIS_ALIASES.items()}
         cls._AXIS_NAMES = dict(enumerate(axes))
         cls._AXIS_SLICEMAP = slicers or None
         cls._AXIS_REVERSED = axes_are_reversed
@@ -217,7 +278,7 @@ def _setup_axes(
         if build_axes:
 
             def set_axis(a, i):
-                setattr(cls, a, lib.AxisProperty(i))
+                setattr(cls, a, properties.AxisProperty(i, docs.get(a, a)))
                 cls._internal_names_set.add(a)
 
             if axes_are_reversed:
@@ -234,29 +295,31 @@ def set_axis(a, i):
                 setattr(cls, k, v)
 
     def _construct_axes_dict(self, axes=None, **kwargs):
-        """ return an axes dictionary for myself """
-        d = dict([(a, self._get_axis(a)) for a in (axes or self._AXIS_ORDERS)])
+        """Return an axes dictionary for myself."""
+        d = {a: self._get_axis(a) for a in (axes or self._AXIS_ORDERS)}
         d.update(kwargs)
         return d
 
     @staticmethod
     def _construct_axes_dict_from(self, axes, **kwargs):
-        """ return an axes dictionary for the passed axes """
-        d = dict([(a, ax) for a, ax in zip(self._AXIS_ORDERS, axes)])
+        """Return an axes dictionary for the passed axes."""
+        d = {a: ax for a, ax in zip(self._AXIS_ORDERS, axes)}
         d.update(kwargs)
         return d
 
     def _construct_axes_dict_for_slice(self, axes=None, **kwargs):
-        """ return an axes dictionary for myself """
-        d = dict([(self._AXIS_SLICEMAP[a], self._get_axis(a))
-                 for a in (axes or self._AXIS_ORDERS)])
+        """Return an axes dictionary for myself."""
+        d = {self._AXIS_SLICEMAP[a]: self._get_axis(a)
+             for a in (axes or self._AXIS_ORDERS)}
         d.update(kwargs)
         return d
 
     def _construct_axes_from_arguments(self, args, kwargs, require_all=False):
-        """ construct and returns axes if supplied in args/kwargs
-            if require_all, raise if all axis arguments are not supplied
-            return a tuple of (axes, kwargs) """
+        """Construct and returns axes if supplied in args/kwargs.
+
+        If require_all, raise if all axis arguments are not supplied
+        return a tuple of (axes, kwargs).
+        """
 
         # construct the args
         args = list(args)
@@ -267,10 +330,8 @@ def _construct_axes_from_arguments(self, args, kwargs, require_all=False):
             if alias is not None:
                 if a in kwargs:
                     if alias in kwargs:
-                        raise TypeError(
-                            "arguments are mutually exclusive for [%s,%s]" %
-                            (a, alias)
-                        )
+                        raise TypeError("arguments are mutually exclusive "
+                                        "for [%s,%s]" % (a, alias))
                     continue
                 if alias in kwargs:
                     kwargs[a] = kwargs.pop(alias)
@@ -280,12 +341,12 @@ def _construct_axes_from_arguments(self, args, kwargs, require_all=False):
             if a not in kwargs:
                 try:
                     kwargs[a] = args.pop(0)
-                except (IndexError):
+                except IndexError:
                     if require_all:
-                        raise TypeError(
-                            "not enough/duplicate arguments specified!")
+                        raise TypeError("not enough/duplicate arguments "
+                                        "specified!")
 
-        axes = dict([(a, kwargs.pop(a, None)) for a in self._AXIS_ORDERS])
+        axes = {a: kwargs.pop(a, None) for a in self._AXIS_ORDERS}
         return axes, kwargs
 
     @classmethod
@@ -302,13 +363,13 @@ def _from_axes(cls, data, axes, **kwargs):
 
     def _get_axis_number(self, axis):
         axis = self._AXIS_ALIASES.get(axis, axis)
-        if com.is_integer(axis):
+        if is_integer(axis):
             if axis in self._AXIS_NAMES:
                 return axis
         else:
             try:
                 return self._AXIS_NUMBERS[axis]
-            except:
+            except KeyError:
                 pass
         raise ValueError('No axis named {0} for object type {1}'
                          .format(axis, type(self)))
@@ -321,7 +382,7 @@ def _get_axis_name(self, axis):
         else:
             try:
                 return self._AXIS_NAMES[axis]
-            except:
+            except KeyError:
                 pass
         raise ValueError('No axis named {0} for object type {1}'
                          .format(axis, type(self)))
@@ -331,7 +392,7 @@ def _get_axis(self, axis):
         return getattr(self, name)
 
     def _get_block_manager_axis(self, axis):
-        """ map the axis to the block_manager axis """
+        """Map the axis to the block_manager axis."""
         axis = self._get_axis_number(axis)
         if self._AXIS_REVERSED:
             m = self._AXIS_LEN - 1
@@ -384,26 +445,73 @@ def _stat_axis(self):
 
     @property
     def shape(self):
-        "Return a tuple of axis dimensions"
+        """Return a tuple of axis dimensions"""
         return tuple(len(self._get_axis(a)) for a in self._AXIS_ORDERS)
 
     @property
     def axes(self):
-        "Return index label(s) of the internal NDFrame"
+        """Return index label(s) of the internal NDFrame"""
         # we do it this way because if we have reversed axes, then
         # the block manager shows then reversed
         return [self._get_axis(a) for a in self._AXIS_ORDERS]
 
     @property
     def ndim(self):
-        "Number of axes / array dimensions"
+        """
+        Return an int representing the number of axes / array dimensions.
+
+        Return 1 if Series. Otherwise return 2 if DataFrame.
+
+        See Also
+        --------
+        ndarray.ndim : Number of array dimensions.
+
+        Examples
+        --------
+        >>> s = pd.Series({'a': 1, 'b': 2, 'c': 3})
+        >>> s.ndim
+        1
+
+        >>> df = pd.DataFrame({'col1': [1, 2], 'col2': [3, 4]})
+        >>> df.ndim
+        2
+        """
         return self._data.ndim
 
     @property
     def size(self):
-        "number of elements in the NDFrame"
+        """
+        Return an int representing the number of elements in this object.
+
+        Return the number of rows if Series. Otherwise return the number of
+        rows times number of columns if DataFrame.
+
+        See Also
+        --------
+        ndarray.size : Number of elements in the array.
+
+        Examples
+        --------
+        >>> s = pd.Series({'a': 1, 'b': 2, 'c': 3})
+        >>> s.size
+        3
+
+        >>> df = pd.DataFrame({'col1': [1, 2], 'col2': [3, 4]})
+        >>> df.size
+        4
+        """
         return np.prod(self.shape)
 
+    @property
+    def _selected_obj(self):
+        """ internal compat with SelectionMixin """
+        return self
+
+    @property
+    def _obj_with_exclusions(self):
+        """ internal compat with SelectionMixin """
+        return self
+
     def _expand_axes(self, key):
         new_axes = []
         for k, ax in zip(key, self.axes):
@@ -416,9 +524,123 @@ def _expand_axes(self, key):
 
         return new_axes
 
-    def set_axis(self, axis, labels):
-        """ public verson of axis assignment """
-        setattr(self,self._get_axis_name(axis),labels)
+    def set_axis(self, labels, axis=0, inplace=None):
+        """
+        Assign desired index to given axis.
+
+        Indexes for column or row labels can be changed by assigning
+        a list-like or Index.
+
+        .. versionchanged:: 0.21.0
+
+           The signature is now `labels` and `axis`, consistent with
+           the rest of pandas API. Previously, the `axis` and `labels`
+           arguments were respectively the first and second positional
+           arguments.
+
+        Parameters
+        ----------
+        labels : list-like, Index
+            The values for the new index.
+
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            The axis to update. The value 0 identifies the rows, and 1
+            identifies the columns.
+
+        inplace : boolean, default None
+            Whether to return a new %(klass)s instance.
+
+            .. warning::
+
+               ``inplace=None`` currently falls back to to True, but in a
+               future version, will default to False. Use inplace=True
+               explicitly rather than relying on the default.
+
+        Returns
+        -------
+        renamed : %(klass)s or None
+            An object of same type as caller if inplace=False, None otherwise.
+
+        See Also
+        --------
+        pandas.DataFrame.rename_axis : Alter the name of the index or columns.
+
+        Examples
+        --------
+        **Series**
+
+        >>> s = pd.Series([1, 2, 3])
+        >>> s
+        0    1
+        1    2
+        2    3
+        dtype: int64
+
+        >>> s.set_axis(['a', 'b', 'c'], axis=0, inplace=False)
+        a    1
+        b    2
+        c    3
+        dtype: int64
+
+        The original object is not modified.
+
+        >>> s
+        0    1
+        1    2
+        2    3
+        dtype: int64
+
+        **DataFrame**
+
+        >>> df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
+
+        Change the row labels.
+
+        >>> df.set_axis(['a', 'b', 'c'], axis='index', inplace=False)
+           A  B
+        a  1  4
+        b  2  5
+        c  3  6
+
+        Change the column labels.
+
+        >>> df.set_axis(['I', 'II'], axis='columns', inplace=False)
+           I  II
+        0  1   4
+        1  2   5
+        2  3   6
+
+        Now, update the labels inplace.
+
+        >>> df.set_axis(['i', 'ii'], axis='columns', inplace=True)
+        >>> df
+           i  ii
+        0  1   4
+        1  2   5
+        2  3   6
+        """
+        if is_scalar(labels):
+            warnings.warn(
+                'set_axis now takes "labels" as first argument, and '
+                '"axis" as named parameter. The old form, with "axis" as '
+                'first parameter and \"labels\" as second, is still supported '
+                'but will be deprecated in a future version of pandas.',
+                FutureWarning, stacklevel=2)
+            labels, axis = axis, labels
+
+        if inplace is None:
+            warnings.warn(
+                'set_axis currently defaults to operating inplace.\nThis '
+                'will change in a future version of pandas, use '
+                'inplace=True to avoid this warning.',
+                FutureWarning, stacklevel=2)
+            inplace = True
+        if inplace:
+            setattr(self, self._get_axis_name(axis), labels)
+        else:
+            obj = self.copy()
+            obj.set_axis(labels, axis=axis, inplace=True)
+            return obj
 
     def _set_axis(self, axis, labels):
         self._data.set_axis(axis, labels)
@@ -448,27 +670,24 @@ def _set_axis(self, axis, labels):
     def transpose(self, *args, **kwargs):
 
         # construct the args
-        axes, kwargs = self._construct_axes_from_arguments(
-            args, kwargs, require_all=True)
-        axes_names = tuple([self._get_axis_name(axes[a])
-                            for a in self._AXIS_ORDERS])
-        axes_numbers = tuple([self._get_axis_number(axes[a])
-                             for a in self._AXIS_ORDERS])
+        axes, kwargs = self._construct_axes_from_arguments(args, kwargs,
+                                                           require_all=True)
+        axes_names = tuple(self._get_axis_name(axes[a])
+                           for a in self._AXIS_ORDERS)
+        axes_numbers = tuple(self._get_axis_number(axes[a])
+                             for a in self._AXIS_ORDERS)
 
         # we must have unique axes
         if len(axes) != len(set(axes)):
             raise ValueError('Must specify %s unique axes' % self._AXIS_LEN)
 
-        new_axes = self._construct_axes_dict_from(
-            self, [self._get_axis(x) for x in axes_names])
+        new_axes = self._construct_axes_dict_from(self, [self._get_axis(x)
+                                                         for x in axes_names])
         new_values = self.values.transpose(axes_numbers)
         if kwargs.pop('copy', None) or (len(args) and args[-1]):
             new_values = new_values.copy()
 
-        if kwargs:
-            raise TypeError('transpose() got an unexpected keyword '
-                    'argument "{0}"'.format(list(kwargs.keys())[0]))
-
+        nv.validate_transpose_for_generic(self, kwargs)
         return self._constructor(new_values, **new_axes).__finalize__(self)
 
     def swapaxes(self, axis1, axis2, copy=True):
@@ -500,6 +719,43 @@ def swapaxes(self, axis1, axis2, copy=True):
     def pop(self, item):
         """
         Return item and drop from frame. Raise KeyError if not found.
+
+        Parameters
+        ----------
+        item : str
+            Column label to be popped
+
+        Returns
+        -------
+        popped : Series
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([('falcon', 'bird',    389.0),
+        ...                    ('parrot', 'bird',     24.0),
+        ...                    ('lion',   'mammal',   80.5),
+        ...                    ('monkey', 'mammal', np.nan)],
+        ...                   columns=('name', 'class', 'max_speed'))
+        >>> df
+             name   class  max_speed
+        0  falcon    bird      389.0
+        1  parrot    bird       24.0
+        2    lion  mammal       80.5
+        3  monkey  mammal        NaN
+
+        >>> df.pop('class')
+        0      bird
+        1      bird
+        2    mammal
+        3    mammal
+        Name: class, dtype: object
+
+        >>> df
+             name  max_speed
+        0  falcon      389.0
+        1  parrot       24.0
+        2    lion       80.5
+        3  monkey        NaN
         """
         result = self[item]
         del self[item]
@@ -510,15 +766,31 @@ def pop(self, item):
 
         return result
 
-    def squeeze(self):
-        """ squeeze length 1 dimensions """
+    def squeeze(self, axis=None):
+        """
+        Squeeze length 1 dimensions.
+
+        Parameters
+        ----------
+        axis : None, integer or string axis name, optional
+            The axis to squeeze if 1-sized.
+
+            .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        scalar if 1-sized, else original object
+        """
+        axis = (self._AXIS_NAMES if axis is None else
+                (self._get_axis_number(axis),))
         try:
-            return self.iloc[tuple([0 if len(a) == 1 else slice(None)
-                                  for a in self.axes])]
-        except:
+            return self.iloc[
+                tuple(0 if i in axis and len(a) == 1 else slice(None)
+                      for i, a in enumerate(self.axes))]
+        except Exception:
             return self
 
-    def swaplevel(self, i, j, axis=0):
+    def swaplevel(self, i=-2, j=-1, axis=0):
         """
         Swap levels i and j in a MultiIndex on a particular axis
 
@@ -529,7 +801,13 @@ def swaplevel(self, i, j, axis=0):
 
         Returns
         -------
-        swapped : type of caller (new object)
+        swapped : same type as caller (new object)
+
+        .. versionchanged:: 0.18.1
+
+           The indexes ``i`` and ``j`` are now optional, and default to
+           the two innermost levels of the index.
+
         """
         axis = self._get_axis_number(axis)
         result = self.copy()
@@ -537,7 +815,7 @@ def swaplevel(self, i, j, axis=0):
         result._data.set_axis(axis, labels.swaplevel(i, j))
         return result
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Rename
 
     # TODO: define separate funcs for DataFrame, Series and Panel so you can
@@ -545,42 +823,130 @@ def swaplevel(self, i, j, axis=0):
     _shared_docs['rename'] = """
         Alter axes input function or functions. Function / dict values must be
         unique (1-to-1). Labels not contained in a dict / Series will be left
-        as-is.
+        as-is. Extra labels listed don't throw an error. Alternatively, change
+        ``Series.name`` with a scalar value (Series only).
 
         Parameters
         ----------
-        %(axes)s : dict-like or function, optional
-            Transformation to apply to that axis values
-
+        %(optional_mapper)s
+        %(axes)s : scalar, list-like, dict-like or function, optional
+            Scalar or list-like will alter the ``Series.name`` attribute,
+            and raise on DataFrame or Panel.
+            dict-like or functions are transformations to apply to
+            that axis' values
+        %(optional_axis)s
         copy : boolean, default True
             Also copy underlying data
         inplace : boolean, default False
             Whether to return a new %(klass)s. If True then value of copy is
             ignored.
+        level : int or level name, default None
+            In case of a MultiIndex, only rename labels in the specified
+            level.
 
         Returns
         -------
         renamed : %(klass)s (new object)
+
+        See Also
+        --------
+        pandas.NDFrame.rename_axis
+
+        Examples
+        --------
+
+        >>> s = pd.Series([1, 2, 3])
+        >>> s
+        0    1
+        1    2
+        2    3
+        dtype: int64
+        >>> s.rename("my_name") # scalar, changes Series.name
+        0    1
+        1    2
+        2    3
+        Name: my_name, dtype: int64
+        >>> s.rename(lambda x: x ** 2)  # function, changes labels
+        0    1
+        1    2
+        4    3
+        dtype: int64
+        >>> s.rename({1: 3, 2: 5})  # mapping, changes labels
+        0    1
+        3    2
+        5    3
+        dtype: int64
+
+        Since ``DataFrame`` doesn't have a ``.name`` attribute,
+        only mapping-type arguments are allowed.
+
+        >>> df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
+        >>> df.rename(2)
+        Traceback (most recent call last):
+        ...
+        TypeError: 'int' object is not callable
+
+        ``DataFrame.rename`` supports two calling conventions
+
+        * ``(index=index_mapper, columns=columns_mapper, ...)``
+        * ``(mapper, axis={'index', 'columns'}, ...)``
+
+        We *highly* recommend using keyword arguments to clarify your
+        intent.
+
+        >>> df.rename(index=str, columns={"A": "a", "B": "c"})
+           a  c
+        0  1  4
+        1  2  5
+        2  3  6
+
+        >>> df.rename(index=str, columns={"A": "a", "C": "c"})
+           a  B
+        0  1  4
+        1  2  5
+        2  3  6
+
+        Using axis-style parameters
+
+        >>> df.rename(str.lower, axis='columns')
+           a  b
+        0  1  4
+        1  2  5
+        2  3  6
+
+        >>> df.rename({1: 2, 2: 4}, axis='index')
+           A  B
+        0  1  4
+        2  2  5
+        4  3  6
+
+        See the :ref:`user guide <basics.rename>` for more.
         """
 
     @Appender(_shared_docs['rename'] % dict(axes='axes keywords for this'
-                                            ' object', klass='NDFrame'))
+                                            ' object', klass='NDFrame',
+                                            optional_mapper='',
+                                            optional_axis=''))
     def rename(self, *args, **kwargs):
-
         axes, kwargs = self._construct_axes_from_arguments(args, kwargs)
         copy = kwargs.pop('copy', True)
         inplace = kwargs.pop('inplace', False)
+        level = kwargs.pop('level', None)
+        axis = kwargs.pop('axis', None)
+        if axis is not None:
+            axis = self._get_axis_number(axis)
 
         if kwargs:
             raise TypeError('rename() got an unexpected keyword '
-                    'argument "{0}"'.format(list(kwargs.keys())[0]))
+                            'argument "{0}"'.format(list(kwargs.keys())[0]))
 
-        if (com._count_not_none(*axes.values()) == 0):
+        if com._count_not_none(*axes.values()) == 0:
             raise TypeError('must pass an index to rename')
 
         # renamer function if passed a dict
         def _get_rename_function(mapper):
             if isinstance(mapper, (dict, ABCSeries)):
+
                 def f(x):
                     if x in mapper:
                         return mapper[x]
@@ -602,7 +968,10 @@ def f(x):
             f = _get_rename_function(v)
 
             baxis = self._get_block_manager_axis(axis)
-            result._data = result._data.rename_axis(f, axis=baxis, copy=copy)
+            if level is not None:
+                level = self.axes[axis]._get_level_number(level)
+            result._data = result._data.rename_axis(f, axis=baxis, copy=copy,
+                                                    level=level)
             result._clear_item_cache()
 
         if inplace:
@@ -614,47 +983,166 @@ def f(x):
 
     def rename_axis(self, mapper, axis=0, copy=True, inplace=False):
         """
-        Alter index and / or columns using input function or functions.
-        Function / dict values must be unique (1-to-1). Labels not contained in
-        a dict / Series will be left as-is.
+        Alter the name of the index or columns.
 
         Parameters
         ----------
-        mapper : dict-like or function, optional
-        axis : int or string, default 0
+        mapper : scalar, list-like, optional
+            Value to set as the axis name attribute.
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            The index or the name of the axis.
         copy : boolean, default True
-            Also copy underlying data
+            Also copy underlying data.
         inplace : boolean, default False
+            Modifies the object directly, instead of creating a new Series
+            or DataFrame.
+
+        Returns
+        -------
+        renamed : Series, DataFrame, or None
+            The same type as the caller or None if `inplace` is True.
+
+        Notes
+        -----
+        Prior to version 0.21.0, ``rename_axis`` could also be used to change
+        the axis *labels* by passing a mapping or scalar. This behavior is
+        deprecated and will be removed in a future version. Use ``rename``
+        instead.
+
+        See Also
+        --------
+        pandas.Series.rename : Alter Series index labels or name
+        pandas.DataFrame.rename : Alter DataFrame index labels or name
+        pandas.Index.rename : Set new names on index
+
+        Examples
+        --------
+        **Series**
+
+        >>> s = pd.Series([1, 2, 3])
+        >>> s.rename_axis("foo")
+        foo
+        0    1
+        1    2
+        2    3
+        dtype: int64
+
+        **DataFrame**
+
+        >>> df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
+        >>> df.rename_axis("foo")
+             A  B
+        foo
+        0    1  4
+        1    2  5
+        2    3  6
+
+        >>> df.rename_axis("bar", axis="columns")
+        bar  A  B
+        0    1  4
+        1    2  5
+        2    3  6
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        non_mapper = is_scalar(mapper) or (is_list_like(mapper) and not
+                                           is_dict_like(mapper))
+        if non_mapper:
+            return self._set_axis_name(mapper, axis=axis, inplace=inplace)
+        else:
+            msg = ("Using 'rename_axis' to alter labels is deprecated. "
+                   "Use '.rename' instead")
+            warnings.warn(msg, FutureWarning, stacklevel=2)
+            axis = self._get_axis_name(axis)
+            d = {'copy': copy, 'inplace': inplace}
+            d[axis] = mapper
+            return self.rename(**d)
+
+    def _set_axis_name(self, name, axis=0, inplace=False):
+        """
+        Alter the name or names of the axis.
+
+        Parameters
+        ----------
+        name : str or list of str
+            Name for the Index, or list of names for the MultiIndex
+        axis : int or str
+           0 or 'index' for the index; 1 or 'columns' for the columns
+        inplace : bool
+            whether to modify `self` directly or return a copy
+
+            .. versionadded:: 0.21.0
 
         Returns
         -------
-        renamed : type of caller
+        renamed : same type as caller or None if inplace=True
+
+        See Also
+        --------
+        pandas.DataFrame.rename
+        pandas.Series.rename
+        pandas.Index.rename
+
+        Examples
+        --------
+        >>> df._set_axis_name("foo")
+             A
+        foo
+        0    1
+        1    2
+        2    3
+        >>> df.index = pd.MultiIndex.from_product([['A'], ['a', 'b', 'c']])
+        >>> df._set_axis_name(["bar", "baz"])
+                 A
+        bar baz
+        A   a    1
+            b    2
+            c    3
         """
-        axis = self._get_axis_name(axis)
-        d = {'copy': copy, 'inplace': inplace}
-        d[axis] = mapper
-        return self.rename(**d)
+        axis = self._get_axis_number(axis)
+        idx = self._get_axis(axis).set_names(name)
 
-    #----------------------------------------------------------------------
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        renamed = self if inplace else self.copy()
+        renamed.set_axis(idx, axis=axis, inplace=True)
+        if not inplace:
+            return renamed
+
+    # ----------------------------------------------------------------------
     # Comparisons
 
     def _indexed_same(self, other):
-        return all([self._get_axis(a).equals(other._get_axis(a))
-                    for a in self._AXIS_ORDERS])
+        return all(self._get_axis(a).equals(other._get_axis(a))
+                   for a in self._AXIS_ORDERS)
 
     def __neg__(self):
-        values = _values_from_object(self)
-        if values.dtype == np.bool_:
+        values = com._values_from_object(self)
+        if is_bool_dtype(values):
             arr = operator.inv(values)
-        else:
+        elif (is_numeric_dtype(values) or is_timedelta64_dtype(values)
+                or is_object_dtype(values)):
             arr = operator.neg(values)
+        else:
+            raise TypeError("Unary negative expects numeric dtype, not {}"
+                            .format(values.dtype))
+        return self.__array_wrap__(arr)
+
+    def __pos__(self):
+        values = com._values_from_object(self)
+        if (is_bool_dtype(values) or is_period_arraylike(values)):
+            arr = values
+        elif (is_numeric_dtype(values) or is_timedelta64_dtype(values)
+                or is_object_dtype(values)):
+            arr = operator.pos(values)
+        else:
+            raise TypeError("Unary plus expects numeric dtype, not {}"
+                            .format(values.dtype))
         return self.__array_wrap__(arr)
 
     def __invert__(self):
         try:
-            arr = operator.inv(_values_from_object(self))
+            arr = operator.inv(com._values_from_object(self))
             return self.__array_wrap__(arr)
-        except:
+        except Exception:
 
             # inv fails with 0 len
             if not np.prod(self.shape):
@@ -664,129 +1152,491 @@ def __invert__(self):
 
     def equals(self, other):
         """
-        Determines if two NDFrame objects contain the same elements. NaNs in the
-        same location are considered equal.
+        Determines if two NDFrame objects contain the same elements. NaNs in
+        the same location are considered equal.
         """
         if not isinstance(other, self._constructor):
             return False
         return self._data.equals(other._data)
 
-    #----------------------------------------------------------------------
-    # Iteration
-
-    def __hash__(self):
-        raise TypeError('{0!r} objects are mutable, thus they cannot be'
-                        ' hashed'.format(self.__class__.__name__))
+    # -------------------------------------------------------------------------
+    # Label or Level Combination Helpers
+    #
+    # A collection of helper methods for DataFrame/Series operations that
+    # accept a combination of column/index labels and levels.  All such
+    # operations should utilize/extend these methods when possible so that we
+    # have consistent precedence and validation logic throughout the library.
 
-    def __iter__(self):
+    def _is_level_reference(self, key, axis=0):
         """
-        Iterate over infor axis
-        """
-        return iter(self._info_axis)
+        Test whether a key is a level reference for a given axis.
 
-    # can we get a better explanation of this?
-    def keys(self):
-        """Get the 'info axis' (see Indexing for more)
+        To be considered a level reference, `key` must be a string that:
+          - (axis=0): Matches the name of an index level and does NOT match
+            a column label.
+          - (axis=1): Matches the name of a column level and does NOT match
+            an index label.
 
-        This is index for Series, columns for DataFrame and major_axis for
-        Panel."""
-        return self._info_axis
+        Parameters
+        ----------
+        key: str
+            Potential level name for the given axis
+        axis: int, default 0
+            Axis that levels are associated with (0 for index, 1 for columns)
 
-    def iteritems(self):
-        """Iterate over (label, values) on info axis
+        Returns
+        -------
+        is_level: bool
+        """
+        axis = self._get_axis_number(axis)
 
-        This is index for Series, columns for DataFrame, major_axis for Panel,
-        and so on.
+        if self.ndim > 2:
+            raise NotImplementedError(
+                "_is_level_reference is not implemented for {type}"
+                .format(type=type(self)))
+
+        return (key is not None and
+                is_hashable(key) and
+                key in self.axes[axis].names and
+                not self._is_label_reference(key, axis=axis))
+
+    def _is_label_reference(self, key, axis=0):
         """
-        for h in self._info_axis:
-            yield h, self[h]
+        Test whether a key is a label reference for a given axis.
 
-    # originally used to get around 2to3's changes to iteritems.
-    # Now unnecessary. Sidenote: don't want to deprecate this for a while,
-    # otherwise libraries that use 2to3 will have issues.
-    def iterkv(self, *args, **kwargs):
-        "iteritems alias used to get around 2to3. Deprecated"
-        warnings.warn("iterkv is deprecated and will be removed in a future "
-                      "release, use ``iteritems`` instead.",
-                      FutureWarning, stacklevel=2)
-        return self.iteritems(*args, **kwargs)
+        To be considered a label reference, `key` must be a string that:
+          - (axis=0): Matches a column label
+          - (axis=1): Matches an index label
 
-    def __len__(self):
-        """Returns length of info axis """
-        return len(self._info_axis)
+        Parameters
+        ----------
+        key: str
+            Potential label name
+        axis: int, default 0
+            Axis perpendicular to the axis that labels are associated with
+            (0 means search for column labels, 1 means search for index labels)
 
-    def __contains__(self, key):
-        """True if the key is in the info axis """
-        return key in self._info_axis
+        Returns
+        -------
+        is_label: bool
+        """
+        axis = self._get_axis_number(axis)
+        other_axes = [ax for ax in range(self._AXIS_LEN) if ax != axis]
 
-    @property
-    def empty(self):
-        "True if NDFrame is entirely empty [no items]"
-        return not all(len(self._get_axis(a)) > 0 for a in self._AXIS_ORDERS)
+        if self.ndim > 2:
+            raise NotImplementedError(
+                "_is_label_reference is not implemented for {type}"
+                .format(type=type(self)))
 
-    def __nonzero__(self):
-        raise ValueError("The truth value of a {0} is ambiguous. "
-                         "Use a.empty, a.bool(), a.item(), a.any() or a.all()."
-                         .format(self.__class__.__name__))
+        return (key is not None and
+                is_hashable(key) and
+                any(key in self.axes[ax] for ax in other_axes))
 
-    __bool__ = __nonzero__
+    def _is_label_or_level_reference(self, key, axis=0):
+        """
+        Test whether a key is a label or level reference for a given axis.
 
-    def bool(self):
-        """ Return the bool of a single element PandasObject
-            This must be a boolean scalar value, either True or False
+        To be considered either a label or a level reference, `key` must be a
+        string that:
+          - (axis=0): Matches a column label or an index level
+          - (axis=1): Matches an index label or a column level
 
-            Raise a ValueError if the PandasObject does not have exactly
-            1 element, or that element is not boolean """
-        v = self.squeeze()
-        if isinstance(v, (bool, np.bool_)):
-            return bool(v)
-        elif np.isscalar(v):
-            raise ValueError("bool cannot act on a non-boolean single element "
-                             "{0}".format(self.__class__.__name__))
+        Parameters
+        ----------
+        key: str
+            Potential label or level name
+        axis: int, default 0
+            Axis that levels are associated with (0 for index, 1 for columns)
 
-        self.__nonzero__()
+        Returns
+        -------
+        is_label_or_level: bool
+        """
 
-    def __abs__(self):
-        return self.abs()
+        if self.ndim > 2:
+            raise NotImplementedError(
+                "_is_label_or_level_reference is not implemented for {type}"
+                .format(type=type(self)))
 
-    #----------------------------------------------------------------------
-    # Array Interface
+        return (self._is_level_reference(key, axis=axis) or
+                self._is_label_reference(key, axis=axis))
 
-    def __array__(self, dtype=None):
-        return _values_from_object(self)
+    def _check_label_or_level_ambiguity(self, key, axis=0, stacklevel=1):
+        """
+        Check whether `key` matches both a level of the input `axis` and a
+        label of the other axis and raise a ``FutureWarning`` if this is the
+        case.
 
-    def __array_wrap__(self, result, context=None):
-        d = self._construct_axes_dict(self._AXIS_ORDERS, copy=False)
-        return self._constructor(result, **d).__finalize__(self)
+        Note: This method will be altered to raise an ambiguity exception in
+        a future version.
 
-    # ideally we would define this to avoid the getattr checks, but
-    # is slower
-    #@property
-    #def __array_interface__(self):
-    #    """ provide numpy array interface method """
-    #    values = self.values
-    #    return dict(typestr=values.dtype.str,shape=values.shape,data=values)
+        Parameters
+        ----------
+        key: str or object
+            label or level name
+        axis: int, default 0
+            Axis that levels are associated with (0 for index, 1 for columns)
+        stacklevel: int, default 1
+            Stack level used when a FutureWarning is raised (see below).
 
-    def to_dense(self):
-        "Return dense representation of NDFrame (as opposed to sparse)"
-        # compat
-        return self
+        Returns
+        -------
+        ambiguous: bool
 
-    #----------------------------------------------------------------------
-    # Picklability
+        Raises
+        ------
+        FutureWarning
+            if `key` is ambiguous. This will become an ambiguity error in a
+            future version
+        """
 
-    def __getstate__(self):
-        meta = dict((k, getattr(self, k, None)) for k in self._metadata)
-        return dict(_data=self._data, _typ=self._typ,
-                    _metadata=self._metadata, **meta)
+        axis = self._get_axis_number(axis)
+        other_axes = [ax for ax in range(self._AXIS_LEN) if ax != axis]
 
-    def __setstate__(self, state):
+        if self.ndim > 2:
+            raise NotImplementedError(
+                "_check_label_or_level_ambiguity is not implemented for {type}"
+                .format(type=type(self)))
+
+        if (key is not None and
+                is_hashable(key) and
+                key in self.axes[axis].names and
+                any(key in self.axes[ax] for ax in other_axes)):
+
+            # Build an informative and grammatical warning
+            level_article, level_type = (('an', 'index')
+                                         if axis == 0 else
+                                         ('a', 'column'))
+
+            label_article, label_type = (('a', 'column')
+                                         if axis == 0 else
+                                         ('an', 'index'))
+
+            msg = ("'{key}' is both {level_article} {level_type} level and "
+                   "{label_article} {label_type} label.\n"
+                   "Defaulting to {label_type}, but this will raise an "
+                   "ambiguity error in a future version"
+                   ).format(key=key,
+                            level_article=level_article,
+                            level_type=level_type,
+                            label_article=label_article,
+                            label_type=label_type)
+
+            warnings.warn(msg, FutureWarning, stacklevel=stacklevel + 1)
+            return True
+        else:
+            return False
 
-        if isinstance(state, BlockManager):
-            self._data = state
-        elif isinstance(state, dict):
-            typ = state.get('_typ')
-            if typ is not None:
+    def _get_label_or_level_values(self, key, axis=0, stacklevel=1):
+        """
+        Return a 1-D array of values associated with `key`, a label or level
+        from the given `axis`.
+
+        Retrieval logic:
+          - (axis=0): Return column values if `key` matches a column label.
+            Otherwise return index level values if `key` matches an index
+            level.
+          - (axis=1): Return row values if `key` matches an index label.
+            Otherwise return column level values if 'key' matches a column
+            level
+
+        Parameters
+        ----------
+        key: str
+            Label or level name.
+        axis: int, default 0
+            Axis that levels are associated with (0 for index, 1 for columns)
+        stacklevel: int, default 1
+            Stack level used when a FutureWarning is raised (see below).
+
+        Returns
+        -------
+        values: np.ndarray
+
+        Raises
+        ------
+        KeyError
+            if `key` matches neither a label nor a level
+        ValueError
+            if `key` matches multiple labels
+        FutureWarning
+            if `key` is ambiguous. This will become an ambiguity error in a
+            future version
+        """
+
+        axis = self._get_axis_number(axis)
+        other_axes = [ax for ax in range(self._AXIS_LEN) if ax != axis]
+
+        if self.ndim > 2:
+            raise NotImplementedError(
+                "_get_label_or_level_values is not implemented for {type}"
+                .format(type=type(self)))
+
+        if self._is_label_reference(key, axis=axis):
+            self._check_label_or_level_ambiguity(key, axis=axis,
+                                                 stacklevel=stacklevel + 1)
+            values = self.xs(key, axis=other_axes[0])._values
+        elif self._is_level_reference(key, axis=axis):
+            values = self.axes[axis].get_level_values(key)._values
+        else:
+            raise KeyError(key)
+
+        # Check for duplicates
+        if values.ndim > 1:
+
+            if other_axes and isinstance(
+                    self._get_axis(other_axes[0]), MultiIndex):
+                multi_message = ('\n'
+                                 'For a multi-index, the label must be a '
+                                 'tuple with elements corresponding to '
+                                 'each level.')
+            else:
+                multi_message = ''
+
+            label_axis_name = 'column' if axis == 0 else 'index'
+            raise ValueError(("The {label_axis_name} label '{key}' "
+                              "is not unique.{multi_message}")
+                             .format(key=key,
+                                     label_axis_name=label_axis_name,
+                                     multi_message=multi_message))
+
+        return values
+
+    def _drop_labels_or_levels(self, keys, axis=0):
+        """
+        Drop labels and/or levels for the given `axis`.
+
+        For each key in `keys`:
+          - (axis=0): If key matches a column label then drop the column.
+            Otherwise if key matches an index level then drop the level.
+          - (axis=1): If key matches an index label then drop the row.
+            Otherwise if key matches a column level then drop the level.
+
+        Parameters
+        ----------
+        keys: str or list of str
+            labels or levels to drop
+        axis: int, default 0
+            Axis that levels are associated with (0 for index, 1 for columns)
+
+        Returns
+        -------
+        dropped: DataFrame
+
+        Raises
+        ------
+        ValueError
+            if any `keys` match neither a label nor a level
+        """
+
+        axis = self._get_axis_number(axis)
+
+        if self.ndim > 2:
+            raise NotImplementedError(
+                "_drop_labels_or_levels is not implemented for {type}"
+                .format(type=type(self)))
+
+        # Validate keys
+        keys = com._maybe_make_list(keys)
+        invalid_keys = [k for k in keys if not
+                        self._is_label_or_level_reference(k, axis=axis)]
+
+        if invalid_keys:
+            raise ValueError(("The following keys are not valid labels or "
+                              "levels for axis {axis}: {invalid_keys}")
+                             .format(axis=axis,
+                                     invalid_keys=invalid_keys))
+
+        # Compute levels and labels to drop
+        levels_to_drop = [k for k in keys
+                          if self._is_level_reference(k, axis=axis)]
+
+        labels_to_drop = [k for k in keys
+                          if not self._is_level_reference(k, axis=axis)]
+
+        # Perform copy upfront and then use inplace operations below.
+        # This ensures that we always perform exactly one copy.
+        # ``copy`` and/or ``inplace`` options could be added in the future.
+        dropped = self.copy()
+
+        if axis == 0:
+            # Handle dropping index levels
+            if levels_to_drop:
+                dropped.reset_index(levels_to_drop, drop=True, inplace=True)
+
+            # Handle dropping columns labels
+            if labels_to_drop:
+                dropped.drop(labels_to_drop, axis=1, inplace=True)
+        else:
+            # Handle dropping column levels
+            if levels_to_drop:
+                if isinstance(dropped.columns, MultiIndex):
+                    # Drop the specified levels from the MultiIndex
+                    dropped.columns = dropped.columns.droplevel(levels_to_drop)
+                else:
+                    # Drop the last level of Index by replacing with
+                    # a RangeIndex
+                    dropped.columns = RangeIndex(dropped.columns.size)
+
+            # Handle dropping index labels
+            if labels_to_drop:
+                dropped.drop(labels_to_drop, axis=0, inplace=True)
+
+        return dropped
+
+    # ----------------------------------------------------------------------
+    # Iteration
+
+    def __hash__(self):
+        raise TypeError('{0!r} objects are mutable, thus they cannot be'
+                        ' hashed'.format(self.__class__.__name__))
+
+    def __iter__(self):
+        """Iterate over infor axis"""
+        return iter(self._info_axis)
+
+    # can we get a better explanation of this?
+    def keys(self):
+        """Get the 'info axis' (see Indexing for more)
+
+        This is index for Series, columns for DataFrame and major_axis for
+        Panel.
+        """
+        return self._info_axis
+
+    def iteritems(self):
+        """Iterate over (label, values) on info axis
+
+        This is index for Series, columns for DataFrame, major_axis for Panel,
+        and so on.
+        """
+        for h in self._info_axis:
+            yield h, self[h]
+
+    def __len__(self):
+        """Returns length of info axis"""
+        return len(self._info_axis)
+
+    def __contains__(self, key):
+        """True if the key is in the info axis"""
+        return key in self._info_axis
+
+    @property
+    def empty(self):
+        """
+        Indicator whether DataFrame is empty.
+
+        True if DataFrame is entirely empty (no items), meaning any of the
+        axes are of length 0.
+
+        Returns
+        -------
+        bool
+            If DataFrame is empty, return True, if not return False.
+
+        Notes
+        -----
+        If DataFrame contains only NaNs, it is still not considered empty. See
+        the example below.
+
+        Examples
+        --------
+        An example of an actual empty DataFrame. Notice the index is empty:
+
+        >>> df_empty = pd.DataFrame({'A' : []})
+        >>> df_empty
+        Empty DataFrame
+        Columns: [A]
+        Index: []
+        >>> df_empty.empty
+        True
+
+        If we only have NaNs in our DataFrame, it is not considered empty! We
+        will need to drop the NaNs to make the DataFrame empty:
+
+        >>> df = pd.DataFrame({'A' : [np.nan]})
+        >>> df
+            A
+        0 NaN
+        >>> df.empty
+        False
+        >>> df.dropna().empty
+        True
+
+        See also
+        --------
+        pandas.Series.dropna
+        pandas.DataFrame.dropna
+        """
+        return any(len(self._get_axis(a)) == 0 for a in self._AXIS_ORDERS)
+
+    def __nonzero__(self):
+        raise ValueError("The truth value of a {0} is ambiguous. "
+                         "Use a.empty, a.bool(), a.item(), a.any() or a.all()."
+                         .format(self.__class__.__name__))
+
+    __bool__ = __nonzero__
+
+    def bool(self):
+        """Return the bool of a single element PandasObject.
+
+        This must be a boolean scalar value, either True or False.  Raise a
+        ValueError if the PandasObject does not have exactly 1 element, or that
+        element is not boolean
+        """
+        v = self.squeeze()
+        if isinstance(v, (bool, np.bool_)):
+            return bool(v)
+        elif is_scalar(v):
+            raise ValueError("bool cannot act on a non-boolean single element "
+                             "{0}".format(self.__class__.__name__))
+
+        self.__nonzero__()
+
+    def __abs__(self):
+        return self.abs()
+
+    def __round__(self, decimals=0):
+        return self.round(decimals)
+
+    # ----------------------------------------------------------------------
+    # Array Interface
+
+    def __array__(self, dtype=None):
+        return com._values_from_object(self)
+
+    def __array_wrap__(self, result, context=None):
+        d = self._construct_axes_dict(self._AXIS_ORDERS, copy=False)
+        return self._constructor(result, **d).__finalize__(self)
+
+    # ideally we would define this to avoid the getattr checks, but
+    # is slower
+    # @property
+    # def __array_interface__(self):
+    #    """ provide numpy array interface method """
+    #    values = self.values
+    #    return dict(typestr=values.dtype.str,shape=values.shape,data=values)
+
+    def to_dense(self):
+        """Return dense representation of NDFrame (as opposed to sparse)"""
+        # compat
+        return self
+
+    # ----------------------------------------------------------------------
+    # Picklability
+
+    def __getstate__(self):
+        meta = {k: getattr(self, k, None) for k in self._metadata}
+        return dict(_data=self._data, _typ=self._typ, _metadata=self._metadata,
+                    **meta)
+
+    def __setstate__(self, state):
+
+        if isinstance(state, BlockManager):
+            self._data = state
+        elif isinstance(state, dict):
+            typ = state.get('_typ')
+            if typ is not None:
 
                 # set in the order of internal names
                 # to avoid definitional recursion
@@ -819,15 +1669,88 @@ def __setstate__(self, state):
 
         self._item_cache = {}
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # IO
 
-    #----------------------------------------------------------------------
+    def _repr_latex_(self):
+        """
+        Returns a LaTeX representation for a particular object.
+        Mainly for use with nbconvert (jupyter notebook conversion to pdf).
+        """
+        if config.get_option('display.latex.repr'):
+            return self.to_latex()
+        else:
+            return None
+
+    # ----------------------------------------------------------------------
     # I/O Methods
 
-    def to_json(self, path_or_buf=None, orient=None, date_format='epoch',
+    _shared_docs['to_excel'] = """
+    Write %(klass)s to an excel sheet
+    %(versionadded_to_excel)s
+
+    Parameters
+    ----------
+    excel_writer : string or ExcelWriter object
+        File path or existing ExcelWriter
+    sheet_name : string, default 'Sheet1'
+        Name of sheet which will contain DataFrame
+    na_rep : string, default ''
+        Missing data representation
+    float_format : string, default None
+        Format string for floating point numbers
+    columns : sequence, optional
+        Columns to write
+    header : boolean or list of string, default True
+        Write out the column names. If a list of strings is given it is
+        assumed to be aliases for the column names
+    index : boolean, default True
+        Write row names (index)
+    index_label : string or sequence, default None
+        Column label for index column(s) if desired. If None is given, and
+        `header` and `index` are True, then the index names are used. A
+        sequence should be given if the DataFrame uses MultiIndex.
+    startrow :
+        upper left cell row to dump data frame
+    startcol :
+        upper left cell column to dump data frame
+    engine : string, default None
+        write engine to use - you can also set this via the options
+        ``io.excel.xlsx.writer``, ``io.excel.xls.writer``, and
+        ``io.excel.xlsm.writer``.
+    merge_cells : boolean, default True
+        Write MultiIndex and Hierarchical Rows as merged cells.
+    encoding: string, default None
+        encoding of the resulting excel file. Only necessary for xlwt,
+        other writers support unicode natively.
+    inf_rep : string, default 'inf'
+        Representation for infinity (there is no native representation for
+        infinity in Excel)
+    freeze_panes : tuple of integer (length 2), default None
+        Specifies the one-based bottommost row and rightmost column that
+        is to be frozen
+
+        .. versionadded:: 0.20.0
+
+    Notes
+    -----
+    If passing an existing ExcelWriter object, then the sheet will be added
+    to the existing workbook.  This can be used to save different
+    DataFrames to one workbook:
+
+    >>> writer = pd.ExcelWriter('output.xlsx')
+    >>> df1.to_excel(writer,'Sheet1')
+    >>> df2.to_excel(writer,'Sheet2')
+    >>> writer.save()
+
+    For compatibility with to_csv, to_excel serializes lists and dicts to
+    strings before writing.
+    """
+
+    def to_json(self, path_or_buf=None, orient=None, date_format=None,
                 double_precision=10, force_ascii=True, date_unit='ms',
-                default_handler=None):
+                default_handler=None, lines=False, compression=None,
+                index=True):
         """
         Convert the object to a JSON string.
 
@@ -836,9 +1759,11 @@ def to_json(self, path_or_buf=None, orient=None, date_format='epoch',
 
         Parameters
         ----------
-        path_or_buf : the path or buffer to write the result string
-            if this is None, return a StringIO of the converted string
+        path_or_buf : string or file handle, optional
+            File path or object. If not specified, the result is returned as
+            a string.
         orient : string
+            Indication of expected JSON string format.
 
             * Series
 
@@ -853,20 +1778,29 @@ def to_json(self, path_or_buf=None, orient=None, date_format='epoch',
 
             * The format of the JSON string
 
-              - split : dict like
-                {index -> [index], columns -> [columns], data -> [values]}
-              - records : list like
+              - 'split' : dict like {'index' -> [index],
+                'columns' -> [columns], 'data' -> [values]}
+              - 'records' : list like
                 [{column -> value}, ... , {column -> value}]
-              - index : dict like {index -> {column -> value}}
-              - columns : dict like {column -> {index -> value}}
-              - values : just the values array
-
-        date_format : {'epoch', 'iso'}
-            Type of date conversion. `epoch` = epoch milliseconds,
-            `iso`` = ISO8601, default is epoch.
-        double_precision : The number of decimal places to use when encoding
-            floating point values, default 10.
-        force_ascii : force encoded string to be ASCII, default True.
+              - 'index' : dict like {index -> {column -> value}}
+              - 'columns' : dict like {column -> {index -> value}}
+              - 'values' : just the values array
+              - 'table' : dict like {'schema': {schema}, 'data': {data}}
+                describing the data, and the data component is
+                like ``orient='records'``.
+
+                .. versionchanged:: 0.20.0
+
+        date_format : {None, 'epoch', 'iso'}
+            Type of date conversion. 'epoch' = epoch milliseconds,
+            'iso' = ISO8601. The default depends on the `orient`. For
+            ``orient='table'``, the default is 'iso'. For all other orients,
+            the default is 'epoch'.
+        double_precision : int, default 10
+            The number of decimal places to use when encoding
+            floating point values.
+        force_ascii : boolean, default True
+            Force encoded string to be ASCII.
         date_unit : string, default 'ms' (milliseconds)
             The time unit to encode to, governs timestamp and ISO8601
             precision.  One of 's', 'ms', 'us', 'ns' for second, millisecond,
@@ -875,69 +1809,193 @@ def to_json(self, path_or_buf=None, orient=None, date_format='epoch',
             Handler to call if object cannot otherwise be converted to a
             suitable format for JSON. Should receive a single argument which is
             the object to convert and return a serialisable object.
+        lines : boolean, default False
+            If 'orient' is 'records' write out line delimited json format. Will
+            throw ValueError if incorrect 'orient' since others are not list
+            like.
 
-        Returns
-        -------
-        same type as input object with filtered info axis
+            .. versionadded:: 0.19.0
+
+        compression : {None, 'gzip', 'bz2', 'zip', 'xz'}
+            A string representing the compression to use in the output file,
+            only used when the first argument is a filename.
+
+            .. versionadded:: 0.21.0
+
+        index : boolean, default True
+            Whether to include the index values in the JSON string. Not
+            including the index (``index=False``) is only supported when
+            orient is 'split' or 'table'.
+
+            .. versionadded:: 0.23.0
+
+        See Also
+        --------
+        pandas.read_json
+
+        Examples
+        --------
+
+        >>> df = pd.DataFrame([['a', 'b'], ['c', 'd']],
+        ...                   index=['row 1', 'row 2'],
+        ...                   columns=['col 1', 'col 2'])
+        >>> df.to_json(orient='split')
+        '{"columns":["col 1","col 2"],
+          "index":["row 1","row 2"],
+          "data":[["a","b"],["c","d"]]}'
+
+        Encoding/decoding a Dataframe using ``'records'`` formatted JSON.
+        Note that index labels are not preserved with this encoding.
+
+        >>> df.to_json(orient='records')
+        '[{"col 1":"a","col 2":"b"},{"col 1":"c","col 2":"d"}]'
+
+        Encoding/decoding a Dataframe using ``'index'`` formatted JSON:
 
+        >>> df.to_json(orient='index')
+        '{"row 1":{"col 1":"a","col 2":"b"},"row 2":{"col 1":"c","col 2":"d"}}'
+
+        Encoding/decoding a Dataframe using ``'columns'`` formatted JSON:
+
+        >>> df.to_json(orient='columns')
+        '{"col 1":{"row 1":"a","row 2":"c"},"col 2":{"row 1":"b","row 2":"d"}}'
+
+        Encoding/decoding a Dataframe using ``'values'`` formatted JSON:
+
+        >>> df.to_json(orient='values')
+        '[["a","b"],["c","d"]]'
+
+        Encoding with Table Schema
+
+        >>> df.to_json(orient='table')
+        '{"schema": {"fields": [{"name": "index", "type": "string"},
+                                {"name": "col 1", "type": "string"},
+                                {"name": "col 2", "type": "string"}],
+                     "primaryKey": "index",
+                     "pandas_version": "0.20.0"},
+          "data": [{"index": "row 1", "col 1": "a", "col 2": "b"},
+                   {"index": "row 2", "col 1": "c", "col 2": "d"}]}'
         """
 
         from pandas.io import json
-        return json.to_json(
-            path_or_buf=path_or_buf,
-            obj=self, orient=orient,
-            date_format=date_format,
-            double_precision=double_precision,
-            force_ascii=force_ascii,
-            date_unit=date_unit,
-            default_handler=default_handler)
+        if date_format is None and orient == 'table':
+            date_format = 'iso'
+        elif date_format is None:
+            date_format = 'epoch'
+        return json.to_json(path_or_buf=path_or_buf, obj=self, orient=orient,
+                            date_format=date_format,
+                            double_precision=double_precision,
+                            force_ascii=force_ascii, date_unit=date_unit,
+                            default_handler=default_handler,
+                            lines=lines, compression=compression,
+                            index=index)
 
     def to_hdf(self, path_or_buf, key, **kwargs):
-        """ activate the HDFStore
+        """
+        Write the contained data to an HDF5 file using HDFStore.
+
+        Hierarchical Data Format (HDF) is self-describing, allowing an
+        application to interpret the structure and contents of a file with
+        no outside information. One HDF file can hold a mix of related objects
+        which can be accessed as a group or as individual objects.
+
+        In order to add another DataFrame or Series to an existing HDF file
+        please use append mode and a different a key.
+
+        For more information see the :ref:`user guide <io.hdf5>`.
 
         Parameters
         ----------
-        path_or_buf : the path (string) or HDFStore object
-        key : string
-            indentifier for the group in the store
-        mode : optional, {'a', 'w', 'r', 'r+'}, default 'a'
-
-          ``'r'``
-              Read-only; no data can be modified.
-          ``'w'``
-              Write; a new file is created (an existing file with the same
-              name would be deleted).
-          ``'a'``
-              Append; an existing file is opened for reading and writing,
-              and if the file does not exist it is created.
-          ``'r+'``
-              It is similar to ``'a'``, but the file must already exist.
-        format   : 'fixed(f)|table(t)', default is 'fixed'
-            fixed(f) : Fixed format
-                       Fast writing/reading. Not-appendable, nor searchable
-            table(t) : Table format
-                       Write as a PyTables Table structure which may perform
-                       worse but allow more flexible operations like searching
-                       / selecting subsets of the data
-        append   : boolean, default False
-            For Table formats, append the input data to the existing
-        complevel : int, 1-9, default 0
-            If a complib is specified compression will be applied
-            where possible
-        complib : {'zlib', 'bzip2', 'lzo', 'blosc', None}, default None
-            If complevel is > 0 apply compression to objects written
-            in the store wherever possible
+        path_or_buf : str or pandas.HDFStore
+            File path or HDFStore object.
+        key : str
+            Identifier for the group in the store.
+        mode : {'a', 'w', 'r+'}, default 'a'
+            Mode to open file:
+
+            - 'w': write, a new file is created (an existing file with
+              the same name would be deleted).
+            - 'a': append, an existing file is opened for reading and
+              writing, and if the file does not exist it is created.
+            - 'r+': similar to 'a', but the file must already exist.
+        format : {'fixed', 'table'}, default 'fixed'
+            Possible values:
+
+            - 'fixed': Fixed format. Fast writing/reading. Not-appendable,
+              nor searchable.
+            - 'table': Table format. Write as a PyTables Table structure
+              which may perform worse but allow more flexible operations
+              like searching / selecting subsets of the data.
+        append : bool, default False
+            For Table formats, append the input data to the existing.
+        data_columns :  list of columns or True, optional
+            List of columns to create as indexed data columns for on-disk
+            queries, or True to use all columns. By default only the axes
+            of the object are indexed. See :ref:`io.hdf5-query-data-columns`.
+            Applicable only to format='table'.
+        complevel : {0-9}, optional
+            Specifies a compression level for data.
+            A value of 0 disables compression.
+        complib : {'zlib', 'lzo', 'bzip2', 'blosc'}, default 'zlib'
+            Specifies the compression library to be used.
+            As of v0.20.2 these additional compressors for Blosc are supported
+            (default if no compressor specified: 'blosc:blosclz'):
+            {'blosc:blosclz', 'blosc:lz4', 'blosc:lz4hc', 'blosc:snappy',
+            'blosc:zlib', 'blosc:zstd'}.
+            Specifying a compression library which is not available issues
+            a ValueError.
         fletcher32 : bool, default False
-            If applying compression use the fletcher32 checksum
-        dropna : boolean, default False.
+            If applying compression use the fletcher32 checksum.
+        dropna : bool, default False
             If true, ALL nan rows will not be written to store.
+        errors : str, default 'strict'
+            Specifies how encoding and decoding errors are to be handled.
+            See the errors argument for :func:`open` for a full list
+            of options.
 
-        """
+        See Also
+        --------
+        DataFrame.read_hdf : Read from HDF file.
+        DataFrame.to_parquet : Write a DataFrame to the binary parquet format.
+        DataFrame.to_sql : Write to a sql table.
+        DataFrame.to_feather : Write out feather-format for DataFrames.
+        DataFrame.to_csv : Write out to a csv file.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
+        ...                   index=['a', 'b', 'c'])
+        >>> df.to_hdf('data.h5', key='df', mode='w')
 
+        We can add another object to the same file:
+
+        >>> s = pd.Series([1, 2, 3, 4])
+        >>> s.to_hdf('data.h5', key='s')
+
+        Reading from HDF file:
+
+        >>> pd.read_hdf('data.h5', 'df')
+        A  B
+        a  1  4
+        b  2  5
+        c  3  6
+        >>> pd.read_hdf('data.h5', 's')
+        0    1
+        1    2
+        2    3
+        3    4
+        dtype: int64
+
+        Deleting file with data:
+
+        >>> import os
+        >>> os.remove('data.h5')
+
+        """
         from pandas.io import pytables
         return pytables.to_hdf(path_or_buf, key, self, **kwargs)
 
-    def to_msgpack(self, path_or_buf=None, **kwargs):
+    def to_msgpack(self, path_or_buf=None, encoding='utf-8', **kwargs):
         """
         msgpack (serialize) object to input file path
 
@@ -955,124 +2013,465 @@ def to_msgpack(self, path_or_buf=None, **kwargs):
         """
 
         from pandas.io import packers
-        return packers.to_msgpack(path_or_buf, self, **kwargs)
+        return packers.to_msgpack(path_or_buf, self, encoding=encoding,
+                                  **kwargs)
 
-    def to_sql(self, name, con, flavor='sqlite', schema=None, if_exists='fail',
-               index=True, index_label=None, chunksize=None, dtype=None):
+    def to_sql(self, name, con, schema=None, if_exists='fail', index=True,
+               index_label=None, chunksize=None, dtype=None):
         """
         Write records stored in a DataFrame to a SQL database.
 
+        Databases supported by SQLAlchemy [1]_ are supported. Tables can be
+        newly created, appended to, or overwritten.
+
         Parameters
         ----------
         name : string
-            Name of SQL table
-        con : SQLAlchemy engine or DBAPI2 connection (legacy mode)
+            Name of SQL table.
+        con : sqlalchemy.engine.Engine or sqlite3.Connection
             Using SQLAlchemy makes it possible to use any DB supported by that
-            library.
-            If a DBAPI2 object, only sqlite3 is supported.
-        flavor : {'sqlite', 'mysql'}, default 'sqlite'
-            The flavor of SQL to use. Ignored when using SQLAlchemy engine.
-            'mysql' is deprecated and will be removed in future versions, but it
-            will be further supported through SQLAlchemy engines.
-        schema : string, default None
+            library. Legacy support is provided for sqlite3.Connection objects.
+        schema : string, optional
             Specify the schema (if database flavor supports this). If None, use
             default schema.
         if_exists : {'fail', 'replace', 'append'}, default 'fail'
-            - fail: If table exists, do nothing.
-            - replace: If table exists, drop it, recreate it, and insert data.
-            - append: If table exists, insert data. Create if does not exist.
+            How to behave if the table already exists.
+
+            * fail: Raise a ValueError.
+            * replace: Drop the table before inserting new values.
+            * append: Insert new values to the existing table.
+
         index : boolean, default True
-            Write DataFrame index as a column.
+            Write DataFrame index as a column. Uses `index_label` as the column
+            name in the table.
         index_label : string or sequence, default None
             Column label for index column(s). If None is given (default) and
             `index` is True, then the index names are used.
             A sequence should be given if the DataFrame uses MultiIndex.
-        chunksize : int, default None
-            If not None, then rows will be written in batches of this size at a
-            time.  If None, all rows will be written at once.
-        dtype : dict of column name to SQL type, default None
-            Optional specifying the datatype for columns. The SQL type should
-            be a SQLAlchemy type, or a string for sqlite3 fallback connection.
+        chunksize : int, optional
+            Rows will be written in batches of this size at a time. By default,
+            all rows will be written at once.
+        dtype : dict, optional
+            Specifying the datatype for columns. The keys should be the column
+            names and the values should be the SQLAlchemy types or strings for
+            the sqlite3 legacy mode.
+
+        Raises
+        ------
+        ValueError
+            When the table already exists and `if_exists` is 'fail' (the
+            default).
+
+        See Also
+        --------
+        pandas.read_sql : read a DataFrame from a table
+
+        References
+        ----------
+        .. [1] http://docs.sqlalchemy.org
+        .. [2] https://www.python.org/dev/peps/pep-0249/
+
+        Examples
+        --------
+
+        Create an in-memory SQLite database.
+
+        >>> from sqlalchemy import create_engine
+        >>> engine = create_engine('sqlite://', echo=False)
 
+        Create a table from scratch with 3 rows.
+
+        >>> df = pd.DataFrame({'name' : ['User 1', 'User 2', 'User 3']})
+        >>> df
+             name
+        0  User 1
+        1  User 2
+        2  User 3
+
+        >>> df.to_sql('users', con=engine)
+        >>> engine.execute("SELECT * FROM users").fetchall()
+        [(0, 'User 1'), (1, 'User 2'), (2, 'User 3')]
+
+        >>> df1 = pd.DataFrame({'name' : ['User 4', 'User 5']})
+        >>> df1.to_sql('users', con=engine, if_exists='append')
+        >>> engine.execute("SELECT * FROM users").fetchall()
+        [(0, 'User 1'), (1, 'User 2'), (2, 'User 3'),
+         (0, 'User 4'), (1, 'User 5')]
+
+        Overwrite the table with just ``df1``.
+
+        >>> df1.to_sql('users', con=engine, if_exists='replace',
+        ...            index_label='id')
+        >>> engine.execute("SELECT * FROM users").fetchall()
+        [(0, 'User 4'), (1, 'User 5')]
+
+        Specify the dtype (especially useful for integers with missing values).
+        Notice that while pandas is forced to store the data as floating point,
+        the database supports nullable integers. When fetching the data with
+        Python, we get back integer scalars.
+
+        >>> df = pd.DataFrame({"A": [1, None, 2]})
+        >>> df
+             A
+        0  1.0
+        1  NaN
+        2  2.0
+
+        >>> from sqlalchemy.types import Integer
+        >>> df.to_sql('integers', con=engine, index=False,
+        ...           dtype={"A": Integer()})
+
+        >>> engine.execute("SELECT * FROM integers").fetchall()
+        [(1,), (None,), (2,)]
         """
         from pandas.io import sql
-        sql.to_sql(
-            self, name, con, flavor=flavor, schema=schema, if_exists=if_exists,
-            index=index, index_label=index_label, chunksize=chunksize,
-            dtype=dtype)
+        sql.to_sql(self, name, con, schema=schema, if_exists=if_exists,
+                   index=index, index_label=index_label, chunksize=chunksize,
+                   dtype=dtype)
 
-    def to_pickle(self, path):
+    def to_pickle(self, path, compression='infer',
+                  protocol=pkl.HIGHEST_PROTOCOL):
         """
-        Pickle (serialize) object to input file path
+        Pickle (serialize) object to file.
 
         Parameters
         ----------
-        path : string
-            File path
+        path : str
+            File path where the pickled object will be stored.
+        compression : {'infer', 'gzip', 'bz2', 'zip', 'xz', None}, \
+        default 'infer'
+            A string representing the compression to use in the output file. By
+            default, infers from the file extension in specified path.
+
+            .. versionadded:: 0.20.0
+        protocol : int
+            Int which indicates which protocol should be used by the pickler,
+            default HIGHEST_PROTOCOL (see [1]_ paragraph 12.1.2). The possible
+            values for this parameter depend on the version of Python. For
+            Python 2.x, possible values are 0, 1, 2. For Python>=3.0, 3 is a
+            valid value. For Python >= 3.4, 4 is a valid value. A negative
+            value for the protocol parameter is equivalent to setting its value
+            to HIGHEST_PROTOCOL.
+
+            .. [1] https://docs.python.org/3/library/pickle.html
+            .. versionadded:: 0.21.0
+
+        See Also
+        --------
+        read_pickle : Load pickled pandas object (or any object) from file.
+        DataFrame.to_hdf : Write DataFrame to an HDF5 file.
+        DataFrame.to_sql : Write DataFrame to a SQL database.
+        DataFrame.to_parquet : Write a DataFrame to the binary parquet format.
+
+        Examples
+        --------
+        >>> original_df = pd.DataFrame({"foo": range(5), "bar": range(5, 10)})
+        >>> original_df
+           foo  bar
+        0    0    5
+        1    1    6
+        2    2    7
+        3    3    8
+        4    4    9
+        >>> original_df.to_pickle("./dummy.pkl")
+
+        >>> unpickled_df = pd.read_pickle("./dummy.pkl")
+        >>> unpickled_df
+           foo  bar
+        0    0    5
+        1    1    6
+        2    2    7
+        3    3    8
+        4    4    9
+
+        >>> import os
+        >>> os.remove("./dummy.pkl")
         """
         from pandas.io.pickle import to_pickle
-        return to_pickle(self, path)
+        return to_pickle(self, path, compression=compression,
+                         protocol=protocol)
 
-    def to_clipboard(self, excel=None, sep=None, **kwargs):
-        """
-        Attempt to write text representation of object to the system clipboard
+    def to_clipboard(self, excel=True, sep=None, **kwargs):
+        r"""
+        Copy object to the system clipboard.
+
+        Write a text representation of object to the system clipboard.
         This can be pasted into Excel, for example.
 
         Parameters
         ----------
-        excel : boolean, defaults to True
-                if True, use the provided separator, writing in a csv
-                format for allowing easy pasting into excel.
-                if False, write a string representation of the object
-                to the clipboard
-        sep : optional, defaults to tab
-        other keywords are passed to to_csv
+        excel : bool, default True
+            - True, use the provided separator, writing in a csv format for
+              allowing easy pasting into excel.
+            - False, write a string representation of the object to the
+              clipboard.
+
+        sep : str, default ``'\t'``
+            Field delimiter.
+        **kwargs
+            These parameters will be passed to DataFrame.to_csv.
+
+        See Also
+        --------
+        DataFrame.to_csv : Write a DataFrame to a comma-separated values
+            (csv) file.
+        read_clipboard : Read text from clipboard and pass to read_table.
 
         Notes
         -----
-        Requirements for your platform
-          - Linux: xclip, or xsel (with gtk or PyQt4 modules)
-          - Windows: none
-          - OS X: none
-        """
-        from pandas.io import clipboard
-        clipboard.to_clipboard(self, excel=excel, sep=sep, **kwargs)
-
-    #----------------------------------------------------------------------
-    # Fancy Indexing
+        Requirements for your platform.
 
-    @classmethod
-    def _create_indexer(cls, name, indexer):
-        """ create an indexer like _name in the class """
+          - Linux : `xclip`, or `xsel` (with `gtk` or `PyQt4` modules)
+          - Windows : none
+          - OS X : none
 
-        if getattr(cls, name, None) is None:
-            iname = '_%s' % name
-            setattr(cls, iname, None)
+        Examples
+        --------
+        Copy the contents of a DataFrame to the clipboard.
 
-            def _indexer(self):
-                i = getattr(self, iname)
-                if i is None:
-                    i = indexer(self, name)
-                    setattr(self, iname, i)
-                return i
+        >>> df = pd.DataFrame([[1, 2, 3], [4, 5, 6]], columns=['A', 'B', 'C'])
+        >>> df.to_clipboard(sep=',')
+        ... # Wrote the following to the system clipboard:
+        ... # ,A,B,C
+        ... # 0,1,2,3
+        ... # 1,4,5,6
 
-            setattr(cls, name, property(_indexer, doc=indexer.__doc__))
+        We can omit the the index by passing the keyword `index` and setting
+        it to false.
 
-            # add to our internal names set
-            cls._internal_names_set.add(iname)
+        >>> df.to_clipboard(sep=',', index=False)
+        ... # Wrote the following to the system clipboard:
+        ... # A,B,C
+        ... # 1,2,3
+        ... # 4,5,6
+        """
+        from pandas.io import clipboards
+        clipboards.to_clipboard(self, excel=excel, sep=sep, **kwargs)
 
-    def get(self, key, default=None):
+    def to_xarray(self):
         """
-        Get item from object for given key (DataFrame column, Panel slice,
-        etc.). Returns default value if not found
+        Return an xarray object from the pandas object.
 
-        Parameters
-        ----------
-        key : object
+        Returns
+        -------
+        a DataArray for a Series
+        a Dataset for a DataFrame
+        a DataArray for higher dims
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'A' : [1, 1, 2],
+                               'B' : ['foo', 'bar', 'foo'],
+                               'C' : np.arange(4.,7)})
+        >>> df
+           A    B    C
+        0  1  foo  4.0
+        1  1  bar  5.0
+        2  2  foo  6.0
+
+        >>> df.to_xarray()
+        <xarray.Dataset>
+        Dimensions:  (index: 3)
+        Coordinates:
+          * index    (index) int64 0 1 2
+        Data variables:
+            A        (index) int64 1 1 2
+            B        (index) object 'foo' 'bar' 'foo'
+            C        (index) float64 4.0 5.0 6.0
+
+        >>> df = pd.DataFrame({'A' : [1, 1, 2],
+                               'B' : ['foo', 'bar', 'foo'],
+                               'C' : np.arange(4.,7)}
+                             ).set_index(['B','A'])
+        >>> df
+                 C
+        B   A
+        foo 1  4.0
+        bar 1  5.0
+        foo 2  6.0
+
+        >>> df.to_xarray()
+        <xarray.Dataset>
+        Dimensions:  (A: 2, B: 2)
+        Coordinates:
+          * B        (B) object 'bar' 'foo'
+          * A        (A) int64 1 2
+        Data variables:
+            C        (B, A) float64 5.0 nan 4.0 6.0
+
+        >>> p = pd.Panel(np.arange(24).reshape(4,3,2),
+                         items=list('ABCD'),
+                         major_axis=pd.date_range('20130101', periods=3),
+                         minor_axis=['first', 'second'])
+        >>> p
+        <class 'pandas.core.panel.Panel'>
+        Dimensions: 4 (items) x 3 (major_axis) x 2 (minor_axis)
+        Items axis: A to D
+        Major_axis axis: 2013-01-01 00:00:00 to 2013-01-03 00:00:00
+        Minor_axis axis: first to second
+
+        >>> p.to_xarray()
+        <xarray.DataArray (items: 4, major_axis: 3, minor_axis: 2)>
+        array([[[ 0,  1],
+                [ 2,  3],
+                [ 4,  5]],
+               [[ 6,  7],
+                [ 8,  9],
+                [10, 11]],
+               [[12, 13],
+                [14, 15],
+                [16, 17]],
+               [[18, 19],
+                [20, 21],
+                [22, 23]]])
+        Coordinates:
+          * items       (items) object 'A' 'B' 'C' 'D'
+          * major_axis  (major_axis) datetime64[ns] 2013-01-01 2013-01-02 2013-01-03  # noqa
+          * minor_axis  (minor_axis) object 'first' 'second'
+
+        Notes
+        -----
+        See the `xarray docs <http://xarray.pydata.org/en/stable/>`__
+        """
+
+        try:
+            import xarray
+        except ImportError:
+            # Give a nice error message
+            raise ImportError("the xarray library is not installed\n"
+                              "you can install via conda\n"
+                              "conda install xarray\n"
+                              "or via pip\n"
+                              "pip install xarray\n")
+
+        if self.ndim == 1:
+            return xarray.DataArray.from_series(self)
+        elif self.ndim == 2:
+            return xarray.Dataset.from_dataframe(self)
+
+        # > 2 dims
+        coords = [(a, self._get_axis(a)) for a in self._AXIS_ORDERS]
+        return xarray.DataArray(self,
+                                coords=coords,
+                                )
+
+    _shared_docs['to_latex'] = r"""
+        Render an object to a tabular environment table. You can splice
+        this into a LaTeX document. Requires \\usepackage{booktabs}.
+
+        .. versionchanged:: 0.20.2
+           Added to Series
+
+        `to_latex`-specific options:
+
+        bold_rows : boolean, default False
+            Make the row labels bold in the output
+        column_format : str, default None
+            The columns format as specified in `LaTeX table format
+            <https://en.wikibooks.org/wiki/LaTeX/Tables>`__ e.g 'rcl' for 3
+            columns
+        longtable : boolean, default will be read from the pandas config module
+            Default: False.
+            Use a longtable environment instead of tabular. Requires adding
+            a \\usepackage{longtable} to your LaTeX preamble.
+        escape : boolean, default will be read from the pandas config module
+            Default: True.
+            When set to False prevents from escaping latex special
+            characters in column names.
+        encoding : str, default None
+            A string representing the encoding to use in the output file,
+            defaults to 'ascii' on Python 2 and 'utf-8' on Python 3.
+        decimal : string, default '.'
+            Character recognized as decimal separator, e.g. ',' in Europe.
+
+            .. versionadded:: 0.18.0
+
+        multicolumn : boolean, default True
+            Use \multicolumn to enhance MultiIndex columns.
+            The default will be read from the config module.
+
+            .. versionadded:: 0.20.0
+
+        multicolumn_format : str, default 'l'
+            The alignment for multicolumns, similar to `column_format`
+            The default will be read from the config module.
+
+            .. versionadded:: 0.20.0
+
+        multirow : boolean, default False
+            Use \multirow to enhance MultiIndex rows.
+            Requires adding a \\usepackage{multirow} to your LaTeX preamble.
+            Will print centered labels (instead of top-aligned)
+            across the contained rows, separating groups via clines.
+            The default will be read from the pandas config module.
+
+            .. versionadded:: 0.20.0
+            """
+
+    @Substitution(header='Write out the column names. If a list of strings '
+                         'is given, it is assumed to be aliases for the '
+                         'column names.')
+    @Appender(_shared_docs['to_latex'] % _shared_doc_kwargs)
+    def to_latex(self, buf=None, columns=None, col_space=None, header=True,
+                 index=True, na_rep='NaN', formatters=None, float_format=None,
+                 sparsify=None, index_names=True, bold_rows=False,
+                 column_format=None, longtable=None, escape=None,
+                 encoding=None, decimal='.', multicolumn=None,
+                 multicolumn_format=None, multirow=None):
+        # Get defaults from the pandas config
+        if self.ndim == 1:
+            self = self.to_frame()
+        if longtable is None:
+            longtable = config.get_option("display.latex.longtable")
+        if escape is None:
+            escape = config.get_option("display.latex.escape")
+        if multicolumn is None:
+            multicolumn = config.get_option("display.latex.multicolumn")
+        if multicolumn_format is None:
+            multicolumn_format = config.get_option(
+                "display.latex.multicolumn_format")
+        if multirow is None:
+            multirow = config.get_option("display.latex.multirow")
+
+        formatter = DataFrameFormatter(self, buf=buf, columns=columns,
+                                       col_space=col_space, na_rep=na_rep,
+                                       header=header, index=index,
+                                       formatters=formatters,
+                                       float_format=float_format,
+                                       bold_rows=bold_rows,
+                                       sparsify=sparsify,
+                                       index_names=index_names,
+                                       escape=escape, decimal=decimal)
+        formatter.to_latex(column_format=column_format, longtable=longtable,
+                           encoding=encoding, multicolumn=multicolumn,
+                           multicolumn_format=multicolumn_format,
+                           multirow=multirow)
+
+        if buf is None:
+            return formatter.buf.getvalue()
+
+    # ----------------------------------------------------------------------
+    # Fancy Indexing
+
+    @classmethod
+    def _create_indexer(cls, name, indexer):
+        """Create an indexer like _name in the class."""
+        if getattr(cls, name, None) is None:
+            _indexer = functools.partial(indexer, name)
+            setattr(cls, name, property(_indexer, doc=indexer.__doc__))
+
+    def get(self, key, default=None):
+        """
+        Get item from object for given key (DataFrame column, Panel slice,
+        etc.). Returns default value if not found.
+
+        Parameters
+        ----------
+        key : object
 
         Returns
         -------
-        value : type of items contained in object
+        value : same type as items contained in object
         """
         try:
             return self[key]
@@ -1083,7 +2482,7 @@ def __getitem__(self, item):
         return self._get_item_cache(item)
 
     def _get_item_cache(self, item):
-        """ return the cached item, item represents a label indexer """
+        """Return the cached item, item represents a label indexer."""
         cache = self._item_cache
         res = cache.get(item)
         if res is None:
@@ -1093,48 +2492,44 @@ def _get_item_cache(self, item):
             res._set_as_cached(item, self)
 
             # for a chain
-            res.is_copy = self.is_copy
+            res._is_copy = self._is_copy
         return res
 
     def _set_as_cached(self, item, cacher):
-        """ set the _cacher attribute on the calling object with
-            a weakref to cacher """
+        """Set the _cacher attribute on the calling object with a weakref to
+        cacher.
+        """
         self._cacher = (item, weakref.ref(cacher))
 
     def _reset_cacher(self):
-        """ reset the cacher """
-        if hasattr(self,'_cacher'):
+        """Reset the cacher."""
+        if hasattr(self, '_cacher'):
             del self._cacher
 
     def _iget_item_cache(self, item):
-        """ return the cached item, item represents a positional indexer """
+        """Return the cached item, item represents a positional indexer."""
         ax = self._info_axis
         if ax.is_unique:
             lower = self._get_item_cache(ax[item])
         else:
-            lower = self.take(item, axis=self._info_axis_number, convert=True)
+            lower = self._take(item, axis=self._info_axis_number)
         return lower
 
     def _box_item_values(self, key, values):
-        raise AbstractMethodError(self)
+        raise com.AbstractMethodError(self)
 
     def _maybe_cache_changed(self, item, value):
+        """The object has called back to us saying maybe it has changed.
         """
-        the object has called back to us saying
-        maybe it has changed
-
-        numpy < 1.8 has an issue with object arrays and aliasing
-        GH6026
-        """
-        self._data.set(item, value, check=pd._np_version_under1p8)
+        self._data.set(item, value, check=False)
 
     @property
     def _is_cached(self):
-        """ boolean : return if I am cached """
+        """Return boolean indicating if self is cached or not."""
         return getattr(self, '_cacher', None) is not None
 
     def _get_cacher(self):
-        """ return my cacher or None """
+        """return my cacher or None"""
         cacher = getattr(self, '_cacher', None)
         if cacher is not None:
             cacher = cacher[1]()
@@ -1142,14 +2537,13 @@ def _get_cacher(self):
 
     @property
     def _is_view(self):
-        """ boolean : return if I am a view of another array """
+        """Return boolean indicating if self is view of another array """
         return self._data.is_view
 
     def _maybe_update_cacher(self, clear=False, verify_is_copy=True):
         """
-
-        see if we need to update our parent cacher
-        if clear, then clear our cache
+        See if we need to update our parent cacher if clear, then clear our
+        cache.
 
         Parameters
         ----------
@@ -1171,7 +2565,7 @@ def _maybe_update_cacher(self, clear=False, verify_is_copy=True):
             else:
                 try:
                     ref._maybe_cache_changed(cacher[0], self)
-                except:
+                except Exception:
                     pass
 
         if verify_is_copy:
@@ -1191,7 +2585,6 @@ def _slice(self, slobj, axis=0, kind=None):
         Construct a slice of this container.
 
         kind parameter is maintained for compatibility with Series slicing.
-
         """
         axis = self._get_block_manager_axis(axis)
         result = self._constructor(self._data.get_slice(slobj, axis=axis))
@@ -1199,7 +2592,7 @@ def _slice(self, slobj, axis=0, kind=None):
 
         # this could be a view
         # but only in a single-dtyped view slicable case
-        is_copy = axis!=0 or result._is_view
+        is_copy = axis != 0 or result._is_view
         result._set_is_copy(self, copy=is_copy)
         return result
 
@@ -1209,29 +2602,31 @@ def _set_item(self, key, value):
 
     def _set_is_copy(self, ref=None, copy=True):
         if not copy:
-            self.is_copy = None
+            self._is_copy = None
         else:
             if ref is not None:
-                self.is_copy = weakref.ref(ref)
+                self._is_copy = weakref.ref(ref)
             else:
-                self.is_copy = None
+                self._is_copy = None
 
     def _check_is_chained_assignment_possible(self):
         """
-        check if we are a view, have a cacher, and are of mixed type
-        if so, then force a setitem_copy check
+        Check if we are a view, have a cacher, and are of mixed type.
+        If so, then force a setitem_copy check.
 
-        should be called just near setting a value
+        Should be called just near setting a value
 
-        will return a boolean if it we are a view and are cached, but a single-dtype
-        meaning that the cacher should be updated following setting
+        Will return a boolean if it we are a view and are cached, but a
+        single-dtype meaning that the cacher should be updated following
+        setting.
         """
         if self._is_view and self._is_cached:
             ref = self._get_cacher()
             if ref is not None and ref._is_mixed_type:
-                self._check_setitem_copy(stacklevel=4, t='referant', force=True)
+                self._check_setitem_copy(stacklevel=4, t='referant',
+                                         force=True)
             return True
-        elif self.is_copy:
+        elif self._is_copy:
             self._check_setitem_copy(stacklevel=4, t='referant')
         return False
 
@@ -1252,67 +2647,72 @@ def _check_setitem_copy(self, stacklevel=4, t='setting', force=False):
         user will see the error *at the level of setting*
 
         It is technically possible to figure out that we are setting on
-        a copy even WITH a multi-dtyped pandas object. In other words, some blocks
-        may be views while other are not. Currently _is_view will ALWAYS return False
-        for multi-blocks to avoid having to handle this case.
+        a copy even WITH a multi-dtyped pandas object. In other words, some
+        blocks may be views while other are not. Currently _is_view will ALWAYS
+        return False for multi-blocks to avoid having to handle this case.
 
         df = DataFrame(np.arange(0,9), columns=['count'])
         df['group'] = 'b'
 
-        # this technically need not raise SettingWithCopy if both are view (which is not
-        # generally guaranteed but is usually True
-        # however, this is in general not a good practice and we recommend using .loc
+        # This technically need not raise SettingWithCopy if both are view
+        # (which is not # generally guaranteed but is usually True.  However,
+        # this is in general not a good practice and we recommend using .loc.
         df.iloc[0:5]['group'] = 'a'
 
         """
 
-        if force or self.is_copy:
+        if force or self._is_copy:
 
             value = config.get_option('mode.chained_assignment')
             if value is None:
                 return
 
-            # see if the copy is not actually refererd; if so, then disolve
+            # see if the copy is not actually referred; if so, then dissolve
             # the copy weakref
             try:
                 gc.collect(2)
-                if not gc.get_referents(self.is_copy()):
-                    self.is_copy = None
+                if not gc.get_referents(self._is_copy()):
+                    self._is_copy = None
                     return
-            except:
+            except Exception:
                 pass
 
             # we might be a false positive
             try:
-                if self.is_copy().shape == self.shape:
-                    self.is_copy = None
+                if self._is_copy().shape == self.shape:
+                    self._is_copy = None
                     return
-            except:
+            except Exception:
                 pass
 
             # a custom message
-            if isinstance(self.is_copy, string_types):
-                t = self.is_copy
+            if isinstance(self._is_copy, string_types):
+                t = self._is_copy
 
             elif t == 'referant':
                 t = ("\n"
                      "A value is trying to be set on a copy of a slice from a "
                      "DataFrame\n\n"
                      "See the caveats in the documentation: "
-                     "http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy")
+                     "http://pandas.pydata.org/pandas-docs/stable/"
+                     "indexing.html#indexing-view-versus-copy"
+                     )
 
             else:
                 t = ("\n"
                      "A value is trying to be set on a copy of a slice from a "
                      "DataFrame.\n"
-                     "Try using .loc[row_indexer,col_indexer] = value instead\n\n"
-                     "See the caveats in the documentation: "
-                     "http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy")
+                     "Try using .loc[row_indexer,col_indexer] = value "
+                     "instead\n\nSee the caveats in the documentation: "
+                     "http://pandas.pydata.org/pandas-docs/stable/"
+                     "indexing.html#indexing-view-versus-copy"
+                     )
 
             if value == 'raise':
-                raise SettingWithCopyError(t)
+                raise com.SettingWithCopyError(t)
             elif value == 'warn':
-                warnings.warn(t, SettingWithCopyWarning, stacklevel=stacklevel)
+                warnings.warn(t, com.SettingWithCopyWarning,
+                              stacklevel=stacklevel)
 
     def __delitem__(self, key):
         """
@@ -1331,7 +2731,7 @@ def __delitem__(self, key):
             # Allow shorthand to delete all columns whose first len(key)
             # elements match key:
             if not isinstance(key, tuple):
-                key = (key,)
+                key = (key, )
             for col in self.columns:
                 if isinstance(col, tuple) and col[:len(key)] == key:
                     del self[col]
@@ -1348,39 +2748,152 @@ def __delitem__(self, key):
         except KeyError:
             pass
 
-    def take(self, indices, axis=0, convert=True, is_copy=True):
-        """
-        Analogous to ndarray.take
+    _shared_docs['_take'] = """
+        Return the elements in the given *positional* indices along an axis.
+
+        This means that we are not indexing according to actual values in
+        the index attribute of the object. We are indexing according to the
+        actual position of the element in the object.
+
+        This is the internal version of ``.take()`` and will contain a wider
+        selection of parameters useful for internal use but not as suitable
+        for public usage.
 
         Parameters
         ----------
-        indices : list / array of ints
+        indices : array-like
+            An array of ints indicating which positions to take.
         axis : int, default 0
-        convert : translate neg to pos indices (default)
-        is_copy : mark the returned frame as a copy
+            The axis on which to select elements. "0" means that we are
+            selecting rows, "1" means that we are selecting columns, etc.
+        is_copy : bool, default True
+            Whether to return a copy of the original object or not.
 
         Returns
         -------
-        taken : type of caller
+        taken : same type as caller
+            An array-like containing the elements taken from the object.
+
+        See Also
+        --------
+        numpy.ndarray.take
+        numpy.take
         """
 
+    @Appender(_shared_docs['_take'])
+    def _take(self, indices, axis=0, is_copy=True):
         self._consolidate_inplace()
+
         new_data = self._data.take(indices,
                                    axis=self._get_block_manager_axis(axis),
-                                   convert=True, verify=True)
+                                   verify=True)
         result = self._constructor(new_data).__finalize__(self)
 
-        # maybe set copy if we didn't actually change the index
+        # Maybe set copy if we didn't actually change the index.
         if is_copy:
             if not result._get_axis(axis).equals(self._get_axis(axis)):
                 result._set_is_copy(self)
 
         return result
 
-    def xs(self, key, axis=0, level=None, copy=None, drop_level=True):
+    _shared_docs['take'] = """
+        Return the elements in the given *positional* indices along an axis.
+
+        This means that we are not indexing according to actual values in
+        the index attribute of the object. We are indexing according to the
+        actual position of the element in the object.
+
+        Parameters
+        ----------
+        indices : array-like
+            An array of ints indicating which positions to take.
+        axis : {0 or 'index', 1 or 'columns', None}, default 0
+            The axis on which to select elements. ``0`` means that we are
+            selecting rows, ``1`` means that we are selecting columns.
+        convert : bool, default True
+            Whether to convert negative indices into positive ones.
+            For example, ``-1`` would map to the ``len(axis) - 1``.
+            The conversions are similar to the behavior of indexing a
+            regular Python list.
+
+            .. deprecated:: 0.21.0
+               In the future, negative indices will always be converted.
+
+        is_copy : bool, default True
+            Whether to return a copy of the original object or not.
+        **kwargs
+            For compatibility with :meth:`numpy.take`. Has no effect on the
+            output.
+
+        Returns
+        -------
+        taken : same type as caller
+            An array-like containing the elements taken from the object.
+
+        See Also
+        --------
+        DataFrame.loc : Select a subset of a DataFrame by labels.
+        DataFrame.iloc : Select a subset of a DataFrame by positions.
+        numpy.take : Take elements from an array along an axis.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([('falcon', 'bird',    389.0),
+        ...                    ('parrot', 'bird',     24.0),
+        ...                    ('lion',   'mammal',   80.5),
+        ...                    ('monkey', 'mammal', np.nan)],
+        ...                    columns=['name', 'class', 'max_speed'],
+        ...                    index=[0, 2, 3, 1])
+        >>> df
+             name   class  max_speed
+        0  falcon    bird      389.0
+        2  parrot    bird       24.0
+        3    lion  mammal       80.5
+        1  monkey  mammal        NaN
+
+        Take elements at positions 0 and 3 along the axis 0 (default).
+
+        Note how the actual indices selected (0 and 1) do not correspond to
+        our selected indices 0 and 3. That's because we are selecting the 0th
+        and 3rd rows, not rows whose indices equal 0 and 3.
+
+        >>> df.take([0, 3])
+             name   class  max_speed
+        0  falcon    bird      389.0
+        1  monkey  mammal        NaN
+
+        Take elements at indices 1 and 2 along the axis 1 (column selection).
+
+        >>> df.take([1, 2], axis=1)
+            class  max_speed
+        0    bird      389.0
+        2    bird       24.0
+        3  mammal       80.5
+        1  mammal        NaN
+
+        We may take elements using negative integers for positive indices,
+        starting from the end of the object, just like with Python lists.
+
+        >>> df.take([-1, -2])
+             name   class  max_speed
+        1  monkey  mammal        NaN
+        3    lion  mammal       80.5
+        """
+
+    @Appender(_shared_docs['take'])
+    def take(self, indices, axis=0, convert=None, is_copy=True, **kwargs):
+        if convert is not None:
+            msg = ("The 'convert' parameter is deprecated "
+                   "and will be removed in a future version.")
+            warnings.warn(msg, FutureWarning, stacklevel=2)
+
+        nv.validate_take(tuple(), kwargs)
+        return self._take(indices, axis=axis, is_copy=is_copy)
+
+    def xs(self, key, axis=0, level=None, drop_level=True):
         """
-        Returns a cross-section (row(s) or column(s)) from the Series/DataFrame.
-        Defaults to cross-section on the rows (axis=0).
+        Returns a cross-section (row(s) or column(s)) from the
+        Series/DataFrame. Defaults to cross-section on the rows (axis=0).
 
         Parameters
         ----------
@@ -1391,8 +2904,6 @@ def xs(self, key, axis=0, level=None, copy=None, drop_level=True):
         level : object, defaults to first n levels (n=1 or len(key))
             In case of a key partially contained in a MultiIndex, indicate
             which levels are used. Levels can be referred by label or position.
-        copy : boolean [deprecated]
-            Whether to make a copy of the data
         drop_level : boolean, default True
             If False, returns object with same levels as self.
 
@@ -1443,32 +2954,23 @@ def xs(self, key, axis=0, level=None, copy=None, drop_level=True):
         -----
         xs is only for getting, not setting values.
 
-        MultiIndex Slicers is a generic way to get/set values on any level or levels
-        it is a superset of xs functionality, see :ref:`MultiIndex Slicers <advanced.mi_slicers>`
+        MultiIndex Slicers is a generic way to get/set values on any level or
+        levels.  It is a superset of xs functionality, see
+        :ref:`MultiIndex Slicers <advanced.mi_slicers>`
 
         """
-        if copy is not None:
-            warnings.warn("copy keyword is deprecated, "
-                          "default is to return a copy or a view if possible")
-
         axis = self._get_axis_number(axis)
         labels = self._get_axis(axis)
         if level is not None:
             loc, new_ax = labels.get_loc_level(key, level=level,
                                                drop_level=drop_level)
 
-            # convert to a label indexer if needed
-            if isinstance(loc, slice):
-                lev_num = labels._get_level_number(level)
-                if labels.levels[lev_num].inferred_type == 'integer':
-                    loc = labels[loc]
-
             # create the tuple of the indexer
             indexer = [slice(None)] * self.ndim
             indexer[axis] = loc
             indexer = tuple(indexer)
 
-            result = self.ix[indexer]
+            result = self.iloc[indexer]
             setattr(result, result._get_axis_name(axis), new_ax)
             return result
 
@@ -1487,15 +2989,14 @@ def xs(self, key, axis=0, level=None, copy=None, drop_level=True):
             if isinstance(loc, np.ndarray):
                 if loc.dtype == np.bool_:
                     inds, = loc.nonzero()
-                    return self.take(inds, axis=axis, convert=False)
+                    return self._take(inds, axis=axis)
                 else:
-                    return self.take(loc, axis=axis, convert=True)
+                    return self._take(loc, axis=axis)
 
-            if not np.isscalar(loc):
+            if not is_scalar(loc):
                 new_index = self.index[loc]
 
-        if np.isscalar(loc):
-            from pandas import Series
+        if is_scalar(loc):
             new_values = self._data.fast_xs(loc)
 
             # may need to box a datelike-scalar
@@ -1504,13 +3005,11 @@ def xs(self, key, axis=0, level=None, copy=None, drop_level=True):
             # that means that their are list/ndarrays inside the Series!
             # so just return them (GH 6394)
             if not is_list_like(new_values) or self.ndim == 1:
-                return _maybe_box_datetimelike(new_values)
+                return com._maybe_box_datetimelike(new_values)
 
-            result = Series(new_values,
-                            index=self.columns,
-                            name=self.index[loc],
-                            copy=copy,
-                            dtype=new_values.dtype)
+            result = self._constructor_sliced(
+                new_values, index=self.columns,
+                name=self.index[loc], dtype=new_values.dtype)
 
         else:
             result = self.iloc[loc]
@@ -1523,10 +3022,11 @@ def xs(self, key, axis=0, level=None, copy=None, drop_level=True):
 
     _xs = xs
 
-    # TODO: Check if this was clearer in 0.12
     def select(self, crit, axis=0):
-        """
-        Return data corresponding to axis labels matching criteria
+        """Return data corresponding to axis labels matching criteria
+
+        .. deprecated:: 0.21.0
+            Use df.loc[df.index.map(crit)] to select via labels
 
         Parameters
         ----------
@@ -1536,8 +3036,13 @@ def select(self, crit, axis=0):
 
         Returns
         -------
-        selection : type of caller
+        selection : same type as caller
         """
+        warnings.warn("'select' is deprecated and will be removed in a "
+                      "future release. You can use "
+                      ".loc[labels.map(crit)] as a replacement",
+                      FutureWarning, stacklevel=2)
+
         axis = self._get_axis_number(axis)
         axis_name = self._get_axis_name(axis)
         axis_values = self._get_axis(axis)
@@ -1552,7 +3057,7 @@ def select(self, crit, axis=0):
 
     def reindex_like(self, other, method=None, copy=True, limit=None,
                      tolerance=None):
-        """ return an object with matching indicies to myself
+        """Return an object with matching indices to myself.
 
         Parameters
         ----------
@@ -1563,9 +3068,9 @@ def reindex_like(self, other, method=None, copy=True, limit=None,
             Maximum number of consecutive labels to fill for inexact matches.
         tolerance : optional
             Maximum distance between labels of the other object and this
-            object for inexact matches.
+            object for inexact matches. Can be list-like.
 
-            .. versionadded:: 0.17.0
+            .. versionadded:: 0.21.0 (list-like tolerance)
 
         Notes
         -----
@@ -1576,15 +3081,44 @@ def reindex_like(self, other, method=None, copy=True, limit=None,
         -------
         reindexed : same as input
         """
-        d = other._construct_axes_dict(axes=self._AXIS_ORDERS,
-                method=method, copy=copy, limit=limit,
-                tolerance=tolerance)
+        d = other._construct_axes_dict(axes=self._AXIS_ORDERS, method=method,
+                                       copy=copy, limit=limit,
+                                       tolerance=tolerance)
 
         return self.reindex(**d)
 
-    def drop(self, labels, axis=0, level=None, inplace=False, errors='raise'):
+    def drop(self, labels=None, axis=0, index=None, columns=None, level=None,
+             inplace=False, errors='raise'):
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
+        if labels is not None:
+            if index is not None or columns is not None:
+                raise ValueError("Cannot specify both 'labels' and "
+                                 "'index'/'columns'")
+            axis_name = self._get_axis_name(axis)
+            axes = {axis_name: labels}
+        elif index is not None or columns is not None:
+            axes, _ = self._construct_axes_from_arguments((index, columns), {})
+        else:
+            raise ValueError("Need to specify at least one of 'labels', "
+                             "'index' or 'columns'")
+
+        obj = self
+
+        for axis, labels in axes.items():
+            if labels is not None:
+                obj = obj._drop_axis(labels, axis, level=level, errors=errors)
+
+        if inplace:
+            self._update_inplace(obj)
+        else:
+            return obj
+
+    def _drop_axis(self, labels, axis, level=None, errors='raise'):
         """
-        Return new object with labels in requested axis removed
+        Drop labels from specified axis. Used in the ``drop`` method
+        internally.
 
         Parameters
         ----------
@@ -1592,20 +3126,13 @@ def drop(self, labels, axis=0, level=None, inplace=False, errors='raise'):
         axis : int or axis name
         level : int or level name, default None
             For MultiIndex
-        inplace : bool, default False
-            If True, do operation inplace and return None.
         errors : {'ignore', 'raise'}, default 'raise'
             If 'ignore', suppress error and existing labels are dropped.
 
-            .. versionadded:: 0.16.1
-
-        Returns
-        -------
-        dropped : type of caller
         """
         axis = self._get_axis_number(axis)
         axis_name = self._get_axis_name(axis)
-        axis, axis_ = self._get_axis(axis), axis
+        axis = self._get_axis(axis)
 
         if axis.is_unique:
             if level is not None:
@@ -1614,36 +3141,36 @@ def drop(self, labels, axis=0, level=None, inplace=False, errors='raise'):
                 new_axis = axis.drop(labels, level=level, errors=errors)
             else:
                 new_axis = axis.drop(labels, errors=errors)
-            dropped = self.reindex(**{axis_name: new_axis})
-            try:
-                dropped.axes[axis_].set_names(axis.names, inplace=True)
-            except AttributeError:
-                pass
-            result = dropped
+            result = self.reindex(**{axis_name: new_axis})
 
+        # Case for non-unique axis
         else:
-            labels = com._index_labels_to_array(labels)
+            labels = _ensure_object(com._index_labels_to_array(labels))
             if level is not None:
                 if not isinstance(axis, MultiIndex):
                     raise AssertionError('axis must be a MultiIndex')
-                indexer = ~lib.ismember(axis.get_level_values(level).values,
-                                        set(labels))
+                indexer = ~axis.get_level_values(level).isin(labels)
+
+                # GH 18561 MultiIndex.drop should raise if label is absent
+                if errors == 'raise' and indexer.all():
+                    raise KeyError('{} not found in axis'.format(labels))
             else:
                 indexer = ~axis.isin(labels)
+                # Check if label doesn't exist along axis
+                labels_missing = (axis.get_indexer_for(labels) == -1).any()
+                if errors == 'raise' and labels_missing:
+                    raise KeyError('{} not found in axis'.format(labels))
 
             slicer = [slice(None)] * self.ndim
             slicer[self._get_axis_number(axis_name)] = indexer
 
-            result = self.ix[tuple(slicer)]
+            result = self.loc[tuple(slicer)]
 
-        if inplace:
-            self._update_inplace(result)
-        else:
-            return result
+        return result
 
     def _update_inplace(self, result, verify_is_copy=True):
         """
-        replace self internals with result.
+        Replace self internals with result.
 
         Parameters
         ----------
@@ -1656,35 +3183,119 @@ def _update_inplace(self, result, verify_is_copy=True):
 
         self._reset_cache()
         self._clear_item_cache()
-        self._data = getattr(result,'_data',result)
+        self._data = getattr(result, '_data', result)
         self._maybe_update_cacher(verify_is_copy=verify_is_copy)
 
     def add_prefix(self, prefix):
         """
-        Concatenate prefix string with panel items names.
+        Prefix labels with string `prefix`.
+
+        For Series, the row labels are prefixed.
+        For DataFrame, the column labels are prefixed.
 
         Parameters
         ----------
-        prefix : string
+        prefix : str
+            The string to add before each label.
 
         Returns
         -------
-        with_prefix : type of caller
+        Series or DataFrame
+            New Series or DataFrame with updated labels.
+
+        See Also
+        --------
+        Series.add_suffix: Suffix row labels with string `suffix`.
+        DataFrame.add_suffix: Suffix column labels with string `suffix`.
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2, 3, 4])
+        >>> s
+        0    1
+        1    2
+        2    3
+        3    4
+        dtype: int64
+
+        >>> s.add_prefix('item_')
+        item_0    1
+        item_1    2
+        item_2    3
+        item_3    4
+        dtype: int64
+
+        >>> df = pd.DataFrame({'A': [1, 2, 3, 4],  'B': [3, 4, 5, 6]})
+        >>> df
+           A  B
+        0  1  3
+        1  2  4
+        2  3  5
+        3  4  6
+
+        >>> df.add_prefix('col_')
+             col_A  col_B
+        0       1       3
+        1       2       4
+        2       3       5
+        3       4       6
         """
         new_data = self._data.add_prefix(prefix)
         return self._constructor(new_data).__finalize__(self)
 
     def add_suffix(self, suffix):
         """
-        Concatenate suffix string with panel items names
+        Suffix labels with string `suffix`.
+
+        For Series, the row labels are suffixed.
+        For DataFrame, the column labels are suffixed.
 
         Parameters
         ----------
-        suffix : string
+        suffix : str
+            The string to add after each label.
 
         Returns
         -------
-        with_suffix : type of caller
+        Series or DataFrame
+            New Series or DataFrame with updated labels.
+
+        See Also
+        --------
+        Series.add_prefix: Prefix row labels with string `prefix`.
+        DataFrame.add_prefix: Prefix column labels with string `prefix`.
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2, 3, 4])
+        >>> s
+        0    1
+        1    2
+        2    3
+        3    4
+        dtype: int64
+
+        >>> s.add_suffix('_item')
+        0_item    1
+        1_item    2
+        2_item    3
+        3_item    4
+        dtype: int64
+
+        >>> df = pd.DataFrame({'A': [1, 2, 3, 4],  'B': [3, 4, 5, 6]})
+        >>> df
+           A  B
+        0  1  3
+        1  2  4
+        2  3  5
+        3  4  6
+
+        >>> df.add_suffix('_col')
+             A_col  B_col
+        0       1       3
+        1       2       4
+        2       3       5
+        3       4       6
         """
         new_data = self._data.add_suffix(suffix)
         return self._constructor(new_data).__finalize__(self)
@@ -1692,31 +3303,97 @@ def add_suffix(self, suffix):
     _shared_docs['sort_values'] = """
         Sort by the values along either axis
 
-        .. versionadded:: 0.17.0
-
         Parameters
-        ----------
-        by : string name or list of names which refer to the axis items
-        axis : %(axes)s to direct sorting
-        ascending : bool or list of bool
-             Sort ascending vs. descending. Specify list for multiple sort orders.
-             If this is a list of bools, must match the length of the by
-        inplace : bool
+        ----------%(optional_by)s
+        axis : %(axes_single_arg)s, default 0
+             Axis to be sorted
+        ascending : bool or list of bool, default True
+             Sort ascending vs. descending. Specify list for multiple sort
+             orders.  If this is a list of bools, must match the length of
+             the by.
+        inplace : bool, default False
              if True, perform operation in-place
-        kind : {`quicksort`, `mergesort`, `heapsort`}
-             Choice of sorting algorithm. See also ndarray.np.sort for more information.
-             `mergesort` is the only stable algorithm. For DataFrames, this option is
-             only applied when sorting on a single column or label.
-        na_position : {'first', 'last'}
+        kind : {'quicksort', 'mergesort', 'heapsort'}, default 'quicksort'
+             Choice of sorting algorithm. See also ndarray.np.sort for more
+             information.  `mergesort` is the only stable algorithm. For
+             DataFrames, this option is only applied when sorting on a single
+             column or label.
+        na_position : {'first', 'last'}, default 'last'
              `first` puts NaNs at the beginning, `last` puts NaNs at the end
 
         Returns
         -------
         sorted_obj : %(klass)s
-        """
-    def sort_values(self, by, axis=0, ascending=True, inplace=False,
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({
+        ...     'col1' : ['A', 'A', 'B', np.nan, 'D', 'C'],
+        ...     'col2' : [2, 1, 9, 8, 7, 4],
+        ...     'col3': [0, 1, 9, 4, 2, 3],
+        ... })
+        >>> df
+            col1 col2 col3
+        0   A    2    0
+        1   A    1    1
+        2   B    9    9
+        3   NaN  8    4
+        4   D    7    2
+        5   C    4    3
+
+        Sort by col1
+
+        >>> df.sort_values(by=['col1'])
+            col1 col2 col3
+        0   A    2    0
+        1   A    1    1
+        2   B    9    9
+        5   C    4    3
+        4   D    7    2
+        3   NaN  8    4
+
+        Sort by multiple columns
+
+        >>> df.sort_values(by=['col1', 'col2'])
+            col1 col2 col3
+        1   A    1    1
+        0   A    2    0
+        2   B    9    9
+        5   C    4    3
+        4   D    7    2
+        3   NaN  8    4
+
+        Sort Descending
+
+        >>> df.sort_values(by='col1', ascending=False)
+            col1 col2 col3
+        4   D    7    2
+        5   C    4    3
+        2   B    9    9
+        0   A    2    0
+        1   A    1    1
+        3   NaN  8    4
+
+        Putting NAs first
+
+        >>> df.sort_values(by='col1', ascending=False, na_position='first')
+            col1 col2 col3
+        3   NaN  8    4
+        4   D    7    2
+        5   C    4    3
+        2   B    9    9
+        0   A    2    0
+        1   A    1    1
+        """
+
+    def sort_values(self, by=None, axis=0, ascending=True, inplace=False,
                     kind='quicksort', na_position='last'):
-        raise AbstractMethodError(self)
+        """
+        NOT IMPLEMENTED: do not call this method, as sorting values is not
+        supported for Panel objects and will raise an error.
+        """
+        raise NotImplementedError("sort_values has not been implemented "
+                                  "on Panel or Panel4D objects.")
 
     _shared_docs['sort_index'] = """
         Sort object by labels (along an axis)
@@ -1728,17 +3405,19 @@ def sort_values(self, by, axis=0, ascending=True, inplace=False,
             if not None, sort on values in specified index level(s)
         ascending : boolean, default True
             Sort ascending vs. descending
-        inplace : bool
+        inplace : bool, default False
             if True, perform operation in-place
-        kind : {`quicksort`, `mergesort`, `heapsort`}
-             Choice of sorting algorithm. See also ndarray.np.sort for more information.
-             `mergesort` is the only stable algorithm. For DataFrames, this option is
-             only applied when sorting on a single column or label.
-        na_position : {'first', 'last'}
-             `first` puts NaNs at the beginning, `last` puts NaNs at the end
-        sort_remaining : bool
-            if true and sorting by level and index is multilevel, sort by other levels
-            too (in order) after sorting by specified level
+        kind : {'quicksort', 'mergesort', 'heapsort'}, default 'quicksort'
+             Choice of sorting algorithm. See also ndarray.np.sort for more
+             information.  `mergesort` is the only stable algorithm. For
+             DataFrames, this option is only applied when sorting on a single
+             column or label.
+        na_position : {'first', 'last'}, default 'last'
+             `first` puts NaNs at the beginning, `last` puts NaNs at the end.
+             Not implemented for MultiIndex.
+        sort_remaining : bool, default True
+            if true and sorting by level and index is multilevel, sort by other
+            levels too (in order) after sorting by specified level
 
         Returns
         -------
@@ -1748,6 +3427,7 @@ def sort_values(self, by, axis=0, ascending=True, inplace=False,
     @Appender(_shared_docs['sort_index'] % dict(axes="axes", klass="NDFrame"))
     def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
                    kind='quicksort', na_position='last', sort_remaining=True):
+        inplace = validate_bool_kwarg(inplace, 'inplace')
         axis = self._get_axis_number(axis)
         axis_name = self._get_axis_name(axis)
         labels = self._get_axis(axis)
@@ -1772,16 +3452,22 @@ def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
 
         Parameters
         ----------
-        %(axes)s : array-like, optional (can be specified in order, or as
-            keywords)
+        %(optional_labels)s
+        %(axes)s : array-like, optional (should be specified using keywords)
             New labels / index to conform to. Preferably an Index object to
             avoid duplicating data
+        %(optional_axis)s
         method : {None, 'backfill'/'bfill', 'pad'/'ffill', 'nearest'}, optional
-            Method to use for filling holes in reindexed DataFrame:
-              * default: don't fill gaps
-              * pad / ffill: propagate last valid observation forward to next valid
-              * backfill / bfill: use next valid observation to fill gap
-              * nearest: use nearest valid observations to fill gap
+            method to use for filling holes in reindexed DataFrame.
+            Please note: this is only applicable to DataFrames/Series with a
+            monotonically increasing/decreasing index.
+
+            * default: don't fill gaps
+            * pad / ffill: propagate last valid observation forward to next
+              valid
+            * backfill / bfill: use next valid observation to fill gap
+            * nearest: use nearest valid observations to fill gap
+
         copy : boolean, default True
             Return a new object, even if the passed indexes are the same
         level : int or name
@@ -1797,41 +3483,196 @@ def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
             matches. The values of the index at the matching locations most
             satisfy the equation ``abs(index[indexer] - target) <= tolerance``.
 
-            .. versionadded:: 0.17.0
+            Tolerance may be a scalar value, which applies the same tolerance
+            to all values, or list-like, which applies variable tolerance per
+            element. List-like includes list, tuple, array, Series, and must be
+            the same size as the index and its dtype must exactly match the
+            index's type.
+
+            .. versionadded:: 0.21.0 (list-like tolerance)
 
         Examples
         --------
-        >>> df.reindex(index=[date1, date2, date3], columns=['A', 'B', 'C'])
+
+        ``DataFrame.reindex`` supports two calling conventions
+
+        * ``(index=index_labels, columns=column_labels, ...)``
+        * ``(labels, axis={'index', 'columns'}, ...)``
+
+        We *highly* recommend using keyword arguments to clarify your
+        intent.
+
+        Create a dataframe with some fictional data.
+
+        >>> index = ['Firefox', 'Chrome', 'Safari', 'IE10', 'Konqueror']
+        >>> df = pd.DataFrame({
+        ...      'http_status': [200,200,404,404,301],
+        ...      'response_time': [0.04, 0.02, 0.07, 0.08, 1.0]},
+        ...       index=index)
+        >>> df
+                   http_status  response_time
+        Firefox            200           0.04
+        Chrome             200           0.02
+        Safari             404           0.07
+        IE10               404           0.08
+        Konqueror          301           1.00
+
+        Create a new index and reindex the dataframe. By default
+        values in the new index that do not have corresponding
+        records in the dataframe are assigned ``NaN``.
+
+        >>> new_index= ['Safari', 'Iceweasel', 'Comodo Dragon', 'IE10',
+        ...             'Chrome']
+        >>> df.reindex(new_index)
+                       http_status  response_time
+        Safari               404.0           0.07
+        Iceweasel              NaN            NaN
+        Comodo Dragon          NaN            NaN
+        IE10                 404.0           0.08
+        Chrome               200.0           0.02
+
+        We can fill in the missing values by passing a value to
+        the keyword ``fill_value``. Because the index is not monotonically
+        increasing or decreasing, we cannot use arguments to the keyword
+        ``method`` to fill the ``NaN`` values.
+
+        >>> df.reindex(new_index, fill_value=0)
+                       http_status  response_time
+        Safari                 404           0.07
+        Iceweasel                0           0.00
+        Comodo Dragon            0           0.00
+        IE10                   404           0.08
+        Chrome                 200           0.02
+
+        >>> df.reindex(new_index, fill_value='missing')
+                      http_status response_time
+        Safari                404          0.07
+        Iceweasel         missing       missing
+        Comodo Dragon     missing       missing
+        IE10                  404          0.08
+        Chrome                200          0.02
+
+        We can also reindex the columns.
+
+        >>> df.reindex(columns=['http_status', 'user_agent'])
+                   http_status  user_agent
+        Firefox            200         NaN
+        Chrome             200         NaN
+        Safari             404         NaN
+        IE10               404         NaN
+        Konqueror          301         NaN
+
+        Or we can use "axis-style" keyword arguments
+
+        >>> df.reindex(['http_status', 'user_agent'], axis="columns")
+                   http_status  user_agent
+        Firefox            200         NaN
+        Chrome             200         NaN
+        Safari             404         NaN
+        IE10               404         NaN
+        Konqueror          301         NaN
+
+        To further illustrate the filling functionality in
+        ``reindex``, we will create a dataframe with a
+        monotonically increasing index (for example, a sequence
+        of dates).
+
+        >>> date_index = pd.date_range('1/1/2010', periods=6, freq='D')
+        >>> df2 = pd.DataFrame({"prices": [100, 101, np.nan, 100, 89, 88]},
+        ...                    index=date_index)
+        >>> df2
+                    prices
+        2010-01-01     100
+        2010-01-02     101
+        2010-01-03     NaN
+        2010-01-04     100
+        2010-01-05      89
+        2010-01-06      88
+
+        Suppose we decide to expand the dataframe to cover a wider
+        date range.
+
+        >>> date_index2 = pd.date_range('12/29/2009', periods=10, freq='D')
+        >>> df2.reindex(date_index2)
+                    prices
+        2009-12-29     NaN
+        2009-12-30     NaN
+        2009-12-31     NaN
+        2010-01-01     100
+        2010-01-02     101
+        2010-01-03     NaN
+        2010-01-04     100
+        2010-01-05      89
+        2010-01-06      88
+        2010-01-07     NaN
+
+        The index entries that did not have a value in the original data frame
+        (for example, '2009-12-29') are by default filled with ``NaN``.
+        If desired, we can fill in the missing values using one of several
+        options.
+
+        For example, to back-propagate the last valid value to fill the ``NaN``
+        values, pass ``bfill`` as an argument to the ``method`` keyword.
+
+        >>> df2.reindex(date_index2, method='bfill')
+                    prices
+        2009-12-29     100
+        2009-12-30     100
+        2009-12-31     100
+        2010-01-01     100
+        2010-01-02     101
+        2010-01-03     NaN
+        2010-01-04     100
+        2010-01-05      89
+        2010-01-06      88
+        2010-01-07     NaN
+
+        Please note that the ``NaN`` value present in the original dataframe
+        (at index value 2010-01-03) will not be filled by any of the
+        value propagation schemes. This is because filling while reindexing
+        does not look at dataframe values, but only compares the original and
+        desired indexes. If you do want to fill in the ``NaN`` values present
+        in the original dataframe, use the ``fillna()`` method.
+
+        See the :ref:`user guide <basics.reindexing>` for more.
 
         Returns
         -------
         reindexed : %(klass)s
         """
+
     # TODO: Decide if we care about having different examples for different
     #       kinds
 
-    @Appender(_shared_docs['reindex'] % dict(axes="axes", klass="NDFrame"))
+    @Appender(_shared_docs['reindex'] % dict(axes="axes", klass="NDFrame",
+                                             optional_labels="",
+                                             optional_axis=""))
     def reindex(self, *args, **kwargs):
 
         # construct the args
         axes, kwargs = self._construct_axes_from_arguments(args, kwargs)
-        method = com._clean_reindex_fill_method(kwargs.pop('method', None))
+        method = missing.clean_reindex_fill_method(kwargs.pop('method', None))
         level = kwargs.pop('level', None)
         copy = kwargs.pop('copy', True)
         limit = kwargs.pop('limit', None)
         tolerance = kwargs.pop('tolerance', None)
-        fill_value = kwargs.pop('fill_value', np.nan)
+        fill_value = kwargs.pop('fill_value', None)
+
+        # Series.reindex doesn't use / need the axis kwarg
+        # We pop and ignore it here, to make writing Series/Frame generic code
+        # easier
+        kwargs.pop("axis", None)
 
         if kwargs:
             raise TypeError('reindex() got an unexpected keyword '
-                    'argument "{0}"'.format(list(kwargs.keys())[0]))
+                            'argument "{0}"'.format(list(kwargs.keys())[0]))
 
         self._consolidate_inplace()
 
         # if all axes that are requested to reindex are equal, then only copy
         # if indicated must have index names equal here as well as values
-        if all([self._get_axis(axis).identical(ax)
-                for axis, ax in axes.items() if ax is not None]):
+        if all(self._get_axis(axis).identical(ax)
+               for axis, ax in axes.items() if ax is not None):
             if copy:
                 return self.copy()
             return self
@@ -1840,16 +3681,16 @@ def reindex(self, *args, **kwargs):
         if self._needs_reindex_multi(axes, method, level):
             try:
                 return self._reindex_multi(axes, copy, fill_value)
-            except:
+            except Exception:
                 pass
 
         # perform the reindex on the axes
-        return self._reindex_axes(axes, level, limit, tolerance,
-                                  method, fill_value, copy).__finalize__(self)
+        return self._reindex_axes(axes, level, limit, tolerance, method,
+                                  fill_value, copy).__finalize__(self)
 
-    def _reindex_axes(self, axes, level, limit, tolerance, method,
-                      fill_value, copy):
-        """ perform the reinxed for all the axes """
+    def _reindex_axes(self, axes, level, limit, tolerance, method, fill_value,
+                      copy):
+        """Perform the reindex for all the axes."""
         obj = self
         for a in self._AXIS_ORDERS:
             labels = axes[a]
@@ -1857,30 +3698,29 @@ def _reindex_axes(self, axes, level, limit, tolerance, method,
                 continue
 
             ax = self._get_axis(a)
-            new_index, indexer = ax.reindex(
-                labels, level=level, limit=limit, tolerance=tolerance,
-                method=method)
+            new_index, indexer = ax.reindex(labels, level=level, limit=limit,
+                                            tolerance=tolerance, method=method)
 
             axis = self._get_axis_number(a)
-            obj = obj._reindex_with_indexers(
-                {axis: [new_index, indexer]},
-                fill_value=fill_value, copy=copy, allow_dups=False)
+            obj = obj._reindex_with_indexers({axis: [new_index, indexer]},
+                                             fill_value=fill_value,
+                                             copy=copy, allow_dups=False)
 
         return obj
 
     def _needs_reindex_multi(self, axes, method, level):
-        """ check if we do need a multi reindex """
+        """Check if we do need a multi reindex."""
         return ((com._count_not_none(*axes.values()) == self._AXIS_LEN) and
                 method is None and level is None and not self._is_mixed_type)
 
     def _reindex_multi(self, axes, copy, fill_value):
         return NotImplemented
 
-    _shared_docs['reindex_axis'] = (
-        """Conform input object to new index with optional filling logic,
-        placing NA/NaN in locations having no value in the previous index. A
-        new object is produced unless the new index is equivalent to the
-        current one and copy=False
+    _shared_docs[
+        'reindex_axis'] = ("""Conform input object to new index with optional
+        filling logic, placing NA/NaN in locations having no value in the
+        previous index. A new object is produced unless the new index is
+        equivalent to the current one and copy=False
 
         Parameters
         ----------
@@ -1890,10 +3730,13 @@ def _reindex_multi(self, axes, copy, fill_value):
         axis : %(axes_single_arg)s
         method : {None, 'backfill'/'bfill', 'pad'/'ffill', 'nearest'}, optional
             Method to use for filling holes in reindexed DataFrame:
-              * default: don't fill gaps
-              * pad / ffill: propagate last valid observation forward to next valid
-              * backfill / bfill: use next valid observation to fill gap
-              * nearest: use nearest valid observations to fill gap
+
+            * default: don't fill gaps
+            * pad / ffill: propagate last valid observation forward to next
+              valid
+            * backfill / bfill: use next valid observation to fill gap
+            * nearest: use nearest valid observations to fill gap
+
         copy : boolean, default True
             Return a new object, even if the passed indexes are the same
         level : int or name
@@ -1906,13 +3749,19 @@ def _reindex_multi(self, axes, copy, fill_value):
             matches. The values of the index at the matching locations most
             satisfy the equation ``abs(index[indexer] - target) <= tolerance``.
 
-            .. versionadded:: 0.17.0
+            Tolerance may be a scalar value, which applies the same tolerance
+            to all values, or list-like, which applies variable tolerance per
+            element. List-like includes list, tuple, array, Series, and must be
+            the same size as the index and its dtype must exactly match the
+            index's type.
+
+            .. versionadded:: 0.21.0 (list-like tolerance)
 
         Examples
         --------
         >>> df.reindex_axis(['A', 'B', 'C'], axis=1)
 
-        See also
+        See Also
         --------
         reindex, reindex_like
 
@@ -1923,23 +3772,25 @@ def _reindex_multi(self, axes, copy, fill_value):
 
     @Appender(_shared_docs['reindex_axis'] % _shared_doc_kwargs)
     def reindex_axis(self, labels, axis=0, method=None, level=None, copy=True,
-                     limit=None, fill_value=np.nan):
+                     limit=None, fill_value=None):
+        msg = ("'.reindex_axis' is deprecated and will be removed in a future "
+               "version. Use '.reindex' instead.")
         self._consolidate_inplace()
 
         axis_name = self._get_axis_name(axis)
         axis_values = self._get_axis(axis_name)
-        method = com._clean_reindex_fill_method(method)
+        method = missing.clean_reindex_fill_method(method)
+        warnings.warn(msg, FutureWarning, stacklevel=3)
         new_index, indexer = axis_values.reindex(labels, method, level,
                                                  limit=limit)
-        return self._reindex_with_indexers(
-            {axis: [new_index, indexer]}, fill_value=fill_value, copy=copy)
+        return self._reindex_with_indexers({axis: [new_index, indexer]},
+                                           fill_value=fill_value, copy=copy)
 
-    def _reindex_with_indexers(self, reindexers,
-                               fill_value=np.nan, copy=False,
+    def _reindex_with_indexers(self, reindexers, fill_value=None, copy=False,
                                allow_dups=False):
-        """ allow_dups indicates an internal call here """
+        """allow_dups indicates an internal call here """
 
-        # reindex doing multiple operations on different axes if indiciated
+        # reindex doing multiple operations on different axes if indicated
         new_data = self._data
         for axis in sorted(reindexers.keys()):
             index, indexer = reindexers[axis]
@@ -1950,7 +3801,7 @@ def _reindex_with_indexers(self, reindexers,
 
             index = _ensure_index(index)
             if indexer is not None:
-                indexer = com._ensure_int64(indexer)
+                indexer = _ensure_int64(indexer)
 
             # TODO: speed up on homogeneous DataFrame objects
             new_data = new_data.reindex_indexer(index, indexer, axis=baxis,
@@ -1974,7 +3825,11 @@ def _reindex_axis(self, new_index, fill_method, axis, copy):
 
     def filter(self, items=None, like=None, regex=None, axis=None):
         """
-        Restrict the info axis to set of items or wildcard
+        Subset rows or columns of dataframe according to labels in
+        the specified index.
+
+        Note that this routine does not filter a dataframe on its
+        contents. The filter is applied to the labels of the index.
 
         Parameters
         ----------
@@ -1984,62 +3839,205 @@ def filter(self, items=None, like=None, regex=None, axis=None):
             Keep info axis where "arg in col == True"
         regex : string (regular expression)
             Keep info axis with re.search(regex, col) == True
-        axis : int or None
-            The axis to filter on. By default this is the info axis. The "info
-            axis" is the axis that is used when indexing with ``[]``. For
-            example, ``df = DataFrame({'a': [1, 2, 3, 4]]}); df['a']``. So,
-            the ``DataFrame`` columns are the info axis.
+        axis : int or string axis name
+            The axis to filter on.  By default this is the info axis,
+            'index' for Series, 'columns' for DataFrame
+
+        Returns
+        -------
+        same type as input object
+
+        Examples
+        --------
+        >>> df
+        one  two  three
+        mouse     1    2      3
+        rabbit    4    5      6
+
+        >>> # select columns by name
+        >>> df.filter(items=['one', 'three'])
+        one  three
+        mouse     1      3
+        rabbit    4      6
+
+        >>> # select columns by regular expression
+        >>> df.filter(regex='e$', axis=1)
+        one  three
+        mouse     1      3
+        rabbit    4      6
+
+        >>> # select rows containing 'bbi'
+        >>> df.filter(like='bbi', axis=0)
+        one  two  three
+        rabbit    4    5      6
+
+        See Also
+        --------
+        pandas.DataFrame.loc
 
         Notes
         -----
-        Arguments are mutually exclusive, but this is not checked for
+        The ``items``, ``like``, and ``regex`` parameters are
+        enforced to be mutually exclusive.
 
+        ``axis`` defaults to the info axis that is used when indexing
+        with ``[]``.
         """
         import re
 
+        nkw = com._count_not_none(items, like, regex)
+        if nkw > 1:
+            raise TypeError('Keyword arguments `items`, `like`, or `regex` '
+                            'are mutually exclusive')
+
         if axis is None:
             axis = self._info_axis_name
-        axis_name = self._get_axis_name(axis)
-        axis_values = self._get_axis(axis_name)
+        labels = self._get_axis(axis)
 
         if items is not None:
-            return self.reindex(**{axis_name: [r for r in items
-                                               if r in axis_values]})
+            name = self._get_axis_name(axis)
+            return self.reindex(
+                **{name: [r for r in items if r in labels]})
         elif like:
-            matchf = lambda x: (like in x if isinstance(x, string_types)
-                                else like in str(x))
-            return self.select(matchf, axis=axis_name)
+            def f(x):
+                return like in to_str(x)
+            values = labels.map(f)
+            return self.loc(axis=axis)[values]
         elif regex:
+            def f(x):
+                return matcher.search(to_str(x)) is not None
             matcher = re.compile(regex)
-            return self.select(lambda x: matcher.search(str(x)) is not None,
-                               axis=axis_name)
+            values = labels.map(f)
+            return self.loc(axis=axis)[values]
         else:
             raise TypeError('Must pass either `items`, `like`, or `regex`')
 
     def head(self, n=5):
         """
-        Returns first n rows
+        Return the first `n` rows.
+
+        This function returns the first `n` rows for the object based
+        on position. It is useful for quickly testing if your object
+        has the right type of data in it.
+
+        Parameters
+        ----------
+        n : int, default 5
+            Number of rows to select.
+
+        Returns
+        -------
+        obj_head : same type as caller
+            The first `n` rows of the caller object.
+
+        See Also
+        --------
+        pandas.DataFrame.tail: Returns the last `n` rows.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'animal':['alligator', 'bee', 'falcon', 'lion',
+        ...                    'monkey', 'parrot', 'shark', 'whale', 'zebra']})
+        >>> df
+              animal
+        0  alligator
+        1        bee
+        2     falcon
+        3       lion
+        4     monkey
+        5     parrot
+        6      shark
+        7      whale
+        8      zebra
+
+        Viewing the first 5 lines
+
+        >>> df.head()
+              animal
+        0  alligator
+        1        bee
+        2     falcon
+        3       lion
+        4     monkey
+
+        Viewing the first `n` lines (three in this case)
+
+        >>> df.head(3)
+              animal
+        0  alligator
+        1        bee
+        2     falcon
         """
-        l = len(self)
-        if l == 0 or n==0:
-            return self
+
         return self.iloc[:n]
 
     def tail(self, n=5):
         """
-        Returns last n rows
-        """
-        l = len(self)
-        if l == 0 or n == 0:
-            return self
-        return self.iloc[-n:]
+        Return the last `n` rows.
+
+        This function returns last `n` rows from the object based on
+        position. It is useful for quickly verifying data, for example,
+        after sorting or appending rows.
+
+        Parameters
+        ----------
+        n : int, default 5
+            Number of rows to select.
 
+        Returns
+        -------
+        type of caller
+            The last `n` rows of the caller object.
+
+        See Also
+        --------
+        pandas.DataFrame.head : The first `n` rows of the caller object.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'animal':['alligator', 'bee', 'falcon', 'lion',
+        ...                    'monkey', 'parrot', 'shark', 'whale', 'zebra']})
+        >>> df
+              animal
+        0  alligator
+        1        bee
+        2     falcon
+        3       lion
+        4     monkey
+        5     parrot
+        6      shark
+        7      whale
+        8      zebra
+
+        Viewing the last 5 lines
+
+        >>> df.tail()
+           animal
+        4  monkey
+        5  parrot
+        6   shark
+        7   whale
+        8   zebra
+
+        Viewing the last `n` lines (three in this case)
+
+        >>> df.tail(3)
+          animal
+        6  shark
+        7  whale
+        8  zebra
+        """
+
+        if n == 0:
+            return self.iloc[0:0]
+        return self.iloc[-n:]
 
-    def sample(self, n=None, frac=None, replace=False, weights=None, random_state=None, axis=None):
+    def sample(self, n=None, frac=None, replace=False, weights=None,
+               random_state=None, axis=None):
         """
-        Returns a random sample of items from an axis of object.
+        Return a random sample of items from an axis of object.
 
-        .. versionadded:: 0.16.1
+        You can use `random_state` for reproducibility.
 
         Parameters
         ----------
@@ -2073,6 +4071,57 @@ def sample(self, n=None, frac=None, replace=False, weights=None, random_state=No
         Returns
         -------
         A new object of same type as caller.
+
+        Examples
+        --------
+        Generate an example ``Series`` and ``DataFrame``:
+
+        >>> s = pd.Series(np.random.randn(50))
+        >>> s.head()
+        0   -0.038497
+        1    1.820773
+        2   -0.972766
+        3   -1.598270
+        4   -1.095526
+        dtype: float64
+        >>> df = pd.DataFrame(np.random.randn(50, 4), columns=list('ABCD'))
+        >>> df.head()
+                  A         B         C         D
+        0  0.016443 -2.318952 -0.566372 -1.028078
+        1 -1.051921  0.438836  0.658280 -0.175797
+        2 -1.243569 -0.364626 -0.215065  0.057736
+        3  1.768216  0.404512 -0.385604 -1.457834
+        4  1.072446 -1.137172  0.314194 -0.046661
+
+        Next extract a random sample from both of these objects...
+
+        3 random elements from the ``Series``:
+
+        >>> s.sample(n=3)
+        27   -0.994689
+        55   -1.049016
+        67   -0.224565
+        dtype: float64
+
+        And a random 10% of the ``DataFrame`` with replacement:
+
+        >>> df.sample(frac=0.1, replace=True)
+                   A         B         C         D
+        35  1.981780  0.142106  1.817165 -0.290805
+        49 -1.336199 -0.448634 -0.789640  0.217116
+        40  0.823173 -0.078816  1.009536  1.015108
+        15  1.421154 -0.055301 -1.922594 -0.019696
+        6  -0.148339  0.832938  1.787600 -1.383767
+
+        You can use `random state` for reproducibility:
+
+        >>> df.sample(random_state=1)
+        A         B         C         D
+        37 -2.027662  0.103611  0.237496 -0.165867
+        43 -0.259323 -0.583426  1.516140 -0.479118
+        12 -1.686325 -0.579510  0.985195 -0.460286
+        8   1.167946  0.429082  1.215742 -1.636041
+        9   1.197475 -0.864188  1.554031 -1.505264
         """
 
         if axis is None:
@@ -2098,22 +4147,28 @@ def sample(self, n=None, frac=None, replace=False, weights=None, random_state=No
                         try:
                             weights = self[weights]
                         except KeyError:
-                            raise KeyError("String passed to weights not a valid column")
+                            raise KeyError("String passed to weights not a "
+                                           "valid column")
                     else:
-                        raise ValueError("Strings can only be passed to weights when sampling from rows on a DataFrame")
+                        raise ValueError("Strings can only be passed to "
+                                         "weights when sampling from rows on "
+                                         "a DataFrame")
                 else:
-                    raise ValueError("Strings cannot be passed as weights when sampling from a Series or Panel.")
+                    raise ValueError("Strings cannot be passed as weights "
+                                     "when sampling from a Series or Panel.")
 
             weights = pd.Series(weights, dtype='float64')
 
             if len(weights) != axis_length:
-                raise ValueError("Weights and axis to be sampled must be of same length")
+                raise ValueError("Weights and axis to be sampled must be of "
+                                 "same length")
 
             if (weights == np.inf).any() or (weights == -np.inf).any():
                 raise ValueError("weight vector may not include `inf` values")
 
             if (weights < 0).any():
-                raise ValueError("weight vector many not include negative values")
+                raise ValueError("weight vector many not include negative "
+                                 "values")
 
             # If has nan, set to zero.
             weights = weights.fillna(0)
@@ -2135,21 +4190,20 @@ def sample(self, n=None, frac=None, replace=False, weights=None, random_state=No
         elif n is None and frac is not None:
             n = int(round(frac * axis_length))
         elif n is not None and frac is not None:
-            raise ValueError('Please enter a value for `frac` OR `n`, not both')
+            raise ValueError('Please enter a value for `frac` OR `n`, not '
+                             'both')
 
         # Check for negative sizes
         if n < 0:
-            raise ValueError("A negative number of rows requested. Please provide positive value.")
+            raise ValueError("A negative number of rows requested. Please "
+                             "provide positive value.")
 
         locs = rs.choice(axis_length, size=n, replace=replace, p=weights)
         return self.take(locs, axis=axis, is_copy=False)
 
-
-    _shared_docs['pipe'] = ("""
+    _shared_docs['pipe'] = (r"""
         Apply func(self, \*args, \*\*kwargs)
 
-        .. versionadded:: 0.16.2
-
         Parameters
         ----------
         func : function
@@ -2158,8 +4212,10 @@ def sample(self, n=None, frac=None, replace=False, weights=None, random_state=No
             Alternatively a ``(callable, data_keyword)`` tuple where
             ``data_keyword`` is a string indicating the keyword of
             ``callable`` that expects the %(klass)s.
-        args : positional arguments passed into ``func``.
-        kwargs : a dictionary of keyword arguments passed into ``func``.
+        args : iterable, optional
+            positional arguments passed into ``func``.
+        kwargs : mapping, optional
+            a dictionary of keyword arguments passed into ``func``.
 
         Returns
         -------
@@ -2169,7 +4225,7 @@ def sample(self, n=None, frac=None, replace=False, weights=None, random_state=No
         -----
 
         Use ``.pipe`` when chaining together functions that expect
-        on Series or DataFrames. Instead of writing
+        Series, DataFrames or GroupBy objects. Instead of writing
 
         >>> f(g(h(df), arg1=a), arg2=b, arg3=c)
 
@@ -2194,26 +4250,101 @@ def sample(self, n=None, frac=None, replace=False, weights=None, random_state=No
         pandas.DataFrame.apply
         pandas.DataFrame.applymap
         pandas.Series.map
-    """
-    )
+    """)
+
     @Appender(_shared_docs['pipe'] % _shared_doc_kwargs)
     def pipe(self, func, *args, **kwargs):
-        if isinstance(func, tuple):
-            func, target = func
-            if target in kwargs:
-                msg = '%s is both the pipe target and a keyword argument' % target
-                raise ValueError(msg)
-            kwargs[target] = self
-            return func(*args, **kwargs)
-        else:
-            return func(self, *args, **kwargs)
+        return com._pipe(self, func, *args, **kwargs)
+
+    _shared_docs['aggregate'] = ("""
+    Aggregate using one or more operations over the specified axis.
+
+    %(versionadded)s
+
+    Parameters
+    ----------
+    func : function, string, dictionary, or list of string/functions
+        Function to use for aggregating the data. If a function, must either
+        work when passed a %(klass)s or when passed to %(klass)s.apply. For
+        a DataFrame, can pass a dict, if the keys are DataFrame column names.
+
+        Accepted combinations are:
+
+        - string function name.
+        - function.
+        - list of functions.
+        - dict of column names -> functions (or list of functions).
+
+    %(axis)s
+    *args
+        Positional arguments to pass to `func`.
+    **kwargs
+        Keyword arguments to pass to `func`.
+
+    Returns
+    -------
+    aggregated : %(klass)s
+
+    Notes
+    -----
+    `agg` is an alias for `aggregate`. Use the alias.
+
+    A passed user-defined-function will be passed a Series for evaluation.
+    """)
+
+    _shared_docs['transform'] = ("""
+    Call function producing a like-indexed %(klass)s
+    and return a %(klass)s with the transformed values
+
+    .. versionadded:: 0.20.0
 
-    #----------------------------------------------------------------------
+    Parameters
+    ----------
+    func : callable, string, dictionary, or list of string/callables
+        To apply to column
+
+        Accepted Combinations are:
+
+        - string function name
+        - function
+        - list of functions
+        - dict of column names -> functions (or list of functions)
+
+    Returns
+    -------
+    transformed : %(klass)s
+
+    Examples
+    --------
+    >>> df = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'],
+    ...                   index=pd.date_range('1/1/2000', periods=10))
+    df.iloc[3:7] = np.nan
+
+    >>> df.transform(lambda x: (x - x.mean()) / x.std())
+                       A         B         C
+    2000-01-01  0.579457  1.236184  0.123424
+    2000-01-02  0.370357 -0.605875 -1.231325
+    2000-01-03  1.455756 -0.277446  0.288967
+    2000-01-04       NaN       NaN       NaN
+    2000-01-05       NaN       NaN       NaN
+    2000-01-06       NaN       NaN       NaN
+    2000-01-07       NaN       NaN       NaN
+    2000-01-08 -0.498658  1.274522  1.642524
+    2000-01-09 -0.540524 -1.012676 -0.828968
+    2000-01-10 -1.366388 -0.614710  0.005378
+
+    See also
+    --------
+    pandas.%(klass)s.aggregate
+    pandas.%(klass)s.apply
+    """)
+
+    # ----------------------------------------------------------------------
     # Attribute access
 
     def __finalize__(self, other, method=None, **kwargs):
         """
-        propagate metadata from other to self
+        Propagate metadata from other to self.
 
         Parameters
         ----------
@@ -2232,22 +4363,23 @@ def __getattr__(self, name):
         """After regular attribute access, try looking up the name
         This allows simpler access to columns for interactive use.
         """
+
         # Note: obj.x will always call obj.__getattribute__('x') prior to
         # calling obj.__getattr__('x').
 
-        if (name in self._internal_names_set
-                or name in self._metadata
-                or name in self._accessors):
+        if (name in self._internal_names_set or name in self._metadata or
+                name in self._accessors):
             return object.__getattribute__(self, name)
         else:
-            if name in self._info_axis:
+            if self._info_axis._can_hold_identifiers_and_holds_name(name):
                 return self[name]
-            raise AttributeError("'%s' object has no attribute '%s'" %
-                                 (type(self).__name__, name))
+            return object.__getattribute__(self, name)
 
     def __setattr__(self, name, value):
         """After regular attribute access, try setting the name
-        This allows simpler access to columns for interactive use."""
+        This allows simpler access to columns for interactive use.
+        """
+
         # first try regular attribute access via __getattribute__, so that
         # e.g. ``obj.x`` and ``obj.x = 4`` will always reference/modify
         # the same attribute.
@@ -2274,16 +4406,24 @@ def __setattr__(self, name, value):
                 else:
                     object.__setattr__(self, name, value)
             except (AttributeError, TypeError):
+                if isinstance(self, ABCDataFrame) and (is_list_like(value)):
+                    warnings.warn("Pandas doesn't allow columns to be "
+                                  "created via a new attribute name - see "
+                                  "https://pandas.pydata.org/pandas-docs/"
+                                  "stable/indexing.html#attribute-access",
+                                  stacklevel=2)
                 object.__setattr__(self, name, value)
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Getting and setting elements
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Consolidation of internals
 
     def _protect_consolidate(self, f):
-        """ consolidate _data. if the blocks have changed, then clear the cache """
+        """Consolidate _data -- if the blocks have changed, then clear the
+        cache
+        """
         blocks_before = len(self._data.blocks)
         result = f()
         if len(self._data.blocks) != blocks_before:
@@ -2291,16 +4431,17 @@ def _protect_consolidate(self, f):
         return result
 
     def _consolidate_inplace(self):
-        """ we are inplace consolidating; return None """
+        """Consolidate data in place and return None"""
+
         def f():
             self._data = self._data.consolidate()
+
         self._protect_consolidate(f)
 
-    def consolidate(self, inplace=False):
+    def _consolidate(self, inplace=False):
         """
         Compute NDFrame with "consolidated" internals (data of each dtype
-        grouped together in a single ndarray). Mainly an internal API function,
-        but available here to the savvy user
+        grouped together in a single ndarray).
 
         Parameters
         ----------
@@ -2309,8 +4450,9 @@ def consolidate(self, inplace=False):
 
         Returns
         -------
-        consolidated : type of caller
+        consolidated : same type as caller
         """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
         if inplace:
             self._consolidate_inplace()
         else:
@@ -2318,6 +4460,18 @@ def consolidate(self, inplace=False):
             cons_data = self._protect_consolidate(f)
             return self._constructor(cons_data).__finalize__(self)
 
+    def consolidate(self, inplace=False):
+        """Compute NDFrame with "consolidated" internals (data of each dtype
+        grouped together in a single ndarray).
+
+        .. deprecated:: 0.20.0
+            Consolidate will be an internal implementation only.
+        """
+        # 15483
+        warnings.warn("consolidate is deprecated and will be removed in a "
+                      "future release.", FutureWarning, stacklevel=2)
+        return self._consolidate(inplace)
+
     @property
     def _is_mixed_type(self):
         f = lambda: self._data.is_mixed_type
@@ -2343,11 +4497,11 @@ def _check_inplace_setting(self, value):
                 try:
                     if np.isnan(value):
                         return True
-                except:
+                except Exception:
                     pass
 
-                raise TypeError(
-                    'Cannot do inplace boolean setting on mixed-types with a non np.nan value')
+                raise TypeError('Cannot do inplace boolean setting on '
+                                'mixed-types with a non np.nan value')
 
         return True
 
@@ -2358,12 +4512,14 @@ def _get_numeric_data(self):
     def _get_bool_data(self):
         return self._constructor(self._data.get_bool_data()).__finalize__(self)
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Internal Interface Methods
 
     def as_matrix(self, columns=None):
-        """
-        Convert the frame to its Numpy-array representation.
+        """Convert the frame to its Numpy-array representation.
+
+        .. deprecated:: 0.23.0
+            Use :meth:`DataFrame.values` instead.
 
         Parameters
         ----------
@@ -2388,7 +4544,8 @@ def as_matrix(self, columns=None):
 
         e.g. If the dtypes are float16 and float32, dtype will be upcast to
         float32.  If dtypes are int32 and uint8, dtype will be upcase to
-        int32.
+        int32. By numpy.find_common_type convention, mixing int64 and uint64
+        will result in a float64 dtype.
 
         This method is provided for backwards compatibility. Generally,
         it is recommended to use '.values'.
@@ -2397,14 +4554,63 @@ def as_matrix(self, columns=None):
         --------
         pandas.DataFrame.values
         """
+        warnings.warn("Method .as_matrix will be removed in a future version. "
+                      "Use .values instead.", FutureWarning, stacklevel=2)
         self._consolidate_inplace()
-        if self._AXIS_REVERSED:
-            return self._data.as_matrix(columns).T
-        return self._data.as_matrix(columns)
+        return self._data.as_array(transpose=self._AXIS_REVERSED,
+                                   items=columns)
 
     @property
     def values(self):
-        """Numpy representation of NDFrame
+        """
+        Return a Numpy representation of the DataFrame.
+
+        Only the values in the DataFrame will be returned, the axes labels
+        will be removed.
+
+        Returns
+        -------
+        numpy.ndarray
+            The values of the DataFrame.
+
+        Examples
+        --------
+        A DataFrame where all columns are the same type (e.g., int64) results
+        in an array of the same type.
+
+        >>> df = pd.DataFrame({'age':    [ 3,  29],
+        ...                    'height': [94, 170],
+        ...                    'weight': [31, 115]})
+        >>> df
+           age  height  weight
+        0    3      94      31
+        1   29     170     115
+        >>> df.dtypes
+        age       int64
+        height    int64
+        weight    int64
+        dtype: object
+        >>> df.values
+        array([[  3,  94,  31],
+               [ 29, 170, 115]], dtype=int64)
+
+        A DataFrame with mixed type columns(e.g., str/object, int64, float32)
+        results in an ndarray of the broadest type that accommodates these
+        mixed types (e.g., object).
+
+        >>> df2 = pd.DataFrame([('parrot',   24.0, 'second'),
+        ...                     ('lion',     80.5, 1),
+        ...                     ('monkey', np.nan, None)],
+        ...                   columns=('name', 'max_speed', 'rank'))
+        >>> df2.dtypes
+        name          object
+        max_speed    float64
+        rank          object
+        dtype: object
+        >>> df2.values
+        array([['parrot', 24.0, 'second'],
+               ['lion', 80.5, 1],
+               ['monkey', nan, None]], dtype=object)
 
         Notes
         -----
@@ -2414,38 +4620,180 @@ def values(self):
         with care if you are not dealing with the blocks.
 
         e.g. If the dtypes are float16 and float32, dtype will be upcast to
-        float32.  If dtypes are int32 and uint8, dtype will be upcase to
-        int32.
-        """
-        return self.as_matrix()
+        float32.  If dtypes are int32 and uint8, dtype will be upcast to
+        int32. By :func:`numpy.find_common_type` convention, mixing int64
+        and uint64 will result in a float64 dtype.
+
+        See Also
+        --------
+        pandas.DataFrame.index : Retrieve the index labels
+        pandas.DataFrame.columns : Retrieving the column names
+        """
+        self._consolidate_inplace()
+        return self._data.as_array(transpose=self._AXIS_REVERSED)
 
     @property
     def _values(self):
-        """ internal implementation """
+        """internal implementation"""
         return self.values
 
     @property
     def _get_values(self):
         # compat
-        return self.as_matrix()
+        return self.values
 
     def get_values(self):
-        """ same as values (but handles sparseness conversions) """
-        return self.as_matrix()
+        """
+        Return an ndarray after converting sparse values to dense.
+
+        This is the same as ``.values`` for non-sparse data. For sparse
+        data contained in a `pandas.SparseArray`, the data are first
+        converted to a dense representation.
+
+        Returns
+        -------
+        numpy.ndarray
+            Numpy representation of DataFrame
+
+        See Also
+        --------
+        values : Numpy representation of DataFrame.
+        pandas.SparseArray : Container for sparse data.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'a': [1, 2], 'b': [True, False],
+        ...                    'c': [1.0, 2.0]})
+        >>> df
+           a      b    c
+        0  1   True  1.0
+        1  2  False  2.0
+
+        >>> df.get_values()
+        array([[1, True, 1.0], [2, False, 2.0]], dtype=object)
+
+        >>> df = pd.DataFrame({"a": pd.SparseArray([1, None, None]),
+        ...                    "c": [1.0, 2.0, 3.0]})
+        >>> df
+             a    c
+        0  1.0  1.0
+        1  NaN  2.0
+        2  NaN  3.0
+
+        >>> df.get_values()
+        array([[ 1.,  1.],
+               [nan,  2.],
+               [nan,  3.]])
+        """
+        return self.values
 
     def get_dtype_counts(self):
-        """ Return the counts of dtypes in this object """
+        """
+        Return counts of unique dtypes in this object.
+
+        Returns
+        -------
+        dtype : Series
+            Series with the count of columns with each dtype.
+
+        See Also
+        --------
+        dtypes : Return the dtypes in this object.
+
+        Examples
+        --------
+        >>> a = [['a', 1, 1.0], ['b', 2, 2.0], ['c', 3, 3.0]]
+        >>> df = pd.DataFrame(a, columns=['str', 'int', 'float'])
+        >>> df
+          str  int  float
+        0   a    1    1.0
+        1   b    2    2.0
+        2   c    3    3.0
+
+        >>> df.get_dtype_counts()
+        float64    1
+        int64      1
+        object     1
+        dtype: int64
+        """
         from pandas import Series
         return Series(self._data.get_dtype_counts())
 
     def get_ftype_counts(self):
-        """ Return the counts of ftypes in this object """
+        """
+        Return counts of unique ftypes in this object.
+
+        .. deprecated:: 0.23.0
+
+        This is useful for SparseDataFrame or for DataFrames containing
+        sparse arrays.
+
+        Returns
+        -------
+        dtype : Series
+            Series with the count of columns with each type and
+            sparsity (dense/sparse)
+
+        See Also
+        --------
+        ftypes : Return ftypes (indication of sparse/dense and dtype) in
+            this object.
+
+        Examples
+        --------
+        >>> a = [['a', 1, 1.0], ['b', 2, 2.0], ['c', 3, 3.0]]
+        >>> df = pd.DataFrame(a, columns=['str', 'int', 'float'])
+        >>> df
+          str  int  float
+        0   a    1    1.0
+        1   b    2    2.0
+        2   c    3    3.0
+
+        >>> df.get_ftype_counts()
+        float64:dense    1
+        int64:dense      1
+        object:dense     1
+        dtype: int64
+        """
+        warnings.warn("get_ftype_counts is deprecated and will "
+                      "be removed in a future version",
+                      FutureWarning, stacklevel=2)
+
         from pandas import Series
         return Series(self._data.get_ftype_counts())
 
     @property
     def dtypes(self):
-        """ Return the dtypes in this object """
+        """
+        Return the dtypes in the DataFrame.
+
+        This returns a Series with the data type of each column.
+        The result's index is the original DataFrame's columns. Columns
+        with mixed types are stored with the ``object`` dtype. See
+        :ref:`the User Guide <basics.dtypes>` for more.
+
+        Returns
+        -------
+        pandas.Series
+            The data type of each column.
+
+        See Also
+        --------
+        pandas.DataFrame.ftypes : dtype and sparsity information.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'float': [1.0],
+        ...                    'int': [1],
+        ...                    'datetime': [pd.Timestamp('20180310')],
+        ...                    'string': ['foo']})
+        >>> df.dtypes
+        float              float64
+        int                  int64
+        datetime    datetime64[ns]
+        string              object
+        dtype: object
+        """
         from pandas import Series
         return Series(self._data.get_dtypes(), index=self._info_axis,
                       dtype=np.object_)
@@ -2453,8 +4801,45 @@ def dtypes(self):
     @property
     def ftypes(self):
         """
-        Return the ftypes (indication of sparse/dense and dtype)
-        in this object.
+        Return the ftypes (indication of sparse/dense and dtype) in DataFrame.
+
+        This returns a Series with the data type of each column.
+        The result's index is the original DataFrame's columns. Columns
+        with mixed types are stored with the ``object`` dtype.  See
+        :ref:`the User Guide <basics.dtypes>` for more.
+
+        Returns
+        -------
+        pandas.Series
+            The data type and indication of sparse/dense of each column.
+
+        See Also
+        --------
+        pandas.DataFrame.dtypes: Series with just dtype information.
+        pandas.SparseDataFrame : Container for sparse tabular data.
+
+        Notes
+        -----
+        Sparse data should have the same dtypes as its dense representation.
+
+        Examples
+        --------
+        >>> import numpy as np
+        >>> arr = np.random.RandomState(0).randn(100, 4)
+        >>> arr[arr < .8] = np.nan
+        >>> pd.DataFrame(arr).ftypes
+        0    float64:dense
+        1    float64:dense
+        2    float64:dense
+        3    float64:dense
+        dtype: object
+
+        >>> pd.SparseDataFrame(arr).ftypes
+        0    float64:sparse
+        1    float64:sparse
+        2    float64:sparse
+        3    float64:sparse
+        dtype: object
         """
         from pandas import Series
         return Series(self._data.get_ftypes(), index=self._info_axis,
@@ -2465,6 +4850,8 @@ def as_blocks(self, copy=True):
         Convert the frame to a dict of dtype -> Constructor Types that each has
         a homogeneous dtype.
 
+        .. deprecated:: 0.21.0
+
         NOTE: the dtypes of the blocks WILL BE PRESERVED HERE (unlike in
               as_matrix)
 
@@ -2472,68 +4859,269 @@ def as_blocks(self, copy=True):
         ----------
         copy : boolean, default True
 
-               .. versionadded: 0.16.1
-
         Returns
         -------
         values : a dict of dtype -> Constructor Types
         """
-        self._consolidate_inplace()
-
-        bd = {}
-        for b in self._data.blocks:
-            bd.setdefault(str(b.dtype), []).append(b)
-
-        result = {}
-        for dtype, blocks in bd.items():
-            # Must combine even after consolidation, because there may be
-            # sparse items which are never consolidated into one block.
-            combined = self._data.combine(blocks, copy=copy)
-            result[dtype] = self._constructor(combined).__finalize__(self)
-
-        return result
+        warnings.warn("as_blocks is deprecated and will "
+                      "be removed in a future version",
+                      FutureWarning, stacklevel=2)
+        return self._to_dict_of_blocks(copy=copy)
 
     @property
     def blocks(self):
-        "Internal property, property synonym for as_blocks()"
+        """
+        Internal property, property synonym for as_blocks()
+
+        .. deprecated:: 0.21.0
+        """
         return self.as_blocks()
 
-    def astype(self, dtype, copy=True, raise_on_error=True, **kwargs):
+    def _to_dict_of_blocks(self, copy=True):
         """
-        Cast object to input numpy.dtype
-        Return a copy when copy = True (be really careful with this!)
+        Return a dict of dtype -> Constructor Types that
+        each is a homogeneous dtype.
+
+        Internal ONLY
+        """
+        return {k: self._constructor(v).__finalize__(self)
+                for k, v, in self._data.to_dict(copy=copy).items()}
+
+    @deprecate_kwarg(old_arg_name='raise_on_error', new_arg_name='errors',
+                     mapping={True: 'raise', False: 'ignore'})
+    def astype(self, dtype, copy=True, errors='raise', **kwargs):
+        """
+        Cast a pandas object to a specified dtype ``dtype``.
 
         Parameters
         ----------
-        dtype : numpy.dtype or Python type
+        dtype : data type, or dict of column name -> data type
+            Use a numpy.dtype or Python type to cast entire pandas object to
+            the same type. Alternatively, use {col: dtype, ...}, where col is a
+            column label and dtype is a numpy.dtype or Python type to cast one
+            or more of the DataFrame's columns to column-specific types.
+        copy : bool, default True.
+            Return a copy when ``copy=True`` (be very careful setting
+            ``copy=False`` as changes to values then may propagate to other
+            pandas objects).
+        errors : {'raise', 'ignore'}, default 'raise'.
+            Control raising of exceptions on invalid data for provided dtype.
+
+            - ``raise`` : allow exceptions to be raised
+            - ``ignore`` : suppress exceptions. On error return original object
+
+            .. versionadded:: 0.20.0
+
         raise_on_error : raise on invalid input
+            .. deprecated:: 0.20.0
+               Use ``errors`` instead
         kwargs : keyword arguments to pass on to the constructor
 
         Returns
         -------
-        casted : type of caller
-        """
+        casted : same type as caller
+
+        Examples
+        --------
+        >>> ser = pd.Series([1, 2], dtype='int32')
+        >>> ser
+        0    1
+        1    2
+        dtype: int32
+        >>> ser.astype('int64')
+        0    1
+        1    2
+        dtype: int64
+
+        Convert to categorical type:
+
+        >>> ser.astype('category')
+        0    1
+        1    2
+        dtype: category
+        Categories (2, int64): [1, 2]
+
+        Convert to ordered categorical type with custom ordering:
+
+        >>> ser.astype('category', ordered=True, categories=[2, 1])
+        0    1
+        1    2
+        dtype: category
+        Categories (2, int64): [2 < 1]
+
+        Note that using ``copy=False`` and changing data on a new
+        pandas object may propagate changes:
+
+        >>> s1 = pd.Series([1,2])
+        >>> s2 = s1.astype('int64', copy=False)
+        >>> s2[0] = 10
+        >>> s1  # note that s1[0] has changed too
+        0    10
+        1     2
+        dtype: int64
+
+        See also
+        --------
+        pandas.to_datetime : Convert argument to datetime.
+        pandas.to_timedelta : Convert argument to timedelta.
+        pandas.to_numeric : Convert argument to a numeric type.
+        numpy.ndarray.astype : Cast a numpy array to a specified type.
+        """
+        if is_dict_like(dtype):
+            if self.ndim == 1:  # i.e. Series
+                if len(dtype) > 1 or self.name not in dtype:
+                    raise KeyError('Only the Series name can be used for '
+                                   'the key in Series dtype mappings.')
+                new_type = dtype[self.name]
+                return self.astype(new_type, copy, errors, **kwargs)
+            elif self.ndim > 2:
+                raise NotImplementedError(
+                    'astype() only accepts a dtype arg of type dict when '
+                    'invoked on Series and DataFrames. A single dtype must be '
+                    'specified when invoked on a Panel.'
+                )
+            for col_name in dtype.keys():
+                if col_name not in self:
+                    raise KeyError('Only a column name can be used for the '
+                                   'key in a dtype mappings argument.')
+            results = []
+            for col_name, col in self.iteritems():
+                if col_name in dtype:
+                    results.append(col.astype(dtype[col_name], copy=copy))
+                else:
+                    results.append(results.append(col.copy() if copy else col))
+
+        elif is_categorical_dtype(dtype) and self.ndim > 1:
+            # GH 18099: columnwise conversion to categorical
+            results = (self[col].astype(dtype, copy=copy) for col in self)
 
-        mgr = self._data.astype(
-            dtype=dtype, copy=copy, raise_on_error=raise_on_error, **kwargs)
-        return self._constructor(mgr).__finalize__(self)
+        else:
+            # else, only a single dtype is given
+            new_data = self._data.astype(dtype=dtype, copy=copy, errors=errors,
+                                         **kwargs)
+            return self._constructor(new_data).__finalize__(self)
+
+        # GH 19920: retain column metadata after concat
+        result = pd.concat(results, axis=1, copy=False)
+        result.columns = self.columns
+        return result
 
     def copy(self, deep=True):
         """
-        Make a copy of this object
+        Make a copy of this object's indices and data.
+
+        When ``deep=True`` (default), a new object will be created with a
+        copy of the calling object's data and indices. Modifications to
+        the data or indices of the copy will not be reflected in the
+        original object (see notes below).
+
+        When ``deep=False``, a new object will be created without copying
+        the calling object's data or index (only references to the data
+        and index are copied). Any changes to the data of the original
+        will be reflected in the shallow copy (and vice versa).
 
         Parameters
         ----------
-        deep : boolean or string, default True
-            Make a deep copy, i.e. also copy data
+        deep : bool, default True
+            Make a deep copy, including a copy of the data and the indices.
+            With ``deep=False`` neither the indices nor the data are copied.
 
         Returns
         -------
-        copy : type of caller
+        copy : Series, DataFrame or Panel
+            Object type matches caller.
+
+        Notes
+        -----
+        When ``deep=True``, data is copied but actual Python objects
+        will not be copied recursively, only the reference to the object.
+        This is in contrast to `copy.deepcopy` in the Standard Library,
+        which recursively copies object data (see examples below).
+
+        While ``Index`` objects are copied when ``deep=True``, the underlying
+        numpy array is not copied for performance reasons. Since ``Index`` is
+        immutable, the underlying data can be safely shared and a copy
+        is not needed.
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2], index=["a", "b"])
+        >>> s
+        a    1
+        b    2
+        dtype: int64
+
+        >>> s_copy = s.copy()
+        >>> s_copy
+        a    1
+        b    2
+        dtype: int64
+
+        **Shallow copy versus default (deep) copy:**
+
+        >>> s = pd.Series([1, 2], index=["a", "b"])
+        >>> deep = s.copy()
+        >>> shallow = s.copy(deep=False)
+
+        Shallow copy shares data and index with original.
+
+        >>> s is shallow
+        False
+        >>> s.values is shallow.values and s.index is shallow.index
+        True
+
+        Deep copy has own copy of data and index.
+
+        >>> s is deep
+        False
+        >>> s.values is deep.values or s.index is deep.index
+        False
+
+        Updates to the data shared by shallow copy and original is reflected
+        in both; deep copy remains unchanged.
+
+        >>> s[0] = 3
+        >>> shallow[1] = 4
+        >>> s
+        a    3
+        b    4
+        dtype: int64
+        >>> shallow
+        a    3
+        b    4
+        dtype: int64
+        >>> deep
+        a    1
+        b    2
+        dtype: int64
+
+        Note that when copying an object containing Python objects, a deep copy
+        will copy the data, but will not do so recursively. Updating a nested
+        data object will be reflected in the deep copy.
+
+        >>> s = pd.Series([[1, 2], [3, 4]])
+        >>> deep = s.copy()
+        >>> s[0][0] = 10
+        >>> s
+        0    [10, 2]
+        1     [3, 4]
+        dtype: object
+        >>> deep
+        0    [10, 2]
+        1     [3, 4]
+        dtype: object
         """
         data = self._data.copy(deep=deep)
         return self._constructor(data).__finalize__(self)
 
+    def __copy__(self, deep=True):
+        return self.copy(deep=deep)
+
+    def __deepcopy__(self, memo=None):
+        if memo is None:
+            memo = {}
+        return self.copy(deep=True)
+
     def _convert(self, datetime=False, numeric=False, timedelta=False,
                  coerce=False, copy=True):
         """
@@ -2561,17 +5149,15 @@ def _convert(self, datetime=False, numeric=False, timedelta=False,
         converted : same as input object
         """
         return self._constructor(
-            self._data.convert(datetime=datetime,
-                                numeric=numeric,
-                                timedelta=timedelta,
-                                coerce=coerce,
-                                copy=copy)).__finalize__(self)
+            self._data.convert(datetime=datetime, numeric=numeric,
+                               timedelta=timedelta, coerce=coerce,
+                               copy=copy)).__finalize__(self)
 
-    # TODO: Remove in 0.18 or 2017, which ever is sooner
     def convert_objects(self, convert_dates=True, convert_numeric=False,
                         convert_timedeltas=True, copy=True):
-        """
-        Attempt to infer better dtype for object columns
+        """Attempt to infer better dtype for object columns.
+
+        .. deprecated:: 0.21.0
 
         Parameters
         ----------
@@ -2589,14 +5175,22 @@ def convert_objects(self, convert_dates=True, convert_numeric=False,
             conversion was done). Note: This is meant for internal use, and
             should not be confused with inplace.
 
+        See Also
+        --------
+        pandas.to_datetime : Convert argument to datetime.
+        pandas.to_timedelta : Convert argument to timedelta.
+        pandas.to_numeric : Convert argument to numeric type.
+
         Returns
         -------
         converted : same as input object
         """
-        from warnings import warn
-        warn("convert_objects is deprecated.  Use the data-type specific "
-             "converters pd.to_datetime, pd.to_timedelta and pd.to_numeric.",
-             FutureWarning, stacklevel=2)
+        msg = ("convert_objects is deprecated.  To re-infer data dtypes for "
+               "object columns, use {klass}.infer_objects()\nFor all "
+               "other conversions use the data-type specific converters "
+               "pd.to_datetime, pd.to_timedelta and pd.to_numeric."
+               ).format(klass=self.__class__.__name__)
+        warnings.warn(msg, FutureWarning, stacklevel=2)
 
         return self._constructor(
             self._data.convert(convert_dates=convert_dates,
@@ -2604,20 +5198,69 @@ def convert_objects(self, convert_dates=True, convert_numeric=False,
                                convert_timedeltas=convert_timedeltas,
                                copy=copy)).__finalize__(self)
 
-    #----------------------------------------------------------------------
+    def infer_objects(self):
+        """
+        Attempt to infer better dtypes for object columns.
+
+        Attempts soft conversion of object-dtyped
+        columns, leaving non-object and unconvertible
+        columns unchanged. The inference rules are the
+        same as during normal Series/DataFrame construction.
+
+        .. versionadded:: 0.21.0
+
+        See Also
+        --------
+        pandas.to_datetime : Convert argument to datetime.
+        pandas.to_timedelta : Convert argument to timedelta.
+        pandas.to_numeric : Convert argument to numeric type.
+
+        Returns
+        -------
+        converted : same type as input object
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({"A": ["a", 1, 2, 3]})
+        >>> df = df.iloc[1:]
+        >>> df
+           A
+        1  1
+        2  2
+        3  3
+
+        >>> df.dtypes
+        A    object
+        dtype: object
+
+        >>> df.infer_objects().dtypes
+        A    int64
+        dtype: object
+        """
+        # numeric=False necessary to only soft convert;
+        # python objects will still be converted to
+        # native numpy numeric types
+        return self._constructor(
+            self._data.convert(datetime=True, numeric=False,
+                               timedelta=True, coerce=False,
+                               copy=True)).__finalize__(self)
+
+    # ----------------------------------------------------------------------
     # Filling NA's
 
-    _shared_docs['fillna'] = (
+    def fillna(self, value=None, method=None, axis=None, inplace=False,
+               limit=None, downcast=None):
         """
         Fill NA/NaN values using the specified method
 
         Parameters
         ----------
         value : scalar, dict, Series, or DataFrame
-            Value to use to fill holes (e.g. 0), alternately a dict/Series/DataFrame of
-            values specifying which value to use for each index (for a Series) or
-            column (for a DataFrame). (values not in the dict/Series/DataFrame will not be
-            filled). This value cannot be a list.
+            Value to use to fill holes (e.g. 0), alternately a
+            dict/Series/DataFrame of values specifying which value to use for
+            each index (for a Series) or column (for a DataFrame). (values not
+            in the dict/Series/DataFrame will not be filled). This value cannot
+            be a list.
         method : {'backfill', 'bfill', 'pad', 'ffill', None}, default None
             Method to use for filling holes in reindexed Series
             pad / ffill: propagate last valid observation forward to next valid
@@ -2633,28 +5276,76 @@ def convert_objects(self, convert_dates=True, convert_numeric=False,
             a gap with more than this number of consecutive NaNs, it will only
             be partially filled. If method is not specified, this is the
             maximum number of entries along the entire axis where NaNs will be
-            filled.
+            filled. Must be greater than 0 if not None.
         downcast : dict, default is None
             a dict of item->dtype of what to downcast if possible,
             or the string 'infer' which will try to downcast to an appropriate
             equal type (e.g. float64 to int64 if possible)
 
-        See also
+        See Also
         --------
+        interpolate : Fill NaN values using interpolation.
         reindex, asfreq
 
         Returns
         -------
         filled : %(klass)s
-        """
-    )
 
-    @Appender(_shared_docs['fillna'] % _shared_doc_kwargs)
-    def fillna(self, value=None, method=None, axis=None, inplace=False,
-               limit=None, downcast=None):
-        if isinstance(value, (list, tuple)):
-            raise TypeError('"value" parameter must be a scalar or dict, but '
-                            'you passed a "{0}"'.format(type(value).__name__))
+        Examples
+        --------
+        >>> df = pd.DataFrame([[np.nan, 2, np.nan, 0],
+        ...                    [3, 4, np.nan, 1],
+        ...                    [np.nan, np.nan, np.nan, 5],
+        ...                    [np.nan, 3, np.nan, 4]],
+        ...                    columns=list('ABCD'))
+        >>> df
+             A    B   C  D
+        0  NaN  2.0 NaN  0
+        1  3.0  4.0 NaN  1
+        2  NaN  NaN NaN  5
+        3  NaN  3.0 NaN  4
+
+        Replace all NaN elements with 0s.
+
+        >>> df.fillna(0)
+            A   B   C   D
+        0   0.0 2.0 0.0 0
+        1   3.0 4.0 0.0 1
+        2   0.0 0.0 0.0 5
+        3   0.0 3.0 0.0 4
+
+        We can also propagate non-null values forward or backward.
+
+        >>> df.fillna(method='ffill')
+            A   B   C   D
+        0   NaN 2.0 NaN 0
+        1   3.0 4.0 NaN 1
+        2   3.0 4.0 NaN 5
+        3   3.0 3.0 NaN 4
+
+        Replace all NaN elements in column 'A', 'B', 'C', and 'D', with 0, 1,
+        2, and 3 respectively.
+
+        >>> values = {'A': 0, 'B': 1, 'C': 2, 'D': 3}
+        >>> df.fillna(value=values)
+            A   B   C   D
+        0   0.0 2.0 2.0 0
+        1   3.0 4.0 2.0 1
+        2   0.0 1.0 2.0 5
+        3   0.0 3.0 2.0 4
+
+        Only replace the first NaN element.
+
+        >>> df.fillna(value=values, limit=1)
+            A   B   C   D
+        0   0.0 2.0 2.0 0
+        1   3.0 4.0 NaN 1
+        2   NaN 1.0 NaN 5
+        3   NaN 3.0 NaN 4
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        value, method = validate_fillna_kwargs(value, method)
+
         self._consolidate_inplace()
 
         # set the default here, so functions examining the signaure
@@ -2662,12 +5353,10 @@ def fillna(self, value=None, method=None, axis=None, inplace=False,
         if axis is None:
             axis = 0
         axis = self._get_axis_number(axis)
-        method = com._clean_fill_method(method)
 
         from pandas import DataFrame
         if value is None:
-            if method is None:
-                raise ValueError('must specify a fill method or value')
+
             if self._is_mixed_type and axis == 1:
                 if inplace:
                     raise NotImplementedError()
@@ -2680,48 +5369,44 @@ def fillna(self, value=None, method=None, axis=None, inplace=False,
 
             # > 3d
             if self.ndim > 3:
-                raise NotImplementedError(
-                    'Cannot fillna with a method for > 3dims'
-                )
+                raise NotImplementedError('Cannot fillna with a method for > '
+                                          '3dims')
 
             # 3d
             elif self.ndim == 3:
-
                 # fill in 2d chunks
-                result = dict([(col, s.fillna(method=method, value=value))
-                               for col, s in compat.iteritems(self)])
-                return self._constructor.from_dict(result).__finalize__(self)
-
-            # 2d or less
-            method = com._clean_fill_method(method)
-            new_data = self._data.interpolate(method=method,
-                                              axis=axis,
-                                              limit=limit,
-                                              inplace=inplace,
-                                              coerce=True,
-                                              downcast=downcast)
-        else:
-            if method is not None:
-                raise ValueError('cannot specify both a fill method and value')
+                result = {col: s.fillna(method=method, value=value)
+                          for col, s in self.iteritems()}
+                new_obj = self._constructor.\
+                    from_dict(result).__finalize__(self)
+                new_data = new_obj._data
 
+            else:
+                # 2d or less
+                new_data = self._data.interpolate(method=method, axis=axis,
+                                                  limit=limit, inplace=inplace,
+                                                  coerce=True,
+                                                  downcast=downcast)
+        else:
             if len(self._get_axis(axis)) == 0:
                 return self
 
             if self.ndim == 1:
-                if isinstance(value, (dict, com.ABCSeries)):
+                if isinstance(value, (dict, ABCSeries)):
                     from pandas import Series
                     value = Series(value)
-                elif not com.is_list_like(value):
+                elif not is_list_like(value):
                     pass
                 else:
-                    raise ValueError("invalid fill value with a %s" % type(value))
+                    raise TypeError('"value" parameter must be a scalar, dict '
+                                    'or Series, but you passed a '
+                                    '"{0}"'.format(type(value).__name__))
 
-                new_data = self._data.fillna(value=value,
-                                             limit=limit,
+                new_data = self._data.fillna(value=value, limit=limit,
                                              inplace=inplace,
                                              downcast=downcast)
 
-            elif isinstance(value, (dict, com.ABCSeries)):
+            elif isinstance(value, (dict, ABCSeries)):
                 if axis == 1:
                     raise NotImplementedError('Currently only can fill '
                                               'with dict/Series column '
@@ -2732,15 +5417,15 @@ def fillna(self, value=None, method=None, axis=None, inplace=False,
                     if k not in result:
                         continue
                     obj = result[k]
-                    obj.fillna(v, limit=limit, inplace=True)
-                return result
-            elif not com.is_list_like(value):
-                new_data = self._data.fillna(value=value,
-                                             limit=limit,
+                    obj.fillna(v, limit=limit, inplace=True, downcast=downcast)
+                return result if not inplace else None
+
+            elif not is_list_like(value):
+                new_data = self._data.fillna(value=value, limit=limit,
                                              inplace=inplace,
                                              downcast=downcast)
             elif isinstance(value, DataFrame) and self.ndim == 2:
-                new_data = self.where(self.notnull(), value)
+                new_data = self.where(self.notna(), value)
             else:
                 raise ValueError("invalid fill value with a %s" % type(value))
 
@@ -2750,26 +5435,35 @@ def fillna(self, value=None, method=None, axis=None, inplace=False,
             return self._constructor(new_data).__finalize__(self)
 
     def ffill(self, axis=None, inplace=False, limit=None, downcast=None):
-        "Synonym for NDFrame.fillna(method='ffill')"
+        """
+        Synonym for :meth:`DataFrame.fillna(method='ffill') <DataFrame.fillna>`
+        """
         return self.fillna(method='ffill', axis=axis, inplace=inplace,
                            limit=limit, downcast=downcast)
 
     def bfill(self, axis=None, inplace=False, limit=None, downcast=None):
-        "Synonym for NDFrame.fillna(method='bfill')"
+        """
+        Synonym for :meth:`DataFrame.fillna(method='bfill') <DataFrame.fillna>`
+        """
         return self.fillna(method='bfill', axis=axis, inplace=inplace,
                            limit=limit, downcast=downcast)
 
-    def replace(self, to_replace=None, value=None, inplace=False, limit=None,
-                regex=False, method='pad', axis=None):
-        """
-        Replace values given in 'to_replace' with 'value'.
+    _shared_docs['replace'] = ("""
+        Replace values given in `to_replace` with `value`.
+
+        Values of the %(klass)s are replaced with other values dynamically.
+        This differs from updating with ``.loc`` or ``.iloc``, which require
+        you to specify a location to update with some value.
 
         Parameters
         ----------
-        to_replace : str, regex, list, dict, Series, numeric, or None
+        to_replace : str, regex, list, dict, Series, int, float, or None
+            How to find the values that will be replaced.
 
-            * str or regex:
+            * numeric, str or regex:
 
+                - numeric: numeric values equal to `to_replace` will be
+                  replaced with `value`
                 - str: string exactly matching `to_replace` will be replaced
                   with `value`
                 - regex: regexs matching `to_replace` will be replaced with
@@ -2783,70 +5477,92 @@ def replace(self, to_replace=None, value=None, inplace=False, limit=None,
                   lists will be interpreted as regexs otherwise they will match
                   directly. This doesn't matter much for `value` since there
                   are only a few possible substitution regexes you can use.
-                - str and regex rules apply as above.
+                - str, regex and numeric rules apply as above.
 
             * dict:
 
-                - Nested dictionaries, e.g., {'a': {'b': nan}}, are read as
-                  follows: look in column 'a' for the value 'b' and replace it
-                  with nan. You can nest regular expressions as well. Note that
+                - Dicts can be used to specify different replacement values
+                  for different existing values. For example,
+                  ``{'a': 'b', 'y': 'z'}`` replaces the value 'a' with 'b' and
+                  'y' with 'z'. To use a dict in this way the `value`
+                  parameter should be `None`.
+                - For a DataFrame a dict can specify that different values
+                  should be replaced in different columns. For example,
+                  ``{'a': 1, 'b': 'z'}`` looks for the value 1 in column 'a'
+                  and the value 'z' in column 'b' and replaces these values
+                  with whatever is specified in `value`. The `value` parameter
+                  should not be ``None`` in this case. You can treat this as a
+                  special case of passing two lists except that you are
+                  specifying the column to search in.
+                - For a DataFrame nested dictionaries, e.g.,
+                  ``{'a': {'b': np.nan}}``, are read as follows: look in column
+                  'a' for the value 'b' and replace it with NaN. The `value`
+                  parameter should be ``None`` to use a nested dict in this
+                  way. You can nest regular expressions as well. Note that
                   column names (the top-level dictionary keys in a nested
                   dictionary) **cannot** be regular expressions.
-                - Keys map to column names and values map to substitution
-                  values. You can treat this as a special case of passing two
-                  lists except that you are specifying the column to search in.
 
             * None:
 
-                - This means that the ``regex`` argument must be a string,
-                  compiled regular expression, or list, dict, ndarray or Series
-                  of such elements. If `value` is also ``None`` then this
-                  **must** be a nested dictionary or ``Series``.
+                - This means that the `regex` argument must be a string,
+                  compiled regular expression, or list, dict, ndarray or
+                  Series of such elements. If `value` is also ``None`` then
+                  this **must** be a nested dictionary or Series.
 
             See the examples section for examples of each of these.
         value : scalar, dict, list, str, regex, default None
-            Value to use to fill holes (e.g. 0), alternately a dict of values
-            specifying which value to use for each column (columns not in the
-            dict will not be filled). Regular expressions, strings and lists or
-            dicts of such objects are also allowed.
+            Value to replace any values matching `to_replace` with.
+            For a DataFrame a dict of values can be used to specify which
+            value to use for each column (columns not in the dict will not be
+            filled). Regular expressions, strings and lists or dicts of such
+            objects are also allowed.
         inplace : boolean, default False
             If True, in place. Note: this will modify any
-            other views on this object (e.g. a column form a DataFrame).
+            other views on this object (e.g. a column from a DataFrame).
             Returns the caller if this is True.
         limit : int, default None
-            Maximum size gap to forward or backward fill
+            Maximum size gap to forward or backward fill.
         regex : bool or same types as `to_replace`, default False
             Whether to interpret `to_replace` and/or `value` as regular
             expressions. If this is ``True`` then `to_replace` *must* be a
-            string. Otherwise, `to_replace` must be ``None`` because this
-            parameter will be interpreted as a regular expression or a list,
-            dict, or array of regular expressions.
-        method : string, optional, {'pad', 'ffill', 'bfill'}
-            The method to use when for replacement, when ``to_replace`` is a
-            ``list``.
+            string. Alternatively, this could be a regular expression or a
+            list, dict, or array of regular expressions in which case
+            `to_replace` must be ``None``.
+        method : {'pad', 'ffill', 'bfill', `None`}
+            The method to use when for replacement, when `to_replace` is a
+            scalar, list or tuple and `value` is ``None``.
 
-        See also
+            .. versionchanged:: 0.23.0
+                Added to DataFrame.
+
+        See Also
         --------
-        NDFrame.reindex
-        NDFrame.asfreq
-        NDFrame.fillna
+        %(klass)s.fillna : Fill NA values
+        %(klass)s.where : Replace values based on boolean condition
+        Series.str.replace : Simple string replacement.
 
         Returns
         -------
-        filled : NDFrame
+        %(klass)s
+            Object after replacement.
 
         Raises
         ------
         AssertionError
-            * If `regex` is not a ``bool`` and `to_replace` is not ``None``.
+            * If `regex` is not a ``bool`` and `to_replace` is not
+              ``None``.
         TypeError
             * If `to_replace` is a ``dict`` and `value` is not a ``list``,
               ``dict``, ``ndarray``, or ``Series``
-            * If `to_replace` is ``None`` and `regex` is not compilable into a
-              regular expression or is a list, dict, ndarray, or Series.
+            * If `to_replace` is ``None`` and `regex` is not compilable
+              into a regular expression or is a list, dict, ndarray, or
+              Series.
+            * When replacing multiple ``bool`` or ``datetime64`` objects and
+              the arguments to `to_replace` does not match the type of the
+              value being replaced
         ValueError
-            * If `to_replace` and `value` are ``list`` s or ``ndarray`` s, but
-              they are not the same length.
+            * If a ``list`` or an ``ndarray`` is passed to `to_replace` and
+              `value` but they are not the same length.
 
         Notes
         -----
@@ -2855,34 +5571,200 @@ def replace(self, to_replace=None, value=None, inplace=False, limit=None,
         * Regular expressions will only substitute on strings, meaning you
           cannot provide, for example, a regular expression matching floating
           point numbers and expect the columns in your frame that have a
-          numeric dtype to be matched. However, if those floating point numbers
-          *are* strings, then you can do this.
+          numeric dtype to be matched. However, if those floating point
+          numbers *are* strings, then you can do this.
         * This method has *a lot* of options. You are encouraged to experiment
           and play with this method to gain intuition about how it works.
+        * When dict is used as the `to_replace` value, it is like
+          key(s) in the dict are the to_replace part and
+          value(s) in the dict are the value parameter.
 
-        """
-        if not com.is_bool(regex) and to_replace is not None:
+        Examples
+        --------
+
+        **Scalar `to_replace` and `value`**
+
+        >>> s = pd.Series([0, 1, 2, 3, 4])
+        >>> s.replace(0, 5)
+        0    5
+        1    1
+        2    2
+        3    3
+        4    4
+        dtype: int64
+
+        >>> df = pd.DataFrame({'A': [0, 1, 2, 3, 4],
+        ...                    'B': [5, 6, 7, 8, 9],
+        ...                    'C': ['a', 'b', 'c', 'd', 'e']})
+        >>> df.replace(0, 5)
+           A  B  C
+        0  5  5  a
+        1  1  6  b
+        2  2  7  c
+        3  3  8  d
+        4  4  9  e
+
+        **List-like `to_replace`**
+
+        >>> df.replace([0, 1, 2, 3], 4)
+           A  B  C
+        0  4  5  a
+        1  4  6  b
+        2  4  7  c
+        3  4  8  d
+        4  4  9  e
+
+        >>> df.replace([0, 1, 2, 3], [4, 3, 2, 1])
+           A  B  C
+        0  4  5  a
+        1  3  6  b
+        2  2  7  c
+        3  1  8  d
+        4  4  9  e
+
+        >>> s.replace([1, 2], method='bfill')
+        0    0
+        1    3
+        2    3
+        3    3
+        4    4
+        dtype: int64
+
+        **dict-like `to_replace`**
+
+        >>> df.replace({0: 10, 1: 100})
+             A  B  C
+        0   10  5  a
+        1  100  6  b
+        2    2  7  c
+        3    3  8  d
+        4    4  9  e
+
+        >>> df.replace({'A': 0, 'B': 5}, 100)
+             A    B  C
+        0  100  100  a
+        1    1    6  b
+        2    2    7  c
+        3    3    8  d
+        4    4    9  e
+
+        >>> df.replace({'A': {0: 100, 4: 400}})
+             A  B  C
+        0  100  5  a
+        1    1  6  b
+        2    2  7  c
+        3    3  8  d
+        4  400  9  e
+
+        **Regular expression `to_replace`**
+
+        >>> df = pd.DataFrame({'A': ['bat', 'foo', 'bait'],
+        ...                    'B': ['abc', 'bar', 'xyz']})
+        >>> df.replace(to_replace=r'^ba.$', value='new', regex=True)
+              A    B
+        0   new  abc
+        1   foo  new
+        2  bait  xyz
+
+        >>> df.replace({'A': r'^ba.$'}, {'A': 'new'}, regex=True)
+              A    B
+        0   new  abc
+        1   foo  bar
+        2  bait  xyz
+
+        >>> df.replace(regex=r'^ba.$', value='new')
+              A    B
+        0   new  abc
+        1   foo  new
+        2  bait  xyz
+
+        >>> df.replace(regex={r'^ba.$':'new', 'foo':'xyz'})
+              A    B
+        0   new  abc
+        1   xyz  new
+        2  bait  xyz
+
+        >>> df.replace(regex=[r'^ba.$', 'foo'], value='new')
+              A    B
+        0   new  abc
+        1   new  new
+        2  bait  xyz
+
+        Note that when replacing multiple ``bool`` or ``datetime64`` objects,
+        the data types in the `to_replace` parameter must match the data
+        type of the value being replaced:
+
+        >>> df = pd.DataFrame({'A': [True, False, True],
+        ...                    'B': [False, True, False]})
+        >>> df.replace({'a string': 'new value', True: False})  # raises
+        Traceback (most recent call last):
+            ...
+        TypeError: Cannot compare types 'ndarray(dtype=bool)' and 'str'
+
+        This raises a ``TypeError`` because one of the ``dict`` keys is not of
+        the correct type for replacement.
+
+        Compare the behavior of ``s.replace({'a': None})`` and
+        ``s.replace('a', None)`` to understand the peculiarities
+        of the `to_replace` parameter:
+
+        >>> s = pd.Series([10, 'a', 'a', 'b', 'a'])
+
+        When one uses a dict as the `to_replace` value, it is like the
+        value(s) in the dict are equal to the `value` parameter.
+        ``s.replace({'a': None})`` is equivalent to
+        ``s.replace(to_replace={'a': None}, value=None, method=None)``:
+
+        >>> s.replace({'a': None})
+        0      10
+        1    None
+        2    None
+        3       b
+        4    None
+        dtype: object
+
+        When ``value=None`` and `to_replace` is a scalar, list or
+        tuple, `replace` uses the method parameter (default 'pad') to do the
+        replacement. So this is why the 'a' values are being replaced by 10
+        in rows 1 and 2 and 'b' in row 4 in this case.
+        The command ``s.replace('a', None)`` is actually equivalent to
+        ``s.replace(to_replace='a', value=None, method='pad')``:
+
+        >>> s.replace('a', None)
+        0    10
+        1    10
+        2    10
+        3     b
+        4     b
+        dtype: object
+    """)
+
+    @Appender(_shared_docs['replace'] % _shared_doc_kwargs)
+    def replace(self, to_replace=None, value=None, inplace=False, limit=None,
+                regex=False, method='pad'):
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if not is_bool(regex) and to_replace is not None:
             raise AssertionError("'to_replace' must be 'None' if 'regex' is "
                                  "not a bool")
-        if axis is not None:
-            from warnings import warn
-            warn('the "axis" argument is deprecated and will be removed in'
-                 'v0.13; this argument has no effect')
 
         self._consolidate_inplace()
 
         if value is None:
             # passing a single value that is scalar like
             # when value is None (GH5319), for compat
-            if not is_dictlike(to_replace) and not is_dictlike(regex):
+            if not is_dict_like(to_replace) and not is_dict_like(regex):
                 to_replace = [to_replace]
 
             if isinstance(to_replace, (tuple, list)):
+                if isinstance(self, pd.DataFrame):
+                    return self.apply(_single_replace,
+                                      args=(to_replace, method, inplace,
+                                            limit))
                 return _single_replace(self, to_replace, method, inplace,
                                        limit)
 
-            if not is_dictlike(to_replace):
-                if not is_dictlike(regex):
+            if not is_dict_like(to_replace):
+                if not is_dict_like(regex):
                     raise TypeError('If "to_replace" and "value" are both None'
                                     ' and "to_replace" is not a list, then '
                                     'regex must be a mapping')
@@ -2890,9 +5772,9 @@ def replace(self, to_replace=None, value=None, inplace=False, limit=None,
                 regex = True
 
             items = list(compat.iteritems(to_replace))
-            keys, values = zip(*items)
+            keys, values = lzip(*items) or ([], [])
 
-            are_mappings = [is_dictlike(v) for v in values]
+            are_mappings = [is_dict_like(v) for v in values]
 
             if any(are_mappings):
                 if not all(are_mappings):
@@ -2904,7 +5786,7 @@ def replace(self, to_replace=None, value=None, inplace=False, limit=None,
                 value_dict = {}
 
                 for k, v in items:
-                    keys, values = zip(*v.items())
+                    keys, values = lzip(*v.items()) or ([], [])
                     if set(keys) & set(values):
                         raise ValueError("Replacement not allowed with "
                                          "overlapping keys and values")
@@ -2925,11 +5807,13 @@ def replace(self, to_replace=None, value=None, inplace=False, limit=None,
                     return self
 
             new_data = self._data
-            if is_dictlike(to_replace):
-                if is_dictlike(value):  # {'A' : NA} -> {'A' : 0}
+            if is_dict_like(to_replace):
+                if is_dict_like(value):  # {'A' : NA} -> {'A' : 0}
                     res = self if inplace else self.copy()
                     for c, src in compat.iteritems(to_replace):
                         if c in value and c in self:
+                            # object conversion is handled in
+                            # series.replace which is called recursivelly
                             res[c] = res[c].replace(to_replace=src,
                                                     value=value[c],
                                                     inplace=False,
@@ -2937,20 +5821,24 @@ def replace(self, to_replace=None, value=None, inplace=False, limit=None,
                     return None if inplace else res
 
                 # {'A': NA} -> 0
-                elif not com.is_list_like(value):
-                    for k, src in compat.iteritems(to_replace):
-                        if k in self:
-                            new_data = new_data.replace(to_replace=src,
-                                                        value=value,
-                                                        filter=[k],
-                                                        inplace=inplace,
-                                                        regex=regex)
+                elif not is_list_like(value):
+                    keys = [(k, src) for k, src in compat.iteritems(to_replace)
+                            if k in self]
+                    keys_len = len(keys) - 1
+                    for i, (k, src) in enumerate(keys):
+                        convert = i == keys_len
+                        new_data = new_data.replace(to_replace=src,
+                                                    value=value,
+                                                    filter=[k],
+                                                    inplace=inplace,
+                                                    regex=regex,
+                                                    convert=convert)
                 else:
                     raise TypeError('value argument must be scalar, dict, or '
                                     'Series')
 
-            elif com.is_list_like(to_replace):  # [NA, ''] -> [0, 'missing']
-                if com.is_list_like(value):
+            elif is_list_like(to_replace):  # [NA, ''] -> [0, 'missing']
+                if is_list_like(value):
                     if len(to_replace) != len(value):
                         raise ValueError('Replacement lists must match '
                                          'in length. Expecting %d got %d ' %
@@ -2963,13 +5851,11 @@ def replace(self, to_replace=None, value=None, inplace=False, limit=None,
 
                 else:  # [NA, ''] -> 0
                     new_data = self._data.replace(to_replace=to_replace,
-                                                  value=value,
-                                                  inplace=inplace,
+                                                  value=value, inplace=inplace,
                                                   regex=regex)
             elif to_replace is None:
-                if not (com.is_re_compilable(regex) or
-                        com.is_list_like(regex) or
-                        is_dictlike(regex)):
+                if not (is_re_compilable(regex) or
+                        is_list_like(regex) or is_dict_like(regex)):
                     raise TypeError("'regex' must be a string or a compiled "
                                     "regular expression or a list or dict of "
                                     "strings or regular expressions, you "
@@ -2980,45 +5866,40 @@ def replace(self, to_replace=None, value=None, inplace=False, limit=None,
             else:
 
                 # dest iterable dict-like
-                if is_dictlike(value):  # NA -> {'A' : 0, 'B' : -1}
+                if is_dict_like(value):  # NA -> {'A' : 0, 'B' : -1}
                     new_data = self._data
 
                     for k, v in compat.iteritems(value):
                         if k in self:
                             new_data = new_data.replace(to_replace=to_replace,
-                                                        value=v,
-                                                        filter=[k],
+                                                        value=v, filter=[k],
                                                         inplace=inplace,
                                                         regex=regex)
 
-                elif not com.is_list_like(value):  # NA -> 0
-                    new_data = self._data.replace(to_replace=to_replace, value=value,
-                                                  inplace=inplace, regex=regex)
+                elif not is_list_like(value):  # NA -> 0
+                    new_data = self._data.replace(to_replace=to_replace,
+                                                  value=value, inplace=inplace,
+                                                  regex=regex)
                 else:
                     msg = ('Invalid "to_replace" type: '
                            '{0!r}').format(type(to_replace).__name__)
                     raise TypeError(msg)  # pragma: no cover
 
-        new_data = new_data.convert(copy=not inplace, numeric=False)
-
         if inplace:
             self._update_inplace(new_data)
         else:
             return self._constructor(new_data).__finalize__(self)
 
-    def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
-                    limit_direction='forward', downcast=None, **kwargs):
-        """
-        Interpolate values according to different methods.
-
-        Please note that only ``method='linear'`` is supported for DataFrames/Series
-        with a MultiIndex.
+    _shared_docs['interpolate'] = """
+        Please note that only ``method='linear'`` is supported for
+        DataFrames/Series with a MultiIndex.
 
         Parameters
         ----------
         method : {'linear', 'time', 'index', 'values', 'nearest', 'zero',
                   'slinear', 'quadratic', 'cubic', 'barycentric', 'krogh',
-                  'polynomial', 'spline' 'piecewise_polynomial', 'pchip'}
+                  'polynomial', 'spline', 'piecewise_polynomial',
+                  'from_derivatives', 'pchip', 'akima'}
 
             * 'linear': ignore the index and treat the values as equally
               spaced. This is the only method supported on MultiIndexes.
@@ -3032,24 +5913,40 @@ def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
               require that you also specify an `order` (int),
               e.g. df.interpolate(method='polynomial', order=4).
               These use the actual numerical values of the index.
-            * 'krogh', 'piecewise_polynomial', 'spline', and 'pchip' are all
-              wrappers around the scipy interpolation methods of similar
-              names. These use the actual numerical values of the index. See
-              the scipy documentation for more on their behavior
-              `here <http://docs.scipy.org/doc/scipy/reference/interpolate.html#univariate-interpolation>`__
-              `and here <http://docs.scipy.org/doc/scipy/reference/tutorial/interpolate.html>`__
+            * 'krogh', 'piecewise_polynomial', 'spline', 'pchip' and 'akima'
+              are all wrappers around the scipy interpolation methods of
+              similar names. These use the actual numerical values of the
+              index. For more information on their behavior, see the
+              `scipy documentation
+              <http://docs.scipy.org/doc/scipy/reference/interpolate.html#univariate-interpolation>`__
+              and `tutorial documentation
+              <http://docs.scipy.org/doc/scipy/reference/tutorial/interpolate.html>`__
+            * 'from_derivatives' refers to BPoly.from_derivatives which
+              replaces 'piecewise_polynomial' interpolation method in
+              scipy 0.18
+
+            .. versionadded:: 0.18.1
+
+               Added support for the 'akima' method
+               Added interpolate method 'from_derivatives' which replaces
+               'piecewise_polynomial' in scipy 0.18; backwards-compatible with
+               scipy < 0.18
 
         axis : {0, 1}, default 0
             * 0: fill column-by-column
             * 1: fill row-by-row
         limit : int, default None.
-            Maximum number of consecutive NaNs to fill.
-        limit_direction : {'forward', 'backward', 'both'}, defaults to 'forward'
+            Maximum number of consecutive NaNs to fill. Must be greater than 0.
+        limit_direction : {'forward', 'backward', 'both'}, default 'forward'
+        limit_area : {'inside', 'outside'}, default None
+            * None: (default) no fill restriction
+            * 'inside' Only fill NaNs surrounded by valid values (interpolate).
+            * 'outside' Only fill NaNs outside valid values (extrapolate).
+
             If limit is specified, consecutive NaNs will be filled in this
             direction.
 
-            .. versionadded:: 0.17.0
-
+            .. versionadded:: 0.21.0
         inplace : bool, default False
             Update the NDFrame in place if possible.
         downcast : optional, 'infer' or None, defaults to None
@@ -3078,6 +5975,16 @@ def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
         dtype: float64
 
         """
+
+    @Appender(_shared_docs['interpolate'] % _shared_doc_kwargs)
+    def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
+                    limit_direction='forward', limit_area=None,
+                    downcast=None, **kwargs):
+        """
+        Interpolate values according to different methods.
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
         if self.ndim > 2:
             raise NotImplementedError("Interpolate has not been implemented "
                                       "on Panel and Panel 4D objects.")
@@ -3097,34 +6004,34 @@ def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
         else:
             alt_ax = ax
 
-        if isinstance(_maybe_transposed_self.index, MultiIndex) and method != 'linear':
+        if (isinstance(_maybe_transposed_self.index, MultiIndex) and
+                method != 'linear'):
             raise ValueError("Only `method=linear` interpolation is supported "
                              "on MultiIndexes.")
 
-        if _maybe_transposed_self._data.get_dtype_counts().get('object') == len(_maybe_transposed_self.T):
+        if _maybe_transposed_self._data.get_dtype_counts().get(
+                'object') == len(_maybe_transposed_self.T):
             raise TypeError("Cannot interpolate with all NaNs.")
 
         # create/use the index
         if method == 'linear':
-            index = np.arange(len(_maybe_transposed_self._get_axis(alt_ax)))  # prior default
+            # prior default
+            index = np.arange(len(_maybe_transposed_self._get_axis(alt_ax)))
         else:
             index = _maybe_transposed_self._get_axis(alt_ax)
 
-        if pd.isnull(index).any():
+        if isna(index).any():
             raise NotImplementedError("Interpolation with NaNs in the index "
                                       "has not been implemented. Try filling "
                                       "those NaNs before interpolating.")
-        new_data = _maybe_transposed_self._data.interpolate(
-            method=method,
-            axis=ax,
-            index=index,
-            values=_maybe_transposed_self,
-            limit=limit,
-            limit_direction=limit_direction,
-            inplace=inplace,
-            downcast=downcast,
-            **kwargs
-        )
+        data = _maybe_transposed_self._data
+        new_data = data.interpolate(method=method, axis=ax, index=index,
+                                    values=_maybe_transposed_self, limit=limit,
+                                    limit_direction=limit_direction,
+                                    limit_area=limit_area,
+                                    inplace=inplace, downcast=downcast,
+                                    **kwargs)
+
         if inplace:
             if axis == 1:
                 new_data = self._constructor(new_data).T._data
@@ -3135,126 +6042,436 @@ def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
                 res = res.T
             return res
 
-    #----------------------------------------------------------------------
-    # Action Methods
-
-    def isnull(self):
-        """
-        Return a boolean same-sized object indicating if the values are null
+    # ----------------------------------------------------------------------
+    # Timeseries methods Methods
 
-        See also
-        --------
-        notnull : boolean inverse of isnull
+    def asof(self, where, subset=None):
         """
-        return isnull(self).__finalize__(self)
-
-    def notnull(self):
-        """Return a boolean same-sized object indicating if the values are
-        not null
+        The last row without any NaN is taken (or the last row without
+        NaN considering only the subset of columns in the case of a DataFrame)
 
-        See also
-        --------
-        isnull : boolean inverse of notnull
-        """
-        return notnull(self).__finalize__(self)
+        .. versionadded:: 0.19.0 For DataFrame
 
-    def clip(self, lower=None, upper=None, out=None, axis=None):
-        """
-        Trim values at input threshold(s)
+        If there is no good value, NaN is returned for a Series
+        a Series of NaN values for a DataFrame
 
         Parameters
         ----------
-        lower : float or array_like, default None
-        upper : float or array_like, default None
-        axis : int or string axis name, optional
-            Align object with lower and upper along the given axis.
+        where : date or array of dates
+        subset : string or list of strings, default None
+           if not None use these columns for NaN propagation
+
+        Notes
+        -----
+        Dates are assumed to be sorted
+        Raises if this is not the case
 
         Returns
         -------
-        clipped : Series
+        where is scalar
 
-        Examples
+          - value or NaN if input is Series
+          - Series if input is DataFrame
+
+        where is Index: same shape object as input
+
+        See Also
         --------
-        >>> df
-          0         1
-        0  0.335232 -1.256177
-        1 -1.367855  0.746646
-        2  0.027753 -1.176076
-        3  0.230930 -0.679613
-        4  1.261967  0.570967
-        >>> df.clip(-1.0, 0.5)
-                  0         1
-        0  0.335232 -1.000000
-        1 -1.000000  0.500000
-        2  0.027753 -1.000000
-        3  0.230930 -0.679613
-        4  0.500000  0.500000
-        >>> t
-        0   -0.3
-        1   -0.2
-        2   -0.1
-        3    0.0
-        4    0.1
-        dtype: float64
-        >>> df.clip(t, t + 1, axis=0)
-                  0         1
-        0  0.335232 -0.300000
-        1 -0.200000  0.746646
-        2  0.027753 -0.100000
-        3  0.230930  0.000000
-        4  1.100000  0.570967
+        merge_asof
+
         """
-        if out is not None:  # pragma: no cover
-            raise Exception('out argument is not supported yet')
 
-        # GH 2747 (arguments were reversed)
-        if lower is not None and upper is not None:
-            if lib.isscalar(lower) and lib.isscalar(upper):
-                lower, upper = min(lower, upper), max(lower, upper)
+        if isinstance(where, compat.string_types):
+            from pandas import to_datetime
+            where = to_datetime(where)
 
-        result = self
-        if lower is not None:
-            result = result.clip_lower(lower, axis)
-        if upper is not None:
-            result = result.clip_upper(upper, axis)
+        if not self.index.is_monotonic:
+            raise ValueError("asof requires a sorted index")
 
-        return result
+        is_series = isinstance(self, ABCSeries)
+        if is_series:
+            if subset is not None:
+                raise ValueError("subset is not valid for Series")
+        elif self.ndim > 2:
+            raise NotImplementedError("asof is not implemented "
+                                      "for {type}".format(type=type(self)))
+        else:
+            if subset is None:
+                subset = self.columns
+            if not is_list_like(subset):
+                subset = [subset]
+
+        is_list = is_list_like(where)
+        if not is_list:
+            start = self.index[0]
+            if isinstance(self.index, PeriodIndex):
+                where = Period(where, freq=self.index.freq).ordinal
+                start = start.ordinal
+
+            if where < start:
+                if not is_series:
+                    from pandas import Series
+                    return Series(index=self.columns, name=where)
+                return np.nan
+
+            # It's always much faster to use a *while* loop here for
+            # Series than pre-computing all the NAs. However a
+            # *while* loop is extremely expensive for DataFrame
+            # so we later pre-compute all the NAs and use the same
+            # code path whether *where* is a scalar or list.
+            # See PR: https://github.com/pandas-dev/pandas/pull/14476
+            if is_series:
+                loc = self.index.searchsorted(where, side='right')
+                if loc > 0:
+                    loc -= 1
+
+                values = self._values
+                while loc > 0 and isna(values[loc]):
+                    loc -= 1
+                return values[loc]
+
+        if not isinstance(where, Index):
+            where = Index(where) if is_list else Index([where])
+
+        nulls = self.isna() if is_series else self[subset].isna().any(1)
+        if nulls.all():
+            if is_series:
+                return self._constructor(np.nan, index=where, name=self.name)
+            elif is_list:
+                from pandas import DataFrame
+                return DataFrame(np.nan, index=where, columns=self.columns)
+            else:
+                from pandas import Series
+                return Series(np.nan, index=self.columns, name=where[0])
 
-    def clip_upper(self, threshold, axis=None):
-        """
-        Return copy of input with values above given value(s) truncated
+        locs = self.index.asof_locs(where, ~(nulls.values))
 
-        Parameters
-        ----------
-        threshold : float or array_like
-        axis : int or string axis name, optional
-            Align object with threshold along the given axis.
+        # mask the missing
+        missing = locs == -1
+        data = self.take(locs, is_copy=False)
+        data.index = where
+        data.loc[missing] = np.nan
+        return data if is_list else data.iloc[-1]
 
-        See also
+    # ----------------------------------------------------------------------
+    # Action Methods
+
+    _shared_docs['isna'] = """
+        Detect missing values.
+
+        Return a boolean same-sized object indicating if the values are NA.
+        NA values, such as None or :attr:`numpy.NaN`, gets mapped to True
+        values.
+        Everything else gets mapped to False values. Characters such as empty
+        strings ``''`` or :attr:`numpy.inf` are not considered NA values
+        (unless you set ``pandas.options.mode.use_inf_as_na = True``).
+
+        Returns
+        -------
+        %(klass)s
+            Mask of bool values for each element in %(klass)s that
+            indicates whether an element is not an NA value.
+
+        See Also
         --------
-        clip
+        %(klass)s.isnull : alias of isna
+        %(klass)s.notna : boolean inverse of isna
+        %(klass)s.dropna : omit axes labels with missing values
+        isna : top-level isna
+
+        Examples
+        --------
+        Show which entries in a DataFrame are NA.
+
+        >>> df = pd.DataFrame({'age': [5, 6, np.NaN],
+        ...                    'born': [pd.NaT, pd.Timestamp('1939-05-27'),
+        ...                             pd.Timestamp('1940-04-25')],
+        ...                    'name': ['Alfred', 'Batman', ''],
+        ...                    'toy': [None, 'Batmobile', 'Joker']})
+        >>> df
+           age       born    name        toy
+        0  5.0        NaT  Alfred       None
+        1  6.0 1939-05-27  Batman  Batmobile
+        2  NaN 1940-04-25              Joker
+
+        >>> df.isna()
+             age   born   name    toy
+        0  False   True  False   True
+        1  False  False  False  False
+        2   True  False  False  False
+
+        Show which entries in a Series are NA.
+
+        >>> ser = pd.Series([5, 6, np.NaN])
+        >>> ser
+        0    5.0
+        1    6.0
+        2    NaN
+        dtype: float64
+
+        >>> ser.isna()
+        0    False
+        1    False
+        2     True
+        dtype: bool
+        """
+
+    @Appender(_shared_docs['isna'] % _shared_doc_kwargs)
+    def isna(self):
+        return isna(self).__finalize__(self)
+
+    @Appender(_shared_docs['isna'] % _shared_doc_kwargs)
+    def isnull(self):
+        return isna(self).__finalize__(self)
+
+    _shared_docs['notna'] = """
+        Detect existing (non-missing) values.
+
+        Return a boolean same-sized object indicating if the values are not NA.
+        Non-missing values get mapped to True. Characters such as empty
+        strings ``''`` or :attr:`numpy.inf` are not considered NA values
+        (unless you set ``pandas.options.mode.use_inf_as_na = True``).
+        NA values, such as None or :attr:`numpy.NaN`, get mapped to False
+        values.
 
         Returns
         -------
-        clipped : same type as input
+        %(klass)s
+            Mask of bool values for each element in %(klass)s that
+            indicates whether an element is not an NA value.
+
+        See Also
+        --------
+        %(klass)s.notnull : alias of notna
+        %(klass)s.isna : boolean inverse of notna
+        %(klass)s.dropna : omit axes labels with missing values
+        notna : top-level notna
+
+        Examples
+        --------
+        Show which entries in a DataFrame are not NA.
+
+        >>> df = pd.DataFrame({'age': [5, 6, np.NaN],
+        ...                    'born': [pd.NaT, pd.Timestamp('1939-05-27'),
+        ...                             pd.Timestamp('1940-04-25')],
+        ...                    'name': ['Alfred', 'Batman', ''],
+        ...                    'toy': [None, 'Batmobile', 'Joker']})
+        >>> df
+           age       born    name        toy
+        0  5.0        NaT  Alfred       None
+        1  6.0 1939-05-27  Batman  Batmobile
+        2  NaN 1940-04-25              Joker
+
+        >>> df.notna()
+             age   born  name    toy
+        0   True  False  True  False
+        1   True   True  True   True
+        2  False   True  True   True
+
+        Show which entries in a Series are not NA.
+
+        >>> ser = pd.Series([5, 6, np.NaN])
+        >>> ser
+        0    5.0
+        1    6.0
+        2    NaN
+        dtype: float64
+
+        >>> ser.notna()
+        0     True
+        1     True
+        2    False
+        dtype: bool
         """
-        if np.any(isnull(threshold)):
+
+    @Appender(_shared_docs['notna'] % _shared_doc_kwargs)
+    def notna(self):
+        return notna(self).__finalize__(self)
+
+    @Appender(_shared_docs['notna'] % _shared_doc_kwargs)
+    def notnull(self):
+        return notna(self).__finalize__(self)
+
+    def _clip_with_scalar(self, lower, upper, inplace=False):
+        if ((lower is not None and np.any(isna(lower))) or
+                (upper is not None and np.any(isna(upper)))):
             raise ValueError("Cannot use an NA value as a clip threshold")
 
-        subset = self.le(threshold, axis=axis) | isnull(self)
-        return self.where(subset, threshold, axis=axis)
+        result = self.values
+        mask = isna(result)
+
+        with np.errstate(all='ignore'):
+            if upper is not None:
+                result = np.where(result >= upper, upper, result)
+            if lower is not None:
+                result = np.where(result <= lower, lower, result)
+        if np.any(mask):
+            result[mask] = np.nan
+
+        axes_dict = self._construct_axes_dict()
+        result = self._constructor(result, **axes_dict).__finalize__(self)
+
+        if inplace:
+            self._update_inplace(result)
+        else:
+            return result
+
+    def _clip_with_one_bound(self, threshold, method, axis, inplace):
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if axis is not None:
+            axis = self._get_axis_number(axis)
+
+        # method is self.le for upper bound and self.ge for lower bound
+        if is_scalar(threshold) and is_number(threshold):
+            if method.__name__ == 'le':
+                return self._clip_with_scalar(None, threshold, inplace=inplace)
+            return self._clip_with_scalar(threshold, None, inplace=inplace)
+
+        subset = method(threshold, axis=axis) | isna(self)
+
+        # GH #15390
+        # In order for where method to work, the threshold must
+        # be transformed to NDFrame from other array like structure.
+        if (not isinstance(threshold, ABCSeries)) and is_list_like(threshold):
+            if isinstance(self, ABCSeries):
+                threshold = pd.Series(threshold, index=self.index)
+            else:
+                threshold = _align_method_FRAME(self, np.asarray(threshold),
+                                                axis)
+        return self.where(subset, threshold, axis=axis, inplace=inplace)
+
+    def clip(self, lower=None, upper=None, axis=None, inplace=False,
+             *args, **kwargs):
+        """
+        Trim values at input threshold(s).
+
+        Assigns values outside boundary to boundary values. Thresholds
+        can be singular values or array like, and in the latter case
+        the clipping is performed element-wise in the specified axis.
+
+        Parameters
+        ----------
+        lower : float or array_like, default None
+            Minimum threshold value. All values below this
+            threshold will be set to it.
+        upper : float or array_like, default None
+            Maximum threshold value. All values above this
+            threshold will be set to it.
+        axis : int or string axis name, optional
+            Align object with lower and upper along the given axis.
+        inplace : boolean, default False
+            Whether to perform the operation in place on the data.
+
+            .. versionadded:: 0.21.0
+        *args, **kwargs
+            Additional keywords have no effect but might be accepted
+            for compatibility with numpy.
+
+        See Also
+        --------
+        clip_lower : Clip values below specified threshold(s).
+        clip_upper : Clip values above specified threshold(s).
+
+        Returns
+        -------
+        Series or DataFrame
+            Same type as calling object with the values outside the
+            clip boundaries replaced
+
+        Examples
+        --------
+        >>> data = {'col_0': [9, -3, 0, -1, 5], 'col_1': [-2, -7, 6, 8, -5]}
+        >>> df = pd.DataFrame(data)
+        >>> df
+           col_0  col_1
+        0      9     -2
+        1     -3     -7
+        2      0      6
+        3     -1      8
+        4      5     -5
+
+        Clips per column using lower and upper thresholds:
+
+        >>> df.clip(-4, 6)
+           col_0  col_1
+        0      6     -2
+        1     -3     -4
+        2      0      6
+        3     -1      6
+        4      5     -4
+
+        Clips using specific lower and upper thresholds per column element:
+
+        >>> t = pd.Series([2, -4, -1, 6, 3])
+        >>> t
+        0    2
+        1   -4
+        2   -1
+        3    6
+        4    3
+        dtype: int64
+
+        >>> df.clip(t, t + 4, axis=0)
+           col_0  col_1
+        0      6      2
+        1     -3     -4
+        2      0      3
+        3      6      8
+        4      5      3
+        """
+        if isinstance(self, ABCPanel):
+            raise NotImplementedError("clip is not supported yet for panels")
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
+        axis = nv.validate_clip_with_axis(axis, args, kwargs)
+        if axis is not None:
+            axis = self._get_axis_number(axis)
+
+        # GH 17276
+        # numpy doesn't like NaN as a clip value
+        # so ignore
+        if np.any(pd.isnull(lower)):
+            lower = None
+        if np.any(pd.isnull(upper)):
+            upper = None
+
+        # GH 2747 (arguments were reversed)
+        if lower is not None and upper is not None:
+            if is_scalar(lower) and is_scalar(upper):
+                lower, upper = min(lower, upper), max(lower, upper)
+
+        # fast-path for scalars
+        if ((lower is None or (is_scalar(lower) and is_number(lower))) and
+                (upper is None or (is_scalar(upper) and is_number(upper)))):
+            return self._clip_with_scalar(lower, upper, inplace=inplace)
+
+        result = self
+        if lower is not None:
+            result = result.clip_lower(lower, axis, inplace=inplace)
+        if upper is not None:
+            if inplace:
+                result = self
+            result = result.clip_upper(upper, axis, inplace=inplace)
 
-    def clip_lower(self, threshold, axis=None):
+        return result
+
+    def clip_upper(self, threshold, axis=None, inplace=False):
         """
-        Return copy of the input with values below given value(s) truncated
+        Return copy of input with values above given value(s) truncated.
 
         Parameters
         ----------
         threshold : float or array_like
         axis : int or string axis name, optional
             Align object with threshold along the given axis.
+        inplace : boolean, default False
+            Whether to perform the operation in place on the data
 
-        See also
+            .. versionadded:: 0.21.0
+
+        See Also
         --------
         clip
 
@@ -3262,25 +6479,130 @@ def clip_lower(self, threshold, axis=None):
         -------
         clipped : same type as input
         """
-        if np.any(isnull(threshold)):
-            raise ValueError("Cannot use an NA value as a clip threshold")
+        return self._clip_with_one_bound(threshold, method=self.le,
+                                         axis=axis, inplace=inplace)
 
-        subset = self.ge(threshold, axis=axis) | isnull(self)
-        return self.where(subset, threshold, axis=axis)
+    def clip_lower(self, threshold, axis=None, inplace=False):
+        """
+        Return copy of the input with values below a threshold truncated.
+
+        Parameters
+        ----------
+        threshold : numeric or array-like
+            Minimum value allowed. All values below threshold will be set to
+            this value.
+
+            * float : every value is compared to `threshold`.
+            * array-like : The shape of `threshold` should match the object
+              it's compared to. When `self` is a Series, `threshold` should be
+              the length. When `self` is a DataFrame, `threshold` should 2-D
+              and the same shape as `self` for ``axis=None``, or 1-D and the
+              same length as the axis being compared.
+
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            Align `self` with `threshold` along the given axis.
+
+        inplace : boolean, default False
+            Whether to perform the operation in place on the data.
+
+            .. versionadded:: 0.21.0
+
+        See Also
+        --------
+        Series.clip : Return copy of input with values below and above
+            thresholds truncated.
+        Series.clip_upper : Return copy of input with values above
+            threshold truncated.
+
+        Returns
+        -------
+        clipped : same type as input
+
+        Examples
+        --------
+        Series single threshold clipping:
+
+        >>> s = pd.Series([5, 6, 7, 8, 9])
+        >>> s.clip_lower(8)
+        0    8
+        1    8
+        2    8
+        3    8
+        4    9
+        dtype: int64
+
+        Series clipping element-wise using an array of thresholds. `threshold`
+        should be the same length as the Series.
+
+        >>> elemwise_thresholds = [4, 8, 7, 2, 5]
+        >>> s.clip_lower(elemwise_thresholds)
+        0    5
+        1    8
+        2    7
+        3    8
+        4    9
+        dtype: int64
+
+        DataFrames can be compared to a scalar.
+
+        >>> df = pd.DataFrame({"A": [1, 3, 5], "B": [2, 4, 6]})
+        >>> df
+           A  B
+        0  1  2
+        1  3  4
+        2  5  6
+
+        >>> df.clip_lower(3)
+           A  B
+        0  3  3
+        1  3  4
+        2  5  6
+
+        Or to an array of values. By default, `threshold` should be the same
+        shape as the DataFrame.
+
+        >>> df.clip_lower(np.array([[3, 4], [2, 2], [6, 2]]))
+           A  B
+        0  3  4
+        1  3  4
+        2  6  6
+
+        Control how `threshold` is broadcast with `axis`. In this case
+        `threshold` should be the same length as the axis specified by
+        `axis`.
+
+        >>> df.clip_lower(np.array([3, 3, 5]), axis='index')
+           A  B
+        0  3  3
+        1  3  4
+        2  5  6
+
+        >>> df.clip_lower(np.array([4, 5]), axis='columns')
+           A  B
+        0  4  5
+        1  4  5
+        2  5  6
+        """
+        return self._clip_with_one_bound(threshold, method=self.ge,
+                                         axis=axis, inplace=inplace)
 
     def groupby(self, by=None, axis=0, level=None, as_index=True, sort=True,
-                group_keys=True, squeeze=False):
+                group_keys=True, squeeze=False, observed=False, **kwargs):
         """
         Group series using mapper (dict or key function, apply given function
-        to group, return result as series) or by a series of columns
+        to group, return result as series) or by a series of columns.
 
         Parameters
         ----------
-        by : mapping function / list of functions, dict, Series, or tuple /
-            list of column names.
-            Called on each element of the object index to determine the groups.
-            If a dict or Series is passed, the Series or dict VALUES will be
-            used to determine the groups
+        by : mapping, function, label, or list of labels
+            Used to determine the groups for the groupby.
+            If ``by`` is a function, it's called on each value of the object's
+            index. If a dict or Series is passed, the Series or dict VALUES
+            will be used to determine the groups (the Series' values are first
+            aligned; see ``.align()`` method). If an ndarray is passed, the
+            values are used as-is determine the groups. A label or list of
+            labels may be passed to group by the columns in ``self``. Notice
+            that a tuple is interpreted a (single) key.
         axis : int, default 0
         level : int, level name, or sequence of such, default None
             If the axis is a MultiIndex (hierarchical), group by a particular
@@ -3291,13 +6613,23 @@ def groupby(self, by=None, axis=0, level=None, as_index=True, sort=True,
             effectively "SQL-style" grouped output
         sort : boolean, default True
             Sort group keys. Get better performance by turning this off.
-            Note this does not influence the order of observations within each group.
-            groupby preserves the order of rows within each group.
+            Note this does not influence the order of observations within each
+            group.  groupby preserves the order of rows within each group.
         group_keys : boolean, default True
             When calling apply, add group keys to index to identify pieces
         squeeze : boolean, default False
             reduce the dimensionality of the return type if possible,
             otherwise return a consistent type
+        observed : boolean, default False
+            This only applies if any of the groupers are Categoricals
+            If True: only show observed values for categorical groupers.
+            If False: show all values for categorical groupers.
+
+            .. versionadded:: 0.23.0
+
+        Returns
+        -------
+        GroupBy object
 
         Examples
         --------
@@ -3310,47 +6642,132 @@ def groupby(self, by=None, axis=0, level=None, as_index=True, sort=True,
 
         >>> data.groupby(['col1', 'col2']).mean()
 
-        Returns
-        -------
-        GroupBy object
+        Notes
+        -----
+        See the `user guide
+        <http://pandas.pydata.org/pandas-docs/stable/groupby.html>`_ for more.
 
+        See also
+        --------
+        resample : Convenience method for frequency conversion and resampling
+            of time series.
         """
-        from pandas.core.groupby import groupby
+        from pandas.core.groupby.groupby import groupby
 
         if level is None and by is None:
             raise TypeError("You have to supply one of 'by' and 'level'")
         axis = self._get_axis_number(axis)
         return groupby(self, by=by, axis=axis, level=level, as_index=as_index,
-                       sort=sort, group_keys=group_keys, squeeze=squeeze)
+                       sort=sort, group_keys=group_keys, squeeze=squeeze,
+                       observed=observed, **kwargs)
 
-    def asfreq(self, freq, method=None, how=None, normalize=False):
+    def asfreq(self, freq, method=None, how=None, normalize=False,
+               fill_value=None):
         """
-        Convert all TimeSeries inside to specified frequency using DateOffset
-        objects. Optionally provide fill method to pad/backfill missing values.
+        Convert TimeSeries to specified frequency.
+
+        Optionally provide filling method to pad/backfill missing values.
+
+        Returns the original data conformed to a new index with the specified
+        frequency. ``resample`` is more appropriate if an operation, such as
+        summarization, is necessary to represent the data at the new frequency.
 
         Parameters
         ----------
         freq : DateOffset object, or string
-        method : {'backfill', 'bfill', 'pad', 'ffill', None}
-            Method to use for filling holes in reindexed Series
-            pad / ffill: propagate last valid observation forward to next valid
-            backfill / bfill: use NEXT valid observation to fill method
+        method : {'backfill'/'bfill', 'pad'/'ffill'}, default None
+            Method to use for filling holes in reindexed Series (note this
+            does not fill NaNs that already were present):
+
+            * 'pad' / 'ffill': propagate last valid observation forward to next
+              valid
+            * 'backfill' / 'bfill': use NEXT valid observation to fill
         how : {'start', 'end'}, default end
             For PeriodIndex only, see PeriodIndex.asfreq
         normalize : bool, default False
             Whether to reset output index to midnight
+        fill_value: scalar, optional
+            Value to use for missing values, applied during upsampling (note
+            this does not fill NaNs that already were present).
+
+            .. versionadded:: 0.20.0
 
         Returns
         -------
-        converted : type of caller
+        converted : same type as caller
+
+        Examples
+        --------
+
+        Start by creating a series with 4 one minute timestamps.
+
+        >>> index = pd.date_range('1/1/2000', periods=4, freq='T')
+        >>> series = pd.Series([0.0, None, 2.0, 3.0], index=index)
+        >>> df = pd.DataFrame({'s':series})
+        >>> df
+                               s
+        2000-01-01 00:00:00    0.0
+        2000-01-01 00:01:00    NaN
+        2000-01-01 00:02:00    2.0
+        2000-01-01 00:03:00    3.0
+
+        Upsample the series into 30 second bins.
+
+        >>> df.asfreq(freq='30S')
+                               s
+        2000-01-01 00:00:00    0.0
+        2000-01-01 00:00:30    NaN
+        2000-01-01 00:01:00    NaN
+        2000-01-01 00:01:30    NaN
+        2000-01-01 00:02:00    2.0
+        2000-01-01 00:02:30    NaN
+        2000-01-01 00:03:00    3.0
+
+        Upsample again, providing a ``fill value``.
+
+        >>> df.asfreq(freq='30S', fill_value=9.0)
+                               s
+        2000-01-01 00:00:00    0.0
+        2000-01-01 00:00:30    9.0
+        2000-01-01 00:01:00    NaN
+        2000-01-01 00:01:30    9.0
+        2000-01-01 00:02:00    2.0
+        2000-01-01 00:02:30    9.0
+        2000-01-01 00:03:00    3.0
+
+        Upsample again, providing a ``method``.
+
+        >>> df.asfreq(freq='30S', method='bfill')
+                               s
+        2000-01-01 00:00:00    0.0
+        2000-01-01 00:00:30    NaN
+        2000-01-01 00:01:00    NaN
+        2000-01-01 00:01:30    2.0
+        2000-01-01 00:02:00    2.0
+        2000-01-01 00:02:30    3.0
+        2000-01-01 00:03:00    3.0
+
+        See Also
+        --------
+        reindex
+
+        Notes
+        -----
+        To learn more about the frequency strings, please see `this link
+        <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
         """
-        from pandas.tseries.resample import asfreq
-        return asfreq(self, freq, method=method, how=how,
-                      normalize=normalize)
+        from pandas.core.resample import asfreq
+        return asfreq(self, freq, method=method, how=how, normalize=normalize,
+                      fill_value=fill_value)
 
     def at_time(self, time, asof=False):
         """
-        Select values at particular time of day (e.g. 9:30AM)
+        Select values at particular time of day (e.g. 9:30AM).
+
+        Raises
+        ------
+        TypeError
+            If the index is not  a :class:`DatetimeIndex`
 
         Parameters
         ----------
@@ -3358,18 +6775,50 @@ def at_time(self, time, asof=False):
 
         Returns
         -------
-        values_at_time : type of caller
+        values_at_time : same type as caller
+
+        Examples
+        --------
+        >>> i = pd.date_range('2018-04-09', periods=4, freq='12H')
+        >>> ts = pd.DataFrame({'A': [1,2,3,4]}, index=i)
+        >>> ts
+                             A
+        2018-04-09 00:00:00  1
+        2018-04-09 12:00:00  2
+        2018-04-10 00:00:00  3
+        2018-04-10 12:00:00  4
+
+        >>> ts.at_time('12:00')
+                             A
+        2018-04-09 12:00:00  2
+        2018-04-10 12:00:00  4
+
+        See Also
+        --------
+        between_time : Select values between particular times of the day
+        first : Select initial periods of time series based on a date offset
+        last : Select final periods of time series based on a date offset
+        DatetimeIndex.indexer_at_time : Get just the index locations for
+            values at particular time of the day
         """
         try:
             indexer = self.index.indexer_at_time(time, asof=asof)
-            return self.take(indexer, convert=False)
+            return self._take(indexer)
         except AttributeError:
             raise TypeError('Index must be DatetimeIndex')
 
     def between_time(self, start_time, end_time, include_start=True,
                      include_end=True):
         """
-        Select values between particular times of the day (e.g., 9:00-9:30 AM)
+        Select values between particular times of the day (e.g., 9:00-9:30 AM).
+
+        By setting ``start_time`` to be later than ``end_time``,
+        you can get the times that are *not* between the two times.
+
+        Raises
+        ------
+        TypeError
+            If the index is not  a :class:`DatetimeIndex`
 
         Parameters
         ----------
@@ -3380,48 +6829,107 @@ def between_time(self, start_time, end_time, include_start=True,
 
         Returns
         -------
-        values_between_time : type of caller
+        values_between_time : same type as caller
+
+        Examples
+        --------
+        >>> i = pd.date_range('2018-04-09', periods=4, freq='1D20min')
+        >>> ts = pd.DataFrame({'A': [1,2,3,4]}, index=i)
+        >>> ts
+                             A
+        2018-04-09 00:00:00  1
+        2018-04-10 00:20:00  2
+        2018-04-11 00:40:00  3
+        2018-04-12 01:00:00  4
+
+        >>> ts.between_time('0:15', '0:45')
+                             A
+        2018-04-10 00:20:00  2
+        2018-04-11 00:40:00  3
+
+        You get the times that are *not* between two times by setting
+        ``start_time`` later than ``end_time``:
+
+        >>> ts.between_time('0:45', '0:15')
+                             A
+        2018-04-09 00:00:00  1
+        2018-04-12 01:00:00  4
+
+        See Also
+        --------
+        at_time : Select values at a particular time of the day
+        first : Select initial periods of time series based on a date offset
+        last : Select final periods of time series based on a date offset
+        DatetimeIndex.indexer_between_time : Get just the index locations for
+            values between particular times of the day
         """
         try:
             indexer = self.index.indexer_between_time(
                 start_time, end_time, include_start=include_start,
                 include_end=include_end)
-            return self.take(indexer, convert=False)
+            return self._take(indexer)
         except AttributeError:
             raise TypeError('Index must be DatetimeIndex')
 
-    def resample(self, rule, how=None, axis=0, fill_method=None,
-                 closed=None, label=None, convention='start',
-                 kind=None, loffset=None, limit=None, base=0):
+    def resample(self, rule, how=None, axis=0, fill_method=None, closed=None,
+                 label=None, convention='start', kind=None, loffset=None,
+                 limit=None, base=0, on=None, level=None):
         """
-        Convenience method for frequency conversion and resampling of regular
-        time-series data.
+        Convenience method for frequency conversion and resampling of time
+        series.  Object must have a datetime-like index (DatetimeIndex,
+        PeriodIndex, or TimedeltaIndex), or pass datetime-like values
+        to the on or level keyword.
 
         Parameters
         ----------
         rule : string
             the offset string or object representing target conversion
-        how : string
-            method for down- or re-sampling, default to 'mean' for
-            downsampling
         axis : int, optional, default 0
-        fill_method : string, default None
-            fill_method for upsampling
         closed : {'right', 'left'}
-            Which side of bin interval is closed
+            Which side of bin interval is closed. The default is 'left'
+            for all frequency offsets except for 'M', 'A', 'Q', 'BM',
+            'BA', 'BQ', and 'W' which all have a default of 'right'.
         label : {'right', 'left'}
-            Which bin edge label to label bucket with
+            Which bin edge label to label bucket with. The default is 'left'
+            for all frequency offsets except for 'M', 'A', 'Q', 'BM',
+            'BA', 'BQ', and 'W' which all have a default of 'right'.
         convention : {'start', 'end', 's', 'e'}
-        kind : "period"/"timestamp"
+            For PeriodIndex only, controls whether to use the start or end of
+            `rule`
+        kind: {'timestamp', 'period'}, optional
+            Pass 'timestamp' to convert the resulting index to a
+            ``DateTimeIndex`` or 'period' to convert it to a ``PeriodIndex``.
+            By default the input representation is retained.
         loffset : timedelta
             Adjust the resampled time labels
-        limit : int, default None
-            Maximum size gap to when reindexing with fill_method
         base : int, default 0
             For frequencies that evenly subdivide 1 day, the "origin" of the
             aggregated intervals. For example, for '5min' frequency, base could
             range from 0 through 4. Defaults to 0
+        on : string, optional
+            For a DataFrame, column to use instead of index for resampling.
+            Column must be datetime-like.
+
+            .. versionadded:: 0.19.0
+
+        level : string or int, optional
+            For a MultiIndex, level (name or number) to use for
+            resampling.  Level must be datetime-like.
+
+            .. versionadded:: 0.19.0
+
+        Returns
+        -------
+        Resampler object
+
+        Notes
+        -----
+        See the `user guide
+        <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#resampling>`_
+        for more.
 
+        To learn more about the offset strings, please see `this link
+        <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
 
         Examples
         --------
@@ -3445,7 +6953,7 @@ def resample(self, rule, how=None, axis=0, fill_method=None,
         Downsample the series into 3 minute bins and sum the values
         of the timestamps falling into a bin.
 
-        >>> series.resample('3T', how='sum')
+        >>> series.resample('3T').sum()
         2000-01-01 00:00:00     3
         2000-01-01 00:03:00    12
         2000-01-01 00:06:00    21
@@ -3456,12 +6964,12 @@ def resample(self, rule, how=None, axis=0, fill_method=None,
         value in the bucket used as the label is not included in the bucket,
         which it labels. For example, in the original series the
         bucket ``2000-01-01 00:03:00`` contains the value 3, but the summed
-        value in the resampled bucket with the label``2000-01-01 00:03:00``
+        value in the resampled bucket with the label ``2000-01-01 00:03:00``
         does not include 3 (if it did, the summed value would be 6, not 3).
         To include this value close the right side of the bin interval as
         illustrated in the example below this one.
 
-        >>> series.resample('3T', how='sum', label='right')
+        >>> series.resample('3T', label='right').sum()
         2000-01-01 00:03:00     3
         2000-01-01 00:06:00    12
         2000-01-01 00:09:00    21
@@ -3470,7 +6978,7 @@ def resample(self, rule, how=None, axis=0, fill_method=None,
         Downsample the series into 3 minute bins as above, but close the right
         side of the bin interval.
 
-        >>> series.resample('3T', how='sum', label='right', closed='right')
+        >>> series.resample('3T', label='right', closed='right').sum()
         2000-01-01 00:00:00     0
         2000-01-01 00:03:00     6
         2000-01-01 00:06:00    15
@@ -3479,18 +6987,18 @@ def resample(self, rule, how=None, axis=0, fill_method=None,
 
         Upsample the series into 30 second bins.
 
-        >>> series.resample('30S')[0:5] #select first 5 rows
-        2000-01-01 00:00:00     0
+        >>> series.resample('30S').asfreq()[0:5] #select first 5 rows
+        2000-01-01 00:00:00   0.0
         2000-01-01 00:00:30   NaN
-        2000-01-01 00:01:00     1
+        2000-01-01 00:01:00   1.0
         2000-01-01 00:01:30   NaN
-        2000-01-01 00:02:00     2
+        2000-01-01 00:02:00   2.0
         Freq: 30S, dtype: float64
 
         Upsample the series into 30 second bins and fill the ``NaN``
         values using the ``pad`` method.
 
-        >>> series.resample('30S', fill_method='pad')[0:5]
+        >>> series.resample('30S').pad()[0:5]
         2000-01-01 00:00:00    0
         2000-01-01 00:00:30    0
         2000-01-01 00:01:00    1
@@ -3501,7 +7009,7 @@ def resample(self, rule, how=None, axis=0, fill_method=None,
         Upsample the series into 30 second bins and fill the
         ``NaN`` values using the ``bfill`` method.
 
-        >>> series.resample('30S', fill_method='bfill')[0:5]
+        >>> series.resample('30S').bfill()[0:5]
         2000-01-01 00:00:00    0
         2000-01-01 00:00:30    1
         2000-01-01 00:01:00    1
@@ -3509,31 +7017,108 @@ def resample(self, rule, how=None, axis=0, fill_method=None,
         2000-01-01 00:02:00    2
         Freq: 30S, dtype: int64
 
-        Pass a custom function to ``how``.
+        Pass a custom function via ``apply``
 
         >>> def custom_resampler(array_like):
         ...     return np.sum(array_like)+5
 
-        >>> series.resample('3T', how=custom_resampler)
+        >>> series.resample('3T').apply(custom_resampler)
         2000-01-01 00:00:00     8
         2000-01-01 00:03:00    17
         2000-01-01 00:06:00    26
         Freq: 3T, dtype: int64
 
-        """
+        For a Series with a PeriodIndex, the keyword `convention` can be
+        used to control whether to use the start or end of `rule`.
+
+        >>> s = pd.Series([1, 2], index=pd.period_range('2012-01-01',
+                                                        freq='A',
+                                                        periods=2))
+        >>> s
+        2012    1
+        2013    2
+        Freq: A-DEC, dtype: int64
+
+        Resample by month using 'start' `convention`. Values are assigned to
+        the first month of the period.
+
+        >>> s.resample('M', convention='start').asfreq().head()
+        2012-01    1.0
+        2012-02    NaN
+        2012-03    NaN
+        2012-04    NaN
+        2012-05    NaN
+        Freq: M, dtype: float64
+
+        Resample by month using 'end' `convention`. Values are assigned to
+        the last month of the period.
+
+        >>> s.resample('M', convention='end').asfreq()
+        2012-12    1.0
+        2013-01    NaN
+        2013-02    NaN
+        2013-03    NaN
+        2013-04    NaN
+        2013-05    NaN
+        2013-06    NaN
+        2013-07    NaN
+        2013-08    NaN
+        2013-09    NaN
+        2013-10    NaN
+        2013-11    NaN
+        2013-12    2.0
+        Freq: M, dtype: float64
+
+        For DataFrame objects, the keyword ``on`` can be used to specify the
+        column instead of the index for resampling.
+
+        >>> df = pd.DataFrame(data=9*[range(4)], columns=['a', 'b', 'c', 'd'])
+        >>> df['time'] = pd.date_range('1/1/2000', periods=9, freq='T')
+        >>> df.resample('3T', on='time').sum()
+                             a  b  c  d
+        time
+        2000-01-01 00:00:00  0  3  6  9
+        2000-01-01 00:03:00  0  3  6  9
+        2000-01-01 00:06:00  0  3  6  9
+
+        For a DataFrame with MultiIndex, the keyword ``level`` can be used to
+        specify on level the resampling needs to take place.
+
+        >>> time = pd.date_range('1/1/2000', periods=5, freq='T')
+        >>> df2 = pd.DataFrame(data=10*[range(4)],
+                               columns=['a', 'b', 'c', 'd'],
+                               index=pd.MultiIndex.from_product([time, [1, 2]])
+                               )
+        >>> df2.resample('3T', level=0).sum()
+                             a  b   c   d
+        2000-01-01 00:00:00  0  6  12  18
+        2000-01-01 00:03:00  0  4   8  12
 
-        from pandas.tseries.resample import TimeGrouper
+        See also
+        --------
+        groupby : Group by mapping, function, label, or list of labels.
+        """
+        from pandas.core.resample import (resample,
+                                          _maybe_process_deprecations)
         axis = self._get_axis_number(axis)
-        sampler = TimeGrouper(rule, label=label, closed=closed, how=how,
-                              axis=axis, kind=kind, loffset=loffset,
-                              fill_method=fill_method, convention=convention,
-                              limit=limit, base=base)
-        return sampler.resample(self).__finalize__(self)
+        r = resample(self, freq=rule, label=label, closed=closed,
+                     axis=axis, kind=kind, loffset=loffset,
+                     convention=convention,
+                     base=base, key=on, level=level)
+        return _maybe_process_deprecations(r,
+                                           how=how,
+                                           fill_method=fill_method,
+                                           limit=limit)
 
     def first(self, offset):
         """
         Convenience method for subsetting initial periods of time series data
-        based on a date offset
+        based on a date offset.
+
+        Raises
+        ------
+        TypeError
+            If the index is not  a :class:`DatetimeIndex`
 
         Parameters
         ----------
@@ -3541,16 +7126,39 @@ def first(self, offset):
 
         Examples
         --------
-        ts.last('10D') -> First 10 days
+        >>> i = pd.date_range('2018-04-09', periods=4, freq='2D')
+        >>> ts = pd.DataFrame({'A': [1,2,3,4]}, index=i)
+        >>> ts
+                    A
+        2018-04-09  1
+        2018-04-11  2
+        2018-04-13  3
+        2018-04-15  4
+
+        Get the rows for the first 3 days:
+
+        >>> ts.first('3D')
+                    A
+        2018-04-09  1
+        2018-04-11  2
+
+        Notice the data for 3 first calender days were returned, not the first
+        3 days observed in the dataset, and therefore data for 2018-04-13 was
+        not returned.
 
         Returns
         -------
-        subset : type of caller
+        subset : same type as caller
+
+        See Also
+        --------
+        last : Select final periods of time series based on a date offset
+        at_time : Select values at a particular time of the day
+        between_time : Select values between particular times of the day
         """
         from pandas.tseries.frequencies import to_offset
         if not isinstance(self.index, DatetimeIndex):
-            raise NotImplementedError("'first' only supports a DatetimeIndex "
-                                      "index")
+            raise TypeError("'first' only supports a DatetimeIndex index")
 
         if len(self.index) == 0:
             return self
@@ -3562,13 +7170,19 @@ def first(self, offset):
         if not offset.isAnchored() and hasattr(offset, '_inc'):
             if end_date in self.index:
                 end = self.index.searchsorted(end_date, side='left')
+                return self.iloc[:end]
 
-        return self.ix[:end]
+        return self.loc[:end]
 
     def last(self, offset):
         """
         Convenience method for subsetting final periods of time series data
-        based on a date offset
+        based on a date offset.
+
+        Raises
+        ------
+        TypeError
+            If the index is not  a :class:`DatetimeIndex`
 
         Parameters
         ----------
@@ -3576,29 +7190,111 @@ def last(self, offset):
 
         Examples
         --------
-        ts.last('5M') -> Last 5 months
+        >>> i = pd.date_range('2018-04-09', periods=4, freq='2D')
+        >>> ts = pd.DataFrame({'A': [1,2,3,4]}, index=i)
+        >>> ts
+                    A
+        2018-04-09  1
+        2018-04-11  2
+        2018-04-13  3
+        2018-04-15  4
+
+        Get the rows for the last 3 days:
+
+        >>> ts.last('3D')
+                    A
+        2018-04-13  3
+        2018-04-15  4
+
+        Notice the data for 3 last calender days were returned, not the last
+        3 observed days in the dataset, and therefore data for 2018-04-11 was
+        not returned.
 
         Returns
         -------
-        subset : type of caller
+        subset : same type as caller
+
+        See Also
+        --------
+        first : Select initial periods of time series based on a date offset
+        at_time : Select values at a particular time of the day
+        between_time : Select values between particular times of the day
         """
         from pandas.tseries.frequencies import to_offset
         if not isinstance(self.index, DatetimeIndex):
-            raise NotImplementedError("'last' only supports a DatetimeIndex "
-                                      "index")
+            raise TypeError("'last' only supports a DatetimeIndex index")
 
         if len(self.index) == 0:
             return self
 
         offset = to_offset(offset)
 
-        start_date = start = self.index[-1] - offset
+        start_date = self.index[-1] - offset
         start = self.index.searchsorted(start_date, side='right')
-        return self.ix[start:]
+        return self.iloc[start:]
+
+    def rank(self, axis=0, method='average', numeric_only=None,
+             na_option='keep', ascending=True, pct=False):
+        """
+        Compute numerical data ranks (1 through n) along axis. Equal values are
+        assigned a rank that is the average of the ranks of those values
+
+        Parameters
+        ----------
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            index to direct ranking
+        method : {'average', 'min', 'max', 'first', 'dense'}
+            * average: average rank of group
+            * min: lowest rank in group
+            * max: highest rank in group
+            * first: ranks assigned in order they appear in the array
+            * dense: like 'min', but rank always increases by 1 between groups
+        numeric_only : boolean, default None
+            Include only float, int, boolean data. Valid only for DataFrame or
+            Panel objects
+        na_option : {'keep', 'top', 'bottom'}
+            * keep: leave NA values where they are
+            * top: smallest rank if ascending
+            * bottom: smallest rank if descending
+        ascending : boolean, default True
+            False for ranks by high (1) to low (N)
+        pct : boolean, default False
+            Computes percentage rank of data
 
-    _shared_docs['align'] = (
+        Returns
+        -------
+        ranks : same type as caller
         """
-        Align two object on their axes with the
+        axis = self._get_axis_number(axis)
+
+        if self.ndim > 2:
+            msg = "rank does not make sense when ndim > 2"
+            raise NotImplementedError(msg)
+
+        def ranker(data):
+            ranks = algos.rank(data.values, axis=axis, method=method,
+                               ascending=ascending, na_option=na_option,
+                               pct=pct)
+            ranks = self._constructor(ranks, **data._construct_axes_dict())
+            return ranks.__finalize__(self)
+
+        # if numeric_only is None, and we can't get anything, we try with
+        # numeric_only=True
+        if numeric_only is None:
+            try:
+                return ranker(self)
+            except TypeError:
+                numeric_only = True
+
+        if numeric_only:
+            data = self._get_numeric_data()
+        else:
+            data = self
+
+        return ranker(data)
+
+    _shared_docs['align'] = ("""
+        Align two objects on their axes with the
         specified join method for each axis Index
 
         Parameters
@@ -3624,35 +7320,36 @@ def last(self, offset):
             Broadcast values along this axis, if aligning two objects of
             different dimensions
 
-            .. versionadded:: 0.17.0
-
         Returns
         -------
         (left, right) : (%(klass)s, type of other)
             Aligned objects
-        """
-    )
+        """)
 
     @Appender(_shared_docs['align'] % _shared_doc_kwargs)
     def align(self, other, join='outer', axis=None, level=None, copy=True,
               fill_value=None, method=None, limit=None, fill_axis=0,
               broadcast_axis=None):
         from pandas import DataFrame, Series
-        method = com._clean_fill_method(method)
+        method = missing.clean_fill_method(method)
 
         if broadcast_axis == 1 and self.ndim != other.ndim:
             if isinstance(self, Series):
-                # this means other is a DataFrame, and we need to broadcast self
-                df = DataFrame(dict((c, self) for c in other.columns),
-                               **other._construct_axes_dict())
-                return df._align_frame(other, join=join, axis=axis, level=level,
-                                       copy=copy, fill_value=fill_value,
-                                       method=method, limit=limit,
-                                       fill_axis=fill_axis)
+                # this means other is a DataFrame, and we need to broadcast
+                # self
+                cons = self._constructor_expanddim
+                df = cons({c: self for c in other.columns},
+                          **other._construct_axes_dict())
+                return df._align_frame(other, join=join, axis=axis,
+                                       level=level, copy=copy,
+                                       fill_value=fill_value, method=method,
+                                       limit=limit, fill_axis=fill_axis)
             elif isinstance(other, Series):
-                # this means self is a DataFrame, and we need to broadcast other
-                df = DataFrame(dict((c, other) for c in self.columns),
-                               **self._construct_axes_dict())
+                # this means self is a DataFrame, and we need to broadcast
+                # other
+                cons = other._constructor_expanddim
+                df = cons({c: other for c in self.columns},
+                          **self._construct_axes_dict())
                 return self._align_frame(df, join=join, axis=axis, level=level,
                                          copy=copy, fill_value=fill_value,
                                          method=method, limit=limit,
@@ -3674,29 +7371,34 @@ def align(self, other, join='outer', axis=None, level=None, copy=True,
             raise TypeError('unsupported type: %s' % type(other))
 
     def _align_frame(self, other, join='outer', axis=None, level=None,
-                     copy=True, fill_value=np.nan, method=None, limit=None,
+                     copy=True, fill_value=None, method=None, limit=None,
                      fill_axis=0):
         # defaults
         join_index, join_columns = None, None
         ilidx, iridx = None, None
         clidx, cridx = None, None
 
+        is_series = isinstance(self, ABCSeries)
+
         if axis is None or axis == 0:
             if not self.index.equals(other.index):
-                join_index, ilidx, iridx = \
-                    self.index.join(other.index, how=join, level=level,
-                                    return_indexers=True)
+                join_index, ilidx, iridx = self.index.join(
+                    other.index, how=join, level=level, return_indexers=True)
 
         if axis is None or axis == 1:
-            if not self.columns.equals(other.columns):
-                join_columns, clidx, cridx = \
-                    self.columns.join(other.columns, how=join, level=level,
-                                      return_indexers=True)
-
-        left = self._reindex_with_indexers({0: [join_index, ilidx],
-                                            1: [join_columns, clidx]},
-                                           copy=copy, fill_value=fill_value,
+            if not is_series and not self.columns.equals(other.columns):
+                join_columns, clidx, cridx = self.columns.join(
+                    other.columns, how=join, level=level, return_indexers=True)
+
+        if is_series:
+            reindexers = {0: [join_index, ilidx]}
+        else:
+            reindexers = {0: [join_index, ilidx], 1: [join_columns, clidx]}
+
+        left = self._reindex_with_indexers(reindexers, copy=copy,
+                                           fill_value=fill_value,
                                            allow_dups=True)
+        # other must be always DataFrame
         right = other._reindex_with_indexers({0: [join_index, iridx],
                                               1: [join_columns, cridx]},
                                              copy=copy, fill_value=fill_value,
@@ -3706,21 +7408,29 @@ def _align_frame(self, other, join='outer', axis=None, level=None,
             left = left.fillna(axis=fill_axis, method=method, limit=limit)
             right = right.fillna(axis=fill_axis, method=method, limit=limit)
 
+        # if DatetimeIndex have different tz, convert to UTC
+        if is_datetime64tz_dtype(left.index):
+            if left.index.tz != right.index.tz:
+                if join_index is not None:
+                    left.index = join_index
+                    right.index = join_index
+
         return left.__finalize__(self), right.__finalize__(other)
 
     def _align_series(self, other, join='outer', axis=None, level=None,
                       copy=True, fill_value=None, method=None, limit=None,
                       fill_axis=0):
-        from pandas import DataFrame
 
-        # series/series compat
-        if isinstance(self, ABCSeries) and isinstance(other, ABCSeries):
+        is_series = isinstance(self, ABCSeries)
+
+        # series/series compat, other must always be a Series
+        if is_series:
             if axis:
                 raise ValueError('cannot align series to a series other than '
                                  'axis 0')
 
             # equal
-            if  self.index.equals(other.index):
+            if self.index.equals(other.index):
                 join_index, lidx, ridx = None, None, None
             else:
                 join_index, lidx, ridx = self.index.join(other.index, how=join,
@@ -3737,9 +7447,9 @@ def _align_series(self, other, join='outer', axis=None, level=None,
                 join_index = self.index
                 lidx, ridx = None, None
                 if not self.index.equals(other.index):
-                    join_index, lidx, ridx = \
-                        self.index.join(other.index, how=join, level=level,
-                                        return_indexers=True)
+                    join_index, lidx, ridx = self.index.join(
+                        other.index, how=join, level=level,
+                        return_indexers=True)
 
                 if lidx is not None:
                     fdata = fdata.reindex_indexer(join_index, lidx, axis=1)
@@ -3748,9 +7458,9 @@ def _align_series(self, other, join='outer', axis=None, level=None,
                 join_index = self.columns
                 lidx, ridx = None, None
                 if not self.columns.equals(other.index):
-                    join_index, lidx, ridx = \
-                        self.columns.join(other.index, how=join, level=level,
-                                          return_indexers=True)
+                    join_index, lidx, ridx = self.columns.join(
+                        other.index, how=join, level=level,
+                        return_indexers=True)
 
                 if lidx is not None:
                     fdata = fdata.reindex_indexer(join_index, lidx, axis=0)
@@ -3760,7 +7470,7 @@ def _align_series(self, other, join='outer', axis=None, level=None,
             if copy and fdata is self._data:
                 fdata = fdata.copy()
 
-            left = DataFrame(fdata)
+            left = self._constructor(fdata)
 
             if ridx is None:
                 right = other
@@ -3768,114 +7478,79 @@ def _align_series(self, other, join='outer', axis=None, level=None,
                 right = other.reindex(join_index, level=level)
 
         # fill
-        fill_na = notnull(fill_value) or (method is not None)
+        fill_na = notna(fill_value) or (method is not None)
         if fill_na:
-            left = left.fillna(fill_value, method=method, limit=limit, axis=fill_axis)
+            left = left.fillna(fill_value, method=method, limit=limit,
+                               axis=fill_axis)
             right = right.fillna(fill_value, method=method, limit=limit)
-        return (left.__finalize__(self), right.__finalize__(other))
 
-    _shared_docs['where'] = ("""
-        Return an object of same shape as self and whose corresponding
-        entries are from self where cond is %(cond)s and otherwise are from other.
+        # if DatetimeIndex have different tz, convert to UTC
+        if is_series or (not is_series and axis == 0):
+            if is_datetime64tz_dtype(left.index):
+                if left.index.tz != right.index.tz:
+                    if join_index is not None:
+                        left.index = join_index
+                        right.index = join_index
 
-        Parameters
-        ----------
-        cond : boolean %(klass)s or array
-        other : scalar or %(klass)s
-        inplace : boolean, default False
-            Whether to perform the operation in place on the data
-        axis : alignment axis if needed, default None
-        level : alignment level if needed, default None
-        try_cast : boolean, default False
-            try to cast the result back to the input type (if possible),
-        raise_on_error : boolean, default True
-            Whether to raise on invalid data types (e.g. trying to where on
-            strings)
+        return left.__finalize__(self), right.__finalize__(other)
 
-        Returns
-        -------
-        wh : same type as caller
-        """)
-    @Appender(_shared_docs['where'] % dict(_shared_doc_kwargs, cond="True"))
-    def where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
-              try_cast=False, raise_on_error=True):
+    def _where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
+               errors='raise', try_cast=False):
+        """
+        Equivalent to public method `where`, except that `other` is not
+        applied as a function even if callable. Used in __setitem__.
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
 
+        # align the cond to same shape as myself
+        cond = com._apply_if_callable(cond, self)
         if isinstance(cond, NDFrame):
             cond, _ = cond.align(self, join='right', broadcast_axis=1)
         else:
             if not hasattr(cond, 'shape'):
-                raise ValueError('where requires an ndarray like object for '
-                                 'its condition')
+                cond = np.asanyarray(cond)
             if cond.shape != self.shape:
-                raise ValueError(
-                    'Array conditional must be same shape as self')
+                raise ValueError('Array conditional must be same shape as '
+                                 'self')
             cond = self._constructor(cond, **self._construct_axes_dict())
 
-        if inplace:
-            cond = -(cond.fillna(True).astype(bool))
+        # make sure we are boolean
+        fill_value = True if inplace else False
+        cond = cond.fillna(fill_value)
+
+        msg = "Boolean array expected for the condition, not {dtype}"
+
+        if not isinstance(cond, pd.DataFrame):
+            # This is a single-dimensional object.
+            if not is_bool_dtype(cond):
+                raise ValueError(msg.format(dtype=cond.dtype))
         else:
-            cond = cond.fillna(False).astype(bool)
+            for dt in cond.dtypes:
+                if not is_bool_dtype(dt):
+                    raise ValueError(msg.format(dtype=dt))
+
+        cond = -cond if inplace else cond
 
-        # try to align
+        # try to align with other
         try_quick = True
         if hasattr(other, 'align'):
 
             # align with me
             if other.ndim <= self.ndim:
 
-                _, other = self.align(other, join='left',
-                                      axis=axis, level=level,
-                                      fill_value=np.nan)
+                _, other = self.align(other, join='left', axis=axis,
+                                      level=level, fill_value=np.nan)
 
                 # if we are NOT aligned, raise as we cannot where index
                 if (axis is None and
-                        not all([other._get_axis(i).equals(ax)
-                                 for i, ax in enumerate(self.axes)])):
+                        not all(other._get_axis(i).equals(ax)
+                                for i, ax in enumerate(self.axes))):
                     raise InvalidIndexError
 
             # slice me out of the other
             else:
-                raise NotImplemented(
-                    "cannot align with a higher dimensional NDFrame"
-                )
-
-        elif is_list_like(other):
-
-            if self.ndim == 1:
-
-                # try to set the same dtype as ourselves
-                try:
-                    new_other = np.array(other, dtype=self.dtype)
-                except ValueError:
-                    new_other = np.array(other)
-
-                # we can end up comparing integers and m8[ns]
-                # which is a numpy no no
-                is_i8 = com.needs_i8_conversion(self.dtype)
-                if is_i8:
-                    matches = False
-                else:
-                    matches = (new_other == np.array(other))
-
-                if matches is False or not matches.all():
-
-                    # coerce other to a common dtype if we can
-                    if com.needs_i8_conversion(self.dtype):
-                        try:
-                            other = np.array(other, dtype=self.dtype)
-                        except:
-                            other = np.array(other)
-                    else:
-                        other = np.asarray(other)
-                        other = np.asarray(other, dtype=np.common_type(other, new_other))
-
-                    # we need to use the new dtype
-                    try_quick = False
-                else:
-                    other = new_other
-            else:
-
-                other = np.array(other)
+                raise NotImplementedError("cannot align with a higher "
+                                          "dimensional NDFrame")
 
         if isinstance(other, np.ndarray):
 
@@ -3898,25 +7573,26 @@ def where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
                         if try_quick:
 
                             try:
-                                new_other = _values_from_object(self).copy()
+                                new_other = com._values_from_object(self)
+                                new_other = new_other.copy()
                                 new_other[icond] = other
                                 other = new_other
-                            except:
+                            except Exception:
                                 try_quick = False
 
                         # let's create a new (if we failed at the above
                         # or not try_quick
                         if not try_quick:
 
-                            dtype, fill_value = _maybe_promote(other.dtype)
+                            dtype, fill_value = maybe_promote(other.dtype)
                             new_other = np.empty(len(icond), dtype=dtype)
                             new_other.fill(fill_value)
-                            com._maybe_upcast_putmask(new_other, icond, other)
+                            maybe_upcast_putmask(new_other, icond, other)
                             other = new_other
 
                     else:
-                        raise ValueError(
-                            'Length of replacements must equal series length')
+                        raise ValueError('Length of replacements must equal '
+                                         'series length')
 
                 else:
                     raise ValueError('other must be the same shape as self '
@@ -3948,17 +7624,173 @@ def where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
 
         else:
             new_data = self._data.where(other=other, cond=cond, align=align,
-                                        raise_on_error=raise_on_error,
+                                        errors=errors,
                                         try_cast=try_cast, axis=block_axis,
                                         transpose=self._AXIS_REVERSED)
 
             return self._constructor(new_data).__finalize__(self)
 
-    @Appender(_shared_docs['where'] % dict(_shared_doc_kwargs, cond="False"))
+    _shared_docs['where'] = ("""
+        Return an object of same shape as self and whose corresponding
+        entries are from self where `cond` is %(cond)s and otherwise are from
+        `other`.
+
+        Parameters
+        ----------
+        cond : boolean %(klass)s, array-like, or callable
+            Where `cond` is %(cond)s, keep the original value. Where
+            %(cond_rev)s, replace with corresponding value from `other`.
+            If `cond` is callable, it is computed on the %(klass)s and
+            should return boolean %(klass)s or array. The callable must
+            not change input %(klass)s (though pandas doesn't check it).
+
+            .. versionadded:: 0.18.1
+                A callable can be used as cond.
+
+        other : scalar, %(klass)s, or callable
+            Entries where `cond` is %(cond_rev)s are replaced with
+            corresponding value from `other`.
+            If other is callable, it is computed on the %(klass)s and
+            should return scalar or %(klass)s. The callable must not
+            change input %(klass)s (though pandas doesn't check it).
+
+            .. versionadded:: 0.18.1
+                A callable can be used as other.
+
+        inplace : boolean, default False
+            Whether to perform the operation in place on the data
+        axis : alignment axis if needed, default None
+        level : alignment level if needed, default None
+        errors : str, {'raise', 'ignore'}, default 'raise'
+            - ``raise`` : allow exceptions to be raised
+            - ``ignore`` : suppress exceptions. On error return original object
+
+            Note that currently this parameter won't affect
+            the results and will always coerce to a suitable dtype.
+
+        try_cast : boolean, default False
+            try to cast the result back to the input type (if possible),
+        raise_on_error : boolean, default True
+            Whether to raise on invalid data types (e.g. trying to where on
+            strings)
+
+            .. deprecated:: 0.21.0
+
+        Returns
+        -------
+        wh : same type as caller
+
+        Notes
+        -----
+        The %(name)s method is an application of the if-then idiom. For each
+        element in the calling DataFrame, if ``cond`` is ``%(cond)s`` the
+        element is used; otherwise the corresponding element from the DataFrame
+        ``other`` is used.
+
+        The signature for :func:`DataFrame.where` differs from
+        :func:`numpy.where`. Roughly ``df1.where(m, df2)`` is equivalent to
+        ``np.where(m, df1, df2)``.
+
+        For further details and examples see the ``%(name)s`` documentation in
+        :ref:`indexing <indexing.where_mask>`.
+
+        Examples
+        --------
+        >>> s = pd.Series(range(5))
+        >>> s.where(s > 0)
+        0    NaN
+        1    1.0
+        2    2.0
+        3    3.0
+        4    4.0
+
+        >>> s.mask(s > 0)
+        0    0.0
+        1    NaN
+        2    NaN
+        3    NaN
+        4    NaN
+
+        >>> s.where(s > 1, 10)
+        0    10.0
+        1    10.0
+        2    2.0
+        3    3.0
+        4    4.0
+
+        >>> df = pd.DataFrame(np.arange(10).reshape(-1, 2), columns=['A', 'B'])
+        >>> m = df %% 3 == 0
+        >>> df.where(m, -df)
+           A  B
+        0  0 -1
+        1 -2  3
+        2 -4 -5
+        3  6 -7
+        4 -8  9
+        >>> df.where(m, -df) == np.where(m, df, -df)
+              A     B
+        0  True  True
+        1  True  True
+        2  True  True
+        3  True  True
+        4  True  True
+        >>> df.where(m, -df) == df.mask(~m, -df)
+              A     B
+        0  True  True
+        1  True  True
+        2  True  True
+        3  True  True
+        4  True  True
+
+        See Also
+        --------
+        :func:`DataFrame.%(name_other)s`
+        """)
+
+    @Appender(_shared_docs['where'] % dict(_shared_doc_kwargs, cond="True",
+                                           cond_rev="False", name='where',
+                                           name_other='mask'))
+    def where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
+              errors='raise', try_cast=False, raise_on_error=None):
+
+        if raise_on_error is not None:
+            warnings.warn(
+                "raise_on_error is deprecated in "
+                "favor of errors='raise|ignore'",
+                FutureWarning, stacklevel=2)
+
+            if raise_on_error:
+                errors = 'raise'
+            else:
+                errors = 'ignore'
+
+        other = com._apply_if_callable(other, self)
+        return self._where(cond, other, inplace, axis, level,
+                           errors=errors, try_cast=try_cast)
+
+    @Appender(_shared_docs['where'] % dict(_shared_doc_kwargs, cond="False",
+                                           cond_rev="True", name='mask',
+                                           name_other='where'))
     def mask(self, cond, other=np.nan, inplace=False, axis=None, level=None,
-             try_cast=False, raise_on_error=True):
+             errors='raise', try_cast=False, raise_on_error=None):
+
+        if raise_on_error is not None:
+            warnings.warn(
+                "raise_on_error is deprecated in "
+                "favor of errors='raise|ignore'",
+                FutureWarning, stacklevel=2)
+
+            if raise_on_error:
+                errors = 'raise'
+            else:
+                errors = 'ignore'
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        cond = com._apply_if_callable(cond, self)
+
         return self.where(~cond, other=other, inplace=inplace, axis=axis,
-            level=level, try_cast=try_cast, raise_on_error=raise_on_error)
+                          level=level, try_cast=try_cast,
+                          errors=errors)
 
     _shared_docs['shift'] = ("""
         Shift index by desired number of periods with an optional time freq
@@ -3968,7 +7800,7 @@ def mask(self, cond, other=np.nan, inplace=False, axis=None, level=None,
         periods : int
             Number of periods to move, can be positive or negative
         freq : DateOffset, timedelta, or time rule string, optional
-            Increment to use from datetools module or time rule (e.g. 'EOM').
+            Increment to use from the tseries module or time rule (e.g. 'EOM').
             See Notes.
         axis : %(axes_single_arg)s
 
@@ -3982,6 +7814,7 @@ def mask(self, cond, other=np.nan, inplace=False, axis=None, level=None,
         -------
         shifted : %(klass)s
     """)
+
     @Appender(_shared_docs['shift'] % _shared_doc_kwargs)
     def shift(self, periods=1, freq=None, axis=0):
         if periods == 0:
@@ -4027,20 +7860,20 @@ def slice_shift(self, periods=1, axis=0):
 
         new_obj = self._slice(vslicer, axis=axis)
         shifted_axis = self._get_axis(axis)[islicer]
-        new_obj.set_axis(axis, shifted_axis)
+        new_obj.set_axis(shifted_axis, axis=axis, inplace=True)
 
         return new_obj.__finalize__(self)
 
     def tshift(self, periods=1, freq=None, axis=0):
         """
-        Shift the time index, using the index's frequency if available
+        Shift the time index, using the index's frequency if available.
 
         Parameters
         ----------
         periods : int
             Number of periods to move, can be positive or negative
         freq : DateOffset, timedelta, or time rule string, default None
-            Increment to use from datetools module or time rule (e.g. 'EOM')
+            Increment to use from the tseries module or time rule (e.g. 'EOM')
         axis : int or basestring
             Corresponds to the axis that contains the Index
 
@@ -4070,11 +7903,11 @@ def tshift(self, periods=1, freq=None, axis=0):
             return self
 
         if isinstance(freq, string_types):
-            freq = datetools.to_offset(freq)
+            freq = to_offset(freq)
 
         block_axis = self._get_block_manager_axis(axis)
         if isinstance(index, PeriodIndex):
-            orig_freq = datetools.to_offset(index.freq)
+            orig_freq = to_offset(index.freq)
             if freq == orig_freq:
                 new_data = self._data.copy()
                 new_data.axes[block_axis] = index.shift(periods)
@@ -4089,22 +7922,122 @@ def tshift(self, periods=1, freq=None, axis=0):
         return self._constructor(new_data).__finalize__(self)
 
     def truncate(self, before=None, after=None, axis=None, copy=True):
-        """Truncates a sorted NDFrame before and/or after some particular
-        dates.
+        """
+        Truncate a Series or DataFrame before and after some index value.
+
+        This is a useful shorthand for boolean indexing based on index
+        values above or below certain thresholds.
 
         Parameters
         ----------
-        before : date
-            Truncate before date
-        after : date
-            Truncate after date
-        axis : the truncation axis, defaults to the stat axis
+        before : date, string, int
+            Truncate all rows before this index value.
+        after : date, string, int
+            Truncate all rows after this index value.
+        axis : {0 or 'index', 1 or 'columns'}, optional
+            Axis to truncate. Truncates the index (rows) by default.
         copy : boolean, default is True,
-            return a copy of the truncated section
+            Return a copy of the truncated section.
 
         Returns
         -------
-        truncated : type of caller
+        type of caller
+            The truncated Series or DataFrame.
+
+        See Also
+        --------
+        DataFrame.loc : Select a subset of a DataFrame by label.
+        DataFrame.iloc : Select a subset of a DataFrame by position.
+
+        Notes
+        -----
+        If the index being truncated contains only datetime values,
+        `before` and `after` may be specified as strings instead of
+        Timestamps.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'A': ['a', 'b', 'c', 'd', 'e'],
+        ...                    'B': ['f', 'g', 'h', 'i', 'j'],
+        ...                    'C': ['k', 'l', 'm', 'n', 'o']},
+        ...                    index=[1, 2, 3, 4, 5])
+        >>> df
+           A  B  C
+        1  a  f  k
+        2  b  g  l
+        3  c  h  m
+        4  d  i  n
+        5  e  j  o
+
+        >>> df.truncate(before=2, after=4)
+           A  B  C
+        2  b  g  l
+        3  c  h  m
+        4  d  i  n
+
+        The columns of a DataFrame can be truncated.
+
+        >>> df.truncate(before="A", after="B", axis="columns")
+           A  B
+        1  a  f
+        2  b  g
+        3  c  h
+        4  d  i
+        5  e  j
+
+        For Series, only rows can be truncated.
+
+        >>> df['A'].truncate(before=2, after=4)
+        2    b
+        3    c
+        4    d
+        Name: A, dtype: object
+
+        The index values in ``truncate`` can be datetimes or string
+        dates.
+
+        >>> dates = pd.date_range('2016-01-01', '2016-02-01', freq='s')
+        >>> df = pd.DataFrame(index=dates, data={'A': 1})
+        >>> df.tail()
+                             A
+        2016-01-31 23:59:56  1
+        2016-01-31 23:59:57  1
+        2016-01-31 23:59:58  1
+        2016-01-31 23:59:59  1
+        2016-02-01 00:00:00  1
+
+        >>> df.truncate(before=pd.Timestamp('2016-01-05'),
+        ...             after=pd.Timestamp('2016-01-10')).tail()
+                             A
+        2016-01-09 23:59:56  1
+        2016-01-09 23:59:57  1
+        2016-01-09 23:59:58  1
+        2016-01-09 23:59:59  1
+        2016-01-10 00:00:00  1
+
+        Because the index is a DatetimeIndex containing only dates, we can
+        specify `before` and `after` as strings. They will be coerced to
+        Timestamps before truncation.
+
+        >>> df.truncate('2016-01-05', '2016-01-10').tail()
+                             A
+        2016-01-09 23:59:56  1
+        2016-01-09 23:59:57  1
+        2016-01-09 23:59:58  1
+        2016-01-09 23:59:59  1
+        2016-01-10 00:00:00  1
+
+        Note that ``truncate`` assumes a 0 value for any unspecified time
+        component (midnight). This differs from partial string slicing, which
+        returns any partially matching dates.
+
+        >>> df.loc['2016-01-05':'2016-01-10', :].tail()
+                             A
+        2016-01-10 23:59:55  1
+        2016-01-10 23:59:56  1
+        2016-01-10 23:59:57  1
+        2016-01-10 23:59:58  1
+        2016-01-10 23:59:59  1
         """
 
         if axis is None:
@@ -4112,10 +8045,15 @@ def truncate(self, before=None, after=None, axis=None, copy=True):
         axis = self._get_axis_number(axis)
         ax = self._get_axis(axis)
 
+        # GH 17935
+        # Check that index is sorted
+        if not ax.is_monotonic_increasing and not ax.is_monotonic_decreasing:
+            raise ValueError("truncate requires a sorted index")
+
         # if we have a date index, convert to dates, otherwise
         # treat like a slice
         if ax.is_all_dates:
-            from pandas.tseries.tools import to_datetime
+            from pandas.core.tools.datetimes import to_datetime
             before = to_datetime(before)
             after = to_datetime(after)
 
@@ -4126,7 +8064,7 @@ def truncate(self, before=None, after=None, axis=None, copy=True):
 
         slicer = [slice(None, None)] * self._AXIS_LEN
         slicer[axis] = slice(before, after)
-        result = self.ix[tuple(slicer)]
+        result = self.loc[tuple(slicer)]
 
         if isinstance(ax, MultiIndex):
             setattr(result, self._get_axis_name(axis),
@@ -4166,10 +8104,10 @@ def _tz_convert(ax, tz):
             if not hasattr(ax, 'tz_convert'):
                 if len(ax) > 0:
                     ax_name = self._get_axis_name(axis)
-                    raise TypeError('%s is not a valid DatetimeIndex or PeriodIndex' %
-                                    ax_name)
+                    raise TypeError('%s is not a valid DatetimeIndex or '
+                                    'PeriodIndex' % ax_name)
                 else:
-                    ax = DatetimeIndex([],tz=tz)
+                    ax = DatetimeIndex([], tz=tz)
             else:
                 ax = ax.tz_convert(tz)
             return ax
@@ -4183,18 +8121,16 @@ def _tz_convert(ax, tz):
         else:
             if level not in (None, 0, ax.name):
                 raise ValueError("The level {0} is not valid".format(level))
-            ax =  _tz_convert(ax, tz)
+            ax = _tz_convert(ax, tz)
 
         result = self._constructor(self._data, copy=copy)
-        result.set_axis(axis,ax)
+        result.set_axis(ax, axis=axis, inplace=True)
         return result.__finalize__(self)
 
-    @deprecate_kwarg(old_arg_name='infer_dst', new_arg_name='ambiguous',
-                     mapping={True: 'infer', False: 'raise'})
     def tz_localize(self, tz, axis=0, level=None, copy=True,
                     ambiguous='raise'):
         """
-        Localize tz-naive TimeSeries to target time zone
+        Localize tz-naive TimeSeries to target time zone.
 
         Parameters
         ----------
@@ -4206,13 +8142,14 @@ def tz_localize(self, tz, axis=0, level=None, copy=True,
         copy : boolean, default True
             Also make a copy of the underlying data
         ambiguous : 'infer', bool-ndarray, 'NaT', default 'raise'
-            - 'infer' will attempt to infer fall dst-transition hours based on order
+            - 'infer' will attempt to infer fall dst-transition hours based on
+              order
             - bool-ndarray where True signifies a DST time, False designates
-              a non-DST time (note that this flag is only applicable for ambiguous times)
+              a non-DST time (note that this flag is only applicable for
+              ambiguous times)
             - 'NaT' will return NaT where there are ambiguous times
-            - 'raise' will raise an AmbiguousTimeError if there are ambiguous times
-        infer_dst : boolean, default False (DEPRECATED)
-            Attempt to infer fall dst-transition hours based on order
+            - 'raise' will raise an AmbiguousTimeError if there are ambiguous
+              times
 
         Returns
         -------
@@ -4229,10 +8166,10 @@ def _tz_localize(ax, tz, ambiguous):
             if not hasattr(ax, 'tz_localize'):
                 if len(ax) > 0:
                     ax_name = self._get_axis_name(axis)
-                    raise TypeError('%s is not a valid DatetimeIndex or PeriodIndex' %
-                                    ax_name)
+                    raise TypeError('%s is not a valid DatetimeIndex or '
+                                    'PeriodIndex' % ax_name)
                 else:
-                    ax = DatetimeIndex([],tz=tz)
+                    ax = DatetimeIndex([], tz=tz)
             else:
                 ax = ax.tz_localize(tz, ambiguous=ambiguous)
             return ax
@@ -4246,156 +8183,394 @@ def _tz_localize(ax, tz, ambiguous):
         else:
             if level not in (None, 0, ax.name):
                 raise ValueError("The level {0} is not valid".format(level))
-            ax =  _tz_localize(ax, tz, ambiguous)
+            ax = _tz_localize(ax, tz, ambiguous)
 
         result = self._constructor(self._data, copy=copy)
-        result.set_axis(axis,ax)
+        result.set_axis(ax, axis=axis, inplace=True)
         return result.__finalize__(self)
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Numeric Methods
     def abs(self):
         """
-        Return an object with absolute value taken. Only applicable to objects
-        that are all numeric
+        Return a Series/DataFrame with absolute numeric value of each element.
+
+        This function only applies to elements that are all numeric.
 
         Returns
         -------
-        abs: type of caller
+        abs
+            Series/DataFrame containing the absolute value of each element.
+
+        Notes
+        -----
+        For ``complex`` inputs, ``1.2 + 1j``, the absolute value is
+        :math:`\\sqrt{ a^2 + b^2 }`.
+
+        Examples
+        --------
+        Absolute numeric values in a Series.
+
+        >>> s = pd.Series([-1.10, 2, -3.33, 4])
+        >>> s.abs()
+        0    1.10
+        1    2.00
+        2    3.33
+        3    4.00
+        dtype: float64
+
+        Absolute numeric values in a Series with complex numbers.
+
+        >>> s = pd.Series([1.2 + 1j])
+        >>> s.abs()
+        0    1.56205
+        dtype: float64
+
+        Absolute numeric values in a Series with a Timedelta element.
+
+        >>> s = pd.Series([pd.Timedelta('1 days')])
+        >>> s.abs()
+        0   1 days
+        dtype: timedelta64[ns]
+
+        Select rows with data closest to certain value using argsort (from
+        `StackOverflow <https://stackoverflow.com/a/17758115>`__).
+
+        >>> df = pd.DataFrame({
+        ...     'a': [4, 5, 6, 7],
+        ...     'b': [10, 20, 30, 40],
+        ...     'c': [100, 50, -30, -50]
+        ... })
+        >>> df
+             a    b    c
+        0    4   10  100
+        1    5   20   50
+        2    6   30  -30
+        3    7   40  -50
+        >>> df.loc[(df.c - 43).abs().argsort()]
+             a    b    c
+        1    5   20   50
+        0    4   10  100
+        2    6   30  -30
+        3    7   40  -50
+
+        See Also
+        --------
+        numpy.absolute : calculate the absolute value element-wise.
         """
         return np.abs(self)
 
-    _shared_docs['describe'] = """
-        Generate various summary statistics, excluding NaN values.
+    def describe(self, percentiles=None, include=None, exclude=None):
+        """
+        Generates descriptive statistics that summarize the central tendency,
+        dispersion and shape of a dataset's distribution, excluding
+        ``NaN`` values.
+
+        Analyzes both numeric and object series, as well
+        as ``DataFrame`` column sets of mixed data types. The output
+        will vary depending on what is provided. Refer to the notes
+        below for more detail.
 
         Parameters
         ----------
-        percentiles : array-like, optional
-            The percentiles to include in the output. Should all
-            be in the interval [0, 1]. By default `percentiles` is
-            [.25, .5, .75], returning the 25th, 50th, and 75th percentiles.
-        include, exclude : list-like, 'all', or None (default)
-            Specify the form of the returned result. Either:
-
-            - None to both (default). The result will include only numeric-typed
-              columns or, if none are, only categorical columns.
-            - A list of dtypes or strings to be included/excluded.
-              To select all numeric types use numpy numpy.number. To select
-              categorical objects use type object. See also the select_dtypes
-              documentation. eg. df.describe(include=['O'])
-            - If include is the string 'all', the output column-set will
-              match the input one.
+        percentiles : list-like of numbers, optional
+            The percentiles to include in the output. All should
+            fall between 0 and 1. The default is
+            ``[.25, .5, .75]``, which returns the 25th, 50th, and
+            75th percentiles.
+        include : 'all', list-like of dtypes or None (default), optional
+            A white list of data types to include in the result. Ignored
+            for ``Series``. Here are the options:
+
+            - 'all' : All columns of the input will be included in the output.
+            - A list-like of dtypes : Limits the results to the
+              provided data types.
+              To limit the result to numeric types submit
+              ``numpy.number``. To limit it instead to object columns submit
+              the ``numpy.object`` data type. Strings
+              can also be used in the style of
+              ``select_dtypes`` (e.g. ``df.describe(include=['O'])``). To
+              select pandas categorical columns, use ``'category'``
+            - None (default) : The result will include all numeric columns.
+        exclude : list-like of dtypes or None (default), optional,
+            A black list of data types to omit from the result. Ignored
+            for ``Series``. Here are the options:
+
+            - A list-like of dtypes : Excludes the provided data types
+              from the result. To exclude numeric types submit
+              ``numpy.number``. To exclude object columns submit the data
+              type ``numpy.object``. Strings can also be used in the style of
+              ``select_dtypes`` (e.g. ``df.describe(include=['O'])``). To
+              exclude pandas categorical columns, use ``'category'``
+            - None (default) : The result will exclude nothing.
 
         Returns
         -------
-        summary: %(klass)s of summary statistics
+        summary:  Series/DataFrame of summary statistics
 
         Notes
         -----
-        The output DataFrame index depends on the requested dtypes:
-
-        For numeric dtypes, it will include: count, mean, std, min,
-        max, and lower, 50, and upper percentiles.
-
-        For object dtypes (e.g. timestamps or strings), the index
-        will include the count, unique, most common, and frequency of the
-        most common. Timestamps also include the first and last items.
+        For numeric data, the result's index will include ``count``,
+        ``mean``, ``std``, ``min``, ``max`` as well as lower, ``50`` and
+        upper percentiles. By default the lower percentile is ``25`` and the
+        upper percentile is ``75``. The ``50`` percentile is the
+        same as the median.
+
+        For object data (e.g. strings or timestamps), the result's index
+        will include ``count``, ``unique``, ``top``, and ``freq``. The ``top``
+        is the most common value. The ``freq`` is the most common value's
+        frequency. Timestamps also include the ``first`` and ``last`` items.
+
+        If multiple object values have the highest count, then the
+        ``count`` and ``top`` results will be arbitrarily chosen from
+        among those with the highest count.
 
-        For mixed dtypes, the index will be the union of the corresponding
-        output types. Non-applicable entries will be filled with NaN.
-        Note that mixed-dtype outputs can only be returned from mixed-dtype
-        inputs and appropriate use of the include/exclude arguments.
+        For mixed data types provided via a ``DataFrame``, the default is to
+        return only an analysis of numeric columns. If the dataframe consists
+        only of object and categorical data without any numeric columns, the
+        default is to return an analysis of both the object and categorical
+        columns. If ``include='all'`` is provided as an option, the result
+        will include a union of attributes of each type.
 
-        If multiple values have the highest count, then the
-        `count` and `most common` pair will be arbitrarily chosen from
-        among those with the highest count.
+        The `include` and `exclude` parameters can be used to limit
+        which columns in a ``DataFrame`` are analyzed for the output.
+        The parameters are ignored when analyzing a ``Series``.
 
-        The include, exclude arguments are ignored for Series.
+        Examples
+        --------
+        Describing a numeric ``Series``.
+
+        >>> s = pd.Series([1, 2, 3])
+        >>> s.describe()
+        count    3.0
+        mean     2.0
+        std      1.0
+        min      1.0
+        25%      1.5
+        50%      2.0
+        75%      2.5
+        max      3.0
+
+        Describing a categorical ``Series``.
+
+        >>> s = pd.Series(['a', 'a', 'b', 'c'])
+        >>> s.describe()
+        count     4
+        unique    3
+        top       a
+        freq      2
+        dtype: object
+
+        Describing a timestamp ``Series``.
+
+        >>> s = pd.Series([
+        ...   np.datetime64("2000-01-01"),
+        ...   np.datetime64("2010-01-01"),
+        ...   np.datetime64("2010-01-01")
+        ... ])
+        >>> s.describe()
+        count                       3
+        unique                      2
+        top       2010-01-01 00:00:00
+        freq                        2
+        first     2000-01-01 00:00:00
+        last      2010-01-01 00:00:00
+        dtype: object
+
+        Describing a ``DataFrame``. By default only numeric fields
+        are returned.
+
+        >>> df = pd.DataFrame({ 'object': ['a', 'b', 'c'],
+        ...                     'numeric': [1, 2, 3],
+        ...                     'categorical': pd.Categorical(['d','e','f'])
+        ...                   })
+        >>> df.describe()
+               numeric
+        count      3.0
+        mean       2.0
+        std        1.0
+        min        1.0
+        25%        1.5
+        50%        2.0
+        75%        2.5
+        max        3.0
+
+        Describing all columns of a ``DataFrame`` regardless of data type.
+
+        >>> df.describe(include='all')
+                categorical  numeric object
+        count            3      3.0      3
+        unique           3      NaN      3
+        top              f      NaN      c
+        freq             1      NaN      1
+        mean           NaN      2.0    NaN
+        std            NaN      1.0    NaN
+        min            NaN      1.0    NaN
+        25%            NaN      1.5    NaN
+        50%            NaN      2.0    NaN
+        75%            NaN      2.5    NaN
+        max            NaN      3.0    NaN
+
+        Describing a column from a ``DataFrame`` by accessing it as
+        an attribute.
+
+        >>> df.numeric.describe()
+        count    3.0
+        mean     2.0
+        std      1.0
+        min      1.0
+        25%      1.5
+        50%      2.0
+        75%      2.5
+        max      3.0
+        Name: numeric, dtype: float64
+
+        Including only numeric columns in a ``DataFrame`` description.
+
+        >>> df.describe(include=[np.number])
+               numeric
+        count      3.0
+        mean       2.0
+        std        1.0
+        min        1.0
+        25%        1.5
+        50%        2.0
+        75%        2.5
+        max        3.0
+
+        Including only string columns in a ``DataFrame`` description.
+
+        >>> df.describe(include=[np.object])
+               object
+        count       3
+        unique      3
+        top         c
+        freq        1
+
+        Including only categorical columns from a ``DataFrame`` description.
+
+        >>> df.describe(include=['category'])
+               categorical
+        count            3
+        unique           3
+        top              f
+        freq             1
+
+        Excluding numeric columns from a ``DataFrame`` description.
+
+        >>> df.describe(exclude=[np.number])
+               categorical object
+        count            3      3
+        unique           3      3
+        top              f      c
+        freq             1      1
+
+        Excluding object columns from a ``DataFrame`` description.
+
+        >>> df.describe(exclude=[np.object])
+                categorical  numeric
+        count            3      3.0
+        unique           3      NaN
+        top              f      NaN
+        freq             1      NaN
+        mean           NaN      2.0
+        std            NaN      1.0
+        min            NaN      1.0
+        25%            NaN      1.5
+        50%            NaN      2.0
+        75%            NaN      2.5
+        max            NaN      3.0
 
-        See also
+        See Also
         --------
+        DataFrame.count
+        DataFrame.max
+        DataFrame.min
+        DataFrame.mean
+        DataFrame.std
         DataFrame.select_dtypes
         """
-
-    @Appender(_shared_docs['describe'] % _shared_doc_kwargs)
-    def describe(self, percentiles=None, include=None, exclude=None ):
         if self.ndim >= 3:
-            msg = "describe is not implemented on on Panel or PanelND objects."
+            msg = "describe is not implemented on Panel objects."
             raise NotImplementedError(msg)
+        elif self.ndim == 2 and self.columns.size == 0:
+            raise ValueError("Cannot describe a DataFrame without columns")
 
         if percentiles is not None:
+            # explicit conversion of `percentiles` to list
+            percentiles = list(percentiles)
+
             # get them all to be in [0, 1]
             self._check_percentile(percentiles)
+
+            # median should always be included
+            if 0.5 not in percentiles:
+                percentiles.append(0.5)
             percentiles = np.asarray(percentiles)
         else:
             percentiles = np.array([0.25, 0.5, 0.75])
 
-        # median should always be included
-        if (percentiles != 0.5).all():  # median isn't included
-            lh = percentiles[percentiles < .5]
-            uh = percentiles[percentiles > .5]
-            percentiles = np.hstack([lh, 0.5, uh])
+        # sort and check for duplicates
+        unique_pcts = np.unique(percentiles)
+        if len(unique_pcts) < len(percentiles):
+            raise ValueError("percentiles cannot contain duplicates")
+        percentiles = unique_pcts
 
-        def pretty_name(x):
-            x *= 100
-            if x == int(x):
-                return '%.0f%%' % x
-            else:
-                return '%.1f%%' % x
+        formatted_percentiles = format_percentiles(percentiles)
 
-        def describe_numeric_1d(series, percentiles):
+        def describe_numeric_1d(series):
             stat_index = (['count', 'mean', 'std', 'min'] +
-                  [pretty_name(x) for x in percentiles] + ['max'])
+                          formatted_percentiles + ['max'])
             d = ([series.count(), series.mean(), series.std(), series.min()] +
-                 [series.quantile(x) for x in percentiles] + [series.max()])
+                 series.quantile(percentiles).tolist() + [series.max()])
             return pd.Series(d, index=stat_index, name=series.name)
 
-
         def describe_categorical_1d(data):
             names = ['count', 'unique']
             objcounts = data.value_counts()
-            result = [data.count(), len(objcounts[objcounts!=0])]
+            count_unique = len(objcounts[objcounts != 0])
+            result = [data.count(), count_unique]
             if result[1] > 0:
                 top, freq = objcounts.index[0], objcounts.iloc[0]
 
-                if data.dtype == object or com.is_categorical_dtype(data.dtype):
-                    names += ['top', 'freq']
-                    result += [top, freq]
-
-                elif com.is_datetime64_dtype(data):
+                if is_datetime64_dtype(data):
                     asint = data.dropna().values.view('i8')
                     names += ['top', 'freq', 'first', 'last']
-                    result += [lib.Timestamp(top), freq,
-                               lib.Timestamp(asint.min()),
-                               lib.Timestamp(asint.max())]
+                    result += [tslib.Timestamp(top), freq,
+                               tslib.Timestamp(asint.min()),
+                               tslib.Timestamp(asint.max())]
+                else:
+                    names += ['top', 'freq']
+                    result += [top, freq]
 
             return pd.Series(result, index=names, name=data.name)
 
-        def describe_1d(data, percentiles):
-            if com.is_numeric_dtype(data):
-                return describe_numeric_1d(data, percentiles)
-            elif com.is_timedelta64_dtype(data):
-                return describe_numeric_1d(data, percentiles)
+        def describe_1d(data):
+            if is_bool_dtype(data):
+                return describe_categorical_1d(data)
+            elif is_numeric_dtype(data):
+                return describe_numeric_1d(data)
+            elif is_timedelta64_dtype(data):
+                return describe_numeric_1d(data)
             else:
                 return describe_categorical_1d(data)
 
         if self.ndim == 1:
-            return describe_1d(self, percentiles)
+            return describe_1d(self)
         elif (include is None) and (exclude is None):
-            if len(self._get_numeric_data()._info_axis) > 0:
-                # when some numerics are found, keep only numerics
-                data = self.select_dtypes(include=[np.number, np.bool])
-            else:
+            # when some numerics are found, keep only numerics
+            data = self.select_dtypes(include=[np.number])
+            if len(data.columns) == 0:
                 data = self
         elif include == 'all':
-            if exclude != None:
+            if exclude is not None:
                 msg = "exclude must be None when include is 'all'"
                 raise ValueError(msg)
             data = self
         else:
             data = self.select_dtypes(include=include, exclude=exclude)
 
-        ldesc = [describe_1d(s, percentiles) for _, s in data.iteritems()]
+        ldesc = [describe_1d(s) for _, s in data.iteritems()]
         # set a convenient order for rows
         names = []
         ldesc_indexes = sorted([x.index for x in ldesc], key=len)
@@ -4403,11 +8578,13 @@ def describe_1d(data, percentiles):
             for name in idxnames:
                 if name not in names:
                     names.append(name)
+
         d = pd.concat(ldesc, join_axes=pd.Index([names]), axis=1)
+        d.columns = data.columns.copy()
         return d
 
     def _check_percentile(self, q):
-        """ Validate percentiles. Used by describe and quantile """
+        """Validate percentiles (used by describe and quantile)."""
 
         msg = ("percentiles should all be in the interval [0, 1]. "
                "Try {0} instead.")
@@ -4421,29 +8598,118 @@ def _check_percentile(self, q):
         return q
 
     _shared_docs['pct_change'] = """
-        Percent change over given number of periods.
+        Percentage change between the current and a prior element.
+
+        Computes the percentage change from the immediately previous row by
+        default. This is useful in comparing the percentage of change in a time
+        series of elements.
 
         Parameters
         ----------
         periods : int, default 1
-            Periods to shift for forming percent change
+            Periods to shift for forming percent change.
         fill_method : str, default 'pad'
-            How to handle NAs before computing percent changes
+            How to handle NAs before computing percent changes.
         limit : int, default None
-            The number of consecutive NAs to fill before stopping
+            The number of consecutive NAs to fill before stopping.
         freq : DateOffset, timedelta, or offset alias string, optional
-            Increment to use from time series API (e.g. 'M' or BDay())
+            Increment to use from time series API (e.g. 'M' or BDay()).
+        **kwargs
+            Additional keyword arguments are passed into
+            `DataFrame.shift` or `Series.shift`.
 
         Returns
         -------
-        chg : %(klass)s
+        chg : Series or DataFrame
+            The same type as the calling object.
 
-        Notes
-        -----
+        See Also
+        --------
+        Series.diff : Compute the difference of two elements in a Series.
+        DataFrame.diff : Compute the difference of two elements in a DataFrame.
+        Series.shift : Shift the index by some number of periods.
+        DataFrame.shift : Shift the index by some number of periods.
+
+        Examples
+        --------
+        **Series**
+
+        >>> s = pd.Series([90, 91, 85])
+        >>> s
+        0    90
+        1    91
+        2    85
+        dtype: int64
+
+        >>> s.pct_change()
+        0         NaN
+        1    0.011111
+        2   -0.065934
+        dtype: float64
+
+        >>> s.pct_change(periods=2)
+        0         NaN
+        1         NaN
+        2   -0.055556
+        dtype: float64
+
+        See the percentage change in a Series where filling NAs with last
+        valid observation forward to next valid.
+
+        >>> s = pd.Series([90, 91, None, 85])
+        >>> s
+        0    90.0
+        1    91.0
+        2     NaN
+        3    85.0
+        dtype: float64
+
+        >>> s.pct_change(fill_method='ffill')
+        0         NaN
+        1    0.011111
+        2    0.000000
+        3   -0.065934
+        dtype: float64
+
+        **DataFrame**
+
+        Percentage change in French franc, Deutsche Mark, and Italian lira from
+        1980-01-01 to 1980-03-01.
+
+        >>> df = pd.DataFrame({
+        ...     'FR': [4.0405, 4.0963, 4.3149],
+        ...     'GR': [1.7246, 1.7482, 1.8519],
+        ...     'IT': [804.74, 810.01, 860.13]},
+        ...     index=['1980-01-01', '1980-02-01', '1980-03-01'])
+        >>> df
+                        FR      GR      IT
+        1980-01-01  4.0405  1.7246  804.74
+        1980-02-01  4.0963  1.7482  810.01
+        1980-03-01  4.3149  1.8519  860.13
+
+        >>> df.pct_change()
+                          FR        GR        IT
+        1980-01-01       NaN       NaN       NaN
+        1980-02-01  0.013810  0.013684  0.006549
+        1980-03-01  0.053365  0.059318  0.061876
+
+        Percentage of change in GOOG and APPL stock volume. Shows computing
+        the percentage change between columns.
+
+        >>> df = pd.DataFrame({
+        ...     '2016': [1769950, 30586265],
+        ...     '2015': [1500923, 40912316],
+        ...     '2014': [1371819, 41403351]},
+        ...     index=['GOOG', 'APPL'])
+        >>> df
+                  2016      2015      2014
+        GOOG   1769950   1500923   1371819
+        APPL  30586265  40912316  41403351
 
-        By default, the percentage change is calculated along the stat
-        axis: 0, or ``Index``, for ``DataFrame`` and 1, or ``minor`` for
-        ``Panel``. You can change this with the ``axis`` keyword argument.
+        >>> df.pct_change(axis='columns')
+              2016      2015      2014
+        GOOG   NaN -0.151997 -0.086016
+        APPL   NaN  0.337604  0.012002
         """
 
     @Appender(_shared_docs['pct_change'] % _shared_doc_kwargs)
@@ -4454,17 +8720,20 @@ def pct_change(self, periods=1, fill_method='pad', limit=None, freq=None,
         if fill_method is None:
             data = self
         else:
-            data = self.fillna(method=fill_method, limit=limit)
+            data = self.fillna(method=fill_method, limit=limit, axis=axis)
 
-        rs = (data.div(data.shift(periods=periods, freq=freq,
-                                  axis=axis, **kwargs)) - 1)
+        rs = (data.div(data.shift(periods=periods, freq=freq, axis=axis,
+                                  **kwargs)) - 1)
+        rs = rs.reindex_like(data)
         if freq is None:
-            mask = com.isnull(_values_from_object(self))
+            mask = isna(com._values_from_object(data))
             np.putmask(rs.values, mask, np.nan)
         return rs
 
     def _agg_by_level(self, name, axis=0, level=0, skipna=True, **kwargs):
-        grouped = self.groupby(level=level, axis=axis)
+        if axis is None:
+            raise ValueError("Must specify 'axis' when aggregating by level.")
+        grouped = self.groupby(level=level, axis=axis, sort=False)
         if hasattr(grouped, name) and skipna:
             return getattr(grouped, name)(**kwargs)
         axis = self._get_axis_number(axis)
@@ -4474,264 +8743,954 @@ def _agg_by_level(self, name, axis=0, level=0, skipna=True, **kwargs):
 
     @classmethod
     def _add_numeric_operations(cls):
-        """ add the operations to the cls; evaluate the doc strings again """
+        """Add the operations to the cls; evaluate the doc strings again"""
 
-        axis_descr = "{%s}" % ', '.join([
-            "{0} ({1})".format(a, i) for i, a in enumerate(cls._AXIS_ORDERS)
-        ])
-        name = (cls._constructor_sliced.__name__
-                if cls._AXIS_LEN > 1 else 'scalar')
+        axis_descr, name, name2 = _doc_parms(cls)
+
+        cls.any = _make_logical_function(
+            cls, 'any', name, name2, axis_descr,
+            _any_desc, nanops.nanany, _any_examples, _any_see_also)
+        cls.all = _make_logical_function(
+            cls, 'all', name, name2, axis_descr, _all_doc,
+            nanops.nanall, _all_examples, _all_see_also)
 
-        _num_doc = """
+        @Substitution(outname='mad',
+                      desc="Return the mean absolute deviation of the values "
+                           "for the requested axis",
+                      name1=name, name2=name2, axis_descr=axis_descr,
+                      min_count='', examples='')
+        @Appender(_num_doc)
+        def mad(self, axis=None, skipna=None, level=None):
+            if skipna is None:
+                skipna = True
+            if axis is None:
+                axis = self._stat_axis_number
+            if level is not None:
+                return self._agg_by_level('mad', axis=axis, level=level,
+                                          skipna=skipna)
+
+            data = self._get_numeric_data()
+            if axis == 0:
+                demeaned = data - data.mean(axis=0)
+            else:
+                demeaned = data.sub(data.mean(axis=1), axis=0)
+            return np.abs(demeaned).mean(axis=axis, skipna=skipna)
+
+        cls.mad = mad
+
+        cls.sem = _make_stat_function_ddof(
+            cls, 'sem', name, name2, axis_descr,
+            "Return unbiased standard error of the mean over requested "
+            "axis.\n\nNormalized by N-1 by default. This can be changed "
+            "using the ddof argument",
+            nanops.nansem)
+        cls.var = _make_stat_function_ddof(
+            cls, 'var', name, name2, axis_descr,
+            "Return unbiased variance over requested axis.\n\nNormalized by "
+            "N-1 by default. This can be changed using the ddof argument",
+            nanops.nanvar)
+        cls.std = _make_stat_function_ddof(
+            cls, 'std', name, name2, axis_descr,
+            "Return sample standard deviation over requested axis."
+            "\n\nNormalized by N-1 by default. This can be changed using the "
+            "ddof argument",
+            nanops.nanstd)
+
+        @Substitution(outname='compounded',
+                      desc="Return the compound percentage of the values for "
+                      "the requested axis", name1=name, name2=name2,
+                      axis_descr=axis_descr,
+                      min_count='', examples='')
+        @Appender(_num_doc)
+        def compound(self, axis=None, skipna=None, level=None):
+            if skipna is None:
+                skipna = True
+            return (1 + self).prod(axis=axis, skipna=skipna, level=level) - 1
+
+        cls.compound = compound
+
+        cls.cummin = _make_cum_function(
+            cls, 'cummin', name, name2, axis_descr, "minimum",
+            lambda y, axis: np.minimum.accumulate(y, axis), "min",
+            np.inf, np.nan, _cummin_examples)
+        cls.cumsum = _make_cum_function(
+            cls, 'cumsum', name, name2, axis_descr, "sum",
+            lambda y, axis: y.cumsum(axis), "sum", 0.,
+            np.nan, _cumsum_examples)
+        cls.cumprod = _make_cum_function(
+            cls, 'cumprod', name, name2, axis_descr, "product",
+            lambda y, axis: y.cumprod(axis), "prod", 1.,
+            np.nan, _cumprod_examples)
+        cls.cummax = _make_cum_function(
+            cls, 'cummax', name, name2, axis_descr, "maximum",
+            lambda y, axis: np.maximum.accumulate(y, axis), "max",
+            -np.inf, np.nan, _cummax_examples)
+
+        cls.sum = _make_min_count_stat_function(
+            cls, 'sum', name, name2, axis_descr,
+            'Return the sum of the values for the requested axis',
+            nanops.nansum, _sum_examples)
+        cls.mean = _make_stat_function(
+            cls, 'mean', name, name2, axis_descr,
+            'Return the mean of the values for the requested axis',
+            nanops.nanmean)
+        cls.skew = _make_stat_function(
+            cls, 'skew', name, name2, axis_descr,
+            'Return unbiased skew over requested axis\nNormalized by N-1',
+            nanops.nanskew)
+        cls.kurt = _make_stat_function(
+            cls, 'kurt', name, name2, axis_descr,
+            "Return unbiased kurtosis over requested axis using Fisher's "
+            "definition of\nkurtosis (kurtosis of normal == 0.0). Normalized "
+            "by N-1\n",
+            nanops.nankurt)
+        cls.kurtosis = cls.kurt
+        cls.prod = _make_min_count_stat_function(
+            cls, 'prod', name, name2, axis_descr,
+            'Return the product of the values for the requested axis',
+            nanops.nanprod, _prod_examples)
+        cls.product = cls.prod
+        cls.median = _make_stat_function(
+            cls, 'median', name, name2, axis_descr,
+            'Return the median of the values for the requested axis',
+            nanops.nanmedian)
+        cls.max = _make_stat_function(
+            cls, 'max', name, name2, axis_descr,
+            """This method returns the maximum of the values in the object.
+            If you want the *index* of the maximum, use ``idxmax``. This is
+            the equivalent of the ``numpy.ndarray`` method ``argmax``.""",
+            nanops.nanmax)
+        cls.min = _make_stat_function(
+            cls, 'min', name, name2, axis_descr,
+            """This method returns the minimum of the values in the object.
+            If you want the *index* of the minimum, use ``idxmin``. This is
+            the equivalent of the ``numpy.ndarray`` method ``argmin``.""",
+            nanops.nanmin)
+
+    @classmethod
+    def _add_series_only_operations(cls):
+        """Add the series only operations to the cls; evaluate the doc
+        strings again.
+        """
+
+        axis_descr, name, name2 = _doc_parms(cls)
+
+        def nanptp(values, axis=0, skipna=True):
+            nmax = nanops.nanmax(values, axis, skipna)
+            nmin = nanops.nanmin(values, axis, skipna)
+            return nmax - nmin
+
+        cls.ptp = _make_stat_function(
+            cls, 'ptp', name, name2, axis_descr,
+            """Returns the difference between the maximum value and the
+            minimum value in the object. This is the equivalent of the
+            ``numpy.ndarray`` method ``ptp``.""",
+            nanptp)
+
+    @classmethod
+    def _add_series_or_dataframe_operations(cls):
+        """Add the series or dataframe only operations to the cls; evaluate
+        the doc strings again.
+        """
+
+        from pandas.core import window as rwindow
+
+        @Appender(rwindow.rolling.__doc__)
+        def rolling(self, window, min_periods=None, center=False,
+                    win_type=None, on=None, axis=0, closed=None):
+            axis = self._get_axis_number(axis)
+            return rwindow.rolling(self, window=window,
+                                   min_periods=min_periods,
+                                   center=center, win_type=win_type,
+                                   on=on, axis=axis, closed=closed)
+
+        cls.rolling = rolling
+
+        @Appender(rwindow.expanding.__doc__)
+        def expanding(self, min_periods=1, center=False, axis=0):
+            axis = self._get_axis_number(axis)
+            return rwindow.expanding(self, min_periods=min_periods,
+                                     center=center, axis=axis)
+
+        cls.expanding = expanding
+
+        @Appender(rwindow.ewm.__doc__)
+        def ewm(self, com=None, span=None, halflife=None, alpha=None,
+                min_periods=0, adjust=True, ignore_na=False,
+                axis=0):
+            axis = self._get_axis_number(axis)
+            return rwindow.ewm(self, com=com, span=span, halflife=halflife,
+                               alpha=alpha, min_periods=min_periods,
+                               adjust=adjust, ignore_na=ignore_na, axis=axis)
+
+        cls.ewm = ewm
+
+        @Appender(_shared_docs['transform'] % _shared_doc_kwargs)
+        def transform(self, func, *args, **kwargs):
+            result = self.agg(func, *args, **kwargs)
+            if is_scalar(result) or len(result) != len(self):
+                raise ValueError("transforms cannot produce "
+                                 "aggregated results")
+
+            return result
+
+        cls.transform = transform
+
+    # ----------------------------------------------------------------------
+    # Misc methods
+
+    _shared_docs['valid_index'] = """
+        Return index for %(position)s non-NA/null value.
+
+        Notes
+        --------
+        If all elements are non-NA/null, returns None.
+        Also returns None for empty %(klass)s.
+
+        Returns
+        --------
+        scalar : type of index
+        """
+
+    def _find_valid_index(self, how):
+        """Retrieves the index of the first valid value.
+
+        Parameters
+        ----------
+        how : {'first', 'last'}
+            Use this parameter to change between the first or last valid index.
+
+        Returns
+        -------
+        idx_first_valid : type of index
+        """
+        assert how in ['first', 'last']
+
+        if len(self) == 0:  # early stop
+            return None
+        is_valid = ~self.isna()
+
+        if self.ndim == 2:
+            is_valid = is_valid.any(1)  # reduce axis 1
+
+        if how == 'first':
+            idxpos = is_valid.values[::].argmax()
+
+        if how == 'last':
+            idxpos = len(self) - 1 - is_valid.values[::-1].argmax()
+
+        chk_notna = is_valid.iat[idxpos]
+        idx = self.index[idxpos]
+
+        if not chk_notna:
+            return None
+        return idx
+
+    @Appender(_shared_docs['valid_index'] % {'position': 'first',
+                                             'klass': 'NDFrame'})
+    def first_valid_index(self):
+        return self._find_valid_index('first')
+
+    @Appender(_shared_docs['valid_index'] % {'position': 'last',
+                                             'klass': 'NDFrame'})
+    def last_valid_index(self):
+        return self._find_valid_index('last')
+
+
+def _doc_parms(cls):
+    """Return a tuple of the doc parms."""
+    axis_descr = "{%s}" % ', '.join(["{0} ({1})".format(a, i)
+                                     for i, a in enumerate(cls._AXIS_ORDERS)])
+    name = (cls._constructor_sliced.__name__
+            if cls._AXIS_LEN > 1 else 'scalar')
+    name2 = cls.__name__
+    return axis_descr, name, name2
+
+
+_num_doc = """
 
 %(desc)s
 
 Parameters
 ----------
-axis : """ + axis_descr + """
+axis : %(axis_descr)s
 skipna : boolean, default True
-    Exclude NA/null values. If an entire row/column is NA, the result
-    will be NA
+    Exclude NA/null values when computing the result.
 level : int or level name, default None
-        If the axis is a MultiIndex (hierarchical), count along a
-        particular level, collapsing into a """ + name + """
+    If the axis is a MultiIndex (hierarchical), count along a
+    particular level, collapsing into a %(name1)s
 numeric_only : boolean, default None
-    Include only float, int, boolean data. If None, will attempt to use
-    everything, then use only numeric data
+    Include only float, int, boolean columns. If None, will attempt to use
+    everything, then use only numeric data. Not implemented for Series.
+%(min_count)s\
 
 Returns
 -------
-%(outname)s : """ + name + " or " + cls.__name__ + " (if level specified)\n"
+%(outname)s : %(name1)s or %(name2)s (if level specified)
 
-        _bool_doc = """
+%(examples)s"""
+
+_num_ddof_doc = """
 
 %(desc)s
 
 Parameters
 ----------
-axis : """ + axis_descr + """
+axis : %(axis_descr)s
 skipna : boolean, default True
     Exclude NA/null values. If an entire row/column is NA, the result
     will be NA
 level : int or level name, default None
-        If the axis is a MultiIndex (hierarchical), count along a
-        particular level, collapsing into a """ + name + """
+    If the axis is a MultiIndex (hierarchical), count along a
+    particular level, collapsing into a %(name1)s
+ddof : int, default 1
+    Delta Degrees of Freedom. The divisor used in calculations is N - ddof,
+    where N represents the number of elements.
+numeric_only : boolean, default None
+    Include only float, int, boolean columns. If None, will attempt to use
+    everything, then use only numeric data. Not implemented for Series.
+
+Returns
+-------
+%(outname)s : %(name1)s or %(name2)s (if level specified)\n"""
+
+_bool_doc = """
+%(desc)s
+
+Parameters
+----------
+axis : {0 or 'index', 1 or 'columns', None}, default 0
+    Indicate which axis or axes should be reduced.
+
+    * 0 / 'index' : reduce the index, return a Series whose index is the
+      original column labels.
+    * 1 / 'columns' : reduce the columns, return a Series whose index is the
+      original index.
+    * None : reduce all axes, return a scalar.
+
+skipna : boolean, default True
+    Exclude NA/null values. If an entire row/column is NA, the result
+    will be NA.
+level : int or level name, default None
+    If the axis is a MultiIndex (hierarchical), count along a
+    particular level, collapsing into a %(name1)s.
 bool_only : boolean, default None
-    Include only boolean data. If None, will attempt to use everything,
-    then use only boolean data
+    Include only boolean columns. If None, will attempt to use everything,
+    then use only boolean data. Not implemented for Series.
+**kwargs : any, default None
+    Additional keywords have no effect but might be accepted for
+    compatibility with NumPy.
 
 Returns
 -------
-%(outname)s : """ + name + " or " + cls.__name__ + " (if level specified)\n"
+%(outname)s : %(name1)s or %(name2)s (if level specified)
+
+%(see_also)s
+%(examples)s"""
+
+_all_doc = """\
+Return whether all elements are True, potentially over an axis.
+
+Returns True if all elements within a series or along a Dataframe
+axis are non-zero, not-empty or not-False."""
+
+_all_examples = """\
+Examples
+--------
+Series
+
+>>> pd.Series([True, True]).all()
+True
+>>> pd.Series([True, False]).all()
+False
+
+DataFrames
+
+Create a dataframe from a dictionary.
+
+>>> df = pd.DataFrame({'col1': [True, True], 'col2': [True, False]})
+>>> df
+   col1   col2
+0  True   True
+1  True  False
 
-        _cnum_doc = """
+Default behaviour checks if column-wise values all return True.
+
+>>> df.all()
+col1     True
+col2    False
+dtype: bool
+
+Specify ``axis='columns'`` to check if row-wise values all return True.
+
+>>> df.all(axis='columns')
+0     True
+1    False
+dtype: bool
+
+Or ``axis=None`` for whether every value is True.
+
+>>> df.all(axis=None)
+False
+"""
+
+_all_see_also = """\
+See also
+--------
+pandas.Series.all : Return True if all elements are True
+pandas.DataFrame.any : Return True if one (or more) elements are True
+"""
+
+_cnum_doc = """
+Return cumulative %(desc)s over a DataFrame or Series axis.
+
+Returns a DataFrame or Series of the same size containing the cumulative
+%(desc)s.
 
 Parameters
 ----------
-axis : """ + axis_descr + """
+axis : {0 or 'index', 1 or 'columns'}, default 0
+    The index or the name of the axis. 0 is equivalent to None or 'index'.
 skipna : boolean, default True
     Exclude NA/null values. If an entire row/column is NA, the result
-    will be NA
+    will be NA.
+*args, **kwargs :
+    Additional keywords have no effect but might be accepted for
+    compatibility with NumPy.
 
 Returns
 -------
-%(outname)s : """ + name + "\n"
-
-        def _make_stat_function(name, desc, f):
-
-            @Substitution(outname=name, desc=desc)
-            @Appender(_num_doc)
-            def stat_func(self, axis=None, skipna=None, level=None,
-                          numeric_only=None, **kwargs):
-                if skipna is None:
-                    skipna = True
-                if axis is None:
-                    axis = self._stat_axis_number
-                if level is not None:
-                    return self._agg_by_level(name, axis=axis, level=level,
-                                              skipna=skipna)
-                return self._reduce(f, name, axis=axis,
-                                    skipna=skipna, numeric_only=numeric_only)
-            stat_func.__name__ = name
-            return stat_func
-
-        cls.sum = _make_stat_function(
-            'sum', 'Return the sum of the values for the requested axis',
-            nanops.nansum)
-        cls.mean = _make_stat_function(
-            'mean', 'Return the mean of the values for the requested axis',
-            nanops.nanmean)
-        cls.skew = _make_stat_function(
-            'skew',
-            'Return unbiased skew over requested axis\nNormalized by N-1',
-            nanops.nanskew)
-        cls.kurt = _make_stat_function(
-            'kurt',
-            'Return unbiased kurtosis over requested axis using Fisher''s '
-            'definition of\nkurtosis (kurtosis of normal == 0.0). Normalized '
-            'by N-1\n',
-            nanops.nankurt)
-        cls.kurtosis = cls.kurt
-        cls.prod = _make_stat_function(
-            'prod', 'Return the product of the values for the requested axis',
-            nanops.nanprod)
-        cls.product = cls.prod
-        cls.median = _make_stat_function(
-            'median', 'Return the median of the values for the requested axis',
-            nanops.nanmedian)
-        cls.max = _make_stat_function('max', """
-This method returns the maximum of the values in the object. If you
-want the *index* of the maximum, use ``idxmax``. This is the
-equivalent of the ``numpy.ndarray`` method ``argmax``.""", nanops.nanmax)
-        cls.min = _make_stat_function('min', """
-This method returns the minimum of the values in the object. If you
-want the *index* of the minimum, use ``idxmin``. This is the
-equivalent of the ``numpy.ndarray`` method ``argmin``.""", nanops.nanmin)
-
-        def _make_logical_function(name, desc, f):
-
-            @Substitution(outname=name, desc=desc)
-            @Appender(_bool_doc)
-            def logical_func(self, axis=None, bool_only=None, skipna=None,
-                             level=None, **kwargs):
-                if skipna is None:
-                    skipna = True
-                if axis is None:
-                    axis = self._stat_axis_number
-                if level is not None:
-                    if bool_only is not None:
-                        raise NotImplementedError(
-                            "Option bool_only is not implemented with option "
-                            "level.")
-                    return self._agg_by_level(name, axis=axis, level=level,
-                                              skipna=skipna)
-                return self._reduce(f, axis=axis, skipna=skipna,
-                                    numeric_only=bool_only, filter_type='bool',
-                                    name=name)
-            logical_func.__name__ = name
-            return logical_func
+%(outname)s : %(name1)s or %(name2)s\n
+%(examples)s
+See also
+--------
+pandas.core.window.Expanding.%(accum_func_name)s : Similar functionality
+    but ignores ``NaN`` values.
+%(name2)s.%(accum_func_name)s : Return the %(desc)s over
+    %(name2)s axis.
+%(name2)s.cummax : Return cumulative maximum over %(name2)s axis.
+%(name2)s.cummin : Return cumulative minimum over %(name2)s axis.
+%(name2)s.cumsum : Return cumulative sum over %(name2)s axis.
+%(name2)s.cumprod : Return cumulative product over %(name2)s axis.
+"""
+
+_cummin_examples = """\
+Examples
+--------
+**Series**
+
+>>> s = pd.Series([2, np.nan, 5, -1, 0])
+>>> s
+0    2.0
+1    NaN
+2    5.0
+3   -1.0
+4    0.0
+dtype: float64
+
+By default, NA values are ignored.
+
+>>> s.cummin()
+0    2.0
+1    NaN
+2    2.0
+3   -1.0
+4   -1.0
+dtype: float64
+
+To include NA values in the operation, use ``skipna=False``
+
+>>> s.cummin(skipna=False)
+0    2.0
+1    NaN
+2    NaN
+3    NaN
+4    NaN
+dtype: float64
+
+**DataFrame**
+
+>>> df = pd.DataFrame([[2.0, 1.0],
+...                    [3.0, np.nan],
+...                    [1.0, 0.0]],
+...                    columns=list('AB'))
+>>> df
+     A    B
+0  2.0  1.0
+1  3.0  NaN
+2  1.0  0.0
+
+By default, iterates over rows and finds the minimum
+in each column. This is equivalent to ``axis=None`` or ``axis='index'``.
+
+>>> df.cummin()
+     A    B
+0  2.0  1.0
+1  2.0  NaN
+2  1.0  0.0
+
+To iterate over columns and find the minimum in each row,
+use ``axis=1``
+
+>>> df.cummin(axis=1)
+     A    B
+0  2.0  1.0
+1  3.0  NaN
+2  1.0  0.0
+"""
+
+_cumsum_examples = """\
+Examples
+--------
+**Series**
+
+>>> s = pd.Series([2, np.nan, 5, -1, 0])
+>>> s
+0    2.0
+1    NaN
+2    5.0
+3   -1.0
+4    0.0
+dtype: float64
+
+By default, NA values are ignored.
+
+>>> s.cumsum()
+0    2.0
+1    NaN
+2    7.0
+3    6.0
+4    6.0
+dtype: float64
+
+To include NA values in the operation, use ``skipna=False``
+
+>>> s.cumsum(skipna=False)
+0    2.0
+1    NaN
+2    NaN
+3    NaN
+4    NaN
+dtype: float64
+
+**DataFrame**
+
+>>> df = pd.DataFrame([[2.0, 1.0],
+...                    [3.0, np.nan],
+...                    [1.0, 0.0]],
+...                    columns=list('AB'))
+>>> df
+     A    B
+0  2.0  1.0
+1  3.0  NaN
+2  1.0  0.0
+
+By default, iterates over rows and finds the sum
+in each column. This is equivalent to ``axis=None`` or ``axis='index'``.
+
+>>> df.cumsum()
+     A    B
+0  2.0  1.0
+1  5.0  NaN
+2  6.0  1.0
+
+To iterate over columns and find the sum in each row,
+use ``axis=1``
+
+>>> df.cumsum(axis=1)
+     A    B
+0  2.0  3.0
+1  3.0  NaN
+2  1.0  1.0
+"""
+
+_cumprod_examples = """\
+Examples
+--------
+**Series**
+
+>>> s = pd.Series([2, np.nan, 5, -1, 0])
+>>> s
+0    2.0
+1    NaN
+2    5.0
+3   -1.0
+4    0.0
+dtype: float64
+
+By default, NA values are ignored.
+
+>>> s.cumprod()
+0     2.0
+1     NaN
+2    10.0
+3   -10.0
+4    -0.0
+dtype: float64
+
+To include NA values in the operation, use ``skipna=False``
+
+>>> s.cumprod(skipna=False)
+0    2.0
+1    NaN
+2    NaN
+3    NaN
+4    NaN
+dtype: float64
+
+**DataFrame**
+
+>>> df = pd.DataFrame([[2.0, 1.0],
+...                    [3.0, np.nan],
+...                    [1.0, 0.0]],
+...                    columns=list('AB'))
+>>> df
+     A    B
+0  2.0  1.0
+1  3.0  NaN
+2  1.0  0.0
+
+By default, iterates over rows and finds the product
+in each column. This is equivalent to ``axis=None`` or ``axis='index'``.
+
+>>> df.cumprod()
+     A    B
+0  2.0  1.0
+1  6.0  NaN
+2  6.0  0.0
+
+To iterate over columns and find the product in each row,
+use ``axis=1``
+
+>>> df.cumprod(axis=1)
+     A    B
+0  2.0  2.0
+1  3.0  NaN
+2  1.0  0.0
+"""
+
+_cummax_examples = """\
+Examples
+--------
+**Series**
+
+>>> s = pd.Series([2, np.nan, 5, -1, 0])
+>>> s
+0    2.0
+1    NaN
+2    5.0
+3   -1.0
+4    0.0
+dtype: float64
+
+By default, NA values are ignored.
+
+>>> s.cummax()
+0    2.0
+1    NaN
+2    5.0
+3    5.0
+4    5.0
+dtype: float64
+
+To include NA values in the operation, use ``skipna=False``
+
+>>> s.cummax(skipna=False)
+0    2.0
+1    NaN
+2    NaN
+3    NaN
+4    NaN
+dtype: float64
+
+**DataFrame**
+
+>>> df = pd.DataFrame([[2.0, 1.0],
+...                    [3.0, np.nan],
+...                    [1.0, 0.0]],
+...                    columns=list('AB'))
+>>> df
+     A    B
+0  2.0  1.0
+1  3.0  NaN
+2  1.0  0.0
+
+By default, iterates over rows and finds the maximum
+in each column. This is equivalent to ``axis=None`` or ``axis='index'``.
+
+>>> df.cummax()
+     A    B
+0  2.0  1.0
+1  3.0  NaN
+2  3.0  1.0
+
+To iterate over columns and find the maximum in each row,
+use ``axis=1``
+
+>>> df.cummax(axis=1)
+     A    B
+0  2.0  2.0
+1  3.0  NaN
+2  1.0  1.0
+"""
+
+_any_see_also = """\
+See Also
+--------
+numpy.any : Numpy version of this method.
+Series.any : Return whether any element is True.
+Series.all : Return whether all elements are True.
+DataFrame.any : Return whether any element is True over requested axis.
+DataFrame.all : Return whether all elements are True over requested axis.
+"""
+
+_any_desc = """\
+Return whether any element is True over requested axis.
+
+Unlike :meth:`DataFrame.all`, this performs an *or* operation. If any of the
+values along the specified axis is True, this will return True."""
+
+_any_examples = """\
+Examples
+--------
+**Series**
+
+For Series input, the output is a scalar indicating whether any element
+is True.
+
+>>> pd.Series([True, False]).any()
+True
+
+**DataFrame**
+
+Whether each column contains at least one True element (the default).
+
+>>> df = pd.DataFrame({"A": [1, 2], "B": [0, 2], "C": [0, 0]})
+>>> df
+   A  B  C
+0  1  0  0
+1  2  2  0
+
+>>> df.any()
+A     True
+B     True
+C    False
+dtype: bool
+
+Aggregating over the columns.
+
+>>> df = pd.DataFrame({"A": [True, False], "B": [1, 2]})
+>>> df
+       A  B
+0   True  1
+1  False  2
+
+>>> df.any(axis='columns')
+0    True
+1    True
+dtype: bool
+
+>>> df = pd.DataFrame({"A": [True, False], "B": [1, 0]})
+>>> df
+       A  B
+0   True  1
+1  False  0
+
+>>> df.any(axis='columns')
+0    True
+1    False
+dtype: bool
+
+Aggregating over the entire DataFrame with ``axis=None``.
 
-        cls.any = _make_logical_function(
-            'any', 'Return whether any element is True over requested axis',
-            nanops.nanany)
-        cls.all = _make_logical_function(
-            'all', 'Return whether all elements are True over requested axis',
-            nanops.nanall)
+>>> df.any(axis=None)
+True
+
+`any` for an empty DataFrame is an empty Series.
+
+>>> pd.DataFrame([]).any()
+Series([], dtype: bool)
+"""
 
-        @Substitution(outname='mad',
-                      desc="Return the mean absolute deviation of the values "
-                           "for the requested axis")
-        @Appender(_num_doc)
-        def mad(self,  axis=None, skipna=None, level=None):
-            if skipna is None:
-                skipna = True
-            if axis is None:
-                axis = self._stat_axis_number
-            if level is not None:
-                return self._agg_by_level('mad', axis=axis, level=level,
-                                          skipna=skipna)
+_sum_examples = """\
+Examples
+--------
+By default, the sum of an empty or all-NA Series is ``0``.
 
-            data = self._get_numeric_data()
-            if axis == 0:
-                demeaned = data - data.mean(axis=0)
-            else:
-                demeaned = data.sub(data.mean(axis=1), axis=0)
-            return np.abs(demeaned).mean(axis=axis, skipna=skipna)
-        cls.mad = mad
+>>> pd.Series([]).sum()  # min_count=0 is the default
+0.0
 
-        def _make_stat_function_ddof(name, desc, f):
-
-            @Substitution(outname=name, desc=desc)
-            @Appender(_num_doc)
-            def stat_func(self, axis=None, skipna=None, level=None, ddof=1,
-                          numeric_only=None, **kwargs):
-                if skipna is None:
-                    skipna = True
-                if axis is None:
-                    axis = self._stat_axis_number
-                if level is not None:
-                    return self._agg_by_level(name, axis=axis, level=level,
-                                              skipna=skipna, ddof=ddof)
-                return self._reduce(f, name, axis=axis,
-                                    numeric_only=numeric_only,
-                                    skipna=skipna, ddof=ddof)
-            stat_func.__name__ = name
-            return stat_func
+This can be controlled with the ``min_count`` parameter. For example, if
+you'd like the sum of an empty series to be NaN, pass ``min_count=1``.
 
-        cls.sem = _make_stat_function_ddof(
-            'sem',
-            "Return unbiased standard error of the mean over "
-            "requested axis.\n\nNormalized by N-1 by default. "
-            "This can be changed using the ddof argument",
-            nanops.nansem)
-        cls.var = _make_stat_function_ddof(
-            'var',
-            "Return unbiased variance over requested "
-            "axis.\n\nNormalized by N-1 by default. "
-            "This can be changed using the ddof argument",
-            nanops.nanvar)
-        cls.std = _make_stat_function_ddof(
-            'std',
-            "Return unbiased standard deviation over requested "
-            "axis.\n\nNormalized by N-1 by default. "
-            "This can be changed using the ddof argument",
-            nanops.nanstd)
+>>> pd.Series([]).sum(min_count=1)
+nan
 
-        @Substitution(outname='compounded',
-                      desc="Return the compound percentage of the values for "
-                           "the requested axis")
-        @Appender(_num_doc)
-        def compound(self, axis=None, skipna=None, level=None):
-            if skipna is None:
-                skipna = True
-            return (1 + self).prod(axis=axis, skipna=skipna, level=level) - 1
-        cls.compound = compound
+Thanks to the ``skipna`` parameter, ``min_count`` handles all-NA and
+empty series identically.
 
-        def _make_cum_function(name, accum_func, mask_a, mask_b):
+>>> pd.Series([np.nan]).sum()
+0.0
 
-            @Substitution(outname=name)
-            @Appender("Return cumulative {0} over requested axis.".format(name)
-                      + _cnum_doc)
-            def func(self, axis=None, dtype=None, out=None, skipna=True,
-                     **kwargs):
-                if axis is None:
-                    axis = self._stat_axis_number
-                else:
-                    axis = self._get_axis_number(axis)
-
-                y = _values_from_object(self).copy()
-
-                if skipna and issubclass(y.dtype.type,
-                                         (np.datetime64, np.timedelta64)):
-                    result = accum_func(y, axis)
-                    mask = isnull(self)
-                    np.putmask(result, mask, pd.tslib.iNaT)
-                elif skipna and not issubclass(y.dtype.type, (np.integer, np.bool_)):
-                    mask = isnull(self)
-                    np.putmask(y, mask, mask_a)
-                    result = accum_func(y, axis)
-                    np.putmask(result, mask, mask_b)
-                else:
-                    result = accum_func(y, axis)
+>>> pd.Series([np.nan]).sum(min_count=1)
+nan
+"""
 
-                d = self._construct_axes_dict()
-                d['copy'] = False
-                return self._constructor(result, **d).__finalize__(self)
+_prod_examples = """\
+Examples
+--------
+By default, the product of an empty or all-NA Series is ``1``
 
-            func.__name__ = name
-            return func
+>>> pd.Series([]).prod()
+1.0
+
+This can be controlled with the ``min_count`` parameter
+
+>>> pd.Series([]).prod(min_count=1)
+nan
+
+Thanks to the ``skipna`` parameter, ``min_count`` handles all-NA and
+empty series identically.
+
+>>> pd.Series([np.nan]).prod()
+1.0
+
+>>> pd.Series([np.nan]).prod(min_count=1)
+nan
+"""
+
+
+_min_count_stub = """\
+min_count : int, default 0
+    The required number of valid values to perform the operation. If fewer than
+    ``min_count`` non-NA values are present the result will be NA.
+
+    .. versionadded :: 0.22.0
+
+       Added with the default being 0. This means the sum of an all-NA
+       or empty Series is 0, and the product of an all-NA or empty
+       Series is 1.
+"""
+
+
+def _make_min_count_stat_function(cls, name, name1, name2, axis_descr, desc,
+                                  f, examples):
+    @Substitution(outname=name, desc=desc, name1=name1, name2=name2,
+                  axis_descr=axis_descr, min_count=_min_count_stub,
+                  examples=examples)
+    @Appender(_num_doc)
+    def stat_func(self, axis=None, skipna=None, level=None, numeric_only=None,
+                  min_count=0,
+                  **kwargs):
+        nv.validate_stat_func(tuple(), kwargs, fname=name)
+        if skipna is None:
+            skipna = True
+        if axis is None:
+            axis = self._stat_axis_number
+        if level is not None:
+            return self._agg_by_level(name, axis=axis, level=level,
+                                      skipna=skipna, min_count=min_count)
+        return self._reduce(f, name, axis=axis, skipna=skipna,
+                            numeric_only=numeric_only, min_count=min_count)
+
+    return set_function_name(stat_func, name, cls)
+
+
+def _make_stat_function(cls, name, name1, name2, axis_descr, desc, f):
+    @Substitution(outname=name, desc=desc, name1=name1, name2=name2,
+                  axis_descr=axis_descr, min_count='', examples='')
+    @Appender(_num_doc)
+    def stat_func(self, axis=None, skipna=None, level=None, numeric_only=None,
+                  **kwargs):
+        nv.validate_stat_func(tuple(), kwargs, fname=name)
+        if skipna is None:
+            skipna = True
+        if axis is None:
+            axis = self._stat_axis_number
+        if level is not None:
+            return self._agg_by_level(name, axis=axis, level=level,
+                                      skipna=skipna)
+        return self._reduce(f, name, axis=axis, skipna=skipna,
+                            numeric_only=numeric_only)
+
+    return set_function_name(stat_func, name, cls)
+
+
+def _make_stat_function_ddof(cls, name, name1, name2, axis_descr, desc, f):
+    @Substitution(outname=name, desc=desc, name1=name1, name2=name2,
+                  axis_descr=axis_descr)
+    @Appender(_num_ddof_doc)
+    def stat_func(self, axis=None, skipna=None, level=None, ddof=1,
+                  numeric_only=None, **kwargs):
+        nv.validate_stat_ddof_func(tuple(), kwargs, fname=name)
+        if skipna is None:
+            skipna = True
+        if axis is None:
+            axis = self._stat_axis_number
+        if level is not None:
+            return self._agg_by_level(name, axis=axis, level=level,
+                                      skipna=skipna, ddof=ddof)
+        return self._reduce(f, name, axis=axis, numeric_only=numeric_only,
+                            skipna=skipna, ddof=ddof)
+
+    return set_function_name(stat_func, name, cls)
+
+
+def _make_cum_function(cls, name, name1, name2, axis_descr, desc,
+                       accum_func, accum_func_name, mask_a, mask_b, examples):
+    @Substitution(outname=name, desc=desc, name1=name1, name2=name2,
+                  axis_descr=axis_descr, accum_func_name=accum_func_name,
+                  examples=examples)
+    @Appender(_cnum_doc)
+    def cum_func(self, axis=None, skipna=True, *args, **kwargs):
+        skipna = nv.validate_cum_func_with_skipna(skipna, args, kwargs, name)
+        if axis is None:
+            axis = self._stat_axis_number
+        else:
+            axis = self._get_axis_number(axis)
+
+        y = com._values_from_object(self).copy()
+
+        if (skipna and
+                issubclass(y.dtype.type, (np.datetime64, np.timedelta64))):
+            result = accum_func(y, axis)
+            mask = isna(self)
+            np.putmask(result, mask, tslib.iNaT)
+        elif skipna and not issubclass(y.dtype.type, (np.integer, np.bool_)):
+            mask = isna(self)
+            np.putmask(y, mask, mask_a)
+            result = accum_func(y, axis)
+            np.putmask(result, mask, mask_b)
+        else:
+            result = accum_func(y, axis)
+
+        d = self._construct_axes_dict()
+        d['copy'] = False
+        return self._constructor(result, **d).__finalize__(self)
+
+    return set_function_name(cum_func, name, cls)
+
+
+def _make_logical_function(cls, name, name1, name2, axis_descr, desc, f,
+                           examples, see_also):
+    @Substitution(outname=name, desc=desc, name1=name1, name2=name2,
+                  axis_descr=axis_descr, examples=examples, see_also=see_also)
+    @Appender(_bool_doc)
+    def logical_func(self, axis=0, bool_only=None, skipna=True, level=None,
+                     **kwargs):
+        nv.validate_logical_func(tuple(), kwargs, fname=name)
+        if level is not None:
+            if bool_only is not None:
+                raise NotImplementedError("Option bool_only is not "
+                                          "implemented with option level.")
+            return self._agg_by_level(name, axis=axis, level=level,
+                                      skipna=skipna)
+        return self._reduce(f, name, axis=axis, skipna=skipna,
+                            numeric_only=bool_only, filter_type='bool')
+
+    return set_function_name(logical_func, name, cls)
 
-        cls.cummin = _make_cum_function(
-            'min', lambda y, axis: np.minimum.accumulate(y, axis),
-            np.inf, np.nan)
-        cls.cumsum = _make_cum_function(
-            'sum', lambda y, axis: y.cumsum(axis), 0., np.nan)
-        cls.cumprod = _make_cum_function(
-            'prod', lambda y, axis: y.cumprod(axis), 1., np.nan)
-        cls.cummax = _make_cum_function(
-            'max', lambda y, axis: np.maximum.accumulate(y, axis),
-            -np.inf, np.nan)
 
-# install the indexerse
+# install the indexes
 for _name, _indexer in indexing.get_indexers_list():
     NDFrame._create_indexer(_name, _indexer)
diff --git a/pandas/core/groupby.py b/pandas/core/groupby.py
deleted file mode 100644
index add5080a69ee4..0000000000000
--- a/pandas/core/groupby.py
+++ /dev/null
@@ -1,4095 +0,0 @@
-import types
-from functools import wraps
-import numpy as np
-import datetime
-import collections
-import warnings
-
-from pandas.compat import(
-    zip, builtins, range, long, lzip,
-    OrderedDict, callable, filter, map
-)
-from pandas import compat
-
-from pandas.core.base import PandasObject
-from pandas.core.categorical import Categorical
-from pandas.core.frame import DataFrame
-from pandas.core.generic import NDFrame
-from pandas.core.index import Index, MultiIndex, CategoricalIndex, _ensure_index
-from pandas.core.internals import BlockManager, make_block
-from pandas.core.series import Series
-from pandas.core.panel import Panel
-from pandas.util.decorators import (cache_readonly, Appender, make_signature,
-                                    deprecate_kwarg)
-import pandas.core.algorithms as algos
-import pandas.core.common as com
-from pandas.core.common import(_possibly_downcast_to_dtype, isnull,
-                               notnull, _DATELIKE_DTYPES, is_numeric_dtype,
-                               is_timedelta64_dtype, is_datetime64_dtype,
-                               is_categorical_dtype, _values_from_object,
-                               is_datetime_or_timedelta_dtype, is_bool,
-                               is_bool_dtype, AbstractMethodError)
-from pandas.core.config import option_context
-import pandas.lib as lib
-from pandas.lib import Timestamp
-import pandas.tslib as tslib
-import pandas.algos as _algos
-import pandas.hashtable as _hash
-
-_agg_doc = """Aggregate using input function or dict of {column -> function}
-
-Parameters
-----------
-arg : function or dict
-    Function to use for aggregating groups. If a function, must either
-    work when passed a DataFrame or when passed to DataFrame.apply. If
-    passed a dict, the keys must be DataFrame column names.
-
-Notes
------
-Numpy functions mean/median/prod/sum/std/var are special cased so the
-default behavior is applying the function along axis=0
-(e.g., np.mean(arr_2d, axis=0)) as opposed to
-mimicking the default Numpy behavior (e.g., np.mean(arr_2d)).
-
-Returns
--------
-aggregated : DataFrame
-"""
-
-
-# special case to prevent duplicate plots when catching exceptions when
-# forwarding methods from NDFrames
-_plotting_methods = frozenset(['plot', 'boxplot', 'hist'])
-
-_common_apply_whitelist = frozenset([
-    'last', 'first',
-    'head', 'tail', 'median',
-    'mean', 'sum', 'min', 'max',
-    'cumsum', 'cumprod', 'cummin', 'cummax', 'cumcount',
-    'resample',
-    'describe',
-    'rank', 'quantile',
-    'fillna',
-    'mad',
-    'any', 'all',
-    'take',
-    'idxmax', 'idxmin',
-    'shift', 'tshift',
-    'ffill', 'bfill',
-    'pct_change', 'skew',
-    'corr', 'cov', 'diff',
-]) | _plotting_methods
-
-_series_apply_whitelist = \
-    (_common_apply_whitelist - set(['boxplot'])) | \
-    frozenset(['dtype', 'unique'])
-
-_dataframe_apply_whitelist = \
-    _common_apply_whitelist | frozenset(['dtypes', 'corrwith'])
-
-
-class GroupByError(Exception):
-    pass
-
-
-class DataError(GroupByError):
-    pass
-
-
-class SpecificationError(GroupByError):
-    pass
-
-
-def _groupby_function(name, alias, npfunc, numeric_only=True,
-                      _convert=False):
-    def f(self):
-        self._set_selection_from_grouper()
-        try:
-            return self._cython_agg_general(alias, numeric_only=numeric_only)
-        except AssertionError as e:
-            raise SpecificationError(str(e))
-        except Exception:
-            result = self.aggregate(lambda x: npfunc(x, axis=self.axis))
-            if _convert:
-                result = result._convert(datetime=True)
-            return result
-
-    f.__doc__ = "Compute %s of group values" % name
-    f.__name__ = name
-
-    return f
-
-
-def _first_compat(x, axis=0):
-    def _first(x):
-        x = np.asarray(x)
-        x = x[notnull(x)]
-        if len(x) == 0:
-            return np.nan
-        return x[0]
-
-    if isinstance(x, DataFrame):
-        return x.apply(_first, axis=axis)
-    else:
-        return _first(x)
-
-
-def _last_compat(x, axis=0):
-    def _last(x):
-        x = np.asarray(x)
-        x = x[notnull(x)]
-        if len(x) == 0:
-            return np.nan
-        return x[-1]
-
-    if isinstance(x, DataFrame):
-        return x.apply(_last, axis=axis)
-    else:
-        return _last(x)
-
-
-class Grouper(object):
-    """
-    A Grouper allows the user to specify a groupby instruction for a target object
-
-    This specification will select a column via the key parameter, or if the level and/or
-    axis parameters are given, a level of the index of the target object.
-
-    These are local specifications and will override 'global' settings, that is the parameters
-    axis and level which are passed to the groupby itself.
-
-    Parameters
-    ----------
-    key : string, defaults to None
-        groupby key, which selects the grouping column of the target
-    level : name/number, defaults to None
-        the level for the target index
-    freq : string / frequency object, defaults to None
-        This will groupby the specified frequency if the target selection (via key or level) is
-        a datetime-like object. For full specification of available frequencies, please see
-        `here <http://pandas.pydata.org/pandas-docs/stable/timeseries.html>`_.
-    axis : number/name of the axis, defaults to 0
-    sort : boolean, default to False
-        whether to sort the resulting labels
-
-    additional kwargs to control time-like groupers (when freq is passed)
-
-    closed : closed end of interval; left or right
-    label : interval boundary to use for labeling; left or right
-    convention : {'start', 'end', 'e', 's'}
-        If grouper is PeriodIndex
-
-    Returns
-    -------
-    A specification for a groupby instruction
-
-    Examples
-    --------
-
-    Syntactic sugar for ``df.groupby('A')``
-
-    >>> df.groupby(Grouper(key='A'))
-
-    Specify a resample operation on the column 'date'
-
-    >>> df.groupby(Grouper(key='date', freq='60s'))
-
-    Specify a resample operation on the level 'date' on the columns axis
-    with a frequency of 60s
-
-    >>> df.groupby(Grouper(level='date', freq='60s', axis=1))
-    """
-
-    def __new__(cls, *args, **kwargs):
-        if kwargs.get('freq') is not None:
-            from pandas.tseries.resample import TimeGrouper
-            cls = TimeGrouper
-        return super(Grouper, cls).__new__(cls)
-
-    def __init__(self, key=None, level=None, freq=None, axis=0, sort=False):
-        self.key=key
-        self.level=level
-        self.freq=freq
-        self.axis=axis
-        self.sort=sort
-
-        self.grouper=None
-        self.obj=None
-        self.indexer=None
-        self.binner=None
-
-    @property
-    def ax(self):
-        return self.grouper
-
-    def _get_grouper(self, obj):
-
-        """
-        Parameters
-        ----------
-        obj : the subject object
-
-        Returns
-        -------
-        a tuple of binner, grouper, obj (possibly sorted)
-        """
-
-        self._set_grouper(obj)
-        self.grouper, exclusions, self.obj = _get_grouper(self.obj, [self.key], axis=self.axis,
-                                                          level=self.level, sort=self.sort)
-        return self.binner, self.grouper, self.obj
-
-    def _set_grouper(self, obj, sort=False):
-        """
-        given an object and the specifications, setup the internal grouper for this particular specification
-
-        Parameters
-        ----------
-        obj : the subject object
-
-        """
-
-        if self.key is not None and self.level is not None:
-            raise ValueError("The Grouper cannot specify both a key and a level!")
-
-        # the key must be a valid info item
-        if self.key is not None:
-            key = self.key
-            if key not in obj._info_axis:
-                raise KeyError("The grouper name {0} is not found".format(key))
-            ax = Index(obj[key], name=key)
-
-        else:
-            ax = obj._get_axis(self.axis)
-            if self.level is not None:
-                level = self.level
-
-                # if a level is given it must be a mi level or
-                # equivalent to the axis name
-                if isinstance(ax, MultiIndex):
-                    level = ax._get_level_number(level)
-                    ax = Index(ax.get_level_values(level), name=ax.names[level])
-
-                else:
-                    if level not in (0, ax.name):
-                        raise ValueError("The level {0} is not valid".format(level))
-
-        # possibly sort
-        if (self.sort or sort) and not ax.is_monotonic:
-            indexer = self.indexer = ax.argsort(kind='quicksort')
-            ax = ax.take(indexer)
-            obj = obj.take(indexer, axis=self.axis, convert=False, is_copy=False)
-
-        self.obj = obj
-        self.grouper = ax
-        return self.grouper
-
-    def _get_binner_for_grouping(self, obj):
-        """ default to the standard binner here """
-        group_axis = obj._get_axis(self.axis)
-        return Grouping(group_axis, None, obj=obj, name=self.key,
-                        level=self.level, sort=self.sort, in_axis=False)
-
-    @property
-    def groups(self):
-        return self.grouper.groups
-
-
-class GroupByPlot(PandasObject):
-    """
-    Class implementing the .plot attribute for groupby objects
-    """
-    def __init__(self, groupby):
-        self._groupby = groupby
-
-    def __call__(self, *args, **kwargs):
-        def f(self, *args, **kwargs):
-            return self.plot(*args, **kwargs)
-        f.__name__ = 'plot'
-        return self._groupby.apply(f)
-
-    def __getattr__(self, name):
-        def attr(*args, **kwargs):
-            def f(self):
-                return getattr(self.plot, name)(*args, **kwargs)
-            return self._groupby.apply(f)
-        return attr
-
-
-class GroupBy(PandasObject):
-
-    """
-    Class for grouping and aggregating relational data. See aggregate,
-    transform, and apply functions on this object.
-
-    It's easiest to use obj.groupby(...) to use GroupBy, but you can also do:
-
-    ::
-
-        grouped = groupby(obj, ...)
-
-    Parameters
-    ----------
-    obj : pandas object
-    axis : int, default 0
-    level : int, default None
-        Level of MultiIndex
-    groupings : list of Grouping objects
-        Most users should ignore this
-    exclusions : array-like, optional
-        List of columns to exclude
-    name : string
-        Most users should ignore this
-
-    Notes
-    -----
-    After grouping, see aggregate, apply, and transform functions. Here are
-    some other brief notes about usage. When grouping by multiple groups, the
-    result index will be a MultiIndex (hierarchical) by default.
-
-    Iteration produces (key, group) tuples, i.e. chunking the data by group. So
-    you can write code like:
-
-    ::
-
-        grouped = obj.groupby(keys, axis=axis)
-        for key, group in grouped:
-            # do something with the data
-
-    Function calls on GroupBy, if not specially implemented, "dispatch" to the
-    grouped data. So if you group a DataFrame and wish to invoke the std()
-    method on each group, you can simply do:
-
-    ::
-
-        df.groupby(mapper).std()
-
-    rather than
-
-    ::
-
-        df.groupby(mapper).aggregate(np.std)
-
-    You can pass arguments to these "wrapped" functions, too.
-
-    See the online documentation for full exposition on these topics and much
-    more
-
-    Returns
-    -------
-    **Attributes**
-    groups : dict
-        {group name -> group labels}
-    len(grouped) : int
-        Number of groups
-    """
-    _apply_whitelist = _common_apply_whitelist
-    _internal_names = ['_cache']
-    _internal_names_set = set(_internal_names)
-    _group_selection = None
-
-    def __init__(self, obj, keys=None, axis=0, level=None,
-                 grouper=None, exclusions=None, selection=None, as_index=True,
-                 sort=True, group_keys=True, squeeze=False):
-        self._selection = selection
-
-        if isinstance(obj, NDFrame):
-            obj._consolidate_inplace()
-
-        self.level = level
-
-        if not as_index:
-            if not isinstance(obj, DataFrame):
-                raise TypeError('as_index=False only valid with DataFrame')
-            if axis != 0:
-                raise ValueError('as_index=False only valid for axis=0')
-
-        self.as_index = as_index
-        self.keys = keys
-        self.sort = sort
-        self.group_keys = group_keys
-        self.squeeze = squeeze
-
-        if grouper is None:
-            grouper, exclusions, obj = _get_grouper(obj, keys, axis=axis,
-                                                    level=level, sort=sort)
-
-        self.obj = obj
-        self.axis = obj._get_axis_number(axis)
-        self.grouper = grouper
-        self.exclusions = set(exclusions) if exclusions else set()
-
-    def __len__(self):
-        return len(self.groups)
-
-    def __unicode__(self):
-        # TODO: Better unicode/repr for GroupBy object
-        return object.__repr__(self)
-
-    @property
-    def groups(self):
-        """ dict {group name -> group labels} """
-        return self.grouper.groups
-
-    @property
-    def ngroups(self):
-        return self.grouper.ngroups
-
-    @property
-    def indices(self):
-        """ dict {group name -> group indices} """
-        return self.grouper.indices
-
-    def _get_indices(self, names):
-        """ safe get multiple indices, translate keys for datelike to underlying repr """
-
-        def get_converter(s):
-            # possibly convert to the actual key types
-            # in the indices, could be a Timestamp or a np.datetime64
-            if isinstance(s, (Timestamp,datetime.datetime)):
-                return lambda key: Timestamp(key)
-            elif isinstance(s, np.datetime64):
-                return lambda key: Timestamp(key).asm8
-            else:
-                return lambda key: key
-
-        if len(names) == 0:
-            return []
-
-        if len(self.indices) > 0:
-            index_sample = next(iter(self.indices))
-        else:
-            index_sample = None     # Dummy sample
-
-        name_sample = names[0]
-        if isinstance(index_sample, tuple):
-            if not isinstance(name_sample, tuple):
-                msg = ("must supply a tuple to get_group with multiple"
-                       " grouping keys")
-                raise ValueError(msg)
-            if not len(name_sample) == len(index_sample):
-                try:
-                    # If the original grouper was a tuple
-                    return [self.indices[name] for name in names]
-                except KeyError:
-                    # turns out it wasn't a tuple
-                    msg = ("must supply a a same-length tuple to get_group"
-                           " with multiple grouping keys")
-                    raise ValueError(msg)
-
-            converters = [get_converter(s) for s in index_sample]
-            names = [tuple([f(n) for f, n in zip(converters, name)]) for name in names]
-
-        else:
-            converter = get_converter(index_sample)
-            names = [converter(name) for name in names]
-
-        return [self.indices.get(name, []) for name in names]
-
-    def _get_index(self, name):
-        """ safe get index, translate keys for datelike to underlying repr """
-        return self._get_indices([name])[0]
-
-    @property
-    def name(self):
-        if self._selection is None:
-            return None  # 'result'
-        else:
-            return self._selection
-
-    @property
-    def _selection_list(self):
-        if not isinstance(self._selection, (list, tuple, Series, Index, np.ndarray)):
-            return [self._selection]
-        return self._selection
-
-    @cache_readonly
-    def _selected_obj(self):
-
-        if self._selection is None or isinstance(self.obj, Series):
-            if self._group_selection is not None:
-                return self.obj[self._group_selection]
-            return self.obj
-        else:
-            return self.obj[self._selection]
-
-    def _set_selection_from_grouper(self):
-        """ we may need create a selection if we have non-level groupers """
-        grp = self.grouper
-        if self.as_index and getattr(grp,'groupings',None) is not None and self.obj.ndim > 1:
-            ax = self.obj._info_axis
-            groupers = [g.name for g in grp.groupings
-                           if g.level is None and g.in_axis]
-
-            if len(groupers):
-                self._group_selection = ax.difference(Index(groupers)).tolist()
-
-    def _set_result_index_ordered(self, result):
-        # set the result index on the passed values object
-        # return the new object
-        # related 8046
-
-        # the values/counts are repeated according to the group index
-        indices = self.indices
-
-        # shortcut of we have an already ordered grouper
-        if not self.grouper.is_monotonic:
-            index = Index(np.concatenate(self._get_indices(self.grouper.result_index)))
-            result.index = index
-            result = result.sort_index()
-
-        result.index = self.obj.index
-        return result
-
-    def _dir_additions(self):
-        return self.obj._dir_additions() | self._apply_whitelist
-
-    def __getattr__(self, attr):
-        if attr in self._internal_names_set:
-            return object.__getattribute__(self, attr)
-        if attr in self.obj:
-            return self[attr]
-        if hasattr(self.obj, attr):
-            return self._make_wrapper(attr)
-
-        raise AttributeError("%r object has no attribute %r" %
-                             (type(self).__name__, attr))
-
-    def __getitem__(self, key):
-        raise NotImplementedError('Not implemented: %s' % key)
-
-    plot = property(GroupByPlot)
-
-    def _make_wrapper(self, name):
-        if name not in self._apply_whitelist:
-            is_callable = callable(getattr(self._selected_obj, name, None))
-            kind = ' callable ' if is_callable else ' '
-            msg = ("Cannot access{0}attribute {1!r} of {2!r} objects, try "
-                   "using the 'apply' method".format(kind, name,
-                                                     type(self).__name__))
-            raise AttributeError(msg)
-
-        # need to setup the selection
-        # as are not passed directly but in the grouper
-        self._set_selection_from_grouper()
-
-        f = getattr(self._selected_obj, name)
-        if not isinstance(f, types.MethodType):
-            return self.apply(lambda self: getattr(self, name))
-
-        f = getattr(type(self._selected_obj), name)
-
-        def wrapper(*args, **kwargs):
-            # a little trickery for aggregation functions that need an axis
-            # argument
-            kwargs_with_axis = kwargs.copy()
-            if 'axis' not in kwargs_with_axis or kwargs_with_axis['axis']==None:
-                kwargs_with_axis['axis'] = self.axis
-
-            def curried_with_axis(x):
-                return f(x, *args, **kwargs_with_axis)
-
-            def curried(x):
-                return f(x, *args, **kwargs)
-
-            # preserve the name so we can detect it when calling plot methods,
-            # to avoid duplicates
-            curried.__name__ = curried_with_axis.__name__ = name
-
-            # special case otherwise extra plots are created when catching the
-            # exception below
-            if name in _plotting_methods:
-                return self.apply(curried)
-
-            try:
-                return self.apply(curried_with_axis)
-            except Exception:
-                try:
-                    return self.apply(curried)
-                except Exception:
-
-                    # related to : GH3688
-                    # try item-by-item
-                    # this can be called recursively, so need to raise ValueError if
-                    # we don't have this method to indicated to aggregate to
-                    # mark this column as an error
-                    try:
-                        return self._aggregate_item_by_item(name, *args, **kwargs)
-                    except (AttributeError):
-                        raise ValueError
-
-        return wrapper
-
-    def get_group(self, name, obj=None):
-        """
-        Constructs NDFrame from group with provided name
-
-        Parameters
-        ----------
-        name : object
-            the name of the group to get as a DataFrame
-        obj : NDFrame, default None
-            the NDFrame to take the DataFrame out of.  If
-            it is None, the object groupby was called on will
-            be used
-
-        Returns
-        -------
-        group : type of obj
-        """
-        if obj is None:
-            obj = self._selected_obj
-
-        inds = self._get_index(name)
-        if not len(inds):
-            raise KeyError(name)
-
-        return obj.take(inds, axis=self.axis, convert=False)
-
-    def __iter__(self):
-        """
-        Groupby iterator
-
-        Returns
-        -------
-        Generator yielding sequence of (name, subsetted object)
-        for each group
-        """
-        return self.grouper.get_iterator(self.obj, axis=self.axis)
-
-    def apply(self, func, *args, **kwargs):
-        """
-        Apply function and combine results together in an intelligent way. The
-        split-apply-combine combination rules attempt to be as common sense
-        based as possible. For example:
-
-        case 1:
-        group DataFrame
-        apply aggregation function (f(chunk) -> Series)
-        yield DataFrame, with group axis having group labels
-
-        case 2:
-        group DataFrame
-        apply transform function ((f(chunk) -> DataFrame with same indexes)
-        yield DataFrame with resulting chunks glued together
-
-        case 3:
-        group Series
-        apply function with f(chunk) -> DataFrame
-        yield DataFrame with result of chunks glued together
-
-        Parameters
-        ----------
-        func : function
-
-        Notes
-        -----
-        See online documentation for full exposition on how to use apply.
-
-        In the current implementation apply calls func twice on the
-        first group to decide whether it can take a fast or slow code
-        path. This can lead to unexpected behavior if func has
-        side-effects, as they will take effect twice for the first
-        group.
-
-
-        See also
-        --------
-        aggregate, transform
-
-        Returns
-        -------
-        applied : type depending on grouped object and function
-        """
-        func = _intercept_function(func)
-
-        @wraps(func)
-        def f(g):
-            return func(g, *args, **kwargs)
-
-        # ignore SettingWithCopy here in case the user mutates
-        with option_context('mode.chained_assignment',None):
-            return self._python_apply_general(f)
-
-    def _python_apply_general(self, f):
-        keys, values, mutated = self.grouper.apply(f, self._selected_obj,
-                                                   self.axis)
-
-        return self._wrap_applied_output(keys, values,
-                                         not_indexed_same=mutated)
-
-    def aggregate(self, func, *args, **kwargs):
-        raise AbstractMethodError(self)
-
-    @Appender(_agg_doc)
-    def agg(self, func, *args, **kwargs):
-        return self.aggregate(func, *args, **kwargs)
-
-    def _iterate_slices(self):
-        yield self.name, self._selected_obj
-
-    def transform(self, func, *args, **kwargs):
-        raise AbstractMethodError(self)
-
-    def irow(self, i):
-        """
-        DEPRECATED. Use ``.nth(i)`` instead
-        """
-
-        # 10177
-        warnings.warn("irow(i) is deprecated. Please use .nth(i)",
-                      FutureWarning, stacklevel=2)
-        return self.nth(i)
-
-    def count(self):
-        """ Compute count of group, excluding missing values """
-
-        # defined here for API doc
-        raise NotImplementedError
-
-    def mean(self):
-        """
-        Compute mean of groups, excluding missing values
-
-        For multiple groupings, the result index will be a MultiIndex
-        """
-        try:
-            return self._cython_agg_general('mean')
-        except GroupByError:
-            raise
-        except Exception:  # pragma: no cover
-            self._set_selection_from_grouper()
-            f = lambda x: x.mean(axis=self.axis)
-            return self._python_agg_general(f)
-
-    def median(self):
-        """
-        Compute median of groups, excluding missing values
-
-        For multiple groupings, the result index will be a MultiIndex
-        """
-        try:
-            return self._cython_agg_general('median')
-        except GroupByError:
-            raise
-        except Exception:  # pragma: no cover
-
-            self._set_selection_from_grouper()
-            def f(x):
-                if isinstance(x, np.ndarray):
-                    x = Series(x)
-                return x.median(axis=self.axis)
-            return self._python_agg_general(f)
-
-    def std(self, ddof=1):
-        """
-        Compute standard deviation of groups, excluding missing values
-
-        For multiple groupings, the result index will be a MultiIndex
-        """
-        # todo, implement at cython level?
-        return np.sqrt(self.var(ddof=ddof))
-
-    def var(self, ddof=1):
-        """
-        Compute variance of groups, excluding missing values
-
-        For multiple groupings, the result index will be a MultiIndex
-        """
-        if ddof == 1:
-            return self._cython_agg_general('var')
-        else:
-            self._set_selection_from_grouper()
-            f = lambda x: x.var(ddof=ddof)
-            return self._python_agg_general(f)
-
-    def sem(self, ddof=1):
-        """
-        Compute standard error of the mean of groups, excluding missing values
-
-        For multiple groupings, the result index will be a MultiIndex
-        """
-        return self.std(ddof=ddof)/np.sqrt(self.count())
-
-    def size(self):
-        """
-        Compute group sizes
-
-        """
-        return self.grouper.size()
-
-    sum = _groupby_function('sum', 'add', np.sum)
-    prod = _groupby_function('prod', 'prod', np.prod)
-    min = _groupby_function('min', 'min', np.min, numeric_only=False)
-    max = _groupby_function('max', 'max', np.max, numeric_only=False)
-    first = _groupby_function('first', 'first', _first_compat,
-                              numeric_only=False, _convert=True)
-    last = _groupby_function('last', 'last', _last_compat, numeric_only=False,
-                             _convert=True)
-
-    def ohlc(self):
-        """
-        Compute sum of values, excluding missing values
-        For multiple groupings, the result index will be a MultiIndex
-        """
-        return self._apply_to_column_groupbys(
-            lambda x: x._cython_agg_general('ohlc'))
-
-    def nth(self, n, dropna=None):
-        """
-        Take the nth row from each group if n is an int, or a subset of rows
-        if n is a list of ints.
-
-        If dropna, will take the nth non-null row, dropna is either
-        Truthy (if a Series) or 'all', 'any' (if a DataFrame); this is equivalent
-        to calling dropna(how=dropna) before the groupby.
-
-        Parameters
-        ----------
-        n : int or list of ints
-            a single nth value for the row or a list of nth values
-        dropna : None or str, optional
-            apply the specified dropna operation before counting which row is
-            the nth row. Needs to be None, 'any' or 'all'
-
-        Examples
-        --------
-        >>> df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
-        >>> g = df.groupby('A')
-        >>> g.nth(0)
-           A   B
-        0  1 NaN
-        2  5   6
-        >>> g.nth(1)
-           A  B
-        1  1  4
-        >>> g.nth(-1)
-           A  B
-        1  1  4
-        2  5  6
-        >>> g.nth(0, dropna='any')
-           B
-        A
-        1  4
-        5  6
-        >>> g.nth(1, dropna='any')  # NaNs denote group exhausted when using dropna
-            B
-        A
-        1 NaN
-        5 NaN
-
-        """
-        if isinstance(n, int):
-            nth_values = [n]
-        elif isinstance(n, (set, list, tuple)):
-            nth_values = list(set(n))
-            if dropna is not None:
-                raise ValueError("dropna option with a list of nth values is not supported")
-        else:
-            raise TypeError("n needs to be an int or a list/set/tuple of ints")
-
-        m = self.grouper._max_groupsize
-        # filter out values that are outside [-m, m)
-        pos_nth_values = [i for i in nth_values if i >= 0 and i < m]
-        neg_nth_values = [i for i in nth_values if i < 0 and i >= -m]
-
-        self._set_selection_from_grouper()
-        if not dropna:  # good choice
-            if not pos_nth_values and not neg_nth_values:
-                # no valid nth values
-                return self._selected_obj.loc[[]]
-
-            rng = np.zeros(m, dtype=bool)
-            for i in pos_nth_values:
-                rng[i] = True
-            is_nth = self._cumcount_array(rng)
-
-            if neg_nth_values:
-                rng = np.zeros(m, dtype=bool)
-                for i in neg_nth_values:
-                    rng[- i - 1] = True
-                is_nth |= self._cumcount_array(rng, ascending=False)
-
-            result = self._selected_obj[is_nth]
-
-            # the result index
-            if self.as_index:
-                ax = self.obj._info_axis
-                names = self.grouper.names
-                if self.obj.ndim == 1:
-                    # this is a pass-thru
-                    pass
-                elif all([ n in ax for n in names ]):
-                    result.index = MultiIndex.from_arrays([self.obj[name][is_nth] for name in names]).set_names(names)
-                elif self._group_selection is not None:
-                    result.index = self.obj._get_axis(self.axis)[is_nth]
-
-                result = result.sort_index()
-
-            return result
-
-        if (isinstance(self._selected_obj, DataFrame)
-           and dropna not in ['any', 'all']):
-            # Note: when agg-ing picker doesn't raise this, just returns NaN
-            raise ValueError("For a DataFrame groupby, dropna must be "
-                             "either None, 'any' or 'all', "
-                             "(was passed %s)." % (dropna),)
-
-        # old behaviour, but with all and any support for DataFrames.
-        # modified in GH 7559 to have better perf
-        max_len = n if n >= 0 else - 1 - n
-        dropped = self.obj.dropna(how=dropna, axis=self.axis)
-
-        # get a new grouper for our dropped obj
-        if self.keys is None and self.level is None:
-
-            # we don't have the grouper info available (e.g. we have selected out
-            # a column that is not in the current object)
-            axis = self.grouper.axis
-            grouper = axis[axis.isin(dropped.index)]
-            keys = self.grouper.names
-        else:
-
-            # create a grouper with the original parameters, but on the dropped object
-            grouper, _, _ = _get_grouper(dropped, key=self.keys, axis=self.axis,
-                                         level=self.level, sort=self.sort)
-
-        sizes = dropped.groupby(grouper).size()
-        result = dropped.groupby(grouper).nth(n)
-        mask = (sizes<max_len).values
-
-        # set the results which don't meet the criteria
-        if len(result) and mask.any():
-            result.loc[mask] = np.nan
-
-        # reset/reindex to the original groups
-        if len(self.obj) == len(dropped) or len(result) == len(self.grouper.result_index):
-            result.index = self.grouper.result_index
-        else:
-            result = result.reindex(self.grouper.result_index)
-
-        return result
-
-    def cumcount(self, ascending=True):
-        """
-        Number each item in each group from 0 to the length of that group - 1.
-
-        Essentially this is equivalent to
-
-        >>> self.apply(lambda x: Series(np.arange(len(x)), x.index))
-
-        Parameters
-        ----------
-        ascending : bool, default True
-            If False, number in reverse, from length of group - 1 to 0.
-
-        Examples
-        --------
-
-        >>> df = pd.DataFrame([['a'], ['a'], ['a'], ['b'], ['b'], ['a']],
-        ...                   columns=['A'])
-        >>> df
-           A
-        0  a
-        1  a
-        2  a
-        3  b
-        4  b
-        5  a
-        >>> df.groupby('A').cumcount()
-        0    0
-        1    1
-        2    2
-        3    0
-        4    1
-        5    3
-        dtype: int64
-        >>> df.groupby('A').cumcount(ascending=False)
-        0    3
-        1    2
-        2    1
-        3    1
-        4    0
-        5    0
-        dtype: int64
-
-        """
-        self._set_selection_from_grouper()
-
-        index = self._selected_obj.index
-        cumcounts = self._cumcount_array(ascending=ascending)
-        return Series(cumcounts, index)
-
-    def head(self, n=5):
-        """
-        Returns first n rows of each group.
-
-        Essentially equivalent to ``.apply(lambda x: x.head(n))``,
-        except ignores as_index flag.
-
-        Examples
-        --------
-
-        >>> df = DataFrame([[1, 2], [1, 4], [5, 6]],
-                            columns=['A', 'B'])
-        >>> df.groupby('A', as_index=False).head(1)
-           A  B
-        0  1  2
-        2  5  6
-        >>> df.groupby('A').head(1)
-           A  B
-        0  1  2
-        2  5  6
-
-        """
-        obj = self._selected_obj
-        in_head = self._cumcount_array() < n
-        head = obj[in_head]
-        return head
-
-    def tail(self, n=5):
-        """
-        Returns last n rows of each group
-
-        Essentially equivalent to ``.apply(lambda x: x.tail(n))``,
-        except ignores as_index flag.
-
-        Examples
-        --------
-
-        >>> df = DataFrame([['a', 1], ['a', 2], ['b', 1], ['b', 2]],
-                            columns=['A', 'B'])
-        >>> df.groupby('A').tail(1)
-           A  B
-        1  a  2
-        3  b  2
-        >>> df.groupby('A').head(1)
-           A  B
-        0  a  1
-        2  b  1
-
-        """
-        obj = self._selected_obj
-        rng = np.arange(0, -self.grouper._max_groupsize, -1, dtype='int64')
-        in_tail = self._cumcount_array(rng, ascending=False) > -n
-        tail = obj[in_tail]
-        return tail
-
-    def _cumcount_array(self, arr=None, ascending=True):
-        """
-        arr is where cumcount gets its values from
-
-        note: this is currently implementing sort=False (though the default is sort=True)
-              for groupby in general
-        """
-        if arr is None:
-            arr = np.arange(self.grouper._max_groupsize, dtype='int64')
-
-        len_index = len(self._selected_obj.index)
-        cumcounts = np.zeros(len_index, dtype=arr.dtype)
-        if not len_index:
-            return cumcounts
-
-        indices, values = [], []
-        for v in self.indices.values():
-            indices.append(v)
-
-            if ascending:
-                values.append(arr[:len(v)])
-            else:
-                values.append(arr[len(v)-1::-1])
-
-        indices = np.concatenate(indices)
-        values = np.concatenate(values)
-        cumcounts[indices] = values
-
-        return cumcounts
-
-    def _index_with_as_index(self, b):
-        """
-        Take boolean mask of index to be returned from apply, if as_index=True
-
-        """
-        # TODO perf, it feels like this should already be somewhere...
-        from itertools import chain
-        original = self._selected_obj.index
-        gp = self.grouper
-        levels = chain((gp.levels[i][gp.labels[i][b]]
-                        for i in range(len(gp.groupings))),
-                       (original.get_level_values(i)[b]
-                        for i in range(original.nlevels)))
-        new = MultiIndex.from_arrays(list(levels))
-        new.names = gp.names + original.names
-        return new
-
-    def _try_cast(self, result, obj):
-        """
-        try to cast the result to our obj original type,
-        we may have roundtripped thru object in the mean-time
-
-        """
-        if obj.ndim > 1:
-            dtype = obj.values.dtype
-        else:
-            dtype = obj.dtype
-
-        if not np.isscalar(result):
-            result = _possibly_downcast_to_dtype(result, dtype)
-
-        return result
-
-    def _cython_agg_general(self, how, numeric_only=True):
-        output = {}
-        for name, obj in self._iterate_slices():
-            is_numeric = is_numeric_dtype(obj.dtype)
-            if numeric_only and not is_numeric:
-                continue
-
-            try:
-                result, names = self.grouper.aggregate(obj.values, how)
-            except AssertionError as e:
-                raise GroupByError(str(e))
-            output[name] = self._try_cast(result, obj)
-
-        if len(output) == 0:
-            raise DataError('No numeric types to aggregate')
-
-        return self._wrap_aggregated_output(output, names)
-
-    def _python_agg_general(self, func, *args, **kwargs):
-        func = _intercept_function(func)
-        f = lambda x: func(x, *args, **kwargs)
-
-        # iterate through "columns" ex exclusions to populate output dict
-        output = {}
-        for name, obj in self._iterate_slices():
-            try:
-                result, counts = self.grouper.agg_series(obj, f)
-                output[name] = self._try_cast(result, obj)
-            except TypeError:
-                continue
-
-        if len(output) == 0:
-            return self._python_apply_general(f)
-
-        if self.grouper._filter_empty_groups:
-
-            mask = counts.ravel() > 0
-            for name, result in compat.iteritems(output):
-
-                # since we are masking, make sure that we have a float object
-                values = result
-                if is_numeric_dtype(values.dtype):
-                    values = com.ensure_float(values)
-
-                output[name] = self._try_cast(values[mask], result)
-
-        return self._wrap_aggregated_output(output)
-
-    def _wrap_applied_output(self, *args, **kwargs):
-        raise AbstractMethodError(self)
-
-    def _concat_objects(self, keys, values, not_indexed_same=False):
-        from pandas.tools.merge import concat
-
-        if not not_indexed_same:
-            result = concat(values, axis=self.axis)
-            ax = self._selected_obj._get_axis(self.axis)
-
-            if isinstance(result, Series):
-                result = result.reindex(ax)
-            else:
-                result = result.reindex_axis(ax, axis=self.axis)
-
-        elif self.group_keys:
-
-            if self.as_index:
-
-                # possible MI return case
-                group_keys = keys
-                group_levels = self.grouper.levels
-                group_names = self.grouper.names
-                result = concat(values, axis=self.axis, keys=group_keys,
-                                levels=group_levels, names=group_names)
-            else:
-
-                # GH5610, returns a MI, with the first level being a
-                # range index
-                keys = list(range(len(values)))
-                result = concat(values, axis=self.axis, keys=keys)
-        else:
-            result = concat(values, axis=self.axis)
-
-        return result
-
-    def _apply_filter(self, indices, dropna):
-        if len(indices) == 0:
-            indices = []
-        else:
-            indices = np.sort(np.concatenate(indices))
-        if dropna:
-            filtered = self._selected_obj.take(indices, axis=self.axis)
-        else:
-            mask = np.empty(len(self._selected_obj.index), dtype=bool)
-            mask.fill(False)
-            mask[indices.astype(int)] = True
-            # mask fails to broadcast when passed to where; broadcast manually.
-            mask = np.tile(mask, list(self._selected_obj.shape[1:]) + [1]).T
-            filtered = self._selected_obj.where(mask)  # Fill with NaNs.
-        return filtered
-
-
-@Appender(GroupBy.__doc__)
-def groupby(obj, by, **kwds):
-    if isinstance(obj, Series):
-        klass = SeriesGroupBy
-    elif isinstance(obj, DataFrame):
-        klass = DataFrameGroupBy
-    else:  # pragma: no cover
-        raise TypeError('invalid type: %s' % type(obj))
-
-    return klass(obj, by, **kwds)
-
-
-def _get_axes(group):
-    if isinstance(group, Series):
-        return [group.index]
-    else:
-        return group.axes
-
-
-def _is_indexed_like(obj, axes):
-    if isinstance(obj, Series):
-        if len(axes) > 1:
-            return False
-        return obj.index.equals(axes[0])
-    elif isinstance(obj, DataFrame):
-        return obj.index.equals(axes[0])
-
-    return False
-
-
-class BaseGrouper(object):
-    """
-    This is an internal Grouper class, which actually holds the generated groups
-    """
-
-    def __init__(self, axis, groupings, sort=True, group_keys=True):
-        self._filter_empty_groups = self.compressed = len(groupings) != 1
-        self.axis, self.groupings, self.sort, self.group_keys = \
-                axis, groupings, sort, group_keys
-
-    @property
-    def shape(self):
-        return tuple(ping.ngroups for ping in self.groupings)
-
-    def __iter__(self):
-        return iter(self.indices)
-
-    @property
-    def nkeys(self):
-        return len(self.groupings)
-
-    def get_iterator(self, data, axis=0):
-        """
-        Groupby iterator
-
-        Returns
-        -------
-        Generator yielding sequence of (name, subsetted object)
-        for each group
-        """
-        splitter = self._get_splitter(data, axis=axis)
-        keys = self._get_group_keys()
-        for key, (i, group) in zip(keys, splitter):
-            yield key, group
-
-    def _get_splitter(self, data, axis=0):
-        comp_ids, _, ngroups = self.group_info
-        return get_splitter(data, comp_ids, ngroups, axis=axis)
-
-    def _get_group_keys(self):
-        if len(self.groupings) == 1:
-            return self.levels[0]
-        else:
-            comp_ids, _, ngroups = self.group_info
-            # provide "flattened" iterator for multi-group setting
-            mapper = _KeyMapper(comp_ids, ngroups, self.labels, self.levels)
-            return [mapper.get_key(i) for i in range(ngroups)]
-
-    def apply(self, f, data, axis=0):
-        mutated = False
-        splitter = self._get_splitter(data, axis=axis)
-        group_keys = self._get_group_keys()
-
-        # oh boy
-        f_name = com._get_callable_name(f)
-        if (f_name not in _plotting_methods and
-                hasattr(splitter, 'fast_apply') and axis == 0):
-            try:
-                values, mutated = splitter.fast_apply(f, group_keys)
-                return group_keys, values, mutated
-            except (lib.InvalidApply):
-                # we detect a mutation of some kind
-                # so take slow path
-                pass
-            except (Exception) as e:
-                # raise this error to the caller
-                pass
-
-        result_values = []
-        for key, (i, group) in zip(group_keys, splitter):
-            object.__setattr__(group, 'name', key)
-
-            # group might be modified
-            group_axes = _get_axes(group)
-            res = f(group)
-            if not _is_indexed_like(res, group_axes):
-                mutated = True
-            result_values.append(res)
-
-        return group_keys, result_values, mutated
-
-    @cache_readonly
-    def indices(self):
-        """ dict {group name -> group indices} """
-        if len(self.groupings) == 1:
-            return self.groupings[0].indices
-        else:
-            label_list = [ping.labels for ping in self.groupings]
-            keys = [_values_from_object(ping.group_index) for ping in self.groupings]
-            return _get_indices_dict(label_list, keys)
-
-    @property
-    def labels(self):
-        return [ping.labels for ping in self.groupings]
-
-    @property
-    def levels(self):
-        return [ping.group_index for ping in self.groupings]
-
-    @property
-    def names(self):
-        return [ping.name for ping in self.groupings]
-
-    def size(self):
-        """
-        Compute group sizes
-
-        """
-        ids, _, ngroup = self.group_info
-        ids = com._ensure_platform_int(ids)
-        out = np.bincount(ids[ids != -1], minlength=ngroup)
-        return Series(out, index=self.result_index, dtype='int64')
-
-    @cache_readonly
-    def _max_groupsize(self):
-        '''
-        Compute size of largest group
-
-        '''
-        # For many items in each group this is much faster than
-        # self.size().max(), in worst case marginally slower
-        if self.indices:
-            return max(len(v) for v in self.indices.values())
-        else:
-            return 0
-
-    @cache_readonly
-    def groups(self):
-        """ dict {group name -> group labels} """
-        if len(self.groupings) == 1:
-            return self.groupings[0].groups
-        else:
-            to_groupby = lzip(*(ping.grouper for ping in self.groupings))
-            to_groupby = Index(to_groupby)
-            return self.axis.groupby(to_groupby.values)
-
-    @cache_readonly
-    def is_monotonic(self):
-        # return if my group orderings are monotonic
-        return Index(self.group_info[0]).is_monotonic
-
-    @cache_readonly
-    def group_info(self):
-        comp_ids, obs_group_ids = self._get_compressed_labels()
-
-        ngroups = len(obs_group_ids)
-        comp_ids = com._ensure_int64(comp_ids)
-        return comp_ids, obs_group_ids, ngroups
-
-
-    def _get_compressed_labels(self):
-        all_labels = [ping.labels for ping in self.groupings]
-        if len(all_labels) > 1:
-            group_index = get_group_index(all_labels, self.shape,
-                                          sort=True, xnull=True)
-            return _compress_group_index(group_index, sort=self.sort)
-
-        ping = self.groupings[0]
-        return ping.labels, np.arange(len(ping.group_index))
-
-    @cache_readonly
-    def ngroups(self):
-        return len(self.result_index)
-
-    @property
-    def recons_labels(self):
-        comp_ids, obs_ids, _ = self.group_info
-        labels = (ping.labels for ping in self.groupings)
-        return decons_obs_group_ids(comp_ids,
-                obs_ids, self.shape, labels, xnull=True)
-
-    @cache_readonly
-    def result_index(self):
-        if not self.compressed and len(self.groupings) == 1:
-            return self.groupings[0].group_index.rename(self.names[0])
-
-        return MultiIndex(levels=[ping.group_index for ping in self.groupings],
-                          labels=self.recons_labels,
-                          verify_integrity=False,
-                          names=self.names)
-
-    def get_group_levels(self):
-        if not self.compressed and len(self.groupings) == 1:
-            return [self.groupings[0].group_index]
-
-        name_list = []
-        for ping, labels in zip(self.groupings, self.recons_labels):
-            labels = com._ensure_platform_int(labels)
-            levels = ping.group_index.take(labels)
-
-            name_list.append(levels)
-
-        return name_list
-
-    #------------------------------------------------------------
-    # Aggregation functions
-
-    _cython_functions = {
-        'add': 'group_add',
-        'prod': 'group_prod',
-        'min': 'group_min',
-        'max': 'group_max',
-        'mean': 'group_mean',
-        'median': {
-            'name': 'group_median'
-        },
-        'var': 'group_var',
-        'first': {
-            'name': 'group_nth',
-            'f': lambda func, a, b, c, d: func(a, b, c, d, 1)
-        },
-        'last': 'group_last',
-    }
-
-    _cython_arity = {
-        'ohlc': 4,  # OHLC
-    }
-
-    _name_functions = {}
-
-    def _get_aggregate_function(self, how, values):
-
-        dtype_str = values.dtype.name
-
-        def get_func(fname):
-            # find the function, or use the object function, or return a
-            # generic
-            for dt in [dtype_str, 'object']:
-                f = getattr(_algos, "%s_%s" % (fname, dtype_str), None)
-                if f is not None:
-                    return f
-
-            if dtype_str == 'float64':
-                return getattr(_algos, fname, None)
-
-        ftype = self._cython_functions[how]
-
-        if isinstance(ftype, dict):
-            func = afunc = get_func(ftype['name'])
-
-            # a sub-function
-            f = ftype.get('f')
-            if f is not None:
-
-                def wrapper(*args, **kwargs):
-                    return f(afunc, *args, **kwargs)
-
-                # need to curry our sub-function
-                func = wrapper
-
-        else:
-            func = get_func(ftype)
-
-        if func is None:
-            raise NotImplementedError("function is not implemented for this"
-                                      "dtype: [how->%s,dtype->%s]" %
-                                      (how, dtype_str))
-        return func, dtype_str
-
-    def aggregate(self, values, how, axis=0):
-        arity = self._cython_arity.get(how, 1)
-
-        vdim = values.ndim
-        swapped = False
-        if vdim == 1:
-            values = values[:, None]
-            out_shape = (self.ngroups, arity)
-        else:
-            if axis > 0:
-                swapped = True
-                values = values.swapaxes(0, axis)
-            if arity > 1:
-                raise NotImplementedError("arity of more than 1 is not "
-                                          "supported for the 'how' argument")
-            out_shape = (self.ngroups,) + values.shape[1:]
-
-        is_numeric = is_numeric_dtype(values.dtype)
-
-        if is_datetime_or_timedelta_dtype(values.dtype):
-            values = values.view('int64')
-            is_numeric = True
-        elif is_bool_dtype(values.dtype):
-            values = _algos.ensure_float64(values)
-        elif com.is_integer_dtype(values):
-            values = values.astype('int64', copy=False)
-        elif is_numeric:
-            values = _algos.ensure_float64(values)
-        else:
-            values = values.astype(object)
-
-        try:
-            agg_func, dtype_str = self._get_aggregate_function(how, values)
-        except NotImplementedError:
-            if is_numeric:
-                values = _algos.ensure_float64(values)
-                agg_func, dtype_str = self._get_aggregate_function(how, values)
-            else:
-                raise
-
-        if is_numeric:
-            out_dtype = '%s%d' % (values.dtype.kind, values.dtype.itemsize)
-        else:
-            out_dtype = 'object'
-
-        # will be filled in Cython function
-        result = np.empty(out_shape, dtype=out_dtype)
-        result.fill(np.nan)
-        counts = np.zeros(self.ngroups, dtype=np.int64)
-
-        result = self._aggregate(result, counts, values, agg_func, is_numeric)
-
-        if com.is_integer_dtype(result):
-            if len(result[result == tslib.iNaT]) > 0:
-                result = result.astype('float64')
-                result[result == tslib.iNaT] = np.nan
-
-        if self._filter_empty_groups and not counts.all():
-            if result.ndim == 2:
-                try:
-                    result = lib.row_bool_subset(
-                        result, (counts > 0).view(np.uint8))
-                except ValueError:
-                    result = lib.row_bool_subset_object(
-                                    com._ensure_object(result),
-                                    (counts > 0).view(np.uint8))
-            else:
-                result = result[counts > 0]
-
-        if vdim == 1 and arity == 1:
-            result = result[:, 0]
-
-        if how in self._name_functions:
-            # TODO
-            names = self._name_functions[how]()
-        else:
-            names = None
-
-        if swapped:
-            result = result.swapaxes(0, axis)
-
-        return result, names
-
-    def _aggregate(self, result, counts, values, agg_func, is_numeric):
-        comp_ids, _, ngroups = self.group_info
-        if values.ndim > 3:
-            # punting for now
-            raise NotImplementedError("number of dimensions is currently "
-                                      "limited to 3")
-        elif values.ndim > 2:
-            for i, chunk in enumerate(values.transpose(2, 0, 1)):
-
-                chunk = chunk.squeeze()
-                agg_func(result[:, :, i], counts, chunk, comp_ids)
-        else:
-            agg_func(result, counts, values, comp_ids)
-
-        return result
-
-    def agg_series(self, obj, func):
-        try:
-            return self._aggregate_series_fast(obj, func)
-        except Exception:
-            return self._aggregate_series_pure_python(obj, func)
-
-    def _aggregate_series_fast(self, obj, func):
-        func = _intercept_function(func)
-
-        if obj.index._has_complex_internals:
-            raise TypeError('Incompatible index for Cython grouper')
-
-        group_index, _, ngroups = self.group_info
-
-        # avoids object / Series creation overhead
-        dummy = obj._get_values(slice(None, 0)).to_dense()
-        indexer = _get_group_index_sorter(group_index, ngroups)
-        obj = obj.take(indexer, convert=False)
-        group_index = com.take_nd(group_index, indexer, allow_fill=False)
-        grouper = lib.SeriesGrouper(obj, func, group_index, ngroups,
-                                    dummy)
-        result, counts = grouper.get_result()
-        return result, counts
-
-    def _aggregate_series_pure_python(self, obj, func):
-
-        group_index, _, ngroups = self.group_info
-
-        counts = np.zeros(ngroups, dtype=int)
-        result = None
-
-        splitter = get_splitter(obj, group_index, ngroups, axis=self.axis)
-
-        for label, group in splitter:
-            res = func(group)
-            if result is None:
-                if (isinstance(res, (Series, Index, np.ndarray)) or
-                        isinstance(res, list)):
-                    raise ValueError('Function does not reduce')
-                result = np.empty(ngroups, dtype='O')
-
-            counts[label] = group.shape[0]
-            result[label] = res
-
-        result = lib.maybe_convert_objects(result, try_float=0)
-        return result, counts
-
-
-def generate_bins_generic(values, binner, closed):
-    """
-    Generate bin edge offsets and bin labels for one array using another array
-    which has bin edge values. Both arrays must be sorted.
-
-    Parameters
-    ----------
-    values : array of values
-    binner : a comparable array of values representing bins into which to bin
-        the first array. Note, 'values' end-points must fall within 'binner'
-        end-points.
-    closed : which end of bin is closed; left (default), right
-
-    Returns
-    -------
-    bins : array of offsets (into 'values' argument) of bins.
-        Zero and last edge are excluded in result, so for instance the first
-        bin is values[0:bin[0]] and the last is values[bin[-1]:]
-    """
-    lenidx = len(values)
-    lenbin = len(binner)
-
-    if lenidx <= 0 or lenbin <= 0:
-        raise ValueError("Invalid length for values or for binner")
-
-    # check binner fits data
-    if values[0] < binner[0]:
-        raise ValueError("Values falls before first bin")
-
-    if values[lenidx - 1] > binner[lenbin - 1]:
-        raise ValueError("Values falls after last bin")
-
-    bins = np.empty(lenbin - 1, dtype=np.int64)
-
-    j = 0  # index into values
-    bc = 0  # bin count
-
-    # linear scan, presume nothing about values/binner except that it fits ok
-    for i in range(0, lenbin - 1):
-        r_bin = binner[i + 1]
-
-        # count values in current bin, advance to next bin
-        while j < lenidx and (values[j] < r_bin or
-                              (closed == 'right' and values[j] == r_bin)):
-            j += 1
-
-        bins[bc] = j
-        bc += 1
-
-    return bins
-
-class BinGrouper(BaseGrouper):
-
-    def __init__(self, bins, binlabels, filter_empty=False):
-        self.bins = com._ensure_int64(bins)
-        self.binlabels = _ensure_index(binlabels)
-        self._filter_empty_groups = filter_empty
-
-    @cache_readonly
-    def groups(self):
-        """ dict {group name -> group labels} """
-
-        # this is mainly for compat
-        # GH 3881
-        result = {}
-        for key, value in zip(self.binlabels, self.bins):
-            if key is not tslib.NaT:
-                result[key] = value
-        return result
-
-    @property
-    def nkeys(self):
-        return 1
-
-    def get_iterator(self, data, axis=0):
-        """
-        Groupby iterator
-
-        Returns
-        -------
-        Generator yielding sequence of (name, subsetted object)
-        for each group
-        """
-        if isinstance(data, NDFrame):
-            slicer = lambda start,edge: data._slice(slice(start,edge),axis=axis)
-            length = len(data.axes[axis])
-        else:
-            slicer = lambda start,edge: data[slice(start,edge)]
-            length = len(data)
-
-        start = 0
-        for edge, label in zip(self.bins, self.binlabels):
-            if label is not tslib.NaT:
-                yield label, slicer(start,edge)
-            start = edge
-
-        if start < length:
-            yield self.binlabels[-1], slicer(start,None)
-
-    def apply(self, f, data, axis=0):
-        result_keys = []
-        result_values = []
-        mutated = False
-        for key, group in self.get_iterator(data, axis=axis):
-            object.__setattr__(group, 'name', key)
-
-            # group might be modified
-            group_axes = _get_axes(group)
-            res = f(group)
-
-            if not _is_indexed_like(res, group_axes):
-                mutated = True
-
-            result_keys.append(key)
-            result_values.append(res)
-
-        return result_keys, result_values, mutated
-
-    @cache_readonly
-    def indices(self):
-        indices = collections.defaultdict(list)
-
-        i = 0
-        for label, bin in zip(self.binlabels, self.bins):
-            if i < bin:
-                if label is not tslib.NaT:
-                    indices[label] = list(range(i, bin))
-                i = bin
-        return indices
-
-    @cache_readonly
-    def group_info(self):
-        ngroups = self.ngroups
-        obs_group_ids = np.arange(ngroups)
-        rep = np.diff(np.r_[0, self.bins])
-
-        rep = com._ensure_platform_int(rep)
-        if ngroups == len(self.bins):
-            comp_ids = np.repeat(np.arange(ngroups), rep)
-        else:
-            comp_ids = np.repeat(np.r_[-1, np.arange(ngroups)], rep)
-
-        return comp_ids.astype('int64', copy=False), \
-            obs_group_ids.astype('int64', copy=False), ngroups
-
-    @cache_readonly
-    def ngroups(self):
-        return len(self.result_index)
-
-    @cache_readonly
-    def result_index(self):
-        if len(self.binlabels) != 0 and isnull(self.binlabels[0]):
-            return self.binlabels[1:]
-
-        return self.binlabels
-
-    @property
-    def levels(self):
-        return [self.binlabels]
-
-    @property
-    def names(self):
-        return [self.binlabels.name]
-
-    @property
-    def groupings(self):
-        # for compat
-        return None
-
-    #----------------------------------------------------------------------
-    # cython aggregation
-
-    _cython_functions = {'ohlc': 'group_ohlc'}
-    _cython_functions.update(BaseGrouper._cython_functions)
-    _cython_functions.pop('median')
-
-    _name_functions = {
-        'ohlc': lambda *args: ['open', 'high', 'low', 'close']
-    }
-
-    def agg_series(self, obj, func):
-        dummy = obj[:0]
-        grouper = lib.SeriesBinGrouper(obj, func, self.bins, dummy)
-        return grouper.get_result()
-
-
-class Grouping(object):
-
-    """
-    Holds the grouping information for a single key
-
-    Parameters
-    ----------
-    index : Index
-    grouper :
-    obj :
-    name :
-    level :
-    in_axis : if the Grouping is a column in self.obj and hence among
-        Groupby.exclusions list
-
-    Returns
-    -------
-    **Attributes**:
-      * indices : dict of {group -> index_list}
-      * labels : ndarray, group labels
-      * ids : mapping of label -> group
-      * counts : array of group counts
-      * group_index : unique groups
-      * groups : dict of {group -> label_list}
-    """
-
-    def __init__(self, index, grouper=None, obj=None, name=None, level=None,
-                 sort=True, in_axis=False):
-
-        self.name = name
-        self.level = level
-        self.grouper = _convert_grouper(index, grouper)
-        self.index = index
-        self.sort = sort
-        self.obj = obj
-        self.in_axis = in_axis
-
-        # right place for this?
-        if isinstance(grouper, (Series, Index)) and name is None:
-            self.name = grouper.name
-
-        if isinstance(grouper, MultiIndex):
-            self.grouper = grouper.values
-
-        # pre-computed
-        self._should_compress = True
-
-        # we have a single grouper which may be a myriad of things, some of which are
-        # dependent on the passing in level
-        #
-
-        if level is not None:
-            if not isinstance(level, int):
-                if level not in index.names:
-                    raise AssertionError('Level %s not in index' % str(level))
-                level = index.names.index(level)
-
-            inds = index.labels[level]
-            level_index = index.levels[level]
-
-            if self.name is None:
-                self.name = index.names[level]
-
-            # XXX complete hack
-
-            if grouper is not None:
-                level_values = index.levels[level].take(inds)
-                self.grouper = level_values.map(self.grouper)
-            else:
-                # all levels may not be observed
-                labels, uniques = algos.factorize(inds, sort=True)
-
-                if len(uniques) > 0 and uniques[0] == -1:
-                    # handle NAs
-                    mask = inds != -1
-                    ok_labels, uniques = algos.factorize(inds[mask], sort=True)
-
-                    labels = np.empty(len(inds), dtype=inds.dtype)
-                    labels[mask] = ok_labels
-                    labels[~mask] = -1
-
-                if len(uniques) < len(level_index):
-                    level_index = level_index.take(uniques)
-
-                self._labels = labels
-                self._group_index = level_index
-                self.grouper = level_index.take(labels)
-        else:
-            if isinstance(self.grouper, (list, tuple)):
-                self.grouper = com._asarray_tuplesafe(self.grouper)
-
-            # a passed Categorical
-            elif is_categorical_dtype(self.grouper):
-
-                # must have an ordered categorical
-                if self.sort:
-                    if not self.grouper.ordered:
-
-                        # technically we cannot group on an unordered Categorical
-                        # but this a user convenience to do so; the ordering
-                        # is preserved and if it's a reduction it doesn't make any difference
-                        pass
-
-                # fix bug #GH8868 sort=False being ignored in categorical groupby
-                else:
-                    cat = self.grouper.unique()
-                    self.grouper = self.grouper.reorder_categories(cat.categories)
-
-                # we make a CategoricalIndex out of the cat grouper
-                # preserving the categories / ordered attributes
-                self._labels = self.grouper.codes
-
-                c = self.grouper.categories
-                self._group_index = CategoricalIndex(Categorical.from_codes(np.arange(len(c)),
-                                                     categories=c,
-                                                     ordered=self.grouper.ordered))
-
-            # a passed Grouper like
-            elif isinstance(self.grouper, Grouper):
-
-                # get the new grouper
-                grouper = self.grouper._get_binner_for_grouping(self.obj)
-                self.obj = self.grouper.obj
-                self.grouper = grouper
-                if self.name is None:
-                    self.name = grouper.name
-
-            # we are done
-            if isinstance(self.grouper, Grouping):
-                self.grouper = self.grouper.grouper
-
-            # no level passed
-            elif not isinstance(self.grouper, (Series, Index, Categorical, np.ndarray)):
-                if getattr(self.grouper, 'ndim', 1) != 1:
-                    t = self.name or str(type(self.grouper))
-                    raise ValueError("Grouper for '%s' not 1-dimensional" % t)
-                self.grouper = self.index.map(self.grouper)
-                if not (hasattr(self.grouper, "__len__") and
-                        len(self.grouper) == len(self.index)):
-                    errmsg = ('Grouper result violates len(labels) == '
-                              'len(data)\nresult: %s' %
-                              com.pprint_thing(self.grouper))
-                    self.grouper = None  # Try for sanity
-                    raise AssertionError(errmsg)
-
-        # if we have a date/time-like grouper, make sure that we have Timestamps like
-        if getattr(self.grouper,'dtype',None) is not None:
-            if is_datetime64_dtype(self.grouper):
-                from pandas import to_datetime
-                self.grouper = to_datetime(self.grouper)
-            elif is_timedelta64_dtype(self.grouper):
-                from pandas import to_timedelta
-                self.grouper = to_timedelta(self.grouper)
-
-    def __repr__(self):
-        return 'Grouping(%s)' % self.name
-
-    def __iter__(self):
-        return iter(self.indices)
-
-    _labels = None
-    _group_index = None
-
-    @property
-    def ngroups(self):
-        return len(self.group_index)
-
-    @cache_readonly
-    def indices(self):
-        return _groupby_indices(self.grouper)
-
-    @property
-    def labels(self):
-        if self._labels is None:
-            self._make_labels()
-        return self._labels
-
-    @property
-    def group_index(self):
-        if self._group_index is None:
-            self._make_labels()
-        return self._group_index
-
-    def _make_labels(self):
-        if self._labels is None or self._group_index is None:
-            labels, uniques = algos.factorize(self.grouper, sort=self.sort)
-            uniques = Index(uniques, name=self.name)
-            self._labels = labels
-            self._group_index = uniques
-
-    @cache_readonly
-    def groups(self):
-        return self.index.groupby(self.grouper)
-
-def _get_grouper(obj, key=None, axis=0, level=None, sort=True):
-    """
-    create and return a BaseGrouper, which is an internal
-    mapping of how to create the grouper indexers.
-    This may be composed of multiple Grouping objects, indicating
-    multiple groupers
-
-    Groupers are ultimately index mappings. They can originate as:
-    index mappings, keys to columns, functions, or Groupers
-
-    Groupers enable local references to axis,level,sort, while
-    the passed in axis, level, and sort are 'global'.
-
-    This routine tries to figure out what the passing in references
-    are and then creates a Grouping for each one, combined into
-    a BaseGrouper.
-
-    """
-
-    group_axis = obj._get_axis(axis)
-
-    # validate that the passed level is compatible with the passed
-    # axis of the object
-    if level is not None:
-        if not isinstance(group_axis, MultiIndex):
-            if isinstance(level, compat.string_types):
-                if obj.index.name != level:
-                    raise ValueError('level name %s is not the name of the '
-                                     'index' % level)
-            elif level > 0:
-                raise ValueError('level > 0 only valid with MultiIndex')
-
-            level = None
-            key = group_axis
-
-    # a passed-in Grouper, directly convert
-    if isinstance(key, Grouper):
-        binner, grouper, obj = key._get_grouper(obj)
-        if key.key is None:
-            return grouper, [], obj
-        else:
-            return grouper, set([key.key]), obj
-
-    # already have a BaseGrouper, just return it
-    elif isinstance(key, BaseGrouper):
-        return key, [], obj
-
-    if not isinstance(key, (tuple, list)):
-        keys = [key]
-    else:
-        keys = key
-
-    # what are we after, exactly?
-    match_axis_length = len(keys) == len(group_axis)
-    any_callable = any(callable(g) or isinstance(g, dict) for g in keys)
-    any_groupers = any(isinstance(g, Grouper) for g in keys)
-    any_arraylike = any(isinstance(g, (list, tuple, Series, Index, np.ndarray))
-                        for g in keys)
-
-    try:
-        if isinstance(obj, DataFrame):
-            all_in_columns = all(g in obj.columns for g in keys)
-        else:
-            all_in_columns = False
-    except Exception:
-        all_in_columns = False
-
-    if (not any_callable and not all_in_columns
-        and not any_arraylike and not any_groupers
-            and match_axis_length
-            and level is None):
-        keys = [com._asarray_tuplesafe(keys)]
-
-    if isinstance(level, (tuple, list)):
-        if key is None:
-            keys = [None] * len(level)
-        levels = level
-    else:
-        levels = [level] * len(keys)
-
-    groupings = []
-    exclusions = []
-
-    # if the actual grouper should be obj[key]
-    def is_in_axis(key):
-        if not _is_label_like(key):
-            try:
-                obj._data.items.get_loc(key)
-            except Exception:
-                return False
-
-        return True
-
-    # if the the grouper is obj[name]
-    def is_in_obj(gpr):
-        try:
-            return id(gpr) == id(obj[gpr.name])
-        except Exception:
-            return False
-
-    for i, (gpr, level) in enumerate(zip(keys, levels)):
-
-        if is_in_obj(gpr):  # df.groupby(df['name'])
-            in_axis, name = True, gpr.name
-            exclusions.append(name)
-
-        elif is_in_axis(gpr):  # df.groupby('name')
-            in_axis, name, gpr = True, gpr, obj[gpr]
-            exclusions.append(name)
-
-        else:
-            in_axis, name = False, None
-
-        if is_categorical_dtype(gpr) and len(gpr) != len(obj):
-            raise ValueError("Categorical dtype grouper must have len(grouper) == len(data)")
-
-        ping = Grouping(group_axis, gpr, obj=obj, name=name,
-                        level=level, sort=sort, in_axis=in_axis)
-
-        groupings.append(ping)
-
-    if len(groupings) == 0:
-        raise ValueError('No group keys passed!')
-
-    # create the internals grouper
-    grouper = BaseGrouper(group_axis, groupings, sort=sort)
-
-    return grouper, exclusions, obj
-
-
-def _is_label_like(val):
-    return isinstance(val, compat.string_types) or np.isscalar(val)
-
-
-def _convert_grouper(axis, grouper):
-    if isinstance(grouper, dict):
-        return grouper.get
-    elif isinstance(grouper, Series):
-        if grouper.index.equals(axis):
-            return grouper._values
-        else:
-            return grouper.reindex(axis)._values
-    elif isinstance(grouper, (list, Series, Index, np.ndarray)):
-        if len(grouper) != len(axis):
-            raise AssertionError('Grouper and axis must be same length')
-        return grouper
-    else:
-        return grouper
-
-def _whitelist_method_generator(klass, whitelist) :
-    """
-    Yields all GroupBy member defs for DataFrame/Series names in _whitelist.
-
-    Parameters
-    ----------
-    klass - class where members are defined.  Should be Series or DataFrame
-
-    whitelist - list of names of klass methods to be constructed
-
-    Returns
-    -------
-    The generator yields a sequence of strings, each suitable for exec'ing,
-    that define implementations of the named methods for DataFrameGroupBy
-    or SeriesGroupBy.
-
-    Since we don't want to override methods explicitly defined in the
-    base class, any such name is skipped.
-    """
-
-    method_wrapper_template = \
-    """def %(name)s(%(sig)s) :
-    \"""
-    %(doc)s
-    \"""
-    f = %(self)s.__getattr__('%(name)s')
-    return f(%(args)s)"""
-    property_wrapper_template = \
-    """@property
-def %(name)s(self) :
-    \"""
-    %(doc)s
-    \"""
-    return self.__getattr__('%(name)s')"""
-    for name in whitelist :
-        # don't override anything that was explicitly defined
-        # in the base class
-        if hasattr(GroupBy,name) :
-            continue
-        # ugly, but we need the name string itself in the method.
-        f = getattr(klass,name)
-        doc = f.__doc__
-        doc = doc if type(doc)==str else ''
-        if type(f) == types.MethodType :
-            wrapper_template = method_wrapper_template
-            decl, args = make_signature(f)
-            # pass args by name to f because otherwise
-            # GroupBy._make_wrapper won't know whether
-            # we passed in an axis parameter.
-            args_by_name = ['{0}={0}'.format(arg) for arg in args[1:]]
-            params = {'name':name,
-                      'doc':doc,
-                      'sig':','.join(decl),
-                      'self':args[0],
-                      'args':','.join(args_by_name)}
-        else :
-            wrapper_template = property_wrapper_template
-            params = {'name':name, 'doc':doc}
-        yield wrapper_template % params
-
-class SeriesGroupBy(GroupBy):
-    #
-    # Make class defs of attributes on SeriesGroupBy whitelist
-    _apply_whitelist = _series_apply_whitelist
-    for _def_str in _whitelist_method_generator(Series,_series_apply_whitelist) :
-        exec(_def_str)
-
-    def aggregate(self, func_or_funcs, *args, **kwargs):
-        """
-        Apply aggregation function or functions to groups, yielding most likely
-        Series but in some cases DataFrame depending on the output of the
-        aggregation function
-
-        Parameters
-        ----------
-        func_or_funcs : function or list / dict of functions
-            List/dict of functions will produce DataFrame with column names
-            determined by the function names themselves (list) or the keys in
-            the dict
-
-        Notes
-        -----
-        agg is an alias for aggregate. Use it.
-
-        Examples
-        --------
-        >>> series
-        bar    1.0
-        baz    2.0
-        qot    3.0
-        qux    4.0
-
-        >>> mapper = lambda x: x[0] # first letter
-        >>> grouped = series.groupby(mapper)
-
-        >>> grouped.aggregate(np.sum)
-        b    3.0
-        q    7.0
-
-        >>> grouped.aggregate([np.sum, np.mean, np.std])
-           mean  std  sum
-        b  1.5   0.5  3
-        q  3.5   0.5  7
-
-        >>> grouped.agg({'result' : lambda x: x.mean() / x.std(),
-        ...              'total' : np.sum})
-           result  total
-        b  2.121   3
-        q  4.95    7
-
-        See also
-        --------
-        apply, transform
-
-        Returns
-        -------
-        Series or DataFrame
-        """
-        if isinstance(func_or_funcs, compat.string_types):
-            return getattr(self, func_or_funcs)(*args, **kwargs)
-
-        if hasattr(func_or_funcs, '__iter__'):
-            ret = self._aggregate_multiple_funcs(func_or_funcs)
-        else:
-            cyfunc = _intercept_cython(func_or_funcs)
-            if cyfunc and not args and not kwargs:
-                return getattr(self, cyfunc)()
-
-            if self.grouper.nkeys > 1:
-                return self._python_agg_general(func_or_funcs, *args, **kwargs)
-
-            try:
-                return self._python_agg_general(func_or_funcs, *args, **kwargs)
-            except Exception:
-                result = self._aggregate_named(func_or_funcs, *args, **kwargs)
-
-            index = Index(sorted(result), name=self.grouper.names[0])
-            ret = Series(result, index=index)
-
-        if not self.as_index:  # pragma: no cover
-            print('Warning, ignoring as_index=True')
-
-        return ret
-
-    def _aggregate_multiple_funcs(self, arg):
-        if isinstance(arg, dict):
-            columns = list(arg.keys())
-            arg = list(arg.items())
-        elif any(isinstance(x, (tuple, list)) for x in arg):
-            arg = [(x, x) if not isinstance(x, (tuple, list)) else x
-                   for x in arg]
-
-            # indicated column order
-            columns = lzip(*arg)[0]
-        else:
-            # list of functions / function names
-            columns = []
-            for f in arg:
-                if isinstance(f, compat.string_types):
-                    columns.append(f)
-                else:
-                    # protect against callables without names
-                    columns.append(com._get_callable_name(f))
-            arg = lzip(columns, arg)
-
-        results = {}
-        for name, func in arg:
-            if name in results:
-                raise SpecificationError('Function names must be unique, '
-                                         'found multiple named %s' % name)
-
-            results[name] = self.aggregate(func)
-
-        return DataFrame(results, columns=columns)
-
-    def _wrap_aggregated_output(self, output, names=None):
-        # sort of a kludge
-        output = output[self.name]
-        index = self.grouper.result_index
-
-        if names is not None:
-            return DataFrame(output, index=index, columns=names)
-        else:
-            name = self.name
-            if name is None:
-                name = self._selected_obj.name
-            return Series(output, index=index, name=name)
-
-    def _wrap_applied_output(self, keys, values, not_indexed_same=False):
-        if len(keys) == 0:
-            # GH #6265
-            return Series([], name=self.name)
-
-        def _get_index():
-            if self.grouper.nkeys > 1:
-                index = MultiIndex.from_tuples(keys, names=self.grouper.names)
-            else:
-                index = Index(keys, name=self.grouper.names[0])
-            return index
-
-        if isinstance(values[0], dict):
-            # GH #823
-            index = _get_index()
-            return DataFrame(values, index=index).stack()
-
-        if isinstance(values[0], (Series, dict)):
-            return self._concat_objects(keys, values,
-                                        not_indexed_same=not_indexed_same)
-        elif isinstance(values[0], DataFrame):
-            # possible that Series -> DataFrame by applied function
-            return self._concat_objects(keys, values,
-                                        not_indexed_same=not_indexed_same)
-        else:
-            # GH #6265
-            return Series(values, index=_get_index(), name=self.name)
-
-    def _aggregate_named(self, func, *args, **kwargs):
-        result = {}
-
-        for name, group in self:
-            group.name = name
-            output = func(group, *args, **kwargs)
-            if isinstance(output, (Series, Index, np.ndarray)):
-                raise Exception('Must produce aggregated value')
-            result[name] = self._try_cast(output, group)
-
-        return result
-
-    def transform(self, func, *args, **kwargs):
-        """
-        Call function producing a like-indexed Series on each group and return
-        a Series with the transformed values
-
-        Parameters
-        ----------
-        func : function
-            To apply to each group. Should return a Series with the same index
-
-        Examples
-        --------
-        >>> grouped.transform(lambda x: (x - x.mean()) / x.std())
-
-        Returns
-        -------
-        transformed : Series
-        """
-
-        # if string function
-        if isinstance(func, compat.string_types):
-            return self._transform_fast(lambda : getattr(self, func)(*args, **kwargs))
-
-        # do we have a cython function
-        cyfunc = _intercept_cython(func)
-        if cyfunc and not args and not kwargs:
-            return self._transform_fast(cyfunc)
-
-        # reg transform
-        dtype = self._selected_obj.dtype
-        result = self._selected_obj.values.copy()
-
-        wrapper = lambda x: func(x, *args, **kwargs)
-        for i, (name, group) in enumerate(self):
-            object.__setattr__(group, 'name', name)
-            res = wrapper(group)
-
-            if hasattr(res, 'values'):
-                res = res.values
-
-            # may need to astype
-            try:
-                common_type = np.common_type(np.array(res), result)
-                if common_type != result.dtype:
-                    result = result.astype(common_type)
-            except:
-                pass
-
-            indexer = self._get_index(name)
-            result[indexer] = res
-
-        result = _possibly_downcast_to_dtype(result, dtype)
-        return self._selected_obj.__class__(result,
-                                            index=self._selected_obj.index,
-                                            name=self._selected_obj.name)
-
-    def _transform_fast(self, func):
-        """
-        fast version of transform, only applicable to builtin/cythonizable functions
-        """
-        if isinstance(func, compat.string_types):
-            func = getattr(self,func)
-
-        ids, _, ngroup = self.grouper.group_info
-        mask = ids != -1
-
-        out = func().values[ids]
-        if not mask.all():
-            out = np.where(mask, out, np.nan)
-
-        obs = np.zeros(ngroup, dtype='bool')
-        obs[ids[mask]] = True
-        if not obs.all():
-            out = self._try_cast(out, self._selected_obj)
-
-        return Series(out, index=self.obj.index)
-
-    def filter(self, func, dropna=True, *args, **kwargs):
-        """
-        Return a copy of a Series excluding elements from groups that
-        do not satisfy the boolean criterion specified by func.
-
-        Parameters
-        ----------
-        func : function
-            To apply to each group. Should return True or False.
-        dropna : Drop groups that do not pass the filter. True by default;
-            if False, groups that evaluate False are filled with NaNs.
-
-        Examples
-        --------
-        >>> grouped.filter(lambda x: x.mean() > 0)
-
-        Returns
-        -------
-        filtered : Series
-        """
-        if isinstance(func, compat.string_types):
-            wrapper = lambda x: getattr(x, func)(*args, **kwargs)
-        else:
-            wrapper = lambda x: func(x, *args, **kwargs)
-
-        # Interpret np.nan as False.
-        def true_and_notnull(x, *args, **kwargs):
-            b = wrapper(x, *args, **kwargs)
-            return b and notnull(b)
-
-        try:
-            indices = [self._get_index(name) for name, group in self
-                       if true_and_notnull(group)]
-        except ValueError:
-            raise TypeError("the filter must return a boolean result")
-        except TypeError:
-            raise TypeError("the filter must return a boolean result")
-
-        filtered = self._apply_filter(indices, dropna)
-        return filtered
-
-    def nunique(self, dropna=True):
-        ids, _, _ = self.grouper.group_info
-        val = self.obj.get_values()
-
-        try:
-            sorter = np.lexsort((val, ids))
-        except TypeError:  # catches object dtypes
-            assert val.dtype == object, \
-                'val.dtype must be object, got %s' % val.dtype
-            val, _ = algos.factorize(val, sort=False)
-            sorter = np.lexsort((val, ids))
-            isnull = lambda a: a == -1
-        else:
-            isnull = com.isnull
-
-        ids, val = ids[sorter], val[sorter]
-
-        # group boundaries are where group ids change
-        # unique observations are where sorted values change
-        idx = np.r_[0, 1 + np.nonzero(ids[1:] != ids[:-1])[0]]
-        inc = np.r_[1, val[1:] != val[:-1]]
-
-        # 1st item of each group is a new unique observation
-        mask = isnull(val)
-        if dropna:
-            inc[idx] = 1
-            inc[mask] = 0
-        else:
-            inc[mask & np.r_[False, mask[:-1]]] = 0
-            inc[idx] = 1
-
-        out = np.add.reduceat(inc, idx).astype('int64', copy=False)
-        return Series(out if ids[0] != -1 else out[1:],
-                      index=self.grouper.result_index,
-                      name=self.name)
-
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
-    @Appender(Series.nlargest.__doc__)
-    def nlargest(self, n=5, keep='first'):
-        # ToDo: When we remove deprecate_kwargs, we can remote these methods
-        # and include nlargest and nsmallest to _series_apply_whitelist
-        return self.apply(lambda x: x.nlargest(n=n, keep=keep))
-
-
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
-    @Appender(Series.nsmallest.__doc__)
-    def nsmallest(self, n=5, keep='first'):
-        return self.apply(lambda x: x.nsmallest(n=n, keep=keep))
-
-    def value_counts(self, normalize=False, sort=True, ascending=False,
-                     bins=None, dropna=True):
-
-        from functools import partial
-        from pandas.tools.tile import cut
-        from pandas.tools.merge import _get_join_indexers
-
-        if bins is not None and not np.iterable(bins):
-            # scalar bins cannot be done at top level
-            # in a backward compatible way
-            return self.apply(Series.value_counts,
-                              normalize=normalize,
-                              sort=sort,
-                              ascending=ascending,
-                              bins=bins)
-
-        ids, _, _ = self.grouper.group_info
-        val = self.obj.get_values()
-
-        # groupby removes null keys from groupings
-        mask = ids != -1
-        ids, val = ids[mask], val[mask]
-
-        if bins is None:
-            lab, lev = algos.factorize(val, sort=True)
-        else:
-            cat, bins = cut(val, bins, retbins=True)
-            # bins[:-1] for backward compat;
-            # o.w. cat.categories could be better
-            lab, lev, dropna = cat.codes, bins[:-1], False
-
-        sorter = np.lexsort((lab, ids))
-        ids, lab = ids[sorter], lab[sorter]
-
-        # group boundaries are where group ids change
-        idx = np.r_[0, 1 + np.nonzero(ids[1:] != ids[:-1])[0]]
-
-        # new values are where sorted labels change
-        inc = np.r_[True, lab[1:] != lab[:-1]]
-        inc[idx] = True  # group boundaries are also new values
-        out = np.diff(np.nonzero(np.r_[inc, True])[0]) # value counts
-
-        # num. of times each group should be repeated
-        rep = partial(np.repeat, repeats=np.add.reduceat(inc, idx))
-
-        # multi-index components
-        labels = list(map(rep, self.grouper.recons_labels)) + [lab[inc]]
-        levels = [ping.group_index for ping in self.grouper.groupings] + [lev]
-        names = self.grouper.names + [self.name]
-
-        if dropna:
-            mask = labels[-1] != -1
-            if mask.all():
-                dropna = False
-            else:
-                out, labels = out[mask], [label[mask] for label in labels]
-
-        if normalize:
-            out = out.astype('float')
-            acc = rep(np.diff(np.r_[idx, len(ids)]))
-            out /= acc[mask] if dropna else acc
-
-        if sort and bins is None:
-            cat = ids[inc][mask] if dropna else ids[inc]
-            sorter = np.lexsort((out if ascending else -out, cat))
-            out, labels[-1] = out[sorter], labels[-1][sorter]
-
-        if bins is None:
-            mi = MultiIndex(levels=levels, labels=labels, names=names,
-                            verify_integrity=False)
-
-            if com.is_integer_dtype(out):
-                out = com._ensure_int64(out)
-            return Series(out, index=mi)
-
-        # for compat. with algos.value_counts need to ensure every
-        # bin is present at every index level, null filled with zeros
-        diff = np.zeros(len(out), dtype='bool')
-        for lab in labels[:-1]:
-            diff |= np.r_[True, lab[1:] != lab[:-1]]
-
-        ncat, nbin = diff.sum(), len(levels[-1])
-
-        left = [np.repeat(np.arange(ncat), nbin),
-                np.tile(np.arange(nbin), ncat)]
-
-        right = [diff.cumsum() - 1, labels[-1]]
-
-        _, idx = _get_join_indexers(left, right, sort=False, how='left')
-        out = np.where(idx != -1, out[idx], 0)
-
-        if sort:
-            sorter = np.lexsort((out if ascending else -out, left[0]))
-            out, left[-1] = out[sorter], left[-1][sorter]
-
-        # build the multi-index w/ full levels
-        labels = list(map(lambda lab: np.repeat(lab[diff], nbin), labels[:-1]))
-        labels.append(left[-1])
-
-        mi = MultiIndex(levels=levels, labels=labels, names=names,
-                        verify_integrity=False)
-
-        if com.is_integer_dtype(out):
-            out = com._ensure_int64(out)
-        return Series(out, index=mi)
-
-    def count(self):
-        """ Compute count of group, excluding missing values """
-        ids, _, ngroups = self.grouper.group_info
-        val = self.obj.get_values()
-
-        mask = (ids != -1) & ~isnull(val)
-        ids = com._ensure_platform_int(ids)
-        out = np.bincount(ids[mask], minlength=ngroups) if ngroups != 0 else []
-
-        return Series(out, index=self.grouper.result_index, name=self.name, dtype='int64')
-
-    def _apply_to_column_groupbys(self, func):
-        """ return a pass thru """
-        return func(self)
-
-class NDFrameGroupBy(GroupBy):
-
-    def _iterate_slices(self):
-        if self.axis == 0:
-            # kludge
-            if self._selection is None:
-                slice_axis = self.obj.columns
-            else:
-                slice_axis = self._selection_list
-            slicer = lambda x: self.obj[x]
-        else:
-            slice_axis = self.obj.index
-            slicer = self.obj.xs
-
-        for val in slice_axis:
-            if val in self.exclusions:
-                continue
-            yield val, slicer(val)
-
-    def _cython_agg_general(self, how, numeric_only=True):
-        new_items, new_blocks = self._cython_agg_blocks(how, numeric_only=numeric_only)
-        return self._wrap_agged_blocks(new_items, new_blocks)
-
-    def _wrap_agged_blocks(self, items, blocks):
-        obj = self._obj_with_exclusions
-
-        new_axes = list(obj._data.axes)
-
-        # more kludge
-        if self.axis == 0:
-            new_axes[0], new_axes[1] = new_axes[1], self.grouper.result_index
-        else:
-            new_axes[self.axis] = self.grouper.result_index
-
-        # Make sure block manager integrity check passes.
-        assert new_axes[0].equals(items)
-        new_axes[0] = items
-
-        mgr = BlockManager(blocks, new_axes)
-
-        new_obj = type(obj)(mgr)
-
-        return self._post_process_cython_aggregate(new_obj)
-
-    _block_agg_axis = 0
-
-    def _cython_agg_blocks(self, how, numeric_only=True):
-        data, agg_axis = self._get_data_to_aggregate()
-
-        new_blocks = []
-
-        if numeric_only:
-            data = data.get_numeric_data(copy=False)
-
-        for block in data.blocks:
-
-            result, _ = self.grouper.aggregate(block.values, how, axis=agg_axis)
-
-            # see if we can cast the block back to the original dtype
-            result = block._try_coerce_and_cast_result(result)
-
-            newb = make_block(result, placement=block.mgr_locs)
-            new_blocks.append(newb)
-
-        if len(new_blocks) == 0:
-            raise DataError('No numeric types to aggregate')
-
-        return data.items, new_blocks
-
-    def _get_data_to_aggregate(self):
-        obj = self._obj_with_exclusions
-        if self.axis == 0:
-            return obj.swapaxes(0, 1)._data, 1
-        else:
-            return obj._data, self.axis
-
-    def _post_process_cython_aggregate(self, obj):
-        # undoing kludge from below
-        if self.axis == 0:
-            obj = obj.swapaxes(0, 1)
-        return obj
-
-    @cache_readonly
-    def _obj_with_exclusions(self):
-        if self._selection is not None:
-            return self.obj.reindex(columns=self._selection_list)
-
-        if len(self.exclusions) > 0:
-            return self.obj.drop(self.exclusions, axis=1)
-        else:
-            return self.obj
-
-    @Appender(_agg_doc)
-    def aggregate(self, arg, *args, **kwargs):
-        if isinstance(arg, compat.string_types):
-            return getattr(self, arg)(*args, **kwargs)
-
-        result = OrderedDict()
-        if isinstance(arg, dict):
-            if self.axis != 0:  # pragma: no cover
-                raise ValueError('Can only pass dict with axis=0')
-
-            obj = self._selected_obj
-
-            if any(isinstance(x, (list, tuple, dict)) for x in arg.values()):
-                new_arg = OrderedDict()
-                for k, v in compat.iteritems(arg):
-                    if not isinstance(v, (tuple, list, dict)):
-                        new_arg[k] = [v]
-                    else:
-                        new_arg[k] = v
-                arg = new_arg
-
-            keys = []
-            if self._selection is not None:
-                subset = obj
-                if isinstance(subset, DataFrame):
-                    raise NotImplementedError("Aggregating on a DataFrame is "
-                                              "not supported")
-
-                for fname, agg_how in compat.iteritems(arg):
-                    colg = SeriesGroupBy(subset, selection=self._selection,
-                                         grouper=self.grouper)
-                    result[fname] = colg.aggregate(agg_how)
-                    keys.append(fname)
-            else:
-                for col, agg_how in compat.iteritems(arg):
-                    colg = SeriesGroupBy(obj[col], selection=col,
-                                         grouper=self.grouper)
-                    result[col] = colg.aggregate(agg_how)
-                    keys.append(col)
-
-            if isinstance(list(result.values())[0], DataFrame):
-                from pandas.tools.merge import concat
-                result = concat([result[k] for k in keys], keys=keys, axis=1)
-            else:
-                result = DataFrame(result)
-        elif isinstance(arg, list):
-            return self._aggregate_multiple_funcs(arg)
-        else:
-            cyfunc = _intercept_cython(arg)
-            if cyfunc and not args and not kwargs:
-                return getattr(self, cyfunc)()
-
-            if self.grouper.nkeys > 1:
-                return self._python_agg_general(arg, *args, **kwargs)
-            else:
-
-                # try to treat as if we are passing a list
-                try:
-                    assert not args and not kwargs
-                    result = self._aggregate_multiple_funcs([arg])
-                    result.columns = Index(result.columns.levels[0],
-                                           name=self._selected_obj.columns.name)
-                except:
-                    result = self._aggregate_generic(arg, *args, **kwargs)
-
-        if not self.as_index:
-            self._insert_inaxis_grouper_inplace(result)
-            result.index = np.arange(len(result))
-
-        return result._convert(datetime=True)
-
-    def _aggregate_multiple_funcs(self, arg):
-        from pandas.tools.merge import concat
-
-        if self.axis != 0:
-            raise NotImplementedError("axis other than 0 is not supported")
-
-        obj = self._obj_with_exclusions
-
-        results = []
-        keys = []
-        for col in obj:
-            try:
-                colg = SeriesGroupBy(obj[col], selection=col,
-                                     grouper=self.grouper)
-                results.append(colg.aggregate(arg))
-                keys.append(col)
-            except (TypeError, DataError):
-                pass
-            except SpecificationError:
-                raise
-        result = concat(results, keys=keys, axis=1)
-
-        return result
-
-    def _aggregate_generic(self, func, *args, **kwargs):
-        if self.grouper.nkeys != 1:
-            raise AssertionError('Number of keys must be 1')
-
-        axis = self.axis
-        obj = self._obj_with_exclusions
-
-        result = {}
-        if axis != obj._info_axis_number:
-            try:
-                for name, data in self:
-                    result[name] = self._try_cast(func(data, *args, **kwargs),
-                                                  data)
-            except Exception:
-                return self._aggregate_item_by_item(func, *args, **kwargs)
-        else:
-            for name in self.indices:
-                try:
-                    data = self.get_group(name, obj=obj)
-                    result[name] = self._try_cast(func(data, *args, **kwargs),
-                                                  data)
-                except Exception:
-                    wrapper = lambda x: func(x, *args, **kwargs)
-                    result[name] = data.apply(wrapper, axis=axis)
-
-        return self._wrap_generic_output(result, obj)
-
-    def _wrap_aggregated_output(self, output, names=None):
-        raise AbstractMethodError(self)
-
-    def _aggregate_item_by_item(self, func, *args, **kwargs):
-        # only for axis==0
-
-        obj = self._obj_with_exclusions
-        result = {}
-        cannot_agg = []
-        errors=None
-        for item in obj:
-            try:
-                data = obj[item]
-                colg = SeriesGroupBy(data, selection=item,
-                                     grouper=self.grouper)
-                result[item] = self._try_cast(
-                    colg.aggregate(func, *args, **kwargs), data)
-            except ValueError:
-                cannot_agg.append(item)
-                continue
-            except TypeError as e:
-                cannot_agg.append(item)
-                errors=e
-                continue
-
-        result_columns = obj.columns
-        if cannot_agg:
-            result_columns = result_columns.drop(cannot_agg)
-
-            # GH6337
-            if not len(result_columns) and errors is not None:
-                raise errors
-
-        return DataFrame(result, columns=result_columns)
-
-    def _decide_output_index(self, output, labels):
-        if len(output) == len(labels):
-            output_keys = labels
-        else:
-            output_keys = sorted(output)
-            try:
-                output_keys.sort()
-            except Exception:  # pragma: no cover
-                pass
-
-            if isinstance(labels, MultiIndex):
-                output_keys = MultiIndex.from_tuples(output_keys,
-                                                     names=labels.names)
-
-        return output_keys
-
-    def _wrap_applied_output(self, keys, values, not_indexed_same=False):
-        from pandas.core.index import _all_indexes_same
-
-        if len(keys) == 0:
-            # XXX
-            return DataFrame({})
-
-        key_names = self.grouper.names
-
-        if isinstance(values[0], DataFrame):
-            return self._concat_objects(keys, values,
-                                        not_indexed_same=not_indexed_same)
-        elif self.grouper.groupings is not None:
-            if len(self.grouper.groupings) > 1:
-                key_index = MultiIndex.from_tuples(keys, names=key_names)
-
-            else:
-                ping = self.grouper.groupings[0]
-                if len(keys) == ping.ngroups:
-                    key_index = ping.group_index
-                    key_index.name = key_names[0]
-
-                    key_lookup = Index(keys)
-                    indexer = key_lookup.get_indexer(key_index)
-
-                    # reorder the values
-                    values = [values[i] for i in indexer]
-                else:
-
-                    key_index = Index(keys, name=key_names[0])
-
-                # don't use the key indexer
-                if not self.as_index:
-                    key_index = None
-
-            # make Nones an empty object
-            if com._count_not_none(*values) != len(values):
-                try:
-                    v = next(v for v in values if v is not None)
-                except StopIteration:
-                    # If all values are None, then this will throw an error.
-                    # We'd prefer it return an empty dataframe.
-                    return DataFrame()
-                if v is None:
-                    return DataFrame()
-                elif isinstance(v, NDFrame):
-                    values = [
-                        x if x is not None else
-                        v._constructor(**v._construct_axes_dict())
-                        for x in values
-                        ]
-
-            v = values[0]
-
-            if isinstance(v, (np.ndarray, Index, Series)):
-                if isinstance(v, Series):
-                    applied_index = self._selected_obj._get_axis(self.axis)
-                    all_indexed_same = _all_indexes_same([
-                        x.index for x in values
-                    ])
-                    singular_series = (len(values) == 1 and
-                                       applied_index.nlevels == 1)
-
-                    # GH3596
-                    # provide a reduction (Frame -> Series) if groups are
-                    # unique
-                    if self.squeeze:
-
-                        # assign the name to this series
-                        if singular_series:
-                            values[0].name = keys[0]
-
-                            # GH2893
-                            # we have series in the values array, we want to
-                            # produce a series:
-                            # if any of the sub-series are not indexed the same
-                            # OR we don't have a multi-index and we have only a
-                            # single values
-                            return self._concat_objects(
-                                keys, values, not_indexed_same=not_indexed_same
-                            )
-
-                        # still a series
-                        # path added as of GH 5545
-                        elif all_indexed_same:
-                            from pandas.tools.merge import concat
-                            return concat(values)
-
-                    if not all_indexed_same:
-                        # GH 8467
-                        return self._concat_objects(
-                            keys, values, not_indexed_same=True,
-                        )
-
-                try:
-                    if self.axis == 0:
-                        # GH6124 if the list of Series have a consistent name,
-                        # then propagate that name to the result.
-                        index = v.index.copy()
-                        if index.name is None:
-                            # Only propagate the series name to the result
-                            # if all series have a consistent name.  If the
-                            # series do not have a consistent name, do
-                            # nothing.
-                            names = set(v.name for v in values)
-                            if len(names) == 1:
-                                index.name = list(names)[0]
-
-                        # normally use vstack as its faster than concat
-                        # and if we have mi-columns
-                        if isinstance(v.index, MultiIndex) or key_index is None:
-                            stacked_values = np.vstack(map(np.asarray, values))
-                            result = DataFrame(stacked_values, index=key_index,
-                                               columns=index)
-                        else:
-                            # GH5788 instead of stacking; concat gets the dtypes correct
-                            from pandas.tools.merge import concat
-                            result = concat(values, keys=key_index,
-                                            names=key_index.names,
-                                            axis=self.axis).unstack()
-                            result.columns = index
-                    else:
-                        stacked_values = np.vstack(map(np.asarray, values))
-                        result = DataFrame(stacked_values.T, index=v.index,
-                                           columns=key_index)
-
-                except (ValueError, AttributeError):
-                    # GH1738: values is list of arrays of unequal lengths fall
-                    # through to the outer else caluse
-                    return Series(values, index=key_index)
-
-                # if we have date/time like in the original, then coerce dates
-                # as we are stacking can easily have object dtypes here
-                if (self._selected_obj.ndim == 2 and
-                        self._selected_obj.dtypes.isin(_DATELIKE_DTYPES).any()):
-                    result = result._convert(numeric=True)
-                    date_cols = self._selected_obj.select_dtypes(
-                        include=list(_DATELIKE_DTYPES)).columns
-                    result[date_cols] = (result[date_cols]
-                                         ._convert(datetime=True,
-                                                          coerce=True))
-                else:
-                    result = result._convert(datetime=True)
-
-                return self._reindex_output(result)
-
-            else:
-                # only coerce dates if we find at least 1 datetime
-                coerce = True if any([ isinstance(v,Timestamp) for v in values ]) else False
-                return (Series(values, index=key_index)
-                        ._convert(datetime=True,
-                                         coerce=coerce))
-
-        else:
-            # Handle cases like BinGrouper
-            return self._concat_objects(keys, values,
-                                        not_indexed_same=not_indexed_same)
-
-    def _transform_general(self, func, *args, **kwargs):
-        from pandas.tools.merge import concat
-
-        applied = []
-
-        obj = self._obj_with_exclusions
-        gen = self.grouper.get_iterator(obj, axis=self.axis)
-        fast_path, slow_path = self._define_paths(func, *args, **kwargs)
-
-        path = None
-        for name, group in gen:
-            object.__setattr__(group, 'name', name)
-
-            if path is None:
-                # Try slow path and fast path.
-                try:
-                    path, res = self._choose_path(fast_path, slow_path, group)
-                except TypeError:
-                    return self._transform_item_by_item(obj, fast_path)
-                except Exception:  # pragma: no cover
-                    res = fast_path(group)
-                    path = fast_path
-            else:
-                res = path(group)
-
-            # broadcasting
-            if isinstance(res, Series):
-                if res.index.is_(obj.index):
-                    group.T.values[:] = res
-                else:
-                    group.values[:] = res
-
-                applied.append(group)
-            else:
-                applied.append(res)
-
-        concat_index = obj.columns if self.axis == 0 else obj.index
-        concatenated = concat(applied, join_axes=[concat_index],
-                              axis=self.axis, verify_integrity=False)
-        return self._set_result_index_ordered(concatenated)
-
-    def transform(self, func, *args, **kwargs):
-        """
-        Call function producing a like-indexed DataFrame on each group and
-        return a DataFrame having the same indexes as the original object
-        filled with the transformed values
-
-        Parameters
-        ----------
-        f : function
-            Function to apply to each subframe
-
-        Notes
-        -----
-        Each subframe is endowed the attribute 'name' in case you need to know
-        which group you are working on.
-
-        Examples
-        --------
-        >>> grouped = df.groupby(lambda x: mapping[x])
-        >>> grouped.transform(lambda x: (x - x.mean()) / x.std())
-        """
-
-        # try to do a fast transform via merge if possible
-        try:
-            obj = self._obj_with_exclusions
-            if isinstance(func, compat.string_types):
-                result = getattr(self, func)(*args, **kwargs)
-            else:
-                cyfunc = _intercept_cython(func)
-                if cyfunc and not args and not kwargs:
-                    result = getattr(self, cyfunc)()
-                else:
-                    return self._transform_general(func, *args, **kwargs)
-        except:
-            return self._transform_general(func, *args, **kwargs)
-
-        # a reduction transform
-        if not isinstance(result, DataFrame):
-            return self._transform_general(func, *args, **kwargs)
-
-        # nuiscance columns
-        if not result.columns.equals(obj.columns):
-            return self._transform_general(func, *args, **kwargs)
-
-        results = np.empty_like(obj.values, result.values.dtype)
-        indices = self.indices
-        for (name, group), (i, row) in zip(self, result.iterrows()):
-            indexer = self._get_index(name)
-            if len(indexer) > 0:
-                results[indexer] = np.tile(row.values,len(indexer)).reshape(len(indexer),-1)
-
-        counts = self.size().fillna(0).values
-        if any(counts == 0):
-            results = self._try_cast(results, obj[result.columns])
-
-        return (DataFrame(results,columns=result.columns,index=obj.index)
-                ._convert(datetime=True))
-
-    def _define_paths(self, func, *args, **kwargs):
-        if isinstance(func, compat.string_types):
-            fast_path = lambda group: getattr(group, func)(*args, **kwargs)
-            slow_path = lambda group: group.apply(
-                lambda x: getattr(x, func)(*args, **kwargs), axis=self.axis)
-        else:
-            fast_path = lambda group: func(group, *args, **kwargs)
-            slow_path = lambda group: group.apply(
-                lambda x: func(x, *args, **kwargs), axis=self.axis)
-        return fast_path, slow_path
-
-    def _choose_path(self, fast_path, slow_path, group):
-        path = slow_path
-        res = slow_path(group)
-
-        # if we make it here, test if we can use the fast path
-        try:
-            res_fast = fast_path(group)
-
-            # compare that we get the same results
-            if res.shape == res_fast.shape:
-                res_r = res.values.ravel()
-                res_fast_r = res_fast.values.ravel()
-                mask = notnull(res_r)
-            if (res_r[mask] == res_fast_r[mask]).all():
-                path = fast_path
-
-        except:
-            pass
-        return path, res
-
-    def _transform_item_by_item(self, obj, wrapper):
-        # iterate through columns
-        output = {}
-        inds = []
-        for i, col in enumerate(obj):
-            try:
-                output[col] = self[col].transform(wrapper)
-                inds.append(i)
-            except Exception:
-                pass
-
-        if len(output) == 0:  # pragma: no cover
-            raise TypeError('Transform function invalid for data types')
-
-        columns = obj.columns
-        if len(output) < len(obj.columns):
-            columns = columns.take(inds)
-
-        return DataFrame(output, index=obj.index, columns=columns)
-
-    def filter(self, func, dropna=True, *args, **kwargs):
-        """
-        Return a copy of a DataFrame excluding elements from groups that
-        do not satisfy the boolean criterion specified by func.
-
-        Parameters
-        ----------
-        f : function
-            Function to apply to each subframe. Should return True or False.
-        dropna : Drop groups that do not pass the filter. True by default;
-            if False, groups that evaluate False are filled with NaNs.
-
-        Notes
-        -----
-        Each subframe is endowed the attribute 'name' in case you need to know
-        which group you are working on.
-
-        Examples
-        --------
-        >>> grouped = df.groupby(lambda x: mapping[x])
-        >>> grouped.filter(lambda x: x['A'].sum() + x['B'].sum() > 0)
-        """
-
-        indices = []
-
-        obj = self._selected_obj
-        gen = self.grouper.get_iterator(obj, axis=self.axis)
-
-        for name, group in gen:
-            object.__setattr__(group, 'name', name)
-
-            res = func(group, *args, **kwargs)
-
-            try:
-                res = res.squeeze()
-            except AttributeError:  # allow e.g., scalars and frames to pass
-                pass
-
-            # interpret the result of the filter
-            if is_bool(res) or (lib.isscalar(res) and isnull(res)):
-                if res and notnull(res):
-                    indices.append(self._get_index(name))
-            else:
-                # non scalars aren't allowed
-                raise TypeError("filter function returned a %s, "
-                                "but expected a scalar bool" %
-                                type(res).__name__)
-
-        return self._apply_filter(indices, dropna)
-
-
-class DataFrameGroupBy(NDFrameGroupBy):
-    _apply_whitelist = _dataframe_apply_whitelist
-    #
-    # Make class defs of attributes on DataFrameGroupBy whitelist.
-    for _def_str in _whitelist_method_generator(DataFrame,_apply_whitelist) :
-        exec(_def_str)
-
-    _block_agg_axis = 1
-
-    def __getitem__(self, key):
-        if self._selection is not None:
-            raise Exception('Column(s) %s already selected' % self._selection)
-
-        if isinstance(key, (list, tuple, Series, Index, np.ndarray)):
-            if len(self.obj.columns.intersection(key)) != len(key):
-                bad_keys = list(set(key).difference(self.obj.columns))
-                raise KeyError("Columns not found: %s"
-                               % str(bad_keys)[1:-1])
-            return DataFrameGroupBy(self.obj, self.grouper, selection=key,
-                                    grouper=self.grouper,
-                                    exclusions=self.exclusions,
-                                    as_index=self.as_index)
-
-        elif not self.as_index:
-            if key not in self.obj.columns:
-                raise KeyError("Column not found: %s" % key)
-            return DataFrameGroupBy(self.obj, self.grouper, selection=key,
-                                    grouper=self.grouper,
-                                    exclusions=self.exclusions,
-                                    as_index=self.as_index)
-
-        else:
-            if key not in self.obj:
-                raise KeyError("Column not found: %s" % key)
-            # kind of a kludge
-            return SeriesGroupBy(self.obj[key], selection=key,
-                                 grouper=self.grouper,
-                                 exclusions=self.exclusions)
-
-    def _wrap_generic_output(self, result, obj):
-        result_index = self.grouper.levels[0]
-
-        if result:
-            if self.axis == 0:
-                result = DataFrame(result, index=obj.columns,
-                                   columns=result_index).T
-            else:
-                result = DataFrame(result, index=obj.index,
-                                   columns=result_index)
-        else:
-            result = DataFrame(result)
-
-        return result
-
-    def _get_data_to_aggregate(self):
-        obj = self._obj_with_exclusions
-        if self.axis == 1:
-            return obj.T._data, 1
-        else:
-            return obj._data, 1
-
-    def _insert_inaxis_grouper_inplace(self, result):
-        # zip in reverse so we can always insert at loc 0
-        izip = zip(* map(reversed, (
-            self.grouper.names,
-            self.grouper.get_group_levels(),
-            [grp.in_axis for grp in self.grouper.groupings])))
-
-        for name, lev, in_axis in izip:
-            if in_axis:
-                result.insert(0, name, lev)
-
-    def _wrap_aggregated_output(self, output, names=None):
-        agg_axis = 0 if self.axis == 1 else 1
-        agg_labels = self._obj_with_exclusions._get_axis(agg_axis)
-
-        output_keys = self._decide_output_index(output, agg_labels)
-
-        if not self.as_index:
-            result = DataFrame(output, columns=output_keys)
-            self._insert_inaxis_grouper_inplace(result)
-            result = result.consolidate()
-        else:
-            index = self.grouper.result_index
-            result = DataFrame(output, index=index, columns=output_keys)
-
-        if self.axis == 1:
-            result = result.T
-
-        return self._reindex_output(result)._convert(datetime=True)
-
-    def _wrap_agged_blocks(self, items, blocks):
-        if not self.as_index:
-            index = np.arange(blocks[0].values.shape[1])
-            mgr = BlockManager(blocks, [items, index])
-            result = DataFrame(mgr)
-
-            self._insert_inaxis_grouper_inplace(result)
-            result = result.consolidate()
-        else:
-            index = self.grouper.result_index
-            mgr = BlockManager(blocks, [items, index])
-            result = DataFrame(mgr)
-
-        if self.axis == 1:
-            result = result.T
-
-        return self._reindex_output(result)._convert(datetime=True)
-
-    def _reindex_output(self, result):
-        """
-        if we have categorical groupers, then we want to make sure that
-        we have a fully reindex-output to the levels. These may have not participated in
-        the groupings (e.g. may have all been nan groups)
-
-        This can re-expand the output space
-        """
-        groupings = self.grouper.groupings
-        if groupings is None:
-            return result
-        elif len(groupings) == 1:
-            return result
-        elif not any([isinstance(ping.grouper, (Categorical, CategoricalIndex))
-                      for ping in groupings]):
-            return result
-
-        levels_list = [ ping.group_index for ping in groupings ]
-        index = MultiIndex.from_product(levels_list, names=self.grouper.names)
-        d = { self.obj._get_axis_name(self.axis) : index, 'copy' : False }
-        return result.reindex(**d).sortlevel(axis=self.axis)
-
-    def _iterate_column_groupbys(self):
-        for i, colname in enumerate(self._selected_obj.columns):
-            yield colname, SeriesGroupBy(self._selected_obj.iloc[:, i],
-                                         selection=colname,
-                                         grouper=self.grouper,
-                                         exclusions=self.exclusions)
-
-    def _apply_to_column_groupbys(self, func):
-        from pandas.tools.merge import concat
-        return concat(
-            (func(col_groupby) for _, col_groupby
-             in self._iterate_column_groupbys()),
-            keys=self._selected_obj.columns, axis=1)
-
-    def count(self):
-        """ Compute count of group, excluding missing values """
-        from functools import partial
-        from pandas.lib import count_level_2d
-        from pandas.core.common import _isnull_ndarraylike as isnull
-
-        data, _ = self._get_data_to_aggregate()
-        ids, _, ngroups = self.grouper.group_info
-        mask = ids != -1
-
-        val = ((mask & ~isnull(blk.get_values())) for blk in data.blocks)
-        loc = (blk.mgr_locs for blk in data.blocks)
-
-        counter = partial(count_level_2d, labels=ids, max_bin=ngroups, axis=1)
-        blk = map(make_block, map(counter, val), loc)
-
-        return self._wrap_agged_blocks(data.items, list(blk))
-
-
-from pandas.tools.plotting import boxplot_frame_groupby
-DataFrameGroupBy.boxplot = boxplot_frame_groupby
-
-
-class PanelGroupBy(NDFrameGroupBy):
-
-    def _iterate_slices(self):
-        if self.axis == 0:
-            # kludge
-            if self._selection is None:
-                slice_axis = self._selected_obj.items
-            else:
-                slice_axis = self._selection_list
-            slicer = lambda x: self._selected_obj[x]
-        else:
-            raise NotImplementedError("axis other than 0 is not supported")
-
-        for val in slice_axis:
-            if val in self.exclusions:
-                continue
-
-            yield val, slicer(val)
-
-    def aggregate(self, arg, *args, **kwargs):
-        """
-        Aggregate using input function or dict of {column -> function}
-
-        Parameters
-        ----------
-        arg : function or dict
-            Function to use for aggregating groups. If a function, must either
-            work when passed a Panel or when passed to Panel.apply. If
-            pass a dict, the keys must be DataFrame column names
-
-        Returns
-        -------
-        aggregated : Panel
-        """
-        if isinstance(arg, compat.string_types):
-            return getattr(self, arg)(*args, **kwargs)
-
-        return self._aggregate_generic(arg, *args, **kwargs)
-
-    def _wrap_generic_output(self, result, obj):
-        if self.axis == 0:
-            new_axes = list(obj.axes)
-            new_axes[0] = self.grouper.result_index
-        elif self.axis == 1:
-            x, y, z = obj.axes
-            new_axes = [self.grouper.result_index, z, x]
-        else:
-            x, y, z = obj.axes
-            new_axes = [self.grouper.result_index, y, x]
-
-        result = Panel._from_axes(result, new_axes)
-
-        if self.axis == 1:
-            result = result.swapaxes(0, 1).swapaxes(0, 2)
-        elif self.axis == 2:
-            result = result.swapaxes(0, 2)
-
-        return result
-
-    def _aggregate_item_by_item(self, func, *args, **kwargs):
-        obj = self._obj_with_exclusions
-        result = {}
-
-        if self.axis > 0:
-            for item in obj:
-                try:
-                    itemg = DataFrameGroupBy(obj[item],
-                                             axis=self.axis - 1,
-                                             grouper=self.grouper)
-                    result[item] = itemg.aggregate(func, *args, **kwargs)
-                except (ValueError, TypeError):
-                    raise
-            new_axes = list(obj.axes)
-            new_axes[self.axis] = self.grouper.result_index
-            return Panel._from_axes(result, new_axes)
-        else:
-            raise ValueError("axis value must be greater than 0")
-
-    def _wrap_aggregated_output(self, output, names=None):
-        raise AbstractMethodError(self)
-
-
-class NDArrayGroupBy(GroupBy):
-    pass
-
-
-#----------------------------------------------------------------------
-# Splitting / application
-
-
-class DataSplitter(object):
-
-    def __init__(self, data, labels, ngroups, axis=0):
-        self.data = data
-        self.labels = com._ensure_int64(labels)
-        self.ngroups = ngroups
-
-        self.axis = axis
-
-    @cache_readonly
-    def slabels(self):
-        # Sorted labels
-        return com.take_nd(self.labels, self.sort_idx, allow_fill=False)
-
-    @cache_readonly
-    def sort_idx(self):
-        # Counting sort indexer
-        return _get_group_index_sorter(self.labels, self.ngroups)
-
-    def __iter__(self):
-        sdata = self._get_sorted_data()
-
-        if self.ngroups == 0:
-            raise StopIteration
-
-        starts, ends = lib.generate_slices(self.slabels, self.ngroups)
-
-        for i, (start, end) in enumerate(zip(starts, ends)):
-            # Since I'm now compressing the group ids, it's now not "possible"
-            # to produce empty slices because such groups would not be observed
-            # in the data
-            # if start >= end:
-            #     raise AssertionError('Start %s must be less than end %s'
-            #                          % (str(start), str(end)))
-            yield i, self._chop(sdata, slice(start, end))
-
-    def _get_sorted_data(self):
-        return self.data.take(self.sort_idx, axis=self.axis, convert=False)
-
-    def _chop(self, sdata, slice_obj):
-        return sdata.iloc[slice_obj]
-
-    def apply(self, f):
-        raise AbstractMethodError(self)
-
-
-class ArraySplitter(DataSplitter):
-    pass
-
-
-class SeriesSplitter(DataSplitter):
-
-    def _chop(self, sdata, slice_obj):
-        return sdata._get_values(slice_obj).to_dense()
-
-
-class FrameSplitter(DataSplitter):
-
-    def __init__(self, data, labels, ngroups, axis=0):
-        super(FrameSplitter, self).__init__(data, labels, ngroups, axis=axis)
-
-    def fast_apply(self, f, names):
-        # must return keys::list, values::list, mutated::bool
-        try:
-            starts, ends = lib.generate_slices(self.slabels, self.ngroups)
-        except:
-            # fails when all -1
-            return [], True
-
-        sdata = self._get_sorted_data()
-        results, mutated = lib.apply_frame_axis0(sdata, f, names, starts, ends)
-
-        return results, mutated
-
-    def _chop(self, sdata, slice_obj):
-        if self.axis == 0:
-            return sdata.iloc[slice_obj]
-        else:
-            return sdata._slice(slice_obj, axis=1)  # ix[:, slice_obj]
-
-
-class NDFrameSplitter(DataSplitter):
-
-    def __init__(self, data, labels, ngroups, axis=0):
-        super(NDFrameSplitter, self).__init__(data, labels, ngroups, axis=axis)
-
-        self.factory = data._constructor
-
-    def _get_sorted_data(self):
-        # this is the BlockManager
-        data = self.data._data
-
-        # this is sort of wasteful but...
-        sorted_axis = data.axes[self.axis].take(self.sort_idx)
-        sorted_data = data.reindex_axis(sorted_axis, axis=self.axis)
-
-        return sorted_data
-
-    def _chop(self, sdata, slice_obj):
-        return self.factory(sdata.get_slice(slice_obj, axis=self.axis))
-
-
-def get_splitter(data, *args, **kwargs):
-    if isinstance(data, Series):
-        klass = SeriesSplitter
-    elif isinstance(data, DataFrame):
-        klass = FrameSplitter
-    else:
-        klass = NDFrameSplitter
-
-    return klass(data, *args, **kwargs)
-
-
-#----------------------------------------------------------------------
-# Misc utilities
-
-
-def get_group_index(labels, shape, sort, xnull):
-    """
-    For the particular label_list, gets the offsets into the hypothetical list
-    representing the totally ordered cartesian product of all possible label
-    combinations, *as long as* this space fits within int64 bounds;
-    otherwise, though group indices identify unique combinations of
-    labels, they cannot be deconstructed.
-    - If `sort`, rank of returned ids preserve lexical ranks of labels.
-      i.e. returned id's can be used to do lexical sort on labels;
-    - If `xnull` nulls (-1 labels) are passed through.
-
-    Parameters
-    ----------
-    labels: sequence of arrays
-        Integers identifying levels at each location
-    shape: sequence of ints same length as labels
-        Number of unique levels at each location
-    sort: boolean
-        If the ranks of returned ids should match lexical ranks of labels
-    xnull: boolean
-        If true nulls are excluded. i.e. -1 values in the labels are
-        passed through
-    Returns
-    -------
-    An array of type int64 where two elements are equal if their corresponding
-    labels are equal at all location.
-    """
-    def _int64_cut_off(shape):
-        acc = long(1)
-        for i, mul in enumerate(shape):
-            acc *= long(mul)
-            if not acc < _INT64_MAX:
-                return i
-        return len(shape)
-
-    def loop(labels, shape):
-        # how many levels can be done without overflow:
-        nlev = _int64_cut_off(shape)
-
-        # compute flat ids for the first `nlev` levels
-        stride = np.prod(shape[1:nlev], dtype='i8')
-        out = stride * labels[0].astype('i8', subok=False, copy=False)
-
-        for i in range(1, nlev):
-            stride //= shape[i]
-            out += labels[i] * stride
-
-        if xnull: # exclude nulls
-            mask = labels[0] == -1
-            for lab in labels[1:nlev]:
-                mask |= lab == -1
-            out[mask] = -1
-
-        if nlev == len(shape):  # all levels done!
-            return out
-
-        # compress what has been done so far in order to avoid overflow
-        # to retain lexical ranks, obs_ids should be sorted
-        comp_ids, obs_ids = _compress_group_index(out, sort=sort)
-
-        labels = [comp_ids] + labels[nlev:]
-        shape = [len(obs_ids)] + shape[nlev:]
-
-        return loop(labels, shape)
-
-    def maybe_lift(lab, size):  # pormote nan values
-        return (lab + 1, size + 1) if (lab == -1).any() else (lab, size)
-
-    labels = map(com._ensure_int64, labels)
-    if not xnull:
-        labels, shape = map(list, zip(*map(maybe_lift, labels, shape)))
-
-    return loop(list(labels), list(shape))
-
-
-_INT64_MAX = np.iinfo(np.int64).max
-
-
-def _int64_overflow_possible(shape):
-    the_prod = long(1)
-    for x in shape:
-        the_prod *= long(x)
-
-    return the_prod >= _INT64_MAX
-
-
-def decons_group_index(comp_labels, shape):
-    # reconstruct labels
-    if _int64_overflow_possible(shape):
-        # at some point group indices are factorized,
-        # and may not be deconstructed here! wrong path!
-        raise ValueError('cannot deconstruct factorized group indices!')
-
-    label_list = []
-    factor = 1
-    y = 0
-    x = comp_labels
-    for i in reversed(range(len(shape))):
-        labels = (x - y) % (factor * shape[i]) // factor
-        np.putmask(labels, comp_labels < 0, -1)
-        label_list.append(labels)
-        y = labels * factor
-        factor *= shape[i]
-    return label_list[::-1]
-
-
-def decons_obs_group_ids(comp_ids, obs_ids, shape, labels, xnull):
-    """
-    reconstruct labels from observed group ids
-
-    Parameters
-    ----------
-    xnull: boolean,
-        if nulls are excluded; i.e. -1 labels are passed through
-    """
-    from pandas.hashtable import unique_label_indices
-
-    if not xnull:
-        lift = np.fromiter(((a == -1).any() for a in labels), dtype='i8')
-        shape = np.asarray(shape, dtype='i8') + lift
-
-    if not _int64_overflow_possible(shape):
-        # obs ids are deconstructable! take the fast route!
-        out = decons_group_index(obs_ids, shape)
-        return out if xnull or not lift.any() \
-                else [x - y for x, y in zip(out, lift)]
-
-    i = unique_label_indices(comp_ids)
-    i8copy = lambda a: a.astype('i8', subok=False, copy=True)
-    return [i8copy(lab[i]) for lab in labels]
-
-
-def _indexer_from_factorized(labels, shape, compress=True):
-    ids = get_group_index(labels, shape, sort=True, xnull=False)
-
-    if not compress:
-        ngroups = (ids.size and ids.max()) + 1
-    else:
-        ids, obs = _compress_group_index(ids, sort=True)
-        ngroups = len(obs)
-
-    return _get_group_index_sorter(ids, ngroups)
-
-
-def _lexsort_indexer(keys, orders=None, na_position='last'):
-    labels = []
-    shape = []
-    if isinstance(orders, bool):
-        orders = [orders] * len(keys)
-    elif orders is None:
-        orders = [True] * len(keys)
-
-    for key, order in zip(keys, orders):
-
-        # we are already a Categorical
-        if is_categorical_dtype(key):
-            c = key
-
-        # create the Categorical
-        else:
-            c = Categorical(key,ordered=True)
-
-        if na_position not in ['last','first']:
-            raise ValueError('invalid na_position: {!r}'.format(na_position))
-
-        n = len(c.categories)
-        codes = c.codes.copy()
-
-        mask = (c.codes == -1)
-        if order: # ascending
-            if na_position == 'last':
-                codes = np.where(mask, n, codes)
-            elif na_position == 'first':
-                codes += 1
-        else: # not order means descending
-            if na_position == 'last':
-                codes = np.where(mask, n, n-codes-1)
-            elif na_position == 'first':
-                codes = np.where(mask, 0, n-codes)
-        if mask.any():
-            n += 1
-
-        shape.append(n)
-        labels.append(codes)
-
-    return _indexer_from_factorized(labels, shape)
-
-def _nargsort(items, kind='quicksort', ascending=True, na_position='last'):
-    """
-    This is intended to be a drop-in replacement for np.argsort which handles NaNs
-    It adds ascending and na_position parameters.
-    GH #6399, #5231
-    """
-
-    # specially handle Categorical
-    if is_categorical_dtype(items):
-        return items.argsort(ascending=ascending)
-
-    items = np.asanyarray(items)
-    idx = np.arange(len(items))
-    mask = isnull(items)
-    non_nans = items[~mask]
-    non_nan_idx = idx[~mask]
-    nan_idx = np.nonzero(mask)[0]
-    if not ascending:
-        non_nans = non_nans[::-1]
-        non_nan_idx = non_nan_idx[::-1]
-    indexer = non_nan_idx[non_nans.argsort(kind=kind)]
-    if not ascending:
-        indexer = indexer[::-1]
-    # Finally, place the NaNs at the end or the beginning according to na_position
-    if na_position == 'last':
-        indexer = np.concatenate([indexer, nan_idx])
-    elif na_position == 'first':
-        indexer = np.concatenate([nan_idx, indexer])
-    else:
-        raise ValueError('invalid na_position: {!r}'.format(na_position))
-    return indexer
-
-
-class _KeyMapper(object):
-
-    """
-    Ease my suffering. Map compressed group id -> key tuple
-    """
-
-    def __init__(self, comp_ids, ngroups, labels, levels):
-        self.levels = levels
-        self.labels = labels
-        self.comp_ids = comp_ids.astype(np.int64)
-
-        self.k = len(labels)
-        self.tables = [_hash.Int64HashTable(ngroups) for _ in range(self.k)]
-
-        self._populate_tables()
-
-    def _populate_tables(self):
-        for labs, table in zip(self.labels, self.tables):
-            table.map(self.comp_ids, labs.astype(np.int64))
-
-    def get_key(self, comp_id):
-        return tuple(level[table.get_item(comp_id)]
-                     for table, level in zip(self.tables, self.levels))
-
-
-def _get_indices_dict(label_list, keys):
-    shape = list(map(len, keys))
-
-    group_index = get_group_index(label_list, shape, sort=True, xnull=True)
-    ngroups = ((group_index.size and group_index.max()) + 1) \
-              if _int64_overflow_possible(shape) \
-              else np.prod(shape, dtype='i8')
-
-    sorter = _get_group_index_sorter(group_index, ngroups)
-
-    sorted_labels = [lab.take(sorter) for lab in label_list]
-    group_index = group_index.take(sorter)
-
-    return lib.indices_fast(sorter, group_index, keys, sorted_labels)
-
-
-#----------------------------------------------------------------------
-# sorting levels...cleverly?
-
-def _get_group_index_sorter(group_index, ngroups):
-    """
-    _algos.groupsort_indexer implements `counting sort` and it is at least
-    O(ngroups), where
-        ngroups = prod(shape)
-        shape = map(len, keys)
-    that is, linear in the number of combinations (cartesian product) of unique
-    values of groupby keys. This can be huge when doing multi-key groupby.
-    np.argsort(kind='mergesort') is O(count x log(count)) where count is the
-    length of the data-frame;
-    Both algorithms are `stable` sort and that is necessary for correctness of
-    groupby operations. e.g. consider:
-        df.groupby(key)[col].transform('first')
-    """
-    count = len(group_index)
-    alpha = 0.0  # taking complexities literally; there may be
-    beta  = 1.0  # some room for fine-tuning these parameters
-    if alpha + beta * ngroups < count * np.log(count):
-        sorter, _ = _algos.groupsort_indexer(com._ensure_int64(group_index),
-                                             ngroups)
-        return com._ensure_platform_int(sorter)
-    else:
-        return group_index.argsort(kind='mergesort')
-
-
-def _compress_group_index(group_index, sort=True):
-    """
-    Group_index is offsets into cartesian product of all possible labels. This
-    space can be huge, so this function compresses it, by computing offsets
-    (comp_ids) into the list of unique labels (obs_group_ids).
-    """
-
-    size_hint = min(len(group_index), _hash._SIZE_HINT_LIMIT)
-    table = _hash.Int64HashTable(size_hint)
-
-    group_index = com._ensure_int64(group_index)
-
-    # note, group labels come out ascending (ie, 1,2,3 etc)
-    comp_ids, obs_group_ids = table.get_labels_groupby(group_index)
-
-    if sort and len(obs_group_ids) > 0:
-        obs_group_ids, comp_ids = _reorder_by_uniques(obs_group_ids, comp_ids)
-
-    return comp_ids, obs_group_ids
-
-
-def _reorder_by_uniques(uniques, labels):
-    # sorter is index where elements ought to go
-    sorter = uniques.argsort()
-
-    # reverse_indexer is where elements came from
-    reverse_indexer = np.empty(len(sorter), dtype=np.int64)
-    reverse_indexer.put(sorter, np.arange(len(sorter)))
-
-    mask = labels < 0
-
-    # move labels to right locations (ie, unsort ascending labels)
-    labels = com.take_nd(reverse_indexer, labels, allow_fill=False)
-    np.putmask(labels, mask, -1)
-
-    # sort observed ids
-    uniques = com.take_nd(uniques, sorter, allow_fill=False)
-
-    return uniques, labels
-
-
-_func_table = {
-    builtins.sum: np.sum,
-    builtins.max: np.max,
-    builtins.min: np.min
-}
-
-
-_cython_table = {
-    builtins.sum: 'sum',
-    builtins.max: 'max',
-    builtins.min: 'min',
-    np.sum: 'sum',
-    np.mean: 'mean',
-    np.prod: 'prod',
-    np.std: 'std',
-    np.var: 'var',
-    np.median: 'median',
-    np.max: 'max',
-    np.min: 'min'
-}
-
-
-def _intercept_function(func):
-    return _func_table.get(func, func)
-
-
-def _intercept_cython(func):
-    return _cython_table.get(func)
-
-
-def _groupby_indices(values):
-    return _algos.groupby_indices(_values_from_object(com._ensure_object(values)))
-
-
-def numpy_groupby(data, labels, axis=0):
-    s = np.argsort(labels)
-    keys, inv = np.unique(labels, return_inverse=True)
-    i = inv.take(s)
-    groups_at = np.where(i != np.concatenate(([-1], i[:-1])))[0]
-    ordered_data = data.take(s, axis=axis)
-    group_sums = np.add.reduceat(ordered_data, groups_at, axis=axis)
-
-    return group_sums
diff --git a/pandas/core/groupby/__init__.py b/pandas/core/groupby/__init__.py
new file mode 100644
index 0000000000000..4b2ebdf16b89b
--- /dev/null
+++ b/pandas/core/groupby/__init__.py
@@ -0,0 +1,4 @@
+# flake8: noqa
+from pandas.core.groupby.groupby import (
+    Grouper, GroupBy, SeriesGroupBy, DataFrameGroupBy
+)
diff --git a/pandas/core/groupby/groupby.py b/pandas/core/groupby/groupby.py
new file mode 100644
index 0000000000000..c69d7f43de8ea
--- /dev/null
+++ b/pandas/core/groupby/groupby.py
@@ -0,0 +1,5130 @@
+import types
+from functools import wraps, partial
+import numpy as np
+import datetime
+import collections
+import warnings
+import copy
+from textwrap import dedent
+from contextlib import contextmanager
+
+from pandas.compat import (
+    zip, range, lzip,
+    callable, map
+)
+
+from pandas import compat
+from pandas.compat.numpy import function as nv
+from pandas.compat import set_function_name
+
+from pandas.core.dtypes.common import (
+    is_numeric_dtype,
+    is_timedelta64_dtype, is_datetime64_dtype,
+    is_categorical_dtype,
+    is_interval_dtype,
+    is_datetimelike,
+    is_datetime64_any_dtype,
+    is_bool, is_integer_dtype,
+    is_complex_dtype,
+    is_bool_dtype,
+    is_scalar,
+    is_list_like,
+    is_hashable,
+    needs_i8_conversion,
+    _ensure_float64,
+    _ensure_platform_int,
+    _ensure_int64,
+    _ensure_object,
+    _ensure_categorical,
+    _ensure_float)
+from pandas.core.dtypes.cast import maybe_downcast_to_dtype
+from pandas.core.dtypes.generic import ABCSeries
+from pandas.core.dtypes.missing import isna, isnull, notna, _maybe_fill
+
+from pandas.core.base import (PandasObject, SelectionMixin, GroupByError,
+                              DataError, SpecificationError)
+from pandas.core.index import (Index, MultiIndex,
+                               CategoricalIndex, _ensure_index)
+from pandas.core.arrays import ExtensionArray, Categorical
+from pandas.core.frame import DataFrame
+from pandas.core.generic import NDFrame, _shared_docs
+from pandas.core.internals import BlockManager, make_block
+from pandas.core.series import Series
+from pandas.core.panel import Panel
+from pandas.core.sorting import (get_group_index_sorter, get_group_index,
+                                 compress_group_index, get_flattened_iterator,
+                                 decons_obs_group_ids, get_indexer_dict)
+from pandas.util._decorators import (cache_readonly, Substitution,
+                                     Appender, make_signature)
+from pandas.io.formats.printing import pprint_thing
+from pandas.util._validators import validate_kwargs
+
+import pandas.core.common as com
+import pandas.core.algorithms as algorithms
+from pandas.core.config import option_context
+
+from pandas.plotting._core import boxplot_frame_groupby
+
+from pandas._libs import (lib, reduction,
+                          groupby as libgroupby,
+                          Timestamp, NaT, iNaT)
+from pandas._libs.lib import count_level_2d
+
+_doc_template = """
+
+        See also
+        --------
+        pandas.Series.%(name)s
+        pandas.DataFrame.%(name)s
+        pandas.Panel.%(name)s
+"""
+
+_apply_docs = dict(
+    template="""
+    Apply function ``func``  group-wise and combine the results together.
+
+    The function passed to ``apply`` must take a {input} as its first
+    argument and return a dataframe, a series or a scalar. ``apply`` will
+    then take care of combining the results back together into a single
+    dataframe or series. ``apply`` is therefore a highly flexible
+    grouping method.
+
+    While ``apply`` is a very flexible method, its downside is that
+    using it can be quite a bit slower than using more specific methods.
+    Pandas offers a wide range of method that will be much faster
+    than using ``apply`` for their specific purposes, so try to use them
+    before reaching for ``apply``.
+
+    Parameters
+    ----------
+    func : function
+        A callable that takes a {input} as its first argument, and
+        returns a dataframe, a series or a scalar. In addition the
+        callable may take positional and keyword arguments
+    args, kwargs : tuple and dict
+        Optional positional and keyword arguments to pass to ``func``
+
+    Returns
+    -------
+    applied : Series or DataFrame
+
+    Notes
+    -----
+    In the current implementation ``apply`` calls func twice on the
+    first group to decide whether it can take a fast or slow code
+    path. This can lead to unexpected behavior if func has
+    side-effects, as they will take effect twice for the first
+    group.
+
+    Examples
+    --------
+    {examples}
+
+    See also
+    --------
+    pipe : Apply function to the full GroupBy object instead of to each
+        group.
+    aggregate, transform
+    """,
+    dataframe_examples="""
+    >>> df = pd.DataFrame({'A': 'a a b'.split(), 'B': [1,2,3], 'C': [4,6, 5]})
+    >>> g = df.groupby('A')
+
+    From ``df`` above we can see that ``g`` has two groups, ``a``, ``b``.
+    Calling ``apply`` in various ways, we can get different grouping results:
+
+    Example 1: below the function passed to ``apply`` takes a dataframe as
+    its argument and returns a dataframe. ``apply`` combines the result for
+    each group together into a new dataframe:
+
+    >>> g.apply(lambda x: x / x.sum())
+              B    C
+    0  0.333333  0.4
+    1  0.666667  0.6
+    2  1.000000  1.0
+
+    Example 2: The function passed to ``apply`` takes a dataframe as
+    its argument and returns a series.  ``apply`` combines the result for
+    each group together into a new dataframe:
+
+    >>> g.apply(lambda x: x.max() - x.min())
+       B  C
+    A
+    a  1  2
+    b  0  0
+
+    Example 3: The function passed to ``apply`` takes a dataframe as
+    its argument and returns a scalar. ``apply`` combines the result for
+    each group together into a series, including setting the index as
+    appropriate:
+
+    >>> g.apply(lambda x: x.C.max() - x.B.min())
+    A
+    a    5
+    b    2
+    dtype: int64
+    """,
+    series_examples="""
+    >>> ser = pd.Series([0, 1, 2], index='a a b'.split())
+    >>> g = ser.groupby(ser.index)
+
+    From ``ser`` above we can see that ``g`` has two groups, ``a``, ``b``.
+    Calling ``apply`` in various ways, we can get different grouping results:
+
+    Example 1: The function passed to ``apply`` takes a series as
+    its argument and returns a series.  ``apply`` combines the result for
+    each group together into a new series:
+
+    >>> g.apply(lambda x:  x*2 if x.name == 'b' else x/2)
+    0    0.0
+    1    0.5
+    2    4.0
+    dtype: float64
+
+    Example 2: The function passed to ``apply`` takes a series as
+    its argument and returns a scalar. ``apply`` combines the result for
+    each group together into a series, including setting the index as
+    appropriate:
+
+    >>> g.apply(lambda x: x.max() - x.min())
+    a    1
+    b    0
+    dtype: int64
+    """)
+
+_pipe_template = """\
+Apply a function ``func`` with arguments to this %(klass)s object and return
+the function's result.
+
+%(versionadded)s
+
+Use ``.pipe`` when you want to improve readability by chaining together
+functions that expect Series, DataFrames, GroupBy or Resampler objects.
+Instead of writing
+
+>>> h(g(f(df.groupby('group')), arg1=a), arg2=b, arg3=c)
+
+You can write
+
+>>> (df.groupby('group')
+...    .pipe(f)
+...    .pipe(g, arg1=a)
+...    .pipe(h, arg2=b, arg3=c))
+
+which is much more readable.
+
+Parameters
+----------
+func : callable or tuple of (callable, string)
+    Function to apply to this %(klass)s object or, alternatively,
+    a ``(callable, data_keyword)`` tuple where ``data_keyword`` is a
+    string indicating the keyword of ``callable`` that expects the
+    %(klass)s object.
+args : iterable, optional
+       positional arguments passed into ``func``.
+kwargs : dict, optional
+         a dictionary of keyword arguments passed into ``func``.
+
+Returns
+-------
+object : the return type of ``func``.
+
+Notes
+-----
+See more `here
+<http://pandas.pydata.org/pandas-docs/stable/groupby.html#piping-function-calls>`_
+
+Examples
+--------
+%(examples)s
+
+See Also
+--------
+pandas.Series.pipe : Apply a function with arguments to a series
+pandas.DataFrame.pipe: Apply a function with arguments to a dataframe
+apply : Apply function to each group instead of to the
+    full %(klass)s object.
+"""
+
+_transform_template = """
+Call function producing a like-indexed %(klass)s on each group and
+return a %(klass)s having the same indexes as the original object
+filled with the transformed values
+
+Parameters
+----------
+f : function
+    Function to apply to each group
+
+Notes
+-----
+Each group is endowed the attribute 'name' in case you need to know
+which group you are working on.
+
+The current implementation imposes three requirements on f:
+
+* f must return a value that either has the same shape as the input
+  subframe or can be broadcast to the shape of the input subframe.
+  For example, f returns a scalar it will be broadcast to have the
+  same shape as the input subframe.
+* if this is a DataFrame, f must support application column-by-column
+  in the subframe. If f also supports application to the entire subframe,
+  then a fast path is used starting from the second chunk.
+* f must not mutate groups. Mutation is not supported and may
+  produce unexpected results.
+
+Returns
+-------
+%(klass)s
+
+See also
+--------
+aggregate, transform
+
+Examples
+--------
+
+# Same shape
+>>> df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
+...                           'foo', 'bar'],
+...                    'B' : ['one', 'one', 'two', 'three',
+...                          'two', 'two'],
+...                    'C' : [1, 5, 5, 2, 5, 5],
+...                    'D' : [2.0, 5., 8., 1., 2., 9.]})
+>>> grouped = df.groupby('A')
+>>> grouped.transform(lambda x: (x - x.mean()) / x.std())
+          C         D
+0 -1.154701 -0.577350
+1  0.577350  0.000000
+2  0.577350  1.154701
+3 -1.154701 -1.000000
+4  0.577350 -0.577350
+5  0.577350  1.000000
+
+# Broadcastable
+>>> grouped.transform(lambda x: x.max() - x.min())
+   C    D
+0  4  6.0
+1  3  8.0
+2  4  6.0
+3  3  8.0
+4  4  6.0
+5  3  8.0
+
+"""
+
+
+# special case to prevent duplicate plots when catching exceptions when
+# forwarding methods from NDFrames
+_plotting_methods = frozenset(['plot', 'boxplot', 'hist'])
+
+_common_apply_whitelist = frozenset([
+    'last', 'first',
+    'head', 'tail', 'median',
+    'mean', 'sum', 'min', 'max',
+    'cumcount', 'ngroup',
+    'resample',
+    'rank', 'quantile',
+    'fillna',
+    'mad',
+    'any', 'all',
+    'take',
+    'idxmax', 'idxmin',
+    'shift', 'tshift',
+    'ffill', 'bfill',
+    'pct_change', 'skew',
+    'corr', 'cov', 'diff',
+]) | _plotting_methods
+
+_series_apply_whitelist = ((_common_apply_whitelist |
+                            {'nlargest', 'nsmallest',
+                             'is_monotonic_increasing',
+                             'is_monotonic_decreasing'}) -
+                           {'boxplot'}) | frozenset(['dtype', 'unique'])
+
+_dataframe_apply_whitelist = ((_common_apply_whitelist |
+                              frozenset(['dtypes', 'corrwith'])) -
+                              {'boxplot'})
+
+_cython_transforms = frozenset(['cumprod', 'cumsum', 'shift',
+                                'cummin', 'cummax'])
+
+_cython_cast_blacklist = frozenset(['rank', 'count', 'size'])
+
+
+class Grouper(object):
+    """
+    A Grouper allows the user to specify a groupby instruction for a target
+    object
+
+    This specification will select a column via the key parameter, or if the
+    level and/or axis parameters are given, a level of the index of the target
+    object.
+
+    These are local specifications and will override 'global' settings,
+    that is the parameters axis and level which are passed to the groupby
+    itself.
+
+    Parameters
+    ----------
+    key : string, defaults to None
+        groupby key, which selects the grouping column of the target
+    level : name/number, defaults to None
+        the level for the target index
+    freq : string / frequency object, defaults to None
+        This will groupby the specified frequency if the target selection
+        (via key or level) is a datetime-like object. For full specification
+        of available frequencies, please see `here
+        <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`_.
+    axis : number/name of the axis, defaults to 0
+    sort : boolean, default to False
+        whether to sort the resulting labels
+
+    additional kwargs to control time-like groupers (when ``freq`` is passed)
+
+    closed : closed end of interval; 'left' or 'right'
+    label : interval boundary to use for labeling; 'left' or 'right'
+    convention : {'start', 'end', 'e', 's'}
+        If grouper is PeriodIndex
+    base, loffset
+
+    Returns
+    -------
+    A specification for a groupby instruction
+
+    Examples
+    --------
+
+    Syntactic sugar for ``df.groupby('A')``
+
+    >>> df.groupby(Grouper(key='A'))
+
+    Specify a resample operation on the column 'date'
+
+    >>> df.groupby(Grouper(key='date', freq='60s'))
+
+    Specify a resample operation on the level 'date' on the columns axis
+    with a frequency of 60s
+
+    >>> df.groupby(Grouper(level='date', freq='60s', axis=1))
+    """
+    _attributes = ('key', 'level', 'freq', 'axis', 'sort')
+
+    def __new__(cls, *args, **kwargs):
+        if kwargs.get('freq') is not None:
+            from pandas.core.resample import TimeGrouper
+            cls = TimeGrouper
+        return super(Grouper, cls).__new__(cls)
+
+    def __init__(self, key=None, level=None, freq=None, axis=0, sort=False):
+        self.key = key
+        self.level = level
+        self.freq = freq
+        self.axis = axis
+        self.sort = sort
+
+        self.grouper = None
+        self.obj = None
+        self.indexer = None
+        self.binner = None
+        self._grouper = None
+
+    @property
+    def ax(self):
+        return self.grouper
+
+    def _get_grouper(self, obj, validate=True):
+        """
+        Parameters
+        ----------
+        obj : the subject object
+        validate : boolean, default True
+            if True, validate the grouper
+
+        Returns
+        -------
+        a tuple of binner, grouper, obj (possibly sorted)
+        """
+
+        self._set_grouper(obj)
+        self.grouper, exclusions, self.obj = _get_grouper(self.obj, [self.key],
+                                                          axis=self.axis,
+                                                          level=self.level,
+                                                          sort=self.sort,
+                                                          validate=validate)
+        return self.binner, self.grouper, self.obj
+
+    def _set_grouper(self, obj, sort=False):
+        """
+        given an object and the specifications, setup the internal grouper
+        for this particular specification
+
+        Parameters
+        ----------
+        obj : the subject object
+        sort : bool, default False
+            whether the resulting grouper should be sorted
+        """
+
+        if self.key is not None and self.level is not None:
+            raise ValueError(
+                "The Grouper cannot specify both a key and a level!")
+
+        # Keep self.grouper value before overriding
+        if self._grouper is None:
+            self._grouper = self.grouper
+
+        # the key must be a valid info item
+        if self.key is not None:
+            key = self.key
+            # The 'on' is already defined
+            if getattr(self.grouper, 'name', None) == key and \
+                    isinstance(obj, ABCSeries):
+                ax = self._grouper.take(obj.index)
+            else:
+                if key not in obj._info_axis:
+                    raise KeyError(
+                        "The grouper name {0} is not found".format(key))
+                ax = Index(obj[key], name=key)
+
+        else:
+            ax = obj._get_axis(self.axis)
+            if self.level is not None:
+                level = self.level
+
+                # if a level is given it must be a mi level or
+                # equivalent to the axis name
+                if isinstance(ax, MultiIndex):
+                    level = ax._get_level_number(level)
+                    ax = Index(ax._get_level_values(level),
+                               name=ax.names[level])
+
+                else:
+                    if level not in (0, ax.name):
+                        raise ValueError(
+                            "The level {0} is not valid".format(level))
+
+        # possibly sort
+        if (self.sort or sort) and not ax.is_monotonic:
+            # use stable sort to support first, last, nth
+            indexer = self.indexer = ax.argsort(kind='mergesort')
+            ax = ax.take(indexer)
+            obj = obj._take(indexer, axis=self.axis, is_copy=False)
+
+        self.obj = obj
+        self.grouper = ax
+        return self.grouper
+
+    @property
+    def groups(self):
+        return self.grouper.groups
+
+    def __repr__(self):
+        attrs_list = ["{}={!r}".format(attr_name, getattr(self, attr_name))
+                      for attr_name in self._attributes
+                      if getattr(self, attr_name) is not None]
+        attrs = ", ".join(attrs_list)
+        cls_name = self.__class__.__name__
+        return "{}({})".format(cls_name, attrs)
+
+
+class GroupByPlot(PandasObject):
+    """
+    Class implementing the .plot attribute for groupby objects
+    """
+
+    def __init__(self, groupby):
+        self._groupby = groupby
+
+    def __call__(self, *args, **kwargs):
+        def f(self):
+            return self.plot(*args, **kwargs)
+        f.__name__ = 'plot'
+        return self._groupby.apply(f)
+
+    def __getattr__(self, name):
+        def attr(*args, **kwargs):
+            def f(self):
+                return getattr(self.plot, name)(*args, **kwargs)
+            return self._groupby.apply(f)
+        return attr
+
+
+@contextmanager
+def _group_selection_context(groupby):
+    """
+    set / reset the _group_selection_context
+    """
+    groupby._set_group_selection()
+    yield groupby
+    groupby._reset_group_selection()
+
+
+class _GroupBy(PandasObject, SelectionMixin):
+    _group_selection = None
+    _apply_whitelist = frozenset([])
+
+    def __init__(self, obj, keys=None, axis=0, level=None,
+                 grouper=None, exclusions=None, selection=None, as_index=True,
+                 sort=True, group_keys=True, squeeze=False,
+                 observed=False, **kwargs):
+
+        self._selection = selection
+
+        if isinstance(obj, NDFrame):
+            obj._consolidate_inplace()
+
+        self.level = level
+
+        if not as_index:
+            if not isinstance(obj, DataFrame):
+                raise TypeError('as_index=False only valid with DataFrame')
+            if axis != 0:
+                raise ValueError('as_index=False only valid for axis=0')
+
+        self.as_index = as_index
+        self.keys = keys
+        self.sort = sort
+        self.group_keys = group_keys
+        self.squeeze = squeeze
+        self.observed = observed
+        self.mutated = kwargs.pop('mutated', False)
+
+        if grouper is None:
+            grouper, exclusions, obj = _get_grouper(obj, keys,
+                                                    axis=axis,
+                                                    level=level,
+                                                    sort=sort,
+                                                    observed=observed,
+                                                    mutated=self.mutated)
+
+        self.obj = obj
+        self.axis = obj._get_axis_number(axis)
+        self.grouper = grouper
+        self.exclusions = set(exclusions) if exclusions else set()
+
+        # we accept no other args
+        validate_kwargs('group', kwargs, {})
+
+    def __len__(self):
+        return len(self.groups)
+
+    def __unicode__(self):
+        # TODO: Better unicode/repr for GroupBy object
+        return object.__repr__(self)
+
+    def _assure_grouper(self):
+        """
+        we create the grouper on instantiation
+        sub-classes may have a different policy
+        """
+        pass
+
+    @property
+    def groups(self):
+        """ dict {group name -> group labels} """
+        self._assure_grouper()
+        return self.grouper.groups
+
+    @property
+    def ngroups(self):
+        self._assure_grouper()
+        return self.grouper.ngroups
+
+    @property
+    def indices(self):
+        """ dict {group name -> group indices} """
+        self._assure_grouper()
+        return self.grouper.indices
+
+    def _get_indices(self, names):
+        """
+        safe get multiple indices, translate keys for
+        datelike to underlying repr
+        """
+
+        def get_converter(s):
+            # possibly convert to the actual key types
+            # in the indices, could be a Timestamp or a np.datetime64
+            if isinstance(s, (Timestamp, datetime.datetime)):
+                return lambda key: Timestamp(key)
+            elif isinstance(s, np.datetime64):
+                return lambda key: Timestamp(key).asm8
+            else:
+                return lambda key: key
+
+        if len(names) == 0:
+            return []
+
+        if len(self.indices) > 0:
+            index_sample = next(iter(self.indices))
+        else:
+            index_sample = None     # Dummy sample
+
+        name_sample = names[0]
+        if isinstance(index_sample, tuple):
+            if not isinstance(name_sample, tuple):
+                msg = ("must supply a tuple to get_group with multiple"
+                       " grouping keys")
+                raise ValueError(msg)
+            if not len(name_sample) == len(index_sample):
+                try:
+                    # If the original grouper was a tuple
+                    return [self.indices[name] for name in names]
+                except KeyError:
+                    # turns out it wasn't a tuple
+                    msg = ("must supply a a same-length tuple to get_group"
+                           " with multiple grouping keys")
+                    raise ValueError(msg)
+
+            converters = [get_converter(s) for s in index_sample]
+            names = [tuple(f(n) for f, n in zip(converters, name))
+                     for name in names]
+
+        else:
+            converter = get_converter(index_sample)
+            names = [converter(name) for name in names]
+
+        return [self.indices.get(name, []) for name in names]
+
+    def _get_index(self, name):
+        """ safe get index, translate keys for datelike to underlying repr """
+        return self._get_indices([name])[0]
+
+    @cache_readonly
+    def _selected_obj(self):
+
+        if self._selection is None or isinstance(self.obj, Series):
+            if self._group_selection is not None:
+                return self.obj[self._group_selection]
+            return self.obj
+        else:
+            return self.obj[self._selection]
+
+    def _reset_group_selection(self):
+        """
+        Clear group based selection. Used for methods needing to return info on
+        each group regardless of whether a group selection was previously set.
+        """
+        if self._group_selection is not None:
+            # GH12839 clear cached selection too when changing group selection
+            self._group_selection = None
+            self._reset_cache('_selected_obj')
+
+    def _set_group_selection(self):
+        """
+        Create group based selection. Used when selection is not passed
+        directly but instead via a grouper.
+
+        NOTE: this should be paired with a call to _reset_group_selection
+        """
+        grp = self.grouper
+        if not (self.as_index and
+                getattr(grp, 'groupings', None) is not None and
+                self.obj.ndim > 1 and
+                self._group_selection is None):
+            return
+
+        ax = self.obj._info_axis
+        groupers = [g.name for g in grp.groupings
+                    if g.level is None and g.in_axis]
+
+        if len(groupers):
+            # GH12839 clear selected obj cache when group selection changes
+            self._group_selection = ax.difference(Index(groupers)).tolist()
+            self._reset_cache('_selected_obj')
+
+    def _set_result_index_ordered(self, result):
+        # set the result index on the passed values object and
+        # return the new object, xref 8046
+
+        # the values/counts are repeated according to the group index
+        # shortcut if we have an already ordered grouper
+        if not self.grouper.is_monotonic:
+            index = Index(np.concatenate(
+                self._get_indices(self.grouper.result_index)))
+            result.set_axis(index, axis=self.axis, inplace=True)
+            result = result.sort_index(axis=self.axis)
+
+        result.set_axis(self.obj._get_axis(self.axis), axis=self.axis,
+                        inplace=True)
+        return result
+
+    def _dir_additions(self):
+        return self.obj._dir_additions() | self._apply_whitelist
+
+    def __getattr__(self, attr):
+        if attr in self._internal_names_set:
+            return object.__getattribute__(self, attr)
+        if attr in self.obj:
+            return self[attr]
+        if hasattr(self.obj, attr):
+            return self._make_wrapper(attr)
+
+        raise AttributeError("%r object has no attribute %r" %
+                             (type(self).__name__, attr))
+
+    @Substitution(klass='GroupBy',
+                  versionadded='.. versionadded:: 0.21.0',
+                  examples="""\
+>>> df = pd.DataFrame({'A': 'a b a b'.split(), 'B': [1, 2, 3, 4]})
+>>> df
+   A  B
+0  a  1
+1  b  2
+2  a  3
+3  b  4
+
+To get the difference between each groups maximum and minimum value in one
+pass, you can do
+
+>>> df.groupby('A').pipe(lambda x: x.max() - x.min())
+   B
+A
+a  2
+b  2""")
+    @Appender(_pipe_template)
+    def pipe(self, func, *args, **kwargs):
+        return com._pipe(self, func, *args, **kwargs)
+
+    plot = property(GroupByPlot)
+
+    def _make_wrapper(self, name):
+        if name not in self._apply_whitelist:
+            is_callable = callable(getattr(self._selected_obj, name, None))
+            kind = ' callable ' if is_callable else ' '
+            msg = ("Cannot access{0}attribute {1!r} of {2!r} objects, try "
+                   "using the 'apply' method".format(kind, name,
+                                                     type(self).__name__))
+            raise AttributeError(msg)
+
+        self._set_group_selection()
+
+        # need to setup the selection
+        # as are not passed directly but in the grouper
+        f = getattr(self._selected_obj, name)
+        if not isinstance(f, types.MethodType):
+            return self.apply(lambda self: getattr(self, name))
+
+        f = getattr(type(self._selected_obj), name)
+
+        def wrapper(*args, **kwargs):
+            # a little trickery for aggregation functions that need an axis
+            # argument
+            kwargs_with_axis = kwargs.copy()
+            if 'axis' not in kwargs_with_axis or \
+               kwargs_with_axis['axis'] is None:
+                kwargs_with_axis['axis'] = self.axis
+
+            def curried_with_axis(x):
+                return f(x, *args, **kwargs_with_axis)
+
+            def curried(x):
+                return f(x, *args, **kwargs)
+
+            # preserve the name so we can detect it when calling plot methods,
+            # to avoid duplicates
+            curried.__name__ = curried_with_axis.__name__ = name
+
+            # special case otherwise extra plots are created when catching the
+            # exception below
+            if name in _plotting_methods:
+                return self.apply(curried)
+
+            try:
+                return self.apply(curried_with_axis)
+            except Exception:
+                try:
+                    return self.apply(curried)
+                except Exception:
+
+                    # related to : GH3688
+                    # try item-by-item
+                    # this can be called recursively, so need to raise
+                    # ValueError
+                    # if we don't have this method to indicated to aggregate to
+                    # mark this column as an error
+                    try:
+                        return self._aggregate_item_by_item(name,
+                                                            *args, **kwargs)
+                    except (AttributeError):
+                        raise ValueError
+
+        return wrapper
+
+    def get_group(self, name, obj=None):
+        """
+        Constructs NDFrame from group with provided name
+
+        Parameters
+        ----------
+        name : object
+            the name of the group to get as a DataFrame
+        obj : NDFrame, default None
+            the NDFrame to take the DataFrame out of.  If
+            it is None, the object groupby was called on will
+            be used
+
+        Returns
+        -------
+        group : same type as obj
+        """
+        if obj is None:
+            obj = self._selected_obj
+
+        inds = self._get_index(name)
+        if not len(inds):
+            raise KeyError(name)
+
+        return obj._take(inds, axis=self.axis)
+
+    def __iter__(self):
+        """
+        Groupby iterator
+
+        Returns
+        -------
+        Generator yielding sequence of (name, subsetted object)
+        for each group
+        """
+        return self.grouper.get_iterator(self.obj, axis=self.axis)
+
+    @Appender(_apply_docs['template']
+              .format(input="dataframe",
+                      examples=_apply_docs['dataframe_examples']))
+    def apply(self, func, *args, **kwargs):
+
+        func = self._is_builtin_func(func)
+
+        # this is needed so we don't try and wrap strings. If we could
+        # resolve functions to their callable functions prior, this
+        # wouldn't be needed
+        if args or kwargs:
+            if callable(func):
+
+                @wraps(func)
+                def f(g):
+                    with np.errstate(all='ignore'):
+                        return func(g, *args, **kwargs)
+            else:
+                raise ValueError('func must be a callable if args or '
+                                 'kwargs are supplied')
+        else:
+            f = func
+
+        # ignore SettingWithCopy here in case the user mutates
+        with option_context('mode.chained_assignment', None):
+            try:
+                result = self._python_apply_general(f)
+            except Exception:
+
+                # gh-20949
+                # try again, with .apply acting as a filtering
+                # operation, by excluding the grouping column
+                # This would normally not be triggered
+                # except if the udf is trying an operation that
+                # fails on *some* columns, e.g. a numeric operation
+                # on a string grouper column
+
+                with _group_selection_context(self):
+                    return self._python_apply_general(f)
+
+        return result
+
+    def _python_apply_general(self, f):
+        keys, values, mutated = self.grouper.apply(f, self._selected_obj,
+                                                   self.axis)
+
+        return self._wrap_applied_output(
+            keys,
+            values,
+            not_indexed_same=mutated or self.mutated)
+
+    def _iterate_slices(self):
+        yield self._selection_name, self._selected_obj
+
+    def transform(self, func, *args, **kwargs):
+        raise com.AbstractMethodError(self)
+
+    def _cumcount_array(self, ascending=True):
+        """
+        Parameters
+        ----------
+        ascending : bool, default True
+            If False, number in reverse, from length of group - 1 to 0.
+
+        Notes
+        -----
+        this is currently implementing sort=False
+        (though the default is sort=True) for groupby in general
+        """
+        ids, _, ngroups = self.grouper.group_info
+        sorter = get_group_index_sorter(ids, ngroups)
+        ids, count = ids[sorter], len(ids)
+
+        if count == 0:
+            return np.empty(0, dtype=np.int64)
+
+        run = np.r_[True, ids[:-1] != ids[1:]]
+        rep = np.diff(np.r_[np.nonzero(run)[0], count])
+        out = (~run).cumsum()
+
+        if ascending:
+            out -= np.repeat(out[run], rep)
+        else:
+            out = np.repeat(out[np.r_[run[1:], True]], rep) - out
+
+        rev = np.empty(count, dtype=np.intp)
+        rev[sorter] = np.arange(count, dtype=np.intp)
+        return out[rev].astype(np.int64, copy=False)
+
+    def _try_cast(self, result, obj, numeric_only=False):
+        """
+        try to cast the result to our obj original type,
+        we may have roundtripped thru object in the mean-time
+
+        if numeric_only is True, then only try to cast numerics
+        and not datetimelikes
+
+        """
+        if obj.ndim > 1:
+            dtype = obj.values.dtype
+        else:
+            dtype = obj.dtype
+
+        if not is_scalar(result):
+            if numeric_only and is_numeric_dtype(dtype) or not numeric_only:
+                result = maybe_downcast_to_dtype(result, dtype)
+
+        return result
+
+    def _transform_should_cast(self, func_nm):
+        """
+        Parameters:
+        -----------
+        func_nm: str
+            The name of the aggregation function being performed
+
+        Returns:
+        --------
+        bool
+            Whether transform should attempt to cast the result of aggregation
+        """
+        return (self.size().fillna(0) > 0).any() and (func_nm not in
+                                                      _cython_cast_blacklist)
+
+    def _cython_transform(self, how, numeric_only=True, **kwargs):
+        output = collections.OrderedDict()
+        for name, obj in self._iterate_slices():
+            is_numeric = is_numeric_dtype(obj.dtype)
+            if numeric_only and not is_numeric:
+                continue
+
+            try:
+                result, names = self.grouper.transform(obj.values, how,
+                                                       **kwargs)
+            except NotImplementedError:
+                continue
+            except AssertionError as e:
+                raise GroupByError(str(e))
+            if self._transform_should_cast(how):
+                output[name] = self._try_cast(result, obj)
+            else:
+                output[name] = result
+
+        if len(output) == 0:
+            raise DataError('No numeric types to aggregate')
+
+        return self._wrap_transformed_output(output, names)
+
+    def _cython_agg_general(self, how, alt=None, numeric_only=True,
+                            min_count=-1):
+        output = {}
+        for name, obj in self._iterate_slices():
+            is_numeric = is_numeric_dtype(obj.dtype)
+            if numeric_only and not is_numeric:
+                continue
+
+            try:
+                result, names = self.grouper.aggregate(obj.values, how,
+                                                       min_count=min_count)
+            except AssertionError as e:
+                raise GroupByError(str(e))
+            output[name] = self._try_cast(result, obj)
+
+        if len(output) == 0:
+            raise DataError('No numeric types to aggregate')
+
+        return self._wrap_aggregated_output(output, names)
+
+    def _python_agg_general(self, func, *args, **kwargs):
+        func = self._is_builtin_func(func)
+        f = lambda x: func(x, *args, **kwargs)
+
+        # iterate through "columns" ex exclusions to populate output dict
+        output = {}
+        for name, obj in self._iterate_slices():
+            try:
+                result, counts = self.grouper.agg_series(obj, f)
+                output[name] = self._try_cast(result, obj, numeric_only=True)
+            except TypeError:
+                continue
+
+        if len(output) == 0:
+            return self._python_apply_general(f)
+
+        if self.grouper._filter_empty_groups:
+
+            mask = counts.ravel() > 0
+            for name, result in compat.iteritems(output):
+
+                # since we are masking, make sure that we have a float object
+                values = result
+                if is_numeric_dtype(values.dtype):
+                    values = _ensure_float(values)
+
+                output[name] = self._try_cast(values[mask], result)
+
+        return self._wrap_aggregated_output(output)
+
+    def _wrap_applied_output(self, *args, **kwargs):
+        raise com.AbstractMethodError(self)
+
+    def _concat_objects(self, keys, values, not_indexed_same=False):
+        from pandas.core.reshape.concat import concat
+
+        def reset_identity(values):
+            # reset the identities of the components
+            # of the values to prevent aliasing
+            for v in com._not_none(*values):
+                ax = v._get_axis(self.axis)
+                ax._reset_identity()
+            return values
+
+        if not not_indexed_same:
+            result = concat(values, axis=self.axis)
+            ax = self._selected_obj._get_axis(self.axis)
+
+            if isinstance(result, Series):
+                result = result.reindex(ax)
+            else:
+
+                # this is a very unfortunate situation
+                # we have a multi-index that is NOT lexsorted
+                # and we have a result which is duplicated
+                # we can't reindex, so we resort to this
+                # GH 14776
+                if isinstance(ax, MultiIndex) and not ax.is_unique:
+                    indexer = algorithms.unique1d(
+                        result.index.get_indexer_for(ax.values))
+                    result = result.take(indexer, axis=self.axis)
+                else:
+                    result = result.reindex(ax, axis=self.axis)
+
+        elif self.group_keys:
+
+            values = reset_identity(values)
+            if self.as_index:
+
+                # possible MI return case
+                group_keys = keys
+                group_levels = self.grouper.levels
+                group_names = self.grouper.names
+
+                result = concat(values, axis=self.axis, keys=group_keys,
+                                levels=group_levels, names=group_names,
+                                sort=False)
+            else:
+
+                # GH5610, returns a MI, with the first level being a
+                # range index
+                keys = list(range(len(values)))
+                result = concat(values, axis=self.axis, keys=keys)
+        else:
+            values = reset_identity(values)
+            result = concat(values, axis=self.axis)
+
+        if (isinstance(result, Series) and
+                getattr(self, '_selection_name', None) is not None):
+
+            result.name = self._selection_name
+
+        return result
+
+    def _apply_filter(self, indices, dropna):
+        if len(indices) == 0:
+            indices = np.array([], dtype='int64')
+        else:
+            indices = np.sort(np.concatenate(indices))
+        if dropna:
+            filtered = self._selected_obj.take(indices, axis=self.axis)
+        else:
+            mask = np.empty(len(self._selected_obj.index), dtype=bool)
+            mask.fill(False)
+            mask[indices.astype(int)] = True
+            # mask fails to broadcast when passed to where; broadcast manually.
+            mask = np.tile(mask, list(self._selected_obj.shape[1:]) + [1]).T
+            filtered = self._selected_obj.where(mask)  # Fill with NaNs.
+        return filtered
+
+
+class GroupBy(_GroupBy):
+
+    """
+    Class for grouping and aggregating relational data. See aggregate,
+    transform, and apply functions on this object.
+
+    It's easiest to use obj.groupby(...) to use GroupBy, but you can also do:
+
+    ::
+
+        grouped = groupby(obj, ...)
+
+    Parameters
+    ----------
+    obj : pandas object
+    axis : int, default 0
+    level : int, default None
+        Level of MultiIndex
+    groupings : list of Grouping objects
+        Most users should ignore this
+    exclusions : array-like, optional
+        List of columns to exclude
+    name : string
+        Most users should ignore this
+
+    Notes
+    -----
+    After grouping, see aggregate, apply, and transform functions. Here are
+    some other brief notes about usage. When grouping by multiple groups, the
+    result index will be a MultiIndex (hierarchical) by default.
+
+    Iteration produces (key, group) tuples, i.e. chunking the data by group. So
+    you can write code like:
+
+    ::
+
+        grouped = obj.groupby(keys, axis=axis)
+        for key, group in grouped:
+            # do something with the data
+
+    Function calls on GroupBy, if not specially implemented, "dispatch" to the
+    grouped data. So if you group a DataFrame and wish to invoke the std()
+    method on each group, you can simply do:
+
+    ::
+
+        df.groupby(mapper).std()
+
+    rather than
+
+    ::
+
+        df.groupby(mapper).aggregate(np.std)
+
+    You can pass arguments to these "wrapped" functions, too.
+
+    See the online documentation for full exposition on these topics and much
+    more
+
+    Returns
+    -------
+    **Attributes**
+    groups : dict
+        {group name -> group labels}
+    len(grouped) : int
+        Number of groups
+    """
+    _apply_whitelist = _common_apply_whitelist
+
+    def _bool_agg(self, val_test, skipna):
+        """Shared func to call any / all Cython GroupBy implementations"""
+
+        def objs_to_bool(vals):
+            try:
+                vals = vals.astype(np.bool)
+            except ValueError:  # for objects
+                vals = np.array([bool(x) for x in vals])
+
+            return vals.view(np.uint8)
+
+        def result_to_bool(result):
+            return result.astype(np.bool, copy=False)
+
+        return self._get_cythonized_result('group_any_all', self.grouper,
+                                           aggregate=True,
+                                           cython_dtype=np.uint8,
+                                           needs_values=True,
+                                           needs_mask=True,
+                                           pre_processing=objs_to_bool,
+                                           post_processing=result_to_bool,
+                                           val_test=val_test, skipna=skipna)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def any(self, skipna=True):
+        """
+        Returns True if any value in the group is truthful, else False
+
+        Parameters
+        ----------
+        skipna : bool, default True
+            Flag to ignore nan values during truth testing
+        """
+        return self._bool_agg('any', skipna)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def all(self, skipna=True):
+        """Returns True if all values in the group are truthful, else False
+
+        Parameters
+        ----------
+        skipna : bool, default True
+            Flag to ignore nan values during truth testing
+        """
+        return self._bool_agg('all', skipna)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def count(self):
+        """Compute count of group, excluding missing values"""
+
+        # defined here for API doc
+        raise NotImplementedError
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def mean(self, *args, **kwargs):
+        """
+        Compute mean of groups, excluding missing values
+
+        For multiple groupings, the result index will be a MultiIndex
+        """
+        nv.validate_groupby_func('mean', args, kwargs, ['numeric_only'])
+        try:
+            return self._cython_agg_general('mean', **kwargs)
+        except GroupByError:
+            raise
+        except Exception:  # pragma: no cover
+            with _group_selection_context(self):
+                f = lambda x: x.mean(axis=self.axis, **kwargs)
+                return self._python_agg_general(f)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def median(self, **kwargs):
+        """
+        Compute median of groups, excluding missing values
+
+        For multiple groupings, the result index will be a MultiIndex
+        """
+        try:
+            return self._cython_agg_general('median', **kwargs)
+        except GroupByError:
+            raise
+        except Exception:  # pragma: no cover
+
+            def f(x):
+                if isinstance(x, np.ndarray):
+                    x = Series(x)
+                return x.median(axis=self.axis, **kwargs)
+            with _group_selection_context(self):
+                return self._python_agg_general(f)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def std(self, ddof=1, *args, **kwargs):
+        """
+        Compute standard deviation of groups, excluding missing values
+
+        For multiple groupings, the result index will be a MultiIndex
+
+        Parameters
+        ----------
+        ddof : integer, default 1
+            degrees of freedom
+        """
+
+        # TODO: implement at Cython level?
+        nv.validate_groupby_func('std', args, kwargs)
+        return np.sqrt(self.var(ddof=ddof, **kwargs))
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def var(self, ddof=1, *args, **kwargs):
+        """
+        Compute variance of groups, excluding missing values
+
+        For multiple groupings, the result index will be a MultiIndex
+
+        Parameters
+        ----------
+        ddof : integer, default 1
+            degrees of freedom
+        """
+        nv.validate_groupby_func('var', args, kwargs)
+        if ddof == 1:
+            return self._cython_agg_general('var', **kwargs)
+        else:
+            f = lambda x: x.var(ddof=ddof, **kwargs)
+            with _group_selection_context(self):
+                return self._python_agg_general(f)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def sem(self, ddof=1):
+        """
+        Compute standard error of the mean of groups, excluding missing values
+
+        For multiple groupings, the result index will be a MultiIndex
+
+        Parameters
+        ----------
+        ddof : integer, default 1
+            degrees of freedom
+        """
+
+        return self.std(ddof=ddof) / np.sqrt(self.count())
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def size(self):
+        """Compute group sizes"""
+        result = self.grouper.size()
+
+        if isinstance(self.obj, Series):
+            result.name = getattr(self.obj, 'name', None)
+        return result
+
+    @classmethod
+    def _add_numeric_operations(cls):
+        """ add numeric operations to the GroupBy generically """
+
+        def groupby_function(name, alias, npfunc,
+                             numeric_only=True, _convert=False,
+                             min_count=-1):
+
+            _local_template = "Compute %(f)s of group values"
+
+            @Substitution(name='groupby', f=name)
+            @Appender(_doc_template)
+            @Appender(_local_template)
+            def f(self, **kwargs):
+                if 'numeric_only' not in kwargs:
+                    kwargs['numeric_only'] = numeric_only
+                if 'min_count' not in kwargs:
+                    kwargs['min_count'] = min_count
+
+                self._set_group_selection()
+                try:
+                    return self._cython_agg_general(
+                        alias, alt=npfunc, **kwargs)
+                except AssertionError as e:
+                    raise SpecificationError(str(e))
+                except Exception:
+                    result = self.aggregate(
+                        lambda x: npfunc(x, axis=self.axis))
+                    if _convert:
+                        result = result._convert(datetime=True)
+                    return result
+
+            set_function_name(f, name, cls)
+
+            return f
+
+        def first_compat(x, axis=0):
+
+            def first(x):
+
+                x = np.asarray(x)
+                x = x[notna(x)]
+                if len(x) == 0:
+                    return np.nan
+                return x[0]
+
+            if isinstance(x, DataFrame):
+                return x.apply(first, axis=axis)
+            else:
+                return first(x)
+
+        def last_compat(x, axis=0):
+
+            def last(x):
+
+                x = np.asarray(x)
+                x = x[notna(x)]
+                if len(x) == 0:
+                    return np.nan
+                return x[-1]
+
+            if isinstance(x, DataFrame):
+                return x.apply(last, axis=axis)
+            else:
+                return last(x)
+
+        cls.sum = groupby_function('sum', 'add', np.sum, min_count=0)
+        cls.prod = groupby_function('prod', 'prod', np.prod, min_count=0)
+        cls.min = groupby_function('min', 'min', np.min, numeric_only=False)
+        cls.max = groupby_function('max', 'max', np.max, numeric_only=False)
+        cls.first = groupby_function('first', 'first', first_compat,
+                                     numeric_only=False)
+        cls.last = groupby_function('last', 'last', last_compat,
+                                    numeric_only=False)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def ohlc(self):
+        """
+        Compute sum of values, excluding missing values
+        For multiple groupings, the result index will be a MultiIndex
+        """
+
+        return self._apply_to_column_groupbys(
+            lambda x: x._cython_agg_general('ohlc'))
+
+    @Appender(DataFrame.describe.__doc__)
+    def describe(self, **kwargs):
+        with _group_selection_context(self):
+            result = self.apply(lambda x: x.describe(**kwargs))
+            if self.axis == 1:
+                return result.T
+            return result.unstack()
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def resample(self, rule, *args, **kwargs):
+        """
+        Provide resampling when using a TimeGrouper
+        Return a new grouper with our resampler appended
+        """
+        from pandas.core.resample import get_resampler_for_grouping
+        return get_resampler_for_grouping(self, rule, *args, **kwargs)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def rolling(self, *args, **kwargs):
+        """
+        Return a rolling grouper, providing rolling
+        functionality per group
+
+        """
+        from pandas.core.window import RollingGroupby
+        return RollingGroupby(self, *args, **kwargs)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def expanding(self, *args, **kwargs):
+        """
+        Return an expanding grouper, providing expanding
+        functionality per group
+
+        """
+        from pandas.core.window import ExpandingGroupby
+        return ExpandingGroupby(self, *args, **kwargs)
+
+    def _fill(self, direction, limit=None):
+        """Shared function for `pad` and `backfill` to call Cython method
+
+        Parameters
+        ----------
+        direction : {'ffill', 'bfill'}
+            Direction passed to underlying Cython function. `bfill` will cause
+            values to be filled backwards. `ffill` and any other values will
+            default to a forward fill
+        limit : int, default None
+            Maximum number of consecutive values to fill. If `None`, this
+            method will convert to -1 prior to passing to Cython
+
+        Returns
+        -------
+        `Series` or `DataFrame` with filled values
+
+        See Also
+        --------
+        pad
+        backfill
+        """
+        # Need int value for Cython
+        if limit is None:
+            limit = -1
+
+        return self._get_cythonized_result('group_fillna_indexer',
+                                           self.grouper, needs_mask=True,
+                                           cython_dtype=np.int64,
+                                           result_is_index=True,
+                                           direction=direction, limit=limit)
+
+    @Substitution(name='groupby')
+    def pad(self, limit=None):
+        """
+        Forward fill the values
+
+        Parameters
+        ----------
+        limit : integer, optional
+            limit of how many values to fill
+
+        See Also
+        --------
+        Series.pad
+        DataFrame.pad
+        Series.fillna
+        DataFrame.fillna
+        """
+        return self._fill('ffill', limit=limit)
+    ffill = pad
+
+    @Substitution(name='groupby')
+    def backfill(self, limit=None):
+        """
+        Backward fill the values
+
+        Parameters
+        ----------
+        limit : integer, optional
+            limit of how many values to fill
+
+        See Also
+        --------
+        Series.backfill
+        DataFrame.backfill
+        Series.fillna
+        DataFrame.fillna
+        """
+        return self._fill('bfill', limit=limit)
+    bfill = backfill
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def nth(self, n, dropna=None):
+        """
+        Take the nth row from each group if n is an int, or a subset of rows
+        if n is a list of ints.
+
+        If dropna, will take the nth non-null row, dropna is either
+        Truthy (if a Series) or 'all', 'any' (if a DataFrame);
+        this is equivalent to calling dropna(how=dropna) before the
+        groupby.
+
+        Parameters
+        ----------
+        n : int or list of ints
+            a single nth value for the row or a list of nth values
+        dropna : None or str, optional
+            apply the specified dropna operation before counting which row is
+            the nth row. Needs to be None, 'any' or 'all'
+
+        Examples
+        --------
+
+        >>> df = pd.DataFrame({'A': [1, 1, 2, 1, 2],
+        ...                    'B': [np.nan, 2, 3, 4, 5]}, columns=['A', 'B'])
+        >>> g = df.groupby('A')
+        >>> g.nth(0)
+             B
+        A
+        1  NaN
+        2  3.0
+        >>> g.nth(1)
+             B
+        A
+        1  2.0
+        2  5.0
+        >>> g.nth(-1)
+             B
+        A
+        1  4.0
+        2  5.0
+        >>> g.nth([0, 1])
+             B
+        A
+        1  NaN
+        1  2.0
+        2  3.0
+        2  5.0
+
+        Specifying ``dropna`` allows count ignoring NaN
+
+        >>> g.nth(0, dropna='any')
+             B
+        A
+        1  2.0
+        2  3.0
+
+        NaNs denote group exhausted when using dropna
+
+        >>> g.nth(3, dropna='any')
+            B
+        A
+        1 NaN
+        2 NaN
+
+        Specifying ``as_index=False`` in ``groupby`` keeps the original index.
+
+        >>> df.groupby('A', as_index=False).nth(1)
+           A    B
+        1  1  2.0
+        4  2  5.0
+        """
+
+        if isinstance(n, int):
+            nth_values = [n]
+        elif isinstance(n, (set, list, tuple)):
+            nth_values = list(set(n))
+            if dropna is not None:
+                raise ValueError(
+                    "dropna option with a list of nth values is not supported")
+        else:
+            raise TypeError("n needs to be an int or a list/set/tuple of ints")
+
+        nth_values = np.array(nth_values, dtype=np.intp)
+        self._set_group_selection()
+
+        if not dropna:
+            mask = np.in1d(self._cumcount_array(), nth_values) | \
+                np.in1d(self._cumcount_array(ascending=False) + 1, -nth_values)
+
+            out = self._selected_obj[mask]
+            if not self.as_index:
+                return out
+
+            ids, _, _ = self.grouper.group_info
+            out.index = self.grouper.result_index[ids[mask]]
+
+            return out.sort_index() if self.sort else out
+
+        if dropna not in ['any', 'all']:
+            if isinstance(self._selected_obj, Series) and dropna is True:
+                warnings.warn("the dropna={dropna} keyword is deprecated,"
+                              "use dropna='all' instead. "
+                              "For a Series groupby, dropna must be "
+                              "either None, 'any' or 'all'.".format(
+                                  dropna=dropna),
+                              FutureWarning,
+                              stacklevel=2)
+                dropna = 'all'
+            else:
+                # Note: when agg-ing picker doesn't raise this,
+                # just returns NaN
+                raise ValueError("For a DataFrame groupby, dropna must be "
+                                 "either None, 'any' or 'all', "
+                                 "(was passed %s)." % (dropna),)
+
+        # old behaviour, but with all and any support for DataFrames.
+        # modified in GH 7559 to have better perf
+        max_len = n if n >= 0 else - 1 - n
+        dropped = self.obj.dropna(how=dropna, axis=self.axis)
+
+        # get a new grouper for our dropped obj
+        if self.keys is None and self.level is None:
+
+            # we don't have the grouper info available
+            # (e.g. we have selected out
+            # a column that is not in the current object)
+            axis = self.grouper.axis
+            grouper = axis[axis.isin(dropped.index)]
+
+        else:
+
+            # create a grouper with the original parameters, but on the dropped
+            # object
+            grouper, _, _ = _get_grouper(dropped, key=self.keys,
+                                         axis=self.axis, level=self.level,
+                                         sort=self.sort,
+                                         mutated=self.mutated)
+
+        grb = dropped.groupby(grouper, as_index=self.as_index, sort=self.sort)
+        sizes, result = grb.size(), grb.nth(n)
+        mask = (sizes < max_len).values
+
+        # set the results which don't meet the criteria
+        if len(result) and mask.any():
+            result.loc[mask] = np.nan
+
+        # reset/reindex to the original groups
+        if len(self.obj) == len(dropped) or \
+           len(result) == len(self.grouper.result_index):
+            result.index = self.grouper.result_index
+        else:
+            result = result.reindex(self.grouper.result_index)
+
+        return result
+
+    @Substitution(name='groupby')
+    def ngroup(self, ascending=True):
+        """
+        Number each group from 0 to the number of groups - 1.
+
+        This is the enumerative complement of cumcount.  Note that the
+        numbers given to the groups match the order in which the groups
+        would be seen when iterating over the groupby object, not the
+        order they are first observed.
+
+        .. versionadded:: 0.20.2
+
+        Parameters
+        ----------
+        ascending : bool, default True
+            If False, number in reverse, from number of group - 1 to 0.
+
+        Examples
+        --------
+
+        >>> df = pd.DataFrame({"A": list("aaabba")})
+        >>> df
+           A
+        0  a
+        1  a
+        2  a
+        3  b
+        4  b
+        5  a
+        >>> df.groupby('A').ngroup()
+        0    0
+        1    0
+        2    0
+        3    1
+        4    1
+        5    0
+        dtype: int64
+        >>> df.groupby('A').ngroup(ascending=False)
+        0    1
+        1    1
+        2    1
+        3    0
+        4    0
+        5    1
+        dtype: int64
+        >>> df.groupby(["A", [1,1,2,3,2,1]]).ngroup()
+        0    0
+        1    0
+        2    1
+        3    3
+        4    2
+        5    0
+        dtype: int64
+
+        See also
+        --------
+        .cumcount : Number the rows in each group.
+        """
+
+        with _group_selection_context(self):
+            index = self._selected_obj.index
+            result = Series(self.grouper.group_info[0], index)
+            if not ascending:
+                result = self.ngroups - 1 - result
+            return result
+
+    @Substitution(name='groupby')
+    def cumcount(self, ascending=True):
+        """
+        Number each item in each group from 0 to the length of that group - 1.
+
+        Essentially this is equivalent to
+
+        >>> self.apply(lambda x: Series(np.arange(len(x)), x.index))
+
+        Parameters
+        ----------
+        ascending : bool, default True
+            If False, number in reverse, from length of group - 1 to 0.
+
+        Examples
+        --------
+
+        >>> df = pd.DataFrame([['a'], ['a'], ['a'], ['b'], ['b'], ['a']],
+        ...                   columns=['A'])
+        >>> df
+           A
+        0  a
+        1  a
+        2  a
+        3  b
+        4  b
+        5  a
+        >>> df.groupby('A').cumcount()
+        0    0
+        1    1
+        2    2
+        3    0
+        4    1
+        5    3
+        dtype: int64
+        >>> df.groupby('A').cumcount(ascending=False)
+        0    3
+        1    2
+        2    1
+        3    1
+        4    0
+        5    0
+        dtype: int64
+
+        See also
+        --------
+        .ngroup : Number the groups themselves.
+        """
+
+        with _group_selection_context(self):
+            index = self._selected_obj.index
+            cumcounts = self._cumcount_array(ascending=ascending)
+            return Series(cumcounts, index)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def rank(self, method='average', ascending=True, na_option='keep',
+             pct=False, axis=0):
+        """
+        Provides the rank of values within each group.
+
+        Parameters
+        ----------
+        method : {'average', 'min', 'max', 'first', 'dense'}, default 'average'
+            * average: average rank of group
+            * min: lowest rank in group
+            * max: highest rank in group
+            * first: ranks assigned in order they appear in the array
+            * dense: like 'min', but rank always increases by 1 between groups
+        ascending : boolean, default True
+            False for ranks by high (1) to low (N)
+        na_option :  {'keep', 'top', 'bottom'}, default 'keep'
+            * keep: leave NA values where they are
+            * top: smallest rank if ascending
+            * bottom: smallest rank if descending
+        pct : boolean, default False
+            Compute percentage rank of data within each group
+        axis : int, default 0
+            The axis of the object over which to compute the rank.
+
+        Returns
+        -----
+        DataFrame with ranking of values within each group
+        """
+        return self._cython_transform('rank', numeric_only=False,
+                                      ties_method=method, ascending=ascending,
+                                      na_option=na_option, pct=pct, axis=axis)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def cumprod(self, axis=0, *args, **kwargs):
+        """Cumulative product for each group"""
+        nv.validate_groupby_func('cumprod', args, kwargs,
+                                 ['numeric_only', 'skipna'])
+        if axis != 0:
+            return self.apply(lambda x: x.cumprod(axis=axis, **kwargs))
+
+        return self._cython_transform('cumprod', **kwargs)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def cumsum(self, axis=0, *args, **kwargs):
+        """Cumulative sum for each group"""
+        nv.validate_groupby_func('cumsum', args, kwargs,
+                                 ['numeric_only', 'skipna'])
+        if axis != 0:
+            return self.apply(lambda x: x.cumsum(axis=axis, **kwargs))
+
+        return self._cython_transform('cumsum', **kwargs)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def cummin(self, axis=0, **kwargs):
+        """Cumulative min for each group"""
+        if axis != 0:
+            return self.apply(lambda x: np.minimum.accumulate(x, axis))
+
+        return self._cython_transform('cummin', numeric_only=False)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def cummax(self, axis=0, **kwargs):
+        """Cumulative max for each group"""
+        if axis != 0:
+            return self.apply(lambda x: np.maximum.accumulate(x, axis))
+
+        return self._cython_transform('cummax', numeric_only=False)
+
+    def _get_cythonized_result(self, how, grouper, aggregate=False,
+                               cython_dtype=None, needs_values=False,
+                               needs_mask=False, needs_ngroups=False,
+                               result_is_index=False,
+                               pre_processing=None, post_processing=None,
+                               **kwargs):
+        """Get result for Cythonized functions
+
+        Parameters
+        ----------
+        how : str, Cythonized function name to be called
+        grouper : Grouper object containing pertinent group info
+        aggregate : bool, default False
+            Whether the result should be aggregated to match the number of
+            groups
+        cython_dtype : default None
+            Type of the array that will be modified by the Cython call. If
+            `None`, the type will be inferred from the values of each slice
+        needs_values : bool, default False
+            Whether the values should be a part of the Cython call
+            signature
+        needs_mask : bool, default False
+            Whether boolean mask needs to be part of the Cython call
+            signature
+        needs_ngroups : bool, default False
+            Whether number of groups is part of the Cython call signature
+        result_is_index : bool, default False
+            Whether the result of the Cython operation is an index of
+            values to be retrieved, instead of the actual values themselves
+        pre_processing : function, default None
+            Function to be applied to `values` prior to passing to Cython
+            Raises if `needs_values` is False
+        post_processing : function, default None
+            Function to be applied to result of Cython function
+        **kwargs : dict
+            Extra arguments to be passed back to Cython funcs
+
+        Returns
+        -------
+        `Series` or `DataFrame`  with filled values
+        """
+        if result_is_index and aggregate:
+            raise ValueError("'result_is_index' and 'aggregate' cannot both "
+                             "be True!")
+        if post_processing:
+            if not callable(pre_processing):
+                raise ValueError("'post_processing' must be a callable!")
+        if pre_processing:
+            if not callable(pre_processing):
+                raise ValueError("'pre_processing' must be a callable!")
+            if not needs_values:
+                raise ValueError("Cannot use 'pre_processing' without "
+                                 "specifying 'needs_values'!")
+
+        labels, _, ngroups = grouper.group_info
+        output = collections.OrderedDict()
+        base_func = getattr(libgroupby, how)
+
+        for name, obj in self._iterate_slices():
+            if aggregate:
+                result_sz = ngroups
+            else:
+                result_sz = len(obj.values)
+
+            if not cython_dtype:
+                cython_dtype = obj.values.dtype
+
+            result = np.zeros(result_sz, dtype=cython_dtype)
+            func = partial(base_func, result, labels)
+            if needs_values:
+                vals = obj.values
+                if pre_processing:
+                    vals = pre_processing(vals)
+                func = partial(func, vals)
+
+            if needs_mask:
+                mask = isnull(obj.values).view(np.uint8)
+                func = partial(func, mask)
+
+            if needs_ngroups:
+                func = partial(func, ngroups)
+
+            func(**kwargs)  # Call func to modify indexer values in place
+
+            if result_is_index:
+                result = algorithms.take_nd(obj.values, result)
+
+            if post_processing:
+                result = post_processing(result)
+
+            output[name] = result
+
+        if aggregate:
+            return self._wrap_aggregated_output(output)
+        else:
+            return self._wrap_transformed_output(output)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def shift(self, periods=1, freq=None, axis=0):
+        """
+        Shift each group by periods observations
+
+        Parameters
+        ----------
+        periods : integer, default 1
+            number of periods to shift
+        freq : frequency string
+        axis : axis to shift, default 0
+        """
+
+        if freq is not None or axis != 0:
+            return self.apply(lambda x: x.shift(periods, freq, axis))
+
+        return self._get_cythonized_result('group_shift_indexer',
+                                           self.grouper, cython_dtype=np.int64,
+                                           needs_ngroups=True,
+                                           result_is_index=True,
+                                           periods=periods)
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def pct_change(self, periods=1, fill_method='pad', limit=None, freq=None,
+                   axis=0):
+        """Calculate pct_change of each value to previous entry in group"""
+        if freq is not None or axis != 0:
+            return self.apply(lambda x: x.pct_change(periods=periods,
+                                                     fill_method=fill_method,
+                                                     limit=limit, freq=freq,
+                                                     axis=axis))
+
+        filled = getattr(self, fill_method)(limit=limit).drop(
+            self.grouper.names, axis=1)
+        shifted = filled.shift(periods=periods, freq=freq)
+
+        return (filled / shifted) - 1
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def head(self, n=5):
+        """
+        Returns first n rows of each group.
+
+        Essentially equivalent to ``.apply(lambda x: x.head(n))``,
+        except ignores as_index flag.
+
+        Examples
+        --------
+
+        >>> df = DataFrame([[1, 2], [1, 4], [5, 6]],
+                           columns=['A', 'B'])
+        >>> df.groupby('A', as_index=False).head(1)
+           A  B
+        0  1  2
+        2  5  6
+        >>> df.groupby('A').head(1)
+           A  B
+        0  1  2
+        2  5  6
+        """
+        self._reset_group_selection()
+        mask = self._cumcount_array() < n
+        return self._selected_obj[mask]
+
+    @Substitution(name='groupby')
+    @Appender(_doc_template)
+    def tail(self, n=5):
+        """
+        Returns last n rows of each group
+
+        Essentially equivalent to ``.apply(lambda x: x.tail(n))``,
+        except ignores as_index flag.
+
+        Examples
+        --------
+
+        >>> df = DataFrame([['a', 1], ['a', 2], ['b', 1], ['b', 2]],
+                           columns=['A', 'B'])
+        >>> df.groupby('A').tail(1)
+           A  B
+        1  a  2
+        3  b  2
+        >>> df.groupby('A').head(1)
+           A  B
+        0  a  1
+        2  b  1
+        """
+        self._reset_group_selection()
+        mask = self._cumcount_array(ascending=False) < n
+        return self._selected_obj[mask]
+
+
+GroupBy._add_numeric_operations()
+
+
+@Appender(GroupBy.__doc__)
+def groupby(obj, by, **kwds):
+    if isinstance(obj, Series):
+        klass = SeriesGroupBy
+    elif isinstance(obj, DataFrame):
+        klass = DataFrameGroupBy
+    else:  # pragma: no cover
+        raise TypeError('invalid type: %s' % type(obj))
+
+    return klass(obj, by, **kwds)
+
+
+def _get_axes(group):
+    if isinstance(group, Series):
+        return [group.index]
+    else:
+        return group.axes
+
+
+def _is_indexed_like(obj, axes):
+    if isinstance(obj, Series):
+        if len(axes) > 1:
+            return False
+        return obj.index.equals(axes[0])
+    elif isinstance(obj, DataFrame):
+        return obj.index.equals(axes[0])
+
+    return False
+
+
+class BaseGrouper(object):
+    """
+    This is an internal Grouper class, which actually holds
+    the generated groups
+
+    Parameters
+    ----------
+    axis : int
+        the axis to group
+    groupings : array of grouping
+        all the grouping instances to handle in this grouper
+        for example for grouper list to groupby, need to pass the list
+    sort : boolean, default True
+        whether this grouper will give sorted result or not
+    group_keys : boolean, default True
+    mutated : boolean, default False
+    indexer : intp array, optional
+        the indexer created by Grouper
+        some groupers (TimeGrouper) will sort its axis and its
+        group_info is also sorted, so need the indexer to reorder
+
+    """
+
+    def __init__(self, axis, groupings, sort=True, group_keys=True,
+                 mutated=False, indexer=None):
+        self._filter_empty_groups = self.compressed = len(groupings) != 1
+        self.axis = axis
+        self.groupings = groupings
+        self.sort = sort
+        self.group_keys = group_keys
+        self.mutated = mutated
+        self.indexer = indexer
+
+    @property
+    def shape(self):
+        return tuple(ping.ngroups for ping in self.groupings)
+
+    def __iter__(self):
+        return iter(self.indices)
+
+    @property
+    def nkeys(self):
+        return len(self.groupings)
+
+    def get_iterator(self, data, axis=0):
+        """
+        Groupby iterator
+
+        Returns
+        -------
+        Generator yielding sequence of (name, subsetted object)
+        for each group
+        """
+        splitter = self._get_splitter(data, axis=axis)
+        keys = self._get_group_keys()
+        for key, (i, group) in zip(keys, splitter):
+            yield key, group
+
+    def _get_splitter(self, data, axis=0):
+        comp_ids, _, ngroups = self.group_info
+        return get_splitter(data, comp_ids, ngroups, axis=axis)
+
+    def _get_group_keys(self):
+        if len(self.groupings) == 1:
+            return self.levels[0]
+        else:
+            comp_ids, _, ngroups = self.group_info
+
+            # provide "flattened" iterator for multi-group setting
+            return get_flattened_iterator(comp_ids,
+                                          ngroups,
+                                          self.levels,
+                                          self.labels)
+
+    def apply(self, f, data, axis=0):
+        mutated = self.mutated
+        splitter = self._get_splitter(data, axis=axis)
+        group_keys = self._get_group_keys()
+
+        # oh boy
+        f_name = com._get_callable_name(f)
+        if (f_name not in _plotting_methods and
+                hasattr(splitter, 'fast_apply') and axis == 0):
+            try:
+                values, mutated = splitter.fast_apply(f, group_keys)
+                return group_keys, values, mutated
+            except reduction.InvalidApply:
+                # we detect a mutation of some kind
+                # so take slow path
+                pass
+            except Exception:
+                # raise this error to the caller
+                pass
+
+        result_values = []
+        for key, (i, group) in zip(group_keys, splitter):
+            object.__setattr__(group, 'name', key)
+
+            # group might be modified
+            group_axes = _get_axes(group)
+            res = f(group)
+            if not _is_indexed_like(res, group_axes):
+                mutated = True
+            result_values.append(res)
+
+        return group_keys, result_values, mutated
+
+    @cache_readonly
+    def indices(self):
+        """ dict {group name -> group indices} """
+        if len(self.groupings) == 1:
+            return self.groupings[0].indices
+        else:
+            label_list = [ping.labels for ping in self.groupings]
+            keys = [com._values_from_object(ping.group_index)
+                    for ping in self.groupings]
+            return get_indexer_dict(label_list, keys)
+
+    @property
+    def labels(self):
+        return [ping.labels for ping in self.groupings]
+
+    @property
+    def levels(self):
+        return [ping.group_index for ping in self.groupings]
+
+    @property
+    def names(self):
+        return [ping.name for ping in self.groupings]
+
+    def size(self):
+        """
+        Compute group sizes
+
+        """
+        ids, _, ngroup = self.group_info
+        ids = _ensure_platform_int(ids)
+        if ngroup:
+            out = np.bincount(ids[ids != -1], minlength=ngroup)
+        else:
+            out = ids
+        return Series(out,
+                      index=self.result_index,
+                      dtype='int64')
+
+    @cache_readonly
+    def groups(self):
+        """ dict {group name -> group labels} """
+        if len(self.groupings) == 1:
+            return self.groupings[0].groups
+        else:
+            to_groupby = lzip(*(ping.grouper for ping in self.groupings))
+            to_groupby = Index(to_groupby)
+            return self.axis.groupby(to_groupby)
+
+    @cache_readonly
+    def is_monotonic(self):
+        # return if my group orderings are monotonic
+        return Index(self.group_info[0]).is_monotonic
+
+    @cache_readonly
+    def group_info(self):
+        comp_ids, obs_group_ids = self._get_compressed_labels()
+
+        ngroups = len(obs_group_ids)
+        comp_ids = _ensure_int64(comp_ids)
+        return comp_ids, obs_group_ids, ngroups
+
+    @cache_readonly
+    def label_info(self):
+        # return the labels of items in original grouped axis
+        labels, _, _ = self.group_info
+        if self.indexer is not None:
+            sorter = np.lexsort((labels, self.indexer))
+            labels = labels[sorter]
+        return labels
+
+    def _get_compressed_labels(self):
+        all_labels = [ping.labels for ping in self.groupings]
+        if len(all_labels) > 1:
+            group_index = get_group_index(all_labels, self.shape,
+                                          sort=True, xnull=True)
+            return compress_group_index(group_index, sort=self.sort)
+
+        ping = self.groupings[0]
+        return ping.labels, np.arange(len(ping.group_index))
+
+    @cache_readonly
+    def ngroups(self):
+        return len(self.result_index)
+
+    @property
+    def recons_labels(self):
+        comp_ids, obs_ids, _ = self.group_info
+        labels = (ping.labels for ping in self.groupings)
+        return decons_obs_group_ids(
+            comp_ids, obs_ids, self.shape, labels, xnull=True)
+
+    @cache_readonly
+    def result_index(self):
+        if not self.compressed and len(self.groupings) == 1:
+            return self.groupings[0].result_index.rename(self.names[0])
+
+        labels = self.recons_labels
+        levels = [ping.result_index for ping in self.groupings]
+        result = MultiIndex(levels=levels,
+                            labels=labels,
+                            verify_integrity=False,
+                            names=self.names)
+        return result
+
+    def get_group_levels(self):
+        if not self.compressed and len(self.groupings) == 1:
+            return [self.groupings[0].result_index]
+
+        name_list = []
+        for ping, labels in zip(self.groupings, self.recons_labels):
+            labels = _ensure_platform_int(labels)
+            levels = ping.result_index.take(labels)
+
+            name_list.append(levels)
+
+        return name_list
+
+    # ------------------------------------------------------------
+    # Aggregation functions
+
+    _cython_functions = {
+        'aggregate': {
+            'add': 'group_add',
+            'prod': 'group_prod',
+            'min': 'group_min',
+            'max': 'group_max',
+            'mean': 'group_mean',
+            'median': {
+                'name': 'group_median'
+            },
+            'var': 'group_var',
+            'first': {
+                'name': 'group_nth',
+                'f': lambda func, a, b, c, d, e: func(a, b, c, d, 1, -1)
+            },
+            'last': 'group_last',
+            'ohlc': 'group_ohlc',
+        },
+
+        'transform': {
+            'cumprod': 'group_cumprod',
+            'cumsum': 'group_cumsum',
+            'cummin': 'group_cummin',
+            'cummax': 'group_cummax',
+            'rank': {
+                'name': 'group_rank',
+                'f': lambda func, a, b, c, d, **kwargs: func(
+                    a, b, c, d,
+                    kwargs.get('ties_method', 'average'),
+                    kwargs.get('ascending', True),
+                    kwargs.get('pct', False),
+                    kwargs.get('na_option', 'keep')
+                )
+            }
+        }
+    }
+
+    _cython_arity = {
+        'ohlc': 4,  # OHLC
+    }
+
+    _name_functions = {
+        'ohlc': lambda *args: ['open', 'high', 'low', 'close']
+    }
+
+    def _is_builtin_func(self, arg):
+        """
+        if we define an builtin function for this argument, return it,
+        otherwise return the arg
+        """
+        return SelectionMixin._builtin_table.get(arg, arg)
+
+    def _get_cython_function(self, kind, how, values, is_numeric):
+
+        dtype_str = values.dtype.name
+
+        def get_func(fname):
+            # see if there is a fused-type version of function
+            # only valid for numeric
+            f = getattr(libgroupby, fname, None)
+            if f is not None and is_numeric:
+                return f
+
+            # otherwise find dtype-specific version, falling back to object
+            for dt in [dtype_str, 'object']:
+                f = getattr(libgroupby, "%s_%s" % (fname, dtype_str), None)
+                if f is not None:
+                    return f
+
+        ftype = self._cython_functions[kind][how]
+
+        if isinstance(ftype, dict):
+            func = afunc = get_func(ftype['name'])
+
+            # a sub-function
+            f = ftype.get('f')
+            if f is not None:
+
+                def wrapper(*args, **kwargs):
+                    return f(afunc, *args, **kwargs)
+
+                # need to curry our sub-function
+                func = wrapper
+
+        else:
+            func = get_func(ftype)
+
+        if func is None:
+            raise NotImplementedError("function is not implemented for this"
+                                      "dtype: [how->%s,dtype->%s]" %
+                                      (how, dtype_str))
+        return func
+
+    def _cython_operation(self, kind, values, how, axis, min_count=-1,
+                          **kwargs):
+        assert kind in ['transform', 'aggregate']
+
+        # can we do this operation with our cython functions
+        # if not raise NotImplementedError
+
+        # we raise NotImplemented if this is an invalid operation
+        # entirely, e.g. adding datetimes
+
+        # categoricals are only 1d, so we
+        # are not setup for dim transforming
+        if is_categorical_dtype(values):
+            raise NotImplementedError(
+                "categoricals are not support in cython ops ATM")
+        elif is_datetime64_any_dtype(values):
+            if how in ['add', 'prod', 'cumsum', 'cumprod']:
+                raise NotImplementedError(
+                    "datetime64 type does not support {} "
+                    "operations".format(how))
+        elif is_timedelta64_dtype(values):
+            if how in ['prod', 'cumprod']:
+                raise NotImplementedError(
+                    "timedelta64 type does not support {} "
+                    "operations".format(how))
+
+        arity = self._cython_arity.get(how, 1)
+
+        vdim = values.ndim
+        swapped = False
+        if vdim == 1:
+            values = values[:, None]
+            out_shape = (self.ngroups, arity)
+        else:
+            if axis > 0:
+                swapped = True
+                values = values.swapaxes(0, axis)
+            if arity > 1:
+                raise NotImplementedError("arity of more than 1 is not "
+                                          "supported for the 'how' argument")
+            out_shape = (self.ngroups,) + values.shape[1:]
+
+        is_datetimelike = needs_i8_conversion(values.dtype)
+        is_numeric = is_numeric_dtype(values.dtype)
+
+        if is_datetimelike:
+            values = values.view('int64')
+            is_numeric = True
+        elif is_bool_dtype(values.dtype):
+            values = _ensure_float64(values)
+        elif is_integer_dtype(values):
+            # we use iNaT for the missing value on ints
+            # so pre-convert to guard this condition
+            if (values == iNaT).any():
+                values = _ensure_float64(values)
+            else:
+                values = values.astype('int64', copy=False)
+        elif is_numeric and not is_complex_dtype(values):
+            values = _ensure_float64(values)
+        else:
+            values = values.astype(object)
+
+        try:
+            func = self._get_cython_function(
+                kind, how, values, is_numeric)
+        except NotImplementedError:
+            if is_numeric:
+                values = _ensure_float64(values)
+                func = self._get_cython_function(
+                    kind, how, values, is_numeric)
+            else:
+                raise
+
+        if how == 'rank':
+            out_dtype = 'float'
+        else:
+            if is_numeric:
+                out_dtype = '%s%d' % (values.dtype.kind, values.dtype.itemsize)
+            else:
+                out_dtype = 'object'
+
+        labels, _, _ = self.group_info
+
+        if kind == 'aggregate':
+            result = _maybe_fill(np.empty(out_shape, dtype=out_dtype),
+                                 fill_value=np.nan)
+            counts = np.zeros(self.ngroups, dtype=np.int64)
+            result = self._aggregate(
+                result, counts, values, labels, func, is_numeric,
+                is_datetimelike, min_count)
+        elif kind == 'transform':
+            result = _maybe_fill(np.empty_like(values, dtype=out_dtype),
+                                 fill_value=np.nan)
+
+            # TODO: min_count
+            result = self._transform(
+                result, values, labels, func, is_numeric, is_datetimelike,
+                **kwargs)
+
+        if is_integer_dtype(result) and not is_datetimelike:
+            mask = result == iNaT
+            if mask.any():
+                result = result.astype('float64')
+                result[mask] = np.nan
+
+        if kind == 'aggregate' and \
+           self._filter_empty_groups and not counts.all():
+            if result.ndim == 2:
+                try:
+                    result = lib.row_bool_subset(
+                        result, (counts > 0).view(np.uint8))
+                except ValueError:
+                    result = lib.row_bool_subset_object(
+                        _ensure_object(result),
+                        (counts > 0).view(np.uint8))
+            else:
+                result = result[counts > 0]
+
+        if vdim == 1 and arity == 1:
+            result = result[:, 0]
+
+        if how in self._name_functions:
+            # TODO
+            names = self._name_functions[how]()
+        else:
+            names = None
+
+        if swapped:
+            result = result.swapaxes(0, axis)
+
+        return result, names
+
+    def aggregate(self, values, how, axis=0, min_count=-1):
+        return self._cython_operation('aggregate', values, how, axis,
+                                      min_count=min_count)
+
+    def transform(self, values, how, axis=0, **kwargs):
+        return self._cython_operation('transform', values, how, axis, **kwargs)
+
+    def _aggregate(self, result, counts, values, comp_ids, agg_func,
+                   is_numeric, is_datetimelike, min_count=-1):
+        if values.ndim > 3:
+            # punting for now
+            raise NotImplementedError("number of dimensions is currently "
+                                      "limited to 3")
+        elif values.ndim > 2:
+            for i, chunk in enumerate(values.transpose(2, 0, 1)):
+
+                chunk = chunk.squeeze()
+                agg_func(result[:, :, i], counts, chunk, comp_ids,
+                         min_count)
+        else:
+            agg_func(result, counts, values, comp_ids, min_count)
+
+        return result
+
+    def _transform(self, result, values, comp_ids, transform_func,
+                   is_numeric, is_datetimelike, **kwargs):
+
+        comp_ids, _, ngroups = self.group_info
+        if values.ndim > 3:
+            # punting for now
+            raise NotImplementedError("number of dimensions is currently "
+                                      "limited to 3")
+        elif values.ndim > 2:
+            for i, chunk in enumerate(values.transpose(2, 0, 1)):
+
+                chunk = chunk.squeeze()
+                transform_func(result[:, :, i], values,
+                               comp_ids, is_datetimelike, **kwargs)
+        else:
+            transform_func(result, values, comp_ids, is_datetimelike, **kwargs)
+
+        return result
+
+    def agg_series(self, obj, func):
+        try:
+            return self._aggregate_series_fast(obj, func)
+        except Exception:
+            return self._aggregate_series_pure_python(obj, func)
+
+    def _aggregate_series_fast(self, obj, func):
+        func = self._is_builtin_func(func)
+
+        if obj.index._has_complex_internals:
+            raise TypeError('Incompatible index for Cython grouper')
+
+        group_index, _, ngroups = self.group_info
+
+        # avoids object / Series creation overhead
+        dummy = obj._get_values(slice(None, 0)).to_dense()
+        indexer = get_group_index_sorter(group_index, ngroups)
+        obj = obj._take(indexer).to_dense()
+        group_index = algorithms.take_nd(
+            group_index, indexer, allow_fill=False)
+        grouper = reduction.SeriesGrouper(obj, func, group_index, ngroups,
+                                          dummy)
+        result, counts = grouper.get_result()
+        return result, counts
+
+    def _aggregate_series_pure_python(self, obj, func):
+
+        group_index, _, ngroups = self.group_info
+
+        counts = np.zeros(ngroups, dtype=int)
+        result = None
+
+        splitter = get_splitter(obj, group_index, ngroups, axis=self.axis)
+
+        for label, group in splitter:
+            res = func(group)
+            if result is None:
+                if (isinstance(res, (Series, Index, np.ndarray))):
+                    raise ValueError('Function does not reduce')
+                result = np.empty(ngroups, dtype='O')
+
+            counts[label] = group.shape[0]
+            result[label] = res
+
+        result = lib.maybe_convert_objects(result, try_float=0)
+        return result, counts
+
+
+def generate_bins_generic(values, binner, closed):
+    """
+    Generate bin edge offsets and bin labels for one array using another array
+    which has bin edge values. Both arrays must be sorted.
+
+    Parameters
+    ----------
+    values : array of values
+    binner : a comparable array of values representing bins into which to bin
+        the first array. Note, 'values' end-points must fall within 'binner'
+        end-points.
+    closed : which end of bin is closed; left (default), right
+
+    Returns
+    -------
+    bins : array of offsets (into 'values' argument) of bins.
+        Zero and last edge are excluded in result, so for instance the first
+        bin is values[0:bin[0]] and the last is values[bin[-1]:]
+    """
+    lenidx = len(values)
+    lenbin = len(binner)
+
+    if lenidx <= 0 or lenbin <= 0:
+        raise ValueError("Invalid length for values or for binner")
+
+    # check binner fits data
+    if values[0] < binner[0]:
+        raise ValueError("Values falls before first bin")
+
+    if values[lenidx - 1] > binner[lenbin - 1]:
+        raise ValueError("Values falls after last bin")
+
+    bins = np.empty(lenbin - 1, dtype=np.int64)
+
+    j = 0  # index into values
+    bc = 0  # bin count
+
+    # linear scan, presume nothing about values/binner except that it fits ok
+    for i in range(0, lenbin - 1):
+        r_bin = binner[i + 1]
+
+        # count values in current bin, advance to next bin
+        while j < lenidx and (values[j] < r_bin or
+                              (closed == 'right' and values[j] == r_bin)):
+            j += 1
+
+        bins[bc] = j
+        bc += 1
+
+    return bins
+
+
+class BinGrouper(BaseGrouper):
+
+    """
+    This is an internal Grouper class
+
+    Parameters
+    ----------
+    bins : the split index of binlabels to group the item of axis
+    binlabels : the label list
+    filter_empty : boolean, default False
+    mutated : boolean, default False
+    indexer : a intp array
+
+    Examples
+    --------
+    bins: [2, 4, 6, 8, 10]
+    binlabels: DatetimeIndex(['2005-01-01', '2005-01-03',
+        '2005-01-05', '2005-01-07', '2005-01-09'],
+        dtype='datetime64[ns]', freq='2D')
+
+    the group_info, which contains the label of each item in grouped
+    axis, the index of label in label list, group number, is
+
+    (array([0, 0, 1, 1, 2, 2, 3, 3, 4, 4]), array([0, 1, 2, 3, 4]), 5)
+
+    means that, the grouped axis has 10 items, can be grouped into 5
+    labels, the first and second items belong to the first label, the
+    third and forth items belong to the second label, and so on
+
+    """
+
+    def __init__(self, bins, binlabels, filter_empty=False, mutated=False,
+                 indexer=None):
+        self.bins = _ensure_int64(bins)
+        self.binlabels = _ensure_index(binlabels)
+        self._filter_empty_groups = filter_empty
+        self.mutated = mutated
+        self.indexer = indexer
+
+    @cache_readonly
+    def groups(self):
+        """ dict {group name -> group labels} """
+
+        # this is mainly for compat
+        # GH 3881
+        result = {}
+        for key, value in zip(self.binlabels, self.bins):
+            if key is not NaT:
+                result[key] = value
+        return result
+
+    @property
+    def nkeys(self):
+        return 1
+
+    def get_iterator(self, data, axis=0):
+        """
+        Groupby iterator
+
+        Returns
+        -------
+        Generator yielding sequence of (name, subsetted object)
+        for each group
+        """
+        if isinstance(data, NDFrame):
+            slicer = lambda start, edge: data._slice(
+                slice(start, edge), axis=axis)
+            length = len(data.axes[axis])
+        else:
+            slicer = lambda start, edge: data[slice(start, edge)]
+            length = len(data)
+
+        start = 0
+        for edge, label in zip(self.bins, self.binlabels):
+            if label is not NaT:
+                yield label, slicer(start, edge)
+            start = edge
+
+        if start < length:
+            yield self.binlabels[-1], slicer(start, None)
+
+    @cache_readonly
+    def indices(self):
+        indices = collections.defaultdict(list)
+
+        i = 0
+        for label, bin in zip(self.binlabels, self.bins):
+            if i < bin:
+                if label is not NaT:
+                    indices[label] = list(range(i, bin))
+                i = bin
+        return indices
+
+    @cache_readonly
+    def group_info(self):
+        ngroups = self.ngroups
+        obs_group_ids = np.arange(ngroups)
+        rep = np.diff(np.r_[0, self.bins])
+
+        rep = _ensure_platform_int(rep)
+        if ngroups == len(self.bins):
+            comp_ids = np.repeat(np.arange(ngroups), rep)
+        else:
+            comp_ids = np.repeat(np.r_[-1, np.arange(ngroups)], rep)
+
+        return comp_ids.astype('int64', copy=False), \
+            obs_group_ids.astype('int64', copy=False), ngroups
+
+    @cache_readonly
+    def ngroups(self):
+        return len(self.result_index)
+
+    @cache_readonly
+    def result_index(self):
+        if len(self.binlabels) != 0 and isna(self.binlabels[0]):
+            return self.binlabels[1:]
+
+        return self.binlabels
+
+    @property
+    def levels(self):
+        return [self.binlabels]
+
+    @property
+    def names(self):
+        return [self.binlabels.name]
+
+    @property
+    def groupings(self):
+        return [Grouping(lvl, lvl, in_axis=False, level=None, name=name)
+                for lvl, name in zip(self.levels, self.names)]
+
+    def agg_series(self, obj, func):
+        dummy = obj[:0]
+        grouper = reduction.SeriesBinGrouper(obj, func, self.bins, dummy)
+        return grouper.get_result()
+
+    # ----------------------------------------------------------------------
+    # cython aggregation
+
+    _cython_functions = copy.deepcopy(BaseGrouper._cython_functions)
+
+
+class Grouping(object):
+
+    """
+    Holds the grouping information for a single key
+
+    Parameters
+    ----------
+    index : Index
+    grouper :
+    obj :
+    name :
+    level :
+    observed : boolean, default False
+        If we are a Categorical, use the observed values
+    in_axis : if the Grouping is a column in self.obj and hence among
+        Groupby.exclusions list
+
+    Returns
+    -------
+    **Attributes**:
+      * indices : dict of {group -> index_list}
+      * labels : ndarray, group labels
+      * ids : mapping of label -> group
+      * counts : array of group counts
+      * group_index : unique groups
+      * groups : dict of {group -> label_list}
+    """
+
+    def __init__(self, index, grouper=None, obj=None, name=None, level=None,
+                 sort=True, observed=False, in_axis=False):
+
+        self.name = name
+        self.level = level
+        self.grouper = _convert_grouper(index, grouper)
+        self.all_grouper = None
+        self.index = index
+        self.sort = sort
+        self.obj = obj
+        self.observed = observed
+        self.in_axis = in_axis
+
+        # right place for this?
+        if isinstance(grouper, (Series, Index)) and name is None:
+            self.name = grouper.name
+
+        if isinstance(grouper, MultiIndex):
+            self.grouper = grouper.values
+
+        # we have a single grouper which may be a myriad of things,
+        # some of which are dependent on the passing in level
+
+        if level is not None:
+            if not isinstance(level, int):
+                if level not in index.names:
+                    raise AssertionError('Level %s not in index' % str(level))
+                level = index.names.index(level)
+
+            if self.name is None:
+                self.name = index.names[level]
+
+            self.grouper, self._labels, self._group_index = \
+                index._get_grouper_for_level(self.grouper, level)
+
+        # a passed Grouper like, directly get the grouper in the same way
+        # as single grouper groupby, use the group_info to get labels
+        elif isinstance(self.grouper, Grouper):
+            # get the new grouper; we already have disambiguated
+            # what key/level refer to exactly, don't need to
+            # check again as we have by this point converted these
+            # to an actual value (rather than a pd.Grouper)
+            _, grouper, _ = self.grouper._get_grouper(self.obj, validate=False)
+            if self.name is None:
+                self.name = grouper.result_index.name
+            self.obj = self.grouper.obj
+            self.grouper = grouper
+
+        else:
+            if self.grouper is None and self.name is not None:
+                self.grouper = self.obj[self.name]
+
+            elif isinstance(self.grouper, (list, tuple)):
+                self.grouper = com._asarray_tuplesafe(self.grouper)
+
+            # a passed Categorical
+            elif is_categorical_dtype(self.grouper):
+
+                self.all_grouper = self.grouper
+                self.grouper = self.grouper._codes_for_groupby(
+                    self.sort, observed)
+                categories = self.grouper.categories
+
+                # we make a CategoricalIndex out of the cat grouper
+                # preserving the categories / ordered attributes
+                self._labels = self.grouper.codes
+                if observed:
+                    codes = algorithms.unique1d(self.grouper.codes)
+                else:
+                    codes = np.arange(len(categories))
+
+                self._group_index = CategoricalIndex(
+                    Categorical.from_codes(
+                        codes=codes,
+                        categories=categories,
+                        ordered=self.grouper.ordered))
+
+            # we are done
+            if isinstance(self.grouper, Grouping):
+                self.grouper = self.grouper.grouper
+
+            # no level passed
+            elif not isinstance(self.grouper,
+                                (Series, Index, ExtensionArray, np.ndarray)):
+                if getattr(self.grouper, 'ndim', 1) != 1:
+                    t = self.name or str(type(self.grouper))
+                    raise ValueError("Grouper for '%s' not 1-dimensional" % t)
+                self.grouper = self.index.map(self.grouper)
+                if not (hasattr(self.grouper, "__len__") and
+                        len(self.grouper) == len(self.index)):
+                    errmsg = ('Grouper result violates len(labels) == '
+                              'len(data)\nresult: %s' %
+                              pprint_thing(self.grouper))
+                    self.grouper = None  # Try for sanity
+                    raise AssertionError(errmsg)
+
+        # if we have a date/time-like grouper, make sure that we have
+        # Timestamps like
+        if getattr(self.grouper, 'dtype', None) is not None:
+            if is_datetime64_dtype(self.grouper):
+                from pandas import to_datetime
+                self.grouper = to_datetime(self.grouper)
+            elif is_timedelta64_dtype(self.grouper):
+                from pandas import to_timedelta
+                self.grouper = to_timedelta(self.grouper)
+
+    def __repr__(self):
+        return 'Grouping({0})'.format(self.name)
+
+    def __iter__(self):
+        return iter(self.indices)
+
+    _labels = None
+    _group_index = None
+
+    @property
+    def ngroups(self):
+        return len(self.group_index)
+
+    @cache_readonly
+    def indices(self):
+        # we have a list of groupers
+        if isinstance(self.grouper, BaseGrouper):
+            return self.grouper.indices
+
+        values = _ensure_categorical(self.grouper)
+        return values._reverse_indexer()
+
+    @property
+    def labels(self):
+        if self._labels is None:
+            self._make_labels()
+        return self._labels
+
+    @cache_readonly
+    def result_index(self):
+        if self.all_grouper is not None:
+            all_categories = self.all_grouper.categories
+
+            # we re-order to the original category orderings
+            if self.sort:
+                return self.group_index.set_categories(all_categories)
+
+            # we are not sorting, so add unobserved to the end
+            categories = self.group_index.categories
+            return self.group_index.add_categories(
+                all_categories[~all_categories.isin(categories)])
+
+        return self.group_index
+
+    @property
+    def group_index(self):
+        if self._group_index is None:
+            self._make_labels()
+        return self._group_index
+
+    def _make_labels(self):
+        if self._labels is None or self._group_index is None:
+            # we have a list of groupers
+            if isinstance(self.grouper, BaseGrouper):
+                labels = self.grouper.label_info
+                uniques = self.grouper.result_index
+            else:
+                labels, uniques = algorithms.factorize(
+                    self.grouper, sort=self.sort)
+                uniques = Index(uniques, name=self.name)
+            self._labels = labels
+            self._group_index = uniques
+
+    @cache_readonly
+    def groups(self):
+        return self.index.groupby(Categorical.from_codes(self.labels,
+                                                         self.group_index))
+
+
+def _get_grouper(obj, key=None, axis=0, level=None, sort=True,
+                 observed=False, mutated=False, validate=True):
+    """
+    create and return a BaseGrouper, which is an internal
+    mapping of how to create the grouper indexers.
+    This may be composed of multiple Grouping objects, indicating
+    multiple groupers
+
+    Groupers are ultimately index mappings. They can originate as:
+    index mappings, keys to columns, functions, or Groupers
+
+    Groupers enable local references to axis,level,sort, while
+    the passed in axis, level, and sort are 'global'.
+
+    This routine tries to figure out what the passing in references
+    are and then creates a Grouping for each one, combined into
+    a BaseGrouper.
+
+    If observed & we have a categorical grouper, only show the observed
+    values
+
+    If validate, then check for key/level overlaps
+
+    """
+    group_axis = obj._get_axis(axis)
+
+    # validate that the passed single level is compatible with the passed
+    # axis of the object
+    if level is not None:
+        # TODO: These if-block and else-block are almost same.
+        # MultiIndex instance check is removable, but it seems that there are
+        # some processes only for non-MultiIndex in else-block,
+        # eg. `obj.index.name != level`. We have to consider carefully whether
+        # these are applicable for MultiIndex. Even if these are applicable,
+        # we need to check if it makes no side effect to subsequent processes
+        # on the outside of this condition.
+        # (GH 17621)
+        if isinstance(group_axis, MultiIndex):
+            if is_list_like(level) and len(level) == 1:
+                level = level[0]
+
+            if key is None and is_scalar(level):
+                # Get the level values from group_axis
+                key = group_axis.get_level_values(level)
+                level = None
+
+        else:
+            # allow level to be a length-one list-like object
+            # (e.g., level=[0])
+            # GH 13901
+            if is_list_like(level):
+                nlevels = len(level)
+                if nlevels == 1:
+                    level = level[0]
+                elif nlevels == 0:
+                    raise ValueError('No group keys passed!')
+                else:
+                    raise ValueError('multiple levels only valid with '
+                                     'MultiIndex')
+
+            if isinstance(level, compat.string_types):
+                if obj.index.name != level:
+                    raise ValueError('level name %s is not the name of the '
+                                     'index' % level)
+            elif level > 0 or level < -1:
+                raise ValueError('level > 0 or level < -1 only valid with '
+                                 ' MultiIndex')
+
+            # NOTE: `group_axis` and `group_axis.get_level_values(level)`
+            # are same in this section.
+            level = None
+            key = group_axis
+
+    # a passed-in Grouper, directly convert
+    if isinstance(key, Grouper):
+        binner, grouper, obj = key._get_grouper(obj, validate=False)
+        if key.key is None:
+            return grouper, [], obj
+        else:
+            return grouper, set([key.key]), obj
+
+    # already have a BaseGrouper, just return it
+    elif isinstance(key, BaseGrouper):
+        return key, [], obj
+
+    # In the future, a tuple key will always mean an actual key,
+    # not an iterable of keys. In the meantime, we attempt to provide
+    # a warning. We can assume that the user wanted a list of keys when
+    # the key is not in the index. We just have to be careful with
+    # unhashble elements of `key`. Any unhashable elements implies that
+    # they wanted a list of keys.
+    # https://github.com/pandas-dev/pandas/issues/18314
+    is_tuple = isinstance(key, tuple)
+    all_hashable = is_tuple and is_hashable(key)
+
+    if is_tuple:
+        if ((all_hashable and key not in obj and set(key).issubset(obj))
+                or not all_hashable):
+            # column names ('a', 'b') -> ['a', 'b']
+            # arrays like (a, b) -> [a, b]
+            msg = ("Interpreting tuple 'by' as a list of keys, rather than "
+                   "a single key. Use 'by=[...]' instead of 'by=(...)'. In "
+                   "the future, a tuple will always mean a single key.")
+            warnings.warn(msg, FutureWarning, stacklevel=5)
+            key = list(key)
+
+    if not isinstance(key, list):
+        keys = [key]
+        match_axis_length = False
+    else:
+        keys = key
+        match_axis_length = len(keys) == len(group_axis)
+
+    # what are we after, exactly?
+    any_callable = any(callable(g) or isinstance(g, dict) for g in keys)
+    any_groupers = any(isinstance(g, Grouper) for g in keys)
+    any_arraylike = any(isinstance(g, (list, tuple, Series, Index, np.ndarray))
+                        for g in keys)
+
+    try:
+        if isinstance(obj, DataFrame):
+            all_in_columns_index = all(g in obj.columns or g in obj.index.names
+                                       for g in keys)
+        else:
+            all_in_columns_index = False
+    except Exception:
+        all_in_columns_index = False
+
+    if not any_callable and not all_in_columns_index and \
+       not any_arraylike and not any_groupers and \
+       match_axis_length and level is None:
+        keys = [com._asarray_tuplesafe(keys)]
+
+    if isinstance(level, (tuple, list)):
+        if key is None:
+            keys = [None] * len(level)
+        levels = level
+    else:
+        levels = [level] * len(keys)
+
+    groupings = []
+    exclusions = []
+
+    # if the actual grouper should be obj[key]
+    def is_in_axis(key):
+        if not _is_label_like(key):
+            try:
+                obj._data.items.get_loc(key)
+            except Exception:
+                return False
+
+        return True
+
+    # if the grouper is obj[name]
+    def is_in_obj(gpr):
+        try:
+            return id(gpr) == id(obj[gpr.name])
+        except Exception:
+            return False
+
+    for i, (gpr, level) in enumerate(zip(keys, levels)):
+
+        if is_in_obj(gpr):  # df.groupby(df['name'])
+            in_axis, name = True, gpr.name
+            exclusions.append(name)
+
+        elif is_in_axis(gpr):  # df.groupby('name')
+            if gpr in obj:
+                if validate:
+                    stacklevel = 5  # Number of stack levels from df.groupby
+                    obj._check_label_or_level_ambiguity(
+                        gpr, stacklevel=stacklevel)
+                in_axis, name, gpr = True, gpr, obj[gpr]
+                exclusions.append(name)
+            elif obj._is_level_reference(gpr):
+                in_axis, name, level, gpr = False, None, gpr, None
+            else:
+                raise KeyError(gpr)
+        elif isinstance(gpr, Grouper) and gpr.key is not None:
+            # Add key to exclusions
+            exclusions.append(gpr.key)
+            in_axis, name = False, None
+        else:
+            in_axis, name = False, None
+
+        if is_categorical_dtype(gpr) and len(gpr) != obj.shape[axis]:
+            raise ValueError(
+                ("Length of grouper ({len_gpr}) and axis ({len_axis})"
+                 " must be same length"
+                 .format(len_gpr=len(gpr), len_axis=obj.shape[axis])))
+
+        # create the Grouping
+        # allow us to passing the actual Grouping as the gpr
+        ping = Grouping(group_axis,
+                        gpr,
+                        obj=obj,
+                        name=name,
+                        level=level,
+                        sort=sort,
+                        observed=observed,
+                        in_axis=in_axis) \
+            if not isinstance(gpr, Grouping) else gpr
+
+        groupings.append(ping)
+
+    if len(groupings) == 0:
+        raise ValueError('No group keys passed!')
+
+    # create the internals grouper
+    grouper = BaseGrouper(group_axis, groupings, sort=sort, mutated=mutated)
+    return grouper, exclusions, obj
+
+
+def _is_label_like(val):
+    return (isinstance(val, (compat.string_types, tuple)) or
+            (val is not None and is_scalar(val)))
+
+
+def _convert_grouper(axis, grouper):
+    if isinstance(grouper, dict):
+        return grouper.get
+    elif isinstance(grouper, Series):
+        if grouper.index.equals(axis):
+            return grouper._values
+        else:
+            return grouper.reindex(axis)._values
+    elif isinstance(grouper, (list, Series, Index, np.ndarray)):
+        if len(grouper) != len(axis):
+            raise ValueError('Grouper and axis must be same length')
+        return grouper
+    else:
+        return grouper
+
+
+def _whitelist_method_generator(klass, whitelist):
+    """
+    Yields all GroupBy member defs for DataFrame/Series names in _whitelist.
+
+    Parameters
+    ----------
+    klass - class where members are defined.  Should be Series or DataFrame
+
+    whitelist - list of names of klass methods to be constructed
+
+    Returns
+    -------
+    The generator yields a sequence of strings, each suitable for exec'ing,
+    that define implementations of the named methods for DataFrameGroupBy
+    or SeriesGroupBy.
+
+    Since we don't want to override methods explicitly defined in the
+    base class, any such name is skipped.
+    """
+
+    method_wrapper_template = \
+        """def %(name)s(%(sig)s) :
+    \"""
+    %(doc)s
+    \"""
+    f = %(self)s.__getattr__('%(name)s')
+    return f(%(args)s)"""
+    property_wrapper_template = \
+        """@property
+def %(name)s(self) :
+    \"""
+    %(doc)s
+    \"""
+    return self.__getattr__('%(name)s')"""
+    for name in whitelist:
+        # don't override anything that was explicitly defined
+        # in the base class
+        if hasattr(GroupBy, name):
+            continue
+        # ugly, but we need the name string itself in the method.
+        f = getattr(klass, name)
+        doc = f.__doc__
+        doc = doc if type(doc) == str else ''
+        if isinstance(f, types.MethodType):
+            wrapper_template = method_wrapper_template
+            decl, args = make_signature(f)
+            # pass args by name to f because otherwise
+            # GroupBy._make_wrapper won't know whether
+            # we passed in an axis parameter.
+            args_by_name = ['{0}={0}'.format(arg) for arg in args[1:]]
+            params = {'name': name,
+                      'doc': doc,
+                      'sig': ','.join(decl),
+                      'self': args[0],
+                      'args': ','.join(args_by_name)}
+        else:
+            wrapper_template = property_wrapper_template
+            params = {'name': name, 'doc': doc}
+        yield wrapper_template % params
+
+
+class SeriesGroupBy(GroupBy):
+    #
+    # Make class defs of attributes on SeriesGroupBy whitelist
+    _apply_whitelist = _series_apply_whitelist
+    for _def_str in _whitelist_method_generator(Series,
+                                                _series_apply_whitelist):
+        exec(_def_str)
+
+    @property
+    def _selection_name(self):
+        """
+        since we are a series, we by definition only have
+        a single name, but may be the result of a selection or
+        the name of our object
+        """
+        if self._selection is None:
+            return self.obj.name
+        else:
+            return self._selection
+
+    _agg_doc = dedent("""
+    Examples
+    --------
+
+    >>> s = Series([1, 2, 3, 4])
+
+    >>> s
+    0    1
+    1    2
+    2    3
+    3    4
+    dtype: int64
+
+    >>> s.groupby([1, 1, 2, 2]).min()
+    1    1
+    2    3
+    dtype: int64
+
+    >>> s.groupby([1, 1, 2, 2]).agg('min')
+    1    1
+    2    3
+    dtype: int64
+
+    >>> s.groupby([1, 1, 2, 2]).agg(['min', 'max'])
+       min  max
+    1    1    2
+    2    3    4
+
+    See also
+    --------
+    pandas.Series.groupby.apply
+    pandas.Series.groupby.transform
+    pandas.Series.aggregate
+
+    """)
+
+    @Appender(_apply_docs['template']
+              .format(input='series',
+                      examples=_apply_docs['series_examples']))
+    def apply(self, func, *args, **kwargs):
+        return super(SeriesGroupBy, self).apply(func, *args, **kwargs)
+
+    @Appender(_agg_doc)
+    @Appender(_shared_docs['aggregate'] % dict(
+        klass='Series',
+        versionadded='',
+        axis=''))
+    def aggregate(self, func_or_funcs, *args, **kwargs):
+        _level = kwargs.pop('_level', None)
+        if isinstance(func_or_funcs, compat.string_types):
+            return getattr(self, func_or_funcs)(*args, **kwargs)
+
+        if isinstance(func_or_funcs, collections.Iterable):
+            # Catch instances of lists / tuples
+            # but not the class list / tuple itself.
+            ret = self._aggregate_multiple_funcs(func_or_funcs,
+                                                 (_level or 0) + 1)
+        else:
+            cyfunc = self._is_cython_func(func_or_funcs)
+            if cyfunc and not args and not kwargs:
+                return getattr(self, cyfunc)()
+
+            if self.grouper.nkeys > 1:
+                return self._python_agg_general(func_or_funcs, *args, **kwargs)
+
+            try:
+                return self._python_agg_general(func_or_funcs, *args, **kwargs)
+            except Exception:
+                result = self._aggregate_named(func_or_funcs, *args, **kwargs)
+
+            index = Index(sorted(result), name=self.grouper.names[0])
+            ret = Series(result, index=index)
+
+        if not self.as_index:  # pragma: no cover
+            print('Warning, ignoring as_index=True')
+
+        # _level handled at higher
+        if not _level and isinstance(ret, dict):
+            from pandas import concat
+            ret = concat(ret, axis=1)
+        return ret
+
+    agg = aggregate
+
+    def _aggregate_multiple_funcs(self, arg, _level):
+        if isinstance(arg, dict):
+
+            # show the deprecation, but only if we
+            # have not shown a higher level one
+            # GH 15931
+            if isinstance(self._selected_obj, Series) and _level <= 1:
+                warnings.warn(
+                    ("using a dict on a Series for aggregation\n"
+                     "is deprecated and will be removed in a future "
+                     "version"),
+                    FutureWarning, stacklevel=3)
+
+            columns = list(arg.keys())
+            arg = list(arg.items())
+        elif any(isinstance(x, (tuple, list)) for x in arg):
+            arg = [(x, x) if not isinstance(x, (tuple, list)) else x
+                   for x in arg]
+
+            # indicated column order
+            columns = lzip(*arg)[0]
+        else:
+            # list of functions / function names
+            columns = []
+            for f in arg:
+                if isinstance(f, compat.string_types):
+                    columns.append(f)
+                else:
+                    # protect against callables without names
+                    columns.append(com._get_callable_name(f))
+            arg = lzip(columns, arg)
+
+        results = {}
+        for name, func in arg:
+            obj = self
+            if name in results:
+                raise SpecificationError('Function names must be unique, '
+                                         'found multiple named %s' % name)
+
+            # reset the cache so that we
+            # only include the named selection
+            if name in self._selected_obj:
+                obj = copy.copy(obj)
+                obj._reset_cache()
+                obj._selection = name
+            results[name] = obj.aggregate(func)
+
+        if isinstance(list(compat.itervalues(results))[0],
+                      DataFrame):
+
+            # let higher level handle
+            if _level:
+                return results
+            return list(compat.itervalues(results))[0]
+        return DataFrame(results, columns=columns)
+
+    def _wrap_output(self, output, index, names=None):
+        """ common agg/transform wrapping logic """
+        output = output[self._selection_name]
+
+        if names is not None:
+            return DataFrame(output, index=index, columns=names)
+        else:
+            name = self._selection_name
+            if name is None:
+                name = self._selected_obj.name
+            return Series(output, index=index, name=name)
+
+    def _wrap_aggregated_output(self, output, names=None):
+        return self._wrap_output(output=output,
+                                 index=self.grouper.result_index,
+                                 names=names)
+
+    def _wrap_transformed_output(self, output, names=None):
+        return self._wrap_output(output=output,
+                                 index=self.obj.index,
+                                 names=names)
+
+    def _wrap_applied_output(self, keys, values, not_indexed_same=False):
+        if len(keys) == 0:
+            # GH #6265
+            return Series([], name=self._selection_name, index=keys)
+
+        def _get_index():
+            if self.grouper.nkeys > 1:
+                index = MultiIndex.from_tuples(keys, names=self.grouper.names)
+            else:
+                index = Index(keys, name=self.grouper.names[0])
+            return index
+
+        if isinstance(values[0], dict):
+            # GH #823
+            index = _get_index()
+            result = DataFrame(values, index=index).stack()
+            result.name = self._selection_name
+            return result
+
+        if isinstance(values[0], (Series, dict)):
+            return self._concat_objects(keys, values,
+                                        not_indexed_same=not_indexed_same)
+        elif isinstance(values[0], DataFrame):
+            # possible that Series -> DataFrame by applied function
+            return self._concat_objects(keys, values,
+                                        not_indexed_same=not_indexed_same)
+        else:
+            # GH #6265
+            return Series(values, index=_get_index(),
+                          name=self._selection_name)
+
+    def _aggregate_named(self, func, *args, **kwargs):
+        result = {}
+
+        for name, group in self:
+            group.name = name
+            output = func(group, *args, **kwargs)
+            if isinstance(output, (Series, Index, np.ndarray)):
+                raise Exception('Must produce aggregated value')
+            result[name] = self._try_cast(output, group)
+
+        return result
+
+    @Substitution(klass='Series', selected='A.')
+    @Appender(_transform_template)
+    def transform(self, func, *args, **kwargs):
+        func = self._is_cython_func(func) or func
+
+        # if string function
+        if isinstance(func, compat.string_types):
+            if func in _cython_transforms:
+                # cythonized transform
+                return getattr(self, func)(*args, **kwargs)
+            else:
+                # cythonized aggregation and merge
+                return self._transform_fast(
+                    lambda: getattr(self, func)(*args, **kwargs), func)
+
+        # reg transform
+        klass = self._selected_obj.__class__
+        results = []
+        wrapper = lambda x: func(x, *args, **kwargs)
+        for name, group in self:
+            object.__setattr__(group, 'name', name)
+            res = wrapper(group)
+
+            if hasattr(res, 'values'):
+                res = res.values
+
+            indexer = self._get_index(name)
+            s = klass(res, indexer)
+            results.append(s)
+
+        from pandas.core.reshape.concat import concat
+        result = concat(results).sort_index()
+
+        # we will only try to coerce the result type if
+        # we have a numeric dtype, as these are *always* udfs
+        # the cython take a different path (and casting)
+        dtype = self._selected_obj.dtype
+        if is_numeric_dtype(dtype):
+            result = maybe_downcast_to_dtype(result, dtype)
+
+        result.name = self._selected_obj.name
+        result.index = self._selected_obj.index
+        return result
+
+    def _transform_fast(self, func, func_nm):
+        """
+        fast version of transform, only applicable to
+        builtin/cythonizable functions
+        """
+        if isinstance(func, compat.string_types):
+            func = getattr(self, func)
+
+        ids, _, ngroup = self.grouper.group_info
+        cast = self._transform_should_cast(func_nm)
+        out = algorithms.take_1d(func().values, ids)
+        if cast:
+            out = self._try_cast(out, self.obj)
+        return Series(out, index=self.obj.index, name=self.obj.name)
+
+    def filter(self, func, dropna=True, *args, **kwargs):  # noqa
+        """
+        Return a copy of a Series excluding elements from groups that
+        do not satisfy the boolean criterion specified by func.
+
+        Parameters
+        ----------
+        func : function
+            To apply to each group. Should return True or False.
+        dropna : Drop groups that do not pass the filter. True by default;
+            if False, groups that evaluate False are filled with NaNs.
+
+        Examples
+        --------
+        >>> import pandas as pd
+        >>> df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
+        ...                           'foo', 'bar'],
+        ...                    'B' : [1, 2, 3, 4, 5, 6],
+        ...                    'C' : [2.0, 5., 8., 1., 2., 9.]})
+        >>> grouped = df.groupby('A')
+        >>> df.groupby('A').B.filter(lambda x: x.mean() > 3.)
+        1    2
+        3    4
+        5    6
+        Name: B, dtype: int64
+
+        Returns
+        -------
+        filtered : Series
+        """
+        if isinstance(func, compat.string_types):
+            wrapper = lambda x: getattr(x, func)(*args, **kwargs)
+        else:
+            wrapper = lambda x: func(x, *args, **kwargs)
+
+        # Interpret np.nan as False.
+        def true_and_notna(x, *args, **kwargs):
+            b = wrapper(x, *args, **kwargs)
+            return b and notna(b)
+
+        try:
+            indices = [self._get_index(name) for name, group in self
+                       if true_and_notna(group)]
+        except ValueError:
+            raise TypeError("the filter must return a boolean result")
+        except TypeError:
+            raise TypeError("the filter must return a boolean result")
+
+        filtered = self._apply_filter(indices, dropna)
+        return filtered
+
+    def nunique(self, dropna=True):
+        """ Returns number of unique elements in the group """
+        ids, _, _ = self.grouper.group_info
+
+        val = self.obj.get_values()
+
+        try:
+            sorter = np.lexsort((val, ids))
+        except TypeError:  # catches object dtypes
+            assert val.dtype == object, \
+                'val.dtype must be object, got %s' % val.dtype
+            val, _ = algorithms.factorize(val, sort=False)
+            sorter = np.lexsort((val, ids))
+            _isna = lambda a: a == -1
+        else:
+            _isna = isna
+
+        ids, val = ids[sorter], val[sorter]
+
+        # group boundaries are where group ids change
+        # unique observations are where sorted values change
+        idx = np.r_[0, 1 + np.nonzero(ids[1:] != ids[:-1])[0]]
+        inc = np.r_[1, val[1:] != val[:-1]]
+
+        # 1st item of each group is a new unique observation
+        mask = _isna(val)
+        if dropna:
+            inc[idx] = 1
+            inc[mask] = 0
+        else:
+            inc[mask & np.r_[False, mask[:-1]]] = 0
+            inc[idx] = 1
+
+        out = np.add.reduceat(inc, idx).astype('int64', copy=False)
+        if len(ids):
+            # NaN/NaT group exists if the head of ids is -1,
+            # so remove it from res and exclude its index from idx
+            if ids[0] == -1:
+                res = out[1:]
+                idx = idx[np.flatnonzero(idx)]
+            else:
+                res = out
+        else:
+            res = out[1:]
+        ri = self.grouper.result_index
+
+        # we might have duplications among the bins
+        if len(res) != len(ri):
+            res, out = np.zeros(len(ri), dtype=out.dtype), res
+            res[ids[idx]] = out
+
+        return Series(res,
+                      index=ri,
+                      name=self._selection_name)
+
+    @Appender(Series.describe.__doc__)
+    def describe(self, **kwargs):
+        result = self.apply(lambda x: x.describe(**kwargs))
+        if self.axis == 1:
+            return result.T
+        return result.unstack()
+
+    def value_counts(self, normalize=False, sort=True, ascending=False,
+                     bins=None, dropna=True):
+
+        from pandas.core.reshape.tile import cut
+        from pandas.core.reshape.merge import _get_join_indexers
+
+        if bins is not None and not np.iterable(bins):
+            # scalar bins cannot be done at top level
+            # in a backward compatible way
+            return self.apply(Series.value_counts,
+                              normalize=normalize,
+                              sort=sort,
+                              ascending=ascending,
+                              bins=bins)
+
+        ids, _, _ = self.grouper.group_info
+        val = self.obj.get_values()
+
+        # groupby removes null keys from groupings
+        mask = ids != -1
+        ids, val = ids[mask], val[mask]
+
+        if bins is None:
+            lab, lev = algorithms.factorize(val, sort=True)
+            llab = lambda lab, inc: lab[inc]
+        else:
+
+            # lab is a Categorical with categories an IntervalIndex
+            lab = cut(Series(val), bins, include_lowest=True)
+            lev = lab.cat.categories
+            lab = lev.take(lab.cat.codes)
+            llab = lambda lab, inc: lab[inc]._multiindex.labels[-1]
+
+        if is_interval_dtype(lab):
+            # TODO: should we do this inside II?
+            sorter = np.lexsort((lab.left, lab.right, ids))
+        else:
+            sorter = np.lexsort((lab, ids))
+
+        ids, lab = ids[sorter], lab[sorter]
+
+        # group boundaries are where group ids change
+        idx = np.r_[0, 1 + np.nonzero(ids[1:] != ids[:-1])[0]]
+
+        # new values are where sorted labels change
+        lchanges = llab(lab, slice(1, None)) != llab(lab, slice(None, -1))
+        inc = np.r_[True, lchanges]
+        inc[idx] = True  # group boundaries are also new values
+        out = np.diff(np.nonzero(np.r_[inc, True])[0])  # value counts
+
+        # num. of times each group should be repeated
+        rep = partial(np.repeat, repeats=np.add.reduceat(inc, idx))
+
+        # multi-index components
+        labels = list(map(rep, self.grouper.recons_labels)) + [llab(lab, inc)]
+        levels = [ping.group_index for ping in self.grouper.groupings] + [lev]
+        names = self.grouper.names + [self._selection_name]
+
+        if dropna:
+            mask = labels[-1] != -1
+            if mask.all():
+                dropna = False
+            else:
+                out, labels = out[mask], [label[mask] for label in labels]
+
+        if normalize:
+            out = out.astype('float')
+            d = np.diff(np.r_[idx, len(ids)])
+            if dropna:
+                m = ids[lab == -1]
+                np.add.at(d, m, -1)
+                acc = rep(d)[mask]
+            else:
+                acc = rep(d)
+            out /= acc
+
+        if sort and bins is None:
+            cat = ids[inc][mask] if dropna else ids[inc]
+            sorter = np.lexsort((out if ascending else -out, cat))
+            out, labels[-1] = out[sorter], labels[-1][sorter]
+
+        if bins is None:
+            mi = MultiIndex(levels=levels, labels=labels, names=names,
+                            verify_integrity=False)
+
+            if is_integer_dtype(out):
+                out = _ensure_int64(out)
+            return Series(out, index=mi, name=self._selection_name)
+
+        # for compat. with libgroupby.value_counts need to ensure every
+        # bin is present at every index level, null filled with zeros
+        diff = np.zeros(len(out), dtype='bool')
+        for lab in labels[:-1]:
+            diff |= np.r_[True, lab[1:] != lab[:-1]]
+
+        ncat, nbin = diff.sum(), len(levels[-1])
+
+        left = [np.repeat(np.arange(ncat), nbin),
+                np.tile(np.arange(nbin), ncat)]
+
+        right = [diff.cumsum() - 1, labels[-1]]
+
+        _, idx = _get_join_indexers(left, right, sort=False, how='left')
+        out = np.where(idx != -1, out[idx], 0)
+
+        if sort:
+            sorter = np.lexsort((out if ascending else -out, left[0]))
+            out, left[-1] = out[sorter], left[-1][sorter]
+
+        # build the multi-index w/ full levels
+        labels = list(map(lambda lab: np.repeat(lab[diff], nbin), labels[:-1]))
+        labels.append(left[-1])
+
+        mi = MultiIndex(levels=levels, labels=labels, names=names,
+                        verify_integrity=False)
+
+        if is_integer_dtype(out):
+            out = _ensure_int64(out)
+        return Series(out, index=mi, name=self._selection_name)
+
+    def count(self):
+        """ Compute count of group, excluding missing values """
+        ids, _, ngroups = self.grouper.group_info
+        val = self.obj.get_values()
+
+        mask = (ids != -1) & ~isna(val)
+        ids = _ensure_platform_int(ids)
+        out = np.bincount(ids[mask], minlength=ngroups or 0)
+
+        return Series(out,
+                      index=self.grouper.result_index,
+                      name=self._selection_name,
+                      dtype='int64')
+
+    def _apply_to_column_groupbys(self, func):
+        """ return a pass thru """
+        return func(self)
+
+    def pct_change(self, periods=1, fill_method='pad', limit=None, freq=None):
+        """Calculate percent change of each value to previous entry in group"""
+        filled = getattr(self, fill_method)(limit=limit)
+        shifted = filled.shift(periods=periods, freq=freq)
+
+        return (filled / shifted) - 1
+
+
+class NDFrameGroupBy(GroupBy):
+
+    def _iterate_slices(self):
+        if self.axis == 0:
+            # kludge
+            if self._selection is None:
+                slice_axis = self.obj.columns
+            else:
+                slice_axis = self._selection_list
+            slicer = lambda x: self.obj[x]
+        else:
+            slice_axis = self.obj.index
+            slicer = self.obj.xs
+
+        for val in slice_axis:
+            if val in self.exclusions:
+                continue
+            yield val, slicer(val)
+
+    def _cython_agg_general(self, how, alt=None, numeric_only=True,
+                            min_count=-1):
+        new_items, new_blocks = self._cython_agg_blocks(
+            how, alt=alt, numeric_only=numeric_only, min_count=min_count)
+        return self._wrap_agged_blocks(new_items, new_blocks)
+
+    def _wrap_agged_blocks(self, items, blocks):
+        obj = self._obj_with_exclusions
+
+        new_axes = list(obj._data.axes)
+
+        # more kludge
+        if self.axis == 0:
+            new_axes[0], new_axes[1] = new_axes[1], self.grouper.result_index
+        else:
+            new_axes[self.axis] = self.grouper.result_index
+
+        # Make sure block manager integrity check passes.
+        assert new_axes[0].equals(items)
+        new_axes[0] = items
+
+        mgr = BlockManager(blocks, new_axes)
+
+        new_obj = type(obj)(mgr)
+
+        return self._post_process_cython_aggregate(new_obj)
+
+    _block_agg_axis = 0
+
+    def _cython_agg_blocks(self, how, alt=None, numeric_only=True,
+                           min_count=-1):
+        # TODO: the actual managing of mgr_locs is a PITA
+        # here, it should happen via BlockManager.combine
+
+        data, agg_axis = self._get_data_to_aggregate()
+
+        if numeric_only:
+            data = data.get_numeric_data(copy=False)
+
+        new_blocks = []
+        new_items = []
+        deleted_items = []
+        for block in data.blocks:
+
+            locs = block.mgr_locs.as_array
+            try:
+                result, _ = self.grouper.aggregate(
+                    block.values, how, axis=agg_axis, min_count=min_count)
+            except NotImplementedError:
+                # generally if we have numeric_only=False
+                # and non-applicable functions
+                # try to python agg
+
+                if alt is None:
+                    # we cannot perform the operation
+                    # in an alternate way, exclude the block
+                    deleted_items.append(locs)
+                    continue
+
+                # call our grouper again with only this block
+                obj = self.obj[data.items[locs]]
+                s = groupby(obj, self.grouper)
+                result = s.aggregate(lambda x: alt(x, axis=self.axis))
+                newb = result._data.blocks[0]
+
+            finally:
+
+                # see if we can cast the block back to the original dtype
+                result = block._try_coerce_and_cast_result(result)
+                newb = block.make_block(result)
+
+            new_items.append(locs)
+            new_blocks.append(newb)
+
+        if len(new_blocks) == 0:
+            raise DataError('No numeric types to aggregate')
+
+        # reset the locs in the blocks to correspond to our
+        # current ordering
+        indexer = np.concatenate(new_items)
+        new_items = data.items.take(np.sort(indexer))
+
+        if len(deleted_items):
+
+            # we need to adjust the indexer to account for the
+            # items we have removed
+            # really should be done in internals :<
+
+            deleted = np.concatenate(deleted_items)
+            ai = np.arange(len(data))
+            mask = np.zeros(len(data))
+            mask[deleted] = 1
+            indexer = (ai - mask.cumsum())[indexer]
+
+        offset = 0
+        for b in new_blocks:
+            loc = len(b.mgr_locs)
+            b.mgr_locs = indexer[offset:(offset + loc)]
+            offset += loc
+
+        return new_items, new_blocks
+
+    def _get_data_to_aggregate(self):
+        obj = self._obj_with_exclusions
+        if self.axis == 0:
+            return obj.swapaxes(0, 1)._data, 1
+        else:
+            return obj._data, self.axis
+
+    def _post_process_cython_aggregate(self, obj):
+        # undoing kludge from below
+        if self.axis == 0:
+            obj = obj.swapaxes(0, 1)
+        return obj
+
+    def aggregate(self, arg, *args, **kwargs):
+
+        _level = kwargs.pop('_level', None)
+        result, how = self._aggregate(arg, _level=_level, *args, **kwargs)
+        if how is None:
+            return result
+
+        if result is None:
+
+            # grouper specific aggregations
+            if self.grouper.nkeys > 1:
+                return self._python_agg_general(arg, *args, **kwargs)
+            else:
+
+                # try to treat as if we are passing a list
+                try:
+                    assert not args and not kwargs
+                    result = self._aggregate_multiple_funcs(
+                        [arg], _level=_level, _axis=self.axis)
+                    result.columns = Index(
+                        result.columns.levels[0],
+                        name=self._selected_obj.columns.name)
+                except Exception:
+                    result = self._aggregate_generic(arg, *args, **kwargs)
+
+        if not self.as_index:
+            self._insert_inaxis_grouper_inplace(result)
+            result.index = np.arange(len(result))
+
+        return result._convert(datetime=True)
+
+    agg = aggregate
+
+    def _aggregate_generic(self, func, *args, **kwargs):
+        if self.grouper.nkeys != 1:
+            raise AssertionError('Number of keys must be 1')
+
+        axis = self.axis
+        obj = self._obj_with_exclusions
+
+        result = {}
+        if axis != obj._info_axis_number:
+            try:
+                for name, data in self:
+                    result[name] = self._try_cast(func(data, *args, **kwargs),
+                                                  data)
+            except Exception:
+                return self._aggregate_item_by_item(func, *args, **kwargs)
+        else:
+            for name in self.indices:
+                try:
+                    data = self.get_group(name, obj=obj)
+                    result[name] = self._try_cast(func(data, *args, **kwargs),
+                                                  data)
+                except Exception:
+                    wrapper = lambda x: func(x, *args, **kwargs)
+                    result[name] = data.apply(wrapper, axis=axis)
+
+        return self._wrap_generic_output(result, obj)
+
+    def _wrap_aggregated_output(self, output, names=None):
+        raise com.AbstractMethodError(self)
+
+    def _aggregate_item_by_item(self, func, *args, **kwargs):
+        # only for axis==0
+
+        obj = self._obj_with_exclusions
+        result = {}
+        cannot_agg = []
+        errors = None
+        for item in obj:
+            try:
+                data = obj[item]
+                colg = SeriesGroupBy(data, selection=item,
+                                     grouper=self.grouper)
+                result[item] = self._try_cast(
+                    colg.aggregate(func, *args, **kwargs), data)
+            except ValueError:
+                cannot_agg.append(item)
+                continue
+            except TypeError as e:
+                cannot_agg.append(item)
+                errors = e
+                continue
+
+        result_columns = obj.columns
+        if cannot_agg:
+            result_columns = result_columns.drop(cannot_agg)
+
+            # GH6337
+            if not len(result_columns) and errors is not None:
+                raise errors
+
+        return DataFrame(result, columns=result_columns)
+
+    def _decide_output_index(self, output, labels):
+        if len(output) == len(labels):
+            output_keys = labels
+        else:
+            output_keys = sorted(output)
+            try:
+                output_keys.sort()
+            except Exception:  # pragma: no cover
+                pass
+
+            if isinstance(labels, MultiIndex):
+                output_keys = MultiIndex.from_tuples(output_keys,
+                                                     names=labels.names)
+
+        return output_keys
+
+    def _wrap_applied_output(self, keys, values, not_indexed_same=False):
+        from pandas.core.index import _all_indexes_same
+        from pandas.core.tools.numeric import to_numeric
+
+        if len(keys) == 0:
+            return DataFrame(index=keys)
+
+        key_names = self.grouper.names
+
+        # GH12824.
+        def first_not_none(values):
+            try:
+                return next(com._not_none(*values))
+            except StopIteration:
+                return None
+
+        v = first_not_none(values)
+
+        if v is None:
+            # GH9684. If all values are None, then this will throw an error.
+            # We'd prefer it return an empty dataframe.
+            return DataFrame()
+        elif isinstance(v, DataFrame):
+            return self._concat_objects(keys, values,
+                                        not_indexed_same=not_indexed_same)
+        elif self.grouper.groupings is not None:
+            if len(self.grouper.groupings) > 1:
+                key_index = self.grouper.result_index
+
+            else:
+                ping = self.grouper.groupings[0]
+                if len(keys) == ping.ngroups:
+                    key_index = ping.group_index
+                    key_index.name = key_names[0]
+
+                    key_lookup = Index(keys)
+                    indexer = key_lookup.get_indexer(key_index)
+
+                    # reorder the values
+                    values = [values[i] for i in indexer]
+                else:
+
+                    key_index = Index(keys, name=key_names[0])
+
+                # don't use the key indexer
+                if not self.as_index:
+                    key_index = None
+
+            # make Nones an empty object
+            v = first_not_none(values)
+            if v is None:
+                return DataFrame()
+            elif isinstance(v, NDFrame):
+                values = [
+                    x if x is not None else
+                    v._constructor(**v._construct_axes_dict())
+                    for x in values
+                ]
+
+            v = values[0]
+
+            if isinstance(v, (np.ndarray, Index, Series)):
+                if isinstance(v, Series):
+                    applied_index = self._selected_obj._get_axis(self.axis)
+                    all_indexed_same = _all_indexes_same([
+                        x.index for x in values
+                    ])
+                    singular_series = (len(values) == 1 and
+                                       applied_index.nlevels == 1)
+
+                    # GH3596
+                    # provide a reduction (Frame -> Series) if groups are
+                    # unique
+                    if self.squeeze:
+
+                        # assign the name to this series
+                        if singular_series:
+                            values[0].name = keys[0]
+
+                            # GH2893
+                            # we have series in the values array, we want to
+                            # produce a series:
+                            # if any of the sub-series are not indexed the same
+                            # OR we don't have a multi-index and we have only a
+                            # single values
+                            return self._concat_objects(
+                                keys, values, not_indexed_same=not_indexed_same
+                            )
+
+                        # still a series
+                        # path added as of GH 5545
+                        elif all_indexed_same:
+                            from pandas.core.reshape.concat import concat
+                            return concat(values)
+
+                    if not all_indexed_same:
+                        # GH 8467
+                        return self._concat_objects(
+                            keys, values, not_indexed_same=True,
+                        )
+
+                try:
+                    if self.axis == 0:
+                        # GH6124 if the list of Series have a consistent name,
+                        # then propagate that name to the result.
+                        index = v.index.copy()
+                        if index.name is None:
+                            # Only propagate the series name to the result
+                            # if all series have a consistent name.  If the
+                            # series do not have a consistent name, do
+                            # nothing.
+                            names = {v.name for v in values}
+                            if len(names) == 1:
+                                index.name = list(names)[0]
+
+                        # normally use vstack as its faster than concat
+                        # and if we have mi-columns
+                        if (isinstance(v.index, MultiIndex) or
+                                key_index is None or
+                                isinstance(key_index, MultiIndex)):
+                            stacked_values = np.vstack(map(np.asarray, values))
+                            result = DataFrame(stacked_values, index=key_index,
+                                               columns=index)
+                        else:
+                            # GH5788 instead of stacking; concat gets the
+                            # dtypes correct
+                            from pandas.core.reshape.concat import concat
+                            result = concat(values, keys=key_index,
+                                            names=key_index.names,
+                                            axis=self.axis).unstack()
+                            result.columns = index
+                    else:
+                        stacked_values = np.vstack(map(np.asarray, values))
+                        result = DataFrame(stacked_values.T, index=v.index,
+                                           columns=key_index)
+
+                except (ValueError, AttributeError):
+                    # GH1738: values is list of arrays of unequal lengths fall
+                    # through to the outer else caluse
+                    return Series(values, index=key_index,
+                                  name=self._selection_name)
+
+                # if we have date/time like in the original, then coerce dates
+                # as we are stacking can easily have object dtypes here
+                so = self._selected_obj
+                if (so.ndim == 2 and so.dtypes.apply(is_datetimelike).any()):
+                    result = result.apply(
+                        lambda x: to_numeric(x, errors='ignore'))
+                    date_cols = self._selected_obj.select_dtypes(
+                        include=['datetime', 'timedelta']).columns
+                    date_cols = date_cols.intersection(result.columns)
+                    result[date_cols] = (result[date_cols]
+                                         ._convert(datetime=True,
+                                                   coerce=True))
+                else:
+                    result = result._convert(datetime=True)
+
+                return self._reindex_output(result)
+
+            # values are not series or array-like but scalars
+            else:
+                # only coerce dates if we find at least 1 datetime
+                coerce = any(isinstance(x, Timestamp) for x in values)
+                # self._selection_name not passed through to Series as the
+                # result should not take the name of original selection
+                # of columns
+                return (Series(values, index=key_index)
+                        ._convert(datetime=True,
+                                  coerce=coerce))
+
+        else:
+            # Handle cases like BinGrouper
+            return self._concat_objects(keys, values,
+                                        not_indexed_same=not_indexed_same)
+
+    def _transform_general(self, func, *args, **kwargs):
+        from pandas.core.reshape.concat import concat
+
+        applied = []
+        obj = self._obj_with_exclusions
+        gen = self.grouper.get_iterator(obj, axis=self.axis)
+        fast_path, slow_path = self._define_paths(func, *args, **kwargs)
+
+        path = None
+        for name, group in gen:
+            object.__setattr__(group, 'name', name)
+
+            if path is None:
+                # Try slow path and fast path.
+                try:
+                    path, res = self._choose_path(fast_path, slow_path, group)
+                except TypeError:
+                    return self._transform_item_by_item(obj, fast_path)
+                except ValueError:
+                    msg = 'transform must return a scalar value for each group'
+                    raise ValueError(msg)
+            else:
+                res = path(group)
+
+            if isinstance(res, Series):
+
+                # we need to broadcast across the
+                # other dimension; this will preserve dtypes
+                # GH14457
+                if not np.prod(group.shape):
+                    continue
+                elif res.index.is_(obj.index):
+                    r = concat([res] * len(group.columns), axis=1)
+                    r.columns = group.columns
+                    r.index = group.index
+                else:
+                    r = DataFrame(
+                        np.concatenate([res.values] * len(group.index)
+                                       ).reshape(group.shape),
+                        columns=group.columns, index=group.index)
+
+                applied.append(r)
+            else:
+                applied.append(res)
+
+        concat_index = obj.columns if self.axis == 0 else obj.index
+        concatenated = concat(applied, join_axes=[concat_index],
+                              axis=self.axis, verify_integrity=False)
+        return self._set_result_index_ordered(concatenated)
+
+    @Substitution(klass='DataFrame', selected='')
+    @Appender(_transform_template)
+    def transform(self, func, *args, **kwargs):
+
+        # optimized transforms
+        func = self._is_cython_func(func) or func
+        if isinstance(func, compat.string_types):
+            if func in _cython_transforms:
+                # cythonized transform
+                return getattr(self, func)(*args, **kwargs)
+            else:
+                # cythonized aggregation and merge
+                result = getattr(self, func)(*args, **kwargs)
+        else:
+            return self._transform_general(func, *args, **kwargs)
+
+        # a reduction transform
+        if not isinstance(result, DataFrame):
+            return self._transform_general(func, *args, **kwargs)
+
+        obj = self._obj_with_exclusions
+
+        # nuiscance columns
+        if not result.columns.equals(obj.columns):
+            return self._transform_general(func, *args, **kwargs)
+
+        return self._transform_fast(result, obj, func)
+
+    def _transform_fast(self, result, obj, func_nm):
+        """
+        Fast transform path for aggregations
+        """
+        # if there were groups with no observations (Categorical only?)
+        # try casting data to original dtype
+        cast = self._transform_should_cast(func_nm)
+
+        # for each col, reshape to to size of original frame
+        # by take operation
+        ids, _, ngroup = self.grouper.group_info
+        output = []
+        for i, _ in enumerate(result.columns):
+            res = algorithms.take_1d(result.iloc[:, i].values, ids)
+            if cast:
+                res = self._try_cast(res, obj.iloc[:, i])
+            output.append(res)
+
+        return DataFrame._from_arrays(output, columns=result.columns,
+                                      index=obj.index)
+
+    def _define_paths(self, func, *args, **kwargs):
+        if isinstance(func, compat.string_types):
+            fast_path = lambda group: getattr(group, func)(*args, **kwargs)
+            slow_path = lambda group: group.apply(
+                lambda x: getattr(x, func)(*args, **kwargs), axis=self.axis)
+        else:
+            fast_path = lambda group: func(group, *args, **kwargs)
+            slow_path = lambda group: group.apply(
+                lambda x: func(x, *args, **kwargs), axis=self.axis)
+        return fast_path, slow_path
+
+    def _choose_path(self, fast_path, slow_path, group):
+        path = slow_path
+        res = slow_path(group)
+
+        # if we make it here, test if we can use the fast path
+        try:
+            res_fast = fast_path(group)
+
+            # compare that we get the same results
+            if res.shape == res_fast.shape:
+                res_r = res.values.ravel()
+                res_fast_r = res_fast.values.ravel()
+                mask = notna(res_r)
+            if (res_r[mask] == res_fast_r[mask]).all():
+                path = fast_path
+
+        except Exception:
+            pass
+        return path, res
+
+    def _transform_item_by_item(self, obj, wrapper):
+        # iterate through columns
+        output = {}
+        inds = []
+        for i, col in enumerate(obj):
+            try:
+                output[col] = self[col].transform(wrapper)
+                inds.append(i)
+            except Exception:
+                pass
+
+        if len(output) == 0:  # pragma: no cover
+            raise TypeError('Transform function invalid for data types')
+
+        columns = obj.columns
+        if len(output) < len(obj.columns):
+            columns = columns.take(inds)
+
+        return DataFrame(output, index=obj.index, columns=columns)
+
+    def filter(self, func, dropna=True, *args, **kwargs):  # noqa
+        """
+        Return a copy of a DataFrame excluding elements from groups that
+        do not satisfy the boolean criterion specified by func.
+
+        Parameters
+        ----------
+        f : function
+            Function to apply to each subframe. Should return True or False.
+        dropna : Drop groups that do not pass the filter. True by default;
+            if False, groups that evaluate False are filled with NaNs.
+
+        Notes
+        -----
+        Each subframe is endowed the attribute 'name' in case you need to know
+        which group you are working on.
+
+        Examples
+        --------
+        >>> import pandas as pd
+        >>> df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
+        ...                           'foo', 'bar'],
+        ...                    'B' : [1, 2, 3, 4, 5, 6],
+        ...                    'C' : [2.0, 5., 8., 1., 2., 9.]})
+        >>> grouped = df.groupby('A')
+        >>> grouped.filter(lambda x: x['B'].mean() > 3.)
+             A  B    C
+        1  bar  2  5.0
+        3  bar  4  1.0
+        5  bar  6  9.0
+
+        Returns
+        -------
+        filtered : DataFrame
+        """
+
+        indices = []
+
+        obj = self._selected_obj
+        gen = self.grouper.get_iterator(obj, axis=self.axis)
+
+        for name, group in gen:
+            object.__setattr__(group, 'name', name)
+
+            res = func(group, *args, **kwargs)
+
+            try:
+                res = res.squeeze()
+            except AttributeError:  # allow e.g., scalars and frames to pass
+                pass
+
+            # interpret the result of the filter
+            if is_bool(res) or (is_scalar(res) and isna(res)):
+                if res and notna(res):
+                    indices.append(self._get_index(name))
+            else:
+                # non scalars aren't allowed
+                raise TypeError("filter function returned a %s, "
+                                "but expected a scalar bool" %
+                                type(res).__name__)
+
+        return self._apply_filter(indices, dropna)
+
+
+class DataFrameGroupBy(NDFrameGroupBy):
+    _apply_whitelist = _dataframe_apply_whitelist
+    #
+    # Make class defs of attributes on DataFrameGroupBy whitelist.
+    for _def_str in _whitelist_method_generator(DataFrame, _apply_whitelist):
+        exec(_def_str)
+
+    _block_agg_axis = 1
+
+    _agg_doc = dedent("""
+    Examples
+    --------
+
+    >>> df = pd.DataFrame({'A': [1, 1, 2, 2],
+    ...                    'B': [1, 2, 3, 4],
+    ...                    'C': np.random.randn(4)})
+
+    >>> df
+       A  B         C
+    0  1  1  0.362838
+    1  1  2  0.227877
+    2  2  3  1.267767
+    3  2  4 -0.562860
+
+    The aggregation is for each column.
+
+    >>> df.groupby('A').agg('min')
+       B         C
+    A
+    1  1  0.227877
+    2  3 -0.562860
+
+    Multiple aggregations
+
+    >>> df.groupby('A').agg(['min', 'max'])
+        B             C
+      min max       min       max
+    A
+    1   1   2  0.227877  0.362838
+    2   3   4 -0.562860  1.267767
+
+    Select a column for aggregation
+
+    >>> df.groupby('A').B.agg(['min', 'max'])
+       min  max
+    A
+    1    1    2
+    2    3    4
+
+    Different aggregations per column
+
+    >>> df.groupby('A').agg({'B': ['min', 'max'], 'C': 'sum'})
+        B             C
+      min max       sum
+    A
+    1   1   2  0.590716
+    2   3   4  0.704907
+
+    See also
+    --------
+    pandas.DataFrame.groupby.apply
+    pandas.DataFrame.groupby.transform
+    pandas.DataFrame.aggregate
+
+    """)
+
+    @Appender(_agg_doc)
+    @Appender(_shared_docs['aggregate'] % dict(
+        klass='DataFrame',
+        versionadded='',
+        axis=''))
+    def aggregate(self, arg, *args, **kwargs):
+        return super(DataFrameGroupBy, self).aggregate(arg, *args, **kwargs)
+
+    agg = aggregate
+
+    def _gotitem(self, key, ndim, subset=None):
+        """
+        sub-classes to define
+        return a sliced object
+
+        Parameters
+        ----------
+        key : string / list of selections
+        ndim : 1,2
+            requested ndim of result
+        subset : object, default None
+            subset to act on
+        """
+
+        if ndim == 2:
+            if subset is None:
+                subset = self.obj
+            return DataFrameGroupBy(subset, self.grouper, selection=key,
+                                    grouper=self.grouper,
+                                    exclusions=self.exclusions,
+                                    as_index=self.as_index)
+        elif ndim == 1:
+            if subset is None:
+                subset = self.obj[key]
+            return SeriesGroupBy(subset, selection=key,
+                                 grouper=self.grouper)
+
+        raise AssertionError("invalid ndim for _gotitem")
+
+    def _wrap_generic_output(self, result, obj):
+        result_index = self.grouper.levels[0]
+
+        if self.axis == 0:
+            return DataFrame(result, index=obj.columns,
+                             columns=result_index).T
+        else:
+            return DataFrame(result, index=obj.index,
+                             columns=result_index)
+
+    def _get_data_to_aggregate(self):
+        obj = self._obj_with_exclusions
+        if self.axis == 1:
+            return obj.T._data, 1
+        else:
+            return obj._data, 1
+
+    def _insert_inaxis_grouper_inplace(self, result):
+        # zip in reverse so we can always insert at loc 0
+        izip = zip(* map(reversed, (
+            self.grouper.names,
+            self.grouper.get_group_levels(),
+            [grp.in_axis for grp in self.grouper.groupings])))
+
+        for name, lev, in_axis in izip:
+            if in_axis:
+                result.insert(0, name, lev)
+
+    def _wrap_aggregated_output(self, output, names=None):
+        agg_axis = 0 if self.axis == 1 else 1
+        agg_labels = self._obj_with_exclusions._get_axis(agg_axis)
+
+        output_keys = self._decide_output_index(output, agg_labels)
+
+        if not self.as_index:
+            result = DataFrame(output, columns=output_keys)
+            self._insert_inaxis_grouper_inplace(result)
+            result = result._consolidate()
+        else:
+            index = self.grouper.result_index
+            result = DataFrame(output, index=index, columns=output_keys)
+
+        if self.axis == 1:
+            result = result.T
+
+        return self._reindex_output(result)._convert(datetime=True)
+
+    def _wrap_transformed_output(self, output, names=None):
+        return DataFrame(output, index=self.obj.index)
+
+    def _wrap_agged_blocks(self, items, blocks):
+        if not self.as_index:
+            index = np.arange(blocks[0].values.shape[-1])
+            mgr = BlockManager(blocks, [items, index])
+            result = DataFrame(mgr)
+
+            self._insert_inaxis_grouper_inplace(result)
+            result = result._consolidate()
+        else:
+            index = self.grouper.result_index
+            mgr = BlockManager(blocks, [items, index])
+            result = DataFrame(mgr)
+
+        if self.axis == 1:
+            result = result.T
+
+        return self._reindex_output(result)._convert(datetime=True)
+
+    def _reindex_output(self, result):
+        """
+        If we have categorical groupers, then we want to make sure that
+        we have a fully reindex-output to the levels. These may have not
+        participated in the groupings (e.g. may have all been
+        nan groups);
+
+        This can re-expand the output space
+        """
+
+        # we need to re-expand the output space to accomodate all values
+        # whether observed or not in the cartesian product of our groupes
+        groupings = self.grouper.groupings
+        if groupings is None:
+            return result
+        elif len(groupings) == 1:
+            return result
+
+        # if we only care about the observed values
+        # we are done
+        elif self.observed:
+            return result
+
+        # reindexing only applies to a Categorical grouper
+        elif not any(isinstance(ping.grouper, (Categorical, CategoricalIndex))
+                     for ping in groupings):
+            return result
+
+        levels_list = [ping.group_index for ping in groupings]
+        index, _ = MultiIndex.from_product(
+            levels_list, names=self.grouper.names).sortlevel()
+
+        if self.as_index:
+            d = {self.obj._get_axis_name(self.axis): index, 'copy': False}
+            return result.reindex(**d)
+
+        # GH 13204
+        # Here, the categorical in-axis groupers, which need to be fully
+        # expanded, are columns in `result`. An idea is to do:
+        # result = result.set_index(self.grouper.names)
+        #                .reindex(index).reset_index()
+        # but special care has to be taken because of possible not-in-axis
+        # groupers.
+        # So, we manually select and drop the in-axis grouper columns,
+        # reindex `result`, and then reset the in-axis grouper columns.
+
+        # Select in-axis groupers
+        in_axis_grps = [(i, ping.name) for (i, ping)
+                        in enumerate(groupings) if ping.in_axis]
+        g_nums, g_names = zip(*in_axis_grps)
+
+        result = result.drop(labels=list(g_names), axis=1)
+
+        # Set a temp index and reindex (possibly expanding)
+        result = result.set_index(self.grouper.result_index
+                                  ).reindex(index, copy=False)
+
+        # Reset in-axis grouper columns
+        # (using level numbers `g_nums` because level names may not be unique)
+        result = result.reset_index(level=g_nums)
+
+        return result.reset_index(drop=True)
+
+    def _iterate_column_groupbys(self):
+        for i, colname in enumerate(self._selected_obj.columns):
+            yield colname, SeriesGroupBy(self._selected_obj.iloc[:, i],
+                                         selection=colname,
+                                         grouper=self.grouper,
+                                         exclusions=self.exclusions)
+
+    def _apply_to_column_groupbys(self, func):
+        from pandas.core.reshape.concat import concat
+        return concat(
+            (func(col_groupby) for _, col_groupby
+             in self._iterate_column_groupbys()),
+            keys=self._selected_obj.columns, axis=1)
+
+    def _fill(self, direction, limit=None):
+        """Overridden method to join grouped columns in output"""
+        res = super(DataFrameGroupBy, self)._fill(direction, limit=limit)
+        output = collections.OrderedDict(
+            (grp.name, grp.grouper) for grp in self.grouper.groupings)
+
+        from pandas import concat
+        return concat((self._wrap_transformed_output(output), res), axis=1)
+
+    def count(self):
+        """ Compute count of group, excluding missing values """
+        from pandas.core.dtypes.missing import _isna_ndarraylike as isna
+
+        data, _ = self._get_data_to_aggregate()
+        ids, _, ngroups = self.grouper.group_info
+        mask = ids != -1
+
+        val = ((mask & ~isna(np.atleast_2d(blk.get_values())))
+               for blk in data.blocks)
+        loc = (blk.mgr_locs for blk in data.blocks)
+
+        counter = partial(count_level_2d, labels=ids, max_bin=ngroups, axis=1)
+        blk = map(make_block, map(counter, val), loc)
+
+        return self._wrap_agged_blocks(data.items, list(blk))
+
+    def nunique(self, dropna=True):
+        """
+        Return DataFrame with number of distinct observations per group for
+        each column.
+
+        .. versionadded:: 0.20.0
+
+        Parameters
+        ----------
+        dropna : boolean, default True
+            Don't include NaN in the counts.
+
+        Returns
+        -------
+        nunique: DataFrame
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'id': ['spam', 'egg', 'egg', 'spam',
+        ...                           'ham', 'ham'],
+        ...                    'value1': [1, 5, 5, 2, 5, 5],
+        ...                    'value2': list('abbaxy')})
+        >>> df
+             id  value1 value2
+        0  spam       1      a
+        1   egg       5      b
+        2   egg       5      b
+        3  spam       2      a
+        4   ham       5      x
+        5   ham       5      y
+
+        >>> df.groupby('id').nunique()
+            id  value1  value2
+        id
+        egg    1       1       1
+        ham    1       1       2
+        spam   1       2       1
+
+        # check for rows with the same id but conflicting values
+        >>> df.groupby('id').filter(lambda g: (g.nunique() > 1).any())
+             id  value1 value2
+        0  spam       1      a
+        3  spam       2      a
+        4   ham       5      x
+        5   ham       5      y
+        """
+
+        obj = self._selected_obj
+
+        def groupby_series(obj, col=None):
+            return SeriesGroupBy(obj,
+                                 selection=col,
+                                 grouper=self.grouper).nunique(dropna=dropna)
+
+        if isinstance(obj, Series):
+            results = groupby_series(obj)
+        else:
+            from pandas.core.reshape.concat import concat
+            results = [groupby_series(obj[col], col) for col in obj.columns]
+            results = concat(results, axis=1)
+
+        if not self.as_index:
+            results.index = com._default_index(len(results))
+        return results
+
+    boxplot = boxplot_frame_groupby
+
+
+class PanelGroupBy(NDFrameGroupBy):
+
+    def aggregate(self, arg, *args, **kwargs):
+        return super(PanelGroupBy, self).aggregate(arg, *args, **kwargs)
+
+    agg = aggregate
+
+    def _iterate_slices(self):
+        if self.axis == 0:
+            # kludge
+            if self._selection is None:
+                slice_axis = self._selected_obj.items
+            else:
+                slice_axis = self._selection_list
+            slicer = lambda x: self._selected_obj[x]
+        else:
+            raise NotImplementedError("axis other than 0 is not supported")
+
+        for val in slice_axis:
+            if val in self.exclusions:
+                continue
+
+            yield val, slicer(val)
+
+    def aggregate(self, arg, *args, **kwargs):
+        """
+        Aggregate using input function or dict of {column -> function}
+
+        Parameters
+        ----------
+        arg : function or dict
+            Function to use for aggregating groups. If a function, must either
+            work when passed a Panel or when passed to Panel.apply. If
+            pass a dict, the keys must be DataFrame column names
+
+        Returns
+        -------
+        aggregated : Panel
+        """
+        if isinstance(arg, compat.string_types):
+            return getattr(self, arg)(*args, **kwargs)
+
+        return self._aggregate_generic(arg, *args, **kwargs)
+
+    def _wrap_generic_output(self, result, obj):
+        if self.axis == 0:
+            new_axes = list(obj.axes)
+            new_axes[0] = self.grouper.result_index
+        elif self.axis == 1:
+            x, y, z = obj.axes
+            new_axes = [self.grouper.result_index, z, x]
+        else:
+            x, y, z = obj.axes
+            new_axes = [self.grouper.result_index, y, x]
+
+        result = Panel._from_axes(result, new_axes)
+
+        if self.axis == 1:
+            result = result.swapaxes(0, 1).swapaxes(0, 2)
+        elif self.axis == 2:
+            result = result.swapaxes(0, 2)
+
+        return result
+
+    def _aggregate_item_by_item(self, func, *args, **kwargs):
+        obj = self._obj_with_exclusions
+        result = {}
+
+        if self.axis > 0:
+            for item in obj:
+                try:
+                    itemg = DataFrameGroupBy(obj[item],
+                                             axis=self.axis - 1,
+                                             grouper=self.grouper)
+                    result[item] = itemg.aggregate(func, *args, **kwargs)
+                except (ValueError, TypeError):
+                    raise
+            new_axes = list(obj.axes)
+            new_axes[self.axis] = self.grouper.result_index
+            return Panel._from_axes(result, new_axes)
+        else:
+            raise ValueError("axis value must be greater than 0")
+
+    def _wrap_aggregated_output(self, output, names=None):
+        raise com.AbstractMethodError(self)
+
+
+# ----------------------------------------------------------------------
+# Splitting / application
+
+
+class DataSplitter(object):
+
+    def __init__(self, data, labels, ngroups, axis=0):
+        self.data = data
+        self.labels = _ensure_int64(labels)
+        self.ngroups = ngroups
+
+        self.axis = axis
+
+    @cache_readonly
+    def slabels(self):
+        # Sorted labels
+        return algorithms.take_nd(self.labels, self.sort_idx, allow_fill=False)
+
+    @cache_readonly
+    def sort_idx(self):
+        # Counting sort indexer
+        return get_group_index_sorter(self.labels, self.ngroups)
+
+    def __iter__(self):
+        sdata = self._get_sorted_data()
+
+        if self.ngroups == 0:
+            # we are inside a generator, rather than raise StopIteration
+            # we merely return signal the end
+            return
+
+        starts, ends = lib.generate_slices(self.slabels, self.ngroups)
+
+        for i, (start, end) in enumerate(zip(starts, ends)):
+            # Since I'm now compressing the group ids, it's now not "possible"
+            # to produce empty slices because such groups would not be observed
+            # in the data
+            # if start >= end:
+            #     raise AssertionError('Start %s must be less than end %s'
+            #                          % (str(start), str(end)))
+            yield i, self._chop(sdata, slice(start, end))
+
+    def _get_sorted_data(self):
+        return self.data._take(self.sort_idx, axis=self.axis)
+
+    def _chop(self, sdata, slice_obj):
+        return sdata.iloc[slice_obj]
+
+    def apply(self, f):
+        raise com.AbstractMethodError(self)
+
+
+class SeriesSplitter(DataSplitter):
+
+    def _chop(self, sdata, slice_obj):
+        return sdata._get_values(slice_obj).to_dense()
+
+
+class FrameSplitter(DataSplitter):
+
+    def __init__(self, data, labels, ngroups, axis=0):
+        super(FrameSplitter, self).__init__(data, labels, ngroups, axis=axis)
+
+    def fast_apply(self, f, names):
+        # must return keys::list, values::list, mutated::bool
+        try:
+            starts, ends = lib.generate_slices(self.slabels, self.ngroups)
+        except Exception:
+            # fails when all -1
+            return [], True
+
+        sdata = self._get_sorted_data()
+        results, mutated = reduction.apply_frame_axis0(sdata, f, names,
+                                                       starts, ends)
+
+        return results, mutated
+
+    def _chop(self, sdata, slice_obj):
+        if self.axis == 0:
+            return sdata.iloc[slice_obj]
+        else:
+            return sdata._slice(slice_obj, axis=1)  # .loc[:, slice_obj]
+
+
+class NDFrameSplitter(DataSplitter):
+
+    def __init__(self, data, labels, ngroups, axis=0):
+        super(NDFrameSplitter, self).__init__(data, labels, ngroups, axis=axis)
+
+        self.factory = data._constructor
+
+    def _get_sorted_data(self):
+        # this is the BlockManager
+        data = self.data._data
+
+        # this is sort of wasteful but...
+        sorted_axis = data.axes[self.axis].take(self.sort_idx)
+        sorted_data = data.reindex_axis(sorted_axis, axis=self.axis)
+
+        return sorted_data
+
+    def _chop(self, sdata, slice_obj):
+        return self.factory(sdata.get_slice(slice_obj, axis=self.axis))
+
+
+def get_splitter(data, *args, **kwargs):
+    if isinstance(data, Series):
+        klass = SeriesSplitter
+    elif isinstance(data, DataFrame):
+        klass = FrameSplitter
+    else:
+        klass = NDFrameSplitter
+
+    return klass(data, *args, **kwargs)
diff --git a/pandas/core/index.py b/pandas/core/index.py
index 256ece6539b6f..2d1c22f5623a1 100644
--- a/pandas/core/index.py
+++ b/pandas/core/index.py
@@ -1,6117 +1,3 @@
-# pylint: disable=E1101,E1103,W0232
-import datetime
-import warnings
-import operator
-from functools import partial
-from sys import getsizeof
-
-import numpy as np
-import pandas.tslib as tslib
-import pandas.lib as lib
-import pandas.algos as _algos
-import pandas.index as _index
-from pandas.lib import Timestamp, Timedelta, is_datetime_array
-
-from pandas.compat import range, zip, lrange, lzip, u, map
-from pandas import compat
-from pandas.core import algorithms
-from pandas.core.base import PandasObject, FrozenList, FrozenNDArray, IndexOpsMixin, _shared_docs, PandasDelegate
-from pandas.util.decorators import (Appender, Substitution, cache_readonly,
-                                    deprecate, deprecate_kwarg)
-import pandas.core.common as com
-from pandas.core.common import (isnull, array_equivalent, is_dtype_equal, is_object_dtype,
-                                is_datetimetz, ABCSeries, ABCCategorical, ABCPeriodIndex,
-                                _values_from_object, is_float, is_integer, is_iterator, is_categorical_dtype,
-                                _ensure_object, _ensure_int64, is_bool_indexer,
-                                is_list_like, is_bool_dtype, is_null_slice, is_integer_dtype)
-from pandas.core.config import get_option
-from pandas.io.common import PerformanceWarning
-
-
-
-
-# simplify
-default_pprint = lambda x, max_seq_items=None: com.pprint_thing(x,
-                                                                escape_chars=('\t', '\r', '\n'),
-                                                                quote_strings=True,
-                                                                max_seq_items=max_seq_items)
-
-
-__all__ = ['Index']
-
-
-_unsortable_types = frozenset(('mixed', 'mixed-integer'))
-
-_index_doc_kwargs = dict(klass='Index', inplace='',
-                         duplicated='np.array')
-
-
-def _try_get_item(x):
-    try:
-        return x.item()
-    except AttributeError:
-        return x
-
-class InvalidIndexError(Exception):
-    pass
-
-_o_dtype = np.dtype(object)
-_Identity = object
-
-def _new_Index(cls, d):
-    """ This is called upon unpickling, rather than the default which doesn't have arguments
-        and breaks __new__ """
-    return cls.__new__(cls, **d)
-
-class Index(IndexOpsMixin, PandasObject):
-
-    """
-    Immutable ndarray implementing an ordered, sliceable set. The basic object
-    storing axis labels for all pandas objects
-
-    Parameters
-    ----------
-    data : array-like (1-dimensional)
-    dtype : NumPy dtype (default: object)
-    copy : bool
-        Make a copy of input ndarray
-    name : object
-        Name to be stored in the index
-    tupleize_cols : bool (default: True)
-        When True, attempt to create a MultiIndex if possible
-
-    Notes
-    -----
-    An Index instance can **only** contain hashable objects
-    """
-    # To hand over control to subclasses
-    _join_precedence = 1
-
-    # Cython methods
-    _groupby = _algos.groupby_object
-    _arrmap = _algos.arrmap_object
-    _left_indexer_unique = _algos.left_join_indexer_unique_object
-    _left_indexer = _algos.left_join_indexer_object
-    _inner_indexer = _algos.inner_join_indexer_object
-    _outer_indexer = _algos.outer_join_indexer_object
-    _box_scalars = False
-
-    _typ = 'index'
-    _data = None
-    _id = None
-    name = None
-    asi8 = None
-    _comparables = ['name']
-    _attributes = ['name']
-    _allow_index_ops = True
-    _allow_datetime_index_ops = False
-    _allow_period_index_ops = False
-    _is_numeric_dtype = False
-
-    _engine_type = _index.ObjectEngine
-
-    def __new__(cls, data=None, dtype=None, copy=False, name=None, fastpath=False,
-                tupleize_cols=True, **kwargs):
-
-        # no class inference!
-        if fastpath:
-            return cls._simple_new(data, name)
-
-        if is_categorical_dtype(data) or is_categorical_dtype(dtype):
-            return CategoricalIndex(data, copy=copy, name=name, **kwargs)
-
-        if isinstance(data, (np.ndarray, Index, ABCSeries)):
-            if issubclass(data.dtype.type, np.datetime64) or is_datetimetz(data):
-                from pandas.tseries.index import DatetimeIndex
-                result = DatetimeIndex(data, copy=copy, name=name, **kwargs)
-                if dtype is not None and _o_dtype == dtype:
-                    return Index(result.to_pydatetime(), dtype=_o_dtype)
-                else:
-                    return result
-            elif issubclass(data.dtype.type, np.timedelta64):
-                from pandas.tseries.tdi import TimedeltaIndex
-                result = TimedeltaIndex(data, copy=copy, name=name, **kwargs)
-                if dtype is not None and _o_dtype == dtype:
-                    return Index(result.to_pytimedelta(), dtype=_o_dtype)
-                else:
-                    return result
-
-            if dtype is not None:
-                try:
-                    data = np.array(data, dtype=dtype, copy=copy)
-                except (TypeError, ValueError):
-                    pass
-
-            # maybe coerce to a sub-class
-            from pandas.tseries.period import PeriodIndex
-            if isinstance(data, PeriodIndex):
-                return PeriodIndex(data, copy=copy, name=name, **kwargs)
-            if issubclass(data.dtype.type, np.integer):
-                return Int64Index(data, copy=copy, dtype=dtype, name=name)
-            elif issubclass(data.dtype.type, np.floating):
-                return Float64Index(data, copy=copy, dtype=dtype, name=name)
-            elif issubclass(data.dtype.type, np.bool) or is_bool_dtype(data):
-                subarr = data.astype('object')
-            else:
-                subarr = com._asarray_tuplesafe(data, dtype=object)
-
-            # _asarray_tuplesafe does not always copy underlying data,
-            # so need to make sure that this happens
-            if copy:
-                subarr = subarr.copy()
-
-            if dtype is None:
-                inferred = lib.infer_dtype(subarr)
-                if inferred == 'integer':
-                    return Int64Index(subarr.astype('i8'), copy=copy, name=name)
-                elif inferred in ['floating', 'mixed-integer-float']:
-                    return Float64Index(subarr, copy=copy, name=name)
-                elif inferred == 'boolean':
-                    # don't support boolean explicity ATM
-                    pass
-                elif inferred != 'string':
-                    if (inferred.startswith('datetime') or
-                        tslib.is_timestamp_array(subarr)):
-                        from pandas.tseries.index import DatetimeIndex
-                        return DatetimeIndex(subarr, copy=copy, name=name, **kwargs)
-                    elif (inferred.startswith('timedelta') or
-                          lib.is_timedelta_array(subarr)):
-                        from pandas.tseries.tdi import TimedeltaIndex
-                        return TimedeltaIndex(subarr, copy=copy, name=name, **kwargs)
-                    elif inferred == 'period':
-                        return PeriodIndex(subarr, name=name, **kwargs)
-            return cls._simple_new(subarr, name)
-
-        elif hasattr(data, '__array__'):
-            return Index(np.asarray(data), dtype=dtype, copy=copy, name=name,
-                         **kwargs)
-        elif data is None or np.isscalar(data):
-            cls._scalar_data_error(data)
-        else:
-            if tupleize_cols and isinstance(data, list) and data and isinstance(data[0], tuple):
-
-                # we must be all tuples, otherwise don't construct
-                # 10697
-                if all( isinstance(e, tuple) for e in data ):
-                    try:
-                        # must be orderable in py3
-                        if compat.PY3:
-                            sorted(data)
-                        return MultiIndex.from_tuples(
-                            data, names=name or kwargs.get('names'))
-                    except (TypeError, KeyError):
-                        # python2 - MultiIndex fails on mixed types
-                        pass
-            # other iterable of some kind
-            subarr = com._asarray_tuplesafe(data, dtype=object)
-            return Index(subarr, dtype=dtype, copy=copy, name=name, **kwargs)
-
-    @classmethod
-    def _simple_new(cls, values, name=None, dtype=None, **kwargs):
-        """
-        we require the we have a dtype compat for the values
-        if we are passed a non-dtype compat, then coerce using the constructor
-
-        Must be careful not to recurse.
-        """
-        if not hasattr(values, 'dtype'):
-            if values is None and dtype is not None:
-                values = np.empty(0, dtype=dtype)
-            else:
-                values = np.array(values,copy=False)
-                if is_object_dtype(values):
-                    values = cls(values, name=name, dtype=dtype, **kwargs)._values
-
-        result = object.__new__(cls)
-        result._data = values
-        result.name = name
-        for k, v in compat.iteritems(kwargs):
-            setattr(result,k,v)
-        result._reset_identity()
-        return result
-
-    def _update_inplace(self, result, **kwargs):
-        # guard when called from IndexOpsMixin
-        raise TypeError("Index can't be updated inplace")
-
-    def is_(self, other):
-        """
-        More flexible, faster check like ``is`` but that works through views
-
-        Note: this is *not* the same as ``Index.identical()``, which checks
-        that metadata is also the same.
-
-        Parameters
-        ----------
-        other : object
-            other object to compare against.
-
-        Returns
-        -------
-        True if both have same underlying data, False otherwise : bool
-        """
-        # use something other than None to be clearer
-        return self._id is getattr(other, '_id', Ellipsis)
-
-    def _reset_identity(self):
-        """Initializes or resets ``_id`` attribute with new object"""
-        self._id = _Identity()
-
-    # ndarray compat
-    def __len__(self):
-        """
-        return the length of the Index
-        """
-        return len(self._data)
-
-    def __array__(self, dtype=None):
-        """ the array interface, return my values """
-        return self._data.view(np.ndarray)
-
-    def __array_wrap__(self, result, context=None):
-        """
-        Gets called after a ufunc
-        """
-        if is_bool_dtype(result):
-            return result
-
-        attrs = self._get_attributes_dict()
-        attrs = self._maybe_update_attributes(attrs)
-        return Index(result, **attrs)
-
-    @cache_readonly
-    def dtype(self):
-        """ return the dtype object of the underlying data """
-        return self._data.dtype
-
-    @cache_readonly
-    def dtype_str(self):
-        """ return the dtype str of the underlying data """
-        return str(self.dtype)
-
-    @property
-    def values(self):
-        """ return the underlying data as an ndarray """
-        return self._data.view(np.ndarray)
-
-    def get_values(self):
-        """ return the underlying data as an ndarray """
-        return self.values
-
-    # ops compat
-    def tolist(self):
-        """
-        return a list of the Index values
-        """
-        return list(self.values)
-
-    def repeat(self, n):
-        """
-        return a new Index of the values repeated n times
-
-        See also
-        --------
-        numpy.ndarray.repeat
-        """
-        return self._shallow_copy(self._values.repeat(n))
-
-    def ravel(self, order='C'):
-        """
-        return an ndarray of the flattened values of the underlying data
-
-        See also
-        --------
-        numpy.ndarray.ravel
-        """
-        return self._values.ravel(order=order)
-
-    # construction helpers
-    @classmethod
-    def _scalar_data_error(cls, data):
-        raise TypeError(
-            '{0}(...) must be called with a collection of some kind, {1} was '
-            'passed'.format(cls.__name__, repr(data))
-        )
-
-    @classmethod
-    def _string_data_error(cls, data):
-        raise TypeError('String dtype not supported, you may need '
-                        'to explicitly cast to a numeric type')
-
-    @classmethod
-    def _coerce_to_ndarray(cls, data):
-        """coerces data to ndarray, raises on scalar data. Converts other
-        iterables to list first and then to array. Does not touch ndarrays."""
-
-        if not isinstance(data, (np.ndarray, Index)):
-            if data is None or np.isscalar(data):
-                cls._scalar_data_error(data)
-
-            # other iterable of some kind
-            if not isinstance(data, (ABCSeries, list, tuple)):
-                data = list(data)
-            data = np.asarray(data)
-        return data
-
-    def _get_attributes_dict(self):
-        """ return an attributes dict for my class """
-        return dict([ (k,getattr(self,k,None)) for k in self._attributes])
-
-    def view(self, cls=None):
-
-        # we need to see if we are subclassing an
-        # index type here
-        if cls is not None and not hasattr(cls,'_typ'):
-            result = self._data.view(cls)
-        else:
-            result = self._shallow_copy()
-        if isinstance(result, Index):
-            result._id = self._id
-        return result
-
-    def _shallow_copy(self, values=None, infer=False, **kwargs):
-        """
-        create a new Index, don't copy the data, use the same object attributes
-        with passed in attributes taking precedence
-
-        *this is an internal non-public method*
-
-        Parameters
-        ----------
-        values : the values to create the new Index, optional
-        infer : boolean, default False
-            if True, infer the new type of the passed values
-        kwargs : updates the default attributes for this Index
-        """
-        if values is None:
-            values = self.values
-        attributes = self._get_attributes_dict()
-        attributes.update(kwargs)
-
-        if infer:
-            attributes['copy'] = False
-            return Index(values, **attributes)
-
-        return self.__class__._simple_new(values,**attributes)
-
-    def _coerce_scalar_to_index(self, item):
-        """
-        we need to coerce a scalar to a compat for our index type
-
-        Parameters
-        ----------
-        item : scalar item to coerce
-        """
-        return Index([item], dtype=self.dtype, **self._get_attributes_dict())
-
-    def copy(self, names=None, name=None, dtype=None, deep=False):
-        """
-        Make a copy of this object.  Name and dtype sets those attributes on
-        the new object.
-
-        Parameters
-        ----------
-        name : string, optional
-        dtype : numpy dtype or pandas type
-
-        Returns
-        -------
-        copy : Index
-
-        Notes
-        -----
-        In most cases, there should be no functional difference from using
-        ``deep``, but if ``deep`` is passed it will attempt to deepcopy.
-        """
-        if names is not None and name is not None:
-            raise TypeError("Can only provide one of `names` and `name`")
-        if deep:
-            from copy import deepcopy
-            new_index = self._shallow_copy(self._data.copy())
-            name = name or deepcopy(self.name)
-        else:
-            new_index = self._shallow_copy()
-            name = self.name
-        if name is not None:
-            names = [name]
-        if names:
-            new_index = new_index.set_names(names)
-        if dtype:
-            new_index = new_index.astype(dtype)
-        return new_index
-
-    __copy__ = copy
-
-    def __unicode__(self):
-        """
-        Return a string representation for this object.
-
-        Invoked by unicode(df) in py2 only. Yields a Unicode String in both
-        py2/py3.
-        """
-        klass = self.__class__.__name__
-        data = self._format_data()
-        attrs = self._format_attrs()
-        space = self._format_space()
-
-        prepr = (u(",%s") % space).join([u("%s=%s") % (k, v)
-                                          for k, v in attrs])
-
-        # no data provided, just attributes
-        if data is None:
-            data = ''
-
-        res = u("%s(%s%s)") % (klass,
-                               data,
-                               prepr)
-
-        return res
-
-    def _format_space(self):
-
-        # using space here controls if the attributes
-        # are line separated or not (the default)
-
-        #max_seq_items = get_option('display.max_seq_items')
-        #if len(self) > max_seq_items:
-        #    space = "\n%s" % (' ' * (len(klass) + 1))
-        return " "
-
-    @property
-    def _formatter_func(self):
-        """
-        Return the formatted data as a unicode string
-        """
-        return default_pprint
-
-    def _format_data(self):
-        """
-        Return the formatted data as a unicode string
-        """
-        from pandas.core.format import get_console_size, _get_adjustment
-        display_width, _ = get_console_size()
-        if display_width is None:
-            display_width = get_option('display.width') or 80
-
-        space1 = "\n%s" % (' ' * (len(self.__class__.__name__) + 1))
-        space2 = "\n%s" % (' ' * (len(self.__class__.__name__) + 2))
-
-        n = len(self)
-        sep = ','
-        max_seq_items = get_option('display.max_seq_items') or n
-        formatter = self._formatter_func
-
-        # do we want to justify (only do so for non-objects)
-        is_justify = not (self.inferred_type in ('string', 'unicode') or
-                          (self.inferred_type == 'categorical' and
-                           is_object_dtype(self.categories)))
-
-        # are we a truncated display
-        is_truncated = n > max_seq_items
-
-        # adj can optionaly handle unicode eastern asian width
-        adj = _get_adjustment()
-
-        def _extend_line(s, line, value, display_width, next_line_prefix):
-
-            if adj.len(line.rstrip()) + adj.len(value.rstrip()) >= display_width:
-                s += line.rstrip()
-                line = next_line_prefix
-            line += value
-            return s, line
-
-        def best_len(values):
-            if values:
-                return max([adj.len(x) for x in values])
-            else:
-                return 0
-
-        if n == 0:
-            summary = '[], '
-        elif n == 1:
-            first = formatter(self[0])
-            summary = '[%s], ' % first
-        elif n == 2:
-            first = formatter(self[0])
-            last = formatter(self[-1])
-            summary = '[%s, %s], ' % (first, last)
-        else:
-
-            if n > max_seq_items:
-                n = min(max_seq_items//2,10)
-                head = [ formatter(x) for x in self[:n] ]
-                tail = [ formatter(x) for x in self[-n:] ]
-            else:
-                head = []
-                tail = [ formatter(x) for x in self ]
-
-            # adjust all values to max length if needed
-            if is_justify:
-
-                # however, if we are not truncated and we are only a single line, then don't justify
-                if is_truncated or not (len(', '.join(head)) < display_width and len(', '.join(tail)) < display_width):
-                    max_len = max(best_len(head), best_len(tail))
-                    head = [x.rjust(max_len) for x in head]
-                    tail = [x.rjust(max_len) for x in tail]
-
-            summary = ""
-            line = space2
-
-            for i in range(len(head)):
-                word = head[i] + sep + ' '
-                summary, line = _extend_line(summary, line, word,
-                                             display_width, space2)
-
-            if is_truncated:
-                # remove trailing space of last line
-                summary += line.rstrip() + space2 + '...'
-                line = space2
-
-            for i in range(len(tail)-1):
-                word = tail[i] + sep + ' '
-                summary, line = _extend_line(summary, line, word,
-                                             display_width, space2)
-
-            # last value: no sep added + 1 space of width used for trailing ','
-            summary, line = _extend_line(summary, line, tail[-1],
-                                         display_width - 2, space2)
-            summary += line
-            summary += '],'
-
-            if len(summary) > (display_width):
-                summary += space1
-            else:  # one row
-                summary += ' '
-
-            # remove initial space
-            summary = '[' + summary[len(space2):]
-
-        return summary
-
-    def _format_attrs(self):
-        """
-        Return a list of tuples of the (attr,formatted_value)
-        """
-        attrs = []
-        attrs.append(('dtype',"'%s'" % self.dtype))
-        if self.name is not None:
-            attrs.append(('name',default_pprint(self.name)))
-        max_seq_items = get_option('display.max_seq_items') or len(self)
-        if len(self) > max_seq_items:
-            attrs.append(('length',len(self)))
-        return attrs
-
-    def to_series(self, **kwargs):
-        """
-        Create a Series with both index and values equal to the index keys
-        useful with map for returning an indexer based on an index
-
-        Returns
-        -------
-        Series : dtype will be based on the type of the Index values.
-        """
-
-        from pandas import Series
-        return Series(self._to_embed(), index=self, name=self.name)
-
-    def _to_embed(self, keep_tz=False):
-        """
-        *this is an internal non-public method*
-
-        return an array repr of this object, potentially casting to object
-
-        """
-        return self.values.copy()
-
-    def astype(self, dtype):
-        return Index(self.values.astype(dtype), name=self.name,
-                     dtype=dtype)
-
-    def to_datetime(self, dayfirst=False):
-        """
-        For an Index containing strings or datetime.datetime objects, attempt
-        conversion to DatetimeIndex
-        """
-        from pandas.tseries.index import DatetimeIndex
-        if self.inferred_type == 'string':
-            from dateutil.parser import parse
-            parser = lambda x: parse(x, dayfirst=dayfirst)
-            parsed = lib.try_parse_dates(self.values, parser=parser)
-            return DatetimeIndex(parsed)
-        else:
-            return DatetimeIndex(self.values)
-
-    def _assert_can_do_setop(self, other):
-        if not com.is_list_like(other):
-            raise TypeError('Input must be Index or array-like')
-        return True
-
-    def _convert_can_do_setop(self, other):
-        if not isinstance(other, Index):
-            other = Index(other, name=self.name)
-            result_name = self.name
-        else:
-            result_name = self.name if self.name == other.name else None
-        return other, result_name
-
-    @property
-    def nlevels(self):
-        return 1
-
-    def _get_names(self):
-        return FrozenList((self.name,))
-
-    def _set_names(self, values, level=None):
-        if len(values) != 1:
-            raise ValueError('Length of new names must be 1, got %d'
-                             % len(values))
-        self.name = values[0]
-
-    names = property(fset=_set_names, fget=_get_names)
-
-    def set_names(self, names, level=None, inplace=False):
-        """
-        Set new names on index. Defaults to returning new index.
-
-        Parameters
-        ----------
-        names : str or sequence
-            name(s) to set
-        level : int or level name, or sequence of int / level names (default None)
-            If the index is a MultiIndex (hierarchical), level(s) to set (None for all levels)
-            Otherwise level must be None
-        inplace : bool
-            if True, mutates in place
-
-        Returns
-        -------
-        new index (of same type and class...etc) [if inplace, returns None]
-
-        Examples
-        --------
-        >>> Index([1, 2, 3, 4]).set_names('foo')
-        Int64Index([1, 2, 3, 4], dtype='int64')
-        >>> Index([1, 2, 3, 4]).set_names(['foo'])
-        Int64Index([1, 2, 3, 4], dtype='int64')
-        >>> idx = MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
-                                          (2, u'one'), (2, u'two')],
-                                          names=['foo', 'bar'])
-        >>> idx.set_names(['baz', 'quz'])
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                   names=[u'baz', u'quz'])
-        >>> idx.set_names('baz', level=0)
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                   names=[u'baz', u'bar'])
-        """
-        if level is not None and self.nlevels == 1:
-            raise ValueError('Level must be None for non-MultiIndex')
-
-        if level is not None and not is_list_like(level) and is_list_like(names):
-            raise TypeError("Names must be a string")
-
-        if not is_list_like(names) and level is None and self.nlevels > 1:
-            raise TypeError("Must pass list-like as `names`.")
-
-        if not is_list_like(names):
-            names = [names]
-        if level is not None and not is_list_like(level):
-            level = [level]
-
-        if inplace:
-            idx = self
-        else:
-            idx = self._shallow_copy()
-        idx._set_names(names, level=level)
-        if not inplace:
-            return idx
-
-    def rename(self, name, inplace=False):
-        """
-        Set new names on index. Defaults to returning new index.
-
-        Parameters
-        ----------
-        name : str or list
-            name to set
-        inplace : bool
-            if True, mutates in place
-
-        Returns
-        -------
-        new index (of same type and class...etc) [if inplace, returns None]
-        """
-        return self.set_names([name], inplace=inplace)
-
-    @property
-    def _has_complex_internals(self):
-        # to disable groupby tricks in MultiIndex
-        return False
-
-    def summary(self, name=None):
-        if len(self) > 0:
-            head = self[0]
-            if hasattr(head, 'format') and\
-               not isinstance(head, compat.string_types):
-                head = head.format()
-            tail = self[-1]
-            if hasattr(tail, 'format') and\
-               not isinstance(tail, compat.string_types):
-                tail = tail.format()
-            index_summary = ', %s to %s' % (com.pprint_thing(head),
-                                            com.pprint_thing(tail))
-        else:
-            index_summary = ''
-
-        if name is None:
-            name = type(self).__name__
-        return '%s: %s entries%s' % (name, len(self), index_summary)
-
-    def _mpl_repr(self):
-        # how to represent ourselves to matplotlib
-        return self.values
-
-    _na_value = np.nan
-    """The expected NA value to use with this index."""
-
-    @property
-    def is_monotonic(self):
-        """ alias for is_monotonic_increasing (deprecated) """
-        return self._engine.is_monotonic_increasing
-
-    @property
-    def is_monotonic_increasing(self):
-        """
-        return if the index is monotonic increasing (only equal or
-        increasing) values.
-        """
-        return self._engine.is_monotonic_increasing
-
-    @property
-    def is_monotonic_decreasing(self):
-        """
-        return if the index is monotonic decreasing (only equal or
-        decreasing) values.
-        """
-        return self._engine.is_monotonic_decreasing
-
-    def is_lexsorted_for_tuple(self, tup):
-        return True
-
-    @cache_readonly(allow_setting=True)
-    def is_unique(self):
-        """ return if the index has unique values """
-        return self._engine.is_unique
-
-    @property
-    def has_duplicates(self):
-        return not self.is_unique
-
-    def is_boolean(self):
-        return self.inferred_type in ['boolean']
-
-    def is_integer(self):
-        return self.inferred_type in ['integer']
-
-    def is_floating(self):
-        return self.inferred_type in ['floating', 'mixed-integer-float']
-
-    def is_numeric(self):
-        return self.inferred_type in ['integer', 'floating']
-
-    def is_object(self):
-        return is_object_dtype(self.dtype)
-
-    def is_categorical(self):
-        return self.inferred_type in ['categorical']
-
-    def is_mixed(self):
-        return 'mixed' in self.inferred_type
-
-    def holds_integer(self):
-        return self.inferred_type in ['integer', 'mixed-integer']
-
-    def _convert_scalar_indexer(self, key, kind=None):
-        """
-        convert a scalar indexer
-
-        Parameters
-        ----------
-        key : label of the slice bound
-        kind : optional, type of the indexing operation (loc/ix/iloc/None)
-
-        right now we are converting
-        floats -> ints if the index supports it
-        """
-
-        def to_int():
-            ikey = int(key)
-            if ikey != key:
-                return self._invalid_indexer('label', key)
-            return ikey
-
-        if kind == 'iloc':
-            if is_integer(key):
-                return key
-            elif is_float(key):
-                key = to_int()
-                warnings.warn("scalar indexers for index type {0} should be integers and not floating point".format(
-                    type(self).__name__), FutureWarning, stacklevel=5)
-                return key
-            return self._invalid_indexer('label', key)
-
-        if is_float(key):
-            if not self.is_floating():
-                warnings.warn("scalar indexers for index type {0} should be integers and not floating point".format(
-                    type(self).__name__), FutureWarning, stacklevel=3)
-            return to_int()
-
-        return key
-
-    def _convert_slice_indexer_getitem(self, key, is_index_slice=False):
-        """ called from the getitem slicers, determine how to treat the key
-            whether positional or not """
-        if self.is_integer() or is_index_slice:
-            return key
-        return self._convert_slice_indexer(key)
-
-    def _convert_slice_indexer(self, key, kind=None):
-        """
-        convert a slice indexer. disallow floats in the start/stop/step
-
-        Parameters
-        ----------
-        key : label of the slice bound
-        kind : optional, type of the indexing operation (loc/ix/iloc/None)
-        """
-
-        # if we are not a slice, then we are done
-        if not isinstance(key, slice):
-            return key
-
-        # validate iloc
-        if kind == 'iloc':
-
-            # need to coerce to_int if needed
-            def f(c):
-                v = getattr(key,c)
-                if v is None or is_integer(v):
-                    return v
-
-                # warn if it's a convertible float
-                if v == int(v):
-                    warnings.warn("slice indexers when using iloc should be integers "
-                                  "and not floating point", FutureWarning, stacklevel=7)
-                    return int(v)
-
-                self._invalid_indexer('slice {0} value'.format(c), v)
-
-            return slice(*[ f(c) for c in ['start','stop','step']])
-
-        # validate slicers
-        def validate(v):
-            if v is None or is_integer(v):
-                return True
-
-            # dissallow floats (except for .ix)
-            elif is_float(v):
-                if kind == 'ix':
-                    return True
-
-                return False
-
-            return True
-        for c in ['start','stop','step']:
-            v = getattr(key,c)
-            if not validate(v):
-                self._invalid_indexer('slice {0} value'.format(c), v)
-
-        # figure out if this is a positional indexer
-        start, stop, step = key.start, key.stop, key.step
-
-        def is_int(v):
-            return v is None or is_integer(v)
-
-        is_null_slicer = start is None and stop is None
-        is_index_slice = is_int(start) and is_int(stop)
-        is_positional = is_index_slice and not self.is_integer()
-
-        if kind == 'getitem':
-            return self._convert_slice_indexer_getitem(
-                key, is_index_slice=is_index_slice)
-
-        # convert the slice to an indexer here
-
-        # if we are mixed and have integers
-        try:
-            if is_positional and self.is_mixed():
-                if start is not None:
-                    i = self.get_loc(start)
-                if stop is not None:
-                    j = self.get_loc(stop)
-                is_positional = False
-        except KeyError:
-            if self.inferred_type == 'mixed-integer-float':
-                raise
-
-        if is_null_slicer:
-            indexer = key
-        elif is_positional:
-            indexer = key
-        else:
-            try:
-                indexer = self.slice_indexer(start, stop, step)
-            except Exception:
-                if is_index_slice:
-                    if self.is_integer():
-                        raise
-                    else:
-                        indexer = key
-                else:
-                    raise
-
-        return indexer
-
-    def _convert_list_indexer(self, keyarr, kind=None):
-        """
-        passed a key that is tuplesafe that is integer based
-        and we have a mixed index (e.g. number/labels). figure out
-        the indexer. return None if we can't help
-        """
-        if kind in [None, 'iloc', 'ix'] and is_integer_dtype(keyarr) \
-           and not self.is_floating() and not isinstance(keyarr, ABCPeriodIndex):
-
-            if self.inferred_type != 'integer':
-                keyarr = np.where(keyarr < 0,
-                                  len(self) + keyarr, keyarr)
-
-            if self.inferred_type == 'mixed-integer':
-                indexer = self.get_indexer(keyarr)
-                if (indexer >= 0).all():
-                    return indexer
-                # missing values are flagged as -1 by get_indexer and negative indices are already
-                # converted to positive indices in the above if-statement, so the negative flags are changed to
-                # values outside the range of indices so as to trigger an IndexError in maybe_convert_indices
-                indexer[indexer < 0] = len(self)
-                from pandas.core.indexing import maybe_convert_indices
-                return maybe_convert_indices(indexer, len(self))
-
-            elif not self.inferred_type == 'integer':
-                return keyarr
-
-        return None
-
-    def _invalid_indexer(self, form, key):
-        """ consistent invalid indexer message """
-        raise TypeError("cannot do {form} indexing on {klass} with these "
-                        "indexers [{key}] of {kind}".format(form=form,
-                                                           klass=type(self),
-                                                           key=key,
-                                                           kind=type(key)))
-
-    def get_duplicates(self):
-        from collections import defaultdict
-        counter = defaultdict(lambda: 0)
-        for k in self.values:
-            counter[k] += 1
-        return sorted(k for k, v in compat.iteritems(counter) if v > 1)
-
-    _get_duplicates = get_duplicates
-
-    def _cleanup(self):
-        self._engine.clear_mapping()
-
-    @cache_readonly
-    def _engine(self):
-        # property, for now, slow to look up
-        return self._engine_type(lambda: self.values, len(self))
-
-    def _validate_index_level(self, level):
-        """
-        Validate index level.
-
-        For single-level Index getting level number is a no-op, but some
-        verification must be done like in MultiIndex.
-
-        """
-        if isinstance(level, int):
-            if level < 0 and level != -1:
-                raise IndexError("Too many levels: Index has only 1 level,"
-                                 " %d is not a valid level number" % (level,))
-            elif level > 0:
-                raise IndexError("Too many levels:"
-                                 " Index has only 1 level, not %d" %
-                                 (level + 1))
-        elif level != self.name:
-            raise KeyError('Level %s must be same as name (%s)'
-                           % (level, self.name))
-
-    def _get_level_number(self, level):
-        self._validate_index_level(level)
-        return 0
-
-    @cache_readonly
-    def inferred_type(self):
-        """ return a string of the type inferred from the values """
-        return lib.infer_dtype(self)
-
-    def is_type_compatible(self, kind):
-        return kind == self.inferred_type
-
-    @cache_readonly
-    def is_all_dates(self):
-        if self._data is None:
-            return False
-        return is_datetime_array(_ensure_object(self.values))
-
-    def __iter__(self):
-        return iter(self.values)
-
-    def __reduce__(self):
-        d = dict(data=self._data)
-        d.update(self._get_attributes_dict())
-        return _new_Index, (self.__class__, d), None
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-
-        if isinstance(state, dict):
-            self._data = state.pop('data')
-            for k, v in compat.iteritems(state):
-                setattr(self, k, v)
-
-        elif isinstance(state, tuple):
-
-            if len(state) == 2:
-                nd_state, own_state = state
-                data = np.empty(nd_state[1], dtype=nd_state[2])
-                np.ndarray.__setstate__(data, nd_state)
-                self.name = own_state[0]
-
-            else:  # pragma: no cover
-                data = np.empty(state)
-                np.ndarray.__setstate__(data, state)
-
-            self._data = data
-            self._reset_identity()
-        else:
-            raise Exception("invalid pickle state")
-    _unpickle_compat = __setstate__
-
-    def __deepcopy__(self, memo={}):
-        return self.copy(deep=True)
-
-    def __nonzero__(self):
-        raise ValueError("The truth value of a {0} is ambiguous. "
-                         "Use a.empty, a.bool(), a.item(), a.any() or a.all()."
-                         .format(self.__class__.__name__))
-
-    __bool__ = __nonzero__
-
-    def __contains__(self, key):
-        hash(key)
-        # work around some kind of odd cython bug
-        try:
-            return key in self._engine
-        except TypeError:
-            return False
-
-    def __hash__(self):
-        raise TypeError("unhashable type: %r" % type(self).__name__)
-
-    def __setitem__(self, key, value):
-        raise TypeError("Index does not support mutable operations")
-
-    def __getitem__(self, key):
-        """
-        Override numpy.ndarray's __getitem__ method to work as desired.
-
-        This function adds lists and Series as valid boolean indexers
-        (ndarrays only supports ndarray with dtype=bool).
-
-        If resulting ndim != 1, plain ndarray is returned instead of
-        corresponding `Index` subclass.
-
-        """
-        # There's no custom logic to be implemented in __getslice__, so it's
-        # not overloaded intentionally.
-        getitem = self._data.__getitem__
-        promote = self._shallow_copy
-
-        if np.isscalar(key):
-            return getitem(key)
-
-        if isinstance(key, slice):
-            # This case is separated from the conditional above to avoid
-            # pessimization of basic indexing.
-            return promote(getitem(key))
-
-        if is_bool_indexer(key):
-            key = np.asarray(key)
-
-        key = _values_from_object(key)
-        result = getitem(key)
-        if not np.isscalar(result):
-            return promote(result)
-        else:
-            return result
-
-    def _ensure_compat_append(self, other):
-        """
-        prepare the append
-
-        Returns
-        -------
-        list of to_concat, name of result Index
-        """
-        name = self.name
-        to_concat = [self]
-
-        if isinstance(other, (list, tuple)):
-            to_concat = to_concat + list(other)
-        else:
-            to_concat.append(other)
-
-        for obj in to_concat:
-            if (isinstance(obj, Index) and
-                obj.name != name and
-                obj.name is not None):
-                name = None
-                break
-
-        to_concat = self._ensure_compat_concat(to_concat)
-        to_concat = [x._values if isinstance(x, Index) else x
-                     for x in to_concat]
-        return to_concat, name
-
-    def append(self, other):
-        """
-        Append a collection of Index options together
-
-        Parameters
-        ----------
-        other : Index or list/tuple of indices
-
-        Returns
-        -------
-        appended : Index
-        """
-        to_concat, name = self._ensure_compat_append(other)
-        attribs = self._get_attributes_dict()
-        attribs['name'] = name
-        return self._shallow_copy(np.concatenate(to_concat), infer=True, **attribs)
-
-    @staticmethod
-    def _ensure_compat_concat(indexes):
-        from pandas.tseries.api import DatetimeIndex, PeriodIndex, TimedeltaIndex
-        klasses = DatetimeIndex, PeriodIndex, TimedeltaIndex
-
-        is_ts = [isinstance(idx, klasses) for idx in indexes]
-
-        if any(is_ts) and not all(is_ts):
-            return [_maybe_box(idx) for idx in indexes]
-
-        return indexes
-
-    def take(self, indices, axis=0, allow_fill=True, fill_value=None):
-        """
-        return a new Index of the values selected by the indexer
-
-        For internal compatibility with numpy arrays.
-
-        # filling must always be None/nan here
-        # but is passed thru internally
-
-        See also
-        --------
-        numpy.ndarray.take
-        """
-
-        indices = com._ensure_platform_int(indices)
-        taken = self.values.take(indices)
-        return self._shallow_copy(taken)
-
-    def putmask(self, mask, value):
-        """
-        return a new Index of the values set with the mask
-
-        See also
-        --------
-        numpy.ndarray.putmask
-        """
-        values = self.values.copy()
-        np.putmask(values, mask, value)
-        return self._shallow_copy(values)
-
-    def format(self, name=False, formatter=None, **kwargs):
-        """
-        Render a string representation of the Index
-        """
-        header = []
-        if name:
-            header.append(com.pprint_thing(self.name,
-                                           escape_chars=('\t', '\r', '\n'))
-                          if self.name is not None else '')
-
-        if formatter is not None:
-            return header + list(self.map(formatter))
-
-        return self._format_with_header(header, **kwargs)
-
-    def _format_with_header(self, header, na_rep='NaN', **kwargs):
-        values = self.values
-
-        from pandas.core.format import format_array
-
-        if is_categorical_dtype(values.dtype):
-            values = np.array(values)
-        elif is_object_dtype(values.dtype):
-            values = lib.maybe_convert_objects(values, safe=1)
-
-        if is_object_dtype(values.dtype):
-            result = [com.pprint_thing(x, escape_chars=('\t', '\r', '\n'))
-                      for x in values]
-
-            # could have nans
-            mask = isnull(values)
-            if mask.any():
-                result = np.array(result)
-                result[mask] = na_rep
-                result = result.tolist()
-
-        else:
-            result = _trim_front(format_array(values, None, justify='left'))
-        return header + result
-
-    def to_native_types(self, slicer=None, **kwargs):
-        """ slice and dice then format """
-        values = self
-        if slicer is not None:
-            values = values[slicer]
-        return values._format_native_types(**kwargs)
-
-    def _format_native_types(self, na_rep='', quoting=None, **kwargs):
-        """ actually format my specific types """
-        mask = isnull(self)
-        if not self.is_object() and not quoting:
-            values = np.asarray(self).astype(str)
-        else:
-            values = np.array(self, dtype=object, copy=True)
-
-        values[mask] = na_rep
-        return values
-
-    def equals(self, other):
-        """
-        Determines if two Index objects contain the same elements.
-        """
-        if self.is_(other):
-            return True
-
-        if not isinstance(other, Index):
-            return False
-
-        return array_equivalent(_values_from_object(self), _values_from_object(other))
-
-    def identical(self, other):
-        """Similar to equals, but check that other comparable attributes are
-        also equal
-        """
-        return (self.equals(other) and
-                all((getattr(self, c, None) == getattr(other, c, None)
-                     for c in self._comparables)) and
-                type(self) == type(other))
-
-    def asof(self, label):
-        """
-        For a sorted index, return the most recent label up to and including
-        the passed label. Return NaN if not found.
-
-        See also
-        --------
-        get_loc : asof is a thin wrapper around get_loc with method='pad'
-        """
-        try:
-            loc = self.get_loc(label, method='pad')
-        except KeyError:
-            return _get_na_value(self.dtype)
-        else:
-            if isinstance(loc, slice):
-                loc = loc.indices(len(self))[-1]
-            return self[loc]
-
-    def asof_locs(self, where, mask):
-        """
-        where : array of timestamps
-        mask : array of booleans where data is not NA
-
-        """
-        locs = self.values[mask].searchsorted(where.values, side='right')
-
-        locs = np.where(locs > 0, locs - 1, 0)
-        result = np.arange(len(self))[mask].take(locs)
-
-        first = mask.argmax()
-        result[(locs == 0) & (where < self.values[first])] = -1
-
-        return result
-
-    def sort_values(self, return_indexer=False, ascending=True):
-        """
-        Return sorted copy of Index
-        """
-        _as = self.argsort()
-        if not ascending:
-            _as = _as[::-1]
-
-        sorted_index = self.take(_as)
-
-        if return_indexer:
-            return sorted_index, _as
-        else:
-            return sorted_index
-
-    def order(self, return_indexer=False, ascending=True):
-        """
-        Return sorted copy of Index
-
-        DEPRECATED: use :meth:`Index.sort_values`
-        """
-        warnings.warn("order is deprecated, use sort_values(...)",
-                      FutureWarning, stacklevel=2)
-        return self.sort_values(return_indexer=return_indexer, ascending=ascending)
-
-    def sort(self, *args, **kwargs):
-        raise TypeError("cannot sort an Index object in-place, use sort_values instead")
-
-    def sortlevel(self, level=None, ascending=True, sort_remaining=None):
-        """
-
-        For internal compatibility with with the Index API
-
-        Sort the Index. This is for compat with MultiIndex
-
-        Parameters
-        ----------
-        ascending : boolean, default True
-            False to sort in descending order
-
-        level, sort_remaining are compat paramaters
-
-        Returns
-        -------
-        sorted_index : Index
-        """
-        return self.sort_values(return_indexer=True, ascending=ascending)
-
-    def shift(self, periods=1, freq=None):
-        """
-        Shift Index containing datetime objects by input number of periods and
-        DateOffset
-
-        Returns
-        -------
-        shifted : Index
-        """
-        if periods == 0:
-            # OK because immutable
-            return self
-
-        offset = periods * freq
-        return Index([idx + offset for idx in self], name=self.name)
-
-    def argsort(self, *args, **kwargs):
-        """
-        return an ndarray indexer of the underlying data
-
-        See also
-        --------
-        numpy.ndarray.argsort
-        """
-        result = self.asi8
-        if result is None:
-            result = np.array(self)
-        return result.argsort(*args, **kwargs)
-
-    def __add__(self, other):
-        if com.is_list_like(other):
-            warnings.warn("using '+' to provide set union with Indexes is deprecated, "
-                          "use '|' or .union()", FutureWarning, stacklevel=2)
-        if isinstance(other, Index):
-            return self.union(other)
-        return Index(np.array(self) + other)
-
-    def __radd__(self, other):
-        if is_list_like(other):
-            warnings.warn("using '+' to provide set union with Indexes is deprecated, "
-                          "use '|' or .union()", FutureWarning, stacklevel=2)
-        return Index(other + np.array(self))
-
-    __iadd__ = __add__
-
-    def __sub__(self, other):
-        warnings.warn("using '-' to provide set differences with Indexes is deprecated, "
-                      "use .difference()",FutureWarning, stacklevel=2)
-        return self.difference(other)
-
-    def __and__(self, other):
-        return self.intersection(other)
-
-    def __or__(self, other):
-        return self.union(other)
-
-    def __xor__(self, other):
-        return self.sym_diff(other)
-
-    def union(self, other):
-        """
-        Form the union of two Index objects and sorts if possible
-
-        Parameters
-        ----------
-        other : Index or array-like
-
-        Returns
-        -------
-        union : Index
-        """
-        self._assert_can_do_setop(other)
-        other = _ensure_index(other)
-
-        if len(other) == 0 or self.equals(other):
-            return self
-
-        if len(self) == 0:
-            return other
-
-        if not is_dtype_equal(self.dtype,other.dtype):
-            this = self.astype('O')
-            other = other.astype('O')
-            return this.union(other)
-
-        if self.is_monotonic and other.is_monotonic:
-            try:
-                result = self._outer_indexer(self.values, other._values)[0]
-            except TypeError:
-                # incomparable objects
-                result = list(self.values)
-
-                # worth making this faster? a very unusual case
-                value_set = set(self.values)
-                result.extend([x for x in other._values if x not in value_set])
-        else:
-            indexer = self.get_indexer(other)
-            indexer, = (indexer == -1).nonzero()
-
-            if len(indexer) > 0:
-                other_diff = com.take_nd(other._values, indexer,
-                                         allow_fill=False)
-                result = com._concat_compat((self.values, other_diff))
-
-                try:
-                    self.values[0] < other_diff[0]
-                except TypeError as e:
-                    warnings.warn("%s, sort order is undefined for "
-                                  "incomparable objects" % e,
-                                  RuntimeWarning,
-                                  stacklevel=3)
-                else:
-                    types = frozenset((self.inferred_type,
-                                       other.inferred_type))
-                    if not types & _unsortable_types:
-                        result.sort()
-
-            else:
-                result = self.values
-
-                try:
-                    result = np.sort(result)
-                except TypeError as e:
-                    warnings.warn("%s, sort order is undefined for "
-                                  "incomparable objects" % e,
-                                  RuntimeWarning,
-                                  stacklevel=3)
-
-        # for subclasses
-        return self._wrap_union_result(other, result)
-
-    def _wrap_union_result(self, other, result):
-        name = self.name if self.name == other.name else None
-        return self.__class__(data=result, name=name)
-
-    def intersection(self, other):
-        """
-        Form the intersection of two Index objects. Sortedness of the result is
-        not guaranteed
-
-        Parameters
-        ----------
-        other : Index or array-like
-
-        Returns
-        -------
-        intersection : Index
-        """
-        self._assert_can_do_setop(other)
-        other = _ensure_index(other)
-
-        if self.equals(other):
-            return self
-
-        if not is_dtype_equal(self.dtype,other.dtype):
-            this = self.astype('O')
-            other = other.astype('O')
-            return this.intersection(other)
-
-        if self.is_monotonic and other.is_monotonic:
-            try:
-                result = self._inner_indexer(self.values, other._values)[0]
-                return self._wrap_union_result(other, result)
-            except TypeError:
-                pass
-
-        try:
-            indexer = Index(self.values).get_indexer(other._values)
-            indexer = indexer.take((indexer != -1).nonzero()[0])
-        except:
-            # duplicates
-            indexer = Index(self.values).get_indexer_non_unique(other._values)[0].unique()
-            indexer = indexer[indexer != -1]
-
-        taken = self.take(indexer)
-        if self.name != other.name:
-            taken.name = None
-        return taken
-
-    def difference(self, other):
-        """
-        Compute sorted set difference of two Index objects
-
-        Parameters
-        ----------
-        other : Index or array-like
-
-        Returns
-        -------
-        diff : Index
-
-        Notes
-        -----
-        One can do either of these and achieve the same result
-
-        >>> index.difference(index2)
-        """
-        self._assert_can_do_setop(other)
-
-        if self.equals(other):
-            return Index([], name=self.name)
-
-        other, result_name = self._convert_can_do_setop(other)
-
-        theDiff = sorted(set(self) - set(other))
-        return Index(theDiff, name=result_name)
-
-    diff = deprecate('diff', difference)
-
-    def sym_diff(self, other, result_name=None):
-        """
-        Compute the sorted symmetric difference of two Index objects.
-
-        Parameters
-        ----------
-
-        other : Index or array-like
-        result_name : str
-
-        Returns
-        -------
-        sym_diff : Index
-
-        Notes
-        -----
-        ``sym_diff`` contains elements that appear in either ``idx1`` or
-        ``idx2`` but not both. Equivalent to the Index created by
-        ``(idx1 - idx2) + (idx2 - idx1)`` with duplicates dropped.
-
-        The sorting of a result containing ``NaN`` values is not guaranteed
-        across Python versions. See GitHub issue #6444.
-
-        Examples
-        --------
-        >>> idx1 = Index([1, 2, 3, 4])
-        >>> idx2 = Index([2, 3, 4, 5])
-        >>> idx1.sym_diff(idx2)
-        Int64Index([1, 5], dtype='int64')
-
-        You can also use the ``^`` operator:
-
-        >>> idx1 ^ idx2
-        Int64Index([1, 5], dtype='int64')
-        """
-        self._assert_can_do_setop(other)
-        other, result_name_update = self._convert_can_do_setop(other)
-        if result_name is None:
-            result_name = result_name_update
-
-        the_diff = sorted(set((self.difference(other)).union(other.difference(self))))
-        attribs = self._get_attributes_dict()
-        attribs['name'] = result_name
-        if 'freq' in attribs:
-            attribs['freq'] = None
-        return self._shallow_copy(the_diff, infer=True, **attribs)
-
-    def get_loc(self, key, method=None, tolerance=None):
-        """
-        Get integer location for requested label
-
-        Parameters
-        ----------
-        key : label
-        method : {None, 'pad'/'ffill', 'backfill'/'bfill', 'nearest'}, optional
-            * default: exact matches only.
-            * pad / ffill: find the PREVIOUS index value if no exact match.
-            * backfill / bfill: use NEXT index value if no exact match
-            * nearest: use the NEAREST index value if no exact match. Tied
-              distances are broken by preferring the larger index value.
-        tolerance : optional
-            Maximum distance from index value for inexact matches. The value of
-            the index at the matching location most satisfy the equation
-            ``abs(index[loc] - key) <= tolerance``.
-
-            .. versionadded:: 0.17.0
-
-        Returns
-        -------
-        loc : int if unique index, possibly slice or mask if not
-        """
-        if method is None:
-            if tolerance is not None:
-                raise ValueError('tolerance argument only valid if using pad, '
-                                 'backfill or nearest lookups')
-            return self._engine.get_loc(_values_from_object(key))
-
-        indexer = self.get_indexer([key], method=method,
-                                   tolerance=tolerance)
-        if indexer.ndim > 1 or indexer.size > 1:
-            raise TypeError('get_loc requires scalar valued input')
-        loc = indexer.item()
-        if loc == -1:
-            raise KeyError(key)
-        return loc
-
-    def get_value(self, series, key):
-        """
-        Fast lookup of value from 1-dimensional ndarray. Only use this if you
-        know what you're doing
-        """
-
-        # if we have something that is Index-like, then
-        # use this, e.g. DatetimeIndex
-        s = getattr(series,'_values',None)
-        if isinstance(s, Index) and lib.isscalar(key):
-            return s[key]
-
-        s = _values_from_object(series)
-        k = _values_from_object(key)
-
-        # prevent integer truncation bug in indexing
-        if is_float(k) and not self.is_floating():
-            raise KeyError
-
-        try:
-            return self._engine.get_value(s, k)
-        except KeyError as e1:
-            if len(self) > 0 and self.inferred_type in ['integer','boolean']:
-                raise
-
-            try:
-                return tslib.get_value_box(s, key)
-            except IndexError:
-                raise
-            except TypeError:
-                # generator/iterator-like
-                if is_iterator(key):
-                    raise InvalidIndexError(key)
-                else:
-                    raise e1
-            except Exception:  # pragma: no cover
-                raise e1
-        except TypeError:
-            # python 3
-            if np.isscalar(key):  # pragma: no cover
-                raise IndexError(key)
-            raise InvalidIndexError(key)
-
-    def set_value(self, arr, key, value):
-        """
-        Fast lookup of value from 1-dimensional ndarray. Only use this if you
-        know what you're doing
-        """
-        self._engine.set_value(
-            _values_from_object(arr), _values_from_object(key), value)
-
-    def get_level_values(self, level):
-        """
-        Return vector of label values for requested level, equal to the length
-        of the index
-
-        Parameters
-        ----------
-        level : int
-
-        Returns
-        -------
-        values : ndarray
-        """
-        # checks that level number is actually just 1
-        self._validate_index_level(level)
-        return self
-
-    def get_indexer(self, target, method=None, limit=None, tolerance=None):
-        """
-        Compute indexer and mask for new index given the current index. The
-        indexer should be then used as an input to ndarray.take to align the
-        current data to the new index.
-
-        Parameters
-        ----------
-        target : Index
-        method : {None, 'pad'/'ffill', 'backfill'/'bfill', 'nearest'}, optional
-            * default: exact matches only.
-            * pad / ffill: find the PREVIOUS index value if no exact match.
-            * backfill / bfill: use NEXT index value if no exact match
-            * nearest: use the NEAREST index value if no exact match. Tied
-              distances are broken by preferring the larger index value.
-        limit : int, optional
-            Maximum number of consecutive labels in ``target`` to match for
-            inexact matches.
-        tolerance : optional
-            Maximum distance between original and new labels for inexact
-            matches. The values of the index at the matching locations most
-            satisfy the equation ``abs(index[indexer] - target) <= tolerance``.
-
-            .. versionadded:: 0.17.0
-
-        Examples
-        --------
-        >>> indexer = index.get_indexer(new_index)
-        >>> new_values = cur_values.take(indexer)
-
-        Returns
-        -------
-        indexer : ndarray of int
-            Integers from 0 to n - 1 indicating that the index at these
-            positions matches the corresponding target values. Missing values
-            in the target are marked by -1.
-        """
-        method = com._clean_reindex_fill_method(method)
-        target = _ensure_index(target)
-        if tolerance is not None:
-            tolerance = self._convert_tolerance(tolerance)
-
-        pself, ptarget = self._possibly_promote(target)
-        if pself is not self or ptarget is not target:
-            return pself.get_indexer(ptarget, method=method, limit=limit,
-                                     tolerance=tolerance)
-
-        if not is_dtype_equal(self.dtype, target.dtype):
-            this = self.astype(object)
-            target = target.astype(object)
-            return this.get_indexer(target, method=method, limit=limit,
-                                    tolerance=tolerance)
-
-        if not self.is_unique:
-            raise InvalidIndexError('Reindexing only valid with uniquely'
-                                    ' valued Index objects')
-
-        if method == 'pad' or method == 'backfill':
-            indexer = self._get_fill_indexer(target, method, limit, tolerance)
-        elif method == 'nearest':
-            indexer = self._get_nearest_indexer(target, limit, tolerance)
-        else:
-            if tolerance is not None:
-                raise ValueError('tolerance argument only valid if doing pad, '
-                                 'backfill or nearest reindexing')
-            if limit is not None:
-                raise ValueError('limit argument only valid if doing pad, '
-                                 'backfill or nearest reindexing')
-
-            indexer = self._engine.get_indexer(target._values)
-
-        return com._ensure_platform_int(indexer)
-
-    def _convert_tolerance(self, tolerance):
-        # override this method on subclasses
-        return tolerance
-
-    def _get_fill_indexer(self, target, method, limit=None, tolerance=None):
-        if self.is_monotonic_increasing and target.is_monotonic_increasing:
-            method = (self._engine.get_pad_indexer if method == 'pad'
-                      else self._engine.get_backfill_indexer)
-            indexer = method(target._values, limit)
-        else:
-            indexer = self._get_fill_indexer_searchsorted(target, method, limit)
-        if tolerance is not None:
-            indexer = self._filter_indexer_tolerance(
-                target._values, indexer, tolerance)
-        return indexer
-
-    def _get_fill_indexer_searchsorted(self, target, method, limit=None):
-        """
-        Fallback pad/backfill get_indexer that works for monotonic decreasing
-        indexes and non-monotonic targets
-        """
-        if limit is not None:
-            raise ValueError('limit argument for %r method only well-defined '
-                             'if index and target are monotonic' % method)
-
-        side = 'left' if method == 'pad' else 'right'
-        target = np.asarray(target)
-
-        # find exact matches first (this simplifies the algorithm)
-        indexer = self.get_indexer(target)
-        nonexact = (indexer == -1)
-        indexer[nonexact] = self._searchsorted_monotonic(target[nonexact], side)
-        if side == 'left':
-            # searchsorted returns "indices into a sorted array such that,
-            # if the corresponding elements in v were inserted before the
-            # indices, the order of a would be preserved".
-            # Thus, we need to subtract 1 to find values to the left.
-            indexer[nonexact] -= 1
-            # This also mapped not found values (values of 0 from
-            # np.searchsorted) to -1, which conveniently is also our
-            # sentinel for missing values
-        else:
-            # Mark indices to the right of the largest value as not found
-            indexer[indexer == len(self)] = -1
-        return indexer
-
-    def _get_nearest_indexer(self, target, limit, tolerance):
-        """
-        Get the indexer for the nearest index labels; requires an index with
-        values that can be subtracted from each other (e.g., not strings or
-        tuples).
-        """
-        left_indexer = self.get_indexer(target, 'pad', limit=limit)
-        right_indexer = self.get_indexer(target, 'backfill', limit=limit)
-
-        target = np.asarray(target)
-        left_distances = abs(self.values[left_indexer] - target)
-        right_distances = abs(self.values[right_indexer] - target)
-
-        op = operator.lt if self.is_monotonic_increasing else operator.le
-        indexer = np.where(op(left_distances, right_distances)
-                           | (right_indexer == -1),
-                           left_indexer, right_indexer)
-        if tolerance is not None:
-            indexer = self._filter_indexer_tolerance(
-                target, indexer, tolerance)
-        return indexer
-
-    def _filter_indexer_tolerance(self, target, indexer, tolerance):
-        distance = abs(self.values[indexer] - target)
-        indexer = np.where(distance <= tolerance, indexer, -1)
-        return indexer
-
-    def get_indexer_non_unique(self, target):
-        """ return an indexer suitable for taking from a non unique index
-            return the labels in the same order as the target, and
-            return a missing indexer into the target (missing are marked as -1
-            in the indexer); target must be an iterable """
-        target = _ensure_index(target)
-        pself, ptarget = self._possibly_promote(target)
-        if pself is not self or ptarget is not target:
-            return pself.get_indexer_non_unique(ptarget)
-
-        if self.is_all_dates:
-            self = Index(self.asi8)
-            tgt_values = target.asi8
-        else:
-            tgt_values = target._values
-
-        indexer, missing = self._engine.get_indexer_non_unique(tgt_values)
-        return Index(indexer), missing
-
-    def get_indexer_for(self, target, **kwargs):
-        """ guaranteed return of an indexer even when non-unique """
-        if self.is_unique:
-            return self.get_indexer(target, **kwargs)
-        indexer, _ = self.get_indexer_non_unique(target, **kwargs)
-        return indexer
-
-    def _possibly_promote(self, other):
-        # A hack, but it works
-        from pandas.tseries.index import DatetimeIndex
-        if self.inferred_type == 'date' and isinstance(other, DatetimeIndex):
-            return DatetimeIndex(self), other
-        elif self.inferred_type == 'boolean':
-            if not is_object_dtype(self.dtype):
-                return self.astype('object'), other.astype('object')
-        return self, other
-
-    def groupby(self, to_groupby):
-        """
-        Group the index labels by a given array of values.
-
-        Parameters
-        ----------
-        to_groupby : array
-            Values used to determine the groups.
-
-        Returns
-        -------
-        groups : dict
-            {group name -> group labels}
-
-        """
-        return self._groupby(self.values, _values_from_object(to_groupby))
-
-    def map(self, mapper):
-        return self._arrmap(self.values, mapper)
-
-    def isin(self, values, level=None):
-        """
-        Compute boolean array of whether each index value is found in the
-        passed set of values.
-
-        Parameters
-        ----------
-        values : set or sequence of values
-            Sought values.
-        level : str or int, optional
-            Name or position of the index level to use (if the index is a
-            MultiIndex).
-
-        Notes
-        -----
-        If `level` is specified:
-
-        - if it is the name of one *and only one* index level, use that level;
-        - otherwise it should be a number indicating level position.
-
-        Returns
-        -------
-        is_contained : ndarray (boolean dtype)
-
-        """
-        if level is not None:
-            self._validate_index_level(level)
-        return algorithms.isin(np.array(self), values)
-
-    def _can_reindex(self, indexer):
-        """
-        *this is an internal non-public method*
-
-        Check if we are allowing reindexing with this particular indexer
-
-        Parameters
-        ----------
-        indexer : an integer indexer
-
-        Raises
-        ------
-        ValueError if its a duplicate axis
-        """
-
-        # trying to reindex on an axis with duplicates
-        if not self.is_unique and len(indexer):
-            raise ValueError("cannot reindex from a duplicate axis")
-
-    def reindex(self, target, method=None, level=None, limit=None,
-                tolerance=None):
-        """
-        Create index with target's values (move/add/delete values as necessary)
-
-        Parameters
-        ----------
-        target : an iterable
-
-        Returns
-        -------
-        new_index : pd.Index
-            Resulting index
-        indexer : np.ndarray or None
-            Indices of output values in original index
-
-        """
-        # GH6552: preserve names when reindexing to non-named target
-        # (i.e. neither Index nor Series).
-        preserve_names = not hasattr(target, 'name')
-
-        # GH7774: preserve dtype/tz if target is empty and not an Index.
-        target = _ensure_has_len(target)  # target may be an iterator
-        if not isinstance(target, Index) and len(target) == 0:
-            attrs = self._get_attributes_dict()
-            attrs.pop('freq', None)  # don't preserve freq
-            target = self._simple_new(None, dtype=self.dtype, **attrs)
-        else:
-            target = _ensure_index(target)
-
-        if level is not None:
-            if method is not None:
-                raise TypeError('Fill method not supported if level passed')
-            _, indexer, _ = self._join_level(target, level, how='right',
-                                             return_indexers=True)
-        else:
-            if self.equals(target):
-                indexer = None
-            else:
-                if self.is_unique:
-                    indexer = self.get_indexer(target, method=method,
-                                               limit=limit,
-                                               tolerance=tolerance)
-                else:
-                    if method is not None or limit is not None:
-                        raise ValueError("cannot reindex a non-unique index "
-                                         "with a method or limit")
-                    indexer, missing = self.get_indexer_non_unique(target)
-
-        if preserve_names and target.nlevels == 1 and target.name != self.name:
-            target = target.copy()
-            target.name = self.name
-
-        return target, indexer
-
-    def _reindex_non_unique(self, target):
-        """
-        *this is an internal non-public method*
-
-        Create a new index with target's values (move/add/delete values as necessary)
-        use with non-unique Index and a possibly non-unique target
-
-        Parameters
-        ----------
-        target : an iterable
-
-        Returns
-        -------
-        new_index : pd.Index
-            Resulting index
-        indexer : np.ndarray or None
-            Indices of output values in original index
-
-        """
-
-        target = _ensure_index(target)
-        indexer, missing = self.get_indexer_non_unique(target)
-        check = indexer != -1
-        new_labels = self.take(indexer[check])
-        new_indexer = None
-
-        if len(missing):
-            l = np.arange(len(indexer))
-
-            missing = com._ensure_platform_int(missing)
-            missing_labels = target.take(missing)
-            missing_indexer = com._ensure_int64(l[~check])
-            cur_labels = self.take(indexer[check])._values
-            cur_indexer = com._ensure_int64(l[check])
-
-            new_labels = np.empty(tuple([len(indexer)]), dtype=object)
-            new_labels[cur_indexer] = cur_labels
-            new_labels[missing_indexer] = missing_labels
-
-            # a unique indexer
-            if target.is_unique:
-
-                # see GH5553, make sure we use the right indexer
-                new_indexer = np.arange(len(indexer))
-                new_indexer[cur_indexer] = np.arange(len(cur_labels))
-                new_indexer[missing_indexer] = -1
-
-            # we have a non_unique selector, need to use the original
-            # indexer here
-            else:
-
-                # need to retake to have the same size as the indexer
-                indexer = indexer._values
-                indexer[~check] = 0
-
-                # reset the new indexer to account for the new size
-                new_indexer = np.arange(len(self.take(indexer)))
-                new_indexer[~check] = -1
-
-        return self._shallow_copy(new_labels), indexer, new_indexer
-
-    def join(self, other, how='left', level=None, return_indexers=False):
-        """
-        *this is an internal non-public method*
-
-        Compute join_index and indexers to conform data
-        structures to the new index.
-
-        Parameters
-        ----------
-        other : Index
-        how : {'left', 'right', 'inner', 'outer'}
-        level : int or level name, default None
-        return_indexers : boolean, default False
-
-        Returns
-        -------
-        join_index, (left_indexer, right_indexer)
-        """
-        self_is_mi = isinstance(self, MultiIndex)
-        other_is_mi = isinstance(other, MultiIndex)
-
-        # try to figure out the join level
-        # GH3662
-        if (level is None and (self_is_mi or other_is_mi)):
-
-            # have the same levels/names so a simple join
-            if self.names == other.names:
-                pass
-            else:
-                return self._join_multi(other, how=how, return_indexers=return_indexers)
-
-        # join on the level
-        if (level is not None and (self_is_mi or other_is_mi)):
-            return self._join_level(other, level, how=how,
-                                    return_indexers=return_indexers)
-
-        other = _ensure_index(other)
-
-        if len(other) == 0 and how in ('left', 'outer'):
-            join_index = self._shallow_copy()
-            if return_indexers:
-                rindexer = np.repeat(-1, len(join_index))
-                return join_index, None, rindexer
-            else:
-                return join_index
-
-        if len(self) == 0 and how in ('right', 'outer'):
-            join_index = other._shallow_copy()
-            if return_indexers:
-                lindexer = np.repeat(-1, len(join_index))
-                return join_index, lindexer, None
-            else:
-                return join_index
-
-        if self._join_precedence < other._join_precedence:
-            how = {'right': 'left', 'left': 'right'}.get(how, how)
-            result = other.join(self, how=how, level=level,
-                                return_indexers=return_indexers)
-            if return_indexers:
-                x, y, z = result
-                result = x, z, y
-            return result
-
-        if not is_dtype_equal(self.dtype,other.dtype):
-            this = self.astype('O')
-            other = other.astype('O')
-            return this.join(other, how=how,
-                             return_indexers=return_indexers)
-
-        _validate_join_method(how)
-
-        if not self.is_unique and not other.is_unique:
-            return self._join_non_unique(other, how=how,
-                                         return_indexers=return_indexers)
-        elif not self.is_unique or not other.is_unique:
-            if self.is_monotonic and other.is_monotonic:
-                return self._join_monotonic(other, how=how,
-                                            return_indexers=return_indexers)
-            else:
-                return self._join_non_unique(other, how=how,
-                                             return_indexers=return_indexers)
-        elif self.is_monotonic and other.is_monotonic:
-            try:
-                return self._join_monotonic(other, how=how,
-                                            return_indexers=return_indexers)
-            except TypeError:
-                pass
-
-        if how == 'left':
-            join_index = self
-        elif how == 'right':
-            join_index = other
-        elif how == 'inner':
-            join_index = self.intersection(other)
-        elif how == 'outer':
-            join_index = self.union(other)
-
-        if return_indexers:
-            if join_index is self:
-                lindexer = None
-            else:
-                lindexer = self.get_indexer(join_index)
-            if join_index is other:
-                rindexer = None
-            else:
-                rindexer = other.get_indexer(join_index)
-            return join_index, lindexer, rindexer
-        else:
-            return join_index
-
-    def _join_multi(self, other, how, return_indexers=True):
-
-        self_is_mi = isinstance(self, MultiIndex)
-        other_is_mi = isinstance(other, MultiIndex)
-
-        # figure out join names
-        self_names = [ n for n in self.names if n is not None ]
-        other_names = [ n for n in other.names if n is not None ]
-        overlap = list(set(self_names) & set(other_names))
-
-        # need at least 1 in common, but not more than 1
-        if not len(overlap):
-            raise ValueError("cannot join with no level specified and no overlapping names")
-        if len(overlap) > 1:
-            raise NotImplementedError("merging with more than one level overlap on a multi-index is not implemented")
-        jl = overlap[0]
-
-        # make the indices into mi's that match
-        if not (self_is_mi and other_is_mi):
-
-            flip_order = False
-            if self_is_mi:
-                self, other = other, self
-                flip_order = True
-                # flip if join method is right or left
-                how = {'right': 'left', 'left': 'right'}.get(how, how)
-
-            level = other.names.index(jl)
-            result = self._join_level(other, level, how=how,
-                                      return_indexers=return_indexers)
-
-            if flip_order:
-                if isinstance(result, tuple):
-                    return result[0], result[2], result[1]
-            return result
-
-        # 2 multi-indexes
-        raise NotImplementedError("merging with both multi-indexes is not implemented")
-
-    def _join_non_unique(self, other, how='left', return_indexers=False):
-        from pandas.tools.merge import _get_join_indexers
-
-        left_idx, right_idx = _get_join_indexers([self.values], [other._values],
-                                                 how=how, sort=True)
-
-        left_idx = com._ensure_platform_int(left_idx)
-        right_idx = com._ensure_platform_int(right_idx)
-
-        join_index = self.values.take(left_idx)
-        mask = left_idx == -1
-        np.putmask(join_index, mask, other._values.take(right_idx))
-
-        join_index = self._wrap_joined_index(join_index, other)
-
-        if return_indexers:
-            return join_index, left_idx, right_idx
-        else:
-            return join_index
-
-    def _join_level(self, other, level, how='left',
-                    return_indexers=False,
-                    keep_order=True):
-        """
-        The join method *only* affects the level of the resulting
-        MultiIndex. Otherwise it just exactly aligns the Index data to the
-        labels of the level in the MultiIndex. If `keep_order` == True, the
-        order of the data indexed by the MultiIndex will not be changed;
-        otherwise, it will tie out with `other`.
-        """
-        from pandas.algos import groupsort_indexer
-
-        def _get_leaf_sorter(labels):
-            '''
-            returns sorter for the inner most level while preserving the
-            order of higher levels
-            '''
-            if labels[0].size == 0:
-                return np.empty(0, dtype='int64')
-
-            if len(labels) == 1:
-                lab = com._ensure_int64(labels[0])
-                sorter, _ = groupsort_indexer(lab, 1 + lab.max())
-                return sorter
-
-            # find indexers of begining of each set of
-            # same-key labels w.r.t all but last level
-            tic = labels[0][:-1] != labels[0][1:]
-            for lab in labels[1:-1]:
-                tic |= lab[:-1] != lab[1:]
-
-            starts = np.hstack(([True], tic, [True])).nonzero()[0]
-            lab = com._ensure_int64(labels[-1])
-            return lib.get_level_sorter(lab, com._ensure_int64(starts))
-
-        if isinstance(self, MultiIndex) and isinstance(other, MultiIndex):
-            raise TypeError('Join on level between two MultiIndex objects '
-                            'is ambiguous')
-
-        left, right = self, other
-
-        flip_order = not isinstance(self, MultiIndex)
-        if flip_order:
-            left, right = right, left
-            how = {'right': 'left', 'left': 'right'}.get(how, how)
-
-        level = left._get_level_number(level)
-        old_level = left.levels[level]
-
-        if not right.is_unique:
-            raise NotImplementedError('Index._join_level on non-unique index '
-                                      'is not implemented')
-
-        new_level, left_lev_indexer, right_lev_indexer = \
-            old_level.join(right, how=how, return_indexers=True)
-
-        if left_lev_indexer is None:
-            if keep_order or len(left) == 0:
-                left_indexer = None
-                join_index = left
-            else:  # sort the leaves
-                left_indexer = _get_leaf_sorter(left.labels[:level + 1])
-                join_index = left[left_indexer]
-
-        else:
-            left_lev_indexer = com._ensure_int64(left_lev_indexer)
-            rev_indexer = lib.get_reverse_indexer(left_lev_indexer,
-                                                  len(old_level))
-
-            new_lev_labels = com.take_nd(rev_indexer, left.labels[level],
-                                         allow_fill=False)
-
-            new_labels = list(left.labels)
-            new_labels[level] = new_lev_labels
-
-            new_levels = list(left.levels)
-            new_levels[level] = new_level
-
-            if keep_order:  # just drop missing values. o.w. keep order
-                left_indexer = np.arange(len(left))
-                mask = new_lev_labels != -1
-                if not mask.all():
-                    new_labels = [lab[mask] for lab in new_labels]
-                    left_indexer = left_indexer[mask]
-
-            else:  # tie out the order with other
-                if level == 0:  # outer most level, take the fast route
-                    ngroups = 1 + new_lev_labels.max()
-                    left_indexer, counts = groupsort_indexer(new_lev_labels,
-                                                             ngroups)
-                    # missing values are placed first; drop them!
-                    left_indexer = left_indexer[counts[0]:]
-                    new_labels = [lab[left_indexer] for lab in new_labels]
-
-                else:  # sort the leaves
-                    mask = new_lev_labels != -1
-                    mask_all = mask.all()
-                    if not mask_all:
-                        new_labels = [lab[mask] for lab in new_labels]
-
-                    left_indexer = _get_leaf_sorter(new_labels[:level + 1])
-                    new_labels = [lab[left_indexer] for lab in new_labels]
-
-                    # left_indexers are w.r.t masked frame.
-                    # reverse to original frame!
-                    if not mask_all:
-                        left_indexer = mask.nonzero()[0][left_indexer]
-
-            join_index = MultiIndex(levels=new_levels,
-                                    labels=new_labels,
-                                    names=left.names,
-                                    verify_integrity=False)
-
-        if right_lev_indexer is not None:
-            right_indexer = com.take_nd(right_lev_indexer,
-                                        join_index.labels[level],
-                                        allow_fill=False)
-        else:
-            right_indexer = join_index.labels[level]
-
-        if flip_order:
-            left_indexer, right_indexer = right_indexer, left_indexer
-
-        if return_indexers:
-            return join_index, left_indexer, right_indexer
-        else:
-            return join_index
-
-    def _join_monotonic(self, other, how='left', return_indexers=False):
-        if self.equals(other):
-            ret_index = other if how == 'right' else self
-            if return_indexers:
-                return ret_index, None, None
-            else:
-                return ret_index
-
-        sv = self.values
-        ov = other._values
-
-        if self.is_unique and other.is_unique:
-            # We can perform much better than the general case
-            if how == 'left':
-                join_index = self
-                lidx = None
-                ridx = self._left_indexer_unique(sv, ov)
-            elif how == 'right':
-                join_index = other
-                lidx = self._left_indexer_unique(ov, sv)
-                ridx = None
-            elif how == 'inner':
-                join_index, lidx, ridx = self._inner_indexer(sv, ov)
-                join_index = self._wrap_joined_index(join_index, other)
-            elif how == 'outer':
-                join_index, lidx, ridx = self._outer_indexer(sv, ov)
-                join_index = self._wrap_joined_index(join_index, other)
-        else:
-            if how == 'left':
-                join_index, lidx, ridx = self._left_indexer(sv, ov)
-            elif how == 'right':
-                join_index, ridx, lidx = self._left_indexer(other, self)
-            elif how == 'inner':
-                join_index, lidx, ridx = self._inner_indexer(sv, ov)
-            elif how == 'outer':
-                join_index, lidx, ridx = self._outer_indexer(sv, ov)
-            join_index = self._wrap_joined_index(join_index, other)
-
-        if return_indexers:
-            return join_index, lidx, ridx
-        else:
-            return join_index
-
-    def _wrap_joined_index(self, joined, other):
-        name = self.name if self.name == other.name else None
-        return Index(joined, name=name)
-
-    def slice_indexer(self, start=None, end=None, step=None, kind=None):
-        """
-        For an ordered Index, compute the slice indexer for input labels and
-        step
-
-        Parameters
-        ----------
-        start : label, default None
-            If None, defaults to the beginning
-        end : label, default None
-            If None, defaults to the end
-        step : int, default None
-        kind : string, default None
-
-        Returns
-        -------
-        indexer : ndarray or slice
-
-        Notes
-        -----
-        This function assumes that the data is sorted, so use at your own peril
-        """
-        start_slice, end_slice = self.slice_locs(start, end, step=step, kind=kind)
-
-        # return a slice
-        if not lib.isscalar(start_slice):
-            raise AssertionError("Start slice bound is non-scalar")
-        if not lib.isscalar(end_slice):
-            raise AssertionError("End slice bound is non-scalar")
-
-        return slice(start_slice, end_slice, step)
-
-    def _maybe_cast_slice_bound(self, label, side, kind):
-        """
-        This function should be overloaded in subclasses that allow non-trivial
-        casting on label-slice bounds, e.g. datetime-like indices allowing
-        strings containing formatted datetimes.
-
-        Parameters
-        ----------
-        label : object
-        side : {'left', 'right'}
-        kind : string / None
-
-        Returns
-        -------
-        label :  object
-
-        Notes
-        -----
-        Value of `side` parameter should be validated in caller.
-
-        """
-
-        # We are a plain index here (sub-class override this method if they
-        # wish to have special treatment for floats/ints, e.g. Float64Index and
-        # datetimelike Indexes
-        # reject them
-        if is_float(label):
-            self._invalid_indexer('slice',label)
-
-        # we are trying to find integer bounds on a non-integer based index
-        # this is rejected (generally .loc gets you here)
-        elif is_integer(label):
-            self._invalid_indexer('slice',label)
-
-        return label
-
-    def _searchsorted_monotonic(self, label, side='left'):
-        if self.is_monotonic_increasing:
-            return self.searchsorted(label, side=side)
-        elif self.is_monotonic_decreasing:
-            # np.searchsorted expects ascending sort order, have to reverse
-            # everything for it to work (element ordering, search side and
-            # resulting value).
-            pos = self[::-1].searchsorted(
-                label, side='right' if side == 'left' else 'right')
-            return len(self) - pos
-
-        raise ValueError('index must be monotonic increasing or decreasing')
-
-    def get_slice_bound(self, label, side, kind):
-        """
-        Calculate slice bound that corresponds to given label.
-
-        Returns leftmost (one-past-the-rightmost if ``side=='right'``) position
-        of given label.
-
-        Parameters
-        ----------
-        label : object
-        side : {'left', 'right'}
-        kind : string / None, the type of indexer
-
-        """
-        if side not in ('left', 'right'):
-            raise ValueError(
-                "Invalid value for side kwarg,"
-                " must be either 'left' or 'right': %s" % (side,))
-
-        original_label = label
-
-        # For datetime indices label may be a string that has to be converted
-        # to datetime boundary according to its resolution.
-        label = self._maybe_cast_slice_bound(label, side, kind)
-
-        # we need to look up the label
-        try:
-            slc = self.get_loc(label)
-        except KeyError as err:
-            try:
-                return self._searchsorted_monotonic(label, side)
-            except ValueError:
-                # raise the original KeyError
-                raise err
-
-        if isinstance(slc, np.ndarray):
-            # get_loc may return a boolean array or an array of indices, which
-            # is OK as long as they are representable by a slice.
-            if is_bool_dtype(slc):
-                slc = lib.maybe_booleans_to_slice(slc.view('u1'))
-            else:
-                slc = lib.maybe_indices_to_slice(slc.astype('i8'), len(self))
-            if isinstance(slc, np.ndarray):
-                raise KeyError(
-                    "Cannot get %s slice bound for non-unique label:"
-                    " %r" % (side, original_label))
-
-        if isinstance(slc, slice):
-            if side == 'left':
-                return slc.start
-            else:
-                return slc.stop
-        else:
-            if side == 'right':
-                return slc + 1
-            else:
-                return slc
-
-    def slice_locs(self, start=None, end=None, step=None, kind=None):
-        """
-        Compute slice locations for input labels.
-
-        Parameters
-        ----------
-        start : label, default None
-            If None, defaults to the beginning
-        end : label, default None
-            If None, defaults to the end
-        step : int, defaults None
-            If None, defaults to 1
-        kind : string, defaults None
-
-        Returns
-        -------
-        start, end : int
-
-        """
-        inc = (step is None or step >= 0)
-
-        if not inc:
-            # If it's a reverse slice, temporarily swap bounds.
-            start, end = end, start
-
-        start_slice = None
-        if start is not None:
-            start_slice = self.get_slice_bound(start, 'left', kind)
-        if start_slice is None:
-            start_slice = 0
-
-        end_slice = None
-        if end is not None:
-            end_slice = self.get_slice_bound(end, 'right', kind)
-        if end_slice is None:
-            end_slice = len(self)
-
-        if not inc:
-            # Bounds at this moment are swapped, swap them back and shift by 1.
-            #
-            # slice_locs('B', 'A', step=-1): s='B', e='A'
-            #
-            #              s='A'                 e='B'
-            # AFTER SWAP:    |                     |
-            #                v ------------------> V
-            #           -----------------------------------
-            #           | | |A|A|A|A| | | | | |B|B| | | | |
-            #           -----------------------------------
-            #              ^ <------------------ ^
-            # SHOULD BE:   |                     |
-            #           end=s-1              start=e-1
-            #
-            end_slice, start_slice = start_slice - 1, end_slice - 1
-
-            # i == -1 triggers ``len(self) + i`` selection that points to the
-            # last element, not before-the-first one, subtracting len(self)
-            # compensates that.
-            if end_slice == -1:
-                end_slice -= len(self)
-            if start_slice == -1:
-                start_slice -= len(self)
-
-        return start_slice, end_slice
-
-    def delete(self, loc):
-        """
-        Make new Index with passed location(-s) deleted
-
-        Returns
-        -------
-        new_index : Index
-        """
-        attribs = self._get_attributes_dict()
-        return self._shallow_copy(np.delete(self._data, loc), **attribs)
-
-    def insert(self, loc, item):
-        """
-        Make new Index inserting new item at location. Follows
-        Python list.append semantics for negative values
-
-        Parameters
-        ----------
-        loc : int
-        item : object
-
-        Returns
-        -------
-        new_index : Index
-        """
-        _self = np.asarray(self)
-        item = self._coerce_scalar_to_index(item)._values
-
-        idx = np.concatenate(
-            (_self[:loc], item, _self[loc:]))
-        attribs = self._get_attributes_dict()
-        return self._shallow_copy(idx, infer=True, **attribs)
-
-    def drop(self, labels, errors='raise'):
-        """
-        Make new Index with passed list of labels deleted
-
-        Parameters
-        ----------
-        labels : array-like
-        errors : {'ignore', 'raise'}, default 'raise'
-            If 'ignore', suppress error and existing labels are dropped.
-
-        Returns
-        -------
-        dropped : Index
-        """
-        labels = com._index_labels_to_array(labels)
-        indexer = self.get_indexer(labels)
-        mask = indexer == -1
-        if mask.any():
-            if errors != 'ignore':
-                raise ValueError('labels %s not contained in axis' % labels[mask])
-            indexer = indexer[~mask]
-        return self.delete(indexer)
-
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
-    @Appender(_shared_docs['drop_duplicates'] % _index_doc_kwargs)
-    def drop_duplicates(self, keep='first'):
-        return super(Index, self).drop_duplicates(keep=keep)
-
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
-    @Appender(_shared_docs['duplicated'] % _index_doc_kwargs)
-    def duplicated(self, keep='first'):
-        return super(Index, self).duplicated(keep=keep)
-
-    def _evaluate_with_timedelta_like(self, other, op, opstr):
-        raise TypeError("can only perform ops with timedelta like values")
-
-    def _evaluate_with_datetime_like(self, other, op, opstr):
-        raise TypeError("can only perform ops with datetime like values")
-
-    @classmethod
-    def _add_comparison_methods(cls):
-        """ add in comparison methods """
-
-        def _make_compare(op):
-
-            def _evaluate_compare(self, other):
-                if isinstance(other, (np.ndarray, Index, ABCSeries)):
-                    if other.ndim > 0 and len(self) != len(other):
-                        raise ValueError('Lengths must match to compare')
-                func = getattr(self.values, op)
-                result = func(np.asarray(other))
-
-                # technically we could support bool dtyped Index
-                # for now just return the indexing array directly
-                if is_bool_dtype(result):
-                    return result
-                try:
-                    return Index(result)
-                except TypeError:
-                    return result
-
-            return _evaluate_compare
-
-        cls.__eq__ = _make_compare('__eq__')
-        cls.__ne__ = _make_compare('__ne__')
-        cls.__lt__ = _make_compare('__lt__')
-        cls.__gt__ = _make_compare('__gt__')
-        cls.__le__ = _make_compare('__le__')
-        cls.__ge__ = _make_compare('__ge__')
-
-    @classmethod
-    def _add_numericlike_set_methods_disabled(cls):
-        """ add in the numeric set-like methods to disable """
-
-        def _make_invalid_op(name):
-
-            def invalid_op(self, other=None):
-                raise TypeError("cannot perform {name} with this index type: {typ}".format(name=name,
-                                                                                           typ=type(self)))
-            invalid_op.__name__ = name
-            return invalid_op
-
-        cls.__add__ = cls.__radd__ = __iadd__ = _make_invalid_op('__add__')
-        cls.__sub__ = __isub__ = _make_invalid_op('__sub__')
-
-    @classmethod
-    def _add_numeric_methods_disabled(cls):
-        """ add in numeric methods to disable """
-
-        def _make_invalid_op(name):
-
-            def invalid_op(self, other=None):
-                raise TypeError("cannot perform {name} with this index type: {typ}".format(name=name,
-                                                                                           typ=type(self)))
-            invalid_op.__name__ = name
-            return invalid_op
-
-        cls.__mul__ = cls.__rmul__ = _make_invalid_op('__mul__')
-        cls.__floordiv__ = cls.__rfloordiv__ = _make_invalid_op('__floordiv__')
-        cls.__truediv__ = cls.__rtruediv__ = _make_invalid_op('__truediv__')
-        if not compat.PY3:
-            cls.__div__ = cls.__rdiv__ = _make_invalid_op('__div__')
-        cls.__neg__ = _make_invalid_op('__neg__')
-        cls.__pos__ = _make_invalid_op('__pos__')
-        cls.__abs__ = _make_invalid_op('__abs__')
-        cls.__inv__ = _make_invalid_op('__inv__')
-
-    def _maybe_update_attributes(self, attrs):
-        """ Update Index attributes (e.g. freq) depending on op """
-        return attrs
-
-    @classmethod
-    def _add_numeric_methods(cls):
-        """ add in numeric methods """
-
-        def _make_evaluate_binop(op, opstr, reversed=False):
-
-            def _evaluate_numeric_binop(self, other):
-                import pandas.tseries.offsets as offsets
-
-                # if we are an inheritor of numeric, but not actually numeric (e.g. DatetimeIndex/PeriodInde)
-                if not self._is_numeric_dtype:
-                    raise TypeError("cannot evaluate a numeric op {opstr} for type: {typ}".format(opstr=opstr,
-                                                                                                  typ=type(self)))
-
-                if isinstance(other, Index):
-                    if not other._is_numeric_dtype:
-                        raise TypeError("cannot evaluate a numeric op {opstr} with type: {typ}".format(opstr=type(self),
-                                                                                                       typ=type(other)))
-                elif isinstance(other, np.ndarray) and not other.ndim:
-                    other = other.item()
-
-                if isinstance(other, (Index, ABCSeries, np.ndarray)):
-                    if len(self) != len(other):
-                        raise ValueError("cannot evaluate a numeric op with unequal lengths")
-                    other = _values_from_object(other)
-                    if other.dtype.kind not in ['f','i']:
-                        raise TypeError("cannot evaluate a numeric op with a non-numeric dtype")
-                elif isinstance(other, (offsets.DateOffset, np.timedelta64, Timedelta, datetime.timedelta)):
-                    return self._evaluate_with_timedelta_like(other, op, opstr)
-                elif isinstance(other, (Timestamp, np.datetime64)):
-                    return self._evaluate_with_datetime_like(other, op, opstr)
-                else:
-                    if not (is_float(other) or is_integer(other)):
-                        raise TypeError("can only perform ops with scalar values")
-
-                # if we are a reversed non-communative op
-                values = self.values
-                if reversed:
-                    values, other = other, values
-
-                attrs = self._get_attributes_dict()
-                attrs = self._maybe_update_attributes(attrs)
-                return Index(op(values, other), **attrs)
-
-            return _evaluate_numeric_binop
-
-        def _make_evaluate_unary(op, opstr):
-
-            def _evaluate_numeric_unary(self):
-
-                # if we are an inheritor of numeric, but not actually numeric (e.g. DatetimeIndex/PeriodInde)
-                if not self._is_numeric_dtype:
-                    raise TypeError("cannot evaluate a numeric op {opstr} for type: {typ}".format(opstr=opstr,
-                                                                                                  typ=type(self)))
-                attrs = self._get_attributes_dict()
-                attrs = self._maybe_update_attributes(attrs)
-                return Index(op(self.values), **attrs)
-
-            return _evaluate_numeric_unary
-
-        cls.__add__ = cls.__radd__ = _make_evaluate_binop(operator.add,'__add__')
-        cls.__sub__ = _make_evaluate_binop(operator.sub,'__sub__')
-        cls.__rsub__ = _make_evaluate_binop(operator.sub,'__sub__',reversed=True)
-        cls.__mul__ = cls.__rmul__ = _make_evaluate_binop(operator.mul,'__mul__')
-        cls.__floordiv__ = _make_evaluate_binop(operator.floordiv,'__floordiv__')
-        cls.__rfloordiv__ = _make_evaluate_binop(operator.floordiv,'__floordiv__',reversed=True)
-        cls.__truediv__ = _make_evaluate_binop(operator.truediv,'__truediv__')
-        cls.__rtruediv__ = _make_evaluate_binop(operator.truediv,'__truediv__',reversed=True)
-        if not compat.PY3:
-            cls.__div__ = _make_evaluate_binop(operator.div,'__div__')
-            cls.__rdiv__ = _make_evaluate_binop(operator.div,'__div__',reversed=True)
-        cls.__neg__ = _make_evaluate_unary(lambda x: -x,'__neg__')
-        cls.__pos__ = _make_evaluate_unary(lambda x: x,'__pos__')
-        cls.__abs__ = _make_evaluate_unary(lambda x: np.abs(x),'__abs__')
-        cls.__inv__ = _make_evaluate_unary(lambda x: -x,'__inv__')
-
-    @classmethod
-    def _add_logical_methods(cls):
-        """ add in logical methods """
-
-        _doc = """
-
-        %(desc)s
-
-        Parameters
-        ----------
-        All arguments to numpy.%(outname)s are accepted.
-
-        Returns
-        -------
-        %(outname)s : bool or array_like (if axis is specified)
-            A single element array_like may be converted to bool."""
-
-        def _make_logical_function(name, desc, f):
-
-            @Substitution(outname=name, desc=desc)
-            @Appender(_doc)
-            def logical_func(self, *args, **kwargs):
-                result = f(self.values)
-                if isinstance(result, (np.ndarray, ABCSeries, Index)) \
-                   and result.ndim == 0:
-                    # return NumPy type
-                    return result.dtype.type(result.item())
-                else:  # pragma: no cover
-                    return result
-            logical_func.__name__ = name
-            return logical_func
-
-        cls.all = _make_logical_function(
-            'all', 'Return whether all elements are True', np.all)
-        cls.any = _make_logical_function(
-            'any', 'Return whether any element is True', np.any)
-
-    @classmethod
-    def _add_logical_methods_disabled(cls):
-        """ add in logical methods to disable """
-
-        def _make_invalid_op(name):
-
-            def invalid_op(self, other=None):
-                raise TypeError("cannot perform {name} with this index type: {typ}".format(name=name,
-                                                                                           typ=type(self)))
-            invalid_op.__name__ = name
-            return invalid_op
-
-        cls.all = _make_invalid_op('all')
-        cls.any = _make_invalid_op('any')
-
-
-Index._add_numeric_methods_disabled()
-Index._add_logical_methods()
-Index._add_comparison_methods()
-
-class CategoricalIndex(Index, PandasDelegate):
-    """
-
-    Immutable Index implementing an ordered, sliceable set. CategoricalIndex
-    represents a sparsely populated Index with an underlying Categorical.
-
-    .. versionadded:: 0.16.1
-
-    Parameters
-    ----------
-    data : array-like or Categorical, (1-dimensional)
-    categories : optional, array-like
-        categories for the CategoricalIndex
-    ordered : boolean,
-        designating if the categories are ordered
-    copy : bool
-        Make a copy of input ndarray
-    name : object
-        Name to be stored in the index
-
-    """
-
-    _typ = 'categoricalindex'
-    _engine_type = _index.Int64Engine
-    _attributes = ['name']
-
-    def __new__(cls, data=None, categories=None, ordered=None, dtype=None, copy=False, name=None, fastpath=False, **kwargs):
-
-        if fastpath:
-            return cls._simple_new(data, name=name)
-
-        if isinstance(data, ABCCategorical):
-            data = cls._create_categorical(cls, data, categories, ordered)
-        elif isinstance(data, CategoricalIndex):
-            data = data._data
-            data = cls._create_categorical(cls, data, categories, ordered)
-        else:
-
-            # don't allow scalars
-            # if data is None, then categories must be provided
-            if lib.isscalar(data):
-                if data is not None or categories is None:
-                    cls._scalar_data_error(data)
-                data = []
-            data = cls._create_categorical(cls, data, categories, ordered)
-
-        if copy:
-            data = data.copy()
-
-        return cls._simple_new(data, name=name)
-
-    def _create_from_codes(self, codes, categories=None, ordered=None, name=None):
-        """
-        *this is an internal non-public method*
-
-        create the correct categorical from codes
-
-        Parameters
-        ----------
-        codes : new codes
-        categories : optional categories, defaults to existing
-        ordered : optional ordered attribute, defaults to existing
-        name : optional name attribute, defaults to existing
-
-        Returns
-        -------
-        CategoricalIndex
-        """
-
-        from pandas.core.categorical import Categorical
-        if categories is None:
-            categories = self.categories
-        if ordered is None:
-            ordered = self.ordered
-        if name is None:
-            name = self.name
-        cat = Categorical.from_codes(codes, categories=categories, ordered=self.ordered)
-        return CategoricalIndex(cat, name=name)
-
-    @staticmethod
-    def _create_categorical(self, data, categories=None, ordered=None):
-        """
-        *this is an internal non-public method*
-
-        create the correct categorical from data and the properties
-
-        Parameters
-        ----------
-        data : data for new Categorical
-        categories : optional categories, defaults to existing
-        ordered : optional ordered attribute, defaults to existing
-
-        Returns
-        -------
-        Categorical
-        """
-
-        if not isinstance(data, ABCCategorical):
-            from pandas.core.categorical import Categorical
-            data = Categorical(data, categories=categories, ordered=ordered)
-        else:
-            if categories is not None:
-                data = data.set_categories(categories)
-            if ordered is not None:
-                data = data.set_ordered(ordered)
-        return data
-
-    @classmethod
-    def _simple_new(cls, values, name=None, categories=None, ordered=None, **kwargs):
-        result = object.__new__(cls)
-
-        values = cls._create_categorical(cls, values, categories, ordered)
-        result._data = values
-        result.name = name
-        for k, v in compat.iteritems(kwargs):
-            setattr(result,k,v)
-
-        result._reset_identity()
-        return result
-
-    def _is_dtype_compat(self, other):
-        """
-        *this is an internal non-public method*
-
-        provide a comparison between the dtype of self and other (coercing if needed)
-
-        Raises
-        ------
-        TypeError if the dtypes are not compatible
-        """
-
-        if is_categorical_dtype(other):
-            if isinstance(other, CategoricalIndex):
-                other = other._values
-            if not other.is_dtype_equal(self):
-                raise TypeError("categories must match existing categories when appending")
-        else:
-            values = other
-            if not is_list_like(values):
-                values = [ values ]
-            other = CategoricalIndex(self._create_categorical(self, other, categories=self.categories, ordered=self.ordered))
-            if not other.isin(values).all():
-                raise TypeError("cannot append a non-category item to a CategoricalIndex")
-
-        return other
-
-    def equals(self, other):
-        """
-        Determines if two CategorialIndex objects contain the same elements.
-        """
-        if self.is_(other):
-            return True
-
-        try:
-            other = self._is_dtype_compat(other)
-            return array_equivalent(self._data, other)
-        except (TypeError, ValueError):
-            pass
-
-        return False
-
-    @property
-    def _formatter_func(self):
-        return self.categories._formatter_func
-
-    def _format_attrs(self):
-        """
-        Return a list of tuples of the (attr,formatted_value)
-        """
-        max_categories = (10 if get_option("display.max_categories") == 0
-                    else get_option("display.max_categories"))
-        attrs = [('categories', default_pprint(self.categories, max_seq_items=max_categories)),
-                 ('ordered',self.ordered)]
-        if self.name is not None:
-            attrs.append(('name',default_pprint(self.name)))
-        attrs.append(('dtype',"'%s'" % self.dtype))
-        max_seq_items = get_option('display.max_seq_items') or len(self)
-        if len(self) > max_seq_items:
-            attrs.append(('length',len(self)))
-        return attrs
-
-    @property
-    def inferred_type(self):
-        return 'categorical'
-
-    @property
-    def values(self):
-        """ return the underlying data, which is a Categorical """
-        return self._data
-
-    def get_values(self):
-        """ return the underlying data as an ndarray """
-        return self._data.get_values()
-
-    @property
-    def codes(self):
-        return self._data.codes
-
-    @property
-    def categories(self):
-        return self._data.categories
-
-    @property
-    def ordered(self):
-        return self._data.ordered
-
-    def __contains__(self, key):
-        hash(key)
-        return key in self.values
-
-    def __array__(self, dtype=None):
-        """ the array interface, return my values """
-        return np.array(self._data, dtype=dtype)
-
-    def argsort(self, *args, **kwargs):
-        return self.values.argsort(*args, **kwargs)
-
-    @cache_readonly
-    def _engine(self):
-
-        # we are going to look things up with the codes themselves
-        return self._engine_type(lambda: self.codes.astype('i8'), len(self))
-
-    @cache_readonly
-    def is_unique(self):
-        return not self.duplicated().any()
-
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
-    @Appender(_shared_docs['duplicated'] % _index_doc_kwargs)
-    def duplicated(self, keep='first'):
-        from pandas.hashtable import duplicated_int64
-        return duplicated_int64(self.codes.astype('i8'), keep)
-
-    def get_loc(self, key, method=None):
-        """
-        Get integer location for requested label
-
-        Parameters
-        ----------
-        key : label
-        method : {None}
-            * default: exact matches only.
-
-        Returns
-        -------
-        loc : int if unique index, possibly slice or mask if not
-        """
-        codes = self.categories.get_loc(key)
-        if (codes == -1):
-            raise KeyError(key)
-        indexer, _ = self._engine.get_indexer_non_unique(np.array([codes]))
-        if (indexer==-1).any():
-            raise KeyError(key)
-
-        return indexer
-
-    def _can_reindex(self, indexer):
-        """ always allow reindexing """
-        pass
-
-    def reindex(self, target, method=None, level=None, limit=None,
-                tolerance=None):
-        """
-        Create index with target's values (move/add/delete values as necessary)
-
-        Returns
-        -------
-        new_index : pd.Index
-            Resulting index
-        indexer : np.ndarray or None
-            Indices of output values in original index
-
-        """
-
-        if method is not None:
-            raise NotImplementedError("argument method is not implemented for CategoricalIndex.reindex")
-        if level is not None:
-            raise NotImplementedError("argument level is not implemented for CategoricalIndex.reindex")
-        if limit is not None:
-            raise NotImplementedError("argument limit is not implemented for CategoricalIndex.reindex")
-
-        target = _ensure_index(target)
-
-        if not is_categorical_dtype(target) and not target.is_unique:
-            raise ValueError("cannot reindex with a non-unique indexer")
-
-        indexer, missing = self.get_indexer_non_unique(np.array(target))
-        new_target = self.take(indexer)
-
-
-        # filling in missing if needed
-        if len(missing):
-            cats = self.categories.get_indexer(target)
-            if (cats==-1).any():
-
-                # coerce to a regular index here!
-                result = Index(np.array(self),name=self.name)
-                new_target, indexer, _ = result._reindex_non_unique(np.array(target))
-
-            else:
-
-                codes = new_target.codes.copy()
-                codes[indexer==-1] = cats[missing]
-                new_target = self._create_from_codes(codes)
-
-        # we always want to return an Index type here
-        # to be consistent with .reindex for other index types (e.g. they don't coerce
-        # based on the actual values, only on the dtype)
-        # unless we had an inital Categorical to begin with
-        # in which case we are going to conform to the passed Categorical
-        new_target = np.asarray(new_target)
-        if is_categorical_dtype(target):
-            new_target = target._shallow_copy(new_target, name=self.name)
-        else:
-            new_target = Index(new_target, name=self.name)
-
-        return new_target, indexer
-
-    def _reindex_non_unique(self, target):
-        """ reindex from a non-unique; which CategoricalIndex's are almost always """
-        new_target, indexer = self.reindex(target)
-        new_indexer = None
-
-        check = indexer==-1
-        if check.any():
-            new_indexer = np.arange(len(self.take(indexer)))
-            new_indexer[check] = -1
-
-        return new_target, indexer, new_indexer
-
-    def get_indexer(self, target, method=None, limit=None, tolerance=None):
-        """
-        Compute indexer and mask for new index given the current index. The
-        indexer should be then used as an input to ndarray.take to align the
-        current data to the new index. The mask determines whether labels are
-        found or not in the current index
-
-        Parameters
-        ----------
-        target : MultiIndex or Index (of tuples)
-        method : {'pad', 'ffill', 'backfill', 'bfill'}
-            pad / ffill: propagate LAST valid observation forward to next valid
-            backfill / bfill: use NEXT valid observation to fill gap
-
-        Notes
-        -----
-        This is a low-level method and probably should be used at your own risk
-
-        Examples
-        --------
-        >>> indexer, mask = index.get_indexer(new_index)
-        >>> new_values = cur_values.take(indexer)
-        >>> new_values[-mask] = np.nan
-
-        Returns
-        -------
-        (indexer, mask) : (ndarray, ndarray)
-        """
-        method = com._clean_reindex_fill_method(method)
-        target = _ensure_index(target)
-
-        if isinstance(target, CategoricalIndex):
-            target = target.categories
-
-        if method == 'pad' or method == 'backfill':
-            raise NotImplementedError("method='pad' and method='backfill' not implemented yet "
-                                      'for CategoricalIndex')
-        elif method == 'nearest':
-            raise NotImplementedError("method='nearest' not implemented yet "
-                                      'for CategoricalIndex')
-        else:
-
-            codes = self.categories.get_indexer(target)
-            indexer, _ = self._engine.get_indexer_non_unique(codes)
-
-        return com._ensure_platform_int(indexer)
-
-    def get_indexer_non_unique(self, target):
-        """ this is the same for a CategoricalIndex for get_indexer; the API returns the missing values as well """
-        target = _ensure_index(target)
-
-        if isinstance(target, CategoricalIndex):
-            target = target.categories
-
-        codes = self.categories.get_indexer(target)
-        return self._engine.get_indexer_non_unique(codes)
-
-    def _convert_list_indexer(self, keyarr, kind=None):
-        """
-        we are passed a list indexer.
-        Return our indexer or raise if all of the values are not included in the categories
-        """
-        codes = self.categories.get_indexer(keyarr)
-        if (codes==-1).any():
-            raise KeyError("a list-indexer must only include values that are in the categories")
-
-        return None
-
-    def take(self, indexer, axis=0, allow_fill=True, fill_value=None):
-        """
-        For internal compatibility with numpy arrays.
-
-        # filling must always be None/nan here
-        # but is passed thru internally
-        assert isnull(fill_value)
-
-        See also
-        --------
-        numpy.ndarray.take
-        """
-
-        indexer = com._ensure_platform_int(indexer)
-        taken = self.codes.take(indexer)
-        return self._create_from_codes(taken)
-
-    def delete(self, loc):
-        """
-        Make new Index with passed location(-s) deleted
-
-        Returns
-        -------
-        new_index : Index
-        """
-        return self._create_from_codes(np.delete(self.codes, loc))
-
-    def insert(self, loc, item):
-        """
-        Make new Index inserting new item at location. Follows
-        Python list.append semantics for negative values
-
-        Parameters
-        ----------
-        loc : int
-        item : object
-
-        Returns
-        -------
-        new_index : Index
-
-        Raises
-        ------
-        ValueError if the item is not in the categories
-
-        """
-        code = self.categories.get_indexer([item])
-        if (code == -1):
-            raise TypeError("cannot insert an item into a CategoricalIndex that is not already an existing category")
-
-        codes = self.codes
-        codes = np.concatenate(
-            (codes[:loc], code, codes[loc:]))
-        return self._create_from_codes(codes)
-
-    def append(self, other):
-        """
-        Append a collection of CategoricalIndex options together
-
-        Parameters
-        ----------
-        other : Index or list/tuple of indices
-
-        Returns
-        -------
-        appended : Index
-
-        Raises
-        ------
-        ValueError if other is not in the categories
-        """
-        to_concat, name = self._ensure_compat_append(other)
-        to_concat = [ self._is_dtype_compat(c) for c in to_concat ]
-        codes = np.concatenate([ c.codes for c in to_concat ])
-        return self._create_from_codes(codes, name=name)
-
-    @classmethod
-    def _add_comparison_methods(cls):
-        """ add in comparison methods """
-
-        def _make_compare(op):
-
-            def _evaluate_compare(self, other):
-
-                # if we have a Categorical type, then must have the same categories
-                if isinstance(other, CategoricalIndex):
-                    other = other._values
-                elif isinstance(other, Index):
-                    other = self._create_categorical(self, other._values, categories=self.categories, ordered=self.ordered)
-
-                if isinstance(other, (ABCCategorical, np.ndarray, ABCSeries)):
-                    if len(self.values) != len(other):
-                        raise ValueError("Lengths must match to compare")
-
-                if isinstance(other, ABCCategorical):
-                    if not self.values.is_dtype_equal(other):
-                        raise TypeError("categorical index comparisions must have the same categories and ordered attributes")
-
-                return getattr(self.values, op)(other)
-
-            return _evaluate_compare
-
-        cls.__eq__ = _make_compare('__eq__')
-        cls.__ne__ = _make_compare('__ne__')
-        cls.__lt__ = _make_compare('__lt__')
-        cls.__gt__ = _make_compare('__gt__')
-        cls.__le__ = _make_compare('__le__')
-        cls.__ge__ = _make_compare('__ge__')
-
-
-    def _delegate_method(self, name, *args, **kwargs):
-        """ method delegation to the ._values """
-        method = getattr(self._values, name)
-        if 'inplace' in kwargs:
-            raise ValueError("cannot use inplace with CategoricalIndex")
-        res = method(*args, **kwargs)
-        if lib.isscalar(res):
-            return res
-        return CategoricalIndex(res, name=self.name)
-
-    @classmethod
-    def _add_accessors(cls):
-        """ add in Categorical accessor methods """
-
-        from pandas.core.categorical import Categorical
-        CategoricalIndex._add_delegate_accessors(delegate=Categorical,
-                                                 accessors=["rename_categories",
-                                                            "reorder_categories",
-                                                            "add_categories",
-                                                            "remove_categories",
-                                                            "remove_unused_categories",
-                                                            "set_categories",
-                                                            "as_ordered",
-                                                            "as_unordered",
-                                                            "min",
-                                                            "max"],
-                                                 typ='method',
-                                                 overwrite=True)
-
-
-CategoricalIndex._add_numericlike_set_methods_disabled()
-CategoricalIndex._add_numeric_methods_disabled()
-CategoricalIndex._add_logical_methods_disabled()
-CategoricalIndex._add_comparison_methods()
-CategoricalIndex._add_accessors()
-
-
-class NumericIndex(Index):
-    """
-    Provide numeric type operations
-
-    This is an abstract class
-
-    """
-    _is_numeric_dtype = True
-
-    def _maybe_cast_slice_bound(self, label, side, kind):
-        """
-        This function should be overloaded in subclasses that allow non-trivial
-        casting on label-slice bounds, e.g. datetime-like indices allowing
-        strings containing formatted datetimes.
-
-        Parameters
-        ----------
-        label : object
-        side : {'left', 'right'}
-        kind : string / None
-
-        Returns
-        -------
-        label :  object
-
-        Notes
-        -----
-        Value of `side` parameter should be validated in caller.
-
-        """
-
-        # we are a numeric index, so we accept
-        # integer/floats directly
-        if not (is_integer(label) or is_float(label)):
-            self._invalid_indexer('slice',label)
-
-        return label
-
-    def _convert_tolerance(self, tolerance):
-        try:
-            return float(tolerance)
-        except ValueError:
-            raise ValueError('tolerance argument for %s must be numeric: %r'
-                             % (type(self).__name__, tolerance))
-
-
-class Int64Index(NumericIndex):
-
-    """
-    Immutable ndarray implementing an ordered, sliceable set. The basic object
-    storing axis labels for all pandas objects. Int64Index is a special case
-    of `Index` with purely integer labels. This is the default index type used
-    by the DataFrame and Series ctors when no explicit index is provided by the
-    user.
-
-    Parameters
-    ----------
-    data : array-like (1-dimensional)
-    dtype : NumPy dtype (default: int64)
-    copy : bool
-        Make a copy of input ndarray
-    name : object
-        Name to be stored in the index
-
-    Notes
-    -----
-    An Index instance can **only** contain hashable objects
-    """
-
-    _typ = 'int64index'
-    _groupby = _algos.groupby_int64
-    _arrmap = _algos.arrmap_int64
-    _left_indexer_unique = _algos.left_join_indexer_unique_int64
-    _left_indexer = _algos.left_join_indexer_int64
-    _inner_indexer = _algos.inner_join_indexer_int64
-    _outer_indexer = _algos.outer_join_indexer_int64
-
-    _engine_type = _index.Int64Engine
-
-    def __new__(cls, data=None, dtype=None, copy=False, name=None, fastpath=False, **kwargs):
-
-        if fastpath:
-            return cls._simple_new(data, name=name)
-
-        # isscalar, generators handled in coerce_to_ndarray
-        data = cls._coerce_to_ndarray(data)
-
-        if issubclass(data.dtype.type, compat.string_types):
-            cls._string_data_error(data)
-
-        elif issubclass(data.dtype.type, np.integer):
-            # don't force the upcast as we may be dealing
-            # with a platform int
-            if dtype is None or not issubclass(np.dtype(dtype).type,
-                                               np.integer):
-                dtype = np.int64
-
-            subarr = np.array(data, dtype=dtype, copy=copy)
-        else:
-            subarr = np.array(data, dtype=np.int64, copy=copy)
-            if len(data) > 0:
-                if (subarr != data).any():
-                    raise TypeError('Unsafe NumPy casting to integer, you must'
-                                    ' explicitly cast')
-
-        return cls._simple_new(subarr, name=name)
-
-    @property
-    def inferred_type(self):
-        return 'integer'
-
-    @cache_readonly
-    def hasnans(self):
-        # by definition
-        return False
-
-    @property
-    def asi8(self):
-        # do not cache or you'll create a memory leak
-        return self.values.view('i8')
-
-    @property
-    def is_all_dates(self):
-        """
-        Checks that all the labels are datetime objects
-        """
-        return False
-
-    def equals(self, other):
-        """
-        Determines if two Index objects contain the same elements.
-        """
-        if self.is_(other):
-            return True
-
-        # if not isinstance(other, Int64Index):
-        #     return False
-
-        try:
-            return array_equivalent(_values_from_object(self), _values_from_object(other))
-        except TypeError:
-            # e.g. fails in numpy 1.6 with DatetimeIndex #1681
-            return False
-
-    def _wrap_joined_index(self, joined, other):
-        name = self.name if self.name == other.name else None
-        return Int64Index(joined, name=name)
-
-
-Int64Index._add_numeric_methods()
-Int64Index._add_logical_methods()
-
-
-class Float64Index(NumericIndex):
-
-    """
-    Immutable ndarray implementing an ordered, sliceable set. The basic object
-    storing axis labels for all pandas objects. Float64Index is a special case
-    of `Index` with purely floating point labels.
-
-    Parameters
-    ----------
-    data : array-like (1-dimensional)
-    dtype : NumPy dtype (default: object)
-    copy : bool
-        Make a copy of input ndarray
-    name : object
-        Name to be stored in the index
-
-    Notes
-    -----
-    An Float64Index instance can **only** contain hashable objects
-    """
-
-    _typ = 'float64index'
-    _engine_type = _index.Float64Engine
-    _groupby = _algos.groupby_float64
-    _arrmap = _algos.arrmap_float64
-    _left_indexer_unique = _algos.left_join_indexer_unique_float64
-    _left_indexer = _algos.left_join_indexer_float64
-    _inner_indexer = _algos.inner_join_indexer_float64
-    _outer_indexer = _algos.outer_join_indexer_float64
-
-    def __new__(cls, data=None, dtype=None, copy=False, name=None, fastpath=False, **kwargs):
-
-        if fastpath:
-            return cls._simple_new(data, name)
-
-        data = cls._coerce_to_ndarray(data)
-
-        if issubclass(data.dtype.type, compat.string_types):
-            cls._string_data_error(data)
-
-        if dtype is None:
-            dtype = np.float64
-
-        try:
-            subarr = np.array(data, dtype=dtype, copy=copy)
-        except:
-            raise TypeError('Unsafe NumPy casting, you must '
-                            'explicitly cast')
-
-        # coerce to float64 for storage
-        if subarr.dtype != np.float64:
-            subarr = subarr.astype(np.float64)
-
-        return cls._simple_new(subarr, name)
-
-    @property
-    def inferred_type(self):
-        return 'floating'
-
-    def astype(self, dtype):
-        if np.dtype(dtype) not in (np.object, np.float64):
-            raise TypeError('Setting %s dtype to anything other than '
-                            'float64 or object is not supported' %
-                            self.__class__)
-        return Index(self._values, name=self.name, dtype=dtype)
-
-    def _convert_scalar_indexer(self, key, kind=None):
-        if kind == 'iloc':
-            return super(Float64Index, self)._convert_scalar_indexer(key,
-                                                                     kind=kind)
-        return key
-
-    def _convert_slice_indexer(self, key, kind=None):
-        """
-        convert a slice indexer, by definition these are labels
-        unless we are iloc
-
-        Parameters
-        ----------
-        key : label of the slice bound
-        kind : optional, type of the indexing operation (loc/ix/iloc/None)
-        """
-
-        # if we are not a slice, then we are done
-        if not isinstance(key, slice):
-            return key
-
-        if kind == 'iloc':
-            return super(Float64Index, self)._convert_slice_indexer(key,
-                                                                    kind=kind)
-
-        # translate to locations
-        return self.slice_indexer(key.start, key.stop, key.step)
-
-    def get_value(self, series, key):
-        """ we always want to get an index value, never a value """
-        if not np.isscalar(key):
-            raise InvalidIndexError
-
-        from pandas.core.indexing import maybe_droplevels
-        from pandas.core.series import Series
-
-        k = _values_from_object(key)
-        loc = self.get_loc(k)
-        new_values = _values_from_object(series)[loc]
-
-        if np.isscalar(new_values) or new_values is None:
-            return new_values
-
-        new_index = self[loc]
-        new_index = maybe_droplevels(new_index, k)
-        return Series(new_values, index=new_index, name=series.name)
-
-    def equals(self, other):
-        """
-        Determines if two Index objects contain the same elements.
-        """
-        if self is other:
-            return True
-
-        # need to compare nans locations and make sure that they are the same
-        # since nans don't compare equal this is a bit tricky
-        try:
-            if not isinstance(other, Float64Index):
-                other = self._constructor(other)
-            if not is_dtype_equal(self.dtype,other.dtype) or self.shape != other.shape:
-                return False
-            left, right = self._values, other._values
-            return ((left == right) | (self._isnan & other._isnan)).all()
-        except TypeError:
-            # e.g. fails in numpy 1.6 with DatetimeIndex #1681
-            return False
-
-    def __contains__(self, other):
-        if super(Float64Index, self).__contains__(other):
-            return True
-
-        try:
-            # if other is a sequence this throws a ValueError
-            return np.isnan(other) and self.hasnans
-        except ValueError:
-            try:
-                return len(other) <= 1 and _try_get_item(other) in self
-            except TypeError:
-                return False
-        except:
-            return False
-
-    def get_loc(self, key, method=None, tolerance=None):
-        try:
-            if np.all(np.isnan(key)):
-                nan_idxs = self._nan_idxs
-                try:
-                    return nan_idxs.item()
-                except (ValueError, IndexError):
-                    # should only need to catch ValueError here but on numpy
-                    # 1.7 .item() can raise IndexError when NaNs are present
-                    return nan_idxs
-        except (TypeError, NotImplementedError):
-            pass
-        return super(Float64Index, self).get_loc(key, method=method,
-                                                 tolerance=tolerance)
-
-    @property
-    def is_all_dates(self):
-        """
-        Checks that all the labels are datetime objects
-        """
-        return False
-
-    @cache_readonly
-    def _nan_idxs(self):
-        w, = self._isnan.nonzero()
-        return w
-
-    @cache_readonly
-    def _isnan(self):
-        return np.isnan(self.values)
-
-    @cache_readonly
-    def hasnans(self):
-        return self._isnan.any()
-
-    @cache_readonly
-    def is_unique(self):
-        return super(Float64Index, self).is_unique and self._nan_idxs.size < 2
-
-    @Appender(Index.isin.__doc__)
-    def isin(self, values, level=None):
-        value_set = set(values)
-        if level is not None:
-            self._validate_index_level(level)
-        return lib.ismember_nans(np.array(self), value_set,
-                                 isnull(list(value_set)).any())
-
-
-Float64Index._add_numeric_methods()
-Float64Index._add_logical_methods_disabled()
-
-
-class MultiIndex(Index):
-
-    """
-    Implements multi-level, a.k.a. hierarchical, index object for pandas
-    objects
-
-    Parameters
-    ----------
-    levels : sequence of arrays
-        The unique labels for each level
-    labels : sequence of arrays
-        Integers for each level designating which label at each location
-    sortorder : optional int
-        Level of sortedness (must be lexicographically sorted by that
-        level)
-    names : optional sequence of objects
-        Names for each of the index levels. (name is accepted for compat)
-    copy : boolean, default False
-        Copy the meta-data
-    verify_integrity : boolean, default True
-        Check that the levels/labels are consistent and valid
-    """
-
-    # initialize to zero-length tuples to make everything work
-    _typ = 'multiindex'
-    _names = FrozenList()
-    _levels = FrozenList()
-    _labels = FrozenList()
-    _comparables = ['names']
-    rename = Index.set_names
-
-    def __new__(cls, levels=None, labels=None, sortorder=None, names=None,
-                copy=False, verify_integrity=True, _set_identity=True, name=None, **kwargs):
-
-        # compat with Index
-        if name is not None:
-            names = name
-        if levels is None or labels is None:
-            raise TypeError("Must pass both levels and labels")
-        if len(levels) != len(labels):
-            raise ValueError('Length of levels and labels must be the same.')
-        if len(levels) == 0:
-            raise ValueError('Must pass non-zero number of levels/labels')
-        if len(levels) == 1:
-            if names:
-                name = names[0]
-            else:
-                name = None
-            return Index(levels[0], name=name, copy=True).take(labels[0])
-
-        result = object.__new__(MultiIndex)
-
-        # we've already validated levels and labels, so shortcut here
-        result._set_levels(levels, copy=copy, validate=False)
-        result._set_labels(labels, copy=copy, validate=False)
-
-        if names is not None:
-            # handles name validation
-            result._set_names(names)
-
-        if sortorder is not None:
-            result.sortorder = int(sortorder)
-        else:
-            result.sortorder = sortorder
-
-        if verify_integrity:
-            result._verify_integrity()
-        if _set_identity:
-            result._reset_identity()
-
-        return result
-
-    def _verify_integrity(self):
-        """Raises ValueError if length of levels and labels don't match or any
-        label would exceed level bounds"""
-        # NOTE: Currently does not check, among other things, that cached
-        # nlevels matches nor that sortorder matches actually sortorder.
-        labels, levels = self.labels, self.levels
-        if len(levels) != len(labels):
-            raise ValueError("Length of levels and labels must match. NOTE:"
-                             " this index is in an inconsistent state.")
-        label_length = len(self.labels[0])
-        for i, (level, label) in enumerate(zip(levels, labels)):
-            if len(label) != label_length:
-                raise ValueError("Unequal label lengths: %s" % (
-                                 [len(lab) for lab in labels]))
-            if len(label) and label.max() >= len(level):
-                raise ValueError("On level %d, label max (%d) >= length of"
-                                 " level  (%d). NOTE: this index is in an"
-                                 " inconsistent state" % (i, label.max(),
-                                                          len(level)))
-
-    def _get_levels(self):
-        return self._levels
-
-    def _set_levels(self, levels, level=None, copy=False, validate=True,
-                    verify_integrity=False):
-        # This is NOT part of the levels property because it should be
-        # externally not allowed to set levels. User beware if you change
-        # _levels directly
-        if validate and len(levels) == 0:
-            raise ValueError('Must set non-zero number of levels.')
-        if validate and level is None and len(levels) != self.nlevels:
-            raise ValueError('Length of levels must match number of levels.')
-        if validate and level is not None and len(levels) != len(level):
-            raise ValueError('Length of levels must match length of level.')
-
-        if level is None:
-            new_levels = FrozenList(_ensure_index(lev, copy=copy)._shallow_copy()
-                                    for lev in levels)
-        else:
-            level = [self._get_level_number(l) for l in level]
-            new_levels = list(self._levels)
-            for l, v in zip(level, levels):
-                new_levels[l] = _ensure_index(v, copy=copy)._shallow_copy()
-            new_levels = FrozenList(new_levels)
-
-        names = self.names
-        self._levels = new_levels
-        if any(names):
-            self._set_names(names)
-
-        self._tuples = None
-        self._reset_cache()
-
-        if verify_integrity:
-            self._verify_integrity()
-
-    def set_levels(self, levels, level=None, inplace=False, verify_integrity=True):
-        """
-        Set new levels on MultiIndex. Defaults to returning
-        new index.
-
-        Parameters
-        ----------
-        levels : sequence or list of sequence
-            new level(s) to apply
-        level : int or level name, or sequence of int / level names (default None)
-            level(s) to set (None for all levels)
-        inplace : bool
-            if True, mutates in place
-        verify_integrity : bool (default True)
-            if True, checks that levels and labels are compatible
-
-        Returns
-        -------
-        new index (of same type and class...etc)
-
-
-        Examples
-        --------
-        >>> idx = MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
-                                          (2, u'one'), (2, u'two')],
-                                          names=['foo', 'bar'])
-        >>> idx.set_levels([['a','b'], [1,2]])
-        MultiIndex(levels=[[u'a', u'b'], [1, 2]],
-                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                   names=[u'foo', u'bar'])
-        >>> idx.set_levels(['a','b'], level=0)
-        MultiIndex(levels=[[u'a', u'b'], [u'one', u'two']],
-                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                   names=[u'foo', u'bar'])
-        >>> idx.set_levels(['a','b'], level='bar')
-        MultiIndex(levels=[[1, 2], [u'a', u'b']],
-                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                   names=[u'foo', u'bar'])
-        >>> idx.set_levels([['a','b'], [1,2]], level=[0,1])
-        MultiIndex(levels=[[u'a', u'b'], [1, 2]],
-                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                   names=[u'foo', u'bar'])
-        """
-        if level is not None and not is_list_like(level):
-            if not is_list_like(levels):
-                raise TypeError("Levels must be list-like")
-            if is_list_like(levels[0]):
-                raise TypeError("Levels must be list-like")
-            level = [level]
-            levels = [levels]
-        elif level is None or is_list_like(level):
-            if not is_list_like(levels) or not is_list_like(levels[0]):
-                raise TypeError("Levels must be list of lists-like")
-
-        if inplace:
-            idx = self
-        else:
-            idx = self._shallow_copy()
-        idx._reset_identity()
-        idx._set_levels(levels, level=level, validate=True,
-                        verify_integrity=verify_integrity)
-        if not inplace:
-            return idx
-
-    # remove me in 0.14 and change to read only property
-    __set_levels = deprecate("setting `levels` directly",
-                             partial(set_levels, inplace=True,
-                                     verify_integrity=True),
-                             alt_name="set_levels")
-    levels = property(fget=_get_levels, fset=__set_levels)
-
-    def _get_labels(self):
-        return self._labels
-
-    def _set_labels(self, labels, level=None, copy=False, validate=True,
-                    verify_integrity=False):
-
-        if validate and level is None and len(labels) != self.nlevels:
-            raise ValueError("Length of labels must match number of levels")
-        if validate and level is not None and len(labels) != len(level):
-            raise ValueError('Length of labels must match length of levels.')
-
-        if level is None:
-            new_labels = FrozenList(_ensure_frozen(lab, lev, copy=copy)._shallow_copy()
-                                    for lev, lab in zip(self.levels, labels))
-        else:
-            level = [self._get_level_number(l) for l in level]
-            new_labels = list(self._labels)
-            for l, lev, lab in zip(level, self.levels, labels):
-                new_labels[l] = _ensure_frozen(lab, lev, copy=copy)._shallow_copy()
-            new_labels = FrozenList(new_labels)
-
-        self._labels = new_labels
-        self._tuples = None
-        self._reset_cache()
-
-        if verify_integrity:
-            self._verify_integrity()
-
-    def set_labels(self, labels, level=None, inplace=False, verify_integrity=True):
-        """
-        Set new labels on MultiIndex. Defaults to returning
-        new index.
-
-        Parameters
-        ----------
-        labels : sequence or list of sequence
-            new labels to apply
-        level : int or level name, or sequence of int / level names (default None)
-            level(s) to set (None for all levels)
-        inplace : bool
-            if True, mutates in place
-        verify_integrity : bool (default True)
-            if True, checks that levels and labels are compatible
-
-        Returns
-        -------
-        new index (of same type and class...etc)
-
-        Examples
-        --------
-        >>> idx = MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
-                                          (2, u'one'), (2, u'two')],
-                                          names=['foo', 'bar'])
-        >>> idx.set_labels([[1,0,1,0], [0,0,1,1]])
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[1, 0, 1, 0], [0, 0, 1, 1]],
-                   names=[u'foo', u'bar'])
-        >>> idx.set_labels([1,0,1,0], level=0)
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[1, 0, 1, 0], [0, 1, 0, 1]],
-                   names=[u'foo', u'bar'])
-        >>> idx.set_labels([0,0,1,1], level='bar')
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[0, 0, 1, 1], [0, 0, 1, 1]],
-                   names=[u'foo', u'bar'])
-        >>> idx.set_labels([[1,0,1,0], [0,0,1,1]], level=[0,1])
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[1, 0, 1, 0], [0, 0, 1, 1]],
-                   names=[u'foo', u'bar'])
-        """
-        if level is not None and not is_list_like(level):
-            if not is_list_like(labels):
-                raise TypeError("Labels must be list-like")
-            if is_list_like(labels[0]):
-                raise TypeError("Labels must be list-like")
-            level = [level]
-            labels = [labels]
-        elif level is None or is_list_like(level):
-            if not is_list_like(labels) or not is_list_like(labels[0]):
-                raise TypeError("Labels must be list of lists-like")
-
-        if inplace:
-            idx = self
-        else:
-            idx = self._shallow_copy()
-        idx._reset_identity()
-        idx._set_labels(labels, level=level, verify_integrity=verify_integrity)
-        if not inplace:
-            return idx
-
-    # remove me in 0.14 and change to readonly property
-    __set_labels = deprecate("setting labels directly",
-                             partial(set_labels, inplace=True,
-                                     verify_integrity=True),
-                             alt_name="set_labels")
-    labels = property(fget=_get_labels, fset=__set_labels)
-
-    def copy(self, names=None, dtype=None, levels=None, labels=None,
-             deep=False, _set_identity=False):
-        """
-        Make a copy of this object. Names, dtype, levels and labels can be
-        passed and will be set on new copy.
-
-        Parameters
-        ----------
-        names : sequence, optional
-        dtype : numpy dtype or pandas type, optional
-        levels : sequence, optional
-        labels : sequence, optional
-
-        Returns
-        -------
-        copy : MultiIndex
-
-        Notes
-        -----
-        In most cases, there should be no functional difference from using
-        ``deep``, but if ``deep`` is passed it will attempt to deepcopy.
-        This could be potentially expensive on large MultiIndex objects.
-        """
-        if deep:
-            from copy import deepcopy
-            levels = levels if levels is not None else deepcopy(self.levels)
-            labels = labels if labels is not None else deepcopy(self.labels)
-            names = names if names is not None else deepcopy(self.names)
-        else:
-            levels = self.levels
-            labels = self.labels
-            names = self.names
-        return MultiIndex(levels=levels,
-                          labels=labels,
-                          names=names,
-                          sortorder=self.sortorder,
-                          verify_integrity=False,
-                          _set_identity=_set_identity)
-
-    def __array__(self, dtype=None):
-        """ the array interface, return my values """
-        return self.values
-
-    def view(self, cls=None):
-        """ this is defined as a copy with the same identity """
-        result = self.copy()
-        result._id = self._id
-        return result
-
-    def _shallow_copy(self, values=None, infer=False, **kwargs):
-        if values is not None:
-            if 'name' in kwargs:
-                kwargs['names'] = kwargs.pop('name',None)
-            return MultiIndex.from_tuples(values, **kwargs)
-        return self.view()
-
-    @cache_readonly
-    def dtype(self):
-        return np.dtype('O')
-
-    @cache_readonly
-    def nbytes(self):
-        """ return the number of bytes in the underlying data """
-        level_nbytes = sum(( i.nbytes for i in self.levels ))
-        label_nbytes = sum(( i.nbytes for i in self.labels ))
-        names_nbytes = sum(( getsizeof(i) for i in self.names ))
-        return level_nbytes + label_nbytes + names_nbytes
-
-    def _format_attrs(self):
-        """
-        Return a list of tuples of the (attr,formatted_value)
-        """
-        attrs = [('levels', default_pprint(self._levels, max_seq_items=False)),
-                 ('labels', default_pprint(self._labels, max_seq_items=False))]
-        if not all(name is None for name in self.names):
-            attrs.append(('names', default_pprint(self.names)))
-        if self.sortorder is not None:
-            attrs.append(('sortorder', default_pprint(self.sortorder)))
-        return attrs
-
-    def _format_space(self):
-        return "\n%s" % (' ' * (len(self.__class__.__name__) + 1))
-
-    def _format_data(self):
-        # we are formatting thru the attributes
-        return None
-
-    def __len__(self):
-        return len(self.labels[0])
-
-    def _get_names(self):
-        return FrozenList(level.name for level in self.levels)
-
-    def _set_names(self, names, level=None, validate=True):
-        """
-        sets names on levels. WARNING: mutates!
-
-        Note that you generally want to set this *after* changing levels, so
-        that it only acts on copies
-        """
-
-        names = list(names)
-
-        if validate and level is not None and len(names) != len(level):
-            raise ValueError('Length of names must match length of level.')
-        if validate and level is None and len(names) != self.nlevels:
-            raise ValueError(
-                'Length of names must match number of levels in MultiIndex.')
-
-        if level is None:
-            level = range(self.nlevels)
-        else:
-            level = [self._get_level_number(l) for l in level]
-
-        # set the name
-        for l, name in zip(level, names):
-            self.levels[l].rename(name, inplace=True)
-
-    names = property(
-        fset=_set_names, fget=_get_names, doc="Names of levels in MultiIndex")
-
-    def _reference_duplicate_name(self, name):
-        """
-        Returns True if the name refered to in self.names is duplicated.
-        """
-        # count the times name equals an element in self.names.
-        return np.sum(name == np.asarray(self.names)) > 1
-
-    def _format_native_types(self, **kwargs):
-        return self.values
-
-    @property
-    def _constructor(self):
-        return MultiIndex.from_tuples
-
-    @cache_readonly
-    def inferred_type(self):
-        return 'mixed'
-
-    @staticmethod
-    def _from_elements(values, labels=None, levels=None, names=None,
-                       sortorder=None):
-        return MultiIndex(levels, labels, names, sortorder=sortorder)
-
-    def _get_level_number(self, level):
-        try:
-            count = self.names.count(level)
-            if count > 1:
-                raise ValueError('The name %s occurs multiple times, use a '
-                                 'level number' % level)
-            level = self.names.index(level)
-        except ValueError:
-            if not isinstance(level, int):
-                raise KeyError('Level %s not found' % str(level))
-            elif level < 0:
-                level += self.nlevels
-                if level < 0:
-                    orig_level = level - self.nlevels
-                    raise IndexError(
-                        'Too many levels: Index has only %d levels, '
-                        '%d is not a valid level number' % (self.nlevels, orig_level)
-                    )
-            # Note: levels are zero-based
-            elif level >= self.nlevels:
-                raise IndexError('Too many levels: Index has only %d levels, '
-                                 'not %d' % (self.nlevels, level + 1))
-        return level
-
-    _tuples = None
-
-    @property
-    def values(self):
-        if self._tuples is not None:
-            return self._tuples
-
-        values = []
-        for lev, lab in zip(self.levels, self.labels):
-            # Need to box timestamps, etc.
-            box = hasattr(lev, '_box_values')
-            # Try to minimize boxing.
-            if box and len(lev) > len(lab):
-                taken = lev._box_values(com.take_1d(lev._values, lab))
-            elif box:
-                taken = com.take_1d(lev._box_values(lev._values), lab,
-                                    fill_value=_get_na_value(lev.dtype.type))
-            else:
-                taken = com.take_1d(np.asarray(lev._values), lab)
-            values.append(taken)
-
-        self._tuples = lib.fast_zip(values)
-        return self._tuples
-
-    # fml
-    @property
-    def _is_v1(self):
-        return False
-
-    @property
-    def _is_v2(self):
-        return False
-
-    @property
-    def _has_complex_internals(self):
-        # to disable groupby tricks
-        return True
-
-    @cache_readonly
-    def is_unique(self):
-        return not self.duplicated().any()
-
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
-    @Appender(_shared_docs['duplicated'] % _index_doc_kwargs)
-    def duplicated(self, keep='first'):
-        from pandas.core.groupby import get_group_index
-        from pandas.hashtable import duplicated_int64
-
-        shape = map(len, self.levels)
-        ids = get_group_index(self.labels, shape, sort=False, xnull=False)
-
-        return duplicated_int64(ids, keep)
-
-    def get_value(self, series, key):
-        # somewhat broken encapsulation
-        from pandas.core.indexing import maybe_droplevels
-        from pandas.core.series import Series
-
-        # Label-based
-        s = _values_from_object(series)
-        k = _values_from_object(key)
-
-        def _try_mi(k):
-            # TODO: what if a level contains tuples??
-            loc = self.get_loc(k)
-            new_values = series._values[loc]
-            new_index = self[loc]
-            new_index = maybe_droplevels(new_index, k)
-            return Series(new_values, index=new_index, name=series.name)
-
-        try:
-            return self._engine.get_value(s, k)
-        except KeyError as e1:
-            try:
-                return _try_mi(key)
-            except KeyError:
-                pass
-
-            try:
-                return _index.get_value_at(s, k)
-            except IndexError:
-                raise
-            except TypeError:
-                # generator/iterator-like
-                if is_iterator(key):
-                    raise InvalidIndexError(key)
-                else:
-                    raise e1
-            except Exception:  # pragma: no cover
-                raise e1
-        except TypeError:
-
-            # a Timestamp will raise a TypeError in a multi-index
-            # rather than a KeyError, try it here
-            # note that a string that 'looks' like a Timestamp will raise
-            # a KeyError! (GH5725)
-            if isinstance(key, (datetime.datetime, np.datetime64)) or (
-                    compat.PY3 and isinstance(key, compat.string_types)):
-                try:
-                    return _try_mi(key)
-                except (KeyError):
-                    raise
-                except:
-                    pass
-
-                try:
-                    return _try_mi(Timestamp(key))
-                except:
-                    pass
-
-            raise InvalidIndexError(key)
-
-    def get_level_values(self, level):
-        """
-        Return vector of label values for requested level, equal to the length
-        of the index
-
-        Parameters
-        ----------
-        level : int or level name
-
-        Returns
-        -------
-        values : ndarray
-        """
-        num = self._get_level_number(level)
-        unique = self.levels[num]  # .values
-        labels = self.labels[num]
-        filled = com.take_1d(unique._values, labels, fill_value=unique._na_value)
-        values = unique._simple_new(filled, self.names[num],
-                                    freq=getattr(unique, 'freq', None),
-                                    tz=getattr(unique, 'tz', None))
-        return values
-
-    def format(self, space=2, sparsify=None, adjoin=True, names=False,
-               na_rep=None, formatter=None):
-        if len(self) == 0:
-            return []
-
-        stringified_levels = []
-        for lev, lab in zip(self.levels, self.labels):
-            na = na_rep if na_rep is not None else _get_na_rep(lev.dtype.type)
-
-            if len(lev) > 0:
-
-                formatted = lev.take(lab).format(formatter=formatter)
-
-                # we have some NA
-                mask = lab == -1
-                if mask.any():
-                    formatted = np.array(formatted, dtype=object)
-                    formatted[mask] = na
-                    formatted = formatted.tolist()
-
-            else:
-                # weird all NA case
-                formatted = [com.pprint_thing(na if isnull(x) else x,
-                                              escape_chars=('\t', '\r', '\n'))
-                             for x in com.take_1d(lev._values, lab)]
-            stringified_levels.append(formatted)
-
-        result_levels = []
-        for lev, name in zip(stringified_levels, self.names):
-            level = []
-
-            if names:
-                level.append(com.pprint_thing(name,
-                                              escape_chars=('\t', '\r', '\n'))
-                             if name is not None else '')
-
-            level.extend(np.array(lev, dtype=object))
-            result_levels.append(level)
-
-        if sparsify is None:
-            sparsify = get_option("display.multi_sparse")
-
-        if sparsify:
-            sentinel = ''
-            # GH3547
-            # use value of sparsify as sentinel,  unless it's an obvious
-            # "Truthey" value
-            if sparsify not in [True, 1]:
-                sentinel = sparsify
-            # little bit of a kludge job for #1217
-            result_levels = _sparsify(result_levels,
-                                      start=int(names),
-                                      sentinel=sentinel)
-
-
-        if adjoin:
-            from pandas.core.format import  _get_adjustment
-            adj = _get_adjustment()
-            return adj.adjoin(space, *result_levels).split('\n')
-        else:
-            return result_levels
-
-    def to_hierarchical(self, n_repeat, n_shuffle=1):
-        """
-        Return a MultiIndex reshaped to conform to the
-        shapes given by n_repeat and n_shuffle.
-
-        Useful to replicate and rearrange a MultiIndex for combination
-        with another Index with n_repeat items.
-
-        Parameters
-        ----------
-        n_repeat : int
-            Number of times to repeat the labels on self
-        n_shuffle : int
-            Controls the reordering of the labels. If the result is going
-            to be an inner level in a MultiIndex, n_shuffle will need to be
-            greater than one. The size of each label must divisible by
-            n_shuffle.
-
-        Returns
-        -------
-        MultiIndex
-
-        Examples
-        --------
-        >>> idx = MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
-                                          (2, u'one'), (2, u'two')])
-        >>> idx.to_hierarchical(3)
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1],
-                           [0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1]])
-        """
-        levels = self.levels
-        labels = [np.repeat(x, n_repeat) for x in self.labels]
-        # Assumes that each label is divisible by n_shuffle
-        labels = [x.reshape(n_shuffle, -1).ravel(1) for x in labels]
-        names = self.names
-        return MultiIndex(levels=levels, labels=labels, names=names)
-
-    @property
-    def is_all_dates(self):
-        return False
-
-    def is_lexsorted(self):
-        """
-        Return True if the labels are lexicographically sorted
-        """
-        return self.lexsort_depth == self.nlevels
-
-    def is_lexsorted_for_tuple(self, tup):
-        """
-        Return True if we are correctly lexsorted given the passed tuple
-        """
-        return len(tup) <= self.lexsort_depth
-
-    @cache_readonly
-    def lexsort_depth(self):
-        if self.sortorder is not None:
-            if self.sortorder == 0:
-                return self.nlevels
-            else:
-                return 0
-
-        int64_labels = [com._ensure_int64(lab) for lab in self.labels]
-        for k in range(self.nlevels, 0, -1):
-            if lib.is_lexsorted(int64_labels[:k]):
-                return k
-
-        return 0
-
-    @classmethod
-    def from_arrays(cls, arrays, sortorder=None, names=None):
-        """
-        Convert arrays to MultiIndex
-
-        Parameters
-        ----------
-        arrays : list / sequence of array-likes
-            Each array-like gives one level's value for each data point.
-            len(arrays) is the number of levels.
-        sortorder : int or None
-            Level of sortedness (must be lexicographically sorted by that
-            level)
-
-        Returns
-        -------
-        index : MultiIndex
-
-        Examples
-        --------
-        >>> arrays = [[1, 1, 2, 2], ['red', 'blue', 'red', 'blue']]
-        >>> MultiIndex.from_arrays(arrays, names=('number', 'color'))
-
-        See Also
-        --------
-        MultiIndex.from_tuples : Convert list of tuples to MultiIndex
-        MultiIndex.from_product : Make a MultiIndex from cartesian product
-                                  of iterables
-        """
-        from pandas.core.categorical import Categorical
-
-        if len(arrays) == 1:
-            name = None if names is None else names[0]
-            return Index(arrays[0], name=name)
-
-        cats = [Categorical.from_array(arr, ordered=True) for arr in arrays]
-        levels = [c.categories for c in cats]
-        labels = [c.codes for c in cats]
-        if names is None:
-            names = [getattr(arr, "name", None) for arr in arrays]
-
-        return MultiIndex(levels=levels, labels=labels,
-                          sortorder=sortorder, names=names,
-                          verify_integrity=False)
-
-    @classmethod
-    def from_tuples(cls, tuples, sortorder=None, names=None):
-        """
-        Convert list of tuples to MultiIndex
-
-        Parameters
-        ----------
-        tuples : list / sequence of tuple-likes
-            Each tuple is the index of one row/column.
-        sortorder : int or None
-            Level of sortedness (must be lexicographically sorted by that
-            level)
-
-        Returns
-        -------
-        index : MultiIndex
-
-        Examples
-        --------
-        >>> tuples = [(1, u'red'), (1, u'blue'),
-                      (2, u'red'), (2, u'blue')]
-        >>> MultiIndex.from_tuples(tuples, names=('number', 'color'))
-
-        See Also
-        --------
-        MultiIndex.from_arrays : Convert list of arrays to MultiIndex
-        MultiIndex.from_product : Make a MultiIndex from cartesian product
-                                  of iterables
-        """
-        if len(tuples) == 0:
-            # I think this is right? Not quite sure...
-            raise TypeError('Cannot infer number of levels from empty list')
-
-        if isinstance(tuples, (np.ndarray, Index)):
-            if isinstance(tuples, Index):
-                tuples = tuples._values
-
-            arrays = list(lib.tuples_to_object_array(tuples).T)
-        elif isinstance(tuples, list):
-            arrays = list(lib.to_object_array_tuples(tuples).T)
-        else:
-            arrays = lzip(*tuples)
-
-        return MultiIndex.from_arrays(arrays, sortorder=sortorder,
-                                      names=names)
-
-    @classmethod
-    def from_product(cls, iterables, sortorder=None, names=None):
-        """
-        Make a MultiIndex from the cartesian product of multiple iterables
-
-        Parameters
-        ----------
-        iterables : list / sequence of iterables
-            Each iterable has unique labels for each level of the index.
-        sortorder : int or None
-            Level of sortedness (must be lexicographically sorted by that
-            level).
-        names : list / sequence of strings or None
-            Names for the levels in the index.
-
-        Returns
-        -------
-        index : MultiIndex
-
-        Examples
-        --------
-        >>> numbers = [0, 1, 2]
-        >>> colors = [u'green', u'purple']
-        >>> MultiIndex.from_product([numbers, colors],
-                                     names=['number', 'color'])
-        MultiIndex(levels=[[0, 1, 2], [u'green', u'purple']],
-                   labels=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]],
-                   names=[u'number', u'color'])
-
-        See Also
-        --------
-        MultiIndex.from_arrays : Convert list of arrays to MultiIndex
-        MultiIndex.from_tuples : Convert list of tuples to MultiIndex
-        """
-        from pandas.core.categorical import Categorical
-        from pandas.tools.util import cartesian_product
-
-        categoricals = [Categorical.from_array(it, ordered=True) for it in iterables]
-        labels = cartesian_product([c.codes for c in categoricals])
-
-        return MultiIndex(levels=[c.categories for c in categoricals],
-                          labels=labels, sortorder=sortorder, names=names)
-
-    @property
-    def nlevels(self):
-        return len(self.levels)
-
-    @property
-    def levshape(self):
-        return tuple(len(x) for x in self.levels)
-
-    def __contains__(self, key):
-        hash(key)
-        # work around some kind of odd cython bug
-        try:
-            self.get_loc(key)
-            return True
-        except LookupError:
-            return False
-
-    def __reduce__(self):
-        """Necessary for making this object picklable"""
-        d = dict(levels = [lev for lev in self.levels],
-                 labels = [label for label in self.labels],
-                 sortorder = self.sortorder,
-                 names = list(self.names))
-        return _new_Index, (self.__class__, d), None
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-
-        if isinstance(state, dict):
-            levels = state.get('levels')
-            labels = state.get('labels')
-            sortorder = state.get('sortorder')
-            names = state.get('names')
-
-        elif isinstance(state, tuple):
-
-            nd_state, own_state = state
-            levels, labels, sortorder, names = own_state
-
-        self._set_levels([Index(x) for x in levels], validate=False)
-        self._set_labels(labels)
-        self._set_names(names)
-        self.sortorder = sortorder
-        self._verify_integrity()
-        self._reset_identity()
-
-    def __getitem__(self, key):
-        if np.isscalar(key):
-            retval = []
-            for lev, lab in zip(self.levels, self.labels):
-                if lab[key] == -1:
-                    retval.append(np.nan)
-                else:
-                    retval.append(lev[lab[key]])
-
-            return tuple(retval)
-        else:
-            if is_bool_indexer(key):
-                key = np.asarray(key)
-                sortorder = self.sortorder
-            else:
-                # cannot be sure whether the result will be sorted
-                sortorder = None
-
-            new_labels = [lab[key] for lab in self.labels]
-
-            return MultiIndex(levels=self.levels,
-                              labels=new_labels,
-                              names=self.names,
-                              sortorder=sortorder,
-                              verify_integrity=False)
-
-    def take(self, indexer, axis=None):
-        indexer = com._ensure_platform_int(indexer)
-        new_labels = [lab.take(indexer) for lab in self.labels]
-        return MultiIndex(levels=self.levels, labels=new_labels,
-                          names=self.names, verify_integrity=False)
-
-    def append(self, other):
-        """
-        Append a collection of Index options together
-
-        Parameters
-        ----------
-        other : Index or list/tuple of indices
-
-        Returns
-        -------
-        appended : Index
-        """
-        if not isinstance(other, (list, tuple)):
-            other = [other]
-
-        if all((isinstance(o, MultiIndex) and o.nlevels >= self.nlevels) for o in other):
-            arrays = []
-            for i in range(self.nlevels):
-                label = self.get_level_values(i)
-                appended = [o.get_level_values(i) for o in other]
-                arrays.append(label.append(appended))
-            return MultiIndex.from_arrays(arrays, names=self.names)
-
-        to_concat = (self.values,) + tuple(k._values for k in other)
-        new_tuples = np.concatenate(to_concat)
-
-        # if all(isinstance(x, MultiIndex) for x in other):
-        try:
-            return MultiIndex.from_tuples(new_tuples, names=self.names)
-        except:
-            return Index(new_tuples)
-
-    def argsort(self, *args, **kwargs):
-        return self.values.argsort(*args, **kwargs)
-
-    def repeat(self, n):
-        return MultiIndex(levels=self.levels,
-                          labels=[label.view(np.ndarray).repeat(n) for label in self.labels],
-                          names=self.names,
-                          sortorder=self.sortorder,
-                          verify_integrity=False)
-
-    def drop(self, labels, level=None, errors='raise'):
-        """
-        Make new MultiIndex with passed list of labels deleted
-
-        Parameters
-        ----------
-        labels : array-like
-            Must be a list of tuples
-        level : int or level name, default None
-
-        Returns
-        -------
-        dropped : MultiIndex
-        """
-        if level is not None:
-            return self._drop_from_level(labels, level)
-
-        try:
-            if not isinstance(labels, (np.ndarray, Index)):
-                labels = com._index_labels_to_array(labels)
-            indexer = self.get_indexer(labels)
-            mask = indexer == -1
-            if mask.any():
-                if errors != 'ignore':
-                    raise ValueError('labels %s not contained in axis'
-                                     % labels[mask])
-                indexer = indexer[~mask]
-        except Exception:
-            pass
-
-        inds = []
-        for label in labels:
-            try:
-                loc = self.get_loc(label)
-                if isinstance(loc, int):
-                    inds.append(loc)
-                else:
-                    inds.extend(lrange(loc.start, loc.stop))
-            except KeyError:
-                if errors != 'ignore':
-                    raise
-
-        return self.delete(inds)
-
-    def _drop_from_level(self, labels, level):
-        labels = com._index_labels_to_array(labels)
-        i = self._get_level_number(level)
-        index = self.levels[i]
-        values = index.get_indexer(labels)
-
-        mask = ~lib.ismember(self.labels[i], set(values))
-
-        return self[mask]
-
-    def droplevel(self, level=0):
-        """
-        Return Index with requested level removed. If MultiIndex has only 2
-        levels, the result will be of Index type not MultiIndex.
-
-        Parameters
-        ----------
-        level : int/level name or list thereof
-
-        Notes
-        -----
-        Does not check if result index is unique or not
-
-        Returns
-        -------
-        index : Index or MultiIndex
-        """
-        levels = level
-        if not isinstance(levels, (tuple, list)):
-            levels = [level]
-
-        new_levels = list(self.levels)
-        new_labels = list(self.labels)
-        new_names = list(self.names)
-
-        levnums = sorted(self._get_level_number(lev) for lev in levels)[::-1]
-
-        for i in levnums:
-            new_levels.pop(i)
-            new_labels.pop(i)
-            new_names.pop(i)
-
-        if len(new_levels) == 1:
-
-            # set nan if needed
-            mask = new_labels[0] == -1
-            result = new_levels[0].take(new_labels[0])
-            if mask.any():
-                result = result.putmask(mask, np.nan)
-
-            result.name = new_names[0]
-            return result
-        else:
-            return MultiIndex(levels=new_levels, labels=new_labels,
-                              names=new_names, verify_integrity=False)
-
-    def swaplevel(self, i, j):
-        """
-        Swap level i with level j. Do not change the ordering of anything
-
-        Parameters
-        ----------
-        i, j : int, string (can be mixed)
-            Level of index to be swapped. Can pass level name as string.
-
-        Returns
-        -------
-        swapped : MultiIndex
-        """
-        new_levels = list(self.levels)
-        new_labels = list(self.labels)
-        new_names = list(self.names)
-
-        i = self._get_level_number(i)
-        j = self._get_level_number(j)
-
-        new_levels[i], new_levels[j] = new_levels[j], new_levels[i]
-        new_labels[i], new_labels[j] = new_labels[j], new_labels[i]
-        new_names[i], new_names[j] = new_names[j], new_names[i]
-
-        return MultiIndex(levels=new_levels, labels=new_labels,
-                          names=new_names, verify_integrity=False)
-
-    def reorder_levels(self, order):
-        """
-        Rearrange levels using input order. May not drop or duplicate levels
-
-        Parameters
-        ----------
-        """
-        order = [self._get_level_number(i) for i in order]
-        if len(order) != self.nlevels:
-            raise AssertionError(('Length of order must be same as '
-                                  'number of levels (%d), got %d')
-                                 % (self.nlevels, len(order)))
-        new_levels = [self.levels[i] for i in order]
-        new_labels = [self.labels[i] for i in order]
-        new_names = [self.names[i] for i in order]
-
-        return MultiIndex(levels=new_levels, labels=new_labels,
-                          names=new_names, verify_integrity=False)
-
-    def __getslice__(self, i, j):
-        return self.__getitem__(slice(i, j))
-
-    def sortlevel(self, level=0, ascending=True, sort_remaining=True):
-        """
-        Sort MultiIndex at the requested level. The result will respect the
-        original ordering of the associated factor at that level.
-
-        Parameters
-        ----------
-        level : list-like, int or str, default 0
-            If a string is given, must be a name of the level
-            If list-like must be names or ints of levels.
-        ascending : boolean, default True
-            False to sort in descending order
-            Can also be a list to specify a directed ordering
-        sort_remaining : sort by the remaining levels after level.
-
-        Returns
-        -------
-        sorted_index : MultiIndex
-        """
-        from pandas.core.groupby import _indexer_from_factorized
-
-        if isinstance(level, (compat.string_types, int)):
-            level = [level]
-        level = [self._get_level_number(lev) for lev in level]
-        sortorder = None
-
-        # we have a directed ordering via ascending
-        if isinstance(ascending, list):
-            if not len(level) == len(ascending):
-                raise ValueError("level must have same length as ascending")
-
-            from pandas.core.groupby import _lexsort_indexer
-            indexer = _lexsort_indexer(self.labels, orders=ascending)
-
-        # level ordering
-        else:
-
-            labels = list(self.labels)
-            shape = list(self.levshape)
-
-            # partition labels and shape
-            primary = tuple(labels.pop(lev - i) for i, lev in enumerate(level))
-            primshp = tuple(shape.pop(lev - i) for i, lev in enumerate(level))
-
-            if sort_remaining:
-                primary += primary + tuple(labels)
-                primshp += primshp + tuple(shape)
-            else:
-                sortorder = level[0]
-
-            indexer = _indexer_from_factorized(primary,
-                                               primshp,
-                                               compress=False)
-
-            if not ascending:
-                indexer = indexer[::-1]
-
-        indexer = com._ensure_platform_int(indexer)
-        new_labels = [lab.take(indexer) for lab in self.labels]
-
-        new_index = MultiIndex(labels=new_labels, levels=self.levels,
-                               names=self.names, sortorder=sortorder,
-                               verify_integrity=False)
-
-        return new_index, indexer
-
-    def get_indexer(self, target, method=None, limit=None, tolerance=None):
-        """
-        Compute indexer and mask for new index given the current index. The
-        indexer should be then used as an input to ndarray.take to align the
-        current data to the new index. The mask determines whether labels are
-        found or not in the current index
-
-        Parameters
-        ----------
-        target : MultiIndex or Index (of tuples)
-        method : {'pad', 'ffill', 'backfill', 'bfill'}
-            pad / ffill: propagate LAST valid observation forward to next valid
-            backfill / bfill: use NEXT valid observation to fill gap
-
-        Notes
-        -----
-        This is a low-level method and probably should be used at your own risk
-
-        Examples
-        --------
-        >>> indexer, mask = index.get_indexer(new_index)
-        >>> new_values = cur_values.take(indexer)
-        >>> new_values[-mask] = np.nan
-
-        Returns
-        -------
-        (indexer, mask) : (ndarray, ndarray)
-        """
-        method = com._clean_reindex_fill_method(method)
-
-        target = _ensure_index(target)
-
-        target_index = target
-        if isinstance(target, MultiIndex):
-            target_index = target._tuple_index
-
-        if not is_object_dtype(target_index.dtype):
-            return np.ones(len(target_index)) * -1
-
-        if not self.is_unique:
-            raise Exception('Reindexing only valid with uniquely valued Index '
-                            'objects')
-
-        self_index = self._tuple_index
-
-        if method == 'pad' or method == 'backfill':
-            if tolerance is not None:
-                raise NotImplementedError("tolerance not implemented yet "
-                                          'for MultiIndex')
-            indexer = self_index._get_fill_indexer(target, method, limit)
-        elif method == 'nearest':
-            raise NotImplementedError("method='nearest' not implemented yet "
-                                      'for MultiIndex; see GitHub issue 9365')
-        else:
-            indexer = self_index._engine.get_indexer(target._values)
-
-        return com._ensure_platform_int(indexer)
-
-    def reindex(self, target, method=None, level=None, limit=None,
-                tolerance=None):
-        """
-        Create index with target's values (move/add/delete values as necessary)
-
-        Returns
-        -------
-        new_index : pd.MultiIndex
-            Resulting index
-        indexer : np.ndarray or None
-            Indices of output values in original index
-
-        """
-        # GH6552: preserve names when reindexing to non-named target
-        # (i.e. neither Index nor Series).
-        preserve_names = not hasattr(target, 'names')
-
-        if level is not None:
-            if method is not None:
-                raise TypeError('Fill method not supported if level passed')
-
-            # GH7774: preserve dtype/tz if target is empty and not an Index.
-            target = _ensure_has_len(target)  # target may be an iterator
-            if len(target) == 0 and not isinstance(target, Index):
-                idx = self.levels[level]
-                attrs = idx._get_attributes_dict()
-                attrs.pop('freq', None)  # don't preserve freq
-                target = type(idx)._simple_new(np.empty(0, dtype=idx.dtype),
-                                               **attrs)
-            else:
-                target = _ensure_index(target)
-            target, indexer, _ = self._join_level(target, level, how='right',
-                                                  return_indexers=True,
-                                                  keep_order=False)
-        else:
-            if self.equals(target):
-                indexer = None
-            else:
-                if self.is_unique:
-                    indexer = self.get_indexer(target, method=method,
-                                               limit=limit,
-                                               tolerance=tolerance)
-                else:
-                    raise Exception(
-                        "cannot handle a non-unique multi-index!")
-
-        if not isinstance(target, MultiIndex):
-            if indexer is None:
-                target = self
-            elif (indexer >= 0).all():
-                target = self.take(indexer)
-            else:
-                # hopefully?
-                target = MultiIndex.from_tuples(target)
-
-        if (preserve_names and target.nlevels == self.nlevels and
-            target.names != self.names):
-            target = target.copy(deep=False)
-            target.names = self.names
-
-        return target, indexer
-
-    @cache_readonly
-    def _tuple_index(self):
-        """
-        Convert MultiIndex to an Index of tuples
-
-        Returns
-        -------
-        index : Index
-        """
-        return Index(self._values)
-
-    def get_slice_bound(self, label, side, kind):
-        if not isinstance(label, tuple):
-            label = label,
-        return self._partial_tup_index(label, side=side)
-
-    def slice_locs(self, start=None, end=None, step=None, kind=None):
-        """
-        For an ordered MultiIndex, compute the slice locations for input
-        labels. They can be tuples representing partial levels, e.g. for a
-        MultiIndex with 3 levels, you can pass a single value (corresponding to
-        the first level), or a 1-, 2-, or 3-tuple.
-
-        Parameters
-        ----------
-        start : label or tuple, default None
-            If None, defaults to the beginning
-        end : label or tuple
-            If None, defaults to the end
-        step : int or None
-            Slice step
-        kind : string, optional, defaults None
-
-        Returns
-        -------
-        (start, end) : (int, int)
-
-        Notes
-        -----
-        This function assumes that the data is sorted by the first level
-        """
-        # This function adds nothing to its parent implementation (the magic
-        # happens in get_slice_bound method), but it adds meaningful doc.
-        return super(MultiIndex, self).slice_locs(start, end, step, kind=kind)
-
-    def _partial_tup_index(self, tup, side='left'):
-        if len(tup) > self.lexsort_depth:
-            raise KeyError('Key length (%d) was greater than MultiIndex'
-                           ' lexsort depth (%d)' %
-                           (len(tup), self.lexsort_depth))
-
-        n = len(tup)
-        start, end = 0, len(self)
-        zipped = zip(tup, self.levels, self.labels)
-        for k, (lab, lev, labs) in enumerate(zipped):
-            section = labs[start:end]
-
-            if lab not in lev:
-                if not lev.is_type_compatible(lib.infer_dtype([lab])):
-                    raise TypeError('Level type mismatch: %s' % lab)
-
-                # short circuit
-                loc = lev.searchsorted(lab, side=side)
-                if side == 'right' and loc >= 0:
-                    loc -= 1
-                return start + section.searchsorted(loc, side=side)
-
-            idx = lev.get_loc(lab)
-            if k < n - 1:
-                end = start + section.searchsorted(idx, side='right')
-                start = start + section.searchsorted(idx, side='left')
-            else:
-                return start + section.searchsorted(idx, side=side)
-
-    def get_loc(self, key, method=None):
-        """
-        Get integer location, slice or boolean mask for requested label or tuple
-        If the key is past the lexsort depth, the return may be a boolean mask
-        array, otherwise it is always a slice or int.
-
-        Parameters
-        ----------
-        key : label or tuple
-        method : None
-
-        Returns
-        -------
-        loc : int, slice object or boolean mask
-        """
-        if method is not None:
-            raise NotImplementedError('only the default get_loc method is '
-                                      'currently supported for MultiIndex')
-
-        def _maybe_to_slice(loc):
-            '''convert integer indexer to boolean mask or slice if possible'''
-            if not isinstance(loc, np.ndarray) or loc.dtype != 'int64':
-                return loc
-
-            loc = lib.maybe_indices_to_slice(loc, len(self))
-            if isinstance(loc, slice):
-                return loc
-
-            mask = np.empty(len(self), dtype='bool')
-            mask.fill(False)
-            mask[loc] = True
-            return mask
-
-        if not isinstance(key, tuple):
-            loc = self._get_level_indexer(key, level=0)
-            return _maybe_to_slice(loc)
-
-        keylen = len(key)
-        if self.nlevels < keylen:
-            raise KeyError('Key length ({0}) exceeds index depth ({1})'
-                    ''.format(keylen, self.nlevels))
-
-        if keylen == self.nlevels and self.is_unique:
-            def _maybe_str_to_time_stamp(key, lev):
-                if lev.is_all_dates and not isinstance(key, Timestamp):
-                    try:
-                        return Timestamp(key, tz=getattr(lev, 'tz', None))
-                    except Exception:
-                        pass
-                return key
-            key = _values_from_object(key)
-            key = tuple(map(_maybe_str_to_time_stamp, key, self.levels))
-            return self._engine.get_loc(key)
-
-        # -- partial selection or non-unique index
-        # break the key into 2 parts based on the lexsort_depth of the index;
-        # the first part returns a continuous slice of the index; the 2nd part
-        # needs linear search within the slice
-        i = self.lexsort_depth
-        lead_key, follow_key = key[:i], key[i:]
-        start, stop = self.slice_locs(lead_key, lead_key) \
-                if lead_key else (0, len(self))
-
-        if start == stop:
-            raise KeyError(key)
-
-        if not follow_key:
-            return slice(start, stop)
-
-        warnings.warn('indexing past lexsort depth may impact performance.',
-                      PerformanceWarning, stacklevel=10)
-
-        loc = np.arange(start, stop, dtype='int64')
-
-        for i, k in enumerate(follow_key, len(lead_key)):
-            mask = self.labels[i][loc] == self.levels[i].get_loc(k)
-            if not mask.all():
-                loc = loc[mask]
-            if not len(loc):
-                raise KeyError(key)
-
-        return _maybe_to_slice(loc) \
-                if len(loc) != stop - start \
-                else slice(start, stop)
-
-    def get_loc_level(self, key, level=0, drop_level=True):
-        """
-        Get integer location slice for requested label or tuple
-
-        Parameters
-        ----------
-        key : label or tuple
-        level : int/level name or list thereof
-
-        Returns
-        -------
-        loc : int or slice object
-        """
-        def maybe_droplevels(indexer, levels, drop_level):
-            if not drop_level:
-                return self[indexer]
-            # kludgearound
-            orig_index = new_index = self[indexer]
-            levels = [self._get_level_number(i) for i in levels]
-            for i in sorted(levels, reverse=True):
-                try:
-                    new_index = new_index.droplevel(i)
-                except:
-
-                    # no dropping here
-                    return orig_index
-            return new_index
-
-        if isinstance(level, (tuple, list)):
-            if len(key) != len(level):
-                raise AssertionError('Key for location must have same '
-                                     'length as number of levels')
-            result = None
-            for lev, k in zip(level, key):
-                loc, new_index = self.get_loc_level(k, level=lev)
-                if isinstance(loc, slice):
-                    mask = np.zeros(len(self), dtype=bool)
-                    mask[loc] = True
-                    loc = mask
-
-                result = loc if result is None else result & loc
-
-            return result, maybe_droplevels(result, level, drop_level)
-
-        level = self._get_level_number(level)
-
-        # kludge for #1796
-        if isinstance(key, list):
-            key = tuple(key)
-
-        if isinstance(key, tuple) and level == 0:
-
-            try:
-                if key in self.levels[0]:
-                    indexer = self._get_level_indexer(key, level=level)
-                    new_index = maybe_droplevels(indexer, [0], drop_level)
-                    return indexer, new_index
-            except TypeError:
-                pass
-
-            if not any(isinstance(k, slice) for k in key):
-
-                # partial selection
-                # optionally get indexer to avoid re-calculation
-                def partial_selection(key, indexer=None):
-                    if indexer is None:
-                        indexer = self.get_loc(key)
-                    ilevels = [i for i in range(len(key))
-                               if key[i] != slice(None, None)]
-                    return indexer, maybe_droplevels(indexer, ilevels,
-                                                     drop_level)
-
-                if len(key) == self.nlevels:
-
-                    if self.is_unique:
-
-                        # here we have a completely specified key, but are
-                        # using some partial string matching here
-                        # GH4758
-                        can_index_exactly = any([
-                            (l.is_all_dates and
-                             not isinstance(k, compat.string_types))
-                            for k, l in zip(key, self.levels)
-                        ])
-                        if any([
-                            l.is_all_dates for k, l in zip(key, self.levels)
-                        ]) and not can_index_exactly:
-                            indexer = self.get_loc(key)
-
-                            # we have a multiple selection here
-                            if not isinstance(indexer, slice) \
-                                    or indexer.stop - indexer.start != 1:
-                                return partial_selection(key, indexer)
-
-                            key = tuple(self[indexer].tolist()[0])
-
-                        return (self._engine.get_loc(_values_from_object(key)),
-                                None)
-                    else:
-                        return partial_selection(key)
-                else:
-                    return partial_selection(key)
-            else:
-                indexer = None
-                for i, k in enumerate(key):
-                    if not isinstance(k, slice):
-                        k = self._get_level_indexer(k, level=i)
-                        if isinstance(k, slice):
-                            # everything
-                            if k.start == 0 and k.stop == len(self):
-                                k = slice(None, None)
-                        else:
-                            k_index = k
-
-                    if isinstance(k, slice):
-                        if k == slice(None, None):
-                            continue
-                        else:
-                            raise TypeError(key)
-
-                    if indexer is None:
-                        indexer = k_index
-                    else:  # pragma: no cover
-                        indexer &= k_index
-                if indexer is None:
-                    indexer = slice(None, None)
-                ilevels = [i for i in range(len(key))
-                           if key[i] != slice(None, None)]
-                return indexer, maybe_droplevels(indexer, ilevels,
-                                                 drop_level)
-        else:
-            indexer = self._get_level_indexer(key, level=level)
-            return indexer, maybe_droplevels(indexer, [level], drop_level)
-
-    def _get_level_indexer(self, key, level=0, indexer=None):
-        # return an indexer, boolean array or a slice showing where the key is
-        # in the totality of values
-        # if the indexer is provided, then use this
-
-        level_index = self.levels[level]
-        labels = self.labels[level]
-
-        def convert_indexer(start, stop, step, indexer=indexer, labels=labels):
-            # given the inputs and the labels/indexer, compute an indexer set
-            # if we have a provided indexer, then this need not consider
-            # the entire labels set
-
-            r = np.arange(start,stop,step)
-            if indexer is not None and len(indexer) != len(labels):
-
-                # we have an indexer which maps the locations in the labels that we
-                # have already selected (and is not an indexer for the entire set)
-                # otherwise this is wasteful
-                # so we only need to examine locations that are in this set
-                # the only magic here is that the result are the mappings to the
-                # set that we have selected
-                from pandas import Series
-                mapper = Series(indexer)
-                indexer = labels.take(com._ensure_platform_int(indexer))
-                result = Series(Index(indexer).isin(r).nonzero()[0])
-                m = result.map(mapper)._values
-
-            else:
-                m = np.zeros(len(labels),dtype=bool)
-                m[np.in1d(labels,r,assume_unique=True)] = True
-
-            return m
-
-        if isinstance(key, slice):
-            # handle a slice, returnig a slice if we can
-            # otherwise a boolean indexer
-
-            try:
-                if key.start is not None:
-                    start = level_index.get_loc(key.start)
-                else:
-                    start = 0
-                if key.stop is not None:
-                    stop  = level_index.get_loc(key.stop)
-                else:
-                    stop = len(level_index)-1
-                step = key.step
-            except (KeyError):
-
-                # we have a partial slice (like looking up a partial date string)
-                start = stop = level_index.slice_indexer(key.start, key.stop, key.step)
-                step = start.step
-
-            if isinstance(start,slice) or isinstance(stop,slice):
-                # we have a slice for start and/or stop
-                # a partial date slicer on a DatetimeIndex generates a slice
-                # note that the stop ALREADY includes the stopped point (if
-                # it was a string sliced)
-                return convert_indexer(start.start,stop.stop,step)
-
-            elif level > 0 or self.lexsort_depth == 0 or step is not None:
-                # need to have like semantics here to right
-                # searching as when we are using a slice
-                # so include the stop+1 (so we include stop)
-                return convert_indexer(start,stop+1,step)
-            else:
-                # sorted, so can return slice object -> view
-                i = labels.searchsorted(start, side='left')
-                j = labels.searchsorted(stop, side='right')
-                return slice(i, j, step)
-
-        else:
-
-            loc = level_index.get_loc(key)
-            if level > 0 or self.lexsort_depth == 0:
-                return np.array(labels == loc,dtype=bool)
-            else:
-                # sorted, so can return slice object -> view
-                i = labels.searchsorted(loc, side='left')
-                j = labels.searchsorted(loc, side='right')
-                return slice(i, j)
-
-    def get_locs(self, tup):
-        """
-        Given a tuple of slices/lists/labels/boolean indexer to a level-wise spec
-        produce an indexer to extract those locations
-
-        Parameters
-        ----------
-        key : tuple of (slices/list/labels)
-
-        Returns
-        -------
-        locs : integer list of locations or boolean indexer suitable
-               for passing to iloc
-        """
-
-        # must be lexsorted to at least as many levels
-        if not self.is_lexsorted_for_tuple(tup):
-            raise KeyError('MultiIndex Slicing requires the index to be fully lexsorted'
-                           ' tuple len ({0}), lexsort depth ({1})'.format(len(tup), self.lexsort_depth))
-
-        # indexer
-        # this is the list of all values that we want to select
-        n = len(self)
-        indexer = None
-
-        def _convert_to_indexer(r):
-            # return an indexer
-            if isinstance(r, slice):
-                m = np.zeros(n,dtype=bool)
-                m[r] = True
-                r = m.nonzero()[0]
-            elif is_bool_indexer(r):
-                if len(r) != n:
-                    raise ValueError("cannot index with a boolean indexer that is"
-                                     " not the same length as the index")
-                r = r.nonzero()[0]
-            return Int64Index(r)
-
-        def _update_indexer(idxr, indexer=indexer):
-            if indexer is None:
-                indexer = Index(np.arange(n))
-            if idxr is None:
-                return indexer
-            return indexer & idxr
-
-        for i,k in enumerate(tup):
-
-            if is_bool_indexer(k):
-                # a boolean indexer, must be the same length!
-                k = np.asarray(k)
-                indexer = _update_indexer(_convert_to_indexer(k), indexer=indexer)
-
-            elif is_list_like(k):
-                # a collection of labels to include from this level (these are or'd)
-                indexers = None
-                for x in k:
-                    try:
-                        idxrs = _convert_to_indexer(self._get_level_indexer(x, level=i, indexer=indexer))
-                        indexers = idxrs if indexers is None else indexers | idxrs
-                    except (KeyError):
-
-                        # ignore not founds
-                        continue
-
-                if indexers is not None:
-                    indexer = _update_indexer(indexers, indexer=indexer)
-                else:
-
-                    # no matches we are done
-                    return Int64Index([])._values
-
-            elif is_null_slice(k):
-                # empty slice
-                indexer = _update_indexer(None, indexer=indexer)
-
-            elif isinstance(k,slice):
-
-                # a slice, include BOTH of the labels
-                indexer = _update_indexer(_convert_to_indexer(self._get_level_indexer(k,level=i,indexer=indexer)), indexer=indexer)
-            else:
-                # a single label
-                indexer = _update_indexer(_convert_to_indexer(self.get_loc_level(k,level=i,drop_level=False)[0]), indexer=indexer)
-
-        # empty indexer
-        if indexer is None:
-            return Int64Index([])._values
-        return indexer._values
-
-    def truncate(self, before=None, after=None):
-        """
-        Slice index between two labels / tuples, return new MultiIndex
-
-        Parameters
-        ----------
-        before : label or tuple, can be partial. Default None
-            None defaults to start
-        after : label or tuple, can be partial. Default None
-            None defaults to end
-
-        Returns
-        -------
-        truncated : MultiIndex
-        """
-        if after and before and after < before:
-            raise ValueError('after < before')
-
-        i, j = self.levels[0].slice_locs(before, after)
-        left, right = self.slice_locs(before, after)
-
-        new_levels = list(self.levels)
-        new_levels[0] = new_levels[0][i:j]
-
-        new_labels = [lab[left:right] for lab in self.labels]
-        new_labels[0] = new_labels[0] - i
-
-        return MultiIndex(levels=new_levels, labels=new_labels,
-                          verify_integrity=False)
-
-    def equals(self, other):
-        """
-        Determines if two MultiIndex objects have the same labeling information
-        (the levels themselves do not necessarily have to be the same)
-
-        See also
-        --------
-        equal_levels
-        """
-        if self.is_(other):
-            return True
-
-        if not isinstance(other, MultiIndex):
-            return array_equivalent(self._values,
-                                    _values_from_object(_ensure_index(other)))
-
-        if self.nlevels != other.nlevels:
-            return False
-
-        if len(self) != len(other):
-            return False
-
-        for i in range(self.nlevels):
-            svalues = com.take_nd(np.asarray(self.levels[i]._values), self.labels[i],
-                                  allow_fill=False)
-            ovalues = com.take_nd(np.asarray(other.levels[i]._values), other.labels[i],
-                                  allow_fill=False)
-            if not array_equivalent(svalues, ovalues):
-                return False
-
-        return True
-
-    def equal_levels(self, other):
-        """
-        Return True if the levels of both MultiIndex objects are the same
-
-        """
-        if self.nlevels != other.nlevels:
-            return False
-
-        for i in range(self.nlevels):
-            if not self.levels[i].equals(other.levels[i]):
-                return False
-        return True
-
-    def union(self, other):
-        """
-        Form the union of two MultiIndex objects, sorting if possible
-
-        Parameters
-        ----------
-        other : MultiIndex or array / Index of tuples
-
-        Returns
-        -------
-        Index
-
-        >>> index.union(index2)
-        """
-        self._assert_can_do_setop(other)
-        other, result_names = self._convert_can_do_setop(other)
-
-        if len(other) == 0 or self.equals(other):
-            return self
-
-        uniq_tuples = lib.fast_unique_multiple([self._values, other._values])
-        return MultiIndex.from_arrays(lzip(*uniq_tuples), sortorder=0,
-                                      names=result_names)
-
-    def intersection(self, other):
-        """
-        Form the intersection of two MultiIndex objects, sorting if possible
-
-        Parameters
-        ----------
-        other : MultiIndex or array / Index of tuples
-
-        Returns
-        -------
-        Index
-        """
-        self._assert_can_do_setop(other)
-        other, result_names = self._convert_can_do_setop(other)
-
-        if self.equals(other):
-            return self
-
-        self_tuples = self._values
-        other_tuples = other._values
-        uniq_tuples = sorted(set(self_tuples) & set(other_tuples))
-        if len(uniq_tuples) == 0:
-            return MultiIndex(levels=[[]] * self.nlevels,
-                              labels=[[]] * self.nlevels,
-                              names=result_names, verify_integrity=False)
-        else:
-            return MultiIndex.from_arrays(lzip(*uniq_tuples), sortorder=0,
-                                          names=result_names)
-
-    def difference(self, other):
-        """
-        Compute sorted set difference of two MultiIndex objects
-
-        Returns
-        -------
-        diff : MultiIndex
-        """
-        self._assert_can_do_setop(other)
-        other, result_names = self._convert_can_do_setop(other)
-
-        if len(other) == 0:
-                return self
-
-        if self.equals(other):
-            return MultiIndex(levels=[[]] * self.nlevels,
-                              labels=[[]] * self.nlevels,
-                              names=result_names, verify_integrity=False)
-
-        difference = sorted(set(self._values) - set(other._values))
-
-        if len(difference) == 0:
-            return MultiIndex(levels=[[]] * self.nlevels,
-                              labels=[[]] * self.nlevels,
-                              names=result_names, verify_integrity=False)
-        else:
-            return MultiIndex.from_tuples(difference, sortorder=0,
-                                          names=result_names)
-
-    def astype(self, dtype):
-        if not is_object_dtype(np.dtype(dtype)):
-            raise TypeError('Setting %s dtype to anything other than object '
-                            'is not supported' % self.__class__)
-        return self._shallow_copy()
-
-    def _convert_can_do_setop(self, other):
-        result_names = self.names
-
-        if not hasattr(other, 'names'):
-            if len(other) == 0:
-                other = MultiIndex(levels=[[]] * self.nlevels,
-                                   labels=[[]] * self.nlevels,
-                                   verify_integrity=False)
-            else:
-                msg = 'other must be a MultiIndex or a list of tuples'
-                try:
-                    other = MultiIndex.from_tuples(other)
-                except:
-                    raise TypeError(msg)
-        else:
-            result_names = self.names if self.names == other.names else None
-        return other, result_names
-
-    def insert(self, loc, item):
-        """
-        Make new MultiIndex inserting new item at location
-
-        Parameters
-        ----------
-        loc : int
-        item : tuple
-            Must be same length as number of levels in the MultiIndex
-
-        Returns
-        -------
-        new_index : Index
-        """
-        # Pad the key with empty strings if lower levels of the key
-        # aren't specified:
-        if not isinstance(item, tuple):
-            item = (item,) + ('',) * (self.nlevels - 1)
-        elif len(item) != self.nlevels:
-            raise ValueError(
-                'Item must have length equal to number of levels.')
-
-        new_levels = []
-        new_labels = []
-        for k, level, labels in zip(item, self.levels, self.labels):
-            if k not in level:
-                # have to insert into level
-                # must insert at end otherwise you have to recompute all the
-                # other labels
-                lev_loc = len(level)
-                level = level.insert(lev_loc, k)
-            else:
-                lev_loc = level.get_loc(k)
-
-            new_levels.append(level)
-            new_labels.append(np.insert(_ensure_int64(labels), loc, lev_loc))
-
-        return MultiIndex(levels=new_levels, labels=new_labels,
-                          names=self.names, verify_integrity=False)
-
-    def delete(self, loc):
-        """
-        Make new index with passed location deleted
-
-        Returns
-        -------
-        new_index : MultiIndex
-        """
-        new_labels = [np.delete(lab, loc) for lab in self.labels]
-        return MultiIndex(levels=self.levels, labels=new_labels,
-                          names=self.names, verify_integrity=False)
-
-    get_major_bounds = slice_locs
-
-    __bounds = None
-
-    @property
-    def _bounds(self):
-        """
-        Return or compute and return slice points for level 0, assuming
-        sortedness
-        """
-        if self.__bounds is None:
-            inds = np.arange(len(self.levels[0]))
-            self.__bounds = self.labels[0].searchsorted(inds)
-
-        return self.__bounds
-
-    def _wrap_joined_index(self, joined, other):
-        names = self.names if self.names == other.names else None
-        return MultiIndex.from_tuples(joined, names=names)
-
-    @Appender(Index.isin.__doc__)
-    def isin(self, values, level=None):
-        if level is None:
-            return lib.ismember(np.array(self), set(values))
-        else:
-            num = self._get_level_number(level)
-            levs = self.levels[num]
-            labs = self.labels[num]
-
-            sought_labels = levs.isin(values).nonzero()[0]
-            if levs.size == 0:
-                return np.zeros(len(labs), dtype=np.bool_)
-            else:
-                return np.lib.arraysetops.in1d(labs, sought_labels)
-
-
-MultiIndex._add_numeric_methods_disabled()
-MultiIndex._add_logical_methods_disabled()
-
-
-# For utility purposes
-
-def _sparsify(label_list, start=0, sentinel=''):
-    pivoted = lzip(*label_list)
-    k = len(label_list)
-
-    result = pivoted[:start + 1]
-    prev = pivoted[start]
-
-    for cur in pivoted[start + 1:]:
-        sparse_cur = []
-
-        for i, (p, t) in enumerate(zip(prev, cur)):
-            if i == k - 1:
-                sparse_cur.append(t)
-                result.append(sparse_cur)
-                break
-
-            if p == t:
-                sparse_cur.append(sentinel)
-            else:
-                sparse_cur.extend(cur[i:])
-                result.append(sparse_cur)
-                break
-
-        prev = cur
-
-    return lzip(*result)
-
-
-def _ensure_index(index_like, copy=False):
-    if isinstance(index_like, Index):
-        if copy:
-            index_like = index_like.copy()
-        return index_like
-    if hasattr(index_like, 'name'):
-        return Index(index_like, name=index_like.name, copy=copy)
-
-    # must check for exactly list here because of strict type
-    # check in clean_index_list
-    if isinstance(index_like, list):
-        if type(index_like) != list:
-            index_like = list(index_like)
-        # 2200 ?
-        converted, all_arrays = lib.clean_index_list(index_like)
-
-        if len(converted) > 0 and all_arrays:
-            return MultiIndex.from_arrays(converted)
-        else:
-            index_like = converted
-    else:
-       # clean_index_list does the equivalent of copying
-       # so only need to do this if not list instance
-        if copy:
-            from copy import copy
-            index_like = copy(index_like)
-
-    return Index(index_like)
-
-
-def _ensure_frozen(array_like, categories, copy=False):
-    array_like = com._coerce_indexer_dtype(array_like, categories)
-    array_like = array_like.view(FrozenNDArray)
-    if copy:
-        array_like = array_like.copy()
-    return array_like
-
-
-def _validate_join_method(method):
-    if method not in ['left', 'right', 'inner', 'outer']:
-        raise ValueError('do not recognize join method %s' % method)
-
-
-# TODO: handle index names!
-def _get_combined_index(indexes, intersect=False):
-    indexes = _get_distinct_indexes(indexes)
-    if len(indexes) == 0:
-        return Index([])
-    if len(indexes) == 1:
-        return indexes[0]
-    if intersect:
-        index = indexes[0]
-        for other in indexes[1:]:
-            index = index.intersection(other)
-        return index
-    union = _union_indexes(indexes)
-    return _ensure_index(union)
-
-
-def _get_distinct_indexes(indexes):
-    return list(dict((id(x), x) for x in indexes).values())
-
-
-def _union_indexes(indexes):
-    if len(indexes) == 0:
-        raise AssertionError('Must have at least 1 Index to union')
-    if len(indexes) == 1:
-        result = indexes[0]
-        if isinstance(result, list):
-            result = Index(sorted(result))
-        return result
-
-    indexes, kind = _sanitize_and_check(indexes)
-    def _unique_indices(inds):
-        def conv(i):
-            if isinstance(i, Index):
-                i = i.tolist()
-            return i
-        return Index(lib.fast_unique_multiple_list([ conv(i) for i in inds ]))
-
-    if kind == 'special':
-        result = indexes[0]
-
-        if hasattr(result, 'union_many'):
-            return result.union_many(indexes[1:])
-        else:
-            for other in indexes[1:]:
-                result = result.union(other)
-            return result
-    elif kind == 'array':
-        index = indexes[0]
-        for other in indexes[1:]:
-            if not index.equals(other):
-                return _unique_indices(indexes)
-
-        return index
-    else:
-        return _unique_indices(indexes)
-
-
-def _trim_front(strings):
-    """
-    Trims zeros and decimal points
-    """
-    trimmed = strings
-    while len(strings) > 0 and all([x[0] == ' ' for x in trimmed]):
-        trimmed = [x[1:] for x in trimmed]
-    return trimmed
-
-
-def _sanitize_and_check(indexes):
-    kinds = list(set([type(index) for index in indexes]))
-
-    if list in kinds:
-        if len(kinds) > 1:
-            indexes = [Index(com._try_sort(x))
-                       if not isinstance(x, Index) else x
-                       for x in indexes]
-            kinds.remove(list)
-        else:
-            return indexes, 'list'
-
-    if len(kinds) > 1 or Index not in kinds:
-        return indexes, 'special'
-    else:
-        return indexes, 'array'
-
-
-def _get_consensus_names(indexes):
-
-    # find the non-none names, need to tupleify to make
-    # the set hashable, then reverse on return
-    consensus_names = set([
-        tuple(i.names) for i in indexes if all(n is not None for n in i.names)
-    ])
-    if len(consensus_names) == 1:
-        return list(list(consensus_names)[0])
-    return [None] * indexes[0].nlevels
-
-
-def _maybe_box(idx):
-    from pandas.tseries.api import DatetimeIndex, PeriodIndex, TimedeltaIndex
-    klasses = DatetimeIndex, PeriodIndex, TimedeltaIndex
-
-    if isinstance(idx, klasses):
-        return idx.asobject
-    return idx
-
-
-def _all_indexes_same(indexes):
-    first = indexes[0]
-    for index in indexes[1:]:
-        if not first.equals(index):
-            return False
-    return True
-
-
-def _get_na_rep(dtype):
-    return {np.datetime64: 'NaT', np.timedelta64: 'NaT'}.get(dtype, 'NaN')
-
-
-def _get_na_value(dtype):
-    return {np.datetime64: tslib.NaT, np.timedelta64: tslib.NaT}.get(dtype,
-                                                                     np.nan)
-
-
-def _ensure_has_len(seq):
-    """If seq is an iterator, put its values into a list."""
-    try:
-        len(seq)
-    except TypeError:
-        return list(seq)
-    else:
-        return seq
+# flake8: noqa
+from pandas.core.indexes.api import *
+from pandas.core.indexes.multi import _sparsify
diff --git a/pandas/io/tests/test_json/__init__.py b/pandas/core/indexes/__init__.py
similarity index 100%
rename from pandas/io/tests/test_json/__init__.py
rename to pandas/core/indexes/__init__.py
diff --git a/pandas/core/indexes/accessors.py b/pandas/core/indexes/accessors.py
new file mode 100644
index 0000000000000..225ccbf590779
--- /dev/null
+++ b/pandas/core/indexes/accessors.py
@@ -0,0 +1,326 @@
+"""
+datetimelike delegation
+"""
+
+import numpy as np
+
+from pandas.core.dtypes.generic import ABCSeries
+from pandas.core.dtypes.common import (
+    is_period_arraylike,
+    is_datetime_arraylike, is_integer_dtype,
+    is_datetime64_dtype, is_datetime64tz_dtype,
+    is_timedelta64_dtype, is_categorical_dtype,
+    is_list_like)
+
+from pandas.core.accessor import PandasDelegate
+from pandas.core.base import NoNewAttributesMixin, PandasObject
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas._libs.tslibs.period import IncompatibleFrequency  # noqa
+from pandas.core.indexes.period import PeriodIndex
+from pandas.core.indexes.timedeltas import TimedeltaIndex
+from pandas.core.algorithms import take_1d
+
+
+class Properties(PandasDelegate, PandasObject, NoNewAttributesMixin):
+
+    def __init__(self, data, orig):
+        if not isinstance(data, ABCSeries):
+            raise TypeError("cannot convert an object of type {0} to a "
+                            "datetimelike index".format(type(data)))
+
+        self.values = data
+        self.orig = orig
+        self.name = getattr(data, 'name', None)
+        self.index = getattr(data, 'index', None)
+        self._freeze()
+
+    def _get_values(self):
+        data = self.values
+        if is_datetime64_dtype(data.dtype):
+            return DatetimeIndex(data, copy=False, name=self.name)
+
+        elif is_datetime64tz_dtype(data.dtype):
+            return DatetimeIndex(data, copy=False, name=self.name)
+
+        elif is_timedelta64_dtype(data.dtype):
+            return TimedeltaIndex(data, copy=False, name=self.name)
+
+        else:
+            if is_period_arraylike(data):
+                return PeriodIndex(data, copy=False, name=self.name)
+            if is_datetime_arraylike(data):
+                return DatetimeIndex(data, copy=False, name=self.name)
+
+        raise TypeError("cannot convert an object of type {0} to a "
+                        "datetimelike index".format(type(data)))
+
+    def _delegate_property_get(self, name):
+        from pandas import Series
+        values = self._get_values()
+
+        result = getattr(values, name)
+
+        # maybe need to upcast (ints)
+        if isinstance(result, np.ndarray):
+            if is_integer_dtype(result):
+                result = result.astype('int64')
+        elif not is_list_like(result):
+            return result
+
+        result = np.asarray(result)
+
+        # blow up if we operate on categories
+        if self.orig is not None:
+            result = take_1d(result, self.orig.cat.codes)
+            index = self.orig.index
+        else:
+            index = self.index
+
+        # return the result as a Series, which is by definition a copy
+        result = Series(result, index=index, name=self.name)
+
+        # setting this object will show a SettingWithCopyWarning/Error
+        result._is_copy = ("modifications to a property of a datetimelike "
+                           "object are not supported and are discarded. "
+                           "Change values on the original.")
+
+        return result
+
+    def _delegate_property_set(self, name, value, *args, **kwargs):
+        raise ValueError("modifications to a property of a datetimelike "
+                         "object are not supported. Change values on the "
+                         "original.")
+
+    def _delegate_method(self, name, *args, **kwargs):
+        from pandas import Series
+        values = self._get_values()
+
+        method = getattr(values, name)
+        result = method(*args, **kwargs)
+
+        if not is_list_like(result):
+            return result
+
+        result = Series(result, index=self.index, name=self.name)
+
+        # setting this object will show a SettingWithCopyWarning/Error
+        result._is_copy = ("modifications to a method of a datetimelike "
+                           "object are not supported and are discarded. "
+                           "Change values on the original.")
+
+        return result
+
+
+class DatetimeProperties(Properties):
+    """
+    Accessor object for datetimelike properties of the Series values.
+
+    Examples
+    --------
+    >>> s.dt.hour
+    >>> s.dt.second
+    >>> s.dt.quarter
+
+    Returns a Series indexed like the original Series.
+    Raises TypeError if the Series does not contain datetimelike values.
+    """
+
+    def to_pydatetime(self):
+        """
+        Return the data as an array of native Python datetime objects
+
+        Timezone information is retained if present.
+
+        .. warning::
+
+           Python's datetime uses microsecond resolution, which is lower than
+           pandas (nanosecond). The values are truncated.
+
+        Returns
+        -------
+        numpy.ndarray
+            object dtype array containing native Python datetime objects.
+
+        See Also
+        --------
+        datetime.datetime : Standard library value for a datetime.
+
+        Examples
+        --------
+        >>> s = pd.Series(pd.date_range('20180310', periods=2))
+        >>> s
+        0   2018-03-10
+        1   2018-03-11
+        dtype: datetime64[ns]
+
+        >>> s.dt.to_pydatetime()
+        array([datetime.datetime(2018, 3, 10, 0, 0),
+               datetime.datetime(2018, 3, 11, 0, 0)], dtype=object)
+
+        pandas' nanosecond precision is truncated to microseconds.
+
+        >>> s = pd.Series(pd.date_range('20180310', periods=2, freq='ns'))
+        >>> s
+        0   2018-03-10 00:00:00.000000000
+        1   2018-03-10 00:00:00.000000001
+        dtype: datetime64[ns]
+
+        >>> s.dt.to_pydatetime()
+        array([datetime.datetime(2018, 3, 10, 0, 0),
+               datetime.datetime(2018, 3, 10, 0, 0)], dtype=object)
+        """
+        return self._get_values().to_pydatetime()
+
+    @property
+    def freq(self):
+        return self._get_values().inferred_freq
+
+
+DatetimeProperties._add_delegate_accessors(
+    delegate=DatetimeIndex,
+    accessors=DatetimeIndex._datetimelike_ops,
+    typ='property')
+DatetimeProperties._add_delegate_accessors(
+    delegate=DatetimeIndex,
+    accessors=DatetimeIndex._datetimelike_methods,
+    typ='method')
+
+
+class TimedeltaProperties(Properties):
+    """
+    Accessor object for datetimelike properties of the Series values.
+
+    Examples
+    --------
+    >>> s.dt.hours
+    >>> s.dt.seconds
+
+    Returns a Series indexed like the original Series.
+    Raises TypeError if the Series does not contain datetimelike values.
+    """
+
+    def to_pytimedelta(self):
+        """
+        Return an array of native `datetime.timedelta` objects.
+
+        Python's standard `datetime` library uses a different representation
+        timedelta's. This method converts a Series of pandas Timedeltas
+        to `datetime.timedelta` format with the same length as the original
+        Series.
+
+        Returns
+        -------
+        a : numpy.ndarray
+            1D array containing data with `datetime.timedelta` type.
+
+        Examples
+        --------
+        >>> s = pd.Series(pd.to_timedelta(np.arange(5), unit='d'))
+        >>> s
+        0   0 days
+        1   1 days
+        2   2 days
+        3   3 days
+        4   4 days
+        dtype: timedelta64[ns]
+
+        >>> s.dt.to_pytimedelta()
+        array([datetime.timedelta(0), datetime.timedelta(1),
+               datetime.timedelta(2), datetime.timedelta(3),
+               datetime.timedelta(4)], dtype=object)
+
+        See Also
+        --------
+        datetime.timedelta
+        """
+        return self._get_values().to_pytimedelta()
+
+    @property
+    def components(self):
+        """
+        Return a dataframe of the components (days, hours, minutes,
+        seconds, milliseconds, microseconds, nanoseconds) of the Timedeltas.
+
+        Returns
+        -------
+        a DataFrame
+
+        """
+        return self._get_values().components.set_index(self.index)
+
+    @property
+    def freq(self):
+        return self._get_values().inferred_freq
+
+
+TimedeltaProperties._add_delegate_accessors(
+    delegate=TimedeltaIndex,
+    accessors=TimedeltaIndex._datetimelike_ops,
+    typ='property')
+TimedeltaProperties._add_delegate_accessors(
+    delegate=TimedeltaIndex,
+    accessors=TimedeltaIndex._datetimelike_methods,
+    typ='method')
+
+
+class PeriodProperties(Properties):
+    """
+    Accessor object for datetimelike properties of the Series values.
+
+    Examples
+    --------
+    >>> s.dt.hour
+    >>> s.dt.second
+    >>> s.dt.quarter
+
+    Returns a Series indexed like the original Series.
+    Raises TypeError if the Series does not contain datetimelike values.
+    """
+
+
+PeriodProperties._add_delegate_accessors(
+    delegate=PeriodIndex,
+    accessors=PeriodIndex._datetimelike_ops,
+    typ='property')
+PeriodProperties._add_delegate_accessors(
+    delegate=PeriodIndex,
+    accessors=PeriodIndex._datetimelike_methods,
+    typ='method')
+
+
+class CombinedDatetimelikeProperties(DatetimeProperties, TimedeltaProperties):
+
+    def __new__(cls, data):
+        # CombinedDatetimelikeProperties isn't really instantiated. Instead
+        # we need to choose which parent (datetime or timedelta) is
+        # appropriate. Since we're checking the dtypes anyway, we'll just
+        # do all the validation here.
+        from pandas import Series
+
+        if not isinstance(data, Series):
+            raise TypeError("cannot convert an object of type {0} to a "
+                            "datetimelike index".format(type(data)))
+
+        orig = data if is_categorical_dtype(data) else None
+        if orig is not None:
+            data = Series(orig.values.categories,
+                          name=orig.name,
+                          copy=False)
+
+        try:
+            if is_datetime64_dtype(data.dtype):
+                return DatetimeProperties(data, orig)
+            elif is_datetime64tz_dtype(data.dtype):
+                return DatetimeProperties(data, orig)
+            elif is_timedelta64_dtype(data.dtype):
+                return TimedeltaProperties(data, orig)
+            else:
+                if is_period_arraylike(data):
+                    return PeriodProperties(data, orig)
+                if is_datetime_arraylike(data):
+                    return DatetimeProperties(data, orig)
+        except Exception:
+            pass  # we raise an attribute error anyway
+
+        raise AttributeError("Can only use .dt accessor with datetimelike "
+                             "values")
diff --git a/pandas/core/indexes/api.py b/pandas/core/indexes/api.py
new file mode 100644
index 0000000000000..6f4fdfe5bf5cd
--- /dev/null
+++ b/pandas/core/indexes/api.py
@@ -0,0 +1,163 @@
+import textwrap
+import warnings
+
+from pandas.core.indexes.base import (Index,
+                                      _new_Index,
+                                      _ensure_index,
+                                      _ensure_index_from_sequences,
+                                      InvalidIndexError)  # noqa
+from pandas.core.indexes.category import CategoricalIndex  # noqa
+from pandas.core.indexes.multi import MultiIndex  # noqa
+from pandas.core.indexes.interval import IntervalIndex  # noqa
+from pandas.core.indexes.numeric import (NumericIndex, Float64Index,  # noqa
+                                    Int64Index, UInt64Index)
+from pandas.core.indexes.range import RangeIndex  # noqa
+from pandas.core.indexes.timedeltas import TimedeltaIndex
+from pandas.core.indexes.period import PeriodIndex
+from pandas.core.indexes.datetimes import DatetimeIndex
+
+import pandas.core.common as com
+from pandas._libs import lib
+from pandas._libs.tslib import NaT
+
+_sort_msg = textwrap.dedent("""\
+Sorting because non-concatenation axis is not aligned. A future version
+of pandas will change to not sort by default.
+
+To accept the future behavior, pass 'sort=False'.
+
+To retain the current behavior and silence the warning, pass 'sort=True'.
+""")
+
+
+# TODO: there are many places that rely on these private methods existing in
+# pandas.core.index
+__all__ = ['Index', 'MultiIndex', 'NumericIndex', 'Float64Index', 'Int64Index',
+           'CategoricalIndex', 'IntervalIndex', 'RangeIndex', 'UInt64Index',
+           'InvalidIndexError', 'TimedeltaIndex',
+           'PeriodIndex', 'DatetimeIndex',
+           '_new_Index', 'NaT',
+           '_ensure_index', '_ensure_index_from_sequences',
+           '_get_combined_index',
+           '_get_objs_combined_axis', '_union_indexes',
+           '_get_consensus_names',
+           '_all_indexes_same']
+
+
+def _get_objs_combined_axis(objs, intersect=False, axis=0, sort=True):
+    # Extract combined index: return intersection or union (depending on the
+    # value of "intersect") of indexes on given axis, or None if all objects
+    # lack indexes (e.g. they are numpy arrays)
+    obs_idxes = [obj._get_axis(axis) for obj in objs
+                 if hasattr(obj, '_get_axis')]
+    if obs_idxes:
+        return _get_combined_index(obs_idxes, intersect=intersect, sort=sort)
+
+
+def _get_combined_index(indexes, intersect=False, sort=False):
+    # TODO: handle index names!
+    indexes = com._get_distinct_objs(indexes)
+    if len(indexes) == 0:
+        index = Index([])
+    elif len(indexes) == 1:
+        index = indexes[0]
+    elif intersect:
+        index = indexes[0]
+        for other in indexes[1:]:
+            index = index.intersection(other)
+    else:
+        index = _union_indexes(indexes, sort=sort)
+        index = _ensure_index(index)
+
+    if sort:
+        try:
+            index = index.sort_values()
+        except TypeError:
+            pass
+    return index
+
+
+def _union_indexes(indexes, sort=True):
+    if len(indexes) == 0:
+        raise AssertionError('Must have at least 1 Index to union')
+    if len(indexes) == 1:
+        result = indexes[0]
+        if isinstance(result, list):
+            result = Index(sorted(result))
+        return result
+
+    indexes, kind = _sanitize_and_check(indexes)
+
+    def _unique_indices(inds):
+        def conv(i):
+            if isinstance(i, Index):
+                i = i.tolist()
+            return i
+
+        return Index(
+            lib.fast_unique_multiple_list([conv(i) for i in inds], sort=sort))
+
+    if kind == 'special':
+        result = indexes[0]
+
+        if hasattr(result, 'union_many'):
+            return result.union_many(indexes[1:])
+        else:
+            for other in indexes[1:]:
+                result = result.union(other)
+            return result
+    elif kind == 'array':
+        index = indexes[0]
+        for other in indexes[1:]:
+            if not index.equals(other):
+
+                if sort is None:
+                    # TODO: remove once pd.concat sort default changes
+                    warnings.warn(_sort_msg, FutureWarning, stacklevel=8)
+                    sort = True
+
+                return _unique_indices(indexes)
+
+        name = _get_consensus_names(indexes)[0]
+        if name != index.name:
+            index = index._shallow_copy(name=name)
+        return index
+    else:  # kind='list'
+        return _unique_indices(indexes)
+
+
+def _sanitize_and_check(indexes):
+    kinds = list({type(index) for index in indexes})
+
+    if list in kinds:
+        if len(kinds) > 1:
+            indexes = [Index(com._try_sort(x))
+                       if not isinstance(x, Index) else
+                       x for x in indexes]
+            kinds.remove(list)
+        else:
+            return indexes, 'list'
+
+    if len(kinds) > 1 or Index not in kinds:
+        return indexes, 'special'
+    else:
+        return indexes, 'array'
+
+
+def _get_consensus_names(indexes):
+
+    # find the non-none names, need to tupleify to make
+    # the set hashable, then reverse on return
+    consensus_names = set(tuple(i.names) for i in indexes
+                          if com._any_not_none(*i.names))
+    if len(consensus_names) == 1:
+        return list(list(consensus_names)[0])
+    return [None] * indexes[0].nlevels
+
+
+def _all_indexes_same(indexes):
+    first = indexes[0]
+    for index in indexes[1:]:
+        if not first.equals(index):
+            return False
+    return True
diff --git a/pandas/core/indexes/base.py b/pandas/core/indexes/base.py
new file mode 100644
index 0000000000000..ba60d10099948
--- /dev/null
+++ b/pandas/core/indexes/base.py
@@ -0,0 +1,4953 @@
+from datetime import datetime, timedelta
+import warnings
+import operator
+from textwrap import dedent
+
+import numpy as np
+from pandas._libs import (lib, index as libindex, tslib as libts,
+                          algos as libalgos, join as libjoin,
+                          Timedelta)
+from pandas._libs.lib import is_datetime_array
+
+from pandas.compat import range, u, set_function_name
+from pandas.compat.numpy import function as nv
+from pandas import compat
+
+from pandas.core.accessor import CachedAccessor
+from pandas.core.arrays import ExtensionArray
+from pandas.core.dtypes.generic import (
+    ABCSeries, ABCDataFrame,
+    ABCMultiIndex,
+    ABCPeriodIndex, ABCTimedeltaIndex,
+    ABCDateOffset)
+from pandas.core.dtypes.missing import isna, array_equivalent
+from pandas.core.dtypes.cast import maybe_cast_to_integer_array
+from pandas.core.dtypes.common import (
+    _ensure_int64,
+    _ensure_object,
+    _ensure_categorical,
+    _ensure_platform_int,
+    is_integer,
+    is_float,
+    is_dtype_equal,
+    is_dtype_union_equal,
+    is_object_dtype,
+    is_categorical,
+    is_categorical_dtype,
+    is_interval_dtype,
+    is_period_dtype,
+    is_bool,
+    is_bool_dtype,
+    is_signed_integer_dtype,
+    is_unsigned_integer_dtype,
+    is_integer_dtype, is_float_dtype,
+    is_datetime64_any_dtype,
+    is_datetime64tz_dtype,
+    is_timedelta64_dtype,
+    is_hashable,
+    needs_i8_conversion,
+    is_iterator, is_list_like,
+    is_scalar)
+
+from pandas.core.base import PandasObject, IndexOpsMixin
+import pandas.core.common as com
+from pandas.core import ops
+from pandas.util._decorators import (
+    Appender, Substitution, cache_readonly, deprecate_kwarg)
+from pandas.core.indexes.frozen import FrozenList
+import pandas.core.dtypes.concat as _concat
+import pandas.core.missing as missing
+import pandas.core.algorithms as algos
+import pandas.core.sorting as sorting
+from pandas.io.formats.printing import (
+    pprint_thing, default_pprint, format_object_summary, format_object_attrs)
+from pandas.core.ops import make_invalid_op
+from pandas.core.strings import StringMethods
+
+__all__ = ['Index']
+
+_unsortable_types = frozenset(('mixed', 'mixed-integer'))
+
+_index_doc_kwargs = dict(klass='Index', inplace='',
+                         target_klass='Index',
+                         unique='Index', duplicated='np.ndarray')
+_index_shared_docs = dict()
+
+
+def _try_get_item(x):
+    try:
+        return x.item()
+    except AttributeError:
+        return x
+
+
+def _make_comparison_op(op, cls):
+    def cmp_method(self, other):
+        if isinstance(other, (np.ndarray, Index, ABCSeries)):
+            if other.ndim > 0 and len(self) != len(other):
+                raise ValueError('Lengths must match to compare')
+
+        # we may need to directly compare underlying
+        # representations
+        if needs_i8_conversion(self) and needs_i8_conversion(other):
+            return self._evaluate_compare(other, op)
+
+        from .multi import MultiIndex
+        if is_object_dtype(self) and not isinstance(self, MultiIndex):
+            # don't pass MultiIndex
+            with np.errstate(all='ignore'):
+                result = ops._comp_method_OBJECT_ARRAY(op, self.values, other)
+
+        else:
+
+            # numpy will show a DeprecationWarning on invalid elementwise
+            # comparisons, this will raise in the future
+            with warnings.catch_warnings(record=True):
+                with np.errstate(all='ignore'):
+                    result = op(self.values, np.asarray(other))
+
+        # technically we could support bool dtyped Index
+        # for now just return the indexing array directly
+        if is_bool_dtype(result):
+            return result
+        try:
+            return Index(result)
+        except TypeError:
+            return result
+
+    name = '__{name}__'.format(name=op.__name__)
+    # TODO: docstring?
+    return set_function_name(cmp_method, name, cls)
+
+
+def _make_arithmetic_op(op, cls):
+    def index_arithmetic_method(self, other):
+        if isinstance(other, (ABCSeries, ABCDataFrame)):
+            return NotImplemented
+        elif isinstance(other, ABCTimedeltaIndex):
+            # Defer to subclass implementation
+            return NotImplemented
+
+        other = self._validate_for_numeric_binop(other, op)
+
+        # handle time-based others
+        if isinstance(other, (ABCDateOffset, np.timedelta64, timedelta)):
+            return self._evaluate_with_timedelta_like(other, op)
+        elif isinstance(other, (datetime, np.datetime64)):
+            return self._evaluate_with_datetime_like(other, op)
+
+        values = self.values
+        with np.errstate(all='ignore'):
+            result = op(values, other)
+
+        result = missing.dispatch_missing(op, values, other, result)
+
+        attrs = self._get_attributes_dict()
+        attrs = self._maybe_update_attributes(attrs)
+        if op is divmod:
+            result = (Index(result[0], **attrs), Index(result[1], **attrs))
+        else:
+            result = Index(result, **attrs)
+        return result
+
+    name = '__{name}__'.format(name=op.__name__)
+    # TODO: docstring?
+    return set_function_name(index_arithmetic_method, name, cls)
+
+
+class InvalidIndexError(Exception):
+    pass
+
+
+_o_dtype = np.dtype(object)
+_Identity = object
+
+
+def _new_Index(cls, d):
+    """ This is called upon unpickling, rather than the default which doesn't
+    have arguments and breaks __new__
+    """
+    # required for backward compat, because PI can't be instantiated with
+    # ordinals through __new__ GH #13277
+    if issubclass(cls, ABCPeriodIndex):
+        from pandas.core.indexes.period import _new_PeriodIndex
+        return _new_PeriodIndex(cls, **d)
+    return cls.__new__(cls, **d)
+
+
+class Index(IndexOpsMixin, PandasObject):
+    """
+    Immutable ndarray implementing an ordered, sliceable set. The basic object
+    storing axis labels for all pandas objects
+
+    Parameters
+    ----------
+    data : array-like (1-dimensional)
+    dtype : NumPy dtype (default: object)
+        If dtype is None, we find the dtype that best fits the data.
+        If an actual dtype is provided, we coerce to that dtype if it's safe.
+        Otherwise, an error will be raised.
+    copy : bool
+        Make a copy of input ndarray
+    name : object
+        Name to be stored in the index
+    tupleize_cols : bool (default: True)
+        When True, attempt to create a MultiIndex if possible
+
+    Notes
+    -----
+    An Index instance can **only** contain hashable objects
+
+    Examples
+    --------
+    >>> pd.Index([1, 2, 3])
+    Int64Index([1, 2, 3], dtype='int64')
+
+    >>> pd.Index(list('abc'))
+    Index(['a', 'b', 'c'], dtype='object')
+
+    See Also
+    ---------
+    RangeIndex : Index implementing a monotonic integer range
+    CategoricalIndex : Index of :class:`Categorical` s.
+    MultiIndex : A multi-level, or hierarchical, Index
+    IntervalIndex : an Index of :class:`Interval` s.
+    DatetimeIndex, TimedeltaIndex, PeriodIndex
+    Int64Index, UInt64Index,  Float64Index
+    """
+    # To hand over control to subclasses
+    _join_precedence = 1
+
+    # Cython methods
+    _left_indexer_unique = libjoin.left_join_indexer_unique_object
+    _left_indexer = libjoin.left_join_indexer_object
+    _inner_indexer = libjoin.inner_join_indexer_object
+    _outer_indexer = libjoin.outer_join_indexer_object
+
+    _typ = 'index'
+    _data = None
+    _id = None
+    name = None
+    asi8 = None
+    _comparables = ['name']
+    _attributes = ['name']
+    _is_numeric_dtype = False
+    _can_hold_na = True
+
+    # would we like our indexing holder to defer to us
+    _defer_to_indexing = False
+
+    # prioritize current class for _shallow_copy_with_infer,
+    # used to infer integers as datetime-likes
+    _infer_as_myclass = False
+
+    _engine_type = libindex.ObjectEngine
+
+    _accessors = set(['str'])
+
+    str = CachedAccessor("str", StringMethods)
+
+    def __new__(cls, data=None, dtype=None, copy=False, name=None,
+                fastpath=False, tupleize_cols=True, **kwargs):
+
+        if name is None and hasattr(data, 'name'):
+            name = data.name
+
+        if fastpath:
+            return cls._simple_new(data, name)
+
+        from .range import RangeIndex
+
+        # range
+        if isinstance(data, RangeIndex):
+            return RangeIndex(start=data, copy=copy, dtype=dtype, name=name)
+        elif isinstance(data, range):
+            return RangeIndex.from_range(data, copy=copy, dtype=dtype,
+                                         name=name)
+
+        # categorical
+        if is_categorical_dtype(data) or is_categorical_dtype(dtype):
+            from .category import CategoricalIndex
+            return CategoricalIndex(data, dtype=dtype, copy=copy, name=name,
+                                    **kwargs)
+
+        # interval
+        if is_interval_dtype(data) or is_interval_dtype(dtype):
+            from .interval import IntervalIndex
+            closed = kwargs.get('closed', None)
+            return IntervalIndex(data, dtype=dtype, name=name, copy=copy,
+                                 closed=closed)
+
+        # index-like
+        elif isinstance(data, (np.ndarray, Index, ABCSeries)):
+
+            if (is_datetime64_any_dtype(data) or
+                (dtype is not None and is_datetime64_any_dtype(dtype)) or
+                    'tz' in kwargs):
+                from pandas import DatetimeIndex
+                result = DatetimeIndex(data, copy=copy, name=name,
+                                       dtype=dtype, **kwargs)
+                if dtype is not None and is_dtype_equal(_o_dtype, dtype):
+                    return Index(result.to_pydatetime(), dtype=_o_dtype)
+                else:
+                    return result
+
+            elif (is_timedelta64_dtype(data) or
+                  (dtype is not None and is_timedelta64_dtype(dtype))):
+                from pandas import TimedeltaIndex
+                result = TimedeltaIndex(data, copy=copy, name=name, **kwargs)
+                if dtype is not None and _o_dtype == dtype:
+                    return Index(result.to_pytimedelta(), dtype=_o_dtype)
+                else:
+                    return result
+
+            if dtype is not None:
+                try:
+
+                    # we need to avoid having numpy coerce
+                    # things that look like ints/floats to ints unless
+                    # they are actually ints, e.g. '0' and 0.0
+                    # should not be coerced
+                    # GH 11836
+                    if is_integer_dtype(dtype):
+                        inferred = lib.infer_dtype(data)
+                        if inferred == 'integer':
+                            data = maybe_cast_to_integer_array(data, dtype,
+                                                               copy=copy)
+                        elif inferred in ['floating', 'mixed-integer-float']:
+                            if isna(data).any():
+                                raise ValueError('cannot convert float '
+                                                 'NaN to integer')
+
+                            if inferred == "mixed-integer-float":
+                                data = maybe_cast_to_integer_array(data, dtype)
+
+                            # If we are actually all equal to integers,
+                            # then coerce to integer.
+                            try:
+                                return cls._try_convert_to_int_index(
+                                    data, copy, name, dtype)
+                            except ValueError:
+                                pass
+
+                            # Return an actual float index.
+                            from .numeric import Float64Index
+                            return Float64Index(data, copy=copy, dtype=dtype,
+                                                name=name)
+
+                        elif inferred == 'string':
+                            pass
+                        else:
+                            data = data.astype(dtype)
+                    elif is_float_dtype(dtype):
+                        inferred = lib.infer_dtype(data)
+                        if inferred == 'string':
+                            pass
+                        else:
+                            data = data.astype(dtype)
+                    else:
+                        data = np.array(data, dtype=dtype, copy=copy)
+
+                except (TypeError, ValueError) as e:
+                    msg = str(e)
+                    if ("cannot convert float" in msg or
+                            "Trying to coerce float values to integer" in msg):
+                        raise
+
+            # maybe coerce to a sub-class
+            from pandas.core.indexes.period import (
+                PeriodIndex, IncompatibleFrequency)
+            if isinstance(data, PeriodIndex):
+                return PeriodIndex(data, copy=copy, name=name, **kwargs)
+            if is_signed_integer_dtype(data.dtype):
+                from .numeric import Int64Index
+                return Int64Index(data, copy=copy, dtype=dtype, name=name)
+            elif is_unsigned_integer_dtype(data.dtype):
+                from .numeric import UInt64Index
+                return UInt64Index(data, copy=copy, dtype=dtype, name=name)
+            elif is_float_dtype(data.dtype):
+                from .numeric import Float64Index
+                return Float64Index(data, copy=copy, dtype=dtype, name=name)
+            elif issubclass(data.dtype.type, np.bool) or is_bool_dtype(data):
+                subarr = data.astype('object')
+            else:
+                subarr = com._asarray_tuplesafe(data, dtype=object)
+
+            # _asarray_tuplesafe does not always copy underlying data,
+            # so need to make sure that this happens
+            if copy:
+                subarr = subarr.copy()
+
+            if dtype is None:
+                inferred = lib.infer_dtype(subarr)
+                if inferred == 'integer':
+                    try:
+                        return cls._try_convert_to_int_index(
+                            subarr, copy, name, dtype)
+                    except ValueError:
+                        pass
+
+                    return Index(subarr, copy=copy,
+                                 dtype=object, name=name)
+                elif inferred in ['floating', 'mixed-integer-float']:
+                    from .numeric import Float64Index
+                    return Float64Index(subarr, copy=copy, name=name)
+                elif inferred == 'interval':
+                    from .interval import IntervalIndex
+                    return IntervalIndex(subarr, name=name, copy=copy)
+                elif inferred == 'boolean':
+                    # don't support boolean explicitly ATM
+                    pass
+                elif inferred != 'string':
+                    if inferred.startswith('datetime'):
+                        if (lib.is_datetime_with_singletz_array(subarr) or
+                                'tz' in kwargs):
+                            # only when subarr has the same tz
+                            from pandas import DatetimeIndex
+                            try:
+                                return DatetimeIndex(subarr, copy=copy,
+                                                     name=name, **kwargs)
+                            except libts.OutOfBoundsDatetime:
+                                pass
+
+                    elif inferred.startswith('timedelta'):
+                        from pandas import TimedeltaIndex
+                        return TimedeltaIndex(subarr, copy=copy, name=name,
+                                              **kwargs)
+                    elif inferred == 'period':
+                        try:
+                            return PeriodIndex(subarr, name=name, **kwargs)
+                        except IncompatibleFrequency:
+                            pass
+            return cls._simple_new(subarr, name)
+
+        elif hasattr(data, '__array__'):
+            return Index(np.asarray(data), dtype=dtype, copy=copy, name=name,
+                         **kwargs)
+        elif data is None or is_scalar(data):
+            cls._scalar_data_error(data)
+        else:
+            if tupleize_cols and is_list_like(data):
+                # GH21470: convert iterable to list before determining if empty
+                if is_iterator(data):
+                    data = list(data)
+
+                if data and all(isinstance(e, tuple) for e in data):
+                    # we must be all tuples, otherwise don't construct
+                    # 10697
+                    from .multi import MultiIndex
+                    return MultiIndex.from_tuples(
+                        data, names=name or kwargs.get('names'))
+            # other iterable of some kind
+            subarr = com._asarray_tuplesafe(data, dtype=object)
+            return Index(subarr, dtype=dtype, copy=copy, name=name, **kwargs)
+
+    """
+    NOTE for new Index creation:
+
+    - _simple_new: It returns new Index with the same type as the caller.
+      All metadata (such as name) must be provided by caller's responsibility.
+      Using _shallow_copy is recommended because it fills these metadata
+      otherwise specified.
+
+    - _shallow_copy: It returns new Index with the same type (using
+      _simple_new), but fills caller's metadata otherwise specified. Passed
+      kwargs will overwrite corresponding metadata.
+
+    - _shallow_copy_with_infer: It returns new Index inferring its type
+      from passed values. It fills caller's metadata otherwise specified as the
+      same as _shallow_copy.
+
+    See each method's docstring.
+    """
+
+    @classmethod
+    def _simple_new(cls, values, name=None, dtype=None, **kwargs):
+        """
+        we require the we have a dtype compat for the values
+        if we are passed a non-dtype compat, then coerce using the constructor
+
+        Must be careful not to recurse.
+        """
+        if not hasattr(values, 'dtype'):
+            if (values is None or not len(values)) and dtype is not None:
+                values = np.empty(0, dtype=dtype)
+            else:
+                values = np.array(values, copy=False)
+                if is_object_dtype(values):
+                    values = cls(values, name=name, dtype=dtype,
+                                 **kwargs)._ndarray_values
+
+        result = object.__new__(cls)
+        result._data = values
+        result.name = name
+        for k, v in compat.iteritems(kwargs):
+            setattr(result, k, v)
+        return result._reset_identity()
+
+    _index_shared_docs['_shallow_copy'] = """
+        create a new Index with the same class as the caller, don't copy the
+        data, use the same object attributes with passed in attributes taking
+        precedence
+
+        *this is an internal non-public method*
+
+        Parameters
+        ----------
+        values : the values to create the new Index, optional
+        kwargs : updates the default attributes for this Index
+        """
+
+    @Appender(_index_shared_docs['_shallow_copy'])
+    def _shallow_copy(self, values=None, **kwargs):
+        if values is None:
+            values = self.values
+        attributes = self._get_attributes_dict()
+        attributes.update(kwargs)
+        if not len(values) and 'dtype' not in kwargs:
+            attributes['dtype'] = self.dtype
+        return self._simple_new(values, **attributes)
+
+    def _shallow_copy_with_infer(self, values=None, **kwargs):
+        """
+        create a new Index inferring the class with passed value, don't copy
+        the data, use the same object attributes with passed in attributes
+        taking precedence
+
+        *this is an internal non-public method*
+
+        Parameters
+        ----------
+        values : the values to create the new Index, optional
+        kwargs : updates the default attributes for this Index
+        """
+        if values is None:
+            values = self.values
+        attributes = self._get_attributes_dict()
+        attributes.update(kwargs)
+        attributes['copy'] = False
+        if not len(values) and 'dtype' not in kwargs:
+            attributes['dtype'] = self.dtype
+        if self._infer_as_myclass:
+            try:
+                return self._constructor(values, **attributes)
+            except (TypeError, ValueError):
+                pass
+        return Index(values, **attributes)
+
+    def _deepcopy_if_needed(self, orig, copy=False):
+        """
+        .. versionadded:: 0.19.0
+
+        Make a copy of self if data coincides (in memory) with orig.
+        Subclasses should override this if self._base is not an ndarray.
+
+        Parameters
+        ----------
+        orig : ndarray
+            other ndarray to compare self._data against
+        copy : boolean, default False
+            when False, do not run any check, just return self
+
+        Returns
+        -------
+        A copy of self if needed, otherwise self : Index
+        """
+        if copy:
+            # Retrieve the "base objects", i.e. the original memory allocations
+            if not isinstance(orig, np.ndarray):
+                # orig is a DatetimeIndex
+                orig = orig.values
+            orig = orig if orig.base is None else orig.base
+            new = self._data if self._data.base is None else self._data.base
+            if orig is new:
+                return self.copy(deep=True)
+
+        return self
+
+    def _update_inplace(self, result, **kwargs):
+        # guard when called from IndexOpsMixin
+        raise TypeError("Index can't be updated inplace")
+
+    def _sort_levels_monotonic(self):
+        """ compat with MultiIndex """
+        return self
+
+    _index_shared_docs['_get_grouper_for_level'] = """
+        Get index grouper corresponding to an index level
+
+        Parameters
+        ----------
+        mapper: Group mapping function or None
+            Function mapping index values to groups
+        level : int or None
+            Index level
+
+        Returns
+        -------
+        grouper : Index
+            Index of values to group on
+        labels : ndarray of int or None
+            Array of locations in level_index
+        uniques : Index or None
+            Index of unique values for level
+        """
+
+    @Appender(_index_shared_docs['_get_grouper_for_level'])
+    def _get_grouper_for_level(self, mapper, level=None):
+        assert level is None or level == 0
+        if mapper is None:
+            grouper = self
+        else:
+            grouper = self.map(mapper)
+
+        return grouper, None, None
+
+    def is_(self, other):
+        """
+        More flexible, faster check like ``is`` but that works through views
+
+        Note: this is *not* the same as ``Index.identical()``, which checks
+        that metadata is also the same.
+
+        Parameters
+        ----------
+        other : object
+            other object to compare against.
+
+        Returns
+        -------
+        True if both have same underlying data, False otherwise : bool
+        """
+        # use something other than None to be clearer
+        return self._id is getattr(
+            other, '_id', Ellipsis) and self._id is not None
+
+    def _reset_identity(self):
+        """Initializes or resets ``_id`` attribute with new object"""
+        self._id = _Identity()
+        return self
+
+    # ndarray compat
+    def __len__(self):
+        """
+        return the length of the Index
+        """
+        return len(self._data)
+
+    def __array__(self, dtype=None):
+        """ the array interface, return my values """
+        return self._data.view(np.ndarray)
+
+    def __array_wrap__(self, result, context=None):
+        """
+        Gets called after a ufunc
+        """
+        if is_bool_dtype(result):
+            return result
+
+        attrs = self._get_attributes_dict()
+        attrs = self._maybe_update_attributes(attrs)
+        return Index(result, **attrs)
+
+    @cache_readonly
+    def dtype(self):
+        """ return the dtype object of the underlying data """
+        return self._data.dtype
+
+    @cache_readonly
+    def dtype_str(self):
+        """ return the dtype str of the underlying data """
+        return str(self.dtype)
+
+    @property
+    def values(self):
+        """ return the underlying data as an ndarray """
+        return self._data.view(np.ndarray)
+
+    @property
+    def _values(self):
+        # type: () -> Union[ExtensionArray, Index]
+        # TODO(EA): remove index types as they become extension arrays
+        """The best array representation.
+
+        This is an ndarray, ExtensionArray, or Index subclass. This differs
+        from ``_ndarray_values``, which always returns an ndarray.
+
+        Both ``_values`` and ``_ndarray_values`` are consistent between
+        ``Series`` and ``Index``.
+
+        It may differ from the public '.values' method.
+
+        index             | values          | _values     | _ndarray_values |
+        ----------------- | -------------- -| ----------- | --------------- |
+        CategoricalIndex  | Categorical     | Categorical | codes           |
+        DatetimeIndex[tz] | ndarray[M8ns]   | DTI[tz]     | ndarray[M8ns]   |
+
+        For the following, the ``._values`` is currently ``ndarray[object]``,
+        but will soon be an ``ExtensionArray``
+
+        index             | values          | _values      | _ndarray_values |
+        ----------------- | --------------- | ------------ | --------------- |
+        PeriodIndex       | ndarray[object] | ndarray[obj] | ndarray[int]    |
+        IntervalIndex     | ndarray[object] | ndarray[obj] | ndarray[object] |
+
+        See Also
+        --------
+        values
+        _ndarray_values
+        """
+        return self.values
+
+    def get_values(self):
+        """
+        Return `Index` data as an `numpy.ndarray`.
+
+        Returns
+        -------
+        numpy.ndarray
+            A one-dimensional numpy array of the `Index` values.
+
+        See Also
+        --------
+        Index.values : The attribute that get_values wraps.
+
+        Examples
+        --------
+        Getting the `Index` values of a `DataFrame`:
+
+        >>> df = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+        ...                    index=['a', 'b', 'c'], columns=['A', 'B', 'C'])
+        >>> df
+           A  B  C
+        a  1  2  3
+        b  4  5  6
+        c  7  8  9
+        >>> df.index.get_values()
+        array(['a', 'b', 'c'], dtype=object)
+
+        Standalone `Index` values:
+
+        >>> idx = pd.Index(['1', '2', '3'])
+        >>> idx.get_values()
+        array(['1', '2', '3'], dtype=object)
+
+        `MultiIndex` arrays also have only one dimension:
+
+        >>> midx = pd.MultiIndex.from_arrays([[1, 2, 3], ['a', 'b', 'c']],
+        ...                                  names=('number', 'letter'))
+        >>> midx.get_values()
+        array([(1, 'a'), (2, 'b'), (3, 'c')], dtype=object)
+        >>> midx.get_values().ndim
+        1
+        """
+        return self.values
+
+    @Appender(IndexOpsMixin.memory_usage.__doc__)
+    def memory_usage(self, deep=False):
+        result = super(Index, self).memory_usage(deep=deep)
+
+        # include our engine hashtable
+        result += self._engine.sizeof(deep=deep)
+        return result
+
+    # ops compat
+    @deprecate_kwarg(old_arg_name='n', new_arg_name='repeats')
+    def repeat(self, repeats, *args, **kwargs):
+        """
+        Repeat elements of an Index.
+
+        Returns a new index where each element of the current index
+        is repeated consecutively a given number of times.
+
+        Parameters
+        ----------
+        repeats : int
+            The number of repetitions for each element.
+        **kwargs
+            Additional keywords have no effect but might be accepted for
+            compatibility with numpy.
+
+        Returns
+        -------
+        pandas.Index
+            Newly created Index with repeated elements.
+
+        See Also
+        --------
+        Series.repeat : Equivalent function for Series
+        numpy.repeat : Underlying implementation
+
+        Examples
+        --------
+        >>> idx = pd.Index([1, 2, 3])
+        >>> idx
+        Int64Index([1, 2, 3], dtype='int64')
+        >>> idx.repeat(2)
+        Int64Index([1, 1, 2, 2, 3, 3], dtype='int64')
+        >>> idx.repeat(3)
+        Int64Index([1, 1, 1, 2, 2, 2, 3, 3, 3], dtype='int64')
+        """
+        nv.validate_repeat(args, kwargs)
+        return self._shallow_copy(self._values.repeat(repeats))
+
+    _index_shared_docs['where'] = """
+        .. versionadded:: 0.19.0
+
+        Return an Index of same shape as self and whose corresponding
+        entries are from self where cond is True and otherwise are from
+        other.
+
+        Parameters
+        ----------
+        cond : boolean array-like with the same length as self
+        other : scalar, or array-like
+        """
+
+    @Appender(_index_shared_docs['where'])
+    def where(self, cond, other=None):
+        if other is None:
+            other = self._na_value
+
+        dtype = self.dtype
+        values = self.values
+
+        if is_bool(other) or is_bool_dtype(other):
+
+            # bools force casting
+            values = values.astype(object)
+            dtype = None
+
+        values = np.where(cond, values, other)
+
+        if self._is_numeric_dtype and np.any(isna(values)):
+            # We can't coerce to the numeric dtype of "self" (unless
+            # it's float) if there are NaN values in our output.
+            dtype = None
+
+        return self._shallow_copy_with_infer(values, dtype=dtype)
+
+    def ravel(self, order='C'):
+        """
+        return an ndarray of the flattened values of the underlying data
+
+        See also
+        --------
+        numpy.ndarray.ravel
+        """
+        return self._ndarray_values.ravel(order=order)
+
+    # construction helpers
+    @classmethod
+    def _try_convert_to_int_index(cls, data, copy, name, dtype):
+        """
+        Attempt to convert an array of data into an integer index.
+
+        Parameters
+        ----------
+        data : The data to convert.
+        copy : Whether to copy the data or not.
+        name : The name of the index returned.
+
+        Returns
+        -------
+        int_index : data converted to either an Int64Index or a
+                    UInt64Index
+
+        Raises
+        ------
+        ValueError if the conversion was not successful.
+        """
+
+        from .numeric import Int64Index, UInt64Index
+        if not is_unsigned_integer_dtype(dtype):
+            # skip int64 conversion attempt if uint-like dtype is passed, as
+            # this could return Int64Index when UInt64Index is what's desrired
+            try:
+                res = data.astype('i8', copy=False)
+                if (res == data).all():
+                    return Int64Index(res, copy=copy, name=name)
+            except (OverflowError, TypeError, ValueError):
+                pass
+
+        # Conversion to int64 failed (possibly due to overflow) or was skipped,
+        # so let's try now with uint64.
+        try:
+            res = data.astype('u8', copy=False)
+            if (res == data).all():
+                return UInt64Index(res, copy=copy, name=name)
+        except (OverflowError, TypeError, ValueError):
+            pass
+
+        raise ValueError
+
+    @classmethod
+    def _scalar_data_error(cls, data):
+        raise TypeError('{0}(...) must be called with a collection of some '
+                        'kind, {1} was passed'.format(cls.__name__,
+                                                      repr(data)))
+
+    @classmethod
+    def _string_data_error(cls, data):
+        raise TypeError('String dtype not supported, you may need '
+                        'to explicitly cast to a numeric type')
+
+    @classmethod
+    def _coerce_to_ndarray(cls, data):
+        """coerces data to ndarray, raises on scalar data. Converts other
+        iterables to list first and then to array. Does not touch ndarrays.
+        """
+
+        if not isinstance(data, (np.ndarray, Index)):
+            if data is None or is_scalar(data):
+                cls._scalar_data_error(data)
+
+            # other iterable of some kind
+            if not isinstance(data, (ABCSeries, list, tuple)):
+                data = list(data)
+            data = np.asarray(data)
+        return data
+
+    def _get_attributes_dict(self):
+        """ return an attributes dict for my class """
+        return {k: getattr(self, k, None) for k in self._attributes}
+
+    def view(self, cls=None):
+
+        # we need to see if we are subclassing an
+        # index type here
+        if cls is not None and not hasattr(cls, '_typ'):
+            result = self._data.view(cls)
+        else:
+            result = self._shallow_copy()
+        if isinstance(result, Index):
+            result._id = self._id
+        return result
+
+    def _coerce_scalar_to_index(self, item):
+        """
+        we need to coerce a scalar to a compat for our index type
+
+        Parameters
+        ----------
+        item : scalar item to coerce
+        """
+        dtype = self.dtype
+
+        if self._is_numeric_dtype and isna(item):
+            # We can't coerce to the numeric dtype of "self" (unless
+            # it's float) if there are NaN values in our output.
+            dtype = None
+
+        return Index([item], dtype=dtype, **self._get_attributes_dict())
+
+    _index_shared_docs['copy'] = """
+        Make a copy of this object.  Name and dtype sets those attributes on
+        the new object.
+
+        Parameters
+        ----------
+        name : string, optional
+        deep : boolean, default False
+        dtype : numpy dtype or pandas type
+
+        Returns
+        -------
+        copy : Index
+
+        Notes
+        -----
+        In most cases, there should be no functional difference from using
+        ``deep``, but if ``deep`` is passed it will attempt to deepcopy.
+        """
+
+    @Appender(_index_shared_docs['copy'])
+    def copy(self, name=None, deep=False, dtype=None, **kwargs):
+        if deep:
+            new_index = self._shallow_copy(self._data.copy())
+        else:
+            new_index = self._shallow_copy()
+
+        names = kwargs.get('names')
+        names = self._validate_names(name=name, names=names, deep=deep)
+        new_index = new_index.set_names(names)
+
+        if dtype:
+            new_index = new_index.astype(dtype)
+        return new_index
+
+    def __copy__(self, **kwargs):
+        return self.copy(**kwargs)
+
+    def __deepcopy__(self, memo=None):
+        if memo is None:
+            memo = {}
+        return self.copy(deep=True)
+
+    def _validate_names(self, name=None, names=None, deep=False):
+        """
+        Handles the quirks of having a singular 'name' parameter for general
+        Index and plural 'names' parameter for MultiIndex.
+        """
+        from copy import deepcopy
+        if names is not None and name is not None:
+            raise TypeError("Can only provide one of `names` and `name`")
+        elif names is None and name is None:
+            return deepcopy(self.names) if deep else self.names
+        elif names is not None:
+            if not is_list_like(names):
+                raise TypeError("Must pass list-like as `names`.")
+            return names
+        else:
+            if not is_list_like(name):
+                return [name]
+            return name
+
+    def __unicode__(self):
+        """
+        Return a string representation for this object.
+
+        Invoked by unicode(df) in py2 only. Yields a Unicode String in both
+        py2/py3.
+        """
+        klass = self.__class__.__name__
+        data = self._format_data()
+        attrs = self._format_attrs()
+        space = self._format_space()
+
+        prepr = (u(",%s") %
+                 space).join(u("%s=%s") % (k, v) for k, v in attrs)
+
+        # no data provided, just attributes
+        if data is None:
+            data = ''
+
+        res = u("%s(%s%s)") % (klass, data, prepr)
+
+        return res
+
+    def _format_space(self):
+
+        # using space here controls if the attributes
+        # are line separated or not (the default)
+
+        # max_seq_items = get_option('display.max_seq_items')
+        # if len(self) > max_seq_items:
+        #    space = "\n%s" % (' ' * (len(klass) + 1))
+        return " "
+
+    @property
+    def _formatter_func(self):
+        """
+        Return the formatter function
+        """
+        return default_pprint
+
+    def _format_data(self, name=None):
+        """
+        Return the formatted data as a unicode string
+        """
+
+        # do we want to justify (only do so for non-objects)
+        is_justify = not (self.inferred_type in ('string', 'unicode') or
+                          (self.inferred_type == 'categorical' and
+                           is_object_dtype(self.categories)))
+
+        return format_object_summary(self, self._formatter_func,
+                                     is_justify=is_justify, name=name)
+
+    def _format_attrs(self):
+        """
+        Return a list of tuples of the (attr,formatted_value)
+        """
+        return format_object_attrs(self)
+
+    def to_series(self, index=None, name=None):
+        """
+        Create a Series with both index and values equal to the index keys
+        useful with map for returning an indexer based on an index
+
+        Parameters
+        ----------
+        index : Index, optional
+            index of resulting Series. If None, defaults to original index
+        name : string, optional
+            name of resulting Series. If None, defaults to name of original
+            index
+
+        Returns
+        -------
+        Series : dtype will be based on the type of the Index values.
+        """
+
+        from pandas import Series
+
+        if index is None:
+            index = self._shallow_copy()
+        if name is None:
+            name = self.name
+
+        return Series(self._to_embed(), index=index, name=name)
+
+    def to_frame(self, index=True):
+        """
+        Create a DataFrame with a column containing the Index.
+
+        .. versionadded:: 0.21.0
+
+        Parameters
+        ----------
+        index : boolean, default True
+            Set the index of the returned DataFrame as the original Index.
+
+        Returns
+        -------
+        DataFrame
+            DataFrame containing the original Index data.
+
+        See Also
+        --------
+        Index.to_series : Convert an Index to a Series.
+        Series.to_frame : Convert Series to DataFrame.
+
+        Examples
+        --------
+        >>> idx = pd.Index(['Ant', 'Bear', 'Cow'], name='animal')
+        >>> idx.to_frame()
+               animal
+        animal
+        Ant       Ant
+        Bear     Bear
+        Cow       Cow
+
+        By default, the original Index is reused. To enforce a new Index:
+
+        >>> idx.to_frame(index=False)
+            animal
+        0   Ant
+        1  Bear
+        2   Cow
+        """
+
+        from pandas import DataFrame
+        name = self.name or 0
+        result = DataFrame({name: self.values.copy()})
+
+        if index:
+            result.index = self
+        return result
+
+    def _to_embed(self, keep_tz=False, dtype=None):
+        """
+        *this is an internal non-public method*
+
+        return an array repr of this object, potentially casting to object
+
+        """
+        if dtype is not None:
+            return self.astype(dtype)._to_embed(keep_tz=keep_tz)
+
+        return self.values.copy()
+
+    _index_shared_docs['astype'] = """
+        Create an Index with values cast to dtypes. The class of a new Index
+        is determined by dtype. When conversion is impossible, a ValueError
+        exception is raised.
+
+        Parameters
+        ----------
+        dtype : numpy dtype or pandas type
+        copy : bool, default True
+            By default, astype always returns a newly allocated object.
+            If copy is set to False and internal requirements on dtype are
+            satisfied, the original data is used to create a new Index
+            or the original Index is returned.
+
+            .. versionadded:: 0.19.0
+
+        """
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        if is_dtype_equal(self.dtype, dtype):
+            return self.copy() if copy else self
+        elif is_categorical_dtype(dtype):
+            from .category import CategoricalIndex
+            return CategoricalIndex(self.values, name=self.name, dtype=dtype,
+                                    copy=copy)
+        try:
+            if is_datetime64tz_dtype(dtype):
+                from pandas import DatetimeIndex
+                return DatetimeIndex(self.values, name=self.name, dtype=dtype,
+                                     copy=copy)
+            return Index(self.values.astype(dtype, copy=copy), name=self.name,
+                         dtype=dtype)
+        except (TypeError, ValueError):
+            msg = 'Cannot cast {name} to dtype {dtype}'
+            raise TypeError(msg.format(name=type(self).__name__, dtype=dtype))
+
+    def _to_safe_for_reshape(self):
+        """ convert to object if we are a categorical """
+        return self
+
+    def _assert_can_do_setop(self, other):
+        if not is_list_like(other):
+            raise TypeError('Input must be Index or array-like')
+        return True
+
+    def _convert_can_do_setop(self, other):
+        if not isinstance(other, Index):
+            other = Index(other, name=self.name)
+            result_name = self.name
+        else:
+            result_name = self.name if self.name == other.name else None
+        return other, result_name
+
+    def _convert_for_op(self, value):
+        """ Convert value to be insertable to ndarray """
+        return value
+
+    def _assert_can_do_op(self, value):
+        """ Check value is valid for scalar op """
+        if not is_scalar(value):
+            msg = "'value' must be a scalar, passed: {0}"
+            raise TypeError(msg.format(type(value).__name__))
+
+    @property
+    def nlevels(self):
+        return 1
+
+    def _get_names(self):
+        return FrozenList((self.name, ))
+
+    def _set_names(self, values, level=None):
+        """
+        Set new names on index. Each name has to be a hashable type.
+
+        Parameters
+        ----------
+        values : str or sequence
+            name(s) to set
+        level : int, level name, or sequence of int/level names (default None)
+            If the index is a MultiIndex (hierarchical), level(s) to set (None
+            for all levels).  Otherwise level must be None
+
+        Raises
+        ------
+        TypeError if each name is not hashable.
+        """
+        if not is_list_like(values):
+            raise ValueError('Names must be a list-like')
+        if len(values) != 1:
+            raise ValueError('Length of new names must be 1, got %d' %
+                             len(values))
+
+        # GH 20527
+        # All items in 'name' need to be hashable:
+        for name in values:
+            if not is_hashable(name):
+                raise TypeError('{}.name must be a hashable type'
+                                .format(self.__class__.__name__))
+        self.name = values[0]
+
+    names = property(fset=_set_names, fget=_get_names)
+
+    def set_names(self, names, level=None, inplace=False):
+        """
+        Set new names on index. Defaults to returning new index.
+
+        Parameters
+        ----------
+        names : str or sequence
+            name(s) to set
+        level : int, level name, or sequence of int/level names (default None)
+            If the index is a MultiIndex (hierarchical), level(s) to set (None
+            for all levels).  Otherwise level must be None
+        inplace : bool
+            if True, mutates in place
+
+        Returns
+        -------
+        new index (of same type and class...etc) [if inplace, returns None]
+
+        Examples
+        --------
+        >>> Index([1, 2, 3, 4]).set_names('foo')
+        Int64Index([1, 2, 3, 4], dtype='int64', name='foo')
+        >>> Index([1, 2, 3, 4]).set_names(['foo'])
+        Int64Index([1, 2, 3, 4], dtype='int64', name='foo')
+        >>> idx = MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
+                                          (2, u'one'), (2, u'two')],
+                                          names=['foo', 'bar'])
+        >>> idx.set_names(['baz', 'quz'])
+        MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                   names=[u'baz', u'quz'])
+        >>> idx.set_names('baz', level=0)
+        MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                   names=[u'baz', u'bar'])
+        """
+
+        from .multi import MultiIndex
+        if level is not None and not isinstance(self, MultiIndex):
+            raise ValueError('Level must be None for non-MultiIndex')
+
+        if level is not None and not is_list_like(level) and is_list_like(
+                names):
+            raise TypeError("Names must be a string")
+
+        if not is_list_like(names) and level is None and self.nlevels > 1:
+            raise TypeError("Must pass list-like as `names`.")
+
+        if not is_list_like(names):
+            names = [names]
+        if level is not None and not is_list_like(level):
+            level = [level]
+
+        if inplace:
+            idx = self
+        else:
+            idx = self._shallow_copy()
+        idx._set_names(names, level=level)
+        if not inplace:
+            return idx
+
+    def rename(self, name, inplace=False):
+        """
+        Set new names on index. Defaults to returning new index.
+
+        Parameters
+        ----------
+        name : str or list
+            name to set
+        inplace : bool
+            if True, mutates in place
+
+        Returns
+        -------
+        new index (of same type and class...etc) [if inplace, returns None]
+        """
+        return self.set_names([name], inplace=inplace)
+
+    @property
+    def _has_complex_internals(self):
+        # to disable groupby tricks in MultiIndex
+        return False
+
+    def _summary(self, name=None):
+        """
+        Return a summarized representation
+
+        Parameters
+        ----------
+        name : str
+            name to use in the summary representation
+
+        Returns
+        -------
+        String with a summarized representation of the index
+        """
+        if len(self) > 0:
+            head = self[0]
+            if (hasattr(head, 'format') and
+                    not isinstance(head, compat.string_types)):
+                head = head.format()
+            tail = self[-1]
+            if (hasattr(tail, 'format') and
+                    not isinstance(tail, compat.string_types)):
+                tail = tail.format()
+            index_summary = ', %s to %s' % (pprint_thing(head),
+                                            pprint_thing(tail))
+        else:
+            index_summary = ''
+
+        if name is None:
+            name = type(self).__name__
+        return '%s: %s entries%s' % (name, len(self), index_summary)
+
+    def summary(self, name=None):
+        """
+        Return a summarized representation
+        .. deprecated:: 0.23.0
+        """
+        warnings.warn("'summary' is deprecated and will be removed in a "
+                      "future version.", FutureWarning, stacklevel=2)
+        return self._summary(name)
+
+    def _mpl_repr(self):
+        # how to represent ourselves to matplotlib
+        return self.values
+
+    _na_value = np.nan
+    """The expected NA value to use with this index."""
+
+    # introspection
+    @property
+    def is_monotonic(self):
+        """ alias for is_monotonic_increasing (deprecated) """
+        return self.is_monotonic_increasing
+
+    @property
+    def is_monotonic_increasing(self):
+        """
+        return if the index is monotonic increasing (only equal or
+        increasing) values.
+
+        Examples
+        --------
+        >>> Index([1, 2, 3]).is_monotonic_increasing
+        True
+        >>> Index([1, 2, 2]).is_monotonic_increasing
+        True
+        >>> Index([1, 3, 2]).is_monotonic_increasing
+        False
+        """
+        return self._engine.is_monotonic_increasing
+
+    @property
+    def is_monotonic_decreasing(self):
+        """
+        return if the index is monotonic decreasing (only equal or
+        decreasing) values.
+
+        Examples
+        --------
+        >>> Index([3, 2, 1]).is_monotonic_decreasing
+        True
+        >>> Index([3, 2, 2]).is_monotonic_decreasing
+        True
+        >>> Index([3, 1, 2]).is_monotonic_decreasing
+        False
+        """
+        return self._engine.is_monotonic_decreasing
+
+    @property
+    def _is_strictly_monotonic_increasing(self):
+        """return if the index is strictly monotonic increasing
+        (only increasing) values
+
+        Examples
+        --------
+        >>> Index([1, 2, 3])._is_strictly_monotonic_increasing
+        True
+        >>> Index([1, 2, 2])._is_strictly_monotonic_increasing
+        False
+        >>> Index([1, 3, 2])._is_strictly_monotonic_increasing
+        False
+        """
+        return self.is_unique and self.is_monotonic_increasing
+
+    @property
+    def _is_strictly_monotonic_decreasing(self):
+        """return if the index is strictly monotonic decreasing
+        (only decreasing) values
+
+        Examples
+        --------
+        >>> Index([3, 2, 1])._is_strictly_monotonic_decreasing
+        True
+        >>> Index([3, 2, 2])._is_strictly_monotonic_decreasing
+        False
+        >>> Index([3, 1, 2])._is_strictly_monotonic_decreasing
+        False
+        """
+        return self.is_unique and self.is_monotonic_decreasing
+
+    def is_lexsorted_for_tuple(self, tup):
+        return True
+
+    @cache_readonly
+    def is_unique(self):
+        """ return if the index has unique values """
+        return self._engine.is_unique
+
+    @property
+    def has_duplicates(self):
+        return not self.is_unique
+
+    def is_boolean(self):
+        return self.inferred_type in ['boolean']
+
+    def is_integer(self):
+        return self.inferred_type in ['integer']
+
+    def is_floating(self):
+        return self.inferred_type in ['floating', 'mixed-integer-float']
+
+    def is_numeric(self):
+        return self.inferred_type in ['integer', 'floating']
+
+    def is_object(self):
+        return is_object_dtype(self.dtype)
+
+    def is_categorical(self):
+        """
+        Check if the Index holds categorical data.
+
+        Returns
+        -------
+        boolean
+            True if the Index is categorical.
+
+        See Also
+        --------
+        CategoricalIndex : Index for categorical data.
+
+        Examples
+        --------
+        >>> idx = pd.Index(["Watermelon", "Orange", "Apple",
+        ...                 "Watermelon"]).astype("category")
+        >>> idx.is_categorical()
+        True
+
+        >>> idx = pd.Index([1, 3, 5, 7])
+        >>> idx.is_categorical()
+        False
+
+        >>> s = pd.Series(["Peter", "Victor", "Elisabeth", "Mar"])
+        >>> s
+        0        Peter
+        1       Victor
+        2    Elisabeth
+        3          Mar
+        dtype: object
+        >>> s.index.is_categorical()
+        False
+        """
+        return self.inferred_type in ['categorical']
+
+    def is_interval(self):
+        return self.inferred_type in ['interval']
+
+    def is_mixed(self):
+        return self.inferred_type in ['mixed']
+
+    def holds_integer(self):
+        return self.inferred_type in ['integer', 'mixed-integer']
+
+    _index_shared_docs['_convert_scalar_indexer'] = """
+        Convert a scalar indexer.
+
+        Parameters
+        ----------
+        key : label of the slice bound
+        kind : {'ix', 'loc', 'getitem', 'iloc'} or None
+    """
+
+    @Appender(_index_shared_docs['_convert_scalar_indexer'])
+    def _convert_scalar_indexer(self, key, kind=None):
+        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
+
+        if kind == 'iloc':
+            return self._validate_indexer('positional', key, kind)
+
+        if len(self) and not isinstance(self, ABCMultiIndex,):
+
+            # we can raise here if we are definitive that this
+            # is positional indexing (eg. .ix on with a float)
+            # or label indexing if we are using a type able
+            # to be represented in the index
+
+            if kind in ['getitem', 'ix'] and is_float(key):
+                if not self.is_floating():
+                    return self._invalid_indexer('label', key)
+
+            elif kind in ['loc'] and is_float(key):
+
+                # we want to raise KeyError on string/mixed here
+                # technically we *could* raise a TypeError
+                # on anything but mixed though
+                if self.inferred_type not in ['floating',
+                                              'mixed-integer-float',
+                                              'string',
+                                              'unicode',
+                                              'mixed']:
+                    return self._invalid_indexer('label', key)
+
+            elif kind in ['loc'] and is_integer(key):
+                if not self.holds_integer():
+                    return self._invalid_indexer('label', key)
+
+        return key
+
+    _index_shared_docs['_convert_slice_indexer'] = """
+        Convert a slice indexer.
+
+        By definition, these are labels unless 'iloc' is passed in.
+        Floats are not allowed as the start, step, or stop of the slice.
+
+        Parameters
+        ----------
+        key : label of the slice bound
+        kind : {'ix', 'loc', 'getitem', 'iloc'} or None
+    """
+
+    @Appender(_index_shared_docs['_convert_slice_indexer'])
+    def _convert_slice_indexer(self, key, kind=None):
+        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
+
+        # if we are not a slice, then we are done
+        if not isinstance(key, slice):
+            return key
+
+        # validate iloc
+        if kind == 'iloc':
+            return slice(self._validate_indexer('slice', key.start, kind),
+                         self._validate_indexer('slice', key.stop, kind),
+                         self._validate_indexer('slice', key.step, kind))
+
+        # potentially cast the bounds to integers
+        start, stop, step = key.start, key.stop, key.step
+
+        # figure out if this is a positional indexer
+        def is_int(v):
+            return v is None or is_integer(v)
+
+        is_null_slicer = start is None and stop is None
+        is_index_slice = is_int(start) and is_int(stop)
+        is_positional = is_index_slice and not self.is_integer()
+
+        if kind == 'getitem':
+            """
+            called from the getitem slicers, validate that we are in fact
+            integers
+            """
+            if self.is_integer() or is_index_slice:
+                return slice(self._validate_indexer('slice', key.start, kind),
+                             self._validate_indexer('slice', key.stop, kind),
+                             self._validate_indexer('slice', key.step, kind))
+
+        # convert the slice to an indexer here
+
+        # if we are mixed and have integers
+        try:
+            if is_positional and self.is_mixed():
+                # TODO: i, j are not used anywhere
+                if start is not None:
+                    i = self.get_loc(start)  # noqa
+                if stop is not None:
+                    j = self.get_loc(stop)  # noqa
+                is_positional = False
+        except KeyError:
+            if self.inferred_type == 'mixed-integer-float':
+                raise
+
+        if is_null_slicer:
+            indexer = key
+        elif is_positional:
+            indexer = key
+        else:
+            try:
+                indexer = self.slice_indexer(start, stop, step, kind=kind)
+            except Exception:
+                if is_index_slice:
+                    if self.is_integer():
+                        raise
+                    else:
+                        indexer = key
+                else:
+                    raise
+
+        return indexer
+
+    def _convert_listlike_indexer(self, keyarr, kind=None):
+        """
+        Parameters
+        ----------
+        keyarr : list-like
+            Indexer to convert.
+
+        Returns
+        -------
+        tuple (indexer, keyarr)
+            indexer is an ndarray or None if cannot convert
+            keyarr are tuple-safe keys
+        """
+        if isinstance(keyarr, Index):
+            keyarr = self._convert_index_indexer(keyarr)
+        else:
+            keyarr = self._convert_arr_indexer(keyarr)
+
+        indexer = self._convert_list_indexer(keyarr, kind=kind)
+        return indexer, keyarr
+
+    _index_shared_docs['_convert_arr_indexer'] = """
+        Convert an array-like indexer to the appropriate dtype.
+
+        Parameters
+        ----------
+        keyarr : array-like
+            Indexer to convert.
+
+        Returns
+        -------
+        converted_keyarr : array-like
+    """
+
+    @Appender(_index_shared_docs['_convert_arr_indexer'])
+    def _convert_arr_indexer(self, keyarr):
+        keyarr = com._asarray_tuplesafe(keyarr)
+        return keyarr
+
+    _index_shared_docs['_convert_index_indexer'] = """
+        Convert an Index indexer to the appropriate dtype.
+
+        Parameters
+        ----------
+        keyarr : Index (or sub-class)
+            Indexer to convert.
+
+        Returns
+        -------
+        converted_keyarr : Index (or sub-class)
+    """
+
+    @Appender(_index_shared_docs['_convert_index_indexer'])
+    def _convert_index_indexer(self, keyarr):
+        return keyarr
+
+    _index_shared_docs['_convert_list_indexer'] = """
+        Convert a list-like indexer to the appropriate dtype.
+
+        Parameters
+        ----------
+        keyarr : Index (or sub-class)
+            Indexer to convert.
+        kind : iloc, ix, loc, optional
+
+        Returns
+        -------
+        positional indexer or None
+    """
+
+    @Appender(_index_shared_docs['_convert_list_indexer'])
+    def _convert_list_indexer(self, keyarr, kind=None):
+        if (kind in [None, 'iloc', 'ix'] and
+                is_integer_dtype(keyarr) and not self.is_floating() and
+                not isinstance(keyarr, ABCPeriodIndex)):
+
+            if self.inferred_type == 'mixed-integer':
+                indexer = self.get_indexer(keyarr)
+                if (indexer >= 0).all():
+                    return indexer
+                # missing values are flagged as -1 by get_indexer and negative
+                # indices are already converted to positive indices in the
+                # above if-statement, so the negative flags are changed to
+                # values outside the range of indices so as to trigger an
+                # IndexError in maybe_convert_indices
+                indexer[indexer < 0] = len(self)
+                from pandas.core.indexing import maybe_convert_indices
+                return maybe_convert_indices(indexer, len(self))
+
+            elif not self.inferred_type == 'integer':
+                keyarr = np.where(keyarr < 0, len(self) + keyarr, keyarr)
+                return keyarr
+
+        return None
+
+    def _invalid_indexer(self, form, key):
+        """ consistent invalid indexer message """
+        raise TypeError("cannot do {form} indexing on {klass} with these "
+                        "indexers [{key}] of {kind}".format(
+                            form=form, klass=type(self), key=key,
+                            kind=type(key)))
+
+    def get_duplicates(self):
+        """
+        Extract duplicated index elements.
+
+        Returns a sorted list of index elements which appear more than once in
+        the index.
+
+        .. deprecated:: 0.23.0
+            Use idx[idx.duplicated()].unique() instead
+
+        Returns
+        -------
+        array-like
+            List of duplicated indexes.
+
+        See Also
+        --------
+        Index.duplicated : Return boolean array denoting duplicates.
+        Index.drop_duplicates : Return Index with duplicates removed.
+
+        Examples
+        --------
+
+        Works on different Index of types.
+
+        >>> pd.Index([1, 2, 2, 3, 3, 3, 4]).get_duplicates()
+        [2, 3]
+        >>> pd.Index([1., 2., 2., 3., 3., 3., 4.]).get_duplicates()
+        [2.0, 3.0]
+        >>> pd.Index(['a', 'b', 'b', 'c', 'c', 'c', 'd']).get_duplicates()
+        ['b', 'c']
+
+        Note that for a DatetimeIndex, it does not return a list but a new
+        DatetimeIndex:
+
+        >>> dates = pd.to_datetime(['2018-01-01', '2018-01-02', '2018-01-03',
+        ...                         '2018-01-03', '2018-01-04', '2018-01-04'],
+        ...                        format='%Y-%m-%d')
+        >>> pd.Index(dates).get_duplicates()
+        DatetimeIndex(['2018-01-03', '2018-01-04'],
+                      dtype='datetime64[ns]', freq=None)
+
+        Sorts duplicated elements even when indexes are unordered.
+
+        >>> pd.Index([1, 2, 3, 2, 3, 4, 3]).get_duplicates()
+        [2, 3]
+
+        Return empty array-like structure when all elements are unique.
+
+        >>> pd.Index([1, 2, 3, 4]).get_duplicates()
+        []
+        >>> dates = pd.to_datetime(['2018-01-01', '2018-01-02', '2018-01-03'],
+        ...                        format='%Y-%m-%d')
+        >>> pd.Index(dates).get_duplicates()
+        DatetimeIndex([], dtype='datetime64[ns]', freq=None)
+        """
+        warnings.warn("'get_duplicates' is deprecated and will be removed in "
+                      "a future release. You can use "
+                      "idx[idx.duplicated()].unique() instead",
+                      FutureWarning, stacklevel=2)
+
+        return self[self.duplicated()].unique()
+
+    def _cleanup(self):
+        self._engine.clear_mapping()
+
+    @cache_readonly
+    def _constructor(self):
+        return type(self)
+
+    @cache_readonly
+    def _engine(self):
+        # property, for now, slow to look up
+        return self._engine_type(lambda: self._ndarray_values, len(self))
+
+    def _validate_index_level(self, level):
+        """
+        Validate index level.
+
+        For single-level Index getting level number is a no-op, but some
+        verification must be done like in MultiIndex.
+
+        """
+        if isinstance(level, int):
+            if level < 0 and level != -1:
+                raise IndexError("Too many levels: Index has only 1 level,"
+                                 " %d is not a valid level number" % (level, ))
+            elif level > 0:
+                raise IndexError("Too many levels:"
+                                 " Index has only 1 level, not %d" %
+                                 (level + 1))
+        elif level != self.name:
+            raise KeyError('Level %s must be same as name (%s)' %
+                           (level, self.name))
+
+    def _get_level_number(self, level):
+        self._validate_index_level(level)
+        return 0
+
+    @cache_readonly
+    def inferred_type(self):
+        """ return a string of the type inferred from the values """
+        return lib.infer_dtype(self)
+
+    def _is_memory_usage_qualified(self):
+        """ return a boolean if we need a qualified .info display """
+        return self.is_object()
+
+    def is_type_compatible(self, kind):
+        return kind == self.inferred_type
+
+    @cache_readonly
+    def is_all_dates(self):
+        if self._data is None:
+            return False
+        return is_datetime_array(_ensure_object(self.values))
+
+    def __reduce__(self):
+        d = dict(data=self._data)
+        d.update(self._get_attributes_dict())
+        return _new_Index, (self.__class__, d), None
+
+    def __setstate__(self, state):
+        """Necessary for making this object picklable"""
+
+        if isinstance(state, dict):
+            self._data = state.pop('data')
+            for k, v in compat.iteritems(state):
+                setattr(self, k, v)
+
+        elif isinstance(state, tuple):
+
+            if len(state) == 2:
+                nd_state, own_state = state
+                data = np.empty(nd_state[1], dtype=nd_state[2])
+                np.ndarray.__setstate__(data, nd_state)
+                self.name = own_state[0]
+
+            else:  # pragma: no cover
+                data = np.empty(state)
+                np.ndarray.__setstate__(data, state)
+
+            self._data = data
+            self._reset_identity()
+        else:
+            raise Exception("invalid pickle state")
+
+    _unpickle_compat = __setstate__
+
+    def __nonzero__(self):
+        raise ValueError("The truth value of a {0} is ambiguous. "
+                         "Use a.empty, a.bool(), a.item(), a.any() or a.all()."
+                         .format(self.__class__.__name__))
+
+    __bool__ = __nonzero__
+
+    _index_shared_docs['__contains__'] = """
+        return a boolean if this key is IN the index
+
+        Parameters
+        ----------
+        key : object
+
+        Returns
+        -------
+        boolean
+        """
+
+    @Appender(_index_shared_docs['__contains__'] % _index_doc_kwargs)
+    def __contains__(self, key):
+        hash(key)
+        try:
+            return key in self._engine
+        except (OverflowError, TypeError, ValueError):
+            return False
+
+    _index_shared_docs['contains'] = """
+        return a boolean if this key is IN the index
+
+        Parameters
+        ----------
+        key : object
+
+        Returns
+        -------
+        boolean
+        """
+
+    @Appender(_index_shared_docs['contains'] % _index_doc_kwargs)
+    def contains(self, key):
+        hash(key)
+        try:
+            return key in self._engine
+        except (TypeError, ValueError):
+            return False
+
+    def __hash__(self):
+        raise TypeError("unhashable type: %r" % type(self).__name__)
+
+    def __setitem__(self, key, value):
+        raise TypeError("Index does not support mutable operations")
+
+    def __getitem__(self, key):
+        """
+        Override numpy.ndarray's __getitem__ method to work as desired.
+
+        This function adds lists and Series as valid boolean indexers
+        (ndarrays only supports ndarray with dtype=bool).
+
+        If resulting ndim != 1, plain ndarray is returned instead of
+        corresponding `Index` subclass.
+
+        """
+        # There's no custom logic to be implemented in __getslice__, so it's
+        # not overloaded intentionally.
+        getitem = self._data.__getitem__
+        promote = self._shallow_copy
+
+        if is_scalar(key):
+            return getitem(key)
+
+        if isinstance(key, slice):
+            # This case is separated from the conditional above to avoid
+            # pessimization of basic indexing.
+            return promote(getitem(key))
+
+        if com.is_bool_indexer(key):
+            key = np.asarray(key)
+
+        key = com._values_from_object(key)
+        result = getitem(key)
+        if not is_scalar(result):
+            return promote(result)
+        else:
+            return result
+
+    def _can_hold_identifiers_and_holds_name(self, name):
+        """
+        Faster check for ``name in self`` when we know `name` is a Python
+        identifier (e.g. in NDFrame.__getattr__, which hits this to support
+        . key lookup). For indexes that can't hold identifiers (everything
+        but object & categorical) we just return False.
+
+        https://github.com/pandas-dev/pandas/issues/19764
+        """
+        if self.is_object() or self.is_categorical():
+            return name in self
+        return False
+
+    def append(self, other):
+        """
+        Append a collection of Index options together
+
+        Parameters
+        ----------
+        other : Index or list/tuple of indices
+
+        Returns
+        -------
+        appended : Index
+        """
+
+        to_concat = [self]
+
+        if isinstance(other, (list, tuple)):
+            to_concat = to_concat + list(other)
+        else:
+            to_concat.append(other)
+
+        for obj in to_concat:
+            if not isinstance(obj, Index):
+                raise TypeError('all inputs must be Index')
+
+        names = {obj.name for obj in to_concat}
+        name = None if len(names) > 1 else self.name
+
+        return self._concat(to_concat, name)
+
+    def _concat(self, to_concat, name):
+
+        typs = _concat.get_dtype_kinds(to_concat)
+
+        if len(typs) == 1:
+            return self._concat_same_dtype(to_concat, name=name)
+        return _concat._concat_index_asobject(to_concat, name=name)
+
+    def _concat_same_dtype(self, to_concat, name):
+        """
+        Concatenate to_concat which has the same class
+        """
+        # must be overridden in specific classes
+        return _concat._concat_index_asobject(to_concat, name)
+
+    _index_shared_docs['take'] = """
+        return a new %(klass)s of the values selected by the indices
+
+        For internal compatibility with numpy arrays.
+
+        Parameters
+        ----------
+        indices : list
+            Indices to be taken
+        axis : int, optional
+            The axis over which to select values, always 0.
+        allow_fill : bool, default True
+        fill_value : bool, default None
+            If allow_fill=True and fill_value is not None, indices specified by
+            -1 is regarded as NA. If Index doesn't hold NA, raise ValueError
+
+        See also
+        --------
+        numpy.ndarray.take
+        """
+
+    @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
+    def take(self, indices, axis=0, allow_fill=True,
+             fill_value=None, **kwargs):
+        if kwargs:
+            nv.validate_take(tuple(), kwargs)
+        indices = _ensure_platform_int(indices)
+        if self._can_hold_na:
+            taken = self._assert_take_fillable(self.values, indices,
+                                               allow_fill=allow_fill,
+                                               fill_value=fill_value,
+                                               na_value=self._na_value)
+        else:
+            if allow_fill and fill_value is not None:
+                msg = 'Unable to fill values because {0} cannot contain NA'
+                raise ValueError(msg.format(self.__class__.__name__))
+            taken = self.values.take(indices)
+        return self._shallow_copy(taken)
+
+    def _assert_take_fillable(self, values, indices, allow_fill=True,
+                              fill_value=None, na_value=np.nan):
+        """ Internal method to handle NA filling of take """
+        indices = _ensure_platform_int(indices)
+
+        # only fill if we are passing a non-None fill_value
+        if allow_fill and fill_value is not None:
+            if (indices < -1).any():
+                msg = ('When allow_fill=True and fill_value is not None, '
+                       'all indices must be >= -1')
+                raise ValueError(msg)
+            taken = algos.take(values,
+                               indices,
+                               allow_fill=allow_fill,
+                               fill_value=na_value)
+        else:
+            taken = values.take(indices)
+        return taken
+
+    @cache_readonly
+    def _isnan(self):
+        """ return if each value is nan"""
+        if self._can_hold_na:
+            return isna(self)
+        else:
+            # shouldn't reach to this condition by checking hasnans beforehand
+            values = np.empty(len(self), dtype=np.bool_)
+            values.fill(False)
+            return values
+
+    @cache_readonly
+    def _nan_idxs(self):
+        if self._can_hold_na:
+            w, = self._isnan.nonzero()
+            return w
+        else:
+            return np.array([], dtype=np.int64)
+
+    @cache_readonly
+    def hasnans(self):
+        """ return if I have any nans; enables various perf speedups """
+        if self._can_hold_na:
+            return self._isnan.any()
+        else:
+            return False
+
+    def isna(self):
+        """
+        Detect missing values.
+
+        Return a boolean same-sized object indicating if the values are NA.
+        NA values, such as ``None``, :attr:`numpy.NaN` or :attr:`pd.NaT`, get
+        mapped to ``True`` values.
+        Everything else get mapped to ``False`` values. Characters such as
+        empty strings `''` or :attr:`numpy.inf` are not considered NA values
+        (unless you set ``pandas.options.mode.use_inf_as_na = True``).
+
+        .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        numpy.ndarray
+            A boolean array of whether my values are NA
+
+        See Also
+        --------
+        pandas.Index.notna : boolean inverse of isna.
+        pandas.Index.dropna : omit entries with missing values.
+        pandas.isna : top-level isna.
+        Series.isna : detect missing values in Series object.
+
+        Examples
+        --------
+        Show which entries in a pandas.Index are NA. The result is an
+        array.
+
+        >>> idx = pd.Index([5.2, 6.0, np.NaN])
+        >>> idx
+        Float64Index([5.2, 6.0, nan], dtype='float64')
+        >>> idx.isna()
+        array([False, False,  True], dtype=bool)
+
+        Empty strings are not considered NA values. None is considered an NA
+        value.
+
+        >>> idx = pd.Index(['black', '', 'red', None])
+        >>> idx
+        Index(['black', '', 'red', None], dtype='object')
+        >>> idx.isna()
+        array([False, False, False,  True], dtype=bool)
+
+        For datetimes, `NaT` (Not a Time) is considered as an NA value.
+
+        >>> idx = pd.DatetimeIndex([pd.Timestamp('1940-04-25'),
+        ...                         pd.Timestamp(''), None, pd.NaT])
+        >>> idx
+        DatetimeIndex(['1940-04-25', 'NaT', 'NaT', 'NaT'],
+                      dtype='datetime64[ns]', freq=None)
+        >>> idx.isna()
+        array([False,  True,  True,  True], dtype=bool)
+        """
+        return self._isnan
+    isnull = isna
+
+    def notna(self):
+        """
+        Detect existing (non-missing) values.
+
+        Return a boolean same-sized object indicating if the values are not NA.
+        Non-missing values get mapped to ``True``. Characters such as empty
+        strings ``''`` or :attr:`numpy.inf` are not considered NA values
+        (unless you set ``pandas.options.mode.use_inf_as_na = True``).
+        NA values, such as None or :attr:`numpy.NaN`, get mapped to ``False``
+        values.
+
+        .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        numpy.ndarray
+            Boolean array to indicate which entries are not NA.
+
+        See also
+        --------
+        Index.notnull : alias of notna
+        Index.isna: inverse of notna
+        pandas.notna : top-level notna
+
+        Examples
+        --------
+        Show which entries in an Index are not NA. The result is an
+        array.
+
+        >>> idx = pd.Index([5.2, 6.0, np.NaN])
+        >>> idx
+        Float64Index([5.2, 6.0, nan], dtype='float64')
+        >>> idx.notna()
+        array([ True,  True, False])
+
+        Empty strings are not considered NA values. None is considered a NA
+        value.
+
+        >>> idx = pd.Index(['black', '', 'red', None])
+        >>> idx
+        Index(['black', '', 'red', None], dtype='object')
+        >>> idx.notna()
+        array([ True,  True,  True, False])
+        """
+        return ~self.isna()
+    notnull = notna
+
+    def putmask(self, mask, value):
+        """
+        return a new Index of the values set with the mask
+
+        See also
+        --------
+        numpy.ndarray.putmask
+        """
+        values = self.values.copy()
+        try:
+            np.putmask(values, mask, self._convert_for_op(value))
+            return self._shallow_copy(values)
+        except (ValueError, TypeError) as err:
+            if is_object_dtype(self):
+                raise err
+
+            # coerces to object
+            return self.astype(object).putmask(mask, value)
+
+    def format(self, name=False, formatter=None, **kwargs):
+        """
+        Render a string representation of the Index
+        """
+        header = []
+        if name:
+            header.append(pprint_thing(self.name,
+                                       escape_chars=('\t', '\r', '\n')) if
+                          self.name is not None else '')
+
+        if formatter is not None:
+            return header + list(self.map(formatter))
+
+        return self._format_with_header(header, **kwargs)
+
+    def _format_with_header(self, header, na_rep='NaN', **kwargs):
+        values = self.values
+
+        from pandas.io.formats.format import format_array
+
+        if is_categorical_dtype(values.dtype):
+            values = np.array(values)
+
+        elif is_object_dtype(values.dtype):
+            values = lib.maybe_convert_objects(values, safe=1)
+
+        if is_object_dtype(values.dtype):
+            result = [pprint_thing(x, escape_chars=('\t', '\r', '\n'))
+                      for x in values]
+
+            # could have nans
+            mask = isna(values)
+            if mask.any():
+                result = np.array(result)
+                result[mask] = na_rep
+                result = result.tolist()
+
+        else:
+            result = _trim_front(format_array(values, None, justify='left'))
+        return header + result
+
+    def to_native_types(self, slicer=None, **kwargs):
+        """
+        Format specified values of `self` and return them.
+
+        Parameters
+        ----------
+        slicer : int, array-like
+            An indexer into `self` that specifies which values
+            are used in the formatting process.
+        kwargs : dict
+            Options for specifying how the values should be formatted.
+            These options include the following:
+
+            1) na_rep : str
+                The value that serves as a placeholder for NULL values
+            2) quoting : bool or None
+                Whether or not there are quoted values in `self`
+            3) date_format : str
+                The format used to represent date-like values
+        """
+
+        values = self
+        if slicer is not None:
+            values = values[slicer]
+        return values._format_native_types(**kwargs)
+
+    def _format_native_types(self, na_rep='', quoting=None, **kwargs):
+        """ actually format my specific types """
+        mask = isna(self)
+        if not self.is_object() and not quoting:
+            values = np.asarray(self).astype(str)
+        else:
+            values = np.array(self, dtype=object, copy=True)
+
+        values[mask] = na_rep
+        return values
+
+    def equals(self, other):
+        """
+        Determines if two Index objects contain the same elements.
+        """
+        if self.is_(other):
+            return True
+
+        if not isinstance(other, Index):
+            return False
+
+        if is_object_dtype(self) and not is_object_dtype(other):
+            # if other is not object, use other's logic for coercion
+            return other.equals(self)
+
+        try:
+            return array_equivalent(com._values_from_object(self),
+                                    com._values_from_object(other))
+        except Exception:
+            return False
+
+    def identical(self, other):
+        """Similar to equals, but check that other comparable attributes are
+        also equal
+        """
+        return (self.equals(other) and
+                all((getattr(self, c, None) == getattr(other, c, None)
+                     for c in self._comparables)) and
+                type(self) == type(other))
+
+    def asof(self, label):
+        """
+        For a sorted index, return the most recent label up to and including
+        the passed label. Return NaN if not found.
+
+        See also
+        --------
+        get_loc : asof is a thin wrapper around get_loc with method='pad'
+        """
+        try:
+            loc = self.get_loc(label, method='pad')
+        except KeyError:
+            return self._na_value
+        else:
+            if isinstance(loc, slice):
+                loc = loc.indices(len(self))[-1]
+            return self[loc]
+
+    def asof_locs(self, where, mask):
+        """
+        where : array of timestamps
+        mask : array of booleans where data is not NA
+
+        """
+        locs = self.values[mask].searchsorted(where.values, side='right')
+
+        locs = np.where(locs > 0, locs - 1, 0)
+        result = np.arange(len(self))[mask].take(locs)
+
+        first = mask.argmax()
+        result[(locs == 0) & (where < self.values[first])] = -1
+
+        return result
+
+    def sort_values(self, return_indexer=False, ascending=True):
+        """
+        Return a sorted copy of the index.
+
+        Return a sorted copy of the index, and optionally return the indices
+        that sorted the index itself.
+
+        Parameters
+        ----------
+        return_indexer : bool, default False
+            Should the indices that would sort the index be returned.
+        ascending : bool, default True
+            Should the index values be sorted in an ascending order.
+
+        Returns
+        -------
+        sorted_index : pandas.Index
+            Sorted copy of the index.
+        indexer : numpy.ndarray, optional
+            The indices that the index itself was sorted by.
+
+        See Also
+        --------
+        pandas.Series.sort_values : Sort values of a Series.
+        pandas.DataFrame.sort_values : Sort values in a DataFrame.
+
+        Examples
+        --------
+        >>> idx = pd.Index([10, 100, 1, 1000])
+        >>> idx
+        Int64Index([10, 100, 1, 1000], dtype='int64')
+
+        Sort values in ascending order (default behavior).
+
+        >>> idx.sort_values()
+        Int64Index([1, 10, 100, 1000], dtype='int64')
+
+        Sort values in descending order, and also get the indices `idx` was
+        sorted by.
+
+        >>> idx.sort_values(ascending=False, return_indexer=True)
+        (Int64Index([1000, 100, 10, 1], dtype='int64'), array([3, 1, 0, 2]))
+        """
+        _as = self.argsort()
+        if not ascending:
+            _as = _as[::-1]
+
+        sorted_index = self.take(_as)
+
+        if return_indexer:
+            return sorted_index, _as
+        else:
+            return sorted_index
+
+    def sort(self, *args, **kwargs):
+        raise TypeError("cannot sort an Index object in-place, use "
+                        "sort_values instead")
+
+    def sortlevel(self, level=None, ascending=True, sort_remaining=None):
+        """
+
+        For internal compatibility with with the Index API
+
+        Sort the Index. This is for compat with MultiIndex
+
+        Parameters
+        ----------
+        ascending : boolean, default True
+            False to sort in descending order
+
+        level, sort_remaining are compat parameters
+
+        Returns
+        -------
+        sorted_index : Index
+        """
+        return self.sort_values(return_indexer=True, ascending=ascending)
+
+    def shift(self, periods=1, freq=None):
+        """
+        Shift index by desired number of time frequency increments.
+
+        This method is for shifting the values of datetime-like indexes
+        by a specified time increment a given number of times.
+
+        Parameters
+        ----------
+        periods : int, default 1
+            Number of periods (or increments) to shift by,
+            can be positive or negative.
+        freq : pandas.DateOffset, pandas.Timedelta or string, optional
+            Frequency increment to shift by.
+            If None, the index is shifted by its own `freq` attribute.
+            Offset aliases are valid strings, e.g., 'D', 'W', 'M' etc.
+
+        Returns
+        -------
+        pandas.Index
+            shifted index
+
+        See Also
+        --------
+        Series.shift : Shift values of Series.
+
+        Examples
+        --------
+        Put the first 5 month starts of 2011 into an index.
+
+        >>> month_starts = pd.date_range('1/1/2011', periods=5, freq='MS')
+        >>> month_starts
+        DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01', '2011-04-01',
+                       '2011-05-01'],
+                      dtype='datetime64[ns]', freq='MS')
+
+        Shift the index by 10 days.
+
+        >>> month_starts.shift(10, freq='D')
+        DatetimeIndex(['2011-01-11', '2011-02-11', '2011-03-11', '2011-04-11',
+                       '2011-05-11'],
+                      dtype='datetime64[ns]', freq=None)
+
+        The default value of `freq` is the `freq` attribute of the index,
+        which is 'MS' (month start) in this example.
+
+        >>> month_starts.shift(10)
+        DatetimeIndex(['2011-11-01', '2011-12-01', '2012-01-01', '2012-02-01',
+                       '2012-03-01'],
+                      dtype='datetime64[ns]', freq='MS')
+
+        Notes
+        -----
+        This method is only implemented for datetime-like index classes,
+        i.e., DatetimeIndex, PeriodIndex and TimedeltaIndex.
+        """
+        raise NotImplementedError("Not supported for type %s" %
+                                  type(self).__name__)
+
+    def argsort(self, *args, **kwargs):
+        """
+        Return the integer indices that would sort the index.
+
+        Parameters
+        ----------
+        *args
+            Passed to `numpy.ndarray.argsort`.
+        **kwargs
+            Passed to `numpy.ndarray.argsort`.
+
+        Returns
+        -------
+        numpy.ndarray
+            Integer indices that would sort the index if used as
+            an indexer.
+
+        See also
+        --------
+        numpy.argsort : Similar method for NumPy arrays.
+        Index.sort_values : Return sorted copy of Index.
+
+        Examples
+        --------
+        >>> idx = pd.Index(['b', 'a', 'd', 'c'])
+        >>> idx
+        Index(['b', 'a', 'd', 'c'], dtype='object')
+
+        >>> order = idx.argsort()
+        >>> order
+        array([1, 0, 3, 2])
+
+        >>> idx[order]
+        Index(['a', 'b', 'c', 'd'], dtype='object')
+        """
+        result = self.asi8
+        if result is None:
+            result = np.array(self)
+        return result.argsort(*args, **kwargs)
+
+    def __add__(self, other):
+        return Index(np.array(self) + other)
+
+    def __radd__(self, other):
+        return Index(other + np.array(self))
+
+    def __iadd__(self, other):
+        # alias for __add__
+        return self + other
+
+    def __sub__(self, other):
+        raise TypeError("cannot perform __sub__ with this index type: "
+                        "{typ}".format(typ=type(self).__name__))
+
+    def __and__(self, other):
+        return self.intersection(other)
+
+    def __or__(self, other):
+        return self.union(other)
+
+    def __xor__(self, other):
+        return self.symmetric_difference(other)
+
+    def _get_consensus_name(self, other):
+        """
+        Given 2 indexes, give a consensus name meaning
+        we take the not None one, or None if the names differ.
+        Return a new object if we are resetting the name
+        """
+        if self.name != other.name:
+            if self.name is None or other.name is None:
+                name = self.name or other.name
+            else:
+                name = None
+            if self.name != name:
+                return self._shallow_copy(name=name)
+        return self
+
+    def union(self, other):
+        """
+        Form the union of two Index objects and sorts if possible.
+
+        Parameters
+        ----------
+        other : Index or array-like
+
+        Returns
+        -------
+        union : Index
+
+        Examples
+        --------
+
+        >>> idx1 = pd.Index([1, 2, 3, 4])
+        >>> idx2 = pd.Index([3, 4, 5, 6])
+        >>> idx1.union(idx2)
+        Int64Index([1, 2, 3, 4, 5, 6], dtype='int64')
+
+        """
+        self._assert_can_do_setop(other)
+        other = _ensure_index(other)
+
+        if len(other) == 0 or self.equals(other):
+            return self._get_consensus_name(other)
+
+        if len(self) == 0:
+            return other._get_consensus_name(self)
+
+        # TODO: is_dtype_union_equal is a hack around
+        # 1. buggy set ops with duplicates (GH #13432)
+        # 2. CategoricalIndex lacking setops (GH #10186)
+        # Once those are fixed, this workaround can be removed
+        if not is_dtype_union_equal(self.dtype, other.dtype):
+            this = self.astype('O')
+            other = other.astype('O')
+            return this.union(other)
+
+        # TODO(EA): setops-refactor, clean all this up
+        if is_period_dtype(self) or is_datetime64tz_dtype(self):
+            lvals = self._ndarray_values
+        else:
+            lvals = self._values
+        if is_period_dtype(other) or is_datetime64tz_dtype(other):
+            rvals = other._ndarray_values
+        else:
+            rvals = other._values
+
+        if self.is_monotonic and other.is_monotonic:
+            try:
+                result = self._outer_indexer(lvals, rvals)[0]
+            except TypeError:
+                # incomparable objects
+                result = list(lvals)
+
+                # worth making this faster? a very unusual case
+                value_set = set(lvals)
+                result.extend([x for x in rvals if x not in value_set])
+        else:
+            indexer = self.get_indexer(other)
+            indexer, = (indexer == -1).nonzero()
+
+            if len(indexer) > 0:
+                other_diff = algos.take_nd(rvals, indexer,
+                                           allow_fill=False)
+                result = _concat._concat_compat((lvals, other_diff))
+
+                try:
+                    lvals[0] < other_diff[0]
+                except TypeError as e:
+                    warnings.warn("%s, sort order is undefined for "
+                                  "incomparable objects" % e, RuntimeWarning,
+                                  stacklevel=3)
+                else:
+                    types = frozenset((self.inferred_type,
+                                       other.inferred_type))
+                    if not types & _unsortable_types:
+                        result.sort()
+
+            else:
+                result = lvals
+
+                try:
+                    result = np.sort(result)
+                except TypeError as e:
+                    warnings.warn("%s, sort order is undefined for "
+                                  "incomparable objects" % e, RuntimeWarning,
+                                  stacklevel=3)
+
+        # for subclasses
+        return self._wrap_union_result(other, result)
+
+    def _wrap_union_result(self, other, result):
+        name = self.name if self.name == other.name else None
+        return self.__class__(result, name=name)
+
+    def intersection(self, other):
+        """
+        Form the intersection of two Index objects.
+
+        This returns a new Index with elements common to the index and `other`,
+        preserving the order of the calling index.
+
+        Parameters
+        ----------
+        other : Index or array-like
+
+        Returns
+        -------
+        intersection : Index
+
+        Examples
+        --------
+
+        >>> idx1 = pd.Index([1, 2, 3, 4])
+        >>> idx2 = pd.Index([3, 4, 5, 6])
+        >>> idx1.intersection(idx2)
+        Int64Index([3, 4], dtype='int64')
+
+        """
+        self._assert_can_do_setop(other)
+        other = _ensure_index(other)
+
+        if self.equals(other):
+            return self._get_consensus_name(other)
+
+        if not is_dtype_equal(self.dtype, other.dtype):
+            this = self.astype('O')
+            other = other.astype('O')
+            return this.intersection(other)
+
+        # TODO(EA): setops-refactor, clean all this up
+        if is_period_dtype(self):
+            lvals = self._ndarray_values
+        else:
+            lvals = self._values
+        if is_period_dtype(other):
+            rvals = other._ndarray_values
+        else:
+            rvals = other._values
+
+        if self.is_monotonic and other.is_monotonic:
+            try:
+                result = self._inner_indexer(lvals, rvals)[0]
+                return self._wrap_union_result(other, result)
+            except TypeError:
+                pass
+
+        try:
+            indexer = Index(rvals).get_indexer(lvals)
+            indexer = indexer.take((indexer != -1).nonzero()[0])
+        except Exception:
+            # duplicates
+            indexer = algos.unique1d(
+                Index(rvals).get_indexer_non_unique(lvals)[0])
+            indexer = indexer[indexer != -1]
+
+        taken = other.take(indexer)
+        if self.name != other.name:
+            taken.name = None
+        return taken
+
+    def difference(self, other):
+        """
+        Return a new Index with elements from the index that are not in
+        `other`.
+
+        This is the set difference of two Index objects.
+        It's sorted if sorting is possible.
+
+        Parameters
+        ----------
+        other : Index or array-like
+
+        Returns
+        -------
+        difference : Index
+
+        Examples
+        --------
+
+        >>> idx1 = pd.Index([1, 2, 3, 4])
+        >>> idx2 = pd.Index([3, 4, 5, 6])
+        >>> idx1.difference(idx2)
+        Int64Index([1, 2], dtype='int64')
+
+        """
+        self._assert_can_do_setop(other)
+
+        if self.equals(other):
+            return self._shallow_copy([])
+
+        other, result_name = self._convert_can_do_setop(other)
+
+        this = self._get_unique_index()
+
+        indexer = this.get_indexer(other)
+        indexer = indexer.take((indexer != -1).nonzero()[0])
+
+        label_diff = np.setdiff1d(np.arange(this.size), indexer,
+                                  assume_unique=True)
+        the_diff = this.values.take(label_diff)
+        try:
+            the_diff = sorting.safe_sort(the_diff)
+        except TypeError:
+            pass
+
+        return this._shallow_copy(the_diff, name=result_name, freq=None)
+
+    def symmetric_difference(self, other, result_name=None):
+        """
+        Compute the symmetric difference of two Index objects.
+        It's sorted if sorting is possible.
+
+        Parameters
+        ----------
+        other : Index or array-like
+        result_name : str
+
+        Returns
+        -------
+        symmetric_difference : Index
+
+        Notes
+        -----
+        ``symmetric_difference`` contains elements that appear in either
+        ``idx1`` or ``idx2`` but not both. Equivalent to the Index created by
+        ``idx1.difference(idx2) | idx2.difference(idx1)`` with duplicates
+        dropped.
+
+        Examples
+        --------
+        >>> idx1 = Index([1, 2, 3, 4])
+        >>> idx2 = Index([2, 3, 4, 5])
+        >>> idx1.symmetric_difference(idx2)
+        Int64Index([1, 5], dtype='int64')
+
+        You can also use the ``^`` operator:
+
+        >>> idx1 ^ idx2
+        Int64Index([1, 5], dtype='int64')
+        """
+        self._assert_can_do_setop(other)
+        other, result_name_update = self._convert_can_do_setop(other)
+        if result_name is None:
+            result_name = result_name_update
+
+        this = self._get_unique_index()
+        other = other._get_unique_index()
+        indexer = this.get_indexer(other)
+
+        # {this} minus {other}
+        common_indexer = indexer.take((indexer != -1).nonzero()[0])
+        left_indexer = np.setdiff1d(np.arange(this.size), common_indexer,
+                                    assume_unique=True)
+        left_diff = this.values.take(left_indexer)
+
+        # {other} minus {this}
+        right_indexer = (indexer == -1).nonzero()[0]
+        right_diff = other.values.take(right_indexer)
+
+        the_diff = _concat._concat_compat([left_diff, right_diff])
+        try:
+            the_diff = sorting.safe_sort(the_diff)
+        except TypeError:
+            pass
+
+        attribs = self._get_attributes_dict()
+        attribs['name'] = result_name
+        if 'freq' in attribs:
+            attribs['freq'] = None
+        return self._shallow_copy_with_infer(the_diff, **attribs)
+
+    def _get_unique_index(self, dropna=False):
+        """
+        Returns an index containing unique values.
+
+        Parameters
+        ----------
+        dropna : bool
+            If True, NaN values are dropped.
+
+        Returns
+        -------
+        uniques : index
+        """
+        if self.is_unique and not dropna:
+            return self
+
+        values = self.values
+
+        if not self.is_unique:
+            values = self.unique()
+
+        if dropna:
+            try:
+                if self.hasnans:
+                    values = values[~isna(values)]
+            except NotImplementedError:
+                pass
+
+        return self._shallow_copy(values)
+
+    _index_shared_docs['get_loc'] = """
+        Get integer location, slice or boolean mask for requested label.
+
+        Parameters
+        ----------
+        key : label
+        method : {None, 'pad'/'ffill', 'backfill'/'bfill', 'nearest'}, optional
+            * default: exact matches only.
+            * pad / ffill: find the PREVIOUS index value if no exact match.
+            * backfill / bfill: use NEXT index value if no exact match
+            * nearest: use the NEAREST index value if no exact match. Tied
+              distances are broken by preferring the larger index value.
+        tolerance : optional
+            Maximum distance from index value for inexact matches. The value of
+            the index at the matching location most satisfy the equation
+            ``abs(index[loc] - key) <= tolerance``.
+
+            Tolerance may be a scalar
+            value, which applies the same tolerance to all values, or
+            list-like, which applies variable tolerance per element. List-like
+            includes list, tuple, array, Series, and must be the same size as
+            the index and its dtype must exactly match the index's type.
+
+            .. versionadded:: 0.21.0 (list-like tolerance)
+
+        Returns
+        -------
+        loc : int if unique index, slice if monotonic index, else mask
+
+        Examples
+        ---------
+        >>> unique_index = pd.Index(list('abc'))
+        >>> unique_index.get_loc('b')
+        1
+
+        >>> monotonic_index = pd.Index(list('abbc'))
+        >>> monotonic_index.get_loc('b')
+        slice(1, 3, None)
+
+        >>> non_monotonic_index = pd.Index(list('abcb'))
+        >>> non_monotonic_index.get_loc('b')
+        array([False,  True, False,  True], dtype=bool)
+        """
+
+    @Appender(_index_shared_docs['get_loc'])
+    def get_loc(self, key, method=None, tolerance=None):
+        if method is None:
+            if tolerance is not None:
+                raise ValueError('tolerance argument only valid if using pad, '
+                                 'backfill or nearest lookups')
+            try:
+                return self._engine.get_loc(key)
+            except KeyError:
+                return self._engine.get_loc(self._maybe_cast_indexer(key))
+
+        indexer = self.get_indexer([key], method=method, tolerance=tolerance)
+        if indexer.ndim > 1 or indexer.size > 1:
+            raise TypeError('get_loc requires scalar valued input')
+        loc = indexer.item()
+        if loc == -1:
+            raise KeyError(key)
+        return loc
+
+    def get_value(self, series, key):
+        """
+        Fast lookup of value from 1-dimensional ndarray. Only use this if you
+        know what you're doing
+        """
+
+        # if we have something that is Index-like, then
+        # use this, e.g. DatetimeIndex
+        s = getattr(series, '_values', None)
+        if isinstance(s, (ExtensionArray, Index)) and is_scalar(key):
+            # GH 20882, 21257
+            # Unify Index and ExtensionArray treatment
+            # First try to convert the key to a location
+            # If that fails, raise a KeyError if an integer
+            # index, otherwise, see if key is an integer, and
+            # try that
+            try:
+                iloc = self.get_loc(key)
+                return s[iloc]
+            except KeyError:
+                if (len(self) > 0 and
+                        self.inferred_type in ['integer', 'boolean']):
+                    raise
+                elif is_integer(key):
+                    return s[key]
+
+        s = com._values_from_object(series)
+        k = com._values_from_object(key)
+
+        k = self._convert_scalar_indexer(k, kind='getitem')
+        try:
+            return self._engine.get_value(s, k,
+                                          tz=getattr(series.dtype, 'tz', None))
+        except KeyError as e1:
+            if len(self) > 0 and self.inferred_type in ['integer', 'boolean']:
+                raise
+
+            try:
+                return libindex.get_value_box(s, key)
+            except IndexError:
+                raise
+            except TypeError:
+                # generator/iterator-like
+                if is_iterator(key):
+                    raise InvalidIndexError(key)
+                else:
+                    raise e1
+            except Exception:  # pragma: no cover
+                raise e1
+        except TypeError:
+            # python 3
+            if is_scalar(key):  # pragma: no cover
+                raise IndexError(key)
+            raise InvalidIndexError(key)
+
+    def set_value(self, arr, key, value):
+        """
+        Fast lookup of value from 1-dimensional ndarray. Only use this if you
+        know what you're doing
+        """
+        self._engine.set_value(com._values_from_object(arr),
+                               com._values_from_object(key), value)
+
+    def _get_level_values(self, level):
+        """
+        Return an Index of values for requested level, equal to the length
+        of the index.
+
+        Parameters
+        ----------
+        level : int or str
+            ``level`` is either the integer position of the level in the
+            MultiIndex, or the name of the level.
+
+        Returns
+        -------
+        values : Index
+            ``self``, as there is only one level in the Index.
+
+        See also
+        ---------
+        pandas.MultiIndex.get_level_values : get values for a level of a
+                                             MultiIndex
+        """
+
+        self._validate_index_level(level)
+        return self
+
+    get_level_values = _get_level_values
+
+    def droplevel(self, level=0):
+        """
+        Return index with requested level(s) removed. If resulting index has
+        only 1 level left, the result will be of Index type, not MultiIndex.
+
+        .. versionadded:: 0.23.1 (support for non-MultiIndex)
+
+        Parameters
+        ----------
+        level : int, str, or list-like, default 0
+            If a string is given, must be the name of a level
+            If list-like, elements must be names or indexes of levels.
+
+        Returns
+        -------
+        index : Index or MultiIndex
+        """
+        if not isinstance(level, (tuple, list)):
+            level = [level]
+
+        levnums = sorted(self._get_level_number(lev) for lev in level)[::-1]
+
+        if len(level) == 0:
+            return self
+        if len(level) >= self.nlevels:
+            raise ValueError("Cannot remove {} levels from an index with {} "
+                             "levels: at least one level must be "
+                             "left.".format(len(level), self.nlevels))
+        # The two checks above guarantee that here self is a MultiIndex
+
+        new_levels = list(self.levels)
+        new_labels = list(self.labels)
+        new_names = list(self.names)
+
+        for i in levnums:
+            new_levels.pop(i)
+            new_labels.pop(i)
+            new_names.pop(i)
+
+        if len(new_levels) == 1:
+
+            # set nan if needed
+            mask = new_labels[0] == -1
+            result = new_levels[0].take(new_labels[0])
+            if mask.any():
+                result = result.putmask(mask, np.nan)
+
+            result.name = new_names[0]
+            return result
+        else:
+            from .multi import MultiIndex
+            return MultiIndex(levels=new_levels, labels=new_labels,
+                              names=new_names, verify_integrity=False)
+
+    _index_shared_docs['get_indexer'] = """
+        Compute indexer and mask for new index given the current index. The
+        indexer should be then used as an input to ndarray.take to align the
+        current data to the new index.
+
+        Parameters
+        ----------
+        target : %(target_klass)s
+        method : {None, 'pad'/'ffill', 'backfill'/'bfill', 'nearest'}, optional
+            * default: exact matches only.
+            * pad / ffill: find the PREVIOUS index value if no exact match.
+            * backfill / bfill: use NEXT index value if no exact match
+            * nearest: use the NEAREST index value if no exact match. Tied
+              distances are broken by preferring the larger index value.
+        limit : int, optional
+            Maximum number of consecutive labels in ``target`` to match for
+            inexact matches.
+        tolerance : optional
+            Maximum distance between original and new labels for inexact
+            matches. The values of the index at the matching locations most
+            satisfy the equation ``abs(index[indexer] - target) <= tolerance``.
+
+            Tolerance may be a scalar value, which applies the same tolerance
+            to all values, or list-like, which applies variable tolerance per
+            element. List-like includes list, tuple, array, Series, and must be
+            the same size as the index and its dtype must exactly match the
+            index's type.
+
+            .. versionadded:: 0.21.0 (list-like tolerance)
+
+        Returns
+        -------
+        indexer : ndarray of int
+            Integers from 0 to n - 1 indicating that the index at these
+            positions matches the corresponding target values. Missing values
+            in the target are marked by -1.
+
+        Examples
+        --------
+        >>> index = pd.Index(['c', 'a', 'b'])
+        >>> index.get_indexer(['a', 'b', 'x'])
+        array([ 1,  2, -1])
+
+        Notice that the return value is an array of locations in ``index``
+        and ``x`` is marked by -1, as it is not in ``index``.
+
+        """
+
+    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
+    def get_indexer(self, target, method=None, limit=None, tolerance=None):
+        method = missing.clean_reindex_fill_method(method)
+        target = _ensure_index(target)
+        if tolerance is not None:
+            tolerance = self._convert_tolerance(tolerance, target)
+
+        # Treat boolean labels passed to a numeric index as not found. Without
+        # this fix False and True would be treated as 0 and 1 respectively.
+        # (GH #16877)
+        if target.is_boolean() and self.is_numeric():
+            return _ensure_platform_int(np.repeat(-1, target.size))
+
+        pself, ptarget = self._maybe_promote(target)
+        if pself is not self or ptarget is not target:
+            return pself.get_indexer(ptarget, method=method, limit=limit,
+                                     tolerance=tolerance)
+
+        if not is_dtype_equal(self.dtype, target.dtype):
+            this = self.astype(object)
+            target = target.astype(object)
+            return this.get_indexer(target, method=method, limit=limit,
+                                    tolerance=tolerance)
+
+        if not self.is_unique:
+            raise InvalidIndexError('Reindexing only valid with uniquely'
+                                    ' valued Index objects')
+
+        if method == 'pad' or method == 'backfill':
+            indexer = self._get_fill_indexer(target, method, limit, tolerance)
+        elif method == 'nearest':
+            indexer = self._get_nearest_indexer(target, limit, tolerance)
+        else:
+            if tolerance is not None:
+                raise ValueError('tolerance argument only valid if doing pad, '
+                                 'backfill or nearest reindexing')
+            if limit is not None:
+                raise ValueError('limit argument only valid if doing pad, '
+                                 'backfill or nearest reindexing')
+
+            indexer = self._engine.get_indexer(target._ndarray_values)
+
+        return _ensure_platform_int(indexer)
+
+    def _convert_tolerance(self, tolerance, target):
+        # override this method on subclasses
+        tolerance = np.asarray(tolerance)
+        if target.size != tolerance.size and tolerance.size > 1:
+            raise ValueError('list-like tolerance size must match '
+                             'target index size')
+        return tolerance
+
+    def _get_fill_indexer(self, target, method, limit=None, tolerance=None):
+        if self.is_monotonic_increasing and target.is_monotonic_increasing:
+            method = (self._engine.get_pad_indexer if method == 'pad' else
+                      self._engine.get_backfill_indexer)
+            indexer = method(target._ndarray_values, limit)
+        else:
+            indexer = self._get_fill_indexer_searchsorted(target, method,
+                                                          limit)
+        if tolerance is not None:
+            indexer = self._filter_indexer_tolerance(target._ndarray_values,
+                                                     indexer,
+                                                     tolerance)
+        return indexer
+
+    def _get_fill_indexer_searchsorted(self, target, method, limit=None):
+        """
+        Fallback pad/backfill get_indexer that works for monotonic decreasing
+        indexes and non-monotonic targets
+        """
+        if limit is not None:
+            raise ValueError('limit argument for %r method only well-defined '
+                             'if index and target are monotonic' % method)
+
+        side = 'left' if method == 'pad' else 'right'
+
+        # find exact matches first (this simplifies the algorithm)
+        indexer = self.get_indexer(target)
+        nonexact = (indexer == -1)
+        indexer[nonexact] = self._searchsorted_monotonic(target[nonexact],
+                                                         side)
+        if side == 'left':
+            # searchsorted returns "indices into a sorted array such that,
+            # if the corresponding elements in v were inserted before the
+            # indices, the order of a would be preserved".
+            # Thus, we need to subtract 1 to find values to the left.
+            indexer[nonexact] -= 1
+            # This also mapped not found values (values of 0 from
+            # np.searchsorted) to -1, which conveniently is also our
+            # sentinel for missing values
+        else:
+            # Mark indices to the right of the largest value as not found
+            indexer[indexer == len(self)] = -1
+        return indexer
+
+    def _get_nearest_indexer(self, target, limit, tolerance):
+        """
+        Get the indexer for the nearest index labels; requires an index with
+        values that can be subtracted from each other (e.g., not strings or
+        tuples).
+        """
+        left_indexer = self.get_indexer(target, 'pad', limit=limit)
+        right_indexer = self.get_indexer(target, 'backfill', limit=limit)
+
+        target = np.asarray(target)
+        left_distances = abs(self.values[left_indexer] - target)
+        right_distances = abs(self.values[right_indexer] - target)
+
+        op = operator.lt if self.is_monotonic_increasing else operator.le
+        indexer = np.where(op(left_distances, right_distances) |
+                           (right_indexer == -1), left_indexer, right_indexer)
+        if tolerance is not None:
+            indexer = self._filter_indexer_tolerance(target, indexer,
+                                                     tolerance)
+        return indexer
+
+    def _filter_indexer_tolerance(self, target, indexer, tolerance):
+        distance = abs(self.values[indexer] - target)
+        indexer = np.where(distance <= tolerance, indexer, -1)
+        return indexer
+
+    _index_shared_docs['get_indexer_non_unique'] = """
+        Compute indexer and mask for new index given the current index. The
+        indexer should be then used as an input to ndarray.take to align the
+        current data to the new index.
+
+        Parameters
+        ----------
+        target : %(target_klass)s
+
+        Returns
+        -------
+        indexer : ndarray of int
+            Integers from 0 to n - 1 indicating that the index at these
+            positions matches the corresponding target values. Missing values
+            in the target are marked by -1.
+        missing : ndarray of int
+            An indexer into the target of the values not found.
+            These correspond to the -1 in the indexer array
+        """
+
+    @Appender(_index_shared_docs['get_indexer_non_unique'] % _index_doc_kwargs)
+    def get_indexer_non_unique(self, target):
+        target = _ensure_index(target)
+        if is_categorical(target):
+            target = target.astype(target.dtype.categories.dtype)
+        pself, ptarget = self._maybe_promote(target)
+        if pself is not self or ptarget is not target:
+            return pself.get_indexer_non_unique(ptarget)
+
+        if self.is_all_dates:
+            self = Index(self.asi8)
+            tgt_values = target.asi8
+        else:
+            tgt_values = target._ndarray_values
+
+        indexer, missing = self._engine.get_indexer_non_unique(tgt_values)
+        return _ensure_platform_int(indexer), missing
+
+    def get_indexer_for(self, target, **kwargs):
+        """
+        guaranteed return of an indexer even when non-unique
+        This dispatches to get_indexer or get_indexer_nonunique as appropriate
+        """
+        if self.is_unique:
+            return self.get_indexer(target, **kwargs)
+        indexer, _ = self.get_indexer_non_unique(target, **kwargs)
+        return indexer
+
+    def _maybe_promote(self, other):
+        # A hack, but it works
+        from pandas import DatetimeIndex
+        if self.inferred_type == 'date' and isinstance(other, DatetimeIndex):
+            return DatetimeIndex(self), other
+        elif self.inferred_type == 'boolean':
+            if not is_object_dtype(self.dtype):
+                return self.astype('object'), other.astype('object')
+        return self, other
+
+    def groupby(self, values):
+        """
+        Group the index labels by a given array of values.
+
+        Parameters
+        ----------
+        values : array
+            Values used to determine the groups.
+
+        Returns
+        -------
+        groups : dict
+            {group name -> group labels}
+        """
+
+        # TODO: if we are a MultiIndex, we can do better
+        # that converting to tuples
+        from .multi import MultiIndex
+        if isinstance(values, MultiIndex):
+            values = values.values
+        values = _ensure_categorical(values)
+        result = values._reverse_indexer()
+
+        # map to the label
+        result = {k: self.take(v) for k, v in compat.iteritems(result)}
+
+        return result
+
+    def map(self, mapper, na_action=None):
+        """
+        Map values using input correspondence (a dict, Series, or function).
+
+        Parameters
+        ----------
+        mapper : function, dict, or Series
+            Mapping correspondence.
+        na_action : {None, 'ignore'}
+            If 'ignore', propagate NA values, without passing them to the
+            mapping correspondence.
+
+        Returns
+        -------
+        applied : Union[Index, MultiIndex], inferred
+            The output of the mapping function applied to the index.
+            If the function returns a tuple with more than one element
+            a MultiIndex will be returned.
+        """
+
+        from .multi import MultiIndex
+        new_values = super(Index, self)._map_values(
+            mapper, na_action=na_action)
+
+        attributes = self._get_attributes_dict()
+
+        # we can return a MultiIndex
+        if new_values.size and isinstance(new_values[0], tuple):
+            if isinstance(self, MultiIndex):
+                names = self.names
+            elif attributes.get('name'):
+                names = [attributes.get('name')] * len(new_values[0])
+            else:
+                names = None
+            return MultiIndex.from_tuples(new_values,
+                                          names=names)
+
+        attributes['copy'] = False
+        if not new_values.size:
+            # empty
+            attributes['dtype'] = self.dtype
+
+        return Index(new_values, **attributes)
+
+    def isin(self, values, level=None):
+        """
+        Return a boolean array where the index values are in `values`.
+
+        Compute boolean array of whether each index value is found in the
+        passed set of values. The length of the returned boolean array matches
+        the length of the index.
+
+        Parameters
+        ----------
+        values : set or list-like
+            Sought values.
+
+            .. versionadded:: 0.18.1
+
+               Support for values as a set.
+
+        level : str or int, optional
+            Name or position of the index level to use (if the index is a
+            `MultiIndex`).
+
+        Returns
+        -------
+        is_contained : ndarray
+            NumPy array of boolean values.
+
+        See also
+        --------
+        Series.isin : Same for Series.
+        DataFrame.isin : Same method for DataFrames.
+
+        Notes
+        -----
+        In the case of `MultiIndex` you must either specify `values` as a
+        list-like object containing tuples that are the same length as the
+        number of levels, or specify `level`. Otherwise it will raise a
+        ``ValueError``.
+
+        If `level` is specified:
+
+        - if it is the name of one *and only one* index level, use that level;
+        - otherwise it should be a number indicating level position.
+
+        Examples
+        --------
+        >>> idx = pd.Index([1,2,3])
+        >>> idx
+        Int64Index([1, 2, 3], dtype='int64')
+
+        Check whether each index value in a list of values.
+        >>> idx.isin([1, 4])
+        array([ True, False, False])
+
+        >>> midx = pd.MultiIndex.from_arrays([[1,2,3],
+        ...                                  ['red', 'blue', 'green']],
+        ...                                  names=('number', 'color'))
+        >>> midx
+        MultiIndex(levels=[[1, 2, 3], ['blue', 'green', 'red']],
+                   labels=[[0, 1, 2], [2, 0, 1]],
+                   names=['number', 'color'])
+
+        Check whether the strings in the 'color' level of the MultiIndex
+        are in a list of colors.
+
+        >>> midx.isin(['red', 'orange', 'yellow'], level='color')
+        array([ True, False, False])
+
+        To check across the levels of a MultiIndex, pass a list of tuples:
+
+        >>> midx.isin([(1, 'red'), (3, 'red')])
+        array([ True, False, False])
+
+        For a DatetimeIndex, string values in `values` are converted to
+        Timestamps.
+
+        >>> dates = ['2000-03-11', '2000-03-12', '2000-03-13']
+        >>> dti = pd.to_datetime(dates)
+        >>> dti
+        DatetimeIndex(['2000-03-11', '2000-03-12', '2000-03-13'],
+        dtype='datetime64[ns]', freq=None)
+
+        >>> dti.isin(['2000-03-11'])
+        array([ True, False, False])
+        """
+        if level is not None:
+            self._validate_index_level(level)
+        return algos.isin(self, values)
+
+    def _can_reindex(self, indexer):
+        """
+        *this is an internal non-public method*
+
+        Check if we are allowing reindexing with this particular indexer
+
+        Parameters
+        ----------
+        indexer : an integer indexer
+
+        Raises
+        ------
+        ValueError if its a duplicate axis
+        """
+
+        # trying to reindex on an axis with duplicates
+        if not self.is_unique and len(indexer):
+            raise ValueError("cannot reindex from a duplicate axis")
+
+    def reindex(self, target, method=None, level=None, limit=None,
+                tolerance=None):
+        """
+        Create index with target's values (move/add/delete values as necessary)
+
+        Parameters
+        ----------
+        target : an iterable
+
+        Returns
+        -------
+        new_index : pd.Index
+            Resulting index
+        indexer : np.ndarray or None
+            Indices of output values in original index
+
+        """
+        # GH6552: preserve names when reindexing to non-named target
+        # (i.e. neither Index nor Series).
+        preserve_names = not hasattr(target, 'name')
+
+        # GH7774: preserve dtype/tz if target is empty and not an Index.
+        target = _ensure_has_len(target)  # target may be an iterator
+
+        if not isinstance(target, Index) and len(target) == 0:
+            attrs = self._get_attributes_dict()
+            attrs.pop('freq', None)  # don't preserve freq
+            target = self._simple_new(None, dtype=self.dtype, **attrs)
+        else:
+            target = _ensure_index(target)
+
+        if level is not None:
+            if method is not None:
+                raise TypeError('Fill method not supported if level passed')
+            _, indexer, _ = self._join_level(target, level, how='right',
+                                             return_indexers=True)
+        else:
+            if self.equals(target):
+                indexer = None
+            else:
+
+                if self.is_unique:
+                    indexer = self.get_indexer(target, method=method,
+                                               limit=limit,
+                                               tolerance=tolerance)
+                else:
+                    if method is not None or limit is not None:
+                        raise ValueError("cannot reindex a non-unique index "
+                                         "with a method or limit")
+                    indexer, missing = self.get_indexer_non_unique(target)
+
+        if preserve_names and target.nlevels == 1 and target.name != self.name:
+            target = target.copy()
+            target.name = self.name
+
+        return target, indexer
+
+    def _reindex_non_unique(self, target):
+        """
+        *this is an internal non-public method*
+
+        Create a new index with target's values (move/add/delete values as
+        necessary) use with non-unique Index and a possibly non-unique target
+
+        Parameters
+        ----------
+        target : an iterable
+
+        Returns
+        -------
+        new_index : pd.Index
+            Resulting index
+        indexer : np.ndarray or None
+            Indices of output values in original index
+
+        """
+
+        target = _ensure_index(target)
+        indexer, missing = self.get_indexer_non_unique(target)
+        check = indexer != -1
+        new_labels = self.take(indexer[check])
+        new_indexer = None
+
+        if len(missing):
+            length = np.arange(len(indexer))
+
+            missing = _ensure_platform_int(missing)
+            missing_labels = target.take(missing)
+            missing_indexer = _ensure_int64(length[~check])
+            cur_labels = self.take(indexer[check]).values
+            cur_indexer = _ensure_int64(length[check])
+
+            new_labels = np.empty(tuple([len(indexer)]), dtype=object)
+            new_labels[cur_indexer] = cur_labels
+            new_labels[missing_indexer] = missing_labels
+
+            # a unique indexer
+            if target.is_unique:
+
+                # see GH5553, make sure we use the right indexer
+                new_indexer = np.arange(len(indexer))
+                new_indexer[cur_indexer] = np.arange(len(cur_labels))
+                new_indexer[missing_indexer] = -1
+
+            # we have a non_unique selector, need to use the original
+            # indexer here
+            else:
+
+                # need to retake to have the same size as the indexer
+                indexer[~check] = -1
+
+                # reset the new indexer to account for the new size
+                new_indexer = np.arange(len(self.take(indexer)))
+                new_indexer[~check] = -1
+
+        new_index = self._shallow_copy_with_infer(new_labels, freq=None)
+        return new_index, indexer, new_indexer
+
+    _index_shared_docs['join'] = """
+        *this is an internal non-public method*
+
+        Compute join_index and indexers to conform data
+        structures to the new index.
+
+        Parameters
+        ----------
+        other : Index
+        how : {'left', 'right', 'inner', 'outer'}
+        level : int or level name, default None
+        return_indexers : boolean, default False
+        sort : boolean, default False
+            Sort the join keys lexicographically in the result Index. If False,
+            the order of the join keys depends on the join type (how keyword)
+
+            .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        join_index, (left_indexer, right_indexer)
+        """
+
+    @Appender(_index_shared_docs['join'])
+    def join(self, other, how='left', level=None, return_indexers=False,
+             sort=False):
+        from .multi import MultiIndex
+        self_is_mi = isinstance(self, MultiIndex)
+        other_is_mi = isinstance(other, MultiIndex)
+
+        # try to figure out the join level
+        # GH3662
+        if level is None and (self_is_mi or other_is_mi):
+
+            # have the same levels/names so a simple join
+            if self.names == other.names:
+                pass
+            else:
+                return self._join_multi(other, how=how,
+                                        return_indexers=return_indexers)
+
+        # join on the level
+        if level is not None and (self_is_mi or other_is_mi):
+            return self._join_level(other, level, how=how,
+                                    return_indexers=return_indexers)
+
+        other = _ensure_index(other)
+
+        if len(other) == 0 and how in ('left', 'outer'):
+            join_index = self._shallow_copy()
+            if return_indexers:
+                rindexer = np.repeat(-1, len(join_index))
+                return join_index, None, rindexer
+            else:
+                return join_index
+
+        if len(self) == 0 and how in ('right', 'outer'):
+            join_index = other._shallow_copy()
+            if return_indexers:
+                lindexer = np.repeat(-1, len(join_index))
+                return join_index, lindexer, None
+            else:
+                return join_index
+
+        if self._join_precedence < other._join_precedence:
+            how = {'right': 'left', 'left': 'right'}.get(how, how)
+            result = other.join(self, how=how, level=level,
+                                return_indexers=return_indexers)
+            if return_indexers:
+                x, y, z = result
+                result = x, z, y
+            return result
+
+        if not is_dtype_equal(self.dtype, other.dtype):
+            this = self.astype('O')
+            other = other.astype('O')
+            return this.join(other, how=how, return_indexers=return_indexers)
+
+        _validate_join_method(how)
+
+        if not self.is_unique and not other.is_unique:
+            return self._join_non_unique(other, how=how,
+                                         return_indexers=return_indexers)
+        elif not self.is_unique or not other.is_unique:
+            if self.is_monotonic and other.is_monotonic:
+                return self._join_monotonic(other, how=how,
+                                            return_indexers=return_indexers)
+            else:
+                return self._join_non_unique(other, how=how,
+                                             return_indexers=return_indexers)
+        elif self.is_monotonic and other.is_monotonic:
+            try:
+                return self._join_monotonic(other, how=how,
+                                            return_indexers=return_indexers)
+            except TypeError:
+                pass
+
+        if how == 'left':
+            join_index = self
+        elif how == 'right':
+            join_index = other
+        elif how == 'inner':
+            join_index = self.intersection(other)
+        elif how == 'outer':
+            join_index = self.union(other)
+
+        if sort:
+            join_index = join_index.sort_values()
+
+        if return_indexers:
+            if join_index is self:
+                lindexer = None
+            else:
+                lindexer = self.get_indexer(join_index)
+            if join_index is other:
+                rindexer = None
+            else:
+                rindexer = other.get_indexer(join_index)
+            return join_index, lindexer, rindexer
+        else:
+            return join_index
+
+    def _join_multi(self, other, how, return_indexers=True):
+        from .multi import MultiIndex
+        self_is_mi = isinstance(self, MultiIndex)
+        other_is_mi = isinstance(other, MultiIndex)
+
+        # figure out join names
+        self_names = com._not_none(*self.names)
+        other_names = com._not_none(*other.names)
+        overlap = list(set(self_names) & set(other_names))
+
+        # need at least 1 in common, but not more than 1
+        if not len(overlap):
+            raise ValueError("cannot join with no level specified and no "
+                             "overlapping names")
+        if len(overlap) > 1:
+            raise NotImplementedError("merging with more than one level "
+                                      "overlap on a multi-index is not "
+                                      "implemented")
+        jl = overlap[0]
+
+        # make the indices into mi's that match
+        if not (self_is_mi and other_is_mi):
+
+            flip_order = False
+            if self_is_mi:
+                self, other = other, self
+                flip_order = True
+                # flip if join method is right or left
+                how = {'right': 'left', 'left': 'right'}.get(how, how)
+
+            level = other.names.index(jl)
+            result = self._join_level(other, level, how=how,
+                                      return_indexers=return_indexers)
+
+            if flip_order:
+                if isinstance(result, tuple):
+                    return result[0], result[2], result[1]
+            return result
+
+        # 2 multi-indexes
+        raise NotImplementedError("merging with both multi-indexes is not "
+                                  "implemented")
+
+    def _join_non_unique(self, other, how='left', return_indexers=False):
+        from pandas.core.reshape.merge import _get_join_indexers
+
+        left_idx, right_idx = _get_join_indexers([self._ndarray_values],
+                                                 [other._ndarray_values],
+                                                 how=how,
+                                                 sort=True)
+
+        left_idx = _ensure_platform_int(left_idx)
+        right_idx = _ensure_platform_int(right_idx)
+
+        join_index = np.asarray(self._ndarray_values.take(left_idx))
+        mask = left_idx == -1
+        np.putmask(join_index, mask, other._ndarray_values.take(right_idx))
+
+        join_index = self._wrap_joined_index(join_index, other)
+
+        if return_indexers:
+            return join_index, left_idx, right_idx
+        else:
+            return join_index
+
+    def _join_level(self, other, level, how='left', return_indexers=False,
+                    keep_order=True):
+        """
+        The join method *only* affects the level of the resulting
+        MultiIndex. Otherwise it just exactly aligns the Index data to the
+        labels of the level in the MultiIndex. If `keep_order` == True, the
+        order of the data indexed by the MultiIndex will not be changed;
+        otherwise, it will tie out with `other`.
+        """
+        from .multi import MultiIndex
+
+        def _get_leaf_sorter(labels):
+            """
+            returns sorter for the inner most level while preserving the
+            order of higher levels
+            """
+            if labels[0].size == 0:
+                return np.empty(0, dtype='int64')
+
+            if len(labels) == 1:
+                lab = _ensure_int64(labels[0])
+                sorter, _ = libalgos.groupsort_indexer(lab, 1 + lab.max())
+                return sorter
+
+            # find indexers of beginning of each set of
+            # same-key labels w.r.t all but last level
+            tic = labels[0][:-1] != labels[0][1:]
+            for lab in labels[1:-1]:
+                tic |= lab[:-1] != lab[1:]
+
+            starts = np.hstack(([True], tic, [True])).nonzero()[0]
+            lab = _ensure_int64(labels[-1])
+            return lib.get_level_sorter(lab, _ensure_int64(starts))
+
+        if isinstance(self, MultiIndex) and isinstance(other, MultiIndex):
+            raise TypeError('Join on level between two MultiIndex objects '
+                            'is ambiguous')
+
+        left, right = self, other
+
+        flip_order = not isinstance(self, MultiIndex)
+        if flip_order:
+            left, right = right, left
+            how = {'right': 'left', 'left': 'right'}.get(how, how)
+
+        level = left._get_level_number(level)
+        old_level = left.levels[level]
+
+        if not right.is_unique:
+            raise NotImplementedError('Index._join_level on non-unique index '
+                                      'is not implemented')
+
+        new_level, left_lev_indexer, right_lev_indexer = \
+            old_level.join(right, how=how, return_indexers=True)
+
+        if left_lev_indexer is None:
+            if keep_order or len(left) == 0:
+                left_indexer = None
+                join_index = left
+            else:  # sort the leaves
+                left_indexer = _get_leaf_sorter(left.labels[:level + 1])
+                join_index = left[left_indexer]
+
+        else:
+            left_lev_indexer = _ensure_int64(left_lev_indexer)
+            rev_indexer = lib.get_reverse_indexer(left_lev_indexer,
+                                                  len(old_level))
+
+            new_lev_labels = algos.take_nd(rev_indexer, left.labels[level],
+                                           allow_fill=False)
+
+            new_labels = list(left.labels)
+            new_labels[level] = new_lev_labels
+
+            new_levels = list(left.levels)
+            new_levels[level] = new_level
+
+            if keep_order:  # just drop missing values. o.w. keep order
+                left_indexer = np.arange(len(left), dtype=np.intp)
+                mask = new_lev_labels != -1
+                if not mask.all():
+                    new_labels = [lab[mask] for lab in new_labels]
+                    left_indexer = left_indexer[mask]
+
+            else:  # tie out the order with other
+                if level == 0:  # outer most level, take the fast route
+                    ngroups = 1 + new_lev_labels.max()
+                    left_indexer, counts = libalgos.groupsort_indexer(
+                        new_lev_labels, ngroups)
+
+                    # missing values are placed first; drop them!
+                    left_indexer = left_indexer[counts[0]:]
+                    new_labels = [lab[left_indexer] for lab in new_labels]
+
+                else:  # sort the leaves
+                    mask = new_lev_labels != -1
+                    mask_all = mask.all()
+                    if not mask_all:
+                        new_labels = [lab[mask] for lab in new_labels]
+
+                    left_indexer = _get_leaf_sorter(new_labels[:level + 1])
+                    new_labels = [lab[left_indexer] for lab in new_labels]
+
+                    # left_indexers are w.r.t masked frame.
+                    # reverse to original frame!
+                    if not mask_all:
+                        left_indexer = mask.nonzero()[0][left_indexer]
+
+            join_index = MultiIndex(levels=new_levels, labels=new_labels,
+                                    names=left.names, verify_integrity=False)
+
+        if right_lev_indexer is not None:
+            right_indexer = algos.take_nd(right_lev_indexer,
+                                          join_index.labels[level],
+                                          allow_fill=False)
+        else:
+            right_indexer = join_index.labels[level]
+
+        if flip_order:
+            left_indexer, right_indexer = right_indexer, left_indexer
+
+        if return_indexers:
+            left_indexer = (None if left_indexer is None
+                            else _ensure_platform_int(left_indexer))
+            right_indexer = (None if right_indexer is None
+                             else _ensure_platform_int(right_indexer))
+            return join_index, left_indexer, right_indexer
+        else:
+            return join_index
+
+    def _join_monotonic(self, other, how='left', return_indexers=False):
+        if self.equals(other):
+            ret_index = other if how == 'right' else self
+            if return_indexers:
+                return ret_index, None, None
+            else:
+                return ret_index
+
+        sv = self._ndarray_values
+        ov = other._ndarray_values
+
+        if self.is_unique and other.is_unique:
+            # We can perform much better than the general case
+            if how == 'left':
+                join_index = self
+                lidx = None
+                ridx = self._left_indexer_unique(sv, ov)
+            elif how == 'right':
+                join_index = other
+                lidx = self._left_indexer_unique(ov, sv)
+                ridx = None
+            elif how == 'inner':
+                join_index, lidx, ridx = self._inner_indexer(sv, ov)
+                join_index = self._wrap_joined_index(join_index, other)
+            elif how == 'outer':
+                join_index, lidx, ridx = self._outer_indexer(sv, ov)
+                join_index = self._wrap_joined_index(join_index, other)
+        else:
+            if how == 'left':
+                join_index, lidx, ridx = self._left_indexer(sv, ov)
+            elif how == 'right':
+                join_index, ridx, lidx = self._left_indexer(ov, sv)
+            elif how == 'inner':
+                join_index, lidx, ridx = self._inner_indexer(sv, ov)
+            elif how == 'outer':
+                join_index, lidx, ridx = self._outer_indexer(sv, ov)
+            join_index = self._wrap_joined_index(join_index, other)
+
+        if return_indexers:
+            lidx = None if lidx is None else _ensure_platform_int(lidx)
+            ridx = None if ridx is None else _ensure_platform_int(ridx)
+            return join_index, lidx, ridx
+        else:
+            return join_index
+
+    def _wrap_joined_index(self, joined, other):
+        name = self.name if self.name == other.name else None
+        return Index(joined, name=name)
+
+    def _get_string_slice(self, key, use_lhs=True, use_rhs=True):
+        # this is for partial string indexing,
+        # overridden in DatetimeIndex, TimedeltaIndex and PeriodIndex
+        raise NotImplementedError
+
+    def slice_indexer(self, start=None, end=None, step=None, kind=None):
+        """
+        For an ordered or unique index, compute the slice indexer for input
+        labels and step.
+
+        Parameters
+        ----------
+        start : label, default None
+            If None, defaults to the beginning
+        end : label, default None
+            If None, defaults to the end
+        step : int, default None
+        kind : string, default None
+
+        Returns
+        -------
+        indexer : slice
+
+        Raises
+        ------
+        KeyError : If key does not exist, or key is not unique and index is
+            not ordered.
+
+        Notes
+        -----
+        This function assumes that the data is sorted, so use at your own peril
+
+        Examples
+        ---------
+        This is a method on all index types. For example you can do:
+
+        >>> idx = pd.Index(list('abcd'))
+        >>> idx.slice_indexer(start='b', end='c')
+        slice(1, 3)
+
+        >>> idx = pd.MultiIndex.from_arrays([list('abcd'), list('efgh')])
+        >>> idx.slice_indexer(start='b', end=('c', 'g'))
+        slice(1, 3)
+        """
+        start_slice, end_slice = self.slice_locs(start, end, step=step,
+                                                 kind=kind)
+
+        # return a slice
+        if not is_scalar(start_slice):
+            raise AssertionError("Start slice bound is non-scalar")
+        if not is_scalar(end_slice):
+            raise AssertionError("End slice bound is non-scalar")
+
+        return slice(start_slice, end_slice, step)
+
+    def _maybe_cast_indexer(self, key):
+        """
+        If we have a float key and are not a floating index
+        then try to cast to an int if equivalent
+        """
+
+        if is_float(key) and not self.is_floating():
+            try:
+                ckey = int(key)
+                if ckey == key:
+                    key = ckey
+            except (OverflowError, ValueError, TypeError):
+                pass
+        return key
+
+    def _validate_indexer(self, form, key, kind):
+        """
+        if we are positional indexer
+        validate that we have appropriate typed bounds
+        must be an integer
+        """
+        assert kind in ['ix', 'loc', 'getitem', 'iloc']
+
+        if key is None:
+            pass
+        elif is_integer(key):
+            pass
+        elif kind in ['iloc', 'getitem']:
+            self._invalid_indexer(form, key)
+        return key
+
+    _index_shared_docs['_maybe_cast_slice_bound'] = """
+        This function should be overloaded in subclasses that allow non-trivial
+        casting on label-slice bounds, e.g. datetime-like indices allowing
+        strings containing formatted datetimes.
+
+        Parameters
+        ----------
+        label : object
+        side : {'left', 'right'}
+        kind : {'ix', 'loc', 'getitem'}
+
+        Returns
+        -------
+        label :  object
+
+        Notes
+        -----
+        Value of `side` parameter should be validated in caller.
+
+        """
+
+    @Appender(_index_shared_docs['_maybe_cast_slice_bound'])
+    def _maybe_cast_slice_bound(self, label, side, kind):
+        assert kind in ['ix', 'loc', 'getitem', None]
+
+        # We are a plain index here (sub-class override this method if they
+        # wish to have special treatment for floats/ints, e.g. Float64Index and
+        # datetimelike Indexes
+        # reject them
+        if is_float(label):
+            if not (kind in ['ix'] and (self.holds_integer() or
+                                        self.is_floating())):
+                self._invalid_indexer('slice', label)
+
+        # we are trying to find integer bounds on a non-integer based index
+        # this is rejected (generally .loc gets you here)
+        elif is_integer(label):
+            self._invalid_indexer('slice', label)
+
+        return label
+
+    def _searchsorted_monotonic(self, label, side='left'):
+        if self.is_monotonic_increasing:
+            return self.searchsorted(label, side=side)
+        elif self.is_monotonic_decreasing:
+            # np.searchsorted expects ascending sort order, have to reverse
+            # everything for it to work (element ordering, search side and
+            # resulting value).
+            pos = self[::-1].searchsorted(label, side='right' if side == 'left'
+                                          else 'left')
+            return len(self) - pos
+
+        raise ValueError('index must be monotonic increasing or decreasing')
+
+    def _get_loc_only_exact_matches(self, key):
+        """
+        This is overridden on subclasses (namely, IntervalIndex) to control
+        get_slice_bound.
+        """
+        return self.get_loc(key)
+
+    def get_slice_bound(self, label, side, kind):
+        """
+        Calculate slice bound that corresponds to given label.
+
+        Returns leftmost (one-past-the-rightmost if ``side=='right'``) position
+        of given label.
+
+        Parameters
+        ----------
+        label : object
+        side : {'left', 'right'}
+        kind : {'ix', 'loc', 'getitem'}
+
+        """
+        assert kind in ['ix', 'loc', 'getitem', None]
+
+        if side not in ('left', 'right'):
+            raise ValueError("Invalid value for side kwarg,"
+                             " must be either 'left' or 'right': %s" %
+                             (side, ))
+
+        original_label = label
+
+        # For datetime indices label may be a string that has to be converted
+        # to datetime boundary according to its resolution.
+        label = self._maybe_cast_slice_bound(label, side, kind)
+
+        # we need to look up the label
+        try:
+            slc = self._get_loc_only_exact_matches(label)
+        except KeyError as err:
+            try:
+                return self._searchsorted_monotonic(label, side)
+            except ValueError:
+                # raise the original KeyError
+                raise err
+
+        if isinstance(slc, np.ndarray):
+            # get_loc may return a boolean array or an array of indices, which
+            # is OK as long as they are representable by a slice.
+            if is_bool_dtype(slc):
+                slc = lib.maybe_booleans_to_slice(slc.view('u1'))
+            else:
+                slc = lib.maybe_indices_to_slice(slc.astype('i8'), len(self))
+            if isinstance(slc, np.ndarray):
+                raise KeyError("Cannot get %s slice bound for non-unique "
+                               "label: %r" % (side, original_label))
+
+        if isinstance(slc, slice):
+            if side == 'left':
+                return slc.start
+            else:
+                return slc.stop
+        else:
+            if side == 'right':
+                return slc + 1
+            else:
+                return slc
+
+    def slice_locs(self, start=None, end=None, step=None, kind=None):
+        """
+        Compute slice locations for input labels.
+
+        Parameters
+        ----------
+        start : label, default None
+            If None, defaults to the beginning
+        end : label, default None
+            If None, defaults to the end
+        step : int, defaults None
+            If None, defaults to 1
+        kind : {'ix', 'loc', 'getitem'} or None
+
+        Returns
+        -------
+        start, end : int
+
+        Notes
+        -----
+        This method only works if the index is monotonic or unique.
+
+        Examples
+        ---------
+        >>> idx = pd.Index(list('abcd'))
+        >>> idx.slice_locs(start='b', end='c')
+        (1, 3)
+
+        See Also
+        --------
+        Index.get_loc : Get location for a single label
+        """
+        inc = (step is None or step >= 0)
+
+        if not inc:
+            # If it's a reverse slice, temporarily swap bounds.
+            start, end = end, start
+
+        start_slice = None
+        if start is not None:
+            start_slice = self.get_slice_bound(start, 'left', kind)
+        if start_slice is None:
+            start_slice = 0
+
+        end_slice = None
+        if end is not None:
+            end_slice = self.get_slice_bound(end, 'right', kind)
+        if end_slice is None:
+            end_slice = len(self)
+
+        if not inc:
+            # Bounds at this moment are swapped, swap them back and shift by 1.
+            #
+            # slice_locs('B', 'A', step=-1): s='B', e='A'
+            #
+            #              s='A'                 e='B'
+            # AFTER SWAP:    |                     |
+            #                v ------------------> V
+            #           -----------------------------------
+            #           | | |A|A|A|A| | | | | |B|B| | | | |
+            #           -----------------------------------
+            #              ^ <------------------ ^
+            # SHOULD BE:   |                     |
+            #           end=s-1              start=e-1
+            #
+            end_slice, start_slice = start_slice - 1, end_slice - 1
+
+            # i == -1 triggers ``len(self) + i`` selection that points to the
+            # last element, not before-the-first one, subtracting len(self)
+            # compensates that.
+            if end_slice == -1:
+                end_slice -= len(self)
+            if start_slice == -1:
+                start_slice -= len(self)
+
+        return start_slice, end_slice
+
+    def delete(self, loc):
+        """
+        Make new Index with passed location(-s) deleted
+
+        Returns
+        -------
+        new_index : Index
+        """
+        return self._shallow_copy(np.delete(self._data, loc))
+
+    def insert(self, loc, item):
+        """
+        Make new Index inserting new item at location. Follows
+        Python list.append semantics for negative values
+
+        Parameters
+        ----------
+        loc : int
+        item : object
+
+        Returns
+        -------
+        new_index : Index
+        """
+        if is_scalar(item) and isna(item):
+            # GH 18295
+            item = self._na_value
+
+        _self = np.asarray(self)
+        item = self._coerce_scalar_to_index(item)._ndarray_values
+        idx = np.concatenate((_self[:loc], item, _self[loc:]))
+        return self._shallow_copy_with_infer(idx)
+
+    def drop(self, labels, errors='raise'):
+        """
+        Make new Index with passed list of labels deleted
+
+        Parameters
+        ----------
+        labels : array-like
+        errors : {'ignore', 'raise'}, default 'raise'
+            If 'ignore', suppress error and existing labels are dropped.
+
+        Returns
+        -------
+        dropped : Index
+
+        Raises
+        ------
+        KeyError
+            If not all of the labels are found in the selected axis
+        """
+        arr_dtype = 'object' if self.dtype == 'object' else None
+        labels = com._index_labels_to_array(labels, dtype=arr_dtype)
+        indexer = self.get_indexer(labels)
+        mask = indexer == -1
+        if mask.any():
+            if errors != 'ignore':
+                raise KeyError(
+                    '{} not found in axis'.format(labels[mask]))
+            indexer = indexer[~mask]
+        return self.delete(indexer)
+
+    _index_shared_docs['index_unique'] = (
+        """
+        Return unique values in the index. Uniques are returned in order
+        of appearance, this does NOT sort.
+
+        Parameters
+        ----------
+        level : int or str, optional, default None
+            Only return values from specified level (for MultiIndex)
+
+            .. versionadded:: 0.23.0
+
+        Returns
+        -------
+        Index without duplicates
+
+        See Also
+        --------
+        unique
+        Series.unique
+        """)
+
+    @Appender(_index_shared_docs['index_unique'] % _index_doc_kwargs)
+    def unique(self, level=None):
+        if level is not None:
+            self._validate_index_level(level)
+        result = super(Index, self).unique()
+        return self._shallow_copy(result)
+
+    def drop_duplicates(self, keep='first'):
+        """
+        Return Index with duplicate values removed.
+
+        Parameters
+        ----------
+        keep : {'first', 'last', ``False``}, default 'first'
+            - 'first' : Drop duplicates except for the first occurrence.
+            - 'last' : Drop duplicates except for the last occurrence.
+            - ``False`` : Drop all duplicates.
+
+        Returns
+        -------
+        deduplicated : Index
+
+        See Also
+        --------
+        Series.drop_duplicates : equivalent method on Series
+        DataFrame.drop_duplicates : equivalent method on DataFrame
+        Index.duplicated : related method on Index, indicating duplicate
+            Index values.
+
+        Examples
+        --------
+        Generate an pandas.Index with duplicate values.
+
+        >>> idx = pd.Index(['lama', 'cow', 'lama', 'beetle', 'lama', 'hippo'])
+
+        The `keep` parameter controls  which duplicate values are removed.
+        The value 'first' keeps the first occurrence for each
+        set of duplicated entries. The default value of keep is 'first'.
+
+        >>> idx.drop_duplicates(keep='first')
+        Index(['lama', 'cow', 'beetle', 'hippo'], dtype='object')
+
+        The value 'last' keeps the last occurrence for each set of duplicated
+        entries.
+
+        >>> idx.drop_duplicates(keep='last')
+        Index(['cow', 'beetle', 'lama', 'hippo'], dtype='object')
+
+        The value ``False`` discards all sets of duplicated entries.
+
+        >>> idx.drop_duplicates(keep=False)
+        Index(['cow', 'beetle', 'hippo'], dtype='object')
+        """
+        return super(Index, self).drop_duplicates(keep=keep)
+
+    def duplicated(self, keep='first'):
+        """
+        Indicate duplicate index values.
+
+        Duplicated values are indicated as ``True`` values in the resulting
+        array. Either all duplicates, all except the first, or all except the
+        last occurrence of duplicates can be indicated.
+
+        Parameters
+        ----------
+        keep : {'first', 'last', False}, default 'first'
+            The value or values in a set of duplicates to mark as missing.
+
+            - 'first' : Mark duplicates as ``True`` except for the first
+              occurrence.
+            - 'last' : Mark duplicates as ``True`` except for the last
+              occurrence.
+            - ``False`` : Mark all duplicates as ``True``.
+
+        Examples
+        --------
+        By default, for each set of duplicated values, the first occurrence is
+        set to False and all others to True:
+
+        >>> idx = pd.Index(['lama', 'cow', 'lama', 'beetle', 'lama'])
+        >>> idx.duplicated()
+        array([False, False,  True, False,  True])
+
+        which is equivalent to
+
+        >>> idx.duplicated(keep='first')
+        array([False, False,  True, False,  True])
+
+        By using 'last', the last occurrence of each set of duplicated values
+        is set on False and all others on True:
+
+        >>> idx.duplicated(keep='last')
+        array([ True, False,  True, False, False])
+
+        By setting keep on ``False``, all duplicates are True:
+
+        >>> idx.duplicated(keep=False)
+        array([ True, False,  True, False,  True])
+
+        Returns
+        -------
+        numpy.ndarray
+
+        See Also
+        --------
+        pandas.Series.duplicated : Equivalent method on pandas.Series
+        pandas.DataFrame.duplicated : Equivalent method on pandas.DataFrame
+        pandas.Index.drop_duplicates : Remove duplicate values from Index
+        """
+        return super(Index, self).duplicated(keep=keep)
+
+    _index_shared_docs['fillna'] = """
+        Fill NA/NaN values with the specified value
+
+        Parameters
+        ----------
+        value : scalar
+            Scalar value to use to fill holes (e.g. 0).
+            This value cannot be a list-likes.
+        downcast : dict, default is None
+            a dict of item->dtype of what to downcast if possible,
+            or the string 'infer' which will try to downcast to an appropriate
+            equal type (e.g. float64 to int64 if possible)
+
+        Returns
+        -------
+        filled : %(klass)s
+        """
+
+    @Appender(_index_shared_docs['fillna'])
+    def fillna(self, value=None, downcast=None):
+        self._assert_can_do_op(value)
+        if self.hasnans:
+            result = self.putmask(self._isnan, value)
+            if downcast is None:
+                # no need to care metadata other than name
+                # because it can't have freq if
+                return Index(result, name=self.name)
+        return self._shallow_copy()
+
+    _index_shared_docs['dropna'] = """
+        Return Index without NA/NaN values
+
+        Parameters
+        ----------
+        how :  {'any', 'all'}, default 'any'
+            If the Index is a MultiIndex, drop the value when any or all levels
+            are NaN.
+
+        Returns
+        -------
+        valid : Index
+        """
+
+    @Appender(_index_shared_docs['dropna'])
+    def dropna(self, how='any'):
+        if how not in ('any', 'all'):
+            raise ValueError("invalid how option: {0}".format(how))
+
+        if self.hasnans:
+            return self._shallow_copy(self.values[~self._isnan])
+        return self._shallow_copy()
+
+    def _evaluate_with_timedelta_like(self, other, op):
+        # Timedelta knows how to operate with np.array, so dispatch to that
+        # operation and then wrap the results
+        other = Timedelta(other)
+        values = self.values
+
+        with np.errstate(all='ignore'):
+            result = op(values, other)
+
+        attrs = self._get_attributes_dict()
+        attrs = self._maybe_update_attributes(attrs)
+        if op == divmod:
+            return Index(result[0], **attrs), Index(result[1], **attrs)
+        return Index(result, **attrs)
+
+    def _evaluate_with_datetime_like(self, other, op):
+        raise TypeError("can only perform ops with datetime like values")
+
+    def _evaluate_compare(self, other, op):
+        raise com.AbstractMethodError(self)
+
+    @classmethod
+    def _add_comparison_methods(cls):
+        """ add in comparison methods """
+        cls.__eq__ = _make_comparison_op(operator.eq, cls)
+        cls.__ne__ = _make_comparison_op(operator.ne, cls)
+        cls.__lt__ = _make_comparison_op(operator.lt, cls)
+        cls.__gt__ = _make_comparison_op(operator.gt, cls)
+        cls.__le__ = _make_comparison_op(operator.le, cls)
+        cls.__ge__ = _make_comparison_op(operator.ge, cls)
+
+    @classmethod
+    def _add_numeric_methods_add_sub_disabled(cls):
+        """ add in the numeric add/sub methods to disable """
+        cls.__add__ = make_invalid_op('__add__')
+        cls.__radd__ = make_invalid_op('__radd__')
+        cls.__iadd__ = make_invalid_op('__iadd__')
+        cls.__sub__ = make_invalid_op('__sub__')
+        cls.__rsub__ = make_invalid_op('__rsub__')
+        cls.__isub__ = make_invalid_op('__isub__')
+
+    @classmethod
+    def _add_numeric_methods_disabled(cls):
+        """ add in numeric methods to disable other than add/sub """
+        cls.__pow__ = make_invalid_op('__pow__')
+        cls.__rpow__ = make_invalid_op('__rpow__')
+        cls.__mul__ = make_invalid_op('__mul__')
+        cls.__rmul__ = make_invalid_op('__rmul__')
+        cls.__floordiv__ = make_invalid_op('__floordiv__')
+        cls.__rfloordiv__ = make_invalid_op('__rfloordiv__')
+        cls.__truediv__ = make_invalid_op('__truediv__')
+        cls.__rtruediv__ = make_invalid_op('__rtruediv__')
+        if not compat.PY3:
+            cls.__div__ = make_invalid_op('__div__')
+            cls.__rdiv__ = make_invalid_op('__rdiv__')
+        cls.__mod__ = make_invalid_op('__mod__')
+        cls.__divmod__ = make_invalid_op('__divmod__')
+        cls.__neg__ = make_invalid_op('__neg__')
+        cls.__pos__ = make_invalid_op('__pos__')
+        cls.__abs__ = make_invalid_op('__abs__')
+        cls.__inv__ = make_invalid_op('__inv__')
+
+    def _maybe_update_attributes(self, attrs):
+        """ Update Index attributes (e.g. freq) depending on op """
+        return attrs
+
+    def _validate_for_numeric_unaryop(self, op, opstr):
+        """ validate if we can perform a numeric unary operation """
+
+        if not self._is_numeric_dtype:
+            raise TypeError("cannot evaluate a numeric op "
+                            "{opstr} for type: {typ}"
+                            .format(opstr=opstr, typ=type(self).__name__))
+
+    def _validate_for_numeric_binop(self, other, op):
+        """
+        return valid other, evaluate or raise TypeError
+        if we are not of the appropriate type
+
+        internal method called by ops
+        """
+        opstr = '__{opname}__'.format(opname=op.__name__)
+        # if we are an inheritor of numeric,
+        # but not actually numeric (e.g. DatetimeIndex/PeriodIndex)
+        if not self._is_numeric_dtype:
+            raise TypeError("cannot evaluate a numeric op {opstr} "
+                            "for type: {typ}"
+                            .format(opstr=opstr, typ=type(self).__name__))
+
+        if isinstance(other, Index):
+            if not other._is_numeric_dtype:
+                raise TypeError("cannot evaluate a numeric op "
+                                "{opstr} with type: {typ}"
+                                .format(opstr=opstr, typ=type(other)))
+        elif isinstance(other, np.ndarray) and not other.ndim:
+            other = other.item()
+
+        if isinstance(other, (Index, ABCSeries, np.ndarray)):
+            if len(self) != len(other):
+                raise ValueError("cannot evaluate a numeric op with "
+                                 "unequal lengths")
+            other = com._values_from_object(other)
+            if other.dtype.kind not in ['f', 'i', 'u']:
+                raise TypeError("cannot evaluate a numeric op "
+                                "with a non-numeric dtype")
+        elif isinstance(other, (ABCDateOffset, np.timedelta64, timedelta)):
+            # higher up to handle
+            pass
+        elif isinstance(other, (datetime, np.datetime64)):
+            # higher up to handle
+            pass
+        else:
+            if not (is_float(other) or is_integer(other)):
+                raise TypeError("can only perform ops with scalar values")
+
+        return other
+
+    @classmethod
+    def _add_numeric_methods_binary(cls):
+        """ add in numeric methods """
+        cls.__add__ = _make_arithmetic_op(operator.add, cls)
+        cls.__radd__ = _make_arithmetic_op(ops.radd, cls)
+        cls.__sub__ = _make_arithmetic_op(operator.sub, cls)
+        cls.__rsub__ = _make_arithmetic_op(ops.rsub, cls)
+        cls.__mul__ = _make_arithmetic_op(operator.mul, cls)
+        cls.__rmul__ = _make_arithmetic_op(ops.rmul, cls)
+        cls.__rpow__ = _make_arithmetic_op(ops.rpow, cls)
+        cls.__pow__ = _make_arithmetic_op(operator.pow, cls)
+        cls.__mod__ = _make_arithmetic_op(operator.mod, cls)
+        cls.__floordiv__ = _make_arithmetic_op(operator.floordiv, cls)
+        cls.__rfloordiv__ = _make_arithmetic_op(ops.rfloordiv, cls)
+        cls.__truediv__ = _make_arithmetic_op(operator.truediv, cls)
+        cls.__rtruediv__ = _make_arithmetic_op(ops.rtruediv, cls)
+        if not compat.PY3:
+            cls.__div__ = _make_arithmetic_op(operator.div, cls)
+            cls.__rdiv__ = _make_arithmetic_op(ops.rdiv, cls)
+
+        cls.__divmod__ = _make_arithmetic_op(divmod, cls)
+
+    @classmethod
+    def _add_numeric_methods_unary(cls):
+        """ add in numeric unary methods """
+
+        def _make_evaluate_unary(op, opstr):
+
+            def _evaluate_numeric_unary(self):
+
+                self._validate_for_numeric_unaryop(op, opstr)
+                attrs = self._get_attributes_dict()
+                attrs = self._maybe_update_attributes(attrs)
+                return Index(op(self.values), **attrs)
+
+            return _evaluate_numeric_unary
+
+        cls.__neg__ = _make_evaluate_unary(operator.neg, '__neg__')
+        cls.__pos__ = _make_evaluate_unary(operator.pos, '__pos__')
+        cls.__abs__ = _make_evaluate_unary(np.abs, '__abs__')
+        cls.__inv__ = _make_evaluate_unary(lambda x: -x, '__inv__')
+
+    @classmethod
+    def _add_numeric_methods(cls):
+        cls._add_numeric_methods_unary()
+        cls._add_numeric_methods_binary()
+
+    @classmethod
+    def _add_logical_methods(cls):
+        """ add in logical methods """
+
+        _doc = """
+        %(desc)s
+
+        Parameters
+        ----------
+        *args
+            These parameters will be passed to numpy.%(outname)s.
+        **kwargs
+            These parameters will be passed to numpy.%(outname)s.
+
+        Returns
+        -------
+        %(outname)s : bool or array_like (if axis is specified)
+            A single element array_like may be converted to bool."""
+
+        _index_shared_docs['index_all'] = dedent("""
+
+        See Also
+        --------
+        pandas.Index.any : Return whether any element in an Index is True.
+        pandas.Series.any : Return whether any element in a Series is True.
+        pandas.Series.all : Return whether all elements in a Series are True.
+
+        Notes
+        -----
+        Not a Number (NaN), positive infinity and negative infinity
+        evaluate to True because these are not equal to zero.
+
+        Examples
+        --------
+        **all**
+
+        True, because nonzero integers are considered True.
+
+        >>> pd.Index([1, 2, 3]).all()
+        True
+
+        False, because ``0`` is considered False.
+
+        >>> pd.Index([0, 1, 2]).all()
+        False
+
+        **any**
+
+        True, because ``1`` is considered True.
+
+        >>> pd.Index([0, 0, 1]).any()
+        True
+
+        False, because ``0`` is considered False.
+
+        >>> pd.Index([0, 0, 0]).any()
+        False
+        """)
+
+        _index_shared_docs['index_any'] = dedent("""
+
+        See Also
+        --------
+        pandas.Index.all : Return whether all elements are True.
+        pandas.Series.all : Return whether all elements are True.
+
+        Notes
+        -----
+        Not a Number (NaN), positive infinity and negative infinity
+        evaluate to True because these are not equal to zero.
+
+        Examples
+        --------
+        >>> index = pd.Index([0, 1, 2])
+        >>> index.any()
+        True
+
+        >>> index = pd.Index([0, 0, 0])
+        >>> index.any()
+        False
+        """)
+
+        def _make_logical_function(name, desc, f):
+            @Substitution(outname=name, desc=desc)
+            @Appender(_index_shared_docs['index_' + name])
+            @Appender(_doc)
+            def logical_func(self, *args, **kwargs):
+                result = f(self.values)
+                if (isinstance(result, (np.ndarray, ABCSeries, Index)) and
+                        result.ndim == 0):
+                    # return NumPy type
+                    return result.dtype.type(result.item())
+                else:  # pragma: no cover
+                    return result
+
+            logical_func.__name__ = name
+            return logical_func
+
+        cls.all = _make_logical_function('all', 'Return whether all elements '
+                                                'are True.',
+                                         np.all)
+        cls.any = _make_logical_function('any',
+                                         'Return whether any element is True.',
+                                         np.any)
+
+    @classmethod
+    def _add_logical_methods_disabled(cls):
+        """ add in logical methods to disable """
+        cls.all = make_invalid_op('all')
+        cls.any = make_invalid_op('any')
+
+
+Index._add_numeric_methods_disabled()
+Index._add_logical_methods()
+Index._add_comparison_methods()
+
+
+def _ensure_index_from_sequences(sequences, names=None):
+    """Construct an index from sequences of data.
+
+    A single sequence returns an Index. Many sequences returns a
+    MultiIndex.
+
+    Parameters
+    ----------
+    sequences : sequence of sequences
+    names : sequence of str
+
+    Returns
+    -------
+    index : Index or MultiIndex
+
+    Examples
+    --------
+    >>> _ensure_index_from_sequences([[1, 2, 3]], names=['name'])
+    Int64Index([1, 2, 3], dtype='int64', name='name')
+
+    >>> _ensure_index_from_sequences([['a', 'a'], ['a', 'b']],
+                                     names=['L1', 'L2'])
+    MultiIndex(levels=[['a'], ['a', 'b']],
+               labels=[[0, 0], [0, 1]],
+               names=['L1', 'L2'])
+
+    See Also
+    --------
+    _ensure_index
+    """
+    from .multi import MultiIndex
+
+    if len(sequences) == 1:
+        if names is not None:
+            names = names[0]
+        return Index(sequences[0], name=names)
+    else:
+        return MultiIndex.from_arrays(sequences, names=names)
+
+
+def _ensure_index(index_like, copy=False):
+    """
+    Ensure that we have an index from some index-like object
+
+    Parameters
+    ----------
+    index : sequence
+        An Index or other sequence
+    copy : bool
+
+    Returns
+    -------
+    index : Index or MultiIndex
+
+    Examples
+    --------
+    >>> _ensure_index(['a', 'b'])
+    Index(['a', 'b'], dtype='object')
+
+    >>> _ensure_index([('a', 'a'),  ('b', 'c')])
+    Index([('a', 'a'), ('b', 'c')], dtype='object')
+
+    >>> _ensure_index([['a', 'a'], ['b', 'c']])
+    MultiIndex(levels=[['a'], ['b', 'c']],
+               labels=[[0, 0], [0, 1]])
+
+    See Also
+    --------
+    _ensure_index_from_sequences
+    """
+    if isinstance(index_like, Index):
+        if copy:
+            index_like = index_like.copy()
+        return index_like
+    if hasattr(index_like, 'name'):
+        return Index(index_like, name=index_like.name, copy=copy)
+
+    if is_iterator(index_like):
+        index_like = list(index_like)
+
+    # must check for exactly list here because of strict type
+    # check in clean_index_list
+    if isinstance(index_like, list):
+        if type(index_like) != list:
+            index_like = list(index_like)
+
+        converted, all_arrays = lib.clean_index_list(index_like)
+
+        if len(converted) > 0 and all_arrays:
+            from .multi import MultiIndex
+            return MultiIndex.from_arrays(converted)
+        else:
+            index_like = converted
+    else:
+        # clean_index_list does the equivalent of copying
+        # so only need to do this if not list instance
+        if copy:
+            from copy import copy
+            index_like = copy(index_like)
+
+    return Index(index_like)
+
+
+def _ensure_has_len(seq):
+    """If seq is an iterator, put its values into a list."""
+    try:
+        len(seq)
+    except TypeError:
+        return list(seq)
+    else:
+        return seq
+
+
+def _trim_front(strings):
+    """
+    Trims zeros and decimal points
+    """
+    trimmed = strings
+    while len(strings) > 0 and all(x[0] == ' ' for x in trimmed):
+        trimmed = [x[1:] for x in trimmed]
+    return trimmed
+
+
+def _validate_join_method(method):
+    if method not in ['left', 'right', 'inner', 'outer']:
+        raise ValueError('do not recognize join method %s' % method)
diff --git a/pandas/core/indexes/category.py b/pandas/core/indexes/category.py
new file mode 100644
index 0000000000000..8472d5fd49bd9
--- /dev/null
+++ b/pandas/core/indexes/category.py
@@ -0,0 +1,860 @@
+import operator
+
+import numpy as np
+from pandas._libs import index as libindex
+
+from pandas import compat
+from pandas.compat.numpy import function as nv
+from pandas.core.dtypes.generic import ABCCategorical, ABCSeries
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas.core.dtypes.common import (
+    is_categorical_dtype,
+    _ensure_platform_int,
+    is_list_like,
+    is_interval_dtype,
+    is_scalar)
+from pandas.core.dtypes.missing import array_equivalent, isna
+from pandas.core.algorithms import take_1d
+
+
+from pandas.util._decorators import Appender, cache_readonly
+from pandas.core.config import get_option
+from pandas.core.indexes.base import Index, _index_shared_docs
+from pandas.core import accessor
+import pandas.core.common as com
+import pandas.core.missing as missing
+import pandas.core.indexes.base as ibase
+from pandas.core.arrays.categorical import Categorical, contains
+
+_index_doc_kwargs = dict(ibase._index_doc_kwargs)
+_index_doc_kwargs.update(dict(target_klass='CategoricalIndex'))
+
+
+class CategoricalIndex(Index, accessor.PandasDelegate):
+    """
+
+    Immutable Index implementing an ordered, sliceable set. CategoricalIndex
+    represents a sparsely populated Index with an underlying Categorical.
+
+    Parameters
+    ----------
+    data : array-like or Categorical, (1-dimensional)
+    categories : optional, array-like
+        categories for the CategoricalIndex
+    ordered : boolean,
+        designating if the categories are ordered
+    copy : bool
+        Make a copy of input ndarray
+    name : object
+        Name to be stored in the index
+
+    Attributes
+    ----------
+    codes
+    categories
+    ordered
+
+    Methods
+    -------
+    rename_categories
+    reorder_categories
+    add_categories
+    remove_categories
+    remove_unused_categories
+    set_categories
+    as_ordered
+    as_unordered
+    map
+
+    See Also
+    --------
+    Categorical, Index
+    """
+
+    _typ = 'categoricalindex'
+    _engine_type = libindex.Int64Engine
+    _attributes = ['name']
+
+    def __new__(cls, data=None, categories=None, ordered=None, dtype=None,
+                copy=False, name=None, fastpath=False):
+
+        if fastpath:
+            return cls._simple_new(data, name=name, dtype=dtype)
+
+        if name is None and hasattr(data, 'name'):
+            name = data.name
+
+        if isinstance(data, ABCCategorical):
+            data = cls._create_categorical(data, categories, ordered,
+                                           dtype)
+        elif isinstance(data, CategoricalIndex):
+            data = data._data
+            data = cls._create_categorical(data, categories, ordered,
+                                           dtype)
+        else:
+
+            # don't allow scalars
+            # if data is None, then categories must be provided
+            if is_scalar(data):
+                if data is not None or categories is None:
+                    cls._scalar_data_error(data)
+                data = []
+            data = cls._create_categorical(data, categories, ordered,
+                                           dtype)
+
+        if copy:
+            data = data.copy()
+
+        return cls._simple_new(data, name=name)
+
+    def _create_from_codes(self, codes, categories=None, ordered=None,
+                           name=None):
+        """
+        *this is an internal non-public method*
+
+        create the correct categorical from codes
+
+        Parameters
+        ----------
+        codes : new codes
+        categories : optional categories, defaults to existing
+        ordered : optional ordered attribute, defaults to existing
+        name : optional name attribute, defaults to existing
+
+        Returns
+        -------
+        CategoricalIndex
+        """
+
+        if categories is None:
+            categories = self.categories
+        if ordered is None:
+            ordered = self.ordered
+        if name is None:
+            name = self.name
+        cat = Categorical.from_codes(codes, categories=categories,
+                                     ordered=self.ordered)
+        return CategoricalIndex(cat, name=name)
+
+    @classmethod
+    def _create_categorical(cls, data, categories=None, ordered=None,
+                            dtype=None):
+        """
+        *this is an internal non-public method*
+
+        create the correct categorical from data and the properties
+
+        Parameters
+        ----------
+        data : data for new Categorical
+        categories : optional categories, defaults to existing
+        ordered : optional ordered attribute, defaults to existing
+        dtype : CategoricalDtype, defaults to existing
+
+        Returns
+        -------
+        Categorical
+        """
+        if (isinstance(data, (cls, ABCSeries)) and
+                is_categorical_dtype(data)):
+            data = data.values
+
+        if not isinstance(data, ABCCategorical):
+            if ordered is None and dtype is None:
+                ordered = False
+            data = Categorical(data, categories=categories, ordered=ordered,
+                               dtype=dtype)
+        else:
+            if categories is not None:
+                data = data.set_categories(categories, ordered=ordered)
+            elif ordered is not None and ordered != data.ordered:
+                data = data.set_ordered(ordered)
+            if isinstance(dtype, CategoricalDtype) and dtype != data.dtype:
+                # we want to silently ignore dtype='category'
+                data = data._set_dtype(dtype)
+        return data
+
+    @classmethod
+    def _simple_new(cls, values, name=None, categories=None, ordered=None,
+                    dtype=None, **kwargs):
+        result = object.__new__(cls)
+
+        values = cls._create_categorical(values, categories, ordered,
+                                         dtype=dtype)
+        result._data = values
+        result.name = name
+        for k, v in compat.iteritems(kwargs):
+            setattr(result, k, v)
+
+        result._reset_identity()
+        return result
+
+    @Appender(_index_shared_docs['_shallow_copy'])
+    def _shallow_copy(self, values=None, categories=None, ordered=None,
+                      dtype=None, **kwargs):
+        # categories and ordered can't be part of attributes,
+        # as these are properties
+        # we want to reuse self.dtype if possible, i.e. neither are
+        # overridden.
+        if dtype is not None and (categories is not None or
+                                  ordered is not None):
+            raise TypeError("Cannot specify both `dtype` and `categories` "
+                            "or `ordered`")
+
+        if categories is None and ordered is None:
+            dtype = self.dtype if dtype is None else dtype
+            return super(CategoricalIndex, self)._shallow_copy(
+                values=values, dtype=dtype, **kwargs)
+        if categories is None:
+            categories = self.categories
+        if ordered is None:
+            ordered = self.ordered
+
+        return super(CategoricalIndex, self)._shallow_copy(
+            values=values, categories=categories,
+            ordered=ordered, **kwargs)
+
+    def _is_dtype_compat(self, other):
+        """
+        *this is an internal non-public method*
+
+        provide a comparison between the dtype of self and other (coercing if
+        needed)
+
+        Raises
+        ------
+        TypeError if the dtypes are not compatible
+        """
+        if is_categorical_dtype(other):
+            if isinstance(other, CategoricalIndex):
+                other = other._values
+            if not other.is_dtype_equal(self):
+                raise TypeError("categories must match existing categories "
+                                "when appending")
+        else:
+            values = other
+            if not is_list_like(values):
+                values = [values]
+            other = CategoricalIndex(self._create_categorical(
+                other, dtype=self.dtype))
+            if not other.isin(values).all():
+                raise TypeError("cannot append a non-category item to a "
+                                "CategoricalIndex")
+
+        return other
+
+    def equals(self, other):
+        """
+        Determines if two CategorialIndex objects contain the same elements.
+        """
+        if self.is_(other):
+            return True
+
+        if not isinstance(other, Index):
+            return False
+
+        try:
+            other = self._is_dtype_compat(other)
+            return array_equivalent(self._data, other)
+        except (TypeError, ValueError):
+            pass
+
+        return False
+
+    @property
+    def _formatter_func(self):
+        return self.categories._formatter_func
+
+    def _format_attrs(self):
+        """
+        Return a list of tuples of the (attr,formatted_value)
+        """
+        max_categories = (10 if get_option("display.max_categories") == 0 else
+                          get_option("display.max_categories"))
+        attrs = [
+            ('categories',
+             ibase.default_pprint(self.categories,
+                                  max_seq_items=max_categories)),
+            ('ordered', self.ordered)]
+        if self.name is not None:
+            attrs.append(('name', ibase.default_pprint(self.name)))
+        attrs.append(('dtype', "'%s'" % self.dtype.name))
+        max_seq_items = get_option('display.max_seq_items') or len(self)
+        if len(self) > max_seq_items:
+            attrs.append(('length', len(self)))
+        return attrs
+
+    @property
+    def inferred_type(self):
+        return 'categorical'
+
+    @property
+    def values(self):
+        """ return the underlying data, which is a Categorical """
+        return self._data
+
+    @property
+    def itemsize(self):
+        # Size of the items in categories, not codes.
+        return self.values.itemsize
+
+    def get_values(self):
+        """ return the underlying data as an ndarray """
+        return self._data.get_values()
+
+    def tolist(self):
+        return self._data.tolist()
+
+    @property
+    def codes(self):
+        return self._data.codes
+
+    @property
+    def categories(self):
+        return self._data.categories
+
+    @property
+    def ordered(self):
+        return self._data.ordered
+
+    def _reverse_indexer(self):
+        return self._data._reverse_indexer()
+
+    @Appender(_index_shared_docs['__contains__'] % _index_doc_kwargs)
+    def __contains__(self, key):
+        # if key is a NaN, check if any NaN is in self.
+        if isna(key):
+            return self.hasnans
+
+        return contains(self, key, container=self._engine)
+
+    @Appender(_index_shared_docs['contains'] % _index_doc_kwargs)
+    def contains(self, key):
+        return key in self
+
+    def __array__(self, dtype=None):
+        """ the array interface, return my values """
+        return np.array(self._data, dtype=dtype)
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        if is_interval_dtype(dtype):
+            from pandas import IntervalIndex
+            return IntervalIndex(np.array(self))
+        elif is_categorical_dtype(dtype):
+            # GH 18630
+            dtype = self.dtype.update_dtype(dtype)
+            if dtype == self.dtype:
+                return self.copy() if copy else self
+
+        return super(CategoricalIndex, self).astype(dtype=dtype, copy=copy)
+
+    @cache_readonly
+    def _isnan(self):
+        """ return if each value is nan"""
+        return self._data.codes == -1
+
+    @Appender(ibase._index_shared_docs['fillna'])
+    def fillna(self, value, downcast=None):
+        self._assert_can_do_op(value)
+        return CategoricalIndex(self._data.fillna(value), name=self.name)
+
+    def argsort(self, *args, **kwargs):
+        return self.values.argsort(*args, **kwargs)
+
+    @cache_readonly
+    def _engine(self):
+
+        # we are going to look things up with the codes themselves
+        return self._engine_type(lambda: self.codes.astype('i8'), len(self))
+
+    # introspection
+    @cache_readonly
+    def is_unique(self):
+        return self._engine.is_unique
+
+    @property
+    def is_monotonic_increasing(self):
+        return self._engine.is_monotonic_increasing
+
+    @property
+    def is_monotonic_decreasing(self):
+        return self._engine.is_monotonic_decreasing
+
+    @Appender(_index_shared_docs['index_unique'] % _index_doc_kwargs)
+    def unique(self, level=None):
+        if level is not None:
+            self._validate_index_level(level)
+        result = self.values.unique()
+        # CategoricalIndex._shallow_copy keeps original categories
+        # and ordered if not otherwise specified
+        return self._shallow_copy(result, categories=result.categories,
+                                  ordered=result.ordered)
+
+    @Appender(Index.duplicated.__doc__)
+    def duplicated(self, keep='first'):
+        from pandas._libs.hashtable import duplicated_int64
+        codes = self.codes.astype('i8')
+        return duplicated_int64(codes, keep)
+
+    def _to_safe_for_reshape(self):
+        """ convert to object if we are a categorical """
+        return self.astype('object')
+
+    def get_loc(self, key, method=None):
+        """
+        Get integer location, slice or boolean mask for requested label.
+
+        Parameters
+        ----------
+        key : label
+        method : {None}
+            * default: exact matches only.
+
+        Returns
+        -------
+        loc : int if unique index, slice if monotonic index, else mask
+
+        Examples
+        ---------
+        >>> unique_index = pd.CategoricalIndex(list('abc'))
+        >>> unique_index.get_loc('b')
+        1
+
+        >>> monotonic_index = pd.CategoricalIndex(list('abbc'))
+        >>> monotonic_index.get_loc('b')
+        slice(1, 3, None)
+
+        >>> non_monotonic_index = p.dCategoricalIndex(list('abcb'))
+        >>> non_monotonic_index.get_loc('b')
+        array([False,  True, False,  True], dtype=bool)
+        """
+        codes = self.categories.get_loc(key)
+        if (codes == -1):
+            raise KeyError(key)
+        return self._engine.get_loc(codes)
+
+    def get_value(self, series, key):
+        """
+        Fast lookup of value from 1-dimensional ndarray. Only use this if you
+        know what you're doing
+        """
+        try:
+            k = com._values_from_object(key)
+            k = self._convert_scalar_indexer(k, kind='getitem')
+            indexer = self.get_loc(k)
+            return series.iloc[indexer]
+        except (KeyError, TypeError):
+            pass
+
+        # we might be a positional inexer
+        return super(CategoricalIndex, self).get_value(series, key)
+
+    def _can_reindex(self, indexer):
+        """ always allow reindexing """
+        pass
+
+    @Appender(_index_shared_docs['where'])
+    def where(self, cond, other=None):
+        if other is None:
+            other = self._na_value
+        values = np.where(cond, self.values, other)
+
+        cat = Categorical(values,
+                          categories=self.categories,
+                          ordered=self.ordered)
+        return self._shallow_copy(cat, **self._get_attributes_dict())
+
+    def reindex(self, target, method=None, level=None, limit=None,
+                tolerance=None):
+        """
+        Create index with target's values (move/add/delete values as necessary)
+
+        Returns
+        -------
+        new_index : pd.Index
+            Resulting index
+        indexer : np.ndarray or None
+            Indices of output values in original index
+
+        """
+
+        if method is not None:
+            raise NotImplementedError("argument method is not implemented for "
+                                      "CategoricalIndex.reindex")
+        if level is not None:
+            raise NotImplementedError("argument level is not implemented for "
+                                      "CategoricalIndex.reindex")
+        if limit is not None:
+            raise NotImplementedError("argument limit is not implemented for "
+                                      "CategoricalIndex.reindex")
+
+        target = ibase._ensure_index(target)
+
+        if not is_categorical_dtype(target) and not target.is_unique:
+            raise ValueError("cannot reindex with a non-unique indexer")
+
+        indexer, missing = self.get_indexer_non_unique(np.array(target))
+
+        if len(self.codes):
+            new_target = self.take(indexer)
+        else:
+            new_target = target
+
+        # filling in missing if needed
+        if len(missing):
+            cats = self.categories.get_indexer(target)
+
+            if (cats == -1).any():
+                # coerce to a regular index here!
+                result = Index(np.array(self), name=self.name)
+                new_target, indexer, _ = result._reindex_non_unique(
+                    np.array(target))
+            else:
+
+                codes = new_target.codes.copy()
+                codes[indexer == -1] = cats[missing]
+                new_target = self._create_from_codes(codes)
+
+        # we always want to return an Index type here
+        # to be consistent with .reindex for other index types (e.g. they don't
+        # coerce based on the actual values, only on the dtype)
+        # unless we had an initial Categorical to begin with
+        # in which case we are going to conform to the passed Categorical
+        new_target = np.asarray(new_target)
+        if is_categorical_dtype(target):
+            new_target = target._shallow_copy(new_target, name=self.name)
+        else:
+            new_target = Index(new_target, name=self.name)
+
+        return new_target, indexer
+
+    def _reindex_non_unique(self, target):
+        """ reindex from a non-unique; which CategoricalIndex's are almost
+        always
+        """
+        new_target, indexer = self.reindex(target)
+        new_indexer = None
+
+        check = indexer == -1
+        if check.any():
+            new_indexer = np.arange(len(self.take(indexer)))
+            new_indexer[check] = -1
+
+        cats = self.categories.get_indexer(target)
+        if not (cats == -1).any():
+            # .reindex returns normal Index. Revert to CategoricalIndex if
+            # all targets are included in my categories
+            new_target = self._shallow_copy(new_target)
+
+        return new_target, indexer, new_indexer
+
+    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
+    def get_indexer(self, target, method=None, limit=None, tolerance=None):
+        from pandas.core.arrays.categorical import _recode_for_categories
+
+        method = missing.clean_reindex_fill_method(method)
+        target = ibase._ensure_index(target)
+
+        if self.is_unique and self.equals(target):
+            return np.arange(len(self), dtype='intp')
+
+        if method == 'pad' or method == 'backfill':
+            raise NotImplementedError("method='pad' and method='backfill' not "
+                                      "implemented yet for CategoricalIndex")
+        elif method == 'nearest':
+            raise NotImplementedError("method='nearest' not implemented yet "
+                                      'for CategoricalIndex')
+
+        if (isinstance(target, CategoricalIndex) and
+                self.values.is_dtype_equal(target)):
+            if self.values.equals(target.values):
+                # we have the same codes
+                codes = target.codes
+            else:
+                codes = _recode_for_categories(target.codes,
+                                               target.categories,
+                                               self.values.categories)
+        else:
+            if isinstance(target, CategoricalIndex):
+                code_indexer = self.categories.get_indexer(target.categories)
+                codes = take_1d(code_indexer, target.codes, fill_value=-1)
+            else:
+                codes = self.categories.get_indexer(target)
+
+        indexer, _ = self._engine.get_indexer_non_unique(codes)
+        return _ensure_platform_int(indexer)
+
+    @Appender(_index_shared_docs['get_indexer_non_unique'] % _index_doc_kwargs)
+    def get_indexer_non_unique(self, target):
+        target = ibase._ensure_index(target)
+
+        if isinstance(target, CategoricalIndex):
+            # Indexing on codes is more efficient if categories are the same:
+            if target.categories is self.categories:
+                target = target.codes
+                indexer, missing = self._engine.get_indexer_non_unique(target)
+                return _ensure_platform_int(indexer), missing
+            target = target.values
+
+        codes = self.categories.get_indexer(target)
+        indexer, missing = self._engine.get_indexer_non_unique(codes)
+        return _ensure_platform_int(indexer), missing
+
+    @Appender(_index_shared_docs['_convert_scalar_indexer'])
+    def _convert_scalar_indexer(self, key, kind=None):
+        if self.categories._defer_to_indexing:
+            return self.categories._convert_scalar_indexer(key, kind=kind)
+
+        return super(CategoricalIndex, self)._convert_scalar_indexer(
+            key, kind=kind)
+
+    @Appender(_index_shared_docs['_convert_list_indexer'])
+    def _convert_list_indexer(self, keyarr, kind=None):
+        # Return our indexer or raise if all of the values are not included in
+        # the categories
+
+        if self.categories._defer_to_indexing:
+            indexer = self.categories._convert_list_indexer(keyarr, kind=kind)
+            return Index(self.codes).get_indexer_for(indexer)
+
+        indexer = self.categories.get_indexer(np.asarray(keyarr))
+        if (indexer == -1).any():
+            raise KeyError(
+                "a list-indexer must only "
+                "include values that are "
+                "in the categories")
+
+        return self.get_indexer(keyarr)
+
+    @Appender(_index_shared_docs['_convert_arr_indexer'])
+    def _convert_arr_indexer(self, keyarr):
+        keyarr = com._asarray_tuplesafe(keyarr)
+
+        if self.categories._defer_to_indexing:
+            return keyarr
+
+        return self._shallow_copy(keyarr)
+
+    @Appender(_index_shared_docs['_convert_index_indexer'])
+    def _convert_index_indexer(self, keyarr):
+        return self._shallow_copy(keyarr)
+
+    @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
+    def take(self, indices, axis=0, allow_fill=True,
+             fill_value=None, **kwargs):
+        nv.validate_take(tuple(), kwargs)
+        indices = _ensure_platform_int(indices)
+        taken = self._assert_take_fillable(self.codes, indices,
+                                           allow_fill=allow_fill,
+                                           fill_value=fill_value,
+                                           na_value=-1)
+        return self._create_from_codes(taken)
+
+    def is_dtype_equal(self, other):
+        return self._data.is_dtype_equal(other)
+
+    take_nd = take
+
+    def map(self, mapper):
+        """
+        Map values using input correspondence (a dict, Series, or function).
+
+        Maps the values (their categories, not the codes) of the index to new
+        categories. If the mapping correspondence is one-to-one the result is a
+        :class:`~pandas.CategoricalIndex` which has the same order property as
+        the original, otherwise an :class:`~pandas.Index` is returned.
+
+        If a `dict` or :class:`~pandas.Series` is used any unmapped category is
+        mapped to `NaN`. Note that if this happens an :class:`~pandas.Index`
+        will be returned.
+
+        Parameters
+        ----------
+        mapper : function, dict, or Series
+            Mapping correspondence.
+
+        Returns
+        -------
+        pandas.CategoricalIndex or pandas.Index
+            Mapped index.
+
+        See Also
+        --------
+        Index.map : Apply a mapping correspondence on an
+            :class:`~pandas.Index`.
+        Series.map : Apply a mapping correspondence on a
+            :class:`~pandas.Series`.
+        Series.apply : Apply more complex functions on a
+            :class:`~pandas.Series`.
+
+        Examples
+        --------
+        >>> idx = pd.CategoricalIndex(['a', 'b', 'c'])
+        >>> idx
+        CategoricalIndex(['a', 'b', 'c'], categories=['a', 'b', 'c'],
+                         ordered=False, dtype='category')
+        >>> idx.map(lambda x: x.upper())
+        CategoricalIndex(['A', 'B', 'C'], categories=['A', 'B', 'C'],
+                         ordered=False, dtype='category')
+        >>> idx.map({'a': 'first', 'b': 'second', 'c': 'third'})
+        CategoricalIndex(['first', 'second', 'third'], categories=['first',
+                         'second', 'third'], ordered=False, dtype='category')
+
+        If the mapping is one-to-one the ordering of the categories is
+        preserved:
+
+        >>> idx = pd.CategoricalIndex(['a', 'b', 'c'], ordered=True)
+        >>> idx
+        CategoricalIndex(['a', 'b', 'c'], categories=['a', 'b', 'c'],
+                         ordered=True, dtype='category')
+        >>> idx.map({'a': 3, 'b': 2, 'c': 1})
+        CategoricalIndex([3, 2, 1], categories=[3, 2, 1], ordered=True,
+                         dtype='category')
+
+        If the mapping is not one-to-one an :class:`~pandas.Index` is returned:
+
+        >>> idx.map({'a': 'first', 'b': 'second', 'c': 'first'})
+        Index(['first', 'second', 'first'], dtype='object')
+
+        If a `dict` is used, all unmapped categories are mapped to `NaN` and
+        the result is an :class:`~pandas.Index`:
+
+        >>> idx.map({'a': 'first', 'b': 'second'})
+        Index(['first', 'second', nan], dtype='object')
+        """
+        return self._shallow_copy_with_infer(self.values.map(mapper))
+
+    def delete(self, loc):
+        """
+        Make new Index with passed location(-s) deleted
+
+        Returns
+        -------
+        new_index : Index
+        """
+        return self._create_from_codes(np.delete(self.codes, loc))
+
+    def insert(self, loc, item):
+        """
+        Make new Index inserting new item at location. Follows
+        Python list.append semantics for negative values
+
+        Parameters
+        ----------
+        loc : int
+        item : object
+
+        Returns
+        -------
+        new_index : Index
+
+        Raises
+        ------
+        ValueError if the item is not in the categories
+
+        """
+        code = self.categories.get_indexer([item])
+        if (code == -1) and not (is_scalar(item) and isna(item)):
+            raise TypeError("cannot insert an item into a CategoricalIndex "
+                            "that is not already an existing category")
+
+        codes = self.codes
+        codes = np.concatenate((codes[:loc], code, codes[loc:]))
+        return self._create_from_codes(codes)
+
+    def _concat(self, to_concat, name):
+        # if calling index is category, don't check dtype of others
+        return CategoricalIndex._concat_same_dtype(self, to_concat, name)
+
+    def _concat_same_dtype(self, to_concat, name):
+        """
+        Concatenate to_concat which has the same class
+        ValueError if other is not in the categories
+        """
+        to_concat = [self._is_dtype_compat(c) for c in to_concat]
+        codes = np.concatenate([c.codes for c in to_concat])
+        result = self._create_from_codes(codes, name=name)
+        # if name is None, _create_from_codes sets self.name
+        result.name = name
+        return result
+
+    def _codes_for_groupby(self, sort, observed):
+        """ Return a Categorical adjusted for groupby """
+        return self.values._codes_for_groupby(sort, observed)
+
+    @classmethod
+    def _add_comparison_methods(cls):
+        """ add in comparison methods """
+
+        def _make_compare(op):
+            opname = '__{op}__'.format(op=op.__name__)
+
+            def _evaluate_compare(self, other):
+
+                # if we have a Categorical type, then must have the same
+                # categories
+                if isinstance(other, CategoricalIndex):
+                    other = other._values
+                elif isinstance(other, Index):
+                    other = self._create_categorical(
+                        other._values, dtype=self.dtype)
+
+                if isinstance(other, (ABCCategorical, np.ndarray,
+                                      ABCSeries)):
+                    if len(self.values) != len(other):
+                        raise ValueError("Lengths must match to compare")
+
+                if isinstance(other, ABCCategorical):
+                    if not self.values.is_dtype_equal(other):
+                        raise TypeError("categorical index comparisons must "
+                                        "have the same categories and ordered "
+                                        "attributes")
+
+                result = op(self.values, other)
+                if isinstance(result, ABCSeries):
+                    # Dispatch to pd.Categorical returned NotImplemented
+                    # and we got a Series back; down-cast to ndarray
+                    result = result.values
+                return result
+
+            return compat.set_function_name(_evaluate_compare, opname, cls)
+
+        cls.__eq__ = _make_compare(operator.eq)
+        cls.__ne__ = _make_compare(operator.ne)
+        cls.__lt__ = _make_compare(operator.lt)
+        cls.__gt__ = _make_compare(operator.gt)
+        cls.__le__ = _make_compare(operator.le)
+        cls.__ge__ = _make_compare(operator.ge)
+
+    def _delegate_method(self, name, *args, **kwargs):
+        """ method delegation to the ._values """
+        method = getattr(self._values, name)
+        if 'inplace' in kwargs:
+            raise ValueError("cannot use inplace with CategoricalIndex")
+        res = method(*args, **kwargs)
+        if is_scalar(res):
+            return res
+        return CategoricalIndex(res, name=self.name)
+
+    @classmethod
+    def _add_accessors(cls):
+        """ add in Categorical accessor methods """
+
+        CategoricalIndex._add_delegate_accessors(
+            delegate=Categorical, accessors=["rename_categories",
+                                             "reorder_categories",
+                                             "add_categories",
+                                             "remove_categories",
+                                             "remove_unused_categories",
+                                             "set_categories",
+                                             "as_ordered", "as_unordered",
+                                             "min", "max"],
+            typ='method', overwrite=True)
+
+
+CategoricalIndex._add_numeric_methods_add_sub_disabled()
+CategoricalIndex._add_numeric_methods_disabled()
+CategoricalIndex._add_logical_methods_disabled()
+CategoricalIndex._add_comparison_methods()
+CategoricalIndex._add_accessors()
diff --git a/pandas/core/indexes/datetimelike.py b/pandas/core/indexes/datetimelike.py
new file mode 100644
index 0000000000000..5afa99d7b6fe8
--- /dev/null
+++ b/pandas/core/indexes/datetimelike.py
@@ -0,0 +1,1250 @@
+# -*- coding: utf-8 -*-
+"""
+Base and utility classes for tseries type pandas objects.
+"""
+import warnings
+import operator
+from datetime import datetime, timedelta
+
+from pandas import compat
+from pandas.compat.numpy import function as nv
+from pandas.core.tools.timedeltas import to_timedelta
+
+import numpy as np
+
+from pandas._libs import lib, iNaT, NaT, Timedelta
+from pandas._libs.tslibs.period import (Period, IncompatibleFrequency,
+                                        _DIFFERENT_FREQ_INDEX)
+from pandas._libs.tslibs.timedeltas import delta_to_nanoseconds
+from pandas._libs.tslibs.timestamps import round_ns
+
+from pandas.core.dtypes.common import (
+    _ensure_int64,
+    is_dtype_equal,
+    is_float,
+    is_integer,
+    is_list_like,
+    is_scalar,
+    is_bool_dtype,
+    is_offsetlike,
+    is_categorical_dtype,
+    is_datetime_or_timedelta_dtype,
+    is_float_dtype,
+    is_integer_dtype,
+    is_object_dtype,
+    is_string_dtype,
+    is_datetime64_dtype,
+    is_datetime64tz_dtype,
+    is_datetime64_any_dtype,
+    is_period_dtype,
+    is_timedelta64_dtype)
+from pandas.core.dtypes.generic import (
+    ABCIndex, ABCSeries, ABCDataFrame, ABCPeriodIndex, ABCIndexClass)
+from pandas.core.dtypes.missing import isna
+from pandas.core import common as com, algorithms, ops
+from pandas.core.algorithms import checked_add_with_arr
+from pandas.errors import NullFrequencyError, PerformanceWarning
+import pandas.io.formats.printing as printing
+
+from pandas.core.indexes.base import Index, _index_shared_docs
+from pandas.util._decorators import Appender, cache_readonly
+import pandas.core.dtypes.concat as _concat
+import pandas.tseries.frequencies as frequencies
+from pandas.tseries.offsets import Tick, DateOffset
+
+import pandas.core.indexes.base as ibase
+_index_doc_kwargs = dict(ibase._index_doc_kwargs)
+
+
+class DatelikeOps(object):
+    """ common ops for DatetimeIndex/PeriodIndex, but not TimedeltaIndex """
+
+    def strftime(self, date_format):
+        return Index(self.format(date_format=date_format),
+                     dtype=compat.text_type)
+    strftime.__doc__ = """
+    Convert to Index using specified date_format.
+
+    Return an Index of formatted strings specified by date_format, which
+    supports the same string format as the python standard library. Details
+    of the string format can be found in `python string format doc <{0}>`__
+
+    Parameters
+    ----------
+    date_format : str
+        Date format string (e.g. "%Y-%m-%d").
+
+    Returns
+    -------
+    Index
+        Index of formatted strings
+
+    See Also
+    --------
+    pandas.to_datetime : Convert the given argument to datetime
+    DatetimeIndex.normalize : Return DatetimeIndex with times to midnight.
+    DatetimeIndex.round : Round the DatetimeIndex to the specified freq.
+    DatetimeIndex.floor : Floor the DatetimeIndex to the specified freq.
+
+    Examples
+    --------
+    >>> rng = pd.date_range(pd.Timestamp("2018-03-10 09:00"),
+    ...                     periods=3, freq='s')
+    >>> rng.strftime('%B %d, %Y, %r')
+    Index(['March 10, 2018, 09:00:00 AM', 'March 10, 2018, 09:00:01 AM',
+           'March 10, 2018, 09:00:02 AM'],
+          dtype='object')
+    """.format("https://docs.python.org/3/library/datetime.html"
+               "#strftime-and-strptime-behavior")
+
+
+class TimelikeOps(object):
+    """ common ops for TimedeltaIndex/DatetimeIndex, but not PeriodIndex """
+
+    _round_doc = (
+        """
+        {op} the data to the specified `freq`.
+
+        Parameters
+        ----------
+        freq : str or Offset
+            The frequency level to {op} the index to. Must be a fixed
+            frequency like 'S' (second) not 'ME' (month end). See
+            :ref:`frequency aliases <timeseries.offset_aliases>` for
+            a list of possible `freq` values.
+
+        Returns
+        -------
+        DatetimeIndex, TimedeltaIndex, or Series
+            Index of the same type for a DatetimeIndex or TimedeltaIndex,
+            or a Series with the same index for a Series.
+
+        Raises
+        ------
+        ValueError if the `freq` cannot be converted.
+
+        Examples
+        --------
+        **DatetimeIndex**
+
+        >>> rng = pd.date_range('1/1/2018 11:59:00', periods=3, freq='min')
+        >>> rng
+        DatetimeIndex(['2018-01-01 11:59:00', '2018-01-01 12:00:00',
+                       '2018-01-01 12:01:00'],
+                      dtype='datetime64[ns]', freq='T')
+        """)
+
+    _round_example = (
+        """>>> rng.round('H')
+        DatetimeIndex(['2018-01-01 12:00:00', '2018-01-01 12:00:00',
+                       '2018-01-01 12:00:00'],
+                      dtype='datetime64[ns]', freq=None)
+
+        **Series**
+
+        >>> pd.Series(rng).dt.round("H")
+        0   2018-01-01 12:00:00
+        1   2018-01-01 12:00:00
+        2   2018-01-01 12:00:00
+        dtype: datetime64[ns]
+        """)
+
+    _floor_example = (
+        """>>> rng.floor('H')
+        DatetimeIndex(['2018-01-01 11:00:00', '2018-01-01 12:00:00',
+                       '2018-01-01 12:00:00'],
+                      dtype='datetime64[ns]', freq=None)
+
+        **Series**
+
+        >>> pd.Series(rng).dt.floor("H")
+        0   2018-01-01 11:00:00
+        1   2018-01-01 12:00:00
+        2   2018-01-01 12:00:00
+        dtype: datetime64[ns]
+        """
+    )
+
+    _ceil_example = (
+        """>>> rng.ceil('H')
+        DatetimeIndex(['2018-01-01 12:00:00', '2018-01-01 12:00:00',
+                       '2018-01-01 13:00:00'],
+                      dtype='datetime64[ns]', freq=None)
+
+        **Series**
+
+        >>> pd.Series(rng).dt.ceil("H")
+        0   2018-01-01 12:00:00
+        1   2018-01-01 12:00:00
+        2   2018-01-01 13:00:00
+        dtype: datetime64[ns]
+        """
+    )
+
+    def _round(self, freq, rounder):
+        # round the local times
+        values = _ensure_datetimelike_to_i8(self)
+        result = round_ns(values, rounder, freq)
+        result = self._maybe_mask_results(result, fill_value=NaT)
+
+        attribs = self._get_attributes_dict()
+        if 'freq' in attribs:
+            attribs['freq'] = None
+        if 'tz' in attribs:
+            attribs['tz'] = None
+        return self._ensure_localized(
+            self._shallow_copy(result, **attribs))
+
+    @Appender((_round_doc + _round_example).format(op="round"))
+    def round(self, freq, *args, **kwargs):
+        return self._round(freq, np.round)
+
+    @Appender((_round_doc + _floor_example).format(op="floor"))
+    def floor(self, freq):
+        return self._round(freq, np.floor)
+
+    @Appender((_round_doc + _ceil_example).format(op="ceil"))
+    def ceil(self, freq):
+        return self._round(freq, np.ceil)
+
+    @classmethod
+    def _validate_frequency(cls, index, freq, **kwargs):
+        """
+        Validate that a frequency is compatible with the values of a given
+        DatetimeIndex or TimedeltaIndex
+
+        Parameters
+        ----------
+        index : DatetimeIndex or TimedeltaIndex
+            The index on which to determine if the given frequency is valid
+        freq : DateOffset
+            The frequency to validate
+        """
+        inferred = index.inferred_freq
+        if index.empty or inferred == freq.freqstr:
+            return None
+
+        on_freq = cls._generate(
+            index[0], None, len(index), None, freq, **kwargs)
+        if not np.array_equal(index.asi8, on_freq.asi8):
+            msg = ('Inferred frequency {infer} from passed values does not '
+                   'conform to passed frequency {passed}')
+            raise ValueError(msg.format(infer=inferred, passed=freq.freqstr))
+
+    @property
+    def freq(self):
+        """Return the frequency object if it is set, otherwise None"""
+        return self._freq
+
+    @freq.setter
+    def freq(self, value):
+        if value is not None:
+            value = frequencies.to_offset(value)
+            self._validate_frequency(self, value)
+
+        self._freq = value
+
+
+class DatetimeIndexOpsMixin(object):
+    """ common ops mixin to support a unified interface datetimelike Index """
+
+    def equals(self, other):
+        """
+        Determines if two Index objects contain the same elements.
+        """
+        if self.is_(other):
+            return True
+
+        if not isinstance(other, ABCIndexClass):
+            return False
+        elif not isinstance(other, type(self)):
+            try:
+                other = type(self)(other)
+            except Exception:
+                return False
+
+        if not is_dtype_equal(self.dtype, other.dtype):
+            # have different timezone
+            return False
+
+        # ToDo: Remove this when PeriodDtype is added
+        elif isinstance(self, ABCPeriodIndex):
+            if not isinstance(other, ABCPeriodIndex):
+                return False
+            if self.freq != other.freq:
+                return False
+
+        return np.array_equal(self.asi8, other.asi8)
+
+    def __iter__(self):
+        return (self._box_func(v) for v in self.asi8)
+
+    @staticmethod
+    def _join_i8_wrapper(joinf, dtype, with_indexers=True):
+        """ create the join wrapper methods """
+
+        @staticmethod
+        def wrapper(left, right):
+            if isinstance(left, (np.ndarray, ABCIndex, ABCSeries)):
+                left = left.view('i8')
+            if isinstance(right, (np.ndarray, ABCIndex, ABCSeries)):
+                right = right.view('i8')
+            results = joinf(left, right)
+            if with_indexers:
+                join_index, left_indexer, right_indexer = results
+                join_index = join_index.view(dtype)
+                return join_index, left_indexer, right_indexer
+            return results
+
+        return wrapper
+
+    def _evaluate_compare(self, other, op):
+        """
+        We have been called because a comparison between
+        8 aware arrays. numpy >= 1.11 will
+        now warn about NaT comparisons
+        """
+
+        # coerce to a similar object
+        if not isinstance(other, type(self)):
+            if not is_list_like(other):
+                # scalar
+                other = [other]
+            elif is_scalar(lib.item_from_zerodim(other)):
+                # ndarray scalar
+                other = [other.item()]
+            other = type(self)(other)
+
+        # compare
+        result = op(self.asi8, other.asi8)
+
+        # technically we could support bool dtyped Index
+        # for now just return the indexing array directly
+        mask = (self._isnan) | (other._isnan)
+        if is_bool_dtype(result):
+            result[mask] = False
+            return result
+
+        result[mask] = iNaT
+        try:
+            return Index(result)
+        except TypeError:
+            return result
+
+    def _ensure_localized(self, result):
+        """
+        ensure that we are re-localized
+
+        This is for compat as we can then call this on all datetimelike
+        indexes generally (ignored for Period/Timedelta)
+
+        Parameters
+        ----------
+        result : DatetimeIndex / i8 ndarray
+
+        Returns
+        -------
+        localized DTI
+        """
+
+        # reconvert to local tz
+        if getattr(self, 'tz', None) is not None:
+            if not isinstance(result, ABCIndexClass):
+                result = self._simple_new(result)
+            result = result.tz_localize(self.tz)
+        return result
+
+    @property
+    def _box_func(self):
+        """
+        box function to get object from internal representation
+        """
+        raise com.AbstractMethodError(self)
+
+    def _box_values(self, values):
+        """
+        apply box func to passed values
+        """
+        return lib.map_infer(values, self._box_func)
+
+    def _box_values_as_index(self):
+        """
+        return object Index which contains boxed values
+        """
+        from pandas.core.index import Index
+        return Index(self._box_values(self.asi8), name=self.name, dtype=object)
+
+    def _format_with_header(self, header, **kwargs):
+        return header + list(self._format_native_types(**kwargs))
+
+    @Appender(_index_shared_docs['__contains__'] % _index_doc_kwargs)
+    def __contains__(self, key):
+        try:
+            res = self.get_loc(key)
+            return (is_scalar(res) or isinstance(res, slice) or
+                    (is_list_like(res) and len(res)))
+        except (KeyError, TypeError, ValueError):
+            return False
+
+    contains = __contains__
+
+    def __getitem__(self, key):
+        """
+        This getitem defers to the underlying array, which by-definition can
+        only handle list-likes, slices, and integer scalars
+        """
+
+        is_int = is_integer(key)
+        if is_scalar(key) and not is_int:
+            raise IndexError("only integers, slices (`:`), ellipsis (`...`), "
+                             "numpy.newaxis (`None`) and integer or boolean "
+                             "arrays are valid indices")
+
+        getitem = self._data.__getitem__
+        if is_int:
+            val = getitem(key)
+            return self._box_func(val)
+        else:
+            if com.is_bool_indexer(key):
+                key = np.asarray(key)
+                if key.all():
+                    key = slice(0, None, None)
+                else:
+                    key = lib.maybe_booleans_to_slice(key.view(np.uint8))
+
+            attribs = self._get_attributes_dict()
+
+            is_period = isinstance(self, ABCPeriodIndex)
+            if is_period:
+                freq = self.freq
+            else:
+                freq = None
+                if isinstance(key, slice):
+                    if self.freq is not None and key.step is not None:
+                        freq = key.step * self.freq
+                    else:
+                        freq = self.freq
+
+            attribs['freq'] = freq
+
+            result = getitem(key)
+            if result.ndim > 1:
+                # To support MPL which performs slicing with 2 dim
+                # even though it only has 1 dim by definition
+                if is_period:
+                    return self._simple_new(result, **attribs)
+                return result
+
+            return self._simple_new(result, **attribs)
+
+    @property
+    def freqstr(self):
+        """
+        Return the frequency object as a string if it is set, otherwise None
+        """
+        if self.freq is None:
+            return None
+        return self.freq.freqstr
+
+    @cache_readonly
+    def inferred_freq(self):
+        """
+        Tries to return a string representing a frequency guess,
+        generated by infer_freq.  Returns None if it can't autodetect the
+        frequency.
+        """
+        try:
+            return frequencies.infer_freq(self)
+        except ValueError:
+            return None
+
+    def _nat_new(self, box=True):
+        """
+        Return Index or ndarray filled with NaT which has the same
+        length as the caller.
+
+        Parameters
+        ----------
+        box : boolean, default True
+            - If True returns a Index as the same as caller.
+            - If False returns ndarray of np.int64.
+        """
+        result = np.zeros(len(self), dtype=np.int64)
+        result.fill(iNaT)
+        if not box:
+            return result
+
+        attribs = self._get_attributes_dict()
+        if not is_period_dtype(self):
+            attribs['freq'] = None
+        return self._simple_new(result, **attribs)
+
+    # Try to run function on index first, and then on elements of index
+    # Especially important for group-by functionality
+    def map(self, f):
+        try:
+            result = f(self)
+
+            # Try to use this result if we can
+            if isinstance(result, np.ndarray):
+                result = Index(result)
+
+            if not isinstance(result, Index):
+                raise TypeError('The map function must return an Index object')
+            return result
+        except Exception:
+            return self.astype(object).map(f)
+
+    def sort_values(self, return_indexer=False, ascending=True):
+        """
+        Return sorted copy of Index
+        """
+        if return_indexer:
+            _as = self.argsort()
+            if not ascending:
+                _as = _as[::-1]
+            sorted_index = self.take(_as)
+            return sorted_index, _as
+        else:
+            sorted_values = np.sort(self._ndarray_values)
+            attribs = self._get_attributes_dict()
+            freq = attribs['freq']
+
+            if freq is not None and not isinstance(self, ABCPeriodIndex):
+                if freq.n > 0 and not ascending:
+                    freq = freq * -1
+                elif freq.n < 0 and ascending:
+                    freq = freq * -1
+            attribs['freq'] = freq
+
+            if not ascending:
+                sorted_values = sorted_values[::-1]
+
+            return self._simple_new(sorted_values, **attribs)
+
+    @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
+    def take(self, indices, axis=0, allow_fill=True,
+             fill_value=None, **kwargs):
+        nv.validate_take(tuple(), kwargs)
+        indices = _ensure_int64(indices)
+
+        maybe_slice = lib.maybe_indices_to_slice(indices, len(self))
+        if isinstance(maybe_slice, slice):
+            return self[maybe_slice]
+
+        taken = self._assert_take_fillable(self.asi8, indices,
+                                           allow_fill=allow_fill,
+                                           fill_value=fill_value,
+                                           na_value=iNaT)
+
+        # keep freq in PeriodIndex, reset otherwise
+        freq = self.freq if isinstance(self, ABCPeriodIndex) else None
+        return self._shallow_copy(taken, freq=freq)
+
+    _can_hold_na = True
+
+    _na_value = NaT
+    """The expected NA value to use with this index."""
+
+    @cache_readonly
+    def _isnan(self):
+        """ return if each value is nan"""
+        return (self.asi8 == iNaT)
+
+    @property
+    def asobject(self):
+        """Return object Index which contains boxed values.
+
+        .. deprecated:: 0.23.0
+            Use ``astype(object)`` instead.
+
+        *this is an internal non-public method*
+        """
+        warnings.warn("'asobject' is deprecated. Use 'astype(object)'"
+                      " instead", FutureWarning, stacklevel=2)
+        return self.astype(object)
+
+    def _convert_tolerance(self, tolerance, target):
+        tolerance = np.asarray(to_timedelta(tolerance, box=False))
+        if target.size != tolerance.size and tolerance.size > 1:
+            raise ValueError('list-like tolerance size must match '
+                             'target index size')
+        return tolerance
+
+    def _maybe_mask_results(self, result, fill_value=None, convert=None):
+        """
+        Parameters
+        ----------
+        result : a ndarray
+        convert : string/dtype or None
+
+        Returns
+        -------
+        result : ndarray with values replace by the fill_value
+
+        mask the result if needed, convert to the provided dtype if its not
+        None
+
+        This is an internal routine
+        """
+
+        if self.hasnans:
+            if convert:
+                result = result.astype(convert)
+            if fill_value is None:
+                fill_value = np.nan
+            result[self._isnan] = fill_value
+        return result
+
+    def tolist(self):
+        """
+        return a list of the underlying data
+        """
+        return list(self.astype(object))
+
+    def min(self, axis=None, *args, **kwargs):
+        """
+        Return the minimum value of the Index or minimum along
+        an axis.
+
+        See also
+        --------
+        numpy.ndarray.min
+        """
+        nv.validate_min(args, kwargs)
+
+        try:
+            i8 = self.asi8
+
+            # quick check
+            if len(i8) and self.is_monotonic:
+                if i8[0] != iNaT:
+                    return self._box_func(i8[0])
+
+            if self.hasnans:
+                min_stamp = self[~self._isnan].asi8.min()
+            else:
+                min_stamp = i8.min()
+            return self._box_func(min_stamp)
+        except ValueError:
+            return self._na_value
+
+    def argmin(self, axis=None, *args, **kwargs):
+        """
+        Returns the indices of the minimum values along an axis.
+        See `numpy.ndarray.argmin` for more information on the
+        `axis` parameter.
+
+        See also
+        --------
+        numpy.ndarray.argmin
+        """
+        nv.validate_argmin(args, kwargs)
+
+        i8 = self.asi8
+        if self.hasnans:
+            mask = self._isnan
+            if mask.all():
+                return -1
+            i8 = i8.copy()
+            i8[mask] = np.iinfo('int64').max
+        return i8.argmin()
+
+    def max(self, axis=None, *args, **kwargs):
+        """
+        Return the maximum value of the Index or maximum along
+        an axis.
+
+        See also
+        --------
+        numpy.ndarray.max
+        """
+        nv.validate_max(args, kwargs)
+
+        try:
+            i8 = self.asi8
+
+            # quick check
+            if len(i8) and self.is_monotonic:
+                if i8[-1] != iNaT:
+                    return self._box_func(i8[-1])
+
+            if self.hasnans:
+                max_stamp = self[~self._isnan].asi8.max()
+            else:
+                max_stamp = i8.max()
+            return self._box_func(max_stamp)
+        except ValueError:
+            return self._na_value
+
+    def argmax(self, axis=None, *args, **kwargs):
+        """
+        Returns the indices of the maximum values along an axis.
+        See `numpy.ndarray.argmax` for more information on the
+        `axis` parameter.
+
+        See also
+        --------
+        numpy.ndarray.argmax
+        """
+        nv.validate_argmax(args, kwargs)
+
+        i8 = self.asi8
+        if self.hasnans:
+            mask = self._isnan
+            if mask.all():
+                return -1
+            i8 = i8.copy()
+            i8[mask] = 0
+        return i8.argmax()
+
+    @property
+    def _formatter_func(self):
+        raise com.AbstractMethodError(self)
+
+    def _format_attrs(self):
+        """
+        Return a list of tuples of the (attr,formatted_value)
+        """
+        attrs = super(DatetimeIndexOpsMixin, self)._format_attrs()
+        for attrib in self._attributes:
+            if attrib == 'freq':
+                freq = self.freqstr
+                if freq is not None:
+                    freq = "'%s'" % freq
+                attrs.append(('freq', freq))
+        return attrs
+
+    @cache_readonly
+    def _resolution(self):
+        return frequencies.Resolution.get_reso_from_freq(self.freqstr)
+
+    @cache_readonly
+    def resolution(self):
+        """
+        Returns day, hour, minute, second, millisecond or microsecond
+        """
+        return frequencies.Resolution.get_str(self._resolution)
+
+    def _convert_scalar_indexer(self, key, kind=None):
+        """
+        we don't allow integer or float indexing on datetime-like when using
+        loc
+
+        Parameters
+        ----------
+        key : label of the slice bound
+        kind : {'ix', 'loc', 'getitem', 'iloc'} or None
+        """
+
+        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
+
+        # we don't allow integer/float indexing for loc
+        # we don't allow float indexing for ix/getitem
+        if is_scalar(key):
+            is_int = is_integer(key)
+            is_flt = is_float(key)
+            if kind in ['loc'] and (is_int or is_flt):
+                self._invalid_indexer('index', key)
+            elif kind in ['ix', 'getitem'] and is_flt:
+                self._invalid_indexer('index', key)
+
+        return (super(DatetimeIndexOpsMixin, self)
+                ._convert_scalar_indexer(key, kind=kind))
+
+    def _add_datelike(self, other):
+        raise TypeError("cannot add {cls} and {typ}"
+                        .format(cls=type(self).__name__,
+                                typ=type(other).__name__))
+
+    def _sub_datelike(self, other):
+        raise com.AbstractMethodError(self)
+
+    def _add_nat(self):
+        """Add pd.NaT to self"""
+        if is_period_dtype(self):
+            raise TypeError('Cannot add {cls} and {typ}'
+                            .format(cls=type(self).__name__,
+                                    typ=type(NaT).__name__))
+
+        # GH#19124 pd.NaT is treated like a timedelta for both timedelta
+        # and datetime dtypes
+        return self._nat_new(box=True)
+
+    def _sub_nat(self):
+        """Subtract pd.NaT from self"""
+        # GH#19124 Timedelta - datetime is not in general well-defined.
+        # We make an exception for pd.NaT, which in this case quacks
+        # like a timedelta.
+        # For datetime64 dtypes by convention we treat NaT as a datetime, so
+        # this subtraction returns a timedelta64 dtype.
+        # For period dtype, timedelta64 is a close-enough return dtype.
+        result = self._nat_new(box=False)
+        return result.view('timedelta64[ns]')
+
+    def _sub_period(self, other):
+        return NotImplemented
+
+    def _sub_period_array(self, other):
+        """
+        Subtract one PeriodIndex from another.  This is only valid if they
+        have the same frequency.
+
+        Parameters
+        ----------
+        other : PeriodIndex
+
+        Returns
+        -------
+        result : np.ndarray[object]
+            Array of DateOffset objects; nulls represented by NaT
+        """
+        if not is_period_dtype(self):
+            raise TypeError("cannot subtract {dtype}-dtype to {cls}"
+                            .format(dtype=other.dtype,
+                                    cls=type(self).__name__))
+
+        if not len(self) == len(other):
+            raise ValueError("cannot subtract indices of unequal length")
+        if self.freq != other.freq:
+            msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
+            raise IncompatibleFrequency(msg)
+
+        new_values = checked_add_with_arr(self.asi8, -other.asi8,
+                                          arr_mask=self._isnan,
+                                          b_mask=other._isnan)
+
+        new_values = np.array([self.freq * x for x in new_values])
+        if self.hasnans or other.hasnans:
+            mask = (self._isnan) | (other._isnan)
+            new_values[mask] = NaT
+        return new_values
+
+    def _add_offset(self, offset):
+        raise com.AbstractMethodError(self)
+
+    def _addsub_offset_array(self, other, op):
+        """
+        Add or subtract array-like of DateOffset objects
+
+        Parameters
+        ----------
+        other : Index, np.ndarray
+            object-dtype containing pd.DateOffset objects
+        op : {operator.add, operator.sub}
+
+        Returns
+        -------
+        result : same class as self
+        """
+        assert op in [operator.add, operator.sub]
+        if len(other) == 1:
+            return op(self, other[0])
+
+        warnings.warn("Adding/subtracting array of DateOffsets to "
+                      "{cls} not vectorized"
+                      .format(cls=type(self).__name__), PerformanceWarning)
+
+        res_values = op(self.astype('O').values, np.array(other))
+        kwargs = {}
+        if not is_period_dtype(self):
+            kwargs['freq'] = 'infer'
+        return self._constructor(res_values, **kwargs)
+
+    def _addsub_int_array(self, other, op):
+        """
+        Add or subtract array-like of integers equivalent to applying
+        `shift` pointwise.
+
+        Parameters
+        ----------
+        other : Index, np.ndarray
+            integer-dtype
+        op : {operator.add, operator.sub}
+
+        Returns
+        -------
+        result : same class as self
+        """
+        assert op in [operator.add, operator.sub]
+        if is_period_dtype(self):
+            # easy case for PeriodIndex
+            if op is operator.sub:
+                other = -other
+            res_values = checked_add_with_arr(self.asi8, other,
+                                              arr_mask=self._isnan)
+            res_values = res_values.view('i8')
+            res_values[self._isnan] = iNaT
+            return self._from_ordinals(res_values, freq=self.freq)
+
+        elif self.freq is None:
+            # GH#19123
+            raise NullFrequencyError("Cannot shift with no freq")
+
+        elif isinstance(self.freq, Tick):
+            # easy case where we can convert to timedelta64 operation
+            td = Timedelta(self.freq)
+            return op(self, td * other)
+
+        # We should only get here with DatetimeIndex; dispatch
+        # to _addsub_offset_array
+        assert not is_timedelta64_dtype(self)
+        return op(self, np.array(other) * self.freq)
+
+    @classmethod
+    def _add_datetimelike_methods(cls):
+        """
+        add in the datetimelike methods (as we may have to override the
+        superclass)
+        """
+
+        def __add__(self, other):
+            other = lib.item_from_zerodim(other)
+            if isinstance(other, (ABCSeries, ABCDataFrame)):
+                return NotImplemented
+
+            # scalar others
+            elif other is NaT:
+                result = self._add_nat()
+            elif isinstance(other, (Tick, timedelta, np.timedelta64)):
+                result = self._add_delta(other)
+            elif isinstance(other, DateOffset):
+                # specifically _not_ a Tick
+                result = self._add_offset(other)
+            elif isinstance(other, (datetime, np.datetime64)):
+                result = self._add_datelike(other)
+            elif is_integer(other):
+                # This check must come after the check for np.timedelta64
+                # as is_integer returns True for these
+                result = self.shift(other)
+
+            # array-like others
+            elif is_timedelta64_dtype(other):
+                # TimedeltaIndex, ndarray[timedelta64]
+                result = self._add_delta(other)
+            elif is_offsetlike(other):
+                # Array/Index of DateOffset objects
+                result = self._addsub_offset_array(other, operator.add)
+            elif is_datetime64_dtype(other) or is_datetime64tz_dtype(other):
+                # DatetimeIndex, ndarray[datetime64]
+                return self._add_datelike(other)
+            elif is_integer_dtype(other):
+                result = self._addsub_int_array(other, operator.add)
+            elif is_float_dtype(other) or is_period_dtype(other):
+                # Explicitly catch invalid dtypes
+                raise TypeError("cannot add {dtype}-dtype to {cls}"
+                                .format(dtype=other.dtype,
+                                        cls=type(self).__name__))
+            elif is_categorical_dtype(other):
+                # Categorical op will raise; defer explicitly
+                return NotImplemented
+            else:  # pragma: no cover
+                return NotImplemented
+
+            if result is NotImplemented:
+                return NotImplemented
+            elif not isinstance(result, Index):
+                # Index.__new__ will choose appropriate subclass for dtype
+                result = Index(result)
+            res_name = ops.get_op_result_name(self, other)
+            result.name = res_name
+            return result
+
+        cls.__add__ = __add__
+
+        def __radd__(self, other):
+            # alias for __add__
+            return self.__add__(other)
+        cls.__radd__ = __radd__
+
+        def __sub__(self, other):
+            from pandas import Index
+
+            other = lib.item_from_zerodim(other)
+            if isinstance(other, (ABCSeries, ABCDataFrame)):
+                return NotImplemented
+
+            # scalar others
+            elif other is NaT:
+                result = self._sub_nat()
+            elif isinstance(other, (Tick, timedelta, np.timedelta64)):
+                result = self._add_delta(-other)
+            elif isinstance(other, DateOffset):
+                # specifically _not_ a Tick
+                result = self._add_offset(-other)
+            elif isinstance(other, (datetime, np.datetime64)):
+                result = self._sub_datelike(other)
+            elif is_integer(other):
+                # This check must come after the check for np.timedelta64
+                # as is_integer returns True for these
+                result = self.shift(-other)
+            elif isinstance(other, Period):
+                result = self._sub_period(other)
+
+            # array-like others
+            elif is_timedelta64_dtype(other):
+                # TimedeltaIndex, ndarray[timedelta64]
+                result = self._add_delta(-other)
+            elif is_offsetlike(other):
+                # Array/Index of DateOffset objects
+                result = self._addsub_offset_array(other, operator.sub)
+            elif is_datetime64_dtype(other) or is_datetime64tz_dtype(other):
+                # DatetimeIndex, ndarray[datetime64]
+                result = self._sub_datelike(other)
+            elif is_period_dtype(other):
+                # PeriodIndex
+                result = self._sub_period_array(other)
+            elif is_integer_dtype(other):
+                result = self._addsub_int_array(other, operator.sub)
+            elif isinstance(other, Index):
+                raise TypeError("cannot subtract {cls} and {typ}"
+                                .format(cls=type(self).__name__,
+                                        typ=type(other).__name__))
+            elif is_float_dtype(other):
+                # Explicitly catch invalid dtypes
+                raise TypeError("cannot subtract {dtype}-dtype from {cls}"
+                                .format(dtype=other.dtype,
+                                        cls=type(self).__name__))
+            elif is_categorical_dtype(other):
+                # Categorical op will raise; defer explicitly
+                return NotImplemented
+            else:  # pragma: no cover
+                return NotImplemented
+
+            if result is NotImplemented:
+                return NotImplemented
+            elif not isinstance(result, Index):
+                # Index.__new__ will choose appropriate subclass for dtype
+                result = Index(result)
+            res_name = ops.get_op_result_name(self, other)
+            result.name = res_name
+            return result
+
+        cls.__sub__ = __sub__
+
+        def __rsub__(self, other):
+            if is_datetime64_dtype(other) and is_timedelta64_dtype(self):
+                # ndarray[datetime64] cannot be subtracted from self, so
+                # we need to wrap in DatetimeIndex and flip the operation
+                from pandas import DatetimeIndex
+                return DatetimeIndex(other) - self
+            elif (is_datetime64_any_dtype(self) and hasattr(other, 'dtype') and
+                  not is_datetime64_any_dtype(other)):
+                # GH#19959 datetime - datetime is well-defined as timedelta,
+                # but any other type - datetime is not well-defined.
+                raise TypeError("cannot subtract {cls} from {typ}"
+                                .format(cls=type(self).__name__,
+                                        typ=type(other).__name__))
+            return -(self - other)
+        cls.__rsub__ = __rsub__
+
+        def __iadd__(self, other):
+            # alias for __add__
+            return self.__add__(other)
+        cls.__iadd__ = __iadd__
+
+        def __isub__(self, other):
+            # alias for __sub__
+            return self.__sub__(other)
+        cls.__isub__ = __isub__
+
+    def _add_delta(self, other):
+        return NotImplemented
+
+    def _add_delta_td(self, other):
+        """
+        Add a delta of a timedeltalike
+        return the i8 result view
+        """
+
+        inc = delta_to_nanoseconds(other)
+        new_values = checked_add_with_arr(self.asi8, inc,
+                                          arr_mask=self._isnan).view('i8')
+        if self.hasnans:
+            new_values[self._isnan] = iNaT
+        return new_values.view('i8')
+
+    def _add_delta_tdi(self, other):
+        """
+        Add a delta of a TimedeltaIndex
+        return the i8 result view
+        """
+
+        # delta operation
+        if not len(self) == len(other):
+            raise ValueError("cannot add indices of unequal length")
+
+        self_i8 = self.asi8
+        other_i8 = other.asi8
+        new_values = checked_add_with_arr(self_i8, other_i8,
+                                          arr_mask=self._isnan,
+                                          b_mask=other._isnan)
+        if self.hasnans or other.hasnans:
+            mask = (self._isnan) | (other._isnan)
+            new_values[mask] = iNaT
+        return new_values.view('i8')
+
+    def isin(self, values):
+        """
+        Compute boolean array of whether each index value is found in the
+        passed set of values
+
+        Parameters
+        ----------
+        values : set or sequence of values
+
+        Returns
+        -------
+        is_contained : ndarray (boolean dtype)
+        """
+        if not isinstance(values, type(self)):
+            try:
+                values = type(self)(values)
+            except ValueError:
+                return self.astype(object).isin(values)
+
+        return algorithms.isin(self.asi8, values.asi8)
+
+    def shift(self, n, freq=None):
+        """
+        Specialized shift which produces a DatetimeIndex
+
+        Parameters
+        ----------
+        n : int
+            Periods to shift by
+        freq : DateOffset or timedelta-like, optional
+
+        Returns
+        -------
+        shifted : DatetimeIndex
+        """
+        if freq is not None and freq != self.freq:
+            if isinstance(freq, compat.string_types):
+                freq = frequencies.to_offset(freq)
+            offset = n * freq
+            result = self + offset
+
+            if hasattr(self, 'tz'):
+                result._tz = self.tz
+
+            return result
+
+        if n == 0:
+            # immutable so OK
+            return self
+
+        if self.freq is None:
+            raise NullFrequencyError("Cannot shift with no freq")
+
+        start = self[0] + n * self.freq
+        end = self[-1] + n * self.freq
+        attribs = self._get_attributes_dict()
+        attribs['start'] = start
+        attribs['end'] = end
+        return type(self)(**attribs)
+
+    def repeat(self, repeats, *args, **kwargs):
+        """
+        Analogous to ndarray.repeat
+        """
+        nv.validate_repeat(args, kwargs)
+        if isinstance(self, ABCPeriodIndex):
+            freq = self.freq
+        else:
+            freq = None
+        return self._shallow_copy(self.asi8.repeat(repeats),
+                                  freq=freq)
+
+    @Appender(_index_shared_docs['where'] % _index_doc_kwargs)
+    def where(self, cond, other=None):
+        other = _ensure_datetimelike_to_i8(other)
+        values = _ensure_datetimelike_to_i8(self)
+        result = np.where(cond, values, other).astype('i8')
+
+        result = self._ensure_localized(result)
+        return self._shallow_copy(result,
+                                  **self._get_attributes_dict())
+
+    def _summary(self, name=None):
+        """
+        Return a summarized representation
+
+        Parameters
+        ----------
+        name : str
+            name to use in the summary representation
+
+        Returns
+        -------
+        String with a summarized representation of the index
+        """
+        formatter = self._formatter_func
+        if len(self) > 0:
+            index_summary = ', %s to %s' % (formatter(self[0]),
+                                            formatter(self[-1]))
+        else:
+            index_summary = ''
+
+        if name is None:
+            name = type(self).__name__
+        result = '%s: %s entries%s' % (printing.pprint_thing(name),
+                                       len(self), index_summary)
+        if self.freq:
+            result += '\nFreq: %s' % self.freqstr
+
+        # display as values, not quoted
+        result = result.replace("'", "")
+        return result
+
+    def _concat_same_dtype(self, to_concat, name):
+        """
+        Concatenate to_concat which has the same class
+        """
+        attribs = self._get_attributes_dict()
+        attribs['name'] = name
+
+        if not isinstance(self, ABCPeriodIndex):
+            # reset freq
+            attribs['freq'] = None
+
+        if getattr(self, 'tz', None) is not None:
+            return _concat._concat_datetimetz(to_concat, name)
+        else:
+            new_data = np.concatenate([c.asi8 for c in to_concat])
+        return self._simple_new(new_data, **attribs)
+
+    def astype(self, dtype, copy=True):
+        if is_object_dtype(dtype):
+            return self._box_values_as_index()
+        elif is_string_dtype(dtype) and not is_categorical_dtype(dtype):
+            return Index(self.format(), name=self.name, dtype=object)
+        elif is_integer_dtype(dtype):
+            return Index(self.values.astype('i8', copy=copy), name=self.name,
+                         dtype='i8')
+        elif (is_datetime_or_timedelta_dtype(dtype) and
+              not is_dtype_equal(self.dtype, dtype)) or is_float_dtype(dtype):
+            # disallow conversion between datetime/timedelta,
+            # and conversions for any datetimelike to float
+            msg = 'Cannot cast {name} to dtype {dtype}'
+            raise TypeError(msg.format(name=type(self).__name__, dtype=dtype))
+        return super(DatetimeIndexOpsMixin, self).astype(dtype, copy=copy)
+
+
+def _ensure_datetimelike_to_i8(other):
+    """ helper for coercing an input scalar or array to i8 """
+    if is_scalar(other) and isna(other):
+        other = iNaT
+    elif isinstance(other, ABCIndexClass):
+        # convert tz if needed
+        if getattr(other, 'tz', None) is not None:
+            other = other.tz_localize(None).asi8
+        else:
+            other = other.asi8
+    else:
+        try:
+            other = np.array(other, copy=False).view('i8')
+        except TypeError:
+            # period array cannot be coerces to int
+            other = Index(other).asi8
+    return other
diff --git a/pandas/core/indexes/datetimes.py b/pandas/core/indexes/datetimes.py
new file mode 100644
index 0000000000000..9515d41080f87
--- /dev/null
+++ b/pandas/core/indexes/datetimes.py
@@ -0,0 +1,2914 @@
+# pylint: disable=E1101
+from __future__ import division
+import operator
+import warnings
+from datetime import time, datetime, timedelta
+
+import numpy as np
+from pytz import utc
+
+from pandas.core.base import _shared_docs
+
+from pandas.core.dtypes.common import (
+    _INT64_DTYPE,
+    _NS_DTYPE,
+    is_object_dtype,
+    is_datetime64_dtype, is_datetime64tz_dtype,
+    is_datetimetz,
+    is_dtype_equal,
+    is_timedelta64_dtype,
+    is_integer,
+    is_float,
+    is_integer_dtype,
+    is_datetime64_ns_dtype, is_datetimelike,
+    is_period_dtype,
+    is_bool_dtype,
+    is_string_like,
+    is_list_like,
+    is_scalar,
+    pandas_dtype,
+    _ensure_int64)
+from pandas.core.dtypes.generic import ABCSeries
+from pandas.core.dtypes.dtypes import DatetimeTZDtype
+from pandas.core.dtypes.missing import isna
+
+import pandas.core.dtypes.concat as _concat
+from pandas.errors import PerformanceWarning
+from pandas.core.algorithms import checked_add_with_arr
+
+from pandas.core.indexes.base import Index, _index_shared_docs
+from pandas.core.indexes.numeric import Int64Index, Float64Index
+import pandas.compat as compat
+from pandas.tseries.frequencies import to_offset, get_period_alias, Resolution
+from pandas.core.indexes.datetimelike import (
+    DatelikeOps, TimelikeOps, DatetimeIndexOpsMixin)
+from pandas.tseries.offsets import (
+    DateOffset, generate_range, Tick, CDay, prefix_mapping)
+
+from pandas.core.tools.timedeltas import to_timedelta
+from pandas.util._decorators import (
+    Appender, cache_readonly, deprecate_kwarg, Substitution)
+import pandas.core.common as com
+import pandas.tseries.offsets as offsets
+import pandas.core.tools.datetimes as tools
+
+from pandas._libs import (lib, index as libindex, tslib as libts,
+                          join as libjoin, Timestamp)
+from pandas._libs.tslibs import (timezones, conversion, fields, parsing,
+                                 ccalendar,
+                                 resolution as libresolution)
+
+# -------- some conversion wrapper functions
+
+
+def _field_accessor(name, field, docstring=None):
+    def f(self):
+        values = self.asi8
+        if self.tz is not None:
+            if self.tz is not utc:
+                values = self._local_timestamps()
+
+        if field in self._bool_ops:
+            if field in ['is_month_start', 'is_month_end',
+                         'is_quarter_start', 'is_quarter_end',
+                         'is_year_start', 'is_year_end']:
+                freq = self.freq
+                month_kw = 12
+                if freq:
+                    kwds = freq.kwds
+                    month_kw = kwds.get('startingMonth', kwds.get('month', 12))
+
+                result = fields.get_start_end_field(values, field,
+                                                    self.freqstr, month_kw)
+            else:
+                result = fields.get_date_field(values, field)
+
+            # these return a boolean by-definition
+            return result
+
+        if field in self._object_ops:
+            result = fields.get_date_name_field(values, field)
+            result = self._maybe_mask_results(result)
+
+        else:
+            result = fields.get_date_field(values, field)
+            result = self._maybe_mask_results(result, convert='float64')
+
+        return Index(result, name=self.name)
+
+    f.__name__ = name
+    f.__doc__ = docstring
+    return property(f)
+
+
+def _dt_index_cmp(opname, cls):
+    """
+    Wrap comparison operations to convert datetime-like to datetime64
+    """
+    nat_result = True if opname == '__ne__' else False
+
+    def wrapper(self, other):
+        func = getattr(super(DatetimeIndex, self), opname)
+
+        if isinstance(other, (datetime, compat.string_types)):
+            if isinstance(other, datetime):
+                # GH#18435 strings get a pass from tzawareness compat
+                self._assert_tzawareness_compat(other)
+
+            other = _to_m8(other, tz=self.tz)
+            result = func(other)
+            if isna(other):
+                result.fill(nat_result)
+        else:
+            if isinstance(other, list):
+                other = DatetimeIndex(other)
+            elif not isinstance(other, (np.datetime64, np.ndarray,
+                                        Index, ABCSeries)):
+                # Following Timestamp convention, __eq__ is all-False
+                # and __ne__ is all True, others raise TypeError.
+                if opname == '__eq__':
+                    return np.zeros(shape=self.shape, dtype=bool)
+                elif opname == '__ne__':
+                    return np.ones(shape=self.shape, dtype=bool)
+                raise TypeError('%s type object %s' %
+                                (type(other), str(other)))
+
+            if is_datetimelike(other):
+                self._assert_tzawareness_compat(other)
+
+            result = func(np.asarray(other))
+            result = com._values_from_object(result)
+
+            # Make sure to pass an array to result[...]; indexing with
+            # Series breaks with older version of numpy
+            o_mask = np.array(isna(other))
+            if o_mask.any():
+                result[o_mask] = nat_result
+
+        if self.hasnans:
+            result[self._isnan] = nat_result
+
+        # support of bool dtype indexers
+        if is_bool_dtype(result):
+            return result
+        return Index(result)
+
+    return compat.set_function_name(wrapper, opname, cls)
+
+
+_midnight = time(0, 0)
+
+
+def _new_DatetimeIndex(cls, d):
+    """ This is called upon unpickling, rather than the default which doesn't
+    have arguments and breaks __new__ """
+
+    # data are already in UTC
+    # so need to localize
+    tz = d.pop('tz', None)
+
+    result = cls.__new__(cls, verify_integrity=False, **d)
+    if tz is not None:
+        result = result.tz_localize('UTC').tz_convert(tz)
+    return result
+
+
+class DatetimeIndex(DatelikeOps, TimelikeOps, DatetimeIndexOpsMixin,
+                    Int64Index):
+    """
+    Immutable ndarray of datetime64 data, represented internally as int64, and
+    which can be boxed to Timestamp objects that are subclasses of datetime and
+    carry metadata such as frequency information.
+
+    Parameters
+    ----------
+    data  : array-like (1-dimensional), optional
+        Optional datetime-like data to construct index with
+    copy  : bool
+        Make a copy of input ndarray
+    freq : string or pandas offset object, optional
+        One of pandas date offset strings or corresponding objects. The string
+        'infer' can be passed in order to set the frequency of the index as the
+        inferred frequency upon creation
+
+    start : starting value, datetime-like, optional
+        If data is None, start is used as the start point in generating regular
+        timestamp data.
+    periods  : int, optional, > 0
+        Number of periods to generate, if generating index. Takes precedence
+        over end argument
+    end   : end time, datetime-like, optional
+        If periods is none, generated index will extend to first conforming
+        time on or just past end argument
+    closed : string or None, default None
+        Make the interval closed with respect to the given frequency to
+        the 'left', 'right', or both sides (None)
+    tz : pytz.timezone or dateutil.tz.tzfile
+    ambiguous : 'infer', bool-ndarray, 'NaT', default 'raise'
+        - 'infer' will attempt to infer fall dst-transition hours based on
+          order
+        - bool-ndarray where True signifies a DST time, False signifies a
+          non-DST time (note that this flag is only applicable for ambiguous
+          times)
+        - 'NaT' will return NaT where there are ambiguous times
+        - 'raise' will raise an AmbiguousTimeError if there are ambiguous times
+    name : object
+        Name to be stored in the index
+    dayfirst : bool, default False
+        If True, parse dates in `data` with the day first order
+    yearfirst : bool, default False
+        If True parse dates in `data` with the year first order
+
+    Attributes
+    ----------
+    year
+    month
+    day
+    hour
+    minute
+    second
+    microsecond
+    nanosecond
+    date
+    time
+    dayofyear
+    weekofyear
+    week
+    dayofweek
+    weekday
+    quarter
+    tz
+    freq
+    freqstr
+    is_month_start
+    is_month_end
+    is_quarter_start
+    is_quarter_end
+    is_year_start
+    is_year_end
+    is_leap_year
+    inferred_freq
+
+    Methods
+    -------
+    normalize
+    strftime
+    snap
+    tz_convert
+    tz_localize
+    round
+    floor
+    ceil
+    to_period
+    to_perioddelta
+    to_pydatetime
+    to_series
+    to_frame
+    month_name
+    day_name
+
+    Notes
+    -----
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    See Also
+    ---------
+    Index : The base pandas Index type
+    TimedeltaIndex : Index of timedelta64 data
+    PeriodIndex : Index of Period data
+    pandas.to_datetime : Convert argument to datetime
+    """
+
+    _typ = 'datetimeindex'
+    _join_precedence = 10
+
+    def _join_i8_wrapper(joinf, **kwargs):
+        return DatetimeIndexOpsMixin._join_i8_wrapper(joinf, dtype='M8[ns]',
+                                                      **kwargs)
+
+    _inner_indexer = _join_i8_wrapper(libjoin.inner_join_indexer_int64)
+    _outer_indexer = _join_i8_wrapper(libjoin.outer_join_indexer_int64)
+    _left_indexer = _join_i8_wrapper(libjoin.left_join_indexer_int64)
+    _left_indexer_unique = _join_i8_wrapper(
+        libjoin.left_join_indexer_unique_int64, with_indexers=False)
+
+    @classmethod
+    def _add_comparison_methods(cls):
+        """ add in comparison methods """
+        cls.__eq__ = _dt_index_cmp('__eq__', cls)
+        cls.__ne__ = _dt_index_cmp('__ne__', cls)
+        cls.__lt__ = _dt_index_cmp('__lt__', cls)
+        cls.__gt__ = _dt_index_cmp('__gt__', cls)
+        cls.__le__ = _dt_index_cmp('__le__', cls)
+        cls.__ge__ = _dt_index_cmp('__ge__', cls)
+
+    _engine_type = libindex.DatetimeEngine
+
+    tz = None
+    _freq = None
+    _comparables = ['name', 'freqstr', 'tz']
+    _attributes = ['name', 'freq', 'tz']
+
+    # define my properties & methods for delegation
+    _bool_ops = ['is_month_start', 'is_month_end',
+                 'is_quarter_start', 'is_quarter_end', 'is_year_start',
+                 'is_year_end', 'is_leap_year']
+    _object_ops = ['weekday_name', 'freq', 'tz']
+    _field_ops = ['year', 'month', 'day', 'hour', 'minute', 'second',
+                  'weekofyear', 'week', 'weekday', 'dayofweek',
+                  'dayofyear', 'quarter', 'days_in_month',
+                  'daysinmonth', 'microsecond',
+                  'nanosecond']
+    _other_ops = ['date', 'time']
+    _datetimelike_ops = _field_ops + _object_ops + _bool_ops + _other_ops
+    _datetimelike_methods = ['to_period', 'tz_localize',
+                             'tz_convert',
+                             'normalize', 'strftime', 'round', 'floor',
+                             'ceil', 'month_name', 'day_name']
+
+    _is_numeric_dtype = False
+    _infer_as_myclass = True
+
+    def __new__(cls, data=None,
+                freq=None, start=None, end=None, periods=None, tz=None,
+                normalize=False, closed=None, ambiguous='raise',
+                dayfirst=False, yearfirst=False, dtype=None,
+                copy=False, name=None, verify_integrity=True):
+
+        # This allows to later ensure that the 'copy' parameter is honored:
+        if isinstance(data, Index):
+            ref_to_data = data._data
+        else:
+            ref_to_data = data
+
+        if name is None and hasattr(data, 'name'):
+            name = data.name
+
+        freq_infer = False
+        if not isinstance(freq, DateOffset):
+
+            # if a passed freq is None, don't infer automatically
+            if freq != 'infer':
+                freq = to_offset(freq)
+            else:
+                freq_infer = True
+                freq = None
+
+        if periods is not None:
+            if is_float(periods):
+                periods = int(periods)
+            elif not is_integer(periods):
+                msg = 'periods must be a number, got {periods}'
+                raise TypeError(msg.format(periods=periods))
+
+        # if dtype has an embedded tz, capture it
+        if dtype is not None:
+            try:
+                dtype = DatetimeTZDtype.construct_from_string(dtype)
+                dtz = getattr(dtype, 'tz', None)
+                if dtz is not None:
+                    if tz is not None and str(tz) != str(dtz):
+                        raise ValueError("cannot supply both a tz and a dtype"
+                                         " with a tz")
+                    tz = dtz
+            except TypeError:
+                pass
+
+        if data is None:
+            if freq is None and com._any_none(periods, start, end):
+                msg = 'Must provide freq argument if no data is supplied'
+                raise ValueError(msg)
+            else:
+                return cls._generate(start, end, periods, name, freq, tz=tz,
+                                     normalize=normalize, closed=closed,
+                                     ambiguous=ambiguous)
+
+        if not isinstance(data, (np.ndarray, Index, ABCSeries)):
+            if is_scalar(data):
+                raise ValueError('DatetimeIndex() must be called with a '
+                                 'collection of some kind, %s was passed'
+                                 % repr(data))
+            # other iterable of some kind
+            if not isinstance(data, (list, tuple)):
+                data = list(data)
+            data = np.asarray(data, dtype='O')
+        elif isinstance(data, ABCSeries):
+            data = data._values
+
+        # data must be Index or np.ndarray here
+        if not (is_datetime64_dtype(data) or is_datetimetz(data) or
+                is_integer_dtype(data) or lib.infer_dtype(data) == 'integer'):
+            data = tools.to_datetime(data, dayfirst=dayfirst,
+                                     yearfirst=yearfirst)
+
+        if isinstance(data, DatetimeIndex):
+            if tz is None:
+                tz = data.tz
+            elif data.tz is None:
+                data = data.tz_localize(tz, ambiguous=ambiguous)
+            else:
+                # the tz's must match
+                if str(tz) != str(data.tz):
+                    msg = ('data is already tz-aware {0}, unable to '
+                           'set specified tz: {1}')
+                    raise TypeError(msg.format(data.tz, tz))
+
+            subarr = data.values
+
+            if freq is None:
+                freq = data.freq
+                verify_integrity = False
+        elif issubclass(data.dtype.type, np.datetime64):
+            if data.dtype != _NS_DTYPE:
+                data = conversion.ensure_datetime64ns(data)
+            if tz is not None:
+                # Convert tz-naive to UTC
+                tz = timezones.maybe_get_tz(tz)
+                data = conversion.tz_localize_to_utc(data.view('i8'), tz,
+                                                     ambiguous=ambiguous)
+            subarr = data.view(_NS_DTYPE)
+        else:
+            # must be integer dtype otherwise
+            # assume this data are epoch timestamps
+            if data.dtype != _INT64_DTYPE:
+                data = data.astype(np.int64, copy=False)
+            subarr = data.view(_NS_DTYPE)
+
+        subarr = cls._simple_new(subarr, name=name, freq=freq, tz=tz)
+        if dtype is not None:
+            if not is_dtype_equal(subarr.dtype, dtype):
+                # dtype must be coerced to DatetimeTZDtype above
+                if subarr.tz is not None:
+                    raise ValueError("cannot localize from non-UTC data")
+
+        if verify_integrity and len(subarr) > 0:
+            if freq is not None and not freq_infer:
+                cls._validate_frequency(subarr, freq, ambiguous=ambiguous)
+
+        if freq_infer:
+            inferred = subarr.inferred_freq
+            if inferred:
+                subarr.freq = to_offset(inferred)
+
+        return subarr._deepcopy_if_needed(ref_to_data, copy)
+
+    @classmethod
+    def _generate(cls, start, end, periods, name, freq,
+                  tz=None, normalize=False, ambiguous='raise', closed=None):
+        if com._count_not_none(start, end, periods, freq) != 3:
+            raise ValueError('Of the four parameters: start, end, periods, '
+                             'and freq, exactly three must be specified')
+
+        _normalized = True
+
+        if start is not None:
+            start = Timestamp(start)
+
+        if end is not None:
+            end = Timestamp(end)
+
+        left_closed = False
+        right_closed = False
+
+        if start is None and end is None:
+            if closed is not None:
+                raise ValueError("Closed has to be None if not both of start"
+                                 "and end are defined")
+
+        if closed is None:
+            left_closed = True
+            right_closed = True
+        elif closed == "left":
+            left_closed = True
+        elif closed == "right":
+            right_closed = True
+        else:
+            raise ValueError("Closed has to be either 'left', 'right' or None")
+
+        try:
+            inferred_tz = timezones.infer_tzinfo(start, end)
+        except Exception:
+            raise TypeError('Start and end cannot both be tz-aware with '
+                            'different timezones')
+
+        inferred_tz = timezones.maybe_get_tz(inferred_tz)
+        tz = timezones.maybe_get_tz(tz)
+
+        if tz is not None and inferred_tz is not None:
+            if not timezones.tz_compare(inferred_tz, tz):
+                raise AssertionError("Inferred time zone not equal to passed "
+                                     "time zone")
+
+        elif inferred_tz is not None:
+            tz = inferred_tz
+
+        if start is not None:
+            if normalize:
+                start = libts.normalize_date(start)
+                _normalized = True
+            else:
+                _normalized = _normalized and start.time() == _midnight
+
+        if end is not None:
+            if normalize:
+                end = libts.normalize_date(end)
+                _normalized = True
+            else:
+                _normalized = _normalized and end.time() == _midnight
+
+        if hasattr(freq, 'delta') and freq != offsets.Day():
+            if inferred_tz is None and tz is not None:
+                # naive dates
+                if start is not None and start.tz is None:
+                    start = start.tz_localize(tz, ambiguous=False)
+
+                if end is not None and end.tz is None:
+                    end = end.tz_localize(tz, ambiguous=False)
+
+            if start and end:
+                if start.tz is None and end.tz is not None:
+                    start = start.tz_localize(end.tz, ambiguous=False)
+
+                if end.tz is None and start.tz is not None:
+                    end = end.tz_localize(start.tz, ambiguous=False)
+
+            if _use_cached_range(freq, _normalized, start, end):
+                index = cls._cached_range(start, end, periods=periods,
+                                          freq=freq, name=name)
+            else:
+                index = _generate_regular_range(start, end, periods, freq)
+
+        else:
+
+            if tz is not None:
+                # naive dates
+                if start is not None and start.tz is not None:
+                    start = start.replace(tzinfo=None)
+
+                if end is not None and end.tz is not None:
+                    end = end.replace(tzinfo=None)
+
+            if start and end:
+                if start.tz is None and end.tz is not None:
+                    end = end.replace(tzinfo=None)
+
+                if end.tz is None and start.tz is not None:
+                    start = start.replace(tzinfo=None)
+
+            if freq is not None:
+                if _use_cached_range(freq, _normalized, start, end):
+                    index = cls._cached_range(start, end, periods=periods,
+                                              freq=freq, name=name)
+                else:
+                    index = _generate_regular_range(start, end, periods, freq)
+
+                if tz is not None and getattr(index, 'tz', None) is None:
+                    index = conversion.tz_localize_to_utc(_ensure_int64(index),
+                                                          tz,
+                                                          ambiguous=ambiguous)
+                    index = index.view(_NS_DTYPE)
+
+                    # index is localized datetime64 array -> have to convert
+                    # start/end as well to compare
+                    if start is not None:
+                        start = start.tz_localize(tz).asm8
+                    if end is not None:
+                        end = end.tz_localize(tz).asm8
+            else:
+                # Create a linearly spaced date_range in local time
+                start = start.tz_localize(tz)
+                end = end.tz_localize(tz)
+                index = tools.to_datetime(np.linspace(start.value,
+                                                      end.value, periods),
+                                          utc=True)
+                index = index.tz_convert(tz)
+
+        if not left_closed and len(index) and index[0] == start:
+            index = index[1:]
+        if not right_closed and len(index) and index[-1] == end:
+            index = index[:-1]
+        index = cls._simple_new(index, name=name, freq=freq, tz=tz)
+        return index
+
+    @property
+    def _box_func(self):
+        return lambda x: Timestamp(x, freq=self.freq, tz=self.tz)
+
+    def _convert_for_op(self, value):
+        """ Convert value to be insertable to ndarray """
+        if self._has_same_tz(value):
+            return _to_m8(value)
+        raise ValueError('Passed item and index have different timezone')
+
+    def _local_timestamps(self):
+        if self.is_monotonic:
+            return conversion.tz_convert(self.asi8, utc, self.tz)
+        else:
+            values = self.asi8
+            indexer = values.argsort()
+            result = conversion.tz_convert(values.take(indexer), utc, self.tz)
+
+            n = len(indexer)
+            reverse = np.empty(n, dtype=np.int_)
+            reverse.put(indexer, np.arange(n))
+            return result.take(reverse)
+
+    @classmethod
+    def _simple_new(cls, values, name=None, freq=None, tz=None,
+                    dtype=None, **kwargs):
+        """
+        we require the we have a dtype compat for the values
+        if we are passed a non-dtype compat, then coerce using the constructor
+        """
+
+        if getattr(values, 'dtype', None) is None:
+            # empty, but with dtype compat
+            if values is None:
+                values = np.empty(0, dtype=_NS_DTYPE)
+                return cls(values, name=name, freq=freq, tz=tz,
+                           dtype=dtype, **kwargs)
+            values = np.array(values, copy=False)
+
+        if is_object_dtype(values):
+            return cls(values, name=name, freq=freq, tz=tz,
+                       dtype=dtype, **kwargs).values
+        elif not is_datetime64_dtype(values):
+            values = _ensure_int64(values).view(_NS_DTYPE)
+
+        result = object.__new__(cls)
+        result._data = values
+        result.name = name
+        result._freq = freq
+        result._tz = timezones.maybe_get_tz(tz)
+        result._tz = timezones.tz_standardize(result._tz)
+        result._reset_identity()
+        return result
+
+    def _assert_tzawareness_compat(self, other):
+        # adapted from _Timestamp._assert_tzawareness_compat
+        other_tz = getattr(other, 'tzinfo', None)
+        if is_datetime64tz_dtype(other):
+            # Get tzinfo from Series dtype
+            other_tz = other.dtype.tz
+        if other is libts.NaT:
+            # pd.NaT quacks both aware and naive
+            pass
+        elif self.tz is None:
+            if other_tz is not None:
+                raise TypeError('Cannot compare tz-naive and tz-aware '
+                                'datetime-like objects.')
+        elif other_tz is None:
+            raise TypeError('Cannot compare tz-naive and tz-aware '
+                            'datetime-like objects')
+
+    @property
+    def _values(self):
+        # tz-naive -> ndarray
+        # tz-aware -> DatetimeIndex
+        if self.tz is not None:
+            return self
+        else:
+            return self.values
+
+    @property
+    def tz(self):
+        # GH 18595
+        return self._tz
+
+    @tz.setter
+    def tz(self, value):
+        # GH 3746: Prevent localizing or converting the index by setting tz
+        raise AttributeError("Cannot directly set timezone. Use tz_localize() "
+                             "or tz_convert() as appropriate")
+
+    @property
+    def tzinfo(self):
+        """
+        Alias for tz attribute
+        """
+        return self.tz
+
+    @property
+    def size(self):
+        # TODO: Remove this when we have a DatetimeTZArray
+        # Necessary to avoid recursion error since DTI._values is a DTI
+        # for TZ-aware
+        return self._ndarray_values.size
+
+    @property
+    def shape(self):
+        # TODO: Remove this when we have a DatetimeTZArray
+        # Necessary to avoid recursion error since DTI._values is a DTI
+        # for TZ-aware
+        return self._ndarray_values.shape
+
+    @property
+    def nbytes(self):
+        # TODO: Remove this when we have a DatetimeTZArray
+        # Necessary to avoid recursion error since DTI._values is a DTI
+        # for TZ-aware
+        return self._ndarray_values.nbytes
+
+    @cache_readonly
+    def _timezone(self):
+        """ Comparable timezone both for pytz / dateutil"""
+        return timezones.get_timezone(self.tzinfo)
+
+    def _has_same_tz(self, other):
+        zzone = self._timezone
+
+        # vzone sholdn't be None if value is non-datetime like
+        if isinstance(other, np.datetime64):
+            # convert to Timestamp as np.datetime64 doesn't have tz attr
+            other = Timestamp(other)
+        vzone = timezones.get_timezone(getattr(other, 'tzinfo', '__no_tz__'))
+        return zzone == vzone
+
+    @classmethod
+    def _cached_range(cls, start=None, end=None, periods=None, freq=None,
+                      name=None):
+        if start is None and end is None:
+            # I somewhat believe this should never be raised externally
+            raise TypeError('Must specify either start or end.')
+        if start is not None:
+            start = Timestamp(start)
+        if end is not None:
+            end = Timestamp(end)
+        if (start is None or end is None) and periods is None:
+            raise TypeError(
+                'Must either specify period or provide both start and end.')
+
+        if freq is None:
+            # This can't happen with external-facing code
+            raise TypeError('Must provide freq.')
+
+        drc = _daterange_cache
+        if freq not in _daterange_cache:
+            xdr = generate_range(offset=freq, start=_CACHE_START,
+                                 end=_CACHE_END)
+
+            arr = tools.to_datetime(list(xdr), box=False)
+
+            cachedRange = DatetimeIndex._simple_new(arr)
+            cachedRange.freq = freq
+            cachedRange = cachedRange.tz_localize(None)
+            cachedRange.name = None
+            drc[freq] = cachedRange
+        else:
+            cachedRange = drc[freq]
+
+        if start is None:
+            if not isinstance(end, Timestamp):
+                raise AssertionError('end must be an instance of Timestamp')
+
+            end = freq.rollback(end)
+
+            endLoc = cachedRange.get_loc(end) + 1
+            startLoc = endLoc - periods
+        elif end is None:
+            if not isinstance(start, Timestamp):
+                raise AssertionError('start must be an instance of Timestamp')
+
+            start = freq.rollforward(start)
+
+            startLoc = cachedRange.get_loc(start)
+            endLoc = startLoc + periods
+        else:
+            if not freq.onOffset(start):
+                start = freq.rollforward(start)
+
+            if not freq.onOffset(end):
+                end = freq.rollback(end)
+
+            startLoc = cachedRange.get_loc(start)
+            endLoc = cachedRange.get_loc(end) + 1
+
+        indexSlice = cachedRange[startLoc:endLoc]
+        indexSlice.name = name
+        indexSlice.freq = freq
+
+        return indexSlice
+
+    def _mpl_repr(self):
+        # how to represent ourselves to matplotlib
+        return libts.ints_to_pydatetime(self.asi8, self.tz)
+
+    @cache_readonly
+    def _is_dates_only(self):
+        """Return a boolean if we are only dates (and don't have a timezone)"""
+        from pandas.io.formats.format import _is_dates_only
+        return _is_dates_only(self.values) and self.tz is None
+
+    @property
+    def _formatter_func(self):
+        from pandas.io.formats.format import _get_format_datetime64
+        formatter = _get_format_datetime64(is_dates_only=self._is_dates_only)
+        return lambda x: "'%s'" % formatter(x, tz=self.tz)
+
+    def __reduce__(self):
+
+        # we use a special reudce here because we need
+        # to simply set the .tz (and not reinterpret it)
+
+        d = dict(data=self._data)
+        d.update(self._get_attributes_dict())
+        return _new_DatetimeIndex, (self.__class__, d), None
+
+    def __setstate__(self, state):
+        """Necessary for making this object picklable"""
+        if isinstance(state, dict):
+            super(DatetimeIndex, self).__setstate__(state)
+
+        elif isinstance(state, tuple):
+
+            # < 0.15 compat
+            if len(state) == 2:
+                nd_state, own_state = state
+                data = np.empty(nd_state[1], dtype=nd_state[2])
+                np.ndarray.__setstate__(data, nd_state)
+
+                self.name = own_state[0]
+                self._freq = own_state[1]
+                self._tz = timezones.tz_standardize(own_state[2])
+
+                # provide numpy < 1.7 compat
+                if nd_state[2] == 'M8[us]':
+                    new_state = np.ndarray.__reduce__(data.astype('M8[ns]'))
+                    np.ndarray.__setstate__(data, new_state[2])
+
+            else:  # pragma: no cover
+                data = np.empty(state)
+                np.ndarray.__setstate__(data, state)
+
+            self._data = data
+            self._reset_identity()
+
+        else:
+            raise Exception("invalid pickle state")
+    _unpickle_compat = __setstate__
+
+    def _sub_datelike(self, other):
+        # subtract a datetime from myself, yielding a ndarray[timedelta64[ns]]
+        if isinstance(other, (DatetimeIndex, np.ndarray)):
+            # if other is an ndarray, we assume it is datetime64-dtype
+            other = DatetimeIndex(other)
+            # require tz compat
+            if not self._has_same_tz(other):
+                raise TypeError("{cls} subtraction must have the same "
+                                "timezones or no timezones"
+                                .format(cls=type(self).__name__))
+            result = self._sub_datelike_dti(other)
+        elif isinstance(other, (datetime, np.datetime64)):
+            assert other is not libts.NaT
+            other = Timestamp(other)
+            if other is libts.NaT:
+                return self - libts.NaT
+            # require tz compat
+            elif not self._has_same_tz(other):
+                raise TypeError("Timestamp subtraction must have the same "
+                                "timezones or no timezones")
+            else:
+                i8 = self.asi8
+                result = checked_add_with_arr(i8, -other.value,
+                                              arr_mask=self._isnan)
+                result = self._maybe_mask_results(result,
+                                                  fill_value=libts.iNaT)
+        else:
+            raise TypeError("cannot subtract {cls} and {typ}"
+                            .format(cls=type(self).__name__,
+                                    typ=type(other).__name__))
+        return result.view('timedelta64[ns]')
+
+    def _sub_datelike_dti(self, other):
+        """subtraction of two DatetimeIndexes"""
+        if not len(self) == len(other):
+            raise ValueError("cannot add indices of unequal length")
+
+        self_i8 = self.asi8
+        other_i8 = other.asi8
+        new_values = self_i8 - other_i8
+        if self.hasnans or other.hasnans:
+            mask = (self._isnan) | (other._isnan)
+            new_values[mask] = libts.iNaT
+        return new_values.view('timedelta64[ns]')
+
+    def _maybe_update_attributes(self, attrs):
+        """ Update Index attributes (e.g. freq) depending on op """
+        freq = attrs.get('freq', None)
+        if freq is not None:
+            # no need to infer if freq is None
+            attrs['freq'] = 'infer'
+        return attrs
+
+    def _add_delta(self, delta):
+        """
+        Add a timedelta-like, DateOffset, or TimedeltaIndex-like object
+        to self.
+
+        Parameters
+        ----------
+        delta : {timedelta, np.timedelta64, DateOffset,
+                 TimedelaIndex, ndarray[timedelta64]}
+
+        Returns
+        -------
+        result : DatetimeIndex
+
+        Notes
+        -----
+        The result's name is set outside of _add_delta by the calling
+        method (__add__ or __sub__)
+        """
+        from pandas import TimedeltaIndex
+
+        if isinstance(delta, (Tick, timedelta, np.timedelta64)):
+            new_values = self._add_delta_td(delta)
+        elif is_timedelta64_dtype(delta):
+            if not isinstance(delta, TimedeltaIndex):
+                delta = TimedeltaIndex(delta)
+            new_values = self._add_delta_tdi(delta)
+        else:
+            new_values = self.astype('O') + delta
+
+        tz = 'UTC' if self.tz is not None else None
+        result = DatetimeIndex(new_values, tz=tz, freq='infer')
+        if self.tz is not None and self.tz is not utc:
+            result = result.tz_convert(self.tz)
+        return result
+
+    def _add_offset(self, offset):
+        assert not isinstance(offset, Tick)
+        try:
+            if self.tz is not None:
+                values = self.tz_localize(None)
+            else:
+                values = self
+            result = offset.apply_index(values)
+            if self.tz is not None:
+                result = result.tz_localize(self.tz)
+
+        except NotImplementedError:
+            warnings.warn("Non-vectorized DateOffset being applied to Series "
+                          "or DatetimeIndex", PerformanceWarning)
+            result = self.astype('O') + offset
+
+        return DatetimeIndex(result, freq='infer')
+
+    def _format_native_types(self, na_rep='NaT', date_format=None, **kwargs):
+        from pandas.io.formats.format import _get_format_datetime64_from_values
+        format = _get_format_datetime64_from_values(self, date_format)
+
+        return libts.format_array_from_datetime(self.asi8,
+                                                tz=self.tz,
+                                                format=format,
+                                                na_rep=na_rep)
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        dtype = pandas_dtype(dtype)
+        if (is_datetime64_ns_dtype(dtype) and
+                not is_dtype_equal(dtype, self.dtype)):
+            # GH 18951: datetime64_ns dtype but not equal means different tz
+            new_tz = getattr(dtype, 'tz', None)
+            if getattr(self.dtype, 'tz', None) is None:
+                return self.tz_localize(new_tz)
+            return self.tz_convert(new_tz)
+        elif is_period_dtype(dtype):
+            return self.to_period(freq=dtype.freq)
+        return super(DatetimeIndex, self).astype(dtype, copy=copy)
+
+    def _get_time_micros(self):
+        values = self.asi8
+        if self.tz is not None and self.tz is not utc:
+            values = self._local_timestamps()
+        return fields.get_time_micros(values)
+
+    def to_series(self, keep_tz=False, index=None, name=None):
+        """
+        Create a Series with both index and values equal to the index keys
+        useful with map for returning an indexer based on an index
+
+        Parameters
+        ----------
+        keep_tz : optional, defaults False.
+            return the data keeping the timezone.
+
+            If keep_tz is True:
+
+              If the timezone is not set, the resulting
+              Series will have a datetime64[ns] dtype.
+
+              Otherwise the Series will have an datetime64[ns, tz] dtype; the
+              tz will be preserved.
+
+            If keep_tz is False:
+
+              Series will have a datetime64[ns] dtype. TZ aware
+              objects will have the tz removed.
+        index : Index, optional
+            index of resulting Series. If None, defaults to original index
+        name : string, optional
+            name of resulting Series. If None, defaults to name of original
+            index
+
+        Returns
+        -------
+        Series
+        """
+        from pandas import Series
+
+        if index is None:
+            index = self._shallow_copy()
+        if name is None:
+            name = self.name
+
+        return Series(self._to_embed(keep_tz), index=index, name=name)
+
+    def _to_embed(self, keep_tz=False, dtype=None):
+        """
+        return an array repr of this object, potentially casting to object
+
+        This is for internal compat
+        """
+        if dtype is not None:
+            return self.astype(dtype)._to_embed(keep_tz=keep_tz)
+
+        if keep_tz and self.tz is not None:
+
+            # preserve the tz & copy
+            return self.copy(deep=True)
+
+        return self.values.copy()
+
+    def to_pydatetime(self):
+        """
+        Return DatetimeIndex as object ndarray of datetime.datetime objects
+
+        Returns
+        -------
+        datetimes : ndarray
+        """
+        return libts.ints_to_pydatetime(self.asi8, tz=self.tz)
+
+    def to_period(self, freq=None):
+        """
+        Cast to PeriodIndex at a particular frequency.
+
+        Converts DatetimeIndex to PeriodIndex.
+
+        Parameters
+        ----------
+        freq : string or Offset, optional
+            One of pandas' :ref:`offset strings <timeseries.offset_aliases>`
+            or an Offset object. Will be inferred by default.
+
+        Returns
+        -------
+        PeriodIndex
+
+        Raises
+        ------
+        ValueError
+            When converting a DatetimeIndex with non-regular values, so that a
+            frequency cannot be inferred.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({"y": [1,2,3]},
+        ...                   index=pd.to_datetime(["2000-03-31 00:00:00",
+        ...                                         "2000-05-31 00:00:00",
+        ...                                         "2000-08-31 00:00:00"]))
+        >>> df.index.to_period("M")
+        PeriodIndex(['2000-03', '2000-05', '2000-08'],
+                    dtype='period[M]', freq='M')
+
+        Infer the daily frequency
+
+        >>> idx = pd.date_range("2017-01-01", periods=2)
+        >>> idx.to_period()
+        PeriodIndex(['2017-01-01', '2017-01-02'],
+                    dtype='period[D]', freq='D')
+
+        See also
+        --------
+        pandas.PeriodIndex: Immutable ndarray holding ordinal values
+        pandas.DatetimeIndex.to_pydatetime: Return DatetimeIndex as object
+        """
+        from pandas.core.indexes.period import PeriodIndex
+
+        if freq is None:
+            freq = self.freqstr or self.inferred_freq
+
+            if freq is None:
+                msg = ("You must pass a freq argument as "
+                       "current index has none.")
+                raise ValueError(msg)
+
+            freq = get_period_alias(freq)
+
+        return PeriodIndex(self.values, name=self.name, freq=freq, tz=self.tz)
+
+    def snap(self, freq='S'):
+        """
+        Snap time stamps to nearest occurring frequency
+
+        """
+        # Superdumb, punting on any optimizing
+        freq = to_offset(freq)
+
+        snapped = np.empty(len(self), dtype=_NS_DTYPE)
+
+        for i, v in enumerate(self):
+            s = v
+            if not freq.onOffset(s):
+                t0 = freq.rollback(s)
+                t1 = freq.rollforward(s)
+                if abs(s - t0) < abs(t1 - s):
+                    s = t0
+                else:
+                    s = t1
+            snapped[i] = s
+
+        # we know it conforms; skip check
+        return DatetimeIndex(snapped, freq=freq, verify_integrity=False)
+
+    def unique(self, level=None):
+        # Override here since IndexOpsMixin.unique uses self._values.unique
+        # For DatetimeIndex with TZ, that's a DatetimeIndex -> recursion error
+        # So we extract the tz-naive DatetimeIndex, unique that, and wrap the
+        # result with out TZ.
+        if self.tz is not None:
+            naive = type(self)(self._ndarray_values, copy=False)
+        else:
+            naive = self
+        result = super(DatetimeIndex, naive).unique(level=level)
+        return self._simple_new(result, name=self.name, tz=self.tz,
+                                freq=self.freq)
+
+    def union(self, other):
+        """
+        Specialized union for DatetimeIndex objects. If combine
+        overlapping ranges with the same DateOffset, will be much
+        faster than Index.union
+
+        Parameters
+        ----------
+        other : DatetimeIndex or array-like
+
+        Returns
+        -------
+        y : Index or DatetimeIndex
+        """
+        self._assert_can_do_setop(other)
+        if not isinstance(other, DatetimeIndex):
+            try:
+                other = DatetimeIndex(other)
+            except TypeError:
+                pass
+
+        this, other = self._maybe_utc_convert(other)
+
+        if this._can_fast_union(other):
+            return this._fast_union(other)
+        else:
+            result = Index.union(this, other)
+            if isinstance(result, DatetimeIndex):
+                result._tz = timezones.tz_standardize(this.tz)
+                if (result.freq is None and
+                        (this.freq is not None or other.freq is not None)):
+                    result.freq = to_offset(result.inferred_freq)
+            return result
+
+    def to_perioddelta(self, freq):
+        """
+        Calculate TimedeltaIndex of difference between index
+        values and index converted to periodIndex at specified
+        freq. Used for vectorized offsets
+
+        Parameters
+        ----------
+        freq: Period frequency
+
+        Returns
+        -------
+        y: TimedeltaIndex
+        """
+        return to_timedelta(self.asi8 - self.to_period(freq)
+                            .to_timestamp().asi8)
+
+    def union_many(self, others):
+        """
+        A bit of a hack to accelerate unioning a collection of indexes
+        """
+        this = self
+
+        for other in others:
+            if not isinstance(this, DatetimeIndex):
+                this = Index.union(this, other)
+                continue
+
+            if not isinstance(other, DatetimeIndex):
+                try:
+                    other = DatetimeIndex(other)
+                except TypeError:
+                    pass
+
+            this, other = this._maybe_utc_convert(other)
+
+            if this._can_fast_union(other):
+                this = this._fast_union(other)
+            else:
+                tz = this.tz
+                this = Index.union(this, other)
+                if isinstance(this, DatetimeIndex):
+                    this._tz = timezones.tz_standardize(tz)
+
+        if this.freq is None:
+            this.freq = to_offset(this.inferred_freq)
+        return this
+
+    def join(self, other, how='left', level=None, return_indexers=False,
+             sort=False):
+        """
+        See Index.join
+        """
+        if (not isinstance(other, DatetimeIndex) and len(other) > 0 and
+            other.inferred_type not in ('floating', 'integer', 'mixed-integer',
+                                        'mixed-integer-float', 'mixed')):
+            try:
+                other = DatetimeIndex(other)
+            except (TypeError, ValueError):
+                pass
+
+        this, other = self._maybe_utc_convert(other)
+        return Index.join(this, other, how=how, level=level,
+                          return_indexers=return_indexers, sort=sort)
+
+    def _maybe_utc_convert(self, other):
+        this = self
+        if isinstance(other, DatetimeIndex):
+            if self.tz is not None:
+                if other.tz is None:
+                    raise TypeError('Cannot join tz-naive with tz-aware '
+                                    'DatetimeIndex')
+            elif other.tz is not None:
+                raise TypeError('Cannot join tz-naive with tz-aware '
+                                'DatetimeIndex')
+
+            if not timezones.tz_compare(self.tz, other.tz):
+                this = self.tz_convert('UTC')
+                other = other.tz_convert('UTC')
+        return this, other
+
+    def _wrap_joined_index(self, joined, other):
+        name = self.name if self.name == other.name else None
+        if (isinstance(other, DatetimeIndex) and
+                self.freq == other.freq and
+                self._can_fast_union(other)):
+            joined = self._shallow_copy(joined)
+            joined.name = name
+            return joined
+        else:
+            tz = getattr(other, 'tz', None)
+            return self._simple_new(joined, name, tz=tz)
+
+    def _can_fast_union(self, other):
+        if not isinstance(other, DatetimeIndex):
+            return False
+
+        freq = self.freq
+
+        if freq is None or freq != other.freq:
+            return False
+
+        if not self.is_monotonic or not other.is_monotonic:
+            return False
+
+        if len(self) == 0 or len(other) == 0:
+            return True
+
+        # to make our life easier, "sort" the two ranges
+        if self[0] <= other[0]:
+            left, right = self, other
+        else:
+            left, right = other, self
+
+        right_start = right[0]
+        left_end = left[-1]
+
+        # Only need to "adjoin", not overlap
+        try:
+            return (right_start == left_end + freq) or right_start in left
+        except (ValueError):
+
+            # if we are comparing a freq that does not propagate timezones
+            # this will raise
+            return False
+
+    def _fast_union(self, other):
+        if len(other) == 0:
+            return self.view(type(self))
+
+        if len(self) == 0:
+            return other.view(type(self))
+
+        # to make our life easier, "sort" the two ranges
+        if self[0] <= other[0]:
+            left, right = self, other
+        else:
+            left, right = other, self
+
+        left_start, left_end = left[0], left[-1]
+        right_end = right[-1]
+
+        if not self.freq._should_cache():
+            # concatenate dates
+            if left_end < right_end:
+                loc = right.searchsorted(left_end, side='right')
+                right_chunk = right.values[loc:]
+                dates = _concat._concat_compat((left.values, right_chunk))
+                return self._shallow_copy(dates)
+            else:
+                return left
+        else:
+            return type(self)(start=left_start,
+                              end=max(left_end, right_end),
+                              freq=left.freq)
+
+    def __iter__(self):
+        """
+        Return an iterator over the boxed values
+
+        Returns
+        -------
+        Timestamps : ndarray
+        """
+
+        # convert in chunks of 10k for efficiency
+        data = self.asi8
+        length = len(self)
+        chunksize = 10000
+        chunks = int(length / chunksize) + 1
+        for i in range(chunks):
+            start_i = i * chunksize
+            end_i = min((i + 1) * chunksize, length)
+            converted = libts.ints_to_pydatetime(data[start_i:end_i],
+                                                 tz=self.tz, freq=self.freq,
+                                                 box="timestamp")
+            for v in converted:
+                yield v
+
+    def _wrap_union_result(self, other, result):
+        name = self.name if self.name == other.name else None
+        if not timezones.tz_compare(self.tz, other.tz):
+            raise ValueError('Passed item and index have different timezone')
+        return self._simple_new(result, name=name, freq=None, tz=self.tz)
+
+    def intersection(self, other):
+        """
+        Specialized intersection for DatetimeIndex objects. May be much faster
+        than Index.intersection
+
+        Parameters
+        ----------
+        other : DatetimeIndex or array-like
+
+        Returns
+        -------
+        y : Index or DatetimeIndex
+        """
+        self._assert_can_do_setop(other)
+        if not isinstance(other, DatetimeIndex):
+            try:
+                other = DatetimeIndex(other)
+            except (TypeError, ValueError):
+                pass
+            result = Index.intersection(self, other)
+            if isinstance(result, DatetimeIndex):
+                if result.freq is None:
+                    result.freq = to_offset(result.inferred_freq)
+            return result
+
+        elif (other.freq is None or self.freq is None or
+              other.freq != self.freq or
+              not other.freq.isAnchored() or
+              (not self.is_monotonic or not other.is_monotonic)):
+            result = Index.intersection(self, other)
+            result = self._shallow_copy(result._values, name=result.name,
+                                        tz=result.tz, freq=None)
+            if result.freq is None:
+                result.freq = to_offset(result.inferred_freq)
+            return result
+
+        if len(self) == 0:
+            return self
+        if len(other) == 0:
+            return other
+        # to make our life easier, "sort" the two ranges
+        if self[0] <= other[0]:
+            left, right = self, other
+        else:
+            left, right = other, self
+
+        end = min(left[-1], right[-1])
+        start = right[0]
+
+        if end < start:
+            return type(self)(data=[])
+        else:
+            lslice = slice(*left.slice_locs(start, end))
+            left_chunk = left.values[lslice]
+            return self._shallow_copy(left_chunk)
+
+    def _parsed_string_to_bounds(self, reso, parsed):
+        """
+        Calculate datetime bounds for parsed time string and its resolution.
+
+        Parameters
+        ----------
+        reso : Resolution
+            Resolution provided by parsed string.
+        parsed : datetime
+            Datetime from parsed string.
+
+        Returns
+        -------
+        lower, upper: pd.Timestamp
+
+        """
+        if reso == 'year':
+            return (Timestamp(datetime(parsed.year, 1, 1), tz=self.tz),
+                    Timestamp(datetime(parsed.year, 12, 31, 23,
+                                       59, 59, 999999), tz=self.tz))
+        elif reso == 'month':
+            d = ccalendar.get_days_in_month(parsed.year, parsed.month)
+            return (Timestamp(datetime(parsed.year, parsed.month, 1),
+                              tz=self.tz),
+                    Timestamp(datetime(parsed.year, parsed.month, d, 23,
+                                       59, 59, 999999), tz=self.tz))
+        elif reso == 'quarter':
+            qe = (((parsed.month - 1) + 2) % 12) + 1  # two months ahead
+            d = ccalendar.get_days_in_month(parsed.year, qe)  # at end of month
+            return (Timestamp(datetime(parsed.year, parsed.month, 1),
+                              tz=self.tz),
+                    Timestamp(datetime(parsed.year, qe, d, 23, 59,
+                                       59, 999999), tz=self.tz))
+        elif reso == 'day':
+            st = datetime(parsed.year, parsed.month, parsed.day)
+            return (Timestamp(st, tz=self.tz),
+                    Timestamp(Timestamp(st + offsets.Day(),
+                                        tz=self.tz).value - 1))
+        elif reso == 'hour':
+            st = datetime(parsed.year, parsed.month, parsed.day,
+                          hour=parsed.hour)
+            return (Timestamp(st, tz=self.tz),
+                    Timestamp(Timestamp(st + offsets.Hour(),
+                                        tz=self.tz).value - 1))
+        elif reso == 'minute':
+            st = datetime(parsed.year, parsed.month, parsed.day,
+                          hour=parsed.hour, minute=parsed.minute)
+            return (Timestamp(st, tz=self.tz),
+                    Timestamp(Timestamp(st + offsets.Minute(),
+                                        tz=self.tz).value - 1))
+        elif reso == 'second':
+            st = datetime(parsed.year, parsed.month, parsed.day,
+                          hour=parsed.hour, minute=parsed.minute,
+                          second=parsed.second)
+            return (Timestamp(st, tz=self.tz),
+                    Timestamp(Timestamp(st + offsets.Second(),
+                                        tz=self.tz).value - 1))
+        elif reso == 'microsecond':
+            st = datetime(parsed.year, parsed.month, parsed.day,
+                          parsed.hour, parsed.minute, parsed.second,
+                          parsed.microsecond)
+            return (Timestamp(st, tz=self.tz), Timestamp(st, tz=self.tz))
+        else:
+            raise KeyError
+
+    def _partial_date_slice(self, reso, parsed, use_lhs=True, use_rhs=True):
+        is_monotonic = self.is_monotonic
+        if (is_monotonic and reso in ['day', 'hour', 'minute', 'second'] and
+                self._resolution >= Resolution.get_reso(reso)):
+            # These resolution/monotonicity validations came from GH3931,
+            # GH3452 and GH2369.
+
+            # See also GH14826
+            raise KeyError
+
+        if reso == 'microsecond':
+            # _partial_date_slice doesn't allow microsecond resolution, but
+            # _parsed_string_to_bounds allows it.
+            raise KeyError
+
+        t1, t2 = self._parsed_string_to_bounds(reso, parsed)
+        stamps = self.asi8
+
+        if is_monotonic:
+
+            # we are out of range
+            if (len(stamps) and ((use_lhs and t1.value < stamps[0] and
+                                  t2.value < stamps[0]) or
+                                 ((use_rhs and t1.value > stamps[-1] and
+                                   t2.value > stamps[-1])))):
+                raise KeyError
+
+            # a monotonic (sorted) series can be sliced
+            left = stamps.searchsorted(
+                t1.value, side='left') if use_lhs else None
+            right = stamps.searchsorted(
+                t2.value, side='right') if use_rhs else None
+
+            return slice(left, right)
+
+        lhs_mask = (stamps >= t1.value) if use_lhs else True
+        rhs_mask = (stamps <= t2.value) if use_rhs else True
+
+        # try to find a the dates
+        return (lhs_mask & rhs_mask).nonzero()[0]
+
+    def _maybe_promote(self, other):
+        if other.inferred_type == 'date':
+            other = DatetimeIndex(other)
+        return self, other
+
+    def get_value(self, series, key):
+        """
+        Fast lookup of value from 1-dimensional ndarray. Only use this if you
+        know what you're doing
+        """
+
+        if isinstance(key, datetime):
+
+            # needed to localize naive datetimes
+            if self.tz is not None:
+                key = Timestamp(key, tz=self.tz)
+
+            return self.get_value_maybe_box(series, key)
+
+        if isinstance(key, time):
+            locs = self.indexer_at_time(key)
+            return series.take(locs)
+
+        try:
+            return com._maybe_box(self, Index.get_value(self, series, key),
+                                  series, key)
+        except KeyError:
+            try:
+                loc = self._get_string_slice(key)
+                return series[loc]
+            except (TypeError, ValueError, KeyError):
+                pass
+
+            try:
+                return self.get_value_maybe_box(series, key)
+            except (TypeError, ValueError, KeyError):
+                raise KeyError(key)
+
+    def get_value_maybe_box(self, series, key):
+        # needed to localize naive datetimes
+        if self.tz is not None:
+            key = Timestamp(key, tz=self.tz)
+        elif not isinstance(key, Timestamp):
+            key = Timestamp(key)
+        values = self._engine.get_value(com._values_from_object(series),
+                                        key, tz=self.tz)
+        return com._maybe_box(self, values, series, key)
+
+    def get_loc(self, key, method=None, tolerance=None):
+        """
+        Get integer location for requested label
+
+        Returns
+        -------
+        loc : int
+        """
+
+        if tolerance is not None:
+            # try converting tolerance now, so errors don't get swallowed by
+            # the try/except clauses below
+            tolerance = self._convert_tolerance(tolerance, np.asarray(key))
+
+        if isinstance(key, datetime):
+            # needed to localize naive datetimes
+            key = Timestamp(key, tz=self.tz)
+            return Index.get_loc(self, key, method, tolerance)
+
+        if isinstance(key, time):
+            if method is not None:
+                raise NotImplementedError('cannot yet lookup inexact labels '
+                                          'when key is a time object')
+            return self.indexer_at_time(key)
+
+        try:
+            return Index.get_loc(self, key, method, tolerance)
+        except (KeyError, ValueError, TypeError):
+            try:
+                return self._get_string_slice(key)
+            except (TypeError, KeyError, ValueError):
+                pass
+
+            try:
+                stamp = Timestamp(key, tz=self.tz)
+                return Index.get_loc(self, stamp, method, tolerance)
+            except KeyError:
+                raise KeyError(key)
+            except ValueError as e:
+                # list-like tolerance size must match target index size
+                if 'list-like' in str(e):
+                    raise e
+                raise KeyError(key)
+
+    def _maybe_cast_slice_bound(self, label, side, kind):
+        """
+        If label is a string, cast it to datetime according to resolution.
+
+        Parameters
+        ----------
+        label : object
+        side : {'left', 'right'}
+        kind : {'ix', 'loc', 'getitem'}
+
+        Returns
+        -------
+        label :  object
+
+        Notes
+        -----
+        Value of `side` parameter should be validated in caller.
+
+        """
+        assert kind in ['ix', 'loc', 'getitem', None]
+
+        if is_float(label) or isinstance(label, time) or is_integer(label):
+            self._invalid_indexer('slice', label)
+
+        if isinstance(label, compat.string_types):
+            freq = getattr(self, 'freqstr',
+                           getattr(self, 'inferred_freq', None))
+            _, parsed, reso = parsing.parse_time_string(label, freq)
+            lower, upper = self._parsed_string_to_bounds(reso, parsed)
+            # lower, upper form the half-open interval:
+            #   [parsed, parsed + 1 freq)
+            # because label may be passed to searchsorted
+            # the bounds need swapped if index is reverse sorted and has a
+            # length > 1 (is_monotonic_decreasing gives True for empty
+            # and length 1 index)
+            if self._is_strictly_monotonic_decreasing and len(self) > 1:
+                return upper if side == 'left' else lower
+            return lower if side == 'left' else upper
+        else:
+            return label
+
+    def _get_string_slice(self, key, use_lhs=True, use_rhs=True):
+        freq = getattr(self, 'freqstr',
+                       getattr(self, 'inferred_freq', None))
+        _, parsed, reso = parsing.parse_time_string(key, freq)
+        loc = self._partial_date_slice(reso, parsed, use_lhs=use_lhs,
+                                       use_rhs=use_rhs)
+        return loc
+
+    def slice_indexer(self, start=None, end=None, step=None, kind=None):
+        """
+        Return indexer for specified label slice.
+        Index.slice_indexer, customized to handle time slicing.
+
+        In addition to functionality provided by Index.slice_indexer, does the
+        following:
+
+        - if both `start` and `end` are instances of `datetime.time`, it
+          invokes `indexer_between_time`
+        - if `start` and `end` are both either string or None perform
+          value-based selection in non-monotonic cases.
+
+        """
+        # For historical reasons DatetimeIndex supports slices between two
+        # instances of datetime.time as if it were applying a slice mask to
+        # an array of (self.hour, self.minute, self.seconds, self.microsecond).
+        if isinstance(start, time) and isinstance(end, time):
+            if step is not None and step != 1:
+                raise ValueError('Must have step size of 1 with time slices')
+            return self.indexer_between_time(start, end)
+
+        if isinstance(start, time) or isinstance(end, time):
+            raise KeyError('Cannot mix time and non-time slice keys')
+
+        try:
+            return Index.slice_indexer(self, start, end, step, kind=kind)
+        except KeyError:
+            # For historical reasons DatetimeIndex by default supports
+            # value-based partial (aka string) slices on non-monotonic arrays,
+            # let's try that.
+            if ((start is None or isinstance(start, compat.string_types)) and
+                    (end is None or isinstance(end, compat.string_types))):
+                mask = True
+                if start is not None:
+                    start_casted = self._maybe_cast_slice_bound(
+                        start, 'left', kind)
+                    mask = start_casted <= self
+
+                if end is not None:
+                    end_casted = self._maybe_cast_slice_bound(
+                        end, 'right', kind)
+                    mask = (self <= end_casted) & mask
+
+                indexer = mask.nonzero()[0][::step]
+                if len(indexer) == len(self):
+                    return slice(None)
+                else:
+                    return indexer
+            else:
+                raise
+
+    @property
+    def offset(self):
+        """get/set the frequency of the Index"""
+        msg = ('DatetimeIndex.offset has been deprecated and will be removed '
+               'in a future version; use DatetimeIndex.freq instead.')
+        warnings.warn(msg, FutureWarning, stacklevel=2)
+        return self.freq
+
+    @offset.setter
+    def offset(self, value):
+        """get/set the frequency of the Index"""
+        msg = ('DatetimeIndex.offset has been deprecated and will be removed '
+               'in a future version; use DatetimeIndex.freq instead.')
+        warnings.warn(msg, FutureWarning, stacklevel=2)
+        self.freq = value
+
+    year = _field_accessor('year', 'Y', "The year of the datetime")
+    month = _field_accessor('month', 'M',
+                            "The month as January=1, December=12")
+    day = _field_accessor('day', 'D', "The days of the datetime")
+    hour = _field_accessor('hour', 'h', "The hours of the datetime")
+    minute = _field_accessor('minute', 'm', "The minutes of the datetime")
+    second = _field_accessor('second', 's', "The seconds of the datetime")
+    microsecond = _field_accessor('microsecond', 'us',
+                                  "The microseconds of the datetime")
+    nanosecond = _field_accessor('nanosecond', 'ns',
+                                 "The nanoseconds of the datetime")
+    weekofyear = _field_accessor('weekofyear', 'woy',
+                                 "The week ordinal of the year")
+    week = weekofyear
+    dayofweek = _field_accessor('dayofweek', 'dow',
+                                "The day of the week with Monday=0, Sunday=6")
+    weekday = dayofweek
+
+    weekday_name = _field_accessor(
+        'weekday_name',
+        'weekday_name',
+        "The name of day in a week (ex: Friday)\n\n.. deprecated:: 0.23.0")
+
+    dayofyear = _field_accessor('dayofyear', 'doy',
+                                "The ordinal day of the year")
+    quarter = _field_accessor('quarter', 'q', "The quarter of the date")
+    days_in_month = _field_accessor(
+        'days_in_month',
+        'dim',
+        "The number of days in the month")
+    daysinmonth = days_in_month
+    is_month_start = _field_accessor(
+        'is_month_start',
+        'is_month_start',
+        "Logical indicating if first day of month (defined by frequency)")
+    is_month_end = _field_accessor(
+        'is_month_end',
+        'is_month_end',
+        """
+        Indicator for whether the date is the last day of the month.
+
+        Returns
+        -------
+        Series or array
+            For Series, returns a Series with boolean values. For
+            DatetimeIndex, returns a boolean array.
+
+        See Also
+        --------
+        is_month_start : Indicator for whether the date is the first day
+            of the month.
+
+        Examples
+        --------
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on DatetimeIndex.
+
+        >>> dates = pd.Series(pd.date_range("2018-02-27", periods=3))
+        >>> dates
+        0   2018-02-27
+        1   2018-02-28
+        2   2018-03-01
+        dtype: datetime64[ns]
+        >>> dates.dt.is_month_end
+        0    False
+        1    True
+        2    False
+        dtype: bool
+
+        >>> idx = pd.date_range("2018-02-27", periods=3)
+        >>> idx.is_month_end
+        array([False,  True, False], dtype=bool)
+        """)
+    is_quarter_start = _field_accessor(
+        'is_quarter_start',
+        'is_quarter_start',
+        """
+        Indicator for whether the date is the first day of a quarter.
+
+        Returns
+        -------
+        is_quarter_start : Series or DatetimeIndex
+            The same type as the original data with boolean values. Series will
+            have the same name and index. DatetimeIndex will have the same
+            name.
+
+        See Also
+        --------
+        quarter : Return the quarter of the date.
+        is_quarter_end : Similar property for indicating the quarter start.
+
+        Examples
+        --------
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on DatetimeIndex.
+
+        >>> df = pd.DataFrame({'dates': pd.date_range("2017-03-30",
+        ...                   periods=4)})
+        >>> df.assign(quarter=df.dates.dt.quarter,
+        ...           is_quarter_start=df.dates.dt.is_quarter_start)
+               dates  quarter  is_quarter_start
+        0 2017-03-30        1             False
+        1 2017-03-31        1             False
+        2 2017-04-01        2              True
+        3 2017-04-02        2             False
+
+        >>> idx = pd.date_range('2017-03-30', periods=4)
+        >>> idx
+        DatetimeIndex(['2017-03-30', '2017-03-31', '2017-04-01', '2017-04-02'],
+                      dtype='datetime64[ns]', freq='D')
+
+        >>> idx.is_quarter_start
+        array([False, False,  True, False])
+        """)
+    is_quarter_end = _field_accessor(
+        'is_quarter_end',
+        'is_quarter_end',
+        """
+        Indicator for whether the date is the last day of a quarter.
+
+        Returns
+        -------
+        is_quarter_end : Series or DatetimeIndex
+            The same type as the original data with boolean values. Series will
+            have the same name and index. DatetimeIndex will have the same
+            name.
+
+        See Also
+        --------
+        quarter : Return the quarter of the date.
+        is_quarter_start : Similar property indicating the quarter start.
+
+        Examples
+        --------
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on DatetimeIndex.
+
+        >>> df = pd.DataFrame({'dates': pd.date_range("2017-03-30",
+        ...                    periods=4)})
+        >>> df.assign(quarter=df.dates.dt.quarter,
+        ...           is_quarter_end=df.dates.dt.is_quarter_end)
+               dates  quarter    is_quarter_end
+        0 2017-03-30        1             False
+        1 2017-03-31        1              True
+        2 2017-04-01        2             False
+        3 2017-04-02        2             False
+
+        >>> idx = pd.date_range('2017-03-30', periods=4)
+        >>> idx
+        DatetimeIndex(['2017-03-30', '2017-03-31', '2017-04-01', '2017-04-02'],
+                      dtype='datetime64[ns]', freq='D')
+
+        >>> idx.is_quarter_end
+        array([False,  True, False, False])
+        """)
+    is_year_start = _field_accessor(
+        'is_year_start',
+        'is_year_start',
+        """
+        Indicate whether the date is the first day of a year.
+
+        Returns
+        -------
+        Series or DatetimeIndex
+            The same type as the original data with boolean values. Series will
+            have the same name and index. DatetimeIndex will have the same
+            name.
+
+        See Also
+        --------
+        is_year_end : Similar property indicating the last day of the year.
+
+        Examples
+        --------
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on DatetimeIndex.
+
+        >>> dates = pd.Series(pd.date_range("2017-12-30", periods=3))
+        >>> dates
+        0   2017-12-30
+        1   2017-12-31
+        2   2018-01-01
+        dtype: datetime64[ns]
+
+        >>> dates.dt.is_year_start
+        0    False
+        1    False
+        2    True
+        dtype: bool
+
+        >>> idx = pd.date_range("2017-12-30", periods=3)
+        >>> idx
+        DatetimeIndex(['2017-12-30', '2017-12-31', '2018-01-01'],
+                      dtype='datetime64[ns]', freq='D')
+
+        >>> idx.is_year_start
+        array([False, False,  True])
+        """)
+    is_year_end = _field_accessor(
+        'is_year_end',
+        'is_year_end',
+        """
+        Indicate whether the date is the last day of the year.
+
+        Returns
+        -------
+        Series or DatetimeIndex
+            The same type as the original data with boolean values. Series will
+            have the same name and index. DatetimeIndex will have the same
+            name.
+
+        See Also
+        --------
+        is_year_start : Similar property indicating the start of the year.
+
+        Examples
+        --------
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on DatetimeIndex.
+
+        >>> dates = pd.Series(pd.date_range("2017-12-30", periods=3))
+        >>> dates
+        0   2017-12-30
+        1   2017-12-31
+        2   2018-01-01
+        dtype: datetime64[ns]
+
+        >>> dates.dt.is_year_end
+        0    False
+        1     True
+        2    False
+        dtype: bool
+
+        >>> idx = pd.date_range("2017-12-30", periods=3)
+        >>> idx
+        DatetimeIndex(['2017-12-30', '2017-12-31', '2018-01-01'],
+                      dtype='datetime64[ns]', freq='D')
+
+        >>> idx.is_year_end
+        array([False,  True, False])
+        """)
+    is_leap_year = _field_accessor(
+        'is_leap_year',
+        'is_leap_year',
+        """
+        Boolean indicator if the date belongs to a leap year.
+
+        A leap year is a year, which has 366 days (instead of 365) including
+        29th of February as an intercalary day.
+        Leap years are years which are multiples of four with the exception
+        of years divisible by 100 but not by 400.
+
+        Returns
+        -------
+        Series or ndarray
+             Booleans indicating if dates belong to a leap year.
+
+        Examples
+        --------
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on DatetimeIndex.
+
+        >>> idx = pd.date_range("2012-01-01", "2015-01-01", freq="Y")
+        >>> idx
+        DatetimeIndex(['2012-12-31', '2013-12-31', '2014-12-31'],
+                      dtype='datetime64[ns]', freq='A-DEC')
+        >>> idx.is_leap_year
+        array([ True, False, False], dtype=bool)
+
+        >>> dates = pd.Series(idx)
+        >>> dates_series
+        0   2012-12-31
+        1   2013-12-31
+        2   2014-12-31
+        dtype: datetime64[ns]
+        >>> dates_series.dt.is_leap_year
+        0     True
+        1    False
+        2    False
+        dtype: bool
+        """)
+
+    @property
+    def time(self):
+        """
+        Returns numpy array of datetime.time. The time part of the Timestamps.
+        """
+
+        # If the Timestamps have a timezone that is not UTC,
+        # convert them into their i8 representation while
+        # keeping their timezone and not using UTC
+        if (self.tz is not None and self.tz is not utc):
+            timestamps = self._local_timestamps()
+        else:
+            timestamps = self.asi8
+
+        return libts.ints_to_pydatetime(timestamps, box="time")
+
+    @property
+    def date(self):
+        """
+        Returns numpy array of python datetime.date objects (namely, the date
+        part of Timestamps without timezone information).
+        """
+
+        # If the Timestamps have a timezone that is not UTC,
+        # convert them into their i8 representation while
+        # keeping their timezone and not using UTC
+        if (self.tz is not None and self.tz is not utc):
+            timestamps = self._local_timestamps()
+        else:
+            timestamps = self.asi8
+
+        return libts.ints_to_pydatetime(timestamps, box="date")
+
+    def normalize(self):
+        """
+        Convert times to midnight.
+
+        The time component of the date-time is converted to midnight i.e.
+        00:00:00. This is useful in cases, when the time does not matter.
+        Length is unaltered. The timezones are unaffected.
+
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on DatetimeIndex.
+
+        Returns
+        -------
+        DatetimeIndex or Series
+            The same type as the original data. Series will have the same
+            name and index. DatetimeIndex will have the same name.
+
+        See Also
+        --------
+        floor : Floor the datetimes to the specified freq.
+        ceil : Ceil the datetimes to the specified freq.
+        round : Round the datetimes to the specified freq.
+
+        Examples
+        --------
+        >>> idx = pd.DatetimeIndex(start='2014-08-01 10:00', freq='H',
+        ...                        periods=3, tz='Asia/Calcutta')
+        >>> idx
+        DatetimeIndex(['2014-08-01 10:00:00+05:30',
+                       '2014-08-01 11:00:00+05:30',
+                       '2014-08-01 12:00:00+05:30'],
+                        dtype='datetime64[ns, Asia/Calcutta]', freq='H')
+        >>> idx.normalize()
+        DatetimeIndex(['2014-08-01 00:00:00+05:30',
+                       '2014-08-01 00:00:00+05:30',
+                       '2014-08-01 00:00:00+05:30'],
+                       dtype='datetime64[ns, Asia/Calcutta]', freq=None)
+        """
+        new_values = conversion.date_normalize(self.asi8, self.tz)
+        return DatetimeIndex(new_values,
+                             freq='infer',
+                             name=self.name).tz_localize(self.tz)
+
+    @Substitution(klass='DatetimeIndex')
+    @Appender(_shared_docs['searchsorted'])
+    @deprecate_kwarg(old_arg_name='key', new_arg_name='value')
+    def searchsorted(self, value, side='left', sorter=None):
+        if isinstance(value, (np.ndarray, Index)):
+            value = np.array(value, dtype=_NS_DTYPE, copy=False)
+        else:
+            value = _to_m8(value, tz=self.tz)
+
+        return self.values.searchsorted(value, side=side)
+
+    def is_type_compatible(self, typ):
+        return typ == self.inferred_type or typ == 'datetime'
+
+    @property
+    def inferred_type(self):
+        # b/c datetime is represented as microseconds since the epoch, make
+        # sure we can't have ambiguous indexing
+        return 'datetime64'
+
+    @cache_readonly
+    def dtype(self):
+        if self.tz is None:
+            return _NS_DTYPE
+        return DatetimeTZDtype('ns', self.tz)
+
+    @property
+    def is_all_dates(self):
+        return True
+
+    @cache_readonly
+    def is_normalized(self):
+        """
+        Returns True if all of the dates are at midnight ("no time")
+        """
+        return conversion.is_date_array_normalized(self.asi8, self.tz)
+
+    @cache_readonly
+    def _resolution(self):
+        return libresolution.resolution(self.asi8, self.tz)
+
+    def insert(self, loc, item):
+        """
+        Make new Index inserting new item at location
+
+        Parameters
+        ----------
+        loc : int
+        item : object
+            if not either a Python datetime or a numpy integer-like, returned
+            Index dtype will be object rather than datetime.
+
+        Returns
+        -------
+        new_index : Index
+        """
+        if is_scalar(item) and isna(item):
+            # GH 18295
+            item = self._na_value
+
+        freq = None
+
+        if isinstance(item, (datetime, np.datetime64)):
+            self._assert_can_do_op(item)
+            if not self._has_same_tz(item) and not isna(item):
+                raise ValueError(
+                    'Passed item and index have different timezone')
+            # check freq can be preserved on edge cases
+            if self.size and self.freq is not None:
+                if ((loc == 0 or loc == -len(self)) and
+                        item + self.freq == self[0]):
+                    freq = self.freq
+                elif (loc == len(self)) and item - self.freq == self[-1]:
+                    freq = self.freq
+            item = _to_m8(item, tz=self.tz)
+
+        try:
+            new_dates = np.concatenate((self[:loc].asi8, [item.view(np.int64)],
+                                        self[loc:].asi8))
+            return DatetimeIndex(new_dates, name=self.name, freq=freq,
+                                 tz=self.tz)
+        except (AttributeError, TypeError):
+
+            # fall back to object index
+            if isinstance(item, compat.string_types):
+                return self.astype(object).insert(loc, item)
+            raise TypeError(
+                "cannot insert DatetimeIndex with incompatible label")
+
+    def delete(self, loc):
+        """
+        Make a new DatetimeIndex with passed location(s) deleted.
+
+        Parameters
+        ----------
+        loc: int, slice or array of ints
+            Indicate which sub-arrays to remove.
+
+        Returns
+        -------
+        new_index : DatetimeIndex
+        """
+        new_dates = np.delete(self.asi8, loc)
+
+        freq = None
+        if is_integer(loc):
+            if loc in (0, -len(self), -1, len(self) - 1):
+                freq = self.freq
+        else:
+            if is_list_like(loc):
+                loc = lib.maybe_indices_to_slice(
+                    _ensure_int64(np.array(loc)), len(self))
+            if isinstance(loc, slice) and loc.step in (1, None):
+                if (loc.start in (0, None) or loc.stop in (len(self), None)):
+                    freq = self.freq
+
+        return DatetimeIndex(new_dates, name=self.name, freq=freq, tz=self.tz)
+
+    def tz_convert(self, tz):
+        """
+        Convert tz-aware DatetimeIndex from one time zone to another.
+
+        Parameters
+        ----------
+        tz : string, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time. Corresponding timestamps would be converted
+            to this time zone of the DatetimeIndex. A `tz` of None will
+            convert to UTC and remove the timezone information.
+
+        Returns
+        -------
+        normalized : DatetimeIndex
+
+        Raises
+        ------
+        TypeError
+            If DatetimeIndex is tz-naive.
+
+        See Also
+        --------
+        DatetimeIndex.tz : A timezone that has a variable offset from UTC
+        DatetimeIndex.tz_localize : Localize tz-naive DatetimeIndex to a
+            given time zone, or remove timezone from a tz-aware DatetimeIndex.
+
+        Examples
+        --------
+        With the `tz` parameter, we can change the DatetimeIndex
+        to other time zones:
+
+        >>> dti = pd.DatetimeIndex(start='2014-08-01 09:00',
+        ...                        freq='H', periods=3, tz='Europe/Berlin')
+
+        >>> dti
+        DatetimeIndex(['2014-08-01 09:00:00+02:00',
+                       '2014-08-01 10:00:00+02:00',
+                       '2014-08-01 11:00:00+02:00'],
+                      dtype='datetime64[ns, Europe/Berlin]', freq='H')
+
+        >>> dti.tz_convert('US/Central')
+        DatetimeIndex(['2014-08-01 02:00:00-05:00',
+                       '2014-08-01 03:00:00-05:00',
+                       '2014-08-01 04:00:00-05:00'],
+                      dtype='datetime64[ns, US/Central]', freq='H')
+
+        With the ``tz=None``, we can remove the timezone (after converting
+        to UTC if necessary):
+
+        >>> dti = pd.DatetimeIndex(start='2014-08-01 09:00',freq='H',
+        ...                        periods=3, tz='Europe/Berlin')
+
+        >>> dti
+        DatetimeIndex(['2014-08-01 09:00:00+02:00',
+                       '2014-08-01 10:00:00+02:00',
+                       '2014-08-01 11:00:00+02:00'],
+                        dtype='datetime64[ns, Europe/Berlin]', freq='H')
+
+        >>> dti.tz_convert(None)
+        DatetimeIndex(['2014-08-01 07:00:00',
+                       '2014-08-01 08:00:00',
+                       '2014-08-01 09:00:00'],
+                        dtype='datetime64[ns]', freq='H')
+        """
+        tz = timezones.maybe_get_tz(tz)
+
+        if self.tz is None:
+            # tz naive, use tz_localize
+            raise TypeError('Cannot convert tz-naive timestamps, use '
+                            'tz_localize to localize')
+
+        # No conversion since timestamps are all UTC to begin with
+        return self._shallow_copy(tz=tz)
+
+    def tz_localize(self, tz, ambiguous='raise', errors='raise'):
+        """
+        Localize tz-naive DatetimeIndex to tz-aware DatetimeIndex.
+
+        This method takes a time zone (tz) naive DatetimeIndex object and
+        makes this time zone aware. It does not move the time to another
+        time zone.
+        Time zone localization helps to switch from time zone aware to time
+        zone unaware objects.
+
+        Parameters
+        ----------
+        tz : string, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone to convert timestamps to. Passing ``None`` will
+            remove the time zone information preserving local time.
+        ambiguous : str {'infer', 'NaT', 'raise'} or bool array, \
+default 'raise'
+            - 'infer' will attempt to infer fall dst-transition hours based on
+              order
+            - bool-ndarray where True signifies a DST time, False signifies a
+              non-DST time (note that this flag is only applicable for
+              ambiguous times)
+            - 'NaT' will return NaT where there are ambiguous times
+            - 'raise' will raise an AmbiguousTimeError if there are ambiguous
+              times
+        errors : {'raise', 'coerce'}, default 'raise'
+            - 'raise' will raise a NonExistentTimeError if a timestamp is not
+               valid in the specified time zone (e.g. due to a transition from
+               or to DST time)
+            - 'coerce' will return NaT if the timestamp can not be converted
+              to the specified time zone
+
+            .. versionadded:: 0.19.0
+
+        Returns
+        -------
+        DatetimeIndex
+            Index converted to the specified time zone.
+
+        Raises
+        ------
+        TypeError
+            If the DatetimeIndex is tz-aware and tz is not None.
+
+        See Also
+        --------
+        DatetimeIndex.tz_convert : Convert tz-aware DatetimeIndex from
+            one time zone to another.
+
+        Examples
+        --------
+        >>> tz_naive = pd.date_range('2018-03-01 09:00', periods=3)
+        >>> tz_naive
+        DatetimeIndex(['2018-03-01 09:00:00', '2018-03-02 09:00:00',
+                       '2018-03-03 09:00:00'],
+                      dtype='datetime64[ns]', freq='D')
+
+        Localize DatetimeIndex in US/Eastern time zone:
+
+        >>> tz_aware = tz_naive.tz_localize(tz='US/Eastern')
+        >>> tz_aware
+        DatetimeIndex(['2018-03-01 09:00:00-05:00',
+                       '2018-03-02 09:00:00-05:00',
+                       '2018-03-03 09:00:00-05:00'],
+                      dtype='datetime64[ns, US/Eastern]', freq='D')
+
+        With the ``tz=None``, we can remove the time zone information
+        while keeping the local time (not converted to UTC):
+
+        >>> tz_aware.tz_localize(None)
+        DatetimeIndex(['2018-03-01 09:00:00', '2018-03-02 09:00:00',
+                       '2018-03-03 09:00:00'],
+                      dtype='datetime64[ns]', freq='D')
+        """
+        if self.tz is not None:
+            if tz is None:
+                new_dates = conversion.tz_convert(self.asi8, 'UTC', self.tz)
+            else:
+                raise TypeError("Already tz-aware, use tz_convert to convert.")
+        else:
+            tz = timezones.maybe_get_tz(tz)
+            # Convert to UTC
+
+            new_dates = conversion.tz_localize_to_utc(self.asi8, tz,
+                                                      ambiguous=ambiguous,
+                                                      errors=errors)
+        new_dates = new_dates.view(_NS_DTYPE)
+        return self._shallow_copy(new_dates, tz=tz)
+
+    def indexer_at_time(self, time, asof=False):
+        """
+        Returns index locations of index values at particular time of day
+        (e.g. 9:30AM).
+
+        Parameters
+        ----------
+        time : datetime.time or string
+            datetime.time or string in appropriate format ("%H:%M", "%H%M",
+            "%I:%M%p", "%I%M%p", "%H:%M:%S", "%H%M%S", "%I:%M:%S%p",
+            "%I%M%S%p").
+
+        Returns
+        -------
+        values_at_time : array of integers
+
+        See Also
+        --------
+        indexer_between_time, DataFrame.at_time
+        """
+        from dateutil.parser import parse
+
+        if asof:
+            raise NotImplementedError("'asof' argument is not supported")
+
+        if isinstance(time, compat.string_types):
+            time = parse(time).time()
+
+        if time.tzinfo:
+            # TODO
+            raise NotImplementedError("argument 'time' with timezone info is "
+                                      "not supported")
+
+        time_micros = self._get_time_micros()
+        micros = _time_to_micros(time)
+        return (micros == time_micros).nonzero()[0]
+
+    def indexer_between_time(self, start_time, end_time, include_start=True,
+                             include_end=True):
+        """
+        Return index locations of values between particular times of day
+        (e.g., 9:00-9:30AM).
+
+        Parameters
+        ----------
+        start_time, end_time : datetime.time, str
+            datetime.time or string in appropriate format ("%H:%M", "%H%M",
+            "%I:%M%p", "%I%M%p", "%H:%M:%S", "%H%M%S", "%I:%M:%S%p",
+            "%I%M%S%p").
+        include_start : boolean, default True
+        include_end : boolean, default True
+
+        Returns
+        -------
+        values_between_time : array of integers
+
+        See Also
+        --------
+        indexer_at_time, DataFrame.between_time
+        """
+        start_time = tools.to_time(start_time)
+        end_time = tools.to_time(end_time)
+        time_micros = self._get_time_micros()
+        start_micros = _time_to_micros(start_time)
+        end_micros = _time_to_micros(end_time)
+
+        if include_start and include_end:
+            lop = rop = operator.le
+        elif include_start:
+            lop = operator.le
+            rop = operator.lt
+        elif include_end:
+            lop = operator.lt
+            rop = operator.le
+        else:
+            lop = rop = operator.lt
+
+        if start_time <= end_time:
+            join_op = operator.and_
+        else:
+            join_op = operator.or_
+
+        mask = join_op(lop(start_micros, time_micros),
+                       rop(time_micros, end_micros))
+
+        return mask.nonzero()[0]
+
+    def to_julian_date(self):
+        """
+        Convert DatetimeIndex to Float64Index of Julian Dates.
+        0 Julian date is noon January 1, 4713 BC.
+        http://en.wikipedia.org/wiki/Julian_day
+        """
+
+        # http://mysite.verizon.net/aesir_research/date/jdalg2.htm
+        year = np.asarray(self.year)
+        month = np.asarray(self.month)
+        day = np.asarray(self.day)
+        testarr = month < 3
+        year[testarr] -= 1
+        month[testarr] += 12
+        return Float64Index(day +
+                            np.fix((153 * month - 457) / 5) +
+                            365 * year +
+                            np.floor(year / 4) -
+                            np.floor(year / 100) +
+                            np.floor(year / 400) +
+                            1721118.5 +
+                            (self.hour +
+                             self.minute / 60.0 +
+                             self.second / 3600.0 +
+                             self.microsecond / 3600.0 / 1e+6 +
+                             self.nanosecond / 3600.0 / 1e+9
+                             ) / 24.0)
+
+    def month_name(self, locale=None):
+        """
+        Return the month names of the DateTimeIndex with specified locale.
+
+        Parameters
+        ----------
+        locale : string, default None (English locale)
+            locale determining the language in which to return the month name
+
+        Returns
+        -------
+        month_names : Index
+            Index of month names
+
+        .. versionadded:: 0.23.0
+        """
+        values = self.asi8
+        if self.tz is not None:
+            if self.tz is not utc:
+                values = self._local_timestamps()
+
+        result = fields.get_date_name_field(values, 'month_name',
+                                            locale=locale)
+        result = self._maybe_mask_results(result)
+        return Index(result, name=self.name)
+
+    def day_name(self, locale=None):
+        """
+        Return the day names of the DateTimeIndex with specified locale.
+
+        Parameters
+        ----------
+        locale : string, default None (English locale)
+            locale determining the language in which to return the day name
+
+        Returns
+        -------
+        month_names : Index
+            Index of day names
+
+        .. versionadded:: 0.23.0
+        """
+        values = self.asi8
+        if self.tz is not None:
+            if self.tz is not utc:
+                values = self._local_timestamps()
+
+        result = fields.get_date_name_field(values, 'day_name',
+                                            locale=locale)
+        result = self._maybe_mask_results(result)
+        return Index(result, name=self.name)
+
+
+DatetimeIndex._add_comparison_methods()
+DatetimeIndex._add_numeric_methods_disabled()
+DatetimeIndex._add_logical_methods_disabled()
+DatetimeIndex._add_datetimelike_methods()
+
+
+def _generate_regular_range(start, end, periods, freq):
+    if isinstance(freq, Tick):
+        stride = freq.nanos
+        if periods is None:
+            b = Timestamp(start).value
+            # cannot just use e = Timestamp(end) + 1 because arange breaks when
+            # stride is too large, see GH10887
+            e = (b + (Timestamp(end).value - b) // stride * stride +
+                 stride // 2 + 1)
+            # end.tz == start.tz by this point due to _generate implementation
+            tz = start.tz
+        elif start is not None:
+            b = Timestamp(start).value
+            e = b + np.int64(periods) * stride
+            tz = start.tz
+        elif end is not None:
+            e = Timestamp(end).value + stride
+            b = e - np.int64(periods) * stride
+            tz = end.tz
+        else:
+            raise ValueError("at least 'start' or 'end' should be specified "
+                             "if a 'period' is given.")
+
+        data = np.arange(b, e, stride, dtype=np.int64)
+        data = DatetimeIndex._simple_new(data, None, tz=tz)
+    else:
+        if isinstance(start, Timestamp):
+            start = start.to_pydatetime()
+
+        if isinstance(end, Timestamp):
+            end = end.to_pydatetime()
+
+        xdr = generate_range(start=start, end=end,
+                             periods=periods, offset=freq)
+
+        dates = list(xdr)
+        # utc = len(dates) > 0 and dates[0].tzinfo is not None
+        data = tools.to_datetime(dates)
+
+    return data
+
+
+def date_range(start=None, end=None, periods=None, freq=None, tz=None,
+               normalize=False, name=None, closed=None, **kwargs):
+    """
+    Return a fixed frequency DatetimeIndex.
+
+    Parameters
+    ----------
+    start : str or datetime-like, optional
+        Left bound for generating dates.
+    end : str or datetime-like, optional
+        Right bound for generating dates.
+    periods : integer, optional
+        Number of periods to generate.
+    freq : str or DateOffset, default 'D' (calendar daily)
+        Frequency strings can have multiples, e.g. '5H'. See
+        :ref:`here <timeseries.offset_aliases>` for a list of
+        frequency aliases.
+    tz : str or tzinfo, optional
+        Time zone name for returning localized DatetimeIndex, for example
+        'Asia/Hong_Kong'. By default, the resulting DatetimeIndex is
+        timezone-naive.
+    normalize : bool, default False
+        Normalize start/end dates to midnight before generating date range.
+    name : str, default None
+        Name of the resulting DatetimeIndex.
+    closed : {None, 'left', 'right'}, optional
+        Make the interval closed with respect to the given frequency to
+        the 'left', 'right', or both sides (None, the default).
+    **kwargs
+        For compatibility. Has no effect on the result.
+
+    Returns
+    -------
+    rng : DatetimeIndex
+
+    See Also
+    --------
+    pandas.DatetimeIndex : An immutable container for datetimes.
+    pandas.timedelta_range : Return a fixed frequency TimedeltaIndex.
+    pandas.period_range : Return a fixed frequency PeriodIndex.
+    pandas.interval_range : Return a fixed frequency IntervalIndex.
+
+    Notes
+    -----
+    Of the four parameters ``start``, ``end``, ``periods``, and ``freq``,
+    exactly three must be specified. If ``freq`` is omitted, the resulting
+    ``DatetimeIndex`` will have ``periods`` linearly spaced elements between
+    ``start`` and ``end`` (closed on both sides).
+
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Examples
+    --------
+    **Specifying the values**
+
+    The next four examples generate the same `DatetimeIndex`, but vary
+    the combination of `start`, `end` and `periods`.
+
+    Specify `start` and `end`, with the default daily frequency.
+
+    >>> pd.date_range(start='1/1/2018', end='1/08/2018')
+    DatetimeIndex(['2018-01-01', '2018-01-02', '2018-01-03', '2018-01-04',
+                   '2018-01-05', '2018-01-06', '2018-01-07', '2018-01-08'],
+                  dtype='datetime64[ns]', freq='D')
+
+    Specify `start` and `periods`, the number of periods (days).
+
+    >>> pd.date_range(start='1/1/2018', periods=8)
+    DatetimeIndex(['2018-01-01', '2018-01-02', '2018-01-03', '2018-01-04',
+                   '2018-01-05', '2018-01-06', '2018-01-07', '2018-01-08'],
+                  dtype='datetime64[ns]', freq='D')
+
+    Specify `end` and `periods`, the number of periods (days).
+
+    >>> pd.date_range(end='1/1/2018', periods=8)
+    DatetimeIndex(['2017-12-25', '2017-12-26', '2017-12-27', '2017-12-28',
+                   '2017-12-29', '2017-12-30', '2017-12-31', '2018-01-01'],
+                  dtype='datetime64[ns]', freq='D')
+
+    Specify `start`, `end`, and `periods`; the frequency is generated
+    automatically (linearly spaced).
+
+    >>> pd.date_range(start='2018-04-24', end='2018-04-27', periods=3)
+    DatetimeIndex(['2018-04-24 00:00:00', '2018-04-25 12:00:00',
+                   '2018-04-27 00:00:00'], freq=None)
+
+    **Other Parameters**
+
+    Changed the `freq` (frequency) to ``'M'`` (month end frequency).
+
+    >>> pd.date_range(start='1/1/2018', periods=5, freq='M')
+    DatetimeIndex(['2018-01-31', '2018-02-28', '2018-03-31', '2018-04-30',
+                   '2018-05-31'],
+                  dtype='datetime64[ns]', freq='M')
+
+    Multiples are allowed
+
+    >>> pd.date_range(start='1/1/2018', periods=5, freq='3M')
+    DatetimeIndex(['2018-01-31', '2018-04-30', '2018-07-31', '2018-10-31',
+                   '2019-01-31'],
+                  dtype='datetime64[ns]', freq='3M')
+
+    `freq` can also be specified as an Offset object.
+
+    >>> pd.date_range(start='1/1/2018', periods=5, freq=pd.offsets.MonthEnd(3))
+    DatetimeIndex(['2018-01-31', '2018-04-30', '2018-07-31', '2018-10-31',
+                   '2019-01-31'],
+                  dtype='datetime64[ns]', freq='3M')
+
+    Specify `tz` to set the timezone.
+
+    >>> pd.date_range(start='1/1/2018', periods=5, tz='Asia/Tokyo')
+    DatetimeIndex(['2018-01-01 00:00:00+09:00', '2018-01-02 00:00:00+09:00',
+                   '2018-01-03 00:00:00+09:00', '2018-01-04 00:00:00+09:00',
+                   '2018-01-05 00:00:00+09:00'],
+                  dtype='datetime64[ns, Asia/Tokyo]', freq='D')
+
+    `closed` controls whether to include `start` and `end` that are on the
+    boundary. The default includes boundary points on either end.
+
+    >>> pd.date_range(start='2017-01-01', end='2017-01-04', closed=None)
+    DatetimeIndex(['2017-01-01', '2017-01-02', '2017-01-03', '2017-01-04'],
+                  dtype='datetime64[ns]', freq='D')
+
+    Use ``closed='left'`` to exclude `end` if it falls on the boundary.
+
+    >>> pd.date_range(start='2017-01-01', end='2017-01-04', closed='left')
+    DatetimeIndex(['2017-01-01', '2017-01-02', '2017-01-03'],
+                  dtype='datetime64[ns]', freq='D')
+
+    Use ``closed='right'`` to exclude `start` if it falls on the boundary.
+
+    >>> pd.date_range(start='2017-01-01', end='2017-01-04', closed='right')
+    DatetimeIndex(['2017-01-02', '2017-01-03', '2017-01-04'],
+                  dtype='datetime64[ns]', freq='D')
+    """
+
+    if freq is None and com._any_none(periods, start, end):
+        freq = 'D'
+
+    return DatetimeIndex(start=start, end=end, periods=periods,
+                         freq=freq, tz=tz, normalize=normalize, name=name,
+                         closed=closed, **kwargs)
+
+
+def bdate_range(start=None, end=None, periods=None, freq='B', tz=None,
+                normalize=True, name=None, weekmask=None, holidays=None,
+                closed=None, **kwargs):
+    """
+    Return a fixed frequency DatetimeIndex, with business day as the default
+    frequency
+
+    Parameters
+    ----------
+    start : string or datetime-like, default None
+        Left bound for generating dates
+    end : string or datetime-like, default None
+        Right bound for generating dates
+    periods : integer, default None
+        Number of periods to generate
+    freq : string or DateOffset, default 'B' (business daily)
+        Frequency strings can have multiples, e.g. '5H'
+    tz : string or None
+        Time zone name for returning localized DatetimeIndex, for example
+        Asia/Beijing
+    normalize : bool, default False
+        Normalize start/end dates to midnight before generating date range
+    name : string, default None
+        Name of the resulting DatetimeIndex
+    weekmask : string or None, default None
+        Weekmask of valid business days, passed to ``numpy.busdaycalendar``,
+        only used when custom frequency strings are passed.  The default
+        value None is equivalent to 'Mon Tue Wed Thu Fri'
+
+        .. versionadded:: 0.21.0
+
+    holidays : list-like or None, default None
+        Dates to exclude from the set of valid business days, passed to
+        ``numpy.busdaycalendar``, only used when custom frequency strings
+        are passed
+
+        .. versionadded:: 0.21.0
+
+    closed : string, default None
+        Make the interval closed with respect to the given frequency to
+        the 'left', 'right', or both sides (None)
+
+    Notes
+    -----
+    Of the four parameters: ``start``, ``end``, ``periods``, and ``freq``,
+    exactly three must be specified.  Specifying ``freq`` is a requirement
+    for ``bdate_range``.  Use ``date_range`` if specifying ``freq`` is not
+    desired.
+
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Returns
+    -------
+    rng : DatetimeIndex
+    """
+    if freq is None:
+        msg = 'freq must be specified for bdate_range; use date_range instead'
+        raise TypeError(msg)
+
+    if is_string_like(freq) and freq.startswith('C'):
+        try:
+            weekmask = weekmask or 'Mon Tue Wed Thu Fri'
+            freq = prefix_mapping[freq](holidays=holidays, weekmask=weekmask)
+        except (KeyError, TypeError):
+            msg = 'invalid custom frequency string: {freq}'.format(freq=freq)
+            raise ValueError(msg)
+    elif holidays or weekmask:
+        msg = ('a custom frequency string is required when holidays or '
+               'weekmask are passed, got frequency {freq}').format(freq=freq)
+        raise ValueError(msg)
+
+    return DatetimeIndex(start=start, end=end, periods=periods,
+                         freq=freq, tz=tz, normalize=normalize, name=name,
+                         closed=closed, **kwargs)
+
+
+def cdate_range(start=None, end=None, periods=None, freq='C', tz=None,
+                normalize=True, name=None, closed=None, **kwargs):
+    """
+    Return a fixed frequency DatetimeIndex, with CustomBusinessDay as the
+    default frequency
+
+    .. deprecated:: 0.21.0
+
+    Parameters
+    ----------
+    start : string or datetime-like, default None
+        Left bound for generating dates
+    end : string or datetime-like, default None
+        Right bound for generating dates
+    periods : integer, default None
+        Number of periods to generate
+    freq : string or DateOffset, default 'C' (CustomBusinessDay)
+        Frequency strings can have multiples, e.g. '5H'
+    tz : string, default None
+        Time zone name for returning localized DatetimeIndex, for example
+        Asia/Beijing
+    normalize : bool, default False
+        Normalize start/end dates to midnight before generating date range
+    name : string, default None
+        Name of the resulting DatetimeIndex
+    weekmask : string, Default 'Mon Tue Wed Thu Fri'
+        weekmask of valid business days, passed to ``numpy.busdaycalendar``
+    holidays : list
+        list/array of dates to exclude from the set of valid business days,
+        passed to ``numpy.busdaycalendar``
+    closed : string, default None
+        Make the interval closed with respect to the given frequency to
+        the 'left', 'right', or both sides (None)
+
+    Notes
+    -----
+    Of the three parameters: ``start``, ``end``, and ``periods``, exactly two
+    must be specified.
+
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Returns
+    -------
+    rng : DatetimeIndex
+    """
+    warnings.warn("cdate_range is deprecated and will be removed in a future "
+                  "version, instead use pd.bdate_range(..., freq='{freq}')"
+                  .format(freq=freq), FutureWarning, stacklevel=2)
+
+    if freq == 'C':
+        holidays = kwargs.pop('holidays', [])
+        weekmask = kwargs.pop('weekmask', 'Mon Tue Wed Thu Fri')
+        freq = CDay(holidays=holidays, weekmask=weekmask)
+    return DatetimeIndex(start=start, end=end, periods=periods, freq=freq,
+                         tz=tz, normalize=normalize, name=name,
+                         closed=closed, **kwargs)
+
+
+def _to_m8(key, tz=None):
+    """
+    Timestamp-like => dt64
+    """
+    if not isinstance(key, Timestamp):
+        # this also converts strings
+        key = Timestamp(key, tz=tz)
+
+    return np.int64(conversion.pydt_to_i8(key)).view(_NS_DTYPE)
+
+
+_CACHE_START = Timestamp(datetime(1950, 1, 1))
+_CACHE_END = Timestamp(datetime(2030, 1, 1))
+
+_daterange_cache = {}
+
+
+def _naive_in_cache_range(start, end):
+    if start is None or end is None:
+        return False
+    else:
+        if start.tzinfo is not None or end.tzinfo is not None:
+            return False
+        return _in_range(start, end, _CACHE_START, _CACHE_END)
+
+
+def _in_range(start, end, rng_start, rng_end):
+    return start > rng_start and end < rng_end
+
+
+def _use_cached_range(freq, _normalized, start, end):
+    return (freq._should_cache() and
+            not (freq._normalize_cache and not _normalized) and
+            _naive_in_cache_range(start, end))
+
+
+def _time_to_micros(time):
+    seconds = time.hour * 60 * 60 + 60 * time.minute + time.second
+    return 1000000 * seconds + time.microsecond
diff --git a/pandas/core/indexes/frozen.py b/pandas/core/indexes/frozen.py
new file mode 100644
index 0000000000000..3c6b922178abf
--- /dev/null
+++ b/pandas/core/indexes/frozen.py
@@ -0,0 +1,150 @@
+"""
+frozen (immutable) data structures to support MultiIndexing
+
+These are used for:
+
+- .names (FrozenList)
+- .levels & .labels (FrozenNDArray)
+
+"""
+
+import numpy as np
+from pandas.core.base import PandasObject
+from pandas.core.dtypes.cast import coerce_indexer_dtype
+from pandas.io.formats.printing import pprint_thing
+
+
+class FrozenList(PandasObject, list):
+
+    """
+    Container that doesn't allow setting item *but*
+    because it's technically non-hashable, will be used
+    for lookups, appropriately, etc.
+    """
+    # Sidenote: This has to be of type list, otherwise it messes up PyTables
+    #           typechecks
+
+    def __add__(self, other):
+        if isinstance(other, tuple):
+            other = list(other)
+        return self.__class__(super(FrozenList, self).__add__(other))
+
+    __iadd__ = __add__
+
+    # Python 2 compat
+    def __getslice__(self, i, j):
+        return self.__class__(super(FrozenList, self).__getslice__(i, j))
+
+    def __getitem__(self, n):
+        # Python 3 compat
+        if isinstance(n, slice):
+            return self.__class__(super(FrozenList, self).__getitem__(n))
+        return super(FrozenList, self).__getitem__(n)
+
+    def __radd__(self, other):
+        if isinstance(other, tuple):
+            other = list(other)
+        return self.__class__(other + list(self))
+
+    def __eq__(self, other):
+        if isinstance(other, (tuple, FrozenList)):
+            other = list(other)
+        return super(FrozenList, self).__eq__(other)
+
+    __req__ = __eq__
+
+    def __mul__(self, other):
+        return self.__class__(super(FrozenList, self).__mul__(other))
+
+    __imul__ = __mul__
+
+    def __reduce__(self):
+        return self.__class__, (list(self),)
+
+    def __hash__(self):
+        return hash(tuple(self))
+
+    def _disabled(self, *args, **kwargs):
+        """This method will not function because object is immutable."""
+        raise TypeError("'%s' does not support mutable operations." %
+                        self.__class__.__name__)
+
+    def __unicode__(self):
+        return pprint_thing(self, quote_strings=True,
+                            escape_chars=('\t', '\r', '\n'))
+
+    def __repr__(self):
+        return "%s(%s)" % (self.__class__.__name__,
+                           str(self))
+
+    __setitem__ = __setslice__ = __delitem__ = __delslice__ = _disabled
+    pop = append = extend = remove = sort = insert = _disabled
+
+
+class FrozenNDArray(PandasObject, np.ndarray):
+
+    # no __array_finalize__ for now because no metadata
+    def __new__(cls, data, dtype=None, copy=False):
+        if copy is None:
+            copy = not isinstance(data, FrozenNDArray)
+        res = np.array(data, dtype=dtype, copy=copy).view(cls)
+        return res
+
+    def _disabled(self, *args, **kwargs):
+        """This method will not function because object is immutable."""
+        raise TypeError("'%s' does not support mutable operations." %
+                        self.__class__)
+
+    __setitem__ = __setslice__ = __delitem__ = __delslice__ = _disabled
+    put = itemset = fill = _disabled
+
+    def _shallow_copy(self):
+        return self.view()
+
+    def values(self):
+        """returns *copy* of underlying array"""
+        arr = self.view(np.ndarray).copy()
+        return arr
+
+    def __unicode__(self):
+        """
+        Return a string representation for this object.
+
+        Invoked by unicode(df) in py2 only. Yields a Unicode String in both
+        py2/py3.
+        """
+        prepr = pprint_thing(self, escape_chars=('\t', '\r', '\n'),
+                             quote_strings=True)
+        return "%s(%s, dtype='%s')" % (type(self).__name__, prepr, self.dtype)
+
+    def searchsorted(self, v, side='left', sorter=None):
+        """
+        Find indices where elements of v should be inserted
+        in a to maintain order.
+
+        For full documentation, see `numpy.searchsorted`
+
+        See Also
+        --------
+        numpy.searchsorted : equivalent function
+        """
+
+        # we are much more performant if the searched
+        # indexer is the same type as the array
+        # this doesn't matter for int64, but DOES
+        # matter for smaller int dtypes
+        # https://github.com/numpy/numpy/issues/5370
+        try:
+            v = self.dtype.type(v)
+        except:
+            pass
+        return super(FrozenNDArray, self).searchsorted(
+            v, side=side, sorter=sorter)
+
+
+def _ensure_frozen(array_like, categories, copy=False):
+    array_like = coerce_indexer_dtype(array_like, categories)
+    array_like = array_like.view(FrozenNDArray)
+    if copy:
+        array_like = array_like.copy()
+    return array_like
diff --git a/pandas/core/indexes/interval.py b/pandas/core/indexes/interval.py
new file mode 100644
index 0000000000000..80619c7beb28c
--- /dev/null
+++ b/pandas/core/indexes/interval.py
@@ -0,0 +1,1596 @@
+""" define the IntervalIndex """
+
+import numpy as np
+import warnings
+
+from pandas.core.dtypes.missing import notna, isna
+from pandas.core.dtypes.generic import ABCDatetimeIndex, ABCPeriodIndex
+from pandas.core.dtypes.dtypes import IntervalDtype
+from pandas.core.dtypes.cast import (
+    maybe_convert_platform, find_common_type, maybe_downcast_to_dtype)
+from pandas.core.dtypes.common import (
+    _ensure_platform_int,
+    is_list_like,
+    is_datetime_or_timedelta_dtype,
+    is_datetime64tz_dtype,
+    is_categorical_dtype,
+    is_string_dtype,
+    is_integer_dtype,
+    is_float_dtype,
+    is_interval_dtype,
+    is_object_dtype,
+    is_scalar,
+    is_float,
+    is_number,
+    is_integer,
+    pandas_dtype)
+from pandas.core.indexes.base import (
+    Index, _ensure_index,
+    default_pprint, _index_shared_docs)
+
+from pandas._libs import Timestamp, Timedelta
+from pandas._libs.interval import (
+    Interval, IntervalMixin, IntervalTree,
+    intervals_to_interval_bounds)
+
+from pandas.core.indexes.datetimes import date_range
+from pandas.core.indexes.timedeltas import timedelta_range
+from pandas.core.indexes.multi import MultiIndex
+from pandas.compat.numpy import function as nv
+import pandas.core.common as com
+from pandas.util._decorators import cache_readonly, Appender
+from pandas.core.config import get_option
+from pandas.tseries.frequencies import to_offset
+from pandas.tseries.offsets import DateOffset
+
+import pandas.core.indexes.base as ibase
+_index_doc_kwargs = dict(ibase._index_doc_kwargs)
+_index_doc_kwargs.update(
+    dict(klass='IntervalIndex',
+         target_klass='IntervalIndex or list of Intervals'))
+
+
+_VALID_CLOSED = set(['left', 'right', 'both', 'neither'])
+
+
+def _get_next_label(label):
+    dtype = getattr(label, 'dtype', type(label))
+    if isinstance(label, (Timestamp, Timedelta)):
+        dtype = 'datetime64'
+    if is_datetime_or_timedelta_dtype(dtype) or is_datetime64tz_dtype(dtype):
+        return label + np.timedelta64(1, 'ns')
+    elif is_integer_dtype(dtype):
+        return label + 1
+    elif is_float_dtype(dtype):
+        return np.nextafter(label, np.infty)
+    else:
+        raise TypeError('cannot determine next label for type {typ!r}'
+                        .format(typ=type(label)))
+
+
+def _get_prev_label(label):
+    dtype = getattr(label, 'dtype', type(label))
+    if isinstance(label, (Timestamp, Timedelta)):
+        dtype = 'datetime64'
+    if is_datetime_or_timedelta_dtype(dtype) or is_datetime64tz_dtype(dtype):
+        return label - np.timedelta64(1, 'ns')
+    elif is_integer_dtype(dtype):
+        return label - 1
+    elif is_float_dtype(dtype):
+        return np.nextafter(label, -np.infty)
+    else:
+        raise TypeError('cannot determine next label for type {typ!r}'
+                        .format(typ=type(label)))
+
+
+def _get_interval_closed_bounds(interval):
+    """
+    Given an Interval or IntervalIndex, return the corresponding interval with
+    closed bounds.
+    """
+    left, right = interval.left, interval.right
+    if interval.open_left:
+        left = _get_next_label(left)
+    if interval.open_right:
+        right = _get_prev_label(right)
+    return left, right
+
+
+def maybe_convert_platform_interval(values):
+    """
+    Try to do platform conversion, with special casing for IntervalIndex.
+    Wrapper around maybe_convert_platform that alters the default return
+    dtype in certain cases to be compatible with IntervalIndex.  For example,
+    empty lists return with integer dtype instead of object dtype, which is
+    prohibited for IntervalIndex.
+
+    Parameters
+    ----------
+    values : array-like
+
+    Returns
+    -------
+    array
+    """
+    if is_categorical_dtype(values):
+        # GH 21243/21253
+        values = np.array(values)
+
+    if isinstance(values, (list, tuple)) and len(values) == 0:
+        # GH 19016
+        # empty lists/tuples get object dtype by default, but this is not
+        # prohibited for IntervalIndex, so coerce to integer instead
+        return np.array([], dtype=np.int64)
+    return maybe_convert_platform(values)
+
+
+def _new_IntervalIndex(cls, d):
+    """
+    This is called upon unpickling, rather than the default which doesn't have
+    arguments and breaks __new__
+    """
+    return cls.from_arrays(**d)
+
+
+class IntervalIndex(IntervalMixin, Index):
+    """
+    Immutable Index implementing an ordered, sliceable set. IntervalIndex
+    represents an Index of Interval objects that are all closed on the same
+    side.
+
+    .. versionadded:: 0.20.0
+
+    .. warning::
+
+       The indexing behaviors are provisional and may change in
+       a future version of pandas.
+
+    Parameters
+    ----------
+    data : array-like (1-dimensional)
+        Array-like containing Interval objects from which to build the
+        IntervalIndex
+    closed : {'left', 'right', 'both', 'neither'}, default 'right'
+        Whether the intervals are closed on the left-side, right-side, both or
+        neither.
+    name : object, optional
+        Name to be stored in the index.
+    copy : boolean, default False
+        Copy the meta-data
+    dtype : dtype or None, default None
+        If None, dtype will be inferred
+
+        .. versionadded:: 0.23.0
+
+    Attributes
+    ----------
+    closed
+    is_non_overlapping_monotonic
+    left
+    length
+    mid
+    right
+    values
+
+    Methods
+    -------
+    contains
+    from_arrays
+    from_breaks
+    from_tuples
+    get_indexer
+    get_loc
+
+    Examples
+    ---------
+    A new ``IntervalIndex`` is typically constructed using
+    :func:`interval_range`:
+
+    >>> pd.interval_range(start=0, end=5)
+    IntervalIndex([(0, 1], (1, 2], (2, 3], (3, 4], (4, 5]]
+                  closed='right', dtype='interval[int64]')
+
+    It may also be constructed using one of the constructor
+    methods: :meth:`IntervalIndex.from_arrays`,
+    :meth:`IntervalIndex.from_breaks`, and :meth:`IntervalIndex.from_tuples`.
+
+    See further examples in the doc strings of ``interval_range`` and the
+    mentioned constructor methods.
+
+    Notes
+    ------
+    See the `user guide
+    <http://pandas.pydata.org/pandas-docs/stable/advanced.html#intervalindex>`_
+    for more.
+
+    See Also
+    --------
+    Index : The base pandas Index type
+    Interval : A bounded slice-like interval; the elements of an IntervalIndex
+    interval_range : Function to create a fixed frequency IntervalIndex
+    cut, qcut : Convert arrays of continuous data into Categoricals/Series of
+                Intervals
+    """
+    _typ = 'intervalindex'
+    _comparables = ['name']
+    _attributes = ['name', 'closed']
+
+    # we would like our indexing holder to defer to us
+    _defer_to_indexing = True
+
+    _mask = None
+
+    def __new__(cls, data, closed=None, dtype=None, copy=False,
+                name=None, fastpath=False, verify_integrity=True):
+
+        if fastpath:
+            return cls._simple_new(data.left, data.right, closed, name,
+                                   copy=copy, verify_integrity=False)
+
+        if name is None and hasattr(data, 'name'):
+            name = data.name
+
+        if isinstance(data, IntervalIndex):
+            left = data.left
+            right = data.right
+            closed = closed or data.closed
+        else:
+
+            # don't allow scalars
+            if is_scalar(data):
+                cls._scalar_data_error(data)
+
+            data = maybe_convert_platform_interval(data)
+            left, right, infer_closed = intervals_to_interval_bounds(
+                data, validate_closed=closed is None)
+            closed = closed or infer_closed
+
+        return cls._simple_new(left, right, closed, name, copy=copy,
+                               dtype=dtype, verify_integrity=verify_integrity)
+
+    @classmethod
+    def _simple_new(cls, left, right, closed=None, name=None, copy=False,
+                    dtype=None, verify_integrity=True):
+        result = IntervalMixin.__new__(cls)
+
+        closed = closed or 'right'
+        left = _ensure_index(left, copy=copy)
+        right = _ensure_index(right, copy=copy)
+
+        if dtype is not None:
+            # GH 19262: dtype must be an IntervalDtype to override inferred
+            dtype = pandas_dtype(dtype)
+            if not is_interval_dtype(dtype):
+                msg = 'dtype must be an IntervalDtype, got {dtype}'
+                raise TypeError(msg.format(dtype=dtype))
+            elif dtype.subtype is not None:
+                left = left.astype(dtype.subtype)
+                right = right.astype(dtype.subtype)
+
+        # coerce dtypes to match if needed
+        if is_float_dtype(left) and is_integer_dtype(right):
+            right = right.astype(left.dtype)
+        elif is_float_dtype(right) and is_integer_dtype(left):
+            left = left.astype(right.dtype)
+
+        if type(left) != type(right):
+            msg = ('must not have differing left [{ltype}] and right '
+                   '[{rtype}] types')
+            raise ValueError(msg.format(ltype=type(left).__name__,
+                                        rtype=type(right).__name__))
+        elif is_categorical_dtype(left.dtype) or is_string_dtype(left.dtype):
+            # GH 19016
+            msg = ('category, object, and string subtypes are not supported '
+                   'for IntervalIndex')
+            raise TypeError(msg)
+        elif isinstance(left, ABCPeriodIndex):
+            msg = 'Period dtypes are not supported, use a PeriodIndex instead'
+            raise ValueError(msg)
+        elif (isinstance(left, ABCDatetimeIndex) and
+                str(left.tz) != str(right.tz)):
+            msg = ("left and right must have the same time zone, got "
+                   "'{left_tz}' and '{right_tz}'")
+            raise ValueError(msg.format(left_tz=left.tz, right_tz=right.tz))
+
+        result._left = left
+        result._right = right
+        result._closed = closed
+        result.name = name
+        if verify_integrity:
+            result._validate()
+        result._reset_identity()
+        return result
+
+    @Appender(_index_shared_docs['_shallow_copy'])
+    def _shallow_copy(self, left=None, right=None, **kwargs):
+        if left is None:
+
+            # no values passed
+            left, right = self.left, self.right
+
+        elif right is None:
+
+            # only single value passed, could be an IntervalIndex
+            # or array of Intervals
+            if not isinstance(left, IntervalIndex):
+                left = self._constructor(left)
+
+            left, right = left.left, left.right
+        else:
+
+            # both left and right are values
+            pass
+
+        attributes = self._get_attributes_dict()
+        attributes.update(kwargs)
+        attributes['verify_integrity'] = False
+        return self._simple_new(left, right, **attributes)
+
+    def _validate(self):
+        """
+        Verify that the IntervalIndex is valid.
+        """
+        if self.closed not in _VALID_CLOSED:
+            raise ValueError("invalid option for 'closed': {closed}"
+                             .format(closed=self.closed))
+        if len(self.left) != len(self.right):
+            raise ValueError('left and right must have the same length')
+        left_mask = notna(self.left)
+        right_mask = notna(self.right)
+        if not (left_mask == right_mask).all():
+            raise ValueError('missing values must be missing in the same '
+                             'location both left and right sides')
+        if not (self.left[left_mask] <= self.right[left_mask]).all():
+            raise ValueError('left side of interval must be <= right side')
+        self._mask = ~left_mask
+
+    @cache_readonly
+    def hasnans(self):
+        """
+        Return if the IntervalIndex has any nans; enables various performance
+        speedups
+        """
+        return self._isnan.any()
+
+    @cache_readonly
+    def _isnan(self):
+        """Return a mask indicating if each value is NA"""
+        if self._mask is None:
+            self._mask = isna(self.left)
+        return self._mask
+
+    @cache_readonly
+    def _engine(self):
+        return IntervalTree(self.left, self.right, closed=self.closed)
+
+    @property
+    def _constructor(self):
+        return type(self)
+
+    def __contains__(self, key):
+        """
+        return a boolean if this key is IN the index
+        We *only* accept an Interval
+
+        Parameters
+        ----------
+        key : Interval
+
+        Returns
+        -------
+        boolean
+        """
+        if not isinstance(key, Interval):
+            return False
+
+        try:
+            self.get_loc(key)
+            return True
+        except KeyError:
+            return False
+
+    def contains(self, key):
+        """
+        Return a boolean indicating if the key is IN the index
+
+        We accept / allow keys to be not *just* actual
+        objects.
+
+        Parameters
+        ----------
+        key : int, float, Interval
+
+        Returns
+        -------
+        boolean
+        """
+        try:
+            self.get_loc(key)
+            return True
+        except KeyError:
+            return False
+
+    @classmethod
+    def from_breaks(cls, breaks, closed='right', name=None, copy=False,
+                    dtype=None):
+        """
+        Construct an IntervalIndex from an array of splits
+
+        Parameters
+        ----------
+        breaks : array-like (1-dimensional)
+            Left and right bounds for each interval.
+        closed : {'left', 'right', 'both', 'neither'}, default 'right'
+            Whether the intervals are closed on the left-side, right-side, both
+            or neither.
+        name : object, optional
+            Name to be stored in the index.
+        copy : boolean, default False
+            copy the data
+        dtype : dtype or None, default None
+            If None, dtype will be inferred
+
+            .. versionadded:: 0.23.0
+
+        Examples
+        --------
+        >>> pd.IntervalIndex.from_breaks([0, 1, 2, 3])
+        IntervalIndex([(0, 1], (1, 2], (2, 3]]
+                      closed='right',
+                      dtype='interval[int64]')
+
+        See Also
+        --------
+        interval_range : Function to create a fixed frequency IntervalIndex
+        IntervalIndex.from_arrays : Construct an IntervalIndex from a left and
+                                    right array
+        IntervalIndex.from_tuples : Construct an IntervalIndex from a
+                                    list/array of tuples
+        """
+        breaks = maybe_convert_platform_interval(breaks)
+
+        return cls.from_arrays(breaks[:-1], breaks[1:], closed,
+                               name=name, copy=copy, dtype=dtype)
+
+    @classmethod
+    def from_arrays(cls, left, right, closed='right', name=None, copy=False,
+                    dtype=None):
+        """
+        Construct from two arrays defining the left and right bounds.
+
+        Parameters
+        ----------
+        left : array-like (1-dimensional)
+            Left bounds for each interval.
+        right : array-like (1-dimensional)
+            Right bounds for each interval.
+        closed : {'left', 'right', 'both', 'neither'}, default 'right'
+            Whether the intervals are closed on the left-side, right-side, both
+            or neither.
+        name : object, optional
+            Name to be stored in the index.
+        copy : boolean, default False
+            Copy the data.
+        dtype : dtype, optional
+            If None, dtype will be inferred.
+
+            .. versionadded:: 0.23.0
+
+        Returns
+        -------
+        index : IntervalIndex
+
+        Notes
+        -----
+        Each element of `left` must be less than or equal to the `right`
+        element at the same position. If an element is missing, it must be
+        missing in both `left` and `right`. A TypeError is raised when
+        using an unsupported type for `left` or `right`. At the moment,
+        'category', 'object', and 'string' subtypes are not supported.
+
+        Raises
+        ------
+        ValueError
+            When a value is missing in only one of `left` or `right`.
+            When a value in `left` is greater than the corresponding value
+            in `right`.
+
+        See Also
+        --------
+        interval_range : Function to create a fixed frequency IntervalIndex.
+        IntervalIndex.from_breaks : Construct an IntervalIndex from an array of
+            splits.
+        IntervalIndex.from_tuples : Construct an IntervalIndex from a
+            list/array of tuples.
+
+        Examples
+        --------
+        >>> pd.IntervalIndex.from_arrays([0, 1, 2], [1, 2, 3])
+        IntervalIndex([(0, 1], (1, 2], (2, 3]]
+                      closed='right',
+                      dtype='interval[int64]')
+
+        If you want to segment different groups of people based on
+        ages, you can apply the method as follows:
+
+        >>> ages = pd.IntervalIndex.from_arrays([0, 2, 13],
+        ...                                     [2, 13, 19], closed='left')
+        >>> ages
+        IntervalIndex([[0, 2), [2, 13), [13, 19)]
+                      closed='left',
+                      dtype='interval[int64]')
+        >>> s = pd.Series(['baby', 'kid', 'teen'], ages)
+        >>> s
+        [0, 2)      baby
+        [2, 13)      kid
+        [13, 19)    teen
+        dtype: object
+
+        Values may be missing, but they must be missing in both arrays.
+
+        >>> pd.IntervalIndex.from_arrays([0, np.nan, 13],
+        ...                              [2, np.nan, 19])
+        IntervalIndex([(0.0, 2.0], nan, (13.0, 19.0]]
+                      closed='right',
+                      dtype='interval[float64]')
+        """
+        left = maybe_convert_platform_interval(left)
+        right = maybe_convert_platform_interval(right)
+
+        return cls._simple_new(left, right, closed, name=name, copy=copy,
+                               dtype=dtype, verify_integrity=True)
+
+    @classmethod
+    def from_intervals(cls, data, closed=None, name=None, copy=False,
+                       dtype=None):
+        """
+        Construct an IntervalIndex from a 1d array of Interval objects
+
+        .. deprecated:: 0.23.0
+
+        Parameters
+        ----------
+        data : array-like (1-dimensional)
+            Array of Interval objects. All intervals must be closed on the same
+            sides.
+        name : object, optional
+            Name to be stored in the index.
+        copy : boolean, default False
+            by-default copy the data, this is compat only and ignored
+        dtype : dtype or None, default None
+            If None, dtype will be inferred
+
+            .. versionadded:: 0.23.0
+
+        Examples
+        --------
+        >>> pd.IntervalIndex.from_intervals([pd.Interval(0, 1),
+        ...                                  pd.Interval(1, 2)])
+        IntervalIndex([(0, 1], (1, 2]]
+                      closed='right', dtype='interval[int64]')
+
+        The generic Index constructor work identically when it infers an array
+        of all intervals:
+
+        >>> pd.Index([pd.Interval(0, 1), pd.Interval(1, 2)])
+        IntervalIndex([(0, 1], (1, 2]]
+                      closed='right', dtype='interval[int64]')
+
+        See Also
+        --------
+        interval_range : Function to create a fixed frequency IntervalIndex
+        IntervalIndex.from_arrays : Construct an IntervalIndex from a left and
+                                    right array
+        IntervalIndex.from_breaks : Construct an IntervalIndex from an array of
+                                    splits
+        IntervalIndex.from_tuples : Construct an IntervalIndex from a
+                                    list/array of tuples
+        """
+        msg = ('IntervalIndex.from_intervals is deprecated and will be '
+               'removed in a future version; use IntervalIndex(...) instead')
+        warnings.warn(msg, FutureWarning, stacklevel=2)
+        return cls(data, closed=closed, name=name, copy=copy, dtype=dtype)
+
+    @classmethod
+    def from_tuples(cls, data, closed='right', name=None, copy=False,
+                    dtype=None):
+        """
+        Construct an IntervalIndex from a list/array of tuples
+
+        Parameters
+        ----------
+        data : array-like (1-dimensional)
+            Array of tuples
+        closed : {'left', 'right', 'both', 'neither'}, default 'right'
+            Whether the intervals are closed on the left-side, right-side, both
+            or neither.
+        name : object, optional
+            Name to be stored in the index.
+        copy : boolean, default False
+            by-default copy the data, this is compat only and ignored
+        dtype : dtype or None, default None
+            If None, dtype will be inferred
+
+            .. versionadded:: 0.23.0
+
+        Examples
+        --------
+        >>>  pd.IntervalIndex.from_tuples([(0, 1), (1, 2)])
+        IntervalIndex([(0, 1], (1, 2]],
+                      closed='right', dtype='interval[int64]')
+
+        See Also
+        --------
+        interval_range : Function to create a fixed frequency IntervalIndex
+        IntervalIndex.from_arrays : Construct an IntervalIndex from a left and
+                                    right array
+        IntervalIndex.from_breaks : Construct an IntervalIndex from an array of
+                                    splits
+        """
+        if len(data):
+            left, right = [], []
+        else:
+            left = right = data
+
+        for d in data:
+            if isna(d):
+                lhs = rhs = np.nan
+            else:
+                try:
+                    # need list of length 2 tuples, e.g. [(0, 1), (1, 2), ...]
+                    lhs, rhs = d
+                except ValueError:
+                    msg = ('IntervalIndex.from_tuples requires tuples of '
+                           'length 2, got {tpl}').format(tpl=d)
+                    raise ValueError(msg)
+                except TypeError:
+                    msg = ('IntervalIndex.from_tuples received an invalid '
+                           'item, {tpl}').format(tpl=d)
+                    raise TypeError(msg)
+            left.append(lhs)
+            right.append(rhs)
+
+        return cls.from_arrays(left, right, closed, name=name, copy=False,
+                               dtype=dtype)
+
+    def to_tuples(self, na_tuple=True):
+        """
+        Return an Index of tuples of the form (left, right)
+
+        Parameters
+        ----------
+        na_tuple : boolean, default True
+            Returns NA as a tuple if True, ``(nan, nan)``, or just as the NA
+            value itself if False, ``nan``.
+
+            .. versionadded:: 0.23.0
+
+        Examples
+        --------
+        >>>  idx = pd.IntervalIndex.from_arrays([0, np.nan, 2], [1, np.nan, 3])
+        >>>  idx.to_tuples()
+        Index([(0.0, 1.0), (nan, nan), (2.0, 3.0)], dtype='object')
+        >>>  idx.to_tuples(na_tuple=False)
+        Index([(0.0, 1.0), nan, (2.0, 3.0)], dtype='object')
+        """
+        tuples = com._asarray_tuplesafe(zip(self.left, self.right))
+        if not na_tuple:
+            # GH 18756
+            tuples = np.where(~self._isnan, tuples, np.nan)
+        return Index(tuples)
+
+    @cache_readonly
+    def _multiindex(self):
+        return MultiIndex.from_arrays([self.left, self.right],
+                                      names=['left', 'right'])
+
+    @property
+    def left(self):
+        """
+        Return the left endpoints of each Interval in the IntervalIndex as
+        an Index
+        """
+        return self._left
+
+    @property
+    def right(self):
+        """
+        Return the right endpoints of each Interval in the IntervalIndex as
+        an Index
+        """
+        return self._right
+
+    @property
+    def closed(self):
+        """
+        Whether the intervals are closed on the left-side, right-side, both or
+        neither
+        """
+        return self._closed
+
+    @property
+    def length(self):
+        """
+        Return an Index with entries denoting the length of each Interval in
+        the IntervalIndex
+        """
+        try:
+            return self.right - self.left
+        except TypeError:
+            # length not defined for some types, e.g. string
+            msg = ('IntervalIndex contains Intervals without defined length, '
+                   'e.g. Intervals with string endpoints')
+            raise TypeError(msg)
+
+    @property
+    def size(self):
+        # Avoid materializing self.values
+        return self.left.size
+
+    @property
+    def shape(self):
+        # Avoid materializing self.values
+        return self.left.shape
+
+    def __len__(self):
+        return len(self.left)
+
+    @cache_readonly
+    def values(self):
+        """
+        Return the IntervalIndex's data as a numpy array of Interval
+        objects (with dtype='object')
+        """
+        left = self.left
+        right = self.right
+        mask = self._isnan
+        closed = self._closed
+
+        result = np.empty(len(left), dtype=object)
+        for i in range(len(left)):
+            if mask[i]:
+                result[i] = np.nan
+            else:
+                result[i] = Interval(left[i], right[i], closed)
+        return result
+
+    def __array__(self, result=None):
+        """ the array interface, return my values """
+        return self.values
+
+    def __array_wrap__(self, result, context=None):
+        # we don't want the superclass implementation
+        return result
+
+    def _array_values(self):
+        return self.values
+
+    def __reduce__(self):
+        d = dict(left=self.left,
+                 right=self.right)
+        d.update(self._get_attributes_dict())
+        return _new_IntervalIndex, (self.__class__, d), None
+
+    @Appender(_index_shared_docs['copy'])
+    def copy(self, deep=False, name=None):
+        left = self.left.copy(deep=True) if deep else self.left
+        right = self.right.copy(deep=True) if deep else self.right
+        name = name if name is not None else self.name
+        closed = self.closed
+        return type(self).from_arrays(left, right, closed=closed, name=name)
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        dtype = pandas_dtype(dtype)
+        if is_interval_dtype(dtype) and dtype != self.dtype:
+            try:
+                new_left = self.left.astype(dtype.subtype)
+                new_right = self.right.astype(dtype.subtype)
+            except TypeError:
+                msg = ('Cannot convert {dtype} to {new_dtype}; subtypes are '
+                       'incompatible')
+                raise TypeError(msg.format(dtype=self.dtype, new_dtype=dtype))
+            return self._shallow_copy(new_left, new_right)
+        return super(IntervalIndex, self).astype(dtype, copy=copy)
+
+    @cache_readonly
+    def dtype(self):
+        """Return the dtype object of the underlying data"""
+        return IntervalDtype.construct_from_string(str(self.left.dtype))
+
+    @property
+    def inferred_type(self):
+        """Return a string of the type inferred from the values"""
+        return 'interval'
+
+    @Appender(Index.memory_usage.__doc__)
+    def memory_usage(self, deep=False):
+        # we don't use an explicit engine
+        # so return the bytes here
+        return (self.left.memory_usage(deep=deep) +
+                self.right.memory_usage(deep=deep))
+
+    @cache_readonly
+    def mid(self):
+        """
+        Return the midpoint of each Interval in the IntervalIndex as an Index
+        """
+        try:
+            return 0.5 * (self.left + self.right)
+        except TypeError:
+            # datetime safe version
+            return self.left + 0.5 * self.length
+
+    @cache_readonly
+    def is_monotonic(self):
+        """
+        Return True if the IntervalIndex is monotonic increasing (only equal or
+        increasing values), else False
+        """
+        return self._multiindex.is_monotonic
+
+    @cache_readonly
+    def is_monotonic_increasing(self):
+        """
+        Return True if the IntervalIndex is monotonic increasing (only equal or
+        increasing values), else False
+        """
+        return self._multiindex.is_monotonic_increasing
+
+    @cache_readonly
+    def is_monotonic_decreasing(self):
+        """
+        Return True if the IntervalIndex is monotonic decreasing (only equal or
+        decreasing values), else False
+        """
+        return self._multiindex.is_monotonic_decreasing
+
+    @cache_readonly
+    def is_unique(self):
+        """
+        Return True if the IntervalIndex contains unique elements, else False
+        """
+        return self._multiindex.is_unique
+
+    @cache_readonly
+    def is_non_overlapping_monotonic(self):
+        """
+        Return True if the IntervalIndex is non-overlapping (no Intervals share
+        points) and is either monotonic increasing or monotonic decreasing,
+        else False
+        """
+        # must be increasing  (e.g., [0, 1), [1, 2), [2, 3), ... )
+        # or decreasing (e.g., [-1, 0), [-2, -1), [-3, -2), ...)
+        # we already require left <= right
+
+        # strict inequality for closed == 'both'; equality implies overlapping
+        # at a point when both sides of intervals are included
+        if self.closed == 'both':
+            return bool((self.right[:-1] < self.left[1:]).all() or
+                        (self.left[:-1] > self.right[1:]).all())
+
+        # non-strict inequality when closed != 'both'; at least one side is
+        # not included in the intervals, so equality does not imply overlapping
+        return bool((self.right[:-1] <= self.left[1:]).all() or
+                    (self.left[:-1] >= self.right[1:]).all())
+
+    @Appender(_index_shared_docs['_convert_scalar_indexer'])
+    def _convert_scalar_indexer(self, key, kind=None):
+        if kind == 'iloc':
+            return super(IntervalIndex, self)._convert_scalar_indexer(
+                key, kind=kind)
+        return key
+
+    def _maybe_cast_slice_bound(self, label, side, kind):
+        return getattr(self, side)._maybe_cast_slice_bound(label, side, kind)
+
+    @Appender(_index_shared_docs['_convert_list_indexer'])
+    def _convert_list_indexer(self, keyarr, kind=None):
+        """
+        we are passed a list-like indexer. Return the
+        indexer for matching intervals.
+        """
+        locs = self.get_indexer_for(keyarr)
+
+        # we have missing values
+        if (locs == -1).any():
+            raise KeyError
+
+        return locs
+
+    def _maybe_cast_indexed(self, key):
+        """
+        we need to cast the key, which could be a scalar
+        or an array-like to the type of our subtype
+        """
+        if isinstance(key, IntervalIndex):
+            return key
+
+        subtype = self.dtype.subtype
+        if is_float_dtype(subtype):
+            if is_integer(key):
+                key = float(key)
+            elif isinstance(key, (np.ndarray, Index)):
+                key = key.astype('float64')
+        elif is_integer_dtype(subtype):
+            if is_integer(key):
+                key = int(key)
+
+        return key
+
+    def _check_method(self, method):
+        if method is None:
+            return
+
+        if method in ['bfill', 'backfill', 'pad', 'ffill', 'nearest']:
+            msg = 'method {method} not yet implemented for IntervalIndex'
+            raise NotImplementedError(msg.format(method=method))
+
+        raise ValueError("Invalid fill method")
+
+    def _searchsorted_monotonic(self, label, side, exclude_label=False):
+        if not self.is_non_overlapping_monotonic:
+            raise KeyError('can only get slices from an IntervalIndex if '
+                           'bounds are non-overlapping and all monotonic '
+                           'increasing or decreasing')
+
+        if isinstance(label, IntervalMixin):
+            raise NotImplementedError
+
+        # GH 20921: "not is_monotonic_increasing" for the second condition
+        # instead of "is_monotonic_decreasing" to account for single element
+        # indexes being both increasing and decreasing
+        if ((side == 'left' and self.left.is_monotonic_increasing) or
+                (side == 'right' and not self.left.is_monotonic_increasing)):
+            sub_idx = self.right
+            if self.open_right or exclude_label:
+                label = _get_next_label(label)
+        else:
+            sub_idx = self.left
+            if self.open_left or exclude_label:
+                label = _get_prev_label(label)
+
+        return sub_idx._searchsorted_monotonic(label, side)
+
+    def _get_loc_only_exact_matches(self, key):
+        if isinstance(key, Interval):
+
+            if not self.is_unique:
+                raise ValueError("cannot index with a slice Interval"
+                                 " and a non-unique index")
+
+            # TODO: this expands to a tuple index, see if we can
+            # do better
+            return Index(self._multiindex.values).get_loc(key)
+        raise KeyError
+
+    def _find_non_overlapping_monotonic_bounds(self, key):
+        if isinstance(key, IntervalMixin):
+            start = self._searchsorted_monotonic(
+                key.left, 'left', exclude_label=key.open_left)
+            stop = self._searchsorted_monotonic(
+                key.right, 'right', exclude_label=key.open_right)
+        elif isinstance(key, slice):
+            # slice
+            start, stop = key.start, key.stop
+            if (key.step or 1) != 1:
+                raise NotImplementedError("cannot slice with a slice step")
+            if start is None:
+                start = 0
+            else:
+                start = self._searchsorted_monotonic(start, 'left')
+            if stop is None:
+                stop = len(self)
+            else:
+                stop = self._searchsorted_monotonic(stop, 'right')
+        else:
+            # scalar or index-like
+
+            start = self._searchsorted_monotonic(key, 'left')
+            stop = self._searchsorted_monotonic(key, 'right')
+        return start, stop
+
+    def get_loc(self, key, method=None):
+        """Get integer location, slice or boolean mask for requested label.
+
+        Parameters
+        ----------
+        key : label
+        method : {None}, optional
+            * default: matches where the label is within an interval only.
+
+        Returns
+        -------
+        loc : int if unique index, slice if monotonic index, else mask
+
+        Examples
+        ---------
+        >>> i1, i2 = pd.Interval(0, 1), pd.Interval(1, 2)
+        >>> index = pd.IntervalIndex([i1, i2])
+        >>> index.get_loc(1)
+        0
+
+        You can also supply an interval or an location for a point inside an
+        interval.
+
+        >>> index.get_loc(pd.Interval(0, 2))
+        array([0, 1], dtype=int64)
+        >>> index.get_loc(1.5)
+        1
+
+        If a label is in several intervals, you get the locations of all the
+        relevant intervals.
+
+        >>> i3 = pd.Interval(0, 2)
+        >>> overlapping_index = pd.IntervalIndex([i2, i3])
+        >>> overlapping_index.get_loc(1.5)
+        array([0, 1], dtype=int64)
+        """
+        self._check_method(method)
+
+        original_key = key
+        key = self._maybe_cast_indexed(key)
+
+        if self.is_non_overlapping_monotonic:
+            if isinstance(key, Interval):
+                left = self._maybe_cast_slice_bound(key.left, 'left', None)
+                right = self._maybe_cast_slice_bound(key.right, 'right', None)
+                key = Interval(left, right, key.closed)
+            else:
+                key = self._maybe_cast_slice_bound(key, 'left', None)
+
+            start, stop = self._find_non_overlapping_monotonic_bounds(key)
+
+            if start is None or stop is None:
+                return slice(start, stop)
+            elif start + 1 == stop:
+                return start
+            elif start < stop:
+                return slice(start, stop)
+            else:
+                raise KeyError(original_key)
+
+        else:
+            # use the interval tree
+            if isinstance(key, Interval):
+                left, right = _get_interval_closed_bounds(key)
+                return self._engine.get_loc_interval(left, right)
+            else:
+                return self._engine.get_loc(key)
+
+    def get_value(self, series, key):
+        if com.is_bool_indexer(key):
+            loc = key
+        elif is_list_like(key):
+            loc = self.get_indexer(key)
+        elif isinstance(key, slice):
+
+            if not (key.step is None or key.step == 1):
+                raise ValueError("cannot support not-default step in a slice")
+
+            try:
+                loc = self.get_loc(key)
+            except TypeError:
+                # we didn't find exact intervals or are non-unique
+                msg = "unable to slice with this key: {key}".format(key=key)
+                raise ValueError(msg)
+
+        else:
+            loc = self.get_loc(key)
+        return series.iloc[loc]
+
+    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
+    def get_indexer(self, target, method=None, limit=None, tolerance=None):
+
+        self._check_method(method)
+        target = _ensure_index(target)
+        target = self._maybe_cast_indexed(target)
+
+        if self.equals(target):
+            return np.arange(len(self), dtype='intp')
+
+        if self.is_non_overlapping_monotonic:
+            start, stop = self._find_non_overlapping_monotonic_bounds(target)
+
+            start_plus_one = start + 1
+            if not ((start_plus_one < stop).any()):
+                return np.where(start_plus_one == stop, start, -1)
+
+        if not self.is_unique:
+            raise ValueError("cannot handle non-unique indices")
+
+        # IntervalIndex
+        if isinstance(target, IntervalIndex):
+            indexer = self._get_reindexer(target)
+
+        # non IntervalIndex
+        else:
+            indexer = np.concatenate([self.get_loc(i) for i in target])
+
+        return _ensure_platform_int(indexer)
+
+    def _get_reindexer(self, target):
+        """
+        Return an indexer for a target IntervalIndex with self
+        """
+
+        # find the left and right indexers
+        lindexer = self._engine.get_indexer(target.left.values)
+        rindexer = self._engine.get_indexer(target.right.values)
+
+        # we want to return an indexer on the intervals
+        # however, our keys could provide overlapping of multiple
+        # intervals, so we iterate thru the indexers and construct
+        # a set of indexers
+
+        indexer = []
+        n = len(self)
+
+        for i, (lhs, rhs) in enumerate(zip(lindexer, rindexer)):
+
+            target_value = target[i]
+
+            # matching on the lhs bound
+            if (lhs != -1 and
+                    self.closed == 'right' and
+                    target_value.left == self[lhs].right):
+                lhs += 1
+
+            # matching on the lhs bound
+            if (rhs != -1 and
+                    self.closed == 'left' and
+                    target_value.right == self[rhs].left):
+                rhs -= 1
+
+            # not found
+            if lhs == -1 and rhs == -1:
+                indexer.append(np.array([-1]))
+
+            elif rhs == -1:
+
+                indexer.append(np.arange(lhs, n))
+
+            elif lhs == -1:
+
+                # care about left/right closed here
+                value = self[i]
+
+                # target.closed same as self.closed
+                if self.closed == target.closed:
+                    if target_value.left < value.left:
+                        indexer.append(np.array([-1]))
+                        continue
+
+                # target.closed == 'left'
+                elif self.closed == 'right':
+                    if target_value.left <= value.left:
+                        indexer.append(np.array([-1]))
+                        continue
+
+                # target.closed == 'right'
+                elif self.closed == 'left':
+                    if target_value.left <= value.left:
+                        indexer.append(np.array([-1]))
+                        continue
+
+                indexer.append(np.arange(0, rhs + 1))
+
+            else:
+                indexer.append(np.arange(lhs, rhs + 1))
+
+        return np.concatenate(indexer)
+
+    @Appender(_index_shared_docs['get_indexer_non_unique'] % _index_doc_kwargs)
+    def get_indexer_non_unique(self, target):
+        target = self._maybe_cast_indexed(_ensure_index(target))
+        return super(IntervalIndex, self).get_indexer_non_unique(target)
+
+    @Appender(_index_shared_docs['where'])
+    def where(self, cond, other=None):
+        if other is None:
+            other = self._na_value
+        values = np.where(cond, self.values, other)
+        return self._shallow_copy(values)
+
+    def delete(self, loc):
+        """
+        Return a new IntervalIndex with passed location(-s) deleted
+
+        Returns
+        -------
+        new_index : IntervalIndex
+        """
+        new_left = self.left.delete(loc)
+        new_right = self.right.delete(loc)
+        return self._shallow_copy(new_left, new_right)
+
+    def insert(self, loc, item):
+        """
+        Return a new IntervalIndex inserting new item at location. Follows
+        Python list.append semantics for negative values.  Only Interval
+        objects and NA can be inserted into an IntervalIndex
+
+        Parameters
+        ----------
+        loc : int
+        item : object
+
+        Returns
+        -------
+        new_index : IntervalIndex
+        """
+        if isinstance(item, Interval):
+            if item.closed != self.closed:
+                raise ValueError('inserted item must be closed on the same '
+                                 'side as the index')
+            left_insert = item.left
+            right_insert = item.right
+        elif is_scalar(item) and isna(item):
+            # GH 18295
+            left_insert = right_insert = item
+        else:
+            raise ValueError('can only insert Interval objects and NA into '
+                             'an IntervalIndex')
+
+        new_left = self.left.insert(loc, left_insert)
+        new_right = self.right.insert(loc, right_insert)
+        return self._shallow_copy(new_left, new_right)
+
+    def _as_like_interval_index(self, other):
+        self._assert_can_do_setop(other)
+        other = _ensure_index(other)
+        if not isinstance(other, IntervalIndex):
+            msg = ('the other index needs to be an IntervalIndex too, but '
+                   'was type {}').format(other.__class__.__name__)
+            raise TypeError(msg)
+        elif self.closed != other.closed:
+            msg = ('can only do set operations between two IntervalIndex '
+                   'objects that are closed on the same side')
+            raise ValueError(msg)
+        return other
+
+    def _concat_same_dtype(self, to_concat, name):
+        """
+        assert that we all have the same .closed
+        we allow a 0-len index here as well
+        """
+        if not len({i.closed for i in to_concat if len(i)}) == 1:
+            msg = ('can only append two IntervalIndex objects '
+                   'that are closed on the same side')
+            raise ValueError(msg)
+        return super(IntervalIndex, self)._concat_same_dtype(to_concat, name)
+
+    @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
+    def take(self, indices, axis=0, allow_fill=True,
+             fill_value=None, **kwargs):
+        nv.validate_take(tuple(), kwargs)
+        indices = _ensure_platform_int(indices)
+        left, right = self.left, self.right
+
+        if fill_value is None:
+            fill_value = self._na_value
+        mask = indices == -1
+
+        if not mask.any():
+            # we won't change dtype here in this case
+            # if we don't need
+            allow_fill = False
+
+        taker = lambda x: x.take(indices, allow_fill=allow_fill,
+                                 fill_value=fill_value)
+
+        try:
+            new_left = taker(left)
+            new_right = taker(right)
+        except ValueError:
+
+            # we need to coerce; migth have NA's in an
+            # integer dtype
+            new_left = taker(left.astype(float))
+            new_right = taker(right.astype(float))
+
+        return self._shallow_copy(new_left, new_right)
+
+    def __getitem__(self, value):
+        mask = self._isnan[value]
+        if is_scalar(mask) and mask:
+            return self._na_value
+
+        left = self.left[value]
+        right = self.right[value]
+
+        # scalar
+        if not isinstance(left, Index):
+            return Interval(left, right, self.closed)
+
+        return self._shallow_copy(left, right)
+
+    # __repr__ associated methods are based on MultiIndex
+
+    def _format_with_header(self, header, **kwargs):
+        return header + list(self._format_native_types(**kwargs))
+
+    def _format_native_types(self, na_rep='', quoting=None, **kwargs):
+        """ actually format my specific types """
+        from pandas.io.formats.format import IntervalArrayFormatter
+        return IntervalArrayFormatter(values=self,
+                                      na_rep=na_rep,
+                                      justify='all').get_result()
+
+    def _format_data(self, name=None):
+
+        # TODO: integrate with categorical and make generic
+        # name argument is unused here; just for compat with base / categorical
+        n = len(self)
+        max_seq_items = min((get_option(
+            'display.max_seq_items') or n) // 10, 10)
+
+        formatter = str
+
+        if n == 0:
+            summary = '[]'
+        elif n == 1:
+            first = formatter(self[0])
+            summary = '[{first}]'.format(first=first)
+        elif n == 2:
+            first = formatter(self[0])
+            last = formatter(self[-1])
+            summary = '[{first}, {last}]'.format(first=first, last=last)
+        else:
+
+            if n > max_seq_items:
+                n = min(max_seq_items // 2, 10)
+                head = [formatter(x) for x in self[:n]]
+                tail = [formatter(x) for x in self[-n:]]
+                summary = '[{head} ... {tail}]'.format(
+                    head=', '.join(head), tail=', '.join(tail))
+            else:
+                head = []
+                tail = [formatter(x) for x in self]
+                summary = '[{tail}]'.format(tail=', '.join(tail))
+
+        return summary + self._format_space()
+
+    def _format_attrs(self):
+        attrs = [('closed', repr(self.closed))]
+        if self.name is not None:
+            attrs.append(('name', default_pprint(self.name)))
+        attrs.append(('dtype', "'{dtype}'".format(dtype=self.dtype)))
+        return attrs
+
+    def _format_space(self):
+        space = ' ' * (len(self.__class__.__name__) + 1)
+        return "\n{space}".format(space=space)
+
+    def argsort(self, *args, **kwargs):
+        return np.lexsort((self.right, self.left))
+
+    def equals(self, other):
+        """
+        Determines if two IntervalIndex objects contain the same elements
+        """
+        if self.is_(other):
+            return True
+
+        # if we can coerce to an II
+        # then we can compare
+        if not isinstance(other, IntervalIndex):
+            if not is_interval_dtype(other):
+                return False
+            other = Index(getattr(other, '.values', other))
+
+        return (self.left.equals(other.left) and
+                self.right.equals(other.right) and
+                self.closed == other.closed)
+
+    def _setop(op_name):
+        def func(self, other):
+            other = self._as_like_interval_index(other)
+
+            # GH 19016: ensure set op will not return a prohibited dtype
+            subtypes = [self.dtype.subtype, other.dtype.subtype]
+            common_subtype = find_common_type(subtypes)
+            if is_object_dtype(common_subtype):
+                msg = ('can only do {op} between two IntervalIndex '
+                       'objects that have compatible dtypes')
+                raise TypeError(msg.format(op=op_name))
+
+            result = getattr(self._multiindex, op_name)(other._multiindex)
+            result_name = self.name if self.name == other.name else None
+
+            # GH 19101: ensure empty results have correct dtype
+            if result.empty:
+                result = result.values.astype(self.dtype.subtype)
+            else:
+                result = result.values
+
+            return type(self).from_tuples(result, closed=self.closed,
+                                          name=result_name)
+        return func
+
+    union = _setop('union')
+    intersection = _setop('intersection')
+    difference = _setop('difference')
+    symmetric_difference = _setop('symmetric_difference')
+
+    # TODO: arithmetic operations
+
+
+IntervalIndex._add_logical_methods_disabled()
+
+
+def _is_valid_endpoint(endpoint):
+    """helper for interval_range to check if start/end are valid types"""
+    return any([is_number(endpoint),
+                isinstance(endpoint, Timestamp),
+                isinstance(endpoint, Timedelta),
+                endpoint is None])
+
+
+def _is_type_compatible(a, b):
+    """helper for interval_range to check type compat of start/end/freq"""
+    is_ts_compat = lambda x: isinstance(x, (Timestamp, DateOffset))
+    is_td_compat = lambda x: isinstance(x, (Timedelta, DateOffset))
+    return ((is_number(a) and is_number(b)) or
+            (is_ts_compat(a) and is_ts_compat(b)) or
+            (is_td_compat(a) and is_td_compat(b)) or
+            com._any_none(a, b))
+
+
+def interval_range(start=None, end=None, periods=None, freq=None,
+                   name=None, closed='right'):
+    """
+    Return a fixed frequency IntervalIndex
+
+    Parameters
+    ----------
+    start : numeric or datetime-like, default None
+        Left bound for generating intervals
+    end : numeric or datetime-like, default None
+        Right bound for generating intervals
+    periods : integer, default None
+        Number of periods to generate
+    freq : numeric, string, or DateOffset, default None
+        The length of each interval. Must be consistent with the type of start
+        and end, e.g. 2 for numeric, or '5H' for datetime-like.  Default is 1
+        for numeric and 'D' (calendar daily) for datetime-like.
+    name : string, default None
+        Name of the resulting IntervalIndex
+    closed : {'left', 'right', 'both', 'neither'}, default 'right'
+        Whether the intervals are closed on the left-side, right-side, both
+        or neither.
+
+    Notes
+    -----
+    Of the four parameters ``start``, ``end``, ``periods``, and ``freq``,
+    exactly three must be specified. If ``freq`` is omitted, the resulting
+    ``IntervalIndex`` will have ``periods`` linearly spaced elements between
+    ``start`` and ``end``, inclusively.
+
+    To learn more about datetime-like frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Returns
+    -------
+    rng : IntervalIndex
+
+    Examples
+    --------
+    Numeric ``start`` and  ``end`` is supported.
+
+    >>> pd.interval_range(start=0, end=5)
+    IntervalIndex([(0, 1], (1, 2], (2, 3], (3, 4], (4, 5]]
+                  closed='right', dtype='interval[int64]')
+
+    Additionally, datetime-like input is also supported.
+
+    >>> pd.interval_range(start=pd.Timestamp('2017-01-01'),
+                          end=pd.Timestamp('2017-01-04'))
+    IntervalIndex([(2017-01-01, 2017-01-02], (2017-01-02, 2017-01-03],
+                   (2017-01-03, 2017-01-04]]
+                  closed='right', dtype='interval[datetime64[ns]]')
+
+    The ``freq`` parameter specifies the frequency between the left and right.
+    endpoints of the individual intervals within the ``IntervalIndex``.  For
+    numeric ``start`` and ``end``, the frequency must also be numeric.
+
+    >>> pd.interval_range(start=0, periods=4, freq=1.5)
+    IntervalIndex([(0.0, 1.5], (1.5, 3.0], (3.0, 4.5], (4.5, 6.0]]
+                  closed='right', dtype='interval[float64]')
+
+    Similarly, for datetime-like ``start`` and ``end``, the frequency must be
+    convertible to a DateOffset.
+
+    >>> pd.interval_range(start=pd.Timestamp('2017-01-01'),
+                          periods=3, freq='MS')
+    IntervalIndex([(2017-01-01, 2017-02-01], (2017-02-01, 2017-03-01],
+                   (2017-03-01, 2017-04-01]]
+                  closed='right', dtype='interval[datetime64[ns]]')
+
+    Specify ``start``, ``end``, and ``periods``; the frequency is generated
+    automatically (linearly spaced).
+
+    >>> pd.interval_range(start=0, end=6, periods=4)
+    IntervalIndex([(0.0, 1.5], (1.5, 3.0], (3.0, 4.5], (4.5, 6.0]]
+              closed='right',
+              dtype='interval[float64]')
+
+    The ``closed`` parameter specifies which endpoints of the individual
+    intervals within the ``IntervalIndex`` are closed.
+
+    >>> pd.interval_range(end=5, periods=4, closed='both')
+    IntervalIndex([[1, 2], [2, 3], [3, 4], [4, 5]]
+                  closed='both', dtype='interval[int64]')
+
+    See Also
+    --------
+    IntervalIndex : an Index of intervals that are all closed on the same side.
+    """
+    start = com._maybe_box_datetimelike(start)
+    end = com._maybe_box_datetimelike(end)
+    endpoint = start if start is not None else end
+
+    if freq is None and com._any_none(periods, start, end):
+        freq = 1 if is_number(endpoint) else 'D'
+
+    if com._count_not_none(start, end, periods, freq) != 3:
+        raise ValueError('Of the four parameters: start, end, periods, and '
+                         'freq, exactly three must be specified')
+
+    if not _is_valid_endpoint(start):
+        msg = 'start must be numeric or datetime-like, got {start}'
+        raise ValueError(msg.format(start=start))
+    elif not _is_valid_endpoint(end):
+        msg = 'end must be numeric or datetime-like, got {end}'
+        raise ValueError(msg.format(end=end))
+
+    if is_float(periods):
+        periods = int(periods)
+    elif not is_integer(periods) and periods is not None:
+        msg = 'periods must be a number, got {periods}'
+        raise TypeError(msg.format(periods=periods))
+
+    if freq is not None and not is_number(freq):
+        try:
+            freq = to_offset(freq)
+        except ValueError:
+            raise ValueError('freq must be numeric or convertible to '
+                             'DateOffset, got {freq}'.format(freq=freq))
+
+    # verify type compatibility
+    if not all([_is_type_compatible(start, end),
+                _is_type_compatible(start, freq),
+                _is_type_compatible(end, freq)]):
+        raise TypeError("start, end, freq need to be type compatible")
+
+    # +1 to convert interval count to breaks count (n breaks = n-1 intervals)
+    if periods is not None:
+        periods += 1
+
+    if is_number(endpoint):
+        # force consistency between start/end/freq (lower end if freq skips it)
+        if com._all_not_none(start, end, freq):
+            end -= (end - start) % freq
+
+        # compute the period/start/end if unspecified (at most one)
+        if periods is None:
+            periods = int((end - start) // freq) + 1
+        elif start is None:
+            start = end - (periods - 1) * freq
+        elif end is None:
+            end = start + (periods - 1) * freq
+
+        breaks = np.linspace(start, end, periods)
+        if all(is_integer(x) for x in com._not_none(start, end, freq)):
+            # np.linspace always produces float output
+            breaks = maybe_downcast_to_dtype(breaks, 'int64')
+    else:
+        # delegate to the appropriate range function
+        if isinstance(endpoint, Timestamp):
+            range_func = date_range
+        else:
+            range_func = timedelta_range
+
+        breaks = range_func(start=start, end=end, periods=periods, freq=freq)
+
+    return IntervalIndex.from_breaks(breaks, name=name, closed=closed)
diff --git a/pandas/core/indexes/multi.py b/pandas/core/indexes/multi.py
new file mode 100644
index 0000000000000..a2322348e1caa
--- /dev/null
+++ b/pandas/core/indexes/multi.py
@@ -0,0 +1,2926 @@
+
+# pylint: disable=E1101,E1103,W0232
+import datetime
+import warnings
+from sys import getsizeof
+
+import numpy as np
+from pandas._libs import algos as libalgos, index as libindex, lib, Timestamp
+
+from pandas.compat import range, zip, lrange, lzip, map
+from pandas.compat.numpy import function as nv
+from pandas import compat
+
+from pandas.core.dtypes.common import (
+    _ensure_int64,
+    _ensure_platform_int,
+    is_categorical_dtype,
+    is_object_dtype,
+    is_hashable,
+    is_iterator,
+    is_list_like,
+    pandas_dtype,
+    is_scalar)
+from pandas.core.dtypes.missing import isna, array_equivalent
+from pandas.errors import PerformanceWarning, UnsortedIndexError
+
+from pandas.util._decorators import Appender, cache_readonly, deprecate_kwarg
+import pandas.core.common as com
+import pandas.core.missing as missing
+import pandas.core.algorithms as algos
+from pandas.io.formats.printing import pprint_thing
+
+from pandas.core.config import get_option
+
+from pandas.core.indexes.base import (
+    Index, _ensure_index,
+    InvalidIndexError,
+    _index_shared_docs)
+from pandas.core.indexes.frozen import (
+    FrozenNDArray, FrozenList, _ensure_frozen)
+import pandas.core.indexes.base as ibase
+_index_doc_kwargs = dict(ibase._index_doc_kwargs)
+_index_doc_kwargs.update(
+    dict(klass='MultiIndex',
+         target_klass='MultiIndex or list of tuples'))
+
+
+class MultiIndexUIntEngine(libindex.BaseMultiIndexCodesEngine,
+                           libindex.UInt64Engine):
+    """
+    This class manages a MultiIndex by mapping label combinations to positive
+    integers.
+    """
+    _base = libindex.UInt64Engine
+
+    def _codes_to_ints(self, codes):
+        """
+        Transform combination(s) of uint64 in one uint64 (each), in a strictly
+        monotonic way (i.e. respecting the lexicographic order of integer
+        combinations): see BaseMultiIndexCodesEngine documentation.
+
+        Parameters
+        ----------
+        codes : 1- or 2-dimensional array of dtype uint64
+            Combinations of integers (one per row)
+
+        Returns
+        ------
+        int_keys : scalar or 1-dimensional array, of dtype uint64
+            Integer(s) representing one combination (each)
+        """
+        # Shift the representation of each level by the pre-calculated number
+        # of bits:
+        codes <<= self.offsets
+
+        # Now sum and OR are in fact interchangeable. This is a simple
+        # composition of the (disjunct) significant bits of each level (i.e.
+        # each column in "codes") in a single positive integer:
+        if codes.ndim == 1:
+            # Single key
+            return np.bitwise_or.reduce(codes)
+
+        # Multiple keys
+        return np.bitwise_or.reduce(codes, axis=1)
+
+
+class MultiIndexPyIntEngine(libindex.BaseMultiIndexCodesEngine,
+                            libindex.ObjectEngine):
+    """
+    This class manages those (extreme) cases in which the number of possible
+    label combinations overflows the 64 bits integers, and uses an ObjectEngine
+    containing Python integers.
+    """
+    _base = libindex.ObjectEngine
+
+    def _codes_to_ints(self, codes):
+        """
+        Transform combination(s) of uint64 in one Python integer (each), in a
+        strictly monotonic way (i.e. respecting the lexicographic order of
+        integer combinations): see BaseMultiIndexCodesEngine documentation.
+
+        Parameters
+        ----------
+        codes : 1- or 2-dimensional array of dtype uint64
+            Combinations of integers (one per row)
+
+        Returns
+        ------
+        int_keys : int, or 1-dimensional array of dtype object
+            Integer(s) representing one combination (each)
+        """
+
+        # Shift the representation of each level by the pre-calculated number
+        # of bits. Since this can overflow uint64, first make sure we are
+        # working with Python integers:
+        codes = codes.astype('object') << self.offsets
+
+        # Now sum and OR are in fact interchangeable. This is a simple
+        # composition of the (disjunct) significant bits of each level (i.e.
+        # each column in "codes") in a single positive integer (per row):
+        if codes.ndim == 1:
+            # Single key
+            return np.bitwise_or.reduce(codes)
+
+        # Multiple keys
+        return np.bitwise_or.reduce(codes, axis=1)
+
+
+class MultiIndex(Index):
+    """
+    A multi-level, or hierarchical, index object for pandas objects
+
+    Parameters
+    ----------
+    levels : sequence of arrays
+        The unique labels for each level
+    labels : sequence of arrays
+        Integers for each level designating which label at each location
+    sortorder : optional int
+        Level of sortedness (must be lexicographically sorted by that
+        level)
+    names : optional sequence of objects
+        Names for each of the index levels. (name is accepted for compat)
+    copy : boolean, default False
+        Copy the meta-data
+    verify_integrity : boolean, default True
+        Check that the levels/labels are consistent and valid
+
+    Examples
+    ---------
+    A new ``MultiIndex`` is typically constructed using one of the helper
+    methods :meth:`MultiIndex.from_arrays`, :meth:`MultiIndex.from_product`
+    and :meth:`MultiIndex.from_tuples`. For example (using ``.from_arrays``):
+
+    >>> arrays = [[1, 1, 2, 2], ['red', 'blue', 'red', 'blue']]
+    >>> pd.MultiIndex.from_arrays(arrays, names=('number', 'color'))
+    MultiIndex(levels=[[1, 2], ['blue', 'red']],
+           labels=[[0, 0, 1, 1], [1, 0, 1, 0]],
+           names=['number', 'color'])
+
+    See further examples for how to construct a MultiIndex in the doc strings
+    of the mentioned helper methods.
+
+    Notes
+    -----
+    See the `user guide
+    <http://pandas.pydata.org/pandas-docs/stable/advanced.html>`_ for more.
+
+    See Also
+    --------
+    MultiIndex.from_arrays  : Convert list of arrays to MultiIndex
+    MultiIndex.from_product : Create a MultiIndex from the cartesian product
+                              of iterables
+    MultiIndex.from_tuples  : Convert list of tuples to a MultiIndex
+    Index : The base pandas Index type
+
+    Attributes
+    ----------
+    names
+    levels
+    labels
+    nlevels
+    levshape
+
+    Methods
+    -------
+    from_arrays
+    from_tuples
+    from_product
+    set_levels
+    set_labels
+    to_frame
+    is_lexsorted
+    sortlevel
+    droplevel
+    swaplevel
+    reorder_levels
+    remove_unused_levels
+    """
+
+    # initialize to zero-length tuples to make everything work
+    _typ = 'multiindex'
+    _names = FrozenList()
+    _levels = FrozenList()
+    _labels = FrozenList()
+    _comparables = ['names']
+    rename = Index.set_names
+
+    def __new__(cls, levels=None, labels=None, sortorder=None, names=None,
+                dtype=None, copy=False, name=None,
+                verify_integrity=True, _set_identity=True):
+
+        # compat with Index
+        if name is not None:
+            names = name
+        if levels is None or labels is None:
+            raise TypeError("Must pass both levels and labels")
+        if len(levels) != len(labels):
+            raise ValueError('Length of levels and labels must be the same.')
+        if len(levels) == 0:
+            raise ValueError('Must pass non-zero number of levels/labels')
+
+        result = object.__new__(MultiIndex)
+
+        # we've already validated levels and labels, so shortcut here
+        result._set_levels(levels, copy=copy, validate=False)
+        result._set_labels(labels, copy=copy, validate=False)
+
+        if names is not None:
+            # handles name validation
+            result._set_names(names)
+
+        if sortorder is not None:
+            result.sortorder = int(sortorder)
+        else:
+            result.sortorder = sortorder
+
+        if verify_integrity:
+            result._verify_integrity()
+        if _set_identity:
+            result._reset_identity()
+        return result
+
+    def _verify_integrity(self, labels=None, levels=None):
+        """
+
+        Parameters
+        ----------
+        labels : optional list
+            Labels to check for validity. Defaults to current labels.
+        levels : optional list
+            Levels to check for validity. Defaults to current levels.
+
+        Raises
+        ------
+        ValueError
+            If length of levels and labels don't match, if any label would
+            exceed level bounds, or there are any duplicate levels.
+        """
+        # NOTE: Currently does not check, among other things, that cached
+        # nlevels matches nor that sortorder matches actually sortorder.
+        labels = labels or self.labels
+        levels = levels or self.levels
+
+        if len(levels) != len(labels):
+            raise ValueError("Length of levels and labels must match. NOTE:"
+                             " this index is in an inconsistent state.")
+        label_length = len(self.labels[0])
+        for i, (level, label) in enumerate(zip(levels, labels)):
+            if len(label) != label_length:
+                raise ValueError("Unequal label lengths: %s" %
+                                 ([len(lab) for lab in labels]))
+            if len(label) and label.max() >= len(level):
+                raise ValueError("On level %d, label max (%d) >= length of"
+                                 " level  (%d). NOTE: this index is in an"
+                                 " inconsistent state" % (i, label.max(),
+                                                          len(level)))
+            if not level.is_unique:
+                raise ValueError("Level values must be unique: {values} on "
+                                 "level {level}".format(
+                                     values=[value for value in level],
+                                     level=i))
+
+    @property
+    def levels(self):
+        return self._levels
+
+    def _set_levels(self, levels, level=None, copy=False, validate=True,
+                    verify_integrity=False):
+        # This is NOT part of the levels property because it should be
+        # externally not allowed to set levels. User beware if you change
+        # _levels directly
+        if validate and len(levels) == 0:
+            raise ValueError('Must set non-zero number of levels.')
+        if validate and level is None and len(levels) != self.nlevels:
+            raise ValueError('Length of levels must match number of levels.')
+        if validate and level is not None and len(levels) != len(level):
+            raise ValueError('Length of levels must match length of level.')
+
+        if level is None:
+            new_levels = FrozenList(
+                _ensure_index(lev, copy=copy)._shallow_copy()
+                for lev in levels)
+        else:
+            level = [self._get_level_number(l) for l in level]
+            new_levels = list(self._levels)
+            for l, v in zip(level, levels):
+                new_levels[l] = _ensure_index(v, copy=copy)._shallow_copy()
+            new_levels = FrozenList(new_levels)
+
+        if verify_integrity:
+            self._verify_integrity(levels=new_levels)
+
+        names = self.names
+        self._levels = new_levels
+        if any(names):
+            self._set_names(names)
+
+        self._tuples = None
+        self._reset_cache()
+
+    def set_levels(self, levels, level=None, inplace=False,
+                   verify_integrity=True):
+        """
+        Set new levels on MultiIndex. Defaults to returning
+        new index.
+
+        Parameters
+        ----------
+        levels : sequence or list of sequence
+            new level(s) to apply
+        level : int, level name, or sequence of int/level names (default None)
+            level(s) to set (None for all levels)
+        inplace : bool
+            if True, mutates in place
+        verify_integrity : bool (default True)
+            if True, checks that levels and labels are compatible
+
+        Returns
+        -------
+        new index (of same type and class...etc)
+
+
+        Examples
+        --------
+        >>> idx = MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
+                                          (2, u'one'), (2, u'two')],
+                                          names=['foo', 'bar'])
+        >>> idx.set_levels([['a','b'], [1,2]])
+        MultiIndex(levels=[[u'a', u'b'], [1, 2]],
+                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                   names=[u'foo', u'bar'])
+        >>> idx.set_levels(['a','b'], level=0)
+        MultiIndex(levels=[[u'a', u'b'], [u'one', u'two']],
+                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                   names=[u'foo', u'bar'])
+        >>> idx.set_levels(['a','b'], level='bar')
+        MultiIndex(levels=[[1, 2], [u'a', u'b']],
+                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                   names=[u'foo', u'bar'])
+        >>> idx.set_levels([['a','b'], [1,2]], level=[0,1])
+        MultiIndex(levels=[[u'a', u'b'], [1, 2]],
+                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                   names=[u'foo', u'bar'])
+        """
+        if level is not None and not is_list_like(level):
+            if not is_list_like(levels):
+                raise TypeError("Levels must be list-like")
+            if is_list_like(levels[0]):
+                raise TypeError("Levels must be list-like")
+            level = [level]
+            levels = [levels]
+        elif level is None or is_list_like(level):
+            if not is_list_like(levels) or not is_list_like(levels[0]):
+                raise TypeError("Levels must be list of lists-like")
+
+        if inplace:
+            idx = self
+        else:
+            idx = self._shallow_copy()
+        idx._reset_identity()
+        idx._set_levels(levels, level=level, validate=True,
+                        verify_integrity=verify_integrity)
+        if not inplace:
+            return idx
+
+    @property
+    def labels(self):
+        return self._labels
+
+    def _set_labels(self, labels, level=None, copy=False, validate=True,
+                    verify_integrity=False):
+
+        if validate and level is None and len(labels) != self.nlevels:
+            raise ValueError("Length of labels must match number of levels")
+        if validate and level is not None and len(labels) != len(level):
+            raise ValueError('Length of labels must match length of levels.')
+
+        if level is None:
+            new_labels = FrozenList(
+                _ensure_frozen(lab, lev, copy=copy)._shallow_copy()
+                for lev, lab in zip(self.levels, labels))
+        else:
+            level = [self._get_level_number(l) for l in level]
+            new_labels = list(self._labels)
+            for lev_idx, lab in zip(level, labels):
+                lev = self.levels[lev_idx]
+                new_labels[lev_idx] = _ensure_frozen(
+                    lab, lev, copy=copy)._shallow_copy()
+            new_labels = FrozenList(new_labels)
+
+        if verify_integrity:
+            self._verify_integrity(labels=new_labels)
+
+        self._labels = new_labels
+        self._tuples = None
+        self._reset_cache()
+
+    def set_labels(self, labels, level=None, inplace=False,
+                   verify_integrity=True):
+        """
+        Set new labels on MultiIndex. Defaults to returning
+        new index.
+
+        Parameters
+        ----------
+        labels : sequence or list of sequence
+            new labels to apply
+        level : int, level name, or sequence of int/level names (default None)
+            level(s) to set (None for all levels)
+        inplace : bool
+            if True, mutates in place
+        verify_integrity : bool (default True)
+            if True, checks that levels and labels are compatible
+
+        Returns
+        -------
+        new index (of same type and class...etc)
+
+        Examples
+        --------
+        >>> idx = MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
+                                          (2, u'one'), (2, u'two')],
+                                          names=['foo', 'bar'])
+        >>> idx.set_labels([[1,0,1,0], [0,0,1,1]])
+        MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                   labels=[[1, 0, 1, 0], [0, 0, 1, 1]],
+                   names=[u'foo', u'bar'])
+        >>> idx.set_labels([1,0,1,0], level=0)
+        MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                   labels=[[1, 0, 1, 0], [0, 1, 0, 1]],
+                   names=[u'foo', u'bar'])
+        >>> idx.set_labels([0,0,1,1], level='bar')
+        MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                   labels=[[0, 0, 1, 1], [0, 0, 1, 1]],
+                   names=[u'foo', u'bar'])
+        >>> idx.set_labels([[1,0,1,0], [0,0,1,1]], level=[0,1])
+        MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                   labels=[[1, 0, 1, 0], [0, 0, 1, 1]],
+                   names=[u'foo', u'bar'])
+        """
+        if level is not None and not is_list_like(level):
+            if not is_list_like(labels):
+                raise TypeError("Labels must be list-like")
+            if is_list_like(labels[0]):
+                raise TypeError("Labels must be list-like")
+            level = [level]
+            labels = [labels]
+        elif level is None or is_list_like(level):
+            if not is_list_like(labels) or not is_list_like(labels[0]):
+                raise TypeError("Labels must be list of lists-like")
+
+        if inplace:
+            idx = self
+        else:
+            idx = self._shallow_copy()
+        idx._reset_identity()
+        idx._set_labels(labels, level=level, verify_integrity=verify_integrity)
+        if not inplace:
+            return idx
+
+    def copy(self, names=None, dtype=None, levels=None, labels=None,
+             deep=False, _set_identity=False, **kwargs):
+        """
+        Make a copy of this object. Names, dtype, levels and labels can be
+        passed and will be set on new copy.
+
+        Parameters
+        ----------
+        names : sequence, optional
+        dtype : numpy dtype or pandas type, optional
+        levels : sequence, optional
+        labels : sequence, optional
+
+        Returns
+        -------
+        copy : MultiIndex
+
+        Notes
+        -----
+        In most cases, there should be no functional difference from using
+        ``deep``, but if ``deep`` is passed it will attempt to deepcopy.
+        This could be potentially expensive on large MultiIndex objects.
+        """
+        name = kwargs.get('name')
+        names = self._validate_names(name=name, names=names, deep=deep)
+
+        if deep:
+            from copy import deepcopy
+            if levels is None:
+                levels = deepcopy(self.levels)
+            if labels is None:
+                labels = deepcopy(self.labels)
+        else:
+            if levels is None:
+                levels = self.levels
+            if labels is None:
+                labels = self.labels
+        return MultiIndex(levels=levels, labels=labels, names=names,
+                          sortorder=self.sortorder, verify_integrity=False,
+                          _set_identity=_set_identity)
+
+    def __array__(self, dtype=None):
+        """ the array interface, return my values """
+        return self.values
+
+    def view(self, cls=None):
+        """ this is defined as a copy with the same identity """
+        result = self.copy()
+        result._id = self._id
+        return result
+
+    def _shallow_copy_with_infer(self, values=None, **kwargs):
+        # On equal MultiIndexes the difference is empty.
+        # Therefore, an empty MultiIndex is returned GH13490
+        if len(values) == 0:
+            return MultiIndex(levels=[[] for _ in range(self.nlevels)],
+                              labels=[[] for _ in range(self.nlevels)],
+                              **kwargs)
+        return self._shallow_copy(values, **kwargs)
+
+    @Appender(_index_shared_docs['__contains__'] % _index_doc_kwargs)
+    def __contains__(self, key):
+        hash(key)
+        try:
+            self.get_loc(key)
+            return True
+        except (LookupError, TypeError):
+            return False
+
+    contains = __contains__
+
+    @Appender(_index_shared_docs['_shallow_copy'])
+    def _shallow_copy(self, values=None, **kwargs):
+        if values is not None:
+            names = kwargs.pop('names', kwargs.pop('name', self.names))
+            # discards freq
+            kwargs.pop('freq', None)
+            return MultiIndex.from_tuples(values, names=names, **kwargs)
+        return self.view()
+
+    @cache_readonly
+    def dtype(self):
+        return np.dtype('O')
+
+    def _is_memory_usage_qualified(self):
+        """ return a boolean if we need a qualified .info display """
+        def f(l):
+            return 'mixed' in l or 'string' in l or 'unicode' in l
+        return any(f(l) for l in self._inferred_type_levels)
+
+    @Appender(Index.memory_usage.__doc__)
+    def memory_usage(self, deep=False):
+        # we are overwriting our base class to avoid
+        # computing .values here which could materialize
+        # a tuple representation uncessarily
+        return self._nbytes(deep)
+
+    @cache_readonly
+    def nbytes(self):
+        """ return the number of bytes in the underlying data """
+        return self._nbytes(False)
+
+    def _nbytes(self, deep=False):
+        """
+        return the number of bytes in the underlying data
+        deeply introspect the level data if deep=True
+
+        include the engine hashtable
+
+        *this is in internal routine*
+
+        """
+
+        # for implementations with no useful getsizeof (PyPy)
+        objsize = 24
+
+        level_nbytes = sum(i.memory_usage(deep=deep) for i in self.levels)
+        label_nbytes = sum(i.nbytes for i in self.labels)
+        names_nbytes = sum(getsizeof(i, objsize) for i in self.names)
+        result = level_nbytes + label_nbytes + names_nbytes
+
+        # include our engine hashtable
+        result += self._engine.sizeof(deep=deep)
+        return result
+
+    def _format_attrs(self):
+        """
+        Return a list of tuples of the (attr,formatted_value)
+        """
+        attrs = [
+            ('levels', ibase.default_pprint(self._levels,
+                                            max_seq_items=False)),
+            ('labels', ibase.default_pprint(self._labels,
+                                            max_seq_items=False))]
+        if com._any_not_none(*self.names):
+            attrs.append(('names', ibase.default_pprint(self.names)))
+        if self.sortorder is not None:
+            attrs.append(('sortorder', ibase.default_pprint(self.sortorder)))
+        return attrs
+
+    def _format_space(self):
+        return "\n%s" % (' ' * (len(self.__class__.__name__) + 1))
+
+    def _format_data(self, name=None):
+        # we are formatting thru the attributes
+        return None
+
+    def __len__(self):
+        return len(self.labels[0])
+
+    def _get_names(self):
+        return FrozenList(level.name for level in self.levels)
+
+    def _set_names(self, names, level=None, validate=True):
+        """
+        Set new names on index. Each name has to be a hashable type.
+
+        Parameters
+        ----------
+        values : str or sequence
+            name(s) to set
+        level : int, level name, or sequence of int/level names (default None)
+            If the index is a MultiIndex (hierarchical), level(s) to set (None
+            for all levels).  Otherwise level must be None
+        validate : boolean, default True
+            validate that the names match level lengths
+
+        Raises
+        ------
+        TypeError if each name is not hashable.
+
+        Notes
+        -----
+        sets names on levels. WARNING: mutates!
+
+        Note that you generally want to set this *after* changing levels, so
+        that it only acts on copies
+        """
+        # GH 15110
+        # Don't allow a single string for names in a MultiIndex
+        if names is not None and not is_list_like(names):
+            raise ValueError('Names should be list-like for a MultiIndex')
+        names = list(names)
+
+        if validate and level is not None and len(names) != len(level):
+            raise ValueError('Length of names must match length of level.')
+        if validate and level is None and len(names) != self.nlevels:
+            raise ValueError('Length of names must match number of levels in '
+                             'MultiIndex.')
+
+        if level is None:
+            level = range(self.nlevels)
+        else:
+            level = [self._get_level_number(l) for l in level]
+
+        # set the name
+        for l, name in zip(level, names):
+            if name is not None:
+                # GH 20527
+                # All items in 'names' need to be hashable:
+                if not is_hashable(name):
+                    raise TypeError('{}.name must be a hashable type'
+                                    .format(self.__class__.__name__))
+            self.levels[l].rename(name, inplace=True)
+
+    names = property(fset=_set_names, fget=_get_names,
+                     doc="Names of levels in MultiIndex")
+
+    def _format_native_types(self, na_rep='nan', **kwargs):
+        new_levels = []
+        new_labels = []
+
+        # go through the levels and format them
+        for level, label in zip(self.levels, self.labels):
+            level = level._format_native_types(na_rep=na_rep, **kwargs)
+            # add nan values, if there are any
+            mask = (label == -1)
+            if mask.any():
+                nan_index = len(level)
+                level = np.append(level, na_rep)
+                label = label.values()
+                label[mask] = nan_index
+            new_levels.append(level)
+            new_labels.append(label)
+
+        # reconstruct the multi-index
+        mi = MultiIndex(levels=new_levels, labels=new_labels, names=self.names,
+                        sortorder=self.sortorder, verify_integrity=False)
+
+        return mi.values
+
+    @Appender(_index_shared_docs['_get_grouper_for_level'])
+    def _get_grouper_for_level(self, mapper, level):
+        indexer = self.labels[level]
+        level_index = self.levels[level]
+
+        if mapper is not None:
+            # Handle group mapping function and return
+            level_values = self.levels[level].take(indexer)
+            grouper = level_values.map(mapper)
+            return grouper, None, None
+
+        labels, uniques = algos.factorize(indexer, sort=True)
+
+        if len(uniques) > 0 and uniques[0] == -1:
+            # Handle NAs
+            mask = indexer != -1
+            ok_labels, uniques = algos.factorize(indexer[mask],
+                                                 sort=True)
+
+            labels = np.empty(len(indexer), dtype=indexer.dtype)
+            labels[mask] = ok_labels
+            labels[~mask] = -1
+
+        if len(uniques) < len(level_index):
+            # Remove unobserved levels from level_index
+            level_index = level_index.take(uniques)
+
+        grouper = level_index.take(labels)
+
+        return grouper, labels, level_index
+
+    @property
+    def _constructor(self):
+        return MultiIndex.from_tuples
+
+    @cache_readonly
+    def inferred_type(self):
+        return 'mixed'
+
+    @staticmethod
+    def _from_elements(values, labels=None, levels=None, names=None,
+                       sortorder=None):
+        return MultiIndex(levels, labels, names, sortorder=sortorder)
+
+    def _get_level_number(self, level):
+        try:
+            count = self.names.count(level)
+            if count > 1:
+                raise ValueError('The name %s occurs multiple times, use a '
+                                 'level number' % level)
+            level = self.names.index(level)
+        except ValueError:
+            if not isinstance(level, int):
+                raise KeyError('Level %s not found' % str(level))
+            elif level < 0:
+                level += self.nlevels
+                if level < 0:
+                    orig_level = level - self.nlevels
+                    raise IndexError('Too many levels: Index has only %d '
+                                     'levels, %d is not a valid level number' %
+                                     (self.nlevels, orig_level))
+            # Note: levels are zero-based
+            elif level >= self.nlevels:
+                raise IndexError('Too many levels: Index has only %d levels, '
+                                 'not %d' % (self.nlevels, level + 1))
+        return level
+
+    _tuples = None
+
+    @cache_readonly
+    def _engine(self):
+        # Calculate the number of bits needed to represent labels in each
+        # level, as log2 of their sizes (including -1 for NaN):
+        sizes = np.ceil(np.log2([len(l) + 1 for l in self.levels]))
+
+        # Sum bit counts, starting from the _right_....
+        lev_bits = np.cumsum(sizes[::-1])[::-1]
+
+        # ... in order to obtain offsets such that sorting the combination of
+        # shifted codes (one for each level, resulting in a unique integer) is
+        # equivalent to sorting lexicographically the codes themselves. Notice
+        # that each level needs to be shifted by the number of bits needed to
+        # represent the _previous_ ones:
+        offsets = np.concatenate([lev_bits[1:], [0]]).astype('uint64')
+
+        # Check the total number of bits needed for our representation:
+        if lev_bits[0] > 64:
+            # The levels would overflow a 64 bit uint - use Python integers:
+            return MultiIndexPyIntEngine(self.levels, self.labels, offsets)
+        return MultiIndexUIntEngine(self.levels, self.labels, offsets)
+
+    @property
+    def values(self):
+        if self._tuples is not None:
+            return self._tuples
+
+        values = []
+        for lev, lab in zip(self.levels, self.labels):
+            # Need to box timestamps, etc.
+            box = hasattr(lev, '_box_values')
+            # Try to minimize boxing.
+            if box and len(lev) > len(lab):
+                taken = lev._box_values(algos.take_1d(lev._ndarray_values,
+                                                      lab))
+            elif box:
+                taken = algos.take_1d(lev._box_values(lev._ndarray_values),
+                                      lab,
+                                      fill_value=lev._na_value)
+            else:
+                taken = algos.take_1d(np.asarray(lev._values), lab)
+            values.append(taken)
+
+        self._tuples = lib.fast_zip(values)
+        return self._tuples
+
+    # fml
+    @property
+    def _is_v1(self):
+        return False
+
+    @property
+    def _is_v2(self):
+        return False
+
+    @property
+    def _has_complex_internals(self):
+        # to disable groupby tricks
+        return True
+
+    @cache_readonly
+    def is_monotonic_increasing(self):
+        """
+        return if the index is monotonic increasing (only equal or
+        increasing) values.
+        """
+
+        # reversed() because lexsort() wants the most significant key last.
+        values = [self._get_level_values(i).values
+                  for i in reversed(range(len(self.levels)))]
+        try:
+            sort_order = np.lexsort(values)
+            return Index(sort_order).is_monotonic
+        except TypeError:
+
+            # we have mixed types and np.lexsort is not happy
+            return Index(self.values).is_monotonic
+
+    @cache_readonly
+    def is_monotonic_decreasing(self):
+        """
+        return if the index is monotonic decreasing (only equal or
+        decreasing) values.
+        """
+        # monotonic decreasing if and only if reverse is monotonic increasing
+        return self[::-1].is_monotonic_increasing
+
+    @cache_readonly
+    def _have_mixed_levels(self):
+        """ return a boolean list indicated if we have mixed levels """
+        return ['mixed' in l for l in self._inferred_type_levels]
+
+    @cache_readonly
+    def _inferred_type_levels(self):
+        """ return a list of the inferred types, one for each level """
+        return [i.inferred_type for i in self.levels]
+
+    @cache_readonly
+    def _hashed_values(self):
+        """ return a uint64 ndarray of my hashed values """
+        from pandas.core.util.hashing import hash_tuples
+        return hash_tuples(self)
+
+    def _hashed_indexing_key(self, key):
+        """
+        validate and return the hash for the provided key
+
+        *this is internal for use for the cython routines*
+
+        Parameters
+        ----------
+        key : string or tuple
+
+        Returns
+        -------
+        np.uint64
+
+        Notes
+        -----
+        we need to stringify if we have mixed levels
+
+        """
+        from pandas.core.util.hashing import hash_tuples, hash_tuple
+
+        if not isinstance(key, tuple):
+            return hash_tuples(key)
+
+        if not len(key) == self.nlevels:
+            raise KeyError
+
+        def f(k, stringify):
+            if stringify and not isinstance(k, compat.string_types):
+                k = str(k)
+            return k
+        key = tuple([f(k, stringify)
+                     for k, stringify in zip(key, self._have_mixed_levels)])
+        return hash_tuple(key)
+
+    @Appender(Index.duplicated.__doc__)
+    def duplicated(self, keep='first'):
+        from pandas.core.sorting import get_group_index
+        from pandas._libs.hashtable import duplicated_int64
+
+        shape = map(len, self.levels)
+        ids = get_group_index(self.labels, shape, sort=False, xnull=False)
+
+        return duplicated_int64(ids, keep)
+
+    def fillna(self, value=None, downcast=None):
+        """
+        fillna is not implemented for MultiIndex
+        """
+        raise NotImplementedError('isna is not defined for MultiIndex')
+
+    @Appender(_index_shared_docs['dropna'])
+    def dropna(self, how='any'):
+        nans = [label == -1 for label in self.labels]
+        if how == 'any':
+            indexer = np.any(nans, axis=0)
+        elif how == 'all':
+            indexer = np.all(nans, axis=0)
+        else:
+            raise ValueError("invalid how option: {0}".format(how))
+
+        new_labels = [label[~indexer] for label in self.labels]
+        return self.copy(labels=new_labels, deep=True)
+
+    def get_value(self, series, key):
+        # somewhat broken encapsulation
+        from pandas.core.indexing import maybe_droplevels
+
+        # Label-based
+        s = com._values_from_object(series)
+        k = com._values_from_object(key)
+
+        def _try_mi(k):
+            # TODO: what if a level contains tuples??
+            loc = self.get_loc(k)
+            new_values = series._values[loc]
+            new_index = self[loc]
+            new_index = maybe_droplevels(new_index, k)
+            return series._constructor(new_values, index=new_index,
+                                       name=series.name).__finalize__(self)
+
+        try:
+            return self._engine.get_value(s, k)
+        except KeyError as e1:
+            try:
+                return _try_mi(key)
+            except KeyError:
+                pass
+
+            try:
+                return libindex.get_value_at(s, k)
+            except IndexError:
+                raise
+            except TypeError:
+                # generator/iterator-like
+                if is_iterator(key):
+                    raise InvalidIndexError(key)
+                else:
+                    raise e1
+            except Exception:  # pragma: no cover
+                raise e1
+        except TypeError:
+
+            # a Timestamp will raise a TypeError in a multi-index
+            # rather than a KeyError, try it here
+            # note that a string that 'looks' like a Timestamp will raise
+            # a KeyError! (GH5725)
+            if (isinstance(key, (datetime.datetime, np.datetime64)) or
+                    (compat.PY3 and isinstance(key, compat.string_types))):
+                try:
+                    return _try_mi(key)
+                except (KeyError):
+                    raise
+                except:
+                    pass
+
+                try:
+                    return _try_mi(Timestamp(key))
+                except:
+                    pass
+
+            raise InvalidIndexError(key)
+
+    def _get_level_values(self, level, unique=False):
+        """
+        Return vector of label values for requested level,
+        equal to the length of the index
+
+        **this is an internal method**
+
+        Parameters
+        ----------
+        level : int level
+        unique : bool, default False
+            if True, drop duplicated values
+
+        Returns
+        -------
+        values : ndarray
+        """
+
+        values = self.levels[level]
+        labels = self.labels[level]
+        if unique:
+            labels = algos.unique(labels)
+        filled = algos.take_1d(values._values, labels,
+                               fill_value=values._na_value)
+        values = values._shallow_copy(filled)
+        return values
+
+    def get_level_values(self, level):
+        """
+        Return vector of label values for requested level,
+        equal to the length of the index.
+
+        Parameters
+        ----------
+        level : int or str
+            ``level`` is either the integer position of the level in the
+            MultiIndex, or the name of the level.
+
+        Returns
+        -------
+        values : Index
+            ``values`` is a level of this MultiIndex converted to
+            a single :class:`Index` (or subclass thereof).
+
+        Examples
+        ---------
+
+        Create a MultiIndex:
+
+        >>> mi = pd.MultiIndex.from_arrays((list('abc'), list('def')))
+        >>> mi.names = ['level_1', 'level_2']
+
+        Get level values by supplying level as either integer or name:
+
+        >>> mi.get_level_values(0)
+        Index(['a', 'b', 'c'], dtype='object', name='level_1')
+        >>> mi.get_level_values('level_2')
+        Index(['d', 'e', 'f'], dtype='object', name='level_2')
+        """
+        level = self._get_level_number(level)
+        values = self._get_level_values(level)
+        return values
+
+    @Appender(_index_shared_docs['index_unique'] % _index_doc_kwargs)
+    def unique(self, level=None):
+
+        if level is None:
+            return super(MultiIndex, self).unique()
+        else:
+            level = self._get_level_number(level)
+            return self._get_level_values(level=level, unique=True)
+
+    def format(self, space=2, sparsify=None, adjoin=True, names=False,
+               na_rep=None, formatter=None):
+        if len(self) == 0:
+            return []
+
+        stringified_levels = []
+        for lev, lab in zip(self.levels, self.labels):
+            na = na_rep if na_rep is not None else _get_na_rep(lev.dtype.type)
+
+            if len(lev) > 0:
+
+                formatted = lev.take(lab).format(formatter=formatter)
+
+                # we have some NA
+                mask = lab == -1
+                if mask.any():
+                    formatted = np.array(formatted, dtype=object)
+                    formatted[mask] = na
+                    formatted = formatted.tolist()
+
+            else:
+                # weird all NA case
+                formatted = [pprint_thing(na if isna(x) else x,
+                                          escape_chars=('\t', '\r', '\n'))
+                             for x in algos.take_1d(lev._values, lab)]
+            stringified_levels.append(formatted)
+
+        result_levels = []
+        for lev, name in zip(stringified_levels, self.names):
+            level = []
+
+            if names:
+                level.append(pprint_thing(name,
+                                          escape_chars=('\t', '\r', '\n'))
+                             if name is not None else '')
+
+            level.extend(np.array(lev, dtype=object))
+            result_levels.append(level)
+
+        if sparsify is None:
+            sparsify = get_option("display.multi_sparse")
+
+        if sparsify:
+            sentinel = ''
+            # GH3547
+            # use value of sparsify as sentinel,  unless it's an obvious
+            # "Truthey" value
+            if sparsify not in [True, 1]:
+                sentinel = sparsify
+            # little bit of a kludge job for #1217
+            result_levels = _sparsify(result_levels, start=int(names),
+                                      sentinel=sentinel)
+
+        if adjoin:
+            from pandas.io.formats.format import _get_adjustment
+            adj = _get_adjustment()
+            return adj.adjoin(space, *result_levels).split('\n')
+        else:
+            return result_levels
+
+    def _to_safe_for_reshape(self):
+        """ convert to object if we are a categorical """
+        return self.set_levels([i._to_safe_for_reshape() for i in self.levels])
+
+    def to_frame(self, index=True):
+        """
+        Create a DataFrame with the levels of the MultiIndex as columns.
+
+        .. versionadded:: 0.20.0
+
+        Parameters
+        ----------
+        index : boolean, default True
+            Set the index of the returned DataFrame as the original MultiIndex.
+
+        Returns
+        -------
+        DataFrame : a DataFrame containing the original MultiIndex data.
+        """
+
+        from pandas import DataFrame
+        result = DataFrame({(name or level):
+                            self._get_level_values(level)
+                            for name, level in
+                            zip(self.names, range(len(self.levels)))},
+                           copy=False)
+        if index:
+            result.index = self
+        return result
+
+    def to_hierarchical(self, n_repeat, n_shuffle=1):
+        """
+        .. deprecated:: 0.24.0
+
+        Return a MultiIndex reshaped to conform to the
+        shapes given by n_repeat and n_shuffle.
+
+        Useful to replicate and rearrange a MultiIndex for combination
+        with another Index with n_repeat items.
+
+        Parameters
+        ----------
+        n_repeat : int
+            Number of times to repeat the labels on self
+        n_shuffle : int
+            Controls the reordering of the labels. If the result is going
+            to be an inner level in a MultiIndex, n_shuffle will need to be
+            greater than one. The size of each label must divisible by
+            n_shuffle.
+
+        Returns
+        -------
+        MultiIndex
+
+        Examples
+        --------
+        >>> idx = MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
+                                          (2, u'one'), (2, u'two')])
+        >>> idx.to_hierarchical(3)
+        MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                   labels=[[0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1],
+                           [0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1]])
+        """
+        levels = self.levels
+        labels = [np.repeat(x, n_repeat) for x in self.labels]
+        # Assumes that each label is divisible by n_shuffle
+        labels = [x.reshape(n_shuffle, -1).ravel(order='F') for x in labels]
+        names = self.names
+        warnings.warn("Method .to_hierarchical is deprecated and will "
+                      "be removed in a future version",
+                      FutureWarning, stacklevel=2)
+        return MultiIndex(levels=levels, labels=labels, names=names)
+
+    @property
+    def is_all_dates(self):
+        return False
+
+    def is_lexsorted(self):
+        """
+        Return True if the labels are lexicographically sorted
+        """
+        return self.lexsort_depth == self.nlevels
+
+    @cache_readonly
+    def lexsort_depth(self):
+        if self.sortorder is not None:
+            if self.sortorder == 0:
+                return self.nlevels
+            else:
+                return 0
+
+        int64_labels = [_ensure_int64(lab) for lab in self.labels]
+        for k in range(self.nlevels, 0, -1):
+            if libalgos.is_lexsorted(int64_labels[:k]):
+                return k
+
+        return 0
+
+    @classmethod
+    def from_arrays(cls, arrays, sortorder=None, names=None):
+        """
+        Convert arrays to MultiIndex
+
+        Parameters
+        ----------
+        arrays : list / sequence of array-likes
+            Each array-like gives one level's value for each data point.
+            len(arrays) is the number of levels.
+        sortorder : int or None
+            Level of sortedness (must be lexicographically sorted by that
+            level)
+
+        Returns
+        -------
+        index : MultiIndex
+
+        Examples
+        --------
+        >>> arrays = [[1, 1, 2, 2], ['red', 'blue', 'red', 'blue']]
+        >>> MultiIndex.from_arrays(arrays, names=('number', 'color'))
+
+        See Also
+        --------
+        MultiIndex.from_tuples : Convert list of tuples to MultiIndex
+        MultiIndex.from_product : Make a MultiIndex from cartesian product
+                                  of iterables
+        """
+        if not is_list_like(arrays):
+            raise TypeError("Input must be a list / sequence of array-likes.")
+        elif is_iterator(arrays):
+            arrays = list(arrays)
+
+        # Check if lengths of all arrays are equal or not,
+        # raise ValueError, if not
+        for i in range(1, len(arrays)):
+            if len(arrays[i]) != len(arrays[i - 1]):
+                raise ValueError('all arrays must be same length')
+
+        from pandas.core.arrays.categorical import _factorize_from_iterables
+
+        labels, levels = _factorize_from_iterables(arrays)
+        if names is None:
+            names = [getattr(arr, "name", None) for arr in arrays]
+
+        return MultiIndex(levels=levels, labels=labels, sortorder=sortorder,
+                          names=names, verify_integrity=False)
+
+    @classmethod
+    def from_tuples(cls, tuples, sortorder=None, names=None):
+        """
+        Convert list of tuples to MultiIndex
+
+        Parameters
+        ----------
+        tuples : list / sequence of tuple-likes
+            Each tuple is the index of one row/column.
+        sortorder : int or None
+            Level of sortedness (must be lexicographically sorted by that
+            level)
+
+        Returns
+        -------
+        index : MultiIndex
+
+        Examples
+        --------
+        >>> tuples = [(1, u'red'), (1, u'blue'),
+                      (2, u'red'), (2, u'blue')]
+        >>> MultiIndex.from_tuples(tuples, names=('number', 'color'))
+
+        See Also
+        --------
+        MultiIndex.from_arrays : Convert list of arrays to MultiIndex
+        MultiIndex.from_product : Make a MultiIndex from cartesian product
+                                  of iterables
+        """
+        if not is_list_like(tuples):
+            raise TypeError('Input must be a list / sequence of tuple-likes.')
+        elif is_iterator(tuples):
+            tuples = list(tuples)
+
+        if len(tuples) == 0:
+            if names is None:
+                msg = 'Cannot infer number of levels from empty list'
+                raise TypeError(msg)
+            arrays = [[]] * len(names)
+        elif isinstance(tuples, (np.ndarray, Index)):
+            if isinstance(tuples, Index):
+                tuples = tuples._values
+
+            arrays = list(lib.tuples_to_object_array(tuples).T)
+        elif isinstance(tuples, list):
+            arrays = list(lib.to_object_array_tuples(tuples).T)
+        else:
+            arrays = lzip(*tuples)
+
+        return MultiIndex.from_arrays(arrays, sortorder=sortorder, names=names)
+
+    @classmethod
+    def from_product(cls, iterables, sortorder=None, names=None):
+        """
+        Make a MultiIndex from the cartesian product of multiple iterables
+
+        Parameters
+        ----------
+        iterables : list / sequence of iterables
+            Each iterable has unique labels for each level of the index.
+        sortorder : int or None
+            Level of sortedness (must be lexicographically sorted by that
+            level).
+        names : list / sequence of strings or None
+            Names for the levels in the index.
+
+        Returns
+        -------
+        index : MultiIndex
+
+        Examples
+        --------
+        >>> numbers = [0, 1, 2]
+        >>> colors = [u'green', u'purple']
+        >>> MultiIndex.from_product([numbers, colors],
+                                     names=['number', 'color'])
+        MultiIndex(levels=[[0, 1, 2], [u'green', u'purple']],
+                   labels=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]],
+                   names=[u'number', u'color'])
+
+        See Also
+        --------
+        MultiIndex.from_arrays : Convert list of arrays to MultiIndex
+        MultiIndex.from_tuples : Convert list of tuples to MultiIndex
+        """
+        from pandas.core.arrays.categorical import _factorize_from_iterables
+        from pandas.core.reshape.util import cartesian_product
+
+        if not is_list_like(iterables):
+            raise TypeError("Input must be a list / sequence of iterables.")
+        elif is_iterator(iterables):
+            iterables = list(iterables)
+
+        labels, levels = _factorize_from_iterables(iterables)
+        labels = cartesian_product(labels)
+        return MultiIndex(levels, labels, sortorder=sortorder, names=names)
+
+    def _sort_levels_monotonic(self):
+        """
+        .. versionadded:: 0.20.0
+
+        This is an *internal* function.
+
+        Create a new MultiIndex from the current to monotonically sorted
+        items IN the levels. This does not actually make the entire MultiIndex
+        monotonic, JUST the levels.
+
+        The resulting MultiIndex will have the same outward
+        appearance, meaning the same .values and ordering. It will also
+        be .equals() to the original.
+
+        Returns
+        -------
+        MultiIndex
+
+        Examples
+        --------
+
+        >>> i = pd.MultiIndex(levels=[['a', 'b'], ['bb', 'aa']],
+                              labels=[[0, 0, 1, 1], [0, 1, 0, 1]])
+        >>> i
+        MultiIndex(levels=[['a', 'b'], ['bb', 'aa']],
+                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]])
+
+        >>> i.sort_monotonic()
+        MultiIndex(levels=[['a', 'b'], ['aa', 'bb']],
+                   labels=[[0, 0, 1, 1], [1, 0, 1, 0]])
+
+        """
+
+        if self.is_lexsorted() and self.is_monotonic:
+            return self
+
+        new_levels = []
+        new_labels = []
+
+        for lev, lab in zip(self.levels, self.labels):
+
+            if not lev.is_monotonic:
+                try:
+                    # indexer to reorder the levels
+                    indexer = lev.argsort()
+                except TypeError:
+                    pass
+                else:
+                    lev = lev.take(indexer)
+
+                    # indexer to reorder the labels
+                    indexer = _ensure_int64(indexer)
+                    ri = lib.get_reverse_indexer(indexer, len(indexer))
+                    lab = algos.take_1d(ri, lab)
+
+            new_levels.append(lev)
+            new_labels.append(lab)
+
+        return MultiIndex(new_levels, new_labels,
+                          names=self.names, sortorder=self.sortorder,
+                          verify_integrity=False)
+
+    def remove_unused_levels(self):
+        """
+        Create a new MultiIndex from the current that removes
+        unused levels, meaning that they are not expressed in the labels.
+
+        The resulting MultiIndex will have the same outward
+        appearance, meaning the same .values and ordering. It will also
+        be .equals() to the original.
+
+        .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        MultiIndex
+
+        Examples
+        --------
+        >>> i = pd.MultiIndex.from_product([range(2), list('ab')])
+        MultiIndex(levels=[[0, 1], ['a', 'b']],
+                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]])
+
+
+        >>> i[2:]
+        MultiIndex(levels=[[0, 1], ['a', 'b']],
+                   labels=[[1, 1], [0, 1]])
+
+        The 0 from the first level is not represented
+        and can be removed
+
+        >>> i[2:].remove_unused_levels()
+        MultiIndex(levels=[[1], ['a', 'b']],
+                   labels=[[0, 0], [0, 1]])
+
+        """
+
+        new_levels = []
+        new_labels = []
+
+        changed = False
+        for lev, lab in zip(self.levels, self.labels):
+
+            # Since few levels are typically unused, bincount() is more
+            # efficient than unique() - however it only accepts positive values
+            # (and drops order):
+            uniques = np.where(np.bincount(lab + 1) > 0)[0] - 1
+            has_na = int(len(uniques) and (uniques[0] == -1))
+
+            if len(uniques) != len(lev) + has_na:
+                # We have unused levels
+                changed = True
+
+                # Recalculate uniques, now preserving order.
+                # Can easily be cythonized by exploiting the already existing
+                # "uniques" and stop parsing "lab" when all items are found:
+                uniques = algos.unique(lab)
+                if has_na:
+                    na_idx = np.where(uniques == -1)[0]
+                    # Just ensure that -1 is in first position:
+                    uniques[[0, na_idx[0]]] = uniques[[na_idx[0], 0]]
+
+                # labels get mapped from uniques to 0:len(uniques)
+                # -1 (if present) is mapped to last position
+                label_mapping = np.zeros(len(lev) + has_na)
+                # ... and reassigned value -1:
+                label_mapping[uniques] = np.arange(len(uniques)) - has_na
+
+                lab = label_mapping[lab]
+
+                # new levels are simple
+                lev = lev.take(uniques[has_na:])
+
+            new_levels.append(lev)
+            new_labels.append(lab)
+
+        result = self._shallow_copy()
+
+        if changed:
+            result._reset_identity()
+            result._set_levels(new_levels, validate=False)
+            result._set_labels(new_labels, validate=False)
+
+        return result
+
+    @property
+    def nlevels(self):
+        """Integer number of levels in this MultiIndex."""
+        return len(self.levels)
+
+    @property
+    def levshape(self):
+        """A tuple with the length of each level."""
+        return tuple(len(x) for x in self.levels)
+
+    def __reduce__(self):
+        """Necessary for making this object picklable"""
+        d = dict(levels=[lev for lev in self.levels],
+                 labels=[label for label in self.labels],
+                 sortorder=self.sortorder, names=list(self.names))
+        return ibase._new_Index, (self.__class__, d), None
+
+    def __setstate__(self, state):
+        """Necessary for making this object picklable"""
+
+        if isinstance(state, dict):
+            levels = state.get('levels')
+            labels = state.get('labels')
+            sortorder = state.get('sortorder')
+            names = state.get('names')
+
+        elif isinstance(state, tuple):
+
+            nd_state, own_state = state
+            levels, labels, sortorder, names = own_state
+
+        self._set_levels([Index(x) for x in levels], validate=False)
+        self._set_labels(labels)
+        self._set_names(names)
+        self.sortorder = sortorder
+        self._verify_integrity()
+        self._reset_identity()
+
+    def __getitem__(self, key):
+        if is_scalar(key):
+            retval = []
+            for lev, lab in zip(self.levels, self.labels):
+                if lab[key] == -1:
+                    retval.append(np.nan)
+                else:
+                    retval.append(lev[lab[key]])
+
+            return tuple(retval)
+        else:
+            if com.is_bool_indexer(key):
+                key = np.asarray(key)
+                sortorder = self.sortorder
+            else:
+                # cannot be sure whether the result will be sorted
+                sortorder = None
+
+                if isinstance(key, Index):
+                    key = np.asarray(key)
+
+            new_labels = [lab[key] for lab in self.labels]
+
+            return MultiIndex(levels=self.levels, labels=new_labels,
+                              names=self.names, sortorder=sortorder,
+                              verify_integrity=False)
+
+    @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
+    def take(self, indices, axis=0, allow_fill=True,
+             fill_value=None, **kwargs):
+        nv.validate_take(tuple(), kwargs)
+        indices = _ensure_platform_int(indices)
+        taken = self._assert_take_fillable(self.labels, indices,
+                                           allow_fill=allow_fill,
+                                           fill_value=fill_value,
+                                           na_value=-1)
+        return MultiIndex(levels=self.levels, labels=taken,
+                          names=self.names, verify_integrity=False)
+
+    def _assert_take_fillable(self, values, indices, allow_fill=True,
+                              fill_value=None, na_value=None):
+        """ Internal method to handle NA filling of take """
+        # only fill if we are passing a non-None fill_value
+        if allow_fill and fill_value is not None:
+            if (indices < -1).any():
+                msg = ('When allow_fill=True and fill_value is not None, '
+                       'all indices must be >= -1')
+                raise ValueError(msg)
+            taken = [lab.take(indices) for lab in self.labels]
+            mask = indices == -1
+            if mask.any():
+                masked = []
+                for new_label in taken:
+                    label_values = new_label.values()
+                    label_values[mask] = na_value
+                    masked.append(FrozenNDArray(label_values))
+                taken = masked
+        else:
+            taken = [lab.take(indices) for lab in self.labels]
+        return taken
+
+    def append(self, other):
+        """
+        Append a collection of Index options together
+
+        Parameters
+        ----------
+        other : Index or list/tuple of indices
+
+        Returns
+        -------
+        appended : Index
+        """
+        if not isinstance(other, (list, tuple)):
+            other = [other]
+
+        if all((isinstance(o, MultiIndex) and o.nlevels >= self.nlevels)
+               for o in other):
+            arrays = []
+            for i in range(self.nlevels):
+                label = self._get_level_values(i)
+                appended = [o._get_level_values(i) for o in other]
+                arrays.append(label.append(appended))
+            return MultiIndex.from_arrays(arrays, names=self.names)
+
+        to_concat = (self.values, ) + tuple(k._values for k in other)
+        new_tuples = np.concatenate(to_concat)
+
+        # if all(isinstance(x, MultiIndex) for x in other):
+        try:
+            return MultiIndex.from_tuples(new_tuples, names=self.names)
+        except:
+            return Index(new_tuples)
+
+    def argsort(self, *args, **kwargs):
+        return self.values.argsort(*args, **kwargs)
+
+    @deprecate_kwarg(old_arg_name='n', new_arg_name='repeats')
+    def repeat(self, repeats, *args, **kwargs):
+        nv.validate_repeat(args, kwargs)
+        return MultiIndex(levels=self.levels,
+                          labels=[label.view(np.ndarray).repeat(repeats)
+                                  for label in self.labels], names=self.names,
+                          sortorder=self.sortorder, verify_integrity=False)
+
+    def where(self, cond, other=None):
+        raise NotImplementedError(".where is not supported for "
+                                  "MultiIndex operations")
+
+    def drop(self, labels, level=None, errors='raise'):
+        """
+        Make new MultiIndex with passed list of labels deleted
+
+        Parameters
+        ----------
+        labels : array-like
+            Must be a list of tuples
+        level : int or level name, default None
+
+        Returns
+        -------
+        dropped : MultiIndex
+        """
+        if level is not None:
+            return self._drop_from_level(labels, level)
+
+        try:
+            if not isinstance(labels, (np.ndarray, Index)):
+                labels = com._index_labels_to_array(labels)
+            indexer = self.get_indexer(labels)
+            mask = indexer == -1
+            if mask.any():
+                if errors != 'ignore':
+                    raise ValueError('labels %s not contained in axis' %
+                                     labels[mask])
+        except Exception:
+            pass
+
+        inds = []
+        for label in labels:
+            try:
+                loc = self.get_loc(label)
+                # get_loc returns either an integer, a slice, or a boolean
+                # mask
+                if isinstance(loc, int):
+                    inds.append(loc)
+                elif isinstance(loc, slice):
+                    inds.extend(lrange(loc.start, loc.stop))
+                elif com.is_bool_indexer(loc):
+                    if self.lexsort_depth == 0:
+                        warnings.warn('dropping on a non-lexsorted multi-index'
+                                      ' without a level parameter may impact '
+                                      'performance.',
+                                      PerformanceWarning,
+                                      stacklevel=3)
+                    loc = loc.nonzero()[0]
+                    inds.extend(loc)
+                else:
+                    msg = 'unsupported indexer of type {}'.format(type(loc))
+                    raise AssertionError(msg)
+            except KeyError:
+                if errors != 'ignore':
+                    raise
+
+        return self.delete(inds)
+
+    def _drop_from_level(self, labels, level):
+        labels = com._index_labels_to_array(labels)
+        i = self._get_level_number(level)
+        index = self.levels[i]
+        values = index.get_indexer(labels)
+
+        mask = ~algos.isin(self.labels[i], values)
+
+        return self[mask]
+
+    def swaplevel(self, i=-2, j=-1):
+        """
+        Swap level i with level j.
+
+        Calling this method does not change the ordering of the values.
+
+        Parameters
+        ----------
+        i : int, str, default -2
+            First level of index to be swapped. Can pass level name as string.
+            Type of parameters can be mixed.
+        j : int, str, default -1
+            Second level of index to be swapped. Can pass level name as string.
+            Type of parameters can be mixed.
+
+        Returns
+        -------
+        MultiIndex
+            A new MultiIndex
+
+        .. versionchanged:: 0.18.1
+
+           The indexes ``i`` and ``j`` are now optional, and default to
+           the two innermost levels of the index.
+
+        See Also
+        --------
+        Series.swaplevel : Swap levels i and j in a MultiIndex
+        Dataframe.swaplevel : Swap levels i and j in a MultiIndex on a
+            particular axis
+
+        Examples
+        --------
+        >>> mi = pd.MultiIndex(levels=[['a', 'b'], ['bb', 'aa']],
+        ...                    labels=[[0, 0, 1, 1], [0, 1, 0, 1]])
+        >>> mi
+        MultiIndex(levels=[['a', 'b'], ['bb', 'aa']],
+           labels=[[0, 0, 1, 1], [0, 1, 0, 1]])
+        >>> mi.swaplevel(0, 1)
+        MultiIndex(levels=[['bb', 'aa'], ['a', 'b']],
+           labels=[[0, 1, 0, 1], [0, 0, 1, 1]])
+        """
+        new_levels = list(self.levels)
+        new_labels = list(self.labels)
+        new_names = list(self.names)
+
+        i = self._get_level_number(i)
+        j = self._get_level_number(j)
+
+        new_levels[i], new_levels[j] = new_levels[j], new_levels[i]
+        new_labels[i], new_labels[j] = new_labels[j], new_labels[i]
+        new_names[i], new_names[j] = new_names[j], new_names[i]
+
+        return MultiIndex(levels=new_levels, labels=new_labels,
+                          names=new_names, verify_integrity=False)
+
+    def reorder_levels(self, order):
+        """
+        Rearrange levels using input order. May not drop or duplicate levels
+
+        Parameters
+        ----------
+        """
+        order = [self._get_level_number(i) for i in order]
+        if len(order) != self.nlevels:
+            raise AssertionError('Length of order must be same as '
+                                 'number of levels (%d), got %d' %
+                                 (self.nlevels, len(order)))
+        new_levels = [self.levels[i] for i in order]
+        new_labels = [self.labels[i] for i in order]
+        new_names = [self.names[i] for i in order]
+
+        return MultiIndex(levels=new_levels, labels=new_labels,
+                          names=new_names, verify_integrity=False)
+
+    def __getslice__(self, i, j):
+        return self.__getitem__(slice(i, j))
+
+    def _get_labels_for_sorting(self):
+        """
+        we categorizing our labels by using the
+        available catgories (all, not just observed)
+        excluding any missing ones (-1); this is in preparation
+        for sorting, where we need to disambiguate that -1 is not
+        a valid valid
+        """
+        from pandas.core.arrays import Categorical
+
+        def cats(label):
+            return np.arange(np.array(label).max() + 1 if len(label) else 0,
+                             dtype=label.dtype)
+
+        return [Categorical.from_codes(label, cats(label), ordered=True)
+                for label in self.labels]
+
+    def sortlevel(self, level=0, ascending=True, sort_remaining=True):
+        """
+        Sort MultiIndex at the requested level. The result will respect the
+        original ordering of the associated factor at that level.
+
+        Parameters
+        ----------
+        level : list-like, int or str, default 0
+            If a string is given, must be a name of the level
+            If list-like must be names or ints of levels.
+        ascending : boolean, default True
+            False to sort in descending order
+            Can also be a list to specify a directed ordering
+        sort_remaining : sort by the remaining levels after level.
+
+        Returns
+        -------
+        sorted_index : pd.MultiIndex
+            Resulting index
+        indexer : np.ndarray
+            Indices of output values in original index
+
+        """
+        from pandas.core.sorting import indexer_from_factorized
+
+        if isinstance(level, (compat.string_types, int)):
+            level = [level]
+        level = [self._get_level_number(lev) for lev in level]
+        sortorder = None
+
+        # we have a directed ordering via ascending
+        if isinstance(ascending, list):
+            if not len(level) == len(ascending):
+                raise ValueError("level must have same length as ascending")
+
+            from pandas.core.sorting import lexsort_indexer
+            indexer = lexsort_indexer([self.labels[lev] for lev in level],
+                                      orders=ascending)
+
+        # level ordering
+        else:
+
+            labels = list(self.labels)
+            shape = list(self.levshape)
+
+            # partition labels and shape
+            primary = tuple(labels.pop(lev - i) for i, lev in enumerate(level))
+            primshp = tuple(shape.pop(lev - i) for i, lev in enumerate(level))
+
+            if sort_remaining:
+                primary += primary + tuple(labels)
+                primshp += primshp + tuple(shape)
+            else:
+                sortorder = level[0]
+
+            indexer = indexer_from_factorized(primary, primshp,
+                                              compress=False)
+
+            if not ascending:
+                indexer = indexer[::-1]
+
+        indexer = _ensure_platform_int(indexer)
+        new_labels = [lab.take(indexer) for lab in self.labels]
+
+        new_index = MultiIndex(labels=new_labels, levels=self.levels,
+                               names=self.names, sortorder=sortorder,
+                               verify_integrity=False)
+
+        return new_index, indexer
+
+    def _convert_listlike_indexer(self, keyarr, kind=None):
+        """
+        Parameters
+        ----------
+        keyarr : list-like
+            Indexer to convert.
+
+        Returns
+        -------
+        tuple (indexer, keyarr)
+            indexer is an ndarray or None if cannot convert
+            keyarr are tuple-safe keys
+        """
+        indexer, keyarr = super(MultiIndex, self)._convert_listlike_indexer(
+            keyarr, kind=kind)
+
+        # are we indexing a specific level
+        if indexer is None and len(keyarr) and not isinstance(keyarr[0],
+                                                              tuple):
+            level = 0
+            _, indexer = self.reindex(keyarr, level=level)
+
+            # take all
+            if indexer is None:
+                indexer = np.arange(len(self))
+
+            check = self.levels[0].get_indexer(keyarr)
+            mask = check == -1
+            if mask.any():
+                raise KeyError('%s not in index' % keyarr[mask])
+
+        return indexer, keyarr
+
+    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
+    def get_indexer(self, target, method=None, limit=None, tolerance=None):
+        method = missing.clean_reindex_fill_method(method)
+        target = _ensure_index(target)
+
+        # empty indexer
+        if is_list_like(target) and not len(target):
+            return _ensure_platform_int(np.array([]))
+
+        if not isinstance(target, MultiIndex):
+            try:
+                target = MultiIndex.from_tuples(target)
+            except (TypeError, ValueError):
+
+                # let's instead try with a straight Index
+                if method is None:
+                    return Index(self.values).get_indexer(target,
+                                                          method=method,
+                                                          limit=limit,
+                                                          tolerance=tolerance)
+
+        if not self.is_unique:
+            raise Exception('Reindexing only valid with uniquely valued Index '
+                            'objects')
+
+        if method == 'pad' or method == 'backfill':
+            if tolerance is not None:
+                raise NotImplementedError("tolerance not implemented yet "
+                                          'for MultiIndex')
+            indexer = self._engine.get_indexer(target, method, limit)
+        elif method == 'nearest':
+            raise NotImplementedError("method='nearest' not implemented yet "
+                                      'for MultiIndex; see GitHub issue 9365')
+        else:
+            indexer = self._engine.get_indexer(target)
+
+        return _ensure_platform_int(indexer)
+
+    @Appender(_index_shared_docs['get_indexer_non_unique'] % _index_doc_kwargs)
+    def get_indexer_non_unique(self, target):
+        return super(MultiIndex, self).get_indexer_non_unique(target)
+
+    def reindex(self, target, method=None, level=None, limit=None,
+                tolerance=None):
+        """
+        Create index with target's values (move/add/delete values as necessary)
+
+        Returns
+        -------
+        new_index : pd.MultiIndex
+            Resulting index
+        indexer : np.ndarray or None
+            Indices of output values in original index
+
+        """
+        # GH6552: preserve names when reindexing to non-named target
+        # (i.e. neither Index nor Series).
+        preserve_names = not hasattr(target, 'names')
+
+        if level is not None:
+            if method is not None:
+                raise TypeError('Fill method not supported if level passed')
+
+            # GH7774: preserve dtype/tz if target is empty and not an Index.
+            # target may be an iterator
+            target = ibase._ensure_has_len(target)
+            if len(target) == 0 and not isinstance(target, Index):
+                idx = self.levels[level]
+                attrs = idx._get_attributes_dict()
+                attrs.pop('freq', None)  # don't preserve freq
+                target = type(idx)._simple_new(np.empty(0, dtype=idx.dtype),
+                                               **attrs)
+            else:
+                target = _ensure_index(target)
+            target, indexer, _ = self._join_level(target, level, how='right',
+                                                  return_indexers=True,
+                                                  keep_order=False)
+        else:
+            target = _ensure_index(target)
+            if self.equals(target):
+                indexer = None
+            else:
+                if self.is_unique:
+                    indexer = self.get_indexer(target, method=method,
+                                               limit=limit,
+                                               tolerance=tolerance)
+                else:
+                    raise Exception("cannot handle a non-unique multi-index!")
+
+        if not isinstance(target, MultiIndex):
+            if indexer is None:
+                target = self
+            elif (indexer >= 0).all():
+                target = self.take(indexer)
+            else:
+                # hopefully?
+                target = MultiIndex.from_tuples(target)
+
+        if (preserve_names and target.nlevels == self.nlevels and
+                target.names != self.names):
+            target = target.copy(deep=False)
+            target.names = self.names
+
+        return target, indexer
+
+    def get_slice_bound(self, label, side, kind):
+
+        if not isinstance(label, tuple):
+            label = label,
+        return self._partial_tup_index(label, side=side)
+
+    def slice_locs(self, start=None, end=None, step=None, kind=None):
+        """
+        For an ordered MultiIndex, compute the slice locations for input
+        labels.
+
+        The input labels can be tuples representing partial levels, e.g. for a
+        MultiIndex with 3 levels, you can pass a single value (corresponding to
+        the first level), or a 1-, 2-, or 3-tuple.
+
+        Parameters
+        ----------
+        start : label or tuple, default None
+            If None, defaults to the beginning
+        end : label or tuple
+            If None, defaults to the end
+        step : int or None
+            Slice step
+        kind : string, optional, defaults None
+
+        Returns
+        -------
+        (start, end) : (int, int)
+
+        Notes
+        -----
+        This method only works if the MultiIndex is properly lexsorted. So,
+        if only the first 2 levels of a 3-level MultiIndex are lexsorted,
+        you can only pass two levels to ``.slice_locs``.
+
+        Examples
+        --------
+        >>> mi = pd.MultiIndex.from_arrays([list('abbd'), list('deff')],
+        ...                                names=['A', 'B'])
+
+        Get the slice locations from the beginning of 'b' in the first level
+        until the end of the multiindex:
+
+        >>> mi.slice_locs(start='b')
+        (1, 4)
+
+        Like above, but stop at the end of 'b' in the first level and 'f' in
+        the second level:
+
+        >>> mi.slice_locs(start='b', end=('b', 'f'))
+        (1, 3)
+
+        See Also
+        --------
+        MultiIndex.get_loc : Get location for a label or a tuple of labels.
+        MultiIndex.get_locs : Get location for a label/slice/list/mask or a
+                              sequence of such.
+        """
+        # This function adds nothing to its parent implementation (the magic
+        # happens in get_slice_bound method), but it adds meaningful doc.
+        return super(MultiIndex, self).slice_locs(start, end, step, kind=kind)
+
+    def _partial_tup_index(self, tup, side='left'):
+        if len(tup) > self.lexsort_depth:
+            raise UnsortedIndexError(
+                'Key length (%d) was greater than MultiIndex'
+                ' lexsort depth (%d)' %
+                (len(tup), self.lexsort_depth))
+
+        n = len(tup)
+        start, end = 0, len(self)
+        zipped = zip(tup, self.levels, self.labels)
+        for k, (lab, lev, labs) in enumerate(zipped):
+            section = labs[start:end]
+
+            if lab not in lev:
+                if not lev.is_type_compatible(lib.infer_dtype([lab])):
+                    raise TypeError('Level type mismatch: %s' % lab)
+
+                # short circuit
+                loc = lev.searchsorted(lab, side=side)
+                if side == 'right' and loc >= 0:
+                    loc -= 1
+                return start + section.searchsorted(loc, side=side)
+
+            idx = lev.get_loc(lab)
+            if k < n - 1:
+                end = start + section.searchsorted(idx, side='right')
+                start = start + section.searchsorted(idx, side='left')
+            else:
+                return start + section.searchsorted(idx, side=side)
+
+    def get_loc(self, key, method=None):
+        """
+        Get location for a label or a tuple of labels as an integer, slice or
+        boolean mask.
+
+        Parameters
+        ----------
+        key : label or tuple of labels (one for each level)
+        method : None
+
+        Returns
+        -------
+        loc : int, slice object or boolean mask
+            If the key is past the lexsort depth, the return may be a
+            boolean mask array, otherwise it is always a slice or int.
+
+        Examples
+        ---------
+        >>> mi = pd.MultiIndex.from_arrays([list('abb'), list('def')])
+
+        >>> mi.get_loc('b')
+        slice(1, 3, None)
+
+        >>> mi.get_loc(('b', 'e'))
+        1
+
+        Notes
+        ------
+        The key cannot be a slice, list of same-level labels, a boolean mask,
+        or a sequence of such. If you want to use those, use
+        :meth:`MultiIndex.get_locs` instead.
+
+        See also
+        --------
+        Index.get_loc : get_loc method for (single-level) index.
+        MultiIndex.slice_locs : Get slice location given start label(s) and
+                                end label(s).
+        MultiIndex.get_locs : Get location for a label/slice/list/mask or a
+                              sequence of such.
+        """
+        if method is not None:
+            raise NotImplementedError('only the default get_loc method is '
+                                      'currently supported for MultiIndex')
+
+        def _maybe_to_slice(loc):
+            """convert integer indexer to boolean mask or slice if possible"""
+            if not isinstance(loc, np.ndarray) or loc.dtype != 'int64':
+                return loc
+
+            loc = lib.maybe_indices_to_slice(loc, len(self))
+            if isinstance(loc, slice):
+                return loc
+
+            mask = np.empty(len(self), dtype='bool')
+            mask.fill(False)
+            mask[loc] = True
+            return mask
+
+        if not isinstance(key, tuple):
+            loc = self._get_level_indexer(key, level=0)
+
+            # _get_level_indexer returns an empty slice if the key has
+            # been dropped from the MultiIndex
+            if isinstance(loc, slice) and loc.start == loc.stop:
+                raise KeyError(key)
+            return _maybe_to_slice(loc)
+
+        keylen = len(key)
+        if self.nlevels < keylen:
+            raise KeyError('Key length ({0}) exceeds index depth ({1})'
+                           ''.format(keylen, self.nlevels))
+
+        if keylen == self.nlevels and self.is_unique:
+            return self._engine.get_loc(key)
+
+        # -- partial selection or non-unique index
+        # break the key into 2 parts based on the lexsort_depth of the index;
+        # the first part returns a continuous slice of the index; the 2nd part
+        # needs linear search within the slice
+        i = self.lexsort_depth
+        lead_key, follow_key = key[:i], key[i:]
+        start, stop = (self.slice_locs(lead_key, lead_key)
+                       if lead_key else (0, len(self)))
+
+        if start == stop:
+            raise KeyError(key)
+
+        if not follow_key:
+            return slice(start, stop)
+
+        warnings.warn('indexing past lexsort depth may impact performance.',
+                      PerformanceWarning, stacklevel=10)
+
+        loc = np.arange(start, stop, dtype='int64')
+
+        for i, k in enumerate(follow_key, len(lead_key)):
+            mask = self.labels[i][loc] == self.levels[i].get_loc(k)
+            if not mask.all():
+                loc = loc[mask]
+            if not len(loc):
+                raise KeyError(key)
+
+        return (_maybe_to_slice(loc) if len(loc) != stop - start else
+                slice(start, stop))
+
+    def get_loc_level(self, key, level=0, drop_level=True):
+        """
+        Get both the location for the requested label(s) and the
+        resulting sliced index.
+
+        Parameters
+        ----------
+        key : label or sequence of labels
+        level : int/level name or list thereof, optional
+        drop_level : bool, default True
+            if ``False``, the resulting index will not drop any level.
+
+        Returns
+        -------
+        loc : A 2-tuple where the elements are:
+              Element 0: int, slice object or boolean array
+              Element 1: The resulting sliced multiindex/index. If the key
+              contains all levels, this will be ``None``.
+
+        Examples
+        --------
+        >>> mi = pd.MultiIndex.from_arrays([list('abb'), list('def')],
+        ...                                names=['A', 'B'])
+
+        >>> mi.get_loc_level('b')
+        (slice(1, 3, None), Index(['e', 'f'], dtype='object', name='B'))
+
+        >>> mi.get_loc_level('e', level='B')
+        (array([False,  True, False], dtype=bool),
+        Index(['b'], dtype='object', name='A'))
+
+        >>> mi.get_loc_level(['b', 'e'])
+        (1, None)
+
+        See Also
+        ---------
+        MultiIndex.get_loc  : Get location for a label or a tuple of labels.
+        MultiIndex.get_locs : Get location for a label/slice/list/mask or a
+                              sequence of such
+        """
+
+        def maybe_droplevels(indexer, levels, drop_level):
+            if not drop_level:
+                return self[indexer]
+            # kludgearound
+            orig_index = new_index = self[indexer]
+            levels = [self._get_level_number(i) for i in levels]
+            for i in sorted(levels, reverse=True):
+                try:
+                    new_index = new_index.droplevel(i)
+                except:
+
+                    # no dropping here
+                    return orig_index
+            return new_index
+
+        if isinstance(level, (tuple, list)):
+            if len(key) != len(level):
+                raise AssertionError('Key for location must have same '
+                                     'length as number of levels')
+            result = None
+            for lev, k in zip(level, key):
+                loc, new_index = self.get_loc_level(k, level=lev)
+                if isinstance(loc, slice):
+                    mask = np.zeros(len(self), dtype=bool)
+                    mask[loc] = True
+                    loc = mask
+
+                result = loc if result is None else result & loc
+
+            return result, maybe_droplevels(result, level, drop_level)
+
+        level = self._get_level_number(level)
+
+        # kludge for #1796
+        if isinstance(key, list):
+            key = tuple(key)
+
+        if isinstance(key, tuple) and level == 0:
+
+            try:
+                if key in self.levels[0]:
+                    indexer = self._get_level_indexer(key, level=level)
+                    new_index = maybe_droplevels(indexer, [0], drop_level)
+                    return indexer, new_index
+            except TypeError:
+                pass
+
+            if not any(isinstance(k, slice) for k in key):
+
+                # partial selection
+                # optionally get indexer to avoid re-calculation
+                def partial_selection(key, indexer=None):
+                    if indexer is None:
+                        indexer = self.get_loc(key)
+                    ilevels = [i for i in range(len(key))
+                               if key[i] != slice(None, None)]
+                    return indexer, maybe_droplevels(indexer, ilevels,
+                                                     drop_level)
+
+                if len(key) == self.nlevels and self.is_unique:
+                    # Complete key in unique index -> standard get_loc
+                    return (self._engine.get_loc(key), None)
+                else:
+                    return partial_selection(key)
+            else:
+                indexer = None
+                for i, k in enumerate(key):
+                    if not isinstance(k, slice):
+                        k = self._get_level_indexer(k, level=i)
+                        if isinstance(k, slice):
+                            # everything
+                            if k.start == 0 and k.stop == len(self):
+                                k = slice(None, None)
+                        else:
+                            k_index = k
+
+                    if isinstance(k, slice):
+                        if k == slice(None, None):
+                            continue
+                        else:
+                            raise TypeError(key)
+
+                    if indexer is None:
+                        indexer = k_index
+                    else:  # pragma: no cover
+                        indexer &= k_index
+                if indexer is None:
+                    indexer = slice(None, None)
+                ilevels = [i for i in range(len(key))
+                           if key[i] != slice(None, None)]
+                return indexer, maybe_droplevels(indexer, ilevels, drop_level)
+        else:
+            indexer = self._get_level_indexer(key, level=level)
+            return indexer, maybe_droplevels(indexer, [level], drop_level)
+
+    def _get_level_indexer(self, key, level=0, indexer=None):
+        # return an indexer, boolean array or a slice showing where the key is
+        # in the totality of values
+        # if the indexer is provided, then use this
+
+        level_index = self.levels[level]
+        labels = self.labels[level]
+
+        def convert_indexer(start, stop, step, indexer=indexer, labels=labels):
+            # given the inputs and the labels/indexer, compute an indexer set
+            # if we have a provided indexer, then this need not consider
+            # the entire labels set
+
+            r = np.arange(start, stop, step)
+            if indexer is not None and len(indexer) != len(labels):
+
+                # we have an indexer which maps the locations in the labels
+                # that we have already selected (and is not an indexer for the
+                # entire set) otherwise this is wasteful so we only need to
+                # examine locations that are in this set the only magic here is
+                # that the result are the mappings to the set that we have
+                # selected
+                from pandas import Series
+                mapper = Series(indexer)
+                indexer = labels.take(_ensure_platform_int(indexer))
+                result = Series(Index(indexer).isin(r).nonzero()[0])
+                m = result.map(mapper)._ndarray_values
+
+            else:
+                m = np.zeros(len(labels), dtype=bool)
+                m[np.in1d(labels, r,
+                          assume_unique=Index(labels).is_unique)] = True
+
+            return m
+
+        if isinstance(key, slice):
+            # handle a slice, returnig a slice if we can
+            # otherwise a boolean indexer
+
+            try:
+                if key.start is not None:
+                    start = level_index.get_loc(key.start)
+                else:
+                    start = 0
+                if key.stop is not None:
+                    stop = level_index.get_loc(key.stop)
+                else:
+                    stop = len(level_index) - 1
+                step = key.step
+            except KeyError:
+
+                # we have a partial slice (like looking up a partial date
+                # string)
+                start = stop = level_index.slice_indexer(key.start, key.stop,
+                                                         key.step, kind='loc')
+                step = start.step
+
+            if isinstance(start, slice) or isinstance(stop, slice):
+                # we have a slice for start and/or stop
+                # a partial date slicer on a DatetimeIndex generates a slice
+                # note that the stop ALREADY includes the stopped point (if
+                # it was a string sliced)
+                return convert_indexer(start.start, stop.stop, step)
+
+            elif level > 0 or self.lexsort_depth == 0 or step is not None:
+                # need to have like semantics here to right
+                # searching as when we are using a slice
+                # so include the stop+1 (so we include stop)
+                return convert_indexer(start, stop + 1, step)
+            else:
+                # sorted, so can return slice object -> view
+                i = labels.searchsorted(start, side='left')
+                j = labels.searchsorted(stop, side='right')
+                return slice(i, j, step)
+
+        else:
+
+            loc = level_index.get_loc(key)
+            if isinstance(loc, slice):
+                return loc
+            elif level > 0 or self.lexsort_depth == 0:
+                return np.array(labels == loc, dtype=bool)
+
+            i = labels.searchsorted(loc, side='left')
+            j = labels.searchsorted(loc, side='right')
+            return slice(i, j)
+
+    def get_locs(self, seq):
+        """
+        Get location for a given label/slice/list/mask or a sequence of such as
+        an array of integers.
+
+        Parameters
+        ----------
+        seq : label/slice/list/mask or a sequence of such
+           You should use one of the above for each level.
+           If a level should not be used, set it to ``slice(None)``.
+
+        Returns
+        -------
+        locs : array of integers suitable for passing to iloc
+
+        Examples
+        ---------
+        >>> mi = pd.MultiIndex.from_arrays([list('abb'), list('def')])
+
+        >>> mi.get_locs('b')
+        array([1, 2], dtype=int64)
+
+        >>> mi.get_locs([slice(None), ['e', 'f']])
+        array([1, 2], dtype=int64)
+
+        >>> mi.get_locs([[True, False, True], slice('e', 'f')])
+        array([2], dtype=int64)
+
+        See also
+        --------
+        MultiIndex.get_loc : Get location for a label or a tuple of labels.
+        MultiIndex.slice_locs : Get slice location given start label(s) and
+                                end label(s).
+        """
+        from .numeric import Int64Index
+
+        # must be lexsorted to at least as many levels
+        true_slices = [i for (i, s) in enumerate(com.is_true_slices(seq)) if s]
+        if true_slices and true_slices[-1] >= self.lexsort_depth:
+            raise UnsortedIndexError('MultiIndex slicing requires the index '
+                                     'to be lexsorted: slicing on levels {0}, '
+                                     'lexsort depth {1}'
+                                     .format(true_slices, self.lexsort_depth))
+        # indexer
+        # this is the list of all values that we want to select
+        n = len(self)
+        indexer = None
+
+        def _convert_to_indexer(r):
+            # return an indexer
+            if isinstance(r, slice):
+                m = np.zeros(n, dtype=bool)
+                m[r] = True
+                r = m.nonzero()[0]
+            elif com.is_bool_indexer(r):
+                if len(r) != n:
+                    raise ValueError("cannot index with a boolean indexer "
+                                     "that is not the same length as the "
+                                     "index")
+                r = r.nonzero()[0]
+            return Int64Index(r)
+
+        def _update_indexer(idxr, indexer=indexer):
+            if indexer is None:
+                indexer = Index(np.arange(n))
+            if idxr is None:
+                return indexer
+            return indexer & idxr
+
+        for i, k in enumerate(seq):
+
+            if com.is_bool_indexer(k):
+                # a boolean indexer, must be the same length!
+                k = np.asarray(k)
+                indexer = _update_indexer(_convert_to_indexer(k),
+                                          indexer=indexer)
+
+            elif is_list_like(k):
+                # a collection of labels to include from this level (these
+                # are or'd)
+                indexers = None
+                for x in k:
+                    try:
+                        idxrs = _convert_to_indexer(
+                            self._get_level_indexer(x, level=i,
+                                                    indexer=indexer))
+                        indexers = (idxrs if indexers is None
+                                    else indexers | idxrs)
+                    except KeyError:
+
+                        # ignore not founds
+                        continue
+
+                if indexers is not None:
+                    indexer = _update_indexer(indexers, indexer=indexer)
+                else:
+                    # no matches we are done
+                    return Int64Index([])._ndarray_values
+
+            elif com.is_null_slice(k):
+                # empty slice
+                indexer = _update_indexer(None, indexer=indexer)
+
+            elif isinstance(k, slice):
+
+                # a slice, include BOTH of the labels
+                indexer = _update_indexer(_convert_to_indexer(
+                    self._get_level_indexer(k, level=i, indexer=indexer)),
+                    indexer=indexer)
+            else:
+                # a single label
+                indexer = _update_indexer(_convert_to_indexer(
+                    self.get_loc_level(k, level=i, drop_level=False)[0]),
+                    indexer=indexer)
+
+        # empty indexer
+        if indexer is None:
+            return Int64Index([])._ndarray_values
+        return indexer._ndarray_values
+
+    def truncate(self, before=None, after=None):
+        """
+        Slice index between two labels / tuples, return new MultiIndex
+
+        Parameters
+        ----------
+        before : label or tuple, can be partial. Default None
+            None defaults to start
+        after : label or tuple, can be partial. Default None
+            None defaults to end
+
+        Returns
+        -------
+        truncated : MultiIndex
+        """
+        if after and before and after < before:
+            raise ValueError('after < before')
+
+        i, j = self.levels[0].slice_locs(before, after)
+        left, right = self.slice_locs(before, after)
+
+        new_levels = list(self.levels)
+        new_levels[0] = new_levels[0][i:j]
+
+        new_labels = [lab[left:right] for lab in self.labels]
+        new_labels[0] = new_labels[0] - i
+
+        return MultiIndex(levels=new_levels, labels=new_labels,
+                          verify_integrity=False)
+
+    def equals(self, other):
+        """
+        Determines if two MultiIndex objects have the same labeling information
+        (the levels themselves do not necessarily have to be the same)
+
+        See also
+        --------
+        equal_levels
+        """
+        if self.is_(other):
+            return True
+
+        if not isinstance(other, Index):
+            return False
+
+        if not isinstance(other, MultiIndex):
+            other_vals = com._values_from_object(_ensure_index(other))
+            return array_equivalent(self._ndarray_values, other_vals)
+
+        if self.nlevels != other.nlevels:
+            return False
+
+        if len(self) != len(other):
+            return False
+
+        for i in range(self.nlevels):
+            slabels = self.labels[i]
+            slabels = slabels[slabels != -1]
+            svalues = algos.take_nd(np.asarray(self.levels[i]._values),
+                                    slabels, allow_fill=False)
+
+            olabels = other.labels[i]
+            olabels = olabels[olabels != -1]
+            ovalues = algos.take_nd(
+                np.asarray(other.levels[i]._values),
+                olabels, allow_fill=False)
+
+            # since we use NaT both datetime64 and timedelta64
+            # we can have a situation where a level is typed say
+            # timedelta64 in self (IOW it has other values than NaT)
+            # but types datetime64 in other (where its all NaT)
+            # but these are equivalent
+            if len(svalues) == 0 and len(ovalues) == 0:
+                continue
+
+            if not array_equivalent(svalues, ovalues):
+                return False
+
+        return True
+
+    def equal_levels(self, other):
+        """
+        Return True if the levels of both MultiIndex objects are the same
+
+        """
+        if self.nlevels != other.nlevels:
+            return False
+
+        for i in range(self.nlevels):
+            if not self.levels[i].equals(other.levels[i]):
+                return False
+        return True
+
+    def union(self, other):
+        """
+        Form the union of two MultiIndex objects, sorting if possible
+
+        Parameters
+        ----------
+        other : MultiIndex or array / Index of tuples
+
+        Returns
+        -------
+        Index
+
+        >>> index.union(index2)
+        """
+        self._assert_can_do_setop(other)
+        other, result_names = self._convert_can_do_setop(other)
+
+        if len(other) == 0 or self.equals(other):
+            return self
+
+        uniq_tuples = lib.fast_unique_multiple([self._ndarray_values,
+                                                other._ndarray_values])
+        return MultiIndex.from_arrays(lzip(*uniq_tuples), sortorder=0,
+                                      names=result_names)
+
+    def intersection(self, other):
+        """
+        Form the intersection of two MultiIndex objects, sorting if possible
+
+        Parameters
+        ----------
+        other : MultiIndex or array / Index of tuples
+
+        Returns
+        -------
+        Index
+        """
+        self._assert_can_do_setop(other)
+        other, result_names = self._convert_can_do_setop(other)
+
+        if self.equals(other):
+            return self
+
+        self_tuples = self._ndarray_values
+        other_tuples = other._ndarray_values
+        uniq_tuples = sorted(set(self_tuples) & set(other_tuples))
+        if len(uniq_tuples) == 0:
+            return MultiIndex(levels=self.levels,
+                              labels=[[]] * self.nlevels,
+                              names=result_names, verify_integrity=False)
+        else:
+            return MultiIndex.from_arrays(lzip(*uniq_tuples), sortorder=0,
+                                          names=result_names)
+
+    def difference(self, other):
+        """
+        Compute sorted set difference of two MultiIndex objects
+
+        Returns
+        -------
+        diff : MultiIndex
+        """
+        self._assert_can_do_setop(other)
+        other, result_names = self._convert_can_do_setop(other)
+
+        if len(other) == 0:
+            return self
+
+        if self.equals(other):
+            return MultiIndex(levels=self.levels,
+                              labels=[[]] * self.nlevels,
+                              names=result_names, verify_integrity=False)
+
+        difference = sorted(set(self._ndarray_values) -
+                            set(other._ndarray_values))
+
+        if len(difference) == 0:
+            return MultiIndex(levels=[[]] * self.nlevels,
+                              labels=[[]] * self.nlevels,
+                              names=result_names, verify_integrity=False)
+        else:
+            return MultiIndex.from_tuples(difference, sortorder=0,
+                                          names=result_names)
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        dtype = pandas_dtype(dtype)
+        if is_categorical_dtype(dtype):
+            msg = '> 1 ndim Categorical are not supported at this time'
+            raise NotImplementedError(msg)
+        elif not is_object_dtype(dtype):
+            msg = ('Setting {cls} dtype to anything other than object '
+                   'is not supported').format(cls=self.__class__)
+            raise TypeError(msg)
+        elif copy is True:
+            return self._shallow_copy()
+        return self
+
+    def _convert_can_do_setop(self, other):
+        result_names = self.names
+
+        if not hasattr(other, 'names'):
+            if len(other) == 0:
+                other = MultiIndex(levels=[[]] * self.nlevels,
+                                   labels=[[]] * self.nlevels,
+                                   verify_integrity=False)
+            else:
+                msg = 'other must be a MultiIndex or a list of tuples'
+                try:
+                    other = MultiIndex.from_tuples(other)
+                except:
+                    raise TypeError(msg)
+        else:
+            result_names = self.names if self.names == other.names else None
+        return other, result_names
+
+    def insert(self, loc, item):
+        """
+        Make new MultiIndex inserting new item at location
+
+        Parameters
+        ----------
+        loc : int
+        item : tuple
+            Must be same length as number of levels in the MultiIndex
+
+        Returns
+        -------
+        new_index : Index
+        """
+        # Pad the key with empty strings if lower levels of the key
+        # aren't specified:
+        if not isinstance(item, tuple):
+            item = (item, ) + ('', ) * (self.nlevels - 1)
+        elif len(item) != self.nlevels:
+            raise ValueError('Item must have length equal to number of '
+                             'levels.')
+
+        new_levels = []
+        new_labels = []
+        for k, level, labels in zip(item, self.levels, self.labels):
+            if k not in level:
+                # have to insert into level
+                # must insert at end otherwise you have to recompute all the
+                # other labels
+                lev_loc = len(level)
+                level = level.insert(lev_loc, k)
+            else:
+                lev_loc = level.get_loc(k)
+
+            new_levels.append(level)
+            new_labels.append(np.insert(_ensure_int64(labels), loc, lev_loc))
+
+        return MultiIndex(levels=new_levels, labels=new_labels,
+                          names=self.names, verify_integrity=False)
+
+    def delete(self, loc):
+        """
+        Make new index with passed location deleted
+
+        Returns
+        -------
+        new_index : MultiIndex
+        """
+        new_labels = [np.delete(lab, loc) for lab in self.labels]
+        return MultiIndex(levels=self.levels, labels=new_labels,
+                          names=self.names, verify_integrity=False)
+
+    get_major_bounds = slice_locs
+
+    __bounds = None
+
+    @property
+    def _bounds(self):
+        """
+        Return or compute and return slice points for level 0, assuming
+        sortedness
+        """
+        if self.__bounds is None:
+            inds = np.arange(len(self.levels[0]))
+            self.__bounds = self.labels[0].searchsorted(inds)
+
+        return self.__bounds
+
+    def _wrap_joined_index(self, joined, other):
+        names = self.names if self.names == other.names else None
+        return MultiIndex.from_tuples(joined, names=names)
+
+    @Appender(Index.isin.__doc__)
+    def isin(self, values, level=None):
+        if level is None:
+            values = MultiIndex.from_tuples(values,
+                                            names=self.names).values
+            return algos.isin(self.values, values)
+        else:
+            num = self._get_level_number(level)
+            levs = self.levels[num]
+            labs = self.labels[num]
+
+            sought_labels = levs.isin(values).nonzero()[0]
+            if levs.size == 0:
+                return np.zeros(len(labs), dtype=np.bool_)
+            else:
+                return np.lib.arraysetops.in1d(labs, sought_labels)
+
+    def _reference_duplicate_name(self, name):
+        """
+        Returns True if the name refered to in self.names is duplicated.
+        """
+        # count the times name equals an element in self.names.
+        return sum(name == n for n in self.names) > 1
+
+
+MultiIndex._add_numeric_methods_disabled()
+MultiIndex._add_numeric_methods_add_sub_disabled()
+MultiIndex._add_logical_methods_disabled()
+
+
+def _sparsify(label_list, start=0, sentinel=''):
+    pivoted = lzip(*label_list)
+    k = len(label_list)
+
+    result = pivoted[:start + 1]
+    prev = pivoted[start]
+
+    for cur in pivoted[start + 1:]:
+        sparse_cur = []
+
+        for i, (p, t) in enumerate(zip(prev, cur)):
+            if i == k - 1:
+                sparse_cur.append(t)
+                result.append(sparse_cur)
+                break
+
+            if p == t:
+                sparse_cur.append(sentinel)
+            else:
+                sparse_cur.extend(cur[i:])
+                result.append(sparse_cur)
+                break
+
+        prev = cur
+
+    return lzip(*result)
+
+
+def _get_na_rep(dtype):
+    return {np.datetime64: 'NaT', np.timedelta64: 'NaT'}.get(dtype, 'NaN')
diff --git a/pandas/core/indexes/numeric.py b/pandas/core/indexes/numeric.py
new file mode 100644
index 0000000000000..1fe0c8fa289e6
--- /dev/null
+++ b/pandas/core/indexes/numeric.py
@@ -0,0 +1,433 @@
+import numpy as np
+from pandas._libs import (index as libindex,
+                          join as libjoin)
+from pandas.core.dtypes.common import (
+    is_dtype_equal,
+    pandas_dtype,
+    needs_i8_conversion,
+    is_integer_dtype,
+    is_bool,
+    is_bool_dtype,
+    is_scalar)
+
+from pandas import compat
+from pandas.core import algorithms
+import pandas.core.common as com
+from pandas.core.indexes.base import (
+    Index, InvalidIndexError, _index_shared_docs)
+from pandas.util._decorators import Appender, cache_readonly
+import pandas.core.dtypes.concat as _concat
+import pandas.core.indexes.base as ibase
+
+
+_num_index_shared_docs = dict()
+
+
+class NumericIndex(Index):
+    """
+    Provide numeric type operations
+
+    This is an abstract class
+
+    """
+    _is_numeric_dtype = True
+
+    def __new__(cls, data=None, dtype=None, copy=False, name=None,
+                fastpath=False):
+
+        if fastpath:
+            return cls._simple_new(data, name=name)
+
+        # is_scalar, generators handled in coerce_to_ndarray
+        data = cls._coerce_to_ndarray(data)
+
+        if issubclass(data.dtype.type, compat.string_types):
+            cls._string_data_error(data)
+
+        if copy or not is_dtype_equal(data.dtype, cls._default_dtype):
+            subarr = np.array(data, dtype=cls._default_dtype, copy=copy)
+            cls._assert_safe_casting(data, subarr)
+        else:
+            subarr = data
+
+        if name is None and hasattr(data, 'name'):
+            name = data.name
+        return cls._simple_new(subarr, name=name)
+
+    @Appender(_index_shared_docs['_maybe_cast_slice_bound'])
+    def _maybe_cast_slice_bound(self, label, side, kind):
+        assert kind in ['ix', 'loc', 'getitem', None]
+
+        # we will try to coerce to integers
+        return self._maybe_cast_indexer(label)
+
+    @Appender(_index_shared_docs['_shallow_copy'])
+    def _shallow_copy(self, values=None, **kwargs):
+        if values is not None and not self._can_hold_na:
+            # Ensure we are not returning an Int64Index with float data:
+            return self._shallow_copy_with_infer(values=values, **kwargs)
+        return (super(NumericIndex, self)._shallow_copy(values=values,
+                                                        **kwargs))
+
+    def _convert_for_op(self, value):
+        """ Convert value to be insertable to ndarray """
+
+        if is_bool(value) or is_bool_dtype(value):
+            # force conversion to object
+            # so we don't lose the bools
+            raise TypeError
+
+        return value
+
+    def _convert_tolerance(self, tolerance, target):
+        tolerance = np.asarray(tolerance)
+        if target.size != tolerance.size and tolerance.size > 1:
+            raise ValueError('list-like tolerance size must match '
+                             'target index size')
+        if not np.issubdtype(tolerance.dtype, np.number):
+            if tolerance.ndim > 0:
+                raise ValueError(('tolerance argument for %s must contain '
+                                  'numeric elements if it is list type') %
+                                 (type(self).__name__,))
+            else:
+                raise ValueError(('tolerance argument for %s must be numeric '
+                                  'if it is a scalar: %r') %
+                                 (type(self).__name__, tolerance))
+        return tolerance
+
+    @classmethod
+    def _assert_safe_casting(cls, data, subarr):
+        """
+        Subclasses need to override this only if the process of casting data
+        from some accepted dtype to the internal dtype(s) bears the risk of
+        truncation (e.g. float to int).
+        """
+        pass
+
+    def _concat_same_dtype(self, indexes, name):
+        return _concat._concat_index_same_dtype(indexes).rename(name)
+
+    @property
+    def is_all_dates(self):
+        """
+        Checks that all the labels are datetime objects
+        """
+        return False
+
+
+_num_index_shared_docs['class_descr'] = """
+    Immutable ndarray implementing an ordered, sliceable set. The basic object
+    storing axis labels for all pandas objects. %(klass)s is a special case
+    of `Index` with purely %(ltype)s labels. %(extra)s
+
+    Parameters
+    ----------
+    data : array-like (1-dimensional)
+    dtype : NumPy dtype (default: %(dtype)s)
+    copy : bool
+        Make a copy of input ndarray
+    name : object
+        Name to be stored in the index
+
+    Attributes
+    ----------
+    None
+
+    Methods
+    -------
+    None
+
+    Notes
+    -----
+    An Index instance can **only** contain hashable objects.
+
+    See also
+    --------
+    Index : The base pandas Index type
+"""
+
+_int64_descr_args = dict(
+    klass='Int64Index',
+    ltype='integer',
+    dtype='int64',
+    extra=''
+)
+
+
+class Int64Index(NumericIndex):
+    __doc__ = _num_index_shared_docs['class_descr'] % _int64_descr_args
+
+    _typ = 'int64index'
+    _left_indexer_unique = libjoin.left_join_indexer_unique_int64
+    _left_indexer = libjoin.left_join_indexer_int64
+    _inner_indexer = libjoin.inner_join_indexer_int64
+    _outer_indexer = libjoin.outer_join_indexer_int64
+    _can_hold_na = False
+    _engine_type = libindex.Int64Engine
+    _default_dtype = np.int64
+
+    @property
+    def inferred_type(self):
+        """Always 'integer' for ``Int64Index``"""
+        return 'integer'
+
+    @property
+    def asi8(self):
+        # do not cache or you'll create a memory leak
+        return self.values.view('i8')
+
+    @Appender(_index_shared_docs['_convert_scalar_indexer'])
+    def _convert_scalar_indexer(self, key, kind=None):
+        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
+
+        # don't coerce ilocs to integers
+        if kind != 'iloc':
+            key = self._maybe_cast_indexer(key)
+        return (super(Int64Index, self)
+                ._convert_scalar_indexer(key, kind=kind))
+
+    def _wrap_joined_index(self, joined, other):
+        name = self.name if self.name == other.name else None
+        return Int64Index(joined, name=name)
+
+    @classmethod
+    def _assert_safe_casting(cls, data, subarr):
+        """
+        Ensure incoming data can be represented as ints.
+        """
+        if not issubclass(data.dtype.type, np.signedinteger):
+            if not np.array_equal(data, subarr):
+                raise TypeError('Unsafe NumPy casting, you must '
+                                'explicitly cast')
+
+
+Int64Index._add_numeric_methods()
+Int64Index._add_logical_methods()
+
+_uint64_descr_args = dict(
+    klass='UInt64Index',
+    ltype='unsigned integer',
+    dtype='uint64',
+    extra=''
+)
+
+
+class UInt64Index(NumericIndex):
+    __doc__ = _num_index_shared_docs['class_descr'] % _uint64_descr_args
+
+    _typ = 'uint64index'
+    _left_indexer_unique = libjoin.left_join_indexer_unique_uint64
+    _left_indexer = libjoin.left_join_indexer_uint64
+    _inner_indexer = libjoin.inner_join_indexer_uint64
+    _outer_indexer = libjoin.outer_join_indexer_uint64
+    _can_hold_na = False
+    _engine_type = libindex.UInt64Engine
+    _default_dtype = np.uint64
+
+    @property
+    def inferred_type(self):
+        """Always 'integer' for ``UInt64Index``"""
+        return 'integer'
+
+    @property
+    def asi8(self):
+        # do not cache or you'll create a memory leak
+        return self.values.view('u8')
+
+    @Appender(_index_shared_docs['_convert_scalar_indexer'])
+    def _convert_scalar_indexer(self, key, kind=None):
+        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
+
+        # don't coerce ilocs to integers
+        if kind != 'iloc':
+            key = self._maybe_cast_indexer(key)
+        return (super(UInt64Index, self)
+                ._convert_scalar_indexer(key, kind=kind))
+
+    @Appender(_index_shared_docs['_convert_arr_indexer'])
+    def _convert_arr_indexer(self, keyarr):
+        # Cast the indexer to uint64 if possible so
+        # that the values returned from indexing are
+        # also uint64.
+        keyarr = com._asarray_tuplesafe(keyarr)
+        if is_integer_dtype(keyarr):
+            return com._asarray_tuplesafe(keyarr, dtype=np.uint64)
+        return keyarr
+
+    @Appender(_index_shared_docs['_convert_index_indexer'])
+    def _convert_index_indexer(self, keyarr):
+        # Cast the indexer to uint64 if possible so
+        # that the values returned from indexing are
+        # also uint64.
+        if keyarr.is_integer():
+            return keyarr.astype(np.uint64)
+        return keyarr
+
+    def _wrap_joined_index(self, joined, other):
+        name = self.name if self.name == other.name else None
+        return UInt64Index(joined, name=name)
+
+    @classmethod
+    def _assert_safe_casting(cls, data, subarr):
+        """
+        Ensure incoming data can be represented as uints.
+        """
+        if not issubclass(data.dtype.type, np.unsignedinteger):
+            if not np.array_equal(data, subarr):
+                raise TypeError('Unsafe NumPy casting, you must '
+                                'explicitly cast')
+
+
+UInt64Index._add_numeric_methods()
+UInt64Index._add_logical_methods()
+
+_float64_descr_args = dict(
+    klass='Float64Index',
+    dtype='float64',
+    ltype='float',
+    extra=''
+)
+
+
+class Float64Index(NumericIndex):
+    __doc__ = _num_index_shared_docs['class_descr'] % _float64_descr_args
+
+    _typ = 'float64index'
+    _engine_type = libindex.Float64Engine
+    _left_indexer_unique = libjoin.left_join_indexer_unique_float64
+    _left_indexer = libjoin.left_join_indexer_float64
+    _inner_indexer = libjoin.inner_join_indexer_float64
+    _outer_indexer = libjoin.outer_join_indexer_float64
+
+    _default_dtype = np.float64
+
+    @property
+    def inferred_type(self):
+        """Always 'floating' for ``Float64Index``"""
+        return 'floating'
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        dtype = pandas_dtype(dtype)
+        if needs_i8_conversion(dtype):
+            msg = ('Cannot convert Float64Index to dtype {dtype}; integer '
+                   'values are required for conversion').format(dtype=dtype)
+            raise TypeError(msg)
+        elif is_integer_dtype(dtype) and self.hasnans:
+            # GH 13149
+            raise ValueError('Cannot convert NA to integer')
+        return super(Float64Index, self).astype(dtype, copy=copy)
+
+    @Appender(_index_shared_docs['_convert_scalar_indexer'])
+    def _convert_scalar_indexer(self, key, kind=None):
+        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
+
+        if kind == 'iloc':
+            return self._validate_indexer('positional', key, kind)
+
+        return key
+
+    @Appender(_index_shared_docs['_convert_slice_indexer'])
+    def _convert_slice_indexer(self, key, kind=None):
+        # if we are not a slice, then we are done
+        if not isinstance(key, slice):
+            return key
+
+        if kind == 'iloc':
+            return super(Float64Index, self)._convert_slice_indexer(key,
+                                                                    kind=kind)
+
+        # translate to locations
+        return self.slice_indexer(key.start, key.stop, key.step, kind=kind)
+
+    def _format_native_types(self, na_rep='', float_format=None, decimal='.',
+                             quoting=None, **kwargs):
+        from pandas.io.formats.format import FloatArrayFormatter
+        formatter = FloatArrayFormatter(self.values, na_rep=na_rep,
+                                        float_format=float_format,
+                                        decimal=decimal, quoting=quoting,
+                                        fixed_width=False)
+        return formatter.get_result_as_array()
+
+    def get_value(self, series, key):
+        """ we always want to get an index value, never a value """
+        if not is_scalar(key):
+            raise InvalidIndexError
+
+        k = com._values_from_object(key)
+        loc = self.get_loc(k)
+        new_values = com._values_from_object(series)[loc]
+
+        return new_values
+
+    def equals(self, other):
+        """
+        Determines if two Index objects contain the same elements.
+        """
+        if self is other:
+            return True
+
+        if not isinstance(other, Index):
+            return False
+
+        # need to compare nans locations and make sure that they are the same
+        # since nans don't compare equal this is a bit tricky
+        try:
+            if not isinstance(other, Float64Index):
+                other = self._constructor(other)
+            if (not is_dtype_equal(self.dtype, other.dtype) or
+                    self.shape != other.shape):
+                return False
+            left, right = self._ndarray_values, other._ndarray_values
+            return ((left == right) | (self._isnan & other._isnan)).all()
+        except (TypeError, ValueError):
+            return False
+
+    def __contains__(self, other):
+        if super(Float64Index, self).__contains__(other):
+            return True
+
+        try:
+            # if other is a sequence this throws a ValueError
+            return np.isnan(other) and self.hasnans
+        except ValueError:
+            try:
+                return len(other) <= 1 and ibase._try_get_item(other) in self
+            except TypeError:
+                pass
+        except TypeError:
+            pass
+
+        return False
+
+    @Appender(_index_shared_docs['get_loc'])
+    def get_loc(self, key, method=None, tolerance=None):
+        try:
+            if np.all(np.isnan(key)):
+                nan_idxs = self._nan_idxs
+                try:
+                    return nan_idxs.item()
+                except (ValueError, IndexError):
+                    # should only need to catch ValueError here but on numpy
+                    # 1.7 .item() can raise IndexError when NaNs are present
+                    if not len(nan_idxs):
+                        raise KeyError(key)
+                    return nan_idxs
+        except (TypeError, NotImplementedError):
+            pass
+        return super(Float64Index, self).get_loc(key, method=method,
+                                                 tolerance=tolerance)
+
+    @cache_readonly
+    def is_unique(self):
+        return super(Float64Index, self).is_unique and self._nan_idxs.size < 2
+
+    @Appender(Index.isin.__doc__)
+    def isin(self, values, level=None):
+        if level is not None:
+            self._validate_index_level(level)
+        return algorithms.isin(np.array(self), values)
+
+
+Float64Index._add_numeric_methods()
+Float64Index._add_logical_methods_disabled()
diff --git a/pandas/core/indexes/period.py b/pandas/core/indexes/period.py
new file mode 100644
index 0000000000000..d4d35d48743bd
--- /dev/null
+++ b/pandas/core/indexes/period.py
@@ -0,0 +1,1300 @@
+# pylint: disable=E1101,E1103,W0232
+from datetime import datetime, timedelta
+import numpy as np
+import warnings
+
+from pandas.core import common as com
+from pandas.core.dtypes.common import (
+    is_integer,
+    is_float,
+    is_integer_dtype,
+    is_float_dtype,
+    is_scalar,
+    is_datetime64_dtype,
+    is_datetime64_any_dtype,
+    is_period_dtype,
+    is_bool_dtype,
+    pandas_dtype,
+    _ensure_object)
+from pandas.core.dtypes.dtypes import PeriodDtype
+from pandas.core.dtypes.generic import ABCSeries
+
+import pandas.tseries.frequencies as frequencies
+from pandas.tseries.frequencies import get_freq_code as _gfc
+from pandas.tseries.offsets import Tick, DateOffset
+
+from pandas.core.indexes.datetimes import DatetimeIndex, Int64Index, Index
+from pandas.core.indexes.datetimelike import DatelikeOps, DatetimeIndexOpsMixin
+from pandas.core.tools.datetimes import parse_time_string
+
+from pandas._libs.lib import infer_dtype
+from pandas._libs import tslib, index as libindex
+from pandas._libs.tslibs.period import (Period, IncompatibleFrequency,
+                                        get_period_field_arr,
+                                        _validate_end_alias, _quarter_to_myear)
+from pandas._libs.tslibs.fields import isleapyear_arr
+from pandas._libs.tslibs import resolution, period
+from pandas._libs.tslibs.timedeltas import delta_to_nanoseconds
+
+from pandas.core.base import _shared_docs
+from pandas.core.indexes.base import _index_shared_docs, _ensure_index
+
+from pandas import compat
+from pandas.util._decorators import (Appender, Substitution, cache_readonly,
+                                     deprecate_kwarg)
+from pandas.compat import zip, u
+
+import pandas.core.indexes.base as ibase
+_index_doc_kwargs = dict(ibase._index_doc_kwargs)
+_index_doc_kwargs.update(
+    dict(target_klass='PeriodIndex or list of Periods'))
+
+
+def _field_accessor(name, alias, docstring=None):
+    def f(self):
+        base, mult = _gfc(self.freq)
+        result = get_period_field_arr(alias, self._ndarray_values, base)
+        return Index(result, name=self.name)
+    f.__name__ = name
+    f.__doc__ = docstring
+    return property(f)
+
+
+def dt64arr_to_periodarr(data, freq, tz):
+    if data.dtype != np.dtype('M8[ns]'):
+        raise ValueError('Wrong dtype: %s' % data.dtype)
+
+    freq = Period._maybe_convert_freq(freq)
+    base, mult = _gfc(freq)
+    return period.dt64arr_to_periodarr(data.view('i8'), base, tz)
+
+# --- Period index sketch
+
+
+_DIFFERENT_FREQ_INDEX = period._DIFFERENT_FREQ_INDEX
+
+
+def _period_index_cmp(opname, cls):
+    """
+    Wrap comparison operations to convert Period-like to PeriodDtype
+    """
+    nat_result = True if opname == '__ne__' else False
+
+    def wrapper(self, other):
+        op = getattr(self._ndarray_values, opname)
+        if isinstance(other, Period):
+            if other.freq != self.freq:
+                msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
+                raise IncompatibleFrequency(msg)
+
+            result = op(other.ordinal)
+        elif isinstance(other, PeriodIndex):
+            if other.freq != self.freq:
+                msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
+                raise IncompatibleFrequency(msg)
+
+            result = op(other._ndarray_values)
+
+            mask = self._isnan | other._isnan
+            if mask.any():
+                result[mask] = nat_result
+
+            return result
+        elif other is tslib.NaT:
+            result = np.empty(len(self._ndarray_values), dtype=bool)
+            result.fill(nat_result)
+        else:
+            other = Period(other, freq=self.freq)
+            result = op(other.ordinal)
+
+        if self.hasnans:
+            result[self._isnan] = nat_result
+
+        return result
+
+    return compat.set_function_name(wrapper, opname, cls)
+
+
+def _new_PeriodIndex(cls, **d):
+    # GH13277 for unpickling
+    if d['data'].dtype == 'int64':
+        values = d.pop('data')
+    return cls._from_ordinals(values=values, **d)
+
+
+class PeriodIndex(DatelikeOps, DatetimeIndexOpsMixin, Int64Index):
+    """
+    Immutable ndarray holding ordinal values indicating regular periods in
+    time such as particular years, quarters, months, etc.
+
+    Index keys are boxed to Period objects which carries the metadata (eg,
+    frequency information).
+
+    Parameters
+    ----------
+    data : array-like (1-dimensional), optional
+        Optional period-like data to construct index with
+    copy : bool
+        Make a copy of input ndarray
+    freq : string or period object, optional
+        One of pandas period strings or corresponding objects
+    start : starting value, period-like, optional
+        If data is None, used as the start point in generating regular
+        period data.
+    periods : int, optional, > 0
+        Number of periods to generate, if generating index. Takes precedence
+        over end argument
+    end : end value, period-like, optional
+        If periods is none, generated index will extend to first conforming
+        period on or just past end argument
+    year : int, array, or Series, default None
+    month : int, array, or Series, default None
+    quarter : int, array, or Series, default None
+    day : int, array, or Series, default None
+    hour : int, array, or Series, default None
+    minute : int, array, or Series, default None
+    second : int, array, or Series, default None
+    tz : object, default None
+        Timezone for converting datetime64 data to Periods
+    dtype : str or PeriodDtype, default None
+
+    Attributes
+    ----------
+    day
+    dayofweek
+    dayofyear
+    days_in_month
+    daysinmonth
+    end_time
+    freq
+    freqstr
+    hour
+    is_leap_year
+    minute
+    month
+    quarter
+    qyear
+    second
+    start_time
+    week
+    weekday
+    weekofyear
+    year
+
+    Methods
+    -------
+    asfreq
+    strftime
+    to_timestamp
+    tz_convert
+    tz_localize
+
+    Examples
+    --------
+    >>> idx = PeriodIndex(year=year_arr, quarter=q_arr)
+
+    >>> idx2 = PeriodIndex(start='2000', end='2010', freq='A')
+
+    See Also
+    ---------
+    Index : The base pandas Index type
+    Period : Represents a period of time
+    DatetimeIndex : Index with datetime64 data
+    TimedeltaIndex : Index of timedelta64 data
+    """
+    _typ = 'periodindex'
+    _attributes = ['name', 'freq']
+
+    # define my properties & methods for delegation
+    _other_ops = []
+    _bool_ops = ['is_leap_year']
+    _object_ops = ['start_time', 'end_time', 'freq']
+    _field_ops = ['year', 'month', 'day', 'hour', 'minute', 'second',
+                  'weekofyear', 'weekday', 'week', 'dayofweek',
+                  'dayofyear', 'quarter', 'qyear',
+                  'days_in_month', 'daysinmonth']
+    _datetimelike_ops = _field_ops + _object_ops + _bool_ops
+    _datetimelike_methods = ['strftime', 'to_timestamp', 'asfreq']
+
+    _is_numeric_dtype = False
+    _infer_as_myclass = True
+
+    _freq = None
+
+    _engine_type = libindex.PeriodEngine
+
+    @classmethod
+    def _add_comparison_methods(cls):
+        """ add in comparison methods """
+        cls.__eq__ = _period_index_cmp('__eq__', cls)
+        cls.__ne__ = _period_index_cmp('__ne__', cls)
+        cls.__lt__ = _period_index_cmp('__lt__', cls)
+        cls.__gt__ = _period_index_cmp('__gt__', cls)
+        cls.__le__ = _period_index_cmp('__le__', cls)
+        cls.__ge__ = _period_index_cmp('__ge__', cls)
+
+    def __new__(cls, data=None, ordinal=None, freq=None, start=None, end=None,
+                periods=None, tz=None, dtype=None, copy=False, name=None,
+                **fields):
+
+        valid_field_set = {'year', 'month', 'day', 'quarter',
+                           'hour', 'minute', 'second'}
+
+        if not set(fields).issubset(valid_field_set):
+            raise TypeError('__new__() got an unexpected keyword argument {}'.
+                            format(list(set(fields) - valid_field_set)[0]))
+
+        if periods is not None:
+            if is_float(periods):
+                periods = int(periods)
+            elif not is_integer(periods):
+                msg = 'periods must be a number, got {periods}'
+                raise TypeError(msg.format(periods=periods))
+
+        if name is None and hasattr(data, 'name'):
+            name = data.name
+
+        if dtype is not None:
+            dtype = pandas_dtype(dtype)
+            if not is_period_dtype(dtype):
+                raise ValueError('dtype must be PeriodDtype')
+            if freq is None:
+                freq = dtype.freq
+            elif freq != dtype.freq:
+                msg = 'specified freq and dtype are different'
+                raise IncompatibleFrequency(msg)
+
+        # coerce freq to freq object, otherwise it can be coerced elementwise
+        # which is slow
+        if freq:
+            freq = Period._maybe_convert_freq(freq)
+
+        if data is None:
+            if ordinal is not None:
+                data = np.asarray(ordinal, dtype=np.int64)
+            else:
+                data, freq = cls._generate_range(start, end, periods,
+                                                 freq, fields)
+            return cls._from_ordinals(data, name=name, freq=freq)
+
+        if isinstance(data, PeriodIndex):
+            if freq is None or freq == data.freq:  # no freq change
+                freq = data.freq
+                data = data._ndarray_values
+            else:
+                base1, _ = _gfc(data.freq)
+                base2, _ = _gfc(freq)
+                data = period.period_asfreq_arr(data._ndarray_values,
+                                                base1, base2, 1)
+            return cls._simple_new(data, name=name, freq=freq)
+
+        # not array / index
+        if not isinstance(data, (np.ndarray, PeriodIndex,
+                                 DatetimeIndex, Int64Index)):
+            if is_scalar(data) or isinstance(data, Period):
+                cls._scalar_data_error(data)
+
+            # other iterable of some kind
+            if not isinstance(data, (list, tuple)):
+                data = list(data)
+
+            data = np.asarray(data)
+
+        # datetime other than period
+        if is_datetime64_dtype(data.dtype):
+            data = dt64arr_to_periodarr(data, freq, tz)
+            return cls._from_ordinals(data, name=name, freq=freq)
+
+        # check not floats
+        if infer_dtype(data) == 'floating' and len(data) > 0:
+            raise TypeError("PeriodIndex does not allow "
+                            "floating point in construction")
+
+        # anything else, likely an array of strings or periods
+        data = _ensure_object(data)
+        freq = freq or period.extract_freq(data)
+        data = period.extract_ordinals(data, freq)
+        return cls._from_ordinals(data, name=name, freq=freq)
+
+    @cache_readonly
+    def _engine(self):
+        return self._engine_type(lambda: self, len(self))
+
+    @classmethod
+    def _generate_range(cls, start, end, periods, freq, fields):
+        if freq is not None:
+            freq = Period._maybe_convert_freq(freq)
+
+        field_count = len(fields)
+        if com._count_not_none(start, end) > 0:
+            if field_count > 0:
+                raise ValueError('Can either instantiate from fields '
+                                 'or endpoints, but not both')
+            subarr, freq = _get_ordinal_range(start, end, periods, freq)
+        elif field_count > 0:
+            subarr, freq = _range_from_fields(freq=freq, **fields)
+        else:
+            raise ValueError('Not enough parameters to construct '
+                             'Period range')
+
+        return subarr, freq
+
+    @classmethod
+    def _simple_new(cls, values, name=None, freq=None, **kwargs):
+        """
+        Values can be any type that can be coerced to Periods.
+        Ordinals in an ndarray are fastpath-ed to `_from_ordinals`
+        """
+        if not is_integer_dtype(values):
+            values = np.array(values, copy=False)
+            if len(values) > 0 and is_float_dtype(values):
+                raise TypeError("PeriodIndex can't take floats")
+            return cls(values, name=name, freq=freq, **kwargs)
+
+        return cls._from_ordinals(values, name, freq, **kwargs)
+
+    @classmethod
+    def _from_ordinals(cls, values, name=None, freq=None, **kwargs):
+        """
+        Values should be int ordinals
+        `__new__` & `_simple_new` cooerce to ordinals and call this method
+        """
+
+        values = np.array(values, dtype='int64', copy=False)
+
+        result = object.__new__(cls)
+        result._data = values
+        result.name = name
+        if freq is None:
+            raise ValueError('freq is not specified and cannot be inferred')
+        result._freq = Period._maybe_convert_freq(freq)
+        result._reset_identity()
+        return result
+
+    def _shallow_copy_with_infer(self, values=None, **kwargs):
+        """ we always want to return a PeriodIndex """
+        return self._shallow_copy(values=values, **kwargs)
+
+    def _shallow_copy(self, values=None, freq=None, **kwargs):
+        if freq is None:
+            freq = self.freq
+        if values is None:
+            values = self._ndarray_values
+        return super(PeriodIndex, self)._shallow_copy(values=values,
+                                                      freq=freq, **kwargs)
+
+    def _coerce_scalar_to_index(self, item):
+        """
+        we need to coerce a scalar to a compat for our index type
+
+        Parameters
+        ----------
+        item : scalar item to coerce
+        """
+        return PeriodIndex([item], **self._get_attributes_dict())
+
+    @Appender(_index_shared_docs['__contains__'])
+    def __contains__(self, key):
+        if isinstance(key, Period):
+            if key.freq != self.freq:
+                return False
+            else:
+                return key.ordinal in self._engine
+        else:
+            try:
+                self.get_loc(key)
+                return True
+            except Exception:
+                return False
+            return False
+
+    contains = __contains__
+
+    @property
+    def asi8(self):
+        return self._ndarray_values.view('i8')
+
+    @cache_readonly
+    def _int64index(self):
+        return Int64Index(self.asi8, name=self.name, fastpath=True)
+
+    @property
+    def values(self):
+        return self.astype(object).values
+
+    @property
+    def _ndarray_values(self):
+        # Ordinals
+        return self._data
+
+    def __array__(self, dtype=None):
+        if is_integer_dtype(dtype):
+            return self.asi8
+        else:
+            return self.astype(object).values
+
+    def __array_wrap__(self, result, context=None):
+        """
+        Gets called after a ufunc. Needs additional handling as
+        PeriodIndex stores internal data as int dtype
+
+        Replace this to __numpy_ufunc__ in future version
+        """
+        if isinstance(context, tuple) and len(context) > 0:
+            func = context[0]
+            if (func is np.add):
+                pass
+            elif (func is np.subtract):
+                name = self.name
+                left = context[1][0]
+                right = context[1][1]
+                if (isinstance(left, PeriodIndex) and
+                        isinstance(right, PeriodIndex)):
+                    name = left.name if left.name == right.name else None
+                    return Index(result, name=name)
+                elif isinstance(left, Period) or isinstance(right, Period):
+                    return Index(result, name=name)
+            elif isinstance(func, np.ufunc):
+                if 'M->M' not in func.types:
+                    msg = "ufunc '{0}' not supported for the PeriodIndex"
+                    # This should be TypeError, but TypeError cannot be raised
+                    # from here because numpy catches.
+                    raise ValueError(msg.format(func.__name__))
+
+        if is_bool_dtype(result):
+            return result
+        # the result is object dtype array of Period
+        # cannot pass _simple_new as it is
+        return self._shallow_copy(result, freq=self.freq, name=self.name)
+
+    @property
+    def _box_func(self):
+        return lambda x: Period._from_ordinal(ordinal=x, freq=self.freq)
+
+    def _to_embed(self, keep_tz=False, dtype=None):
+        """
+        return an array repr of this object, potentially casting to object
+        """
+
+        if dtype is not None:
+            return self.astype(dtype)._to_embed(keep_tz=keep_tz)
+
+        return self.astype(object).values
+
+    @property
+    def size(self):
+        # Avoid materializing self._values
+        return self._ndarray_values.size
+
+    @property
+    def shape(self):
+        # Avoid materializing self._values
+        return self._ndarray_values.shape
+
+    @property
+    def _formatter_func(self):
+        return lambda x: "'%s'" % x
+
+    def asof_locs(self, where, mask):
+        """
+        where : array of timestamps
+        mask : array of booleans where data is not NA
+
+        """
+        where_idx = where
+        if isinstance(where_idx, DatetimeIndex):
+            where_idx = PeriodIndex(where_idx.values, freq=self.freq)
+
+        locs = self._ndarray_values[mask].searchsorted(
+            where_idx._ndarray_values, side='right')
+
+        locs = np.where(locs > 0, locs - 1, 0)
+        result = np.arange(len(self))[mask].take(locs)
+
+        first = mask.argmax()
+        result[(locs == 0) & (where_idx._ndarray_values <
+                              self._ndarray_values[first])] = -1
+
+        return result
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True, how='start'):
+        dtype = pandas_dtype(dtype)
+        if is_integer_dtype(dtype):
+            return self._int64index.copy() if copy else self._int64index
+        elif is_datetime64_any_dtype(dtype):
+            tz = getattr(dtype, 'tz', None)
+            return self.to_timestamp(how=how).tz_localize(tz)
+        elif is_period_dtype(dtype):
+            return self.asfreq(freq=dtype.freq)
+        return super(PeriodIndex, self).astype(dtype, copy=copy)
+
+    @Substitution(klass='PeriodIndex')
+    @Appender(_shared_docs['searchsorted'])
+    @deprecate_kwarg(old_arg_name='key', new_arg_name='value')
+    def searchsorted(self, value, side='left', sorter=None):
+        if isinstance(value, Period):
+            if value.freq != self.freq:
+                msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, value.freqstr)
+                raise IncompatibleFrequency(msg)
+            value = value.ordinal
+        elif isinstance(value, compat.string_types):
+            value = Period(value, freq=self.freq).ordinal
+
+        return self._ndarray_values.searchsorted(value, side=side,
+                                                 sorter=sorter)
+
+    @property
+    def is_all_dates(self):
+        return True
+
+    @property
+    def is_full(self):
+        """
+        Returns True if this PeriodIndex is range-like in that all Periods
+        between start and end are present, in order.
+        """
+        if len(self) == 0:
+            return True
+        if not self.is_monotonic:
+            raise ValueError('Index is not monotonic')
+        values = self.asi8
+        return ((values[1:] - values[:-1]) < 2).all()
+
+    @property
+    def freq(self):
+        """Return the frequency object if it is set, otherwise None"""
+        return self._freq
+
+    @freq.setter
+    def freq(self, value):
+        msg = ('Setting PeriodIndex.freq has been deprecated and will be '
+               'removed in a future version; use PeriodIndex.asfreq instead. '
+               'The PeriodIndex.freq setter is not guaranteed to work.')
+        warnings.warn(msg, FutureWarning, stacklevel=2)
+        self._freq = value
+
+    def asfreq(self, freq=None, how='E'):
+        """
+        Convert the PeriodIndex to the specified frequency `freq`.
+
+        Parameters
+        ----------
+
+        freq : str
+            a frequency
+        how : str {'E', 'S'}
+            'E', 'END', or 'FINISH' for end,
+            'S', 'START', or 'BEGIN' for start.
+            Whether the elements should be aligned to the end
+            or start within pa period. January 31st ('END') vs.
+            January 1st ('START') for example.
+
+        Returns
+        -------
+
+        new : PeriodIndex with the new frequency
+
+        Examples
+        --------
+        >>> pidx = pd.period_range('2010-01-01', '2015-01-01', freq='A')
+        >>> pidx
+        <class 'pandas.core.indexes.period.PeriodIndex'>
+        [2010, ..., 2015]
+        Length: 6, Freq: A-DEC
+
+        >>> pidx.asfreq('M')
+        <class 'pandas.core.indexes.period.PeriodIndex'>
+        [2010-12, ..., 2015-12]
+        Length: 6, Freq: M
+
+        >>> pidx.asfreq('M', how='S')
+        <class 'pandas.core.indexes.period.PeriodIndex'>
+        [2010-01, ..., 2015-01]
+        Length: 6, Freq: M
+        """
+        how = _validate_end_alias(how)
+
+        freq = Period._maybe_convert_freq(freq)
+
+        base1, mult1 = _gfc(self.freq)
+        base2, mult2 = _gfc(freq)
+
+        asi8 = self.asi8
+        # mult1 can't be negative or 0
+        end = how == 'E'
+        if end:
+            ordinal = asi8 + mult1 - 1
+        else:
+            ordinal = asi8
+
+        new_data = period.period_asfreq_arr(ordinal, base1, base2, end)
+
+        if self.hasnans:
+            new_data[self._isnan] = tslib.iNaT
+
+        return self._simple_new(new_data, self.name, freq=freq)
+
+    year = _field_accessor('year', 0, "The year of the period")
+    month = _field_accessor('month', 3, "The month as January=1, December=12")
+    day = _field_accessor('day', 4, "The days of the period")
+    hour = _field_accessor('hour', 5, "The hour of the period")
+    minute = _field_accessor('minute', 6, "The minute of the period")
+    second = _field_accessor('second', 7, "The second of the period")
+    weekofyear = _field_accessor('week', 8, "The week ordinal of the year")
+    week = weekofyear
+    dayofweek = _field_accessor('dayofweek', 10,
+                                "The day of the week with Monday=0, Sunday=6")
+    weekday = dayofweek
+    dayofyear = day_of_year = _field_accessor('dayofyear', 9,
+                                              "The ordinal day of the year")
+    quarter = _field_accessor('quarter', 2, "The quarter of the date")
+    qyear = _field_accessor('qyear', 1)
+    days_in_month = _field_accessor('days_in_month', 11,
+                                    "The number of days in the month")
+    daysinmonth = days_in_month
+
+    @property
+    def is_leap_year(self):
+        """ Logical indicating if the date belongs to a leap year """
+        return isleapyear_arr(np.asarray(self.year))
+
+    @property
+    def start_time(self):
+        return self.to_timestamp(how='start')
+
+    @property
+    def end_time(self):
+        return self.to_timestamp(how='end')
+
+    def _mpl_repr(self):
+        # how to represent ourselves to matplotlib
+        return self.astype(object).values
+
+    def to_timestamp(self, freq=None, how='start'):
+        """
+        Cast to DatetimeIndex
+
+        Parameters
+        ----------
+        freq : string or DateOffset, optional
+            Target frequency. The default is 'D' for week or longer,
+            'S' otherwise
+        how : {'s', 'e', 'start', 'end'}
+
+        Returns
+        -------
+        DatetimeIndex
+        """
+        how = _validate_end_alias(how)
+
+        if freq is None:
+            base, mult = _gfc(self.freq)
+            freq = frequencies.get_to_timestamp_base(base)
+        else:
+            freq = Period._maybe_convert_freq(freq)
+
+        base, mult = _gfc(freq)
+        new_data = self.asfreq(freq, how)
+
+        new_data = period.periodarr_to_dt64arr(new_data._ndarray_values, base)
+        return DatetimeIndex(new_data, freq='infer', name=self.name)
+
+    def _maybe_convert_timedelta(self, other):
+        if isinstance(
+                other, (timedelta, np.timedelta64, Tick, np.ndarray)):
+            offset = frequencies.to_offset(self.freq.rule_code)
+            if isinstance(offset, Tick):
+                if isinstance(other, np.ndarray):
+                    nanos = np.vectorize(delta_to_nanoseconds)(other)
+                else:
+                    nanos = delta_to_nanoseconds(other)
+                offset_nanos = delta_to_nanoseconds(offset)
+                check = np.all(nanos % offset_nanos == 0)
+                if check:
+                    return nanos // offset_nanos
+        elif isinstance(other, DateOffset):
+            freqstr = other.rule_code
+            base = frequencies.get_base_alias(freqstr)
+            if base == self.freq.rule_code:
+                return other.n
+            msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
+            raise IncompatibleFrequency(msg)
+        elif is_integer(other):
+            # integer is passed to .shift via
+            # _add_datetimelike_methods basically
+            # but ufunc may pass integer to _add_delta
+            return other
+        # raise when input doesn't have freq
+        msg = "Input has different freq from PeriodIndex(freq={0})"
+        raise IncompatibleFrequency(msg.format(self.freqstr))
+
+    def _add_offset(self, other):
+        assert not isinstance(other, Tick)
+        base = frequencies.get_base_alias(other.rule_code)
+        if base != self.freq.rule_code:
+            msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
+            raise IncompatibleFrequency(msg)
+        return self.shift(other.n)
+
+    def _add_delta_td(self, other):
+        assert isinstance(other, (timedelta, np.timedelta64, Tick))
+        nanos = delta_to_nanoseconds(other)
+        own_offset = frequencies.to_offset(self.freq.rule_code)
+
+        if isinstance(own_offset, Tick):
+            offset_nanos = delta_to_nanoseconds(own_offset)
+            if np.all(nanos % offset_nanos == 0):
+                return self.shift(nanos // offset_nanos)
+
+        # raise when input doesn't have freq
+        raise IncompatibleFrequency("Input has different freq from "
+                                    "{cls}(freq={freqstr})"
+                                    .format(cls=type(self).__name__,
+                                            freqstr=self.freqstr))
+
+    def _add_delta(self, other):
+        ordinal_delta = self._maybe_convert_timedelta(other)
+        return self.shift(ordinal_delta)
+
+    def _sub_datelike(self, other):
+        assert other is not tslib.NaT
+        return NotImplemented
+
+    def _sub_period(self, other):
+        # If the operation is well-defined, we return an object-Index
+        # of DateOffsets.  Null entries are filled with pd.NaT
+        if self.freq != other.freq:
+            msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
+            raise IncompatibleFrequency(msg)
+
+        asi8 = self.asi8
+        new_data = asi8 - other.ordinal
+        new_data = np.array([self.freq * x for x in new_data])
+
+        if self.hasnans:
+            new_data[self._isnan] = tslib.NaT
+
+        return Index(new_data)
+
+    def shift(self, n):
+        """
+        Specialized shift which produces an PeriodIndex
+
+        Parameters
+        ----------
+        n : int
+            Periods to shift by
+
+        Returns
+        -------
+        shifted : PeriodIndex
+        """
+        values = self._ndarray_values + n * self.freq.n
+        if self.hasnans:
+            values[self._isnan] = tslib.iNaT
+        return self._shallow_copy(values=values)
+
+    @cache_readonly
+    def dtype(self):
+        return PeriodDtype.construct_from_string(self.freq)
+
+    @property
+    def inferred_type(self):
+        # b/c data is represented as ints make sure we can't have ambiguous
+        # indexing
+        return 'period'
+
+    def get_value(self, series, key):
+        """
+        Fast lookup of value from 1-dimensional ndarray. Only use this if you
+        know what you're doing
+        """
+        s = com._values_from_object(series)
+        try:
+            return com._maybe_box(self,
+                                  super(PeriodIndex, self).get_value(s, key),
+                                  series, key)
+        except (KeyError, IndexError):
+            try:
+                asdt, parsed, reso = parse_time_string(key, self.freq)
+                grp = resolution.Resolution.get_freq_group(reso)
+                freqn = resolution.get_freq_group(self.freq)
+
+                vals = self._ndarray_values
+
+                # if our data is higher resolution than requested key, slice
+                if grp < freqn:
+                    iv = Period(asdt, freq=(grp, 1))
+                    ord1 = iv.asfreq(self.freq, how='S').ordinal
+                    ord2 = iv.asfreq(self.freq, how='E').ordinal
+
+                    if ord2 < vals[0] or ord1 > vals[-1]:
+                        raise KeyError(key)
+
+                    pos = np.searchsorted(self._ndarray_values, [ord1, ord2])
+                    key = slice(pos[0], pos[1] + 1)
+                    return series[key]
+                elif grp == freqn:
+                    key = Period(asdt, freq=self.freq).ordinal
+                    return com._maybe_box(self, self._engine.get_value(s, key),
+                                          series, key)
+                else:
+                    raise KeyError(key)
+            except TypeError:
+                pass
+
+            key = Period(key, self.freq).ordinal
+            return com._maybe_box(self, self._engine.get_value(s, key),
+                                  series, key)
+
+    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
+    def get_indexer(self, target, method=None, limit=None, tolerance=None):
+        target = _ensure_index(target)
+
+        if hasattr(target, 'freq') and target.freq != self.freq:
+            msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, target.freqstr)
+            raise IncompatibleFrequency(msg)
+
+        if isinstance(target, PeriodIndex):
+            target = target.asi8
+
+        if tolerance is not None:
+            tolerance = self._convert_tolerance(tolerance, target)
+        return Index.get_indexer(self._int64index, target, method,
+                                 limit, tolerance)
+
+    def _get_unique_index(self, dropna=False):
+        """
+        wrap Index._get_unique_index to handle NaT
+        """
+        res = super(PeriodIndex, self)._get_unique_index(dropna=dropna)
+        if dropna:
+            res = res.dropna()
+        return res
+
+    def get_loc(self, key, method=None, tolerance=None):
+        """
+        Get integer location for requested label
+
+        Returns
+        -------
+        loc : int
+        """
+        try:
+            return self._engine.get_loc(key)
+        except KeyError:
+            if is_integer(key):
+                raise
+
+            try:
+                asdt, parsed, reso = parse_time_string(key, self.freq)
+                key = asdt
+            except TypeError:
+                pass
+
+            try:
+                key = Period(key, freq=self.freq)
+            except ValueError:
+                # we cannot construct the Period
+                # as we have an invalid type
+                raise KeyError(key)
+
+            try:
+                ordinal = tslib.iNaT if key is tslib.NaT else key.ordinal
+                if tolerance is not None:
+                    tolerance = self._convert_tolerance(tolerance,
+                                                        np.asarray(key))
+                return self._int64index.get_loc(ordinal, method, tolerance)
+
+            except KeyError:
+                raise KeyError(key)
+
+    def _maybe_cast_slice_bound(self, label, side, kind):
+        """
+        If label is a string or a datetime, cast it to Period.ordinal according
+        to resolution.
+
+        Parameters
+        ----------
+        label : object
+        side : {'left', 'right'}
+        kind : {'ix', 'loc', 'getitem'}
+
+        Returns
+        -------
+        bound : Period or object
+
+        Notes
+        -----
+        Value of `side` parameter should be validated in caller.
+
+        """
+        assert kind in ['ix', 'loc', 'getitem']
+
+        if isinstance(label, datetime):
+            return Period(label, freq=self.freq)
+        elif isinstance(label, compat.string_types):
+            try:
+                _, parsed, reso = parse_time_string(label, self.freq)
+                bounds = self._parsed_string_to_bounds(reso, parsed)
+                return bounds[0 if side == 'left' else 1]
+            except Exception:
+                raise KeyError(label)
+        elif is_integer(label) or is_float(label):
+            self._invalid_indexer('slice', label)
+
+        return label
+
+    def _parsed_string_to_bounds(self, reso, parsed):
+        if reso == 'year':
+            t1 = Period(year=parsed.year, freq='A')
+        elif reso == 'month':
+            t1 = Period(year=parsed.year, month=parsed.month, freq='M')
+        elif reso == 'quarter':
+            q = (parsed.month - 1) // 3 + 1
+            t1 = Period(year=parsed.year, quarter=q, freq='Q-DEC')
+        elif reso == 'day':
+            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
+                        freq='D')
+        elif reso == 'hour':
+            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
+                        hour=parsed.hour, freq='H')
+        elif reso == 'minute':
+            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
+                        hour=parsed.hour, minute=parsed.minute, freq='T')
+        elif reso == 'second':
+            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
+                        hour=parsed.hour, minute=parsed.minute,
+                        second=parsed.second, freq='S')
+        else:
+            raise KeyError(reso)
+        return (t1.asfreq(self.freq, how='start'),
+                t1.asfreq(self.freq, how='end'))
+
+    def _get_string_slice(self, key):
+        if not self.is_monotonic:
+            raise ValueError('Partial indexing only valid for '
+                             'ordered time series')
+
+        key, parsed, reso = parse_time_string(key, self.freq)
+        grp = resolution.Resolution.get_freq_group(reso)
+        freqn = resolution.get_freq_group(self.freq)
+        if reso in ['day', 'hour', 'minute', 'second'] and not grp < freqn:
+            raise KeyError(key)
+
+        t1, t2 = self._parsed_string_to_bounds(reso, parsed)
+        return slice(self.searchsorted(t1.ordinal, side='left'),
+                     self.searchsorted(t2.ordinal, side='right'))
+
+    def _convert_tolerance(self, tolerance, target):
+        tolerance = DatetimeIndexOpsMixin._convert_tolerance(self, tolerance,
+                                                             target)
+        if target.size != tolerance.size and tolerance.size > 1:
+            raise ValueError('list-like tolerance size must match '
+                             'target index size')
+        return self._maybe_convert_timedelta(tolerance)
+
+    def insert(self, loc, item):
+        if not isinstance(item, Period) or self.freq != item.freq:
+            return self.astype(object).insert(loc, item)
+
+        idx = np.concatenate((self[:loc].asi8, np.array([item.ordinal]),
+                              self[loc:].asi8))
+        return self._shallow_copy(idx)
+
+    def join(self, other, how='left', level=None, return_indexers=False,
+             sort=False):
+        """
+        See Index.join
+        """
+        self._assert_can_do_setop(other)
+
+        result = Int64Index.join(self, other, how=how, level=level,
+                                 return_indexers=return_indexers,
+                                 sort=sort)
+
+        if return_indexers:
+            result, lidx, ridx = result
+            return self._apply_meta(result), lidx, ridx
+        return self._apply_meta(result)
+
+    def _assert_can_do_setop(self, other):
+        super(PeriodIndex, self)._assert_can_do_setop(other)
+
+        if not isinstance(other, PeriodIndex):
+            raise ValueError('can only call with other PeriodIndex-ed objects')
+
+        if self.freq != other.freq:
+            msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
+            raise IncompatibleFrequency(msg)
+
+    def _wrap_union_result(self, other, result):
+        name = self.name if self.name == other.name else None
+        result = self._apply_meta(result)
+        result.name = name
+        return result
+
+    def _apply_meta(self, rawarr):
+        if not isinstance(rawarr, PeriodIndex):
+            rawarr = PeriodIndex._from_ordinals(rawarr, freq=self.freq,
+                                                name=self.name)
+        return rawarr
+
+    def _format_native_types(self, na_rep=u('NaT'), date_format=None,
+                             **kwargs):
+
+        values = self.astype(object).values
+
+        if date_format:
+            formatter = lambda dt: dt.strftime(date_format)
+        else:
+            formatter = lambda dt: u('%s') % dt
+
+        if self.hasnans:
+            mask = self._isnan
+            values[mask] = na_rep
+            imask = ~mask
+            values[imask] = np.array([formatter(dt) for dt
+                                      in values[imask]])
+        else:
+            values = np.array([formatter(dt) for dt in values])
+        return values
+
+    def __setstate__(self, state):
+        """Necessary for making this object picklable"""
+
+        if isinstance(state, dict):
+            super(PeriodIndex, self).__setstate__(state)
+
+        elif isinstance(state, tuple):
+
+            # < 0.15 compat
+            if len(state) == 2:
+                nd_state, own_state = state
+                data = np.empty(nd_state[1], dtype=nd_state[2])
+                np.ndarray.__setstate__(data, nd_state)
+
+                # backcompat
+                self._freq = Period._maybe_convert_freq(own_state[1])
+
+            else:  # pragma: no cover
+                data = np.empty(state)
+                np.ndarray.__setstate__(self, state)
+
+            self._data = data
+
+        else:
+            raise Exception("invalid pickle state")
+
+    _unpickle_compat = __setstate__
+
+    def tz_convert(self, tz):
+        """
+        Convert tz-aware DatetimeIndex from one time zone to another (using
+        pytz/dateutil)
+
+        Parameters
+        ----------
+        tz : string, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time. Corresponding timestamps would be converted to
+            time zone of the TimeSeries.
+            None will remove timezone holding UTC time.
+
+        Returns
+        -------
+        normalized : DatetimeIndex
+
+        Notes
+        -----
+        Not currently implemented for PeriodIndex
+        """
+        raise NotImplementedError("Not yet implemented for PeriodIndex")
+
+    def tz_localize(self, tz, ambiguous='raise'):
+        """
+        Localize tz-naive DatetimeIndex to given time zone (using
+        pytz/dateutil), or remove timezone from tz-aware DatetimeIndex
+
+        Parameters
+        ----------
+        tz : string, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time. Corresponding timestamps would be converted to
+            time zone of the TimeSeries.
+            None will remove timezone holding local time.
+
+        Returns
+        -------
+        localized : DatetimeIndex
+
+        Notes
+        -----
+        Not currently implemented for PeriodIndex
+        """
+        raise NotImplementedError("Not yet implemented for PeriodIndex")
+
+
+PeriodIndex._add_comparison_methods()
+PeriodIndex._add_numeric_methods_disabled()
+PeriodIndex._add_logical_methods_disabled()
+PeriodIndex._add_datetimelike_methods()
+
+
+def _get_ordinal_range(start, end, periods, freq, mult=1):
+    if com._count_not_none(start, end, periods) != 2:
+        raise ValueError('Of the three parameters: start, end, and periods, '
+                         'exactly two must be specified')
+
+    if freq is not None:
+        _, mult = _gfc(freq)
+
+    if start is not None:
+        start = Period(start, freq)
+    if end is not None:
+        end = Period(end, freq)
+
+    is_start_per = isinstance(start, Period)
+    is_end_per = isinstance(end, Period)
+
+    if is_start_per and is_end_per and start.freq != end.freq:
+        raise ValueError('start and end must have same freq')
+    if (start is tslib.NaT or end is tslib.NaT):
+        raise ValueError('start and end must not be NaT')
+
+    if freq is None:
+        if is_start_per:
+            freq = start.freq
+        elif is_end_per:
+            freq = end.freq
+        else:  # pragma: no cover
+            raise ValueError('Could not infer freq from start/end')
+
+    if periods is not None:
+        periods = periods * mult
+        if start is None:
+            data = np.arange(end.ordinal - periods + mult,
+                             end.ordinal + 1, mult,
+                             dtype=np.int64)
+        else:
+            data = np.arange(start.ordinal, start.ordinal + periods, mult,
+                             dtype=np.int64)
+    else:
+        data = np.arange(start.ordinal, end.ordinal + 1, mult, dtype=np.int64)
+
+    return data, freq
+
+
+def _range_from_fields(year=None, month=None, quarter=None, day=None,
+                       hour=None, minute=None, second=None, freq=None):
+    if hour is None:
+        hour = 0
+    if minute is None:
+        minute = 0
+    if second is None:
+        second = 0
+    if day is None:
+        day = 1
+
+    ordinals = []
+
+    if quarter is not None:
+        if freq is None:
+            freq = 'Q'
+            base = frequencies.FreqGroup.FR_QTR
+        else:
+            base, mult = _gfc(freq)
+            if base != frequencies.FreqGroup.FR_QTR:
+                raise AssertionError("base must equal FR_QTR")
+
+        year, quarter = _make_field_arrays(year, quarter)
+        for y, q in zip(year, quarter):
+            y, m = _quarter_to_myear(y, q, freq)
+            val = period.period_ordinal(y, m, 1, 1, 1, 1, 0, 0, base)
+            ordinals.append(val)
+    else:
+        base, mult = _gfc(freq)
+        arrays = _make_field_arrays(year, month, day, hour, minute, second)
+        for y, mth, d, h, mn, s in zip(*arrays):
+            ordinals.append(period.period_ordinal(
+                y, mth, d, h, mn, s, 0, 0, base))
+
+    return np.array(ordinals, dtype=np.int64), freq
+
+
+def _make_field_arrays(*fields):
+    length = None
+    for x in fields:
+        if isinstance(x, (list, np.ndarray, ABCSeries)):
+            if length is not None and len(x) != length:
+                raise ValueError('Mismatched Period array lengths')
+            elif length is None:
+                length = len(x)
+
+    arrays = [np.asarray(x) if isinstance(x, (np.ndarray, list, ABCSeries))
+              else np.repeat(x, length) for x in fields]
+
+    return arrays
+
+
+def pnow(freq=None):
+    # deprecation, xref #13790
+    warnings.warn("pd.pnow() and pandas.core.indexes.period.pnow() "
+                  "are deprecated. Please use Period.now()",
+                  FutureWarning, stacklevel=2)
+    return Period.now(freq=freq)
+
+
+def period_range(start=None, end=None, periods=None, freq='D', name=None):
+    """
+    Return a fixed frequency PeriodIndex, with day (calendar) as the default
+    frequency
+
+    Parameters
+    ----------
+    start : string or period-like, default None
+        Left bound for generating periods
+    end : string or period-like, default None
+        Right bound for generating periods
+    periods : integer, default None
+        Number of periods to generate
+    freq : string or DateOffset, default 'D' (calendar daily)
+        Frequency alias
+    name : string, default None
+        Name of the resulting PeriodIndex
+
+    Notes
+    -----
+    Of the three parameters: ``start``, ``end``, and ``periods``, exactly two
+    must be specified.
+
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Returns
+    -------
+    prng : PeriodIndex
+
+    Examples
+    --------
+
+    >>> pd.period_range(start='2017-01-01', end='2018-01-01', freq='M')
+    PeriodIndex(['2017-01', '2017-02', '2017-03', '2017-04', '2017-05',
+                 '2017-06', '2017-06', '2017-07', '2017-08', '2017-09',
+                 '2017-10', '2017-11', '2017-12', '2018-01'],
+                dtype='period[M]', freq='M')
+
+    If ``start`` or ``end`` are ``Period`` objects, they will be used as anchor
+    endpoints for a ``PeriodIndex`` with frequency matching that of the
+    ``period_range`` constructor.
+
+    >>> pd.period_range(start=pd.Period('2017Q1', freq='Q'),
+    ...                 end=pd.Period('2017Q2', freq='Q'), freq='M')
+    PeriodIndex(['2017-03', '2017-04', '2017-05', '2017-06'],
+                dtype='period[M]', freq='M')
+    """
+    if com._count_not_none(start, end, periods) != 2:
+        raise ValueError('Of the three parameters: start, end, and periods, '
+                         'exactly two must be specified')
+
+    return PeriodIndex(start=start, end=end, periods=periods,
+                       freq=freq, name=name)
diff --git a/pandas/core/indexes/range.py b/pandas/core/indexes/range.py
new file mode 100644
index 0000000000000..4e192548a1f2d
--- /dev/null
+++ b/pandas/core/indexes/range.py
@@ -0,0 +1,661 @@
+from sys import getsizeof
+import operator
+from datetime import timedelta
+
+import numpy as np
+from pandas._libs import index as libindex
+
+from pandas.core.dtypes.common import (
+    is_integer,
+    is_scalar,
+    is_int64_dtype)
+from pandas.core.dtypes.generic import ABCSeries, ABCTimedeltaIndex
+
+from pandas import compat
+from pandas.compat import lrange, range, get_range_parameters
+from pandas.compat.numpy import function as nv
+
+import pandas.core.common as com
+from pandas.core import ops
+from pandas.core.indexes.base import Index, _index_shared_docs
+from pandas.util._decorators import Appender, cache_readonly
+import pandas.core.dtypes.concat as _concat
+import pandas.core.indexes.base as ibase
+
+from pandas.core.indexes.numeric import Int64Index
+
+
+class RangeIndex(Int64Index):
+
+    """
+    Immutable Index implementing a monotonic integer range.
+
+    RangeIndex is a memory-saving special case of Int64Index limited to
+    representing monotonic ranges. Using RangeIndex may in some instances
+    improve computing speed.
+
+    This is the default index type used
+    by DataFrame and Series when no explicit index is provided by the user.
+
+    Parameters
+    ----------
+    start : int (default: 0), or other RangeIndex instance.
+        If int and "stop" is not given, interpreted as "stop" instead.
+    stop : int (default: 0)
+    step : int (default: 1)
+    name : object, optional
+        Name to be stored in the index
+    copy : bool, default False
+        Unused, accepted for homogeneity with other index types.
+
+    See Also
+    --------
+    Index : The base pandas Index type
+    Int64Index : Index of int64 data
+
+    Attributes
+    ----------
+    None
+
+    Methods
+    -------
+    from_range
+    """
+
+    _typ = 'rangeindex'
+    _engine_type = libindex.Int64Engine
+
+    def __new__(cls, start=None, stop=None, step=None,
+                dtype=None, copy=False, name=None, fastpath=False):
+
+        if fastpath:
+            return cls._simple_new(start, stop, step, name=name)
+
+        cls._validate_dtype(dtype)
+
+        # RangeIndex
+        if isinstance(start, RangeIndex):
+            if name is None:
+                name = start.name
+            return cls._simple_new(name=name,
+                                   **dict(start._get_data_as_items()))
+
+        # validate the arguments
+        def _ensure_int(value, field):
+            msg = ("RangeIndex(...) must be called with integers,"
+                   " {value} was passed for {field}")
+            if not is_scalar(value):
+                raise TypeError(msg.format(value=type(value).__name__,
+                                           field=field))
+            try:
+                new_value = int(value)
+                assert(new_value == value)
+            except (TypeError, ValueError, AssertionError):
+                raise TypeError(msg.format(value=type(value).__name__,
+                                           field=field))
+
+            return new_value
+
+        if com._all_none(start, stop, step):
+            msg = "RangeIndex(...) must be called with integers"
+            raise TypeError(msg)
+        elif start is None:
+            start = 0
+        else:
+            start = _ensure_int(start, 'start')
+        if stop is None:
+            stop = start
+            start = 0
+        else:
+            stop = _ensure_int(stop, 'stop')
+        if step is None:
+            step = 1
+        elif step == 0:
+            raise ValueError("Step must not be zero")
+        else:
+            step = _ensure_int(step, 'step')
+
+        return cls._simple_new(start, stop, step, name)
+
+    @classmethod
+    def from_range(cls, data, name=None, dtype=None, **kwargs):
+        """ create RangeIndex from a range (py3), or xrange (py2) object """
+        if not isinstance(data, range):
+            raise TypeError(
+                '{0}(...) must be called with object coercible to a '
+                'range, {1} was passed'.format(cls.__name__, repr(data)))
+
+        start, stop, step = get_range_parameters(data)
+        return RangeIndex(start, stop, step, dtype=dtype, name=name, **kwargs)
+
+    @classmethod
+    def _simple_new(cls, start, stop=None, step=None, name=None,
+                    dtype=None, **kwargs):
+        result = object.__new__(cls)
+
+        # handle passed None, non-integers
+        if start is None and stop is None:
+            # empty
+            start, stop, step = 0, 0, 1
+
+        if start is None or not is_integer(start):
+            try:
+
+                return RangeIndex(start, stop, step, name=name, **kwargs)
+            except TypeError:
+                return Index(start, stop, step, name=name, **kwargs)
+
+        result._start = start
+        result._stop = stop or 0
+        result._step = step or 1
+        result.name = name
+        for k, v in compat.iteritems(kwargs):
+            setattr(result, k, v)
+
+        result._reset_identity()
+        return result
+
+    @staticmethod
+    def _validate_dtype(dtype):
+        """ require dtype to be None or int64 """
+        if not (dtype is None or is_int64_dtype(dtype)):
+            raise TypeError('Invalid to pass a non-int64 dtype to RangeIndex')
+
+    @cache_readonly
+    def _constructor(self):
+        """ return the class to use for construction """
+        return Int64Index
+
+    @cache_readonly
+    def _data(self):
+        return np.arange(self._start, self._stop, self._step, dtype=np.int64)
+
+    @cache_readonly
+    def _int64index(self):
+        return Int64Index(self._data, name=self.name, fastpath=True)
+
+    def _get_data_as_items(self):
+        """ return a list of tuples of start, stop, step """
+        return [('start', self._start),
+                ('stop', self._stop),
+                ('step', self._step)]
+
+    def __reduce__(self):
+        d = self._get_attributes_dict()
+        d.update(dict(self._get_data_as_items()))
+        return ibase._new_Index, (self.__class__, d), None
+
+    def _format_attrs(self):
+        """
+        Return a list of tuples of the (attr, formatted_value)
+        """
+        attrs = self._get_data_as_items()
+        if self.name is not None:
+            attrs.append(('name', ibase.default_pprint(self.name)))
+        return attrs
+
+    def _format_data(self, name=None):
+        # we are formatting thru the attributes
+        return None
+
+    @cache_readonly
+    def nbytes(self):
+        """
+        Return the number of bytes in the underlying data
+        On implementations where this is undetermined (PyPy)
+        assume 24 bytes for each value
+        """
+        return sum(getsizeof(getattr(self, v), 24) for v in
+                   ['_start', '_stop', '_step'])
+
+    def memory_usage(self, deep=False):
+        """
+        Memory usage of my values
+
+        Parameters
+        ----------
+        deep : bool
+            Introspect the data deeply, interrogate
+            `object` dtypes for system-level memory consumption
+
+        Returns
+        -------
+        bytes used
+
+        Notes
+        -----
+        Memory usage does not include memory consumed by elements that
+        are not components of the array if deep=False
+
+        See Also
+        --------
+        numpy.ndarray.nbytes
+        """
+        return self.nbytes
+
+    @property
+    def dtype(self):
+        return np.dtype(np.int64)
+
+    @property
+    def is_unique(self):
+        """ return if the index has unique values """
+        return True
+
+    @cache_readonly
+    def is_monotonic_increasing(self):
+        return self._step > 0 or len(self) <= 1
+
+    @cache_readonly
+    def is_monotonic_decreasing(self):
+        return self._step < 0 or len(self) <= 1
+
+    @property
+    def has_duplicates(self):
+        return False
+
+    def tolist(self):
+        return lrange(self._start, self._stop, self._step)
+
+    @Appender(_index_shared_docs['_shallow_copy'])
+    def _shallow_copy(self, values=None, **kwargs):
+        if values is None:
+            return RangeIndex(name=self.name, fastpath=True,
+                              **dict(self._get_data_as_items()))
+        else:
+            kwargs.setdefault('name', self.name)
+            return self._int64index._shallow_copy(values, **kwargs)
+
+    @Appender(ibase._index_shared_docs['copy'])
+    def copy(self, name=None, deep=False, dtype=None, **kwargs):
+        self._validate_dtype(dtype)
+        if name is None:
+            name = self.name
+        return RangeIndex(name=name, fastpath=True,
+                          **dict(self._get_data_as_items()))
+
+    def _minmax(self, meth):
+        no_steps = len(self) - 1
+        if no_steps == -1:
+            return np.nan
+        elif ((meth == 'min' and self._step > 0) or
+              (meth == 'max' and self._step < 0)):
+            return self._start
+
+        return self._start + self._step * no_steps
+
+    def min(self):
+        """The minimum value of the RangeIndex"""
+        return self._minmax('min')
+
+    def max(self):
+        """The maximum value of the RangeIndex"""
+        return self._minmax('max')
+
+    def argsort(self, *args, **kwargs):
+        """
+        Returns the indices that would sort the index and its
+        underlying data.
+
+        Returns
+        -------
+        argsorted : numpy array
+
+        See also
+        --------
+        numpy.ndarray.argsort
+        """
+        nv.validate_argsort(args, kwargs)
+
+        if self._step > 0:
+            return np.arange(len(self))
+        else:
+            return np.arange(len(self) - 1, -1, -1)
+
+    def equals(self, other):
+        """
+        Determines if two Index objects contain the same elements.
+        """
+        if isinstance(other, RangeIndex):
+            ls = len(self)
+            lo = len(other)
+            return (ls == lo == 0 or
+                    ls == lo == 1 and
+                    self._start == other._start or
+                    ls == lo and
+                    self._start == other._start and
+                    self._step == other._step)
+
+        return super(RangeIndex, self).equals(other)
+
+    def intersection(self, other):
+        """
+        Form the intersection of two Index objects. Sortedness of the result is
+        not guaranteed
+
+        Parameters
+        ----------
+        other : Index or array-like
+
+        Returns
+        -------
+        intersection : Index
+        """
+        if not isinstance(other, RangeIndex):
+            return super(RangeIndex, self).intersection(other)
+
+        if not len(self) or not len(other):
+            return RangeIndex._simple_new(None)
+
+        first = self[::-1] if self._step < 0 else self
+        second = other[::-1] if other._step < 0 else other
+
+        # check whether intervals intersect
+        # deals with in- and decreasing ranges
+        int_low = max(first._start, second._start)
+        int_high = min(first._stop, second._stop)
+        if int_high <= int_low:
+            return RangeIndex._simple_new(None)
+
+        # Method hint: linear Diophantine equation
+        # solve intersection problem
+        # performance hint: for identical step sizes, could use
+        # cheaper alternative
+        gcd, s, t = first._extended_gcd(first._step, second._step)
+
+        # check whether element sets intersect
+        if (first._start - second._start) % gcd:
+            return RangeIndex._simple_new(None)
+
+        # calculate parameters for the RangeIndex describing the
+        # intersection disregarding the lower bounds
+        tmp_start = first._start + (second._start - first._start) * \
+            first._step // gcd * s
+        new_step = first._step * second._step // gcd
+        new_index = RangeIndex(tmp_start, int_high, new_step, fastpath=True)
+
+        # adjust index to limiting interval
+        new_index._start = new_index._min_fitting_element(int_low)
+
+        if (self._step < 0 and other._step < 0) is not (new_index._step < 0):
+            new_index = new_index[::-1]
+        return new_index
+
+    def _min_fitting_element(self, lower_limit):
+        """Returns the smallest element greater than or equal to the limit"""
+        no_steps = -(-(lower_limit - self._start) // abs(self._step))
+        return self._start + abs(self._step) * no_steps
+
+    def _max_fitting_element(self, upper_limit):
+        """Returns the largest element smaller than or equal to the limit"""
+        no_steps = (upper_limit - self._start) // abs(self._step)
+        return self._start + abs(self._step) * no_steps
+
+    def _extended_gcd(self, a, b):
+        """
+        Extended Euclidean algorithms to solve Bezout's identity:
+           a*x + b*y = gcd(x, y)
+        Finds one particular solution for x, y: s, t
+        Returns: gcd, s, t
+        """
+        s, old_s = 0, 1
+        t, old_t = 1, 0
+        r, old_r = b, a
+        while r:
+            quotient = old_r // r
+            old_r, r = r, old_r - quotient * r
+            old_s, s = s, old_s - quotient * s
+            old_t, t = t, old_t - quotient * t
+        return old_r, old_s, old_t
+
+    def union(self, other):
+        """
+        Form the union of two Index objects and sorts if possible
+
+        Parameters
+        ----------
+        other : Index or array-like
+
+        Returns
+        -------
+        union : Index
+        """
+        self._assert_can_do_setop(other)
+        if len(other) == 0 or self.equals(other):
+            return self
+        if len(self) == 0:
+            return other
+        if isinstance(other, RangeIndex):
+            start_s, step_s = self._start, self._step
+            end_s = self._start + self._step * (len(self) - 1)
+            start_o, step_o = other._start, other._step
+            end_o = other._start + other._step * (len(other) - 1)
+            if self._step < 0:
+                start_s, step_s, end_s = end_s, -step_s, start_s
+            if other._step < 0:
+                start_o, step_o, end_o = end_o, -step_o, start_o
+            if len(self) == 1 and len(other) == 1:
+                step_s = step_o = abs(self._start - other._start)
+            elif len(self) == 1:
+                step_s = step_o
+            elif len(other) == 1:
+                step_o = step_s
+            start_r = min(start_s, start_o)
+            end_r = max(end_s, end_o)
+            if step_o == step_s:
+                if ((start_s - start_o) % step_s == 0 and
+                        (start_s - end_o) <= step_s and
+                        (start_o - end_s) <= step_s):
+                    return RangeIndex(start_r, end_r + step_s, step_s)
+                if ((step_s % 2 == 0) and
+                        (abs(start_s - start_o) <= step_s / 2) and
+                        (abs(end_s - end_o) <= step_s / 2)):
+                    return RangeIndex(start_r, end_r + step_s / 2, step_s / 2)
+            elif step_o % step_s == 0:
+                if ((start_o - start_s) % step_s == 0 and
+                        (start_o + step_s >= start_s) and
+                        (end_o - step_s <= end_s)):
+                    return RangeIndex(start_r, end_r + step_s, step_s)
+            elif step_s % step_o == 0:
+                if ((start_s - start_o) % step_o == 0 and
+                        (start_s + step_o >= start_o) and
+                        (end_s - step_o <= end_o)):
+                    return RangeIndex(start_r, end_r + step_o, step_o)
+
+        return self._int64index.union(other)
+
+    @Appender(_index_shared_docs['join'])
+    def join(self, other, how='left', level=None, return_indexers=False,
+             sort=False):
+        if how == 'outer' and self is not other:
+            # note: could return RangeIndex in more circumstances
+            return self._int64index.join(other, how, level, return_indexers,
+                                         sort)
+
+        return super(RangeIndex, self).join(other, how, level, return_indexers,
+                                            sort)
+
+    def _concat_same_dtype(self, indexes, name):
+        return _concat._concat_rangeindex_same_dtype(indexes).rename(name)
+
+    def __len__(self):
+        """
+        return the length of the RangeIndex
+        """
+        return max(0, -(-(self._stop - self._start) // self._step))
+
+    @property
+    def size(self):
+        return len(self)
+
+    def __getitem__(self, key):
+        """
+        Conserve RangeIndex type for scalar and slice keys.
+        """
+        super_getitem = super(RangeIndex, self).__getitem__
+
+        if is_scalar(key):
+            n = int(key)
+            if n != key:
+                return super_getitem(key)
+            if n < 0:
+                n = len(self) + key
+            if n < 0 or n > len(self) - 1:
+                raise IndexError("index {key} is out of bounds for axis 0 "
+                                 "with size {size}".format(key=key,
+                                                           size=len(self)))
+            return self._start + n * self._step
+
+        if isinstance(key, slice):
+
+            # This is basically PySlice_GetIndicesEx, but delegation to our
+            # super routines if we don't have integers
+
+            l = len(self)
+
+            # complete missing slice information
+            step = 1 if key.step is None else key.step
+            if key.start is None:
+                start = l - 1 if step < 0 else 0
+            else:
+                start = key.start
+
+                if start < 0:
+                    start += l
+                if start < 0:
+                    start = -1 if step < 0 else 0
+                if start >= l:
+                    start = l - 1 if step < 0 else l
+
+            if key.stop is None:
+                stop = -1 if step < 0 else l
+            else:
+                stop = key.stop
+
+                if stop < 0:
+                    stop += l
+                if stop < 0:
+                    stop = -1
+                if stop > l:
+                    stop = l
+
+            # delegate non-integer slices
+            if (start != int(start) or
+                    stop != int(stop) or
+                    step != int(step)):
+                return super_getitem(key)
+
+            # convert indexes to values
+            start = self._start + self._step * start
+            stop = self._start + self._step * stop
+            step = self._step * step
+
+            return RangeIndex(start, stop, step, name=self.name, fastpath=True)
+
+        # fall back to Int64Index
+        return super_getitem(key)
+
+    def __floordiv__(self, other):
+        if is_integer(other) and other != 0:
+            if (len(self) == 0 or
+                    self._start % other == 0 and
+                    self._step % other == 0):
+                start = self._start // other
+                step = self._step // other
+                stop = start + len(self) * step
+                return RangeIndex(start, stop, step, name=self.name,
+                                  fastpath=True)
+            if len(self) == 1:
+                start = self._start // other
+                return RangeIndex(start, start + 1, 1, name=self.name,
+                                  fastpath=True)
+        return self._int64index // other
+
+    @classmethod
+    def _add_numeric_methods_binary(cls):
+        """ add in numeric methods, specialized to RangeIndex """
+
+        def _make_evaluate_binop(op, step=False):
+            """
+            Parameters
+            ----------
+            op : callable that accepts 2 parms
+                perform the binary op
+            step : callable, optional, default to False
+                op to apply to the step parm if not None
+                if False, use the existing step
+            """
+
+            def _evaluate_numeric_binop(self, other):
+                if isinstance(other, ABCSeries):
+                    return NotImplemented
+                elif isinstance(other, ABCTimedeltaIndex):
+                    # Defer to TimedeltaIndex implementation
+                    return NotImplemented
+                elif isinstance(other, (timedelta, np.timedelta64)):
+                    # GH#19333 is_integer evaluated True on timedelta64,
+                    # so we need to catch these explicitly
+                    return op(self._int64index, other)
+
+                other = self._validate_for_numeric_binop(other, op)
+                attrs = self._get_attributes_dict()
+                attrs = self._maybe_update_attributes(attrs)
+
+                left, right = self, other
+
+                try:
+                    # apply if we have an override
+                    if step:
+                        with np.errstate(all='ignore'):
+                            rstep = step(left._step, right)
+
+                        # we don't have a representable op
+                        # so return a base index
+                        if not is_integer(rstep) or not rstep:
+                            raise ValueError
+
+                    else:
+                        rstep = left._step
+
+                    with np.errstate(all='ignore'):
+                        rstart = op(left._start, right)
+                        rstop = op(left._stop, right)
+
+                    result = RangeIndex(rstart,
+                                        rstop,
+                                        rstep,
+                                        **attrs)
+
+                    # for compat with numpy / Int64Index
+                    # even if we can represent as a RangeIndex, return
+                    # as a Float64Index if we have float-like descriptors
+                    if not all(is_integer(x) for x in
+                               [rstart, rstop, rstep]):
+                        result = result.astype('float64')
+
+                    return result
+
+                except (ValueError, TypeError, ZeroDivisionError):
+                    # Defer to Int64Index implementation
+                    return op(self._int64index, other)
+                    # TODO: Do attrs get handled reliably?
+
+            return _evaluate_numeric_binop
+
+        cls.__add__ = _make_evaluate_binop(operator.add)
+        cls.__radd__ = _make_evaluate_binop(ops.radd)
+        cls.__sub__ = _make_evaluate_binop(operator.sub)
+        cls.__rsub__ = _make_evaluate_binop(ops.rsub)
+        cls.__mul__ = _make_evaluate_binop(operator.mul, step=operator.mul)
+        cls.__rmul__ = _make_evaluate_binop(ops.rmul, step=ops.rmul)
+        cls.__truediv__ = _make_evaluate_binop(operator.truediv,
+                                               step=operator.truediv)
+        cls.__rtruediv__ = _make_evaluate_binop(ops.rtruediv,
+                                                step=ops.rtruediv)
+        if not compat.PY3:
+            cls.__div__ = _make_evaluate_binop(operator.div, step=operator.div)
+            cls.__rdiv__ = _make_evaluate_binop(ops.rdiv, step=ops.rdiv)
+
+
+RangeIndex._add_numeric_methods()
+RangeIndex._add_logical_methods()
diff --git a/pandas/core/indexes/timedeltas.py b/pandas/core/indexes/timedeltas.py
new file mode 100644
index 0000000000000..e90e1264638b0
--- /dev/null
+++ b/pandas/core/indexes/timedeltas.py
@@ -0,0 +1,1126 @@
+""" implement the TimedeltaIndex """
+
+from datetime import timedelta
+
+import numpy as np
+from pandas.core.dtypes.common import (
+    _TD_DTYPE,
+    is_integer,
+    is_float,
+    is_bool_dtype,
+    is_list_like,
+    is_scalar,
+    is_timedelta64_dtype,
+    is_timedelta64_ns_dtype,
+    pandas_dtype,
+    _ensure_int64)
+from pandas.core.dtypes.missing import isna
+from pandas.core.dtypes.generic import ABCSeries
+
+from pandas.core.indexes.base import Index
+from pandas.core.indexes.numeric import Int64Index
+import pandas.compat as compat
+from pandas.compat import u
+from pandas.tseries.frequencies import to_offset
+from pandas.core.algorithms import checked_add_with_arr
+from pandas.core.base import _shared_docs
+from pandas.core.indexes.base import _index_shared_docs
+import pandas.core.common as com
+import pandas.core.dtypes.concat as _concat
+from pandas.util._decorators import Appender, Substitution, deprecate_kwarg
+from pandas.core.indexes.datetimelike import (
+    TimelikeOps, DatetimeIndexOpsMixin)
+from pandas.core.tools.timedeltas import (
+    to_timedelta, _coerce_scalar_to_timedelta_type)
+from pandas.tseries.offsets import Tick, DateOffset
+from pandas._libs import (lib, index as libindex, tslib as libts,
+                          join as libjoin, Timedelta, NaT, iNaT)
+from pandas._libs.tslibs.timedeltas import array_to_timedelta64
+from pandas._libs.tslibs.fields import get_timedelta_field
+
+
+def _field_accessor(name, alias, docstring=None):
+    def f(self):
+        values = self.asi8
+        result = get_timedelta_field(values, alias)
+        if self.hasnans:
+            result = self._maybe_mask_results(result, convert='float64')
+
+        return Index(result, name=self.name)
+
+    f.__name__ = name
+    f.__doc__ = docstring
+    return property(f)
+
+
+def _td_index_cmp(opname, cls):
+    """
+    Wrap comparison operations to convert timedelta-like to timedelta64
+    """
+    nat_result = True if opname == '__ne__' else False
+
+    def wrapper(self, other):
+        msg = "cannot compare a {cls} with type {typ}"
+        func = getattr(super(TimedeltaIndex, self), opname)
+        if _is_convertible_to_td(other) or other is NaT:
+            try:
+                other = _to_m8(other)
+            except ValueError:
+                # failed to parse as timedelta
+                raise TypeError(msg.format(cls=type(self).__name__,
+                                           typ=type(other).__name__))
+            result = func(other)
+            if isna(other):
+                result.fill(nat_result)
+
+        elif not is_list_like(other):
+            raise TypeError(msg.format(cls=type(self).__name__,
+                                       typ=type(other).__name__))
+        else:
+            other = TimedeltaIndex(other).values
+            result = func(other)
+            result = com._values_from_object(result)
+
+            o_mask = np.array(isna(other))
+            if o_mask.any():
+                result[o_mask] = nat_result
+
+        if self.hasnans:
+            result[self._isnan] = nat_result
+
+        # support of bool dtype indexers
+        if is_bool_dtype(result):
+            return result
+        return Index(result)
+
+    return compat.set_function_name(wrapper, opname, cls)
+
+
+class TimedeltaIndex(DatetimeIndexOpsMixin, TimelikeOps, Int64Index):
+    """
+    Immutable ndarray of timedelta64 data, represented internally as int64, and
+    which can be boxed to timedelta objects
+
+    Parameters
+    ----------
+    data  : array-like (1-dimensional), optional
+        Optional timedelta-like data to construct index with
+    unit: unit of the arg (D,h,m,s,ms,us,ns) denote the unit, optional
+        which is an integer/float number
+    freq : string or pandas offset object, optional
+        One of pandas date offset strings or corresponding objects. The string
+        'infer' can be passed in order to set the frequency of the index as the
+        inferred frequency upon creation
+    copy  : bool
+        Make a copy of input ndarray
+    start : starting value, timedelta-like, optional
+        If data is None, start is used as the start point in generating regular
+        timedelta data.
+    periods  : int, optional, > 0
+        Number of periods to generate, if generating index. Takes precedence
+        over end argument
+    end   : end time, timedelta-like, optional
+        If periods is none, generated index will extend to first conforming
+        time on or just past end argument
+    closed : string or None, default None
+        Make the interval closed with respect to the given frequency to
+        the 'left', 'right', or both sides (None)
+    name : object
+        Name to be stored in the index
+
+    Notes
+    -----
+
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    See Also
+    ---------
+    Index : The base pandas Index type
+    Timedelta : Represents a duration between two dates or times.
+    DatetimeIndex : Index of datetime64 data
+    PeriodIndex : Index of Period data
+
+    Attributes
+    ----------
+    days
+    seconds
+    microseconds
+    nanoseconds
+    components
+    inferred_freq
+
+    Methods
+    -------
+    to_pytimedelta
+    to_series
+    round
+    floor
+    ceil
+    to_frame
+    """
+
+    _typ = 'timedeltaindex'
+    _join_precedence = 10
+
+    def _join_i8_wrapper(joinf, **kwargs):
+        return DatetimeIndexOpsMixin._join_i8_wrapper(
+            joinf, dtype='m8[ns]', **kwargs)
+
+    _inner_indexer = _join_i8_wrapper(libjoin.inner_join_indexer_int64)
+    _outer_indexer = _join_i8_wrapper(libjoin.outer_join_indexer_int64)
+    _left_indexer = _join_i8_wrapper(libjoin.left_join_indexer_int64)
+    _left_indexer_unique = _join_i8_wrapper(
+        libjoin.left_join_indexer_unique_int64, with_indexers=False)
+
+    # define my properties & methods for delegation
+    _other_ops = []
+    _bool_ops = []
+    _object_ops = ['freq']
+    _field_ops = ['days', 'seconds', 'microseconds', 'nanoseconds']
+    _datetimelike_ops = _field_ops + _object_ops + _bool_ops
+    _datetimelike_methods = ["to_pytimedelta", "total_seconds",
+                             "round", "floor", "ceil"]
+
+    @classmethod
+    def _add_comparison_methods(cls):
+        """ add in comparison methods """
+        cls.__eq__ = _td_index_cmp('__eq__', cls)
+        cls.__ne__ = _td_index_cmp('__ne__', cls)
+        cls.__lt__ = _td_index_cmp('__lt__', cls)
+        cls.__gt__ = _td_index_cmp('__gt__', cls)
+        cls.__le__ = _td_index_cmp('__le__', cls)
+        cls.__ge__ = _td_index_cmp('__ge__', cls)
+
+    _engine_type = libindex.TimedeltaEngine
+
+    _comparables = ['name', 'freq']
+    _attributes = ['name', 'freq']
+    _is_numeric_dtype = True
+    _infer_as_myclass = True
+
+    _freq = None
+
+    def __new__(cls, data=None, unit=None, freq=None, start=None, end=None,
+                periods=None, closed=None, dtype=None, copy=False,
+                name=None, verify_integrity=True):
+
+        if isinstance(data, TimedeltaIndex) and freq is None and name is None:
+            if copy:
+                return data.copy()
+            else:
+                return data._shallow_copy()
+
+        freq_infer = False
+        if not isinstance(freq, DateOffset):
+
+            # if a passed freq is None, don't infer automatically
+            if freq != 'infer':
+                freq = to_offset(freq)
+            else:
+                freq_infer = True
+                freq = None
+
+        if periods is not None:
+            if is_float(periods):
+                periods = int(periods)
+            elif not is_integer(periods):
+                msg = 'periods must be a number, got {periods}'
+                raise TypeError(msg.format(periods=periods))
+
+        if data is None:
+            if freq is None and com._any_none(periods, start, end):
+                msg = 'Must provide freq argument if no data is supplied'
+                raise ValueError(msg)
+            else:
+                return cls._generate(start, end, periods, name, freq,
+                                     closed=closed)
+
+        if unit is not None:
+            data = to_timedelta(data, unit=unit, box=False)
+
+        if not isinstance(data, (np.ndarray, Index, ABCSeries)):
+            if is_scalar(data):
+                raise ValueError('TimedeltaIndex() must be called with a '
+                                 'collection of some kind, %s was passed'
+                                 % repr(data))
+
+        # convert if not already
+        if getattr(data, 'dtype', None) != _TD_DTYPE:
+            data = to_timedelta(data, unit=unit, box=False)
+        elif copy:
+            data = np.array(data, copy=True)
+
+        # check that we are matching freqs
+        if verify_integrity and len(data) > 0:
+            if freq is not None and not freq_infer:
+                index = cls._simple_new(data, name=name)
+                cls._validate_frequency(index, freq)
+                index.freq = freq
+                return index
+
+        if freq_infer:
+            index = cls._simple_new(data, name=name)
+            inferred = index.inferred_freq
+            if inferred:
+                index.freq = to_offset(inferred)
+            return index
+
+        return cls._simple_new(data, name=name, freq=freq)
+
+    @classmethod
+    def _generate(cls, start, end, periods, name, freq, closed=None):
+        if com._count_not_none(start, end, periods, freq) != 3:
+            raise ValueError('Of the four parameters: start, end, periods, '
+                             'and freq, exactly three must be specified')
+
+        if start is not None:
+            start = Timedelta(start)
+
+        if end is not None:
+            end = Timedelta(end)
+
+        left_closed = False
+        right_closed = False
+
+        if start is None and end is None:
+            if closed is not None:
+                raise ValueError("Closed has to be None if not both of start"
+                                 "and end are defined")
+
+        if closed is None:
+            left_closed = True
+            right_closed = True
+        elif closed == "left":
+            left_closed = True
+        elif closed == "right":
+            right_closed = True
+        else:
+            raise ValueError("Closed has to be either 'left', 'right' or None")
+
+        if freq is not None:
+            index = _generate_regular_range(start, end, periods, freq)
+            index = cls._simple_new(index, name=name, freq=freq)
+        else:
+            index = to_timedelta(np.linspace(start.value, end.value, periods))
+
+        if not left_closed:
+            index = index[1:]
+        if not right_closed:
+            index = index[:-1]
+
+        return index
+
+    @property
+    def _box_func(self):
+        return lambda x: Timedelta(x, unit='ns')
+
+    @classmethod
+    def _simple_new(cls, values, name=None, freq=None, **kwargs):
+        values = np.array(values, copy=False)
+        if values.dtype == np.object_:
+            values = array_to_timedelta64(values)
+        if values.dtype != _TD_DTYPE:
+            values = _ensure_int64(values).view(_TD_DTYPE)
+
+        result = object.__new__(cls)
+        result._data = values
+        result.name = name
+        result._freq = freq
+        result._reset_identity()
+        return result
+
+    @property
+    def _formatter_func(self):
+        from pandas.io.formats.format import _get_format_timedelta64
+        return _get_format_timedelta64(self, box=True)
+
+    def __setstate__(self, state):
+        """Necessary for making this object picklable"""
+        if isinstance(state, dict):
+            super(TimedeltaIndex, self).__setstate__(state)
+        else:
+            raise Exception("invalid pickle state")
+    _unpickle_compat = __setstate__
+
+    def _maybe_update_attributes(self, attrs):
+        """ Update Index attributes (e.g. freq) depending on op """
+        freq = attrs.get('freq', None)
+        if freq is not None:
+            # no need to infer if freq is None
+            attrs['freq'] = 'infer'
+        return attrs
+
+    def _add_offset(self, other):
+        assert not isinstance(other, Tick)
+        raise TypeError("cannot add the type {typ} to a {cls}"
+                        .format(typ=type(other).__name__,
+                                cls=type(self).__name__))
+
+    def _add_delta(self, delta):
+        """
+        Add a timedelta-like, Tick, or TimedeltaIndex-like object
+        to self.
+
+        Parameters
+        ----------
+        delta : {timedelta, np.timedelta64, Tick, TimedeltaIndex}
+
+        Returns
+        -------
+        result : TimedeltaIndex
+
+        Notes
+        -----
+        The result's name is set outside of _add_delta by the calling
+        method (__add__ or __sub__)
+        """
+        if isinstance(delta, (Tick, timedelta, np.timedelta64)):
+            new_values = self._add_delta_td(delta)
+        elif isinstance(delta, TimedeltaIndex):
+            new_values = self._add_delta_tdi(delta)
+        elif is_timedelta64_dtype(delta):
+            # ndarray[timedelta64] --> wrap in TimedeltaIndex
+            delta = TimedeltaIndex(delta)
+            new_values = self._add_delta_tdi(delta)
+        else:
+            raise TypeError("cannot add the type {0} to a TimedeltaIndex"
+                            .format(type(delta)))
+
+        return TimedeltaIndex(new_values, freq='infer')
+
+    def _evaluate_with_timedelta_like(self, other, op):
+        if isinstance(other, ABCSeries):
+            # GH#19042
+            return NotImplemented
+
+        opstr = '__{opname}__'.format(opname=op.__name__).replace('__r', '__')
+        # allow division by a timedelta
+        if opstr in ['__div__', '__truediv__', '__floordiv__']:
+            if _is_convertible_to_td(other):
+                other = Timedelta(other)
+                if isna(other):
+                    raise NotImplementedError(
+                        "division by pd.NaT not implemented")
+
+                i8 = self.asi8
+                left, right = i8, other.value
+
+                if opstr in ['__floordiv__']:
+                    result = op(left, right)
+                else:
+                    result = op(left, np.float64(right))
+                result = self._maybe_mask_results(result, convert='float64')
+                return Index(result, name=self.name, copy=False)
+
+        return NotImplemented
+
+    def _add_datelike(self, other):
+        # adding a timedeltaindex to a datetimelike
+        from pandas import Timestamp, DatetimeIndex
+        if isinstance(other, (DatetimeIndex, np.ndarray)):
+            # if other is an ndarray, we assume it is datetime64-dtype
+            # defer to implementation in DatetimeIndex
+            other = DatetimeIndex(other)
+            return other + self
+        else:
+            assert other is not NaT
+            other = Timestamp(other)
+            i8 = self.asi8
+            result = checked_add_with_arr(i8, other.value,
+                                          arr_mask=self._isnan)
+            result = self._maybe_mask_results(result, fill_value=iNaT)
+            return DatetimeIndex(result)
+
+    def _sub_datelike(self, other):
+        assert other is not NaT
+        raise TypeError("cannot subtract a datelike from a {cls}"
+                        .format(cls=type(self).__name__))
+
+    def _addsub_offset_array(self, other, op):
+        # Add or subtract Array-like of DateOffset objects
+        try:
+            # TimedeltaIndex can only operate with a subset of DateOffset
+            # subclasses.  Incompatible classes will raise AttributeError,
+            # which we re-raise as TypeError
+            return DatetimeIndexOpsMixin._addsub_offset_array(self, other, op)
+        except AttributeError:
+            raise TypeError("Cannot add/subtract non-tick DateOffset to {cls}"
+                            .format(cls=type(self).__name__))
+
+    def _format_native_types(self, na_rep=u('NaT'),
+                             date_format=None, **kwargs):
+        from pandas.io.formats.format import Timedelta64Formatter
+        return Timedelta64Formatter(values=self,
+                                    nat_rep=na_rep,
+                                    justify='all').get_result()
+
+    days = _field_accessor("days", "days",
+                           " Number of days for each element. ")
+    seconds = _field_accessor("seconds", "seconds",
+                              " Number of seconds (>= 0 and less than 1 day) "
+                              "for each element. ")
+    microseconds = _field_accessor("microseconds", "microseconds",
+                                   "\nNumber of microseconds (>= 0 and less "
+                                   "than 1 second) for each\nelement. ")
+    nanoseconds = _field_accessor("nanoseconds", "nanoseconds",
+                                  "\nNumber of nanoseconds (>= 0 and less "
+                                  "than 1 microsecond) for each\nelement.\n")
+
+    @property
+    def components(self):
+        """
+        Return a dataframe of the components (days, hours, minutes,
+        seconds, milliseconds, microseconds, nanoseconds) of the Timedeltas.
+
+        Returns
+        -------
+        a DataFrame
+        """
+        from pandas import DataFrame
+
+        columns = ['days', 'hours', 'minutes', 'seconds',
+                   'milliseconds', 'microseconds', 'nanoseconds']
+        hasnans = self.hasnans
+        if hasnans:
+            def f(x):
+                if isna(x):
+                    return [np.nan] * len(columns)
+                return x.components
+        else:
+            def f(x):
+                return x.components
+
+        result = DataFrame([f(x) for x in self])
+        result.columns = columns
+        if not hasnans:
+            result = result.astype('int64')
+        return result
+
+    def total_seconds(self):
+        """
+        Return total duration of each element expressed in seconds.
+
+        This method is available directly on TimedeltaIndex and on Series
+        containing timedelta values under the ``.dt`` namespace.
+
+        Returns
+        -------
+        seconds : Float64Index or Series
+            When the calling object is a TimedeltaIndex, the return type is a
+            Float64Index. When the calling object is a Series, the return type
+            is Series of type `float64` whose index is the same as the
+            original.
+
+        See Also
+        --------
+        datetime.timedelta.total_seconds : Standard library version
+            of this method.
+        TimedeltaIndex.components : Return a DataFrame with components of
+            each Timedelta.
+
+        Examples
+        --------
+        **Series**
+
+        >>> s = pd.Series(pd.to_timedelta(np.arange(5), unit='d'))
+        >>> s
+        0   0 days
+        1   1 days
+        2   2 days
+        3   3 days
+        4   4 days
+        dtype: timedelta64[ns]
+
+        >>> s.dt.total_seconds()
+        0         0.0
+        1     86400.0
+        2    172800.0
+        3    259200.0
+        4    345600.0
+        dtype: float64
+
+        **TimedeltaIndex**
+
+        >>> idx = pd.to_timedelta(np.arange(5), unit='d')
+        >>> idx
+        TimedeltaIndex(['0 days', '1 days', '2 days', '3 days', '4 days'],
+                       dtype='timedelta64[ns]', freq=None)
+
+        >>> idx.total_seconds()
+        Float64Index([0.0, 86400.0, 172800.0, 259200.00000000003, 345600.0],
+                     dtype='float64')
+        """
+        return Index(self._maybe_mask_results(1e-9 * self.asi8),
+                     name=self.name)
+
+    def to_pytimedelta(self):
+        """
+        Return TimedeltaIndex as object ndarray of datetime.timedelta objects
+
+        Returns
+        -------
+        datetimes : ndarray
+        """
+        return libts.ints_to_pytimedelta(self.asi8)
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        dtype = pandas_dtype(dtype)
+        if is_timedelta64_dtype(dtype) and not is_timedelta64_ns_dtype(dtype):
+            # return an index (essentially this is division)
+            result = self.values.astype(dtype, copy=copy)
+            if self.hasnans:
+                values = self._maybe_mask_results(result, convert='float64')
+                return Index(values, name=self.name)
+            return Index(result.astype('i8'), name=self.name)
+        return super(TimedeltaIndex, self).astype(dtype, copy=copy)
+
+    def union(self, other):
+        """
+        Specialized union for TimedeltaIndex objects. If combine
+        overlapping ranges with the same DateOffset, will be much
+        faster than Index.union
+
+        Parameters
+        ----------
+        other : TimedeltaIndex or array-like
+
+        Returns
+        -------
+        y : Index or TimedeltaIndex
+        """
+        self._assert_can_do_setop(other)
+        if not isinstance(other, TimedeltaIndex):
+            try:
+                other = TimedeltaIndex(other)
+            except (TypeError, ValueError):
+                pass
+        this, other = self, other
+
+        if this._can_fast_union(other):
+            return this._fast_union(other)
+        else:
+            result = Index.union(this, other)
+            if isinstance(result, TimedeltaIndex):
+                if result.freq is None:
+                    result.freq = to_offset(result.inferred_freq)
+            return result
+
+    def join(self, other, how='left', level=None, return_indexers=False,
+             sort=False):
+        """
+        See Index.join
+        """
+        if _is_convertible_to_index(other):
+            try:
+                other = TimedeltaIndex(other)
+            except (TypeError, ValueError):
+                pass
+
+        return Index.join(self, other, how=how, level=level,
+                          return_indexers=return_indexers,
+                          sort=sort)
+
+    def _wrap_joined_index(self, joined, other):
+        name = self.name if self.name == other.name else None
+        if (isinstance(other, TimedeltaIndex) and self.freq == other.freq and
+                self._can_fast_union(other)):
+            joined = self._shallow_copy(joined, name=name)
+            return joined
+        else:
+            return self._simple_new(joined, name)
+
+    def _can_fast_union(self, other):
+        if not isinstance(other, TimedeltaIndex):
+            return False
+
+        freq = self.freq
+
+        if freq is None or freq != other.freq:
+            return False
+
+        if not self.is_monotonic or not other.is_monotonic:
+            return False
+
+        if len(self) == 0 or len(other) == 0:
+            return True
+
+        # to make our life easier, "sort" the two ranges
+        if self[0] <= other[0]:
+            left, right = self, other
+        else:
+            left, right = other, self
+
+        right_start = right[0]
+        left_end = left[-1]
+
+        # Only need to "adjoin", not overlap
+        return (right_start == left_end + freq) or right_start in left
+
+    def _fast_union(self, other):
+        if len(other) == 0:
+            return self.view(type(self))
+
+        if len(self) == 0:
+            return other.view(type(self))
+
+        # to make our life easier, "sort" the two ranges
+        if self[0] <= other[0]:
+            left, right = self, other
+        else:
+            left, right = other, self
+
+        left_end = left[-1]
+        right_end = right[-1]
+
+        # concatenate
+        if left_end < right_end:
+            loc = right.searchsorted(left_end, side='right')
+            right_chunk = right.values[loc:]
+            dates = _concat._concat_compat((left.values, right_chunk))
+            return self._shallow_copy(dates)
+        else:
+            return left
+
+    def _wrap_union_result(self, other, result):
+        name = self.name if self.name == other.name else None
+        return self._simple_new(result, name=name, freq=None)
+
+    def intersection(self, other):
+        """
+        Specialized intersection for TimedeltaIndex objects. May be much faster
+        than Index.intersection
+
+        Parameters
+        ----------
+        other : TimedeltaIndex or array-like
+
+        Returns
+        -------
+        y : Index or TimedeltaIndex
+        """
+        self._assert_can_do_setop(other)
+        if not isinstance(other, TimedeltaIndex):
+            try:
+                other = TimedeltaIndex(other)
+            except (TypeError, ValueError):
+                pass
+            result = Index.intersection(self, other)
+            return result
+
+        if len(self) == 0:
+            return self
+        if len(other) == 0:
+            return other
+        # to make our life easier, "sort" the two ranges
+        if self[0] <= other[0]:
+            left, right = self, other
+        else:
+            left, right = other, self
+
+        end = min(left[-1], right[-1])
+        start = right[0]
+
+        if end < start:
+            return type(self)(data=[])
+        else:
+            lslice = slice(*left.slice_locs(start, end))
+            left_chunk = left.values[lslice]
+            return self._shallow_copy(left_chunk)
+
+    def _maybe_promote(self, other):
+        if other.inferred_type == 'timedelta':
+            other = TimedeltaIndex(other)
+        return self, other
+
+    def get_value(self, series, key):
+        """
+        Fast lookup of value from 1-dimensional ndarray. Only use this if you
+        know what you're doing
+        """
+
+        if _is_convertible_to_td(key):
+            key = Timedelta(key)
+            return self.get_value_maybe_box(series, key)
+
+        try:
+            return com._maybe_box(self, Index.get_value(self, series, key),
+                                  series, key)
+        except KeyError:
+            try:
+                loc = self._get_string_slice(key)
+                return series[loc]
+            except (TypeError, ValueError, KeyError):
+                pass
+
+            try:
+                return self.get_value_maybe_box(series, key)
+            except (TypeError, ValueError, KeyError):
+                raise KeyError(key)
+
+    def get_value_maybe_box(self, series, key):
+        if not isinstance(key, Timedelta):
+            key = Timedelta(key)
+        values = self._engine.get_value(com._values_from_object(series), key)
+        return com._maybe_box(self, values, series, key)
+
+    def get_loc(self, key, method=None, tolerance=None):
+        """
+        Get integer location for requested label
+
+        Returns
+        -------
+        loc : int
+        """
+        if is_list_like(key):
+            raise TypeError
+
+        if isna(key):
+            key = NaT
+
+        if tolerance is not None:
+            # try converting tolerance now, so errors don't get swallowed by
+            # the try/except clauses below
+            tolerance = self._convert_tolerance(tolerance, np.asarray(key))
+
+        if _is_convertible_to_td(key):
+            key = Timedelta(key)
+            return Index.get_loc(self, key, method, tolerance)
+
+        try:
+            return Index.get_loc(self, key, method, tolerance)
+        except (KeyError, ValueError, TypeError):
+            try:
+                return self._get_string_slice(key)
+            except (TypeError, KeyError, ValueError):
+                pass
+
+            try:
+                stamp = Timedelta(key)
+                return Index.get_loc(self, stamp, method, tolerance)
+            except (KeyError, ValueError):
+                raise KeyError(key)
+
+    def _maybe_cast_slice_bound(self, label, side, kind):
+        """
+        If label is a string, cast it to timedelta according to resolution.
+
+
+        Parameters
+        ----------
+        label : object
+        side : {'left', 'right'}
+        kind : {'ix', 'loc', 'getitem'}
+
+        Returns
+        -------
+        label :  object
+
+        """
+        assert kind in ['ix', 'loc', 'getitem', None]
+
+        if isinstance(label, compat.string_types):
+            parsed = _coerce_scalar_to_timedelta_type(label, box=True)
+            lbound = parsed.round(parsed.resolution)
+            if side == 'left':
+                return lbound
+            else:
+                return (lbound + to_offset(parsed.resolution) -
+                        Timedelta(1, 'ns'))
+        elif ((is_integer(label) or is_float(label)) and
+              not is_timedelta64_dtype(label)):
+            self._invalid_indexer('slice', label)
+
+        return label
+
+    def _get_string_slice(self, key, use_lhs=True, use_rhs=True):
+        freq = getattr(self, 'freqstr',
+                       getattr(self, 'inferred_freq', None))
+        if is_integer(key) or is_float(key) or key is NaT:
+            self._invalid_indexer('slice', key)
+        loc = self._partial_td_slice(key, freq, use_lhs=use_lhs,
+                                     use_rhs=use_rhs)
+        return loc
+
+    def _partial_td_slice(self, key, freq, use_lhs=True, use_rhs=True):
+
+        # given a key, try to figure out a location for a partial slice
+        if not isinstance(key, compat.string_types):
+            return key
+
+        raise NotImplementedError
+
+        # TODO(wesm): dead code
+        # parsed = _coerce_scalar_to_timedelta_type(key, box=True)
+
+        # is_monotonic = self.is_monotonic
+
+        # # figure out the resolution of the passed td
+        # # and round to it
+
+        # # t1 = parsed.round(reso)
+
+        # t2 = t1 + to_offset(parsed.resolution) - Timedelta(1, 'ns')
+
+        # stamps = self.asi8
+
+        # if is_monotonic:
+
+        #     # we are out of range
+        #     if (len(stamps) and ((use_lhs and t1.value < stamps[0] and
+        #                           t2.value < stamps[0]) or
+        #                          ((use_rhs and t1.value > stamps[-1] and
+        #                            t2.value > stamps[-1])))):
+        #         raise KeyError
+
+        #     # a monotonic (sorted) series can be sliced
+        #     left = (stamps.searchsorted(t1.value, side='left')
+        #             if use_lhs else None)
+        #     right = (stamps.searchsorted(t2.value, side='right')
+        #              if use_rhs else None)
+
+        #     return slice(left, right)
+
+        # lhs_mask = (stamps >= t1.value) if use_lhs else True
+        # rhs_mask = (stamps <= t2.value) if use_rhs else True
+
+        # # try to find a the dates
+        # return (lhs_mask & rhs_mask).nonzero()[0]
+
+    @Substitution(klass='TimedeltaIndex')
+    @Appender(_shared_docs['searchsorted'])
+    @deprecate_kwarg(old_arg_name='key', new_arg_name='value')
+    def searchsorted(self, value, side='left', sorter=None):
+        if isinstance(value, (np.ndarray, Index)):
+            value = np.array(value, dtype=_TD_DTYPE, copy=False)
+        else:
+            value = _to_m8(value)
+
+        return self.values.searchsorted(value, side=side, sorter=sorter)
+
+    def is_type_compatible(self, typ):
+        return typ == self.inferred_type or typ == 'timedelta'
+
+    @property
+    def inferred_type(self):
+        return 'timedelta64'
+
+    @property
+    def dtype(self):
+        return _TD_DTYPE
+
+    @property
+    def is_all_dates(self):
+        return True
+
+    def insert(self, loc, item):
+        """
+        Make new Index inserting new item at location
+
+        Parameters
+        ----------
+        loc : int
+        item : object
+            if not either a Python datetime or a numpy integer-like, returned
+            Index dtype will be object rather than datetime.
+
+        Returns
+        -------
+        new_index : Index
+        """
+        # try to convert if possible
+        if _is_convertible_to_td(item):
+            try:
+                item = Timedelta(item)
+            except Exception:
+                pass
+        elif is_scalar(item) and isna(item):
+            # GH 18295
+            item = self._na_value
+
+        freq = None
+        if isinstance(item, Timedelta) or (is_scalar(item) and isna(item)):
+
+            # check freq can be preserved on edge cases
+            if self.freq is not None:
+                if ((loc == 0 or loc == -len(self)) and
+                        item + self.freq == self[0]):
+                    freq = self.freq
+                elif (loc == len(self)) and item - self.freq == self[-1]:
+                    freq = self.freq
+            item = _to_m8(item)
+
+        try:
+            new_tds = np.concatenate((self[:loc].asi8, [item.view(np.int64)],
+                                      self[loc:].asi8))
+            return TimedeltaIndex(new_tds, name=self.name, freq=freq)
+
+        except (AttributeError, TypeError):
+
+            # fall back to object index
+            if isinstance(item, compat.string_types):
+                return self.astype(object).insert(loc, item)
+            raise TypeError(
+                "cannot insert TimedeltaIndex with incompatible label")
+
+    def delete(self, loc):
+        """
+        Make a new TimedeltaIndex with passed location(s) deleted.
+
+        Parameters
+        ----------
+        loc: int, slice or array of ints
+            Indicate which sub-arrays to remove.
+
+        Returns
+        -------
+        new_index : TimedeltaIndex
+        """
+        new_tds = np.delete(self.asi8, loc)
+
+        freq = 'infer'
+        if is_integer(loc):
+            if loc in (0, -len(self), -1, len(self) - 1):
+                freq = self.freq
+        else:
+            if is_list_like(loc):
+                loc = lib.maybe_indices_to_slice(
+                    _ensure_int64(np.array(loc)), len(self))
+            if isinstance(loc, slice) and loc.step in (1, None):
+                if (loc.start in (0, None) or loc.stop in (len(self), None)):
+                    freq = self.freq
+
+        return TimedeltaIndex(new_tds, name=self.name, freq=freq)
+
+
+TimedeltaIndex._add_comparison_methods()
+TimedeltaIndex._add_numeric_methods()
+TimedeltaIndex._add_logical_methods_disabled()
+TimedeltaIndex._add_datetimelike_methods()
+
+
+def _is_convertible_to_index(other):
+    """
+    return a boolean whether I can attempt conversion to a TimedeltaIndex
+    """
+    if isinstance(other, TimedeltaIndex):
+        return True
+    elif (len(other) > 0 and
+          other.inferred_type not in ('floating', 'mixed-integer', 'integer',
+                                      'mixed-integer-float', 'mixed')):
+        return True
+    return False
+
+
+def _is_convertible_to_td(key):
+    return isinstance(key, (Tick, timedelta,
+                            np.timedelta64, compat.string_types))
+
+
+def _to_m8(key):
+    """
+    Timedelta-like => dt64
+    """
+    if not isinstance(key, Timedelta):
+        # this also converts strings
+        key = Timedelta(key)
+
+    # return an type that can be compared
+    return np.int64(key.value).view(_TD_DTYPE)
+
+
+def _generate_regular_range(start, end, periods, offset):
+    stride = offset.nanos
+    if periods is None:
+        b = Timedelta(start).value
+        e = Timedelta(end).value
+        e += stride - e % stride
+    elif start is not None:
+        b = Timedelta(start).value
+        e = b + periods * stride
+    elif end is not None:
+        e = Timedelta(end).value + stride
+        b = e - periods * stride
+    else:
+        raise ValueError("at least 'start' or 'end' should be specified "
+                         "if a 'period' is given.")
+
+    data = np.arange(b, e, stride, dtype=np.int64)
+    data = TimedeltaIndex._simple_new(data, None)
+
+    return data
+
+
+def timedelta_range(start=None, end=None, periods=None, freq=None,
+                    name=None, closed=None):
+    """
+    Return a fixed frequency TimedeltaIndex, with day as the default
+    frequency
+
+    Parameters
+    ----------
+    start : string or timedelta-like, default None
+        Left bound for generating timedeltas
+    end : string or timedelta-like, default None
+        Right bound for generating timedeltas
+    periods : integer, default None
+        Number of periods to generate
+    freq : string or DateOffset, default 'D' (calendar daily)
+        Frequency strings can have multiples, e.g. '5H'
+    name : string, default None
+        Name of the resulting TimedeltaIndex
+    closed : string, default None
+        Make the interval closed with respect to the given frequency to
+        the 'left', 'right', or both sides (None)
+
+    Returns
+    -------
+    rng : TimedeltaIndex
+
+    Notes
+    -----
+    Of the four parameters ``start``, ``end``, ``periods``, and ``freq``,
+    exactly three must be specified. If ``freq`` is omitted, the resulting
+    ``TimedeltaIndex`` will have ``periods`` linearly spaced elements between
+    ``start`` and ``end`` (closed on both sides).
+
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Examples
+    --------
+
+    >>> pd.timedelta_range(start='1 day', periods=4)
+    TimedeltaIndex(['1 days', '2 days', '3 days', '4 days'],
+                   dtype='timedelta64[ns]', freq='D')
+
+    The ``closed`` parameter specifies which endpoint is included.  The default
+    behavior is to include both endpoints.
+
+    >>> pd.timedelta_range(start='1 day', periods=4, closed='right')
+    TimedeltaIndex(['2 days', '3 days', '4 days'],
+                   dtype='timedelta64[ns]', freq='D')
+
+    The ``freq`` parameter specifies the frequency of the TimedeltaIndex.
+    Only fixed frequencies can be passed, non-fixed frequencies such as
+    'M' (month end) will raise.
+
+    >>> pd.timedelta_range(start='1 day', end='2 days', freq='6H')
+    TimedeltaIndex(['1 days 00:00:00', '1 days 06:00:00', '1 days 12:00:00',
+                    '1 days 18:00:00', '2 days 00:00:00'],
+                   dtype='timedelta64[ns]', freq='6H')
+
+    Specify ``start``, ``end``, and ``periods``; the frequency is generated
+    automatically (linearly spaced).
+
+    >>> pd.timedelta_range(start='1 day', end='5 days', periods=4)
+    TimedeltaIndex(['1 days 00:00:00', '2 days 08:00:00', '3 days 16:00:00',
+                '5 days 00:00:00'],
+               dtype='timedelta64[ns]', freq=None)
+    """
+    if freq is None and com._any_none(periods, start, end):
+        freq = 'D'
+
+    return TimedeltaIndex(start=start, end=end, periods=periods,
+                          freq=freq, name=name, closed=closed)
diff --git a/pandas/core/indexing.py b/pandas/core/indexing.py
old mode 100644
new mode 100755
index 8b4528ef451ef..a69313a2d4a43
--- a/pandas/core/indexing.py
+++ b/pandas/core/indexing.py
@@ -1,94 +1,157 @@
 # pylint: disable=W0223
-
-from pandas.core.index import Index, MultiIndex
+import textwrap
+import warnings
+import numpy as np
 from pandas.compat import range, zip
 import pandas.compat as compat
+from pandas.core.dtypes.generic import ABCDataFrame, ABCPanel, ABCSeries
+from pandas.core.dtypes.common import (
+    is_integer_dtype,
+    is_integer, is_float,
+    is_list_like,
+    is_sequence,
+    is_iterator,
+    is_scalar,
+    is_sparse,
+    _ensure_platform_int)
+from pandas.core.dtypes.missing import isna, _infer_fill_value
+from pandas.errors import AbstractMethodError
+from pandas.util._decorators import Appender
+
+from pandas.core.index import Index, MultiIndex
+
 import pandas.core.common as com
-from pandas.core.common import (is_bool_indexer, is_integer_dtype,
-                                _asarray_tuplesafe, is_list_like, isnull,
-                                is_null_slice, is_full_slice,
-                                ABCSeries, ABCDataFrame, ABCPanel, is_float,
-                                _values_from_object, _infer_fill_value, is_integer)
-import numpy as np
+from pandas._libs.indexing import _NDFrameIndexerBase
+
 
 # the supported indexers
 def get_indexers_list():
 
     return [
-        ('ix',   _IXIndexer),
+        ('ix', _IXIndexer),
         ('iloc', _iLocIndexer),
-        ('loc',  _LocIndexer),
-        ('at',   _AtIndexer),
-        ('iat',  _iAtIndexer),
+        ('loc', _LocIndexer),
+        ('at', _AtIndexer),
+        ('iat', _iAtIndexer),
     ]
 
+
 # "null slice"
 _NS = slice(None, None)
 
+
 # the public IndexSlicerMaker
 class _IndexSlice(object):
+    """
+    Create an object to more easily perform multi-index slicing
+
+    See Also
+    --------
+    MultiIndex.remove_unused_levels : New MultiIndex with no unused levels.
+
+    Notes
+    -----
+    See :ref:`Defined Levels <advanced.shown_levels>`
+    for further info on slicing a MultiIndex.
+
+    Examples
+    --------
+
+    >>> midx = pd.MultiIndex.from_product([['A0','A1'], ['B0','B1','B2','B3']])
+    >>> columns = ['foo', 'bar']
+    >>> dfmi = pd.DataFrame(np.arange(16).reshape((len(midx), len(columns))),
+                            index=midx, columns=columns)
+
+    Using the default slice command:
+
+    >>> dfmi.loc[(slice(None), slice('B0', 'B1')), :]
+               foo  bar
+        A0 B0    0    1
+           B1    2    3
+        A1 B0    8    9
+           B1   10   11
+
+    Using the IndexSlice class for a more intuitive command:
+
+    >>> idx = pd.IndexSlice
+    >>> dfmi.loc[idx[:, 'B0':'B1'], :]
+               foo  bar
+        A0 B0    0    1
+           B1    2    3
+        A1 B0    8    9
+           B1   10   11
+    """
+
     def __getitem__(self, arg):
         return arg
+
+
 IndexSlice = _IndexSlice()
 
+
 class IndexingError(Exception):
     pass
 
-class _NDFrameIndexer(object):
+
+class _NDFrameIndexer(_NDFrameIndexerBase):
     _valid_types = None
     _exception = KeyError
+    axis = None
 
-    def __init__(self, obj, name):
-        self.obj = obj
-        self.ndim = obj.ndim
-        self.name = name
-        self.axis = None
-
-    def __call__(self, *args, **kwargs):
+    def __call__(self, axis=None):
         # we need to return a copy of ourselves
-        self = self.__class__(self.obj, self.name)
+        new_self = self.__class__(self.name, self.obj)
 
-        # set the passed in values
-        for k, v in compat.iteritems(kwargs):
-            setattr(self,k,v)
-        return self
+        if axis is not None:
+            axis = self.obj._get_axis_number(axis)
+        new_self.axis = axis
+        return new_self
 
     def __iter__(self):
         raise NotImplementedError('ix is not iterable')
 
     def __getitem__(self, key):
         if type(key) is tuple:
+            key = tuple(com._apply_if_callable(x, self.obj)
+                        for x in key)
             try:
-                values = self.obj.get_value(*key)
-                if np.isscalar(values):
+                values = self.obj._get_value(*key)
+                if is_scalar(values):
                     return values
             except Exception:
                 pass
 
             return self._getitem_tuple(key)
         else:
-            return self._getitem_axis(key, axis=0)
+            # we by definition only have the 0th axis
+            axis = self.axis or 0
+
+            key = com._apply_if_callable(key, self.obj)
+            return self._getitem_axis(key, axis=axis)
+
+    def _get_label(self, label, axis=None):
+        if axis is None:
+            axis = self.axis or 0
 
-    def _get_label(self, label, axis=0):
         if self.ndim == 1:
             # for perf reasons we want to try _xs first
             # as its basically direct indexing
             # but will fail when the index is not present
             # see GH5667
-            try:
-                return self.obj._xs(label, axis=axis)
-            except:
-                return self.obj[label]
-        elif (isinstance(label, tuple) and
-                isinstance(label[axis], slice)):
+            return self.obj._xs(label, axis=axis)
+        elif isinstance(label, tuple) and isinstance(label[axis], slice):
             raise IndexingError('no slices here, handle elsewhere')
 
         return self.obj._xs(label, axis=axis)
 
-    def _get_loc(self, key, axis=0):
+    def _get_loc(self, key, axis=None):
+        if axis is None:
+            axis = self.axis
         return self.obj._ixs(key, axis=axis)
 
-    def _slice(self, obj, axis=0, kind=None):
+    def _slice(self, obj, axis=None, kind=None):
+        if axis is None:
+            axis = self.axis
         return self.obj._slice(obj, axis=axis, kind=kind)
 
     def _get_setitem_indexer(self, key):
@@ -96,49 +159,80 @@ def _get_setitem_indexer(self, key):
             return self._convert_tuple(key, is_setter=True)
 
         axis = self.obj._get_axis(0)
-        if isinstance(axis, MultiIndex):
+
+        if isinstance(axis, MultiIndex) and self.name != 'iloc':
             try:
                 return axis.get_loc(key)
             except Exception:
                 pass
 
-        if isinstance(key, tuple) and not self.ndim < len(key):
-            return self._convert_tuple(key, is_setter=True)
+        if isinstance(key, tuple):
+            try:
+                return self._convert_tuple(key, is_setter=True)
+            except IndexingError:
+                pass
+
+        if isinstance(key, range):
+            return self._convert_range(key, is_setter=True)
 
         try:
             return self._convert_to_indexer(key, is_setter=True)
-        except TypeError:
+        except TypeError as e:
+
+            # invalid indexer type vs 'other' indexing errors
+            if 'cannot do' in str(e):
+                raise
             raise IndexingError(key)
 
     def __setitem__(self, key, value):
+        if isinstance(key, tuple):
+            key = tuple(com._apply_if_callable(x, self.obj)
+                        for x in key)
+        else:
+            key = com._apply_if_callable(key, self.obj)
         indexer = self._get_setitem_indexer(key)
         self._setitem_with_indexer(indexer, value)
 
-    def _has_valid_type(self, k, axis):
-        raise NotImplementedError()
+    def _validate_key(self, key, axis):
+        """
+        Ensure that key is valid for current indexer.
+
+        Parameters
+        ----------
+        key : scalar, slice or list-like
+            The key requested
+
+        axis : int
+            Dimension on which the indexing is being made
+
+        Raises
+        ------
+        TypeError
+            If the key (or some element of it) has wrong type
+
+        IndexError
+            If the key (or some element of it) is out of bounds
+
+        KeyError
+            If the key was not found
+        """
+        raise AbstractMethodError()
 
     def _has_valid_tuple(self, key):
         """ check the key for valid keys across my indexer """
         for i, k in enumerate(key):
             if i >= self.obj.ndim:
                 raise IndexingError('Too many indexers')
-            if not self._has_valid_type(k, i):
-                raise ValueError("Location based indexing can only have [%s] "
-                                 "types" % self._valid_types)
-
-    def _should_validate_iterable(self, axis=0):
-        """ return a boolean whether this axes needs validation for a passed iterable """
-        ax = self.obj._get_axis(axis)
-        if isinstance(ax, MultiIndex):
-            return False
-        elif ax.is_floating():
-            return False
-
-        return True
+            try:
+                self._validate_key(k, i)
+            except ValueError:
+                raise ValueError("Location based indexing can only have "
+                                 "[{types}] types"
+                                 .format(types=self._valid_types))
 
     def _is_nested_tuple_indexer(self, tup):
-        if any([ isinstance(ax, MultiIndex) for ax in self.obj.axes ]):
-            return any([ is_nested_tuple(tup,ax) for ax in self.obj.axes ])
+        if any(isinstance(ax, MultiIndex) for ax in self.obj.axes):
+            return any(is_nested_tuple(tup, ax) for ax in self.obj.axes)
         return False
 
     def _convert_tuple(self, key, is_setter=False):
@@ -147,17 +241,26 @@ def _convert_tuple(self, key, is_setter=False):
             axis = self.obj._get_axis_number(self.axis)
             for i in range(self.ndim):
                 if i == axis:
-                    keyidx.append(self._convert_to_indexer(key, axis=axis, is_setter=is_setter))
+                    keyidx.append(self._convert_to_indexer(
+                        key, axis=axis, is_setter=is_setter))
                 else:
                     keyidx.append(slice(None))
         else:
             for i, k in enumerate(key):
+                if i >= self.obj.ndim:
+                    raise IndexingError('Too many indexers')
                 idx = self._convert_to_indexer(k, axis=i, is_setter=is_setter)
                 keyidx.append(idx)
         return tuple(keyidx)
 
+    def _convert_range(self, key, is_setter=False):
+        """ convert a range argument """
+        return list(key)
+
     def _convert_scalar_indexer(self, key, axis):
         # if we are accessing via lowered dim, use the last dim
+        if axis is None:
+            axis = 0
         ax = self.obj._get_axis(min(axis, self.ndim - 1))
         # a scalar
         return ax._convert_scalar_indexer(key, kind=self.name)
@@ -172,7 +275,8 @@ def _has_valid_setitem_indexer(self, indexer):
 
     def _has_valid_positional_setitem_indexer(self, indexer):
         """ validate that an positional indexer cannot enlarge its target
-            will raise if needed, does not modify the indexer externally """
+        will raise if needed, does not modify the indexer externally
+        """
         if isinstance(indexer, dict):
             raise IndexError("{0} cannot enlarge its target object"
                              .format(self.name))
@@ -188,11 +292,11 @@ def _has_valid_positional_setitem_indexer(self, indexer):
                     pass
                 elif is_integer(i):
                     if i >= len(ax):
-                        raise IndexError("{0} cannot enlarge its target object"
-                                         .format(self.name))
+                        raise IndexError("{name} cannot enlarge its target "
+                                         "object".format(name=self.name))
                 elif isinstance(i, dict):
-                    raise IndexError("{0} cannot enlarge its target object"
-                                     .format(self.name))
+                    raise IndexError("{name} cannot enlarge its target object"
+                                     .format(name=self.name))
 
         return True
 
@@ -200,7 +304,8 @@ def _setitem_with_indexer(self, indexer, value):
         self._has_valid_setitem_indexer(indexer)
 
         # also has the side effect of consolidating in-place
-        from pandas import Panel, DataFrame, Series
+        # TODO: Panel, DataFrame are not imported, remove?
+        from pandas import Panel, DataFrame, Series  # noqa
         info_axis = self.obj._info_axis_number
 
         # maybe partial set
@@ -211,16 +316,19 @@ def _setitem_with_indexer(self, indexer, value):
         if not take_split_path and self.obj._data.blocks:
             blk, = self.obj._data.blocks
             if 1 < blk.ndim:  # in case of dict, keys are indices
-                val = list(value.values()) if isinstance(value,dict) else value
+                val = list(value.values()) if isinstance(value,
+                                                         dict) else value
                 take_split_path = not blk._can_hold_element(val)
 
         if isinstance(indexer, tuple) and len(indexer) == len(self.obj.axes):
 
             for i, ax in zip(indexer, self.obj.axes):
 
-                # if we have any multi-indexes that have non-trivial slices (not null slices)
-                # then we must take the split path, xref GH 10360
-                if isinstance(ax, MultiIndex) and not (is_integer(i) or is_null_slice(i)):
+                # if we have any multi-indexes that have non-trivial slices
+                # (not null slices) then we must take the split path, xref
+                # GH 10360
+                if (isinstance(ax, MultiIndex) and
+                        not (is_integer(i) or com.is_null_slice(i))):
                     take_split_path = True
                     break
 
@@ -248,14 +356,13 @@ def _setitem_with_indexer(self, indexer, value):
                             len(_ax) for _i, _ax in enumerate(self.obj.axes)
                             if _i != i
                         ]
-                        if any([not l for l in len_non_info_axes]):
+                        if any(not l for l in len_non_info_axes):
                             if not is_list_like_indexer(value):
                                 raise ValueError("cannot set a frame with no "
                                                  "defined index and a scalar")
                             self.obj[key] = value
                             return self.obj
 
-
                         # add a new item with the dtype setup
                         self.obj[key] = _infer_fill_value(value)
 
@@ -270,10 +377,10 @@ def _setitem_with_indexer(self, indexer, value):
                     # just replacing the block manager here
                     # so the object is the same
                     index = self.obj._get_axis(i)
-                    labels = index.insert(len(index),key)
-                    self.obj._data = self.obj.reindex_axis(labels, i)._data
+                    labels = index.insert(len(index), key)
+                    self.obj._data = self.obj.reindex(labels, axis=i)._data
                     self.obj._maybe_update_cacher(clear=True)
-                    self.obj.is_copy=None
+                    self.obj._is_copy = None
 
                     nindexer.append(labels.get_loc(key))
 
@@ -291,14 +398,30 @@ def _setitem_with_indexer(self, indexer, value):
                 # and set inplace
                 if self.ndim == 1:
                     index = self.obj.index
-                    new_index = index.insert(len(index),indexer)
+                    new_index = index.insert(len(index), indexer)
+
+                    # we have a coerced indexer, e.g. a float
+                    # that matches in an Int64Index, so
+                    # we will not create a duplicate index, rather
+                    # index to that element
+                    # e.g. 0.0 -> 0
+                    # GH12246
+                    if index.is_unique:
+                        new_indexer = index.get_indexer([new_index[-1]])
+                        if (new_indexer != -1).any():
+                            return self._setitem_with_indexer(new_indexer,
+                                                              value)
 
                     # this preserves dtype of the value
                     new_values = Series([value])._values
                     if len(self.obj._values):
-                        new_values = np.concatenate([self.obj._values,
-                                                     new_values])
-
+                        try:
+                            new_values = np.concatenate([self.obj._values,
+                                                         new_values])
+                        except TypeError:
+                            as_obj = self.obj.astype(object)
+                            new_values = np.concatenate([as_obj,
+                                                         new_values])
                     self.obj._data = self.obj._constructor(
                         new_values, index=new_index, name=self.obj.name)._data
                     self.obj._maybe_update_cacher(clear=True)
@@ -308,14 +431,14 @@ def _setitem_with_indexer(self, indexer, value):
 
                     # no columns and scalar
                     if not len(self.obj.columns):
-                        raise ValueError(
-                            "cannot set a frame with no defined columns"
-                        )
+                        raise ValueError("cannot set a frame with no defined "
+                                         "columns")
 
                     # append a Series
                     if isinstance(value, Series):
 
-                        value = value.reindex(index=self.obj.columns,copy=True)
+                        value = value.reindex(index=self.obj.columns,
+                                              copy=True)
                         value.name = indexer
 
                     # a list-list
@@ -324,11 +447,11 @@ def _setitem_with_indexer(self, indexer, value):
                         # must have conforming columns
                         if is_list_like_indexer(value):
                             if len(value) != len(self.obj.columns):
-                                raise ValueError(
-                                    "cannot set a row with mismatched columns"
-                                    )
+                                raise ValueError("cannot set a row with "
+                                                 "mismatched columns")
 
-                        value = Series(value,index=self.obj.columns,name=indexer)
+                        value = Series(value, index=self.obj.columns,
+                                       name=indexer)
 
                     self.obj._data = self.obj.append(value)._data
                     self.obj._maybe_update_cacher(clear=True)
@@ -369,23 +492,24 @@ def _setitem_with_indexer(self, indexer, value):
 
                 # require that we are setting the right number of values that
                 # we are indexing
-                if is_list_like_indexer(value) and np.iterable(value) and lplane_indexer != len(value):
+                if is_list_like_indexer(value) and np.iterable(
+                        value) and lplane_indexer != len(value):
 
                     if len(obj[idx]) != len(value):
-                        raise ValueError(
-                            "cannot set using a multi-index selection indexer "
-                            "with a different length than the value"
-                        )
+                        raise ValueError("cannot set using a multi-index "
+                                         "selection indexer with a different "
+                                         "length than the value")
 
                     # make sure we have an ndarray
-                    value = getattr(value,'values',value).ravel()
+                    value = getattr(value, 'values', value).ravel()
 
                     # we can directly set the series here
                     # as we select a slice indexer on the mi
                     idx = index._convert_slice_indexer(idx)
                     obj._consolidate_inplace()
                     obj = obj.copy()
-                    obj._data = obj._data.setitem(indexer=tuple([idx]), value=value)
+                    obj._data = obj._data.setitem(indexer=tuple([idx]),
+                                                  value=value)
                     self.obj[item] = obj
                     return
 
@@ -405,9 +529,13 @@ def setter(item, v):
 
                 # perform the equivalent of a setitem on the info axis
                 # as we have a null slice or a slice with full bounds
-                # which means essentially reassign to the columns of a multi-dim object
+                # which means essentially reassign to the columns of a
+                # multi-dim object
                 # GH6149 (null slice), GH10408 (full bounds)
-                if isinstance(pi, tuple) and all(is_null_slice(idx) or is_full_slice(idx, len(self.obj)) for idx in pi):
+                if (isinstance(pi, tuple) and
+                        all(com.is_null_slice(idx) or
+                            com.is_full_slice(idx, len(self.obj))
+                            for idx in pi)):
                     s = v
                 else:
                     # set the item, possibly having a dtype change
@@ -421,7 +549,8 @@ def setter(item, v):
 
             def can_do_equal_len():
                 """ return True if we have an equal len settable """
-                if not len(labels) == 1 or not np.iterable(value):
+                if (not len(labels) == 1 or not np.iterable(value) or
+                        is_scalar(plane_indexer[0])):
                     return False
 
                 l = len(value)
@@ -438,16 +567,19 @@ def can_do_equal_len():
 
             # we need an iterable, with a ndim of at least 1
             # eg. don't pass through np.array(0)
-            if is_list_like_indexer(value) and getattr(value,'ndim',1) > 0:
+            if is_list_like_indexer(value) and getattr(value, 'ndim', 1) > 0:
 
                 # we have an equal len Frame
                 if isinstance(value, ABCDataFrame) and value.ndim > 1:
                     sub_indexer = list(indexer)
+                    multiindex_indexer = isinstance(labels, MultiIndex)
 
                     for item in labels:
                         if item in value:
                             sub_indexer[info_axis] = item
-                            v = self._align_series(tuple(sub_indexer), value[item])
+                            v = self._align_series(
+                                tuple(sub_indexer), value[item],
+                                multiindex_indexer)
                         else:
                             v = np.nan
 
@@ -458,7 +590,7 @@ def can_do_equal_len():
 
                     # note that this coerces the dtype if we are mixed
                     # GH 7551
-                    value = np.array(value,dtype=object)
+                    value = np.array(value, dtype=object)
                     if len(labels) != value.shape[1]:
                         raise ValueError('Must have equal len keys and value '
                                          'when setting with an ndarray')
@@ -494,12 +626,19 @@ def can_do_equal_len():
                 # if we are setting on the info axis ONLY
                 # set using those methods to avoid block-splitting
                 # logic here
-                if len(indexer) > info_axis and is_integer(indexer[info_axis]) and all(
-                    is_null_slice(idx) for i, idx in enumerate(indexer) if i != info_axis):
+                if (len(indexer) > info_axis and
+                        is_integer(indexer[info_axis]) and
+                        all(com.is_null_slice(idx)
+                            for i, idx in enumerate(indexer)
+                            if i != info_axis) and
+                        item_labels.is_unique):
                     self.obj[item_labels[indexer[info_axis]]] = value
                     return
 
             if isinstance(value, (ABCSeries, dict)):
+                # TODO(EA): ExtensionBlock.setitem this causes issues with
+                # setting for extensionarrays that store dicts. Need to decide
+                # if it's worth supporting that.
                 value = self._align_series(indexer, Series(value))
 
             elif isinstance(value, ABCDataFrame):
@@ -513,21 +652,43 @@ def can_do_equal_len():
 
             # actually do the set
             self.obj._consolidate_inplace()
-            self.obj._data = self.obj._data.setitem(indexer=indexer, value=value)
+            self.obj._data = self.obj._data.setitem(indexer=indexer,
+                                                    value=value)
             self.obj._maybe_update_cacher(clear=True)
 
-    def _align_series(self, indexer, ser):
-        # indexer to assign Series can be tuple, slice, scalar
+    def _align_series(self, indexer, ser, multiindex_indexer=False):
+        """
+        Parameters
+        ----------
+        indexer : tuple, slice, scalar
+            The indexer used to get the locations that will be set to
+            `ser`
+
+        ser : pd.Series
+            The values to assign to the locations specified by `indexer`
+
+        multiindex_indexer : boolean, optional
+            Defaults to False. Should be set to True if `indexer` was from
+            a `pd.MultiIndex`, to avoid unnecessary broadcasting.
+
+
+        Returns:
+        --------
+        `np.array` of `ser` broadcast to the appropriate shape for assignment
+        to the locations selected by `indexer`
+
+        """
         if isinstance(indexer, (slice, np.ndarray, list, Index)):
             indexer = tuple([indexer])
 
         if isinstance(indexer, tuple):
 
             # flatten np.ndarray indexers
-            ravel = lambda i: i.ravel() if isinstance(i, np.ndarray) else i
+            def ravel(i):
+                return i.ravel() if isinstance(i, np.ndarray) else i
             indexer = tuple(map(ravel, indexer))
 
-            aligners = [not is_null_slice(idx) for idx in indexer]
+            aligners = [not com.is_null_slice(idx) for idx in indexer]
             sum_aligners = sum(aligners)
             single_aligner = sum_aligners == 1
             is_frame = self.obj.ndim == 2
@@ -551,11 +712,11 @@ def _align_series(self, indexer, ser):
             # we have a frame, with multiple indexers on both axes; and a
             # series, so need to broadcast (see GH5206)
             if (sum_aligners == self.ndim and
-                    all([com.is_sequence(_) for _ in indexer])):
+                    all(is_sequence(_) for _ in indexer)):
                 ser = ser.reindex(obj.axes[0][indexer[0]], copy=True)._values
 
                 # single indexer
-                if len(indexer) > 1:
+                if len(indexer) > 1 and not multiindex_indexer:
                     l = len(indexer[1])
                     ser = np.tile(ser, l).reshape(l, -1).T
 
@@ -565,8 +726,8 @@ def _align_series(self, indexer, ser):
                 ax = obj.axes[i]
 
                 # multiple aligners (or null slices)
-                if com.is_sequence(idx) or isinstance(idx, slice):
-                    if single_aligner and is_null_slice(idx):
+                if is_sequence(idx) or isinstance(idx, slice):
+                    if single_aligner and com.is_null_slice(idx):
                         continue
                     new_ix = ax[idx]
                     if not is_list_like_indexer(new_ix):
@@ -611,7 +772,7 @@ def _align_series(self, indexer, ser):
 
                     return ser
 
-        elif np.isscalar(indexer):
+        elif is_scalar(indexer):
             ax = self.obj._get_axis(1)
 
             if ser.index.equals(ax):
@@ -627,19 +788,22 @@ def _align_frame(self, indexer, df):
 
         if isinstance(indexer, tuple):
 
-            aligners = [not is_null_slice(idx) for idx in indexer]
+            aligners = [not com.is_null_slice(idx) for idx in indexer]
             sum_aligners = sum(aligners)
-            single_aligner = sum_aligners == 1
+            # TODO: single_aligner is not used
+            single_aligner = sum_aligners == 1  # noqa
 
             idx, cols = None, None
             sindexers = []
             for i, ix in enumerate(indexer):
                 ax = self.obj.axes[i]
-                if com.is_sequence(ix) or isinstance(ix, slice):
+                if is_sequence(ix) or isinstance(ix, slice):
+                    if isinstance(ix, np.ndarray):
+                        ix = ix.ravel()
                     if idx is None:
-                        idx = ax[ix].ravel()
+                        idx = ax[ix]
                     elif cols is None:
-                        cols = ax[ix].ravel()
+                        cols = ax[ix]
                     else:
                         break
                 else:
@@ -668,8 +832,8 @@ def _align_frame(self, indexer, df):
                     val = df.reindex(idx, columns=cols)._values
                 return val
 
-        elif ((isinstance(indexer, slice) or is_list_like_indexer(indexer))
-              and is_frame):
+        elif ((isinstance(indexer, slice) or is_list_like_indexer(indexer)) and
+              is_frame):
             ax = self.obj.index[indexer]
             if df.index.equals(ax):
                 val = df.copy()._values
@@ -677,14 +841,16 @@ def _align_frame(self, indexer, df):
 
                 # we have a multi-index and are trying to align
                 # with a particular, level GH3738
-                if isinstance(ax, MultiIndex) and isinstance(
-                    df.index, MultiIndex) and ax.nlevels != df.index.nlevels:
-                    raise TypeError("cannot align on a multi-index with out specifying the join levels")
+                if (isinstance(ax, MultiIndex) and
+                        isinstance(df.index, MultiIndex) and
+                        ax.nlevels != df.index.nlevels):
+                    raise TypeError("cannot align on a multi-index with out "
+                                    "specifying the join levels")
 
                 val = df.reindex(index=ax)._values
             return val
 
-        elif np.isscalar(indexer) and is_panel:
+        elif is_scalar(indexer) and is_panel:
             idx = self.obj.axes[1]
             cols = self.obj.axes[2]
 
@@ -699,8 +865,9 @@ def _align_frame(self, indexer, df):
         raise ValueError('Incompatible indexer with DataFrame')
 
     def _align_panel(self, indexer, df):
-        is_frame = self.obj.ndim == 2
-        is_panel = self.obj.ndim >= 3
+        # TODO: is_frame, is_panel are unused
+        is_frame = self.obj.ndim == 2  # noqa
+        is_panel = self.obj.ndim >= 3  # noqa
         raise NotImplementedError("cannot set using an indexer with a Panel "
                                   "yet!")
 
@@ -723,7 +890,7 @@ def _getitem_tuple(self, tup):
             if i >= self.obj.ndim:
                 raise IndexingError('Too many indexers')
 
-            if is_null_slice(key):
+            if com.is_null_slice(key):
                 continue
 
             retval = getattr(retval, self.name)._getitem_axis(key, axis=i)
@@ -731,66 +898,59 @@ def _getitem_tuple(self, tup):
         return retval
 
     def _multi_take_opportunity(self, tup):
-        from pandas.core.generic import NDFrame
-
-        # ugly hack for GH #836
-        if not isinstance(self.obj, NDFrame):
-            return False
-
+        """
+        Check whether there is the possibility to use ``_multi_take``.
+        Currently the limit is that all axes being indexed must be indexed with
+        list-likes.
+
+        Parameters
+        ----------
+        tup : tuple
+            Tuple of indexers, one per axis
+
+        Returns
+        -------
+        boolean: Whether the current indexing can be passed through _multi_take
+        """
         if not all(is_list_like_indexer(x) for x in tup):
             return False
 
         # just too complicated
-        for indexer, ax in zip(tup, self.obj._data.axes):
-            if isinstance(ax, MultiIndex):
-                return False
-            elif is_bool_indexer(indexer):
-                return False
-            elif not ax.is_unique:
-                return False
+        if any(com.is_bool_indexer(x) for x in tup):
+            return False
 
         return True
 
     def _multi_take(self, tup):
-        """ create the reindex map for our objects, raise the _exception if we
-        can't create the indexer
         """
-        try:
-            o = self.obj
-            d = dict([
-                (a, self._convert_for_reindex(t, axis=o._get_axis_number(a)))
-                for t, a in zip(tup, o._AXIS_ORDERS)
-            ])
-            return o.reindex(**d)
-        except:
-            raise self._exception
-
-    def _convert_for_reindex(self, key, axis=0):
-        labels = self.obj._get_axis(axis)
-
-        if is_bool_indexer(key):
-            key = check_bool_indexer(labels, key)
-            return labels[key]
-        else:
-            if isinstance(key, Index):
-                # want Index objects to pass through untouched
-                keyarr = key
-            else:
-                # asarray can be unsafe, NumPy strings are weird
-                keyarr = _asarray_tuplesafe(key)
-
-            if is_integer_dtype(keyarr) and not labels.is_integer():
-                keyarr = com._ensure_platform_int(keyarr)
-                return labels.take(keyarr)
+        Create the indexers for the passed tuple of keys, and execute the take
+        operation. This allows the take operation to be executed all at once -
+        rather than once for each dimension - improving efficiency.
+
+        Parameters
+        ----------
+        tup : tuple
+            Tuple of indexers, one per axis
+
+        Returns
+        -------
+        values: same type as the object being indexed
+        """
+        # GH 836
+        o = self.obj
+        d = {axis: self._get_listlike_indexer(key, axis)
+             for (key, axis) in zip(tup, o._AXIS_ORDERS)}
+        return o._reindex_with_indexers(d, copy=True, allow_dups=True)
 
-            return keyarr
+    def _convert_for_reindex(self, key, axis=None):
+        return key
 
     def _handle_lowerdim_multi_index_axis0(self, tup):
         # we have an axis0 multi-index, handle or raise
 
         try:
             # fast path for series or for tup devoid of slices
-            return self._get_label(tup, axis=0)
+            return self._get_label(tup, axis=self.axis)
         except TypeError:
             # slices are unhashable
             pass
@@ -818,7 +978,9 @@ def _getitem_lowerdim(self, tup):
 
         # we maybe be using a tuple to represent multiple dimensions here
         ax0 = self.obj._get_axis(0)
-        if isinstance(ax0, MultiIndex):
+        # ...but iloc should handle the tuple as simple integer-location
+        # instead of checking it as multiindex representation (GH 13797)
+        if isinstance(ax0, MultiIndex) and self.name != 'iloc':
             result = self._handle_lowerdim_multi_index_axis0(tup)
             if result is not None:
                 return result
@@ -847,14 +1009,18 @@ def _getitem_lowerdim(self, tup):
 
                     # unfortunately need an odious kludge here because of
                     # DataFrame transposing convention
-                    if (isinstance(section, ABCDataFrame) and i > 0
-                            and len(new_key) == 2):
+                    if (isinstance(section, ABCDataFrame) and i > 0 and
+                            len(new_key) == 2):
                         a, b = new_key
                         new_key = b, a
 
                     if len(new_key) == 1:
                         new_key, = new_key
 
+                # Slices should return views, but calling iloc/loc with a null
+                # slice returns a new object.
+                if com.is_null_slice(new_key):
+                    return section
                 # This is an elided recursive call to iloc/loc/etc'
                 return getattr(section, self.name)[new_key]
 
@@ -872,8 +1038,9 @@ def _getitem_nested_tuple(self, tup):
             if result is not None:
                 return result
 
-            # this is a series with a multi-index specified a tuple of selectors
-            return self._getitem_axis(tup, axis=0)
+            # this is a series with a multi-index specified a tuple of
+            # selectors
+            return self._getitem_axis(tup, axis=self.axis)
 
         # handle the multi-axis by taking sections and reducing
         # this is iterative
@@ -881,7 +1048,7 @@ def _getitem_nested_tuple(self, tup):
         axis = 0
         for i, key in enumerate(tup):
 
-            if is_null_slice(key):
+            if com.is_null_slice(key):
                 axis += 1
                 continue
 
@@ -890,7 +1057,7 @@ def _getitem_nested_tuple(self, tup):
             axis += 1
 
             # if we have a scalar, we are done
-            if np.isscalar(obj) or not hasattr(obj,'ndim'):
+            if is_scalar(obj) or not hasattr(obj, 'ndim'):
                 break
 
             # has the dim of the obj changed?
@@ -907,22 +1074,31 @@ def _getitem_nested_tuple(self, tup):
 
         return obj
 
-    def _getitem_axis(self, key, axis=0):
+    def _getitem_axis(self, key, axis=None):
+
+        if axis is None:
+            axis = self.axis or 0
 
-        if self._should_validate_iterable(axis):
-            self._has_valid_type(key, axis)
+        if is_iterator(key):
+            key = list(key)
+        self._validate_key(key, axis)
 
         labels = self.obj._get_axis(axis)
         if isinstance(key, slice):
             return self._get_slice_axis(key, axis=axis)
-        elif is_list_like_indexer(key) and not (isinstance(key, tuple) and
-                                        isinstance(labels, MultiIndex)):
+        elif (is_list_like_indexer(key) and
+              not (isinstance(key, tuple) and
+                   isinstance(labels, MultiIndex))):
 
             if hasattr(key, 'ndim') and key.ndim > 1:
                 raise ValueError('Cannot index with multidimensional key')
 
             return self._getitem_iterable(key, axis=axis)
         else:
+
+            # maybe coerce a float scalar to integer
+            key = labels._maybe_cast_indexer(key)
+
             if is_integer(key):
                 if axis == 0 and isinstance(labels, MultiIndex):
                     try:
@@ -937,83 +1113,171 @@ def _getitem_axis(self, key, axis=0):
 
             return self._get_label(key, axis=axis)
 
-    def _getitem_iterable(self, key, axis=0):
-        if self._should_validate_iterable(axis):
-            self._has_valid_type(key, axis)
+    def _get_listlike_indexer(self, key, axis, raise_missing=False):
+        """
+        Transform a list-like of keys into a new index and an indexer.
+
+        Parameters
+        ----------
+        key : list-like
+            Target labels
+        axis: int
+            Dimension on which the indexing is being made
+        raise_missing: bool
+            Whether to raise a KeyError if some labels are not found. Will be
+            removed in the future, and then this method will always behave as
+            if raise_missing=True.
+
+        Raises
+        ------
+        KeyError
+            If at least one key was requested but none was found, and
+            raise_missing=True.
+
+        Returns
+        -------
+        keyarr: Index
+            New index (coinciding with 'key' if the axis is unique)
+        values : array-like
+            An indexer for the return object; -1 denotes keys not found
+        """
+        o = self.obj
+        ax = o._get_axis(axis)
+
+        # Have the index compute an indexer or return None
+        # if it cannot handle:
+        indexer, keyarr = ax._convert_listlike_indexer(key,
+                                                       kind=self.name)
+        # We only act on all found values:
+        if indexer is not None and (indexer != -1).all():
+            self._validate_read_indexer(key, indexer, axis,
+                                        raise_missing=raise_missing)
+            return ax[indexer], indexer
+
+        if ax.is_unique:
+            # If we are trying to get actual keys from empty Series, we
+            # patiently wait for a KeyError later on - otherwise, convert
+            if len(ax) or not len(key):
+                key = self._convert_for_reindex(key, axis)
+            indexer = ax.get_indexer_for(key)
+            keyarr = ax.reindex(keyarr)[0]
+        else:
+            keyarr, indexer, new_indexer = ax._reindex_non_unique(keyarr)
+
+        self._validate_read_indexer(keyarr, indexer,
+                                    o._get_axis_number(axis),
+                                    raise_missing=raise_missing)
+        return keyarr, indexer
+
+    def _getitem_iterable(self, key, axis=None):
+        """
+        Index current object with an an iterable key (which can be a boolean
+        indexer, or a collection of keys).
+
+        Parameters
+        ----------
+        key : iterable
+            Target labels, or boolean indexer
+        axis: int, default None
+            Dimension on which the indexing is being made
+
+        Raises
+        ------
+        KeyError
+            If no key was found. Will change in the future to raise if not all
+            keys were found.
+        IndexingError
+            If the boolean indexer is unalignable with the object being
+            indexed.
+
+        Returns
+        -------
+        scalar, DataFrame, or Series: indexed value(s),
+        """
+
+        if axis is None:
+            axis = self.axis or 0
+
+        self._validate_key(key, axis)
 
         labels = self.obj._get_axis(axis)
 
-        if is_bool_indexer(key):
+        if com.is_bool_indexer(key):
+            # A boolean indexer
             key = check_bool_indexer(labels, key)
             inds, = key.nonzero()
-            return self.obj.take(inds, axis=axis, convert=False)
+            return self.obj._take(inds, axis=axis)
         else:
-            if isinstance(key, Index):
-                # want Index objects to pass through untouched
-                keyarr = key
-            else:
-                # asarray can be unsafe, NumPy strings are weird
-                keyarr = _asarray_tuplesafe(key)
-
-            # have the index handle the indexer and possibly return
-            # an indexer or raising
-            indexer = labels._convert_list_indexer(keyarr, kind=self.name)
-            if indexer is not None:
-                return self.obj.take(indexer, axis=axis)
-
-            # this is not the most robust, but...
-            if (isinstance(labels, MultiIndex) and len(keyarr) and
-                    not isinstance(keyarr[0], tuple)):
-                level = 0
-            else:
-                level = None
+            # A collection of keys
+            keyarr, indexer = self._get_listlike_indexer(key, axis,
+                                                         raise_missing=False)
+            return self.obj._reindex_with_indexers({axis: [keyarr, indexer]},
+                                                   copy=True, allow_dups=True)
 
-            # existing labels are unique and indexer are unique
-            if labels.is_unique and Index(keyarr).is_unique:
-
-                try:
-                    result = self.obj.reindex_axis(keyarr, axis=axis, level=level)
-
-                    # this is an error as we are trying to find
-                    # keys in a multi-index that don't exist
-                    if isinstance(labels, MultiIndex) and level is not None:
-                        if hasattr(result,'ndim') and not np.prod(result.shape) and len(keyarr):
-                            raise KeyError("cannot index a multi-index axis with these keys")
-
-                    return result
+    def _validate_read_indexer(self, key, indexer, axis, raise_missing=False):
+        """
+        Check that indexer can be used to return a result (e.g. at least one
+        element was found, unless the list of keys was actually empty).
+
+        Parameters
+        ----------
+        key : list-like
+            Target labels (only used to show correct error message)
+        indexer: array-like of booleans
+            Indices corresponding to the key (with -1 indicating not found)
+        axis: int
+            Dimension on which the indexing is being made
+        raise_missing: bool
+            Whether to raise a KeyError if some labels are not found. Will be
+            removed in the future, and then this method will always behave as
+            if raise_missing=True.
+
+        Raises
+        ------
+        KeyError
+            If at least one key was requested but none was found, and
+            raise_missing=True.
+        """
 
-                except AttributeError:
+        ax = self.obj._get_axis(axis)
 
-                    # Series
-                    if axis != 0:
-                        raise AssertionError('axis must be 0')
-                    return self.obj.reindex(keyarr, level=level)
+        if len(key) == 0:
+            return
 
-            # existing labels are non-unique
-            else:
+        # Count missing values:
+        missing = (indexer < 0).sum()
 
-                # reindex with the specified axis
-                if axis + 1 > self.obj.ndim:
-                    raise AssertionError("invalid indexing error with "
-                                         "non-unique index")
+        if missing:
+            if missing == len(indexer):
+                raise KeyError(
+                    u"None of [{key}] are in the [{axis}]".format(
+                        key=key, axis=self.obj._get_axis_name(axis)))
 
-                new_target, indexer, new_indexer = labels._reindex_non_unique(keyarr)
+            # We (temporarily) allow for some missing keys with .loc, except in
+            # some cases (e.g. setting) in which "raise_missing" will be False
+            if not(self.name == 'loc' and not raise_missing):
+                not_found = list(set(key) - set(ax))
+                raise KeyError("{} not in index".format(not_found))
 
-                if new_indexer is not None:
-                    result = self.obj.take(indexer[indexer!=-1], axis=axis,
-                                           convert=False)
+            # we skip the warning on Categorical/Interval
+            # as this check is actually done (check for
+            # non-missing values), but a bit later in the
+            # code, so we want to avoid warning & then
+            # just raising
 
-                    result = result._reindex_with_indexers({
-                        axis: [new_target, new_indexer]
-                        }, copy=True, allow_dups=True)
+            _missing_key_warning = textwrap.dedent("""
+            Passing list-likes to .loc or [] with any missing label will raise
+            KeyError in the future, you can use .reindex() as an alternative.
 
-                else:
-                    result = self.obj.take(indexer, axis=axis,
-                                           convert=False)
+            See the documentation here:
+            https://pandas.pydata.org/pandas-docs/stable/indexing.html#deprecate-loc-reindex-listlike""")  # noqa
 
-                return result
+            if not (ax.is_categorical() or ax.is_interval()):
+                warnings.warn(_missing_key_warning,
+                              FutureWarning, stacklevel=6)
 
-    def _convert_to_indexer(self, obj, axis=0, is_setter=False):
+    def _convert_to_indexer(self, obj, axis=None, is_setter=False,
+                            raise_missing=False):
         """
         Convert indexing key into something we can use to do actual fancy
         indexing on an ndarray
@@ -1024,14 +1288,26 @@ def _convert_to_indexer(self, obj, axis=0, is_setter=False):
         ix[['foo', 'bar', 'baz']] -> [i, j, k] (indices of foo, bar, baz)
 
         Going by Zen of Python?
-        "In the face of ambiguity, refuse the temptation to guess."
+        'In the face of ambiguity, refuse the temptation to guess.'
         raise AmbiguousIndexError with integer labels?
         - No, prefer label-based indexing
         """
+        if axis is None:
+            axis = self.axis or 0
+
         labels = self.obj._get_axis(axis)
 
-        # if we are a scalar indexer and not type correct raise
-        obj = self._convert_scalar_indexer(obj, axis)
+        if isinstance(obj, slice):
+            return self._convert_slice_indexer(obj, axis)
+
+        # try to find out correct indexer, if not type correct raise
+        try:
+            obj = self._convert_scalar_indexer(obj, axis)
+        except TypeError:
+
+            # but we will allow setting
+            if is_setter:
+                pass
 
         # see if we are positional in nature
         is_int_index = labels.is_integer()
@@ -1070,58 +1346,20 @@ def _convert_to_indexer(self, obj, axis=0, is_setter=False):
 
             return obj
 
-        if isinstance(obj, slice):
-            return self._convert_slice_indexer(obj, axis)
-
-        elif is_nested_tuple(obj, labels):
+        if is_nested_tuple(obj, labels):
             return labels.get_locs(obj)
+
         elif is_list_like_indexer(obj):
-            if is_bool_indexer(obj):
+
+            if com.is_bool_indexer(obj):
                 obj = check_bool_indexer(labels, obj)
                 inds, = obj.nonzero()
                 return inds
             else:
-                if isinstance(obj, Index):
-                    objarr = obj.values
-                else:
-                    objarr = _asarray_tuplesafe(obj)
-
-                # The index may want to handle a list indexer differently
-                # by returning an indexer or raising
-                indexer = labels._convert_list_indexer(objarr, kind=self.name)
-                if indexer is not None:
-                    return indexer
-
-                # this is not the most robust, but...
-                if (isinstance(labels, MultiIndex) and
-                        not isinstance(objarr[0], tuple)):
-                    level = 0
-                    _, indexer = labels.reindex(objarr, level=level)
-
-                    # take all
-                    if indexer is None:
-                        indexer = np.arange(len(labels))
-
-                    check = labels.levels[0].get_indexer(objarr)
-                else:
-                    level = None
-
-                    # unique index
-                    if labels.is_unique:
-                        indexer = check = labels.get_indexer(objarr)
-
-                    # non-unique (dups)
-                    else:
-                        (indexer,
-                         missing) = labels.get_indexer_non_unique(objarr)
-                        check = indexer
-
-                mask = check == -1
-                if mask.any():
-                    raise KeyError('%s not in index' % objarr[mask])
-
-                return _values_from_object(indexer)
-
+                # When setting, missing keys are not allowed, even with .loc:
+                kwargs = {'raise_missing': True if is_setter else
+                          raise_missing}
+                return self._get_listlike_indexer(obj, axis, **kwargs)[1]
         else:
             try:
                 return labels.get_loc(obj)
@@ -1136,24 +1374,29 @@ def _tuplify(self, loc):
         tup[0] = loc
         return tuple(tup)
 
-    def _get_slice_axis(self, slice_obj, axis=0):
+    def _get_slice_axis(self, slice_obj, axis=None):
         obj = self.obj
 
+        if axis is None:
+            axis = self.axis or 0
+
         if not need_slice(slice_obj):
-            return obj
+            return obj.copy(deep=False)
         indexer = self._convert_slice_indexer(slice_obj, axis)
 
         if isinstance(indexer, slice):
             return self._slice(indexer, axis=axis, kind='iloc')
         else:
-            return self.obj.take(indexer, axis=axis, convert=False)
+            return self.obj._take(indexer, axis=axis)
 
 
 class _IXIndexer(_NDFrameIndexer):
-
     """A primarily label-location based indexer, with integer position
     fallback.
 
+    Warning: Starting in 0.20.0, the .ix indexer is deprecated, in
+    favor of the more strict .iloc and .loc indexers.
+
     ``.ix[]`` supports mixed integer and label based access. It is
     primarily label based, but will fall back to integer positional
     access unless the corresponding axis is of integer type.
@@ -1161,7 +1404,7 @@ class _IXIndexer(_NDFrameIndexer):
     ``.ix`` is the most general indexer and will support any of the
     inputs in ``.loc`` and ``.iloc``. ``.ix`` also supports floating
     point label schemes. ``.ix`` is exceptionally useful when dealing
-    with mixed positional and label based hierachical indexes.
+    with mixed positional and label based hierarchical indexes.
 
     However, when an axis is integer based, ONLY label based access
     and not positional access is supported. Thus, in such cases, it's
@@ -1171,11 +1414,26 @@ class _IXIndexer(_NDFrameIndexer):
 
     """
 
-    def _has_valid_type(self, key, axis):
+    def __init__(self, name, obj):
+
+        _ix_deprecation_warning = textwrap.dedent("""
+            .ix is deprecated. Please use
+            .loc for label based indexing or
+            .iloc for positional indexing
+
+            See the documentation here:
+            http://pandas.pydata.org/pandas-docs/stable/indexing.html#ix-indexer-is-deprecated""")  # noqa
+
+        warnings.warn(_ix_deprecation_warning,
+                      DeprecationWarning, stacklevel=2)
+        super(_IXIndexer, self).__init__(name, obj)
+
+    @Appender(_NDFrameIndexer._validate_key.__doc__)
+    def _validate_key(self, key, axis):
         if isinstance(key, slice):
             return True
 
-        elif is_bool_indexer(key):
+        elif com.is_bool_indexer(key):
             return True
 
         elif is_list_like_indexer(key):
@@ -1187,47 +1445,112 @@ def _has_valid_type(self, key, axis):
 
         return True
 
+    def _convert_for_reindex(self, key, axis=None):
+        """
+        Transform a list of keys into a new array ready to be used as axis of
+        the object we return (e.g. including NaNs).
+
+        Parameters
+        ----------
+        key : list-like
+            Target labels
+        axis: int
+            Where the indexing is being made
+
+        Returns
+        -------
+        list-like of labels
+        """
+
+        if axis is None:
+            axis = self.axis or 0
+        labels = self.obj._get_axis(axis)
+
+        if com.is_bool_indexer(key):
+            key = check_bool_indexer(labels, key)
+            return labels[key]
+
+        if isinstance(key, Index):
+            keyarr = labels._convert_index_indexer(key)
+        else:
+            # asarray can be unsafe, NumPy strings are weird
+            keyarr = com._asarray_tuplesafe(key)
+
+        if is_integer_dtype(keyarr):
+            # Cast the indexer to uint64 if possible so
+            # that the values returned from indexing are
+            # also uint64.
+            keyarr = labels._convert_arr_indexer(keyarr)
+
+            if not labels.is_integer():
+                keyarr = _ensure_platform_int(keyarr)
+                return labels.take(keyarr)
+
+        return keyarr
+
 
 class _LocationIndexer(_NDFrameIndexer):
     _exception = Exception
 
     def __getitem__(self, key):
         if type(key) is tuple:
+            key = tuple(com._apply_if_callable(x, self.obj)
+                        for x in key)
+            try:
+                if self._is_scalar_access(key):
+                    return self._getitem_scalar(key)
+            except (KeyError, IndexError):
+                pass
             return self._getitem_tuple(key)
         else:
-            return self._getitem_axis(key, axis=0)
+            # we by definition only have the 0th axis
+            axis = self.axis or 0
+
+            maybe_callable = com._apply_if_callable(key, self.obj)
+            return self._getitem_axis(maybe_callable, axis=axis)
 
-    def _getitem_axis(self, key, axis=0):
+    def _is_scalar_access(self, key):
         raise NotImplementedError()
 
-    def _getbool_axis(self, key, axis=0):
+    def _getitem_scalar(self, key):
+        raise NotImplementedError()
+
+    def _getitem_axis(self, key, axis=None):
+        raise NotImplementedError()
+
+    def _getbool_axis(self, key, axis=None):
+        if axis is None:
+            axis = self.axis or 0
         labels = self.obj._get_axis(axis)
         key = check_bool_indexer(labels, key)
         inds, = key.nonzero()
         try:
-            return self.obj.take(inds, axis=axis, convert=False)
+            return self.obj._take(inds, axis=axis)
         except Exception as detail:
             raise self._exception(detail)
 
-    def _get_slice_axis(self, slice_obj, axis=0):
+    def _get_slice_axis(self, slice_obj, axis=None):
         """ this is pretty simple as we just have to deal with labels """
+        if axis is None:
+            axis = self.axis or 0
+
         obj = self.obj
         if not need_slice(slice_obj):
-            return obj
+            return obj.copy(deep=False)
 
         labels = obj._get_axis(axis)
         indexer = labels.slice_indexer(slice_obj.start, slice_obj.stop,
-                                       slice_obj.step)
+                                       slice_obj.step, kind=self.name)
 
         if isinstance(indexer, slice):
             return self._slice(indexer, axis=axis, kind='iloc')
         else:
-            return self.obj.take(indexer, axis=axis, convert=False)
+            return self.obj._take(indexer, axis=axis)
 
 
 class _LocIndexer(_LocationIndexer):
-
-    """Purely label-location based indexer for selection by label.
+    """
+    Access a group of rows and columns by label(s) or a boolean array.
 
     ``.loc[]`` is primarily label based, but may also be used with a
     boolean array.
@@ -1238,14 +1561,229 @@ class _LocIndexer(_LocationIndexer):
       interpreted as a *label* of the index, and **never** as an
       integer position along the index).
     - A list or array of labels, e.g. ``['a', 'b', 'c']``.
-    - A slice object with labels, e.g. ``'a':'f'`` (note that contrary
-      to usual python slices, **both** the start and the stop are included!).
-    - A boolean array.
+    - A slice object with labels, e.g. ``'a':'f'``.
+
+      .. warning:: Note that contrary to usual python slices, **both** the
+          start and the stop are included
 
-    ``.loc`` will raise a ``KeyError`` when the items are not found.
+    - A boolean array of the same length as the axis being sliced,
+      e.g. ``[True, False, True]``.
+    - A ``callable`` function with one argument (the calling Series, DataFrame
+      or Panel) and that returns valid output for indexing (one of the above)
 
     See more at :ref:`Selection by Label <indexing.label>`
 
+    See Also
+    --------
+    DataFrame.at : Access a single value for a row/column label pair
+    DataFrame.iloc : Access group of rows and columns by integer position(s)
+    DataFrame.xs : Returns a cross-section (row(s) or column(s)) from the
+        Series/DataFrame.
+    Series.loc : Access group of values using labels
+
+    Examples
+    --------
+    **Getting values**
+
+    >>> df = pd.DataFrame([[1, 2], [4, 5], [7, 8]],
+    ...      index=['cobra', 'viper', 'sidewinder'],
+    ...      columns=['max_speed', 'shield'])
+    >>> df
+                max_speed  shield
+    cobra               1       2
+    viper               4       5
+    sidewinder          7       8
+
+    Single label. Note this returns the row as a Series.
+
+    >>> df.loc['viper']
+    max_speed    4
+    shield       5
+    Name: viper, dtype: int64
+
+    List of labels. Note using ``[[]]`` returns a DataFrame.
+
+    >>> df.loc[['viper', 'sidewinder']]
+                max_speed  shield
+    viper               4       5
+    sidewinder          7       8
+
+    Single label for row and column
+
+    >>> df.loc['cobra', 'shield']
+    2
+
+    Slice with labels for row and single label for column. As mentioned
+    above, note that both the start and stop of the slice are included.
+
+    >>> df.loc['cobra':'viper', 'max_speed']
+    cobra    1
+    viper    4
+    Name: max_speed, dtype: int64
+
+    Boolean list with the same length as the row axis
+
+    >>> df.loc[[False, False, True]]
+                max_speed  shield
+    sidewinder          7       8
+
+    Conditional that returns a boolean Series
+
+    >>> df.loc[df['shield'] > 6]
+                max_speed  shield
+    sidewinder          7       8
+
+    Conditional that returns a boolean Series with column labels specified
+
+    >>> df.loc[df['shield'] > 6, ['max_speed']]
+                max_speed
+    sidewinder          7
+
+    Callable that returns a boolean Series
+
+    >>> df.loc[lambda df: df['shield'] == 8]
+                max_speed  shield
+    sidewinder          7       8
+
+    **Setting values**
+
+    Set value for all items matching the list of labels
+
+    >>> df.loc[['viper', 'sidewinder'], ['shield']] = 50
+    >>> df
+                max_speed  shield
+    cobra               1       2
+    viper               4      50
+    sidewinder          7      50
+
+    Set value for an entire row
+
+    >>> df.loc['cobra'] = 10
+    >>> df
+                max_speed  shield
+    cobra              10      10
+    viper               4      50
+    sidewinder          7      50
+
+    Set value for an entire column
+
+    >>> df.loc[:, 'max_speed'] = 30
+    >>> df
+                max_speed  shield
+    cobra              30      10
+    viper              30      50
+    sidewinder         30      50
+
+    Set value for rows matching callable condition
+
+    >>> df.loc[df['shield'] > 35] = 0
+    >>> df
+                max_speed  shield
+    cobra              30      10
+    viper               0       0
+    sidewinder          0       0
+
+    **Getting values on a DataFrame with an index that has integer labels**
+
+    Another example using integers for the index
+
+    >>> df = pd.DataFrame([[1, 2], [4, 5], [7, 8]],
+    ...      index=[7, 8, 9], columns=['max_speed', 'shield'])
+    >>> df
+       max_speed  shield
+    7          1       2
+    8          4       5
+    9          7       8
+
+    Slice with integer labels for rows. As mentioned above, note that both
+    the start and stop of the slice are included.
+
+    >>> df.loc[7:9]
+       max_speed  shield
+    7          1       2
+    8          4       5
+    9          7       8
+
+    **Getting values with a MultiIndex**
+
+    A number of examples using a DataFrame with a MultiIndex
+
+    >>> tuples = [
+    ...    ('cobra', 'mark i'), ('cobra', 'mark ii'),
+    ...    ('sidewinder', 'mark i'), ('sidewinder', 'mark ii'),
+    ...    ('viper', 'mark ii'), ('viper', 'mark iii')
+    ... ]
+    >>> index = pd.MultiIndex.from_tuples(tuples)
+    >>> values = [[12, 2], [0, 4], [10, 20],
+    ...         [1, 4], [7, 1], [16, 36]]
+    >>> df = pd.DataFrame(values, columns=['max_speed', 'shield'], index=index)
+    >>> df
+                         max_speed  shield
+    cobra      mark i           12       2
+               mark ii           0       4
+    sidewinder mark i           10      20
+               mark ii           1       4
+    viper      mark ii           7       1
+               mark iii         16      36
+
+    Single label. Note this returns a DataFrame with a single index.
+
+    >>> df.loc['cobra']
+             max_speed  shield
+    mark i          12       2
+    mark ii          0       4
+
+    Single index tuple. Note this returns a Series.
+
+    >>> df.loc[('cobra', 'mark ii')]
+    max_speed    0
+    shield       4
+    Name: (cobra, mark ii), dtype: int64
+
+    Single label for row and column. Similar to passing in a tuple, this
+    returns a Series.
+
+    >>> df.loc['cobra', 'mark i']
+    max_speed    12
+    shield        2
+    Name: (cobra, mark i), dtype: int64
+
+    Single tuple. Note using ``[[]]`` returns a DataFrame.
+
+    >>> df.loc[[('cobra', 'mark ii')]]
+                   max_speed  shield
+    cobra mark ii          0       4
+
+    Single tuple for the index with a single label for the column
+
+    >>> df.loc[('cobra', 'mark i'), 'shield']
+    2
+
+    Slice from index tuple to single label
+
+    >>> df.loc[('cobra', 'mark i'):'viper']
+                         max_speed  shield
+    cobra      mark i           12       2
+               mark ii           0       4
+    sidewinder mark i           10      20
+               mark ii           1       4
+    viper      mark ii           7       1
+               mark iii         16      36
+
+    Slice from index tuple to index tuple
+
+    >>> df.loc[('cobra', 'mark i'):('viper', 'mark ii')]
+                        max_speed  shield
+    cobra      mark i          12       2
+               mark ii          0       4
+    sidewinder mark i          10      20
+               mark ii          1       4
+    viper      mark ii          7       1
+
+    Raises
+    ------
+    KeyError:
+        when any items are not found
     """
 
     _valid_types = ("labels (MUST BE IN THE INDEX), slices of labels (BOTH "
@@ -1253,78 +1791,120 @@ class _LocIndexer(_LocationIndexer):
                     "index is integers), listlike of labels, boolean")
     _exception = KeyError
 
-    def _has_valid_type(self, key, axis):
-        ax = self.obj._get_axis(axis)
+    @Appender(_NDFrameIndexer._validate_key.__doc__)
+    def _validate_key(self, key, axis):
 
-        # valid for a label where all labels are in the index
-        # slice of lables (where start-end in labels)
-        # slice of integers (only if in the lables)
+        # valid for a collection of labels (we check their presence later)
+        # slice of labels (where start-end in labels)
+        # slice of integers (only if in the labels)
         # boolean
 
         if isinstance(key, slice):
-            return True
+            return
 
-        elif is_bool_indexer(key):
-            return True
+        if com.is_bool_indexer(key):
+            return
 
-        elif is_list_like_indexer(key):
+        if not is_list_like_indexer(key):
+            self._convert_scalar_indexer(key, axis)
 
-            # mi is just a passthru
-            if isinstance(key, tuple) and isinstance(ax, MultiIndex):
-                return True
+    def _is_scalar_access(self, key):
+        # this is a shortcut accessor to both .loc and .iloc
+        # that provide the equivalent access of .at and .iat
+        # a) avoid getting things via sections and (to minimize dtype changes)
+        # b) provide a performant path
+        if not hasattr(key, '__len__'):
+            return False
 
-            # TODO: don't check the entire key unless necessary
-            if len(key) and np.all(ax.get_indexer_for(key) < 0):
+        if len(key) != self.ndim:
+            return False
 
-                raise KeyError("None of [%s] are in the [%s]" %
-                               (key, self.obj._get_axis_name(axis)))
+        for i, k in enumerate(key):
+            if not is_scalar(k):
+                return False
 
-            return True
+            ax = self.obj.axes[i]
+            if isinstance(ax, MultiIndex):
+                return False
 
-        else:
+            if not ax.is_unique:
+                return False
 
-            def error():
-                if isnull(key):
-                    raise ValueError(
-                        "cannot use label indexing with a null key")
-                raise KeyError("the label [%s] is not in the [%s]" %
-                               (key, self.obj._get_axis_name(axis)))
+        return True
 
-            try:
-                key = self._convert_scalar_indexer(key, axis)
-                if not key in ax:
-                    error()
-            except (TypeError) as e:
-
-                # python 3 type errors should be raised
-                if 'unorderable' in str(e):  # pragma: no cover
-                    error()
-                raise
-            except:
-                error()
+    def _getitem_scalar(self, key):
+        # a fast-path to scalar access
+        # if not, raise
+        values = self.obj._get_value(*key)
+        return values
+
+    def _get_partial_string_timestamp_match_key(self, key, labels):
+        """Translate any partial string timestamp matches in key, returning the
+        new key (GH 10331)"""
+        if isinstance(labels, MultiIndex):
+            if isinstance(key, compat.string_types) and \
+                    labels.levels[0].is_all_dates:
+                # Convert key '2016-01-01' to
+                # ('2016-01-01'[, slice(None, None, None)]+)
+                key = tuple([key] + [slice(None)] * (len(labels.levels) - 1))
+
+            if isinstance(key, tuple):
+                # Convert (..., '2016-01-01', ...) in tuple to
+                # (..., slice('2016-01-01', '2016-01-01', None), ...)
+                new_key = []
+                for i, component in enumerate(key):
+                    if isinstance(component, compat.string_types) and \
+                            labels.levels[i].is_all_dates:
+                        new_key.append(slice(component, component, None))
+                    else:
+                        new_key.append(component)
+                key = tuple(new_key)
 
-        return True
+        return key
+
+    def _getitem_axis(self, key, axis=None):
+        if axis is None:
+            axis = self.axis or 0
+
+        if is_iterator(key):
+            key = list(key)
 
-    def _getitem_axis(self, key, axis=0):
         labels = self.obj._get_axis(axis)
+        key = self._get_partial_string_timestamp_match_key(key, labels)
 
         if isinstance(key, slice):
-            self._has_valid_type(key, axis)
+            self._validate_key(key, axis)
             return self._get_slice_axis(key, axis=axis)
-        elif is_bool_indexer(key):
+        elif com.is_bool_indexer(key):
             return self._getbool_axis(key, axis=axis)
         elif is_list_like_indexer(key):
 
-            # GH 7349
-            # possibly convert a list-like into a nested tuple
-            # but don't convert a list-like of tuples
+            # convert various list-like indexers
+            # to a list of keys
+            # we will use the *values* of the object
+            # and NOT the index if its a PandasObject
             if isinstance(labels, MultiIndex):
-                if not isinstance(key, tuple) and len(key) > 1 and not isinstance(key[0], tuple):
+
+                if isinstance(key, (ABCSeries, np.ndarray)) and key.ndim <= 1:
+                    # Series, or 0,1 ndim ndarray
+                    # GH 14730
+                    key = list(key)
+                elif isinstance(key, ABCDataFrame):
+                    # GH 15438
+                    raise NotImplementedError("Indexing a MultiIndex with a "
+                                              "DataFrame key is not "
+                                              "implemented")
+                elif hasattr(key, 'ndim') and key.ndim > 1:
+                    raise NotImplementedError("Indexing a MultiIndex with a "
+                                              "multidimensional key is not "
+                                              "implemented")
+
+                if (not isinstance(key, tuple) and len(key) > 1 and
+                        not isinstance(key[0], tuple)):
                     key = tuple([key])
 
             # an iterable multi-selection
-            if not (isinstance(key, tuple) and
-                    isinstance(labels, MultiIndex)):
+            if not (isinstance(key, tuple) and isinstance(labels, MultiIndex)):
 
                 if hasattr(key, 'ndim') and key.ndim > 1:
                     raise ValueError('Cannot index with multidimensional key')
@@ -1334,17 +1914,16 @@ def _getitem_axis(self, key, axis=0):
             # nested tuple slicing
             if is_nested_tuple(key, labels):
                 locs = labels.get_locs(key)
-                indexer = [ slice(None) ] * self.ndim
+                indexer = [slice(None)] * self.ndim
                 indexer[axis] = locs
                 return self.obj.iloc[tuple(indexer)]
 
         # fall thru to straight lookup
-        self._has_valid_type(key, axis)
+        self._validate_key(key, axis)
         return self._get_label(key, axis=axis)
 
 
 class _iLocIndexer(_LocationIndexer):
-
     """Purely integer-location based indexing for selection by position.
 
     ``.iloc[]`` is primarily integer position based (from ``0`` to
@@ -1357,6 +1936,8 @@ class _iLocIndexer(_LocationIndexer):
     - A list or array of integers, e.g. ``[4, 3, 0]``.
     - A slice object with ints, e.g. ``1:7``.
     - A boolean array.
+    - A ``callable`` function with one argument (the calling Series, DataFrame
+      or Panel) and that returns valid output for indexing (one of the above)
 
     ``.iloc`` will raise ``IndexError`` if a requested indexer is
     out-of-bounds, except *slice* indexers which allow out-of-bounds
@@ -1370,50 +1951,73 @@ class _iLocIndexer(_LocationIndexer):
                     "point is EXCLUDED), listlike of integers, boolean array")
     _exception = IndexError
 
-    def _has_valid_type(self, key, axis):
-        if is_bool_indexer(key):
+    def _validate_key(self, key, axis):
+        if com.is_bool_indexer(key):
             if hasattr(key, 'index') and isinstance(key.index, Index):
                 if key.index.inferred_type == 'integer':
-                    raise NotImplementedError(
-                        "iLocation based boolean indexing on an integer type "
-                        "is not available"
-                    )
+                    raise NotImplementedError("iLocation based boolean "
+                                              "indexing on an integer type "
+                                              "is not available")
                 raise ValueError("iLocation based boolean indexing cannot use "
                                  "an indexable as a mask")
-            return True
+            return
 
         if isinstance(key, slice):
-            return True
+            return
         elif is_integer(key):
-            return self._is_valid_integer(key, axis)
+            self._validate_integer(key, axis)
+        elif isinstance(key, tuple):
+            # a tuple should already have been caught by this point
+            # so don't treat a tuple as a valid indexer
+            raise IndexingError('Too many indexers')
         elif is_list_like_indexer(key):
-            return self._is_valid_list_like(key, axis)
-        return False
+            # check that the key does not exceed the maximum size of the index
+            arr = np.array(key)
+            l = len(self.obj._get_axis(axis))
+
+            if len(arr) and (arr.max() >= l or arr.min() < -l):
+                raise IndexError("positional indexers are out-of-bounds")
+        else:
+            raise ValueError("Can only index by location with "
+                             "a [{types}]".format(types=self._valid_types))
 
     def _has_valid_setitem_indexer(self, indexer):
         self._has_valid_positional_setitem_indexer(indexer)
 
-    def _is_valid_integer(self, key, axis):
-        # return a boolean if we have a valid integer indexer
+    def _is_scalar_access(self, key):
+        # this is a shortcut accessor to both .loc and .iloc
+        # that provide the equivalent access of .at and .iat
+        # a) avoid getting things via sections and (to minimize dtype changes)
+        # b) provide a performant path
+        if not hasattr(key, '__len__'):
+            return False
+
+        if len(key) != self.ndim:
+            return False
+
+        for i, k in enumerate(key):
+            if not is_integer(k):
+                return False
+
+            ax = self.obj.axes[i]
+            if not ax.is_unique:
+                return False
 
-        ax = self.obj._get_axis(axis)
-        l = len(ax)
-        if key >= l or key < -l:
-            raise IndexError("single positional indexer is out-of-bounds")
         return True
 
+    def _getitem_scalar(self, key):
+        # a fast-path to scalar access
+        # if not, raise
+        values = self.obj._get_value(*key, takeable=True)
+        return values
 
-    def _is_valid_list_like(self, key, axis):
-        # return a boolean if we are a valid list-like (e.g. that we dont' have out-of-bounds values)
+    def _validate_integer(self, key, axis):
+        # return a boolean if we have a valid integer indexer
 
-        # coerce the key to not exceed the maximum size of the index
-        arr = np.array(key)
         ax = self.obj._get_axis(axis)
         l = len(ax)
-        if len(arr) and (arr.max() >= l or arr.min() < -l):
-            raise IndexError("positional indexers are out-of-bounds")
-
-        return True
+        if key >= l or key < -l:
+            raise IndexError("single positional indexer is out-of-bounds")
 
     def _getitem_tuple(self, tup):
 
@@ -1424,19 +2028,19 @@ def _getitem_tuple(self, tup):
             pass
 
         retval = self.obj
-        axis=0
+        axis = 0
         for i, key in enumerate(tup):
             if i >= self.obj.ndim:
                 raise IndexingError('Too many indexers')
 
-            if is_null_slice(key):
+            if com.is_null_slice(key):
                 axis += 1
                 continue
 
             retval = getattr(retval, self.name)._getitem_axis(key, axis=axis)
 
             # if the dim was reduced, then pass a lower-dim the next time
-            if retval.ndim<self.ndim:
+            if retval.ndim < self.ndim:
                 axis -= 1
 
             # try to get for the next axis
@@ -1444,53 +2048,76 @@ def _getitem_tuple(self, tup):
 
         return retval
 
-    def _get_slice_axis(self, slice_obj, axis=0):
+    def _get_slice_axis(self, slice_obj, axis=None):
+        if axis is None:
+            axis = self.axis or 0
         obj = self.obj
 
         if not need_slice(slice_obj):
-            return obj
+            return obj.copy(deep=False)
 
         slice_obj = self._convert_slice_indexer(slice_obj, axis)
         if isinstance(slice_obj, slice):
             return self._slice(slice_obj, axis=axis, kind='iloc')
         else:
-            return self.obj.take(slice_obj, axis=axis, convert=False)
+            return self.obj._take(slice_obj, axis=axis)
 
-    def _getitem_axis(self, key, axis=0):
+    def _get_list_axis(self, key, axis=None):
+        """
+        Return Series values by list or array of integers
 
-        if isinstance(key, slice):
-            self._has_valid_type(key, axis)
-            return self._get_slice_axis(key, axis=axis)
+        Parameters
+        ----------
+        key : list-like positional indexer
+        axis : int (can only be zero)
 
-        elif is_bool_indexer(key):
-            self._has_valid_type(key, axis)
-            return self._getbool_axis(key, axis=axis)
+        Returns
+        -------
+        Series object
+        """
+        if axis is None:
+            axis = self.axis or 0
+        try:
+            return self.obj._take(key, axis=axis)
+        except IndexError:
+            # re-raise with different error message
+            raise IndexError("positional indexers are out-of-bounds")
 
-        # a single integer or a list of integers
-        else:
+    def _getitem_axis(self, key, axis=None):
+        if axis is None:
+            axis = self.axis or 0
+
+        if isinstance(key, slice):
+            return self._get_slice_axis(key, axis=axis)
 
-            if is_list_like_indexer(key):
+        if isinstance(key, list):
+            key = np.asarray(key)
 
-                # validate list bounds
-                self._is_valid_list_like(key, axis)
+        if com.is_bool_indexer(key):
+            self._validate_key(key, axis)
+            return self._getbool_axis(key, axis=axis)
 
-                # force an actual list
-                key = list(key)
+        # a list of integers
+        elif is_list_like_indexer(key):
+            return self._get_list_axis(key, axis=axis)
 
-            else:
-                key = self._convert_scalar_indexer(key, axis)
+        # a single integer
+        else:
+            key = self._convert_scalar_indexer(key, axis)
 
-                if not is_integer(key):
-                    raise TypeError("Cannot index by location index with a "
-                                    "non-integer key")
+            if not is_integer(key):
+                raise TypeError("Cannot index by location index with a "
+                                "non-integer key")
 
-                # validate the location
-                self._is_valid_integer(key, axis)
+            # validate the location
+            self._validate_integer(key, axis)
 
             return self._get_loc(key, axis=axis)
 
-    def _convert_to_indexer(self, obj, axis=0, is_setter=False):
+    def _convert_to_indexer(self, obj, axis=None, is_setter=False):
         """ much simpler as we only have to deal with our valid types """
+        if axis is None:
+            axis = self.axis or 0
 
         # make need to convert a float key
         if isinstance(obj, slice):
@@ -1499,15 +2126,15 @@ def _convert_to_indexer(self, obj, axis=0, is_setter=False):
         elif is_float(obj):
             return self._convert_scalar_indexer(obj, axis)
 
-        elif self._has_valid_type(obj, axis):
+        try:
+            self._validate_key(obj, axis)
             return obj
-
-        raise ValueError("Can only index by location with a [%s]" %
-                         self._valid_types)
+        except ValueError:
+            raise ValueError("Can only index by location with "
+                             "a [{types}]".format(types=self._valid_types))
 
 
 class _ScalarAccessIndexer(_NDFrameIndexer):
-
     """ access scalars quickly """
 
     def _convert_key(self, key, is_setter=False):
@@ -1523,9 +2150,16 @@ def __getitem__(self, key):
                 raise ValueError('Invalid call for scalar access (getting)!')
 
         key = self._convert_key(key)
-        return self.obj.get_value(*key, takeable=self._takeable)
+        return self.obj._get_value(*key, takeable=self._takeable)
 
     def __setitem__(self, key, value):
+        if isinstance(key, tuple):
+            key = tuple(com._apply_if_callable(x, self.obj)
+                        for x in key)
+        else:
+            # scalar callable may return tuple
+            key = com._apply_if_callable(key, self.obj)
+
         if not isinstance(key, tuple):
             key = self._tuplify(key)
         if len(key) != self.obj.ndim:
@@ -1533,22 +2167,62 @@ def __setitem__(self, key, value):
                              '(setting)!')
         key = list(self._convert_key(key, is_setter=True))
         key.append(value)
-        self.obj.set_value(*key, takeable=self._takeable)
+        self.obj._set_value(*key, takeable=self._takeable)
 
 
 class _AtIndexer(_ScalarAccessIndexer):
+    """
+    Access a single value for a row/column label pair.
+
+    Similar to ``loc``, in that both provide label-based lookups. Use
+    ``at`` if you only need to get or set a single value in a DataFrame
+    or Series.
+
+    See Also
+    --------
+    DataFrame.iat : Access a single value for a row/column pair by integer
+        position
+    DataFrame.loc : Access a group of rows and columns by label(s)
+    Series.at : Access a single value using a label
+
+    Examples
+    --------
+    >>> df = pd.DataFrame([[0, 2, 3], [0, 4, 1], [10, 20, 30]],
+    ...                   index=[4, 5, 6], columns=['A', 'B', 'C'])
+    >>> df
+        A   B   C
+    4   0   2   3
+    5   0   4   1
+    6  10  20  30
+
+    Get value at specified row/column pair
 
-    """Fast label-based scalar accessor
+    >>> df.at[4, 'B']
+    2
 
-    Similarly to ``loc``, ``at`` provides **label** based scalar lookups.
-    You can also set using these indexers.
+    Set value at specified row/column pair
 
+    >>> df.at[4, 'B'] = 10
+    >>> df.at[4, 'B']
+    10
+
+    Get value within a Series
+
+    >>> df.loc[5].at['B']
+    4
+
+    Raises
+    ------
+    KeyError
+        When label does not exist in DataFrame
     """
 
     _takeable = False
 
     def _convert_key(self, key, is_setter=False):
-        """ require they keys to be the same type as the index (so we don't fallback) """
+        """ require they keys to be the same type as the index (so we don't
+        fallback)
+        """
 
         # allow arbitrary setting
         if is_setter:
@@ -1557,21 +2231,60 @@ def _convert_key(self, key, is_setter=False):
         for ax, i in zip(self.obj.axes, key):
             if ax.is_integer():
                 if not is_integer(i):
-                    raise ValueError("At based indexing on an integer index can only have integer "
-                                     "indexers")
+                    raise ValueError("At based indexing on an integer index "
+                                     "can only have integer indexers")
             else:
                 if is_integer(i):
-                    raise ValueError("At based indexing on an non-integer index can only have non-integer "
+                    raise ValueError("At based indexing on an non-integer "
+                                     "index can only have non-integer "
                                      "indexers")
         return key
 
+
 class _iAtIndexer(_ScalarAccessIndexer):
+    """
+    Access a single value for a row/column pair by integer position.
+
+    Similar to ``iloc``, in that both provide integer-based lookups. Use
+    ``iat`` if you only need to get or set a single value in a DataFrame
+    or Series.
+
+    See Also
+    --------
+    DataFrame.at : Access a single value for a row/column label pair
+    DataFrame.loc : Access a group of rows and columns by label(s)
+    DataFrame.iloc : Access a group of rows and columns by integer position(s)
+
+    Examples
+    --------
+    >>> df = pd.DataFrame([[0, 2, 3], [0, 4, 1], [10, 20, 30]],
+    ...                   columns=['A', 'B', 'C'])
+    >>> df
+        A   B   C
+    0   0   2   3
+    1   0   4   1
+    2  10  20  30
 
-    """Fast integer location scalar accessor.
+    Get value at specified row/column pair
 
-    Similarly to ``iloc``, ``iat`` provides **integer** based lookups.
-    You can also set using these indexers.
+    >>> df.iat[1, 2]
+    1
 
+    Set value at specified row/column pair
+
+    >>> df.iat[1, 2] = 10
+    >>> df.iat[1, 2]
+    10
+
+    Get value within a series
+
+    >>> df.loc[0].iat[1]
+    2
+
+    Raises
+    ------
+    IndexError
+        When integer position is out of bounds
     """
 
     _takeable = True
@@ -1580,16 +2293,13 @@ def _has_valid_setitem_indexer(self, indexer):
         self._has_valid_positional_setitem_indexer(indexer)
 
     def _convert_key(self, key, is_setter=False):
-        """ require  integer args (and convert to label arguments) """
+        """ require integer args (and convert to label arguments) """
         for a, i in zip(self.obj.axes, key):
             if not is_integer(i):
                 raise ValueError("iAt based indexing can only have integer "
                                  "indexers")
         return key
 
-# 32-bit floating point machine epsilon
-_eps = np.finfo('f4').eps
-
 
 def length_of_indexer(indexer, target=None):
     """return the length of a single non-tuple indexer which could be a slice
@@ -1611,7 +2321,7 @@ def length_of_indexer(indexer, target=None):
             step = 1
         elif step < 0:
             step = -step
-        return (stop - start + step-1) // step
+        return (stop - start + step - 1) // step
     elif isinstance(indexer, (ABCSeries, Index, np.ndarray, list)):
         return len(indexer)
     elif not is_list_like_indexer(indexer):
@@ -1629,32 +2339,20 @@ def convert_to_index_sliceable(obj, key):
     elif isinstance(key, compat.string_types):
 
         # we are an actual column
-        if key in obj._data.items:
+        if obj._data.items.contains(key):
             return None
 
-        # we need a timelike key here
+        # We might have a datetimelike string that we can translate to a
+        # slice here via partial string indexing
         if idx.is_all_dates:
             try:
                 return idx._get_string_slice(key)
-            except:
+            except (KeyError, ValueError, NotImplementedError):
                 return None
 
     return None
 
 
-def is_index_slice(obj):
-    def _is_valid_index(x):
-        return (is_integer(x) or is_float(x)
-                and np.allclose(x, int(x), rtol=_eps, atol=0))
-
-    def _crit(v):
-        return v is None or _is_valid_index(v)
-
-    both_none = obj.start is None and obj.stop is None
-
-    return not both_none and (_crit(obj.start) and _crit(obj.stop))
-
-
 def check_bool_indexer(ax, key):
     # boolean indexing, need to check that the data are aligned, otherwise
     # disallowed
@@ -1664,12 +2362,15 @@ def check_bool_indexer(ax, key):
     result = key
     if isinstance(key, ABCSeries) and not key.index.equals(ax):
         result = result.reindex(ax)
-        mask = com.isnull(result._values)
+        mask = isna(result._values)
         if mask.any():
-            raise IndexingError('Unalignable boolean Series key provided')
-
+            raise IndexingError('Unalignable boolean Series provided as '
+                                'indexer (index of the boolean Series and of '
+                                'the indexed object do not match')
         result = result.astype(bool)._values
-
+    elif is_sparse(result):
+        result = result.to_dense()
+        result = np.asarray(result, dtype=bool)
     else:
         # is_bool_indexer has already checked for nulls in the case of an
         # object array key, so no check needed here
@@ -1678,9 +2379,53 @@ def check_bool_indexer(ax, key):
     return result
 
 
+def check_setitem_lengths(indexer, value, values):
+    """Validate that value and indexer are the same length.
+
+    An special-case is allowed for when the indexer is a boolean array
+    and the number of true values equals the length of ``value``. In
+    this case, no exception is raised.
+
+    Parameters
+    ----------
+    indexer : sequence
+        The key for the setitem
+    value : array-like
+        The value for the setitem
+    values : array-like
+        The values being set into
+
+    Returns
+    -------
+    None
+
+    Raises
+    ------
+    ValueError
+        When the indexer is an ndarray or list and the lengths don't
+        match.
+    """
+    # boolean with truth values == len of the value is ok too
+    if isinstance(indexer, (np.ndarray, list)):
+        if is_list_like(value) and len(indexer) != len(value):
+            if not (isinstance(indexer, np.ndarray) and
+                    indexer.dtype == np.bool_ and
+                    len(indexer[indexer]) == len(value)):
+                raise ValueError("cannot set using a list-like indexer "
+                                 "with a different length than the value")
+    # slice
+    elif isinstance(indexer, slice):
+
+        if is_list_like(value) and len(values):
+            if len(value) != length_of_indexer(indexer, values):
+                raise ValueError("cannot set using a slice indexer with a "
+                                 "different length than the value")
+
+
 def convert_missing_indexer(indexer):
     """ reverse convert a missing indexer, which is a dict
-        return the scalar indexer and a boolean indicating if we converted """
+    return the scalar indexer and a boolean indicating if we converted
+    """
 
     if isinstance(indexer, dict):
 
@@ -1696,32 +2441,97 @@ def convert_missing_indexer(indexer):
 
 def convert_from_missing_indexer_tuple(indexer, axes):
     """ create a filtered indexer that doesn't have any missing indexers """
+
     def get_indexer(_i, _idx):
-        return (axes[_i].get_loc(_idx['key'])
-                if isinstance(_idx, dict) else _idx)
-    return tuple([get_indexer(_i, _idx) for _i, _idx in enumerate(indexer)])
+        return (axes[_i].get_loc(_idx['key']) if isinstance(_idx, dict) else
+                _idx)
+
+    return tuple(get_indexer(_i, _idx) for _i, _idx in enumerate(indexer))
 
 
 def maybe_convert_indices(indices, n):
-    """ if we have negative indicies, translate to postive here
-    if have indicies that are out-of-bounds, raise an IndexError
     """
+    Attempt to convert indices into valid, positive indices.
+
+    If we have negative indices, translate to positive here.
+    If we have indices that are out-of-bounds, raise an IndexError.
+
+    Parameters
+    ----------
+    indices : array-like
+        The array of indices that we are to convert.
+    n : int
+        The number of elements in the array that we are indexing.
+
+    Returns
+    -------
+    valid_indices : array-like
+        An array-like of positive indices that correspond to the ones
+        that were passed in initially to this function.
+
+    Raises
+    ------
+    IndexError : one of the converted indices either exceeded the number
+        of elements (specified by `n`) OR was still negative.
+    """
+
     if isinstance(indices, list):
         indices = np.array(indices)
         if len(indices) == 0:
             # If list is empty, np.array will return float and cause indexing
             # errors.
-            return np.empty(0, dtype=np.int_)
+            return np.empty(0, dtype=np.intp)
 
     mask = indices < 0
     if mask.any():
         indices[mask] += n
+
     mask = (indices >= n) | (indices < 0)
     if mask.any():
         raise IndexError("indices are out-of-bounds")
     return indices
 
 
+def validate_indices(indices, n):
+    """Perform bounds-checking for an indexer.
+
+    -1 is allowed for indicating missing values.
+
+    Parameters
+    ----------
+    indices : ndarray
+    n : int
+        length of the array being indexed
+
+    Raises
+    ------
+    ValueError
+
+    Examples
+    --------
+    >>> validate_indices([1, 2], 3)
+    # OK
+    >>> validate_indices([1, -2], 3)
+    ValueError
+    >>> validate_indices([1, 2, 3], 3)
+    IndexError
+    >>> validate_indices([-1, -1], 0)
+    # OK
+    >>> validate_indices([0, 1], 0)
+    IndexError
+    """
+    if len(indices):
+        min_idx = indices.min()
+        if min_idx < -1:
+            msg = ("'indices' contains values less than allowed ({} < {})"
+                   .format(min_idx, -1))
+            raise ValueError(msg)
+
+        max_idx = indices.max()
+        if max_idx >= n:
+            raise IndexError("indices are out-of-bounds")
+
+
 def maybe_convert_ix(*args):
     """
     We likely want to take the cross-product
@@ -1739,21 +2549,23 @@ def maybe_convert_ix(*args):
 
 
 def is_nested_tuple(tup, labels):
-    # check for a compatiable nested tuple and multiindexes among the axes
+    # check for a compatible nested tuple and multiindexes among the axes
     if not isinstance(tup, tuple):
         return False
 
-    # are we nested tuple of: tuple,list,slice
     for i, k in enumerate(tup):
 
-        if isinstance(k, (tuple, list, slice)):
+        if is_list_like(k) or isinstance(k, slice):
             return isinstance(labels, MultiIndex)
 
     return False
 
+
 def is_list_like_indexer(key):
     # allow a list_like, but exclude NamedTuples which can be indexers
-    return is_list_like(key) and not (isinstance(key, tuple) and type(key) is not tuple)
+    return is_list_like(key) and not (isinstance(key, tuple) and
+                                      type(key) is not tuple)
+
 
 def is_label_like(key):
     # select a label or row
@@ -1761,8 +2573,7 @@ def is_label_like(key):
 
 
 def need_slice(obj):
-    return (obj.start is not None or
-            obj.stop is not None or
+    return (obj.start is not None or obj.stop is not None or
             (obj.step is not None and obj.step != 1))
 
 
@@ -1783,3 +2594,46 @@ def maybe_droplevels(index, key):
             pass
 
     return index
+
+
+def _non_reducing_slice(slice_):
+    """
+    Ensurse that a slice doesn't reduce to a Series or Scalar.
+
+    Any user-paseed `subset` should have this called on it
+    to make sure we're always working with DataFrames.
+    """
+    # default to column slice, like DataFrame
+    # ['A', 'B'] -> IndexSlices[:, ['A', 'B']]
+    kinds = tuple(list(compat.string_types) + [ABCSeries, np.ndarray, Index,
+                                               list])
+    if isinstance(slice_, kinds):
+        slice_ = IndexSlice[:, slice_]
+
+    def pred(part):
+        # true when slice does *not* reduce
+        return isinstance(part, slice) or is_list_like(part)
+
+    if not is_list_like(slice_):
+        if not isinstance(slice_, slice):
+            # a 1-d slice, like df.loc[1]
+            slice_ = [[slice_]]
+        else:
+            # slice(a, b, c)
+            slice_ = [slice_]  # to tuplize later
+    else:
+        slice_ = [part if pred(part) else [part] for part in slice_]
+    return tuple(slice_)
+
+
+def _maybe_numeric_slice(df, slice_, include_bool=False):
+    """
+    want nice defaults for background_gradient that don't break
+    with non-numeric data. But if slice_ is passed go with that.
+    """
+    if slice_ is None:
+        dtypes = [np.number]
+        if include_bool:
+            dtypes.append(bool)
+        slice_ = IndexSlice[:, df.select_dtypes(include=dtypes).columns]
+    return slice_
diff --git a/pandas/core/internals.py b/pandas/core/internals.py
index c8c834180c9f6..fe508dc1bb0bc 100644
--- a/pandas/core/internals.py
+++ b/pandas/core/internals.py
@@ -1,48 +1,91 @@
+import warnings
 import copy
+from warnings import catch_warnings
+import inspect
 import itertools
 import re
 import operator
 from datetime import datetime, timedelta, date
 from collections import defaultdict
+from functools import partial
 
 import numpy as np
+
+from pandas._libs import internals as libinternals
+
 from pandas.core.base import PandasObject
 
-from pandas.core.common import (_possibly_downcast_to_dtype, isnull,
-                                _NS_DTYPE, _TD_DTYPE, ABCSeries, is_list_like,
-                                ABCSparseSeries, _infer_dtype_from_scalar,
-                                is_null_slice, is_dtype_equal,
-                                is_null_datelike_scalar, _maybe_promote,
-                                is_timedelta64_dtype, is_datetime64_dtype,
-                                is_datetime64tz_dtype, is_datetimetz, is_sparse,
-                                array_equivalent, _maybe_convert_string_to_object,
-                                is_categorical, needs_i8_conversion, is_datetimelike_v_numeric,
-                                is_internal_type)
-from pandas.core.dtypes import DatetimeTZDtype
+from pandas.core.dtypes.dtypes import (
+    ExtensionDtype, DatetimeTZDtype,
+    PandasExtensionDtype,
+    CategoricalDtype)
+from pandas.core.dtypes.common import (
+    _TD_DTYPE, _NS_DTYPE,
+    _ensure_int64, _ensure_platform_int,
+    is_integer,
+    is_dtype_equal,
+    is_timedelta64_dtype,
+    is_datetime64_dtype, is_datetimetz, is_sparse,
+    is_categorical, is_categorical_dtype,
+    is_integer_dtype,
+    is_datetime64tz_dtype,
+    is_bool_dtype,
+    is_object_dtype,
+    is_datetimelike_v_numeric,
+    is_float_dtype, is_numeric_dtype,
+    is_numeric_v_string_like, is_extension_type,
+    is_extension_array_dtype,
+    is_list_like,
+    is_re,
+    is_re_compilable,
+    is_scalar,
+    _get_dtype)
+from pandas.core.dtypes.cast import (
+    maybe_downcast_to_dtype,
+    maybe_upcast,
+    maybe_promote,
+    infer_dtype_from,
+    infer_dtype_from_scalar,
+    soft_convert_objects,
+    maybe_convert_objects,
+    astype_nansafe,
+    find_common_type,
+    maybe_infer_dtype_type)
+from pandas.core.dtypes.missing import (
+    isna, notna, array_equivalent,
+    _isna_compat,
+    is_null_datelike_scalar)
+import pandas.core.dtypes.concat as _concat
+
+from pandas.core.dtypes.generic import (
+    ABCSeries,
+    ABCDatetimeIndex,
+    ABCExtensionArray,
+    ABCIndexClass)
+import pandas.core.common as com
+import pandas.core.algorithms as algos
 
 from pandas.core.index import Index, MultiIndex, _ensure_index
-from pandas.core.indexing import maybe_convert_indices, length_of_indexer
-from pandas.core.categorical import Categorical, maybe_to_categorical
-from pandas.tseries.index import DatetimeIndex
-import pandas.core.common as com
-import pandas.core.convert as convert
-from pandas.sparse.array import _maybe_to_sparse, SparseArray
-import pandas.lib as lib
-import pandas.tslib as tslib
-import pandas.computation.expressions as expressions
-from pandas.util.decorators import cache_readonly
-
-from pandas.tslib import Timestamp, Timedelta
+from pandas.core.indexing import maybe_convert_indices, check_setitem_lengths
+from pandas.core.arrays import Categorical
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexes.timedeltas import TimedeltaIndex
+from pandas.io.formats.printing import pprint_thing
+
+import pandas.core.missing as missing
+from pandas.core.sparse.array import _maybe_to_sparse, SparseArray
+from pandas._libs import lib, tslib
+from pandas._libs.tslib import Timedelta
+from pandas._libs.internals import BlockPlacement
+from pandas._libs.tslibs import conversion
+
+from pandas.util._decorators import cache_readonly
+from pandas.util._validators import validate_bool_kwarg
 from pandas import compat
 from pandas.compat import range, map, zip, u
-from pandas.tseries.timedeltas import _coerce_scalar_to_timedelta_type
-
-
-from pandas.lib import BlockPlacement
 
 
 class Block(PandasObject):
-
     """
     Canonical n-dimensional unit of homogeneous dtype contained in a pandas
     data structure
@@ -61,29 +104,64 @@ class Block(PandasObject):
     is_object = False
     is_categorical = False
     is_sparse = False
+    is_extension = False
     _box_to_block_values = True
     _can_hold_na = False
-    _downcast_dtype = None
     _can_consolidate = True
     _verify_integrity = True
     _validate_ndim = True
     _ftype = 'dense'
-    _holder = None
+    _concatenator = staticmethod(np.concatenate)
+
+    def __init__(self, values, placement, ndim=None):
+        self.ndim = self._check_ndim(values, ndim)
+        self.mgr_locs = placement
+        self.values = values
+
+        if (self._validate_ndim and self.ndim and
+                len(self.mgr_locs) != len(self.values)):
+            raise ValueError(
+                'Wrong number of items passed {val}, placement implies '
+                '{mgr}'.format(val=len(self.values), mgr=len(self.mgr_locs)))
+
+    def _check_ndim(self, values, ndim):
+        """ndim inference and validation.
+
+        Infers ndim from 'values' if not provided to __init__.
+        Validates that values.ndim and ndim are consistent if and only if
+        the class variable '_validate_ndim' is True.
+
+        Parameters
+        ----------
+        values : array-like
+        ndim : int or None
 
-    def __init__(self, values, placement, ndim=None, fastpath=False):
+        Returns
+        -------
+        ndim : int
+
+        Raises
+        ------
+        ValueError : the number of dimensions do not match
+        """
         if ndim is None:
             ndim = values.ndim
-        elif values.ndim != ndim:
-            raise ValueError('Wrong number of dimensions')
-        self.ndim = ndim
 
-        self.mgr_locs = placement
-        self.values = values
+        if self._validate_ndim and values.ndim != ndim:
+            msg = ("Wrong number of dimensions. values.ndim != ndim "
+                   "[{} != {}]")
+            raise ValueError(msg.format(values.ndim, ndim))
+
+        return ndim
+
+    @property
+    def _holder(self):
+        """The array-like that can hold the underlying values.
 
-        if len(self.mgr_locs) != len(self.values):
-            raise ValueError('Wrong number of items passed %d,'
-                             ' placement implies %d' % (
-                                 len(self.values), len(self.mgr_locs)))
+        None for 'Block', overridden by subclasses that don't
+        use an ndarray.
+        """
+        return None
 
     @property
     def _consolidate_key(self):
@@ -108,14 +186,14 @@ def is_categorical_astype(self, dtype):
         validate that we have a astypeable to categorical,
         returns a boolean if we are a categorical
         """
-        if com.is_categorical_dtype(dtype):
-            if dtype == com.CategoricalDtype():
-                return True
-
+        if dtype is Categorical or dtype is CategoricalDtype:
             # this is a pd.Categorical, but is not
             # a valid type for astypeing
             raise TypeError("invalid type {0} for astype".format(dtype))
 
+        elif is_categorical_dtype(dtype):
+            return True
+
         return False
 
     def external_values(self, dtype=None):
@@ -124,19 +202,30 @@ def external_values(self, dtype=None):
 
     def internal_values(self, dtype=None):
         """ return an internal format, currently just the ndarray
-        this should be the pure internal API format """
+        this should be the pure internal API format
+        """
         return self.values
 
+    def formatting_values(self):
+        """Return the internal values used by the DataFrame/SeriesFormatter"""
+        return self.internal_values()
+
     def get_values(self, dtype=None):
         """
         return an internal format, currently just the ndarray
-        this is often overriden to handle to_dense like operations
+        this is often overridden to handle to_dense like operations
         """
+        if is_object_dtype(dtype):
+            return self.values.astype(object)
         return self.values
 
     def to_dense(self):
         return self.values.view()
 
+    @property
+    def _na_value(self):
+        return np.nan
+
     @property
     def fill_value(self):
         return np.nan
@@ -145,58 +234,65 @@ def fill_value(self):
     def mgr_locs(self):
         return self._mgr_locs
 
+    @mgr_locs.setter
+    def mgr_locs(self, new_mgr_locs):
+        if not isinstance(new_mgr_locs, BlockPlacement):
+            new_mgr_locs = BlockPlacement(new_mgr_locs)
+
+        self._mgr_locs = new_mgr_locs
+
     @property
     def array_dtype(self):
-        """ the dtype to return if I want to construct this block as an array """
+        """ the dtype to return if I want to construct this block as an
+        array
+        """
         return self.dtype
 
-    def make_block(self, values, placement=None, ndim=None, **kwargs):
+    def make_block(self, values, placement=None, ndim=None):
         """
-        Create a new block, with type inference
-        propogate any values that are not specified
+        Create a new block, with type inference propagate any values that are
+        not specified
         """
         if placement is None:
             placement = self.mgr_locs
         if ndim is None:
             ndim = self.ndim
 
-        return make_block(values, placement=placement, ndim=ndim, **kwargs)
+        return make_block(values, placement=placement, ndim=ndim)
 
-    def make_block_same_class(self, values, placement, copy=False, fastpath=True,
-                              **kwargs):
+    def make_block_scalar(self, values):
         """
-        Wrap given values in a block of same type as self.
-
-        `kwargs` are used in SparseBlock override.
-
+        Create a ScalarBlock
         """
-        if copy:
-            values = values.copy()
-        return make_block(values, placement, klass=self.__class__,
-                          fastpath=fastpath, **kwargs)
-
-    @mgr_locs.setter
-    def mgr_locs(self, new_mgr_locs):
-        if not isinstance(new_mgr_locs, BlockPlacement):
-            new_mgr_locs = BlockPlacement(new_mgr_locs)
-
-        self._mgr_locs = new_mgr_locs
+        return ScalarBlock(values)
+
+    def make_block_same_class(self, values, placement=None, ndim=None,
+                              dtype=None):
+        """ Wrap given values in a block of same type as self. """
+        if dtype is not None:
+            # issue 19431 fastparquet is passing this
+            warnings.warn("dtype argument is deprecated, will be removed "
+                          "in a future release.", DeprecationWarning)
+        if placement is None:
+            placement = self.mgr_locs
+        return make_block(values, placement=placement, ndim=ndim,
+                          klass=self.__class__, dtype=dtype)
 
     def __unicode__(self):
 
         # don't want to print out all of the items here
-        name = com.pprint_thing(self.__class__.__name__)
+        name = pprint_thing(self.__class__.__name__)
         if self._is_single_block:
 
-            result = '%s: %s dtype: %s' % (
-                name, len(self), self.dtype)
+            result = '{name}: {len} dtype: {dtype}'.format(
+                name=name, len=len(self), dtype=self.dtype)
 
         else:
 
-            shape = ' x '.join([com.pprint_thing(s) for s in self.shape])
-            result = '%s: %s, %s, dtype: %s' % (
-                name, com.pprint_thing(self.mgr_locs.indexer), shape,
-                self.dtype)
+            shape = ' x '.join(pprint_thing(s) for s in self.shape)
+            result = '{name}: {index}, {shape}, dtype: {dtype}'.format(
+                name=name, index=pprint_thing(self.mgr_locs.indexer),
+                shape=shape, dtype=self.dtype)
 
         return result
 
@@ -215,7 +311,7 @@ def _slice(self, slicer):
         """ return a slice of my values """
         return self.values[slicer]
 
-    def reshape_nd(self, labels, shape, ref_items):
+    def reshape_nd(self, labels, shape, ref_items, mgr=None):
         """
         Parameters
         ----------
@@ -225,20 +321,15 @@ def reshape_nd(self, labels, shape, ref_items):
 
         return a new block that is transformed to a nd block
         """
-
-        return _block2d_to_blocknd(
-            values=self.get_values().T,
-            placement=self.mgr_locs,
-            shape=shape,
-            labels=labels,
-            ref_items=ref_items)
+        return _block2d_to_blocknd(values=self.get_values().T,
+                                   placement=self.mgr_locs, shape=shape,
+                                   labels=labels, ref_items=ref_items)
 
     def getitem_block(self, slicer, new_mgr_locs=None):
         """
         Perform __getitem__-like, return result as block.
 
         As of now, only supports slices that preserve dimensionality.
-
         """
         if new_mgr_locs is None:
             if isinstance(slicer, tuple):
@@ -258,39 +349,25 @@ def getitem_block(self, slicer, new_mgr_locs=None):
     def shape(self):
         return self.values.shape
 
-    @property
-    def itemsize(self):
-        return self.values.itemsize
-
     @property
     def dtype(self):
         return self.values.dtype
 
     @property
     def ftype(self):
-        return "%s:%s" % (self.dtype, self._ftype)
+        return "{dtype}:{ftype}".format(dtype=self.dtype, ftype=self._ftype)
 
     def merge(self, other):
         return _merge_blocks([self, other])
 
-    def reindex_axis(self, indexer, method=None, axis=1, fill_value=None,
-                     limit=None, mask_info=None):
+    def concat_same_type(self, to_concat, placement=None):
         """
-        Reindex using pre-computed indexer information
+        Concatenate list of single blocks of the same type.
         """
-        if axis < 1:
-            raise AssertionError('axis must be at least 1, got %d' % axis)
-        if fill_value is None:
-            fill_value = self.fill_value
-
-        new_values = com.take_nd(self.values, indexer, axis,
-                                 fill_value=fill_value, mask_info=mask_info)
-        return self.make_block(new_values,
-                               fastpath=True)
-
-    def get(self, item):
-        loc = self.items.get_loc(item)
-        return self.values[loc]
+        values = self._concatenator([blk.values for blk in to_concat],
+                                    axis=self.ndim - 1)
+        return self.make_block_same_class(
+            values, placement=placement or slice(0, len(values), 1))
 
     def iget(self, i):
         return self.values[i]
@@ -312,31 +389,131 @@ def delete(self, loc):
         self.values = np.delete(self.values, loc, 0)
         self.mgr_locs = self.mgr_locs.delete(loc)
 
-    def apply(self, func, **kwargs):
-        """ apply the function to my values; return a block if we are not one """
-        result = func(self.values, **kwargs)
+    def apply(self, func, mgr=None, **kwargs):
+        """ apply the function to my values; return a block if we are not
+        one
+        """
+        with np.errstate(all='ignore'):
+            result = func(self.values, **kwargs)
         if not isinstance(result, Block):
-            result = self.make_block(values=_block_shape(result))
+            result = self.make_block(values=_block_shape(result,
+                                                         ndim=self.ndim))
 
         return result
 
-    def fillna(self, value, limit=None, inplace=False, downcast=None):
+    def fillna(self, value, limit=None, inplace=False, downcast=None,
+               mgr=None):
+        """ fillna on the block with the value. If we fail, then convert to
+        ObjectBlock and try again
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
         if not self._can_hold_na:
             if inplace:
-                return [self]
+                return self
             else:
-                return [self.copy()]
+                return self.copy()
 
-        mask = isnull(self.values)
+        mask = isna(self.values)
         if limit is not None:
+            if not is_integer(limit):
+                raise ValueError('Limit must be an integer')
+            if limit < 1:
+                raise ValueError('Limit must be greater than 0')
             if self.ndim > 2:
                 raise NotImplementedError("number of dimensions for 'fillna' "
                                           "is currently limited to 2")
-            mask[mask.cumsum(self.ndim-1) > limit] = False
+            mask[mask.cumsum(self.ndim - 1) > limit] = False
 
-        value = self._try_fill(value)
-        blocks = self.putmask(mask, value, inplace=inplace)
-        return self._maybe_downcast(blocks, downcast)
+        # fillna, but if we cannot coerce, then try again as an ObjectBlock
+        try:
+            values, _, _, _ = self._try_coerce_args(self.values, value)
+            blocks = self.putmask(mask, value, inplace=inplace)
+            blocks = [b.make_block(values=self._try_coerce_result(b.values))
+                      for b in blocks]
+            return self._maybe_downcast(blocks, downcast)
+        except (TypeError, ValueError):
+
+            # we can't process the value, but nothing to do
+            if not mask.any():
+                return self if inplace else self.copy()
+
+            # operate column-by-column
+            def f(m, v, i):
+                block = self.coerce_to_target_dtype(value)
+
+                # slice out our block
+                if i is not None:
+                    block = block.getitem_block(slice(i, i + 1))
+                return block.fillna(value,
+                                    limit=limit,
+                                    inplace=inplace,
+                                    downcast=None)
+
+            return self.split_and_operate(mask, f, inplace)
+
+    def split_and_operate(self, mask, f, inplace):
+        """
+        split the block per-column, and apply the callable f
+        per-column, return a new block for each. Handle
+        masking which will not change a block unless needed.
+
+        Parameters
+        ----------
+        mask : 2-d boolean mask
+        f : callable accepting (1d-mask, 1d values, indexer)
+        inplace : boolean
+
+        Returns
+        -------
+        list of blocks
+        """
+
+        if mask is None:
+            mask = np.ones(self.shape, dtype=bool)
+        new_values = self.values
+
+        def make_a_block(nv, ref_loc):
+            if isinstance(nv, Block):
+                block = nv
+            elif isinstance(nv, list):
+                block = nv[0]
+            else:
+                # Put back the dimension that was taken from it and make
+                # a block out of the result.
+                try:
+                    nv = _block_shape(nv, ndim=self.ndim)
+                except (AttributeError, NotImplementedError):
+                    pass
+                block = self.make_block(values=nv,
+                                        placement=ref_loc)
+            return block
+
+        # ndim == 1
+        if self.ndim == 1:
+            if mask.any():
+                nv = f(mask, new_values, None)
+            else:
+                nv = new_values if inplace else new_values.copy()
+            block = make_a_block(nv, self.mgr_locs)
+            return [block]
+
+        # ndim > 1
+        new_blocks = []
+        for i, ref_loc in enumerate(self.mgr_locs):
+            m = mask[i]
+            v = new_values[i]
+
+            # need a new block
+            if m.any():
+                nv = f(m, v, i)
+            else:
+                nv = v if inplace else v.copy()
+
+            block = make_a_block(nv, [ref_loc])
+            new_blocks.append(block)
+
+        return new_blocks
 
     def _maybe_downcast(self, blocks, downcast=None):
 
@@ -347,18 +524,16 @@ def _maybe_downcast(self, blocks, downcast=None):
         elif downcast is None and (self.is_timedelta or self.is_datetime):
             return blocks
 
-        result_blocks = []
-        for b in blocks:
-            result_blocks.extend(b.downcast(downcast))
-
-        return result_blocks
+        if not isinstance(blocks, list):
+            blocks = [blocks]
+        return _extend_blocks([b.downcast(downcast) for b in blocks])
 
-    def downcast(self, dtypes=None):
+    def downcast(self, dtypes=None, mgr=None):
         """ try to downcast each item to the dict of dtypes if present """
 
         # turn it off completely
         if dtypes is False:
-            return [self]
+            return self
 
         values = self.values
 
@@ -369,56 +544,93 @@ def downcast(self, dtypes=None):
             if dtypes is None:
                 dtypes = 'infer'
 
-            nv = _possibly_downcast_to_dtype(values, dtypes)
-            return [self.make_block(nv,
-                                    fastpath=True)]
+            nv = maybe_downcast_to_dtype(values, dtypes)
+            return self.make_block(nv)
 
         # ndim > 1
         if dtypes is None:
-            return [self]
+            return self
 
         if not (dtypes == 'infer' or isinstance(dtypes, dict)):
             raise ValueError("downcast must have a dictionary or 'infer' as "
                              "its argument")
 
-        # item-by-item
+        # operate column-by-column
         # this is expensive as it splits the blocks items-by-item
-        blocks = []
-        for i, rl in enumerate(self.mgr_locs):
+        def f(m, v, i):
 
             if dtypes == 'infer':
                 dtype = 'infer'
             else:
                 raise AssertionError("dtypes as dict is not supported yet")
-                dtype = dtypes.get(item, self._downcast_dtype)
 
-            if dtype is None:
-                nv = _block_shape(values[i], ndim=self.ndim)
-            else:
-                nv = _possibly_downcast_to_dtype(values[i], dtype)
-                nv = _block_shape(nv, ndim=self.ndim)
+            if dtype is not None:
+                v = maybe_downcast_to_dtype(v, dtype)
+            return v
 
-            blocks.append(self.make_block(nv,
-                                          fastpath=True,
-                                          placement=[rl]))
+        return self.split_and_operate(None, f, False)
 
-        return blocks
+    def astype(self, dtype, copy=False, errors='raise', values=None, **kwargs):
+        return self._astype(dtype, copy=copy, errors=errors, values=values,
+                            **kwargs)
 
-    def astype(self, dtype, copy=False, raise_on_error=True, values=None, **kwargs):
-        return self._astype(dtype, copy=copy, raise_on_error=raise_on_error,
-                            values=values, **kwargs)
+    def _astype(self, dtype, copy=False, errors='raise', values=None,
+                klass=None, mgr=None, **kwargs):
+        """Coerce to the new type
 
-    def _astype(self, dtype, copy=False, raise_on_error=True, values=None,
-                klass=None, **kwargs):
-        """
-        Coerce to the new type (if copy=True, return a new copy)
-        raise on an except if raise == True
+        Parameters
+        ----------
+        dtype : str, dtype convertible
+        copy : boolean, default False
+            copy if indicated
+        errors : str, {'raise', 'ignore'}, default 'ignore'
+            - ``raise`` : allow exceptions to be raised
+            - ``ignore`` : suppress exceptions. On error return original object
+
+        Returns
+        -------
+        Block
         """
+        errors_legal_values = ('raise', 'ignore')
+
+        if errors not in errors_legal_values:
+            invalid_arg = ("Expected value of kwarg 'errors' to be one of {}. "
+                           "Supplied value is '{}'".format(
+                               list(errors_legal_values), errors))
+            raise ValueError(invalid_arg)
+
+        if (inspect.isclass(dtype) and
+                issubclass(dtype, (PandasExtensionDtype, ExtensionDtype))):
+            msg = ("Expected an instance of {}, but got the class instead. "
+                   "Try instantiating 'dtype'.".format(dtype.__name__))
+            raise TypeError(msg)
 
         # may need to convert to categorical
-        # this is only called for non-categoricals
         if self.is_categorical_astype(dtype):
-            return self.make_block(Categorical(self.values, **kwargs))
+
+            # deprecated 17636
+            if ('categories' in kwargs or 'ordered' in kwargs):
+                if isinstance(dtype, CategoricalDtype):
+                    raise TypeError(
+                        "Cannot specify a CategoricalDtype and also "
+                        "`categories` or `ordered`. Use "
+                        "`dtype=CategoricalDtype(categories, ordered)`"
+                        " instead.")
+                warnings.warn("specifying 'categories' or 'ordered' in "
+                              ".astype() is deprecated; pass a "
+                              "CategoricalDtype instead",
+                              FutureWarning, stacklevel=7)
+
+            categories = kwargs.get('categories', None)
+            ordered = kwargs.get('ordered', None)
+            if com._any_not_none(categories, ordered):
+                dtype = CategoricalDtype(categories, ordered)
+
+            if is_categorical_dtype(self.values):
+                # GH 10696/18593: update an existing categorical efficiently
+                return self.make_block(self.values.astype(dtype, copy=copy))
+
+            return self.make_block(Categorical(self.values, dtype=dtype))
 
         # astype processing
         dtype = np.dtype(dtype)
@@ -434,7 +646,8 @@ def _astype(self, dtype, copy=False, raise_on_error=True, values=None,
             # force the copy here
             if values is None:
 
-                if issubclass(dtype.type, (compat.text_type, compat.string_types)):
+                if issubclass(dtype.type,
+                              (compat.text_type, compat.string_types)):
 
                     # use native type formatting for datetime/tz/timedelta
                     if self.is_datelike:
@@ -442,49 +655,53 @@ def _astype(self, dtype, copy=False, raise_on_error=True, values=None,
 
                     # astype formatting
                     else:
-                        values = self.values
+                        values = self.get_values()
 
                 else:
                     values = self.get_values(dtype=dtype)
 
                 # _astype_nansafe works fine with 1-d only
-                values = com._astype_nansafe(values.ravel(), dtype, copy=True)
+                values = astype_nansafe(values.ravel(), dtype, copy=True)
                 values = values.reshape(self.shape)
 
-            newb = make_block(values,
-                              placement=self.mgr_locs,
-                              dtype=dtype,
+            newb = make_block(values, placement=self.mgr_locs,
                               klass=klass)
         except:
-            if raise_on_error is True:
+            if errors == 'raise':
                 raise
             newb = self.copy() if copy else self
 
         if newb.is_numeric and self.is_numeric:
             if newb.shape != self.shape:
-                raise TypeError("cannot set astype for copy = [%s] for dtype "
-                                "(%s [%s]) with smaller itemsize that current "
-                                "(%s [%s])" % (copy, self.dtype.name,
-                                               self.itemsize, newb.dtype.name,
-                                               newb.itemsize))
+                raise TypeError(
+                    "cannot set astype for copy = [{copy}] for dtype "
+                    "({dtype} [{itemsize}]) with smaller itemsize than "
+                    "current ({newb_dtype} [{newb_size}])".format(
+                        copy=copy, dtype=self.dtype.name,
+                        itemsize=self.itemsize, newb_dtype=newb.dtype.name,
+                        newb_size=newb.itemsize))
         return newb
 
     def convert(self, copy=True, **kwargs):
-        """ attempt to coerce any object types to better types
-            return a copy of the block (if copy = True)
-            by definition we are not an ObjectBlock here!  """
-
-        return [self.copy()] if copy else [self]
+        """ attempt to coerce any object types to better types return a copy
+        of the block (if copy = True) by definition we are not an ObjectBlock
+        here!
+        """
 
-    def _can_hold_element(self, value):
-        raise NotImplementedError()
+        return self.copy() if copy else self
 
-    def _try_cast(self, value):
-        raise NotImplementedError()
+    def _can_hold_element(self, element):
+        """ require the same dtype as ourselves """
+        dtype = self.values.dtype.type
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            return issubclass(tipo.type, dtype)
+        return isinstance(element, dtype)
 
     def _try_cast_result(self, result, dtype=None):
-        """ try to cast the result to our original type,
-        we may have roundtripped thru object in the mean-time """
+        """ try to cast the result to our original type, we may have
+        roundtripped thru object in the mean-time
+        """
         if dtype is None:
             dtype = self.dtype
 
@@ -499,7 +716,7 @@ def _try_cast_result(self, result, dtype=None):
                 dtype = dtype.type
             if issubclass(dtype, (np.bool_, np.object_)):
                 if issubclass(dtype, np.bool_):
-                    if isnull(result).all():
+                    if isna(result).all():
                         return result.astype(np.bool_)
                     else:
                         result = result.astype(np.object_)
@@ -512,15 +729,19 @@ def _try_cast_result(self, result, dtype=None):
             return result
 
         # may need to change the dtype here
-        return _possibly_downcast_to_dtype(result, dtype)
-
-    def _try_operate(self, values):
-        """ return a version to operate on as the input """
-        return values
+        return maybe_downcast_to_dtype(result, dtype)
 
     def _try_coerce_args(self, values, other):
         """ provide coercion to our input arguments """
-        return values, other
+
+        if np.any(notna(other)) and not self._can_hold_element(other):
+            # coercion issues
+            # let higher levels handle
+            raise TypeError("cannot convert {} to an {}".format(
+                type(other).__name__,
+                type(self).__name__.lower().replace('Block', '')))
+
+        return values, False, other, False
 
     def _try_coerce_result(self, result):
         """ reverse of try_coerce_args """
@@ -531,16 +752,15 @@ def _try_coerce_and_cast_result(self, result, dtype=None):
         result = self._try_cast_result(result, dtype=dtype)
         return result
 
-    def _try_fill(self, value):
-        return value
-
-    def to_native_types(self, slicer=None, na_rep='nan', quoting=None, **kwargs):
+    def to_native_types(self, slicer=None, na_rep='nan', quoting=None,
+                        **kwargs):
         """ convert to our native types format, slicing if desired """
 
-        values = self.values
+        values = self.get_values()
+
         if slicer is not None:
             values = values[:, slicer]
-        mask = isnull(values)
+        mask = isna(values)
 
         if not self.is_object and not quoting:
             values = values.astype(str)
@@ -551,138 +771,181 @@ def to_native_types(self, slicer=None, na_rep='nan', quoting=None, **kwargs):
         return values
 
     # block actions ####
-    def copy(self, deep=True):
+    def copy(self, deep=True, mgr=None):
+        """ copy constructor """
         values = self.values
         if deep:
             values = values.copy()
-        return self.make_block(values,
-                               klass=self.__class__,
-                               fastpath=True)
+        return self.make_block_same_class(values)
 
     def replace(self, to_replace, value, inplace=False, filter=None,
-                regex=False):
+                regex=False, convert=True, mgr=None):
         """ replace the to_replace value with value, possible to create new
         blocks here this is just a call to putmask. regex is not used here.
         It is used in ObjectBlocks.  It is here for API
-        compatibility."""
-        mask = com.mask_missing(self.values, to_replace)
-        if filter is not None:
-            filtered_out = ~self.mgr_locs.isin(filter)
-            mask[filtered_out.nonzero()[0]] = False
+        compatibility.
+        """
 
-        if not mask.any():
-            if inplace:
-                return [self]
-            return [self.copy()]
-        return self.putmask(mask, value, inplace=inplace)
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        original_to_replace = to_replace
+
+        # try to replace, if we raise an error, convert to ObjectBlock and
+        # retry
+        try:
+            values, _, to_replace, _ = self._try_coerce_args(self.values,
+                                                             to_replace)
+            mask = missing.mask_missing(values, to_replace)
+            if filter is not None:
+                filtered_out = ~self.mgr_locs.isin(filter)
+                mask[filtered_out.nonzero()[0]] = False
 
-    def setitem(self, indexer, value):
-        """ set the value inplace; return a new block (of a possibly different
-        dtype)
+            blocks = self.putmask(mask, value, inplace=inplace)
+            if convert:
+                blocks = [b.convert(by_item=True, numeric=False,
+                                    copy=not inplace) for b in blocks]
+            return blocks
+        except (TypeError, ValueError):
 
-        indexer is a direct slice/positional indexer; value must be a
-        compatible shape
-        """
+            # try again with a compatible block
+            block = self.astype(object)
+            return block.replace(
+                to_replace=original_to_replace, value=value, inplace=inplace,
+                filter=filter, regex=regex, convert=convert)
 
+    def _replace_single(self, *args, **kwargs):
+        """ no-op on a non-ObjectBlock """
+        return self if kwargs['inplace'] else self.copy()
+
+    def setitem(self, indexer, value, mgr=None):
+        """Set the value inplace, returning a a maybe different typed block.
+
+        Parameters
+        ----------
+        indexer : tuple, list-like, array-like, slice
+            The subset of self.values to set
+        value : object
+            The value being set
+        mgr : BlockPlacement, optional
+
+        Returns
+        -------
+        Block
+
+        Notes
+        -----
+        `indexer` is a direct slice/positional indexer. `value` must
+        be a compatible shape.
+        """
         # coerce None values, if appropriate
         if value is None:
             if self.is_numeric:
                 value = np.nan
 
-        # coerce args
-        values, value = self._try_coerce_args(self.values, value)
+        # coerce if block dtype can store value
+        values = self.values
+        try:
+            values, _, value, _ = self._try_coerce_args(values, value)
+            # can keep its own dtype
+            if hasattr(value, 'dtype') and is_dtype_equal(values.dtype,
+                                                          value.dtype):
+                dtype = self.dtype
+            else:
+                dtype = 'infer'
+
+        except (TypeError, ValueError):
+            # current dtype cannot store value, coerce to common dtype
+            find_dtype = False
+
+            if hasattr(value, 'dtype'):
+                dtype = value.dtype
+                find_dtype = True
+
+            elif is_scalar(value):
+                if isna(value):
+                    # NaN promotion is handled in latter path
+                    dtype = False
+                else:
+                    dtype, _ = infer_dtype_from_scalar(value,
+                                                       pandas_dtype=True)
+                    find_dtype = True
+            else:
+                dtype = 'infer'
+
+            if find_dtype:
+                dtype = find_common_type([values.dtype, dtype])
+                if not is_dtype_equal(self.dtype, dtype):
+                    b = self.astype(dtype)
+                    return b.setitem(indexer, value, mgr=mgr)
+
+        # value must be storeable at this moment
         arr_value = np.array(value)
 
         # cast the values to a type that can hold nan (if necessary)
         if not self._can_hold_element(value):
-            dtype, _ = com._maybe_promote(arr_value.dtype)
+            dtype, _ = maybe_promote(arr_value.dtype)
             values = values.astype(dtype)
 
         transf = (lambda x: x.T) if self.ndim == 2 else (lambda x: x)
         values = transf(values)
-        l = len(values)
 
         # length checking
-        # boolean with truth values == len of the value is ok too
-        if isinstance(indexer, (np.ndarray, list)):
-            if is_list_like(value) and len(indexer) != len(value):
-                if not (isinstance(indexer, np.ndarray) and
-                        indexer.dtype == np.bool_ and
-                        len(indexer[indexer]) == len(value)):
-                    raise ValueError("cannot set using a list-like indexer "
-                                     "with a different length than the value")
-
-        # slice
-        elif isinstance(indexer, slice):
-
-            if is_list_like(value) and l:
-                if len(value) != length_of_indexer(indexer, values):
-                    raise ValueError("cannot set using a slice indexer with a "
-                                     "different length than the value")
-
-        try:
-
-            def _is_scalar_indexer(indexer):
-                # return True if we are all scalar indexers
+        check_setitem_lengths(indexer, value, values)
 
-                if arr_value.ndim == 1:
-                    if not isinstance(indexer, tuple):
-                        indexer = tuple([indexer])
-                    return all([ np.isscalar(idx) for idx in indexer ])
-                return False
+        def _is_scalar_indexer(indexer):
+            # return True if we are all scalar indexers
 
-            def _is_empty_indexer(indexer):
-                # return a boolean if we have an empty indexer
+            if arr_value.ndim == 1:
+                if not isinstance(indexer, tuple):
+                    indexer = tuple([indexer])
+                    return any(isinstance(idx, np.ndarray) and len(idx) == 0
+                               for idx in indexer)
+            return False
 
-                if arr_value.ndim == 1:
-                    if not isinstance(indexer, tuple):
-                        indexer = tuple([indexer])
-                    return any(isinstance(idx, np.ndarray) and len(idx) == 0 for idx in indexer)
-                return False
+        def _is_empty_indexer(indexer):
+            # return a boolean if we have an empty indexer
 
-            # empty indexers
-            # 8669 (empty)
-            if _is_empty_indexer(indexer):
-                pass
+            if is_list_like(indexer) and not len(indexer):
+                return True
+            if arr_value.ndim == 1:
+                if not isinstance(indexer, tuple):
+                    indexer = tuple([indexer])
+                return any(isinstance(idx, np.ndarray) and len(idx) == 0
+                           for idx in indexer)
+            return False
 
-            # setting a single element for each dim and with a rhs that could be say a list
-            # GH 6043
-            elif _is_scalar_indexer(indexer):
-                values[indexer] = value
+        # empty indexers
+        # 8669 (empty)
+        if _is_empty_indexer(indexer):
+            pass
 
-            # if we are an exact match (ex-broadcasting),
-            # then use the resultant dtype
-            elif len(arr_value.shape) and arr_value.shape[0] == values.shape[0] and np.prod(arr_value.shape) == np.prod(values.shape):
-                values[indexer] = value
+        # setting a single element for each dim and with a rhs that could
+        # be say a list
+        # GH 6043
+        elif _is_scalar_indexer(indexer):
+            values[indexer] = value
+
+        # if we are an exact match (ex-broadcasting),
+        # then use the resultant dtype
+        elif (len(arr_value.shape) and
+              arr_value.shape[0] == values.shape[0] and
+              np.prod(arr_value.shape) == np.prod(values.shape)):
+            values[indexer] = value
+            try:
                 values = values.astype(arr_value.dtype)
+            except ValueError:
+                pass
 
-            # set
-            else:
-                values[indexer] = value
-
-            # coerce and try to infer the dtypes of the result
-            if np.isscalar(value):
-                dtype, _ = _infer_dtype_from_scalar(value)
-            else:
-                dtype = 'infer'
-            values = self._try_coerce_and_cast_result(values, dtype)
-            block = self.make_block(transf(values),
-                                    fastpath=True)
-
-            # may have to soft convert_objects here
-            if block.is_object and not self.is_object:
-                block = block.convert(numeric=False)
-
-            return block
-        except (ValueError, TypeError) as detail:
-            raise
-        except Exception as detail:
-            pass
+        # set
+        else:
+            values[indexer] = value
 
-        return [self]
+        # coerce and try to infer the dtypes of the result
+        values = self._try_coerce_and_cast_result(values, dtype)
+        block = self.make_block(transf(values))
+        return block
 
-    def putmask(self, mask, new, align=True, inplace=False,
-                axis=0, transpose=False):
+    def putmask(self, mask, new, align=True, inplace=False, axis=0,
+                transpose=False, mgr=None):
         """ putmask the data to the block; it is possible that we may create a
         new dtype of block
 
@@ -705,30 +968,44 @@ def putmask(self, mask, new, align=True, inplace=False,
 
         new_values = self.values if inplace else self.values.copy()
 
-        if hasattr(new, 'reindex_axis'):
-            new = new.values
-
-        if hasattr(mask, 'reindex_axis'):
-            mask = mask.values
+        new = getattr(new, 'values', new)
+        mask = getattr(mask, 'values', mask)
 
         # if we are passed a scalar None, convert it here
-        if not is_list_like(new) and isnull(new) and not self.is_object:
+        if not is_list_like(new) and isna(new) and not self.is_object:
             new = self.fill_value
 
         if self._can_hold_element(new):
+            _, _, new, _ = self._try_coerce_args(new_values, new)
+
             if transpose:
                 new_values = new_values.T
 
-            new = self._try_cast(new)
-
-            # If the default repeat behavior in np.putmask would go in the wrong
-            # direction, then explictly repeat and reshape new instead
+            # If the default repeat behavior in np.putmask would go in the
+            # wrong direction, then explicitly repeat and reshape new instead
             if getattr(new, 'ndim', 0) >= 1:
                 if self.ndim - 1 == new.ndim and axis == 1:
-                    new = np.repeat(new, new_values.shape[-1]).reshape(
-                        self.shape)
+                    new = np.repeat(
+                        new, new_values.shape[-1]).reshape(self.shape)
                 new = new.astype(new_values.dtype)
 
+            # we require exact matches between the len of the
+            # values we are setting (or is compat). np.putmask
+            # doesn't check this and will simply truncate / pad
+            # the output, but we want sane error messages
+            #
+            # TODO: this prob needs some better checking
+            # for 2D cases
+            if ((is_list_like(new) and
+                 np.any(mask[mask]) and
+                 getattr(new, 'ndim', 1) == 1)):
+
+                if not (mask.shape[-1] == len(new) or
+                        mask[mask].shape[-1] == len(new) or
+                        len(new) == 1):
+                    raise ValueError("cannot assign mismatch "
+                                     "length to masked array")
+
             np.putmask(new_values, mask, new)
 
         # maybe upcast me
@@ -746,43 +1023,29 @@ def putmask(self, mask, new, align=True, inplace=False,
                     new_shape.insert(axis, 1)
                     new = new.reshape(tuple(new_shape))
 
-            # need to go column by column
-            new_blocks = []
-            if self.ndim > 1:
-                for i, ref_loc in enumerate(self.mgr_locs):
-                    m = mask[i]
-                    v = new_values[i]
-
-                    # need a new block
-                    if m.any():
-                        if isinstance(new, np.ndarray):
-                            n = np.squeeze(new[i % new.shape[0]])
-                        else:
-                            n = np.array(new)
-
-                        # type of the new block
-                        dtype, _ = com._maybe_promote(n.dtype)
+            # operate column-by-column
+            def f(m, v, i):
 
-                        # we need to explicitly astype here to make a copy
-                        n = n.astype(dtype)
+                if i is None:
+                    # ndim==1 case.
+                    n = new
+                else:
 
-                        nv = _putmask_smart(v, m, n)
+                    if isinstance(new, np.ndarray):
+                        n = np.squeeze(new[i % new.shape[0]])
                     else:
-                        nv = v if inplace else v.copy()
+                        n = np.array(new)
 
-                    # Put back the dimension that was taken from it and make
-                    # a block out of the result.
-                    block = self.make_block(values=nv[np.newaxis],
-                                            placement=[ref_loc],
-                                            fastpath=True)
+                    # type of the new block
+                    dtype, _ = maybe_promote(n.dtype)
 
-                    new_blocks.append(block)
+                    # we need to explicitly astype here to make a copy
+                    n = n.astype(dtype)
 
-            else:
-                nv = _putmask_smart(new_values, mask, new)
-                new_blocks.append(self.make_block(values=nv,
-                                                  fastpath=True))
+                nv = _putmask_smart(v, m, n)
+                return nv
 
+            new_blocks = self.split_and_operate(mask, f, inplace)
             return new_blocks
 
         if inplace:
@@ -791,13 +1054,75 @@ def putmask(self, mask, new, align=True, inplace=False,
         if transpose:
             new_values = new_values.T
 
-        return [self.make_block(new_values,
-                                fastpath=True)]
+        return [self.make_block(new_values)]
+
+    def coerce_to_target_dtype(self, other):
+        """
+        coerce the current block to a dtype compat for other
+        we will return a block, possibly object, and not raise
+
+        we can also safely try to coerce to the same dtype
+        and will receive the same block
+        """
+
+        # if we cannot then coerce to object
+        dtype, _ = infer_dtype_from(other, pandas_dtype=True)
+
+        if is_dtype_equal(self.dtype, dtype):
+            return self
+
+        if self.is_bool or is_object_dtype(dtype) or is_bool_dtype(dtype):
+            # we don't upcast to bool
+            return self.astype(object)
+
+        elif ((self.is_float or self.is_complex) and
+              (is_integer_dtype(dtype) or is_float_dtype(dtype))):
+            # don't coerce float/complex to int
+            return self
+
+        elif (self.is_datetime or
+              is_datetime64_dtype(dtype) or
+              is_datetime64tz_dtype(dtype)):
+
+            # not a datetime
+            if not ((is_datetime64_dtype(dtype) or
+                     is_datetime64tz_dtype(dtype)) and self.is_datetime):
+                return self.astype(object)
+
+            # don't upcast timezone with different timezone or no timezone
+            mytz = getattr(self.dtype, 'tz', None)
+            othertz = getattr(dtype, 'tz', None)
+
+            if str(mytz) != str(othertz):
+                return self.astype(object)
+
+            raise AssertionError("possible recursion in "
+                                 "coerce_to_target_dtype: {} {}".format(
+                                     self, other))
+
+        elif (self.is_timedelta or is_timedelta64_dtype(dtype)):
+
+            # not a timedelta
+            if not (is_timedelta64_dtype(dtype) and self.is_timedelta):
+                return self.astype(object)
 
-    def interpolate(self, method='pad', axis=0, index=None,
-                    values=None, inplace=False, limit=None,
-                    limit_direction='forward',
-                    fill_value=None, coerce=False, downcast=None, **kwargs):
+            raise AssertionError("possible recursion in "
+                                 "coerce_to_target_dtype: {} {}".format(
+                                     self, other))
+
+        try:
+            return self.astype(dtype)
+        except (ValueError, TypeError):
+            pass
+
+        return self.astype(object)
+
+    def interpolate(self, method='pad', axis=0, index=None, values=None,
+                    inplace=False, limit=None, limit_direction='forward',
+                    limit_area=None, fill_value=None, coerce=False,
+                    downcast=None, mgr=None, **kwargs):
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
 
         def check_int_bool(self, inplace):
             # Only FloatBlocks will contain NaNs.
@@ -810,7 +1135,7 @@ def check_int_bool(self, inplace):
 
         # a fill na type method
         try:
-            m = com._clean_fill_method(method)
+            m = missing.clean_fill_method(method)
         except:
             m = None
 
@@ -818,16 +1143,14 @@ def check_int_bool(self, inplace):
             r = check_int_bool(self, inplace)
             if r is not None:
                 return r
-            return self._interpolate_with_fill(method=m,
-                                               axis=axis,
-                                               inplace=inplace,
-                                               limit=limit,
+            return self._interpolate_with_fill(method=m, axis=axis,
+                                               inplace=inplace, limit=limit,
                                                fill_value=fill_value,
                                                coerce=coerce,
-                                               downcast=downcast)
+                                               downcast=downcast, mgr=mgr)
         # try an interp method
         try:
-            m = com._clean_interp_method(method, **kwargs)
+            m = missing.clean_interp_method(method, **kwargs)
         except:
             m = None
 
@@ -835,24 +1158,22 @@ def check_int_bool(self, inplace):
             r = check_int_bool(self, inplace)
             if r is not None:
                 return r
-            return self._interpolate(method=m,
-                                     index=index,
-                                     values=values,
-                                     axis=axis,
-                                     limit=limit,
+            return self._interpolate(method=m, index=index, values=values,
+                                     axis=axis, limit=limit,
                                      limit_direction=limit_direction,
-                                     fill_value=fill_value,
-                                     inplace=inplace,
-                                     downcast=downcast,
-                                     **kwargs)
+                                     limit_area=limit_area,
+                                     fill_value=fill_value, inplace=inplace,
+                                     downcast=downcast, mgr=mgr, **kwargs)
 
         raise ValueError("invalid method '{0}' to interpolate.".format(method))
 
     def _interpolate_with_fill(self, method='pad', axis=0, inplace=False,
                                limit=None, fill_value=None, coerce=False,
-                               downcast=None):
+                               downcast=None, mgr=None):
         """ fillna but using the interpolate machinery """
 
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
         # if we are coercing, then don't force the conversion
         # if the block can't hold the type
         if coerce:
@@ -862,28 +1183,23 @@ def _interpolate_with_fill(self, method='pad', axis=0, inplace=False,
                 else:
                     return [self.copy()]
 
-        fill_value = self._try_fill(fill_value)
         values = self.values if inplace else self.values.copy()
-        values = self._try_operate(values)
-        values = com.interpolate_2d(values,
-                                    method=method,
-                                    axis=axis,
-                                    limit=limit,
-                                    fill_value=fill_value,
-                                    dtype=self.dtype)
+        values, _, fill_value, _ = self._try_coerce_args(values, fill_value)
+        values = missing.interpolate_2d(values, method=method, axis=axis,
+                                        limit=limit, fill_value=fill_value,
+                                        dtype=self.dtype)
         values = self._try_coerce_result(values)
 
-        blocks = [self.make_block(values,
-                                  klass=self.__class__,
-                                  fastpath=True)]
+        blocks = [self.make_block_same_class(values, ndim=self.ndim)]
         return self._maybe_downcast(blocks, downcast)
 
     def _interpolate(self, method=None, index=None, values=None,
                      fill_value=None, axis=0, limit=None,
-                     limit_direction='forward',
-                     inplace=False, downcast=None, **kwargs):
+                     limit_direction='forward', limit_area=None,
+                     inplace=False, downcast=None, mgr=None, **kwargs):
         """ interpolate using scipy wrappers """
 
+        inplace = validate_bool_kwarg(inplace, 'inplace')
         data = self.values if inplace else self.values.copy()
 
         # only deal with floats
@@ -905,18 +1221,17 @@ def func(x):
 
             # process a 1-d slice, returning it
             # should the axis argument be handled below in apply_along_axis?
-            # i.e. not an arg to com.interpolate_1d
-            return com.interpolate_1d(index, x, method=method, limit=limit,
-                                      limit_direction=limit_direction,
-                                      fill_value=fill_value,
-                                      bounds_error=False, **kwargs)
+            # i.e. not an arg to missing.interpolate_1d
+            return missing.interpolate_1d(index, x, method=method, limit=limit,
+                                          limit_direction=limit_direction,
+                                          limit_area=limit_area,
+                                          fill_value=fill_value,
+                                          bounds_error=False, **kwargs)
 
         # interp each column independently
         interp_values = np.apply_along_axis(func, axis, data)
 
-        blocks = [self.make_block(interp_values,
-                                  klass=self.__class__,
-                                  fastpath=True)]
+        blocks = [self.make_block_same_class(interp_values)]
         return self._maybe_downcast(blocks, downcast)
 
     def take_nd(self, indexer, axis, new_mgr_locs=None, fill_tuple=None):
@@ -925,7 +1240,7 @@ def take_nd(self, indexer, axis, new_mgr_locs=None, fill_tuple=None):
 
         """
 
-        # com.take_nd dispatches for DatetimeTZBlock, CategoricalBlock
+        # algos.take_nd dispatches for DatetimeTZBlock, CategoricalBlock
         # so need to preserve types
         # sparse is treated like an ndarray, but needs .get_values() shaping
 
@@ -935,16 +1250,16 @@ def take_nd(self, indexer, axis, new_mgr_locs=None, fill_tuple=None):
 
         if fill_tuple is None:
             fill_value = self.fill_value
-            new_values = com.take_nd(values, indexer, axis=axis,
-                                     allow_fill=False)
+            new_values = algos.take_nd(values, indexer, axis=axis,
+                                       allow_fill=False)
         else:
             fill_value = fill_tuple[0]
-            new_values = com.take_nd(values, indexer, axis=axis,
-                                     allow_fill=True, fill_value=fill_value)
+            new_values = algos.take_nd(values, indexer, axis=axis,
+                                       allow_fill=True, fill_value=fill_value)
 
         if new_mgr_locs is None:
             if axis == 0:
-                slc = lib.indexer_as_slice(indexer)
+                slc = libinternals.indexer_as_slice(indexer)
                 if slc is not None:
                     new_mgr_locs = self.mgr_locs[slc]
                 else:
@@ -957,18 +1272,17 @@ def take_nd(self, indexer, axis, new_mgr_locs=None, fill_tuple=None):
         else:
             return self.make_block_same_class(new_values, new_mgr_locs)
 
-    def diff(self, n, axis=1):
+    def diff(self, n, axis=1, mgr=None):
         """ return block for the diff of the values """
-        new_values = com.diff(self.values, n, axis=axis)
-        return [self.make_block(values=new_values,
-                                fastpath=True)]
+        new_values = algos.diff(self.values, n, axis=axis)
+        return [self.make_block(values=new_values)]
 
-    def shift(self, periods, axis=0):
+    def shift(self, periods, axis=0, mgr=None):
         """ shift the block by periods, possibly upcast """
 
         # convert integer to float if necessary. need to do a lot more than
         # that, handle boolean etc also
-        new_values, fill_value = com._maybe_upcast(self.values)
+        new_values, fill_value = maybe_upcast(self.values)
 
         # make sure array sent to np.roll is c_contiguous
         f_ordered = new_values.flags.f_contiguous
@@ -977,23 +1291,23 @@ def shift(self, periods, axis=0):
             axis = new_values.ndim - axis - 1
 
         if np.prod(new_values.shape):
-            new_values = np.roll(new_values, com._ensure_platform_int(periods), axis=axis)
+            new_values = np.roll(new_values, _ensure_platform_int(periods),
+                                 axis=axis)
 
-        axis_indexer = [ slice(None) ] * self.ndim
+        axis_indexer = [slice(None)] * self.ndim
         if periods > 0:
-            axis_indexer[axis] = slice(None,periods)
+            axis_indexer[axis] = slice(None, periods)
         else:
-            axis_indexer[axis] = slice(periods,None)
+            axis_indexer[axis] = slice(periods, None)
         new_values[tuple(axis_indexer)] = fill_value
 
         # restore original order
         if f_ordered:
             new_values = new_values.T
 
-        return [self.make_block(new_values,
-                                fastpath=True)]
+        return [self.make_block(new_values)]
 
-    def eval(self, func, other, raise_on_error=True, try_cast=False):
+    def eval(self, func, other, errors='raise', try_cast=False, mgr=None):
         """
         evaluate the block; return result block from the result
 
@@ -1001,17 +1315,20 @@ def eval(self, func, other, raise_on_error=True, try_cast=False):
         ----------
         func  : how to combine self, other
         other : a ndarray/object
-        raise_on_error : if True, raise when I can't perform the function,
-            False by default (and just return the data that we had coming in)
+        errors : str, {'raise', 'ignore'}, default 'raise'
+            - ``raise`` : allow exceptions to be raised
+            - ``ignore`` : suppress exceptions. On error return original object
+
+        try_cast : try casting the results to the input type
 
         Returns
         -------
         a new block, the result of the func
         """
+        orig_other = other
         values = self.values
 
-        if hasattr(other, 'reindex_axis'):
-            other = other.values
+        other = getattr(other, 'values', other)
 
         # make sure that we can broadcast
         is_transposed = False
@@ -1025,25 +1342,67 @@ def eval(self, func, other, raise_on_error=True, try_cast=False):
                     is_transposed = True
                 else:
                     # this is a broadcast error heree
-                    raise ValueError("cannot broadcast shape [%s] with block "
-                                     "values [%s]" % (values.T.shape,
-                                                      other.shape))
+                    raise ValueError(
+                        "cannot broadcast shape [{t_shape}] with "
+                        "block values [{oth_shape}]".format(
+                            t_shape=values.T.shape, oth_shape=other.shape))
 
         transf = (lambda x: x.T) if is_transposed else (lambda x: x)
 
         # coerce/transpose the args if needed
-        values, other = self._try_coerce_args(transf(values), other)
+        try:
+            values, values_mask, other, other_mask = self._try_coerce_args(
+                transf(values), other)
+        except TypeError:
+            block = self.coerce_to_target_dtype(orig_other)
+            return block.eval(func, orig_other,
+                              errors=errors,
+                              try_cast=try_cast, mgr=mgr)
 
         # get the result, may need to transpose the other
         def get_result(other):
-            return self._try_coerce_result(func(values, other))
+
+            # avoid numpy warning of comparisons again None
+            if other is None:
+                result = not func.__name__ == 'eq'
+
+            # avoid numpy warning of elementwise comparisons to object
+            elif is_numeric_v_string_like(values, other):
+                result = False
+
+            # avoid numpy warning of elementwise comparisons
+            elif func.__name__ == 'eq':
+                if is_list_like(other) and not isinstance(other, np.ndarray):
+                    other = np.asarray(other)
+
+                    # if we can broadcast, then ok
+                    if values.shape[-1] != other.shape[-1]:
+                        return False
+                result = func(values, other)
+            else:
+                result = func(values, other)
+
+            # mask if needed
+            if isinstance(values_mask, np.ndarray) and values_mask.any():
+                result = result.astype('float64', copy=False)
+                result[values_mask] = np.nan
+            if other_mask is True:
+                result = result.astype('float64', copy=False)
+                result[:] = np.nan
+            elif isinstance(other_mask, np.ndarray) and other_mask.any():
+                result = result.astype('float64', copy=False)
+                result[other_mask.ravel()] = np.nan
+
+            return result
 
         # error handler if we have an issue operating with the function
         def handle_error():
 
-            if raise_on_error:
-                raise TypeError('Could not operate %s with block values %s'
-                                % (repr(other), str(detail)))
+            if errors == 'raise':
+                # The 'detail' variable is defined in outer scope.
+                raise TypeError(
+                    'Could not operate {other!r} with block values '
+                    '{detail!s}'.format(other=other, detail=detail))  # noqa
             else:
                 # return the values
                 result = np.empty(values.shape, dtype='O')
@@ -1052,7 +1411,8 @@ def handle_error():
 
         # get the result
         try:
-            result = get_result(other)
+            with np.errstate(all='ignore'):
+                result = get_result(other)
 
         # if we have an invalid shape/broadcast error
         # GH4576, so raise instead of allowing to pass through
@@ -1069,11 +1429,12 @@ def handle_error():
                 # differentiate between an invalid ndarray-ndarray comparison
                 # and an invalid type comparison
                 if isinstance(values, np.ndarray) and is_list_like(other):
-                    raise ValueError('Invalid broadcasting comparison [%s] '
-                                     'with block values' % repr(other))
+                    raise ValueError(
+                        'Invalid broadcasting comparison [{other!r}] with '
+                        'block values'.format(other=other))
 
-                raise TypeError('Could not compare [%s] with block values'
-                                % repr(other))
+                raise TypeError('Could not compare [{other!r}] '
+                                'with block values'.format(other=other))
 
         # transpose if needed
         result = transf(result)
@@ -1082,11 +1443,11 @@ def handle_error():
         if try_cast:
             result = self._try_cast_result(result)
 
-        return [self.make_block(result,
-                                fastpath=True,)]
+        result = _block_shape(result, ndim=self.ndim)
+        return [self.make_block(result)]
 
-    def where(self, other, cond, align=True, raise_on_error=True,
-              try_cast=False, axis=0, transpose=False):
+    def where(self, other, cond, align=True, errors='raise',
+              try_cast=False, axis=0, transpose=False, mgr=None):
         """
         evaluate the block; return result block(s) from the result
 
@@ -1095,8 +1456,10 @@ def where(self, other, cond, align=True, raise_on_error=True,
         other : a ndarray/object
         cond  : the condition to respect
         align : boolean, perform alignment on other/cond
-        raise_on_error : if True, raise when I can't perform the function,
-            False by default (and just return the data that we had coming in)
+        errors : str, {'raise', 'ignore'}, default 'raise'
+            - ``raise`` : allow exceptions to be raised
+            - ``ignore`` : suppress exceptions. On error return original object
+
         axis : int
         transpose : boolean
             Set to True if self is stored with axes reversed
@@ -1105,56 +1468,65 @@ def where(self, other, cond, align=True, raise_on_error=True,
         -------
         a new block(s), the result of the func
         """
+        import pandas.core.computation.expressions as expressions
+        assert errors in ['raise', 'ignore']
 
         values = self.values
+        orig_other = other
         if transpose:
             values = values.T
 
-        if hasattr(other, 'reindex_axis'):
-            other = other.values
-
-        if hasattr(cond, 'reindex_axis'):
-            cond = cond.values
+        other = getattr(other, 'values', other)
+        cond = getattr(cond, 'values', cond)
 
         # If the default broadcasting would go in the wrong direction, then
-        # explictly reshape other instead
+        # explicitly reshape other instead
         if getattr(other, 'ndim', 0) >= 1:
             if values.ndim - 1 == other.ndim and axis == 1:
-                other = other.reshape(tuple(other.shape + (1,)))
+                other = other.reshape(tuple(other.shape + (1, )))
 
         if not hasattr(cond, 'shape'):
-            raise ValueError("where must have a condition that is ndarray like")
-
-        other = _maybe_convert_string_to_object(other)
+            raise ValueError("where must have a condition that is ndarray "
+                             "like")
 
         # our where function
-        def func(c, v, o):
-            if c.ravel().all():
-                return v
+        def func(cond, values, other):
+            if cond.ravel().all():
+                return values
+
+            values, values_mask, other, other_mask = self._try_coerce_args(
+                values, other)
 
-            v, o = self._try_coerce_args(v, o)
             try:
-                return self._try_coerce_result(
-                    expressions.where(c, v, o, raise_on_error=True)
-                )
+                return self._try_coerce_result(expressions.where(
+                    cond, values, other))
             except Exception as detail:
-                if raise_on_error:
-                    raise TypeError('Could not operate [%s] with block values '
-                                    '[%s]' % (repr(o), str(detail)))
+                if errors == 'raise':
+                    raise TypeError(
+                        'Could not operate [{other!r}] with block values '
+                        '[{detail!s}]'.format(other=other, detail=detail))
                 else:
                     # return the values
-                    result = np.empty(v.shape, dtype='float64')
+                    result = np.empty(values.shape, dtype='float64')
                     result.fill(np.nan)
                     return result
 
         # see if we can operate on the entire block, or need item-by-item
         # or if we are a single block (ndim == 1)
-        result = func(cond, values, other)
-        if self._can_hold_na or self.ndim == 1:
+        try:
+            result = func(cond, values, other)
+        except TypeError:
+
+            # we cannot coerce, return a compat dtype
+            # we are explicitly ignoring errors
+            block = self.coerce_to_target_dtype(other)
+            blocks = block.where(orig_other, cond, align=align,
+                                 errors=errors,
+                                 try_cast=try_cast, axis=axis,
+                                 transpose=transpose)
+            return self._maybe_downcast(blocks, 'infer')
 
-            if not isinstance(result, np.ndarray):
-                raise TypeError('Could not compare [%s] with block values'
-                                % repr(other))
+        if self._can_hold_na or self.ndim == 1:
 
             if transpose:
                 result = result.T
@@ -1174,46 +1546,202 @@ def func(c, v, o):
         result_blocks = []
         for m in [mask, ~mask]:
             if m.any():
-                r = self._try_cast_result(
-                    result.take(m.nonzero()[0], axis=axis))
-                result_blocks.append(self.make_block(r.T,
-                                                     placement=self.mgr_locs[m]))
+                r = self._try_cast_result(result.take(m.nonzero()[0],
+                                                      axis=axis))
+                result_blocks.append(
+                    self.make_block(r.T, placement=self.mgr_locs[m]))
 
         return result_blocks
 
     def equals(self, other):
-        if self.dtype != other.dtype or self.shape != other.shape: return False
+        if self.dtype != other.dtype or self.shape != other.shape:
+            return False
         return array_equivalent(self.values, other.values)
 
+    def _unstack(self, unstacker_func, new_columns):
+        """Return a list of unstacked blocks of self
 
-class NonConsolidatableMixIn(object):
-    """ hold methods for the nonconsolidatable blocks """
-    _can_consolidate = False
-    _verify_integrity = False
-    _validate_ndim = False
-    _holder = None
+        Parameters
+        ----------
+        unstacker_func : callable
+            Partially applied unstacker.
+        new_columns : Index
+            All columns of the unstacked BlockManager.
 
-    def __init__(self, values, placement,
-                 ndim=None, fastpath=False, **kwargs):
+        Returns
+        -------
+        blocks : list of Block
+            New blocks of unstacked values.
+        mask : array_like of bool
+            The mask of columns of `blocks` we should keep.
+        """
+        unstacker = unstacker_func(self.values.T)
+        new_items = unstacker.get_new_columns()
+        new_placement = new_columns.get_indexer(new_items)
+        new_values, mask = unstacker.get_new_values()
 
-        # Placement must be converted to BlockPlacement via property setter
-        # before ndim logic, because placement may be a slice which doesn't
-        # have a length.
-        self.mgr_locs = placement
+        mask = mask.any(0)
+        new_values = new_values.T[mask]
+        new_placement = new_placement[mask]
 
-        # kludgetastic
-        if ndim is None:
-            if len(self.mgr_locs) != 1:
-                ndim = 1
+        blocks = [make_block(new_values, placement=new_placement)]
+        return blocks, mask
+
+    def quantile(self, qs, interpolation='linear', axis=0, mgr=None):
+        """
+        compute the quantiles of the
+
+        Parameters
+        ----------
+        qs: a scalar or list of the quantiles to be computed
+        interpolation: type of interpolation, default 'linear'
+        axis: axis to compute, default 0
+
+        Returns
+        -------
+        tuple of (axis, block)
+
+        """
+        kw = {'interpolation': interpolation}
+        values = self.get_values()
+        values, _, _, _ = self._try_coerce_args(values, values)
+
+        def _nanpercentile1D(values, mask, q, **kw):
+            values = values[~mask]
+
+            if len(values) == 0:
+                if is_scalar(q):
+                    return self._na_value
+                else:
+                    return np.array([self._na_value] * len(q),
+                                    dtype=values.dtype)
+
+            return np.percentile(values, q, **kw)
+
+        def _nanpercentile(values, q, axis, **kw):
+
+            mask = isna(self.values)
+            if not is_scalar(mask) and mask.any():
+                if self.ndim == 1:
+                    return _nanpercentile1D(values, mask, q, **kw)
+                else:
+                    # for nonconsolidatable blocks mask is 1D, but values 2D
+                    if mask.ndim < values.ndim:
+                        mask = mask.reshape(values.shape)
+                    if axis == 0:
+                        values = values.T
+                        mask = mask.T
+                    result = [_nanpercentile1D(val, m, q, **kw) for (val, m)
+                              in zip(list(values), list(mask))]
+                    result = np.array(result, dtype=values.dtype, copy=False).T
+                    return result
             else:
-                ndim = 2
-        self.ndim = ndim
+                return np.percentile(values, q, axis=axis, **kw)
 
-        if not isinstance(values, self._holder):
-            raise TypeError("values must be {0}".format(self._holder.__name__))
+        from pandas import Float64Index
+        is_empty = values.shape[axis] == 0
+        if is_list_like(qs):
+            ax = Float64Index(qs)
+
+            if is_empty:
+                if self.ndim == 1:
+                    result = self._na_value
+                else:
+                    # create the array of na_values
+                    # 2d len(values) * len(qs)
+                    result = np.repeat(np.array([self._na_value] * len(qs)),
+                                       len(values)).reshape(len(values),
+                                                            len(qs))
+            else:
+
+                try:
+                    result = _nanpercentile(values, np.array(qs) * 100,
+                                            axis=axis, **kw)
+                except ValueError:
+
+                    # older numpies don't handle an array for q
+                    result = [_nanpercentile(values, q * 100,
+                                             axis=axis, **kw) for q in qs]
+
+                result = np.array(result, copy=False)
+                if self.ndim > 1:
+                    result = result.T
+
+        else:
+
+            if self.ndim == 1:
+                ax = Float64Index([qs])
+            else:
+                ax = mgr.axes[0]
+
+            if is_empty:
+                if self.ndim == 1:
+                    result = self._na_value
+                else:
+                    result = np.array([self._na_value] * len(self))
+            else:
+                result = _nanpercentile(values, qs * 100, axis=axis, **kw)
+
+        ndim = getattr(result, 'ndim', None) or 0
+        result = self._try_coerce_result(result)
+        if is_scalar(result):
+            return ax, self.make_block_scalar(result)
+        return ax, make_block(result,
+                              placement=np.arange(len(result)),
+                              ndim=ndim)
 
+
+class ScalarBlock(Block):
+    """
+    a scalar compat Block
+    """
+    __slots__ = ['_mgr_locs', 'values', 'ndim']
+
+    def __init__(self, values):
+        self.ndim = 0
+        self.mgr_locs = [0]
         self.values = values
 
+    @property
+    def dtype(self):
+        return type(self.values)
+
+    @property
+    def shape(self):
+        return tuple([0])
+
+    def __len__(self):
+        return 0
+
+
+class NonConsolidatableMixIn(object):
+    """ hold methods for the nonconsolidatable blocks """
+    _can_consolidate = False
+    _verify_integrity = False
+    _validate_ndim = False
+
+    def __init__(self, values, placement, ndim=None):
+        """Initialize a non-consolidatable block.
+
+        'ndim' may be inferred from 'placement'.
+
+        This will call continue to call __init__ for the other base
+        classes mixed in with this Mixin.
+        """
+        # Placement must be converted to BlockPlacement so that we can check
+        # its length
+        if not isinstance(placement, BlockPlacement):
+            placement = BlockPlacement(placement)
+
+        # Maybe infer ndim from placement
+        if ndim is None:
+            if len(placement) != 1:
+                ndim = 1
+            else:
+                ndim = 2
+        super(NonConsolidatableMixIn, self).__init__(values, placement,
+                                                     ndim=ndim)
+
     @property
     def shape(self):
         if self.ndim == 1:
@@ -1231,7 +1759,7 @@ def iget(self, col):
 
         if self.ndim == 2 and isinstance(col, tuple):
             col, loc = col
-            if not is_null_slice(col) and col != 0:
+            if not com.is_null_slice(col) and col != 0:
                 raise IndexError("{0} only contains one item".format(self))
             return self.values[loc]
         else:
@@ -1246,12 +1774,40 @@ def set(self, locs, values, check=False):
         assert locs.tolist() == [0]
         self.values = values
 
-    def get(self, item):
-        if self.ndim == 1:
-            loc = self.items.get_loc(item)
-            return self.values[loc]
-        else:
-            return self.values
+    def putmask(self, mask, new, align=True, inplace=False, axis=0,
+                transpose=False, mgr=None):
+        """
+        putmask the data to the block; we must be a single block and not
+        generate other blocks
+
+        return the resulting block
+
+        Parameters
+        ----------
+        mask  : the condition to respect
+        new : a ndarray/object
+        align : boolean, perform alignment on other/cond, default is True
+        inplace : perform inplace modification, default is False
+
+        Returns
+        -------
+        a new block, the result of the putmask
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
+        # use block's copy logic.
+        # .values may be an Index which does shallow copy by default
+        new_values = self.values if inplace else self.copy().values
+        new_values, _, new, _ = self._try_coerce_args(new_values, new)
+
+        if isinstance(new, np.ndarray) and len(new) == len(mask):
+            new = new[mask]
+
+        mask = _safe_reshape(mask, new_values.shape)
+
+        new_values[mask] = new
+        new_values = self._try_coerce_result(new_values)
+        return [self.make_block(values=new_values)]
 
     def _slice(self, slicer):
         """ return a slice of my values (but densify first) """
@@ -1260,6 +1816,207 @@ def _slice(self, slicer):
     def _try_cast_result(self, result, dtype=None):
         return result
 
+    def _unstack(self, unstacker_func, new_columns):
+        """Return a list of unstacked blocks of self
+
+        Parameters
+        ----------
+        unstacker_func : callable
+            Partially applied unstacker.
+        new_columns : Index
+            All columns of the unstacked BlockManager.
+
+        Returns
+        -------
+        blocks : list of Block
+            New blocks of unstacked values.
+        mask : array_like of bool
+            The mask of columns of `blocks` we should keep.
+        """
+        # NonConsolidatable blocks can have a single item only, so we return
+        # one block per item
+        unstacker = unstacker_func(self.values.T)
+        new_items = unstacker.get_new_columns()
+        new_placement = new_columns.get_indexer(new_items)
+        new_values, mask = unstacker.get_new_values()
+
+        mask = mask.any(0)
+        new_values = new_values.T[mask]
+        new_placement = new_placement[mask]
+
+        blocks = [self.make_block_same_class(vals, [place])
+                  for vals, place in zip(new_values, new_placement)]
+        return blocks, mask
+
+
+class ExtensionBlock(NonConsolidatableMixIn, Block):
+    """Block for holding extension types.
+
+    Notes
+    -----
+    This holds all 3rd-party extension array types. It's also the immediate
+    parent class for our internal extension types' blocks, CategoricalBlock.
+
+    ExtensionArrays are limited to 1-D.
+    """
+    is_extension = True
+
+    def __init__(self, values, placement, ndim=None):
+        values = self._maybe_coerce_values(values)
+        super(ExtensionBlock, self).__init__(values, placement, ndim)
+
+    def _maybe_coerce_values(self, values):
+        """Unbox to an extension array.
+
+        This will unbox an ExtensionArray stored in an Index or Series.
+        ExtensionArrays pass through. No dtype coercion is done.
+
+        Parameters
+        ----------
+        values : Index, Series, ExtensionArray
+
+        Returns
+        -------
+        ExtensionArray
+        """
+        if isinstance(values, (ABCIndexClass, ABCSeries)):
+            values = values._values
+        return values
+
+    @property
+    def _holder(self):
+        # For extension blocks, the holder is values-dependent.
+        return type(self.values)
+
+    @property
+    def fill_value(self):
+        # Used in reindex_indexer
+        return self.values.dtype.na_value
+
+    @property
+    def _can_hold_na(self):
+        # The default ExtensionArray._can_hold_na is True
+        return self._holder._can_hold_na
+
+    @property
+    def is_view(self):
+        """Extension arrays are never treated as views."""
+        return False
+
+    def setitem(self, indexer, value, mgr=None):
+        """Set the value inplace, returning a same-typed block.
+
+        This differs from Block.setitem by not allowing setitem to change
+        the dtype of the Block.
+
+        Parameters
+        ----------
+        indexer : tuple, list-like, array-like, slice
+            The subset of self.values to set
+        value : object
+            The value being set
+        mgr : BlockPlacement, optional
+
+        Returns
+        -------
+        Block
+
+        Notes
+        -----
+        `indexer` is a direct slice/positional indexer. `value` must
+        be a compatible shape.
+        """
+        if isinstance(indexer, tuple):
+            # we are always 1-D
+            indexer = indexer[0]
+
+        check_setitem_lengths(indexer, value, self.values)
+        self.values[indexer] = value
+        return self
+
+    def get_values(self, dtype=None):
+        # ExtensionArrays must be iterable, so this works.
+        values = np.asarray(self.values)
+        if values.ndim == self.ndim - 1:
+            values = values.reshape((1,) + values.shape)
+        return values
+
+    def to_dense(self):
+        return np.asarray(self.values)
+
+    def take_nd(self, indexer, axis=0, new_mgr_locs=None, fill_tuple=None):
+        """
+        Take values according to indexer and return them as a block.
+        """
+        if fill_tuple is None:
+            fill_value = None
+        else:
+            fill_value = fill_tuple[0]
+
+        # axis doesn't matter; we are really a single-dim object
+        # but are passed the axis depending on the calling routing
+        # if its REALLY axis 0, then this will be a reindex and not a take
+        new_values = self.values.take(indexer, fill_value=fill_value,
+                                      allow_fill=True)
+
+        # if we are a 1-dim object, then always place at 0
+        if self.ndim == 1:
+            new_mgr_locs = [0]
+        else:
+            if new_mgr_locs is None:
+                new_mgr_locs = self.mgr_locs
+
+        return self.make_block_same_class(new_values, new_mgr_locs)
+
+    def _can_hold_element(self, element):
+        # XXX: We may need to think about pushing this onto the array.
+        # We're doing the same as CategoricalBlock here.
+        return True
+
+    def _slice(self, slicer):
+        """ return a slice of my values """
+
+        # slice the category
+        # return same dims as we currently have
+
+        if isinstance(slicer, tuple) and len(slicer) == 2:
+            if not com.is_null_slice(slicer[0]):
+                raise AssertionError("invalid slicing for a 1-ndim "
+                                     "categorical")
+            slicer = slicer[1]
+
+        return self.values[slicer]
+
+    def formatting_values(self):
+        return self.values._formatting_values()
+
+    def concat_same_type(self, to_concat, placement=None):
+        """
+        Concatenate list of single blocks of the same type.
+        """
+        values = self._holder._concat_same_type(
+            [blk.values for blk in to_concat])
+        placement = placement or slice(0, len(values), 1)
+        return self.make_block_same_class(values, ndim=self.ndim,
+                                          placement=placement)
+
+    def fillna(self, value, limit=None, inplace=False, downcast=None,
+               mgr=None):
+        values = self.values if inplace else self.values.copy()
+        values = values.fillna(value=value, limit=limit)
+        return [self.make_block_same_class(values=values,
+                                           placement=self.mgr_locs,
+                                           ndim=self.ndim)]
+
+    def interpolate(self, method='pad', axis=0, inplace=False, limit=None,
+                    fill_value=None, **kwargs):
+
+        values = self.values if inplace else self.values.copy()
+        return self.make_block_same_class(
+            values=values.fillna(value=fill_value, method=method,
+                                 limit=limit),
+            placement=self.mgr_locs)
+
 
 class NumericBlock(Block):
     __slots__ = ()
@@ -1271,7 +2028,8 @@ class FloatOrComplexBlock(NumericBlock):
     __slots__ = ()
 
     def equals(self, other):
-        if self.dtype != other.dtype or self.shape != other.shape: return False
+        if self.dtype != other.dtype or self.shape != other.shape:
+            return False
         left, right = self.values, other.values
         return ((left == right) | (np.isnan(left) & np.isnan(right))).all()
 
@@ -1279,52 +2037,46 @@ def equals(self, other):
 class FloatBlock(FloatOrComplexBlock):
     __slots__ = ()
     is_float = True
-    _downcast_dtype = 'int64'
 
     def _can_hold_element(self, element):
-        if is_list_like(element):
-            element = np.array(element)
-            tipo = element.dtype.type
-            return issubclass(tipo, (np.floating, np.integer)) and not issubclass(
-                tipo, (np.datetime64, np.timedelta64))
-        return isinstance(element, (float, int, np.float_, np.int_)) and not isinstance(
-            element, (bool, np.bool_, datetime, timedelta, np.datetime64, np.timedelta64))
-
-    def _try_cast(self, element):
-        try:
-            return float(element)
-        except:  # pragma: no cover
-            return element
-
-    def to_native_types(self, slicer=None, na_rep='', float_format=None, decimal='.',
-                        quoting=None, **kwargs):
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            return (issubclass(tipo.type, (np.floating, np.integer)) and
+                    not issubclass(tipo.type, (np.datetime64, np.timedelta64)))
+        return (
+            isinstance(
+                element, (float, int, np.floating, np.int_, compat.long))
+            and not isinstance(element, (bool, np.bool_, datetime, timedelta,
+                                         np.datetime64, np.timedelta64)))
+
+    def to_native_types(self, slicer=None, na_rep='', float_format=None,
+                        decimal='.', quoting=None, **kwargs):
         """ convert to our native types format, slicing if desired """
 
         values = self.values
         if slicer is not None:
             values = values[:, slicer]
-        mask = isnull(values)
 
-        formatter = None
-        if float_format and decimal != '.':
-            formatter = lambda v : (float_format % v).replace('.',decimal,1)
-        elif decimal != '.':
-            formatter = lambda v : ('%g' % v).replace('.',decimal,1)
-        elif float_format:
-            formatter = lambda v : float_format % v
+        # see gh-13418: no special formatting is desired at the
+        # output (important for appropriate 'quoting' behaviour),
+        # so do not pass it through the FloatArrayFormatter
+        if float_format is None and decimal == '.':
+            mask = isna(values)
 
-        if formatter is None and not quoting:
-            values = values.astype(str)
-        else:
-            values = np.array(values, dtype='object')
+            if not quoting:
+                values = values.astype(str)
+            else:
+                values = np.array(values, dtype='object')
 
-        values[mask] = na_rep
-        if formatter:
-            imask = (~mask).ravel()
-            values.flat[imask] = np.array(
-                [formatter(val) for val in values.ravel()[imask]])
+            values[mask] = na_rep
+            return values
 
-        return values
+        from pandas.io.formats.format import FloatArrayFormatter
+        formatter = FloatArrayFormatter(values, na_rep=na_rep,
+                                        float_format=float_format,
+                                        decimal=decimal, quoting=quoting,
+                                        fixed_width=False)
+        return formatter.get_result_as_array()
 
     def should_store(self, value):
         # when inserting a column should not coerce integers to floats
@@ -1338,17 +2090,15 @@ class ComplexBlock(FloatOrComplexBlock):
     is_complex = True
 
     def _can_hold_element(self, element):
-        if is_list_like(element):
-            element = np.array(element)
-            return issubclass(element.dtype.type, (np.floating, np.integer, np.complexfloating))
-        return (isinstance(element, (float, int, complex, np.float_, np.int_)) and
-                not isinstance(bool, np.bool_))
-
-    def _try_cast(self, element):
-        try:
-            return complex(element)
-        except:  # pragma: no cover
-            return element
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            return issubclass(tipo.type,
+                              (np.floating, np.integer, np.complexfloating))
+        return (
+            isinstance(
+                element,
+                (float, int, complex, np.float_, np.int_, compat.long))
+            and not isinstance(element, (bool, np.bool_)))
 
     def should_store(self, value):
         return issubclass(value.dtype.type, np.complexfloating)
@@ -1360,97 +2110,143 @@ class IntBlock(NumericBlock):
     _can_hold_na = False
 
     def _can_hold_element(self, element):
-        if is_list_like(element):
-            element = np.array(element)
-            tipo = element.dtype.type
-            return issubclass(tipo, np.integer) and not issubclass(tipo, (np.datetime64, np.timedelta64))
-        return com.is_integer(element)
-
-    def _try_cast(self, element):
-        try:
-            return int(element)
-        except:  # pragma: no cover
-            return element
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            return (issubclass(tipo.type, np.integer) and
+                    not issubclass(tipo.type, (np.datetime64,
+                                               np.timedelta64)) and
+                    self.dtype.itemsize >= tipo.itemsize)
+        return is_integer(element)
 
     def should_store(self, value):
-        return com.is_integer_dtype(value) and value.dtype == self.dtype
+        return is_integer_dtype(value) and value.dtype == self.dtype
+
+
+class DatetimeLikeBlockMixin(object):
+    """Mixin class for DatetimeBlock and DatetimeTZBlock."""
+
+    @property
+    def _holder(self):
+        return DatetimeIndex
+
+    @property
+    def _na_value(self):
+        return tslib.NaT
+
+    @property
+    def fill_value(self):
+        return tslib.iNaT
 
+    def get_values(self, dtype=None):
+        """
+        return object dtype as boxed values, such as Timestamps/Timedelta
+        """
+        if is_object_dtype(dtype):
+            return lib.map_infer(self.values.ravel(),
+                                 self._box_func).reshape(self.values.shape)
+        return self.values
 
-class TimeDeltaBlock(IntBlock):
+
+class TimeDeltaBlock(DatetimeLikeBlockMixin, IntBlock):
     __slots__ = ()
     is_timedelta = True
     _can_hold_na = True
     is_numeric = False
 
+    def __init__(self, values, placement, ndim=None):
+        if values.dtype != _TD_DTYPE:
+            values = conversion.ensure_timedelta64ns(values)
+
+        super(TimeDeltaBlock, self).__init__(values,
+                                             placement=placement, ndim=ndim)
+
     @property
-    def fill_value(self):
-        return tslib.iNaT
+    def _holder(self):
+        return TimedeltaIndex
 
-    def _try_fill(self, value):
-        """ if we are a NaT, return the actual fill value """
-        if isinstance(value, type(tslib.NaT)) or np.array(isnull(value)).all():
-            value = tslib.iNaT
-        elif isinstance(value, Timedelta):
-            value = value.value
-        elif isinstance(value, np.timedelta64):
-            pass
-        elif com.is_integer(value):
-            # coerce to seconds of timedelta
-            value = np.timedelta64(int(value * 1e9))
-        elif isinstance(value, timedelta):
-            value = np.timedelta64(value)
+    @property
+    def _box_func(self):
+        return lambda x: tslib.Timedelta(x, unit='ns')
+
+    def _can_hold_element(self, element):
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            return issubclass(tipo.type, np.timedelta64)
+        return is_integer(element) or isinstance(
+            element, (timedelta, np.timedelta64))
+
+    def fillna(self, value, **kwargs):
 
-        return value
+        # allow filling with integers to be
+        # interpreted as seconds
+        if is_integer(value) and not isinstance(value, np.timedelta64):
+            value = Timedelta(value, unit='s')
+        return super(TimeDeltaBlock, self).fillna(value, **kwargs)
 
     def _try_coerce_args(self, values, other):
-        """ Coerce values and other to float64, with null values converted to
-            NaN. values is always ndarray-like, other may not be """
-        def masker(v):
-            mask = isnull(v)
-            v = v.astype('float64')
-            v[mask] = np.nan
-            return v
+        """
+        Coerce values and other to int64, with null values converted to
+        iNaT. values is always ndarray-like, other may not be
 
-        values = masker(values)
+        Parameters
+        ----------
+        values : ndarray-like
+        other : ndarray-like or scalar
 
-        if is_null_datelike_scalar(other):
-            other = np.nan
-        elif isinstance(other, (np.timedelta64, Timedelta, timedelta)):
-            other = _coerce_scalar_to_timedelta_type(other, unit='s', box=False).item()
-            if other == tslib.iNaT:
-                other = np.nan
-        elif lib.isscalar(other):
-            other = np.float64(other)
-        else:
-            other = masker(other)
+        Returns
+        -------
+        base-type values, values mask, base-type other, other mask
+        """
 
-        return values, other
+        values_mask = isna(values)
+        values = values.view('i8')
+        other_mask = False
 
-    def _try_operate(self, values):
-        """ return a version to operate on """
-        return values.view('i8')
+        if isinstance(other, bool):
+            raise TypeError
+        elif is_null_datelike_scalar(other):
+            other = tslib.iNaT
+            other_mask = True
+        elif isinstance(other, Timedelta):
+            other_mask = isna(other)
+            other = other.value
+        elif isinstance(other, timedelta):
+            other = Timedelta(other).value
+        elif isinstance(other, np.timedelta64):
+            other_mask = isna(other)
+            other = Timedelta(other).value
+        elif hasattr(other, 'dtype') and is_timedelta64_dtype(other):
+            other_mask = isna(other)
+            other = other.astype('i8', copy=False).view('i8')
+        else:
+            # coercion issues
+            # let higher levels handle
+            raise TypeError
+
+        return values, values_mask, other, other_mask
 
     def _try_coerce_result(self, result):
         """ reverse of try_coerce_args / try_operate """
         if isinstance(result, np.ndarray):
-            mask = isnull(result)
+            mask = isna(result)
             if result.dtype.kind in ['i', 'f', 'O']:
                 result = result.astype('m8[ns]')
             result[mask] = tslib.iNaT
-        elif isinstance(result, np.integer):
-            result = lib.Timedelta(result)
+        elif isinstance(result, (np.integer, np.float)):
+            result = self._box_func(result)
         return result
 
     def should_store(self, value):
         return issubclass(value.dtype.type, np.timedelta64)
 
-    def to_native_types(self, slicer=None, na_rep=None, quoting=None, **kwargs):
+    def to_native_types(self, slicer=None, na_rep=None, quoting=None,
+                        **kwargs):
         """ convert to our native types format, slicing if desired """
 
         values = self.values
         if slicer is not None:
             values = values[:, slicer]
-        mask = isnull(values)
+        mask = isna(values)
 
         rvalues = np.empty(values.shape, dtype=object)
         if na_rep is None:
@@ -1458,8 +2254,8 @@ def to_native_types(self, slicer=None, na_rep=None, quoting=None, **kwargs):
         rvalues[mask] = na_rep
         imask = (~mask).ravel()
 
-        #### FIXME ####
-        # should use the core.format.Timedelta64Formatter here
+        # FIXME:
+        # should use the formats.format.Timedelta64Formatter here
         # to figure what format to pass to the Timedelta
         # e.g. to not show the decimals say
         rvalues.flat[imask] = np.array([Timedelta(val)._repr_base(format='all')
@@ -1468,41 +2264,30 @@ def to_native_types(self, slicer=None, na_rep=None, quoting=None, **kwargs):
         return rvalues
 
 
-    def get_values(self, dtype=None):
-        # return object dtypes as Timedelta
-        if dtype == object:
-            return lib.map_infer(self.values.ravel(), lib.Timedelta
-                                 ).reshape(self.values.shape)
-        return self.values
-
 class BoolBlock(NumericBlock):
     __slots__ = ()
     is_bool = True
     _can_hold_na = False
 
     def _can_hold_element(self, element):
-        if is_list_like(element):
-            element = np.array(element)
-            return issubclass(element.dtype.type, np.integer)
-        return isinstance(element, (int, bool))
-
-    def _try_cast(self, element):
-        try:
-            return bool(element)
-        except:  # pragma: no cover
-            return element
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            return issubclass(tipo.type, np.bool_)
+        return isinstance(element, (bool, np.bool_))
 
     def should_store(self, value):
         return issubclass(value.dtype.type, np.bool_)
 
     def replace(self, to_replace, value, inplace=False, filter=None,
-                regex=False):
+                regex=False, convert=True, mgr=None):
+        inplace = validate_bool_kwarg(inplace, 'inplace')
         to_replace_values = np.atleast_1d(to_replace)
         if not np.can_cast(to_replace_values, bool):
             return self
         return super(BoolBlock, self).replace(to_replace, value,
                                               inplace=inplace, filter=filter,
-                                              regex=regex)
+                                              regex=regex, convert=convert,
+                                              mgr=mgr)
 
 
 class ObjectBlock(Block):
@@ -1510,14 +2295,12 @@ class ObjectBlock(Block):
     is_object = True
     _can_hold_na = True
 
-    def __init__(self, values, ndim=2, fastpath=False,
-                 placement=None, **kwargs):
+    def __init__(self, values, placement=None, ndim=2):
         if issubclass(values.dtype.type, compat.string_types):
             values = np.array(values, dtype=object)
 
         super(ObjectBlock, self).__init__(values, ndim=ndim,
-                                          fastpath=fastpath,
-                                          placement=placement, **kwargs)
+                                          placement=placement)
 
     @property
     def is_bool(self):
@@ -1528,27 +2311,28 @@ def is_bool(self):
 
     # TODO: Refactor when convert_objects is removed since there will be 1 path
     def convert(self, *args, **kwargs):
-        """ attempt to coerce any object types to better types
-            return a copy of the block (if copy = True)
-            by definition we ARE an ObjectBlock!!!!!
+        """ attempt to coerce any object types to better types return a copy of
+        the block (if copy = True) by definition we ARE an ObjectBlock!!!!!
+
+        can return multiple blocks!
+        """
 
-            can return multiple blocks!
-            """
         if args:
             raise NotImplementedError
         by_item = True if 'by_item' not in kwargs else kwargs['by_item']
 
-        new_inputs = ['coerce','datetime','numeric','timedelta']
+        new_inputs = ['coerce', 'datetime', 'numeric', 'timedelta']
         new_style = False
         for kw in new_inputs:
             new_style |= kw in kwargs
 
         if new_style:
-            fn = convert._soft_convert_objects
+            fn = soft_convert_objects
             fn_inputs = new_inputs
         else:
-            fn = convert._possibly_convert_objects
-            fn_inputs = ['convert_dates','convert_numeric','convert_timedeltas']
+            fn = maybe_convert_objects
+            fn_inputs = ['convert_dates', 'convert_numeric',
+                         'convert_timedeltas']
         fn_inputs += ['copy']
 
         fn_kwargs = {}
@@ -1556,21 +2340,24 @@ def convert(self, *args, **kwargs):
             if key in kwargs:
                 fn_kwargs[key] = kwargs[key]
 
-        # attempt to create new type blocks
-        blocks = []
-        if by_item and not self._is_single_block:
-
-            for i, rl in enumerate(self.mgr_locs):
-                values = self.iget(i)
-
-                values = fn(values.ravel(), **fn_kwargs).reshape(values.shape)
+        # operate column-by-column
+        def f(m, v, i):
+            shape = v.shape
+            values = fn(v.ravel(), **fn_kwargs)
+            try:
+                values = values.reshape(shape)
                 values = _block_shape(values, ndim=self.ndim)
-                newb = make_block(values, ndim=self.ndim, placement=[rl])
-                blocks.append(newb)
+            except (AttributeError, NotImplementedError):
+                pass
+
+            return values
 
+        if by_item and not self._is_single_block:
+            blocks = self.split_and_operate(None, f, False)
         else:
-            values = fn(self.values.ravel(), **fn_kwargs).reshape(self.values.shape)
-            blocks.append(make_block(values, ndim=self.ndim, placement=self.mgr_locs))
+            values = f(None, self.values.ravel(), None)
+            blocks = [make_block(values, ndim=self.ndim,
+                                 placement=self.mgr_locs)]
 
         return blocks
 
@@ -1598,71 +2385,95 @@ def set(self, locs, values, check=False):
             # see GH6171
             new_shape = list(values.shape)
             new_shape[0] = len(self.items)
-            self.values = np.empty(tuple(new_shape),dtype=self.dtype)
+            self.values = np.empty(tuple(new_shape), dtype=self.dtype)
             self.values.fill(np.nan)
             self.values[locs] = values
 
-
     def _maybe_downcast(self, blocks, downcast=None):
 
         if downcast is not None:
             return blocks
 
         # split and convert the blocks
-        result_blocks = []
-        for blk in blocks:
-            result_blocks.extend(blk.convert(datetime=True, numeric=False))
-        return result_blocks
+        return _extend_blocks([b.convert(datetime=True, numeric=False)
+                               for b in blocks])
 
     def _can_hold_element(self, element):
         return True
 
-    def _try_cast(self, element):
-        return element
+    def _try_coerce_args(self, values, other):
+        """ provide coercion to our input arguments """
+
+        if isinstance(other, ABCDatetimeIndex):
+            # to store DatetimeTZBlock as object
+            other = other.astype(object).values
+
+        return values, False, other, False
 
     def should_store(self, value):
         return not (issubclass(value.dtype.type,
-                              (np.integer, np.floating, np.complexfloating,
-                               np.datetime64, np.bool_)) or is_internal_type(value))
+                               (np.integer, np.floating, np.complexfloating,
+                                np.datetime64, np.bool_)) or
+                    # TODO(ExtensionArray): remove is_extension_type
+                    # when all extension arrays have been ported.
+                    is_extension_type(value) or
+                    is_extension_array_dtype(value))
 
     def replace(self, to_replace, value, inplace=False, filter=None,
-                regex=False):
-        blk = [self]
-        to_rep_is_list = com.is_list_like(to_replace)
-        value_is_list = com.is_list_like(value)
+                regex=False, convert=True, mgr=None):
+        to_rep_is_list = is_list_like(to_replace)
+        value_is_list = is_list_like(value)
         both_lists = to_rep_is_list and value_is_list
         either_list = to_rep_is_list or value_is_list
 
-        if not either_list and com.is_re(to_replace):
-            blk[0], = blk[0]._replace_single(to_replace, value,
-                                             inplace=inplace, filter=filter,
-                                             regex=True)
+        result_blocks = []
+        blocks = [self]
+
+        if not either_list and is_re(to_replace):
+            return self._replace_single(to_replace, value, inplace=inplace,
+                                        filter=filter, regex=True,
+                                        convert=convert, mgr=mgr)
         elif not (either_list or regex):
-            blk = super(ObjectBlock, self).replace(to_replace, value,
-                                                   inplace=inplace,
-                                                   filter=filter, regex=regex)
+            return super(ObjectBlock, self).replace(to_replace, value,
+                                                    inplace=inplace,
+                                                    filter=filter, regex=regex,
+                                                    convert=convert, mgr=mgr)
         elif both_lists:
             for to_rep, v in zip(to_replace, value):
-                blk[0], = blk[0]._replace_single(to_rep, v, inplace=inplace,
-                                                 filter=filter, regex=regex)
+                result_blocks = []
+                for b in blocks:
+                    result = b._replace_single(to_rep, v, inplace=inplace,
+                                               filter=filter, regex=regex,
+                                               convert=convert, mgr=mgr)
+                    result_blocks = _extend_blocks(result, result_blocks)
+                blocks = result_blocks
+            return result_blocks
+
         elif to_rep_is_list and regex:
             for to_rep in to_replace:
-                blk[0], = blk[0]._replace_single(to_rep, value,
-                                                 inplace=inplace,
-                                                 filter=filter, regex=regex)
-        else:
-            blk[0], = blk[0]._replace_single(to_replace, value,
-                                             inplace=inplace, filter=filter,
-                                             regex=regex)
-        return blk
+                result_blocks = []
+                for b in blocks:
+                    result = b._replace_single(to_rep, value, inplace=inplace,
+                                               filter=filter, regex=regex,
+                                               convert=convert, mgr=mgr)
+                    result_blocks = _extend_blocks(result, result_blocks)
+                blocks = result_blocks
+            return result_blocks
+
+        return self._replace_single(to_replace, value, inplace=inplace,
+                                    filter=filter, convert=convert,
+                                    regex=regex, mgr=mgr)
 
     def _replace_single(self, to_replace, value, inplace=False, filter=None,
-                        regex=False):
+                        regex=False, convert=True, mgr=None):
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
         # to_replace is regex compilable
-        to_rep_re = regex and com.is_re_compilable(to_replace)
+        to_rep_re = regex and is_re_compilable(to_replace)
 
         # regex is regex compilable
-        regex_re = com.is_re_compilable(regex)
+        regex_re = is_re_compilable(regex)
 
         # only one will survive
         if to_rep_re and regex_re:
@@ -1689,19 +2500,17 @@ def _replace_single(self, to_replace, value, inplace=False, filter=None,
         else:
             # if the thing to replace is not a string or compiled regex call
             # the superclass method -> to_replace is some kind of object
-            result = super(ObjectBlock, self).replace(to_replace, value,
-                                                      inplace=inplace,
-                                                      filter=filter,
-                                                      regex=regex)
-            if not isinstance(result, list):
-                result = [result]
-            return result
+            return super(ObjectBlock, self).replace(to_replace, value,
+                                                    inplace=inplace,
+                                                    filter=filter, regex=regex,
+                                                    mgr=mgr)
 
         new_values = self.values if inplace else self.values.copy()
 
         # deal with replacing values with objects (strings) that match but
         # whose replacement is not a string (numeric, nan, object)
-        if isnull(value) or not isinstance(value, compat.string_types):
+        if isna(value) or not isinstance(value, compat.string_types):
+
             def re_replacer(s):
                 try:
                     return value if rx.search(s) is not None else s
@@ -1725,134 +2534,60 @@ def re_replacer(s):
 
         new_values[filt] = f(new_values[filt])
 
-        return [self if inplace else
-                self.make_block(new_values,
-                                fastpath=True)]
+        # convert
+        block = self.make_block(new_values)
+        if convert:
+            block = block.convert(by_item=True, numeric=False)
+
+        return block
+
 
-class CategoricalBlock(NonConsolidatableMixIn, ObjectBlock):
+class CategoricalBlock(ExtensionBlock):
     __slots__ = ()
     is_categorical = True
     _verify_integrity = True
     _can_hold_na = True
-    _holder = Categorical
+    _concatenator = staticmethod(_concat._concat_categorical)
 
-    def __init__(self, values, placement,
-                 fastpath=False, **kwargs):
+    def __init__(self, values, placement, ndim=None):
+        from pandas.core.arrays.categorical import _maybe_to_categorical
 
         # coerce to categorical if we can
-        super(CategoricalBlock, self).__init__(maybe_to_categorical(values),
-                                               fastpath=True, placement=placement,
-                                               **kwargs)
+        super(CategoricalBlock, self).__init__(_maybe_to_categorical(values),
+                                               placement=placement,
+                                               ndim=ndim)
 
     @property
-    def is_view(self):
-        """ I am never a view """
-        return False
-
-    def to_dense(self):
-        return self.values.to_dense().view()
-
-    def convert(self, copy=True, **kwargs):
-        return [self.copy() if copy else self]
+    def _holder(self):
+        return Categorical
 
     @property
     def array_dtype(self):
-        """ the dtype to return if I want to construct this block as an array """
+        """ the dtype to return if I want to construct this block as an
+        array
+        """
         return np.object_
 
-    def _slice(self, slicer):
-        """ return a slice of my values """
-
-        # slice the category
-        # return same dims as we currently have
-        return self.values._slice(slicer)
-
-    def fillna(self, value, limit=None, inplace=False, downcast=None):
-        # we may need to upcast our fill to match our dtype
-        if limit is not None:
-            raise NotImplementedError("specifying a limit for 'fillna' has "
-                                      "not been implemented yet")
-
-        values = self.values if inplace else self.values.copy()
-        return [self.make_block_same_class(values=values.fillna(value=value,
-                                                                limit=limit),
-                                           placement=self.mgr_locs)]
+    def _try_coerce_result(self, result):
+        """ reverse of try_coerce_args """
 
-    def interpolate(self, method='pad', axis=0, inplace=False,
-                    limit=None, fill_value=None, **kwargs):
+        # GH12564: CategoricalBlock is 1-dim only
+        # while returned results could be any dim
+        if ((not is_categorical_dtype(result)) and
+                isinstance(result, np.ndarray)):
+            result = _block_shape(result, ndim=self.ndim)
 
-        values = self.values if inplace else self.values.copy()
-        return self.make_block_same_class(values=values.fillna(fill_value=fill_value,
-                                                               method=method,
-                                                               limit=limit),
-                                          placement=self.mgr_locs)
+        return result
 
-    def shift(self, periods, axis=0):
+    def shift(self, periods, axis=0, mgr=None):
         return self.make_block_same_class(values=self.values.shift(periods),
                                           placement=self.mgr_locs)
 
-    def take_nd(self, indexer, axis=0, new_mgr_locs=None, fill_tuple=None):
-        """
-        Take values according to indexer and return them as a block.bb
-
-        """
-        if fill_tuple is None:
-            fill_value = None
-        else:
-            fill_value = fill_tuple[0]
-
-        # axis doesn't matter; we are really a single-dim object
-        # but are passed the axis depending on the calling routing
-        # if its REALLY axis 0, then this will be a reindex and not a take
-        new_values = self.values.take_nd(indexer, fill_value=fill_value)
-
-        # if we are a 1-dim object, then always place at 0
-        if self.ndim == 1:
-            new_mgr_locs = [0]
-        else:
-            if new_mgr_locs is None:
-                new_mgr_locs = self.mgr_locs
-
-        return self.make_block_same_class(new_values, new_mgr_locs)
-
-    def putmask(self, mask, new, align=True, inplace=False,
-                axis=0, transpose=False):
-        """ putmask the data to the block; it is possible that we may create a
-        new dtype of block
-
-        return the resulting block(s)
-
-        Parameters
-        ----------
-        mask  : the condition to respect
-        new : a ndarray/object
-        align : boolean, perform alignment on other/cond, default is True
-        inplace : perform inplace modification, default is False
-
-        Returns
-        -------
-        a new block(s), the result of the putmask
-        """
-        new_values = self.values if inplace else self.values.copy()
-        new_values[mask] = new
-        return [self.make_block_same_class(values=new_values, placement=self.mgr_locs)]
-
-    def _astype(self, dtype, copy=False, raise_on_error=True, values=None,
-                klass=None):
-        """
-        Coerce to the new type (if copy=True, return a new copy)
-        raise on an except if raise == True
-        """
-
-        if self.is_categorical_astype(dtype):
-            values = self.values
-        else:
-            values = np.asarray(self.values).astype(dtype, copy=False)
-
-        if copy:
-            values = values.copy()
-
-        return self.make_block(values)
+    def to_dense(self):
+        # Categorical.get_values returns a DatetimeIndex for datetime
+        # categories, so we can't simply use `np.asarray(self.values)` like
+        # other types.
+        return self.values.get_values()
 
     def to_native_types(self, slicer=None, na_rep='', quoting=None, **kwargs):
         """ convert to our native types format, slicing if desired """
@@ -1861,39 +2596,75 @@ def to_native_types(self, slicer=None, na_rep='', quoting=None, **kwargs):
         if slicer is not None:
             # Categorical is always one dimension
             values = values[slicer]
-        mask = isnull(values)
+        mask = isna(values)
         values = np.array(values, dtype='object')
         values[mask] = na_rep
 
         # we are expected to return a 2-d ndarray
-        return values.reshape(1,len(values))
+        return values.reshape(1, len(values))
+
+    def concat_same_type(self, to_concat, placement=None):
+        """
+        Concatenate list of single blocks of the same type.
+
+        Note that this CategoricalBlock._concat_same_type *may* not
+        return a CategoricalBlock. When the categories in `to_concat`
+        differ, this will return an object ndarray.
 
-class DatetimeBlock(Block):
+        If / when we decide we don't like that behavior:
+
+        1. Change Categorical._concat_same_type to use union_categoricals
+        2. Delete this method.
+        """
+        values = self._concatenator([blk.values for blk in to_concat],
+                                    axis=self.ndim - 1)
+        # not using self.make_block_same_class as values can be object dtype
+        return make_block(
+            values, placement=placement or slice(0, len(values), 1),
+            ndim=self.ndim)
+
+
+class DatetimeBlock(DatetimeLikeBlockMixin, Block):
     __slots__ = ()
     is_datetime = True
     _can_hold_na = True
 
-    def __init__(self, values, placement,
-                 fastpath=False, **kwargs):
-        if values.dtype != _NS_DTYPE:
-            values = tslib.cast_to_nanoseconds(values)
-
+    def __init__(self, values, placement, ndim=None):
+        values = self._maybe_coerce_values(values)
         super(DatetimeBlock, self).__init__(values,
-                                            fastpath=True, placement=placement,
-                                            **kwargs)
+                                            placement=placement, ndim=ndim)
+
+    def _maybe_coerce_values(self, values):
+        """Input validation for values passed to __init__. Ensure that
+        we have datetime64ns, coercing if necessary.
+
+        Parameters
+        ----------
+        values : array-like
+            Must be convertible to datetime64
+
+        Returns
+        -------
+        values : ndarray[datetime64ns]
+
+        Overridden by DatetimeTZBlock.
+        """
+        if values.dtype != _NS_DTYPE:
+            values = conversion.ensure_datetime64ns(values)
+        return values
 
-    def _astype(self, dtype, **kwargs):
+    def _astype(self, dtype, mgr=None, **kwargs):
         """
         these automatically copy, so copy=True has no effect
         raise on an except if raise == True
         """
 
         # if we are passed a datetime64[ns, tz]
-        if com.is_datetime64tz_dtype(dtype):
+        if is_datetime64tz_dtype(dtype):
             dtype = DatetimeTZDtype(dtype)
 
             values = self.values
-            if getattr(values,'tz',None) is None:
+            if getattr(values, 'tz', None) is None:
                 values = DatetimeIndex(values).tz_localize('UTC')
             values = values.tz_convert(dtype.tz)
             return self.make_block(values)
@@ -1901,101 +2672,73 @@ def _astype(self, dtype, **kwargs):
         # delegate
         return super(DatetimeBlock, self)._astype(dtype=dtype, **kwargs)
 
-
     def _can_hold_element(self, element):
-        if is_list_like(element):
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            # TODO: this still uses asarray, instead of dtype.type
             element = np.array(element)
             return element.dtype == _NS_DTYPE or element.dtype == np.int64
-        return (com.is_integer(element) or
-                isinstance(element, datetime) or
-                isnull(element))
+        return (is_integer(element) or isinstance(element, datetime) or
+                isna(element))
 
-    def _try_cast(self, element):
-        try:
-            return int(element)
-        except:
-            return element
+    def _try_coerce_args(self, values, other):
+        """
+        Coerce values and other to dtype 'i8'. NaN and NaT convert to
+        the smallest i8, and will correctly round-trip to NaT if converted
+        back in _try_coerce_result. values is always ndarray-like, other
+        may not be
 
-    def _try_operate(self, values):
-        """ return a version to operate on """
-        return values.view('i8')
+        Parameters
+        ----------
+        values : ndarray-like
+        other : ndarray-like or scalar
 
-    def _try_coerce_args(self, values, other):
-        """ Coerce values and other to dtype 'i8'. NaN and NaT convert to
-            the smallest i8, and will correctly round-trip to NaT if converted
-            back in _try_coerce_result. values is always ndarray-like, other
-            may not be """
+        Returns
+        -------
+        base-type values, values mask, base-type other, other mask
+        """
+
+        values_mask = isna(values)
         values = values.view('i8')
+        other_mask = False
 
-        if is_null_datelike_scalar(other):
+        if isinstance(other, bool):
+            raise TypeError
+        elif is_null_datelike_scalar(other):
             other = tslib.iNaT
+            other_mask = True
         elif isinstance(other, (datetime, np.datetime64, date)):
-            other = lib.Timestamp(other).asm8.view('i8')
-        elif hasattr(other, 'dtype') and com.is_integer_dtype(other):
-            other = other.view('i8')
+            other = self._box_func(other)
+            if getattr(other, 'tz') is not None:
+                raise TypeError("cannot coerce a Timestamp with a tz on a "
+                                "naive Block")
+            other_mask = isna(other)
+            other = other.asm8.view('i8')
+        elif hasattr(other, 'dtype') and is_datetime64_dtype(other):
+            other_mask = isna(other)
+            other = other.astype('i8', copy=False).view('i8')
         else:
-            other = np.array(other, dtype='i8')
+            # coercion issues
+            # let higher levels handle
+            raise TypeError
 
-        return values, other
+        return values, values_mask, other, other_mask
 
     def _try_coerce_result(self, result):
         """ reverse of try_coerce_args """
         if isinstance(result, np.ndarray):
             if result.dtype.kind in ['i', 'f', 'O']:
-                result = result.astype('M8[ns]')
-        elif isinstance(result, (np.integer, np.datetime64)):
-            result = lib.Timestamp(result)
+                try:
+                    result = result.astype('M8[ns]')
+                except ValueError:
+                    pass
+        elif isinstance(result, (np.integer, np.float, np.datetime64)):
+            result = self._box_func(result)
         return result
 
     @property
-    def fill_value(self):
-        return tslib.iNaT
-
-    def _try_fill(self, value):
-        """ if we are a NaT, return the actual fill value """
-        if isinstance(value, type(tslib.NaT)) or np.array(isnull(value)).all():
-            value = tslib.iNaT
-        return value
-
-    def fillna(self, value, limit=None,
-               inplace=False, downcast=None):
-
-        mask = isnull(self.values)
-        value = self._try_fill(value)
-
-        if limit is not None:
-            if self.ndim > 2:
-                raise NotImplementedError("number of dimensions for 'fillna' "
-                                          "is currently limited to 2")
-            mask[mask.cumsum(self.ndim-1)>limit]=False
-
-        if mask.any():
-            try:
-                return self._fillna_mask(mask, value, inplace=inplace)
-            except TypeError:
-                pass
-            # _fillna_mask raises TypeError when it fails
-            # cannot perform inplace op because of object coercion
-            values = self.get_values(dtype=object)
-            np.putmask(values, mask, value)
-            return [self.make_block(values, fastpath=True)]
-        else:
-            return [self if inplace else self.copy()]
-
-    def _fillna_mask(self, mask, value, inplace=False):
-        if getattr(value, 'tzinfo', None) is None:
-            # Series comes to this path
-            values = self.values
-            if not inplace:
-                values = values.copy()
-            try:
-                np.putmask(values, mask, value)
-                return [self if inplace else
-                        self.make_block(values, fastpath=True)]
-            except (ValueError, TypeError):
-                # scalar causes ValueError, and array causes TypeError
-                pass
-        raise TypeError
+    def _box_func(self):
+        return tslib.Timestamp
 
     def to_native_types(self, slicer=None, na_rep=None, date_format=None,
                         quoting=None, **kwargs):
@@ -2005,17 +2748,17 @@ def to_native_types(self, slicer=None, na_rep=None, date_format=None,
         if slicer is not None:
             values = values[..., slicer]
 
-        from pandas.core.format import _get_format_datetime64_from_values
+        from pandas.io.formats.format import _get_format_datetime64_from_values
         format = _get_format_datetime64_from_values(values, date_format)
 
-        result = tslib.format_array_from_datetime(values.view('i8').ravel(),
-                                                  tz=getattr(self.values,'tz',None),
-                                                  format=format,
-                                                  na_rep=na_rep).reshape(values.shape)
+        result = tslib.format_array_from_datetime(
+            values.view('i8').ravel(), tz=getattr(self.values, 'tz', None),
+            format=format, na_rep=na_rep).reshape(values.shape)
         return np.atleast_2d(result)
 
     def should_store(self, value):
-        return issubclass(value.dtype.type, np.datetime64) and not is_datetimetz(value)
+        return (issubclass(value.dtype.type, np.datetime64) and
+                not is_datetimetz(value))
 
     def set(self, locs, values, check=False):
         """
@@ -2027,111 +2770,164 @@ def set(self, locs, values, check=False):
         """
         if values.dtype != _NS_DTYPE:
             # Workaround for numpy 1.6 bug
-            values = tslib.cast_to_nanoseconds(values)
+            values = conversion.ensure_datetime64ns(values)
 
         self.values[locs] = values
 
-    def get_values(self, dtype=None):
-        # return object dtype as Timestamps
-        if dtype == object:
-            return lib.map_infer(self.values.ravel(), lib.Timestamp)\
-                      .reshape(self.values.shape)
-        return self.values
 
 class DatetimeTZBlock(NonConsolidatableMixIn, DatetimeBlock):
     """ implement a datetime64 block with a tz attribute """
     __slots__ = ()
-    _holder = DatetimeIndex
+    _concatenator = staticmethod(_concat._concat_datetime)
     is_datetimetz = True
 
-    def __init__(self, values, placement, ndim=2,
-                 **kwargs):
+    def __init__(self, values, placement, ndim=2, dtype=None):
+        # XXX: This will end up calling _maybe_coerce_values twice
+        # when dtype is not None. It's relatively cheap (just an isinstance)
+        # but it'd nice to avoid.
+        #
+        # If we can remove dtype from __init__, and push that conversion
+        # push onto the callers, then we can remove this entire __init__
+        # and just use DatetimeBlock's.
+        if dtype is not None:
+            values = self._maybe_coerce_values(values, dtype=dtype)
+        super(DatetimeTZBlock, self).__init__(values, placement=placement,
+                                              ndim=ndim)
+
+    def _maybe_coerce_values(self, values, dtype=None):
+        """Input validation for values passed to __init__. Ensure that
+        we have datetime64TZ, coercing if necessary.
+
+        Parametetrs
+        -----------
+        values : array-like
+            Must be convertible to datetime64
+        dtype : string or DatetimeTZDtype, optional
+            Does a shallow copy to this tz
 
+        Returns
+        -------
+        values : ndarray[datetime64ns]
+        """
         if not isinstance(values, self._holder):
             values = self._holder(values)
+
+        if dtype is not None:
+            if isinstance(dtype, compat.string_types):
+                dtype = DatetimeTZDtype.construct_from_string(dtype)
+            values = values._shallow_copy(tz=dtype.tz)
+
         if values.tz is None:
             raise ValueError("cannot create a DatetimeTZBlock without a tz")
 
-        super(DatetimeTZBlock, self).__init__(values,
-                                              placement=placement,
-                                              ndim=ndim,
-                                              **kwargs)
+        return values
+
+    @property
+    def is_view(self):
+        """ return a boolean if I am possibly a view """
+        # check the ndarray values of the DatetimeIndex values
+        return self.values.values.base is not None
+
+    def copy(self, deep=True, mgr=None):
+        """ copy constructor """
+        values = self.values
+        if deep:
+            values = values.copy(deep=True)
+        return self.make_block_same_class(values)
+
     def external_values(self):
-        """ we internally represent the data as a DatetimeIndex, but for external
-        compat with ndarray, export as a ndarray of Timestamps """
+        """ we internally represent the data as a DatetimeIndex, but for
+        external compat with ndarray, export as a ndarray of Timestamps
+        """
         return self.values.astype('datetime64[ns]').values
 
     def get_values(self, dtype=None):
         # return object dtype as Timestamps with the zones
-        if dtype == object:
-            return lib.map_infer(self.values.ravel(), lambda x: lib.Timestamp(x,tz=self.values.tz))\
-                      .reshape(self.values.shape)
+        if is_object_dtype(dtype):
+            return lib.map_infer(
+                self.values.ravel(), self._box_func).reshape(self.values.shape)
         return self.values
 
-    def _fillna_mask(self, mask, value, inplace=False):
-        # cannot perform inplace op for internal DatetimeIndex
-        my_tz = tslib.get_timezone(self.values.tz)
-        value_tz = tslib.get_timezone(getattr(value, 'tzinfo', None))
-
-        if (my_tz == value_tz or self.dtype == getattr(value, 'dtype', None)):
-            if my_tz == value_tz:
-                # hack for PY2.6 / numpy 1.7.1.
-                # Other versions can directly use self.values.putmask
-                # --------------------------------------
-                try:
-                    value = value.asm8
-                except AttributeError:
-                    value = tslib.Timestamp(value).asm8
-                ### ------------------------------------
-
-            try:
-                values = self.values.putmask(mask, value)
-                return [self.make_block(values, fastpath=True)]
-            except ValueError:
-                pass
-        raise TypeError
-
     def _slice(self, slicer):
         """ return a slice of my values """
         if isinstance(slicer, tuple):
             col, loc = slicer
-            if not is_null_slice(col) and col != 0:
+            if not com.is_null_slice(col) and col != 0:
                 raise IndexError("{0} only contains one item".format(self))
             return self.values[loc]
         return self.values[slicer]
 
     def _try_coerce_args(self, values, other):
-        """ localize and return i8 for the values """
-        values = values.tz_localize(None).asi8
+        """
+        localize and return i8 for the values
+
+        Parameters
+        ----------
+        values : ndarray-like
+        other : ndarray-like or scalar
 
-        if is_null_datelike_scalar(other):
+        Returns
+        -------
+        base-type values, values mask, base-type other, other mask
+        """
+        values_mask = _block_shape(isna(values), ndim=self.ndim)
+        # asi8 is a view, needs copy
+        values = _block_shape(values.asi8, ndim=self.ndim)
+        other_mask = False
+
+        if isinstance(other, ABCSeries):
+            other = self._holder(other)
+            other_mask = isna(other)
+
+        if isinstance(other, bool):
+            raise TypeError
+        elif (is_null_datelike_scalar(other) or
+              (is_scalar(other) and isna(other))):
             other = tslib.iNaT
+            other_mask = True
         elif isinstance(other, self._holder):
             if other.tz != self.values.tz:
                 raise ValueError("incompatible or non tz-aware value")
-            other = other.tz_localize(None).asi8
-        else:
-            other = lib.Timestamp(other)
-            if not getattr(other, 'tz', None):
+            other = other.asi8
+            other_mask = isna(other)
+        elif isinstance(other, (np.datetime64, datetime, date)):
+            other = tslib.Timestamp(other)
+            tz = getattr(other, 'tz', None)
+
+            # test we can have an equal time zone
+            if tz is None or str(tz) != str(self.values.tz):
                 raise ValueError("incompatible or non tz-aware value")
+            other_mask = isna(other)
             other = other.value
+        else:
+            raise TypeError
 
-        return values, other
+        return values, values_mask, other, other_mask
 
     def _try_coerce_result(self, result):
         """ reverse of try_coerce_args """
-        result = super(DatetimeTZBlock, self)._try_coerce_result(result)
-
         if isinstance(result, np.ndarray):
-            result = self._holder(result, tz=self.values.tz)
-        elif isinstance(result, (np.integer, np.datetime64)):
-            result = lib.Timestamp(result, tz=self.values.tz)
+            if result.dtype.kind in ['i', 'f', 'O']:
+                result = result.astype('M8[ns]')
+        elif isinstance(result, (np.integer, np.float, np.datetime64)):
+            result = tslib.Timestamp(result, tz=self.values.tz)
+        if isinstance(result, np.ndarray):
+            # allow passing of > 1dim if its trivial
+            if result.ndim > 1:
+                result = result.reshape(np.prod(result.shape))
+            result = self.values._shallow_copy(result)
+
         return result
 
-    def shift(self, periods, axis=0):
+    @property
+    def _box_func(self):
+        return lambda x: tslib.Timestamp(x, tz=self.dtype.tz)
+
+    def shift(self, periods, axis=0, mgr=None):
         """ shift the block by periods """
 
-        ### think about moving this to the DatetimeIndex. This is a non-freq (number of periods) shift ###
+        # think about moving this to the DatetimeIndex. This is a non-freq
+        # (number of periods) shift ###
 
         N = len(self)
         indexer = np.zeros(N, dtype=int)
@@ -2140,16 +2936,56 @@ def shift(self, periods, axis=0):
         else:
             indexer[:periods] = np.arange(-periods, N)
 
-        # move to UTC & take
-        new_values = self.values.tz_localize(None).asi8.take(indexer)
+        new_values = self.values.asi8.take(indexer)
+
+        if periods > 0:
+            new_values[:periods] = tslib.iNaT
+        else:
+            new_values[periods:] = tslib.iNaT
+
+        new_values = self.values._shallow_copy(new_values)
+        return [self.make_block_same_class(new_values,
+                                           placement=self.mgr_locs)]
+
+    def diff(self, n, axis=0, mgr=None):
+        """1st discrete difference
+
+        Parameters
+        ----------
+        n : int, number of periods to diff
+        axis : int, axis to diff upon. default 0
+        mgr : default None
+
+        Return
+        ------
+        A list with a new TimeDeltaBlock.
+
+        Note
+        ----
+        The arguments here are mimicking shift so they are called correctly
+        by apply.
+        """
+        if axis == 0:
+            # Cannot currently calculate diff across multiple blocks since this
+            # function is invoked via apply
+            raise NotImplementedError
+        new_values = (self.values - self.shift(n, axis=axis)[0].values).asi8
 
-        if periods > 0:
-            new_values[:periods] = tslib.iNaT
-        else:
-            new_values[periods:] = tslib.iNaT
+        # Reshape the new_values like how algos.diff does for timedelta data
+        new_values = new_values.reshape(1, len(new_values))
+        new_values = new_values.astype('timedelta64[ns]')
+        return [TimeDeltaBlock(new_values, placement=self.mgr_locs.indexer)]
+
+    def concat_same_type(self, to_concat, placement=None):
+        """
+        Concatenate list of single blocks of the same type.
+        """
+        values = self._concatenator([blk.values for blk in to_concat],
+                                    axis=self.ndim - 1)
+        # not using self.make_block_same_class as values can be non-tz dtype
+        return make_block(
+            values, placement=placement or slice(0, len(values), 1))
 
-        new_values = DatetimeIndex(new_values,tz=self.values.tz)
-        return [self.make_block_same_class(new_values, placement=self.mgr_locs)]
 
 class SparseBlock(NonConsolidatableMixIn, Block):
     """ implement as a list of sparse arrays of the same dtype """
@@ -2159,26 +2995,30 @@ class SparseBlock(NonConsolidatableMixIn, Block):
     _box_to_block_values = False
     _can_hold_na = True
     _ftype = 'sparse'
-    _holder = SparseArray
+    _concatenator = staticmethod(_concat._concat_sparse)
+
+    def __init__(self, values, placement, ndim=None):
+        # Ensure that we have the underlying SparseArray here...
+        if isinstance(values, ABCSeries):
+            values = values.values
+        assert isinstance(values, SparseArray)
+        super(SparseBlock, self).__init__(values, placement, ndim=ndim)
 
     @property
-    def shape(self):
-        return (len(self.mgr_locs), self.sp_index.length)
+    def _holder(self):
+        return SparseArray
 
     @property
-    def itemsize(self):
-        return self.dtype.itemsize
+    def shape(self):
+        return (len(self.mgr_locs), self.sp_index.length)
 
     @property
     def fill_value(self):
-        #return np.nan
+        # return np.nan
         return self.values.fill_value
 
     @fill_value.setter
     def fill_value(self, v):
-        # we may need to upcast our fill to match our dtype
-        if issubclass(self.dtype.type, np.floating):
-            v = float(v)
         self.values.fill_value = v
 
     def to_dense(self):
@@ -2204,25 +3044,33 @@ def sp_index(self):
     def kind(self):
         return self.values.kind
 
+    def _astype(self, dtype, copy=False, errors='raise', values=None,
+                klass=None, mgr=None, **kwargs):
+        if values is None:
+            values = self.values
+        values = values.astype(dtype, copy=copy)
+        return self.make_block_same_class(values=values,
+                                          placement=self.mgr_locs)
+
     def __len__(self):
         try:
             return self.sp_index.length
         except:
             return 0
 
-    def copy(self, deep=True):
+    def copy(self, deep=True, mgr=None):
         return self.make_block_same_class(values=self.values,
                                           sparse_index=self.sp_index,
                                           kind=self.kind, copy=deep,
                                           placement=self.mgr_locs)
 
-    def make_block_same_class(self, values, placement,
-                              sparse_index=None, kind=None, dtype=None,
-                              fill_value=None, copy=False, fastpath=True, **kwargs):
+    def make_block_same_class(self, values, placement, sparse_index=None,
+                              kind=None, dtype=None, fill_value=None,
+                              copy=False, ndim=None):
         """ return a new block """
         if dtype is None:
-            dtype = self.dtype
-        if fill_value is None:
+            dtype = values.dtype
+        if fill_value is None and not isinstance(values, SparseArray):
             fill_value = self.values.fill_value
 
         # if not isinstance(values, SparseArray) and values.ndim != self.ndim:
@@ -2237,8 +3085,7 @@ def make_block_same_class(self, values, placement,
                 # won't take space since there's 0 items, plus it will preserve
                 # the dtype.
                 return self.make_block(np.empty(values.shape, dtype=dtype),
-                                       placement,
-                                       fastpath=True)
+                                       placement)
             elif nitems > 1:
                 raise ValueError("Only 1-item 2d sparse blocks are supported")
             else:
@@ -2248,30 +3095,28 @@ def make_block_same_class(self, values, placement,
                                  kind=kind or self.kind, dtype=dtype,
                                  fill_value=fill_value, copy=copy)
         return self.make_block(new_values,
-                               fastpath=fastpath,
                                placement=placement)
 
-    def interpolate(self, method='pad', axis=0, inplace=False,
-                    limit=None, fill_value=None, **kwargs):
+    def interpolate(self, method='pad', axis=0, inplace=False, limit=None,
+                    fill_value=None, **kwargs):
 
-        values = com.interpolate_2d(
-            self.values.to_dense(), method, axis, limit, fill_value)
+        values = missing.interpolate_2d(self.values.to_dense(), method, axis,
+                                        limit, fill_value)
         return self.make_block_same_class(values=values,
                                           placement=self.mgr_locs)
 
-    def fillna(self, value, limit=None, inplace=False, downcast=None):
+    def fillna(self, value, limit=None, inplace=False, downcast=None,
+               mgr=None):
         # we may need to upcast our fill to match our dtype
         if limit is not None:
             raise NotImplementedError("specifying a limit for 'fillna' has "
                                       "not been implemented yet")
-        if issubclass(self.dtype.type, np.floating):
-            value = float(value)
         values = self.values if inplace else self.values.copy()
-        return [self.make_block_same_class(values=values.get_values(value),
-                                           fill_value=value,
+        values = values.fillna(value, downcast=downcast)
+        return [self.make_block_same_class(values=values,
                                            placement=self.mgr_locs)]
 
-    def shift(self, periods, axis=0):
+    def shift(self, periods, axis=0, mgr=None):
         """ shift the block by periods """
         N = len(self.values.T)
         indexer = np.zeros(N, dtype=int)
@@ -2282,27 +3127,13 @@ def shift(self, periods, axis=0):
         new_values = self.values.to_dense().take(indexer)
         # convert integer to float if necessary. need to do a lot more than
         # that, handle boolean etc also
-        new_values, fill_value = com._maybe_upcast(new_values)
+        new_values, fill_value = maybe_upcast(new_values)
         if periods > 0:
             new_values[:periods] = fill_value
         else:
             new_values[periods:] = fill_value
-        return [self.make_block_same_class(new_values, placement=self.mgr_locs)]
-
-    def reindex_axis(self, indexer, method=None, axis=1, fill_value=None,
-                     limit=None, mask_info=None):
-        """
-        Reindex using pre-computed indexer information
-        """
-        if axis < 1:
-            raise AssertionError('axis must be at least 1, got %d' % axis)
-
-        # taking on the 0th axis always here
-        if fill_value is None:
-            fill_value = self.fill_value
-        return self.make_block_same_class(self.values.take(indexer),
-                                          fill_value=fill_value,
-                                          placement=self.mgr_locs)
+        return [self.make_block_same_class(new_values,
+                                           placement=self.mgr_locs)]
 
     def sparse_reindex(self, new_index):
         """ sparse reindex and return a new block
@@ -2311,50 +3142,72 @@ def sparse_reindex(self, new_index):
         values = values.sp_index.to_int_index().reindex(
             values.sp_values.astype('float64'), values.fill_value, new_index)
         return self.make_block_same_class(values, sparse_index=new_index,
-                               placement=self.mgr_locs)
+                                          placement=self.mgr_locs)
+
+
+def get_block_type(values, dtype=None):
+    """
+    Find the appropriate Block subclass to use for the given values and dtype.
+
+    Parameters
+    ----------
+    values : ndarray-like
+    dtype : numpy or pandas dtype
+
+    Returns
+    -------
+    cls : class, subclass of Block
+    """
+    dtype = dtype or values.dtype
+    vtype = dtype.type
+
+    if is_sparse(values):
+        cls = SparseBlock
+    elif issubclass(vtype, np.floating):
+        cls = FloatBlock
+    elif issubclass(vtype, np.timedelta64):
+        assert issubclass(vtype, np.integer)
+        cls = TimeDeltaBlock
+    elif issubclass(vtype, np.complexfloating):
+        cls = ComplexBlock
+    elif issubclass(vtype, np.datetime64):
+        assert not is_datetimetz(values)
+        cls = DatetimeBlock
+    elif is_datetimetz(values):
+        cls = DatetimeTZBlock
+    elif issubclass(vtype, np.integer):
+        cls = IntBlock
+    elif dtype == np.bool_:
+        cls = BoolBlock
+    elif is_categorical(values):
+        cls = CategoricalBlock
+    elif is_extension_array_dtype(values):
+        cls = ExtensionBlock
+    else:
+        cls = ObjectBlock
+    return cls
 
 
-def make_block(values, placement, klass=None, ndim=None,
-               dtype=None, fastpath=False):
+def make_block(values, placement, klass=None, ndim=None, dtype=None,
+               fastpath=None):
+    if fastpath is not None:
+        # GH#19265 pyarrow is passing this
+        warnings.warn("fastpath argument is deprecated, will be removed "
+                      "in a future release.", DeprecationWarning)
     if klass is None:
         dtype = dtype or values.dtype
-        vtype = dtype.type
-
-        if isinstance(values, SparseArray):
-            klass = SparseBlock
-        elif issubclass(vtype, np.floating):
-            klass = FloatBlock
-        elif (issubclass(vtype, np.integer) and
-                issubclass(vtype, np.timedelta64)):
-            klass = TimeDeltaBlock
-        elif (issubclass(vtype, np.integer) and
-                not issubclass(vtype, np.datetime64)):
-            klass = IntBlock
-        elif dtype == np.bool_:
-            klass = BoolBlock
-        elif issubclass(vtype, np.datetime64):
-            if hasattr(values,'tz'):
-                klass = DatetimeTZBlock
-            else:
-                klass = DatetimeBlock
-        elif is_datetimetz(values):
-            klass = DatetimeTZBlock
-        elif issubclass(vtype, np.complexfloating):
-            klass = ComplexBlock
-        elif is_categorical(values):
-            klass = CategoricalBlock
-        else:
-            klass = ObjectBlock
+        klass = get_block_type(values, dtype)
 
-    return klass(values, ndim=ndim, fastpath=fastpath,
-                 placement=placement)
+    elif klass is DatetimeTZBlock and not is_datetimetz(values):
+        return klass(values, ndim=ndim,
+                     placement=placement, dtype=dtype)
 
+    return klass(values, ndim=ndim, placement=placement)
 
 # TODO: flexible with index=None and/or items=None
 
 
 class BlockManager(PandasObject):
-
     """
     Core internal data structure to implement DataFrame, Series, Panel, etc.
 
@@ -2409,19 +3262,21 @@ class BlockManager(PandasObject):
     __slots__ = ['axes', 'blocks', '_ndim', '_shape', '_known_consolidated',
                  '_is_consolidated', '_blknos', '_blklocs']
 
-    def __init__(self, blocks, axes, do_integrity_check=True, fastpath=True):
+    def __init__(self, blocks, axes, do_integrity_check=True):
         self.axes = [_ensure_index(ax) for ax in axes]
         self.blocks = tuple(blocks)
 
         for block in blocks:
             if block.is_sparse:
                 if len(block.mgr_locs) != 1:
-                    raise AssertionError("Sparse block refers to multiple items")
+                    raise AssertionError("Sparse block refers to multiple "
+                                         "items")
             else:
                 if self.ndim != block.ndim:
-                    raise AssertionError(('Number of Block dimensions (%d) must '
-                                          'equal number of axes (%d)')
-                                         % (block.ndim, self.ndim))
+                    raise AssertionError(
+                        'Number of Block dimensions ({block}) must equal '
+                        'number of axes ({self})'.format(block=block.ndim,
+                                                         self=self.ndim))
 
         if do_integrity_check:
             self._verify_integrity()
@@ -2433,9 +3288,8 @@ def __init__(self, blocks, axes, do_integrity_check=True, fastpath=True):
     def make_empty(self, axes=None):
         """ return an empty BlockManager with the items axis of len 0 """
         if axes is None:
-            axes = [_ensure_index([])] + [
-                _ensure_index(a) for a in self.axes[1:]
-            ]
+            axes = [_ensure_index([])] + [_ensure_index(a)
+                                          for a in self.axes[1:]]
 
         # preserve dtype if possible
         if self.ndim == 1:
@@ -2464,12 +3318,13 @@ def set_axis(self, axis, new_labels):
         new_len = len(new_labels)
 
         if new_len != old_len:
-            raise ValueError('Length mismatch: Expected axis has %d elements, '
-                             'new values have %d elements' % (old_len, new_len))
+            raise ValueError(
+                'Length mismatch: Expected axis has {old} elements, new '
+                'values have {new} elements'.format(old=old_len, new=new_len))
 
         self.axes[axis] = new_labels
 
-    def rename_axis(self, mapper, axis, copy=True):
+    def rename_axis(self, mapper, axis, copy=True, level=None):
         """
         Rename one of axes.
 
@@ -2478,18 +3333,19 @@ def rename_axis(self, mapper, axis, copy=True):
         mapper : unary callable
         axis : int
         copy : boolean, default True
+        level : int, default None
 
         """
         obj = self.copy(deep=copy)
-        obj.set_axis(axis, _transform_index(self.axes[axis], mapper))
+        obj.set_axis(axis, _transform_index(self.axes[axis], mapper, level))
         return obj
 
     def add_prefix(self, prefix):
-        f = (str(prefix) + '%s').__mod__
+        f = partial('{prefix}{}'.format, prefix=prefix)
         return self.rename_axis(f, axis=0)
 
     def add_suffix(self, suffix):
-        f = ('%s' + str(suffix)).__mod__
+        f = partial('{}{suffix}'.format, suffix=suffix)
         return self.rename_axis(f, axis=0)
 
     @property
@@ -2527,6 +3383,7 @@ def _rebuild_blknos_and_blklocs(self):
     # make items read only for now
     def _get_items(self):
         return self.axes[0]
+
     items = property(fget=_get_items)
 
     def _get_counts(self, f):
@@ -2546,11 +3403,11 @@ def get_ftype_counts(self):
 
     def get_dtypes(self):
         dtypes = np.array([blk.dtype for blk in self.blocks])
-        return com.take_1d(dtypes, self._blknos, allow_fill=False)
+        return algos.take_1d(dtypes, self._blknos, allow_fill=False)
 
     def get_ftypes(self):
         ftypes = np.array([blk.ftype for blk in self.blocks])
-        return com.take_1d(ftypes, self._blknos, allow_fill=False)
+        return algos.take_1d(ftypes, self._blknos, allow_fill=False)
 
     def __getstate__(self):
         block_values = [b.values for b in self.blocks]
@@ -2560,8 +3417,7 @@ def __getstate__(self):
         extra_state = {
             '0.14.1': {
                 'axes': axes_array,
-                'blocks': [dict(values=b.values,
-                                mgr_locs=b.mgr_locs.indexer)
+                'blocks': [dict(values=b.values, mgr_locs=b.mgr_locs.indexer)
                            for b in self.blocks]
             }
         }
@@ -2577,13 +3433,12 @@ def unpickle_block(values, mgr_locs):
                 values = values.astype('M8[ns]')
             return make_block(values, placement=mgr_locs)
 
-        if (isinstance(state, tuple) and len(state) >= 4
-            and '0.14.1' in state[3]):
+        if (isinstance(state, tuple) and len(state) >= 4 and
+                '0.14.1' in state[3]):
             state = state[3]['0.14.1']
             self.axes = [_ensure_index(ax) for ax in state['axes']]
-            self.blocks = tuple(
-                unpickle_block(b['values'], b['mgr_locs'])
-                for b in state['blocks'])
+            self.blocks = tuple(unpickle_block(b['values'], b['mgr_locs'])
+                                for b in state['blocks'])
         else:
             # discard anything after 3rd, support beta pickling format for a
             # little while longer
@@ -2619,15 +3474,15 @@ def __len__(self):
         return len(self.items)
 
     def __unicode__(self):
-        output = com.pprint_thing(self.__class__.__name__)
+        output = pprint_thing(self.__class__.__name__)
         for i, ax in enumerate(self.axes):
             if i == 0:
-                output += u('\nItems: %s') % ax
+                output += u('\nItems: {ax}'.format(ax=ax))
             else:
-                output += u('\nAxis %d: %s') % (i, ax)
+                output += u('\nAxis {i}: {ax}'.format(i=i, ax=ax))
 
         for block in self.blocks:
-            output += u('\n%s') % com.pprint_thing(block)
+            output += u('\n{block}'.format(block=pprint_thing(block)))
         return output
 
     def _verify_integrity(self):
@@ -2639,10 +3494,11 @@ def _verify_integrity(self):
         if len(self.items) != tot_items:
             raise AssertionError('Number of manager items must equal union of '
                                  'block items\n# manager items: {0}, # '
-                                 'tot_items: {1}'.format(len(self.items),
-                                                         tot_items))
+                                 'tot_items: {1}'.format(
+                                     len(self.items), tot_items))
 
-    def apply(self, f, axes=None, filter=None, do_integrity_check=False, consolidate=True, **kwargs):
+    def apply(self, f, axes=None, filter=None, do_integrity_check=False,
+              consolidate=True, **kwargs):
         """
         iterate over the blocks, collect and create a new block manager
 
@@ -2652,8 +3508,10 @@ def apply(self, f, axes=None, filter=None, do_integrity_check=False, consolidate
         axes : optional (if not supplied, use self.axes)
         filter : list, if supplied, only call the block if the filter is in
                  the block
-        do_integrity_check : boolean, default False. Do the block manager integrity check
-        consolidate: boolean, default True. Join together blocks having same dtype
+        do_integrity_check : boolean, default False. Do the block manager
+            integrity check
+        consolidate: boolean, default True. Join together blocks having same
+            dtype
 
         Returns
         -------
@@ -2698,8 +3556,12 @@ def apply(self, f, axes=None, filter=None, do_integrity_check=False, consolidate
         else:
             align_keys = []
 
-        aligned_args = dict((k, kwargs[k]) for k in align_keys
-                            if hasattr(kwargs[k], 'reindex_axis'))
+        # TODO(EA): may interfere with ExtensionBlock.setitem for blocks
+        # with a .values attribute.
+        aligned_args = dict((k, kwargs[k])
+                            for k in align_keys
+                            if hasattr(kwargs[k], 'values') and
+                            not isinstance(kwargs[k], ABCExtensionArray))
 
         for b in self.blocks:
             if filter is not None:
@@ -2712,15 +3574,12 @@ def apply(self, f, axes=None, filter=None, do_integrity_check=False, consolidate
 
                 for k, obj in aligned_args.items():
                     axis = getattr(obj, '_info_axis_number', 0)
-                    kwargs[k] = obj.reindex_axis(b_items, axis=axis,
-                                                 copy=align_copy)
+                    kwargs[k] = obj.reindex(b_items, axis=axis,
+                                            copy=align_copy)
 
+            kwargs['mgr'] = self
             applied = getattr(b, f)(**kwargs)
-
-            if isinstance(applied, list):
-                result_blocks.extend(applied)
-            else:
-                result_blocks.append(applied)
+            result_blocks = _extend_blocks(applied, result_blocks)
 
         if len(result_blocks) == 0:
             return self.make_empty(axes or self.axes)
@@ -2729,8 +3588,97 @@ def apply(self, f, axes=None, filter=None, do_integrity_check=False, consolidate
         bm._consolidate_inplace()
         return bm
 
-    def isnull(self, **kwargs):
-        return self.apply('apply', **kwargs)
+    def reduction(self, f, axis=0, consolidate=True, transposed=False,
+                  **kwargs):
+        """
+        iterate over the blocks, collect and create a new block manager.
+        This routine is intended for reduction type operations and
+        will do inference on the generated blocks.
+
+        Parameters
+        ----------
+        f: the callable or function name to operate on at the block level
+        axis: reduction axis, default 0
+        consolidate: boolean, default True. Join together blocks having same
+            dtype
+        transposed: boolean, default False
+            we are holding transposed data
+
+        Returns
+        -------
+        Block Manager (new object)
+
+        """
+
+        if consolidate:
+            self._consolidate_inplace()
+
+        axes, blocks = [], []
+        for b in self.blocks:
+            kwargs['mgr'] = self
+            axe, block = getattr(b, f)(axis=axis, **kwargs)
+
+            axes.append(axe)
+            blocks.append(block)
+
+        # note that some DatetimeTZ, Categorical are always ndim==1
+        ndim = {b.ndim for b in blocks}
+
+        if 2 in ndim:
+
+            new_axes = list(self.axes)
+
+            # multiple blocks that are reduced
+            if len(blocks) > 1:
+                new_axes[1] = axes[0]
+
+                # reset the placement to the original
+                for b, sb in zip(blocks, self.blocks):
+                    b.mgr_locs = sb.mgr_locs
+
+            else:
+                new_axes[axis] = Index(np.concatenate(
+                    [ax.values for ax in axes]))
+
+            if transposed:
+                new_axes = new_axes[::-1]
+                blocks = [b.make_block(b.values.T,
+                                       placement=np.arange(b.shape[1])
+                                       ) for b in blocks]
+
+            return self.__class__(blocks, new_axes)
+
+        # 0 ndim
+        if 0 in ndim and 1 not in ndim:
+            values = np.array([b.values for b in blocks])
+            if len(values) == 1:
+                return values.item()
+            blocks = [make_block(values, ndim=1)]
+            axes = Index([ax[0] for ax in axes])
+
+        # single block
+        values = _concat._concat_compat([b.values for b in blocks])
+
+        # compute the orderings of our original data
+        if len(self.blocks) > 1:
+
+            indexer = np.empty(len(self.axes[0]), dtype=np.intp)
+            i = 0
+            for b in self.blocks:
+                for j in b.mgr_locs:
+                    indexer[j] = i
+                    i = i + 1
+
+            values = values.take(indexer)
+
+        return SingleBlockManager(
+            [make_block(values,
+                        ndim=1,
+                        placement=np.arange(len(values)))],
+            axes[0])
+
+    def isna(self, func, **kwargs):
+        return self.apply('apply', func=func, **kwargs)
 
     def where(self, **kwargs):
         return self.apply('where', **kwargs)
@@ -2738,6 +3686,9 @@ def where(self, **kwargs):
     def eval(self, **kwargs):
         return self.apply('eval', **kwargs)
 
+    def quantile(self, **kwargs):
+        return self.reduction('quantile', **kwargs)
+
     def setitem(self, **kwargs):
         return self.apply('setitem', **kwargs)
 
@@ -2768,20 +3719,27 @@ def convert(self, **kwargs):
     def replace(self, **kwargs):
         return self.apply('replace', **kwargs)
 
-    def replace_list(self, src_list, dest_list, inplace=False, regex=False):
+    def replace_list(self, src_list, dest_list, inplace=False, regex=False,
+                     mgr=None):
         """ do a list replace """
 
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
+        if mgr is None:
+            mgr = self
+
         # figure out our mask a-priori to avoid repeated replacements
-        values = self.as_matrix()
+        values = self.as_array()
 
         def comp(s):
-            if isnull(s):
-                return isnull(values)
-            return _possibly_compare(values, getattr(s, 'asm8', s),
-                                     operator.eq)
+            if isna(s):
+                return isna(values)
+            return _maybe_compare(values, getattr(s, 'asm8', s), operator.eq)
+
         masks = [comp(s) for i, s in enumerate(src_list)]
 
         result_blocks = []
+        src_len = len(src_list) - 1
         for blk in self.blocks:
 
             # its possible to get multiple result blocks here
@@ -2791,17 +3749,16 @@ def comp(s):
                 new_rb = []
                 for b in rb:
                     if b.dtype == np.object_:
-                        result = b.replace(s, d, inplace=inplace,
-                                           regex=regex)
-                        if isinstance(result, list):
-                            new_rb.extend(result)
-                        else:
-                            new_rb.append(result)
+                        convert = i == src_len
+                        result = b.replace(s, d, inplace=inplace, regex=regex,
+                                           mgr=mgr, convert=convert)
+                        new_rb = _extend_blocks(result, new_rb)
                     else:
                         # get our mask for this element, sized to this
                         # particular block
                         m = masks[i][b.mgr_locs.indexer]
                         if m.any():
+                            b = b.coerce_to_target_dtype(d)
                             new_rb.extend(b.putmask(m, d, inplace=True))
                         else:
                             new_rb.append(b)
@@ -2839,13 +3796,18 @@ def is_mixed_type(self):
     def is_numeric_mixed_type(self):
         # Warning, consolidation needs to get checked upstairs
         self._consolidate_inplace()
-        return all([block.is_numeric for block in self.blocks])
+        return all(block.is_numeric for block in self.blocks)
 
     @property
     def is_datelike_mixed_type(self):
         # Warning, consolidation needs to get checked upstairs
         self._consolidate_inplace()
-        return any([block.is_datelike for block in self.blocks])
+        return any(block.is_datelike for block in self.blocks)
+
+    @property
+    def any_extension_types(self):
+        """Whether any of the blocks in this manager are extension blocks"""
+        return any(block.is_extension for block in self.blocks)
 
     @property
     def is_view(self):
@@ -2888,20 +3850,21 @@ def combine(self, blocks, copy=True):
             return self.make_empty()
 
         # FIXME: optimization potential
-        indexer = np.sort(np.concatenate([b.mgr_locs.as_array for b in blocks]))
+        indexer = np.sort(np.concatenate([b.mgr_locs.as_array
+                                          for b in blocks]))
         inv_indexer = lib.get_reverse_indexer(indexer, self.shape[0])
-        new_items = self.items.take(indexer)
 
         new_blocks = []
         for b in blocks:
             b = b.copy(deep=copy)
-            b.mgr_locs = com.take_1d(inv_indexer, b.mgr_locs.as_array, axis=0,
-                                     allow_fill=False)
+            b.mgr_locs = algos.take_1d(inv_indexer, b.mgr_locs.as_array,
+                                       axis=0, allow_fill=False)
             new_blocks.append(b)
 
-        new_axes = list(self.axes)
-        new_axes[0] = new_items
-        return self.__class__(new_blocks, new_axes, do_integrity_check=False)
+        axes = list(self.axes)
+        axes[0] = self.items.take(indexer)
+
+        return self.__class__(new_blocks, axes, do_integrity_check=False)
 
     def get_slice(self, slobj, axis=0):
         if axis >= self.ndim:
@@ -2918,8 +3881,7 @@ def get_slice(self, slobj, axis=0):
         new_axes = list(self.axes)
         new_axes[axis] = new_axes[axis][slobj]
 
-        bm = self.__class__(new_blocks, new_axes, do_integrity_check=False,
-                            fastpath=True)
+        bm = self.__class__(new_blocks, new_axes, do_integrity_check=False)
         bm._consolidate_inplace()
         return bm
 
@@ -2930,7 +3892,7 @@ def __contains__(self, item):
     def nblocks(self):
         return len(self.blocks)
 
-    def copy(self, deep=True):
+    def copy(self, deep=True, mgr=None):
         """
         Make deep or shallow copy of BlockManager
 
@@ -2951,15 +3913,30 @@ def copy(self, deep=True):
                 copy = lambda ax: ax.copy(deep=True)
             else:
                 copy = lambda ax: ax.view()
-            new_axes = [ copy(ax) for ax in self.axes]
+            new_axes = [copy(ax) for ax in self.axes]
         else:
             new_axes = list(self.axes)
         return self.apply('copy', axes=new_axes, deep=deep,
                           do_integrity_check=False)
 
-    def as_matrix(self, items=None):
+    def as_array(self, transpose=False, items=None):
+        """Convert the blockmanager data into an numpy array.
+
+        Parameters
+        ----------
+        transpose : boolean, default False
+            If True, transpose the return array
+        items : list of strings or None
+            Names of block items that will be included in the returned
+            array. ``None`` means that all block items will be used
+
+        Returns
+        -------
+        arr : ndarray
+        """
         if len(self.blocks) == 0:
-            return np.empty(self.shape, dtype=float)
+            arr = np.empty(self.shape, dtype=float)
+            return arr.transpose() if transpose else arr
 
         if items is not None:
             mgr = self.reindex_axis(items, axis=0)
@@ -2967,9 +3944,11 @@ def as_matrix(self, items=None):
             mgr = self
 
         if self._is_single_block or not self.is_mixed_type:
-            return mgr.blocks[0].get_values()
+            arr = mgr.blocks[0].get_values()
         else:
-            return mgr._interleave()
+            arr = mgr._interleave()
+
+        return arr.transpose() if transpose else arr
 
     def _interleave(self):
         """
@@ -3004,10 +3983,35 @@ def _interleave(self):
 
         return result
 
+    def to_dict(self, copy=True):
+        """
+        Return a dict of str(dtype) -> BlockManager
+
+        Parameters
+        ----------
+        copy : boolean, default True
+
+        Returns
+        -------
+        values : a dict of dtype -> BlockManager
+
+        Notes
+        -----
+        This consolidates based on str(dtype)
+        """
+        self._consolidate_inplace()
+
+        bd = {}
+        for b in self.blocks:
+            bd.setdefault(str(b.dtype), []).append(b)
+
+        return {dtype: self.combine(blocks, copy=copy)
+                for dtype, blocks in bd.items()}
+
     def xs(self, key, axis=1, copy=True, takeable=False):
         if axis < 1:
-            raise AssertionError('Can only take xs across axis >= 1, got %d'
-                                 % axis)
+            raise AssertionError(
+                'Can only take xs across axis >= 1, got {ax}'.format(ax=axis))
 
         # take by position
         if takeable:
@@ -3032,7 +4036,7 @@ def xs(self, key, axis=1, copy=True, takeable=False):
             # we must copy here as we are mixed type
             for blk in self.blocks:
                 newb = make_block(values=blk.values[slicer],
-                                  klass=blk.__class__, fastpath=True,
+                                  klass=blk.__class__,
                                   placement=blk.mgr_locs)
                 new_blocks.append(newb)
         elif len(self.blocks) == 1:
@@ -3040,8 +4044,9 @@ def xs(self, key, axis=1, copy=True, takeable=False):
             vals = block.values[slicer]
             if copy:
                 vals = vals.copy()
-            new_blocks = [make_block(values=vals, placement=block.mgr_locs,
-                                     klass=block.__class__, fastpath=True,)]
+            new_blocks = [make_block(values=vals,
+                                     placement=block.mgr_locs,
+                                     klass=block.__class__)]
 
         return self.__class__(new_blocks, new_axes)
 
@@ -3106,13 +4111,13 @@ def get(self, item, fastpath=True):
         """
         if self.items.is_unique:
 
-            if not isnull(item):
+            if not isna(item):
                 loc = self.items.get_loc(item)
             else:
-                indexer = np.arange(len(self.items))[isnull(self.items)]
+                indexer = np.arange(len(self.items))[isna(self.items)]
 
                 # allow a single nan location indexer
-                if not np.isscalar(indexer):
+                if not is_scalar(indexer):
                     if len(indexer) == 1:
                         loc = indexer.item()
                     else:
@@ -3121,19 +4126,19 @@ def get(self, item, fastpath=True):
             return self.iget(loc, fastpath=fastpath)
         else:
 
-            if isnull(item):
-                raise ValueError("cannot label index with a null key")
+            if isna(item):
+                raise TypeError("cannot label index with a null key")
 
             indexer = self.items.get_indexer_for([item])
             return self.reindex_indexer(new_axis=self.items[indexer],
-                                        indexer=indexer, axis=0, allow_dups=True)
+                                        indexer=indexer, axis=0,
+                                        allow_dups=True)
 
     def iget(self, i, fastpath=True):
         """
         Return the data as a SingleBlockManager if fastpath=True and possible
 
         Otherwise return as a ndarray
-
         """
         block = self.blocks[self._blknos[i]]
         values = block.iget(self._blklocs[i])
@@ -3141,24 +4146,26 @@ def iget(self, i, fastpath=True):
             return values
 
         # fastpath shortcut for select a single-dim from a 2-dim BM
-        return SingleBlockManager([ block.make_block_same_class(values,
-                                                                placement=slice(0, len(values)),
-                                                                ndim=1,
-                                                                fastpath=True) ],
-                                  self.axes[1])
-
+        return SingleBlockManager(
+            [block.make_block_same_class(values,
+                                         placement=slice(0, len(values)),
+                                         ndim=1)],
+            self.axes[1])
 
     def get_scalar(self, tup):
         """
         Retrieve single item
         """
-        full_loc = list(ax.get_loc(x)
-                        for ax, x in zip(self.axes, tup))
+        full_loc = [ax.get_loc(x) for ax, x in zip(self.axes, tup)]
         blk = self.blocks[self._blknos[full_loc[0]]]
-        full_loc[0] = self._blklocs[full_loc[0]]
+        values = blk.values
 
         # FIXME: this may return non-upcasted types?
-        return blk.values[tuple(full_loc)]
+        if values.ndim == 1:
+            return values[full_loc[1]]
+
+        full_loc[0] = self._blklocs[full_loc[0]]
+        return values[tuple(full_loc)]
 
     def delete(self, item):
         """
@@ -3207,21 +4214,27 @@ def set(self, item, value, check=False):
         # FIXME: refactor, clearly separate broadcasting & zip-like assignment
         #        can prob also fix the various if tests for sparse/categorical
 
-        value_is_internal_type = is_internal_type(value)
+        # TODO(EA): Remove an is_extension_ when all extension types satisfy
+        # the interface
+        value_is_extension_type = (is_extension_type(value) or
+                                   is_extension_array_dtype(value))
 
         # categorical/spares/datetimetz
-        if value_is_internal_type:
+        if value_is_extension_type:
+
             def value_getitem(placement):
                 return value
         else:
             if value.ndim == self.ndim - 1:
-                value = value.reshape((1,) + value.shape)
+                value = _safe_reshape(value, (1,) + value.shape)
 
                 def value_getitem(placement):
                     return value
             else:
+
                 def value_getitem(placement):
                     return value[placement.indexer]
+
             if value.shape[1:] != self.shape[1:]:
                 raise AssertionError('Shape of new values must be compatible '
                                      'with manager shape')
@@ -3269,8 +4282,8 @@ def value_getitem(placement):
             new_blknos.fill(-1)
             new_blknos[~is_deleted] = np.arange(self.nblocks -
                                                 len(removed_blknos))
-            self._blknos = com.take_1d(new_blknos, self._blknos, axis=0,
-                                       allow_fill=False)
+            self._blknos = algos.take_1d(new_blknos, self._blknos, axis=0,
+                                         allow_fill=False)
             self.blocks = tuple(blk for i, blk in enumerate(self.blocks)
                                 if i not in set(removed_blknos))
 
@@ -3279,7 +4292,7 @@ def value_getitem(placement):
             unfit_count = len(unfit_mgr_locs)
 
             new_blocks = []
-            if value_is_internal_type:
+            if value_is_extension_type:
                 # This code (ab-)uses the fact that sparse blocks contain only
                 # one item.
                 new_blocks.extend(
@@ -3322,14 +4335,16 @@ def insert(self, loc, item, value, allow_duplicates=False):
         """
         if not allow_duplicates and item in self.items:
             # Should this be a different kind of error??
-            raise ValueError('cannot insert %s, already exists' % item)
+            raise ValueError('cannot insert {}, already exists'.format(item))
 
         if not isinstance(loc, int):
             raise TypeError("loc must be int")
 
-        block = make_block(values=value,
-                           ndim=self.ndim,
-                           placement=slice(loc, loc+1))
+        # insert to the axis; this could possibly raise a TypeError
+        new_axis = self.items.insert(loc, item)
+
+        block = make_block(values=value, ndim=self.ndim,
+                           placement=slice(loc, loc + 1))
 
         for blkno, count in _fast_count_smallints(self._blknos[loc:]):
             blk = self.blocks[blkno]
@@ -3349,8 +4364,7 @@ def insert(self, loc, item, value, allow_duplicates=False):
             self._blklocs = np.insert(self._blklocs, loc, 0)
             self._blknos = np.insert(self._blknos, loc, len(self.blocks))
 
-        self.axes[0] = self.items.insert(loc, item)
-
+        self.axes[0] = new_axis
         self.blocks += (block,)
         self._shape = None
 
@@ -3365,8 +4379,8 @@ def reindex_axis(self, new_index, axis, method=None, limit=None,
         Conform block manager to new index.
         """
         new_index = _ensure_index(new_index)
-        new_index, indexer = self.axes[axis].reindex(
-            new_index, method=method, limit=limit)
+        new_index, indexer = self.axes[axis].reindex(new_index, method=method,
+                                                     limit=limit)
 
         return self.reindex_indexer(new_index, indexer, axis=axis,
                                     fill_value=fill_value, copy=copy)
@@ -3403,13 +4417,12 @@ def reindex_indexer(self, new_axis, indexer, axis, fill_value=None,
             raise IndexError("Requested axis not found in manager")
 
         if axis == 0:
-            new_blocks = self._slice_take_blocks_ax0(
-                indexer, fill_tuple=(fill_value,))
+            new_blocks = self._slice_take_blocks_ax0(indexer,
+                                                     fill_tuple=(fill_value,))
         else:
-            new_blocks = [blk.take_nd(indexer, axis=axis,
-                                      fill_tuple=(fill_value if fill_value is not None else
-                                                  blk.fill_value,))
-                          for blk in self.blocks]
+            new_blocks = [blk.take_nd(indexer, axis=axis, fill_tuple=(
+                fill_value if fill_value is not None else blk.fill_value,))
+                for blk in self.blocks]
 
         new_axes = list(self.axes)
         new_axes[axis] = new_axis
@@ -3436,12 +4449,11 @@ def _slice_take_blocks_ax0(self, slice_or_indexer, fill_tuple=None):
             blk = self.blocks[0]
 
             if sl_type in ('slice', 'mask'):
-                return [blk.getitem_block(slobj,
-                                          new_mgr_locs=slice(0, sllen))]
+                return [blk.getitem_block(slobj, new_mgr_locs=slice(0, sllen))]
             elif not allow_fill or self.ndim == 1:
                 if allow_fill and fill_tuple[0] is None:
-                    _, fill_value = com._maybe_promote(blk.dtype)
-                    fill_tuple = (fill_value,)
+                    _, fill_value = maybe_promote(blk.dtype)
+                    fill_tuple = (fill_value, )
 
                 return [blk.take_nd(slobj, axis=0,
                                     new_mgr_locs=slice(0, sllen),
@@ -3451,10 +4463,10 @@ def _slice_take_blocks_ax0(self, slice_or_indexer, fill_tuple=None):
             blknos = self._blknos[slobj]
             blklocs = self._blklocs[slobj]
         else:
-            blknos = com.take_1d(self._blknos, slobj, fill_value=-1,
-                                 allow_fill=allow_fill)
-            blklocs = com.take_1d(self._blklocs, slobj, fill_value=-1,
-                                  allow_fill=allow_fill)
+            blknos = algos.take_1d(self._blknos, slobj, fill_value=-1,
+                                   allow_fill=allow_fill)
+            blklocs = algos.take_1d(self._blklocs, slobj, fill_value=-1,
+                                    allow_fill=allow_fill)
 
         # When filling blknos, make sure blknos is updated before appending to
         # blocks list, that way new blkno is exactly len(blocks).
@@ -3468,24 +4480,25 @@ def _slice_take_blocks_ax0(self, slice_or_indexer, fill_tuple=None):
                 # If we've got here, fill_tuple was not None.
                 fill_value = fill_tuple[0]
 
-                blocks.append(self._make_na_block(
-                    placement=mgr_locs, fill_value=fill_value))
+                blocks.append(self._make_na_block(placement=mgr_locs,
+                                                  fill_value=fill_value))
             else:
                 blk = self.blocks[blkno]
 
                 # Otherwise, slicing along items axis is necessary.
                 if not blk._can_consolidate:
-                    # A non-consolidatable block, it's easy, because there's only one item
-                    # and each mgr loc is a copy of that single item.
+                    # A non-consolidatable block, it's easy, because there's
+                    # only one item and each mgr loc is a copy of that single
+                    # item.
                     for mgr_loc in mgr_locs:
                         newblk = blk.copy(deep=True)
                         newblk.mgr_locs = slice(mgr_loc, mgr_loc + 1)
                         blocks.append(newblk)
 
                 else:
-                    blocks.append(blk.take_nd(
-                        blklocs[mgr_locs.indexer], axis=0,
-                        new_mgr_locs=mgr_locs, fill_tuple=None))
+                    blocks.append(blk.take_nd(blklocs[mgr_locs.indexer],
+                                              axis=0, new_mgr_locs=mgr_locs,
+                                              fill_tuple=None))
 
         return blocks
 
@@ -3497,7 +4510,7 @@ def _make_na_block(self, placement, fill_value=None):
         block_shape = list(self.shape)
         block_shape[0] = len(placement)
 
-        dtype, fill_value = com._infer_dtype_from_scalar(fill_value)
+        dtype, fill_value = infer_dtype_from_scalar(fill_value)
         block_values = np.empty(block_shape, dtype=dtype)
         block_values.fill(fill_value)
         return make_block(block_values, placement=placement)
@@ -3507,9 +4520,10 @@ def take(self, indexer, axis=1, verify=True, convert=True):
         Take items along any axis.
         """
         self._consolidate_inplace()
-        indexer = np.arange(indexer.start, indexer.stop, indexer.step,
-                            dtype='int64') if isinstance(indexer, slice) \
-                                    else np.asanyarray(indexer, dtype='int64')
+        indexer = (np.arange(indexer.start, indexer.stop, indexer.step,
+                             dtype='int64')
+                   if isinstance(indexer, slice)
+                   else np.asanyarray(indexer, dtype='int64'))
 
         n = self.shape[axis]
         if convert:
@@ -3532,8 +4546,7 @@ def merge(self, other, lsuffix='', rsuffix=''):
                                          right=other.items, rsuffix=rsuffix)
         new_items = _concat_indexes([l, r])
 
-        new_blocks = [blk.copy(deep=False)
-                      for blk in self.blocks]
+        new_blocks = [blk.copy(deep=False) for blk in self.blocks]
 
         offset = self.shape[0]
         for blk in other.blocks:
@@ -3551,8 +4564,9 @@ def _is_indexed_like(self, other):
         Check all axes except items
         """
         if self.ndim != other.ndim:
-            raise AssertionError(('Number of dimensions must agree '
-                                  'got %d and %d') % (self.ndim, other.ndim))
+            raise AssertionError(
+                'Number of dimensions must agree got {ndim} and '
+                '{oth_ndim}'.format(ndim=self.ndim, oth_ndim=other.ndim))
         for ax, oax in zip(self.axes[1:], other.axes[1:]):
             if not ax.equals(oax):
                 return False
@@ -3562,7 +4576,7 @@ def equals(self, other):
         self_axes, other_axes = self.axes, other.axes
         if len(self_axes) != len(other_axes):
             return False
-        if not all (ax1.equals(ax2) for ax1, ax2 in zip(self_axes, other_axes)):
+        if not all(ax1.equals(ax2) for ax1, ax2 in zip(self_axes, other_axes)):
             return False
         self._consolidate_inplace()
         other._consolidate_inplace()
@@ -3578,8 +4592,40 @@ def canonicalize(block):
 
         self_blocks = sorted(self.blocks, key=canonicalize)
         other_blocks = sorted(other.blocks, key=canonicalize)
-        return all(block.equals(oblock) for block, oblock in
-                   zip(self_blocks, other_blocks))
+        return all(block.equals(oblock)
+                   for block, oblock in zip(self_blocks, other_blocks))
+
+    def unstack(self, unstacker_func):
+        """Return a blockmanager with all blocks unstacked.
+
+        Parameters
+        ----------
+        unstacker_func : callable
+            A (partially-applied) ``pd.core.reshape._Unstacker`` class.
+
+        Returns
+        -------
+        unstacked : BlockManager
+        """
+        dummy = unstacker_func(np.empty((0, 0)), value_columns=self.items)
+        new_columns = dummy.get_new_columns()
+        new_index = dummy.get_new_index()
+        new_blocks = []
+        columns_mask = []
+
+        for blk in self.blocks:
+            blocks, mask = blk._unstack(
+                partial(unstacker_func,
+                        value_columns=self.items[blk.mgr_locs.indexer]),
+                new_columns)
+
+            new_blocks.extend(blocks)
+            columns_mask.extend(mask)
+
+        new_columns = new_columns[columns_mask]
+
+        bm = BlockManager(new_blocks, [new_columns, new_index])
+        return bm
 
 
 class SingleBlockManager(BlockManager):
@@ -3594,8 +4640,8 @@ def __init__(self, block, axis, do_integrity_check=False, fastpath=False):
 
         if isinstance(axis, list):
             if len(axis) != 1:
-                raise ValueError(
-                    "cannot create SingleBlockManager with more than 1 axis")
+                raise ValueError("cannot create SingleBlockManager with more "
+                                 "than 1 axis")
             axis = axis[0]
 
         # passed from constructor, single block, single axis
@@ -3628,9 +4674,7 @@ def __init__(self, block, axis, do_integrity_check=False, fastpath=False):
                 block = block[0]
 
         if not isinstance(block, Block):
-            block = make_block(block,
-                               placement=slice(0, len(axis)),
-                               ndim=1, fastpath=True)
+            block = make_block(block, placement=slice(0, len(axis)), ndim=1)
 
         self.blocks = [block]
 
@@ -3645,44 +4689,15 @@ def _block(self):
     def _values(self):
         return self._block.values
 
-    def reindex(self, new_axis, indexer=None, method=None, fill_value=None,
-                limit=None, copy=True):
-        # if we are the same and don't copy, just return
-        if self.index.equals(new_axis):
-            if copy:
-                return self.copy(deep=True)
-            else:
-                return self
-
-        values = self._block.get_values()
-
-        if indexer is None:
-            indexer = self.items.get_indexer_for(new_axis)
-
-        if fill_value is None:
-            # FIXME: is fill_value used correctly in sparse blocks?
-            if not self._block.is_sparse:
-                fill_value = self._block.fill_value
-            else:
-                fill_value = np.nan
-
-        new_values = com.take_1d(values, indexer,
-                                 fill_value=fill_value)
-
-        # fill if needed
-        if method is not None or limit is not None:
-            new_values = com.interpolate_2d(new_values, method=method,
-                                            limit=limit, fill_value=fill_value)
-
-        if self._block.is_sparse:
-            make_block = self._block.make_block_same_class
-
-        block = make_block(new_values, copy=copy,
-                           placement=slice(0, len(new_axis)))
+    @property
+    def _blknos(self):
+        """ compat with BlockManager """
+        return None
 
-        mgr = SingleBlockManager(block, new_axis)
-        mgr._consolidate_inplace()
-        return mgr
+    @property
+    def _blklocs(self):
+        """ compat with BlockManager """
+        return None
 
     def get_slice(self, slobj, axis=0):
         if axis >= self.ndim:
@@ -3730,13 +4745,21 @@ def external_values(self):
     def internal_values(self):
         return self._block.internal_values()
 
+    def formatting_values(self):
+        """Return the internal values used by the DataFrame/SeriesFormatter"""
+        return self._block.formatting_values()
+
     def get_values(self):
         """ return a dense type view """
-        return np.array(self._block.to_dense(),copy=False)
+        return np.array(self._block.to_dense(), copy=False)
 
     @property
-    def itemsize(self):
-        return self._block.values.itemsize
+    def asobject(self):
+        """
+        return a object dtype array. datetime/timedelta like values are boxed
+        to Timestamp/Timedelta instances.
+        """
+        return self._block.get_values(dtype=object)
 
     @property
     def _can_hold_na(self):
@@ -3768,6 +4791,45 @@ def fast_xs(self, loc):
         """
         return self._block.values[loc]
 
+    def concat(self, to_concat, new_axis):
+        """
+        Concatenate a list of SingleBlockManagers into a single
+        SingleBlockManager.
+
+        Used for pd.concat of Series objects with axis=0.
+
+        Parameters
+        ----------
+        to_concat : list of SingleBlockManagers
+        new_axis : Index of the result
+
+        Returns
+        -------
+        SingleBlockManager
+
+        """
+        non_empties = [x for x in to_concat if len(x) > 0]
+
+        # check if all series are of the same block type:
+        if len(non_empties) > 0:
+            blocks = [obj.blocks[0] for obj in non_empties]
+
+            if all(type(b) is type(blocks[0]) for b in blocks[1:]):  # noqa
+                new_block = blocks[0].concat_same_type(blocks)
+            else:
+                values = [x.values for x in blocks]
+                values = _concat._concat_compat(values)
+                new_block = make_block(
+                    values, placement=slice(0, len(values), 1))
+        else:
+            values = [x._block.values for x in to_concat]
+            values = _concat._concat_compat(values)
+            new_block = make_block(
+                values, placement=slice(0, len(values), 1))
+
+        mgr = SingleBlockManager(new_block, new_axis)
+        return mgr
+
 
 def construction_error(tot_items, block_shape, axes, e=None):
     """ raise a helpful message about our construction """
@@ -3775,8 +4837,10 @@ def construction_error(tot_items, block_shape, axes, e=None):
     implied = tuple(map(int, [len(ax) for ax in axes]))
     if passed == implied and e is not None:
         raise e
+    if block_shape[0] == 0:
+        raise ValueError("Empty data passed with indices specified.")
     raise ValueError("Shape of passed values is {0}, indices imply {1}".format(
-        passed,implied))
+        passed, implied))
 
 
 def create_block_manager_from_blocks(blocks, axes):
@@ -3786,8 +4850,8 @@ def create_block_manager_from_blocks(blocks, axes):
             if not len(blocks[0]):
                 blocks = []
             else:
-                # It's OK if a single block is passed as values, its placement is
-                # basically "all items", but if there're many, don't bother
+                # It's OK if a single block is passed as values, its placement
+                # is basically "all items", but if there're many, don't bother
                 # converting, it's an error anyway.
                 blocks = [make_block(values=blocks[0],
                                      placement=slice(0, len(axes[0])))]
@@ -3809,25 +4873,17 @@ def create_block_manager_from_arrays(arrays, names, axes):
         mgr = BlockManager(blocks, axes)
         mgr._consolidate_inplace()
         return mgr
-    except (ValueError) as e:
+    except ValueError as e:
         construction_error(len(arrays), arrays[0].shape, axes, e)
 
 
 def form_blocks(arrays, names, axes):
     # put "leftover" items in float bucket, where else?
     # generalize?
-    float_items = []
-    complex_items = []
-    int_items = []
-    bool_items = []
-    object_items = []
-    sparse_items = []
-    datetime_items = []
-    datetime_tz_items = []
-    cat_items = []
+    items_dict = defaultdict(list)
     extra_locs = []
 
-    names_idx = Index(names)
+    names_idx = _ensure_index(names)
     if names_idx.equals(axes[0]):
         names_indexer = np.arange(len(names_idx))
     else:
@@ -3842,84 +4898,64 @@ def form_blocks(arrays, names, axes):
         k = names[name_idx]
         v = arrays[name_idx]
 
-        if is_sparse(v):
-            sparse_items.append((i, k, v))
-        elif issubclass(v.dtype.type, np.floating):
-            float_items.append((i, k, v))
-        elif issubclass(v.dtype.type, np.complexfloating):
-            complex_items.append((i, k, v))
-        elif issubclass(v.dtype.type, np.datetime64):
-            if v.dtype != _NS_DTYPE:
-                v = tslib.cast_to_nanoseconds(v)
-
-            if is_datetimetz(v):
-                datetime_tz_items.append((i, k, v))
-            else:
-                datetime_items.append((i, k, v))
-        elif is_datetimetz(v):
-            datetime_tz_items.append((i, k, v))
-        elif issubclass(v.dtype.type, np.integer):
-            if v.dtype == np.uint64:
-                # HACK #2355 definite overflow
-                if (v > 2 ** 63 - 1).any():
-                    object_items.append((i, k, v))
-                    continue
-            int_items.append((i, k, v))
-        elif v.dtype == np.bool_:
-            bool_items.append((i, k, v))
-        elif is_categorical(v):
-            cat_items.append((i, k, v))
-        else:
-            object_items.append((i, k, v))
+        block_type = get_block_type(v)
+        items_dict[block_type.__name__].append((i, k, v))
 
     blocks = []
-    if len(float_items):
-        float_blocks = _multi_blockify(float_items)
+    if len(items_dict['FloatBlock']):
+        float_blocks = _multi_blockify(items_dict['FloatBlock'])
         blocks.extend(float_blocks)
 
-    if len(complex_items):
-        complex_blocks = _multi_blockify(complex_items)
+    if len(items_dict['ComplexBlock']):
+        complex_blocks = _multi_blockify(items_dict['ComplexBlock'])
         blocks.extend(complex_blocks)
 
-    if len(int_items):
-        int_blocks = _multi_blockify(int_items)
+    if len(items_dict['TimeDeltaBlock']):
+        timedelta_blocks = _multi_blockify(items_dict['TimeDeltaBlock'])
+        blocks.extend(timedelta_blocks)
+
+    if len(items_dict['IntBlock']):
+        int_blocks = _multi_blockify(items_dict['IntBlock'])
         blocks.extend(int_blocks)
 
-    if len(datetime_items):
-        datetime_blocks = _simple_blockify(
-            datetime_items, _NS_DTYPE)
+    if len(items_dict['DatetimeBlock']):
+        datetime_blocks = _simple_blockify(items_dict['DatetimeBlock'],
+                                           _NS_DTYPE)
         blocks.extend(datetime_blocks)
 
-    if len(datetime_tz_items):
-        dttz_blocks = [ make_block(array,
-                                   klass=DatetimeTZBlock,
-                                   fastpath=True,
-                                   placement=[i],
-                                   ) for i, names, array in datetime_tz_items ]
+    if len(items_dict['DatetimeTZBlock']):
+        dttz_blocks = [make_block(array,
+                                  klass=DatetimeTZBlock,
+                                  placement=[i])
+                       for i, _, array in items_dict['DatetimeTZBlock']]
         blocks.extend(dttz_blocks)
 
-    if len(bool_items):
-        bool_blocks = _simple_blockify(
-            bool_items, np.bool_)
+    if len(items_dict['BoolBlock']):
+        bool_blocks = _simple_blockify(items_dict['BoolBlock'], np.bool_)
         blocks.extend(bool_blocks)
 
-    if len(object_items) > 0:
-        object_blocks = _simple_blockify(
-            object_items, np.object_)
+    if len(items_dict['ObjectBlock']) > 0:
+        object_blocks = _simple_blockify(items_dict['ObjectBlock'], np.object_)
         blocks.extend(object_blocks)
 
-    if len(sparse_items) > 0:
-        sparse_blocks = _sparse_blockify(sparse_items)
+    if len(items_dict['SparseBlock']) > 0:
+        sparse_blocks = _sparse_blockify(items_dict['SparseBlock'])
         blocks.extend(sparse_blocks)
 
-    if len(cat_items) > 0:
-        cat_blocks = [ make_block(array,
-                                  klass=CategoricalBlock,
-                                  fastpath=True,
-                                  placement=[i]
-                                  ) for i, names, array in cat_items ]
+    if len(items_dict['CategoricalBlock']) > 0:
+        cat_blocks = [make_block(array, klass=CategoricalBlock, placement=[i])
+                      for i, _, array in items_dict['CategoricalBlock']]
         blocks.extend(cat_blocks)
 
+    if len(items_dict['ExtensionBlock']):
+
+        external_blocks = [
+            make_block(array, klass=ExtensionBlock, placement=[i])
+            for i, _, array in items_dict['ExtensionBlock']
+        ]
+
+        blocks.extend(external_blocks)
+
     if len(extra_locs):
         shape = (len(extra_locs),) + tuple(len(x) for x in axes[1:])
 
@@ -3956,8 +4992,7 @@ def _multi_blockify(tuples, dtype=None):
     new_blocks = []
     for dtype, tup_block in grouper:
 
-        values, placement = _stack_arrays(
-            list(tup_block), dtype)
+        values, placement = _stack_arrays(list(tup_block), dtype)
 
         block = make_block(values, placement=placement)
         new_blocks.append(block)
@@ -3973,9 +5008,7 @@ def _sparse_blockify(tuples, dtype=None):
     new_blocks = []
     for i, names, array in tuples:
         array = _maybe_to_sparse(array)
-        block = make_block(
-            array, klass=SparseBlock, fastpath=True,
-            placement=[i])
+        block = make_block(array, klass=SparseBlock, placement=[i])
         new_blocks.append(block)
 
     return new_blocks
@@ -4012,63 +5045,13 @@ def _interleaved_dtype(blocks):
     if not len(blocks):
         return None
 
-    counts = defaultdict(lambda: [])
-    for x in blocks:
-        counts[type(x)].append(x)
-
-    def _lcd_dtype(l):
-        """ find the lowest dtype that can accomodate the given types """
-        m = l[0].dtype
-        for x in l[1:]:
-            if x.dtype.itemsize > m.itemsize:
-                m = x.dtype
-        return m
-
-    have_int = len(counts[IntBlock]) > 0
-    have_bool = len(counts[BoolBlock]) > 0
-    have_object = len(counts[ObjectBlock]) > 0
-    have_float = len(counts[FloatBlock]) > 0
-    have_complex = len(counts[ComplexBlock]) > 0
-    have_dt64 = len(counts[DatetimeBlock]) > 0
-    have_dt64_tz = len(counts[DatetimeTZBlock]) > 0
-    have_td64 = len(counts[TimeDeltaBlock]) > 0
-    have_cat = len(counts[CategoricalBlock]) > 0
-    have_sparse = len(counts[SparseBlock]) > 0
-    have_numeric = have_float or have_complex or have_int
-
-    has_non_numeric = have_dt64 or have_dt64_tz or have_td64 or have_cat
-
-    if (have_object or
-        (have_bool and (have_numeric or have_dt64 or have_dt64_tz or have_td64)) or
-        (have_numeric and has_non_numeric) or
-        have_cat or
-        have_dt64 or
-        have_dt64_tz or
-        have_td64):
-        return np.dtype(object)
-    elif have_bool:
-        return np.dtype(bool)
-    elif have_int and not have_float and not have_complex:
-
-        # if we are mixing unsigned and signed, then return
-        # the next biggest int type (if we can)
-        lcd = _lcd_dtype(counts[IntBlock])
-        kinds = set([i.dtype.kind for i in counts[IntBlock]])
-        if len(kinds) == 1:
-            return lcd
-
-        if lcd == 'uint64' or lcd == 'int64':
-            return np.dtype('int64')
-
-        # return 1 bigger on the itemsize if unsinged
-        if lcd.kind == 'u':
-            return np.dtype('int%s' % (lcd.itemsize * 8 * 2))
-        return lcd
-
-    elif have_complex:
-        return np.dtype('c16')
-    else:
-        return _lcd_dtype(counts[FloatBlock] + counts[SparseBlock])
+    dtype = find_common_type([b.dtype for b in blocks])
+
+    # only numpy compat
+    if isinstance(dtype, (PandasExtensionDtype, ExtensionDtype)):
+        dtype = np.object
+
+    return dtype
 
 
 def _consolidate(blocks):
@@ -4084,22 +5067,19 @@ def _consolidate(blocks):
     for (_can_consolidate, dtype), group_blocks in grouper:
         merged_blocks = _merge_blocks(list(group_blocks), dtype=dtype,
                                       _can_consolidate=_can_consolidate)
-        if isinstance(merged_blocks, list):
-            new_blocks.extend(merged_blocks)
-        else:
-            new_blocks.append(merged_blocks)
-
+        new_blocks = _extend_blocks(merged_blocks, new_blocks)
     return new_blocks
 
 
 def _merge_blocks(blocks, dtype=None, _can_consolidate=True):
+
     if len(blocks) == 1:
         return blocks[0]
 
     if _can_consolidate:
 
         if dtype is None:
-            if len(set([b.dtype for b in blocks])) != 1:
+            if len({b.dtype for b in blocks}) != 1:
                 raise AssertionError("_merge_blocks are invalid!")
             dtype = blocks[0].dtype
 
@@ -4112,19 +5092,35 @@ def _merge_blocks(blocks, dtype=None, _can_consolidate=True):
         new_values = new_values[argsort]
         new_mgr_locs = new_mgr_locs[argsort]
 
-        return make_block(new_values,
-                          fastpath=True, placement=new_mgr_locs)
+        return make_block(new_values, placement=new_mgr_locs)
 
     # no merge
     return blocks
 
 
+def _extend_blocks(result, blocks=None):
+    """ return a new extended blocks, givin the result """
+    if blocks is None:
+        blocks = []
+    if isinstance(result, list):
+        for r in result:
+            if isinstance(r, list):
+                blocks.extend(r)
+            else:
+                blocks.append(r)
+    elif isinstance(result, BlockManager):
+        blocks.extend(result.blocks)
+    else:
+        blocks.append(result)
+    return blocks
+
+
 def _block_shape(values, ndim=1, shape=None):
     """ guarantee the shape of the values to be at least 1 d """
-    if values.ndim <= ndim:
+    if values.ndim < ndim:
         if shape is None:
             shape = values.shape
-        values = values.reshape(tuple((1,) + shape))
+        values = values.reshape(tuple((1, ) + shape))
     return values
 
 
@@ -4139,28 +5135,35 @@ def _vstack(to_stack, dtype):
         return np.vstack(to_stack)
 
 
-def _possibly_compare(a, b, op):
+def _maybe_compare(a, b, op):
 
     is_a_array = isinstance(a, np.ndarray)
     is_b_array = isinstance(b, np.ndarray)
 
-    # numpy deprecation warning to have i8 vs integer comparisions
+    # numpy deprecation warning to have i8 vs integer comparisons
     if is_datetimelike_v_numeric(a, b):
-        res = False
+        result = False
+
+    # numpy deprecation warning if comparing numeric vs string-like
+    elif is_numeric_v_string_like(a, b):
+        result = False
+
     else:
-        res = op(a, b)
+        result = op(a, b)
 
-    if np.isscalar(res) and (is_a_array or is_b_array):
+    if is_scalar(result) and (is_a_array or is_b_array):
         type_names = [type(a).__name__, type(b).__name__]
 
         if is_a_array:
-            type_names[0] = 'ndarray(dtype=%s)' % a.dtype
+            type_names[0] = 'ndarray(dtype={dtype})'.format(dtype=a.dtype)
 
         if is_b_array:
-            type_names[1] = 'ndarray(dtype=%s)' % b.dtype
+            type_names[1] = 'ndarray(dtype={dtype})'.format(dtype=b.dtype)
 
-        raise TypeError("Cannot compare types %r and %r" % tuple(type_names))
-    return res
+        raise TypeError(
+            "Cannot compare types {a!r} and {b!r}".format(a=type_names[0],
+                                                          b=type_names[1]))
+    return result
 
 
 def _concat_indexes(indexes):
@@ -4169,8 +5172,6 @@ def _concat_indexes(indexes):
 
 def _block2d_to_blocknd(values, placement, shape, labels, ref_items):
     """ pivot to the labels shape """
-    from pandas.core.internals import make_block
-
     panel_shape = (len(placement),) + shape
 
     # TODO: lexsort depth needs to be 2!!
@@ -4184,11 +5185,10 @@ def _block2d_to_blocknd(values, placement, shape, labels, ref_items):
     if mask.all():
         pvalues = np.empty(panel_shape, dtype=values.dtype)
     else:
-        dtype, fill_value = _maybe_promote(values.dtype)
+        dtype, fill_value = maybe_promote(values.dtype)
         pvalues = np.empty(panel_shape, dtype=dtype)
         pvalues.fill(fill_value)
 
-    values = values
     for i in range(len(placement)):
         pvalues[i].flat[mask] = values[:, i]
 
@@ -4201,9 +5201,10 @@ def _factor_indexer(shape, labels):
     expanded label indexer
     """
     mult = np.array(shape)[::-1].cumprod()[::-1]
-    return com._ensure_platform_int(
+    return _ensure_platform_int(
         np.sum(np.array(labels).T * np.append(mult, [1]), axis=1).T)
 
+
 def _get_blkno_placements(blknos, blk_count, group=True):
     """
 
@@ -4220,10 +5221,10 @@ def _get_blkno_placements(blknos, blk_count, group=True):
 
     """
 
-    blknos = com._ensure_int64(blknos)
+    blknos = _ensure_int64(blknos)
 
     # FIXME: blk_count is unused, but it may avoid the use of dicts in cython
-    for blkno, indexer in lib.get_blkno_indexers(blknos, group):
+    for blkno, indexer in libinternals.get_blkno_indexers(blknos, group):
         yield blkno, BlockPlacement(indexer)
 
 
@@ -4239,78 +5240,149 @@ def items_overlap_with_suffix(left, lsuffix, right, rsuffix):
         return left, right
     else:
         if not lsuffix and not rsuffix:
-            raise ValueError('columns overlap but no suffix specified: %s' %
-                             to_rename)
+            raise ValueError('columns overlap but no suffix specified: '
+                             '{rename}'.format(rename=to_rename))
 
         def lrenamer(x):
             if x in to_rename:
-                return '%s%s' % (x, lsuffix)
+                return '{x}{lsuffix}'.format(x=x, lsuffix=lsuffix)
             return x
 
         def rrenamer(x):
             if x in to_rename:
-                return '%s%s' % (x, rsuffix)
+                return '{x}{rsuffix}'.format(x=x, rsuffix=rsuffix)
             return x
 
         return (_transform_index(left, lrenamer),
                 _transform_index(right, rrenamer))
 
 
-def _transform_index(index, func):
+def _safe_reshape(arr, new_shape):
+    """
+    If possible, reshape `arr` to have shape `new_shape`,
+    with a couple of exceptions (see gh-13012):
+
+    1) If `arr` is a ExtensionArray or Index, `arr` will be
+       returned as is.
+    2) If `arr` is a Series, the `_values` attribute will
+       be reshaped and returned.
+
+    Parameters
+    ----------
+    arr : array-like, object to be reshaped
+    new_shape : int or tuple of ints, the new shape
+    """
+    if isinstance(arr, ABCSeries):
+        arr = arr._values
+    if not isinstance(arr, ABCExtensionArray):
+        arr = arr.reshape(new_shape)
+    return arr
+
+
+def _transform_index(index, func, level=None):
     """
     Apply function to all values found in index.
 
     This includes transforming multiindex entries separately.
+    Only apply function to one level of the MultiIndex if level is specified.
 
     """
     if isinstance(index, MultiIndex):
-        items = [tuple(func(y) for y in x) for x in index]
+        if level is not None:
+            items = [tuple(func(y) if i == level else y
+                           for i, y in enumerate(x)) for x in index]
+        else:
+            items = [tuple(func(y) for y in x) for x in index]
         return MultiIndex.from_tuples(items, names=index.names)
     else:
         items = [func(x) for x in index]
-        return Index(items, name=index.name)
+        return Index(items, name=index.name, tupleize_cols=False)
 
 
 def _putmask_smart(v, m, n):
     """
-    Return a new block, try to preserve dtype if possible.
+    Return a new ndarray, try to preserve dtype if possible.
 
     Parameters
     ----------
     v : `values`, updated in-place (array like)
     m : `mask`, applies to both sides (array like)
     n : `new values` either scalar or an array like aligned with `values`
+
+    Returns
+    -------
+    values : ndarray with updated values
+        this *may* be a copy of the original
+
+    See Also
+    --------
+    ndarray.putmask
     """
 
+    # we cannot use np.asarray() here as we cannot have conversions
+    # that numpy does when numeric are mixed with strings
+
     # n should be the length of the mask or a scalar here
     if not is_list_like(n):
-        n = np.array([n] * len(m))
-    elif isinstance(n, np.ndarray) and n.ndim == 0: # numpy scalar
+        n = np.repeat(n, len(m))
+    elif isinstance(n, np.ndarray) and n.ndim == 0:  # numpy scalar
         n = np.repeat(np.array(n, ndmin=1), len(m))
 
     # see if we are only masking values that if putted
     # will work in the current dtype
     try:
         nn = n[m]
-        nn_at = nn.astype(v.dtype)
-        comp = (nn == nn_at)
-        if is_list_like(comp) and comp.all():
-            nv = v.copy()
-            nv[m] = nn_at
-            return nv
+
+        # make sure that we have a nullable type
+        # if we have nulls
+        if not _isna_compat(v, nn[0]):
+            raise ValueError
+
+        # we ignore ComplexWarning here
+        with catch_warnings(record=True):
+            nn_at = nn.astype(v.dtype)
+
+        # avoid invalid dtype comparisons
+        # between numbers & strings
+
+        # only compare integers/floats
+        # don't compare integers to datetimelikes
+        if (not is_numeric_v_string_like(nn, nn_at) and
+            (is_float_dtype(nn.dtype) or
+             is_integer_dtype(nn.dtype) and
+             is_float_dtype(nn_at.dtype) or
+             is_integer_dtype(nn_at.dtype))):
+
+            comp = (nn == nn_at)
+            if is_list_like(comp) and comp.all():
+                nv = v.copy()
+                nv[m] = nn_at
+                return nv
     except (ValueError, IndexError, TypeError):
         pass
 
-    # change the dtype
-    dtype, _ = com._maybe_promote(n.dtype)
-    nv = v.astype(dtype)
-    try:
-        nv[m] = n[m]
-    except ValueError:
-        idx, = np.where(np.squeeze(m))
-        for mask_index, new_val in zip(idx, n[m]):
-            nv[mask_index] = new_val
-    return nv
+    n = np.asarray(n)
+
+    def _putmask_preserve(nv, n):
+        try:
+            nv[m] = n[m]
+        except (IndexError, ValueError):
+            nv[m] = n
+        return nv
+
+    # preserves dtype if possible
+    if v.dtype.kind == n.dtype.kind:
+        return _putmask_preserve(v, n)
+
+    # change the dtype if needed
+    dtype, _ = maybe_promote(n.dtype)
+
+    if is_extension_type(v.dtype) and is_object_dtype(dtype):
+        v = v.get_values(dtype)
+    else:
+        v = v.astype(dtype)
+
+    return _putmask_preserve(v, n)
 
 
 def concatenate_block_managers(mgrs_indexers, axes, concat_axis, copy):
@@ -4325,18 +5397,63 @@ def concatenate_block_managers(mgrs_indexers, axes, concat_axis, copy):
     copy : bool
 
     """
-    concat_plan = combine_concat_plans([get_mgr_concatenation_plan(mgr, indexers)
-                                        for mgr, indexers in mgrs_indexers],
-                                       concat_axis)
+    concat_plan = combine_concat_plans(
+        [get_mgr_concatenation_plan(mgr, indexers)
+         for mgr, indexers in mgrs_indexers], concat_axis)
+
+    blocks = []
+
+    for placement, join_units in concat_plan:
 
-    blocks = [make_block(concatenate_join_units(join_units, concat_axis,
-                                                copy=copy),
-                         placement=placement)
-              for placement, join_units in concat_plan]
+        if len(join_units) == 1 and not join_units[0].indexers:
+            b = join_units[0].block
+            values = b.values
+            if copy:
+                values = values.copy()
+            elif not copy:
+                values = values.view()
+            b = b.make_block_same_class(values, placement=placement)
+        elif is_uniform_join_units(join_units):
+            b = join_units[0].block.concat_same_type(
+                [ju.block for ju in join_units], placement=placement)
+        else:
+            b = make_block(
+                concatenate_join_units(join_units, concat_axis, copy=copy),
+                placement=placement)
+        blocks.append(b)
 
     return BlockManager(blocks, axes)
 
 
+def is_uniform_join_units(join_units):
+    """
+    Check if the join units consist of blocks of uniform type that can
+    be concatenated using Block.concat_same_type instead of the generic
+    concatenate_join_units (which uses `_concat._concat_compat`).
+
+    """
+    return (
+        # all blocks need to have the same type
+        all(type(ju.block) is type(join_units[0].block) for ju in join_units) and  # noqa
+        # no blocks that would get missing values (can lead to type upcasts)
+        # unless we're an extension dtype.
+        all(not ju.is_na or ju.block.is_extension for ju in join_units) and
+        # no blocks with indexers (as then the dimensions do not fit)
+        all(not ju.indexers for ju in join_units) and
+        # disregard Panels
+        all(ju.block.ndim <= 2 for ju in join_units) and
+        # only use this path when there is something to concatenate
+        len(join_units) > 1)
+
+
+def is_uniform_reindex(join_units):
+    return (
+        # TODO: should this be ju.block._can_hold_na?
+        all(ju.block and ju.block.is_extension for ju in join_units) and
+        len(set(ju.block.dtype.name for ju in join_units)) == 1
+    )
+
+
 def get_empty_dtype_and_na(join_units):
     """
     Return dtype and N/A values to use when concatenating specified units.
@@ -4354,6 +5471,12 @@ def get_empty_dtype_and_na(join_units):
         if blk is None:
             return np.float64, np.nan
 
+    if is_uniform_reindex(join_units):
+        # XXX: integrate property
+        empty_dtype = join_units[0].block.dtype
+        upcasted_na = join_units[0].block.fill_value
+        return empty_dtype, upcasted_na
+
     has_none_blocks = False
     dtypes = [None] * len(join_units)
     for i, unit in enumerate(join_units):
@@ -4362,16 +5485,15 @@ def get_empty_dtype_and_na(join_units):
         else:
             dtypes[i] = unit.dtype
 
-    # dtypes = set()
-    upcast_classes = set()
-    null_upcast_classes = set()
+    upcast_classes = defaultdict(list)
+    null_upcast_classes = defaultdict(list)
     for dtype, unit in zip(dtypes, join_units):
         if dtype is None:
             continue
 
-        if com.is_categorical_dtype(dtype):
+        if is_categorical_dtype(dtype):
             upcast_cls = 'category'
-        elif com.is_datetimetz(dtype):
+        elif is_datetimetz(dtype):
             upcast_cls = 'datetimetz'
         elif issubclass(dtype.type, np.bool_):
             upcast_cls = 'bool'
@@ -4381,16 +5503,18 @@ def get_empty_dtype_and_na(join_units):
             upcast_cls = 'datetime'
         elif is_timedelta64_dtype(dtype):
             upcast_cls = 'timedelta'
+        elif is_float_dtype(dtype) or is_numeric_dtype(dtype):
+            upcast_cls = dtype.name
         else:
             upcast_cls = 'float'
 
         # Null blocks should not influence upcast class selection, unless there
         # are only null blocks, when same upcasting rules must be applied to
         # null upcast classes.
-        if unit.is_null:
-            null_upcast_classes.add(upcast_cls)
+        if unit.is_na:
+            null_upcast_classes[upcast_cls].append(dtype)
         else:
-            upcast_classes.add(upcast_cls)
+            upcast_classes[upcast_cls].append(dtype)
 
     if not upcast_classes:
         upcast_classes = null_upcast_classes
@@ -4405,16 +5529,25 @@ def get_empty_dtype_and_na(join_units):
             return np.dtype(np.bool_), None
     elif 'category' in upcast_classes:
         return np.dtype(np.object_), np.nan
-    elif 'float' in upcast_classes:
-        return np.dtype(np.float64), np.nan
     elif 'datetimetz' in upcast_classes:
-        return np.dtype('M8[ns]'), tslib.iNaT
+        dtype = upcast_classes['datetimetz']
+        return dtype[0], tslib.iNaT
     elif 'datetime' in upcast_classes:
         return np.dtype('M8[ns]'), tslib.iNaT
     elif 'timedelta' in upcast_classes:
         return np.dtype('m8[ns]'), tslib.iNaT
     else:  # pragma
-        raise AssertionError("invalid dtype determination in get_concat_dtype")
+        g = np.find_common_type(upcast_classes, [])
+        if is_float_dtype(g):
+            return g, g.type(np.nan)
+        elif is_numeric_dtype(g):
+            if has_none_blocks:
+                return np.float64, np.nan
+            else:
+                return g, None
+
+    msg = "invalid dtype determination in get_concat_dtype"
+    raise AssertionError(msg)
 
 
 def concatenate_join_units(join_units, concat_axis, copy):
@@ -4434,13 +5567,20 @@ def concatenate_join_units(join_units, concat_axis, copy):
     if len(to_concat) == 1:
         # Only one block, nothing to concatenate.
         concat_values = to_concat[0]
-        if copy and concat_values.base is not None:
-            concat_values = concat_values.copy()
+        if copy:
+            if isinstance(concat_values, np.ndarray):
+                # non-reindexed (=not yet copied) arrays are made into a view
+                # in JoinUnit.get_reindexed_values
+                if concat_values.base is not None:
+                    concat_values = concat_values.copy()
+            else:
+                concat_values = concat_values.copy()
     else:
-        concat_values = com._concat_compat(to_concat, axis=concat_axis)
+        concat_values = _concat._concat_compat(to_concat, axis=concat_axis)
 
     return concat_values
 
+
 def get_mgr_concatenation_plan(mgr, indexers):
     """
     Construct concatenation plan for given block manager and indexers.
@@ -4464,8 +5604,8 @@ def get_mgr_concatenation_plan(mgr, indexers):
 
     if 0 in indexers:
         ax0_indexer = indexers.pop(0)
-        blknos = com.take_1d(mgr._blknos, ax0_indexer, fill_value=-1)
-        blklocs = com.take_1d(mgr._blklocs, ax0_indexer, fill_value=-1)
+        blknos = algos.take_1d(mgr._blknos, ax0_indexer, fill_value=-1)
+        blklocs = algos.take_1d(mgr._blklocs, ax0_indexer, fill_value=-1)
     else:
 
         if mgr._is_single_block:
@@ -4494,17 +5634,18 @@ def get_mgr_concatenation_plan(mgr, indexers):
             blk = mgr.blocks[blkno]
             ax0_blk_indexer = blklocs[placements.indexer]
 
-            unit_no_ax0_reindexing = (
-                len(placements) == len(blk.mgr_locs) and
-                # Fastpath detection of join unit not needing to reindex its
-                # block: no ax0 reindexing took place and block placement was
-                # sequential before.
-                ((ax0_indexer is None
-                  and blk.mgr_locs.is_slice_like
-                  and blk.mgr_locs.as_slice.step == 1) or
-                 # Slow-ish detection: all indexer locs are sequential (and
-                 # length match is checked above).
-                 (np.diff(ax0_blk_indexer) == 1).all()))
+            unit_no_ax0_reindexing = (len(placements) == len(blk.mgr_locs) and
+                                      # Fastpath detection of join unit not
+                                      # needing to reindex its block: no ax0
+                                      # reindexing took place and block
+                                      # placement was sequential before.
+                                      ((ax0_indexer is None and
+                                        blk.mgr_locs.is_slice_like and
+                                        blk.mgr_locs.as_slice.step == 1) or
+                                       # Slow-ish detection: all indexer locs
+                                       # are sequential (and length match is
+                                       # checked above).
+                                       (np.diff(ax0_blk_indexer) == 1).all()))
 
             # Omit indexer if no item reindexing is required.
             if unit_no_ax0_reindexing:
@@ -4543,6 +5684,7 @@ def combine_concat_plans(plans, concat_axis):
 
     else:
         num_ended = [0]
+
         def _next_or_none(seq):
             retval = next(seq, None)
             if retval is None:
@@ -4611,15 +5753,19 @@ def trim_join_unit(join_unit, length):
 
 
 class JoinUnit(object):
-    def __init__(self, block, shape, indexers={}):
+
+    def __init__(self, block, shape, indexers=None):
         # Passing shape explicitly is required for cases when block is None.
+        if indexers is None:
+            indexers = {}
         self.block = block
         self.indexers = indexers
         self.shape = shape
 
     def __repr__(self):
-        return '%s(%r, %s)' % (self.__class__.__name__,
-                               self.block, self.indexers)
+        return '{name}({block!r}, {indexers})'.format(
+            name=self.__class__.__name__, block=self.block,
+            indexers=self.indexers)
 
     @cache_readonly
     def needs_filling(self):
@@ -4638,13 +5784,11 @@ def dtype(self):
         if not self.needs_filling:
             return self.block.dtype
         else:
-            return com._get_dtype(com._maybe_promote(self.block.dtype,
-                                                     self.block.fill_value)[0])
-
-        return self._dtype
+            return _get_dtype(maybe_promote(self.block.dtype,
+                                            self.block.fill_value)[0])
 
     @cache_readonly
-    def is_null(self):
+    def is_na(self):
         if self.block is None:
             return True
 
@@ -4657,12 +5801,19 @@ def is_null(self):
         values = self.block.values
         if self.block.is_categorical:
             values_flat = values.categories
+        elif self.block.is_sparse:
+            # fill_value is not NaN and have holes
+            if not values._null_fill_value and values.sp_index.ngaps > 0:
+                return False
+            values_flat = values.ravel(order='K')
+        elif isinstance(self.block, ExtensionBlock):
+            values_flat = values
         else:
-            values_flat = values.ravel()
+            values_flat = values.ravel(order='K')
         total_len = values_flat.shape[0]
         chunk_len = max(total_len // 40, 1000)
         for i in range(0, total_len, chunk_len):
-            if not isnull(values_flat[i: i + chunk_len]).all():
+            if not isna(values_flat[i:i + chunk_len]).all():
                 return False
 
         return True
@@ -4675,30 +5826,38 @@ def get_reindexed_values(self, empty_dtype, upcasted_na):
         else:
             fill_value = upcasted_na
 
-            if self.is_null and not getattr(self.block,'is_categorical',None):
-                missing_arr = np.empty(self.shape, dtype=empty_dtype)
-                if np.prod(self.shape):
-                    # NumPy 1.6 workaround: this statement gets strange if all
-                    # blocks are of same dtype and some of them are empty:
-                    # empty one are considered "null" so they must be filled,
-                    # but no dtype upcasting happens and the dtype may not
-                    # allow NaNs.
-                    #
-                    # In general, no one should get hurt when one tries to put
-                    # incorrect values into empty array, but numpy 1.6 is
-                    # strict about that.
+            if self.is_na:
+                if getattr(self.block, 'is_object', False):
+                    # we want to avoid filling with np.nan if we are
+                    # using None; we already know that we are all
+                    # nulls
+                    values = self.block.values.ravel(order='K')
+                    if len(values) and values[0] is None:
+                        fill_value = None
+
+                if getattr(self.block, 'is_datetimetz', False) or \
+                        is_datetimetz(empty_dtype):
+                    pass
+                elif getattr(self.block, 'is_categorical', False):
+                    pass
+                elif getattr(self.block, 'is_sparse', False):
+                    pass
+                else:
+                    missing_arr = np.empty(self.shape, dtype=empty_dtype)
                     missing_arr.fill(fill_value)
-                return missing_arr
+                    return missing_arr
 
             if not self.indexers:
                 if not self.block._can_consolidate:
                     # preserve these for validation in _concat_compat
                     return self.block.values
 
-            if self.block.is_bool:
+            if self.block.is_bool and not self.block.is_categorical:
                 # External code requested filling/upcasting, bool values must
                 # be upcasted to object to avoid being upcasted to numeric.
                 values = self.block.astype(np.object_).values
+            elif self.block.is_extension:
+                values = self.block.values
             else:
                 # No dtype upcasting is done here, it will be performed during
                 # concatenation itself.
@@ -4712,8 +5871,8 @@ def get_reindexed_values(self, empty_dtype, upcasted_na):
 
         else:
             for ax, indexer in self.indexers.items():
-                values = com.take_nd(values, indexer, axis=ax,
-                                     fill_value=fill_value)
+                values = algos.take_nd(values, indexer, axis=ax,
+                                       fill_value=fill_value)
 
         return values
 
@@ -4731,8 +5890,8 @@ def _fast_count_smallints(arr):
 
 def _preprocess_slice_or_indexer(slice_or_indexer, length, allow_fill):
     if isinstance(slice_or_indexer, slice):
-        return 'slice', slice_or_indexer, lib.slice_len(slice_or_indexer,
-                                                        length)
+        return ('slice', slice_or_indexer,
+                libinternals.slice_len(slice_or_indexer, length))
     elif (isinstance(slice_or_indexer, np.ndarray) and
           slice_or_indexer.dtype == np.bool_):
         return 'mask', slice_or_indexer, slice_or_indexer.sum()
diff --git a/pandas/core/matrix.py b/pandas/core/matrix.py
deleted file mode 100644
index 3d42fd93d969b..0000000000000
--- a/pandas/core/matrix.py
+++ /dev/null
@@ -1 +0,0 @@
-from pandas.core.frame import DataFrame as DataMatrix
diff --git a/pandas/core/missing.py b/pandas/core/missing.py
new file mode 100644
index 0000000000000..e9b9a734ec5f5
--- /dev/null
+++ b/pandas/core/missing.py
@@ -0,0 +1,812 @@
+"""
+Routines for filling missing data
+"""
+import operator
+
+import numpy as np
+from distutils.version import LooseVersion
+
+from pandas._libs import algos, lib
+
+from pandas.compat import range, string_types
+from pandas.core.dtypes.common import (
+    is_numeric_v_string_like,
+    is_float_dtype,
+    is_datetime64_dtype,
+    is_datetime64tz_dtype,
+    is_integer_dtype,
+    is_scalar,
+    is_integer,
+    needs_i8_conversion,
+    _ensure_float64)
+
+from pandas.core.dtypes.cast import infer_dtype_from_array
+from pandas.core.dtypes.missing import isna
+
+
+def mask_missing(arr, values_to_mask):
+    """
+    Return a masking array of same size/shape as arr
+    with entries equaling any member of values_to_mask set to True
+    """
+    dtype, values_to_mask = infer_dtype_from_array(values_to_mask)
+
+    try:
+        values_to_mask = np.array(values_to_mask, dtype=dtype)
+
+    except Exception:
+        values_to_mask = np.array(values_to_mask, dtype=object)
+
+    na_mask = isna(values_to_mask)
+    nonna = values_to_mask[~na_mask]
+
+    mask = None
+    for x in nonna:
+        if mask is None:
+
+            # numpy elementwise comparison warning
+            if is_numeric_v_string_like(arr, x):
+                mask = False
+            else:
+                mask = arr == x
+
+            # if x is a string and arr is not, then we get False and we must
+            # expand the mask to size arr.shape
+            if is_scalar(mask):
+                mask = np.zeros(arr.shape, dtype=bool)
+        else:
+
+            # numpy elementwise comparison warning
+            if is_numeric_v_string_like(arr, x):
+                mask |= False
+            else:
+                mask |= arr == x
+
+    if na_mask.any():
+        if mask is None:
+            mask = isna(arr)
+        else:
+            mask |= isna(arr)
+
+    return mask
+
+
+def clean_fill_method(method, allow_nearest=False):
+    # asfreq is compat for resampling
+    if method in [None, 'asfreq']:
+        return None
+
+    if isinstance(method, string_types):
+        method = method.lower()
+        if method == 'ffill':
+            method = 'pad'
+        elif method == 'bfill':
+            method = 'backfill'
+
+    valid_methods = ['pad', 'backfill']
+    expecting = 'pad (ffill) or backfill (bfill)'
+    if allow_nearest:
+        valid_methods.append('nearest')
+        expecting = 'pad (ffill), backfill (bfill) or nearest'
+    if method not in valid_methods:
+        msg = ('Invalid fill method. Expecting {expecting}. Got {method}'
+               .format(expecting=expecting, method=method))
+        raise ValueError(msg)
+    return method
+
+
+def clean_interp_method(method, **kwargs):
+    order = kwargs.get('order')
+    valid = ['linear', 'time', 'index', 'values', 'nearest', 'zero', 'slinear',
+             'quadratic', 'cubic', 'barycentric', 'polynomial', 'krogh',
+             'piecewise_polynomial', 'pchip', 'akima', 'spline',
+             'from_derivatives']
+    if method in ('spline', 'polynomial') and order is None:
+        raise ValueError("You must specify the order of the spline or "
+                         "polynomial.")
+    if method not in valid:
+        raise ValueError("method must be one of {valid}. Got '{method}' "
+                         "instead.".format(valid=valid, method=method))
+
+    return method
+
+
+def interpolate_1d(xvalues, yvalues, method='linear', limit=None,
+                   limit_direction='forward', limit_area=None, fill_value=None,
+                   bounds_error=False, order=None, **kwargs):
+    """
+    Logic for the 1-d interpolation.  The result should be 1-d, inputs
+    xvalues and yvalues will each be 1-d arrays of the same length.
+
+    Bounds_error is currently hardcoded to False since non-scipy ones don't
+    take it as an argumnet.
+    """
+    # Treat the original, non-scipy methods first.
+
+    invalid = isna(yvalues)
+    valid = ~invalid
+
+    if not valid.any():
+        # have to call np.asarray(xvalues) since xvalues could be an Index
+        # which can't be mutated
+        result = np.empty_like(np.asarray(xvalues), dtype=np.float64)
+        result.fill(np.nan)
+        return result
+
+    if valid.all():
+        return yvalues
+
+    if method == 'time':
+        if not getattr(xvalues, 'is_all_dates', None):
+            # if not issubclass(xvalues.dtype.type, np.datetime64):
+            raise ValueError('time-weighted interpolation only works '
+                             'on Series or DataFrames with a '
+                             'DatetimeIndex')
+        method = 'values'
+
+    valid_limit_directions = ['forward', 'backward', 'both']
+    limit_direction = limit_direction.lower()
+    if limit_direction not in valid_limit_directions:
+        msg = ('Invalid limit_direction: expecting one of {valid!r}, '
+               'got {invalid!r}.')
+        raise ValueError(msg.format(valid=valid_limit_directions,
+                                    invalid=limit_direction))
+
+    if limit_area is not None:
+        valid_limit_areas = ['inside', 'outside']
+        limit_area = limit_area.lower()
+        if limit_area not in valid_limit_areas:
+            raise ValueError('Invalid limit_area: expecting one of {}, got '
+                             '{}.'.format(valid_limit_areas, limit_area))
+
+    # default limit is unlimited GH #16282
+    if limit is None:
+        # limit = len(xvalues)
+        pass
+    elif not is_integer(limit):
+        raise ValueError('Limit must be an integer')
+    elif limit < 1:
+        raise ValueError('Limit must be greater than 0')
+
+    from pandas import Series
+    ys = Series(yvalues)
+
+    # These are sets of index pointers to invalid values... i.e. {0, 1, etc...
+    all_nans = set(np.flatnonzero(invalid))
+    start_nans = set(range(ys.first_valid_index()))
+    end_nans = set(range(1 + ys.last_valid_index(), len(valid)))
+    mid_nans = all_nans - start_nans - end_nans
+
+    # Like the sets above, preserve_nans contains indices of invalid values,
+    # but in this case, it is the final set of indices that need to be
+    # preserved as NaN after the interpolation.
+
+    # For example if limit_direction='forward' then preserve_nans will
+    # contain indices of NaNs at the beginning of the series, and NaNs that
+    # are more than'limit' away from the prior non-NaN.
+
+    # set preserve_nans based on direction using _interp_limit
+    if limit_direction == 'forward':
+        preserve_nans = start_nans | set(_interp_limit(invalid, limit, 0))
+    elif limit_direction == 'backward':
+        preserve_nans = end_nans | set(_interp_limit(invalid, 0, limit))
+    else:
+        # both directions... just use _interp_limit
+        preserve_nans = set(_interp_limit(invalid, limit, limit))
+
+    # if limit_area is set, add either mid or outside indices
+    # to preserve_nans GH #16284
+    if limit_area == 'inside':
+        # preserve NaNs on the outside
+        preserve_nans |= start_nans | end_nans
+    elif limit_area == 'outside':
+        # preserve NaNs on the inside
+        preserve_nans |= mid_nans
+
+    # sort preserve_nans and covert to list
+    preserve_nans = sorted(preserve_nans)
+
+    xvalues = getattr(xvalues, 'values', xvalues)
+    yvalues = getattr(yvalues, 'values', yvalues)
+    result = yvalues.copy()
+
+    if method in ['linear', 'time', 'index', 'values']:
+        if method in ('values', 'index'):
+            inds = np.asarray(xvalues)
+            # hack for DatetimeIndex, #1646
+            if needs_i8_conversion(inds.dtype.type):
+                inds = inds.view(np.int64)
+            if inds.dtype == np.object_:
+                inds = lib.maybe_convert_objects(inds)
+        else:
+            inds = xvalues
+        result[invalid] = np.interp(inds[invalid], inds[valid], yvalues[valid])
+        result[preserve_nans] = np.nan
+        return result
+
+    sp_methods = ['nearest', 'zero', 'slinear', 'quadratic', 'cubic',
+                  'barycentric', 'krogh', 'spline', 'polynomial',
+                  'from_derivatives', 'piecewise_polynomial', 'pchip', 'akima']
+
+    if method in sp_methods:
+        inds = np.asarray(xvalues)
+        # hack for DatetimeIndex, #1646
+        if issubclass(inds.dtype.type, np.datetime64):
+            inds = inds.view(np.int64)
+        result[invalid] = _interpolate_scipy_wrapper(inds[valid],
+                                                     yvalues[valid],
+                                                     inds[invalid],
+                                                     method=method,
+                                                     fill_value=fill_value,
+                                                     bounds_error=bounds_error,
+                                                     order=order, **kwargs)
+        result[preserve_nans] = np.nan
+        return result
+
+
+def _interpolate_scipy_wrapper(x, y, new_x, method, fill_value=None,
+                               bounds_error=False, order=None, **kwargs):
+    """
+    passed off to scipy.interpolate.interp1d. method is scipy's kind.
+    Returns an array interpolated at new_x.  Add any new methods to
+    the list in _clean_interp_method
+    """
+    try:
+        from scipy import interpolate
+        # TODO: Why is DatetimeIndex being imported here?
+        from pandas import DatetimeIndex  # noqa
+    except ImportError:
+        raise ImportError('{method} interpolation requires SciPy'
+                          .format(method=method))
+
+    new_x = np.asarray(new_x)
+
+    # ignores some kwargs that could be passed along.
+    alt_methods = {
+        'barycentric': interpolate.barycentric_interpolate,
+        'krogh': interpolate.krogh_interpolate,
+        'from_derivatives': _from_derivatives,
+        'piecewise_polynomial': _from_derivatives,
+    }
+
+    if getattr(x, 'is_all_dates', False):
+        # GH 5975, scipy.interp1d can't hande datetime64s
+        x, new_x = x._values.astype('i8'), new_x.astype('i8')
+
+    if method == 'pchip':
+        try:
+            alt_methods['pchip'] = interpolate.pchip_interpolate
+        except AttributeError:
+            raise ImportError("Your version of Scipy does not support "
+                              "PCHIP interpolation.")
+    elif method == 'akima':
+        try:
+            from scipy.interpolate import Akima1DInterpolator  # noqa
+            alt_methods['akima'] = _akima_interpolate
+        except ImportError:
+            raise ImportError("Your version of Scipy does not support "
+                              "Akima interpolation.")
+
+    interp1d_methods = ['nearest', 'zero', 'slinear', 'quadratic', 'cubic',
+                        'polynomial']
+    if method in interp1d_methods:
+        if method == 'polynomial':
+            method = order
+        terp = interpolate.interp1d(x, y, kind=method, fill_value=fill_value,
+                                    bounds_error=bounds_error)
+        new_y = terp(new_x)
+    elif method == 'spline':
+        # GH #10633
+        if not order:
+            raise ValueError("order needs to be specified and greater than 0")
+        terp = interpolate.UnivariateSpline(x, y, k=order, **kwargs)
+        new_y = terp(new_x)
+    else:
+        # GH 7295: need to be able to write for some reason
+        # in some circumstances: check all three
+        if not x.flags.writeable:
+            x = x.copy()
+        if not y.flags.writeable:
+            y = y.copy()
+        if not new_x.flags.writeable:
+            new_x = new_x.copy()
+        method = alt_methods[method]
+        new_y = method(x, y, new_x, **kwargs)
+    return new_y
+
+
+def _from_derivatives(xi, yi, x, order=None, der=0, extrapolate=False):
+    """
+    Convenience function for interpolate.BPoly.from_derivatives
+
+    Construct a piecewise polynomial in the Bernstein basis, compatible
+    with the specified values and derivatives at breakpoints.
+
+    Parameters
+    ----------
+    xi : array_like
+        sorted 1D array of x-coordinates
+    yi : array_like or list of array-likes
+        yi[i][j] is the j-th derivative known at xi[i]
+    orders : None or int or array_like of ints. Default: None.
+        Specifies the degree of local polynomials. If not None, some
+        derivatives are ignored.
+    der : int or list
+        How many derivatives to extract; None for all potentially nonzero
+        derivatives (that is a number equal to the number of points), or a
+        list of derivatives to extract. This numberincludes the function
+        value as 0th derivative.
+     extrapolate : bool, optional
+        Whether to extrapolate to ouf-of-bounds points based on first and last
+        intervals, or to return NaNs. Default: True.
+
+    See Also
+    --------
+    scipy.interpolate.BPoly.from_derivatives
+
+    Returns
+    -------
+    y : scalar or array_like
+        The result, of length R or length M or M by R,
+
+    """
+    import scipy
+    from scipy import interpolate
+
+    if LooseVersion(scipy.__version__) < LooseVersion('0.18.0'):
+        try:
+            method = interpolate.piecewise_polynomial_interpolate
+            return method(xi, yi.reshape(-1, 1), x,
+                          orders=order, der=der)
+        except AttributeError:
+            pass
+
+    # return the method for compat with scipy version & backwards compat
+    method = interpolate.BPoly.from_derivatives
+    m = method(xi, yi.reshape(-1, 1),
+               orders=order, extrapolate=extrapolate)
+
+    return m(x)
+
+
+def _akima_interpolate(xi, yi, x, der=0, axis=0):
+    """
+    Convenience function for akima interpolation.
+    xi and yi are arrays of values used to approximate some function f,
+    with ``yi = f(xi)``.
+
+    See `Akima1DInterpolator` for details.
+
+    Parameters
+    ----------
+    xi : array_like
+        A sorted list of x-coordinates, of length N.
+    yi :  array_like
+        A 1-D array of real values.  `yi`'s length along the interpolation
+        axis must be equal to the length of `xi`. If N-D array, use axis
+        parameter to select correct axis.
+    x : scalar or array_like
+        Of length M.
+    der : int or list, optional
+        How many derivatives to extract; None for all potentially
+        nonzero derivatives (that is a number equal to the number
+        of points), or a list of derivatives to extract. This number
+        includes the function value as 0th derivative.
+    axis : int, optional
+        Axis in the yi array corresponding to the x-coordinate values.
+
+    See Also
+    --------
+    scipy.interpolate.Akima1DInterpolator
+
+    Returns
+    -------
+    y : scalar or array_like
+        The result, of length R or length M or M by R,
+
+    """
+    from scipy import interpolate
+    try:
+        P = interpolate.Akima1DInterpolator(xi, yi, axis=axis)
+    except TypeError:
+        # Scipy earlier than 0.17.0 missing axis
+        P = interpolate.Akima1DInterpolator(xi, yi)
+    if der == 0:
+        return P(x)
+    elif interpolate._isscalar(der):
+        return P(x, der=der)
+    else:
+        return [P(x, nu) for nu in der]
+
+
+def interpolate_2d(values, method='pad', axis=0, limit=None, fill_value=None,
+                   dtype=None):
+    """ perform an actual interpolation of values, values will be make 2-d if
+    needed fills inplace, returns the result
+    """
+
+    transf = (lambda x: x) if axis == 0 else (lambda x: x.T)
+
+    # reshape a 1 dim if needed
+    ndim = values.ndim
+    if values.ndim == 1:
+        if axis != 0:  # pragma: no cover
+            raise AssertionError("cannot interpolate on a ndim == 1 with "
+                                 "axis != 0")
+        values = values.reshape(tuple((1,) + values.shape))
+
+    if fill_value is None:
+        mask = None
+    else:  # todo create faster fill func without masking
+        mask = mask_missing(transf(values), fill_value)
+
+    method = clean_fill_method(method)
+    if method == 'pad':
+        values = transf(pad_2d(
+            transf(values), limit=limit, mask=mask, dtype=dtype))
+    else:
+        values = transf(backfill_2d(
+            transf(values), limit=limit, mask=mask, dtype=dtype))
+
+    # reshape back
+    if ndim == 1:
+        values = values[0]
+
+    return values
+
+
+def _interp_wrapper(f, wrap_dtype, na_override=None):
+    def wrapper(arr, mask, limit=None):
+        view = arr.view(wrap_dtype)
+        f(view, mask, limit=limit)
+
+    return wrapper
+
+
+_pad_1d_datetime = _interp_wrapper(algos.pad_inplace_int64, np.int64)
+_pad_2d_datetime = _interp_wrapper(algos.pad_2d_inplace_int64, np.int64)
+_backfill_1d_datetime = _interp_wrapper(algos.backfill_inplace_int64, np.int64)
+_backfill_2d_datetime = _interp_wrapper(algos.backfill_2d_inplace_int64,
+                                        np.int64)
+
+
+def pad_1d(values, limit=None, mask=None, dtype=None):
+    if dtype is None:
+        dtype = values.dtype
+    _method = None
+    if is_float_dtype(values):
+        name = 'pad_inplace_{name}'.format(name=dtype.name)
+        _method = getattr(algos, name, None)
+    elif is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype):
+        _method = _pad_1d_datetime
+    elif is_integer_dtype(values):
+        values = _ensure_float64(values)
+        _method = algos.pad_inplace_float64
+    elif values.dtype == np.object_:
+        _method = algos.pad_inplace_object
+
+    if _method is None:
+        raise ValueError('Invalid dtype for pad_1d [{name}]'
+                         .format(name=dtype.name))
+
+    if mask is None:
+        mask = isna(values)
+    mask = mask.view(np.uint8)
+    _method(values, mask, limit=limit)
+    return values
+
+
+def backfill_1d(values, limit=None, mask=None, dtype=None):
+    if dtype is None:
+        dtype = values.dtype
+    _method = None
+    if is_float_dtype(values):
+        name = 'backfill_inplace_{name}'.format(name=dtype.name)
+        _method = getattr(algos, name, None)
+    elif is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype):
+        _method = _backfill_1d_datetime
+    elif is_integer_dtype(values):
+        values = _ensure_float64(values)
+        _method = algos.backfill_inplace_float64
+    elif values.dtype == np.object_:
+        _method = algos.backfill_inplace_object
+
+    if _method is None:
+        raise ValueError('Invalid dtype for backfill_1d [{name}]'
+                         .format(name=dtype.name))
+
+    if mask is None:
+        mask = isna(values)
+    mask = mask.view(np.uint8)
+
+    _method(values, mask, limit=limit)
+    return values
+
+
+def pad_2d(values, limit=None, mask=None, dtype=None):
+    if dtype is None:
+        dtype = values.dtype
+    _method = None
+    if is_float_dtype(values):
+        name = 'pad_2d_inplace_{name}'.format(name=dtype.name)
+        _method = getattr(algos, name, None)
+    elif is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype):
+        _method = _pad_2d_datetime
+    elif is_integer_dtype(values):
+        values = _ensure_float64(values)
+        _method = algos.pad_2d_inplace_float64
+    elif values.dtype == np.object_:
+        _method = algos.pad_2d_inplace_object
+
+    if _method is None:
+        raise ValueError('Invalid dtype for pad_2d [{name}]'
+                         .format(name=dtype.name))
+
+    if mask is None:
+        mask = isna(values)
+    mask = mask.view(np.uint8)
+
+    if np.all(values.shape):
+        _method(values, mask, limit=limit)
+    else:
+        # for test coverage
+        pass
+    return values
+
+
+def backfill_2d(values, limit=None, mask=None, dtype=None):
+    if dtype is None:
+        dtype = values.dtype
+    _method = None
+    if is_float_dtype(values):
+        name = 'backfill_2d_inplace_{name}'.format(name=dtype.name)
+        _method = getattr(algos, name, None)
+    elif is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype):
+        _method = _backfill_2d_datetime
+    elif is_integer_dtype(values):
+        values = _ensure_float64(values)
+        _method = algos.backfill_2d_inplace_float64
+    elif values.dtype == np.object_:
+        _method = algos.backfill_2d_inplace_object
+
+    if _method is None:
+        raise ValueError('Invalid dtype for backfill_2d [{name}]'
+                         .format(name=dtype.name))
+
+    if mask is None:
+        mask = isna(values)
+    mask = mask.view(np.uint8)
+
+    if np.all(values.shape):
+        _method(values, mask, limit=limit)
+    else:
+        # for test coverage
+        pass
+    return values
+
+
+_fill_methods = {'pad': pad_1d, 'backfill': backfill_1d}
+
+
+def get_fill_func(method):
+    method = clean_fill_method(method)
+    return _fill_methods[method]
+
+
+def clean_reindex_fill_method(method):
+    return clean_fill_method(method, allow_nearest=True)
+
+
+def fill_zeros(result, x, y, name, fill):
+    """
+    if this is a reversed op, then flip x,y
+
+    if we have an integer value (or array in y)
+    and we have 0's, fill them with the fill,
+    return the result
+
+    mask the nan's from x
+    """
+    if fill is None or is_float_dtype(result):
+        return result
+
+    if name.startswith(('r', '__r')):
+        x, y = y, x
+
+    is_variable_type = (hasattr(y, 'dtype') or hasattr(y, 'type'))
+    is_scalar_type = is_scalar(y)
+
+    if not is_variable_type and not is_scalar_type:
+        return result
+
+    if is_scalar_type:
+        y = np.array(y)
+
+    if is_integer_dtype(y):
+
+        if (y == 0).any():
+
+            # GH 7325, mask and nans must be broadcastable (also: PR 9308)
+            # Raveling and then reshaping makes np.putmask faster
+            mask = ((y == 0) & ~np.isnan(result)).ravel()
+
+            shape = result.shape
+            result = result.astype('float64', copy=False).ravel()
+
+            np.putmask(result, mask, fill)
+
+            # if we have a fill of inf, then sign it correctly
+            # (GH 6178 and PR 9308)
+            if np.isinf(fill):
+                signs = np.sign(y if name.startswith(('r', '__r')) else x)
+                negative_inf_mask = (signs.ravel() < 0) & mask
+                np.putmask(result, negative_inf_mask, -fill)
+
+            if "floordiv" in name:  # (PR 9308)
+                nan_mask = ((y == 0) & (x == 0)).ravel()
+                np.putmask(result, nan_mask, np.nan)
+
+            result = result.reshape(shape)
+
+    return result
+
+
+def mask_zero_div_zero(x, y, result, copy=False):
+    """
+    Set results of 0 / 0 or 0 // 0 to np.nan, regardless of the dtypes
+    of the numerator or the denominator.
+
+    Parameters
+    ----------
+    x : ndarray
+    y : ndarray
+    result : ndarray
+    copy : bool (default False)
+        Whether to always create a new array or try to fill in the existing
+        array if possible.
+
+    Returns
+    -------
+    filled_result : ndarray
+
+    Examples
+    --------
+    >>> x = np.array([1, 0, -1], dtype=np.int64)
+    >>> y = 0       # int 0; numpy behavior is different with float
+    >>> result = x / y
+    >>> result      # raw numpy result does not fill division by zero
+    array([0, 0, 0])
+    >>> mask_zero_div_zero(x, y, result)
+    array([ inf,  nan, -inf])
+    """
+    if is_scalar(y):
+        y = np.array(y)
+
+    zmask = y == 0
+    if zmask.any():
+        shape = result.shape
+
+        nan_mask = (zmask & (x == 0)).ravel()
+        neginf_mask = (zmask & (x < 0)).ravel()
+        posinf_mask = (zmask & (x > 0)).ravel()
+
+        if nan_mask.any() or neginf_mask.any() or posinf_mask.any():
+            # Fill negative/0 with -inf, positive/0 with +inf, 0/0 with NaN
+            result = result.astype('float64', copy=copy).ravel()
+
+            np.putmask(result, nan_mask, np.nan)
+            np.putmask(result, posinf_mask, np.inf)
+            np.putmask(result, neginf_mask, -np.inf)
+
+            result = result.reshape(shape)
+
+    return result
+
+
+def dispatch_missing(op, left, right, result):
+    """
+    Fill nulls caused by division by zero, casting to a diffferent dtype
+    if necessary.
+
+    Parameters
+    ----------
+    op : function (operator.add, operator.div, ...)
+    left : object (Index for non-reversed ops)
+    right : object (Index fof reversed ops)
+    result : ndarray
+
+    Returns
+    -------
+    result : ndarray
+    """
+    opstr = '__{opname}__'.format(opname=op.__name__).replace('____', '__')
+    if op in [operator.truediv, operator.floordiv,
+              getattr(operator, 'div', None)]:
+        result = mask_zero_div_zero(left, right, result)
+    elif op is operator.mod:
+        result = fill_zeros(result, left, right, opstr, np.nan)
+    elif op is divmod:
+        res0 = mask_zero_div_zero(left, right, result[0])
+        res1 = fill_zeros(result[1], left, right, opstr, np.nan)
+        result = (res0, res1)
+    return result
+
+
+def _interp_limit(invalid, fw_limit, bw_limit):
+    """
+    Get indexers of values that won't be filled
+    because they exceed the limits.
+
+    Parameters
+    ----------
+    invalid : boolean ndarray
+    fw_limit : int or None
+        forward limit to index
+    bw_limit : int or None
+        backward limit to index
+
+    Returns
+    -------
+    set of indexers
+
+    Notes
+    -----
+    This is equivalent to the more readable, but slower
+
+    .. code-block:: python
+
+       for x in np.where(invalid)[0]:
+           if invalid[max(0, x - fw_limit):x + bw_limit + 1].all():
+               yield x
+    """
+    # handle forward first; the backward direction is the same except
+    # 1. operate on the reversed array
+    # 2. subtract the returned indices from N - 1
+    N = len(invalid)
+    f_idx = set()
+    b_idx = set()
+
+    def inner(invalid, limit):
+        limit = min(limit, N)
+        windowed = _rolling_window(invalid, limit + 1).all(1)
+        idx = (set(np.where(windowed)[0] + limit) |
+               set(np.where((~invalid[:limit + 1]).cumsum() == 0)[0]))
+        return idx
+
+    if fw_limit is not None:
+
+        if fw_limit == 0:
+            f_idx = set(np.where(invalid)[0])
+        else:
+            f_idx = inner(invalid, fw_limit)
+
+    if bw_limit is not None:
+
+        if bw_limit == 0:
+            # then we don't even need to care about backwards
+            # just use forwards
+            return f_idx
+        else:
+            b_idx = list(inner(invalid[::-1], bw_limit))
+            b_idx = set(N - 1 - np.asarray(b_idx))
+            if fw_limit == 0:
+                return b_idx
+
+    return f_idx & b_idx
+
+
+def _rolling_window(a, window):
+    """
+    [True, True, False, True, False], 2 ->
+
+    [
+        [True,  True],
+        [True, False],
+        [False, True],
+        [True, False],
+    ]
+    """
+    # https://stackoverflow.com/a/6811241
+    shape = a.shape[:-1] + (a.shape[-1] - window + 1, window)
+    strides = a.strides + (a.strides[-1],)
+    return np.lib.stride_tricks.as_strided(a, shape=shape, strides=strides)
diff --git a/pandas/core/nanops.py b/pandas/core/nanops.py
index 43533b67b5441..90333c23817c5 100644
--- a/pandas/core/nanops.py
+++ b/pandas/core/nanops.py
@@ -1,28 +1,58 @@
 import itertools
 import functools
+import operator
+import warnings
+from distutils.version import LooseVersion
+
 import numpy as np
+from pandas import compat
+from pandas._libs import tslib, lib
+from pandas.core.dtypes.common import (
+    _get_dtype,
+    is_float, is_scalar,
+    is_integer, is_complex, is_float_dtype,
+    is_complex_dtype, is_integer_dtype,
+    is_bool_dtype, is_object_dtype,
+    is_numeric_dtype,
+    is_datetime64_dtype, is_timedelta64_dtype,
+    is_datetime_or_timedelta_dtype,
+    is_int_or_datetime_dtype, is_any_int_dtype)
+from pandas.core.dtypes.cast import _int64_max, maybe_upcast_putmask
+from pandas.core.dtypes.missing import isna, notna, na_value_for_dtype
+from pandas.core.config import get_option
+import pandas.core.common as com
+
+_BOTTLENECK_INSTALLED = False
+_MIN_BOTTLENECK_VERSION = '1.0.0'
 
 try:
     import bottleneck as bn
-    _USE_BOTTLENECK = True
+    ver = bn.__version__
+    _BOTTLENECK_INSTALLED = (LooseVersion(ver) >=
+                             LooseVersion(_MIN_BOTTLENECK_VERSION))
+
+    if not _BOTTLENECK_INSTALLED:
+        warnings.warn(
+            "The installed version of bottleneck {ver} is not supported "
+            "in pandas and will be not be used\nThe minimum supported "
+            "version is {min_ver}\n".format(
+                ver=ver, min_ver=_MIN_BOTTLENECK_VERSION), UserWarning)
+
 except ImportError:  # pragma: no cover
-    _USE_BOTTLENECK = False
-
-import pandas.hashtable as _hash
-from pandas import compat, lib, algos, tslib
-from pandas.compat import builtins
-from pandas.core.common import (isnull, notnull, _values_from_object,
-                                _maybe_upcast_putmask,
-                                ensure_float, _ensure_float64,
-                                _ensure_int64, _ensure_object,
-                                is_float, is_integer, is_complex,
-                                is_float_dtype,
-                                is_complex_dtype, is_integer_dtype,
-                                is_bool_dtype, is_object_dtype,
-                                is_datetime64_dtype, is_timedelta64_dtype,
-                                is_datetime_or_timedelta_dtype, _get_dtype,
-                                is_int_or_datetime_dtype, is_any_int_dtype,
-                                _int64_max)
+    pass
+
+
+_USE_BOTTLENECK = False
+
+
+def set_use_bottleneck(v=True):
+    # set/unset to use bottleneck
+    global _USE_BOTTLENECK
+    if _BOTTLENECK_INSTALLED:
+        _USE_BOTTLENECK = v
+
+
+set_use_bottleneck(get_option('compute.use_bottleneck'))
 
 
 class disallow(object):
@@ -40,11 +70,11 @@ def __call__(self, f):
         def _f(*args, **kwargs):
             obj_iter = itertools.chain(args, compat.itervalues(kwargs))
             if any(self.check(obj) for obj in obj_iter):
-                raise TypeError('reduction operation {0!r} not allowed for '
-                                'this dtype'.format(f.__name__.replace('nan',
-                                                                       '')))
+                msg = 'reduction operation {name!r} not allowed for this dtype'
+                raise TypeError(msg.format(name=f.__name__.replace('nan', '')))
             try:
-                return f(*args, **kwargs)
+                with np.errstate(invalid='ignore'):
+                    return f(*args, **kwargs)
             except ValueError as e:
                 # we want to transform an object array
                 # ValueError message to the more typical TypeError
@@ -53,13 +83,13 @@ def _f(*args, **kwargs):
                 if is_object_dtype(args[0]):
                     raise TypeError(e)
                 raise
+
         return _f
 
 
 class bottleneck_switch(object):
 
-    def __init__(self, zero_value=None, **kwargs):
-        self.zero_value = zero_value
+    def __init__(self, **kwargs):
         self.kwargs = kwargs
 
     def __call__(self, alt):
@@ -77,22 +107,17 @@ def f(values, axis=None, skipna=True, **kwds):
                     if k not in kwds:
                         kwds[k] = v
             try:
-                if self.zero_value is not None and values.size == 0:
-                    if values.ndim == 1:
-
-                        # wrap the 0's if needed
-                        if is_timedelta64_dtype(values):
-                            return lib.Timedelta(0)
-                        return 0
-                    else:
-                        result_shape = (values.shape[:axis] +
-                                        values.shape[axis + 1:])
-                        result = np.empty(result_shape)
-                        result.fill(0)
-                        return result
-
-                if _USE_BOTTLENECK and skipna and _bn_ok_dtype(values.dtype,
-                                                               bn_name):
+                if values.size == 0 and kwds.get('min_count') is None:
+                    # We are empty, returning NA for our type
+                    # Only applies for the default `min_count` of None
+                    # since that affects how empty arrays are handled.
+                    # TODO(GH-18976) update all the nanops methods to
+                    # correctly handle empty inputs and remove this check.
+                    # It *may* just be `var`
+                    return _na_for_min_count(values, axis)
+
+                if (_USE_BOTTLENECK and skipna and
+                        _bn_ok_dtype(values.dtype, bn_name)):
                     result = bn_func(values, axis=axis, **kwds)
 
                     # prefer to treat inf/-inf as NA, but must compute the func
@@ -121,14 +146,18 @@ def f(values, axis=None, skipna=True, **kwds):
 
 def _bn_ok_dtype(dt, name):
     # Bottleneck chokes on datetime64
-    if (not is_object_dtype(dt) and
-            not is_datetime_or_timedelta_dtype(dt)):
+    if (not is_object_dtype(dt) and not is_datetime_or_timedelta_dtype(dt)):
 
+        # GH 15507
         # bottleneck does not properly upcast during the sum
         # so can overflow
-        if name == 'nansum':
-            if dt.itemsize < 8:
-                return False
+
+        # GH 9422
+        # further we also want to preserve NaN when all elements
+        # are NaN, unlinke bottleneck/numpy which consider this
+        # to be 0
+        if name in ['nansum', 'nanprod']:
+            return False
 
         return True
     return False
@@ -142,7 +171,7 @@ def _has_infs(result):
             return lib.has_infs_f4(result.ravel())
     try:
         return np.isinf(result).any()
-    except (TypeError, NotImplementedError) as e:
+    except (TypeError, NotImplementedError):
         # if it doesn't support infs, then it can't have infs
         return False
 
@@ -173,13 +202,14 @@ def _get_fill_value(dtype, fill_value=None, fill_value_typ=None):
 def _get_values(values, skipna, fill_value=None, fill_value_typ=None,
                 isfinite=False, copy=True):
     """ utility to get the values view, mask, dtype
-        if necessary copy and mask using the specified fill_value
-        copy = True will force the copy """
-    values = _values_from_object(values)
+    if necessary copy and mask using the specified fill_value
+    copy = True will force the copy
+    """
+    values = com._values_from_object(values)
     if isfinite:
         mask = _isfinite(values)
     else:
-        mask = isnull(values)
+        mask = isna(values)
 
     dtype = values.dtype
     dtype_ok = _na_ok_dtype(dtype)
@@ -197,7 +227,7 @@ def _get_values(values, skipna, fill_value=None, fill_value_typ=None,
 
         # promote if needed
         else:
-            values, changed = _maybe_upcast_putmask(values, mask, fill_value)
+            values, changed = maybe_upcast_putmask(values, mask, fill_value)
 
     elif copy:
         values = values.copy()
@@ -216,7 +246,7 @@ def _get_values(values, skipna, fill_value=None, fill_value_typ=None,
 
 def _isfinite(values):
     if is_datetime_or_timedelta_dtype(values):
-        return isnull(values)
+        return isna(values)
     if (is_complex_dtype(values) or is_float_dtype(values) or
             is_integer_dtype(values) or is_bool_dtype(values)):
         return ~np.isfinite(values)
@@ -238,7 +268,7 @@ def _wrap_results(result, dtype):
 
     if is_datetime64_dtype(dtype):
         if not isinstance(result, np.ndarray):
-            result = lib.Timestamp(result)
+            result = tslib.Timestamp(result)
         else:
             result = result.view(dtype)
     elif is_timedelta64_dtype(dtype):
@@ -248,13 +278,43 @@ def _wrap_results(result, dtype):
             if np.fabs(result) > _int64_max:
                 raise ValueError("overflow in timedelta operation")
 
-            result = lib.Timedelta(result, unit='ns')
+            result = tslib.Timedelta(result, unit='ns')
         else:
             result = result.astype('i8').view(dtype)
 
     return result
 
 
+def _na_for_min_count(values, axis):
+    """Return the missing value for `values`
+
+    Parameters
+    ----------
+    values : ndarray
+    axis : int or None
+        axis for the reduction
+
+    Returns
+    -------
+    result : scalar or ndarray
+        For 1-D values, returns a scalar of the correct missing type.
+        For 2-D values, returns a 1-D array where each element is missing.
+    """
+    # we either return np.nan or pd.NaT
+    if is_numeric_dtype(values):
+        values = values.astype('float64')
+    fill_value = na_value_for_dtype(values.dtype)
+
+    if values.ndim == 1:
+        return fill_value
+    else:
+        result_shape = (values.shape[:axis] +
+                        values.shape[axis + 1:])
+        result = np.empty(result_shape, dtype=values.dtype)
+        result.fill(fill_value)
+        return result
+
+
 def nanany(values, axis=None, skipna=True):
     values, mask, dtype, _ = _get_values(values, skipna, False, copy=skipna)
     return values.any(axis)
@@ -266,8 +326,7 @@ def nanall(values, axis=None, skipna=True):
 
 
 @disallow('M8')
-@bottleneck_switch(zero_value=0)
-def nansum(values, axis=None, skipna=True):
+def nansum(values, axis=None, skipna=True, min_count=0):
     values, mask, dtype, dtype_max = _get_values(values, skipna, 0)
     dtype_sum = dtype_max
     if is_float_dtype(dtype):
@@ -275,7 +334,7 @@ def nansum(values, axis=None, skipna=True):
     elif is_timedelta64_dtype(dtype):
         dtype_sum = np.float64
     the_sum = values.sum(axis, dtype=dtype_sum)
-    the_sum = _maybe_null_out(the_sum, axis, mask)
+    the_sum = _maybe_null_out(the_sum, axis, mask, min_count=min_count)
 
     return _wrap_results(the_sum, dtype)
 
@@ -310,14 +369,13 @@ def nanmean(values, axis=None, skipna=True):
 @bottleneck_switch()
 def nanmedian(values, axis=None, skipna=True):
 
-    values, mask, dtype, dtype_max = _get_values(values, skipna)
-
     def get_median(x):
-        mask = notnull(x)
+        mask = notna(x)
         if not skipna and not mask.all():
             return np.nan
-        return algos.median(_values_from_object(x[mask]))
+        return np.nanmedian(x[mask])
 
+    values, mask, dtype, dtype_max = _get_values(values, skipna)
     if not is_float_dtype(values):
         values = values.astype('f8')
         values[mask] = np.nan
@@ -329,9 +387,15 @@ def get_median(x):
 
     # an array from a frame
     if values.ndim > 1:
+
         # there's a non-empty array to apply over otherwise numpy raises
         if notempty:
-            return _wrap_results(np.apply_along_axis(get_median, axis, values), dtype)
+            if not skipna:
+                return _wrap_results(
+                    np.apply_along_axis(get_median, axis, values), dtype)
+
+            # fastpath for the skipna case
+            return _wrap_results(np.nanmedian(values, axis), dtype)
 
         # must return the correct shape, but median is not defined for the
         # empty set so return nans of shape "everything but the passed axis"
@@ -353,7 +417,7 @@ def _get_counts_nanvar(mask, axis, ddof, dtype=float):
     d = count - dtype.type(ddof)
 
     # always return NaN, never inf
-    if np.isscalar(count):
+    if is_scalar(count):
         if count <= ddof:
             count = np.nan
             d = np.nan
@@ -376,8 +440,9 @@ def nanstd(values, axis=None, skipna=True, ddof=1):
 @bottleneck_switch(ddof=1)
 def nanvar(values, axis=None, skipna=True, ddof=1):
 
+    values = com._values_from_object(values)
     dtype = values.dtype
-    mask = isnull(values)
+    mask = isna(values)
     if is_any_int_dtype(values):
         values = values.astype('f8')
         values[mask] = np.nan
@@ -400,7 +465,7 @@ def nanvar(values, axis=None, skipna=True, ddof=1):
     avg = _ensure_numeric(values.sum(axis=axis, dtype=np.float64)) / count
     if axis is not None:
         avg = np.expand_dims(avg, axis)
-    sqr = _ensure_numeric((avg - values) ** 2)
+    sqr = _ensure_numeric((avg - values)**2)
     np.putmask(sqr, mask, 0)
     result = sqr.sum(axis=axis, dtype=np.float64) / d
 
@@ -416,7 +481,7 @@ def nanvar(values, axis=None, skipna=True, ddof=1):
 def nansem(values, axis=None, skipna=True, ddof=1):
     var = nanvar(values, axis, skipna, ddof=ddof)
 
-    mask = isnull(values)
+    mask = isna(values)
     if not is_float_dtype(values.dtype):
         values = values.astype('f8')
     count, _ = _get_counts_nanvar(mask, axis, ddof, values.dtype)
@@ -429,13 +494,10 @@ def _nanminmax(meth, fill_value_typ):
     @bottleneck_switch()
     def reduction(values, axis=None, skipna=True):
         values, mask, dtype, dtype_max = _get_values(
-            values,
-            skipna,
-            fill_value_typ=fill_value_typ,
-        )
+            values, skipna, fill_value_typ=fill_value_typ, )
 
-        if ((axis is not None and values.shape[axis] == 0)
-                or values.size == 0):
+        if ((axis is not None and values.shape[axis] == 0) or
+                values.size == 0):
             try:
                 result = getattr(values, meth)(axis, dtype=dtype_max)
                 result.fill(np.nan)
@@ -455,32 +517,40 @@ def reduction(values, axis=None, skipna=True):
 nanmax = _nanminmax('max', fill_value_typ='-inf')
 
 
+@disallow('O')
 def nanargmax(values, axis=None, skipna=True):
     """
     Returns -1 in the NA case
     """
-    values, mask, dtype, _ = _get_values(values, skipna, fill_value_typ='-inf',
-                                         isfinite=True)
+    values, mask, dtype, _ = _get_values(values, skipna, fill_value_typ='-inf')
     result = values.argmax(axis)
     result = _maybe_arg_null_out(result, axis, mask, skipna)
     return result
 
 
+@disallow('O')
 def nanargmin(values, axis=None, skipna=True):
     """
     Returns -1 in the NA case
     """
-    values, mask, dtype, _ = _get_values(values, skipna, fill_value_typ='+inf',
-                                         isfinite=True)
+    values, mask, dtype, _ = _get_values(values, skipna, fill_value_typ='+inf')
     result = values.argmin(axis)
     result = _maybe_arg_null_out(result, axis, mask, skipna)
     return result
 
 
-@disallow('M8','m8')
+@disallow('M8', 'm8')
 def nanskew(values, axis=None, skipna=True):
+    """ Compute the sample skewness.
 
-    mask = isnull(values)
+    The statistic computed here is the adjusted Fisher-Pearson standardized
+    moment coefficient G1. The algorithm computes this coefficient directly
+    from the second and third central moment.
+
+    """
+
+    values = com._values_from_object(values)
+    mask = isna(values)
     if not is_float_dtype(values.dtype):
         values = values.astype('f8')
         count = _get_counts(mask, axis)
@@ -491,33 +561,54 @@ def nanskew(values, axis=None, skipna=True):
         values = values.copy()
         np.putmask(values, mask, 0)
 
-    typ = values.dtype.type
-    A = values.sum(axis) / count
-    B = (values ** 2).sum(axis) / count - A ** typ(2)
-    C = (values ** 3).sum(axis) / count - A ** typ(3) - typ(3) * A * B
+    mean = values.sum(axis, dtype=np.float64) / count
+    if axis is not None:
+        mean = np.expand_dims(mean, axis)
+
+    adjusted = values - mean
+    if skipna:
+        np.putmask(adjusted, mask, 0)
+    adjusted2 = adjusted ** 2
+    adjusted3 = adjusted2 * adjusted
+    m2 = adjusted2.sum(axis, dtype=np.float64)
+    m3 = adjusted3.sum(axis, dtype=np.float64)
 
     # floating point error
-    B = _zero_out_fperr(B)
-    C = _zero_out_fperr(C)
+    #
+    # #18044 in _libs/windows.pyx calc_skew follow this behavior
+    # to fix the fperr to treat m2 <1e-14 as zero
+    m2 = _zero_out_fperr(m2)
+    m3 = _zero_out_fperr(m3)
+
+    with np.errstate(invalid='ignore', divide='ignore'):
+        result = (count * (count - 1) ** 0.5 / (count - 2)) * (m3 / m2 ** 1.5)
 
-    result = ((np.sqrt(count * count - count) * C) /
-              ((count - typ(2)) * np.sqrt(B) ** typ(3)))
+    dtype = values.dtype
+    if is_float_dtype(dtype):
+        result = result.astype(dtype)
 
     if isinstance(result, np.ndarray):
-        result = np.where(B == 0, 0, result)
+        result = np.where(m2 == 0, 0, result)
         result[count < 3] = np.nan
         return result
     else:
-        result = 0 if B == 0 else result
+        result = 0 if m2 == 0 else result
         if count < 3:
             return np.nan
         return result
 
 
-@disallow('M8','m8')
+@disallow('M8', 'm8')
 def nankurt(values, axis=None, skipna=True):
+    """ Compute the sample excess kurtosis.
 
-    mask = isnull(values)
+    The statistic computed here is the adjusted Fisher-Pearson standardized
+    moment coefficient G2, computed directly from the second and fourth
+    central moment.
+
+    """
+    values = com._values_from_object(values)
+    mask = isna(values)
     if not is_float_dtype(values.dtype):
         values = values.astype('f8')
         count = _get_counts(mask, axis)
@@ -528,40 +619,61 @@ def nankurt(values, axis=None, skipna=True):
         values = values.copy()
         np.putmask(values, mask, 0)
 
-    typ = values.dtype.type
-    A = values.sum(axis) / count
-    B = (values ** 2).sum(axis) / count - A ** typ(2)
-    C = (values ** 3).sum(axis) / count - A ** typ(3) - typ(3) * A * B
-    D = (values ** 4).sum(axis) / count - A ** typ(4) - typ(6) * B * A * A - typ(4) * C * A
+    mean = values.sum(axis, dtype=np.float64) / count
+    if axis is not None:
+        mean = np.expand_dims(mean, axis)
 
-    B = _zero_out_fperr(B)
-    D = _zero_out_fperr(D)
+    adjusted = values - mean
+    if skipna:
+        np.putmask(adjusted, mask, 0)
+    adjusted2 = adjusted ** 2
+    adjusted4 = adjusted2 ** 2
+    m2 = adjusted2.sum(axis, dtype=np.float64)
+    m4 = adjusted4.sum(axis, dtype=np.float64)
+
+    with np.errstate(invalid='ignore', divide='ignore'):
+        adj = 3 * (count - 1) ** 2 / ((count - 2) * (count - 3))
+        numer = count * (count + 1) * (count - 1) * m4
+        denom = (count - 2) * (count - 3) * m2**2
+        result = numer / denom - adj
 
-    if not isinstance(B, np.ndarray):
-        # if B is a scalar, check these corner cases first before doing division
+    # floating point error
+    #
+    # #18044 in _libs/windows.pyx calc_kurt follow this behavior
+    # to fix the fperr to treat denom <1e-14 as zero
+    numer = _zero_out_fperr(numer)
+    denom = _zero_out_fperr(denom)
+
+    if not isinstance(denom, np.ndarray):
+        # if ``denom`` is a scalar, check these corner cases first before
+        # doing division
         if count < 4:
             return np.nan
-        if B == 0:
+        if denom == 0:
             return 0
 
-    result = (((count * count - typ(1)) * D / (B * B) - typ(3) * ((count - typ(1)) ** typ(2))) /
-              ((count - typ(2)) * (count - typ(3))))
+    with np.errstate(invalid='ignore', divide='ignore'):
+        result = numer / denom - adj
+
+    dtype = values.dtype
+    if is_float_dtype(dtype):
+        result = result.astype(dtype)
 
     if isinstance(result, np.ndarray):
-        result = np.where(B == 0, 0, result)
+        result = np.where(denom == 0, 0, result)
         result[count < 4] = np.nan
 
     return result
 
 
-@disallow('M8','m8')
-def nanprod(values, axis=None, skipna=True):
-    mask = isnull(values)
+@disallow('M8', 'm8')
+def nanprod(values, axis=None, skipna=True, min_count=0):
+    mask = isna(values)
     if skipna and not is_any_int_dtype(values):
         values = values.copy()
         values[mask] = 1
     result = values.prod(axis)
-    return _maybe_null_out(result, axis, mask)
+    return _maybe_null_out(result, axis, mask, min_count=min_count)
 
 
 def _maybe_arg_null_out(result, axis, mask, skipna):
@@ -589,7 +701,7 @@ def _get_counts(mask, axis, dtype=float):
         return dtype.type(mask.size - mask.sum())
 
     count = mask.shape[axis] - mask.sum(axis)
-    if np.isscalar(count):
+    if is_scalar(count):
         return dtype.type(count)
     try:
         return count.astype(dtype)
@@ -597,31 +709,37 @@ def _get_counts(mask, axis, dtype=float):
         return np.array(count, dtype=dtype)
 
 
-def _maybe_null_out(result, axis, mask):
+def _maybe_null_out(result, axis, mask, min_count=1):
     if axis is not None and getattr(result, 'ndim', False):
-        null_mask = (mask.shape[axis] - mask.sum(axis)) == 0
+        null_mask = (mask.shape[axis] - mask.sum(axis) - min_count) < 0
         if np.any(null_mask):
-            if np.iscomplexobj(result):
-                result = result.astype('c16')
+            if is_numeric_dtype(result):
+                if np.iscomplexobj(result):
+                    result = result.astype('c16')
+                else:
+                    result = result.astype('f8')
+                result[null_mask] = np.nan
             else:
-                result = result.astype('f8')
-            result[null_mask] = np.nan
+                # GH12941, use None to auto cast null
+                result[null_mask] = None
     elif result is not tslib.NaT:
         null_mask = mask.size - mask.sum()
-        if null_mask == 0:
+        if null_mask < min_count:
             result = np.nan
 
     return result
 
 
 def _zero_out_fperr(arg):
+    # #18044 reference this behavior to fix rolling skew/kurt issue
     if isinstance(arg, np.ndarray):
-        return np.where(np.abs(arg) < 1e-14, 0, arg)
+        with np.errstate(invalid='ignore'):
+            return np.where(np.abs(arg) < 1e-14, 0, arg)
     else:
         return arg.dtype.type(0) if np.abs(arg) < 1e-14 else arg
 
 
-@disallow('M8','m8')
+@disallow('M8', 'm8')
 def nancorr(a, b, method='pearson', min_periods=None):
     """
     a, b: ndarrays
@@ -632,7 +750,7 @@ def nancorr(a, b, method='pearson', min_periods=None):
     if min_periods is None:
         min_periods = 1
 
-    valid = notnull(a) & notnull(b)
+    valid = notna(a) & notna(b)
     if not valid.all():
         a = a[valid]
         b = b[valid]
@@ -668,7 +786,7 @@ def _spearman(a, b):
     return _cor_methods[method]
 
 
-@disallow('M8','m8')
+@disallow('M8', 'm8')
 def nancov(a, b, min_periods=None):
     if len(a) != len(b):
         raise AssertionError('Operands to nancov must have same size')
@@ -676,7 +794,7 @@ def nancov(a, b, min_periods=None):
     if min_periods is None:
         min_periods = 1
 
-    valid = notnull(a) & notnull(b)
+    valid = notna(a) & notna(b)
     if not valid.all():
         a = a[valid]
         b = b[valid]
@@ -706,21 +824,21 @@ def _ensure_numeric(x):
             try:
                 x = complex(x)
             except Exception:
-                raise TypeError('Could not convert %s to numeric' % str(x))
+                raise TypeError('Could not convert {value!s} to numeric'
+                                .format(value=x))
     return x
 
 # NA-friendly array comparisons
 
-import operator
-
 
 def make_nancomp(op):
     def f(x, y):
-        xmask = isnull(x)
-        ymask = isnull(y)
+        xmask = isna(x)
+        ymask = isna(y)
         mask = xmask | ymask
 
-        result = op(x, y)
+        with np.errstate(all='ignore'):
+            result = op(x, y)
 
         if mask.any():
             if is_bool_dtype(result):
@@ -728,36 +846,13 @@ def f(x, y):
             np.putmask(result, mask, np.nan)
 
         return result
+
     return f
 
+
 nangt = make_nancomp(operator.gt)
 nange = make_nancomp(operator.ge)
 nanlt = make_nancomp(operator.lt)
 nanle = make_nancomp(operator.le)
 naneq = make_nancomp(operator.eq)
 nanne = make_nancomp(operator.ne)
-
-
-def unique1d(values):
-    """
-    Hash table-based unique
-    """
-    if np.issubdtype(values.dtype, np.floating):
-        table = _hash.Float64HashTable(len(values))
-        uniques = np.array(table.unique(_ensure_float64(values)),
-                           dtype=np.float64)
-    elif np.issubdtype(values.dtype, np.datetime64):
-        table = _hash.Int64HashTable(len(values))
-        uniques = table.unique(_ensure_int64(values))
-        uniques = uniques.view('M8[ns]')
-    elif np.issubdtype(values.dtype, np.timedelta64):
-        table = _hash.Int64HashTable(len(values))
-        uniques = table.unique(_ensure_int64(values))
-        uniques = uniques.view('m8[ns]')
-    elif np.issubdtype(values.dtype, np.integer):
-        table = _hash.Int64HashTable(len(values))
-        uniques = table.unique(_ensure_int64(values))
-    else:
-        table = _hash.PyObjectHashTable(len(values))
-        uniques = table.unique(_ensure_object(values))
-    return uniques
diff --git a/pandas/core/ops.py b/pandas/core/ops.py
index 5b3d6069f17ec..fa6d88648cc63 100644
--- a/pandas/core/ops.py
+++ b/pandas/core/ops.py
@@ -5,181 +5,887 @@
 """
 # necessary to enforce truediv in Python 2.X
 from __future__ import division
+import datetime
 import operator
+import textwrap
 import warnings
+
 import numpy as np
 import pandas as pd
-import datetime
-from pandas import compat, lib, tslib
-import pandas.index as _index
-from pandas.util.decorators import Appender
-import pandas.core.common as com
-import pandas.computation.expressions as expressions
-from pandas.lib import isscalar
-from pandas.tslib import iNaT
+
+from pandas._libs import algos as libalgos, ops as libops
+
+from pandas import compat
+from pandas.util._decorators import Appender
+
 from pandas.compat import bind_method
-from pandas.core.common import(is_list_like, notnull, isnull,
-                               _values_from_object, _maybe_match_name,
-                               needs_i8_conversion, is_datetimelike_v_numeric,
-                               is_integer_dtype, is_categorical_dtype, is_object_dtype,
-                               is_timedelta64_dtype, is_datetime64_dtype, is_datetime64tz_dtype,
-                               is_bool_dtype)
-from pandas.io.common import PerformanceWarning
+import pandas.core.missing as missing
+import pandas.core.common as com
+
+from pandas.errors import NullFrequencyError
+from pandas.core.dtypes.missing import notna, isna
+from pandas.core.dtypes.common import (
+    needs_i8_conversion,
+    is_datetimelike_v_numeric,
+    is_integer_dtype, is_categorical_dtype,
+    is_object_dtype, is_timedelta64_dtype,
+    is_datetime64_dtype, is_datetime64tz_dtype,
+    is_bool_dtype,
+    is_list_like,
+    is_scalar,
+    is_extension_array_dtype,
+    _ensure_object)
+from pandas.core.dtypes.cast import (
+    maybe_upcast_putmask, find_common_type,
+    construct_1d_object_array_from_listlike)
+from pandas.core.dtypes.generic import (
+    ABCSeries,
+    ABCDataFrame, ABCPanel,
+    ABCIndex,
+    ABCSparseSeries, ABCSparseArray)
+
+
+# -----------------------------------------------------------------------------
+# Ops Wrapping Utilities
+
+def get_op_result_name(left, right):
+    """
+    Find the appropriate name to pin to an operation result.  This result
+    should always be either an Index or a Series.
+
+    Parameters
+    ----------
+    left : {Series, Index}
+    right : object
+
+    Returns
+    -------
+    name : object
+        Usually a string
+    """
+    # `left` is always a pd.Series when called from within ops
+    if isinstance(right, (ABCSeries, pd.Index)):
+        name = _maybe_match_name(left, right)
+    else:
+        name = left.name
+    return name
+
+
+def _maybe_match_name(a, b):
+    """
+    Try to find a name to attach to the result of an operation between
+    a and b.  If only one of these has a `name` attribute, return that
+    name.  Otherwise return a consensus name if they match of None if
+    they have different names.
+
+    Parameters
+    ----------
+    a : object
+    b : object
+
+    Returns
+    -------
+    name : str or None
+
+    See also
+    --------
+    pandas.core.common._consensus_name_attr
+    """
+    a_has = hasattr(a, 'name')
+    b_has = hasattr(b, 'name')
+    if a_has and b_has:
+        if a.name == b.name:
+            return a.name
+        else:
+            # TODO: what if they both have np.nan for their names?
+            return None
+    elif a_has:
+        return a.name
+    elif b_has:
+        return b.name
+    return None
+
+
+# -----------------------------------------------------------------------------
+# Reversed Operations not available in the stdlib operator module.
+# Defining these instead of using lambdas allows us to reference them by name.
+
+def radd(left, right):
+    return right + left
+
+
+def rsub(left, right):
+    return right - left
+
+
+def rmul(left, right):
+    return right * left
+
+
+def rdiv(left, right):
+    return right / left
+
+
+def rtruediv(left, right):
+    return right / left
+
+
+def rfloordiv(left, right):
+    return right // left
+
+
+def rmod(left, right):
+    return right % left
+
+
+def rdivmod(left, right):
+    return divmod(right, left)
+
+
+def rpow(left, right):
+    return right ** left
+
+
+def rand_(left, right):
+    return operator.and_(right, left)
+
+
+def ror_(left, right):
+    return operator.or_(right, left)
+
+
+def rxor(left, right):
+    return operator.xor(right, left)
+
+
+# -----------------------------------------------------------------------------
+
+def make_invalid_op(name):
+    """
+    Return a binary method that always raises a TypeError.
+
+    Parameters
+    ----------
+    name : str
+
+    Returns
+    -------
+    invalid_op : function
+    """
+    def invalid_op(self, other=None):
+        raise TypeError("cannot perform {name} with this index type: "
+                        "{typ}".format(name=name, typ=type(self).__name__))
+
+    invalid_op.__name__ = name
+    return invalid_op
+
+
+def _gen_eval_kwargs(name):
+    """
+    Find the keyword arguments to pass to numexpr for the given operation.
+
+    Parameters
+    ----------
+    name : str
+
+    Returns
+    -------
+    eval_kwargs : dict
+
+    Examples
+    --------
+    >>> _gen_eval_kwargs("__add__")
+    {}
+
+    >>> _gen_eval_kwargs("rtruediv")
+    {"reversed": True, "truediv": True}
+    """
+    kwargs = {}
+
+    # Series and Panel appear to only pass __add__, __radd__, ...
+    # but DataFrame gets both these dunder names _and_ non-dunder names
+    # add, radd, ...
+    name = name.replace('__', '')
+
+    if name.startswith('r'):
+        if name not in ['radd', 'rand', 'ror', 'rxor']:
+            # Exclude commutative operations
+            kwargs['reversed'] = True
+
+    if name in ['truediv', 'rtruediv']:
+        kwargs['truediv'] = True
+
+    if name in ['ne']:
+        kwargs['masker'] = True
+
+    return kwargs
+
+
+def _gen_fill_zeros(name):
+    """
+    Find the appropriate fill value to use when filling in undefined values
+    in the results of the given operation caused by operating on
+    (generally dividing by) zero.
+
+    Parameters
+    ----------
+    name : str
+
+    Returns
+    -------
+    fill_value : {None, np.nan, np.inf}
+    """
+    name = name.strip('__')
+    if 'div' in name:
+        # truediv, floordiv, div, and reversed variants
+        fill_value = np.inf
+    elif 'mod' in name:
+        # mod, rmod
+        fill_value = np.nan
+    else:
+        fill_value = None
+    return fill_value
+
+
+def _get_frame_op_default_axis(name):
+    """
+    Only DataFrame cares about default_axis, specifically:
+    special methods have default_axis=None and flex methods
+    have default_axis='columns'.
+
+    Parameters
+    ----------
+    name : str
+
+    Returns
+    -------
+    default_axis: str or None
+    """
+    if name.replace('__r', '__') in ['__and__', '__or__', '__xor__']:
+        # bool methods
+        return 'columns'
+    elif name.startswith('__'):
+        # __add__, __mul__, ...
+        return None
+    else:
+        # add, mul, ...
+        return 'columns'
+
+
+def _get_opstr(op, cls):
+    """
+    Find the operation string, if any, to pass to numexpr for this
+    operation.
+
+    Parameters
+    ----------
+    op : binary operator
+    cls : class
+
+    Returns
+    -------
+    op_str : string or None
+    """
+    # numexpr is available for non-sparse classes
+    subtyp = getattr(cls, '_subtyp', '')
+    use_numexpr = 'sparse' not in subtyp
+
+    if not use_numexpr:
+        # if we're not using numexpr, then don't pass a str_rep
+        return None
+
+    return {operator.add: '+',
+            radd: '+',
+            operator.mul: '*',
+            rmul: '*',
+            operator.sub: '-',
+            rsub: '-',
+            operator.truediv: '/',
+            rtruediv: '/',
+            operator.floordiv: '//',
+            rfloordiv: '//',
+            operator.mod: None,  # TODO: Why None for mod but '%' for rmod?
+            rmod: '%',
+            operator.pow: '**',
+            rpow: '**',
+            operator.eq: '==',
+            operator.ne: '!=',
+            operator.le: '<=',
+            operator.lt: '<',
+            operator.ge: '>=',
+            operator.gt: '>',
+            operator.and_: '&',
+            rand_: '&',
+            operator.or_: '|',
+            ror_: '|',
+            operator.xor: '^',
+            rxor: '^',
+            divmod: None,
+            rdivmod: None}[op]
+
+
+def _get_op_name(op, special):
+    """
+    Find the name to attach to this method according to conventions
+    for special and non-special methods.
+
+    Parameters
+    ----------
+    op : binary operator
+    special : bool
+
+    Returns
+    -------
+    op_name : str
+    """
+    opname = op.__name__.strip('_')
+    if special:
+        opname = '__{opname}__'.format(opname=opname)
+    return opname
+
+
+# -----------------------------------------------------------------------------
+# Docstring Generation and Templates
+
+_add_example_FRAME = """
+>>> a = pd.DataFrame([1, 1, 1, np.nan], index=['a', 'b', 'c', 'd'],
+...                  columns=['one'])
+>>> a
+   one
+a  1.0
+b  1.0
+c  1.0
+d  NaN
+>>> b = pd.DataFrame(dict(one=[1, np.nan, 1, np.nan],
+...                       two=[np.nan, 2, np.nan, 2]),
+...                  index=['a', 'b', 'd', 'e'])
+>>> b
+   one  two
+a  1.0  NaN
+b  NaN  2.0
+d  1.0  NaN
+e  NaN  2.0
+>>> a.add(b, fill_value=0)
+   one  two
+a  2.0  NaN
+b  1.0  2.0
+c  1.0  NaN
+d  1.0  NaN
+e  NaN  2.0
+"""
+
+_sub_example_FRAME = """
+>>> a = pd.DataFrame([2, 1, 1, np.nan], index=['a', 'b', 'c', 'd'],
+...                  columns=['one'])
+>>> a
+   one
+a  2.0
+b  1.0
+c  1.0
+d  NaN
+>>> b = pd.DataFrame(dict(one=[1, np.nan, 1, np.nan],
+...                       two=[3, 2, np.nan, 2]),
+...                  index=['a', 'b', 'd', 'e'])
+>>> b
+   one  two
+a  1.0  3.0
+b  NaN  2.0
+d  1.0  NaN
+e  NaN  2.0
+>>> a.sub(b, fill_value=0)
+   one  two
+a  1.0  -3.0
+b  1.0  -2.0
+c  1.0  NaN
+d  -1.0  NaN
+e  NaN  -2.0
+"""
+
+_op_descriptions = {
+    # Arithmetic Operators
+    'add': {'op': '+',
+            'desc': 'Addition',
+            'reverse': 'radd',
+            'df_examples': _add_example_FRAME},
+    'sub': {'op': '-',
+            'desc': 'Subtraction',
+            'reverse': 'rsub',
+            'df_examples': _sub_example_FRAME},
+    'mul': {'op': '*',
+            'desc': 'Multiplication',
+            'reverse': 'rmul',
+            'df_examples': None},
+    'mod': {'op': '%',
+            'desc': 'Modulo',
+            'reverse': 'rmod',
+            'df_examples': None},
+    'pow': {'op': '**',
+            'desc': 'Exponential power',
+            'reverse': 'rpow',
+            'df_examples': None},
+    'truediv': {'op': '/',
+                'desc': 'Floating division',
+                'reverse': 'rtruediv',
+                'df_examples': None},
+    'floordiv': {'op': '//',
+                 'desc': 'Integer division',
+                 'reverse': 'rfloordiv',
+                 'df_examples': None},
+    'divmod': {'op': 'divmod',
+               'desc': 'Integer division and modulo',
+               'reverse': None,
+               'df_examples': None},
+
+    # Comparison Operators
+    'eq': {'op': '==',
+           'desc': 'Equal to',
+           'reverse': None,
+           'df_examples': None},
+    'ne': {'op': '!=',
+           'desc': 'Not equal to',
+           'reverse': None,
+           'df_examples': None},
+    'lt': {'op': '<',
+           'desc': 'Less than',
+           'reverse': None,
+           'df_examples': None},
+    'le': {'op': '<=',
+           'desc': 'Less than or equal to',
+           'reverse': None,
+           'df_examples': None},
+    'gt': {'op': '>',
+           'desc': 'Greater than',
+           'reverse': None,
+           'df_examples': None},
+    'ge': {'op': '>=',
+           'desc': 'Greater than or equal to',
+           'reverse': None,
+           'df_examples': None}}
+
+_op_names = list(_op_descriptions.keys())
+for key in _op_names:
+    _op_descriptions[key]['reversed'] = False
+    reverse_op = _op_descriptions[key]['reverse']
+    if reverse_op is not None:
+        _op_descriptions[reverse_op] = _op_descriptions[key].copy()
+        _op_descriptions[reverse_op]['reversed'] = True
+        _op_descriptions[reverse_op]['reverse'] = key
+
+_flex_doc_SERIES = """
+{desc} of series and other, element-wise (binary operator `{op_name}`).
+
+Equivalent to ``{equiv}``, but with support to substitute a fill_value for
+missing data in one of the inputs.
+
+Parameters
+----------
+other : Series or scalar value
+fill_value : None or float value, default None (NaN)
+    Fill existing missing (NaN) values, and any new element needed for
+    successful Series alignment, with this value before computation.
+    If data in both corresponding Series locations is missing
+    the result will be missing
+level : int or name
+    Broadcast across a level, matching Index values on the
+    passed MultiIndex level
+
+Returns
+-------
+result : Series
+
+Examples
+--------
+>>> a = pd.Series([1, 1, 1, np.nan], index=['a', 'b', 'c', 'd'])
+>>> a
+a    1.0
+b    1.0
+c    1.0
+d    NaN
+dtype: float64
+>>> b = pd.Series([1, np.nan, 1, np.nan], index=['a', 'b', 'd', 'e'])
+>>> b
+a    1.0
+b    NaN
+d    1.0
+e    NaN
+dtype: float64
+>>> a.add(b, fill_value=0)
+a    2.0
+b    1.0
+c    1.0
+d    1.0
+e    NaN
+dtype: float64
+
+See also
+--------
+Series.{reverse}
+"""
+
+_arith_doc_FRAME = """
+Binary operator %s with support to substitute a fill_value for missing data in
+one of the inputs
+
+Parameters
+----------
+other : Series, DataFrame, or constant
+axis : {0, 1, 'index', 'columns'}
+    For Series input, axis to match Series index on
+fill_value : None or float value, default None
+    Fill existing missing (NaN) values, and any new element needed for
+    successful DataFrame alignment, with this value before computation.
+    If data in both corresponding DataFrame locations is missing
+    the result will be missing
+level : int or name
+    Broadcast across a level, matching Index values on the
+    passed MultiIndex level
+
+Notes
+-----
+Mismatched indices will be unioned together
+
+Returns
+-------
+result : DataFrame
+"""
+
+_flex_doc_FRAME = """
+{desc} of dataframe and other, element-wise (binary operator `{op_name}`).
+
+Equivalent to ``{equiv}``, but with support to substitute a fill_value for
+missing data in one of the inputs.
+
+Parameters
+----------
+other : Series, DataFrame, or constant
+axis : {{0, 1, 'index', 'columns'}}
+    For Series input, axis to match Series index on
+level : int or name
+    Broadcast across a level, matching Index values on the
+    passed MultiIndex level
+fill_value : None or float value, default None
+    Fill existing missing (NaN) values, and any new element needed for
+    successful DataFrame alignment, with this value before computation.
+    If data in both corresponding DataFrame locations is missing
+    the result will be missing
+
+Notes
+-----
+Mismatched indices will be unioned together
+
+Returns
+-------
+result : DataFrame
+
+Examples
+--------
+{df_examples}
+
+See also
+--------
+DataFrame.{reverse}
+"""
+
+_flex_doc_PANEL = """
+{desc} of series and other, element-wise (binary operator `{op_name}`).
+Equivalent to ``{equiv}``.
+
+Parameters
+----------
+other : DataFrame or Panel
+axis : {{items, major_axis, minor_axis}}
+    Axis to broadcast over
+
+Returns
+-------
+Panel
+
+See also
+--------
+Panel.{reverse}
+"""
+
+
+_agg_doc_PANEL = """
+Wrapper method for {op_name}
+
+Parameters
+----------
+other : DataFrame or Panel
+axis : {{items, major_axis, minor_axis}}
+    Axis to broadcast over
+
+Returns
+-------
+Panel
+"""
+
+
+def _make_flex_doc(op_name, typ):
+    """
+    Make the appropriate substitutions for the given operation and class-typ
+    into either _flex_doc_SERIES or _flex_doc_FRAME to return the docstring
+    to attach to a generated method.
+
+    Parameters
+    ----------
+    op_name : str {'__add__', '__sub__', ... '__eq__', '__ne__', ...}
+    typ : str {series, 'dataframe']}
+
+    Returns
+    -------
+    doc : str
+    """
+    op_name = op_name.replace('__', '')
+    op_desc = _op_descriptions[op_name]
+
+    if op_desc['reversed']:
+        equiv = 'other ' + op_desc['op'] + ' ' + typ
+    else:
+        equiv = typ + ' ' + op_desc['op'] + ' other'
+
+    if typ == 'series':
+        base_doc = _flex_doc_SERIES
+        doc = base_doc.format(desc=op_desc['desc'], op_name=op_name,
+                              equiv=equiv, reverse=op_desc['reverse'])
+    elif typ == 'dataframe':
+        base_doc = _flex_doc_FRAME
+        doc = base_doc.format(desc=op_desc['desc'], op_name=op_name,
+                              equiv=equiv, reverse=op_desc['reverse'],
+                              df_examples=op_desc['df_examples'])
+    elif typ == 'panel':
+        base_doc = _flex_doc_PANEL
+        doc = base_doc.format(desc=op_desc['desc'], op_name=op_name,
+                              equiv=equiv, reverse=op_desc['reverse'])
+    else:
+        raise AssertionError('Invalid typ argument.')
+    return doc
+
+
+# -----------------------------------------------------------------------------
+# Masking NA values and fallbacks for operations numpy does not support
+
+def fill_binop(left, right, fill_value):
+    """
+    If a non-None fill_value is given, replace null entries in left and right
+    with this value, but only in positions where _one_ of left/right is null,
+    not both.
+
+    Parameters
+    ----------
+    left : array-like
+    right : array-like
+    fill_value : object
+
+    Returns
+    -------
+    left : array-like
+    right : array-like
+
+    Notes
+    -----
+    Makes copies if fill_value is not None
+    """
+    # TODO: can we make a no-copy implementation?
+    if fill_value is not None:
+        left_mask = isna(left)
+        right_mask = isna(right)
+        left = left.copy()
+        right = right.copy()
+
+        # one but not both
+        mask = left_mask ^ right_mask
+        left[left_mask & mask] = fill_value
+        right[right_mask & mask] = fill_value
+    return left, right
+
+
+def mask_cmp_op(x, y, op, allowed_types):
+    """
+    Apply the function `op` to only non-null points in x and y.
+
+    Parameters
+    ----------
+    x : array-like
+    y : array-like
+    op : binary operation
+    allowed_types : class or tuple of classes
+
+    Returns
+    -------
+    result : ndarray[bool]
+    """
+    # TODO: Can we make the allowed_types arg unnecessary?
+    xrav = x.ravel()
+    result = np.empty(x.size, dtype=bool)
+    if isinstance(y, allowed_types):
+        yrav = y.ravel()
+        mask = notna(xrav) & notna(yrav)
+        result[mask] = op(np.array(list(xrav[mask])),
+                          np.array(list(yrav[mask])))
+    else:
+        mask = notna(xrav)
+        result[mask] = op(np.array(list(xrav[mask])), y)
+
+    if op == operator.ne:  # pragma: no cover
+        np.putmask(result, ~mask, True)
+    else:
+        np.putmask(result, ~mask, False)
+    result = result.reshape(x.shape)
+    return result
+
 
 # -----------------------------------------------------------------------------
 # Functions that add arithmetic methods to objects, given arithmetic factory
 # methods
 
+def _get_method_wrappers(cls):
+    """
+    Find the appropriate operation-wrappers to use when defining flex/special
+    arithmetic, boolean, and comparison operations with the given class.
+
+    Parameters
+    ----------
+    cls : class
 
-def _create_methods(arith_method, radd_func, comp_method, bool_method,
-                    use_numexpr, special=False, default_axis='columns'):
+    Returns
+    -------
+    arith_flex : function or None
+    comp_flex : function or None
+    arith_special : function
+    comp_special : function
+    bool_special : function
+
+    Notes
+    -----
+    None is only returned for SparseArray
+    """
+    if issubclass(cls, ABCSparseSeries):
+        # Be sure to catch this before ABCSeries and ABCSparseArray,
+        # as they will both come see SparseSeries as a subclass
+        arith_flex = _flex_method_SERIES
+        comp_flex = _flex_method_SERIES
+        arith_special = _arith_method_SPARSE_SERIES
+        comp_special = _arith_method_SPARSE_SERIES
+        bool_special = _bool_method_SERIES
+        # TODO: I don't think the functions defined by bool_method are tested
+    elif issubclass(cls, ABCSeries):
+        # Just Series; SparseSeries is caught above
+        arith_flex = _flex_method_SERIES
+        comp_flex = _flex_method_SERIES
+        arith_special = _arith_method_SERIES
+        comp_special = _comp_method_SERIES
+        bool_special = _bool_method_SERIES
+    elif issubclass(cls, ABCSparseArray):
+        arith_flex = None
+        comp_flex = None
+        arith_special = _arith_method_SPARSE_ARRAY
+        comp_special = _arith_method_SPARSE_ARRAY
+        bool_special = _arith_method_SPARSE_ARRAY
+    elif issubclass(cls, ABCPanel):
+        arith_flex = _flex_method_PANEL
+        comp_flex = _comp_method_PANEL
+        arith_special = _arith_method_PANEL
+        comp_special = _comp_method_PANEL
+        bool_special = _arith_method_PANEL
+    elif issubclass(cls, ABCDataFrame):
+        # Same for DataFrame and SparseDataFrame
+        arith_flex = _arith_method_FRAME
+        comp_flex = _flex_comp_method_FRAME
+        arith_special = _arith_method_FRAME
+        comp_special = _comp_method_FRAME
+        bool_special = _arith_method_FRAME
+    return arith_flex, comp_flex, arith_special, comp_special, bool_special
+
+
+def _create_methods(cls, arith_method, comp_method, bool_method,
+                    special=False):
     # creates actual methods based upon arithmetic, comp and bool method
     # constructors.
 
-    # NOTE: Only frame cares about default_axis, specifically: special methods
-    # have default axis None, whereas flex methods have default axis 'columns'
-    # if we're not using numexpr, then don't pass a str_rep
-    if use_numexpr:
-        op = lambda x: x
-    else:
-        op = lambda x: None
-    if special:
-        def names(x):
-            if x[-1] == "_":
-                return "__%s_" % x
-            else:
-                return "__%s__" % x
-    else:
-        names = lambda x: x
-    radd_func = radd_func or operator.add
-    # Inframe, all special methods have default_axis=None, flex methods have
-    # default_axis set to the default (columns)
+    have_divmod = issubclass(cls, ABCSeries)
+    # divmod is available for Series and SparseSeries
+
+    # yapf: disable
     new_methods = dict(
-        add=arith_method(operator.add, names('add'), op('+'),
-                         default_axis=default_axis),
-        radd=arith_method(radd_func, names('radd'), op('+'),
-                          default_axis=default_axis),
-        sub=arith_method(operator.sub, names('sub'), op('-'),
-                         default_axis=default_axis),
-        mul=arith_method(operator.mul, names('mul'), op('*'),
-                         default_axis=default_axis),
-        truediv=arith_method(operator.truediv, names('truediv'), op('/'),
-                             truediv=True, fill_zeros=np.inf,
-                             default_axis=default_axis),
-        floordiv=arith_method(operator.floordiv, names('floordiv'), op('//'),
-                              default_axis=default_axis, fill_zeros=np.inf),
-        # Causes a floating point exception in the tests when numexpr
-        # enabled, so for now no speedup
-        mod=arith_method(operator.mod, names('mod'), None,
-                         default_axis=default_axis, fill_zeros=np.nan),
-        pow=arith_method(operator.pow, names('pow'), op('**'),
-                         default_axis=default_axis),
+        add=arith_method(cls, operator.add, special),
+        radd=arith_method(cls, radd, special),
+        sub=arith_method(cls, operator.sub, special),
+        mul=arith_method(cls, operator.mul, special),
+        truediv=arith_method(cls, operator.truediv, special),
+        floordiv=arith_method(cls, operator.floordiv, special),
+        # Causes a floating point exception in the tests when numexpr enabled,
+        # so for now no speedup
+        mod=arith_method(cls, operator.mod, special),
+        pow=arith_method(cls, operator.pow, special),
         # not entirely sure why this is necessary, but previously was included
         # so it's here to maintain compatibility
-        rmul=arith_method(operator.mul, names('rmul'), op('*'),
-                          default_axis=default_axis, reversed=True),
-        rsub=arith_method(lambda x, y: y - x, names('rsub'), op('-'),
-                          default_axis=default_axis, reversed=True),
-        rtruediv=arith_method(lambda x, y: operator.truediv(y, x),
-                              names('rtruediv'), op('/'), truediv=True,
-                              fill_zeros=np.inf, default_axis=default_axis,
-                              reversed=True),
-        rfloordiv=arith_method(lambda x, y: operator.floordiv(y, x),
-                               names('rfloordiv'), op('//'),
-                               default_axis=default_axis, fill_zeros=np.inf,
-                               reversed=True),
-        rpow=arith_method(lambda x, y: y ** x, names('rpow'), op('**'),
-                          default_axis=default_axis, reversed=True),
-        rmod=arith_method(lambda x, y: y % x, names('rmod'), op('%'),
-                          default_axis=default_axis, fill_zeros=np.nan,
-                          reversed=True),
-    )
+        rmul=arith_method(cls, rmul, special),
+        rsub=arith_method(cls, rsub, special),
+        rtruediv=arith_method(cls, rtruediv, special),
+        rfloordiv=arith_method(cls, rfloordiv, special),
+        rpow=arith_method(cls, rpow, special),
+        rmod=arith_method(cls, rmod, special))
+    # yapf: enable
     new_methods['div'] = new_methods['truediv']
     new_methods['rdiv'] = new_methods['rtruediv']
+    if have_divmod:
+        # divmod doesn't have an op that is supported by numexpr
+        new_methods['divmod'] = arith_method(cls, divmod, special)
+
+    new_methods.update(dict(
+        eq=comp_method(cls, operator.eq, special),
+        ne=comp_method(cls, operator.ne, special),
+        lt=comp_method(cls, operator.lt, special),
+        gt=comp_method(cls, operator.gt, special),
+        le=comp_method(cls, operator.le, special),
+        ge=comp_method(cls, operator.ge, special)))
 
-    # Comp methods never had a default axis set
-    if comp_method:
-        new_methods.update(dict(
-            eq=comp_method(operator.eq, names('eq'), op('==')),
-            ne=comp_method(operator.ne, names('ne'), op('!='), masker=True),
-            lt=comp_method(operator.lt, names('lt'), op('<')),
-            gt=comp_method(operator.gt, names('gt'), op('>')),
-            le=comp_method(operator.le, names('le'), op('<=')),
-            ge=comp_method(operator.ge, names('ge'), op('>=')),
-        ))
     if bool_method:
-        new_methods.update(dict(
-            and_=bool_method(operator.and_, names('and_'), op('&')),
-            or_=bool_method(operator.or_, names('or_'), op('|')),
-            # For some reason ``^`` wasn't used in original.
-            xor=bool_method(operator.xor, names('xor'), op('^')),
-            rand_=bool_method(lambda x, y: operator.and_(y, x),
-                              names('rand_'), op('&')),
-            ror_=bool_method(lambda x, y: operator.or_(y, x), names('ror_'), op('|')),
-            rxor=bool_method(lambda x, y: operator.xor(y, x), names('rxor'), op('^'))
-        ))
-
-    new_methods = dict((names(k), v) for k, v in new_methods.items())
-    return new_methods
+        new_methods.update(
+            dict(and_=bool_method(cls, operator.and_, special),
+                 or_=bool_method(cls, operator.or_, special),
+                 # For some reason ``^`` wasn't used in original.
+                 xor=bool_method(cls, operator.xor, special),
+                 rand_=bool_method(cls, rand_, special),
+                 ror_=bool_method(cls, ror_, special),
+                 rxor=bool_method(cls, rxor, special)))
 
+    if special:
+        dunderize = lambda x: '__{name}__'.format(name=x.strip('_'))
+    else:
+        dunderize = lambda x: x
+    new_methods = {dunderize(k): v for k, v in new_methods.items()}
+    return new_methods
 
-def add_methods(cls, new_methods, force, select, exclude):
-    if select and exclude:
-        raise TypeError("May only pass either select or exclude")
-    methods = new_methods
-    if select:
-        select = set(select)
-        methods = {}
-        for key, method in new_methods.items():
-            if key in select:
-                methods[key] = method
-    if exclude:
-        for k in exclude:
-            new_methods.pop(k, None)
 
+def add_methods(cls, new_methods):
     for name, method in new_methods.items():
+        # For most methods, if we find that the class already has a method
+        # of the same name, it is OK to over-write it.  The exception is
+        # inplace methods (__iadd__, __isub__, ...) for SparseArray, which
+        # retain the np.ndarray versions.
+        force = not (issubclass(cls, ABCSparseArray) and
+                     name.startswith('__i'))
         if force or name not in cls.__dict__:
             bind_method(cls, name, method)
 
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # Arithmetic
-def add_special_arithmetic_methods(cls, arith_method=None, radd_func=None,
-                                   comp_method=None, bool_method=None,
-                                   use_numexpr=True, force=False, select=None,
-                                   exclude=None):
+def add_special_arithmetic_methods(cls):
     """
     Adds the full suite of special arithmetic methods (``__add__``,
     ``__sub__``, etc.) to the class.
 
     Parameters
     ----------
-    arith_method : function (optional)
-        factory for special arithmetic methods, with op string:
-        f(op, name, str_rep, default_axis=None, fill_zeros=None, **eval_kwargs)
-    radd_func :  function (optional)
-        Possible replacement for ``operator.add`` for compatibility
-    comp_method : function, optional,
-        factory for rich comparison - signature: f(op, name, str_rep)
-    use_numexpr : bool, default True
-        whether to accelerate with numexpr, defaults to True
-    force : bool, default False
-        if False, checks whether function is defined **on ``cls.__dict__``**
-        before defining if True, always defines functions on class base
-    select : iterable of strings (optional)
-        if passed, only sets functions with names in select
-    exclude : iterable of strings (optional)
-        if passed, will not set functions with names in exclude
+    cls : class
+        special methods will be defined and pinned to this class
     """
-    radd_func = radd_func or operator.add
-
-    # in frame, special methods have default_axis = None, comp methods use
-    # 'columns'
-
-    new_methods = _create_methods(arith_method, radd_func, comp_method,
-                                  bool_method, use_numexpr, default_axis=None,
+    _, _, arith_method, comp_method, bool_method = _get_method_wrappers(cls)
+    new_methods = _create_methods(cls, arith_method, comp_method, bool_method,
                                   special=True)
-
     # inplace operators (I feel like these should get passed an `inplace=True`
     # or just be removed
 
@@ -193,459 +899,278 @@ def f(self, other):
 
             # this makes sure that we are aligned like the input
             # we are updating inplace so we want to ignore is_copy
-            self._update_inplace(result.reindex_like(self,copy=False)._data,
+            self._update_inplace(result.reindex_like(self, copy=False)._data,
                                  verify_is_copy=False)
 
             return self
+
         return f
 
-    new_methods.update(dict(
-        __iadd__=_wrap_inplace_method(new_methods["__add__"]),
-        __isub__=_wrap_inplace_method(new_methods["__sub__"]),
-        __imul__=_wrap_inplace_method(new_methods["__mul__"]),
-        __itruediv__=_wrap_inplace_method(new_methods["__truediv__"]),
-        __ipow__=_wrap_inplace_method(new_methods["__pow__"]),
-    ))
+    new_methods.update(
+        dict(__iadd__=_wrap_inplace_method(new_methods["__add__"]),
+             __isub__=_wrap_inplace_method(new_methods["__sub__"]),
+             __imul__=_wrap_inplace_method(new_methods["__mul__"]),
+             __itruediv__=_wrap_inplace_method(new_methods["__truediv__"]),
+             __ifloordiv__=_wrap_inplace_method(new_methods["__floordiv__"]),
+             __imod__=_wrap_inplace_method(new_methods["__mod__"]),
+             __ipow__=_wrap_inplace_method(new_methods["__pow__"])))
     if not compat.PY3:
-        new_methods["__idiv__"] = new_methods["__div__"]
+        new_methods["__idiv__"] = _wrap_inplace_method(new_methods["__div__"])
 
-    add_methods(cls, new_methods=new_methods, force=force, select=select,
-                exclude=exclude)
+    new_methods.update(
+        dict(__iand__=_wrap_inplace_method(new_methods["__and__"]),
+             __ior__=_wrap_inplace_method(new_methods["__or__"]),
+             __ixor__=_wrap_inplace_method(new_methods["__xor__"])))
 
+    add_methods(cls, new_methods=new_methods)
 
-def add_flex_arithmetic_methods(cls, flex_arith_method, radd_func=None,
-                                flex_comp_method=None, flex_bool_method=None,
-                                use_numexpr=True, force=False, select=None,
-                                exclude=None):
+
+def add_flex_arithmetic_methods(cls):
     """
     Adds the full suite of flex arithmetic methods (``pow``, ``mul``, ``add``)
     to the class.
 
     Parameters
     ----------
-    flex_arith_method : function
-        factory for special arithmetic methods, with op string:
-        f(op, name, str_rep, default_axis=None, fill_zeros=None, **eval_kwargs)
-    radd_func :  function (optional)
-        Possible replacement for ``lambda x, y: operator.add(y, x)`` for
-        compatibility
-    flex_comp_method : function, optional,
-        factory for rich comparison - signature: f(op, name, str_rep)
-    use_numexpr : bool, default True
-        whether to accelerate with numexpr, defaults to True
-    force : bool, default False
-        if False, checks whether function is defined **on ``cls.__dict__``**
-        before defining if True, always defines functions on class base
-    select : iterable of strings (optional)
-        if passed, only sets functions with names in select
-    exclude : iterable of strings (optional)
-        if passed, will not set functions with names in exclude
+    cls : class
+        flex methods will be defined and pinned to this class
     """
-    radd_func = radd_func or (lambda x, y: operator.add(y, x))
-    # in frame, default axis is 'columns', doesn't matter for series and panel
-    new_methods = _create_methods(
-        flex_arith_method, radd_func, flex_comp_method, flex_bool_method,
-        use_numexpr, default_axis='columns', special=False)
-    new_methods.update(dict(
-        multiply=new_methods['mul'],
-        subtract=new_methods['sub'],
-        divide=new_methods['div']
-    ))
+    flex_arith_method, flex_comp_method, _, _, _ = _get_method_wrappers(cls)
+    new_methods = _create_methods(cls, flex_arith_method,
+                                  flex_comp_method, bool_method=None,
+                                  special=False)
+    new_methods.update(dict(multiply=new_methods['mul'],
+                            subtract=new_methods['sub'],
+                            divide=new_methods['div']))
     # opt out of bool flex methods for now
-    for k in ('ror_', 'rxor', 'rand_'):
-        if k in new_methods:
-            new_methods.pop(k)
-
-    add_methods(cls, new_methods=new_methods, force=force, select=select,
-                exclude=exclude)
-
+    assert not any(kname in new_methods for kname in ('ror_', 'rxor', 'rand_'))
 
-class _TimeOp(object):
+    add_methods(cls, new_methods=new_methods)
 
-    """
-    Wrapper around Series datetime/time/timedelta arithmetic operations.
-    Generally, you should use classmethod ``maybe_convert_for_time_op`` as an
-    entry point.
-    """
-    fill_value = iNaT
-    wrap_results = staticmethod(lambda x: x)
-    dtype = None
-
-    def __init__(self, left, right, name, na_op):
-
-        # need to make sure that we are aligning the data
-        if isinstance(left, pd.Series) and isinstance(right, pd.Series):
-            left, right = left.align(right,copy=False)
-
-        lvalues = self._convert_to_array(left, name=name)
-        rvalues = self._convert_to_array(right, name=name, other=lvalues)
-
-        self.name = name
-        self.na_op = na_op
-
-        # left
-        self.left = left
-        self.is_offset_lhs = self._is_offset(left)
-        self.is_timedelta_lhs = is_timedelta64_dtype(lvalues)
-        self.is_datetime64_lhs = is_datetime64_dtype(lvalues)
-        self.is_datetime64tz_lhs = is_datetime64tz_dtype(lvalues)
-        self.is_datetime_lhs = self.is_datetime64_lhs or self.is_datetime64tz_lhs
-        self.is_integer_lhs = left.dtype.kind in ['i', 'u']
-
-        # right
-        self.right = right
-        self.is_offset_rhs = self._is_offset(right)
-        self.is_datetime64_rhs = is_datetime64_dtype(rvalues)
-        self.is_datetime64tz_rhs = is_datetime64tz_dtype(rvalues)
-        self.is_datetime_rhs = self.is_datetime64_rhs or self.is_datetime64tz_rhs
-        self.is_timedelta_rhs = is_timedelta64_dtype(rvalues)
-        self.is_integer_rhs = rvalues.dtype.kind in ('i', 'u')
-
-        self._validate(lvalues, rvalues, name)
-        self.lvalues, self.rvalues = self._convert_for_datetime(lvalues, rvalues)
-
-    def _validate(self, lvalues, rvalues, name):
-        # timedelta and integer mul/div
-
-        if (self.is_timedelta_lhs and self.is_integer_rhs) or (
-            self.is_integer_lhs and self.is_timedelta_rhs):
-
-            if name not in ('__div__', '__truediv__', '__mul__'):
-                raise TypeError("can only operate on a timedelta and an "
-                                "integer for division, but the operator [%s]"
-                                "was passed" % name)
-
-        # 2 datetimes
-        elif self.is_datetime_lhs and self.is_datetime_rhs:
-
-            if name not in ('__sub__','__rsub__'):
-                raise TypeError("can only operate on a datetimes for"
-                                " subtraction, but the operator [%s] was"
-                                " passed" % name)
-
-            # if tz's must be equal (same or None)
-            if getattr(lvalues,'tz',None) != getattr(rvalues,'tz',None):
-                raise ValueError("Incompatbile tz's on datetime subtraction ops")
-
-        # 2 timedeltas
-        elif ((self.is_timedelta_lhs and
-               (self.is_timedelta_rhs or self.is_offset_rhs)) or
-              (self.is_timedelta_rhs and
-               (self.is_timedelta_lhs or self.is_offset_lhs))):
-
-            if name not in ('__div__', '__rdiv__', '__truediv__', '__rtruediv__',
-                            '__add__', '__radd__', '__sub__', '__rsub__'):
-                raise TypeError("can only operate on a timedeltas for "
-                                "addition, subtraction, and division, but the"
-                                " operator [%s] was passed" % name)
-
-        # datetime and timedelta/DateOffset
-        elif (self.is_datetime_lhs and
-              (self.is_timedelta_rhs or self.is_offset_rhs)):
-
-            if name not in ('__add__', '__radd__', '__sub__'):
-                raise TypeError("can only operate on a datetime with a rhs of"
-                                " a timedelta/DateOffset for addition and subtraction,"
-                                " but the operator [%s] was passed" %
-                                name)
-
-        elif ((self.is_timedelta_lhs or self.is_offset_lhs)
-              and self.is_datetime_rhs):
-
-            if name not in ('__add__', '__radd__'):
-                raise TypeError("can only operate on a timedelta/DateOffset and"
-                                " a datetime for addition, but the operator"
-                                " [%s] was passed" % name)
-        else:
-            raise TypeError('cannot operate on a series with out a rhs '
-                            'of a series/ndarray of type datetime64[ns] '
-                            'or a timedelta')
-
-    def _convert_to_array(self, values, name=None, other=None):
-        """converts values to ndarray"""
-        from pandas.tseries.timedeltas import to_timedelta
-
-        ovalues = values
-        if not is_list_like(values):
-            values = np.array([values])
-
-        inferred_type = lib.infer_dtype(values)
-
-        if inferred_type in ('datetime64', 'datetime', 'date', 'time'):
-            # if we have a other of timedelta, but use pd.NaT here we
-            # we are in the wrong path
-            if (other is not None and other.dtype == 'timedelta64[ns]' and
-                    all(isnull(v) for v in values)):
-                values = np.empty(values.shape, dtype=other.dtype)
-                values[:] = iNaT
-
-            # a datelike
-            elif isinstance(values, pd.DatetimeIndex):
-                values = values.to_series()
-            # datetime with tz
-            elif isinstance(ovalues, datetime.datetime) and hasattr(ovalues,'tz'):
-                values = pd.DatetimeIndex(values)
-            # datetime array with tz
-            elif com.is_datetimetz(values):
-                if isinstance(values, pd.Series):
-                    values = values._values
-            elif not (isinstance(values, (np.ndarray, pd.Series)) and
-                      is_datetime64_dtype(values)):
-                values = tslib.array_to_datetime(values)
-        elif inferred_type in ('timedelta', 'timedelta64'):
-            # have a timedelta, convert to to ns here
-            values = to_timedelta(values, errors='coerce')
-        elif inferred_type == 'integer':
-            # py3 compat where dtype is 'm' but is an integer
-            if values.dtype.kind == 'm':
-                values = values.astype('timedelta64[ns]')
-            elif isinstance(values, pd.PeriodIndex):
-                values = values.to_timestamp().to_series()
-            elif name not in ('__truediv__', '__div__', '__mul__'):
-                raise TypeError("incompatible type for a datetime/timedelta "
-                                "operation [{0}]".format(name))
-        elif inferred_type == 'floating':
-            # all nan, so ok, use the other dtype (e.g. timedelta or datetime)
-            if isnull(values).all():
-                values = np.empty(values.shape, dtype=other.dtype)
-                values[:] = iNaT
-            else:
-                raise TypeError(
-                    'incompatible type [{0}] for a datetime/timedelta '
-                    'operation'.format(np.array(values).dtype))
-        elif self._is_offset(values):
-            return values
-        else:
-            raise TypeError("incompatible type [{0}] for a datetime/timedelta"
-                            " operation".format(np.array(values).dtype))
-
-        return values
-
-    def _convert_for_datetime(self, lvalues, rvalues):
-        from pandas.tseries.timedeltas import to_timedelta
-
-        mask = isnull(lvalues) | isnull(rvalues)
 
-        # datetimes require views
-        if self.is_datetime_lhs or self.is_datetime_rhs:
+# -----------------------------------------------------------------------------
+# Series
 
-            # datetime subtraction means timedelta
-            if self.is_datetime_lhs and self.is_datetime_rhs:
-                self.dtype = 'timedelta64[ns]'
-            elif self.is_datetime64tz_lhs:
-                self.dtype = lvalues.dtype
-            elif self.is_datetime64tz_rhs:
-                self.dtype = rvalues.dtype
-            else:
-                self.dtype = 'datetime64[ns]'
-
-            # if adding single offset try vectorized path
-            # in DatetimeIndex; otherwise elementwise apply
-            def _offset(lvalues, rvalues):
-                if len(lvalues) == 1:
-                    rvalues = pd.DatetimeIndex(rvalues)
-                    lvalues = lvalues[0]
-                else:
-                    warnings.warn("Adding/subtracting array of DateOffsets to Series not vectorized",
-                                  PerformanceWarning)
-                    rvalues = rvalues.astype('O')
+def _align_method_SERIES(left, right, align_asobject=False):
+    """ align lhs and rhs Series """
 
-                # pass thru on the na_op
-                self.na_op = lambda x, y: getattr(x,self.name)(y)
-                return lvalues, rvalues
+    # ToDo: Different from _align_method_FRAME, list, tuple and ndarray
+    # are not coerced here
+    # because Series has inconsistencies described in #13637
 
+    if isinstance(right, ABCSeries):
+        # avoid repeated alignment
+        if not left.index.equals(right.index):
 
-            if self.is_offset_lhs:
-                lvalues, rvalues = _offset(lvalues, rvalues)
-            elif self.is_offset_rhs:
-                rvalues, lvalues = _offset(rvalues, lvalues)
-            else:
+            if align_asobject:
+                # to keep original value's dtype for bool ops
+                left = left.astype(object)
+                right = right.astype(object)
 
-                # with tz, convert to UTC
-                if self.is_datetime64tz_lhs:
-                    lvalues = lvalues.tz_localize(None)
-                if self.is_datetime64tz_rhs:
-                    rvalues = rvalues.tz_localize(None)
+            left, right = left.align(right, copy=False)
 
-                lvalues = lvalues.view(np.int64)
-                rvalues = rvalues.view(np.int64)
+    return left, right
 
-        # otherwise it's a timedelta
-        else:
 
-            self.dtype = 'timedelta64[ns]'
-
-            # convert Tick DateOffset to underlying delta
-            if self.is_offset_lhs:
-                lvalues = to_timedelta(lvalues)
-            if self.is_offset_rhs:
-                rvalues = to_timedelta(rvalues)
-
-            lvalues = lvalues.astype(np.int64)
-            rvalues = rvalues.astype(np.int64)
-
-            # time delta division -> unit less
-            # integer gets converted to timedelta in np < 1.6
-            if (self.is_timedelta_lhs and self.is_timedelta_rhs) and\
-               not self.is_integer_rhs and\
-               not self.is_integer_lhs and\
-               self.name in ('__div__', '__truediv__'):
-                self.dtype = 'float64'
-                self.fill_value = np.nan
-                lvalues = lvalues.astype(np.float64)
-                rvalues = rvalues.astype(np.float64)
-
-        # if we need to mask the results
-        if mask.any():
-            def f(x):
-
-                # datetime64[ns]/timedelta64[ns] masking
-                try:
-                    x = np.array(x, dtype=self.dtype)
-                except TypeError:
-                    x = np.array(x, dtype='datetime64[ns]')
+def _construct_result(left, result, index, name, dtype):
+    """
+    If the raw op result has a non-None name (e.g. it is an Index object) and
+    the name argument is None, then passing name to the constructor will
+    not be enough; we still need to override the name attribute.
+    """
+    out = left._constructor(result, index=index, dtype=dtype)
 
-                np.putmask(x, mask, self.fill_value)
-                return x
-            self.wrap_results = f
+    out.name = name
+    return out
 
-        return lvalues, rvalues
 
+def _construct_divmod_result(left, result, index, name, dtype):
+    """divmod returns a tuple of like indexed series instead of a single series.
+    """
+    constructor = left._constructor
+    return (
+        constructor(result[0], index=index, name=name, dtype=dtype),
+        constructor(result[1], index=index, name=name, dtype=dtype),
+    )
 
-    def _is_offset(self, arr_or_obj):
-        """ check if obj or all elements of list-like is DateOffset """
-        if isinstance(arr_or_obj, pd.DateOffset):
-            return True
-        elif is_list_like(arr_or_obj):
-            return all(isinstance(x, pd.DateOffset) for x in arr_or_obj)
-        else:
-            return False
 
-    @classmethod
-    def maybe_convert_for_time_op(cls, left, right, name, na_op):
-        """
-        if ``left`` and ``right`` are appropriate for datetime arithmetic with
-        operation ``name``, processes them and returns a ``_TimeOp`` object
-        that stores all the required values.  Otherwise, it will generate
-        either a ``NotImplementedError`` or ``None``, indicating that the
-        operation is unsupported for datetimes (e.g., an unsupported r_op) or
-        that the data is not the right type for time ops.
-        """
-        # decide if we can do it
-        is_timedelta_lhs = is_timedelta64_dtype(left)
-        is_datetime_lhs = is_datetime64_dtype(left) or is_datetime64tz_dtype(left)
+def dispatch_to_extension_op(op, left, right):
+    """
+    Assume that left or right is a Series backed by an ExtensionArray,
+    apply the operator defined by op.
+    """
 
-        if not (is_datetime_lhs or is_timedelta_lhs):
-            return None
+    # The op calls will raise TypeError if the op is not defined
+    # on the ExtensionArray
+    if is_extension_array_dtype(left):
+        res_values = op(left.values, right)
+    else:
+        # We know that left is not ExtensionArray and is Series and right is
+        # ExtensionArray.  Want to force ExtensionArray op to get called
+        res_values = op(list(left.values), right.values)
 
-        return cls(left, right, name, na_op)
+    res_name = get_op_result_name(left, right)
+    return left._constructor(res_values, index=left.index,
+                             name=res_name)
 
 
-def _arith_method_SERIES(op, name, str_rep, fill_zeros=None,
-                         default_axis=None, **eval_kwargs):
+def _arith_method_SERIES(cls, op, special):
     """
     Wrapper function for Series arithmetic operations, to avoid
     code duplication.
     """
+    str_rep = _get_opstr(op, cls)
+    op_name = _get_op_name(op, special)
+    eval_kwargs = _gen_eval_kwargs(op_name)
+    fill_zeros = _gen_fill_zeros(op_name)
+    construct_result = (_construct_divmod_result
+                        if op is divmod else _construct_result)
+
     def na_op(x, y):
+        import pandas.core.computation.expressions as expressions
+
         try:
-            result = expressions.evaluate(op, str_rep, x, y,
-                                          raise_on_error=True, **eval_kwargs)
+            result = expressions.evaluate(op, str_rep, x, y, **eval_kwargs)
         except TypeError:
-            if isinstance(y, (np.ndarray, pd.Series, pd.Index)):
-                dtype = np.find_common_type([x.dtype, y.dtype], [])
+            if isinstance(y, (np.ndarray, ABCSeries, pd.Index)):
+                dtype = find_common_type([x.dtype, y.dtype])
                 result = np.empty(x.size, dtype=dtype)
-                mask = notnull(x) & notnull(y)
-                result[mask] = op(x[mask], _values_from_object(y[mask]))
-            elif isinstance(x, np.ndarray):
+                mask = notna(x) & notna(y)
+                result[mask] = op(x[mask], com._values_from_object(y[mask]))
+            else:
+                assert isinstance(x, np.ndarray)
                 result = np.empty(len(x), dtype=x.dtype)
-                mask = notnull(x)
+                mask = notna(x)
                 result[mask] = op(x[mask], y)
-            else:
-                raise TypeError("{typ} cannot perform the operation {op}".format(typ=type(x).__name__,op=str_rep))
 
-            result, changed = com._maybe_upcast_putmask(result, ~mask, np.nan)
+            result, changed = maybe_upcast_putmask(result, ~mask, np.nan)
 
-        result = com._fill_zeros(result, x, y, name, fill_zeros)
+        result = missing.fill_zeros(result, x, y, op_name, fill_zeros)
         return result
 
-    def wrapper(left, right, name=name, na_op=na_op):
+    def safe_na_op(lvalues, rvalues):
+        try:
+            with np.errstate(all='ignore'):
+                return na_op(lvalues, rvalues)
+        except Exception:
+            if is_object_dtype(lvalues):
+                return libalgos.arrmap_object(lvalues,
+                                              lambda x: op(x, rvalues))
+            raise
+
+    def wrapper(left, right):
 
-        if isinstance(right, pd.DataFrame):
+        if isinstance(right, ABCDataFrame):
             return NotImplemented
 
-        time_converted = _TimeOp.maybe_convert_for_time_op(left, right, name, na_op)
+        left, right = _align_method_SERIES(left, right)
+        res_name = get_op_result_name(left, right)
 
-        if time_converted is None:
-            lvalues, rvalues = left, right
-            dtype = None
-            wrap_results = lambda x: x
-        elif time_converted == NotImplemented:
-            return NotImplemented
-        else:
-            left, right = time_converted.left, time_converted.right
-            lvalues, rvalues = time_converted.lvalues, time_converted.rvalues
-            dtype = time_converted.dtype
-            wrap_results = time_converted.wrap_results
-            na_op = time_converted.na_op
-
-        if isinstance(rvalues, pd.Series):
-            rindex = getattr(rvalues,'index',rvalues)
-            name = _maybe_match_name(left, rvalues)
-            lvalues = getattr(lvalues, 'values', lvalues)
-            rvalues = getattr(rvalues, 'values', rvalues)
-            if left.index.equals(rindex):
-                index = left.index
-            else:
-                index, lidx, ridx = left.index.join(rindex, how='outer',
-                                                       return_indexers=True)
+        if is_datetime64_dtype(left) or is_datetime64tz_dtype(left):
+            result = dispatch_to_index_op(op, left, right, pd.DatetimeIndex)
+            return construct_result(left, result,
+                                    index=left.index, name=res_name,
+                                    dtype=result.dtype)
 
-                if lidx is not None:
-                    lvalues = com.take_1d(lvalues, lidx)
+        elif is_timedelta64_dtype(left):
+            result = dispatch_to_index_op(op, left, right, pd.TimedeltaIndex)
+            return construct_result(left, result,
+                                    index=left.index, name=res_name,
+                                    dtype=result.dtype)
 
-                if ridx is not None:
-                    rvalues = com.take_1d(rvalues, ridx)
+        elif is_categorical_dtype(left):
+            raise TypeError("{typ} cannot perform the operation "
+                            "{op}".format(typ=type(left).__name__, op=str_rep))
 
-            arr = na_op(lvalues, rvalues)
+        elif (is_extension_array_dtype(left) or
+              (is_extension_array_dtype(right) and
+               not is_categorical_dtype(right))):
+            return dispatch_to_extension_op(op, left, right)
 
-            return left._constructor(wrap_results(arr), index=index,
-                                     name=name, dtype=dtype)
-        else:
-            # scalars
-            if hasattr(lvalues, 'values') and not isinstance(lvalues, pd.DatetimeIndex):
-                lvalues = lvalues.values
+        lvalues = left.values
+        rvalues = right
+        if isinstance(rvalues, ABCSeries):
+            rvalues = rvalues.values
+
+        result = safe_na_op(lvalues, rvalues)
+        return construct_result(left, result,
+                                index=left.index, name=res_name, dtype=None)
 
-            return left._constructor(wrap_results(na_op(lvalues, rvalues)),
-                                     index=left.index, name=left.name,
-                                     dtype=dtype)
     return wrapper
 
 
-def _comp_method_SERIES(op, name, str_rep, masker=False):
+def dispatch_to_index_op(op, left, right, index_class):
+    """
+    Wrap Series left in the given index_class to delegate the operation op
+    to the index implementation.  DatetimeIndex and TimedeltaIndex perform
+    type checking, timezone handling, overflow checks, etc.
+
+    Parameters
+    ----------
+    op : binary operator (operator.add, operator.sub, ...)
+    left : Series
+    right : object
+    index_class : DatetimeIndex or TimedeltaIndex
+
+    Returns
+    -------
+    result : object, usually DatetimeIndex, TimedeltaIndex, or Series
+    """
+    left_idx = index_class(left)
+
+    # avoid accidentally allowing integer add/sub.  For datetime64[tz] dtypes,
+    # left_idx may inherit a freq from a cached DatetimeIndex.
+    # See discussion in GH#19147.
+    if getattr(left_idx, 'freq', None) is not None:
+        left_idx = left_idx._shallow_copy(freq=None)
+    try:
+        result = op(left_idx, right)
+    except NullFrequencyError:
+        # DatetimeIndex and TimedeltaIndex with freq == None raise ValueError
+        # on add/sub of integers (or int-like).  We re-raise as a TypeError.
+        raise TypeError('incompatible type for a datetime/timedelta '
+                        'operation [{name}]'.format(name=op.__name__))
+    return result
+
+
+def _comp_method_OBJECT_ARRAY(op, x, y):
+    if isinstance(y, list):
+        y = construct_1d_object_array_from_listlike(y)
+    if isinstance(y, (np.ndarray, ABCSeries, ABCIndex)):
+        if not is_object_dtype(y.dtype):
+            y = y.astype(np.object_)
+
+        if isinstance(y, (ABCSeries, ABCIndex)):
+            y = y.values
+
+        result = libops.vec_compare(x, y, op)
+    else:
+        result = libops.scalar_compare(x, y, op)
+    return result
+
+
+def _comp_method_SERIES(cls, op, special):
     """
     Wrapper function for Series arithmetic operations, to avoid
     code duplication.
     """
+    op_name = _get_op_name(op, special)
+    masker = _gen_eval_kwargs(op_name).get('masker', False)
+
     def na_op(x, y):
 
         # dispatch to the categorical if we have a categorical
         # in either operand
-        if is_categorical_dtype(x):
-            return op(x,y)
-        elif is_categorical_dtype(y) and not isscalar(y):
-            return op(y,x)
+        if is_categorical_dtype(y) and not is_scalar(y):
+            # The `not is_scalar(y)` check excludes the string "category"
+            return op(y, x)
 
-        if is_object_dtype(x.dtype):
-            if isinstance(y, list):
-                y = lib.list_to_object_array(y)
+        elif is_object_dtype(x.dtype):
+            result = _comp_method_OBJECT_ARRAY(op, x, y)
+
+        elif is_datetimelike_v_numeric(x, y):
+            raise TypeError("invalid type comparison")
 
-            if isinstance(y, (np.ndarray, pd.Series)):
-                if not is_object_dtype(y.dtype):
-                    result = lib.vec_compare(x, y.astype(np.object_), op)
-                else:
-                    result = lib.vec_compare(x, y, op)
-            else:
-                result = lib.scalar_compare(x, y, op)
         else:
 
             # we want to compare like types
@@ -653,34 +1178,22 @@ def na_op(x, y):
             # we are not NotImplemented, otherwise
             # we would allow datetime64 (but viewed as i8) against
             # integer comparisons
-            if is_datetimelike_v_numeric(x, y):
-                raise TypeError("invalid type comparison")
-
-            # numpy does not like comparisons vs None
-            if isscalar(y) and isnull(y):
-                if name == '__ne__':
-                    return np.ones(len(x), dtype=bool)
-                else:
-                    return np.zeros(len(x), dtype=bool)
 
             # we have a datetime/timedelta and may need to convert
+            assert not needs_i8_conversion(x)
             mask = None
-            if needs_i8_conversion(x) or (not isscalar(y) and needs_i8_conversion(y)):
-
-                if isscalar(y):
-                    y = _index.convert_scalar(x,_values_from_object(y))
-                else:
-                    y = y.view('i8')
-
-                mask = isnull(x)
-
+            if not is_scalar(y) and needs_i8_conversion(y):
+                mask = isna(x) | isna(y)
+                y = y.view('i8')
                 x = x.view('i8')
 
-            try:
-                result = getattr(x, name)(y)
+            method = getattr(x, op_name, None)
+            if method is not None:
+                with np.errstate(all='ignore'):
+                    result = method(y)
                 if result is NotImplemented:
                     raise TypeError("invalid type comparison")
-            except AttributeError:
+            else:
                 result = op(x, y)
 
             if mask is not None and mask.any():
@@ -693,517 +1206,651 @@ def wrapper(self, other, axis=None):
         if axis is not None:
             self._get_axis_number(axis)
 
-        if isinstance(other, pd.Series):
-            name = _maybe_match_name(self, other)
-            if len(self) != len(other):
-                raise ValueError('Series lengths must match to compare')
-            return self._constructor(na_op(self.values, other.values),
-                                     index=self.index, name=name)
-        elif isinstance(other, pd.DataFrame):  # pragma: no cover
+        res_name = get_op_result_name(self, other)
+
+        if isinstance(other, ABCDataFrame):  # pragma: no cover
+            # Defer to DataFrame implementation; fail early
             return NotImplemented
+
+        elif isinstance(other, ABCSeries) and not self._indexed_same(other):
+            raise ValueError("Can only compare identically-labeled "
+                             "Series objects")
+
+        elif is_categorical_dtype(self):
+            # Dispatch to Categorical implementation; pd.CategoricalIndex
+            # behavior is non-canonical GH#19513
+            res_values = dispatch_to_index_op(op, self, other, pd.Categorical)
+            return self._constructor(res_values, index=self.index,
+                                     name=res_name)
+
+        if is_datetime64_dtype(self) or is_datetime64tz_dtype(self):
+            # Dispatch to DatetimeIndex to ensure identical
+            # Series/Index behavior
+            if (isinstance(other, datetime.date) and
+                    not isinstance(other, datetime.datetime)):
+                # https://github.com/pandas-dev/pandas/issues/21152
+                # Compatibility for difference between Series comparison w/
+                # datetime and date
+                msg = (
+                    "Comparing Series of datetimes with 'datetime.date'.  "
+                    "Currently, the 'datetime.date' is coerced to a "
+                    "datetime. In the future pandas will not coerce, "
+                    "and {future}. "
+                    "To retain the current behavior, "
+                    "convert the 'datetime.date' to a datetime with "
+                    "'pd.Timestamp'."
+                )
+
+                if op in {operator.lt, operator.le, operator.gt, operator.ge}:
+                    future = "a TypeError will be raised"
+                else:
+                    future = (
+                        "'the values will not compare equal to the "
+                        "'datetime.date'"
+                    )
+                msg = '\n'.join(textwrap.wrap(msg.format(future=future)))
+                warnings.warn(msg, FutureWarning, stacklevel=2)
+                other = pd.Timestamp(other)
+
+            res_values = dispatch_to_index_op(op, self, other,
+                                              pd.DatetimeIndex)
+
+            return self._constructor(res_values, index=self.index,
+                                     name=res_name)
+
+        elif is_timedelta64_dtype(self):
+            res_values = dispatch_to_index_op(op, self, other,
+                                              pd.TimedeltaIndex)
+            return self._constructor(res_values, index=self.index,
+                                     name=res_name)
+
+        elif (is_extension_array_dtype(self) or
+              (is_extension_array_dtype(other) and
+               not is_categorical_dtype(other))):
+            return dispatch_to_extension_op(op, self, other)
+
+        elif isinstance(other, ABCSeries):
+            # By this point we have checked that self._indexed_same(other)
+            res_values = na_op(self.values, other.values)
+            # rename is needed in case res_name is None and res_values.name
+            # is not.
+            return self._constructor(res_values, index=self.index,
+                                     name=res_name).rename(res_name)
+
         elif isinstance(other, (np.ndarray, pd.Index)):
-            if len(self) != len(other):
+            # do not check length of zerodim array
+            # as it will broadcast
+            if other.ndim != 0 and len(self) != len(other):
                 raise ValueError('Lengths must match to compare')
-            return self._constructor(na_op(self.values, np.asarray(other)),
-                                     index=self.index).__finalize__(self)
+
+            res_values = na_op(self.values, np.asarray(other))
+            result = self._constructor(res_values, index=self.index)
+            # rename is needed in case res_name is None and self.name
+            # is not.
+            return result.__finalize__(self).rename(res_name)
+
         elif isinstance(other, pd.Categorical):
-            if not is_categorical_dtype(self):
-                msg = "Cannot compare a Categorical for op {op} with Series of dtype {typ}.\n"\
-                      "If you want to compare values, use 'series <op> np.asarray(other)'."
-                raise TypeError(msg.format(op=op,typ=self.dtype))
+            # ordering of checks matters; by this point we know
+            # that not is_categorical_dtype(self)
+            res_values = op(self.values, other)
+            return self._constructor(res_values, index=self.index,
+                                     name=res_name)
 
+        elif is_scalar(other) and isna(other):
+            # numpy does not like comparisons vs None
+            if op is operator.ne:
+                res_values = np.ones(len(self), dtype=bool)
+            else:
+                res_values = np.zeros(len(self), dtype=bool)
+            return self._constructor(res_values, index=self.index,
+                                     name=res_name, dtype='bool')
 
-        if is_categorical_dtype(self):
-            # cats are a special case as get_values() would return an ndarray, which would then
-            # not take categories ordering into account
-            # we can go directly to op, as the na_op would just test again and dispatch to it.
-            res = op(self.values, other)
         else:
             values = self.get_values()
-            if is_list_like(other):
+            if isinstance(other, list):
                 other = np.asarray(other)
 
-            res = na_op(values, other)
-            if isscalar(res):
-                raise TypeError('Could not compare %s type with Series'
-                                % type(other))
+            with np.errstate(all='ignore'):
+                res = na_op(values, other)
+            if is_scalar(res):
+                raise TypeError('Could not compare {typ} type with Series'
+                                .format(typ=type(other)))
 
             # always return a full value series here
-            res = _values_from_object(res)
+            res_values = com._values_from_object(res)
+            return self._constructor(res_values, index=self.index,
+                                     name=res_name, dtype='bool')
 
-        res = pd.Series(res, index=self.index, name=self.name,
-                        dtype='bool')
-        return res
     return wrapper
 
 
-def _bool_method_SERIES(op, name, str_rep):
+def _bool_method_SERIES(cls, op, special):
     """
     Wrapper function for Series arithmetic operations, to avoid
     code duplication.
     """
+
     def na_op(x, y):
         try:
             result = op(x, y)
         except TypeError:
             if isinstance(y, list):
-                y = lib.list_to_object_array(y)
+                y = construct_1d_object_array_from_listlike(y)
 
-            if isinstance(y, (np.ndarray, pd.Series)):
+            if isinstance(y, (np.ndarray, ABCSeries)):
                 if (is_bool_dtype(x.dtype) and is_bool_dtype(y.dtype)):
                     result = op(x, y)  # when would this be hit?
                 else:
-                    x = com._ensure_object(x)
-                    y = com._ensure_object(y)
-                    result = lib.vec_binop(x, y, op)
+                    x = _ensure_object(x)
+                    y = _ensure_object(y)
+                    result = libops.vec_binop(x, y, op)
             else:
+                # let null fall thru
+                if not isna(y):
+                    y = bool(y)
                 try:
-
-                    # let null fall thru
-                    if not isnull(y):
-                        y = bool(y)
-                    result = lib.scalar_binop(x, y, op)
+                    result = libops.scalar_binop(x, y, op)
                 except:
-                    raise TypeError("cannot compare a dtyped [{0}] array with "
-                                    "a scalar of type [{1}]".format(
-                                        x.dtype, type(y).__name__))
+                    raise TypeError("cannot compare a dtyped [{dtype}] array "
+                                    "with a scalar of type [{typ}]"
+                                    .format(dtype=x.dtype,
+                                            typ=type(y).__name__))
 
         return result
 
+    fill_int = lambda x: x.fillna(0)
+    fill_bool = lambda x: x.fillna(False).astype(bool)
+
     def wrapper(self, other):
         is_self_int_dtype = is_integer_dtype(self.dtype)
 
-        fill_int = lambda x: x.fillna(0)
-        fill_bool = lambda x: x.fillna(False).astype(bool)
+        self, other = _align_method_SERIES(self, other, align_asobject=True)
+
+        if isinstance(other, ABCDataFrame):
+            # Defer to DataFrame implementation; fail early
+            return NotImplemented
 
-        if isinstance(other, pd.Series):
-            name = _maybe_match_name(self, other)
-            other = other.reindex_like(self)
+        elif isinstance(other, ABCSeries):
+            name = get_op_result_name(self, other)
             is_other_int_dtype = is_integer_dtype(other.dtype)
             other = fill_int(other) if is_other_int_dtype else fill_bool(other)
 
-            filler = fill_int if is_self_int_dtype and is_other_int_dtype else fill_bool
-            return filler(self._constructor(na_op(self.values, other.values),
-                                     index=self.index,
-                                     name=name))
+            filler = (fill_int if is_self_int_dtype and is_other_int_dtype
+                      else fill_bool)
 
-        elif isinstance(other, pd.DataFrame):
-            return NotImplemented
+            res_values = na_op(self.values, other.values)
+            unfilled = self._constructor(res_values,
+                                         index=self.index, name=name)
+            return filler(unfilled)
 
         else:
             # scalars, list, tuple, np.array
-            filler = fill_int if is_self_int_dtype and is_integer_dtype(np.asarray(other)) else fill_bool
-            return filler(self._constructor(na_op(self.values, other),
-                                    index=self.index)).__finalize__(self)
-
-    return wrapper
-
-
-def _radd_compat(left, right):
-    radd = lambda x, y: y + x
-    # GH #353, NumPy 1.5.1 workaround
-    try:
-        output = radd(left, right)
-    except TypeError:
-        raise
-
-    return output
-
-_op_descriptions = {'add': {'op': '+', 'desc': 'Addition', 'reversed': False, 'reverse': 'radd'},
-                    'sub': {'op': '-', 'desc': 'Subtraction', 'reversed': False, 'reverse': 'rsub'},
-                    'mul': {'op': '*', 'desc': 'Multiplication', 'reversed': False, 'reverse': 'rmul'},
-                    'mod': {'op': '%', 'desc': 'Modulo', 'reversed': False, 'reverse': 'rmod'},
-                    'pow': {'op': '**', 'desc': 'Exponential power', 'reversed': False, 'reverse': 'rpow'},
-                    'truediv': {'op': '/', 'desc': 'Floating division', 'reversed': False, 'reverse': 'rtruediv'},
-                    'floordiv': {'op': '//', 'desc': 'Integer division', 'reversed': False, 'reverse': 'rfloordiv'}}
+            filler = (fill_int if is_self_int_dtype and
+                      is_integer_dtype(np.asarray(other)) else fill_bool)
 
-_op_names = list(_op_descriptions.keys())
-for k in _op_names:
-    reverse_op = _op_descriptions[k]['reverse']
-    _op_descriptions[reverse_op] = _op_descriptions[k].copy()
-    _op_descriptions[reverse_op]['reversed'] = True
-    _op_descriptions[reverse_op]['reverse'] = k
-
-def _flex_method_SERIES(op, name, str_rep, default_axis=None,
-                        fill_zeros=None, **eval_kwargs):
-    op_name = name.replace('__', '')
-    op_desc = _op_descriptions[op_name]
-    if op_desc['reversed']:
-        equiv = 'other ' + op_desc['op'] + ' series'
-    else:
-        equiv = 'series ' + op_desc['op'] + ' other'
+            res_values = na_op(self.values, other)
+            unfilled = self._constructor(res_values, index=self.index)
+            return filler(unfilled).__finalize__(self)
 
-    doc = """
-    %s of series and other, element-wise (binary operator `%s`).
-
-    Equivalent to ``%s``, but with support to substitute a fill_value for
-    missing data in one of the inputs.
-
-    Parameters
-    ----------
-    other: Series or scalar value
-    fill_value : None or float value, default None (NaN)
-        Fill missing (NaN) values with this value. If both Series are
-        missing, the result will be missing
-    level : int or name
-        Broadcast across a level, matching Index values on the
-        passed MultiIndex level
+    return wrapper
 
-    Returns
-    -------
-    result : Series
 
-    See also
-    --------
-    Series.%s
-    """ % (op_desc['desc'], op_name, equiv, op_desc['reverse'])
+def _flex_method_SERIES(cls, op, special):
+    name = _get_op_name(op, special)
+    doc = _make_flex_doc(name, 'series')
 
     @Appender(doc)
     def flex_wrapper(self, other, level=None, fill_value=None, axis=0):
         # validate axis
-        self._get_axis_number(axis)
-        if isinstance(other, pd.Series):
+        if axis is not None:
+            self._get_axis_number(axis)
+        if isinstance(other, ABCSeries):
             return self._binop(other, op, level=level, fill_value=fill_value)
-        elif isinstance(other, (np.ndarray, pd.Series, list, tuple)):
+        elif isinstance(other, (np.ndarray, list, tuple)):
             if len(other) != len(self):
                 raise ValueError('Lengths must be equal')
-            return self._binop(self._constructor(other, self.index), op,
-                               level=level, fill_value=fill_value)
+            other = self._constructor(other, self.index)
+            return self._binop(other, op, level=level, fill_value=fill_value)
         else:
-            return self._constructor(op(self.values, other),
+            if fill_value is not None:
+                self = self.fillna(fill_value)
+
+            return self._constructor(op(self, other),
                                      self.index).__finalize__(self)
 
     flex_wrapper.__name__ = name
     return flex_wrapper
 
-series_flex_funcs = dict(flex_arith_method=_flex_method_SERIES,
-                         radd_func=_radd_compat,
-                         flex_comp_method=_comp_method_SERIES)
 
-series_special_funcs = dict(arith_method=_arith_method_SERIES,
-                            radd_func=_radd_compat,
-                            comp_method=_comp_method_SERIES,
-                            bool_method=_bool_method_SERIES)
+# -----------------------------------------------------------------------------
+# DataFrame
 
+def _combine_series_frame(self, other, func, fill_value=None, axis=None,
+                          level=None, try_cast=True):
+    """
+    Apply binary operator `func` to self, other using alignment and fill
+    conventions determined by the fill_value, axis, level, and try_cast kwargs.
 
-_arith_doc_FRAME = """
-Binary operator %s with support to substitute a fill_value for missing data in
-one of the inputs
+    Parameters
+    ----------
+    self : DataFrame
+    other : Series
+    func : binary operator
+    fill_value : object, default None
+    axis : {0, 1, 'columns', 'index', None}, default None
+    level : int or None, default None
+    try_cast : bool, default True
 
-Parameters
-----------
-other : Series, DataFrame, or constant
-axis : {0, 1, 'index', 'columns'}
-    For Series input, axis to match Series index on
-fill_value : None or float value, default None
-    Fill missing (NaN) values with this value. If both DataFrame locations are
-    missing, the result will be missing
-level : int or name
-    Broadcast across a level, matching Index values on the
-    passed MultiIndex level
+    Returns
+    -------
+    result : DataFrame
+    """
+    if fill_value is not None:
+        raise NotImplementedError("fill_value {fill} not supported."
+                                  .format(fill=fill_value))
+
+    if axis is not None:
+        axis = self._get_axis_number(axis)
+        if axis == 0:
+            return self._combine_match_index(other, func, level=level)
+        else:
+            return self._combine_match_columns(other, func, level=level,
+                                               try_cast=try_cast)
+    else:
+        if not len(other):
+            return self * np.nan
+
+        if not len(self):
+            # Ambiguous case, use _series so works with DataFrame
+            return self._constructor(data=self._series, index=self.index,
+                                     columns=self.columns)
+
+        # default axis is columns
+        return self._combine_match_columns(other, func, level=level,
+                                           try_cast=try_cast)
+
+
+def _align_method_FRAME(left, right, axis):
+    """ convert rhs to meet lhs dims if input is list, tuple or np.ndarray """
+
+    def to_series(right):
+        msg = ('Unable to coerce to Series, length must be {req_len}: '
+               'given {given_len}')
+        if axis is not None and left._get_axis_name(axis) == 'index':
+            if len(left.index) != len(right):
+                raise ValueError(msg.format(req_len=len(left.index),
+                                            given_len=len(right)))
+            right = left._constructor_sliced(right, index=left.index)
+        else:
+            if len(left.columns) != len(right):
+                raise ValueError(msg.format(req_len=len(left.columns),
+                                            given_len=len(right)))
+            right = left._constructor_sliced(right, index=left.columns)
+        return right
 
-Notes
------
-Mismatched indices will be unioned together
+    if isinstance(right, np.ndarray):
 
-Returns
--------
-result : DataFrame
-"""
+        if right.ndim == 1:
+            right = to_series(right)
+
+        elif right.ndim == 2:
+            if left.shape != right.shape:
+                raise ValueError("Unable to coerce to DataFrame, shape "
+                                 "must be {req_shape}: given {given_shape}"
+                                 .format(req_shape=left.shape,
+                                         given_shape=right.shape))
+
+            right = left._constructor(right, index=left.index,
+                                      columns=left.columns)
+        elif right.ndim > 2:
+            raise ValueError('Unable to coerce to Series/DataFrame, dim '
+                             'must be <= 2: {dim}'.format(dim=right.shape))
 
+    elif (is_list_like(right) and
+          not isinstance(right, (ABCSeries, ABCDataFrame))):
+        # GH17901
+        right = to_series(right)
+
+    return right
+
+
+def _arith_method_FRAME(cls, op, special):
+    str_rep = _get_opstr(op, cls)
+    op_name = _get_op_name(op, special)
+    eval_kwargs = _gen_eval_kwargs(op_name)
+    fill_zeros = _gen_fill_zeros(op_name)
+    default_axis = _get_frame_op_default_axis(op_name)
 
-def _arith_method_FRAME(op, name, str_rep=None, default_axis='columns',
-                        fill_zeros=None, **eval_kwargs):
     def na_op(x, y):
+        import pandas.core.computation.expressions as expressions
+
         try:
-            result = expressions.evaluate(
-                op, str_rep, x, y, raise_on_error=True, **eval_kwargs)
+            result = expressions.evaluate(op, str_rep, x, y, **eval_kwargs)
         except TypeError:
             xrav = x.ravel()
-            if isinstance(y, (np.ndarray, pd.Series)):
-                dtype = np.find_common_type([x.dtype, y.dtype], [])
+            if isinstance(y, (np.ndarray, ABCSeries)):
+                dtype = find_common_type([x.dtype, y.dtype])
                 result = np.empty(x.size, dtype=dtype)
                 yrav = y.ravel()
-                mask = notnull(xrav) & notnull(yrav)
+                mask = notna(xrav) & notna(yrav)
                 xrav = xrav[mask]
+
+                if yrav.shape != mask.shape:
+                    # FIXME: GH#5284, GH#5035, GH#19448
+                    # Without specifically raising here we get mismatched
+                    # errors in Py3 (TypeError) vs Py2 (ValueError)
+                    raise ValueError('Cannot broadcast operands together.')
+
                 yrav = yrav[mask]
-                if np.prod(xrav.shape) and np.prod(yrav.shape):
-                    result[mask] = op(xrav, yrav)
-            elif hasattr(x,'size'):
+                if xrav.size:
+                    with np.errstate(all='ignore'):
+                        result[mask] = op(xrav, yrav)
+
+            elif isinstance(x, np.ndarray):
+                # mask is only meaningful for x
                 result = np.empty(x.size, dtype=x.dtype)
-                mask = notnull(xrav)
+                mask = notna(xrav)
                 xrav = xrav[mask]
-                if np.prod(xrav.shape):
-                    result[mask] = op(xrav, y)
+                if xrav.size:
+                    with np.errstate(all='ignore'):
+                        result[mask] = op(xrav, y)
             else:
-                raise TypeError("cannot perform operation {op} between objects "
-                                "of type {x} and {y}".format(op=name,x=type(x),y=type(y)))
+                raise TypeError("cannot perform operation {op} between "
+                                "objects of type {x} and {y}"
+                                .format(op=op_name, x=type(x), y=type(y)))
 
-            result, changed = com._maybe_upcast_putmask(result, ~mask, np.nan)
+            result, changed = maybe_upcast_putmask(result, ~mask, np.nan)
             result = result.reshape(x.shape)
 
-        result = com._fill_zeros(result, x, y, name, fill_zeros)
+        result = missing.fill_zeros(result, x, y, op_name, fill_zeros)
 
         return result
 
-    if name in _op_descriptions:
-        op_name = name.replace('__', '')
-        op_desc = _op_descriptions[op_name]
-        if op_desc['reversed']:
-            equiv = 'other ' + op_desc['op'] + ' dataframe'
-        else:
-            equiv = 'dataframe ' + op_desc['op'] + ' other'
-
-        doc = """
-        %s of dataframe and other, element-wise (binary operator `%s`).
-
-        Equivalent to ``%s``, but with support to substitute a fill_value for
-        missing data in one of the inputs.
-
-        Parameters
-        ----------
-        other : Series, DataFrame, or constant
-        axis : {0, 1, 'index', 'columns'}
-            For Series input, axis to match Series index on
-        fill_value : None or float value, default None
-            Fill missing (NaN) values with this value. If both DataFrame locations are
-            missing, the result will be missing
-        level : int or name
-            Broadcast across a level, matching Index values on the
-            passed MultiIndex level
-
-        Notes
-        -----
-        Mismatched indices will be unioned together
-
-        Returns
-        -------
-        result : DataFrame
-
-        See also
-        --------
-        DataFrame.%s
-        """ % (op_desc['desc'], op_name, equiv, op_desc['reverse'])
+    if op_name in _op_descriptions:
+        # i.e. include "add" but not "__add__"
+        doc = _make_flex_doc(op_name, 'dataframe')
     else:
-        doc = _arith_doc_FRAME % name
+        doc = _arith_doc_FRAME % op_name
 
     @Appender(doc)
     def f(self, other, axis=default_axis, level=None, fill_value=None):
-        if isinstance(other, pd.DataFrame):    # Another DataFrame
+
+        other = _align_method_FRAME(self, other, axis)
+
+        if isinstance(other, ABCDataFrame):  # Another DataFrame
             return self._combine_frame(other, na_op, fill_value, level)
-        elif isinstance(other, pd.Series):
-            return self._combine_series(other, na_op, fill_value, axis, level)
-        elif isinstance(other, (list, tuple)):
-            if axis is not None and self._get_axis_name(axis) == 'index':
-                # TODO: Get all of these to use _constructor_sliced
-                # casted = self._constructor_sliced(other, index=self.index)
-                casted = pd.Series(other, index=self.index)
-            else:
-                # casted = self._constructor_sliced(other, index=self.columns)
-                casted = pd.Series(other, index=self.columns)
-            return self._combine_series(casted, na_op, fill_value, axis, level)
-        elif isinstance(other, np.ndarray) and other.ndim:  # skips np scalar
-            if other.ndim == 1:
-                if axis is not None and self._get_axis_name(axis) == 'index':
-                    # casted = self._constructor_sliced(other,
-                    #                                   index=self.index)
-                    casted = pd.Series(other, index=self.index)
-                else:
-                    # casted = self._constructor_sliced(other,
-                    #                                   index=self.columns)
-                    casted = pd.Series(other, index=self.columns)
-                return self._combine_series(casted, na_op, fill_value,
-                                            axis, level)
-            elif other.ndim == 2:
-                # casted = self._constructor(other, index=self.index,
-                #                            columns=self.columns)
-                casted = pd.DataFrame(other, index=self.index,
-                                      columns=self.columns)
-                return self._combine_frame(casted, na_op, fill_value, level)
-            else:
-                raise ValueError("Incompatible argument shape: %s" %
-                                 (other.shape, ))
+        elif isinstance(other, ABCSeries):
+            return _combine_series_frame(self, other, na_op,
+                                         fill_value=fill_value, axis=axis,
+                                         level=level, try_cast=True)
         else:
-            return self._combine_const(other, na_op)
+            if fill_value is not None:
+                self = self.fillna(fill_value)
 
-    f.__name__ = name
+            return self._combine_const(other, na_op, try_cast=True)
+
+    f.__name__ = op_name
 
     return f
 
 
-# Masker unused for now
-def _flex_comp_method_FRAME(op, name, str_rep=None, default_axis='columns',
-                            masker=False):
+def _flex_comp_method_FRAME(cls, op, special):
+    str_rep = _get_opstr(op, cls)
+    op_name = _get_op_name(op, special)
+    default_axis = _get_frame_op_default_axis(op_name)
 
     def na_op(x, y):
         try:
-            result = op(x, y)
+            with np.errstate(invalid='ignore'):
+                result = op(x, y)
         except TypeError:
-            xrav = x.ravel()
-            result = np.empty(x.size, dtype=x.dtype)
-            if isinstance(y, (np.ndarray, pd.Series)):
-                yrav = y.ravel()
-                mask = notnull(xrav) & notnull(yrav)
-                result[mask] = op(np.array(list(xrav[mask])),
-                                  np.array(list(yrav[mask])))
-            else:
-                mask = notnull(xrav)
-                result[mask] = op(np.array(list(xrav[mask])), y)
-
-            if op == operator.ne:  # pragma: no cover
-                np.putmask(result, ~mask, True)
-            else:
-                np.putmask(result, ~mask, False)
-            result = result.reshape(x.shape)
-
+            result = mask_cmp_op(x, y, op, (np.ndarray, ABCSeries))
         return result
 
-    @Appender('Wrapper for flexible comparison methods %s' % name)
+    @Appender('Wrapper for flexible comparison methods {name}'
+              .format(name=op_name))
     def f(self, other, axis=default_axis, level=None):
-        if isinstance(other, pd.DataFrame):    # Another DataFrame
-            return self._flex_compare_frame(other, na_op, str_rep, level)
 
-        elif isinstance(other, pd.Series):
-            return self._combine_series(other, na_op, None, axis, level)
+        other = _align_method_FRAME(self, other, axis)
 
-        elif isinstance(other, (list, tuple)):
-            if axis is not None and self._get_axis_name(axis) == 'index':
-                casted = pd.Series(other, index=self.index)
-            else:
-                casted = pd.Series(other, index=self.columns)
-
-            return self._combine_series(casted, na_op, None, axis, level)
-
-        elif isinstance(other, np.ndarray):
-            if other.ndim == 1:
-                if axis is not None and self._get_axis_name(axis) == 'index':
-                    casted = pd.Series(other, index=self.index)
-                else:
-                    casted = pd.Series(other, index=self.columns)
-
-                return self._combine_series(casted, na_op, None, axis, level)
-
-            elif other.ndim == 2:
-                casted = pd.DataFrame(other, index=self.index,
-                                      columns=self.columns)
-
-                return self._flex_compare_frame(casted, na_op, str_rep, level)
-
-            else:
-                raise ValueError("Incompatible argument shape: %s" %
-                                 (other.shape, ))
+        if isinstance(other, ABCDataFrame):
+            # Another DataFrame
+            if not self._indexed_same(other):
+                self, other = self.align(other, 'outer',
+                                         level=level, copy=False)
+            return self._compare_frame(other, na_op, str_rep)
 
+        elif isinstance(other, ABCSeries):
+            return _combine_series_frame(self, other, na_op,
+                                         fill_value=None, axis=axis,
+                                         level=level, try_cast=False)
         else:
-            return self._combine_const(other, na_op)
+            return self._combine_const(other, na_op, try_cast=False)
 
-    f.__name__ = name
+    f.__name__ = op_name
 
     return f
 
 
-def _comp_method_FRAME(func, name, str_rep, masker=False):
-    @Appender('Wrapper for comparison method %s' % name)
+def _comp_method_FRAME(cls, func, special):
+    str_rep = _get_opstr(func, cls)
+    op_name = _get_op_name(func, special)
+
+    @Appender('Wrapper for comparison method {name}'.format(name=op_name))
     def f(self, other):
-        if isinstance(other, pd.DataFrame):    # Another DataFrame
+        if isinstance(other, ABCDataFrame):
+            # Another DataFrame
+            if not self._indexed_same(other):
+                raise ValueError('Can only compare identically-labeled '
+                                 'DataFrame objects')
             return self._compare_frame(other, func, str_rep)
-        elif isinstance(other, pd.Series):
-            return self._combine_series_infer(other, func)
+
+        elif isinstance(other, ABCSeries):
+            return _combine_series_frame(self, other, func,
+                                         fill_value=None, axis=None,
+                                         level=None, try_cast=False)
         else:
 
-            # straight boolean comparisions we want to allow all columns
+            # straight boolean comparisons we want to allow all columns
             # (regardless of dtype to pass thru) See #4537 for discussion.
-            res = self._combine_const(other, func, raise_on_error=False)
+            res = self._combine_const(other, func,
+                                      errors='ignore',
+                                      try_cast=False)
             return res.fillna(True).astype(bool)
 
-    f.__name__ = name
+    f.__name__ = op_name
 
     return f
 
 
-frame_flex_funcs = dict(flex_arith_method=_arith_method_FRAME,
-                        radd_func=_radd_compat,
-                        flex_comp_method=_flex_comp_method_FRAME)
+# -----------------------------------------------------------------------------
+# Panel
+
+def _arith_method_PANEL(cls, op, special):
+    # work only for scalars
+    op_name = _get_op_name(op, special)
+
+    def f(self, other):
+        if not is_scalar(other):
+            raise ValueError('Simple arithmetic with {name} can only be '
+                             'done with scalar values'
+                             .format(name=self._constructor.__name__))
+
+        return self._combine(other, op)
 
+    f.__name__ = op_name
+    return f
 
-frame_special_funcs = dict(arith_method=_arith_method_FRAME,
-                           radd_func=_radd_compat,
-                           comp_method=_comp_method_FRAME,
-                           bool_method=_arith_method_FRAME)
 
+def _comp_method_PANEL(cls, op, special):
+    str_rep = _get_opstr(op, cls)
+    op_name = _get_op_name(op, special)
 
-def _arith_method_PANEL(op, name, str_rep=None, fill_zeros=None,
-                        default_axis=None, **eval_kwargs):
-    # copied from Series na_op above, but without unnecessary branch for
-    # non-scalar
     def na_op(x, y):
+        import pandas.core.computation.expressions as expressions
+
         try:
-            result = expressions.evaluate(op, str_rep, x, y,
-                                          raise_on_error=True, **eval_kwargs)
+            result = expressions.evaluate(op, str_rep, x, y)
         except TypeError:
+            result = mask_cmp_op(x, y, op, np.ndarray)
+        return result
 
-            # TODO: might need to find_common_type here?
-            result = np.empty(len(x), dtype=x.dtype)
-            mask = notnull(x)
-            result[mask] = op(x[mask], y)
-            result, changed = com._maybe_upcast_putmask(result, ~mask, np.nan)
+    @Appender('Wrapper for comparison method {name}'.format(name=op_name))
+    def f(self, other, axis=None):
+        # Validate the axis parameter
+        if axis is not None:
+            axis = self._get_axis_number(axis)
 
-        result = com._fill_zeros(result, x, y, name, fill_zeros)
-        return result
+        if isinstance(other, self._constructor):
+            return self._compare_constructor(other, na_op, try_cast=False)
+        elif isinstance(other, (self._constructor_sliced, ABCDataFrame,
+                                ABCSeries)):
+            raise Exception("input needs alignment for this object [{object}]"
+                            .format(object=self._constructor))
+        else:
+            return self._combine_const(other, na_op, try_cast=False)
 
-    # work only for scalars
-    def f(self, other):
-        if not isscalar(other):
-            raise ValueError('Simple arithmetic with %s can only be '
-                             'done with scalar values' %
-                             self._constructor.__name__)
+    f.__name__ = op_name
 
-        return self._combine(other, op)
-    f.__name__ = name
     return f
 
 
-def _comp_method_PANEL(op, name, str_rep=None, masker=False):
+def _flex_method_PANEL(cls, op, special):
+    str_rep = _get_opstr(op, cls)
+    op_name = _get_op_name(op, special)
+    eval_kwargs = _gen_eval_kwargs(op_name)
+    fill_zeros = _gen_fill_zeros(op_name)
 
     def na_op(x, y):
+        import pandas.core.computation.expressions as expressions
+
         try:
             result = expressions.evaluate(op, str_rep, x, y,
-                                          raise_on_error=True)
+                                          errors='raise',
+                                          **eval_kwargs)
         except TypeError:
-            xrav = x.ravel()
-            result = np.empty(x.size, dtype=bool)
-            if isinstance(y, np.ndarray):
-                yrav = y.ravel()
-                mask = notnull(xrav) & notnull(yrav)
-                result[mask] = op(np.array(list(xrav[mask])),
-                                  np.array(list(yrav[mask])))
-            else:
-                mask = notnull(xrav)
-                result[mask] = op(np.array(list(xrav[mask])), y)
-
-            if op == operator.ne:  # pragma: no cover
-                np.putmask(result, ~mask, True)
-            else:
-                np.putmask(result, ~mask, False)
-            result = result.reshape(x.shape)
+            result = op(x, y)
 
+        # handles discrepancy between numpy and numexpr on division/mod
+        # by 0 though, given that these are generally (always?)
+        # non-scalars, I'm not sure whether it's worth it at the moment
+        result = missing.fill_zeros(result, x, y, op_name, fill_zeros)
         return result
 
-    @Appender('Wrapper for comparison method %s' % name)
-    def f(self, other):
-        if isinstance(other, self._constructor):
-            return self._compare_constructor(other, na_op)
-        elif isinstance(other, (self._constructor_sliced, pd.DataFrame,
-                                pd.Series)):
-            raise Exception("input needs alignment for this object [%s]" %
-                            self._constructor)
-        else:
-            return self._combine_const(other, na_op)
+    if op_name in _op_descriptions:
+        doc = _make_flex_doc(op_name, 'panel')
+    else:
+        # doc strings substitors
+        doc = _agg_doc_PANEL.format(op_name=op_name)
 
-    f.__name__ = name
+    @Appender(doc)
+    def f(self, other, axis=0):
+        return self._combine(other, na_op, axis=axis)
 
+    f.__name__ = op_name
     return f
 
 
-panel_special_funcs = dict(arith_method=_arith_method_PANEL,
-                           comp_method=_comp_method_PANEL,
-                           bool_method=_arith_method_PANEL)
+# -----------------------------------------------------------------------------
+# Sparse
+
+def _cast_sparse_series_op(left, right, opname):
+    """
+    For SparseSeries operation, coerce to float64 if the result is expected
+    to have NaN or inf values
+
+    Parameters
+    ----------
+    left : SparseArray
+    right : SparseArray
+    opname : str
+
+    Returns
+    -------
+    left : SparseArray
+    right : SparseArray
+    """
+    opname = opname.strip('_')
+
+    if is_integer_dtype(left) and is_integer_dtype(right):
+        # series coerces to float64 if result should have NaN/inf
+        if opname in ('floordiv', 'mod') and (right.values == 0).any():
+            left = left.astype(np.float64)
+            right = right.astype(np.float64)
+        elif opname in ('rfloordiv', 'rmod') and (left.values == 0).any():
+            left = left.astype(np.float64)
+            right = right.astype(np.float64)
+
+    return left, right
+
+
+def _arith_method_SPARSE_SERIES(cls, op, special):
+    """
+    Wrapper function for Series arithmetic operations, to avoid
+    code duplication.
+    """
+    op_name = _get_op_name(op, special)
+
+    def wrapper(self, other):
+        if isinstance(other, ABCDataFrame):
+            return NotImplemented
+        elif isinstance(other, ABCSeries):
+            if not isinstance(other, ABCSparseSeries):
+                other = other.to_sparse(fill_value=self.fill_value)
+            return _sparse_series_op(self, other, op, op_name)
+        elif is_scalar(other):
+            with np.errstate(all='ignore'):
+                new_values = op(self.values, other)
+            return self._constructor(new_values,
+                                     index=self.index,
+                                     name=self.name)
+        else:  # pragma: no cover
+            raise TypeError('operation with {other} not supported'
+                            .format(other=type(other)))
+
+    wrapper.__name__ = op_name
+    return wrapper
+
+
+def _sparse_series_op(left, right, op, name):
+    left, right = left.align(right, join='outer', copy=False)
+    new_index = left.index
+    new_name = get_op_result_name(left, right)
+
+    from pandas.core.sparse.array import _sparse_array_op
+    lvalues, rvalues = _cast_sparse_series_op(left.values, right.values, name)
+    result = _sparse_array_op(lvalues, rvalues, op, name)
+    return left._constructor(result, index=new_index, name=new_name)
+
+
+def _arith_method_SPARSE_ARRAY(cls, op, special):
+    """
+    Wrapper function for Series arithmetic operations, to avoid
+    code duplication.
+    """
+    op_name = _get_op_name(op, special)
+
+    def wrapper(self, other):
+        from pandas.core.sparse.array import (
+            SparseArray, _sparse_array_op, _wrap_result, _get_fill)
+        if isinstance(other, np.ndarray):
+            if len(self) != len(other):
+                raise AssertionError("length mismatch: {self} vs. {other}"
+                                     .format(self=len(self), other=len(other)))
+            if not isinstance(other, SparseArray):
+                dtype = getattr(other, 'dtype', None)
+                other = SparseArray(other, fill_value=self.fill_value,
+                                    dtype=dtype)
+            return _sparse_array_op(self, other, op, op_name)
+        elif is_scalar(other):
+            with np.errstate(all='ignore'):
+                fill = op(_get_fill(self), np.asarray(other))
+                result = op(self.sp_values, other)
+
+            return _wrap_result(op_name, result, self.sp_index, fill)
+        else:  # pragma: no cover
+            raise TypeError('operation with {other} not supported'
+                            .format(other=type(other)))
+
+    wrapper.__name__ = op_name
+    return wrapper
diff --git a/pandas/core/panel.py b/pandas/core/panel.py
index 08ef82835830c..e012819812f6b 100644
--- a/pandas/core/panel.py
+++ b/pandas/core/panel.py
@@ -3,41 +3,45 @@
 """
 # pylint: disable=E1103,W0231,W0212,W0621
 from __future__ import division
-from pandas.compat import (map, zip, range, lrange, lmap, u, OrderedDict,
-                           OrderedDefaultdict)
-from pandas import compat
-import warnings
+
 import numpy as np
-from pandas.core.common import (PandasError, _try_sort, _default_index,
-                                _infer_dtype_from_scalar, notnull, is_list_like)
-from pandas.core.categorical import Categorical
+import warnings
+from pandas.core.dtypes.cast import (
+    infer_dtype_from_scalar,
+    cast_scalar_to_array,
+    maybe_cast_item)
+from pandas.core.dtypes.common import (
+    is_integer, is_list_like,
+    is_string_like, is_scalar)
+from pandas.core.dtypes.missing import notna
+
+import pandas.core.ops as ops
+import pandas.core.common as com
+from pandas import compat
+from pandas.compat import (map, zip, range, u, OrderedDict)
+from pandas.compat.numpy import function as nv
+from pandas.core.frame import DataFrame
+from pandas.core.generic import NDFrame, _shared_docs
 from pandas.core.index import (Index, MultiIndex, _ensure_index,
-                               _get_combined_index)
+                               _get_objs_combined_axis)
+from pandas.io.formats.printing import pprint_thing
 from pandas.core.indexing import maybe_droplevels
 from pandas.core.internals import (BlockManager,
                                    create_block_manager_from_arrays,
                                    create_block_manager_from_blocks)
 from pandas.core.series import Series
-from pandas.core.frame import DataFrame
-from pandas.core.generic import NDFrame, _shared_docs
-from pandas.tools.util import cartesian_product
-from pandas import compat
-from pandas.util.decorators import (deprecate, Appender, Substitution,
-                                    deprecate_kwarg)
-import pandas.core.common as com
-import pandas.core.ops as ops
-import pandas.computation.expressions as expressions
-from pandas import lib
-from pandas.core.ops import _op_descriptions
-
+from pandas.core.reshape.util import cartesian_product
+from pandas.util._decorators import Appender, Substitution
+from pandas.util._validators import validate_axis_style_args
 
 _shared_doc_kwargs = dict(
     axes='items, major_axis, minor_axis',
     klass="Panel",
-    axes_single_arg="{0, 1, 2, 'items', 'major_axis', 'minor_axis'}")
-_shared_doc_kwargs['args_transpose'] = ("three positional arguments: each one"
-                                        "of\n        %s" %
-                                        _shared_doc_kwargs['axes_single_arg'])
+    axes_single_arg="{0, 1, 2, 'items', 'major_axis', 'minor_axis'}",
+    optional_mapper='', optional_axis='', optional_labels='')
+_shared_doc_kwargs['args_transpose'] = (
+    "three positional arguments: each one of\n{ax_single}".format(
+        ax_single=_shared_doc_kwargs['axes_single_arg']))
 
 
 def _ensure_like_indices(time, panels):
@@ -55,7 +59,7 @@ def _ensure_like_indices(time, panels):
     return time, panels
 
 
-def panel_index(time, panels, names=['time', 'panel']):
+def panel_index(time, panels, names=None):
     """
     Returns a multi-index suitable for a panel-like DataFrame
 
@@ -94,21 +98,23 @@ def panel_index(time, panels, names=['time', 'panel']):
                 (1961, 'B'), (1961, 'C'), (1962, 'A'), (1962, 'B'),
                 (1962, 'C')], dtype=object)
     """
+    if names is None:
+        names = ['time', 'panel']
     time, panels = _ensure_like_indices(time, panels)
-    time_factor = Categorical.from_array(time, ordered=True)
-    panel_factor = Categorical.from_array(panels, ordered=True)
-
-    labels = [time_factor.codes, panel_factor.codes]
-    levels = [time_factor.categories, panel_factor.categories]
-    return MultiIndex(levels, labels, sortorder=None, names=names,
-                      verify_integrity=False)
+    return MultiIndex.from_arrays([time, panels], sortorder=None, names=names)
 
 
 class Panel(NDFrame):
-
     """
     Represents wide format panel data, stored as 3-dimensional array
 
+   .. deprecated:: 0.20.0
+       The recommended way to represent 3-D data are with a MultiIndex on a
+       DataFrame via the :attr:`~Panel.to_frame()` method or with the
+       `xarray package <http://xarray.pydata.org/en/stable/>`__.
+       Pandas provides a :attr:`~Panel.to_xarray()` method to automate this
+       conversion.
+
     Parameters
     ----------
     data : ndarray (items x major x minor), or dict of DataFrames
@@ -132,6 +138,18 @@ def _constructor(self):
 
     def __init__(self, data=None, items=None, major_axis=None, minor_axis=None,
                  copy=False, dtype=None):
+        # deprecation GH13563
+        warnings.warn("\nPanel is deprecated and will be removed in a "
+                      "future version.\nThe recommended way to represent "
+                      "these types of 3-dimensional data are with a "
+                      "MultiIndex on a DataFrame, via the "
+                      "Panel.to_frame() method\n"
+                      "Alternatively, you can use the xarray package "
+                      "http://xarray.pydata.org/en/stable/.\n"
+                      "Pandas provides a `.to_xarray()` method to help "
+                      "automate this conversion.\n",
+                      FutureWarning, stacklevel=3)
+
         self._init_data(data=data, items=items, major_axis=major_axis,
                         minor_axis=minor_axis, copy=copy, dtype=dtype)
 
@@ -149,11 +167,11 @@ def _init_data(self, data, copy, dtype, **kwargs):
 
         if kwargs:
             raise TypeError('_init_data() got an unexpected keyword '
-                    'argument "{0}"'.format(list(kwargs.keys())[0]))
+                            'argument "{0}"'.format(list(kwargs.keys())[0]))
 
         axes = None
         if isinstance(data, BlockManager):
-            if any(x is not None for x in passed_axes):
+            if com._any_not_none(*passed_axes):
                 axes = [x if x is not None else y
                         for x, y in zip(passed_axes, data.axes)]
             mgr = data
@@ -165,15 +183,14 @@ def _init_data(self, data, copy, dtype, **kwargs):
             mgr = self._init_matrix(data, passed_axes, dtype=dtype, copy=copy)
             copy = False
             dtype = None
-        elif lib.isscalar(data) and all(x is not None for x in passed_axes):
-            if dtype is None:
-                dtype, data = _infer_dtype_from_scalar(data)
-            values = np.empty([len(x) for x in passed_axes], dtype=dtype)
-            values.fill(data)
-            mgr = self._init_matrix(values, passed_axes, dtype=dtype, copy=False)
+        elif is_scalar(data) and com._all_not_none(*passed_axes):
+            values = cast_scalar_to_array([len(x) for x in passed_axes],
+                                          data, dtype=dtype)
+            mgr = self._init_matrix(values, passed_axes, dtype=values.dtype,
+                                    copy=False)
             copy = False
         else:  # pragma: no cover
-            raise PandasError('Panel constructor not properly called!')
+            raise ValueError('Panel constructor not properly called!')
 
         NDFrame.__init__(self, mgr, axes=axes, copy=copy, dtype=dtype)
 
@@ -183,21 +200,20 @@ def _init_dict(self, data, axes, dtype=None):
         # prefilter if haxis passed
         if haxis is not None:
             haxis = _ensure_index(haxis)
-            data = OrderedDict((k, v) for k, v
-                               in compat.iteritems(data) if k in haxis)
+            data = OrderedDict((k, v)
+                               for k, v in compat.iteritems(data)
+                               if k in haxis)
         else:
-            ks = list(data.keys())
-            if not isinstance(data, OrderedDict):
-                ks = _try_sort(ks)
-            haxis = Index(ks)
+            keys = com._dict_keys_to_ordered_list(data)
+            haxis = Index(keys)
 
         for k, v in compat.iteritems(data):
             if isinstance(v, dict):
                 data[k] = self._constructor_sliced(v)
 
         # extract axis for remaining axes & create the slicemap
-        raxes = [self._extract_axis(self, data, axis=i)
-                 if a is None else a for i, a in enumerate(axes)]
+        raxes = [self._extract_axis(self, data, axis=i) if a is None else a
+                 for i, a in enumerate(axes)]
         raxes_sm = self._extract_axes_for_slice(self, raxes)
 
         # shallow copy
@@ -246,9 +262,11 @@ def from_dict(cls, data, intersect=False, orient='items', dtype=None):
         -------
         Panel
         """
+        from collections import defaultdict
+
         orient = orient.lower()
         if orient == 'minor':
-            new_data = OrderedDefaultdict(dict)
+            new_data = defaultdict(OrderedDict)
             for col, df in compat.iteritems(data):
                 for item, s in compat.iteritems(df):
                     new_data[item][col] = s
@@ -264,11 +282,13 @@ def from_dict(cls, data, intersect=False, orient='items', dtype=None):
         return cls(**d)
 
     def __getitem__(self, key):
+        key = com._apply_if_callable(key, self)
+
         if isinstance(self._info_axis, MultiIndex):
             return self._getitem_multilevel(key)
         if not (is_list_like(key) or isinstance(key, slice)):
             return super(Panel, self).__getitem__(key)
-        return self.ix[key]
+        return self.loc[key]
 
     def _getitem_multilevel(self, key):
         info = self._info_axis
@@ -276,8 +296,7 @@ def _getitem_multilevel(self, key):
         if isinstance(loc, (slice, np.ndarray)):
             new_index = info[loc]
             result_index = maybe_droplevels(new_index, key)
-            slices = [loc] + [slice(None) for x in range(
-                self._AXIS_LEN - 1)]
+            slices = [loc] + [slice(None) for x in range(self._AXIS_LEN - 1)]
             new_values = self.values[slices]
 
             d = self._construct_axes_dict(self._AXIS_ORDERS[1:])
@@ -294,23 +313,24 @@ def _init_matrix(self, data, axes, dtype=None, copy=False):
             try:
                 values = values.astype(dtype)
             except Exception:
-                raise ValueError('failed to cast to %s' % dtype)
+                raise ValueError('failed to cast to '
+                                 '{datatype}'.format(datatype=dtype))
 
         shape = values.shape
         fixed_axes = []
         for i, ax in enumerate(axes):
             if ax is None:
-                ax = _default_index(shape[i])
+                ax = com._default_index(shape[i])
             else:
                 ax = _ensure_index(ax)
             fixed_axes.append(ax)
 
         return create_block_manager_from_blocks([values], fixed_axes)
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Comparison methods
 
-    def _compare_constructor(self, other, func):
+    def _compare_constructor(self, other, func, try_cast=True):
         if not self._indexed_same(other):
             raise Exception('Can only compare identically-labeled '
                             'same type objects')
@@ -322,7 +342,7 @@ def _compare_constructor(self, other, func):
         d = self._construct_axes_dict(copy=False)
         return self._constructor(data=new_data, **d)
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Magic methods
 
     def __unicode__(self):
@@ -335,18 +355,18 @@ def __unicode__(self):
 
         class_name = str(self.__class__)
 
-        shape = self.shape
-        dims = u('Dimensions: %s') % ' x '.join(
-            ["%d (%s)" % (s, a) for a, s in zip(self._AXIS_ORDERS, shape)])
+        dims = u('Dimensions: {dimensions}'.format(dimensions=' x '.join(
+            ["{shape} ({axis})".format(shape=shape, axis=axis) for axis, shape
+             in zip(self._AXIS_ORDERS, self.shape)])))
 
         def axis_pretty(a):
             v = getattr(self, a)
             if len(v) > 0:
-                return u('%s axis: %s to %s') % (a.capitalize(),
-                                                 com.pprint_thing(v[0]),
-                                                 com.pprint_thing(v[-1]))
+                return u('{ax} axis: {x} to {y}'.format(ax=a.capitalize(),
+                                                        x=pprint_thing(v[0]),
+                                                        y=pprint_thing(v[-1])))
             else:
-                return u('%s axis: None') % a.capitalize()
+                return u('{ax} axis: None'.format(ax=a.capitalize()))
 
         output = '\n'.join(
             [class_name, dims] + [axis_pretty(a) for a in self._AXIS_ORDERS])
@@ -378,30 +398,20 @@ def _get_plane_axes(self, axis):
         (as compared with higher level planes),
         as we are returning a DataFrame axes
         """
-        return [ self._get_axis(axi) for axi in self._get_plane_axes_index(axis) ]
+        return [self._get_axis(axi)
+                for axi in self._get_plane_axes_index(axis)]
 
     fromDict = from_dict
 
-    def to_sparse(self, fill_value=None, kind='block'):
+    def to_sparse(self, *args, **kwargs):
         """
-        Convert to SparsePanel
-
-        Parameters
-        ----------
-        fill_value : float, default NaN
-        kind : {'block', 'integer'}
+        NOT IMPLEMENTED: do not call this method, as sparsifying is not
+        supported for Panel objects and will raise an error.
 
-        Returns
-        -------
-        y : SparseDataFrame
+        Convert to SparsePanel
         """
-        from pandas.core.sparse import SparsePanel
-        frames = dict(compat.iteritems(self))
-        return SparsePanel(frames, items=self.items,
-                           major_axis=self.major_axis,
-                           minor_axis=self.minor_axis,
-                           default_kind=kind,
-                           default_fill_value=fill_value)
+        raise NotImplementedError("sparsifying is not supported "
+                                  "for Panel objects")
 
     def to_excel(self, path, na_rep='', engine=None, **kwargs):
         """
@@ -449,21 +459,24 @@ def to_excel(self, path, na_rep='', engine=None, **kwargs):
             writer = path
         kwargs['na_rep'] = na_rep
 
-        for item, df in compat.iteritems(self):
+        for item, df in self.iteritems():
             name = str(item)
             df.to_excel(writer, name, **kwargs)
         writer.save()
 
     def as_matrix(self):
         self._consolidate_inplace()
-        return self._data.as_matrix()
+        return self._data.as_array()
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Getting and setting elements
 
     def get_value(self, *args, **kwargs):
-        """
-        Quickly retrieve single value at (item, major, minor) location
+        """Quickly retrieve single value at (item, major, minor) location
+
+        .. deprecated:: 0.21.0
+
+        Please use .at[] or .iat[] accessors.
 
         Parameters
         ----------
@@ -476,6 +489,13 @@ def get_value(self, *args, **kwargs):
         -------
         value : scalar value
         """
+        warnings.warn("get_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._get_value(*args, **kwargs)
+
+    def _get_value(self, *args, **kwargs):
         nargs = len(args)
         nreq = self._AXIS_LEN
 
@@ -488,18 +508,22 @@ def get_value(self, *args, **kwargs):
 
         if kwargs:
             raise TypeError('get_value() got an unexpected keyword '
-                    'argument "{0}"'.format(list(kwargs.keys())[0]))
+                            'argument "{0}"'.format(list(kwargs.keys())[0]))
 
         if takeable is True:
             lower = self._iget_item_cache(args[0])
         else:
             lower = self._get_item_cache(args[0])
 
-        return lower.get_value(*args[1:], takeable=takeable)
+        return lower._get_value(*args[1:], takeable=takeable)
+    _get_value.__doc__ = get_value.__doc__
 
     def set_value(self, *args, **kwargs):
-        """
-        Quickly set single value at (item, major, minor) location
+        """Quickly set single value at (item, major, minor) location
+
+        .. deprecated:: 0.21.0
+
+        Please use .at[] or .iat[] accessors.
 
         Parameters
         ----------
@@ -515,6 +539,13 @@ def set_value(self, *args, **kwargs):
             If label combo is contained, will be reference to calling Panel,
             otherwise a new object
         """
+        warnings.warn("set_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._set_value(*args, **kwargs)
+
+    def _set_value(self, *args, **kwargs):
         # require an arg for each axis and the value
         nargs = len(args)
         nreq = self._AXIS_LEN + 1
@@ -527,7 +558,7 @@ def set_value(self, *args, **kwargs):
 
         if kwargs:
             raise TypeError('set_value() got an unexpected keyword '
-                    'argument "{0}"'.format(list(kwargs.keys())[0]))
+                            'argument "{0}"'.format(list(kwargs.keys())[0]))
 
         try:
             if takeable is True:
@@ -535,21 +566,21 @@ def set_value(self, *args, **kwargs):
             else:
                 lower = self._get_item_cache(args[0])
 
-            lower.set_value(*args[1:], takeable=takeable)
+            lower._set_value(*args[1:], takeable=takeable)
             return self
         except KeyError:
             axes = self._expand_axes(args)
             d = self._construct_axes_dict_from(self, axes, copy=False)
             result = self.reindex(**d)
             args = list(args)
-            likely_dtype, args[-1] = _infer_dtype_from_scalar(args[-1])
-            made_bigger = not np.array_equal(
-                axes[0], self._info_axis)
+            likely_dtype, args[-1] = infer_dtype_from_scalar(args[-1])
+            made_bigger = not np.array_equal(axes[0], self._info_axis)
             # how to make this logic simpler?
             if made_bigger:
-                com._possibly_cast_item(result, args[0], likely_dtype)
+                maybe_cast_item(result, args[0], likely_dtype)
 
-            return result.set_value(*args)
+            return result._set_value(*args)
+    _set_value.__doc__ = set_value.__doc__
 
     def _box_item_values(self, key, values):
         if self.ndim == values.ndim:
@@ -565,6 +596,7 @@ def _box_item_values(self, key, values):
         return self._constructor_sliced(values, **d)
 
     def __setitem__(self, key, value):
+        key = com._apply_if_callable(key, self)
         shape = tuple(self.shape)
         if isinstance(value, self._constructor_sliced):
             value = value.reindex(
@@ -572,23 +604,24 @@ def __setitem__(self, key, value):
             mat = value.values
         elif isinstance(value, np.ndarray):
             if value.shape != shape[1:]:
-                raise ValueError(
-                    'shape of value must be {0}, shape of given object was '
-                    '{1}'.format(shape[1:], tuple(map(int, value.shape))))
+                raise ValueError('shape of value must be {0}, shape of given '
+                                 'object was {1}'.format(
+                                     shape[1:], tuple(map(int, value.shape))))
             mat = np.asarray(value)
-        elif np.isscalar(value):
-            dtype, value = _infer_dtype_from_scalar(value)
-            mat = np.empty(shape[1:], dtype=dtype)
-            mat.fill(value)
+        elif is_scalar(value):
+            mat = cast_scalar_to_array(shape[1:], value)
         else:
-            raise TypeError('Cannot set item of type: %s' % str(type(value)))
+            raise TypeError('Cannot set item of '
+                            'type: {dtype!s}'.format(dtype=type(value)))
 
         mat = mat.reshape(tuple([1]) + shape[1:])
         NDFrame._set_item(self, key, mat)
 
     def _unpickle_panel_compat(self, state):  # pragma: no cover
         "Unpickle the panel"
-        _unpickle = com._unpickle_array
+        from pandas.io.pickle import _unpickle_array
+
+        _unpickle = _unpickle_array
         vals, items, major, minor = state
 
         items = _unpickle(items)
@@ -624,6 +657,34 @@ def head(self, n=5):
     def tail(self, n=5):
         raise NotImplementedError
 
+    def round(self, decimals=0, *args, **kwargs):
+        """
+        Round each value in Panel to a specified number of decimal places.
+
+        .. versionadded:: 0.18.0
+
+        Parameters
+        ----------
+        decimals : int
+            Number of decimal places to round to (default: 0).
+            If decimals is negative, it specifies the number of
+            positions to the left of the decimal point.
+
+        Returns
+        -------
+        Panel object
+
+        See Also
+        --------
+        numpy.around
+        """
+        nv.validate_round(args, kwargs)
+
+        if is_integer(decimals):
+            result = np.apply_along_axis(np.round, 0, self.values)
+            return self._wrap_result(result, axis=0)
+        raise TypeError("decimals must be an integer")
+
     def _needs_reindex_multi(self, axes, method, level):
         """ don't allow a multi reindex on Panel or above ndim """
         return False
@@ -653,7 +714,7 @@ def dropna(self, axis=0, how='any', inplace=False):
         axis = self._get_axis_number(axis)
 
         values = self.values
-        mask = com.notnull(values)
+        mask = notna(values)
 
         for ax in reversed(sorted(set(range(self._AXIS_LEN)) - set([axis]))):
             mask = mask.sum(ax)
@@ -677,37 +738,39 @@ def _combine(self, other, func, axis=0):
             return self._combine_panel(other, func)
         elif isinstance(other, DataFrame):
             return self._combine_frame(other, func, axis=axis)
-        elif np.isscalar(other):
+        elif is_scalar(other):
             return self._combine_const(other, func)
         else:
-            raise NotImplementedError(str(type(other)) + 
-                ' is not supported in combine operation with ' + 
-                str(type(self)))
+            raise NotImplementedError(
+                "{otype!s} is not supported in combine operation with "
+                "{selftype!s}".format(otype=type(other), selftype=type(self)))
 
-    def _combine_const(self, other, func):
-        new_values = func(self.values, other)
+    def _combine_const(self, other, func, try_cast=True):
+        with np.errstate(all='ignore'):
+            new_values = func(self.values, other)
         d = self._construct_axes_dict()
         return self._constructor(new_values, **d)
 
-    def _combine_frame(self, other, func, axis=0):
+    def _combine_frame(self, other, func, axis=0, try_cast=True):
         index, columns = self._get_plane_axes(axis)
         axis = self._get_axis_number(axis)
 
         other = other.reindex(index=index, columns=columns)
 
-        if axis == 0:
-            new_values = func(self.values, other.values)
-        elif axis == 1:
-            new_values = func(self.values.swapaxes(0, 1), other.values.T)
-            new_values = new_values.swapaxes(0, 1)
-        elif axis == 2:
-            new_values = func(self.values.swapaxes(0, 2), other.values)
-            new_values = new_values.swapaxes(0, 2)
+        with np.errstate(all='ignore'):
+            if axis == 0:
+                new_values = func(self.values, other.values)
+            elif axis == 1:
+                new_values = func(self.values.swapaxes(0, 1), other.values.T)
+                new_values = new_values.swapaxes(0, 1)
+            elif axis == 2:
+                new_values = func(self.values.swapaxes(0, 2), other.values)
+                new_values = new_values.swapaxes(0, 2)
 
         return self._constructor(new_values, self.items, self.major_axis,
                                  self.minor_axis)
 
-    def _combine_panel(self, other, func):
+    def _combine_panel(self, other, func, try_cast=True):
         items = self.items.union(other.items)
         major = self.major_axis.union(other.major_axis)
         minor = self.minor_axis.union(other.minor_axis)
@@ -716,11 +779,12 @@ def _combine_panel(self, other, func):
         this = self.reindex(items=items, major=major, minor=minor)
         other = other.reindex(items=items, major=major, minor=minor)
 
-        result_values = func(this.values, other.values)
+        with np.errstate(all='ignore'):
+            result_values = func(this.values, other.values)
 
         return self._constructor(result_values, items, major, minor)
 
-    def major_xs(self, key, copy=None):
+    def major_xs(self, key):
         """
         Return slice of panel along major axis
 
@@ -728,8 +792,6 @@ def major_xs(self, key, copy=None):
         ----------
         key : object
             Major axis label
-        copy : boolean [deprecated]
-            Whether to make a copy of the data
 
         Returns
         -------
@@ -740,17 +802,14 @@ def major_xs(self, key, copy=None):
         -----
         major_xs is only for getting, not setting values.
 
-        MultiIndex Slicers is a generic way to get/set values on any level or levels
-        it is a superset of major_xs functionality, see :ref:`MultiIndex Slicers <advanced.mi_slicers>`
+        MultiIndex Slicers is a generic way to get/set values on any level or
+        levels and is a superset of major_xs functionality, see
+        :ref:`MultiIndex Slicers <advanced.mi_slicers>`
 
         """
-        if copy is not None:
-            warnings.warn("copy keyword is deprecated, "
-                          "default is to return a copy or a view if possible")
-
         return self.xs(key, axis=self._AXIS_LEN - 2)
 
-    def minor_xs(self, key, copy=None):
+    def minor_xs(self, key):
         """
         Return slice of panel along minor axis
 
@@ -758,8 +817,6 @@ def minor_xs(self, key, copy=None):
         ----------
         key : object
             Minor axis label
-        copy : boolean [deprecated]
-            Whether to make a copy of the data
 
         Returns
         -------
@@ -770,17 +827,14 @@ def minor_xs(self, key, copy=None):
         -----
         minor_xs is only for getting, not setting values.
 
-        MultiIndex Slicers is a generic way to get/set values on any level or levels
-        it is a superset of minor_xs functionality, see :ref:`MultiIndex Slicers <advanced.mi_slicers>`
+        MultiIndex Slicers is a generic way to get/set values on any level or
+        levels and is a superset of minor_xs functionality, see
+        :ref:`MultiIndex Slicers <advanced.mi_slicers>`
 
         """
-        if copy is not None:
-            warnings.warn("copy keyword is deprecated, "
-                          "default is to return a copy or a view if possible")
-
         return self.xs(key, axis=self._AXIS_LEN - 1)
 
-    def xs(self, key, axis=1, copy=None):
+    def xs(self, key, axis=1):
         """
         Return slice of panel along selected axis
 
@@ -789,8 +843,6 @@ def xs(self, key, axis=1, copy=None):
         key : object
             Label
         axis : {'items', 'major', 'minor}, default 1/'major'
-        copy : boolean [deprecated]
-            Whether to make a copy of the data
 
         Returns
         -------
@@ -800,14 +852,11 @@ def xs(self, key, axis=1, copy=None):
         -----
         xs is only for getting, not setting values.
 
-        MultiIndex Slicers is a generic way to get/set values on any level or levels
-        it is a superset of xs functionality, see :ref:`MultiIndex Slicers <advanced.mi_slicers>`
+        MultiIndex Slicers is a generic way to get/set values on any level or
+        levels and is a superset of xs functionality, see
+        :ref:`MultiIndex Slicers <advanced.mi_slicers>`
 
         """
-        if copy is not None:
-            warnings.warn("copy keyword is deprecated, "
-                          "default is to return a copy or a view if possible")
-
         axis = self._get_axis_number(axis)
         if axis == 0:
             return self[key]
@@ -832,7 +881,8 @@ def _ixs(self, i, axis=0):
         key = ax[i]
 
         # xs cannot handle a non-scalar key, so just reindex here
-        # if we have a multi-index and a single tuple, then its a reduction (GH 7516)
+        # if we have a multi-index and a single tuple, then its a reduction
+        # (GH 7516)
         if not (isinstance(ax, MultiIndex) and isinstance(key, tuple)):
             if is_list_like(key):
                 indexer = {self._get_axis_name(axis): key}
@@ -862,7 +912,7 @@ def groupby(self, function, axis='major'):
         -------
         grouped : PanelGroupBy
         """
-        from pandas.core.groupby import PanelGroupBy
+        from pandas.core.groupby.groupby import PanelGroupBy
         axis = self._get_axis_number(axis)
         return PanelGroupBy(self, function, axis=axis)
 
@@ -886,7 +936,7 @@ def to_frame(self, filter_observations=True):
 
         if filter_observations:
             # shaped like the return DataFrame
-            mask = com.notnull(self.values).all(axis=0)
+            mask = notna(self.values).all(axis=0)
             # size = mask.sum()
             selector = mask.ravel()
         else:
@@ -898,10 +948,14 @@ def to_frame(self, filter_observations=True):
             data[item] = self[item].values.ravel()[selector]
 
         def construct_multi_parts(idx, n_repeat, n_shuffle=1):
-            axis_idx = idx.to_hierarchical(n_repeat, n_shuffle)
-            labels = [x[selector] for x in axis_idx.labels]
-            levels = axis_idx.levels
-            names = axis_idx.names
+            # Replicates and shuffles MultiIndex, returns individual attributes
+            labels = [np.repeat(x, n_repeat) for x in idx.labels]
+            # Assumes that each label is divisible by n_shuffle
+            labels = [x.reshape(n_shuffle, -1).ravel(order='F')
+                      for x in labels]
+            labels = [x[selector] for x in labels]
+            levels = idx.levels
+            names = idx.names
             return labels, levels, names
 
         def construct_index_parts(idx, major=True):
@@ -934,37 +988,50 @@ def construct_index_parts(idx, major=True):
         labels = major_labels + minor_labels
         names = major_names + minor_names
 
-        index = MultiIndex(levels=levels, labels=labels,
-                           names=names, verify_integrity=False)
+        index = MultiIndex(levels=levels, labels=labels, names=names,
+                           verify_integrity=False)
 
         return DataFrame(data, index=index, columns=self.items)
 
-    to_long = deprecate('to_long', to_frame)
-    toLong = deprecate('toLong', to_frame)
-
     def apply(self, func, axis='major', **kwargs):
         """
-        Applies function along input axis of the Panel
+        Applies function along axis (or axes) of the Panel
 
         Parameters
         ----------
         func : function
             Function to apply to each combination of 'other' axes
-            e.g. if axis = 'items', then the combination of major_axis/minor_axis
-            will be passed a Series
-        axis : {'major', 'minor', 'items'}
+            e.g. if axis = 'items', the combination of major_axis/minor_axis
+            will each be passed as a Series; if axis = ('items', 'major'),
+            DataFrames of items & major axis will be passed
+        axis : {'items', 'minor', 'major'}, or {0, 1, 2}, or a tuple with two
+            axes
         Additional keyword arguments will be passed as keywords to the function
 
         Examples
         --------
-        >>> p.apply(numpy.sqrt) # returns a Panel
-        >>> p.apply(lambda x: x.sum(), axis=0) # equiv to p.sum(0)
-        >>> p.apply(lambda x: x.sum(), axis=1) # equiv to p.sum(1)
-        >>> p.apply(lambda x: x.sum(), axis=2) # equiv to p.sum(2)
+
+        Returns a Panel with the square root of each element
+
+        >>> p = pd.Panel(np.random.rand(4,3,2))
+        >>> p.apply(np.sqrt)
+
+        Equivalent to p.sum(1), returning a DataFrame
+
+        >>> p.apply(lambda x: x.sum(), axis=1)
+
+        Equivalent to previous:
+
+        >>> p.apply(lambda x: x.sum(), axis='major')
+
+        Return the shapes of each DataFrame over axis 2 (i.e the shapes of
+        items x major), as a Series
+
+        >>> p.apply(lambda x: x.shape, axis=(0,1))
 
         Returns
         -------
-        result : Pandas Object
+        result : Panel, DataFrame, or Series
         """
 
         if kwargs and not isinstance(func, np.ufunc):
@@ -973,7 +1040,7 @@ def apply(self, func, axis='major', **kwargs):
             f = func
 
         # 2d-slabs
-        if isinstance(axis, (tuple,list)) and len(axis) == 2:
+        if isinstance(axis, (tuple, list)) and len(axis) == 2:
             return self._apply_2d(f, axis=axis)
 
         axis = self._get_axis_number(axis)
@@ -981,7 +1048,8 @@ def apply(self, func, axis='major', **kwargs):
         # try ufunc like
         if isinstance(f, np.ufunc):
             try:
-                result = np.apply_along_axis(func, axis, self.values)
+                with np.errstate(all='ignore'):
+                    result = np.apply_along_axis(func, axis, self.values)
                 return self._wrap_result(result, axis=axis)
             except (AttributeError):
                 pass
@@ -992,19 +1060,18 @@ def apply(self, func, axis='major', **kwargs):
     def _apply_1d(self, func, axis):
 
         axis_name = self._get_axis_name(axis)
-        ax = self._get_axis(axis)
         ndim = self.ndim
         values = self.values
 
         # iter thru the axes
         slice_axis = self._get_axis(axis)
-        slice_indexer = [0]*(ndim-1)
+        slice_indexer = [0] * (ndim - 1)
         indexer = np.zeros(ndim, 'O')
         indlist = list(range(ndim))
         indlist.remove(axis)
         indexer[axis] = slice(None, None)
         indexer.put(indlist, slice_indexer)
-        planes = [ self._get_axis(axi) for axi in indlist ]
+        planes = [self._get_axis(axi) for axi in indlist]
         shape = np.array(self.shape).take(indlist)
 
         # all the iteration points
@@ -1014,10 +1081,10 @@ def _apply_1d(self, func, axis):
         for i in range(np.prod(shape)):
 
             # construct the object
-            pts = tuple([ p[i] for p in points ])
+            pts = tuple(p[i] for p in points)
             indexer.put(indlist, slice_indexer)
 
-            obj = Series(values[tuple(indexer)],index=slice_axis,name=pts)
+            obj = Series(values[tuple(indexer)], index=slice_axis, name=pts)
             result = func(obj)
 
             results.append(result)
@@ -1025,8 +1092,8 @@ def _apply_1d(self, func, axis):
             # increment the indexer
             slice_indexer[-1] += 1
             n = -1
-            while (slice_indexer[n] >= shape[n]) and (n > (1-ndim)):
-                slice_indexer[n-1] += 1
+            while (slice_indexer[n] >= shape[n]) and (n > (1 - ndim)):
+                slice_indexer[n - 1] += 1
                 slice_indexer[n] = 0
                 n -= 1
 
@@ -1035,25 +1102,25 @@ def _apply_1d(self, func, axis):
             return self._constructor(**self._construct_axes_dict())
 
         # same ndim as current
-        if isinstance(results[0],Series):
-            arr = np.vstack([ r.values for r in results ])
+        if isinstance(results[0], Series):
+            arr = np.vstack([r.values for r in results])
             arr = arr.T.reshape(tuple([len(slice_axis)] + list(shape)))
-            tranp = np.array([axis]+indlist).argsort()
+            tranp = np.array([axis] + indlist).argsort()
             arr = arr.transpose(tuple(list(tranp)))
-            return self._constructor(arr,**self._construct_axes_dict())
+            return self._constructor(arr, **self._construct_axes_dict())
 
         # ndim-1 shape
         results = np.array(results).reshape(shape)
         if results.ndim == 2 and axis_name != self._info_axis_name:
             results = results.T
             planes = planes[::-1]
-        return self._construct_return_type(results,planes)
+        return self._construct_return_type(results, planes)
 
     def _apply_2d(self, func, axis):
         """ handle 2-d slices, equiv to iterating over the other axis """
 
         ndim = self.ndim
-        axis = [ self._get_axis_number(a) for a in axis ]
+        axis = [self._get_axis_number(a) for a in axis]
 
         # construct slabs, in 2-d this is a DataFrame result
         indexer_axis = list(range(ndim))
@@ -1061,32 +1128,45 @@ def _apply_2d(self, func, axis):
             indexer_axis.remove(a)
         indexer_axis = indexer_axis[0]
 
-        slicer = [ slice(None,None) ] * ndim
+        slicer = [slice(None, None)] * ndim
         ax = self._get_axis(indexer_axis)
 
         results = []
         for i, e in enumerate(ax):
-
             slicer[indexer_axis] = i
             sliced = self.iloc[tuple(slicer)]
 
             obj = func(sliced)
-            results.append((e,obj))
+            results.append((e, obj))
 
         return self._construct_return_type(dict(results))
 
     def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
                 filter_type=None, **kwds):
         if numeric_only:
-            raise NotImplementedError(
-                'Panel.{0} does not implement numeric_only.'.format(name))
+            raise NotImplementedError('Panel.{0} does not implement '
+                                      'numeric_only.'.format(name))
+
+        if axis is None and filter_type == 'bool':
+            # labels = None
+            # constructor = None
+            axis_number = None
+            axis_name = None
+        else:
+            # TODO: Make other agg func handle axis=None properly
+            axis = self._get_axis_number(axis)
+            # labels = self._get_agg_axis(axis)
+            # constructor = self._constructor
+            axis_name = self._get_axis_name(axis)
+            axis_number = self._get_axis_number(axis_name)
 
-        axis_name = self._get_axis_name(axis)
-        axis_number = self._get_axis_number(axis_name)
         f = lambda x: op(x, axis=axis_number, skipna=skipna, **kwds)
 
-        result = f(self.values)
+        with np.errstate(all='ignore'):
+            result = f(self.values)
 
+        if axis is None and filter_type == 'bool':
+            return np.bool_(result)
         axes = self._get_plane_axes(axis_name)
         if result.ndim == 2 and axis_name != self._info_axis_name:
             result = result.T
@@ -1095,12 +1175,12 @@ def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
 
     def _construct_return_type(self, result, axes=None):
         """ return the type for the ndim of the result """
-        ndim = getattr(result,'ndim',None)
+        ndim = getattr(result, 'ndim', None)
 
         # need to assume they are the same
         if ndim is None:
-            if isinstance(result,dict):
-                ndim = getattr(list(compat.itervalues(result))[0],'ndim',0)
+            if isinstance(result, dict):
+                ndim = getattr(list(compat.itervalues(result))[0], 'ndim', 0)
 
                 # have a dict, so top-level is +1 dim
                 if ndim != 0:
@@ -1112,7 +1192,7 @@ def _construct_return_type(self, result, axes=None):
 
         # same as self
         elif self.ndim == ndim:
-            """ return the construction dictionary for these axes """
+            # return the construction dictionary for these axes
             if axes is None:
                 return self._constructor(result)
             return self._constructor(result, **self._construct_axes_dict())
@@ -1124,8 +1204,8 @@ def _construct_return_type(self, result, axes=None):
             return self._constructor_sliced(
                 result, **self._extract_axes_for_slice(self, axes))
 
-        raise PandasError('invalid _construct_return_type [self->%s] '
-                          '[result->%s]' % (self, result))
+        raise ValueError('invalid _construct_return_type [self->{self}] '
+                         '[result->{result}]'.format(self=self, result=result))
 
     def _wrap_result(self, result, axis):
         axis = self._get_axis_name(axis)
@@ -1136,20 +1216,32 @@ def _wrap_result(self, result, axis):
         return self._construct_return_type(result, axes)
 
     @Appender(_shared_docs['reindex'] % _shared_doc_kwargs)
-    def reindex(self, items=None, major_axis=None, minor_axis=None, **kwargs):
-        major_axis = (major_axis if major_axis is not None
-                      else kwargs.pop('major', None))
-        minor_axis = (minor_axis if minor_axis is not None
-                      else kwargs.pop('minor', None))
-        return super(Panel, self).reindex(items=items, major_axis=major_axis,
-                                          minor_axis=minor_axis, **kwargs)
+    def reindex(self, *args, **kwargs):
+        major = kwargs.pop("major", None)
+        minor = kwargs.pop('minor', None)
+
+        if major is not None:
+            if kwargs.get("major_axis"):
+                raise TypeError("Cannot specify both 'major' and 'major_axis'")
+            kwargs['major_axis'] = major
+        if minor is not None:
+            if kwargs.get("minor_axis"):
+                raise TypeError("Cannot specify both 'minor' and 'minor_axis'")
+
+            kwargs['minor_axis'] = minor
+        axes = validate_axis_style_args(self, args, kwargs, 'labels',
+                                        'reindex')
+        kwargs.update(axes)
+        kwargs.pop('axis', None)
+        kwargs.pop('labels', None)
+        return super(Panel, self).reindex(**kwargs)
 
     @Appender(_shared_docs['rename'] % _shared_doc_kwargs)
     def rename(self, items=None, major_axis=None, minor_axis=None, **kwargs):
-        major_axis = (major_axis if major_axis is not None
-                      else kwargs.pop('major', None))
-        minor_axis = (minor_axis if minor_axis is not None
-                      else kwargs.pop('minor', None))
+        major_axis = (major_axis if major_axis is not None else
+                      kwargs.pop('major', None))
+        minor_axis = (minor_axis if minor_axis is not None else
+                      kwargs.pop('minor', None))
         return super(Panel, self).rename(items=items, major_axis=major_axis,
                                          minor_axis=minor_axis, **kwargs)
 
@@ -1163,15 +1255,29 @@ def reindex_axis(self, labels, axis=0, method=None, level=None, copy=True,
 
     @Appender(_shared_docs['transpose'] % _shared_doc_kwargs)
     def transpose(self, *args, **kwargs):
-        return super(Panel, self).transpose(*args, **kwargs)
+        # check if a list of axes was passed in instead as a
+        # single *args element
+        if (len(args) == 1 and hasattr(args[0], '__iter__') and
+                not is_string_like(args[0])):
+            axes = args[0]
+        else:
+            axes = args
+
+        if 'axes' in kwargs and axes:
+            raise TypeError("transpose() got multiple values for "
+                            "keyword argument 'axes'")
+        elif not axes:
+            axes = kwargs.pop('axes', ())
 
-    @Appender(_shared_docs['fillna'] % _shared_doc_kwargs)
+        return super(Panel, self).transpose(*axes, **kwargs)
+
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(NDFrame.fillna.__doc__)
     def fillna(self, value=None, method=None, axis=None, inplace=False,
                limit=None, downcast=None, **kwargs):
-        return super(Panel, self).fillna(value=value, method=method,
-                                         axis=axis, inplace=inplace,
-                                         limit=limit, downcast=downcast,
-                                         **kwargs)
+        return super(Panel, self).fillna(value=value, method=method, axis=axis,
+                                         inplace=inplace, limit=limit,
+                                         downcast=downcast, **kwargs)
 
     def count(self, axis='major'):
         """
@@ -1189,11 +1295,10 @@ def count(self, axis='major'):
 
         values = self.values
         mask = np.isfinite(values)
-        result = mask.sum(axis=i,dtype='int64')
+        result = mask.sum(axis=i, dtype='int64')
 
         return self._wrap_result(result, axis)
 
-    @deprecate_kwarg(old_arg_name='lags', new_arg_name='periods')
     def shift(self, periods=1, freq=None, axis='major'):
         """
         Shift index by desired number of periods with an optional time freq.
@@ -1244,7 +1349,7 @@ def join(self, other, how='left', lsuffix='', rsuffix=''):
         -------
         joined : Panel
         """
-        from pandas.tools.merge import concat
+        from pandas.core.reshape.concat import concat
 
         if isinstance(other, Panel):
             join_major, join_minor = self._get_join_index(other, how)
@@ -1317,16 +1422,17 @@ def _get_join_index(self, other, how):
     # miscellaneous data creation
     @staticmethod
     def _extract_axes(self, data, axes, **kwargs):
-        """ return a list of the axis indicies """
-        return [self._extract_axis(self, data, axis=i, **kwargs) for i, a
-                in enumerate(axes)]
+        """ return a list of the axis indices """
+        return [self._extract_axis(self, data, axis=i, **kwargs)
+                for i, a in enumerate(axes)]
 
     @staticmethod
     def _extract_axes_for_slice(self, axes):
         """ return the slice dictionary for these axes """
-        return dict([(self._AXIS_SLICEMAP[i], a)
-                     for i, a in zip(self._AXIS_ORDERS[self._AXIS_LEN -
-                                                       len(axes):], axes)])
+        return dict((self._AXIS_SLICEMAP[i], a)
+                    for i, a in zip(
+                        self._AXIS_ORDERS[self._AXIS_LEN - len(axes):],
+                        axes))
 
     @staticmethod
     def _prep_ndarray(self, values, copy=True):
@@ -1358,11 +1464,11 @@ def _homogenize_dict(self, frames, intersect=True, dtype=None):
 
         Returns
         -------
-        dict of aligned results & indicies
+        dict of aligned results & indices
         """
 
         result = dict()
-        # caller differs dict/ODict, presered type
+        # caller differs dict/ODict, preserved type
         if isinstance(frames, OrderedDict):
             result = OrderedDict()
 
@@ -1374,8 +1480,8 @@ def _homogenize_dict(self, frames, intersect=True, dtype=None):
                 adj_frames[k] = v
 
         axes = self._AXIS_ORDERS[1:]
-        axes_dict = dict([(a, ax) for a, ax in zip(axes, self._extract_axes(
-            self, adj_frames, axes, intersect=intersect))])
+        axes_dict = dict((a, ax) for a, ax in zip(axes, self._extract_axes(
+            self, adj_frames, axes, intersect=intersect)))
 
         reindex_dict = dict(
             [(self._AXIS_SLICEMAP[a], axes_dict[a]) for a in axes])
@@ -1398,7 +1504,6 @@ def _extract_axis(self, data, axis=0, intersect=False):
             index = Index([])
         elif len(data) > 0:
             raw_lengths = []
-            indexes = []
 
         have_raw_arrays = False
         have_frames = False
@@ -1406,18 +1511,22 @@ def _extract_axis(self, data, axis=0, intersect=False):
         for v in data.values():
             if isinstance(v, self._constructor_sliced):
                 have_frames = True
-                indexes.append(v._get_axis(axis))
             elif v is not None:
                 have_raw_arrays = True
                 raw_lengths.append(v.shape[axis])
 
         if have_frames:
-            index = _get_combined_index(indexes, intersect=intersect)
+            # we want the "old" behavior here, of sorting only
+            # 1. we're doing a union (intersect=False)
+            # 2. the indices are not aligned.
+            index = _get_objs_combined_axis(data.values(), axis=axis,
+                                            intersect=intersect, sort=None)
 
         if have_raw_arrays:
             lengths = list(set(raw_lengths))
             if len(lengths) > 1:
-                raise ValueError('ndarrays must match shape on axis %d' % axis)
+                raise ValueError('ndarrays must match shape on '
+                                 'axis {ax}'.format(ax=axis))
 
             if have_frames:
                 if lengths[0] != len(index):
@@ -1430,109 +1539,14 @@ def _extract_axis(self, data, axis=0, intersect=False):
 
         return _ensure_index(index)
 
-    @classmethod
-    def _add_aggregate_operations(cls, use_numexpr=True):
-        """ add the operations to the cls; evaluate the doc strings again """
-
-        # doc strings substitors
-        _agg_doc = """
-Wrapper method for %%s
-
-Parameters
-----------
-other : %s or %s""" % (cls._constructor_sliced.__name__, cls.__name__) + """
-axis : {""" + ', '.join(cls._AXIS_ORDERS) + "}" + """
-    Axis to broadcast over
-
-Returns
--------
-""" + cls.__name__ + "\n"
-
-        def _panel_arith_method(op, name, str_rep=None, default_axis=None,
-                                fill_zeros=None, **eval_kwargs):
-            def na_op(x, y):
-                try:
-                    result = expressions.evaluate(op, str_rep, x, y,
-                                                  raise_on_error=True,
-                                                  **eval_kwargs)
-                except TypeError:
-                    result = op(x, y)
-
-                # handles discrepancy between numpy and numexpr on division/mod
-                # by 0 though, given that these are generally (always?)
-                # non-scalars, I'm not sure whether it's worth it at the moment
-                result = com._fill_zeros(result, x, y, name, fill_zeros)
-                return result
-
-            if name in _op_descriptions:
-                op_name = name.replace('__', '')
-                op_desc = _op_descriptions[op_name]
-                if op_desc['reversed']:
-                    equiv = 'other ' + op_desc['op'] + ' panel'
-                else:
-                    equiv = 'panel ' + op_desc['op'] + ' other'
-
-                _op_doc = """
-                %%s of series and other, element-wise (binary operator `%%s`).
-                Equivalent to ``%%s``.
-
-                Parameters
-                ----------
-                other : %s or %s""" % (cls._constructor_sliced.__name__, cls.__name__) + """
-                axis : {""" + ', '.join(cls._AXIS_ORDERS) + "}" + """
-                    Axis to broadcast over
-
-                Returns
-                -------
-                """ + cls.__name__ + """
-
-                See also
-                --------
-                """ + cls.__name__ + ".%s\n"
-                doc = _op_doc % (op_desc['desc'], op_name, equiv, op_desc['reverse'])
-            else:
-                doc = _agg_doc % name
-
-            @Appender(doc)
-            def f(self, other, axis=0):
-                return self._combine(other, na_op, axis=axis)
-            f.__name__ = name
-            return f
-
-        # add `div`, `mul`, `pow`, etc..
-        ops.add_flex_arithmetic_methods(
-            cls, _panel_arith_method, use_numexpr=use_numexpr,
-            flex_comp_method=ops._comp_method_PANEL)
-
-Panel._setup_axes(axes=['items', 'major_axis', 'minor_axis'],
-                  info_axis=0,
-                  stat_axis=1,
-                  aliases={'major': 'major_axis',
-                           'minor': 'minor_axis'},
+
+Panel._setup_axes(axes=['items', 'major_axis', 'minor_axis'], info_axis=0,
+                  stat_axis=1, aliases={'major': 'major_axis',
+                                        'minor': 'minor_axis'},
                   slicers={'major_axis': 'index',
-                           'minor_axis': 'columns'})
+                           'minor_axis': 'columns'},
+                  docs={})
 
-ops.add_special_arithmetic_methods(Panel, **ops.panel_special_funcs)
-Panel._add_aggregate_operations()
+ops.add_special_arithmetic_methods(Panel)
+ops.add_flex_arithmetic_methods(Panel)
 Panel._add_numeric_operations()
-
-# legacy
-class WidePanel(Panel):
-
-    def __init__(self, *args, **kwargs):
-
-        # deprecation, #10892
-        warnings.warn("WidePanel is deprecated. Please use Panel",
-                      FutureWarning, stacklevel=2)
-
-        super(WidePanel, self).__init__(*args, **kwargs)
-
-class LongPanel(DataFrame):
-
-    def __init__(self, *args, **kwargs):
-
-        # deprecation, #10892
-        warnings.warn("LongPanel is deprecated. Please use DataFrame",
-                      FutureWarning, stacklevel=2)
-
-        super(LongPanel, self).__init__(*args, **kwargs)
diff --git a/pandas/core/panel4d.py b/pandas/core/panel4d.py
deleted file mode 100644
index 7fafbd0eaa2b5..0000000000000
--- a/pandas/core/panel4d.py
+++ /dev/null
@@ -1,43 +0,0 @@
-""" Panel4D: a 4-d dict like collection of panels """
-
-from pandas.core.panelnd import create_nd_panel_factory
-from pandas.core.panel import Panel
-
-Panel4D = create_nd_panel_factory(
-    klass_name='Panel4D',
-    orders=['labels', 'items', 'major_axis', 'minor_axis'],
-    slices={'labels': 'labels', 'items': 'items', 'major_axis': 'major_axis',
-            'minor_axis': 'minor_axis'},
-    slicer=Panel,
-    aliases={'major': 'major_axis', 'minor': 'minor_axis'},
-    stat_axis=2,
-    ns=dict(__doc__="""
-    Panel4D is a 4-Dimensional named container very much like a Panel, but 
-    having 4 named dimensions. It is intended as a test bed for more 
-    N-Dimensional named containers.
-
-    Parameters
-    ----------
-    data : ndarray (labels x items x major x minor), or dict of Panels
-
-    labels : Index or array-like : axis=0
-    items  : Index or array-like : axis=1
-    major_axis : Index or array-like: axis=2
-    minor_axis : Index or array-like: axis=3
-
-    dtype : dtype, default None
-    Data type to force, otherwise infer
-    copy : boolean, default False
-    Copy data from inputs. Only affects DataFrame / 2d ndarray input
-    """)
-)
-
-
-def panel4d_init(self, data=None, labels=None, items=None, major_axis=None,
-                 minor_axis=None, copy=False, dtype=None):
-
-    self._init_data(data=data, labels=labels, items=items,
-                    major_axis=major_axis, minor_axis=minor_axis,
-                    copy=copy, dtype=dtype)
-
-Panel4D.__init__ = panel4d_init
diff --git a/pandas/core/panelnd.py b/pandas/core/panelnd.py
deleted file mode 100644
index 35e6412efc760..0000000000000
--- a/pandas/core/panelnd.py
+++ /dev/null
@@ -1,108 +0,0 @@
-""" Factory methods to create N-D panels """
-
-from pandas.compat import zip
-import pandas.compat as compat
-
-
-def create_nd_panel_factory(klass_name, orders, slices, slicer, aliases=None,
-                            stat_axis=2, info_axis=0, ns=None):
-    """ manufacture a n-d class:
-
-        Parameters
-        ----------
-        klass_name : the klass name
-        orders : the names of the axes in order (highest to lowest)
-        slices : a dictionary that defines how the axes map to the slice axis
-        slicer : the class representing a slice of this panel
-        aliases : a dictionary defining aliases for various axes
-            default = { major : major_axis, minor : minor_axis }
-        stat_axis : the default statistic axis default = 2
-        info_axis : the info axis
-
-        Returns
-        -------
-        a class object representing this panel
-
-    """
-
-    # if slicer is a name, get the object
-    if isinstance(slicer, compat.string_types):
-        import pandas
-        try:
-            slicer = getattr(pandas, slicer)
-        except:
-            raise Exception("cannot create this slicer [%s]" % slicer)
-
-    # build the klass
-    ns = {} if not ns else ns
-    klass = type(klass_name, (slicer,), ns)
-
-    # setup the axes
-    klass._setup_axes(axes=orders, info_axis=info_axis, stat_axis=stat_axis,
-                      aliases=aliases, slicers=slices)
-
-    klass._constructor_sliced = slicer
-
-    # define the methods ####
-    def __init__(self, *args, **kwargs):
-        if not (kwargs.get('data') or len(args)):
-            raise Exception(
-                "must supply at least a data argument to [%s]" % klass_name)
-        if 'copy' not in kwargs:
-            kwargs['copy'] = False
-        if 'dtype' not in kwargs:
-            kwargs['dtype'] = None
-        self._init_data(*args, **kwargs)
-    klass.__init__ = __init__
-
-    def _get_plane_axes_index(self, axis):
-        """ return the sliced index for this object """
-
-        axis_name = self._get_axis_name(axis)
-        index = self._AXIS_ORDERS.index(axis)
-
-        planes = []
-        if index:
-            planes.extend(self._AXIS_ORDERS[0:index])
-        if index != self._AXIS_LEN:
-            planes.extend(self._AXIS_ORDERS[index + 1:])
-
-        return planes
-    klass._get_plane_axes_index = _get_plane_axes_index
-
-    def _combine(self, other, func, axis=0):
-        if isinstance(other, klass):
-            return self._combine_with_constructor(other, func)
-        return super(klass, self)._combine(other, func, axis=axis)
-    klass._combine = _combine
-
-    def _combine_with_constructor(self, other, func):
-
-        # combine labels to form new axes
-        new_axes = []
-        for a in self._AXIS_ORDERS:
-            new_axes.append(getattr(self, a).union(getattr(other, a)))
-
-        # reindex: could check that everything's the same size, but forget it
-        d = dict([(a, ax) for a, ax in zip(self._AXIS_ORDERS, new_axes)])
-        d['copy'] = False
-        this = self.reindex(**d)
-        other = other.reindex(**d)
-
-        result_values = func(this.values, other.values)
-
-        return self._constructor(result_values, **d)
-    klass._combine_with_constructor = _combine_with_constructor
-
-    # set as NonImplemented operations which we don't support
-    for f in ['to_frame', 'to_excel', 'to_sparse', 'groupby', 'join', 'filter',
-              'dropna', 'shift']:
-        def func(self, *args, **kwargs):
-            raise NotImplementedError("this operation is not supported")
-        setattr(klass, f, func)
-
-    # add the aggregate operations
-    klass._add_aggregate_operations()
-    klass._add_numeric_operations()
-
-    return klass
diff --git a/pandas/core/resample.py b/pandas/core/resample.py
new file mode 100644
index 0000000000000..0b0fcacc1bc48
--- /dev/null
+++ b/pandas/core/resample.py
@@ -0,0 +1,1595 @@
+from datetime import timedelta
+import numpy as np
+import warnings
+import copy
+from textwrap import dedent
+
+import pandas as pd
+from pandas.core.base import GroupByMixin
+
+from pandas.core.groupby.groupby import (
+    BinGrouper, Grouper, _GroupBy, GroupBy, SeriesGroupBy, groupby,
+    PanelGroupBy, _pipe_template
+)
+
+from pandas.tseries.frequencies import to_offset, is_subperiod, is_superperiod
+from pandas.core.indexes.datetimes import DatetimeIndex, date_range
+from pandas.core.indexes.timedeltas import TimedeltaIndex
+from pandas.tseries.offsets import DateOffset, Tick, Day, delta_to_nanoseconds
+from pandas.core.indexes.period import PeriodIndex
+from pandas.errors import AbstractMethodError
+import pandas.core.algorithms as algos
+from pandas.core.dtypes.generic import ABCDataFrame, ABCSeries
+
+import pandas.compat as compat
+from pandas.compat.numpy import function as nv
+
+from pandas._libs import lib, tslib
+from pandas._libs.tslib import Timestamp
+from pandas._libs.tslibs.period import IncompatibleFrequency
+
+from pandas.util._decorators import Appender, Substitution
+from pandas.core.generic import _shared_docs
+_shared_docs_kwargs = dict()
+
+
+class Resampler(_GroupBy):
+
+    """
+    Class for resampling datetimelike data, a groupby-like operation.
+    See aggregate, transform, and apply functions on this object.
+
+    It's easiest to use obj.resample(...) to use Resampler.
+
+    Parameters
+    ----------
+    obj : pandas object
+    groupby : a TimeGrouper object
+    axis : int, default 0
+    kind : str or None
+        'period', 'timestamp' to override default index treatement
+
+    Notes
+    -----
+    After resampling, see aggregate, apply, and transform functions.
+
+    Returns
+    -------
+    a Resampler of the appropriate type
+    """
+
+    # to the groupby descriptor
+    _attributes = ['freq', 'axis', 'closed', 'label', 'convention',
+                   'loffset', 'base', 'kind']
+
+    def __init__(self, obj, groupby=None, axis=0, kind=None, **kwargs):
+        self.groupby = groupby
+        self.keys = None
+        self.sort = True
+        self.axis = axis
+        self.kind = kind
+        self.squeeze = False
+        self.group_keys = True
+        self.as_index = True
+        self.exclusions = set()
+        self.binner = None
+        self.grouper = None
+
+        if self.groupby is not None:
+            self.groupby._set_grouper(self._convert_obj(obj), sort=True)
+
+    def __unicode__(self):
+        """ provide a nice str repr of our rolling object """
+        attrs = ["{k}={v}".format(k=k, v=getattr(self.groupby, k))
+                 for k in self._attributes if
+                 getattr(self.groupby, k, None) is not None]
+        return "{klass} [{attrs}]".format(klass=self.__class__.__name__,
+                                          attrs=', '.join(attrs))
+
+    def __getattr__(self, attr):
+        if attr in self._internal_names_set:
+            return object.__getattribute__(self, attr)
+        if attr in self._attributes:
+            return getattr(self.groupby, attr)
+        if attr in self.obj:
+            return self[attr]
+
+        return object.__getattribute__(self, attr)
+
+    @property
+    def obj(self):
+        return self.groupby.obj
+
+    @property
+    def ax(self):
+        return self.groupby.ax
+
+    @property
+    def _typ(self):
+        """ masquerade for compat as a Series or a DataFrame """
+        if isinstance(self._selected_obj, pd.Series):
+            return 'series'
+        return 'dataframe'
+
+    @property
+    def _from_selection(self):
+        """ is the resampling from a DataFrame column or MultiIndex level """
+        # upsampling and PeriodIndex resampling do not work
+        # with selection, this state used to catch and raise an error
+        return (self.groupby is not None and
+                (self.groupby.key is not None or
+                 self.groupby.level is not None))
+
+    def _convert_obj(self, obj):
+        """
+        provide any conversions for the object in order to correctly handle
+
+        Parameters
+        ----------
+        obj : the object to be resampled
+
+        Returns
+        -------
+        obj : converted object
+        """
+        obj = obj._consolidate()
+        return obj
+
+    def _get_binner_for_time(self):
+        raise AbstractMethodError(self)
+
+    def _set_binner(self):
+        """
+        setup our binners
+        cache these as we are an immutable object
+        """
+
+        if self.binner is None:
+            self.binner, self.grouper = self._get_binner()
+
+    def _get_binner(self):
+        """
+        create the BinGrouper, assume that self.set_grouper(obj)
+        has already been called
+        """
+
+        binner, bins, binlabels = self._get_binner_for_time()
+        bin_grouper = BinGrouper(bins, binlabels, indexer=self.groupby.indexer)
+        return binner, bin_grouper
+
+    def _assure_grouper(self):
+        """ make sure that we are creating our binner & grouper """
+        self._set_binner()
+
+    @Substitution(klass='Resampler',
+                  versionadded='.. versionadded:: 0.23.0',
+                  examples="""
+>>> df = pd.DataFrame({'A': [1, 2, 3, 4]},
+...                   index=pd.date_range('2012-08-02', periods=4))
+>>> df
+            A
+2012-08-02  1
+2012-08-03  2
+2012-08-04  3
+2012-08-05  4
+
+To get the difference between each 2-day period's maximum and minimum value in
+one pass, you can do
+
+>>> df.resample('2D').pipe(lambda x: x.max() - x.min())
+            A
+2012-08-02  1
+2012-08-04  1""")
+    @Appender(_pipe_template)
+    def pipe(self, func, *args, **kwargs):
+        return super(Resampler, self).pipe(func, *args, **kwargs)
+
+    _agg_doc = dedent("""
+
+    Examples
+    --------
+    >>> s = Series([1,2,3,4,5],
+                    index=pd.date_range('20130101',
+                                        periods=5,freq='s'))
+    2013-01-01 00:00:00    1
+    2013-01-01 00:00:01    2
+    2013-01-01 00:00:02    3
+    2013-01-01 00:00:03    4
+    2013-01-01 00:00:04    5
+    Freq: S, dtype: int64
+
+    >>> r = s.resample('2s')
+    DatetimeIndexResampler [freq=<2 * Seconds>, axis=0, closed=left,
+                            label=left, convention=start, base=0]
+
+    >>> r.agg(np.sum)
+    2013-01-01 00:00:00    3
+    2013-01-01 00:00:02    7
+    2013-01-01 00:00:04    5
+    Freq: 2S, dtype: int64
+
+    >>> r.agg(['sum','mean','max'])
+                         sum  mean  max
+    2013-01-01 00:00:00    3   1.5    2
+    2013-01-01 00:00:02    7   3.5    4
+    2013-01-01 00:00:04    5   5.0    5
+
+    >>> r.agg({'result' : lambda x: x.mean() / x.std(),
+               'total' : np.sum})
+                         total    result
+    2013-01-01 00:00:00      3  2.121320
+    2013-01-01 00:00:02      7  4.949747
+    2013-01-01 00:00:04      5       NaN
+
+    See also
+    --------
+    pandas.DataFrame.groupby.aggregate
+    pandas.DataFrame.resample.transform
+    pandas.DataFrame.aggregate
+
+    """)
+
+    @Appender(_agg_doc)
+    @Appender(_shared_docs['aggregate'] % dict(
+        klass='DataFrame',
+        versionadded='',
+        axis=''))
+    def aggregate(self, arg, *args, **kwargs):
+
+        self._set_binner()
+        result, how = self._aggregate(arg, *args, **kwargs)
+        if result is None:
+            result = self._groupby_and_aggregate(arg,
+                                                 *args,
+                                                 **kwargs)
+
+        result = self._apply_loffset(result)
+        return result
+
+    agg = aggregate
+    apply = aggregate
+
+    def transform(self, arg, *args, **kwargs):
+        """
+        Call function producing a like-indexed Series on each group and return
+        a Series with the transformed values
+
+        Parameters
+        ----------
+        func : function
+            To apply to each group. Should return a Series with the same index
+
+        Examples
+        --------
+        >>> resampled.transform(lambda x: (x - x.mean()) / x.std())
+
+        Returns
+        -------
+        transformed : Series
+        """
+        return self._selected_obj.groupby(self.groupby).transform(
+            arg, *args, **kwargs)
+
+    def _downsample(self, f):
+        raise AbstractMethodError(self)
+
+    def _upsample(self, f, limit=None, fill_value=None):
+        raise AbstractMethodError(self)
+
+    def _gotitem(self, key, ndim, subset=None):
+        """
+        sub-classes to define
+        return a sliced object
+
+        Parameters
+        ----------
+        key : string / list of selections
+        ndim : 1,2
+            requested ndim of result
+        subset : object, default None
+            subset to act on
+        """
+        self._set_binner()
+        grouper = self.grouper
+        if subset is None:
+            subset = self.obj
+        grouped = groupby(subset, by=None, grouper=grouper, axis=self.axis)
+
+        # try the key selection
+        try:
+            return grouped[key]
+        except KeyError:
+            return grouped
+
+    def _groupby_and_aggregate(self, how, grouper=None, *args, **kwargs):
+        """ re-evaluate the obj with a groupby aggregation """
+
+        if grouper is None:
+            self._set_binner()
+            grouper = self.grouper
+
+        obj = self._selected_obj
+
+        try:
+            grouped = groupby(obj, by=None, grouper=grouper, axis=self.axis)
+        except TypeError:
+
+            # panel grouper
+            grouped = PanelGroupBy(obj, grouper=grouper, axis=self.axis)
+
+        try:
+            if isinstance(obj, ABCDataFrame) and compat.callable(how):
+                # Check if the function is reducing or not.
+                result = grouped._aggregate_item_by_item(how, *args, **kwargs)
+            else:
+                result = grouped.aggregate(how, *args, **kwargs)
+        except Exception:
+
+            # we have a non-reducing function
+            # try to evaluate
+            result = grouped.apply(how, *args, **kwargs)
+
+        result = self._apply_loffset(result)
+        return self._wrap_result(result)
+
+    def _apply_loffset(self, result):
+        """
+        if loffset is set, offset the result index
+
+        This is NOT an idempotent routine, it will be applied
+        exactly once to the result.
+
+        Parameters
+        ----------
+        result : Series or DataFrame
+            the result of resample
+        """
+
+        needs_offset = (
+            isinstance(self.loffset, (DateOffset, timedelta)) and
+            isinstance(result.index, DatetimeIndex) and
+            len(result.index) > 0
+        )
+
+        if needs_offset:
+            result.index = result.index + self.loffset
+
+        self.loffset = None
+        return result
+
+    def _get_resampler_for_grouping(self, groupby, **kwargs):
+        """ return the correct class for resampling with groupby """
+        return self._resampler_for_grouping(self, groupby=groupby, **kwargs)
+
+    def _wrap_result(self, result):
+        """ potentially wrap any results """
+        if isinstance(result, ABCSeries) and self._selection is not None:
+            result.name = self._selection
+
+        if isinstance(result, ABCSeries) and result.empty:
+            obj = self.obj
+            result.index = obj.index._shallow_copy(freq=to_offset(self.freq))
+            result.name = getattr(obj, 'name', None)
+
+        return result
+
+    def pad(self, limit=None):
+        """
+        Forward fill the values
+
+        Parameters
+        ----------
+        limit : integer, optional
+            limit of how many values to fill
+
+        Returns
+        -------
+        an upsampled Series
+
+        See Also
+        --------
+        Series.fillna
+        DataFrame.fillna
+        """
+        return self._upsample('pad', limit=limit)
+    ffill = pad
+
+    def nearest(self, limit=None):
+        """
+        Fill values with nearest neighbor starting from center
+
+        Parameters
+        ----------
+        limit : integer, optional
+            limit of how many values to fill
+
+            .. versionadded:: 0.21.0
+
+        Returns
+        -------
+        an upsampled Series
+
+        See Also
+        --------
+        Series.fillna
+        DataFrame.fillna
+        """
+        return self._upsample('nearest', limit=limit)
+
+    def backfill(self, limit=None):
+        """
+        Backward fill the new missing values in the resampled data.
+
+        In statistics, imputation is the process of replacing missing data with
+        substituted values [1]_. When resampling data, missing values may
+        appear (e.g., when the resampling frequency is higher than the original
+        frequency). The backward fill will replace NaN values that appeared in
+        the resampled data with the next value in the original sequence.
+        Missing values that existed in the original data will not be modified.
+
+        Parameters
+        ----------
+        limit : integer, optional
+            Limit of how many values to fill.
+
+        Returns
+        -------
+        Series, DataFrame
+            An upsampled Series or DataFrame with backward filled NaN values.
+
+        See Also
+        --------
+        bfill : Alias of backfill.
+        fillna : Fill NaN values using the specified method, which can be
+            'backfill'.
+        nearest : Fill NaN values with nearest neighbor starting from center.
+        pad : Forward fill NaN values.
+        pandas.Series.fillna : Fill NaN values in the Series using the
+            specified method, which can be 'backfill'.
+        pandas.DataFrame.fillna : Fill NaN values in the DataFrame using the
+            specified method, which can be 'backfill'.
+
+        References
+        ----------
+        .. [1] https://en.wikipedia.org/wiki/Imputation_(statistics)
+
+        Examples
+        --------
+
+        Resampling a Series:
+
+        >>> s = pd.Series([1, 2, 3],
+        ...               index=pd.date_range('20180101', periods=3, freq='h'))
+        >>> s
+        2018-01-01 00:00:00    1
+        2018-01-01 01:00:00    2
+        2018-01-01 02:00:00    3
+        Freq: H, dtype: int64
+
+        >>> s.resample('30min').backfill()
+        2018-01-01 00:00:00    1
+        2018-01-01 00:30:00    2
+        2018-01-01 01:00:00    2
+        2018-01-01 01:30:00    3
+        2018-01-01 02:00:00    3
+        Freq: 30T, dtype: int64
+
+        >>> s.resample('15min').backfill(limit=2)
+        2018-01-01 00:00:00    1.0
+        2018-01-01 00:15:00    NaN
+        2018-01-01 00:30:00    2.0
+        2018-01-01 00:45:00    2.0
+        2018-01-01 01:00:00    2.0
+        2018-01-01 01:15:00    NaN
+        2018-01-01 01:30:00    3.0
+        2018-01-01 01:45:00    3.0
+        2018-01-01 02:00:00    3.0
+        Freq: 15T, dtype: float64
+
+        Resampling a DataFrame that has missing values:
+
+        >>> df = pd.DataFrame({'a': [2, np.nan, 6], 'b': [1, 3, 5]},
+        ...                   index=pd.date_range('20180101', periods=3,
+        ...                                       freq='h'))
+        >>> df
+                               a  b
+        2018-01-01 00:00:00  2.0  1
+        2018-01-01 01:00:00  NaN  3
+        2018-01-01 02:00:00  6.0  5
+
+        >>> df.resample('30min').backfill()
+                               a  b
+        2018-01-01 00:00:00  2.0  1
+        2018-01-01 00:30:00  NaN  3
+        2018-01-01 01:00:00  NaN  3
+        2018-01-01 01:30:00  6.0  5
+        2018-01-01 02:00:00  6.0  5
+
+        >>> df.resample('15min').backfill(limit=2)
+                               a    b
+        2018-01-01 00:00:00  2.0  1.0
+        2018-01-01 00:15:00  NaN  NaN
+        2018-01-01 00:30:00  NaN  3.0
+        2018-01-01 00:45:00  NaN  3.0
+        2018-01-01 01:00:00  NaN  3.0
+        2018-01-01 01:15:00  NaN  NaN
+        2018-01-01 01:30:00  6.0  5.0
+        2018-01-01 01:45:00  6.0  5.0
+        2018-01-01 02:00:00  6.0  5.0
+        """
+        return self._upsample('backfill', limit=limit)
+    bfill = backfill
+
+    def fillna(self, method, limit=None):
+        """
+        Fill missing values introduced by upsampling.
+
+        In statistics, imputation is the process of replacing missing data with
+        substituted values [1]_. When resampling data, missing values may
+        appear (e.g., when the resampling frequency is higher than the original
+        frequency).
+
+        Missing values that existed in the original data will
+        not be modified.
+
+        Parameters
+        ----------
+        method : {'pad', 'backfill', 'ffill', 'bfill', 'nearest'}
+            Method to use for filling holes in resampled data
+
+            * 'pad' or 'ffill': use previous valid observation to fill gap
+              (forward fill).
+            * 'backfill' or 'bfill': use next valid observation to fill gap.
+            * 'nearest': use nearest valid observation to fill gap.
+
+        limit : integer, optional
+            Limit of how many consecutive missing values to fill.
+
+        Returns
+        -------
+        Series or DataFrame
+            An upsampled Series or DataFrame with missing values filled.
+
+        See Also
+        --------
+        backfill : Backward fill NaN values in the resampled data.
+        pad : Forward fill NaN values in the resampled data.
+        nearest : Fill NaN values in the resampled data
+            with nearest neighbor starting from center.
+        interpolate : Fill NaN values using interpolation.
+        pandas.Series.fillna : Fill NaN values in the Series using the
+            specified method, which can be 'bfill' and 'ffill'.
+        pandas.DataFrame.fillna : Fill NaN values in the DataFrame using the
+            specified method, which can be 'bfill' and 'ffill'.
+
+        Examples
+        --------
+        Resampling a Series:
+
+        >>> s = pd.Series([1, 2, 3],
+        ...               index=pd.date_range('20180101', periods=3, freq='h'))
+        >>> s
+        2018-01-01 00:00:00    1
+        2018-01-01 01:00:00    2
+        2018-01-01 02:00:00    3
+        Freq: H, dtype: int64
+
+        Without filling the missing values you get:
+
+        >>> s.resample("30min").asfreq()
+        2018-01-01 00:00:00    1.0
+        2018-01-01 00:30:00    NaN
+        2018-01-01 01:00:00    2.0
+        2018-01-01 01:30:00    NaN
+        2018-01-01 02:00:00    3.0
+        Freq: 30T, dtype: float64
+
+        >>> s.resample('30min').fillna("backfill")
+        2018-01-01 00:00:00    1
+        2018-01-01 00:30:00    2
+        2018-01-01 01:00:00    2
+        2018-01-01 01:30:00    3
+        2018-01-01 02:00:00    3
+        Freq: 30T, dtype: int64
+
+        >>> s.resample('15min').fillna("backfill", limit=2)
+        2018-01-01 00:00:00    1.0
+        2018-01-01 00:15:00    NaN
+        2018-01-01 00:30:00    2.0
+        2018-01-01 00:45:00    2.0
+        2018-01-01 01:00:00    2.0
+        2018-01-01 01:15:00    NaN
+        2018-01-01 01:30:00    3.0
+        2018-01-01 01:45:00    3.0
+        2018-01-01 02:00:00    3.0
+        Freq: 15T, dtype: float64
+
+        >>> s.resample('30min').fillna("pad")
+        2018-01-01 00:00:00    1
+        2018-01-01 00:30:00    1
+        2018-01-01 01:00:00    2
+        2018-01-01 01:30:00    2
+        2018-01-01 02:00:00    3
+        Freq: 30T, dtype: int64
+
+        >>> s.resample('30min').fillna("nearest")
+        2018-01-01 00:00:00    1
+        2018-01-01 00:30:00    2
+        2018-01-01 01:00:00    2
+        2018-01-01 01:30:00    3
+        2018-01-01 02:00:00    3
+        Freq: 30T, dtype: int64
+
+        Missing values present before the upsampling are not affected.
+
+        >>> sm = pd.Series([1, None, 3],
+        ...               index=pd.date_range('20180101', periods=3, freq='h'))
+        >>> sm
+        2018-01-01 00:00:00    1.0
+        2018-01-01 01:00:00    NaN
+        2018-01-01 02:00:00    3.0
+        Freq: H, dtype: float64
+
+        >>> sm.resample('30min').fillna('backfill')
+        2018-01-01 00:00:00    1.0
+        2018-01-01 00:30:00    NaN
+        2018-01-01 01:00:00    NaN
+        2018-01-01 01:30:00    3.0
+        2018-01-01 02:00:00    3.0
+        Freq: 30T, dtype: float64
+
+        >>> sm.resample('30min').fillna('pad')
+        2018-01-01 00:00:00    1.0
+        2018-01-01 00:30:00    1.0
+        2018-01-01 01:00:00    NaN
+        2018-01-01 01:30:00    NaN
+        2018-01-01 02:00:00    3.0
+        Freq: 30T, dtype: float64
+
+        >>> sm.resample('30min').fillna('nearest')
+        2018-01-01 00:00:00    1.0
+        2018-01-01 00:30:00    NaN
+        2018-01-01 01:00:00    NaN
+        2018-01-01 01:30:00    3.0
+        2018-01-01 02:00:00    3.0
+        Freq: 30T, dtype: float64
+
+        DataFrame resampling is done column-wise. All the same options are
+        available.
+
+        >>> df = pd.DataFrame({'a': [2, np.nan, 6], 'b': [1, 3, 5]},
+        ...                   index=pd.date_range('20180101', periods=3,
+        ...                                       freq='h'))
+        >>> df
+                               a  b
+        2018-01-01 00:00:00  2.0  1
+        2018-01-01 01:00:00  NaN  3
+        2018-01-01 02:00:00  6.0  5
+
+        >>> df.resample('30min').fillna("bfill")
+                               a  b
+        2018-01-01 00:00:00  2.0  1
+        2018-01-01 00:30:00  NaN  3
+        2018-01-01 01:00:00  NaN  3
+        2018-01-01 01:30:00  6.0  5
+        2018-01-01 02:00:00  6.0  5
+
+        References
+        ----------
+        .. [1] https://en.wikipedia.org/wiki/Imputation_(statistics)
+        """
+        return self._upsample(method, limit=limit)
+
+    @Appender(_shared_docs['interpolate'] % _shared_docs_kwargs)
+    def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
+                    limit_direction='forward', limit_area=None,
+                    downcast=None, **kwargs):
+        """
+        Interpolate values according to different methods.
+
+        .. versionadded:: 0.18.1
+        """
+        result = self._upsample(None)
+        return result.interpolate(method=method, axis=axis, limit=limit,
+                                  inplace=inplace,
+                                  limit_direction=limit_direction,
+                                  limit_area=limit_area,
+                                  downcast=downcast, **kwargs)
+
+    def asfreq(self, fill_value=None):
+        """
+        return the values at the new freq,
+        essentially a reindex
+
+        Parameters
+        ----------
+        fill_value: scalar, optional
+            Value to use for missing values, applied during upsampling (note
+            this does not fill NaNs that already were present).
+
+            .. versionadded:: 0.20.0
+
+        See Also
+        --------
+        Series.asfreq
+        DataFrame.asfreq
+        """
+        return self._upsample('asfreq', fill_value=fill_value)
+
+    def std(self, ddof=1, *args, **kwargs):
+        """
+        Compute standard deviation of groups, excluding missing values
+
+        Parameters
+        ----------
+        ddof : integer, default 1
+        degrees of freedom
+        """
+        nv.validate_resampler_func('std', args, kwargs)
+        return self._downsample('std', ddof=ddof)
+
+    def var(self, ddof=1, *args, **kwargs):
+        """
+        Compute variance of groups, excluding missing values
+
+        Parameters
+        ----------
+        ddof : integer, default 1
+        degrees of freedom
+        """
+        nv.validate_resampler_func('var', args, kwargs)
+        return self._downsample('var', ddof=ddof)
+
+    @Appender(GroupBy.size.__doc__)
+    def size(self):
+        # It's a special case as higher level does return
+        # a copy of 0-len objects. GH14962
+        result = self._downsample('size')
+        if not len(self.ax) and isinstance(self._selected_obj, ABCDataFrame):
+            result = pd.Series([], index=result.index, dtype='int64')
+        return result
+
+
+# downsample methods
+for method in ['sum', 'prod']:
+
+    def f(self, _method=method, min_count=0, *args, **kwargs):
+        nv.validate_resampler_func(_method, args, kwargs)
+        return self._downsample(_method, min_count=min_count)
+    f.__doc__ = getattr(GroupBy, method).__doc__
+    setattr(Resampler, method, f)
+
+
+# downsample methods
+for method in ['min', 'max', 'first', 'last', 'mean', 'sem',
+               'median', 'ohlc']:
+
+    def f(self, _method=method, *args, **kwargs):
+        nv.validate_resampler_func(_method, args, kwargs)
+        return self._downsample(_method)
+    f.__doc__ = getattr(GroupBy, method).__doc__
+    setattr(Resampler, method, f)
+
+# groupby & aggregate methods
+for method in ['count']:
+    def f(self, _method=method):
+        return self._downsample(_method)
+    f.__doc__ = getattr(GroupBy, method).__doc__
+    setattr(Resampler, method, f)
+
+# series only methods
+for method in ['nunique']:
+    def f(self, _method=method):
+        return self._downsample(_method)
+    f.__doc__ = getattr(SeriesGroupBy, method).__doc__
+    setattr(Resampler, method, f)
+
+
+def _maybe_process_deprecations(r, how=None, fill_method=None, limit=None):
+    """ potentially we might have a deprecation warning, show it
+    but call the appropriate methods anyhow """
+
+    if how is not None:
+
+        # .resample(..., how='sum')
+        if isinstance(how, compat.string_types):
+            method = "{0}()".format(how)
+
+            # .resample(..., how=lambda x: ....)
+        else:
+            method = ".apply(<func>)"
+
+        # if we have both a how and fill_method, then show
+        # the following warning
+        if fill_method is None:
+            warnings.warn("how in .resample() is deprecated\n"
+                          "the new syntax is "
+                          ".resample(...).{method}".format(
+                              method=method),
+                          FutureWarning, stacklevel=3)
+        r = r.aggregate(how)
+
+    if fill_method is not None:
+
+        # show the prior function call
+        method = '.' + method if how is not None else ''
+
+        args = "limit={0}".format(limit) if limit is not None else ""
+        warnings.warn("fill_method is deprecated to .resample()\n"
+                      "the new syntax is .resample(...){method}"
+                      ".{fill_method}({args})".format(
+                          method=method,
+                          fill_method=fill_method,
+                          args=args),
+                      FutureWarning, stacklevel=3)
+
+        if how is not None:
+            r = getattr(r, fill_method)(limit=limit)
+        else:
+            r = r.aggregate(fill_method, limit=limit)
+
+    return r
+
+
+class _GroupByMixin(GroupByMixin):
+    """ provide the groupby facilities """
+
+    def __init__(self, obj, *args, **kwargs):
+
+        parent = kwargs.pop('parent', None)
+        groupby = kwargs.pop('groupby', None)
+        if parent is None:
+            parent = obj
+
+        # initialize our GroupByMixin object with
+        # the resampler attributes
+        for attr in self._attributes:
+            setattr(self, attr, kwargs.get(attr, getattr(parent, attr)))
+
+        super(_GroupByMixin, self).__init__(None)
+        self._groupby = groupby
+        self._groupby.mutated = True
+        self._groupby.grouper.mutated = True
+        self.groupby = copy.copy(parent.groupby)
+
+    def _apply(self, f, **kwargs):
+        """
+        dispatch to _upsample; we are stripping all of the _upsample kwargs and
+        performing the original function call on the grouped object
+        """
+
+        def func(x):
+            x = self._shallow_copy(x, groupby=self.groupby)
+
+            if isinstance(f, compat.string_types):
+                return getattr(x, f)(**kwargs)
+
+            return x.apply(f, **kwargs)
+
+        result = self._groupby.apply(func)
+        return self._wrap_result(result)
+
+    _upsample = _apply
+    _downsample = _apply
+    _groupby_and_aggregate = _apply
+
+
+class DatetimeIndexResampler(Resampler):
+
+    @property
+    def _resampler_for_grouping(self):
+        return DatetimeIndexResamplerGroupby
+
+    def _get_binner_for_time(self):
+
+        # this is how we are actually creating the bins
+        if self.kind == 'period':
+            return self.groupby._get_time_period_bins(self.ax)
+        return self.groupby._get_time_bins(self.ax)
+
+    def _downsample(self, how, **kwargs):
+        """
+        Downsample the cython defined function
+
+        Parameters
+        ----------
+        how : string / cython mapped function
+        **kwargs : kw args passed to how function
+        """
+        self._set_binner()
+        how = self._is_cython_func(how) or how
+        ax = self.ax
+        obj = self._selected_obj
+
+        if not len(ax):
+            # reset to the new freq
+            obj = obj.copy()
+            obj.index.freq = self.freq
+            return obj
+
+        # do we have a regular frequency
+        if ax.freq is not None or ax.inferred_freq is not None:
+
+            if len(self.grouper.binlabels) > len(ax) and how is None:
+
+                # let's do an asfreq
+                return self.asfreq()
+
+        # we are downsampling
+        # we want to call the actual grouper method here
+        result = obj.groupby(
+            self.grouper, axis=self.axis).aggregate(how, **kwargs)
+
+        result = self._apply_loffset(result)
+        return self._wrap_result(result)
+
+    def _adjust_binner_for_upsample(self, binner):
+        """ adjust our binner when upsampling """
+        if self.closed == 'right':
+            binner = binner[1:]
+        else:
+            binner = binner[:-1]
+        return binner
+
+    def _upsample(self, method, limit=None, fill_value=None):
+        """
+        method : string {'backfill', 'bfill', 'pad',
+            'ffill', 'asfreq'} method for upsampling
+        limit : int, default None
+            Maximum size gap to fill when reindexing
+        fill_value : scalar, default None
+            Value to use for missing values
+
+        See also
+        --------
+        .fillna
+
+        """
+        self._set_binner()
+        if self.axis:
+            raise AssertionError('axis must be 0')
+        if self._from_selection:
+            raise ValueError("Upsampling from level= or on= selection"
+                             " is not supported, use .set_index(...)"
+                             " to explicitly set index to"
+                             " datetime-like")
+
+        ax = self.ax
+        obj = self._selected_obj
+        binner = self.binner
+        res_index = self._adjust_binner_for_upsample(binner)
+
+        # if we have the same frequency as our axis, then we are equal sampling
+        if limit is None and to_offset(ax.inferred_freq) == self.freq:
+            result = obj.copy()
+            result.index = res_index
+        else:
+            result = obj.reindex(res_index, method=method,
+                                 limit=limit, fill_value=fill_value)
+
+        result = self._apply_loffset(result)
+        return self._wrap_result(result)
+
+    def _wrap_result(self, result):
+        result = super(DatetimeIndexResampler, self)._wrap_result(result)
+
+        # we may have a different kind that we were asked originally
+        # convert if needed
+        if self.kind == 'period' and not isinstance(result.index, PeriodIndex):
+            result.index = result.index.to_period(self.freq)
+        return result
+
+
+class DatetimeIndexResamplerGroupby(_GroupByMixin, DatetimeIndexResampler):
+    """
+    Provides a resample of a groupby implementation
+
+    .. versionadded:: 0.18.1
+
+    """
+    @property
+    def _constructor(self):
+        return DatetimeIndexResampler
+
+
+class PeriodIndexResampler(DatetimeIndexResampler):
+
+    @property
+    def _resampler_for_grouping(self):
+        return PeriodIndexResamplerGroupby
+
+    def _get_binner_for_time(self):
+        if self.kind == 'timestamp':
+            return super(PeriodIndexResampler, self)._get_binner_for_time()
+        return self.groupby._get_period_bins(self.ax)
+
+    def _convert_obj(self, obj):
+        obj = super(PeriodIndexResampler, self)._convert_obj(obj)
+
+        if self._from_selection:
+            # see GH 14008, GH 12871
+            msg = ("Resampling from level= or on= selection"
+                   " with a PeriodIndex is not currently supported,"
+                   " use .set_index(...) to explicitly set index")
+            raise NotImplementedError(msg)
+
+        if self.loffset is not None:
+            # Cannot apply loffset/timedelta to PeriodIndex -> convert to
+            # timestamps
+            self.kind = 'timestamp'
+
+        # convert to timestamp
+        if self.kind == 'timestamp':
+            obj = obj.to_timestamp(how=self.convention)
+
+        return obj
+
+    def _downsample(self, how, **kwargs):
+        """
+        Downsample the cython defined function
+
+        Parameters
+        ----------
+        how : string / cython mapped function
+        **kwargs : kw args passed to how function
+        """
+
+        # we may need to actually resample as if we are timestamps
+        if self.kind == 'timestamp':
+            return super(PeriodIndexResampler, self)._downsample(how, **kwargs)
+
+        how = self._is_cython_func(how) or how
+        ax = self.ax
+
+        if is_subperiod(ax.freq, self.freq):
+            # Downsampling
+            return self._groupby_and_aggregate(how, grouper=self.grouper)
+        elif is_superperiod(ax.freq, self.freq):
+            if how == 'ohlc':
+                # GH #13083
+                # upsampling to subperiods is handled as an asfreq, which works
+                # for pure aggregating/reducing methods
+                # OHLC reduces along the time dimension, but creates multiple
+                # values for each period -> handle by _groupby_and_aggregate()
+                return self._groupby_and_aggregate(how, grouper=self.grouper)
+            return self.asfreq()
+        elif ax.freq == self.freq:
+            return self.asfreq()
+
+        raise IncompatibleFrequency(
+            'Frequency {} cannot be resampled to {}, as they are not '
+            'sub or super periods'.format(ax.freq, self.freq))
+
+    def _upsample(self, method, limit=None, fill_value=None):
+        """
+        method : string {'backfill', 'bfill', 'pad', 'ffill'}
+            method for upsampling
+        limit : int, default None
+            Maximum size gap to fill when reindexing
+        fill_value : scalar, default None
+            Value to use for missing values
+
+        See also
+        --------
+        .fillna
+
+        """
+
+        # we may need to actually resample as if we are timestamps
+        if self.kind == 'timestamp':
+            return super(PeriodIndexResampler, self)._upsample(
+                method, limit=limit, fill_value=fill_value)
+
+        self._set_binner()
+        ax = self.ax
+        obj = self.obj
+        new_index = self.binner
+
+        # Start vs. end of period
+        memb = ax.asfreq(self.freq, how=self.convention)
+
+        # Get the fill indexer
+        indexer = memb.get_indexer(new_index, method=method, limit=limit)
+        return self._wrap_result(_take_new_index(
+            obj, indexer, new_index, axis=self.axis))
+
+
+class PeriodIndexResamplerGroupby(_GroupByMixin, PeriodIndexResampler):
+    """
+    Provides a resample of a groupby implementation
+
+    .. versionadded:: 0.18.1
+
+    """
+    @property
+    def _constructor(self):
+        return PeriodIndexResampler
+
+
+class TimedeltaIndexResampler(DatetimeIndexResampler):
+
+    @property
+    def _resampler_for_grouping(self):
+        return TimedeltaIndexResamplerGroupby
+
+    def _get_binner_for_time(self):
+        return self.groupby._get_time_delta_bins(self.ax)
+
+    def _adjust_binner_for_upsample(self, binner):
+        """ adjust our binner when upsampling """
+        ax = self.ax
+
+        if is_subperiod(ax.freq, self.freq):
+            # We are actually downsampling
+            # but are in the asfreq path
+            # GH 12926
+            if self.closed == 'right':
+                binner = binner[1:]
+            else:
+                binner = binner[:-1]
+        return binner
+
+
+class TimedeltaIndexResamplerGroupby(_GroupByMixin, TimedeltaIndexResampler):
+    """
+    Provides a resample of a groupby implementation
+
+    .. versionadded:: 0.18.1
+
+    """
+    @property
+    def _constructor(self):
+        return TimedeltaIndexResampler
+
+
+def resample(obj, kind=None, **kwds):
+    """ create a TimeGrouper and return our resampler """
+    tg = TimeGrouper(**kwds)
+    return tg._get_resampler(obj, kind=kind)
+
+
+resample.__doc__ = Resampler.__doc__
+
+
+def get_resampler_for_grouping(groupby, rule, how=None, fill_method=None,
+                               limit=None, kind=None, **kwargs):
+    """ return our appropriate resampler when grouping as well """
+
+    # .resample uses 'on' similar to how .groupby uses 'key'
+    kwargs['key'] = kwargs.pop('on', None)
+
+    tg = TimeGrouper(freq=rule, **kwargs)
+    resampler = tg._get_resampler(groupby.obj, kind=kind)
+    r = resampler._get_resampler_for_grouping(groupby=groupby)
+    return _maybe_process_deprecations(r,
+                                       how=how,
+                                       fill_method=fill_method,
+                                       limit=limit)
+
+
+class TimeGrouper(Grouper):
+    """
+    Custom groupby class for time-interval grouping
+
+    Parameters
+    ----------
+    freq : pandas date offset or offset alias for identifying bin edges
+    closed : closed end of interval; 'left' or 'right'
+    label : interval boundary to use for labeling; 'left' or 'right'
+    convention : {'start', 'end', 'e', 's'}
+        If axis is PeriodIndex
+    """
+    _attributes = Grouper._attributes + ('closed', 'label', 'how',
+                                         'loffset', 'kind', 'convention',
+                                         'base')
+
+    def __init__(self, freq='Min', closed=None, label=None, how='mean',
+                 axis=0, fill_method=None, limit=None, loffset=None,
+                 kind=None, convention=None, base=0, **kwargs):
+        # Check for correctness of the keyword arguments which would
+        # otherwise silently use the default if misspelled
+        if label not in {None, 'left', 'right'}:
+            raise ValueError('Unsupported value {} for `label`'.format(label))
+        if closed not in {None, 'left', 'right'}:
+            raise ValueError('Unsupported value {} for `closed`'.format(
+                closed))
+        if convention not in {None, 'start', 'end', 'e', 's'}:
+            raise ValueError('Unsupported value {} for `convention`'
+                             .format(convention))
+
+        freq = to_offset(freq)
+
+        end_types = set(['M', 'A', 'Q', 'BM', 'BA', 'BQ', 'W'])
+        rule = freq.rule_code
+        if (rule in end_types or
+                ('-' in rule and rule[:rule.find('-')] in end_types)):
+            if closed is None:
+                closed = 'right'
+            if label is None:
+                label = 'right'
+        else:
+            if closed is None:
+                closed = 'left'
+            if label is None:
+                label = 'left'
+
+        self.closed = closed
+        self.label = label
+        self.kind = kind
+
+        self.convention = convention or 'E'
+        self.convention = self.convention.lower()
+
+        if isinstance(loffset, compat.string_types):
+            loffset = to_offset(loffset)
+        self.loffset = loffset
+
+        self.how = how
+        self.fill_method = fill_method
+        self.limit = limit
+        self.base = base
+
+        # always sort time groupers
+        kwargs['sort'] = True
+
+        super(TimeGrouper, self).__init__(freq=freq, axis=axis, **kwargs)
+
+    def _get_resampler(self, obj, kind=None):
+        """
+        return my resampler or raise if we have an invalid axis
+
+        Parameters
+        ----------
+        obj : input object
+        kind : string, optional
+            'period','timestamp','timedelta' are valid
+
+        Returns
+        -------
+        a Resampler
+
+        Raises
+        ------
+        TypeError if incompatible axis
+
+        """
+        self._set_grouper(obj)
+
+        ax = self.ax
+        if isinstance(ax, DatetimeIndex):
+            return DatetimeIndexResampler(obj,
+                                          groupby=self,
+                                          kind=kind,
+                                          axis=self.axis)
+        elif isinstance(ax, PeriodIndex) or kind == 'period':
+            return PeriodIndexResampler(obj,
+                                        groupby=self,
+                                        kind=kind,
+                                        axis=self.axis)
+        elif isinstance(ax, TimedeltaIndex):
+            return TimedeltaIndexResampler(obj,
+                                           groupby=self,
+                                           axis=self.axis)
+
+        raise TypeError("Only valid with DatetimeIndex, "
+                        "TimedeltaIndex or PeriodIndex, "
+                        "but got an instance of %r" % type(ax).__name__)
+
+    def _get_grouper(self, obj, validate=True):
+        # create the resampler and return our binner
+        r = self._get_resampler(obj)
+        r._set_binner()
+        return r.binner, r.grouper, r.obj
+
+    def _get_time_bins(self, ax):
+        if not isinstance(ax, DatetimeIndex):
+            raise TypeError('axis must be a DatetimeIndex, but got '
+                            'an instance of %r' % type(ax).__name__)
+
+        if len(ax) == 0:
+            binner = labels = DatetimeIndex(
+                data=[], freq=self.freq, name=ax.name)
+            return binner, [], labels
+
+        first, last = ax.min(), ax.max()
+        first, last = _get_range_edges(first, last, self.freq,
+                                       closed=self.closed,
+                                       base=self.base)
+        tz = ax.tz
+        # GH #12037
+        # use first/last directly instead of call replace() on them
+        # because replace() will swallow the nanosecond part
+        # thus last bin maybe slightly before the end if the end contains
+        # nanosecond part and lead to `Values falls after last bin` error
+        binner = labels = DatetimeIndex(freq=self.freq,
+                                        start=first,
+                                        end=last,
+                                        tz=tz,
+                                        name=ax.name)
+
+        # GH 15549
+        # In edge case of tz-aware resapmling binner last index can be
+        # less than the last variable in data object, this happens because of
+        # DST time change
+        if len(binner) > 1 and binner[-1] < last:
+            extra_date_range = pd.date_range(binner[-1], last + self.freq,
+                                             freq=self.freq, tz=tz,
+                                             name=ax.name)
+            binner = labels = binner.append(extra_date_range[1:])
+
+        # a little hack
+        trimmed = False
+        if (len(binner) > 2 and binner[-2] == last and
+                self.closed == 'right'):
+
+            binner = binner[:-1]
+            trimmed = True
+
+        ax_values = ax.asi8
+        binner, bin_edges = self._adjust_bin_edges(binner, ax_values)
+
+        # general version, knowing nothing about relative frequencies
+        bins = lib.generate_bins_dt64(
+            ax_values, bin_edges, self.closed, hasnans=ax.hasnans)
+
+        if self.closed == 'right':
+            labels = binner
+            if self.label == 'right':
+                labels = labels[1:]
+            elif not trimmed:
+                labels = labels[:-1]
+        else:
+            if self.label == 'right':
+                labels = labels[1:]
+            elif not trimmed:
+                labels = labels[:-1]
+
+        if ax.hasnans:
+            binner = binner.insert(0, tslib.NaT)
+            labels = labels.insert(0, tslib.NaT)
+
+        # if we end up with more labels than bins
+        # adjust the labels
+        # GH4076
+        if len(bins) < len(labels):
+            labels = labels[:len(bins)]
+
+        return binner, bins, labels
+
+    def _adjust_bin_edges(self, binner, ax_values):
+        # Some hacks for > daily data, see #1471, #1458, #1483
+
+        bin_edges = binner.asi8
+
+        if self.freq != 'D' and is_superperiod(self.freq, 'D'):
+            day_nanos = delta_to_nanoseconds(timedelta(1))
+            if self.closed == 'right':
+                bin_edges = bin_edges + day_nanos - 1
+
+            # intraday values on last day
+            if bin_edges[-2] > ax_values.max():
+                bin_edges = bin_edges[:-1]
+                binner = binner[:-1]
+
+        return binner, bin_edges
+
+    def _get_time_delta_bins(self, ax):
+        if not isinstance(ax, TimedeltaIndex):
+            raise TypeError('axis must be a TimedeltaIndex, but got '
+                            'an instance of %r' % type(ax).__name__)
+
+        if not len(ax):
+            binner = labels = TimedeltaIndex(
+                data=[], freq=self.freq, name=ax.name)
+            return binner, [], labels
+
+        start = ax[0]
+        end = ax[-1]
+        labels = binner = TimedeltaIndex(start=start,
+                                         end=end,
+                                         freq=self.freq,
+                                         name=ax.name)
+
+        end_stamps = labels + 1
+        bins = ax.searchsorted(end_stamps, side='left')
+
+        # Addresses GH #10530
+        if self.base > 0:
+            labels += type(self.freq)(self.base)
+
+        return binner, bins, labels
+
+    def _get_time_period_bins(self, ax):
+        if not isinstance(ax, DatetimeIndex):
+            raise TypeError('axis must be a DatetimeIndex, but got '
+                            'an instance of %r' % type(ax).__name__)
+
+        if not len(ax):
+            binner = labels = PeriodIndex(
+                data=[], freq=self.freq, name=ax.name)
+            return binner, [], labels
+
+        labels = binner = PeriodIndex(start=ax[0],
+                                      end=ax[-1],
+                                      freq=self.freq,
+                                      name=ax.name)
+
+        end_stamps = (labels + 1).asfreq(self.freq, 's').to_timestamp()
+        if ax.tzinfo:
+            end_stamps = end_stamps.tz_localize(ax.tzinfo)
+        bins = ax.searchsorted(end_stamps, side='left')
+
+        return binner, bins, labels
+
+    def _get_period_bins(self, ax):
+        if not isinstance(ax, PeriodIndex):
+            raise TypeError('axis must be a PeriodIndex, but got '
+                            'an instance of %r' % type(ax).__name__)
+
+        memb = ax.asfreq(self.freq, how=self.convention)
+
+        # NaT handling as in pandas._lib.lib.generate_bins_dt64()
+        nat_count = 0
+        if memb.hasnans:
+            nat_count = np.sum(memb._isnan)
+            memb = memb[~memb._isnan]
+
+        # if index contains no valid (non-NaT) values, return empty index
+        if not len(memb):
+            binner = labels = PeriodIndex(
+                data=[], freq=self.freq, name=ax.name)
+            return binner, [], labels
+
+        start = ax.min().asfreq(self.freq, how=self.convention)
+        end = ax.max().asfreq(self.freq, how='end')
+
+        labels = binner = PeriodIndex(start=start, end=end,
+                                      freq=self.freq, name=ax.name)
+
+        i8 = memb.asi8
+        freq_mult = self.freq.n
+
+        # when upsampling to subperiods, we need to generate enough bins
+        expected_bins_count = len(binner) * freq_mult
+        i8_extend = expected_bins_count - (i8[-1] - i8[0])
+        rng = np.arange(i8[0], i8[-1] + i8_extend, freq_mult)
+        rng += freq_mult
+        bins = memb.searchsorted(rng, side='left')
+
+        if nat_count > 0:
+            # NaT handling as in pandas._lib.lib.generate_bins_dt64()
+            # shift bins by the number of NaT
+            bins += nat_count
+            bins = np.insert(bins, 0, nat_count)
+            binner = binner.insert(0, tslib.NaT)
+            labels = labels.insert(0, tslib.NaT)
+
+        return binner, bins, labels
+
+
+def _take_new_index(obj, indexer, new_index, axis=0):
+    from pandas.core.api import Series, DataFrame
+
+    if isinstance(obj, Series):
+        new_values = algos.take_1d(obj.values, indexer)
+        return Series(new_values, index=new_index, name=obj.name)
+    elif isinstance(obj, DataFrame):
+        if axis == 1:
+            raise NotImplementedError("axis 1 is not supported")
+        return DataFrame(obj._data.reindex_indexer(
+            new_axis=new_index, indexer=indexer, axis=1))
+    else:
+        raise ValueError("'obj' should be either a Series or a DataFrame")
+
+
+def _get_range_edges(first, last, offset, closed='left', base=0):
+    if isinstance(offset, compat.string_types):
+        offset = to_offset(offset)
+
+    if isinstance(offset, Tick):
+        is_day = isinstance(offset, Day)
+        day_nanos = delta_to_nanoseconds(timedelta(1))
+
+        # #1165
+        if (is_day and day_nanos % offset.nanos == 0) or not is_day:
+            return _adjust_dates_anchored(first, last, offset,
+                                          closed=closed, base=base)
+
+    if not isinstance(offset, Tick):  # and first.time() != last.time():
+        # hack!
+        first = first.normalize()
+        last = last.normalize()
+
+    if closed == 'left':
+        first = Timestamp(offset.rollback(first))
+    else:
+        first = Timestamp(first - offset)
+
+    last = Timestamp(last + offset)
+
+    return first, last
+
+
+def _adjust_dates_anchored(first, last, offset, closed='right', base=0):
+    # First and last offsets should be calculated from the start day to fix an
+    # error cause by resampling across multiple days when a one day period is
+    # not a multiple of the frequency.
+    #
+    # See https://github.com/pandas-dev/pandas/issues/8683
+
+    # 14682 - Since we need to drop the TZ information to perform
+    # the adjustment in the presence of a DST change,
+    # save TZ Info and the DST state of the first and last parameters
+    # so that we can accurately rebuild them at the end.
+    first_tzinfo = first.tzinfo
+    last_tzinfo = last.tzinfo
+    first_dst = bool(first.dst())
+    last_dst = bool(last.dst())
+
+    first = first.tz_localize(None)
+    last = last.tz_localize(None)
+
+    start_day_nanos = first.normalize().value
+
+    base_nanos = (base % offset.n) * offset.nanos // offset.n
+    start_day_nanos += base_nanos
+
+    foffset = (first.value - start_day_nanos) % offset.nanos
+    loffset = (last.value - start_day_nanos) % offset.nanos
+
+    if closed == 'right':
+        if foffset > 0:
+            # roll back
+            fresult = first.value - foffset
+        else:
+            fresult = first.value - offset.nanos
+
+        if loffset > 0:
+            # roll forward
+            lresult = last.value + (offset.nanos - loffset)
+        else:
+            # already the end of the road
+            lresult = last.value
+    else:  # closed == 'left'
+        if foffset > 0:
+            fresult = first.value - foffset
+        else:
+            # start of the road
+            fresult = first.value
+
+        if loffset > 0:
+            # roll forward
+            lresult = last.value + (offset.nanos - loffset)
+        else:
+            lresult = last.value + offset.nanos
+
+    return (Timestamp(fresult).tz_localize(first_tzinfo, ambiguous=first_dst),
+            Timestamp(lresult).tz_localize(last_tzinfo, ambiguous=last_dst))
+
+
+def asfreq(obj, freq, method=None, how=None, normalize=False, fill_value=None):
+    """
+    Utility frequency conversion method for Series/DataFrame
+    """
+    if isinstance(obj.index, PeriodIndex):
+        if method is not None:
+            raise NotImplementedError("'method' argument is not supported")
+
+        if how is None:
+            how = 'E'
+
+        new_obj = obj.copy()
+        new_obj.index = obj.index.asfreq(freq, how=how)
+
+    elif len(obj.index) == 0:
+        new_obj = obj.copy()
+        new_obj.index = obj.index._shallow_copy(freq=to_offset(freq))
+
+    else:
+        dti = date_range(obj.index[0], obj.index[-1], freq=freq)
+        dti.name = obj.index.name
+        new_obj = obj.reindex(dti, method=method, fill_value=fill_value)
+        if normalize:
+            new_obj.index = new_obj.index.normalize()
+
+    return new_obj
diff --git a/pandas/core/reshape.py b/pandas/core/reshape.py
deleted file mode 100644
index fecfe5cd82c6d..0000000000000
--- a/pandas/core/reshape.py
+++ /dev/null
@@ -1,1177 +0,0 @@
-# pylint: disable=E1101,E1103
-# pylint: disable=W0703,W0622,W0613,W0201
-from pandas.compat import range, zip
-from pandas import compat
-import itertools
-
-import numpy as np
-
-from pandas.core.series import Series
-from pandas.core.frame import DataFrame
-
-from pandas.core.sparse import SparseDataFrame, SparseSeries
-from pandas.sparse.array import SparseArray
-from pandas._sparse import IntIndex
-
-from pandas.core.categorical import Categorical
-from pandas.core.common import notnull, _ensure_platform_int, _maybe_promote
-from pandas.core.groupby import get_group_index, _compress_group_index
-
-import pandas.core.common as com
-import pandas.algos as algos
-
-from pandas.core.index import MultiIndex, _get_na_value
-
-
-class _Unstacker(object):
-
-    """
-    Helper class to unstack data / pivot with multi-level index
-
-    Parameters
-    ----------
-    level : int or str, default last level
-        Level to "unstack". Accepts a name for the level.
-
-    Examples
-    --------
-    >>> import pandas as pd
-    >>> index = pd.MultiIndex.from_tuples([('one', 'a'), ('one', 'b'),
-    ...                                    ('two', 'a'), ('two', 'b')])
-    >>> s = pd.Series(np.arange(1.0, 5.0), index=index)
-    >>> s
-    one  a   1
-         b   2
-    two  a   3
-         b   4
-    dtype: float64
-
-    >>> s.unstack(level=-1)
-         a   b
-    one  1  2
-    two  3  4
-
-    >>> s.unstack(level=0)
-       one  two
-    a  1   2
-    b  3   4
-
-    Returns
-    -------
-    unstacked : DataFrame
-    """
-
-    def __init__(self, values, index, level=-1, value_columns=None):
-
-        self.is_categorical = None
-        if values.ndim == 1:
-            if isinstance(values, Categorical):
-                self.is_categorical = values
-                values = np.array(values)
-            values = values[:, np.newaxis]
-        self.values = values
-        self.value_columns = value_columns
-
-        if value_columns is None and values.shape[1] != 1:  # pragma: no cover
-            raise ValueError('must pass column labels for multi-column data')
-
-        self.index = index
-
-        if isinstance(self.index, MultiIndex):
-            if index._reference_duplicate_name(level):
-                msg = ("Ambiguous reference to {0}. The index "
-                       "names are not unique.".format(level))
-                raise ValueError(msg)
-
-        self.level = self.index._get_level_number(level)
-
-        # when index includes `nan`, need to lift levels/strides by 1
-        self.lift = 1 if -1 in self.index.labels[self.level] else 0
-
-        self.new_index_levels = list(index.levels)
-        self.new_index_names = list(index.names)
-
-        self.removed_name = self.new_index_names.pop(self.level)
-        self.removed_level = self.new_index_levels.pop(self.level)
-
-        self._make_sorted_values_labels()
-        self._make_selectors()
-
-    def _make_sorted_values_labels(self):
-        v = self.level
-
-        labs = list(self.index.labels)
-        levs = list(self.index.levels)
-        to_sort = labs[:v] + labs[v + 1:] + [labs[v]]
-        sizes = [len(x) for x in levs[:v] + levs[v + 1:] + [levs[v]]]
-
-        comp_index, obs_ids = get_compressed_ids(to_sort, sizes)
-        ngroups = len(obs_ids)
-
-        indexer = algos.groupsort_indexer(comp_index, ngroups)[0]
-        indexer = _ensure_platform_int(indexer)
-
-        self.sorted_values = com.take_nd(self.values, indexer, axis=0)
-        self.sorted_labels = [l.take(indexer) for l in to_sort]
-
-    def _make_selectors(self):
-        new_levels = self.new_index_levels
-
-        # make the mask
-        remaining_labels = self.sorted_labels[:-1]
-        level_sizes = [len(x) for x in new_levels]
-
-        comp_index, obs_ids = get_compressed_ids(remaining_labels, level_sizes)
-        ngroups = len(obs_ids)
-
-        comp_index = _ensure_platform_int(comp_index)
-        stride = self.index.levshape[self.level] + self.lift
-        self.full_shape = ngroups, stride
-
-        selector = self.sorted_labels[-1] + stride * comp_index + self.lift
-        mask = np.zeros(np.prod(self.full_shape), dtype=bool)
-        mask.put(selector, True)
-
-        if mask.sum() < len(self.index):
-            raise ValueError('Index contains duplicate entries, '
-                             'cannot reshape')
-
-        self.group_index = comp_index
-        self.mask = mask
-        self.unique_groups = obs_ids
-        self.compressor = comp_index.searchsorted(np.arange(ngroups))
-
-    def get_result(self):
-        # TODO: find a better way than this masking business
-
-        values, value_mask = self.get_new_values()
-        columns = self.get_new_columns()
-        index = self.get_new_index()
-
-        # filter out missing levels
-        if values.shape[1] > 0:
-            col_inds, obs_ids = _compress_group_index(self.sorted_labels[-1])
-            # rare case, level values not observed
-            if len(obs_ids) < self.full_shape[1]:
-                inds = (value_mask.sum(0) > 0).nonzero()[0]
-                values = com.take_nd(values, inds, axis=1)
-                columns = columns[inds]
-
-        # may need to coerce categoricals here
-        if self.is_categorical is not None:
-            values = [ Categorical.from_array(values[:,i],
-                                              categories=self.is_categorical.categories,
-                                              ordered=True)
-                       for i in range(values.shape[-1]) ]
-
-        return DataFrame(values, index=index, columns=columns)
-
-    def get_new_values(self):
-        values = self.values
-
-        # place the values
-        length, width = self.full_shape
-        stride = values.shape[1]
-        result_width = width * stride
-        result_shape = (length, result_width)
-
-        # if our mask is all True, then we can use our existing dtype
-        if self.mask.all():
-            dtype = values.dtype
-            new_values = np.empty(result_shape, dtype=dtype)
-        else:
-            dtype, fill_value = _maybe_promote(values.dtype)
-            new_values = np.empty(result_shape, dtype=dtype)
-            new_values.fill(fill_value)
-
-        new_mask = np.zeros(result_shape, dtype=bool)
-
-        # is there a simpler / faster way of doing this?
-        for i in range(values.shape[1]):
-            chunk = new_values[:, i * width: (i + 1) * width]
-            mask_chunk = new_mask[:, i * width: (i + 1) * width]
-
-            chunk.flat[self.mask] = self.sorted_values[:, i]
-            mask_chunk.flat[self.mask] = True
-
-        return new_values, new_mask
-
-    def get_new_columns(self):
-        if self.value_columns is None:
-            if self.lift == 0:
-                return self.removed_level
-
-            lev = self.removed_level
-            return lev.insert(0, _get_na_value(lev.dtype.type))
-
-        stride = len(self.removed_level) + self.lift
-        width = len(self.value_columns)
-        propagator = np.repeat(np.arange(width), stride)
-        if isinstance(self.value_columns, MultiIndex):
-            new_levels = self.value_columns.levels + (self.removed_level,)
-            new_names = self.value_columns.names + (self.removed_name,)
-
-            new_labels = [lab.take(propagator)
-                          for lab in self.value_columns.labels]
-        else:
-            new_levels = [self.value_columns, self.removed_level]
-            new_names = [self.value_columns.name, self.removed_name]
-            new_labels = [propagator]
-
-        new_labels.append(np.tile(np.arange(stride) - self.lift, width))
-        return MultiIndex(levels=new_levels, labels=new_labels,
-                          names=new_names, verify_integrity=False)
-
-    def get_new_index(self):
-        result_labels = [lab.take(self.compressor)
-                         for lab in self.sorted_labels[:-1]]
-
-        # construct the new index
-        if len(self.new_index_levels) == 1:
-            lev, lab = self.new_index_levels[0], result_labels[0]
-            if (lab == -1).any():
-                lev = lev.insert(len(lev), _get_na_value(lev.dtype.type))
-            return lev.take(lab)
-
-        return MultiIndex(levels=self.new_index_levels,
-                          labels=result_labels,
-                          names=self.new_index_names,
-                          verify_integrity=False)
-
-
-def _unstack_multiple(data, clocs):
-    from pandas.core.groupby import decons_obs_group_ids
-
-    if len(clocs) == 0:
-        return data
-
-    # NOTE: This doesn't deal with hierarchical columns yet
-
-    index = data.index
-
-    clocs = [index._get_level_number(i) for i in clocs]
-
-    rlocs = [i for i in range(index.nlevels) if i not in clocs]
-
-    clevels = [index.levels[i] for i in clocs]
-    clabels = [index.labels[i] for i in clocs]
-    cnames = [index.names[i] for i in clocs]
-    rlevels = [index.levels[i] for i in rlocs]
-    rlabels = [index.labels[i] for i in rlocs]
-    rnames = [index.names[i] for i in rlocs]
-
-    shape = [len(x) for x in clevels]
-    group_index = get_group_index(clabels, shape, sort=False, xnull=False)
-
-    comp_ids, obs_ids = _compress_group_index(group_index, sort=False)
-    recons_labels = decons_obs_group_ids(comp_ids,
-                       obs_ids, shape, clabels, xnull=False)
-
-    dummy_index = MultiIndex(levels=rlevels + [obs_ids],
-                             labels=rlabels + [comp_ids],
-                             names=rnames + ['__placeholder__'],
-                             verify_integrity=False)
-
-    if isinstance(data, Series):
-        dummy = Series(data.values, index=dummy_index)
-        unstacked = dummy.unstack('__placeholder__')
-        new_levels = clevels
-        new_names = cnames
-        new_labels = recons_labels
-    else:
-        if isinstance(data.columns, MultiIndex):
-            result = data
-            for i in range(len(clocs)):
-                val = clocs[i]
-                result = result.unstack(val)
-                clocs = [val if i > val else val - 1 for val in clocs]
-
-            return result
-
-        dummy = DataFrame(data.values, index=dummy_index,
-                          columns=data.columns)
-
-        unstacked = dummy.unstack('__placeholder__')
-        if isinstance(unstacked, Series):
-            unstcols = unstacked.index
-        else:
-            unstcols = unstacked.columns
-        new_levels = [unstcols.levels[0]] + clevels
-        new_names = [data.columns.name] + cnames
-
-        new_labels = [unstcols.labels[0]]
-        for rec in recons_labels:
-            new_labels.append(rec.take(unstcols.labels[-1]))
-
-    new_columns = MultiIndex(levels=new_levels, labels=new_labels,
-                             names=new_names, verify_integrity=False)
-
-    if isinstance(unstacked, Series):
-        unstacked.index = new_columns
-    else:
-        unstacked.columns = new_columns
-
-    return unstacked
-
-
-def pivot(self, index=None, columns=None, values=None):
-    """
-    See DataFrame.pivot
-    """
-    if values is None:
-        cols = [columns] if index is None else [index, columns]
-        append = index is None
-        indexed = self.set_index(cols, append=append)
-        return indexed.unstack(columns)
-    else:
-        if index is None:
-            index = self.index
-        else:
-            index = self[index]
-        indexed = Series(self[values].values,
-                         index=MultiIndex.from_arrays([index,
-                                                       self[columns]]))
-        return indexed.unstack(columns)
-
-
-def pivot_simple(index, columns, values):
-    """
-    Produce 'pivot' table based on 3 columns of this DataFrame.
-    Uses unique values from index / columns and fills with values.
-
-    Parameters
-    ----------
-    index : ndarray
-        Labels to use to make new frame's index
-    columns : ndarray
-        Labels to use to make new frame's columns
-    values : ndarray
-        Values to use for populating new frame's values
-
-    Notes
-    -----
-    Obviously, all 3 of the input arguments must have the same length
-
-    Returns
-    -------
-    DataFrame
-    """
-    if (len(index) != len(columns)) or (len(columns) != len(values)):
-        raise AssertionError('Length of index, columns, and values must be the'
-                             ' same')
-
-    if len(index) == 0:
-        return DataFrame(index=[])
-
-    hindex = MultiIndex.from_arrays([index, columns])
-    series = Series(values.ravel(), index=hindex)
-    series = series.sortlevel(0)
-    return series.unstack()
-
-
-def _slow_pivot(index, columns, values):
-    """
-    Produce 'pivot' table based on 3 columns of this DataFrame.
-    Uses unique values from index / columns and fills with values.
-
-    Parameters
-    ----------
-    index : string or object
-        Column name to use to make new frame's index
-    columns : string or object
-        Column name to use to make new frame's columns
-    values : string or object
-        Column name to use for populating new frame's values
-
-    Could benefit from some Cython here.
-    """
-    tree = {}
-    for i, (idx, col) in enumerate(zip(index, columns)):
-        if col not in tree:
-            tree[col] = {}
-        branch = tree[col]
-        branch[idx] = values[i]
-
-    return DataFrame(tree)
-
-
-def unstack(obj, level):
-    if isinstance(level, (tuple, list)):
-        return _unstack_multiple(obj, level)
-
-    if isinstance(obj, DataFrame):
-        if isinstance(obj.index, MultiIndex):
-            return _unstack_frame(obj, level)
-        else:
-            return obj.T.stack(dropna=False)
-    else:
-        unstacker = _Unstacker(obj.values, obj.index, level=level)
-        return unstacker.get_result()
-
-
-def _unstack_frame(obj, level):
-    from pandas.core.internals import BlockManager, make_block
-
-    if obj._is_mixed_type:
-        unstacker = _Unstacker(np.empty(obj.shape, dtype=bool),  # dummy
-                               obj.index, level=level,
-                               value_columns=obj.columns)
-        new_columns = unstacker.get_new_columns()
-        new_index = unstacker.get_new_index()
-        new_axes = [new_columns, new_index]
-
-        new_blocks = []
-        mask_blocks = []
-        for blk in obj._data.blocks:
-            blk_items = obj._data.items[blk.mgr_locs.indexer]
-            bunstacker = _Unstacker(blk.values.T, obj.index, level=level,
-                                    value_columns=blk_items)
-            new_items = bunstacker.get_new_columns()
-            new_placement = new_columns.get_indexer(new_items)
-            new_values, mask = bunstacker.get_new_values()
-
-            mblk = make_block(mask.T, placement=new_placement)
-            mask_blocks.append(mblk)
-
-            newb = make_block(new_values.T, placement=new_placement)
-            new_blocks.append(newb)
-
-        result = DataFrame(BlockManager(new_blocks, new_axes))
-        mask_frame = DataFrame(BlockManager(mask_blocks, new_axes))
-        return result.ix[:, mask_frame.sum(0) > 0]
-    else:
-        unstacker = _Unstacker(obj.values, obj.index, level=level,
-                               value_columns=obj.columns)
-        return unstacker.get_result()
-
-
-def get_compressed_ids(labels, sizes):
-    from pandas.core.groupby import get_group_index
-
-    ids = get_group_index(labels, sizes, sort=True, xnull=False)
-    return _compress_group_index(ids, sort=True)
-
-
-def stack(frame, level=-1, dropna=True):
-    """
-    Convert DataFrame to Series with multi-level Index. Columns become the
-    second level of the resulting hierarchical index
-
-    Returns
-    -------
-    stacked : Series
-    """
-    def factorize(index):
-        if index.is_unique:
-            return index, np.arange(len(index))
-        cat = Categorical(index, ordered=True)
-        return cat.categories, cat.codes
-
-    N, K = frame.shape
-    if isinstance(frame.columns, MultiIndex):
-        if frame.columns._reference_duplicate_name(level):
-            msg = ("Ambiguous reference to {0}. The column "
-                   "names are not unique.".format(level))
-            raise ValueError(msg)
-
-    # Will also convert negative level numbers and check if out of bounds.
-    level_num = frame.columns._get_level_number(level)
-
-    if isinstance(frame.columns, MultiIndex):
-        return _stack_multi_columns(frame, level_num=level_num, dropna=dropna)
-    elif isinstance(frame.index, MultiIndex):
-        new_levels = list(frame.index.levels)
-        new_labels = [lab.repeat(K) for lab in frame.index.labels]
-
-        clev, clab = factorize(frame.columns)
-        new_levels.append(clev)
-        new_labels.append(np.tile(clab, N).ravel())
-
-        new_names = list(frame.index.names)
-        new_names.append(frame.columns.name)
-        new_index = MultiIndex(levels=new_levels, labels=new_labels,
-                               names=new_names, verify_integrity=False)
-    else:
-        levels, (ilab, clab) = \
-                zip(*map(factorize, (frame.index, frame.columns)))
-        labels = ilab.repeat(K), np.tile(clab, N).ravel()
-        new_index = MultiIndex(levels=levels,
-                               labels=labels,
-                               names=[frame.index.name, frame.columns.name],
-                               verify_integrity=False)
-
-    new_values = frame.values.ravel()
-    if dropna:
-        mask = notnull(new_values)
-        new_values = new_values[mask]
-        new_index = new_index[mask]
-    return Series(new_values, index=new_index)
-
-
-def stack_multiple(frame, level, dropna=True):
-    # If all passed levels match up to column names, no
-    # ambiguity about what to do
-    if all(lev in frame.columns.names for lev in level):
-        result = frame
-        for lev in level:
-            result = stack(result, lev, dropna=dropna)
-
-    # Otherwise, level numbers may change as each successive level is stacked
-    elif all(isinstance(lev, int) for lev in level):
-        # As each stack is done, the level numbers decrease, so we need
-        #  to account for that when level is a sequence of ints
-        result = frame
-        # _get_level_number() checks level numbers are in range and converts
-        # negative numbers to positive
-        level = [frame.columns._get_level_number(lev) for lev in level]
-
-        # Can't iterate directly through level as we might need to change
-        # values as we go
-        for index in range(len(level)):
-            lev = level[index]
-            result = stack(result, lev, dropna=dropna)
-            # Decrement all level numbers greater than current, as these
-            # have now shifted down by one
-            updated_level = []
-            for other in level:
-                if other > lev:
-                    updated_level.append(other - 1)
-                else:
-                    updated_level.append(other)
-            level = updated_level
-
-    else:
-        raise ValueError("level should contain all level names or all level numbers, "
-                         "not a mixture of the two.")
-
-    return result
-
-
-def _stack_multi_columns(frame, level_num=-1, dropna=True):
-    def _convert_level_number(level_num, columns):
-        """
-        Logic for converting the level number to something
-        we can safely pass to swaplevel:
-
-        We generally want to convert the level number into
-        a level name, except when columns do not have names,
-        in which case we must leave as a level number
-        """
-        if level_num in columns.names:
-            return columns.names[level_num]
-        else:
-            if columns.names[level_num] is None:
-                return level_num
-            else:
-                return columns.names[level_num]
-
-    this = frame.copy()
-
-    # this makes life much simpler
-    if level_num != frame.columns.nlevels - 1:
-        # roll levels to put selected level at end
-        roll_columns = this.columns
-        for i in range(level_num, frame.columns.nlevels - 1):
-            # Need to check if the ints conflict with level names
-            lev1 = _convert_level_number(i, roll_columns)
-            lev2 = _convert_level_number(i + 1, roll_columns)
-            roll_columns = roll_columns.swaplevel(lev1, lev2)
-        this.columns = roll_columns
-
-    if not this.columns.is_lexsorted():
-        # Workaround the edge case where 0 is one of the column names,
-        # which interferes with trying to sort based on the first
-        # level
-        level_to_sort = _convert_level_number(0, this.columns)
-        this = this.sortlevel(level_to_sort, axis=1)
-
-    # tuple list excluding level for grouping columns
-    if len(frame.columns.levels) > 2:
-        tuples = list(zip(*[
-            lev.take(lab) for lev, lab in
-            zip(this.columns.levels[:-1], this.columns.labels[:-1])
-        ]))
-        unique_groups = [key for key, _ in itertools.groupby(tuples)]
-        new_names = this.columns.names[:-1]
-        new_columns = MultiIndex.from_tuples(unique_groups, names=new_names)
-    else:
-        new_columns = unique_groups = this.columns.levels[0]
-
-    # time to ravel the values
-    new_data = {}
-    level_vals = this.columns.levels[-1]
-    level_labels = sorted(set(this.columns.labels[-1]))
-    level_vals_used = level_vals[level_labels]
-    levsize = len(level_labels)
-    drop_cols = []
-    for key in unique_groups:
-        loc = this.columns.get_loc(key)
-        slice_len = loc.stop - loc.start
-        # can make more efficient?
-
-        if slice_len == 0:
-            drop_cols.append(key)
-            continue
-        elif slice_len != levsize:
-            chunk = this.ix[:, this.columns[loc]]
-            chunk.columns = level_vals.take(chunk.columns.labels[-1])
-            value_slice = chunk.reindex(columns=level_vals_used).values
-        else:
-            if frame._is_mixed_type:
-                value_slice = this.ix[:, this.columns[loc]].values
-            else:
-                value_slice = this.values[:, loc]
-
-        new_data[key] = value_slice.ravel()
-
-    if len(drop_cols) > 0:
-        new_columns = new_columns.difference(drop_cols)
-
-    N = len(this)
-
-    if isinstance(this.index, MultiIndex):
-        new_levels = list(this.index.levels)
-        new_names = list(this.index.names)
-        new_labels = [lab.repeat(levsize) for lab in this.index.labels]
-    else:
-        new_levels = [this.index]
-        new_labels = [np.arange(N).repeat(levsize)]
-        new_names = [this.index.name]  # something better?
-
-    new_levels.append(frame.columns.levels[level_num])
-    new_labels.append(np.tile(level_labels, N))
-    new_names.append(frame.columns.names[level_num])
-
-    new_index = MultiIndex(levels=new_levels, labels=new_labels,
-                           names=new_names, verify_integrity=False)
-
-    result = DataFrame(new_data, index=new_index, columns=new_columns)
-
-    # more efficient way to go about this? can do the whole masking biz but
-    # will only save a small amount of time...
-    if dropna:
-        result = result.dropna(axis=0, how='all')
-
-    return result
-
-
-def melt(frame, id_vars=None, value_vars=None,
-         var_name=None, value_name='value', col_level=None):
-    """
-    "Unpivots" a DataFrame from wide format to long format, optionally leaving
-    identifier variables set.
-
-    This function is useful to massage a DataFrame into a format where one
-    or more columns are identifier variables (`id_vars`), while all other
-    columns, considered measured variables (`value_vars`), are "unpivoted" to
-    the row axis, leaving just two non-identifier columns, 'variable' and
-    'value'.
-
-    Parameters
-    ----------
-    frame : DataFrame
-    id_vars : tuple, list, or ndarray, optional
-        Column(s) to use as identifier variables.
-    value_vars : tuple, list, or ndarray, optional
-        Column(s) to unpivot. If not specified, uses all columns that
-        are not set as `id_vars`.
-    var_name : scalar
-        Name to use for the 'variable' column. If None it uses
-        ``frame.columns.name`` or 'variable'.
-    value_name : scalar, default 'value'
-        Name to use for the 'value' column.
-    col_level : int or string, optional
-        If columns are a MultiIndex then use this level to melt.
-
-    See also
-    --------
-    pivot_table
-    DataFrame.pivot
-
-    Examples
-    --------
-    >>> import pandas as pd
-    >>> df = pd.DataFrame({'A': {0: 'a', 1: 'b', 2: 'c'},
-    ...                    'B': {0: 1, 1: 3, 2: 5},
-    ...                    'C': {0: 2, 1: 4, 2: 6}})
-    >>> df
-       A  B  C
-    0  a  1  2
-    1  b  3  4
-    2  c  5  6
-
-    >>> pd.melt(df, id_vars=['A'], value_vars=['B'])
-       A variable  value
-    0  a        B      1
-    1  b        B      3
-    2  c        B      5
-
-    >>> pd.melt(df, id_vars=['A'], value_vars=['B', 'C'])
-       A variable  value
-    0  a        B      1
-    1  b        B      3
-    2  c        B      5
-    3  a        C      2
-    4  b        C      4
-    5  c        C      6
-
-    The names of 'variable' and 'value' columns can be customized:
-
-    >>> pd.melt(df, id_vars=['A'], value_vars=['B'],
-    ...         var_name='myVarname', value_name='myValname')
-       A myVarname  myValname
-    0  a         B          1
-    1  b         B          3
-    2  c         B          5
-
-    If you have multi-index columns:
-
-    >>> df.columns = [list('ABC'), list('DEF')]
-    >>> df
-       A  B  C
-       D  E  F
-    0  a  1  2
-    1  b  3  4
-    2  c  5  6
-
-    >>> pd.melt(df, col_level=0, id_vars=['A'], value_vars=['B'])
-       A variable  value
-    0  a        B      1
-    1  b        B      3
-    2  c        B      5
-
-    >>> pd.melt(df, id_vars=[('A', 'D')], value_vars=[('B', 'E')])
-      (A, D) variable_0 variable_1  value
-    0      a          B          E      1
-    1      b          B          E      3
-    2      c          B          E      5
-
-    """
-    # TODO: what about the existing index?
-    if id_vars is not None:
-        if not isinstance(id_vars, (tuple, list, np.ndarray)):
-            id_vars = [id_vars]
-        else:
-            id_vars = list(id_vars)
-    else:
-        id_vars = []
-
-    if value_vars is not None:
-        if not isinstance(value_vars, (tuple, list, np.ndarray)):
-            value_vars = [value_vars]
-        frame = frame.ix[:, id_vars + value_vars]
-    else:
-        frame = frame.copy()
-
-    if col_level is not None:  # allow list or other?
-        # frame is a copy
-        frame.columns = frame.columns.get_level_values(col_level)
-
-    if var_name is None:
-        if isinstance(frame.columns, MultiIndex):
-            if len(frame.columns.names) == len(set(frame.columns.names)):
-                var_name = frame.columns.names
-            else:
-                var_name = ['variable_%s' % i for i in
-                            range(len(frame.columns.names))]
-        else:
-            var_name = [frame.columns.name if frame.columns.name is not None
-                        else 'variable']
-    if isinstance(var_name, compat.string_types):
-        var_name = [var_name]
-
-    N, K = frame.shape
-    K -= len(id_vars)
-
-    mdata = {}
-    for col in id_vars:
-        mdata[col] = np.tile(frame.pop(col).values, K)
-
-    mcolumns = id_vars + var_name + [value_name]
-
-    mdata[value_name] = frame.values.ravel('F')
-    for i, col in enumerate(var_name):
-        # asanyarray will keep the columns as an Index
-        mdata[col] = np.asanyarray(frame.columns.get_level_values(i)).repeat(N)
-
-    return DataFrame(mdata, columns=mcolumns)
-
-
-def lreshape(data, groups, dropna=True, label=None):
-    """
-    Reshape long-format data to wide. Generalized inverse of DataFrame.pivot
-
-    Parameters
-    ----------
-    data : DataFrame
-    groups : dict
-        {new_name : list_of_columns}
-    dropna : boolean, default True
-
-    Examples
-    --------
-    >>> import pandas as pd
-    >>> data = pd.DataFrame({'hr1': [514, 573], 'hr2': [545, 526],
-    ...                      'team': ['Red Sox', 'Yankees'],
-    ...                      'year1': [2007, 2008], 'year2': [2008, 2008]})
-    >>> data
-       hr1  hr2     team  year1  year2
-    0  514  545  Red Sox   2007   2008
-    1  573  526  Yankees   2007   2008
-
-    >>> pd.lreshape(data, {'year': ['year1', 'year2'], 'hr': ['hr1', 'hr2']})
-          team   hr  year
-    0  Red Sox  514  2007
-    1  Yankees  573  2007
-    2  Red Sox  545  2008
-    3  Yankees  526  2008
-
-    Returns
-    -------
-    reshaped : DataFrame
-    """
-    if isinstance(groups, dict):
-        keys = list(groups.keys())
-        values = list(groups.values())
-    else:
-        keys, values = zip(*groups)
-
-    all_cols = list(set.union(*[set(x) for x in values]))
-    id_cols = list(data.columns.difference(all_cols))
-
-    K = len(values[0])
-
-    for seq in values:
-        if len(seq) != K:
-            raise ValueError('All column lists must be same length')
-
-    mdata = {}
-    pivot_cols = []
-
-    for target, names in zip(keys, values):
-        mdata[target] = com._concat_compat([data[col].values for col in names])
-        pivot_cols.append(target)
-
-    for col in id_cols:
-        mdata[col] = np.tile(data[col].values, K)
-
-    if dropna:
-        mask = np.ones(len(mdata[pivot_cols[0]]), dtype=bool)
-        for c in pivot_cols:
-            mask &= notnull(mdata[c])
-        if not mask.all():
-            mdata = dict((k, v[mask]) for k, v in compat.iteritems(mdata))
-
-    return DataFrame(mdata, columns=id_cols + pivot_cols)
-
-
-def wide_to_long(df, stubnames, i, j):
-    """
-    Wide panel to long format. Less flexible but more user-friendly than melt.
-
-    Parameters
-    ----------
-    df : DataFrame
-        The wide-format DataFrame
-    stubnames : list
-        A list of stub names. The wide format variables are assumed to
-        start with the stub names.
-    i : str
-        The name of the id variable.
-    j : str
-        The name of the subobservation variable.
-    stubend : str
-        Regex to match for the end of the stubs.
-
-    Returns
-    -------
-    DataFrame
-        A DataFrame that contains each stub name as a variable as well as
-        variables for i and j.
-
-    Examples
-    --------
-    >>> import pandas as pd
-    >>> import numpy as np
-    >>> np.random.seed(123)
-    >>> df = pd.DataFrame({"A1970" : {0 : "a", 1 : "b", 2 : "c"},
-    ...                    "A1980" : {0 : "d", 1 : "e", 2 : "f"},
-    ...                    "B1970" : {0 : 2.5, 1 : 1.2, 2 : .7},
-    ...                    "B1980" : {0 : 3.2, 1 : 1.3, 2 : .1},
-    ...                    "X"     : dict(zip(range(3), np.random.randn(3)))
-    ...                   })
-    >>> df["id"] = df.index
-    >>> df
-    A1970 A1980  B1970  B1980         X  id
-    0     a     d    2.5    3.2 -1.085631   0
-    1     b     e    1.2    1.3  0.997345   1
-    2     c     f    0.7    0.1  0.282978   2
-    >>> wide_to_long(df, ["A", "B"], i="id", j="year")
-                    X  A    B
-    id year
-    0  1970 -1.085631  a  2.5
-    1  1970  0.997345  b  1.2
-    2  1970  0.282978  c  0.7
-    0  1980 -1.085631  d  3.2
-    1  1980  0.997345  e  1.3
-    2  1980  0.282978  f  0.1
-
-    Notes
-    -----
-    All extra variables are treated as extra id variables. This simply uses
-    `pandas.melt` under the hood, but is hard-coded to "do the right thing"
-    in a typicaly case.
-    """
-    def get_var_names(df, regex):
-        return df.filter(regex=regex).columns.tolist()
-
-    def melt_stub(df, stub, i, j):
-        varnames = get_var_names(df, "^" + stub)
-        newdf = melt(df, id_vars=i, value_vars=varnames, value_name=stub,
-                     var_name=j)
-        newdf_j = newdf[j].str.replace(stub, "")
-        try:
-            newdf_j = newdf_j.astype(int)
-        except ValueError:
-            pass
-        newdf[j] = newdf_j
-        return newdf
-
-    id_vars = get_var_names(df, "^(?!%s)" % "|".join(stubnames))
-    if i not in id_vars:
-        id_vars += [i]
-
-    newdf = melt_stub(df, stubnames[0], id_vars, j)
-
-    for stub in stubnames[1:]:
-        new = melt_stub(df, stub, id_vars, j)
-        newdf = newdf.merge(new, how="outer", on=id_vars + [j], copy=False)
-    return newdf.set_index([i, j])
-
-def get_dummies(data, prefix=None, prefix_sep='_', dummy_na=False,
-                columns=None, sparse=False):
-    """
-    Convert categorical variable into dummy/indicator variables
-
-    Parameters
-    ----------
-    data : array-like, Series, or DataFrame
-    prefix : string, list of strings, or dict of strings, default None
-        String to append DataFrame column names
-        Pass a list with length equal to the number of columns
-        when calling get_dummies on a DataFrame. Alternativly, `prefix`
-        can be a dictionary mapping column names to prefixes.
-    prefix_sep : string, default '_'
-        If appending prefix, separator/delimiter to use. Or pass a
-        list or dictionary as with `prefix.`
-    dummy_na : bool, default False
-        Add a column to indicate NaNs, if False NaNs are ignored.
-    columns : list-like, default None
-        Column names in the DataFrame to be encoded.
-        If `columns` is None then all the columns with
-        `object` or `category` dtype will be converted.
-    sparse : bool, default False
-        Whether the dummy columns should be sparse or not.  Returns
-        SparseDataFrame if `data` is a Series or if all columns are included.
-        Otherwise returns a DataFrame with some SparseBlocks.
-
-        .. versionadded:: 0.16.1
-
-    Returns
-    -------
-    dummies : DataFrame or SparseDataFrame
-
-    Examples
-    --------
-    >>> import pandas as pd
-    >>> s = pd.Series(list('abca'))
-
-    >>> get_dummies(s)
-       a  b  c
-    0  1  0  0
-    1  0  1  0
-    2  0  0  1
-    3  1  0  0
-
-    >>> s1 = ['a', 'b', np.nan]
-
-    >>> get_dummies(s1)
-       a  b
-    0  1  0
-    1  0  1
-    2  0  0
-
-    >>> get_dummies(s1, dummy_na=True)
-       a  b  NaN
-    0  1  0    0
-    1  0  1    0
-    2  0  0    1
-
-    >>> df = DataFrame({'A': ['a', 'b', 'a'], 'B': ['b', 'a', 'c'],
-                        'C': [1, 2, 3]})
-
-    >>> get_dummies(df, prefix=['col1', 'col2']):
-       C  col1_a  col1_b  col2_a  col2_b  col2_c
-    0  1       1       0       0       1       0
-    1  2       0       1       1       0       0
-    2  3       1       0       0       0       1
-
-    See also ``Series.str.get_dummies``.
-
-    """
-    from pandas.tools.merge import concat
-    from itertools import cycle
-
-    if isinstance(data, DataFrame):
-        # determine columns being encoded
-
-        if columns is None:
-            columns_to_encode = data.select_dtypes(include=['object',
-                'category']).columns
-        else:
-            columns_to_encode = columns
-
-        # validate prefixes and separator to avoid silently dropping cols
-        def check_len(item, name):
-            length_msg = ("Length of '{0}' ({1}) did "
-                           "not match the length of the columns "
-                           "being encoded ({2}).")
-
-            if com.is_list_like(item):
-                if not len(item) == len(columns_to_encode):
-                    raise ValueError(length_msg.format(name, len(item),
-                                     len(columns_to_encode)))
-
-        check_len(prefix, 'prefix')
-        check_len(prefix_sep, 'prefix_sep')
-        if isinstance(prefix, compat.string_types):
-            prefix = cycle([prefix])
-        if isinstance(prefix, dict):
-            prefix = [prefix[col] for col in columns_to_encode]
-
-        if prefix is None:
-            prefix = columns_to_encode
-
-        # validate separators
-        if isinstance(prefix_sep, compat.string_types):
-            prefix_sep = cycle([prefix_sep])
-        elif isinstance(prefix_sep, dict):
-            prefix_sep = [prefix_sep[col] for col in columns_to_encode]
-
-        if set(columns_to_encode) == set(data.columns):
-            with_dummies = []
-        else:
-            with_dummies = [data.drop(columns_to_encode, axis=1)]
-
-        for (col, pre, sep) in zip(columns_to_encode, prefix, prefix_sep):
-
-            dummy = _get_dummies_1d(data[col], prefix=pre, prefix_sep=sep,
-                                    dummy_na=dummy_na, sparse=sparse)
-            with_dummies.append(dummy)
-        result = concat(with_dummies, axis=1)
-    else:
-        result = _get_dummies_1d(data, prefix, prefix_sep, dummy_na,
-                                 sparse=sparse)
-    return result
-
-
-def _get_dummies_1d(data, prefix, prefix_sep='_', dummy_na=False, sparse=False):
-    # Series avoids inconsistent NaN handling
-    cat = Categorical.from_array(Series(data), ordered=True)
-    levels = cat.categories
-
-    # if all NaN
-    if not dummy_na and len(levels) == 0:
-        if isinstance(data, Series):
-            index = data.index
-        else:
-            index = np.arange(len(data))
-        if not sparse:
-            return DataFrame(index=index)
-        else:
-            return SparseDataFrame(index=index)
-
-    codes = cat.codes.copy()
-    if dummy_na:
-        codes[codes == -1] = len(cat.categories)
-        levels = np.append(cat.categories, np.nan)
-
-    number_of_cols = len(levels)
-
-    if prefix is not None:
-        dummy_cols = ['%s%s%s' % (prefix, prefix_sep, v)
-                      for v in levels]
-    else:
-        dummy_cols = levels
-
-    if isinstance(data, Series):
-        index = data.index
-    else:
-        index = None
-
-    if sparse:
-        sparse_series = {}
-        N = len(data)
-        sp_indices = [ [] for _ in range(len(dummy_cols)) ]
-        for ndx, code in enumerate(codes):
-            if code == -1:
-                # Blank entries if not dummy_na and code == -1, #GH4446
-                continue
-            sp_indices[code].append(ndx)
-
-        for col, ixs in zip(dummy_cols, sp_indices):
-            sarr = SparseArray(np.ones(len(ixs)), sparse_index=IntIndex(N, ixs),
-                               fill_value=0)
-            sparse_series[col] = SparseSeries(data=sarr, index=index)
-
-        return SparseDataFrame(sparse_series, index=index, columns=dummy_cols)
-
-    else:
-        dummy_mat = np.eye(number_of_cols).take(codes, axis=0)
-
-        if not dummy_na:
-            # reset NaN GH4446
-            dummy_mat[codes == -1] = 0
-
-        return DataFrame(dummy_mat, index=index, columns=dummy_cols)
-
-
-def make_axis_dummies(frame, axis='minor', transform=None):
-    """
-    Construct 1-0 dummy variables corresponding to designated axis
-    labels
-
-    Parameters
-    ----------
-    frame : DataFrame
-    axis : {'major', 'minor'}, default 'minor'
-    transform : function, default None
-        Function to apply to axis labels first. For example, to
-        get "day of week" dummies in a time series regression
-        you might call::
-
-            make_axis_dummies(panel, axis='major',
-                              transform=lambda d: d.weekday())
-    Returns
-    -------
-    dummies : DataFrame
-        Column names taken from chosen axis
-    """
-    numbers = {
-        'major': 0,
-        'minor': 1
-    }
-    num = numbers.get(axis, axis)
-
-    items = frame.index.levels[num]
-    labels = frame.index.labels[num]
-    if transform is not None:
-        mapped_items = items.map(transform)
-        cat = Categorical.from_array(mapped_items.take(labels), ordered=True)
-        labels = cat.codes
-        items = cat.categories
-
-    values = np.eye(len(items), dtype=float)
-    values = values.take(labels, axis=0)
-
-    return DataFrame(values, columns=items, index=frame.index)
diff --git a/pandas/rpy/tests/__init__.py b/pandas/core/reshape/__init__.py
similarity index 100%
rename from pandas/rpy/tests/__init__.py
rename to pandas/core/reshape/__init__.py
diff --git a/pandas/core/reshape/api.py b/pandas/core/reshape/api.py
new file mode 100644
index 0000000000000..11d69359f5c65
--- /dev/null
+++ b/pandas/core/reshape/api.py
@@ -0,0 +1,8 @@
+# flake8: noqa
+
+from pandas.core.reshape.concat import concat
+from pandas.core.reshape.melt import melt, lreshape, wide_to_long
+from pandas.core.reshape.reshape import pivot_simple as pivot, get_dummies
+from pandas.core.reshape.merge import merge, merge_ordered, merge_asof
+from pandas.core.reshape.pivot import pivot_table, crosstab
+from pandas.core.reshape.tile import cut, qcut
diff --git a/pandas/core/reshape/concat.py b/pandas/core/reshape/concat.py
new file mode 100644
index 0000000000000..b36e9b8d900fd
--- /dev/null
+++ b/pandas/core/reshape/concat.py
@@ -0,0 +1,632 @@
+"""
+concat routines
+"""
+
+import numpy as np
+from pandas import compat, DataFrame, Series, Index, MultiIndex
+from pandas.core.index import (_get_objs_combined_axis,
+                               _ensure_index, _get_consensus_names,
+                               _all_indexes_same)
+from pandas.core.arrays.categorical import (_factorize_from_iterable,
+                                            _factorize_from_iterables)
+from pandas.core.internals import concatenate_block_managers
+from pandas.core import common as com
+from pandas.core.generic import NDFrame
+import pandas.core.dtypes.concat as _concat
+
+# ---------------------------------------------------------------------
+# Concatenate DataFrame objects
+
+
+def concat(objs, axis=0, join='outer', join_axes=None, ignore_index=False,
+           keys=None, levels=None, names=None, verify_integrity=False,
+           sort=None, copy=True):
+    """
+    Concatenate pandas objects along a particular axis with optional set logic
+    along the other axes.
+
+    Can also add a layer of hierarchical indexing on the concatenation axis,
+    which may be useful if the labels are the same (or overlapping) on
+    the passed axis number.
+
+    Parameters
+    ----------
+    objs : a sequence or mapping of Series, DataFrame, or Panel objects
+        If a dict is passed, the sorted keys will be used as the `keys`
+        argument, unless it is passed, in which case the values will be
+        selected (see below). Any None objects will be dropped silently unless
+        they are all None in which case a ValueError will be raised
+    axis : {0/'index', 1/'columns'}, default 0
+        The axis to concatenate along
+    join : {'inner', 'outer'}, default 'outer'
+        How to handle indexes on other axis(es)
+    join_axes : list of Index objects
+        Specific indexes to use for the other n - 1 axes instead of performing
+        inner/outer set logic
+    ignore_index : boolean, default False
+        If True, do not use the index values along the concatenation axis. The
+        resulting axis will be labeled 0, ..., n - 1. This is useful if you are
+        concatenating objects where the concatenation axis does not have
+        meaningful indexing information. Note the index values on the other
+        axes are still respected in the join.
+    keys : sequence, default None
+        If multiple levels passed, should contain tuples. Construct
+        hierarchical index using the passed keys as the outermost level
+    levels : list of sequences, default None
+        Specific levels (unique values) to use for constructing a
+        MultiIndex. Otherwise they will be inferred from the keys
+    names : list, default None
+        Names for the levels in the resulting hierarchical index
+    verify_integrity : boolean, default False
+        Check whether the new concatenated axis contains duplicates. This can
+        be very expensive relative to the actual data concatenation
+    sort : boolean, default None
+        Sort non-concatenation axis if it is not already aligned when `join`
+        is 'outer'. The current default of sorting is deprecated and will
+        change to not-sorting in a future version of pandas.
+
+        Explicitly pass ``sort=True`` to silence the warning and sort.
+        Explicitly pass ``sort=False`` to silence the warning and not sort.
+
+        This has no effect when ``join='inner'``, which already preserves
+        the order of the non-concatenation axis.
+
+        .. versionadded:: 0.23.0
+
+    copy : boolean, default True
+        If False, do not copy data unnecessarily
+
+    Returns
+    -------
+    concatenated : object, type of objs
+        When concatenating all ``Series`` along the index (axis=0), a
+        ``Series`` is returned. When ``objs`` contains at least one
+        ``DataFrame``, a ``DataFrame`` is returned. When concatenating along
+        the columns (axis=1), a ``DataFrame`` is returned.
+
+    Notes
+    -----
+    The keys, levels, and names arguments are all optional.
+
+    A walkthrough of how this method fits in with other tools for combining
+    pandas objects can be found `here
+    <http://pandas.pydata.org/pandas-docs/stable/merging.html>`__.
+
+    See Also
+    --------
+    Series.append
+    DataFrame.append
+    DataFrame.join
+    DataFrame.merge
+
+    Examples
+    --------
+    Combine two ``Series``.
+
+    >>> s1 = pd.Series(['a', 'b'])
+    >>> s2 = pd.Series(['c', 'd'])
+    >>> pd.concat([s1, s2])
+    0    a
+    1    b
+    0    c
+    1    d
+    dtype: object
+
+    Clear the existing index and reset it in the result
+    by setting the ``ignore_index`` option to ``True``.
+
+    >>> pd.concat([s1, s2], ignore_index=True)
+    0    a
+    1    b
+    2    c
+    3    d
+    dtype: object
+
+    Add a hierarchical index at the outermost level of
+    the data with the ``keys`` option.
+
+    >>> pd.concat([s1, s2], keys=['s1', 's2',])
+    s1  0    a
+        1    b
+    s2  0    c
+        1    d
+    dtype: object
+
+    Label the index keys you create with the ``names`` option.
+
+    >>> pd.concat([s1, s2], keys=['s1', 's2'],
+    ...           names=['Series name', 'Row ID'])
+    Series name  Row ID
+    s1           0         a
+                 1         b
+    s2           0         c
+                 1         d
+    dtype: object
+
+    Combine two ``DataFrame`` objects with identical columns.
+
+    >>> df1 = pd.DataFrame([['a', 1], ['b', 2]],
+    ...                    columns=['letter', 'number'])
+    >>> df1
+      letter  number
+    0      a       1
+    1      b       2
+    >>> df2 = pd.DataFrame([['c', 3], ['d', 4]],
+    ...                    columns=['letter', 'number'])
+    >>> df2
+      letter  number
+    0      c       3
+    1      d       4
+    >>> pd.concat([df1, df2])
+      letter  number
+    0      a       1
+    1      b       2
+    0      c       3
+    1      d       4
+
+    Combine ``DataFrame`` objects with overlapping columns
+    and return everything. Columns outside the intersection will
+    be filled with ``NaN`` values.
+
+    >>> df3 = pd.DataFrame([['c', 3, 'cat'], ['d', 4, 'dog']],
+    ...                    columns=['letter', 'number', 'animal'])
+    >>> df3
+      letter  number animal
+    0      c       3    cat
+    1      d       4    dog
+    >>> pd.concat([df1, df3])
+      animal letter  number
+    0    NaN      a       1
+    1    NaN      b       2
+    0    cat      c       3
+    1    dog      d       4
+
+    Combine ``DataFrame`` objects with overlapping columns
+    and return only those that are shared by passing ``inner`` to
+    the ``join`` keyword argument.
+
+    >>> pd.concat([df1, df3], join="inner")
+      letter  number
+    0      a       1
+    1      b       2
+    0      c       3
+    1      d       4
+
+    Combine ``DataFrame`` objects horizontally along the x axis by
+    passing in ``axis=1``.
+
+    >>> df4 = pd.DataFrame([['bird', 'polly'], ['monkey', 'george']],
+    ...                    columns=['animal', 'name'])
+    >>> pd.concat([df1, df4], axis=1)
+      letter  number  animal    name
+    0      a       1    bird   polly
+    1      b       2  monkey  george
+
+    Prevent the result from including duplicate index values with the
+    ``verify_integrity`` option.
+
+    >>> df5 = pd.DataFrame([1], index=['a'])
+    >>> df5
+       0
+    a  1
+    >>> df6 = pd.DataFrame([2], index=['a'])
+    >>> df6
+       0
+    a  2
+    >>> pd.concat([df5, df6], verify_integrity=True)
+    Traceback (most recent call last):
+        ...
+    ValueError: Indexes have overlapping values: ['a']
+    """
+    op = _Concatenator(objs, axis=axis, join_axes=join_axes,
+                       ignore_index=ignore_index, join=join,
+                       keys=keys, levels=levels, names=names,
+                       verify_integrity=verify_integrity,
+                       copy=copy, sort=sort)
+    return op.get_result()
+
+
+class _Concatenator(object):
+    """
+    Orchestrates a concatenation operation for BlockManagers
+    """
+
+    def __init__(self, objs, axis=0, join='outer', join_axes=None,
+                 keys=None, levels=None, names=None,
+                 ignore_index=False, verify_integrity=False, copy=True,
+                 sort=False):
+        if isinstance(objs, (NDFrame, compat.string_types)):
+            raise TypeError('first argument must be an iterable of pandas '
+                            'objects, you passed an object of type '
+                            '"{name}"'.format(name=type(objs).__name__))
+
+        if join == 'outer':
+            self.intersect = False
+        elif join == 'inner':
+            self.intersect = True
+        else:  # pragma: no cover
+            raise ValueError('Only can inner (intersect) or outer (union) '
+                             'join the other axis')
+
+        if isinstance(objs, dict):
+            if keys is None:
+                keys = sorted(objs)
+            objs = [objs[k] for k in keys]
+        else:
+            objs = list(objs)
+
+        if len(objs) == 0:
+            raise ValueError('No objects to concatenate')
+
+        if keys is None:
+            objs = list(com._not_none(*objs))
+        else:
+            # #1649
+            clean_keys = []
+            clean_objs = []
+            for k, v in zip(keys, objs):
+                if v is None:
+                    continue
+                clean_keys.append(k)
+                clean_objs.append(v)
+            objs = clean_objs
+            name = getattr(keys, 'name', None)
+            keys = Index(clean_keys, name=name)
+
+        if len(objs) == 0:
+            raise ValueError('All objects passed were None')
+
+        # consolidate data & figure out what our result ndim is going to be
+        ndims = set()
+        for obj in objs:
+            if not isinstance(obj, NDFrame):
+                msg = ('cannot concatenate object of type "{0}";'
+                       ' only pd.Series, pd.DataFrame, and pd.Panel'
+                       ' (deprecated) objs are valid'.format(type(obj)))
+                raise TypeError(msg)
+
+            # consolidate
+            obj._consolidate(inplace=True)
+            ndims.add(obj.ndim)
+
+        # get the sample
+        # want the highest ndim that we have, and must be non-empty
+        # unless all objs are empty
+        sample = None
+        if len(ndims) > 1:
+            max_ndim = max(ndims)
+            for obj in objs:
+                if obj.ndim == max_ndim and np.sum(obj.shape):
+                    sample = obj
+                    break
+
+        else:
+            # filter out the empties if we have not multi-index possibilities
+            # note to keep empty Series as it affect to result columns / name
+            non_empties = [obj for obj in objs
+                           if sum(obj.shape) > 0 or isinstance(obj, Series)]
+
+            if (len(non_empties) and (keys is None and names is None and
+                                      levels is None and
+                                      join_axes is None and
+                                      not self.intersect)):
+                objs = non_empties
+                sample = objs[0]
+
+        if sample is None:
+            sample = objs[0]
+        self.objs = objs
+
+        # Standardize axis parameter to int
+        if isinstance(sample, Series):
+            axis = DataFrame()._get_axis_number(axis)
+        else:
+            axis = sample._get_axis_number(axis)
+
+        # Need to flip BlockManager axis in the DataFrame special case
+        self._is_frame = isinstance(sample, DataFrame)
+        if self._is_frame:
+            axis = 1 if axis == 0 else 0
+
+        self._is_series = isinstance(sample, Series)
+        if not 0 <= axis <= sample.ndim:
+            raise AssertionError("axis must be between 0 and {ndim}, input was"
+                                 " {axis}".format(ndim=sample.ndim, axis=axis))
+
+        # if we have mixed ndims, then convert to highest ndim
+        # creating column numbers as needed
+        if len(ndims) > 1:
+            current_column = 0
+            max_ndim = sample.ndim
+            self.objs, objs = [], self.objs
+            for obj in objs:
+
+                ndim = obj.ndim
+                if ndim == max_ndim:
+                    pass
+
+                elif ndim != max_ndim - 1:
+                    raise ValueError("cannot concatenate unaligned mixed "
+                                     "dimensional NDFrame objects")
+
+                else:
+                    name = getattr(obj, 'name', None)
+                    if ignore_index or name is None:
+                        name = current_column
+                        current_column += 1
+
+                    # doing a row-wise concatenation so need everything
+                    # to line up
+                    if self._is_frame and axis == 1:
+                        name = 0
+                    obj = sample._constructor({name: obj})
+
+                self.objs.append(obj)
+
+        # note: this is the BlockManager axis (since DataFrame is transposed)
+        self.axis = axis
+        self.join_axes = join_axes
+        self.keys = keys
+        self.names = names or getattr(keys, 'names', None)
+        self.levels = levels
+        self.sort = sort
+
+        self.ignore_index = ignore_index
+        self.verify_integrity = verify_integrity
+        self.copy = copy
+
+        self.new_axes = self._get_new_axes()
+
+    def get_result(self):
+
+        # series only
+        if self._is_series:
+
+            # stack blocks
+            if self.axis == 0:
+                name = com._consensus_name_attr(self.objs)
+
+                mgr = self.objs[0]._data.concat([x._data for x in self.objs],
+                                                self.new_axes)
+                cons = _concat._get_series_result_type(mgr, self.objs)
+                return cons(mgr, name=name).__finalize__(self, method='concat')
+
+            # combine as columns in a frame
+            else:
+                data = dict(zip(range(len(self.objs)), self.objs))
+                cons = _concat._get_series_result_type(data)
+
+                index, columns = self.new_axes
+                df = cons(data, index=index)
+                df.columns = columns
+                return df.__finalize__(self, method='concat')
+
+        # combine block managers
+        else:
+            mgrs_indexers = []
+            for obj in self.objs:
+                mgr = obj._data
+                indexers = {}
+                for ax, new_labels in enumerate(self.new_axes):
+                    if ax == self.axis:
+                        # Suppress reindexing on concat axis
+                        continue
+
+                    obj_labels = mgr.axes[ax]
+                    if not new_labels.equals(obj_labels):
+                        indexers[ax] = obj_labels.reindex(new_labels)[1]
+
+                mgrs_indexers.append((obj._data, indexers))
+
+            new_data = concatenate_block_managers(
+                mgrs_indexers, self.new_axes, concat_axis=self.axis,
+                copy=self.copy)
+            if not self.copy:
+                new_data._consolidate_inplace()
+
+            cons = _concat._get_frame_result_type(new_data, self.objs)
+            return (cons._from_axes(new_data, self.new_axes)
+                    .__finalize__(self, method='concat'))
+
+    def _get_result_dim(self):
+        if self._is_series and self.axis == 1:
+            return 2
+        else:
+            return self.objs[0].ndim
+
+    def _get_new_axes(self):
+        ndim = self._get_result_dim()
+        new_axes = [None] * ndim
+
+        if self.join_axes is None:
+            for i in range(ndim):
+                if i == self.axis:
+                    continue
+                new_axes[i] = self._get_comb_axis(i)
+        else:
+            if len(self.join_axes) != ndim - 1:
+                raise AssertionError("length of join_axes must not be equal "
+                                     "to {length}".format(length=ndim - 1))
+
+            # ufff...
+            indices = compat.lrange(ndim)
+            indices.remove(self.axis)
+
+            for i, ax in zip(indices, self.join_axes):
+                new_axes[i] = ax
+
+        new_axes[self.axis] = self._get_concat_axis()
+        return new_axes
+
+    def _get_comb_axis(self, i):
+        data_axis = self.objs[0]._get_block_manager_axis(i)
+        try:
+            return _get_objs_combined_axis(self.objs, axis=data_axis,
+                                           intersect=self.intersect,
+                                           sort=self.sort)
+        except IndexError:
+            types = [type(x).__name__ for x in self.objs]
+            raise TypeError("Cannot concatenate list of {types}"
+                            .format(types=types))
+
+    def _get_concat_axis(self):
+        """
+        Return index to be used along concatenation axis.
+        """
+        if self._is_series:
+            if self.axis == 0:
+                indexes = [x.index for x in self.objs]
+            elif self.ignore_index:
+                idx = com._default_index(len(self.objs))
+                return idx
+            elif self.keys is None:
+                names = [None] * len(self.objs)
+                num = 0
+                has_names = False
+                for i, x in enumerate(self.objs):
+                    if not isinstance(x, Series):
+                        raise TypeError("Cannot concatenate type 'Series' "
+                                        "with object of type {type!r}"
+                                        .format(type=type(x).__name__))
+                    if x.name is not None:
+                        names[i] = x.name
+                        has_names = True
+                    else:
+                        names[i] = num
+                        num += 1
+                if has_names:
+                    return Index(names)
+                else:
+                    return com._default_index(len(self.objs))
+            else:
+                return _ensure_index(self.keys)
+        else:
+            indexes = [x._data.axes[self.axis] for x in self.objs]
+
+        if self.ignore_index:
+            idx = com._default_index(sum(len(i) for i in indexes))
+            return idx
+
+        if self.keys is None:
+            concat_axis = _concat_indexes(indexes)
+        else:
+            concat_axis = _make_concat_multiindex(indexes, self.keys,
+                                                  self.levels, self.names)
+
+        self._maybe_check_integrity(concat_axis)
+
+        return concat_axis
+
+    def _maybe_check_integrity(self, concat_index):
+        if self.verify_integrity:
+            if not concat_index.is_unique:
+                overlap = concat_index[concat_index.duplicated()].unique()
+                raise ValueError('Indexes have overlapping values: '
+                                 '{overlap!s}'.format(overlap=overlap))
+
+
+def _concat_indexes(indexes):
+    return indexes[0].append(indexes[1:])
+
+
+def _make_concat_multiindex(indexes, keys, levels=None, names=None):
+
+    if ((levels is None and isinstance(keys[0], tuple)) or
+            (levels is not None and len(levels) > 1)):
+        zipped = compat.lzip(*keys)
+        if names is None:
+            names = [None] * len(zipped)
+
+        if levels is None:
+            _, levels = _factorize_from_iterables(zipped)
+        else:
+            levels = [_ensure_index(x) for x in levels]
+    else:
+        zipped = [keys]
+        if names is None:
+            names = [None]
+
+        if levels is None:
+            levels = [_ensure_index(keys)]
+        else:
+            levels = [_ensure_index(x) for x in levels]
+
+    if not _all_indexes_same(indexes):
+        label_list = []
+
+        # things are potentially different sizes, so compute the exact labels
+        # for each level and pass those to MultiIndex.from_arrays
+
+        for hlevel, level in zip(zipped, levels):
+            to_concat = []
+            for key, index in zip(hlevel, indexes):
+                try:
+                    i = level.get_loc(key)
+                except KeyError:
+                    raise ValueError('Key {key!s} not in level {level!s}'
+                                     .format(key=key, level=level))
+
+                to_concat.append(np.repeat(i, len(index)))
+            label_list.append(np.concatenate(to_concat))
+
+        concat_index = _concat_indexes(indexes)
+
+        # these go at the end
+        if isinstance(concat_index, MultiIndex):
+            levels.extend(concat_index.levels)
+            label_list.extend(concat_index.labels)
+        else:
+            codes, categories = _factorize_from_iterable(concat_index)
+            levels.append(categories)
+            label_list.append(codes)
+
+        if len(names) == len(levels):
+            names = list(names)
+        else:
+            # make sure that all of the passed indices have the same nlevels
+            if not len({idx.nlevels for idx in indexes}) == 1:
+                raise AssertionError("Cannot concat indices that do"
+                                     " not have the same number of levels")
+
+            # also copies
+            names = names + _get_consensus_names(indexes)
+
+        return MultiIndex(levels=levels, labels=label_list, names=names,
+                          verify_integrity=False)
+
+    new_index = indexes[0]
+    n = len(new_index)
+    kpieces = len(indexes)
+
+    # also copies
+    new_names = list(names)
+    new_levels = list(levels)
+
+    # construct labels
+    new_labels = []
+
+    # do something a bit more speedy
+
+    for hlevel, level in zip(zipped, levels):
+        hlevel = _ensure_index(hlevel)
+        mapped = level.get_indexer(hlevel)
+
+        mask = mapped == -1
+        if mask.any():
+            raise ValueError('Values not found in passed level: {hlevel!s}'
+                             .format(hlevel=hlevel[mask]))
+
+        new_labels.append(np.repeat(mapped, n))
+
+    if isinstance(new_index, MultiIndex):
+        new_levels.extend(new_index.levels)
+        new_labels.extend([np.tile(lab, kpieces) for lab in new_index.labels])
+    else:
+        new_levels.append(new_index)
+        new_labels.append(np.tile(np.arange(n), kpieces))
+
+    if len(new_names) < len(new_levels):
+        new_names.extend(new_index.names)
+
+    return MultiIndex(levels=new_levels, labels=new_labels, names=new_names,
+                      verify_integrity=False)
diff --git a/pandas/core/reshape/melt.py b/pandas/core/reshape/melt.py
new file mode 100644
index 0000000000000..b3e3c52f6e363
--- /dev/null
+++ b/pandas/core/reshape/melt.py
@@ -0,0 +1,447 @@
+# pylint: disable=E1101,E1103
+# pylint: disable=W0703,W0622,W0613,W0201
+import numpy as np
+
+from pandas.core.dtypes.common import is_list_like
+from pandas import compat
+from pandas.core.arrays import Categorical
+
+from pandas.core.dtypes.generic import ABCMultiIndex
+
+from pandas.core.frame import _shared_docs
+from pandas.util._decorators import Appender
+
+import re
+from pandas.core.dtypes.missing import notna
+from pandas.core.dtypes.common import is_extension_type
+from pandas.core.tools.numeric import to_numeric
+from pandas.core.reshape.concat import concat
+
+
+@Appender(_shared_docs['melt'] %
+          dict(caller='pd.melt(df, ',
+               versionadded="",
+               other='DataFrame.melt'))
+def melt(frame, id_vars=None, value_vars=None, var_name=None,
+         value_name='value', col_level=None):
+    # TODO: what about the existing index?
+    if id_vars is not None:
+        if not is_list_like(id_vars):
+            id_vars = [id_vars]
+        elif (isinstance(frame.columns, ABCMultiIndex) and
+              not isinstance(id_vars, list)):
+            raise ValueError('id_vars must be a list of tuples when columns'
+                             ' are a MultiIndex')
+        else:
+            id_vars = list(id_vars)
+    else:
+        id_vars = []
+
+    if value_vars is not None:
+        if not is_list_like(value_vars):
+            value_vars = [value_vars]
+        elif (isinstance(frame.columns, ABCMultiIndex) and
+              not isinstance(value_vars, list)):
+            raise ValueError('value_vars must be a list of tuples when'
+                             ' columns are a MultiIndex')
+        else:
+            value_vars = list(value_vars)
+        frame = frame.loc[:, id_vars + value_vars]
+    else:
+        frame = frame.copy()
+
+    if col_level is not None:  # allow list or other?
+        # frame is a copy
+        frame.columns = frame.columns.get_level_values(col_level)
+
+    if var_name is None:
+        if isinstance(frame.columns, ABCMultiIndex):
+            if len(frame.columns.names) == len(set(frame.columns.names)):
+                var_name = frame.columns.names
+            else:
+                var_name = ['variable_{i}'.format(i=i)
+                            for i in range(len(frame.columns.names))]
+        else:
+            var_name = [frame.columns.name if frame.columns.name is not None
+                        else 'variable']
+    if isinstance(var_name, compat.string_types):
+        var_name = [var_name]
+
+    N, K = frame.shape
+    K -= len(id_vars)
+
+    mdata = {}
+    for col in id_vars:
+        id_data = frame.pop(col)
+        if is_extension_type(id_data):
+            id_data = concat([id_data] * K, ignore_index=True)
+        else:
+            id_data = np.tile(id_data.values, K)
+        mdata[col] = id_data
+
+    mcolumns = id_vars + var_name + [value_name]
+
+    mdata[value_name] = frame.values.ravel('F')
+    for i, col in enumerate(var_name):
+        # asanyarray will keep the columns as an Index
+        mdata[col] = np.asanyarray(frame.columns
+                                   ._get_level_values(i)).repeat(N)
+
+    return frame._constructor(mdata, columns=mcolumns)
+
+
+def lreshape(data, groups, dropna=True, label=None):
+    """
+    Reshape long-format data to wide. Generalized inverse of DataFrame.pivot
+
+    Parameters
+    ----------
+    data : DataFrame
+    groups : dict
+        {new_name : list_of_columns}
+    dropna : boolean, default True
+
+    Examples
+    --------
+    >>> import pandas as pd
+    >>> data = pd.DataFrame({'hr1': [514, 573], 'hr2': [545, 526],
+    ...                      'team': ['Red Sox', 'Yankees'],
+    ...                      'year1': [2007, 2007], 'year2': [2008, 2008]})
+    >>> data
+       hr1  hr2     team  year1  year2
+    0  514  545  Red Sox   2007   2008
+    1  573  526  Yankees   2007   2008
+
+    >>> pd.lreshape(data, {'year': ['year1', 'year2'], 'hr': ['hr1', 'hr2']})
+          team  year   hr
+    0  Red Sox  2007  514
+    1  Yankees  2007  573
+    2  Red Sox  2008  545
+    3  Yankees  2008  526
+
+    Returns
+    -------
+    reshaped : DataFrame
+    """
+    if isinstance(groups, dict):
+        keys = list(groups.keys())
+        values = list(groups.values())
+    else:
+        keys, values = zip(*groups)
+
+    all_cols = list(set.union(*[set(x) for x in values]))
+    id_cols = list(data.columns.difference(all_cols))
+
+    K = len(values[0])
+
+    for seq in values:
+        if len(seq) != K:
+            raise ValueError('All column lists must be same length')
+
+    mdata = {}
+    pivot_cols = []
+
+    for target, names in zip(keys, values):
+        to_concat = [data[col].values for col in names]
+
+        import pandas.core.dtypes.concat as _concat
+        mdata[target] = _concat._concat_compat(to_concat)
+        pivot_cols.append(target)
+
+    for col in id_cols:
+        mdata[col] = np.tile(data[col].values, K)
+
+    if dropna:
+        mask = np.ones(len(mdata[pivot_cols[0]]), dtype=bool)
+        for c in pivot_cols:
+            mask &= notna(mdata[c])
+        if not mask.all():
+            mdata = {k: v[mask] for k, v in compat.iteritems(mdata)}
+
+    return data._constructor(mdata, columns=id_cols + pivot_cols)
+
+
+def wide_to_long(df, stubnames, i, j, sep="", suffix=r'\d+'):
+    r"""
+    Wide panel to long format. Less flexible but more user-friendly than melt.
+
+    With stubnames ['A', 'B'], this function expects to find one or more
+    group of columns with format
+    A-suffix1, A-suffix2,..., B-suffix1, B-suffix2,...
+    You specify what you want to call this suffix in the resulting long format
+    with `j` (for example `j='year'`)
+
+    Each row of these wide variables are assumed to be uniquely identified by
+    `i` (can be a single column name or a list of column names)
+
+    All remaining variables in the data frame are left intact.
+
+    Parameters
+    ----------
+    df : DataFrame
+        The wide-format DataFrame
+    stubnames : str or list-like
+        The stub name(s). The wide format variables are assumed to
+        start with the stub names.
+    i : str or list-like
+        Column(s) to use as id variable(s)
+    j : str
+        The name of the sub-observation variable. What you wish to name your
+        suffix in the long format.
+    sep : str, default ""
+        A character indicating the separation of the variable names
+        in the wide format, to be stripped from the names in the long format.
+        For example, if your column names are A-suffix1, A-suffix2, you
+        can strip the hyphen by specifying `sep='-'`
+
+        .. versionadded:: 0.20.0
+
+    suffix : str, default '\\d+'
+        A regular expression capturing the wanted suffixes. '\\d+' captures
+        numeric suffixes. Suffixes with no numbers could be specified with the
+        negated character class '\\D+'. You can also further disambiguate
+        suffixes, for example, if your wide variables are of the form
+        A-one, B-two,.., and you have an unrelated column A-rating, you can
+        ignore the last one by specifying `suffix='(!?one|two)'`
+
+        .. versionadded:: 0.20.0
+
+        .. versionchanged:: 0.23.0
+            When all suffixes are numeric, they are cast to int64/float64.
+
+    Returns
+    -------
+    DataFrame
+        A DataFrame that contains each stub name as a variable, with new index
+        (i, j)
+
+    Examples
+    --------
+    >>> import pandas as pd
+    >>> import numpy as np
+    >>> np.random.seed(123)
+    >>> df = pd.DataFrame({"A1970" : {0 : "a", 1 : "b", 2 : "c"},
+    ...                    "A1980" : {0 : "d", 1 : "e", 2 : "f"},
+    ...                    "B1970" : {0 : 2.5, 1 : 1.2, 2 : .7},
+    ...                    "B1980" : {0 : 3.2, 1 : 1.3, 2 : .1},
+    ...                    "X"     : dict(zip(range(3), np.random.randn(3)))
+    ...                   })
+    >>> df["id"] = df.index
+    >>> df
+      A1970 A1980  B1970  B1980         X  id
+    0     a     d    2.5    3.2 -1.085631   0
+    1     b     e    1.2    1.3  0.997345   1
+    2     c     f    0.7    0.1  0.282978   2
+    >>> pd.wide_to_long(df, ["A", "B"], i="id", j="year")
+    ... # doctest: +NORMALIZE_WHITESPACE
+                    X  A    B
+    id year
+    0  1970 -1.085631  a  2.5
+    1  1970  0.997345  b  1.2
+    2  1970  0.282978  c  0.7
+    0  1980 -1.085631  d  3.2
+    1  1980  0.997345  e  1.3
+    2  1980  0.282978  f  0.1
+
+    With multiple id columns
+
+    >>> df = pd.DataFrame({
+    ...     'famid': [1, 1, 1, 2, 2, 2, 3, 3, 3],
+    ...     'birth': [1, 2, 3, 1, 2, 3, 1, 2, 3],
+    ...     'ht1': [2.8, 2.9, 2.2, 2, 1.8, 1.9, 2.2, 2.3, 2.1],
+    ...     'ht2': [3.4, 3.8, 2.9, 3.2, 2.8, 2.4, 3.3, 3.4, 2.9]
+    ... })
+    >>> df
+       birth  famid  ht1  ht2
+    0      1      1  2.8  3.4
+    1      2      1  2.9  3.8
+    2      3      1  2.2  2.9
+    3      1      2  2.0  3.2
+    4      2      2  1.8  2.8
+    5      3      2  1.9  2.4
+    6      1      3  2.2  3.3
+    7      2      3  2.3  3.4
+    8      3      3  2.1  2.9
+    >>> l = pd.wide_to_long(df, stubnames='ht', i=['famid', 'birth'], j='age')
+    >>> l
+    ... # doctest: +NORMALIZE_WHITESPACE
+                      ht
+    famid birth age
+    1     1     1    2.8
+                2    3.4
+          2     1    2.9
+                2    3.8
+          3     1    2.2
+                2    2.9
+    2     1     1    2.0
+                2    3.2
+          2     1    1.8
+                2    2.8
+          3     1    1.9
+                2    2.4
+    3     1     1    2.2
+                2    3.3
+          2     1    2.3
+                2    3.4
+          3     1    2.1
+                2    2.9
+
+    Going from long back to wide just takes some creative use of `unstack`
+
+    >>> w = l.unstack()
+    >>> w.columns = w.columns.map('{0[0]}{0[1]}'.format)
+    >>> w.reset_index()
+       famid  birth  ht1  ht2
+    0      1      1  2.8  3.4
+    1      1      2  2.9  3.8
+    2      1      3  2.2  2.9
+    3      2      1  2.0  3.2
+    4      2      2  1.8  2.8
+    5      2      3  1.9  2.4
+    6      3      1  2.2  3.3
+    7      3      2  2.3  3.4
+    8      3      3  2.1  2.9
+
+    Less wieldy column names are also handled
+
+    >>> np.random.seed(0)
+    >>> df = pd.DataFrame({'A(quarterly)-2010': np.random.rand(3),
+    ...                    'A(quarterly)-2011': np.random.rand(3),
+    ...                    'B(quarterly)-2010': np.random.rand(3),
+    ...                    'B(quarterly)-2011': np.random.rand(3),
+    ...                    'X' : np.random.randint(3, size=3)})
+    >>> df['id'] = df.index
+    >>> df # doctest: +NORMALIZE_WHITESPACE, +ELLIPSIS
+       A(quarterly)-2010  A(quarterly)-2011  B(quarterly)-2010  ...
+    0           0.548814           0.544883           0.437587  ...
+    1           0.715189           0.423655           0.891773  ...
+    2           0.602763           0.645894           0.963663  ...
+       X  id
+    0  0   0
+    1  1   1
+    2  1   2
+
+    >>> pd.wide_to_long(df, ['A(quarterly)', 'B(quarterly)'], i='id',
+    ...                 j='year', sep='-')
+    ... # doctest: +NORMALIZE_WHITESPACE
+             X  A(quarterly)  B(quarterly)
+    id year
+    0  2010  0      0.548814     0.437587
+    1  2010  1      0.715189     0.891773
+    2  2010  1      0.602763     0.963663
+    0  2011  0      0.544883     0.383442
+    1  2011  1      0.423655     0.791725
+    2  2011  1      0.645894     0.528895
+
+    If we have many columns, we could also use a regex to find our
+    stubnames and pass that list on to wide_to_long
+
+    >>> stubnames = sorted(
+    ...     set([match[0] for match in df.columns.str.findall(
+    ...         r'[A-B]\(.*\)').values if match != [] ])
+    ... )
+    >>> list(stubnames)
+    ['A(quarterly)', 'B(quarterly)']
+
+    All of the above examples have integers as suffixes. It is possible to
+    have non-integers as suffixes.
+
+    >>> df = pd.DataFrame({
+    ...     'famid': [1, 1, 1, 2, 2, 2, 3, 3, 3],
+    ...     'birth': [1, 2, 3, 1, 2, 3, 1, 2, 3],
+    ...     'ht_one': [2.8, 2.9, 2.2, 2, 1.8, 1.9, 2.2, 2.3, 2.1],
+    ...     'ht_two': [3.4, 3.8, 2.9, 3.2, 2.8, 2.4, 3.3, 3.4, 2.9]
+    ... })
+    >>> df
+       birth  famid  ht_one  ht_two
+    0      1      1     2.8     3.4
+    1      2      1     2.9     3.8
+    2      3      1     2.2     2.9
+    3      1      2     2.0     3.2
+    4      2      2     1.8     2.8
+    5      3      2     1.9     2.4
+    6      1      3     2.2     3.3
+    7      2      3     2.3     3.4
+    8      3      3     2.1     2.9
+
+    >>> l = pd.wide_to_long(df, stubnames='ht', i=['famid', 'birth'], j='age',
+                            sep='_', suffix='\w')
+    >>> l
+    ... # doctest: +NORMALIZE_WHITESPACE
+                      ht
+    famid birth age
+    1     1     one  2.8
+                two  3.4
+          2     one  2.9
+                two  3.8
+          3     one  2.2
+                two  2.9
+    2     1     one  2.0
+                two  3.2
+          2     one  1.8
+                two  2.8
+          3     one  1.9
+                two  2.4
+    3     1     one  2.2
+                two  3.3
+          2     one  2.3
+                two  3.4
+          3     one  2.1
+                two  2.9
+
+    Notes
+    -----
+    All extra variables are left untouched. This simply uses
+    `pandas.melt` under the hood, but is hard-coded to "do the right thing"
+    in a typical case.
+    """
+    def get_var_names(df, stub, sep, suffix):
+        regex = r'^{stub}{sep}{suffix}$'.format(
+            stub=re.escape(stub), sep=re.escape(sep), suffix=suffix)
+        pattern = re.compile(regex)
+        return [col for col in df.columns if pattern.match(col)]
+
+    def melt_stub(df, stub, i, j, value_vars, sep):
+        newdf = melt(df, id_vars=i, value_vars=value_vars,
+                     value_name=stub.rstrip(sep), var_name=j)
+        newdf[j] = Categorical(newdf[j])
+        newdf[j] = newdf[j].str.replace(re.escape(stub + sep), "")
+
+        # GH17627 Cast numerics suffixes to int/float
+        newdf[j] = to_numeric(newdf[j], errors='ignore')
+
+        return newdf.set_index(i + [j])
+
+    if any(col in stubnames for col in df.columns):
+        raise ValueError("stubname can't be identical to a column name")
+
+    if not is_list_like(stubnames):
+        stubnames = [stubnames]
+    else:
+        stubnames = list(stubnames)
+
+    if not is_list_like(i):
+        i = [i]
+    else:
+        i = list(i)
+
+    if df[i].duplicated().any():
+        raise ValueError("the id variables need to uniquely identify each row")
+
+    value_vars = [get_var_names(df, stub, sep, suffix) for stub in stubnames]
+
+    value_vars_flattened = [e for sublist in value_vars for e in sublist]
+    id_vars = list(set(df.columns.tolist()).difference(value_vars_flattened))
+
+    melted = []
+    for s, v in zip(stubnames, value_vars):
+        melted.append(melt_stub(df, s, i, j, v, sep))
+    melted = melted[0].join(melted[1:], how='outer')
+
+    if len(i) == 1:
+        new = df[id_vars].set_index(i).join(melted)
+        return new
+
+    new = df[id_vars].merge(melted.reset_index(), on=i).set_index(i + [j])
+
+    return new
diff --git a/pandas/core/reshape/merge.py b/pandas/core/reshape/merge.py
new file mode 100644
index 0000000000000..e38c069b3c3fb
--- /dev/null
+++ b/pandas/core/reshape/merge.py
@@ -0,0 +1,1647 @@
+"""
+SQL-style merge routines
+"""
+
+import copy
+import warnings
+import string
+
+import numpy as np
+from pandas.compat import range, lzip, zip, map, filter
+import pandas.compat as compat
+
+from pandas import (Categorical, DataFrame,
+                    Index, MultiIndex, Timedelta)
+from pandas.core.arrays.categorical import _recode_for_categories
+from pandas.core.frame import _merge_doc
+from pandas.core.dtypes.common import (
+    is_datetime64tz_dtype,
+    is_datetime64_dtype,
+    needs_i8_conversion,
+    is_int64_dtype,
+    is_array_like,
+    is_categorical_dtype,
+    is_integer_dtype,
+    is_float_dtype,
+    is_numeric_dtype,
+    is_integer,
+    is_int_or_datetime_dtype,
+    is_dtype_equal,
+    is_bool,
+    is_bool_dtype,
+    is_list_like,
+    is_datetimelike,
+    _ensure_int64,
+    _ensure_float64,
+    _ensure_object,
+    _get_dtype)
+from pandas.core.dtypes.missing import na_value_for_dtype
+from pandas.core.internals import (items_overlap_with_suffix,
+                                   concatenate_block_managers)
+from pandas.util._decorators import Appender, Substitution
+
+from pandas.core.sorting import is_int64_overflow_possible
+import pandas.core.algorithms as algos
+import pandas.core.sorting as sorting
+import pandas.core.common as com
+from pandas._libs import hashtable as libhashtable, join as libjoin, lib
+from pandas.errors import MergeError
+
+
+@Substitution('\nleft : DataFrame')
+@Appender(_merge_doc, indents=0)
+def merge(left, right, how='inner', on=None, left_on=None, right_on=None,
+          left_index=False, right_index=False, sort=False,
+          suffixes=('_x', '_y'), copy=True, indicator=False,
+          validate=None):
+    op = _MergeOperation(left, right, how=how, on=on, left_on=left_on,
+                         right_on=right_on, left_index=left_index,
+                         right_index=right_index, sort=sort, suffixes=suffixes,
+                         copy=copy, indicator=indicator,
+                         validate=validate)
+    return op.get_result()
+
+
+if __debug__:
+    merge.__doc__ = _merge_doc % '\nleft : DataFrame'
+
+
+def _groupby_and_merge(by, on, left, right, _merge_pieces,
+                       check_duplicates=True):
+    """
+    groupby & merge; we are always performing a left-by type operation
+
+    Parameters
+    ----------
+    by: field to group
+    on: duplicates field
+    left: left frame
+    right: right frame
+    _merge_pieces: function for merging
+    check_duplicates: boolean, default True
+        should we check & clean duplicates
+    """
+
+    pieces = []
+    if not isinstance(by, (list, tuple)):
+        by = [by]
+
+    lby = left.groupby(by, sort=False)
+
+    # if we can groupby the rhs
+    # then we can get vastly better perf
+    try:
+
+        # we will check & remove duplicates if indicated
+        if check_duplicates:
+            if on is None:
+                on = []
+            elif not isinstance(on, (list, tuple)):
+                on = [on]
+
+            if right.duplicated(by + on).any():
+                right = right.drop_duplicates(by + on, keep='last')
+        rby = right.groupby(by, sort=False)
+    except KeyError:
+        rby = None
+
+    for key, lhs in lby:
+
+        if rby is None:
+            rhs = right
+        else:
+            try:
+                rhs = right.take(rby.indices[key])
+            except KeyError:
+                # key doesn't exist in left
+                lcols = lhs.columns.tolist()
+                cols = lcols + [r for r in right.columns
+                                if r not in set(lcols)]
+                merged = lhs.reindex(columns=cols)
+                merged.index = range(len(merged))
+                pieces.append(merged)
+                continue
+
+        merged = _merge_pieces(lhs, rhs)
+
+        # make sure join keys are in the merged
+        # TODO, should _merge_pieces do this?
+        for k in by:
+            try:
+                if k in merged:
+                    merged[k] = key
+            except KeyError:
+                pass
+
+        pieces.append(merged)
+
+    # preserve the original order
+    # if we have a missing piece this can be reset
+    from pandas.core.reshape.concat import concat
+    result = concat(pieces, ignore_index=True)
+    result = result.reindex(columns=pieces[0].columns, copy=False)
+    return result, lby
+
+
+def merge_ordered(left, right, on=None,
+                  left_on=None, right_on=None,
+                  left_by=None, right_by=None,
+                  fill_method=None, suffixes=('_x', '_y'),
+                  how='outer'):
+    """Perform merge with optional filling/interpolation designed for ordered
+    data like time series data. Optionally perform group-wise merge (see
+    examples)
+
+    Parameters
+    ----------
+    left : DataFrame
+    right : DataFrame
+    on : label or list
+        Field names to join on. Must be found in both DataFrames.
+    left_on : label or list, or array-like
+        Field names to join on in left DataFrame. Can be a vector or list of
+        vectors of the length of the DataFrame to use a particular vector as
+        the join key instead of columns
+    right_on : label or list, or array-like
+        Field names to join on in right DataFrame or vector/list of vectors per
+        left_on docs
+    left_by : column name or list of column names
+        Group left DataFrame by group columns and merge piece by piece with
+        right DataFrame
+    right_by : column name or list of column names
+        Group right DataFrame by group columns and merge piece by piece with
+        left DataFrame
+    fill_method : {'ffill', None}, default None
+        Interpolation method for data
+    suffixes : 2-length sequence (tuple, list, ...)
+        Suffix to apply to overlapping column names in the left and right
+        side, respectively
+    how : {'left', 'right', 'outer', 'inner'}, default 'outer'
+        * left: use only keys from left frame (SQL: left outer join)
+        * right: use only keys from right frame (SQL: right outer join)
+        * outer: use union of keys from both frames (SQL: full outer join)
+        * inner: use intersection of keys from both frames (SQL: inner join)
+
+        .. versionadded:: 0.19.0
+
+    Examples
+    --------
+    >>> A                      >>> B
+          key  lvalue group        key  rvalue
+    0   a       1     a        0     b       1
+    1   c       2     a        1     c       2
+    2   e       3     a        2     d       3
+    3   a       1     b
+    4   c       2     b
+    5   e       3     b
+
+    >>> merge_ordered(A, B, fill_method='ffill', left_by='group')
+      group key  lvalue  rvalue
+    0     a   a       1     NaN
+    1     a   b       1     1.0
+    2     a   c       2     2.0
+    3     a   d       2     3.0
+    4     a   e       3     3.0
+    5     b   a       1     NaN
+    6     b   b       1     1.0
+    7     b   c       2     2.0
+    8     b   d       2     3.0
+    9     b   e       3     3.0
+
+    Returns
+    -------
+    merged : DataFrame
+        The output type will the be same as 'left', if it is a subclass
+        of DataFrame.
+
+    See also
+    --------
+    merge
+    merge_asof
+
+    """
+    def _merger(x, y):
+        # perform the ordered merge operation
+        op = _OrderedMerge(x, y, on=on, left_on=left_on, right_on=right_on,
+                           suffixes=suffixes, fill_method=fill_method,
+                           how=how)
+        return op.get_result()
+
+    if left_by is not None and right_by is not None:
+        raise ValueError('Can only group either left or right frames')
+    elif left_by is not None:
+        result, _ = _groupby_and_merge(left_by, on, left, right,
+                                       lambda x, y: _merger(x, y),
+                                       check_duplicates=False)
+    elif right_by is not None:
+        result, _ = _groupby_and_merge(right_by, on, right, left,
+                                       lambda x, y: _merger(y, x),
+                                       check_duplicates=False)
+    else:
+        result = _merger(left, right)
+    return result
+
+
+def merge_asof(left, right, on=None,
+               left_on=None, right_on=None,
+               left_index=False, right_index=False,
+               by=None, left_by=None, right_by=None,
+               suffixes=('_x', '_y'),
+               tolerance=None,
+               allow_exact_matches=True,
+               direction='backward'):
+    """Perform an asof merge. This is similar to a left-join except that we
+    match on nearest key rather than equal keys.
+
+    Both DataFrames must be sorted by the key.
+
+    For each row in the left DataFrame:
+
+      - A "backward" search selects the last row in the right DataFrame whose
+        'on' key is less than or equal to the left's key.
+
+      - A "forward" search selects the first row in the right DataFrame whose
+        'on' key is greater than or equal to the left's key.
+
+      - A "nearest" search selects the row in the right DataFrame whose 'on'
+        key is closest in absolute distance to the left's key.
+
+    The default is "backward" and is compatible in versions below 0.20.0.
+    The direction parameter was added in version 0.20.0 and introduces
+    "forward" and "nearest".
+
+    Optionally match on equivalent keys with 'by' before searching with 'on'.
+
+    .. versionadded:: 0.19.0
+
+    Parameters
+    ----------
+    left : DataFrame
+    right : DataFrame
+    on : label
+        Field name to join on. Must be found in both DataFrames.
+        The data MUST be ordered. Furthermore this must be a numeric column,
+        such as datetimelike, integer, or float. On or left_on/right_on
+        must be given.
+    left_on : label
+        Field name to join on in left DataFrame.
+    right_on : label
+        Field name to join on in right DataFrame.
+    left_index : boolean
+        Use the index of the left DataFrame as the join key.
+
+        .. versionadded:: 0.19.2
+
+    right_index : boolean
+        Use the index of the right DataFrame as the join key.
+
+        .. versionadded:: 0.19.2
+
+    by : column name or list of column names
+        Match on these columns before performing merge operation.
+    left_by : column name
+        Field names to match on in the left DataFrame.
+
+        .. versionadded:: 0.19.2
+
+    right_by : column name
+        Field names to match on in the right DataFrame.
+
+        .. versionadded:: 0.19.2
+
+    suffixes : 2-length sequence (tuple, list, ...)
+        Suffix to apply to overlapping column names in the left and right
+        side, respectively.
+    tolerance : integer or Timedelta, optional, default None
+        Select asof tolerance within this range; must be compatible
+        with the merge index.
+    allow_exact_matches : boolean, default True
+
+        - If True, allow matching with the same 'on' value
+          (i.e. less-than-or-equal-to / greater-than-or-equal-to)
+        - If False, don't match the same 'on' value
+          (i.e., strictly less-than / strictly greater-than)
+
+    direction : 'backward' (default), 'forward', or 'nearest'
+        Whether to search for prior, subsequent, or closest matches.
+
+        .. versionadded:: 0.20.0
+
+
+    Returns
+    -------
+    merged : DataFrame
+
+    Examples
+    --------
+    >>> left = pd.DataFrame({'a': [1, 5, 10], 'left_val': ['a', 'b', 'c']})
+    >>> left
+        a left_val
+    0   1        a
+    1   5        b
+    2  10        c
+
+    >>> right = pd.DataFrame({'a': [1, 2, 3, 6, 7],
+    ...                       'right_val': [1, 2, 3, 6, 7]})
+    >>> right
+       a  right_val
+    0  1          1
+    1  2          2
+    2  3          3
+    3  6          6
+    4  7          7
+
+    >>> pd.merge_asof(left, right, on='a')
+        a left_val  right_val
+    0   1        a          1
+    1   5        b          3
+    2  10        c          7
+
+    >>> pd.merge_asof(left, right, on='a', allow_exact_matches=False)
+        a left_val  right_val
+    0   1        a        NaN
+    1   5        b        3.0
+    2  10        c        7.0
+
+    >>> pd.merge_asof(left, right, on='a', direction='forward')
+        a left_val  right_val
+    0   1        a        1.0
+    1   5        b        6.0
+    2  10        c        NaN
+
+    >>> pd.merge_asof(left, right, on='a', direction='nearest')
+        a left_val  right_val
+    0   1        a          1
+    1   5        b          6
+    2  10        c          7
+
+    We can use indexed DataFrames as well.
+
+    >>> left = pd.DataFrame({'left_val': ['a', 'b', 'c']}, index=[1, 5, 10])
+    >>> left
+       left_val
+    1         a
+    5         b
+    10        c
+
+    >>> right = pd.DataFrame({'right_val': [1, 2, 3, 6, 7]},
+    ...                      index=[1, 2, 3, 6, 7])
+    >>> right
+       right_val
+    1          1
+    2          2
+    3          3
+    6          6
+    7          7
+
+    >>> pd.merge_asof(left, right, left_index=True, right_index=True)
+       left_val  right_val
+    1         a          1
+    5         b          3
+    10        c          7
+
+    Here is a real-world times-series example
+
+    >>> quotes
+                         time ticker     bid     ask
+    0 2016-05-25 13:30:00.023   GOOG  720.50  720.93
+    1 2016-05-25 13:30:00.023   MSFT   51.95   51.96
+    2 2016-05-25 13:30:00.030   MSFT   51.97   51.98
+    3 2016-05-25 13:30:00.041   MSFT   51.99   52.00
+    4 2016-05-25 13:30:00.048   GOOG  720.50  720.93
+    5 2016-05-25 13:30:00.049   AAPL   97.99   98.01
+    6 2016-05-25 13:30:00.072   GOOG  720.50  720.88
+    7 2016-05-25 13:30:00.075   MSFT   52.01   52.03
+
+    >>> trades
+                         time ticker   price  quantity
+    0 2016-05-25 13:30:00.023   MSFT   51.95        75
+    1 2016-05-25 13:30:00.038   MSFT   51.95       155
+    2 2016-05-25 13:30:00.048   GOOG  720.77       100
+    3 2016-05-25 13:30:00.048   GOOG  720.92       100
+    4 2016-05-25 13:30:00.048   AAPL   98.00       100
+
+    By default we are taking the asof of the quotes
+
+    >>> pd.merge_asof(trades, quotes,
+    ...                       on='time',
+    ...                       by='ticker')
+                         time ticker   price  quantity     bid     ask
+    0 2016-05-25 13:30:00.023   MSFT   51.95        75   51.95   51.96
+    1 2016-05-25 13:30:00.038   MSFT   51.95       155   51.97   51.98
+    2 2016-05-25 13:30:00.048   GOOG  720.77       100  720.50  720.93
+    3 2016-05-25 13:30:00.048   GOOG  720.92       100  720.50  720.93
+    4 2016-05-25 13:30:00.048   AAPL   98.00       100     NaN     NaN
+
+    We only asof within 2ms between the quote time and the trade time
+
+    >>> pd.merge_asof(trades, quotes,
+    ...                       on='time',
+    ...                       by='ticker',
+    ...                       tolerance=pd.Timedelta('2ms'))
+                         time ticker   price  quantity     bid     ask
+    0 2016-05-25 13:30:00.023   MSFT   51.95        75   51.95   51.96
+    1 2016-05-25 13:30:00.038   MSFT   51.95       155     NaN     NaN
+    2 2016-05-25 13:30:00.048   GOOG  720.77       100  720.50  720.93
+    3 2016-05-25 13:30:00.048   GOOG  720.92       100  720.50  720.93
+    4 2016-05-25 13:30:00.048   AAPL   98.00       100     NaN     NaN
+
+    We only asof within 10ms between the quote time and the trade time
+    and we exclude exact matches on time. However *prior* data will
+    propagate forward
+
+    >>> pd.merge_asof(trades, quotes,
+    ...                       on='time',
+    ...                       by='ticker',
+    ...                       tolerance=pd.Timedelta('10ms'),
+    ...                       allow_exact_matches=False)
+                         time ticker   price  quantity     bid     ask
+    0 2016-05-25 13:30:00.023   MSFT   51.95        75     NaN     NaN
+    1 2016-05-25 13:30:00.038   MSFT   51.95       155   51.97   51.98
+    2 2016-05-25 13:30:00.048   GOOG  720.77       100     NaN     NaN
+    3 2016-05-25 13:30:00.048   GOOG  720.92       100     NaN     NaN
+    4 2016-05-25 13:30:00.048   AAPL   98.00       100     NaN     NaN
+
+    See also
+    --------
+    merge
+    merge_ordered
+
+    """
+    op = _AsOfMerge(left, right,
+                    on=on, left_on=left_on, right_on=right_on,
+                    left_index=left_index, right_index=right_index,
+                    by=by, left_by=left_by, right_by=right_by,
+                    suffixes=suffixes,
+                    how='asof', tolerance=tolerance,
+                    allow_exact_matches=allow_exact_matches,
+                    direction=direction)
+    return op.get_result()
+
+
+# TODO: transformations??
+# TODO: only copy DataFrames when modification necessary
+class _MergeOperation(object):
+    """
+    Perform a database (SQL) merge operation between two DataFrame objects
+    using either columns as keys or their row indexes
+    """
+    _merge_type = 'merge'
+
+    def __init__(self, left, right, how='inner', on=None,
+                 left_on=None, right_on=None, axis=1,
+                 left_index=False, right_index=False, sort=True,
+                 suffixes=('_x', '_y'), copy=True, indicator=False,
+                 validate=None):
+        self.left = self.orig_left = left
+        self.right = self.orig_right = right
+        self.how = how
+        self.axis = axis
+
+        self.on = com._maybe_make_list(on)
+        self.left_on = com._maybe_make_list(left_on)
+        self.right_on = com._maybe_make_list(right_on)
+
+        self.copy = copy
+        self.suffixes = suffixes
+        self.sort = sort
+
+        self.left_index = left_index
+        self.right_index = right_index
+
+        self.indicator = indicator
+
+        if isinstance(self.indicator, compat.string_types):
+            self.indicator_name = self.indicator
+        elif isinstance(self.indicator, bool):
+            self.indicator_name = '_merge' if self.indicator else None
+        else:
+            raise ValueError(
+                'indicator option can only accept boolean or string arguments')
+
+        if not isinstance(left, DataFrame):
+            raise ValueError('can not merge DataFrame with instance of '
+                             'type {left}'.format(left=type(left)))
+        if not isinstance(right, DataFrame):
+            raise ValueError('can not merge DataFrame with instance of '
+                             'type {right}'.format(right=type(right)))
+
+        if not is_bool(left_index):
+            raise ValueError(
+                'left_index parameter must be of type bool, not '
+                '{left_index}'.format(left_index=type(left_index)))
+        if not is_bool(right_index):
+            raise ValueError(
+                'right_index parameter must be of type bool, not '
+                '{right_index}'.format(right_index=type(right_index)))
+
+        # warn user when merging between different levels
+        if left.columns.nlevels != right.columns.nlevels:
+            msg = ('merging between different levels can give an unintended '
+                   'result ({left} levels on the left, {right} on the right)'
+                   ).format(left=left.columns.nlevels,
+                            right=right.columns.nlevels)
+            warnings.warn(msg, UserWarning)
+
+        self._validate_specification()
+
+        # note this function has side effects
+        (self.left_join_keys,
+         self.right_join_keys,
+         self.join_names) = self._get_merge_keys()
+
+        # validate the merge keys dtypes. We may need to coerce
+        # to avoid incompat dtypes
+        self._maybe_coerce_merge_keys()
+
+        # If argument passed to validate,
+        # check if columns specified as unique
+        # are in fact unique.
+        if validate is not None:
+            self._validate(validate)
+
+    def get_result(self):
+        if self.indicator:
+            self.left, self.right = self._indicator_pre_merge(
+                self.left, self.right)
+
+        join_index, left_indexer, right_indexer = self._get_join_info()
+
+        ldata, rdata = self.left._data, self.right._data
+        lsuf, rsuf = self.suffixes
+
+        llabels, rlabels = items_overlap_with_suffix(ldata.items, lsuf,
+                                                     rdata.items, rsuf)
+
+        lindexers = {1: left_indexer} if left_indexer is not None else {}
+        rindexers = {1: right_indexer} if right_indexer is not None else {}
+
+        result_data = concatenate_block_managers(
+            [(ldata, lindexers), (rdata, rindexers)],
+            axes=[llabels.append(rlabels), join_index],
+            concat_axis=0, copy=self.copy)
+
+        typ = self.left._constructor
+        result = typ(result_data).__finalize__(self, method=self._merge_type)
+
+        if self.indicator:
+            result = self._indicator_post_merge(result)
+
+        self._maybe_add_join_keys(result, left_indexer, right_indexer)
+
+        self._maybe_restore_index_levels(result)
+
+        return result
+
+    def _indicator_pre_merge(self, left, right):
+
+        columns = left.columns.union(right.columns)
+
+        for i in ['_left_indicator', '_right_indicator']:
+            if i in columns:
+                raise ValueError("Cannot use `indicator=True` option when "
+                                 "data contains a column named {name}"
+                                 .format(name=i))
+        if self.indicator_name in columns:
+            raise ValueError(
+                "Cannot use name of an existing column for indicator column")
+
+        left = left.copy()
+        right = right.copy()
+
+        left['_left_indicator'] = 1
+        left['_left_indicator'] = left['_left_indicator'].astype('int8')
+
+        right['_right_indicator'] = 2
+        right['_right_indicator'] = right['_right_indicator'].astype('int8')
+
+        return left, right
+
+    def _indicator_post_merge(self, result):
+
+        result['_left_indicator'] = result['_left_indicator'].fillna(0)
+        result['_right_indicator'] = result['_right_indicator'].fillna(0)
+
+        result[self.indicator_name] = Categorical((result['_left_indicator'] +
+                                                   result['_right_indicator']),
+                                                  categories=[1, 2, 3])
+        result[self.indicator_name] = (
+            result[self.indicator_name]
+            .cat.rename_categories(['left_only', 'right_only', 'both']))
+
+        result = result.drop(labels=['_left_indicator', '_right_indicator'],
+                             axis=1)
+        return result
+
+    def _maybe_restore_index_levels(self, result):
+        """
+        Restore index levels specified as `on` parameters
+
+        Here we check for cases where `self.left_on` and `self.right_on` pairs
+        each reference an index level in their respective DataFrames. The
+        joined columns corresponding to these pairs are then restored to the
+        index of `result`.
+
+        **Note:** This method has side effects. It modifies `result` in-place
+
+        Parameters
+        ----------
+        result: DataFrame
+            merge result
+
+        Returns
+        -------
+        None
+        """
+        names_to_restore = []
+        for name, left_key, right_key in zip(self.join_names,
+                                             self.left_on,
+                                             self.right_on):
+            if (self.orig_left._is_level_reference(left_key) and
+                    self.orig_right._is_level_reference(right_key) and
+                    name not in result.index.names):
+
+                names_to_restore.append(name)
+
+        if names_to_restore:
+            result.set_index(names_to_restore, inplace=True)
+
+    def _maybe_add_join_keys(self, result, left_indexer, right_indexer):
+
+        left_has_missing = None
+        right_has_missing = None
+
+        keys = zip(self.join_names, self.left_on, self.right_on)
+        for i, (name, lname, rname) in enumerate(keys):
+            if not _should_fill(lname, rname):
+                continue
+
+            take_left, take_right = None, None
+
+            if name in result:
+
+                if left_indexer is not None and right_indexer is not None:
+                    if name in self.left:
+
+                        if left_has_missing is None:
+                            left_has_missing = (left_indexer == -1).any()
+
+                        if left_has_missing:
+                            take_right = self.right_join_keys[i]
+
+                            if not is_dtype_equal(result[name].dtype,
+                                                  self.left[name].dtype):
+                                take_left = self.left[name]._values
+
+                    elif name in self.right:
+
+                        if right_has_missing is None:
+                            right_has_missing = (right_indexer == -1).any()
+
+                        if right_has_missing:
+                            take_left = self.left_join_keys[i]
+
+                            if not is_dtype_equal(result[name].dtype,
+                                                  self.right[name].dtype):
+                                take_right = self.right[name]._values
+
+            elif left_indexer is not None \
+                    and is_array_like(self.left_join_keys[i]):
+                take_left = self.left_join_keys[i]
+                take_right = self.right_join_keys[i]
+
+            if take_left is not None or take_right is not None:
+
+                if take_left is None:
+                    lvals = result[name]._values
+                else:
+                    lfill = na_value_for_dtype(take_left.dtype)
+                    lvals = algos.take_1d(take_left, left_indexer,
+                                          fill_value=lfill)
+
+                if take_right is None:
+                    rvals = result[name]._values
+                else:
+                    rfill = na_value_for_dtype(take_right.dtype)
+                    rvals = algos.take_1d(take_right, right_indexer,
+                                          fill_value=rfill)
+
+                # if we have an all missing left_indexer
+                # make sure to just use the right values
+                mask = left_indexer == -1
+                if mask.all():
+                    key_col = rvals
+                else:
+                    key_col = Index(lvals).where(~mask, rvals)
+
+                if result._is_label_reference(name):
+                    result[name] = key_col
+                elif result._is_level_reference(name):
+                    if isinstance(result.index, MultiIndex):
+                        idx_list = [result.index.get_level_values(level_name)
+                                    if level_name != name else key_col
+                                    for level_name in result.index.names]
+
+                        result.set_index(idx_list, inplace=True)
+                    else:
+                        result.index = Index(key_col, name=name)
+                else:
+                    result.insert(i, name or 'key_{i}'.format(i=i), key_col)
+
+    def _get_join_indexers(self):
+        """ return the join indexers """
+        return _get_join_indexers(self.left_join_keys,
+                                  self.right_join_keys,
+                                  sort=self.sort,
+                                  how=self.how)
+
+    def _get_join_info(self):
+        left_ax = self.left._data.axes[self.axis]
+        right_ax = self.right._data.axes[self.axis]
+
+        if self.left_index and self.right_index and self.how != 'asof':
+            join_index, left_indexer, right_indexer = \
+                left_ax.join(right_ax, how=self.how, return_indexers=True,
+                             sort=self.sort)
+        elif self.right_index and self.how == 'left':
+            join_index, left_indexer, right_indexer = \
+                _left_join_on_index(left_ax, right_ax, self.left_join_keys,
+                                    sort=self.sort)
+
+        elif self.left_index and self.how == 'right':
+            join_index, right_indexer, left_indexer = \
+                _left_join_on_index(right_ax, left_ax, self.right_join_keys,
+                                    sort=self.sort)
+        else:
+            (left_indexer,
+             right_indexer) = self._get_join_indexers()
+
+            if self.right_index:
+                if len(self.left) > 0:
+                    join_index = self.left.index.take(left_indexer)
+                else:
+                    join_index = self.right.index.take(right_indexer)
+                    left_indexer = np.array([-1] * len(join_index))
+            elif self.left_index:
+                if len(self.right) > 0:
+                    join_index = self.right.index.take(right_indexer)
+                else:
+                    join_index = self.left.index.take(left_indexer)
+                    right_indexer = np.array([-1] * len(join_index))
+            else:
+                join_index = Index(np.arange(len(left_indexer)))
+
+        if len(join_index) == 0:
+            join_index = join_index.astype(object)
+        return join_index, left_indexer, right_indexer
+
+    def _get_merge_keys(self):
+        """
+        Note: has side effects (copy/delete key columns)
+
+        Parameters
+        ----------
+        left
+        right
+        on
+
+        Returns
+        -------
+        left_keys, right_keys
+        """
+        left_keys = []
+        right_keys = []
+        join_names = []
+        right_drop = []
+        left_drop = []
+
+        left, right = self.left, self.right
+        stacklevel = 5  # Number of stack levels from df.merge
+
+        is_lkey = lambda x: is_array_like(x) and len(x) == len(left)
+        is_rkey = lambda x: is_array_like(x) and len(x) == len(right)
+
+        # Note that pd.merge_asof() has separate 'on' and 'by' parameters. A
+        # user could, for example, request 'left_index' and 'left_by'. In a
+        # regular pd.merge(), users cannot specify both 'left_index' and
+        # 'left_on'. (Instead, users have a MultiIndex). That means the
+        # self.left_on in this function is always empty in a pd.merge(), but
+        # a pd.merge_asof(left_index=True, left_by=...) will result in a
+        # self.left_on array with a None in the middle of it. This requires
+        # a work-around as designated in the code below.
+        # See _validate_specification() for where this happens.
+
+        # ugh, spaghetti re #733
+        if _any(self.left_on) and _any(self.right_on):
+            for lk, rk in zip(self.left_on, self.right_on):
+                if is_lkey(lk):
+                    left_keys.append(lk)
+                    if is_rkey(rk):
+                        right_keys.append(rk)
+                        join_names.append(None)  # what to do?
+                    else:
+                        if rk is not None:
+                            right_keys.append(
+                                right._get_label_or_level_values(
+                                    rk, stacklevel=stacklevel))
+                            join_names.append(rk)
+                        else:
+                            # work-around for merge_asof(right_index=True)
+                            right_keys.append(right.index)
+                            join_names.append(right.index.name)
+                else:
+                    if not is_rkey(rk):
+                        if rk is not None:
+                            right_keys.append(
+                                right._get_label_or_level_values(
+                                    rk, stacklevel=stacklevel))
+                        else:
+                            # work-around for merge_asof(right_index=True)
+                            right_keys.append(right.index)
+                        if lk is not None and lk == rk:
+                            # avoid key upcast in corner case (length-0)
+                            if len(left) > 0:
+                                right_drop.append(rk)
+                            else:
+                                left_drop.append(lk)
+                    else:
+                        right_keys.append(rk)
+                    if lk is not None:
+                        left_keys.append(left._get_label_or_level_values(
+                            lk, stacklevel=stacklevel))
+                        join_names.append(lk)
+                    else:
+                        # work-around for merge_asof(left_index=True)
+                        left_keys.append(left.index)
+                        join_names.append(left.index.name)
+        elif _any(self.left_on):
+            for k in self.left_on:
+                if is_lkey(k):
+                    left_keys.append(k)
+                    join_names.append(None)
+                else:
+                    left_keys.append(left._get_label_or_level_values(
+                        k, stacklevel=stacklevel))
+                    join_names.append(k)
+            if isinstance(self.right.index, MultiIndex):
+                right_keys = [lev._values.take(lab)
+                              for lev, lab in zip(self.right.index.levels,
+                                                  self.right.index.labels)]
+            else:
+                right_keys = [self.right.index.values]
+        elif _any(self.right_on):
+            for k in self.right_on:
+                if is_rkey(k):
+                    right_keys.append(k)
+                    join_names.append(None)
+                else:
+                    right_keys.append(right._get_label_or_level_values(
+                        k, stacklevel=stacklevel))
+                    join_names.append(k)
+            if isinstance(self.left.index, MultiIndex):
+                left_keys = [lev._values.take(lab)
+                             for lev, lab in zip(self.left.index.levels,
+                                                 self.left.index.labels)]
+            else:
+                left_keys = [self.left.index.values]
+
+        if left_drop:
+            self.left = self.left._drop_labels_or_levels(left_drop)
+
+        if right_drop:
+            self.right = self.right._drop_labels_or_levels(right_drop)
+
+        return left_keys, right_keys, join_names
+
+    def _maybe_coerce_merge_keys(self):
+        # we have valid mergees but we may have to further
+        # coerce these if they are originally incompatible types
+        #
+        # for example if these are categorical, but are not dtype_equal
+        # or if we have object and integer dtypes
+
+        for lk, rk, name in zip(self.left_join_keys,
+                                self.right_join_keys,
+                                self.join_names):
+            if (len(lk) and not len(rk)) or (not len(lk) and len(rk)):
+                continue
+
+            lk_is_cat = is_categorical_dtype(lk)
+            rk_is_cat = is_categorical_dtype(rk)
+
+            # if either left or right is a categorical
+            # then the must match exactly in categories & ordered
+            if lk_is_cat and rk_is_cat:
+                if lk.is_dtype_equal(rk):
+                    continue
+
+            elif lk_is_cat or rk_is_cat:
+                pass
+
+            elif is_dtype_equal(lk.dtype, rk.dtype):
+                continue
+
+            msg = ("You are trying to merge on {lk_dtype} and "
+                   "{rk_dtype} columns. If you wish to proceed "
+                   "you should use pd.concat".format(lk_dtype=lk.dtype,
+                                                     rk_dtype=rk.dtype))
+
+            # if we are numeric, then allow differing
+            # kinds to proceed, eg. int64 and int8, int and float
+            # further if we are object, but we infer to
+            # the same, then proceed
+            if is_numeric_dtype(lk) and is_numeric_dtype(rk):
+                if lk.dtype.kind == rk.dtype.kind:
+                    pass
+
+                # check whether ints and floats
+                elif is_integer_dtype(rk) and is_float_dtype(lk):
+                    if not (lk == lk.astype(rk.dtype))[~np.isnan(lk)].all():
+                        warnings.warn('You are merging on int and float '
+                                      'columns where the float values '
+                                      'are not equal to their int '
+                                      'representation', UserWarning)
+
+                elif is_float_dtype(rk) and is_integer_dtype(lk):
+                    if not (rk == rk.astype(lk.dtype))[~np.isnan(rk)].all():
+                        warnings.warn('You are merging on int and float '
+                                      'columns where the float values '
+                                      'are not equal to their int '
+                                      'representation', UserWarning)
+
+                # let's infer and see if we are ok
+                elif lib.infer_dtype(lk) == lib.infer_dtype(rk):
+                    pass
+
+            # Check if we are trying to merge on obviously
+            # incompatible dtypes GH 9780, GH 15800
+
+            # boolean values are considered as numeric, but are still allowed
+            # to be merged on object boolean values
+            elif ((is_numeric_dtype(lk) and not is_bool_dtype(lk))
+                    and not is_numeric_dtype(rk)):
+                raise ValueError(msg)
+            elif (not is_numeric_dtype(lk)
+                    and (is_numeric_dtype(rk) and not is_bool_dtype(rk))):
+                raise ValueError(msg)
+            elif is_datetimelike(lk) and not is_datetimelike(rk):
+                raise ValueError(msg)
+            elif not is_datetimelike(lk) and is_datetimelike(rk):
+                raise ValueError(msg)
+            elif is_datetime64tz_dtype(lk) and not is_datetime64tz_dtype(rk):
+                raise ValueError(msg)
+            elif not is_datetime64tz_dtype(lk) and is_datetime64tz_dtype(rk):
+                raise ValueError(msg)
+
+            # Houston, we have a problem!
+            # let's coerce to object if the dtypes aren't
+            # categorical, otherwise coerce to the category
+            # dtype. If we coerced categories to object,
+            # then we would lose type information on some
+            # columns, and end up trying to merge
+            # incompatible dtypes. See GH 16900.
+            else:
+                if name in self.left.columns:
+                    typ = lk.categories.dtype if lk_is_cat else object
+                    self.left = self.left.assign(
+                        **{name: self.left[name].astype(typ)})
+                if name in self.right.columns:
+                    typ = rk.categories.dtype if rk_is_cat else object
+                    self.right = self.right.assign(
+                        **{name: self.right[name].astype(typ)})
+
+    def _validate_specification(self):
+        # Hm, any way to make this logic less complicated??
+        if self.on is None and self.left_on is None and self.right_on is None:
+
+            if self.left_index and self.right_index:
+                self.left_on, self.right_on = (), ()
+            elif self.left_index:
+                if self.right_on is None:
+                    raise MergeError('Must pass right_on or right_index=True')
+            elif self.right_index:
+                if self.left_on is None:
+                    raise MergeError('Must pass left_on or left_index=True')
+            else:
+                # use the common columns
+                common_cols = self.left.columns.intersection(
+                    self.right.columns)
+                if len(common_cols) == 0:
+                    raise MergeError(
+                        'No common columns to perform merge on. '
+                        'Merge options: left_on={lon}, right_on={ron}, '
+                        'left_index={lidx}, right_index={ridx}'
+                        .format(lon=self.left_on, ron=self.right_on,
+                                lidx=self.left_index, ridx=self.right_index))
+                if not common_cols.is_unique:
+                    raise MergeError("Data columns not unique: {common!r}"
+                                     .format(common=common_cols))
+                self.left_on = self.right_on = common_cols
+        elif self.on is not None:
+            if self.left_on is not None or self.right_on is not None:
+                raise MergeError('Can only pass argument "on" OR "left_on" '
+                                 'and "right_on", not a combination of both.')
+            self.left_on = self.right_on = self.on
+        elif self.left_on is not None:
+            n = len(self.left_on)
+            if self.right_index:
+                if len(self.left_on) != self.right.index.nlevels:
+                    raise ValueError('len(left_on) must equal the number '
+                                     'of levels in the index of "right"')
+                self.right_on = [None] * n
+        elif self.right_on is not None:
+            n = len(self.right_on)
+            if self.left_index:
+                if len(self.right_on) != self.left.index.nlevels:
+                    raise ValueError('len(right_on) must equal the number '
+                                     'of levels in the index of "left"')
+                self.left_on = [None] * n
+        if len(self.right_on) != len(self.left_on):
+            raise ValueError("len(right_on) must equal len(left_on)")
+
+    def _validate(self, validate):
+
+        # Check uniqueness of each
+        if self.left_index:
+            left_unique = self.orig_left.index.is_unique
+        else:
+            left_unique = MultiIndex.from_arrays(self.left_join_keys
+                                                 ).is_unique
+
+        if self.right_index:
+            right_unique = self.orig_right.index.is_unique
+        else:
+            right_unique = MultiIndex.from_arrays(self.right_join_keys
+                                                  ).is_unique
+
+        # Check data integrity
+        if validate in ["one_to_one", "1:1"]:
+            if not left_unique and not right_unique:
+                raise MergeError("Merge keys are not unique in either left"
+                                 " or right dataset; not a one-to-one merge")
+            elif not left_unique:
+                raise MergeError("Merge keys are not unique in left dataset;"
+                                 " not a one-to-one merge")
+            elif not right_unique:
+                raise MergeError("Merge keys are not unique in right dataset;"
+                                 " not a one-to-one merge")
+
+        elif validate in ["one_to_many", "1:m"]:
+            if not left_unique:
+                raise MergeError("Merge keys are not unique in left dataset;"
+                                 "not a one-to-many merge")
+
+        elif validate in ["many_to_one", "m:1"]:
+            if not right_unique:
+                raise MergeError("Merge keys are not unique in right dataset;"
+                                 " not a many-to-one merge")
+
+        elif validate in ['many_to_many', 'm:m']:
+            pass
+
+        else:
+            raise ValueError("Not a valid argument for validate")
+
+
+def _get_join_indexers(left_keys, right_keys, sort=False, how='inner',
+                       **kwargs):
+    """
+
+    Parameters
+    ----------
+    left_keys: ndarray, Index, Series
+    right_keys: ndarray, Index, Series
+    sort: boolean, default False
+    how: string {'inner', 'outer', 'left', 'right'}, default 'inner'
+
+    Returns
+    -------
+    tuple of (left_indexer, right_indexer)
+        indexers into the left_keys, right_keys
+
+    """
+    from functools import partial
+
+    assert len(left_keys) == len(right_keys), \
+        'left_key and right_keys must be the same length'
+
+    # bind `sort` arg. of _factorize_keys
+    fkeys = partial(_factorize_keys, sort=sort)
+
+    # get left & right join labels and num. of levels at each location
+    llab, rlab, shape = map(list, zip(* map(fkeys, left_keys, right_keys)))
+
+    # get flat i8 keys from label lists
+    lkey, rkey = _get_join_keys(llab, rlab, shape, sort)
+
+    # factorize keys to a dense i8 space
+    # `count` is the num. of unique keys
+    # set(lkey) | set(rkey) == range(count)
+    lkey, rkey, count = fkeys(lkey, rkey)
+
+    # preserve left frame order if how == 'left' and sort == False
+    kwargs = copy.copy(kwargs)
+    if how == 'left':
+        kwargs['sort'] = sort
+    join_func = _join_functions[how]
+
+    return join_func(lkey, rkey, count, **kwargs)
+
+
+class _OrderedMerge(_MergeOperation):
+    _merge_type = 'ordered_merge'
+
+    def __init__(self, left, right, on=None, left_on=None, right_on=None,
+                 left_index=False, right_index=False, axis=1,
+                 suffixes=('_x', '_y'), copy=True,
+                 fill_method=None, how='outer'):
+
+        self.fill_method = fill_method
+        _MergeOperation.__init__(self, left, right, on=on, left_on=left_on,
+                                 left_index=left_index,
+                                 right_index=right_index,
+                                 right_on=right_on, axis=axis,
+                                 how=how, suffixes=suffixes,
+                                 sort=True  # factorize sorts
+                                 )
+
+    def get_result(self):
+        join_index, left_indexer, right_indexer = self._get_join_info()
+
+        # this is a bit kludgy
+        ldata, rdata = self.left._data, self.right._data
+        lsuf, rsuf = self.suffixes
+
+        llabels, rlabels = items_overlap_with_suffix(ldata.items, lsuf,
+                                                     rdata.items, rsuf)
+
+        if self.fill_method == 'ffill':
+            left_join_indexer = libjoin.ffill_indexer(left_indexer)
+            right_join_indexer = libjoin.ffill_indexer(right_indexer)
+        else:
+            left_join_indexer = left_indexer
+            right_join_indexer = right_indexer
+
+        lindexers = {
+            1: left_join_indexer} if left_join_indexer is not None else {}
+        rindexers = {
+            1: right_join_indexer} if right_join_indexer is not None else {}
+
+        result_data = concatenate_block_managers(
+            [(ldata, lindexers), (rdata, rindexers)],
+            axes=[llabels.append(rlabels), join_index],
+            concat_axis=0, copy=self.copy)
+
+        typ = self.left._constructor
+        result = typ(result_data).__finalize__(self, method=self._merge_type)
+
+        self._maybe_add_join_keys(result, left_indexer, right_indexer)
+
+        return result
+
+
+def _asof_function(direction, on_type):
+    name = 'asof_join_{dir}_{on}'.format(dir=direction, on=on_type)
+    return getattr(libjoin, name, None)
+
+
+def _asof_by_function(direction, on_type, by_type):
+    name = 'asof_join_{dir}_{on}_by_{by}'.format(
+        dir=direction, on=on_type, by=by_type)
+    return getattr(libjoin, name, None)
+
+
+_type_casters = {
+    'int64_t': _ensure_int64,
+    'double': _ensure_float64,
+    'object': _ensure_object,
+}
+
+_cython_types = {
+    'uint8': 'uint8_t',
+    'uint32': 'uint32_t',
+    'uint16': 'uint16_t',
+    'uint64': 'uint64_t',
+    'int8': 'int8_t',
+    'int32': 'int32_t',
+    'int16': 'int16_t',
+    'int64': 'int64_t',
+    'float16': 'error',
+    'float32': 'float',
+    'float64': 'double',
+}
+
+
+def _get_cython_type(dtype):
+    """ Given a dtype, return a C name like 'int64_t' or 'double' """
+    type_name = _get_dtype(dtype).name
+    ctype = _cython_types.get(type_name, 'object')
+    if ctype == 'error':
+        raise MergeError('unsupported type: {type}'.format(type=type_name))
+    return ctype
+
+
+def _get_cython_type_upcast(dtype):
+    """ Upcast a dtype to 'int64_t', 'double', or 'object' """
+    if is_integer_dtype(dtype):
+        return 'int64_t'
+    elif is_float_dtype(dtype):
+        return 'double'
+    else:
+        return 'object'
+
+
+class _AsOfMerge(_OrderedMerge):
+    _merge_type = 'asof_merge'
+
+    def __init__(self, left, right, on=None, left_on=None, right_on=None,
+                 left_index=False, right_index=False,
+                 by=None, left_by=None, right_by=None,
+                 axis=1, suffixes=('_x', '_y'), copy=True,
+                 fill_method=None,
+                 how='asof', tolerance=None,
+                 allow_exact_matches=True,
+                 direction='backward'):
+
+        self.by = by
+        self.left_by = left_by
+        self.right_by = right_by
+        self.tolerance = tolerance
+        self.allow_exact_matches = allow_exact_matches
+        self.direction = direction
+
+        _OrderedMerge.__init__(self, left, right, on=on, left_on=left_on,
+                               right_on=right_on, left_index=left_index,
+                               right_index=right_index, axis=axis,
+                               how=how, suffixes=suffixes,
+                               fill_method=fill_method)
+
+    def _validate_specification(self):
+        super(_AsOfMerge, self)._validate_specification()
+
+        # we only allow on to be a single item for on
+        if len(self.left_on) != 1 and not self.left_index:
+            raise MergeError("can only asof on a key for left")
+
+        if len(self.right_on) != 1 and not self.right_index:
+            raise MergeError("can only asof on a key for right")
+
+        if self.left_index and isinstance(self.left.index, MultiIndex):
+            raise MergeError("left can only have one index")
+
+        if self.right_index and isinstance(self.right.index, MultiIndex):
+            raise MergeError("right can only have one index")
+
+        # set 'by' columns
+        if self.by is not None:
+            if self.left_by is not None or self.right_by is not None:
+                raise MergeError('Can only pass by OR left_by '
+                                 'and right_by')
+            self.left_by = self.right_by = self.by
+        if self.left_by is None and self.right_by is not None:
+            raise MergeError('missing left_by')
+        if self.left_by is not None and self.right_by is None:
+            raise MergeError('missing right_by')
+
+        # add 'by' to our key-list so we can have it in the
+        # output as a key
+        if self.left_by is not None:
+            if not is_list_like(self.left_by):
+                self.left_by = [self.left_by]
+            if not is_list_like(self.right_by):
+                self.right_by = [self.right_by]
+
+            if len(self.left_by) != len(self.right_by):
+                raise MergeError('left_by and right_by must be same length')
+
+            self.left_on = self.left_by + list(self.left_on)
+            self.right_on = self.right_by + list(self.right_on)
+
+        # check 'direction' is valid
+        if self.direction not in ['backward', 'forward', 'nearest']:
+            raise MergeError('direction invalid: {direction}'
+                             .format(direction=self.direction))
+
+    @property
+    def _asof_key(self):
+        """ This is our asof key, the 'on' """
+        return self.left_on[-1]
+
+    def _get_merge_keys(self):
+
+        # note this function has side effects
+        (left_join_keys,
+         right_join_keys,
+         join_names) = super(_AsOfMerge, self)._get_merge_keys()
+
+        # validate index types are the same
+        for i, (lk, rk) in enumerate(zip(left_join_keys, right_join_keys)):
+            if not is_dtype_equal(lk.dtype, rk.dtype):
+                raise MergeError("incompatible merge keys [{i}] {lkdtype} and "
+                                 "{rkdtype}, must be the same type"
+                                 .format(i=i, lkdtype=lk.dtype,
+                                         rkdtype=rk.dtype))
+
+        # validate tolerance; must be a Timedelta if we have a DTI
+        if self.tolerance is not None:
+
+            if self.left_index:
+                lt = self.left.index
+            else:
+                lt = left_join_keys[-1]
+
+            msg = ("incompatible tolerance {tolerance}, must be compat "
+                   "with type {lkdtype}".format(
+                       tolerance=type(self.tolerance),
+                       lkdtype=lt.dtype))
+
+            if is_datetime64_dtype(lt) or is_datetime64tz_dtype(lt):
+                if not isinstance(self.tolerance, Timedelta):
+                    raise MergeError(msg)
+                if self.tolerance < Timedelta(0):
+                    raise MergeError("tolerance must be positive")
+
+            elif is_int64_dtype(lt):
+                if not is_integer(self.tolerance):
+                    raise MergeError(msg)
+                if self.tolerance < 0:
+                    raise MergeError("tolerance must be positive")
+
+            else:
+                raise MergeError("key must be integer or timestamp")
+
+        # validate allow_exact_matches
+        if not is_bool(self.allow_exact_matches):
+            msg = "allow_exact_matches must be boolean, passed {passed}"
+            raise MergeError(msg.format(passed=self.allow_exact_matches))
+
+        return left_join_keys, right_join_keys, join_names
+
+    def _get_join_indexers(self):
+        """ return the join indexers """
+
+        def flip(xs):
+            """ unlike np.transpose, this returns an array of tuples """
+            labels = list(string.ascii_lowercase[:len(xs)])
+            dtypes = [x.dtype for x in xs]
+            labeled_dtypes = list(zip(labels, dtypes))
+            return np.array(lzip(*xs), labeled_dtypes)
+
+        # values to compare
+        left_values = (self.left.index.values if self.left_index else
+                       self.left_join_keys[-1])
+        right_values = (self.right.index.values if self.right_index else
+                        self.right_join_keys[-1])
+        tolerance = self.tolerance
+
+        # we required sortedness in the join keys
+        msg = "{side} keys must be sorted"
+        if not Index(left_values).is_monotonic:
+            raise ValueError(msg.format(side='left'))
+        if not Index(right_values).is_monotonic:
+            raise ValueError(msg.format(side='right'))
+
+        # initial type conversion as needed
+        if needs_i8_conversion(left_values):
+            left_values = left_values.view('i8')
+            right_values = right_values.view('i8')
+            if tolerance is not None:
+                tolerance = tolerance.value
+
+        # a "by" parameter requires special handling
+        if self.left_by is not None:
+            # remove 'on' parameter from values if one existed
+            if self.left_index and self.right_index:
+                left_by_values = self.left_join_keys
+                right_by_values = self.right_join_keys
+            else:
+                left_by_values = self.left_join_keys[0:-1]
+                right_by_values = self.right_join_keys[0:-1]
+
+            # get tuple representation of values if more than one
+            if len(left_by_values) == 1:
+                left_by_values = left_by_values[0]
+                right_by_values = right_by_values[0]
+            else:
+                left_by_values = flip(left_by_values)
+                right_by_values = flip(right_by_values)
+
+            # upcast 'by' parameter because HashTable is limited
+            by_type = _get_cython_type_upcast(left_by_values.dtype)
+            by_type_caster = _type_casters[by_type]
+            left_by_values = by_type_caster(left_by_values)
+            right_by_values = by_type_caster(right_by_values)
+
+            # choose appropriate function by type
+            on_type = _get_cython_type(left_values.dtype)
+            func = _asof_by_function(self.direction, on_type, by_type)
+            return func(left_values,
+                        right_values,
+                        left_by_values,
+                        right_by_values,
+                        self.allow_exact_matches,
+                        tolerance)
+        else:
+            # choose appropriate function by type
+            on_type = _get_cython_type(left_values.dtype)
+            func = _asof_function(self.direction, on_type)
+            return func(left_values,
+                        right_values,
+                        self.allow_exact_matches,
+                        tolerance)
+
+
+def _get_multiindex_indexer(join_keys, index, sort):
+    from functools import partial
+
+    # bind `sort` argument
+    fkeys = partial(_factorize_keys, sort=sort)
+
+    # left & right join labels and num. of levels at each location
+    rlab, llab, shape = map(list, zip(* map(fkeys, index.levels, join_keys)))
+    if sort:
+        rlab = list(map(np.take, rlab, index.labels))
+    else:
+        i8copy = lambda a: a.astype('i8', subok=False, copy=True)
+        rlab = list(map(i8copy, index.labels))
+
+    # fix right labels if there were any nulls
+    for i in range(len(join_keys)):
+        mask = index.labels[i] == -1
+        if mask.any():
+            # check if there already was any nulls at this location
+            # if there was, it is factorized to `shape[i] - 1`
+            a = join_keys[i][llab[i] == shape[i] - 1]
+            if a.size == 0 or not a[0] != a[0]:
+                shape[i] += 1
+
+            rlab[i][mask] = shape[i] - 1
+
+    # get flat i8 join keys
+    lkey, rkey = _get_join_keys(llab, rlab, shape, sort)
+
+    # factorize keys to a dense i8 space
+    lkey, rkey, count = fkeys(lkey, rkey)
+
+    return libjoin.left_outer_join(lkey, rkey, count, sort=sort)
+
+
+def _get_single_indexer(join_key, index, sort=False):
+    left_key, right_key, count = _factorize_keys(join_key, index, sort=sort)
+
+    left_indexer, right_indexer = libjoin.left_outer_join(
+        _ensure_int64(left_key),
+        _ensure_int64(right_key),
+        count, sort=sort)
+
+    return left_indexer, right_indexer
+
+
+def _left_join_on_index(left_ax, right_ax, join_keys, sort=False):
+    if len(join_keys) > 1:
+        if not ((isinstance(right_ax, MultiIndex) and
+                 len(join_keys) == right_ax.nlevels)):
+            raise AssertionError("If more than one join key is given then "
+                                 "'right_ax' must be a MultiIndex and the "
+                                 "number of join keys must be the number of "
+                                 "levels in right_ax")
+
+        left_indexer, right_indexer = \
+            _get_multiindex_indexer(join_keys, right_ax, sort=sort)
+    else:
+        jkey = join_keys[0]
+
+        left_indexer, right_indexer = \
+            _get_single_indexer(jkey, right_ax, sort=sort)
+
+    if sort or len(left_ax) != len(left_indexer):
+        # if asked to sort or there are 1-to-many matches
+        join_index = left_ax.take(left_indexer)
+        return join_index, left_indexer, right_indexer
+
+    # left frame preserves order & length of its index
+    return left_ax, None, right_indexer
+
+
+def _right_outer_join(x, y, max_groups):
+    right_indexer, left_indexer = libjoin.left_outer_join(y, x, max_groups)
+    return left_indexer, right_indexer
+
+
+_join_functions = {
+    'inner': libjoin.inner_join,
+    'left': libjoin.left_outer_join,
+    'right': _right_outer_join,
+    'outer': libjoin.full_outer_join,
+}
+
+
+def _factorize_keys(lk, rk, sort=True):
+    if is_datetime64tz_dtype(lk) and is_datetime64tz_dtype(rk):
+        lk = lk.values
+        rk = rk.values
+
+    # if we exactly match in categories, allow us to factorize on codes
+    if (is_categorical_dtype(lk) and
+            is_categorical_dtype(rk) and
+            lk.is_dtype_equal(rk)):
+        klass = libhashtable.Int64Factorizer
+
+        if lk.categories.equals(rk.categories):
+            rk = rk.codes
+        else:
+            # Same categories in different orders -> recode
+            rk = _recode_for_categories(rk.codes, rk.categories, lk.categories)
+
+        lk = _ensure_int64(lk.codes)
+        rk = _ensure_int64(rk)
+    elif is_int_or_datetime_dtype(lk) and is_int_or_datetime_dtype(rk):
+        klass = libhashtable.Int64Factorizer
+        lk = _ensure_int64(com._values_from_object(lk))
+        rk = _ensure_int64(com._values_from_object(rk))
+    else:
+        klass = libhashtable.Factorizer
+        lk = _ensure_object(lk)
+        rk = _ensure_object(rk)
+
+    rizer = klass(max(len(lk), len(rk)))
+
+    llab = rizer.factorize(lk)
+    rlab = rizer.factorize(rk)
+
+    count = rizer.get_count()
+
+    if sort:
+        uniques = rizer.uniques.to_array()
+        llab, rlab = _sort_labels(uniques, llab, rlab)
+
+    # NA group
+    lmask = llab == -1
+    lany = lmask.any()
+    rmask = rlab == -1
+    rany = rmask.any()
+
+    if lany or rany:
+        if lany:
+            np.putmask(llab, lmask, count)
+        if rany:
+            np.putmask(rlab, rmask, count)
+        count += 1
+
+    return llab, rlab, count
+
+
+def _sort_labels(uniques, left, right):
+    if not isinstance(uniques, np.ndarray):
+        # tuplesafe
+        uniques = Index(uniques).values
+
+    llength = len(left)
+    labels = np.concatenate([left, right])
+
+    _, new_labels = sorting.safe_sort(uniques, labels, na_sentinel=-1)
+    new_labels = _ensure_int64(new_labels)
+    new_left, new_right = new_labels[:llength], new_labels[llength:]
+
+    return new_left, new_right
+
+
+def _get_join_keys(llab, rlab, shape, sort):
+
+    # how many levels can be done without overflow
+    pred = lambda i: not is_int64_overflow_possible(shape[:i])
+    nlev = next(filter(pred, range(len(shape), 0, -1)))
+
+    # get keys for the first `nlev` levels
+    stride = np.prod(shape[1:nlev], dtype='i8')
+    lkey = stride * llab[0].astype('i8', subok=False, copy=False)
+    rkey = stride * rlab[0].astype('i8', subok=False, copy=False)
+
+    for i in range(1, nlev):
+        with np.errstate(divide='ignore'):
+            stride //= shape[i]
+        lkey += llab[i] * stride
+        rkey += rlab[i] * stride
+
+    if nlev == len(shape):  # all done!
+        return lkey, rkey
+
+    # densify current keys to avoid overflow
+    lkey, rkey, count = _factorize_keys(lkey, rkey, sort=sort)
+
+    llab = [lkey] + llab[nlev:]
+    rlab = [rkey] + rlab[nlev:]
+    shape = [count] + shape[nlev:]
+
+    return _get_join_keys(llab, rlab, shape, sort)
+
+
+def _should_fill(lname, rname):
+    if (not isinstance(lname, compat.string_types) or
+            not isinstance(rname, compat.string_types)):
+        return True
+    return lname == rname
+
+
+def _any(x):
+    return x is not None and com._any_not_none(*x)
diff --git a/pandas/core/reshape/pivot.py b/pandas/core/reshape/pivot.py
new file mode 100644
index 0000000000000..3390451c60c0f
--- /dev/null
+++ b/pandas/core/reshape/pivot.py
@@ -0,0 +1,600 @@
+# pylint: disable=E1103
+
+
+from pandas.core.dtypes.common import (
+    is_list_like, is_scalar, is_integer_dtype)
+from pandas.core.dtypes.generic import ABCDataFrame, ABCSeries
+from pandas.core.dtypes.cast import maybe_downcast_to_dtype
+
+from pandas.core.reshape.concat import concat
+from pandas.core.series import Series
+from pandas.core.groupby.groupby import Grouper
+from pandas.core.reshape.util import cartesian_product
+from pandas.core.index import Index, _get_objs_combined_axis
+from pandas.compat import range, lrange, zip
+from pandas import compat
+import pandas.core.common as com
+from pandas.util._decorators import Appender, Substitution
+
+from pandas.core.frame import _shared_docs
+# Note: We need to make sure `frame` is imported before `pivot`, otherwise
+# _shared_docs['pivot_table'] will not yet exist.  TODO: Fix this dependency
+
+import numpy as np
+
+
+@Substitution('\ndata : DataFrame')
+@Appender(_shared_docs['pivot_table'], indents=1)
+def pivot_table(data, values=None, index=None, columns=None, aggfunc='mean',
+                fill_value=None, margins=False, dropna=True,
+                margins_name='All'):
+    index = _convert_by(index)
+    columns = _convert_by(columns)
+
+    if isinstance(aggfunc, list):
+        pieces = []
+        keys = []
+        for func in aggfunc:
+            table = pivot_table(data, values=values, index=index,
+                                columns=columns,
+                                fill_value=fill_value, aggfunc=func,
+                                margins=margins, margins_name=margins_name)
+            pieces.append(table)
+            keys.append(getattr(func, '__name__', func))
+
+        return concat(pieces, keys=keys, axis=1)
+
+    keys = index + columns
+
+    values_passed = values is not None
+    if values_passed:
+        if is_list_like(values):
+            values_multi = True
+            values = list(values)
+        else:
+            values_multi = False
+            values = [values]
+
+        # GH14938 Make sure value labels are in data
+        for i in values:
+            if i not in data:
+                raise KeyError(i)
+
+        to_filter = []
+        for x in keys + values:
+            if isinstance(x, Grouper):
+                x = x.key
+            try:
+                if x in data:
+                    to_filter.append(x)
+            except TypeError:
+                pass
+        if len(to_filter) < len(data.columns):
+            data = data[to_filter]
+
+    else:
+        values = data.columns
+        for key in keys:
+            try:
+                values = values.drop(key)
+            except (TypeError, ValueError, KeyError):
+                pass
+        values = list(values)
+
+    # group by the cartesian product of the grouper
+    # if we have a categorical
+    grouped = data.groupby(keys, observed=False)
+    agged = grouped.agg(aggfunc)
+    if dropna and isinstance(agged, ABCDataFrame) and len(agged.columns):
+        agged = agged.dropna(how='all')
+
+        # gh-21133
+        # we want to down cast if
+        # the original values are ints
+        # as we grouped with a NaN value
+        # and then dropped, coercing to floats
+        for v in [v for v in values if v in data and v in agged]:
+            if (is_integer_dtype(data[v]) and
+                    not is_integer_dtype(agged[v])):
+                agged[v] = maybe_downcast_to_dtype(agged[v], data[v].dtype)
+
+    table = agged
+    if table.index.nlevels > 1:
+        # Related GH #17123
+        # If index_names are integers, determine whether the integers refer
+        # to the level position or name.
+        index_names = agged.index.names[:len(index)]
+        to_unstack = []
+        for i in range(len(index), len(keys)):
+            name = agged.index.names[i]
+            if name is None or name in index_names:
+                to_unstack.append(i)
+            else:
+                to_unstack.append(name)
+        table = agged.unstack(to_unstack)
+
+    if not dropna:
+        from pandas import MultiIndex
+        if table.index.nlevels > 1:
+            m = MultiIndex.from_arrays(cartesian_product(table.index.levels),
+                                       names=table.index.names)
+            table = table.reindex(m, axis=0)
+
+        if table.columns.nlevels > 1:
+            m = MultiIndex.from_arrays(cartesian_product(table.columns.levels),
+                                       names=table.columns.names)
+            table = table.reindex(m, axis=1)
+
+    if isinstance(table, ABCDataFrame):
+        table = table.sort_index(axis=1)
+
+    if fill_value is not None:
+        table = table.fillna(value=fill_value, downcast='infer')
+
+    if margins:
+        if dropna:
+            data = data[data.notna().all(axis=1)]
+        table = _add_margins(table, data, values, rows=index,
+                             cols=columns, aggfunc=aggfunc,
+                             observed=dropna,
+                             margins_name=margins_name, fill_value=fill_value)
+
+    # discard the top level
+    if values_passed and not values_multi and not table.empty and \
+       (table.columns.nlevels > 1):
+        table = table[values[0]]
+
+    if len(index) == 0 and len(columns) > 0:
+        table = table.T
+
+    # GH 15193 Make sure empty columns are removed if dropna=True
+    if isinstance(table, ABCDataFrame) and dropna:
+        table = table.dropna(how='all', axis=1)
+
+    return table
+
+
+def _add_margins(table, data, values, rows, cols, aggfunc,
+                 observed=None, margins_name='All', fill_value=None):
+    if not isinstance(margins_name, compat.string_types):
+        raise ValueError('margins_name argument must be a string')
+
+    msg = u'Conflicting name "{name}" in margins'.format(name=margins_name)
+    for level in table.index.names:
+        if margins_name in table.index.get_level_values(level):
+            raise ValueError(msg)
+
+    grand_margin = _compute_grand_margin(data, values, aggfunc, margins_name)
+
+    # could be passed a Series object with no 'columns'
+    if hasattr(table, 'columns'):
+        for level in table.columns.names[1:]:
+            if margins_name in table.columns.get_level_values(level):
+                raise ValueError(msg)
+
+    if len(rows) > 1:
+        key = (margins_name,) + ('',) * (len(rows) - 1)
+    else:
+        key = margins_name
+
+    if not values and isinstance(table, ABCSeries):
+        # If there are no values and the table is a series, then there is only
+        # one column in the data. Compute grand margin and return it.
+        return table.append(Series({key: grand_margin[margins_name]}))
+
+    if values:
+        marginal_result_set = _generate_marginal_results(table, data, values,
+                                                         rows, cols, aggfunc,
+                                                         observed,
+                                                         grand_margin,
+                                                         margins_name)
+        if not isinstance(marginal_result_set, tuple):
+            return marginal_result_set
+        result, margin_keys, row_margin = marginal_result_set
+    else:
+        marginal_result_set = _generate_marginal_results_without_values(
+            table, data, rows, cols, aggfunc, observed, margins_name)
+        if not isinstance(marginal_result_set, tuple):
+            return marginal_result_set
+        result, margin_keys, row_margin = marginal_result_set
+    row_margin = row_margin.reindex(result.columns, fill_value=fill_value)
+    # populate grand margin
+    for k in margin_keys:
+        if isinstance(k, compat.string_types):
+            row_margin[k] = grand_margin[k]
+        else:
+            row_margin[k] = grand_margin[k[0]]
+
+    from pandas import DataFrame
+    margin_dummy = DataFrame(row_margin, columns=[key]).T
+
+    row_names = result.index.names
+    try:
+        for dtype in set(result.dtypes):
+            cols = result.select_dtypes([dtype]).columns
+            margin_dummy[cols] = margin_dummy[cols].astype(dtype)
+        result = result.append(margin_dummy)
+    except TypeError:
+
+        # we cannot reshape, so coerce the axis
+        result.index = result.index._to_safe_for_reshape()
+        result = result.append(margin_dummy)
+    result.index.names = row_names
+
+    return result
+
+
+def _compute_grand_margin(data, values, aggfunc,
+                          margins_name='All'):
+
+    if values:
+        grand_margin = {}
+        for k, v in data[values].iteritems():
+            try:
+                if isinstance(aggfunc, compat.string_types):
+                    grand_margin[k] = getattr(v, aggfunc)()
+                elif isinstance(aggfunc, dict):
+                    if isinstance(aggfunc[k], compat.string_types):
+                        grand_margin[k] = getattr(v, aggfunc[k])()
+                    else:
+                        grand_margin[k] = aggfunc[k](v)
+                else:
+                    grand_margin[k] = aggfunc(v)
+            except TypeError:
+                pass
+        return grand_margin
+    else:
+        return {margins_name: aggfunc(data.index)}
+
+
+def _generate_marginal_results(table, data, values, rows, cols, aggfunc,
+                               observed,
+                               grand_margin,
+                               margins_name='All'):
+    if len(cols) > 0:
+        # need to "interleave" the margins
+        table_pieces = []
+        margin_keys = []
+
+        def _all_key(key):
+            return (key, margins_name) + ('',) * (len(cols) - 1)
+
+        if len(rows) > 0:
+            margin = data[rows + values].groupby(
+                rows, observed=observed).agg(aggfunc)
+            cat_axis = 1
+
+            for key, piece in table.groupby(level=0,
+                                            axis=cat_axis,
+                                            observed=observed):
+                all_key = _all_key(key)
+
+                # we are going to mutate this, so need to copy!
+                piece = piece.copy()
+                try:
+                    piece[all_key] = margin[key]
+                except TypeError:
+
+                    # we cannot reshape, so coerce the axis
+                    piece.set_axis(piece._get_axis(
+                                   cat_axis)._to_safe_for_reshape(),
+                                   axis=cat_axis, inplace=True)
+                    piece[all_key] = margin[key]
+
+                table_pieces.append(piece)
+                margin_keys.append(all_key)
+        else:
+            margin = grand_margin
+            cat_axis = 0
+            for key, piece in table.groupby(level=0,
+                                            axis=cat_axis,
+                                            observed=observed):
+                all_key = _all_key(key)
+                table_pieces.append(piece)
+                table_pieces.append(Series(margin[key], index=[all_key]))
+                margin_keys.append(all_key)
+
+        result = concat(table_pieces, axis=cat_axis)
+
+        if len(rows) == 0:
+            return result
+    else:
+        result = table
+        margin_keys = table.columns
+
+    if len(cols) > 0:
+        row_margin = data[cols + values].groupby(
+            cols, observed=observed).agg(aggfunc)
+        row_margin = row_margin.stack()
+
+        # slight hack
+        new_order = [len(cols)] + lrange(len(cols))
+        row_margin.index = row_margin.index.reorder_levels(new_order)
+    else:
+        row_margin = Series(np.nan, index=result.columns)
+
+    return result, margin_keys, row_margin
+
+
+def _generate_marginal_results_without_values(
+        table, data, rows, cols, aggfunc,
+        observed, margins_name='All'):
+    if len(cols) > 0:
+        # need to "interleave" the margins
+        margin_keys = []
+
+        def _all_key():
+            if len(cols) == 1:
+                return margins_name
+            return (margins_name, ) + ('', ) * (len(cols) - 1)
+
+        if len(rows) > 0:
+            margin = data[rows].groupby(rows,
+                                        observed=observed).apply(aggfunc)
+            all_key = _all_key()
+            table[all_key] = margin
+            result = table
+            margin_keys.append(all_key)
+
+        else:
+            margin = data.groupby(level=0,
+                                  axis=0,
+                                  observed=observed).apply(aggfunc)
+            all_key = _all_key()
+            table[all_key] = margin
+            result = table
+            margin_keys.append(all_key)
+            return result
+    else:
+        result = table
+        margin_keys = table.columns
+
+    if len(cols):
+        row_margin = data[cols].groupby(cols, observed=observed).apply(aggfunc)
+    else:
+        row_margin = Series(np.nan, index=result.columns)
+
+    return result, margin_keys, row_margin
+
+
+def _convert_by(by):
+    if by is None:
+        by = []
+    elif (is_scalar(by) or
+          isinstance(by, (np.ndarray, Index, ABCSeries, Grouper)) or
+          hasattr(by, '__call__')):
+        by = [by]
+    else:
+        by = list(by)
+    return by
+
+
+def crosstab(index, columns, values=None, rownames=None, colnames=None,
+             aggfunc=None, margins=False, margins_name='All', dropna=True,
+             normalize=False):
+    """
+    Compute a simple cross-tabulation of two (or more) factors. By default
+    computes a frequency table of the factors unless an array of values and an
+    aggregation function are passed
+
+    Parameters
+    ----------
+    index : array-like, Series, or list of arrays/Series
+        Values to group by in the rows
+    columns : array-like, Series, or list of arrays/Series
+        Values to group by in the columns
+    values : array-like, optional
+        Array of values to aggregate according to the factors.
+        Requires `aggfunc` be specified.
+    aggfunc : function, optional
+        If specified, requires `values` be specified as well
+    rownames : sequence, default None
+        If passed, must match number of row arrays passed
+    colnames : sequence, default None
+        If passed, must match number of column arrays passed
+    margins : boolean, default False
+        Add row/column margins (subtotals)
+    margins_name : string, default 'All'
+        Name of the row / column that will contain the totals
+        when margins is True.
+
+        .. versionadded:: 0.21.0
+
+    dropna : boolean, default True
+        Do not include columns whose entries are all NaN
+    normalize : boolean, {'all', 'index', 'columns'}, or {0,1}, default False
+        Normalize by dividing all values by the sum of values.
+
+        - If passed 'all' or `True`, will normalize over all values.
+        - If passed 'index' will normalize over each row.
+        - If passed 'columns' will normalize over each column.
+        - If margins is `True`, will also normalize margin values.
+
+        .. versionadded:: 0.18.1
+
+
+    Notes
+    -----
+    Any Series passed will have their name attributes used unless row or column
+    names for the cross-tabulation are specified.
+
+    Any input passed containing Categorical data will have **all** of its
+    categories included in the cross-tabulation, even if the actual data does
+    not contain any instances of a particular category.
+
+    In the event that there aren't overlapping indexes an empty DataFrame will
+    be returned.
+
+    Examples
+    --------
+    >>> a = np.array(["foo", "foo", "foo", "foo", "bar", "bar",
+    ...               "bar", "bar", "foo", "foo", "foo"], dtype=object)
+    >>> b = np.array(["one", "one", "one", "two", "one", "one",
+    ...               "one", "two", "two", "two", "one"], dtype=object)
+    >>> c = np.array(["dull", "dull", "shiny", "dull", "dull", "shiny",
+    ...               "shiny", "dull", "shiny", "shiny", "shiny"],
+    ...               dtype=object)
+
+    >>> pd.crosstab(a, [b, c], rownames=['a'], colnames=['b', 'c'])
+    ... # doctest: +NORMALIZE_WHITESPACE
+    b   one        two
+    c   dull shiny dull shiny
+    a
+    bar    1     2    1     0
+    foo    2     2    1     2
+
+    >>> foo = pd.Categorical(['a', 'b'], categories=['a', 'b', 'c'])
+    >>> bar = pd.Categorical(['d', 'e'], categories=['d', 'e', 'f'])
+    >>> crosstab(foo, bar)  # 'c' and 'f' are not represented in the data,
+                            # and will not be shown in the output because
+                            # dropna is True by default. Set 'dropna=False'
+                            # to preserve categories with no data
+    ... # doctest: +SKIP
+    col_0  d  e
+    row_0
+    a      1  0
+    b      0  1
+
+    >>> crosstab(foo, bar, dropna=False)  # 'c' and 'f' are not represented
+                            # in the data, but they still will be counted
+                            # and shown in the output
+    ... # doctest: +SKIP
+    col_0  d  e  f
+    row_0
+    a      1  0  0
+    b      0  1  0
+    c      0  0  0
+
+    Returns
+    -------
+    crosstab : DataFrame
+    """
+
+    index = com._maybe_make_list(index)
+    columns = com._maybe_make_list(columns)
+
+    rownames = _get_names(index, rownames, prefix='row')
+    colnames = _get_names(columns, colnames, prefix='col')
+
+    common_idx = _get_objs_combined_axis(index + columns, intersect=True,
+                                         sort=False)
+
+    data = {}
+    data.update(zip(rownames, index))
+    data.update(zip(colnames, columns))
+
+    if values is None and aggfunc is not None:
+        raise ValueError("aggfunc cannot be used without values.")
+
+    if values is not None and aggfunc is None:
+        raise ValueError("values cannot be used without an aggfunc.")
+
+    from pandas import DataFrame
+    df = DataFrame(data, index=common_idx)
+    if values is None:
+        df['__dummy__'] = 0
+        kwargs = {'aggfunc': len, 'fill_value': 0}
+    else:
+        df['__dummy__'] = values
+        kwargs = {'aggfunc': aggfunc}
+
+    table = df.pivot_table('__dummy__', index=rownames, columns=colnames,
+                           margins=margins, margins_name=margins_name,
+                           dropna=dropna, **kwargs)
+
+    # Post-process
+    if normalize is not False:
+        table = _normalize(table, normalize=normalize, margins=margins,
+                           margins_name=margins_name)
+
+    return table
+
+
+def _normalize(table, normalize, margins, margins_name='All'):
+
+    if not isinstance(normalize, bool) and not isinstance(normalize,
+                                                          compat.string_types):
+        axis_subs = {0: 'index', 1: 'columns'}
+        try:
+            normalize = axis_subs[normalize]
+        except KeyError:
+            raise ValueError("Not a valid normalize argument")
+
+    if margins is False:
+
+        # Actual Normalizations
+        normalizers = {
+            'all': lambda x: x / x.sum(axis=1).sum(axis=0),
+            'columns': lambda x: x / x.sum(),
+            'index': lambda x: x.div(x.sum(axis=1), axis=0)
+        }
+
+        normalizers[True] = normalizers['all']
+
+        try:
+            f = normalizers[normalize]
+        except KeyError:
+            raise ValueError("Not a valid normalize argument")
+
+        table = f(table)
+        table = table.fillna(0)
+
+    elif margins is True:
+
+        column_margin = table.loc[:, margins_name].drop(margins_name)
+        index_margin = table.loc[margins_name, :].drop(margins_name)
+        table = table.drop(margins_name, axis=1).drop(margins_name)
+        # to keep index and columns names
+        table_index_names = table.index.names
+        table_columns_names = table.columns.names
+
+        # Normalize core
+        table = _normalize(table, normalize=normalize, margins=False)
+
+        # Fix Margins
+        if normalize == 'columns':
+            column_margin = column_margin / column_margin.sum()
+            table = concat([table, column_margin], axis=1)
+            table = table.fillna(0)
+
+        elif normalize == 'index':
+            index_margin = index_margin / index_margin.sum()
+            table = table.append(index_margin)
+            table = table.fillna(0)
+
+        elif normalize == "all" or normalize is True:
+            column_margin = column_margin / column_margin.sum()
+            index_margin = index_margin / index_margin.sum()
+            index_margin.loc[margins_name] = 1
+            table = concat([table, column_margin], axis=1)
+            table = table.append(index_margin)
+
+            table = table.fillna(0)
+
+        else:
+            raise ValueError("Not a valid normalize argument")
+
+        table.index.names = table_index_names
+        table.columns.names = table_columns_names
+
+    else:
+        raise ValueError("Not a valid margins argument")
+
+    return table
+
+
+def _get_names(arrs, names, prefix='row'):
+    if names is None:
+        names = []
+        for i, arr in enumerate(arrs):
+            if isinstance(arr, ABCSeries) and arr.name is not None:
+                names.append(arr.name)
+            else:
+                names.append('{prefix}_{i}'.format(prefix=prefix, i=i))
+    else:
+        if len(names) != len(arrs):
+            raise AssertionError('arrays and names must have the same length')
+        if not isinstance(names, list):
+            names = list(names)
+
+    return names
diff --git a/pandas/core/reshape/reshape.py b/pandas/core/reshape/reshape.py
new file mode 100644
index 0000000000000..3d9e84954a63b
--- /dev/null
+++ b/pandas/core/reshape/reshape.py
@@ -0,0 +1,1026 @@
+# pylint: disable=E1101,E1103
+# pylint: disable=W0703,W0622,W0613,W0201
+from pandas.compat import range, text_type, zip
+from pandas import compat
+from functools import partial
+import itertools
+
+import numpy as np
+
+from pandas.core.dtypes.common import (
+    _ensure_platform_int,
+    is_list_like, is_bool_dtype,
+    needs_i8_conversion, is_sparse, is_object_dtype)
+from pandas.core.dtypes.cast import maybe_promote
+from pandas.core.dtypes.missing import notna
+
+from pandas.core.series import Series
+from pandas.core.frame import DataFrame
+
+from pandas.core.sparse.api import SparseDataFrame, SparseSeries
+from pandas.core.sparse.array import SparseArray
+from pandas._libs.sparse import IntIndex
+
+from pandas.core.arrays import Categorical
+from pandas.core.arrays.categorical import _factorize_from_iterable
+from pandas.core.sorting import (get_group_index, get_compressed_ids,
+                                 compress_group_index, decons_obs_group_ids)
+
+import pandas.core.algorithms as algos
+from pandas._libs import algos as _algos, reshape as _reshape
+
+from pandas.core.index import Index, MultiIndex
+
+
+class _Unstacker(object):
+    """
+    Helper class to unstack data / pivot with multi-level index
+
+    Parameters
+    ----------
+    values : ndarray
+        Values of DataFrame to "Unstack"
+    index : object
+        Pandas ``Index``
+    level : int or str, default last level
+        Level to "unstack". Accepts a name for the level.
+    value_columns : Index, optional
+        Pandas ``Index`` or ``MultiIndex`` object if unstacking a DataFrame
+    fill_value : scalar, optional
+        Default value to fill in missing values if subgroups do not have the
+        same set of labels. By default, missing values will be replaced with
+        the default fill value for that data type, NaN for float, NaT for
+        datetimelike, etc. For integer types, by default data will converted to
+        float and missing values will be set to NaN.
+    constructor : object
+        Pandas ``DataFrame`` or subclass used to create unstacked
+        response.  If None, DataFrame or SparseDataFrame will be used.
+
+    Examples
+    --------
+    >>> import pandas as pd
+    >>> index = pd.MultiIndex.from_tuples([('one', 'a'), ('one', 'b'),
+    ...                                    ('two', 'a'), ('two', 'b')])
+    >>> s = pd.Series(np.arange(1, 5, dtype=np.int64), index=index)
+    >>> s
+    one  a    1
+         b    2
+    two  a    3
+         b    4
+    dtype: int64
+
+    >>> s.unstack(level=-1)
+         a  b
+    one  1  2
+    two  3  4
+
+    >>> s.unstack(level=0)
+       one  two
+    a    1    3
+    b    2    4
+
+    Returns
+    -------
+    unstacked : DataFrame
+    """
+
+    def __init__(self, values, index, level=-1, value_columns=None,
+                 fill_value=None, constructor=None):
+
+        self.is_categorical = None
+        self.is_sparse = is_sparse(values)
+        if values.ndim == 1:
+            if isinstance(values, Categorical):
+                self.is_categorical = values
+                values = np.array(values)
+            elif self.is_sparse:
+                # XXX: Makes SparseArray *dense*, but it's supposedly
+                # a single column at a time, so it's "doable"
+                values = values.values
+            values = values[:, np.newaxis]
+        self.values = values
+        self.value_columns = value_columns
+        self.fill_value = fill_value
+
+        if constructor is None:
+            if self.is_sparse:
+                self.constructor = SparseDataFrame
+            else:
+                self.constructor = DataFrame
+        else:
+            self.constructor = constructor
+
+        if value_columns is None and values.shape[1] != 1:  # pragma: no cover
+            raise ValueError('must pass column labels for multi-column data')
+
+        self.index = index.remove_unused_levels()
+
+        if isinstance(self.index, MultiIndex):
+            if index._reference_duplicate_name(level):
+                msg = ("Ambiguous reference to {level}. The index "
+                       "names are not unique.".format(level=level))
+                raise ValueError(msg)
+
+        self.level = self.index._get_level_number(level)
+
+        # when index includes `nan`, need to lift levels/strides by 1
+        self.lift = 1 if -1 in self.index.labels[self.level] else 0
+
+        self.new_index_levels = list(self.index.levels)
+        self.new_index_names = list(self.index.names)
+
+        self.removed_name = self.new_index_names.pop(self.level)
+        self.removed_level = self.new_index_levels.pop(self.level)
+        self.removed_level_full = index.levels[self.level]
+
+        self._make_sorted_values_labels()
+        self._make_selectors()
+
+    def _make_sorted_values_labels(self):
+        v = self.level
+
+        labs = list(self.index.labels)
+        levs = list(self.index.levels)
+        to_sort = labs[:v] + labs[v + 1:] + [labs[v]]
+        sizes = [len(x) for x in levs[:v] + levs[v + 1:] + [levs[v]]]
+
+        comp_index, obs_ids = get_compressed_ids(to_sort, sizes)
+        ngroups = len(obs_ids)
+
+        indexer = _algos.groupsort_indexer(comp_index, ngroups)[0]
+        indexer = _ensure_platform_int(indexer)
+
+        self.sorted_values = algos.take_nd(self.values, indexer, axis=0)
+        self.sorted_labels = [l.take(indexer) for l in to_sort]
+
+    def _make_selectors(self):
+        new_levels = self.new_index_levels
+
+        # make the mask
+        remaining_labels = self.sorted_labels[:-1]
+        level_sizes = [len(x) for x in new_levels]
+
+        comp_index, obs_ids = get_compressed_ids(remaining_labels, level_sizes)
+        ngroups = len(obs_ids)
+
+        comp_index = _ensure_platform_int(comp_index)
+        stride = self.index.levshape[self.level] + self.lift
+        self.full_shape = ngroups, stride
+
+        selector = self.sorted_labels[-1] + stride * comp_index + self.lift
+        mask = np.zeros(np.prod(self.full_shape), dtype=bool)
+        mask.put(selector, True)
+
+        if mask.sum() < len(self.index):
+            raise ValueError('Index contains duplicate entries, '
+                             'cannot reshape')
+
+        self.group_index = comp_index
+        self.mask = mask
+        self.unique_groups = obs_ids
+        self.compressor = comp_index.searchsorted(np.arange(ngroups))
+
+    def get_result(self):
+        values, _ = self.get_new_values()
+        columns = self.get_new_columns()
+        index = self.get_new_index()
+
+        # may need to coerce categoricals here
+        if self.is_categorical is not None:
+            categories = self.is_categorical.categories
+            ordered = self.is_categorical.ordered
+            values = [Categorical(values[:, i], categories=categories,
+                                  ordered=ordered)
+                      for i in range(values.shape[-1])]
+
+        return self.constructor(values, index=index, columns=columns)
+
+    def get_new_values(self):
+        values = self.values
+
+        # place the values
+        length, width = self.full_shape
+        stride = values.shape[1]
+        result_width = width * stride
+        result_shape = (length, result_width)
+        mask = self.mask
+        mask_all = mask.all()
+
+        # we can simply reshape if we don't have a mask
+        if mask_all and len(values):
+            new_values = (self.sorted_values
+                              .reshape(length, width, stride)
+                              .swapaxes(1, 2)
+                              .reshape(result_shape)
+                          )
+            new_mask = np.ones(result_shape, dtype=bool)
+            return new_values, new_mask
+
+        # if our mask is all True, then we can use our existing dtype
+        if mask_all:
+            dtype = values.dtype
+            new_values = np.empty(result_shape, dtype=dtype)
+        else:
+            dtype, fill_value = maybe_promote(values.dtype, self.fill_value)
+            new_values = np.empty(result_shape, dtype=dtype)
+            new_values.fill(fill_value)
+
+        new_mask = np.zeros(result_shape, dtype=bool)
+
+        name = np.dtype(dtype).name
+        sorted_values = self.sorted_values
+
+        # we need to convert to a basic dtype
+        # and possibly coerce an input to our output dtype
+        # e.g. ints -> floats
+        if needs_i8_conversion(values):
+            sorted_values = sorted_values.view('i8')
+            new_values = new_values.view('i8')
+            name = 'int64'
+        elif is_bool_dtype(values):
+            sorted_values = sorted_values.astype('object')
+            new_values = new_values.astype('object')
+            name = 'object'
+        else:
+            sorted_values = sorted_values.astype(name, copy=False)
+
+        # fill in our values & mask
+        f = getattr(_reshape, "unstack_{name}".format(name=name))
+        f(sorted_values,
+          mask.view('u1'),
+          stride,
+          length,
+          width,
+          new_values,
+          new_mask.view('u1'))
+
+        # reconstruct dtype if needed
+        if needs_i8_conversion(values):
+            new_values = new_values.view(values.dtype)
+
+        return new_values, new_mask
+
+    def get_new_columns(self):
+        if self.value_columns is None:
+            if self.lift == 0:
+                return self.removed_level
+
+            lev = self.removed_level
+            return lev.insert(0, lev._na_value)
+
+        stride = len(self.removed_level) + self.lift
+        width = len(self.value_columns)
+        propagator = np.repeat(np.arange(width), stride)
+        if isinstance(self.value_columns, MultiIndex):
+            new_levels = self.value_columns.levels + (self.removed_level_full,)
+            new_names = self.value_columns.names + (self.removed_name,)
+
+            new_labels = [lab.take(propagator)
+                          for lab in self.value_columns.labels]
+        else:
+            new_levels = [self.value_columns, self.removed_level_full]
+            new_names = [self.value_columns.name, self.removed_name]
+            new_labels = [propagator]
+
+        # The two indices differ only if the unstacked level had unused items:
+        if len(self.removed_level_full) != len(self.removed_level):
+            # In this case, we remap the new labels to the original level:
+            repeater = self.removed_level_full.get_indexer(self.removed_level)
+            if self.lift:
+                repeater = np.insert(repeater, 0, -1)
+        else:
+            # Otherwise, we just use each level item exactly once:
+            repeater = np.arange(stride) - self.lift
+
+        # The entire level is then just a repetition of the single chunk:
+        new_labels.append(np.tile(repeater, width))
+        return MultiIndex(levels=new_levels, labels=new_labels,
+                          names=new_names, verify_integrity=False)
+
+    def get_new_index(self):
+        result_labels = [lab.take(self.compressor)
+                         for lab in self.sorted_labels[:-1]]
+
+        # construct the new index
+        if len(self.new_index_levels) == 1:
+            lev, lab = self.new_index_levels[0], result_labels[0]
+            if (lab == -1).any():
+                lev = lev.insert(len(lev), lev._na_value)
+            return lev.take(lab)
+
+        return MultiIndex(levels=self.new_index_levels, labels=result_labels,
+                          names=self.new_index_names, verify_integrity=False)
+
+
+def _unstack_multiple(data, clocs, fill_value=None):
+    if len(clocs) == 0:
+        return data
+
+    # NOTE: This doesn't deal with hierarchical columns yet
+
+    index = data.index
+
+    clocs = [index._get_level_number(i) for i in clocs]
+
+    rlocs = [i for i in range(index.nlevels) if i not in clocs]
+
+    clevels = [index.levels[i] for i in clocs]
+    clabels = [index.labels[i] for i in clocs]
+    cnames = [index.names[i] for i in clocs]
+    rlevels = [index.levels[i] for i in rlocs]
+    rlabels = [index.labels[i] for i in rlocs]
+    rnames = [index.names[i] for i in rlocs]
+
+    shape = [len(x) for x in clevels]
+    group_index = get_group_index(clabels, shape, sort=False, xnull=False)
+
+    comp_ids, obs_ids = compress_group_index(group_index, sort=False)
+    recons_labels = decons_obs_group_ids(comp_ids, obs_ids, shape, clabels,
+                                         xnull=False)
+
+    if rlocs == []:
+        # Everything is in clocs, so the dummy df has a regular index
+        dummy_index = Index(obs_ids, name='__placeholder__')
+    else:
+        dummy_index = MultiIndex(levels=rlevels + [obs_ids],
+                                 labels=rlabels + [comp_ids],
+                                 names=rnames + ['__placeholder__'],
+                                 verify_integrity=False)
+
+    if isinstance(data, Series):
+        dummy = data.copy()
+        dummy.index = dummy_index
+        unstacked = dummy.unstack('__placeholder__', fill_value=fill_value)
+        new_levels = clevels
+        new_names = cnames
+        new_labels = recons_labels
+    else:
+        if isinstance(data.columns, MultiIndex):
+            result = data
+            for i in range(len(clocs)):
+                val = clocs[i]
+                result = result.unstack(val)
+                clocs = [v if i > v else v - 1 for v in clocs]
+
+            return result
+
+        dummy = data.copy()
+        dummy.index = dummy_index
+
+        unstacked = dummy.unstack('__placeholder__', fill_value=fill_value)
+        if isinstance(unstacked, Series):
+            unstcols = unstacked.index
+        else:
+            unstcols = unstacked.columns
+        new_levels = [unstcols.levels[0]] + clevels
+        new_names = [data.columns.name] + cnames
+
+        new_labels = [unstcols.labels[0]]
+        for rec in recons_labels:
+            new_labels.append(rec.take(unstcols.labels[-1]))
+
+    new_columns = MultiIndex(levels=new_levels, labels=new_labels,
+                             names=new_names, verify_integrity=False)
+
+    if isinstance(unstacked, Series):
+        unstacked.index = new_columns
+    else:
+        unstacked.columns = new_columns
+
+    return unstacked
+
+
+def pivot(self, index=None, columns=None, values=None):
+    """
+    See DataFrame.pivot
+    """
+    if values is None:
+        cols = [columns] if index is None else [index, columns]
+        append = index is None
+        indexed = self.set_index(cols, append=append)
+    else:
+        if index is None:
+            index = self.index
+        else:
+            index = self[index]
+        index = MultiIndex.from_arrays([index, self[columns]])
+
+        if is_list_like(values) and not isinstance(values, tuple):
+            # Exclude tuple because it is seen as a single column name
+            indexed = self._constructor(self[values].values, index=index,
+                                        columns=values)
+        else:
+            indexed = self._constructor_sliced(self[values].values,
+                                               index=index)
+    return indexed.unstack(columns)
+
+
+def pivot_simple(index, columns, values):
+    """
+    Produce 'pivot' table based on 3 columns of this DataFrame.
+    Uses unique values from index / columns and fills with values.
+
+    Parameters
+    ----------
+    index : ndarray
+        Labels to use to make new frame's index
+    columns : ndarray
+        Labels to use to make new frame's columns
+    values : ndarray
+        Values to use for populating new frame's values
+
+    Notes
+    -----
+    Obviously, all 3 of the input arguments must have the same length
+
+    Returns
+    -------
+    DataFrame
+
+    See also
+    --------
+    DataFrame.pivot_table : generalization of pivot that can handle
+        duplicate values for one index/column pair
+    """
+    if (len(index) != len(columns)) or (len(columns) != len(values)):
+        raise AssertionError('Length of index, columns, and values must be the'
+                             ' same')
+
+    if len(index) == 0:
+        return DataFrame(index=[])
+
+    hindex = MultiIndex.from_arrays([index, columns])
+    series = Series(values.ravel(), index=hindex)
+    series = series.sort_index(level=0)
+    return series.unstack()
+
+
+def _slow_pivot(index, columns, values):
+    """
+    Produce 'pivot' table based on 3 columns of this DataFrame.
+    Uses unique values from index / columns and fills with values.
+
+    Parameters
+    ----------
+    index : string or object
+        Column name to use to make new frame's index
+    columns : string or object
+        Column name to use to make new frame's columns
+    values : string or object
+        Column name to use for populating new frame's values
+
+    Could benefit from some Cython here.
+    """
+    tree = {}
+    for i, (idx, col) in enumerate(zip(index, columns)):
+        if col not in tree:
+            tree[col] = {}
+        branch = tree[col]
+        branch[idx] = values[i]
+
+    return DataFrame(tree)
+
+
+def unstack(obj, level, fill_value=None):
+    if isinstance(level, (tuple, list)):
+        if len(level) != 1:
+            # _unstack_multiple only handles MultiIndexes,
+            # and isn't needed for a single level
+            return _unstack_multiple(obj, level, fill_value=fill_value)
+        else:
+            level = level[0]
+
+    if isinstance(obj, DataFrame):
+        if isinstance(obj.index, MultiIndex):
+            return _unstack_frame(obj, level, fill_value=fill_value)
+        else:
+            return obj.T.stack(dropna=False)
+    else:
+        unstacker = _Unstacker(obj.values, obj.index, level=level,
+                               fill_value=fill_value,
+                               constructor=obj._constructor_expanddim)
+        return unstacker.get_result()
+
+
+def _unstack_frame(obj, level, fill_value=None):
+    if obj._is_mixed_type:
+        unstacker = partial(_Unstacker, index=obj.index,
+                            level=level, fill_value=fill_value)
+        blocks = obj._data.unstack(unstacker)
+        return obj._constructor(blocks)
+    else:
+        unstacker = _Unstacker(obj.values, obj.index, level=level,
+                               value_columns=obj.columns,
+                               fill_value=fill_value,
+                               constructor=obj._constructor)
+        return unstacker.get_result()
+
+
+def stack(frame, level=-1, dropna=True):
+    """
+    Convert DataFrame to Series with multi-level Index. Columns become the
+    second level of the resulting hierarchical index
+
+    Returns
+    -------
+    stacked : Series
+    """
+
+    def factorize(index):
+        if index.is_unique:
+            return index, np.arange(len(index))
+        codes, categories = _factorize_from_iterable(index)
+        return categories, codes
+
+    N, K = frame.shape
+
+    if isinstance(frame.columns, MultiIndex):
+        if frame.columns._reference_duplicate_name(level):
+            msg = ("Ambiguous reference to {level}. The column "
+                   "names are not unique.".format(level=level))
+            raise ValueError(msg)
+
+    # Will also convert negative level numbers and check if out of bounds.
+    level_num = frame.columns._get_level_number(level)
+
+    if isinstance(frame.columns, MultiIndex):
+        return _stack_multi_columns(frame, level_num=level_num, dropna=dropna)
+    elif isinstance(frame.index, MultiIndex):
+        new_levels = list(frame.index.levels)
+        new_labels = [lab.repeat(K) for lab in frame.index.labels]
+
+        clev, clab = factorize(frame.columns)
+        new_levels.append(clev)
+        new_labels.append(np.tile(clab, N).ravel())
+
+        new_names = list(frame.index.names)
+        new_names.append(frame.columns.name)
+        new_index = MultiIndex(levels=new_levels, labels=new_labels,
+                               names=new_names, verify_integrity=False)
+    else:
+        levels, (ilab, clab) = zip(*map(factorize, (frame.index,
+                                                    frame.columns)))
+        labels = ilab.repeat(K), np.tile(clab, N).ravel()
+        new_index = MultiIndex(levels=levels, labels=labels,
+                               names=[frame.index.name, frame.columns.name],
+                               verify_integrity=False)
+
+    new_values = frame.values.ravel()
+    if dropna:
+        mask = notna(new_values)
+        new_values = new_values[mask]
+        new_index = new_index[mask]
+
+    return frame._constructor_sliced(new_values, index=new_index)
+
+
+def stack_multiple(frame, level, dropna=True):
+    # If all passed levels match up to column names, no
+    # ambiguity about what to do
+    if all(lev in frame.columns.names for lev in level):
+        result = frame
+        for lev in level:
+            result = stack(result, lev, dropna=dropna)
+
+    # Otherwise, level numbers may change as each successive level is stacked
+    elif all(isinstance(lev, int) for lev in level):
+        # As each stack is done, the level numbers decrease, so we need
+        #  to account for that when level is a sequence of ints
+        result = frame
+        # _get_level_number() checks level numbers are in range and converts
+        # negative numbers to positive
+        level = [frame.columns._get_level_number(lev) for lev in level]
+
+        # Can't iterate directly through level as we might need to change
+        # values as we go
+        for index in range(len(level)):
+            lev = level[index]
+            result = stack(result, lev, dropna=dropna)
+            # Decrement all level numbers greater than current, as these
+            # have now shifted down by one
+            updated_level = []
+            for other in level:
+                if other > lev:
+                    updated_level.append(other - 1)
+                else:
+                    updated_level.append(other)
+            level = updated_level
+
+    else:
+        raise ValueError("level should contain all level names or all level "
+                         "numbers, not a mixture of the two.")
+
+    return result
+
+
+def _stack_multi_columns(frame, level_num=-1, dropna=True):
+    def _convert_level_number(level_num, columns):
+        """
+        Logic for converting the level number to something we can safely pass
+        to swaplevel:
+
+        We generally want to convert the level number into a level name, except
+        when columns do not have names, in which case we must leave as a level
+        number
+        """
+        if level_num in columns.names:
+            return columns.names[level_num]
+        else:
+            if columns.names[level_num] is None:
+                return level_num
+            else:
+                return columns.names[level_num]
+
+    this = frame.copy()
+
+    # this makes life much simpler
+    if level_num != frame.columns.nlevels - 1:
+        # roll levels to put selected level at end
+        roll_columns = this.columns
+        for i in range(level_num, frame.columns.nlevels - 1):
+            # Need to check if the ints conflict with level names
+            lev1 = _convert_level_number(i, roll_columns)
+            lev2 = _convert_level_number(i + 1, roll_columns)
+            roll_columns = roll_columns.swaplevel(lev1, lev2)
+        this.columns = roll_columns
+
+    if not this.columns.is_lexsorted():
+        # Workaround the edge case where 0 is one of the column names,
+        # which interferes with trying to sort based on the first
+        # level
+        level_to_sort = _convert_level_number(0, this.columns)
+        this = this.sort_index(level=level_to_sort, axis=1)
+
+    # tuple list excluding level for grouping columns
+    if len(frame.columns.levels) > 2:
+        tuples = list(zip(*[lev.take(lab)
+                            for lev, lab in zip(this.columns.levels[:-1],
+                                                this.columns.labels[:-1])]))
+        unique_groups = [key for key, _ in itertools.groupby(tuples)]
+        new_names = this.columns.names[:-1]
+        new_columns = MultiIndex.from_tuples(unique_groups, names=new_names)
+    else:
+        new_columns = unique_groups = this.columns.levels[0]
+
+    # time to ravel the values
+    new_data = {}
+    level_vals = this.columns.levels[-1]
+    level_labels = sorted(set(this.columns.labels[-1]))
+    level_vals_used = level_vals[level_labels]
+    levsize = len(level_labels)
+    drop_cols = []
+    for key in unique_groups:
+        try:
+            loc = this.columns.get_loc(key)
+        except KeyError:
+            drop_cols.append(key)
+            continue
+
+        # can make more efficient?
+        # we almost always return a slice
+        # but if unsorted can get a boolean
+        # indexer
+        if not isinstance(loc, slice):
+            slice_len = len(loc)
+        else:
+            slice_len = loc.stop - loc.start
+
+        if slice_len != levsize:
+            chunk = this.loc[:, this.columns[loc]]
+            chunk.columns = level_vals.take(chunk.columns.labels[-1])
+            value_slice = chunk.reindex(columns=level_vals_used).values
+        else:
+            if frame._is_mixed_type:
+                value_slice = this.loc[:, this.columns[loc]].values
+            else:
+                value_slice = this.values[:, loc]
+
+        new_data[key] = value_slice.ravel()
+
+    if len(drop_cols) > 0:
+        new_columns = new_columns.difference(drop_cols)
+
+    N = len(this)
+
+    if isinstance(this.index, MultiIndex):
+        new_levels = list(this.index.levels)
+        new_names = list(this.index.names)
+        new_labels = [lab.repeat(levsize) for lab in this.index.labels]
+    else:
+        new_levels = [this.index]
+        new_labels = [np.arange(N).repeat(levsize)]
+        new_names = [this.index.name]  # something better?
+
+    new_levels.append(level_vals)
+    new_labels.append(np.tile(level_labels, N))
+    new_names.append(frame.columns.names[level_num])
+
+    new_index = MultiIndex(levels=new_levels, labels=new_labels,
+                           names=new_names, verify_integrity=False)
+
+    result = frame._constructor(new_data, index=new_index, columns=new_columns)
+
+    # more efficient way to go about this? can do the whole masking biz but
+    # will only save a small amount of time...
+    if dropna:
+        result = result.dropna(axis=0, how='all')
+
+    return result
+
+
+def get_dummies(data, prefix=None, prefix_sep='_', dummy_na=False,
+                columns=None, sparse=False, drop_first=False, dtype=None):
+    """
+    Convert categorical variable into dummy/indicator variables
+
+    Parameters
+    ----------
+    data : array-like, Series, or DataFrame
+    prefix : string, list of strings, or dict of strings, default None
+        String to append DataFrame column names.
+        Pass a list with length equal to the number of columns
+        when calling get_dummies on a DataFrame. Alternatively, `prefix`
+        can be a dictionary mapping column names to prefixes.
+    prefix_sep : string, default '_'
+        If appending prefix, separator/delimiter to use. Or pass a
+        list or dictionary as with `prefix.`
+    dummy_na : bool, default False
+        Add a column to indicate NaNs, if False NaNs are ignored.
+    columns : list-like, default None
+        Column names in the DataFrame to be encoded.
+        If `columns` is None then all the columns with
+        `object` or `category` dtype will be converted.
+    sparse : bool, default False
+        Whether the dummy columns should be sparse or not.  Returns
+        SparseDataFrame if `data` is a Series or if all columns are included.
+        Otherwise returns a DataFrame with some SparseBlocks.
+    drop_first : bool, default False
+        Whether to get k-1 dummies out of k categorical levels by removing the
+        first level.
+
+        .. versionadded:: 0.18.0
+
+    dtype : dtype, default np.uint8
+        Data type for new columns. Only a single dtype is allowed.
+
+        .. versionadded:: 0.23.0
+
+    Returns
+    -------
+    dummies : DataFrame or SparseDataFrame
+
+    Examples
+    --------
+    >>> import pandas as pd
+    >>> s = pd.Series(list('abca'))
+
+    >>> pd.get_dummies(s)
+       a  b  c
+    0  1  0  0
+    1  0  1  0
+    2  0  0  1
+    3  1  0  0
+
+    >>> s1 = ['a', 'b', np.nan]
+
+    >>> pd.get_dummies(s1)
+       a  b
+    0  1  0
+    1  0  1
+    2  0  0
+
+    >>> pd.get_dummies(s1, dummy_na=True)
+       a  b  NaN
+    0  1  0    0
+    1  0  1    0
+    2  0  0    1
+
+    >>> df = pd.DataFrame({'A': ['a', 'b', 'a'], 'B': ['b', 'a', 'c'],
+    ...                    'C': [1, 2, 3]})
+
+    >>> pd.get_dummies(df, prefix=['col1', 'col2'])
+       C  col1_a  col1_b  col2_a  col2_b  col2_c
+    0  1       1       0       0       1       0
+    1  2       0       1       1       0       0
+    2  3       1       0       0       0       1
+
+    >>> pd.get_dummies(pd.Series(list('abcaa')))
+       a  b  c
+    0  1  0  0
+    1  0  1  0
+    2  0  0  1
+    3  1  0  0
+    4  1  0  0
+
+    >>> pd.get_dummies(pd.Series(list('abcaa')), drop_first=True)
+       b  c
+    0  0  0
+    1  1  0
+    2  0  1
+    3  0  0
+    4  0  0
+
+    >>> pd.get_dummies(pd.Series(list('abc')), dtype=float)
+         a    b    c
+    0  1.0  0.0  0.0
+    1  0.0  1.0  0.0
+    2  0.0  0.0  1.0
+
+    See Also
+    --------
+    Series.str.get_dummies
+    """
+    from pandas.core.reshape.concat import concat
+    from itertools import cycle
+
+    dtypes_to_encode = ['object', 'category']
+
+    if isinstance(data, DataFrame):
+        # determine columns being encoded
+        if columns is None:
+            data_to_encode = data.select_dtypes(
+                include=dtypes_to_encode)
+        else:
+            data_to_encode = data[columns]
+
+        # validate prefixes and separator to avoid silently dropping cols
+        def check_len(item, name):
+            len_msg = ("Length of '{name}' ({len_item}) did not match the "
+                       "length of the columns being encoded ({len_enc}).")
+
+            if is_list_like(item):
+                if not len(item) == data_to_encode.shape[1]:
+                    len_msg = \
+                        len_msg.format(name=name, len_item=len(item),
+                                       len_enc=data_to_encode.shape[1])
+                    raise ValueError(len_msg)
+
+        check_len(prefix, 'prefix')
+        check_len(prefix_sep, 'prefix_sep')
+
+        if isinstance(prefix, compat.string_types):
+            prefix = cycle([prefix])
+        if isinstance(prefix, dict):
+            prefix = [prefix[col] for col in data_to_encode.columns]
+
+        if prefix is None:
+            prefix = data_to_encode.columns
+
+        # validate separators
+        if isinstance(prefix_sep, compat.string_types):
+            prefix_sep = cycle([prefix_sep])
+        elif isinstance(prefix_sep, dict):
+            prefix_sep = [prefix_sep[col] for col in data_to_encode.columns]
+
+        if data_to_encode.shape == data.shape:
+            # Encoding the entire df, do not prepend any dropped columns
+            with_dummies = []
+        elif columns is not None:
+            # Encoding only cols specified in columns. Get all cols not in
+            # columns to prepend to result.
+            with_dummies = [data.drop(columns, axis=1)]
+        else:
+            # Encoding only object and category dtype columns. Get remaining
+            # columns to prepend to result.
+            with_dummies = [data.select_dtypes(exclude=dtypes_to_encode)]
+
+        for (col, pre, sep) in zip(data_to_encode.iteritems(), prefix,
+                                   prefix_sep):
+            # col is (column_name, column), use just column data here
+            dummy = _get_dummies_1d(col[1], prefix=pre, prefix_sep=sep,
+                                    dummy_na=dummy_na, sparse=sparse,
+                                    drop_first=drop_first, dtype=dtype)
+            with_dummies.append(dummy)
+        result = concat(with_dummies, axis=1)
+    else:
+        result = _get_dummies_1d(data, prefix, prefix_sep, dummy_na,
+                                 sparse=sparse,
+                                 drop_first=drop_first,
+                                 dtype=dtype)
+    return result
+
+
+def _get_dummies_1d(data, prefix, prefix_sep='_', dummy_na=False,
+                    sparse=False, drop_first=False, dtype=None):
+    # Series avoids inconsistent NaN handling
+    codes, levels = _factorize_from_iterable(Series(data))
+
+    if dtype is None:
+        dtype = np.uint8
+    dtype = np.dtype(dtype)
+
+    if is_object_dtype(dtype):
+        raise ValueError("dtype=object is not a valid dtype for get_dummies")
+
+    def get_empty_Frame(data, sparse):
+        if isinstance(data, Series):
+            index = data.index
+        else:
+            index = np.arange(len(data))
+        if not sparse:
+            return DataFrame(index=index)
+        else:
+            return SparseDataFrame(index=index, default_fill_value=0)
+
+    # if all NaN
+    if not dummy_na and len(levels) == 0:
+        return get_empty_Frame(data, sparse)
+
+    codes = codes.copy()
+    if dummy_na:
+        codes[codes == -1] = len(levels)
+        levels = np.append(levels, np.nan)
+
+    # if dummy_na, we just fake a nan level. drop_first will drop it again
+    if drop_first and len(levels) == 1:
+        return get_empty_Frame(data, sparse)
+
+    number_of_cols = len(levels)
+
+    if prefix is not None:
+        dummy_strs = [u'{prefix}{sep}{level}' if isinstance(v, text_type)
+                      else '{prefix}{sep}{level}' for v in levels]
+        dummy_cols = [dummy_str.format(prefix=prefix, sep=prefix_sep, level=v)
+                      for dummy_str, v in zip(dummy_strs, levels)]
+    else:
+        dummy_cols = levels
+
+    if isinstance(data, Series):
+        index = data.index
+    else:
+        index = None
+
+    if sparse:
+        sparse_series = {}
+        N = len(data)
+        sp_indices = [[] for _ in range(len(dummy_cols))]
+        for ndx, code in enumerate(codes):
+            if code == -1:
+                # Blank entries if not dummy_na and code == -1, #GH4446
+                continue
+            sp_indices[code].append(ndx)
+
+        if drop_first:
+            # remove first categorical level to avoid perfect collinearity
+            # GH12042
+            sp_indices = sp_indices[1:]
+            dummy_cols = dummy_cols[1:]
+        for col, ixs in zip(dummy_cols, sp_indices):
+            sarr = SparseArray(np.ones(len(ixs), dtype=dtype),
+                               sparse_index=IntIndex(N, ixs), fill_value=0,
+                               dtype=dtype)
+            sparse_series[col] = SparseSeries(data=sarr, index=index)
+
+        out = SparseDataFrame(sparse_series, index=index, columns=dummy_cols,
+                              default_fill_value=0,
+                              dtype=dtype)
+        return out
+
+    else:
+        dummy_mat = np.eye(number_of_cols, dtype=dtype).take(codes, axis=0)
+
+        if not dummy_na:
+            # reset NaN GH4446
+            dummy_mat[codes == -1] = 0
+
+        if drop_first:
+            # remove first GH12042
+            dummy_mat = dummy_mat[:, 1:]
+            dummy_cols = dummy_cols[1:]
+        return DataFrame(dummy_mat, index=index, columns=dummy_cols)
+
+
+def make_axis_dummies(frame, axis='minor', transform=None):
+    """
+    Construct 1-0 dummy variables corresponding to designated axis
+    labels
+
+    Parameters
+    ----------
+    frame : DataFrame
+    axis : {'major', 'minor'}, default 'minor'
+    transform : function, default None
+        Function to apply to axis labels first. For example, to
+        get "day of week" dummies in a time series regression
+        you might call::
+
+            make_axis_dummies(panel, axis='major',
+                              transform=lambda d: d.weekday())
+    Returns
+    -------
+    dummies : DataFrame
+        Column names taken from chosen axis
+    """
+    numbers = {'major': 0, 'minor': 1}
+    num = numbers.get(axis, axis)
+
+    items = frame.index.levels[num]
+    labels = frame.index.labels[num]
+    if transform is not None:
+        mapped_items = items.map(transform)
+        labels, items = _factorize_from_iterable(mapped_items.take(labels))
+
+    values = np.eye(len(items), dtype=float)
+    values = values.take(labels, axis=0)
+
+    return DataFrame(values, columns=items, index=frame.index)
diff --git a/pandas/core/reshape/tile.py b/pandas/core/reshape/tile.py
new file mode 100644
index 0000000000000..8bbf939e110e9
--- /dev/null
+++ b/pandas/core/reshape/tile.py
@@ -0,0 +1,528 @@
+"""
+Quantilization functions and related stuff
+"""
+from functools import partial
+
+from pandas.core.dtypes.missing import isna
+from pandas.core.dtypes.common import (
+    is_integer,
+    is_scalar,
+    is_categorical_dtype,
+    is_datetime64_dtype,
+    is_timedelta64_dtype,
+    is_datetime64tz_dtype,
+    _ensure_int64)
+
+import pandas.core.algorithms as algos
+import pandas.core.nanops as nanops
+from pandas._libs.lib import infer_dtype
+from pandas import (to_timedelta, to_datetime,
+                    Categorical, Timestamp, Timedelta,
+                    Series, Interval, IntervalIndex)
+
+import numpy as np
+
+
+def cut(x, bins, right=True, labels=None, retbins=False, precision=3,
+        include_lowest=False, duplicates='raise'):
+    """
+    Bin values into discrete intervals.
+
+    Use `cut` when you need to segment and sort data values into bins. This
+    function is also useful for going from a continuous variable to a
+    categorical variable. For example, `cut` could convert ages to groups of
+    age ranges. Supports binning into an equal number of bins, or a
+    pre-specified array of bins.
+
+    Parameters
+    ----------
+    x : array-like
+        The input array to be binned. Must be 1-dimensional.
+    bins : int, sequence of scalars, or pandas.IntervalIndex
+        The criteria to bin by.
+
+        * int : Defines the number of equal-width bins in the range of `x`. The
+          range of `x` is extended by .1% on each side to include the minimum
+          and maximum values of `x`.
+        * sequence of scalars : Defines the bin edges allowing for non-uniform
+          width. No extension of the range of `x` is done.
+        * IntervalIndex : Defines the exact bins to be used.
+
+    right : bool, default True
+        Indicates whether `bins` includes the rightmost edge or not. If
+        ``right == True`` (the default), then the `bins` ``[1, 2, 3, 4]``
+        indicate (1,2], (2,3], (3,4]. This argument is ignored when
+        `bins` is an IntervalIndex.
+    labels : array or bool, optional
+        Specifies the labels for the returned bins. Must be the same length as
+        the resulting bins. If False, returns only integer indicators of the
+        bins. This affects the type of the output container (see below).
+        This argument is ignored when `bins` is an IntervalIndex.
+    retbins : bool, default False
+        Whether to return the bins or not. Useful when bins is provided
+        as a scalar.
+    precision : int, default 3
+        The precision at which to store and display the bins labels.
+    include_lowest : bool, default False
+        Whether the first interval should be left-inclusive or not.
+    duplicates : {default 'raise', 'drop'}, optional
+        If bin edges are not unique, raise ValueError or drop non-uniques.
+
+        .. versionadded:: 0.23.0
+
+    Returns
+    -------
+    out : pandas.Categorical, Series, or ndarray
+        An array-like object representing the respective bin for each value
+        of `x`. The type depends on the value of `labels`.
+
+        * True (default) : returns a Series for Series `x` or a
+          pandas.Categorical for all other inputs. The values stored within
+          are Interval dtype.
+
+        * sequence of scalars : returns a Series for Series `x` or a
+          pandas.Categorical for all other inputs. The values stored within
+          are whatever the type in the sequence is.
+
+        * False : returns an ndarray of integers.
+
+    bins : numpy.ndarray or IntervalIndex.
+        The computed or specified bins. Only returned when `retbins=True`.
+        For scalar or sequence `bins`, this is an ndarray with the computed
+        bins. If set `duplicates=drop`, `bins` will drop non-unique bin. For
+        an IntervalIndex `bins`, this is equal to `bins`.
+
+    See Also
+    --------
+    qcut : Discretize variable into equal-sized buckets based on rank
+        or based on sample quantiles.
+    pandas.Categorical : Array type for storing data that come from a
+        fixed set of values.
+    Series : One-dimensional array with axis labels (including time series).
+    pandas.IntervalIndex : Immutable Index implementing an ordered,
+        sliceable set.
+
+    Notes
+    -----
+    Any NA values will be NA in the result. Out of bounds values will be NA in
+    the resulting Series or pandas.Categorical object.
+
+    Examples
+    --------
+    Discretize into three equal-sized bins.
+
+    >>> pd.cut(np.array([1, 7, 5, 4, 6, 3]), 3)
+    ... # doctest: +ELLIPSIS
+    [(0.994, 3.0], (5.0, 7.0], (3.0, 5.0], (3.0, 5.0], (5.0, 7.0], ...
+    Categories (3, interval[float64]): [(0.994, 3.0] < (3.0, 5.0] ...
+
+    >>> pd.cut(np.array([1, 7, 5, 4, 6, 3]), 3, retbins=True)
+    ... # doctest: +ELLIPSIS
+    ([(0.994, 3.0], (5.0, 7.0], (3.0, 5.0], (3.0, 5.0], (5.0, 7.0], ...
+    Categories (3, interval[float64]): [(0.994, 3.0] < (3.0, 5.0] ...
+    array([0.994, 3.   , 5.   , 7.   ]))
+
+    Discovers the same bins, but assign them specific labels. Notice that
+    the returned Categorical's categories are `labels` and is ordered.
+
+    >>> pd.cut(np.array([1, 7, 5, 4, 6, 3]),
+    ...        3, labels=["bad", "medium", "good"])
+    [bad, good, medium, medium, good, bad]
+    Categories (3, object): [bad < medium < good]
+
+    ``labels=False`` implies you just want the bins back.
+
+    >>> pd.cut([0, 1, 1, 2], bins=4, labels=False)
+    array([0, 1, 1, 3])
+
+    Passing a Series as an input returns a Series with categorical dtype:
+
+    >>> s = pd.Series(np.array([2, 4, 6, 8, 10]),
+    ...               index=['a', 'b', 'c', 'd', 'e'])
+    >>> pd.cut(s, 3)
+    ... # doctest: +ELLIPSIS
+    a    (1.992, 4.667]
+    b    (1.992, 4.667]
+    c    (4.667, 7.333]
+    d     (7.333, 10.0]
+    e     (7.333, 10.0]
+    dtype: category
+    Categories (3, interval[float64]): [(1.992, 4.667] < (4.667, ...
+
+    Passing a Series as an input returns a Series with mapping value.
+    It is used to map numerically to intervals based on bins.
+
+    >>> s = pd.Series(np.array([2, 4, 6, 8, 10]),
+    ...               index=['a', 'b', 'c', 'd', 'e'])
+    >>> pd.cut(s, [0, 2, 4, 6, 8, 10], labels=False, retbins=True, right=False)
+    ... # doctest: +ELLIPSIS
+    (a    0.0
+     b    1.0
+     c    2.0
+     d    3.0
+     e    4.0
+     dtype: float64, array([0, 2, 4, 6, 8]))
+
+    Use `drop` optional when bins is not unique
+
+    >>> pd.cut(s, [0, 2, 4, 6, 10, 10], labels=False, retbins=True,
+    ...    right=False, duplicates='drop')
+    ... # doctest: +ELLIPSIS
+    (a    0.0
+     b    1.0
+     c    2.0
+     d    3.0
+     e    3.0
+     dtype: float64, array([0, 2, 4, 6, 8]))
+
+    Passing an IntervalIndex for `bins` results in those categories exactly.
+    Notice that values not covered by the IntervalIndex are set to NaN. 0
+    is to the left of the first bin (which is closed on the right), and 1.5
+    falls between two bins.
+
+    >>> bins = pd.IntervalIndex.from_tuples([(0, 1), (2, 3), (4, 5)])
+    >>> pd.cut([0, 0.5, 1.5, 2.5, 4.5], bins)
+    [NaN, (0, 1], NaN, (2, 3], (4, 5]]
+    Categories (3, interval[int64]): [(0, 1] < (2, 3] < (4, 5]]
+    """
+    # NOTE: this binning code is changed a bit from histogram for var(x) == 0
+
+    # for handling the cut for datetime and timedelta objects
+    x_is_series, series_index, name, x = _preprocess_for_cut(x)
+    x, dtype = _coerce_to_type(x)
+
+    if not np.iterable(bins):
+        if is_scalar(bins) and bins < 1:
+            raise ValueError("`bins` should be a positive integer.")
+
+        try:  # for array-like
+            sz = x.size
+        except AttributeError:
+            x = np.asarray(x)
+            sz = x.size
+
+        if sz == 0:
+            raise ValueError('Cannot cut empty array')
+
+        rng = (nanops.nanmin(x), nanops.nanmax(x))
+        mn, mx = [mi + 0.0 for mi in rng]
+
+        if mn == mx:  # adjust end points before binning
+            mn -= .001 * abs(mn) if mn != 0 else .001
+            mx += .001 * abs(mx) if mx != 0 else .001
+            bins = np.linspace(mn, mx, bins + 1, endpoint=True)
+        else:  # adjust end points after binning
+            bins = np.linspace(mn, mx, bins + 1, endpoint=True)
+            adj = (mx - mn) * 0.001  # 0.1% of the range
+            if right:
+                bins[0] -= adj
+            else:
+                bins[-1] += adj
+
+    elif isinstance(bins, IntervalIndex):
+        pass
+    else:
+        bins = np.asarray(bins)
+        bins = _convert_bin_to_numeric_type(bins, dtype)
+        if (np.diff(bins) < 0).any():
+            raise ValueError('bins must increase monotonically.')
+
+    fac, bins = _bins_to_cuts(x, bins, right=right, labels=labels,
+                              precision=precision,
+                              include_lowest=include_lowest,
+                              dtype=dtype,
+                              duplicates=duplicates)
+
+    return _postprocess_for_cut(fac, bins, retbins, x_is_series,
+                                series_index, name)
+
+
+def qcut(x, q, labels=None, retbins=False, precision=3, duplicates='raise'):
+    """
+    Quantile-based discretization function. Discretize variable into
+    equal-sized buckets based on rank or based on sample quantiles. For example
+    1000 values for 10 quantiles would produce a Categorical object indicating
+    quantile membership for each data point.
+
+    Parameters
+    ----------
+    x : 1d ndarray or Series
+    q : integer or array of quantiles
+        Number of quantiles. 10 for deciles, 4 for quartiles, etc. Alternately
+        array of quantiles, e.g. [0, .25, .5, .75, 1.] for quartiles
+    labels : array or boolean, default None
+        Used as labels for the resulting bins. Must be of the same length as
+        the resulting bins. If False, return only integer indicators of the
+        bins.
+    retbins : bool, optional
+        Whether to return the (bins, labels) or not. Can be useful if bins
+        is given as a scalar.
+    precision : int, optional
+        The precision at which to store and display the bins labels
+    duplicates : {default 'raise', 'drop'}, optional
+        If bin edges are not unique, raise ValueError or drop non-uniques.
+
+        .. versionadded:: 0.20.0
+
+    Returns
+    -------
+    out : Categorical or Series or array of integers if labels is False
+        The return type (Categorical or Series) depends on the input: a Series
+        of type category if input is a Series else Categorical. Bins are
+        represented as categories when categorical data is returned.
+    bins : ndarray of floats
+        Returned only if `retbins` is True.
+
+    Notes
+    -----
+    Out of bounds values will be NA in the resulting Categorical object
+
+    Examples
+    --------
+    >>> pd.qcut(range(5), 4)
+    ... # doctest: +ELLIPSIS
+    [(-0.001, 1.0], (-0.001, 1.0], (1.0, 2.0], (2.0, 3.0], (3.0, 4.0]]
+    Categories (4, interval[float64]): [(-0.001, 1.0] < (1.0, 2.0] ...
+
+    >>> pd.qcut(range(5), 3, labels=["good", "medium", "bad"])
+    ... # doctest: +SKIP
+    [good, good, medium, bad, bad]
+    Categories (3, object): [good < medium < bad]
+
+    >>> pd.qcut(range(5), 4, labels=False)
+    array([0, 0, 1, 2, 3])
+    """
+    x_is_series, series_index, name, x = _preprocess_for_cut(x)
+
+    x, dtype = _coerce_to_type(x)
+
+    if is_integer(q):
+        quantiles = np.linspace(0, 1, q + 1)
+    else:
+        quantiles = q
+    bins = algos.quantile(x, quantiles)
+    fac, bins = _bins_to_cuts(x, bins, labels=labels,
+                              precision=precision, include_lowest=True,
+                              dtype=dtype, duplicates=duplicates)
+
+    return _postprocess_for_cut(fac, bins, retbins, x_is_series,
+                                series_index, name)
+
+
+def _bins_to_cuts(x, bins, right=True, labels=None,
+                  precision=3, include_lowest=False,
+                  dtype=None, duplicates='raise'):
+
+    if duplicates not in ['raise', 'drop']:
+        raise ValueError("invalid value for 'duplicates' parameter, "
+                         "valid options are: raise, drop")
+
+    if isinstance(bins, IntervalIndex):
+        # we have a fast-path here
+        ids = bins.get_indexer(x)
+        result = algos.take_nd(bins, ids)
+        result = Categorical(result, categories=bins, ordered=True)
+        return result, bins
+
+    unique_bins = algos.unique(bins)
+    if len(unique_bins) < len(bins) and len(bins) != 2:
+        if duplicates == 'raise':
+            raise ValueError("Bin edges must be unique: {bins!r}.\nYou "
+                             "can drop duplicate edges by setting "
+                             "the 'duplicates' kwarg".format(bins=bins))
+        else:
+            bins = unique_bins
+
+    side = 'left' if right else 'right'
+    ids = _ensure_int64(bins.searchsorted(x, side=side))
+
+    if include_lowest:
+        # Numpy 1.9 support: ensure this mask is a Numpy array
+        ids[np.asarray(x == bins[0])] = 1
+
+    na_mask = isna(x) | (ids == len(bins)) | (ids == 0)
+    has_nas = na_mask.any()
+
+    if labels is not False:
+        if labels is None:
+            labels = _format_labels(bins, precision, right=right,
+                                    include_lowest=include_lowest,
+                                    dtype=dtype)
+        else:
+            if len(labels) != len(bins) - 1:
+                raise ValueError('Bin labels must be one fewer than '
+                                 'the number of bin edges')
+        if not is_categorical_dtype(labels):
+            labels = Categorical(labels, categories=labels, ordered=True)
+
+        np.putmask(ids, na_mask, 0)
+        result = algos.take_nd(labels, ids - 1)
+
+    else:
+        result = ids - 1
+        if has_nas:
+            result = result.astype(np.float64)
+            np.putmask(result, na_mask, np.nan)
+
+    return result, bins
+
+
+def _trim_zeros(x):
+    while len(x) > 1 and x[-1] == '0':
+        x = x[:-1]
+    if len(x) > 1 and x[-1] == '.':
+        x = x[:-1]
+    return x
+
+
+def _coerce_to_type(x):
+    """
+    if the passed data is of datetime/timedelta type,
+    this method converts it to numeric so that cut method can
+    handle it
+    """
+    dtype = None
+
+    if is_datetime64tz_dtype(x):
+        dtype = x.dtype
+    elif is_datetime64_dtype(x):
+        x = to_datetime(x)
+        dtype = np.datetime64
+    elif is_timedelta64_dtype(x):
+        x = to_timedelta(x)
+        dtype = np.timedelta64
+
+    if dtype is not None:
+        # GH 19768: force NaT to NaN during integer conversion
+        x = np.where(x.notna(), x.view(np.int64), np.nan)
+
+    return x, dtype
+
+
+def _convert_bin_to_numeric_type(bins, dtype):
+    """
+    if the passed bin is of datetime/timedelta type,
+    this method converts it to integer
+
+    Parameters
+    ----------
+    bins : list-like of bins
+    dtype : dtype of data
+
+    Raises
+    ------
+    ValueError if bins are not of a compat dtype to dtype
+    """
+    bins_dtype = infer_dtype(bins)
+    if is_timedelta64_dtype(dtype):
+        if bins_dtype in ['timedelta', 'timedelta64']:
+            bins = to_timedelta(bins).view(np.int64)
+        else:
+            raise ValueError("bins must be of timedelta64 dtype")
+    elif is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype):
+        if bins_dtype in ['datetime', 'datetime64']:
+            bins = to_datetime(bins).view(np.int64)
+        else:
+            raise ValueError("bins must be of datetime64 dtype")
+
+    return bins
+
+
+def _format_labels(bins, precision, right=True,
+                   include_lowest=False, dtype=None):
+    """ based on the dtype, return our labels """
+
+    closed = 'right' if right else 'left'
+
+    if is_datetime64tz_dtype(dtype):
+        formatter = partial(Timestamp, tz=dtype.tz)
+        adjust = lambda x: x - Timedelta('1ns')
+    elif is_datetime64_dtype(dtype):
+        formatter = Timestamp
+        adjust = lambda x: x - Timedelta('1ns')
+    elif is_timedelta64_dtype(dtype):
+        formatter = Timedelta
+        adjust = lambda x: x - Timedelta('1ns')
+    else:
+        precision = _infer_precision(precision, bins)
+        formatter = lambda x: _round_frac(x, precision)
+        adjust = lambda x: x - 10 ** (-precision)
+
+    breaks = [formatter(b) for b in bins]
+    labels = IntervalIndex.from_breaks(breaks, closed=closed)
+
+    if right and include_lowest:
+        # we will adjust the left hand side by precision to
+        # account that we are all right closed
+        v = adjust(labels[0].left)
+
+        i = IntervalIndex([Interval(v, labels[0].right, closed='right')])
+        labels = i.append(labels[1:])
+
+    return labels
+
+
+def _preprocess_for_cut(x):
+    """
+    handles preprocessing for cut where we convert passed
+    input to array, strip the index information and store it
+    separately
+    """
+    x_is_series = isinstance(x, Series)
+    series_index = None
+    name = None
+
+    if x_is_series:
+        series_index = x.index
+        name = x.name
+
+    # Check that the passed array is a Pandas or Numpy object
+    # We don't want to strip away a Pandas data-type here (e.g. datetimetz)
+    ndim = getattr(x, 'ndim', None)
+    if ndim is None:
+        x = np.asarray(x)
+    if x.ndim != 1:
+        raise ValueError("Input array must be 1 dimensional")
+
+    return x_is_series, series_index, name, x
+
+
+def _postprocess_for_cut(fac, bins, retbins, x_is_series,
+                         series_index, name):
+    """
+    handles post processing for the cut method where
+    we combine the index information if the originally passed
+    datatype was a series
+    """
+    if x_is_series:
+        fac = Series(fac, index=series_index, name=name)
+
+    if not retbins:
+        return fac
+
+    return fac, bins
+
+
+def _round_frac(x, precision):
+    """
+    Round the fractional part of the given number
+    """
+    if not np.isfinite(x) or x == 0:
+        return x
+    else:
+        frac, whole = np.modf(x)
+        if whole == 0:
+            digits = -int(np.floor(np.log10(abs(frac)))) - 1 + precision
+        else:
+            digits = precision
+        return np.around(x, digits)
+
+
+def _infer_precision(base_precision, bins):
+    """Infer an appropriate precision for _round_frac
+    """
+    for precision in range(base_precision, 20):
+        levels = [_round_frac(b, precision) for b in bins]
+        if algos.unique(levels).size == bins.size:
+            return precision
+    return base_precision  # default
diff --git a/pandas/core/reshape/util.py b/pandas/core/reshape/util.py
new file mode 100644
index 0000000000000..2fe82e5d6bc57
--- /dev/null
+++ b/pandas/core/reshape/util.py
@@ -0,0 +1,76 @@
+import numpy as np
+
+from pandas.core.dtypes.common import is_list_like
+
+from pandas.compat import reduce
+from pandas.core.index import Index
+from pandas.core import common as com
+
+
+def match(needles, haystack):
+    haystack = Index(haystack)
+    needles = Index(needles)
+    return haystack.get_indexer(needles)
+
+
+def cartesian_product(X):
+    """
+    Numpy version of itertools.product or pandas.compat.product.
+    Sometimes faster (for large inputs)...
+
+    Parameters
+    ----------
+    X : list-like of list-likes
+
+    Returns
+    -------
+    product : list of ndarrays
+
+    Examples
+    --------
+    >>> cartesian_product([list('ABC'), [1, 2]])
+    [array(['A', 'A', 'B', 'B', 'C', 'C'], dtype='|S1'),
+    array([1, 2, 1, 2, 1, 2])]
+
+    See also
+    --------
+    itertools.product : Cartesian product of input iterables.  Equivalent to
+        nested for-loops.
+    pandas.compat.product : An alias for itertools.product.
+    """
+    msg = "Input must be a list-like of list-likes"
+    if not is_list_like(X):
+        raise TypeError(msg)
+    for x in X:
+        if not is_list_like(x):
+            raise TypeError(msg)
+
+    if len(X) == 0:
+        return []
+
+    lenX = np.fromiter((len(x) for x in X), dtype=np.intp)
+    cumprodX = np.cumproduct(lenX)
+
+    a = np.roll(cumprodX, 1)
+    a[0] = 1
+
+    if cumprodX[-1] != 0:
+        b = cumprodX[-1] / cumprodX
+    else:
+        # if any factor is empty, the cartesian product is empty
+        b = np.zeros_like(cumprodX)
+
+    return [np.tile(np.repeat(np.asarray(com._values_from_object(x)), b[i]),
+                    np.product(a[i]))
+            for i, x in enumerate(X)]
+
+
+def _compose2(f, g):
+    """Compose 2 callables"""
+    return lambda *args, **kwargs: f(g(*args, **kwargs))
+
+
+def compose(*funcs):
+    """Compose 2 or more callables"""
+    assert len(funcs) > 1, 'At least 2 callables must be passed to compose'
+    return reduce(_compose2, funcs)
diff --git a/pandas/core/series.py b/pandas/core/series.py
index f4e3374626011..cdb901d18767c 100644
--- a/pandas/core/series.py
+++ b/pandas/core/series.py
@@ -8,66 +8,105 @@
 
 import types
 import warnings
+from textwrap import dedent
 
-from numpy import nan, ndarray
 import numpy as np
 import numpy.ma as ma
 
-from pandas.core.common import (isnull, notnull, is_bool_indexer,
-                                _default_index, _maybe_upcast,
-                                _asarray_tuplesafe, _infer_dtype_from_scalar,
-                                is_list_like, _values_from_object,
-                                is_categorical_dtype, is_datetime64tz_dtype,
-                                needs_i8_conversion, i8_boxer,
-                                _possibly_cast_to_datetime, _possibly_castable,
-                                _possibly_convert_platform, _try_sort,
-                                is_int64_dtype, is_internal_type, is_datetimetz,
-                                _maybe_match_name, ABCSparseArray,
-                                _coerce_to_dtype, SettingWithCopyError,
-                                _maybe_box_datetimelike, ABCDataFrame,
-                                _dict_compat)
+from pandas.core.accessor import CachedAccessor
+from pandas.core.arrays import ExtensionArray
+from pandas.core.dtypes.common import (
+    is_categorical_dtype,
+    is_bool,
+    is_integer, is_integer_dtype,
+    is_float_dtype,
+    is_extension_type,
+    is_extension_array_dtype,
+    is_datetime64tz_dtype,
+    is_timedelta64_dtype,
+    is_object_dtype,
+    is_list_like,
+    is_hashable,
+    is_iterator,
+    is_dict_like,
+    is_scalar,
+    _is_unorderable_exception,
+    _ensure_platform_int,
+    pandas_dtype)
+from pandas.core.dtypes.generic import (
+    ABCSparseArray, ABCDataFrame, ABCIndexClass)
+from pandas.core.dtypes.cast import (
+    maybe_upcast, infer_dtype_from_scalar,
+    maybe_convert_platform,
+    maybe_cast_to_datetime, maybe_castable,
+    construct_1d_arraylike_from_scalar,
+    construct_1d_ndarray_preserving_na,
+    construct_1d_object_array_from_listlike,
+    maybe_cast_to_integer_array)
+from pandas.core.dtypes.missing import (
+    isna,
+    notna,
+    remove_na_arraylike,
+    na_value_for_dtype)
+
 from pandas.core.index import (Index, MultiIndex, InvalidIndexError,
-                               _ensure_index)
+                               Float64Index, _ensure_index)
 from pandas.core.indexing import check_bool_indexer, maybe_convert_indices
 from pandas.core import generic, base
 from pandas.core.internals import SingleBlockManager
-from pandas.core.categorical import Categorical, CategoricalAccessor
-from pandas.tseries.common import (maybe_to_datetimelike,
-                                   CombinedDatetimelikeProperties)
-from pandas.tseries.index import DatetimeIndex
-from pandas.tseries.tdi import TimedeltaIndex
-from pandas.tseries.period import PeriodIndex, Period
+from pandas.core.arrays.categorical import Categorical, CategoricalAccessor
+from pandas.core.indexes.accessors import CombinedDatetimelikeProperties
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexes.timedeltas import TimedeltaIndex
+from pandas.core.indexes.period import PeriodIndex
 from pandas import compat
-from pandas.util.terminal import get_terminal_size
-from pandas.compat import zip, u, OrderedDict, StringIO
+from pandas.io.formats.terminal import get_terminal_size
+from pandas.compat import (
+    zip, u, OrderedDict, StringIO, range, get_range_parameters, PY36)
+from pandas.compat.numpy import function as nv
 
 import pandas.core.ops as ops
-from pandas.core import algorithms
+import pandas.core.algorithms as algorithms
 
 import pandas.core.common as com
-import pandas.core.datetools as datetools
-import pandas.core.format as fmt
 import pandas.core.nanops as nanops
-from pandas.util.decorators import Appender, cache_readonly, deprecate_kwarg
-
-import pandas.lib as lib
-import pandas.tslib as tslib
-import pandas.index as _index
+import pandas.io.formats.format as fmt
+from pandas.util._decorators import (
+    Appender, deprecate, deprecate_kwarg, Substitution)
+from pandas.util._validators import validate_bool_kwarg
 
-from numpy import percentile as _quantile
+from pandas._libs import index as libindex, tslib as libts, lib, iNaT
 from pandas.core.config import get_option
+from pandas.core.strings import StringMethods
 
-__all__ = ['Series']
+import pandas.plotting._core as gfx
 
+__all__ = ['Series']
 
 _shared_doc_kwargs = dict(
-    axes='index',
-    klass='Series',
-    axes_single_arg="{0, 'index'}",
+    axes='index', klass='Series', axes_single_arg="{0 or 'index'}",
+    axis="""
+    axis : {0 or 'index'}
+        Parameter needed for compatibility with DataFrame.
+    """,
     inplace="""inplace : boolean, default False
-            If True, performs operation inplace and returns None.""",
-    duplicated='Series'
-)
+        If True, performs operation inplace and returns None.""",
+    unique='np.ndarray', duplicated='Series',
+    optional_by='', optional_mapper='', optional_labels='', optional_axis='',
+    versionadded_to_excel='\n    .. versionadded:: 0.20.0\n')
+
+
+# see gh-16971
+def remove_na(arr):
+    """Remove null values from array like structure.
+
+    .. deprecated:: 0.21.0
+        Use s[s.notnull()] instead.
+    """
+
+    warnings.warn("remove_na is deprecated and is a private "
+                  "function. Do not use.", FutureWarning, stacklevel=2)
+    return remove_na_arraylike(arr)
 
 
 def _coerce_method(converter):
@@ -76,25 +115,24 @@ def _coerce_method(converter):
     def wrapper(self):
         if len(self) == 1:
             return converter(self.iloc[0])
-        raise TypeError(
-            "cannot convert the series to {0}".format(str(converter)))
-    return wrapper
+        raise TypeError("cannot convert the series to "
+                        "{0}".format(str(converter)))
 
+    return wrapper
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # Series class
 
 
 class Series(base.IndexOpsMixin, generic.NDFrame):
-
     """
     One-dimensional ndarray with axis labels (including time series).
 
-    Labels need not be unique but must be any hashable type. The object
+    Labels need not be unique but must be a hashable type. The object
     supports both integer- and label-based indexing and provides a host of
     methods for performing operations involving the index. Statistical
     methods from ndarray have been overridden to automatically exclude
-    missing data (currently represented as NaN)
+    missing data (currently represented as NaN).
 
     Operations between Series (+, -, /, *, **) align values based on their
     associated index values-- they need not be the same length. The result
@@ -104,10 +142,15 @@ class Series(base.IndexOpsMixin, generic.NDFrame):
     ----------
     data : array-like, dict, or scalar value
         Contains data stored in Series
+
+        .. versionchanged :: 0.23.0
+           If data is a dict, argument order is maintained for Python 3.6
+           and later.
+
     index : array-like or Index (1d)
-        Values must be unique and hashable, same length as data. Index
-        object (or other iterable of same length as data) Will default to
-        np.arange(len(data)) if not provided. If both a dict and index
+        Values must be hashable and have the same length as `data`.
+        Non-unique index values are allowed. Will default to
+        RangeIndex (0, 1, 2, ..., n) if not provided. If both a dict and index
         sequence are used, the index will override the keys found in the
         dict.
     dtype : numpy.dtype or None
@@ -116,8 +159,10 @@ class Series(base.IndexOpsMixin, generic.NDFrame):
         Copy input data
     """
     _metadata = ['name']
-    _accessors = frozenset(['dt', 'cat', 'str'])
-    _allow_index_ops = True
+    _accessors = set(['dt', 'cat', 'str'])
+    _deprecations = generic.NDFrame._deprecations | frozenset(
+        ['asobject', 'sortlevel', 'reshape', 'get_value', 'set_value',
+         'from_csv', 'valid'])
 
     def __init__(self, data=None, index=None, dtype=None, name=None,
                  copy=False, fastpath=False):
@@ -147,12 +192,17 @@ def __init__(self, data=None, index=None, dtype=None, name=None,
                 raise NotImplementedError("initializing a Series from a "
                                           "MultiIndex is not supported")
             elif isinstance(data, Index):
-                # need to copy to avoid aliasing issues
                 if name is None:
                     name = data.name
 
-                data = data._to_embed(keep_tz=True)
-                copy = True
+                if dtype is not None:
+                    # astype copies
+                    data = data.astype(dtype)
+                else:
+                    # need to copy to avoid aliasing issues
+                    data = data._values.copy()
+                copy = False
+
             elif isinstance(data, np.ndarray):
                 pass
             elif isinstance(data, Series):
@@ -164,33 +214,27 @@ def __init__(self, data=None, index=None, dtype=None, name=None,
                     data = data.reindex(index, copy=copy)
                 data = data._data
             elif isinstance(data, dict):
-                if index is None:
-                    if isinstance(data, OrderedDict):
-                        index = Index(data)
-                    else:
-                        index = Index(_try_sort(data))
-                try:
-                    if isinstance(index, DatetimeIndex):
-                        # coerce back to datetime objects for lookup
-                        data = _dict_compat(data)
-                        data = lib.fast_multiget(data, index.astype('O'),
-                                                 default=np.nan)
-                    elif isinstance(index, PeriodIndex):
-                        data = [data.get(i, nan) for i in index]
-                    else:
-                        data = lib.fast_multiget(data, index.values,
-                                                 default=np.nan)
-                except TypeError:
-                    data = [data.get(i, nan) for i in index]
-
+                data, index = self._init_dict(data, index, dtype)
+                dtype = None
+                copy = False
             elif isinstance(data, SingleBlockManager):
                 if index is None:
                     index = data.index
-                else:
-                    data = data.reindex(index, copy=copy)
-            elif isinstance(data, Categorical):
-                if dtype is not None:
-                    raise ValueError("cannot specify a dtype with a Categorical")
+                elif not data.index.equals(index) or copy:
+                    # GH#19275 SingleBlockManager input should only be called
+                    # internally
+                    raise AssertionError('Cannot pass both SingleBlockManager '
+                                         '`data` argument and a different '
+                                         '`index` argument.  `copy` must '
+                                         'be False.')
+
+            elif is_extension_array_dtype(data) and dtype is not None:
+                if not data.dtype.is_dtype(dtype):
+                    raise ValueError("Cannot specify a dtype '{}' with an "
+                                     "extension array of a different "
+                                     "dtype ('{}').".format(dtype,
+                                                            data.dtype))
+
             elif (isinstance(data, types.GeneratorType) or
                   (compat.PY3 and isinstance(data, map))):
                 data = list(data)
@@ -206,12 +250,25 @@ def __init__(self, data=None, index=None, dtype=None, name=None,
             if index is None:
                 if not is_list_like(data):
                     data = [data]
-                index = _default_index(len(data))
+                index = com._default_index(len(data))
+            elif is_list_like(data):
+
+                # a scalar numpy array is list-like but doesn't
+                # have a proper length
+                try:
+                    if len(index) != len(data):
+                        raise ValueError(
+                            'Length of passed values is {val}, '
+                            'index implies {ind}'
+                            .format(val=len(data), ind=len(index)))
+                except TypeError:
+                    pass
 
             # create/copy the manager
             if isinstance(data, SingleBlockManager):
                 if dtype is not None:
-                    data = data.astype(dtype=dtype, raise_on_error=False)
+                    data = data.astype(dtype=dtype, errors='ignore',
+                                       copy=copy)
                 elif copy:
                     data = data.copy()
             else:
@@ -222,18 +279,73 @@ def __init__(self, data=None, index=None, dtype=None, name=None,
 
         generic.NDFrame.__init__(self, data, fastpath=True)
 
-        object.__setattr__(self, 'name', name)
+        self.name = name
         self._set_axis(0, index, fastpath=True)
 
+    def _init_dict(self, data, index=None, dtype=None):
+        """
+        Derive the "_data" and "index" attributes of a new Series from a
+        dictionary input.
+
+        Parameters
+        ----------
+        data : dict or dict-like
+            Data used to populate the new Series
+        index : Index or index-like, default None
+            index for the new Series: if None, use dict keys
+        dtype : dtype, default None
+            dtype for the new Series: if None, infer from data
+
+        Returns
+        -------
+        _data : BlockManager for the new Series
+        index : index for the new Series
+        """
+        # Looking for NaN in dict doesn't work ({np.nan : 1}[float('nan')]
+        # raises KeyError), so we iterate the entire dict, and align
+        if data:
+            keys, values = zip(*compat.iteritems(data))
+            values = list(values)
+        elif index is not None:
+            # fastpath for Series(data=None). Just use broadcasting a scalar
+            # instead of reindexing.
+            values = na_value_for_dtype(dtype)
+            keys = index
+        else:
+            keys, values = [], []
+
+        # Input is now list-like, so rely on "standard" construction:
+        s = Series(values, index=keys, dtype=dtype)
+
+        # Now we just make sure the order is respected, if any
+        if data and index is not None:
+            s = s.reindex(index, copy=False)
+        elif not PY36 and not isinstance(data, OrderedDict) and data:
+            # Need the `and data` to avoid sorting Series(None, index=[...])
+            # since that isn't really dict-like
+            try:
+                s = s.sort_index()
+            except TypeError:
+                pass
+        return s._data, s.index
+
     @classmethod
     def from_array(cls, arr, index=None, name=None, dtype=None, copy=False,
                    fastpath=False):
-        # return a sparse series here
+        """Construct Series from array.
+
+        .. deprecated :: 0.23.0
+            Use pd.Series(..) constructor instead.
+
+        """
+        warnings.warn("'from_array' is deprecated and will be removed in a "
+                      "future version. Please use the pd.Series(..) "
+                      "constructor instead.", FutureWarning, stacklevel=2)
         if isinstance(arr, ABCSparseArray):
-            from pandas.sparse.series import SparseSeries
+            from pandas.core.sparse.series import SparseSeries
             cls = SparseSeries
-
-        return cls(arr, index=index, name=name, dtype=dtype, copy=copy, fastpath=fastpath)
+        return cls(arr, index=index, name=name, dtype=dtype,
+                   copy=copy, fastpath=fastpath)
 
     @property
     def _constructor(self):
@@ -249,14 +361,6 @@ def _constructor_expanddim(self):
     def _can_hold_na(self):
         return self._data._can_hold_na
 
-    @property
-    def is_time_series(self):
-        msg = "is_time_series is deprecated. Please use Series.index.is_all_dates"
-        warnings.warn(msg, FutureWarning, stacklevel=2)
-        # return self._subtyp in ['time_series', 'sparse_time_series']
-        return self.index.is_all_dates
-
-
     _index = None
 
     def _set_axis(self, axis, labels, fastpath=False):
@@ -267,13 +371,18 @@ def _set_axis(self, axis, labels, fastpath=False):
 
         is_all_dates = labels.is_all_dates
         if is_all_dates:
+            if not isinstance(labels,
+                              (DatetimeIndex, PeriodIndex, TimedeltaIndex)):
+                try:
+                    labels = DatetimeIndex(labels)
+                    # need to set here because we changed the index
+                    if fastpath:
+                        self._data.set_axis(axis, labels)
+                except (libts.OutOfBoundsDatetime, ValueError):
+                    # labels may exceeds datetime bounds,
+                    # or not be a DatetimeIndex
+                    pass
 
-            if not isinstance(labels, (DatetimeIndex, PeriodIndex, TimedeltaIndex)):
-                labels = DatetimeIndex(labels)
-
-                # need to set here becuase we changed the index
-                if fastpath:
-                    self._data.set_axis(axis, labels)
         self._set_subtyp(is_all_dates)
 
         object.__setattr__(self, '_index', labels)
@@ -290,6 +399,16 @@ def _update_inplace(self, result, **kwargs):
         # we want to call the generic version and not the IndexOpsMixin
         return generic.NDFrame._update_inplace(self, result, **kwargs)
 
+    @property
+    def name(self):
+        return self._name
+
+    @name.setter
+    def name(self, value):
+        if value is not None and not is_hashable(value):
+            raise TypeError('Series.name must be a hashable type')
+        object.__setattr__(self, '_name', value)
+
     # ndarray compatibility
     @property
     def dtype(self):
@@ -335,10 +454,11 @@ def values(self):
 
         Timezone aware datetime data is converted to UTC:
 
-        >>> pd.Series(pd.date_range('20130101',periods=3,tz='US/Eastern')).values
-        array(['2013-01-01T00:00:00.000000000-0500',
-               '2013-01-02T00:00:00.000000000-0500',
-               '2013-01-03T00:00:00.000000000-0500'], dtype='datetime64[ns]')
+        >>> pd.Series(pd.date_range('20130101', periods=3,
+        ...                         tz='US/Eastern')).values
+        array(['2013-01-01T05:00:00.000000000',
+               '2013-01-02T05:00:00.000000000',
+               '2013-01-03T05:00:00.000000000'], dtype='datetime64[ns]')
 
         """
         return self._data.external_values()
@@ -348,10 +468,30 @@ def _values(self):
         """ return the internal repr of this data """
         return self._data.internal_values()
 
+    def _formatting_values(self):
+        """Return the values that can be formatted (used by SeriesFormatter
+        and DataFrameFormatter)
+        """
+        return self._data.formatting_values()
+
     def get_values(self):
         """ same as values (but handles sparseness conversions); is a view """
         return self._data.get_values()
 
+    @property
+    def asobject(self):
+        """Return object Series which contains boxed values.
+
+        .. deprecated :: 0.23.0
+
+           Use ``astype(object)`` instead.
+
+        *this is an internal non-public method*
+        """
+        warnings.warn("'asobject' is deprecated. Use 'astype(object)'"
+                      " instead", FutureWarning, stacklevel=2)
+        return self.astype(object).values
+
     # ops
     def ravel(self, order='C'):
         """
@@ -363,7 +503,7 @@ def ravel(self, order='C'):
         """
         return self._values.ravel(order=order)
 
-    def compress(self, condition, axis=0, out=None, **kwargs):
+    def compress(self, condition, *args, **kwargs):
         """
         Return selected slices of an array along given axis as a Series
 
@@ -371,14 +511,15 @@ def compress(self, condition, axis=0, out=None, **kwargs):
         --------
         numpy.ndarray.compress
         """
+        nv.validate_compress(args, kwargs)
         return self[condition]
 
     def nonzero(self):
         """
-        Return the indices of the elements that are non-zero
+        Return the *integer* indices of the elements that are non-zero
 
         This method is equivalent to calling `numpy.nonzero` on the
-        series data. For compatability with NumPy, the return value is
+        series data. For compatibility with NumPy, the return value is
         the same (a tuple with an array of indices for each dimension),
         but it will always be a one-item tuple because series only have
         one dimension.
@@ -393,6 +534,15 @@ def nonzero(self):
         3    4
         dtype: int64
 
+        >>> s = pd.Series([0, 3, 0, 4], index=['a', 'b', 'c', 'd'])
+        # same return although index of s is different
+        >>> s.nonzero()
+        (array([1, 3]),)
+        >>> s.iloc[s.nonzero()[0]]
+        b    3
+        d    4
+        dtype: int64
+
         See Also
         --------
         numpy.nonzero
@@ -401,7 +551,8 @@ def nonzero(self):
 
     def put(self, *args, **kwargs):
         """
-        return a ndarray with the values put
+        Applies the `put` method to its `values` attribute
+        if it has one.
 
         See also
         --------
@@ -416,6 +567,71 @@ def __len__(self):
         return len(self._data)
 
     def view(self, dtype=None):
+        """
+        Create a new view of the Series.
+
+        This function will return a new Series with a view of the same
+        underlying values in memory, optionally reinterpreted with a new data
+        type. The new data type must preserve the same size in bytes as to not
+        cause index misalignment.
+
+        Parameters
+        ----------
+        dtype : data type
+            Data type object or one of their string representations.
+
+        Returns
+        -------
+        Series
+            A new Series object as a view of the same data in memory.
+
+        See Also
+        --------
+        numpy.ndarray.view : Equivalent numpy function to create a new view of
+            the same data in memory.
+
+        Notes
+        -----
+        Series are instantiated with ``dtype=float64`` by default. While
+        ``numpy.ndarray.view()`` will return a view with the same data type as
+        the original array, ``Series.view()`` (without specified dtype)
+        will try using ``float64`` and may fail if the original data type size
+        in bytes is not the same.
+
+        Examples
+        --------
+        >>> s = pd.Series([-2, -1, 0, 1, 2], dtype='int8')
+        >>> s
+        0   -2
+        1   -1
+        2    0
+        3    1
+        4    2
+        dtype: int8
+
+        The 8 bit signed integer representation of `-1` is `0b11111111`, but
+        the same bytes represent 255 if read as an 8 bit unsigned integer:
+
+        >>> us = s.view('uint8')
+        >>> us
+        0    254
+        1    255
+        2      0
+        3      1
+        4      2
+        dtype: uint8
+
+        The views share the same underlying values:
+
+        >>> us[0] = 128
+        >>> s
+        0   -128
+        1     -1
+        2      0
+        3      1
+        4      2
+        dtype: int8
+        """
         return self._constructor(self._values.view(dtype),
                                  index=self.index).__finalize__(self)
 
@@ -441,9 +657,10 @@ def __array_prepare__(self, result, context=None):
         if context is not None and not isinstance(self._values, np.ndarray):
             obj = context[1][0]
             raise TypeError("{obj} with dtype {dtype} cannot perform "
-                            "the numpy op {op}".format(obj=type(obj).__name__,
-                                                       dtype=getattr(obj,'dtype',None),
-                                                       op=context[0].__name__))
+                            "the numpy op {op}".format(
+                                obj=type(obj).__name__,
+                                dtype=getattr(obj, 'dtype', None),
+                                op=context[0].__name__))
         return result
 
     # complex
@@ -500,9 +717,7 @@ def _unpickle_series_compat(self, state):
     # indexers
     @property
     def axes(self):
-        """
-        Return a list of the row axis labels
-        """
+        """Return a list of the row axis labels"""
         return [self.index]
 
     def _ixs(self, i, axis=0):
@@ -522,12 +737,12 @@ def _ixs(self, i, axis=0):
             # dispatch to the values if we need
             values = self._values
             if isinstance(values, np.ndarray):
-                return _index.get_value_at(values, i)
+                return libindex.get_value_at(values, i)
             else:
                 return values[i]
         except IndexError:
             raise
-        except:
+        except Exception:
             if isinstance(i, slice):
                 indexer = self.index._convert_slice_indexer(i, kind='iloc')
                 return self._get_values(indexer)
@@ -536,30 +751,34 @@ def _ixs(self, i, axis=0):
                 if isinstance(label, Index):
                     return self.take(i, axis=axis, convert=True)
                 else:
-                    return _index.get_value_at(self, i)
+                    return libindex.get_value_at(self, i)
 
     @property
     def _is_mixed_type(self):
         return False
 
     def _slice(self, slobj, axis=0, kind=None):
-        slobj = self.index._convert_slice_indexer(slobj, kind=kind or 'getitem')
+        slobj = self.index._convert_slice_indexer(slobj,
+                                                  kind=kind or 'getitem')
         return self._get_values(slobj)
 
     def __getitem__(self, key):
+        key = com._apply_if_callable(key, self)
         try:
             result = self.index.get_value(self, key)
 
-            if not np.isscalar(result):
+            if not is_scalar(result):
                 if is_list_like(result) and not isinstance(result, Series):
 
-                    # we need to box if we have a non-unique index here
+                    # we need to box if loc of the key isn't scalar here
                     # otherwise have inline ndarray/lists
-                    if not self.index.is_unique:
-                        result = self._constructor(result,
-                                                   index=[key]*len(result)
-                                                   ,dtype=self.dtype).__finalize__(self)
-
+                    try:
+                        if not is_scalar(self.index.get_loc(key)):
+                            result = self._constructor(
+                                result, index=[key] * len(result),
+                                dtype=self.dtype).__finalize__(self)
+                    except KeyError:
+                        pass
             return result
         except InvalidIndexError:
             pass
@@ -569,12 +788,13 @@ def __getitem__(self, key):
                 pass
             elif key is Ellipsis:
                 return self
-            elif is_bool_indexer(key):
+            elif com.is_bool_indexer(key):
                 pass
             else:
 
                 # we can try to coerce the indexer (or this will raise)
-                new_key = self.index._convert_scalar_indexer(key,kind='getitem')
+                new_key = self.index._convert_scalar_indexer(key,
+                                                             kind='getitem')
                 if type(new_key) != type(key):
                     return self.__getitem__(new_key)
                 raise
@@ -582,10 +802,10 @@ def __getitem__(self, key):
         except Exception:
             raise
 
-        if com.is_iterator(key):
+        if is_iterator(key):
             key = list(key)
 
-        if is_bool_indexer(key):
+        if com.is_bool_indexer(key):
             key = check_bool_indexer(self.index, key)
 
         return self._get_with(key)
@@ -596,13 +816,13 @@ def _get_with(self, key):
             indexer = self.index._convert_slice_indexer(key, kind='getitem')
             return self._get_values(indexer)
         elif isinstance(key, ABCDataFrame):
-            raise TypeError('Indexing a Series with DataFrame is not supported, '\
-                            'use the appropriate DataFrame column')
+            raise TypeError('Indexing a Series with DataFrame is not '
+                            'supported, use the appropriate DataFrame column')
         else:
             if isinstance(key, tuple):
                 try:
                     return self._get_values_tuple(key)
-                except:
+                except Exception:
                     if len(key) == 1:
                         key = key[0]
                         if isinstance(key, slice):
@@ -620,7 +840,7 @@ def _get_with(self, key):
 
             if key_type == 'integer':
                 if self.index.is_integer() or self.index.is_floating():
-                    return self.reindex(key)
+                    return self.loc[key]
                 else:
                     return self._get_values(key)
             elif key_type == 'boolean':
@@ -629,7 +849,7 @@ def _get_with(self, key):
                 try:
                     # handle the dup indexing case (GH 4246)
                     if isinstance(key, (list, tuple)):
-                        return self.ix[key]
+                        return self.loc[key]
 
                     return self.reindex(key)
                 except Exception:
@@ -642,7 +862,7 @@ def _get_with(self, key):
 
     def _get_values_tuple(self, key):
         # mpl hackaround
-        if any(k is None for k in key):
+        if com._any_none(*key):
             return self._get_values(key)
 
         if not isinstance(self.index, MultiIndex):
@@ -661,54 +881,56 @@ def _get_values(self, indexer):
             return self._values[indexer]
 
     def __setitem__(self, key, value):
+        key = com._apply_if_callable(key, self)
 
         def setitem(key, value):
             try:
                 self._set_with_engine(key, value)
                 return
-            except (SettingWithCopyError):
+            except com.SettingWithCopyError:
                 raise
             except (KeyError, ValueError):
                 values = self._values
-                if (com.is_integer(key)
-                                and not self.index.inferred_type == 'integer'):
+                if (is_integer(key) and
+                        not self.index.inferred_type == 'integer'):
 
                     values[key] = value
                     return
                 elif key is Ellipsis:
                     self[:] = value
                     return
-                elif is_bool_indexer(key):
+                elif com.is_bool_indexer(key):
                     pass
-                elif com.is_timedelta64_dtype(self.dtype):
+                elif is_timedelta64_dtype(self.dtype):
                     # reassign a null value to iNaT
-                    if isnull(value):
-                        value = tslib.iNaT
+                    if isna(value):
+                        value = iNaT
 
                         try:
-                            self.index._engine.set_value(self._values, key, value)
+                            self.index._engine.set_value(self._values, key,
+                                                         value)
                             return
-                        except (TypeError):
+                        except TypeError:
                             pass
 
                 self.loc[key] = value
                 return
 
             except TypeError as e:
-                if isinstance(key, tuple) and not isinstance(self.index,
-                                                             MultiIndex):
+                if (isinstance(key, tuple) and
+                        not isinstance(self.index, MultiIndex)):
                     raise ValueError("Can only tuple-index with a MultiIndex")
 
                 # python 3 type errors should be raised
-                if 'unorderable' in str(e):  # pragma: no cover
+                if _is_unorderable_exception(e):
                     raise IndexError(key)
 
-            if is_bool_indexer(key):
+            if com.is_bool_indexer(key):
                 key = check_bool_indexer(self.index, key)
                 try:
-                    self.where(~key, value, inplace=True)
+                    self._where(~key, value, inplace=True)
                     return
-                except (InvalidIndexError):
+                except InvalidIndexError:
                     pass
 
             self._set_with(key, value)
@@ -743,8 +965,8 @@ def _set_with(self, key, value):
             if not isinstance(key, (list, Series, np.ndarray, Series)):
                 try:
                     key = list(key)
-                except:
-                    key = [ key ]
+                except Exception:
+                    key = [key]
 
             if isinstance(key, Index):
                 key_type = key.inferred_type
@@ -765,12 +987,11 @@ def _set_labels(self, key, value):
         if isinstance(key, Index):
             key = key.values
         else:
-            key = _asarray_tuplesafe(key)
+            key = com._asarray_tuplesafe(key)
         indexer = self.index.get_indexer(key)
         mask = indexer == -1
         if mask.any():
-            raise ValueError('%s not contained in the index'
-                             % str(key[mask]))
+            raise ValueError('%s not contained in the index' % str(key[mask]))
         self._set_values(indexer, value)
 
     def _set_values(self, key, value):
@@ -779,90 +1000,56 @@ def _set_values(self, key, value):
         self._data = self._data.setitem(indexer=key, value=value)
         self._maybe_update_cacher()
 
-    # help out SparseSeries
-    _get_val_at = ndarray.__getitem__
-
-    def repeat(self, reps):
+    @deprecate_kwarg(old_arg_name='reps', new_arg_name='repeats')
+    def repeat(self, repeats, *args, **kwargs):
         """
-        return a new Series with the values repeated reps times
+        Repeat elements of an Series. Refer to `numpy.ndarray.repeat`
+        for more information about the `repeats` argument.
 
         See also
         --------
         numpy.ndarray.repeat
         """
-        new_index = self.index.repeat(reps)
-        new_values = self._values.repeat(reps)
+        nv.validate_repeat(args, kwargs)
+        new_index = self.index.repeat(repeats)
+        new_values = self._values.repeat(repeats)
         return self._constructor(new_values,
                                  index=new_index).__finalize__(self)
 
-    def reshape(self, *args, **kwargs):
-        """
-        return an ndarray with the values shape
-        if the specified shape matches exactly the current shape, then
-        return self (for compat)
-
-        See also
-        --------
-        numpy.ndarray.take
-        """
-        if len(args) == 1 and hasattr(args[0], '__iter__'):
-            shape = args[0]
-        else:
-            shape = args
-
-        if tuple(shape) == self.shape:
-            # XXX ignoring the "order" keyword.
-            return self
-
-        return self._values.reshape(shape, **kwargs)
-
-    def iget_value(self, i, axis=0):
-        """
-        DEPRECATED. Use ``.iloc[i]`` or ``.iat[i]`` instead
-        """
-        warnings.warn("iget_value(i) is deprecated. Please use .iloc[i] or .iat[i]",
-                      FutureWarning, stacklevel=2)
-        return self._ixs(i)
-
-    def iget(self, i, axis=0):
-        """
-        DEPRECATED. Use ``.iloc[i]`` or ``.iat[i]`` instead
-        """
-
-        warnings.warn("iget(i) is deprecated. Please use .iloc[i] or .iat[i]",
-                      FutureWarning, stacklevel=2)
-        return self._ixs(i)
-
-    def irow(self, i, axis=0):
-        """
-        DEPRECATED. Use ``.iloc[i]`` or ``.iat[i]`` instead
-        """
-        warnings.warn("irow(i) is deprecated. Please use .iloc[i] or .iat[i]",
-                      FutureWarning, stacklevel=2)
-        return self._ixs(i)
-
     def get_value(self, label, takeable=False):
-        """
-        Quickly retrieve single value at passed index label
+        """Quickly retrieve single value at passed index label
+
+        .. deprecated:: 0.21.0
+            Please use .at[] or .iat[] accessors.
 
         Parameters
         ----------
-        index : label
+        label : object
         takeable : interpret the index as indexers, default False
 
         Returns
         -------
         value : scalar value
         """
+        warnings.warn("get_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._get_value(label, takeable=takeable)
+
+    def _get_value(self, label, takeable=False):
         if takeable is True:
-            return _maybe_box_datetimelike(self._values[label])
+            return com._maybe_box_datetimelike(self._values[label])
         return self.index.get_value(self._values, label)
+    _get_value.__doc__ = get_value.__doc__
 
     def set_value(self, label, value, takeable=False):
-        """
-        Quickly set single value at passed label. If label is not contained, a
-        new object is created with the label placed at the end of the result
-        index
+        """Quickly set single value at passed label. If label is not contained,
+        a new object is created with the label placed at the end of the result
+        index.
+
+        .. deprecated:: 0.21.0
+            Please use .at[] or .iat[] accessors.
 
         Parameters
         ----------
@@ -878,46 +1065,143 @@ def set_value(self, label, value, takeable=False):
             If label is contained, will be reference to calling Series,
             otherwise a new object
         """
+        warnings.warn("set_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._set_value(label, value, takeable=takeable)
+
+    def _set_value(self, label, value, takeable=False):
         try:
             if takeable:
                 self._values[label] = value
             else:
                 self.index._engine.set_value(self._values, label, value)
-            return self
         except KeyError:
 
             # set using a non-recursive method
             self.loc[label] = value
-            return self
+
+        return self
+    _set_value.__doc__ = set_value.__doc__
 
     def reset_index(self, level=None, drop=False, name=None, inplace=False):
         """
-        Analogous to the :meth:`pandas.DataFrame.reset_index` function, see
-        docstring there.
+        Generate a new DataFrame or Series with the index reset.
+
+        This is useful when the index needs to be treated as a column, or
+        when the index is meaningless and needs to be reset to the default
+        before another operation.
 
         Parameters
         ----------
-        level : int, str, tuple, or list, default None
-            Only remove the given levels from the index. Removes all levels by
-            default
-        drop : boolean, default False
-            Do not try to insert index into dataframe columns
-        name : object, default None
-            The name of the column corresponding to the Series values
-        inplace : boolean, default False
-            Modify the Series in place (do not create a new object)
+        level : int, str, tuple, or list, default optional
+            For a Series with a MultiIndex, only remove the specified levels
+            from the index. Removes all levels by default.
+        drop : bool, default False
+            Just reset the index, without inserting it as a column in
+            the new DataFrame.
+        name : object, optional
+            The name to use for the column containing the original Series
+            values. Uses ``self.name`` by default. This argument is ignored
+            when `drop` is True.
+        inplace : bool, default False
+            Modify the Series in place (do not create a new object).
 
         Returns
-        ----------
-        resetted : DataFrame, or Series if drop == True
-        """
+        -------
+        Series or DataFrame
+            When `drop` is False (the default), a DataFrame is returned.
+            The newly created columns will come first in the DataFrame,
+            followed by the original Series values.
+            When `drop` is True, a `Series` is returned.
+            In either case, if ``inplace=True``, no value is returned.
+
+        See Also
+        --------
+        DataFrame.reset_index: Analogous function for DataFrame.
+
+        Examples
+        --------
+
+        >>> s = pd.Series([1, 2, 3, 4], name='foo',
+        ...               index=pd.Index(['a', 'b', 'c', 'd'], name='idx'))
+
+        Generate a DataFrame with default index.
+
+        >>> s.reset_index()
+          idx  foo
+        0   a    1
+        1   b    2
+        2   c    3
+        3   d    4
+
+        To specify the name of the new column use `name`.
+
+        >>> s.reset_index(name='values')
+          idx  values
+        0   a       1
+        1   b       2
+        2   c       3
+        3   d       4
+
+        To generate a new Series with the default set `drop` to True.
+
+        >>> s.reset_index(drop=True)
+        0    1
+        1    2
+        2    3
+        3    4
+        Name: foo, dtype: int64
+
+        To update the Series in place, without generating a new one
+        set `inplace` to True. Note that it also requires ``drop=True``.
+
+        >>> s.reset_index(inplace=True, drop=True)
+        >>> s
+        0    1
+        1    2
+        2    3
+        3    4
+        Name: foo, dtype: int64
+
+        The `level` parameter is interesting for Series with a multi-level
+        index.
+
+        >>> arrays = [np.array(['bar', 'bar', 'baz', 'baz']),
+        ...           np.array(['one', 'two', 'one', 'two'])]
+        >>> s2 = pd.Series(
+        ...     range(4), name='foo',
+        ...     index=pd.MultiIndex.from_arrays(arrays,
+        ...                                     names=['a', 'b']))
+
+        To remove a specific level from the Index, use `level`.
+
+        >>> s2.reset_index(level='a')
+               a  foo
+        b
+        one  bar    0
+        two  bar    1
+        one  baz    2
+        two  baz    3
+
+        If `level` is not set, all levels are removed from the Index.
+
+        >>> s2.reset_index()
+             a    b  foo
+        0  bar  one    0
+        1  bar  two    1
+        2  baz  one    2
+        3  baz  two    3
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
         if drop:
-            new_index = np.arange(len(self))
-            if level is not None and isinstance(self.index, MultiIndex):
+            new_index = com._default_index(len(self))
+            if level is not None:
                 if not isinstance(level, (tuple, list)):
                     level = [level]
                 level = [self.index._get_level_number(lev) for lev in level]
-                if len(level) < len(self.index.levels):
+                if len(level) < self.index.nlevels:
                     new_index = self.index.droplevel(level)
 
             if inplace:
@@ -943,17 +1227,19 @@ def __unicode__(self):
         """
         buf = StringIO(u(""))
         width, height = get_terminal_size()
-        max_rows = (height if get_option("display.max_rows") == 0
-                    else get_option("display.max_rows"))
+        max_rows = (height if get_option("display.max_rows") == 0 else
+                    get_option("display.max_rows"))
+        show_dimensions = get_option("display.show_dimensions")
 
         self.to_string(buf=buf, name=self.name, dtype=self.dtype,
-                       max_rows=max_rows)
+                       max_rows=max_rows, length=show_dimensions)
         result = buf.getvalue()
 
         return result
 
     def to_string(self, buf=None, na_rep='NaN', float_format=None, header=True,
-                  length=False, dtype=False, name=False, max_rows=None):
+                  index=True, length=False, dtype=False, name=False,
+                  max_rows=None):
         """
         Render a string representation of the Series
 
@@ -968,6 +1254,8 @@ def to_string(self, buf=None, na_rep='NaN', float_format=None, header=True,
             default None
         header: boolean, default True
             Add the Series header (index name)
+        index : bool, optional
+            Add index (row) labels, default True
         length : boolean, default False
             Add the Series length
         dtype : boolean, default False
@@ -983,55 +1271,27 @@ def to_string(self, buf=None, na_rep='NaN', float_format=None, header=True,
         formatted : string (if not buffer passed)
         """
 
-        the_repr = self._get_repr(float_format=float_format, na_rep=na_rep,
-                                  header=header, length=length, dtype=dtype,
-                                  name=name, max_rows=max_rows)
-
-        # catch contract violations
-        if not isinstance(the_repr, compat.text_type):
-            raise AssertionError("result must be of type unicode, type"
-                                 " of result is {0!r}"
-                                 "".format(the_repr.__class__.__name__))
-
-        if buf is None:
-            return the_repr
-        else:
-            try:
-                buf.write(the_repr)
-            except AttributeError:
-                with open(buf, 'w') as f:
-                    f.write(the_repr)
-
-    def _get_repr(
-        self, name=False, header=True, length=True, dtype=True, na_rep='NaN',
-            float_format=None, max_rows=None):
-        """
-
-        Internal function, should always return unicode string
-        """
-        formatter = fmt.SeriesFormatter(self, name=name,
-                                        length=length, header=header,
-                                        dtype=dtype,
-                                        na_rep=na_rep,
+        formatter = fmt.SeriesFormatter(self, name=name, length=length,
+                                        header=header, index=index,
+                                        dtype=dtype, na_rep=na_rep,
                                         float_format=float_format,
                                         max_rows=max_rows)
         result = formatter.to_string()
 
-        # TODO: following check prob. not neces.
+        # catch contract violations
         if not isinstance(result, compat.text_type):
             raise AssertionError("result must be of type unicode, type"
                                  " of result is {0!r}"
                                  "".format(result.__class__.__name__))
-        return result
 
-    def __iter__(self):
-        """ provide iteration over the values of the Series
-        box values if necessary """
-        if needs_i8_conversion(self.dtype):
-            boxer = i8_boxer(self)
-            return (boxer(x) for x in self._values)
+        if buf is None:
+            return result
         else:
-            return iter(self._values)
+            try:
+                buf.write(result)
+            except AttributeError:
+                with open(buf, 'w') as f:
+                    f.write(result)
 
     def iteritems(self):
         """
@@ -1039,29 +1299,48 @@ def iteritems(self):
         """
         return zip(iter(self.index), iter(self))
 
-    if compat.PY3:  # pragma: no cover
-        items = iteritems
+    items = iteritems
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Misc public methods
 
     def keys(self):
-        "Alias for index"
+        """Alias for index"""
         return self.index
 
-    def tolist(self):
-        """ Convert Series to a nested list """
-        return list(self)
-
-    def to_dict(self):
+    def to_dict(self, into=dict):
         """
-        Convert Series to {label -> value} dict
+        Convert Series to {label -> value} dict or dict-like object.
+
+        Parameters
+        ----------
+        into : class, default dict
+            The collections.Mapping subclass to use as the return
+            object. Can be the actual class or an empty
+            instance of the mapping type you want.  If you want a
+            collections.defaultdict, you must pass it initialized.
+
+            .. versionadded:: 0.21.0
 
         Returns
         -------
-        value_dict : dict
-        """
-        return dict(compat.iteritems(self))
+        value_dict : collections.Mapping
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2, 3, 4])
+        >>> s.to_dict()
+        {0: 1, 1: 2, 2: 3, 3: 4}
+        >>> from collections import OrderedDict, defaultdict
+        >>> s.to_dict(OrderedDict)
+        OrderedDict([(0, 1), (1, 2), (2, 3), (3, 4)])
+        >>> dd = defaultdict(list)
+        >>> s.to_dict(dd)
+        defaultdict(<type 'list'>, {0: 1, 1: 2, 2: 3, 3: 4})
+        """
+        # GH16122
+        into_c = com.standardize_mapping(into)
+        return into_c(compat.iteritems(self))
 
     def to_frame(self, name=None):
         """
@@ -1097,11 +1376,26 @@ def to_sparse(self, kind='block', fill_value=None):
         -------
         sp : SparseSeries
         """
-        from pandas.core.sparse import SparseSeries
+        from pandas.core.sparse.series import SparseSeries
         return SparseSeries(self, kind=kind,
                             fill_value=fill_value).__finalize__(self)
 
-    #----------------------------------------------------------------------
+    def _set_name(self, name, inplace=False):
+        """
+        Set the Series name.
+
+        Parameters
+        ----------
+        name : str
+        inplace : bool
+            whether to modify `self` directly or return a copy
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        ser = self if inplace else self.copy()
+        ser.name = name
+        return ser
+
+    # ----------------------------------------------------------------------
     # Statistics, overridden ndarray methods
 
     # TODO: integrate bottleneck
@@ -1120,10 +1414,8 @@ def count(self, level=None):
         -------
         nobs : int or Series (if level specified)
         """
-        from pandas.core.index import _get_na_value
-
         if level is None:
-            return notnull(_values_from_object(self)).sum()
+            return notna(com._values_from_object(self)).sum()
 
         if isinstance(level, compat.string_types):
             level = self.index._get_level_number(level)
@@ -1134,154 +1426,474 @@ def count(self, level=None):
         mask = lab == -1
         if mask.any():
             lab[mask] = cnt = len(lev)
-            lev = lev.insert(cnt, _get_na_value(lev.dtype.type))
+            lev = lev.insert(cnt, lev._na_value)
 
-        out = np.bincount(lab[notnull(self.values)], minlength=len(lev))
-        return self._constructor(out, index=lev, dtype='int64').__finalize__(self)
+        obs = lab[notna(self.values)]
+        out = np.bincount(obs, minlength=len(lev) or None)
+        return self._constructor(out, index=lev,
+                                 dtype='int64').__finalize__(self)
 
-    def mode(self):
-        """Returns the mode(s) of the dataset.
+    def mode(self, dropna=True):
+        """Return the mode(s) of the dataset.
 
-        Empty if nothing occurs at least 2 times.  Always returns Series even
-        if only one value.
+        Always returns Series even if only one value is returned.
 
         Parameters
-        ----------
-        sort : bool, default True
-            If True, will lexicographically sort values, if False skips
-            sorting. Result ordering when ``sort=False`` is not defined.
+        -------
+        dropna : boolean, default True
+            Don't consider counts of NaN/NaT.
+
+            .. versionadded:: 0.24.0
 
         Returns
         -------
         modes : Series (sorted)
         """
         # TODO: Add option for bins like value_counts()
-        return algorithms.mode(self)
-
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
-    @Appender(base._shared_docs['drop_duplicates'] % _shared_doc_kwargs)
-    def drop_duplicates(self, keep='first', inplace=False):
-        return super(Series, self).drop_duplicates(keep=keep, inplace=inplace)
-
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
-    @Appender(base._shared_docs['duplicated'] % _shared_doc_kwargs)
-    def duplicated(self, keep='first'):
-        return super(Series, self).duplicated(keep=keep)
+        return algorithms.mode(self, dropna=dropna)
 
-    def idxmin(self, axis=None, out=None, skipna=True):
+    def unique(self):
         """
-        Index of first occurrence of minimum of values.
+        Return unique values of Series object.
 
-        Parameters
-        ----------
-        skipna : boolean, default True
-            Exclude NA/null values
+        Uniques are returned in order of appearance. Hash table-based unique,
+        therefore does NOT sort.
 
         Returns
         -------
-        idxmin : Index of minimum of values
-
-        Notes
-        -----
-        This method is the Series version of ``ndarray.argmin``.
+        ndarray or Categorical
+            The unique values returned as a NumPy array. In case of categorical
+            data type, returned as a Categorical.
 
         See Also
         --------
-        DataFrame.idxmin
-        numpy.ndarray.argmin
-        """
-        i = nanops.nanargmin(_values_from_object(self), skipna=skipna)
-        if i == -1:
-            return np.nan
-        return self.index[i]
+        pandas.unique : top-level unique method for any 1-d array-like object.
+        Index.unique : return Index with unique values from an Index object.
 
-    def idxmax(self, axis=None, out=None, skipna=True):
-        """
-        Index of first occurrence of maximum of values.
+        Examples
+        --------
+        >>> pd.Series([2, 1, 3, 3], name='A').unique()
+        array([2, 1, 3])
 
-        Parameters
-        ----------
-        skipna : boolean, default True
-            Exclude NA/null values
+        >>> pd.Series([pd.Timestamp('2016-01-01') for _ in range(3)]).unique()
+        array(['2016-01-01T00:00:00.000000000'], dtype='datetime64[ns]')
 
-        Returns
-        -------
-        idxmax : Index of maximum of values
+        >>> pd.Series([pd.Timestamp('2016-01-01', tz='US/Eastern')
+        ...            for _ in range(3)]).unique()
+        array([Timestamp('2016-01-01 00:00:00-0500', tz='US/Eastern')],
+              dtype=object)
 
-        Notes
-        -----
-        This method is the Series version of ``ndarray.argmax``.
+        An unordered Categorical will return categories in the order of
+        appearance.
 
-        See Also
-        --------
-        DataFrame.idxmax
-        numpy.ndarray.argmax
-        """
-        i = nanops.nanargmax(_values_from_object(self), skipna=skipna)
-        if i == -1:
-            return np.nan
-        return self.index[i]
+        >>> pd.Series(pd.Categorical(list('baabc'))).unique()
+        [b, a, c]
+        Categories (3, object): [b, a, c]
 
-    # ndarray compat
-    argmin = idxmin
-    argmax = idxmax
+        An ordered Categorical preserves the category ordering.
 
-    @Appender(np.ndarray.round.__doc__)
-    def round(self, decimals=0, out=None):
+        >>> pd.Series(pd.Categorical(list('baabc'), categories=list('abc'),
+        ...                          ordered=True)).unique()
+        [b, a, c]
+        Categories (3, object): [a < b < c]
         """
+        result = super(Series, self).unique()
 
-        """
-        result = _values_from_object(self).round(decimals, out=out)
-        if out is None:
-            result = self._constructor(result,
-                                       index=self.index).__finalize__(self)
+        if is_datetime64tz_dtype(self.dtype):
+            # we are special casing datetime64tz_dtype
+            # to return an object array of tz-aware Timestamps
+
+            # TODO: it must return DatetimeArray with tz in pandas 2.0
+            result = result.astype(object).values
 
         return result
 
-    def quantile(self, q=0.5):
+    def drop_duplicates(self, keep='first', inplace=False):
         """
-        Return value at the given quantile, a la numpy.percentile.
+        Return Series with duplicate values removed.
 
         Parameters
         ----------
-        q : float or array-like, default 0.5 (50% quantile)
-            0 <= q <= 1, the quantile(s) to compute
+        keep : {'first', 'last', ``False``}, default 'first'
+            - 'first' : Drop duplicates except for the first occurrence.
+            - 'last' : Drop duplicates except for the last occurrence.
+            - ``False`` : Drop all duplicates.
+        inplace : boolean, default ``False``
+            If ``True``, performs operation inplace and returns None.
 
         Returns
         -------
-        quantile : float or Series
-            if ``q`` is an array, a Series will be returned where the
-            index is ``q`` and the values are the quantiles.
+        deduplicated : Series
+
+        See Also
+        --------
+        Index.drop_duplicates : equivalent method on Index
+        DataFrame.drop_duplicates : equivalent method on DataFrame
+        Series.duplicated : related method on Series, indicating duplicate
+            Series values.
 
         Examples
         --------
+        Generate an Series with duplicated entries.
 
-        >>> s = Series([1, 2, 3, 4])
-        >>> s.quantile(.5)
-            2.5
-        >>> s.quantile([.25, .5, .75])
-        0.25    1.75
-        0.50    2.50
-        0.75    3.25
-        dtype: float64
+        >>> s = pd.Series(['lama', 'cow', 'lama', 'beetle', 'lama', 'hippo'],
+        ...               name='animal')
+        >>> s
+        0      lama
+        1       cow
+        2      lama
+        3    beetle
+        4      lama
+        5     hippo
+        Name: animal, dtype: object
+
+        With the 'keep' parameter, the selection behaviour of duplicated values
+        can be changed. The value 'first' keeps the first occurrence for each
+        set of duplicated entries. The default value of keep is 'first'.
+
+        >>> s.drop_duplicates()
+        0      lama
+        1       cow
+        3    beetle
+        5     hippo
+        Name: animal, dtype: object
+
+        The value 'last' for parameter 'keep' keeps the last occurrence for
+        each set of duplicated entries.
+
+        >>> s.drop_duplicates(keep='last')
+        1       cow
+        3    beetle
+        4      lama
+        5     hippo
+        Name: animal, dtype: object
+
+        The value ``False`` for parameter 'keep' discards all sets of
+        duplicated entries. Setting the value of 'inplace' to ``True`` performs
+        the operation inplace and returns ``None``.
+
+        >>> s.drop_duplicates(keep=False, inplace=True)
+        >>> s
+        1       cow
+        3    beetle
+        5     hippo
+        Name: animal, dtype: object
         """
-        valid = self.dropna()
-        self._check_percentile(q)
+        return super(Series, self).drop_duplicates(keep=keep, inplace=inplace)
 
-        def multi(values, qs):
-            if com.is_list_like(qs):
-                values = [_quantile(values, x*100) for x in qs]
-                return self._constructor(values, index=qs, name=self.name)
-            else:
-                return _quantile(values, qs*100)
+    def duplicated(self, keep='first'):
+        """
+        Indicate duplicate Series values.
+
+        Duplicated values are indicated as ``True`` values in the resulting
+        Series. Either all duplicates, all except the first or all except the
+        last occurrence of duplicates can be indicated.
+
+        Parameters
+        ----------
+        keep : {'first', 'last', False}, default 'first'
+            - 'first' : Mark duplicates as ``True`` except for the first
+              occurrence.
+            - 'last' : Mark duplicates as ``True`` except for the last
+              occurrence.
+            - ``False`` : Mark all duplicates as ``True``.
+
+        Examples
+        --------
+        By default, for each set of duplicated values, the first occurrence is
+        set on False and all others on True:
+
+        >>> animals = pd.Series(['lama', 'cow', 'lama', 'beetle', 'lama'])
+        >>> animals.duplicated()
+        0    False
+        1    False
+        2     True
+        3    False
+        4     True
+        dtype: bool
+
+        which is equivalent to
+
+        >>> animals.duplicated(keep='first')
+        0    False
+        1    False
+        2     True
+        3    False
+        4     True
+        dtype: bool
+
+        By using 'last', the last occurrence of each set of duplicated values
+        is set on False and all others on True:
+
+        >>> animals.duplicated(keep='last')
+        0     True
+        1    False
+        2     True
+        3    False
+        4    False
+        dtype: bool
+
+        By setting keep on ``False``, all duplicates are True:
+
+        >>> animals.duplicated(keep=False)
+        0     True
+        1    False
+        2     True
+        3    False
+        4     True
+        dtype: bool
+
+        Returns
+        -------
+        pandas.core.series.Series
+
+        See Also
+        --------
+        pandas.Index.duplicated : Equivalent method on pandas.Index
+        pandas.DataFrame.duplicated : Equivalent method on pandas.DataFrame
+        pandas.Series.drop_duplicates : Remove duplicate values from Series
+        """
+        return super(Series, self).duplicated(keep=keep)
+
+    def idxmin(self, axis=None, skipna=True, *args, **kwargs):
+        """
+        Return the row label of the minimum value.
+
+        If multiple values equal the minimum, the first row label with that
+        value is returned.
+
+        Parameters
+        ----------
+        skipna : boolean, default True
+            Exclude NA/null values. If the entire Series is NA, the result
+            will be NA.
+        axis : int, default 0
+            For compatibility with DataFrame.idxmin. Redundant for application
+            on Series.
+        *args, **kwargs
+            Additional keywors have no effect but might be accepted
+            for compatibility with NumPy.
+
+        Returns
+        -------
+        idxmin : Index of minimum of values.
+
+        Raises
+        ------
+        ValueError
+            If the Series is empty.
+
+        Notes
+        -----
+        This method is the Series version of ``ndarray.argmin``. This method
+        returns the label of the minimum, while ``ndarray.argmin`` returns
+        the position. To get the position, use ``series.values.argmin()``.
+
+        See Also
+        --------
+        numpy.argmin : Return indices of the minimum values
+            along the given axis.
+        DataFrame.idxmin : Return index of first occurrence of minimum
+            over requested axis.
+        Series.idxmax : Return index *label* of the first occurrence
+            of maximum of values.
+
+        Examples
+        --------
+        >>> s = pd.Series(data=[1, None, 4, 1],
+        ...               index=['A' ,'B' ,'C' ,'D'])
+        >>> s
+        A    1.0
+        B    NaN
+        C    4.0
+        D    1.0
+        dtype: float64
+
+        >>> s.idxmin()
+        'A'
+
+        If `skipna` is False and there is an NA value in the data,
+        the function returns ``nan``.
+
+        >>> s.idxmin(skipna=False)
+        nan
+        """
+        skipna = nv.validate_argmin_with_skipna(skipna, args, kwargs)
+        i = nanops.nanargmin(com._values_from_object(self), skipna=skipna)
+        if i == -1:
+            return np.nan
+        return self.index[i]
+
+    def idxmax(self, axis=0, skipna=True, *args, **kwargs):
+        """
+        Return the row label of the maximum value.
+
+        If multiple values equal the maximum, the first row label with that
+        value is returned.
+
+        Parameters
+        ----------
+        skipna : boolean, default True
+            Exclude NA/null values. If the entire Series is NA, the result
+            will be NA.
+        axis : int, default 0
+            For compatibility with DataFrame.idxmax. Redundant for application
+            on Series.
+        *args, **kwargs
+            Additional keywors have no effect but might be accepted
+            for compatibility with NumPy.
+
+        Returns
+        -------
+        idxmax : Index of maximum of values.
+
+        Raises
+        ------
+        ValueError
+            If the Series is empty.
+
+        Notes
+        -----
+        This method is the Series version of ``ndarray.argmax``. This method
+        returns the label of the maximum, while ``ndarray.argmax`` returns
+        the position. To get the position, use ``series.values.argmax()``.
+
+        See Also
+        --------
+        numpy.argmax : Return indices of the maximum values
+            along the given axis.
+        DataFrame.idxmax : Return index of first occurrence of maximum
+            over requested axis.
+        Series.idxmin : Return index *label* of the first occurrence
+            of minimum of values.
+
+        Examples
+        --------
+        >>> s = pd.Series(data=[1, None, 4, 3, 4],
+        ...               index=['A', 'B', 'C', 'D', 'E'])
+        >>> s
+        A    1.0
+        B    NaN
+        C    4.0
+        D    3.0
+        E    4.0
+        dtype: float64
+
+        >>> s.idxmax()
+        'C'
+
+        If `skipna` is False and there is an NA value in the data,
+        the function returns ``nan``.
+
+        >>> s.idxmax(skipna=False)
+        nan
+        """
+        skipna = nv.validate_argmax_with_skipna(skipna, args, kwargs)
+        i = nanops.nanargmax(com._values_from_object(self), skipna=skipna)
+        if i == -1:
+            return np.nan
+        return self.index[i]
+
+    # ndarray compat
+    argmin = deprecate(
+        'argmin', idxmin, '0.21.0',
+        msg=dedent("""\
+        'argmin' is deprecated, use 'idxmin' instead. The behavior of 'argmin'
+        will be corrected to return the positional minimum in the future.
+        Use 'series.values.argmin' to get the position of the minimum now.""")
+    )
+    argmax = deprecate(
+        'argmax', idxmax, '0.21.0',
+        msg=dedent("""\
+        'argmax' is deprecated, use 'idxmax' instead. The behavior of 'argmax'
+        will be corrected to return the positional maximum in the future.
+        Use 'series.values.argmax' to get the position of the maximum now.""")
+    )
+
+    def round(self, decimals=0, *args, **kwargs):
+        """
+        Round each value in a Series to the given number of decimals.
+
+        Parameters
+        ----------
+        decimals : int
+            Number of decimal places to round to (default: 0).
+            If decimals is negative, it specifies the number of
+            positions to the left of the decimal point.
+
+        Returns
+        -------
+        Series object
+
+        See Also
+        --------
+        numpy.around
+        DataFrame.round
+
+        """
+        nv.validate_round(args, kwargs)
+        result = com._values_from_object(self).round(decimals)
+        result = self._constructor(result, index=self.index).__finalize__(self)
+
+        return result
+
+    def quantile(self, q=0.5, interpolation='linear'):
+        """
+        Return value at the given quantile.
+
+        Parameters
+        ----------
+        q : float or array-like, default 0.5 (50% quantile)
+            0 <= q <= 1, the quantile(s) to compute
+        interpolation : {'linear', 'lower', 'higher', 'midpoint', 'nearest'}
+            .. versionadded:: 0.18.0
 
-        return self._maybe_box(lambda values: multi(values, q), dropna=True)
+            This optional parameter specifies the interpolation method to use,
+            when the desired quantile lies between two data points `i` and `j`:
 
-    def ptp(self, axis=None, out=None):
-        return _values_from_object(self).ptp(axis, out)
+                * linear: `i + (j - i) * fraction`, where `fraction` is the
+                  fractional part of the index surrounded by `i` and `j`.
+                * lower: `i`.
+                * higher: `j`.
+                * nearest: `i` or `j` whichever is nearest.
+                * midpoint: (`i` + `j`) / 2.
+
+        Returns
+        -------
+        quantile : float or Series
+            if ``q`` is an array, a Series will be returned where the
+            index is ``q`` and the values are the quantiles.
+
+        Examples
+        --------
+        >>> s = Series([1, 2, 3, 4])
+        >>> s.quantile(.5)
+        2.5
+        >>> s.quantile([.25, .5, .75])
+        0.25    1.75
+        0.50    2.50
+        0.75    3.25
+        dtype: float64
+
+        See Also
+        --------
+        pandas.core.window.Rolling.quantile
+        numpy.percentile
+        """
+
+        self._check_percentile(q)
+
+        result = self._data.quantile(qs=q, interpolation=interpolation)
+
+        if is_list_like(q):
+            return self._constructor(result,
+                                     index=Float64Index(q),
+                                     name=self.name)
+        else:
+            # scalar
+            return result
 
-    def corr(self, other, method='pearson',
-             min_periods=None):
+    def corr(self, other, method='pearson', min_periods=None):
         """
         Compute correlation with `other` Series, excluding missing values
 
@@ -1330,18 +1942,65 @@ def cov(self, other, min_periods=None):
 
     def diff(self, periods=1):
         """
-        1st discrete difference of object
+        First discrete difference of element.
+
+        Calculates the difference of a Series element compared with another
+        element in the Series (default is element in previous row).
 
         Parameters
         ----------
         periods : int, default 1
-            Periods to shift for forming difference
+            Periods to shift for calculating difference, accepts negative
+            values.
 
         Returns
         -------
         diffed : Series
+
+        See Also
+        --------
+        Series.pct_change: Percent change over given number of periods.
+        Series.shift: Shift index by desired number of periods with an
+            optional time freq.
+        DataFrame.diff: First discrete difference of object
+
+        Examples
+        --------
+        Difference with previous row
+
+        >>> s = pd.Series([1, 1, 2, 3, 5, 8])
+        >>> s.diff()
+        0    NaN
+        1    0.0
+        2    1.0
+        3    1.0
+        4    2.0
+        5    3.0
+        dtype: float64
+
+        Difference with 3rd previous row
+
+        >>> s.diff(periods=3)
+        0    NaN
+        1    NaN
+        2    NaN
+        3    2.0
+        4    4.0
+        5    6.0
+        dtype: float64
+
+        Difference with following row
+
+        >>> s.diff(periods=-1)
+        0    0.0
+        1   -1.0
+        2   -1.0
+        3   -2.0
+        4   -3.0
+        5    NaN
+        dtype: float64
         """
-        result = com.diff(_values_from_object(self), periods)
+        result = algorithms.diff(com._values_from_object(self), periods)
         return self._constructor(result, index=self.index).__finalize__(self)
 
     def autocorr(self, lag=1):
@@ -1362,7 +2021,7 @@ def autocorr(self, lag=1):
     def dot(self, other):
         """
         Matrix multiplication with DataFrame or inner-product with Series
-        objects
+        objects. Can also be called using `self @ other` in Python >= 3.5.
 
         Parameters
         ----------
@@ -1401,88 +2060,107 @@ def dot(self, other):
         else:  # pragma: no cover
             raise TypeError('unsupported type: %s' % type(other))
 
-    def searchsorted(self, v, side='left', sorter=None):
-        """Find indices where elements should be inserted to maintain order.
+    def __matmul__(self, other):
+        """ Matrix multiplication using binary `@` operator in Python>=3.5 """
+        return self.dot(other)
+
+    def __rmatmul__(self, other):
+        """ Matrix multiplication using binary `@` operator in Python>=3.5 """
+        return self.dot(np.transpose(other))
+
+    @Substitution(klass='Series')
+    @Appender(base._shared_docs['searchsorted'])
+    @deprecate_kwarg(old_arg_name='v', new_arg_name='value')
+    def searchsorted(self, value, side='left', sorter=None):
+        if sorter is not None:
+            sorter = _ensure_platform_int(sorter)
+        return self._values.searchsorted(Series(value)._values,
+                                         side=side, sorter=sorter)
+
+    # -------------------------------------------------------------------
+    # Combination
 
-        Find the indices into a sorted Series `self` such that, if the
-        corresponding elements in `v` were inserted before the indices, the
-        order of `self` would be preserved.
+    def append(self, to_append, ignore_index=False, verify_integrity=False):
+        """
+        Concatenate two or more Series.
 
         Parameters
         ----------
-        v : array_like
-            Values to insert into `a`.
-        side : {'left', 'right'}, optional
-            If 'left', the index of the first suitable location found is given.
-            If 'right', return the last such index.  If there is no suitable
-            index, return either 0 or N (where N is the length of `a`).
-        sorter : 1-D array_like, optional
-            Optional array of integer indices that sort `self` into ascending
-            order. They are typically the result of ``np.argsort``.
+        to_append : Series or list/tuple of Series
+        ignore_index : boolean, default False
+            If True, do not use the index labels.
 
-        Returns
-        -------
-        indices : array of ints
-            Array of insertion points with the same shape as `v`.
+            .. versionadded:: 0.19.0
 
-        See Also
-        --------
-        Series.sort_values
-        numpy.searchsorted
+        verify_integrity : boolean, default False
+            If True, raise Exception on creating index with duplicates
 
         Notes
         -----
-        Binary search is used to find the required insertion points.
+        Iteratively appending to a Series can be more computationally intensive
+        than a single concatenate. A better solution is to append values to a
+        list and then concatenate the list with the original Series all at
+        once.
+
+        See also
+        --------
+        pandas.concat : General function to concatenate DataFrame, Series
+            or Panel objects
+
+        Returns
+        -------
+        appended : Series
 
         Examples
         --------
-        >>> x = pd.Series([1, 2, 3])
-        >>> x
+        >>> s1 = pd.Series([1, 2, 3])
+        >>> s2 = pd.Series([4, 5, 6])
+        >>> s3 = pd.Series([4, 5, 6], index=[3,4,5])
+        >>> s1.append(s2)
         0    1
         1    2
         2    3
+        0    4
+        1    5
+        2    6
         dtype: int64
-        >>> x.searchsorted(4)
-        array([3])
-        >>> x.searchsorted([0, 4])
-        array([0, 3])
-        >>> x.searchsorted([1, 3], side='left')
-        array([0, 2])
-        >>> x.searchsorted([1, 3], side='right')
-        array([1, 3])
-        >>> x.searchsorted([1, 2], side='right', sorter=[0, 2, 1])
-        array([1, 3])
-        """
-        if sorter is not None:
-            sorter = com._ensure_platform_int(sorter)
 
-        return self._values.searchsorted(Series(v)._values, side=side,
-                                         sorter=sorter)
+        >>> s1.append(s3)
+        0    1
+        1    2
+        2    3
+        3    4
+        4    5
+        5    6
+        dtype: int64
 
-    #------------------------------------------------------------------------------
-    # Combination
+        With `ignore_index` set to True:
 
-    def append(self, to_append, verify_integrity=False):
-        """
-        Concatenate two or more Series.
+        >>> s1.append(s2, ignore_index=True)
+        0    1
+        1    2
+        2    3
+        3    4
+        4    5
+        5    6
+        dtype: int64
+
+        With `verify_integrity` set to True:
+
+        >>> s1.append(s2, verify_integrity=True)
+        Traceback (most recent call last):
+        ...
+        ValueError: Indexes have overlapping values: [0, 1, 2]
 
-        Parameters
-        ----------
-        to_append : Series or list/tuple of Series
-        verify_integrity : boolean, default False
-            If True, raise Exception on creating index with duplicates
 
-        Returns
-        -------
-        appended : Series
         """
-        from pandas.tools.merge import concat
+        from pandas.core.reshape.concat import concat
 
         if isinstance(to_append, (list, tuple)):
             to_concat = [self] + to_append
         else:
             to_concat = [self, to_append]
-        return concat(to_concat, ignore_index=False,
+        return concat(to_concat, ignore_index=ignore_index,
                       verify_integrity=verify_integrity)
 
     def _binop(self, other, func, level=None, fill_value=None):
@@ -1511,25 +2189,16 @@ def _binop(self, other, func, level=None, fill_value=None):
         this = self
 
         if not self.index.equals(other.index):
-            this, other = self.align(other, level=level, join='outer', copy=False)
+            this, other = self.align(other, level=level, join='outer',
+                                     copy=False)
             new_index = this.index
 
-        this_vals = this.values
-        other_vals = other.values
+        this_vals, other_vals = ops.fill_binop(this.values, other.values,
+                                               fill_value)
 
-        if fill_value is not None:
-            this_mask = isnull(this_vals)
-            other_mask = isnull(other_vals)
-            this_vals = this_vals.copy()
-            other_vals = other_vals.copy()
-
-            # one but not both
-            mask = this_mask ^ other_mask
-            this_vals[this_mask & mask] = fill_value
-            other_vals[other_mask & mask] = fill_value
-
-        result = func(this_vals, other_vals)
-        name = _maybe_match_name(self, other)
+        with np.errstate(all='ignore'):
+            result = func(this_vals, other_vals)
+        name = ops.get_op_result_name(self, other)
         result = self._constructor(result, index=new_index, name=name)
         result = result.__finalize__(self)
         if name is None:
@@ -1537,7 +2206,7 @@ def _binop(self, other, func, level=None, fill_value=None):
             result.name = None
         return result
 
-    def combine(self, other, func, fill_value=nan):
+    def combine(self, other, func, fill_value=None):
         """
         Perform elementwise binary operation on two Series using given function
         with optional fill value when an index is missing from one Series or
@@ -1547,24 +2216,61 @@ def combine(self, other, func, fill_value=nan):
         ----------
         other : Series or scalar value
         func : function
+            Function that takes two scalars as inputs and return a scalar
         fill_value : scalar value
+            The default specifies to use the appropriate NaN value for
+            the underlying dtype of the Series
 
         Returns
         -------
         result : Series
+
+        Examples
+        --------
+        >>> s1 = Series([1, 2])
+        >>> s2 = Series([0, 3])
+        >>> s1.combine(s2, lambda x1, x2: x1 if x1 < x2 else x2)
+        0    0
+        1    2
+        dtype: int64
+
+        See Also
+        --------
+        Series.combine_first : Combine Series values, choosing the calling
+            Series's values first
         """
+        if fill_value is None:
+            fill_value = na_value_for_dtype(self.dtype, compat=False)
+
         if isinstance(other, Series):
+            # If other is a Series, result is based on union of Series,
+            # so do this element by element
             new_index = self.index.union(other.index)
-            new_name = _maybe_match_name(self, other)
-            new_values = np.empty(len(new_index), dtype=self.dtype)
-            for i, idx in enumerate(new_index):
+            new_name = ops.get_op_result_name(self, other)
+            new_values = []
+            for idx in new_index:
                 lv = self.get(idx, fill_value)
                 rv = other.get(idx, fill_value)
-                new_values[i] = func(lv, rv)
+                with np.errstate(all='ignore'):
+                    new_values.append(func(lv, rv))
         else:
+            # Assume that other is a scalar, so apply the function for
+            # each element in the Series
             new_index = self.index
-            new_values = func(self._values, other)
+            with np.errstate(all='ignore'):
+                new_values = [func(lv, other) for lv in self._values]
             new_name = self.name
+
+        if is_categorical_dtype(self.values):
+            pass
+        elif is_extension_array_dtype(self.values):
+            # The function can return something of any type, so check
+            # if the type is compatible with the calling EA
+            try:
+                new_values = self._values._from_sequence(new_values)
+            except TypeError:
+                pass
+
         return self._constructor(new_values, index=new_index, name=new_name)
 
     def combine_first(self, other):
@@ -1578,13 +2284,28 @@ def combine_first(self, other):
 
         Returns
         -------
-        y : Series
+        combined : Series
+
+        Examples
+        --------
+        >>> s1 = pd.Series([1, np.nan])
+        >>> s2 = pd.Series([3, 4])
+        >>> s1.combine_first(s2)
+        0    1.0
+        1    4.0
+        dtype: float64
+
+        See Also
+        --------
+        Series.combine : Perform elementwise operation on two Series
+            using a given function
         """
         new_index = self.index.union(other.index)
         this = self.reindex(new_index, copy=False)
         other = other.reindex(new_index, copy=False)
-        name = _maybe_match_name(self, other)
-        rs_vals = com._where_compat(isnull(this), other._values, this._values)
+        # TODO: do we need name?
+        name = ops.get_op_result_name(self, other)  # noqa
+        rs_vals = com._where_compat(isna(this), other._values, this._values)
         return self._constructor(rs_vals, index=new_index).__finalize__(self)
 
     def update(self, other):
@@ -1595,20 +2316,161 @@ def update(self, other):
         Parameters
         ----------
         other : Series
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2, 3])
+        >>> s.update(pd.Series([4, 5, 6]))
+        >>> s
+        0    4
+        1    5
+        2    6
+        dtype: int64
+
+        >>> s = pd.Series(['a', 'b', 'c'])
+        >>> s.update(pd.Series(['d', 'e'], index=[0, 2]))
+        >>> s
+        0    d
+        1    b
+        2    e
+        dtype: object
+
+        >>> s = pd.Series([1, 2, 3])
+        >>> s.update(pd.Series([4, 5, 6, 7, 8]))
+        >>> s
+        0    4
+        1    5
+        2    6
+        dtype: int64
+
+        If ``other`` contains NaNs the corresponding values are not updated
+        in the original Series.
+
+        >>> s = pd.Series([1, 2, 3])
+        >>> s.update(pd.Series([4, np.nan, 6]))
+        >>> s
+        0    4
+        1    2
+        2    6
+        dtype: int64
+
         """
         other = other.reindex_like(self)
-        mask = notnull(other)
+        mask = notna(other)
 
         self._data = self._data.putmask(mask=mask, new=other, inplace=True)
         self._maybe_update_cacher()
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # Reindexing, sorting
 
-    @Appender(generic._shared_docs['sort_values'] % _shared_doc_kwargs)
     def sort_values(self, axis=0, ascending=True, inplace=False,
                     kind='quicksort', na_position='last'):
+        """
+        Sort by the values.
+
+        Sort a Series in ascending or descending order by some
+        criterion.
+
+        Parameters
+        ----------
+        axis : {0 or 'index'}, default 0
+            Axis to direct sorting. The value 'index' is accepted for
+            compatibility with DataFrame.sort_values.
+        ascending : bool, default True
+            If True, sort values in ascending order, otherwise descending.
+        inplace : bool, default False
+            If True, perform operation in-place.
+        kind : {'quicksort', 'mergesort' or 'heapsort'}, default 'quicksort'
+            Choice of sorting algorithm. See also :func:`numpy.sort` for more
+            information. 'mergesort' is the only stable  algorithm.
+        na_position : {'first' or 'last'}, default 'last'
+            Argument 'first' puts NaNs at the beginning, 'last' puts NaNs at
+            the end.
+
+        Returns
+        -------
+        Series
+            Series ordered by values.
+
+        See Also
+        --------
+        Series.sort_index : Sort by the Series indices.
+        DataFrame.sort_values : Sort DataFrame by the values along either axis.
+        DataFrame.sort_index : Sort DataFrame by indices.
+
+        Examples
+        --------
+        >>> s = pd.Series([np.nan, 1, 3, 10, 5])
+        >>> s
+        0     NaN
+        1     1.0
+        2     3.0
+        3     10.0
+        4     5.0
+        dtype: float64
+
+        Sort values ascending order (default behaviour)
+
+        >>> s.sort_values(ascending=True)
+        1     1.0
+        2     3.0
+        4     5.0
+        3    10.0
+        0     NaN
+        dtype: float64
 
+        Sort values descending order
+
+        >>> s.sort_values(ascending=False)
+        3    10.0
+        4     5.0
+        2     3.0
+        1     1.0
+        0     NaN
+        dtype: float64
+
+        Sort values inplace
+
+        >>> s.sort_values(ascending=False, inplace=True)
+        >>> s
+        3    10.0
+        4     5.0
+        2     3.0
+        1     1.0
+        0     NaN
+        dtype: float64
+
+        Sort values putting NAs first
+
+        >>> s.sort_values(na_position='first')
+        0     NaN
+        1     1.0
+        2     3.0
+        4     5.0
+        3    10.0
+        dtype: float64
+
+        Sort a series of strings
+
+        >>> s = pd.Series(['z', 'b', 'd', 'a', 'c'])
+        >>> s
+        0    z
+        1    b
+        2    d
+        3    a
+        4    c
+        dtype: object
+
+        >>> s.sort_values()
+        3    a
+        1    b
+        4    c
+        2    d
+        0    z
+        dtype: object
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
         axis = self._get_axis_number(axis)
 
         # GH 5856/5853
@@ -1629,13 +2491,22 @@ def _try_kind_sort(arr):
         arr = self._values
         sortedIdx = np.empty(len(self), dtype=np.int32)
 
-        bad = isnull(arr)
+        bad = isna(arr)
 
         good = ~bad
-        idx = np.arange(len(self))
+        idx = com._default_index(len(self))
 
         argsorted = _try_kind_sort(arr[good])
 
+        if is_list_like(ascending):
+            if len(ascending) != 1:
+                raise ValueError('Length of ascending (%d) must be 1 '
+                                 'for Series' % (len(ascending)))
+            ascending = ascending[0]
+
+        if not is_bool(ascending):
+            raise ValueError('ascending must be boolean')
+
         if not ascending:
             argsorted = argsorted[::-1]
 
@@ -1657,98 +2528,159 @@ def _try_kind_sort(arr):
         else:
             return result.__finalize__(self)
 
-    @Appender(generic._shared_docs['sort_index'] % _shared_doc_kwargs)
     def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
-                   sort_remaining=True):
-
-        axis = self._get_axis_number(axis)
-        index = self.index
-        if level is not None:
-            new_index, indexer = index.sortlevel(level, ascending=ascending,
-                                                 sort_remaining=sort_remaining)
-        elif isinstance(index, MultiIndex):
-            from pandas.core.groupby import _lexsort_indexer
-            indexer = _lexsort_indexer(index.labels, orders=ascending)
-            indexer = com._ensure_platform_int(indexer)
-            new_index = index.take(indexer)
-        else:
-            new_index, indexer = index.sort_values(return_indexer=True,
-                                                   ascending=ascending)
-
-        new_values = self._values.take(indexer)
-        return self._constructor(new_values,
-                                 index=new_index).__finalize__(self)
-
-    def sort(self, axis=0, ascending=True, kind='quicksort', na_position='last', inplace=True):
+                   kind='quicksort', na_position='last', sort_remaining=True):
         """
-        DEPRECATED: use :meth:`Series.sort_values(inplace=True)` for INPLACE sorting
+        Sort Series by index labels.
 
-        Sort values and index labels by value. This is an inplace sort by default.
-        Series.order is the equivalent but returns a new Series.
+        Returns a new Series sorted by label if `inplace` argument is
+        ``False``, otherwise updates the original series and returns None.
 
         Parameters
         ----------
-        axis : int (can only be zero)
-        ascending : boolean, default True
-            Sort ascending. Passing False sorts descending
-        kind : {'mergesort', 'quicksort', 'heapsort'}, default 'quicksort'
-            Choice of sorting algorithm. See np.sort for more
-            information. 'mergesort' is the only stable algorithm
-        na_position : {'first', 'last'} (optional, default='last')
-            'first' puts NaNs at the beginning
-            'last' puts NaNs at the end
-        inplace : boolean, default True
-            Do operation in place.
+        axis : int, default 0
+            Axis to direct sorting. This can only be 0 for Series.
+        level : int, optional
+            If not None, sort on values in specified index level(s).
+        ascending : bool, default true
+            Sort ascending vs. descending.
+        inplace : bool, default False
+            If True, perform operation in-place.
+        kind : {'quicksort', 'mergesort', 'heapsort'}, default 'quicksort'
+            Choice of sorting algorithm. See also :func:`numpy.sort` for more
+            information.  'mergesort' is the only stable algorithm. For
+            DataFrames, this option is only applied when sorting on a single
+            column or label.
+        na_position : {'first', 'last'}, default 'last'
+            If 'first' puts NaNs at the beginning, 'last' puts NaNs at the end.
+            Not implemented for MultiIndex.
+        sort_remaining : bool, default True
+            If true and sorting by level and index is multilevel, sort by other
+            levels too (in order) after sorting by specified level.
+
+        Returns
+        -------
+        pandas.Series
+            The original Series sorted by the labels
 
         See Also
         --------
-        Series.sort_values
-        """
-        warnings.warn("sort is deprecated, use sort_values(inplace=True) for for INPLACE sorting",
-                      FutureWarning, stacklevel=2)
+        DataFrame.sort_index: Sort DataFrame by the index
+        DataFrame.sort_values: Sort DataFrame by the value
+        Series.sort_values : Sort Series by the value
 
-        return self.sort_values(ascending=ascending,
-                                kind=kind,
-                                na_position=na_position,
-                                inplace=inplace)
+        Examples
+        --------
+        >>> s = pd.Series(['a', 'b', 'c', 'd'], index=[3, 2, 1, 4])
+        >>> s.sort_index()
+        1    c
+        2    b
+        3    a
+        4    d
+        dtype: object
+
+        Sort Descending
+
+        >>> s.sort_index(ascending=False)
+        4    d
+        3    a
+        2    b
+        1    c
+        dtype: object
+
+        Sort Inplace
+
+        >>> s.sort_index(inplace=True)
+        >>> s
+        1    c
+        2    b
+        3    a
+        4    d
+        dtype: object
+
+        By default NaNs are put at the end, but use `na_position` to place
+        them at the beginning
+
+        >>> s = pd.Series(['a', 'b', 'c', 'd'], index=[3, 2, 1, np.nan])
+        >>> s.sort_index(na_position='first')
+        NaN     d
+         1.0    c
+         2.0    b
+         3.0    a
+        dtype: object
+
+        Specify index level to sort
+
+        >>> arrays = [np.array(['qux', 'qux', 'foo', 'foo',
+        ...                     'baz', 'baz', 'bar', 'bar']),
+        ...           np.array(['two', 'one', 'two', 'one',
+        ...                     'two', 'one', 'two', 'one'])]
+        >>> s = pd.Series([1, 2, 3, 4, 5, 6, 7, 8], index=arrays)
+        >>> s.sort_index(level=1)
+        bar  one    8
+        baz  one    6
+        foo  one    4
+        qux  one    2
+        bar  two    7
+        baz  two    5
+        foo  two    3
+        qux  two    1
+        dtype: int64
 
-    def order(self, na_last=None, ascending=True, kind='quicksort', na_position='last', inplace=False):
+        Does not sort by remaining levels when sorting by levels
+
+        >>> s.sort_index(level=1, sort_remaining=False)
+        qux  one    2
+        foo  one    4
+        baz  one    6
+        bar  one    8
+        qux  two    1
+        foo  two    3
+        baz  two    5
+        bar  two    7
+        dtype: int64
         """
-        DEPRECATED: use :meth:`Series.sort_values`
+        # TODO: this can be combined with DataFrame.sort_index impl as
+        # almost identical
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        axis = self._get_axis_number(axis)
+        index = self.index
 
-        Sorts Series object, by value, maintaining index-value link.
-        This will return a new Series by default. Series.sort is the equivalent but as an inplace method.
+        if level is not None:
+            new_index, indexer = index.sortlevel(level, ascending=ascending,
+                                                 sort_remaining=sort_remaining)
+        elif isinstance(index, MultiIndex):
+            from pandas.core.sorting import lexsort_indexer
+            labels = index._sort_levels_monotonic()
+            indexer = lexsort_indexer(labels._get_labels_for_sorting(),
+                                      orders=ascending,
+                                      na_position=na_position)
+        else:
+            from pandas.core.sorting import nargsort
 
-        Parameters
-        ----------
-        na_last : boolean (optional, default=True) (DEPRECATED; use na_position)
-            Put NaN's at beginning or end
-        ascending : boolean, default True
-            Sort ascending. Passing False sorts descending
-        kind : {'mergesort', 'quicksort', 'heapsort'}, default 'quicksort'
-            Choice of sorting algorithm. See np.sort for more
-            information. 'mergesort' is the only stable algorithm
-        na_position : {'first', 'last'} (optional, default='last')
-            'first' puts NaNs at the beginning
-            'last' puts NaNs at the end
-        inplace : boolean, default False
-            Do operation in place.
+            # Check monotonic-ness before sort an index
+            # GH11080
+            if ((ascending and index.is_monotonic_increasing) or
+                    (not ascending and index.is_monotonic_decreasing)):
+                if inplace:
+                    return
+                else:
+                    return self.copy()
 
-        Returns
-        -------
-        y : Series
+            indexer = nargsort(index, kind=kind, ascending=ascending,
+                               na_position=na_position)
 
-        See Also
-        --------
-        Series.sort_values
-        """
-        warnings.warn("order is deprecated, use sort_values(...)",
-                      FutureWarning, stacklevel=2)
+        indexer = _ensure_platform_int(indexer)
+        new_index = index.take(indexer)
+        new_index = new_index._sort_levels_monotonic()
 
-        return self.sort_values(ascending=ascending,
-                                kind=kind,
-                                na_position=na_position,
-                                inplace=inplace)
+        new_values = self._values.take(indexer)
+        result = self._constructor(new_values, index=new_index)
+
+        if inplace:
+            self._update_inplace(result)
+        else:
+            return result.__finalize__(self)
 
     def argsort(self, axis=0, kind='quicksort', order=None):
         """
@@ -1772,11 +2704,11 @@ def argsort(self, axis=0, kind='quicksort', order=None):
         numpy.ndarray.argsort
         """
         values = self._values
-        mask = isnull(values)
+        mask = isna(values)
 
         if mask.any():
-            result = Series(
-                -1, index=self.index, name=self.name, dtype='int64')
+            result = Series(-1, index=self.index, name=self.name,
+                            dtype='int64')
             notmask = ~mask
             result[notmask] = np.argsort(values[notmask], kind=kind)
             return self._constructor(result,
@@ -1786,48 +2718,18 @@ def argsort(self, axis=0, kind='quicksort', order=None):
                 np.argsort(values, kind=kind), index=self.index,
                 dtype='int64').__finalize__(self)
 
-    def rank(self, method='average', na_option='keep', ascending=True,
-             pct=False):
-        """
-        Compute data ranks (1 through n). Equal values are assigned a rank that
-        is the average of the ranks of those values
-
-        Parameters
-        ----------
-        method : {'average', 'min', 'max', 'first', 'dense'}
-            * average: average rank of group
-            * min: lowest rank in group
-            * max: highest rank in group
-            * first: ranks assigned in order they appear in the array
-            * dense: like 'min', but rank always increases by 1 between groups
-        na_option : {'keep'}
-            keep: leave NA values where they are
-        ascending : boolean, default True
-            False for ranks by high (1) to low (N)
-        pct : boolean, default False
-            Computes percentage rank of data
-
-        Returns
-        -------
-        ranks : Series
-        """
-        ranks = algorithms.rank(self._values, method=method, na_option=na_option,
-                                ascending=ascending, pct=pct)
-        return self._constructor(ranks, index=self.index).__finalize__(self)
-
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
     def nlargest(self, n=5, keep='first'):
-        """Return the largest `n` elements.
+        """
+        Return the largest `n` elements.
 
         Parameters
         ----------
         n : int
             Return this many descending sorted values
-        keep : {'first', 'last', False}, default 'first'
+        keep : {'first', 'last'}, default 'first'
             Where there are duplicate values:
             - ``first`` : take the first occurrence.
             - ``last`` : take the last occurrence.
-        take_last : deprecated
 
         Returns
         -------
@@ -1836,8 +2738,8 @@ def nlargest(self, n=5, keep='first'):
 
         Notes
         -----
-        Faster than ``.sort_values(ascending=False).head(n)`` for small `n` relative
-        to the size of the ``Series`` object.
+        Faster than ``.sort_values(ascending=False).head(n)`` for small `n`
+        relative to the size of the ``Series`` object.
 
         See Also
         --------
@@ -1847,24 +2749,34 @@ def nlargest(self, n=5, keep='first'):
         --------
         >>> import pandas as pd
         >>> import numpy as np
-        >>> s = pd.Series(np.random.randn(1e6))
+        >>> s = pd.Series(np.random.randn(10**6))
         >>> s.nlargest(10)  # only sorts up to the N requested
+        219921    4.644710
+        82124     4.608745
+        421689    4.564644
+        425277    4.447014
+        718691    4.414137
+        43154     4.403520
+        283187    4.313922
+        595519    4.273635
+        503969    4.250236
+        121637    4.240952
+        dtype: float64
         """
-        return algorithms.select_n(self, n=n, keep=keep, method='nlargest')
+        return algorithms.SelectNSeries(self, n=n, keep=keep).nlargest()
 
-    @deprecate_kwarg('take_last', 'keep', mapping={True: 'last', False: 'first'})
     def nsmallest(self, n=5, keep='first'):
-        """Return the smallest `n` elements.
+        """
+        Return the smallest `n` elements.
 
         Parameters
         ----------
         n : int
             Return this many ascending sorted values
-        keep : {'first', 'last', False}, default 'first'
+        keep : {'first', 'last'}, default 'first'
             Where there are duplicate values:
             - ``first`` : take the first occurrence.
             - ``last`` : take the last occurrence.
-        take_last : deprecated
 
         Returns
         -------
@@ -1884,16 +2796,29 @@ def nsmallest(self, n=5, keep='first'):
         --------
         >>> import pandas as pd
         >>> import numpy as np
-        >>> s = pd.Series(np.random.randn(1e6))
+        >>> s = pd.Series(np.random.randn(10**6))
         >>> s.nsmallest(10)  # only sorts up to the N requested
+        288532   -4.954580
+        732345   -4.835960
+        64803    -4.812550
+        446457   -4.609998
+        501225   -4.483945
+        669476   -4.472935
+        973615   -4.401699
+        621279   -4.355126
+        773916   -4.347355
+        359919   -4.331927
+        dtype: float64
         """
-        return algorithms.select_n(self, n=n, keep=keep, method='nsmallest')
+        return algorithms.SelectNSeries(self, n=n, keep=keep).nsmallest()
 
     def sortlevel(self, level=0, ascending=True, sort_remaining=True):
-        """
-        Sort Series with MultiIndex by chosen level. Data will be
+        """Sort Series with MultiIndex by chosen level. Data will be
         lexicographically sorted by the chosen level followed by the other
-        levels (in order)
+        levels (in order),
+
+        .. deprecated:: 0.20.0
+            Use :meth:`Series.sort_index`
 
         Parameters
         ----------
@@ -1909,9 +2834,12 @@ def sortlevel(self, level=0, ascending=True, sort_remaining=True):
         Series.sort_index(level=...)
 
         """
-        return self.sort_index(level=level, ascending=ascending, sort_remaining=sort_remaining)
+        warnings.warn("sortlevel is deprecated, use sort_index(level=...)",
+                      FutureWarning, stacklevel=2)
+        return self.sort_index(level=level, ascending=ascending,
+                               sort_remaining=sort_remaining)
 
-    def swaplevel(self, i, j, copy=True):
+    def swaplevel(self, i=-2, j=-1, copy=True):
         """
         Swap levels i and j in a MultiIndex
 
@@ -1923,6 +2851,12 @@ def swaplevel(self, i, j, copy=True):
         Returns
         -------
         swapped : Series
+
+        .. versionchanged:: 0.18.1
+
+           The indexes ``i`` and ``j`` are now optional, and default to
+           the two innermost levels of the index.
+
         """
         new_index = self.index.swaplevel(i, j)
         return self._constructor(self._values, index=new_index,
@@ -1935,9 +2869,9 @@ def reorder_levels(self, order):
 
         Parameters
         ----------
-        order: list of int representing new level order.
+        order : list of int representing new level order.
                (reference level by number or key)
-        axis: where to reorder levels
+        axis : where to reorder levels
 
         Returns
         -------
@@ -1950,7 +2884,7 @@ def reorder_levels(self, order):
         result.index = result.index.reorder_levels(order)
         return result
 
-    def unstack(self, level=-1):
+    def unstack(self, level=-1, fill_value=None):
         """
         Unstack, a.k.a. pivot, Series with MultiIndex to produce DataFrame.
         The level involved will automatically get sorted.
@@ -1959,92 +2893,206 @@ def unstack(self, level=-1):
         ----------
         level : int, string, or list of these, default last level
             Level(s) to unstack, can pass level name
+        fill_value : replace NaN with this value if the unstack produces
+            missing values
+
+            .. versionadded:: 0.18.0
 
         Examples
         --------
+        >>> s = pd.Series([1, 2, 3, 4],
+        ...     index=pd.MultiIndex.from_product([['one', 'two'], ['a', 'b']]))
         >>> s
-        one  a   1.
-        one  b   2.
-        two  a   3.
-        two  b   4.
+        one  a    1
+             b    2
+        two  a    3
+             b    4
+        dtype: int64
 
         >>> s.unstack(level=-1)
-             a   b
-        one  1.  2.
-        two  3.  4.
+             a  b
+        one  1  2
+        two  3  4
 
         >>> s.unstack(level=0)
            one  two
-        a  1.   2.
-        b  3.   4.
+        a    1    3
+        b    2    4
 
         Returns
         -------
         unstacked : DataFrame
         """
-        from pandas.core.reshape import unstack
-        return unstack(self, level)
+        from pandas.core.reshape.reshape import unstack
+        return unstack(self, level, fill_value)
 
-    #----------------------------------------------------------------------
+    # ----------------------------------------------------------------------
     # function application
 
     def map(self, arg, na_action=None):
         """
-        Map values of Series using input correspondence (which can be
-        a dict, Series, or function)
+        Map values of Series using input correspondence (a dict, Series, or
+        function).
 
         Parameters
         ----------
         arg : function, dict, or Series
+            Mapping correspondence.
         na_action : {None, 'ignore'}
-            If 'ignore', propagate NA values
+            If 'ignore', propagate NA values, without passing them to the
+            mapping correspondence.
+
+        Returns
+        -------
+        y : Series
+            Same index as caller.
 
         Examples
         --------
+
+        Map inputs to outputs (both of type `Series`):
+
+        >>> x = pd.Series([1,2,3], index=['one', 'two', 'three'])
         >>> x
-        one   1
-        two   2
-        three 3
+        one      1
+        two      2
+        three    3
+        dtype: int64
 
+        >>> y = pd.Series(['foo', 'bar', 'baz'], index=[1,2,3])
         >>> y
-        1  foo
-        2  bar
-        3  baz
+        1    foo
+        2    bar
+        3    baz
 
         >>> x.map(y)
         one   foo
         two   bar
         three baz
 
-        Returns
-        -------
-        y : Series
-            same index as caller
+        If `arg` is a dictionary, return a new Series with values converted
+        according to the dictionary's mapping:
+
+        >>> z = {1: 'A', 2: 'B', 3: 'C'}
+
+        >>> x.map(z)
+        one   A
+        two   B
+        three C
+
+        Use na_action to control whether NA values are affected by the mapping
+        function.
+
+        >>> s = pd.Series([1, 2, 3, np.nan])
+
+        >>> s2 = s.map('this is a string {}'.format, na_action=None)
+        0    this is a string 1.0
+        1    this is a string 2.0
+        2    this is a string 3.0
+        3    this is a string nan
+        dtype: object
+
+        >>> s3 = s.map('this is a string {}'.format, na_action='ignore')
+        0    this is a string 1.0
+        1    this is a string 2.0
+        2    this is a string 3.0
+        3                     NaN
+        dtype: object
+
+        See Also
+        --------
+        Series.apply : For applying more complex functions on a Series.
+        DataFrame.apply : Apply a function row-/column-wise.
+        DataFrame.applymap : Apply a function elementwise on a whole DataFrame.
+
+        Notes
+        -----
+        When `arg` is a dictionary, values in Series that are not in the
+        dictionary (as keys) are converted to ``NaN``. However, if the
+        dictionary is a ``dict`` subclass that defines ``__missing__`` (i.e.
+        provides a method for default values), then this default is used
+        rather than ``NaN``:
+
+        >>> from collections import Counter
+        >>> counter = Counter()
+        >>> counter['bar'] += 1
+        >>> y.map(counter)
+        1    0
+        2    1
+        3    0
+        dtype: int64
         """
-        values = self._values
-        if com.is_datetime64_dtype(values.dtype):
-            values = lib.map_infer(values, lib.Timestamp)
+        new_values = super(Series, self)._map_values(
+            arg, na_action=na_action)
+        return self._constructor(new_values,
+                                 index=self.index).__finalize__(self)
+
+    def _gotitem(self, key, ndim, subset=None):
+        """
+        sub-classes to define
+        return a sliced object
+
+        Parameters
+        ----------
+        key : string / list of selections
+        ndim : 1,2
+            requested ndim of result
+        subset : object, default None
+            subset to act on
+        """
+        return self
+
+    _agg_doc = dedent("""
+    Examples
+    --------
 
-        if na_action == 'ignore':
-            mask = isnull(values)
+    >>> s = Series(np.random.randn(10))
 
-            def map_f(values, f):
-                return lib.map_infer_mask(values, f, mask.view(np.uint8))
-        else:
-            map_f = lib.map_infer
+    >>> s.agg('min')
+    -1.3018049988556679
 
-        if isinstance(arg, (dict, Series)):
-            if isinstance(arg, dict):
-                arg = self._constructor(arg, index=arg.keys())
+    >>> s.agg(['min', 'max'])
+    min   -1.301805
+    max    1.127688
+    dtype: float64
 
-            indexer = arg.index.get_indexer(values)
-            new_values = com.take_1d(arg._values, indexer)
-            return self._constructor(new_values,
-                                     index=self.index).__finalize__(self)
-        else:
-            mapped = map_f(values, arg)
-            return self._constructor(mapped,
-                                     index=self.index).__finalize__(self)
+    See also
+    --------
+    pandas.Series.apply
+    pandas.Series.transform
+
+    """)
+
+    @Appender(_agg_doc)
+    @Appender(generic._shared_docs['aggregate'] % dict(
+        versionadded='.. versionadded:: 0.20.0',
+        **_shared_doc_kwargs))
+    def aggregate(self, func, axis=0, *args, **kwargs):
+        axis = self._get_axis_number(axis)
+        result, how = self._aggregate(func, *args, **kwargs)
+        if result is None:
+
+            # we can be called from an inner function which
+            # passes this meta-data
+            kwargs.pop('_axis', None)
+            kwargs.pop('_level', None)
+
+            # try a regular apply, this evaluates lambdas
+            # row-by-row; however if the lambda is expected a Series
+            # expression, e.g.: lambda x: x-x.quantile(0.25)
+            # this will fail, so we can try a vectorized evaluation
+
+            # we cannot FIRST try the vectorized evaluation, because
+            # then .agg and .apply would have different semantics if the
+            # operation is actually defined on the Series, e.g. str
+            try:
+                result = self.apply(func, *args, **kwargs)
+            except (ValueError, AttributeError, TypeError):
+                result = func(self, *args, **kwargs)
+
+        return result
+
+    agg = aggregate
 
     def apply(self, func, convert_dtype=True, args=(), **kwds):
         """
@@ -2069,6 +3117,8 @@ def apply(self, func, convert_dtype=True, args=(), **kwds):
         See also
         --------
         Series.map: For element-wise operations
+        Series.agg: only perform aggregating type operations
+        Series.transform: only perform transforming type operations
 
         Examples
         --------
@@ -2079,6 +3129,7 @@ def apply(self, func, convert_dtype=True, args=(), **kwds):
         >>> import numpy as np
         >>> series = pd.Series([20, 21, 12], index=['London',
         ... 'New York','Helsinki'])
+        >>> series
         London      20
         New York    21
         Helsinki    12
@@ -2123,7 +3174,7 @@ def apply(self, func, convert_dtype=True, args=(), **kwds):
         >>> def add_custom_values(x, **kwargs):
         ...     for month in kwargs:
         ...         x+=kwargs[month]
-        ...         return x
+        ...     return x
 
         >>> series.apply(add_custom_values, june=30, july=20, august=25)
         London      95
@@ -2145,19 +3196,32 @@ def apply(self, func, convert_dtype=True, args=(), **kwds):
             return self._constructor(dtype=self.dtype,
                                      index=self.index).__finalize__(self)
 
+        # dispatch to agg
+        if isinstance(func, (list, dict)):
+            return self.aggregate(func, *args, **kwds)
+
+        # if we are a string, try to dispatch
+        if isinstance(func, compat.string_types):
+            return self._try_aggregate_string_function(func, *args, **kwds)
+
+        # handle ufuncs and lambdas
         if kwds or args and not isinstance(func, np.ufunc):
-            f = lambda x: func(x, *args, **kwds)
+            def f(x):
+                return func(x, *args, **kwds)
         else:
             f = func
 
-        if isinstance(f, np.ufunc):
-            return f(self)
+        with np.errstate(all='ignore'):
+            if isinstance(f, np.ufunc):
+                return f(self)
 
-        values = _values_from_object(self)
-        if com.is_datetime64_dtype(values.dtype):
-            values = lib.map_infer(values, lib.Timestamp)
+            # row-wise access
+            if is_extension_type(self.dtype):
+                mapped = self._values.map(f)
+            else:
+                values = self.astype(object).values
+                mapped = lib.map_infer(values, f, convert=convert_dtype)
 
-        mapped = lib.map_infer(values, f, convert=convert_dtype)
         if len(mapped) and isinstance(mapped[0], Series):
             from pandas.core.frame import DataFrame
             return DataFrame(mapped.tolist(), index=self.index)
@@ -2177,63 +3241,26 @@ def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
         delegate = self._values
         if isinstance(delegate, np.ndarray):
             # Validate that 'axis' is consistent with Series's single axis.
-            self._get_axis_number(axis)
+            if axis is not None:
+                self._get_axis_number(axis)
             if numeric_only:
-                raise NotImplementedError(
-                    'Series.{0} does not implement numeric_only.'.format(name))
-            return op(delegate, skipna=skipna, **kwds)
+                raise NotImplementedError('Series.{0} does not implement '
+                                          'numeric_only.'.format(name))
+            with np.errstate(all='ignore'):
+                return op(delegate, skipna=skipna, **kwds)
 
         return delegate._reduce(op=op, name=name, axis=axis, skipna=skipna,
                                 numeric_only=numeric_only,
                                 filter_type=filter_type, **kwds)
 
-    def _maybe_box(self, func, dropna=False):
-        """
-        evaluate a function with possible input/output conversion if we are i8
-
-        Parameters
-        ----------
-        dropna : bool, default False
-           whether to drop values if necessary
-
-        """
-        if dropna:
-            values = self.dropna()._values
-        else:
-            values = self._values
-
-        if needs_i8_conversion(self):
-            boxer = i8_boxer(self)
-
-            if len(values) == 0:
-                return boxer(tslib.iNaT)
-
-            values = values.view('i8')
-            result = func(values)
-
-            if com.is_list_like(result):
-                result = result.map(boxer)
-            else:
-                result = boxer(result)
-
-        else:
-
-            # let the function return nan if appropriate
-            if dropna:
-                if len(values) == 0:
-                    return np.nan
-            result = func(values)
-
-        return result
-
     def _reindex_indexer(self, new_index, indexer, copy):
         if indexer is None:
             if copy:
                 return self.copy()
             return self
 
-        # be subclass-friendly
-        new_values = com.take_1d(self.get_values(), indexer)
+        new_values = algorithms.take_1d(self._values, indexer,
+                                        allow_fill=True, fill_value=None)
         return self._constructor(new_values, index=new_index)
 
     def _needs_reindex_multi(self, axes, method, level):
@@ -2246,19 +3273,179 @@ def _needs_reindex_multi(self, axes, method, level):
     def align(self, other, join='outer', axis=None, level=None, copy=True,
               fill_value=None, method=None, limit=None, fill_axis=0,
               broadcast_axis=None):
-        return super(Series, self).align(other, join=join, axis=axis, level=level, copy=copy,
-                                         fill_value=fill_value, method=method, limit=limit,
-                                         fill_axis=fill_axis, broadcast_axis=broadcast_axis)
+        return super(Series, self).align(other, join=join, axis=axis,
+                                         level=level, copy=copy,
+                                         fill_value=fill_value, method=method,
+                                         limit=limit, fill_axis=fill_axis,
+                                         broadcast_axis=broadcast_axis)
 
-    @Appender(generic._shared_docs['rename'] % _shared_doc_kwargs)
     def rename(self, index=None, **kwargs):
+        """Alter Series index labels or name
+
+        Function / dict values must be unique (1-to-1). Labels not contained in
+        a dict / Series will be left as-is. Extra labels listed don't throw an
+        error.
+
+        Alternatively, change ``Series.name`` with a scalar value.
+
+        See the :ref:`user guide <basics.rename>` for more.
+
+        Parameters
+        ----------
+        index : scalar, hashable sequence, dict-like or function, optional
+            dict-like or functions are transformations to apply to
+            the index.
+            Scalar or hashable sequence-like will alter the ``Series.name``
+            attribute.
+        copy : boolean, default True
+            Also copy underlying data
+        inplace : boolean, default False
+            Whether to return a new Series. If True then value of copy is
+            ignored.
+        level : int or level name, default None
+            In case of a MultiIndex, only rename labels in the specified
+            level.
+
+        Returns
+        -------
+        renamed : Series (new object)
+
+        See Also
+        --------
+        pandas.Series.rename_axis
+
+        Examples
+        --------
+
+        >>> s = pd.Series([1, 2, 3])
+        >>> s
+        0    1
+        1    2
+        2    3
+        dtype: int64
+        >>> s.rename("my_name") # scalar, changes Series.name
+        0    1
+        1    2
+        2    3
+        Name: my_name, dtype: int64
+        >>> s.rename(lambda x: x ** 2)  # function, changes labels
+        0    1
+        1    2
+        4    3
+        dtype: int64
+        >>> s.rename({1: 3, 2: 5})  # mapping, changes labels
+        0    1
+        3    2
+        5    3
+        dtype: int64
+
+        """
+        kwargs['inplace'] = validate_bool_kwarg(kwargs.get('inplace', False),
+                                                'inplace')
+
+        non_mapping = is_scalar(index) or (is_list_like(index) and
+                                           not is_dict_like(index))
+        if non_mapping:
+            return self._set_name(index, inplace=kwargs.get('inplace'))
         return super(Series, self).rename(index=index, **kwargs)
 
     @Appender(generic._shared_docs['reindex'] % _shared_doc_kwargs)
     def reindex(self, index=None, **kwargs):
         return super(Series, self).reindex(index=index, **kwargs)
 
-    @Appender(generic._shared_docs['fillna'] % _shared_doc_kwargs)
+    def drop(self, labels=None, axis=0, index=None, columns=None,
+             level=None, inplace=False, errors='raise'):
+        """
+        Return Series with specified index labels removed.
+
+        Remove elements of a Series based on specifying the index labels.
+        When using a multi-index, labels on different levels can be removed
+        by specifying the level.
+
+        Parameters
+        ----------
+        labels : single label or list-like
+            Index labels to drop.
+        axis : 0, default 0
+            Redundant for application on Series.
+        index, columns : None
+            Redundant for application on Series, but index can be used instead
+            of labels.
+
+            .. versionadded:: 0.21.0
+        level : int or level name, optional
+            For MultiIndex, level for which the labels will be removed.
+        inplace : bool, default False
+            If True, do operation inplace and return None.
+        errors : {'ignore', 'raise'}, default 'raise'
+            If 'ignore', suppress error and only existing labels are dropped.
+
+        Returns
+        -------
+        dropped : pandas.Series
+
+        See Also
+        --------
+        Series.reindex : Return only specified index labels of Series.
+        Series.dropna : Return series without null values.
+        Series.drop_duplicates : Return Series with duplicate values removed.
+        DataFrame.drop : Drop specified labels from rows or columns.
+
+        Raises
+        ------
+        KeyError
+            If none of the labels are found in the index.
+
+        Examples
+        --------
+        >>> s = pd.Series(data=np.arange(3), index=['A','B','C'])
+        >>> s
+        A  0
+        B  1
+        C  2
+        dtype: int64
+
+        Drop labels B en C
+
+        >>> s.drop(labels=['B','C'])
+        A  0
+        dtype: int64
+
+        Drop 2nd level label in MultiIndex Series
+
+        >>> midx = pd.MultiIndex(levels=[['lama', 'cow', 'falcon'],
+        ...                              ['speed', 'weight', 'length']],
+        ...                      labels=[[0, 0, 0, 1, 1, 1, 2, 2, 2],
+        ...                              [0, 1, 2, 0, 1, 2, 0, 1, 2]])
+        >>> s = pd.Series([45, 200, 1.2, 30, 250, 1.5, 320, 1, 0.3],
+        ...               index=midx)
+        >>> s
+        lama    speed      45.0
+                weight    200.0
+                length      1.2
+        cow     speed      30.0
+                weight    250.0
+                length      1.5
+        falcon  speed     320.0
+                weight      1.0
+                length      0.3
+        dtype: float64
+
+        >>> s.drop(labels='weight', level=1)
+        lama    speed      45.0
+                length      1.2
+        cow     speed      30.0
+                length      1.5
+        falcon  speed     320.0
+                length      0.3
+        dtype: float64
+        """
+        return super(Series, self).drop(labels=labels, axis=axis, index=index,
+                                        columns=columns, level=level,
+                                        inplace=inplace, errors=errors)
+
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(generic.NDFrame.fillna.__doc__)
     def fillna(self, value=None, method=None, axis=None, inplace=False,
                limit=None, downcast=None, **kwargs):
         return super(Series, self).fillna(value=value, method=method,
@@ -2266,57 +3453,129 @@ def fillna(self, value=None, method=None, axis=None, inplace=False,
                                           limit=limit, downcast=downcast,
                                           **kwargs)
 
+    @Appender(generic._shared_docs['replace'] % _shared_doc_kwargs)
+    def replace(self, to_replace=None, value=None, inplace=False, limit=None,
+                regex=False, method='pad'):
+        return super(Series, self).replace(to_replace=to_replace, value=value,
+                                           inplace=inplace, limit=limit,
+                                           regex=regex, method=method)
+
     @Appender(generic._shared_docs['shift'] % _shared_doc_kwargs)
     def shift(self, periods=1, freq=None, axis=0):
-        return super(Series, self).shift(periods=periods, freq=freq,
-                                         axis=axis)
+        return super(Series, self).shift(periods=periods, freq=freq, axis=axis)
 
     def reindex_axis(self, labels, axis=0, **kwargs):
-        """ for compatibility with higher dims """
+        """Conform Series to new index with optional filling logic.
+
+        .. deprecated:: 0.21.0
+            Use ``Series.reindex`` instead.
+        """
+        # for compatibility with higher dims
         if axis != 0:
             raise ValueError("cannot reindex series on non-zero axis!")
+        msg = ("'.reindex_axis' is deprecated and will be removed in a future "
+               "version. Use '.reindex' instead.")
+        warnings.warn(msg, FutureWarning, stacklevel=2)
+
         return self.reindex(index=labels, **kwargs)
 
-    def take(self, indices, axis=0, convert=True, is_copy=False):
+    def memory_usage(self, index=True, deep=False):
         """
-        return Series corresponding to requested indices
+        Return the memory usage of the Series.
+
+        The memory usage can optionally include the contribution of
+        the index and of elements of `object` dtype.
 
         Parameters
         ----------
-        indices : list / array of ints
-        convert : translate negative to positive indices (default)
+        index : bool, default True
+            Specifies whether to include the memory usage of the Series index.
+        deep : bool, default False
+            If True, introspect the data deeply by interrogating
+            `object` dtypes for system-level memory consumption, and include
+            it in the returned value.
 
         Returns
         -------
-        taken : Series
+        int
+            Bytes of memory consumed.
 
-        See also
+        See Also
+        --------
+        numpy.ndarray.nbytes : Total bytes consumed by the elements of the
+            array.
+        DataFrame.memory_usage : Bytes consumed by a DataFrame.
+
+        Examples
         --------
-        numpy.ndarray.take
+
+        >>> s = pd.Series(range(3))
+        >>> s.memory_usage()
+        104
+
+        Not including the index gives the size of the rest of the data, which
+        is necessarily smaller:
+
+        >>> s.memory_usage(index=False)
+        24
+
+        The memory footprint of `object` values is ignored by default:
+
+        >>> s = pd.Series(["a", "b"])
+        >>> s.values
+        array(['a', 'b'], dtype=object)
+        >>> s.memory_usage()
+        96
+        >>> s.memory_usage(deep=True)
+        212
         """
-        # check/convert indicies here
-        if convert:
-            indices = maybe_convert_indices(
-                indices, len(self._get_axis(axis)))
+        v = super(Series, self).memory_usage(deep=deep)
+        if index:
+            v += self.index.memory_usage(deep=deep)
+        return v
 
-        indices = com._ensure_platform_int(indices)
+    @Appender(generic._shared_docs['_take'])
+    def _take(self, indices, axis=0, is_copy=False):
+
+        indices = _ensure_platform_int(indices)
         new_index = self.index.take(indices)
-        new_values = self._values.take(indices)
-        return self._constructor(new_values,
-                                 index=new_index).__finalize__(self)
+
+        if is_categorical_dtype(self):
+            # https://github.com/pandas-dev/pandas/issues/20664
+            # TODO: remove when the default Categorical.take behavior changes
+            indices = maybe_convert_indices(indices, len(self._get_axis(axis)))
+            kwargs = {'allow_fill': False}
+        else:
+            kwargs = {}
+        new_values = self._values.take(indices, **kwargs)
+
+        result = (self._constructor(new_values, index=new_index,
+                                    fastpath=True).__finalize__(self))
+
+        # Maybe set copy if we didn't actually change the index.
+        if is_copy:
+            if not result._get_axis(axis).equals(self._get_axis(axis)):
+                result._set_is_copy(self)
+
+        return result
 
     def isin(self, values):
         """
-        Return a boolean :class:`~pandas.Series` showing whether each element
-        in the :class:`~pandas.Series` is exactly contained in the passed
-        sequence of ``values``.
+        Check whether `values` are contained in Series.
+
+        Return a boolean Series showing whether each element in the Series
+        matches an element in the passed sequence of `values` exactly.
 
         Parameters
         ----------
-        values : list-like
+        values : set or list-like
             The sequence of values to test. Passing in a single string will
             raise a ``TypeError``. Instead, turn a single string into a
-            ``list`` of one element.
+            list of one element.
+
+            .. versionadded:: 0.18.1
+
+              Support for values as a set.
 
         Returns
         -------
@@ -2325,50 +3584,105 @@ def isin(self, values):
         Raises
         ------
         TypeError
-          * If ``values`` is a string
+          * If `values` is a string
 
         See Also
         --------
-        pandas.DataFrame.isin
+        pandas.DataFrame.isin : equivalent method on DataFrame
 
         Examples
         --------
 
-        >>> s = pd.Series(list('abc'))
-        >>> s.isin(['a', 'c', 'e'])
+        >>> s = pd.Series(['lama', 'cow', 'lama', 'beetle', 'lama',
+        ...                'hippo'], name='animal')
+        >>> s.isin(['cow', 'lama'])
         0     True
-        1    False
+        1     True
         2     True
-        dtype: bool
+        3    False
+        4     True
+        5    False
+        Name: animal, dtype: bool
 
-        Passing a single string as ``s.isin('a')`` will raise an error. Use
+        Passing a single string as ``s.isin('lama')`` will raise an error. Use
         a list of one element instead:
 
-        >>> s.isin(['a'])
+        >>> s.isin(['lama'])
         0     True
         1    False
-        2    False
-        dtype: bool
-
+        2     True
+        3    False
+        4     True
+        5    False
+        Name: animal, dtype: bool
         """
-        result = algorithms.isin(_values_from_object(self), values)
+        result = algorithms.isin(self, values)
         return self._constructor(result, index=self.index).__finalize__(self)
 
     def between(self, left, right, inclusive=True):
         """
-        Return boolean Series equivalent to left <= series <= right. NA values
-        will be treated as False
+        Return boolean Series equivalent to left <= series <= right.
+
+        This function returns a boolean vector containing `True` wherever the
+        corresponding Series element is between the boundary values `left` and
+        `right`. NA values are treated as `False`.
 
         Parameters
         ----------
         left : scalar
-            Left boundary
+            Left boundary.
         right : scalar
-            Right boundary
+            Right boundary.
+        inclusive : bool, default True
+            Include boundaries.
 
         Returns
         -------
-        is_between : Series
+        Series
+            Each element will be a boolean.
+
+        Notes
+        -----
+        This function is equivalent to ``(left <= ser) & (ser <= right)``
+
+        See Also
+        --------
+        pandas.Series.gt : Greater than of series and other
+        pandas.Series.lt : Less than of series and other
+
+        Examples
+        --------
+        >>> s = pd.Series([2, 0, 4, 8, np.nan])
+
+        Boundary values are included by default:
+
+        >>> s.between(1, 4)
+        0     True
+        1    False
+        2     True
+        3    False
+        4    False
+        dtype: bool
+
+        With `inclusive` set to ``False`` boundary values are excluded:
+
+        >>> s.between(1, 4, inclusive=False)
+        0     True
+        1    False
+        2    False
+        3    False
+        4    False
+        dtype: bool
+
+        `left` and `right` can be any scalar value:
+
+        >>> s = pd.Series(['Alice', 'Bob', 'Carol', 'Eve'])
+        >>> s.between('Anna', 'Daniel')
+        0    False
+        1     True
+        2     True
+        3    False
+        dtype: bool
         """
         if inclusive:
             lmask = self >= left
@@ -2382,8 +3696,10 @@ def between(self, left, right, inclusive=True):
     @classmethod
     def from_csv(cls, path, sep=',', parse_dates=True, header=None,
                  index_col=0, encoding=None, infer_datetime_format=False):
-        """
-        Read CSV file (DISCOURAGED, please use :func:`pandas.read_csv` instead).
+        """Read CSV file.
+
+        .. deprecated:: 0.21.0
+            Use :func:`pandas.read_csv` instead.
 
         It is preferable to use the more powerful :func:`pandas.read_csv`
         for most general purposes, but ``from_csv`` makes for an easy
@@ -2430,28 +3746,32 @@ def from_csv(cls, path, sep=',', parse_dates=True, header=None,
         -------
         y : Series
         """
+
+        # We're calling `DataFrame.from_csv` in the implementation,
+        # which will propagate a warning regarding `from_csv` deprecation.
         from pandas.core.frame import DataFrame
         df = DataFrame.from_csv(path, header=header, index_col=index_col,
                                 sep=sep, parse_dates=parse_dates,
                                 encoding=encoding,
                                 infer_datetime_format=infer_datetime_format)
-        result = df.iloc[:,0]
+        result = df.iloc[:, 0]
         if header is None:
             result.index.name = result.name = None
 
         return result
 
-    def to_csv(self, path, index=True, sep=",", na_rep='',
-               float_format=None, header=False,
-               index_label=None, mode='w', nanRep=None, encoding=None,
-               date_format=None, decimal='.'):
+    def to_csv(self, path=None, index=True, sep=",", na_rep='',
+               float_format=None, header=False, index_label=None,
+               mode='w', encoding=None, compression=None, date_format=None,
+               decimal='.'):
         """
         Write Series to a comma-separated values (csv) file
 
         Parameters
         ----------
-        path : string file path or file handle / StringIO. If None is provided
-            the result is returned as a string.
+        path : string or file handle, default None
+            File path or object, if None is provided the result is returned as
+            a string.
         na_rep : string, default ''
             Missing data representation
         float_format : string, default None
@@ -2470,122 +3790,160 @@ def to_csv(self, path, index=True, sep=",", na_rep='',
         encoding : string, optional
             a string representing the encoding to use if the contents are
             non-ascii, for python versions prior to 3
+        compression : string, optional
+            A string representing the compression to use in the output file.
+            Allowed values are 'gzip', 'bz2', 'zip', 'xz'. This input is only
+            used when the first argument is a filename.
         date_format: string, default None
             Format string for datetime objects.
         decimal: string, default '.'
-            Character recognized as decimal separator. E.g. use ',' for European data
+            Character recognized as decimal separator. E.g. use ',' for
+            European data
         """
         from pandas.core.frame import DataFrame
         df = DataFrame(self)
         # result is only a string if no path provided, otherwise None
         result = df.to_csv(path, index=index, sep=sep, na_rep=na_rep,
-                  float_format=float_format, header=header,
-                  index_label=index_label, mode=mode, nanRep=nanRep,
-                  encoding=encoding, date_format=date_format, decimal=decimal)
+                           float_format=float_format, header=header,
+                           index_label=index_label, mode=mode,
+                           encoding=encoding, compression=compression,
+                           date_format=date_format, decimal=decimal)
         if path is None:
             return result
 
+    @Appender(generic._shared_docs['to_excel'] % _shared_doc_kwargs)
+    def to_excel(self, excel_writer, sheet_name='Sheet1', na_rep='',
+                 float_format=None, columns=None, header=True, index=True,
+                 index_label=None, startrow=0, startcol=0, engine=None,
+                 merge_cells=True, encoding=None, inf_rep='inf', verbose=True):
+        df = self.to_frame()
+        df.to_excel(excel_writer=excel_writer, sheet_name=sheet_name,
+                    na_rep=na_rep, float_format=float_format, columns=columns,
+                    header=header, index=index, index_label=index_label,
+                    startrow=startrow, startcol=startcol, engine=engine,
+                    merge_cells=merge_cells, encoding=encoding,
+                    inf_rep=inf_rep, verbose=verbose)
+
+    @Appender(generic._shared_docs['isna'] % _shared_doc_kwargs)
+    def isna(self):
+        return super(Series, self).isna()
+
+    @Appender(generic._shared_docs['isna'] % _shared_doc_kwargs)
+    def isnull(self):
+        return super(Series, self).isnull()
+
+    @Appender(generic._shared_docs['notna'] % _shared_doc_kwargs)
+    def notna(self):
+        return super(Series, self).notna()
+
+    @Appender(generic._shared_docs['notna'] % _shared_doc_kwargs)
+    def notnull(self):
+        return super(Series, self).notnull()
+
     def dropna(self, axis=0, inplace=False, **kwargs):
         """
-        Return Series without null values
+        Return a new Series with missing values removed.
+
+        See the :ref:`User Guide <missing_data>` for more on which values are
+        considered missing, and how to work with missing data.
+
+        Parameters
+        ----------
+        axis : {0 or 'index'}, default 0
+            There is only one axis to drop values from.
+        inplace : bool, default False
+            If True, do operation inplace and return None.
+        **kwargs
+            Not in use.
 
         Returns
         -------
-        valid : Series
-        inplace : boolean, default False
-            Do operation in place.
-        """
-        kwargs.pop('how', None)
-        if kwargs:
-            raise TypeError('dropna() got an unexpected keyword '
-                    'argument "{0}"'.format(list(kwargs.keys())[0]))
-
-        axis = self._get_axis_number(axis or 0)
-        result = remove_na(self)
-        if inplace:
-            self._update_inplace(result)
-        else:
-            return result
+        Series
+            Series with NA entries dropped from it.
 
-    valid = lambda self, inplace=False, **kwargs: self.dropna(inplace=inplace,
-                                                              **kwargs)
+        See Also
+        --------
+        Series.isna: Indicate missing values.
+        Series.notna : Indicate existing (non-missing) values.
+        Series.fillna : Replace missing values.
+        DataFrame.dropna : Drop rows or columns which contain NA values.
+        Index.dropna : Drop missing indices.
 
-    def first_valid_index(self):
-        """
-        Return label for first non-NA/null value
-        """
-        if len(self) == 0:
-            return None
+        Examples
+        --------
+        >>> ser = pd.Series([1., 2., np.nan])
+        >>> ser
+        0    1.0
+        1    2.0
+        2    NaN
+        dtype: float64
 
-        mask = isnull(self._values)
-        i = mask.argmin()
-        if mask[i]:
-            return None
-        else:
-            return self.index[i]
+        Drop NA values from a Series.
 
-    def last_valid_index(self):
-        """
-        Return label for last non-NA/null value
-        """
-        if len(self) == 0:
-            return None
+        >>> ser.dropna()
+        0    1.0
+        1    2.0
+        dtype: float64
 
-        mask = isnull(self._values[::-1])
-        i = mask.argmin()
-        if mask[i]:
-            return None
-        else:
-            return self.index[len(self) - i - 1]
+        Keep the Series with valid entries in the same variable.
 
-    #----------------------------------------------------------------------
-    # Time series-oriented methods
+        >>> ser.dropna(inplace=True)
+        >>> ser
+        0    1.0
+        1    2.0
+        dtype: float64
 
-    def asof(self, where):
-        """
-        Return last good (non-NaN) value in Series if value is NaN for
-        requested date.
+        Empty strings are not considered NA values. ``None`` is considered an
+        NA value.
+
+        >>> ser = pd.Series([np.NaN, 2, pd.NaT, '', None, 'I stay'])
+        >>> ser
+        0       NaN
+        1         2
+        2       NaT
+        3
+        4      None
+        5    I stay
+        dtype: object
+        >>> ser.dropna()
+        1         2
+        3
+        5    I stay
+        dtype: object
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        kwargs.pop('how', None)
+        if kwargs:
+            raise TypeError('dropna() got an unexpected keyword '
+                            'argument "{0}"'.format(list(kwargs.keys())[0]))
 
-        If there is no good value, NaN is returned.
+        axis = self._get_axis_number(axis or 0)
 
-        Parameters
-        ----------
-        where : date or array of dates
+        if self._can_hold_na:
+            result = remove_na_arraylike(self)
+            if inplace:
+                self._update_inplace(result)
+            else:
+                return result
+        else:
+            if inplace:
+                # do nothing
+                pass
+            else:
+                return self.copy()
 
-        Notes
-        -----
-        Dates are assumed to be sorted
+    def valid(self, inplace=False, **kwargs):
+        """Return Series without null values.
 
-        Returns
-        -------
-        value or NaN
+        .. deprecated:: 0.23.0
+            Use :meth:`Series.dropna` instead.
         """
-        if isinstance(where, compat.string_types):
-            where = datetools.to_datetime(where)
-
-        values = self._values
-
-        if not hasattr(where, '__iter__'):
-            start = self.index[0]
-            if isinstance(self.index, PeriodIndex):
-                where = Period(where, freq=self.index.freq).ordinal
-                start = start.ordinal
-
-            if where < start:
-                return np.nan
-            loc = self.index.searchsorted(where, side='right')
-            if loc > 0:
-                loc -= 1
-            while isnull(values[loc]) and loc > 0:
-                loc -= 1
-            return values[loc]
-
-        if not isinstance(where, Index):
-            where = Index(where)
+        warnings.warn("Method .valid will be removed in a future version. "
+                      "Use .dropna instead.", FutureWarning, stacklevel=2)
+        return self.dropna(inplace=inplace, **kwargs)
 
-        locs = self.index.asof_locs(where, notnull(values))
-        new_values = com.take_1d(values, locs)
-        return self._constructor(new_values, index=where).__finalize__(self)
+    # ----------------------------------------------------------------------
+    # Time series-oriented methods
 
     def to_timestamp(self, freq=None, how='start', copy=True):
         """
@@ -2632,95 +3990,74 @@ def to_period(self, freq=None, copy=True):
         return self._constructor(new_values,
                                  index=new_index).__finalize__(self)
 
-    #------------------------------------------------------------------------------
-    # Datetimelike delegation methods
-
-    def _make_dt_accessor(self):
-        try:
-            return maybe_to_datetimelike(self)
-        except Exception:
-            raise AttributeError("Can only use .dt accessor with datetimelike "
-                                 "values")
-
-    dt = base.AccessorProperty(CombinedDatetimelikeProperties, _make_dt_accessor)
-
-    #------------------------------------------------------------------------------
-    # Categorical methods
-
-    def _make_cat_accessor(self):
-        if not is_categorical_dtype(self.dtype):
-            raise AttributeError("Can only use .cat accessor with a "
-                                 "'category' dtype")
-        return CategoricalAccessor(self.values, self.index)
-
-    cat = base.AccessorProperty(CategoricalAccessor, _make_cat_accessor)
+    # ----------------------------------------------------------------------
+    # Accessor Methods
+    # ----------------------------------------------------------------------
+    str = CachedAccessor("str", StringMethods)
+    dt = CachedAccessor("dt", CombinedDatetimelikeProperties)
+    cat = CachedAccessor("cat", CategoricalAccessor)
+    plot = CachedAccessor("plot", gfx.SeriesPlotMethods)
 
-    def _dir_deletions(self):
-        return self._accessors
+    # ----------------------------------------------------------------------
+    # Add plotting methods to Series
+    hist = gfx.hist_series
 
-    def _dir_additions(self):
-        rv = set()
-        # these accessors are mutually exclusive, so break loop when one exists
-        for accessor in self._accessors:
-            try:
-                getattr(self, accessor)
-                rv.add(accessor)
-                break
-            except AttributeError:
-                pass
-        return rv
 
-Series._setup_axes(['index'], info_axis=0, stat_axis=0,
-                   aliases={'rows': 0})
+Series._setup_axes(['index'], info_axis=0, stat_axis=0, aliases={'rows': 0},
+                   docs={'index': 'The index (axis labels) of the Series.'})
 Series._add_numeric_operations()
-_INDEX_TYPES = ndarray, Index, list, tuple
+Series._add_series_only_operations()
+Series._add_series_or_dataframe_operations()
 
-#------------------------------------------------------------------------------
-# Supplementary functions
+# Add arithmetic!
+ops.add_flex_arithmetic_methods(Series)
+ops.add_special_arithmetic_methods(Series)
 
 
-def remove_na(series):
-    """
-    Return series containing only true/non-NaN values, possibly empty.
-    """
-    return series[notnull(_values_from_object(series))]
+# -----------------------------------------------------------------------------
+# Supplementary functions
 
 
 def _sanitize_index(data, index, copy=False):
-    """ sanitize an index type to return an ndarray of the underlying, pass thru a non-Index """
+    """ sanitize an index type to return an ndarray of the underlying, pass
+    thru a non-Index
+    """
 
     if index is None:
         return data
 
     if len(data) != len(index):
-        raise ValueError('Length of values does not match length of '
-                         'index')
+        raise ValueError('Length of values does not match length of ' 'index')
 
-    if isinstance(data, PeriodIndex):
-        data = data.asobject
-    elif isinstance(data, DatetimeIndex):
-        data = data._to_embed(keep_tz=True)
+    if isinstance(data, ABCIndexClass) and not copy:
+        pass
+    elif isinstance(data, (PeriodIndex, DatetimeIndex)):
+        data = data._values
         if copy:
             data = data.copy()
+
     elif isinstance(data, np.ndarray):
 
         # coerce datetimelike types
-        if data.dtype.kind in ['M','m']:
+        if data.dtype.kind in ['M', 'm']:
             data = _sanitize_array(data, index, copy=copy)
 
     return data
 
+
 def _sanitize_array(data, index, dtype=None, copy=False,
                     raise_cast_failure=False):
-    """ sanitize input data to an ndarray, copy if specified, coerce to the dtype if specified """
+    """ sanitize input data to an ndarray, copy if specified, coerce to the
+    dtype if specified
+    """
 
     if dtype is not None:
-        dtype = _coerce_to_dtype(dtype)
+        dtype = pandas_dtype(dtype)
 
     if isinstance(data, ma.MaskedArray):
         mask = ma.getmaskarray(data)
         if mask.any():
-            data, fill_value = _maybe_upcast(data, copy=True)
+            data, fill_value = maybe_upcast(data, copy=True)
             data[mask] = fill_value
         else:
             data = data.copy()
@@ -2729,16 +4066,38 @@ def _try_cast(arr, take_fast_path):
 
         # perf shortcut as this is the most common case
         if take_fast_path:
-            if _possibly_castable(arr) and not copy and dtype is None:
+            if maybe_castable(arr) and not copy and dtype is None:
                 return arr
 
         try:
-            subarr = _possibly_cast_to_datetime(arr, dtype)
-            if not is_internal_type(subarr):
-                subarr = np.array(subarr, dtype=dtype, copy=copy)
+            # gh-15832: Check if we are requesting a numeric dype and
+            # that we can convert the data to the requested dtype.
+            if is_float_dtype(dtype) or is_integer_dtype(dtype):
+                subarr = maybe_cast_to_integer_array(arr, dtype)
+
+            subarr = maybe_cast_to_datetime(arr, dtype)
+            # Take care in creating object arrays (but iterators are not
+            # supported):
+            if is_object_dtype(dtype) and (is_list_like(subarr) and
+                                           not (is_iterator(subarr) or
+                                           isinstance(subarr, np.ndarray))):
+                subarr = construct_1d_object_array_from_listlike(subarr)
+            elif not is_extension_type(subarr):
+                subarr = construct_1d_ndarray_preserving_na(subarr, dtype,
+                                                            copy=copy)
         except (ValueError, TypeError):
             if is_categorical_dtype(dtype):
-                subarr = Categorical(arr)
+                # We *do* allow casting to categorical, since we know
+                # that Categorical is the only array type for 'category'.
+                subarr = Categorical(arr, dtype.categories,
+                                     ordered=dtype.ordered)
+            elif is_extension_array_dtype(dtype):
+                # We don't allow casting to third party dtypes, since we don't
+                # know what array belongs to which type.
+                msg = ("Cannot cast data to extension dtype '{}'. "
+                       "Pass the extension array directly.".format(dtype))
+                raise ValueError(msg)
+
             elif dtype is not None and raise_cast_failure:
                 raise
             else:
@@ -2752,8 +4111,8 @@ def _try_cast(arr, take_fast_path):
             subarr = np.array(data, copy=False)
 
             # possibility of nan -> garbage
-            if com.is_float_dtype(data.dtype) and com.is_integer_dtype(dtype):
-                if not isnull(data).any():
+            if is_float_dtype(data.dtype) and is_integer_dtype(dtype):
+                if not isna(data).any():
                     subarr = _try_cast(data, True)
                 elif copy:
                     subarr = data.copy()
@@ -2761,23 +4120,29 @@ def _try_cast(arr, take_fast_path):
                 subarr = _try_cast(data, True)
         elif isinstance(data, Index):
             # don't coerce Index types
-            # e.g. indexes can have different conversions (so don't fast path them)
+            # e.g. indexes can have different conversions (so don't fast path
+            # them)
             # GH 6140
-            subarr = _sanitize_index(data, index, copy=True)
+            subarr = _sanitize_index(data, index, copy=copy)
         else:
-            subarr = _try_cast(data, True)
 
-        if copy:
-            subarr = data.copy()
+            # we will try to copy be-definition here
+            subarr = _try_cast(data, True)
 
-    elif isinstance(data, Categorical):
+    elif isinstance(data, ExtensionArray):
         subarr = data
 
+        if dtype is not None and not data.dtype.is_dtype(dtype):
+            msg = ("Cannot coerce extension array to dtype '{typ}'. "
+                   "Do the coercion before passing to the constructor "
+                   "instead.".format(typ=dtype))
+            raise ValueError(msg)
+
         if copy:
             subarr = data.copy()
         return subarr
 
-    elif isinstance(data, list) and len(data) > 0:
+    elif isinstance(data, (list, tuple)) and len(data) > 0:
         if dtype is not None:
             try:
                 subarr = _try_cast(data, False)
@@ -2788,28 +4153,20 @@ def _try_cast(arr, take_fast_path):
                 subarr = lib.maybe_convert_objects(subarr)
 
         else:
-            subarr = _possibly_convert_platform(data)
+            subarr = maybe_convert_platform(data)
 
-        subarr = _possibly_cast_to_datetime(subarr, dtype)
+        subarr = maybe_cast_to_datetime(subarr, dtype)
 
+    elif isinstance(data, range):
+        # GH 16804
+        start, stop, step = get_range_parameters(data)
+        arr = np.arange(start, stop, step, dtype='int64')
+        subarr = _try_cast(arr, False)
     else:
         subarr = _try_cast(data, False)
 
-    def create_from_value(value, index, dtype):
-        # return a new empty value suitable for the dtype
-
-        if is_datetimetz(dtype):
-            subarr = DatetimeIndex([value]*len(index))
-        else:
-            if not isinstance(dtype, (np.dtype, type(np.dtype))):
-                dtype = dtype.dtype
-            subarr = np.empty(len(index), dtype=dtype)
-            subarr.fill(value)
-
-        return subarr
-
-    # scalar like
-    if subarr.ndim == 0:
+    # scalar like, GH
+    if getattr(subarr, 'ndim', 0) == 0:
         if isinstance(data, list):  # pragma: no cover
             subarr = np.array(data, dtype=object)
         elif index is not None:
@@ -2817,12 +4174,13 @@ def create_from_value(value, index, dtype):
 
             # figure out the dtype from the value (upcast if necessary)
             if dtype is None:
-                dtype, value = _infer_dtype_from_scalar(value)
+                dtype, value = infer_dtype_from_scalar(value)
             else:
                 # need to possibly convert the value here
-                value = _possibly_cast_to_datetime(value, dtype)
+                value = maybe_cast_to_datetime(value, dtype)
 
-            subarr = create_from_value(value, index, dtype)
+            subarr = construct_1d_arraylike_from_scalar(
+                value, len(index), dtype)
 
         else:
             return subarr.item()
@@ -2833,39 +4191,24 @@ def create_from_value(value, index, dtype):
 
             # a 1-element ndarray
             if len(subarr) != len(index) and len(subarr) == 1:
-                subarr = create_from_value(subarr[0], index, subarr)
+                subarr = construct_1d_arraylike_from_scalar(
+                    subarr[0], len(index), subarr.dtype)
 
     elif subarr.ndim > 1:
         if isinstance(data, np.ndarray):
             raise Exception('Data must be 1-dimensional')
         else:
-            subarr = _asarray_tuplesafe(data, dtype=dtype)
+            subarr = com._asarray_tuplesafe(data, dtype=dtype)
 
     # This is to prevent mixed-type Series getting all casted to
     # NumPy string type, e.g. NaN --> '-1#IND'.
     if issubclass(subarr.dtype.type, compat.string_types):
-        subarr = np.array(data, dtype=object, copy=copy)
+        # GH 16605
+        # If not empty convert the data to dtype
+        # GH 19853: If data is a scalar, subarr has already the result
+        if not is_scalar(data):
+            if not np.all(isna(data)):
+                data = np.array(data, dtype=dtype, copy=False)
+            subarr = np.array(data, dtype=object, copy=copy)
 
     return subarr
-
-# backwards compatiblity
-class TimeSeries(Series):
-
-    def __init__(self, *args, **kwargs):
-        # deprecation TimeSeries, #10890
-        warnings.warn("TimeSeries is deprecated. Please use Series",
-                      FutureWarning, stacklevel=2)
-
-        super(TimeSeries, self).__init__(*args, **kwargs)
-
-#----------------------------------------------------------------------
-# Add plotting methods to Series
-
-import pandas.tools.plotting as _gfx
-
-Series.plot = base.AccessorProperty(_gfx.SeriesPlotMethods, _gfx.SeriesPlotMethods)
-Series.hist = _gfx.hist_series
-
-# Add arithmetic!
-ops.add_flex_arithmetic_methods(Series, **ops.series_flex_funcs)
-ops.add_special_arithmetic_methods(Series, **ops.series_special_funcs)
diff --git a/pandas/core/sorting.py b/pandas/core/sorting.py
new file mode 100644
index 0000000000000..212f44e55c489
--- /dev/null
+++ b/pandas/core/sorting.py
@@ -0,0 +1,490 @@
+""" miscellaneous sorting / groupby utilities """
+
+import numpy as np
+from pandas.compat import long, string_types, PY3
+from pandas.core.dtypes.common import (
+    _ensure_platform_int,
+    _ensure_int64,
+    is_list_like,
+    is_categorical_dtype)
+from pandas.core.dtypes.cast import infer_dtype_from_array
+from pandas.core.dtypes.missing import isna
+import pandas.core.algorithms as algorithms
+from pandas._libs import lib, algos, hashtable
+from pandas._libs.hashtable import unique_label_indices
+
+
+_INT64_MAX = np.iinfo(np.int64).max
+
+
+def get_group_index(labels, shape, sort, xnull):
+    """
+    For the particular label_list, gets the offsets into the hypothetical list
+    representing the totally ordered cartesian product of all possible label
+    combinations, *as long as* this space fits within int64 bounds;
+    otherwise, though group indices identify unique combinations of
+    labels, they cannot be deconstructed.
+    - If `sort`, rank of returned ids preserve lexical ranks of labels.
+      i.e. returned id's can be used to do lexical sort on labels;
+    - If `xnull` nulls (-1 labels) are passed through.
+
+    Parameters
+    ----------
+    labels: sequence of arrays
+        Integers identifying levels at each location
+    shape: sequence of ints same length as labels
+        Number of unique levels at each location
+    sort: boolean
+        If the ranks of returned ids should match lexical ranks of labels
+    xnull: boolean
+        If true nulls are excluded. i.e. -1 values in the labels are
+        passed through
+    Returns
+    -------
+    An array of type int64 where two elements are equal if their corresponding
+    labels are equal at all location.
+    """
+    def _int64_cut_off(shape):
+        acc = long(1)
+        for i, mul in enumerate(shape):
+            acc *= long(mul)
+            if not acc < _INT64_MAX:
+                return i
+        return len(shape)
+
+    def maybe_lift(lab, size):
+        # promote nan values (assigned -1 label in lab array)
+        # so that all output values are non-negative
+        return (lab + 1, size + 1) if (lab == -1).any() else (lab, size)
+
+    labels = map(_ensure_int64, labels)
+    if not xnull:
+        labels, shape = map(list, zip(*map(maybe_lift, labels, shape)))
+
+    labels = list(labels)
+    shape = list(shape)
+
+    # Iteratively process all the labels in chunks sized so less
+    # than _INT64_MAX unique int ids will be required for each chunk
+    while True:
+        # how many levels can be done without overflow:
+        nlev = _int64_cut_off(shape)
+
+        # compute flat ids for the first `nlev` levels
+        stride = np.prod(shape[1:nlev], dtype='i8')
+        out = stride * labels[0].astype('i8', subok=False, copy=False)
+
+        for i in range(1, nlev):
+            if shape[i] == 0:
+                stride = 0
+            else:
+                stride //= shape[i]
+            out += labels[i] * stride
+
+        if xnull:  # exclude nulls
+            mask = labels[0] == -1
+            for lab in labels[1:nlev]:
+                mask |= lab == -1
+            out[mask] = -1
+
+        if nlev == len(shape):  # all levels done!
+            break
+
+        # compress what has been done so far in order to avoid overflow
+        # to retain lexical ranks, obs_ids should be sorted
+        comp_ids, obs_ids = compress_group_index(out, sort=sort)
+
+        labels = [comp_ids] + labels[nlev:]
+        shape = [len(obs_ids)] + shape[nlev:]
+
+    return out
+
+
+def get_compressed_ids(labels, sizes):
+    """
+
+    Group_index is offsets into cartesian product of all possible labels. This
+    space can be huge, so this function compresses it, by computing offsets
+    (comp_ids) into the list of unique labels (obs_group_ids).
+
+    Parameters
+    ----------
+    labels : list of label arrays
+    sizes : list of size of the levels
+
+    Returns
+    -------
+    tuple of (comp_ids, obs_group_ids)
+
+    """
+    ids = get_group_index(labels, sizes, sort=True, xnull=False)
+    return compress_group_index(ids, sort=True)
+
+
+def is_int64_overflow_possible(shape):
+    the_prod = long(1)
+    for x in shape:
+        the_prod *= long(x)
+
+    return the_prod >= _INT64_MAX
+
+
+def decons_group_index(comp_labels, shape):
+    # reconstruct labels
+    if is_int64_overflow_possible(shape):
+        # at some point group indices are factorized,
+        # and may not be deconstructed here! wrong path!
+        raise ValueError('cannot deconstruct factorized group indices!')
+
+    label_list = []
+    factor = 1
+    y = 0
+    x = comp_labels
+    for i in reversed(range(len(shape))):
+        labels = (x - y) % (factor * shape[i]) // factor
+        np.putmask(labels, comp_labels < 0, -1)
+        label_list.append(labels)
+        y = labels * factor
+        factor *= shape[i]
+    return label_list[::-1]
+
+
+def decons_obs_group_ids(comp_ids, obs_ids, shape, labels, xnull):
+    """
+    reconstruct labels from observed group ids
+
+    Parameters
+    ----------
+    xnull: boolean,
+        if nulls are excluded; i.e. -1 labels are passed through
+    """
+
+    if not xnull:
+        lift = np.fromiter(((a == -1).any() for a in labels), dtype='i8')
+        shape = np.asarray(shape, dtype='i8') + lift
+
+    if not is_int64_overflow_possible(shape):
+        # obs ids are deconstructable! take the fast route!
+        out = decons_group_index(obs_ids, shape)
+        return out if xnull or not lift.any() \
+            else [x - y for x, y in zip(out, lift)]
+
+    i = unique_label_indices(comp_ids)
+    i8copy = lambda a: a.astype('i8', subok=False, copy=True)
+    return [i8copy(lab[i]) for lab in labels]
+
+
+def indexer_from_factorized(labels, shape, compress=True):
+    ids = get_group_index(labels, shape, sort=True, xnull=False)
+
+    if not compress:
+        ngroups = (ids.size and ids.max()) + 1
+    else:
+        ids, obs = compress_group_index(ids, sort=True)
+        ngroups = len(obs)
+
+    return get_group_index_sorter(ids, ngroups)
+
+
+def lexsort_indexer(keys, orders=None, na_position='last'):
+    from pandas.core.arrays import Categorical
+
+    labels = []
+    shape = []
+    if isinstance(orders, bool):
+        orders = [orders] * len(keys)
+    elif orders is None:
+        orders = [True] * len(keys)
+
+    for key, order in zip(keys, orders):
+
+        # we are already a Categorical
+        if is_categorical_dtype(key):
+            c = key
+
+        # create the Categorical
+        else:
+            c = Categorical(key, ordered=True)
+
+        if na_position not in ['last', 'first']:
+            raise ValueError('invalid na_position: {!r}'.format(na_position))
+
+        n = len(c.categories)
+        codes = c.codes.copy()
+
+        mask = (c.codes == -1)
+        if order:  # ascending
+            if na_position == 'last':
+                codes = np.where(mask, n, codes)
+            elif na_position == 'first':
+                codes += 1
+        else:  # not order means descending
+            if na_position == 'last':
+                codes = np.where(mask, n, n - codes - 1)
+            elif na_position == 'first':
+                codes = np.where(mask, 0, n - codes)
+        if mask.any():
+            n += 1
+
+        shape.append(n)
+        labels.append(codes)
+
+    return indexer_from_factorized(labels, shape)
+
+
+def nargsort(items, kind='quicksort', ascending=True, na_position='last'):
+    """
+    This is intended to be a drop-in replacement for np.argsort which
+    handles NaNs. It adds ascending and na_position parameters.
+    GH #6399, #5231
+    """
+
+    # specially handle Categorical
+    if is_categorical_dtype(items):
+        return items.argsort(ascending=ascending, kind=kind)
+
+    items = np.asanyarray(items)
+    idx = np.arange(len(items))
+    mask = isna(items)
+    non_nans = items[~mask]
+    non_nan_idx = idx[~mask]
+    nan_idx = np.nonzero(mask)[0]
+    if not ascending:
+        non_nans = non_nans[::-1]
+        non_nan_idx = non_nan_idx[::-1]
+    indexer = non_nan_idx[non_nans.argsort(kind=kind)]
+    if not ascending:
+        indexer = indexer[::-1]
+    # Finally, place the NaNs at the end or the beginning according to
+    # na_position
+    if na_position == 'last':
+        indexer = np.concatenate([indexer, nan_idx])
+    elif na_position == 'first':
+        indexer = np.concatenate([nan_idx, indexer])
+    else:
+        raise ValueError('invalid na_position: {!r}'.format(na_position))
+    return indexer
+
+
+class _KeyMapper(object):
+
+    """
+    Ease my suffering. Map compressed group id -> key tuple
+    """
+
+    def __init__(self, comp_ids, ngroups, levels, labels):
+        self.levels = levels
+        self.labels = labels
+        self.comp_ids = comp_ids.astype(np.int64)
+
+        self.k = len(labels)
+        self.tables = [hashtable.Int64HashTable(ngroups)
+                       for _ in range(self.k)]
+
+        self._populate_tables()
+
+    def _populate_tables(self):
+        for labs, table in zip(self.labels, self.tables):
+            table.map(self.comp_ids, labs.astype(np.int64))
+
+    def get_key(self, comp_id):
+        return tuple(level[table.get_item(comp_id)]
+                     for table, level in zip(self.tables, self.levels))
+
+
+def get_flattened_iterator(comp_ids, ngroups, levels, labels):
+    # provide "flattened" iterator for multi-group setting
+    mapper = _KeyMapper(comp_ids, ngroups, levels, labels)
+    return [mapper.get_key(i) for i in range(ngroups)]
+
+
+def get_indexer_dict(label_list, keys):
+    """ return a diction of {labels} -> {indexers} """
+    shape = list(map(len, keys))
+
+    group_index = get_group_index(label_list, shape, sort=True, xnull=True)
+    ngroups = ((group_index.size and group_index.max()) + 1) \
+        if is_int64_overflow_possible(shape) \
+        else np.prod(shape, dtype='i8')
+
+    sorter = get_group_index_sorter(group_index, ngroups)
+
+    sorted_labels = [lab.take(sorter) for lab in label_list]
+    group_index = group_index.take(sorter)
+
+    return lib.indices_fast(sorter, group_index, keys, sorted_labels)
+
+
+# ----------------------------------------------------------------------
+# sorting levels...cleverly?
+
+def get_group_index_sorter(group_index, ngroups):
+    """
+    algos.groupsort_indexer implements `counting sort` and it is at least
+    O(ngroups), where
+        ngroups = prod(shape)
+        shape = map(len, keys)
+    that is, linear in the number of combinations (cartesian product) of unique
+    values of groupby keys. This can be huge when doing multi-key groupby.
+    np.argsort(kind='mergesort') is O(count x log(count)) where count is the
+    length of the data-frame;
+    Both algorithms are `stable` sort and that is necessary for correctness of
+    groupby operations. e.g. consider:
+        df.groupby(key)[col].transform('first')
+    """
+    count = len(group_index)
+    alpha = 0.0  # taking complexities literally; there may be
+    beta = 1.0  # some room for fine-tuning these parameters
+    do_groupsort = (count > 0 and ((alpha + beta * ngroups) <
+                                   (count * np.log(count))))
+    if do_groupsort:
+        sorter, _ = algos.groupsort_indexer(_ensure_int64(group_index),
+                                            ngroups)
+        return _ensure_platform_int(sorter)
+    else:
+        return group_index.argsort(kind='mergesort')
+
+
+def compress_group_index(group_index, sort=True):
+    """
+    Group_index is offsets into cartesian product of all possible labels. This
+    space can be huge, so this function compresses it, by computing offsets
+    (comp_ids) into the list of unique labels (obs_group_ids).
+    """
+
+    size_hint = min(len(group_index), hashtable._SIZE_HINT_LIMIT)
+    table = hashtable.Int64HashTable(size_hint)
+
+    group_index = _ensure_int64(group_index)
+
+    # note, group labels come out ascending (ie, 1,2,3 etc)
+    comp_ids, obs_group_ids = table.get_labels_groupby(group_index)
+
+    if sort and len(obs_group_ids) > 0:
+        obs_group_ids, comp_ids = _reorder_by_uniques(obs_group_ids, comp_ids)
+
+    return comp_ids, obs_group_ids
+
+
+def _reorder_by_uniques(uniques, labels):
+    # sorter is index where elements ought to go
+    sorter = uniques.argsort()
+
+    # reverse_indexer is where elements came from
+    reverse_indexer = np.empty(len(sorter), dtype=np.int64)
+    reverse_indexer.put(sorter, np.arange(len(sorter)))
+
+    mask = labels < 0
+
+    # move labels to right locations (ie, unsort ascending labels)
+    labels = algorithms.take_nd(reverse_indexer, labels, allow_fill=False)
+    np.putmask(labels, mask, -1)
+
+    # sort observed ids
+    uniques = algorithms.take_nd(uniques, sorter, allow_fill=False)
+
+    return uniques, labels
+
+
+def safe_sort(values, labels=None, na_sentinel=-1, assume_unique=False):
+    """
+    Sort ``values`` and reorder corresponding ``labels``.
+    ``values`` should be unique if ``labels`` is not None.
+    Safe for use with mixed types (int, str), orders ints before strs.
+
+    .. versionadded:: 0.19.0
+
+    Parameters
+    ----------
+    values : list-like
+        Sequence; must be unique if ``labels`` is not None.
+    labels : list_like
+        Indices to ``values``. All out of bound indices are treated as
+        "not found" and will be masked with ``na_sentinel``.
+    na_sentinel : int, default -1
+        Value in ``labels`` to mark "not found".
+        Ignored when ``labels`` is None.
+    assume_unique : bool, default False
+        When True, ``values`` are assumed to be unique, which can speed up
+        the calculation. Ignored when ``labels`` is None.
+
+    Returns
+    -------
+    ordered : ndarray
+        Sorted ``values``
+    new_labels : ndarray
+        Reordered ``labels``; returned when ``labels`` is not None.
+
+    Raises
+    ------
+    TypeError
+        * If ``values`` is not list-like or if ``labels`` is neither None
+        nor list-like
+        * If ``values`` cannot be sorted
+    ValueError
+        * If ``labels`` is not None and ``values`` contain duplicates.
+    """
+    if not is_list_like(values):
+        raise TypeError("Only list-like objects are allowed to be passed to"
+                        "safe_sort as values")
+
+    if not isinstance(values, np.ndarray):
+
+        # don't convert to string types
+        dtype, _ = infer_dtype_from_array(values)
+        values = np.asarray(values, dtype=dtype)
+
+    def sort_mixed(values):
+        # order ints before strings, safe in py3
+        str_pos = np.array([isinstance(x, string_types) for x in values],
+                           dtype=bool)
+        nums = np.sort(values[~str_pos])
+        strs = np.sort(values[str_pos])
+        return np.concatenate([nums, np.asarray(strs, dtype=object)])
+
+    sorter = None
+    if PY3 and lib.infer_dtype(values) == 'mixed-integer':
+        # unorderable in py3 if mixed str/int
+        ordered = sort_mixed(values)
+    else:
+        try:
+            sorter = values.argsort()
+            ordered = values.take(sorter)
+        except TypeError:
+            # try this anyway
+            ordered = sort_mixed(values)
+
+    # labels:
+
+    if labels is None:
+        return ordered
+
+    if not is_list_like(labels):
+        raise TypeError("Only list-like objects or None are allowed to be"
+                        "passed to safe_sort as labels")
+    labels = _ensure_platform_int(np.asarray(labels))
+
+    from pandas import Index
+    if not assume_unique and not Index(values).is_unique:
+        raise ValueError("values should be unique if labels is not None")
+
+    if sorter is None:
+        # mixed types
+        (hash_klass, _), values = algorithms._get_data_algo(
+            values, algorithms._hashtables)
+        t = hash_klass(len(values))
+        t.map_locations(values)
+        sorter = _ensure_platform_int(t.lookup(ordered))
+
+    reverse_indexer = np.empty(len(sorter), dtype=np.int_)
+    reverse_indexer.put(sorter, np.arange(len(sorter)))
+
+    mask = (labels < -len(values)) | (labels >= len(values)) | \
+        (labels == na_sentinel)
+
+    # (Out of bound indices will be masked with `na_sentinel` next, so we may
+    # deal with them here without performance loss using `mode='wrap'`.)
+    new_labels = reverse_indexer.take(labels, mode='wrap')
+    np.putmask(new_labels, mask, na_sentinel)
+
+    return ordered, _ensure_platform_int(new_labels)
diff --git a/pandas/core/sparse.py b/pandas/core/sparse.py
deleted file mode 100644
index 84149e5598f82..0000000000000
--- a/pandas/core/sparse.py
+++ /dev/null
@@ -1,10 +0,0 @@
-"""
-Data structures for sparse float data. Life is made simpler by dealing only
-with float64 data
-"""
-
-# pylint: disable=W0611
-
-from pandas.sparse.series import SparseSeries
-from pandas.sparse.frame import SparseDataFrame
-from pandas.sparse.panel import SparsePanel
diff --git a/pandas/sandbox/__init__.py b/pandas/core/sparse/__init__.py
similarity index 100%
rename from pandas/sandbox/__init__.py
rename to pandas/core/sparse/__init__.py
diff --git a/pandas/core/sparse/api.py b/pandas/core/sparse/api.py
new file mode 100644
index 0000000000000..85941e6923338
--- /dev/null
+++ b/pandas/core/sparse/api.py
@@ -0,0 +1,5 @@
+# pylint: disable=W0611
+# flake8: noqa
+from pandas.core.sparse.array import SparseArray
+from pandas.core.sparse.series import SparseSeries
+from pandas.core.sparse.frame import SparseDataFrame
diff --git a/pandas/core/sparse/array.py b/pandas/core/sparse/array.py
new file mode 100644
index 0000000000000..ff58f7d104ff9
--- /dev/null
+++ b/pandas/core/sparse/array.py
@@ -0,0 +1,849 @@
+"""
+SparseArray data structure
+"""
+from __future__ import division
+# pylint: disable=E1101,E1103,W0231
+
+import numpy as np
+import warnings
+
+import pandas as pd
+from pandas.core.base import PandasObject, IndexOpsMixin
+
+from pandas import compat
+from pandas.compat import range, PYPY
+from pandas.compat.numpy import function as nv
+
+from pandas.core.dtypes.generic import ABCSparseSeries
+from pandas.core.dtypes.common import (
+    _ensure_platform_int,
+    is_float, is_integer,
+    is_object_dtype,
+    is_integer_dtype,
+    is_bool_dtype,
+    is_list_like,
+    is_string_dtype,
+    is_scalar, is_dtype_equal)
+from pandas.core.dtypes.cast import (
+    maybe_convert_platform, maybe_promote,
+    astype_nansafe, find_common_type, infer_dtype_from_scalar,
+    construct_1d_arraylike_from_scalar)
+from pandas.core.dtypes.missing import isna, notna, na_value_for_dtype
+
+import pandas._libs.sparse as splib
+import pandas._libs.lib as lib
+from pandas._libs.sparse import SparseIndex, BlockIndex, IntIndex
+from pandas._libs import index as libindex
+import pandas.core.algorithms as algos
+import pandas.core.ops as ops
+import pandas.io.formats.printing as printing
+from pandas.util._decorators import Appender
+from pandas.core.indexes.base import _index_shared_docs
+
+
+_sparray_doc_kwargs = dict(klass='SparseArray')
+
+
+def _get_fill(arr):
+    # coerce fill_value to arr dtype if possible
+    # int64 SparseArray can have NaN as fill_value if there is no missing
+    try:
+        return np.asarray(arr.fill_value, dtype=arr.dtype)
+    except ValueError:
+        return np.asarray(arr.fill_value)
+
+
+def _sparse_array_op(left, right, op, name):
+    if name.startswith('__'):
+        # For lookups in _libs.sparse we need non-dunder op name
+        name = name[2:-2]
+
+    # dtype used to find corresponding sparse method
+    if not is_dtype_equal(left.dtype, right.dtype):
+        dtype = find_common_type([left.dtype, right.dtype])
+        left = left.astype(dtype)
+        right = right.astype(dtype)
+    else:
+        dtype = left.dtype
+
+    # dtype the result must have
+    result_dtype = None
+
+    if left.sp_index.ngaps == 0 or right.sp_index.ngaps == 0:
+        with np.errstate(all='ignore'):
+            result = op(left.get_values(), right.get_values())
+            fill = op(_get_fill(left), _get_fill(right))
+
+        if left.sp_index.ngaps == 0:
+            index = left.sp_index
+        else:
+            index = right.sp_index
+    elif left.sp_index.equals(right.sp_index):
+        with np.errstate(all='ignore'):
+            result = op(left.sp_values, right.sp_values)
+            fill = op(_get_fill(left), _get_fill(right))
+        index = left.sp_index
+    else:
+        if name[0] == 'r':
+            left, right = right, left
+            name = name[1:]
+
+        if name in ('and', 'or') and dtype == 'bool':
+            opname = 'sparse_{name}_uint8'.format(name=name)
+            # to make template simple, cast here
+            left_sp_values = left.sp_values.view(np.uint8)
+            right_sp_values = right.sp_values.view(np.uint8)
+            result_dtype = np.bool
+        else:
+            opname = 'sparse_{name}_{dtype}'.format(name=name, dtype=dtype)
+            left_sp_values = left.sp_values
+            right_sp_values = right.sp_values
+
+        sparse_op = getattr(splib, opname)
+        with np.errstate(all='ignore'):
+            result, index, fill = sparse_op(left_sp_values, left.sp_index,
+                                            left.fill_value, right_sp_values,
+                                            right.sp_index, right.fill_value)
+
+    if result_dtype is None:
+        result_dtype = result.dtype
+
+    return _wrap_result(name, result, index, fill, dtype=result_dtype)
+
+
+def _wrap_result(name, data, sparse_index, fill_value, dtype=None):
+    """ wrap op result to have correct dtype """
+    if name.startswith('__'):
+        # e.g. __eq__ --> eq
+        name = name[2:-2]
+
+    if name in ('eq', 'ne', 'lt', 'gt', 'le', 'ge'):
+        dtype = np.bool
+
+    if is_bool_dtype(dtype):
+        # fill_value may be np.bool_
+        fill_value = bool(fill_value)
+    return SparseArray(data, sparse_index=sparse_index,
+                       fill_value=fill_value, dtype=dtype)
+
+
+class SparseArray(PandasObject, np.ndarray):
+    """Data structure for labeled, sparse floating point 1-D data
+
+    Parameters
+    ----------
+    data : {array-like (1-D), Series, SparseSeries, dict}
+    kind : {'block', 'integer'}
+    fill_value : float
+        Code for missing value. Defaults depends on dtype.
+        0 for int dtype, False for bool dtype, and NaN for other dtypes
+    sparse_index : {BlockIndex, IntIndex}, optional
+        Only if you have one. Mainly used internally
+
+    Notes
+    -----
+    SparseArray objects are immutable via the typical Python means. If you
+    must change values, convert to dense, make your changes, then convert back
+    to sparse
+    """
+    __array_priority__ = 15
+    _typ = 'array'
+    _subtyp = 'sparse_array'
+
+    sp_index = None
+    fill_value = None
+
+    def __new__(cls, data, sparse_index=None, index=None, kind='integer',
+                fill_value=None, dtype=None, copy=False):
+
+        if index is not None:
+            if data is None:
+                data = np.nan
+            if not is_scalar(data):
+                raise Exception("must only pass scalars with an index ")
+            dtype = infer_dtype_from_scalar(data)[0]
+            data = construct_1d_arraylike_from_scalar(
+                data, len(index), dtype)
+
+        if isinstance(data, ABCSparseSeries):
+            data = data.values
+        is_sparse_array = isinstance(data, SparseArray)
+
+        if dtype is not None:
+            dtype = np.dtype(dtype)
+
+        if is_sparse_array:
+            sparse_index = data.sp_index
+            values = data.sp_values
+            fill_value = data.fill_value
+        else:
+            # array-like
+            if sparse_index is None:
+                if dtype is not None:
+                    data = np.asarray(data, dtype=dtype)
+                res = make_sparse(data, kind=kind, fill_value=fill_value)
+                values, sparse_index, fill_value = res
+            else:
+                values = _sanitize_values(data)
+                if len(values) != sparse_index.npoints:
+                    raise AssertionError("Non array-like type {type} must "
+                                         "have the same length as the index"
+                                         .format(type=type(values)))
+        # Create array, do *not* copy data by default
+        if copy:
+            subarr = np.array(values, dtype=dtype, copy=True)
+        else:
+            subarr = np.asarray(values, dtype=dtype)
+        # Change the class of the array to be the subclass type.
+        return cls._simple_new(subarr, sparse_index, fill_value)
+
+    @classmethod
+    def _simple_new(cls, data, sp_index, fill_value):
+        if not isinstance(sp_index, SparseIndex):
+            # caller must pass SparseIndex
+            raise ValueError('sp_index must be a SparseIndex')
+
+        if fill_value is None:
+            if sp_index.ngaps > 0:
+                # has missing hole
+                fill_value = np.nan
+            else:
+                fill_value = na_value_for_dtype(data.dtype)
+
+        if (is_integer_dtype(data) and is_float(fill_value) and
+                sp_index.ngaps > 0):
+            # if float fill_value is being included in dense repr,
+            # convert values to float
+            data = data.astype(float)
+
+        result = data.view(cls)
+
+        if not isinstance(sp_index, SparseIndex):
+            # caller must pass SparseIndex
+            raise ValueError('sp_index must be a SparseIndex')
+
+        result.sp_index = sp_index
+        result._fill_value = fill_value
+        return result
+
+    @property
+    def _constructor(self):
+        return lambda x: SparseArray(x, fill_value=self.fill_value,
+                                     kind=self.kind)
+
+    @property
+    def kind(self):
+        if isinstance(self.sp_index, BlockIndex):
+            return 'block'
+        elif isinstance(self.sp_index, IntIndex):
+            return 'integer'
+
+    @Appender(IndexOpsMixin.memory_usage.__doc__)
+    def memory_usage(self, deep=False):
+        values = self.sp_values
+
+        v = values.nbytes
+
+        if deep and is_object_dtype(self) and not PYPY:
+            v += lib.memory_usage_of_objects(values)
+
+        return v
+
+    def __array_wrap__(self, out_arr, context=None):
+        """
+        NumPy calls this method when ufunc is applied
+
+        Parameters
+        ----------
+
+        out_arr : ndarray
+            ufunc result (note that ufunc is only applied to sp_values)
+        context : tuple of 3 elements (ufunc, signature, domain)
+            for example, following is a context when np.sin is applied to
+            SparseArray,
+
+            (<ufunc 'sin'>, (SparseArray,), 0))
+
+        See http://docs.scipy.org/doc/numpy/user/basics.subclassing.html
+        """
+        if isinstance(context, tuple) and len(context) == 3:
+            ufunc, args, domain = context
+            # to apply ufunc only to fill_value (to avoid recursive call)
+            args = [getattr(a, 'fill_value', a) for a in args]
+            with np.errstate(all='ignore'):
+                fill_value = ufunc(self.fill_value, *args[1:])
+        else:
+            fill_value = self.fill_value
+
+        return self._simple_new(out_arr, sp_index=self.sp_index,
+                                fill_value=fill_value)
+
+    def __array_finalize__(self, obj):
+        """
+        Gets called after any ufunc or other array operations, necessary
+        to pass on the index.
+        """
+        self.sp_index = getattr(obj, 'sp_index', None)
+        self._fill_value = getattr(obj, 'fill_value', None)
+
+    def __reduce__(self):
+        """Necessary for making this object picklable"""
+        object_state = list(np.ndarray.__reduce__(self))
+        subclass_state = self.fill_value, self.sp_index
+        object_state[2] = self.sp_values.__reduce__()[2]
+        object_state[2] = (object_state[2], subclass_state)
+        return tuple(object_state)
+
+    def __setstate__(self, state):
+        """Necessary for making this object picklable"""
+        nd_state, own_state = state
+        np.ndarray.__setstate__(self, nd_state)
+
+        fill_value, sp_index = own_state[:2]
+        self.sp_index = sp_index
+        self._fill_value = fill_value
+
+    def __len__(self):
+        try:
+            return self.sp_index.length
+        except:
+            return 0
+
+    def __unicode__(self):
+        return '{self}\nFill: {fill}\n{index}'.format(
+            self=printing.pprint_thing(self),
+            fill=printing.pprint_thing(self.fill_value),
+            index=printing.pprint_thing(self.sp_index))
+
+    def disable(self, other):
+        raise NotImplementedError('inplace binary ops not supported')
+    # Inplace operators
+    __iadd__ = disable
+    __isub__ = disable
+    __imul__ = disable
+    __itruediv__ = disable
+    __ifloordiv__ = disable
+    __ipow__ = disable
+
+    # Python 2 division operators
+    if not compat.PY3:
+        __idiv__ = disable
+
+    @property
+    def values(self):
+        """
+        Dense values
+        """
+        output = np.empty(len(self), dtype=self.dtype)
+        int_index = self.sp_index.to_int_index()
+        output.fill(self.fill_value)
+        output.put(int_index.indices, self)
+        return output
+
+    @property
+    def shape(self):
+        return (len(self),)
+
+    @property
+    def sp_values(self):
+        # caching not an option, leaks memory
+        return self.view(np.ndarray)
+
+    @property
+    def fill_value(self):
+        return self._fill_value
+
+    @fill_value.setter
+    def fill_value(self, value):
+        if not is_scalar(value):
+            raise ValueError('fill_value must be a scalar')
+        # if the specified value triggers type promotion, raise ValueError
+        new_dtype, fill_value = maybe_promote(self.dtype, value)
+        if is_dtype_equal(self.dtype, new_dtype):
+            self._fill_value = fill_value
+        else:
+            msg = 'unable to set fill_value {fill} to {dtype} dtype'
+            raise ValueError(msg.format(fill=value, dtype=self.dtype))
+
+    def get_values(self, fill=None):
+        """ return a dense representation """
+        return self.to_dense(fill=fill)
+
+    def to_dense(self, fill=None):
+        """
+        Convert SparseArray to a NumPy array.
+
+        Parameters
+        ----------
+        fill: float, default None
+            .. deprecated:: 0.20.0
+               This argument is not respected by this function.
+
+        Returns
+        -------
+        arr : NumPy array
+        """
+        if fill is not None:
+            warnings.warn(("The 'fill' parameter has been deprecated and "
+                           "will be removed in a future version."),
+                          FutureWarning, stacklevel=2)
+        return self.values
+
+    def __iter__(self):
+        if np.issubdtype(self.dtype, np.floating):
+            boxer = float
+        elif np.issubdtype(self.dtype, np.integer):
+            boxer = int
+        else:
+            boxer = lambda x: x
+
+        for i in range(len(self)):
+            r = self._get_val_at(i)
+
+            # box em
+            yield boxer(r)
+
+    def __getitem__(self, key):
+        """
+
+        """
+
+        if is_integer(key):
+            return self._get_val_at(key)
+        elif isinstance(key, tuple):
+            data_slice = self.values[key]
+        else:
+            if isinstance(key, SparseArray):
+                if is_bool_dtype(key):
+                    key = key.to_dense()
+                else:
+                    key = np.asarray(key)
+
+            if hasattr(key, '__len__') and len(self) != len(key):
+                return self.take(key)
+            else:
+                data_slice = self.values[key]
+
+        return self._constructor(data_slice)
+
+    def __getslice__(self, i, j):
+        if i < 0:
+            i = 0
+        if j < 0:
+            j = 0
+        slobj = slice(i, j)
+        return self.__getitem__(slobj)
+
+    def _get_val_at(self, loc):
+        n = len(self)
+        if loc < 0:
+            loc += n
+
+        if loc >= n or loc < 0:
+            raise IndexError('Out of bounds access')
+
+        sp_loc = self.sp_index.lookup(loc)
+        if sp_loc == -1:
+            return self.fill_value
+        else:
+            return libindex.get_value_at(self, sp_loc)
+
+    @Appender(_index_shared_docs['take'] % _sparray_doc_kwargs)
+    def take(self, indices, axis=0, allow_fill=True,
+             fill_value=None, **kwargs):
+        """
+        Sparse-compatible version of ndarray.take
+
+        Returns
+        -------
+        taken : ndarray
+        """
+        nv.validate_take(tuple(), kwargs)
+
+        if axis:
+            raise ValueError("axis must be 0, input was {axis}"
+                             .format(axis=axis))
+
+        if is_integer(indices):
+            # return scalar
+            return self[indices]
+
+        indices = _ensure_platform_int(indices)
+        n = len(self)
+        if allow_fill and fill_value is not None:
+            # allow -1 to indicate self.fill_value,
+            # self.fill_value may not be NaN
+            if (indices < -1).any():
+                msg = ('When allow_fill=True and fill_value is not None, '
+                       'all indices must be >= -1')
+                raise ValueError(msg)
+            elif (n <= indices).any():
+                msg = 'index is out of bounds for size {size}'.format(size=n)
+                raise IndexError(msg)
+        else:
+            if ((indices < -n) | (n <= indices)).any():
+                msg = 'index is out of bounds for size {size}'.format(size=n)
+                raise IndexError(msg)
+
+        indices = indices.astype(np.int32)
+        if not (allow_fill and fill_value is not None):
+            indices = indices.copy()
+            indices[indices < 0] += n
+
+        locs = self.sp_index.lookup_array(indices)
+        indexer = np.arange(len(locs), dtype=np.int32)
+        mask = locs != -1
+        if mask.any():
+            indexer = indexer[mask]
+            new_values = self.sp_values.take(locs[mask])
+        else:
+            indexer = np.empty(shape=(0, ), dtype=np.int32)
+            new_values = np.empty(shape=(0, ), dtype=self.sp_values.dtype)
+
+        sp_index = _make_index(len(indices), indexer, kind=self.sp_index)
+        return self._simple_new(new_values, sp_index, self.fill_value)
+
+    def __setitem__(self, key, value):
+        # if is_integer(key):
+        #    self.values[key] = value
+        # else:
+        #    raise Exception("SparseArray does not support setting non-scalars
+        # via setitem")
+        raise TypeError(
+            "SparseArray does not support item assignment via setitem")
+
+    def __setslice__(self, i, j, value):
+        if i < 0:
+            i = 0
+        if j < 0:
+            j = 0
+        slobj = slice(i, j)  # noqa
+
+        # if not is_scalar(value):
+        #    raise Exception("SparseArray does not support setting non-scalars
+        # via slices")
+
+        # x = self.values
+        # x[slobj] = value
+        # self.values = x
+        raise TypeError("SparseArray does not support item assignment via "
+                        "slices")
+
+    def astype(self, dtype=None, copy=True):
+        dtype = np.dtype(dtype)
+        sp_values = astype_nansafe(self.sp_values, dtype, copy=copy)
+        try:
+            if is_bool_dtype(dtype):
+                # to avoid np.bool_ dtype
+                fill_value = bool(self.fill_value)
+            else:
+                fill_value = dtype.type(self.fill_value)
+        except ValueError:
+            msg = 'unable to coerce current fill_value {fill} to {dtype} dtype'
+            raise ValueError(msg.format(fill=self.fill_value, dtype=dtype))
+        return self._simple_new(sp_values, self.sp_index,
+                                fill_value=fill_value)
+
+    def copy(self, deep=True):
+        """
+        Make a copy of the SparseArray. Only the actual sparse values need to
+        be copied.
+        """
+        if deep:
+            values = self.sp_values.copy()
+        else:
+            values = self.sp_values
+        return SparseArray(values, sparse_index=self.sp_index,
+                           dtype=self.dtype, fill_value=self.fill_value)
+
+    def count(self):
+        """
+        Compute sum of non-NA/null observations in SparseArray. If the
+        fill_value is not NaN, the "sparse" locations will be included in the
+        observation count.
+
+        Returns
+        -------
+        nobs : int
+        """
+        sp_values = self.sp_values
+        valid_spvals = np.isfinite(sp_values).sum()
+        if self._null_fill_value:
+            return valid_spvals
+        else:
+            return valid_spvals + self.sp_index.ngaps
+
+    @property
+    def _null_fill_value(self):
+        return isna(self.fill_value)
+
+    @property
+    def _valid_sp_values(self):
+        sp_vals = self.sp_values
+        mask = notna(sp_vals)
+        return sp_vals[mask]
+
+    @Appender(_index_shared_docs['fillna'] % _sparray_doc_kwargs)
+    def fillna(self, value, downcast=None):
+        if downcast is not None:
+            raise NotImplementedError
+
+        if issubclass(self.dtype.type, np.floating):
+            value = float(value)
+
+        new_values = np.where(isna(self.sp_values), value, self.sp_values)
+        fill_value = value if self._null_fill_value else self.fill_value
+
+        return self._simple_new(new_values, self.sp_index,
+                                fill_value=fill_value)
+
+    def all(self, axis=0, *args, **kwargs):
+        """
+        Tests whether all elements evaluate True
+
+        Returns
+        -------
+        all : bool
+
+        See Also
+        --------
+        numpy.all
+        """
+        nv.validate_all(args, kwargs)
+
+        values = self.sp_values
+
+        if len(values) != len(self) and not np.all(self.fill_value):
+            return False
+
+        return values.all()
+
+    def any(self, axis=0, *args, **kwargs):
+        """
+        Tests whether at least one of elements evaluate True
+
+        Returns
+        -------
+        any : bool
+
+        See Also
+        --------
+        numpy.any
+        """
+        nv.validate_any(args, kwargs)
+
+        values = self.sp_values
+
+        if len(values) != len(self) and np.any(self.fill_value):
+            return True
+
+        return values.any()
+
+    def sum(self, axis=0, *args, **kwargs):
+        """
+        Sum of non-NA/null values
+
+        Returns
+        -------
+        sum : float
+        """
+        nv.validate_sum(args, kwargs)
+        valid_vals = self._valid_sp_values
+        sp_sum = valid_vals.sum()
+        if self._null_fill_value:
+            return sp_sum
+        else:
+            nsparse = self.sp_index.ngaps
+            return sp_sum + self.fill_value * nsparse
+
+    def cumsum(self, axis=0, *args, **kwargs):
+        """
+        Cumulative sum of non-NA/null values.
+
+        When performing the cumulative summation, any non-NA/null values will
+        be skipped. The resulting SparseArray will preserve the locations of
+        NaN values, but the fill value will be `np.nan` regardless.
+
+        Parameters
+        ----------
+        axis : int or None
+            Axis over which to perform the cumulative summation. If None,
+            perform cumulative summation over flattened array.
+
+        Returns
+        -------
+        cumsum : SparseArray
+        """
+        nv.validate_cumsum(args, kwargs)
+
+        if axis is not None and axis >= self.ndim:  # Mimic ndarray behaviour.
+            raise ValueError("axis(={axis}) out of bounds".format(axis=axis))
+
+        if not self._null_fill_value:
+            return SparseArray(self.to_dense()).cumsum()
+
+        return SparseArray(self.sp_values.cumsum(), sparse_index=self.sp_index,
+                           fill_value=self.fill_value)
+
+    def mean(self, axis=0, *args, **kwargs):
+        """
+        Mean of non-NA/null values
+
+        Returns
+        -------
+        mean : float
+        """
+        nv.validate_mean(args, kwargs)
+        valid_vals = self._valid_sp_values
+        sp_sum = valid_vals.sum()
+        ct = len(valid_vals)
+
+        if self._null_fill_value:
+            return sp_sum / ct
+        else:
+            nsparse = self.sp_index.ngaps
+            return (sp_sum + self.fill_value * nsparse) / (ct + nsparse)
+
+    def value_counts(self, dropna=True):
+        """
+        Returns a Series containing counts of unique values.
+
+        Parameters
+        ----------
+        dropna : boolean, default True
+            Don't include counts of NaN, even if NaN is in sp_values.
+
+        Returns
+        -------
+        counts : Series
+        """
+        keys, counts = algos._value_counts_arraylike(self.sp_values,
+                                                     dropna=dropna)
+        fcounts = self.sp_index.ngaps
+        if fcounts > 0:
+            if self._null_fill_value and dropna:
+                pass
+            else:
+                if self._null_fill_value:
+                    mask = pd.isna(keys)
+                else:
+                    mask = keys == self.fill_value
+
+                if mask.any():
+                    counts[mask] += fcounts
+                else:
+                    keys = np.insert(keys, 0, self.fill_value)
+                    counts = np.insert(counts, 0, fcounts)
+
+        if not isinstance(keys, pd.Index):
+            keys = pd.Index(keys)
+        result = pd.Series(counts, index=keys)
+        return result
+
+
+def _maybe_to_dense(obj):
+    """ try to convert to dense """
+    if hasattr(obj, 'to_dense'):
+        return obj.to_dense()
+    return obj
+
+
+def _maybe_to_sparse(array):
+    """ array must be SparseSeries or SparseArray """
+    if isinstance(array, ABCSparseSeries):
+        array = array.values.copy()
+    return array
+
+
+def _sanitize_values(arr):
+    """
+    return an ndarray for our input,
+    in a platform independent manner
+    """
+
+    if hasattr(arr, 'values'):
+        arr = arr.values
+    else:
+
+        # scalar
+        if is_scalar(arr):
+            arr = [arr]
+
+        # ndarray
+        if isinstance(arr, np.ndarray):
+            pass
+
+        elif is_list_like(arr) and len(arr) > 0:
+            arr = maybe_convert_platform(arr)
+
+        else:
+            arr = np.asarray(arr)
+
+    return arr
+
+
+def make_sparse(arr, kind='block', fill_value=None):
+    """
+    Convert ndarray to sparse format
+
+    Parameters
+    ----------
+    arr : ndarray
+    kind : {'block', 'integer'}
+    fill_value : NaN or another value
+
+    Returns
+    -------
+    (sparse_values, index) : (ndarray, SparseIndex)
+    """
+
+    arr = _sanitize_values(arr)
+
+    if arr.ndim > 1:
+        raise TypeError("expected dimension <= 1 data")
+
+    if fill_value is None:
+        fill_value = na_value_for_dtype(arr.dtype)
+
+    if isna(fill_value):
+        mask = notna(arr)
+    else:
+        # For str arrays in NumPy 1.12.0, operator!= below isn't
+        # element-wise but just returns False if fill_value is not str,
+        # so cast to object comparison to be safe
+        if is_string_dtype(arr):
+            arr = arr.astype(object)
+
+        if is_object_dtype(arr.dtype):
+            # element-wise equality check method in numpy doesn't treat
+            # each element type, eg. 0, 0.0, and False are treated as
+            # same. So we have to check the both of its type and value.
+            mask = splib.make_mask_object_ndarray(arr, fill_value)
+        else:
+            mask = arr != fill_value
+
+    length = len(arr)
+    if length != mask.size:
+        # the arr is a SparseArray
+        indices = mask.sp_index.indices
+    else:
+        indices = mask.nonzero()[0].astype(np.int32)
+
+    index = _make_index(length, indices, kind)
+    sparsified_values = arr[mask]
+    return sparsified_values, index, fill_value
+
+
+def _make_index(length, indices, kind):
+
+    if kind == 'block' or isinstance(kind, BlockIndex):
+        locs, lens = splib.get_blocks(indices)
+        index = BlockIndex(length, locs, lens)
+    elif kind == 'integer' or isinstance(kind, IntIndex):
+        index = IntIndex(length, indices)
+    else:  # pragma: no cover
+        raise ValueError('must be block or integer type')
+    return index
+
+
+ops.add_special_arithmetic_methods(SparseArray)
diff --git a/pandas/core/sparse/frame.py b/pandas/core/sparse/frame.py
new file mode 100644
index 0000000000000..28299fbe61daf
--- /dev/null
+++ b/pandas/core/sparse/frame.py
@@ -0,0 +1,1026 @@
+"""
+Data structures for sparse float data. Life is made simpler by dealing only
+with float64 data
+"""
+from __future__ import division
+# pylint: disable=E1101,E1103,W0231,E0202
+
+import warnings
+from pandas.compat import lmap
+from pandas import compat
+import numpy as np
+
+from pandas.core.dtypes.missing import isna, notna
+from pandas.core.dtypes.cast import maybe_upcast, find_common_type
+from pandas.core.dtypes.common import _ensure_platform_int, is_scipy_sparse
+
+from pandas.compat.numpy import function as nv
+from pandas.core.index import Index, MultiIndex, _ensure_index
+from pandas.core.series import Series
+from pandas.core.frame import DataFrame, extract_index, _prep_ndarray
+import pandas.core.algorithms as algos
+from pandas.core.internals import (BlockManager,
+                                   create_block_manager_from_arrays)
+import pandas.core.generic as generic
+from pandas.core.sparse.series import SparseSeries, SparseArray
+from pandas._libs.sparse import BlockIndex, get_blocks
+from pandas.util._decorators import Appender
+import pandas.core.ops as ops
+import pandas.core.common as com
+
+_shared_doc_kwargs = dict(klass='SparseDataFrame')
+
+
+class SparseDataFrame(DataFrame):
+    """
+    DataFrame containing sparse floating point data in the form of SparseSeries
+    objects
+
+    Parameters
+    ----------
+    data : same types as can be passed to DataFrame or scipy.sparse.spmatrix
+        .. versionchanged :: 0.23.0
+           If data is a dict, argument order is maintained for Python 3.6
+           and later.
+
+    index : array-like, optional
+    column : array-like, optional
+    default_kind : {'block', 'integer'}, default 'block'
+        Default sparse kind for converting Series to SparseSeries. Will not
+        override SparseSeries passed into constructor
+    default_fill_value : float
+        Default fill_value for converting Series to SparseSeries
+        (default: nan). Will not override SparseSeries passed in.
+    """
+    _subtyp = 'sparse_frame'
+
+    def __init__(self, data=None, index=None, columns=None, default_kind=None,
+                 default_fill_value=None, dtype=None, copy=False):
+
+        # pick up the defaults from the Sparse structures
+        if isinstance(data, SparseDataFrame):
+            if index is None:
+                index = data.index
+            if columns is None:
+                columns = data.columns
+            if default_fill_value is None:
+                default_fill_value = data.default_fill_value
+            if default_kind is None:
+                default_kind = data.default_kind
+        elif isinstance(data, (SparseSeries, SparseArray)):
+            if index is None:
+                index = data.index
+            if default_fill_value is None:
+                default_fill_value = data.fill_value
+            if columns is None and hasattr(data, 'name'):
+                columns = [data.name]
+            if columns is None:
+                raise Exception("cannot pass a series w/o a name or columns")
+            data = {columns[0]: data}
+
+        if default_fill_value is None:
+            default_fill_value = np.nan
+        if default_kind is None:
+            default_kind = 'block'
+
+        self._default_kind = default_kind
+        self._default_fill_value = default_fill_value
+
+        if is_scipy_sparse(data):
+            mgr = self._init_spmatrix(data, index, columns, dtype=dtype,
+                                      fill_value=default_fill_value)
+        elif isinstance(data, dict):
+            mgr = self._init_dict(data, index, columns, dtype=dtype)
+        elif isinstance(data, (np.ndarray, list)):
+            mgr = self._init_matrix(data, index, columns, dtype=dtype)
+        elif isinstance(data, SparseDataFrame):
+            mgr = self._init_mgr(data._data,
+                                 dict(index=index, columns=columns),
+                                 dtype=dtype, copy=copy)
+        elif isinstance(data, DataFrame):
+            mgr = self._init_dict(data, data.index, data.columns, dtype=dtype)
+        elif isinstance(data, Series):
+            mgr = self._init_dict(data.to_frame(), data.index,
+                                  columns=None, dtype=dtype)
+        elif isinstance(data, BlockManager):
+            mgr = self._init_mgr(data, axes=dict(index=index, columns=columns),
+                                 dtype=dtype, copy=copy)
+        elif data is None:
+            data = DataFrame()
+
+            if index is None:
+                index = Index([])
+            else:
+                index = _ensure_index(index)
+
+            if columns is None:
+                columns = Index([])
+            else:
+                for c in columns:
+                    data[c] = SparseArray(np.nan, index=index,
+                                          kind=self._default_kind,
+                                          fill_value=self._default_fill_value)
+            mgr = to_manager(data, columns, index)
+            if dtype is not None:
+                mgr = mgr.astype(dtype)
+        else:
+            msg = ('SparseDataFrame called with unknown type "{data_type}" '
+                   'for data argument')
+            raise TypeError(msg.format(data_type=type(data).__name__))
+
+        generic.NDFrame.__init__(self, mgr)
+
+    @property
+    def _constructor(self):
+        return SparseDataFrame
+
+    _constructor_sliced = SparseSeries
+
+    def _init_dict(self, data, index, columns, dtype=None):
+        # pre-filter out columns if we passed it
+        if columns is not None:
+            columns = _ensure_index(columns)
+            data = {k: v for k, v in compat.iteritems(data) if k in columns}
+        else:
+            keys = com._dict_keys_to_ordered_list(data)
+            columns = Index(keys)
+
+        if index is None:
+            index = extract_index(list(data.values()))
+
+        sp_maker = lambda x: SparseArray(x, kind=self._default_kind,
+                                         fill_value=self._default_fill_value,
+                                         copy=True, dtype=dtype)
+        sdict = {}
+        for k, v in compat.iteritems(data):
+            if isinstance(v, Series):
+                # Force alignment, no copy necessary
+                if not v.index.equals(index):
+                    v = v.reindex(index)
+
+                if not isinstance(v, SparseSeries):
+                    v = sp_maker(v.values)
+            elif isinstance(v, SparseArray):
+                v = v.copy()
+            else:
+                if isinstance(v, dict):
+                    v = [v.get(i, np.nan) for i in index]
+
+                v = sp_maker(v)
+            sdict[k] = v
+
+        # TODO: figure out how to handle this case, all nan's?
+        # add in any other columns we want to have (completeness)
+        nan_arr = np.empty(len(index), dtype='float64')
+        nan_arr.fill(np.nan)
+        nan_arr = sp_maker(nan_arr)
+        sdict.update((c, nan_arr) for c in columns if c not in sdict)
+
+        return to_manager(sdict, columns, index)
+
+    def _init_matrix(self, data, index, columns, dtype=None):
+        """ Init self from ndarray or list of lists """
+        data = _prep_ndarray(data, copy=False)
+        index, columns = self._prep_index(data, index, columns)
+        data = {idx: data[:, i] for i, idx in enumerate(columns)}
+        return self._init_dict(data, index, columns, dtype)
+
+    def _init_spmatrix(self, data, index, columns, dtype=None,
+                       fill_value=None):
+        """ Init self from scipy.sparse matrix """
+        index, columns = self._prep_index(data, index, columns)
+        data = data.tocoo()
+        N = len(index)
+
+        # Construct a dict of SparseSeries
+        sdict = {}
+        values = Series(data.data, index=data.row, copy=False)
+        for col, rowvals in values.groupby(data.col):
+            # get_blocks expects int32 row indices in sorted order
+            rowvals = rowvals.sort_index()
+            rows = rowvals.index.values.astype(np.int32)
+            blocs, blens = get_blocks(rows)
+
+            sdict[columns[col]] = SparseSeries(
+                rowvals.values, index=index,
+                fill_value=fill_value,
+                sparse_index=BlockIndex(N, blocs, blens))
+
+        # Add any columns that were empty and thus not grouped on above
+        sdict.update({column: SparseSeries(index=index,
+                                           fill_value=fill_value,
+                                           sparse_index=BlockIndex(N, [], []))
+                      for column in columns
+                      if column not in sdict})
+
+        return self._init_dict(sdict, index, columns, dtype)
+
+    def _prep_index(self, data, index, columns):
+        N, K = data.shape
+        if index is None:
+            index = com._default_index(N)
+        if columns is None:
+            columns = com._default_index(K)
+
+        if len(columns) != K:
+            raise ValueError('Column length mismatch: {columns} vs. {K}'
+                             .format(columns=len(columns), K=K))
+        if len(index) != N:
+            raise ValueError('Index length mismatch: {index} vs. {N}'
+                             .format(index=len(index), N=N))
+        return index, columns
+
+    def to_coo(self):
+        """
+        Return the contents of the frame as a sparse SciPy COO matrix.
+
+        .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        coo_matrix : scipy.sparse.spmatrix
+            If the caller is heterogeneous and contains booleans or objects,
+            the result will be of dtype=object. See Notes.
+
+        Notes
+        -----
+        The dtype will be the lowest-common-denominator type (implicit
+        upcasting); that is to say if the dtypes (even of numeric types)
+        are mixed, the one that accommodates all will be chosen.
+
+        e.g. If the dtypes are float16 and float32, dtype will be upcast to
+        float32. By numpy.find_common_type convention, mixing int64 and
+        and uint64 will result in a float64 dtype.
+        """
+        try:
+            from scipy.sparse import coo_matrix
+        except ImportError:
+            raise ImportError('Scipy is not installed')
+
+        dtype = find_common_type(self.dtypes)
+        cols, rows, datas = [], [], []
+        for col, name in enumerate(self):
+            s = self[name]
+            row = s.sp_index.to_int_index().indices
+            cols.append(np.repeat(col, len(row)))
+            rows.append(row)
+            datas.append(s.sp_values.astype(dtype, copy=False))
+
+        cols = np.concatenate(cols)
+        rows = np.concatenate(rows)
+        datas = np.concatenate(datas)
+        return coo_matrix((datas, (rows, cols)), shape=self.shape)
+
+    def __array_wrap__(self, result):
+        return self._constructor(
+            result, index=self.index, columns=self.columns,
+            default_kind=self._default_kind,
+            default_fill_value=self._default_fill_value).__finalize__(self)
+
+    def __getstate__(self):
+        # pickling
+        return dict(_typ=self._typ, _subtyp=self._subtyp, _data=self._data,
+                    _default_fill_value=self._default_fill_value,
+                    _default_kind=self._default_kind)
+
+    def _unpickle_sparse_frame_compat(self, state):
+        """ original pickle format """
+        series, cols, idx, fv, kind = state
+
+        if not isinstance(cols, Index):  # pragma: no cover
+            from pandas.io.pickle import _unpickle_array
+            columns = _unpickle_array(cols)
+        else:
+            columns = cols
+
+        if not isinstance(idx, Index):  # pragma: no cover
+            from pandas.io.pickle import _unpickle_array
+            index = _unpickle_array(idx)
+        else:
+            index = idx
+
+        series_dict = DataFrame()
+        for col, (sp_index, sp_values) in compat.iteritems(series):
+            series_dict[col] = SparseSeries(sp_values, sparse_index=sp_index,
+                                            fill_value=fv)
+
+        self._data = to_manager(series_dict, columns, index)
+        self._default_fill_value = fv
+        self._default_kind = kind
+
+    def to_dense(self):
+        """
+        Convert to dense DataFrame
+
+        Returns
+        -------
+        df : DataFrame
+        """
+        data = {k: v.to_dense() for k, v in compat.iteritems(self)}
+        return DataFrame(data, index=self.index, columns=self.columns)
+
+    def _apply_columns(self, func):
+        """ get new SparseDataFrame applying func to each columns """
+
+        new_data = {}
+        for col, series in compat.iteritems(self):
+            new_data[col] = func(series)
+
+        return self._constructor(
+            data=new_data, index=self.index, columns=self.columns,
+            default_fill_value=self.default_fill_value).__finalize__(self)
+
+    def astype(self, dtype):
+        return self._apply_columns(lambda x: x.astype(dtype))
+
+    def copy(self, deep=True):
+        """
+        Make a copy of this SparseDataFrame
+        """
+        result = super(SparseDataFrame, self).copy(deep=deep)
+        result._default_fill_value = self._default_fill_value
+        result._default_kind = self._default_kind
+        return result
+
+    @property
+    def default_fill_value(self):
+        return self._default_fill_value
+
+    @property
+    def default_kind(self):
+        return self._default_kind
+
+    @property
+    def density(self):
+        """
+        Ratio of non-sparse points to total (dense) data points
+        represented in the frame
+        """
+        tot_nonsparse = sum(ser.sp_index.npoints
+                            for _, ser in compat.iteritems(self))
+        tot = len(self.index) * len(self.columns)
+        return tot_nonsparse / float(tot)
+
+    def fillna(self, value=None, method=None, axis=0, inplace=False,
+               limit=None, downcast=None):
+        new_self = super(SparseDataFrame,
+                         self).fillna(value=value, method=method, axis=axis,
+                                      inplace=inplace, limit=limit,
+                                      downcast=downcast)
+        if not inplace:
+            self = new_self
+
+        # set the fill value if we are filling as a scalar with nothing special
+        # going on
+        if (value is not None and value == value and method is None and
+                limit is None):
+            self._default_fill_value = value
+
+        if not inplace:
+            return self
+
+    # ----------------------------------------------------------------------
+    # Support different internal representation of SparseDataFrame
+
+    def _sanitize_column(self, key, value, **kwargs):
+        """
+        Creates a new SparseArray from the input value.
+
+        Parameters
+        ----------
+        key : object
+        value : scalar, Series, or array-like
+        kwargs : dict
+
+        Returns
+        -------
+        sanitized_column : SparseArray
+
+        """
+        sp_maker = lambda x, index=None: SparseArray(
+            x, index=index, fill_value=self._default_fill_value,
+            kind=self._default_kind)
+        if isinstance(value, SparseSeries):
+            clean = value.reindex(self.index).as_sparse_array(
+                fill_value=self._default_fill_value, kind=self._default_kind)
+
+        elif isinstance(value, SparseArray):
+            if len(value) != len(self.index):
+                raise AssertionError('Length of values does not match '
+                                     'length of index')
+            clean = value
+
+        elif hasattr(value, '__iter__'):
+            if isinstance(value, Series):
+                clean = value.reindex(self.index)
+                if not isinstance(value, SparseSeries):
+                    clean = sp_maker(clean)
+            else:
+                if len(value) != len(self.index):
+                    raise AssertionError('Length of values does not match '
+                                         'length of index')
+                clean = sp_maker(value)
+
+        # Scalar
+        else:
+            clean = sp_maker(value, self.index)
+
+        # always return a SparseArray!
+        return clean
+
+    def __getitem__(self, key):
+        """
+        Retrieve column or slice from DataFrame
+        """
+        if isinstance(key, slice):
+            date_rng = self.index[key]
+            return self.reindex(date_rng)
+        elif isinstance(key, (np.ndarray, list, Series)):
+            return self._getitem_array(key)
+        else:
+            return self._get_item_cache(key)
+
+    def get_value(self, index, col, takeable=False):
+        """
+        Quickly retrieve single value at passed column and index
+
+        .. deprecated:: 0.21.0
+
+        Please use .at[] or .iat[] accessors.
+
+        Parameters
+        ----------
+        index : row label
+        col : column label
+        takeable : interpret the index/col as indexers, default False
+
+        Returns
+        -------
+        value : scalar value
+        """
+        warnings.warn("get_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._get_value(index, col, takeable=takeable)
+
+    def _get_value(self, index, col, takeable=False):
+        if takeable is True:
+            series = self._iget_item_cache(col)
+        else:
+            series = self._get_item_cache(col)
+
+        return series._get_value(index, takeable=takeable)
+    _get_value.__doc__ = get_value.__doc__
+
+    def set_value(self, index, col, value, takeable=False):
+        """
+        Put single value at passed column and index
+
+        .. deprecated:: 0.21.0
+
+        Please use .at[] or .iat[] accessors.
+
+        Parameters
+        ----------
+        index : row label
+        col : column label
+        value : scalar value
+        takeable : interpret the index/col as indexers, default False
+
+        Notes
+        -----
+        This method *always* returns a new object. It is currently not
+        particularly efficient (and potentially very expensive) but is provided
+        for API compatibility with DataFrame
+
+        Returns
+        -------
+        frame : DataFrame
+        """
+        warnings.warn("set_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._set_value(index, col, value, takeable=takeable)
+
+    def _set_value(self, index, col, value, takeable=False):
+        dense = self.to_dense()._set_value(
+            index, col, value, takeable=takeable)
+        return dense.to_sparse(kind=self._default_kind,
+                               fill_value=self._default_fill_value)
+    _set_value.__doc__ = set_value.__doc__
+
+    def _slice(self, slobj, axis=0, kind=None):
+        if axis == 0:
+            new_index = self.index[slobj]
+            new_columns = self.columns
+        else:
+            new_index = self.index
+            new_columns = self.columns[slobj]
+
+        return self.reindex(index=new_index, columns=new_columns)
+
+    def xs(self, key, axis=0, copy=False):
+        """
+        Returns a row (cross-section) from the SparseDataFrame as a Series
+        object.
+
+        Parameters
+        ----------
+        key : some index contained in the index
+
+        Returns
+        -------
+        xs : Series
+        """
+        if axis == 1:
+            data = self[key]
+            return data
+
+        i = self.index.get_loc(key)
+        data = self.take([i]).get_values()[0]
+        return Series(data, index=self.columns)
+
+    # ----------------------------------------------------------------------
+    # Arithmetic-related methods
+
+    def _combine_frame(self, other, func, fill_value=None, level=None):
+        this, other = self.align(other, join='outer', level=level, copy=False)
+        new_index, new_columns = this.index, this.columns
+
+        if level is not None:
+            raise NotImplementedError("'level' argument is not supported")
+
+        if self.empty and other.empty:
+            return self._constructor(index=new_index).__finalize__(self)
+
+        new_data = {}
+        if fill_value is not None:
+            # TODO: be a bit more intelligent here
+            for col in new_columns:
+                if col in this and col in other:
+                    dleft = this[col].to_dense()
+                    dright = other[col].to_dense()
+                    result = dleft._binop(dright, func, fill_value=fill_value)
+                    result = result.to_sparse(fill_value=this[col].fill_value)
+                    new_data[col] = result
+        else:
+
+            for col in new_columns:
+                if col in this and col in other:
+                    new_data[col] = func(this[col], other[col])
+
+        # if the fill values are the same use them? or use a valid one
+        new_fill_value = None
+        other_fill_value = getattr(other, 'default_fill_value', np.nan)
+        if self.default_fill_value == other_fill_value:
+            new_fill_value = self.default_fill_value
+        elif np.isnan(self.default_fill_value) and not np.isnan(
+                other_fill_value):
+            new_fill_value = other_fill_value
+        elif not np.isnan(self.default_fill_value) and np.isnan(
+                other_fill_value):
+            new_fill_value = self.default_fill_value
+
+        return self._constructor(data=new_data, index=new_index,
+                                 columns=new_columns,
+                                 default_fill_value=new_fill_value
+                                 ).__finalize__(self)
+
+    def _combine_match_index(self, other, func, level=None):
+        new_data = {}
+
+        if level is not None:
+            raise NotImplementedError("'level' argument is not supported")
+
+        new_index = self.index.union(other.index)
+        this = self
+        if self.index is not new_index:
+            this = self.reindex(new_index)
+
+        if other.index is not new_index:
+            other = other.reindex(new_index)
+
+        for col, series in compat.iteritems(this):
+            new_data[col] = func(series.values, other.values)
+
+        # fill_value is a function of our operator
+        fill_value = None
+        if isna(other.fill_value) or isna(self.default_fill_value):
+            fill_value = np.nan
+        else:
+            fill_value = func(np.float64(self.default_fill_value),
+                              np.float64(other.fill_value))
+
+        return self._constructor(
+            new_data, index=new_index, columns=self.columns,
+            default_fill_value=fill_value).__finalize__(self)
+
+    def _combine_match_columns(self, other, func, level=None, try_cast=True):
+        # patched version of DataFrame._combine_match_columns to account for
+        # NumPy circumventing __rsub__ with float64 types, e.g.: 3.0 - series,
+        # where 3.0 is numpy.float64 and series is a SparseSeries. Still
+        # possible for this to happen, which is bothersome
+
+        if level is not None:
+            raise NotImplementedError("'level' argument is not supported")
+
+        new_data = {}
+
+        union = intersection = self.columns
+
+        if not union.equals(other.index):
+            union = other.index.union(self.columns)
+            intersection = other.index.intersection(self.columns)
+
+        for col in intersection:
+            new_data[col] = func(self[col], float(other[col]))
+
+        return self._constructor(
+            new_data, index=self.index, columns=union,
+            default_fill_value=self.default_fill_value).__finalize__(self)
+
+    def _combine_const(self, other, func, errors='raise', try_cast=True):
+        return self._apply_columns(lambda x: func(x, other))
+
+    def _reindex_index(self, index, method, copy, level, fill_value=np.nan,
+                       limit=None, takeable=False):
+        if level is not None:
+            raise TypeError('Reindex by level not supported for sparse')
+
+        if self.index.equals(index):
+            if copy:
+                return self.copy()
+            else:
+                return self
+
+        if len(self.index) == 0:
+            return self._constructor(
+                index=index, columns=self.columns).__finalize__(self)
+
+        indexer = self.index.get_indexer(index, method, limit=limit)
+        indexer = _ensure_platform_int(indexer)
+        mask = indexer == -1
+        need_mask = mask.any()
+
+        new_series = {}
+        for col, series in self.iteritems():
+            if mask.all():
+                continue
+
+            values = series.values
+            # .take returns SparseArray
+            new = values.take(indexer)
+            if need_mask:
+                new = new.values
+                # convert integer to float if necessary. need to do a lot
+                # more than that, handle boolean etc also
+                new, fill_value = maybe_upcast(new, fill_value=fill_value)
+                np.putmask(new, mask, fill_value)
+
+            new_series[col] = new
+
+        return self._constructor(
+            new_series, index=index, columns=self.columns,
+            default_fill_value=self._default_fill_value).__finalize__(self)
+
+    def _reindex_columns(self, columns, method, copy, level, fill_value=None,
+                         limit=None, takeable=False):
+        if level is not None:
+            raise TypeError('Reindex by level not supported for sparse')
+
+        if notna(fill_value):
+            raise NotImplementedError("'fill_value' argument is not supported")
+
+        if limit:
+            raise NotImplementedError("'limit' argument is not supported")
+
+        if method is not None:
+            raise NotImplementedError("'method' argument is not supported")
+
+        # TODO: fill value handling
+        sdict = {k: v for k, v in compat.iteritems(self) if k in columns}
+        return self._constructor(
+            sdict, index=self.index, columns=columns,
+            default_fill_value=self._default_fill_value).__finalize__(self)
+
+    def _reindex_with_indexers(self, reindexers, method=None, fill_value=None,
+                               limit=None, copy=False, allow_dups=False):
+
+        if method is not None or limit is not None:
+            raise NotImplementedError("cannot reindex with a method or limit "
+                                      "with sparse")
+
+        if fill_value is None:
+            fill_value = np.nan
+
+        reindexers = {self._get_axis_number(a): val
+                      for (a, val) in compat.iteritems(reindexers)}
+
+        index, row_indexer = reindexers.get(0, (None, None))
+        columns, col_indexer = reindexers.get(1, (None, None))
+
+        if columns is None:
+            columns = self.columns
+
+        new_arrays = {}
+        for col in columns:
+            if col not in self:
+                continue
+            if row_indexer is not None:
+                new_arrays[col] = algos.take_1d(self[col].get_values(),
+                                                row_indexer,
+                                                fill_value=fill_value)
+            else:
+                new_arrays[col] = self[col]
+
+        return self._constructor(new_arrays, index=index,
+                                 columns=columns).__finalize__(self)
+
+    def _join_compat(self, other, on=None, how='left', lsuffix='', rsuffix='',
+                     sort=False):
+        if on is not None:
+            raise NotImplementedError("'on' keyword parameter is not yet "
+                                      "implemented")
+        return self._join_index(other, how, lsuffix, rsuffix)
+
+    def _join_index(self, other, how, lsuffix, rsuffix):
+        if isinstance(other, Series):
+            if other.name is None:
+                raise ValueError('Other Series must have a name')
+
+            other = SparseDataFrame(
+                {other.name: other},
+                default_fill_value=self._default_fill_value)
+
+        join_index = self.index.join(other.index, how=how)
+
+        this = self.reindex(join_index)
+        other = other.reindex(join_index)
+
+        this, other = this._maybe_rename_join(other, lsuffix, rsuffix)
+
+        from pandas import concat
+        return concat([this, other], axis=1, verify_integrity=True)
+
+    def _maybe_rename_join(self, other, lsuffix, rsuffix):
+        to_rename = self.columns.intersection(other.columns)
+        if len(to_rename) > 0:
+            if not lsuffix and not rsuffix:
+                raise ValueError('columns overlap but no suffix specified: '
+                                 '{to_rename}'.format(to_rename=to_rename))
+
+            def lrenamer(x):
+                if x in to_rename:
+                    return '{x}{lsuffix}'.format(x=x, lsuffix=lsuffix)
+                return x
+
+            def rrenamer(x):
+                if x in to_rename:
+                    return '{x}{rsuffix}'.format(x=x, rsuffix=rsuffix)
+                return x
+
+            this = self.rename(columns=lrenamer)
+            other = other.rename(columns=rrenamer)
+        else:
+            this = self
+
+        return this, other
+
+    def transpose(self, *args, **kwargs):
+        """
+        Returns a DataFrame with the rows/columns switched.
+        """
+        nv.validate_transpose(args, kwargs)
+        return self._constructor(
+            self.values.T, index=self.columns, columns=self.index,
+            default_fill_value=self._default_fill_value,
+            default_kind=self._default_kind).__finalize__(self)
+
+    T = property(transpose)
+
+    @Appender(DataFrame.count.__doc__)
+    def count(self, axis=0, **kwds):
+        if axis is None:
+            axis = self._stat_axis_number
+
+        return self.apply(lambda x: x.count(), axis=axis)
+
+    def cumsum(self, axis=0, *args, **kwargs):
+        """
+        Return SparseDataFrame of cumulative sums over requested axis.
+
+        Parameters
+        ----------
+        axis : {0, 1}
+            0 for row-wise, 1 for column-wise
+
+        Returns
+        -------
+        y : SparseDataFrame
+        """
+        nv.validate_cumsum(args, kwargs)
+
+        if axis is None:
+            axis = self._stat_axis_number
+
+        return self.apply(lambda x: x.cumsum(), axis=axis)
+
+    @Appender(generic._shared_docs['isna'] % _shared_doc_kwargs)
+    def isna(self):
+        return self._apply_columns(lambda x: x.isna())
+    isnull = isna
+
+    @Appender(generic._shared_docs['notna'] % _shared_doc_kwargs)
+    def notna(self):
+        return self._apply_columns(lambda x: x.notna())
+    notnull = notna
+
+    def apply(self, func, axis=0, broadcast=None, reduce=None,
+              result_type=None):
+        """
+        Analogous to DataFrame.apply, for SparseDataFrame
+
+        Parameters
+        ----------
+        func : function
+            Function to apply to each column
+        axis : {0, 1, 'index', 'columns'}
+        broadcast : bool, default False
+            For aggregation functions, return object of same size with values
+            propagated
+
+            .. deprecated:: 0.23.0
+               This argument will be removed in a future version, replaced
+               by result_type='broadcast'.
+
+        reduce : boolean or None, default None
+            Try to apply reduction procedures. If the DataFrame is empty,
+            apply will use reduce to determine whether the result should be a
+            Series or a DataFrame. If reduce is None (the default), apply's
+            return value will be guessed by calling func an empty Series (note:
+            while guessing, exceptions raised by func will be ignored). If
+            reduce is True a Series will always be returned, and if False a
+            DataFrame will always be returned.
+
+            .. deprecated:: 0.23.0
+               This argument will be removed in a future version, replaced
+               by result_type='reduce'.
+
+        result_type : {'expand', 'reduce', 'broadcast, None}
+            These only act when axis=1 {columns}:
+
+            * 'expand' : list-like results will be turned into columns.
+            * 'reduce' : return a Series if possible rather than expanding
+              list-like results. This is the opposite to 'expand'.
+            * 'broadcast' : results will be broadcast to the original shape
+              of the frame, the original index & columns will be retained.
+
+            The default behaviour (None) depends on the return value of the
+            applied function: list-like results will be returned as a Series
+            of those. However if the apply function returns a Series these
+            are expanded to columns.
+
+            .. versionadded:: 0.23.0
+
+        Returns
+        -------
+        applied : Series or SparseDataFrame
+        """
+        if not len(self.columns):
+            return self
+        axis = self._get_axis_number(axis)
+
+        if isinstance(func, np.ufunc):
+            new_series = {}
+            for k, v in compat.iteritems(self):
+                applied = func(v)
+                applied.fill_value = func(v.fill_value)
+                new_series[k] = applied
+            return self._constructor(
+                new_series, index=self.index, columns=self.columns,
+                default_fill_value=self._default_fill_value,
+                default_kind=self._default_kind).__finalize__(self)
+
+        from pandas.core.apply import frame_apply
+        op = frame_apply(self,
+                         func=func,
+                         axis=axis,
+                         reduce=reduce,
+                         broadcast=broadcast,
+                         result_type=result_type)
+        return op.get_result()
+
+    def applymap(self, func):
+        """
+        Apply a function to a DataFrame that is intended to operate
+        elementwise, i.e. like doing map(func, series) for each series in the
+        DataFrame
+
+        Parameters
+        ----------
+        func : function
+            Python function, returns a single value from a single value
+
+        Returns
+        -------
+        applied : DataFrame
+        """
+        return self.apply(lambda x: lmap(func, x))
+
+
+def to_manager(sdf, columns, index):
+    """ create and return the block manager from a dataframe of series,
+    columns, index
+    """
+
+    # from BlockManager perspective
+    axes = [_ensure_index(columns), _ensure_index(index)]
+
+    return create_block_manager_from_arrays(
+        [sdf[c] for c in columns], columns, axes)
+
+
+def stack_sparse_frame(frame):
+    """
+    Only makes sense when fill_value is NaN
+    """
+    lengths = [s.sp_index.npoints for _, s in compat.iteritems(frame)]
+    nobs = sum(lengths)
+
+    # this is pretty fast
+    minor_labels = np.repeat(np.arange(len(frame.columns)), lengths)
+
+    inds_to_concat = []
+    vals_to_concat = []
+    # TODO: Figure out whether this can be reached.
+    # I think this currently can't be reached because you can't build a
+    # SparseDataFrame with a non-np.NaN fill value (fails earlier).
+    for _, series in compat.iteritems(frame):
+        if not np.isnan(series.fill_value):
+            raise TypeError('This routine assumes NaN fill value')
+
+        int_index = series.sp_index.to_int_index()
+        inds_to_concat.append(int_index.indices)
+        vals_to_concat.append(series.sp_values)
+
+    major_labels = np.concatenate(inds_to_concat)
+    stacked_values = np.concatenate(vals_to_concat)
+    index = MultiIndex(levels=[frame.index, frame.columns],
+                       labels=[major_labels, minor_labels],
+                       verify_integrity=False)
+
+    lp = DataFrame(stacked_values.reshape((nobs, 1)), index=index,
+                   columns=['foo'])
+    return lp.sort_index(level=0)
+
+
+def homogenize(series_dict):
+    """
+    Conform a set of SparseSeries (with NaN fill_value) to a common SparseIndex
+    corresponding to the locations where they all have data
+
+    Parameters
+    ----------
+    series_dict : dict or DataFrame
+
+    Notes
+    -----
+    Using the dumbest algorithm I could think of. Should put some more thought
+    into this
+
+    Returns
+    -------
+    homogenized : dict of SparseSeries
+    """
+    index = None
+
+    need_reindex = False
+
+    for _, series in compat.iteritems(series_dict):
+        if not np.isnan(series.fill_value):
+            raise TypeError('this method is only valid with NaN fill values')
+
+        if index is None:
+            index = series.sp_index
+        elif not series.sp_index.equals(index):
+            need_reindex = True
+            index = index.intersect(series.sp_index)
+
+    if need_reindex:
+        output = {}
+        for name, series in compat.iteritems(series_dict):
+            if not series.sp_index.equals(index):
+                series = series.sparse_reindex(index)
+
+            output[name] = series
+    else:
+        output = series_dict
+
+    return output
+
+
+# use unaccelerated ops for sparse objects
+ops.add_flex_arithmetic_methods(SparseDataFrame)
+ops.add_special_arithmetic_methods(SparseDataFrame)
diff --git a/pandas/core/sparse/scipy_sparse.py b/pandas/core/sparse/scipy_sparse.py
new file mode 100644
index 0000000000000..748a52f484893
--- /dev/null
+++ b/pandas/core/sparse/scipy_sparse.py
@@ -0,0 +1,138 @@
+"""
+Interaction with scipy.sparse matrices.
+
+Currently only includes SparseSeries.to_coo helpers.
+"""
+from pandas.core.index import MultiIndex, Index
+from pandas.core.series import Series
+from pandas.compat import OrderedDict, lmap
+
+
+def _check_is_partition(parts, whole):
+    whole = set(whole)
+    parts = [set(x) for x in parts]
+    if set.intersection(*parts) != set():
+        raise ValueError(
+            'Is not a partition because intersection is not null.')
+    if set.union(*parts) != whole:
+        raise ValueError('Is not a partition because union is not the whole.')
+
+
+def _to_ijv(ss, row_levels=(0, ), column_levels=(1, ), sort_labels=False):
+    """ For arbitrary (MultiIndexed) SparseSeries return
+    (v, i, j, ilabels, jlabels) where (v, (i, j)) is suitable for
+    passing to scipy.sparse.coo constructor. """
+    # index and column levels must be a partition of the index
+    _check_is_partition([row_levels, column_levels], range(ss.index.nlevels))
+
+    # from the SparseSeries: get the labels and data for non-null entries
+    values = ss._data.internal_values()._valid_sp_values
+
+    nonnull_labels = ss.dropna()
+
+    def get_indexers(levels):
+        """ Return sparse coords and dense labels for subset levels """
+
+        # TODO: how to do this better? cleanly slice nonnull_labels given the
+        # coord
+        values_ilabels = [tuple(x[i] for i in levels)
+                          for x in nonnull_labels.index]
+        if len(levels) == 1:
+            values_ilabels = [x[0] for x in values_ilabels]
+
+        # # performance issues with groupby ###################################
+        # TODO: these two lines can rejplace the code below but
+        # groupby is too slow (in some cases at least)
+        # labels_to_i = ss.groupby(level=levels, sort=sort_labels).first()
+        # labels_to_i[:] = np.arange(labels_to_i.shape[0])
+
+        def _get_label_to_i_dict(labels, sort_labels=False):
+            """ Return OrderedDict of unique labels to number.
+            Optionally sort by label.
+            """
+            labels = Index(lmap(tuple, labels)).unique().tolist()  # squish
+            if sort_labels:
+                labels = sorted(list(labels))
+            d = OrderedDict((k, i) for i, k in enumerate(labels))
+            return (d)
+
+        def _get_index_subset_to_coord_dict(index, subset, sort_labels=False):
+            def robust_get_level_values(i):
+                # if index has labels (that are not None) use those,
+                # else use the level location
+                try:
+                    return index.get_level_values(index.names[i])
+                except KeyError:
+                    return index.get_level_values(i)
+
+            ilabels = list(zip(*[robust_get_level_values(i) for i in subset]))
+            labels_to_i = _get_label_to_i_dict(ilabels,
+                                               sort_labels=sort_labels)
+            labels_to_i = Series(labels_to_i)
+            if len(subset) > 1:
+                labels_to_i.index = MultiIndex.from_tuples(labels_to_i.index)
+                labels_to_i.index.names = [index.names[i] for i in subset]
+            else:
+                labels_to_i.index = Index(x[0] for x in labels_to_i.index)
+                labels_to_i.index.name = index.names[subset[0]]
+
+            labels_to_i.name = 'value'
+            return (labels_to_i)
+
+        labels_to_i = _get_index_subset_to_coord_dict(ss.index, levels,
+                                                      sort_labels=sort_labels)
+        # #####################################################################
+        # #####################################################################
+
+        i_coord = labels_to_i[values_ilabels].tolist()
+        i_labels = labels_to_i.index.tolist()
+
+        return i_coord, i_labels
+
+    i_coord, i_labels = get_indexers(row_levels)
+    j_coord, j_labels = get_indexers(column_levels)
+
+    return values, i_coord, j_coord, i_labels, j_labels
+
+
+def _sparse_series_to_coo(ss, row_levels=(0, ), column_levels=(1, ),
+                          sort_labels=False):
+    """ Convert a SparseSeries to a scipy.sparse.coo_matrix using index
+    levels row_levels, column_levels as the row and column
+    labels respectively. Returns the sparse_matrix, row and column labels.
+    """
+
+    import scipy.sparse
+
+    if ss.index.nlevels < 2:
+        raise ValueError('to_coo requires MultiIndex with nlevels > 2')
+    if not ss.index.is_unique:
+        raise ValueError('Duplicate index entries are not allowed in to_coo '
+                         'transformation.')
+
+    # to keep things simple, only rely on integer indexing (not labels)
+    row_levels = [ss.index._get_level_number(x) for x in row_levels]
+    column_levels = [ss.index._get_level_number(x) for x in column_levels]
+
+    v, i, j, rows, columns = _to_ijv(ss, row_levels=row_levels,
+                                     column_levels=column_levels,
+                                     sort_labels=sort_labels)
+    sparse_matrix = scipy.sparse.coo_matrix(
+        (v, (i, j)), shape=(len(rows), len(columns)))
+    return sparse_matrix, rows, columns
+
+
+def _coo_to_sparse_series(A, dense_index=False):
+    """ Convert a scipy.sparse.coo_matrix to a SparseSeries.
+    Use the defaults given in the SparseSeries constructor.
+    """
+    s = Series(A.data, MultiIndex.from_arrays((A.row, A.col)))
+    s = s.sort_index()
+    s = s.to_sparse()  # TODO: specify kind?
+    if dense_index:
+        # is there a better constructor method to use here?
+        i = range(A.shape[0])
+        j = range(A.shape[1])
+        ind = MultiIndex.from_product([i, j])
+        s = s.reindex(ind)
+    return s
diff --git a/pandas/core/sparse/series.py b/pandas/core/sparse/series.py
new file mode 100644
index 0000000000000..09d958059d355
--- /dev/null
+++ b/pandas/core/sparse/series.py
@@ -0,0 +1,814 @@
+"""
+Data structures for sparse float data. Life is made simpler by dealing only
+with float64 data
+"""
+
+# pylint: disable=E1101,E1103,W0231
+
+import numpy as np
+import warnings
+
+from pandas.core.dtypes.missing import isna, notna
+
+from pandas.compat.numpy import function as nv
+from pandas.core.index import Index, _ensure_index, InvalidIndexError
+from pandas.core.series import Series
+from pandas.core.internals import SingleBlockManager
+from pandas.core import generic
+import pandas.core.common as com
+import pandas.core.ops as ops
+import pandas._libs.index as libindex
+from pandas.util._decorators import Appender
+
+from pandas.core.sparse.array import (
+    make_sparse, SparseArray,
+    _make_index)
+from pandas._libs.sparse import BlockIndex, IntIndex
+import pandas._libs.sparse as splib
+
+from pandas.core.sparse.scipy_sparse import (
+    _sparse_series_to_coo,
+    _coo_to_sparse_series)
+
+
+_shared_doc_kwargs = dict(axes='index', klass='SparseSeries',
+                          axes_single_arg="{0, 'index'}",
+                          optional_labels='', optional_axis='')
+
+
+class SparseSeries(Series):
+    """Data structure for labeled, sparse floating point data
+
+    Parameters
+    ----------
+    data : {array-like, Series, SparseSeries, dict}
+        .. versionchanged :: 0.23.0
+           If data is a dict, argument order is maintained for Python 3.6
+           and later.
+
+    kind : {'block', 'integer'}
+    fill_value : float
+        Code for missing value. Defaults depends on dtype.
+        0 for int dtype, False for bool dtype, and NaN for other dtypes
+    sparse_index : {BlockIndex, IntIndex}, optional
+        Only if you have one. Mainly used internally
+
+    Notes
+    -----
+    SparseSeries objects are immutable via the typical Python means. If you
+    must change values, convert to dense, make your changes, then convert back
+    to sparse
+    """
+    _subtyp = 'sparse_series'
+
+    def __init__(self, data=None, index=None, sparse_index=None, kind='block',
+                 fill_value=None, name=None, dtype=None, copy=False,
+                 fastpath=False):
+
+        # we are called internally, so short-circuit
+        if fastpath:
+
+            # data is an ndarray, index is defined
+
+            if not isinstance(data, SingleBlockManager):
+                data = SingleBlockManager(data, index, fastpath=True)
+            if copy:
+                data = data.copy()
+
+        else:
+
+            if data is None:
+                data = []
+
+            if isinstance(data, Series) and name is None:
+                name = data.name
+
+            if isinstance(data, SparseArray):
+                if index is not None:
+                    assert (len(index) == len(data))
+                sparse_index = data.sp_index
+                if fill_value is None:
+                    fill_value = data.fill_value
+
+                data = np.asarray(data)
+
+            elif isinstance(data, SparseSeries):
+                if index is None:
+                    index = data.index.view()
+                if fill_value is None:
+                    fill_value = data.fill_value
+                # extract the SingleBlockManager
+                data = data._data
+
+            elif isinstance(data, (Series, dict)):
+                data = Series(data, index=index)
+                index = data.index.view()
+
+                res = make_sparse(data, kind=kind, fill_value=fill_value)
+                data, sparse_index, fill_value = res
+
+            elif isinstance(data, (tuple, list, np.ndarray)):
+                # array-like
+                if sparse_index is None:
+                    res = make_sparse(data, kind=kind, fill_value=fill_value)
+                    data, sparse_index, fill_value = res
+                else:
+                    assert (len(data) == sparse_index.npoints)
+
+            elif isinstance(data, SingleBlockManager):
+                if dtype is not None:
+                    data = data.astype(dtype)
+                if index is None:
+                    index = data.index.view()
+                elif not data.index.equals(index) or copy:  # pragma: no cover
+                    # GH#19275 SingleBlockManager input should only be called
+                    # internally
+                    raise AssertionError('Cannot pass both SingleBlockManager '
+                                         '`data` argument and a different '
+                                         '`index` argument.  `copy` must '
+                                         'be False.')
+
+            else:
+                length = len(index)
+
+                if data == fill_value or (isna(data) and isna(fill_value)):
+                    if kind == 'block':
+                        sparse_index = BlockIndex(length, [], [])
+                    else:
+                        sparse_index = IntIndex(length, [])
+                    data = np.array([])
+
+                else:
+                    if kind == 'block':
+                        locs, lens = ([0], [length]) if length else ([], [])
+                        sparse_index = BlockIndex(length, locs, lens)
+                    else:
+                        sparse_index = IntIndex(length, index)
+                    v = data
+                    data = np.empty(length)
+                    data.fill(v)
+
+            if index is None:
+                index = com._default_index(sparse_index.length)
+            index = _ensure_index(index)
+
+            # create/copy the manager
+            if isinstance(data, SingleBlockManager):
+
+                if copy:
+                    data = data.copy()
+            else:
+
+                # create a sparse array
+                if not isinstance(data, SparseArray):
+                    data = SparseArray(data, sparse_index=sparse_index,
+                                       fill_value=fill_value, dtype=dtype,
+                                       copy=copy)
+
+                data = SingleBlockManager(data, index)
+
+        generic.NDFrame.__init__(self, data)
+
+        self.index = index
+        self.name = name
+
+    @property
+    def values(self):
+        """ return the array """
+        return self.block.values
+
+    def __array__(self, result=None):
+        """ the array interface, return my values """
+        return self.block.values
+
+    def get_values(self):
+        """ same as values """
+        return self.block.to_dense().view()
+
+    @property
+    def block(self):
+        return self._data._block
+
+    @property
+    def fill_value(self):
+        return self.block.fill_value
+
+    @fill_value.setter
+    def fill_value(self, v):
+        self.block.fill_value = v
+
+    @property
+    def sp_index(self):
+        return self.block.sp_index
+
+    @property
+    def sp_values(self):
+        return self.values.sp_values
+
+    @property
+    def npoints(self):
+        return self.sp_index.npoints
+
+    @classmethod
+    def from_array(cls, arr, index=None, name=None, copy=False,
+                   fill_value=None, fastpath=False):
+        """Construct SparseSeries from array.
+
+        .. deprecated:: 0.23.0
+            Use the pd.SparseSeries(..) constructor instead.
+        """
+        warnings.warn("'from_array' is deprecated and will be removed in a "
+                      "future version. Please use the pd.SparseSeries(..) "
+                      "constructor instead.", FutureWarning, stacklevel=2)
+        return cls(arr, index=index, name=name, copy=copy,
+                   fill_value=fill_value, fastpath=fastpath)
+
+    @property
+    def _constructor(self):
+        return SparseSeries
+
+    @property
+    def _constructor_expanddim(self):
+        from pandas.core.sparse.api import SparseDataFrame
+        return SparseDataFrame
+
+    @property
+    def kind(self):
+        if isinstance(self.sp_index, BlockIndex):
+            return 'block'
+        elif isinstance(self.sp_index, IntIndex):
+            return 'integer'
+
+    def as_sparse_array(self, kind=None, fill_value=None, copy=False):
+        """ return my self as a sparse array, do not copy by default """
+
+        if fill_value is None:
+            fill_value = self.fill_value
+        if kind is None:
+            kind = self.kind
+        return SparseArray(self.values, sparse_index=self.sp_index,
+                           fill_value=fill_value, kind=kind, copy=copy)
+
+    def __len__(self):
+        return len(self.block)
+
+    @property
+    def shape(self):
+        return self._data.shape
+
+    def __unicode__(self):
+        # currently, unicode is same as repr...fixes infinite loop
+        series_rep = Series.__unicode__(self)
+        rep = '{series}\n{index!r}'.format(series=series_rep,
+                                           index=self.sp_index)
+        return rep
+
+    def __array_wrap__(self, result, context=None):
+        """
+        Gets called prior to a ufunc (and after)
+
+        See SparseArray.__array_wrap__ for detail.
+        """
+        if isinstance(context, tuple) and len(context) == 3:
+            ufunc, args, domain = context
+            args = [getattr(a, 'fill_value', a) for a in args]
+            with np.errstate(all='ignore'):
+                fill_value = ufunc(self.fill_value, *args[1:])
+        else:
+            fill_value = self.fill_value
+
+        return self._constructor(result, index=self.index,
+                                 sparse_index=self.sp_index,
+                                 fill_value=fill_value,
+                                 copy=False).__finalize__(self)
+
+    def __array_finalize__(self, obj):
+        """
+        Gets called after any ufunc or other array operations, necessary
+        to pass on the index.
+        """
+        self.name = getattr(obj, 'name', None)
+        self.fill_value = getattr(obj, 'fill_value', None)
+
+    def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
+                filter_type=None, **kwds):
+        """ perform a reduction operation """
+        return op(self.get_values(), skipna=skipna, **kwds)
+
+    def __getstate__(self):
+        # pickling
+        return dict(_typ=self._typ, _subtyp=self._subtyp, _data=self._data,
+                    fill_value=self.fill_value, name=self.name)
+
+    def _unpickle_series_compat(self, state):
+
+        nd_state, own_state = state
+
+        # recreate the ndarray
+        data = np.empty(nd_state[1], dtype=nd_state[2])
+        np.ndarray.__setstate__(data, nd_state)
+
+        index, fill_value, sp_index = own_state[:3]
+        name = None
+        if len(own_state) > 3:
+            name = own_state[3]
+
+        # create a sparse array
+        if not isinstance(data, SparseArray):
+            data = SparseArray(data, sparse_index=sp_index,
+                               fill_value=fill_value, copy=False)
+
+        # recreate
+        data = SingleBlockManager(data, index, fastpath=True)
+        generic.NDFrame.__init__(self, data)
+
+        self._set_axis(0, index)
+        self.name = name
+
+    def __iter__(self):
+        """ forward to the array """
+        return iter(self.values)
+
+    def _set_subtyp(self, is_all_dates):
+        if is_all_dates:
+            object.__setattr__(self, '_subtyp', 'sparse_time_series')
+        else:
+            object.__setattr__(self, '_subtyp', 'sparse_series')
+
+    def _ixs(self, i, axis=0):
+        """
+        Return the i-th value or values in the SparseSeries by location
+
+        Parameters
+        ----------
+        i : int, slice, or sequence of integers
+
+        Returns
+        -------
+        value : scalar (int) or Series (slice, sequence)
+        """
+        label = self.index[i]
+        if isinstance(label, Index):
+            return self.take(i, axis=axis)
+        else:
+            return self._get_val_at(i)
+
+    def _get_val_at(self, loc):
+        """ forward to the array """
+        return self.block.values._get_val_at(loc)
+
+    def __getitem__(self, key):
+        try:
+            return self.index.get_value(self, key)
+
+        except InvalidIndexError:
+            pass
+        except KeyError:
+            if isinstance(key, (int, np.integer)):
+                return self._get_val_at(key)
+            elif key is Ellipsis:
+                return self
+            raise Exception('Requested index not in this series!')
+
+        except TypeError:
+            # Could not hash item, must be array-like?
+            pass
+
+        key = com._values_from_object(key)
+        if self.index.nlevels > 1 and isinstance(key, tuple):
+            # to handle MultiIndex labels
+            key = self.index.get_loc(key)
+        return self._constructor(self.values[key],
+                                 index=self.index[key]).__finalize__(self)
+
+    def _get_values(self, indexer):
+        try:
+            return self._constructor(self._data.get_slice(indexer),
+                                     fastpath=True).__finalize__(self)
+        except Exception:
+            return self[indexer]
+
+    def _set_with_engine(self, key, value):
+        return self._set_value(key, value)
+
+    def abs(self):
+        """
+        Return an object with absolute value taken. Only applicable to objects
+        that are all numeric
+
+        Returns
+        -------
+        abs: same type as caller
+        """
+        return self._constructor(np.abs(self.values),
+                                 index=self.index).__finalize__(self)
+
+    def get(self, label, default=None):
+        """
+        Returns value occupying requested label, default to specified
+        missing value if not present. Analogous to dict.get
+
+        Parameters
+        ----------
+        label : object
+            Label value looking for
+        default : object, optional
+            Value to return if label not in index
+
+        Returns
+        -------
+        y : scalar
+        """
+        if label in self.index:
+            loc = self.index.get_loc(label)
+            return self._get_val_at(loc)
+        else:
+            return default
+
+    def get_value(self, label, takeable=False):
+        """
+        Retrieve single value at passed index label
+
+        .. deprecated:: 0.21.0
+
+        Please use .at[] or .iat[] accessors.
+
+        Parameters
+        ----------
+        index : label
+        takeable : interpret the index as indexers, default False
+
+        Returns
+        -------
+        value : scalar value
+        """
+        warnings.warn("get_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+
+        return self._get_value(label, takeable=takeable)
+
+    def _get_value(self, label, takeable=False):
+        loc = label if takeable is True else self.index.get_loc(label)
+        return self._get_val_at(loc)
+    _get_value.__doc__ = get_value.__doc__
+
+    def set_value(self, label, value, takeable=False):
+        """
+        Quickly set single value at passed label. If label is not contained, a
+        new object is created with the label placed at the end of the result
+        index
+
+        .. deprecated:: 0.21.0
+
+        Please use .at[] or .iat[] accessors.
+
+        Parameters
+        ----------
+        label : object
+            Partial indexing with MultiIndex not allowed
+        value : object
+            Scalar value
+        takeable : interpret the index as indexers, default False
+
+        Notes
+        -----
+        This method *always* returns a new object. It is not particularly
+        efficient but is provided for API compatibility with Series
+
+        Returns
+        -------
+        series : SparseSeries
+        """
+        warnings.warn("set_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._set_value(label, value, takeable=takeable)
+
+    def _set_value(self, label, value, takeable=False):
+        values = self.to_dense()
+
+        # if the label doesn't exist, we will create a new object here
+        # and possibly change the index
+        new_values = values._set_value(label, value, takeable=takeable)
+        if new_values is not None:
+            values = new_values
+        new_index = values.index
+        values = SparseArray(values, fill_value=self.fill_value,
+                             kind=self.kind)
+        self._data = SingleBlockManager(values, new_index)
+        self._index = new_index
+    _set_value.__doc__ = set_value.__doc__
+
+    def _set_values(self, key, value):
+
+        # this might be inefficient as we have to recreate the sparse array
+        # rather than setting individual elements, but have to convert
+        # the passed slice/boolean that's in dense space into a sparse indexer
+        # not sure how to do that!
+        if isinstance(key, Series):
+            key = key.values
+
+        values = self.values.to_dense()
+        values[key] = libindex.convert_scalar(values, value)
+        values = SparseArray(values, fill_value=self.fill_value,
+                             kind=self.kind)
+        self._data = SingleBlockManager(values, self.index)
+
+    def to_dense(self, sparse_only=False):
+        """
+        Convert SparseSeries to a Series.
+
+        Parameters
+        ----------
+        sparse_only : bool, default False
+            .. deprecated:: 0.20.0
+                This argument will be removed in a future version.
+
+            If True, return just the non-sparse values, or the dense version
+            of `self.values` if False.
+
+        Returns
+        -------
+        s : Series
+        """
+        if sparse_only:
+            warnings.warn(("The 'sparse_only' parameter has been deprecated "
+                           "and will be removed in a future version."),
+                          FutureWarning, stacklevel=2)
+            int_index = self.sp_index.to_int_index()
+            index = self.index.take(int_index.indices)
+            return Series(self.sp_values, index=index, name=self.name)
+        else:
+            return Series(self.values.to_dense(), index=self.index,
+                          name=self.name)
+
+    @property
+    def density(self):
+        r = float(self.sp_index.npoints) / float(self.sp_index.length)
+        return r
+
+    def copy(self, deep=True):
+        """
+        Make a copy of the SparseSeries. Only the actual sparse values need to
+        be copied
+        """
+        new_data = self._data
+        if deep:
+            new_data = self._data.copy()
+
+        return self._constructor(new_data, sparse_index=self.sp_index,
+                                 fill_value=self.fill_value).__finalize__(self)
+
+    @Appender(generic._shared_docs['reindex'] % _shared_doc_kwargs)
+    def reindex(self, index=None, method=None, copy=True, limit=None,
+                **kwargs):
+
+        return super(SparseSeries, self).reindex(index=index, method=method,
+                                                 copy=copy, limit=limit,
+                                                 **kwargs)
+
+    def sparse_reindex(self, new_index):
+        """
+        Conform sparse values to new SparseIndex
+
+        Parameters
+        ----------
+        new_index : {BlockIndex, IntIndex}
+
+        Returns
+        -------
+        reindexed : SparseSeries
+        """
+        if not isinstance(new_index, splib.SparseIndex):
+            raise TypeError('new index must be a SparseIndex')
+
+        block = self.block.sparse_reindex(new_index)
+        new_data = SingleBlockManager(block, self.index)
+        return self._constructor(new_data, index=self.index,
+                                 sparse_index=new_index,
+                                 fill_value=self.fill_value).__finalize__(self)
+
+    @Appender(generic._shared_docs['take'])
+    def take(self, indices, axis=0, convert=None, *args, **kwargs):
+        if convert is not None:
+            msg = ("The 'convert' parameter is deprecated "
+                   "and will be removed in a future version.")
+            warnings.warn(msg, FutureWarning, stacklevel=2)
+        else:
+            convert = True
+
+        nv.validate_take_with_convert(convert, args, kwargs)
+        new_values = SparseArray.take(self.values, indices)
+        new_index = self.index.take(indices)
+        return self._constructor(new_values,
+                                 index=new_index).__finalize__(self)
+
+    def cumsum(self, axis=0, *args, **kwargs):
+        """
+        Cumulative sum of non-NA/null values.
+
+        When performing the cumulative summation, any non-NA/null values will
+        be skipped. The resulting SparseSeries will preserve the locations of
+        NaN values, but the fill value will be `np.nan` regardless.
+
+        Parameters
+        ----------
+        axis : {0}
+
+        Returns
+        -------
+        cumsum : SparseSeries
+        """
+        nv.validate_cumsum(args, kwargs)
+        if axis is not None:
+            axis = self._get_axis_number(axis)
+
+        new_array = self.values.cumsum()
+
+        return self._constructor(
+            new_array, index=self.index,
+            sparse_index=new_array.sp_index).__finalize__(self)
+
+    @Appender(generic._shared_docs['isna'] % _shared_doc_kwargs)
+    def isna(self):
+        arr = SparseArray(isna(self.values.sp_values),
+                          sparse_index=self.values.sp_index,
+                          fill_value=isna(self.fill_value))
+        return self._constructor(arr, index=self.index).__finalize__(self)
+    isnull = isna
+
+    @Appender(generic._shared_docs['notna'] % _shared_doc_kwargs)
+    def notna(self):
+        arr = SparseArray(notna(self.values.sp_values),
+                          sparse_index=self.values.sp_index,
+                          fill_value=notna(self.fill_value))
+        return self._constructor(arr, index=self.index).__finalize__(self)
+    notnull = notna
+
+    def dropna(self, axis=0, inplace=False, **kwargs):
+        """
+        Analogous to Series.dropna. If fill_value=NaN, returns a dense Series
+        """
+        # TODO: make more efficient
+        axis = self._get_axis_number(axis or 0)
+        dense_valid = self.to_dense().dropna()
+        if inplace:
+            raise NotImplementedError("Cannot perform inplace dropna"
+                                      " operations on a SparseSeries")
+        if isna(self.fill_value):
+            return dense_valid
+        else:
+            dense_valid = dense_valid[dense_valid != self.fill_value]
+            return dense_valid.to_sparse(fill_value=self.fill_value)
+
+    @Appender(generic._shared_docs['shift'] % _shared_doc_kwargs)
+    def shift(self, periods, freq=None, axis=0):
+        if periods == 0:
+            return self.copy()
+
+        # no special handling of fill values yet
+        if not isna(self.fill_value):
+            shifted = self.to_dense().shift(periods, freq=freq,
+                                            axis=axis)
+            return shifted.to_sparse(fill_value=self.fill_value,
+                                     kind=self.kind)
+
+        if freq is not None:
+            return self._constructor(
+                self.sp_values, sparse_index=self.sp_index,
+                index=self.index.shift(periods, freq),
+                fill_value=self.fill_value).__finalize__(self)
+
+        int_index = self.sp_index.to_int_index()
+        new_indices = int_index.indices + periods
+        start, end = new_indices.searchsorted([0, int_index.length])
+
+        new_indices = new_indices[start:end]
+        new_sp_index = _make_index(len(self), new_indices, self.sp_index)
+
+        arr = self.values._simple_new(self.sp_values[start:end].copy(),
+                                      new_sp_index, fill_value=np.nan)
+        return self._constructor(arr, index=self.index).__finalize__(self)
+
+    def combine_first(self, other):
+        """
+        Combine Series values, choosing the calling Series's values
+        first. Result index will be the union of the two indexes
+
+        Parameters
+        ----------
+        other : Series
+
+        Returns
+        -------
+        y : Series
+        """
+        if isinstance(other, SparseSeries):
+            other = other.to_dense()
+
+        dense_combined = self.to_dense().combine_first(other)
+        return dense_combined.to_sparse(fill_value=self.fill_value)
+
+    def to_coo(self, row_levels=(0, ), column_levels=(1, ), sort_labels=False):
+        """
+        Create a scipy.sparse.coo_matrix from a SparseSeries with MultiIndex.
+
+        Use row_levels and column_levels to determine the row and column
+        coordinates respectively. row_levels and column_levels are the names
+        (labels) or numbers of the levels. {row_levels, column_levels} must be
+        a partition of the MultiIndex level names (or numbers).
+
+        Parameters
+        ----------
+        row_levels : tuple/list
+        column_levels : tuple/list
+        sort_labels : bool, default False
+            Sort the row and column labels before forming the sparse matrix.
+
+        Returns
+        -------
+        y : scipy.sparse.coo_matrix
+        rows : list (row labels)
+        columns : list (column labels)
+
+        Examples
+        --------
+        >>> from numpy import nan
+        >>> s = Series([3.0, nan, 1.0, 3.0, nan, nan])
+        >>> s.index = MultiIndex.from_tuples([(1, 2, 'a', 0),
+                                              (1, 2, 'a', 1),
+                                              (1, 1, 'b', 0),
+                                              (1, 1, 'b', 1),
+                                              (2, 1, 'b', 0),
+                                              (2, 1, 'b', 1)],
+                                              names=['A', 'B', 'C', 'D'])
+        >>> ss = s.to_sparse()
+        >>> A, rows, columns = ss.to_coo(row_levels=['A', 'B'],
+                                         column_levels=['C', 'D'],
+                                         sort_labels=True)
+        >>> A
+        <3x4 sparse matrix of type '<class 'numpy.float64'>'
+                with 3 stored elements in COOrdinate format>
+        >>> A.todense()
+        matrix([[ 0.,  0.,  1.,  3.],
+        [ 3.,  0.,  0.,  0.],
+        [ 0.,  0.,  0.,  0.]])
+        >>> rows
+        [(1, 1), (1, 2), (2, 1)]
+        >>> columns
+        [('a', 0), ('a', 1), ('b', 0), ('b', 1)]
+        """
+        A, rows, columns = _sparse_series_to_coo(self, row_levels,
+                                                 column_levels,
+                                                 sort_labels=sort_labels)
+        return A, rows, columns
+
+    @classmethod
+    def from_coo(cls, A, dense_index=False):
+        """
+        Create a SparseSeries from a scipy.sparse.coo_matrix.
+
+        Parameters
+        ----------
+        A : scipy.sparse.coo_matrix
+        dense_index : bool, default False
+            If False (default), the SparseSeries index consists of only the
+            coords of the non-null entries of the original coo_matrix.
+            If True, the SparseSeries index consists of the full sorted
+            (row, col) coordinates of the coo_matrix.
+
+        Returns
+        -------
+        s : SparseSeries
+
+        Examples
+        ---------
+        >>> from scipy import sparse
+        >>> A = sparse.coo_matrix(([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])),
+                               shape=(3, 4))
+        >>> A
+        <3x4 sparse matrix of type '<class 'numpy.float64'>'
+                with 3 stored elements in COOrdinate format>
+        >>> A.todense()
+        matrix([[ 0.,  0.,  1.,  2.],
+                [ 3.,  0.,  0.,  0.],
+                [ 0.,  0.,  0.,  0.]])
+        >>> ss = SparseSeries.from_coo(A)
+        >>> ss
+        0  2    1
+           3    2
+        1  0    3
+        dtype: float64
+        BlockIndex
+        Block locations: array([0], dtype=int32)
+        Block lengths: array([3], dtype=int32)
+        """
+        return _coo_to_sparse_series(A, dense_index=dense_index)
+
+
+# overwrite series methods with unaccelerated Sparse-specific versions
+ops.add_flex_arithmetic_methods(SparseSeries)
+ops.add_special_arithmetic_methods(SparseSeries)
diff --git a/pandas/core/strings.py b/pandas/core/strings.py
index dddc1f4898908..b27cfdfe3f1bd 100644
--- a/pandas/core/strings.py
+++ b/pandas/core/strings.py
@@ -1,22 +1,60 @@
 import numpy as np
 
 from pandas.compat import zip
-from pandas.core.common import isnull, _values_from_object, is_bool_dtype, is_list_like
+from pandas.core.dtypes.generic import ABCSeries, ABCIndex
+from pandas.core.dtypes.missing import isna, notna
+from pandas.core.dtypes.common import (
+    is_bool_dtype,
+    is_categorical_dtype,
+    is_object_dtype,
+    is_string_like,
+    is_list_like,
+    is_scalar,
+    is_integer,
+    is_re)
+
+import pandas.core.common as com
+from pandas.core.algorithms import take_1d
 import pandas.compat as compat
-from pandas.util.decorators import Appender, deprecate_kwarg
+from pandas.core.base import NoNewAttributesMixin
+from pandas.util._decorators import Appender
 import re
-import pandas.lib as lib
+import pandas._libs.lib as lib
+import pandas._libs.ops as libops
 import warnings
 import textwrap
+import codecs
 
+_cpython_optimized_encoders = (
+    "utf-8", "utf8", "latin-1", "latin1", "iso-8859-1", "mbcs", "ascii"
+)
+_cpython_optimized_decoders = _cpython_optimized_encoders + (
+    "utf-16", "utf-32"
+)
 
 _shared_docs = dict()
 
 
 def _get_array_list(arr, others):
+    """
+    Auxiliary function for :func:`str_cat`
+
+    Parameters
+    ----------
+    arr : ndarray
+        The left-most ndarray of the concatenation
+    others : list, ndarray, Series
+        The rest of the content to concatenate. If list of list-likes,
+        all elements must be passable to ``np.asarray``.
+
+    Returns
+    -------
+    list
+        List of all necessary arrays
+    """
     from pandas.core.series import Series
 
-    if len(others) and isinstance(_values_from_object(others)[0],
+    if len(others) and isinstance(com._values_from_object(others)[0],
                                   (list, np.ndarray, Series)):
         arrays = [arr] + list(others)
     else:
@@ -27,42 +65,28 @@ def _get_array_list(arr, others):
 
 def str_cat(arr, others=None, sep=None, na_rep=None):
     """
-    Concatenate strings in the Series/Index with given separator.
+    Auxiliary function for :meth:`str.cat`
+
+    If `others` is specified, this function concatenates the Series/Index
+    and elements of `others` element-wise.
+    If `others` is not being passed then all values in the Series are
+    concatenated in a single string with a given `sep`.
 
     Parameters
     ----------
-    others : list-like, or list of list-likes
-      If None, returns str concatenating strings of the Series
+    others : list-like, or list of list-likes, optional
+        List-likes (or a list of them) of the same length as calling object.
+        If None, returns str concatenating strings of the Series.
     sep : string or None, default None
+        If None, concatenates without any separator.
     na_rep : string or None, default None
-        If None, an NA in any array will propagate
+        If None, NA in the series are ignored.
 
     Returns
     -------
-    concat : Series/Index of objects or str
-
-    Examples
-    --------
-    If ``others`` is specified, corresponding values are
-    concatenated with the separator. Result will be a Series of strings.
-
-    >>> Series(['a', 'b', 'c']).str.cat(['A', 'B', 'C'], sep=',')
-    0    a,A
-    1    b,B
-    2    c,C
-    dtype: object
-
-    Otherwise, strings in the Series are concatenated. Result will be a string.
-
-    >>> Series(['a', 'b', 'c']).str.cat(sep=',')
-    'a,b,c'
-
-    Also, you can pass a list of list-likes.
-
-    >>> Series(['a', 'b']).str.cat([['x', 'y'], ['1', '2']], sep=',')
-    0    a,x,1
-    1    b,y,2
-    dtype: object
+    concat
+        ndarray containing concatenated results (if `others is not None`)
+        or str (if `others is None`)
     """
     if sep is None:
         sep = ''
@@ -71,7 +95,7 @@ def str_cat(arr, others=None, sep=None, na_rep=None):
         arrays = _get_array_list(arr, others)
 
         n = _length_check(arrays)
-        masks = np.array([isnull(x) for x in arrays])
+        masks = np.array([isna(x) for x in arrays])
         cats = None
 
         if na_rep is None:
@@ -99,20 +123,25 @@ def str_cat(arr, others=None, sep=None, na_rep=None):
         return result
     else:
         arr = np.asarray(arr, dtype=object)
-        mask = isnull(arr)
+        mask = isna(arr)
         if na_rep is None and mask.any():
-            return np.nan
+            if sep == '':
+                na_rep = ''
+            else:
+                return sep.join(arr[notna(arr)])
         return sep.join(np.where(mask, na_rep, arr))
 
 
 def _length_check(others):
     n = None
     for x in others:
-        if n is None:
-            n = len(x)
-        elif len(x) != n:
-            raise ValueError('All arrays must be same length')
-
+        try:
+            if n is None:
+                n = len(x)
+            elif len(x) != n:
+                raise ValueError('All arrays must be same length')
+        except TypeError:
+            raise ValueError('Must pass arrays containing strings to str_cat')
     return n
 
 
@@ -122,25 +151,36 @@ def _na_map(f, arr, na_result=np.nan, dtype=object):
 
 
 def _map(f, arr, na_mask=False, na_value=np.nan, dtype=object):
-    from pandas.core.series import Series
-
     if not len(arr):
         return np.ndarray(0, dtype=dtype)
 
-    if isinstance(arr, Series):
+    if isinstance(arr, ABCSeries):
         arr = arr.values
     if not isinstance(arr, np.ndarray):
         arr = np.asarray(arr, dtype=object)
     if na_mask:
-        mask = isnull(arr)
+        mask = isna(arr)
         try:
-            result = lib.map_infer_mask(arr, f, mask.view(np.uint8))
-        except (TypeError, AttributeError):
+            convert = not all(mask)
+            result = lib.map_infer_mask(arr, f, mask.view(np.uint8), convert)
+        except (TypeError, AttributeError) as e:
+            # Reraise the exception if callable `f` got wrong number of args.
+            # The user may want to be warned by this, instead of getting NaN
+            if compat.PY2:
+                p_err = r'takes (no|(exactly|at (least|most)) ?\d+) arguments?'
+            else:
+                p_err = (r'((takes)|(missing)) (?(2)from \d+ to )?\d+ '
+                         r'(?(3)required )positional arguments?')
+
+            if len(e.args) >= 1 and re.search(p_err, e.args[0]):
+                raise e
+
             def g(x):
                 try:
                     return f(x)
                 except (TypeError, AttributeError):
                     return na_value
+
             return _map(g, arr, dtype=dtype)
         if na_value is not np.nan:
             np.putmask(result, mask, na_value)
@@ -155,15 +195,65 @@ def str_count(arr, pat, flags=0):
     """
     Count occurrences of pattern in each string of the Series/Index.
 
+    This function is used to count the number of times a particular regex
+    pattern is repeated in each of the string elements of the
+    :class:`~pandas.Series`.
+
     Parameters
     ----------
-    pat : string, valid regular expression
-    flags : int, default 0 (no flags)
-        re module flags, e.g. re.IGNORECASE
+    pat : str
+        Valid regular expression.
+    flags : int, default 0, meaning no flags
+        Flags for the `re` module. For a complete list, `see here
+        <https://docs.python.org/3/howto/regex.html#compilation-flags>`_.
+    **kwargs
+        For compatibility with other string methods. Not used.
 
     Returns
     -------
-    counts : Series/Index of integer values
+    counts : Series or Index
+        Same type as the calling object containing the integer counts.
+
+    Notes
+    -----
+    Some characters need to be escaped when passing in `pat`.
+    eg. ``'$'`` has a special meaning in regex and must be escaped when
+    finding this literal character.
+
+    See Also
+    --------
+    re : Standard library module for regular expressions.
+    str.count : Standard library version, without regular expression support.
+
+    Examples
+    --------
+    >>> s = pd.Series(['A', 'B', 'Aaba', 'Baca', np.nan, 'CABA', 'cat'])
+    >>> s.str.count('a')
+    0    0.0
+    1    0.0
+    2    2.0
+    3    2.0
+    4    NaN
+    5    0.0
+    6    1.0
+    dtype: float64
+
+    Escape ``'$'`` to find the literal dollar sign.
+
+    >>> s = pd.Series(['$', 'B', 'Aab$', '$$ca', 'C$B$', 'cat'])
+    >>> s.str.count('\\$')
+    0    1
+    1    0
+    2    1
+    3    2
+    4    2
+    5    0
+    dtype: int64
+
+    This is also available on Index
+
+    >>> pd.Index(['A', 'A', 'Aaba', 'cat']).str.count('a')
+    Int64Index([0, 0, 2, 1], dtype='int64')
     """
     regex = re.compile(pat, flags=flags)
     f = lambda x: len(regex.findall(x))
@@ -172,29 +262,123 @@ def str_count(arr, pat, flags=0):
 
 def str_contains(arr, pat, case=True, flags=0, na=np.nan, regex=True):
     """
-    Return boolean Series/``array`` whether given pattern/regex is
-    contained in each string in the Series/Index.
+    Test if pattern or regex is contained within a string of a Series or Index.
+
+    Return boolean Series or Index based on whether a given pattern or regex is
+    contained within a string of a Series or Index.
 
     Parameters
     ----------
-    pat : string
-        Character sequence or regular expression
-    case : boolean, default True
-        If True, case sensitive
+    pat : str
+        Character sequence or regular expression.
+    case : bool, default True
+        If True, case sensitive.
     flags : int, default 0 (no flags)
-        re module flags, e.g. re.IGNORECASE
-    na : default NaN, fill value for missing values.
+        Flags to pass through to the re module, e.g. re.IGNORECASE.
+    na : default NaN
+        Fill value for missing values.
     regex : bool, default True
-        If True use re.search, otherwise use Python in operator
+        If True, assumes the pat is a regular expression.
+
+        If False, treats the pat as a literal string.
 
     Returns
     -------
-    contained : Series/array of boolean values
+    Series or Index of boolean values
+        A Series or Index of boolean values indicating whether the
+        given pattern is contained within the string of each element
+        of the Series or Index.
 
     See Also
     --------
     match : analogous, but stricter, relying on re.match instead of re.search
 
+    Examples
+    --------
+
+    Returning a Series of booleans using only a literal pattern.
+
+    >>> s1 = pd.Series(['Mouse', 'dog', 'house and parrot', '23', np.NaN])
+    >>> s1.str.contains('og', regex=False)
+    0    False
+    1     True
+    2    False
+    3    False
+    4      NaN
+    dtype: object
+
+    Returning an Index of booleans using only a literal pattern.
+
+    >>> ind = pd.Index(['Mouse', 'dog', 'house and parrot', '23.0', np.NaN])
+    >>> ind.str.contains('23', regex=False)
+    Index([False, False, False, True, nan], dtype='object')
+
+    Specifying case sensitivity using `case`.
+
+    >>> s1.str.contains('oG', case=True, regex=True)
+    0    False
+    1    False
+    2    False
+    3    False
+    4      NaN
+    dtype: object
+
+    Specifying `na` to be `False` instead of `NaN` replaces NaN values
+    with `False`. If Series or Index does not contain NaN values
+    the resultant dtype will be `bool`, otherwise, an `object` dtype.
+
+    >>> s1.str.contains('og', na=False, regex=True)
+    0    False
+    1     True
+    2    False
+    3    False
+    4    False
+    dtype: bool
+
+    Returning 'house' or 'dog' when either expression occurs in a string.
+
+    >>> s1.str.contains('house|dog', regex=True)
+    0    False
+    1     True
+    2     True
+    3    False
+    4      NaN
+    dtype: object
+
+    Ignoring case sensitivity using `flags` with regex.
+
+    >>> import re
+    >>> s1.str.contains('PARROT', flags=re.IGNORECASE, regex=True)
+    0    False
+    1    False
+    2     True
+    3    False
+    4      NaN
+    dtype: object
+
+    Returning any digit using regular expression.
+
+    >>> s1.str.contains('\\d', regex=True)
+    0    False
+    1    False
+    2    False
+    3     True
+    4      NaN
+    dtype: object
+
+    Ensure `pat` is a not a literal pattern when `regex` is set to True.
+    Note in the following example one might expect only `s2[1]` and `s2[3]` to
+    return `True`. However, '.0' as a regex matches any character
+    followed by a 0.
+
+    >>> s2 = pd.Series(['40','40.0','41','41.0','35'])
+    >>> s2.str.contains('.0', regex=True)
+    0     True
+    1     True
+    2    False
+    3     True
+    4    False
+    dtype: bool
     """
     if regex:
         if not case:
@@ -204,7 +388,8 @@ def str_contains(arr, pat, case=True, flags=0, na=np.nan, regex=True):
 
         if regex.groups > 0:
             warnings.warn("This pattern has match groups. To actually get the"
-                          " groups, use str.extract.", UserWarning, stacklevel=3)
+                          " groups, use str.extract.", UserWarning,
+                          stacklevel=3)
 
         f = lambda x: bool(regex.search(x))
     else:
@@ -220,19 +405,54 @@ def str_contains(arr, pat, case=True, flags=0, na=np.nan, regex=True):
 
 def str_startswith(arr, pat, na=np.nan):
     """
-    Return boolean Series/``array`` indicating whether each string in the
-    Series/Index starts with passed pattern. Equivalent to
-    :meth:`str.startswith`.
+    Test if the start of each string element matches a pattern.
+
+    Equivalent to :meth:`str.startswith`.
 
     Parameters
     ----------
-    pat : string
-        Character sequence
-    na : bool, default NaN
+    pat : str
+        Character sequence. Regular expressions are not accepted.
+    na : object, default NaN
+        Object shown if element tested is not a string.
 
     Returns
     -------
-    startswith : Series/array of boolean values
+    Series or Index of bool
+        A Series of booleans indicating whether the given pattern matches
+        the start of each string element.
+
+    See Also
+    --------
+    str.startswith : Python standard library string method.
+    Series.str.endswith : Same as startswith, but tests the end of string.
+    Series.str.contains : Tests if string element contains a pattern.
+
+    Examples
+    --------
+    >>> s = pd.Series(['bat', 'Bear', 'cat', np.nan])
+    >>> s
+    0     bat
+    1    Bear
+    2     cat
+    3     NaN
+    dtype: object
+
+    >>> s.str.startswith('b')
+    0     True
+    1    False
+    2    False
+    3      NaN
+    dtype: object
+
+    Specifying `na` to be `False` instead of `NaN`.
+
+    >>> s.str.startswith('b', na=False)
+    0     True
+    1    False
+    2    False
+    3    False
+    dtype: bool
     """
     f = lambda x: x.startswith(pat)
     return _na_map(f, arr, na, dtype=bool)
@@ -240,58 +460,210 @@ def str_startswith(arr, pat, na=np.nan):
 
 def str_endswith(arr, pat, na=np.nan):
     """
-    Return boolean Series indicating whether each string in the
-    Series/Index ends with passed pattern. Equivalent to
-    :meth:`str.endswith`.
+    Test if the end of each string element matches a pattern.
+
+    Equivalent to :meth:`str.endswith`.
 
     Parameters
     ----------
-    pat : string
-        Character sequence
-    na : bool, default NaN
+    pat : str
+        Character sequence. Regular expressions are not accepted.
+    na : object, default NaN
+        Object shown if element tested is not a string.
 
     Returns
     -------
-    endswith : Series/array of boolean values
+    Series or Index of bool
+        A Series of booleans indicating whether the given pattern matches
+        the end of each string element.
+
+    See Also
+    --------
+    str.endswith : Python standard library string method.
+    Series.str.startswith : Same as endswith, but tests the start of string.
+    Series.str.contains : Tests if string element contains a pattern.
+
+    Examples
+    --------
+    >>> s = pd.Series(['bat', 'bear', 'caT', np.nan])
+    >>> s
+    0     bat
+    1    bear
+    2     caT
+    3     NaN
+    dtype: object
+
+    >>> s.str.endswith('t')
+    0     True
+    1    False
+    2    False
+    3      NaN
+    dtype: object
+
+    Specifying `na` to be `False` instead of `NaN`.
+
+    >>> s.str.endswith('t', na=False)
+    0     True
+    1    False
+    2    False
+    3    False
+    dtype: bool
     """
     f = lambda x: x.endswith(pat)
     return _na_map(f, arr, na, dtype=bool)
 
 
-def str_replace(arr, pat, repl, n=-1, case=True, flags=0):
-    """
+def str_replace(arr, pat, repl, n=-1, case=None, flags=0, regex=True):
+    r"""
     Replace occurrences of pattern/regex in the Series/Index with
     some other string. Equivalent to :meth:`str.replace` or
     :func:`re.sub`.
 
     Parameters
     ----------
-    pat : string
-        Character sequence or regular expression
-    repl : string
-        Replacement sequence
+    pat : string or compiled regex
+        String can be a character sequence or regular expression.
+
+        .. versionadded:: 0.20.0
+            `pat` also accepts a compiled regex.
+
+    repl : string or callable
+        Replacement string or a callable. The callable is passed the regex
+        match object and must return a replacement string to be used.
+        See :func:`re.sub`.
+
+        .. versionadded:: 0.20.0
+            `repl` also accepts a callable.
+
     n : int, default -1 (all)
         Number of replacements to make from start
-    case : boolean, default True
-        If True, case sensitive
+    case : boolean, default None
+        - If True, case sensitive (the default if `pat` is a string)
+        - Set to False for case insensitive
+        - Cannot be set if `pat` is a compiled regex
     flags : int, default 0 (no flags)
-        re module flags, e.g. re.IGNORECASE
+        - re module flags, e.g. re.IGNORECASE
+        - Cannot be set if `pat` is a compiled regex
+    regex : boolean, default True
+        - If True, assumes the passed-in pattern is a regular expression.
+        - If False, treats the pattern as a literal string
+        - Cannot be set to False if `pat` is a compiled regex or `repl` is
+          a callable.
+
+        .. versionadded:: 0.23.0
 
     Returns
     -------
     replaced : Series/Index of objects
+
+    Raises
+    ------
+    ValueError
+        * if `regex` is False and `repl` is a callable or `pat` is a compiled
+          regex
+        * if `pat` is a compiled regex and `case` or `flags` is set
+
+    Notes
+    -----
+    When `pat` is a compiled regex, all flags should be included in the
+    compiled regex. Use of `case`, `flags`, or `regex=False` with a compiled
+    regex will raise an error.
+
+    Examples
+    --------
+    When `pat` is a string and `regex` is True (the default), the given `pat`
+    is compiled as a regex. When `repl` is a string, it replaces matching
+    regex patterns as with :meth:`re.sub`. NaN value(s) in the Series are
+    left as is:
+
+    >>> pd.Series(['foo', 'fuz', np.nan]).str.replace('f.', 'ba', regex=True)
+    0    bao
+    1    baz
+    2    NaN
+    dtype: object
+
+    When `pat` is a string and `regex` is False, every `pat` is replaced with
+    `repl` as with :meth:`str.replace`:
+
+    >>> pd.Series(['f.o', 'fuz', np.nan]).str.replace('f.', 'ba', regex=False)
+    0    bao
+    1    fuz
+    2    NaN
+    dtype: object
+
+    When `repl` is a callable, it is called on every `pat` using
+    :func:`re.sub`. The callable should expect one positional argument
+    (a regex object) and return a string.
+
+    To get the idea:
+
+    >>> pd.Series(['foo', 'fuz', np.nan]).str.replace('f', repr)
+    0    <_sre.SRE_Match object; span=(0, 1), match='f'>oo
+    1    <_sre.SRE_Match object; span=(0, 1), match='f'>uz
+    2                                                  NaN
+    dtype: object
+
+    Reverse every lowercase alphabetic word:
+
+    >>> repl = lambda m: m.group(0)[::-1]
+    >>> pd.Series(['foo 123', 'bar baz', np.nan]).str.replace(r'[a-z]+', repl)
+    0    oof 123
+    1    rab zab
+    2        NaN
+    dtype: object
+
+    Using regex groups (extract second group and swap case):
+
+    >>> pat = r"(?P<one>\w+) (?P<two>\w+) (?P<three>\w+)"
+    >>> repl = lambda m: m.group('two').swapcase()
+    >>> pd.Series(['One Two Three', 'Foo Bar Baz']).str.replace(pat, repl)
+    0    tWO
+    1    bAR
+    dtype: object
+
+    Using a compiled regex with flags
+
+    >>> regex_pat = re.compile(r'FUZ', flags=re.IGNORECASE)
+    >>> pd.Series(['foo', 'fuz', np.nan]).str.replace(regex_pat, 'bar')
+    0    foo
+    1    bar
+    2    NaN
+    dtype: object
+
     """
-    use_re = not case or len(pat) > 1 or flags
 
-    if use_re:
-        if not case:
-            flags |= re.IGNORECASE
-        regex = re.compile(pat, flags=flags)
-        n = n if n >= 0 else 0
+    # Check whether repl is valid (GH 13438, GH 15055)
+    if not (is_string_like(repl) or callable(repl)):
+        raise TypeError("repl must be a string or callable")
 
-        def f(x):
-            return regex.sub(repl, x, count=n)
+    is_compiled_re = is_re(pat)
+    if regex:
+        if is_compiled_re:
+            if (case is not None) or (flags != 0):
+                raise ValueError("case and flags cannot be set"
+                                 " when pat is a compiled regex")
+        else:
+            # not a compiled regex
+            # set default case
+            if case is None:
+                case = True
+
+            # add case flag, if provided
+            if case is False:
+                flags |= re.IGNORECASE
+        if is_compiled_re or len(pat) > 1 or flags or callable(repl):
+            n = n if n >= 0 else 0
+            compiled = re.compile(pat, flags=flags)
+            f = lambda x: compiled.sub(repl=repl, string=x, count=n)
+        else:
+            f = lambda x: x.replace(pat, repl, n)
     else:
+        if is_compiled_re:
+            raise ValueError("Cannot use a compiled regex as replacement "
+                             "pattern with regex=False")
+        if callable(repl):
+            raise ValueError("Cannot use a callable replacement when "
+                             "regex=False")
         f = lambda x: x.replace(pat, repl, n)
 
     return _na_map(f, arr)
@@ -311,7 +683,8 @@ def str_repeat(arr, repeats):
     -------
     repeated : Series/Index of objects
     """
-    if np.isscalar(repeats):
+    if is_scalar(repeats):
+
         def rep(x):
             try:
                 return compat.binary_type.__mul__(x, repeats)
@@ -320,6 +693,7 @@ def rep(x):
 
         return _na_map(rep, arr)
     else:
+
         def rep(x, r):
             try:
                 return compat.binary_type.__mul__(x, r)
@@ -327,15 +701,13 @@ def rep(x, r):
                 return compat.text_type.__mul__(x, r)
 
         repeats = np.asarray(repeats, dtype=object)
-        result = lib.vec_binop(_values_from_object(arr), repeats, rep)
+        result = libops.vec_binop(com._values_from_object(arr), repeats, rep)
         return result
 
 
-def str_match(arr, pat, case=True, flags=0, na=np.nan, as_indexer=False):
+def str_match(arr, pat, case=True, flags=0, na=np.nan, as_indexer=None):
     """
-    Deprecated: Find groups in each string in the Series/Index
-    using passed regular expression.
-    If as_indexer=True, determine if each string matches a regular expression.
+    Determine if each string matches a regular expression.
 
     Parameters
     ----------
@@ -346,60 +718,38 @@ def str_match(arr, pat, case=True, flags=0, na=np.nan, as_indexer=False):
     flags : int, default 0 (no flags)
         re module flags, e.g. re.IGNORECASE
     na : default NaN, fill value for missing values.
-    as_indexer : False, by default, gives deprecated behavior better achieved
-        using str_extract. True return boolean indexer.
+    as_indexer
+        .. deprecated:: 0.21.0
 
     Returns
     -------
     Series/array of boolean values
-        if as_indexer=True
-    Series/Index of tuples
-        if as_indexer=False, default but deprecated
 
     See Also
     --------
-    contains : analagous, but less strict, relying on re.search instead of
+    contains : analogous, but less strict, relying on re.search instead of
         re.match
-    extract : now preferred to the deprecated usage of match (as_indexer=False)
+    extract : extract matched groups
 
-    Notes
-    -----
-    To extract matched groups, which is the deprecated behavior of match, use
-    str.extract.
     """
-
     if not case:
         flags |= re.IGNORECASE
 
     regex = re.compile(pat, flags=flags)
 
-    if (not as_indexer) and regex.groups > 0:
-        # Do this first, to make sure it happens even if the re.compile
-        # raises below.
-        warnings.warn("In future versions of pandas, match will change to"
-                      " always return a bool indexer.", FutureWarning,
-                      stacklevel=3)
-
-    if as_indexer and regex.groups > 0:
-        warnings.warn("This pattern has match groups. To actually get the"
-                      " groups, use str.extract.", UserWarning, stacklevel=3)
+    if (as_indexer is False) and (regex.groups > 0):
+        raise ValueError("as_indexer=False with a pattern with groups is no "
+                         "longer supported. Use '.str.extract(pat)' instead")
+    elif as_indexer is not None:
+        # Previously, this keyword was used for changing the default but
+        # deprecated behaviour. This keyword is now no longer needed.
+        warnings.warn("'as_indexer' keyword was specified but is ignored "
+                      "(match now returns a boolean indexer by default), "
+                      "and will be removed in a future version.",
+                      FutureWarning, stacklevel=3)
 
-    # If not as_indexer and regex.groups == 0, this returns empty lists
-    # and is basically useless, so we will not warn.
-
-    if (not as_indexer) and regex.groups > 0:
-        dtype = object
-
-        def f(x):
-            m = regex.match(x)
-            if m:
-                return m.groups()
-            else:
-                return []
-    else:
-        # This is the new behavior of str_match.
-        dtype = bool
-        f = lambda x: bool(regex.match(x))
+    dtype = bool
+    f = lambda x: bool(regex.match(x))
 
     return _na_map(f, arr, na, dtype=dtype)
 
@@ -411,38 +761,122 @@ def _get_single_group_name(rx):
         return None
 
 
-def str_extract(arr, pat, flags=0):
+def _groups_or_na_fun(regex):
+    """Used in both extract_noexpand and extract_frame"""
+    if regex.groups == 0:
+        raise ValueError("pattern contains no capture groups")
+    empty_row = [np.nan] * regex.groups
+
+    def f(x):
+        if not isinstance(x, compat.string_types):
+            return empty_row
+        m = regex.search(x)
+        if m:
+            return [np.nan if item is None else item for item in m.groups()]
+        else:
+            return empty_row
+    return f
+
+
+def _str_extract_noexpand(arr, pat, flags=0):
     """
     Find groups in each string in the Series using passed regular
-    expression.
+    expression. This function is called from
+    str_extract(expand=False), and can return Series, DataFrame, or
+    Index.
+
+    """
+    from pandas import DataFrame, Index
+
+    regex = re.compile(pat, flags=flags)
+    groups_or_na = _groups_or_na_fun(regex)
+
+    if regex.groups == 1:
+        result = np.array([groups_or_na(val)[0] for val in arr], dtype=object)
+        name = _get_single_group_name(regex)
+    else:
+        if isinstance(arr, Index):
+            raise ValueError("only one regex group is supported with Index")
+        name = None
+        names = dict(zip(regex.groupindex.values(), regex.groupindex.keys()))
+        columns = [names.get(1 + i, i) for i in range(regex.groups)]
+        if arr.empty:
+            result = DataFrame(columns=columns, dtype=object)
+        else:
+            result = DataFrame(
+                [groups_or_na(val) for val in arr],
+                columns=columns,
+                index=arr.index,
+                dtype=object)
+    return result, name
+
+
+def _str_extract_frame(arr, pat, flags=0):
+    """
+    For each subject string in the Series, extract groups from the
+    first match of regular expression pat. This function is called from
+    str_extract(expand=True), and always returns a DataFrame.
+
+    """
+    from pandas import DataFrame
+
+    regex = re.compile(pat, flags=flags)
+    groups_or_na = _groups_or_na_fun(regex)
+    names = dict(zip(regex.groupindex.values(), regex.groupindex.keys()))
+    columns = [names.get(1 + i, i) for i in range(regex.groups)]
+
+    if len(arr) == 0:
+        return DataFrame(columns=columns, dtype=object)
+    try:
+        result_index = arr.index
+    except AttributeError:
+        result_index = None
+    return DataFrame(
+        [groups_or_na(val) for val in arr],
+        columns=columns,
+        index=result_index,
+        dtype=object)
+
+
+def str_extract(arr, pat, flags=0, expand=True):
+    r"""
+    For each subject string in the Series, extract groups from the
+    first match of regular expression pat.
 
     Parameters
     ----------
     pat : string
-        Pattern or regular expression
+        Regular expression pattern with capturing groups
     flags : int, default 0 (no flags)
         re module flags, e.g. re.IGNORECASE
 
+    expand : bool, default True
+        * If True, return DataFrame.
+        * If False, return Series/Index/DataFrame.
+
+        .. versionadded:: 0.18.0
+
     Returns
     -------
-    extracted groups : Series (one group) or DataFrame (multiple groups)
-        Note that dtype of the result is always object, even when no match is
-        found and the result is a Series or DataFrame containing only NaN
-        values.
+    DataFrame with one row for each subject string, and one column for
+    each group. Any capture group names in regular expression pat will
+    be used for column names; otherwise capture group numbers will be
+    used. The dtype of each result column is always object, even when
+    no match is found. If expand=False and pat has only one capture group,
+    then return a Series (if subject is a Series) or Index (if subject
+    is an Index).
 
-    Examples
+    See Also
     --------
-    A pattern with one group will return a Series. Non-matches will be NaN.
-
-    >>> Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)')
-    0      1
-    1      2
-    2    NaN
-    dtype: object
+    extractall : returns all matches (not just the first match)
 
-    A pattern with more than one group will return a DataFrame.
+    Examples
+    --------
+    A pattern with two groups will return a DataFrame with two columns.
+    Non-matches will be NaN.
 
-    >>> Series(['a1', 'b2', 'c3']).str.extract('([ab])(\d)')
+    >>> s = Series(['a1', 'b2', 'c3'])
+    >>> s.str.extract(r'([ab])(\d)')
          0    1
     0    a    1
     1    b    2
@@ -450,7 +884,7 @@ def str_extract(arr, pat, flags=0):
 
     A pattern may contain optional groups.
 
-    >>> Series(['a1', 'b2', 'c3']).str.extract('([ab])?(\d)')
+    >>> s.str.extract(r'([ab])?(\d)')
          0  1
     0    a  1
     1    b  2
@@ -458,49 +892,147 @@ def str_extract(arr, pat, flags=0):
 
     Named groups will become column names in the result.
 
-    >>> Series(['a1', 'b2', 'c3']).str.extract('(?P<letter>[ab])(?P<digit>\d)')
+    >>> s.str.extract(r'(?P<letter>[ab])(?P<digit>\d)')
       letter digit
     0      a     1
     1      b     2
     2    NaN   NaN
 
+    A pattern with one group will return a DataFrame with one column
+    if expand=True.
+
+    >>> s.str.extract(r'[ab](\d)', expand=True)
+         0
+    0    1
+    1    2
+    2  NaN
+
+    A pattern with one group will return a Series if expand=False.
+
+    >>> s.str.extract(r'[ab](\d)', expand=False)
+    0      1
+    1      2
+    2    NaN
+    dtype: object
+
+    """
+    if not isinstance(expand, bool):
+        raise ValueError("expand must be True or False")
+    if expand:
+        return _str_extract_frame(arr._orig, pat, flags=flags)
+    else:
+        result, name = _str_extract_noexpand(arr._data, pat, flags=flags)
+        return arr._wrap_result(result, name=name, expand=expand)
+
+
+def str_extractall(arr, pat, flags=0):
+    r"""
+    For each subject string in the Series, extract groups from all
+    matches of regular expression pat. When each subject string in the
+    Series has exactly one match, extractall(pat).xs(0, level='match')
+    is the same as extract(pat).
+
+    .. versionadded:: 0.18.0
+
+    Parameters
+    ----------
+    pat : string
+        Regular expression pattern with capturing groups
+    flags : int, default 0 (no flags)
+        re module flags, e.g. re.IGNORECASE
+
+    Returns
+    -------
+    A DataFrame with one row for each match, and one column for each
+    group. Its rows have a MultiIndex with first levels that come from
+    the subject Series. The last level is named 'match' and indicates
+    the order in the subject. Any capture group names in regular
+    expression pat will be used for column names; otherwise capture
+    group numbers will be used.
+
+    See Also
+    --------
+    extract : returns first match only (not all matches)
+
+    Examples
+    --------
+    A pattern with one group will return a DataFrame with one column.
+    Indices with no matches will not appear in the result.
+
+    >>> s = Series(["a1a2", "b1", "c1"], index=["A", "B", "C"])
+    >>> s.str.extractall(r"[ab](\d)")
+             0
+      match
+    A 0      1
+      1      2
+    B 0      1
+
+    Capture group names are used for column names of the result.
+
+    >>> s.str.extractall(r"[ab](?P<digit>\d)")
+            digit
+      match
+    A 0         1
+      1         2
+    B 0         1
+
+    A pattern with two groups will return a DataFrame with two columns.
+
+    >>> s.str.extractall(r"(?P<letter>[ab])(?P<digit>\d)")
+            letter digit
+      match
+    A 0          a     1
+      1          a     2
+    B 0          b     1
+
+    Optional groups that do not match are NaN in the result.
+
+    >>> s.str.extractall(r"(?P<letter>[ab])?(?P<digit>\d)")
+            letter digit
+      match
+    A 0          a     1
+      1          a     2
+    B 0          b     1
+    C 0        NaN     1
+
     """
-    from pandas.core.series import Series
-    from pandas.core.frame import DataFrame
-    from pandas.core.index import Index
 
     regex = re.compile(pat, flags=flags)
-    # just to be safe, check this
+    # the regex must contain capture groups.
     if regex.groups == 0:
-        raise ValueError("This pattern contains no groups to capture.")
-    empty_row = [np.nan]*regex.groups
+        raise ValueError("pattern contains no capture groups")
 
-    def f(x):
-        if not isinstance(x, compat.string_types):
-            return empty_row
-        m = regex.search(x)
-        if m:
-            return [np.nan if item is None else item for item in m.groups()]
-        else:
-            return empty_row
+    if isinstance(arr, ABCIndex):
+        arr = arr.to_series().reset_index(drop=True)
 
-    if regex.groups == 1:
-        result = np.array([f(val)[0] for val in arr], dtype=object)
-        name = _get_single_group_name(regex)
-    else:
-        if isinstance(arr, Index):
-            raise ValueError("only one regex group is supported with Index")
-        name = None
-        names = dict(zip(regex.groupindex.values(), regex.groupindex.keys()))
-        columns = [names.get(1 + i, i) for i in range(regex.groups)]
-        if arr.empty:
-            result = DataFrame(columns=columns, dtype=object)
-        else:
-            result = DataFrame([f(val) for val in arr],
-                               columns=columns,
-                               index=arr.index,
-                               dtype=object)
-    return result, name
+    names = dict(zip(regex.groupindex.values(), regex.groupindex.keys()))
+    columns = [names.get(1 + i, i) for i in range(regex.groups)]
+    match_list = []
+    index_list = []
+    is_mi = arr.index.nlevels > 1
+
+    for subject_key, subject in arr.iteritems():
+        if isinstance(subject, compat.string_types):
+
+            if not is_mi:
+                subject_key = (subject_key, )
+
+            for match_i, match_tuple in enumerate(regex.findall(subject)):
+                if isinstance(match_tuple, compat.string_types):
+                    match_tuple = (match_tuple,)
+                na_tuple = [np.NaN if group == "" else group
+                            for group in match_tuple]
+                match_list.append(na_tuple)
+                result_key = tuple(subject_key + (match_i, ))
+                index_list.append(result_key)
+
+    from pandas import MultiIndex
+    index = MultiIndex.from_tuples(
+        index_list, names=arr.index.names + ["match"])
+
+    result = arr._constructor_expanddim(match_list, index=index,
+                                        columns=columns)
+    return result
 
 
 def str_get_dummies(arr, sep='|'):
@@ -535,14 +1067,6 @@ def str_get_dummies(arr, sep='|'):
     --------
     pandas.get_dummies
     """
-    from pandas.core.frame import DataFrame
-    from pandas.core.index import Index
-
-    # GH9980, Index.str does not support get_dummies() as it returns a frame
-    if isinstance(arr, Index):
-        raise TypeError("get_dummies is not supported for string methods on Index")
-
-    # TODO remove this hack?
     arr = arr.fillna('')
     try:
         arr = sep + arr + sep
@@ -559,41 +1083,158 @@ def str_get_dummies(arr, sep='|'):
     for i, t in enumerate(tags):
         pat = sep + t + sep
         dummies[:, i] = lib.map_infer(arr.values, lambda x: pat in x)
-    return DataFrame(dummies, arr.index, tags)
+    return dummies, tags
 
 
 def str_join(arr, sep):
     """
-    Join lists contained as elements in the Series/Index with
-    passed delimiter. Equivalent to :meth:`str.join`.
+    Join lists contained as elements in the Series/Index with passed delimiter.
+
+    If the elements of a Series are lists themselves, join the content of these
+    lists using the delimiter passed to the function.
+    This function is an equivalent to :meth:`str.join`.
 
     Parameters
     ----------
-    sep : string
-        Delimiter
+    sep : str
+        Delimiter to use between list entries.
 
     Returns
     -------
-    joined : Series/Index of objects
+    Series/Index: object
+
+    Notes
+    -----
+    If any of the lists does not contain string objects the result of the join
+    will be `NaN`.
+
+    See Also
+    --------
+    str.join : Standard library version of this method.
+    Series.str.split : Split strings around given separator/delimiter.
+
+    Examples
+    --------
+
+    Example with a list that contains non-string elements.
+
+    >>> s = pd.Series([['lion', 'elephant', 'zebra'],
+    ...                [1.1, 2.2, 3.3],
+    ...                ['cat', np.nan, 'dog'],
+    ...                ['cow', 4.5, 'goat']
+    ...                ['duck', ['swan', 'fish'], 'guppy']])
+    >>> s
+    0        [lion, elephant, zebra]
+    1                [1.1, 2.2, 3.3]
+    2                [cat, nan, dog]
+    3               [cow, 4.5, goat]
+    4    [duck, [swan, fish], guppy]
+    dtype: object
+
+    Join all lists using an '-', the lists containing object(s) of types other
+    than str will become a NaN.
+
+    >>> s.str.join('-')
+    0    lion-elephant-zebra
+    1                    NaN
+    2                    NaN
+    3                    NaN
+    4                    NaN
+    dtype: object
     """
     return _na_map(sep.join, arr)
 
 
 def str_findall(arr, pat, flags=0):
     """
-    Find all occurrences of pattern or regular expression in the
-    Series/Index. Equivalent to :func:`re.findall`.
+    Find all occurrences of pattern or regular expression in the Series/Index.
+
+    Equivalent to applying :func:`re.findall` to all the elements in the
+    Series/Index.
 
     Parameters
     ----------
     pat : string
-        Pattern or regular expression
-    flags : int, default 0 (no flags)
-        re module flags, e.g. re.IGNORECASE
+        Pattern or regular expression.
+    flags : int, default 0
+        ``re`` module flags, e.g. `re.IGNORECASE` (default is 0, which means
+        no flags).
 
     Returns
     -------
-    matches : Series/Index of lists
+    Series/Index of lists of strings
+        All non-overlapping matches of pattern or regular expression in each
+        string of this Series/Index.
+
+    See Also
+    --------
+    count : Count occurrences of pattern or regular expression in each string
+        of the Series/Index.
+    extractall : For each string in the Series, extract groups from all matches
+        of regular expression and return a DataFrame with one row for each
+        match and one column for each group.
+    re.findall : The equivalent ``re`` function to all non-overlapping matches
+        of pattern or regular expression in string, as a list of strings.
+
+    Examples
+    --------
+
+    >>> s = pd.Series(['Lion', 'Monkey', 'Rabbit'])
+
+    The search for the pattern 'Monkey' returns one match:
+
+    >>> s.str.findall('Monkey')
+    0          []
+    1    [Monkey]
+    2          []
+    dtype: object
+
+    On the other hand, the search for the pattern 'MONKEY' doesn't return any
+    match:
+
+    >>> s.str.findall('MONKEY')
+    0    []
+    1    []
+    2    []
+    dtype: object
+
+    Flags can be added to the pattern or regular expression. For instance,
+    to find the pattern 'MONKEY' ignoring the case:
+
+    >>> import re
+    >>> s.str.findall('MONKEY', flags=re.IGNORECASE)
+    0          []
+    1    [Monkey]
+    2          []
+    dtype: object
+
+    When the pattern matches more than one string in the Series, all matches
+    are returned:
+
+    >>> s.str.findall('on')
+    0    [on]
+    1    [on]
+    2      []
+    dtype: object
+
+    Regular expressions are supported too. For instance, the search for all the
+    strings ending with the word 'on' is shown next:
+
+    >>> s.str.findall('on$')
+    0    [on]
+    1      []
+    2      []
+    dtype: object
+
+    If the pattern is found more than once in the same string, then a list of
+    multiple strings is returned:
+
+    >>> s.str.findall('b')
+    0        []
+    1        []
+    2    [b, b]
+    dtype: object
+
     """
     regex = re.compile(pat, flags=flags)
     return _na_map(regex.findall, arr)
@@ -685,6 +1326,10 @@ def str_pad(arr, width, side='left', fillchar=' '):
     if len(fillchar) != 1:
         raise TypeError('fillchar must be a character, not str')
 
+    if not is_integer(width):
+        msg = 'width must be of integer type, not {0}'
+        raise TypeError(msg.format(type(width).__name__))
+
     if side == 'left':
         f = lambda x: x.rjust(width, fillchar)
     elif side == 'right':
@@ -698,27 +1343,7 @@ def str_pad(arr, width, side='left', fillchar=' '):
 
 
 def str_split(arr, pat=None, n=None):
-    """
-    Split each string (a la re.split) in the Series/Index by given
-    pattern, propagating NA values. Equivalent to :meth:`str.split`.
-
-    Parameters
-    ----------
-    pat : string, default None
-        String or regular expression to split on. If None, splits on whitespace
-    n : int, default -1 (all)
-        None, 0 and -1 will be interpreted as return all splits
-    expand : bool, default False
-        * If True, return DataFrame/MultiIndex expanding dimensionality.
-        * If False, return Series/Index.
-
-        .. versionadded:: 0.16.1
-    return_type : deprecated, use `expand`
 
-    Returns
-    -------
-    split : Series/Index or DataFrame/MultiIndex of objects
-    """
     if pat is None:
         if n is None or n == 0:
             n = -1
@@ -738,27 +1363,7 @@ def str_split(arr, pat=None, n=None):
 
 
 def str_rsplit(arr, pat=None, n=None):
-    """
-    Split each string in the Series/Index by the given delimiter
-    string, starting at the end of the string and working to the front.
-    Equivalent to :meth:`str.rsplit`.
 
-    .. versionadded:: 0.16.2
-
-    Parameters
-    ----------
-    pat : string, default None
-        Separator to split on. If None, splits on whitespace
-    n : int, default -1 (all)
-        None, 0 and -1 will be interpreted as return all splits
-    expand : bool, default False
-        * If True, return DataFrame/MultiIndex expanding dimensionality.
-        * If False, return Series/Index.
-
-    Returns
-    -------
-    split : Series/Index or DataFrame/MultiIndex of objects
-    """
     if n is None or n == 0:
         n = -1
     f = lambda x: x.rsplit(pat, n)
@@ -787,19 +1392,75 @@ def str_slice(arr, start=None, stop=None, step=None):
 
 def str_slice_replace(arr, start=None, stop=None, repl=None):
     """
-    Replace a slice of each string in the Series/Index with another
-    string.
+    Replace a positional slice of a string with another value.
 
     Parameters
     ----------
-    start : int or None
-    stop : int or None
-    repl : str or None
-        String for replacement
+    start : int, optional
+        Left index position to use for the slice. If not specified (None),
+        the slice is unbounded on the left, i.e. slice from the start
+        of the string.
+    stop : int, optional
+        Right index position to use for the slice. If not specified (None),
+        the slice is unbounded on the right, i.e. slice until the
+        end of the string.
+    repl : str, optional
+        String for replacement. If not specified (None), the sliced region
+        is replaced with an empty string.
 
     Returns
     -------
-    replaced : Series/Index of objects
+    replaced : Series or Index
+        Same type as the original object.
+
+    See Also
+    --------
+    Series.str.slice : Just slicing without replacement.
+
+    Examples
+    --------
+    >>> s = pd.Series(['a', 'ab', 'abc', 'abdc', 'abcde'])
+    >>> s
+    0        a
+    1       ab
+    2      abc
+    3     abdc
+    4    abcde
+    dtype: object
+
+    Specify just `start`, meaning replace `start` until the end of the
+    string with `repl`.
+
+    >>> s.str.slice_replace(1, repl='X')
+    0    aX
+    1    aX
+    2    aX
+    3    aX
+    4    aX
+    dtype: object
+
+    Specify just `stop`, meaning the start of the string to `stop` is replaced
+    with `repl`, and the rest of the string is included.
+
+    >>> s.str.slice_replace(stop=2, repl='X')
+    0       X
+    1       X
+    2      Xc
+    3     Xdc
+    4    Xcde
+    dtype: object
+
+    Specify `start` and `stop`, meaning the slice from `start` to `stop` is
+    replaced with `repl`. Everything before or after `start` and `stop` is
+    included as is.
+
+    >>> s.str.slice_replace(start=1, stop=3, repl='X')
+    0      aX
+    1      aX
+    2      aX
+    3     aXc
+    4    aXde
+    dtype: object
     """
     if repl is None:
         repl = ''
@@ -816,6 +1477,7 @@ def f(x):
         if stop is not None:
             y += x[local_stop:]
         return y
+
     return _na_map(f, arr)
 
 
@@ -917,10 +1579,10 @@ def str_translate(arr, table, deletechars=None):
     Parameters
     ----------
     table : dict (python 3), str or None (python 2)
-        In python 3, table is a mapping of Unicode ordinals to Unicode ordinals,
-        strings, or None. Unmapped characters are left untouched. Characters
-        mapped to None are deleted. :meth:`str.maketrans` is a helper function
-        for making translation tables.
+        In python 3, table is a mapping of Unicode ordinals to Unicode
+        ordinals, strings, or None. Unmapped characters are left untouched.
+        Characters mapped to None are deleted. :meth:`str.maketrans` is a
+        helper function for making translation tables.
         In python 2, table is either a string of length 256 or None. If the
         table argument is None, no translation is applied and the operation
         simply removes the characters in deletechars. :func:`string.maketrans`
@@ -936,72 +1598,124 @@ def str_translate(arr, table, deletechars=None):
     if deletechars is None:
         f = lambda x: x.translate(table)
     else:
-        from pandas import compat
         if compat.PY3:
             raise ValueError("deletechars is not a valid argument for "
                              "str.translate in python 3. You should simply "
-                             "specify character deletions in the table argument")
+                             "specify character deletions in the table "
+                             "argument")
         f = lambda x: x.translate(table, deletechars)
     return _na_map(f, arr)
 
 
 def str_get(arr, i):
     """
+    Extract element from each component at specified position.
+
     Extract element from lists, tuples, or strings in each element in the
     Series/Index.
 
     Parameters
     ----------
     i : int
-        Integer index (location)
+        Position of element to extract.
 
     Returns
     -------
     items : Series/Index of objects
+
+    Examples
+    --------
+    >>> s = pd.Series(["String",
+               (1, 2, 3),
+               ["a", "b", "c"],
+               123, -456,
+               {1:"Hello", "2":"World"}])
+    >>> s
+    0                        String
+    1                     (1, 2, 3)
+    2                     [a, b, c]
+    3                           123
+    4                          -456
+    5    {1: 'Hello', '2': 'World'}
+    dtype: object
+
+    >>> s.str.get(1)
+    0        t
+    1        2
+    2        b
+    3      NaN
+    4      NaN
+    5    Hello
+    dtype: object
+
+    >>> s.str.get(-1)
+    0      g
+    1      3
+    2      c
+    3    NaN
+    4    NaN
+    5    NaN
+    dtype: object
     """
-    f = lambda x: x[i] if len(x) > i else np.nan
+    def f(x):
+        if isinstance(x, dict):
+            return x.get(i)
+        elif len(x) > i >= -len(x):
+            return x[i]
+        return np.nan
     return _na_map(f, arr)
 
 
 def str_decode(arr, encoding, errors="strict"):
     """
-    Decode character string in the Series/Index to unicode
-    using indicated encoding. Equivalent to :meth:`str.decode`.
+    Decode character string in the Series/Index using indicated encoding.
+    Equivalent to :meth:`str.decode` in python2 and :meth:`bytes.decode` in
+    python3.
 
     Parameters
     ----------
-    encoding : string
-    errors : string
+    encoding : str
+    errors : str, optional
 
     Returns
     -------
     decoded : Series/Index of objects
     """
-    f = lambda x: x.decode(encoding, errors)
+    if encoding in _cpython_optimized_decoders:
+        # CPython optimized implementation
+        f = lambda x: x.decode(encoding, errors)
+    else:
+        decoder = codecs.getdecoder(encoding)
+        f = lambda x: decoder(x, errors)[0]
     return _na_map(f, arr)
 
 
 def str_encode(arr, encoding, errors="strict"):
     """
-    Encode character string in the Series/Index to some other encoding
-    using indicated encoding. Equivalent to :meth:`str.encode`.
+    Encode character string in the Series/Index using indicated encoding.
+    Equivalent to :meth:`str.encode`.
 
     Parameters
     ----------
-    encoding : string
-    errors : string
+    encoding : str
+    errors : str, optional
 
     Returns
     -------
     encoded : Series/Index of objects
     """
-    f = lambda x: x.encode(encoding, errors)
+    if encoding in _cpython_optimized_encoders:
+        # CPython optimized implementation
+        f = lambda x: x.encode(encoding, errors)
+    else:
+        encoder = codecs.getencoder(encoding)
+        f = lambda x: encoder(x, errors)[0]
     return _na_map(f, arr)
 
 
 def _noarg_wrapper(f, docstring=None, **kargs):
     def wrapper(self):
-        result = _na_map(f, self.series, **kargs)
+        result = _na_map(f, self._data, **kargs)
         return self._wrap_result(result)
 
     wrapper.__name__ = f.__name__
@@ -1015,15 +1729,15 @@ def wrapper(self):
 
 def _pat_wrapper(f, flags=False, na=False, **kwargs):
     def wrapper1(self, pat):
-        result = f(self.series, pat)
+        result = f(self._data, pat)
         return self._wrap_result(result)
 
     def wrapper2(self, pat, flags=0, **kwargs):
-        result = f(self.series, pat, flags=flags, **kwargs)
+        result = f(self._data, pat, flags=flags, **kwargs)
         return self._wrap_result(result)
 
     def wrapper3(self, pat, na=np.nan):
-        result = f(self.series, pat, na=na)
+        result = f(self._data, pat, na=na)
         return self._wrap_result(result)
 
     wrapper = wrapper3 if na else wrapper2 if flags else wrapper1
@@ -1037,15 +1751,16 @@ def wrapper3(self, pat, na=np.nan):
 
 def copy(source):
     "Copy a docstring from another source function (if present)"
+
     def do_copy(target):
         if source.__doc__:
             target.__doc__ = source.__doc__
         return target
-    return do_copy
 
+    return do_copy
 
-class StringMethods(object):
 
+class StringMethods(NoNewAttributesMixin):
     """
     Vectorized string functions for Series and Index. NAs stay NA unless
     handled otherwise by a particular method. Patterned after Python's string
@@ -1057,100 +1772,570 @@ class StringMethods(object):
     >>> s.str.replace('_', '')
     """
 
-    def __init__(self, series):
-        self.series = series
+    def __init__(self, data):
+        self._validate(data)
+        self._is_categorical = is_categorical_dtype(data)
+
+        # .values.categories works for both Series/Index
+        self._data = data.values.categories if self._is_categorical else data
+        # save orig to blow up categoricals to the right type
+        self._orig = data
+        self._freeze()
+
+    @staticmethod
+    def _validate(data):
+        from pandas.core.index import Index
+
+        if (isinstance(data, ABCSeries) and
+                not ((is_categorical_dtype(data.dtype) and
+                      is_object_dtype(data.values.categories)) or
+                     (is_object_dtype(data.dtype)))):
+            # it's neither a string series not a categorical series with
+            # strings inside the categories.
+            # this really should exclude all series with any non-string values
+            # (instead of test for object dtype), but that isn't practical for
+            # performance reasons until we have a str dtype (GH 9343)
+            raise AttributeError("Can only use .str accessor with string "
+                                 "values, which use np.object_ dtype in "
+                                 "pandas")
+        elif isinstance(data, Index):
+            # can't use ABCIndex to exclude non-str
+
+            # see src/inference.pyx which can contain string values
+            allowed_types = ('string', 'unicode', 'mixed', 'mixed-integer')
+            if is_categorical_dtype(data.dtype):
+                inf_type = data.categories.inferred_type
+            else:
+                inf_type = data.inferred_type
+            if inf_type not in allowed_types:
+                message = ("Can only use .str accessor with string values "
+                           "(i.e. inferred_type is 'string', 'unicode' or "
+                           "'mixed')")
+                raise AttributeError(message)
+            if data.nlevels > 1:
+                message = ("Can only use .str accessor with Index, not "
+                           "MultiIndex")
+                raise AttributeError(message)
 
     def __getitem__(self, key):
         if isinstance(key, slice):
-            return self.slice(start=key.start, stop=key.stop,
-                              step=key.step)
+            return self.slice(start=key.start, stop=key.stop, step=key.step)
         else:
             return self.get(key)
 
     def __iter__(self):
         i = 0
         g = self.get(i)
-        while g.notnull().any():
+        while g.notna().any():
             yield g
             i += 1
             g = self.get(i)
 
-    def _wrap_result(self, result, **kwargs):
+    def _wrap_result(self, result, use_codes=True,
+                     name=None, expand=None):
 
-        # leave as it is to keep extract and get_dummies results
-        # can be merged to _wrap_result_expand in v0.17
-        from pandas.core.series import Series
-        from pandas.core.frame import DataFrame
-        from pandas.core.index import Index
+        from pandas.core.index import Index, MultiIndex
 
-        if not hasattr(result, 'ndim'):
+        # for category, we do the stuff on the categories, so blow it up
+        # to the full series again
+        # But for some operations, we have to do the stuff on the full values,
+        # so make it possible to skip this step as the method already did this
+        # before the transformation...
+        if use_codes and self._is_categorical:
+            result = take_1d(result, self._orig.cat.codes)
+
+        if not hasattr(result, 'ndim') or not hasattr(result, 'dtype'):
             return result
-        name = kwargs.get('name') or getattr(result, 'name', None) or self.series.name
-
-        if result.ndim == 1:
-            if isinstance(self.series, Index):
-                # if result is a boolean np.array, return the np.array
-                # instead of wrapping it into a boolean Index (GH 8875)
-                if is_bool_dtype(result):
-                    return result
-                return Index(result, name=name)
-            return Series(result, index=self.series.index, name=name)
-        else:
-            assert result.ndim < 3
-            return DataFrame(result, index=self.series.index)
+        assert result.ndim < 3
+
+        if expand is None:
+            # infer from ndim if expand is not specified
+            expand = False if result.ndim == 1 else True
+
+        elif expand is True and not isinstance(self._orig, Index):
+            # required when expand=True is explicitly specified
+            # not needed when inferred
+
+            def cons_row(x):
+                if is_list_like(x):
+                    return x
+                else:
+                    return [x]
+
+            result = [cons_row(x) for x in result]
+            if result:
+                # propagate nan values to match longest sequence (GH 18450)
+                max_len = max(len(x) for x in result)
+                result = [x * max_len if len(x) == 0 or x[0] is np.nan
+                          else x for x in result]
 
-    def _wrap_result_expand(self, result, expand=False):
         if not isinstance(expand, bool):
             raise ValueError("expand must be True or False")
 
-        from pandas.core.index import Index, MultiIndex
-        if not hasattr(result, 'ndim'):
-            return result
-
-        if isinstance(self.series, Index):
-            name = getattr(result, 'name', None)
+        if expand is False:
+            # if expand is False, result should have the same name
+            # as the original otherwise specified
+            if name is None:
+                name = getattr(result, 'name', None)
+            if name is None:
+                # do not use logical or, _orig may be a DataFrame
+                # which has "name" column
+                name = self._orig.name
+
+        # Wait until we are sure result is a Series or Index before
+        # checking attributes (GH 12180)
+        if isinstance(self._orig, Index):
             # if result is a boolean np.array, return the np.array
             # instead of wrapping it into a boolean Index (GH 8875)
-            if hasattr(result, 'dtype') and is_bool_dtype(result):
+            if is_bool_dtype(result):
                 return result
 
             if expand:
                 result = list(result)
-                return MultiIndex.from_tuples(result, names=name)
+                out = MultiIndex.from_tuples(result, names=name)
+                if out.nlevels == 1:
+                    # We had all tuples of length-one, which are
+                    # better represented as a regular Index.
+                    out = out.get_level_values(0)
+                return out
             else:
                 return Index(result, name=name)
         else:
-            index = self.series.index
+            index = self._orig.index
             if expand:
-                def cons_row(x):
-                    if is_list_like(x):
-                        return x
-                    else:
-                        return [ x ]
-                cons = self.series._constructor_expanddim
-                data = [cons_row(x) for x in result]
-                return cons(data, index=index)
+                cons = self._orig._constructor_expanddim
+                return cons(result, columns=name, index=index)
             else:
-                name = getattr(result, 'name', None)
-                cons = self.series._constructor
+                # Must be a Series
+                cons = self._orig._constructor
                 return cons(result, name=name, index=index)
 
-    @copy(str_cat)
-    def cat(self, others=None, sep=None, na_rep=None):
-        result = str_cat(self.series, others=others, sep=sep, na_rep=na_rep)
-        return self._wrap_result(result)
+    def _get_series_list(self, others, ignore_index=False):
+        """
+        Auxiliary function for :meth:`str.cat`. Turn potentially mixed input
+        into a list of Series (elements without an index must match the length
+        of the calling Series/Index).
 
-    @deprecate_kwarg('return_type', 'expand',
-                     mapping={'series': False, 'frame': True})
-    @copy(str_split)
+        Parameters
+        ----------
+        others : Series, DataFrame, np.ndarray, list-like or list-like of
+            objects that are either Series, np.ndarray (1-dim) or list-like
+        ignore_index : boolean, default False
+            Determines whether to forcefully align others with index of caller
+
+        Returns
+        -------
+        tuple : (others transformed into list of Series,
+                 boolean whether FutureWarning should be raised)
+        """
+
+        # once str.cat defaults to alignment, this function can be simplified;
+        # will not need `ignore_index` and the second boolean output anymore
+
+        from pandas import Index, Series, DataFrame
+
+        # self._orig is either Series or Index
+        idx = self._orig if isinstance(self._orig, Index) else self._orig.index
+
+        err_msg = ('others must be Series, Index, DataFrame, np.ndarrary or '
+                   'list-like (either containing only strings or containing '
+                   'only objects of type Series/Index/list-like/np.ndarray)')
+
+        # Generally speaking, all objects without an index inherit the index
+        # `idx` of the calling Series/Index - i.e. must have matching length.
+        # Objects with an index (i.e. Series/Index/DataFrame) keep their own
+        # index, *unless* ignore_index is set to True.
+        if isinstance(others, Series):
+            warn = not others.index.equals(idx)
+            # only reconstruct Series when absolutely necessary
+            los = [Series(others.values, index=idx)
+                   if ignore_index and warn else others]
+            return (los, warn)
+        elif isinstance(others, Index):
+            warn = not others.equals(idx)
+            los = [Series(others.values,
+                          index=(idx if ignore_index else others))]
+            return (los, warn)
+        elif isinstance(others, DataFrame):
+            warn = not others.index.equals(idx)
+            if ignore_index and warn:
+                # without copy, this could change "others"
+                # that was passed to str.cat
+                others = others.copy()
+                others.index = idx
+            return ([others[x] for x in others], warn)
+        elif isinstance(others, np.ndarray) and others.ndim == 2:
+            others = DataFrame(others, index=idx)
+            return ([others[x] for x in others], False)
+        elif is_list_like(others):
+            others = list(others)  # ensure iterators do not get read twice etc
+
+            # in case of list-like `others`, all elements must be
+            # either one-dimensional list-likes or scalars
+            if all(is_list_like(x) for x in others):
+                los = []
+                warn = False
+                # iterate through list and append list of series for each
+                # element (which we check to be one-dimensional and non-nested)
+                while others:
+                    nxt = others.pop(0)  # nxt is guaranteed list-like by above
+                    if not isinstance(nxt, (DataFrame, Series,
+                                            Index, np.ndarray)):
+                        # safety for non-persistent list-likes (e.g. iterators)
+                        # do not map indexed/typed objects; info needed below
+                        nxt = list(nxt)
+
+                    # known types for which we can avoid deep inspection
+                    no_deep = ((isinstance(nxt, np.ndarray) and nxt.ndim == 1)
+                               or isinstance(nxt, (Series, Index)))
+                    # nested list-likes are forbidden:
+                    # -> elements of nxt must not be list-like
+                    is_legal = ((no_deep and nxt.dtype == object)
+                                or all(not is_list_like(x) for x in nxt))
+
+                    # DataFrame is false positive of is_legal
+                    # because "x in df" returns column names
+                    if not is_legal or isinstance(nxt, DataFrame):
+                        raise TypeError(err_msg)
+
+                    nxt, wnx = self._get_series_list(nxt,
+                                                     ignore_index=ignore_index)
+                    los = los + nxt
+                    warn = warn or wnx
+                return (los, warn)
+            elif all(not is_list_like(x) for x in others):
+                return ([Series(others, index=idx)], False)
+        raise TypeError(err_msg)
+
+    def cat(self, others=None, sep=None, na_rep=None, join=None):
+        """
+        Concatenate strings in the Series/Index with given separator.
+
+        If `others` is specified, this function concatenates the Series/Index
+        and elements of `others` element-wise.
+        If `others` is not passed, then all values in the Series/Index are
+        concatenated into a single string with a given `sep`.
+
+        Parameters
+        ----------
+        others : Series, Index, DataFrame, np.ndarrary or list-like
+            Series, Index, DataFrame, np.ndarray (one- or two-dimensional) and
+            other list-likes of strings must have the same length as the
+            calling Series/Index, with the exception of indexed objects (i.e.
+            Series/Index/DataFrame) if `join` is not None.
+
+            If others is a list-like that contains a combination of Series,
+            np.ndarray (1-dim) or list-like, then all elements will be unpacked
+            and must satisfy the above criteria individually.
+
+            If others is None, the method returns the concatenation of all
+            strings in the calling Series/Index.
+        sep : string or None, default None
+            If None, concatenates without any separator.
+        na_rep : string or None, default None
+            Representation that is inserted for all missing values:
+
+            - If `na_rep` is None, and `others` is None, missing values in the
+              Series/Index are omitted from the result.
+            - If `na_rep` is None, and `others` is not None, a row containing a
+              missing value in any of the columns (before concatenation) will
+              have a missing value in the result.
+        join : {'left', 'right', 'outer', 'inner'}, default None
+            Determines the join-style between the calling Series/Index and any
+            Series/Index/DataFrame in `others` (objects without an index need
+            to match the length of the calling Series/Index). If None,
+            alignment is disabled, but this option will be removed in a future
+            version of pandas and replaced with a default of `'left'`. To
+            disable alignment, use `.values` on any Series/Index/DataFrame in
+            `others`.
+
+            .. versionadded:: 0.23.0
+
+        Returns
+        -------
+        concat : str or Series/Index of objects
+            If `others` is None, `str` is returned, otherwise a `Series/Index`
+            (same type as caller) of objects is returned.
+
+        See Also
+        --------
+        split : Split each string in the Series/Index
+
+        Examples
+        --------
+        When not passing `others`, all values are concatenated into a single
+        string:
+
+        >>> s = pd.Series(['a', 'b', np.nan, 'd'])
+        >>> s.str.cat(sep=' ')
+        'a b d'
+
+        By default, NA values in the Series are ignored. Using `na_rep`, they
+        can be given a representation:
+
+        >>> s.str.cat(sep=' ', na_rep='?')
+        'a b ? d'
+
+        If `others` is specified, corresponding values are concatenated with
+        the separator. Result will be a Series of strings.
+
+        >>> s.str.cat(['A', 'B', 'C', 'D'], sep=',')
+        0    a,A
+        1    b,B
+        2    NaN
+        3    d,D
+        dtype: object
+
+        Missing values will remain missing in the result, but can again be
+        represented using `na_rep`
+
+        >>> s.str.cat(['A', 'B', 'C', 'D'], sep=',', na_rep='-')
+        0    a,A
+        1    b,B
+        2    -,C
+        3    d,D
+        dtype: object
+
+        If `sep` is not specified, the values are concatenated without
+        separation.
+
+        >>> s.str.cat(['A', 'B', 'C', 'D'], na_rep='-')
+        0    aA
+        1    bB
+        2    -C
+        3    dD
+        dtype: object
+
+        Series with different indexes can be aligned before concatenation. The
+        `join`-keyword works as in other methods.
+
+        >>> t = pd.Series(['d', 'a', 'e', 'c'], index=[3, 0, 4, 2])
+        >>> s.str.cat(t, join=None, na_rep='-')
+        0    ad
+        1    ba
+        2    -e
+        3    dc
+        dtype: object
+        >>>
+        >>> s.str.cat(t, join='left', na_rep='-')
+        0    aa
+        1    b-
+        2    -c
+        3    dd
+        dtype: object
+        >>>
+        >>> s.str.cat(t, join='outer', na_rep='-')
+        0    aa
+        1    b-
+        2    -c
+        3    dd
+        4    -e
+        dtype: object
+        >>>
+        >>> s.str.cat(t, join='inner', na_rep='-')
+        0    aa
+        2    -c
+        3    dd
+        dtype: object
+        >>>
+        >>> s.str.cat(t, join='right', na_rep='-')
+        3    dd
+        0    aa
+        4    -e
+        2    -c
+        dtype: object
+
+        For more examples, see :ref:`here <text.concatenate>`.
+        """
+        from pandas import Index, Series, concat
+
+        if isinstance(others, compat.string_types):
+            raise ValueError("Did you mean to supply a `sep` keyword?")
+
+        if isinstance(self._orig, Index):
+            data = Series(self._orig, index=self._orig)
+        else:  # Series
+            data = self._orig
+
+        # concatenate Series/Index with itself if no "others"
+        if others is None:
+            result = str_cat(data, others=others, sep=sep, na_rep=na_rep)
+            return self._wrap_result(result,
+                                     use_codes=(not self._is_categorical))
+
+        try:
+            # turn anything in "others" into lists of Series
+            others, warn = self._get_series_list(others,
+                                                 ignore_index=(join is None))
+        except ValueError:  # do not catch TypeError raised by _get_series_list
+            if join is None:
+                raise ValueError('All arrays must be same length, except '
+                                 'those having an index if `join` is not None')
+            else:
+                raise ValueError('If `others` contains arrays or lists (or '
+                                 'other list-likes without an index), these '
+                                 'must all be of the same length as the '
+                                 'calling Series/Index.')
+
+        if join is None and warn:
+            warnings.warn("A future version of pandas will perform index "
+                          "alignment when `others` is a Series/Index/"
+                          "DataFrame (or a list-like containing one). To "
+                          "disable alignment (the behavior before v.0.23) and "
+                          "silence this warning, use `.values` on any Series/"
+                          "Index/DataFrame in `others`. To enable alignment "
+                          "and silence this warning, pass `join='left'|"
+                          "'outer'|'inner'|'right'`. The future default will "
+                          "be `join='left'`.", FutureWarning, stacklevel=2)
+
+        # align if required
+        if join is not None:
+            # Need to add keys for uniqueness in case of duplicate columns
+            others = concat(others, axis=1,
+                            join=(join if join == 'inner' else 'outer'),
+                            keys=range(len(others)))
+            data, others = data.align(others, join=join)
+            others = [others[x] for x in others]  # again list of Series
+
+        # str_cat discards index
+        res = str_cat(data, others=others, sep=sep, na_rep=na_rep)
+
+        if isinstance(self._orig, Index):
+            res = Index(res, name=self._orig.name)
+        else:  # Series
+            res = Series(res, index=data.index, name=self._orig.name)
+        return res
+
+    _shared_docs['str_split'] = ("""
+    Split strings around given separator/delimiter.
+
+    Splits the string in the Series/Index from the %(side)s,
+    at the specified delimiter string. Equivalent to :meth:`str.%(method)s`.
+
+    Parameters
+    ----------
+    pat : str, optional
+        String or regular expression to split on.
+        If not specified, split on whitespace.
+    n : int, default -1 (all)
+        Limit number of splits in output.
+        ``None``, 0 and -1 will be interpreted as return all splits.
+    expand : bool, default False
+        Expand the splitted strings into separate columns.
+
+        * If ``True``, return DataFrame/MultiIndex expanding dimensionality.
+        * If ``False``, return Series/Index, containing lists of strings.
+
+    Returns
+    -------
+    Series, Index, DataFrame or MultiIndex
+        Type matches caller unless ``expand=True`` (see Notes).
+
+    See Also
+    --------
+     Series.str.split : Split strings around given separator/delimiter.
+     Series.str.rsplit : Splits string around given separator/delimiter,
+     starting from the right.
+     Series.str.join : Join lists contained as elements in the Series/Index
+     with passed delimiter.
+     str.split : Standard library version for split.
+     str.rsplit : Standard library version for rsplit.
+
+    Notes
+    -----
+    The handling of the `n` keyword depends on the number of found splits:
+
+    - If found splits > `n`,  make first `n` splits only
+    - If found splits <= `n`, make all splits
+    - If for a certain row the number of found splits < `n`,
+      append `None` for padding up to `n` if ``expand=True``
+
+    If using ``expand=True``, Series and Index callers return DataFrame and
+    MultiIndex objects, respectively.
+
+    Examples
+    --------
+    >>> s = pd.Series(["this is a regular sentence",
+    "https://docs.python.org/3/tutorial/index.html", np.nan])
+
+    In the default setting, the string is split by whitespace.
+
+    >>> s.str.split()
+    0                   [this, is, a, regular, sentence]
+    1    [https://docs.python.org/3/tutorial/index.html]
+    2                                                NaN
+    dtype: object
+
+    Without the `n` parameter, the outputs of `rsplit` and `split`
+    are identical.
+
+    >>> s.str.rsplit()
+    0                   [this, is, a, regular, sentence]
+    1    [https://docs.python.org/3/tutorial/index.html]
+    2                                                NaN
+    dtype: object
+
+    The `n` parameter can be used to limit the number of splits on the
+    delimiter. The outputs of `split` and `rsplit` are different.
+
+    >>> s.str.split(n=2)
+    0                     [this, is, a regular sentence]
+    1    [https://docs.python.org/3/tutorial/index.html]
+    2                                                NaN
+    dtype: object
+
+    >>> s.str.rsplit(n=2)
+    0                     [this is a, regular, sentence]
+    1    [https://docs.python.org/3/tutorial/index.html]
+    2                                                NaN
+    dtype: object
+
+    The `pat` parameter can be used to split by other characters.
+
+    >>> s.str.split(pat = "/")
+    0                         [this is a regular sentence]
+    1    [https:, , docs.python.org, 3, tutorial, index...
+    2                                                  NaN
+    dtype: object
+
+    When using ``expand=True``, the split elements will expand out into
+    separate columns. If NaN is present, it is propagated throughout
+    the columns during the split.
+
+    >>> s.str.split(expand=True)
+                                                   0     1     2        3
+    0                                           this    is     a  regular
+    1  https://docs.python.org/3/tutorial/index.html  None  None     None
+    2                                            NaN   NaN   NaN      NaN \
+
+                 4
+    0     sentence
+    1         None
+    2          NaN
+
+    For slightly more complex use cases like splitting the html document name
+    from a url, a combination of parameter settings can be used.
+
+    >>> s.str.rsplit("/", n=1, expand=True)
+                                        0           1
+    0          this is a regular sentence        None
+    1  https://docs.python.org/3/tutorial  index.html
+    2                                 NaN         NaN
+    """)
+
+    @Appender(_shared_docs['str_split'] % {
+        'side': 'beginning',
+        'method': 'split'})
     def split(self, pat=None, n=-1, expand=False):
-        result = str_split(self.series, pat, n=n)
-        return self._wrap_result_expand(result, expand=expand)
+        result = str_split(self._data, pat, n=n)
+        return self._wrap_result(result, expand=expand)
 
-    @copy(str_rsplit)
+    @Appender(_shared_docs['str_split'] % {
+        'side': 'end',
+        'method': 'rsplit'})
     def rsplit(self, pat=None, n=-1, expand=False):
-        result = str_rsplit(self.series, pat, n=n)
-        return self._wrap_result_expand(result, expand=expand)
+        result = str_rsplit(self._data, pat, n=n)
+        return self._wrap_result(result, expand=expand)
 
     _shared_docs['str_partition'] = ("""
     Split the string at the %(side)s occurrence of `sep`, and return 3 elements
@@ -1195,58 +2380,65 @@ def rsplit(self, pat=None, n=-1, expand=False):
     1  D_E  _  F
     2          X
     """)
-    @Appender(_shared_docs['str_partition'] % {'side': 'first',
-        'return': '3 elements containing the string itself, followed by two empty strings',
-        'also': 'rpartition : Split the string at the last occurrence of `sep`'})
+
+    @Appender(_shared_docs['str_partition'] % {
+        'side': 'first',
+        'return': '3 elements containing the string itself, followed by two '
+                  'empty strings',
+        'also': 'rpartition : Split the string at the last occurrence of `sep`'
+    })
     def partition(self, pat=' ', expand=True):
         f = lambda x: x.partition(pat)
-        result = _na_map(f, self.series)
-        return self._wrap_result_expand(result, expand=expand)
-
-    @Appender(_shared_docs['str_partition'] % {'side': 'last',
-        'return': '3 elements containing two empty strings, followed by the string itself',
-        'also': 'partition : Split the string at the first occurrence of `sep`'})
+        result = _na_map(f, self._data)
+        return self._wrap_result(result, expand=expand)
+
+    @Appender(_shared_docs['str_partition'] % {
+        'side': 'last',
+        'return': '3 elements containing two empty strings, followed by the '
+                  'string itself',
+        'also': 'partition : Split the string at the first occurrence of `sep`'
+    })
     def rpartition(self, pat=' ', expand=True):
         f = lambda x: x.rpartition(pat)
-        result = _na_map(f, self.series)
-        return self._wrap_result_expand(result, expand=expand)
+        result = _na_map(f, self._data)
+        return self._wrap_result(result, expand=expand)
 
     @copy(str_get)
     def get(self, i):
-        result = str_get(self.series, i)
+        result = str_get(self._data, i)
         return self._wrap_result(result)
 
     @copy(str_join)
     def join(self, sep):
-        result = str_join(self.series, sep)
+        result = str_join(self._data, sep)
         return self._wrap_result(result)
 
     @copy(str_contains)
     def contains(self, pat, case=True, flags=0, na=np.nan, regex=True):
-        result = str_contains(self.series, pat, case=case, flags=flags,
-                              na=na, regex=regex)
+        result = str_contains(self._data, pat, case=case, flags=flags, na=na,
+                              regex=regex)
         return self._wrap_result(result)
 
     @copy(str_match)
-    def match(self, pat, case=True, flags=0, na=np.nan, as_indexer=False):
-        result = str_match(self.series, pat, case=case, flags=flags,
-                           na=na, as_indexer=as_indexer)
+    def match(self, pat, case=True, flags=0, na=np.nan, as_indexer=None):
+        result = str_match(self._data, pat, case=case, flags=flags, na=na,
+                           as_indexer=as_indexer)
         return self._wrap_result(result)
 
     @copy(str_replace)
-    def replace(self, pat, repl, n=-1, case=True, flags=0):
-        result = str_replace(self.series, pat, repl, n=n, case=case,
-                             flags=flags)
+    def replace(self, pat, repl, n=-1, case=None, flags=0, regex=True):
+        result = str_replace(self._data, pat, repl, n=n, case=case,
+                             flags=flags, regex=regex)
         return self._wrap_result(result)
 
     @copy(str_repeat)
     def repeat(self, repeats):
-        result = str_repeat(self.series, repeats)
+        result = str_repeat(self._data, repeats)
         return self._wrap_result(result)
 
     @copy(str_pad)
     def pad(self, width, side='left', fillchar=' '):
-        result = str_pad(self.series, width, side=side, fillchar=fillchar)
+        result = str_pad(self._data, width, side=side, fillchar=fillchar)
         return self._wrap_result(result)
 
     _shared_docs['str_pad'] = ("""
@@ -1267,7 +2459,7 @@ def pad(self, width, side='left', fillchar=' '):
     """)
 
     @Appender(_shared_docs['str_pad'] % dict(side='left and right',
-              method='center'))
+                                             method='center'))
     def center(self, width, fillchar=' '):
         return self.pad(width, side='both', fillchar=fillchar)
 
@@ -1280,7 +2472,7 @@ def rjust(self, width, fillchar=' '):
         return self.pad(width, side='left', fillchar=fillchar)
 
     def zfill(self, width):
-        """"
+        """
         Filling left side of strings in the Series/Index with 0.
         Equivalent to :meth:`str.zfill`.
 
@@ -1294,27 +2486,27 @@ def zfill(self, width):
         -------
         filled : Series/Index of objects
         """
-        result = str_pad(self.series, width, side='left', fillchar='0')
+        result = str_pad(self._data, width, side='left', fillchar='0')
         return self._wrap_result(result)
 
     @copy(str_slice)
     def slice(self, start=None, stop=None, step=None):
-        result = str_slice(self.series, start, stop, step)
+        result = str_slice(self._data, start, stop, step)
         return self._wrap_result(result)
 
     @copy(str_slice_replace)
     def slice_replace(self, start=None, stop=None, repl=None):
-        result = str_slice_replace(self.series, start, stop, repl)
+        result = str_slice_replace(self._data, start, stop, repl)
         return self._wrap_result(result)
 
     @copy(str_decode)
     def decode(self, encoding, errors="strict"):
-        result = str_decode(self.series, encoding, errors)
+        result = str_decode(self._data, encoding, errors)
         return self._wrap_result(result)
 
     @copy(str_encode)
     def encode(self, encoding, errors="strict"):
-        result = str_encode(self.series, encoding, errors)
+        result = str_encode(self._data, encoding, errors)
         return self._wrap_result(result)
 
     _shared_docs['str_strip'] = ("""
@@ -1327,36 +2519,40 @@ def encode(self, encoding, errors="strict"):
     """)
 
     @Appender(_shared_docs['str_strip'] % dict(side='left and right sides',
-              method='strip'))
+                                               method='strip'))
     def strip(self, to_strip=None):
-        result = str_strip(self.series, to_strip, side='both')
+        result = str_strip(self._data, to_strip, side='both')
         return self._wrap_result(result)
 
     @Appender(_shared_docs['str_strip'] % dict(side='left side',
-              method='lstrip'))
+                                               method='lstrip'))
     def lstrip(self, to_strip=None):
-        result = str_strip(self.series, to_strip, side='left')
+        result = str_strip(self._data, to_strip, side='left')
         return self._wrap_result(result)
 
     @Appender(_shared_docs['str_strip'] % dict(side='right side',
-              method='rstrip'))
+                                               method='rstrip'))
     def rstrip(self, to_strip=None):
-        result = str_strip(self.series, to_strip, side='right')
+        result = str_strip(self._data, to_strip, side='right')
         return self._wrap_result(result)
 
     @copy(str_wrap)
     def wrap(self, width, **kwargs):
-        result = str_wrap(self.series, width, **kwargs)
+        result = str_wrap(self._data, width, **kwargs)
         return self._wrap_result(result)
 
     @copy(str_get_dummies)
     def get_dummies(self, sep='|'):
-        result = str_get_dummies(self.series, sep)
-        return self._wrap_result(result)
+        # we need to cast to Series of strings as only that has all
+        # methods available for making the dummies...
+        data = self._orig.astype(str) if self._is_categorical else self._data
+        result, name = str_get_dummies(data, sep)
+        return self._wrap_result(result, use_codes=(not self._is_categorical),
+                                 name=name, expand=True)
 
     @copy(str_translate)
     def translate(self, table, deletechars=None):
-        result = str_translate(self.series, table, deletechars)
+        result = str_translate(self._data, table, deletechars)
         return self._wrap_result(result)
 
     count = _pat_wrapper(str_count, flags=True)
@@ -1365,9 +2561,12 @@ def translate(self, table, deletechars=None):
     findall = _pat_wrapper(str_findall, flags=True)
 
     @copy(str_extract)
-    def extract(self, pat, flags=0):
-        result, name = str_extract(self.series, pat, flags=flags)
-        return self._wrap_result(result, name=name)
+    def extract(self, pat, flags=0, expand=True):
+        return str_extract(self, pat, flags=flags, expand=expand)
+
+    @copy(str_extractall)
+    def extractall(self, pat, flags=0):
+        return str_extractall(self._orig, pat, flags=flags)
 
     _shared_docs['find'] = ("""
     Return %(side)s indexes in each strings in the Series/Index
@@ -1392,16 +2591,18 @@ def extract(self, pat, flags=0):
     %(also)s
     """)
 
-    @Appender(_shared_docs['find'] % dict(side='lowest', method='find',
-              also='rfind : Return highest indexes in each strings'))
+    @Appender(_shared_docs['find'] %
+              dict(side='lowest', method='find',
+                   also='rfind : Return highest indexes in each strings'))
     def find(self, sub, start=0, end=None):
-        result = str_find(self.series, sub, start=start, end=end, side='left')
+        result = str_find(self._data, sub, start=start, end=end, side='left')
         return self._wrap_result(result)
 
-    @Appender(_shared_docs['find'] % dict(side='highest', method='rfind',
-              also='find : Return lowest indexes in each strings'))
+    @Appender(_shared_docs['find'] %
+              dict(side='highest', method='rfind',
+                   also='find : Return lowest indexes in each strings'))
     def rfind(self, sub, start=0, end=None):
-        result = str_find(self.series, sub, start=start, end=end, side='right')
+        result = str_find(self._data, sub, start=start, end=end, side='right')
         return self._wrap_result(result)
 
     def normalize(self, form):
@@ -1420,14 +2621,14 @@ def normalize(self, form):
         """
         import unicodedata
         f = lambda x: unicodedata.normalize(form, compat.u_safe(x))
-        result = _na_map(f, self.series)
+        result = _na_map(f, self._data)
         return self._wrap_result(result)
 
     _shared_docs['index'] = ("""
     Return %(side)s indexes in each strings where the substring is
-    fully contained between [start:end]. This is the same as ``str.%(similar)s``
-    except instead of returning -1, it raises a ValueError when the substring
-    is not found. Equivalent to standard ``str.%(method)s``.
+    fully contained between [start:end]. This is the same as
+    ``str.%(similar)s`` except instead of returning -1, it raises a ValueError
+    when the substring is not found. Equivalent to standard ``str.%(method)s``.
 
     Parameters
     ----------
@@ -1447,16 +2648,18 @@ def normalize(self, form):
     %(also)s
     """)
 
-    @Appender(_shared_docs['index'] % dict(side='lowest', similar='find', method='index',
-              also='rindex : Return highest indexes in each strings'))
+    @Appender(_shared_docs['index'] %
+              dict(side='lowest', similar='find', method='index',
+                   also='rindex : Return highest indexes in each strings'))
     def index(self, sub, start=0, end=None):
-        result = str_index(self.series, sub, start=start, end=end, side='left')
+        result = str_index(self._data, sub, start=start, end=end, side='left')
         return self._wrap_result(result)
 
-    @Appender(_shared_docs['index'] % dict(side='highest', similar='rfind', method='rindex',
-              also='index : Return lowest indexes in each strings'))
+    @Appender(_shared_docs['index'] %
+              dict(side='highest', similar='rfind', method='rindex',
+                   also='index : Return lowest indexes in each strings'))
     def rindex(self, sub, start=0, end=None):
-        result = str_index(self.series, sub, start=start, end=end, side='right')
+        result = str_index(self._data, sub, start=start, end=end, side='right')
         return self._wrap_result(result)
 
     _shared_docs['len'] = ("""
@@ -1470,11 +2673,68 @@ def rindex(self, sub, start=0, end=None):
 
     _shared_docs['casemethods'] = ("""
     Convert strings in the Series/Index to %(type)s.
+
     Equivalent to :meth:`str.%(method)s`.
 
     Returns
     -------
-    converted : Series/Index of objects
+    Series/Index of objects
+
+    See Also
+    --------
+    Series.str.lower : Converts all characters to lowercase.
+    Series.str.upper : Converts all characters to uppercase.
+    Series.str.title : Converts first character of each word to uppercase and
+        remaining to lowercase.
+    Series.str.capitalize : Converts first character to uppercase and
+        remaining to lowercase.
+    Series.str.swapcase : Converts uppercase to lowercase and lowercase to
+        uppercase.
+
+    Examples
+    --------
+    >>> s = pd.Series(['lower', 'CAPITALS', 'this is a sentence', 'SwApCaSe'])
+    >>> s
+    0                 lower
+    1              CAPITALS
+    2    this is a sentence
+    3              SwApCaSe
+    dtype: object
+
+    >>> s.str.lower()
+    0                 lower
+    1              capitals
+    2    this is a sentence
+    3              swapcase
+    dtype: object
+
+    >>> s.str.upper()
+    0                 LOWER
+    1              CAPITALS
+    2    THIS IS A SENTENCE
+    3              SWAPCASE
+    dtype: object
+
+    >>> s.str.title()
+    0                 Lower
+    1              Capitals
+    2    This Is A Sentence
+    3              Swapcase
+    dtype: object
+
+    >>> s.str.capitalize()
+    0                 Lower
+    1              Capitals
+    2    This is a sentence
+    3              Swapcase
+    dtype: object
+
+    >>> s.str.swapcase()
+    0                 LOWER
+    1              capitals
+    2    THIS IS A SENTENCE
+    3              sWaPcAsE
+    dtype: object
     """)
     _shared_docs['lower'] = dict(type='lowercase', method='lower')
     _shared_docs['upper'] = dict(type='uppercase', method='upper')
@@ -1542,3 +2802,8 @@ def rindex(self, sub, start=0, end=None):
     isdecimal = _noarg_wrapper(lambda x: compat.u_safe(x).isdecimal(),
                                docstring=_shared_docs['ismethods'] %
                                _shared_docs['isdecimal'])
+
+    @classmethod
+    def _make_accessor(cls, data):
+        cls._validate(data)
+        return cls(data)
diff --git a/pandas/sparse/__init__.py b/pandas/core/tools/__init__.py
similarity index 100%
rename from pandas/sparse/__init__.py
rename to pandas/core/tools/__init__.py
diff --git a/pandas/core/tools/datetimes.py b/pandas/core/tools/datetimes.py
new file mode 100644
index 0000000000000..18802d98a347e
--- /dev/null
+++ b/pandas/core/tools/datetimes.py
@@ -0,0 +1,814 @@
+from datetime import datetime, timedelta, time
+from collections import MutableMapping
+
+import numpy as np
+
+from pandas._libs import tslib
+from pandas._libs.tslibs.strptime import array_strptime
+from pandas._libs.tslibs import parsing, conversion
+from pandas._libs.tslibs.parsing import (  # noqa
+    parse_time_string,
+    DateParseError,
+    _format_is_iso,
+    _guess_datetime_format)
+
+from pandas.core.dtypes.common import (
+    _ensure_object,
+    is_datetime64_ns_dtype,
+    is_datetime64_dtype,
+    is_datetime64tz_dtype,
+    is_integer_dtype,
+    is_integer,
+    is_float,
+    is_list_like,
+    is_scalar,
+    is_numeric_dtype)
+from pandas.core.dtypes.generic import (
+    ABCIndexClass, ABCSeries,
+    ABCDataFrame)
+from pandas.core.dtypes.missing import notna
+from pandas.core import algorithms
+from pandas.compat import zip
+
+
+def _guess_datetime_format_for_array(arr, **kwargs):
+    # Try to guess the format based on the first non-NaN element
+    non_nan_elements = notna(arr).nonzero()[0]
+    if len(non_nan_elements):
+        return _guess_datetime_format(arr[non_nan_elements[0]], **kwargs)
+
+
+def _maybe_cache(arg, format, cache, tz, convert_listlike):
+    """
+    Create a cache of unique dates from an array of dates
+
+    Parameters
+    ----------
+    arg : integer, float, string, datetime, list, tuple, 1-d array, Series
+    format : string
+        Strftime format to parse time
+    cache : boolean
+        True attempts to create a cache of converted values
+    tz : string
+        Timezone of the dates
+    convert_listlike : function
+        Conversion function to apply on dates
+
+    Returns
+    -------
+    cache_array : Series
+        Cache of converted, unique dates. Can be empty
+    """
+    from pandas import Series
+    cache_array = Series()
+    if cache:
+        # Perform a quicker unique check
+        from pandas import Index
+        if not Index(arg).is_unique:
+            unique_dates = algorithms.unique(arg)
+            cache_dates = convert_listlike(unique_dates, True, format, tz=tz)
+            cache_array = Series(cache_dates, index=unique_dates)
+    return cache_array
+
+
+def _convert_and_box_cache(arg, cache_array, box, errors, name=None):
+    """
+    Convert array of dates with a cache and box the result
+
+    Parameters
+    ----------
+    arg : integer, float, string, datetime, list, tuple, 1-d array, Series
+    cache_array : Series
+        Cache of converted, unique dates
+    box : boolean
+        True boxes result as an Index-like, False returns an ndarray
+    errors : string
+        'ignore' plus box=True will convert result to Index
+    name : string, default None
+        Name for a DatetimeIndex
+
+    Returns
+    -------
+    result : datetime of converted dates
+        Returns:
+
+        - Index-like if box=True
+        - ndarray if box=False
+    """
+    from pandas import Series, DatetimeIndex, Index
+    result = Series(arg).map(cache_array)
+    if box:
+        if errors == 'ignore':
+            return Index(result)
+        else:
+            return DatetimeIndex(result, name=name)
+    return result.values
+
+
+def _return_parsed_timezone_results(result, timezones, box, tz):
+    """
+    Return results from array_strptime if a %z or %Z directive was passed.
+
+    Parameters
+    ----------
+    result : ndarray
+        int64 date representations of the dates
+    timezones : ndarray
+        pytz timezone objects
+    box : boolean
+        True boxes result as an Index-like, False returns an ndarray
+    tz : object
+        None or pytz timezone object
+    Returns
+    -------
+    tz_result : ndarray of parsed dates with timezone
+        Returns:
+
+        - Index-like if box=True
+        - ndarray of Timestamps if box=False
+
+    """
+    if tz is not None:
+        raise ValueError("Cannot pass a tz argument when "
+                         "parsing strings with timezone "
+                         "information.")
+    tz_results = np.array([tslib.Timestamp(res).tz_localize(zone) for res, zone
+                           in zip(result, timezones)])
+    if box:
+        from pandas import Index
+        return Index(tz_results)
+    return tz_results
+
+
+def to_datetime(arg, errors='raise', dayfirst=False, yearfirst=False,
+                utc=None, box=True, format=None, exact=True,
+                unit=None, infer_datetime_format=False, origin='unix',
+                cache=False):
+    """
+    Convert argument to datetime.
+
+    Parameters
+    ----------
+    arg : integer, float, string, datetime, list, tuple, 1-d array, Series
+
+        .. versionadded:: 0.18.1
+
+           or DataFrame/dict-like
+
+    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
+
+        - If 'raise', then invalid parsing will raise an exception
+        - If 'coerce', then invalid parsing will be set as NaT
+        - If 'ignore', then invalid parsing will return the input
+    dayfirst : boolean, default False
+        Specify a date parse order if `arg` is str or its list-likes.
+        If True, parses dates with the day first, eg 10/11/12 is parsed as
+        2012-11-10.
+        Warning: dayfirst=True is not strict, but will prefer to parse
+        with day first (this is a known bug, based on dateutil behavior).
+    yearfirst : boolean, default False
+        Specify a date parse order if `arg` is str or its list-likes.
+
+        - If True parses dates with the year first, eg 10/11/12 is parsed as
+          2010-11-12.
+        - If both dayfirst and yearfirst are True, yearfirst is preceded (same
+          as dateutil).
+
+        Warning: yearfirst=True is not strict, but will prefer to parse
+        with year first (this is a known bug, based on dateutil behavior).
+
+        .. versionadded:: 0.16.1
+
+    utc : boolean, default None
+        Return UTC DatetimeIndex if True (converting any tz-aware
+        datetime.datetime objects as well).
+    box : boolean, default True
+
+        - If True returns a DatetimeIndex
+        - If False returns ndarray of values.
+    format : string, default None
+        strftime to parse time, eg "%d/%m/%Y", note that "%f" will parse
+        all the way up to nanoseconds.
+    exact : boolean, True by default
+
+        - If True, require an exact format match.
+        - If False, allow the format to match anywhere in the target string.
+
+    unit : string, default 'ns'
+        unit of the arg (D,s,ms,us,ns) denote the unit, which is an
+        integer or float number. This will be based off the origin.
+        Example, with unit='ms' and origin='unix' (the default), this
+        would calculate the number of milliseconds to the unix epoch start.
+    infer_datetime_format : boolean, default False
+        If True and no `format` is given, attempt to infer the format of the
+        datetime strings, and if it can be inferred, switch to a faster
+        method of parsing them. In some cases this can increase the parsing
+        speed by ~5-10x.
+    origin : scalar, default is 'unix'
+        Define the reference date. The numeric values would be parsed as number
+        of units (defined by `unit`) since this reference date.
+
+        - If 'unix' (or POSIX) time; origin is set to 1970-01-01.
+        - If 'julian', unit must be 'D', and origin is set to beginning of
+          Julian Calendar. Julian day number 0 is assigned to the day starting
+          at noon on January 1, 4713 BC.
+        - If Timestamp convertible, origin is set to Timestamp identified by
+          origin.
+
+        .. versionadded:: 0.20.0
+    cache : boolean, default False
+        If True, use a cache of unique, converted dates to apply the datetime
+        conversion. May produce significant speed-up when parsing duplicate
+        date strings, especially ones with timezone offsets.
+
+        .. versionadded:: 0.23.0
+
+    Returns
+    -------
+    ret : datetime if parsing succeeded.
+        Return type depends on input:
+
+        - list-like: DatetimeIndex
+        - Series: Series of datetime64 dtype
+        - scalar: Timestamp
+
+        In case when it is not possible to return designated types (e.g. when
+        any element of input is before Timestamp.min or after Timestamp.max)
+        return will have datetime.datetime type (or corresponding
+        array/Series).
+
+    Examples
+    --------
+    Assembling a datetime from multiple columns of a DataFrame. The keys can be
+    common abbreviations like ['year', 'month', 'day', 'minute', 'second',
+    'ms', 'us', 'ns']) or plurals of the same
+
+    >>> df = pd.DataFrame({'year': [2015, 2016],
+                           'month': [2, 3],
+                           'day': [4, 5]})
+    >>> pd.to_datetime(df)
+    0   2015-02-04
+    1   2016-03-05
+    dtype: datetime64[ns]
+
+    If a date does not meet the `timestamp limitations
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html
+    #timeseries-timestamp-limits>`_, passing errors='ignore'
+    will return the original input instead of raising any exception.
+
+    Passing errors='coerce' will force an out-of-bounds date to NaT,
+    in addition to forcing non-dates (or non-parseable dates) to NaT.
+
+    >>> pd.to_datetime('13000101', format='%Y%m%d', errors='ignore')
+    datetime.datetime(1300, 1, 1, 0, 0)
+    >>> pd.to_datetime('13000101', format='%Y%m%d', errors='coerce')
+    NaT
+
+    Passing infer_datetime_format=True can often-times speedup a parsing
+    if its not an ISO8601 format exactly, but in a regular format.
+
+    >>> s = pd.Series(['3/11/2000', '3/12/2000', '3/13/2000']*1000)
+
+    >>> s.head()
+    0    3/11/2000
+    1    3/12/2000
+    2    3/13/2000
+    3    3/11/2000
+    4    3/12/2000
+    dtype: object
+
+    >>> %timeit pd.to_datetime(s,infer_datetime_format=True)
+    100 loops, best of 3: 10.4 ms per loop
+
+    >>> %timeit pd.to_datetime(s,infer_datetime_format=False)
+    1 loop, best of 3: 471 ms per loop
+
+    Using a unix epoch time
+
+    >>> pd.to_datetime(1490195805, unit='s')
+    Timestamp('2017-03-22 15:16:45')
+    >>> pd.to_datetime(1490195805433502912, unit='ns')
+    Timestamp('2017-03-22 15:16:45.433502912')
+
+    .. warning:: For float arg, precision rounding might happen. To prevent
+        unexpected behavior use a fixed-width exact type.
+
+    Using a non-unix epoch origin
+
+    >>> pd.to_datetime([1, 2, 3], unit='D',
+                       origin=pd.Timestamp('1960-01-01'))
+    0    1960-01-02
+    1    1960-01-03
+    2    1960-01-04
+
+    See also
+    --------
+    pandas.DataFrame.astype : Cast argument to a specified dtype.
+    pandas.to_timedelta : Convert argument to timedelta.
+    """
+    from pandas.core.indexes.datetimes import DatetimeIndex
+
+    tz = 'utc' if utc else None
+
+    def _convert_listlike(arg, box, format, name=None, tz=tz):
+
+        if isinstance(arg, (list, tuple)):
+            arg = np.array(arg, dtype='O')
+
+        # these are shortcutable
+        if is_datetime64tz_dtype(arg):
+            if not isinstance(arg, DatetimeIndex):
+                return DatetimeIndex(arg, tz=tz, name=name)
+            if utc:
+                arg = arg.tz_convert(None).tz_localize('UTC')
+            return arg
+
+        elif is_datetime64_ns_dtype(arg):
+            if box and not isinstance(arg, DatetimeIndex):
+                try:
+                    return DatetimeIndex(arg, tz=tz, name=name)
+                except ValueError:
+                    pass
+
+            return arg
+
+        elif unit is not None:
+            if format is not None:
+                raise ValueError("cannot specify both format and unit")
+            arg = getattr(arg, 'values', arg)
+            result = tslib.array_with_unit_to_datetime(arg, unit,
+                                                       errors=errors)
+            if box:
+                if errors == 'ignore':
+                    from pandas import Index
+                    return Index(result)
+
+                return DatetimeIndex(result, tz=tz, name=name)
+            return result
+        elif getattr(arg, 'ndim', 1) > 1:
+            raise TypeError('arg must be a string, datetime, list, tuple, '
+                            '1-d array, or Series')
+
+        arg = _ensure_object(arg)
+        require_iso8601 = False
+
+        if infer_datetime_format and format is None:
+            format = _guess_datetime_format_for_array(arg, dayfirst=dayfirst)
+
+        if format is not None:
+            # There is a special fast-path for iso8601 formatted
+            # datetime strings, so in those cases don't use the inferred
+            # format because this path makes process slower in this
+            # special case
+            format_is_iso8601 = _format_is_iso(format)
+            if format_is_iso8601:
+                require_iso8601 = not infer_datetime_format
+                format = None
+
+        try:
+            result = None
+
+            if format is not None:
+                # shortcut formatting here
+                if format == '%Y%m%d':
+                    try:
+                        result = _attempt_YYYYMMDD(arg, errors=errors)
+                    except:
+                        raise ValueError("cannot convert the input to "
+                                         "'%Y%m%d' date format")
+
+                # fallback
+                if result is None:
+                    try:
+                        result, timezones = array_strptime(
+                            arg, format, exact=exact, errors=errors)
+                        if '%Z' in format or '%z' in format:
+                            return _return_parsed_timezone_results(
+                                result, timezones, box, tz)
+                    except tslib.OutOfBoundsDatetime:
+                        if errors == 'raise':
+                            raise
+                        result = arg
+                    except ValueError:
+                        # if format was inferred, try falling back
+                        # to array_to_datetime - terminate here
+                        # for specified formats
+                        if not infer_datetime_format:
+                            if errors == 'raise':
+                                raise
+                            result = arg
+
+            if result is None and (format is None or infer_datetime_format):
+                result = tslib.array_to_datetime(
+                    arg,
+                    errors=errors,
+                    utc=utc,
+                    dayfirst=dayfirst,
+                    yearfirst=yearfirst,
+                    require_iso8601=require_iso8601
+                )
+
+            if is_datetime64_dtype(result) and box:
+                result = DatetimeIndex(result, tz=tz, name=name)
+            return result
+
+        except ValueError as e:
+            try:
+                values, tz = conversion.datetime_to_datetime64(arg)
+                return DatetimeIndex._simple_new(values, name=name, tz=tz)
+            except (ValueError, TypeError):
+                raise e
+
+    if arg is None:
+        return None
+
+    # handle origin
+    if origin == 'julian':
+
+        original = arg
+        j0 = tslib.Timestamp(0).to_julian_date()
+        if unit != 'D':
+            raise ValueError("unit must be 'D' for origin='julian'")
+        try:
+            arg = arg - j0
+        except:
+            raise ValueError("incompatible 'arg' type for given "
+                             "'origin'='julian'")
+
+        # premptively check this for a nice range
+        j_max = tslib.Timestamp.max.to_julian_date() - j0
+        j_min = tslib.Timestamp.min.to_julian_date() - j0
+        if np.any(arg > j_max) or np.any(arg < j_min):
+            raise tslib.OutOfBoundsDatetime(
+                "{original} is Out of Bounds for "
+                "origin='julian'".format(original=original))
+
+    elif origin not in ['unix', 'julian']:
+
+        # arg must be a numeric
+        original = arg
+        if not ((is_scalar(arg) and (is_integer(arg) or is_float(arg))) or
+                is_numeric_dtype(np.asarray(arg))):
+            raise ValueError(
+                "'{arg}' is not compatible with origin='{origin}'; "
+                "it must be numeric with a unit specified ".format(
+                    arg=arg,
+                    origin=origin))
+
+        # we are going to offset back to unix / epoch time
+        try:
+            offset = tslib.Timestamp(origin)
+        except tslib.OutOfBoundsDatetime:
+            raise tslib.OutOfBoundsDatetime(
+                "origin {origin} is Out of Bounds".format(origin=origin))
+        except ValueError:
+            raise ValueError("origin {origin} cannot be converted "
+                             "to a Timestamp".format(origin=origin))
+
+        if offset.tz is not None:
+            raise ValueError(
+                "origin offset {} must be tz-naive".format(offset))
+        offset -= tslib.Timestamp(0)
+
+        # convert the offset to the unit of the arg
+        # this should be lossless in terms of precision
+        offset = offset // tslib.Timedelta(1, unit=unit)
+
+        # scalars & ndarray-like can handle the addition
+        if is_list_like(arg) and not isinstance(
+                arg, (ABCSeries, ABCIndexClass, np.ndarray)):
+            arg = np.asarray(arg)
+        arg = arg + offset
+
+    if isinstance(arg, tslib.Timestamp):
+        result = arg
+    elif isinstance(arg, ABCSeries):
+        cache_array = _maybe_cache(arg, format, cache, tz, _convert_listlike)
+        if not cache_array.empty:
+            result = arg.map(cache_array)
+        else:
+            from pandas import Series
+            values = _convert_listlike(arg._values, True, format)
+            result = Series(values, index=arg.index, name=arg.name)
+    elif isinstance(arg, (ABCDataFrame, MutableMapping)):
+        result = _assemble_from_unit_mappings(arg, errors=errors)
+    elif isinstance(arg, ABCIndexClass):
+        cache_array = _maybe_cache(arg, format, cache, tz, _convert_listlike)
+        if not cache_array.empty:
+            result = _convert_and_box_cache(arg, cache_array, box, errors,
+                                            name=arg.name)
+        else:
+            result = _convert_listlike(arg, box, format, name=arg.name)
+    elif is_list_like(arg):
+        cache_array = _maybe_cache(arg, format, cache, tz, _convert_listlike)
+        if not cache_array.empty:
+            result = _convert_and_box_cache(arg, cache_array, box, errors)
+        else:
+            result = _convert_listlike(arg, box, format)
+    else:
+        result = _convert_listlike(np.array([arg]), box, format)[0]
+
+    return result
+
+
+# mappings for assembling units
+_unit_map = {'year': 'year',
+             'years': 'year',
+             'month': 'month',
+             'months': 'month',
+             'day': 'day',
+             'days': 'day',
+             'hour': 'h',
+             'hours': 'h',
+             'minute': 'm',
+             'minutes': 'm',
+             'second': 's',
+             'seconds': 's',
+             'ms': 'ms',
+             'millisecond': 'ms',
+             'milliseconds': 'ms',
+             'us': 'us',
+             'microsecond': 'us',
+             'microseconds': 'us',
+             'ns': 'ns',
+             'nanosecond': 'ns',
+             'nanoseconds': 'ns'
+             }
+
+
+def _assemble_from_unit_mappings(arg, errors):
+    """
+    assemble the unit specified fields from the arg (DataFrame)
+    Return a Series for actual parsing
+
+    Parameters
+    ----------
+    arg : DataFrame
+    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
+
+        - If 'raise', then invalid parsing will raise an exception
+        - If 'coerce', then invalid parsing will be set as NaT
+        - If 'ignore', then invalid parsing will return the input
+
+    Returns
+    -------
+    Series
+    """
+    from pandas import to_timedelta, to_numeric, DataFrame
+    arg = DataFrame(arg)
+    if not arg.columns.is_unique:
+        raise ValueError("cannot assemble with duplicate keys")
+
+    # replace passed unit with _unit_map
+    def f(value):
+        if value in _unit_map:
+            return _unit_map[value]
+
+        # m is case significant
+        if value.lower() in _unit_map:
+            return _unit_map[value.lower()]
+
+        return value
+
+    unit = {k: f(k) for k in arg.keys()}
+    unit_rev = {v: k for k, v in unit.items()}
+
+    # we require at least Ymd
+    required = ['year', 'month', 'day']
+    req = sorted(list(set(required) - set(unit_rev.keys())))
+    if len(req):
+        raise ValueError("to assemble mappings requires at least that "
+                         "[year, month, day] be specified: [{required}] "
+                         "is missing".format(required=','.join(req)))
+
+    # keys we don't recognize
+    excess = sorted(list(set(unit_rev.keys()) - set(_unit_map.values())))
+    if len(excess):
+        raise ValueError("extra keys have been passed "
+                         "to the datetime assemblage: "
+                         "[{excess}]".format(excess=','.join(excess)))
+
+    def coerce(values):
+        # we allow coercion to if errors allows
+        values = to_numeric(values, errors=errors)
+
+        # prevent overflow in case of int8 or int16
+        if is_integer_dtype(values):
+            values = values.astype('int64', copy=False)
+        return values
+
+    values = (coerce(arg[unit_rev['year']]) * 10000 +
+              coerce(arg[unit_rev['month']]) * 100 +
+              coerce(arg[unit_rev['day']]))
+    try:
+        values = to_datetime(values, format='%Y%m%d', errors=errors)
+    except (TypeError, ValueError) as e:
+        raise ValueError("cannot assemble the "
+                         "datetimes: {error}".format(error=e))
+
+    for u in ['h', 'm', 's', 'ms', 'us', 'ns']:
+        value = unit_rev.get(u)
+        if value is not None and value in arg:
+            try:
+                values += to_timedelta(coerce(arg[value]),
+                                       unit=u,
+                                       errors=errors)
+            except (TypeError, ValueError) as e:
+                raise ValueError("cannot assemble the datetimes [{value}]: "
+                                 "{error}".format(value=value, error=e))
+
+    return values
+
+
+def _attempt_YYYYMMDD(arg, errors):
+    """ try to parse the YYYYMMDD/%Y%m%d format, try to deal with NaT-like,
+        arg is a passed in as an object dtype, but could really be ints/strings
+        with nan-like/or floats (e.g. with nan)
+
+    Parameters
+    ----------
+    arg : passed value
+    errors : 'raise','ignore','coerce'
+    """
+
+    def calc(carg):
+        # calculate the actual result
+        carg = carg.astype(object)
+        parsed = parsing.try_parse_year_month_day(carg / 10000,
+                                                  carg / 100 % 100,
+                                                  carg % 100)
+        return tslib.array_to_datetime(parsed, errors=errors)
+
+    def calc_with_mask(carg, mask):
+        result = np.empty(carg.shape, dtype='M8[ns]')
+        iresult = result.view('i8')
+        iresult[~mask] = tslib.iNaT
+        result[mask] = calc(carg[mask].astype(np.float64).astype(np.int64)). \
+            astype('M8[ns]')
+        return result
+
+    # try intlike / strings that are ints
+    try:
+        return calc(arg.astype(np.int64))
+    except:
+        pass
+
+    # a float with actual np.nan
+    try:
+        carg = arg.astype(np.float64)
+        return calc_with_mask(carg, notna(carg))
+    except:
+        pass
+
+    # string with NaN-like
+    try:
+        mask = ~algorithms.isin(arg, list(tslib.nat_strings))
+        return calc_with_mask(arg, mask)
+    except:
+        pass
+
+    return None
+
+
+# Fixed time formats for time parsing
+_time_formats = ["%H:%M", "%H%M", "%I:%M%p", "%I%M%p",
+                 "%H:%M:%S", "%H%M%S", "%I:%M:%S%p", "%I%M%S%p"]
+
+
+def _guess_time_format_for_array(arr):
+    # Try to guess the format based on the first non-NaN element
+    non_nan_elements = notna(arr).nonzero()[0]
+    if len(non_nan_elements):
+        element = arr[non_nan_elements[0]]
+        for time_format in _time_formats:
+            try:
+                datetime.strptime(element, time_format)
+                return time_format
+            except ValueError:
+                pass
+
+    return None
+
+
+def to_time(arg, format=None, infer_time_format=False, errors='raise'):
+    """
+    Parse time strings to time objects using fixed strptime formats ("%H:%M",
+    "%H%M", "%I:%M%p", "%I%M%p", "%H:%M:%S", "%H%M%S", "%I:%M:%S%p",
+    "%I%M%S%p")
+
+    Use infer_time_format if all the strings are in the same format to speed
+    up conversion.
+
+    Parameters
+    ----------
+    arg : string in time format, datetime.time, list, tuple, 1-d array,  Series
+    format : str, default None
+        Format used to convert arg into a time object.  If None, fixed formats
+        are used.
+    infer_time_format: bool, default False
+        Infer the time format based on the first non-NaN element.  If all
+        strings are in the same format, this will speed up conversion.
+    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
+        - If 'raise', then invalid parsing will raise an exception
+        - If 'coerce', then invalid parsing will be set as None
+        - If 'ignore', then invalid parsing will return the input
+
+    Returns
+    -------
+    datetime.time
+    """
+    from pandas.core.series import Series
+
+    def _convert_listlike(arg, format):
+
+        if isinstance(arg, (list, tuple)):
+            arg = np.array(arg, dtype='O')
+
+        elif getattr(arg, 'ndim', 1) > 1:
+            raise TypeError('arg must be a string, datetime, list, tuple, '
+                            '1-d array, or Series')
+
+        arg = _ensure_object(arg)
+
+        if infer_time_format and format is None:
+            format = _guess_time_format_for_array(arg)
+
+        times = []
+        if format is not None:
+            for element in arg:
+                try:
+                    times.append(datetime.strptime(element, format).time())
+                except (ValueError, TypeError):
+                    if errors == 'raise':
+                        msg = ("Cannot convert {element} to a time with given "
+                               "format {format}").format(element=element,
+                                                         format=format)
+                        raise ValueError(msg)
+                    elif errors == 'ignore':
+                        return arg
+                    else:
+                        times.append(None)
+        else:
+            formats = _time_formats[:]
+            format_found = False
+            for element in arg:
+                time_object = None
+                for time_format in formats:
+                    try:
+                        time_object = datetime.strptime(element,
+                                                        time_format).time()
+                        if not format_found:
+                            # Put the found format in front
+                            fmt = formats.pop(formats.index(time_format))
+                            formats.insert(0, fmt)
+                            format_found = True
+                        break
+                    except (ValueError, TypeError):
+                        continue
+
+                if time_object is not None:
+                    times.append(time_object)
+                elif errors == 'raise':
+                    raise ValueError("Cannot convert arg {arg} to "
+                                     "a time".format(arg=arg))
+                elif errors == 'ignore':
+                    return arg
+                else:
+                    times.append(None)
+
+        return times
+
+    if arg is None:
+        return arg
+    elif isinstance(arg, time):
+        return arg
+    elif isinstance(arg, Series):
+        values = _convert_listlike(arg._values, format)
+        return Series(values, index=arg.index, name=arg.name)
+    elif isinstance(arg, ABCIndexClass):
+        return _convert_listlike(arg, format)
+    elif is_list_like(arg):
+        return _convert_listlike(arg, format)
+
+    return _convert_listlike(np.array([arg]), format)[0]
+
+
+def format(dt):
+    """Returns date in YYYYMMDD format."""
+    return dt.strftime('%Y%m%d')
+
+
+OLE_TIME_ZERO = datetime(1899, 12, 30, 0, 0, 0)
+
+
+def ole2datetime(oledt):
+    """function for converting excel date to normal date format"""
+    val = float(oledt)
+
+    # Excel has a bug where it thinks the date 2/29/1900 exists
+    # we just reject any date before 3/1/1900.
+    if val < 61:
+        msg = "Value is outside of acceptable range: {value}".format(value=val)
+        raise ValueError(msg)
+
+    return OLE_TIME_ZERO + timedelta(days=val)
diff --git a/pandas/core/tools/numeric.py b/pandas/core/tools/numeric.py
new file mode 100644
index 0000000000000..ebe135dfb184c
--- /dev/null
+++ b/pandas/core/tools/numeric.py
@@ -0,0 +1,181 @@
+import numpy as np
+import pandas as pd
+from pandas.core.dtypes.common import (
+    is_scalar,
+    is_numeric_dtype,
+    is_decimal,
+    is_datetime_or_timedelta_dtype,
+    is_number,
+    _ensure_object)
+from pandas.core.dtypes.generic import ABCSeries, ABCIndexClass
+from pandas.core.dtypes.cast import maybe_downcast_to_dtype
+from pandas._libs import lib
+
+
+def to_numeric(arg, errors='raise', downcast=None):
+    """
+    Convert argument to a numeric type.
+
+    The default return dtype is `float64` or `int64`
+    depending on the data supplied. Use the `downcast` parameter
+    to obtain other dtypes.
+
+    Parameters
+    ----------
+    arg : list, tuple, 1-d array, or Series
+    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
+        - If 'raise', then invalid parsing will raise an exception
+        - If 'coerce', then invalid parsing will be set as NaN
+        - If 'ignore', then invalid parsing will return the input
+    downcast : {'integer', 'signed', 'unsigned', 'float'} , default None
+        If not None, and if the data has been successfully cast to a
+        numerical dtype (or if the data was numeric to begin with),
+        downcast that resulting data to the smallest numerical dtype
+        possible according to the following rules:
+
+        - 'integer' or 'signed': smallest signed int dtype (min.: np.int8)
+        - 'unsigned': smallest unsigned int dtype (min.: np.uint8)
+        - 'float': smallest float dtype (min.: np.float32)
+
+        As this behaviour is separate from the core conversion to
+        numeric values, any errors raised during the downcasting
+        will be surfaced regardless of the value of the 'errors' input.
+
+        In addition, downcasting will only occur if the size
+        of the resulting data's dtype is strictly larger than
+        the dtype it is to be cast to, so if none of the dtypes
+        checked satisfy that specification, no downcasting will be
+        performed on the data.
+
+        .. versionadded:: 0.19.0
+
+    Returns
+    -------
+    ret : numeric if parsing succeeded.
+        Return type depends on input.  Series if Series, otherwise ndarray
+
+    Examples
+    --------
+    Take separate series and convert to numeric, coercing when told to
+
+    >>> import pandas as pd
+    >>> s = pd.Series(['1.0', '2', -3])
+    >>> pd.to_numeric(s)
+    0    1.0
+    1    2.0
+    2   -3.0
+    dtype: float64
+    >>> pd.to_numeric(s, downcast='float')
+    0    1.0
+    1    2.0
+    2   -3.0
+    dtype: float32
+    >>> pd.to_numeric(s, downcast='signed')
+    0    1
+    1    2
+    2   -3
+    dtype: int8
+    >>> s = pd.Series(['apple', '1.0', '2', -3])
+    >>> pd.to_numeric(s, errors='ignore')
+    0    apple
+    1      1.0
+    2        2
+    3       -3
+    dtype: object
+    >>> pd.to_numeric(s, errors='coerce')
+    0    NaN
+    1    1.0
+    2    2.0
+    3   -3.0
+    dtype: float64
+
+    See also
+    --------
+    pandas.DataFrame.astype : Cast argument to a specified dtype.
+    pandas.to_datetime : Convert argument to datetime.
+    pandas.to_timedelta : Convert argument to timedelta.
+    numpy.ndarray.astype : Cast a numpy array to a specified type.
+    """
+    if downcast not in (None, 'integer', 'signed', 'unsigned', 'float'):
+        raise ValueError('invalid downcasting method provided')
+
+    is_series = False
+    is_index = False
+    is_scalars = False
+
+    if isinstance(arg, ABCSeries):
+        is_series = True
+        values = arg.values
+    elif isinstance(arg, ABCIndexClass):
+        is_index = True
+        values = arg.asi8
+        if values is None:
+            values = arg.values
+    elif isinstance(arg, (list, tuple)):
+        values = np.array(arg, dtype='O')
+    elif is_scalar(arg):
+        if is_decimal(arg):
+            return float(arg)
+        if is_number(arg):
+            return arg
+        is_scalars = True
+        values = np.array([arg], dtype='O')
+    elif getattr(arg, 'ndim', 1) > 1:
+        raise TypeError('arg must be a list, tuple, 1-d array, or Series')
+    else:
+        values = arg
+
+    try:
+        if is_numeric_dtype(values):
+            pass
+        elif is_datetime_or_timedelta_dtype(values):
+            values = values.astype(np.int64)
+        else:
+            values = _ensure_object(values)
+            coerce_numeric = False if errors in ('ignore', 'raise') else True
+            values = lib.maybe_convert_numeric(values, set(),
+                                               coerce_numeric=coerce_numeric)
+
+    except Exception:
+        if errors == 'raise':
+            raise
+
+    # attempt downcast only if the data has been successfully converted
+    # to a numerical dtype and if a downcast method has been specified
+    if downcast is not None and is_numeric_dtype(values):
+        typecodes = None
+
+        if downcast in ('integer', 'signed'):
+            typecodes = np.typecodes['Integer']
+        elif downcast == 'unsigned' and np.min(values) >= 0:
+            typecodes = np.typecodes['UnsignedInteger']
+        elif downcast == 'float':
+            typecodes = np.typecodes['Float']
+
+            # pandas support goes only to np.float32,
+            # as float dtypes smaller than that are
+            # extremely rare and not well supported
+            float_32_char = np.dtype(np.float32).char
+            float_32_ind = typecodes.index(float_32_char)
+            typecodes = typecodes[float_32_ind:]
+
+        if typecodes is not None:
+            # from smallest to largest
+            for dtype in typecodes:
+                if np.dtype(dtype).itemsize <= values.dtype.itemsize:
+                    values = maybe_downcast_to_dtype(values, dtype)
+
+                    # successful conversion
+                    if values.dtype == dtype:
+                        break
+
+    if is_series:
+        return pd.Series(values, index=arg.index, name=arg.name)
+    elif is_index:
+        # because we want to coerce to numeric if possible,
+        # do not use _shallow_copy_with_infer
+        return pd.Index(values, name=arg.name)
+    elif is_scalars:
+        return values[0]
+    else:
+        return values
diff --git a/pandas/core/tools/timedeltas.py b/pandas/core/tools/timedeltas.py
new file mode 100644
index 0000000000000..94e2f2342bd51
--- /dev/null
+++ b/pandas/core/tools/timedeltas.py
@@ -0,0 +1,193 @@
+"""
+timedelta support tools
+"""
+
+import numpy as np
+import pandas as pd
+import pandas._libs.tslib as tslib
+from pandas._libs.tslibs.timedeltas import (convert_to_timedelta64,
+                                            array_to_timedelta64)
+
+from pandas.core.dtypes.common import (
+    _ensure_object,
+    is_integer_dtype,
+    is_timedelta64_dtype,
+    is_list_like)
+from pandas.core.dtypes.generic import ABCSeries, ABCIndexClass
+
+
+def to_timedelta(arg, unit='ns', box=True, errors='raise'):
+    """
+    Convert argument to timedelta
+
+    Parameters
+    ----------
+    arg : string, timedelta, list, tuple, 1-d array, or Series
+    unit : unit of the arg (D,h,m,s,ms,us,ns) denote the unit, which is an
+        integer/float number
+    box : boolean, default True
+        - If True returns a Timedelta/TimedeltaIndex of the results
+        - if False returns a np.timedelta64 or ndarray of values of dtype
+          timedelta64[ns]
+    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
+        - If 'raise', then invalid parsing will raise an exception
+        - If 'coerce', then invalid parsing will be set as NaT
+        - If 'ignore', then invalid parsing will return the input
+
+    Returns
+    -------
+    ret : timedelta64/arrays of timedelta64 if parsing succeeded
+
+    Examples
+    --------
+
+    Parsing a single string to a Timedelta:
+
+    >>> pd.to_timedelta('1 days 06:05:01.00003')
+    Timedelta('1 days 06:05:01.000030')
+    >>> pd.to_timedelta('15.5us')
+    Timedelta('0 days 00:00:00.000015')
+
+    Parsing a list or array of strings:
+
+    >>> pd.to_timedelta(['1 days 06:05:01.00003', '15.5us', 'nan'])
+    TimedeltaIndex(['1 days 06:05:01.000030', '0 days 00:00:00.000015', NaT],
+                   dtype='timedelta64[ns]', freq=None)
+
+    Converting numbers by specifying the `unit` keyword argument:
+
+    >>> pd.to_timedelta(np.arange(5), unit='s')
+    TimedeltaIndex(['00:00:00', '00:00:01', '00:00:02',
+                    '00:00:03', '00:00:04'],
+                   dtype='timedelta64[ns]', freq=None)
+    >>> pd.to_timedelta(np.arange(5), unit='d')
+    TimedeltaIndex(['0 days', '1 days', '2 days', '3 days', '4 days'],
+                   dtype='timedelta64[ns]', freq=None)
+
+    See also
+    --------
+    pandas.DataFrame.astype : Cast argument to a specified dtype.
+    pandas.to_datetime : Convert argument to datetime.
+    """
+    unit = _validate_timedelta_unit(unit)
+
+    if errors not in ('ignore', 'raise', 'coerce'):
+        raise ValueError("errors must be one of 'ignore', "
+                         "'raise', or 'coerce'}")
+
+    if arg is None:
+        return arg
+    elif isinstance(arg, ABCSeries):
+        from pandas import Series
+        values = _convert_listlike(arg._values, unit=unit,
+                                   box=False, errors=errors)
+        return Series(values, index=arg.index, name=arg.name)
+    elif isinstance(arg, ABCIndexClass):
+        return _convert_listlike(arg, unit=unit, box=box,
+                                 errors=errors, name=arg.name)
+    elif is_list_like(arg) and getattr(arg, 'ndim', 1) == 0:
+        # extract array scalar and process below
+        arg = arg.item()
+    elif is_list_like(arg) and getattr(arg, 'ndim', 1) == 1:
+        return _convert_listlike(arg, unit=unit, box=box, errors=errors)
+    elif getattr(arg, 'ndim', 1) > 1:
+        raise TypeError('arg must be a string, timedelta, list, tuple, '
+                        '1-d array, or Series')
+
+    # ...so it must be a scalar value. Return scalar.
+    return _coerce_scalar_to_timedelta_type(arg, unit=unit,
+                                            box=box, errors=errors)
+
+
+_unit_map = {
+    'Y': 'Y',
+    'y': 'Y',
+    'W': 'W',
+    'w': 'W',
+    'D': 'D',
+    'd': 'D',
+    'days': 'D',
+    'Days': 'D',
+    'day': 'D',
+    'Day': 'D',
+    'M': 'M',
+    'H': 'h',
+    'h': 'h',
+    'm': 'm',
+    'T': 'm',
+    'S': 's',
+    's': 's',
+    'L': 'ms',
+    'MS': 'ms',
+    'ms': 'ms',
+    'US': 'us',
+    'us': 'us',
+    'NS': 'ns',
+    'ns': 'ns',
+}
+
+
+def _validate_timedelta_unit(arg):
+    """ provide validation / translation for timedelta short units """
+    try:
+        return _unit_map[arg]
+    except:
+        if arg is None:
+            return 'ns'
+        raise ValueError("invalid timedelta unit {arg} provided"
+                         .format(arg=arg))
+
+
+def _coerce_scalar_to_timedelta_type(r, unit='ns', box=True, errors='raise'):
+    """Convert string 'r' to a timedelta object."""
+
+    try:
+        result = convert_to_timedelta64(r, unit)
+    except ValueError:
+        if errors == 'raise':
+            raise
+        elif errors == 'ignore':
+            return r
+
+        # coerce
+        result = pd.NaT
+
+    if box:
+        result = tslib.Timedelta(result)
+    return result
+
+
+def _convert_listlike(arg, unit='ns', box=True, errors='raise', name=None):
+    """Convert a list of objects to a timedelta index object."""
+
+    if isinstance(arg, (list, tuple)) or not hasattr(arg, 'dtype'):
+        arg = np.array(list(arg), dtype='O')
+
+    # these are shortcut-able
+    if is_timedelta64_dtype(arg):
+        value = arg.astype('timedelta64[ns]')
+    elif is_integer_dtype(arg):
+        value = arg.astype('timedelta64[{unit}]'.format(unit=unit)).astype(
+            'timedelta64[ns]', copy=False)
+    else:
+        try:
+            value = array_to_timedelta64(_ensure_object(arg),
+                                         unit=unit, errors=errors)
+            value = value.astype('timedelta64[ns]', copy=False)
+        except ValueError:
+            if errors == 'ignore':
+                return arg
+            else:
+                # This else-block accounts for the cases when errors='raise'
+                # and errors='coerce'. If errors == 'raise', these errors
+                # should be raised. If errors == 'coerce', we shouldn't
+                # expect any errors to be raised, since all parsing errors
+                # cause coercion to pd.NaT. However, if an error / bug is
+                # introduced that causes an Exception to be raised, we would
+                # like to surface it.
+                raise
+
+    if box:
+        from pandas import TimedeltaIndex
+        value = TimedeltaIndex(value, unit='ns', name=name)
+    return value
diff --git a/pandas/sparse/tests/__init__.py b/pandas/core/util/__init__.py
similarity index 100%
rename from pandas/sparse/tests/__init__.py
rename to pandas/core/util/__init__.py
diff --git a/pandas/core/util/hashing.py b/pandas/core/util/hashing.py
new file mode 100644
index 0000000000000..7edb5b16ce77a
--- /dev/null
+++ b/pandas/core/util/hashing.py
@@ -0,0 +1,332 @@
+"""
+data hash pandas / numpy objects
+"""
+import itertools
+
+import numpy as np
+from pandas._libs import hashing, tslib
+from pandas.core.dtypes.generic import (
+    ABCMultiIndex,
+    ABCIndexClass,
+    ABCSeries,
+    ABCDataFrame)
+from pandas.core.dtypes.common import (
+    is_categorical_dtype, is_list_like)
+from pandas.core.dtypes.missing import isna
+from pandas.core.dtypes.cast import infer_dtype_from_scalar
+
+
+# 16 byte long hashing key
+_default_hash_key = '0123456789123456'
+
+
+def _combine_hash_arrays(arrays, num_items):
+    """
+    Parameters
+    ----------
+    arrays : generator
+    num_items : int
+
+    Should be the same as CPython's tupleobject.c
+    """
+    try:
+        first = next(arrays)
+    except StopIteration:
+        return np.array([], dtype=np.uint64)
+
+    arrays = itertools.chain([first], arrays)
+
+    mult = np.uint64(1000003)
+    out = np.zeros_like(first) + np.uint64(0x345678)
+    for i, a in enumerate(arrays):
+        inverse_i = num_items - i
+        out ^= a
+        out *= mult
+        mult += np.uint64(82520 + inverse_i + inverse_i)
+    assert i + 1 == num_items, 'Fed in wrong num_items'
+    out += np.uint64(97531)
+    return out
+
+
+def hash_pandas_object(obj, index=True, encoding='utf8', hash_key=None,
+                       categorize=True):
+    """
+    Return a data hash of the Index/Series/DataFrame
+
+    .. versionadded:: 0.19.2
+
+    Parameters
+    ----------
+    index : boolean, default True
+        include the index in the hash (if Series/DataFrame)
+    encoding : string, default 'utf8'
+        encoding for data & key when strings
+    hash_key : string key to encode, default to _default_hash_key
+    categorize : bool, default True
+        Whether to first categorize object arrays before hashing. This is more
+        efficient when the array contains duplicate values.
+
+        .. versionadded:: 0.20.0
+
+    Returns
+    -------
+    Series of uint64, same length as the object
+
+    """
+    from pandas import Series
+    if hash_key is None:
+        hash_key = _default_hash_key
+
+    if isinstance(obj, ABCMultiIndex):
+        return Series(hash_tuples(obj, encoding, hash_key),
+                      dtype='uint64', copy=False)
+
+    if isinstance(obj, ABCIndexClass):
+        h = hash_array(obj.values, encoding, hash_key,
+                       categorize).astype('uint64', copy=False)
+        h = Series(h, index=obj, dtype='uint64', copy=False)
+    elif isinstance(obj, ABCSeries):
+        h = hash_array(obj.values, encoding, hash_key,
+                       categorize).astype('uint64', copy=False)
+        if index:
+            index_iter = (hash_pandas_object(obj.index,
+                                             index=False,
+                                             encoding=encoding,
+                                             hash_key=hash_key,
+                                             categorize=categorize).values
+                          for _ in [None])
+            arrays = itertools.chain([h], index_iter)
+            h = _combine_hash_arrays(arrays, 2)
+
+        h = Series(h, index=obj.index, dtype='uint64', copy=False)
+
+    elif isinstance(obj, ABCDataFrame):
+        hashes = (hash_array(series.values) for _, series in obj.iteritems())
+        num_items = len(obj.columns)
+        if index:
+            index_hash_generator = (hash_pandas_object(obj.index,
+                                                       index=False,
+                                                       encoding=encoding,
+                                                       hash_key=hash_key,
+                                                       categorize=categorize).values  # noqa
+                                    for _ in [None])
+            num_items += 1
+            hashes = itertools.chain(hashes, index_hash_generator)
+        h = _combine_hash_arrays(hashes, num_items)
+
+        h = Series(h, index=obj.index, dtype='uint64', copy=False)
+    else:
+        raise TypeError("Unexpected type for hashing %s" % type(obj))
+    return h
+
+
+def hash_tuples(vals, encoding='utf8', hash_key=None):
+    """
+    Hash an MultiIndex / list-of-tuples efficiently
+
+    .. versionadded:: 0.20.0
+
+    Parameters
+    ----------
+    vals : MultiIndex, list-of-tuples, or single tuple
+    encoding : string, default 'utf8'
+    hash_key : string key to encode, default to _default_hash_key
+
+    Returns
+    -------
+    ndarray of hashed values array
+    """
+    is_tuple = False
+    if isinstance(vals, tuple):
+        vals = [vals]
+        is_tuple = True
+    elif not is_list_like(vals):
+        raise TypeError("must be convertible to a list-of-tuples")
+
+    from pandas import Categorical, MultiIndex
+
+    if not isinstance(vals, ABCMultiIndex):
+        vals = MultiIndex.from_tuples(vals)
+
+    # create a list-of-Categoricals
+    vals = [Categorical(vals.labels[level],
+                        vals.levels[level],
+                        ordered=False,
+                        fastpath=True)
+            for level in range(vals.nlevels)]
+
+    # hash the list-of-ndarrays
+    hashes = (_hash_categorical(cat,
+                                encoding=encoding,
+                                hash_key=hash_key)
+              for cat in vals)
+    h = _combine_hash_arrays(hashes, len(vals))
+    if is_tuple:
+        h = h[0]
+
+    return h
+
+
+def hash_tuple(val, encoding='utf8', hash_key=None):
+    """
+    Hash a single tuple efficiently
+
+    Parameters
+    ----------
+    val : single tuple
+    encoding : string, default 'utf8'
+    hash_key : string key to encode, default to _default_hash_key
+
+    Returns
+    -------
+    hash
+
+    """
+    hashes = (_hash_scalar(v, encoding=encoding, hash_key=hash_key)
+              for v in val)
+
+    h = _combine_hash_arrays(hashes, len(val))[0]
+
+    return h
+
+
+def _hash_categorical(c, encoding, hash_key):
+    """
+    Hash a Categorical by hashing its categories, and then mapping the codes
+    to the hashes
+
+    Parameters
+    ----------
+    c : Categorical
+    encoding : string, default 'utf8'
+    hash_key : string key to encode, default to _default_hash_key
+
+    Returns
+    -------
+    ndarray of hashed values array, same size as len(c)
+    """
+    hashed = hash_array(c.categories.values, encoding, hash_key,
+                        categorize=False)
+
+    # we have uint64, as we don't directly support missing values
+    # we don't want to use take_nd which will coerce to float
+    # instead, directly construct the result with a
+    # max(np.uint64) as the missing value indicator
+    #
+    # TODO: GH 15362
+
+    mask = c.isna()
+    if len(hashed):
+        result = hashed.take(c.codes)
+    else:
+        result = np.zeros(len(mask), dtype='uint64')
+
+    if mask.any():
+        result[mask] = np.iinfo(np.uint64).max
+
+    return result
+
+
+def hash_array(vals, encoding='utf8', hash_key=None, categorize=True):
+    """
+    Given a 1d array, return an array of deterministic integers.
+
+    .. versionadded:: 0.19.2
+
+    Parameters
+    ----------
+    vals : ndarray, Categorical
+    encoding : string, default 'utf8'
+        encoding for data & key when strings
+    hash_key : string key to encode, default to _default_hash_key
+    categorize : bool, default True
+        Whether to first categorize object arrays before hashing. This is more
+        efficient when the array contains duplicate values.
+
+        .. versionadded:: 0.20.0
+
+    Returns
+    -------
+    1d uint64 numpy array of hash values, same length as the vals
+
+    """
+
+    if not hasattr(vals, 'dtype'):
+        raise TypeError("must pass a ndarray-like")
+    dtype = vals.dtype
+
+    if hash_key is None:
+        hash_key = _default_hash_key
+
+    # For categoricals, we hash the categories, then remap the codes to the
+    # hash values. (This check is above the complex check so that we don't ask
+    # numpy if categorical is a subdtype of complex, as it will choke).
+    if is_categorical_dtype(dtype):
+        return _hash_categorical(vals, encoding, hash_key)
+
+    # we'll be working with everything as 64-bit values, so handle this
+    # 128-bit value early
+    elif np.issubdtype(dtype, np.complex128):
+        return hash_array(vals.real) + 23 * hash_array(vals.imag)
+
+    # First, turn whatever array this is into unsigned 64-bit ints, if we can
+    # manage it.
+    elif isinstance(dtype, np.bool):
+        vals = vals.astype('u8')
+    elif issubclass(dtype.type, (np.datetime64, np.timedelta64)):
+        vals = vals.view('i8').astype('u8', copy=False)
+    elif issubclass(dtype.type, np.number) and dtype.itemsize <= 8:
+        vals = vals.view('u{}'.format(vals.dtype.itemsize)).astype('u8')
+    else:
+        # With repeated values, its MUCH faster to categorize object dtypes,
+        # then hash and rename categories. We allow skipping the categorization
+        # when the values are known/likely to be unique.
+        if categorize:
+            from pandas import factorize, Categorical, Index
+            codes, categories = factorize(vals, sort=False)
+            cat = Categorical(codes, Index(categories),
+                              ordered=False, fastpath=True)
+            return _hash_categorical(cat, encoding, hash_key)
+
+        try:
+            vals = hashing.hash_object_array(vals, hash_key, encoding)
+        except TypeError:
+            # we have mixed types
+            vals = hashing.hash_object_array(vals.astype(str).astype(object),
+                                             hash_key, encoding)
+
+    # Then, redistribute these 64-bit ints within the space of 64-bit ints
+    vals ^= vals >> 30
+    vals *= np.uint64(0xbf58476d1ce4e5b9)
+    vals ^= vals >> 27
+    vals *= np.uint64(0x94d049bb133111eb)
+    vals ^= vals >> 31
+    return vals
+
+
+def _hash_scalar(val, encoding='utf8', hash_key=None):
+    """
+    Hash scalar value
+
+    Returns
+    -------
+    1d uint64 numpy array of hash value, of length 1
+    """
+
+    if isna(val):
+        # this is to be consistent with the _hash_categorical implementation
+        return np.array([np.iinfo(np.uint64).max], dtype='u8')
+
+    if getattr(val, 'tzinfo', None) is not None:
+        # for tz-aware datetimes, we need the underlying naive UTC value and
+        # not the tz aware object or pd extension type (as
+        # infer_dtype_from_scalar would do)
+        if not isinstance(val, tslib.Timestamp):
+            val = tslib.Timestamp(val)
+        val = val.tz_convert(None)
+
+    dtype, val = infer_dtype_from_scalar(val)
+    vals = np.array([val], dtype=dtype)
+
+    return hash_array(vals, hash_key=hash_key, encoding=encoding,
+                      categorize=False)
diff --git a/pandas/core/window.py b/pandas/core/window.py
new file mode 100644
index 0000000000000..f089e402261db
--- /dev/null
+++ b/pandas/core/window.py
@@ -0,0 +1,2492 @@
+"""
+
+provide a generic structure to support window functions,
+similar to how we have a Groupby object
+
+
+"""
+from __future__ import division
+
+import warnings
+import numpy as np
+from collections import defaultdict
+from datetime import timedelta
+
+from pandas.core.dtypes.generic import (
+    ABCSeries,
+    ABCDataFrame,
+    ABCDatetimeIndex,
+    ABCTimedeltaIndex,
+    ABCPeriodIndex,
+    ABCDateOffset)
+from pandas.core.dtypes.common import (
+    is_integer,
+    is_bool,
+    is_float_dtype,
+    is_integer_dtype,
+    needs_i8_conversion,
+    is_timedelta64_dtype,
+    is_list_like,
+    _ensure_float64,
+    is_scalar)
+
+from pandas.core.base import (PandasObject, SelectionMixin,
+                              GroupByMixin)
+import pandas.core.common as com
+import pandas._libs.window as _window
+
+from pandas import compat
+from pandas.compat.numpy import function as nv
+from pandas.util._decorators import (Substitution, Appender,
+                                     cache_readonly)
+from pandas.core.generic import _shared_docs
+from textwrap import dedent
+
+
+_shared_docs = dict(**_shared_docs)
+_doc_template = """
+
+Returns
+-------
+same type as input
+
+See also
+--------
+pandas.Series.%(name)s
+pandas.DataFrame.%(name)s
+"""
+
+
+class _Window(PandasObject, SelectionMixin):
+    _attributes = ['window', 'min_periods', 'center', 'win_type',
+                   'axis', 'on', 'closed']
+    exclusions = set()
+
+    def __init__(self, obj, window=None, min_periods=None,
+                 center=False, win_type=None, axis=0, on=None, closed=None,
+                 **kwargs):
+
+        self.__dict__.update(kwargs)
+        self.blocks = []
+        self.obj = obj
+        self.on = on
+        self.closed = closed
+        self.window = window
+        self.min_periods = min_periods
+        self.center = center
+        self.win_type = win_type
+        self.win_freq = None
+        self.axis = obj._get_axis_number(axis) if axis is not None else None
+        self.validate()
+
+    @property
+    def _constructor(self):
+        return Window
+
+    @property
+    def is_datetimelike(self):
+        return None
+
+    @property
+    def _on(self):
+        return None
+
+    @property
+    def is_freq_type(self):
+        return self.win_type == 'freq'
+
+    def validate(self):
+        if self.center is not None and not is_bool(self.center):
+            raise ValueError("center must be a boolean")
+        if self.min_periods is not None and not \
+           is_integer(self.min_periods):
+            raise ValueError("min_periods must be an integer")
+        if self.closed is not None and self.closed not in \
+           ['right', 'both', 'left', 'neither']:
+            raise ValueError("closed must be 'right', 'left', 'both' or "
+                             "'neither'")
+
+    def _convert_freq(self):
+        """ resample according to the how, return a new object """
+
+        obj = self._selected_obj
+        index = None
+        return obj, index
+
+    def _create_blocks(self):
+        """ split data into blocks & return conformed data """
+
+        obj, index = self._convert_freq()
+        if index is not None:
+            index = self._on
+
+        # filter out the on from the object
+        if self.on is not None:
+            if obj.ndim == 2:
+                obj = obj.reindex(columns=obj.columns.difference([self.on]),
+                                  copy=False)
+        blocks = obj._to_dict_of_blocks(copy=False).values()
+
+        return blocks, obj, index
+
+    def _gotitem(self, key, ndim, subset=None):
+        """
+        sub-classes to define
+        return a sliced object
+
+        Parameters
+        ----------
+        key : string / list of selections
+        ndim : 1,2
+            requested ndim of result
+        subset : object, default None
+            subset to act on
+        """
+
+        # create a new object to prevent aliasing
+        if subset is None:
+            subset = self.obj
+        self = self._shallow_copy(subset)
+        self._reset_cache()
+        if subset.ndim == 2:
+            if is_scalar(key) and key in subset or is_list_like(key):
+                self._selection = key
+        return self
+
+    def __getattr__(self, attr):
+        if attr in self._internal_names_set:
+            return object.__getattribute__(self, attr)
+        if attr in self.obj:
+            return self[attr]
+
+        raise AttributeError("%r object has no attribute %r" %
+                             (type(self).__name__, attr))
+
+    def _dir_additions(self):
+        return self.obj._dir_additions()
+
+    def _get_window(self, other=None):
+        return self.window
+
+    @property
+    def _window_type(self):
+        return self.__class__.__name__
+
+    def __unicode__(self):
+        """ provide a nice str repr of our rolling object """
+
+        attrs = ["{k}={v}".format(k=k, v=getattr(self, k))
+                 for k in self._attributes
+                 if getattr(self, k, None) is not None]
+        return "{klass} [{attrs}]".format(klass=self._window_type,
+                                          attrs=','.join(attrs))
+
+    def __iter__(self):
+        url = 'https://github.com/pandas-dev/pandas/issues/11704'
+        raise NotImplementedError('See issue #11704 {url}'.format(url=url))
+
+    def _get_index(self, index=None):
+        """
+        Return index as ndarrays
+
+        Returns
+        -------
+        tuple of (index, index_as_ndarray)
+        """
+
+        if self.is_freq_type:
+            if index is None:
+                index = self._on
+            return index, index.asi8
+        return index, index
+
+    def _prep_values(self, values=None, kill_inf=True):
+
+        if values is None:
+            values = getattr(self._selected_obj, 'values', self._selected_obj)
+
+        # GH #12373 : rolling functions error on float32 data
+        # make sure the data is coerced to float64
+        if is_float_dtype(values.dtype):
+            values = _ensure_float64(values)
+        elif is_integer_dtype(values.dtype):
+            values = _ensure_float64(values)
+        elif needs_i8_conversion(values.dtype):
+            raise NotImplementedError("ops for {action} for this "
+                                      "dtype {dtype} are not "
+                                      "implemented".format(
+                                          action=self._window_type,
+                                          dtype=values.dtype))
+        else:
+            try:
+                values = _ensure_float64(values)
+            except (ValueError, TypeError):
+                raise TypeError("cannot handle this type -> {0}"
+                                "".format(values.dtype))
+
+        if kill_inf:
+            values = values.copy()
+            values[np.isinf(values)] = np.NaN
+
+        return values
+
+    def _wrap_result(self, result, block=None, obj=None):
+        """ wrap a single result """
+
+        if obj is None:
+            obj = self._selected_obj
+        index = obj.index
+
+        if isinstance(result, np.ndarray):
+
+            # coerce if necessary
+            if block is not None:
+                if is_timedelta64_dtype(block.values.dtype):
+                    from pandas import to_timedelta
+                    result = to_timedelta(
+                        result.ravel(), unit='ns').values.reshape(result.shape)
+
+            if result.ndim == 1:
+                from pandas import Series
+                return Series(result, index, name=obj.name)
+
+            return type(obj)(result, index=index, columns=block.columns)
+        return result
+
+    def _wrap_results(self, results, blocks, obj):
+        """
+        wrap the results
+
+        Parameters
+        ----------
+        results : list of ndarrays
+        blocks : list of blocks
+        obj : conformed data (may be resampled)
+        """
+
+        from pandas import Series, concat
+        from pandas.core.index import _ensure_index
+
+        final = []
+        for result, block in zip(results, blocks):
+
+            result = self._wrap_result(result, block=block, obj=obj)
+            if result.ndim == 1:
+                return result
+            final.append(result)
+
+        # if we have an 'on' column
+        # we want to put it back into the results
+        # in the same location
+        columns = self._selected_obj.columns
+        if self.on is not None and not self._on.equals(obj.index):
+
+            name = self._on.name
+            final.append(Series(self._on, index=obj.index, name=name))
+
+            if self._selection is not None:
+
+                selection = _ensure_index(self._selection)
+
+                # need to reorder to include original location of
+                # the on column (if its not already there)
+                if name not in selection:
+                    columns = self.obj.columns
+                    indexer = columns.get_indexer(selection.tolist() + [name])
+                    columns = columns.take(sorted(indexer))
+
+        if not len(final):
+            return obj.astype('float64')
+        return concat(final, axis=1).reindex(columns=columns, copy=False)
+
+    def _center_window(self, result, window):
+        """ center the result in the window """
+        if self.axis > result.ndim - 1:
+            raise ValueError("Requested axis is larger then no. of argument "
+                             "dimensions")
+
+        offset = _offset(window, True)
+        if offset > 0:
+            if isinstance(result, (ABCSeries, ABCDataFrame)):
+                result = result.slice_shift(-offset, axis=self.axis)
+            else:
+                lead_indexer = [slice(None)] * result.ndim
+                lead_indexer[self.axis] = slice(offset, None)
+                result = np.copy(result[tuple(lead_indexer)])
+        return result
+
+    def aggregate(self, arg, *args, **kwargs):
+        result, how = self._aggregate(arg, *args, **kwargs)
+        if result is None:
+            return self.apply(arg, raw=False, args=args, kwargs=kwargs)
+        return result
+
+    agg = aggregate
+
+    _shared_docs['sum'] = dedent("""
+    Calculate %(name)s sum of given DataFrame or Series.
+
+    Parameters
+    ----------
+    *args, **kwargs
+        For compatibility with other %(name)s methods. Has no effect
+        on the computed value.
+
+    Returns
+    -------
+    Series or DataFrame
+        Same type as the input, with the same index, containing the
+        %(name)s sum.
+
+    See Also
+    --------
+    Series.sum : Reducing sum for Series.
+    DataFrame.sum : Reducing sum for DataFrame.
+
+    Examples
+    --------
+    >>> s = pd.Series([1, 2, 3, 4, 5])
+    >>> s
+    0    1
+    1    2
+    2    3
+    3    4
+    4    5
+    dtype: int64
+
+    >>> s.rolling(3).sum()
+    0     NaN
+    1     NaN
+    2     6.0
+    3     9.0
+    4    12.0
+    dtype: float64
+
+    >>> s.expanding(3).sum()
+    0     NaN
+    1     NaN
+    2     6.0
+    3    10.0
+    4    15.0
+    dtype: float64
+
+    >>> s.rolling(3, center=True).sum()
+    0     NaN
+    1     6.0
+    2     9.0
+    3    12.0
+    4     NaN
+    dtype: float64
+
+    For DataFrame, each %(name)s sum is computed column-wise.
+
+    >>> df = pd.DataFrame({"A": s, "B": s ** 2})
+    >>> df
+       A   B
+    0  1   1
+    1  2   4
+    2  3   9
+    3  4  16
+    4  5  25
+
+    >>> df.rolling(3).sum()
+          A     B
+    0   NaN   NaN
+    1   NaN   NaN
+    2   6.0  14.0
+    3   9.0  29.0
+    4  12.0  50.0
+    """)
+
+    _shared_docs['mean'] = dedent("""
+    Calculate the %(name)s mean of the values.
+
+    Parameters
+    ----------
+    *args
+        Under Review.
+    **kwargs
+        Under Review.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returned object type is determined by the caller of the %(name)s
+        calculation.
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with Series data
+    DataFrame.%(name)s : Calling object with DataFrames
+    Series.mean : Equivalent method for Series
+    DataFrame.mean : Equivalent method for DataFrame
+
+    Examples
+    --------
+    The below examples will show rolling mean calculations with window sizes of
+    two and three, respectively.
+
+    >>> s = pd.Series([1, 2, 3, 4])
+    >>> s.rolling(2).mean()
+    0    NaN
+    1    1.5
+    2    2.5
+    3    3.5
+    dtype: float64
+
+    >>> s.rolling(3).mean()
+    0    NaN
+    1    NaN
+    2    2.0
+    3    3.0
+    dtype: float64
+    """)
+
+
+class Window(_Window):
+    """
+    Provides rolling window calculations.
+
+    .. versionadded:: 0.18.0
+
+    Parameters
+    ----------
+    window : int, or offset
+        Size of the moving window. This is the number of observations used for
+        calculating the statistic. Each window will be a fixed size.
+
+        If its an offset then this will be the time period of each window. Each
+        window will be a variable sized based on the observations included in
+        the time-period. This is only valid for datetimelike indexes. This is
+        new in 0.19.0
+    min_periods : int, default None
+        Minimum number of observations in window required to have a value
+        (otherwise result is NA). For a window that is specified by an offset,
+        this will default to 1.
+    center : boolean, default False
+        Set the labels at the center of the window.
+    win_type : string, default None
+        Provide a window type. If ``None``, all points are evenly weighted.
+        See the notes below for further information.
+    on : string, optional
+        For a DataFrame, column on which to calculate
+        the rolling window, rather than the index
+    closed : string, default None
+        Make the interval closed on the 'right', 'left', 'both' or
+        'neither' endpoints.
+        For offset-based windows, it defaults to 'right'.
+        For fixed windows, defaults to 'both'. Remaining cases not implemented
+        for fixed windows.
+
+        .. versionadded:: 0.20.0
+
+    axis : int or string, default 0
+
+    Returns
+    -------
+    a Window or Rolling sub-classed for the particular operation
+
+    Examples
+    --------
+
+    >>> df = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]})
+    >>> df
+         B
+    0  0.0
+    1  1.0
+    2  2.0
+    3  NaN
+    4  4.0
+
+    Rolling sum with a window length of 2, using the 'triang'
+    window type.
+
+    >>> df.rolling(2, win_type='triang').sum()
+         B
+    0  NaN
+    1  1.0
+    2  2.5
+    3  NaN
+    4  NaN
+
+    Rolling sum with a window length of 2, min_periods defaults
+    to the window length.
+
+    >>> df.rolling(2).sum()
+         B
+    0  NaN
+    1  1.0
+    2  3.0
+    3  NaN
+    4  NaN
+
+    Same as above, but explicitly set the min_periods
+
+    >>> df.rolling(2, min_periods=1).sum()
+         B
+    0  0.0
+    1  1.0
+    2  3.0
+    3  2.0
+    4  4.0
+
+    A ragged (meaning not-a-regular frequency), time-indexed DataFrame
+
+    >>> df = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]},
+    ...                   index = [pd.Timestamp('20130101 09:00:00'),
+    ...                            pd.Timestamp('20130101 09:00:02'),
+    ...                            pd.Timestamp('20130101 09:00:03'),
+    ...                            pd.Timestamp('20130101 09:00:05'),
+    ...                            pd.Timestamp('20130101 09:00:06')])
+
+    >>> df
+                           B
+    2013-01-01 09:00:00  0.0
+    2013-01-01 09:00:02  1.0
+    2013-01-01 09:00:03  2.0
+    2013-01-01 09:00:05  NaN
+    2013-01-01 09:00:06  4.0
+
+
+    Contrasting to an integer rolling window, this will roll a variable
+    length window corresponding to the time period.
+    The default for min_periods is 1.
+
+    >>> df.rolling('2s').sum()
+                           B
+    2013-01-01 09:00:00  0.0
+    2013-01-01 09:00:02  1.0
+    2013-01-01 09:00:03  3.0
+    2013-01-01 09:00:05  NaN
+    2013-01-01 09:00:06  4.0
+
+    Notes
+    -----
+    By default, the result is set to the right edge of the window. This can be
+    changed to the center of the window by setting ``center=True``.
+
+    To learn more about the offsets & frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    The recognized win_types are:
+
+    * ``boxcar``
+    * ``triang``
+    * ``blackman``
+    * ``hamming``
+    * ``bartlett``
+    * ``parzen``
+    * ``bohman``
+    * ``blackmanharris``
+    * ``nuttall``
+    * ``barthann``
+    * ``kaiser`` (needs beta)
+    * ``gaussian`` (needs std)
+    * ``general_gaussian`` (needs power, width)
+    * ``slepian`` (needs width).
+
+    If ``win_type=None`` all points are evenly weighted. To learn more about
+    different window types see `scipy.signal window functions
+    <https://docs.scipy.org/doc/scipy/reference/signal.html#window-functions>`__.
+
+    See Also
+    --------
+    expanding : Provides expanding transformations.
+    ewm : Provides exponential weighted functions
+    """
+
+    def validate(self):
+        super(Window, self).validate()
+
+        window = self.window
+        if isinstance(window, (list, tuple, np.ndarray)):
+            pass
+        elif is_integer(window):
+            if window <= 0:
+                raise ValueError("window must be > 0 ")
+            try:
+                import scipy.signal as sig
+            except ImportError:
+                raise ImportError('Please install scipy to generate window '
+                                  'weight')
+
+            if not isinstance(self.win_type, compat.string_types):
+                raise ValueError('Invalid win_type {0}'.format(self.win_type))
+            if getattr(sig, self.win_type, None) is None:
+                raise ValueError('Invalid win_type {0}'.format(self.win_type))
+        else:
+            raise ValueError('Invalid window {0}'.format(window))
+
+    def _prep_window(self, **kwargs):
+        """
+        provide validation for our window type, return the window
+        we have already been validated
+        """
+
+        window = self._get_window()
+        if isinstance(window, (list, tuple, np.ndarray)):
+            return com._asarray_tuplesafe(window).astype(float)
+        elif is_integer(window):
+            import scipy.signal as sig
+
+            # the below may pop from kwargs
+            def _validate_win_type(win_type, kwargs):
+                arg_map = {'kaiser': ['beta'],
+                           'gaussian': ['std'],
+                           'general_gaussian': ['power', 'width'],
+                           'slepian': ['width']}
+                if win_type in arg_map:
+                    return tuple([win_type] + _pop_args(win_type,
+                                                        arg_map[win_type],
+                                                        kwargs))
+                return win_type
+
+            def _pop_args(win_type, arg_names, kwargs):
+                msg = '%s window requires %%s' % win_type
+                all_args = []
+                for n in arg_names:
+                    if n not in kwargs:
+                        raise ValueError(msg % n)
+                    all_args.append(kwargs.pop(n))
+                return all_args
+
+            win_type = _validate_win_type(self.win_type, kwargs)
+            # GH #15662. `False` makes symmetric window, rather than periodic.
+            return sig.get_window(win_type, window, False).astype(float)
+
+    def _apply_window(self, mean=True, **kwargs):
+        """
+        Applies a moving window of type ``window_type`` on the data.
+
+        Parameters
+        ----------
+        mean : boolean, default True
+            If True computes weighted mean, else weighted sum
+
+        Returns
+        -------
+        y : same type as input argument
+
+        """
+        window = self._prep_window(**kwargs)
+        center = self.center
+
+        blocks, obj, index = self._create_blocks()
+        results = []
+        for b in blocks:
+            try:
+                values = self._prep_values(b.values)
+            except TypeError:
+                results.append(b.values.copy())
+                continue
+
+            if values.size == 0:
+                results.append(values.copy())
+                continue
+
+            offset = _offset(window, center)
+            additional_nans = np.array([np.NaN] * offset)
+
+            def f(arg, *args, **kwargs):
+                minp = _use_window(self.min_periods, len(window))
+                return _window.roll_window(np.concatenate((arg,
+                                                           additional_nans))
+                                           if center else arg, window, minp,
+                                           avg=mean)
+
+            result = np.apply_along_axis(f, self.axis, values)
+
+            if center:
+                result = self._center_window(result, window)
+            results.append(result)
+
+        return self._wrap_results(results, blocks, obj)
+
+    _agg_doc = dedent("""
+    Examples
+    --------
+
+    >>> df = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'])
+    >>> df
+              A         B         C
+    0 -2.385977 -0.102758  0.438822
+    1 -1.004295  0.905829 -0.954544
+    2  0.735167 -0.165272 -1.619346
+    3 -0.702657 -1.340923 -0.706334
+    4 -0.246845  0.211596 -0.901819
+    5  2.463718  3.157577 -1.380906
+    6 -1.142255  2.340594 -0.039875
+    7  1.396598 -1.647453  1.677227
+    8 -0.543425  1.761277 -0.220481
+    9 -0.640505  0.289374 -1.550670
+
+    >>> df.rolling(3, win_type='boxcar').agg('mean')
+              A         B         C
+    0       NaN       NaN       NaN
+    1       NaN       NaN       NaN
+    2 -0.885035  0.212600 -0.711689
+    3 -0.323928 -0.200122 -1.093408
+    4 -0.071445 -0.431533 -1.075833
+    5  0.504739  0.676083 -0.996353
+    6  0.358206  1.903256 -0.774200
+    7  0.906020  1.283573  0.085482
+    8 -0.096361  0.818139  0.472290
+    9  0.070889  0.134399 -0.031308
+
+    See also
+    --------
+    pandas.DataFrame.rolling.aggregate
+    pandas.DataFrame.aggregate
+
+    """)
+
+    @Appender(_agg_doc)
+    @Appender(_shared_docs['aggregate'] % dict(
+        versionadded='',
+        klass='Series/DataFrame',
+        axis=''))
+    def aggregate(self, arg, *args, **kwargs):
+        result, how = self._aggregate(arg, *args, **kwargs)
+        if result is None:
+
+            # these must apply directly
+            result = arg(self)
+
+        return result
+
+    agg = aggregate
+
+    @Substitution(name='window')
+    @Appender(_shared_docs['sum'])
+    def sum(self, *args, **kwargs):
+        nv.validate_window_func('sum', args, kwargs)
+        return self._apply_window(mean=False, **kwargs)
+
+    @Substitution(name='window')
+    @Appender(_shared_docs['mean'])
+    def mean(self, *args, **kwargs):
+        nv.validate_window_func('mean', args, kwargs)
+        return self._apply_window(mean=True, **kwargs)
+
+
+class _GroupByMixin(GroupByMixin):
+    """ provide the groupby facilities """
+
+    def __init__(self, obj, *args, **kwargs):
+        parent = kwargs.pop('parent', None)  # noqa
+        groupby = kwargs.pop('groupby', None)
+        if groupby is None:
+            groupby, obj = obj, obj.obj
+        self._groupby = groupby
+        self._groupby.mutated = True
+        self._groupby.grouper.mutated = True
+        super(GroupByMixin, self).__init__(obj, *args, **kwargs)
+
+    count = GroupByMixin._dispatch('count')
+    corr = GroupByMixin._dispatch('corr', other=None, pairwise=None)
+    cov = GroupByMixin._dispatch('cov', other=None, pairwise=None)
+
+    def _apply(self, func, name, window=None, center=None,
+               check_minp=None, **kwargs):
+        """
+        dispatch to apply; we are stripping all of the _apply kwargs and
+        performing the original function call on the grouped object
+        """
+
+        def f(x, name=name, *args):
+            x = self._shallow_copy(x)
+
+            if isinstance(name, compat.string_types):
+                return getattr(x, name)(*args, **kwargs)
+
+            return x.apply(name, *args, **kwargs)
+
+        return self._groupby.apply(f)
+
+
+class _Rolling(_Window):
+
+    @property
+    def _constructor(self):
+        return Rolling
+
+    def _apply(self, func, name=None, window=None, center=None,
+               check_minp=None, **kwargs):
+        """
+        Rolling statistical measure using supplied function. Designed to be
+        used with passed-in Cython array-based functions.
+
+        Parameters
+        ----------
+        func : string/callable to apply
+        name : string, optional
+           name of this function
+        window : int/array, default to _get_window()
+        center : boolean, default to self.center
+        check_minp : function, default to _use_window
+
+        Returns
+        -------
+        y : type of input
+        """
+        if center is None:
+            center = self.center
+        if window is None:
+            window = self._get_window()
+
+        if check_minp is None:
+            check_minp = _use_window
+
+        blocks, obj, index = self._create_blocks()
+        index, indexi = self._get_index(index=index)
+        results = []
+        for b in blocks:
+            values = self._prep_values(b.values)
+
+            if values.size == 0:
+                results.append(values.copy())
+                continue
+
+            # if we have a string function name, wrap it
+            if isinstance(func, compat.string_types):
+                cfunc = getattr(_window, func, None)
+                if cfunc is None:
+                    raise ValueError("we do not support this function "
+                                     "in _window.{0}".format(func))
+
+                def func(arg, window, min_periods=None, closed=None):
+                    minp = check_minp(min_periods, window)
+                    # ensure we are only rolling on floats
+                    arg = _ensure_float64(arg)
+                    return cfunc(arg,
+                                 window, minp, indexi, closed, **kwargs)
+
+            # calculation function
+            if center:
+                offset = _offset(window, center)
+                additional_nans = np.array([np.NaN] * offset)
+
+                def calc(x):
+                    return func(np.concatenate((x, additional_nans)),
+                                window, min_periods=self.min_periods,
+                                closed=self.closed)
+            else:
+
+                def calc(x):
+                    return func(x, window, min_periods=self.min_periods,
+                                closed=self.closed)
+
+            with np.errstate(all='ignore'):
+                if values.ndim > 1:
+                    result = np.apply_along_axis(calc, self.axis, values)
+                else:
+                    result = calc(values)
+
+            if center:
+                result = self._center_window(result, window)
+
+            results.append(result)
+
+        return self._wrap_results(results, blocks, obj)
+
+
+class _Rolling_and_Expanding(_Rolling):
+
+    _shared_docs['count'] = dedent(r"""
+    The %(name)s count of any non-NaN observations inside the window.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returned object type is determined by the caller of the %(name)s
+        calculation.
+
+    See Also
+    --------
+    pandas.Series.%(name)s : Calling object with Series data
+    pandas.DataFrame.%(name)s : Calling object with DataFrames
+    pandas.DataFrame.count : Count of the full DataFrame
+
+    Examples
+    --------
+    >>> s = pd.Series([2, 3, np.nan, 10])
+    >>> s.rolling(2).count()
+    0    1.0
+    1    2.0
+    2    1.0
+    3    1.0
+    dtype: float64
+    >>> s.rolling(3).count()
+    0    1.0
+    1    2.0
+    2    2.0
+    3    2.0
+    dtype: float64
+    >>> s.rolling(4).count()
+    0    1.0
+    1    2.0
+    2    2.0
+    3    3.0
+    dtype: float64
+    """)
+
+    def count(self):
+
+        blocks, obj, index = self._create_blocks()
+        index, indexi = self._get_index(index=index)
+
+        window = self._get_window()
+        window = min(window, len(obj)) if not self.center else window
+
+        results = []
+        for b in blocks:
+            result = b.notna().astype(int)
+            result = self._constructor(result, window=window, min_periods=0,
+                                       center=self.center,
+                                       closed=self.closed).sum()
+            results.append(result)
+
+        return self._wrap_results(results, blocks, obj)
+
+    _shared_docs['apply'] = dedent(r"""
+    %(name)s function apply
+
+    Parameters
+    ----------
+    func : function
+        Must produce a single value from an ndarray input if ``raw=True``
+        or a Series if ``raw=False``
+    raw : bool, default None
+        * ``False`` : passes each row or column as a Series to the
+          function.
+        * ``True`` or ``None`` : the passed function will receive ndarray
+          objects instead.
+          If you are just applying a NumPy reduction function this will
+          achieve much better performance.
+
+        The `raw` parameter is required and will show a FutureWarning if
+        not passed. In the future `raw` will default to False.
+
+        .. versionadded:: 0.23.0
+
+    \*args and \*\*kwargs are passed to the function""")
+
+    def apply(self, func, raw=None, args=(), kwargs={}):
+        from pandas import Series
+
+        # TODO: _level is unused?
+        _level = kwargs.pop('_level', None)  # noqa
+        window = self._get_window()
+        offset = _offset(window, self.center)
+        index, indexi = self._get_index()
+
+        # TODO: default is for backward compat
+        # change to False in the future
+        if raw is None:
+            warnings.warn(
+                "Currently, 'apply' passes the values as ndarrays to the "
+                "applied function. In the future, this will change to passing "
+                "it as Series objects. You need to specify 'raw=True' to keep "
+                "the current behaviour, and you can pass 'raw=False' to "
+                "silence this warning", FutureWarning, stacklevel=3)
+            raw = True
+
+        def f(arg, window, min_periods, closed):
+            minp = _use_window(min_periods, window)
+            if not raw:
+                arg = Series(arg, index=self.obj.index)
+            return _window.roll_generic(
+                arg, window, minp, indexi,
+                closed, offset, func, raw, args, kwargs)
+
+        return self._apply(f, func, args=args, kwargs=kwargs,
+                           center=False, raw=raw)
+
+    def sum(self, *args, **kwargs):
+        nv.validate_window_func('sum', args, kwargs)
+        return self._apply('roll_sum', 'sum', **kwargs)
+
+    _shared_docs['max'] = dedent("""
+    %(name)s maximum
+    """)
+
+    def max(self, *args, **kwargs):
+        nv.validate_window_func('max', args, kwargs)
+        return self._apply('roll_max', 'max', **kwargs)
+
+    _shared_docs['min'] = dedent("""
+    Calculate the %(name)s minimum.
+
+    Parameters
+    ----------
+    **kwargs
+        Under Review.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returned object type is determined by the caller of the %(name)s
+        calculation.
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with a Series
+    DataFrame.%(name)s : Calling object with a DataFrame
+    Series.min : Similar method for Series
+    DataFrame.min : Similar method for DataFrame
+
+    Examples
+    --------
+    Performing a rolling minimum with a window size of 3.
+
+    >>> s = pd.Series([4, 3, 5, 2, 6])
+    >>> s.rolling(3).min()
+    0    NaN
+    1    NaN
+    2    3.0
+    3    2.0
+    4    2.0
+    dtype: float64
+    """)
+
+    def min(self, *args, **kwargs):
+        nv.validate_window_func('min', args, kwargs)
+        return self._apply('roll_min', 'min', **kwargs)
+
+    def mean(self, *args, **kwargs):
+        nv.validate_window_func('mean', args, kwargs)
+        return self._apply('roll_mean', 'mean', **kwargs)
+
+    _shared_docs['median'] = dedent("""
+    Calculate the %(name)s median.
+
+    Parameters
+    ----------
+    **kwargs
+        For compatibility with other %(name)s methods. Has no effect
+        on the computed median.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returned type is the same as the original object.
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with Series data
+    DataFrame.%(name)s : Calling object with DataFrames
+    Series.median : Equivalent method for Series
+    DataFrame.median : Equivalent method for DataFrame
+
+    Examples
+    --------
+    Compute the rolling median of a series with a window size of 3.
+
+    >>> s = pd.Series([0, 1, 2, 3, 4])
+    >>> s.rolling(3).median()
+    0    NaN
+    1    NaN
+    2    1.0
+    3    2.0
+    4    3.0
+    dtype: float64
+    """)
+
+    def median(self, **kwargs):
+        return self._apply('roll_median_c', 'median', **kwargs)
+
+    _shared_docs['std'] = dedent("""
+    Calculate %(name)s standard deviation.
+
+    Normalized by N-1 by default. This can be changed using the `ddof`
+    argument.
+
+    Parameters
+    ----------
+    ddof : int, default 1
+        Delta Degrees of Freedom.  The divisor used in calculations
+        is ``N - ddof``, where ``N`` represents the number of elements.
+    *args, **kwargs
+        For NumPy compatibility. No additional arguments are used.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returns the same object type as the caller of the %(name)s calculation.
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with Series data
+    DataFrame.%(name)s : Calling object with DataFrames
+    Series.std : Equivalent method for Series
+    DataFrame.std : Equivalent method for DataFrame
+    numpy.std : Equivalent method for Numpy array
+
+    Notes
+    -----
+    The default `ddof` of 1 used in Series.std is different than the default
+    `ddof` of 0 in numpy.std.
+
+    A minimum of one period is required for the rolling calculation.
+
+    Examples
+    --------
+    >>> s = pd.Series([5, 5, 6, 7, 5, 5, 5])
+    >>> s.rolling(3).std()
+    0         NaN
+    1         NaN
+    2    0.577350
+    3    1.000000
+    4    1.000000
+    5    1.154701
+    6    0.000000
+    dtype: float64
+
+    >>> s.expanding(3).std()
+    0         NaN
+    1         NaN
+    2    0.577350
+    3    0.957427
+    4    0.894427
+    5    0.836660
+    6    0.786796
+    dtype: float64
+    """)
+
+    def std(self, ddof=1, *args, **kwargs):
+        nv.validate_window_func('std', args, kwargs)
+        window = self._get_window()
+        index, indexi = self._get_index()
+
+        def f(arg, *args, **kwargs):
+            minp = _require_min_periods(1)(self.min_periods, window)
+            return _zsqrt(_window.roll_var(arg, window, minp, indexi,
+                                           self.closed, ddof))
+
+        return self._apply(f, 'std', check_minp=_require_min_periods(1),
+                           ddof=ddof, **kwargs)
+
+    _shared_docs['var'] = dedent("""
+    Calculate unbiased %(name)s variance.
+
+    Normalized by N-1 by default. This can be changed using the `ddof`
+    argument.
+
+    Parameters
+    ----------
+    ddof : int, default 1
+        Delta Degrees of Freedom.  The divisor used in calculations
+        is ``N - ddof``, where ``N`` represents the number of elements.
+    *args, **kwargs
+        For NumPy compatibility. No additional arguments are used.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returns the same object type as the caller of the %(name)s calculation.
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with Series data
+    DataFrame.%(name)s : Calling object with DataFrames
+    Series.var : Equivalent method for Series
+    DataFrame.var : Equivalent method for DataFrame
+    numpy.var : Equivalent method for Numpy array
+
+    Notes
+    -----
+    The default `ddof` of 1 used in :meth:`Series.var` is different than the
+    default `ddof` of 0 in :func:`numpy.var`.
+
+    A minimum of 1 period is required for the rolling calculation.
+
+    Examples
+    --------
+    >>> s = pd.Series([5, 5, 6, 7, 5, 5, 5])
+    >>> s.rolling(3).var()
+    0         NaN
+    1         NaN
+    2    0.333333
+    3    1.000000
+    4    1.000000
+    5    1.333333
+    6    0.000000
+    dtype: float64
+
+    >>> s.expanding(3).var()
+    0         NaN
+    1         NaN
+    2    0.333333
+    3    0.916667
+    4    0.800000
+    5    0.700000
+    6    0.619048
+    dtype: float64
+    """)
+
+    def var(self, ddof=1, *args, **kwargs):
+        nv.validate_window_func('var', args, kwargs)
+        return self._apply('roll_var', 'var',
+                           check_minp=_require_min_periods(1), ddof=ddof,
+                           **kwargs)
+
+    _shared_docs['skew'] = """Unbiased %(name)s skewness"""
+
+    def skew(self, **kwargs):
+        return self._apply('roll_skew', 'skew',
+                           check_minp=_require_min_periods(3), **kwargs)
+
+    _shared_docs['kurt'] = dedent("""
+    Calculate unbiased %(name)s kurtosis.
+
+    This function uses Fisher's definition of kurtosis without bias.
+
+    Parameters
+    ----------
+    **kwargs
+        Under Review.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returned object type is determined by the caller of the %(name)s
+        calculation
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with Series data
+    DataFrame.%(name)s : Calling object with DataFrames
+    Series.kurt : Equivalent method for Series
+    DataFrame.kurt : Equivalent method for DataFrame
+    scipy.stats.skew : Third moment of a probability density
+    scipy.stats.kurtosis : Reference SciPy method
+
+    Notes
+    -----
+    A minimum of 4 periods is required for the %(name)s calculation.
+    """)
+
+    def kurt(self, **kwargs):
+        return self._apply('roll_kurt', 'kurt',
+                           check_minp=_require_min_periods(4), **kwargs)
+
+    _shared_docs['quantile'] = dedent("""
+    %(name)s quantile.
+
+    Parameters
+    ----------
+    quantile : float
+        Quantile to compute. 0 <= quantile <= 1.
+    interpolation : {'linear', 'lower', 'higher', 'midpoint', 'nearest'}
+        .. versionadded:: 0.23.0
+
+        This optional parameter specifies the interpolation method to use,
+        when the desired quantile lies between two data points `i` and `j`:
+
+            * linear: `i + (j - i) * fraction`, where `fraction` is the
+              fractional part of the index surrounded by `i` and `j`.
+            * lower: `i`.
+            * higher: `j`.
+            * nearest: `i` or `j` whichever is nearest.
+            * midpoint: (`i` + `j`) / 2.
+    **kwargs:
+        For compatibility with other %(name)s methods. Has no effect on
+        the result.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returned object type is determined by the caller of the %(name)s
+        calculation.
+
+    Examples
+    --------
+    >>> s = pd.Series([1, 2, 3, 4])
+    >>> s.rolling(2).quantile(.4, interpolation='lower')
+    0    NaN
+    1    1.0
+    2    2.0
+    3    3.0
+    dtype: float64
+
+    >>> s.rolling(2).quantile(.4, interpolation='midpoint')
+    0    NaN
+    1    1.5
+    2    2.5
+    3    3.5
+    dtype: float64
+
+    See Also
+    --------
+    pandas.Series.quantile : Computes value at the given quantile over all data
+        in Series.
+    pandas.DataFrame.quantile : Computes values at the given quantile over
+        requested axis in DataFrame.
+    """)
+
+    def quantile(self, quantile, interpolation='linear', **kwargs):
+        window = self._get_window()
+        index, indexi = self._get_index()
+
+        def f(arg, *args, **kwargs):
+            minp = _use_window(self.min_periods, window)
+            if quantile == 1.0:
+                return _window.roll_max(arg, window, minp, indexi,
+                                        self.closed)
+            elif quantile == 0.0:
+                return _window.roll_min(arg, window, minp, indexi,
+                                        self.closed)
+            else:
+                return _window.roll_quantile(arg, window, minp, indexi,
+                                             self.closed, quantile,
+                                             interpolation)
+
+        return self._apply(f, 'quantile', quantile=quantile,
+                           **kwargs)
+
+    _shared_docs['cov'] = dedent("""
+    %(name)s sample covariance
+
+    Parameters
+    ----------
+    other : Series, DataFrame, or ndarray, optional
+        if not supplied then will default to self and produce pairwise output
+    pairwise : bool, default None
+        If False then only matching columns between self and other will be used
+        and the output will be a DataFrame.
+        If True then all pairwise combinations will be calculated and the
+        output will be a MultiIndexed DataFrame in the case of DataFrame
+        inputs. In the case of missing elements, only complete pairwise
+        observations will be used.
+    ddof : int, default 1
+        Delta Degrees of Freedom.  The divisor used in calculations
+        is ``N - ddof``, where ``N`` represents the number of elements.""")
+
+    def cov(self, other=None, pairwise=None, ddof=1, **kwargs):
+        if other is None:
+            other = self._selected_obj
+            # only default unset
+            pairwise = True if pairwise is None else pairwise
+        other = self._shallow_copy(other)
+
+        # GH 16058: offset window
+        if self.is_freq_type:
+            window = self.win_freq
+        else:
+            window = self._get_window(other)
+
+        def _get_cov(X, Y):
+            # GH #12373 : rolling functions error on float32 data
+            # to avoid potential overflow, cast the data to float64
+            X = X.astype('float64')
+            Y = Y.astype('float64')
+            mean = lambda x: x.rolling(window, self.min_periods,
+                                       center=self.center).mean(**kwargs)
+            count = (X + Y).rolling(window=window,
+                                    center=self.center).count(**kwargs)
+            bias_adj = count / (count - ddof)
+            return (mean(X * Y) - mean(X) * mean(Y)) * bias_adj
+
+        return _flex_binary_moment(self._selected_obj, other._selected_obj,
+                                   _get_cov, pairwise=bool(pairwise))
+
+    _shared_docs['corr'] = dedent("""
+    %(name)s sample correlation
+
+    Parameters
+    ----------
+    other : Series, DataFrame, or ndarray, optional
+        if not supplied then will default to self and produce pairwise output
+    pairwise : bool, default None
+        If False then only matching columns between self and other will be
+        used and the output will be a DataFrame.
+        If True then all pairwise combinations will be calculated and the
+        output will be a MultiIndex DataFrame in the case of DataFrame inputs.
+        In the case of missing elements, only complete pairwise observations
+        will be used.""")
+
+    def corr(self, other=None, pairwise=None, **kwargs):
+        if other is None:
+            other = self._selected_obj
+            # only default unset
+            pairwise = True if pairwise is None else pairwise
+        other = self._shallow_copy(other)
+        window = self._get_window(other)
+
+        def _get_corr(a, b):
+            a = a.rolling(window=window, min_periods=self.min_periods,
+                          center=self.center)
+            b = b.rolling(window=window, min_periods=self.min_periods,
+                          center=self.center)
+
+            return a.cov(b, **kwargs) / (a.std(**kwargs) * b.std(**kwargs))
+
+        return _flex_binary_moment(self._selected_obj, other._selected_obj,
+                                   _get_corr, pairwise=bool(pairwise))
+
+
+class Rolling(_Rolling_and_Expanding):
+
+    @cache_readonly
+    def is_datetimelike(self):
+        return isinstance(self._on,
+                          (ABCDatetimeIndex,
+                           ABCTimedeltaIndex,
+                           ABCPeriodIndex))
+
+    @cache_readonly
+    def _on(self):
+
+        if self.on is None:
+            return self.obj.index
+        elif (isinstance(self.obj, ABCDataFrame) and
+              self.on in self.obj.columns):
+            from pandas import Index
+            return Index(self.obj[self.on])
+        else:
+            raise ValueError("invalid on specified as {0}, "
+                             "must be a column (if DataFrame) "
+                             "or None".format(self.on))
+
+    def validate(self):
+        super(Rolling, self).validate()
+
+        # we allow rolling on a datetimelike index
+        if ((self.obj.empty or self.is_datetimelike) and
+                isinstance(self.window, (compat.string_types, ABCDateOffset,
+                                         timedelta))):
+
+            self._validate_monotonic()
+            freq = self._validate_freq()
+
+            # we don't allow center
+            if self.center:
+                raise NotImplementedError("center is not implemented "
+                                          "for datetimelike and offset "
+                                          "based windows")
+
+            # this will raise ValueError on non-fixed freqs
+            self.win_freq = self.window
+            self.window = freq.nanos
+            self.win_type = 'freq'
+
+            # min_periods must be an integer
+            if self.min_periods is None:
+                self.min_periods = 1
+
+        elif not is_integer(self.window):
+            raise ValueError("window must be an integer")
+        elif self.window < 0:
+            raise ValueError("window must be non-negative")
+
+        if not self.is_datetimelike and self.closed is not None:
+            raise ValueError("closed only implemented for datetimelike "
+                             "and offset based windows")
+
+    def _validate_monotonic(self):
+        """ validate on is monotonic """
+        if not self._on.is_monotonic:
+            formatted = self.on or 'index'
+            raise ValueError("{0} must be "
+                             "monotonic".format(formatted))
+
+    def _validate_freq(self):
+        """ validate & return window frequency """
+        from pandas.tseries.frequencies import to_offset
+        try:
+            return to_offset(self.window)
+        except (TypeError, ValueError):
+            raise ValueError("passed window {0} is not "
+                             "compatible with a datetimelike "
+                             "index".format(self.window))
+
+    _agg_doc = dedent("""
+    Examples
+    --------
+
+    >>> df = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'])
+    >>> df
+              A         B         C
+    0 -2.385977 -0.102758  0.438822
+    1 -1.004295  0.905829 -0.954544
+    2  0.735167 -0.165272 -1.619346
+    3 -0.702657 -1.340923 -0.706334
+    4 -0.246845  0.211596 -0.901819
+    5  2.463718  3.157577 -1.380906
+    6 -1.142255  2.340594 -0.039875
+    7  1.396598 -1.647453  1.677227
+    8 -0.543425  1.761277 -0.220481
+    9 -0.640505  0.289374 -1.550670
+
+    >>> df.rolling(3).sum()
+              A         B         C
+    0       NaN       NaN       NaN
+    1       NaN       NaN       NaN
+    2 -2.655105  0.637799 -2.135068
+    3 -0.971785 -0.600366 -3.280224
+    4 -0.214334 -1.294599 -3.227500
+    5  1.514216  2.028250 -2.989060
+    6  1.074618  5.709767 -2.322600
+    7  2.718061  3.850718  0.256446
+    8 -0.289082  2.454418  1.416871
+    9  0.212668  0.403198 -0.093924
+
+
+    >>> df.rolling(3).agg({'A':'sum', 'B':'min'})
+              A         B
+    0       NaN       NaN
+    1       NaN       NaN
+    2 -2.655105 -0.165272
+    3 -0.971785 -1.340923
+    4 -0.214334 -1.340923
+    5  1.514216 -1.340923
+    6  1.074618  0.211596
+    7  2.718061 -1.647453
+    8 -0.289082 -1.647453
+    9  0.212668 -1.647453
+
+    See also
+    --------
+    pandas.Series.rolling
+    pandas.DataFrame.rolling
+
+    """)
+
+    @Appender(_agg_doc)
+    @Appender(_shared_docs['aggregate'] % dict(
+        versionadded='',
+        klass='Series/DataFrame',
+        axis=''))
+    def aggregate(self, arg, *args, **kwargs):
+        return super(Rolling, self).aggregate(arg, *args, **kwargs)
+
+    agg = aggregate
+
+    @Substitution(name='rolling')
+    @Appender(_shared_docs['count'])
+    def count(self):
+
+        # different impl for freq counting
+        if self.is_freq_type:
+            return self._apply('roll_count', 'count')
+
+        return super(Rolling, self).count()
+
+    @Substitution(name='rolling')
+    @Appender(_doc_template)
+    @Appender(_shared_docs['apply'])
+    def apply(self, func, raw=None, args=(), kwargs={}):
+        return super(Rolling, self).apply(
+            func, raw=raw, args=args, kwargs=kwargs)
+
+    @Substitution(name='rolling')
+    @Appender(_shared_docs['sum'])
+    def sum(self, *args, **kwargs):
+        nv.validate_rolling_func('sum', args, kwargs)
+        return super(Rolling, self).sum(*args, **kwargs)
+
+    @Substitution(name='rolling')
+    @Appender(_doc_template)
+    @Appender(_shared_docs['max'])
+    def max(self, *args, **kwargs):
+        nv.validate_rolling_func('max', args, kwargs)
+        return super(Rolling, self).max(*args, **kwargs)
+
+    @Substitution(name='rolling')
+    @Appender(_shared_docs['min'])
+    def min(self, *args, **kwargs):
+        nv.validate_rolling_func('min', args, kwargs)
+        return super(Rolling, self).min(*args, **kwargs)
+
+    @Substitution(name='rolling')
+    @Appender(_shared_docs['mean'])
+    def mean(self, *args, **kwargs):
+        nv.validate_rolling_func('mean', args, kwargs)
+        return super(Rolling, self).mean(*args, **kwargs)
+
+    @Substitution(name='rolling')
+    @Appender(_shared_docs['median'])
+    def median(self, **kwargs):
+        return super(Rolling, self).median(**kwargs)
+
+    @Substitution(name='rolling')
+    @Appender(_shared_docs['std'])
+    def std(self, ddof=1, *args, **kwargs):
+        nv.validate_rolling_func('std', args, kwargs)
+        return super(Rolling, self).std(ddof=ddof, **kwargs)
+
+    @Substitution(name='rolling')
+    @Appender(_shared_docs['var'])
+    def var(self, ddof=1, *args, **kwargs):
+        nv.validate_rolling_func('var', args, kwargs)
+        return super(Rolling, self).var(ddof=ddof, **kwargs)
+
+    @Substitution(name='rolling')
+    @Appender(_doc_template)
+    @Appender(_shared_docs['skew'])
+    def skew(self, **kwargs):
+        return super(Rolling, self).skew(**kwargs)
+
+    _agg_doc = dedent("""
+    Examples
+    --------
+
+    The example below will show a rolling calculation with a window size of
+    four matching the equivalent function call using `scipy.stats`.
+
+    >>> arr = [1, 2, 3, 4, 999]
+    >>> fmt = "{0:.6f}"  # limit the printed precision to 6 digits
+    >>> import scipy.stats
+    >>> print(fmt.format(scipy.stats.kurtosis(arr[:-1], bias=False)))
+    -1.200000
+    >>> print(fmt.format(scipy.stats.kurtosis(arr[1:], bias=False)))
+    3.999946
+    >>> s = pd.Series(arr)
+    >>> s.rolling(4).kurt()
+    0         NaN
+    1         NaN
+    2         NaN
+    3   -1.200000
+    4    3.999946
+    dtype: float64
+    """)
+
+    @Appender(_agg_doc)
+    @Substitution(name='rolling')
+    @Appender(_shared_docs['kurt'])
+    def kurt(self, **kwargs):
+        return super(Rolling, self).kurt(**kwargs)
+
+    @Substitution(name='rolling')
+    @Appender(_shared_docs['quantile'])
+    def quantile(self, quantile, interpolation='linear', **kwargs):
+        return super(Rolling, self).quantile(quantile=quantile,
+                                             interpolation=interpolation,
+                                             **kwargs)
+
+    @Substitution(name='rolling')
+    @Appender(_doc_template)
+    @Appender(_shared_docs['cov'])
+    def cov(self, other=None, pairwise=None, ddof=1, **kwargs):
+        return super(Rolling, self).cov(other=other, pairwise=pairwise,
+                                        ddof=ddof, **kwargs)
+
+    @Substitution(name='rolling')
+    @Appender(_doc_template)
+    @Appender(_shared_docs['corr'])
+    def corr(self, other=None, pairwise=None, **kwargs):
+        return super(Rolling, self).corr(other=other, pairwise=pairwise,
+                                         **kwargs)
+
+
+class RollingGroupby(_GroupByMixin, Rolling):
+    """
+    Provides a rolling groupby implementation
+
+    .. versionadded:: 0.18.1
+
+    """
+    @property
+    def _constructor(self):
+        return Rolling
+
+    def _gotitem(self, key, ndim, subset=None):
+
+        # we are setting the index on the actual object
+        # here so our index is carried thru to the selected obj
+        # when we do the splitting for the groupby
+        if self.on is not None:
+            self._groupby.obj = self._groupby.obj.set_index(self._on)
+            self.on = None
+        return super(RollingGroupby, self)._gotitem(key, ndim, subset=subset)
+
+    def _validate_monotonic(self):
+        """
+        validate that on is monotonic;
+        we don't care for groupby.rolling
+        because we have already validated at a higher
+        level
+        """
+        pass
+
+
+class Expanding(_Rolling_and_Expanding):
+    """
+    Provides expanding transformations.
+
+    .. versionadded:: 0.18.0
+
+    Parameters
+    ----------
+    min_periods : int, default 1
+        Minimum number of observations in window required to have a value
+        (otherwise result is NA).
+    center : boolean, default False
+        Set the labels at the center of the window.
+    axis : int or string, default 0
+
+    Returns
+    -------
+    a Window sub-classed for the particular operation
+
+    Examples
+    --------
+
+    >>> df = DataFrame({'B': [0, 1, 2, np.nan, 4]})
+         B
+    0  0.0
+    1  1.0
+    2  2.0
+    3  NaN
+    4  4.0
+
+    >>> df.expanding(2).sum()
+         B
+    0  NaN
+    1  1.0
+    2  3.0
+    3  3.0
+    4  7.0
+
+    Notes
+    -----
+    By default, the result is set to the right edge of the window. This can be
+    changed to the center of the window by setting ``center=True``.
+
+    See Also
+    --------
+    rolling : Provides rolling window calculations
+    ewm : Provides exponential weighted functions
+    """
+
+    _attributes = ['min_periods', 'center', 'axis']
+
+    def __init__(self, obj, min_periods=1, center=False, axis=0,
+                 **kwargs):
+        super(Expanding, self).__init__(obj=obj, min_periods=min_periods,
+                                        center=center, axis=axis)
+
+    @property
+    def _constructor(self):
+        return Expanding
+
+    def _get_window(self, other=None):
+        obj = self._selected_obj
+        if other is None:
+            return (max(len(obj), self.min_periods) if self.min_periods
+                    else len(obj))
+        return (max((len(obj) + len(obj)), self.min_periods)
+                if self.min_periods else (len(obj) + len(obj)))
+
+    _agg_doc = dedent("""
+    Examples
+    --------
+
+    >>> df = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'])
+    >>> df
+              A         B         C
+    0 -2.385977 -0.102758  0.438822
+    1 -1.004295  0.905829 -0.954544
+    2  0.735167 -0.165272 -1.619346
+    3 -0.702657 -1.340923 -0.706334
+    4 -0.246845  0.211596 -0.901819
+    5  2.463718  3.157577 -1.380906
+    6 -1.142255  2.340594 -0.039875
+    7  1.396598 -1.647453  1.677227
+    8 -0.543425  1.761277 -0.220481
+    9 -0.640505  0.289374 -1.550670
+
+    >>> df.ewm(alpha=0.5).mean()
+              A         B         C
+    0 -2.385977 -0.102758  0.438822
+    1 -1.464856  0.569633 -0.490089
+    2 -0.207700  0.149687 -1.135379
+    3 -0.471677 -0.645305 -0.906555
+    4 -0.355635 -0.203033 -0.904111
+    5  1.076417  1.503943 -1.146293
+    6 -0.041654  1.925562 -0.588728
+    7  0.680292  0.132049  0.548693
+    8  0.067236  0.948257  0.163353
+    9 -0.286980  0.618493 -0.694496
+
+    See also
+    --------
+    pandas.DataFrame.expanding.aggregate
+    pandas.DataFrame.rolling.aggregate
+    pandas.DataFrame.aggregate
+
+    """)
+
+    @Appender(_agg_doc)
+    @Appender(_shared_docs['aggregate'] % dict(
+        versionadded='',
+        klass='Series/DataFrame',
+        axis=''))
+    def aggregate(self, arg, *args, **kwargs):
+        return super(Expanding, self).aggregate(arg, *args, **kwargs)
+
+    agg = aggregate
+
+    @Substitution(name='expanding')
+    @Appender(_shared_docs['count'])
+    def count(self, **kwargs):
+        return super(Expanding, self).count(**kwargs)
+
+    @Substitution(name='expanding')
+    @Appender(_doc_template)
+    @Appender(_shared_docs['apply'])
+    def apply(self, func, raw=None, args=(), kwargs={}):
+        return super(Expanding, self).apply(
+            func, raw=raw, args=args, kwargs=kwargs)
+
+    @Substitution(name='expanding')
+    @Appender(_shared_docs['sum'])
+    def sum(self, *args, **kwargs):
+        nv.validate_expanding_func('sum', args, kwargs)
+        return super(Expanding, self).sum(*args, **kwargs)
+
+    @Substitution(name='expanding')
+    @Appender(_doc_template)
+    @Appender(_shared_docs['max'])
+    def max(self, *args, **kwargs):
+        nv.validate_expanding_func('max', args, kwargs)
+        return super(Expanding, self).max(*args, **kwargs)
+
+    @Substitution(name='expanding')
+    @Appender(_shared_docs['min'])
+    def min(self, *args, **kwargs):
+        nv.validate_expanding_func('min', args, kwargs)
+        return super(Expanding, self).min(*args, **kwargs)
+
+    @Substitution(name='expanding')
+    @Appender(_shared_docs['mean'])
+    def mean(self, *args, **kwargs):
+        nv.validate_expanding_func('mean', args, kwargs)
+        return super(Expanding, self).mean(*args, **kwargs)
+
+    @Substitution(name='expanding')
+    @Appender(_shared_docs['median'])
+    def median(self, **kwargs):
+        return super(Expanding, self).median(**kwargs)
+
+    @Substitution(name='expanding')
+    @Appender(_shared_docs['std'])
+    def std(self, ddof=1, *args, **kwargs):
+        nv.validate_expanding_func('std', args, kwargs)
+        return super(Expanding, self).std(ddof=ddof, **kwargs)
+
+    @Substitution(name='expanding')
+    @Appender(_shared_docs['var'])
+    def var(self, ddof=1, *args, **kwargs):
+        nv.validate_expanding_func('var', args, kwargs)
+        return super(Expanding, self).var(ddof=ddof, **kwargs)
+
+    @Substitution(name='expanding')
+    @Appender(_doc_template)
+    @Appender(_shared_docs['skew'])
+    def skew(self, **kwargs):
+        return super(Expanding, self).skew(**kwargs)
+
+    _agg_doc = dedent("""
+    Examples
+    --------
+
+    The example below will show an expanding calculation with a window size of
+    four matching the equivalent function call using `scipy.stats`.
+
+    >>> arr = [1, 2, 3, 4, 999]
+    >>> import scipy.stats
+    >>> fmt = "{0:.6f}"  # limit the printed precision to 6 digits
+    >>> print(fmt.format(scipy.stats.kurtosis(arr[:-1], bias=False)))
+    -1.200000
+    >>> print(fmt.format(scipy.stats.kurtosis(arr, bias=False)))
+    4.999874
+    >>> s = pd.Series(arr)
+    >>> s.expanding(4).kurt()
+    0         NaN
+    1         NaN
+    2         NaN
+    3   -1.200000
+    4    4.999874
+    dtype: float64
+    """)
+
+    @Appender(_agg_doc)
+    @Substitution(name='expanding')
+    @Appender(_shared_docs['kurt'])
+    def kurt(self, **kwargs):
+        return super(Expanding, self).kurt(**kwargs)
+
+    @Substitution(name='expanding')
+    @Appender(_shared_docs['quantile'])
+    def quantile(self, quantile, interpolation='linear', **kwargs):
+        return super(Expanding, self).quantile(quantile=quantile,
+                                               interpolation=interpolation,
+                                               **kwargs)
+
+    @Substitution(name='expanding')
+    @Appender(_doc_template)
+    @Appender(_shared_docs['cov'])
+    def cov(self, other=None, pairwise=None, ddof=1, **kwargs):
+        return super(Expanding, self).cov(other=other, pairwise=pairwise,
+                                          ddof=ddof, **kwargs)
+
+    @Substitution(name='expanding')
+    @Appender(_doc_template)
+    @Appender(_shared_docs['corr'])
+    def corr(self, other=None, pairwise=None, **kwargs):
+        return super(Expanding, self).corr(other=other, pairwise=pairwise,
+                                           **kwargs)
+
+
+class ExpandingGroupby(_GroupByMixin, Expanding):
+    """
+    Provides a expanding groupby implementation
+
+    .. versionadded:: 0.18.1
+
+    """
+    @property
+    def _constructor(self):
+        return Expanding
+
+
+_bias_template = """
+
+Parameters
+----------
+bias : boolean, default False
+    Use a standard estimation bias correction
+"""
+
+_pairwise_template = """
+
+Parameters
+----------
+other : Series, DataFrame, or ndarray, optional
+    if not supplied then will default to self and produce pairwise output
+pairwise : bool, default None
+    If False then only matching columns between self and other will be used and
+    the output will be a DataFrame.
+    If True then all pairwise combinations will be calculated and the output
+    will be a MultiIndex DataFrame in the case of DataFrame inputs.
+    In the case of missing elements, only complete pairwise observations will
+    be used.
+bias : boolean, default False
+   Use a standard estimation bias correction
+"""
+
+
+class EWM(_Rolling):
+    r"""
+    Provides exponential weighted functions
+
+    .. versionadded:: 0.18.0
+
+    Parameters
+    ----------
+    com : float, optional
+        Specify decay in terms of center of mass,
+        :math:`\alpha = 1 / (1 + com),\text{ for } com \geq 0`
+    span : float, optional
+        Specify decay in terms of span,
+        :math:`\alpha = 2 / (span + 1),\text{ for } span \geq 1`
+    halflife : float, optional
+        Specify decay in terms of half-life,
+        :math:`\alpha = 1 - exp(log(0.5) / halflife),\text{ for } halflife > 0`
+    alpha : float, optional
+        Specify smoothing factor :math:`\alpha` directly,
+        :math:`0 < \alpha \leq 1`
+
+        .. versionadded:: 0.18.0
+
+    min_periods : int, default 0
+        Minimum number of observations in window required to have a value
+        (otherwise result is NA).
+    adjust : boolean, default True
+        Divide by decaying adjustment factor in beginning periods to account
+        for imbalance in relative weightings (viewing EWMA as a moving average)
+    ignore_na : boolean, default False
+        Ignore missing values when calculating weights;
+        specify True to reproduce pre-0.15.0 behavior
+
+    Returns
+    -------
+    a Window sub-classed for the particular operation
+
+    Examples
+    --------
+
+    >>> df = DataFrame({'B': [0, 1, 2, np.nan, 4]})
+         B
+    0  0.0
+    1  1.0
+    2  2.0
+    3  NaN
+    4  4.0
+
+    >>> df.ewm(com=0.5).mean()
+              B
+    0  0.000000
+    1  0.750000
+    2  1.615385
+    3  1.615385
+    4  3.670213
+
+    Notes
+    -----
+    Exactly one of center of mass, span, half-life, and alpha must be provided.
+    Allowed values and relationship between the parameters are specified in the
+    parameter descriptions above; see the link at the end of this section for
+    a detailed explanation.
+
+    When adjust is True (default), weighted averages are calculated using
+    weights (1-alpha)**(n-1), (1-alpha)**(n-2), ..., 1-alpha, 1.
+
+    When adjust is False, weighted averages are calculated recursively as:
+       weighted_average[0] = arg[0];
+       weighted_average[i] = (1-alpha)*weighted_average[i-1] + alpha*arg[i].
+
+    When ignore_na is False (default), weights are based on absolute positions.
+    For example, the weights of x and y used in calculating the final weighted
+    average of [x, None, y] are (1-alpha)**2 and 1 (if adjust is True), and
+    (1-alpha)**2 and alpha (if adjust is False).
+
+    When ignore_na is True (reproducing pre-0.15.0 behavior), weights are based
+    on relative positions. For example, the weights of x and y used in
+    calculating the final weighted average of [x, None, y] are 1-alpha and 1
+    (if adjust is True), and 1-alpha and alpha (if adjust is False).
+
+    More details can be found at
+    http://pandas.pydata.org/pandas-docs/stable/computation.html#exponentially-weighted-windows
+
+    See Also
+    --------
+    rolling : Provides rolling window calculations
+    expanding : Provides expanding transformations.
+    """
+    _attributes = ['com', 'min_periods', 'adjust', 'ignore_na', 'axis']
+
+    def __init__(self, obj, com=None, span=None, halflife=None, alpha=None,
+                 min_periods=0, adjust=True, ignore_na=False,
+                 axis=0):
+        self.obj = obj
+        self.com = _get_center_of_mass(com, span, halflife, alpha)
+        self.min_periods = min_periods
+        self.adjust = adjust
+        self.ignore_na = ignore_na
+        self.axis = axis
+        self.on = None
+
+    @property
+    def _constructor(self):
+        return EWM
+
+    _agg_doc = dedent("""
+    Examples
+    --------
+
+    >>> df = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'])
+    >>> df
+              A         B         C
+    0 -2.385977 -0.102758  0.438822
+    1 -1.004295  0.905829 -0.954544
+    2  0.735167 -0.165272 -1.619346
+    3 -0.702657 -1.340923 -0.706334
+    4 -0.246845  0.211596 -0.901819
+    5  2.463718  3.157577 -1.380906
+    6 -1.142255  2.340594 -0.039875
+    7  1.396598 -1.647453  1.677227
+    8 -0.543425  1.761277 -0.220481
+    9 -0.640505  0.289374 -1.550670
+
+    >>> df.ewm(alpha=0.5).mean()
+              A         B         C
+    0 -2.385977 -0.102758  0.438822
+    1 -1.464856  0.569633 -0.490089
+    2 -0.207700  0.149687 -1.135379
+    3 -0.471677 -0.645305 -0.906555
+    4 -0.355635 -0.203033 -0.904111
+    5  1.076417  1.503943 -1.146293
+    6 -0.041654  1.925562 -0.588728
+    7  0.680292  0.132049  0.548693
+    8  0.067236  0.948257  0.163353
+    9 -0.286980  0.618493 -0.694496
+
+    See also
+    --------
+    pandas.DataFrame.rolling.aggregate
+
+    """)
+
+    @Appender(_agg_doc)
+    @Appender(_shared_docs['aggregate'] % dict(
+        versionadded='',
+        klass='Series/DataFrame',
+        axis=''))
+    def aggregate(self, arg, *args, **kwargs):
+        return super(EWM, self).aggregate(arg, *args, **kwargs)
+
+    agg = aggregate
+
+    def _apply(self, func, **kwargs):
+        """Rolling statistical measure using supplied function. Designed to be
+        used with passed-in Cython array-based functions.
+
+        Parameters
+        ----------
+        func : string/callable to apply
+
+        Returns
+        -------
+        y : same type as input argument
+
+        """
+        blocks, obj, index = self._create_blocks()
+        results = []
+        for b in blocks:
+            try:
+                values = self._prep_values(b.values)
+            except TypeError:
+                results.append(b.values.copy())
+                continue
+
+            if values.size == 0:
+                results.append(values.copy())
+                continue
+
+            # if we have a string function name, wrap it
+            if isinstance(func, compat.string_types):
+                cfunc = getattr(_window, func, None)
+                if cfunc is None:
+                    raise ValueError("we do not support this function "
+                                     "in _window.{0}".format(func))
+
+                def func(arg):
+                    return cfunc(arg, self.com, int(self.adjust),
+                                 int(self.ignore_na), int(self.min_periods))
+
+            results.append(np.apply_along_axis(func, self.axis, values))
+
+        return self._wrap_results(results, blocks, obj)
+
+    @Substitution(name='ewm')
+    @Appender(_doc_template)
+    def mean(self, *args, **kwargs):
+        """exponential weighted moving average"""
+        nv.validate_window_func('mean', args, kwargs)
+        return self._apply('ewma', **kwargs)
+
+    @Substitution(name='ewm')
+    @Appender(_doc_template)
+    @Appender(_bias_template)
+    def std(self, bias=False, *args, **kwargs):
+        """exponential weighted moving stddev"""
+        nv.validate_window_func('std', args, kwargs)
+        return _zsqrt(self.var(bias=bias, **kwargs))
+
+    vol = std
+
+    @Substitution(name='ewm')
+    @Appender(_doc_template)
+    @Appender(_bias_template)
+    def var(self, bias=False, *args, **kwargs):
+        """exponential weighted moving variance"""
+        nv.validate_window_func('var', args, kwargs)
+
+        def f(arg):
+            return _window.ewmcov(arg, arg, self.com, int(self.adjust),
+                                  int(self.ignore_na), int(self.min_periods),
+                                  int(bias))
+
+        return self._apply(f, **kwargs)
+
+    @Substitution(name='ewm')
+    @Appender(_doc_template)
+    @Appender(_pairwise_template)
+    def cov(self, other=None, pairwise=None, bias=False, **kwargs):
+        """exponential weighted sample covariance"""
+        if other is None:
+            other = self._selected_obj
+            # only default unset
+            pairwise = True if pairwise is None else pairwise
+        other = self._shallow_copy(other)
+
+        def _get_cov(X, Y):
+            X = self._shallow_copy(X)
+            Y = self._shallow_copy(Y)
+            cov = _window.ewmcov(X._prep_values(), Y._prep_values(), self.com,
+                                 int(self.adjust), int(self.ignore_na),
+                                 int(self.min_periods), int(bias))
+            return X._wrap_result(cov)
+
+        return _flex_binary_moment(self._selected_obj, other._selected_obj,
+                                   _get_cov, pairwise=bool(pairwise))
+
+    @Substitution(name='ewm')
+    @Appender(_doc_template)
+    @Appender(_pairwise_template)
+    def corr(self, other=None, pairwise=None, **kwargs):
+        """exponential weighted sample correlation"""
+        if other is None:
+            other = self._selected_obj
+            # only default unset
+            pairwise = True if pairwise is None else pairwise
+        other = self._shallow_copy(other)
+
+        def _get_corr(X, Y):
+            X = self._shallow_copy(X)
+            Y = self._shallow_copy(Y)
+
+            def _cov(x, y):
+                return _window.ewmcov(x, y, self.com, int(self.adjust),
+                                      int(self.ignore_na),
+                                      int(self.min_periods),
+                                      1)
+
+            x_values = X._prep_values()
+            y_values = Y._prep_values()
+            with np.errstate(all='ignore'):
+                cov = _cov(x_values, y_values)
+                x_var = _cov(x_values, x_values)
+                y_var = _cov(y_values, y_values)
+                corr = cov / _zsqrt(x_var * y_var)
+            return X._wrap_result(corr)
+
+        return _flex_binary_moment(self._selected_obj, other._selected_obj,
+                                   _get_corr, pairwise=bool(pairwise))
+
+# Helper Funcs
+
+
+def _flex_binary_moment(arg1, arg2, f, pairwise=False):
+
+    if not (isinstance(arg1, (np.ndarray, ABCSeries, ABCDataFrame)) and
+            isinstance(arg2, (np.ndarray, ABCSeries, ABCDataFrame))):
+        raise TypeError("arguments to moment function must be of type "
+                        "np.ndarray/Series/DataFrame")
+
+    if (isinstance(arg1, (np.ndarray, ABCSeries)) and
+            isinstance(arg2, (np.ndarray, ABCSeries))):
+        X, Y = _prep_binary(arg1, arg2)
+        return f(X, Y)
+
+    elif isinstance(arg1, ABCDataFrame):
+        from pandas import DataFrame
+
+        def dataframe_from_int_dict(data, frame_template):
+            result = DataFrame(data, index=frame_template.index)
+            if len(result.columns) > 0:
+                result.columns = frame_template.columns[result.columns]
+            return result
+
+        results = {}
+        if isinstance(arg2, ABCDataFrame):
+            if pairwise is False:
+                if arg1 is arg2:
+                    # special case in order to handle duplicate column names
+                    for i, col in enumerate(arg1.columns):
+                        results[i] = f(arg1.iloc[:, i], arg2.iloc[:, i])
+                    return dataframe_from_int_dict(results, arg1)
+                else:
+                    if not arg1.columns.is_unique:
+                        raise ValueError("'arg1' columns are not unique")
+                    if not arg2.columns.is_unique:
+                        raise ValueError("'arg2' columns are not unique")
+                    with warnings.catch_warnings(record=True):
+                        X, Y = arg1.align(arg2, join='outer')
+                    X = X + 0 * Y
+                    Y = Y + 0 * X
+
+                    with warnings.catch_warnings(record=True):
+                        res_columns = arg1.columns.union(arg2.columns)
+                    for col in res_columns:
+                        if col in X and col in Y:
+                            results[col] = f(X[col], Y[col])
+                    return DataFrame(results, index=X.index,
+                                     columns=res_columns)
+            elif pairwise is True:
+                results = defaultdict(dict)
+                for i, k1 in enumerate(arg1.columns):
+                    for j, k2 in enumerate(arg2.columns):
+                        if j < i and arg2 is arg1:
+                            # Symmetric case
+                            results[i][j] = results[j][i]
+                        else:
+                            results[i][j] = f(*_prep_binary(arg1.iloc[:, i],
+                                                            arg2.iloc[:, j]))
+
+                from pandas import MultiIndex, concat
+
+                result_index = arg1.index.union(arg2.index)
+                if len(result_index):
+
+                    # construct result frame
+                    result = concat(
+                        [concat([results[i][j]
+                                 for j, c in enumerate(arg2.columns)],
+                                ignore_index=True)
+                         for i, c in enumerate(arg1.columns)],
+                        ignore_index=True,
+                        axis=1)
+                    result.columns = arg1.columns
+
+                    # set the index and reorder
+                    if arg2.columns.nlevels > 1:
+                        result.index = MultiIndex.from_product(
+                            arg2.columns.levels + [result_index])
+                        result = result.reorder_levels([2, 0, 1]).sort_index()
+                    else:
+                        result.index = MultiIndex.from_product(
+                            [range(len(arg2.columns)),
+                             range(len(result_index))])
+                        result = result.swaplevel(1, 0).sort_index()
+                        result.index = MultiIndex.from_product(
+                            [result_index] + [arg2.columns])
+                else:
+
+                    # empty result
+                    result = DataFrame(
+                        index=MultiIndex(levels=[arg1.index, arg2.columns],
+                                         labels=[[], []]),
+                        columns=arg2.columns,
+                        dtype='float64')
+
+                # reset our index names to arg1 names
+                # reset our column names to arg2 names
+                # careful not to mutate the original names
+                result.columns = result.columns.set_names(
+                    arg1.columns.names)
+                result.index = result.index.set_names(
+                    result_index.names + arg2.columns.names)
+
+                return result
+
+            else:
+                raise ValueError("'pairwise' is not True/False")
+        else:
+            results = {}
+            for i, col in enumerate(arg1.columns):
+                results[i] = f(*_prep_binary(arg1.iloc[:, i], arg2))
+            return dataframe_from_int_dict(results, arg1)
+
+    else:
+        return _flex_binary_moment(arg2, arg1, f)
+
+
+def _get_center_of_mass(comass, span, halflife, alpha):
+    valid_count = com._count_not_none(comass, span, halflife, alpha)
+    if valid_count > 1:
+        raise ValueError("comass, span, halflife, and alpha "
+                         "are mutually exclusive")
+
+    # Convert to center of mass; domain checks ensure 0 < alpha <= 1
+    if comass is not None:
+        if comass < 0:
+            raise ValueError("comass must satisfy: comass >= 0")
+    elif span is not None:
+        if span < 1:
+            raise ValueError("span must satisfy: span >= 1")
+        comass = (span - 1) / 2.
+    elif halflife is not None:
+        if halflife <= 0:
+            raise ValueError("halflife must satisfy: halflife > 0")
+        decay = 1 - np.exp(np.log(0.5) / halflife)
+        comass = 1 / decay - 1
+    elif alpha is not None:
+        if alpha <= 0 or alpha > 1:
+            raise ValueError("alpha must satisfy: 0 < alpha <= 1")
+        comass = (1.0 - alpha) / alpha
+    else:
+        raise ValueError("Must pass one of comass, span, halflife, or alpha")
+
+    return float(comass)
+
+
+def _offset(window, center):
+    if not is_integer(window):
+        window = len(window)
+    offset = (window - 1) / 2. if center else 0
+    try:
+        return int(offset)
+    except:
+        return offset.astype(int)
+
+
+def _require_min_periods(p):
+    def _check_func(minp, window):
+        if minp is None:
+            return window
+        else:
+            return max(p, minp)
+
+    return _check_func
+
+
+def _use_window(minp, window):
+    if minp is None:
+        return window
+    else:
+        return minp
+
+
+def _zsqrt(x):
+    with np.errstate(all='ignore'):
+        result = np.sqrt(x)
+        mask = x < 0
+
+    if isinstance(x, ABCDataFrame):
+        if mask.values.any():
+            result[mask] = 0
+    else:
+        if mask.any():
+            result[mask] = 0
+
+    return result
+
+
+def _prep_binary(arg1, arg2):
+    if not isinstance(arg2, type(arg1)):
+        raise Exception('Input arrays must be of the same type!')
+
+    # mask out values, this also makes a common index...
+    X = arg1 + 0 * arg2
+    Y = arg2 + 0 * arg1
+
+    return X, Y
+
+
+# Top-level exports
+
+
+def rolling(obj, win_type=None, **kwds):
+    if not isinstance(obj, (ABCSeries, ABCDataFrame)):
+        raise TypeError('invalid type: %s' % type(obj))
+
+    if win_type is not None:
+        return Window(obj, win_type=win_type, **kwds)
+
+    return Rolling(obj, **kwds)
+
+
+rolling.__doc__ = Window.__doc__
+
+
+def expanding(obj, **kwds):
+    if not isinstance(obj, (ABCSeries, ABCDataFrame)):
+        raise TypeError('invalid type: %s' % type(obj))
+
+    return Expanding(obj, **kwds)
+
+
+expanding.__doc__ = Expanding.__doc__
+
+
+def ewm(obj, **kwds):
+    if not isinstance(obj, (ABCSeries, ABCDataFrame)):
+        raise TypeError('invalid type: %s' % type(obj))
+
+    return EWM(obj, **kwds)
+
+
+ewm.__doc__ = EWM.__doc__
diff --git a/pandas/errors/__init__.py b/pandas/errors/__init__.py
new file mode 100644
index 0000000000000..f2794574944e7
--- /dev/null
+++ b/pandas/errors/__init__.py
@@ -0,0 +1,184 @@
+# flake8: noqa
+
+"""
+Expose public exceptions & warnings
+"""
+
+from pandas._libs.tslib import OutOfBoundsDatetime
+
+
+class PerformanceWarning(Warning):
+    """
+    Warning raised when there is a possible
+    performance impact.
+    """
+
+class UnsupportedFunctionCall(ValueError):
+    """
+    Exception raised when attempting to call a numpy function
+    on a pandas object, but that function is not supported by
+    the object e.g. ``np.cumsum(groupby_object)``.
+    """
+
+class UnsortedIndexError(KeyError):
+    """
+    Error raised when attempting to get a slice of a MultiIndex,
+    and the index has not been lexsorted. Subclass of `KeyError`.
+
+    .. versionadded:: 0.20.0
+
+    """
+
+
+class ParserError(ValueError):
+    """
+    Exception that is raised by an error encountered in `pd.read_csv`.
+    """
+
+
+class DtypeWarning(Warning):
+    """
+    Warning raised when reading different dtypes in a column from a file.
+
+    Raised for a dtype incompatibility. This can happen whenever `read_csv`
+    or `read_table` encounter non-uniform dtypes in a column(s) of a given
+    CSV file.
+
+    See Also
+    --------
+    pandas.read_csv : Read CSV (comma-separated) file into a DataFrame.
+    pandas.read_table : Read general delimited file into a DataFrame.
+
+    Notes
+    -----
+    This warning is issued when dealing with larger files because the dtype
+    checking happens per chunk read.
+
+    Despite the warning, the CSV file is read with mixed types in a single
+    column which will be an object type. See the examples below to better
+    understand this issue.
+
+    Examples
+    --------
+    This example creates and reads a large CSV file with a column that contains
+    `int` and `str`.
+
+    >>> df = pd.DataFrame({'a': (['1'] * 100000 + ['X'] * 100000 +
+    ...                          ['1'] * 100000),
+    ...                    'b': ['b'] * 300000})
+    >>> df.to_csv('test.csv', index=False)
+    >>> df2 = pd.read_csv('test.csv')
+    ... # DtypeWarning: Columns (0) have mixed types
+
+    Important to notice that ``df2`` will contain both `str` and `int` for the
+    same input, '1'.
+
+    >>> df2.iloc[262140, 0]
+    '1'
+    >>> type(df2.iloc[262140, 0])
+    <class 'str'>
+    >>> df2.iloc[262150, 0]
+    1
+    >>> type(df2.iloc[262150, 0])
+    <class 'int'>
+
+    One way to solve this issue is using the `dtype` parameter in the
+    `read_csv` and `read_table` functions to explicit the conversion:
+
+    >>> df2 = pd.read_csv('test.csv', sep=',', dtype={'a': str})
+
+    No warning was issued.
+
+    >>> import os
+    >>> os.remove('test.csv')
+    """
+
+
+class EmptyDataError(ValueError):
+    """
+    Exception that is thrown in `pd.read_csv` (by both the C and
+    Python engines) when empty data or header is encountered.
+    """
+
+
+class ParserWarning(Warning):
+    """
+    Warning raised when reading a file that doesn't use the default 'c' parser.
+
+    Raised by `pd.read_csv` and `pd.read_table` when it is necessary to change
+    parsers, generally from the default 'c' parser to 'python'.
+
+    It happens due to a lack of support or functionality for parsing a
+    particular attribute of a CSV file with the requested engine.
+
+    Currently, 'c' unsupported options include the following parameters:
+
+    1. `sep` other than a single character (e.g. regex separators)
+    2. `skipfooter` higher than 0
+    3. `sep=None` with `delim_whitespace=False`
+
+    The warning can be avoided by adding `engine='python'` as a parameter in
+    `pd.read_csv` and `pd.read_table` methods.
+
+    See Also
+    --------
+    pd.read_csv : Read CSV (comma-separated) file into DataFrame.
+    pd.read_table : Read general delimited file into DataFrame.
+
+    Examples
+    --------
+    Using a `sep` in `pd.read_csv` other than a single character:
+
+    >>> import io
+    >>> csv = u'''a;b;c
+    ...           1;1,8
+    ...           1;2,1'''
+    >>> df = pd.read_csv(io.StringIO(csv), sep='[;,]')
+    ... # ParserWarning: Falling back to the 'python' engine...
+
+    Adding `engine='python'` to `pd.read_csv` removes the Warning:
+
+    >>> df = pd.read_csv(io.StringIO(csv), sep='[;,]', engine='python')
+    """
+
+
+class MergeError(ValueError):
+    """
+    Error raised when problems arise during merging due to problems
+    with input data. Subclass of `ValueError`.
+    """
+
+
+class NullFrequencyError(ValueError):
+    """
+    Error raised when a null `freq` attribute is used in an operation
+    that needs a non-null frequency, particularly `DatetimeIndex.shift`,
+    `TimedeltaIndex.shift`, `PeriodIndex.shift`.
+    """
+
+
+class AccessorRegistrationWarning(Warning):
+    """Warning for attribute conflicts in accessor registration."""
+
+
+class AbstractMethodError(NotImplementedError):
+    """Raise this error instead of NotImplementedError for abstract methods
+    while keeping compatibility with Python 2 and Python 3.
+    """
+
+    def __init__(self, class_instance, methodtype='method'):
+        types = {'method', 'classmethod', 'staticmethod', 'property'}
+        if methodtype not in types:
+            msg = 'methodtype must be one of {}, got {} instead.'.format(
+                methodtype, types)
+            raise ValueError(msg)
+        self.methodtype = methodtype
+        self.class_instance = class_instance
+
+    def __str__(self):
+        if self.methodtype == 'classmethod':
+            name = self.class_instance.__name__
+        else:
+            name = self.class_instance.__class__.__name__
+        msg = "This {methodtype} must be defined in the concrete class {name}"
+        return (msg.format(methodtype=self.methodtype, name=name))
diff --git a/pandas/stats/__init__.py b/pandas/formats/__init__.py
similarity index 100%
rename from pandas/stats/__init__.py
rename to pandas/formats/__init__.py
diff --git a/pandas/formats/style.py b/pandas/formats/style.py
new file mode 100644
index 0000000000000..ec4b4a2cde0c5
--- /dev/null
+++ b/pandas/formats/style.py
@@ -0,0 +1,7 @@
+import warnings
+
+warnings.warn("Styler has been moved from pandas.formats.style.Styler"
+              " to pandas.io.formats.style.Styler. This shim will be"
+              " removed in pandas 0.21",
+              FutureWarning)
+from pandas.io.formats.style import Styler  # noqa
diff --git a/pandas/hashtable.pxd b/pandas/hashtable.pxd
deleted file mode 100644
index 97b6687d061e9..0000000000000
--- a/pandas/hashtable.pxd
+++ /dev/null
@@ -1,24 +0,0 @@
-from khash cimport kh_int64_t, kh_float64_t, kh_pymap_t, int64_t, float64_t
-
-# prototypes for sharing
-
-cdef class HashTable:
-    pass
-
-cdef class Int64HashTable(HashTable):
-    cdef kh_int64_t *table
-
-    cpdef get_item(self, int64_t val)
-    cpdef set_item(self, int64_t key, Py_ssize_t val)
-
-cdef class Float64HashTable(HashTable):
-    cdef kh_float64_t *table
-
-    cpdef get_item(self, float64_t val)
-    cpdef set_item(self, float64_t key, Py_ssize_t val)
-
-cdef class PyObjectHashTable(HashTable):
-    cdef kh_pymap_t *table
-
-    cpdef get_item(self, object val)
-    cpdef set_item(self, object key, Py_ssize_t val)
diff --git a/pandas/hashtable.pyx b/pandas/hashtable.pyx
deleted file mode 100644
index dfa7930ada62f..0000000000000
--- a/pandas/hashtable.pyx
+++ /dev/null
@@ -1,1139 +0,0 @@
-# cython: profile=False
-
-from cpython cimport PyObject, Py_INCREF, PyList_Check, PyTuple_Check
-
-from khash cimport *
-from numpy cimport *
-from cpython cimport PyMem_Malloc, PyMem_Realloc, PyMem_Free
-
-from util cimport _checknan
-cimport util
-
-import numpy as np
-nan = np.nan
-
-cdef extern from "numpy/npy_math.h":
-    double NAN "NPY_NAN"
-
-cimport cython
-cimport numpy as cnp
-
-cnp.import_array()
-cnp.import_ufunc()
-
-cdef int64_t iNaT = util.get_nat()
-_SIZE_HINT_LIMIT = (1 << 20) + 7
-
-cdef extern from "datetime.h":
-    bint PyDateTime_Check(object o)
-    void PyDateTime_IMPORT()
-
-PyDateTime_IMPORT
-
-cdef extern from "Python.h":
-    int PySlice_Check(object)
-
-cdef size_t _INIT_VEC_CAP = 32
-
-cdef class ObjectVector:
-
-    cdef:
-        PyObject **data
-        size_t n, m
-        ndarray ao
-
-    def __cinit__(self):
-        self.n = 0
-        self.m = _INIT_VEC_CAP
-        self.ao = np.empty(_INIT_VEC_CAP, dtype=object)
-        self.data = <PyObject**> self.ao.data
-
-    def __len__(self):
-        return self.n
-
-    cdef inline append(self, object o):
-        if self.n == self.m:
-            self.m = max(self.m * 2, _INIT_VEC_CAP)
-            self.ao.resize(self.m)
-            self.data = <PyObject**> self.ao.data
-
-        Py_INCREF(o)
-        self.data[self.n] = <PyObject*> o
-        self.n += 1
-
-    def to_array(self):
-        self.ao.resize(self.n)
-        self.m = self.n
-        return self.ao
-
-ctypedef struct Int64VectorData:
-    int64_t *data
-    size_t n, m
-
-ctypedef struct Float64VectorData:
-    float64_t *data
-    size_t n, m
-
-ctypedef fused vector_data:
-    Int64VectorData
-    Float64VectorData
-
-ctypedef fused sixty_four_bit_scalar:
-    int64_t
-    float64_t
-
-cdef bint needs_resize(vector_data *data) nogil:
-    return data.n == data.m
-
-cdef void append_data(vector_data *data, sixty_four_bit_scalar x) nogil:
-
-    # compile time specilization of the fused types
-    # as the cross-product is generated, but we cannot assign float->int
-    # the types that don't pass are pruned
-    if (vector_data is Int64VectorData and sixty_four_bit_scalar is int64_t) or (
-        vector_data is Float64VectorData and sixty_four_bit_scalar is float64_t):
-
-        data.data[data.n] = x
-        data.n += 1
-
-cdef class Int64Vector:
-
-    cdef:
-        Int64VectorData *data
-        ndarray ao
-
-    def __cinit__(self):
-        self.data = <Int64VectorData *>PyMem_Malloc(sizeof(Int64VectorData))
-        if not self.data:
-            raise MemoryError()
-        self.data.n = 0
-        self.data.m = _INIT_VEC_CAP
-        self.ao = np.empty(self.data.m, dtype=np.int64)
-        self.data.data = <int64_t*> self.ao.data
-
-    cdef resize(self):
-        self.data.m = max(self.data.m * 4, _INIT_VEC_CAP)
-        self.ao.resize(self.data.m)
-        self.data.data = <int64_t*> self.ao.data
-
-    def __dealloc__(self):
-        PyMem_Free(self.data)
-
-    def __len__(self):
-        return self.data.n
-
-    def to_array(self):
-        self.ao.resize(self.data.n)
-        self.data.m = self.data.n
-        return self.ao
-
-    cdef inline void append(self, int64_t x):
-
-        if needs_resize(self.data):
-            self.resize()
-
-        append_data(self.data, x)
-
-cdef class Float64Vector:
-
-    cdef:
-        Float64VectorData *data
-        ndarray ao
-
-    def __cinit__(self):
-        self.data = <Float64VectorData *>PyMem_Malloc(sizeof(Float64VectorData))
-        if not self.data:
-            raise MemoryError()
-        self.data.n = 0
-        self.data.m = _INIT_VEC_CAP
-        self.ao = np.empty(self.data.m, dtype=np.float64)
-        self.data.data = <float64_t*> self.ao.data
-
-    cdef resize(self):
-        self.data.m = max(self.data.m * 4, _INIT_VEC_CAP)
-        self.ao.resize(self.data.m)
-        self.data.data = <float64_t*> self.ao.data
-
-    def __dealloc__(self):
-        PyMem_Free(self.data)
-
-    def __len__(self):
-        return self.data.n
-
-    def to_array(self):
-        self.ao.resize(self.data.n)
-        self.data.m = self.data.n
-        return self.ao
-
-    cdef inline void append(self, float64_t x):
-
-        if needs_resize(self.data):
-            self.resize()
-
-        append_data(self.data, x)
-
-cdef class HashTable:
-    pass
-
-cdef class StringHashTable(HashTable):
-    cdef kh_str_t *table
-
-    def __cinit__(self, int size_hint=1):
-        self.table = kh_init_str()
-        if size_hint is not None:
-            kh_resize_str(self.table, size_hint)
-
-    def __dealloc__(self):
-        kh_destroy_str(self.table)
-
-    cpdef get_item(self, object val):
-        cdef khiter_t k
-        k = kh_get_str(self.table, util.get_c_string(val))
-        if k != self.table.n_buckets:
-            return self.table.vals[k]
-        else:
-            raise KeyError(val)
-
-    def get_iter_test(self, object key, Py_ssize_t iterations):
-        cdef Py_ssize_t i, val
-        for i in range(iterations):
-            k = kh_get_str(self.table, util.get_c_string(key))
-            if k != self.table.n_buckets:
-                val = self.table.vals[k]
-
-    cpdef set_item(self, object key, Py_ssize_t val):
-        cdef:
-            khiter_t k
-            int ret = 0
-            char* buf
-
-        buf = util.get_c_string(key)
-
-        k = kh_put_str(self.table, buf, &ret)
-        self.table.keys[k] = key
-        if kh_exist_str(self.table, k):
-            self.table.vals[k] = val
-        else:
-            raise KeyError(key)
-
-    def get_indexer(self, ndarray[object] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            ndarray[int64_t] labels = np.empty(n, dtype=np.int64)
-            char *buf
-            int64_t *resbuf = <int64_t*> labels.data
-            khiter_t k
-            kh_str_t *table = self.table
-
-        for i in range(n):
-            buf = util.get_c_string(values[i])
-            k = kh_get_str(table, buf)
-            if k != table.n_buckets:
-                resbuf[i] = table.vals[k]
-            else:
-                resbuf[i] = -1
-        return labels
-
-    def unique(self, ndarray[object] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int ret = 0
-            object val
-            char *buf
-            khiter_t k
-            ObjectVector uniques = ObjectVector()
-
-        for i in range(n):
-            val = values[i]
-            buf = util.get_c_string(val)
-            k = kh_get_str(self.table, buf)
-            if k == self.table.n_buckets:
-                kh_put_str(self.table, buf, &ret)
-                uniques.append(val)
-
-        return uniques.to_array()
-
-    def factorize(self, ndarray[object] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            ndarray[int64_t] labels = np.empty(n, dtype=np.int64)
-            dict reverse = {}
-            Py_ssize_t idx, count = 0
-            int ret = 0
-            object val
-            char *buf
-            khiter_t k
-
-        for i in range(n):
-            val = values[i]
-            buf = util.get_c_string(val)
-            k = kh_get_str(self.table, buf)
-            if k != self.table.n_buckets:
-                idx = self.table.vals[k]
-                labels[i] = idx
-            else:
-                k = kh_put_str(self.table, buf, &ret)
-                # print 'putting %s, %s' % (val, count)
-
-                self.table.vals[k] = count
-                reverse[count] = val
-                labels[i] = count
-                count += 1
-
-        return reverse, labels
-
-cdef class Int64HashTable(HashTable):
-
-    def __cinit__(self, size_hint=1):
-        self.table = kh_init_int64()
-        if size_hint is not None:
-            kh_resize_int64(self.table, size_hint)
-
-    def __len__(self):
-        return self.table.size
-
-    def __dealloc__(self):
-        kh_destroy_int64(self.table)
-
-    def __contains__(self, object key):
-        cdef khiter_t k
-        k = kh_get_int64(self.table, key)
-        return k != self.table.n_buckets
-
-    cpdef get_item(self, int64_t val):
-        cdef khiter_t k
-        k = kh_get_int64(self.table, val)
-        if k != self.table.n_buckets:
-            return self.table.vals[k]
-        else:
-            raise KeyError(val)
-
-    def get_iter_test(self, int64_t key, Py_ssize_t iterations):
-        cdef Py_ssize_t i, val=0
-        for i in range(iterations):
-            k = kh_get_int64(self.table, val)
-            if k != self.table.n_buckets:
-                val = self.table.vals[k]
-
-    cpdef set_item(self, int64_t key, Py_ssize_t val):
-        cdef:
-            khiter_t k
-            int ret = 0
-
-        k = kh_put_int64(self.table, key, &ret)
-        self.table.keys[k] = key
-        if kh_exist_int64(self.table, k):
-            self.table.vals[k] = val
-        else:
-            raise KeyError(key)
-
-    @cython.boundscheck(False)
-    def map(self, int64_t[:] keys, int64_t[:] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int ret = 0
-            int64_t key
-            khiter_t k
-
-        with nogil:
-            for i in range(n):
-                key = keys[i]
-                k = kh_put_int64(self.table, key, &ret)
-                self.table.vals[k] = <Py_ssize_t> values[i]
-
-    @cython.boundscheck(False)
-    def map_locations(self, int64_t[:] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int ret = 0
-            int64_t val
-            khiter_t k
-
-        with nogil:
-            for i in range(n):
-                val = values[i]
-                k = kh_put_int64(self.table, val, &ret)
-                self.table.vals[k] = i
-
-    @cython.boundscheck(False)
-    def lookup(self, int64_t[:] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int ret = 0
-            int64_t val
-            khiter_t k
-            int64_t[:] locs = np.empty(n, dtype=np.int64)
-
-        with nogil:
-            for i in range(n):
-                val = values[i]
-                k = kh_get_int64(self.table, val)
-                if k != self.table.n_buckets:
-                    locs[i] = self.table.vals[k]
-                else:
-                    locs[i] = -1
-
-        return np.asarray(locs)
-
-    def factorize(self, ndarray[object] values):
-        reverse = {}
-        labels = self.get_labels(values, reverse, 0)
-        return reverse, labels
-
-    @cython.boundscheck(False)
-    def get_labels(self, int64_t[:] values, Int64Vector uniques,
-                   Py_ssize_t count_prior, Py_ssize_t na_sentinel):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int64_t[:] labels
-            Py_ssize_t idx, count = count_prior
-            int ret = 0
-            int64_t val
-            khiter_t k
-            Int64VectorData *ud
-
-        labels = np.empty(n, dtype=np.int64)
-        ud = uniques.data
-
-        with nogil:
-            for i in range(n):
-                val = values[i]
-                k = kh_get_int64(self.table, val)
-                if k != self.table.n_buckets:
-                    idx = self.table.vals[k]
-                    labels[i] = idx
-                else:
-                    k = kh_put_int64(self.table, val, &ret)
-                    self.table.vals[k] = count
-
-                    if needs_resize(ud):
-                        with gil:
-                            uniques.resize()
-                    append_data(ud, val)
-                    labels[i] = count
-                    count += 1
-
-        return np.asarray(labels)
-
-    @cython.boundscheck(False)
-    def get_labels_groupby(self, int64_t[:] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int64_t[:] labels
-            Py_ssize_t idx, count = 0
-            int ret = 0
-            int64_t val
-            khiter_t k
-            Int64Vector uniques = Int64Vector()
-            Int64VectorData *ud
-
-        labels = np.empty(n, dtype=np.int64)
-        ud = uniques.data
-
-        with nogil:
-            for i in range(n):
-                val = values[i]
-
-                # specific for groupby
-                if val < 0:
-                    labels[i] = -1
-                    continue
-
-                k = kh_get_int64(self.table, val)
-                if k != self.table.n_buckets:
-                    idx = self.table.vals[k]
-                    labels[i] = idx
-                else:
-                    k = kh_put_int64(self.table, val, &ret)
-                    self.table.vals[k] = count
-
-                    if needs_resize(ud):
-                        with gil:
-                            uniques.resize()
-                    append_data(ud, val)
-                    labels[i] = count
-                    count += 1
-
-        arr_uniques = uniques.to_array()
-
-        return np.asarray(labels), arr_uniques
-
-    @cython.boundscheck(False)
-    def unique(self, int64_t[:] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int ret = 0
-            int64_t val
-            khiter_t k
-            Int64Vector uniques = Int64Vector()
-            Int64VectorData *ud
-
-        ud = uniques.data
-
-        with nogil:
-            for i in range(n):
-                val = values[i]
-                k = kh_get_int64(self.table, val)
-                if k == self.table.n_buckets:
-                    kh_put_int64(self.table, val, &ret)
-
-                    if needs_resize(ud):
-                        with gil:
-                            uniques.resize()
-                    append_data(ud, val)
-
-        return uniques.to_array()
-
-
-cdef class Float64HashTable(HashTable):
-
-    def __cinit__(self, size_hint=1):
-        self.table = kh_init_float64()
-        if size_hint is not None:
-            kh_resize_float64(self.table, size_hint)
-
-    def __len__(self):
-        return self.table.size
-
-    cpdef get_item(self, float64_t val):
-        cdef khiter_t k
-        k = kh_get_float64(self.table, val)
-        if k != self.table.n_buckets:
-            return self.table.vals[k]
-        else:
-            raise KeyError(val)
-
-    cpdef set_item(self, float64_t key, Py_ssize_t val):
-        cdef:
-            khiter_t k
-            int ret = 0
-
-        k = kh_put_float64(self.table, key, &ret)
-        self.table.keys[k] = key
-        if kh_exist_float64(self.table, k):
-            self.table.vals[k] = val
-        else:
-            raise KeyError(key)
-
-    def __dealloc__(self):
-        kh_destroy_float64(self.table)
-
-    def __contains__(self, object key):
-        cdef khiter_t k
-        k = kh_get_float64(self.table, key)
-        return k != self.table.n_buckets
-
-    def factorize(self, float64_t[:] values):
-        uniques = Float64Vector()
-        labels = self.get_labels(values, uniques, 0, -1)
-        return uniques.to_array(), labels
-
-    @cython.boundscheck(False)
-    def get_labels(self, float64_t[:] values,
-                     Float64Vector uniques,
-                     Py_ssize_t count_prior, int64_t na_sentinel):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int64_t[:] labels
-            Py_ssize_t idx, count = count_prior
-            int ret = 0
-            float64_t val
-            khiter_t k
-            Float64VectorData *ud
-
-        labels = np.empty(n, dtype=np.int64)
-        ud = uniques.data
-
-        with nogil:
-            for i in range(n):
-                val = values[i]
-
-                if val != val:
-                    labels[i] = na_sentinel
-                    continue
-
-                k = kh_get_float64(self.table, val)
-                if k != self.table.n_buckets:
-                    idx = self.table.vals[k]
-                    labels[i] = idx
-                else:
-                    k = kh_put_float64(self.table, val, &ret)
-                    self.table.vals[k] = count
-
-                    if needs_resize(ud):
-                        with gil:
-                            uniques.resize()
-                    append_data(ud, val)
-                    labels[i] = count
-                    count += 1
-
-        return np.asarray(labels)
-
-    @cython.boundscheck(False)
-    def map_locations(self, float64_t[:] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int ret = 0
-            khiter_t k
-
-        with nogil:
-            for i in range(n):
-                k = kh_put_float64(self.table, values[i], &ret)
-                self.table.vals[k] = i
-
-    @cython.boundscheck(False)
-    def lookup(self, float64_t[:] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int ret = 0
-            float64_t val
-            khiter_t k
-            int64_t[:] locs = np.empty(n, dtype=np.int64)
-
-        with nogil:
-            for i in range(n):
-                val = values[i]
-                k = kh_get_float64(self.table, val)
-                if k != self.table.n_buckets:
-                    locs[i] = self.table.vals[k]
-                else:
-                    locs[i] = -1
-
-        return np.asarray(locs)
-
-    @cython.boundscheck(False)
-    def unique(self, float64_t[:] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int ret = 0
-            float64_t val
-            khiter_t k
-            bint seen_na = 0
-            Float64Vector uniques = Float64Vector()
-            Float64VectorData *ud
-
-        ud = uniques.data
-
-        with nogil:
-            for i in range(n):
-                val = values[i]
-
-                if val == val:
-                    k = kh_get_float64(self.table, val)
-                    if k == self.table.n_buckets:
-                        kh_put_float64(self.table, val, &ret)
-
-                        if needs_resize(ud):
-                            with gil:
-                                uniques.resize()
-                        append_data(ud, val)
-
-                elif not seen_na:
-                    seen_na = 1
-
-                    if needs_resize(ud):
-                        with gil:
-                            uniques.resize()
-                    append_data(ud, NAN)
-
-        return uniques.to_array()
-
-na_sentinel = object
-
-cdef class PyObjectHashTable(HashTable):
-
-    def __init__(self, size_hint=1):
-        self.table = kh_init_pymap()
-        kh_resize_pymap(self.table, size_hint)
-
-    def __dealloc__(self):
-        if self.table is not NULL:
-            self.destroy()
-
-    def __len__(self):
-        return self.table.size
-
-    def __contains__(self, object key):
-        cdef khiter_t k
-        hash(key)
-        if key != key or key is None:
-             key = na_sentinel
-        k = kh_get_pymap(self.table, <PyObject*>key)
-        return k != self.table.n_buckets
-
-    def destroy(self):
-        kh_destroy_pymap(self.table)
-        self.table = NULL
-
-    cpdef get_item(self, object val):
-        cdef khiter_t k
-        if val != val or val is None:
-            val = na_sentinel
-        k = kh_get_pymap(self.table, <PyObject*>val)
-        if k != self.table.n_buckets:
-            return self.table.vals[k]
-        else:
-            raise KeyError(val)
-
-    def get_iter_test(self, object key, Py_ssize_t iterations):
-        cdef Py_ssize_t i, val
-        if key != key or key is None:
-             key = na_sentinel
-        for i in range(iterations):
-            k = kh_get_pymap(self.table, <PyObject*>key)
-            if k != self.table.n_buckets:
-                val = self.table.vals[k]
-
-    cpdef set_item(self, object key, Py_ssize_t val):
-        cdef:
-            khiter_t k
-            int ret = 0
-            char* buf
-
-        hash(key)
-        if key != key or key is None:
-             key = na_sentinel
-        k = kh_put_pymap(self.table, <PyObject*>key, &ret)
-        # self.table.keys[k] = key
-        if kh_exist_pymap(self.table, k):
-            self.table.vals[k] = val
-        else:
-            raise KeyError(key)
-
-    def map_locations(self, ndarray[object] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int ret = 0
-            object val
-            khiter_t k
-
-        for i in range(n):
-            val = values[i]
-            hash(val)
-            if val != val or val is None:
-                val = na_sentinel
-
-            k = kh_put_pymap(self.table, <PyObject*>val, &ret)
-            self.table.vals[k] = i
-
-    def lookup(self, ndarray[object] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int ret = 0
-            object val
-            khiter_t k
-            int64_t[:] locs = np.empty(n, dtype=np.int64)
-
-        for i in range(n):
-            val = values[i]
-            hash(val)
-            if val != val or val is None:
-                val = na_sentinel
-
-            k = kh_get_pymap(self.table, <PyObject*>val)
-            if k != self.table.n_buckets:
-                locs[i] = self.table.vals[k]
-            else:
-                locs[i] = -1
-
-        return np.asarray(locs)
-
-    def unique(self, ndarray[object] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int ret = 0
-            object val
-            khiter_t k
-            ObjectVector uniques = ObjectVector()
-            bint seen_na = 0
-
-        for i in range(n):
-            val = values[i]
-            hash(val)
-            if not _checknan(val):
-                k = kh_get_pymap(self.table, <PyObject*>val)
-                if k == self.table.n_buckets:
-                    kh_put_pymap(self.table, <PyObject*>val, &ret)
-                    uniques.append(val)
-            elif not seen_na:
-                seen_na = 1
-                uniques.append(nan)
-
-        return uniques.to_array()
-
-    def get_labels(self, ndarray[object] values, ObjectVector uniques,
-                     Py_ssize_t count_prior, int64_t na_sentinel):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int64_t[:] labels
-            Py_ssize_t idx, count = count_prior
-            int ret = 0
-            object val
-            khiter_t k
-
-        labels = np.empty(n, dtype=np.int64)
-
-        for i in range(n):
-            val = values[i]
-            hash(val)
-
-            if val != val or val is None:
-                labels[i] = na_sentinel
-                continue
-
-            k = kh_get_pymap(self.table, <PyObject*>val)
-            if k != self.table.n_buckets:
-                idx = self.table.vals[k]
-                labels[i] = idx
-            else:
-                k = kh_put_pymap(self.table, <PyObject*>val, &ret)
-                self.table.vals[k] = count
-                uniques.append(val)
-                labels[i] = count
-                count += 1
-
-        return np.asarray(labels)
-
-
-cdef class Factorizer:
-    cdef public PyObjectHashTable table
-    cdef public ObjectVector uniques
-    cdef public Py_ssize_t count
-
-    def __init__(self, size_hint):
-        self.table = PyObjectHashTable(size_hint)
-        self.uniques = ObjectVector()
-        self.count = 0
-
-    def get_count(self):
-        return self.count
-
-    def factorize(self, ndarray[object] values, sort=False, na_sentinel=-1):
-        """
-        Factorize values with nans replaced by na_sentinel
-        >>> factorize(np.array([1,2,np.nan], dtype='O'), na_sentinel=20)
-        array([ 0,  1, 20])
-        """
-        labels = self.table.get_labels(values, self.uniques,
-                                       self.count, na_sentinel)
-        mask = (labels == na_sentinel)
-        # sort on
-        if sort:
-            if labels.dtype != np.int_:
-                labels = labels.astype(np.int_)
-            sorter = self.uniques.to_array().argsort()
-            reverse_indexer = np.empty(len(sorter), dtype=np.int_)
-            reverse_indexer.put(sorter, np.arange(len(sorter)))
-            labels = reverse_indexer.take(labels, mode='clip')
-            labels[mask] = na_sentinel
-        self.count = len(self.uniques)
-        return labels
-
-    def unique(self, ndarray[object] values):
-        # just for fun
-        return self.table.unique(values)
-
-
-cdef class Int64Factorizer:
-    cdef public Int64HashTable table
-    cdef public Int64Vector uniques
-    cdef public Py_ssize_t count
-
-    def __init__(self, size_hint):
-        self.table = Int64HashTable(size_hint)
-        self.uniques = Int64Vector()
-        self.count = 0
-
-    def get_count(self):
-        return self.count
-
-    def factorize(self, int64_t[:] values, sort=False,
-                  na_sentinel=-1):
-        labels = self.table.get_labels(values, self.uniques,
-                                       self.count, na_sentinel)
-
-        # sort on
-        if sort:
-            if labels.dtype != np.int_:
-                labels = labels.astype(np.int_)
-
-            sorter = self.uniques.to_array().argsort()
-            reverse_indexer = np.empty(len(sorter), dtype=np.int_)
-            reverse_indexer.put(sorter, np.arange(len(sorter)))
-
-            labels = reverse_indexer.take(labels)
-
-        self.count = len(self.uniques)
-        return labels
-
-ctypedef fused kh_scalar64:
-    kh_int64_t
-    kh_float64_t
-
-@cython.boundscheck(False)
-cdef build_count_table_scalar64(sixty_four_bit_scalar[:] values,
-                                kh_scalar64 *table, bint dropna):
-    cdef:
-        khiter_t k
-        Py_ssize_t i, n = len(values)
-        sixty_four_bit_scalar val
-        int ret = 0
-
-    if sixty_four_bit_scalar is float64_t and kh_scalar64 is kh_float64_t:
-        with nogil:
-            kh_resize_float64(table, n)
-
-            for i in range(n):
-                val = values[i]
-                if val == val or not dropna:
-                    k = kh_get_float64(table, val)
-                    if k != table.n_buckets:
-                        table.vals[k] += 1
-                    else:
-                        k = kh_put_float64(table, val, &ret)
-                        table.vals[k] = 1
-    elif sixty_four_bit_scalar is int64_t and kh_scalar64 is kh_int64_t:
-        with nogil:
-            kh_resize_int64(table, n)
-
-            for i in range(n):
-                val = values[i]
-                k = kh_get_int64(table, val)
-                if k != table.n_buckets:
-                    table.vals[k] += 1
-                else:
-                    k = kh_put_int64(table, val, &ret)
-                    table.vals[k] = 1
-    else:
-        raise ValueError("Table type must match scalar type.")
-
-
-
-@cython.boundscheck(False)
-cpdef value_count_scalar64(sixty_four_bit_scalar[:] values, bint dropna):
-    cdef:
-        Py_ssize_t i
-        kh_float64_t *ftable
-        kh_int64_t *itable
-        sixty_four_bit_scalar[:] result_keys
-        int64_t[:] result_counts
-        int k
-
-    i = 0
-
-    if sixty_four_bit_scalar is float64_t:
-        ftable = kh_init_float64()
-        build_count_table_scalar64(values, ftable, dropna)
-
-        result_keys = np.empty(ftable.n_occupied, dtype=np.float64)
-        result_counts = np.zeros(ftable.n_occupied, dtype=np.int64)
-
-        with nogil:
-            for k in range(ftable.n_buckets):
-                if kh_exist_float64(ftable, k):
-                    result_keys[i] = ftable.keys[k]
-                    result_counts[i] = ftable.vals[k]
-                    i += 1
-        kh_destroy_float64(ftable)
-
-    elif sixty_four_bit_scalar is int64_t:
-        itable = kh_init_int64()
-        build_count_table_scalar64(values, itable, dropna)
-
-        result_keys = np.empty(itable.n_occupied, dtype=np.int64)
-        result_counts = np.zeros(itable.n_occupied, dtype=np.int64)
-
-        with nogil:
-            for k in range(itable.n_buckets):
-                if kh_exist_int64(itable, k):
-                    result_keys[i] = itable.keys[k]
-                    result_counts[i] = itable.vals[k]
-                    i += 1
-        kh_destroy_int64(itable)
-
-    return np.asarray(result_keys), np.asarray(result_counts)
-
-
-cdef build_count_table_object(ndarray[object] values,
-                              ndarray[uint8_t, cast=True] mask,
-                              kh_pymap_t *table):
-    cdef:
-        khiter_t k
-        Py_ssize_t i, n = len(values)
-        int ret = 0
-
-    kh_resize_pymap(table, n // 10)
-
-    for i in range(n):
-        if mask[i]:
-            continue
-
-        val = values[i]
-        k = kh_get_pymap(table, <PyObject*> val)
-        if k != table.n_buckets:
-            table.vals[k] += 1
-        else:
-            k = kh_put_pymap(table, <PyObject*> val, &ret)
-            table.vals[k] = 1
-
-
-cpdef value_count_object(ndarray[object] values,
-                         ndarray[uint8_t, cast=True] mask):
-    cdef:
-        Py_ssize_t i
-        kh_pymap_t *table
-        int k
-
-    table = kh_init_pymap()
-    build_count_table_object(values, mask, table)
-
-    i = 0
-    result_keys = np.empty(table.n_occupied, dtype=object)
-    result_counts = np.zeros(table.n_occupied, dtype=np.int64)
-    for k in range(table.n_buckets):
-        if kh_exist_pymap(table, k):
-            result_keys[i] = <object> table.keys[k]
-            result_counts[i] = table.vals[k]
-            i += 1
-    kh_destroy_pymap(table)
-
-    return result_keys, result_counts
-
-
-def mode_object(ndarray[object] values, ndarray[uint8_t, cast=True] mask):
-    cdef:
-        int count, max_count = 2
-        int j = -1 # so you can do +=
-        int k
-        ndarray[object] modes
-        kh_pymap_t *table
-
-    table = kh_init_pymap()
-    build_count_table_object(values, mask, table)
-
-    modes = np.empty(table.n_buckets, dtype=np.object_)
-    for k in range(table.n_buckets):
-        if kh_exist_pymap(table, k):
-            count = table.vals[k]
-
-            if count == max_count:
-                j += 1
-            elif count > max_count:
-                max_count = count
-                j = 0
-            else:
-                continue
-            modes[j] = <object> table.keys[k]
-
-    kh_destroy_pymap(table)
-
-    return modes[:j+1]
-
-
-@cython.boundscheck(False)
-def mode_int64(int64_t[:] values):
-    cdef:
-        int count, max_count = 2
-        int j = -1 # so you can do +=
-        int k
-        kh_int64_t *table
-        ndarray[int64_t] modes
-
-    table = kh_init_int64()
-
-    build_count_table_scalar64(values, table, 0)
-
-    modes = np.empty(table.n_buckets, dtype=np.int64)
-
-    with nogil:
-        for k in range(table.n_buckets):
-            if kh_exist_int64(table, k):
-                count = table.vals[k]
-
-                if count == max_count:
-                    j += 1
-                elif count > max_count:
-                    max_count = count
-                    j = 0
-                else:
-                    continue
-                modes[j] = table.keys[k]
-
-    kh_destroy_int64(table)
-
-    return modes[:j+1]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def duplicated_int64(ndarray[int64_t, ndim=1] values, object keep='first'):
-    cdef:
-        int ret = 0, value, k
-        Py_ssize_t i, n = len(values)
-        kh_int64_t * table = kh_init_int64()
-        ndarray[uint8_t, ndim=1, cast=True] out = np.empty(n, dtype='bool')
-
-    kh_resize_int64(table, min(n, _SIZE_HINT_LIMIT))
-
-    if keep not in ('last', 'first', False):
-        raise ValueError('keep must be either "first", "last" or False')
-
-    if keep == 'last':
-        with nogil:
-            for i from n > i >=0:
-                kh_put_int64(table, values[i], &ret)
-                out[i] = ret == 0
-    elif keep == 'first':
-        with nogil:
-            for i from 0 <= i < n:
-                kh_put_int64(table, values[i], &ret)
-                out[i] = ret == 0
-    else:
-        with nogil:
-            for i from 0 <= i < n:
-                value = values[i]
-                k = kh_get_int64(table, value)
-                if k != table.n_buckets:
-                    out[table.vals[k]] = 1
-                    out[i] = 1
-                else:
-                    k = kh_put_int64(table, value, &ret)
-                    table.keys[k] = value
-                    table.vals[k] = i
-                    out[i] = 0
-    kh_destroy_int64(table)
-    return out
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def unique_label_indices(ndarray[int64_t, ndim=1] labels):
-    """
-    indices of the first occurrences of the unique labels
-    *excluding* -1. equivelent to:
-        np.unique(labels, return_index=True)[1]
-    """
-    cdef:
-        int ret = 0
-        Py_ssize_t i, n = len(labels)
-        kh_int64_t * table = kh_init_int64()
-        Int64Vector idx = Int64Vector()
-        ndarray[int64_t, ndim=1] arr
-        Int64VectorData *ud = idx.data
-
-    kh_resize_int64(table, min(n, _SIZE_HINT_LIMIT))
-
-    with nogil:
-        for i in range(n):
-            kh_put_int64(table, labels[i], &ret)
-            if ret != 0:
-                if needs_resize(ud):
-                    with gil:
-                        idx.resize()
-                append_data(ud, i)
-
-    kh_destroy_int64(table)
-
-    arr = idx.to_array()
-    arr = arr[labels[arr].argsort()]
-
-    return arr[1:] if arr.size != 0 and labels[arr[0]] == -1 else arr
diff --git a/pandas/index.pyx b/pandas/index.pyx
deleted file mode 100644
index 1678e3b280ee5..0000000000000
--- a/pandas/index.pyx
+++ /dev/null
@@ -1,653 +0,0 @@
-# cython: profile=False
-
-from numpy cimport ndarray
-
-from numpy cimport (float64_t, int32_t, int64_t, uint8_t,
-                    NPY_DATETIME, NPY_TIMEDELTA)
-cimport cython
-
-cimport numpy as cnp
-
-cnp.import_array()
-cnp.import_ufunc()
-
-cimport util
-
-import numpy as np
-
-cimport tslib
-from hashtable cimport *
-from pandas import algos, tslib, hashtable as _hash
-from pandas.tslib import Timestamp, Timedelta
-
-from datetime cimport (get_datetime64_value, _pydatetime_to_dts,
-                       pandas_datetimestruct)
-
-from cpython cimport PyTuple_Check, PyList_Check
-
-cdef extern from "datetime.h":
-    bint PyDateTime_Check(object o)
-    void PyDateTime_IMPORT()
-
-cdef int64_t iNaT = util.get_nat()
-
-try:
-    from dateutil.tz import tzutc as _du_utc
-    import pytz
-    UTC = pytz.utc
-    have_pytz = True
-except ImportError:
-    have_pytz = False
-
-PyDateTime_IMPORT
-
-cdef extern from "Python.h":
-    int PySlice_Check(object)
-
-
-cdef inline is_definitely_invalid_key(object val):
-    if PyTuple_Check(val):
-        try:
-            hash(val)
-        except TypeError:
-            return True
-
-    # we have a _data, means we are a NDFrame
-    return (PySlice_Check(val) or cnp.PyArray_Check(val)
-            or PyList_Check(val) or hasattr(val,'_data'))
-
-def get_value_at(ndarray arr, object loc):
-    if arr.descr.type_num == NPY_DATETIME:
-        return Timestamp(util.get_value_at(arr, loc))
-    elif arr.descr.type_num == NPY_TIMEDELTA:
-        return Timedelta(util.get_value_at(arr, loc))
-    return util.get_value_at(arr, loc)
-
-def set_value_at(ndarray arr, object loc, object val):
-    return util.set_value_at(arr, loc, val)
-
-
-# Don't populate hash tables in monotonic indexes larger than this
-_SIZE_CUTOFF = 1000000
-
-
-cdef class IndexEngine:
-
-    cdef readonly:
-        object vgetter
-        HashTable mapping
-        bint over_size_threshold
-
-    cdef:
-        bint unique, monotonic_inc, monotonic_dec
-        bint initialized, monotonic_check, unique_check
-
-    def __init__(self, vgetter, n):
-        self.vgetter = vgetter
-
-        self.over_size_threshold = n >= _SIZE_CUTOFF
-
-        self.initialized = 0
-        self.monotonic_check = 0
-
-        self.unique = 0
-        self.unique_check = 0
-        self.monotonic_inc = 0
-        self.monotonic_dec = 0
-
-    def __contains__(self, object val):
-        self._ensure_mapping_populated()
-        hash(val)
-        return val in self.mapping
-
-    cpdef get_value(self, ndarray arr, object key):
-        '''
-        arr : 1-dimensional ndarray
-        '''
-        cdef:
-            object loc
-            void* data_ptr
-
-        loc = self.get_loc(key)
-        if PySlice_Check(loc) or cnp.PyArray_Check(loc):
-            return arr[loc]
-        else:
-            if arr.descr.type_num == NPY_DATETIME:
-                return Timestamp(util.get_value_at(arr, loc))
-            elif arr.descr.type_num == NPY_TIMEDELTA:
-                return Timedelta(util.get_value_at(arr, loc))
-            return util.get_value_at(arr, loc)
-
-    cpdef set_value(self, ndarray arr, object key, object value):
-        '''
-        arr : 1-dimensional ndarray
-        '''
-        cdef:
-            object loc
-            void* data_ptr
-
-        loc = self.get_loc(key)
-        value = convert_scalar(arr, value)
-
-        if PySlice_Check(loc) or cnp.PyArray_Check(loc):
-            arr[loc] = value
-        else:
-            util.set_value_at(arr, loc, value)
-
-    cpdef get_loc(self, object val):
-        if is_definitely_invalid_key(val):
-            raise TypeError
-
-        if self.over_size_threshold and self.is_monotonic_increasing:
-            if not self.is_unique:
-                return self._get_loc_duplicates(val)
-            values = self._get_index_values()
-            loc = _bin_search(values, val) # .searchsorted(val, side='left')
-            if util.get_value_at(values, loc) != val:
-                raise KeyError(val)
-            return loc
-
-        self._ensure_mapping_populated()
-        if not self.unique:
-            return self._get_loc_duplicates(val)
-
-        self._check_type(val)
-
-        try:
-            return self.mapping.get_item(val)
-        except TypeError:
-            raise KeyError(val)
-
-    cdef inline _get_loc_duplicates(self, object val):
-        cdef:
-            Py_ssize_t diff
-
-        if self.is_monotonic_increasing:
-            values = self._get_index_values()
-            left = values.searchsorted(val, side='left')
-            right = values.searchsorted(val, side='right')
-
-            diff = right - left
-            if diff == 0:
-                raise KeyError(val)
-            elif diff == 1:
-                return left
-            else:
-                return slice(left, right)
-        else:
-            return self._maybe_get_bool_indexer(val)
-
-    cdef _maybe_get_bool_indexer(self, object val):
-        cdef:
-            ndarray[uint8_t] indexer
-            ndarray[object] values
-            int count = 0
-            Py_ssize_t i, n
-            int last_true
-
-        values = self._get_index_values()
-        n = len(values)
-
-        result = np.empty(n, dtype=bool)
-        indexer = result.view(np.uint8)
-
-        for i in range(n):
-            if values[i] == val:
-                count += 1
-                indexer[i] = 1
-                last_true = i
-            else:
-                indexer[i] = 0
-
-        if count == 0:
-            raise KeyError(val)
-        if count == 1:
-            return last_true
-
-        return result
-
-    property is_unique:
-
-        def __get__(self):
-            if not self.unique_check:
-                self._do_unique_check()
-
-            return self.unique == 1
-
-    property is_monotonic_increasing:
-
-        def __get__(self):
-            if not self.monotonic_check:
-                self._do_monotonic_check()
-
-            return self.monotonic_inc == 1
-
-    property is_monotonic_decreasing:
-
-        def __get__(self):
-            if not self.monotonic_check:
-                self._do_monotonic_check()
-
-            return self.monotonic_dec == 1
-
-    cdef inline _do_monotonic_check(self):
-        try:
-            values = self._get_index_values()
-            self.monotonic_inc, self.monotonic_dec = \
-                self._call_monotonic(values)
-        except TypeError:
-            self.monotonic_inc = 0
-            self.monotonic_dec = 0
-
-        self.monotonic_check = 1
-
-    cdef _get_index_values(self):
-        return self.vgetter()
-
-    cdef inline _do_unique_check(self):
-        self._ensure_mapping_populated()
-
-    def _call_monotonic(self, values):
-        raise NotImplementedError
-
-    cdef _make_hash_table(self, n):
-        raise NotImplementedError
-
-    cdef _check_type(self, object val):
-        hash(val)
-
-    cdef inline _ensure_mapping_populated(self):
-        if not self.initialized:
-            self.initialize()
-
-    cdef initialize(self):
-        values = self._get_index_values()
-
-        self.mapping = self._make_hash_table(len(values))
-        self.mapping.map_locations(values)
-
-        if len(self.mapping) == len(values):
-            self.unique = 1
-            self.unique_check = 1
-
-        self.initialized = 1
-
-    def clear_mapping(self):
-        self.mapping = None
-        self.initialized = 0
-
-    def get_indexer(self, values):
-        self._ensure_mapping_populated()
-        return self.mapping.lookup(values)
-
-    def get_indexer_non_unique(self, targets):
-        """ return an indexer suitable for takng from a non unique index
-            return the labels in the same order ast the target
-            and a missing indexer into the targets (which correspond
-            to the -1 indicies in the results """
-
-        cdef:
-            ndarray values, x
-            ndarray[int64_t] result, missing
-            set stargets
-            dict d = {}
-            object val
-            int count = 0, count_missing = 0
-            Py_ssize_t i, j, n, n_t, n_alloc
-
-        self._ensure_mapping_populated()
-        values = self._get_index_values()
-        stargets = set(targets)
-        n = len(values)
-        n_t = len(targets)
-        if n > 10000:
-            n_alloc = 10000
-        else:
-            n_alloc = n
-
-        result  = np.empty(n_alloc, dtype=np.int64)
-        missing = np.empty(n_t, dtype=np.int64)
-
-        # form the set of the results (like ismember)
-        members = np.empty(n, dtype=np.uint8)
-        for i in range(n):
-            val = util.get_value_1d(values, i)
-            if val in stargets:
-                if val not in d:
-                   d[val] = []
-                d[val].append(i)
-
-        for i in range(n_t):
-
-            val = util.get_value_1d(targets, i)
-
-            # found
-            if val in d:
-                for j in d[val]:
-
-                   # realloc if needed
-                   if count >= n_alloc:
-                      n_alloc += 10000
-                      result = np.resize(result, n_alloc)
-
-                   result[count] = j
-                   count += 1
-
-            # value not found
-            else:
-
-                if count >= n_alloc:
-                     n_alloc += 10000
-                     result = np.resize(result, n_alloc)
-                result[count] = -1
-                count += 1
-                missing[count_missing] = i
-                count_missing += 1
-
-        return result[0:count], missing[0:count_missing]
-
-cdef class Int64Engine(IndexEngine):
-
-    cdef _get_index_values(self):
-        return algos.ensure_int64(self.vgetter())
-
-    cdef _make_hash_table(self, n):
-        return _hash.Int64HashTable(n)
-
-    def _call_monotonic(self, values):
-        return algos.is_monotonic_int64(values, timelike=False)
-
-    def get_pad_indexer(self, other, limit=None):
-        return algos.pad_int64(self._get_index_values(), other,
-                               limit=limit)
-
-    def get_backfill_indexer(self, other, limit=None):
-        return algos.backfill_int64(self._get_index_values(), other,
-                                    limit=limit)
-
-    cdef _check_type(self, object val):
-        hash(val)
-        if util.is_bool_object(val):
-            raise KeyError(val)
-        elif util.is_float_object(val):
-            raise KeyError(val)
-
-    cdef _maybe_get_bool_indexer(self, object val):
-        cdef:
-            ndarray[uint8_t, cast=True] indexer
-            ndarray[int64_t] values
-            int count = 0
-            Py_ssize_t i, n
-            int64_t ival
-            int last_true
-
-        if not util.is_integer_object(val):
-            raise KeyError(val)
-
-        ival = val
-
-        values = self._get_index_values()
-        n = len(values)
-
-        result = np.empty(n, dtype=bool)
-        indexer = result.view(np.uint8)
-
-        for i in range(n):
-            if values[i] == val:
-                count += 1
-                indexer[i] = 1
-                last_true = i
-            else:
-                indexer[i] = 0
-
-        if count == 0:
-            raise KeyError(val)
-        if count == 1:
-            return last_true
-
-        return result
-
-cdef class Float64Engine(IndexEngine):
-
-    cdef _make_hash_table(self, n):
-        return _hash.Float64HashTable(n)
-
-    cdef _get_index_values(self):
-        return algos.ensure_float64(self.vgetter())
-
-    cdef _maybe_get_bool_indexer(self, object val):
-        cdef:
-            ndarray[uint8_t] indexer
-            ndarray[float64_t] values
-            int count = 0
-            Py_ssize_t i, n
-            int last_true
-
-        values = self._get_index_values()
-        n = len(values)
-
-        result = np.empty(n, dtype=bool)
-        indexer = result.view(np.uint8)
-
-        for i in range(n):
-            if values[i] == val:
-                count += 1
-                indexer[i] = 1
-                last_true = i
-            else:
-                indexer[i] = 0
-
-        if count == 0:
-            raise KeyError(val)
-        if count == 1:
-            return last_true
-
-        return result
-
-    def _call_monotonic(self, values):
-        return algos.is_monotonic_float64(values, timelike=False)
-
-    def get_pad_indexer(self, other, limit=None):
-        return algos.pad_float64(self._get_index_values(), other,
-                                    limit=limit)
-
-    def get_backfill_indexer(self, other, limit=None):
-        return algos.backfill_float64(self._get_index_values(), other,
-                                         limit=limit)
-
-
-cdef Py_ssize_t _bin_search(ndarray values, object val) except -1:
-    cdef:
-        Py_ssize_t mid, lo = 0, hi = len(values) - 1
-        object pval
-
-    if hi >= 0 and val > util.get_value_at(values, hi):
-        return len(values)
-
-    while lo < hi:
-        mid = (lo + hi) // 2
-        pval = util.get_value_at(values, mid)
-        if val < pval:
-            hi = mid
-        elif val > pval:
-            lo = mid + 1
-        else:
-            while mid > 0 and val == util.get_value_at(values, mid - 1):
-                mid -= 1
-            return mid
-
-    if val <= util.get_value_at(values, mid):
-        return mid
-    else:
-        return mid + 1
-
-_pad_functions = {
-    'object' : algos.pad_object,
-    'int64' : algos.pad_int64,
-    'float64' : algos.pad_float64
-}
-
-_backfill_functions = {
-    'object': algos.backfill_object,
-    'int64': algos.backfill_int64,
-    'float64': algos.backfill_float64
-}
-
-cdef class ObjectEngine(IndexEngine):
-
-    cdef _make_hash_table(self, n):
-        return _hash.PyObjectHashTable(n)
-
-    def _call_monotonic(self, values):
-        return algos.is_monotonic_object(values, timelike=False)
-
-    def get_pad_indexer(self, other, limit=None):
-        return algos.pad_object(self._get_index_values(), other,
-                                   limit=limit)
-
-    def get_backfill_indexer(self, other, limit=None):
-        return algos.backfill_object(self._get_index_values(), other,
-                                        limit=limit)
-
-
-cdef class DatetimeEngine(Int64Engine):
-
-    cdef _get_box_dtype(self):
-        return 'M8[ns]'
-
-    def __contains__(self, object val):
-        if self.over_size_threshold and self.is_monotonic_increasing:
-            if not self.is_unique:
-                return self._get_loc_duplicates(val)
-            values = self._get_index_values()
-            conv = _to_i8(val)
-            loc = values.searchsorted(conv, side='left')
-            return util.get_value_at(values, loc) == conv
-
-        self._ensure_mapping_populated()
-        return _to_i8(val) in self.mapping
-
-    cdef _get_index_values(self):
-        return self.vgetter().view('i8')
-
-    def _call_monotonic(self, values):
-        return algos.is_monotonic_int64(values, timelike=True)
-
-    cpdef get_loc(self, object val):
-        if is_definitely_invalid_key(val):
-            raise TypeError
-
-        # Welcome to the spaghetti factory
-
-        if self.over_size_threshold and self.is_monotonic_increasing:
-            if not self.is_unique:
-                val = _to_i8(val)
-                return self._get_loc_duplicates(val)
-            values = self._get_index_values()
-
-            try:
-                conv = _to_i8(val)
-                loc = values.searchsorted(conv, side='left')
-            except TypeError:
-                self._date_check_type(val)
-                raise KeyError(val)
-
-            if loc == len(values) or util.get_value_at(values, loc) != conv:
-                raise KeyError(val)
-            return loc
-
-        self._ensure_mapping_populated()
-        if not self.unique:
-            val = _to_i8(val)
-            return self._get_loc_duplicates(val)
-
-        try:
-            return self.mapping.get_item(val.value)
-        except KeyError:
-            raise KeyError(val)
-        except AttributeError:
-            pass
-
-        try:
-            val = _to_i8(val)
-            return self.mapping.get_item(val)
-        except TypeError:
-            self._date_check_type(val)
-            raise KeyError(val)
-
-    cdef inline _date_check_type(self, object val):
-        hash(val)
-        if not util.is_integer_object(val):
-            raise KeyError(val)
-
-    def get_indexer(self, values):
-        self._ensure_mapping_populated()
-        if values.dtype != self._get_box_dtype():
-            return np.repeat(-1, len(values)).astype('i4')
-        values = np.asarray(values).view('i8')
-        return self.mapping.lookup(values)
-
-    def get_pad_indexer(self, other, limit=None):
-        if other.dtype != self._get_box_dtype():
-            return np.repeat(-1, len(other)).astype('i4')
-        other = np.asarray(other).view('i8')
-        return algos.pad_int64(self._get_index_values(), other,
-                                limit=limit)
-
-    def get_backfill_indexer(self, other, limit=None):
-        if other.dtype != self._get_box_dtype():
-            return np.repeat(-1, len(other)).astype('i4')
-        other = np.asarray(other).view('i8')
-        return algos.backfill_int64(self._get_index_values(), other,
-                                     limit=limit)
-
-
-cdef class TimedeltaEngine(DatetimeEngine):
-
-    cdef _get_box_dtype(self):
-        return 'm8[ns]'
-
-cpdef convert_scalar(ndarray arr, object value):
-    if arr.descr.type_num == NPY_DATETIME:
-        if isinstance(value,np.ndarray):
-            pass
-        elif isinstance(value, Timestamp):
-            return value.value
-        elif value is None or value != value:
-            return iNaT
-        else:
-            return Timestamp(value).value
-    elif arr.descr.type_num == NPY_TIMEDELTA:
-        if isinstance(value,np.ndarray):
-            pass
-        elif isinstance(value, Timedelta):
-            return value.value
-        elif value is None or value != value:
-            return iNaT
-        else:
-            return Timedelta(value).value
-
-    if issubclass(arr.dtype.type, (np.integer, np.bool_)):
-        if util.is_float_object(value) and value != value:
-            raise ValueError('Cannot assign nan to integer series')
-
-    return value
-
-cdef inline _to_i8(object val):
-    cdef pandas_datetimestruct dts
-    try:
-        return val.value
-    except AttributeError:
-        if util.is_datetime64_object(val):
-            return get_datetime64_value(val)
-        elif PyDateTime_Check(val):
-            tzinfo = getattr(val, 'tzinfo', None)
-            ival = _pydatetime_to_dts(val, &dts)  # Save the original date value so we can get the utcoffset from it.
-            if tzinfo is not None and not _is_utc(tzinfo):
-                offset = tslib._get_utcoffset(tzinfo, val)
-                ival -= tslib._delta_to_nanoseconds(offset)
-            return ival
-        return val
-
-cdef inline bint _is_utc(object tz):
-    return tz is UTC or isinstance(tz, _du_utc)
diff --git a/pandas/info.py b/pandas/info.py
deleted file mode 100644
index 57ecd91739eab..0000000000000
--- a/pandas/info.py
+++ /dev/null
@@ -1,20 +0,0 @@
-"""
-pandas - a powerful data analysis and manipulation library for Python
-=====================================================================
-
-See http://pandas.pydata.org/ for full documentation. Otherwise, see the
-docstrings of the various objects in the pandas namespace:
-
-Series
-DataFrame
-Panel
-Index
-DatetimeIndex
-HDFStore
-bdate_range
-date_range
-read_csv
-read_fwf
-read_table
-ols
-"""
diff --git a/pandas/io/api.py b/pandas/io/api.py
index fedde462c74b7..f542a8176dce7 100644
--- a/pandas/io/api.py
+++ b/pandas/io/api.py
@@ -2,15 +2,31 @@
 Data IO api
 """
 
+# flake8: noqa
+
 from pandas.io.parsers import read_csv, read_table, read_fwf
-from pandas.io.clipboard import read_clipboard
+from pandas.io.clipboards import read_clipboard
 from pandas.io.excel import ExcelFile, ExcelWriter, read_excel
-from pandas.io.pytables import HDFStore, Term, get_store, read_hdf
+from pandas.io.pytables import HDFStore, get_store, read_hdf
 from pandas.io.json import read_json
 from pandas.io.html import read_html
 from pandas.io.sql import read_sql, read_sql_table, read_sql_query
 from pandas.io.sas import read_sas
+from pandas.io.feather_format import read_feather
+from pandas.io.parquet import read_parquet
 from pandas.io.stata import read_stata
 from pandas.io.pickle import read_pickle, to_pickle
 from pandas.io.packers import read_msgpack, to_msgpack
 from pandas.io.gbq import read_gbq
+
+# deprecation, xref #13790
+def Term(*args, **kwargs):
+    import warnings
+
+    warnings.warn("pd.Term is deprecated as it is not "
+                  "applicable to user code. Instead use in-line "
+                  "string expressions in the where clause when "
+                  "searching in HDFStore",
+                  FutureWarning, stacklevel=2)
+    from pandas.io.pytables import Term
+    return Term(*args, **kwargs)
diff --git a/pandas/io/auth.py b/pandas/io/auth.py
deleted file mode 100644
index 74b6b13000108..0000000000000
--- a/pandas/io/auth.py
+++ /dev/null
@@ -1,123 +0,0 @@
-from __future__ import print_function
-# see LICENSES directory for copyright and license
-import os
-import sys
-import logging
-
-import httplib2
-
-import apiclient.discovery as gapi
-import gflags
-import oauth2client.file as auth_file
-import oauth2client.client as oauth
-import oauth2client.tools as tools
-OOB_CALLBACK_URN = oauth.OOB_CALLBACK_URN
-
-
-class AuthenticationConfigError(ValueError):
-    pass
-
-FLOWS = {}
-FLAGS = gflags.FLAGS
-DEFAULT_SECRETS = os.path.join(
-    os.path.dirname(__file__), 'client_secrets.json')
-DEFAULT_SCOPE = 'https://www.googleapis.com/auth/analytics.readonly'
-DEFAULT_TOKEN_FILE = os.path.join(os.path.dirname(__file__), 'analytics.dat')
-MISSING_CLIENT_MSG = """
-WARNING: Please configure OAuth 2.0
-
-You need to populate the client_secrets.json file found at:
-
-   %s
-
-with information from the APIs Console <https://code.google.com/apis/console>.
-
-"""
-DOC_URL = ('https://developers.google.com/api-client-library/python/guide/'
-           'aaa_client_secrets')
-
-gflags.DEFINE_enum('logging_level', 'ERROR',
-                   ['DEBUG', 'INFO', 'WARNING', 'ERROR', 'CRITICAL'],
-                   'Set the level of logging detail.')
-
-# Name of file that will store the access and refresh tokens to access
-# the API without having to login each time. Make sure this file is in
-# a secure place.
-
-
-def process_flags(flags=[]):
-    """Uses the command-line flags to set the logging level.
-
-    Args:
-    argv: List of command line arguments passed to the python script.
-    """
-
-    # Let the gflags module process the command-line arguments.
-    try:
-        FLAGS(flags)
-    except gflags.FlagsError as e:
-        print('%s\nUsage: %s ARGS\n%s' % (e, str(flags), FLAGS))
-        sys.exit(1)
-
-    # Set the logging according to the command-line flag.
-    logging.getLogger().setLevel(getattr(logging, FLAGS.logging_level))
-
-
-def get_flow(secret, scope, redirect):
-    """
-    Retrieve an authentication flow object based on the given
-    configuration in the secret file name, the authentication scope,
-    and a redirect URN
-    """
-    key = (secret, scope, redirect)
-    flow = FLOWS.get(key, None)
-    if flow is None:
-        msg = MISSING_CLIENT_MSG % secret
-        if not os.path.exists(secret):
-            raise AuthenticationConfigError(msg)
-        flow = oauth.flow_from_clientsecrets(secret, scope,
-                                             redirect_uri=redirect,
-                                             message=msg)
-        FLOWS[key] = flow
-    return flow
-
-
-def make_token_store(fpath=None):
-    """create token storage from give file name"""
-    if fpath is None:
-        fpath = DEFAULT_TOKEN_FILE
-    return auth_file.Storage(fpath)
-
-
-def authenticate(flow, storage=None):
-    """
-    Try to retrieve a valid set of credentials from the token store if possible
-    Otherwise use the given authentication flow to obtain new credentials
-    and return an authenticated http object
-
-    Parameters
-    ----------
-    flow : authentication workflow
-    storage: token storage, default None
-    """
-    http = httplib2.Http()
-
-    # Prepare credentials, and authorize HTTP object with them.
-    credentials = storage.get()
-    if credentials is None or credentials.invalid:
-        credentials = tools.run(flow, storage)
-
-    http = credentials.authorize(http)
-    return http
-
-
-def init_service(http):
-    """
-    Use the given http object to build the analytics service object
-    """
-    return gapi.build('analytics', 'v3', http=http)
-
-
-def reset_default_token_store():
-    import os
-    os.remove(DEFAULT_TOKEN_FILE)
diff --git a/pandas/io/clipboard.py b/pandas/io/clipboard.py
deleted file mode 100644
index dfa46156aaead..0000000000000
--- a/pandas/io/clipboard.py
+++ /dev/null
@@ -1,98 +0,0 @@
-""" io on the clipboard """
-from pandas import compat, get_option, option_context, DataFrame
-from pandas.compat import StringIO
-
-
-def read_clipboard(**kwargs):  # pragma: no cover
-    """
-    Read text from clipboard and pass to read_table. See read_table for the
-    full argument list
-
-    If unspecified, `sep` defaults to '\s+'
-
-    Returns
-    -------
-    parsed : DataFrame
-    """
-    from pandas.util.clipboard import clipboard_get
-    from pandas.io.parsers import read_table
-    text = clipboard_get()
-
-    # try to decode (if needed on PY3)
-    # Strange. linux py33 doesn't complain, win py33 does
-    if compat.PY3:
-        try:
-            text = compat.bytes_to_str(
-                text, encoding=(kwargs.get('encoding') or
-                                get_option('display.encoding'))
-            )
-        except:
-            pass
-
-    # Excel copies into clipboard with \t seperation
-    # inspect no more then the 10 first lines, if they
-    # all contain an equal number (>0) of tabs, infer
-    # that this came from excel and set 'sep' accordingly
-    lines = text[:10000].split('\n')[:-1][:10]
-
-    # Need to remove leading white space, since read_table
-    # accepts:
-    #    a  b
-    # 0  1  2
-    # 1  3  4
-
-    counts = set([x.lstrip().count('\t') for x in lines])
-    if len(lines)>1 and len(counts) == 1 and counts.pop() != 0:
-        kwargs['sep'] = '\t'
-
-    if kwargs.get('sep') is None and kwargs.get('delim_whitespace') is None:
-        kwargs['sep'] = '\s+'
-
-    return read_table(StringIO(text), **kwargs)
-
-
-def to_clipboard(obj, excel=None, sep=None, **kwargs):  # pragma: no cover
-    """
-    Attempt to write text representation of object to the system clipboard
-    The clipboard can be then pasted into Excel for example.
-
-    Parameters
-    ----------
-    obj : the object to write to the clipboard
-    excel : boolean, defaults to True
-            if True, use the provided separator, writing in a csv
-            format for allowing easy pasting into excel.
-            if False, write a string representation of the object
-            to the clipboard
-    sep : optional, defaults to tab
-    other keywords are passed to to_csv
-
-    Notes
-    -----
-    Requirements for your platform
-      - Linux: xclip, or xsel (with gtk or PyQt4 modules)
-      - Windows:
-      - OS X:
-    """
-    from pandas.util.clipboard import clipboard_set
-    if excel is None:
-        excel = True
-
-    if excel:
-        try:
-            if sep is None:
-                sep = '\t'
-            buf = StringIO()
-            obj.to_csv(buf, sep=sep, **kwargs)
-            clipboard_set(buf.getvalue())
-            return
-        except:
-            pass
-
-    if isinstance(obj, DataFrame):
-        # str(df) has various unhelpful defaults, like truncation
-        with option_context('display.max_colwidth', 999999):
-            objstr = obj.to_string(**kwargs)
-    else:
-        objstr = str(obj)
-    clipboard_set(objstr)
diff --git a/pandas/io/clipboard/__init__.py b/pandas/io/clipboard/__init__.py
new file mode 100644
index 0000000000000..b76a843e3e7f2
--- /dev/null
+++ b/pandas/io/clipboard/__init__.py
@@ -0,0 +1,125 @@
+"""
+Pyperclip
+
+A cross-platform clipboard module for Python. (only handles plain text for now)
+By Al Sweigart al@inventwithpython.com
+BSD License
+
+Usage:
+  import pyperclip
+  pyperclip.copy('The text to be copied to the clipboard.')
+  spam = pyperclip.paste()
+
+  if not pyperclip.copy:
+    print("Copy functionality unavailable!")
+
+On Windows, no additional modules are needed.
+On Mac, the module uses pbcopy and pbpaste, which should come with the os.
+On Linux, install xclip or xsel via package manager. For example, in Debian:
+sudo apt-get install xclip
+
+Otherwise on Linux, you will need the gtk, qtpy or PyQt modules installed.
+qtpy also requires a python-qt-bindings module: PyQt4, PyQt5, PySide, PySide2
+
+gtk and PyQt4 modules are not available for Python 3,
+and this module does not work with PyGObject yet.
+"""
+__version__ = '1.5.27'
+
+import platform
+import os
+import subprocess
+from .clipboards import (init_osx_clipboard,
+                         init_gtk_clipboard, init_qt_clipboard,
+                         init_xclip_clipboard, init_xsel_clipboard,
+                         init_klipper_clipboard, init_no_clipboard)
+from .windows import init_windows_clipboard
+
+# `import qtpy` sys.exit()s if DISPLAY is not in the environment.
+# Thus, we need to detect the presence of $DISPLAY manually
+# and not load qtpy if it is absent.
+HAS_DISPLAY = os.getenv("DISPLAY", False)
+CHECK_CMD = "where" if platform.system() == "Windows" else "which"
+
+
+def _executable_exists(name):
+    return subprocess.call([CHECK_CMD, name],
+                           stdout=subprocess.PIPE, stderr=subprocess.PIPE) == 0
+
+
+def determine_clipboard():
+    # Determine the OS/platform and set
+    # the copy() and paste() functions accordingly.
+    if 'cygwin' in platform.system().lower():
+        # FIXME: pyperclip currently does not support Cygwin,
+        # see https://github.com/asweigart/pyperclip/issues/55
+        pass
+    elif os.name == 'nt' or platform.system() == 'Windows':
+        return init_windows_clipboard()
+    if os.name == 'mac' or platform.system() == 'Darwin':
+        return init_osx_clipboard()
+    if HAS_DISPLAY:
+        # Determine which command/module is installed, if any.
+        try:
+            # Check if gtk is installed
+            import gtk  # noqa
+        except ImportError:
+            pass
+        else:
+            return init_gtk_clipboard()
+
+        try:
+            # qtpy is a small abstraction layer that lets you write
+            # applications using a single api call to either PyQt or PySide
+            # https://pypi.org/project/QtPy
+            import qtpy  # noqa
+        except ImportError:
+            # If qtpy isn't installed, fall back on importing PyQt5, or PyQt5
+            try:
+                import PyQt5  # noqa
+            except ImportError:
+                try:
+                    import PyQt4  # noqa
+                except ImportError:
+                    pass  # fail fast for all non-ImportError exceptions.
+                else:
+                    return init_qt_clipboard()
+            else:
+                return init_qt_clipboard()
+            pass
+        else:
+            return init_qt_clipboard()
+
+        if _executable_exists("xclip"):
+            return init_xclip_clipboard()
+        if _executable_exists("xsel"):
+            return init_xsel_clipboard()
+        if _executable_exists("klipper") and _executable_exists("qdbus"):
+            return init_klipper_clipboard()
+
+    return init_no_clipboard()
+
+
+def set_clipboard(clipboard):
+    global copy, paste
+
+    clipboard_types = {'osx': init_osx_clipboard,
+                       'gtk': init_gtk_clipboard,
+                       'qt': init_qt_clipboard,
+                       'xclip': init_xclip_clipboard,
+                       'xsel': init_xsel_clipboard,
+                       'klipper': init_klipper_clipboard,
+                       'windows': init_windows_clipboard,
+                       'no': init_no_clipboard}
+
+    copy, paste = clipboard_types[clipboard]()
+
+
+copy, paste = determine_clipboard()
+
+__all__ = ["copy", "paste"]
+
+
+# pandas aliases
+clipboard_get = paste
+clipboard_set = copy
diff --git a/pandas/io/clipboard/clipboards.py b/pandas/io/clipboard/clipboards.py
new file mode 100644
index 0000000000000..0793ca6877cdb
--- /dev/null
+++ b/pandas/io/clipboard/clipboards.py
@@ -0,0 +1,143 @@
+import subprocess
+from .exceptions import PyperclipException
+from pandas.compat import PY2, text_type
+
+EXCEPT_MSG = """
+    Pyperclip could not find a copy/paste mechanism for your system.
+    For more information, please visit https://pyperclip.readthedocs.org """
+
+
+def init_osx_clipboard():
+    def copy_osx(text):
+        p = subprocess.Popen(['pbcopy', 'w'],
+                             stdin=subprocess.PIPE, close_fds=True)
+        p.communicate(input=text.encode('utf-8'))
+
+    def paste_osx():
+        p = subprocess.Popen(['pbpaste', 'r'],
+                             stdout=subprocess.PIPE, close_fds=True)
+        stdout, stderr = p.communicate()
+        return stdout.decode('utf-8')
+
+    return copy_osx, paste_osx
+
+
+def init_gtk_clipboard():
+    import gtk
+
+    def copy_gtk(text):
+        global cb
+        cb = gtk.Clipboard()
+        cb.set_text(text)
+        cb.store()
+
+    def paste_gtk():
+        clipboardContents = gtk.Clipboard().wait_for_text()
+        # for python 2, returns None if the clipboard is blank.
+        if clipboardContents is None:
+            return ''
+        else:
+            return clipboardContents
+
+    return copy_gtk, paste_gtk
+
+
+def init_qt_clipboard():
+    # $DISPLAY should exist
+
+    # Try to import from qtpy, but if that fails try PyQt5 then PyQt4
+    try:
+        from qtpy.QtWidgets import QApplication
+    except ImportError:
+        try:
+            from PyQt5.QtWidgets import QApplication
+        except ImportError:
+            from PyQt4.QtGui import QApplication
+
+    app = QApplication.instance()
+    if app is None:
+        app = QApplication([])
+
+    def copy_qt(text):
+        cb = app.clipboard()
+        cb.setText(text)
+
+    def paste_qt():
+        cb = app.clipboard()
+        return text_type(cb.text())
+
+    return copy_qt, paste_qt
+
+
+def init_xclip_clipboard():
+    def copy_xclip(text):
+        p = subprocess.Popen(['xclip', '-selection', 'c'],
+                             stdin=subprocess.PIPE, close_fds=True)
+        p.communicate(input=text.encode('utf-8'))
+
+    def paste_xclip():
+        p = subprocess.Popen(['xclip', '-selection', 'c', '-o'],
+                             stdout=subprocess.PIPE, close_fds=True)
+        stdout, stderr = p.communicate()
+        return stdout.decode('utf-8')
+
+    return copy_xclip, paste_xclip
+
+
+def init_xsel_clipboard():
+    def copy_xsel(text):
+        p = subprocess.Popen(['xsel', '-b', '-i'],
+                             stdin=subprocess.PIPE, close_fds=True)
+        p.communicate(input=text.encode('utf-8'))
+
+    def paste_xsel():
+        p = subprocess.Popen(['xsel', '-b', '-o'],
+                             stdout=subprocess.PIPE, close_fds=True)
+        stdout, stderr = p.communicate()
+        return stdout.decode('utf-8')
+
+    return copy_xsel, paste_xsel
+
+
+def init_klipper_clipboard():
+    def copy_klipper(text):
+        p = subprocess.Popen(
+            ['qdbus', 'org.kde.klipper', '/klipper', 'setClipboardContents',
+             text.encode('utf-8')],
+            stdin=subprocess.PIPE, close_fds=True)
+        p.communicate(input=None)
+
+    def paste_klipper():
+        p = subprocess.Popen(
+            ['qdbus', 'org.kde.klipper', '/klipper', 'getClipboardContents'],
+            stdout=subprocess.PIPE, close_fds=True)
+        stdout, stderr = p.communicate()
+
+        # Workaround for https://bugs.kde.org/show_bug.cgi?id=342874
+        # TODO: https://github.com/asweigart/pyperclip/issues/43
+        clipboardContents = stdout.decode('utf-8')
+        # even if blank, Klipper will append a newline at the end
+        assert len(clipboardContents) > 0
+        # make sure that newline is there
+        assert clipboardContents.endswith('\n')
+        if clipboardContents.endswith('\n'):
+            clipboardContents = clipboardContents[:-1]
+        return clipboardContents
+
+    return copy_klipper, paste_klipper
+
+
+def init_no_clipboard():
+    class ClipboardUnavailable(object):
+
+        def __call__(self, *args, **kwargs):
+            raise PyperclipException(EXCEPT_MSG)
+
+        if PY2:
+            def __nonzero__(self):
+                return False
+        else:
+            def __bool__(self):
+                return False
+
+    return ClipboardUnavailable(), ClipboardUnavailable()
diff --git a/pandas/io/clipboard/exceptions.py b/pandas/io/clipboard/exceptions.py
new file mode 100644
index 0000000000000..d948ad414327c
--- /dev/null
+++ b/pandas/io/clipboard/exceptions.py
@@ -0,0 +1,12 @@
+import ctypes
+
+
+class PyperclipException(RuntimeError):
+    pass
+
+
+class PyperclipWindowsException(PyperclipException):
+
+    def __init__(self, message):
+        message += " ({err})".format(err=ctypes.WinError())
+        super(PyperclipWindowsException, self).__init__(message)
diff --git a/pandas/io/clipboard/windows.py b/pandas/io/clipboard/windows.py
new file mode 100644
index 0000000000000..5fc23f7102f41
--- /dev/null
+++ b/pandas/io/clipboard/windows.py
@@ -0,0 +1,153 @@
+"""
+This module implements clipboard handling on Windows using ctypes.
+"""
+import time
+import contextlib
+import ctypes
+from ctypes import c_size_t, sizeof, c_wchar_p, get_errno, c_wchar
+from .exceptions import PyperclipWindowsException
+
+
+class CheckedCall(object):
+
+    def __init__(self, f):
+        super(CheckedCall, self).__setattr__("f", f)
+
+    def __call__(self, *args):
+        ret = self.f(*args)
+        if not ret and get_errno():
+            raise PyperclipWindowsException("Error calling " + self.f.__name__)
+        return ret
+
+    def __setattr__(self, key, value):
+        setattr(self.f, key, value)
+
+
+def init_windows_clipboard():
+    from ctypes.wintypes import (HGLOBAL, LPVOID, DWORD, LPCSTR, INT, HWND,
+                                 HINSTANCE, HMENU, BOOL, UINT, HANDLE)
+
+    windll = ctypes.windll
+
+    safeCreateWindowExA = CheckedCall(windll.user32.CreateWindowExA)
+    safeCreateWindowExA.argtypes = [DWORD, LPCSTR, LPCSTR, DWORD, INT, INT,
+                                    INT, INT, HWND, HMENU, HINSTANCE, LPVOID]
+    safeCreateWindowExA.restype = HWND
+
+    safeDestroyWindow = CheckedCall(windll.user32.DestroyWindow)
+    safeDestroyWindow.argtypes = [HWND]
+    safeDestroyWindow.restype = BOOL
+
+    OpenClipboard = windll.user32.OpenClipboard
+    OpenClipboard.argtypes = [HWND]
+    OpenClipboard.restype = BOOL
+
+    safeCloseClipboard = CheckedCall(windll.user32.CloseClipboard)
+    safeCloseClipboard.argtypes = []
+    safeCloseClipboard.restype = BOOL
+
+    safeEmptyClipboard = CheckedCall(windll.user32.EmptyClipboard)
+    safeEmptyClipboard.argtypes = []
+    safeEmptyClipboard.restype = BOOL
+
+    safeGetClipboardData = CheckedCall(windll.user32.GetClipboardData)
+    safeGetClipboardData.argtypes = [UINT]
+    safeGetClipboardData.restype = HANDLE
+
+    safeSetClipboardData = CheckedCall(windll.user32.SetClipboardData)
+    safeSetClipboardData.argtypes = [UINT, HANDLE]
+    safeSetClipboardData.restype = HANDLE
+
+    safeGlobalAlloc = CheckedCall(windll.kernel32.GlobalAlloc)
+    safeGlobalAlloc.argtypes = [UINT, c_size_t]
+    safeGlobalAlloc.restype = HGLOBAL
+
+    safeGlobalLock = CheckedCall(windll.kernel32.GlobalLock)
+    safeGlobalLock.argtypes = [HGLOBAL]
+    safeGlobalLock.restype = LPVOID
+
+    safeGlobalUnlock = CheckedCall(windll.kernel32.GlobalUnlock)
+    safeGlobalUnlock.argtypes = [HGLOBAL]
+    safeGlobalUnlock.restype = BOOL
+
+    GMEM_MOVEABLE = 0x0002
+    CF_UNICODETEXT = 13
+
+    @contextlib.contextmanager
+    def window():
+        """
+        Context that provides a valid Windows hwnd.
+        """
+        # we really just need the hwnd, so setting "STATIC"
+        # as predefined lpClass is just fine.
+        hwnd = safeCreateWindowExA(0, b"STATIC", None, 0, 0, 0, 0, 0,
+                                   None, None, None, None)
+        try:
+            yield hwnd
+        finally:
+            safeDestroyWindow(hwnd)
+
+    @contextlib.contextmanager
+    def clipboard(hwnd):
+        """
+        Context manager that opens the clipboard and prevents
+        other applications from modifying the clipboard content.
+        """
+        # We may not get the clipboard handle immediately because
+        # some other application is accessing it (?)
+        # We try for at least 500ms to get the clipboard.
+        t = time.time() + 0.5
+        success = False
+        while time.time() < t:
+            success = OpenClipboard(hwnd)
+            if success:
+                break
+            time.sleep(0.01)
+        if not success:
+            raise PyperclipWindowsException("Error calling OpenClipboard")
+
+        try:
+            yield
+        finally:
+            safeCloseClipboard()
+
+    def copy_windows(text):
+        # This function is heavily based on
+        # http://msdn.com/ms649016#_win32_Copying_Information_to_the_Clipboard
+        with window() as hwnd:
+            # http://msdn.com/ms649048
+            # If an application calls OpenClipboard with hwnd set to NULL,
+            # EmptyClipboard sets the clipboard owner to NULL;
+            # this causes SetClipboardData to fail.
+            # => We need a valid hwnd to copy something.
+            with clipboard(hwnd):
+                safeEmptyClipboard()
+
+                if text:
+                    # http://msdn.com/ms649051
+                    # If the hMem parameter identifies a memory object,
+                    # the object must have been allocated using the
+                    # function with the GMEM_MOVEABLE flag.
+                    count = len(text) + 1
+                    handle = safeGlobalAlloc(GMEM_MOVEABLE,
+                                             count * sizeof(c_wchar))
+                    locked_handle = safeGlobalLock(handle)
+
+                    ctypes.memmove(c_wchar_p(locked_handle),
+                                   c_wchar_p(text), count * sizeof(c_wchar))
+
+                    safeGlobalUnlock(handle)
+                    safeSetClipboardData(CF_UNICODETEXT, handle)
+
+    def paste_windows():
+        with clipboard(None):
+            handle = safeGetClipboardData(CF_UNICODETEXT)
+            if not handle:
+                # GetClipboardData may return NULL with errno == NO_ERROR
+                # if the clipboard is empty.
+                # (Also, it may return a handle to an empty buffer,
+                # but technically that's not empty)
+                return ""
+            return c_wchar_p(handle).value
+
+    return copy_windows, paste_windows
diff --git a/pandas/io/clipboards.py b/pandas/io/clipboards.py
new file mode 100644
index 0000000000000..dcc221ce978b3
--- /dev/null
+++ b/pandas/io/clipboards.py
@@ -0,0 +1,120 @@
+""" io on the clipboard """
+from pandas import compat, get_option, option_context, DataFrame
+from pandas.compat import StringIO, PY2
+
+
+def read_clipboard(sep=r'\s+', **kwargs):  # pragma: no cover
+    r"""
+    Read text from clipboard and pass to read_table. See read_table for the
+    full argument list
+
+    Parameters
+    ----------
+    sep : str, default '\s+'.
+        A string or regex delimiter. The default of '\s+' denotes
+        one or more whitespace characters.
+
+    Returns
+    -------
+    parsed : DataFrame
+    """
+    encoding = kwargs.pop('encoding', 'utf-8')
+
+    # only utf-8 is valid for passed value because that's what clipboard
+    # supports
+    if encoding is not None and encoding.lower().replace('-', '') != 'utf8':
+        raise NotImplementedError(
+            'reading from clipboard only supports utf-8 encoding')
+
+    from pandas.io.clipboard import clipboard_get
+    from pandas.io.parsers import read_table
+    text = clipboard_get()
+
+    # try to decode (if needed on PY3)
+    # Strange. linux py33 doesn't complain, win py33 does
+    if compat.PY3:
+        try:
+            text = compat.bytes_to_str(
+                text, encoding=(kwargs.get('encoding') or
+                                get_option('display.encoding'))
+            )
+        except:
+            pass
+
+    # Excel copies into clipboard with \t separation
+    # inspect no more then the 10 first lines, if they
+    # all contain an equal number (>0) of tabs, infer
+    # that this came from excel and set 'sep' accordingly
+    lines = text[:10000].split('\n')[:-1][:10]
+
+    # Need to remove leading white space, since read_table
+    # accepts:
+    #    a  b
+    # 0  1  2
+    # 1  3  4
+
+    counts = {x.lstrip().count('\t') for x in lines}
+    if len(lines) > 1 and len(counts) == 1 and counts.pop() != 0:
+        sep = r'\t'
+
+    if sep is None and kwargs.get('delim_whitespace') is None:
+        sep = r'\s+'
+
+    return read_table(StringIO(text), sep=sep, **kwargs)
+
+
+def to_clipboard(obj, excel=True, sep=None, **kwargs):  # pragma: no cover
+    """
+    Attempt to write text representation of object to the system clipboard
+    The clipboard can be then pasted into Excel for example.
+
+    Parameters
+    ----------
+    obj : the object to write to the clipboard
+    excel : boolean, defaults to True
+            if True, use the provided separator, writing in a csv
+            format for allowing easy pasting into excel.
+            if False, write a string representation of the object
+            to the clipboard
+    sep : optional, defaults to tab
+    other keywords are passed to to_csv
+
+    Notes
+    -----
+    Requirements for your platform
+      - Linux: xclip, or xsel (with gtk or PyQt4 modules)
+      - Windows:
+      - OS X:
+    """
+    encoding = kwargs.pop('encoding', 'utf-8')
+
+    # testing if an invalid encoding is passed to clipboard
+    if encoding is not None and encoding.lower().replace('-', '') != 'utf8':
+        raise ValueError('clipboard only supports utf-8 encoding')
+
+    from pandas.io.clipboard import clipboard_set
+    if excel is None:
+        excel = True
+
+    if excel:
+        try:
+            if sep is None:
+                sep = r'\t'
+            buf = StringIO()
+            # clipboard_set (pyperclip) expects unicode
+            obj.to_csv(buf, sep=sep, encoding='utf-8', **kwargs)
+            text = buf.getvalue()
+            if PY2:
+                text = text.decode('utf-8')
+            clipboard_set(text)
+            return
+        except:
+            pass
+
+    if isinstance(obj, DataFrame):
+        # str(df) has various unhelpful defaults, like truncation
+        with option_context('display.max_colwidth', 999999):
+            objstr = obj.to_string(**kwargs)
+    else:
+        objstr = str(obj)
+    clipboard_set(objstr)
diff --git a/pandas/io/common.py b/pandas/io/common.py
index b9cdd44e52555..6d579fc8a8a09 100644
--- a/pandas/io/common.py
+++ b/pandas/io/common.py
@@ -1,32 +1,51 @@
 """Common IO api utilities"""
 
-import sys
 import os
-import zipfile
+import csv
+import codecs
+import mmap
 from contextlib import contextmanager, closing
+import zipfile
 
-from pandas.compat import StringIO, string_types, BytesIO
+from pandas.compat import StringIO, BytesIO, string_types, text_type
 from pandas import compat
+from pandas.io.formats.printing import pprint_thing
+import pandas.core.common as com
+from pandas.core.dtypes.common import is_number, is_file_like
+
+# compat
+from pandas.errors import (ParserError, DtypeWarning,  # noqa
+                           EmptyDataError, ParserWarning)
+
+# gh-12665: Alias for now and remove later.
+CParserError = ParserError
+
+# common NA values
+# no longer excluding inf representations
+# '1.#INF','-1.#INF', '1.#INF000000',
+_NA_VALUES = set([
+    '-1.#IND', '1.#QNAN', '1.#IND', '-1.#QNAN', '#N/A N/A', '#N/A',
+    'N/A', 'n/a', 'NA', '#NA', 'NULL', 'null', 'NaN', '-NaN', 'nan', '-nan', ''
+])
 
 
 if compat.PY3:
     from urllib.request import urlopen, pathname2url
     _urlopen = urlopen
     from urllib.parse import urlparse as parse_url
-    import urllib.parse as compat_parse
     from urllib.parse import (uses_relative, uses_netloc, uses_params,
                               urlencode, urljoin)
     from urllib.error import URLError
-    from http.client import HTTPException
+    from http.client import HTTPException  # noqa
 else:
     from urllib2 import urlopen as _urlopen
-    from urllib import urlencode, pathname2url
+    from urllib import urlencode, pathname2url  # noqa
     from urlparse import urlparse as parse_url
     from urlparse import uses_relative, uses_netloc, uses_params, urljoin
-    from urllib2 import URLError
-    from httplib import HTTPException
-    from contextlib import contextmanager, closing
-    from functools import wraps
+    from urllib2 import URLError  # noqa
+    from httplib import HTTPException  # noqa
+    from contextlib import contextmanager, closing  # noqa
+    from functools import wraps  # noqa
 
     # @wraps(_urlopen)
     @contextmanager
@@ -39,83 +58,20 @@ def urlopen(*args, **kwargs):
 _VALID_URLS.discard('')
 
 
-class PerformanceWarning(Warning):
-    pass
-
-
-class DtypeWarning(Warning):
-    pass
-
-
-try:
-    from boto.s3 import key
-    class BotoFileLikeReader(key.Key):
-        """boto Key modified to be more file-like
-
-        This modification of the boto Key will read through a supplied
-        S3 key once, then stop. The unmodified boto Key object will repeatedly
-        cycle through a file in S3: after reaching the end of the file,
-        boto will close the file. Then the next call to `read` or `next` will
-        re-open the file and start reading from the beginning.
+class BaseIterator(object):
+    """Subclass this and provide a "__next__()" method to obtain an iterator.
+    Useful only when the object being iterated is non-reusable (e.g. OK for a
+    parser, not for an in-memory table, yes for its iterator)."""
 
-        Also adds a `readline` function which will split the returned
-        values by the `\n` character.
-        """
-        def __init__(self, *args, **kwargs):
-            encoding = kwargs.pop("encoding", None)  # Python 2 compat
-            super(BotoFileLikeReader, self).__init__(*args, **kwargs)
-            self.finished_read = False  # Add a flag to mark the end of the read.
-            self.buffer = ""
-            self.lines = []
-            if encoding is None and compat.PY3:
-                encoding = "utf-8"
-            self.encoding = encoding
-            self.lines = []
-
-        def next(self):
-            return self.readline()
-
-        __next__ = next
-
-        def read(self, *args, **kwargs):
-            if self.finished_read:
-                return b'' if compat.PY3 else ''
-            return super(BotoFileLikeReader, self).read(*args, **kwargs)
-
-        def close(self, *args, **kwargs):
-            self.finished_read = True
-            return super(BotoFileLikeReader, self).close(*args, **kwargs)
-
-        def seekable(self):
-            """Needed for reading by bz2"""
-            return False
-
-        def readline(self):
-            """Split the contents of the Key by '\n' characters."""
-            if self.lines:
-                retval = self.lines[0]
-                self.lines = self.lines[1:]
-                return retval
-            if self.finished_read:
-                if self.buffer:
-                    retval, self.buffer = self.buffer, ""
-                    return retval
-                else:
-                    raise StopIteration
+    def __iter__(self):
+        return self
 
-            if self.encoding:
-                self.buffer = "{}{}".format(self.buffer, self.read(8192).decode(self.encoding))
-            else:
-                self.buffer = "{}{}".format(self.buffer, self.read(8192))
+    def __next__(self):
+        raise com.AbstractMethodError(self)
 
-            split_buffer = self.buffer.split("\n")
-            self.lines.extend(split_buffer[:-1])
-            self.buffer = split_buffer[-1]
 
-            return self.readline()
-except ImportError:
-    # boto is only needed for reading from S3.
-    pass
+if not compat.PY3:
+    BaseIterator.next = lambda self: self.__next__()
 
 
 def _is_url(url):
@@ -132,51 +88,10 @@ def _is_url(url):
     """
     try:
         return parse_url(url).scheme in _VALID_URLS
-    except:
-        return False
-
-
-def _is_s3_url(url):
-    """Check for an s3, s3n, or s3a url"""
-    try:
-        return parse_url(url).scheme in ['s3', 's3n', 's3a']
-    except:
+    except Exception:
         return False
 
 
-def maybe_read_encoded_stream(reader, encoding=None, compression=None):
-    """read an encoded stream from the reader and transform the bytes to
-    unicode if required based on the encoding
-
-        Parameters
-        ----------
-        reader : a streamable file-like object
-        encoding : optional, the encoding to attempt to read
-
-        Returns
-        -------
-        a tuple of (a stream of decoded bytes, the encoding which was used)
-
-    """
-
-    if compat.PY3 or encoding is not None:  # pragma: no cover
-        if encoding:
-            errors = 'strict'
-        else:
-            errors = 'replace'
-            encoding = 'utf-8'
-
-        if compression == 'gzip':
-            reader = BytesIO(reader.read())
-        else:
-            reader = StringIO(reader.read().decode(encoding, errors))
-    else:
-        if compression == 'gzip':
-            reader = BytesIO(reader.read())
-        encoding = None
-    return reader, encoding
-
-
 def _expand_user(filepath_or_buffer):
     """Return the argument with an initial component of ~ or ~user
        replaced by that user's home directory.
@@ -194,6 +109,7 @@ def _expand_user(filepath_or_buffer):
         return os.path.expanduser(filepath_or_buffer)
     return filepath_or_buffer
 
+
 def _validate_header_arg(header):
     if isinstance(header, bool):
         raise TypeError("Passing a bool to header is invalid. "
@@ -201,63 +117,122 @@ def _validate_header_arg(header):
                         "header=int or list-like of ints to specify "
                         "the row(s) making up the column names")
 
+
+def _stringify_path(filepath_or_buffer):
+    """Attempt to convert a path-like object to a string.
+
+    Parameters
+    ----------
+    filepath_or_buffer : object to be converted
+
+    Returns
+    -------
+    str_filepath_or_buffer : maybe a string version of the object
+
+    Notes
+    -----
+    Objects supporting the fspath protocol (python 3.6+) are coerced
+    according to its __fspath__ method.
+
+    For backwards compatibility with older pythons, pathlib.Path and
+    py.path objects are specially coerced.
+
+    Any other object is passed through unchanged, which includes bytes,
+    strings, buffers, or anything else that's not even path-like.
+    """
+    try:
+        import pathlib
+        _PATHLIB_INSTALLED = True
+    except ImportError:
+        _PATHLIB_INSTALLED = False
+
+    try:
+        from py.path import local as LocalPath
+        _PY_PATH_INSTALLED = True
+    except ImportError:
+        _PY_PATH_INSTALLED = False
+
+    if hasattr(filepath_or_buffer, '__fspath__'):
+        return filepath_or_buffer.__fspath__()
+    if _PATHLIB_INSTALLED and isinstance(filepath_or_buffer, pathlib.Path):
+        return text_type(filepath_or_buffer)
+    if _PY_PATH_INSTALLED and isinstance(filepath_or_buffer, LocalPath):
+        return filepath_or_buffer.strpath
+    return filepath_or_buffer
+
+
+def is_s3_url(url):
+    """Check for an s3, s3n, or s3a url"""
+    try:
+        return parse_url(url).scheme in ['s3', 's3n', 's3a']
+    except Exception:
+        return False
+
+
+def is_gcs_url(url):
+    """Check for a gcs url"""
+    try:
+        return parse_url(url).scheme in ['gcs', 'gs']
+    except Exception:
+        return False
+
+
 def get_filepath_or_buffer(filepath_or_buffer, encoding=None,
-                           compression=None):
+                           compression=None, mode=None):
     """
-    If the filepath_or_buffer is a url, translate and return the buffer
-    passthru otherwise.
+    If the filepath_or_buffer is a url, translate and return the buffer.
+    Otherwise passthrough.
 
     Parameters
     ----------
-    filepath_or_buffer : a url, filepath, or buffer
+    filepath_or_buffer : a url, filepath (str, py.path.local or pathlib.Path),
+                         or buffer
     encoding : the encoding to use to decode py3 bytes, default is 'utf-8'
+    mode : str, optional
 
     Returns
     -------
-    a filepath_or_buffer, the encoding, the compression
+    tuple of ({a filepath_ or buffer or S3File instance},
+              encoding, str,
+              compression, str,
+              should_close, bool)
     """
+    filepath_or_buffer = _stringify_path(filepath_or_buffer)
 
     if _is_url(filepath_or_buffer):
-        req = _urlopen(str(filepath_or_buffer))
-        if compression == 'infer':
-            content_encoding = req.headers.get('Content-Encoding', None)
-            if content_encoding == 'gzip':
-                compression = 'gzip'
-            else:
-                compression = None
-        # cat on the compression to the tuple returned by the function
-        to_return = list(maybe_read_encoded_stream(req, encoding, compression)) + \
-                    [compression]
-        return tuple(to_return)
-
-    if _is_s3_url(filepath_or_buffer):
-        try:
-            import boto
-        except:
-            raise ImportError("boto is required to handle s3 files")
-        # Assuming AWS_ACCESS_KEY_ID and AWS_SECRET_ACCESS_KEY
-        # are environment variables
-        parsed_url = parse_url(filepath_or_buffer)
-
-        try:
-            conn = boto.connect_s3()
-        except boto.exception.NoAuthHandlerFound:
-            conn = boto.connect_s3(anon=True)
-
-        b = conn.get_bucket(parsed_url.netloc, validate=False)
-        if compat.PY2 and (compression == 'gzip' or
-                           (compression == 'infer' and
-                            filepath_or_buffer.endswith(".gz"))):
-            k = boto.s3.key.Key(b, parsed_url.path)
-            filepath_or_buffer = BytesIO(k.get_contents_as_string(
-                encoding=encoding))
-        else:
-            k = BotoFileLikeReader(b, parsed_url.path, encoding=encoding)
-            k.open('r')  # Expose read errors immediately
-            filepath_or_buffer = k
-        return filepath_or_buffer, None, compression
-
-    return _expand_user(filepath_or_buffer), None, compression
+        req = _urlopen(filepath_or_buffer)
+        content_encoding = req.headers.get('Content-Encoding', None)
+        if content_encoding == 'gzip':
+            # Override compression based on Content-Encoding header
+            compression = 'gzip'
+        reader = BytesIO(req.read())
+        req.close()
+        return reader, encoding, compression, True
+
+    if is_s3_url(filepath_or_buffer):
+        from pandas.io import s3
+        return s3.get_filepath_or_buffer(filepath_or_buffer,
+                                         encoding=encoding,
+                                         compression=compression,
+                                         mode=mode)
+
+    if is_gcs_url(filepath_or_buffer):
+        from pandas.io import gcs
+        return gcs.get_filepath_or_buffer(filepath_or_buffer,
+                                          encoding=encoding,
+                                          compression=compression,
+                                          mode=mode)
+
+    if isinstance(filepath_or_buffer, (compat.string_types,
+                                       compat.binary_type,
+                                       mmap.mmap)):
+        return _expand_user(filepath_or_buffer), None, compression, False
+
+    if not is_file_like(filepath_or_buffer):
+        msg = "Invalid file path or buffer object type: {_type}"
+        raise ValueError(msg.format(_type=type(filepath_or_buffer)))
+
+    return filepath_or_buffer, None, compression, False
 
 
 def file_path_to_url(path):
@@ -275,12 +250,359 @@ def file_path_to_url(path):
     return urljoin('file:', pathname2url(path))
 
 
-# ZipFile is not a context manager for <= 2.6
-# must be tuple index here since 2.6 doesn't use namedtuple for version_info
-if sys.version_info[1] <= 6:
-    @contextmanager
-    def ZipFile(*args, **kwargs):
-        with closing(zipfile.ZipFile(*args, **kwargs)) as zf:
-            yield zf
+_compression_to_extension = {
+    'gzip': '.gz',
+    'bz2': '.bz2',
+    'zip': '.zip',
+    'xz': '.xz',
+}
+
+
+def _infer_compression(filepath_or_buffer, compression):
+    """
+    Get the compression method for filepath_or_buffer. If compression='infer',
+    the inferred compression method is returned. Otherwise, the input
+    compression method is returned unchanged, unless it's invalid, in which
+    case an error is raised.
+
+    Parameters
+    ----------
+    filepath_or_buf :
+        a path (str) or buffer
+    compression : str or None
+        the compression method including None for no compression and 'infer'
+
+    Returns
+    -------
+    string or None :
+        compression method
+
+    Raises
+    ------
+    ValueError on invalid compression specified
+    """
+
+    # No compression has been explicitly specified
+    if compression is None:
+        return None
+
+    # Infer compression
+    if compression == 'infer':
+        # Convert all path types (e.g. pathlib.Path) to strings
+        filepath_or_buffer = _stringify_path(filepath_or_buffer)
+        if not isinstance(filepath_or_buffer, compat.string_types):
+            # Cannot infer compression of a buffer, assume no compression
+            return None
+
+        # Infer compression from the filename/URL extension
+        for compression, extension in _compression_to_extension.items():
+            if filepath_or_buffer.endswith(extension):
+                return compression
+        return None
+
+    # Compression has been specified. Check that it's valid
+    if compression in _compression_to_extension:
+        return compression
+
+    msg = 'Unrecognized compression type: {}'.format(compression)
+    valid = ['infer', None] + sorted(_compression_to_extension)
+    msg += '\nValid compression types are {}'.format(valid)
+    raise ValueError(msg)
+
+
+def _get_handle(path_or_buf, mode, encoding=None, compression=None,
+                memory_map=False, is_text=True):
+    """
+    Get file handle for given path/buffer and mode.
+
+    Parameters
+    ----------
+    path_or_buf :
+        a path (str) or buffer
+    mode : str
+        mode to open path_or_buf with
+    encoding : str or None
+    compression : str or None
+        Supported compression protocols are gzip, bz2, zip, and xz
+    memory_map : boolean, default False
+        See parsers._parser_params for more information.
+    is_text : boolean, default True
+        whether file/buffer is in text format (csv, json, etc.), or in binary
+        mode (pickle, etc.)
+
+    Returns
+    -------
+    f : file-like
+        A file-like object
+    handles : list of file-like objects
+        A list of file-like object that were opened in this function.
+    """
+    try:
+        from s3fs import S3File
+        need_text_wrapping = (BytesIO, S3File)
+    except ImportError:
+        need_text_wrapping = (BytesIO,)
+
+    handles = list()
+    f = path_or_buf
+
+    # Convert pathlib.Path/py.path.local or string
+    path_or_buf = _stringify_path(path_or_buf)
+    is_path = isinstance(path_or_buf, compat.string_types)
+
+    if compression:
+
+        if compat.PY2 and not is_path and encoding:
+            msg = 'compression with encoding is not yet supported in Python 2'
+            raise ValueError(msg)
+
+        # GZ Compression
+        if compression == 'gzip':
+            import gzip
+            if is_path:
+                f = gzip.open(path_or_buf, mode)
+            else:
+                f = gzip.GzipFile(fileobj=path_or_buf)
+
+        # BZ Compression
+        elif compression == 'bz2':
+            import bz2
+            if is_path:
+                f = bz2.BZ2File(path_or_buf, mode)
+            elif compat.PY2:
+                # Python 2's bz2 module can't take file objects, so have to
+                # run through decompress manually
+                f = StringIO(bz2.decompress(path_or_buf.read()))
+                path_or_buf.close()
+            else:
+                f = bz2.BZ2File(path_or_buf)
+
+        # ZIP Compression
+        elif compression == 'zip':
+            zf = BytesZipFile(path_or_buf, mode)
+            if zf.mode == 'w':
+                f = zf
+            elif zf.mode == 'r':
+                zip_names = zf.namelist()
+                if len(zip_names) == 1:
+                    f = zf.open(zip_names.pop())
+                elif len(zip_names) == 0:
+                    raise ValueError('Zero files found in ZIP file {}'
+                                     .format(path_or_buf))
+                else:
+                    raise ValueError('Multiple files found in ZIP file.'
+                                     ' Only one file per ZIP: {}'
+                                     .format(zip_names))
+
+        # XZ Compression
+        elif compression == 'xz':
+            lzma = compat.import_lzma()
+            f = lzma.LZMAFile(path_or_buf, mode)
+
+        # Unrecognized Compression
+        else:
+            msg = 'Unrecognized compression type: {}'.format(compression)
+            raise ValueError(msg)
+
+        handles.append(f)
+
+    elif is_path:
+        if compat.PY2:
+            # Python 2
+            f = open(path_or_buf, mode)
+        elif encoding:
+            # Python 3 and encoding
+            f = open(path_or_buf, mode, encoding=encoding)
+        elif is_text:
+            # Python 3 and no explicit encoding
+            f = open(path_or_buf, mode, errors='replace')
+        else:
+            # Python 3 and binary mode
+            f = open(path_or_buf, mode)
+        handles.append(f)
+
+    # in Python 3, convert BytesIO or fileobjects passed with an encoding
+    if compat.PY3 and is_text and\
+            (compression or isinstance(f, need_text_wrapping)):
+        from io import TextIOWrapper
+        f = TextIOWrapper(f, encoding=encoding)
+        handles.append(f)
+
+    if memory_map and hasattr(f, 'fileno'):
+        try:
+            g = MMapWrapper(f)
+            f.close()
+            f = g
+        except Exception:
+            # we catch any errors that may have occurred
+            # because that is consistent with the lower-level
+            # functionality of the C engine (pd.read_csv), so
+            # leave the file handler as is then
+            pass
+
+    return f, handles
+
+
+class BytesZipFile(zipfile.ZipFile, BytesIO):
+    """
+    Wrapper for standard library class ZipFile and allow the returned file-like
+    handle to accept byte strings via `write` method.
+
+    BytesIO provides attributes of file-like object and ZipFile.writestr writes
+    bytes strings into a member of the archive.
+    """
+    # GH 17778
+    def __init__(self, file, mode, compression=zipfile.ZIP_DEFLATED, **kwargs):
+        if mode in ['wb', 'rb']:
+            mode = mode.replace('b', '')
+        super(BytesZipFile, self).__init__(file, mode, compression, **kwargs)
+
+    def write(self, data):
+        super(BytesZipFile, self).writestr(self.filename, data)
+
+    @property
+    def closed(self):
+        return self.fp is None
+
+
+class MMapWrapper(BaseIterator):
+    """
+    Wrapper for the Python's mmap class so that it can be properly read in
+    by Python's csv.reader class.
+
+    Parameters
+    ----------
+    f : file object
+        File object to be mapped onto memory. Must support the 'fileno'
+        method or have an equivalent attribute
+
+    """
+
+    def __init__(self, f):
+        self.mmap = mmap.mmap(f.fileno(), 0, access=mmap.ACCESS_READ)
+
+    def __getattr__(self, name):
+        return getattr(self.mmap, name)
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        newline = self.mmap.readline()
+
+        # readline returns bytes, not str, in Python 3,
+        # but Python's CSV reader expects str, so convert
+        # the output to str before continuing
+        if compat.PY3:
+            newline = compat.bytes_to_str(newline)
+
+        # mmap doesn't raise if reading past the allocated
+        # data but instead returns an empty string, so raise
+        # if that is returned
+        if newline == '':
+            raise StopIteration
+        return newline
+
+
+if not compat.PY3:
+    MMapWrapper.next = lambda self: self.__next__()
+
+
+class UTF8Recoder(BaseIterator):
+
+    """
+    Iterator that reads an encoded stream and reencodes the input to UTF-8
+    """
+
+    def __init__(self, f, encoding):
+        self.reader = codecs.getreader(encoding)(f)
+
+    def read(self, bytes=-1):
+        return self.reader.read(bytes).encode("utf-8")
+
+    def readline(self):
+        return self.reader.readline().encode("utf-8")
+
+    def next(self):
+        return next(self.reader).encode("utf-8")
+
+
+if compat.PY3:  # pragma: no cover
+    def UnicodeReader(f, dialect=csv.excel, encoding="utf-8", **kwds):
+        # ignore encoding
+        return csv.reader(f, dialect=dialect, **kwds)
+
+    def UnicodeWriter(f, dialect=csv.excel, encoding="utf-8", **kwds):
+        return csv.writer(f, dialect=dialect, **kwds)
 else:
-    ZipFile = zipfile.ZipFile
+    class UnicodeReader(BaseIterator):
+
+        """
+        A CSV reader which will iterate over lines in the CSV file "f",
+        which is encoded in the given encoding.
+
+        On Python 3, this is replaced (below) by csv.reader, which handles
+        unicode.
+        """
+
+        def __init__(self, f, dialect=csv.excel, encoding="utf-8", **kwds):
+            f = UTF8Recoder(f, encoding)
+            self.reader = csv.reader(f, dialect=dialect, **kwds)
+
+        def __next__(self):
+            row = next(self.reader)
+            return [compat.text_type(s, "utf-8") for s in row]
+
+    class UnicodeWriter(object):
+
+        """
+        A CSV writer which will write rows to CSV file "f",
+        which is encoded in the given encoding.
+        """
+
+        def __init__(self, f, dialect=csv.excel, encoding="utf-8", **kwds):
+            # Redirect output to a queue
+            self.queue = StringIO()
+            self.writer = csv.writer(self.queue, dialect=dialect, **kwds)
+            self.stream = f
+            self.encoder = codecs.getincrementalencoder(encoding)()
+            self.quoting = kwds.get("quoting", None)
+
+        def writerow(self, row):
+            def _check_as_is(x):
+                return (self.quoting == csv.QUOTE_NONNUMERIC and
+                        is_number(x)) or isinstance(x, str)
+
+            row = [x if _check_as_is(x)
+                   else pprint_thing(x).encode("utf-8") for x in row]
+
+            self.writer.writerow([s for s in row])
+            # Fetch UTF-8 output from the queue ...
+            data = self.queue.getvalue()
+            data = data.decode("utf-8")
+            # ... and re-encode it into the target encoding
+            data = self.encoder.encode(data)
+            # write to the target stream
+            self.stream.write(data)
+            # empty queue
+            self.queue.truncate(0)
+
+        def writerows(self, rows):
+            def _check_as_is(x):
+                return (self.quoting == csv.QUOTE_NONNUMERIC and
+                        is_number(x)) or isinstance(x, str)
+
+            for i, row in enumerate(rows):
+                rows[i] = [x if _check_as_is(x)
+                           else pprint_thing(x).encode("utf-8") for x in row]
+
+            self.writer.writerows([[s for s in row] for row in rows])
+            # Fetch UTF-8 output from the queue ...
+            data = self.queue.getvalue()
+            data = data.decode("utf-8")
+            # ... and re-encode it into the target encoding
+            data = self.encoder.encode(data)
+            # write to the target stream
+            self.stream.write(data)
+            # empty queue
+            self.queue.truncate(0)
diff --git a/pandas/io/data.py b/pandas/io/data.py
deleted file mode 100644
index 310b165101bdf..0000000000000
--- a/pandas/io/data.py
+++ /dev/null
@@ -1,1243 +0,0 @@
-"""
-Module contains tools for collecting data from various remote sources
-
-
-"""
-import warnings
-import tempfile
-import datetime as dt
-import time
-
-from collections import defaultdict
-
-import numpy as np
-
-from pandas.compat import(
-    StringIO, bytes_to_str, range, lmap, zip
-)
-import pandas.compat as compat
-from pandas import Panel, DataFrame, Series, read_csv, concat, to_datetime, DatetimeIndex, DateOffset
-from pandas.core.common import is_list_like, PandasError
-from pandas.io.common import urlopen, ZipFile, urlencode
-from pandas.tseries.offsets import MonthEnd
-from pandas.util.testing import _network_error_classes
-from pandas.io.html import read_html
-
-warnings.warn("\n"
-              "The pandas.io.data module is moved to a separate package "
-              "(pandas-datareader) and will be removed from pandas in a "
-              "future version.\nAfter installing the pandas-datareader package "
-              "(https://github.com/pydata/pandas-datareader), you can change "
-              "the import ``from pandas.io import data, wb`` to "
-              "``from pandas_datareader import data, wb``.",
-              FutureWarning)
-
-class SymbolWarning(UserWarning):
-    pass
-
-
-class RemoteDataError(PandasError, IOError):
-    pass
-
-
-def DataReader(name, data_source=None, start=None, end=None,
-               retry_count=3, pause=0.001):
-    """
-    Imports data from a number of online sources.
-
-    Currently supports Yahoo! Finance, Google Finance, St. Louis FED (FRED)
-    and Kenneth French's data library.
-
-    Parameters
-    ----------
-    name : str or list of strs
-        the name of the dataset. Some data sources (yahoo, google, fred) will
-        accept a list of names.
-    data_source: str, default: None
-        the data source ("yahoo", "google", "fred", or "ff")
-    start : datetime, default: None
-        left boundary for range (defaults to 1/1/2010)
-    end : datetime, default: None
-        right boundary for range (defaults to today)
-    retry_count : int, default 3
-        Number of times to retry query request.
-    pause : numeric, default 0.001
-        Time, in seconds, to pause between consecutive queries of chunks. If
-        single value given for symbol, represents the pause between retries.
-
-    Examples
-    ----------
-
-    # Data from Yahoo! Finance
-    gs = DataReader("GS", "yahoo")
-
-    # Data from Google Finance
-    aapl = DataReader("AAPL", "google")
-
-    # Data from FRED
-    vix = DataReader("VIXCLS", "fred")
-
-    # Data from Fama/French
-    ff = DataReader("F-F_Research_Data_Factors", "famafrench")
-    ff = DataReader("F-F_Research_Data_Factors_weekly", "famafrench")
-    ff = DataReader("6_Portfolios_2x3", "famafrench")
-    ff = DataReader("F-F_ST_Reversal_Factor", "famafrench")
-    """
-    start, end = _sanitize_dates(start, end)
-
-    if data_source == "yahoo":
-        return get_data_yahoo(symbols=name, start=start, end=end,
-                              adjust_price=False, chunksize=25,
-                              retry_count=retry_count, pause=pause)
-    elif data_source == "google":
-        return get_data_google(symbols=name, start=start, end=end,
-                               adjust_price=False, chunksize=25,
-                               retry_count=retry_count, pause=pause)
-    elif data_source == "fred":
-        return get_data_fred(name, start, end)
-    elif data_source == "famafrench":
-        return get_data_famafrench(name)
-
-
-def _sanitize_dates(start, end):
-    from pandas.core.datetools import to_datetime
-    start = to_datetime(start)
-    end = to_datetime(end)
-    if start is None:
-        start = dt.datetime(2010, 1, 1)
-    if end is None:
-        end = dt.datetime.today()
-    return start, end
-
-
-def _in_chunks(seq, size):
-    """
-    Return sequence in 'chunks' of size defined by size
-    """
-    return (seq[pos:pos + size] for pos in range(0, len(seq), size))
-
-
-_yahoo_codes = {'symbol': 's', 'last': 'l1', 'change_pct': 'p2', 'PE': 'r',
-                'time': 't1', 'short_ratio': 's7'}
-
-
-_YAHOO_QUOTE_URL = 'http://finance.yahoo.com/d/quotes.csv?'
-
-
-def get_quote_yahoo(symbols):
-    """
-    Get current yahoo quote
-
-    Returns a DataFrame
-    """
-    if isinstance(symbols, compat.string_types):
-        sym_list = symbols
-    else:
-        sym_list = '+'.join(symbols)
-
-    # for codes see: http://www.gummy-stuff.org/Yahoo-data.htm
-    request = ''.join(compat.itervalues(_yahoo_codes))  # code request string
-    header = list(_yahoo_codes.keys())
-
-    data = defaultdict(list)
-
-    url_str = _YAHOO_QUOTE_URL + 's=%s&f=%s' % (sym_list, request)
-
-    with urlopen(url_str) as url:
-        lines = url.readlines()
-
-    for line in lines:
-        fields = line.decode('utf-8').strip().split(',')
-        for i, field in enumerate(fields):
-            if field[-2:] == '%"':
-                v = float(field.strip('"%'))
-            elif field[0] == '"':
-                v = field.strip('"')
-            else:
-                try:
-                    v = float(field)
-                except ValueError:
-                    v = field
-            data[header[i]].append(v)
-
-    idx = data.pop('symbol')
-    return DataFrame(data, index=idx)
-
-
-def get_quote_google(symbols):
-    raise NotImplementedError("Google Finance doesn't have this functionality")
-
-
-def _retry_read_url(url, retry_count, pause, name):
-    for _ in range(retry_count):
-        time.sleep(pause)
-
-        # kludge to close the socket ASAP
-        try:
-            with urlopen(url) as resp:
-                lines = resp.read()
-        except _network_error_classes:
-            pass
-        else:
-            rs = read_csv(StringIO(bytes_to_str(lines)), index_col=0,
-                          parse_dates=True, na_values='-')[::-1]
-            # Yahoo! Finance sometimes does this awesome thing where they
-            # return 2 rows for the most recent business day
-            if len(rs) > 2 and rs.index[-1] == rs.index[-2]:  # pragma: no cover
-                rs = rs[:-1]
-
-            #Get rid of unicode characters in index name.
-            try:
-                rs.index.name = rs.index.name.decode('unicode_escape').encode('ascii', 'ignore')
-            except AttributeError:
-                #Python 3 string has no decode method.
-                rs.index.name = rs.index.name.encode('ascii', 'ignore').decode()
-
-            return rs
-
-    raise IOError("after %d tries, %s did not "
-                  "return a 200 for url %r" % (retry_count, name, url))
-
-
-_HISTORICAL_YAHOO_URL = 'http://ichart.finance.yahoo.com/table.csv?'
-
-
-def _get_hist_yahoo(sym, start, end, interval, retry_count, pause):
-    """
-    Get historical data for the given name from yahoo.
-    Date format is datetime
-
-    Returns a DataFrame.
-    """
-    start, end = _sanitize_dates(start, end)
-    url = (_HISTORICAL_YAHOO_URL + 's=%s' % sym +
-           '&a=%s' % (start.month - 1) +
-           '&b=%s' % start.day +
-           '&c=%s' % start.year +
-           '&d=%s' % (end.month - 1) +
-           '&e=%s' % end.day +
-           '&f=%s' % end.year +
-           '&g=%s' % interval +
-           '&ignore=.csv')
-    return _retry_read_url(url, retry_count, pause, 'Yahoo!')
-
-
-_HISTORICAL_GOOGLE_URL = 'http://www.google.com/finance/historical?'
-
-
-def _get_hist_google(sym, start, end, interval, retry_count, pause):
-    """
-    Get historical data for the given name from google.
-    Date format is datetime
-
-    Returns a DataFrame.
-    """
-    start, end = _sanitize_dates(start, end)
-
-    # www.google.com/finance/historical?q=GOOG&startdate=Jun+9%2C+2011&enddate=Jun+8%2C+2013&output=csv
-    url = "%s%s" % (_HISTORICAL_GOOGLE_URL,
-                    urlencode({"q": sym,
-                               "startdate": start.strftime('%b %d, ' '%Y'),
-                               "enddate": end.strftime('%b %d, %Y'),
-                               "output": "csv"}))
-    return _retry_read_url(url, retry_count, pause, 'Google')
-
-
-def _adjust_prices(hist_data, price_list=None):
-    """
-    Return modifed DataFrame or Panel with adjusted prices based on
-    'Adj Close' price. Adds 'Adj_Ratio' column.
-    """
-    if price_list is None:
-        price_list = 'Open', 'High', 'Low', 'Close'
-    adj_ratio = hist_data['Adj Close'] / hist_data['Close']
-
-    data = hist_data.copy()
-    for item in price_list:
-        data[item] = hist_data[item] * adj_ratio
-    data['Adj_Ratio'] = adj_ratio
-    del data['Adj Close']
-    return data
-
-
-def _calc_return_index(price_df):
-    """
-    Return a returns index from a input price df or series. Initial value
-    (typically NaN) is set to 1.
-    """
-    df = price_df.pct_change().add(1).cumprod()
-    mask = df.ix[1].notnull() & df.ix[0].isnull()
-    df.ix[0][mask] = 1
-
-    # Check for first stock listings after starting date of index in ret_index
-    # If True, find first_valid_index and set previous entry to 1.
-    if (~mask).any():
-        for sym in mask.index[~mask]:
-            tstamp = df[sym].first_valid_index()
-            t_idx = df.index.get_loc(tstamp) - 1
-            df[sym].ix[t_idx] = 1
-
-    return df
-
-
-_YAHOO_COMPONENTS_URL = 'http://download.finance.yahoo.com/d/quotes.csv?'
-
-
-def get_components_yahoo(idx_sym):
-    """
-    Returns DataFrame containing list of component information for
-    index represented in idx_sym from yahoo. Includes component symbol
-    (ticker), exchange, and name.
-
-    Parameters
-    ----------
-    idx_sym : str
-        Stock index symbol
-        Examples:
-        '^DJI' (Dow Jones Industrial Average)
-        '^NYA' (NYSE Composite)
-        '^IXIC' (NASDAQ Composite)
-
-        See: http://finance.yahoo.com/indices for other index symbols
-
-    Returns
-    -------
-    idx_df : DataFrame
-    """
-    stats = 'snx'
-    # URL of form:
-    # http://download.finance.yahoo.com/d/quotes.csv?s=@%5EIXIC&f=snxl1d1t1c1ohgv
-    url = _YAHOO_COMPONENTS_URL + 's={0}&f={1}&e=.csv&h={2}'
-
-    idx_mod = idx_sym.replace('^', '@%5E')
-    url_str = url.format(idx_mod, stats, 1)
-
-    idx_df = DataFrame()
-    mask = [True]
-    comp_idx = 1
-
-    # LOOP across component index structure,
-    # break when no new components are found
-    while True in mask:
-        url_str = url.format(idx_mod, stats,  comp_idx)
-        with urlopen(url_str) as resp:
-            raw = resp.read()
-        lines = raw.decode('utf-8').strip().strip('"').split('"\r\n"')
-        lines = [line.strip().split('","') for line in lines]
-
-        temp_df = DataFrame(lines, columns=['ticker', 'name', 'exchange'])
-        temp_df = temp_df.drop_duplicates()
-        temp_df = temp_df.set_index('ticker')
-        mask = ~temp_df.index.isin(idx_df.index)
-
-        comp_idx = comp_idx + 50
-        idx_df = idx_df.append(temp_df[mask])
-
-    return idx_df
-
-
-def _dl_mult_symbols(symbols, start, end, interval, chunksize, retry_count, pause,
-                     method):
-    stocks = {}
-    failed = []
-    passed = []
-    for sym_group in _in_chunks(symbols, chunksize):
-        for sym in sym_group:
-            try:
-                stocks[sym] = method(sym, start, end, interval, retry_count, pause)
-                passed.append(sym)
-            except IOError:
-                warnings.warn('Failed to read symbol: {0!r}, replacing with '
-                              'NaN.'.format(sym), SymbolWarning)
-                failed.append(sym)
-
-    if len(passed) == 0:
-        raise RemoteDataError("No data fetched using "
-                              "{0!r}".format(method.__name__))
-    try:
-        if len(stocks) > 0 and len(failed) > 0 and len(passed) > 0:
-            df_na = stocks[passed[0]].copy()
-            df_na[:] = np.nan
-            for sym in failed:
-                stocks[sym] = df_na
-        return Panel(stocks).swapaxes('items', 'minor')
-    except AttributeError:
-        # cannot construct a panel with just 1D nans indicating no data
-        raise RemoteDataError("No data fetched using "
-                              "{0!r}".format(method.__name__))
-
-_source_functions = {'google': _get_hist_google, 'yahoo': _get_hist_yahoo}
-
-
-def _get_data_from(symbols, start, end, interval, retry_count, pause, adjust_price,
-                   ret_index, chunksize, source):
-
-    src_fn = _source_functions[source]
-
-    # If a single symbol, (e.g., 'GOOG')
-    if isinstance(symbols, (compat.string_types, int)):
-        hist_data = src_fn(symbols, start, end, interval, retry_count, pause)
-    # Or multiple symbols, (e.g., ['GOOG', 'AAPL', 'MSFT'])
-    elif isinstance(symbols, DataFrame):
-        hist_data = _dl_mult_symbols(symbols.index, start, end, interval, chunksize,
-                                     retry_count, pause, src_fn)
-    else:
-        hist_data = _dl_mult_symbols(symbols, start, end, interval, chunksize,
-                                     retry_count, pause, src_fn)
-    if source.lower() == 'yahoo':
-        if ret_index:
-            hist_data['Ret_Index'] = _calc_return_index(hist_data['Adj Close'])
-        if adjust_price:
-            hist_data = _adjust_prices(hist_data)
-
-    return hist_data
-
-
-def get_data_yahoo(symbols=None, start=None, end=None, retry_count=3,
-                   pause=0.001, adjust_price=False, ret_index=False,
-                   chunksize=25, interval='d'):
-    """
-    Returns DataFrame/Panel of historical stock prices from symbols, over date
-    range, start to end. To avoid being penalized by Yahoo! Finance servers,
-    pauses between downloading 'chunks' of symbols can be specified.
-
-    Parameters
-    ----------
-    symbols : string, array-like object (list, tuple, Series), or DataFrame, default: None
-        Single stock symbol (ticker), array-like object of symbols or
-        DataFrame with index containing stock symbols
-    start : string, (defaults to '1/1/2010')
-        Starting date, timestamp. Parses many different kind of date
-        representations (e.g., 'JAN-01-2010', '1/1/10', 'Jan, 1, 1980')
-    end : string, (defaults to today)
-        Ending date, timestamp. Same format as starting date.
-    retry_count : int, default: 3
-        Number of times to retry query request.
-    pause : numeric, default: 0.001
-        Time, in seconds, to pause between consecutive queries of chunks. If
-        single value given for symbol, represents the pause between retries.
-    adjust_price : bool, default: False
-        If True, adjusts all prices in hist_data ('Open', 'High', 'Low',
-        'Close') based on 'Adj Close' price. Adds 'Adj_Ratio' column and drops
-        'Adj Close'.
-    ret_index : bool, default: False
-        If True, includes a simple return index 'Ret_Index' in hist_data.
-    chunksize : int, default: 25
-        Number of symbols to download consecutively before intiating pause.
-    interval : string, default: 'd'
-        Time interval code, valid values are 'd' for daily, 'w' for weekly,
-        'm' for monthly and 'v' for dividend.
-
-    Returns
-    -------
-    hist_data : DataFrame (str) or Panel (array-like object, DataFrame)
-    """
-    if interval not in ['d', 'w', 'm', 'v']:
-        raise ValueError("Invalid interval: valid values are 'd', 'w', 'm' and 'v'")
-    return _get_data_from(symbols, start, end, interval, retry_count, pause,
-                          adjust_price, ret_index, chunksize, 'yahoo')
-
-
-def get_data_google(symbols=None, start=None, end=None, retry_count=3,
-                    pause=0.001, adjust_price=False, ret_index=False,
-                    chunksize=25):
-    """
-    Returns DataFrame/Panel of historical stock prices from symbols, over date
-    range, start to end. To avoid being penalized by Google Finance servers,
-    pauses between downloading 'chunks' of symbols can be specified.
-
-    Parameters
-    ----------
-    symbols : string, array-like object (list, tuple, Series), or DataFrame
-        Single stock symbol (ticker), array-like object of symbols or
-        DataFrame with index containing stock symbols.
-    start : string, (defaults to '1/1/2010')
-        Starting date, timestamp. Parses many different kind of date
-        representations (e.g., 'JAN-01-2010', '1/1/10', 'Jan, 1, 1980')
-    end : string, (defaults to today)
-        Ending date, timestamp. Same format as starting date.
-    retry_count : int, default: 3
-        Number of times to retry query request.
-    pause : numeric, default: 0.001
-        Time, in seconds, to pause between consecutive queries of chunks. If
-        single value given for symbol, represents the pause between retries.
-    chunksize : int, default: 25
-        Number of symbols to download consecutively before intiating pause.
-    ret_index : bool, default: False
-        If True, includes a simple return index 'Ret_Index' in hist_data.
-
-    Returns
-    -------
-    hist_data : DataFrame (str) or Panel (array-like object, DataFrame)
-    """
-    return _get_data_from(symbols, start, end, None, retry_count, pause,
-                          adjust_price, ret_index, chunksize, 'google')
-
-
-_FRED_URL = "http://research.stlouisfed.org/fred2/series/"
-
-
-def get_data_fred(name, start=dt.datetime(2010, 1, 1),
-                  end=dt.datetime.today()):
-    """
-    Get data for the given name from the St. Louis FED (FRED).
-    Date format is datetime
-
-    Returns a DataFrame.
-
-    If multiple names are passed for "series" then the index of the
-    DataFrame is the outer join of the indicies of each series.
-    """
-    start, end = _sanitize_dates(start, end)
-
-    if not is_list_like(name):
-        names = [name]
-    else:
-        names = name
-
-    urls = [_FRED_URL + '%s' % n + '/downloaddata/%s' % n + '.csv' for
-            n in names]
-
-    def fetch_data(url, name):
-        with urlopen(url) as resp:
-            data = read_csv(resp, index_col=0, parse_dates=True,
-                            header=None, skiprows=1, names=["DATE", name],
-                            na_values='.')
-        try:
-            return data.truncate(start, end)
-        except KeyError:
-            if data.ix[3].name[7:12] == 'Error':
-                raise IOError("Failed to get the data. Check that {0!r} is "
-                              "a valid FRED series.".format(name))
-            raise
-    df = concat([fetch_data(url, n) for url, n in zip(urls, names)],
-                axis=1, join='outer')
-    return df
-
-
-_FAMAFRENCH_URL = 'http://mba.tuck.dartmouth.edu/pages/faculty/ken.french/ftp'
-
-
-def get_data_famafrench(name):
-    # path of zip files
-    zip_file_path = '{0}/{1}_TXT.zip'.format(_FAMAFRENCH_URL, name)
-
-    with urlopen(zip_file_path) as url:
-        raw = url.read()
-
-    with tempfile.TemporaryFile() as tmpf:
-        tmpf.write(raw)
-
-        with ZipFile(tmpf, 'r') as zf:
-            data = zf.open(zf.namelist()[0]).readlines()
-
-    line_lengths = np.array(lmap(len, data))
-    file_edges = np.where(line_lengths == 2)[0]
-
-    datasets = {}
-    edges = zip(file_edges + 1, file_edges[1:])
-    for i, (left_edge, right_edge) in enumerate(edges):
-        dataset = [d.split() for d in data[left_edge:right_edge]]
-        if len(dataset) > 10:
-            ncol_raw = np.array(lmap(len, dataset))
-            ncol = np.median(ncol_raw)
-            header_index = np.where(ncol_raw == ncol - 1)[0][-1]
-            header = dataset[header_index]
-            ds_header = dataset[header_index + 1:]
-            # to ensure the header is unique
-            header = ['{0} {1}'.format(j, hj) for j, hj in enumerate(header,
-                                                                     start=1)]
-            index = np.array([d[0] for d in ds_header], dtype=int)
-            dataset = np.array([d[1:] for d in ds_header], dtype=float)
-            datasets[i] = DataFrame(dataset, index, columns=header)
-
-    return datasets
-
-
-# Items needed for options class
-CUR_MONTH = dt.datetime.now().month
-CUR_YEAR = dt.datetime.now().year
-CUR_DAY = dt.datetime.now().day
-
-
-def _two_char(s):
-    return '{0:0>2}'.format(s)
-
-
-class Options(object):
-    """
-    ***Experimental***
-    This class fetches call/put data for a given stock/expiry month.
-
-    It is instantiated with a string representing the ticker symbol.
-
-    The class has the following methods:
-        get_options_data:(month, year, expiry)
-        get_call_data:(month, year, expiry)
-        get_put_data: (month, year, expiry)
-        get_near_stock_price(opt_frame, above_below)
-        get_all_data(call, put)
-        get_forward_data(months, call, put) (deprecated)
-
-    Examples
-    --------
-    # Instantiate object with ticker
-    >>> aapl = Options('aapl', 'yahoo')
-
-    # Fetch next expiry call data
-    >>> calls = aapl.get_call_data()
-
-    # Can now access aapl.calls instance variable
-    >>> aapl.calls
-
-    # Fetch next expiry put data
-    >>> puts = aapl.get_put_data()
-
-    # Can now access aapl.puts instance variable
-    >>> aapl.puts
-
-    # cut down the call data to be 3 below and 3 above the stock price.
-    >>> cut_calls = aapl.get_near_stock_price(call=True, above_below=3)
-
-    # Fetch call and put data with expiry from now to 8 months out
-    >>> forward_data = aapl.get_forward_data(8, call=True, put=True)
-
-    # Fetch all call and put data
-    >>> all_data = aapl.get_all_data()
-    """
-
-    _TABLE_LOC = {'calls': 1, 'puts': 2}
-    _OPTIONS_BASE_URL = 'http://finance.yahoo.com/q/op?s={sym}'
-    _FINANCE_BASE_URL = 'http://finance.yahoo.com'
-
-    def __init__(self, symbol, data_source=None):
-        """ Instantiates options_data with a ticker saved as symbol """
-        self.symbol = symbol.upper()
-        if data_source is None:
-            warnings.warn("Options(symbol) is deprecated, use Options(symbol,"
-                          " data_source) instead", FutureWarning, stacklevel=2)
-            data_source = "yahoo"
-        if data_source != "yahoo":
-            raise NotImplementedError("currently only yahoo supported")
-
-    def get_options_data(self, month=None, year=None, expiry=None):
-        """
-        ***Experimental***
-        Gets call/put data for the stock with the expiration data in the
-        given month and year
-
-        Parameters
-        ----------
-        month : number, int, optional(default=None)
-            The month the options expire. This should be either 1 or 2
-            digits.
-
-        year : number, int, optional(default=None)
-            The year the options expire. This should be a 4 digit int.
-
-        expiry : date-like or convertible or list-like object, optional (default=None)
-            The date (or dates) when options expire (defaults to current month)
-
-        Returns
-        -------
-        pandas.DataFrame
-            A DataFrame with requested options data.
-
-            Index:
-                Strike: Option strike, int
-                Expiry: Option expiry, Timestamp
-                Type: Call or Put, string
-                Symbol: Option symbol as reported on Yahoo, string
-            Columns:
-                Last: Last option price, float
-                Chg: Change from prior day, float
-                Bid: Bid price, float
-                Ask: Ask price, float
-                Vol: Volume traded, int64
-                Open_Int: Open interest, int64
-                IsNonstandard: True if the the deliverable is not 100 shares, otherwise false
-                Underlying: Ticker of the underlying security, string
-                Underlying_Price: Price of the underlying security, float64
-                Quote_Time: Time of the quote, Timestamp
-
-        Notes
-        -----
-        Note: Format of returned data frame is dependent on Yahoo and may change.
-
-        When called, this function will add instance variables named
-        calls and puts. See the following example:
-
-            >>> aapl = Options('aapl', 'yahoo')  # Create object
-            >>> aapl.calls  # will give an AttributeError
-            >>> aapl.get_options()  # Get data and set ivars
-            >>> aapl.calls  # Doesn't throw AttributeError
-
-        Also note that aapl.calls and appl.puts will always be the calls
-        and puts for the next expiry. If the user calls this method with
-        a different expiry, the ivar will be named callsYYMMDD or putsYYMMDD,
-        where YY, MM and DD are, respectively, two digit representations of
-        the year, month and day for the expiry of the options.
-
-        """
-        return concat([f(month, year, expiry)
-                       for f in (self.get_put_data,
-                                 self.get_call_data)]).sortlevel()
-
-    def _get_option_frames_from_yahoo(self, expiry):
-        url = self._yahoo_url_from_expiry(expiry)
-        option_frames = self._option_frames_from_url(url)
-        frame_name = '_frames' + self._expiry_to_string(expiry)
-        setattr(self, frame_name, option_frames)
-        return option_frames
-
-    @staticmethod
-    def _expiry_to_string(expiry):
-        m1 = _two_char(expiry.month)
-        d1 = _two_char(expiry.day)
-        return str(expiry.year)[-2:] + m1 + d1
-
-    def _yahoo_url_from_expiry(self, expiry):
-        try:
-            expiry_links = self._expiry_links
-
-        except AttributeError:
-            _, expiry_links = self._get_expiry_dates_and_links()
-
-        return self._FINANCE_BASE_URL + expiry_links[expiry]
-
-    def _option_frames_from_url(self, url):
-        frames = read_html(url)
-        nframes = len(frames)
-        frames_req = max(self._TABLE_LOC.values())
-        if nframes < frames_req:
-            raise RemoteDataError("%s options tables found (%s expected)" % (nframes, frames_req))
-
-        if not hasattr(self, 'underlying_price'):
-            try:
-                self.underlying_price, self.quote_time = self._underlying_price_and_time_from_url(url)
-            except IndexError:
-                self.underlying_price, self.quote_time = np.nan, np.nan
-
-        calls = frames[self._TABLE_LOC['calls']]
-        puts = frames[self._TABLE_LOC['puts']]
-
-        calls = self._process_data(calls, 'call')
-        puts = self._process_data(puts, 'put')
-
-        return {'calls': calls, 'puts': puts}
-
-    def _underlying_price_and_time_from_url(self, url):
-        root = self._parse_url(url)
-        underlying_price = self._underlying_price_from_root(root)
-        quote_time = self._quote_time_from_root(root)
-        return underlying_price, quote_time
-
-    @staticmethod
-    def _underlying_price_from_root(root):
-        underlying_price = root.xpath('.//*[@class="time_rtq_ticker Fz-30 Fw-b"]')[0]\
-            .getchildren()[0].text
-        underlying_price = underlying_price.replace(',', '') #GH11
-
-        try:
-            underlying_price = float(underlying_price)
-        except ValueError:
-            underlying_price = np.nan
-
-        return underlying_price
-
-    @staticmethod
-    def _quote_time_from_root(root):
-        #Gets the time of the quote, note this is actually the time of the underlying price.
-        try:
-            quote_time_text = root.xpath('.//*[@class="time_rtq Fz-m"]')[0].getchildren()[1].getchildren()[0].text
-            ##TODO: Enable timezone matching when strptime can match EST with %Z
-            quote_time_text = quote_time_text.split(' ')[0]
-            quote_time = dt.datetime.strptime(quote_time_text, "%I:%M%p")
-            quote_time = quote_time.replace(year=CUR_YEAR, month=CUR_MONTH, day=CUR_DAY)
-        except ValueError:
-            quote_time = np.nan
-
-        return quote_time
-
-    def _get_option_data(self, expiry, name):
-        frame_name = '_frames' + self._expiry_to_string(expiry)
-
-        try:
-            frames = getattr(self, frame_name)
-        except AttributeError:
-            frames = self._get_option_frames_from_yahoo(expiry)
-
-        option_data = frames[name]
-        if expiry != self.expiry_dates[0]:
-            name += self._expiry_to_string(expiry)
-
-        setattr(self, name, option_data)
-        return option_data
-
-    def get_call_data(self, month=None, year=None, expiry=None):
-        """
-        ***Experimental***
-        Gets call/put data for the stock with the expiration data in the
-        given month and year
-
-        Parameters
-        ----------
-        month : number, int, optional(default=None)
-            The month the options expire. This should be either 1 or 2
-            digits.
-
-        year : number, int, optional(default=None)
-            The year the options expire. This should be a 4 digit int.
-
-        expiry : date-like or convertible or list-like object, optional (default=None)
-            The date (or dates) when options expire (defaults to current month)
-
-        Returns
-        -------
-        call_data: pandas.DataFrame
-            A DataFrame with requested options data.
-
-            Index:
-                Strike: Option strike, int
-                Expiry: Option expiry, Timestamp
-                Type: Call or Put, string
-                Symbol: Option symbol as reported on Yahoo, string
-            Columns:
-                Last: Last option price, float
-                Chg: Change from prior day, float
-                Bid: Bid price, float
-                Ask: Ask price, float
-                Vol: Volume traded, int64
-                Open_Int: Open interest, int64
-                IsNonstandard: True if the the deliverable is not 100 shares, otherwise false
-                Underlying: Ticker of the underlying security, string
-                Underlying_Price: Price of the underlying security, float64
-                Quote_Time: Time of the quote, Timestamp
-
-        Notes
-        -----
-        Note: Format of returned data frame is dependent on Yahoo and may change.
-
-        When called, this function will add instance variables named
-        calls and puts. See the following example:
-
-            >>> aapl = Options('aapl', 'yahoo')  # Create object
-            >>> aapl.calls  # will give an AttributeError
-            >>> aapl.get_call_data()  # Get data and set ivars
-            >>> aapl.calls  # Doesn't throw AttributeError
-
-        Also note that aapl.calls will always be the calls for the next
-        expiry. If the user calls this method with a different month
-        or year, the ivar will be named callsYYMMDD where YY, MM and DD are,
-        respectively, two digit representations of the year, month and day
-        for the expiry of the options.
-        """
-        expiry = self._try_parse_dates(year, month, expiry)
-        return self._get_data_in_date_range(expiry, call=True, put=False)
-
-    def get_put_data(self, month=None, year=None, expiry=None):
-        """
-        ***Experimental***
-        Gets put data for the stock with the expiration data in the
-        given month and year
-
-        Parameters
-        ----------
-        month : number, int, optional(default=None)
-            The month the options expire. This should be either 1 or 2
-            digits.
-
-        year : number, int, optional(default=None)
-            The year the options expire. This should be a 4 digit int.
-
-        expiry : date-like or convertible or list-like object, optional (default=None)
-            The date (or dates) when options expire (defaults to current month)
-
-        Returns
-        -------
-        put_data: pandas.DataFrame
-            A DataFrame with requested options data.
-
-            Index:
-                Strike: Option strike, int
-                Expiry: Option expiry, Timestamp
-                Type: Call or Put, string
-                Symbol: Option symbol as reported on Yahoo, string
-            Columns:
-                Last: Last option price, float
-                Chg: Change from prior day, float
-                Bid: Bid price, float
-                Ask: Ask price, float
-                Vol: Volume traded, int64
-                Open_Int: Open interest, int64
-                IsNonstandard: True if the the deliverable is not 100 shares, otherwise false
-                Underlying: Ticker of the underlying security, string
-                Underlying_Price: Price of the underlying security, float64
-                Quote_Time: Time of the quote, Timestamp
-
-        Notes
-        -----
-        Note: Format of returned data frame is dependent on Yahoo and may change.
-
-        When called, this function will add instance variables named
-        puts. See the following example:
-
-            >>> aapl = Options('aapl')  # Create object
-            >>> aapl.puts  # will give an AttributeError
-            >>> aapl.get_put_data()  # Get data and set ivars
-            >>> aapl.puts  # Doesn't throw AttributeError
-
-                    return self.__setattr__(self, str(str(x) + str(y)))
-
-        Also note that aapl.puts will always be the puts for the next
-        expiry. If the user calls this method with a different month
-        or year, the ivar will be named putsYYMMDD where YY, MM and DD are,
-        respectively, two digit representations of the year, month and day
-        for the expiry of the options.
-        """
-        expiry = self._try_parse_dates(year, month, expiry)
-        return self._get_data_in_date_range(expiry, put=True, call=False)
-
-    def get_near_stock_price(self, above_below=2, call=True, put=False,
-                             month=None, year=None, expiry=None):
-        """
-        ***Experimental***
-        Returns a data frame of options that are near the current stock price.
-
-        Parameters
-        ----------
-        above_below : number, int, optional (default=2)
-            The number of strike prices above and below the stock price that
-            should be taken
-
-        call : bool, default: True
-            Tells the function whether or not it should be using calls
-
-        put : bool, default: False
-            Tells the function weather or not it should be using puts
-
-        month : number, int, optional(default=None)
-            The month the options expire. This should be either 1 or 2
-            digits.
-
-        year : number, int, optional(default=None)
-            The year the options expire. This should be a 4 digit int.
-
-        expiry : date-like or convertible or list-like object, optional (default=None)
-            The date (or dates) when options expire (defaults to current month)
-
-        Returns
-        -------
-        chopped: DataFrame
-            The resultant DataFrame chopped down to be 2 * above_below + 1 rows
-            desired. If there isn't data as far out as the user has asked for
-            then
-
-         Note: Format of returned data frame is dependent on Yahoo and may change.
-
-        """
-        expiry = self._try_parse_dates(year, month, expiry)
-        data = self._get_data_in_date_range(expiry, call=call, put=put)
-        return self.chop_data(data, above_below, self.underlying_price)
-
-    def chop_data(self, df, above_below=2, underlying_price=None):
-        """Returns a data frame only options that are near the current stock price."""
-
-        if not underlying_price:
-            try:
-                underlying_price = self.underlying_price
-            except AttributeError:
-                underlying_price = np.nan
-
-        max_strike = max(df.index.get_level_values('Strike'))
-        min_strike = min(df.index.get_level_values('Strike'))
-
-        if not np.isnan(underlying_price) and min_strike < underlying_price < max_strike:
-            start_index = np.where(df.index.get_level_values('Strike')
-                                   > underlying_price)[0][0]
-
-            get_range = slice(start_index - above_below,
-                              start_index + above_below + 1)
-            df = df[get_range].dropna(how='all')
-
-        return df
-
-    def _try_parse_dates(self, year, month, expiry):
-        """
-        Validates dates provided by user.  Ensures the user either provided both a month and a year or an expiry.
-
-        Parameters
-        ----------
-        year : int
-            Calendar year
-
-        month : int
-            Calendar month
-
-        expiry : date-like or convertible, (preferred)
-            Expiry date
-
-        Returns
-        -------
-        list of expiry dates (datetime.date)
-        """
-
-        #Checks if the user gave one of the month or the year but not both and did not provide an expiry:
-        if (month is not None and year is None) or (month is None and year is not None) and expiry is None:
-            msg = "You must specify either (`year` and `month`) or `expiry` " \
-                  "or none of these options for the next expiry."
-            raise ValueError(msg)
-
-        if expiry is not None:
-            if hasattr(expiry, '__iter__'):
-                expiry = [self._validate_expiry(exp) for exp in expiry]
-            else:
-                expiry = [self._validate_expiry(expiry)]
-
-            if len(expiry) == 0:
-                raise ValueError('No expiries available for given input.')
-
-        elif year is None and month is None:
-            #No arguments passed, provide next expiry
-            year = CUR_YEAR
-            month = CUR_MONTH
-            expiry = dt.date(year, month, 1)
-            expiry = [self._validate_expiry(expiry)]
-
-        else:
-            #Year and month passed, provide all expiries in that month
-            expiry = [expiry for expiry in self.expiry_dates if expiry.year == year and expiry.month == month]
-            if len(expiry) == 0:
-                raise ValueError('No expiries available in %s-%s' % (year, month))
-
-        return expiry
-
-    def _validate_expiry(self, expiry):
-        """Ensures that an expiry date has data available on Yahoo
-        If the expiry date does not have options that expire on that day, return next expiry"""
-
-        expiry_dates = self.expiry_dates
-        expiry = to_datetime(expiry)
-        if hasattr(expiry, 'date'):
-            expiry = expiry.date()
-
-        if expiry in expiry_dates:
-            return expiry
-        else:
-            index = DatetimeIndex(expiry_dates).order()
-            return index[index.date >= expiry][0].date()
-
-    def get_forward_data(self, months, call=True, put=False, near=False,
-                         above_below=2):
-        """
-        ***Experimental***
-        Gets either call, put, or both data for months starting in the current
-        month and going out in the future a specified amount of time.
-
-        Parameters
-        ----------
-        months : number, int
-            How many months to go out in the collection of the data. This is
-            inclusive.
-
-        call : bool, optional (default=True)
-            Whether or not to collect data for call options
-
-        put : bool, optional (default=False)
-            Whether or not to collect data for put options.
-
-        near : bool, optional (default=False)
-            Whether this function should get only the data near the
-            current stock price. Uses Options.get_near_stock_price
-
-        above_below : number, int, optional (default=2)
-            The number of strike prices above and below the stock price that
-            should be taken if the near option is set to True
-
-        Returns
-        -------
-        pandas.DataFrame
-            A DataFrame with requested options data.
-
-            Index:
-                Strike: Option strike, int
-                Expiry: Option expiry, Timestamp
-                Type: Call or Put, string
-                Symbol: Option symbol as reported on Yahoo, string
-            Columns:
-                Last: Last option price, float
-                Chg: Change from prior day, float
-                Bid: Bid price, float
-                Ask: Ask price, float
-                Vol: Volume traded, int64
-                Open_Int: Open interest, int64
-                IsNonstandard: True if the the deliverable is not 100 shares, otherwise false
-                Underlying: Ticker of the underlying security, string
-                Underlying_Price: Price of the underlying security, float64
-                Quote_Time: Time of the quote, Timestamp
-
-                Note: Format of returned data frame is dependent on Yahoo and may change.
-
-        """
-        warnings.warn("get_forward_data() is deprecated", FutureWarning,
-                      stacklevel=2)
-        end_date = dt.date.today() + MonthEnd(months)
-        dates = (date for date in self.expiry_dates if date <= end_date.date())
-        data = self._get_data_in_date_range(dates, call=call, put=put)
-        if near:
-            data = self.chop_data(data, above_below=above_below)
-        return data
-
-    def get_all_data(self, call=True, put=True):
-        """
-        ***Experimental***
-        Gets either call, put, or both data for all available months starting
-        in the current month.
-
-        Parameters
-        ----------
-        call : bool, optional (default=True)
-            Whether or not to collect data for call options
-
-        put : bool, optional (default=True)
-            Whether or not to collect data for put options.
-
-        Returns
-        -------
-        pandas.DataFrame
-            A DataFrame with requested options data.
-
-            Index:
-                Strike: Option strike, int
-                Expiry: Option expiry, Timestamp
-                Type: Call or Put, string
-                Symbol: Option symbol as reported on Yahoo, string
-            Columns:
-                Last: Last option price, float
-                Chg: Change from prior day, float
-                Bid: Bid price, float
-                Ask: Ask price, float
-                Vol: Volume traded, int64
-                Open_Int: Open interest, int64
-                IsNonstandard: True if the the deliverable is not 100 shares, otherwise false
-                Underlying: Ticker of the underlying security, string
-                Underlying_Price: Price of the underlying security, float64
-                Quote_Time: Time of the quote, Timestamp
-
-        Note: Format of returned data frame is dependent on Yahoo and may change.
-
-        """
-
-        try:
-            expiry_dates = self.expiry_dates
-        except AttributeError:
-            expiry_dates, _ = self._get_expiry_dates_and_links()
-
-        return self._get_data_in_date_range(dates=expiry_dates, call=call, put=put)
-
-    def _get_data_in_date_range(self, dates, call=True, put=True):
-
-        to_ret = Series({'calls': call, 'puts': put})
-        to_ret = to_ret[to_ret].index
-        data = []
-
-        for name in to_ret:
-            for expiry_date in dates:
-                nam = name + self._expiry_to_string(expiry_date)
-                try:  # Try to access on the instance
-                    frame = getattr(self, nam)
-                except AttributeError:
-                    frame = self._get_option_data(expiry=expiry_date, name=name)
-                data.append(frame)
-
-        return concat(data).sortlevel()
-
-    @property
-    def expiry_dates(self):
-        """
-        Returns a list of available expiry dates
-        """
-        try:
-            expiry_dates = self._expiry_dates
-        except AttributeError:
-            expiry_dates, _ = self._get_expiry_dates_and_links()
-        return expiry_dates
-
-    def _get_expiry_dates_and_links(self):
-        """
-        Gets available expiry dates.
-
-        Returns
-        -------
-        Tuple of:
-        List of datetime.date objects
-        Dict of datetime.date objects as keys and corresponding links
-        """
-
-        url = self._OPTIONS_BASE_URL.format(sym=self.symbol)
-        root = self._parse_url(url)
-
-        try:
-            links = root.xpath('//*[@id="options_menu"]/form/select/option')
-        except IndexError:
-            raise RemoteDataError('Expiry dates not available')
-
-        expiry_dates = [dt.datetime.strptime(element.text, "%B %d, %Y").date() for element in links]
-        links = [element.attrib['data-selectbox-link'] for element in links]
-
-        if len(expiry_dates) == 0:
-            raise RemoteDataError('Data not available')
-
-        expiry_links = dict(zip(expiry_dates, links))
-        self._expiry_links = expiry_links
-        self._expiry_dates = expiry_dates
-        return expiry_dates, expiry_links
-
-    def _parse_url(self, url):
-        """
-        Downloads and parses a URL, returns xml root.
-
-        """
-        try:
-            from lxml.html import parse
-        except ImportError:
-            raise ImportError("Please install lxml if you want to use the "
-                              "{0!r} class".format(self.__class__.__name__))
-        try:
-            doc = parse(url)
-        except _network_error_classes:
-            raise RemoteDataError("Unable to parse URL "
-                                  "{0!r}".format(url))
-        else:
-            root = doc.getroot()
-            if root is None:
-                raise RemoteDataError("Parsed URL {0!r} has no root"
-                                      "element".format(url))
-        return root
-
-    def _process_data(self, frame, type):
-        """
-        Adds columns for Expiry, IsNonstandard (ie: deliverable is not 100 shares)
-        and Tag (the tag indicating what is actually deliverable, None if standard).
-
-        """
-        frame.columns = ['Strike', 'Symbol', 'Last', 'Bid', 'Ask', 'Chg', 'PctChg', 'Vol', 'Open_Int', 'IV']
-        frame["Rootexp"] = frame.Symbol.str[0:-9]
-        frame["Root"] = frame.Rootexp.str[0:-6]
-        frame["Expiry"] = to_datetime(frame.Rootexp.str[-6:])
-        #Removes dashes in equity ticker to map to option ticker.
-        #Ex: BRK-B to BRKB140517C00100000
-        frame["IsNonstandard"] = frame['Root'] != self.symbol.replace('-', '')
-        del frame["Rootexp"]
-        frame["Underlying"] = self.symbol
-        try:
-            frame['Underlying_Price'] = self.underlying_price
-            frame["Quote_Time"] = self.quote_time
-        except AttributeError:
-            frame['Underlying_Price'] = np.nan
-            frame["Quote_Time"] = np.nan
-        frame.rename(columns={'Open Int': 'Open_Int'}, inplace=True)
-        frame['Type'] = type
-        frame.set_index(['Strike', 'Expiry', 'Type', 'Symbol'], inplace=True)
-
-        return frame
diff --git a/pandas/io/date_converters.py b/pandas/io/date_converters.py
index 3ffcef4b21552..377373f8a0135 100644
--- a/pandas/io/date_converters.py
+++ b/pandas/io/date_converters.py
@@ -1,20 +1,20 @@
 """This module is designed for community supported date conversion functions"""
 from pandas.compat import range, map
 import numpy as np
-import pandas.lib as lib
+from pandas._libs.tslibs import parsing
 
 
 def parse_date_time(date_col, time_col):
     date_col = _maybe_cast(date_col)
     time_col = _maybe_cast(time_col)
-    return lib.try_parse_date_and_time(date_col, time_col)
+    return parsing.try_parse_date_and_time(date_col, time_col)
 
 
 def parse_date_fields(year_col, month_col, day_col):
     year_col = _maybe_cast(year_col)
     month_col = _maybe_cast(month_col)
     day_col = _maybe_cast(day_col)
-    return lib.try_parse_year_month_day(year_col, month_col, day_col)
+    return parsing.try_parse_year_month_day(year_col, month_col, day_col)
 
 
 def parse_all_fields(year_col, month_col, day_col, hour_col, minute_col,
@@ -25,8 +25,9 @@ def parse_all_fields(year_col, month_col, day_col, hour_col, minute_col,
     hour_col = _maybe_cast(hour_col)
     minute_col = _maybe_cast(minute_col)
     second_col = _maybe_cast(second_col)
-    return lib.try_parse_datetime_components(year_col, month_col, day_col,
-                                             hour_col, minute_col, second_col)
+    return parsing.try_parse_datetime_components(year_col, month_col, day_col,
+                                                 hour_col, minute_col,
+                                                 second_col)
 
 
 def generic_parser(parse_func, *cols):
diff --git a/pandas/io/excel.py b/pandas/io/excel.py
index a7a844cdfcb40..793a95ffb0ee7 100644
--- a/pandas/io/excel.py
+++ b/pandas/io/excel.py
@@ -2,34 +2,245 @@
 Module parse to/from Excel
 """
 
-#----------------------------------------------------------------------
+# ---------------------------------------------------------------------
 # ExcelFile class
+from datetime import datetime, date, time, MINYEAR, timedelta
+
 import os
-import datetime
 import abc
+import warnings
 import numpy as np
+from io import UnsupportedOperation
+
+from pandas.core.dtypes.common import (
+    is_integer, is_float,
+    is_bool, is_list_like)
 
 from pandas.core.frame import DataFrame
 from pandas.io.parsers import TextParser
-from pandas.io.common import _is_url, _urlopen, _validate_header_arg
-from pandas.tseries.period import Period
-from pandas import json
+from pandas.errors import EmptyDataError
+from pandas.io.common import (_is_url, _urlopen, _validate_header_arg,
+                              get_filepath_or_buffer, _NA_VALUES,
+                              _stringify_path)
+import pandas._libs.json as json
 from pandas.compat import (map, zip, reduce, range, lrange, u, add_metaclass,
-                           BytesIO, string_types)
+                           string_types, OrderedDict)
 from pandas.core import config
-from pandas.core.common import pprint_thing
-from pandas.util.decorators import Appender
+from pandas.io.formats.printing import pprint_thing
 import pandas.compat as compat
-import pandas.compat.openpyxl_compat as openpyxl_compat
-import pandas.core.common as com
 from warnings import warn
 from distutils.version import LooseVersion
+from pandas.util._decorators import Appender, deprecate_kwarg
+from textwrap import fill
 
 __all__ = ["read_excel", "ExcelWriter", "ExcelFile"]
 
 _writer_extensions = ["xlsx", "xls", "xlsm"]
 _writers = {}
 
+_read_excel_doc = """
+Read an Excel table into a pandas DataFrame
+
+Parameters
+----------
+io : string, path object (pathlib.Path or py._path.local.LocalPath),
+    file-like object, pandas ExcelFile, or xlrd workbook.
+    The string could be a URL. Valid URL schemes include http, ftp, s3,
+    gcs, and file. For file URLs, a host is expected. For instance, a local
+    file could be file://localhost/path/to/workbook.xlsx
+sheet_name : string, int, mixed list of strings/ints, or None, default 0
+
+    Strings are used for sheet names, Integers are used in zero-indexed
+    sheet positions.
+
+    Lists of strings/integers are used to request multiple sheets.
+
+    Specify None to get all sheets.
+
+    str|int -> DataFrame is returned.
+    list|None -> Dict of DataFrames is returned, with keys representing
+    sheets.
+
+    Available Cases
+
+    * Defaults to 0 -> 1st sheet as a DataFrame
+    * 1 -> 2nd sheet as a DataFrame
+    * "Sheet1" -> 1st sheet as a DataFrame
+    * [0,1,"Sheet5"] -> 1st, 2nd & 5th sheet as a dictionary of DataFrames
+    * None -> All sheets as a dictionary of DataFrames
+
+sheetname : string, int, mixed list of strings/ints, or None, default 0
+
+    .. deprecated:: 0.21.0
+       Use `sheet_name` instead
+
+header : int, list of ints, default 0
+    Row (0-indexed) to use for the column labels of the parsed
+    DataFrame. If a list of integers is passed those row positions will
+    be combined into a ``MultiIndex``. Use None if there is no header.
+names : array-like, default None
+    List of column names to use. If file contains no header row,
+    then you should explicitly pass header=None
+index_col : int, list of ints, default None
+    Column (0-indexed) to use as the row labels of the DataFrame.
+    Pass None if there is no such column.  If a list is passed,
+    those columns will be combined into a ``MultiIndex``.  If a
+    subset of data is selected with ``usecols``, index_col
+    is based on the subset.
+parse_cols : int or list, default None
+
+    .. deprecated:: 0.21.0
+       Pass in `usecols` instead.
+
+usecols : int or list, default None
+    * If None then parse all columns,
+    * If int then indicates last column to be parsed
+    * If list of ints then indicates list of column numbers to be parsed
+    * If string then indicates comma separated list of Excel column letters and
+      column ranges (e.g. "A:E" or "A,C,E:F").  Ranges are inclusive of
+      both sides.
+squeeze : boolean, default False
+    If the parsed data only contains one column then return a Series
+dtype : Type name or dict of column -> type, default None
+    Data type for data or columns. E.g. {'a': np.float64, 'b': np.int32}
+    Use `object` to preserve data as stored in Excel and not interpret dtype.
+    If converters are specified, they will be applied INSTEAD
+    of dtype conversion.
+
+    .. versionadded:: 0.20.0
+
+engine: string, default None
+    If io is not a buffer or path, this must be set to identify io.
+    Acceptable values are None or xlrd
+converters : dict, default None
+    Dict of functions for converting values in certain columns. Keys can
+    either be integers or column labels, values are functions that take one
+    input argument, the Excel cell content, and return the transformed
+    content.
+true_values : list, default None
+    Values to consider as True
+
+    .. versionadded:: 0.19.0
+
+false_values : list, default None
+    Values to consider as False
+
+    .. versionadded:: 0.19.0
+
+skiprows : list-like
+    Rows to skip at the beginning (0-indexed)
+nrows : int, default None
+    Number of rows to parse
+
+    .. versionadded:: 0.23.0
+
+na_values : scalar, str, list-like, or dict, default None
+    Additional strings to recognize as NA/NaN. If dict passed, specific
+    per-column NA values. By default the following values are interpreted
+    as NaN: '""" + fill("', '".join(sorted(_NA_VALUES)), 70, subsequent_indent="    ") + """'.
+keep_default_na : bool, default True
+    If na_values are specified and keep_default_na is False the default NaN
+    values are overridden, otherwise they're appended to.
+verbose : boolean, default False
+    Indicate number of NA values placed in non-numeric columns
+thousands : str, default None
+    Thousands separator for parsing string columns to numeric.  Note that
+    this parameter is only necessary for columns stored as TEXT in Excel,
+    any numeric columns will automatically be parsed, regardless of display
+    format.
+comment : str, default None
+    Comments out remainder of line. Pass a character or characters to this
+    argument to indicate comments in the input file. Any data between the
+    comment string and the end of the current line is ignored.
+skip_footer : int, default 0
+
+    .. deprecated:: 0.23.0
+       Pass in `skipfooter` instead.
+skipfooter : int, default 0
+    Rows at the end to skip (0-indexed)
+convert_float : boolean, default True
+    convert integral floats to int (i.e., 1.0 --> 1). If False, all numeric
+    data will be read in as floats: Excel stores all numbers as floats
+    internally
+
+Returns
+-------
+parsed : DataFrame or Dict of DataFrames
+    DataFrame from the passed in Excel file.  See notes in sheet_name
+    argument for more information on when a Dict of Dataframes is returned.
+
+Examples
+--------
+
+An example DataFrame written to a local file
+
+>>> df_out = pd.DataFrame([('string1', 1),
+...                        ('string2', 2),
+...                        ('string3', 3)],
+...                       columns=['Name', 'Value'])
+>>> df_out
+      Name  Value
+0  string1      1
+1  string2      2
+2  string3      3
+>>> df_out.to_excel('tmp.xlsx')
+
+The file can be read using the file name as string or an open file object:
+
+>>> pd.read_excel('tmp.xlsx')
+      Name  Value
+0  string1      1
+1  string2      2
+2  string3      3
+
+>>> pd.read_excel(open('tmp.xlsx','rb'))
+      Name  Value
+0  string1      1
+1  string2      2
+2  string3      3
+
+Index and header can be specified via the `index_col` and `header` arguments
+
+>>> pd.read_excel('tmp.xlsx', index_col=None, header=None)
+     0        1      2
+0  NaN     Name  Value
+1  0.0  string1      1
+2  1.0  string2      2
+3  2.0  string3      3
+
+Column types are inferred but can be explicitly specified
+
+>>> pd.read_excel('tmp.xlsx', dtype={'Name':str, 'Value':float})
+      Name  Value
+0  string1    1.0
+1  string2    2.0
+2  string3    3.0
+
+True, False, and NA values, and thousands separators have defaults,
+but can be explicitly specified, too. Supply the values you would like
+as strings or lists of strings!
+
+>>> pd.read_excel('tmp.xlsx',
+...               na_values=['string1', 'string2'])
+      Name  Value
+0      NaN      1
+1      NaN      2
+2  string3      3
+
+Comment lines in the excel input file can be skipped using the `comment` kwarg
+
+>>> df = pd.DataFrame({'a': ['1', '#2'], 'b': ['2', '3']})
+>>> df.to_excel('tmp.xlsx', index=False)
+>>> pd.read_excel('tmp.xlsx')
+    a  b
+0   1  2
+1  #2  3
+
+>>> pd.read_excel('tmp.xlsx', comment='#')
+   a  b
+0  1  2
+"""
+
 
 def register_writer(klass):
     """Adds engine to the excel writer registry. You must use this method to
@@ -43,131 +254,80 @@ def register_writer(klass):
         if ext.startswith('.'):
             ext = ext[1:]
         if ext not in _writer_extensions:
-            config.register_option("io.excel.%s.writer" % ext,
+            config.register_option("io.excel.{ext}.writer".format(ext=ext),
                                    engine_name, validator=str)
             _writer_extensions.append(ext)
 
 
-def get_writer(engine_name):
-    if engine_name == 'openpyxl':
-        try:
-            import openpyxl
-
-            # with version-less openpyxl engine
-            # make sure we make the intelligent choice for the user
-            if LooseVersion(openpyxl.__version__) < '2.0.0':
-                 return _writers['openpyxl1']
-            elif LooseVersion(openpyxl.__version__) < '2.2.0':
-                 return _writers['openpyxl20']
-            else:
-                 return _writers['openpyxl22']
-        except ImportError:
-            # fall through to normal exception handling below
-            pass
+def _get_default_writer(ext):
+    _default_writers = {'xlsx': 'openpyxl', 'xlsm': 'openpyxl', 'xls': 'xlwt'}
+    try:
+        import xlsxwriter  # noqa
+        _default_writers['xlsx'] = 'xlsxwriter'
+    except ImportError:
+        pass
+    return _default_writers[ext]
 
+
+def get_writer(engine_name):
     try:
         return _writers[engine_name]
     except KeyError:
-        raise ValueError("No Excel writer '%s'" % engine_name)
-
-def read_excel(io, sheetname=0, header=0, skiprows=None, skip_footer=0,
-               index_col=None, parse_cols=None, parse_dates=False,
-               date_parser=None, na_values=None, thousands=None,
-               convert_float=True, has_index_names=None, converters=None,
-               engine=None, **kwds):
-    """
-    Read an Excel table into a pandas DataFrame
-
-    Parameters
-    ----------
-    io : string, file-like object, pandas ExcelFile, or xlrd workbook.
-        The string could be a URL. Valid URL schemes include http, ftp, s3,
-        and file. For file URLs, a host is expected. For instance, a local
-        file could be file://localhost/path/to/workbook.xlsx
-    sheetname : string, int, mixed list of strings/ints, or None, default 0
-
-        Strings are used for sheet names, Integers are used in zero-indexed sheet
-        positions.
-
-        Lists of strings/integers are used to request multiple sheets.
-
-        Specify None to get all sheets.
-
-        str|int -> DataFrame is returned.
-        list|None -> Dict of DataFrames is returned, with keys representing sheets.
-
-        Available Cases
-
-        * Defaults to 0 -> 1st sheet as a DataFrame
-        * 1 -> 2nd sheet as a DataFrame
-        * "Sheet1" -> 1st sheet as a DataFrame
-        * [0,1,"Sheet5"] -> 1st, 2nd & 5th sheet as a dictionary of DataFrames
-        * None -> All sheets as a dictionary of DataFrames
-
-    header : int, list of ints, default 0
-        Row (0-indexed) to use for the column labels of the parsed
-        DataFrame. If a list of integers is passed those row positions will
-        be combined into a ``MultiIndex``
-    skiprows : list-like
-        Rows to skip at the beginning (0-indexed)
-    skip_footer : int, default 0
-        Rows at the end to skip (0-indexed)
-    index_col : int, list of ints, default None
-        Column (0-indexed) to use as the row labels of the DataFrame.
-        Pass None if there is no such column.  If a list is passed,
-        those columns will be combined into a ``MultiIndex``
-    converters : dict, default None
-        Dict of functions for converting values in certain columns. Keys can
-        either be integers or column labels, values are functions that take one
-        input argument, the Excel cell content, and return the transformed
-        content.
-    parse_cols : int or list, default None
-        * If None then parse all columns,
-        * If int then indicates last column to be parsed
-        * If list of ints then indicates list of column numbers to be parsed
-        * If string then indicates comma separated list of column names and
-          column ranges (e.g. "A:E" or "A,C,E:F")
-    na_values : list-like, default None
-        List of additional strings to recognize as NA/NaN
-    thousands : str, default None
-        Thousands separator for parsing string columns to numeric.  Note that
-        this parameter is only necessary for columns stored as TEXT in Excel,
-        any numeric columns will automatically be parsed, regardless of display
-        format.
-    keep_default_na : bool, default True
-        If na_values are specified and keep_default_na is False the default NaN
-        values are overridden, otherwise they're appended to
-    verbose : boolean, default False
-        Indicate number of NA values placed in non-numeric columns
-    engine: string, default None
-        If io is not a buffer or path, this must be set to identify io.
-        Acceptable values are None or xlrd
-    convert_float : boolean, default True
-        convert integral floats to int (i.e., 1.0 --> 1). If False, all numeric
-        data will be read in as floats: Excel stores all numbers as floats
-        internally
-    has_index_names : boolean, default None
-        DEPRECATED: for version 0.17+ index names will be automatically inferred
-        based on index_col.  To read Excel output from 0.16.2 and prior that
-        had saved index names, use True.
-
-    Returns
-    -------
-    parsed : DataFrame or Dict of DataFrames
-        DataFrame from the passed in Excel file.  See notes in sheetname argument
-        for more information on when a Dict of Dataframes is returned.
-
-    """
+        raise ValueError("No Excel writer '{engine}'"
+                         .format(engine=engine_name))
+
+
+@Appender(_read_excel_doc)
+@deprecate_kwarg("parse_cols", "usecols")
+@deprecate_kwarg("skip_footer", "skipfooter")
+def read_excel(io,
+               sheet_name=0,
+               header=0,
+               names=None,
+               index_col=None,
+               usecols=None,
+               squeeze=False,
+               dtype=None,
+               engine=None,
+               converters=None,
+               true_values=None,
+               false_values=None,
+               skiprows=None,
+               nrows=None,
+               na_values=None,
+               parse_dates=False,
+               date_parser=None,
+               thousands=None,
+               comment=None,
+               skipfooter=0,
+               convert_float=True,
+               **kwds):
 
     if not isinstance(io, ExcelFile):
         io = ExcelFile(io, engine=engine)
 
-    return io._parse_excel(
-        sheetname=sheetname, header=header, skiprows=skiprows,
-        index_col=index_col, parse_cols=parse_cols, parse_dates=parse_dates,
-        date_parser=date_parser, na_values=na_values, thousands=thousands,
-        convert_float=convert_float, has_index_names=has_index_names,
-        skip_footer=skip_footer, converters=converters, **kwds)
+    return io.parse(
+        sheet_name=sheet_name,
+        header=header,
+        names=names,
+        index_col=index_col,
+        usecols=usecols,
+        squeeze=squeeze,
+        dtype=dtype,
+        converters=converters,
+        true_values=true_values,
+        false_values=false_values,
+        skiprows=skiprows,
+        nrows=nrows,
+        na_values=na_values,
+        parse_dates=parse_dates,
+        date_parser=date_parser,
+        thousands=thousands,
+        comment=comment,
+        skipfooter=skipfooter,
+        convert_float=convert_float,
+        **kwds)
+
 
 class ExcelFile(object):
     """
@@ -176,48 +336,89 @@ class ExcelFile(object):
 
     Parameters
     ----------
-    io : string, file-like object or xlrd workbook
-        If a string, expected to be a path to xls or xlsx file
+    io : string, path object (pathlib.Path or py._path.local.LocalPath),
+        file-like object or xlrd workbook
+        If a string or path object, expected to be a path to xls or xlsx file
     engine: string, default None
         If io is not a buffer or path, this must be set to identify io.
         Acceptable values are None or xlrd
     """
+
     def __init__(self, io, **kwds):
 
-        import xlrd  # throw an ImportError if we need to
+        err_msg = "Install xlrd >= 0.9.0 for Excel support"
 
-        ver = tuple(map(int, xlrd.__VERSION__.split(".")[:2]))
-        if ver < (0, 9):  # pragma: no cover
-            raise ImportError("pandas requires xlrd >= 0.9.0 for excel "
-                              "support, current version " + xlrd.__VERSION__)
+        try:
+            import xlrd
+        except ImportError:
+            raise ImportError(err_msg)
+        else:
+            ver = tuple(map(int, xlrd.__VERSION__.split(".")[:2]))
+            if ver < (0, 9):  # pragma: no cover
+                raise ImportError(err_msg +
+                                  ". Current version " + xlrd.__VERSION__)
 
+        # could be a str, ExcelFile, Book, etc.
         self.io = io
+        # Always a string
+        self._io = _stringify_path(io)
 
         engine = kwds.pop('engine', None)
 
         if engine is not None and engine != 'xlrd':
-            raise ValueError("Unknown engine: %s" % engine)
+            raise ValueError("Unknown engine: {engine}".format(engine=engine))
 
-        if isinstance(io, compat.string_types):
-            if _is_url(io):
-                data = _urlopen(io).read()
-                self.book = xlrd.open_workbook(file_contents=data)
-            else:
-                self.book = xlrd.open_workbook(io)
-        elif engine == 'xlrd' and isinstance(io, xlrd.Book):
+        # If io is a url, want to keep the data as bytes so can't pass
+        # to get_filepath_or_buffer()
+        if _is_url(self._io):
+            io = _urlopen(self._io)
+        elif not isinstance(self.io, (ExcelFile, xlrd.Book)):
+            io, _, _, _ = get_filepath_or_buffer(self._io)
+
+        if engine == 'xlrd' and isinstance(io, xlrd.Book):
             self.book = io
         elif not isinstance(io, xlrd.Book) and hasattr(io, "read"):
             # N.B. xlrd.Book has a read attribute too
+            if hasattr(io, 'seek'):
+                try:
+                    # GH 19779
+                    io.seek(0)
+                except UnsupportedOperation:
+                    # HTTPResponse does not support seek()
+                    # GH 20434
+                    pass
+
             data = io.read()
             self.book = xlrd.open_workbook(file_contents=data)
+        elif isinstance(self._io, compat.string_types):
+            self.book = xlrd.open_workbook(self._io)
         else:
             raise ValueError('Must explicitly set engine if not passing in'
                              ' buffer or path for io.')
 
-    def parse(self, sheetname=0, header=0, skiprows=None, skip_footer=0,
-              index_col=None, parse_cols=None, parse_dates=False,
-              date_parser=None, na_values=None, thousands=None,
-              convert_float=True, has_index_names=None, converters=None, **kwds):
+    def __fspath__(self):
+        return self._io
+
+    def parse(self,
+              sheet_name=0,
+              header=0,
+              names=None,
+              index_col=None,
+              usecols=None,
+              squeeze=False,
+              converters=None,
+              true_values=None,
+              false_values=None,
+              skiprows=None,
+              nrows=None,
+              na_values=None,
+              parse_dates=False,
+              date_parser=None,
+              thousands=None,
+              comment=None,
+              skipfooter=0,
+              convert_float=True,
+              **kwds):
         """
         Parse specified sheet(s) into a DataFrame
 
@@ -225,20 +426,36 @@ def parse(self, sheetname=0, header=0, skiprows=None, skip_footer=0,
         docstring for more info on accepted parameters
         """
 
-        return self._parse_excel(sheetname=sheetname, header=header,
-                                 skiprows=skiprows,
+        # Can't use _deprecate_kwarg since sheetname=None has a special meaning
+        if is_integer(sheet_name) and sheet_name == 0 and 'sheetname' in kwds:
+            warnings.warn("The `sheetname` keyword is deprecated, use "
+                          "`sheet_name` instead", FutureWarning, stacklevel=2)
+            sheet_name = kwds.pop("sheetname")
+        elif 'sheetname' in kwds:
+            raise TypeError("Cannot specify both `sheet_name` "
+                            "and `sheetname`. Use just `sheet_name`")
+
+        return self._parse_excel(sheet_name=sheet_name,
+                                 header=header,
+                                 names=names,
                                  index_col=index_col,
-                                 has_index_names=has_index_names,
-                                 parse_cols=parse_cols,
+                                 usecols=usecols,
+                                 squeeze=squeeze,
+                                 converters=converters,
+                                 true_values=true_values,
+                                 false_values=false_values,
+                                 skiprows=skiprows,
+                                 nrows=nrows,
+                                 na_values=na_values,
                                  parse_dates=parse_dates,
-                                 date_parser=date_parser, na_values=na_values,
+                                 date_parser=date_parser,
                                  thousands=thousands,
-                                 skip_footer=skip_footer,
+                                 comment=comment,
+                                 skipfooter=skipfooter,
                                  convert_float=convert_float,
-                                 converters=converters,
                                  **kwds)
 
-    def _should_parse(self, i, parse_cols):
+    def _should_parse(self, i, usecols):
 
         def _range2cols(areas):
             """
@@ -264,35 +481,45 @@ def _excel2num(x):
                     cols.append(_excel2num(rng))
             return cols
 
-        if isinstance(parse_cols, int):
-            return i <= parse_cols
-        elif isinstance(parse_cols, compat.string_types):
-            return i in _range2cols(parse_cols)
+        if isinstance(usecols, int):
+            return i <= usecols
+        elif isinstance(usecols, compat.string_types):
+            return i in _range2cols(usecols)
         else:
-            return i in parse_cols
-
-    def _parse_excel(self, sheetname=0, header=0, skiprows=None, skip_footer=0,
-                     index_col=None, has_index_names=None, parse_cols=None,
-                     parse_dates=False, date_parser=None, na_values=None,
-                     thousands=None, convert_float=True,
-                     verbose=False, **kwds):
-
-        skipfooter = kwds.pop('skipfooter', None)
-        if skipfooter is not None:
-            skip_footer = skipfooter
+            return i in usecols
+
+    def _parse_excel(self,
+                     sheet_name=0,
+                     header=0,
+                     names=None,
+                     index_col=None,
+                     usecols=None,
+                     squeeze=False,
+                     dtype=None,
+                     true_values=None,
+                     false_values=None,
+                     skiprows=None,
+                     nrows=None,
+                     na_values=None,
+                     verbose=False,
+                     parse_dates=False,
+                     date_parser=None,
+                     thousands=None,
+                     comment=None,
+                     skipfooter=0,
+                     convert_float=True,
+                     **kwds):
 
         _validate_header_arg(header)
-        if has_index_names is not None:
-            warn("\nThe has_index_names argument is deprecated; index names "
-                 "will be automatically inferred based on index_col.\n"
-                 "This argmument is still necessary if reading Excel output "
-                 "from 0.16.2 or prior with index names.", FutureWarning,
-                 stacklevel=3)
 
         if 'chunksize' in kwds:
-            raise NotImplementedError("Reading an Excel file in chunks "
+            raise NotImplementedError("chunksize keyword of read_excel "
                                       "is not implemented")
 
+        if parse_dates is True and index_col is None:
+            warn("The 'parse_dates=True' keyword of read_excel was provided"
+                 " without an 'index_col' keyword value.")
+
         import xlrd
         from xlrd import (xldate, XL_CELL_DATE,
                           XL_CELL_ERROR, XL_CELL_BOOLEAN,
@@ -300,34 +527,42 @@ def _parse_excel(self, sheetname=0, header=0, skiprows=None, skip_footer=0,
 
         epoch1904 = self.book.datemode
 
-        def _parse_cell(cell_contents,cell_typ):
+        def _parse_cell(cell_contents, cell_typ):
             """converts the contents of the cell into a pandas
                appropriate object"""
 
             if cell_typ == XL_CELL_DATE:
+
                 if xlrd_0_9_3:
                     # Use the newer xlrd datetime handling.
-                    cell_contents = xldate.xldate_as_datetime(cell_contents,
-                                                              epoch1904)
-
+                    try:
+                        cell_contents = \
+                            xldate.xldate_as_datetime(cell_contents,
+                                                      epoch1904)
+                    except OverflowError:
+                        return cell_contents
                     # Excel doesn't distinguish between dates and time,
                     # so we treat dates on the epoch as times only.
                     # Also, Excel supports 1900 and 1904 epochs.
                     year = (cell_contents.timetuple())[0:3]
-                    if ((not epoch1904 and year == (1899, 12, 31))
-                            or (epoch1904 and year == (1904, 1, 1))):
-                        cell_contents = datetime.time(cell_contents.hour,
-                                              cell_contents.minute,
-                                              cell_contents.second,
-                                              cell_contents.microsecond)
+                    if ((not epoch1904 and year == (1899, 12, 31)) or
+                            (epoch1904 and year == (1904, 1, 1))):
+                        cell_contents = time(cell_contents.hour,
+                                             cell_contents.minute,
+                                             cell_contents.second,
+                                             cell_contents.microsecond)
                 else:
                     # Use the xlrd <= 0.9.2 date handling.
-                    dt = xldate.xldate_as_tuple(cell_contents, epoch1904)
+                    try:
+                        dt = xldate.xldate_as_tuple(cell_contents, epoch1904)
+
+                    except xldate.XLDateTooLarge:
+                        return cell_contents
 
-                    if dt[0] < datetime.MINYEAR:
-                        cell_contents = datetime.time(*dt[3:])
+                    if dt[0] < MINYEAR:
+                        cell_contents = time(*dt[3:])
                     else:
-                        cell_contents = datetime.datetime(*dt)
+                        cell_contents = datetime(*dt)
 
             elif cell_typ == XL_CELL_ERROR:
                 cell_contents = np.nan
@@ -335,7 +570,7 @@ def _parse_cell(cell_contents,cell_typ):
                 cell_contents = bool(cell_contents)
             elif convert_float and cell_typ == XL_CELL_NUMBER:
                 # GH5394 - Excel 'numbers' are always floats
-                # it's a minimal perf hit and less suprising
+                # it's a minimal perf hit and less surprising
                 val = int(cell_contents)
                 if val == cell_contents:
                     cell_contents = val
@@ -349,24 +584,24 @@ def _parse_cell(cell_contents,cell_typ):
 
         ret_dict = False
 
-        #Keep sheetname to maintain backwards compatibility.
-        if isinstance(sheetname, list):
-            sheets = sheetname
+        # Keep sheetname to maintain backwards compatibility.
+        if isinstance(sheet_name, list):
+            sheets = sheet_name
             ret_dict = True
-        elif sheetname is None:
+        elif sheet_name is None:
             sheets = self.sheet_names
             ret_dict = True
         else:
-            sheets = [sheetname]
+            sheets = [sheet_name]
 
-        #handle same-type duplicates.
-        sheets = list(set(sheets))
+        # handle same-type duplicates.
+        sheets = list(OrderedDict.fromkeys(sheets).keys())
 
-        output = {}
+        output = OrderedDict()
 
         for asheetname in sheets:
             if verbose:
-                print("Reading sheet %s" % asheetname)
+                print("Reading sheet {sheet}".format(sheet=asheetname))
 
             if isinstance(asheetname, compat.string_types):
                 sheet = self.book.sheet_by_name(asheetname)
@@ -380,36 +615,41 @@ def _parse_cell(cell_contents,cell_typ):
                 row = []
                 for j, (value, typ) in enumerate(zip(sheet.row_values(i),
                                                      sheet.row_types(i))):
-                    if parse_cols is not None and j not in should_parse:
-                        should_parse[j] = self._should_parse(j, parse_cols)
+                    if usecols is not None and j not in should_parse:
+                        should_parse[j] = self._should_parse(j, usecols)
 
-                    if parse_cols is None or should_parse[j]:
-                        row.append(_parse_cell(value,typ))
+                    if usecols is None or should_parse[j]:
+                        row.append(_parse_cell(value, typ))
                 data.append(row)
 
             if sheet.nrows == 0:
-                return DataFrame()
+                output[asheetname] = DataFrame()
+                continue
 
-            if com.is_list_like(header) and len(header) == 1:
+            if is_list_like(header) and len(header) == 1:
                 header = header[0]
 
             # forward fill and pull out names for MultiIndex column
             header_names = None
             if header is not None:
-                if com.is_list_like(header):
+                if is_list_like(header):
                     header_names = []
+                    control_row = [True for x in data[0]]
                     for row in header:
-                        if com.is_integer(skiprows):
+                        if is_integer(skiprows):
                             row += skiprows
-                        data[row] = _fill_mi_header(data[row])
-                        header_name, data[row] = _pop_header_name(data[row], index_col)
+
+                        data[row], control_row = _fill_mi_header(
+                            data[row], control_row)
+                        header_name, data[row] = _pop_header_name(
+                            data[row], index_col)
                         header_names.append(header_name)
                 else:
                     data[header] = _trim_excel_header(data[header])
 
-            if com.is_list_like(index_col):
+            if is_list_like(index_col):
                 # forward fill values for MultiIndex index
-                if not com.is_list_like(header):
+                if not is_list_like(header):
                     offset = 1 + header
                 else:
                     offset = 1 + max(header)
@@ -422,28 +662,43 @@ def _parse_cell(cell_contents,cell_typ):
                         else:
                             last = data[row][col]
 
-            if com.is_list_like(header) and len(header) > 1:
-                has_index_names = True
-
-            parser = TextParser(data, header=header, index_col=index_col,
-                                has_index_names=has_index_names,
-                                na_values=na_values,
-                                thousands=thousands,
-                                parse_dates=parse_dates,
-                                date_parser=date_parser,
-                                skiprows=skiprows,
-                                skip_footer=skip_footer,
-                                **kwds)
-
-            output[asheetname] = parser.read()
-            output[asheetname].columns = output[asheetname].columns.set_names(header_names)
+            has_index_names = is_list_like(header) and len(header) > 1
+
+            # GH 12292 : error when read one empty column from excel file
+            try:
+                parser = TextParser(data,
+                                    header=header,
+                                    index_col=index_col,
+                                    has_index_names=has_index_names,
+                                    squeeze=squeeze,
+                                    dtype=dtype,
+                                    true_values=true_values,
+                                    false_values=false_values,
+                                    skiprows=skiprows,
+                                    nrows=nrows,
+                                    na_values=na_values,
+                                    parse_dates=parse_dates,
+                                    date_parser=date_parser,
+                                    thousands=thousands,
+                                    comment=comment,
+                                    skipfooter=skipfooter,
+                                    **kwds)
+
+                output[asheetname] = parser.read(nrows=nrows)
+                if names is not None:
+                    output[asheetname].columns = names
+                if not squeeze or isinstance(output[asheetname], DataFrame):
+                    output[asheetname].columns = output[
+                        asheetname].columns.set_names(header_names)
+            except EmptyDataError:
+                # No Data, return an empty DataFrame
+                output[asheetname] = DataFrame()
 
         if ret_dict:
             return output
         else:
             return output[asheetname]
 
-
     @property
     def sheet_names(self):
         return self.book.sheet_names()
@@ -460,6 +715,22 @@ def __exit__(self, exc_type, exc_value, traceback):
         self.close()
 
 
+def _validate_freeze_panes(freeze_panes):
+    if freeze_panes is not None:
+        if (
+            len(freeze_panes) == 2 and
+            all(isinstance(item, int) for item in freeze_panes)
+        ):
+            return True
+
+        raise ValueError("freeze_panes must be of form (row, column)"
+                         " where row and column are integers")
+
+    # freeze_panes wasn't specified, return False so it won't be applied
+    # to output sheet
+    return False
+
+
 def _trim_excel_header(row):
     # trim header row so auto-index inference works
     # xlrd uses '' , openpyxl None
@@ -467,18 +738,40 @@ def _trim_excel_header(row):
         row = row[1:]
     return row
 
-def _fill_mi_header(row):
-    # forward fill blanks entries
-    # from headers if parsing as MultiIndex
+
+def _fill_mi_header(row, control_row):
+    """Forward fills blank entries in row, but only inside the same parent index
+
+    Used for creating headers in Multiindex.
+    Parameters
+    ----------
+    row : list
+        List of items in a single row.
+    control_row : list of boolean
+        Helps to determine if particular column is in same parent index as the
+        previous value. Used to stop propagation of empty cells between
+        different indexes.
+
+    Returns
+    ----------
+    Returns changed row and control_row
+    """
     last = row[0]
     for i in range(1, len(row)):
+        if not control_row[i]:
+            last = row[i]
+
         if row[i] == '' or row[i] is None:
             row[i] = last
         else:
+            control_row[i] = False
             last = row[i]
-    return row
+
+    return row, control_row
 
 # fill blank if index_col not None
+
+
 def _pop_header_name(row, index_col):
     """ (header, new_data) for header rows in MultiIndex parsing"""
     none_fill = lambda x: None if x == '' else x
@@ -488,23 +781,8 @@ def _pop_header_name(row, index_col):
         return none_fill(row[0]), row[1:]
     else:
         # pop out header name and fill w/ blank
-        i = index_col if not com.is_list_like(index_col) else max(index_col)
-        return none_fill(row[i]), row[:i] + [''] + row[i+1:]
-
-def _conv_value(val):
-    # Convert numpy types to Python types for the Excel writers.
-    if com.is_integer(val):
-        val = int(val)
-    elif com.is_float(val):
-        val = float(val)
-    elif com.is_bool(val):
-        val = bool(val)
-    elif isinstance(val, Period):
-        val = "%s" % val
-    elif com.is_list_like(val):
-        val = str(val)
-
-    return val
+        i = index_col if not is_list_like(index_col) else max(index_col)
+        return none_fill(row[i]), row[:i] + [''] + row[i + 1:]
 
 
 @add_metaclass(abc.ABCMeta)
@@ -526,6 +804,10 @@ class ExcelWriter(object):
     datetime_format : string, default None
         Format string for datetime objects written into Excel files
         (e.g. 'YYYY-MM-DD HH:MM:SS')
+    mode : {'w' or 'a'}, default 'w'
+        File mode to use (write or append).
+
+    .. versionadded:: 0.24.0
 
     Notes
     -----
@@ -555,17 +837,23 @@ class ExcelWriter(object):
     # ExcelWriter.
     def __new__(cls, path, engine=None, **kwargs):
         # only switch class if generic(ExcelWriter)
+
         if issubclass(cls, ExcelWriter):
-            if engine is None:
+            if engine is None or (isinstance(engine, string_types) and
+                                  engine == 'auto'):
                 if isinstance(path, string_types):
                     ext = os.path.splitext(path)[-1][1:]
                 else:
                     ext = 'xlsx'
 
                 try:
-                    engine = config.get_option('io.excel.%s.writer' % ext)
+                    engine = config.get_option('io.excel.{ext}.writer'
+                                               .format(ext=ext))
+                    if engine == 'auto':
+                        engine = _get_default_writer(ext)
                 except KeyError:
-                    error = ValueError("No engine for filetype: '%s'" % ext)
+                    error = ValueError("No engine for filetype: '{ext}'"
+                                       .format(ext=ext))
                     raise error
             cls = get_writer(engine)
 
@@ -587,18 +875,21 @@ def engine(self):
         pass
 
     @abc.abstractmethod
-    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0):
+    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
+                    freeze_panes=None):
         """
-        Write given formated cells into Excel an excel sheet
+        Write given formatted cells into Excel an excel sheet
 
         Parameters
         ----------
         cells : generator
-            cell of formated data to save to Excel sheet
+            cell of formatted data to save to Excel sheet
         sheet_name : string, default None
             Name of Excel sheet, if None, then use self.cur_sheet
         startrow: upper left cell row to dump data frame
         startcol: upper left cell column to dump data frame
+        freeze_panes: integer tuple of length 2
+            contains the bottom-most row and right-most column to freeze
         """
         pass
 
@@ -610,7 +901,8 @@ def save(self):
         pass
 
     def __init__(self, path, engine=None,
-                 date_format=None, datetime_format=None, **engine_kwargs):
+                 date_format=None, datetime_format=None, mode='w',
+                 **engine_kwargs):
         # validate that this engine can handle the extension
         if isinstance(path, string_types):
             ext = os.path.splitext(path)[-1]
@@ -632,6 +924,11 @@ def __init__(self, path, engine=None,
         else:
             self.datetime_format = datetime_format
 
+        self.mode = mode
+
+    def __fspath__(self):
+        return _stringify_path(self.path)
+
     def _get_sheet_name(self, sheet_name):
         if sheet_name is None:
             sheet_name = self.cur_sheet
@@ -640,6 +937,39 @@ def _get_sheet_name(self, sheet_name):
                              'cur_sheet property')
         return sheet_name
 
+    def _value_with_fmt(self, val):
+        """Convert numpy types to Python types for the Excel writers.
+
+        Parameters
+        ----------
+        val : object
+            Value to be written into cells
+
+        Returns
+        -------
+        Tuple with the first element being the converted value and the second
+            being an optional format
+        """
+        fmt = None
+
+        if is_integer(val):
+            val = int(val)
+        elif is_float(val):
+            val = float(val)
+        elif is_bool(val):
+            val = bool(val)
+        elif isinstance(val, datetime):
+            fmt = self.datetime_format
+        elif isinstance(val, date):
+            fmt = self.date_format
+        elif isinstance(val, timedelta):
+            val = val.total_seconds() / float(86400)
+            fmt = '0'
+        else:
+            val = compat.to_str(val)
+
+        return val, fmt
+
     @classmethod
     def check_extension(cls, ext):
         """checks that path's extension against the Writer's supported
@@ -647,8 +977,9 @@ def check_extension(cls, ext):
         if ext.startswith('.'):
             ext = ext[1:]
         if not any(ext in extension for extension in cls.supported_extensions):
-            msg = (u("Invalid extension for engine '%s': '%s'") %
-                   (pprint_thing(cls.engine), pprint_thing(ext)))
+            msg = (u("Invalid extension for engine '{engine}': '{ext}'")
+                   .format(engine=pprint_thing(cls.engine),
+                           ext=pprint_thing(ext)))
             raise ValueError(msg)
         else:
             return True
@@ -665,26 +996,31 @@ def close(self):
         return self.save()
 
 
-class _Openpyxl1Writer(ExcelWriter):
-    engine = 'openpyxl1'
+class _OpenpyxlWriter(ExcelWriter):
+    engine = 'openpyxl'
     supported_extensions = ('.xlsx', '.xlsm')
-    openpyxl_majorver = 1
 
-    def __init__(self, path, engine=None, **engine_kwargs):
-        if not openpyxl_compat.is_compat(major_ver=self.openpyxl_majorver):
-            raise ValueError('Installed openpyxl is not supported at this '
-                             'time. Use {0}.x.y.'
-                             .format(self.openpyxl_majorver))
+    def __init__(self, path, engine=None, mode='w', **engine_kwargs):
         # Use the openpyxl module as the Excel writer.
         from openpyxl.workbook import Workbook
 
-        super(_Openpyxl1Writer, self).__init__(path, **engine_kwargs)
+        super(_OpenpyxlWriter, self).__init__(path, mode=mode, **engine_kwargs)
 
-        # Create workbook object with default optimized_write=True.
-        self.book = Workbook()
-        # Openpyxl 1.6.1 adds a dummy sheet. We remove it.
-        if self.book.worksheets:
-            self.book.remove_sheet(self.book.worksheets[0])
+        if self.mode == 'a':  # Load from existing workbook
+            from openpyxl import load_workbook
+            book = load_workbook(self.path)
+            self.book = book
+        else:
+            # Create workbook object with default optimized_write=True.
+            self.book = Workbook()
+
+            if self.book.worksheets:
+                try:
+                    self.book.remove(self.book.worksheets[0])
+                except AttributeError:
+
+                    # compat - for openpyxl <= 2.4
+                    self.book.remove_sheet(self.book.worksheets[0])
 
     def save(self):
         """
@@ -692,63 +1028,6 @@ def save(self):
         """
         return self.book.save(self.path)
 
-    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0):
-        # Write the frame cells using openpyxl.
-        from openpyxl.cell import get_column_letter
-
-        sheet_name = self._get_sheet_name(sheet_name)
-
-        if sheet_name in self.sheets:
-            wks = self.sheets[sheet_name]
-        else:
-            wks = self.book.create_sheet()
-            wks.title = sheet_name
-            self.sheets[sheet_name] = wks
-
-        for cell in cells:
-            colletter = get_column_letter(startcol + cell.col + 1)
-            xcell = wks.cell("%s%s" % (colletter, startrow + cell.row + 1))
-            xcell.value = _conv_value(cell.val)
-            style = None
-            if cell.style:
-                style = self._convert_to_style(cell.style)
-                for field in style.__fields__:
-                    xcell.style.__setattr__(field,
-                                            style.__getattribute__(field))
-
-            if isinstance(cell.val, datetime.datetime):
-                xcell.style.number_format.format_code = self.datetime_format
-            elif isinstance(cell.val, datetime.date):
-                xcell.style.number_format.format_code = self.date_format
-
-            if cell.mergestart is not None and cell.mergeend is not None:
-                cletterstart = get_column_letter(startcol + cell.col + 1)
-                cletterend = get_column_letter(startcol + cell.mergeend + 1)
-
-                wks.merge_cells('%s%s:%s%s' % (cletterstart,
-                                               startrow + cell.row + 1,
-                                               cletterend,
-                                               startrow + cell.mergestart + 1))
-
-                # Excel requires that the format of the first cell in a merged
-                # range is repeated in the rest of the merged range.
-                if style:
-                    first_row = startrow + cell.row + 1
-                    last_row = startrow + cell.mergestart + 1
-                    first_col = startcol + cell.col + 1
-                    last_col = startcol + cell.mergeend + 1
-
-                    for row in range(first_row, last_row + 1):
-                        for col in range(first_col, last_col + 1):
-                            if row == first_row and col == first_col:
-                                # Ignore first cell. It is already handled.
-                                continue
-                            colletter = get_column_letter(col)
-                            xcell = wks.cell("%s%s" % (colletter, row))
-                            for field in style.__fields__:
-                                xcell.style.__setattr__(
-                                    field, style.__getattribute__(field))
-
     @classmethod
     def _convert_to_style(cls, style_dict):
         """
@@ -770,81 +1049,6 @@ def _convert_to_style(cls, style_dict):
 
         return xls_style
 
-register_writer(_Openpyxl1Writer)
-
-
-class _OpenpyxlWriter(_Openpyxl1Writer):
-    engine = 'openpyxl'
-
-register_writer(_OpenpyxlWriter)
-
-
-class _Openpyxl20Writer(_Openpyxl1Writer):
-    """
-    Note: Support for OpenPyxl v2 is currently EXPERIMENTAL (GH7565).
-    """
-    engine = 'openpyxl20'
-    openpyxl_majorver = 2
-
-    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0):
-        # Write the frame cells using openpyxl.
-        from openpyxl.cell import get_column_letter
-
-        sheet_name = self._get_sheet_name(sheet_name)
-
-        if sheet_name in self.sheets:
-            wks = self.sheets[sheet_name]
-        else:
-            wks = self.book.create_sheet()
-            wks.title = sheet_name
-            self.sheets[sheet_name] = wks
-
-        for cell in cells:
-            colletter = get_column_letter(startcol + cell.col + 1)
-            xcell = wks.cell("%s%s" % (colletter, startrow + cell.row + 1))
-            xcell.value = _conv_value(cell.val)
-            style_kwargs = {}
-
-            # Apply format codes before cell.style to allow override
-            if isinstance(cell.val, datetime.datetime):
-                style_kwargs.update(self._convert_to_style_kwargs({
-                        'number_format':{'format_code': self.datetime_format}}))
-            elif isinstance(cell.val, datetime.date):
-                style_kwargs.update(self._convert_to_style_kwargs({
-                        'number_format':{'format_code': self.date_format}}))
-
-            if cell.style:
-                style_kwargs.update(self._convert_to_style_kwargs(cell.style))
-
-            if style_kwargs:
-                xcell.style = xcell.style.copy(**style_kwargs)
-
-            if cell.mergestart is not None and cell.mergeend is not None:
-                cletterstart = get_column_letter(startcol + cell.col + 1)
-                cletterend = get_column_letter(startcol + cell.mergeend + 1)
-
-                wks.merge_cells('%s%s:%s%s' % (cletterstart,
-                                               startrow + cell.row + 1,
-                                               cletterend,
-                                               startrow + cell.mergestart + 1))
-
-                # Excel requires that the format of the first cell in a merged
-                # range is repeated in the rest of the merged range.
-                if style_kwargs:
-                    first_row = startrow + cell.row + 1
-                    last_row = startrow + cell.mergestart + 1
-                    first_col = startcol + cell.col + 1
-                    last_col = startcol + cell.mergeend + 1
-
-                    for row in range(first_row, last_row + 1):
-                        for col in range(first_col, last_col + 1):
-                            if row == first_row and col == first_col:
-                                # Ignore first cell. It is already handled.
-                                continue
-                            colletter = get_column_letter(col)
-                            xcell = wks.cell("%s%s" % (colletter, row))
-                            xcell.style = xcell.style.copy(**style_kwargs)
-
     @classmethod
     def _convert_to_style_kwargs(cls, style_dict):
         """
@@ -876,15 +1080,14 @@ def _convert_to_style_kwargs(cls, style_dict):
         for k, v in style_dict.items():
             if k in _style_key_map:
                 k = _style_key_map[k]
-            _conv_to_x = getattr(cls, '_convert_to_{0}'.format(k),
-                    lambda x: None)
+            _conv_to_x = getattr(cls, '_convert_to_{k}'.format(k=k),
+                                 lambda x: None)
             new_v = _conv_to_x(v)
             if new_v:
                 style_kwargs[k] = new_v
 
         return style_kwargs
 
-
     @classmethod
     def _convert_to_color(cls, color_spec):
         """
@@ -913,7 +1116,6 @@ def _convert_to_color(cls, color_spec):
         else:
             return Color(**color_spec)
 
-
     @classmethod
     def _convert_to_font(cls, font_dict):
         """
@@ -962,7 +1164,6 @@ def _convert_to_font(cls, font_dict):
 
         return Font(**font_kwargs)
 
-
     @classmethod
     def _convert_to_stop(cls, stop_seq):
         """
@@ -980,7 +1181,6 @@ def _convert_to_stop(cls, stop_seq):
 
         return map(cls._convert_to_color, stop_seq)
 
-
     @classmethod
     def _convert_to_fill(cls, fill_dict):
         """
@@ -1045,7 +1245,6 @@ def _convert_to_fill(cls, fill_dict):
         except TypeError:
             return GradientFill(**gfill_kwargs)
 
-
     @classmethod
     def _convert_to_side(cls, side_spec):
         """
@@ -1081,7 +1280,6 @@ def _convert_to_side(cls, side_spec):
 
         return Side(**side_kwargs)
 
-
     @classmethod
     def _convert_to_border(cls, border_dict):
         """
@@ -1125,7 +1323,6 @@ def _convert_to_border(cls, border_dict):
 
         return Border(**border_kwargs)
 
-
     @classmethod
     def _convert_to_alignment(cls, alignment_dict):
         """
@@ -1149,7 +1346,6 @@ def _convert_to_alignment(cls, alignment_dict):
 
         return Alignment(**alignment_dict)
 
-
     @classmethod
     def _convert_to_number_format(cls, number_format_dict):
         """
@@ -1164,13 +1360,7 @@ def _convert_to_number_format(cls, number_format_dict):
         -------
         number_format : str
         """
-        try:
-            # >= 2.0.0 < 2.1.0
-            from openpyxl.styles import NumberFormat
-            return NumberFormat(**number_format_dict)
-        except:
-            # >= 2.1.0
-            return number_format_dict['format_code']
+        return number_format_dict['format_code']
 
     @classmethod
     def _convert_to_protection(cls, protection_dict):
@@ -1190,20 +1380,9 @@ def _convert_to_protection(cls, protection_dict):
 
         return Protection(**protection_dict)
 
-
-register_writer(_Openpyxl20Writer)
-
-class _Openpyxl22Writer(_Openpyxl20Writer):
-    """
-    Note: Support for OpenPyxl v2.2 is currently EXPERIMENTAL (GH7565).
-    """
-    engine = 'openpyxl22'
-    openpyxl_majorver = 2
-
-    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0):
+    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
+                    freeze_panes=None):
         # Write the frame cells using openpyxl.
-        from openpyxl import styles
-
         sheet_name = self._get_sheet_name(sheet_name)
 
         _style_cache = {}
@@ -1215,12 +1394,18 @@ def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0):
             wks.title = sheet_name
             self.sheets[sheet_name] = wks
 
+        if _validate_freeze_panes(freeze_panes):
+            wks.freeze_panes = wks.cell(row=freeze_panes[0] + 1,
+                                        column=freeze_panes[1] + 1)
+
         for cell in cells:
             xcell = wks.cell(
-                        row=startrow + cell.row + 1,
-                        column=startcol + cell.col + 1
-                        )
-            xcell.value = _conv_value(cell.val)
+                row=startrow + cell.row + 1,
+                column=startcol + cell.col + 1
+            )
+            xcell.value, fmt = self._value_with_fmt(cell.val)
+            if fmt:
+                xcell.number_format = fmt
 
             style_kwargs = {}
             if cell.style:
@@ -1237,14 +1422,15 @@ def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0):
             if cell.mergestart is not None and cell.mergeend is not None:
 
                 wks.merge_cells(
-                        start_row=startrow + cell.row + 1,
-                        start_column=startcol + cell.col + 1,
-                        end_column=startcol + cell.mergeend + 1,
-                        end_row=startrow + cell.mergeend + 1
-                        )
+                    start_row=startrow + cell.row + 1,
+                    start_column=startcol + cell.col + 1,
+                    end_column=startcol + cell.mergeend + 1,
+                    end_row=startrow + cell.mergestart + 1
+                )
 
                 # When cells are merged only the top-left cell is preserved
-                # The behaviour of the other cells in a merged range is undefined
+                # The behaviour of the other cells in a merged range is
+                # undefined
                 if style_kwargs:
                     first_row = startrow + cell.row + 1
                     last_row = startrow + cell.mergestart + 1
@@ -1260,17 +1446,24 @@ def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0):
                             for k, v in style_kwargs.items():
                                 setattr(xcell, k, v)
 
-register_writer(_Openpyxl22Writer)
+
+register_writer(_OpenpyxlWriter)
+
 
 class _XlwtWriter(ExcelWriter):
     engine = 'xlwt'
     supported_extensions = ('.xls',)
 
-    def __init__(self, path, engine=None, encoding=None, **engine_kwargs):
+    def __init__(self, path, engine=None, encoding=None, mode='w',
+                 **engine_kwargs):
         # Use the xlwt module as the Excel writer.
         import xlwt
         engine_kwargs['engine'] = engine
-        super(_XlwtWriter, self).__init__(path, **engine_kwargs)
+
+        if mode == 'a':
+            raise ValueError('Append mode is not supported with xlwt!')
+
+        super(_XlwtWriter, self).__init__(path, mode=mode, **engine_kwargs)
 
         if encoding is None:
             encoding = 'ascii'
@@ -1284,7 +1477,8 @@ def save(self):
         """
         return self.book.save(self.path)
 
-    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0):
+    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
+                    freeze_panes=None):
         # Write the frame cells using xlwt.
 
         sheet_name = self._get_sheet_name(sheet_name)
@@ -1295,25 +1489,24 @@ def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0):
             wks = self.book.add_sheet(sheet_name)
             self.sheets[sheet_name] = wks
 
+        if _validate_freeze_panes(freeze_panes):
+            wks.set_panes_frozen(True)
+            wks.set_horz_split_pos(freeze_panes[0])
+            wks.set_vert_split_pos(freeze_panes[1])
+
         style_dict = {}
 
         for cell in cells:
-            val = _conv_value(cell.val)
-
-            num_format_str = None
-            if isinstance(cell.val, datetime.datetime):
-                num_format_str = self.datetime_format
-            elif isinstance(cell.val, datetime.date):
-                num_format_str = self.date_format
+            val, fmt = self._value_with_fmt(cell.val)
 
             stylekey = json.dumps(cell.style)
-            if num_format_str:
-                stylekey += num_format_str
+            if fmt:
+                stylekey += fmt
 
             if stylekey in style_dict:
                 style = style_dict[stylekey]
             else:
-                style = self._convert_to_style(cell.style, num_format_str)
+                style = self._convert_to_style(cell.style, fmt)
                 style_dict[stylekey] = style
 
             if cell.mergestart is not None and cell.mergeend is not None:
@@ -1346,17 +1539,19 @@ def _style_to_xlwt(cls, item, firstlevel=True, field_sep=',',
         """
         if hasattr(item, 'items'):
             if firstlevel:
-                it = ["%s: %s" % (key, cls._style_to_xlwt(value, False))
+                it = ["{key}: {val}"
+                      .format(key=key, val=cls._style_to_xlwt(value, False))
                       for key, value in item.items()]
-                out = "%s " % (line_sep).join(it)
+                out = "{sep} ".format(sep=(line_sep).join(it))
                 return out
             else:
-                it = ["%s %s" % (key, cls._style_to_xlwt(value, False))
+                it = ["{key} {val}"
+                      .format(key=key, val=cls._style_to_xlwt(value, False))
                       for key, value in item.items()]
-                out = "%s " % (field_sep).join(it)
+                out = "{sep} ".format(sep=(field_sep).join(it))
                 return out
         else:
-            item = "%s" % item
+            item = "{item}".format(item=item)
             item = item.replace("True", "on")
             item = item.replace("False", "off")
             return item
@@ -1382,21 +1577,170 @@ def _convert_to_style(cls, style_dict, num_format_str=None):
 
         return style
 
+
 register_writer(_XlwtWriter)
 
 
+class _XlsxStyler(object):
+    # Map from openpyxl-oriented styles to flatter xlsxwriter representation
+    # Ordering necessary for both determinism and because some are keyed by
+    # prefixes of others.
+    STYLE_MAPPING = {
+        'font': [
+            (('name',), 'font_name'),
+            (('sz',), 'font_size'),
+            (('size',), 'font_size'),
+            (('color', 'rgb',), 'font_color'),
+            (('color',), 'font_color'),
+            (('b',), 'bold'),
+            (('bold',), 'bold'),
+            (('i',), 'italic'),
+            (('italic',), 'italic'),
+            (('u',), 'underline'),
+            (('underline',), 'underline'),
+            (('strike',), 'font_strikeout'),
+            (('vertAlign',), 'font_script'),
+            (('vertalign',), 'font_script'),
+        ],
+        'number_format': [
+            (('format_code',), 'num_format'),
+            ((), 'num_format',),
+        ],
+        'protection': [
+            (('locked',), 'locked'),
+            (('hidden',), 'hidden'),
+        ],
+        'alignment': [
+            (('horizontal',), 'align'),
+            (('vertical',), 'valign'),
+            (('text_rotation',), 'rotation'),
+            (('wrap_text',), 'text_wrap'),
+            (('indent',), 'indent'),
+            (('shrink_to_fit',), 'shrink'),
+        ],
+        'fill': [
+            (('patternType',), 'pattern'),
+            (('patterntype',), 'pattern'),
+            (('fill_type',), 'pattern'),
+            (('start_color', 'rgb',), 'fg_color'),
+            (('fgColor', 'rgb',), 'fg_color'),
+            (('fgcolor', 'rgb',), 'fg_color'),
+            (('start_color',), 'fg_color'),
+            (('fgColor',), 'fg_color'),
+            (('fgcolor',), 'fg_color'),
+            (('end_color', 'rgb',), 'bg_color'),
+            (('bgColor', 'rgb',), 'bg_color'),
+            (('bgcolor', 'rgb',), 'bg_color'),
+            (('end_color',), 'bg_color'),
+            (('bgColor',), 'bg_color'),
+            (('bgcolor',), 'bg_color'),
+        ],
+        'border': [
+            (('color', 'rgb',), 'border_color'),
+            (('color',), 'border_color'),
+            (('style',), 'border'),
+            (('top', 'color', 'rgb',), 'top_color'),
+            (('top', 'color',), 'top_color'),
+            (('top', 'style',), 'top'),
+            (('top',), 'top'),
+            (('right', 'color', 'rgb',), 'right_color'),
+            (('right', 'color',), 'right_color'),
+            (('right', 'style',), 'right'),
+            (('right',), 'right'),
+            (('bottom', 'color', 'rgb',), 'bottom_color'),
+            (('bottom', 'color',), 'bottom_color'),
+            (('bottom', 'style',), 'bottom'),
+            (('bottom',), 'bottom'),
+            (('left', 'color', 'rgb',), 'left_color'),
+            (('left', 'color',), 'left_color'),
+            (('left', 'style',), 'left'),
+            (('left',), 'left'),
+        ],
+    }
+
+    @classmethod
+    def convert(cls, style_dict, num_format_str=None):
+        """
+        converts a style_dict to an xlsxwriter format dict
+
+        Parameters
+        ----------
+        style_dict: style dictionary to convert
+        num_format_str: optional number format string
+        """
+
+        # Create a XlsxWriter format object.
+        props = {}
+
+        if num_format_str is not None:
+            props['num_format'] = num_format_str
+
+        if style_dict is None:
+            return props
+
+        if 'borders' in style_dict:
+            style_dict = style_dict.copy()
+            style_dict['border'] = style_dict.pop('borders')
+
+        for style_group_key, style_group in style_dict.items():
+            for src, dst in cls.STYLE_MAPPING.get(style_group_key, []):
+                # src is a sequence of keys into a nested dict
+                # dst is a flat key
+                if dst in props:
+                    continue
+                v = style_group
+                for k in src:
+                    try:
+                        v = v[k]
+                    except (KeyError, TypeError):
+                        break
+                else:
+                    props[dst] = v
+
+        if isinstance(props.get('pattern'), string_types):
+            # TODO: support other fill patterns
+            props['pattern'] = 0 if props['pattern'] == 'none' else 1
+
+        for k in ['border', 'top', 'right', 'bottom', 'left']:
+            if isinstance(props.get(k), string_types):
+                try:
+                    props[k] = ['none', 'thin', 'medium', 'dashed', 'dotted',
+                                'thick', 'double', 'hair', 'mediumDashed',
+                                'dashDot', 'mediumDashDot', 'dashDotDot',
+                                'mediumDashDotDot', 'slantDashDot'].\
+                        index(props[k])
+                except ValueError:
+                    props[k] = 2
+
+        if isinstance(props.get('font_script'), string_types):
+            props['font_script'] = ['baseline', 'superscript', 'subscript'].\
+                index(props['font_script'])
+
+        if isinstance(props.get('underline'), string_types):
+            props['underline'] = {'none': 0, 'single': 1, 'double': 2,
+                                  'singleAccounting': 33,
+                                  'doubleAccounting': 34}[props['underline']]
+
+        return props
+
+
 class _XlsxWriter(ExcelWriter):
     engine = 'xlsxwriter'
     supported_extensions = ('.xlsx',)
 
     def __init__(self, path, engine=None,
-                 date_format=None, datetime_format=None, **engine_kwargs):
+                 date_format=None, datetime_format=None, mode='w',
+                 **engine_kwargs):
         # Use the xlsxwriter module as the Excel writer.
         import xlsxwriter
 
+        if mode == 'a':
+            raise ValueError('Append mode is not supported with xlsxwriter!')
+
         super(_XlsxWriter, self).__init__(path, engine=engine,
                                           date_format=date_format,
                                           datetime_format=datetime_format,
+                                          mode=mode,
                                           **engine_kwargs)
 
         self.book = xlsxwriter.Workbook(path, **engine_kwargs)
@@ -1405,11 +1749,12 @@ def save(self):
         """
         Save workbook to disk.
         """
+
         return self.book.close()
 
-    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0):
+    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
+                    freeze_panes=None):
         # Write the frame cells using xlsxwriter.
-
         sheet_name = self._get_sheet_name(sheet_name)
 
         if sheet_name in self.sheets:
@@ -1418,25 +1763,23 @@ def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0):
             wks = self.book.add_worksheet(sheet_name)
             self.sheets[sheet_name] = wks
 
-        style_dict = {}
+        style_dict = {'null': None}
 
-        for cell in cells:
-            val = _conv_value(cell.val)
+        if _validate_freeze_panes(freeze_panes):
+            wks.freeze_panes(*(freeze_panes))
 
-            num_format_str = None
-            if isinstance(cell.val, datetime.datetime):
-                num_format_str = self.datetime_format
-            elif isinstance(cell.val, datetime.date):
-                num_format_str = self.date_format
+        for cell in cells:
+            val, fmt = self._value_with_fmt(cell.val)
 
             stylekey = json.dumps(cell.style)
-            if num_format_str:
-                stylekey += num_format_str
+            if fmt:
+                stylekey += fmt
 
             if stylekey in style_dict:
                 style = style_dict[stylekey]
             else:
-                style = self._convert_to_style(cell.style, num_format_str)
+                style = self.book.add_format(
+                    _XlsxStyler.convert(cell.style, fmt))
                 style_dict[stylekey] = style
 
             if cell.mergestart is not None and cell.mergeend is not None:
@@ -1450,48 +1793,5 @@ def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0):
                           startcol + cell.col,
                           val, style)
 
-    def _convert_to_style(self, style_dict, num_format_str=None):
-        """
-        converts a style_dict to an xlsxwriter format object
-        Parameters
-        ----------
-        style_dict: style dictionary to convert
-        num_format_str: optional number format string
-        """
-
-        # If there is no formatting we don't create a format object.
-        if num_format_str is None and style_dict is None:
-            return None
-
-        # Create a XlsxWriter format object.
-        xl_format = self.book.add_format()
-
-        if num_format_str is not None:
-            xl_format.set_num_format(num_format_str)
-
-        if style_dict is None:
-            return xl_format
-
-        # Map the cell font to XlsxWriter font properties.
-        if style_dict.get('font'):
-            font = style_dict['font']
-            if font.get('bold'):
-                xl_format.set_bold()
-
-        # Map the alignment to XlsxWriter alignment properties.
-        alignment = style_dict.get('alignment')
-        if alignment:
-            if (alignment.get('horizontal')
-                    and alignment['horizontal'] == 'center'):
-                xl_format.set_align('center')
-            if (alignment.get('vertical')
-                    and alignment['vertical'] == 'top'):
-                xl_format.set_align('top')
-
-        # Map the cell borders to XlsxWriter border properties.
-        if style_dict.get('borders'):
-            xl_format.set_border()
-
-        return xl_format
 
 register_writer(_XlsxWriter)
diff --git a/pandas/io/feather_format.py b/pandas/io/feather_format.py
new file mode 100644
index 0000000000000..1bc6526214a91
--- /dev/null
+++ b/pandas/io/feather_format.py
@@ -0,0 +1,112 @@
+""" feather-format compat """
+
+from distutils.version import LooseVersion
+from pandas import DataFrame, RangeIndex, Int64Index
+from pandas.compat import range
+from pandas.io.common import _stringify_path
+
+
+def _try_import():
+    # since pandas is a dependency of feather
+    # we need to import on first use
+
+    try:
+        import feather
+    except ImportError:
+
+        # give a nice error message
+        raise ImportError("the feather-format library is not installed\n"
+                          "you can install via conda\n"
+                          "conda install feather-format -c conda-forge\n"
+                          "or via pip\n"
+                          "pip install -U feather-format\n")
+
+    try:
+        LooseVersion(feather.__version__) >= LooseVersion('0.3.1')
+    except AttributeError:
+        raise ImportError("the feather-format library must be >= "
+                          "version 0.3.1\n"
+                          "you can install via conda\n"
+                          "conda install feather-format -c conda-forge"
+                          "or via pip\n"
+                          "pip install -U feather-format\n")
+
+    return feather
+
+
+def to_feather(df, path):
+    """
+    Write a DataFrame to the feather-format
+
+    Parameters
+    ----------
+    df : DataFrame
+    path : string file path, or file-like object
+
+    """
+    path = _stringify_path(path)
+    if not isinstance(df, DataFrame):
+        raise ValueError("feather only support IO with DataFrames")
+
+    feather = _try_import()
+    valid_types = {'string', 'unicode'}
+
+    # validate index
+    # --------------
+
+    # validate that we have only a default index
+    # raise on anything else as we don't serialize the index
+
+    if not isinstance(df.index, Int64Index):
+        raise ValueError("feather does not support serializing {} "
+                         "for the index; you can .reset_index()"
+                         "to make the index into column(s)".format(
+                             type(df.index)))
+
+    if not df.index.equals(RangeIndex.from_range(range(len(df)))):
+        raise ValueError("feather does not support serializing a "
+                         "non-default index for the index; you "
+                         "can .reset_index() to make the index "
+                         "into column(s)")
+
+    if df.index.name is not None:
+        raise ValueError("feather does not serialize index meta-data on a "
+                         "default index")
+
+    # validate columns
+    # ----------------
+
+    # must have value column names (strings only)
+    if df.columns.inferred_type not in valid_types:
+        raise ValueError("feather must have string column names")
+
+    feather.write_dataframe(df, path)
+
+
+def read_feather(path, nthreads=1):
+    """
+    Load a feather-format object from the file path
+
+    .. versionadded 0.20.0
+
+    Parameters
+    ----------
+    path : string file path, or file-like object
+    nthreads : int, default 1
+        Number of CPU threads to use when reading to pandas.DataFrame
+
+       .. versionadded 0.21.0
+
+    Returns
+    -------
+    type of object stored in file
+
+    """
+
+    feather = _try_import()
+    path = _stringify_path(path)
+
+    if LooseVersion(feather.__version__) < LooseVersion('0.4.0'):
+        return feather.read_dataframe(path)
+
+    return feather.read_dataframe(path, nthreads=nthreads)
diff --git a/pandas/stats/tests/__init__.py b/pandas/io/formats/__init__.py
similarity index 100%
rename from pandas/stats/tests/__init__.py
rename to pandas/io/formats/__init__.py
diff --git a/pandas/io/formats/console.py b/pandas/io/formats/console.py
new file mode 100644
index 0000000000000..36eac8dd57fbd
--- /dev/null
+++ b/pandas/io/formats/console.py
@@ -0,0 +1,84 @@
+"""
+Internal module for console introspection
+"""
+
+import sys
+import locale
+from pandas.io.formats.terminal import get_terminal_size
+
+# -----------------------------------------------------------------------------
+# Global formatting options
+_initial_defencoding = None
+
+
+def detect_console_encoding():
+    """
+    Try to find the most capable encoding supported by the console.
+    slightly modified from the way IPython handles the same issue.
+    """
+    global _initial_defencoding
+
+    encoding = None
+    try:
+        encoding = sys.stdout.encoding or sys.stdin.encoding
+    except AttributeError:
+        pass
+
+    # try again for something better
+    if not encoding or 'ascii' in encoding.lower():
+        try:
+            encoding = locale.getpreferredencoding()
+        except Exception:
+            pass
+
+    # when all else fails. this will usually be "ascii"
+    if not encoding or 'ascii' in encoding.lower():
+        encoding = sys.getdefaultencoding()
+
+    # GH3360, save the reported defencoding at import time
+    # MPL backends may change it. Make available for debugging.
+    if not _initial_defencoding:
+        _initial_defencoding = sys.getdefaultencoding()
+
+    return encoding
+
+
+def get_console_size():
+    """Return console size as tuple = (width, height).
+
+    Returns (None,None) in non-interactive session.
+    """
+    from pandas import get_option
+    from pandas.core import common as com
+
+    display_width = get_option('display.width')
+    # deprecated.
+    display_height = get_option('display.max_rows')
+
+    # Consider
+    # interactive shell terminal, can detect term size
+    # interactive non-shell terminal (ipnb/ipqtconsole), cannot detect term
+    # size non-interactive script, should disregard term size
+
+    # in addition
+    # width,height have default values, but setting to 'None' signals
+    # should use Auto-Detection, But only in interactive shell-terminal.
+    # Simple. yeah.
+
+    if com.in_interactive_session():
+        if com.in_ipython_frontend():
+            # sane defaults for interactive non-shell terminal
+            # match default for width,height in config_init
+            from pandas.core.config import get_default_val
+            terminal_width = get_default_val('display.width')
+            terminal_height = get_default_val('display.max_rows')
+        else:
+            # pure terminal
+            terminal_width, terminal_height = get_terminal_size()
+    else:
+        terminal_width, terminal_height = None, None
+
+    # Note if the User sets width/Height to None (auto-detection)
+    # and we're in a script (non-inter), this will return (None,None)
+    # caller needs to deal.
+    return (display_width or terminal_width, display_height or terminal_height)
diff --git a/pandas/io/formats/css.py b/pandas/io/formats/css.py
new file mode 100644
index 0000000000000..429c98b579ca0
--- /dev/null
+++ b/pandas/io/formats/css.py
@@ -0,0 +1,250 @@
+"""Utilities for interpreting CSS from Stylers for formatting non-HTML outputs
+"""
+
+import re
+import warnings
+
+
+class CSSWarning(UserWarning):
+    """This CSS syntax cannot currently be parsed"""
+    pass
+
+
+class CSSResolver(object):
+    """A callable for parsing and resolving CSS to atomic properties
+
+    """
+
+    INITIAL_STYLE = {
+    }
+
+    def __call__(self, declarations_str, inherited=None):
+        """ the given declarations to atomic properties
+
+        Parameters
+        ----------
+        declarations_str : str
+            A list of CSS declarations
+        inherited : dict, optional
+            Atomic properties indicating the inherited style context in which
+            declarations_str is to be resolved. ``inherited`` should already
+            be resolved, i.e. valid output of this method.
+
+        Returns
+        -------
+        props : dict
+            Atomic CSS 2.2 properties
+
+        Examples
+        --------
+        >>> resolve = CSSResolver()
+        >>> inherited = {'font-family': 'serif', 'font-weight': 'bold'}
+        >>> out = resolve('''
+        ...               border-color: BLUE RED;
+        ...               font-size: 1em;
+        ...               font-size: 2em;
+        ...               font-weight: normal;
+        ...               font-weight: inherit;
+        ...               ''', inherited)
+        >>> sorted(out.items())  # doctest: +NORMALIZE_WHITESPACE
+        [('border-bottom-color', 'blue'),
+         ('border-left-color', 'red'),
+         ('border-right-color', 'red'),
+         ('border-top-color', 'blue'),
+         ('font-family', 'serif'),
+         ('font-size', '24pt'),
+         ('font-weight', 'bold')]
+        """
+
+        props = dict(self.atomize(self.parse(declarations_str)))
+        if inherited is None:
+            inherited = {}
+
+        # 1. resolve inherited, initial
+        for prop, val in inherited.items():
+            if prop not in props:
+                props[prop] = val
+
+        for prop, val in list(props.items()):
+            if val == 'inherit':
+                val = inherited.get(prop, 'initial')
+            if val == 'initial':
+                val = self.INITIAL_STYLE.get(prop)
+
+            if val is None:
+                # we do not define a complete initial stylesheet
+                del props[prop]
+            else:
+                props[prop] = val
+
+        # 2. resolve relative font size
+        if props.get('font-size'):
+            if 'font-size' in inherited:
+                em_pt = inherited['font-size']
+                assert em_pt[-2:] == 'pt'
+                em_pt = float(em_pt[:-2])
+            else:
+                em_pt = None
+            props['font-size'] = self.size_to_pt(
+                props['font-size'], em_pt, conversions=self.FONT_SIZE_RATIOS)
+
+            font_size = float(props['font-size'][:-2])
+        else:
+            font_size = None
+
+        # 3. TODO: resolve other font-relative units
+        for side in self.SIDES:
+            prop = 'border-{side}-width'.format(side=side)
+            if prop in props:
+                props[prop] = self.size_to_pt(
+                    props[prop], em_pt=font_size,
+                    conversions=self.BORDER_WIDTH_RATIOS)
+            for prop in ['margin-{side}'.format(side=side),
+                         'padding-{side}'.format(side=side)]:
+                if prop in props:
+                    # TODO: support %
+                    props[prop] = self.size_to_pt(
+                        props[prop], em_pt=font_size,
+                        conversions=self.MARGIN_RATIOS)
+
+        return props
+
+    UNIT_RATIOS = {
+        'rem': ('pt', 12),
+        'ex': ('em', .5),
+        # 'ch':
+        'px': ('pt', .75),
+        'pc': ('pt', 12),
+        'in': ('pt', 72),
+        'cm': ('in', 1 / 2.54),
+        'mm': ('in', 1 / 25.4),
+        'q': ('mm', .25),
+        '!!default': ('em', 0),
+    }
+
+    FONT_SIZE_RATIOS = UNIT_RATIOS.copy()
+    FONT_SIZE_RATIOS.update({
+        '%': ('em', .01),
+        'xx-small': ('rem', .5),
+        'x-small': ('rem', .625),
+        'small': ('rem', .8),
+        'medium': ('rem', 1),
+        'large': ('rem', 1.125),
+        'x-large': ('rem', 1.5),
+        'xx-large': ('rem', 2),
+        'smaller': ('em', 1 / 1.2),
+        'larger': ('em', 1.2),
+        '!!default': ('em', 1),
+    })
+
+    MARGIN_RATIOS = UNIT_RATIOS.copy()
+    MARGIN_RATIOS.update({
+        'none': ('pt', 0),
+    })
+
+    BORDER_WIDTH_RATIOS = UNIT_RATIOS.copy()
+    BORDER_WIDTH_RATIOS.update({
+        'none': ('pt', 0),
+        'thick': ('px', 4),
+        'medium': ('px', 2),
+        'thin': ('px', 1),
+        # Default: medium only if solid
+    })
+
+    def size_to_pt(self, in_val, em_pt=None, conversions=UNIT_RATIOS):
+        def _error():
+            warnings.warn('Unhandled size: {val!r}'.format(val=in_val),
+                          CSSWarning)
+            return self.size_to_pt('1!!default', conversions=conversions)
+
+        try:
+            val, unit = re.match(r'^(\S*?)([a-zA-Z%!].*)', in_val).groups()
+        except AttributeError:
+            return _error()
+        if val == '':
+            # hack for 'large' etc.
+            val = 1
+        else:
+            try:
+                val = float(val)
+            except ValueError:
+                return _error()
+
+        while unit != 'pt':
+            if unit == 'em':
+                if em_pt is None:
+                    unit = 'rem'
+                else:
+                    val *= em_pt
+                    unit = 'pt'
+                continue
+
+            try:
+                unit, mul = conversions[unit]
+            except KeyError:
+                return _error()
+            val *= mul
+
+        val = round(val, 5)
+        if int(val) == val:
+            size_fmt = '{fmt:d}pt'.format(fmt=int(val))
+        else:
+            size_fmt = '{fmt:f}pt'.format(fmt=val)
+        return size_fmt
+
+    def atomize(self, declarations):
+        for prop, value in declarations:
+            attr = 'expand_' + prop.replace('-', '_')
+            try:
+                expand = getattr(self, attr)
+            except AttributeError:
+                yield prop, value
+            else:
+                for prop, value in expand(prop, value):
+                    yield prop, value
+
+    SIDE_SHORTHANDS = {
+        1: [0, 0, 0, 0],
+        2: [0, 1, 0, 1],
+        3: [0, 1, 2, 1],
+        4: [0, 1, 2, 3],
+    }
+    SIDES = ('top', 'right', 'bottom', 'left')
+
+    def _side_expander(prop_fmt):
+        def expand(self, prop, value):
+            tokens = value.split()
+            try:
+                mapping = self.SIDE_SHORTHANDS[len(tokens)]
+            except KeyError:
+                warnings.warn('Could not expand "{prop}: {val}"'
+                              .format(prop=prop, val=value), CSSWarning)
+                return
+            for key, idx in zip(self.SIDES, mapping):
+                yield prop_fmt.format(key), tokens[idx]
+
+        return expand
+
+    expand_border_color = _side_expander('border-{:s}-color')
+    expand_border_style = _side_expander('border-{:s}-style')
+    expand_border_width = _side_expander('border-{:s}-width')
+    expand_margin = _side_expander('margin-{:s}')
+    expand_padding = _side_expander('padding-{:s}')
+
+    def parse(self, declarations_str):
+        """Generates (prop, value) pairs from declarations
+
+        In a future version may generate parsed tokens from tinycss/tinycss2
+        """
+        for decl in declarations_str.split(';'):
+            if not decl.strip():
+                continue
+            prop, sep, val = decl.partition(':')
+            prop = prop.strip().lower()
+            # TODO: don't lowercase case sensitive parts of values (strings)
+            val = val.strip().lower()
+            if sep:
+                yield prop, val
+            else:
+                warnings.warn('Ill-formatted attribute: expected a colon '
+                              'in {decl!r}'.format(decl=decl), CSSWarning)
diff --git a/pandas/io/formats/csvs.py b/pandas/io/formats/csvs.py
new file mode 100644
index 0000000000000..60518f596e9af
--- /dev/null
+++ b/pandas/io/formats/csvs.py
@@ -0,0 +1,313 @@
+# -*- coding: utf-8 -*-
+"""
+Module for formatting output data into CSV files.
+"""
+
+from __future__ import print_function
+
+import warnings
+
+import csv as csvlib
+from zipfile import ZipFile
+import numpy as np
+
+from pandas.core.dtypes.missing import notna
+from pandas.core.index import Index, MultiIndex
+from pandas import compat
+from pandas.compat import (StringIO, range, zip)
+
+from pandas.io.common import (_get_handle, UnicodeWriter, _expand_user,
+                              _stringify_path)
+from pandas._libs import writers as libwriters
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexes.period import PeriodIndex
+
+
+class CSVFormatter(object):
+
+    def __init__(self, obj, path_or_buf=None, sep=",", na_rep='',
+                 float_format=None, cols=None, header=True, index=True,
+                 index_label=None, mode='w', nanRep=None, encoding=None,
+                 compression=None, quoting=None, line_terminator='\n',
+                 chunksize=None, tupleize_cols=False, quotechar='"',
+                 date_format=None, doublequote=True, escapechar=None,
+                 decimal='.'):
+
+        self.obj = obj
+
+        if path_or_buf is None:
+            path_or_buf = StringIO()
+
+        self.path_or_buf = _expand_user(_stringify_path(path_or_buf))
+        self.sep = sep
+        self.na_rep = na_rep
+        self.float_format = float_format
+        self.decimal = decimal
+
+        self.header = header
+        self.index = index
+        self.index_label = index_label
+        self.mode = mode
+        self.encoding = encoding
+        self.compression = compression
+
+        if quoting is None:
+            quoting = csvlib.QUOTE_MINIMAL
+        self.quoting = quoting
+
+        if quoting == csvlib.QUOTE_NONE:
+            # prevents crash in _csv
+            quotechar = None
+        self.quotechar = quotechar
+
+        self.doublequote = doublequote
+        self.escapechar = escapechar
+
+        self.line_terminator = line_terminator
+
+        self.date_format = date_format
+
+        self.tupleize_cols = tupleize_cols
+        self.has_mi_columns = (isinstance(obj.columns, MultiIndex) and
+                               not self.tupleize_cols)
+
+        # validate mi options
+        if self.has_mi_columns:
+            if cols is not None:
+                raise TypeError("cannot specify cols with a MultiIndex on the "
+                                "columns")
+
+        if cols is not None:
+            if isinstance(cols, Index):
+                cols = cols.to_native_types(na_rep=na_rep,
+                                            float_format=float_format,
+                                            date_format=date_format,
+                                            quoting=self.quoting)
+            else:
+                cols = list(cols)
+            self.obj = self.obj.loc[:, cols]
+
+        # update columns to include possible multiplicity of dupes
+        # and make sure sure cols is just a list of labels
+        cols = self.obj.columns
+        if isinstance(cols, Index):
+            cols = cols.to_native_types(na_rep=na_rep,
+                                        float_format=float_format,
+                                        date_format=date_format,
+                                        quoting=self.quoting)
+        else:
+            cols = list(cols)
+
+        # save it
+        self.cols = cols
+
+        # preallocate data 2d list
+        self.blocks = self.obj._data.blocks
+        ncols = sum(b.shape[0] for b in self.blocks)
+        self.data = [None] * ncols
+
+        if chunksize is None:
+            chunksize = (100000 // (len(self.cols) or 1)) or 1
+        self.chunksize = int(chunksize)
+
+        self.data_index = obj.index
+        if (isinstance(self.data_index, (DatetimeIndex, PeriodIndex)) and
+                date_format is not None):
+            self.data_index = Index([x.strftime(date_format) if notna(x) else
+                                     '' for x in self.data_index])
+
+        self.nlevels = getattr(self.data_index, 'nlevels', 1)
+        if not index:
+            self.nlevels = 0
+
+    def save(self):
+        # create the writer & save
+        if self.encoding is None:
+            if compat.PY2:
+                encoding = 'ascii'
+            else:
+                encoding = 'utf-8'
+        else:
+            encoding = self.encoding
+
+        # GH 21227 internal compression is not used when file-like passed.
+        if self.compression and hasattr(self.path_or_buf, 'write'):
+            msg = ("compression has no effect when passing file-like "
+                   "object as input.")
+            warnings.warn(msg, RuntimeWarning, stacklevel=2)
+
+        # when zip compression is called.
+        is_zip = isinstance(self.path_or_buf, ZipFile) or (
+            not hasattr(self.path_or_buf, 'write')
+            and self.compression == 'zip')
+
+        if is_zip:
+            # zipfile doesn't support writing string to archive. uses string
+            # buffer to receive csv writing and dump into zip compression
+            # file handle. GH 21241, 21118
+            f = StringIO()
+            close = False
+        elif hasattr(self.path_or_buf, 'write'):
+            f = self.path_or_buf
+            close = False
+        else:
+            f, handles = _get_handle(self.path_or_buf, self.mode,
+                                     encoding=encoding,
+                                     compression=self.compression)
+            close = True
+
+        try:
+            writer_kwargs = dict(lineterminator=self.line_terminator,
+                                 delimiter=self.sep, quoting=self.quoting,
+                                 doublequote=self.doublequote,
+                                 escapechar=self.escapechar,
+                                 quotechar=self.quotechar)
+            if encoding == 'ascii':
+                self.writer = csvlib.writer(f, **writer_kwargs)
+            else:
+                writer_kwargs['encoding'] = encoding
+                self.writer = UnicodeWriter(f, **writer_kwargs)
+
+            self._save()
+
+        finally:
+            if is_zip:
+                # GH 17778 handles zip compression separately.
+                buf = f.getvalue()
+                if hasattr(self.path_or_buf, 'write'):
+                    self.path_or_buf.write(buf)
+                else:
+                    f, handles = _get_handle(self.path_or_buf, self.mode,
+                                             encoding=encoding,
+                                             compression=self.compression)
+                    f.write(buf)
+                    close = True
+            if close:
+                f.close()
+                for _fh in handles:
+                    _fh.close()
+
+    def _save_header(self):
+
+        writer = self.writer
+        obj = self.obj
+        index_label = self.index_label
+        cols = self.cols
+        has_mi_columns = self.has_mi_columns
+        header = self.header
+        encoded_labels = []
+
+        has_aliases = isinstance(header, (tuple, list, np.ndarray, Index))
+        if not (has_aliases or self.header):
+            return
+        if has_aliases:
+            if len(header) != len(cols):
+                raise ValueError(('Writing {ncols} cols but got {nalias} '
+                                 'aliases'.format(ncols=len(cols),
+                                                  nalias=len(header))))
+            else:
+                write_cols = header
+        else:
+            write_cols = cols
+
+        if self.index:
+            # should write something for index label
+            if index_label is not False:
+                if index_label is None:
+                    if isinstance(obj.index, MultiIndex):
+                        index_label = []
+                        for i, name in enumerate(obj.index.names):
+                            if name is None:
+                                name = ''
+                            index_label.append(name)
+                    else:
+                        index_label = obj.index.name
+                        if index_label is None:
+                            index_label = ['']
+                        else:
+                            index_label = [index_label]
+                elif not isinstance(index_label,
+                                    (list, tuple, np.ndarray, Index)):
+                    # given a string for a DF with Index
+                    index_label = [index_label]
+
+                encoded_labels = list(index_label)
+            else:
+                encoded_labels = []
+
+        if not has_mi_columns or has_aliases:
+            encoded_labels += list(write_cols)
+            writer.writerow(encoded_labels)
+        else:
+            # write out the mi
+            columns = obj.columns
+
+            # write out the names for each level, then ALL of the values for
+            # each level
+            for i in range(columns.nlevels):
+
+                # we need at least 1 index column to write our col names
+                col_line = []
+                if self.index:
+
+                    # name is the first column
+                    col_line.append(columns.names[i])
+
+                    if isinstance(index_label, list) and len(index_label) > 1:
+                        col_line.extend([''] * (len(index_label) - 1))
+
+                col_line.extend(columns._get_level_values(i))
+
+                writer.writerow(col_line)
+
+            # Write out the index line if it's not empty.
+            # Otherwise, we will print out an extraneous
+            # blank line between the mi and the data rows.
+            if encoded_labels and set(encoded_labels) != set(['']):
+                encoded_labels.extend([''] * len(columns))
+                writer.writerow(encoded_labels)
+
+    def _save(self):
+
+        self._save_header()
+
+        nrows = len(self.data_index)
+
+        # write in chunksize bites
+        chunksize = self.chunksize
+        chunks = int(nrows / chunksize) + 1
+
+        for i in range(chunks):
+            start_i = i * chunksize
+            end_i = min((i + 1) * chunksize, nrows)
+            if start_i >= end_i:
+                break
+
+            self._save_chunk(start_i, end_i)
+
+    def _save_chunk(self, start_i, end_i):
+
+        data_index = self.data_index
+
+        # create the data for a chunk
+        slicer = slice(start_i, end_i)
+        for i in range(len(self.blocks)):
+            b = self.blocks[i]
+            d = b.to_native_types(slicer=slicer, na_rep=self.na_rep,
+                                  float_format=self.float_format,
+                                  decimal=self.decimal,
+                                  date_format=self.date_format,
+                                  quoting=self.quoting)
+
+            for col_loc, col in zip(b.mgr_locs, d):
+                # self.data is a preallocated list
+                self.data[col_loc] = col
+
+        ix = data_index.to_native_types(slicer=slicer, na_rep=self.na_rep,
+                                        float_format=self.float_format,
+                                        decimal=self.decimal,
+                                        date_format=self.date_format,
+                                        quoting=self.quoting)
+
+        libwriters.write_csv_rows(self.data, ix, self.nlevels,
+                                  self.cols, self.writer)
diff --git a/pandas/io/formats/excel.py b/pandas/io/formats/excel.py
new file mode 100644
index 0000000000000..76ffd41f93090
--- /dev/null
+++ b/pandas/io/formats/excel.py
@@ -0,0 +1,654 @@
+"""Utilities for conversion to writer-agnostic Excel representation
+"""
+
+import re
+import warnings
+import itertools
+
+import numpy as np
+
+from pandas.compat import reduce
+from pandas.io.formats.css import CSSResolver, CSSWarning
+from pandas.io.formats.printing import pprint_thing
+import pandas.core.common as com
+from pandas.core.dtypes.common import is_float, is_scalar
+from pandas.core.dtypes import missing
+from pandas import Index, MultiIndex, PeriodIndex
+from pandas.io.formats.format import get_level_lengths
+
+
+class ExcelCell(object):
+    __fields__ = ('row', 'col', 'val', 'style', 'mergestart', 'mergeend')
+    __slots__ = __fields__
+
+    def __init__(self, row, col, val, style=None, mergestart=None,
+                 mergeend=None):
+        self.row = row
+        self.col = col
+        self.val = val
+        self.style = style
+        self.mergestart = mergestart
+        self.mergeend = mergeend
+
+
+header_style = {"font": {"bold": True},
+                "borders": {"top": "thin",
+                            "right": "thin",
+                            "bottom": "thin",
+                            "left": "thin"},
+                "alignment": {"horizontal": "center",
+                              "vertical": "top"}}
+
+
+class CSSToExcelConverter(object):
+    """A callable for converting CSS declarations to ExcelWriter styles
+
+    Supports parts of CSS 2.2, with minimal CSS 3.0 support (e.g. text-shadow),
+    focusing on font styling, backgrounds, borders and alignment.
+
+    Operates by first computing CSS styles in a fairly generic
+    way (see :meth:`compute_css`) then determining Excel style
+    properties from CSS properties (see :meth:`build_xlstyle`).
+
+    Parameters
+    ----------
+    inherited : str, optional
+        CSS declarations understood to be the containing scope for the
+        CSS processed by :meth:`__call__`.
+    """
+    # NB: Most of the methods here could be classmethods, as only __init__
+    #     and __call__ make use of instance attributes.  We leave them as
+    #     instancemethods so that users can easily experiment with extensions
+    #     without monkey-patching.
+
+    def __init__(self, inherited=None):
+        if inherited is not None:
+            inherited = self.compute_css(inherited,
+                                         self.compute_css.INITIAL_STYLE)
+
+        self.inherited = inherited
+
+    compute_css = CSSResolver()
+
+    def __call__(self, declarations_str):
+        """Convert CSS declarations to ExcelWriter style
+
+        Parameters
+        ----------
+        declarations_str : str
+            List of CSS declarations.
+            e.g. "font-weight: bold; background: blue"
+
+        Returns
+        -------
+        xlstyle : dict
+            A style as interpreted by ExcelWriter when found in
+            ExcelCell.style.
+        """
+        # TODO: memoize?
+        properties = self.compute_css(declarations_str, self.inherited)
+        return self.build_xlstyle(properties)
+
+    def build_xlstyle(self, props):
+        out = {
+            'alignment': self.build_alignment(props),
+            'border': self.build_border(props),
+            'fill': self.build_fill(props),
+            'font': self.build_font(props),
+        }
+        # TODO: support number format
+        # TODO: handle cell width and height: needs support in pandas.io.excel
+
+        def remove_none(d):
+            """Remove key where value is None, through nested dicts"""
+            for k, v in list(d.items()):
+                if v is None:
+                    del d[k]
+                elif isinstance(v, dict):
+                    remove_none(v)
+                    if not v:
+                        del d[k]
+
+        remove_none(out)
+        return out
+
+    VERTICAL_MAP = {
+        'top': 'top',
+        'text-top': 'top',
+        'middle': 'center',
+        'baseline': 'bottom',
+        'bottom': 'bottom',
+        'text-bottom': 'bottom',
+        # OpenXML also has 'justify', 'distributed'
+    }
+
+    def build_alignment(self, props):
+        # TODO: text-indent, padding-left -> alignment.indent
+        return {'horizontal': props.get('text-align'),
+                'vertical': self.VERTICAL_MAP.get(props.get('vertical-align')),
+                'wrap_text': (None if props.get('white-space') is None else
+                              props['white-space'] not in
+                              ('nowrap', 'pre', 'pre-line'))
+                }
+
+    def build_border(self, props):
+        return {side: {
+            'style': self._border_style(props.get('border-{side}-style'
+                                        .format(side=side)),
+                                        props.get('border-{side}-width'
+                                        .format(side=side))),
+            'color': self.color_to_excel(
+                props.get('border-{side}-color'.format(side=side))),
+        } for side in ['top', 'right', 'bottom', 'left']}
+
+    def _border_style(self, style, width):
+        # convert styles and widths to openxml, one of:
+        #       'dashDot'
+        #       'dashDotDot'
+        #       'dashed'
+        #       'dotted'
+        #       'double'
+        #       'hair'
+        #       'medium'
+        #       'mediumDashDot'
+        #       'mediumDashDotDot'
+        #       'mediumDashed'
+        #       'slantDashDot'
+        #       'thick'
+        #       'thin'
+        if width is None and style is None:
+            return None
+        if style == 'none' or style == 'hidden':
+            return None
+
+        if width is None:
+            width = '2pt'
+        width = float(width[:-2])
+        if width < 1e-5:
+            return None
+        elif width < 1.3:
+            width_name = 'thin'
+        elif width < 2.8:
+            width_name = 'medium'
+        else:
+            width_name = 'thick'
+
+        if style in (None, 'groove', 'ridge', 'inset', 'outset'):
+            # not handled
+            style = 'solid'
+
+        if style == 'double':
+            return 'double'
+        if style == 'solid':
+            return width_name
+        if style == 'dotted':
+            if width_name in ('hair', 'thin'):
+                return 'dotted'
+            return 'mediumDashDotDot'
+        if style == 'dashed':
+            if width_name in ('hair', 'thin'):
+                return 'dashed'
+            return 'mediumDashed'
+
+    def build_fill(self, props):
+        # TODO: perhaps allow for special properties
+        #       -excel-pattern-bgcolor and -excel-pattern-type
+        fill_color = props.get('background-color')
+        if fill_color not in (None, 'transparent', 'none'):
+            return {
+                'fgColor': self.color_to_excel(fill_color),
+                'patternType': 'solid',
+            }
+
+    BOLD_MAP = {'bold': True, 'bolder': True, '600': True, '700': True,
+                '800': True, '900': True,
+                'normal': False, 'lighter': False, '100': False, '200': False,
+                '300': False, '400': False, '500': False}
+    ITALIC_MAP = {'normal': False, 'italic': True, 'oblique': True}
+
+    def build_font(self, props):
+        size = props.get('font-size')
+        if size is not None:
+            assert size.endswith('pt')
+            size = float(size[:-2])
+
+        font_names_tmp = re.findall(r'''(?x)
+            (
+            "(?:[^"]|\\")+"
+            |
+            '(?:[^']|\\')+'
+            |
+            [^'",]+
+            )(?=,|\s*$)
+        ''', props.get('font-family', ''))
+        font_names = []
+        for name in font_names_tmp:
+            if name[:1] == '"':
+                name = name[1:-1].replace('\\"', '"')
+            elif name[:1] == '\'':
+                name = name[1:-1].replace('\\\'', '\'')
+            else:
+                name = name.strip()
+            if name:
+                font_names.append(name)
+
+        family = None
+        for name in font_names:
+            if name == 'serif':
+                family = 1  # roman
+                break
+            elif name == 'sans-serif':
+                family = 2  # swiss
+                break
+            elif name == 'cursive':
+                family = 4  # script
+                break
+            elif name == 'fantasy':
+                family = 5  # decorative
+                break
+
+        decoration = props.get('text-decoration')
+        if decoration is not None:
+            decoration = decoration.split()
+        else:
+            decoration = ()
+
+        return {
+            'name': font_names[0] if font_names else None,
+            'family': family,
+            'size': size,
+            'bold': self.BOLD_MAP.get(props.get('font-weight')),
+            'italic': self.ITALIC_MAP.get(props.get('font-style')),
+            'underline': ('single' if
+                          'underline' in decoration
+                          else None),
+            'strike': ('line-through' in decoration) or None,
+            'color': self.color_to_excel(props.get('color')),
+            # shadow if nonzero digit before shadow color
+            'shadow': (bool(re.search('^[^#(]*[1-9]',
+                                      props['text-shadow']))
+                       if 'text-shadow' in props else None),
+            # 'vertAlign':,
+            # 'charset': ,
+            # 'scheme': ,
+            # 'outline': ,
+            # 'condense': ,
+        }
+
+    NAMED_COLORS = {
+        'maroon': '800000',
+        'brown': 'A52A2A',
+        'red': 'FF0000',
+        'pink': 'FFC0CB',
+        'orange': 'FFA500',
+        'yellow': 'FFFF00',
+        'olive': '808000',
+        'green': '008000',
+        'purple': '800080',
+        'fuchsia': 'FF00FF',
+        'lime': '00FF00',
+        'teal': '008080',
+        'aqua': '00FFFF',
+        'blue': '0000FF',
+        'navy': '000080',
+        'black': '000000',
+        'gray': '808080',
+        'grey': '808080',
+        'silver': 'C0C0C0',
+        'white': 'FFFFFF',
+    }
+
+    def color_to_excel(self, val):
+        if val is None:
+            return None
+        if val.startswith('#') and len(val) == 7:
+            return val[1:].upper()
+        if val.startswith('#') and len(val) == 4:
+            return (val[1] * 2 + val[2] * 2 + val[3] * 2).upper()
+        try:
+            return self.NAMED_COLORS[val]
+        except KeyError:
+            warnings.warn('Unhandled color format: {val!r}'.format(val=val),
+                          CSSWarning)
+
+
+class ExcelFormatter(object):
+    """
+    Class for formatting a DataFrame to a list of ExcelCells,
+
+    Parameters
+    ----------
+    df : DataFrame or Styler
+    na_rep: na representation
+    float_format : string, default None
+            Format string for floating point numbers
+    cols : sequence, optional
+        Columns to write
+    header : boolean or list of string, default True
+        Write out column names. If a list of string is given it is
+        assumed to be aliases for the column names
+    index : boolean, default True
+        output row names (index)
+    index_label : string or sequence, default None
+            Column label for index column(s) if desired. If None is given, and
+            `header` and `index` are True, then the index names are used. A
+            sequence should be given if the DataFrame uses MultiIndex.
+    merge_cells : boolean, default False
+            Format MultiIndex and Hierarchical Rows as merged cells.
+    inf_rep : string, default `'inf'`
+        representation for np.inf values (which aren't representable in Excel)
+        A `'-'` sign will be added in front of -inf.
+    style_converter : callable, optional
+        This translates Styler styles (CSS) into ExcelWriter styles.
+        Defaults to ``CSSToExcelConverter()``.
+        It should have signature css_declarations string -> excel style.
+        This is only called for body cells.
+    """
+
+    def __init__(self, df, na_rep='', float_format=None, cols=None,
+                 header=True, index=True, index_label=None, merge_cells=False,
+                 inf_rep='inf', style_converter=None):
+        self.rowcounter = 0
+        self.na_rep = na_rep
+        if hasattr(df, 'render'):
+            self.styler = df
+            df = df.data
+            if style_converter is None:
+                style_converter = CSSToExcelConverter()
+            self.style_converter = style_converter
+        else:
+            self.styler = None
+        self.df = df
+        if cols is not None:
+
+            # all missing, raise
+            if not len(Index(cols) & df.columns):
+                raise KeyError(
+                    "passes columns are not ALL present dataframe")
+
+            # deprecatedin gh-17295
+            # 1 missing is ok (for now)
+            if len(Index(cols) & df.columns) != len(cols):
+                warnings.warn(
+                    "Not all names specified in 'columns' are found; "
+                    "this will raise a KeyError in the future",
+                    FutureWarning)
+
+            self.df = df.reindex(columns=cols)
+        self.columns = self.df.columns
+        self.float_format = float_format
+        self.index = index
+        self.index_label = index_label
+        self.header = header
+        self.merge_cells = merge_cells
+        self.inf_rep = inf_rep
+
+    def _format_value(self, val):
+        if is_scalar(val) and missing.isna(val):
+            val = self.na_rep
+        elif is_float(val):
+            if missing.isposinf_scalar(val):
+                val = self.inf_rep
+            elif missing.isneginf_scalar(val):
+                val = '-{inf}'.format(inf=self.inf_rep)
+            elif self.float_format is not None:
+                val = float(self.float_format % val)
+        return val
+
+    def _format_header_mi(self):
+        if self.columns.nlevels > 1:
+            if not self.index:
+                raise NotImplementedError("Writing to Excel with MultiIndex"
+                                          " columns and no index "
+                                          "('index'=False) is not yet "
+                                          "implemented.")
+
+        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
+        if not (has_aliases or self.header):
+            return
+
+        columns = self.columns
+        level_strs = columns.format(sparsify=self.merge_cells, adjoin=False,
+                                    names=False)
+        level_lengths = get_level_lengths(level_strs)
+        coloffset = 0
+        lnum = 0
+
+        if self.index and isinstance(self.df.index, MultiIndex):
+            coloffset = len(self.df.index[0]) - 1
+
+        if self.merge_cells:
+            # Format multi-index as a merged cells.
+            for lnum in range(len(level_lengths)):
+                name = columns.names[lnum]
+                yield ExcelCell(lnum, coloffset, name, header_style)
+
+            for lnum, (spans, levels, labels) in enumerate(zip(
+                    level_lengths, columns.levels, columns.labels)):
+                values = levels.take(labels)
+                for i in spans:
+                    if spans[i] > 1:
+                        yield ExcelCell(lnum, coloffset + i + 1, values[i],
+                                        header_style, lnum,
+                                        coloffset + i + spans[i])
+                    else:
+                        yield ExcelCell(lnum, coloffset + i + 1, values[i],
+                                        header_style)
+        else:
+            # Format in legacy format with dots to indicate levels.
+            for i, values in enumerate(zip(*level_strs)):
+                v = ".".join(map(pprint_thing, values))
+                yield ExcelCell(lnum, coloffset + i + 1, v, header_style)
+
+        self.rowcounter = lnum
+
+    def _format_header_regular(self):
+        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
+        if has_aliases or self.header:
+            coloffset = 0
+
+            if self.index:
+                coloffset = 1
+                if isinstance(self.df.index, MultiIndex):
+                    coloffset = len(self.df.index[0])
+
+            colnames = self.columns
+            if has_aliases:
+                if len(self.header) != len(self.columns):
+                    raise ValueError('Writing {cols} cols but got {alias} '
+                                     'aliases'.format(cols=len(self.columns),
+                                                      alias=len(self.header)))
+                else:
+                    colnames = self.header
+
+            for colindex, colname in enumerate(colnames):
+                yield ExcelCell(self.rowcounter, colindex + coloffset, colname,
+                                header_style)
+
+    def _format_header(self):
+        if isinstance(self.columns, MultiIndex):
+            gen = self._format_header_mi()
+        else:
+            gen = self._format_header_regular()
+
+        gen2 = ()
+        if self.df.index.names:
+            row = [x if x is not None else ''
+                   for x in self.df.index.names] + [''] * len(self.columns)
+            if reduce(lambda x, y: x and y, map(lambda x: x != '', row)):
+                gen2 = (ExcelCell(self.rowcounter, colindex, val, header_style)
+                        for colindex, val in enumerate(row))
+                self.rowcounter += 1
+        return itertools.chain(gen, gen2)
+
+    def _format_body(self):
+
+        if isinstance(self.df.index, MultiIndex):
+            return self._format_hierarchical_rows()
+        else:
+            return self._format_regular_rows()
+
+    def _format_regular_rows(self):
+        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
+        if has_aliases or self.header:
+            self.rowcounter += 1
+
+        # output index and index_label?
+        if self.index:
+            # check aliases
+            # if list only take first as this is not a MultiIndex
+            if (self.index_label and
+                    isinstance(self.index_label, (list, tuple, np.ndarray,
+                                                  Index))):
+                index_label = self.index_label[0]
+            # if string good to go
+            elif self.index_label and isinstance(self.index_label, str):
+                index_label = self.index_label
+            else:
+                index_label = self.df.index.names[0]
+
+            if isinstance(self.columns, MultiIndex):
+                self.rowcounter += 1
+
+            if index_label and self.header is not False:
+                yield ExcelCell(self.rowcounter - 1, 0, index_label,
+                                header_style)
+
+            # write index_values
+            index_values = self.df.index
+            if isinstance(self.df.index, PeriodIndex):
+                index_values = self.df.index.to_timestamp()
+
+            for idx, idxval in enumerate(index_values):
+                yield ExcelCell(self.rowcounter + idx, 0, idxval, header_style)
+
+            coloffset = 1
+        else:
+            coloffset = 0
+
+        for cell in self._generate_body(coloffset):
+            yield cell
+
+    def _format_hierarchical_rows(self):
+        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
+        if has_aliases or self.header:
+            self.rowcounter += 1
+
+        gcolidx = 0
+
+        if self.index:
+            index_labels = self.df.index.names
+            # check for aliases
+            if (self.index_label and
+                    isinstance(self.index_label, (list, tuple, np.ndarray,
+                                                  Index))):
+                index_labels = self.index_label
+
+            # MultiIndex columns require an extra row
+            # with index names (blank if None) for
+            # unambigous round-trip, unless not merging,
+            # in which case the names all go on one row Issue #11328
+            if isinstance(self.columns, MultiIndex) and self.merge_cells:
+                self.rowcounter += 1
+
+            # if index labels are not empty go ahead and dump
+            if com._any_not_none(*index_labels) and self.header is not False:
+
+                for cidx, name in enumerate(index_labels):
+                    yield ExcelCell(self.rowcounter - 1, cidx, name,
+                                    header_style)
+
+            if self.merge_cells:
+                # Format hierarchical rows as merged cells.
+                level_strs = self.df.index.format(sparsify=True, adjoin=False,
+                                                  names=False)
+                level_lengths = get_level_lengths(level_strs)
+
+                for spans, levels, labels in zip(level_lengths,
+                                                 self.df.index.levels,
+                                                 self.df.index.labels):
+
+                    values = levels.take(labels,
+                                         allow_fill=levels._can_hold_na,
+                                         fill_value=True)
+
+                    for i in spans:
+                        if spans[i] > 1:
+                            yield ExcelCell(self.rowcounter + i, gcolidx,
+                                            values[i], header_style,
+                                            self.rowcounter + i + spans[i] - 1,
+                                            gcolidx)
+                        else:
+                            yield ExcelCell(self.rowcounter + i, gcolidx,
+                                            values[i], header_style)
+                    gcolidx += 1
+
+            else:
+                # Format hierarchical rows with non-merged values.
+                for indexcolvals in zip(*self.df.index):
+                    for idx, indexcolval in enumerate(indexcolvals):
+                        yield ExcelCell(self.rowcounter + idx, gcolidx,
+                                        indexcolval, header_style)
+                    gcolidx += 1
+
+        for cell in self._generate_body(gcolidx):
+            yield cell
+
+    def _generate_body(self, coloffset):
+        if self.styler is None:
+            styles = None
+        else:
+            styles = self.styler._compute().ctx
+            if not styles:
+                styles = None
+        xlstyle = None
+
+        # Write the body of the frame data series by series.
+        for colidx in range(len(self.columns)):
+            series = self.df.iloc[:, colidx]
+            for i, val in enumerate(series):
+                if styles is not None:
+                    xlstyle = self.style_converter(';'.join(styles[i, colidx]))
+                yield ExcelCell(self.rowcounter + i, colidx + coloffset, val,
+                                xlstyle)
+
+    def get_formatted_cells(self):
+        for cell in itertools.chain(self._format_header(),
+                                    self._format_body()):
+            cell.val = self._format_value(cell.val)
+            yield cell
+
+    def write(self, writer, sheet_name='Sheet1', startrow=0,
+              startcol=0, freeze_panes=None, engine=None):
+        """
+        writer : string or ExcelWriter object
+            File path or existing ExcelWriter
+        sheet_name : string, default 'Sheet1'
+            Name of sheet which will contain DataFrame
+        startrow :
+            upper left cell row to dump data frame
+        startcol :
+            upper left cell column to dump data frame
+        freeze_panes : tuple of integer (length 2), default None
+            Specifies the one-based bottommost row and rightmost column that
+            is to be frozen
+        engine : string, default None
+            write engine to use if writer is a path - you can also set this
+            via the options ``io.excel.xlsx.writer``, ``io.excel.xls.writer``,
+            and ``io.excel.xlsm.writer``.
+        """
+        from pandas.io.excel import ExcelWriter
+        from pandas.io.common import _stringify_path
+
+        if isinstance(writer, ExcelWriter):
+            need_save = False
+        else:
+            writer = ExcelWriter(_stringify_path(writer), engine=engine)
+            need_save = True
+
+        formatted_cells = self.get_formatted_cells()
+        writer.write_cells(formatted_cells, sheet_name,
+                           startrow=startrow, startcol=startcol,
+                           freeze_panes=freeze_panes)
+        if need_save:
+            writer.save()
diff --git a/pandas/io/formats/format.py b/pandas/io/formats/format.py
new file mode 100644
index 0000000000000..12201f62946ac
--- /dev/null
+++ b/pandas/io/formats/format.py
@@ -0,0 +1,1602 @@
+# -*- coding: utf-8 -*-
+"""
+Internal module for formatting output data in csv, html,
+and latex files. This module also applies to display formatting.
+"""
+
+from __future__ import print_function
+# pylint: disable=W0141
+
+from pandas.core.dtypes.missing import isna, notna
+from pandas.core.dtypes.common import (
+    is_categorical_dtype,
+    is_float_dtype,
+    is_period_arraylike,
+    is_integer_dtype,
+    is_interval_dtype,
+    is_datetimetz,
+    is_integer,
+    is_float,
+    is_scalar,
+    is_numeric_dtype,
+    is_datetime64_dtype,
+    is_timedelta64_dtype,
+    is_list_like)
+from pandas.core.dtypes.generic import ABCSparseArray
+from pandas.core.base import PandasObject
+import pandas.core.common as com
+from pandas.core.index import Index, MultiIndex, _ensure_index
+from pandas import compat
+from pandas.compat import (StringIO, lzip, map, zip, u)
+
+from pandas.io.formats.terminal import get_terminal_size
+from pandas.core.config import get_option, set_option
+from pandas.io.common import (_expand_user, _stringify_path)
+from pandas.io.formats.printing import adjoin, justify, pprint_thing
+from pandas._libs import lib
+
+from pandas._libs.tslib import (iNaT, Timestamp, Timedelta,
+                                format_array_from_datetime)
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexes.period import PeriodIndex
+import pandas as pd
+import numpy as np
+
+from functools import partial
+
+common_docstring = """
+    Parameters
+    ----------
+    buf : StringIO-like, optional
+        buffer to write to
+    columns : sequence, optional
+        the subset of columns to write; default None writes all columns
+    col_space : int, optional
+        the minimum width of each column
+    header : bool, optional
+        %(header)s
+    index : bool, optional
+        whether to print index (row) labels, default True
+    na_rep : string, optional
+        string representation of NAN to use, default 'NaN'
+    formatters : list or dict of one-parameter functions, optional
+        formatter functions to apply to columns' elements by position or name,
+        default None. The result of each function must be a unicode string.
+        List must be of length equal to the number of columns.
+    float_format : one-parameter function, optional
+        formatter function to apply to columns' elements if they are floats,
+        default None. The result of this function must be a unicode string.
+    sparsify : bool, optional
+        Set to False for a DataFrame with a hierarchical index to print every
+        multiindex key at each row, default True
+    index_names : bool, optional
+        Prints the names of the indexes, default True
+    line_width : int, optional
+        Width to wrap a line in characters, default no wrap
+    table_id : str, optional
+        id for the <table> element create by to_html
+
+        .. versionadded:: 0.23.0"""
+
+_VALID_JUSTIFY_PARAMETERS = ("left", "right", "center", "justify",
+                             "justify-all", "start", "end", "inherit",
+                             "match-parent", "initial", "unset")
+
+justify_docstring = """
+    justify : str, default None
+        How to justify the column labels. If None uses the option from
+        the print configuration (controlled by set_option), 'right' out
+        of the box. Valid values are
+
+        * left
+        * right
+        * center
+        * justify
+        * justify-all
+        * start
+        * end
+        * inherit
+        * match-parent
+        * initial
+        * unset
+"""
+
+return_docstring = """
+
+    Returns
+    -------
+    formatted : string (or unicode, depending on data and options)"""
+
+docstring_to_string = common_docstring + justify_docstring + return_docstring
+
+
+class CategoricalFormatter(object):
+
+    def __init__(self, categorical, buf=None, length=True, na_rep='NaN',
+                 footer=True):
+        self.categorical = categorical
+        self.buf = buf if buf is not None else StringIO(u(""))
+        self.na_rep = na_rep
+        self.length = length
+        self.footer = footer
+
+    def _get_footer(self):
+        footer = ''
+
+        if self.length:
+            if footer:
+                footer += ', '
+            footer += "Length: {length}".format(length=len(self.categorical))
+
+        level_info = self.categorical._repr_categories_info()
+
+        # Levels are added in a newline
+        if footer:
+            footer += '\n'
+        footer += level_info
+
+        return compat.text_type(footer)
+
+    def _get_formatted_values(self):
+        return format_array(self.categorical.get_values(), None,
+                            float_format=None, na_rep=self.na_rep)
+
+    def to_string(self):
+        categorical = self.categorical
+
+        if len(categorical) == 0:
+            if self.footer:
+                return self._get_footer()
+            else:
+                return u('')
+
+        fmt_values = self._get_formatted_values()
+
+        result = [u('{i}').format(i=i) for i in fmt_values]
+        result = [i.strip() for i in result]
+        result = u(', ').join(result)
+        result = [u('[') + result + u(']')]
+        if self.footer:
+            footer = self._get_footer()
+            if footer:
+                result.append(footer)
+
+        return compat.text_type(u('\n').join(result))
+
+
+class SeriesFormatter(object):
+
+    def __init__(self, series, buf=None, length=True, header=True, index=True,
+                 na_rep='NaN', name=False, float_format=None, dtype=True,
+                 max_rows=None):
+        self.series = series
+        self.buf = buf if buf is not None else StringIO()
+        self.name = name
+        self.na_rep = na_rep
+        self.header = header
+        self.length = length
+        self.index = index
+        self.max_rows = max_rows
+
+        if float_format is None:
+            float_format = get_option("display.float_format")
+        self.float_format = float_format
+        self.dtype = dtype
+        self.adj = _get_adjustment()
+
+        self._chk_truncate()
+
+    def _chk_truncate(self):
+        from pandas.core.reshape.concat import concat
+        max_rows = self.max_rows
+        truncate_v = max_rows and (len(self.series) > max_rows)
+        series = self.series
+        if truncate_v:
+            if max_rows == 1:
+                row_num = max_rows
+                series = series.iloc[:max_rows]
+            else:
+                row_num = max_rows // 2
+                series = concat((series.iloc[:row_num],
+                                 series.iloc[-row_num:]))
+            self.tr_row_num = row_num
+        self.tr_series = series
+        self.truncate_v = truncate_v
+
+    def _get_footer(self):
+        name = self.series.name
+        footer = u('')
+
+        if getattr(self.series.index, 'freq', None) is not None:
+            footer += 'Freq: {freq}'.format(freq=self.series.index.freqstr)
+
+        if self.name is not False and name is not None:
+            if footer:
+                footer += ', '
+
+            series_name = pprint_thing(name,
+                                       escape_chars=('\t', '\r', '\n'))
+            footer += ((u"Name: {sname}".format(sname=series_name))
+                       if name is not None else "")
+
+        if (self.length is True or
+                (self.length == 'truncate' and self.truncate_v)):
+            if footer:
+                footer += ', '
+            footer += 'Length: {length}'.format(length=len(self.series))
+
+        if self.dtype is not False and self.dtype is not None:
+            name = getattr(self.tr_series.dtype, 'name', None)
+            if name:
+                if footer:
+                    footer += ', '
+                footer += u'dtype: {typ}'.format(typ=pprint_thing(name))
+
+        # level infos are added to the end and in a new line, like it is done
+        # for Categoricals
+        if is_categorical_dtype(self.tr_series.dtype):
+            level_info = self.tr_series._values._repr_categories_info()
+            if footer:
+                footer += "\n"
+            footer += level_info
+
+        return compat.text_type(footer)
+
+    def _get_formatted_index(self):
+        index = self.tr_series.index
+        is_multi = isinstance(index, MultiIndex)
+
+        if is_multi:
+            have_header = any(name for name in index.names)
+            fmt_index = index.format(names=True)
+        else:
+            have_header = index.name is not None
+            fmt_index = index.format(name=True)
+        return fmt_index, have_header
+
+    def _get_formatted_values(self):
+        values_to_format = self.tr_series._formatting_values()
+        return format_array(values_to_format, None,
+                            float_format=self.float_format, na_rep=self.na_rep)
+
+    def to_string(self):
+        series = self.tr_series
+        footer = self._get_footer()
+
+        if len(series) == 0:
+            return 'Series([], ' + footer + ')'
+
+        fmt_index, have_header = self._get_formatted_index()
+        fmt_values = self._get_formatted_values()
+
+        if self.truncate_v:
+            n_header_rows = 0
+            row_num = self.tr_row_num
+            width = self.adj.len(fmt_values[row_num - 1])
+            if width > 3:
+                dot_str = '...'
+            else:
+                dot_str = '..'
+            # Series uses mode=center because it has single value columns
+            # DataFrame uses mode=left
+            dot_str = self.adj.justify([dot_str], width, mode='center')[0]
+            fmt_values.insert(row_num + n_header_rows, dot_str)
+            fmt_index.insert(row_num + 1, '')
+
+        if self.index:
+            result = self.adj.adjoin(3, *[fmt_index[1:], fmt_values])
+        else:
+            result = self.adj.adjoin(3, fmt_values).replace('\n ',
+                                                            '\n').strip()
+
+        if self.header and have_header:
+            result = fmt_index[0] + '\n' + result
+
+        if footer:
+            result += '\n' + footer
+
+        return compat.text_type(u('').join(result))
+
+
+class TextAdjustment(object):
+
+    def __init__(self):
+        self.encoding = get_option("display.encoding")
+
+    def len(self, text):
+        return compat.strlen(text, encoding=self.encoding)
+
+    def justify(self, texts, max_len, mode='right'):
+        return justify(texts, max_len, mode=mode)
+
+    def adjoin(self, space, *lists, **kwargs):
+        return adjoin(space, *lists, strlen=self.len,
+                      justfunc=self.justify, **kwargs)
+
+
+class EastAsianTextAdjustment(TextAdjustment):
+
+    def __init__(self):
+        super(EastAsianTextAdjustment, self).__init__()
+        if get_option("display.unicode.ambiguous_as_wide"):
+            self.ambiguous_width = 2
+        else:
+            self.ambiguous_width = 1
+
+    def len(self, text):
+        return compat.east_asian_len(text, encoding=self.encoding,
+                                     ambiguous_width=self.ambiguous_width)
+
+    def justify(self, texts, max_len, mode='right'):
+        # re-calculate padding space per str considering East Asian Width
+        def _get_pad(t):
+            return max_len - self.len(t) + len(t)
+
+        if mode == 'left':
+            return [x.ljust(_get_pad(x)) for x in texts]
+        elif mode == 'center':
+            return [x.center(_get_pad(x)) for x in texts]
+        else:
+            return [x.rjust(_get_pad(x)) for x in texts]
+
+
+def _get_adjustment():
+    use_east_asian_width = get_option("display.unicode.east_asian_width")
+    if use_east_asian_width:
+        return EastAsianTextAdjustment()
+    else:
+        return TextAdjustment()
+
+
+class TableFormatter(object):
+
+    is_truncated = False
+    show_dimensions = None
+
+    @property
+    def should_show_dimensions(self):
+        return (self.show_dimensions is True or
+                (self.show_dimensions == 'truncate' and self.is_truncated))
+
+    def _get_formatter(self, i):
+        if isinstance(self.formatters, (list, tuple)):
+            if is_integer(i):
+                return self.formatters[i]
+            else:
+                return None
+        else:
+            if is_integer(i) and i not in self.columns:
+                i = self.columns[i]
+            return self.formatters.get(i, None)
+
+
+class DataFrameFormatter(TableFormatter):
+    """
+    Render a DataFrame
+
+    self.to_string() : console-friendly tabular output
+    self.to_html()   : html table
+    self.to_latex()   : LaTeX tabular environment table
+
+    """
+
+    __doc__ = __doc__ if __doc__ else ''
+    __doc__ += common_docstring + justify_docstring + return_docstring
+
+    def __init__(self, frame, buf=None, columns=None, col_space=None,
+                 header=True, index=True, na_rep='NaN', formatters=None,
+                 justify=None, float_format=None, sparsify=None,
+                 index_names=True, line_width=None, max_rows=None,
+                 max_cols=None, show_dimensions=False, decimal='.',
+                 table_id=None, **kwds):
+        self.frame = frame
+        if buf is not None:
+            self.buf = _expand_user(_stringify_path(buf))
+        else:
+            self.buf = StringIO()
+        self.show_index_names = index_names
+
+        if sparsify is None:
+            sparsify = get_option("display.multi_sparse")
+
+        self.sparsify = sparsify
+
+        self.float_format = float_format
+        self.formatters = formatters if formatters is not None else {}
+        self.na_rep = na_rep
+        self.decimal = decimal
+        self.col_space = col_space
+        self.header = header
+        self.index = index
+        self.line_width = line_width
+        self.max_rows = max_rows
+        self.max_cols = max_cols
+        self.max_rows_displayed = min(max_rows or len(self.frame),
+                                      len(self.frame))
+        self.show_dimensions = show_dimensions
+        self.table_id = table_id
+
+        if justify is None:
+            self.justify = get_option("display.colheader_justify")
+        else:
+            self.justify = justify
+
+        self.kwds = kwds
+
+        if columns is not None:
+            self.columns = _ensure_index(columns)
+            self.frame = self.frame[self.columns]
+        else:
+            self.columns = frame.columns
+
+        self._chk_truncate()
+        self.adj = _get_adjustment()
+
+    def _chk_truncate(self):
+        """
+        Checks whether the frame should be truncated. If so, slices
+        the frame up.
+        """
+        from pandas.core.reshape.concat import concat
+
+        # Column of which first element is used to determine width of a dot col
+        self.tr_size_col = -1
+
+        # Cut the data to the information actually printed
+        max_cols = self.max_cols
+        max_rows = self.max_rows
+
+        if max_cols == 0 or max_rows == 0:  # assume we are in the terminal
+                                            # (why else = 0)
+            (w, h) = get_terminal_size()
+            self.w = w
+            self.h = h
+            if self.max_rows == 0:
+                dot_row = 1
+                prompt_row = 1
+                if self.show_dimensions:
+                    show_dimension_rows = 3
+                n_add_rows = (self.header + dot_row + show_dimension_rows +
+                              prompt_row)
+                # rows available to fill with actual data
+                max_rows_adj = self.h - n_add_rows
+                self.max_rows_adj = max_rows_adj
+
+            # Format only rows and columns that could potentially fit the
+            # screen
+            if max_cols == 0 and len(self.frame.columns) > w:
+                max_cols = w
+            if max_rows == 0 and len(self.frame) > h:
+                max_rows = h
+
+        if not hasattr(self, 'max_rows_adj'):
+            self.max_rows_adj = max_rows
+        if not hasattr(self, 'max_cols_adj'):
+            self.max_cols_adj = max_cols
+
+        max_cols_adj = self.max_cols_adj
+        max_rows_adj = self.max_rows_adj
+
+        truncate_h = max_cols_adj and (len(self.columns) > max_cols_adj)
+        truncate_v = max_rows_adj and (len(self.frame) > max_rows_adj)
+
+        frame = self.frame
+        if truncate_h:
+            if max_cols_adj == 0:
+                col_num = len(frame.columns)
+            elif max_cols_adj == 1:
+                frame = frame.iloc[:, :max_cols]
+                col_num = max_cols
+            else:
+                col_num = (max_cols_adj // 2)
+                frame = concat((frame.iloc[:, :col_num],
+                                frame.iloc[:, -col_num:]), axis=1)
+            self.tr_col_num = col_num
+        if truncate_v:
+            if max_rows_adj == 0:
+                row_num = len(frame)
+            if max_rows_adj == 1:
+                row_num = max_rows
+                frame = frame.iloc[:max_rows, :]
+            else:
+                row_num = max_rows_adj // 2
+                frame = concat((frame.iloc[:row_num, :],
+                                frame.iloc[-row_num:, :]))
+            self.tr_row_num = row_num
+
+        self.tr_frame = frame
+        self.truncate_h = truncate_h
+        self.truncate_v = truncate_v
+        self.is_truncated = self.truncate_h or self.truncate_v
+
+    def _to_str_columns(self):
+        """
+        Render a DataFrame to a list of columns (as lists of strings).
+        """
+        frame = self.tr_frame
+
+        # may include levels names also
+
+        str_index = self._get_formatted_index(frame)
+
+        if not is_list_like(self.header) and not self.header:
+            stringified = []
+            for i, c in enumerate(frame):
+                fmt_values = self._format_col(i)
+                fmt_values = _make_fixed_width(fmt_values, self.justify,
+                                               minimum=(self.col_space or 0),
+                                               adj=self.adj)
+                stringified.append(fmt_values)
+        else:
+            if is_list_like(self.header):
+                if len(self.header) != len(self.columns):
+                    raise ValueError(('Writing {ncols} cols but got {nalias} '
+                                      'aliases'
+                                      .format(ncols=len(self.columns),
+                                              nalias=len(self.header))))
+                str_columns = [[label] for label in self.header]
+            else:
+                str_columns = self._get_formatted_column_labels(frame)
+
+            stringified = []
+            for i, c in enumerate(frame):
+                cheader = str_columns[i]
+                header_colwidth = max(self.col_space or 0,
+                                      *(self.adj.len(x) for x in cheader))
+                fmt_values = self._format_col(i)
+                fmt_values = _make_fixed_width(fmt_values, self.justify,
+                                               minimum=header_colwidth,
+                                               adj=self.adj)
+
+                max_len = max(max(self.adj.len(x) for x in fmt_values),
+                              header_colwidth)
+                cheader = self.adj.justify(cheader, max_len, mode=self.justify)
+                stringified.append(cheader + fmt_values)
+
+        strcols = stringified
+        if self.index:
+            strcols.insert(0, str_index)
+
+        # Add ... to signal truncated
+        truncate_h = self.truncate_h
+        truncate_v = self.truncate_v
+
+        if truncate_h:
+            col_num = self.tr_col_num
+            # infer from column header
+            col_width = self.adj.len(strcols[self.tr_size_col][0])
+            strcols.insert(self.tr_col_num + 1, ['...'.center(col_width)] *
+                           (len(str_index)))
+        if truncate_v:
+            n_header_rows = len(str_index) - len(frame)
+            row_num = self.tr_row_num
+            for ix, col in enumerate(strcols):
+                # infer from above row
+                cwidth = self.adj.len(strcols[ix][row_num])
+                is_dot_col = False
+                if truncate_h:
+                    is_dot_col = ix == col_num + 1
+                if cwidth > 3 or is_dot_col:
+                    my_str = '...'
+                else:
+                    my_str = '..'
+
+                if ix == 0:
+                    dot_mode = 'left'
+                elif is_dot_col:
+                    cwidth = self.adj.len(strcols[self.tr_size_col][0])
+                    dot_mode = 'center'
+                else:
+                    dot_mode = 'right'
+                dot_str = self.adj.justify([my_str], cwidth, mode=dot_mode)[0]
+                strcols[ix].insert(row_num + n_header_rows, dot_str)
+        return strcols
+
+    def to_string(self):
+        """
+        Render a DataFrame to a console-friendly tabular output.
+        """
+        from pandas import Series
+
+        frame = self.frame
+
+        if len(frame.columns) == 0 or len(frame.index) == 0:
+            info_line = (u('Empty {name}\nColumns: {col}\nIndex: {idx}')
+                         .format(name=type(self.frame).__name__,
+                         col=pprint_thing(frame.columns),
+                         idx=pprint_thing(frame.index)))
+            text = info_line
+        else:
+
+            strcols = self._to_str_columns()
+            if self.line_width is None:  # no need to wrap around just print
+                # the whole frame
+                text = self.adj.adjoin(1, *strcols)
+            elif (not isinstance(self.max_cols, int) or
+                    self.max_cols > 0):  # need to wrap around
+                text = self._join_multiline(*strcols)
+            else:  # max_cols == 0. Try to fit frame to terminal
+                text = self.adj.adjoin(1, *strcols).split('\n')
+                max_len = Series(text).str.len().max()
+                headers = [ele[0] for ele in strcols]
+                # Size of last col determines dot col size. See
+                # `self._to_str_columns
+                size_tr_col = len(headers[self.tr_size_col])
+                max_len += size_tr_col  # Need to make space for largest row
+                # plus truncate dot col
+                dif = max_len - self.w
+                # '+ 1' to avoid too wide repr (GH PR #17023)
+                adj_dif = dif + 1
+                col_lens = Series([Series(ele).apply(len).max()
+                                   for ele in strcols])
+                n_cols = len(col_lens)
+                counter = 0
+                while adj_dif > 0 and n_cols > 1:
+                    counter += 1
+                    mid = int(round(n_cols / 2.))
+                    mid_ix = col_lens.index[mid]
+                    col_len = col_lens[mid_ix]
+                    adj_dif -= (col_len + 1)  # adjoin adds one
+                    col_lens = col_lens.drop(mid_ix)
+                    n_cols = len(col_lens)
+                max_cols_adj = n_cols - self.index  # subtract index column
+                self.max_cols_adj = max_cols_adj
+
+                # Call again _chk_truncate to cut frame appropriately
+                # and then generate string representation
+                self._chk_truncate()
+                strcols = self._to_str_columns()
+                text = self.adj.adjoin(1, *strcols)
+        if not self.index:
+            text = text.replace('\n ', '\n').strip()
+        self.buf.writelines(text)
+
+        if self.should_show_dimensions:
+            self.buf.write("\n\n[{nrows} rows x {ncols} columns]"
+                           .format(nrows=len(frame), ncols=len(frame.columns)))
+
+    def _join_multiline(self, *strcols):
+        lwidth = self.line_width
+        adjoin_width = 1
+        strcols = list(strcols)
+        if self.index:
+            idx = strcols.pop(0)
+            lwidth -= np.array([self.adj.len(x)
+                                for x in idx]).max() + adjoin_width
+
+        col_widths = [np.array([self.adj.len(x) for x in col]).max() if
+                      len(col) > 0 else 0 for col in strcols]
+        col_bins = _binify(col_widths, lwidth)
+        nbins = len(col_bins)
+
+        if self.truncate_v:
+            nrows = self.max_rows_adj + 1
+        else:
+            nrows = len(self.frame)
+
+        str_lst = []
+        st = 0
+        for i, ed in enumerate(col_bins):
+            row = strcols[st:ed]
+            if self.index:
+                row.insert(0, idx)
+            if nbins > 1:
+                if ed <= len(strcols) and i < nbins - 1:
+                    row.append([' \\'] + ['  '] * (nrows - 1))
+                else:
+                    row.append([' '] * nrows)
+            str_lst.append(self.adj.adjoin(adjoin_width, *row))
+            st = ed
+        return '\n\n'.join(str_lst)
+
+    def to_latex(self, column_format=None, longtable=False, encoding=None,
+                 multicolumn=False, multicolumn_format=None, multirow=False):
+        """
+        Render a DataFrame to a LaTeX tabular/longtable environment output.
+        """
+
+        from pandas.io.formats.latex import LatexFormatter
+        latex_renderer = LatexFormatter(self, column_format=column_format,
+                                        longtable=longtable,
+                                        multicolumn=multicolumn,
+                                        multicolumn_format=multicolumn_format,
+                                        multirow=multirow)
+
+        if encoding is None:
+            encoding = 'ascii' if compat.PY2 else 'utf-8'
+
+        if hasattr(self.buf, 'write'):
+            latex_renderer.write_result(self.buf)
+        elif isinstance(self.buf, compat.string_types):
+            import codecs
+            with codecs.open(self.buf, 'w', encoding=encoding) as f:
+                latex_renderer.write_result(f)
+        else:
+            raise TypeError('buf is not a file name and it has no write '
+                            'method')
+
+    def _format_col(self, i):
+        frame = self.tr_frame
+        formatter = self._get_formatter(i)
+        values_to_format = frame.iloc[:, i]._formatting_values()
+        return format_array(values_to_format, formatter,
+                            float_format=self.float_format, na_rep=self.na_rep,
+                            space=self.col_space, decimal=self.decimal)
+
+    def to_html(self, classes=None, notebook=False, border=None):
+        """
+        Render a DataFrame to a html table.
+
+        Parameters
+        ----------
+        classes : str or list-like
+            classes to include in the `class` attribute of the opening
+            ``<table>`` tag, in addition to the default "dataframe".
+        notebook : {True, False}, optional, default False
+            Whether the generated HTML is for IPython Notebook.
+        border : int
+            A ``border=border`` attribute is included in the opening
+            ``<table>`` tag. Default ``pd.options.html.border``.
+
+            .. versionadded:: 0.19.0
+         """
+        from pandas.io.formats.html import HTMLFormatter
+        html_renderer = HTMLFormatter(self, classes=classes,
+                                      max_rows=self.max_rows,
+                                      max_cols=self.max_cols,
+                                      notebook=notebook,
+                                      border=border,
+                                      table_id=self.table_id)
+        if hasattr(self.buf, 'write'):
+            html_renderer.write_result(self.buf)
+        elif isinstance(self.buf, compat.string_types):
+            with open(self.buf, 'w') as f:
+                html_renderer.write_result(f)
+        else:
+            raise TypeError('buf is not a file name and it has no write '
+                            ' method')
+
+    def _get_formatted_column_labels(self, frame):
+        from pandas.core.index import _sparsify
+
+        columns = frame.columns
+
+        if isinstance(columns, MultiIndex):
+            fmt_columns = columns.format(sparsify=False, adjoin=False)
+            fmt_columns = lzip(*fmt_columns)
+            dtypes = self.frame.dtypes._values
+
+            # if we have a Float level, they don't use leading space at all
+            restrict_formatting = any(l.is_floating for l in columns.levels)
+            need_leadsp = dict(zip(fmt_columns, map(is_numeric_dtype, dtypes)))
+
+            def space_format(x, y):
+                if (y not in self.formatters and
+                        need_leadsp[x] and not restrict_formatting):
+                    return ' ' + y
+                return y
+
+            str_columns = list(zip(*[[space_format(x, y) for y in x]
+                                     for x in fmt_columns]))
+            if self.sparsify:
+                str_columns = _sparsify(str_columns)
+
+            str_columns = [list(x) for x in zip(*str_columns)]
+        else:
+            fmt_columns = columns.format()
+            dtypes = self.frame.dtypes
+            need_leadsp = dict(zip(fmt_columns, map(is_numeric_dtype, dtypes)))
+            str_columns = [[' ' + x if not self._get_formatter(i) and
+                            need_leadsp[x] else x]
+                           for i, (col, x) in enumerate(zip(columns,
+                                                            fmt_columns))]
+
+        if self.show_index_names and self.has_index_names:
+            for x in str_columns:
+                x.append('')
+
+        # self.str_columns = str_columns
+        return str_columns
+
+    @property
+    def has_index_names(self):
+        return _has_names(self.frame.index)
+
+    @property
+    def has_column_names(self):
+        return _has_names(self.frame.columns)
+
+    def _get_formatted_index(self, frame):
+        # Note: this is only used by to_string() and to_latex(), not by
+        # to_html().
+        index = frame.index
+        columns = frame.columns
+
+        show_index_names = self.show_index_names and self.has_index_names
+        show_col_names = (self.show_index_names and self.has_column_names)
+
+        fmt = self._get_formatter('__index__')
+
+        if isinstance(index, MultiIndex):
+            fmt_index = index.format(sparsify=self.sparsify, adjoin=False,
+                                     names=show_index_names, formatter=fmt)
+        else:
+            fmt_index = [index.format(name=show_index_names, formatter=fmt)]
+        fmt_index = [tuple(_make_fixed_width(list(x), justify='left',
+                                             minimum=(self.col_space or 0),
+                                             adj=self.adj)) for x in fmt_index]
+
+        adjoined = self.adj.adjoin(1, *fmt_index).split('\n')
+
+        # empty space for columns
+        if show_col_names:
+            col_header = ['{x}'.format(x=x)
+                          for x in self._get_column_name_list()]
+        else:
+            col_header = [''] * columns.nlevels
+
+        if self.header:
+            return col_header + adjoined
+        else:
+            return adjoined
+
+    def _get_column_name_list(self):
+        names = []
+        columns = self.frame.columns
+        if isinstance(columns, MultiIndex):
+            names.extend('' if name is None else name
+                         for name in columns.names)
+        else:
+            names.append('' if columns.name is None else columns.name)
+        return names
+
+# ----------------------------------------------------------------------
+# Array formatters
+
+
+def format_array(values, formatter, float_format=None, na_rep='NaN',
+                 digits=None, space=None, justify='right', decimal='.'):
+
+    if is_categorical_dtype(values):
+        fmt_klass = CategoricalArrayFormatter
+    elif is_interval_dtype(values):
+        fmt_klass = IntervalArrayFormatter
+    elif is_float_dtype(values.dtype):
+        fmt_klass = FloatArrayFormatter
+    elif is_period_arraylike(values):
+        fmt_klass = PeriodArrayFormatter
+    elif is_integer_dtype(values.dtype):
+        fmt_klass = IntArrayFormatter
+    elif is_datetimetz(values):
+        fmt_klass = Datetime64TZFormatter
+    elif is_datetime64_dtype(values.dtype):
+        fmt_klass = Datetime64Formatter
+    elif is_timedelta64_dtype(values.dtype):
+        fmt_klass = Timedelta64Formatter
+    else:
+        fmt_klass = GenericArrayFormatter
+
+    if space is None:
+        space = get_option("display.column_space")
+
+    if float_format is None:
+        float_format = get_option("display.float_format")
+
+    if digits is None:
+        digits = get_option("display.precision")
+
+    fmt_obj = fmt_klass(values, digits=digits, na_rep=na_rep,
+                        float_format=float_format, formatter=formatter,
+                        space=space, justify=justify, decimal=decimal)
+
+    return fmt_obj.get_result()
+
+
+class GenericArrayFormatter(object):
+
+    def __init__(self, values, digits=7, formatter=None, na_rep='NaN',
+                 space=12, float_format=None, justify='right', decimal='.',
+                 quoting=None, fixed_width=True):
+        self.values = values
+        self.digits = digits
+        self.na_rep = na_rep
+        self.space = space
+        self.formatter = formatter
+        self.float_format = float_format
+        self.justify = justify
+        self.decimal = decimal
+        self.quoting = quoting
+        self.fixed_width = fixed_width
+
+    def get_result(self):
+        fmt_values = self._format_strings()
+        return _make_fixed_width(fmt_values, self.justify)
+
+    def _format_strings(self):
+        if self.float_format is None:
+            float_format = get_option("display.float_format")
+            if float_format is None:
+                fmt_str = ('{{x: .{prec:d}g}}'
+                           .format(prec=get_option("display.precision")))
+                float_format = lambda x: fmt_str.format(x=x)
+        else:
+            float_format = self.float_format
+
+        formatter = (
+            self.formatter if self.formatter is not None else
+            (lambda x: pprint_thing(x, escape_chars=('\t', '\r', '\n'))))
+
+        def _format(x):
+            if self.na_rep is not None and is_scalar(x) and isna(x):
+                if x is None:
+                    return 'None'
+                elif x is pd.NaT:
+                    return 'NaT'
+                return self.na_rep
+            elif isinstance(x, PandasObject):
+                return u'{x}'.format(x=x)
+            else:
+                # object dtype
+                return u'{x}'.format(x=formatter(x))
+
+        vals = self.values
+        if isinstance(vals, Index):
+            vals = vals._values
+        elif isinstance(vals, ABCSparseArray):
+            vals = vals.values
+
+        is_float_type = lib.map_infer(vals, is_float) & notna(vals)
+        leading_space = is_float_type.any()
+
+        fmt_values = []
+        for i, v in enumerate(vals):
+            if not is_float_type[i] and leading_space:
+                fmt_values.append(u' {v}'.format(v=_format(v)))
+            elif is_float_type[i]:
+                fmt_values.append(float_format(v))
+            else:
+                fmt_values.append(u' {v}'.format(v=_format(v)))
+
+        return fmt_values
+
+
+class FloatArrayFormatter(GenericArrayFormatter):
+    """
+
+    """
+
+    def __init__(self, *args, **kwargs):
+        GenericArrayFormatter.__init__(self, *args, **kwargs)
+
+        # float_format is expected to be a string
+        # formatter should be used to pass a function
+        if self.float_format is not None and self.formatter is None:
+            if callable(self.float_format):
+                self.formatter = self.float_format
+                self.float_format = None
+
+    def _value_formatter(self, float_format=None, threshold=None):
+        """Returns a function to be applied on each value to format it
+        """
+
+        # the float_format parameter supersedes self.float_format
+        if float_format is None:
+            float_format = self.float_format
+
+        # we are going to compose different functions, to first convert to
+        # a string, then replace the decimal symbol, and finally chop according
+        # to the threshold
+
+        # when there is no float_format, we use str instead of '%g'
+        # because str(0.0) = '0.0' while '%g' % 0.0 = '0'
+        if float_format:
+            def base_formatter(v):
+                return float_format(value=v) if notna(v) else self.na_rep
+        else:
+            def base_formatter(v):
+                return str(v) if notna(v) else self.na_rep
+
+        if self.decimal != '.':
+            def decimal_formatter(v):
+                return base_formatter(v).replace('.', self.decimal, 1)
+        else:
+            decimal_formatter = base_formatter
+
+        if threshold is None:
+            return decimal_formatter
+
+        def formatter(value):
+            if notna(value):
+                if abs(value) > threshold:
+                    return decimal_formatter(value)
+                else:
+                    return decimal_formatter(0.0)
+            else:
+                return self.na_rep
+
+        return formatter
+
+    def get_result_as_array(self):
+        """
+        Returns the float values converted into strings using
+        the parameters given at initialisation, as a numpy array
+        """
+
+        if self.formatter is not None:
+            return np.array([self.formatter(x) for x in self.values])
+
+        if self.fixed_width:
+            threshold = get_option("display.chop_threshold")
+        else:
+            threshold = None
+
+        # if we have a fixed_width, we'll need to try different float_format
+        def format_values_with(float_format):
+            formatter = self._value_formatter(float_format, threshold)
+
+            # separate the wheat from the chaff
+            values = self.values
+            mask = isna(values)
+            if hasattr(values, 'to_dense'):  # sparse numpy ndarray
+                values = values.to_dense()
+            values = np.array(values, dtype='object')
+            values[mask] = self.na_rep
+            imask = (~mask).ravel()
+            values.flat[imask] = np.array([formatter(val)
+                                           for val in values.ravel()[imask]])
+
+            if self.fixed_width:
+                return _trim_zeros(values, self.na_rep)
+
+            return values
+
+        # There is a special default string when we are fixed-width
+        # The default is otherwise to use str instead of a formatting string
+        if self.float_format is None:
+            if self.fixed_width:
+                float_format = partial('{value: .{digits:d}f}'.format,
+                                       digits=self.digits)
+            else:
+                float_format = self.float_format
+        else:
+            float_format = lambda value: self.float_format % value
+
+        formatted_values = format_values_with(float_format)
+
+        if not self.fixed_width:
+            return formatted_values
+
+        # we need do convert to engineering format if some values are too small
+        # and would appear as 0, or if some values are too big and take too
+        # much space
+
+        if len(formatted_values) > 0:
+            maxlen = max(len(x) for x in formatted_values)
+            too_long = maxlen > self.digits + 6
+        else:
+            too_long = False
+
+        with np.errstate(invalid='ignore'):
+            abs_vals = np.abs(self.values)
+            # this is pretty arbitrary for now
+            # large values: more that 8 characters including decimal symbol
+            # and first digit, hence > 1e6
+            has_large_values = (abs_vals > 1e6).any()
+            has_small_values = ((abs_vals < 10**(-self.digits)) &
+                                (abs_vals > 0)).any()
+
+        if has_small_values or (too_long and has_large_values):
+            float_format = partial('{value: .{digits:d}e}'.format,
+                                   digits=self.digits)
+            formatted_values = format_values_with(float_format)
+
+        return formatted_values
+
+    def _format_strings(self):
+        # shortcut
+        if self.formatter is not None:
+            return [self.formatter(x) for x in self.values]
+
+        return list(self.get_result_as_array())
+
+
+class IntArrayFormatter(GenericArrayFormatter):
+
+    def _format_strings(self):
+        formatter = self.formatter or (lambda x: '{x: d}'.format(x=x))
+        fmt_values = [formatter(x) for x in self.values]
+        return fmt_values
+
+
+class Datetime64Formatter(GenericArrayFormatter):
+
+    def __init__(self, values, nat_rep='NaT', date_format=None, **kwargs):
+        super(Datetime64Formatter, self).__init__(values, **kwargs)
+        self.nat_rep = nat_rep
+        self.date_format = date_format
+
+    def _format_strings(self):
+        """ we by definition have DO NOT have a TZ """
+
+        values = self.values
+
+        if not isinstance(values, DatetimeIndex):
+            values = DatetimeIndex(values)
+
+        if self.formatter is not None and callable(self.formatter):
+            return [self.formatter(x) for x in values]
+
+        fmt_values = format_array_from_datetime(
+            values.asi8.ravel(),
+            format=_get_format_datetime64_from_values(values,
+                                                      self.date_format),
+            na_rep=self.nat_rep).reshape(values.shape)
+        return fmt_values.tolist()
+
+
+class IntervalArrayFormatter(GenericArrayFormatter):
+
+    def __init__(self, values, *args, **kwargs):
+        GenericArrayFormatter.__init__(self, values, *args, **kwargs)
+
+    def _format_strings(self):
+        formatter = self.formatter or str
+        fmt_values = np.array([formatter(x) for x in self.values])
+        return fmt_values
+
+
+class PeriodArrayFormatter(IntArrayFormatter):
+
+    def _format_strings(self):
+        from pandas.core.indexes.period import IncompatibleFrequency
+        try:
+            values = PeriodIndex(self.values).to_native_types()
+        except IncompatibleFrequency:
+            # periods may contains different freq
+            values = Index(self.values, dtype='object').to_native_types()
+
+        formatter = self.formatter or (lambda x: '{x}'.format(x=x))
+        fmt_values = [formatter(x) for x in values]
+        return fmt_values
+
+
+class CategoricalArrayFormatter(GenericArrayFormatter):
+
+    def __init__(self, values, *args, **kwargs):
+        GenericArrayFormatter.__init__(self, values, *args, **kwargs)
+
+    def _format_strings(self):
+        fmt_values = format_array(self.values.get_values(), self.formatter,
+                                  float_format=self.float_format,
+                                  na_rep=self.na_rep, digits=self.digits,
+                                  space=self.space, justify=self.justify)
+        return fmt_values
+
+
+def format_percentiles(percentiles):
+    """
+    Outputs rounded and formatted percentiles.
+
+    Parameters
+    ----------
+    percentiles : list-like, containing floats from interval [0,1]
+
+    Returns
+    -------
+    formatted : list of strings
+
+    Notes
+    -----
+    Rounding precision is chosen so that: (1) if any two elements of
+    ``percentiles`` differ, they remain different after rounding
+    (2) no entry is *rounded* to 0% or 100%.
+    Any non-integer is always rounded to at least 1 decimal place.
+
+    Examples
+    --------
+    Keeps all entries different after rounding:
+
+    >>> format_percentiles([0.01999, 0.02001, 0.5, 0.666666, 0.9999])
+    ['1.999%', '2.001%', '50%', '66.667%', '99.99%']
+
+    No element is rounded to 0% or 100% (unless already equal to it).
+    Duplicates are allowed:
+
+    >>> format_percentiles([0, 0.5, 0.02001, 0.5, 0.666666, 0.9999])
+    ['0%', '50%', '2.0%', '50%', '66.67%', '99.99%']
+    """
+
+    percentiles = np.asarray(percentiles)
+
+    # It checks for np.NaN as well
+    with np.errstate(invalid='ignore'):
+        if not is_numeric_dtype(percentiles) or not np.all(percentiles >= 0) \
+                or not np.all(percentiles <= 1):
+            raise ValueError("percentiles should all be in the interval [0,1]")
+
+    percentiles = 100 * percentiles
+    int_idx = (percentiles.astype(int) == percentiles)
+
+    if np.all(int_idx):
+        out = percentiles.astype(int).astype(str)
+        return [i + '%' for i in out]
+
+    unique_pcts = np.unique(percentiles)
+    to_begin = unique_pcts[0] if unique_pcts[0] > 0 else None
+    to_end = 100 - unique_pcts[-1] if unique_pcts[-1] < 100 else None
+
+    # Least precision that keeps percentiles unique after rounding
+    prec = -np.floor(np.log10(np.min(
+        np.ediff1d(unique_pcts, to_begin=to_begin, to_end=to_end)
+    ))).astype(int)
+    prec = max(1, prec)
+    out = np.empty_like(percentiles, dtype=object)
+    out[int_idx] = percentiles[int_idx].astype(int).astype(str)
+    out[~int_idx] = percentiles[~int_idx].round(prec).astype(str)
+    return [i + '%' for i in out]
+
+
+def _is_dates_only(values):
+    # return a boolean if we are only dates (and don't have a timezone)
+    values = DatetimeIndex(values)
+    if values.tz is not None:
+        return False
+
+    values_int = values.asi8
+    consider_values = values_int != iNaT
+    one_day_nanos = (86400 * 1e9)
+    even_days = np.logical_and(consider_values,
+                               values_int % int(one_day_nanos) != 0).sum() == 0
+    if even_days:
+        return True
+    return False
+
+
+def _format_datetime64(x, tz=None, nat_rep='NaT'):
+    if x is None or (is_scalar(x) and isna(x)):
+        return nat_rep
+
+    if tz is not None or not isinstance(x, Timestamp):
+        x = Timestamp(x, tz=tz)
+
+    return str(x)
+
+
+def _format_datetime64_dateonly(x, nat_rep='NaT', date_format=None):
+    if x is None or (is_scalar(x) and isna(x)):
+        return nat_rep
+
+    if not isinstance(x, Timestamp):
+        x = Timestamp(x)
+
+    if date_format:
+        return x.strftime(date_format)
+    else:
+        return x._date_repr
+
+
+def _get_format_datetime64(is_dates_only, nat_rep='NaT', date_format=None):
+
+    if is_dates_only:
+        return lambda x, tz=None: _format_datetime64_dateonly(
+            x, nat_rep=nat_rep, date_format=date_format)
+    else:
+        return lambda x, tz=None: _format_datetime64(x, tz=tz, nat_rep=nat_rep)
+
+
+def _get_format_datetime64_from_values(values, date_format):
+    """ given values and a date_format, return a string format """
+    is_dates_only = _is_dates_only(values)
+    if is_dates_only:
+        return date_format or "%Y-%m-%d"
+    return date_format
+
+
+class Datetime64TZFormatter(Datetime64Formatter):
+
+    def _format_strings(self):
+        """ we by definition have a TZ """
+
+        values = self.values.astype(object)
+        is_dates_only = _is_dates_only(values)
+        formatter = (self.formatter or
+                     _get_format_datetime64(is_dates_only,
+                                            date_format=self.date_format))
+        fmt_values = [formatter(x) for x in values]
+
+        return fmt_values
+
+
+class Timedelta64Formatter(GenericArrayFormatter):
+
+    def __init__(self, values, nat_rep='NaT', box=False, **kwargs):
+        super(Timedelta64Formatter, self).__init__(values, **kwargs)
+        self.nat_rep = nat_rep
+        self.box = box
+
+    def _format_strings(self):
+        formatter = (self.formatter or
+                     _get_format_timedelta64(self.values, nat_rep=self.nat_rep,
+                                             box=self.box))
+        fmt_values = np.array([formatter(x) for x in self.values])
+        return fmt_values
+
+
+def _get_format_timedelta64(values, nat_rep='NaT', box=False):
+    """
+    Return a formatter function for a range of timedeltas.
+    These will all have the same format argument
+
+    If box, then show the return in quotes
+    """
+
+    values_int = values.astype(np.int64)
+
+    consider_values = values_int != iNaT
+
+    one_day_nanos = (86400 * 1e9)
+    even_days = np.logical_and(consider_values,
+                               values_int % one_day_nanos != 0).sum() == 0
+    all_sub_day = np.logical_and(
+        consider_values, np.abs(values_int) >= one_day_nanos).sum() == 0
+
+    if even_days:
+        format = None
+    elif all_sub_day:
+        format = 'sub_day'
+    else:
+        format = 'long'
+
+    def _formatter(x):
+        if x is None or (is_scalar(x) and isna(x)):
+            return nat_rep
+
+        if not isinstance(x, Timedelta):
+            x = Timedelta(x)
+        result = x._repr_base(format=format)
+        if box:
+            result = "'{res}'".format(res=result)
+        return result
+
+    return _formatter
+
+
+def _make_fixed_width(strings, justify='right', minimum=None, adj=None):
+
+    if len(strings) == 0 or justify == 'all':
+        return strings
+
+    if adj is None:
+        adj = _get_adjustment()
+
+    max_len = max(adj.len(x) for x in strings)
+
+    if minimum is not None:
+        max_len = max(minimum, max_len)
+
+    conf_max = get_option("display.max_colwidth")
+    if conf_max is not None and max_len > conf_max:
+        max_len = conf_max
+
+    def just(x):
+        if conf_max is not None:
+            if (conf_max > 3) & (adj.len(x) > max_len):
+                x = x[:max_len - 3] + '...'
+        return x
+
+    strings = [just(x) for x in strings]
+    result = adj.justify(strings, max_len, mode=justify)
+    return result
+
+
+def _trim_zeros(str_floats, na_rep='NaN'):
+    """
+    Trims zeros, leaving just one before the decimal points if need be.
+    """
+    trimmed = str_floats
+
+    def _cond(values):
+        non_na = [x for x in values if x != na_rep]
+        return (len(non_na) > 0 and all(x.endswith('0') for x in non_na) and
+                not (any(('e' in x) or ('E' in x) for x in non_na)))
+
+    while _cond(trimmed):
+        trimmed = [x[:-1] if x != na_rep else x for x in trimmed]
+
+    # leave one 0 after the decimal points if need be.
+    return [x + "0" if x.endswith('.') and x != na_rep else x for x in trimmed]
+
+
+def _has_names(index):
+    if isinstance(index, MultiIndex):
+        return com._any_not_none(*index.names)
+    else:
+        return index.name is not None
+
+
+class EngFormatter(object):
+    """
+    Formats float values according to engineering format.
+
+    Based on matplotlib.ticker.EngFormatter
+    """
+
+    # The SI engineering prefixes
+    ENG_PREFIXES = {
+        -24: "y",
+        -21: "z",
+        -18: "a",
+        -15: "f",
+        -12: "p",
+        -9: "n",
+        -6: "u",
+        -3: "m",
+        0: "",
+        3: "k",
+        6: "M",
+        9: "G",
+        12: "T",
+        15: "P",
+        18: "E",
+        21: "Z",
+        24: "Y"
+    }
+
+    def __init__(self, accuracy=None, use_eng_prefix=False):
+        self.accuracy = accuracy
+        self.use_eng_prefix = use_eng_prefix
+
+    def __call__(self, num):
+        """ Formats a number in engineering notation, appending a letter
+        representing the power of 1000 of the original number. Some examples:
+
+        >>> format_eng(0)       # for self.accuracy = 0
+        ' 0'
+
+        >>> format_eng(1000000) # for self.accuracy = 1,
+                                #     self.use_eng_prefix = True
+        ' 1.0M'
+
+        >>> format_eng("-1e-6") # for self.accuracy = 2
+                                #     self.use_eng_prefix = False
+        '-1.00E-06'
+
+        @param num: the value to represent
+        @type num: either a numeric value or a string that can be converted to
+                   a numeric value (as per decimal.Decimal constructor)
+
+        @return: engineering formatted string
+        """
+        import decimal
+        import math
+        dnum = decimal.Decimal(str(num))
+
+        if decimal.Decimal.is_nan(dnum):
+            return 'NaN'
+
+        if decimal.Decimal.is_infinite(dnum):
+            return 'inf'
+
+        sign = 1
+
+        if dnum < 0:  # pragma: no cover
+            sign = -1
+            dnum = -dnum
+
+        if dnum != 0:
+            pow10 = decimal.Decimal(int(math.floor(dnum.log10() / 3) * 3))
+        else:
+            pow10 = decimal.Decimal(0)
+
+        pow10 = pow10.min(max(self.ENG_PREFIXES.keys()))
+        pow10 = pow10.max(min(self.ENG_PREFIXES.keys()))
+        int_pow10 = int(pow10)
+
+        if self.use_eng_prefix:
+            prefix = self.ENG_PREFIXES[int_pow10]
+        else:
+            if int_pow10 < 0:
+                prefix = 'E-{pow10:02d}'.format(pow10=-int_pow10)
+            else:
+                prefix = 'E+{pow10:02d}'.format(pow10=int_pow10)
+
+        mant = sign * dnum / (10**pow10)
+
+        if self.accuracy is None:  # pragma: no cover
+            format_str = u("{mant: g}{prefix}")
+        else:
+            format_str = (u("{{mant: .{acc:d}f}}{{prefix}}")
+                          .format(acc=self.accuracy))
+
+        formatted = format_str.format(mant=mant, prefix=prefix)
+
+        return formatted  # .strip()
+
+
+def set_eng_float_format(accuracy=3, use_eng_prefix=False):
+    """
+    Alter default behavior on how float is formatted in DataFrame.
+    Format float in engineering format. By accuracy, we mean the number of
+    decimal digits after the floating point.
+
+    See also EngFormatter.
+    """
+
+    set_option("display.float_format", EngFormatter(accuracy, use_eng_prefix))
+    set_option("display.column_space", max(12, accuracy + 9))
+
+
+def _binify(cols, line_width):
+    adjoin_width = 1
+    bins = []
+    curr_width = 0
+    i_last_column = len(cols) - 1
+    for i, w in enumerate(cols):
+        w_adjoined = w + adjoin_width
+        curr_width += w_adjoined
+        if i_last_column == i:
+            wrap = curr_width + 1 > line_width and i > 0
+        else:
+            wrap = curr_width + 2 > line_width and i > 0
+        if wrap:
+            bins.append(i)
+            curr_width = w_adjoined
+
+    bins.append(len(cols))
+    return bins
+
+
+def get_level_lengths(levels, sentinel=''):
+    """For each index in each level the function returns lengths of indexes.
+
+    Parameters
+    ----------
+    levels : list of lists
+        List of values on for level.
+    sentinel : string, optional
+        Value which states that no new index starts on there.
+
+    Returns
+    ----------
+    Returns list of maps. For each level returns map of indexes (key is index
+    in row and value is length of index).
+    """
+    if len(levels) == 0:
+        return []
+
+    control = [True for x in levels[0]]
+
+    result = []
+    for level in levels:
+        last_index = 0
+
+        lengths = {}
+        for i, key in enumerate(level):
+            if control[i] and key == sentinel:
+                pass
+            else:
+                control[i] = False
+                lengths[last_index] = i - last_index
+                last_index = i
+
+        lengths[last_index] = len(level) - last_index
+
+        result.append(lengths)
+
+    return result
+
+
+def buffer_put_lines(buf, lines):
+    """
+    Appends lines to a buffer.
+
+    Parameters
+    ----------
+    buf
+        The buffer to write to
+    lines
+        The lines to append.
+    """
+    if any(isinstance(x, compat.text_type) for x in lines):
+        lines = [compat.text_type(x) for x in lines]
+    buf.write('\n'.join(lines))
diff --git a/pandas/io/formats/html.py b/pandas/io/formats/html.py
new file mode 100644
index 0000000000000..a43c55a220292
--- /dev/null
+++ b/pandas/io/formats/html.py
@@ -0,0 +1,506 @@
+# -*- coding: utf-8 -*-
+"""
+Module for formatting output data in HTML.
+"""
+
+from __future__ import print_function
+from distutils.version import LooseVersion
+
+from textwrap import dedent
+
+import pandas.core.common as com
+from pandas.core.index import MultiIndex
+from pandas import compat
+from pandas.compat import (lzip, range, map, zip, u,
+                           OrderedDict, unichr)
+from pandas.core.config import get_option
+from pandas.io.formats.printing import pprint_thing
+from pandas.io.formats.format import (get_level_lengths,
+                                      buffer_put_lines)
+from pandas.io.formats.format import TableFormatter
+
+
+class HTMLFormatter(TableFormatter):
+
+    indent_delta = 2
+
+    def __init__(self, formatter, classes=None, max_rows=None, max_cols=None,
+                 notebook=False, border=None, table_id=None):
+        self.fmt = formatter
+        self.classes = classes
+
+        self.frame = self.fmt.frame
+        self.columns = self.fmt.tr_frame.columns
+        self.elements = []
+        self.bold_rows = self.fmt.kwds.get('bold_rows', False)
+        self.escape = self.fmt.kwds.get('escape', True)
+
+        self.max_rows = max_rows or len(self.fmt.frame)
+        self.max_cols = max_cols or len(self.fmt.columns)
+        self.show_dimensions = self.fmt.show_dimensions
+        self.is_truncated = (self.max_rows < len(self.fmt.frame) or
+                             self.max_cols < len(self.fmt.columns))
+        self.notebook = notebook
+        if border is None:
+            border = get_option('display.html.border')
+        self.border = border
+        self.table_id = table_id
+
+    def write(self, s, indent=0):
+        rs = pprint_thing(s)
+        self.elements.append(' ' * indent + rs)
+
+    def write_th(self, s, indent=0, tags=None):
+        if self.fmt.col_space is not None and self.fmt.col_space > 0:
+            tags = (tags or "")
+            tags += ('style="min-width: {colspace};"'
+                     .format(colspace=self.fmt.col_space))
+
+        return self._write_cell(s, kind='th', indent=indent, tags=tags)
+
+    def write_td(self, s, indent=0, tags=None):
+        return self._write_cell(s, kind='td', indent=indent, tags=tags)
+
+    def _write_cell(self, s, kind='td', indent=0, tags=None):
+        if tags is not None:
+            start_tag = '<{kind} {tags}>'.format(kind=kind, tags=tags)
+        else:
+            start_tag = '<{kind}>'.format(kind=kind)
+
+        if self.escape:
+            # escape & first to prevent double escaping of &
+            esc = OrderedDict([('&', r'&amp;'), ('<', r'&lt;'),
+                               ('>', r'&gt;')])
+        else:
+            esc = {}
+        rs = pprint_thing(s, escape_chars=esc).strip()
+        self.write(u'{start}{rs}</{kind}>'
+                   .format(start=start_tag, rs=rs, kind=kind), indent)
+
+    def write_tr(self, line, indent=0, indent_delta=4, header=False,
+                 align=None, tags=None, nindex_levels=0):
+        if tags is None:
+            tags = {}
+
+        if align is None:
+            self.write('<tr>', indent)
+        else:
+            self.write('<tr style="text-align: {align};">'
+                       .format(align=align), indent)
+        indent += indent_delta
+
+        for i, s in enumerate(line):
+            val_tag = tags.get(i, None)
+            if header or (self.bold_rows and i < nindex_levels):
+                self.write_th(s, indent, tags=val_tag)
+            else:
+                self.write_td(s, indent, tags=val_tag)
+
+        indent -= indent_delta
+        self.write('</tr>', indent)
+
+    def write_style(self):
+        # We use the "scoped" attribute here so that the desired
+        # style properties for the data frame are not then applied
+        # throughout the entire notebook.
+        template_first = """\
+            <style scoped>"""
+        template_last = """\
+            </style>"""
+        template_select = """\
+                .dataframe %s {
+                    %s: %s;
+                }"""
+        element_props = [('tbody tr th:only-of-type',
+                          'vertical-align',
+                          'middle'),
+                         ('tbody tr th',
+                          'vertical-align',
+                          'top')]
+        if isinstance(self.columns, MultiIndex):
+            element_props.append(('thead tr th',
+                                  'text-align',
+                                  'left'))
+            if all((self.fmt.has_index_names,
+                    self.fmt.index,
+                    self.fmt.show_index_names)):
+                element_props.append(('thead tr:last-of-type th',
+                                      'text-align',
+                                      'right'))
+        else:
+            element_props.append(('thead th',
+                                  'text-align',
+                                  'right'))
+        template_mid = '\n\n'.join(map(lambda t: template_select % t,
+                                       element_props))
+        template = dedent('\n'.join((template_first,
+                                     template_mid,
+                                     template_last)))
+        if self.notebook:
+            self.write(template)
+
+    def write_result(self, buf):
+        indent = 0
+        id_section = ""
+        frame = self.frame
+
+        _classes = ['dataframe']  # Default class.
+        use_mathjax = get_option("display.html.use_mathjax")
+        if not use_mathjax:
+            _classes.append('tex2jax_ignore')
+        if self.classes is not None:
+            if isinstance(self.classes, str):
+                self.classes = self.classes.split()
+            if not isinstance(self.classes, (list, tuple)):
+                raise AssertionError('classes must be list or tuple, not {typ}'
+                                     .format(typ=type(self.classes)))
+            _classes.extend(self.classes)
+
+        if self.notebook:
+            div_style = ''
+            try:
+                import IPython
+                if IPython.__version__ < LooseVersion('3.0.0'):
+                    div_style = ' style="max-width:1500px;overflow:auto;"'
+            except (ImportError, AttributeError):
+                pass
+
+            self.write('<div{style}>'.format(style=div_style))
+
+        self.write_style()
+
+        if self.table_id is not None:
+            id_section = ' id="{table_id}"'.format(table_id=self.table_id)
+        self.write('<table border="{border}" class="{cls}"{id_section}>'
+                   .format(border=self.border, cls=' '.join(_classes),
+                           id_section=id_section), indent)
+
+        indent += self.indent_delta
+        indent = self._write_header(indent)
+        indent = self._write_body(indent)
+
+        self.write('</table>', indent)
+        if self.should_show_dimensions:
+            by = chr(215) if compat.PY3 else unichr(215)  # ×
+            self.write(u('<p>{rows} rows {by} {cols} columns</p>')
+                       .format(rows=len(frame),
+                               by=by,
+                               cols=len(frame.columns)))
+
+        if self.notebook:
+            self.write('</div>')
+
+        buffer_put_lines(buf, self.elements)
+
+    def _write_header(self, indent):
+        truncate_h = self.fmt.truncate_h
+        row_levels = self.frame.index.nlevels
+        if not self.fmt.header:
+            # write nothing
+            return indent
+
+        def _column_header():
+            if self.fmt.index:
+                row = [''] * (self.frame.index.nlevels - 1)
+            else:
+                row = []
+
+            if isinstance(self.columns, MultiIndex):
+                if self.fmt.has_column_names and self.fmt.index:
+                    row.append(single_column_table(self.columns.names))
+                else:
+                    row.append('')
+                style = "text-align: {just};".format(just=self.fmt.justify)
+                row.extend([single_column_table(c, self.fmt.justify, style)
+                            for c in self.columns])
+            else:
+                if self.fmt.index:
+                    row.append(self.columns.name or '')
+                row.extend(self.columns)
+            return row
+
+        self.write('<thead>', indent)
+        row = []
+
+        indent += self.indent_delta
+
+        if isinstance(self.columns, MultiIndex):
+            template = 'colspan="{span:d}" halign="left"'
+
+            if self.fmt.sparsify:
+                # GH3547
+                sentinel = com.sentinel_factory()
+            else:
+                sentinel = None
+            levels = self.columns.format(sparsify=sentinel, adjoin=False,
+                                         names=False)
+            level_lengths = get_level_lengths(levels, sentinel)
+            inner_lvl = len(level_lengths) - 1
+            for lnum, (records, values) in enumerate(zip(level_lengths,
+                                                         levels)):
+                if truncate_h:
+                    # modify the header lines
+                    ins_col = self.fmt.tr_col_num
+                    if self.fmt.sparsify:
+                        recs_new = {}
+                        # Increment tags after ... col.
+                        for tag, span in list(records.items()):
+                            if tag >= ins_col:
+                                recs_new[tag + 1] = span
+                            elif tag + span > ins_col:
+                                recs_new[tag] = span + 1
+                                if lnum == inner_lvl:
+                                    values = (values[:ins_col] + (u('...'),) +
+                                              values[ins_col:])
+                                else:
+                                    # sparse col headers do not receive a ...
+                                    values = (values[:ins_col] +
+                                              (values[ins_col - 1], ) +
+                                              values[ins_col:])
+                            else:
+                                recs_new[tag] = span
+                            # if ins_col lies between tags, all col headers
+                            # get ...
+                            if tag + span == ins_col:
+                                recs_new[ins_col] = 1
+                                values = (values[:ins_col] + (u('...'),) +
+                                          values[ins_col:])
+                        records = recs_new
+                        inner_lvl = len(level_lengths) - 1
+                        if lnum == inner_lvl:
+                            records[ins_col] = 1
+                    else:
+                        recs_new = {}
+                        for tag, span in list(records.items()):
+                            if tag >= ins_col:
+                                recs_new[tag + 1] = span
+                            else:
+                                recs_new[tag] = span
+                        recs_new[ins_col] = 1
+                        records = recs_new
+                        values = (values[:ins_col] + [u('...')] +
+                                  values[ins_col:])
+
+                name = self.columns.names[lnum]
+                row = [''] * (row_levels - 1) + ['' if name is None else
+                                                 pprint_thing(name)]
+
+                if row == [""] and self.fmt.index is False:
+                    row = []
+
+                tags = {}
+                j = len(row)
+                for i, v in enumerate(values):
+                    if i in records:
+                        if records[i] > 1:
+                            tags[j] = template.format(span=records[i])
+                    else:
+                        continue
+                    j += 1
+                    row.append(v)
+                self.write_tr(row, indent, self.indent_delta, tags=tags,
+                              header=True)
+        else:
+            col_row = _column_header()
+            align = self.fmt.justify
+
+            if truncate_h:
+                ins_col = row_levels + self.fmt.tr_col_num
+                col_row.insert(ins_col, '...')
+
+            self.write_tr(col_row, indent, self.indent_delta, header=True,
+                          align=align)
+
+        if all((self.fmt.has_index_names,
+                self.fmt.index,
+                self.fmt.show_index_names)):
+            row = ([x if x is not None else ''
+                    for x in self.frame.index.names] +
+                   [''] * min(len(self.columns), self.max_cols))
+            if truncate_h:
+                ins_col = row_levels + self.fmt.tr_col_num
+                row.insert(ins_col, '')
+            self.write_tr(row, indent, self.indent_delta, header=True)
+
+        indent -= self.indent_delta
+        self.write('</thead>', indent)
+
+        return indent
+
+    def _write_body(self, indent):
+        self.write('<tbody>', indent)
+        indent += self.indent_delta
+
+        fmt_values = {}
+        for i in range(min(len(self.columns), self.max_cols)):
+            fmt_values[i] = self.fmt._format_col(i)
+
+        # write values
+        if self.fmt.index:
+            if isinstance(self.frame.index, MultiIndex):
+                self._write_hierarchical_rows(fmt_values, indent)
+            else:
+                self._write_regular_rows(fmt_values, indent)
+        else:
+            for i in range(min(len(self.frame), self.max_rows)):
+                row = [fmt_values[j][i] for j in range(len(self.columns))]
+                self.write_tr(row, indent, self.indent_delta, tags=None)
+
+        indent -= self.indent_delta
+        self.write('</tbody>', indent)
+        indent -= self.indent_delta
+
+        return indent
+
+    def _write_regular_rows(self, fmt_values, indent):
+        truncate_h = self.fmt.truncate_h
+        truncate_v = self.fmt.truncate_v
+
+        ncols = len(self.fmt.tr_frame.columns)
+        nrows = len(self.fmt.tr_frame)
+        fmt = self.fmt._get_formatter('__index__')
+        if fmt is not None:
+            index_values = self.fmt.tr_frame.index.map(fmt)
+        else:
+            index_values = self.fmt.tr_frame.index.format()
+
+        row = []
+        for i in range(nrows):
+
+            if truncate_v and i == (self.fmt.tr_row_num):
+                str_sep_row = ['...' for ele in row]
+                self.write_tr(str_sep_row, indent, self.indent_delta,
+                              tags=None, nindex_levels=1)
+
+            row = []
+            row.append(index_values[i])
+            row.extend(fmt_values[j][i] for j in range(ncols))
+
+            if truncate_h:
+                dot_col_ix = self.fmt.tr_col_num + 1
+                row.insert(dot_col_ix, '...')
+            self.write_tr(row, indent, self.indent_delta, tags=None,
+                          nindex_levels=1)
+
+    def _write_hierarchical_rows(self, fmt_values, indent):
+        template = 'rowspan="{span}" valign="top"'
+
+        truncate_h = self.fmt.truncate_h
+        truncate_v = self.fmt.truncate_v
+        frame = self.fmt.tr_frame
+        ncols = len(frame.columns)
+        nrows = len(frame)
+        row_levels = self.frame.index.nlevels
+
+        idx_values = frame.index.format(sparsify=False, adjoin=False,
+                                        names=False)
+        idx_values = lzip(*idx_values)
+
+        if self.fmt.sparsify:
+            # GH3547
+            sentinel = com.sentinel_factory()
+            levels = frame.index.format(sparsify=sentinel, adjoin=False,
+                                        names=False)
+
+            level_lengths = get_level_lengths(levels, sentinel)
+            inner_lvl = len(level_lengths) - 1
+            if truncate_v:
+                # Insert ... row and adjust idx_values and
+                # level_lengths to take this into account.
+                ins_row = self.fmt.tr_row_num
+                inserted = False
+                for lnum, records in enumerate(level_lengths):
+                    rec_new = {}
+                    for tag, span in list(records.items()):
+                        if tag >= ins_row:
+                            rec_new[tag + 1] = span
+                        elif tag + span > ins_row:
+                            rec_new[tag] = span + 1
+
+                            # GH 14882 - Make sure insertion done once
+                            if not inserted:
+                                dot_row = list(idx_values[ins_row - 1])
+                                dot_row[-1] = u('...')
+                                idx_values.insert(ins_row, tuple(dot_row))
+                                inserted = True
+                            else:
+                                dot_row = list(idx_values[ins_row])
+                                dot_row[inner_lvl - lnum] = u('...')
+                                idx_values[ins_row] = tuple(dot_row)
+                        else:
+                            rec_new[tag] = span
+                        # If ins_row lies between tags, all cols idx cols
+                        # receive ...
+                        if tag + span == ins_row:
+                            rec_new[ins_row] = 1
+                            if lnum == 0:
+                                idx_values.insert(ins_row, tuple(
+                                    [u('...')] * len(level_lengths)))
+
+                            # GH 14882 - Place ... in correct level
+                            elif inserted:
+                                dot_row = list(idx_values[ins_row])
+                                dot_row[inner_lvl - lnum] = u('...')
+                                idx_values[ins_row] = tuple(dot_row)
+                    level_lengths[lnum] = rec_new
+
+                level_lengths[inner_lvl][ins_row] = 1
+                for ix_col in range(len(fmt_values)):
+                    fmt_values[ix_col].insert(ins_row, '...')
+                nrows += 1
+
+            for i in range(nrows):
+                row = []
+                tags = {}
+
+                sparse_offset = 0
+                j = 0
+                for records, v in zip(level_lengths, idx_values[i]):
+                    if i in records:
+                        if records[i] > 1:
+                            tags[j] = template.format(span=records[i])
+                    else:
+                        sparse_offset += 1
+                        continue
+
+                    j += 1
+                    row.append(v)
+
+                row.extend(fmt_values[j][i] for j in range(ncols))
+                if truncate_h:
+                    row.insert(row_levels - sparse_offset +
+                               self.fmt.tr_col_num, '...')
+                self.write_tr(row, indent, self.indent_delta, tags=tags,
+                              nindex_levels=len(levels) - sparse_offset)
+        else:
+            for i in range(len(frame)):
+                idx_values = list(zip(*frame.index.format(
+                    sparsify=False, adjoin=False, names=False)))
+                row = []
+                row.extend(idx_values[i])
+                row.extend(fmt_values[j][i] for j in range(ncols))
+                if truncate_h:
+                    row.insert(row_levels + self.fmt.tr_col_num, '...')
+                self.write_tr(row, indent, self.indent_delta, tags=None,
+                              nindex_levels=frame.index.nlevels)
+
+
+def single_column_table(column, align=None, style=None):
+    table = '<table'
+    if align is not None:
+        table += (' align="{align}"'.format(align=align))
+    if style is not None:
+        table += (' style="{style}"'.format(style=style))
+    table += '><tbody>'
+    for i in column:
+        table += ('<tr><td>{i!s}</td></tr>'.format(i=i))
+    table += '</tbody></table>'
+    return table
+
+
+def single_row_table(row):  # pragma: no cover
+    table = '<table><tbody><tr>'
+    for i in row:
+        table += ('<td>{i!s}</td>'.format(i=i))
+    table += '</tr></tbody></table>'
+    return table
diff --git a/pandas/io/formats/latex.py b/pandas/io/formats/latex.py
new file mode 100644
index 0000000000000..666f124e7d544
--- /dev/null
+++ b/pandas/io/formats/latex.py
@@ -0,0 +1,243 @@
+# -*- coding: utf-8 -*-
+"""
+Module for formatting output data in Latex.
+"""
+
+from __future__ import print_function
+
+from pandas.core.index import MultiIndex
+from pandas import compat
+from pandas.compat import range, map, zip, u
+from pandas.io.formats.format import TableFormatter
+import numpy as np
+
+
+class LatexFormatter(TableFormatter):
+    """ Used to render a DataFrame to a LaTeX tabular/longtable environment
+    output.
+
+    Parameters
+    ----------
+    formatter : `DataFrameFormatter`
+    column_format : str, default None
+        The columns format as specified in `LaTeX table format
+        <https://en.wikibooks.org/wiki/LaTeX/Tables>`__ e.g 'rcl' for 3 columns
+    longtable : boolean, default False
+        Use a longtable environment instead of tabular.
+
+    See Also
+    --------
+    HTMLFormatter
+    """
+
+    def __init__(self, formatter, column_format=None, longtable=False,
+                 multicolumn=False, multicolumn_format=None, multirow=False):
+        self.fmt = formatter
+        self.frame = self.fmt.frame
+        self.bold_rows = self.fmt.kwds.get('bold_rows', False)
+        self.column_format = column_format
+        self.longtable = longtable
+        self.multicolumn = multicolumn
+        self.multicolumn_format = multicolumn_format
+        self.multirow = multirow
+
+    def write_result(self, buf):
+        """
+        Render a DataFrame to a LaTeX tabular/longtable environment output.
+        """
+
+        # string representation of the columns
+        if len(self.frame.columns) == 0 or len(self.frame.index) == 0:
+            info_line = (u('Empty {name}\nColumns: {col}\nIndex: {idx}')
+                         .format(name=type(self.frame).__name__,
+                                 col=self.frame.columns,
+                                 idx=self.frame.index))
+            strcols = [[info_line]]
+        else:
+            strcols = self.fmt._to_str_columns()
+
+        def get_col_type(dtype):
+            if issubclass(dtype.type, np.number):
+                return 'r'
+            else:
+                return 'l'
+
+        # reestablish the MultiIndex that has been joined by _to_str_column
+        if self.fmt.index and isinstance(self.frame.index, MultiIndex):
+            out = self.frame.index.format(
+                adjoin=False, sparsify=self.fmt.sparsify,
+                names=self.fmt.has_index_names, na_rep=self.fmt.na_rep
+            )
+
+            # index.format will sparsify repeated entries with empty strings
+            # so pad these with some empty space
+            def pad_empties(x):
+                for pad in reversed(x):
+                    if pad:
+                        break
+                return [x[0]] + [i if i else ' ' * len(pad) for i in x[1:]]
+            out = (pad_empties(i) for i in out)
+
+            # Add empty spaces for each column level
+            clevels = self.frame.columns.nlevels
+            out = [[' ' * len(i[-1])] * clevels + i for i in out]
+
+            # Add the column names to the last index column
+            cnames = self.frame.columns.names
+            if any(cnames):
+                new_names = [i if i else '{}' for i in cnames]
+                out[self.frame.index.nlevels - 1][:clevels] = new_names
+
+            # Get rid of old multiindex column and add new ones
+            strcols = out + strcols[1:]
+
+        column_format = self.column_format
+        if column_format is None:
+            dtypes = self.frame.dtypes._values
+            column_format = ''.join(map(get_col_type, dtypes))
+            if self.fmt.index:
+                index_format = 'l' * self.frame.index.nlevels
+                column_format = index_format + column_format
+        elif not isinstance(column_format,
+                            compat.string_types):  # pragma: no cover
+            raise AssertionError('column_format must be str or unicode, '
+                                 'not {typ}'.format(typ=type(column_format)))
+
+        if not self.longtable:
+            buf.write('\\begin{{tabular}}{{{fmt}}}\n'
+                      .format(fmt=column_format))
+            buf.write('\\toprule\n')
+        else:
+            buf.write('\\begin{{longtable}}{{{fmt}}}\n'
+                      .format(fmt=column_format))
+            buf.write('\\toprule\n')
+
+        ilevels = self.frame.index.nlevels
+        clevels = self.frame.columns.nlevels
+        nlevels = clevels
+        if self.fmt.has_index_names and self.fmt.show_index_names:
+            nlevels += 1
+        strrows = list(zip(*strcols))
+        self.clinebuf = []
+
+        for i, row in enumerate(strrows):
+            if i == nlevels and self.fmt.header:
+                buf.write('\\midrule\n')  # End of header
+                if self.longtable:
+                    buf.write('\\endhead\n')
+                    buf.write('\\midrule\n')
+                    buf.write('\\multicolumn{{{n}}}{{r}}{{{{Continued on next '
+                              'page}}}} \\\\\n'.format(n=len(row)))
+                    buf.write('\\midrule\n')
+                    buf.write('\\endfoot\n\n')
+                    buf.write('\\bottomrule\n')
+                    buf.write('\\endlastfoot\n')
+            if self.fmt.kwds.get('escape', True):
+                # escape backslashes first
+                crow = [(x.replace('\\', '\\textbackslash ')
+                         .replace('_', '\\_')
+                         .replace('%', '\\%').replace('$', '\\$')
+                         .replace('#', '\\#').replace('{', '\\{')
+                         .replace('}', '\\}').replace('~', '\\textasciitilde ')
+                         .replace('^', '\\textasciicircum ')
+                         .replace('&', '\\&')
+                         if (x and x != '{}') else '{}') for x in row]
+            else:
+                crow = [x if x else '{}' for x in row]
+            if self.bold_rows and self.fmt.index:
+                # bold row labels
+                crow = ['\\textbf{{{x}}}'.format(x=x)
+                        if j < ilevels and x.strip() not in ['', '{}'] else x
+                        for j, x in enumerate(crow)]
+            if i < clevels and self.fmt.header and self.multicolumn:
+                # sum up columns to multicolumns
+                crow = self._format_multicolumn(crow, ilevels)
+            if (i >= nlevels and self.fmt.index and self.multirow and
+                    ilevels > 1):
+                # sum up rows to multirows
+                crow = self._format_multirow(crow, ilevels, i, strrows)
+            buf.write(' & '.join(crow))
+            buf.write(' \\\\\n')
+            if self.multirow and i < len(strrows) - 1:
+                self._print_cline(buf, i, len(strcols))
+
+        if not self.longtable:
+            buf.write('\\bottomrule\n')
+            buf.write('\\end{tabular}\n')
+        else:
+            buf.write('\\end{longtable}\n')
+
+    def _format_multicolumn(self, row, ilevels):
+        r"""
+        Combine columns belonging to a group to a single multicolumn entry
+        according to self.multicolumn_format
+
+        e.g.:
+        a &  &  & b & c &
+        will become
+        \multicolumn{3}{l}{a} & b & \multicolumn{2}{l}{c}
+        """
+        row2 = list(row[:ilevels])
+        ncol = 1
+        coltext = ''
+
+        def append_col():
+            # write multicolumn if needed
+            if ncol > 1:
+                row2.append('\\multicolumn{{{ncol:d}}}{{{fmt:s}}}{{{txt:s}}}'
+                            .format(ncol=ncol, fmt=self.multicolumn_format,
+                                    txt=coltext.strip()))
+            # don't modify where not needed
+            else:
+                row2.append(coltext)
+        for c in row[ilevels:]:
+            # if next col has text, write the previous
+            if c.strip():
+                if coltext:
+                    append_col()
+                coltext = c
+                ncol = 1
+            # if not, add it to the previous multicolumn
+            else:
+                ncol += 1
+        # write last column name
+        if coltext:
+            append_col()
+        return row2
+
+    def _format_multirow(self, row, ilevels, i, rows):
+        r"""
+        Check following rows, whether row should be a multirow
+
+        e.g.:     becomes:
+        a & 0 &   \multirow{2}{*}{a} & 0 &
+          & 1 &     & 1 &
+        b & 0 &   \cline{1-2}
+                  b & 0 &
+        """
+        for j in range(ilevels):
+            if row[j].strip():
+                nrow = 1
+                for r in rows[i + 1:]:
+                    if not r[j].strip():
+                        nrow += 1
+                    else:
+                        break
+                if nrow > 1:
+                    # overwrite non-multirow entry
+                    row[j] = '\\multirow{{{nrow:d}}}{{*}}{{{row:s}}}'.format(
+                        nrow=nrow, row=row[j].strip())
+                    # save when to end the current block with \cline
+                    self.clinebuf.append([i + nrow - 1, j + 1])
+        return row
+
+    def _print_cline(self, buf, i, icol):
+        """
+        Print clines after multirow-blocks are finished
+        """
+        for cl in self.clinebuf:
+            if cl[0] == i:
+                buf.write('\\cline{{{cl:d}-{icol:d}}}\n'
+                          .format(cl=cl[1], icol=icol))
+        # remove entries that have been written to buffer
+        self.clinebuf = [x for x in self.clinebuf if x[0] != i]
diff --git a/pandas/io/formats/printing.py b/pandas/io/formats/printing.py
new file mode 100644
index 0000000000000..e22d7bce42841
--- /dev/null
+++ b/pandas/io/formats/printing.py
@@ -0,0 +1,417 @@
+"""
+printing tools
+"""
+
+import sys
+from pandas.core.dtypes.inference import is_sequence
+from pandas import compat
+from pandas.compat import u
+from pandas.core.config import get_option
+
+
+def adjoin(space, *lists, **kwargs):
+    """
+    Glues together two sets of strings using the amount of space requested.
+    The idea is to prettify.
+
+    ----------
+    space : int
+        number of spaces for padding
+    lists : str
+        list of str which being joined
+    strlen : callable
+        function used to calculate the length of each str. Needed for unicode
+        handling.
+    justfunc : callable
+        function used to justify str. Needed for unicode handling.
+    """
+    strlen = kwargs.pop('strlen', len)
+    justfunc = kwargs.pop('justfunc', justify)
+
+    out_lines = []
+    newLists = []
+    lengths = [max(map(strlen, x)) + space for x in lists[:-1]]
+    # not the last one
+    lengths.append(max(map(len, lists[-1])))
+    maxLen = max(map(len, lists))
+    for i, lst in enumerate(lists):
+        nl = justfunc(lst, lengths[i], mode='left')
+        nl.extend([' ' * lengths[i]] * (maxLen - len(lst)))
+        newLists.append(nl)
+    toJoin = zip(*newLists)
+    for lines in toJoin:
+        out_lines.append(_join_unicode(lines))
+    return _join_unicode(out_lines, sep='\n')
+
+
+def justify(texts, max_len, mode='right'):
+    """
+    Perform ljust, center, rjust against string or list-like
+    """
+    if mode == 'left':
+        return [x.ljust(max_len) for x in texts]
+    elif mode == 'center':
+        return [x.center(max_len) for x in texts]
+    else:
+        return [x.rjust(max_len) for x in texts]
+
+
+def _join_unicode(lines, sep=''):
+    try:
+        return sep.join(lines)
+    except UnicodeDecodeError:
+        sep = compat.text_type(sep)
+        return sep.join([x.decode('utf-8') if isinstance(x, str) else x
+                         for x in lines])
+
+
+# Unicode consolidation
+# ---------------------
+#
+# pprinting utility functions for generating Unicode text or
+# bytes(3.x)/str(2.x) representations of objects.
+# Try to use these as much as possible rather then rolling your own.
+#
+# When to use
+# -----------
+#
+# 1) If you're writing code internal to pandas (no I/O directly involved),
+#    use pprint_thing().
+#
+#    It will always return unicode text which can handled by other
+#    parts of the package without breakage.
+#
+# 2) if you need to write something out to file, use
+#    pprint_thing_encoded(encoding).
+#
+#    If no encoding is specified, it defaults to utf-8. Since encoding pure
+#    ascii with utf-8 is a no-op you can safely use the default utf-8 if you're
+#    working with straight ascii.
+
+
+def _pprint_seq(seq, _nest_lvl=0, max_seq_items=None, **kwds):
+    """
+    internal. pprinter for iterables. you should probably use pprint_thing()
+    rather then calling this directly.
+
+    bounds length of printed sequence, depending on options
+    """
+    if isinstance(seq, set):
+        fmt = u("{{{body}}}")
+    else:
+        fmt = u("[{body}]") if hasattr(seq, '__setitem__') else u("({body})")
+
+    if max_seq_items is False:
+        nitems = len(seq)
+    else:
+        nitems = max_seq_items or get_option("max_seq_items") or len(seq)
+
+    s = iter(seq)
+    r = []
+    for i in range(min(nitems, len(seq))):  # handle sets, no slicing
+        r.append(pprint_thing(
+            next(s), _nest_lvl + 1, max_seq_items=max_seq_items, **kwds))
+    body = ", ".join(r)
+
+    if nitems < len(seq):
+        body += ", ..."
+    elif isinstance(seq, tuple) and len(seq) == 1:
+        body += ','
+
+    return fmt.format(body=body)
+
+
+def _pprint_dict(seq, _nest_lvl=0, max_seq_items=None, **kwds):
+    """
+    internal. pprinter for iterables. you should probably use pprint_thing()
+    rather then calling this directly.
+    """
+    fmt = u("{{{things}}}")
+    pairs = []
+
+    pfmt = u("{key}: {val}")
+
+    if max_seq_items is False:
+        nitems = len(seq)
+    else:
+        nitems = max_seq_items or get_option("max_seq_items") or len(seq)
+
+    for k, v in list(seq.items())[:nitems]:
+        pairs.append(
+            pfmt.format(
+                key=pprint_thing(k, _nest_lvl + 1,
+                                 max_seq_items=max_seq_items, **kwds),
+                val=pprint_thing(v, _nest_lvl + 1,
+                                 max_seq_items=max_seq_items, **kwds)))
+
+    if nitems < len(seq):
+        return fmt.format(things=", ".join(pairs) + ", ...")
+    else:
+        return fmt.format(things=", ".join(pairs))
+
+
+def pprint_thing(thing, _nest_lvl=0, escape_chars=None, default_escapes=False,
+                 quote_strings=False, max_seq_items=None):
+    """
+    This function is the sanctioned way of converting objects
+    to a unicode representation.
+
+    properly handles nested sequences containing unicode strings
+    (unicode(object) does not)
+
+    Parameters
+    ----------
+    thing : anything to be formatted
+    _nest_lvl : internal use only. pprint_thing() is mutually-recursive
+        with pprint_sequence, this argument is used to keep track of the
+        current nesting level, and limit it.
+    escape_chars : list or dict, optional
+        Characters to escape. If a dict is passed the values are the
+        replacements
+    default_escapes : bool, default False
+        Whether the input escape characters replaces or adds to the defaults
+    max_seq_items : False, int, default None
+        Pass thru to other pretty printers to limit sequence printing
+
+    Returns
+    -------
+    result - unicode object on py2, str on py3. Always Unicode.
+
+    """
+
+    def as_escaped_unicode(thing, escape_chars=escape_chars):
+        # Unicode is fine, else we try to decode using utf-8 and 'replace'
+        # if that's not it either, we have no way of knowing and the user
+        # should deal with it himself.
+
+        try:
+            result = compat.text_type(thing)  # we should try this first
+        except UnicodeDecodeError:
+            # either utf-8 or we replace errors
+            result = str(thing).decode('utf-8', "replace")
+
+        translate = {'\t': r'\t', '\n': r'\n', '\r': r'\r', }
+        if isinstance(escape_chars, dict):
+            if default_escapes:
+                translate.update(escape_chars)
+            else:
+                translate = escape_chars
+            escape_chars = list(escape_chars.keys())
+        else:
+            escape_chars = escape_chars or tuple()
+        for c in escape_chars:
+            result = result.replace(c, translate[c])
+
+        return compat.text_type(result)
+
+    if (compat.PY3 and hasattr(thing, '__next__')) or hasattr(thing, 'next'):
+        return compat.text_type(thing)
+    elif (isinstance(thing, dict) and
+          _nest_lvl < get_option("display.pprint_nest_depth")):
+        result = _pprint_dict(thing, _nest_lvl, quote_strings=True,
+                              max_seq_items=max_seq_items)
+    elif (is_sequence(thing) and
+          _nest_lvl < get_option("display.pprint_nest_depth")):
+        result = _pprint_seq(thing, _nest_lvl, escape_chars=escape_chars,
+                             quote_strings=quote_strings,
+                             max_seq_items=max_seq_items)
+    elif isinstance(thing, compat.string_types) and quote_strings:
+        if compat.PY3:
+            fmt = u("'{thing}'")
+        else:
+            fmt = u("u'{thing}'")
+        result = fmt.format(thing=as_escaped_unicode(thing))
+    else:
+        result = as_escaped_unicode(thing)
+
+    return compat.text_type(result)  # always unicode
+
+
+def pprint_thing_encoded(object, encoding='utf-8', errors='replace', **kwds):
+    value = pprint_thing(object)  # get unicode representation of object
+    return value.encode(encoding, errors, **kwds)
+
+
+def _enable_data_resource_formatter(enable):
+    if 'IPython' not in sys.modules:
+        # definitely not in IPython
+        return
+    from IPython import get_ipython
+    ip = get_ipython()
+    if ip is None:
+        # still not in IPython
+        return
+
+    formatters = ip.display_formatter.formatters
+    mimetype = "application/vnd.dataresource+json"
+
+    if enable:
+        if mimetype not in formatters:
+            # define tableschema formatter
+            from IPython.core.formatters import BaseFormatter
+
+            class TableSchemaFormatter(BaseFormatter):
+                print_method = '_repr_data_resource_'
+                _return_type = (dict,)
+            # register it:
+            formatters[mimetype] = TableSchemaFormatter()
+        # enable it if it's been disabled:
+        formatters[mimetype].enabled = True
+    else:
+        # unregister tableschema mime-type
+        if mimetype in formatters:
+            formatters[mimetype].enabled = False
+
+
+default_pprint = lambda x, max_seq_items=None: \
+    pprint_thing(x, escape_chars=('\t', '\r', '\n'), quote_strings=True,
+                 max_seq_items=max_seq_items)
+
+
+def format_object_summary(obj, formatter, is_justify=True, name=None):
+    """
+    Return the formatted obj as a unicode string
+
+    Parameters
+    ----------
+    obj : object
+        must be iterable and support __getitem__
+    formatter : callable
+        string formatter for an element
+    is_justify : boolean
+        should justify the display
+    name : name, optiona
+        defaults to the class name of the obj
+
+    Returns
+    -------
+    summary string
+
+    """
+    from pandas.io.formats.console import get_console_size
+    from pandas.io.formats.format import _get_adjustment
+
+    display_width, _ = get_console_size()
+    if display_width is None:
+        display_width = get_option('display.width') or 80
+    if name is None:
+        name = obj.__class__.__name__
+
+    space1 = "\n%s" % (' ' * (len(name) + 1))
+    space2 = "\n%s" % (' ' * (len(name) + 2))
+
+    n = len(obj)
+    sep = ','
+    max_seq_items = get_option('display.max_seq_items') or n
+
+    # are we a truncated display
+    is_truncated = n > max_seq_items
+
+    # adj can optionally handle unicode eastern asian width
+    adj = _get_adjustment()
+
+    def _extend_line(s, line, value, display_width, next_line_prefix):
+
+        if (adj.len(line.rstrip()) + adj.len(value.rstrip()) >=
+                display_width):
+            s += line.rstrip()
+            line = next_line_prefix
+        line += value
+        return s, line
+
+    def best_len(values):
+        if values:
+            return max(adj.len(x) for x in values)
+        else:
+            return 0
+
+    if n == 0:
+        summary = '[], '
+    elif n == 1:
+        first = formatter(obj[0])
+        summary = '[%s], ' % first
+    elif n == 2:
+        first = formatter(obj[0])
+        last = formatter(obj[-1])
+        summary = '[%s, %s], ' % (first, last)
+    else:
+
+        if n > max_seq_items:
+            n = min(max_seq_items // 2, 10)
+            head = [formatter(x) for x in obj[:n]]
+            tail = [formatter(x) for x in obj[-n:]]
+        else:
+            head = []
+            tail = [formatter(x) for x in obj]
+
+        # adjust all values to max length if needed
+        if is_justify:
+
+            # however, if we are not truncated and we are only a single
+            # line, then don't justify
+            if (is_truncated or
+                    not (len(', '.join(head)) < display_width and
+                         len(', '.join(tail)) < display_width)):
+                max_len = max(best_len(head), best_len(tail))
+                head = [x.rjust(max_len) for x in head]
+                tail = [x.rjust(max_len) for x in tail]
+
+        summary = ""
+        line = space2
+
+        for i in range(len(head)):
+            word = head[i] + sep + ' '
+            summary, line = _extend_line(summary, line, word,
+                                         display_width, space2)
+
+        if is_truncated:
+            # remove trailing space of last line
+            summary += line.rstrip() + space2 + '...'
+            line = space2
+
+        for i in range(len(tail) - 1):
+            word = tail[i] + sep + ' '
+            summary, line = _extend_line(summary, line, word,
+                                         display_width, space2)
+
+        # last value: no sep added + 1 space of width used for trailing ','
+        summary, line = _extend_line(summary, line, tail[-1],
+                                     display_width - 2, space2)
+        summary += line
+        summary += '],'
+
+        if len(summary) > (display_width):
+            summary += space1
+        else:  # one row
+            summary += ' '
+
+        # remove initial space
+        summary = '[' + summary[len(space2):]
+
+    return summary
+
+
+def format_object_attrs(obj):
+    """
+    Return a list of tuples of the (attr, formatted_value)
+    for common attrs, including dtype, name, length
+
+    Parameters
+    ----------
+    obj : object
+        must be iterable
+
+    Returns
+    -------
+    list
+
+    """
+    attrs = []
+    if hasattr(obj, 'dtype'):
+        attrs.append(('dtype', "'{}'".format(obj.dtype)))
+    if getattr(obj, 'name', None) is not None:
+        attrs.append(('name', default_pprint(obj.name)))
+    max_seq_items = get_option('display.max_seq_items') or len(obj)
+    if len(obj) > max_seq_items:
+        attrs.append(('length', len(obj)))
+    return attrs
diff --git a/pandas/io/formats/style.py b/pandas/io/formats/style.py
new file mode 100644
index 0000000000000..62c2ea8ab9273
--- /dev/null
+++ b/pandas/io/formats/style.py
@@ -0,0 +1,1312 @@
+"""
+Module for applying conditional formatting to
+DataFrames and Series.
+"""
+from functools import partial
+from itertools import product
+from contextlib import contextmanager
+from uuid import uuid1
+import copy
+from collections import defaultdict, MutableMapping
+
+try:
+    from jinja2 import (
+        PackageLoader, Environment, ChoiceLoader, FileSystemLoader
+    )
+except ImportError:
+    msg = "pandas.Styler requires jinja2. "\
+          "Please install with `conda install Jinja2`\n"\
+          "or `pip install Jinja2`"
+    raise ImportError(msg)
+
+from pandas.core.dtypes.common import is_float, is_string_like
+
+import numpy as np
+import pandas as pd
+from pandas.api.types import is_list_like
+from pandas.compat import range
+from pandas.core.config import get_option
+from pandas.core.generic import _shared_docs
+import pandas.core.common as com
+from pandas.core.indexing import _maybe_numeric_slice, _non_reducing_slice
+from pandas.util._decorators import Appender
+try:
+    import matplotlib.pyplot as plt
+    from matplotlib import colors
+    has_mpl = True
+except ImportError:
+    has_mpl = False
+    no_mpl_message = "{0} requires matplotlib."
+
+
+@contextmanager
+def _mpl(func):
+    if has_mpl:
+        yield plt, colors
+    else:
+        raise ImportError(no_mpl_message.format(func.__name__))
+
+
+class Styler(object):
+    """
+    Helps style a DataFrame or Series according to the
+    data with HTML and CSS.
+
+    Parameters
+    ----------
+    data: Series or DataFrame
+    precision: int
+        precision to round floats to, defaults to pd.options.display.precision
+    table_styles: list-like, default None
+        list of {selector: (attr, value)} dicts; see Notes
+    uuid: str, default None
+        a unique identifier to avoid CSS collisions; generated automatically
+    caption: str, default None
+        caption to attach to the table
+
+    Attributes
+    ----------
+    env : Jinja2 Environment
+    template : Jinja2 Template
+    loader : Jinja2 Loader
+
+    Notes
+    -----
+    Most styling will be done by passing style functions into
+    ``Styler.apply`` or ``Styler.applymap``. Style functions should
+    return values with strings containing CSS ``'attr: value'`` that will
+    be applied to the indicated cells.
+
+    If using in the Jupyter notebook, Styler has defined a ``_repr_html_``
+    to automatically render itself. Otherwise call Styler.render to get
+    the generated HTML.
+
+    CSS classes are attached to the generated HTML
+
+    * Index and Column names include ``index_name`` and ``level<k>``
+      where `k` is its level in a MultiIndex
+    * Index label cells include
+
+      * ``row_heading``
+      * ``row<n>`` where `n` is the numeric position of the row
+      * ``level<k>`` where `k` is the level in a MultiIndex
+
+    * Column label cells include
+      * ``col_heading``
+      * ``col<n>`` where `n` is the numeric position of the column
+      * ``evel<k>`` where `k` is the level in a MultiIndex
+
+    * Blank cells include ``blank``
+    * Data cells include ``data``
+
+    See Also
+    --------
+    pandas.DataFrame.style
+    """
+    loader = PackageLoader("pandas", "io/formats/templates")
+    env = Environment(
+        loader=loader,
+        trim_blocks=True,
+    )
+    template = env.get_template("html.tpl")
+
+    def __init__(self, data, precision=None, table_styles=None, uuid=None,
+                 caption=None, table_attributes=None):
+        self.ctx = defaultdict(list)
+        self._todo = []
+
+        if not isinstance(data, (pd.Series, pd.DataFrame)):
+            raise TypeError("``data`` must be a Series or DataFrame")
+        if data.ndim == 1:
+            data = data.to_frame()
+        if not data.index.is_unique or not data.columns.is_unique:
+            raise ValueError("style is not supported for non-unique indices.")
+
+        self.data = data
+        self.index = data.index
+        self.columns = data.columns
+
+        self.uuid = uuid
+        self.table_styles = table_styles
+        self.caption = caption
+        if precision is None:
+            precision = get_option('display.precision')
+        self.precision = precision
+        self.table_attributes = table_attributes
+        self.hidden_index = False
+        self.hidden_columns = []
+
+        # display_funcs maps (row, col) -> formatting function
+
+        def default_display_func(x):
+            if is_float(x):
+                return '{:>.{precision}g}'.format(x, precision=self.precision)
+            else:
+                return x
+
+        self._display_funcs = defaultdict(lambda: default_display_func)
+
+    def _repr_html_(self):
+        """Hooks into Jupyter notebook rich display system."""
+        return self.render()
+
+    @Appender(_shared_docs['to_excel'] % dict(
+        axes='index, columns', klass='Styler',
+        axes_single_arg="{0 or 'index', 1 or 'columns'}",
+        optional_by="""
+            by : str or list of str
+                Name or list of names which refer to the axis items.""",
+        versionadded_to_excel='\n    .. versionadded:: 0.20'))
+    def to_excel(self, excel_writer, sheet_name='Sheet1', na_rep='',
+                 float_format=None, columns=None, header=True, index=True,
+                 index_label=None, startrow=0, startcol=0, engine=None,
+                 merge_cells=True, encoding=None, inf_rep='inf', verbose=True,
+                 freeze_panes=None):
+
+        from pandas.io.formats.excel import ExcelFormatter
+        formatter = ExcelFormatter(self, na_rep=na_rep, cols=columns,
+                                   header=header,
+                                   float_format=float_format, index=index,
+                                   index_label=index_label,
+                                   merge_cells=merge_cells,
+                                   inf_rep=inf_rep)
+        formatter.write(excel_writer, sheet_name=sheet_name, startrow=startrow,
+                        startcol=startcol, freeze_panes=freeze_panes,
+                        engine=engine)
+
+    def _translate(self):
+        """
+        Convert the DataFrame in `self.data` and the attrs from `_build_styles`
+        into a dictionary of {head, body, uuid, cellstyle}
+        """
+        table_styles = self.table_styles or []
+        caption = self.caption
+        ctx = self.ctx
+        precision = self.precision
+        hidden_index = self.hidden_index
+        hidden_columns = self.hidden_columns
+        uuid = self.uuid or str(uuid1()).replace("-", "_")
+        ROW_HEADING_CLASS = "row_heading"
+        COL_HEADING_CLASS = "col_heading"
+        INDEX_NAME_CLASS = "index_name"
+
+        DATA_CLASS = "data"
+        BLANK_CLASS = "blank"
+        BLANK_VALUE = ""
+
+        def format_attr(pair):
+            return "{key}={value}".format(**pair)
+
+        # for sparsifying a MultiIndex
+        idx_lengths = _get_level_lengths(self.index)
+        col_lengths = _get_level_lengths(self.columns, hidden_columns)
+
+        cell_context = dict()
+
+        n_rlvls = self.data.index.nlevels
+        n_clvls = self.data.columns.nlevels
+        rlabels = self.data.index.tolist()
+        clabels = self.data.columns.tolist()
+
+        if n_rlvls == 1:
+            rlabels = [[x] for x in rlabels]
+        if n_clvls == 1:
+            clabels = [[x] for x in clabels]
+        clabels = list(zip(*clabels))
+
+        cellstyle = []
+        head = []
+
+        for r in range(n_clvls):
+            # Blank for Index columns...
+            row_es = [{"type": "th",
+                       "value": BLANK_VALUE,
+                       "display_value": BLANK_VALUE,
+                       "is_visible": not hidden_index,
+                       "class": " ".join([BLANK_CLASS])}] * (n_rlvls - 1)
+
+            # ... except maybe the last for columns.names
+            name = self.data.columns.names[r]
+            cs = [BLANK_CLASS if name is None else INDEX_NAME_CLASS,
+                  "level{lvl}".format(lvl=r)]
+            name = BLANK_VALUE if name is None else name
+            row_es.append({"type": "th",
+                           "value": name,
+                           "display_value": name,
+                           "class": " ".join(cs),
+                           "is_visible": not hidden_index})
+
+            if clabels:
+                for c, value in enumerate(clabels[r]):
+                    cs = [COL_HEADING_CLASS, "level{lvl}".format(lvl=r),
+                          "col{col}".format(col=c)]
+                    cs.extend(cell_context.get(
+                        "col_headings", {}).get(r, {}).get(c, []))
+                    es = {
+                        "type": "th",
+                        "value": value,
+                        "display_value": value,
+                        "class": " ".join(cs),
+                        "is_visible": _is_visible(c, r, col_lengths),
+                    }
+                    colspan = col_lengths.get((r, c), 0)
+                    if colspan > 1:
+                        es["attributes"] = [
+                            format_attr({"key": "colspan", "value": colspan})
+                        ]
+                    row_es.append(es)
+                head.append(row_es)
+
+        if (self.data.index.names and
+                com._any_not_none(*self.data.index.names) and
+                not hidden_index):
+            index_header_row = []
+
+            for c, name in enumerate(self.data.index.names):
+                cs = [INDEX_NAME_CLASS,
+                      "level{lvl}".format(lvl=c)]
+                name = '' if name is None else name
+                index_header_row.append({"type": "th", "value": name,
+                                         "class": " ".join(cs)})
+
+            index_header_row.extend(
+                [{"type": "th",
+                  "value": BLANK_VALUE,
+                  "class": " ".join([BLANK_CLASS])
+                  }] * (len(clabels[0]) - len(hidden_columns)))
+
+            head.append(index_header_row)
+
+        body = []
+        for r, idx in enumerate(self.data.index):
+            row_es = []
+            for c, value in enumerate(rlabels[r]):
+                rid = [ROW_HEADING_CLASS, "level{lvl}".format(lvl=c),
+                       "row{row}".format(row=r)]
+                es = {
+                    "type": "th",
+                    "is_visible": (_is_visible(r, c, idx_lengths) and
+                                   not hidden_index),
+                    "value": value,
+                    "display_value": value,
+                    "id": "_".join(rid[1:]),
+                    "class": " ".join(rid)
+                }
+                rowspan = idx_lengths.get((c, r), 0)
+                if rowspan > 1:
+                    es["attributes"] = [
+                        format_attr({"key": "rowspan", "value": rowspan})
+                    ]
+                row_es.append(es)
+
+            for c, col in enumerate(self.data.columns):
+                cs = [DATA_CLASS, "row{row}".format(row=r),
+                      "col{col}".format(col=c)]
+                cs.extend(cell_context.get("data", {}).get(r, {}).get(c, []))
+                formatter = self._display_funcs[(r, c)]
+                value = self.data.iloc[r, c]
+                row_es.append({
+                    "type": "td",
+                    "value": value,
+                    "class": " ".join(cs),
+                    "id": "_".join(cs[1:]),
+                    "display_value": formatter(value),
+                    "is_visible": (c not in hidden_columns)
+                })
+                props = []
+                for x in ctx[r, c]:
+                    # have to handle empty styles like ['']
+                    if x.count(":"):
+                        props.append(x.split(":"))
+                    else:
+                        props.append(['', ''])
+                cellstyle.append({'props': props,
+                                  'selector': "row{row}_col{col}"
+                                  .format(row=r, col=c)})
+            body.append(row_es)
+
+        table_attr = self.table_attributes
+        use_mathjax = get_option("display.html.use_mathjax")
+        if not use_mathjax:
+            table_attr = table_attr or ''
+            if 'class="' in table_attr:
+                table_attr = table_attr.replace('class="',
+                                                'class="tex2jax_ignore ')
+            else:
+                table_attr += ' class="tex2jax_ignore"'
+
+        return dict(head=head, cellstyle=cellstyle, body=body, uuid=uuid,
+                    precision=precision, table_styles=table_styles,
+                    caption=caption, table_attributes=table_attr)
+
+    def format(self, formatter, subset=None):
+        """
+        Format the text display value of cells.
+
+        .. versionadded:: 0.18.0
+
+        Parameters
+        ----------
+        formatter: str, callable, or dict
+        subset: IndexSlice
+            An argument to ``DataFrame.loc`` that restricts which elements
+            ``formatter`` is applied to.
+
+        Returns
+        -------
+        self : Styler
+
+        Notes
+        -----
+
+        ``formatter`` is either an ``a`` or a dict ``{column name: a}`` where
+        ``a`` is one of
+
+        - str: this will be wrapped in: ``a.format(x)``
+        - callable: called with the value of an individual cell
+
+        The default display value for numeric values is the "general" (``g``)
+        format with ``pd.options.display.precision`` precision.
+
+        Examples
+        --------
+
+        >>> df = pd.DataFrame(np.random.randn(4, 2), columns=['a', 'b'])
+        >>> df.style.format("{:.2%}")
+        >>> df['c'] = ['a', 'b', 'c', 'd']
+        >>> df.style.format({'c': str.upper})
+        """
+        if subset is None:
+            row_locs = range(len(self.data))
+            col_locs = range(len(self.data.columns))
+        else:
+            subset = _non_reducing_slice(subset)
+            if len(subset) == 1:
+                subset = subset, self.data.columns
+
+            sub_df = self.data.loc[subset]
+            row_locs = self.data.index.get_indexer_for(sub_df.index)
+            col_locs = self.data.columns.get_indexer_for(sub_df.columns)
+
+        if isinstance(formatter, MutableMapping):
+            for col, col_formatter in formatter.items():
+                # formatter must be callable, so '{}' are converted to lambdas
+                col_formatter = _maybe_wrap_formatter(col_formatter)
+                col_num = self.data.columns.get_indexer_for([col])[0]
+
+                for row_num in row_locs:
+                    self._display_funcs[(row_num, col_num)] = col_formatter
+        else:
+            # single scalar to format all cells with
+            locs = product(*(row_locs, col_locs))
+            for i, j in locs:
+                formatter = _maybe_wrap_formatter(formatter)
+                self._display_funcs[(i, j)] = formatter
+        return self
+
+    def render(self, **kwargs):
+        """Render the built up styles to HTML
+
+        Parameters
+        ----------
+        `**kwargs`:
+            Any additional keyword arguments are passed through
+            to ``self.template.render``. This is useful when you
+            need to provide additional variables for a custom
+            template.
+
+            .. versionadded:: 0.20
+
+        Returns
+        -------
+        rendered: str
+            the rendered HTML
+
+        Notes
+        -----
+        ``Styler`` objects have defined the ``_repr_html_`` method
+        which automatically calls ``self.render()`` when it's the
+        last item in a Notebook cell. When calling ``Styler.render()``
+        directly, wrap the result in ``IPython.display.HTML`` to view
+        the rendered HTML in the notebook.
+
+        Pandas uses the following keys in render. Arguments passed
+        in ``**kwargs`` take precedence, so think carefully if you want
+        to override them:
+
+        * head
+        * cellstyle
+        * body
+        * uuid
+        * precision
+        * table_styles
+        * caption
+        * table_attributes
+        """
+        self._compute()
+        # TODO: namespace all the pandas keys
+        d = self._translate()
+        # filter out empty styles, every cell will have a class
+        # but the list of props may just be [['', '']].
+        # so we have the neested anys below
+        trimmed = [x for x in d['cellstyle']
+                   if any(any(y) for y in x['props'])]
+        d['cellstyle'] = trimmed
+        d.update(kwargs)
+        return self.template.render(**d)
+
+    def _update_ctx(self, attrs):
+        """
+        update the state of the Styler. Collects a mapping
+        of {index_label: ['<property>: <value>']}
+
+        attrs: Series or DataFrame
+        should contain strings of '<property>: <value>;<prop2>: <val2>'
+        Whitespace shouldn't matter and the final trailing ';' shouldn't
+        matter.
+        """
+        for row_label, v in attrs.iterrows():
+            for col_label, col in v.iteritems():
+                i = self.index.get_indexer([row_label])[0]
+                j = self.columns.get_indexer([col_label])[0]
+                for pair in col.rstrip(";").split(";"):
+                    self.ctx[(i, j)].append(pair)
+
+    def _copy(self, deepcopy=False):
+        styler = Styler(self.data, precision=self.precision,
+                        caption=self.caption, uuid=self.uuid,
+                        table_styles=self.table_styles)
+        if deepcopy:
+            styler.ctx = copy.deepcopy(self.ctx)
+            styler._todo = copy.deepcopy(self._todo)
+        else:
+            styler.ctx = self.ctx
+            styler._todo = self._todo
+        return styler
+
+    def __copy__(self):
+        """
+        Deep copy by default.
+        """
+        return self._copy(deepcopy=False)
+
+    def __deepcopy__(self, memo):
+        return self._copy(deepcopy=True)
+
+    def clear(self):
+        """"Reset" the styler, removing any previously applied styles.
+        Returns None.
+        """
+        self.ctx.clear()
+        self._todo = []
+
+    def _compute(self):
+        """
+        Execute the style functions built up in `self._todo`.
+
+        Relies on the conventions that all style functions go through
+        .apply or .applymap. The append styles to apply as tuples of
+
+        (application method, *args, **kwargs)
+        """
+        r = self
+        for func, args, kwargs in self._todo:
+            r = func(self)(*args, **kwargs)
+        return r
+
+    def _apply(self, func, axis=0, subset=None, **kwargs):
+        subset = slice(None) if subset is None else subset
+        subset = _non_reducing_slice(subset)
+        data = self.data.loc[subset]
+        if axis is not None:
+            result = data.apply(func, axis=axis,
+                                result_type='expand', **kwargs)
+            result.columns = data.columns
+        else:
+            result = func(data, **kwargs)
+            if not isinstance(result, pd.DataFrame):
+                raise TypeError(
+                    "Function {func!r} must return a DataFrame when "
+                    "passed to `Styler.apply` with axis=None"
+                    .format(func=func))
+            if not (result.index.equals(data.index) and
+                    result.columns.equals(data.columns)):
+                msg = ('Result of {func!r} must have identical index and '
+                       'columns as the input'.format(func=func))
+                raise ValueError(msg)
+
+        result_shape = result.shape
+        expected_shape = self.data.loc[subset].shape
+        if result_shape != expected_shape:
+            msg = ("Function {func!r} returned the wrong shape.\n"
+                   "Result has shape: {res}\n"
+                   "Expected shape:   {expect}".format(func=func,
+                                                       res=result.shape,
+                                                       expect=expected_shape))
+            raise ValueError(msg)
+        self._update_ctx(result)
+        return self
+
+    def apply(self, func, axis=0, subset=None, **kwargs):
+        """
+        Apply a function column-wise, row-wise, or table-wise,
+        updating the HTML representation with the result.
+
+        Parameters
+        ----------
+        func : function
+            ``func`` should take a Series or DataFrame (depending
+            on ``axis``), and return an object with the same shape.
+            Must return a DataFrame with identical index and
+            column labels when ``axis=None``
+        axis : int, str or None
+            apply to each column (``axis=0`` or ``'index'``)
+            or to each row (``axis=1`` or ``'columns'``) or
+            to the entire DataFrame at once with ``axis=None``
+        subset : IndexSlice
+            a valid indexer to limit ``data`` to *before* applying the
+            function. Consider using a pandas.IndexSlice
+        kwargs : dict
+            pass along to ``func``
+
+        Returns
+        -------
+        self : Styler
+
+        Notes
+        -----
+        The output shape of ``func`` should match the input, i.e. if
+        ``x`` is the input row, column, or table (depending on ``axis``),
+        then ``func(x.shape) == x.shape`` should be true.
+
+        This is similar to ``DataFrame.apply``, except that ``axis=None``
+        applies the function to the entire DataFrame at once,
+        rather than column-wise or row-wise.
+
+        Examples
+        --------
+        >>> def highlight_max(x):
+        ...     return ['background-color: yellow' if v == x.max() else ''
+                        for v in x]
+        ...
+        >>> df = pd.DataFrame(np.random.randn(5, 2))
+        >>> df.style.apply(highlight_max)
+        """
+        self._todo.append((lambda instance: getattr(instance, '_apply'),
+                           (func, axis, subset), kwargs))
+        return self
+
+    def _applymap(self, func, subset=None, **kwargs):
+        func = partial(func, **kwargs)  # applymap doesn't take kwargs?
+        if subset is None:
+            subset = pd.IndexSlice[:]
+        subset = _non_reducing_slice(subset)
+        result = self.data.loc[subset].applymap(func)
+        self._update_ctx(result)
+        return self
+
+    def applymap(self, func, subset=None, **kwargs):
+        """
+        Apply a function elementwise, updating the HTML
+        representation with the result.
+
+        Parameters
+        ----------
+        func : function
+            ``func`` should take a scalar and return a scalar
+        subset : IndexSlice
+            a valid indexer to limit ``data`` to *before* applying the
+            function. Consider using a pandas.IndexSlice
+        kwargs : dict
+            pass along to ``func``
+
+        Returns
+        -------
+        self : Styler
+
+        See Also
+        --------
+        Styler.where
+
+        """
+        self._todo.append((lambda instance: getattr(instance, '_applymap'),
+                           (func, subset), kwargs))
+        return self
+
+    def where(self, cond, value, other=None, subset=None, **kwargs):
+        """
+        Apply a function elementwise, updating the HTML
+        representation with a style which is selected in
+        accordance with the return value of a function.
+
+        .. versionadded:: 0.21.0
+
+        Parameters
+        ----------
+        cond : callable
+            ``cond`` should take a scalar and return a boolean
+        value : str
+            applied when ``cond`` returns true
+        other : str
+            applied when ``cond`` returns false
+        subset : IndexSlice
+            a valid indexer to limit ``data`` to *before* applying the
+            function. Consider using a pandas.IndexSlice
+        kwargs : dict
+            pass along to ``cond``
+
+        Returns
+        -------
+        self : Styler
+
+        See Also
+        --------
+        Styler.applymap
+
+        """
+
+        if other is None:
+            other = ''
+
+        return self.applymap(lambda val: value if cond(val) else other,
+                             subset=subset, **kwargs)
+
+    def set_precision(self, precision):
+        """
+        Set the precision used to render.
+
+        Parameters
+        ----------
+        precision: int
+
+        Returns
+        -------
+        self : Styler
+        """
+        self.precision = precision
+        return self
+
+    def set_table_attributes(self, attributes):
+        """
+        Set the table attributes. These are the items
+        that show up in the opening ``<table>`` tag in addition
+        to to automatic (by default) id.
+
+        Parameters
+        ----------
+        attributes : string
+
+        Returns
+        -------
+        self : Styler
+
+        Examples
+        --------
+        >>> df = pd.DataFrame(np.random.randn(10, 4))
+        >>> df.style.set_table_attributes('class="pure-table"')
+        # ... <table class="pure-table"> ...
+        """
+        self.table_attributes = attributes
+        return self
+
+    def export(self):
+        """
+        Export the styles to applied to the current Styler.
+        Can be applied to a second style with ``Styler.use``.
+
+        Returns
+        -------
+        styles: list
+
+        See Also
+        --------
+        Styler.use
+        """
+        return self._todo
+
+    def use(self, styles):
+        """
+        Set the styles on the current Styler, possibly using styles
+        from ``Styler.export``.
+
+        Parameters
+        ----------
+        styles: list
+            list of style functions
+
+        Returns
+        -------
+        self : Styler
+
+        See Also
+        --------
+        Styler.export
+        """
+        self._todo.extend(styles)
+        return self
+
+    def set_uuid(self, uuid):
+        """
+        Set the uuid for a Styler.
+
+        Parameters
+        ----------
+        uuid: str
+
+        Returns
+        -------
+        self : Styler
+        """
+        self.uuid = uuid
+        return self
+
+    def set_caption(self, caption):
+        """
+        Set the caption on a Styler
+
+        Parameters
+        ----------
+        caption: str
+
+        Returns
+        -------
+        self : Styler
+        """
+        self.caption = caption
+        return self
+
+    def set_table_styles(self, table_styles):
+        """
+        Set the table styles on a Styler. These are placed in a
+        ``<style>`` tag before the generated HTML table.
+
+        Parameters
+        ----------
+        table_styles: list
+            Each individual table_style should be a dictionary with
+            ``selector`` and ``props`` keys. ``selector`` should be a CSS
+            selector that the style will be applied to (automatically
+            prefixed by the table's UUID) and ``props`` should be a list of
+            tuples with ``(attribute, value)``.
+
+        Returns
+        -------
+        self : Styler
+
+        Examples
+        --------
+        >>> df = pd.DataFrame(np.random.randn(10, 4))
+        >>> df.style.set_table_styles(
+        ...     [{'selector': 'tr:hover',
+        ...       'props': [('background-color', 'yellow')]}]
+        ... )
+        """
+        self.table_styles = table_styles
+        return self
+
+    def hide_index(self):
+        """
+        Hide any indices from rendering.
+
+        .. versionadded:: 0.23.0
+
+        Returns
+        -------
+        self : Styler
+        """
+        self.hidden_index = True
+        return self
+
+    def hide_columns(self, subset):
+        """
+        Hide columns from rendering.
+
+        .. versionadded:: 0.23.0
+
+        Parameters
+        ----------
+        subset: IndexSlice
+            An argument to ``DataFrame.loc`` that identifies which columns
+            are hidden.
+
+        Returns
+        -------
+        self : Styler
+        """
+        subset = _non_reducing_slice(subset)
+        hidden_df = self.data.loc[subset]
+        self.hidden_columns = self.columns.get_indexer_for(hidden_df.columns)
+        return self
+
+    # -----------------------------------------------------------------------
+    # A collection of "builtin" styles
+    # -----------------------------------------------------------------------
+
+    @staticmethod
+    def _highlight_null(v, null_color):
+        return ('background-color: {color}'.format(color=null_color)
+                if pd.isna(v) else '')
+
+    def highlight_null(self, null_color='red'):
+        """
+        Shade the background ``null_color`` for missing values.
+
+        Parameters
+        ----------
+        null_color: str
+
+        Returns
+        -------
+        self : Styler
+        """
+        self.applymap(self._highlight_null, null_color=null_color)
+        return self
+
+    def background_gradient(self, cmap='PuBu', low=0, high=0, axis=0,
+                            subset=None, text_color_threshold=0.408):
+        """
+        Color the background in a gradient according to
+        the data in each column (optionally row).
+        Requires matplotlib.
+
+        Parameters
+        ----------
+        cmap: str or colormap
+            matplotlib colormap
+        low, high: float
+            compress the range by these values.
+        axis: int or str
+            1 or 'columns' for columnwise, 0 or 'index' for rowwise
+        subset: IndexSlice
+            a valid slice for ``data`` to limit the style application to
+        text_color_threshold: float or int
+            luminance threshold for determining text color. Facilitates text
+            visibility across varying background colors. From 0 to 1.
+            0 = all text is dark colored, 1 = all text is light colored.
+
+            .. versionadded:: 0.24.0
+
+        Returns
+        -------
+        self : Styler
+
+        Notes
+        -----
+        Set ``text_color_threshold`` or tune ``low`` and ``high`` to keep the
+        text legible by not using the entire range of the color map. The range
+        of the data is extended by ``low * (x.max() - x.min())`` and ``high *
+        (x.max() - x.min())`` before normalizing.
+
+        Raises
+        ------
+        ValueError
+            If ``text_color_threshold`` is not a value from 0 to 1.
+        """
+        subset = _maybe_numeric_slice(self.data, subset)
+        subset = _non_reducing_slice(subset)
+        self.apply(self._background_gradient, cmap=cmap, subset=subset,
+                   axis=axis, low=low, high=high,
+                   text_color_threshold=text_color_threshold)
+        return self
+
+    @staticmethod
+    def _background_gradient(s, cmap='PuBu', low=0, high=0,
+                             text_color_threshold=0.408):
+        """Color background in a range according to the data."""
+        with _mpl(Styler.background_gradient) as (plt, colors):
+            rng = s.max() - s.min()
+            # extend lower / upper bounds, compresses color range
+            norm = colors.Normalize(s.min() - (rng * low),
+                                    s.max() + (rng * high))
+            # matplotlib modifies inplace?
+            # https://github.com/matplotlib/matplotlib/issues/5427
+            normed = norm(s.values)
+            c = [colors.rgb2hex(x) for x in plt.cm.get_cmap(cmap)(normed)]
+            if (not isinstance(text_color_threshold, (float, int)) or
+                    not 0 <= text_color_threshold <= 1):
+                msg = "`text_color_threshold` must be a value from 0 to 1."
+                raise ValueError(msg)
+
+            def relative_luminance(color):
+                """
+                Calculate relative luminance of a color.
+
+                The calculation adheres to the W3C standards
+                (https://www.w3.org/WAI/GL/wiki/Relative_luminance)
+
+                Parameters
+                ----------
+                color : matplotlib color
+                    Hex code, rgb-tuple, or HTML color name.
+
+                Returns
+                -------
+                float
+                    The relative luminance as a value from 0 to 1
+                """
+                rgb = colors.colorConverter.to_rgba_array(color)[:, :3]
+                rgb = np.where(rgb <= .03928, rgb / 12.92,
+                               ((rgb + .055) / 1.055) ** 2.4)
+                lum = rgb.dot([.2126, .7152, .0722])
+                return lum.item()
+
+            text_colors = ['#f1f1f1' if relative_luminance(x) <
+                           text_color_threshold else '#000000' for x in c]
+
+            return ['background-color: {color};color: {tc}'.format(
+                    color=color, tc=tc) for color, tc in zip(c, text_colors)]
+
+    def set_properties(self, subset=None, **kwargs):
+        """
+        Convenience method for setting one or more non-data dependent
+        properties or each cell.
+
+        Parameters
+        ----------
+        subset: IndexSlice
+            a valid slice for ``data`` to limit the style application to
+        kwargs: dict
+            property: value pairs to be set for each cell
+
+        Returns
+        -------
+        self : Styler
+
+        Examples
+        --------
+        >>> df = pd.DataFrame(np.random.randn(10, 4))
+        >>> df.style.set_properties(color="white", align="right")
+        >>> df.style.set_properties(**{'background-color': 'yellow'})
+        """
+        values = ';'.join('{p}: {v}'.format(p=p, v=v)
+                          for p, v in kwargs.items())
+        f = lambda x: values
+        return self.applymap(f, subset=subset)
+
+    @staticmethod
+    def _bar_left(s, color, width, base):
+        """
+        The minimum value is aligned at the left of the cell
+        Parameters
+        ----------
+        color: 2-tuple/list, of [``color_negative``, ``color_positive``]
+        width: float
+            A number between 0 or 100. The largest value will cover ``width``
+            percent of the cell's width
+        base: str
+            The base css format of the cell, e.g.:
+            ``base = 'width: 10em; height: 80%;'``
+        Returns
+        -------
+        self : Styler
+        """
+        normed = width * (s - s.min()) / (s.max() - s.min())
+        zero_normed = width * (0 - s.min()) / (s.max() - s.min())
+        attrs = (base + 'background: linear-gradient(90deg,{c} {w:.1f}%, '
+                        'transparent 0%)')
+
+        return [base if x == 0 else attrs.format(c=color[0], w=x)
+                if x < zero_normed
+                else attrs.format(c=color[1], w=x) if x >= zero_normed
+                else base for x in normed]
+
+    @staticmethod
+    def _bar_center_zero(s, color, width, base):
+        """
+        Creates a bar chart where the zero is centered in the cell
+        Parameters
+        ----------
+        color: 2-tuple/list, of [``color_negative``, ``color_positive``]
+        width: float
+            A number between 0 or 100. The largest value will cover ``width``
+            percent of the cell's width
+        base: str
+            The base css format of the cell, e.g.:
+            ``base = 'width: 10em; height: 80%;'``
+        Returns
+        -------
+        self : Styler
+        """
+
+        # Either the min or the max should reach the edge
+        # (50%, centered on zero)
+        m = max(abs(s.min()), abs(s.max()))
+
+        normed = s * 50 * width / (100.0 * m)
+
+        attrs_neg = (base + 'background: linear-gradient(90deg, transparent 0%'
+                     ', transparent {w:.1f}%, {c} {w:.1f}%, '
+                     '{c} 50%, transparent 50%)')
+
+        attrs_pos = (base + 'background: linear-gradient(90deg, transparent 0%'
+                     ', transparent 50%, {c} 50%, {c} {w:.1f}%, '
+                     'transparent {w:.1f}%)')
+
+        return [attrs_pos.format(c=color[1], w=(50 + x)) if x >= 0
+                else attrs_neg.format(c=color[0], w=(50 + x))
+                for x in normed]
+
+    @staticmethod
+    def _bar_center_mid(s, color, width, base):
+        """
+        Creates a bar chart where the midpoint is centered in the cell
+        Parameters
+        ----------
+        color: 2-tuple/list, of [``color_negative``, ``color_positive``]
+        width: float
+            A number between 0 or 100. The largest value will cover ``width``
+            percent of the cell's width
+        base: str
+            The base css format of the cell, e.g.:
+            ``base = 'width: 10em; height: 80%;'``
+        Returns
+        -------
+        self : Styler
+        """
+
+        if s.min() >= 0:
+            # In this case, we place the zero at the left, and the max() should
+            # be at width
+            zero = 0.0
+            slope = width / s.max()
+        elif s.max() <= 0:
+            # In this case, we place the zero at the right, and the min()
+            # should be at 100-width
+            zero = 100.0
+            slope = width / -s.min()
+        else:
+            slope = width / (s.max() - s.min())
+            zero = (100.0 + width) / 2.0 - slope * s.max()
+
+        normed = zero + slope * s
+
+        attrs_neg = (base + 'background: linear-gradient(90deg, transparent 0%'
+                     ', transparent {w:.1f}%, {c} {w:.1f}%, '
+                     '{c} {zero:.1f}%, transparent {zero:.1f}%)')
+
+        attrs_pos = (base + 'background: linear-gradient(90deg, transparent 0%'
+                     ', transparent {zero:.1f}%, {c} {zero:.1f}%, '
+                     '{c} {w:.1f}%, transparent {w:.1f}%)')
+
+        return [attrs_pos.format(c=color[1], zero=zero, w=x) if x > zero
+                else attrs_neg.format(c=color[0], zero=zero, w=x)
+                for x in normed]
+
+    def bar(self, subset=None, axis=0, color='#d65f5f', width=100,
+            align='left'):
+        """
+        Color the background ``color`` proportional to the values in each
+        column.
+        Excludes non-numeric data by default.
+
+        Parameters
+        ----------
+        subset: IndexSlice, default None
+            a valid slice for ``data`` to limit the style application to
+        axis: int
+        color: str or 2-tuple/list
+            If a str is passed, the color is the same for both
+            negative and positive numbers. If 2-tuple/list is used, the
+            first element is the color_negative and the second is the
+            color_positive (eg: ['#d65f5f', '#5fba7d'])
+        width: float
+            A number between 0 or 100. The largest value will cover ``width``
+            percent of the cell's width
+        align : {'left', 'zero',' mid'}, default 'left'
+            - 'left' : the min value starts at the left of the cell
+            - 'zero' : a value of zero is located at the center of the cell
+            - 'mid' : the center of the cell is at (max-min)/2, or
+              if values are all negative (positive) the zero is aligned
+              at the right (left) of the cell
+
+              .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        self : Styler
+        """
+        subset = _maybe_numeric_slice(self.data, subset)
+        subset = _non_reducing_slice(subset)
+
+        base = 'width: 10em; height: 80%;'
+
+        if not(is_list_like(color)):
+            color = [color, color]
+        elif len(color) == 1:
+            color = [color[0], color[0]]
+        elif len(color) > 2:
+            msg = ("Must pass `color` as string or a list-like"
+                   " of length 2: [`color_negative`, `color_positive`]\n"
+                   "(eg: color=['#d65f5f', '#5fba7d'])")
+            raise ValueError(msg)
+
+        if align == 'left':
+            self.apply(self._bar_left, subset=subset, axis=axis, color=color,
+                       width=width, base=base)
+        elif align == 'zero':
+            self.apply(self._bar_center_zero, subset=subset, axis=axis,
+                       color=color, width=width, base=base)
+        elif align == 'mid':
+            self.apply(self._bar_center_mid, subset=subset, axis=axis,
+                       color=color, width=width, base=base)
+        else:
+            msg = ("`align` must be one of {'left', 'zero',' mid'}")
+            raise ValueError(msg)
+
+        return self
+
+    def highlight_max(self, subset=None, color='yellow', axis=0):
+        """
+        Highlight the maximum by shading the background
+
+        Parameters
+        ----------
+        subset: IndexSlice, default None
+            a valid slice for ``data`` to limit the style application to
+        color: str, default 'yellow'
+        axis: int, str, or None; default 0
+            0 or 'index' for columnwise (default), 1 or 'columns' for rowwise,
+            or ``None`` for tablewise
+
+        Returns
+        -------
+        self : Styler
+        """
+        return self._highlight_handler(subset=subset, color=color, axis=axis,
+                                       max_=True)
+
+    def highlight_min(self, subset=None, color='yellow', axis=0):
+        """
+        Highlight the minimum by shading the background
+
+        Parameters
+        ----------
+        subset: IndexSlice, default None
+            a valid slice for ``data`` to limit the style application to
+        color: str, default 'yellow'
+        axis: int, str, or None; default 0
+            0 or 'index' for columnwise (default), 1 or 'columns' for rowwise,
+            or ``None`` for tablewise
+
+        Returns
+        -------
+        self : Styler
+        """
+        return self._highlight_handler(subset=subset, color=color, axis=axis,
+                                       max_=False)
+
+    def _highlight_handler(self, subset=None, color='yellow', axis=None,
+                           max_=True):
+        subset = _non_reducing_slice(_maybe_numeric_slice(self.data, subset))
+        self.apply(self._highlight_extrema, color=color, axis=axis,
+                   subset=subset, max_=max_)
+        return self
+
+    @staticmethod
+    def _highlight_extrema(data, color='yellow', max_=True):
+        """Highlight the min or max in a Series or DataFrame"""
+        attr = 'background-color: {0}'.format(color)
+        if data.ndim == 1:  # Series from .apply
+            if max_:
+                extrema = data == data.max()
+            else:
+                extrema = data == data.min()
+            return [attr if v else '' for v in extrema]
+        else:  # DataFrame from .tee
+            if max_:
+                extrema = data == data.max().max()
+            else:
+                extrema = data == data.min().min()
+            return pd.DataFrame(np.where(extrema, attr, ''),
+                                index=data.index, columns=data.columns)
+
+    @classmethod
+    def from_custom_template(cls, searchpath, name):
+        """
+        Factory function for creating a subclass of ``Styler``
+        with a custom template and Jinja environment.
+
+        Parameters
+        ----------
+        searchpath : str or list
+            Path or paths of directories containing the templates
+        name : str
+            Name of your custom template to use for rendering
+
+        Returns
+        -------
+        MyStyler : subclass of Styler
+            has the correct ``env`` and ``template`` class attributes set.
+        """
+        loader = ChoiceLoader([
+            FileSystemLoader(searchpath),
+            cls.loader,
+        ])
+
+        class MyStyler(cls):
+            env = Environment(loader=loader)
+            template = env.get_template(name)
+
+        return MyStyler
+
+
+def _is_visible(idx_row, idx_col, lengths):
+    """
+    Index -> {(idx_row, idx_col): bool})
+    """
+    return (idx_col, idx_row) in lengths
+
+
+def _get_level_lengths(index, hidden_elements=None):
+    """
+    Given an index, find the level length for each element.
+    Optional argument is a list of index positions which
+    should not be visible.
+
+    Result is a dictionary of (level, inital_position): span
+    """
+    sentinel = com.sentinel_factory()
+    levels = index.format(sparsify=sentinel, adjoin=False, names=False)
+
+    if hidden_elements is None:
+        hidden_elements = []
+
+    lengths = {}
+    if index.nlevels == 1:
+        for i, value in enumerate(levels):
+            if(i not in hidden_elements):
+                lengths[(0, i)] = 1
+        return lengths
+
+    for i, lvl in enumerate(levels):
+        for j, row in enumerate(lvl):
+            if not get_option('display.multi_sparse'):
+                lengths[(i, j)] = 1
+            elif (row != sentinel) and (j not in hidden_elements):
+                last_label = j
+                lengths[(i, last_label)] = 1
+            elif (row != sentinel):
+                # even if its hidden, keep track of it in case
+                # length >1 and later elements are visible
+                last_label = j
+                lengths[(i, last_label)] = 0
+            elif(j not in hidden_elements):
+                lengths[(i, last_label)] += 1
+
+    non_zero_lengths = {}
+    for element, length in lengths.items():
+        if(length >= 1):
+            non_zero_lengths[element] = length
+
+    return non_zero_lengths
+
+
+def _maybe_wrap_formatter(formatter):
+    if is_string_like(formatter):
+        return lambda x: formatter.format(x)
+    elif callable(formatter):
+        return formatter
+    else:
+        msg = ("Expected a template string or callable, got {formatter} "
+               "instead".format(formatter=formatter))
+        raise TypeError(msg)
diff --git a/pandas/io/formats/templates/html.tpl b/pandas/io/formats/templates/html.tpl
new file mode 100644
index 0000000000000..706db1ecdd961
--- /dev/null
+++ b/pandas/io/formats/templates/html.tpl
@@ -0,0 +1,70 @@
+{# Update the template_structure.html document too #}
+{%- block before_style -%}{%- endblock before_style -%}
+{% block style %}
+<style  type="text/css" >
+{% block table_styles %}
+{% for s in table_styles %}
+    #T_{{uuid}} {{s.selector}} {
+    {% for p,val in s.props %}
+      {{p}}: {{val}};
+    {% endfor -%}
+    }
+{%- endfor -%}
+{% endblock table_styles %}
+{% block before_cellstyle %}{% endblock before_cellstyle %}
+{% block cellstyle %}
+{%- for s in cellstyle %}
+    #T_{{uuid}}{{s.selector}} {
+    {% for p,val in s.props %}
+        {{p}}: {{val}};
+    {% endfor %}
+    }
+{%- endfor -%}
+{%- endblock cellstyle %}
+</style>
+{%- endblock style %}
+{%- block before_table %}{% endblock before_table %} 
+{%- block table %}  
+<table id="T_{{uuid}}" {% if table_attributes %}{{ table_attributes }}{% endif %}> 
+{%- block caption %} 
+{%- if caption -%} 
+    <caption>{{caption}}</caption> 
+{%- endif -%} 
+{%- endblock caption %} 
+{%- block thead %} 
+<thead> 
+    {%- block before_head_rows %}{% endblock %}
+    {%- for r in head %} 
+    {%- block head_tr scoped %}
+    <tr> 
+        {%- for c in r %} 
+        {%- if c.is_visible != False %} 
+        <{{ c.type }} class="{{c.class}}" {{ c.attributes|join(" ") }}>{{c.value}}</{{ c.type }}>
+        {%- endif %} 
+        {%- endfor %} 
+    </tr> 
+    {%- endblock head_tr %}
+    {%- endfor %} 
+    {%- block after_head_rows %}{% endblock %}
+</thead> 
+{%- endblock thead %} 
+{%- block tbody %} 
+<tbody> 
+    {%- block before_rows %}{%- endblock before_rows %}
+    {%- for r in body %} 
+    {%- block tr scoped %}
+    <tr> 
+        {%- for c in r %} 
+        {%- if c.is_visible != False %} 
+        <{{ c.type }} id="T_{{ uuid }}{{ c.id }}" class="{{ c.class }}" {{ c.attributes|join(" ") }}>{{ c.display_value }}</{{ c.type }}>
+        {%- endif %} 
+        {%- endfor %} 
+    </tr> 
+    {%- endblock tr %}
+    {%- endfor %} 
+    {%- block after_rows %}{%- endblock after_rows %}
+</tbody> 
+{%- endblock tbody %} 
+</table> 
+{%- endblock table %} 
+{%- block after_table %}{% endblock after_table %} 
diff --git a/pandas/util/terminal.py b/pandas/io/formats/terminal.py
similarity index 83%
rename from pandas/util/terminal.py
rename to pandas/io/formats/terminal.py
index fc985855d2682..52262ea05bf96 100644
--- a/pandas/util/terminal.py
+++ b/pandas/io/formats/terminal.py
@@ -14,8 +14,11 @@
 from __future__ import print_function
 
 import os
+import shutil
+from pandas.compat import PY3
 
-__all__ = ['get_terminal_size']
+
+__all__ = ['get_terminal_size', 'is_terminal']
 
 
 def get_terminal_size():
@@ -26,6 +29,10 @@ def get_terminal_size():
     IPython zmq frontends, or IDLE do not run in a terminal,
     """
     import platform
+
+    if PY3:
+        return shutil.get_terminal_size()
+
     current_os = platform.system()
     tuple_xy = None
     if current_os == 'Windows':
@@ -42,6 +49,23 @@ def get_terminal_size():
     return tuple_xy
 
 
+def is_terminal():
+    """
+    Detect if Python is running in a terminal.
+
+    Returns True if Python is running in a terminal or False if not.
+    """
+    try:
+        ip = get_ipython()
+    except NameError:  # assume standard Python interpreter in a terminal
+        return True
+    else:
+        if hasattr(ip, 'kernel'):  # IPython as a Jupyter kernel
+            return False
+        else:  # IPython in a terminal
+            return True
+
+
 def _get_terminal_size_windows():
     res = None
     try:
@@ -94,7 +118,6 @@ def ioctl_GWINSZ(fd):
             import fcntl
             import termios
             import struct
-            import os
             cr = struct.unpack(
                 'hh', fcntl.ioctl(fd, termios.TIOCGWINSZ, '1234'))
         except:
@@ -116,6 +139,7 @@ def ioctl_GWINSZ(fd):
             return None
     return int(cr[1]), int(cr[0])
 
+
 if __name__ == "__main__":
     sizex, sizey = get_terminal_size()
-    print('width = %s height = %s' % (sizex, sizey))
+    print('width = {w} height = {h}'.format(w=sizex, h=sizey))
diff --git a/pandas/io/ga.py b/pandas/io/ga.py
deleted file mode 100644
index 5525b34951524..0000000000000
--- a/pandas/io/ga.py
+++ /dev/null
@@ -1,462 +0,0 @@
-"""
-1. Goto https://code.google.com/apis/console
-2. Create new project
-3. Goto APIs and register for OAuth2.0 for installed applications
-4. Download JSON secret file and move into same directory as this file
-"""
-
-# GH11038
-import warnings
-warnings.warn("The pandas.io.ga module is deprecated and will be "
-              "removed in a future version.",
-              FutureWarning, stacklevel=2)
-
-from datetime import datetime
-import re
-from pandas import compat
-import numpy as np
-from pandas import DataFrame
-import pandas as pd
-import pandas.io.parsers as psr
-import pandas.lib as lib
-from pandas.io.date_converters import generic_parser
-import pandas.io.auth as auth
-from pandas.util.decorators import Appender, Substitution
-
-from apiclient.errors import HttpError
-from oauth2client.client import AccessTokenRefreshError
-from pandas.compat import zip, u
-
-TYPE_MAP = {u('INTEGER'): int, u('FLOAT'): float, u('TIME'): int}
-
-NO_CALLBACK = auth.OOB_CALLBACK_URN
-DOC_URL = auth.DOC_URL
-
-_QUERY_PARAMS = """metrics : list of str
-    Un-prefixed metric names (e.g., 'visitors' and not 'ga:visitors')
-dimensions : list of str
-    Un-prefixed dimension variable names
-start_date : str/date/datetime
-end_date : str/date/datetime, optional, default is None but internally set as today
-segment : list of str, optional, default: None
-filters : list of str, optional, default: None
-start_index : int, default 1
-max_results : int, default 10000
-    If >10000, must specify chunksize or ValueError will be raised"""
-
-_QUERY_DOC = """
-Construct a google analytics query using given parameters
-Metrics and dimensions do not need the 'ga:' prefix
-
-Parameters
-----------
-profile_id : str
-%s
-""" % _QUERY_PARAMS
-
-_GA_READER_DOC = """Given query parameters, return a DataFrame with all the
-data or an iterator that returns DataFrames containing chunks of the data
-
-Parameters
-----------
-%s
-sort : bool/list, default True
-    Sort output by index or list of columns
-chunksize : int, optional
-    If max_results >10000, specifies the number of rows per iteration
-index_col : str/list of str/dict, optional, default: None
-    If unspecified then dimension variables are set as index
-parse_dates : bool/list/dict, default: True
-keep_date_col : boolean, default: False
-date_parser : optional, default: None
-na_values : optional, default: None
-converters : optional, default: None
-dayfirst : bool, default False
-    Informs date parsing
-account_name : str, optional, default: None
-account_id : str, optional, default: None
-property_name : str, optional, default: None
-property_id : str, optional, default: None
-profile_name : str, optional, default: None
-profile_id : str, optional, default: None
-%%(extras)s
-Returns
--------
-data : DataFrame or DataFrame yielding iterator
-""" % _QUERY_PARAMS
-
-_AUTH_PARAMS = """secrets : str, optional
-    File path to the secrets file
-scope : str, optional
-    Authentication scope
-token_file_name : str, optional
-    Path to token storage
-redirect : str, optional
-    Local host redirect if unspecified
-"""
-
-
-def reset_token_store():
-    """
-    Deletes the default token store
-    """
-    auth.reset_default_token_store()
-
-
-@Substitution(extras=_AUTH_PARAMS)
-@Appender(_GA_READER_DOC)
-def read_ga(metrics, dimensions, start_date, **kwargs):
-    lst = ['secrets', 'scope', 'token_file_name', 'redirect']
-    reader_kwds = dict((p, kwargs.pop(p)) for p in lst if p in kwargs)
-    reader = GAnalytics(**reader_kwds)
-    return reader.get_data(metrics=metrics, start_date=start_date,
-                           dimensions=dimensions, **kwargs)
-
-
-class OAuthDataReader(object):
-    """
-    Abstract class for handling OAuth2 authentication using the Google
-    oauth2client library
-    """
-    def __init__(self, scope, token_file_name, redirect):
-        """
-        Parameters
-        ----------
-        scope : str
-            Designates the authentication scope
-        token_file_name : str
-            Location of cache for authenticated tokens
-        redirect : str
-            Redirect URL
-        """
-        self.scope = scope
-        self.token_store = auth.make_token_store(token_file_name)
-        self.redirect_url = redirect
-
-    def authenticate(self, secrets):
-        """
-        Run the authentication process and return an authorized
-        http object
-
-        Parameters
-        ----------
-        secrets : str
-            File name for client secrets
-
-        Notes
-        -----
-        See google documention for format of secrets file
-        %s
-        """ % DOC_URL
-        flow = self._create_flow(secrets)
-        return auth.authenticate(flow, self.token_store)
-
-    def _create_flow(self, secrets):
-        """
-        Create an authentication flow based on the secrets file
-
-        Parameters
-        ----------
-        secrets : str
-            File name for client secrets
-
-        Notes
-        -----
-        See google documentation for format of secrets file
-        %s
-        """ % DOC_URL
-        return auth.get_flow(secrets, self.scope, self.redirect_url)
-
-
-class GDataReader(OAuthDataReader):
-    """
-    Abstract class for reading data from google APIs using OAuth2
-    Subclasses must implement create_query method
-    """
-    def __init__(self, scope=auth.DEFAULT_SCOPE,
-                 token_file_name=auth.DEFAULT_TOKEN_FILE,
-                 redirect=NO_CALLBACK, secrets=auth.DEFAULT_SECRETS):
-        super(GDataReader, self).__init__(scope, token_file_name, redirect)
-        self._service = self._init_service(secrets)
-
-    @property
-    def service(self):
-        """The authenticated request service object"""
-        return self._service
-
-    def _init_service(self, secrets):
-        """
-        Build an authenticated google api request service using the given
-        secrets file
-        """
-        http = self.authenticate(secrets)
-        return auth.init_service(http)
-
-    def get_account(self, name=None, id=None, **kwargs):
-        """ Retrieve an account that matches the name, id, or some account
-        attribute specified in **kwargs
-
-        Parameters
-        ----------
-        name : str, optional, default: None
-        id : str, optional, default: None
-        """
-        accounts = self.service.management().accounts().list().execute()
-        return _get_match(accounts, name, id, **kwargs)
-
-    def get_web_property(self, account_id=None, name=None, id=None, **kwargs):
-        """
-        Retrieve a web property given and account and property name, id, or
-        custom attribute
-
-        Parameters
-        ----------
-        account_id : str, optional, default: None
-        name : str, optional, default: None
-        id : str, optional, default: None
-        """
-        prop_store = self.service.management().webproperties()
-        kwds = {}
-        if account_id is not None:
-            kwds['accountId'] = account_id
-        prop_for_acct = prop_store.list(**kwds).execute()
-        return _get_match(prop_for_acct, name, id, **kwargs)
-
-    def get_profile(self, account_id=None, web_property_id=None, name=None,
-                    id=None, **kwargs):
-
-        """
-        Retrieve the right profile for the given account, web property, and
-        profile attribute (name, id, or arbitrary parameter in kwargs)
-
-        Parameters
-        ----------
-        account_id : str, optional, default: None
-        web_property_id : str, optional, default: None
-        name : str, optional, default: None
-        id : str, optional, default: None
-        """
-        profile_store = self.service.management().profiles()
-        kwds = {}
-        if account_id is not None:
-            kwds['accountId'] = account_id
-        if web_property_id is not None:
-            kwds['webPropertyId'] = web_property_id
-        profiles = profile_store.list(**kwds).execute()
-        return _get_match(profiles, name, id, **kwargs)
-
-    def create_query(self, *args, **kwargs):
-        raise NotImplementedError()
-
-    @Substitution(extras='')
-    @Appender(_GA_READER_DOC)
-    def get_data(self, metrics, start_date, end_date=None,
-                 dimensions=None, segment=None, filters=None, start_index=1,
-                 max_results=10000, index_col=None, parse_dates=True,
-                 keep_date_col=False, date_parser=None, na_values=None,
-                 converters=None, sort=True, dayfirst=False,
-                 account_name=None, account_id=None, property_name=None,
-                 property_id=None, profile_name=None, profile_id=None,
-                 chunksize=None):
-        if chunksize is None and max_results > 10000:
-            raise ValueError('Google API returns maximum of 10,000 rows, '
-                             'please set chunksize')
-
-        account = self.get_account(account_name, account_id)
-        web_property = self.get_web_property(account.get('id'), property_name,
-                                             property_id)
-        profile = self.get_profile(account.get('id'), web_property.get('id'),
-                                   profile_name, profile_id)
-
-        profile_id = profile.get('id')
-
-        if index_col is None and dimensions is not None:
-            if isinstance(dimensions, compat.string_types):
-                dimensions = [dimensions]
-            index_col = _clean_index(list(dimensions), parse_dates)
-
-        def _read(start, result_size):
-            query = self.create_query(profile_id, metrics, start_date,
-                                      end_date=end_date, dimensions=dimensions,
-                                      segment=segment, filters=filters,
-                                      start_index=start,
-                                      max_results=result_size)
-
-            try:
-                rs = query.execute()
-                rows = rs.get('rows', [])
-                col_info = rs.get('columnHeaders', [])
-                return self._parse_data(rows, col_info, index_col,
-                                        parse_dates=parse_dates,
-                                        keep_date_col=keep_date_col,
-                                        date_parser=date_parser,
-                                        dayfirst=dayfirst,
-                                        na_values=na_values,
-                                        converters=converters, sort=sort)
-            except HttpError as inst:
-                raise ValueError('Google API error %s: %s' % (inst.resp.status,
-                                 inst._get_reason()))
-
-        if chunksize is None:
-            return _read(start_index, max_results)
-
-        def iterator():
-            curr_start = start_index
-
-            while curr_start < max_results:
-                yield _read(curr_start, chunksize)
-                curr_start += chunksize
-        return iterator()
-
-    def _parse_data(self, rows, col_info, index_col, parse_dates=True,
-                    keep_date_col=False, date_parser=None, dayfirst=False,
-                    na_values=None, converters=None, sort=True):
-        # TODO use returned column types
-        col_names = _get_col_names(col_info)
-        df = psr._read(rows, dict(index_col=index_col, parse_dates=parse_dates,
-                                  date_parser=date_parser, dayfirst=dayfirst,
-                                  na_values=na_values,
-                                  keep_date_col=keep_date_col,
-                                  converters=converters,
-                                  header=None, names=col_names))
-
-        if isinstance(sort, bool) and sort:
-            return df.sort_index()
-        elif isinstance(sort, (compat.string_types, list, tuple, np.ndarray)):
-            return df.sort_index(by=sort)
-
-        return df
-
-
-class GAnalytics(GDataReader):
-
-    @Appender(_QUERY_DOC)
-    def create_query(self, profile_id, metrics, start_date, end_date=None,
-                     dimensions=None, segment=None, filters=None,
-                     start_index=None, max_results=10000, **kwargs):
-        qry = format_query(profile_id, metrics, start_date, end_date=end_date,
-                           dimensions=dimensions, segment=segment,
-                           filters=filters, start_index=start_index,
-                           max_results=max_results, **kwargs)
-        try:
-            return self.service.data().ga().get(**qry)
-        except TypeError as error:
-            raise ValueError('Error making query: %s' % error)
-
-
-def format_query(ids, metrics, start_date, end_date=None, dimensions=None,
-                 segment=None, filters=None, sort=None, start_index=None,
-                 max_results=10000, **kwargs):
-    if isinstance(metrics, compat.string_types):
-        metrics = [metrics]
-    met = ','.join(['ga:%s' % x for x in metrics])
-
-    start_date = pd.to_datetime(start_date).strftime('%Y-%m-%d')
-    if end_date is None:
-        end_date = datetime.today()
-    end_date = pd.to_datetime(end_date).strftime('%Y-%m-%d')
-
-    qry = dict(ids='ga:%s' % str(ids),
-               metrics=met,
-               start_date=start_date,
-               end_date=end_date)
-    qry.update(kwargs)
-
-    names = ['dimensions', 'filters', 'sort']
-    lst = [dimensions, filters, sort]
-    [_maybe_add_arg(qry, n, d) for n, d in zip(names, lst)]
-
-    if isinstance(segment, compat.string_types):
-        if re.match("^[a-zA-Z0-9\-\_]+$", segment):
-            _maybe_add_arg(qry, 'segment', segment, 'gaid:')
-        else:
-            _maybe_add_arg(qry, 'segment', segment, 'dynamic::ga')
-    elif isinstance(segment, int):
-        _maybe_add_arg(qry, 'segment', segment, 'gaid:')
-    elif segment:
-        raise ValueError("segment must be string for dynamic and int ID")
-
-    if start_index is not None:
-        qry['start_index'] = str(start_index)
-
-    if max_results is not None:
-        qry['max_results'] = str(max_results)
-
-    return qry
-
-
-def _maybe_add_arg(query, field, data, prefix='ga'):
-    if data is not None:
-        if isinstance(data, (compat.string_types, int)):
-            data = [data]
-        data = ','.join(['%s:%s' % (prefix, x) for x in data])
-        query[field] = data
-
-
-def _get_match(obj_store, name, id, **kwargs):
-    key, val = None, None
-    if len(kwargs) > 0:
-        key = list(kwargs.keys())[0]
-        val = list(kwargs.values())[0]
-
-    if name is None and id is None and key is None:
-        return obj_store.get('items')[0]
-
-    name_ok = lambda item: name is not None and item.get('name') == name
-    id_ok = lambda item: id is not None and item.get('id') == id
-    key_ok = lambda item: key is not None and item.get(key) == val
-
-    match = None
-    if obj_store.get('items'):
-        # TODO look up gapi for faster lookup
-        for item in obj_store.get('items'):
-            if name_ok(item) or id_ok(item) or key_ok(item):
-                return item
-
-
-def _clean_index(index_dims, parse_dates):
-    _should_add = lambda lst: pd.Index(lst).isin(index_dims).all()
-    to_remove = []
-    to_add = []
-
-    if isinstance(parse_dates, (list, tuple, np.ndarray)):
-        for lst in parse_dates:
-            if isinstance(lst, (list, tuple, np.ndarray)):
-                if _should_add(lst):
-                    to_add.append('_'.join(lst))
-                to_remove.extend(lst)
-    elif isinstance(parse_dates, dict):
-        for name, lst in compat.iteritems(parse_dates):
-            if isinstance(lst, (list, tuple, np.ndarray)):
-                if _should_add(lst):
-                    to_add.append(name)
-                to_remove.extend(lst)
-
-    index_dims = pd.Index(index_dims)
-    to_remove = pd.Index(set(to_remove))
-    to_add = pd.Index(set(to_add))
-
-    return index_dims.difference(to_remove).union(to_add)
-
-
-def _get_col_names(header_info):
-    return [x['name'][3:] for x in header_info]
-
-
-def _get_column_types(header_info):
-    return [(x['name'][3:], x['columnType']) for x in header_info]
-
-
-def _get_dim_names(header_info):
-    return [x['name'][3:] for x in header_info
-            if x['columnType'] == u('DIMENSION')]
-
-
-def _get_met_names(header_info):
-    return [x['name'][3:] for x in header_info
-            if x['columnType'] == u('METRIC')]
-
-
-def _get_data_types(header_info):
-    return [(x['name'][3:], TYPE_MAP.get(x['dataType'], object))
-            for x in header_info]
diff --git a/pandas/io/gbq.py b/pandas/io/gbq.py
index e7241036b94c4..87a0e4d5d1747 100644
--- a/pandas/io/gbq.py
+++ b/pandas/io/gbq.py
@@ -1,806 +1,129 @@
-import warnings
-from datetime import datetime
-import json
-import logging
-from time import sleep
-import uuid
+""" Google BigQuery support """
 
-import numpy as np
-
-from distutils.version import StrictVersion
-from pandas import compat
-from pandas.core.api import DataFrame
-from pandas.tools.merge import concat
-from pandas.core.common import PandasError
-from pandas.util.decorators import deprecate
-from pandas.compat import lzip, bytes_to_str
-
-def _check_google_client_version():
 
+def _try_import():
+    # since pandas is a dependency of pandas-gbq
+    # we need to import on first use
     try:
-        import pkg_resources
-
+        import pandas_gbq
     except ImportError:
-        raise ImportError('Could not import pkg_resources (setuptools).')
-
-    if compat.PY3:
-        google_api_minimum_version = '1.4.1'
-    else:
-        google_api_minimum_version = '1.2.0'
-
-    _GOOGLE_API_CLIENT_VERSION = pkg_resources.get_distribution('google-api-python-client').version
-
-    if StrictVersion(_GOOGLE_API_CLIENT_VERSION) < StrictVersion(google_api_minimum_version):
-        raise ImportError("pandas requires google-api-python-client >= {0} for Google BigQuery support, "
-                          "current version {1}".format(google_api_minimum_version, _GOOGLE_API_CLIENT_VERSION))
-
-logger = logging.getLogger('pandas.io.gbq')
-logger.setLevel(logging.ERROR)
 
+        # give a nice error message
+        raise ImportError("Load data from Google BigQuery\n"
+                          "\n"
+                          "the pandas-gbq package is not installed\n"
+                          "see the docs: https://pandas-gbq.readthedocs.io\n"
+                          "\n"
+                          "you can install via pip or conda:\n"
+                          "pip install pandas-gbq\n"
+                          "conda install pandas-gbq -c conda-forge\n")
 
-class AccessDenied(PandasError, ValueError):
-    """
-    Raised when invalid credentials are provided, or tokens have expired.
-    """
-    pass
-
-
-class DatasetCreationError(PandasError, ValueError):
-    """
-    Raised when the create dataset method fails
-    """
-    pass
-
-
-class GenericGBQException(PandasError, ValueError):
-    """
-    Raised when an unrecognized Google API Error occurs.
-    """
-    pass
-
-
-class InvalidColumnOrder(PandasError, ValueError):
-    """
-    Raised when the provided column order for output
-    results DataFrame does not match the schema
-    returned by BigQuery.
-    """
-    pass
-
-
-class InvalidPageToken(PandasError, ValueError):
-    """
-    Raised when Google BigQuery fails to return,
-    or returns a duplicate page token.
-    """
-    pass
+    return pandas_gbq
 
 
-class InvalidSchema(PandasError, ValueError):
+def read_gbq(query, project_id=None, index_col=None, col_order=None,
+             reauth=False, private_key=None, auth_local_webserver=False,
+             dialect='legacy', location=None, configuration=None,
+             verbose=None):
     """
-    Raised when the provided DataFrame does
-    not match the schema of the destination
-    table in BigQuery.
-    """
-    pass
-
-
-class NotFoundException(PandasError, ValueError):
-    """
-    Raised when the project_id, table or dataset provided in the query could not be found.
-    """
-    pass
-
-
-class StreamingInsertError(PandasError, ValueError):
-    """
-    Raised when BigQuery reports a streaming insert error.
-    For more information see `Streaming Data Into BigQuery
-    <https://cloud.google.com/bigquery/streaming-data-into-bigquery>`__
-    """
-
-
-class TableCreationError(PandasError, ValueError):
-    """
-    Raised when the create table method fails
-    """
-    pass
-
-
-class GbqConnector(object):
-
-    def __init__(self, project_id, reauth=False):
-        self.test_google_api_imports()
-        self.project_id = project_id
-        self.reauth = reauth
-        self.credentials = self.get_credentials()
-        self.service = self.get_service(self.credentials)
-
-    def test_google_api_imports(self):
-        try:
-            import httplib2
-            from apiclient.discovery import build
-            from apiclient.errors import HttpError
-            from oauth2client.client import AccessTokenRefreshError
-            from oauth2client.client import OAuth2WebServerFlow
-            from oauth2client.file import Storage
-            from oauth2client.tools import run_flow, argparser
-        except ImportError as e:
-            raise ImportError("Missing module required for Google BigQuery support: {0}".format(str(e)))
-
-    def get_credentials(self):
-        from oauth2client.client import OAuth2WebServerFlow
-        from oauth2client.file import Storage
-        from oauth2client.tools import run_flow, argparser
-
-        _check_google_client_version()
-
-        flow = OAuth2WebServerFlow(client_id='495642085510-k0tmvj2m941jhre2nbqka17vqpjfddtd.apps.googleusercontent.com',
-                                   client_secret='kOc9wMptUtxkcIFbtZCcrEAc',
-                                   scope='https://www.googleapis.com/auth/bigquery',
-                                   redirect_uri='urn:ietf:wg:oauth:2.0:oob')
-
-        storage = Storage('bigquery_credentials.dat')
-        credentials = storage.get()
-
-        if credentials is None or credentials.invalid or self.reauth:
-            credentials = run_flow(flow, storage, argparser.parse_args([]))
-
-        return credentials
-
-    @staticmethod
-    def get_service(credentials):
-        import httplib2
-        from apiclient.discovery import build
-
-        _check_google_client_version()
-
-        http = httplib2.Http()
-        http = credentials.authorize(http)
-        bigquery_service = build('bigquery', 'v2', http=http)
-
-        return bigquery_service
-
-    @staticmethod
-    def process_http_error(ex):
-        # See `BigQuery Troubleshooting Errors <https://cloud.google.com/bigquery/troubleshooting-errors>`__
-
-        status = json.loads(bytes_to_str(ex.content))['error']
-        errors = status.get('errors', None)
-
-        if errors:
-            for error in errors:
-                reason = error['reason']
-                message = error['message']
-
-                raise GenericGBQException("Reason: {0}, Message: {1}".format(reason, message))
-
-        raise GenericGBQException(errors)
-
-    @staticmethod
-    def process_insert_errors(insert_errors, verbose):
-        for insert_error in insert_errors:
-            row = insert_error['index']
-            errors = insert_error.get('errors', None)
-            for error in errors:
-                reason = error['reason']
-                message = error['message']
-                location = error['location']
-                error_message = 'Error at Row: {0}, Reason: {1}, Location: {2}, Message: {3}'.format(row, reason, location, message)
-
-                # Report all error messages if verbose is set
-                if verbose:
-                    print(error_message)
-                else:
-                    raise StreamingInsertError(error_message + '\nEnable verbose logging to see all errors')
-
-        raise StreamingInsertError
-
-    def run_query(self, query, verbose=True):
-        from apiclient.errors import HttpError
-        from oauth2client.client import AccessTokenRefreshError
-
-        _check_google_client_version()
-
-        job_collection = self.service.jobs()
-        job_data = {
-            'configuration': {
-                'query': {
-                    'query': query
-                    # 'allowLargeResults', 'createDisposition', 'preserveNulls', destinationTable, useQueryCache
-                }
-            }
-        }
-
-        try:
-            query_reply = job_collection.insert(projectId=self.project_id, body=job_data).execute()
-        except AccessTokenRefreshError:
-            raise AccessDenied("The credentials have been revoked or expired, please re-run the application "
-                               "to re-authorize")
-        except HttpError as ex:
-            self.process_http_error(ex)
-
-        job_reference = query_reply['jobReference']
-
-        while not query_reply.get('jobComplete', False):
-            if verbose:
-                print('Waiting for job to complete...')
-            try:
-                query_reply = job_collection.getQueryResults(projectId=job_reference['projectId'],
-                                                             jobId=job_reference['jobId']).execute()
-            except HttpError as ex:
-                self.process_http_error(ex)
-
-        total_rows = int(query_reply['totalRows'])
-        result_pages = list()
-        seen_page_tokens = list()
-        current_row = 0
-        # Only read schema on first page
-        schema = query_reply['schema']
-
-        # Loop through each page of data
-        while 'rows' in query_reply and current_row < total_rows:
-            page = query_reply['rows']
-            result_pages.append(page)
-            current_row += len(page)
-            page_token = query_reply.get('pageToken', None)
-
-            if not page_token and current_row < total_rows:
-                raise InvalidPageToken(
-                    "Required pageToken was missing. Received {0} of {1} rows".format(current_row,
-                                                                                      total_rows))
-
-            elif page_token in seen_page_tokens:
-                raise InvalidPageToken("A duplicate pageToken was returned")
-
-            seen_page_tokens.append(page_token)
-
-            try:
-                query_reply = job_collection.getQueryResults(
-                                projectId=job_reference['projectId'],
-                                jobId=job_reference['jobId'],
-                                pageToken=page_token).execute()
-            except HttpError as ex:
-                self.process_http_error(ex)
-
-        if current_row < total_rows:
-            raise InvalidPageToken()
-
-        return schema, result_pages
-
-    def load_data(self, dataframe, dataset_id, table_id, chunksize, verbose):
-        from apiclient.errors import HttpError
-
-        job_id = uuid.uuid4().hex
-        rows = []
-        remaining_rows = len(dataframe)
-
-        if verbose:
-            total_rows = remaining_rows
-            print("\n\n")
-
-        for index, row in dataframe.reset_index(drop=True).iterrows():
-            row_dict = dict()
-            row_dict['json'] = json.loads(row.to_json(force_ascii=False,
-                                                      date_unit='s',
-                                                      date_format='iso'))
-            row_dict['insertId'] = job_id + str(index)
-            rows.append(row_dict)
-            remaining_rows -= 1
-
-            if (len(rows) % chunksize == 0) or (remaining_rows == 0):
-                if verbose:
-                    print("\rStreaming Insert is {0}% Complete".format(((total_rows - remaining_rows) * 100) / total_rows))
-
-                body = {'rows': rows}
-
-                try:
-                    response = self.service.tabledata().insertAll(
-                                                            projectId = self.project_id,
-                                                            datasetId = dataset_id,
-                                                            tableId = table_id,
-                                                            body = body).execute()
-                except HttpError as ex:
-                    self.process_http_error(ex)
-
-                # For streaming inserts, even if you receive a success HTTP response code, you'll need to check the
-                # insertErrors property of the response to determine if the row insertions were successful, because
-                # it's possible that BigQuery was only partially successful at inserting the rows.
-                # See the `Success HTTP Response Codes <https://cloud.google.com/bigquery/streaming-data-into-bigquery#troubleshooting>`__
-                # section
-
-                insert_errors = response.get('insertErrors', None)
-                if insert_errors:
-                    self.process_insert_errors(insert_errors, verbose)
-
-                sleep(1)  # Maintains the inserts "per second" rate per API
-                rows = []
-
-        if verbose:
-            print("\n")
-
-    def verify_schema(self, dataset_id, table_id, schema):
-        from apiclient.errors import HttpError
-
-        try:
-            return (self.service.tables().get(
-                projectId=self.project_id,
-                datasetId=dataset_id,
-                tableId=table_id
-            ).execute()['schema']) == schema
-
-        except HttpError as ex:
-            self.process_http_error(ex)
-
-    def delete_and_recreate_table(self, dataset_id, table_id, table_schema, verbose):
-        delay = 0
-
-        # Changes to table schema may take up to 2 minutes as of May 2015
-        # See `Issue 191 <https://code.google.com/p/google-bigquery/issues/detail?id=191>`__
-        # Compare previous schema with new schema to determine if there should be a 120 second delay
-
-        if not self.verify_schema(dataset_id, table_id, table_schema):
-            if verbose:
-                print('The existing table has a different schema. Please wait 2 minutes. See Google BigQuery issue #191')
-            delay = 120
-
-        table = _Table(self.project_id, dataset_id)
-        table.delete(table_id)
-        table.create(table_id, table_schema)
-        sleep(delay)
-
-
-def _parse_data(schema, rows):
-    # see: http://pandas.pydata.org/pandas-docs/dev/missing_data.html#missing-data-casting-rules-and-indexing
-    dtype_map = {'INTEGER': np.dtype(float),
-                 'FLOAT': np.dtype(float),
-                 'TIMESTAMP': 'M8[ns]'}     # This seems to be buggy without nanosecond indicator
-
-    fields = schema['fields']
-    col_types = [field['type'] for field in fields]
-    col_names = [str(field['name']) for field in fields]
-    col_dtypes = [dtype_map.get(field['type'], object) for field in fields]
-    page_array = np.zeros((len(rows),),
-                          dtype=lzip(col_names, col_dtypes))
-
-    for row_num, raw_row in enumerate(rows):
-        entries = raw_row.get('f', [])
-        for col_num, field_type in enumerate(col_types):
-            field_value = _parse_entry(entries[col_num].get('v', ''),
-                                       field_type)
-            page_array[row_num][col_num] = field_value
-
-    return DataFrame(page_array, columns=col_names)
+    Load data from Google BigQuery.
 
+    This function requires the `pandas-gbq package
+    <https://pandas-gbq.readthedocs.io>`__.
 
-def _parse_entry(field_value, field_type):
-    if field_value is None or field_value == 'null':
-        return None
-    if field_type == 'INTEGER' or field_type == 'FLOAT':
-        return float(field_value)
-    elif field_type == 'TIMESTAMP':
-        timestamp = datetime.utcfromtimestamp(float(field_value))
-        return np.datetime64(timestamp)
-    elif field_type == 'BOOLEAN':
-        return field_value == 'true'
-    return field_value
-
-
-def read_gbq(query, project_id=None, index_col=None, col_order=None, reauth=False, verbose=True):
-    """Load data from Google BigQuery.
-
-    THIS IS AN EXPERIMENTAL LIBRARY
-
-    The main method a user calls to execute a Query in Google BigQuery and read results
-    into a pandas DataFrame using the v2 Google API client for Python.  Documentation for
-    the API is available at https://developers.google.com/api-client-library/python/.
-    Authentication to the Google BigQuery service is via OAuth 2.0 using the product name
-    'pandas GBQ'.
+    See the `How to authenticate with Google BigQuery
+    <https://pandas-gbq.readthedocs.io/en/latest/howto/authentication.html>`__
+    guide for authentication instructions.
 
     Parameters
     ----------
     query : str
-        SQL-Like Query to return data values
-    project_id : str
-        Google BigQuery Account project ID.
-    index_col : str (optional)
-        Name of result column to use for index in results DataFrame
-    col_order : list(str) (optional)
+        SQL-Like Query to return data values.
+    project_id : str, optional
+        Google BigQuery Account project ID. Optional when available from
+        the environment.
+    index_col : str, optional
+        Name of result column to use for index in results DataFrame.
+    col_order : list(str), optional
         List of BigQuery column names in the desired order for results
-        DataFrame
-    reauth : boolean (default False)
-        Force Google BigQuery to reauthenticate the user. This is useful
+        DataFrame.
+    reauth : boolean, default False
+        Force Google BigQuery to re-authenticate the user. This is useful
         if multiple accounts are used.
-    verbose : boolean (default True)
-        Verbose output
+    private_key : str, optional
+        Service account private key in JSON format. Can be file path
+        or string contents. This is useful for remote server
+        authentication (eg. Jupyter/IPython notebook on remote host).
+    auth_local_webserver : boolean, default False
+        Use the `local webserver flow`_ instead of the `console flow`_
+        when getting user credentials.
+
+        .. _local webserver flow:
+            http://google-auth-oauthlib.readthedocs.io/en/latest/reference/google_auth_oauthlib.flow.html#google_auth_oauthlib.flow.InstalledAppFlow.run_local_server
+        .. _console flow:
+            http://google-auth-oauthlib.readthedocs.io/en/latest/reference/google_auth_oauthlib.flow.html#google_auth_oauthlib.flow.InstalledAppFlow.run_console
+
+        *New in version 0.2.0 of pandas-gbq*.
+    dialect : str, default 'legacy'
+        SQL syntax dialect to use. Value can be one of:
+
+        ``'legacy'``
+            Use BigQuery's legacy SQL dialect. For more information see
+            `BigQuery Legacy SQL Reference
+            <https://cloud.google.com/bigquery/docs/reference/legacy-sql>`__.
+        ``'standard'``
+            Use BigQuery's standard SQL, which is
+            compliant with the SQL 2011 standard. For more information
+            see `BigQuery Standard SQL Reference
+            <https://cloud.google.com/bigquery/docs/reference/standard-sql/>`__.
+    location : str, optional
+        Location where the query job should run. See the `BigQuery locations
+        documentation
+        <https://cloud.google.com/bigquery/docs/dataset-locations>`__ for a
+        list of available locations. The location must match that of any
+        datasets used in the query.
+
+        *New in version 0.5.0 of pandas-gbq*.
+    configuration : dict, optional
+        Query config parameters for job processing.
+        For example:
+
+            configuration = {'query': {'useQueryCache': False}}
+
+        For more information see `BigQuery REST API Reference
+        <https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query>`__.
+    verbose : None, deprecated
+        Deprecated in Pandas-GBQ 0.4.0. Use the `logging module
+        to adjust verbosity instead
+        <https://pandas-gbq.readthedocs.io/en/latest/intro.html#logging>`__.
 
     Returns
     -------
     df: DataFrame
-        DataFrame representing results of query
-
-    """
-
-    if not project_id:
-        raise TypeError("Missing required parameter: project_id")
-
-    connector = GbqConnector(project_id, reauth=reauth)
-    schema, pages = connector.run_query(query, verbose=verbose)
-    dataframe_list = []
-    while len(pages) > 0:
-        page = pages.pop()
-        dataframe_list.append(_parse_data(schema, page))
-
-    if len(dataframe_list) > 0:
-        final_df = concat(dataframe_list, ignore_index=True)
-    else:
-        final_df = _parse_data(schema, [])
-
-    # Reindex the DataFrame on the provided column
-    if index_col is not None:
-        if index_col in final_df.columns:
-            final_df.set_index(index_col, inplace=True)
-        else:
-            raise InvalidColumnOrder(
-                'Index column "{0}" does not exist in DataFrame.'
-                .format(index_col)
-            )
-
-    # Change the order of columns in the DataFrame based on provided list
-    if col_order is not None:
-        if sorted(col_order) == sorted(final_df.columns):
-            final_df = final_df[col_order]
-        else:
-            raise InvalidColumnOrder(
-                'Column order does not match this DataFrame.'
-            )
-
-    # Downcast floats to integers and objects to booleans
-    # if there are no NaN's. This is presently due to a
-    # limitation of numpy in handling missing data.
-    final_df._data = final_df._data.downcast(dtypes='infer')
-    return final_df
-
-
-def to_gbq(dataframe, destination_table, project_id, chunksize=10000,
-           verbose=True, reauth=False, if_exists='fail'):
-    """Write a DataFrame to a Google BigQuery table.
-
-    THIS IS AN EXPERIMENTAL LIBRARY
-
-    Parameters
-    ----------
-    dataframe : DataFrame
-        DataFrame to be written
-    destination_table : string
-        Name of table to be written, in the form 'dataset.tablename'
-    project_id : str
-        Google BigQuery Account project ID.
-    chunksize : int (default 10000)
-        Number of rows to be inserted in each chunk from the dataframe.
-    verbose : boolean (default True)
-        Show percentage complete
-    reauth : boolean (default False)
-        Force Google BigQuery to reauthenticate the user. This is useful
-        if multiple accounts are used.
-    if_exists : {'fail', 'replace', 'append'}, default 'fail'
-        'fail': If table exists, do nothing.
-        'replace': If table exists, drop it, recreate it, and insert data.
-        'append': If table exists, insert data. Create if does not exist.
-    """
-
-    if if_exists not in ('fail', 'replace', 'append'):
-        raise ValueError("'{0}' is not valid for if_exists".format(if_exists))
-
-    if '.' not in destination_table:
-        raise NotFoundException("Invalid Table Name. Should be of the form 'datasetId.tableId' ")
-
-    connector = GbqConnector(project_id, reauth=reauth)
-    dataset_id, table_id = destination_table.rsplit('.', 1)
-
-    table = _Table(project_id, dataset_id, reauth=reauth)
-
-    table_schema = _generate_bq_schema(dataframe)
-
-    # If table exists, check if_exists parameter
-    if table.exists(table_id):
-        if if_exists == 'fail':
-            raise TableCreationError("Could not create the table because it already exists. "
-                                     "Change the if_exists parameter to append or replace data.")
-        elif if_exists == 'replace':
-            connector.delete_and_recreate_table(dataset_id, table_id, table_schema, verbose)
-        elif if_exists == 'append':
-            if not connector.verify_schema(dataset_id, table_id, table_schema):
-                raise InvalidSchema("The schema of the destination table does not match")
-    else:
-        table.create(table_id, table_schema)
-
-    connector.load_data(dataframe, dataset_id, table_id, chunksize, verbose)
-
-
-def generate_bq_schema(df, default_type='STRING'):
-
-    # deprecation TimeSeries, #11121
-    warnings.warn("generate_bq_schema is deprecated and will be removed in a future version",
-                  FutureWarning, stacklevel=2)
-
-    return _generate_bq_schema(df, default_type=default_type)
-
-def _generate_bq_schema(df, default_type='STRING'):
-    """ Given a passed df, generate the associated Google BigQuery schema.
-
-    Parameters
-    ----------
-    df : DataFrame
-    default_type : string
-        The default big query type in case the type of the column
-        does not exist in the schema.
-    """
-
-    type_mapping = {
-        'i': 'INTEGER',
-        'b': 'BOOLEAN',
-        'f': 'FLOAT',
-        'O': 'STRING',
-        'S': 'STRING',
-        'U': 'STRING',
-        'M': 'TIMESTAMP'
-    }
-
-    fields = []
-    for column_name, dtype in df.dtypes.iteritems():
-        fields.append({'name': column_name,
-                       'type': type_mapping.get(dtype.kind, default_type)})
-
-    return {'fields': fields}
-
-class _Table(GbqConnector):
-
-    def __init__(self, project_id, dataset_id, reauth=False):
-        from apiclient.errors import HttpError
-        self.test_google_api_imports()
-        self.project_id = project_id
-        self.reauth = reauth
-        self.credentials = self.get_credentials()
-        self.service = self.get_service(self.credentials)
-        self.http_error = HttpError
-        self.dataset_id = dataset_id
-
-    def exists(self, table_id):
-        """ Check if a table exists in Google BigQuery
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        table : str
-            Name of table to be verified
-
-        Returns
-        -------
-        boolean
-            true if table exists, otherwise false
-        """
-
-        try:
-            self.service.tables().get(
-                 projectId=self.project_id,
-                 datasetId=self.dataset_id,
-                 tableId=table_id).execute()
-            return True
-        except self.http_error as ex:
-            if ex.resp.status == 404:
-                return False
-            else:
-                self.process_http_error(ex)
-
-    def create(self, table_id, schema):
-        """ Create a table in Google BigQuery given a table and schema
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        table : str
-            Name of table to be written
-        schema : str
-            Use the generate_bq_schema to generate your table schema from a dataframe.
-        """
-
-        if self.exists(table_id):
-            raise TableCreationError("The table could not be created because it already exists")
-
-        if not _Dataset(self.project_id).exists(self.dataset_id):
-            _Dataset(self.project_id).create(self.dataset_id)
-
-        body = {
-            'schema': schema,
-            'tableReference': {
-                'tableId': table_id,
-                'projectId': self.project_id,
-                'datasetId': self.dataset_id
-            }
-        }
-
-        try:
-            self.service.tables().insert(
-                 projectId=self.project_id,
-                 datasetId=self.dataset_id,
-                 body=body).execute()
-        except self.http_error as ex:
-            self.process_http_error(ex)
-
-    def delete(self, table_id):
-        """ Delete a table in Google BigQuery
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        table : str
-            Name of table to be deleted
-        """
-
-        if not self.exists(table_id):
-            raise NotFoundException("Table does not exist")
-
-        try:
-            self.service.tables().delete(
-                 datasetId=self.dataset_id,
-                 projectId=self.project_id,
-                 tableId=table_id).execute()
-        except self.http_error as ex:
-            self.process_http_error(ex)
-
-
-class _Dataset(GbqConnector):
-
-    def __init__(self, project_id, reauth=False):
-        from apiclient.errors import HttpError
-        self.test_google_api_imports()
-        self.project_id = project_id
-        self.reauth = reauth
-        self.credentials = self.get_credentials()
-        self.service = self.get_service(self.credentials)
-        self.http_error = HttpError
-
-    def exists(self, dataset_id):
-        """ Check if a dataset exists in Google BigQuery
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        dataset_id : str
-            Name of dataset to be verified
-
-        Returns
-        -------
-        boolean
-            true if dataset exists, otherwise false
-        """
-
-        try:
-            self.service.datasets().get(
-                 projectId=self.project_id,
-                 datasetId=dataset_id).execute()
-            return True
-        except self.http_error as ex:
-            if ex.resp.status == 404:
-                return False
-            else:
-                self.process_http_error(ex)
-
-    def datasets(self):
-        """ Return a list of datasets in Google BigQuery
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        None
-
-        Returns
-        -------
-        list
-            List of datasets under the specific project
-        """
-
-        try:
-            list_dataset_response = self.service.datasets().list(
-                                         projectId=self.project_id).execute().get('datasets', None)
-
-            if not list_dataset_response:
-                return []
-
-            dataset_list = list()
-
-            for row_num, raw_row in enumerate(list_dataset_response):
-                dataset_list.append(raw_row['datasetReference']['datasetId'])
-
-            return dataset_list
-        except self.http_error as ex:
-            self.process_http_error(ex)
-
-    def create(self, dataset_id):
-        """ Create a dataset in Google BigQuery
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        dataset : str
-            Name of dataset to be written
-        """
-
-        if self.exists(dataset_id):
-            raise DatasetCreationError("The dataset could not be created because it already exists")
-
-        body = {
-            'datasetReference': {
-                'projectId': self.project_id,
-                'datasetId': dataset_id
-            }
-        }
-
-        try:
-            self.service.datasets().insert(
-                 projectId=self.project_id,
-                 body=body).execute()
-        except self.http_error as ex:
-            self.process_http_error(ex)
-
-    def delete(self, dataset_id):
-        """ Delete a dataset in Google BigQuery
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        dataset : str
-            Name of dataset to be deleted
-        """
-
-        if not self.exists(dataset_id):
-            raise NotFoundException("Dataset {0} does not exist".format(dataset_id))
-
-        try:
-            self.service.datasets().delete(
-                 datasetId=dataset_id,
-                 projectId=self.project_id).execute()
-
-        except self.http_error as ex:
-            self.process_http_error(ex)
-
-    def tables(self, dataset_id):
-        """ List tables in the specific dataset in Google BigQuery
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        dataset : str
-            Name of dataset to list tables for
-
-        Returns
-        -------
-        list
-            List of tables under the specific dataset
-        """
-
-        try:
-            list_table_response = self.service.tables().list(
-                                       projectId=self.project_id,
-                                       datasetId=dataset_id).execute().get('tables', None)
-
-            if not list_table_response:
-                return []
-
-            table_list = list()
-
-            for row_num, raw_row in enumerate(list_table_response):
-                table_list.append(raw_row['tableReference']['tableId'])
-
-            return table_list
-        except self.http_error as ex:
-            self.process_http_error(ex)
+        DataFrame representing results of query.
+
+    See Also
+    --------
+    pandas_gbq.read_gbq : This function in the pandas-gbq library.
+    pandas.DataFrame.to_gbq : Write a DataFrame to Google BigQuery.
+    """
+    pandas_gbq = _try_import()
+    return pandas_gbq.read_gbq(
+        query, project_id=project_id, index_col=index_col,
+        col_order=col_order, reauth=reauth, verbose=verbose,
+        private_key=private_key, auth_local_webserver=auth_local_webserver,
+        dialect=dialect, location=location, configuration=configuration)
+
+
+def to_gbq(dataframe, destination_table, project_id=None, chunksize=None,
+           verbose=None, reauth=False, if_exists='fail', private_key=None,
+           auth_local_webserver=False, table_schema=None, location=None,
+           progress_bar=True):
+    pandas_gbq = _try_import()
+    return pandas_gbq.to_gbq(
+        dataframe, destination_table, project_id=project_id,
+        chunksize=chunksize, verbose=verbose, reauth=reauth,
+        if_exists=if_exists, private_key=private_key,
+        auth_local_webserver=auth_local_webserver,
+        table_schema=table_schema, location=location,
+        progress_bar=progress_bar)
diff --git a/pandas/io/gcs.py b/pandas/io/gcs.py
new file mode 100644
index 0000000000000..aa1cb648f05d1
--- /dev/null
+++ b/pandas/io/gcs.py
@@ -0,0 +1,16 @@
+""" GCS support for remote file interactivity """
+try:
+    import gcsfs
+except ImportError:
+    raise ImportError("The gcsfs library is required to handle GCS files")
+
+
+def get_filepath_or_buffer(filepath_or_buffer, encoding=None,
+                           compression=None, mode=None):
+
+    if mode is None:
+        mode = 'rb'
+
+    fs = gcsfs.GCSFileSystem()
+    filepath_or_buffer = fs.open(filepath_or_buffer, mode)
+    return filepath_or_buffer, None, compression, True
diff --git a/pandas/io/html.py b/pandas/io/html.py
index f175702dedabc..8fd876e85889f 100644
--- a/pandas/io/html.py
+++ b/pandas/io/html.py
@@ -7,25 +7,27 @@
 import re
 import numbers
 import collections
-import warnings
 
 from distutils.version import LooseVersion
 
 import numpy as np
 
-from pandas.io.common import _is_url, urlopen, parse_url, _validate_header_arg
+from pandas.core.dtypes.common import is_list_like
+from pandas.errors import EmptyDataError
+from pandas.io.common import _is_url, urlopen, _validate_header_arg
 from pandas.io.parsers import TextParser
 from pandas.compat import (lrange, lmap, u, string_types, iteritems,
                            raise_with_traceback, binary_type)
-from pandas.core import common as com
 from pandas import Series
-from pandas.core.common import AbstractMethodError
+import pandas.core.common as com
+from pandas.io.formats.printing import pprint_thing
 
 _IMPORTS = False
 _HAS_BS4 = False
 _HAS_LXML = False
 _HAS_HTML5LIB = False
 
+
 def _importers():
     # import things we need
     # but make this done on a first use basis
@@ -34,28 +36,28 @@ def _importers():
     if _IMPORTS:
         return
 
-    _IMPORTS = True
-
     global _HAS_BS4, _HAS_LXML, _HAS_HTML5LIB
 
     try:
-        import bs4
+        import bs4  # noqa
         _HAS_BS4 = True
     except ImportError:
         pass
 
     try:
-        import lxml
+        import lxml  # noqa
         _HAS_LXML = True
     except ImportError:
         pass
 
     try:
-        import html5lib
+        import html5lib  # noqa
         _HAS_HTML5LIB = True
     except ImportError:
         pass
 
+    _IMPORTS = True
+
 
 #############
 # READ HTML #
@@ -105,7 +107,7 @@ def _get_skiprows(skiprows):
     """
     if isinstance(skiprows, slice):
         return lrange(skiprows.start or 0, skiprows.stop, skiprows.step or 1)
-    elif isinstance(skiprows, numbers.Integral) or com.is_list_like(skiprows):
+    elif isinstance(skiprows, numbers.Integral) or is_list_like(skiprows):
         return skiprows
     elif skiprows is None:
         return 0
@@ -157,6 +159,14 @@ class _HtmlFrameParser(object):
     attrs : dict
         List of HTML <table> element attributes to match.
 
+    encoding : str
+        Encoding to be used by parser
+
+    displayed_only : bool
+        Whether or not items with "display:none" should be ignored
+
+        .. versionadded:: 0.23.0
+
     Attributes
     ----------
     io : str or file-like
@@ -169,6 +179,14 @@ class _HtmlFrameParser(object):
         A dictionary of valid table attributes to use to search for table
         elements.
 
+    encoding : str
+        Encoding to be used by parser
+
+    displayed_only : bool
+        Whether or not items with "display:none" should be ignored
+
+        .. versionadded:: 0.23.0
+
     Notes
     -----
     To subclass this class effectively you must override the following methods:
@@ -183,11 +201,13 @@ class _HtmlFrameParser(object):
     See each method's respective documentation for details on their
     functionality.
     """
-    def __init__(self, io, match, attrs, encoding):
+
+    def __init__(self, io, match, attrs, encoding, displayed_only):
         self.io = io
         self.match = match
         self.attrs = attrs
         self.encoding = encoding
+        self.displayed_only = displayed_only
 
     def parse_tables(self):
         tables = self._parse_tables(self._build_doc(), self.match, self.attrs)
@@ -230,7 +250,7 @@ def _text_getter(self, obj):
         text : str or unicode
             The text from an individual DOM node.
         """
-        raise AbstractMethodError(self)
+        raise com.AbstractMethodError(self)
 
     def _parse_td(self, obj):
         """Return the td elements from a row element.
@@ -244,7 +264,7 @@ def _parse_td(self, obj):
         columns : list of node-like
             These are the elements of each row, i.e., the columns.
         """
-        raise AbstractMethodError(self)
+        raise com.AbstractMethodError(self)
 
     def _parse_tables(self, doc, match, attrs):
         """Return all tables from the parsed DOM.
@@ -259,7 +279,7 @@ def _parse_tables(self, doc, match, attrs):
 
         attrs : dict
             A dictionary of table attributes that can be used to disambiguate
-            mutliple tables on a page.
+            multiple tables on a page.
 
         Raises
         ------
@@ -271,7 +291,7 @@ def _parse_tables(self, doc, match, attrs):
         tables : list of node-like
             A list of <table> elements to be parsed into raw data.
         """
-        raise AbstractMethodError(self)
+        raise com.AbstractMethodError(self)
 
     def _parse_tr(self, table):
         """Return the list of row elements from the parsed table element.
@@ -286,7 +306,7 @@ def _parse_tr(self, table):
         rows : list of node-like
             A list row elements of a table, usually <tr> or <th> elements.
         """
-        raise AbstractMethodError(self)
+        raise com.AbstractMethodError(self)
 
     def _parse_thead(self, table):
         """Return the header of a table.
@@ -301,10 +321,10 @@ def _parse_thead(self, table):
         thead : node-like
             A <thead>...</thead> element.
         """
-        raise AbstractMethodError(self)
+        raise com.AbstractMethodError(self)
 
     def _parse_tbody(self, table):
-        """Return the body of the table.
+        """Return the list of tbody elements from the parsed table element.
 
         Parameters
         ----------
@@ -313,10 +333,10 @@ def _parse_tbody(self, table):
 
         Returns
         -------
-        tbody : node-like
-            A <tbody>...</tbody> element.
+        tbodys : list of node-like
+            A list of <tbody>...</tbody> elements
         """
-        raise AbstractMethodError(self)
+        raise com.AbstractMethodError(self)
 
     def _parse_tfoot(self, table):
         """Return the footer of the table if any.
@@ -331,7 +351,7 @@ def _parse_tfoot(self, table):
         tfoot : node-like
             A <tfoot>...</tfoot> element.
         """
-        raise AbstractMethodError(self)
+        raise com.AbstractMethodError(self)
 
     def _build_doc(self):
         """Return a tree-like object that can be used to iterate over the DOM.
@@ -340,7 +360,7 @@ def _build_doc(self):
         -------
         obj : tree-like
         """
-        raise AbstractMethodError(self)
+        raise com.AbstractMethodError(self)
 
     def _build_table(self, table):
         header = self._parse_raw_thead(table)
@@ -352,24 +372,54 @@ def _parse_raw_thead(self, table):
         thead = self._parse_thead(table)
         res = []
         if thead:
-            res = lmap(self._text_getter, self._parse_th(thead[0]))
-        return np.array(res).squeeze() if res and len(res) == 1 else res
+            trs = self._parse_tr(thead[0])
+            for tr in trs:
+                cols = lmap(self._text_getter, self._parse_td(tr))
+                if any(col != '' for col in cols):
+                    res.append(cols)
+        return res
 
     def _parse_raw_tfoot(self, table):
         tfoot = self._parse_tfoot(table)
         res = []
         if tfoot:
             res = lmap(self._text_getter, self._parse_td(tfoot[0]))
-        return np.array(res).squeeze() if res and len(res) == 1 else res
+        return np.atleast_1d(
+            np.array(res).squeeze()) if res and len(res) == 1 else res
 
     def _parse_raw_tbody(self, table):
-        tbody = self._parse_tbody(table)
+        tbodies = self._parse_tbody(table)
 
-        try:
-            res = self._parse_tr(tbody[0])
-        except IndexError:
-            res = self._parse_tr(table)
-        return self._parse_raw_data(res)
+        raw_data = []
+
+        if tbodies:
+            for tbody in tbodies:
+                raw_data.extend(self._parse_tr(tbody))
+        else:
+            raw_data.extend(self._parse_tr(table))
+
+        return self._parse_raw_data(raw_data)
+
+    def _handle_hidden_tables(self, tbl_list, attr_name):
+        """Returns list of tables, potentially removing hidden elements
+
+        Parameters
+        ----------
+        tbl_list : list of Tag or list of Element
+            Type of list elements will vary depending upon parser used
+        attr_name : str
+            Name of the accessor for retrieving HTML attributes
+
+        Returns
+        -------
+        list of Tag or list of Element
+            Return type matches `tbl_list`
+        """
+        if not self.displayed_only:
+            return tbl_list
+
+        return [x for x in tbl_list if "display:none" not in
+                getattr(x, attr_name).get('style', '').replace(" ", "")]
 
 
 class _BeautifulSoupHtml5LibFrameParser(_HtmlFrameParser):
@@ -385,6 +435,7 @@ class _BeautifulSoupHtml5LibFrameParser(_HtmlFrameParser):
     Documentation strings for this class are in the base class
     :class:`pandas.io.html._HtmlFrameParser`.
     """
+
     def __init__(self, *args, **kwargs):
         super(_BeautifulSoupHtml5LibFrameParser, self).__init__(*args,
                                                                 **kwargs)
@@ -421,22 +472,29 @@ def _parse_tables(self, doc, match, attrs):
 
         result = []
         unique_tables = set()
+        tables = self._handle_hidden_tables(tables, "attrs")
 
         for table in tables:
+            if self.displayed_only:
+                for elem in table.find_all(
+                        style=re.compile(r"display:\s*none")):
+                    elem.decompose()
+
             if (table not in unique_tables and
                     table.find(text=match) is not None):
                 result.append(table)
             unique_tables.add(table)
 
         if not result:
-            raise ValueError("No tables found matching pattern %r" %
-                             match.pattern)
+            raise ValueError("No tables found matching pattern {patt!r}"
+                             .format(patt=match.pattern))
         return result
 
     def _setup_build_doc(self):
         raw_text = _read(self.io)
         if not raw_text:
-            raise ValueError('No text parsed from document: %s' % self.io)
+            raise ValueError('No text parsed from document: {doc}'
+                             .format(doc=self.io))
         return raw_text
 
     def _build_doc(self):
@@ -463,8 +521,8 @@ def _build_xpath_expr(attrs):
     if 'class_' in attrs:
         attrs['class'] = attrs.pop('class_')
 
-    s = [u("@%s=%r") % (k, v) for k, v in iteritems(attrs)]
-    return u('[%s]') % ' and '.join(s)
+    s = [u("@{key}={val!r}").format(key=k, val=v) for k, v in iteritems(attrs)]
+    return u('[{expr}]').format(expr=' and '.join(s))
 
 
 _re_namespace = {'re': 'http://exslt.org/regular-expressions'}
@@ -488,6 +546,7 @@ class _LxmlFrameParser(_HtmlFrameParser):
     Documentation strings for this class are in the base class
     :class:`_HtmlFrameParser`.
     """
+
     def __init__(self, *args, **kwargs):
         super(_LxmlFrameParser, self).__init__(*args, **kwargs)
 
@@ -498,16 +557,15 @@ def _parse_td(self, row):
         return row.xpath('.//td|.//th')
 
     def _parse_tr(self, table):
-        expr = './/tr[normalize-space()]'
-        return table.xpath(expr)
+        return table.xpath('.//tr')
 
     def _parse_tables(self, doc, match, kwargs):
         pattern = match.pattern
 
         # 1. check all descendants for the given pattern and only search tables
         # 2. go up the tree until we find a table
-        query = '//table//*[re:test(text(), %r)]/ancestor::table'
-        xpath_expr = u(query) % pattern
+        query = '//table//*[re:test(text(), {patt!r})]/ancestor::table'
+        xpath_expr = u(query).format(patt=pattern)
 
         # if any table attributes were given build an xpath expression to
         # search for them
@@ -516,8 +574,20 @@ def _parse_tables(self, doc, match, kwargs):
 
         tables = doc.xpath(xpath_expr, namespaces=_re_namespace)
 
+        tables = self._handle_hidden_tables(tables, "attrib")
+        if self.displayed_only:
+            for table in tables:
+                # lxml utilizes XPATH 1.0 which does not have regex
+                # support. As a result, we find all elements with a style
+                # attribute and iterate them to check for display:none
+                for elem in table.xpath('.//*[@style]'):
+                    if "display:none" in elem.attrib.get(
+                            "style", "").replace(" ", ""):
+                        elem.getparent().remove(elem)
+
         if not tables:
-            raise ValueError("No tables found matching regex %r" % pattern)
+            raise ValueError("No tables found matching regex {patt!r}"
+                             .format(patt=pattern))
         return tables
 
     def _build_doc(self):
@@ -538,18 +608,20 @@ def _build_doc(self):
         """
         from lxml.html import parse, fromstring, HTMLParser
         from lxml.etree import XMLSyntaxError
-
-        parser = HTMLParser(recover=False, encoding=self.encoding)
+        parser = HTMLParser(recover=True, encoding=self.encoding)
 
         try:
-            # try to parse the input in the simplest way
-            r = parse(self.io, parser=parser)
-
+            if _is_url(self.io):
+                with urlopen(self.io) as f:
+                    r = parse(f, parser=parser)
+            else:
+                # try to parse the input in the simplest way
+                r = parse(self.io, parser=parser)
             try:
                 r = r.getroot()
             except AttributeError:
                 pass
-        except (UnicodeDecodeError, IOError):
+        except (UnicodeDecodeError, IOError) as e:
             # if the input is a blob of html goop
             if not _is_url(self.io):
                 r = fromstring(self.io, parser=parser)
@@ -559,16 +631,7 @@ def _build_doc(self):
                 except AttributeError:
                     pass
             else:
-                # not a url
-                scheme = parse_url(self.io).scheme
-                if scheme not in _valid_schemes:
-                    # lxml can't parse it
-                    msg = ('%r is not a valid url scheme, valid schemes are '
-                           '%s') % (scheme, _valid_schemes)
-                    raise ValueError(msg)
-                else:
-                    # something else happened: maybe a faulty connection
-                    raise
+                raise e
         else:
             if not hasattr(r, 'text_content'):
                 raise XMLSyntaxError("no text parsed from document", 0, 0, 0)
@@ -584,9 +647,26 @@ def _parse_tfoot(self, table):
         return table.xpath('.//tfoot')
 
     def _parse_raw_thead(self, table):
-        expr = './/thead//th'
-        return [_remove_whitespace(x.text_content()) for x in
-                table.xpath(expr)]
+        expr = './/thead'
+        thead = table.xpath(expr)
+        res = []
+        if thead:
+            # Grab any directly descending table headers first
+            ths = thead[0].xpath('./th')
+            if ths:
+                cols = [_remove_whitespace(x.text_content()) for x in ths]
+                if any(col != '' for col in cols):
+                    res.append(cols)
+            else:
+                trs = self._parse_tr(thead[0])
+
+                for tr in trs:
+                    cols = [_remove_whitespace(x.text_content()) for x in
+                            self._parse_td(tr)]
+
+                    if any(col != '' for col in cols):
+                        res.append(cols)
+        return res
 
     def _parse_raw_tfoot(self, table):
         expr = './/tfoot//th|//tfoot//td'
@@ -604,26 +684,22 @@ def _expand_elements(body):
         body[ind] += empty * (lens_max - length)
 
 
-def _data_to_frame(data, header, index_col, skiprows,
-                   parse_dates, tupleize_cols, thousands):
-    head, body, foot = data
-
+def _data_to_frame(**kwargs):
+    head, body, foot = kwargs.pop('data')
+    header = kwargs.pop('header')
+    kwargs['skiprows'] = _get_skiprows(kwargs['skiprows'])
     if head:
-        body = [head] + body
-
+        rows = lrange(len(head))
+        body = head + body
         if header is None:  # special case when a table has <th> elements
-            header = 0
+            header = 0 if rows == [0] else rows
 
     if foot:
         body += [foot]
 
     # fill out elements of body that are "ragged"
     _expand_elements(body)
-
-    tp = TextParser(body, header=header, index_col=index_col,
-                    skiprows=_get_skiprows(skiprows),
-                    parse_dates=parse_dates, tupleize_cols=tupleize_cols,
-                    thousands=thousands)
+    tp = TextParser(body, header=header, **kwargs)
     df = tp.read()
     return df
 
@@ -655,23 +731,21 @@ def _parser_dispatch(flavor):
     """
     valid_parsers = list(_valid_parsers.keys())
     if flavor not in valid_parsers:
-        raise ValueError('%r is not a valid flavor, valid flavors are %s' %
-                         (flavor, valid_parsers))
+        raise ValueError('{invalid!r} is not a valid flavor, valid flavors '
+                         'are {valid}'
+                         .format(invalid=flavor, valid=valid_parsers))
 
     if flavor in ('bs4', 'html5lib'):
         if not _HAS_HTML5LIB:
             raise ImportError("html5lib not found, please install it")
         if not _HAS_BS4:
-            raise ImportError("BeautifulSoup4 (bs4) not found, please install it")
+            raise ImportError(
+                "BeautifulSoup4 (bs4) not found, please install it")
         import bs4
-        if bs4.__version__ == LooseVersion('4.2.0'):
-            raise ValueError("You're using a version"
-                             " of BeautifulSoup4 (4.2.0) that has been"
-                             " known to cause problems on certain"
-                             " operating systems such as Debian. "
-                             "Please install a version of"
-                             " BeautifulSoup4 != 4.2.0, both earlier"
-                             " and later releases will work.")
+        if LooseVersion(bs4.__version__) <= LooseVersion('4.2.0'):
+            raise ValueError("A minimum version of BeautifulSoup 4.2.1 "
+                             "is required")
+
     else:
         if not _HAS_LXML:
             raise ImportError("lxml not found, please install it")
@@ -679,7 +753,7 @@ def _parser_dispatch(flavor):
 
 
 def _print_as_set(s):
-    return '{%s}' % ', '.join([com.pprint_thing(el) for el in s])
+    return '{{arg}}'.format(arg=', '.join(pprint_thing(el) for el in s))
 
 
 def _validate_flavor(flavor):
@@ -689,26 +763,27 @@ def _validate_flavor(flavor):
         flavor = flavor,
     elif isinstance(flavor, collections.Iterable):
         if not all(isinstance(flav, string_types) for flav in flavor):
-            raise TypeError('Object of type %r is not an iterable of strings' %
-                            type(flavor).__name__)
+            raise TypeError('Object of type {typ!r} is not an iterable of '
+                            'strings'
+                            .format(typ=type(flavor).__name__))
     else:
-        fmt = '{0!r}' if isinstance(flavor, string_types) else '{0}'
+        fmt = '{flavor!r}' if isinstance(flavor, string_types) else '{flavor}'
         fmt += ' is not a valid flavor'
-        raise ValueError(fmt.format(flavor))
+        raise ValueError(fmt.format(flavor=flavor))
 
     flavor = tuple(flavor)
     valid_flavors = set(_valid_parsers)
     flavor_set = set(flavor)
 
     if not flavor_set & valid_flavors:
-        raise ValueError('%s is not a valid set of flavors, valid flavors are '
-                         '%s' % (_print_as_set(flavor_set),
-                                 _print_as_set(valid_flavors)))
+        raise ValueError('{invalid} is not a valid set of flavors, valid '
+                         'flavors are {valid}'
+                         .format(invalid=_print_as_set(flavor_set),
+                                 valid=_print_as_set(valid_flavors)))
     return flavor
 
 
-def _parse(flavor, io, match, header, index_col, skiprows,
-           parse_dates, tupleize_cols, thousands, attrs, encoding):
+def _parse(flavor, io, match, attrs, encoding, displayed_only, **kwargs):
     flavor = _validate_flavor(flavor)
     compiled_match = re.compile(match)  # you can pass a compiled regex here
 
@@ -716,11 +791,23 @@ def _parse(flavor, io, match, header, index_col, skiprows,
     retained = None
     for flav in flavor:
         parser = _parser_dispatch(flav)
-        p = parser(io, compiled_match, attrs, encoding)
+        p = parser(io, compiled_match, attrs, encoding, displayed_only)
 
         try:
             tables = p.parse_tables()
         except Exception as caught:
+            # if `io` is an io-like object, check if it's seekable
+            # and try to rewind it before trying the next parser
+            if hasattr(io, 'seekable') and io.seekable():
+                io.seek(0)
+            elif hasattr(io, 'seekable') and not io.seekable():
+                # if we couldn't rewind it, let the user know
+                raise ValueError('The flavor {} failed to parse your input. '
+                                 'Since you passed a non-rewindable file '
+                                 'object, we can\'t rewind it to try '
+                                 'another parser. Try read_html() with a '
+                                 'different flavor.'.format(flav))
+
             retained = caught
         else:
             break
@@ -730,21 +817,17 @@ def _parse(flavor, io, match, header, index_col, skiprows,
     ret = []
     for table in tables:
         try:
-            ret.append(_data_to_frame(data=table,
-                                      header=header,
-                                      index_col=index_col,
-                                      skiprows=skiprows,
-                                      parse_dates=parse_dates,
-                                      tupleize_cols=tupleize_cols,
-                                      thousands=thousands))
-        except StopIteration: # empty table
+            ret.append(_data_to_frame(data=table, **kwargs))
+        except EmptyDataError:  # empty table
             continue
     return ret
 
 
 def read_html(io, match='.+', flavor=None, header=None, index_col=None,
               skiprows=None, attrs=None, parse_dates=False,
-              tupleize_cols=False, thousands=',', encoding=None):
+              tupleize_cols=None, thousands=',', encoding=None,
+              decimal='.', converters=None, na_values=None,
+              keep_default_na=True, displayed_only=True):
     r"""Read HTML tables into a ``list`` of ``DataFrame`` objects.
 
     Parameters
@@ -811,6 +894,9 @@ def read_html(io, match='.+', flavor=None, header=None, index_col=None,
         :class:`~pandas.MultiIndex`, otherwise return raw tuples. Defaults to
         ``False``.
 
+        .. deprecated:: 0.21.0
+           This argument will be removed and will always convert to MultiIndex
+
     thousands : str, optional
         Separator to use to parse thousands. Defaults to ``','``.
 
@@ -820,6 +906,36 @@ def read_html(io, match='.+', flavor=None, header=None, index_col=None,
         underlying parser library (e.g., the parser library will try to use
         the encoding provided by the document).
 
+    decimal : str, default '.'
+        Character to recognize as decimal point (e.g. use ',' for European
+        data).
+
+        .. versionadded:: 0.19.0
+
+    converters : dict, default None
+        Dict of functions for converting values in certain columns. Keys can
+        either be integers or column labels, values are functions that take one
+        input argument, the cell (not column) content, and return the
+        transformed content.
+
+        .. versionadded:: 0.19.0
+
+    na_values : iterable, default None
+        Custom NA values
+
+        .. versionadded:: 0.19.0
+
+    keep_default_na : bool, default True
+        If na_values are specified and keep_default_na is False the default NaN
+        values are overridden, otherwise they're appended to
+
+        .. versionadded:: 0.19.0
+
+    display_only : bool, default True
+        Whether elements with "display: none" should be parsed
+
+        .. versionadded:: 0.23.0
+
     Returns
     -------
     dfs : list of DataFrames
@@ -827,7 +943,7 @@ def read_html(io, match='.+', flavor=None, header=None, index_col=None,
     Notes
     -----
     Before using this function you should read the :ref:`gotchas about the
-    HTML parsing libraries <html-gotchas>`.
+    HTML parsing libraries <io.html.gotchas>`.
 
     Expect to do some cleanup after you call this function. For example, you
     might need to manually assign column names if the column names are
@@ -862,5 +978,10 @@ def read_html(io, match='.+', flavor=None, header=None, index_col=None,
         raise ValueError('cannot skip rows starting from the end of the '
                          'data (you passed a negative value)')
     _validate_header_arg(header)
-    return _parse(flavor, io, match, header, index_col, skiprows,
-                  parse_dates, tupleize_cols, thousands, attrs, encoding)
+    return _parse(flavor=flavor, io=io, match=match, header=header,
+                  index_col=index_col, skiprows=skiprows,
+                  parse_dates=parse_dates, tupleize_cols=tupleize_cols,
+                  thousands=thousands, attrs=attrs, encoding=encoding,
+                  decimal=decimal, converters=converters, na_values=na_values,
+                  keep_default_na=keep_default_na,
+                  displayed_only=displayed_only)
diff --git a/pandas/io/json.py b/pandas/io/json.py
deleted file mode 100644
index f368f0e6cf28e..0000000000000
--- a/pandas/io/json.py
+++ /dev/null
@@ -1,779 +0,0 @@
-# pylint: disable-msg=E1101,W0613,W0603
-
-import os
-import copy
-from collections import defaultdict
-import numpy as np
-
-import pandas.json as _json
-from pandas.tslib import iNaT
-from pandas.compat import long, u
-from pandas import compat, isnull
-from pandas import Series, DataFrame, to_datetime
-from pandas.io.common import get_filepath_or_buffer
-from pandas.core.common import AbstractMethodError
-import pandas.core.common as com
-
-loads = _json.loads
-dumps = _json.dumps
-### interface to/from ###
-
-
-def to_json(path_or_buf, obj, orient=None, date_format='epoch',
-            double_precision=10, force_ascii=True, date_unit='ms',
-            default_handler=None):
-
-    if isinstance(obj, Series):
-        s = SeriesWriter(
-            obj, orient=orient, date_format=date_format,
-            double_precision=double_precision, ensure_ascii=force_ascii,
-            date_unit=date_unit, default_handler=default_handler).write()
-    elif isinstance(obj, DataFrame):
-        s = FrameWriter(
-            obj, orient=orient, date_format=date_format,
-            double_precision=double_precision, ensure_ascii=force_ascii,
-            date_unit=date_unit, default_handler=default_handler).write()
-    else:
-        raise NotImplementedError("'obj' should be a Series or a DataFrame")
-
-    if isinstance(path_or_buf, compat.string_types):
-        with open(path_or_buf, 'w') as fh:
-            fh.write(s)
-    elif path_or_buf is None:
-        return s
-    else:
-        path_or_buf.write(s)
-
-
-class Writer(object):
-
-    def __init__(self, obj, orient, date_format, double_precision,
-                 ensure_ascii, date_unit, default_handler=None):
-        self.obj = obj
-
-        if orient is None:
-            orient = self._default_orient
-
-        self.orient = orient
-        self.date_format = date_format
-        self.double_precision = double_precision
-        self.ensure_ascii = ensure_ascii
-        self.date_unit = date_unit
-        self.default_handler = default_handler
-
-        self.is_copy = None
-        self._format_axes()
-
-    def _format_axes(self):
-        raise AbstractMethodError(self)
-
-    def write(self):
-        return dumps(
-            self.obj,
-            orient=self.orient,
-            double_precision=self.double_precision,
-            ensure_ascii=self.ensure_ascii,
-            date_unit=self.date_unit,
-            iso_dates=self.date_format == 'iso',
-            default_handler=self.default_handler)
-
-
-class SeriesWriter(Writer):
-    _default_orient = 'index'
-
-    def _format_axes(self):
-        if not self.obj.index.is_unique and self.orient == 'index':
-            raise ValueError("Series index must be unique for orient="
-                             "'%s'" % self.orient)
-
-
-class FrameWriter(Writer):
-    _default_orient = 'columns'
-
-    def _format_axes(self):
-        """ try to axes if they are datelike """
-        if not self.obj.index.is_unique and self.orient in (
-                'index', 'columns'):
-            raise ValueError("DataFrame index must be unique for orient="
-                             "'%s'." % self.orient)
-        if not self.obj.columns.is_unique and self.orient in (
-                'index', 'columns', 'records'):
-            raise ValueError("DataFrame columns must be unique for orient="
-                             "'%s'." % self.orient)
-
-
-def read_json(path_or_buf=None, orient=None, typ='frame', dtype=True,
-              convert_axes=True, convert_dates=True, keep_default_dates=True,
-              numpy=False, precise_float=False, date_unit=None):
-    """
-    Convert a JSON string to pandas object
-
-    Parameters
-    ----------
-    path_or_buf : a valid JSON string or file-like, default: None
-        The string could be a URL. Valid URL schemes include http, ftp, s3, and
-        file. For file URLs, a host is expected. For instance, a local file
-        could be ``file://localhost/path/to/table.json``
-
-    orient  
-
-        * `Series`
-
-          - default is ``'index'``
-          - allowed values are: ``{'split','records','index'}``
-          - The Series index must be unique for orient ``'index'``.
-
-        * `DataFrame`
-
-          - default is ``'columns'``
-          - allowed values are: {'split','records','index','columns','values'}
-          - The DataFrame index must be unique for orients 'index' and
-            'columns'.
-          - The DataFrame columns must be unique for orients 'index',
-            'columns', and 'records'.
-
-        * The format of the JSON string
-
-          - split : dict like
-            ``{index -> [index], columns -> [columns], data -> [values]}``
-          - records : list like
-            ``[{column -> value}, ... , {column -> value}]``
-          - index : dict like ``{index -> {column -> value}}``
-          - columns : dict like ``{column -> {index -> value}}``
-          - values : just the values array
-
-    typ : type of object to recover (series or frame), default 'frame'
-    dtype : boolean or dict, default True
-        If True, infer dtypes, if a dict of column to dtype, then use those,
-        if False, then don't infer dtypes at all, applies only to the data.
-    convert_axes : boolean, default True
-        Try to convert the axes to the proper dtypes.
-    convert_dates : boolean, default True
-        List of columns to parse for dates; If True, then try to parse
-        datelike columns default is True; a column label is datelike if
-        
-        * it ends with ``'_at'``,
-        
-        * it ends with ``'_time'``,
-        
-        * it begins with ``'timestamp'``,
-        
-        * it is ``'modified'``, or
-        
-        * it is ``'date'``
-
-    keep_default_dates : boolean, default True
-        If parsing dates, then parse the default datelike columns
-    numpy : boolean, default False
-        Direct decoding to numpy arrays. Supports numeric data only, but
-        non-numeric column and index labels are supported. Note also that the
-        JSON ordering MUST be the same for each term if numpy=True.
-    precise_float : boolean, default False
-        Set to enable usage of higher precision (strtod) function when
-        decoding string to double values. Default (False) is to use fast but
-        less precise builtin functionality
-    date_unit : string, default None
-        The timestamp unit to detect if converting dates. The default behaviour
-        is to try and detect the correct precision, but if this is not desired
-        then pass one of 's', 'ms', 'us' or 'ns' to force parsing only seconds,
-        milliseconds, microseconds or nanoseconds respectively.
-
-    Returns
-    -------
-    result : Series or DataFrame
-    """
-
-    filepath_or_buffer, _, _ = get_filepath_or_buffer(path_or_buf)
-    if isinstance(filepath_or_buffer, compat.string_types):
-        try:
-            exists = os.path.exists(filepath_or_buffer)
-
-        # if the filepath is too long will raise here
-        # 5874
-        except (TypeError,ValueError):
-            exists = False
-
-        if exists:
-            with open(filepath_or_buffer, 'r') as fh:
-                json = fh.read()
-        else:
-            json = filepath_or_buffer
-    elif hasattr(filepath_or_buffer, 'read'):
-        json = filepath_or_buffer.read()
-    else:
-        json = filepath_or_buffer
-
-    obj = None
-    if typ == 'frame':
-        obj = FrameParser(json, orient, dtype, convert_axes, convert_dates,
-                          keep_default_dates, numpy, precise_float,
-                          date_unit).parse()
-
-    if typ == 'series' or obj is None:
-        if not isinstance(dtype, bool):
-            dtype = dict(data=dtype)
-        obj = SeriesParser(json, orient, dtype, convert_axes, convert_dates,
-                           keep_default_dates, numpy, precise_float,
-                           date_unit).parse()
-
-    return obj
-
-
-class Parser(object):
-
-    _STAMP_UNITS = ('s', 'ms', 'us', 'ns')
-    _MIN_STAMPS = {
-        's': long(31536000),
-        'ms': long(31536000000),
-        'us': long(31536000000000),
-        'ns': long(31536000000000000)}
-
-    def __init__(self, json, orient, dtype=True, convert_axes=True,
-                 convert_dates=True, keep_default_dates=False, numpy=False,
-                 precise_float=False, date_unit=None):
-        self.json = json
-
-        if orient is None:
-            orient = self._default_orient
-
-        self.orient = orient
-        self.dtype = dtype
-
-        if orient == "split":
-            numpy = False
-
-        if date_unit is not None:
-            date_unit = date_unit.lower()
-            if date_unit not in self._STAMP_UNITS:
-                raise ValueError('date_unit must be one of %s' %
-                                 (self._STAMP_UNITS,))
-            self.min_stamp = self._MIN_STAMPS[date_unit]
-        else:
-            self.min_stamp = self._MIN_STAMPS['s']
-
-        self.numpy = numpy
-        self.precise_float = precise_float
-        self.convert_axes = convert_axes
-        self.convert_dates = convert_dates
-        self.date_unit = date_unit
-        self.keep_default_dates = keep_default_dates
-        self.obj = None
-
-    def check_keys_split(self, decoded):
-        "checks that dict has only the appropriate keys for orient='split'"
-        bad_keys = set(decoded.keys()).difference(set(self._split_keys))
-        if bad_keys:
-            bad_keys = ", ".join(bad_keys)
-            raise ValueError(u("JSON data had unexpected key(s): %s") %
-                             com.pprint_thing(bad_keys))
-
-    def parse(self):
-
-        # try numpy
-        numpy = self.numpy
-        if numpy:
-            self._parse_numpy()
-
-        else:
-            self._parse_no_numpy()
-
-        if self.obj is None:
-            return None
-        if self.convert_axes:
-            self._convert_axes()
-        self._try_convert_types()
-        return self.obj
-
-    def _convert_axes(self):
-        """ try to convert axes """
-        for axis in self.obj._AXIS_NUMBERS.keys():
-            new_axis, result = self._try_convert_data(
-                axis, self.obj._get_axis(axis), use_dtypes=False,
-                convert_dates=True)
-            if result:
-                setattr(self.obj, axis, new_axis)
-
-    def _try_convert_types(self):
-        raise AbstractMethodError(self)
-
-    def _try_convert_data(self, name, data, use_dtypes=True,
-                          convert_dates=True):
-        """ try to parse a ndarray like into a column by inferring dtype """
-
-        # don't try to coerce, unless a force conversion
-        if use_dtypes:
-            if self.dtype is False:
-                return data, False
-            elif self.dtype is True:
-                pass
-
-            else:
-
-                # dtype to force
-                dtype = (self.dtype.get(name)
-                         if isinstance(self.dtype, dict) else self.dtype)
-                if dtype is not None:
-                    try:
-                        dtype = np.dtype(dtype)
-                        return data.astype(dtype), True
-                    except:
-                        return data, False
-
-        if convert_dates:
-            new_data, result = self._try_convert_to_date(data)
-            if result:
-                return new_data, True
-
-        result = False
-
-        if data.dtype == 'object':
-
-            # try float
-            try:
-                data = data.astype('float64')
-                result = True
-            except:
-                pass
-
-        if data.dtype.kind == 'f':
-
-            if data.dtype != 'float64':
-
-                # coerce floats to 64
-                try:
-                    data = data.astype('float64')
-                    result = True
-                except:
-                    pass
-
-        # do't coerce 0-len data
-        if len(data) and (data.dtype == 'float' or data.dtype == 'object'):
-
-            # coerce ints if we can
-            try:
-                new_data = data.astype('int64')
-                if (new_data == data).all():
-                    data = new_data
-                    result = True
-            except:
-                pass
-
-        # coerce ints to 64
-        if data.dtype == 'int':
-
-            # coerce floats to 64
-            try:
-                data = data.astype('int64')
-                result = True
-            except:
-                pass
-
-        return data, result
-
-    def _try_convert_to_date(self, data):
-        """ try to parse a ndarray like into a date column
-            try to coerce object in epoch/iso formats and
-            integer/float in epcoh formats, return a boolean if parsing
-            was successful """
-
-        # no conversion on empty
-        if not len(data):
-            return data, False
-
-        new_data = data
-        if new_data.dtype == 'object':
-            try:
-                new_data = data.astype('int64')
-            except:
-                pass
-
-        # ignore numbers that are out of range
-        if issubclass(new_data.dtype.type, np.number):
-            in_range = (isnull(new_data.values) | (new_data > self.min_stamp) |
-                        (new_data.values == iNaT))
-            if not in_range.all():
-                return data, False
-
-        date_units = (self.date_unit,) if self.date_unit else self._STAMP_UNITS
-        for date_unit in date_units:
-            try:
-                new_data = to_datetime(new_data, errors='raise',
-                                       unit=date_unit)
-            except OverflowError:
-                continue
-            except:
-                break
-            return new_data, True
-        return data, False
-
-    def _try_convert_dates(self):
-        raise AbstractMethodError(self)
-
-
-class SeriesParser(Parser):
-    _default_orient = 'index'
-    _split_keys = ('name', 'index', 'data')
-
-    def _parse_no_numpy(self):
-
-        json = self.json
-        orient = self.orient
-        if orient == "split":
-            decoded = dict((str(k), v)
-                           for k, v in compat.iteritems(loads(
-                               json,
-                               precise_float=self.precise_float)))
-            self.check_keys_split(decoded)
-            self.obj = Series(dtype=None, **decoded)
-        else:
-            self.obj = Series(
-                loads(json, precise_float=self.precise_float), dtype=None)
-
-    def _parse_numpy(self):
-
-        json = self.json
-        orient = self.orient
-        if orient == "split":
-            decoded = loads(json, dtype=None, numpy=True,
-                            precise_float=self.precise_float)
-            decoded = dict((str(k), v) for k, v in compat.iteritems(decoded))
-            self.check_keys_split(decoded)
-            self.obj = Series(**decoded)
-        elif orient == "columns" or orient == "index":
-            self.obj = Series(*loads(json, dtype=None, numpy=True,
-                                     labelled=True,
-                                     precise_float=self.precise_float))
-        else:
-            self.obj = Series(loads(json, dtype=None, numpy=True,
-                                    precise_float=self.precise_float))
-
-    def _try_convert_types(self):
-        if self.obj is None:
-            return
-        obj, result = self._try_convert_data(
-            'data', self.obj, convert_dates=self.convert_dates)
-        if result:
-            self.obj = obj
-
-
-class FrameParser(Parser):
-    _default_orient = 'columns'
-    _split_keys = ('columns', 'index', 'data')
-
-    def _parse_numpy(self):
-
-        json = self.json
-        orient = self.orient
-
-        if orient == "columns":
-            args = loads(json, dtype=None, numpy=True, labelled=True,
-                         precise_float=self.precise_float)
-            if args:
-                args = (args[0].T, args[2], args[1])
-            self.obj = DataFrame(*args)
-        elif orient == "split":
-            decoded = loads(json, dtype=None, numpy=True,
-                            precise_float=self.precise_float)
-            decoded = dict((str(k), v) for k, v in compat.iteritems(decoded))
-            self.check_keys_split(decoded)
-            self.obj = DataFrame(**decoded)
-        elif orient == "values":
-            self.obj = DataFrame(loads(json, dtype=None, numpy=True,
-                                       precise_float=self.precise_float))
-        else:
-            self.obj = DataFrame(*loads(json, dtype=None, numpy=True,
-                                        labelled=True,
-                                        precise_float=self.precise_float))
-
-    def _parse_no_numpy(self):
-
-        json = self.json
-        orient = self.orient
-
-        if orient == "columns":
-            self.obj = DataFrame(
-                loads(json, precise_float=self.precise_float), dtype=None)
-        elif orient == "split":
-            decoded = dict((str(k), v)
-                           for k, v in compat.iteritems(loads(
-                               json,
-                               precise_float=self.precise_float)))
-            self.check_keys_split(decoded)
-            self.obj = DataFrame(dtype=None, **decoded)
-        elif orient == "index":
-            self.obj = DataFrame(
-                loads(json, precise_float=self.precise_float), dtype=None).T
-        else:
-            self.obj = DataFrame(
-                loads(json, precise_float=self.precise_float), dtype=None)
-
-    def _process_converter(self, f, filt=None):
-        """ take a conversion function and possibly recreate the frame """
-
-        if filt is None:
-            filt = lambda col, c: True
-
-        needs_new_obj = False
-        new_obj = dict()
-        for i, (col, c) in enumerate(self.obj.iteritems()):
-            if filt(col, c):
-                new_data, result = f(col, c)
-                if result:
-                    c = new_data
-                    needs_new_obj = True
-            new_obj[i] = c
-
-        if needs_new_obj:
-
-            # possibly handle dup columns
-            new_obj = DataFrame(new_obj, index=self.obj.index)
-            new_obj.columns = self.obj.columns
-            self.obj = new_obj
-
-    def _try_convert_types(self):
-        if self.obj is None:
-            return
-        if self.convert_dates:
-            self._try_convert_dates()
-
-        self._process_converter(
-            lambda col, c: self._try_convert_data(col, c, convert_dates=False))
-
-    def _try_convert_dates(self):
-        if self.obj is None:
-            return
-
-        # our columns to parse
-        convert_dates = self.convert_dates
-        if convert_dates is True:
-            convert_dates = []
-        convert_dates = set(convert_dates)
-
-        def is_ok(col):
-            """ return if this col is ok to try for a date parse """
-            if not isinstance(col, compat.string_types):
-                return False
-
-            col_lower = col.lower()
-            if (col_lower.endswith('_at') or
-                    col_lower.endswith('_time') or
-                    col_lower == 'modified' or
-                    col_lower == 'date' or
-                    col_lower == 'datetime' or
-                    col_lower.startswith('timestamp')):
-                return True
-            return False
-
-        self._process_converter(
-            lambda col, c: self._try_convert_to_date(c),
-            lambda col, c: ((self.keep_default_dates and is_ok(col))
-                            or col in convert_dates))
-
-
-#----------------------------------------------------------------------
-# JSON normalization routines
-
-def nested_to_record(ds, prefix="", level=0):
-    """a simplified json_normalize
-
-    converts a nested dict into a flat dict ("record"), unlike json_normalize,
-    it does not attempt to extract a subset of the data.
-
-    Parameters
-    ----------
-    ds : dict or list of dicts
-    prefix: the prefix, optional, default: ""
-    level: the number of levels in the jason string, optional, default: 0
-
-    Returns
-    -------
-    d - dict or list of dicts, matching `ds`
-
-    Examples
-    --------
-
-    IN[52]: nested_to_record(dict(flat1=1,dict1=dict(c=1,d=2),
-                                  nested=dict(e=dict(c=1,d=2),d=2)))
-    Out[52]:
-    {'dict1.c': 1,
-     'dict1.d': 2,
-     'flat1': 1,
-     'nested.d': 2,
-     'nested.e.c': 1,
-     'nested.e.d': 2}
-    """
-    singleton = False
-    if isinstance(ds, dict):
-        ds = [ds]
-        singleton = True
-
-    new_ds = []
-    for d in ds:
-
-        new_d = copy.deepcopy(d)
-        for k, v in d.items():
-            # each key gets renamed with prefix
-            if level == 0:
-                newkey = str(k)
-            else:
-                newkey = prefix + '.' + str(k)
-
-            # only dicts gets recurse-flattend
-            # only at level>1 do we rename the rest of the keys
-            if not isinstance(v, dict):
-                if level != 0:  # so we skip copying for top level, common case
-                    v = new_d.pop(k)
-                    new_d[newkey] = v
-                continue
-            else:
-                v = new_d.pop(k)
-                new_d.update(nested_to_record(v, newkey, level+1))
-        new_ds.append(new_d)
-
-    if singleton:
-        return new_ds[0]
-    return new_ds
-
-
-def json_normalize(data, record_path=None, meta=None,
-                   meta_prefix=None,
-                   record_prefix=None):
-    """
-    "Normalize" semi-structured JSON data into a flat table
-
-    Parameters
-    ----------
-    data : dict or list of dicts
-        Unserialized JSON objects
-    record_path : string or list of strings, default None
-        Path in each object to list of records. If not passed, data will be
-        assumed to be an array of records
-    meta : list of paths (string or list of strings), default None
-        Fields to use as metadata for each record in resulting table
-    record_prefix : string, default None
-        If True, prefix records with dotted (?) path, e.g. foo.bar.field if
-        path to records is ['foo', 'bar']
-    meta_prefix : string, default None
-
-    Returns
-    -------
-    frame : DataFrame
-
-    Examples
-    --------
-
-    >>> data = [{'state': 'Florida',
-    ...          'shortname': 'FL',
-    ...          'info': {
-    ...               'governor': 'Rick Scott'
-    ...          },
-    ...          'counties': [{'name': 'Dade', 'population': 12345},
-    ...                      {'name': 'Broward', 'population': 40000},
-    ...                      {'name': 'Palm Beach', 'population': 60000}]},
-    ...         {'state': 'Ohio',
-    ...          'shortname': 'OH',
-    ...          'info': {
-    ...               'governor': 'John Kasich'
-    ...          },
-    ...          'counties': [{'name': 'Summit', 'population': 1234},
-    ...                       {'name': 'Cuyahoga', 'population': 1337}]}]
-    >>> from pandas.io.json import json_normalize
-    >>> result = json_normalize(data, 'counties', ['state', 'shortname',
-    ...                                           ['info', 'governor']])
-    >>> result
-             name  population info.governor    state shortname
-    0        Dade       12345    Rick Scott  Florida        FL
-    1     Broward       40000    Rick Scott  Florida        FL
-    2  Palm Beach       60000    Rick Scott  Florida        FL
-    3      Summit        1234   John Kasich     Ohio        OH
-    4    Cuyahoga        1337   John Kasich     Ohio        OH
-
-    """
-    def _pull_field(js, spec):
-        result = js
-        if isinstance(spec, list):
-            for field in spec:
-                result = result[field]
-        else:
-            result = result[spec]
-
-        return result
-
-    # A bit of a hackjob
-    if isinstance(data, dict):
-        data = [data]
-
-    if record_path is None:
-        if any([isinstance(x, dict) for x in compat.itervalues(data[0])]):
-            # naive normalization, this is idempotent for flat records
-            # and potentially will inflate the data considerably for
-            # deeply nested structures:
-            #  {VeryLong: { b: 1,c:2}} -> {VeryLong.b:1 ,VeryLong.c:@}
-            #
-            # TODO: handle record value which are lists, at least error
-            #       reasonably
-            data = nested_to_record(data)
-        return DataFrame(data)
-    elif not isinstance(record_path, list):
-        record_path = [record_path]
-
-    if meta is None:
-        meta = []
-    elif not isinstance(meta, list):
-        meta = [meta]
-
-    for i, x in enumerate(meta):
-        if not isinstance(x, list):
-            meta[i] = [x]
-
-    # Disastrously inefficient for now
-    records = []
-    lengths = []
-
-    meta_vals = defaultdict(list)
-    meta_keys = ['.'.join(val) for val in meta]
-
-    def _recursive_extract(data, path, seen_meta, level=0):
-        if len(path) > 1:
-            for obj in data:
-                for val, key in zip(meta, meta_keys):
-                    if level + 1 == len(val):
-                        seen_meta[key] = _pull_field(obj, val[-1])
-
-                _recursive_extract(obj[path[0]], path[1:],
-                                   seen_meta, level=level+1)
-        else:
-            for obj in data:
-                recs = _pull_field(obj, path[0])
-
-                # For repeating the metadata later
-                lengths.append(len(recs))
-
-                for val, key in zip(meta, meta_keys):
-                    if level + 1 > len(val):
-                        meta_val = seen_meta[key]
-                    else:
-                        meta_val = _pull_field(obj, val[level:])
-                    meta_vals[key].append(meta_val)
-
-                records.extend(recs)
-
-    _recursive_extract(data, record_path, {}, level=0)
-
-    result = DataFrame(records)
-
-    if record_prefix is not None:
-        result.rename(columns=lambda x: record_prefix + x, inplace=True)
-
-    # Data types, a problem
-    for k, v in compat.iteritems(meta_vals):
-        if meta_prefix is not None:
-            k = meta_prefix + k
-
-        if k in result:
-            raise ValueError('Conflicting metadata name %s, '
-                             'need distinguishing prefix ' % k)
-
-        result[k] = np.array(v).repeat(lengths)
-
-    return result
diff --git a/pandas/io/json/__init__.py b/pandas/io/json/__init__.py
new file mode 100644
index 0000000000000..32d110b3404a9
--- /dev/null
+++ b/pandas/io/json/__init__.py
@@ -0,0 +1,5 @@
+from .json import to_json, read_json, loads, dumps  # noqa
+from .normalize import json_normalize  # noqa
+from .table_schema import build_table_schema  # noqa
+
+del json, normalize, table_schema  # noqa
diff --git a/pandas/io/json/json.py b/pandas/io/json/json.py
new file mode 100644
index 0000000000000..9992be521d61f
--- /dev/null
+++ b/pandas/io/json/json.py
@@ -0,0 +1,929 @@
+# pylint: disable-msg=E1101,W0613,W0603
+from itertools import islice
+import os
+import numpy as np
+
+import pandas._libs.json as json
+from pandas._libs.tslib import iNaT
+from pandas.compat import StringIO, long, u, to_str
+from pandas import compat, isna
+from pandas import Series, DataFrame, to_datetime, MultiIndex
+from pandas.io.common import (get_filepath_or_buffer, _get_handle,
+                              _infer_compression, _stringify_path,
+                              BaseIterator)
+from pandas.io.parsers import _validate_integer
+import pandas.core.common as com
+from pandas.core.reshape.concat import concat
+from pandas.io.formats.printing import pprint_thing
+from .normalize import _convert_to_line_delimits
+from .table_schema import build_table_schema, parse_table_schema
+from pandas.core.dtypes.common import is_period_dtype
+
+loads = json.loads
+dumps = json.dumps
+
+TABLE_SCHEMA_VERSION = '0.20.0'
+
+
+# interface to/from
+def to_json(path_or_buf, obj, orient=None, date_format='epoch',
+            double_precision=10, force_ascii=True, date_unit='ms',
+            default_handler=None, lines=False, compression=None,
+            index=True):
+
+    if not index and orient not in ['split', 'table']:
+        raise ValueError("'index=False' is only valid when 'orient' is "
+                         "'split' or 'table'")
+
+    path_or_buf = _stringify_path(path_or_buf)
+    if lines and orient != 'records':
+        raise ValueError(
+            "'lines' keyword only valid when 'orient' is records")
+
+    if orient == 'table' and isinstance(obj, Series):
+        obj = obj.to_frame(name=obj.name or 'values')
+    if orient == 'table' and isinstance(obj, DataFrame):
+        writer = JSONTableWriter
+    elif isinstance(obj, Series):
+        writer = SeriesWriter
+    elif isinstance(obj, DataFrame):
+        writer = FrameWriter
+    else:
+        raise NotImplementedError("'obj' should be a Series or a DataFrame")
+
+    s = writer(
+        obj, orient=orient, date_format=date_format,
+        double_precision=double_precision, ensure_ascii=force_ascii,
+        date_unit=date_unit, default_handler=default_handler,
+        index=index).write()
+
+    if lines:
+        s = _convert_to_line_delimits(s)
+
+    if isinstance(path_or_buf, compat.string_types):
+        fh, handles = _get_handle(path_or_buf, 'w', compression=compression)
+        try:
+            fh.write(s)
+        finally:
+            fh.close()
+    elif path_or_buf is None:
+        return s
+    else:
+        path_or_buf.write(s)
+
+
+class Writer(object):
+
+    def __init__(self, obj, orient, date_format, double_precision,
+                 ensure_ascii, date_unit, index, default_handler=None):
+        self.obj = obj
+
+        if orient is None:
+            orient = self._default_orient
+
+        self.orient = orient
+        self.date_format = date_format
+        self.double_precision = double_precision
+        self.ensure_ascii = ensure_ascii
+        self.date_unit = date_unit
+        self.default_handler = default_handler
+        self.index = index
+
+        self.is_copy = None
+        self._format_axes()
+
+    def _format_axes(self):
+        raise com.AbstractMethodError(self)
+
+    def write(self):
+        return self._write(self.obj, self.orient, self.double_precision,
+                           self.ensure_ascii, self.date_unit,
+                           self.date_format == 'iso', self.default_handler)
+
+    def _write(self, obj, orient, double_precision, ensure_ascii,
+               date_unit, iso_dates, default_handler):
+        return dumps(
+            obj,
+            orient=orient,
+            double_precision=double_precision,
+            ensure_ascii=ensure_ascii,
+            date_unit=date_unit,
+            iso_dates=iso_dates,
+            default_handler=default_handler
+        )
+
+
+class SeriesWriter(Writer):
+    _default_orient = 'index'
+
+    def _format_axes(self):
+        if not self.obj.index.is_unique and self.orient == 'index':
+            raise ValueError("Series index must be unique for orient="
+                             "'{orient}'".format(orient=self.orient))
+
+    def _write(self, obj, orient, double_precision, ensure_ascii,
+               date_unit, iso_dates, default_handler):
+        if not self.index and orient == 'split':
+            obj = {"name": obj.name, "data": obj.values}
+        return super(SeriesWriter, self)._write(obj, orient,
+                                                double_precision,
+                                                ensure_ascii, date_unit,
+                                                iso_dates, default_handler)
+
+
+class FrameWriter(Writer):
+    _default_orient = 'columns'
+
+    def _format_axes(self):
+        """ try to axes if they are datelike """
+        if not self.obj.index.is_unique and self.orient in (
+                'index', 'columns'):
+            raise ValueError("DataFrame index must be unique for orient="
+                             "'{orient}'.".format(orient=self.orient))
+        if not self.obj.columns.is_unique and self.orient in (
+                'index', 'columns', 'records'):
+            raise ValueError("DataFrame columns must be unique for orient="
+                             "'{orient}'.".format(orient=self.orient))
+
+    def _write(self, obj, orient, double_precision, ensure_ascii,
+               date_unit, iso_dates, default_handler):
+        if not self.index and orient == 'split':
+            obj = obj.to_dict(orient='split')
+            del obj["index"]
+        return super(FrameWriter, self)._write(obj, orient,
+                                               double_precision,
+                                               ensure_ascii, date_unit,
+                                               iso_dates, default_handler)
+
+
+class JSONTableWriter(FrameWriter):
+    _default_orient = 'records'
+
+    def __init__(self, obj, orient, date_format, double_precision,
+                 ensure_ascii, date_unit, index, default_handler=None):
+        """
+        Adds a `schema` attribute with the Table Schema, resets
+        the index (can't do in caller, because the schema inference needs
+        to know what the index is, forces orient to records, and forces
+        date_format to 'iso'.
+        """
+        super(JSONTableWriter, self).__init__(
+            obj, orient, date_format, double_precision, ensure_ascii,
+            date_unit, index, default_handler=default_handler)
+
+        if date_format != 'iso':
+            msg = ("Trying to write with `orient='table'` and "
+                   "`date_format='{fmt}'`. Table Schema requires dates "
+                   "to be formatted with `date_format='iso'`"
+                   .format(fmt=date_format))
+            raise ValueError(msg)
+
+        self.schema = build_table_schema(obj, index=self.index)
+
+        # NotImplementd on a column MultiIndex
+        if obj.ndim == 2 and isinstance(obj.columns, MultiIndex):
+            raise NotImplementedError(
+                "orient='table' is not supported for MultiIndex")
+
+        # TODO: Do this timedelta properly in objToJSON.c See GH #15137
+        if ((obj.ndim == 1) and (obj.name in set(obj.index.names)) or
+                len(obj.columns & obj.index.names)):
+            msg = "Overlapping names between the index and columns"
+            raise ValueError(msg)
+
+        obj = obj.copy()
+        timedeltas = obj.select_dtypes(include=['timedelta']).columns
+        if len(timedeltas):
+            obj[timedeltas] = obj[timedeltas].applymap(
+                lambda x: x.isoformat())
+        # Convert PeriodIndex to datetimes before serialzing
+        if is_period_dtype(obj.index):
+            obj.index = obj.index.to_timestamp()
+
+        # exclude index from obj if index=False
+        if not self.index:
+            self.obj = obj.reset_index(drop=True)
+        else:
+            self.obj = obj.reset_index(drop=False)
+        self.date_format = 'iso'
+        self.orient = 'records'
+        self.index = index
+
+    def _write(self, obj, orient, double_precision, ensure_ascii,
+               date_unit, iso_dates, default_handler):
+        data = super(JSONTableWriter, self)._write(obj, orient,
+                                                   double_precision,
+                                                   ensure_ascii, date_unit,
+                                                   iso_dates,
+                                                   default_handler)
+        serialized = '{{"schema": {schema}, "data": {data}}}'.format(
+                     schema=dumps(self.schema), data=data)
+        return serialized
+
+
+def read_json(path_or_buf=None, orient=None, typ='frame', dtype=True,
+              convert_axes=True, convert_dates=True, keep_default_dates=True,
+              numpy=False, precise_float=False, date_unit=None, encoding=None,
+              lines=False, chunksize=None, compression='infer'):
+    """
+    Convert a JSON string to pandas object
+
+    Parameters
+    ----------
+    path_or_buf : a valid JSON string or file-like, default: None
+        The string could be a URL. Valid URL schemes include http, ftp, s3,
+        gcs, and file. For file URLs, a host is expected. For instance, a local
+        file could be ``file://localhost/path/to/table.json``
+
+    orient : string,
+        Indication of expected JSON string format.
+        Compatible JSON strings can be produced by ``to_json()`` with a
+        corresponding orient value.
+        The set of possible orients is:
+
+        - ``'split'`` : dict like
+          ``{index -> [index], columns -> [columns], data -> [values]}``
+        - ``'records'`` : list like
+          ``[{column -> value}, ... , {column -> value}]``
+        - ``'index'`` : dict like ``{index -> {column -> value}}``
+        - ``'columns'`` : dict like ``{column -> {index -> value}}``
+        - ``'values'`` : just the values array
+
+        The allowed and default values depend on the value
+        of the `typ` parameter.
+
+        * when ``typ == 'series'``,
+
+          - allowed orients are ``{'split','records','index'}``
+          - default is ``'index'``
+          - The Series index must be unique for orient ``'index'``.
+
+        * when ``typ == 'frame'``,
+
+          - allowed orients are ``{'split','records','index',
+            'columns','values', 'table'}``
+          - default is ``'columns'``
+          - The DataFrame index must be unique for orients ``'index'`` and
+            ``'columns'``.
+          - The DataFrame columns must be unique for orients ``'index'``,
+            ``'columns'``, and ``'records'``.
+
+        .. versionadded:: 0.23.0
+           'table' as an allowed value for the ``orient`` argument
+
+    typ : type of object to recover (series or frame), default 'frame'
+    dtype : boolean or dict, default True
+        If True, infer dtypes, if a dict of column to dtype, then use those,
+        if False, then don't infer dtypes at all, applies only to the data.
+    convert_axes : boolean, default True
+        Try to convert the axes to the proper dtypes.
+    convert_dates : boolean, default True
+        List of columns to parse for dates; If True, then try to parse
+        datelike columns default is True; a column label is datelike if
+
+        * it ends with ``'_at'``,
+
+        * it ends with ``'_time'``,
+
+        * it begins with ``'timestamp'``,
+
+        * it is ``'modified'``, or
+
+        * it is ``'date'``
+
+    keep_default_dates : boolean, default True
+        If parsing dates, then parse the default datelike columns
+    numpy : boolean, default False
+        Direct decoding to numpy arrays. Supports numeric data only, but
+        non-numeric column and index labels are supported. Note also that the
+        JSON ordering MUST be the same for each term if numpy=True.
+    precise_float : boolean, default False
+        Set to enable usage of higher precision (strtod) function when
+        decoding string to double values. Default (False) is to use fast but
+        less precise builtin functionality
+    date_unit : string, default None
+        The timestamp unit to detect if converting dates. The default behaviour
+        is to try and detect the correct precision, but if this is not desired
+        then pass one of 's', 'ms', 'us' or 'ns' to force parsing only seconds,
+        milliseconds, microseconds or nanoseconds respectively.
+    lines : boolean, default False
+        Read the file as a json object per line.
+
+        .. versionadded:: 0.19.0
+
+    encoding : str, default is 'utf-8'
+        The encoding to use to decode py3 bytes.
+
+        .. versionadded:: 0.19.0
+
+    chunksize: integer, default None
+        Return JsonReader object for iteration.
+        See the `line-delimted json docs
+        <http://pandas.pydata.org/pandas-docs/stable/io.html#io-jsonl>`_
+        for more information on ``chunksize``.
+        This can only be passed if `lines=True`.
+        If this is None, the file will be read into memory all at once.
+
+        .. versionadded:: 0.21.0
+
+    compression : {'infer', 'gzip', 'bz2', 'zip', 'xz', None}, default 'infer'
+        For on-the-fly decompression of on-disk data. If 'infer', then use
+        gzip, bz2, zip or xz if path_or_buf is a string ending in
+        '.gz', '.bz2', '.zip', or 'xz', respectively, and no decompression
+        otherwise. If using 'zip', the ZIP file must contain only one data
+        file to be read in. Set to None for no decompression.
+
+        .. versionadded:: 0.21.0
+
+    Returns
+    -------
+    result : Series or DataFrame, depending on the value of `typ`.
+
+    Notes
+    -----
+    Specific to ``orient='table'``, if a :class:`DataFrame` with a literal
+    :class:`Index` name of `index` gets written with :func:`to_json`, the
+    subsequent read operation will incorrectly set the :class:`Index` name to
+    ``None``. This is because `index` is also used by :func:`DataFrame.to_json`
+    to denote a missing :class:`Index` name, and the subsequent
+    :func:`read_json` operation cannot distinguish between the two. The same
+    limitation is encountered with a :class:`MultiIndex` and any names
+    beginning with ``'level_'``.
+
+    See Also
+    --------
+    DataFrame.to_json
+
+    Examples
+    --------
+
+    >>> df = pd.DataFrame([['a', 'b'], ['c', 'd']],
+    ...                   index=['row 1', 'row 2'],
+    ...                   columns=['col 1', 'col 2'])
+
+    Encoding/decoding a Dataframe using ``'split'`` formatted JSON:
+
+    >>> df.to_json(orient='split')
+    '{"columns":["col 1","col 2"],
+      "index":["row 1","row 2"],
+      "data":[["a","b"],["c","d"]]}'
+    >>> pd.read_json(_, orient='split')
+          col 1 col 2
+    row 1     a     b
+    row 2     c     d
+
+    Encoding/decoding a Dataframe using ``'index'`` formatted JSON:
+
+    >>> df.to_json(orient='index')
+    '{"row 1":{"col 1":"a","col 2":"b"},"row 2":{"col 1":"c","col 2":"d"}}'
+    >>> pd.read_json(_, orient='index')
+          col 1 col 2
+    row 1     a     b
+    row 2     c     d
+
+    Encoding/decoding a Dataframe using ``'records'`` formatted JSON.
+    Note that index labels are not preserved with this encoding.
+
+    >>> df.to_json(orient='records')
+    '[{"col 1":"a","col 2":"b"},{"col 1":"c","col 2":"d"}]'
+    >>> pd.read_json(_, orient='records')
+      col 1 col 2
+    0     a     b
+    1     c     d
+
+    Encoding with Table Schema
+
+    >>> df.to_json(orient='table')
+    '{"schema": {"fields": [{"name": "index", "type": "string"},
+                            {"name": "col 1", "type": "string"},
+                            {"name": "col 2", "type": "string"}],
+                    "primaryKey": "index",
+                    "pandas_version": "0.20.0"},
+        "data": [{"index": "row 1", "col 1": "a", "col 2": "b"},
+                {"index": "row 2", "col 1": "c", "col 2": "d"}]}'
+    """
+
+    compression = _infer_compression(path_or_buf, compression)
+    filepath_or_buffer, _, compression, should_close = get_filepath_or_buffer(
+        path_or_buf, encoding=encoding, compression=compression,
+    )
+
+    json_reader = JsonReader(
+        filepath_or_buffer, orient=orient, typ=typ, dtype=dtype,
+        convert_axes=convert_axes, convert_dates=convert_dates,
+        keep_default_dates=keep_default_dates, numpy=numpy,
+        precise_float=precise_float, date_unit=date_unit, encoding=encoding,
+        lines=lines, chunksize=chunksize, compression=compression,
+    )
+
+    if chunksize:
+        return json_reader
+
+    result = json_reader.read()
+    if should_close:
+        try:
+            filepath_or_buffer.close()
+        except:  # noqa: flake8
+            pass
+    return result
+
+
+class JsonReader(BaseIterator):
+    """
+    JsonReader provides an interface for reading in a JSON file.
+
+    If initialized with ``lines=True`` and ``chunksize``, can be iterated over
+    ``chunksize`` lines at a time. Otherwise, calling ``read`` reads in the
+    whole document.
+    """
+    def __init__(self, filepath_or_buffer, orient, typ, dtype, convert_axes,
+                 convert_dates, keep_default_dates, numpy, precise_float,
+                 date_unit, encoding, lines, chunksize, compression):
+
+        self.path_or_buf = filepath_or_buffer
+        self.orient = orient
+        self.typ = typ
+        self.dtype = dtype
+        self.convert_axes = convert_axes
+        self.convert_dates = convert_dates
+        self.keep_default_dates = keep_default_dates
+        self.numpy = numpy
+        self.precise_float = precise_float
+        self.date_unit = date_unit
+        self.encoding = encoding
+        self.compression = compression
+        self.lines = lines
+        self.chunksize = chunksize
+        self.nrows_seen = 0
+        self.should_close = False
+
+        if self.chunksize is not None:
+            self.chunksize = _validate_integer("chunksize", self.chunksize, 1)
+            if not self.lines:
+                raise ValueError("chunksize can only be passed if lines=True")
+
+        data = self._get_data_from_filepath(filepath_or_buffer)
+        self.data = self._preprocess_data(data)
+
+    def _preprocess_data(self, data):
+        """
+        At this point, the data either has a `read` attribute (e.g. a file
+        object or a StringIO) or is a string that is a JSON document.
+
+        If self.chunksize, we prepare the data for the `__next__` method.
+        Otherwise, we read it into memory for the `read` method.
+        """
+        if hasattr(data, 'read') and not self.chunksize:
+            data = data.read()
+        if not hasattr(data, 'read') and self.chunksize:
+            data = StringIO(data)
+
+        return data
+
+    def _get_data_from_filepath(self, filepath_or_buffer):
+        """
+        read_json accepts three input types:
+            1. filepath (string-like)
+            2. file-like object (e.g. open file object, StringIO)
+            3. JSON string
+
+        This method turns (1) into (2) to simplify the rest of the processing.
+        It returns input types (2) and (3) unchanged.
+        """
+
+        data = filepath_or_buffer
+
+        exists = False
+        if isinstance(data, compat.string_types):
+            try:
+                exists = os.path.exists(filepath_or_buffer)
+            # gh-5874: if the filepath is too long will raise here
+            except (TypeError, ValueError):
+                pass
+
+        if exists or self.compression is not None:
+            data, _ = _get_handle(filepath_or_buffer, 'r',
+                                  encoding=self.encoding,
+                                  compression=self.compression)
+            self.should_close = True
+            self.open_stream = data
+
+        return data
+
+    def _combine_lines(self, lines):
+        """Combines a list of JSON objects into one JSON object"""
+        lines = filter(None, map(lambda x: x.strip(), lines))
+        return '[' + ','.join(lines) + ']'
+
+    def read(self):
+        """Read the whole JSON input into a pandas object"""
+        if self.lines and self.chunksize:
+            obj = concat(self)
+        elif self.lines:
+
+            data = to_str(self.data)
+            obj = self._get_object_parser(
+                self._combine_lines(data.split('\n'))
+            )
+        else:
+            obj = self._get_object_parser(self.data)
+        self.close()
+        return obj
+
+    def _get_object_parser(self, json):
+        """parses a json document into a pandas object"""
+        typ = self.typ
+        dtype = self.dtype
+        kwargs = {
+            "orient": self.orient, "dtype": self.dtype,
+            "convert_axes": self.convert_axes,
+            "convert_dates": self.convert_dates,
+            "keep_default_dates": self.keep_default_dates, "numpy": self.numpy,
+            "precise_float": self.precise_float, "date_unit": self.date_unit
+        }
+        obj = None
+        if typ == 'frame':
+            obj = FrameParser(json, **kwargs).parse()
+
+        if typ == 'series' or obj is None:
+            if not isinstance(dtype, bool):
+                dtype = dict(data=dtype)
+            obj = SeriesParser(json, **kwargs).parse()
+
+        return obj
+
+    def close(self):
+        """
+        If we opened a stream earlier, in _get_data_from_filepath, we should
+        close it. If an open stream or file was passed, we leave it open.
+        """
+        if self.should_close:
+            try:
+                self.open_stream.close()
+            except (IOError, AttributeError):
+                pass
+
+    def __next__(self):
+        lines = list(islice(self.data, self.chunksize))
+        if lines:
+            lines_json = self._combine_lines(lines)
+            obj = self._get_object_parser(lines_json)
+
+            # Make sure that the returned objects have the right index.
+            obj.index = range(self.nrows_seen, self.nrows_seen + len(obj))
+            self.nrows_seen += len(obj)
+
+            return obj
+
+        self.close()
+        raise StopIteration
+
+
+class Parser(object):
+
+    _STAMP_UNITS = ('s', 'ms', 'us', 'ns')
+    _MIN_STAMPS = {
+        's': long(31536000),
+        'ms': long(31536000000),
+        'us': long(31536000000000),
+        'ns': long(31536000000000000)}
+
+    def __init__(self, json, orient, dtype=True, convert_axes=True,
+                 convert_dates=True, keep_default_dates=False, numpy=False,
+                 precise_float=False, date_unit=None):
+        self.json = json
+
+        if orient is None:
+            orient = self._default_orient
+
+        self.orient = orient
+        self.dtype = dtype
+
+        if orient == "split":
+            numpy = False
+
+        if date_unit is not None:
+            date_unit = date_unit.lower()
+            if date_unit not in self._STAMP_UNITS:
+                raise ValueError('date_unit must be one of {units}'
+                                 .format(units=self._STAMP_UNITS))
+            self.min_stamp = self._MIN_STAMPS[date_unit]
+        else:
+            self.min_stamp = self._MIN_STAMPS['s']
+
+        self.numpy = numpy
+        self.precise_float = precise_float
+        self.convert_axes = convert_axes
+        self.convert_dates = convert_dates
+        self.date_unit = date_unit
+        self.keep_default_dates = keep_default_dates
+        self.obj = None
+
+    def check_keys_split(self, decoded):
+        "checks that dict has only the appropriate keys for orient='split'"
+        bad_keys = set(decoded.keys()).difference(set(self._split_keys))
+        if bad_keys:
+            bad_keys = ", ".join(bad_keys)
+            raise ValueError(u("JSON data had unexpected key(s): {bad_keys}")
+                             .format(bad_keys=pprint_thing(bad_keys)))
+
+    def parse(self):
+
+        # try numpy
+        numpy = self.numpy
+        if numpy:
+            self._parse_numpy()
+
+        else:
+            self._parse_no_numpy()
+
+        if self.obj is None:
+            return None
+        if self.convert_axes:
+            self._convert_axes()
+        self._try_convert_types()
+        return self.obj
+
+    def _convert_axes(self):
+        """ try to convert axes """
+        for axis in self.obj._AXIS_NUMBERS.keys():
+            new_axis, result = self._try_convert_data(
+                axis, self.obj._get_axis(axis), use_dtypes=False,
+                convert_dates=True)
+            if result:
+                setattr(self.obj, axis, new_axis)
+
+    def _try_convert_types(self):
+        raise com.AbstractMethodError(self)
+
+    def _try_convert_data(self, name, data, use_dtypes=True,
+                          convert_dates=True):
+        """ try to parse a ndarray like into a column by inferring dtype """
+
+        # don't try to coerce, unless a force conversion
+        if use_dtypes:
+            if self.dtype is False:
+                return data, False
+            elif self.dtype is True:
+                pass
+
+            else:
+
+                # dtype to force
+                dtype = (self.dtype.get(name)
+                         if isinstance(self.dtype, dict) else self.dtype)
+                if dtype is not None:
+                    try:
+                        dtype = np.dtype(dtype)
+                        return data.astype(dtype), True
+                    except (TypeError, ValueError):
+                        return data, False
+
+        if convert_dates:
+            new_data, result = self._try_convert_to_date(data)
+            if result:
+                return new_data, True
+
+        result = False
+
+        if data.dtype == 'object':
+
+            # try float
+            try:
+                data = data.astype('float64')
+                result = True
+            except (TypeError, ValueError):
+                pass
+
+        if data.dtype.kind == 'f':
+
+            if data.dtype != 'float64':
+
+                # coerce floats to 64
+                try:
+                    data = data.astype('float64')
+                    result = True
+                except (TypeError, ValueError):
+                    pass
+
+        # do't coerce 0-len data
+        if len(data) and (data.dtype == 'float' or data.dtype == 'object'):
+
+            # coerce ints if we can
+            try:
+                new_data = data.astype('int64')
+                if (new_data == data).all():
+                    data = new_data
+                    result = True
+            except (TypeError, ValueError):
+                pass
+
+        # coerce ints to 64
+        if data.dtype == 'int':
+
+            # coerce floats to 64
+            try:
+                data = data.astype('int64')
+                result = True
+            except (TypeError, ValueError):
+                pass
+
+        return data, result
+
+    def _try_convert_to_date(self, data):
+        """ try to parse a ndarray like into a date column
+            try to coerce object in epoch/iso formats and
+            integer/float in epcoh formats, return a boolean if parsing
+            was successful """
+
+        # no conversion on empty
+        if not len(data):
+            return data, False
+
+        new_data = data
+        if new_data.dtype == 'object':
+            try:
+                new_data = data.astype('int64')
+            except (TypeError, ValueError, OverflowError):
+                pass
+
+        # ignore numbers that are out of range
+        if issubclass(new_data.dtype.type, np.number):
+            in_range = (isna(new_data.values) | (new_data > self.min_stamp) |
+                        (new_data.values == iNaT))
+            if not in_range.all():
+                return data, False
+
+        date_units = (self.date_unit,) if self.date_unit else self._STAMP_UNITS
+        for date_unit in date_units:
+            try:
+                new_data = to_datetime(new_data, errors='raise',
+                                       unit=date_unit)
+            except ValueError:
+                continue
+            except Exception:
+                break
+            return new_data, True
+        return data, False
+
+    def _try_convert_dates(self):
+        raise com.AbstractMethodError(self)
+
+
+class SeriesParser(Parser):
+    _default_orient = 'index'
+    _split_keys = ('name', 'index', 'data')
+
+    def _parse_no_numpy(self):
+
+        json = self.json
+        orient = self.orient
+        if orient == "split":
+            decoded = {str(k): v for k, v in compat.iteritems(
+                loads(json, precise_float=self.precise_float))}
+            self.check_keys_split(decoded)
+            self.obj = Series(dtype=None, **decoded)
+        else:
+            self.obj = Series(
+                loads(json, precise_float=self.precise_float), dtype=None)
+
+    def _parse_numpy(self):
+
+        json = self.json
+        orient = self.orient
+        if orient == "split":
+            decoded = loads(json, dtype=None, numpy=True,
+                            precise_float=self.precise_float)
+            decoded = {str(k): v for k, v in compat.iteritems(decoded)}
+            self.check_keys_split(decoded)
+            self.obj = Series(**decoded)
+        elif orient == "columns" or orient == "index":
+            self.obj = Series(*loads(json, dtype=None, numpy=True,
+                                     labelled=True,
+                                     precise_float=self.precise_float))
+        else:
+            self.obj = Series(loads(json, dtype=None, numpy=True,
+                                    precise_float=self.precise_float))
+
+    def _try_convert_types(self):
+        if self.obj is None:
+            return
+        obj, result = self._try_convert_data(
+            'data', self.obj, convert_dates=self.convert_dates)
+        if result:
+            self.obj = obj
+
+
+class FrameParser(Parser):
+    _default_orient = 'columns'
+    _split_keys = ('columns', 'index', 'data')
+
+    def _parse_numpy(self):
+
+        json = self.json
+        orient = self.orient
+
+        if orient == "columns":
+            args = loads(json, dtype=None, numpy=True, labelled=True,
+                         precise_float=self.precise_float)
+            if len(args):
+                args = (args[0].T, args[2], args[1])
+            self.obj = DataFrame(*args)
+        elif orient == "split":
+            decoded = loads(json, dtype=None, numpy=True,
+                            precise_float=self.precise_float)
+            decoded = {str(k): v for k, v in compat.iteritems(decoded)}
+            self.check_keys_split(decoded)
+            self.obj = DataFrame(**decoded)
+        elif orient == "values":
+            self.obj = DataFrame(loads(json, dtype=None, numpy=True,
+                                       precise_float=self.precise_float))
+        else:
+            self.obj = DataFrame(*loads(json, dtype=None, numpy=True,
+                                        labelled=True,
+                                        precise_float=self.precise_float))
+
+    def _parse_no_numpy(self):
+
+        json = self.json
+        orient = self.orient
+
+        if orient == "columns":
+            self.obj = DataFrame(
+                loads(json, precise_float=self.precise_float), dtype=None)
+        elif orient == "split":
+            decoded = {str(k): v for k, v in compat.iteritems(
+                loads(json, precise_float=self.precise_float))}
+            self.check_keys_split(decoded)
+            self.obj = DataFrame(dtype=None, **decoded)
+        elif orient == "index":
+            self.obj = DataFrame(
+                loads(json, precise_float=self.precise_float), dtype=None).T
+        elif orient == 'table':
+            self.obj = parse_table_schema(json,
+                                          precise_float=self.precise_float)
+        else:
+            self.obj = DataFrame(
+                loads(json, precise_float=self.precise_float), dtype=None)
+
+    def _process_converter(self, f, filt=None):
+        """ take a conversion function and possibly recreate the frame """
+
+        if filt is None:
+            filt = lambda col, c: True
+
+        needs_new_obj = False
+        new_obj = dict()
+        for i, (col, c) in enumerate(self.obj.iteritems()):
+            if filt(col, c):
+                new_data, result = f(col, c)
+                if result:
+                    c = new_data
+                    needs_new_obj = True
+            new_obj[i] = c
+
+        if needs_new_obj:
+
+            # possibly handle dup columns
+            new_obj = DataFrame(new_obj, index=self.obj.index)
+            new_obj.columns = self.obj.columns
+            self.obj = new_obj
+
+    def _try_convert_types(self):
+        if self.obj is None:
+            return
+        if self.convert_dates:
+            self._try_convert_dates()
+
+        self._process_converter(
+            lambda col, c: self._try_convert_data(col, c, convert_dates=False))
+
+    def _try_convert_dates(self):
+        if self.obj is None:
+            return
+
+        # our columns to parse
+        convert_dates = self.convert_dates
+        if convert_dates is True:
+            convert_dates = []
+        convert_dates = set(convert_dates)
+
+        def is_ok(col):
+            """ return if this col is ok to try for a date parse """
+            if not isinstance(col, compat.string_types):
+                return False
+
+            col_lower = col.lower()
+            if (col_lower.endswith('_at') or
+                    col_lower.endswith('_time') or
+                    col_lower == 'modified' or
+                    col_lower == 'date' or
+                    col_lower == 'datetime' or
+                    col_lower.startswith('timestamp')):
+                return True
+            return False
+
+        self._process_converter(
+            lambda col, c: self._try_convert_to_date(c),
+            lambda col, c: ((self.keep_default_dates and is_ok(col)) or
+                            col in convert_dates))
diff --git a/pandas/io/json/normalize.py b/pandas/io/json/normalize.py
new file mode 100644
index 0000000000000..2004a24c2ec5a
--- /dev/null
+++ b/pandas/io/json/normalize.py
@@ -0,0 +1,281 @@
+# ---------------------------------------------------------------------
+# JSON normalization routines
+
+import copy
+from collections import defaultdict
+import numpy as np
+
+from pandas._libs.writers import convert_json_to_lines
+from pandas import compat, DataFrame
+
+
+def _convert_to_line_delimits(s):
+    """Helper function that converts json lists to line delimited json."""
+
+    # Determine we have a JSON list to turn to lines otherwise just return the
+    # json object, only lists can
+    if not s[0] == '[' and s[-1] == ']':
+        return s
+    s = s[1:-1]
+
+    return convert_json_to_lines(s)
+
+
+def nested_to_record(ds, prefix="", sep=".", level=0):
+    """a simplified json_normalize
+
+    converts a nested dict into a flat dict ("record"), unlike json_normalize,
+    it does not attempt to extract a subset of the data.
+
+    Parameters
+    ----------
+    ds : dict or list of dicts
+    prefix: the prefix, optional, default: ""
+    sep : string, default '.'
+        Nested records will generate names separated by sep,
+        e.g., for sep='.', { 'foo' : { 'bar' : 0 } } -> foo.bar
+
+        .. versionadded:: 0.20.0
+
+    level: the number of levels in the jason string, optional, default: 0
+
+    Returns
+    -------
+    d - dict or list of dicts, matching `ds`
+
+    Examples
+    --------
+
+    IN[52]: nested_to_record(dict(flat1=1,dict1=dict(c=1,d=2),
+                                  nested=dict(e=dict(c=1,d=2),d=2)))
+    Out[52]:
+    {'dict1.c': 1,
+     'dict1.d': 2,
+     'flat1': 1,
+     'nested.d': 2,
+     'nested.e.c': 1,
+     'nested.e.d': 2}
+    """
+    singleton = False
+    if isinstance(ds, dict):
+        ds = [ds]
+        singleton = True
+
+    new_ds = []
+    for d in ds:
+
+        new_d = copy.deepcopy(d)
+        for k, v in d.items():
+            # each key gets renamed with prefix
+            if not isinstance(k, compat.string_types):
+                k = str(k)
+            if level == 0:
+                newkey = k
+            else:
+                newkey = prefix + sep + k
+
+            # only dicts gets recurse-flattend
+            # only at level>1 do we rename the rest of the keys
+            if not isinstance(v, dict):
+                if level != 0:  # so we skip copying for top level, common case
+                    v = new_d.pop(k)
+                    new_d[newkey] = v
+                continue
+            else:
+                v = new_d.pop(k)
+                new_d.update(nested_to_record(v, newkey, sep, level + 1))
+        new_ds.append(new_d)
+
+    if singleton:
+        return new_ds[0]
+    return new_ds
+
+
+def json_normalize(data, record_path=None, meta=None,
+                   meta_prefix=None,
+                   record_prefix=None,
+                   errors='raise',
+                   sep='.'):
+    """
+    "Normalize" semi-structured JSON data into a flat table
+
+    Parameters
+    ----------
+    data : dict or list of dicts
+        Unserialized JSON objects
+    record_path : string or list of strings, default None
+        Path in each object to list of records. If not passed, data will be
+        assumed to be an array of records
+    meta : list of paths (string or list of strings), default None
+        Fields to use as metadata for each record in resulting table
+    record_prefix : string, default None
+        If True, prefix records with dotted (?) path, e.g. foo.bar.field if
+        path to records is ['foo', 'bar']
+    meta_prefix : string, default None
+    errors : {'raise', 'ignore'}, default 'raise'
+
+        * 'ignore' : will ignore KeyError if keys listed in meta are not
+          always present
+        * 'raise' : will raise KeyError if keys listed in meta are not
+          always present
+
+        .. versionadded:: 0.20.0
+
+    sep : string, default '.'
+        Nested records will generate names separated by sep,
+        e.g., for sep='.', { 'foo' : { 'bar' : 0 } } -> foo.bar
+
+        .. versionadded:: 0.20.0
+
+
+    Returns
+    -------
+    frame : DataFrame
+
+    Examples
+    --------
+
+    >>> from pandas.io.json import json_normalize
+    >>> data = [{'id': 1, 'name': {'first': 'Coleen', 'last': 'Volk'}},
+    ...         {'name': {'given': 'Mose', 'family': 'Regner'}},
+    ...         {'id': 2, 'name': 'Faye Raker'}]
+    >>> json_normalize(data)
+        id        name name.family name.first name.given name.last
+    0  1.0         NaN         NaN     Coleen        NaN      Volk
+    1  NaN         NaN      Regner        NaN       Mose       NaN
+    2  2.0  Faye Raker         NaN        NaN        NaN       NaN
+
+    >>> data = [{'state': 'Florida',
+    ...          'shortname': 'FL',
+    ...          'info': {
+    ...               'governor': 'Rick Scott'
+    ...          },
+    ...          'counties': [{'name': 'Dade', 'population': 12345},
+    ...                      {'name': 'Broward', 'population': 40000},
+    ...                      {'name': 'Palm Beach', 'population': 60000}]},
+    ...         {'state': 'Ohio',
+    ...          'shortname': 'OH',
+    ...          'info': {
+    ...               'governor': 'John Kasich'
+    ...          },
+    ...          'counties': [{'name': 'Summit', 'population': 1234},
+    ...                       {'name': 'Cuyahoga', 'population': 1337}]}]
+    >>> result = json_normalize(data, 'counties', ['state', 'shortname',
+    ...                                           ['info', 'governor']])
+    >>> result
+             name  population info.governor    state shortname
+    0        Dade       12345    Rick Scott  Florida        FL
+    1     Broward       40000    Rick Scott  Florida        FL
+    2  Palm Beach       60000    Rick Scott  Florida        FL
+    3      Summit        1234   John Kasich     Ohio        OH
+    4    Cuyahoga        1337   John Kasich     Ohio        OH
+
+    >>> data = {'A': [1, 2]}
+    >>> json_normalize(data, 'A', record_prefix='Prefix.')
+        Prefix.0
+    0          1
+    1          2
+    """
+    def _pull_field(js, spec):
+        result = js
+        if isinstance(spec, list):
+            for field in spec:
+                result = result[field]
+        else:
+            result = result[spec]
+
+        return result
+
+    if isinstance(data, list) and not data:
+        return DataFrame()
+
+    # A bit of a hackjob
+    if isinstance(data, dict):
+        data = [data]
+
+    if record_path is None:
+        if any([[isinstance(x, dict)
+                for x in compat.itervalues(y)] for y in data]):
+            # naive normalization, this is idempotent for flat records
+            # and potentially will inflate the data considerably for
+            # deeply nested structures:
+            #  {VeryLong: { b: 1,c:2}} -> {VeryLong.b:1 ,VeryLong.c:@}
+            #
+            # TODO: handle record value which are lists, at least error
+            #       reasonably
+            data = nested_to_record(data, sep=sep)
+        return DataFrame(data)
+    elif not isinstance(record_path, list):
+        record_path = [record_path]
+
+    if meta is None:
+        meta = []
+    elif not isinstance(meta, list):
+        meta = [meta]
+
+    meta = [m if isinstance(m, list) else [m] for m in meta]
+
+    # Disastrously inefficient for now
+    records = []
+    lengths = []
+
+    meta_vals = defaultdict(list)
+    if not isinstance(sep, compat.string_types):
+        sep = str(sep)
+    meta_keys = [sep.join(val) for val in meta]
+
+    def _recursive_extract(data, path, seen_meta, level=0):
+        if len(path) > 1:
+            for obj in data:
+                for val, key in zip(meta, meta_keys):
+                    if level + 1 == len(val):
+                        seen_meta[key] = _pull_field(obj, val[-1])
+
+                _recursive_extract(obj[path[0]], path[1:],
+                                   seen_meta, level=level + 1)
+        else:
+            for obj in data:
+                recs = _pull_field(obj, path[0])
+
+                # For repeating the metadata later
+                lengths.append(len(recs))
+
+                for val, key in zip(meta, meta_keys):
+                    if level + 1 > len(val):
+                        meta_val = seen_meta[key]
+                    else:
+                        try:
+                            meta_val = _pull_field(obj, val[level:])
+                        except KeyError as e:
+                            if errors == 'ignore':
+                                meta_val = np.nan
+                            else:
+                                raise \
+                                    KeyError("Try running with "
+                                             "errors='ignore' as key "
+                                             "{err} is not always present"
+                                             .format(err=e))
+                    meta_vals[key].append(meta_val)
+
+                records.extend(recs)
+
+    _recursive_extract(data, record_path, {}, level=0)
+
+    result = DataFrame(records)
+
+    if record_prefix is not None:
+        result = result.rename(
+            columns=lambda x: "{p}{c}".format(p=record_prefix, c=x))
+
+    # Data types, a problem
+    for k, v in compat.iteritems(meta_vals):
+        if meta_prefix is not None:
+            k = meta_prefix + k
+
+        if k in result:
+            raise ValueError('Conflicting metadata name {name}, '
+                             'need distinguishing prefix '.format(name=k))
+
+        result[k] = np.array(v).repeat(lengths)
+
+    return result
diff --git a/pandas/io/json/table_schema.py b/pandas/io/json/table_schema.py
new file mode 100644
index 0000000000000..2dc176648fb31
--- /dev/null
+++ b/pandas/io/json/table_schema.py
@@ -0,0 +1,324 @@
+"""
+Table Schema builders
+
+http://specs.frictionlessdata.io/json-table-schema/
+"""
+import warnings
+
+import pandas._libs.json as json
+from pandas import DataFrame
+from pandas.api.types import CategoricalDtype
+import pandas.core.common as com
+from pandas.core.dtypes.common import (
+    is_integer_dtype, is_timedelta64_dtype, is_numeric_dtype,
+    is_bool_dtype, is_datetime64_dtype, is_datetime64tz_dtype,
+    is_categorical_dtype, is_period_dtype, is_string_dtype
+)
+
+loads = json.loads
+
+
+def as_json_table_type(x):
+    """
+    Convert a NumPy / pandas type to its corresponding json_table.
+
+    Parameters
+    ----------
+    x : array or dtype
+
+    Returns
+    -------
+    t : str
+        the Table Schema data types
+
+    Notes
+    -----
+    This table shows the relationship between NumPy / pandas dtypes,
+    and Table Schema dtypes.
+
+    ==============  =================
+    Pandas type     Table Schema type
+    ==============  =================
+    int64           integer
+    float64         number
+    bool            boolean
+    datetime64[ns]  datetime
+    timedelta64[ns] duration
+    object          str
+    categorical     any
+    =============== =================
+    """
+    if is_integer_dtype(x):
+        return 'integer'
+    elif is_bool_dtype(x):
+        return 'boolean'
+    elif is_numeric_dtype(x):
+        return 'number'
+    elif (is_datetime64_dtype(x) or is_datetime64tz_dtype(x) or
+          is_period_dtype(x)):
+        return 'datetime'
+    elif is_timedelta64_dtype(x):
+        return 'duration'
+    elif is_categorical_dtype(x):
+        return 'any'
+    elif is_string_dtype(x):
+        return 'string'
+    else:
+        return 'any'
+
+
+def set_default_names(data):
+    """Sets index names to 'index' for regular, or 'level_x' for Multi"""
+    if com._all_not_none(*data.index.names):
+        nms = data.index.names
+        if len(nms) == 1 and data.index.name == 'index':
+            warnings.warn("Index name of 'index' is not round-trippable")
+        elif len(nms) > 1 and any(x.startswith('level_') for x in nms):
+            warnings.warn("Index names beginning with 'level_' are not "
+                          "round-trippable")
+        return data
+
+    data = data.copy()
+    if data.index.nlevels > 1:
+        names = [name if name is not None else 'level_{}'.format(i)
+                 for i, name in enumerate(data.index.names)]
+        data.index.names = names
+    else:
+        data.index.name = data.index.name or 'index'
+    return data
+
+
+def convert_pandas_type_to_json_field(arr, dtype=None):
+    dtype = dtype or arr.dtype
+    if arr.name is None:
+        name = 'values'
+    else:
+        name = arr.name
+    field = {'name': name,
+             'type': as_json_table_type(dtype)}
+
+    if is_categorical_dtype(arr):
+        if hasattr(arr, 'categories'):
+            cats = arr.categories
+            ordered = arr.ordered
+        else:
+            cats = arr.cat.categories
+            ordered = arr.cat.ordered
+        field['constraints'] = {"enum": list(cats)}
+        field['ordered'] = ordered
+    elif is_period_dtype(arr):
+        field['freq'] = arr.freqstr
+    elif is_datetime64tz_dtype(arr):
+        if hasattr(arr, 'dt'):
+            field['tz'] = arr.dt.tz.zone
+        else:
+            field['tz'] = arr.tz.zone
+    return field
+
+
+def convert_json_field_to_pandas_type(field):
+    """
+    Converts a JSON field descriptor into its corresponding NumPy / pandas type
+
+    Parameters
+    ----------
+    field
+        A JSON field descriptor
+
+    Returns
+    -------
+    dtype
+
+    Raises
+    -----
+    ValueError
+        If the type of the provided field is unknown or currently unsupported
+
+    Examples
+    --------
+    >>> convert_json_field_to_pandas_type({'name': 'an_int',
+                                           'type': 'integer'})
+    'int64'
+    >>> convert_json_field_to_pandas_type({'name': 'a_categorical',
+                                           'type': 'any',
+                                           'contraints': {'enum': [
+                                                          'a', 'b', 'c']},
+                                           'ordered': True})
+    'CategoricalDtype(categories=['a', 'b', 'c'], ordered=True)'
+    >>> convert_json_field_to_pandas_type({'name': 'a_datetime',
+                                           'type': 'datetime'})
+    'datetime64[ns]'
+    >>> convert_json_field_to_pandas_type({'name': 'a_datetime_with_tz',
+                                           'type': 'datetime',
+                                           'tz': 'US/Central'})
+    'datetime64[ns, US/Central]'
+    """
+    typ = field['type']
+    if typ == 'string':
+        return 'object'
+    elif typ == 'integer':
+        return 'int64'
+    elif typ == 'number':
+        return 'float64'
+    elif typ == 'boolean':
+        return 'bool'
+    elif typ == 'duration':
+        return 'timedelta64'
+    elif typ == 'datetime':
+        if field.get('tz'):
+            return 'datetime64[ns, {tz}]'.format(tz=field['tz'])
+        else:
+            return 'datetime64[ns]'
+    elif typ == 'any':
+        if 'constraints' in field and 'ordered' in field:
+            return CategoricalDtype(categories=field['constraints']['enum'],
+                                    ordered=field['ordered'])
+        else:
+            return 'object'
+
+    raise ValueError("Unsupported or invalid field type: {}".format(typ))
+
+
+def build_table_schema(data, index=True, primary_key=None, version=True):
+    """
+    Create a Table schema from ``data``.
+
+    Parameters
+    ----------
+    data : Series, DataFrame
+    index : bool, default True
+        Whether to include ``data.index`` in the schema.
+    primary_key : bool or None, default True
+        column names to designate as the primary key.
+        The default `None` will set `'primaryKey'` to the index
+        level or levels if the index is unique.
+    version : bool, default True
+        Whether to include a field `pandas_version` with the version
+        of pandas that generated the schema.
+
+    Returns
+    -------
+    schema : dict
+
+    Examples
+    --------
+    >>> df = pd.DataFrame(
+    ...     {'A': [1, 2, 3],
+    ...      'B': ['a', 'b', 'c'],
+    ...      'C': pd.date_range('2016-01-01', freq='d', periods=3),
+    ...     }, index=pd.Index(range(3), name='idx'))
+    >>> build_table_schema(df)
+    {'fields': [{'name': 'idx', 'type': 'integer'},
+    {'name': 'A', 'type': 'integer'},
+    {'name': 'B', 'type': 'string'},
+    {'name': 'C', 'type': 'datetime'}],
+    'pandas_version': '0.20.0',
+    'primaryKey': ['idx']}
+
+    Notes
+    -----
+    See `_as_json_table_type` for conversion types.
+    Timedeltas as converted to ISO8601 duration format with
+    9 decimal places after the seconds field for nanosecond precision.
+
+    Categoricals are converted to the `any` dtype, and use the `enum` field
+    constraint to list the allowed values. The `ordered` attribute is included
+    in an `ordered` field.
+    """
+    if index is True:
+        data = set_default_names(data)
+
+    schema = {}
+    fields = []
+
+    if index:
+        if data.index.nlevels > 1:
+            for level in data.index.levels:
+                fields.append(convert_pandas_type_to_json_field(level))
+        else:
+            fields.append(convert_pandas_type_to_json_field(data.index))
+
+    if data.ndim > 1:
+        for column, s in data.iteritems():
+            fields.append(convert_pandas_type_to_json_field(s))
+    else:
+        fields.append(convert_pandas_type_to_json_field(data))
+
+    schema['fields'] = fields
+    if index and data.index.is_unique and primary_key is None:
+        if data.index.nlevels == 1:
+            schema['primaryKey'] = [data.index.name]
+        else:
+            schema['primaryKey'] = data.index.names
+    elif primary_key is not None:
+        schema['primaryKey'] = primary_key
+
+    if version:
+        schema['pandas_version'] = '0.20.0'
+    return schema
+
+
+def parse_table_schema(json, precise_float):
+    """
+    Builds a DataFrame from a given schema
+
+    Parameters
+    ----------
+    json :
+        A JSON table schema
+    precise_float : boolean
+        Flag controlling precision when decoding string to double values, as
+        dictated by ``read_json``
+
+    Returns
+    -------
+    df : DataFrame
+
+    Raises
+    ------
+    NotImplementedError
+        If the JSON table schema contains either timezone or timedelta data
+
+    Notes
+    -----
+        Because :func:`DataFrame.to_json` uses the string 'index' to denote a
+        name-less :class:`Index`, this function sets the name of the returned
+        :class:`DataFrame` to ``None`` when said string is encountered with a
+        normal :class:`Index`. For a :class:`MultiIndex`, the same limitation
+        applies to any strings beginning with 'level_'. Therefore, an
+        :class:`Index` name of 'index'  and :class:`MultiIndex` names starting
+        with 'level_' are not supported.
+
+    See also
+    --------
+    build_table_schema : inverse function
+    pandas.read_json
+    """
+    table = loads(json, precise_float=precise_float)
+    col_order = [field['name'] for field in table['schema']['fields']]
+    df = DataFrame(table['data'], columns=col_order)[col_order]
+
+    dtypes = {field['name']: convert_json_field_to_pandas_type(field)
+              for field in table['schema']['fields']}
+
+    # Cannot directly use as_type with timezone data on object; raise for now
+    if any(str(x).startswith('datetime64[ns, ') for x in dtypes.values()):
+        raise NotImplementedError('table="orient" can not yet read timezone '
+                                  'data')
+
+    # No ISO constructor for Timedelta as of yet, so need to raise
+    if 'timedelta64' in dtypes.values():
+        raise NotImplementedError('table="orient" can not yet read '
+                                  'ISO-formatted Timedelta data')
+
+    df = df.astype(dtypes)
+
+    df = df.set_index(table['schema']['primaryKey'])
+    if len(df.index.names) == 1:
+        if df.index.name == 'index':
+            df.index.name = None
+    else:
+        df.index.names = [None if x.startswith('level_') else x for x in
+                          df.index.names]
+
+    return df
diff --git a/pandas/io/msgpack/__init__.py b/pandas/io/msgpack/__init__.py
new file mode 100644
index 0000000000000..984e90ee03e69
--- /dev/null
+++ b/pandas/io/msgpack/__init__.py
@@ -0,0 +1,50 @@
+# coding: utf-8
+
+from collections import namedtuple
+
+from pandas.io.msgpack.exceptions import *  # noqa
+from pandas.io.msgpack._version import version  # noqa
+
+
+class ExtType(namedtuple('ExtType', 'code data')):
+    """ExtType represents ext type in msgpack."""
+    def __new__(cls, code, data):
+        if not isinstance(code, int):
+            raise TypeError("code must be int")
+        if not isinstance(data, bytes):
+            raise TypeError("data must be bytes")
+        if not 0 <= code <= 127:
+            raise ValueError("code must be 0~127")
+        return super(ExtType, cls).__new__(cls, code, data)
+
+import os  # noqa
+
+from pandas.io.msgpack._packer import Packer  # noqa
+from pandas.io.msgpack._unpacker import unpack, unpackb, Unpacker  # noqa
+
+
+def pack(o, stream, **kwargs):
+    """
+    Pack object `o` and write it to `stream`
+
+    See :class:`Packer` for options.
+    """
+    packer = Packer(**kwargs)
+    stream.write(packer.pack(o))
+
+
+def packb(o, **kwargs):
+    """
+    Pack object `o` and return packed bytes
+
+    See :class:`Packer` for options.
+    """
+    return Packer(**kwargs).pack(o)
+
+
+# alias for compatibility to simplejson/marshal/pickle.
+load = unpack
+loads = unpackb
+
+dump = pack
+dumps = packb
diff --git a/pandas/msgpack/_packer.pyx b/pandas/io/msgpack/_packer.pyx
similarity index 82%
rename from pandas/msgpack/_packer.pyx
rename to pandas/io/msgpack/_packer.pyx
index 5004b9e8e7262..c81069c8e04c0 100644
--- a/pandas/msgpack/_packer.pyx
+++ b/pandas/io/msgpack/_packer.pyx
@@ -1,16 +1,17 @@
 # coding: utf-8
-#cython: embedsignature=True
+# cython: embedsignature=True
 
 from cpython cimport *
 from libc.stdlib cimport *
 from libc.string cimport *
 from libc.limits cimport *
 
-from pandas.msgpack.exceptions import PackValueError
-from pandas.msgpack import ExtType
+from pandas.io.msgpack.exceptions import PackValueError
+from pandas.io.msgpack import ExtType
+import numpy as np
 
 
-cdef extern from "../src/msgpack/pack.h":
+cdef extern from "../../src/msgpack/pack.h":
     struct msgpack_packer:
         char* buf
         size_t length
@@ -23,7 +24,8 @@ cdef extern from "../src/msgpack/pack.h":
     int msgpack_pack_false(msgpack_packer* pk)
     int msgpack_pack_long(msgpack_packer* pk, long d)
     int msgpack_pack_long_long(msgpack_packer* pk, long long d)
-    int msgpack_pack_unsigned_long_long(msgpack_packer* pk, unsigned long long d)
+    int msgpack_pack_unsigned_long_long(msgpack_packer* pk,
+                                        unsigned long long d)
     int msgpack_pack_float(msgpack_packer* pk, float d)
     int msgpack_pack_double(msgpack_packer* pk, double d)
     int msgpack_pack_array(msgpack_packer* pk, size_t l)
@@ -58,8 +60,10 @@ cdef class Packer(object):
     :param bool use_single_float:
         Use single precision float type for float. (default: False)
     :param bool autoreset:
-        Reset buffer after each pack and return it's content as `bytes`. (default: True).
-        If set this to false, use `bytes()` to get content and `.reset()` to clear buffer.
+        Reset buffer after each pack and return it's
+        content as `bytes`. (default: True).
+        If set this to false, use `bytes()` to get
+        content and `.reset()` to clear buffer.
     :param bool use_bin_type:
         Use bin type introduced in msgpack spec 2.0 for bytes.
         It also enable str8 type for unicode.
@@ -74,15 +78,16 @@ cdef class Packer(object):
     cdef bint autoreset
 
     def __cinit__(self):
-        cdef int buf_size = 1024*1024
-        self.pk.buf = <char*> malloc(buf_size);
+        cdef int buf_size = 1024 * 1024
+        self.pk.buf = <char*> malloc(buf_size)
         if self.pk.buf == NULL:
             raise MemoryError("Unable to allocate internal buffer.")
         self.pk.buf_size = buf_size
         self.pk.length = 0
 
-    def __init__(self, default=None, encoding='utf-8', unicode_errors='strict',
-                 use_single_float=False, bint autoreset=1, bint use_bin_type=0):
+    def __init__(self, default=None, encoding='utf-8',
+                 unicode_errors='strict', use_single_float=False,
+                 bint autoreset=1, bint use_bin_type=0):
         """
         """
         self.use_float = use_single_float
@@ -110,7 +115,8 @@ cdef class Packer(object):
     def __dealloc__(self):
         free(self.pk.buf);
 
-    cdef int _pack(self, object o, int nest_limit=DEFAULT_RECURSE_LIMIT) except -1:
+    cdef int _pack(self, object o,
+                   int nest_limit=DEFAULT_RECURSE_LIMIT) except -1:
         cdef long long llval
         cdef unsigned long long ullval
         cdef long longval
@@ -128,7 +134,7 @@ cdef class Packer(object):
         while True:
             if o is None:
                 ret = msgpack_pack_nil(&self.pk)
-            elif isinstance(o, bool):
+            elif isinstance(o, (bool, np.bool_)):
                 if o:
                     ret = msgpack_pack_true(&self.pk)
                 else:
@@ -147,14 +153,14 @@ cdef class Packer(object):
                 ret = msgpack_pack_long(&self.pk, longval)
             elif PyFloat_Check(o):
                 if self.use_float:
-                   fval = o
-                   ret = msgpack_pack_float(&self.pk, fval)
+                    fval = o
+                    ret = msgpack_pack_float(&self.pk, fval)
                 else:
-                   dval = o
-                   ret = msgpack_pack_double(&self.pk, dval)
+                    dval = o
+                    ret = msgpack_pack_double(&self.pk, dval)
             elif PyBytes_Check(o):
                 L = len(o)
-                if L > (2**32)-1:
+                if L > (2**32) - 1:
                     raise ValueError("bytes is too large")
                 rawval = o
                 ret = msgpack_pack_bin(&self.pk, L)
@@ -162,10 +168,12 @@ cdef class Packer(object):
                     ret = msgpack_pack_raw_body(&self.pk, rawval, L)
             elif PyUnicode_Check(o):
                 if not self.encoding:
-                    raise TypeError("Can't encode unicode string: no encoding is specified")
-                o = PyUnicode_AsEncodedString(o, self.encoding, self.unicode_errors)
+                    raise TypeError("Can't encode unicode string: "
+                                    "no encoding is specified")
+                o = PyUnicode_AsEncodedString(o, self.encoding,
+                                              self.unicode_errors)
                 L = len(o)
-                if L > (2**32)-1:
+                if L > (2**32) - 1:
                     raise ValueError("dict is too large")
                 rawval = o
                 ret = msgpack_pack_raw(&self.pk, len(o))
@@ -174,50 +182,50 @@ cdef class Packer(object):
             elif PyDict_CheckExact(o):
                 d = <dict>o
                 L = len(d)
-                if L > (2**32)-1:
+                if L > (2**32) - 1:
                     raise ValueError("dict is too large")
                 ret = msgpack_pack_map(&self.pk, L)
                 if ret == 0:
                     for k, v in d.iteritems():
-                        ret = self._pack(k, nest_limit-1)
+                        ret = self._pack(k, nest_limit - 1)
                         if ret != 0: break
-                        ret = self._pack(v, nest_limit-1)
+                        ret = self._pack(v, nest_limit - 1)
                         if ret != 0: break
             elif PyDict_Check(o):
                 L = len(o)
-                if L > (2**32)-1:
+                if L > (2**32) - 1:
                     raise ValueError("dict is too large")
                 ret = msgpack_pack_map(&self.pk, L)
                 if ret == 0:
                     for k, v in o.items():
-                        ret = self._pack(k, nest_limit-1)
+                        ret = self._pack(k, nest_limit - 1)
                         if ret != 0: break
-                        ret = self._pack(v, nest_limit-1)
+                        ret = self._pack(v, nest_limit - 1)
                         if ret != 0: break
             elif isinstance(o, ExtType):
                 # This should be before Tuple because ExtType is namedtuple.
                 longval = o.code
                 rawval = o.data
                 L = len(o.data)
-                if L > (2**32)-1:
+                if L > (2**32) - 1:
                     raise ValueError("EXT data is too large")
                 ret = msgpack_pack_ext(&self.pk, longval, L)
                 ret = msgpack_pack_raw_body(&self.pk, rawval, L)
             elif PyTuple_Check(o) or PyList_Check(o):
                 L = len(o)
-                if L > (2**32)-1:
+                if L > (2**32) - 1:
                     raise ValueError("list is too large")
                 ret = msgpack_pack_array(&self.pk, L)
                 if ret == 0:
                     for v in o:
-                        ret = self._pack(v, nest_limit-1)
+                        ret = self._pack(v, nest_limit - 1)
                         if ret != 0: break
             elif not default_used and self._default:
                 o = self._default(o)
                 default_used = 1
                 continue
             else:
-                raise TypeError("can't serialize %r" % (o,))
+                raise TypeError("can't serialize {thing!r}".format(thing=o))
             return ret
 
     cpdef pack(self, object obj):
@@ -237,7 +245,7 @@ cdef class Packer(object):
         msgpack_pack_raw_body(&self.pk, data, len(data))
 
     def pack_array_header(self, size_t size):
-        if size > (2**32-1):
+        if size > (2**32) - 1:
             raise ValueError
         cdef int ret = msgpack_pack_array(&self.pk, size)
         if ret == -1:
@@ -250,7 +258,7 @@ cdef class Packer(object):
             return buf
 
     def pack_map_header(self, size_t size):
-        if size > (2**32-1):
+        if size > (2**32) - 1:
             raise ValueError
         cdef int ret = msgpack_pack_map(&self.pk, size)
         if ret == -1:
diff --git a/pandas/msgpack/_unpacker.pyx b/pandas/io/msgpack/_unpacker.pyx
similarity index 83%
rename from pandas/msgpack/_unpacker.pyx
rename to pandas/io/msgpack/_unpacker.pyx
index f68bf3369427c..04bb330e595dd 100644
--- a/pandas/msgpack/_unpacker.pyx
+++ b/pandas/io/msgpack/_unpacker.pyx
@@ -1,29 +1,26 @@
 # coding: utf-8
-#cython: embedsignature=True
+# cython: embedsignature=True
 
 from cpython cimport *
 cdef extern from "Python.h":
     ctypedef struct PyObject
-    cdef int PyObject_AsReadBuffer(object o, const void** buff, Py_ssize_t* buf_len) except -1
+    cdef int PyObject_AsReadBuffer(object o, const void** buff,
+                                   Py_ssize_t* buf_len) except -1
 
 from libc.stdlib cimport *
 from libc.string cimport *
 from libc.limits cimport *
 
-from pandas.msgpack.exceptions import (
-        BufferFull,
-        OutOfData,
-        UnpackValueError,
-        ExtraData,
-        )
-from pandas.msgpack import ExtType
+from pandas.io.msgpack.exceptions import (BufferFull, OutOfData,
+                                          UnpackValueError, ExtraData)
+from pandas.io.msgpack import ExtType
 
 
-cdef extern from "../src/msgpack/unpack.h":
+cdef extern from "../../src/msgpack/unpack.h":
     ctypedef struct msgpack_user:
         bint use_list
         PyObject* object_hook
-        bint has_pairs_hook # call object_hook with k-v pairs
+        bint has_pairs_hook  # call object_hook with k-v pairs
         PyObject* list_hook
         PyObject* ext_hook
         char *encoding
@@ -65,7 +62,8 @@ cdef inline init_ctx(unpack_context *ctx,
     ctx.user.max_ext_len = max_ext_len
 
     if object_hook is not None and object_pairs_hook is not None:
-        raise TypeError("object_pairs_hook and object_hook are mutually exclusive.")
+        raise TypeError("object_pairs_hook and object_hook "
+                        "are mutually exclusive.")
 
     if object_hook is not None:
         if not PyCallable_Check(object_hook):
@@ -93,13 +91,16 @@ cdef inline init_ctx(unpack_context *ctx,
     ctx.user.encoding = encoding
     ctx.user.unicode_errors = unicode_errors
 
+
 def default_read_extended_type(typecode, data):
-    raise NotImplementedError("Cannot decode extended type with typecode=%d" % typecode)
+    raise NotImplementedError("Cannot decode extended type "
+                              "with typecode={code}".format(code=typecode))
+
 
 def unpackb(object packed, object object_hook=None, object list_hook=None,
             bint use_list=1, encoding=None, unicode_errors="strict",
             object_pairs_hook=None, ext_hook=ExtType,
-            Py_ssize_t max_str_len=2147483647, # 2**32-1
+            Py_ssize_t max_str_len=2147483647,  # 2**32-1
             Py_ssize_t max_bin_len=2147483647,
             Py_ssize_t max_array_len=2147483647,
             Py_ssize_t max_map_len=2147483647,
@@ -139,10 +140,11 @@ def unpackb(object packed, object object_hook=None, object list_hook=None,
     if ret == 1:
         obj = unpack_data(&ctx)
         if off < buf_len:
-            raise ExtraData(obj, PyBytes_FromStringAndSize(buf+off, buf_len-off))
+            raise ExtraData(obj, PyBytes_FromStringAndSize(
+                buf + off, buf_len - off))
         return obj
     else:
-        raise UnpackValueError("Unpack failed: error = %d" % (ret,))
+        raise UnpackValueError("Unpack failed: error = {ret}".format(ret=ret))
 
 
 def unpack(object stream, object object_hook=None, object list_hook=None,
@@ -157,9 +159,9 @@ def unpack(object stream, object object_hook=None, object list_hook=None,
     See :class:`Unpacker` for options.
     """
     return unpackb(stream.read(), use_list=use_list,
-                   object_hook=object_hook, object_pairs_hook=object_pairs_hook, list_hook=list_hook,
-                   encoding=encoding, unicode_errors=unicode_errors,
-                   )
+                   object_hook=object_hook,
+                   object_pairs_hook=object_pairs_hook, list_hook=list_hook,
+                   encoding=encoding, unicode_errors=unicode_errors)
 
 
 cdef class Unpacker(object):
@@ -169,10 +171,12 @@ cdef class Unpacker(object):
 
     :param file_like:
         File-like object having `.read(n)` method.
-        If specified, unpacker reads serialized data from it and :meth:`feed()` is not usable.
+        If specified, unpacker reads serialized data from it and
+        :meth:`feed()` is not usable.
 
     :param int read_size:
-        Used as `file_like.read(read_size)`. (default: `min(1024**2, max_buffer_size)`)
+        Used as `file_like.read(read_size)`. (default:
+        `min(1024**2, max_buffer_size)`)
 
     :param bool use_list:
         If true, unpack msgpack array to Python list.
@@ -184,9 +188,8 @@ cdef class Unpacker(object):
         (See also simplejson)
 
     :param callable object_pairs_hook:
-        When specified, it should be callable.
-        Unpacker calls it with a list of key-value pairs after unpacking msgpack map.
-        (See also simplejson)
+        When specified, it should be callable. Unpacker calls it with a list
+        of key-value pairs after unpacking msgpack map. (See also simplejson)
 
     :param str encoding:
         Encoding used for decoding msgpack raw.
@@ -197,9 +200,10 @@ cdef class Unpacker(object):
         (default: `'strict'`)
 
     :param int max_buffer_size:
-        Limits size of data waiting unpacked.  0 means system's INT_MAX (default).
-        Raises `BufferFull` exception when it is insufficient.
-        You shoud set this parameter when unpacking data from untrasted source.
+        Limits size of data waiting unpacked.  0 means system's
+        INT_MAX  (default). Raises `BufferFull` exception when it
+        is insufficient. You should set this parameter when unpacking
+        data from untrasted source.
 
     :param int max_str_len:
         Limits max length of str. (default: 2**31-1)
@@ -250,10 +254,10 @@ cdef class Unpacker(object):
         self.buf = NULL
 
     def __init__(self, file_like=None, Py_ssize_t read_size=0, bint use_list=1,
-                 object object_hook=None, object object_pairs_hook=None, object list_hook=None,
-                 encoding=None, unicode_errors='strict', int max_buffer_size=0,
-                 object ext_hook=ExtType,
-                 Py_ssize_t max_str_len=2147483647, # 2**32-1
+                 object object_hook=None, object object_pairs_hook=None,
+                 object list_hook=None, encoding=None, unicode_errors='strict',
+                 int max_buffer_size=0, object ext_hook=ExtType,
+                 Py_ssize_t max_str_len=2147483647,  # 2**32-1
                  Py_ssize_t max_bin_len=2147483647,
                  Py_ssize_t max_array_len=2147483647,
                  Py_ssize_t max_map_len=2147483647,
@@ -274,7 +278,8 @@ cdef class Unpacker(object):
         if not max_buffer_size:
             max_buffer_size = INT_MAX
         if read_size > max_buffer_size:
-            raise ValueError("read_size should be less or equal to max_buffer_size")
+            raise ValueError("read_size should be less or "
+                             "equal to max_buffer_size")
         if not read_size:
             read_size = min(max_buffer_size, 1024**2)
         self.max_buffer_size = max_buffer_size
@@ -313,8 +318,8 @@ cdef class Unpacker(object):
         """Append `next_bytes` to internal buffer."""
         cdef Py_buffer pybuff
         if self.file_like is not None:
-            raise AssertionError(
-                    "unpacker.feed() is not be able to use with `file_like`.")
+            raise AssertionError("unpacker.feed() is not be able "
+                                 "to use with `file_like`.")
         PyObject_GetBuffer(next_bytes, &pybuff, PyBUF_SIMPLE)
         try:
             self.append_buffer(<char*>pybuff.buf, pybuff.len)
@@ -338,10 +343,10 @@ cdef class Unpacker(object):
                 head = 0
             else:
                 # expand buffer.
-                new_size = (tail-head) + _buf_len
+                new_size = (tail - head) + _buf_len
                 if new_size > self.max_buffer_size:
                     raise BufferFull
-                new_size = min(new_size*2, self.max_buffer_size)
+                new_size = min(new_size * 2, self.max_buffer_size)
                 new_buf = <char*>malloc(new_size)
                 if new_buf == NULL:
                     # self.buf still holds old buffer and will be freed during
@@ -363,15 +368,16 @@ cdef class Unpacker(object):
 
     cdef read_from_file(self):
         next_bytes = self.file_like_read(
-                min(self.read_size,
-                    self.max_buffer_size - (self.buf_tail - self.buf_head)
-                    ))
+            min(self.read_size,
+                self.max_buffer_size - (self.buf_tail - self.buf_head)))
         if next_bytes:
-            self.append_buffer(PyBytes_AsString(next_bytes), PyBytes_Size(next_bytes))
+            self.append_buffer(PyBytes_AsString(next_bytes),
+                               PyBytes_Size(next_bytes))
         else:
             self.file_like = None
 
-    cdef object _unpack(self, execute_fn execute, object write_bytes, bint iter=0):
+    cdef object _unpack(self, execute_fn execute,
+                        object write_bytes, bint iter=0):
         cdef int ret
         cdef object obj
         cdef size_t prev_head
@@ -389,7 +395,8 @@ cdef class Unpacker(object):
 
             ret = execute(&self.ctx, self.buf, self.buf_tail, &self.buf_head)
             if write_bytes is not None:
-                write_bytes(PyBytes_FromStringAndSize(self.buf + prev_head, self.buf_head - prev_head))
+                write_bytes(PyBytes_FromStringAndSize(
+                    self.buf + prev_head, self.buf_head - prev_head))
 
             if ret == 1:
                 obj = unpack_data(&self.ctx)
@@ -404,7 +411,8 @@ cdef class Unpacker(object):
                 else:
                     raise OutOfData("No more data to unpack.")
             else:
-                raise ValueError("Unpack failed: error = %d" % (ret,))
+                raise ValueError("Unpack failed: error = {ret}"
+                                 .format(ret=ret))
 
     def read_bytes(self, Py_ssize_t nbytes):
         """Read a specified number of raw bytes from the stream"""
@@ -459,8 +467,8 @@ cdef class Unpacker(object):
         return self._unpack(unpack_construct, None, 1)
 
     # for debug.
-    #def _buf(self):
+    # def _buf(self):
     #    return PyString_FromStringAndSize(self.buf, self.buf_tail)
 
-    #def _off(self):
+    # def _off(self):
     #    return self.buf_head
diff --git a/pandas/msgpack/_version.py b/pandas/io/msgpack/_version.py
similarity index 100%
rename from pandas/msgpack/_version.py
rename to pandas/io/msgpack/_version.py
diff --git a/pandas/io/msgpack/exceptions.py b/pandas/io/msgpack/exceptions.py
new file mode 100644
index 0000000000000..ae0f74a6700bd
--- /dev/null
+++ b/pandas/io/msgpack/exceptions.py
@@ -0,0 +1,32 @@
+class UnpackException(Exception):
+    pass
+
+
+class BufferFull(UnpackException):
+    pass
+
+
+class OutOfData(UnpackException):
+    pass
+
+
+class UnpackValueError(UnpackException, ValueError):
+    pass
+
+
+class ExtraData(ValueError):
+
+    def __init__(self, unpacked, extra):
+        self.unpacked = unpacked
+        self.extra = extra
+
+    def __str__(self):
+        return "unpack(b) received extra data."
+
+
+class PackException(Exception):
+    pass
+
+
+class PackValueError(PackException, ValueError):
+    pass
diff --git a/pandas/io/packers.py b/pandas/io/packers.py
index d5c02736a1cf5..03a5e8528f72d 100644
--- a/pandas/io/packers.py
+++ b/pandas/io/packers.py
@@ -1,12 +1,10 @@
 """
 Msgpack serializer support for reading and writing pandas data structures
 to disk
-"""
 
-# portions of msgpack_numpy package, by Lev Givon were incorporated
-# into this module (and tests_packers.py)
+portions of msgpack_numpy package, by Lev Givon were incorporated
+into this module (and tests_packers.py)
 
-"""
 License
 =======
 
@@ -40,27 +38,79 @@
 OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 """
 
-import os
 from datetime import datetime, date, timedelta
 from dateutil.parser import parse
+import os
+from textwrap import dedent
+import warnings
 
 import numpy as np
 from pandas import compat
-from pandas.compat import u, PY3
-from pandas import (
-    Timestamp, Period, Series, DataFrame, Panel, Panel4D,
-    Index, MultiIndex, Int64Index, PeriodIndex, DatetimeIndex, Float64Index,
-    NaT
-)
-from pandas.sparse.api import SparseSeries, SparseDataFrame, SparsePanel
-from pandas.sparse.array import BlockIndex, IntIndex
+from pandas.compat import u, u_safe
+
+from pandas.core.dtypes.common import (
+    is_categorical_dtype, is_object_dtype,
+    needs_i8_conversion, pandas_dtype)
+
+from pandas import (Timestamp, Period, Series, DataFrame,  # noqa
+                    Index, MultiIndex, Float64Index, Int64Index,
+                    Panel, RangeIndex, PeriodIndex, DatetimeIndex, NaT,
+                    Categorical, CategoricalIndex, IntervalIndex, Interval,
+                    TimedeltaIndex)
+from pandas.core.sparse.api import SparseSeries, SparseDataFrame
+from pandas.core.sparse.array import BlockIndex, IntIndex
 from pandas.core.generic import NDFrame
-from pandas.core.common import needs_i8_conversion
-from pandas.io.common import get_filepath_or_buffer
-from pandas.core.internals import BlockManager, make_block
+from pandas.errors import PerformanceWarning
+from pandas.io.common import get_filepath_or_buffer, _stringify_path
+from pandas.core.internals import BlockManager, make_block, _safe_reshape
 import pandas.core.internals as internals
 
-from pandas.msgpack import Unpacker as _Unpacker, Packer as _Packer, ExtType
+from pandas.io.msgpack import Unpacker as _Unpacker, Packer as _Packer, ExtType
+from pandas.util._move import (
+    BadMove as _BadMove,
+    move_into_mutable_buffer as _move_into_mutable_buffer,
+)
+
+# check which compression libs we have installed
+try:
+    import zlib
+
+    def _check_zlib():
+        pass
+except ImportError:
+    def _check_zlib():
+        raise ImportError('zlib is not installed')
+
+_check_zlib.__doc__ = dedent(
+    """\
+    Check if zlib is installed.
+
+    Raises
+    ------
+    ImportError
+        Raised when zlib is not installed.
+    """,
+)
+
+try:
+    import blosc
+
+    def _check_blosc():
+        pass
+except ImportError:
+    def _check_blosc():
+        raise ImportError('blosc is not installed')
+
+_check_blosc.__doc__ = dedent(
+    """\
+    Check if blosc is installed.
+
+    Raises
+    ------
+    ImportError
+        Raised when blosc is not installed.
+    """,
+)
 
 # until we can pass this into our conversion functions,
 # this is pretty hacky
@@ -79,6 +129,7 @@ def to_msgpack(path_or_buf, *args, **kwargs):
     path_or_buf : string File path, buffer-like, or None
                   if None, return generated string
     args : an object or objects to serialize
+    encoding: encoding for unicode objects
     append : boolean whether to append to an existing msgpack
              (default is False)
     compress : type of compressor (zlib or blosc), default to None (no
@@ -86,6 +137,8 @@ def to_msgpack(path_or_buf, *args, **kwargs):
     """
     global compressor
     compressor = kwargs.pop('compress', None)
+    if compressor:
+        compressor = u(compressor)
     append = kwargs.pop('append', None)
     if append:
         mode = 'a+b'
@@ -96,6 +149,7 @@ def writer(fh):
         for a in args:
             fh.write(pack(a, **kwargs))
 
+    path_or_buf = _stringify_path(path_or_buf)
     if isinstance(path_or_buf, compat.string_types):
         with open(path_or_buf, mode) as fh:
             writer(fh)
@@ -107,7 +161,7 @@ def writer(fh):
         writer(path_or_buf)
 
 
-def read_msgpack(path_or_buf, iterator=False, **kwargs):
+def read_msgpack(path_or_buf, encoding='utf-8', iterator=False, **kwargs):
     """
     Load msgpack pandas object from the specified
     file path
@@ -118,27 +172,33 @@ def read_msgpack(path_or_buf, iterator=False, **kwargs):
     Parameters
     ----------
     path_or_buf : string File path, BytesIO like or string
+    encoding: Encoding for decoding msgpack str type
     iterator : boolean, if True, return an iterator to the unpacker
                (default is False)
 
     Returns
     -------
-    obj : type of object stored in file
+    obj : same type as object stored in file
 
     """
-    path_or_buf, _, _ = get_filepath_or_buffer(path_or_buf)
+    path_or_buf, _, _, should_close = get_filepath_or_buffer(path_or_buf)
     if iterator:
         return Iterator(path_or_buf)
 
     def read(fh):
-        l = list(unpack(fh, **kwargs))
+        l = list(unpack(fh, encoding=encoding, **kwargs))
         if len(l) == 1:
             return l[0]
+
+        if should_close:
+            try:
+                path_or_buf.close()
+            except:  # noqa: flake8
+                pass
         return l
 
     # see if we have an actual file
     if isinstance(path_or_buf, compat.string_types):
-
         try:
             exists = os.path.exists(path_or_buf)
         except (TypeError, ValueError):
@@ -148,22 +208,26 @@ def read(fh):
             with open(path_or_buf, 'rb') as fh:
                 return read(fh)
 
-    # treat as a binary-like
     if isinstance(path_or_buf, compat.binary_type):
+        # treat as a binary-like
         fh = None
         try:
-            fh = compat.BytesIO(path_or_buf)
-            return read(fh)
+            # We can't distinguish between a path and a buffer of bytes in
+            # Python 2 so instead assume the first byte of a valid path is
+            # less than 0x80.
+            if compat.PY3 or ord(path_or_buf[0]) >= 0x80:
+                fh = compat.BytesIO(path_or_buf)
+                return read(fh)
         finally:
             if fh is not None:
                 fh.close()
-
-    # a buffer like
-    if hasattr(path_or_buf, 'read') and compat.callable(path_or_buf.read):
+    elif hasattr(path_or_buf, 'read') and compat.callable(path_or_buf.read):
+        # treat as a buffer like
         return read(path_or_buf)
 
     raise ValueError('path_or_buf needs to be a string file path or file-like')
 
+
 dtype_dict = {21: np.dtype('M8[ns]'),
               u('datetime64[ns]'): np.dtype('M8[ns]'),
               u('datetime64[us]'): np.dtype('M8[us]'),
@@ -174,18 +238,20 @@ def read(fh):
               # this is platform int, which we need to remap to np.int64
               # for compat on windows platforms
               7: np.dtype('int64'),
-}
+              'category': 'category'
+              }
 
 
 def dtype_for(t):
     """ return my dtype mapping, whether number or name """
     if t in dtype_dict:
         return dtype_dict[t]
-    return np.typeDict[t]
+    return np.typeDict.get(t, t)
+
 
-c2f_dict = {'complex':    np.float64,
+c2f_dict = {'complex': np.float64,
             'complex128': np.float64,
-            'complex64':  np.float32}
+            'complex64': np.float32}
 
 # numpy 1.6.1 compat
 if hasattr(np, 'float128'):
@@ -205,15 +271,19 @@ def convert(values):
     """ convert the numpy values to a list """
 
     dtype = values.dtype
+
+    if is_categorical_dtype(values):
+        return values
+
+    elif is_object_dtype(dtype):
+        return values.ravel().tolist()
+
     if needs_i8_conversion(dtype):
         values = values.view('i8')
     v = values.ravel()
 
-    # convert object
-    if dtype == np.object_:
-        return v.tolist()
-
     if compressor == 'zlib':
+        _check_zlib()
 
         # return string arrays like they are
         if dtype == np.object_:
@@ -221,10 +291,10 @@ def convert(values):
 
         # convert to a bytes array
         v = v.tostring()
-        import zlib
         return ExtType(0, zlib.compress(v))
 
     elif compressor == 'blosc':
+        _check_blosc()
 
         # return string arrays like they are
         if dtype == np.object_:
@@ -232,7 +302,6 @@ def convert(values):
 
         # convert to a bytes array
         v = v.tostring()
-        import blosc
         return ExtType(0, blosc.compress(v, typesize=dtype.itemsize))
 
     # ndarray (on original dtype)
@@ -246,203 +315,251 @@ def unconvert(values, dtype, compress=None):
     if as_is_ext:
         values = values.data
 
-    if dtype == np.object_:
+    if is_categorical_dtype(dtype):
+        return values
+
+    elif is_object_dtype(dtype):
         return np.array(values, dtype=object)
 
+    dtype = pandas_dtype(dtype).base
+
     if not as_is_ext:
         values = values.encode('latin1')
 
-    if compress == 'zlib':
-        import zlib
-        values = zlib.decompress(values)
-        return np.frombuffer(values, dtype=dtype)
-
-    elif compress == 'blosc':
-        import blosc
-        values = blosc.decompress(values)
-        return np.frombuffer(values, dtype=dtype)
+    if compress:
+        if compress == u'zlib':
+            _check_zlib()
+            decompress = zlib.decompress
+        elif compress == u'blosc':
+            _check_blosc()
+            decompress = blosc.decompress
+        else:
+            raise ValueError("compress must be one of 'zlib' or 'blosc'")
 
-    # from a string
-    return np.fromstring(values, dtype=dtype)
+        try:
+            return np.frombuffer(
+                _move_into_mutable_buffer(decompress(values)),
+                dtype=dtype,
+            )
+        except _BadMove as e:
+            # Pull the decompressed data off of the `_BadMove` exception.
+            # We don't just store this in the locals because we want to
+            # minimize the risk of giving users access to a `bytes` object
+            # whose data is also given to a mutable buffer.
+            values = e.args[0]
+            if len(values) > 1:
+                # The empty string and single characters are memoized in many
+                # string creating functions in the capi. This case should not
+                # warn even though we need to make a copy because we are only
+                # copying at most 1 byte.
+                warnings.warn(
+                    'copying data after decompressing; this may mean that'
+                    ' decompress is caching its result',
+                    PerformanceWarning,
+                )
+                # fall through to copying `np.fromstring`
+
+    # Copy the bytes into a numpy array.
+    buf = np.frombuffer(values, dtype=dtype)
+    buf = buf.copy()  # required to not mutate the original data
+    buf.flags.writeable = True
+    return buf
 
 
 def encode(obj):
     """
     Data encoder
     """
-
     tobj = type(obj)
     if isinstance(obj, Index):
-        if isinstance(obj, PeriodIndex):
-            return {'typ': 'period_index',
-                    'klass': obj.__class__.__name__,
-                    'name': getattr(obj, 'name', None),
-                    'freq': getattr(obj, 'freqstr', None),
-                    'dtype': obj.dtype.name,
-                    'data': convert(obj.asi8),
-                    'compress': compressor}
+        if isinstance(obj, RangeIndex):
+            return {u'typ': u'range_index',
+                    u'klass': u(obj.__class__.__name__),
+                    u'name': getattr(obj, 'name', None),
+                    u'start': getattr(obj, '_start', None),
+                    u'stop': getattr(obj, '_stop', None),
+                    u'step': getattr(obj, '_step', None)}
+        elif isinstance(obj, PeriodIndex):
+            return {u'typ': u'period_index',
+                    u'klass': u(obj.__class__.__name__),
+                    u'name': getattr(obj, 'name', None),
+                    u'freq': u_safe(getattr(obj, 'freqstr', None)),
+                    u'dtype': u(obj.dtype.name),
+                    u'data': convert(obj.asi8),
+                    u'compress': compressor}
         elif isinstance(obj, DatetimeIndex):
             tz = getattr(obj, 'tz', None)
 
             # store tz info and data as UTC
             if tz is not None:
-                tz = tz.zone
+                tz = u(tz.zone)
                 obj = obj.tz_convert('UTC')
-            return {'typ': 'datetime_index',
-                    'klass': obj.__class__.__name__,
-                    'name': getattr(obj, 'name', None),
-                    'dtype': obj.dtype.name,
-                    'data': convert(obj.asi8),
-                    'freq': getattr(obj, 'freqstr', None),
-                    'tz': tz,
-                    'compress': compressor}
+            return {u'typ': u'datetime_index',
+                    u'klass': u(obj.__class__.__name__),
+                    u'name': getattr(obj, 'name', None),
+                    u'dtype': u(obj.dtype.name),
+                    u'data': convert(obj.asi8),
+                    u'freq': u_safe(getattr(obj, 'freqstr', None)),
+                    u'tz': tz,
+                    u'compress': compressor}
+        elif isinstance(obj, IntervalIndex):
+            return {u'typ': u'interval_index',
+                    u'klass': u(obj.__class__.__name__),
+                    u'name': getattr(obj, 'name', None),
+                    u'left': getattr(obj, '_left', None),
+                    u'right': getattr(obj, '_right', None),
+                    u'closed': getattr(obj, '_closed', None)}
         elif isinstance(obj, MultiIndex):
-            return {'typ': 'multi_index',
-                    'klass': obj.__class__.__name__,
-                    'names': getattr(obj, 'names', None),
-                    'dtype': obj.dtype.name,
-                    'data': convert(obj.values),
-                    'compress': compressor}
+            return {u'typ': u'multi_index',
+                    u'klass': u(obj.__class__.__name__),
+                    u'names': getattr(obj, 'names', None),
+                    u'dtype': u(obj.dtype.name),
+                    u'data': convert(obj.values),
+                    u'compress': compressor}
         else:
-            return {'typ': 'index',
-                    'klass': obj.__class__.__name__,
-                    'name': getattr(obj, 'name', None),
-                    'dtype': obj.dtype.name,
-                    'data': convert(obj.values),
-                    'compress': compressor}
+            return {u'typ': u'index',
+                    u'klass': u(obj.__class__.__name__),
+                    u'name': getattr(obj, 'name', None),
+                    u'dtype': u(obj.dtype.name),
+                    u'data': convert(obj.values),
+                    u'compress': compressor}
+
+    elif isinstance(obj, Categorical):
+        return {u'typ': u'category',
+                u'klass': u(obj.__class__.__name__),
+                u'name': getattr(obj, 'name', None),
+                u'codes': obj.codes,
+                u'categories': obj.categories,
+                u'ordered': obj.ordered,
+                u'compress': compressor}
+
     elif isinstance(obj, Series):
         if isinstance(obj, SparseSeries):
             raise NotImplementedError(
                 'msgpack sparse series is not implemented'
             )
-            #d = {'typ': 'sparse_series',
+            # d = {'typ': 'sparse_series',
             #     'klass': obj.__class__.__name__,
             #     'dtype': obj.dtype.name,
             #     'index': obj.index,
             #     'sp_index': obj.sp_index,
             #     'sp_values': convert(obj.sp_values),
             #     'compress': compressor}
-            #for f in ['name', 'fill_value', 'kind']:
+            # for f in ['name', 'fill_value', 'kind']:
             #    d[f] = getattr(obj, f, None)
-            #return d
+            # return d
         else:
-            return {'typ': 'series',
-                    'klass': obj.__class__.__name__,
-                    'name': getattr(obj, 'name', None),
-                    'index': obj.index,
-                    'dtype': obj.dtype.name,
-                    'data': convert(obj.values),
-                    'compress': compressor}
+            return {u'typ': u'series',
+                    u'klass': u(obj.__class__.__name__),
+                    u'name': getattr(obj, 'name', None),
+                    u'index': obj.index,
+                    u'dtype': u(obj.dtype.name),
+                    u'data': convert(obj.values),
+                    u'compress': compressor}
     elif issubclass(tobj, NDFrame):
         if isinstance(obj, SparseDataFrame):
             raise NotImplementedError(
                 'msgpack sparse frame is not implemented'
             )
-            #d = {'typ': 'sparse_dataframe',
+            # d = {'typ': 'sparse_dataframe',
             #     'klass': obj.__class__.__name__,
             #     'columns': obj.columns}
-            #for f in ['default_fill_value', 'default_kind']:
+            # for f in ['default_fill_value', 'default_kind']:
             #    d[f] = getattr(obj, f, None)
-            #d['data'] = dict([(name, ss)
+            # d['data'] = dict([(name, ss)
             #                 for name, ss in compat.iteritems(obj)])
-            #return d
-        elif isinstance(obj, SparsePanel):
-            raise NotImplementedError(
-                'msgpack sparse frame is not implemented'
-            )
-            #d = {'typ': 'sparse_panel',
-            #     'klass': obj.__class__.__name__,
-            #     'items': obj.items}
-            #for f in ['default_fill_value', 'default_kind']:
-            #    d[f] = getattr(obj, f, None)
-            #d['data'] = dict([(name, df)
-            #                 for name, df in compat.iteritems(obj)])
-            #return d
+            # return d
         else:
 
             data = obj._data
             if not data.is_consolidated():
                 data = data.consolidate()
 
-           # the block manager
-            return {'typ': 'block_manager',
-                    'klass': obj.__class__.__name__,
-                    'axes': data.axes,
-                    'blocks': [{'items': data.items.take(b.mgr_locs),
-                                'locs': b.mgr_locs.as_array,
-                                'values': convert(b.values),
-                                'shape': b.values.shape,
-                                'dtype': b.dtype.name,
-                                'klass': b.__class__.__name__,
-                                'compress': compressor
-                                } for b in data.blocks]}
+            # the block manager
+            return {u'typ': u'block_manager',
+                    u'klass': u(obj.__class__.__name__),
+                    u'axes': data.axes,
+                    u'blocks': [{u'locs': b.mgr_locs.as_array,
+                                 u'values': convert(b.values),
+                                 u'shape': b.values.shape,
+                                 u'dtype': u(b.dtype.name),
+                                 u'klass': u(b.__class__.__name__),
+                                 u'compress': compressor} for b in data.blocks]
+                    }
 
     elif isinstance(obj, (datetime, date, np.datetime64, timedelta,
-                          np.timedelta64)):
+                          np.timedelta64)) or obj is NaT:
         if isinstance(obj, Timestamp):
             tz = obj.tzinfo
             if tz is not None:
-                tz = tz.zone
-            offset = obj.offset
-            if offset is not None:
-                offset = offset.freqstr
-            return {'typ': 'timestamp',
-                    'value': obj.value,
-                    'offset': offset,
-                    'tz': tz}
+                tz = u(tz.zone)
+            freq = obj.freq
+            if freq is not None:
+                freq = u(freq.freqstr)
+            return {u'typ': u'timestamp',
+                    u'value': obj.value,
+                    u'freq': freq,
+                    u'tz': tz}
+        if obj is NaT:
+            return {u'typ': u'nat'}
         elif isinstance(obj, np.timedelta64):
-            return {'typ': 'timedelta64',
-                    'data': obj.view('i8')}
+            return {u'typ': u'timedelta64',
+                    u'data': obj.view('i8')}
         elif isinstance(obj, timedelta):
-            return {'typ': 'timedelta',
-                    'data': (obj.days, obj.seconds, obj.microseconds)}
+            return {u'typ': u'timedelta',
+                    u'data': (obj.days, obj.seconds, obj.microseconds)}
         elif isinstance(obj, np.datetime64):
-            return {'typ': 'datetime64',
-                    'data': str(obj)}
+            return {u'typ': u'datetime64',
+                    u'data': u(str(obj))}
         elif isinstance(obj, datetime):
-            return {'typ': 'datetime',
-                    'data': obj.isoformat()}
+            return {u'typ': u'datetime',
+                    u'data': u(obj.isoformat())}
         elif isinstance(obj, date):
-            return {'typ': 'date',
-                    'data': obj.isoformat()}
+            return {u'typ': u'date',
+                    u'data': u(obj.isoformat())}
         raise Exception("cannot encode this datetimelike object: %s" % obj)
     elif isinstance(obj, Period):
-        return {'typ': 'period',
-                'ordinal': obj.ordinal,
-                'freq': obj.freq}
+        return {u'typ': u'period',
+                u'ordinal': obj.ordinal,
+                u'freq': u_safe(obj.freqstr)}
+    elif isinstance(obj, Interval):
+        return {u'typ': u'interval',
+                u'left': obj.left,
+                u'right': obj.right,
+                u'closed': obj.closed}
     elif isinstance(obj, BlockIndex):
-        return {'typ': 'block_index',
-                'klass': obj.__class__.__name__,
-                'blocs': obj.blocs,
-                'blengths': obj.blengths,
-                'length': obj.length}
+        return {u'typ': u'block_index',
+                u'klass': u(obj.__class__.__name__),
+                u'blocs': obj.blocs,
+                u'blengths': obj.blengths,
+                u'length': obj.length}
     elif isinstance(obj, IntIndex):
-        return {'typ': 'int_index',
-                'klass': obj.__class__.__name__,
-                'indices': obj.indices,
-                'length': obj.length}
+        return {u'typ': u'int_index',
+                u'klass': u(obj.__class__.__name__),
+                u'indices': obj.indices,
+                u'length': obj.length}
     elif isinstance(obj, np.ndarray):
-        return {'typ': 'ndarray',
-                'shape': obj.shape,
-                'ndim': obj.ndim,
-                'dtype': obj.dtype.name,
-                'data': convert(obj),
-                'compress': compressor}
+        return {u'typ': u'ndarray',
+                u'shape': obj.shape,
+                u'ndim': obj.ndim,
+                u'dtype': u(obj.dtype.name),
+                u'data': convert(obj),
+                u'compress': compressor}
     elif isinstance(obj, np.number):
         if np.iscomplexobj(obj):
-            return {'typ': 'np_scalar',
-                    'sub_typ': 'np_complex',
-                    'dtype': obj.dtype.name,
-                    'real': obj.real.__repr__(),
-                    'imag': obj.imag.__repr__()}
+            return {u'typ': u'np_scalar',
+                    u'sub_typ': u'np_complex',
+                    u'dtype': u(obj.dtype.name),
+                    u'real': u(obj.real.__repr__()),
+                    u'imag': u(obj.imag.__repr__())}
         else:
-            return {'typ': 'np_scalar',
-                    'dtype': obj.dtype.name,
-                    'data': obj.__repr__()}
+            return {u'typ': u'np_scalar',
+                    u'dtype': u(obj.dtype.name),
+                    u'data': u(obj.__repr__())}
     elif isinstance(obj, complex):
-        return {'typ': 'np_complex',
-                'real': obj.real.__repr__(),
-                'imag': obj.imag.__repr__()}
+        return {u'typ': u'np_complex',
+                u'real': u(obj.real.__repr__()),
+                u'imag': u(obj.imag.__repr__())}
 
     return obj
 
@@ -452,111 +569,139 @@ def decode(obj):
     Decoder for deserializing numpy data types.
     """
 
-    typ = obj.get('typ')
+    typ = obj.get(u'typ')
     if typ is None:
         return obj
-    elif typ == 'timestamp':
-        return Timestamp(obj['value'], tz=obj['tz'], offset=obj['offset'])
-    elif typ == 'period':
-        return Period(ordinal=obj['ordinal'], freq=obj['freq'])
-    elif typ == 'index':
-        dtype = dtype_for(obj['dtype'])
-        data = unconvert(obj['data'], dtype,
-                         obj.get('compress'))
-        return globals()[obj['klass']](data, dtype=dtype, name=obj['name'])
-    elif typ == 'multi_index':
-        dtype = dtype_for(obj['dtype'])
-        data = unconvert(obj['data'], dtype,
-                         obj.get('compress'))
+    elif typ == u'timestamp':
+        freq = obj[u'freq'] if 'freq' in obj else obj[u'offset']
+        return Timestamp(obj[u'value'], tz=obj[u'tz'], freq=freq)
+    elif typ == u'nat':
+        return NaT
+    elif typ == u'period':
+        return Period(ordinal=obj[u'ordinal'], freq=obj[u'freq'])
+    elif typ == u'index':
+        dtype = dtype_for(obj[u'dtype'])
+        data = unconvert(obj[u'data'], dtype,
+                         obj.get(u'compress'))
+        return globals()[obj[u'klass']](data, dtype=dtype, name=obj[u'name'])
+    elif typ == u'range_index':
+        return globals()[obj[u'klass']](obj[u'start'],
+                                        obj[u'stop'],
+                                        obj[u'step'],
+                                        name=obj[u'name'])
+    elif typ == u'multi_index':
+        dtype = dtype_for(obj[u'dtype'])
+        data = unconvert(obj[u'data'], dtype,
+                         obj.get(u'compress'))
         data = [tuple(x) for x in data]
-        return globals()[obj['klass']].from_tuples(data, names=obj['names'])
-    elif typ == 'period_index':
-        data = unconvert(obj['data'], np.int64, obj.get('compress'))
-        d = dict(name=obj['name'], freq=obj['freq'])
-        return globals()[obj['klass']](data, **d)
-    elif typ == 'datetime_index':
-        data = unconvert(obj['data'], np.int64, obj.get('compress'))
-        d = dict(name=obj['name'], freq=obj['freq'], verify_integrity=False)
-        result = globals()[obj['klass']](data, **d)
-        tz = obj['tz']
+        return globals()[obj[u'klass']].from_tuples(data, names=obj[u'names'])
+    elif typ == u'period_index':
+        data = unconvert(obj[u'data'], np.int64, obj.get(u'compress'))
+        d = dict(name=obj[u'name'], freq=obj[u'freq'])
+        return globals()[obj[u'klass']]._from_ordinals(data, **d)
+    elif typ == u'datetime_index':
+        data = unconvert(obj[u'data'], np.int64, obj.get(u'compress'))
+        d = dict(name=obj[u'name'], freq=obj[u'freq'], verify_integrity=False)
+        result = globals()[obj[u'klass']](data, **d)
+        tz = obj[u'tz']
 
         # reverse tz conversion
         if tz is not None:
             result = result.tz_localize('UTC').tz_convert(tz)
         return result
 
-    elif typ == 'series':
-        dtype = dtype_for(obj['dtype'])
-        index = obj['index']
-        return globals()[obj['klass']](unconvert(obj['data'], dtype,
-                                                 obj['compress']),
-                                       index=index,
-                                       dtype=dtype,
-                                       name=obj['name'])
-    elif typ == 'block_manager':
-        axes = obj['axes']
+    elif typ == u'interval_index':
+        return globals()[obj[u'klass']].from_arrays(obj[u'left'],
+                                                    obj[u'right'],
+                                                    obj[u'closed'],
+                                                    name=obj[u'name'])
+    elif typ == u'category':
+        from_codes = globals()[obj[u'klass']].from_codes
+        return from_codes(codes=obj[u'codes'],
+                          categories=obj[u'categories'],
+                          ordered=obj[u'ordered'])
+
+    elif typ == u'interval':
+        return Interval(obj[u'left'], obj[u'right'], obj[u'closed'])
+    elif typ == u'series':
+        dtype = dtype_for(obj[u'dtype'])
+        pd_dtype = pandas_dtype(dtype)
+
+        index = obj[u'index']
+        result = globals()[obj[u'klass']](unconvert(obj[u'data'], dtype,
+                                                    obj[u'compress']),
+                                          index=index,
+                                          dtype=pd_dtype,
+                                          name=obj[u'name'])
+        return result
 
-        def create_block(b):
-            values = unconvert(b['values'], dtype_for(b['dtype']),
-                               b['compress']).reshape(b['shape'])
+    elif typ == u'block_manager':
+        axes = obj[u'axes']
 
-            # locs handles duplicate column names, and should be used instead of items; see GH 9618
-            if 'locs' in b:
-                placement = b['locs']
+        def create_block(b):
+            values = _safe_reshape(unconvert(
+                b[u'values'], dtype_for(b[u'dtype']),
+                b[u'compress']), b[u'shape'])
+
+            # locs handles duplicate column names, and should be used instead
+            # of items; see GH 9618
+            if u'locs' in b:
+                placement = b[u'locs']
             else:
-                placement = axes[0].get_indexer(b['items'])
+                placement = axes[0].get_indexer(b[u'items'])
             return make_block(values=values,
-                              klass=getattr(internals, b['klass']),
-                              placement=placement)
-
-        blocks = [create_block(b) for b in obj['blocks']]
-        return globals()[obj['klass']](BlockManager(blocks, axes))
-    elif typ == 'datetime':
-        return parse(obj['data'])
-    elif typ == 'datetime64':
-        return np.datetime64(parse(obj['data']))
-    elif typ == 'date':
-        return parse(obj['data']).date()
-    elif typ == 'timedelta':
-        return timedelta(*obj['data'])
-    elif typ == 'timedelta64':
-        return np.timedelta64(int(obj['data']))
-    #elif typ == 'sparse_series':
+                              klass=getattr(internals, b[u'klass']),
+                              placement=placement,
+                              dtype=b[u'dtype'])
+
+        blocks = [create_block(b) for b in obj[u'blocks']]
+        return globals()[obj[u'klass']](BlockManager(blocks, axes))
+    elif typ == u'datetime':
+        return parse(obj[u'data'])
+    elif typ == u'datetime64':
+        return np.datetime64(parse(obj[u'data']))
+    elif typ == u'date':
+        return parse(obj[u'data']).date()
+    elif typ == u'timedelta':
+        return timedelta(*obj[u'data'])
+    elif typ == u'timedelta64':
+        return np.timedelta64(int(obj[u'data']))
+    # elif typ == 'sparse_series':
     #    dtype = dtype_for(obj['dtype'])
     #    return globals()[obj['klass']](
     #        unconvert(obj['sp_values'], dtype, obj['compress']),
     #        sparse_index=obj['sp_index'], index=obj['index'],
     #        fill_value=obj['fill_value'], kind=obj['kind'], name=obj['name'])
-    #elif typ == 'sparse_dataframe':
+    # elif typ == 'sparse_dataframe':
     #    return globals()[obj['klass']](
     #        obj['data'], columns=obj['columns'],
     #        default_fill_value=obj['default_fill_value'],
     #        default_kind=obj['default_kind']
     #    )
-    #elif typ == 'sparse_panel':
+    # elif typ == 'sparse_panel':
     #    return globals()[obj['klass']](
     #        obj['data'], items=obj['items'],
     #        default_fill_value=obj['default_fill_value'],
     #        default_kind=obj['default_kind'])
-    elif typ == 'block_index':
-        return globals()[obj['klass']](obj['length'], obj['blocs'],
-                                       obj['blengths'])
-    elif typ == 'int_index':
-        return globals()[obj['klass']](obj['length'], obj['indices'])
-    elif typ == 'ndarray':
-        return unconvert(obj['data'], np.typeDict[obj['dtype']],
-                         obj.get('compress')).reshape(obj['shape'])
-    elif typ == 'np_scalar':
-        if obj.get('sub_typ') == 'np_complex':
-            return c2f(obj['real'], obj['imag'], obj['dtype'])
+    elif typ == u'block_index':
+        return globals()[obj[u'klass']](obj[u'length'], obj[u'blocs'],
+                                        obj[u'blengths'])
+    elif typ == u'int_index':
+        return globals()[obj[u'klass']](obj[u'length'], obj[u'indices'])
+    elif typ == u'ndarray':
+        return unconvert(obj[u'data'], np.typeDict[obj[u'dtype']],
+                         obj.get(u'compress')).reshape(obj[u'shape'])
+    elif typ == u'np_scalar':
+        if obj.get(u'sub_typ') == u'np_complex':
+            return c2f(obj[u'real'], obj[u'imag'], obj[u'dtype'])
         else:
-            dtype = dtype_for(obj['dtype'])
+            dtype = dtype_for(obj[u'dtype'])
             try:
-                return dtype(obj['data'])
+                return dtype(obj[u'data'])
             except:
-                return dtype.type(obj['data'])
-    elif typ == 'np_complex':
-        return complex(obj['real'] + '+' + obj['imag'] + 'j')
+                return dtype.type(obj[u'data'])
+    elif typ == u'np_complex':
+        return complex(obj[u'real'] + u'+' + obj[u'imag'] + u'j')
     elif isinstance(obj, (dict, list, set)):
         return obj
     else:
@@ -564,7 +709,7 @@ def create_block(b):
 
 
 def pack(o, default=encode,
-         encoding='latin1', unicode_errors='strict', use_single_float=False,
+         encoding='utf-8', unicode_errors='strict', use_single_float=False,
          autoreset=1, use_bin_type=1):
     """
     Pack an object and return the packed bytes.
@@ -578,7 +723,7 @@ def pack(o, default=encode,
 
 
 def unpack(packed, object_hook=decode,
-           list_hook=None, use_list=False, encoding='latin1',
+           list_hook=None, use_list=False, encoding='utf-8',
            unicode_errors='strict', object_pairs_hook=None,
            max_buffer_size=0, ext_hook=ExtType):
     """
@@ -598,7 +743,7 @@ def unpack(packed, object_hook=decode,
 class Packer(_Packer):
 
     def __init__(self, default=encode,
-                 encoding='latin1',
+                 encoding='utf-8',
                  unicode_errors='strict',
                  use_single_float=False,
                  autoreset=1,
@@ -615,7 +760,7 @@ class Unpacker(_Unpacker):
 
     def __init__(self, file_like=None, read_size=0, use_list=False,
                  object_hook=decode,
-                 object_pairs_hook=None, list_hook=None, encoding='latin1',
+                 object_pairs_hook=None, list_hook=None, encoding='utf-8',
                  unicode_errors='strict', max_buffer_size=0, ext_hook=ExtType):
         super(Unpacker, self).__init__(file_like=file_like,
                                        read_size=read_size,
diff --git a/pandas/io/parquet.py b/pandas/io/parquet.py
new file mode 100644
index 0000000000000..a99014f07a6b3
--- /dev/null
+++ b/pandas/io/parquet.py
@@ -0,0 +1,288 @@
+""" parquet compat """
+
+from warnings import catch_warnings
+from distutils.version import LooseVersion
+from pandas import DataFrame, RangeIndex, Int64Index, get_option
+from pandas.compat import string_types
+import pandas.core.common as com
+from pandas.io.common import get_filepath_or_buffer, is_s3_url
+
+
+def get_engine(engine):
+    """ return our implementation """
+
+    if engine == 'auto':
+        engine = get_option('io.parquet.engine')
+
+    if engine == 'auto':
+        # try engines in this order
+        try:
+            return PyArrowImpl()
+        except ImportError:
+            pass
+
+        try:
+            return FastParquetImpl()
+        except ImportError:
+            pass
+
+        raise ImportError("Unable to find a usable engine; "
+                          "tried using: 'pyarrow', 'fastparquet'.\n"
+                          "pyarrow or fastparquet is required for parquet "
+                          "support")
+
+    if engine not in ['pyarrow', 'fastparquet']:
+        raise ValueError("engine must be one of 'pyarrow', 'fastparquet'")
+
+    if engine == 'pyarrow':
+        return PyArrowImpl()
+    elif engine == 'fastparquet':
+        return FastParquetImpl()
+
+
+class BaseImpl(object):
+
+    api = None  # module
+
+    @staticmethod
+    def validate_dataframe(df):
+
+        if not isinstance(df, DataFrame):
+            raise ValueError("to_parquet only supports IO with DataFrames")
+
+        # must have value column names (strings only)
+        if df.columns.inferred_type not in {'string', 'unicode'}:
+            raise ValueError("parquet must have string column names")
+
+        # index level names must be strings
+        valid_names = all(
+            isinstance(name, string_types)
+            for name in df.index.names
+            if name is not None
+        )
+        if not valid_names:
+            raise ValueError("Index level names must be strings")
+
+    def write(self, df, path, compression, **kwargs):
+        raise com.AbstractMethodError(self)
+
+    def read(self, path, columns=None, **kwargs):
+        raise com.AbstractMethodError(self)
+
+
+class PyArrowImpl(BaseImpl):
+
+    def __init__(self):
+        # since pandas is a dependency of pyarrow
+        # we need to import on first use
+        try:
+            import pyarrow
+            import pyarrow.parquet
+        except ImportError:
+            raise ImportError(
+                "pyarrow is required for parquet support\n\n"
+                "you can install via conda\n"
+                "conda install pyarrow -c conda-forge\n"
+                "\nor via pip\n"
+                "pip install -U pyarrow\n"
+            )
+        if LooseVersion(pyarrow.__version__) < '0.4.1':
+            raise ImportError(
+                "pyarrow >= 0.4.1 is required for parquet support\n\n"
+                "you can install via conda\n"
+                "conda install pyarrow -c conda-forge\n"
+                "\nor via pip\n"
+                "pip install -U pyarrow\n"
+            )
+
+        self._pyarrow_lt_060 = (
+            LooseVersion(pyarrow.__version__) < LooseVersion('0.6.0'))
+        self._pyarrow_lt_070 = (
+            LooseVersion(pyarrow.__version__) < LooseVersion('0.7.0'))
+
+        self.api = pyarrow
+
+    def write(self, df, path, compression='snappy',
+              coerce_timestamps='ms', **kwargs):
+        self.validate_dataframe(df)
+        if self._pyarrow_lt_070:
+            self._validate_write_lt_070(df)
+        path, _, _, _ = get_filepath_or_buffer(path, mode='wb')
+
+        if self._pyarrow_lt_060:
+            table = self.api.Table.from_pandas(df, timestamps_to_ms=True)
+            self.api.parquet.write_table(
+                table, path, compression=compression, **kwargs)
+
+        else:
+            table = self.api.Table.from_pandas(df)
+            self.api.parquet.write_table(
+                table, path, compression=compression,
+                coerce_timestamps=coerce_timestamps, **kwargs)
+
+    def read(self, path, columns=None, **kwargs):
+        path, _, _, should_close = get_filepath_or_buffer(path)
+        if self._pyarrow_lt_070:
+            result = self.api.parquet.read_pandas(path, columns=columns,
+                                                  **kwargs).to_pandas()
+        else:
+            kwargs['use_pandas_metadata'] = True
+            result = self.api.parquet.read_table(path, columns=columns,
+                                                 **kwargs).to_pandas()
+        if should_close:
+            try:
+                path.close()
+            except:  # noqa: flake8
+                pass
+
+        return result
+
+    def _validate_write_lt_070(self, df):
+        # Compatibility shim for pyarrow < 0.7.0
+        # TODO: Remove in pandas 0.23.0
+        from pandas.core.indexes.multi import MultiIndex
+        if isinstance(df.index, MultiIndex):
+            msg = (
+                "Multi-index DataFrames are only supported "
+                "with pyarrow >= 0.7.0"
+            )
+            raise ValueError(msg)
+        # Validate index
+        if not isinstance(df.index, Int64Index):
+            msg = (
+                "pyarrow < 0.7.0 does not support serializing {} for the "
+                "index; you can .reset_index() to make the index into "
+                "column(s), or install the latest version of pyarrow or "
+                "fastparquet."
+            )
+            raise ValueError(msg.format(type(df.index)))
+        if not df.index.equals(RangeIndex(len(df))):
+            raise ValueError(
+                "pyarrow < 0.7.0 does not support serializing a non-default "
+                "index; you can .reset_index() to make the index into "
+                "column(s), or install the latest version of pyarrow or "
+                "fastparquet."
+            )
+        if df.index.name is not None:
+            raise ValueError(
+                "pyarrow < 0.7.0 does not serialize indexes with a name; you "
+                "can set the index.name to None or install the latest version "
+                "of pyarrow or fastparquet."
+            )
+
+
+class FastParquetImpl(BaseImpl):
+
+    def __init__(self):
+        # since pandas is a dependency of fastparquet
+        # we need to import on first use
+        try:
+            import fastparquet
+        except ImportError:
+            raise ImportError(
+                "fastparquet is required for parquet support\n\n"
+                "you can install via conda\n"
+                "conda install fastparquet -c conda-forge\n"
+                "\nor via pip\n"
+                "pip install -U fastparquet"
+            )
+        if LooseVersion(fastparquet.__version__) < '0.1.0':
+            raise ImportError(
+                "fastparquet >= 0.1.0 is required for parquet "
+                "support\n\n"
+                "you can install via conda\n"
+                "conda install fastparquet -c conda-forge\n"
+                "\nor via pip\n"
+                "pip install -U fastparquet"
+            )
+        self.api = fastparquet
+
+    def write(self, df, path, compression='snappy', **kwargs):
+        self.validate_dataframe(df)
+        # thriftpy/protocol/compact.py:339:
+        # DeprecationWarning: tostring() is deprecated.
+        # Use tobytes() instead.
+
+        if is_s3_url(path):
+            # path is s3:// so we need to open the s3file in 'wb' mode.
+            # TODO: Support 'ab'
+
+            path, _, _, _ = get_filepath_or_buffer(path, mode='wb')
+            # And pass the opened s3file to the fastparquet internal impl.
+            kwargs['open_with'] = lambda path, _: path
+        else:
+            path, _, _, _ = get_filepath_or_buffer(path)
+
+        with catch_warnings(record=True):
+            self.api.write(path, df,
+                           compression=compression, **kwargs)
+
+    def read(self, path, columns=None, **kwargs):
+        if is_s3_url(path):
+            # When path is s3:// an S3File is returned.
+            # We need to retain the original path(str) while also
+            # pass the S3File().open function to fsatparquet impl.
+            s3, _, _, should_close = get_filepath_or_buffer(path)
+            try:
+                parquet_file = self.api.ParquetFile(path, open_with=s3.s3.open)
+            finally:
+                s3.close()
+        else:
+            path, _, _, _ = get_filepath_or_buffer(path)
+            parquet_file = self.api.ParquetFile(path)
+
+        return parquet_file.to_pandas(columns=columns, **kwargs)
+
+
+def to_parquet(df, path, engine='auto', compression='snappy', **kwargs):
+    """
+    Write a DataFrame to the parquet format.
+
+    Parameters
+    ----------
+    df : DataFrame
+    path : string
+        File path
+    engine : {'auto', 'pyarrow', 'fastparquet'}, default 'auto'
+        Parquet library to use. If 'auto', then the option
+        ``io.parquet.engine`` is used. The default ``io.parquet.engine``
+        behavior is to try 'pyarrow', falling back to 'fastparquet' if
+        'pyarrow' is unavailable.
+    compression : {'snappy', 'gzip', 'brotli', None}, default 'snappy'
+        Name of the compression to use. Use ``None`` for no compression.
+    kwargs
+        Additional keyword arguments passed to the engine
+    """
+    impl = get_engine(engine)
+    return impl.write(df, path, compression=compression, **kwargs)
+
+
+def read_parquet(path, engine='auto', columns=None, **kwargs):
+    """
+    Load a parquet object from the file path, returning a DataFrame.
+
+    .. versionadded 0.21.0
+
+    Parameters
+    ----------
+    path : string
+        File path
+    columns: list, default=None
+        If not None, only these columns will be read from the file.
+
+        .. versionadded 0.21.1
+    engine : {'auto', 'pyarrow', 'fastparquet'}, default 'auto'
+        Parquet library to use. If 'auto', then the option
+        ``io.parquet.engine`` is used. The default ``io.parquet.engine``
+        behavior is to try 'pyarrow', falling back to 'fastparquet' if
+        'pyarrow' is unavailable.
+    kwargs are passed to the engine
+
+    Returns
+    -------
+    DataFrame
+
+    """
+
+    impl = get_engine(engine)
+    return impl.read(path, columns=columns, **kwargs)
diff --git a/pandas/io/parsers.py b/pandas/io/parsers.py
index 8ac1aed9d9af7..65df2bffb4abf 100755
--- a/pandas/io/parsers.py
+++ b/pandas/io/parsers.py
@@ -2,209 +2,335 @@
 Module contains tools for processing files into DataFrames or other objects
 """
 from __future__ import print_function
-from pandas.compat import range, lrange, StringIO, lzip, zip, string_types, map
-from pandas import compat
+from collections import defaultdict
 import re
 import csv
+import sys
 import warnings
+import datetime
+from textwrap import fill
 
 import numpy as np
 
-from pandas.core.index import Index, MultiIndex
+from pandas import compat
+from pandas.compat import (range, lrange, PY3, StringIO, lzip,
+                           zip, string_types, map, u)
+from pandas.core.dtypes.common import (
+    is_integer, _ensure_object,
+    is_list_like, is_integer_dtype,
+    is_float, is_dtype_equal,
+    is_object_dtype, is_string_dtype,
+    is_scalar, is_categorical_dtype)
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas.core.dtypes.missing import isna
+from pandas.core.dtypes.cast import astype_nansafe
+from pandas.core.index import (Index, MultiIndex, RangeIndex,
+                               _ensure_index_from_sequences)
+from pandas.core.series import Series
 from pandas.core.frame import DataFrame
-import datetime
+from pandas.core.arrays import Categorical
+from pandas.core import algorithms
 import pandas.core.common as com
-from pandas.core.common import AbstractMethodError
-from pandas.core.config import get_option
 from pandas.io.date_converters import generic_parser
-from pandas.io.common import get_filepath_or_buffer, _validate_header_arg
-from pandas.tseries import tools
-
-from pandas.util.decorators import Appender
-
-import pandas.lib as lib
-import pandas.tslib as tslib
-import pandas.parser as _parser
-
-
-class ParserWarning(Warning):
-    pass
-
-_parser_params = """Also supports optionally iterating or breaking of the file
+from pandas.errors import ParserWarning, ParserError, EmptyDataError
+from pandas.io.common import (get_filepath_or_buffer, is_file_like,
+                              _validate_header_arg, _get_handle,
+                              UnicodeReader, UTF8Recoder, _NA_VALUES,
+                              BaseIterator, _infer_compression)
+from pandas.core.tools import datetimes as tools
+
+from pandas.util._decorators import Appender
+
+import pandas._libs.lib as lib
+import pandas._libs.parsers as parsers
+import pandas._libs.ops as libops
+from pandas._libs.tslibs import parsing
+
+# BOM character (byte order mark)
+# This exists at the beginning of a file to indicate endianness
+# of a file (stream). Unfortunately, this marker screws up parsing,
+# so we need to remove it if we see it.
+_BOM = u('\ufeff')
+
+_parser_params = r"""Also supports optionally iterating or breaking of the file
 into chunks.
 
+Additional help can be found in the `online docs for IO Tools
+<http://pandas.pydata.org/pandas-docs/stable/io.html>`_.
+
 Parameters
 ----------
-filepath_or_buffer : string or file handle / StringIO
-    The string could be a URL. Valid URL schemes include
-    http, ftp, s3, and file. For file URLs, a
-    host is expected. For instance, a local file could be
-    file ://localhost/path/to/table.csv
+filepath_or_buffer : str, pathlib.Path, py._path.local.LocalPath or any \
+object with a read() method (such as a file handle or StringIO)
+    The string could be a URL. Valid URL schemes include http, ftp, s3, and
+    file. For file URLs, a host is expected. For instance, a local file could
+    be file://localhost/path/to/table.csv
 %s
-lineterminator : string (length 1), default None
-    Character to break file into lines. Only valid with C parser
-quotechar : string (length 1)
-    The character used to denote the start and end of a quoted item. Quoted
-    items can include the delimiter and it will be ignored.
-quoting : int or csv.QUOTE_* instance, default None
-    Control field quoting behavior per ``csv.QUOTE_*`` constants. Use one of
-    QUOTE_MINIMAL (0), QUOTE_ALL (1), QUOTE_NONNUMERIC (2) or QUOTE_NONE (3).
-    Default (None) results in QUOTE_MINIMAL behavior.
-skipinitialspace : boolean, default False
-    Skip spaces after delimiter
-escapechar : string (length 1), default None
-    One-character string used to escape delimiter when quoting is QUOTE_NONE.
-dtype : Type name or dict of column -> type, default None
-    Data type for data or columns. E.g. {'a': np.float64, 'b': np.int32}
-    (Unsupported with engine='python')
-compression : {'gzip', 'bz2', 'infer', None}, default 'infer'
-    For on-the-fly decompression of on-disk data. If 'infer', then use gzip or
-    bz2 if filepath_or_buffer is a string ending in '.gz' or '.bz2',
-    respectively, and no decompression otherwise. Set to None for no
-    decompression.
-dialect : string or csv.Dialect instance, default None
-    If None defaults to Excel dialect. Ignored if sep longer than 1 char
-    See csv.Dialect documentation for more details
-header : int, list of ints, default 'infer'
+delim_whitespace : boolean, default False
+    Specifies whether or not whitespace (e.g. ``' '`` or ``'\t'``) will be
+    used as the sep. Equivalent to setting ``sep='\s+'``. If this option
+    is set to True, nothing should be passed in for the ``delimiter``
+    parameter.
+
+    .. versionadded:: 0.18.1 support for the Python parser.
+
+header : int or list of ints, default 'infer'
     Row number(s) to use as the column names, and the start of the
-    data.  Defaults to 0 if no ``names`` passed, otherwise ``None``. Explicitly
-    pass ``header=0`` to be able to replace existing names. The header can be
-    a list of integers that specify row locations for a multi-index on the
-    columns E.g. [0,1,3]. Intervening rows that are not specified will be
-    skipped (e.g. 2 in this example are skipped). Note that this parameter
-    ignores commented lines and empty lines if ``skip_blank_lines=True``, so header=0
-    denotes the first line of data rather than the first line of the file.
-skiprows : list-like or integer, default None
-    Line numbers to skip (0-indexed) or number of lines to skip (int)
-    at the start of the file
+    data.  Default behavior is to infer the column names: if no names
+    are passed the behavior is identical to ``header=0`` and column
+    names are inferred from the first line of the file, if column
+    names are passed explicitly then the behavior is identical to
+    ``header=None``. Explicitly pass ``header=0`` to be able to
+    replace existing names. The header can be a list of integers that
+    specify row locations for a multi-index on the columns
+    e.g. [0,1,3]. Intervening rows that are not specified will be
+    skipped (e.g. 2 in this example is skipped). Note that this
+    parameter ignores commented lines and empty lines if
+    ``skip_blank_lines=True``, so header=0 denotes the first line of
+    data rather than the first line of the file.
+names : array-like, default None
+    List of column names to use. If file contains no header row, then you
+    should explicitly pass header=None. Duplicates in this list will cause
+    a ``UserWarning`` to be issued.
 index_col : int or sequence or False, default None
     Column to use as the row labels of the DataFrame. If a sequence is given, a
     MultiIndex is used. If you have a malformed file with delimiters at the end
     of each line, you might consider index_col=False to force pandas to _not_
     use the first column as the index (row names)
-names : array-like, default None
-    List of column names to use. If file contains no header row, then you
-    should explicitly pass header=None
-prefix : string, default None
-    Prefix to add to column numbers when no header, e.g 'X' for X0, X1, ...
-na_values : str, list-like or dict, default None
-    Additional strings to recognize as NA/NaN. If dict passed, specific
-    per-column NA values
+usecols : list-like or callable, default None
+    Return a subset of the columns. If list-like, all elements must either
+    be positional (i.e. integer indices into the document columns) or strings
+    that correspond to column names provided either by the user in `names` or
+    inferred from the document header row(s). For example, a valid list-like
+    `usecols` parameter would be [0, 1, 2] or ['foo', 'bar', 'baz']. Element
+    order is ignored, so ``usecols=[0, 1]`` is the same as ``[1, 0]``.
+    To instantiate a DataFrame from ``data`` with element order preserved use
+    ``pd.read_csv(data, usecols=['foo', 'bar'])[['foo', 'bar']]`` for columns
+    in ``['foo', 'bar']`` order or
+    ``pd.read_csv(data, usecols=['foo', 'bar'])[['bar', 'foo']]``
+    for ``['bar', 'foo']`` order.
+
+    If callable, the callable function will be evaluated against the column
+    names, returning names where the callable function evaluates to True. An
+    example of a valid callable argument would be ``lambda x: x.upper() in
+    ['AAA', 'BBB', 'DDD']``. Using this parameter results in much faster
+    parsing time and lower memory usage.
+squeeze : boolean, default False
+    If the parsed data only contains one column then return a Series
+prefix : str, default None
+    Prefix to add to column numbers when no header, e.g. 'X' for X0, X1, ...
+mangle_dupe_cols : boolean, default True
+    Duplicate columns will be specified as 'X', 'X.1', ...'X.N', rather than
+    'X'...'X'. Passing in False will cause data to be overwritten if there
+    are duplicate names in the columns.
+dtype : Type name or dict of column -> type, default None
+    Data type for data or columns. E.g. {'a': np.float64, 'b': np.int32}
+    Use `str` or `object` together with suitable `na_values` settings
+    to preserve and not interpret dtype.
+    If converters are specified, they will be applied INSTEAD
+    of dtype conversion.
+%s
+converters : dict, default None
+    Dict of functions for converting values in certain columns. Keys can either
+    be integers or column labels
 true_values : list, default None
     Values to consider as True
 false_values : list, default None
     Values to consider as False
+skipinitialspace : boolean, default False
+    Skip spaces after delimiter.
+skiprows : list-like or integer or callable, default None
+    Line numbers to skip (0-indexed) or number of lines to skip (int)
+    at the start of the file.
+
+    If callable, the callable function will be evaluated against the row
+    indices, returning True if the row should be skipped and False otherwise.
+    An example of a valid callable argument would be ``lambda x: x in [0, 2]``.
+skipfooter : int, default 0
+    Number of lines at bottom of file to skip (Unsupported with engine='c')
+nrows : int, default None
+    Number of rows of file to read. Useful for reading pieces of large files
+na_values : scalar, str, list-like, or dict, default None
+    Additional strings to recognize as NA/NaN. If dict passed, specific
+    per-column NA values.  By default the following values are interpreted as
+    NaN: '""" + fill("', '".join(sorted(_NA_VALUES)),
+                     70, subsequent_indent="    ") + """'.
 keep_default_na : bool, default True
-    If na_values are specified and keep_default_na is False the default NaN
-    values are overridden, otherwise they're appended to
-parse_dates : boolean, list of ints or names, list of lists, or dict, default False
-    If True -> try parsing the index.
-    If [1, 2, 3] -> try parsing columns 1, 2, 3 each as a separate date column.
-    If [[1, 3]] -> combine columns 1 and 3 and parse as a single date column.
-    {'foo' : [1, 3]} -> parse columns 1, 3 as date and call result 'foo'
-    A fast-path exists for iso8601-formatted dates.
+    Whether or not to include the default NaN values when parsing the data.
+    Depending on whether `na_values` is passed in, the behavior is as follows:
+
+    * If `keep_default_na` is True, and `na_values` are specified, `na_values`
+      is appended to the default NaN values used for parsing.
+    * If `keep_default_na` is True, and `na_values` are not specified, only
+      the default NaN values are used for parsing.
+    * If `keep_default_na` is False, and `na_values` are specified, only
+      the NaN values specified `na_values` are used for parsing.
+    * If `keep_default_na` is False, and `na_values` are not specified, no
+      strings will be parsed as NaN.
+
+    Note that if `na_filter` is passed in as False, the `keep_default_na` and
+    `na_values` parameters will be ignored.
+na_filter : boolean, default True
+    Detect missing value markers (empty strings and the value of na_values). In
+    data without any NAs, passing na_filter=False can improve the performance
+    of reading a large file
+verbose : boolean, default False
+    Indicate number of NA values placed in non-numeric columns
+skip_blank_lines : boolean, default True
+    If True, skip over blank lines rather than interpreting as NaN values
+parse_dates : boolean or list of ints or names or list of lists or dict, \
+default False
+
+    * boolean. If True -> try parsing the index.
+    * list of ints or names. e.g. If [1, 2, 3] -> try parsing columns 1, 2, 3
+      each as a separate date column.
+    * list of lists. e.g.  If [[1, 3]] -> combine columns 1 and 3 and parse as
+      a single date column.
+    * dict, e.g. {'foo' : [1, 3]} -> parse columns 1, 3 as date and call result
+      'foo'
+
+    If a column or index contains an unparseable date, the entire column or
+    index will be returned unaltered as an object data type. For non-standard
+    datetime parsing, use ``pd.to_datetime`` after ``pd.read_csv``
+
+    Note: A fast-path exists for iso8601-formatted dates.
+infer_datetime_format : boolean, default False
+    If True and `parse_dates` is enabled, pandas will attempt to infer the
+    format of the datetime strings in the columns, and if it can be inferred,
+    switch to a faster method of parsing them. In some cases this can increase
+    the parsing speed by 5-10x.
 keep_date_col : boolean, default False
-    If True and parse_dates specifies combining multiple columns then
+    If True and `parse_dates` specifies combining multiple columns then
     keep the original columns.
 date_parser : function, default None
-    Function to use for converting a sequence of string columns to an
-    array of datetime instances. The default uses dateutil.parser.parser
-    to do the conversion. Pandas will try to call date_parser in three different
-    ways, advancing to the next if an exception occurs: 1) Pass one or more arrays
-    (as defined by parse_dates) as arguments; 2) concatenate (row-wise) the string
-    values from the columns defined by parse_dates into a single array and pass
-    that; and 3) call date_parser once for each row using one or more strings
-    (corresponding to the columns defined by parse_dates) as arguments.
+    Function to use for converting a sequence of string columns to an array of
+    datetime instances. The default uses ``dateutil.parser.parser`` to do the
+    conversion. Pandas will try to call `date_parser` in three different ways,
+    advancing to the next if an exception occurs: 1) Pass one or more arrays
+    (as defined by `parse_dates`) as arguments; 2) concatenate (row-wise) the
+    string values from the columns defined by `parse_dates` into a single array
+    and pass that; and 3) call `date_parser` once for each row using one or
+    more strings (corresponding to the columns defined by `parse_dates`) as
+    arguments.
 dayfirst : boolean, default False
     DD/MM format dates, international and European format
+iterator : boolean, default False
+    Return TextFileReader object for iteration or getting chunks with
+    ``get_chunk()``.
+chunksize : int, default None
+    Return TextFileReader object for iteration.
+    See the `IO Tools docs
+    <http://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking>`_
+    for more information on ``iterator`` and ``chunksize``.
+compression : {'infer', 'gzip', 'bz2', 'zip', 'xz', None}, default 'infer'
+    For on-the-fly decompression of on-disk data. If 'infer' and
+    `filepath_or_buffer` is path-like, then detect compression from the
+    following extensions: '.gz', '.bz2', '.zip', or '.xz' (otherwise no
+    decompression). If using 'zip', the ZIP file must contain only one data
+    file to be read in. Set to None for no decompression.
+
+    .. versionadded:: 0.18.1 support for 'zip' and 'xz' compression.
+
 thousands : str, default None
     Thousands separator
+decimal : str, default '.'
+    Character to recognize as decimal point (e.g. use ',' for European data).
+float_precision : string, default None
+    Specifies which converter the C engine should use for floating-point
+    values. The options are `None` for the ordinary converter,
+    `high` for the high-precision converter, and `round_trip` for the
+    round-trip converter.
+lineterminator : str (length 1), default None
+    Character to break file into lines. Only valid with C parser.
+quotechar : str (length 1), optional
+    The character used to denote the start and end of a quoted item. Quoted
+    items can include the delimiter and it will be ignored.
+quoting : int or csv.QUOTE_* instance, default 0
+    Control field quoting behavior per ``csv.QUOTE_*`` constants. Use one of
+    QUOTE_MINIMAL (0), QUOTE_ALL (1), QUOTE_NONNUMERIC (2) or QUOTE_NONE (3).
+doublequote : boolean, default ``True``
+   When quotechar is specified and quoting is not ``QUOTE_NONE``, indicate
+   whether or not to interpret two consecutive quotechar elements INSIDE a
+   field as a single ``quotechar`` element.
+escapechar : str (length 1), default None
+    One-character string used to escape delimiter when quoting is QUOTE_NONE.
 comment : str, default None
-    Indicates remainder of line should not be parsed. If found at the
-    beginning of a line, the line will be ignored altogether. This parameter
-    must be a single character. Like empty lines (as long as ``skip_blank_lines=True``),
-    fully commented lines are ignored by the parameter `header`
-    but not by `skiprows`. For example, if comment='#', parsing
-    '#empty\\na,b,c\\n1,2,3' with `header=0` will result in 'a,b,c' being
+    Indicates remainder of line should not be parsed. If found at the beginning
+    of a line, the line will be ignored altogether. This parameter must be a
+    single character. Like empty lines (as long as ``skip_blank_lines=True``),
+    fully commented lines are ignored by the parameter `header` but not by
+    `skiprows`. For example, if ``comment='#'``, parsing
+    ``#empty\\na,b,c\\n1,2,3`` with ``header=0`` will result in 'a,b,c' being
     treated as the header.
-decimal : str, default '.'
-    Character to recognize as decimal point. E.g. use ',' for European data
-nrows : int, default None
-    Number of rows of file to read. Useful for reading pieces of large files
-iterator : boolean, default False
-    Return TextFileReader object
-chunksize : int, default None
-    Return TextFileReader object for iteration
-skipfooter : int, default 0
-    Number of lines at bottom of file to skip (Unsupported with engine='c')
-converters : dict, default None
-    Dict of functions for converting values in certain columns. Keys can either
-    be integers or column labels
-verbose : boolean, default False
-    Indicate number of NA values placed in non-numeric columns
-delimiter : string, default None
-    Alternative argument name for sep. Regular expressions are accepted.
-encoding : string, default None
+encoding : str, default None
     Encoding to use for UTF when reading/writing (ex. 'utf-8'). `List of Python
     standard encodings
     <https://docs.python.org/3/library/codecs.html#standard-encodings>`_
-squeeze : boolean, default False
-    If the parsed data only contains one column then return a Series
-na_filter : boolean, default True
-    Detect missing value markers (empty strings and the value of na_values). In
-    data without any NAs, passing na_filter=False can improve the performance
-    of reading a large file
-usecols : array-like, default None
-    Return a subset of the columns.
-    Results in much faster parsing time and lower memory usage.
-mangle_dupe_cols : boolean, default True
-    Duplicate columns will be specified as 'X.0'...'X.N', rather than 'X'...'X'
+dialect : str or csv.Dialect instance, default None
+    If provided, this parameter will override values (default or not) for the
+    following parameters: `delimiter`, `doublequote`, `escapechar`,
+    `skipinitialspace`, `quotechar`, and `quoting`. If it is necessary to
+    override values, a ParserWarning will be issued. See csv.Dialect
+    documentation for more details.
 tupleize_cols : boolean, default False
+    .. deprecated:: 0.21.0
+       This argument will be removed and will always convert to MultiIndex
+
     Leave a list of tuples on columns as is (default is to convert to
-    a Multi Index on the columns)
+    a MultiIndex on the columns)
 error_bad_lines : boolean, default True
     Lines with too many fields (e.g. a csv line with too many commas) will by
     default cause an exception to be raised, and no DataFrame will be returned.
     If False, then these "bad lines" will dropped from the DataFrame that is
-    returned. (Only valid with C parser)
+    returned.
 warn_bad_lines : boolean, default True
     If error_bad_lines is False, and warn_bad_lines is True, a warning for each
-    "bad line" will be output. (Only valid with C parser).
-infer_datetime_format : boolean, default False
-    If True and parse_dates is enabled for a column, attempt to infer
-    the datetime format to speed up the processing
-skip_blank_lines : boolean, default True
-    If True, skip over blank lines rather than interpreting as NaN values
+    "bad line" will be output.
+low_memory : boolean, default True
+    Internally process the file in chunks, resulting in lower memory use
+    while parsing, but possibly mixed type inference.  To ensure no mixed
+    types either set False, or specify the type with the `dtype` parameter.
+    Note that the entire file is read into a single DataFrame regardless,
+    use the `chunksize` or `iterator` parameter to return the data in chunks.
+    (Only valid with C parser)
+memory_map : boolean, default False
+    If a filepath is provided for `filepath_or_buffer`, map the file object
+    directly onto memory and access the data directly from there. Using this
+    option can improve performance because there is no longer any I/O overhead.
 
 Returns
 -------
 result : DataFrame or TextParser
 """
 
-_csv_params = """sep : string, default ','
-    Delimiter to use. If sep is None, will try to automatically determine
-    this. Regular expressions are accepted.
-engine : {'c', 'python'}
+# engine is not used in read_fwf() so is factored out of the shared docstring
+_engine_doc = """engine : {'c', 'python'}, optional
     Parser engine to use. The C engine is faster while the python engine is
     currently more feature-complete."""
 
-_table_params = """sep : string, default \\t (tab-stop)
-    Delimiter to use. Regular expressions are accepted.
-engine : {'c', 'python'}
-    Parser engine to use. The C engine is faster while the python engine is
-    currently more feature-complete."""
+_sep_doc = r"""sep : str, default {default}
+    Delimiter to use. If sep is None, the C engine cannot automatically detect
+    the separator, but the Python parsing engine can, meaning the latter will
+    be used and automatically detect the separator by Python's builtin sniffer
+    tool, ``csv.Sniffer``. In addition, separators longer than 1 character and
+    different from ``'\s+'`` will be interpreted as regular expressions and
+    will also force the use of the Python parsing engine. Note that regex
+    delimiters are prone to ignoring quoted data. Regex example: ``'\r\t'``
+delimiter : str, default ``None``
+    Alternative argument name for sep."""
 
 _read_csv_doc = """
 Read CSV (comma-separated) file into DataFrame
 
 %s
-""" % (_parser_params % _csv_params)
+""" % (_parser_params % (_sep_doc.format(default="','"), _engine_doc))
 
 _read_table_doc = """
 Read general delimited file into DataFrame
 
 %s
-""" % (_parser_params % _table_params)
+""" % (_parser_params % (_sep_doc.format(default="\\t (tab-stop)"),
+                         _engine_doc))
 
 _fwf_widths = """\
 colspecs : list of pairs (int, int) or 'infer'. optional
@@ -212,48 +338,91 @@ class ParserWarning(Warning):
     fields of each line as half-open intervals (i.e.,  [from, to[ ).
     String value 'infer' can be used to instruct the parser to try
     detecting the column specifications from the first 100 rows of
-    the data (default='infer').
+    the data which are not being skipped via skiprows (default='infer').
 widths : list of ints. optional
     A list of field widths which can be used instead of 'colspecs' if
     the intervals are contiguous.
+delimiter : str, default ``'\t' + ' '``
+    Characters to consider as filler characters in the fixed-width file.
+    Can be used to specify the filler character of the fields
+    if it is not spaces (e.g., '~').
 """
 
 _read_fwf_doc = """
 Read a table of fixed-width formatted lines into DataFrame
 
 %s
+""" % (_parser_params % (_fwf_widths, ''))
 
-Also, 'delimiter' is used to specify the filler character of the
-fields if it is not spaces (e.g., '~').
-""" % (_parser_params % _fwf_widths)
+
+def _validate_integer(name, val, min_val=0):
+    """
+    Checks whether the 'name' parameter for parsing is either
+    an integer OR float that can SAFELY be cast to an integer
+    without losing accuracy. Raises a ValueError if that is
+    not the case.
+
+    Parameters
+    ----------
+    name : string
+        Parameter name (used for error reporting)
+    val : int or float
+        The value to check
+    min_val : int
+        Minimum allowed value (val < min_val will result in a ValueError)
+    """
+    msg = "'{name:s}' must be an integer >={min_val:d}".format(name=name,
+                                                               min_val=min_val)
+
+    if val is not None:
+        if is_float(val):
+            if int(val) != val:
+                raise ValueError(msg)
+            val = int(val)
+        elif not (is_integer(val) and val >= min_val):
+            raise ValueError(msg)
+
+    return val
+
+
+def _validate_names(names):
+    """
+    Check if the `names` parameter contains duplicates.
+
+    If duplicates are found, we issue a warning before returning.
+
+    Parameters
+    ----------
+    names : array-like or None
+        An array containing a list of the names used for the output DataFrame.
+
+    Returns
+    -------
+    names : array-like or None
+        The original `names` parameter.
+    """
+
+    if names is not None:
+        if len(names) != len(set(names)):
+            msg = ("Duplicate names specified. This "
+                   "will raise an error in the future.")
+            warnings.warn(msg, UserWarning, stacklevel=3)
+
+    return names
 
 
 def _read(filepath_or_buffer, kwds):
-    "Generic reader of line files."
+    """Generic reader of line files."""
     encoding = kwds.get('encoding', None)
-    skipfooter = kwds.pop('skipfooter', None)
-    if skipfooter is not None:
-        kwds['skip_footer'] = skipfooter
-
-    # If the input could be a filename, check for a recognizable compression extension.
-    # If we're reading from a URL, the `get_filepath_or_buffer` will use header info
-    # to determine compression, so use what it finds in that case.
-    inferred_compression = kwds.get('compression')
-    if inferred_compression == 'infer':
-        if isinstance(filepath_or_buffer, compat.string_types):
-            if filepath_or_buffer.endswith('.gz'):
-                inferred_compression = 'gzip'
-            elif filepath_or_buffer.endswith('.bz2'):
-                inferred_compression = 'bz2'
-            else:
-                inferred_compression = None
-        else:
-            inferred_compression = None
+    if encoding is not None:
+        encoding = re.sub('_', '-', encoding).lower()
+        kwds['encoding'] = encoding
 
-    filepath_or_buffer, _, compression = get_filepath_or_buffer(filepath_or_buffer,
-                                                                encoding,
-                                                                compression=kwds.get('compression', None))
-    kwds['compression'] = inferred_compression if compression == 'infer' else compression
+    compression = kwds.get('compression')
+    compression = _infer_compression(filepath_or_buffer, compression)
+    filepath_or_buffer, _, compression, should_close = get_filepath_or_buffer(
+        filepath_or_buffer, encoding, compression)
+    kwds['compression'] = compression
 
     if kwds.get('date_parser', None) is not None:
         if isinstance(kwds['parse_dates'], bool):
@@ -261,21 +430,31 @@ def _read(filepath_or_buffer, kwds):
 
     # Extract some of the arguments (pass chunksize on).
     iterator = kwds.get('iterator', False)
-    nrows = kwds.pop('nrows', None)
-    chunksize = kwds.get('chunksize', None)
+    chunksize = _validate_integer('chunksize', kwds.get('chunksize', None), 1)
+    nrows = kwds.get('nrows', None)
+
+    # Check for duplicates in names.
+    _validate_names(kwds.get("names", None))
 
     # Create the parser.
     parser = TextFileReader(filepath_or_buffer, **kwds)
 
-    if (nrows is not None) and (chunksize is not None):
-        raise NotImplementedError("'nrows' and 'chunksize' can not be used"
-                                  " together yet.")
-    elif nrows is not None:
-        return parser.read(nrows)
-    elif chunksize or iterator:
+    if chunksize or iterator:
         return parser
 
-    return parser.read()
+    try:
+        data = parser.read(nrows)
+    finally:
+        parser.close()
+
+    if should_close:
+        try:
+            filepath_or_buffer.close()
+        except:  # noqa: flake8
+            pass
+
+    return data
+
 
 _parser_defaults = {
     'delimiter': None,
@@ -295,12 +474,14 @@ def _read(filepath_or_buffer, kwds):
     'na_values': None,
     'true_values': None,
     'false_values': None,
-    'skip_footer': 0,
     'converters': None,
+    'dtype': None,
+    'skipfooter': 0,
 
     'keep_default_na': True,
     'thousands': None,
     'comment': None,
+    'decimal': b'.',
 
     # 'engine': 'c',
     'parse_dates': False,
@@ -310,7 +491,7 @@ def _read(filepath_or_buffer, kwds):
 
     'usecols': None,
 
-    # 'nrows': None,
+    'nrows': None,
     # 'iterator': False,
     'chunksize': None,
     'verbose': False,
@@ -326,17 +507,12 @@ def _read(filepath_or_buffer, kwds):
 
 _c_parser_defaults = {
     'delim_whitespace': False,
-    'as_recarray': False,
     'na_filter': True,
-    'compact_ints': False,
-    'use_unsigned': False,
     'low_memory': True,
     'memory_map': False,
-    'buffer_lines': None,
     'error_bad_lines': True,
     'warn_bad_lines': True,
-    'dtype': None,
-    'decimal': b'.',
+    'tupleize_cols': False,
     'float_precision': None
 }
 
@@ -345,8 +521,18 @@ def _read(filepath_or_buffer, kwds):
     'widths': None,
 }
 
-_c_unsupported = set(['skip_footer'])
-_python_unsupported = set(_c_parser_defaults.keys())
+_c_unsupported = {'skipfooter'}
+_python_unsupported = {
+    'low_memory',
+    'float_precision',
+}
+
+_deprecated_defaults = {
+    'tupleize_cols': None
+}
+_deprecated_args = {
+    'tupleize_cols',
+}
 
 
 def _make_parser_function(name, sep=','):
@@ -355,65 +541,70 @@ def _make_parser_function(name, sep=','):
 
     def parser_f(filepath_or_buffer,
                  sep=sep,
-                 dialect=None,
-                 compression='infer',
-
-                 doublequote=True,
-                 escapechar=None,
-                 quotechar='"',
-                 quoting=csv.QUOTE_MINIMAL,
-                 skipinitialspace=False,
-                 lineterminator=None,
+                 delimiter=None,
 
+                 # Column and Index Locations and Names
                  header='infer',
-                 index_col=None,
                  names=None,
-                 prefix=None,
-                 skiprows=None,
-                 skipfooter=None,
-                 skip_footer=0,
-                 na_values=None,
-                 true_values=None,
-                 false_values=None,
-                 delimiter=None,
-                 converters=None,
-                 dtype=None,
+                 index_col=None,
                  usecols=None,
+                 squeeze=False,
+                 prefix=None,
+                 mangle_dupe_cols=True,
 
+                 # General Parsing Configuration
+                 dtype=None,
                  engine=None,
-                 delim_whitespace=False,
-                 as_recarray=False,
-                 na_filter=True,
-                 compact_ints=False,
-                 use_unsigned=False,
-                 low_memory=_c_parser_defaults['low_memory'],
-                 buffer_lines=None,
-                 warn_bad_lines=True,
-                 error_bad_lines=True,
+                 converters=None,
+                 true_values=None,
+                 false_values=None,
+                 skipinitialspace=False,
+                 skiprows=None,
+                 nrows=None,
 
+                 # NA and Missing Data Handling
+                 na_values=None,
                  keep_default_na=True,
-                 thousands=None,
-                 comment=None,
-                 decimal=b'.',
+                 na_filter=True,
+                 verbose=False,
+                 skip_blank_lines=True,
 
+                 # Datetime Handling
                  parse_dates=False,
+                 infer_datetime_format=False,
                  keep_date_col=False,
-                 dayfirst=False,
                  date_parser=None,
+                 dayfirst=False,
 
-                 memory_map=False,
-                 float_precision=None,
-                 nrows=None,
+                 # Iteration
                  iterator=False,
                  chunksize=None,
 
-                 verbose=False,
+                 # Quoting, Compression, and File Format
+                 compression='infer',
+                 thousands=None,
+                 decimal=b'.',
+                 lineterminator=None,
+                 quotechar='"',
+                 quoting=csv.QUOTE_MINIMAL,
+                 escapechar=None,
+                 comment=None,
                  encoding=None,
-                 squeeze=False,
-                 mangle_dupe_cols=True,
-                 tupleize_cols=False,
-                 infer_datetime_format=False,
-                 skip_blank_lines=True):
+                 dialect=None,
+                 tupleize_cols=None,
+
+                 # Error Handling
+                 error_bad_lines=True,
+                 warn_bad_lines=True,
+
+                 skipfooter=0,
+
+                 # Internal
+                 doublequote=True,
+                 delim_whitespace=False,
+                 low_memory=_c_parser_defaults['low_memory'],
+                 memory_map=False,
+                 float_precision=None):
 
         # Alias sep -> delimiter.
         if delimiter is None:
@@ -464,7 +655,7 @@ def parser_f(filepath_or_buffer,
                     nrows=nrows,
                     iterator=iterator,
                     chunksize=chunksize,
-                    skipfooter=skipfooter or skip_footer,
+                    skipfooter=skipfooter,
                     converters=converters,
                     dtype=dtype,
                     usecols=usecols,
@@ -475,14 +666,10 @@ def parser_f(filepath_or_buffer,
                     float_precision=float_precision,
 
                     na_filter=na_filter,
-                    compact_ints=compact_ints,
-                    use_unsigned=use_unsigned,
                     delim_whitespace=delim_whitespace,
-                    as_recarray=as_recarray,
                     warn_bad_lines=warn_bad_lines,
                     error_bad_lines=error_bad_lines,
                     low_memory=low_memory,
-                    buffer_lines=buffer_lines,
                     mangle_dupe_cols=mangle_dupe_cols,
                     tupleize_cols=tupleize_cols,
                     infer_datetime_format=infer_datetime_format,
@@ -494,6 +681,7 @@ def parser_f(filepath_or_buffer,
 
     return parser_f
 
+
 read_csv = _make_parser_function('read_csv', sep=',')
 read_csv = Appender(_read_csv_doc)(read_csv)
 
@@ -522,16 +710,7 @@ def read_fwf(filepath_or_buffer, colspecs='infer', widths=None, **kwds):
     return _read(filepath_or_buffer, kwds)
 
 
-# common NA values
-# no longer excluding inf representations
-# '1.#INF','-1.#INF', '1.#INF000000',
-_NA_VALUES = set([
-    '-1.#IND', '1.#QNAN', '1.#IND', '-1.#QNAN', '#N/A N/A', '#N/A', 'N/A', 'NA', '#NA',
-    'NULL', 'NaN', '-NaN', 'nan', '-nan', ''
-])
-
-
-class TextFileReader(object):
+class TextFileReader(BaseIterator):
     """
 
     Passed dialect overrides any of the related parser options
@@ -554,12 +733,33 @@ def __init__(self, f, engine=None, **kwds):
             dialect = kwds['dialect']
             if dialect in csv.list_dialects():
                 dialect = csv.get_dialect(dialect)
-            kwds['delimiter'] = dialect.delimiter
-            kwds['doublequote'] = dialect.doublequote
-            kwds['escapechar'] = dialect.escapechar
-            kwds['skipinitialspace'] = dialect.skipinitialspace
-            kwds['quotechar'] = dialect.quotechar
-            kwds['quoting'] = dialect.quoting
+
+            # Any valid dialect should have these attributes.
+            # If any are missing, we will raise automatically.
+            for param in ('delimiter', 'doublequote', 'escapechar',
+                          'skipinitialspace', 'quotechar', 'quoting'):
+                try:
+                    dialect_val = getattr(dialect, param)
+                except AttributeError:
+                    raise ValueError("Invalid dialect '{dialect}' provided"
+                                     .format(dialect=kwds['dialect']))
+                provided = kwds.get(param, _parser_defaults[param])
+
+                # Messages for conflicting values between the dialect instance
+                # and the actual parameters provided.
+                conflict_msgs = []
+
+                if dialect_val != provided:
+                    conflict_msgs.append((
+                        "Conflicting values for '{param}': '{val}' was "
+                        "provided, but the dialect specifies '{diaval}'. "
+                        "Using the dialect-specified value.".format(
+                            param=param, val=provided, diaval=dialect_val)))
+
+                if conflict_msgs:
+                    warnings.warn('\n\n'.join(conflict_msgs), ParserWarning,
+                                  stacklevel=2)
+                kwds[param] = dialect_val
 
         if kwds.get('header', 'infer') == 'infer':
             kwds['header'] = 0 if kwds.get('names') is None else None
@@ -569,36 +769,57 @@ def __init__(self, f, engine=None, **kwds):
         # miscellanea
         self.engine = engine
         self._engine = None
+        self._currow = 0
 
         options = self._get_options_with_defaults(engine)
 
         self.chunksize = options.pop('chunksize', None)
+        self.nrows = options.pop('nrows', None)
         self.squeeze = options.pop('squeeze', False)
 
         # might mutate self.engine
+        self.engine = self._check_file_or_buffer(f, engine)
         self.options, self.engine = self._clean_options(options, engine)
+
         if 'has_index_names' in kwds:
             self.options['has_index_names'] = kwds['has_index_names']
 
         self._make_engine(self.engine)
 
+    def close(self):
+        self._engine.close()
+
     def _get_options_with_defaults(self, engine):
         kwds = self.orig_options
 
         options = {}
 
         for argname, default in compat.iteritems(_parser_defaults):
-            options[argname] = kwds.get(argname, default)
+            value = kwds.get(argname, default)
+
+            # see gh-12935
+            if argname == 'mangle_dupe_cols' and not value:
+                raise ValueError('Setting mangle_dupe_cols=False is '
+                                 'not supported yet')
+            else:
+                options[argname] = value
 
         for argname, default in compat.iteritems(_c_parser_defaults):
             if argname in kwds:
                 value = kwds[argname]
 
                 if engine != 'c' and value != default:
-                    raise ValueError('The %r option is not supported with the'
-                                     ' %r engine' % (argname, engine))
+                    if ('python' in engine and
+                            argname not in _python_unsupported):
+                        pass
+                    elif value == _deprecated_defaults.get(argname, default):
+                        pass
+                    else:
+                        raise ValueError(
+                            'The %r option is not supported with the'
+                            ' %r engine' % (argname, engine))
             else:
-                value = default
+                value = _deprecated_defaults.get(argname, default)
             options[argname] = value
 
         if engine == 'python-fwf':
@@ -607,6 +828,23 @@ def _get_options_with_defaults(self, engine):
 
         return options
 
+    def _check_file_or_buffer(self, f, engine):
+        # see gh-16530
+        if is_file_like(f):
+            next_attr = "__next__" if PY3 else "next"
+
+            # The C engine doesn't need the file-like to have the "next" or
+            # "__next__" attribute. However, the Python engine explicitly calls
+            # "next(...)" when iterating through such an object, meaning it
+            # needs to have that attribute ("next" for Python 2.x, "__next__"
+            # for Python 3.x)
+            if engine != "c" and not hasattr(f, next_attr):
+                msg = ("The 'python' engine cannot iterate "
+                       "through this file buffer.")
+                raise ValueError(msg)
+
+        return engine
+
     def _clean_options(self, options, engine):
         result = options.copy()
 
@@ -618,24 +856,54 @@ def _clean_options(self, options, engine):
 
         # C engine not supported yet
         if engine == 'c':
-            if options['skip_footer'] > 0:
+            if options['skipfooter'] > 0:
                 fallback_reason = "the 'c' engine does not support"\
-                                  " skip_footer"
+                                  " skipfooter"
                 engine = 'python'
 
+        encoding = sys.getfilesystemencoding() or 'utf-8'
         if sep is None and not delim_whitespace:
             if engine == 'c':
                 fallback_reason = "the 'c' engine does not support"\
                                   " sep=None with delim_whitespace=False"
                 engine = 'python'
         elif sep is not None and len(sep) > 1:
-            if engine == 'c' and sep == '\s+':
+            if engine == 'c' and sep == r'\s+':
                 result['delim_whitespace'] = True
                 del result['delimiter']
             elif engine not in ('python', 'python-fwf'):
                 # wait until regex engine integrated
                 fallback_reason = "the 'c' engine does not support"\
-                                  " regex separators"
+                                  " regex separators (separators > 1 char and"\
+                                  r" different from '\s+' are"\
+                                  " interpreted as regex)"
+                engine = 'python'
+        elif delim_whitespace:
+            if 'python' in engine:
+                result['delimiter'] = r'\s+'
+        elif sep is not None:
+            encodeable = True
+            try:
+                if len(sep.encode(encoding)) > 1:
+                    encodeable = False
+            except UnicodeDecodeError:
+                encodeable = False
+            if not encodeable and engine not in ('python', 'python-fwf'):
+                fallback_reason = "the separator encoded in {encoding}" \
+                                  " is > 1 char long, and the 'c' engine" \
+                                  " does not support such separators".format(
+                                      encoding=encoding)
+                engine = 'python'
+
+        quotechar = options['quotechar']
+        if (quotechar is not None and
+                isinstance(quotechar, (str, compat.text_type, bytes))):
+            if (len(quotechar) == 1 and ord(quotechar) > 127 and
+                    engine not in ('python', 'python-fwf')):
+                fallback_reason = ("ord(quotechar) > 127, meaning the "
+                                   "quotechar is larger than one byte, "
+                                   "and the 'c' engine does not support "
+                                   "such quotechars")
                 engine = 'python'
 
         if fallback_reason and engine_specified:
@@ -651,10 +919,8 @@ def _clean_options(self, options, engine):
                     msg = ("Falling back to the 'python' engine because"
                            " {reason}, but this causes {option!r} to be"
                            " ignored as it is not supported by the 'python'"
-                           " engine.").format(reason=fallback_reason, option=arg)
-                    if arg == 'dtype':
-                        msg += " (Note the 'converters' option provides"\
-                               " similar functionality.)"
+                           " engine.").format(reason=fallback_reason,
+                                              option=arg)
                     raise ValueError(msg)
                 del result[arg]
 
@@ -670,11 +936,31 @@ def _clean_options(self, options, engine):
         na_values = options['na_values']
         skiprows = options['skiprows']
 
-        # really delete this one
-        keep_default_na = result.pop('keep_default_na')
-
         _validate_header_arg(options['header'])
 
+        depr_warning = ''
+
+        for arg in _deprecated_args:
+            parser_default = _c_parser_defaults[arg]
+            depr_default = _deprecated_defaults[arg]
+
+            msg = ("The '{arg}' argument has been deprecated "
+                   "and will be removed in a future version."
+                   .format(arg=arg))
+
+            if arg == 'tupleize_cols':
+                msg += (' Column tuples will then '
+                        'always be converted to MultiIndex.')
+
+            if result.get(arg, depr_default) != depr_default:
+                # raise Exception(result.get(arg, depr_default), depr_default)
+                depr_warning += msg + '\n\n'
+            else:
+                result[arg] = parser_default
+
+        if depr_warning != '':
+            warnings.warn(depr_warning, FutureWarning, stacklevel=2)
+
         if index_col is True:
             raise ValueError("The value of index_col couldn't be 'True'")
         if _is_index_col(index_col):
@@ -694,11 +980,18 @@ def _clean_options(self, options, engine):
             converters = {}
 
         # Converting values to NA
+        keep_default_na = options['keep_default_na']
         na_values, na_fvalues = _clean_na_values(na_values, keep_default_na)
 
-        if com.is_integer(skiprows):
-            skiprows = lrange(skiprows)
-        skiprows = set() if skiprows is None else set(skiprows)
+        # handle skiprows; this is internally handled by the
+        # c-engine, so only need for python parsers
+        if engine != 'c':
+            if is_integer(skiprows):
+                skiprows = lrange(skiprows)
+            if skiprows is None:
+                skiprows = set()
+            elif not callable(skiprows):
+                skiprows = set(skiprows)
 
         # put stuff back
         result['names'] = names
@@ -709,15 +1002,12 @@ def _clean_options(self, options, engine):
 
         return result, engine
 
-    def __iter__(self):
+    def __next__(self):
         try:
-            if self.chunksize:
-                while True:
-                    yield self.read(self.chunksize)
-            else:
-                yield self.read()
+            return self.get_chunk()
         except StopIteration:
-            pass
+            self.close()
+            raise
 
     def _make_engine(self, engine='c'):
         if engine == 'c':
@@ -727,26 +1017,41 @@ def _make_engine(self, engine='c'):
                 klass = PythonParser
             elif engine == 'python-fwf':
                 klass = FixedWidthFieldParser
+            else:
+                raise ValueError('Unknown engine: {engine} (valid options are'
+                                 ' "c", "python", or' ' "python-fwf")'.format(
+                                     engine=engine))
             self._engine = klass(self.f, **self.options)
 
     def _failover_to_python(self):
-        raise AbstractMethodError(self)
+        raise com.AbstractMethodError(self)
 
     def read(self, nrows=None):
+        nrows = _validate_integer('nrows', nrows)
+
         if nrows is not None:
-            if self.options.get('skip_footer'):
-                raise ValueError('skip_footer not supported for iteration')
+            if self.options.get('skipfooter'):
+                raise ValueError('skipfooter not supported for iteration')
 
         ret = self._engine.read(nrows)
 
-        if self.options.get('as_recarray'):
-            return ret
-
         # May alter columns / col_dict
         index, columns, col_dict = self._create_index(ret)
 
+        if index is None:
+            if col_dict:
+                # Any column is actually fine:
+                new_rows = len(compat.next(compat.itervalues(col_dict)))
+                index = RangeIndex(self._currow, self._currow + new_rows)
+            else:
+                new_rows = 0
+        else:
+            new_rows = len(index)
+
         df = DataFrame(col_dict, columns=columns, index=index)
 
+        self._currow += new_rows
+
         if self.squeeze and len(df.columns) == 1:
             return df[df.columns[0]].copy()
         return df
@@ -758,6 +1063,10 @@ def _create_index(self, ret):
     def get_chunk(self, size=None):
         if size is None:
             size = self.chunksize
+        if self.nrows is not None:
+            if self._currow >= self.nrows:
+                raise StopIteration
+            size = min(size, self.nrows - self._currow)
         return self.read(nrows=size)
 
 
@@ -765,6 +1074,163 @@ def _is_index_col(col):
     return col is not None and col is not False
 
 
+def _is_potential_multi_index(columns):
+    """
+    Check whether or not the `columns` parameter
+    could be converted into a MultiIndex.
+
+    Parameters
+    ----------
+    columns : array-like
+        Object which may or may not be convertible into a MultiIndex
+
+    Returns
+    -------
+    boolean : Whether or not columns could become a MultiIndex
+    """
+    return (len(columns) and not isinstance(columns, MultiIndex) and
+            all(isinstance(c, tuple) for c in columns))
+
+
+def _evaluate_usecols(usecols, names):
+    """
+    Check whether or not the 'usecols' parameter
+    is a callable.  If so, enumerates the 'names'
+    parameter and returns a set of indices for
+    each entry in 'names' that evaluates to True.
+    If not a callable, returns 'usecols'.
+    """
+    if callable(usecols):
+        return {i for i, name in enumerate(names) if usecols(name)}
+    return usecols
+
+
+def _validate_usecols_names(usecols, names):
+    """
+    Validates that all usecols are present in a given
+    list of names. If not, raise a ValueError that
+    shows what usecols are missing.
+
+    Parameters
+    ----------
+    usecols : iterable of usecols
+        The columns to validate are present in names.
+    names : iterable of names
+        The column names to check against.
+
+    Returns
+    -------
+    usecols : iterable of usecols
+        The `usecols` parameter if the validation succeeds.
+
+    Raises
+    ------
+    ValueError : Columns were missing. Error message will list them.
+    """
+    missing = [c for c in usecols if c not in names]
+    if len(missing) > 0:
+        raise ValueError(
+            "Usecols do not match columns, "
+            "columns expected but not found: {missing}".format(missing=missing)
+        )
+
+    return usecols
+
+
+def _validate_skipfooter_arg(skipfooter):
+    """
+    Validate the 'skipfooter' parameter.
+
+    Checks whether 'skipfooter' is a non-negative integer.
+    Raises a ValueError if that is not the case.
+
+    Parameters
+    ----------
+    skipfooter : non-negative integer
+        The number of rows to skip at the end of the file.
+
+    Returns
+    -------
+    validated_skipfooter : non-negative integer
+        The original input if the validation succeeds.
+
+    Raises
+    ------
+    ValueError : 'skipfooter' was not a non-negative integer.
+    """
+
+    if not is_integer(skipfooter):
+        raise ValueError("skipfooter must be an integer")
+
+    if skipfooter < 0:
+        raise ValueError("skipfooter cannot be negative")
+
+    return skipfooter
+
+
+def _validate_usecols_arg(usecols):
+    """
+    Validate the 'usecols' parameter.
+
+    Checks whether or not the 'usecols' parameter contains all integers
+    (column selection by index), strings (column by name) or is a callable.
+    Raises a ValueError if that is not the case.
+
+    Parameters
+    ----------
+    usecols : list-like, callable, or None
+        List of columns to use when parsing or a callable that can be used
+        to filter a list of table columns.
+
+    Returns
+    -------
+    usecols_tuple : tuple
+        A tuple of (verified_usecols, usecols_dtype).
+
+        'verified_usecols' is either a set if an array-like is passed in or
+        'usecols' if a callable or None is passed in.
+
+        'usecols_dtype` is the inferred dtype of 'usecols' if an array-like
+        is passed in or None if a callable or None is passed in.
+    """
+    msg = ("'usecols' must either be list-like of all strings, all unicode, "
+           "all integers or a callable.")
+    if usecols is not None:
+        if callable(usecols):
+            return usecols, None
+        # GH20529, ensure is iterable container but not string.
+        elif not is_list_like(usecols):
+            raise ValueError(msg)
+        else:
+            usecols_dtype = lib.infer_dtype(usecols)
+            if usecols_dtype not in ('empty', 'integer',
+                                     'string', 'unicode'):
+                raise ValueError(msg)
+        return set(usecols), usecols_dtype
+    return usecols, None
+
+
+def _validate_parse_dates_arg(parse_dates):
+    """
+    Check whether or not the 'parse_dates' parameter
+    is a non-boolean scalar. Raises a ValueError if
+    that is the case.
+    """
+    msg = ("Only booleans, lists, and "
+           "dictionaries are accepted "
+           "for the 'parse_dates' parameter")
+
+    if parse_dates is not None:
+        if is_scalar(parse_dates):
+            if not lib.is_bool(parse_dates):
+                raise TypeError(msg)
+
+        elif not isinstance(parse_dates, (list, dict)):
+            raise TypeError(msg)
+
+    return parse_dates
+
+
 class ParserBase(object):
 
     def __init__(self, kwds):
@@ -776,16 +1242,21 @@ def __init__(self, kwds):
         self.index_names = None
         self.col_names = None
 
-        self.parse_dates = kwds.pop('parse_dates', False)
+        self.parse_dates = _validate_parse_dates_arg(
+            kwds.pop('parse_dates', False))
         self.date_parser = kwds.pop('date_parser', None)
         self.dayfirst = kwds.pop('dayfirst', False)
         self.keep_date_col = kwds.pop('keep_date_col', False)
 
         self.na_values = kwds.get('na_values')
         self.na_fvalues = kwds.get('na_fvalues')
+        self.na_filter = kwds.get('na_filter', False)
+        self.keep_default_na = kwds.get('keep_default_na', True)
+
         self.true_values = kwds.get('true_values')
         self.false_values = kwds.get('false_values')
         self.tupleize_cols = kwds.get('tupleize_cols', False)
+        self.mangle_dupe_cols = kwds.get('mangle_dupe_cols', True)
         self.infer_datetime_format = kwds.pop('infer_datetime_format', False)
 
         self._date_conv = _make_date_converter(
@@ -797,9 +1268,8 @@ def __init__(self, kwds):
         # validate header options for mi
         self.header = kwds.get('header')
         if isinstance(self.header, (list, tuple, np.ndarray)):
-            if kwds.get('as_recarray'):
-                raise ValueError("cannot specify as_recarray when "
-                                 "specifying a multi-index header")
+            if not all(map(is_integer, self.header)):
+                raise ValueError("header must be integer or list of integers")
             if kwds.get('usecols'):
                 raise ValueError("cannot specify usecols when "
                                  "specifying a multi-index header")
@@ -812,15 +1282,27 @@ def __init__(self, kwds):
                 is_sequence = isinstance(self.index_col, (list, tuple,
                                                           np.ndarray))
                 if not (is_sequence and
-                        all(map(com.is_integer, self.index_col)) or
-                        com.is_integer(self.index_col)):
+                        all(map(is_integer, self.index_col)) or
+                        is_integer(self.index_col)):
                     raise ValueError("index_col must only contain row numbers "
                                      "when specifying a multi-index header")
 
+        # GH 16338
+        elif self.header is not None and not is_integer(self.header):
+            raise ValueError("header must be integer or list of integers")
+
         self._name_processed = False
 
         self._first_chunk = True
 
+        # GH 13932
+        # keep references to file handles opened by the parser itself
+        self.handles = []
+
+    def close(self):
+        for f in self.handles:
+            f.close()
+
     @property
     def _has_complex_date_col(self):
         return (isinstance(self.parse_dates, dict) or
@@ -832,13 +1314,18 @@ def _should_parse_dates(self, i):
         if isinstance(self.parse_dates, bool):
             return self.parse_dates
         else:
-            name = self.index_names[i]
+            if self.index_names is not None:
+                name = self.index_names[i]
+            else:
+                name = None
             j = self.index_col[i]
 
-            if np.isscalar(self.parse_dates):
-                return (j == self.parse_dates) or (name == self.parse_dates)
+            if is_scalar(self.parse_dates):
+                return ((j == self.parse_dates) or
+                        (name is not None and name == self.parse_dates))
             else:
-                return (j in self.parse_dates) or (name in self.parse_dates)
+                return ((j in self.parse_dates) or
+                        (name is not None and name in self.parse_dates))
 
     def _extract_multi_indexer_columns(self, header, index_names, col_names,
                                        passed_names=False):
@@ -867,19 +1354,22 @@ def _extract_multi_indexer_columns(self, header, index_names, col_names,
         field_count = len(header[0])
 
         def extract(r):
-            return tuple([r[i] for i in range(field_count) if i not in sic])
+            return tuple(r[i] for i in range(field_count) if i not in sic)
 
         columns = lzip(*[extract(r) for r in header])
         names = ic + columns
 
+        def tostr(x):
+            return str(x) if not isinstance(x, compat.string_types) else x
+
         # if we find 'Unnamed' all of a single level, then our header was too
         # long
         for n in range(len(columns[0])):
-            if all(['Unnamed' in c[n] for c in columns]):
-                raise _parser.CParserError(
+            if all('Unnamed' in tostr(c[n]) for c in columns):
+                raise ParserError(
                     "Passed header=[%s] are too many rows for this "
                     "multi_index of columns"
-                    % ','.join([str(x) for x in self.header])
+                    % ','.join(str(x) for x in self.header)
                 )
 
         # clean the column names (if we have an index_col)
@@ -893,11 +1383,37 @@ def extract(r):
 
         return names, index_names, col_names, passed_names
 
+    def _maybe_dedup_names(self, names):
+        # see gh-7160 and gh-9424: this helps to provide
+        # immediate alleviation of the duplicate names
+        # issue and appears to be satisfactory to users,
+        # but ultimately, not needing to butcher the names
+        # would be nice!
+        if self.mangle_dupe_cols:
+            names = list(names)  # so we can index
+            counts = defaultdict(int)
+            is_potential_mi = _is_potential_multi_index(names)
+
+            for i, col in enumerate(names):
+                cur_count = counts[col]
+
+                while cur_count > 0:
+                    counts[col] = cur_count + 1
+
+                    if is_potential_mi:
+                        col = col[:-1] + ('%s.%d' % (col[-1], cur_count),)
+                    else:
+                        col = '%s.%d' % (col, cur_count)
+                    cur_count = counts[col]
+
+                names[i] = col
+                counts[col] = cur_count + 1
+
+        return names
+
     def _maybe_make_multi_index_columns(self, columns, col_names=None):
         # possibly create a column mi here
-        if (not self.tupleize_cols and len(columns) and
-                not isinstance(columns, MultiIndex) and
-                all([isinstance(c, tuple) for c in columns])):
+        if _is_potential_multi_index(columns):
             columns = MultiIndex.from_tuples(columns, names=col_names)
         return columns
 
@@ -908,7 +1424,6 @@ def _make_index(self, data, alldata, columns, indexnamerow=False):
         elif not self._has_complex_date_col:
             index = self._get_simple_index(alldata, columns)
             index = self._agg_index(index)
-
         elif self._has_complex_date_col:
             if not self._name_processed:
                 (self.index_names, _,
@@ -935,7 +1450,6 @@ def ix(col):
             if not isinstance(col, compat.string_types):
                 return col
             raise ValueError('Index %s invalid' % col)
-        index = None
 
         to_remove = []
         index = []
@@ -966,8 +1480,6 @@ def _get_name(icol):
                 if i == icol:
                     return c
 
-        index = None
-
         to_remove = []
         index = []
         for idx in self.index_col:
@@ -985,57 +1497,110 @@ def _get_name(icol):
 
     def _agg_index(self, index, try_parse_dates=True):
         arrays = []
+
         for i, arr in enumerate(index):
 
-            if (try_parse_dates and self._should_parse_dates(i)):
+            if try_parse_dates and self._should_parse_dates(i):
                 arr = self._date_conv(arr)
 
-            col_na_values = self.na_values
-            col_na_fvalues = self.na_fvalues
+            if self.na_filter:
+                col_na_values = self.na_values
+                col_na_fvalues = self.na_fvalues
+            else:
+                col_na_values = set()
+                col_na_fvalues = set()
 
             if isinstance(self.na_values, dict):
                 col_name = self.index_names[i]
                 if col_name is not None:
                     col_na_values, col_na_fvalues = _get_na_values(
-                        col_name, self.na_values, self.na_fvalues)
+                        col_name, self.na_values, self.na_fvalues,
+                        self.keep_default_na)
 
-            arr, _ = self._convert_types(arr, col_na_values | col_na_fvalues)
+            arr, _ = self._infer_types(arr, col_na_values | col_na_fvalues)
             arrays.append(arr)
 
-        index = MultiIndex.from_arrays(arrays, names=self.index_names)
+        names = self.index_names
+        index = _ensure_index_from_sequences(arrays, names)
 
         return index
 
     def _convert_to_ndarrays(self, dct, na_values, na_fvalues, verbose=False,
-                             converters=None):
+                             converters=None, dtypes=None):
         result = {}
         for c, values in compat.iteritems(dct):
             conv_f = None if converters is None else converters.get(c, None)
-            col_na_values, col_na_fvalues = _get_na_values(c, na_values,
-                                                           na_fvalues)
-            coerce_type = True
+            if isinstance(dtypes, dict):
+                cast_type = dtypes.get(c, None)
+            else:
+                # single dtype or None
+                cast_type = dtypes
+
+            if self.na_filter:
+                col_na_values, col_na_fvalues = _get_na_values(
+                    c, na_values, na_fvalues, self.keep_default_na)
+            else:
+                col_na_values, col_na_fvalues = set(), set()
+
             if conv_f is not None:
+                # conv_f applied to data before inference
+                if cast_type is not None:
+                    warnings.warn(("Both a converter and dtype were specified "
+                                   "for column {0} - only the converter will "
+                                   "be used").format(c), ParserWarning,
+                                  stacklevel=7)
+
                 try:
                     values = lib.map_infer(values, conv_f)
                 except ValueError:
-                    mask = lib.ismember(values, na_values).view(np.uint8)
+                    mask = algorithms.isin(
+                        values, list(na_values)).view(np.uint8)
                     values = lib.map_infer_mask(values, conv_f, mask)
-                coerce_type = False
 
-            cvals, na_count = self._convert_types(
-                values, set(col_na_values) | col_na_fvalues, coerce_type)
+                cvals, na_count = self._infer_types(
+                    values, set(col_na_values) | col_na_fvalues,
+                    try_num_bool=False)
+            else:
+                # skip inference if specified dtype is object
+                try_num_bool = not (cast_type and is_string_dtype(cast_type))
+
+                # general type inference and conversion
+                cvals, na_count = self._infer_types(
+                    values, set(col_na_values) | col_na_fvalues,
+                    try_num_bool)
+
+                # type specified in dtype param
+                if cast_type and not is_dtype_equal(cvals, cast_type):
+                    cvals = self._cast_types(cvals, cast_type, c)
+
             result[c] = cvals
             if verbose and na_count:
                 print('Filled %d NA values in column %s' % (na_count, str(c)))
         return result
 
-    def _convert_types(self, values, na_values, try_num_bool=True):
+    def _infer_types(self, values, na_values, try_num_bool=True):
+        """
+        Infer types of values, possibly casting
+
+        Parameters
+        ----------
+        values : ndarray
+        na_values : set
+        try_num_bool : bool, default try
+           try to cast values to numeric (first preference) or boolean
+
+        Returns:
+        --------
+        converted : ndarray
+        na_count : int
+        """
+
         na_count = 0
         if issubclass(values.dtype.type, (np.number, np.bool_)):
-            mask = lib.ismember(values, na_values)
+            mask = algorithms.isin(values, list(na_values))
             na_count = mask.sum()
             if na_count > 0:
-                if com.is_integer_dtype(values):
+                if is_integer_dtype(values):
                     values = values.astype(np.float64)
                 np.putmask(values, mask, np.nan)
             return values, na_count
@@ -1043,24 +1608,67 @@ def _convert_types(self, values, na_values, try_num_bool=True):
         if try_num_bool:
             try:
                 result = lib.maybe_convert_numeric(values, na_values, False)
+                na_count = isna(result).sum()
             except Exception:
                 result = values
                 if values.dtype == np.object_:
-                    na_count = lib.sanitize_objects(result, na_values, False)
+                    na_count = parsers.sanitize_objects(result, na_values,
+                                                        False)
         else:
             result = values
             if values.dtype == np.object_:
-                na_count = lib.sanitize_objects(values, na_values, False)
+                na_count = parsers.sanitize_objects(values, na_values, False)
 
         if result.dtype == np.object_ and try_num_bool:
-            result = lib.maybe_convert_bool(values,
-                                            true_values=self.true_values,
-                                            false_values=self.false_values)
+            result = libops.maybe_convert_bool(values,
+                                               true_values=self.true_values,
+                                               false_values=self.false_values)
 
         return result, na_count
 
+    def _cast_types(self, values, cast_type, column):
+        """
+        Cast values to specified type
+
+        Parameters
+        ----------
+        values : ndarray
+        cast_type : string or np.dtype
+           dtype to cast values to
+        column : string
+            column name - used only for error reporting
+
+        Returns
+        -------
+        converted : ndarray
+        """
+
+        if is_categorical_dtype(cast_type):
+            known_cats = (isinstance(cast_type, CategoricalDtype) and
+                          cast_type.categories is not None)
+
+            if not is_object_dtype(values) and not known_cats:
+                # XXX this is for consistency with
+                # c-parser which parses all categories
+                # as strings
+                values = astype_nansafe(values, str)
+
+            cats = Index(values).unique().dropna()
+            values = Categorical._from_inferred_categories(
+                cats, cats.get_indexer(values), cast_type
+            )
+
+        else:
+            try:
+                values = astype_nansafe(values, cast_type, copy=True)
+            except ValueError:
+                raise ValueError("Unable to convert column %s to "
+                                 "type %s" % (column, cast_type))
+        return values
+
     def _do_date_conversions(self, names, data):
         # returns data, columns
+
         if self.parse_dates is not None:
             data, names = _process_date_conversion(
                 data, self._date_conv, self.parse_dates, self.index_col,
@@ -1078,22 +1686,26 @@ def __init__(self, src, **kwds):
         self.kwds = kwds
         kwds = kwds.copy()
 
-        self.as_recarray = kwds.get('as_recarray', False)
         ParserBase.__init__(self, kwds)
 
-        if 'utf-16' in (kwds.get('encoding') or ''):
+        if (kwds.get('compression') is None
+           and 'utf-16' in (kwds.get('encoding') or '')):
+            # if source is utf-16 plain text, convert source to utf-8
             if isinstance(src, compat.string_types):
                 src = open(src, 'rb')
-            src = com.UTF8Recoder(src, kwds['encoding'])
+                self.handles.append(src)
+            src = UTF8Recoder(src, kwds['encoding'])
             kwds['encoding'] = 'utf-8'
 
         # #2442
         kwds['allow_leading_cols'] = self.index_col is not False
 
-        self._reader = _parser.TextReader(src, **kwds)
+        # GH20529, validate usecol arg before TextReader
+        self.usecols, self.usecols_dtype = _validate_usecols_arg(
+            kwds['usecols'])
+        kwds['usecols'] = self.usecols
 
-        # XXX
-        self.usecols = self._reader.usecols
+        self._reader = parsers.TextReader(src, **kwds)
 
         passed_names = self.names is None
 
@@ -1118,20 +1730,30 @@ def __init__(self, src, **kwds):
             else:
                 self.names = lrange(self._reader.table_width)
 
-        # If the names were inferred (not passed by user) and usedcols is
-        # defined, then ensure names refers to the used columns, not the
-        # document's columns.
-        if self.usecols and passed_names:
-            col_indices = []
-            for u in self.usecols:
-                if isinstance(u, string_types):
-                    col_indices.append(self.names.index(u))
-                else:
-                    col_indices.append(u)
-            self.names = [n for i, n in enumerate(self.names)
-                          if i in col_indices]
-            if len(self.names) < len(self.usecols):
-                raise ValueError("Usecols do not match names.")
+        # gh-9755
+        #
+        # need to set orig_names here first
+        # so that proper indexing can be done
+        # with _set_noconvert_columns
+        #
+        # once names has been filtered, we will
+        # then set orig_names again to names
+        self.orig_names = self.names[:]
+
+        if self.usecols:
+            usecols = _evaluate_usecols(self.usecols, self.orig_names)
+
+            # GH 14671
+            if (self.usecols_dtype == 'string' and
+                    not set(usecols).issubset(self.orig_names)):
+                _validate_usecols_names(usecols, self.orig_names)
+
+            if len(self.names) > len(usecols):
+                self.names = [n for i, n in enumerate(self.names)
+                              if (i in usecols or n in usecols)]
+
+            if len(self.names) < len(usecols):
+                _validate_usecols_names(usecols, self.names)
 
         self._set_noconvert_columns()
 
@@ -1154,14 +1776,46 @@ def __init__(self, src, **kwds):
 
         self._implicit_index = self._reader.leading_cols > 0
 
+    def close(self):
+        for f in self.handles:
+            f.close()
+
+        # close additional handles opened by C parser (for compression)
+        try:
+            self._reader.close()
+        except:
+            pass
+
     def _set_noconvert_columns(self):
-        names = self.names
+        """
+        Set the columns that should not undergo dtype conversions.
+
+        Currently, any column that is involved with date parsing will not
+        undergo such conversions.
+        """
+        names = self.orig_names
+        if self.usecols_dtype == 'integer':
+            # A set of integers will be converted to a list in
+            # the correct order every single time.
+            usecols = list(self.usecols)
+            usecols.sort()
+        elif (callable(self.usecols) or
+                self.usecols_dtype not in ('empty', None)):
+            # The names attribute should have the correct columns
+            # in the proper order for indexing with parse_dates.
+            usecols = self.names[:]
+        else:
+            # Usecols is empty.
+            usecols = None
 
         def _set(x):
-            if com.is_integer(x):
-                self._reader.set_noconvert(x)
-            else:
-                self._reader.set_noconvert(names.index(x))
+            if usecols is not None and is_integer(x):
+                x = usecols[x]
+
+            if not is_integer(x):
+                x = names.index(x)
+
+            self._reader.set_noconvert(x)
 
         if isinstance(self.parse_dates, list):
             for val in self.parse_dates:
@@ -1179,6 +1833,13 @@ def _set(x):
                 else:
                     _set(val)
 
+        elif self.parse_dates:
+            if isinstance(self.index_col, list):
+                for k in self.index_col:
+                    _set(k)
+            elif self.index_col is not None:
+                _set(self.index_col)
+
     def set_error_bad_lines(self, status):
         self._reader.set_error_bad_lines(int(status))
 
@@ -1188,20 +1849,27 @@ def read(self, nrows=None):
         except StopIteration:
             if self._first_chunk:
                 self._first_chunk = False
-                return _get_empty_meta(self.orig_names,
-                                       self.index_col,
-                                       self.index_names,
-                                       dtype=self.kwds.get('dtype'))
+                names = self._maybe_dedup_names(self.orig_names)
+                index, columns, col_dict = _get_empty_meta(
+                    names, self.index_col, self.index_names,
+                    dtype=self.kwds.get('dtype'))
+                columns = self._maybe_make_multi_index_columns(
+                    columns, self.col_names)
+
+                if self.usecols is not None:
+                    columns = self._filter_usecols(columns)
+
+                col_dict = dict(filter(lambda item: item[0] in columns,
+                                       col_dict.items()))
+
+                return index, columns, col_dict
+
             else:
                 raise
 
         # Done with first read, next time raise StopIteration
         self._first_chunk = False
 
-        if self.as_recarray:
-            # what to do if there are leading columns?
-            return data
-
         names = self.names
 
         if self._reader.leading_cols:
@@ -1221,14 +1889,16 @@ def read(self, nrows=None):
                                                  try_parse_dates=True)
                 arrays.append(values)
 
-            index = MultiIndex.from_arrays(arrays)
+            index = _ensure_index_from_sequences(arrays)
 
             if self.usecols is not None:
                 names = self._filter_usecols(names)
 
+            names = self._maybe_dedup_names(names)
+
             # rename dict keys
             data = sorted(data.items())
-            data = dict((k, v) for k, (i, v) in zip(names, data))
+            data = {k: v for k, (i, v) in zip(names, data)}
 
             names, data = self._do_date_conversions(names, data)
 
@@ -1238,6 +1908,7 @@ def read(self, nrows=None):
 
             # ugh, mutation
             names = list(self.orig_names)
+            names = self._maybe_dedup_names(names)
 
             if self.usecols is not None:
                 names = self._filter_usecols(names)
@@ -1245,7 +1916,7 @@ def read(self, nrows=None):
             # columns as list
             alldata = [x[1] for x in data]
 
-            data = dict((k, v) for k, (i, v) in zip(names, data))
+            data = {k: v for k, (i, v) in zip(names, data)}
 
             names, data = self._do_date_conversions(names, data)
             index, names = self._make_index(data, alldata, names)
@@ -1257,9 +1928,10 @@ def read(self, nrows=None):
 
     def _filter_usecols(self, names):
         # hackish
-        if self.usecols is not None and len(names) != len(self.usecols):
+        usecols = _evaluate_usecols(self.usecols, names)
+        if usecols is not None and len(names) != len(usecols):
             names = [name for i, name in enumerate(names)
-                     if i in self.usecols or name in self.usecols]
+                     if i in usecols or name in usecols]
         return names
 
     def _get_index_names(self):
@@ -1299,8 +1971,8 @@ def TextParser(*args, **kwds):
     has_index_names: boolean, default False
         True if the cols defined in index_col have an index name and are
         not in the header
-    na_values : iterable, default None
-        Custom NA values
+    na_values : scalar, str, list-like, or dict, default None
+        Additional strings to recognize as NA/NaN.
     keep_default_na : bool, default True
     thousands : str, default None
         Thousands separator
@@ -1311,7 +1983,7 @@ def TextParser(*args, **kwds):
     date_parser : function, default None
     skiprows : list of integers
         Row numbers to skip
-    skip_footer : int
+    skipfooter : int
         Number of line at bottom of file to skip
     converters : dict, default None
         Dict of functions for converting values in certain columns. Keys can
@@ -1337,41 +2009,7 @@ def TextParser(*args, **kwds):
 
 
 def count_empty_vals(vals):
-    return sum([1 for v in vals if v == '' or v is None])
-
-
-def _wrap_compressed(f, compression, encoding=None):
-    """wraps compressed fileobject in a decompressing fileobject
-    NOTE: For all files in Python 3.2 and for bzip'd files under all Python
-    versions, this means reading in the entire file and then re-wrapping it in
-    StringIO.
-    """
-    compression = compression.lower()
-    encoding = encoding or get_option('display.encoding')
-
-    if compression == 'gzip':
-        import gzip
-
-        f = gzip.GzipFile(fileobj=f)
-        if compat.PY3:
-            from io import TextIOWrapper
-
-            f = TextIOWrapper(f)
-        return f
-    elif compression == 'bz2':
-        import bz2
-
-        if compat.PY3:
-            f = bz2.open(f, 'rt', encoding=encoding)
-        else:
-            # Python 2's bz2 module can't take file objects, so have to
-            # run through decompress manually
-            data = bz2.decompress(f.read())
-            f = StringIO(data)
-        return f
-    else:
-        raise ValueError('do not recognize compression method %s'
-                         % compression)
+    return sum(1 for v in vals if v == '' or v is None)
 
 
 class PythonParser(ParserBase):
@@ -1391,21 +2029,32 @@ def __init__(self, f, **kwds):
 
         self.encoding = kwds['encoding']
         self.compression = kwds['compression']
+        self.memory_map = kwds['memory_map']
         self.skiprows = kwds['skiprows']
 
-        self.skip_footer = kwds['skip_footer']
+        if callable(self.skiprows):
+            self.skipfunc = self.skiprows
+        else:
+            self.skipfunc = lambda x: x in self.skiprows
+
+        self.skipfooter = _validate_skipfooter_arg(kwds['skipfooter'])
         self.delimiter = kwds['delimiter']
 
         self.quotechar = kwds['quotechar']
+        if isinstance(self.quotechar, compat.text_type):
+            self.quotechar = str(self.quotechar)
+
         self.escapechar = kwds['escapechar']
         self.doublequote = kwds['doublequote']
         self.skipinitialspace = kwds['skipinitialspace']
         self.lineterminator = kwds['lineterminator']
         self.quoting = kwds['quoting']
-        self.mangle_dupe_cols = kwds.get('mangle_dupe_cols', True)
-        self.usecols = kwds['usecols']
+        self.usecols, _ = _validate_usecols_arg(kwds['usecols'])
         self.skip_blank_lines = kwds['skip_blank_lines']
 
+        self.warn_bad_lines = kwds['warn_bad_lines']
+        self.error_bad_lines = kwds['error_bad_lines']
+
         self.names_passed = kwds['names'] or None
 
         self.has_index_names = False
@@ -1414,21 +2063,19 @@ def __init__(self, f, **kwds):
 
         self.verbose = kwds['verbose']
         self.converters = kwds['converters']
+        self.dtype = kwds['dtype']
 
         self.thousands = kwds['thousands']
+        self.decimal = kwds['decimal']
+
         self.comment = kwds['comment']
         self._comment_lines = []
 
-        if isinstance(f, compat.string_types):
-            f = com._get_handle(f, 'r', encoding=self.encoding,
-                                compression=self.compression)
-        elif self.compression:
-            f = _wrap_compressed(f, self.compression, self.encoding)
-        # in Python 3, convert BytesIO or fileobjects passed with an encoding
-        elif compat.PY3 and isinstance(f, compat.BytesIO):
-            from io import TextIOWrapper
-
-            f = TextIOWrapper(f, encoding=self.encoding)
+        mode = 'r' if PY3 else 'rb'
+        f, handles = _get_handle(f, mode, encoding=self.encoding,
+                                 compression=self.compression,
+                                 memory_map=self.memory_map)
+        self.handles.extend(handles)
 
         # Set self.data to something that can read lines.
         if hasattr(f, 'readline'):
@@ -1437,7 +2084,7 @@ def __init__(self, f, **kwds):
             self.data = f
 
         # Get columns in two steps: infer from data, then
-        # infer column indices from self.usecols if is is specified.
+        # infer column indices from self.usecols if it is specified.
         self._col_indices = None
         self.columns, self.num_original_columns = self._infer_columns()
 
@@ -1462,8 +2109,8 @@ def __init__(self, f, **kwds):
         # multiple date column thing turning into a real spaghetti factory
 
         if not self._has_complex_date_col:
-            (index_names,
-             self.orig_names, self.columns) = self._get_index_name(self.columns)
+            (index_names, self.orig_names, self.columns) = (
+                self._get_index_name(self.columns))
             self._name_processed = True
             if self.index_names is None:
                 self.index_names = index_names
@@ -1473,13 +2120,22 @@ def __init__(self, f, **kwds):
         else:
             self._no_thousands_columns = None
 
+        if len(self.decimal) != 1:
+            raise ValueError('Only length-1 decimal markers supported')
+
+        if self.thousands is None:
+            self.nonnum = re.compile('[^-^0-9^%s]+' % self.decimal)
+        else:
+            self.nonnum = re.compile('[^-^0-9^%s^%s]+' % (self.thousands,
+                                                          self.decimal))
+
     def _set_no_thousands_columns(self):
         # Create a set of column ids that are not to be stripped of thousands
         # operators.
         noconvert_columns = set()
 
         def _set(x):
-            if com.is_integer(x):
+            if is_integer(x):
                 noconvert_columns.add(x)
             else:
                 noconvert_columns.add(self.columns.index(x))
@@ -1499,6 +2155,14 @@ def _set(x):
                         _set(k)
                 else:
                     _set(val)
+
+        elif self.parse_dates:
+            if isinstance(self.index_col, list):
+                for k in self.index_col:
+                    _set(k)
+            elif self.index_col is not None:
+                _set(self.index_col)
+
         return noconvert_columns
 
     def _make_reader(self, f):
@@ -1528,7 +2192,7 @@ class MyDialect(csv.Dialect):
             # attempt to sniff the delimiter
             if sniff_sep:
                 line = f.readline()
-                while self.pos in self.skiprows:
+                while self.skipfunc(self.pos):
                     self.pos += 1
                     line = f.readline()
 
@@ -1540,24 +2204,28 @@ class MyDialect(csv.Dialect):
                 dia.delimiter = sniffed.delimiter
                 if self.encoding is not None:
                     self.buf.extend(list(
-                        com.UnicodeReader(StringIO(line),
-                                          dialect=dia,
-                                          encoding=self.encoding)))
+                        UnicodeReader(StringIO(line),
+                                      dialect=dia,
+                                      encoding=self.encoding)))
                 else:
                     self.buf.extend(list(csv.reader(StringIO(line),
                                                     dialect=dia)))
 
             if self.encoding is not None:
-                reader = com.UnicodeReader(f, dialect=dia,
-                                           encoding=self.encoding,
-                                           strict=True)
+                reader = UnicodeReader(f, dialect=dia,
+                                       encoding=self.encoding,
+                                       strict=True)
             else:
                 reader = csv.reader(f, dialect=dia,
                                     strict=True)
 
         else:
             def _read():
-                line = next(f)
+                line = f.readline()
+
+                if compat.PY2 and self.encoding:
+                    line = line.decode(self.encoding)
+
                 pat = re.compile(sep)
                 yield pat.split(line.strip())
                 for line in f:
@@ -1581,9 +2249,12 @@ def read(self, rows=None):
         columns = list(self.orig_names)
         if not len(content):  # pragma: no cover
             # DataFrame with the right metadata, even though it's length 0
-            return _get_empty_meta(self.orig_names,
-                                   self.index_col,
-                                   self.index_names)
+            names = self._maybe_dedup_names(self.orig_names)
+            index, columns, col_dict = _get_empty_meta(
+                names, self.index_col, self.index_names, self.dtype)
+            columns = self._maybe_make_multi_index_columns(
+                columns, self.col_names)
+            return index, columns, col_dict
 
         # handle new style for names in index
         count_empty_content_vals = count_empty_vals(content[0])
@@ -1595,7 +2266,8 @@ def read(self, rows=None):
         alldata = self._rows_to_cols(content)
         data = self._exclude_implicit_index(alldata)
 
-        columns, data = self._do_date_conversions(self.columns, data)
+        columns = self._maybe_dedup_names(self.columns)
+        columns, data = self._do_date_conversions(columns, data)
 
         data = self._convert_data(data)
         index, columns = self._make_index(data, alldata, columns, indexnamerow)
@@ -1603,18 +2275,19 @@ def read(self, rows=None):
         return index, columns, data
 
     def _exclude_implicit_index(self, alldata):
+        names = self._maybe_dedup_names(self.orig_names)
 
         if self._implicit_index:
             excl_indices = self.index_col
 
             data = {}
             offset = 0
-            for i, col in enumerate(self.orig_names):
+            for i, col in enumerate(names):
                 while i + offset in excl_indices:
                     offset += 1
                 data[col] = alldata[i + offset]
         else:
-            data = dict((k, v) for k, v in zip(self.orig_names, alldata))
+            data = {k: v for k, v in zip(names, alldata)}
 
         return data
 
@@ -1622,19 +2295,47 @@ def _exclude_implicit_index(self, alldata):
     def get_chunk(self, size=None):
         if size is None:
             size = self.chunksize
-        return self.read(nrows=size)
+        return self.read(rows=size)
 
     def _convert_data(self, data):
         # apply converters
-        clean_conv = {}
+        def _clean_mapping(mapping):
+            "converts col numbers to names"
+            clean = {}
+            for col, v in compat.iteritems(mapping):
+                if isinstance(col, int) and col not in self.orig_names:
+                    col = self.orig_names[col]
+                clean[col] = v
+            return clean
+
+        clean_conv = _clean_mapping(self.converters)
+        if not isinstance(self.dtype, dict):
+            # handles single dtype applied to all columns
+            clean_dtypes = self.dtype
+        else:
+            clean_dtypes = _clean_mapping(self.dtype)
+
+        # Apply NA values.
+        clean_na_values = {}
+        clean_na_fvalues = {}
 
-        for col, f in compat.iteritems(self.converters):
-            if isinstance(col, int) and col not in self.orig_names:
-                col = self.orig_names[col]
-            clean_conv[col] = f
+        if isinstance(self.na_values, dict):
+            for col in self.na_values:
+                na_value = self.na_values[col]
+                na_fvalue = self.na_fvalues[col]
 
-        return self._convert_to_ndarrays(data, self.na_values, self.na_fvalues,
-                                         self.verbose, clean_conv)
+                if isinstance(col, int) and col not in self.orig_names:
+                    col = self.orig_names[col]
+
+                clean_na_values[col] = na_value
+                clean_na_fvalues[col] = na_fvalue
+        else:
+            clean_na_values = self.na_values
+            clean_na_fvalues = self.na_fvalues
+
+        return self._convert_to_ndarrays(data, clean_na_values,
+                                         clean_na_fvalues, self.verbose,
+                                         clean_conv, clean_dtypes)
 
     def _infer_columns(self):
         names = self.names
@@ -1643,20 +2344,43 @@ def _infer_columns(self):
         if self.header is not None:
             header = self.header
 
-            # we have a mi columns, so read an extra line
             if isinstance(header, (list, tuple, np.ndarray)):
-                have_mi_columns = True
-                header = list(header) + [header[-1] + 1]
+                have_mi_columns = len(header) > 1
+                # we have a mi columns, so read an extra line
+                if have_mi_columns:
+                    header = list(header) + [header[-1] + 1]
             else:
                 have_mi_columns = False
                 header = [header]
 
             columns = []
             for level, hr in enumerate(header):
-                line = self._buffered_line()
+                try:
+                    line = self._buffered_line()
 
-                while self.line_pos <= hr:
-                    line = self._next_line()
+                    while self.line_pos <= hr:
+                        line = self._next_line()
+
+                except StopIteration:
+                    if self.line_pos < hr:
+                        raise ValueError(
+                            'Passed header=%s but only %d lines in file'
+                            % (hr, self.line_pos + 1))
+
+                    # We have an empty file, so check
+                    # if columns are provided. That will
+                    # serve as the 'line' for parsing
+                    if have_mi_columns and hr > 0:
+                        if clear_buffer:
+                            self._clear_buffer()
+                        columns.append([None] * len(columns[-1]))
+                        return columns, num_original_columns
+
+                    if not self.names:
+                        raise EmptyDataError(
+                            "No columns to parse from file")
+
+                    line = self.names[:]
 
                 unnamed_count = 0
                 this_columns = []
@@ -1672,11 +2396,17 @@ def _infer_columns(self):
                         this_columns.append(c)
 
                 if not have_mi_columns and self.mangle_dupe_cols:
-                    counts = {}
+                    counts = defaultdict(int)
+
                     for i, col in enumerate(this_columns):
-                        cur_count = counts.get(col, 0)
-                        if cur_count > 0:
-                            this_columns[i] = '%s.%d' % (col, cur_count)
+                        cur_count = counts[col]
+
+                        while cur_count > 0:
+                            counts[col] = cur_count + 1
+                            col = "%s.%d" % (col, cur_count)
+                            cur_count = counts[col]
+
+                        this_columns[i] = col
                         counts[col] = cur_count + 1
                 elif have_mi_columns:
 
@@ -1687,7 +2417,7 @@ def _infer_columns(self):
                         lc = len(this_columns)
                         ic = (len(self.index_col)
                               if self.index_col is not None else 0)
-                        if lc != unnamed_count and lc-ic > unnamed_count:
+                        if lc != unnamed_count and lc - ic > unnamed_count:
                             clear_buffer = False
                             this_columns = [None] * lc
                             self.buf = [self.buf[-1]]
@@ -1700,10 +2430,10 @@ def _infer_columns(self):
                 self._clear_buffer()
 
             if names is not None:
-                if ((self.usecols is not None
-                        and len(names) != len(self.usecols))
-                    or (self.usecols is None
-                        and len(names) != len(columns[0]))):
+                if ((self.usecols is not None and
+                     len(names) != len(self.usecols)) or
+                    (self.usecols is None and
+                     len(names) != len(columns[0]))):
                     raise ValueError('Number of passed names did not match '
                                      'number of header fields in the file')
                 if len(columns) > 1:
@@ -1721,22 +2451,33 @@ def _infer_columns(self):
             else:
                 columns = self._handle_usecols(columns, columns[0])
         else:
-            # header is None
-            line = self._buffered_line()
+            try:
+                line = self._buffered_line()
+
+            except StopIteration:
+                if not names:
+                    raise EmptyDataError(
+                        "No columns to parse from file")
+
+                line = names[:]
+
             ncols = len(line)
             num_original_columns = ncols
+
             if not names:
                 if self.prefix:
-                    columns = [['%s%d' % (self.prefix, i) for i in range(ncols)]]
+                    columns = [['%s%d' % (self.prefix, i)
+                                for i in range(ncols)]]
                 else:
                     columns = [lrange(ncols)]
                 columns = self._handle_usecols(columns, columns[0])
             else:
-                if self.usecols is None or len(names) == num_original_columns:
+                if self.usecols is None or len(names) >= num_original_columns:
                     columns = self._handle_usecols([names], names)
                     num_original_columns = len(names)
                 else:
-                    if self.usecols and len(names) != len(self.usecols):
+                    if (not callable(self.usecols) and
+                            len(names) != len(self.usecols)):
                         raise ValueError(
                             'Number of passed names did not match number of '
                             'header fields in the file'
@@ -1755,16 +2496,22 @@ def _handle_usecols(self, columns, usecols_key):
         usecols_key is used if there are string usecols.
         """
         if self.usecols is not None:
-            if any([isinstance(u, string_types) for u in self.usecols]):
+            if callable(self.usecols):
+                col_indices = _evaluate_usecols(self.usecols, usecols_key)
+            elif any(isinstance(u, string_types) for u in self.usecols):
                 if len(columns) > 1:
                     raise ValueError("If using multiple headers, usecols must "
                                      "be integers.")
                 col_indices = []
-                for u in self.usecols:
-                    if isinstance(u, string_types):
-                        col_indices.append(usecols_key.index(u))
+
+                for col in self.usecols:
+                    if isinstance(col, string_types):
+                        try:
+                            col_indices.append(usecols_key.index(col))
+                        except ValueError:
+                            _validate_usecols_names(self.usecols, usecols_key)
                     else:
-                        col_indices.append(u)
+                        col_indices.append(col)
             else:
                 col_indices = self.usecols
 
@@ -1782,12 +2529,85 @@ def _buffered_line(self):
         else:
             return self._next_line()
 
-    def _empty(self, line):
+    def _check_for_bom(self, first_row):
+        """
+        Checks whether the file begins with the BOM character.
+        If it does, remove it. In addition, if there is quoting
+        in the field subsequent to the BOM, remove it as well
+        because it technically takes place at the beginning of
+        the name, not the middle of it.
+        """
+        # first_row will be a list, so we need to check
+        # that that list is not empty before proceeding.
+        if not first_row:
+            return first_row
+
+        # The first element of this row is the one that could have the
+        # BOM that we want to remove. Check that the first element is a
+        # string before proceeding.
+        if not isinstance(first_row[0], compat.string_types):
+            return first_row
+
+        # Check that the string is not empty, as that would
+        # obviously not have a BOM at the start of it.
+        if not first_row[0]:
+            return first_row
+
+        # Since the string is non-empty, check that it does
+        # in fact begin with a BOM.
+        first_elt = first_row[0][0]
+
+        # This is to avoid warnings we get in Python 2.x if
+        # we find ourselves comparing with non-Unicode
+        if compat.PY2 and not isinstance(first_elt, unicode):  # noqa
+            try:
+                first_elt = u(first_elt)
+            except UnicodeDecodeError:
+                return first_row
+
+        if first_elt != _BOM:
+            return first_row
+
+        first_row = first_row[0]
+
+        if len(first_row) > 1 and first_row[1] == self.quotechar:
+            start = 2
+            quote = first_row[1]
+            end = first_row[2:].index(quote) + 2
+
+            # Extract the data between the quotation marks
+            new_row = first_row[start:end]
+
+            # Extract any remaining data after the second
+            # quotation mark.
+            if len(first_row) > end + 1:
+                new_row += first_row[end + 1:]
+            return [new_row]
+        elif len(first_row) > 1:
+            return [first_row[1:]]
+        else:
+            # First row is just the BOM, so we
+            # return an empty string.
+            return [""]
+
+    def _is_line_empty(self, line):
+        """
+        Check if a line is empty or not.
+
+        Parameters
+        ----------
+        line : str, array-like
+            The line of data to check.
+
+        Returns
+        -------
+        boolean : Whether or not the line is empty.
+        """
         return not line or all(not x for x in line)
 
     def _next_line(self):
         if isinstance(self.data, list):
-            while self.pos in self.skiprows:
+            while self.skipfunc(self.pos):
                 self.pos += 1
 
             while True:
@@ -1795,37 +2615,108 @@ def _next_line(self):
                     line = self._check_comments([self.data[self.pos]])[0]
                     self.pos += 1
                     # either uncommented or blank to begin with
-                    if not self.skip_blank_lines and (self._empty(self.data[
-                            self.pos - 1]) or line):
+                    if (not self.skip_blank_lines and
+                            (self._is_line_empty(
+                                self.data[self.pos - 1]) or line)):
                         break
                     elif self.skip_blank_lines:
-                        ret = self._check_empty([line])
+                        ret = self._remove_empty_lines([line])
                         if ret:
                             line = ret[0]
                             break
                 except IndexError:
                     raise StopIteration
         else:
-            while self.pos in self.skiprows:
+            while self.skipfunc(self.pos):
                 self.pos += 1
                 next(self.data)
 
             while True:
-                orig_line = next(self.data)
-                line = self._check_comments([orig_line])[0]
+                orig_line = self._next_iter_line(row_num=self.pos + 1)
                 self.pos += 1
-                if not self.skip_blank_lines and (self._empty(orig_line) or line):
-                    break
-                elif self.skip_blank_lines:
-                    ret = self._check_empty([line])
-                    if ret:
-                        line = ret[0]
+
+                if orig_line is not None:
+                    line = self._check_comments([orig_line])[0]
+
+                    if self.skip_blank_lines:
+                        ret = self._remove_empty_lines([line])
+
+                        if ret:
+                            line = ret[0]
+                            break
+                    elif self._is_line_empty(orig_line) or line:
                         break
 
+        # This was the first line of the file,
+        # which could contain the BOM at the
+        # beginning of it.
+        if self.pos == 1:
+            line = self._check_for_bom(line)
+
         self.line_pos += 1
         self.buf.append(line)
         return line
 
+    def _alert_malformed(self, msg, row_num):
+        """
+        Alert a user about a malformed row.
+
+        If `self.error_bad_lines` is True, the alert will be `ParserError`.
+        If `self.warn_bad_lines` is True, the alert will be printed out.
+
+        Parameters
+        ----------
+        msg : The error message to display.
+        row_num : The row number where the parsing error occurred.
+                  Because this row number is displayed, we 1-index,
+                  even though we 0-index internally.
+        """
+
+        if self.error_bad_lines:
+            raise ParserError(msg)
+        elif self.warn_bad_lines:
+            base = 'Skipping line {row_num}: '.format(row_num=row_num)
+            sys.stderr.write(base + msg + '\n')
+
+    def _next_iter_line(self, row_num):
+        """
+        Wrapper around iterating through `self.data` (CSV source).
+
+        When a CSV error is raised, we check for specific
+        error messages that allow us to customize the
+        error message displayed to the user.
+
+        Parameters
+        ----------
+        row_num : The row number of the line being parsed.
+        """
+
+        try:
+            return next(self.data)
+        except csv.Error as e:
+            if self.warn_bad_lines or self.error_bad_lines:
+                msg = str(e)
+
+                if 'NULL byte' in msg:
+                    msg = ('NULL byte detected. This byte '
+                           'cannot be processed in Python\'s '
+                           'native csv library at the moment, '
+                           'so please pass in engine=\'c\' instead')
+                elif 'newline inside string' in msg:
+                    msg = ('EOF inside string starting with '
+                           'line ' + str(row_num))
+
+                if self.skipfooter > 0:
+                    reason = ('Error could possibly be due to '
+                              'parsing errors in the skipped footer rows '
+                              '(the skipfooter keyword is only applied '
+                              'after Python\'s csv library has parsed '
+                              'all rows).')
+                    msg += '. ' + reason
+
+                self._alert_malformed(msg, row_num)
+            return None
+
     def _check_comments(self, lines):
         if self.comment is None:
             return lines
@@ -1844,34 +2735,63 @@ def _check_comments(self, lines):
             ret.append(rl)
         return ret
 
-    def _check_empty(self, lines):
+    def _remove_empty_lines(self, lines):
+        """
+        Iterate through the lines and remove any that are
+        either empty or contain only one whitespace value
+
+        Parameters
+        ----------
+        lines : array-like
+            The array of lines that we are to filter.
+
+        Returns
+        -------
+        filtered_lines : array-like
+            The same array of lines with the "empty" ones removed.
+        """
+
         ret = []
         for l in lines:
             # Remove empty lines and lines with only one whitespace value
-            if len(l) > 1 or len(l) == 1 and (not isinstance(l[0],
-                                compat.string_types) or l[0].strip()):
+            if (len(l) > 1 or len(l) == 1 and
+                    (not isinstance(l[0], compat.string_types) or
+                     l[0].strip())):
                 ret.append(l)
         return ret
 
     def _check_thousands(self, lines):
         if self.thousands is None:
             return lines
-        nonnum = re.compile('[^-^0-9^%s^.]+' % self.thousands)
+
+        return self._search_replace_num_columns(lines=lines,
+                                                search=self.thousands,
+                                                replace='')
+
+    def _search_replace_num_columns(self, lines, search, replace):
         ret = []
         for l in lines:
             rl = []
             for i, x in enumerate(l):
                 if (not isinstance(x, compat.string_types) or
-                    self.thousands not in x or
-                    (self._no_thousands_columns
-                        and i in self._no_thousands_columns)
-                        or nonnum.search(x.strip())):
+                    search not in x or
+                    (self._no_thousands_columns and
+                     i in self._no_thousands_columns) or
+                        self.nonnum.search(x.strip())):
                     rl.append(x)
                 else:
-                    rl.append(x.replace(self.thousands, ''))
+                    rl.append(x.replace(search, replace))
             ret.append(rl)
         return ret
 
+    def _check_decimal(self, lines):
+        if self.decimal == _parser_defaults['decimal']:
+            return lines
+
+        return self._search_replace_num_columns(lines=lines,
+                                                search=self.decimal,
+                                                replace='.')
+
     def _clear_buffer(self):
         self.buf = []
 
@@ -1941,48 +2861,69 @@ def _get_index_name(self, columns):
         return index_name, orig_names, columns
 
     def _rows_to_cols(self, content):
-        zipped_content = list(lib.to_object_array(content).T)
-
         col_len = self.num_original_columns
-        zip_len = len(zipped_content)
 
         if self._implicit_index:
             col_len += len(self.index_col)
 
-        if self.skip_footer < 0:
-            raise ValueError('skip footer cannot be negative')
+        max_len = max(len(row) for row in content)
 
-        # Loop through rows to verify lengths are correct.
-        if col_len != zip_len and self.index_col is not False:
-            i = 0
-            for (i, l) in enumerate(content):
-                if len(l) != col_len:
-                    break
+        # Check that there are no rows with too many
+        # elements in their row (rows with too few
+        # elements are padded with NaN).
+        if (max_len > col_len and
+                self.index_col is not False and
+                self.usecols is None):
 
-            footers = 0
-            if self.skip_footer:
-                footers = self.skip_footer
+            footers = self.skipfooter if self.skipfooter else 0
+            bad_lines = []
 
-            row_num = self.pos - (len(content) - i + footers)
+            iter_content = enumerate(content)
+            content_len = len(content)
+            content = []
 
-            msg = ('Expected %d fields in line %d, saw %d' %
-                   (col_len, row_num + 1, zip_len))
-            raise ValueError(msg)
+            for (i, l) in iter_content:
+                actual_len = len(l)
+
+                if actual_len > col_len:
+                    if self.error_bad_lines or self.warn_bad_lines:
+                        row_num = self.pos - (content_len - i + footers)
+                        bad_lines.append((row_num, actual_len))
+
+                        if self.error_bad_lines:
+                            break
+                else:
+                    content.append(l)
+
+            for row_num, actual_len in bad_lines:
+                msg = ('Expected %d fields in line %d, saw %d' %
+                       (col_len, row_num + 1, actual_len))
+                if (self.delimiter and
+                        len(self.delimiter) > 1 and
+                        self.quoting != csv.QUOTE_NONE):
+                    # see gh-13374
+                    reason = ('Error could possibly be due to quotes being '
+                              'ignored when a multi-char delimiter is used.')
+                    msg += '. ' + reason
+
+                self._alert_malformed(msg, row_num + 1)
+
+        # see gh-13320
+        zipped_content = list(lib.to_object_array(
+            content, min_width=col_len).T)
 
         if self.usecols:
             if self._implicit_index:
                 zipped_content = [
                     a for i, a in enumerate(zipped_content)
-                    if (i < len(self.index_col)
-                        or i - len(self.index_col) in self._col_indices)
-                ]
+                    if (i < len(self.index_col) or
+                        i - len(self.index_col) in self._col_indices)]
             else:
                 zipped_content = [a for i, a in enumerate(zipped_content)
                                   if i in self._col_indices]
         return zipped_content
 
     def _get_lines(self, rows=None):
-        source = self.data
         lines = self.buf
         new_rows = None
 
@@ -1997,20 +2938,20 @@ def _get_lines(self, rows=None):
                 rows -= len(self.buf)
 
         if new_rows is None:
-            if isinstance(source, list):
-                if self.pos > len(source):
+            if isinstance(self.data, list):
+                if self.pos > len(self.data):
                     raise StopIteration
                 if rows is None:
-                    new_rows = source[self.pos:]
-                    new_pos = len(source)
+                    new_rows = self.data[self.pos:]
+                    new_pos = len(self.data)
                 else:
-                    new_rows = source[self.pos:self.pos + rows]
+                    new_rows = self.data[self.pos:self.pos + rows]
                     new_pos = self.pos + rows
 
                 # Check for stop rows. n.b.: self.skiprows is a set.
                 if self.skiprows:
                     new_rows = [row for i, row in enumerate(new_rows)
-                                if i + self.pos not in self.skiprows]
+                                if not self.skipfunc(i + self.pos)]
 
                 lines.extend(new_rows)
                 self.pos = new_pos
@@ -2020,25 +2961,23 @@ def _get_lines(self, rows=None):
                 try:
                     if rows is not None:
                         for _ in range(rows):
-                            new_rows.append(next(source))
+                            new_rows.append(next(self.data))
                         lines.extend(new_rows)
                     else:
                         rows = 0
+
                         while True:
-                            try:
-                                new_rows.append(next(source))
-                                rows += 1
-                            except csv.Error as inst:
-                                if 'newline inside string' in str(inst):
-                                    row_num = str(self.pos + rows)
-                                    msg = ('EOF inside string starting with '
-                                           'line ' + row_num)
-                                    raise Exception(msg)
-                                raise
+                            new_row = self._next_iter_line(
+                                row_num=self.pos + rows + 1)
+                            rows += 1
+
+                            if new_row is not None:
+                                new_rows.append(new_row)
+
                 except StopIteration:
                     if self.skiprows:
                         new_rows = [row for i, row in enumerate(new_rows)
-                                    if self.pos + i not in self.skiprows]
+                                    if not self.skipfunc(i + self.pos)]
                     lines.extend(new_rows)
                     if len(lines) == 0:
                         raise
@@ -2048,13 +2987,14 @@ def _get_lines(self, rows=None):
         else:
             lines = new_rows
 
-        if self.skip_footer:
-            lines = lines[:-self.skip_footer]
+        if self.skipfooter:
+            lines = lines[:-self.skipfooter]
 
         lines = self._check_comments(lines)
         if self.skip_blank_lines:
-            lines = self._check_empty(lines)
-        return self._check_thousands(lines)
+            lines = self._remove_empty_lines(lines)
+        lines = self._check_thousands(lines)
+        return self._check_decimal(lines)
 
 
 def _make_date_converter(date_parser=None, dayfirst=False,
@@ -2064,8 +3004,8 @@ def converter(*date_cols):
             strs = _concat_date_cols(date_cols)
 
             try:
-                return tools._to_datetime(
-                    com._ensure_object(strs),
+                return tools.to_datetime(
+                    _ensure_object(strs),
                     utc=None,
                     box=False,
                     dayfirst=dayfirst,
@@ -2074,19 +3014,20 @@ def converter(*date_cols):
                 )
             except:
                 return tools.to_datetime(
-                    lib.try_parse_dates(strs, dayfirst=dayfirst))
+                    parsing.try_parse_dates(strs, dayfirst=dayfirst))
         else:
             try:
-                result = tools.to_datetime(date_parser(*date_cols), errors='ignore')
+                result = tools.to_datetime(
+                    date_parser(*date_cols), errors='ignore')
                 if isinstance(result, datetime.datetime):
                     raise Exception('scalar parser')
                 return result
             except Exception:
                 try:
                     return tools.to_datetime(
-                        lib.try_parse_dates(_concat_date_cols(date_cols),
-                                            parser=date_parser,
-                                            dayfirst=dayfirst),
+                        parsing.try_parse_dates(_concat_date_cols(date_cols),
+                                                parser=date_parser,
+                                                dayfirst=dayfirst),
                         errors='ignore')
                 except Exception:
                     return generic_parser(date_parser, *date_cols)
@@ -2099,9 +3040,9 @@ def _process_date_conversion(data_dict, converter, parse_spec,
                              keep_date_col=False):
     def _isindex(colspec):
         return ((isinstance(index_col, list) and
-                 colspec in index_col)
-                or (isinstance(index_names, list) and
-                    colspec in index_names))
+                 colspec in index_col) or
+                (isinstance(index_names, list) and
+                 colspec in index_names))
 
     new_cols = []
     new_data = {}
@@ -2117,7 +3058,7 @@ def _isindex(colspec):
     if isinstance(parse_spec, list):
         # list of column lists
         for colspec in parse_spec:
-            if np.isscalar(colspec):
+            if is_scalar(colspec):
                 if isinstance(colspec, int) and colspec not in data_dict:
                     colspec = orig_names[colspec]
                 if _isindex(colspec):
@@ -2166,11 +3107,11 @@ def _try_convert_dates(parser, colspec, data_dict, columns):
         if c in colset:
             colnames.append(c)
         elif isinstance(c, int) and c not in columns:
-            colnames.append(str(columns[c]))
+            colnames.append(columns[c])
         else:
             colnames.append(c)
 
-    new_name = '_'.join([str(x) for x in colnames])
+    new_name = '_'.join(str(x) for x in colnames)
     to_parse = [data_dict[c] for c in colnames if c in data_dict]
 
     new_col = parser(*to_parse)
@@ -2183,18 +3124,28 @@ def _clean_na_values(na_values, keep_default_na=True):
         if keep_default_na:
             na_values = _NA_VALUES
         else:
-            na_values = []
+            na_values = set()
         na_fvalues = set()
     elif isinstance(na_values, dict):
-        if keep_default_na:
-            for k, v in compat.iteritems(na_values):
-                v = set(list(v)) | _NA_VALUES
-                na_values[k] = v
-        na_fvalues = dict([
-            (k, _floatify_na_values(v)) for k, v in na_values.items()
-        ])
+        old_na_values = na_values.copy()
+        na_values = {}  # Prevent aliasing.
+
+        # Convert the values in the na_values dictionary
+        # into array-likes for further use. This is also
+        # where we append the default NaN values, provided
+        # that `keep_default_na=True`.
+        for k, v in compat.iteritems(old_na_values):
+            if not is_list_like(v):
+                v = [v]
+
+            if keep_default_na:
+                v = set(v) | _NA_VALUES
+
+            na_values[k] = v
+        na_fvalues = dict((k, _floatify_na_values(v))
+                          for k, v in na_values.items())
     else:
-        if not com.is_list_like(na_values):
+        if not is_list_like(na_values):
             na_values = [na_values]
         na_values = _stringify_na_values(na_values)
         if keep_default_na:
@@ -2241,25 +3192,44 @@ def _clean_index_names(columns, index_col):
 def _get_empty_meta(columns, index_col, index_names, dtype=None):
     columns = list(columns)
 
-    if dtype is None:
-        dtype = {}
+    # Convert `dtype` to a defaultdict of some kind.
+    # This will enable us to write `dtype[col_name]`
+    # without worrying about KeyError issues later on.
+    if not isinstance(dtype, dict):
+        # if dtype == None, default will be np.object.
+        default_dtype = dtype or np.object
+        dtype = defaultdict(lambda: default_dtype)
     else:
-        # Convert column indexes to column names.
-        dtype = dict((columns[k] if com.is_integer(k) else k, v)
-                     for k, v in compat.iteritems(dtype))
+        # Save a copy of the dictionary.
+        _dtype = dtype.copy()
+        dtype = defaultdict(lambda: np.object)
 
-    if index_col is None or index_col is False:
+        # Convert column indexes to column names.
+        for k, v in compat.iteritems(_dtype):
+            col = columns[k] if is_integer(k) else k
+            dtype[col] = v
+
+    # Even though we have no data, the "index" of the empty DataFrame
+    # could for example still be an empty MultiIndex. Thus, we need to
+    # check whether we have any index columns specified, via either:
+    #
+    # 1) index_col (column indices)
+    # 2) index_names (column names)
+    #
+    # Both must be non-null to ensure a successful construction. Otherwise,
+    # we have to create a generic emtpy Index.
+    if (index_col is None or index_col is False) or index_names is None:
         index = Index([])
     else:
-        index = [np.empty(0, dtype=dtype.get(index_name, np.object))
-                  for index_name in index_names]
-        index = MultiIndex.from_arrays(index, names=index_names)
+        data = [Series([], dtype=dtype[name]) for name in index_names]
+        index = _ensure_index_from_sequences(data, names=index_names)
         index_col.sort()
+
         for i, n in enumerate(index_col):
-            columns.pop(n-i)
+            columns.pop(n - i)
 
-    col_dict = dict((col_name, np.empty(0, dtype=dtype.get(col_name, np.object)))
-                    for col_name in columns)
+    col_dict = {col_name: Series([], dtype=dtype[col_name])
+                for col_name in columns}
 
     return index, columns, col_dict
 
@@ -2302,14 +3272,38 @@ def _stringify_na_values(na_values):
     return set(result)
 
 
-def _get_na_values(col, na_values, na_fvalues):
+def _get_na_values(col, na_values, na_fvalues, keep_default_na):
+    """
+    Get the NaN values for a given column.
+
+    Parameters
+    ----------
+    col : str
+        The name of the column.
+    na_values : array-like, dict
+        The object listing the NaN values as strings.
+    na_fvalues : array-like, dict
+        The object listing the NaN values as floats.
+    keep_default_na : bool
+        If `na_values` is a dict, and the column is not mapped in the
+        dictionary, whether to return the default NaN values or the empty set.
+
+    Returns
+    -------
+    nan_tuple : A length-two tuple composed of
+
+        1) na_values : the string NaN values for that column.
+        2) na_fvalues : the float NaN values for that column.
+    """
+
     if isinstance(na_values, dict):
         if col in na_values:
-            values = na_values[col]
-            fvalues = na_fvalues[col]
             return na_values[col], na_fvalues[col]
         else:
-            return _NA_VALUES, set()
+            if keep_default_na:
+                return _NA_VALUES, set()
+
+            return set(), set()
     else:
         return na_values, na_fvalues
 
@@ -2336,22 +3330,23 @@ def _concat_date_cols(date_cols):
                 for x in date_cols[0]
             ], dtype=object)
 
-    rs = np.array([' '.join([compat.text_type(y) for y in x])
+    rs = np.array([' '.join(compat.text_type(y) for y in x)
                    for x in zip(*date_cols)], dtype=object)
     return rs
 
 
-class FixedWidthReader(object):
+class FixedWidthReader(BaseIterator):
     """
     A reader of fixed-width lines.
     """
-    def __init__(self, f, colspecs, delimiter, comment):
+
+    def __init__(self, f, colspecs, delimiter, comment, skiprows=None):
         self.f = f
         self.buffer = None
         self.delimiter = '\r\n' + delimiter if delimiter else '\n\r\t '
         self.comment = comment
         if colspecs == 'infer':
-            self.colspecs = self.detect_colspecs()
+            self.colspecs = self.detect_colspecs(skiprows=skiprows)
         else:
             self.colspecs = colspecs
 
@@ -2360,7 +3355,6 @@ def __init__(self, f, colspecs, delimiter, comment):
                             "input was a %r" % type(colspecs).__name__)
 
         for colspec in self.colspecs:
-
             if not (isinstance(colspec, (tuple, list)) and
                     len(colspec) == 2 and
                     isinstance(colspec[0], (int, np.integer, type(None))) and
@@ -2368,20 +3362,50 @@ def __init__(self, f, colspecs, delimiter, comment):
                 raise TypeError('Each column specification must be '
                                 '2 element tuple or list of integers')
 
-    def get_rows(self, n):
-        rows = []
-        for i, row in enumerate(self.f, 1):
-            rows.append(row)
-            if i >= n:
+    def get_rows(self, n, skiprows=None):
+        """
+        Read rows from self.f, skipping as specified.
+
+        We distinguish buffer_rows (the first <= n lines)
+        from the rows returned to detect_colspecs because
+        it's simpler to leave the other locations with
+        skiprows logic alone than to modify them to deal
+        with the fact we skipped some rows here as well.
+
+        Parameters
+        ----------
+        n : int
+            Number of rows to read from self.f, not counting
+            rows that are skipped.
+        skiprows: set, optional
+            Indices of rows to skip.
+
+        Returns
+        -------
+        detect_rows : list of str
+            A list containing the rows to read.
+
+        """
+        if skiprows is None:
+            skiprows = set()
+        buffer_rows = []
+        detect_rows = []
+        for i, row in enumerate(self.f):
+            if i not in skiprows:
+                detect_rows.append(row)
+            buffer_rows.append(row)
+            if len(detect_rows) >= n:
                 break
-        self.buffer = iter(rows)
-        return rows
+        self.buffer = iter(buffer_rows)
+        return detect_rows
 
-    def detect_colspecs(self, n=100):
+    def detect_colspecs(self, n=100, skiprows=None):
         # Regex escape the delimiters
-        delimiters = ''.join([r'\%s' % x for x in self.delimiter])
+        delimiters = ''.join(r'\%s' % x for x in self.delimiter)
         pattern = re.compile('([^%s]+)' % delimiters)
-        rows = self.get_rows(n)
+        rows = self.get_rows(n, skiprows)
+        if not rows:
+            raise EmptyDataError("No rows from which to infer column width")
         max_len = max(map(len, rows))
         mask = np.zeros(max_len + 1, dtype=int)
         if self.comment is not None:
@@ -2392,9 +3416,10 @@ def detect_colspecs(self, n=100):
         shifted = np.roll(mask, 1)
         shifted[0] = 0
         edges = np.where((mask ^ shifted) == 1)[0]
-        return list(zip(edges[::2], edges[1::2]))
+        edge_pairs = list(zip(edges[::2], edges[1::2]))
+        return edge_pairs
 
-    def next(self):
+    def __next__(self):
         if self.buffer is not None:
             try:
                 line = next(self.buffer)
@@ -2407,21 +3432,18 @@ def next(self):
         return [line[fromm:to].strip(self.delimiter)
                 for (fromm, to) in self.colspecs]
 
-    # Iterator protocol in Python 3 uses __next__()
-    __next__ = next
-
 
 class FixedWidthFieldParser(PythonParser):
     """
     Specialization that Converts fixed-width fields into DataFrames.
     See PythonParser for details.
     """
+
     def __init__(self, f, **kwds):
         # Support iterators, convert to a list.
         self.colspecs = kwds.pop('colspecs')
-
         PythonParser.__init__(self, f, **kwds)
 
     def _make_reader(self, f):
         self.data = FixedWidthReader(f, self.colspecs, self.delimiter,
-                                     self.comment)
+                                     self.comment, self.skiprows)
diff --git a/pandas/io/pickle.py b/pandas/io/pickle.py
index 52a9ef0370e9e..d347d76c33e0f 100644
--- a/pandas/io/pickle.py
+++ b/pandas/io/pickle.py
@@ -1,36 +1,155 @@
-from pandas.compat import cPickle as pkl, pickle_compat as pc, PY3
+""" pickle compat """
+import warnings
 
-def to_pickle(obj, path):
+import numpy as np
+from numpy.lib.format import read_array, write_array
+from pandas.compat import BytesIO, cPickle as pkl, pickle_compat as pc, PY3
+from pandas.core.dtypes.common import is_datetime64_dtype, _NS_DTYPE
+from pandas.io.common import _get_handle, _infer_compression, _stringify_path
+
+
+def to_pickle(obj, path, compression='infer', protocol=pkl.HIGHEST_PROTOCOL):
     """
-    Pickle (serialize) object to input file path
+    Pickle (serialize) object to file.
 
     Parameters
     ----------
     obj : any object
-    path : string
-        File path
+        Any python object.
+    path : str
+        File path where the pickled object will be stored.
+    compression : {'infer', 'gzip', 'bz2', 'zip', 'xz', None}, default 'infer'
+        A string representing the compression to use in the output file. By
+        default, infers from the file extension in specified path.
+
+        .. versionadded:: 0.20.0
+    protocol : int
+        Int which indicates which protocol should be used by the pickler,
+        default HIGHEST_PROTOCOL (see [1], paragraph 12.1.2). The possible
+        values for this parameter depend on the version of Python. For Python
+        2.x, possible values are 0, 1, 2. For Python>=3.0, 3 is a valid value.
+        For Python >= 3.4, 4 is a valid value. A negative value for the
+        protocol parameter is equivalent to setting its value to
+        HIGHEST_PROTOCOL.
+
+        .. [1] https://docs.python.org/3/library/pickle.html
+        .. versionadded:: 0.21.0
+
+    See Also
+    --------
+    read_pickle : Load pickled pandas object (or any object) from file.
+    DataFrame.to_hdf : Write DataFrame to an HDF5 file.
+    DataFrame.to_sql : Write DataFrame to a SQL database.
+    DataFrame.to_parquet : Write a DataFrame to the binary parquet format.
+
+    Examples
+    --------
+    >>> original_df = pd.DataFrame({"foo": range(5), "bar": range(5, 10)})
+    >>> original_df
+       foo  bar
+    0    0    5
+    1    1    6
+    2    2    7
+    3    3    8
+    4    4    9
+    >>> pd.to_pickle(original_df, "./dummy.pkl")
+
+    >>> unpickled_df = pd.read_pickle("./dummy.pkl")
+    >>> unpickled_df
+       foo  bar
+    0    0    5
+    1    1    6
+    2    2    7
+    3    3    8
+    4    4    9
+
+    >>> import os
+    >>> os.remove("./dummy.pkl")
     """
-    with open(path, 'wb') as f:
-        pkl.dump(obj, f, protocol=pkl.HIGHEST_PROTOCOL)
+    path = _stringify_path(path)
+    inferred_compression = _infer_compression(path, compression)
+    f, fh = _get_handle(path, 'wb',
+                        compression=inferred_compression,
+                        is_text=False)
+    if protocol < 0:
+        protocol = pkl.HIGHEST_PROTOCOL
+    try:
+        f.write(pkl.dumps(obj, protocol=protocol))
+    finally:
+        for _f in fh:
+            _f.close()
 
 
-def read_pickle(path):
+def read_pickle(path, compression='infer'):
     """
-    Load pickled pandas object (or any other pickled object) from the specified
-    file path
+    Load pickled pandas object (or any object) from file.
+
+    .. warning::
 
-    Warning: Loading pickled data received from untrusted sources can be
-    unsafe. See: http://docs.python.org/2.7/library/pickle.html
+       Loading pickled data received from untrusted sources can be
+       unsafe. See `here <https://docs.python.org/3/library/pickle.html>`__.
 
     Parameters
     ----------
-    path : string
-        File path
+    path : str
+        File path where the pickled object will be loaded.
+    compression : {'infer', 'gzip', 'bz2', 'zip', 'xz', None}, default 'infer'
+        For on-the-fly decompression of on-disk data. If 'infer', then use
+        gzip, bz2, xz or zip if path ends in '.gz', '.bz2', '.xz',
+        or '.zip' respectively, and no decompression otherwise.
+        Set to None for no decompression.
+
+        .. versionadded:: 0.20.0
 
     Returns
     -------
-    unpickled : type of object stored in file
+    unpickled : same type as object stored in file
+
+    See Also
+    --------
+    DataFrame.to_pickle : Pickle (serialize) DataFrame object to file.
+    Series.to_pickle : Pickle (serialize) Series object to file.
+    read_hdf : Read HDF5 file into a DataFrame.
+    read_sql : Read SQL query or database table into a DataFrame.
+    read_parquet : Load a parquet object, returning a DataFrame.
+
+    Examples
+    --------
+    >>> original_df = pd.DataFrame({"foo": range(5), "bar": range(5, 10)})
+    >>> original_df
+       foo  bar
+    0    0    5
+    1    1    6
+    2    2    7
+    3    3    8
+    4    4    9
+    >>> pd.to_pickle(original_df, "./dummy.pkl")
+
+    >>> unpickled_df = pd.read_pickle("./dummy.pkl")
+    >>> unpickled_df
+       foo  bar
+    0    0    5
+    1    1    6
+    2    2    7
+    3    3    8
+    4    4    9
+
+    >>> import os
+    >>> os.remove("./dummy.pkl")
     """
+    path = _stringify_path(path)
+    inferred_compression = _infer_compression(path, compression)
+
+    def read_wrapper(func):
+        # wrapper file handle open/close operation
+        f, fh = _get_handle(path, 'rb',
+                            compression=inferred_compression,
+                            is_text=False)
+        try:
+            return func(f)
+        finally:
+            for _f in fh:
+                _f.close()
 
     def try_read(path, encoding=None):
         # try with cPickle
@@ -42,23 +161,45 @@ def try_read(path, encoding=None):
         # cpickle
         # GH 6899
         try:
-            with open(path, 'rb') as fh:
-                return pkl.load(fh)
-        except (Exception) as e:
-
+            with warnings.catch_warnings(record=True):
+                # We want to silencce any warnings about, e.g. moved modules.
+                return read_wrapper(lambda f: pkl.load(f))
+        except Exception:
             # reg/patched pickle
             try:
-                with open(path, 'rb') as fh:
-                    return pc.load(fh, encoding=encoding, compat=False)
-
+                return read_wrapper(
+                    lambda f: pc.load(f, encoding=encoding, compat=False))
             # compat pickle
             except:
-                with open(path, 'rb') as fh:
-                    return pc.load(fh, encoding=encoding, compat=True)
-
+                return read_wrapper(
+                    lambda f: pc.load(f, encoding=encoding, compat=True))
     try:
         return try_read(path)
     except:
         if PY3:
             return try_read(path, encoding='latin1')
         raise
+
+
+# compat with sparse pickle / unpickle
+
+
+def _pickle_array(arr):
+    arr = arr.view(np.ndarray)
+
+    buf = BytesIO()
+    write_array(buf, arr)
+
+    return buf.getvalue()
+
+
+def _unpickle_array(bytes):
+    arr = read_array(BytesIO(bytes))
+
+    # All datetimes should be stored as M8[ns].  When unpickling with
+    # numpy1.6, it will read these as M8[us].  So this ensures all
+    # datetime64 types are read as MS[ns]
+    if is_datetime64_dtype(arr):
+        arr = arr.view(_NS_DTYPE)
+
+    return arr
diff --git a/pandas/io/pytables.py b/pandas/io/pytables.py
index 4de641bb67926..f93ad425b2c6a 100644
--- a/pandas/io/pytables.py
+++ b/pandas/io/pytables.py
@@ -12,44 +12,54 @@
 import warnings
 import os
 
+from pandas.core.dtypes.common import (
+    is_list_like,
+    is_categorical_dtype,
+    is_timedelta64_dtype,
+    is_datetime64tz_dtype,
+    is_datetime64_dtype,
+    _ensure_object,
+    _ensure_int64,
+    _ensure_platform_int)
+from pandas.core.dtypes.missing import array_equivalent
+
 import numpy as np
-import pandas as pd
-from pandas import (Series, DataFrame, Panel, Panel4D, Index,
-                    MultiIndex, Int64Index, Timestamp)
-from pandas.sparse.api import SparseSeries, SparseDataFrame, SparsePanel
-from pandas.sparse.array import BlockIndex, IntIndex
-from pandas.tseries.api import PeriodIndex, DatetimeIndex
-from pandas.tseries.tdi import TimedeltaIndex
+from pandas import (Series, DataFrame, Panel, Index,
+                    MultiIndex, Int64Index, isna, concat, to_datetime,
+                    SparseSeries, SparseDataFrame, PeriodIndex,
+                    DatetimeIndex, TimedeltaIndex)
+from pandas.core import config
+from pandas.io.common import _stringify_path
+from pandas.core.sparse.array import BlockIndex, IntIndex
 from pandas.core.base import StringMixin
-from pandas.core.common import adjoin, pprint_thing
+from pandas.io.formats.printing import adjoin, pprint_thing
+from pandas.errors import PerformanceWarning
+import pandas.core.common as com
 from pandas.core.algorithms import match, unique
-from pandas.core.categorical import Categorical
-from pandas.core.common import _asarray_tuplesafe
-from pandas.core.internals import (BlockManager, make_block, _block2d_to_blocknd,
+from pandas.core.arrays.categorical import (Categorical,
+                                            _factorize_from_iterables)
+from pandas.core.internals import (BlockManager, make_block,
+                                   _block2d_to_blocknd,
                                    _factor_indexer, _block_shape)
 from pandas.core.index import _ensure_index
-from pandas.tseries.timedeltas import _coerce_scalar_to_timedelta_type
-import pandas.core.common as com
-from pandas.tools.merge import concat
 from pandas import compat
 from pandas.compat import u_safe as u, PY3, range, lrange, string_types, filter
-from pandas.io.common import PerformanceWarning
 from pandas.core.config import get_option
-from pandas.computation.pytables import Expr, maybe_expression
+from pandas.core.computation.pytables import Expr, maybe_expression
 
-import pandas.lib as lib
-import pandas.algos as algos
-import pandas.tslib as tslib
+from pandas._libs import algos, lib, writers as libwriters
+from pandas._libs.tslibs import timezones
 
-from contextlib import contextmanager
 from distutils.version import LooseVersion
 
 # versioning attribute
 _version = '0.15.2'
 
+# encoding
 # PY3 encoding if we don't specify
 _default_encoding = 'UTF-8'
 
+
 def _ensure_decoded(s):
     """ if we have bytes, decode them to unicode """
     if isinstance(s, np.bytes_):
@@ -64,17 +74,17 @@ def _ensure_encoding(encoding):
             encoding = _default_encoding
     return encoding
 
-def _set_tz(values, tz, preserve_UTC=False):
-    """ set the timezone if values are an Index """
-    if tz is not None and isinstance(values, Index):
-        tz = _ensure_decoded(tz)
-        if values.tz is None:
-            values = values.tz_localize('UTC').tz_convert(tz)
-        if preserve_UTC:
-            if tslib.get_timezone(tz) == 'UTC':
-                values = list(values)
 
-    return values
+def _ensure_str(name):
+    """Ensure that an index / column name is a str (python 3) or
+    unicode (python 2); otherwise they may be np.string dtype.
+    Non-string dtypes are passed through unchanged.
+
+    https://github.com/pandas-dev/pandas/issues/13492
+    """
+    if isinstance(name, compat.string_types):
+        name = compat.text_type(name)
+    return name
 
 
 Term = Expr
@@ -88,7 +98,7 @@ def _ensure_term(where, scope_level):
     create the terms here with a frame_level=2 (we are 2 levels down)
     """
 
-    # only consider list/tuple here as an ndarray is automaticaly a coordinate
+    # only consider list/tuple here as an ndarray is automatically a coordinate
     # list
     level = scope_level + 1
     if isinstance(where, (list, tuple)):
@@ -115,6 +125,7 @@ class ClosedFileError(Exception):
 class IncompatibilityWarning(Warning):
     pass
 
+
 incompatibility_doc = """
 where criteria is being ignored as this version [%s] is too old (or
 not-defined), read the file in and write it out to a new file to upgrade (with
@@ -125,6 +136,7 @@ class IncompatibilityWarning(Warning):
 class AttributeConflictWarning(Warning):
     pass
 
+
 attribute_conflict_doc = """
 the [%s] attribute of the existing index is [%s] which conflicts with the new
 [%s], resetting the attribute to None
@@ -134,6 +146,7 @@ class AttributeConflictWarning(Warning):
 class DuplicateWarning(Warning):
     pass
 
+
 duplicate_doc = """
 duplicate entries in table, taking most recently appended
 """
@@ -165,17 +178,13 @@ class DuplicateWarning(Warning):
 
     Series: u('series'),
     SparseSeries: u('sparse_series'),
-    pd.TimeSeries: u('series'),
     DataFrame: u('frame'),
     SparseDataFrame: u('sparse_frame'),
     Panel: u('wide'),
-    Panel4D: u('ndim'),
-    SparsePanel: u('sparse_panel')
 }
 
 # storer class map
 _STORER_MAP = {
-    u('TimeSeries'): 'LegacySeriesFixed',
     u('Series'): 'LegacySeriesFixed',
     u('DataFrame'): 'LegacyFrameFixed',
     u('DataMatrix'): 'LegacyFrameFixed',
@@ -184,7 +193,6 @@ class DuplicateWarning(Warning):
     u('frame'): 'FrameFixed',
     u('sparse_frame'): 'SparseFrameFixed',
     u('wide'): 'PanelFixed',
-    u('sparse_panel'): 'SparsePanelFixed',
 }
 
 # table class map
@@ -195,7 +203,6 @@ class DuplicateWarning(Warning):
     u('appendable_frame'): 'AppendableFrameTable',
     u('appendable_multiframe'): 'AppendableMultiFrameTable',
     u('appendable_panel'): 'AppendablePanelTable',
-    u('appendable_ndim'): 'AppendableNDimTable',
     u('worm'): 'WORMTable',
     u('legacy_frame'): 'LegacyFrameTable',
     u('legacy_panel'): 'LegacyPanelTable',
@@ -204,12 +211,10 @@ class DuplicateWarning(Warning):
 # axes map
 _AXES_MAP = {
     DataFrame: [0],
-    Panel: [1, 2],
-    Panel4D: [1, 2, 3],
+    Panel: [1, 2]
 }
 
 # register our configuration options
-from pandas.core import config
 dropna_doc = """
 : boolean
     drop ALL nan rows when appending to a table
@@ -232,6 +237,7 @@ class DuplicateWarning(Warning):
 _table_mod = None
 _table_file_open_policy_is_strict = False
 
+
 def _tables():
     global _table_mod
     global _table_file_open_policy_is_strict
@@ -240,14 +246,15 @@ def _tables():
         _table_mod = tables
 
         # version requirements
-        if LooseVersion(tables.__version__) < '3.0.0':
+        if LooseVersion(tables.__version__) < LooseVersion('3.0.0'):
             raise ImportError("PyTables version >= 3.0.0 is required")
 
         # set the file open policy
         # return the file open policy; this changes as of pytables 3.1
         # depending on the HDF5 version
         try:
-            _table_file_open_policy_is_strict = tables.file._FILE_OPEN_POLICY == 'strict'
+            _table_file_open_policy_is_strict = (
+                tables.file._FILE_OPEN_POLICY == 'strict')
         except:
             pass
 
@@ -255,6 +262,7 @@ def _tables():
 
 # interface to/from ###
 
+
 def to_hdf(path_or_buf, key, value, mode=None, complevel=None, complib=None,
            append=None, **kwargs):
     """ store this object, close it if we opened it """
@@ -264,79 +272,125 @@ def to_hdf(path_or_buf, key, value, mode=None, complevel=None, complib=None,
     else:
         f = lambda store: store.put(key, value, **kwargs)
 
+    path_or_buf = _stringify_path(path_or_buf)
     if isinstance(path_or_buf, string_types):
         with HDFStore(path_or_buf, mode=mode, complevel=complevel,
-                       complib=complib) as store:
+                      complib=complib) as store:
             f(store)
     else:
         f(path_or_buf)
 
 
-def read_hdf(path_or_buf, key=None, **kwargs):
-    """ read from the store, close it if we opened it
+def read_hdf(path_or_buf, key=None, mode='r', **kwargs):
+    """
+    Read from the store, close it if we opened it.
 
-        Retrieve pandas object stored in file, optionally based on where
-        criteria
+    Retrieve pandas object stored in file, optionally based on where
+    criteria
 
-        Parameters
-        ----------
-        path_or_buf : path (string), or buffer to read from
-        key : group identifier in the store. Can be omitted a HDF file contains
-            a single pandas object.
-        where : list of Term (or convertable) objects, optional
-        start : optional, integer (defaults to None), row number to start
-            selection
-        stop  : optional, integer (defaults to None), row number to stop
-            selection
-        columns : optional, a list of columns that if not None, will limit the
-            return columns
-        iterator : optional, boolean, return an iterator, default False
-        chunksize : optional, nrows to include in iteration, return an iterator
+    Parameters
+    ----------
+    path_or_buf : string, buffer or path object
+        Path to the file to open, or an open :class:`pandas.HDFStore` object.
+        Supports any object implementing the ``__fspath__`` protocol.
+        This includes :class:`pathlib.Path` and py._path.local.LocalPath
+        objects.
+
+        .. versionadded:: 0.19.0 support for pathlib, py.path.
+        .. versionadded:: 0.21.0 support for __fspath__ protocol.
+
+    key : object, optional
+        The group identifier in the store. Can be omitted if the HDF file
+        contains a single pandas object.
+    mode : {'r', 'r+', 'a'}, optional
+        Mode to use when opening the file. Ignored if path_or_buf is a
+        :class:`pandas.HDFStore`. Default is 'r'.
+    where : list, optional
+        A list of Term (or convertible) objects.
+    start : int, optional
+        Row number to start selection.
+    stop  : int, optional
+        Row number to stop selection.
+    columns : list, optional
+        A list of columns names to return.
+    iterator : bool, optional
+        Return an iterator object.
+    chunksize : int, optional
+        Number of rows to include in an iteration when using an iterator.
+    errors : str, default 'strict'
+        Specifies how encoding and decoding errors are to be handled.
+        See the errors argument for :func:`open` for a full list
+        of options.
+    **kwargs
+        Additional keyword arguments passed to HDFStore.
 
-        Returns
-        -------
-        The selected object
+    Returns
+    -------
+    item : object
+        The selected object. Return type depends on the object stored.
 
-        """
+    See Also
+    --------
+    pandas.DataFrame.to_hdf : write a HDF file from a DataFrame
+    pandas.HDFStore : low-level access to HDF files
+
+    Examples
+    --------
+    >>> df = pd.DataFrame([[1, 1.0, 'a']], columns=['x', 'y', 'z'])
+    >>> df.to_hdf('./store.h5', 'data')
+    >>> reread = pd.read_hdf('./store.h5')
+    """
 
+    if mode not in ['r', 'r+', 'a']:
+        raise ValueError('mode {0} is not allowed while performing a read. '
+                         'Allowed modes are r, r+ and a.'.format(mode))
     # grab the scope
     if 'where' in kwargs:
         kwargs['where'] = _ensure_term(kwargs['where'], scope_level=1)
 
-    if isinstance(path_or_buf, string_types):
+    if isinstance(path_or_buf, HDFStore):
+        if not path_or_buf.is_open:
+            raise IOError('The HDFStore must be open for reading.')
 
+        store = path_or_buf
+        auto_close = False
+    else:
+        path_or_buf = _stringify_path(path_or_buf)
+        if not isinstance(path_or_buf, string_types):
+            raise NotImplementedError('Support for generic buffers has not '
+                                      'been implemented.')
         try:
             exists = os.path.exists(path_or_buf)
 
-        #if filepath is too long
-        except (TypeError,ValueError):
+        # if filepath is too long
+        except (TypeError, ValueError):
             exists = False
 
         if not exists:
-            raise IOError('File %s does not exist' % path_or_buf)
+            raise compat.FileNotFoundError(
+                'File %s does not exist' % path_or_buf)
 
+        store = HDFStore(path_or_buf, mode=mode, **kwargs)
         # can't auto open/close if we are using an iterator
         # so delegate to the iterator
-        store = HDFStore(path_or_buf, **kwargs)
         auto_close = True
 
-    elif isinstance(path_or_buf, HDFStore):
-        if not path_or_buf.is_open:
-            raise IOError('The HDFStore must be open for reading.')
-
-        store = path_or_buf
-        auto_close = False
-    else:
-        raise NotImplementedError('Support for generic buffers has not been '
-                                  'implemented.')
-
     try:
         if key is None:
-            keys = store.keys()
-            if len(keys) != 1:
-                raise ValueError('key must be provided when HDF file contains '
-                                 'multiple datasets.')
-            key = keys[0]
+            groups = store.groups()
+            if len(groups) == 0:
+                raise ValueError('No dataset in HDF5 file.')
+            candidate_only_group = groups[0]
+
+            # For the HDF file to have only one dataset, all other groups
+            # should then be metadata groups for that candidate group. (This
+            # assumes that the groups() method enumerates parent groups
+            # before their children.)
+            for group_to_check in groups[1:]:
+                if not _is_metadata_of(group_to_check, candidate_only_group):
+                    raise ValueError('key must be provided when HDF5 file '
+                                     'contains multiple datasets.')
+            key = candidate_only_group._v_pathname
         return store.select(key, auto_close=auto_close, **kwargs)
     except:
         # if there is an error, close the store
@@ -348,6 +402,20 @@ def read_hdf(path_or_buf, key=None, **kwargs):
         raise
 
 
+def _is_metadata_of(group, parent_group):
+    """Check if a given group is a metadata group for a given parent_group."""
+    if group._v_depth <= parent_group._v_depth:
+        return False
+
+    current = group
+    while current._v_depth > 1:
+        parent = current._v_parent
+        if parent == parent_group and current._v_name == 'meta':
+            return True
+        current = current._v_parent
+    return False
+
+
 class HDFStore(StringMixin):
 
     """
@@ -370,12 +438,17 @@ class HDFStore(StringMixin):
             and if the file does not exist it is created.
         ``'r+'``
             It is similar to ``'a'``, but the file must already exist.
-    complevel : int, 1-9, default 0
-            If a complib is specified compression will be applied
-            where possible
-    complib : {'zlib', 'bzip2', 'lzo', 'blosc', None}, default None
-            If complevel is > 0 apply compression to objects written
-            in the store wherever possible
+    complevel : int, 0-9, default None
+            Specifies a compression level for data.
+            A value of 0 disables compression.
+    complib : {'zlib', 'lzo', 'bzip2', 'blosc'}, default 'zlib'
+            Specifies the compression library to be used.
+            As of v0.20.2 these additional compressors for Blosc are supported
+            (default if no compressor specified: 'blosc:blosclz'):
+            {'blosc:blosclz', 'blosc:lz4', 'blosc:lz4hc', 'blosc:snappy',
+             'blosc:zlib', 'blosc:zstd'}.
+            Specifying a compression library which is not available issues
+            a ValueError.
     fletcher32 : bool, default False
             If applying compression use the fletcher32 checksum
 
@@ -393,25 +466,33 @@ class HDFStore(StringMixin):
     def __init__(self, path, mode=None, complevel=None, complib=None,
                  fletcher32=False, **kwargs):
         try:
-            import tables
+            import tables  # noqa
         except ImportError as ex:  # pragma: no cover
-            raise ImportError('HDFStore requires PyTables, "{ex}" problem importing'.format(ex=str(ex)))
+            raise ImportError('HDFStore requires PyTables, "{ex}" problem '
+                              'importing'.format(ex=str(ex)))
 
-        if complib not in (None, 'blosc', 'bzip2', 'lzo', 'zlib'):
-            raise ValueError("complib only supports 'blosc', 'bzip2', lzo' "
-                             "or 'zlib' compression.")
+        if complib is not None and complib not in tables.filters.all_complibs:
+            raise ValueError(
+                "complib only supports {libs} compression.".format(
+                    libs=tables.filters.all_complibs))
 
-        self._path = path
+        if complib is None and complevel is not None:
+            complib = tables.filters.default_complib
+
+        self._path = _stringify_path(path)
         if mode is None:
             mode = 'a'
         self._mode = mode
         self._handle = None
-        self._complevel = complevel
+        self._complevel = complevel if complevel else 0
         self._complib = complib
         self._fletcher32 = fletcher32
         self._filters = None
         self.open(mode=mode, **kwargs)
 
+    def __fspath__(self):
+        return self._path
+
     @property
     def root(self):
         """ return the root node """
@@ -433,7 +514,6 @@ def __delitem__(self, key):
 
     def __getattr__(self, name):
         """ allow attribute access to get stores """
-        self._check_if_open()
         try:
             return self.get(name)
         except:
@@ -442,7 +522,7 @@ def __getattr__(self, name):
                              (type(self).__name__, name))
 
     def __contains__(self, key):
-        """ check for existance of this key
+        """ check for existence of this key
               can match the exact pathname or the pathnm w/o the leading '/'
               """
         node = self.get_node(key)
@@ -456,32 +536,7 @@ def __len__(self):
         return len(self.groups())
 
     def __unicode__(self):
-        output = '%s\nFile path: %s\n' % (type(self), pprint_thing(self._path))
-        if self.is_open:
-            lkeys = sorted(list(self.keys()))
-            if len(lkeys):
-                keys = []
-                values = []
-
-                for k in lkeys:
-                    try:
-                        s = self.get_storer(k)
-                        if s is not None:
-                            keys.append(pprint_thing(s.pathname or k))
-                            values.append(
-                                pprint_thing(s or 'invalid_HDFStore node'))
-                    except Exception as detail:
-                        keys.append(k)
-                        values.append("[invalid_HDFStore node: %s]"
-                                      % pprint_thing(detail))
-
-                output += adjoin(12, keys, values)
-            else:
-                output += 'Empty'
-        else:
-            output += "File is CLOSED"
-
-        return output
+        return '%s\nFile path: %s\n' % (type(self), pprint_thing(self._path))
 
     def __enter__(self):
         return self
@@ -497,6 +552,9 @@ def keys(self):
         """
         return [n._v_pathname for n in self.groups()]
 
+    def __iter__(self):
+        return iter(self.keys())
+
     def items(self):
         """
         iterate on key->group
@@ -538,11 +596,8 @@ def open(self, mode='a', **kwargs):
         if self.is_open:
             self.close()
 
-        if self._complib is not None:
-            if self._complevel is None:
-                self._complevel = 9
-            self._filters = _tables().Filters(self._complevel,
-                                              self._complib,
+        if self._complevel and self._complevel > 0:
+            self._filters = _tables().Filters(self._complevel, self._complib,
                                               fletcher32=self._fletcher32)
 
         try:
@@ -559,19 +614,23 @@ def open(self, mode='a', **kwargs):
             # trap PyTables >= 3.1 FILE_OPEN_POLICY exception
             # to provide an updated message
             if 'FILE_OPEN_POLICY' in str(e):
-
-                e = ValueError("PyTables [{version}] no longer supports opening multiple files\n"
-                               "even in read-only mode on this HDF5 version [{hdf_version}]. You can accept this\n"
-                               "and not open the same file multiple times at once,\n"
-                               "upgrade the HDF5 version, or downgrade to PyTables 3.0.0 which allows\n"
-                               "files to be opened multiple times at once\n".format(version=tables.__version__,
-                                                                                    hdf_version=tables.get_hdf5_version()))
+                e = ValueError(
+                    "PyTables [{version}] no longer supports opening multiple "
+                    "files\n"
+                    "even in read-only mode on this HDF5 version "
+                    "[{hdf_version}]. You can accept this\n"
+                    "and not open the same file multiple times at once,\n"
+                    "upgrade the HDF5 version, or downgrade to PyTables 3.0.0 "
+                    "which allows\n"
+                    "files to be opened multiple times at once\n"
+                    .format(version=tables.__version__,
+                            hdf_version=tables.get_hdf5_version()))
 
             raise e
 
         except (Exception) as e:
 
-            # trying to read from a non-existant file causes an error which
+            # trying to read from a non-existent file causes an error which
             # is not part of IOError, make it one
             if self._mode == 'r' and 'Unable to open/create file' in str(e):
                 raise IOError(str(e))
@@ -628,7 +687,7 @@ def get(self, key):
 
         Returns
         -------
-        obj : type of object stored in file
+        obj : same type as object stored in file
         """
         group = self.get_node(key)
         if group is None:
@@ -644,7 +703,7 @@ def select(self, key, where=None, start=None, stop=None, columns=None,
         Parameters
         ----------
         key : object
-        where : list of Term (or convertable) objects, optional
+        where : list of Term (or convertible) objects, optional
         start : integer (defaults to None), row number to start selection
         stop  : integer (defaults to None), row number to stop selection
         columns : a list of columns that if not None, will limit the return
@@ -672,12 +731,12 @@ def select(self, key, where=None, start=None, stop=None, columns=None,
         def func(_start, _stop, _where):
             return s.read(start=_start, stop=_stop,
                           where=_where,
-                          columns=columns, **kwargs)
+                          columns=columns)
 
         # create the iterator
-        it = TableIterator(self, s, func, where=where, nrows=s.nrows, start=start,
-                           stop=stop, iterator=iterator, chunksize=chunksize,
-                           auto_close=auto_close)
+        it = TableIterator(self, s, func, where=where, nrows=s.nrows,
+                           start=start, stop=stop, iterator=iterator,
+                           chunksize=chunksize, auto_close=auto_close)
 
         return it.get_result()
 
@@ -689,7 +748,7 @@ def select_as_coordinates(
         Parameters
         ----------
         key : object
-        where : list of Term (or convertable) objects, optional
+        where : list of Term (or convertible) objects, optional
         start : integer (defaults to None), row number to start selection
         stop  : integer (defaults to None), row number to stop selection
         """
@@ -764,7 +823,7 @@ def select_as_multiple(self, keys, where=None, selector=None, columns=None,
 
         # validate rows
         nrows = None
-        for t, k in itertools.chain([(s,selector)], zip(tbls, keys)):
+        for t, k in itertools.chain([(s, selector)], zip(tbls, keys)):
             if t is None:
                 raise KeyError("Invalid table [%s]" % k)
             if not t.is_table:
@@ -780,25 +839,26 @@ def select_as_multiple(self, keys, where=None, selector=None, columns=None,
                     "all tables must have exactly the same nrows!")
 
         # axis is the concentation axes
-        axis = list(set([t.non_index_axes[0][0] for t in tbls]))[0]
+        axis = list({t.non_index_axes[0][0] for t in tbls})[0]
 
         def func(_start, _stop, _where):
 
-            # retrieve the objs, _where is always passed as a set of coordinates here
-            objs = [t.read(where=_where, columns=columns, **kwargs) for t in tbls]
+            # retrieve the objs, _where is always passed as a set of
+            # coordinates here
+            objs = [t.read(where=_where, columns=columns, start=_start,
+                           stop=_stop, **kwargs) for t in tbls]
 
             # concat and return
             return concat(objs, axis=axis,
-                          verify_integrity=False).consolidate()
+                          verify_integrity=False)._consolidate()
 
         # create the iterator
-        it = TableIterator(self, s, func, where=where, nrows=nrows, start=start,
-                           stop=stop, iterator=iterator, chunksize=chunksize,
-                           auto_close=auto_close)
+        it = TableIterator(self, s, func, where=where, nrows=nrows,
+                           start=start, stop=stop, iterator=iterator,
+                           chunksize=chunksize, auto_close=auto_close)
 
         return it.get_result(coordinates=True)
 
-
     def put(self, key, value, format=None, append=False, **kwargs):
         """
         Store object in HDFStore
@@ -817,6 +877,9 @@ def put(self, key, value, format=None, append=False, **kwargs):
         append   : boolean, default False
             This will force Table format, append the input data to the
             existing.
+        data_columns : list of columns to create as data columns, or True to
+            use all columns. See
+            `here <http://pandas.pydata.org/pandas-docs/stable/io.html#query-via-data-columns>`__ # noqa
         encoding : default None, provide an encoding for strings
         dropna   : boolean, default False, do not write an ALL nan row to
             the store settable by the option 'io.hdf.dropna_table'
@@ -834,7 +897,7 @@ def remove(self, key, where=None, start=None, stop=None):
         ----------
         key : string
             Node to remove or delete rows from
-        where : list of Term (or convertable) objects, optional
+        where : list of Term (or convertible) objects, optional
         start : integer (defaults to None), row number to start selection
         stop  : integer (defaults to None), row number to stop selection
 
@@ -850,7 +913,10 @@ def remove(self, key, where=None, start=None, stop=None):
         where = _ensure_term(where, scope_level=1)
         try:
             s = self.get_storer(key)
-        except:
+        except KeyError:
+            # the key is not a valid store, re-raising KeyError
+            raise
+        except Exception:
 
             if where is not None:
                 raise ValueError(
@@ -862,11 +928,8 @@ def remove(self, key, where=None, start=None, stop=None):
                 s._f_remove(recursive=True)
                 return None
 
-        if s is None:
-            raise KeyError('No object named %s in the file' % key)
-
         # remove the node
-        if where is None and start is None and stop is None:
+        if com._all_none(where, start, stop):
             s.group._f_remove(recursive=True)
 
         # delete from the table
@@ -885,7 +948,7 @@ def append(self, key, value, format=None, append=True, columns=None,
         Parameters
         ----------
         key : object
-        value : {Series, DataFrame, Panel, Panel4D}
+        value : {Series, DataFrame, Panel}
         format: 'table' is the default
             table(t) : table format
                        Write as a PyTables Table structure which may perform
@@ -893,8 +956,11 @@ def append(self, key, value, format=None, append=True, columns=None,
                        / selecting subsets of the data
         append       : boolean, default True, append the input data to the
             existing
-        data_columns : list of columns to create as data columns, or True to
-            use all columns
+        data_columns :  list of columns, or True, default None
+            List of columns to create as indexed data columns for on-disk
+            queries, or True to use all columns. By default only the axes
+            of the object are indexed. See `here
+            <http://pandas.pydata.org/pandas-docs/stable/io.html#query-via-data-columns>`__.
         min_itemsize : dict of columns that specify minimum string sizes
         nan_rep      : string to use as string nan represenation
         chunksize    : size to chunk the writing
@@ -902,6 +968,7 @@ def append(self, key, value, format=None, append=True, columns=None,
         encoding     : default None, provide an encoding for strings
         dropna       : boolean, default False, do not write an ALL nan row to
             the store settable by the option 'io.hdf.dropna_table'
+
         Notes
         -----
         Does *not* check if data being appended overlaps with existing
@@ -990,20 +1057,20 @@ def append_to_multiple(self, d, value, selector, data_columns=None,
             valid_index = next(idxs)
             for index in idxs:
                 valid_index = valid_index.intersection(index)
-            value = value.ix[valid_index]
+            value = value.loc[valid_index]
 
         # append
         for k, v in d.items():
             dc = data_columns if k == selector else None
 
             # compute the val
-            val = value.reindex_axis(v, axis=axis)
+            val = value.reindex(v, axis=axis)
 
             self.append(k, val, data_columns=dc, **kwargs)
 
     def create_table_index(self, key, **kwargs):
         """ Create a pytables index on the table
-        Paramaters
+        Parameters
         ----------
         key : object (the node to index)
 
@@ -1031,13 +1098,61 @@ def groups(self):
         _tables()
         self._check_if_open()
         return [
-            g for g in self._handle.walk_nodes()
-            if (getattr(g._v_attrs, 'pandas_type', None) or
-                getattr(g, 'table', None) or
+            g for g in self._handle.walk_groups()
+            if (not isinstance(g, _table_mod.link.Link) and
+                (getattr(g._v_attrs, 'pandas_type', None) or
+                 getattr(g, 'table', None) or
                 (isinstance(g, _table_mod.table.Table) and
-                 g._v_name != u('table')))
+                 g._v_name != u('table'))))
         ]
 
+    def walk(self, where="/"):
+        """ Walk the pytables group hierarchy for pandas objects
+
+        This generator will yield the group path, subgroups and pandas object
+        names for each group.
+        Any non-pandas PyTables objects that are not a group will be ignored.
+
+        The `where` group itself is listed first (preorder), then each of its
+        child groups (following an alphanumerical order) is also traversed,
+        following the same procedure.
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        where : str, optional
+            Group where to start walking.
+            If not supplied, the root group is used.
+
+        Yields
+        ------
+        path : str
+            Full path to a group (without trailing '/')
+        groups : list of str
+            names of the groups contained in `path`
+        leaves : list of str
+            names of the pandas objects contained in `path`
+
+        """
+        _tables()
+        self._check_if_open()
+        for g in self._handle.walk_groups(where):
+            if getattr(g._v_attrs, 'pandas_type', None) is not None:
+                continue
+
+            groups = []
+            leaves = []
+            for child in g._v_children.values():
+                pandas_type = getattr(child._v_attrs, 'pandas_type', None)
+                if pandas_type is None:
+                    if isinstance(child, _table_mod.group.Group):
+                        groups.append(child._v_name)
+                else:
+                    leaves.append(child._v_name)
+
+            yield (g._v_pathname.rstrip('/'), groups, leaves)
+
     def get_node(self, key):
         """ return the node with the key or None if it does not exist """
         self._check_if_open()
@@ -1052,7 +1167,8 @@ def get_storer(self, key):
         """ return the storer object for a key, raise if not in the file """
         group = self.get_node(key)
         if group is None:
-            return None
+            raise KeyError('No object named {} in the file'.format(key))
+
         s = self._create_storer(group)
         s.infer_axes()
         return s
@@ -1108,6 +1224,39 @@ def copy(self, file, mode='w', propindexes=True, keys=None, complib=None,
 
         return new_store
 
+    def info(self):
+        """
+        print detailed information on the store
+
+        .. versionadded:: 0.21.0
+        """
+        output = '%s\nFile path: %s\n' % (type(self), pprint_thing(self._path))
+        if self.is_open:
+            lkeys = sorted(list(self.keys()))
+            if len(lkeys):
+                keys = []
+                values = []
+
+                for k in lkeys:
+                    try:
+                        s = self.get_storer(k)
+                        if s is not None:
+                            keys.append(pprint_thing(s.pathname or k))
+                            values.append(
+                                pprint_thing(s or 'invalid_HDFStore node'))
+                    except Exception as detail:
+                        keys.append(k)
+                        values.append("[invalid_HDFStore node: %s]"
+                                      % pprint_thing(detail))
+
+                output += adjoin(12, keys, values)
+            else:
+                output += 'Empty'
+        else:
+            output += "File is CLOSED"
+
+        return output
+
     # private methods ######
     def _check_if_open(self):
         if not self.is_open:
@@ -1174,7 +1323,7 @@ def error(t):
         # existing node (and must be a table)
         if tt is None:
 
-            # if we are a writer, determin the tt
+            # if we are a writer, determine the tt
             if value is not None:
 
                 if pt == u('series_table'):
@@ -1276,6 +1425,13 @@ def _read_group(self, group, **kwargs):
 def get_store(path, **kwargs):
     """ Backwards compatible alias for ``HDFStore``
     """
+    warnings.warn(
+        "get_store is deprecated and be "
+        "removed in a future version\n"
+        "HDFStore(path, **kwargs) is the replacement",
+        FutureWarning,
+        stacklevel=6)
+
     return HDFStore(path, **kwargs)
 
 
@@ -1287,7 +1443,7 @@ class TableIterator(object):
         ----------
 
         store : the reference store
-        s     : the refered storer
+        s     : the referred storer
         func  : the function to execute the query
         where : the where of the query
         nrows : the rows to iterate on
@@ -1303,15 +1459,23 @@ class TableIterator(object):
     def __init__(self, store, s, func, where, nrows, start=None, stop=None,
                  iterator=False, chunksize=None, auto_close=False):
         self.store = store
-        self.s     = s
-        self.func  = func
+        self.s = s
+        self.func = func
         self.where = where
-        self.nrows = nrows or 0
-        self.start = start or 0
 
-        if stop is None:
-            stop = self.nrows
-        self.stop = min(self.nrows, stop)
+        # set start/stop if they are not set if we are a table
+        if self.s.is_table:
+            if nrows is None:
+                nrows = 0
+            if start is None:
+                start = 0
+            if stop is None:
+                stop = nrows
+            stop = min(nrows, stop)
+
+        self.nrows = nrows
+        self.start = start
+        self.stop = stop
 
         self.coordinates = None
         if iterator or chunksize is not None:
@@ -1357,7 +1521,8 @@ def get_result(self, coordinates=False):
 
         # if specified read via coordinates (necessary for multiple selections
         if coordinates:
-            where = self.s.read_coordinates(where=self.where)
+            where = self.s.read_coordinates(where=self.where, start=self.start,
+                                            stop=self.stop)
         else:
             where = self.where
 
@@ -1366,6 +1531,7 @@ def get_result(self, coordinates=False):
         self.close()
         return results
 
+
 class IndexCol(StringMixin):
 
     """ an index column description class
@@ -1446,8 +1612,8 @@ def __unicode__(self):
 
     def __eq__(self, other):
         """ compare 2 col items """
-        return all([getattr(self, a, None) == getattr(other, a, None)
-                    for a in ['name', 'cname', 'axis', 'pos']])
+        return all(getattr(self, a, None) == getattr(other, a, None)
+                   for a in ['name', 'cname', 'axis', 'pos'])
 
     def __ne__(self, other):
         return not self.__eq__(other)
@@ -1473,14 +1639,14 @@ def infer(self, handler):
         new_self.read_metadata(handler)
         return new_self
 
-    def convert(self, values, nan_rep, encoding):
+    def convert(self, values, nan_rep, encoding, errors):
         """ set the values from this selection: take = take ownership """
-        try:
+
+        # values is a recarray
+        if values.dtype.fields is not None:
             values = values[self.cname]
-        except:
-            pass
 
-        values = _maybe_convert(values, self.kind, encoding)
+        values = _maybe_convert(values, self.kind, encoding, errors)
 
         kwargs = dict()
         if self.freq is not None:
@@ -1529,7 +1695,7 @@ def __iter__(self):
 
     def maybe_set_size(self, min_itemsize=None, **kwargs):
         """ maybe set a string col itemsize:
-               min_itemsize can be an interger or a dict with this columns name
+               min_itemsize can be an integer or a dict with this columns name
                with an integer size """
         if _ensure_decoded(self.kind) == u('string'):
 
@@ -1620,11 +1786,11 @@ def set_info(self, info):
             self.__dict__.update(idx)
 
     def get_attr(self):
-        """ set the kind for this colummn """
+        """ set the kind for this column """
         self.kind = getattr(self.attrs, self.kind_attr, None)
 
     def set_attr(self):
-        """ set the kind for this colummn """
+        """ set the kind for this column """
         setattr(self.attrs, self.kind_attr, self.kind)
 
     def read_metadata(self, handler):
@@ -1637,14 +1803,15 @@ def validate_metadata(self, handler):
             new_metadata = self.metadata
             cur_metadata = handler.read_metadata(self.cname)
             if new_metadata is not None and cur_metadata is not None \
-                   and not com.array_equivalent(new_metadata, cur_metadata):
-                raise ValueError("cannot append a categorical with different categories"
-                                 " to the existing")
+                    and not array_equivalent(new_metadata, cur_metadata):
+                raise ValueError("cannot append a categorical with "
+                                 "different categories to the existing")
 
     def write_metadata(self, handler):
         """ set the meta data """
         if self.metadata is not None:
-            handler.write_metadata(self.cname,self.metadata)
+            handler.write_metadata(self.cname, self.metadata)
+
 
 class GenericIndexCol(IndexCol):
 
@@ -1654,7 +1821,7 @@ class GenericIndexCol(IndexCol):
     def is_indexed(self):
         return False
 
-    def convert(self, values, nan_rep, encoding):
+    def convert(self, values, nan_rep, encoding, errors):
         """ set the values from this selection: take = take ownership """
 
         self.values = Int64Index(np.arange(self.table.nrows))
@@ -1682,7 +1849,7 @@ class DataCol(IndexCol):
         """
     is_an_indexable = False
     is_data_indexable = False
-    _info_fields = ['tz','ordered']
+    _info_fields = ['tz', 'ordered']
 
     @classmethod
     def create_for_block(
@@ -1698,7 +1865,7 @@ def create_for_block(
         # name values_0
         try:
             if version[0] == 0 and version[1] <= 10 and version[2] == 0:
-                m = re.search("values_block_(\d+)", name)
+                m = re.search(r"values_block_(\d+)", name)
                 if m:
                     name = "values_%s" % m.groups()[0]
         except:
@@ -1707,9 +1874,10 @@ def create_for_block(
         return cls(name=name, cname=cname, **kwargs)
 
     def __init__(self, values=None, kind=None, typ=None,
-                 cname=None, data=None, meta=None, metadata=None, block=None, **kwargs):
-        super(DataCol, self).__init__(
-            values=values, kind=kind, typ=typ, cname=cname, **kwargs)
+                 cname=None, data=None, meta=None, metadata=None,
+                 block=None, **kwargs):
+        super(DataCol, self).__init__(values=values, kind=kind, typ=typ,
+                                      cname=cname, **kwargs)
         self.dtype = None
         self.dtype_attr = u("%s_dtype" % self.name)
         self.meta = meta
@@ -1729,8 +1897,8 @@ def __unicode__(self):
 
     def __eq__(self, other):
         """ compare 2 col items """
-        return all([getattr(self, a, None) == getattr(other, a, None)
-                    for a in ['name', 'cname', 'dtype', 'pos']])
+        return all(getattr(self, a, None) == getattr(other, a, None)
+                   for a in ['name', 'cname', 'dtype', 'pos'])
 
     def set_data(self, data, dtype=None):
         self.data = data
@@ -1750,7 +1918,7 @@ def take_data(self):
     def set_metadata(self, metadata):
         """ record the metadata """
         if metadata is not None:
-            metadata = np.array(metadata,copy=False).ravel()
+            metadata = np.array(metadata, copy=False).ravel()
         self.metadata = metadata
 
     def set_kind(self):
@@ -1782,14 +1950,15 @@ def set_kind(self):
                 self.typ = getattr(self.description, self.cname, None)
 
     def set_atom(self, block, block_items, existing_col, min_itemsize,
-                 nan_rep, info, encoding=None, **kwargs):
+                 nan_rep, info, encoding=None, errors='strict'):
         """ create and setup my atom from the block b """
 
         self.values = list(block_items)
 
         # short-cut certain block types
         if block.is_categorical:
-            return self.set_atom_categorical(block, items=block_items, info=info)
+            return self.set_atom_categorical(block, items=block_items,
+                                             info=info)
         elif block.is_datetimetz:
             return self.set_atom_datetime64tz(block, info=info)
         elif block.is_datetime:
@@ -1813,7 +1982,7 @@ def set_atom(self, block, block_items, existing_col, min_itemsize,
             raise TypeError(
                 "too many timezones in this block, create separate "
                 "data columns"
-                )
+            )
         elif inferred_type == 'unicode':
             raise TypeError(
                 "[unicode] is not implemented as a table column")
@@ -1826,7 +1995,8 @@ def set_atom(self, block, block_items, existing_col, min_itemsize,
                 existing_col,
                 min_itemsize,
                 nan_rep,
-                encoding)
+                encoding,
+                errors)
 
         # set as a data block
         else:
@@ -1836,10 +2006,12 @@ def get_atom_string(self, block, itemsize):
         return _tables().StringCol(itemsize=itemsize, shape=block.shape[0])
 
     def set_atom_string(self, block, block_items, existing_col, min_itemsize,
-                        nan_rep, encoding):
+                        nan_rep, encoding, errors):
         # fill nan items with myself, don't disturb the blocks by
         # trying to downcast
-        block = block.fillna(nan_rep, downcast=False)[0]
+        block = block.fillna(nan_rep, downcast=False)
+        if isinstance(block, list):
+            block = block[0]
         data = block.values
 
         # see if we have a valid string type
@@ -1860,7 +2032,7 @@ def set_atom_string(self, block, block_items, existing_col, min_itemsize,
                     )
 
         # itemsize is the maximum length of a string (along any dimension)
-        data_converted = _convert_string_array(data, encoding)
+        data_converted = _convert_string_array(data, encoding, errors)
         itemsize = data_converted.itemsize
 
         # specified min_itemsize?
@@ -1897,7 +2069,8 @@ def get_atom_data(self, block, kind=None):
     def set_atom_complex(self, block):
         self.kind = block.dtype.name
         itemsize = int(self.kind.split('complex')[-1]) // 8
-        self.typ = _tables().ComplexCol(itemsize=itemsize, shape=block.shape[0])
+        self.typ = _tables().ComplexCol(
+            itemsize=itemsize, shape=block.shape[0])
         self.set_data(block.values.astype(self.typ.type, copy=False))
 
     def set_atom_data(self, block):
@@ -1945,14 +2118,11 @@ def set_atom_datetime64tz(self, block, info, values=None):
         if values is None:
             values = block.values
 
-        # convert this column to datetime64[ns] utc, and save the tz
-        values = values.tz_convert('UTC').values.view('i8').reshape(block.shape)
+        # convert this column to i8 in UTC, and save the tz
+        values = values.asi8.reshape(block.shape)
 
         # store a converted timezone
-        zone = tslib.get_timezone(block.values.tz)
-        if zone is None:
-            zone = tslib.tot_seconds(block.values.tz.utcoffset())
-        self.tz = zone
+        self.tz = _get_tz(block.values.tz)
         self.update_info(info)
 
         self.kind = 'datetime64'
@@ -1993,15 +2163,15 @@ def validate_attr(self, append):
                 raise ValueError("appended items dtype do not match existing "
                                  "items dtype in table!")
 
-    def convert(self, values, nan_rep, encoding):
+    def convert(self, values, nan_rep, encoding, errors):
         """set the data from this selection (and convert to the correct dtype
         if we can)
         """
 
-        try:
+        # values is a recarray
+        if values.dtype.fields is not None:
             values = values[self.cname]
-        except:
-            pass
+
         self.set_data(values)
 
         # use the meta if needed
@@ -2013,18 +2183,9 @@ def convert(self, values, nan_rep, encoding):
 
             # reverse converts
             if dtype == u('datetime64'):
-                # recreate the timezone
-                if self.tz is not None:
-
-                    # data should be 2-dim here
-                    # we stored as utc, so just set the tz
 
-                    index = DatetimeIndex(
-                        self.data.ravel(), tz='UTC').tz_convert(tslib.maybe_get_tz(self.tz))
-                    self.data = index
-
-                else:
-                    self.data = np.asarray(self.data, dtype='M8[ns]')
+                # recreate with tz if indicated
+                self.data = _set_tz(self.data, self.tz, coerce=True)
 
             elif dtype == u('timedelta64'):
                 self.data = np.asarray(self.data, dtype='m8[ns]')
@@ -2045,7 +2206,24 @@ def convert(self, values, nan_rep, encoding):
 
                 # we have a categorical
                 categories = self.metadata
-                self.data = Categorical.from_codes(self.data.ravel(),
+                codes = self.data.ravel()
+
+                # if we have stored a NaN in the categories
+                # then strip it; in theory we could have BOTH
+                # -1s in the codes and nulls :<
+                if categories is None:
+                    # Handle case of NaN-only categorical columns in which case
+                    # the categories are an empty array; when this is stored,
+                    # pytables cannot write a zero-len array, so on readback
+                    # the categories would be None and `read_hdf()` would fail.
+                    categories = Index([], dtype=np.float64)
+                else:
+                    mask = isna(categories)
+                    if mask.any():
+                        categories = categories[~mask]
+                        codes[codes != -1] -= mask.astype(int).cumsum().values
+
+                self.data = Categorical.from_codes(codes,
                                                    categories=categories,
                                                    ordered=self.ordered)
 
@@ -2059,19 +2237,19 @@ def convert(self, values, nan_rep, encoding):
         # convert nans / decode
         if _ensure_decoded(self.kind) == u('string'):
             self.data = _unconvert_string_array(
-                self.data, nan_rep=nan_rep, encoding=encoding)
+                self.data, nan_rep=nan_rep, encoding=encoding, errors=errors)
 
         return self
 
     def get_attr(self):
-        """ get the data for this colummn """
+        """ get the data for this column """
         self.values = getattr(self.attrs, self.kind_attr, None)
         self.dtype = getattr(self.attrs, self.dtype_attr, None)
         self.meta = getattr(self.attrs, self.meta_attr, None)
         self.set_kind()
 
     def set_attr(self):
-        """ set the data for this colummn """
+        """ set the data for this column """
         setattr(self.attrs, self.kind_attr, self.values)
         setattr(self.attrs, self.meta_attr, self.meta)
         if self.dtype is not None:
@@ -2125,10 +2303,12 @@ class Fixed(StringMixin):
     ndim = None
     is_table = False
 
-    def __init__(self, parent, group, encoding=None, **kwargs):
+    def __init__(self, parent, group, encoding=None, errors='strict',
+                 **kwargs):
         self.parent = parent
         self.group = group
         self.encoding = _ensure_encoding(encoding)
+        self.errors = errors
         self.set_version()
 
     @property
@@ -2141,7 +2321,7 @@ def set_version(self):
         version = _ensure_decoded(
             getattr(self.group._v_attrs, 'pandas_version', None))
         try:
-            self.version = tuple([int(x) for x in version.split('.')])
+            self.version = tuple(int(x) for x in version.split('.'))
             if len(self.version) == 2:
                 self.version = self.version + (0,)
         except:
@@ -2162,7 +2342,7 @@ def __unicode__(self):
         s = self.shape
         if s is not None:
             if isinstance(s, (list, tuple)):
-                s = "[%s]" % ','.join([pprint_thing(x) for x in s])
+                s = "[%s]" % ','.join(pprint_thing(x) for x in s)
             return "%-12.12s (shape->%s)" % (self.pandas_type, s)
         return self.pandas_type
 
@@ -2262,8 +2442,11 @@ def write(self, **kwargs):
             "cannot write on an abstract storer: sublcasses should implement")
 
     def delete(self, where=None, start=None, stop=None, **kwargs):
-        """ support fully deleting the node in its entirety (only) - where specification must be None """
-        if where is None and start is None and stop is None:
+        """
+        support fully deleting the node in its entirety (only) - where
+        specification must be None
+        """
+        if com._all_none(where, start, stop):
             self._handle.remove_node(self.group, recursive=True)
             return None
 
@@ -2274,8 +2457,7 @@ class GenericFixed(Fixed):
 
     """ a generified fixed version """
     _index_type_map = {DatetimeIndex: 'datetime', PeriodIndex: 'period'}
-    _reverse_index_map = dict([(v, k)
-                              for k, v in compat.iteritems(_index_type_map)])
+    _reverse_index_map = {v: k for k, v in compat.iteritems(_index_type_map)}
     attributes = []
 
     # indexer helpders
@@ -2291,20 +2473,37 @@ def _alias_to_class(self, alias):
     def _get_index_factory(self, klass):
         if klass == DatetimeIndex:
             def f(values, freq=None, tz=None):
-                return DatetimeIndex._simple_new(values, None, freq=freq,
-                                                 tz=tz)
+                # data are already in UTC, localize and convert if tz present
+                result = DatetimeIndex._simple_new(values, None, freq=freq)
+                if tz is not None:
+                    result = result.tz_localize('UTC').tz_convert(tz)
+                return result
+            return f
+        elif klass == PeriodIndex:
+            def f(values, freq=None, tz=None):
+                return PeriodIndex._simple_new(values, None, freq=freq)
             return f
+
         return klass
 
     def validate_read(self, kwargs):
-        if kwargs.get('columns') is not None:
+        """
+        remove table keywords from kwargs and return
+        raise if any keywords are passed which are not-None
+        """
+        kwargs = copy.copy(kwargs)
+
+        columns = kwargs.pop('columns', None)
+        if columns is not None:
             raise TypeError("cannot pass a column specification when reading "
                             "a Fixed format store. this store must be "
                             "selected in its entirety")
-        if kwargs.get('where') is not None:
+        where = kwargs.pop('where', None)
+        if where is not None:
             raise TypeError("cannot pass a where specification when reading "
                             "from a Fixed format store. this store must be "
                             "selected in its entirety")
+        return kwargs
 
     @property
     def is_exists(self):
@@ -2313,27 +2512,28 @@ def is_exists(self):
     def set_attrs(self):
         """ set our object attributes """
         self.attrs.encoding = self.encoding
+        self.attrs.errors = self.errors
 
     def get_attrs(self):
         """ retrieve our attributes """
         self.encoding = _ensure_encoding(getattr(self.attrs, 'encoding', None))
+        self.errors = getattr(self.attrs, 'errors', 'strict')
         for n in self.attributes:
             setattr(self, n, _ensure_decoded(getattr(self.attrs, n, None)))
 
     def write(self, obj, **kwargs):
         self.set_attrs()
 
-    def read_array(self, key):
+    def read_array(self, key, start=None, stop=None):
         """ read an array for the specified node (off of group """
         import tables
         node = getattr(self.group, key)
-        data = node[:]
         attrs = node._v_attrs
 
         transposed = getattr(attrs, 'transposed', False)
 
         if isinstance(node, tables.VLArray):
-            ret = data[0]
+            ret = node[0][start:stop]
         else:
             dtype = getattr(attrs, 'value_type', None)
             shape = getattr(attrs, 'shape', None)
@@ -2342,10 +2542,13 @@ def read_array(self, key):
                 # length 0 axis
                 ret = np.empty(shape, dtype=dtype)
             else:
-                ret = data
+                ret = node[start:stop]
 
             if dtype == u('datetime64'):
-                ret = np.asarray(ret, dtype='M8[ns]')
+
+                # reconstruct a timezone if indicated
+                ret = _set_tz(ret, getattr(attrs, 'tz', None), coerce=True)
+
             elif dtype == u('timedelta64'):
                 ret = np.asarray(ret, dtype='m8[ns]')
 
@@ -2354,17 +2557,17 @@ def read_array(self, key):
         else:
             return ret
 
-    def read_index(self, key):
+    def read_index(self, key, **kwargs):
         variety = _ensure_decoded(getattr(self.attrs, '%s_variety' % key))
 
         if variety == u('multi'):
-            return self.read_multi_index(key)
+            return self.read_multi_index(key, **kwargs)
         elif variety == u('block'):
-            return self.read_block_index(key)
+            return self.read_block_index(key, **kwargs)
         elif variety == u('sparseint'):
-            return self.read_sparse_intindex(key)
+            return self.read_sparse_intindex(key, **kwargs)
         elif variety == u('regular'):
-            _, index = self.read_index_node(getattr(self.group, key))
+            _, index = self.read_index_node(getattr(self.group, key), **kwargs)
             return index
         else:  # pragma: no cover
             raise TypeError('unrecognized index variety: %s' % variety)
@@ -2381,9 +2584,11 @@ def write_index(self, key, index):
             self.write_sparse_intindex(key, index)
         else:
             setattr(self.attrs, '%s_variety' % key, 'regular')
-            converted = _convert_index(index, self.encoding,
+            converted = _convert_index(index, self.encoding, self.errors,
                                        self.format_type).set_name('index')
+
             self.write_array(key, converted.values)
+
             node = getattr(self.group, key)
             node._v_attrs.kind = converted.kind
             node._v_attrs.name = index.name
@@ -2395,29 +2600,26 @@ def write_index(self, key, index):
                 node._v_attrs.freq = index.freq
 
             if hasattr(index, 'tz') and index.tz is not None:
-                zone = tslib.get_timezone(index.tz)
-                if zone is None:
-                    zone = tslib.tot_seconds(index.tz.utcoffset())
-                node._v_attrs.tz = zone
+                node._v_attrs.tz = _get_tz(index.tz)
 
     def write_block_index(self, key, index):
         self.write_array('%s_blocs' % key, index.blocs)
         self.write_array('%s_blengths' % key, index.blengths)
         setattr(self.attrs, '%s_length' % key, index.length)
 
-    def read_block_index(self, key):
+    def read_block_index(self, key, **kwargs):
         length = getattr(self.attrs, '%s_length' % key)
-        blocs = self.read_array('%s_blocs' % key)
-        blengths = self.read_array('%s_blengths' % key)
+        blocs = self.read_array('%s_blocs' % key, **kwargs)
+        blengths = self.read_array('%s_blengths' % key, **kwargs)
         return BlockIndex(length, blocs, blengths)
 
     def write_sparse_intindex(self, key, index):
         self.write_array('%s_indices' % key, index.indices)
         setattr(self.attrs, '%s_length' % key, index.length)
 
-    def read_sparse_intindex(self, key):
+    def read_sparse_intindex(self, key, **kwargs):
         length = getattr(self.attrs, '%s_length' % key)
-        indices = self.read_array('%s_indices' % key)
+        indices = self.read_array('%s_indices' % key, **kwargs)
         return IntIndex(length, indices)
 
     def write_multi_index(self, key, index):
@@ -2428,7 +2630,7 @@ def write_multi_index(self, key, index):
                                                  index.names)):
             # write the level
             level_key = '%s_level%d' % (key, i)
-            conv_level = _convert_index(lev, self.encoding,
+            conv_level = _convert_index(lev, self.encoding, self.errors,
                                         self.format_type).set_name(level_key)
             self.write_array(level_key, conv_level.values)
             node = getattr(self.group, level_key)
@@ -2442,7 +2644,7 @@ def write_multi_index(self, key, index):
             label_key = '%s_label%d' % (key, i)
             self.write_array(label_key, lab)
 
-    def read_multi_index(self, key):
+    def read_multi_index(self, key, **kwargs):
         nlevels = getattr(self.attrs, '%s_nlevels' % key)
 
         levels = []
@@ -2450,19 +2652,20 @@ def read_multi_index(self, key):
         names = []
         for i in range(nlevels):
             level_key = '%s_level%d' % (key, i)
-            name, lev = self.read_index_node(getattr(self.group, level_key))
+            name, lev = self.read_index_node(getattr(self.group, level_key),
+                                             **kwargs)
             levels.append(lev)
             names.append(name)
 
             label_key = '%s_label%d' % (key, i)
-            lab = self.read_array(label_key)
+            lab = self.read_array(label_key, **kwargs)
             labels.append(lab)
 
         return MultiIndex(levels=levels, labels=labels, names=names,
                           verify_integrity=True)
 
-    def read_index_node(self, node):
-        data = node[:]
+    def read_index_node(self, node, start=None, stop=None):
+        data = node[start:stop]
         # If the index was an empty array write_array_empty() will
         # have written a sentinel. Here we relace it with the original.
         if ('shape' in node._v_attrs and
@@ -2473,10 +2676,10 @@ def read_index_node(self, node):
         name = None
 
         if 'name' in node._v_attrs:
-            name = node._v_attrs.name
+            name = _ensure_str(node._v_attrs.name)
 
-        index_class = self._alias_to_class(getattr(node._v_attrs,
-                                                   'index_class', ''))
+        index_class = self._alias_to_class(_ensure_decoded(
+            getattr(node._v_attrs, 'index_class', '')))
         factory = self._get_index_factory(index_class)
 
         kwargs = {}
@@ -2487,12 +2690,14 @@ def read_index_node(self, node):
             kwargs['tz'] = node._v_attrs['tz']
 
         if kind in (u('date'), u('datetime')):
-            index = factory(
-                _unconvert_index(data, kind, encoding=self.encoding),
-                dtype=object, **kwargs)
+            index = factory(_unconvert_index(data, kind,
+                                             encoding=self.encoding,
+                                             errors=self.errors),
+                            dtype=object, **kwargs)
         else:
-            index = factory(
-                _unconvert_index(data, kind, encoding=self.encoding), **kwargs)
+            index = factory(_unconvert_index(data, kind,
+                                             encoding=self.encoding,
+                                             errors=self.errors), **kwargs)
 
         index.name = name
 
@@ -2519,8 +2724,10 @@ def write_array(self, key, value, items=None):
         empty_array = self._is_empty_array(value.shape)
         transposed = False
 
-        if com.is_categorical_dtype(value):
-            raise NotImplementedError("cannot store a category dtype")
+        if is_categorical_dtype(value):
+            raise NotImplementedError('Cannot store a category dtype in '
+                                      'a HDF5 dataset that uses format='
+                                      '"fixed". Use format="table".')
 
         if not empty_array:
             value = value.T
@@ -2538,8 +2745,8 @@ def write_array(self, key, value, items=None):
                 # create an empty chunked array and fill it from value
                 if not empty_array:
                     ca = self._handle.create_carray(self.group, key, atom,
-                                                   value.shape,
-                                                   filters=self._filters)
+                                                    value.shape,
+                                                    filters=self._filters)
                     ca[:] = value
                     getattr(self.group, key)._v_attrs.transposed = transposed
 
@@ -2566,18 +2773,29 @@ def write_array(self, key, value, items=None):
                 warnings.warn(ws, PerformanceWarning, stacklevel=7)
 
             vlarr = self._handle.create_vlarray(self.group, key,
-                                               _tables().ObjectAtom())
+                                                _tables().ObjectAtom())
             vlarr.append(value)
         else:
             if empty_array:
                 self.write_array_empty(key, value)
             else:
-                if value.dtype.type == np.datetime64:
-                    self._handle.create_array(self.group, key, value.view('i8'))
+                if is_datetime64_dtype(value.dtype):
+                    self._handle.create_array(
+                        self.group, key, value.view('i8'))
                     getattr(
                         self.group, key)._v_attrs.value_type = 'datetime64'
-                elif value.dtype.type == np.timedelta64:
-                    self._handle.create_array(self.group, key, value.view('i8'))
+                elif is_datetime64tz_dtype(value.dtype):
+                    # store as UTC
+                    # with a zone
+                    self._handle.create_array(self.group, key,
+                                              value.asi8)
+
+                    node = getattr(self.group, key)
+                    node._v_attrs.tz = _get_tz(value.tz)
+                    node._v_attrs.value_type = 'datetime64'
+                elif is_timedelta64_dtype(value.dtype):
+                    self._handle.create_array(
+                        self.group, key, value.view('i8'))
                     getattr(
                         self.group, key)._v_attrs.value_type = 'timedelta64'
                 else:
@@ -2588,17 +2806,18 @@ def write_array(self, key, value, items=None):
 
 class LegacyFixed(GenericFixed):
 
-    def read_index_legacy(self, key):
+    def read_index_legacy(self, key, start=None, stop=None):
         node = getattr(self.group, key)
-        data = node[:]
+        data = node[start:stop]
         kind = node._v_attrs.kind
-        return _unconvert_index_legacy(data, kind, encoding=self.encoding)
+        return _unconvert_index_legacy(data, kind, encoding=self.encoding,
+                                       errors=self.errors)
 
 
 class LegacySeriesFixed(LegacyFixed):
 
     def read(self, **kwargs):
-        self.validate_read(kwargs)
+        kwargs = self.validate_read(kwargs)
         index = self.read_index_legacy('index')
         values = self.read_array('values')
         return Series(values, index=index)
@@ -2607,7 +2826,7 @@ def read(self, **kwargs):
 class LegacyFrameFixed(LegacyFixed):
 
     def read(self, **kwargs):
-        self.validate_read(kwargs)
+        kwargs = self.validate_read(kwargs)
         index = self.read_index_legacy('index')
         columns = self.read_index_legacy('columns')
         values = self.read_array('values')
@@ -2626,9 +2845,9 @@ def shape(self):
             return None
 
     def read(self, **kwargs):
-        self.validate_read(kwargs)
-        index = self.read_index('index')
-        values = self.read_array('values')
+        kwargs = self.validate_read(kwargs)
+        index = self.read_index('index', **kwargs)
+        values = self.read_array('values', **kwargs)
         return Series(values, index=index, name=self.name)
 
     def write(self, obj, **kwargs):
@@ -2638,12 +2857,25 @@ def write(self, obj, **kwargs):
         self.attrs.name = obj.name
 
 
-class SparseSeriesFixed(GenericFixed):
+class SparseFixed(GenericFixed):
+
+    def validate_read(self, kwargs):
+        """
+        we don't support start, stop kwds in Sparse
+        """
+        kwargs = super(SparseFixed, self).validate_read(kwargs)
+        if 'start' in kwargs or 'stop' in kwargs:
+            raise NotImplementedError("start and/or stop are not supported "
+                                      "in fixed Sparse reading")
+        return kwargs
+
+
+class SparseSeriesFixed(SparseFixed):
     pandas_kind = u('sparse_series')
     attributes = ['name', 'fill_value', 'kind']
 
     def read(self, **kwargs):
-        self.validate_read(kwargs)
+        kwargs = self.validate_read(kwargs)
         index = self.read_index('index')
         sp_values = self.read_array('sp_values')
         sp_index = self.read_index('sp_index')
@@ -2662,12 +2894,12 @@ def write(self, obj, **kwargs):
         self.attrs.kind = obj.kind
 
 
-class SparseFrameFixed(GenericFixed):
+class SparseFrameFixed(SparseFixed):
     pandas_kind = u('sparse_frame')
     attributes = ['default_kind', 'default_fill_value']
 
     def read(self, **kwargs):
-        self.validate_read(kwargs)
+        kwargs = self.validate_read(kwargs)
         columns = self.read_index('columns')
         sdict = {}
         for c in columns:
@@ -2695,39 +2927,6 @@ def write(self, obj, **kwargs):
         self.write_index('columns', obj.columns)
 
 
-class SparsePanelFixed(GenericFixed):
-    pandas_kind = u('sparse_panel')
-    attributes = ['default_kind', 'default_fill_value']
-
-    def read(self, **kwargs):
-        self.validate_read(kwargs)
-        items = self.read_index('items')
-
-        sdict = {}
-        for name in items:
-            key = 'sparse_frame_%s' % name
-            s = SparseFrameFixed(self.parent, getattr(self.group, key))
-            s.infer_axes()
-            sdict[name] = s.read()
-        return SparsePanel(sdict, items=items, default_kind=self.default_kind,
-                           default_fill_value=self.default_fill_value)
-
-    def write(self, obj, **kwargs):
-        super(SparsePanelFixed, self).write(obj, **kwargs)
-        self.attrs.default_fill_value = obj.default_fill_value
-        self.attrs.default_kind = obj.default_kind
-        self.write_index('items', obj.items)
-
-        for name, sdf in compat.iteritems(obj):
-            key = 'sparse_frame_%s' % name
-            if key not in self.group._v_children:
-                node = self._handle.create_group(self.group, key)
-            else:
-                node = getattr(self.group, key)
-            s = SparseFrameFixed(self.parent, node)
-            s.write(sdf)
-
-
 class BlockManagerFixed(GenericFixed):
     attributes = ['ndim', 'nblocks']
     is_shape_reversed = False
@@ -2763,19 +2962,26 @@ def shape(self):
         except:
             return None
 
-    def read(self, **kwargs):
-        self.validate_read(kwargs)
+    def read(self, start=None, stop=None, **kwargs):
+        # start, stop applied to rows, so 0th axis only
+
+        kwargs = self.validate_read(kwargs)
+        select_axis = self.obj_type()._get_block_manager_axis(0)
 
         axes = []
         for i in range(self.ndim):
-            ax = self.read_index('axis%d' % i)
+
+            _start, _stop = (start, stop) if i == select_axis else (None, None)
+            ax = self.read_index('axis%d' % i, start=_start, stop=_stop)
             axes.append(ax)
 
         items = axes[0]
         blocks = []
         for i in range(self.nblocks):
+
             blk_items = self.read_index('block%d_items' % i)
-            values = self.read_array('block%d_values' % i)
+            values = self.read_array('block%d_values' % i,
+                                     start=_start, stop=_stop)
             blk = make_block(values,
                              placement=items.get_indexer(blk_items))
             blocks.append(blk)
@@ -2792,7 +2998,8 @@ def write(self, obj, **kwargs):
         for i, ax in enumerate(data.axes):
             if i == 0:
                 if not ax.is_unique:
-                    raise ValueError("Columns index has to be unique for fixed format")
+                    raise ValueError(
+                        "Columns index has to be unique for fixed format")
             self.write_index('axis%d' % i, ax)
 
         # Supporting mixed-type DataFrame objects...nontrivial
@@ -2877,11 +3084,11 @@ def __unicode__(self):
 
         ver = ''
         if self.is_old_version:
-            ver = "[%s]" % '.'.join([str(x) for x in self.version])
+            ver = "[%s]" % '.'.join(str(x) for x in self.version)
 
         return "%-12.12s%s (typ->%s,nrows->%s,ncols->%s,indexers->[%s]%s)" % (
             self.pandas_type, ver, self.table_type_short, self.nrows,
-            self.ncols, ','.join([a.name for a in self.index_axes]), dc
+            self.ncols, ','.join(a.name for a in self.index_axes), dc
         )
 
     def __getitem__(self, c):
@@ -2925,7 +3132,8 @@ def is_multi_index(self):
 
     def validate_metadata(self, existing):
         """ create / validate metadata """
-        self.metadata = [ c.name for c in self.values_axes if c.metadata is not None ]
+        self.metadata = [
+            c.name for c in self.values_axes if c.metadata is not None]
 
     def validate_multiindex(self, obj):
         """validate that we can store the multi-index; reset and return the
@@ -2973,7 +3181,7 @@ def axes(self):
     @property
     def ncols(self):
         """ the number of total columns in the values axes """
-        return sum([len(a.values) for a in self.values_axes])
+        return sum(len(a.values) for a in self.values_axes)
 
     @property
     def is_transposed(self):
@@ -3022,11 +3230,12 @@ def write_metadata(self, key, values):
         """
         values = Series(values)
         self.parent.put(self._get_metadata_path(key), values, format='table',
-                encoding=self.encoding, nan_rep=self.nan_rep)
+                        encoding=self.encoding, errors=self.errors,
+                        nan_rep=self.nan_rep)
 
     def read_metadata(self, key):
         """ return the meta data array for this key """
-        if getattr(getattr(self.group,'meta',None),key,None) is not None:
+        if getattr(getattr(self.group, 'meta', None), key, None) is not None:
             return self.parent.select(self._get_metadata_path(key))
         return None
 
@@ -3043,6 +3252,7 @@ def set_attrs(self):
         self.attrs.data_columns = self.data_columns
         self.attrs.nan_rep = self.nan_rep
         self.attrs.encoding = self.encoding
+        self.attrs.errors = self.errors
         self.attrs.levels = self.levels
         self.attrs.metadata = self.metadata
         self.set_info()
@@ -3058,6 +3268,7 @@ def get_attrs(self):
         self.nan_rep = getattr(self.attrs, 'nan_rep', None)
         self.encoding = _ensure_encoding(
             getattr(self.attrs, 'encoding', None))
+        self.errors = getattr(self.attrs, 'errors', 'strict')
         self.levels = getattr(
             self.attrs, 'levels', None) or []
         self.index_axes = [
@@ -3133,7 +3344,7 @@ def create_index(self, columns=None, optlevel=None, kind=None):
           note: cannot index Time64Col() or ComplexCol currently;
           PyTables must be >= 3.0
 
-        Paramaters
+        Parameters
         ----------
         columns : False (don't create an index), True (create all columns
             index), None or list_like (the indexers to index)
@@ -3187,11 +3398,13 @@ def create_index(self, columns=None, optlevel=None, kind=None):
                 # create the index
                 if not v.is_indexed:
                     if v.type.startswith('complex'):
-                        raise TypeError('Columns containing complex values can be stored but cannot'
-                                        ' be indexed when using table format. Either use fixed '
-                                        'format, set index=False, or do not include the columns '
-                                        'containing complex values to data_columns when '
-                                        'initializing the table.')
+                        raise TypeError(
+                            'Columns containing complex values can be stored '
+                            'but cannot'
+                            ' be indexed when using table format. Either use '
+                            'fixed format, set index=False, or do not include '
+                            'the columns containing complex values to '
+                            'data_columns when initializing the table.')
                     v.create_index(**kw)
 
     def read_axes(self, where, **kwargs):
@@ -3213,7 +3426,8 @@ def read_axes(self, where, **kwargs):
         # convert the data
         for a in self.axes:
             a.set_info(self.info)
-            a.convert(values, nan_rep=self.nan_rep, encoding=self.encoding)
+            a.convert(values, nan_rep=self.nan_rep, encoding=self.encoding,
+                      errors=self.errors)
 
         return True
 
@@ -3238,7 +3452,7 @@ def validate_data_columns(self, data_columns, min_itemsize):
         # evaluate the passed data_columns, True == use all columns
         # take only valide axis labels
         if data_columns is True:
-            data_columns = axis_labels
+            data_columns = list(axis_labels)
         elif data_columns is None:
             data_columns = []
 
@@ -3295,6 +3509,7 @@ def create_axes(self, axes, obj, validate=True, nan_rep=None,
             data_columns = existing_table.data_columns
             nan_rep = existing_table.nan_rep
             self.encoding = existing_table.encoding
+            self.errors = existing_table.errors
             self.info = copy.copy(existing_table.info)
         else:
             existing_table = None
@@ -3321,7 +3536,7 @@ def create_axes(self, axes, obj, validate=True, nan_rep=None,
             if i in axes:
                 name = obj._AXIS_NAMES[i]
                 index_axes_map[i] = _convert_index(
-                    a, self.encoding, self.format_type
+                    a, self.encoding, self.errors, self.format_type
                 ).set_name(name).set_axis(i)
             else:
 
@@ -3331,10 +3546,12 @@ def create_axes(self, axes, obj, validate=True, nan_rep=None,
                 if existing_table is not None:
                     indexer = len(self.non_index_axes)
                     exist_axis = existing_table.non_index_axes[indexer][1]
-                    if append_axis != exist_axis:
+                    if not array_equivalent(np.array(append_axis),
+                                            np.array(exist_axis)):
 
                         # ahah! -> reindex
-                        if sorted(append_axis) == sorted(exist_axis):
+                        if array_equivalent(np.array(sorted(append_axis)),
+                                            np.array(sorted(exist_axis))):
                             append_axis = exist_axis
 
                 # the non_index_axes info
@@ -3352,9 +3569,8 @@ def create_axes(self, axes, obj, validate=True, nan_rep=None,
         j = len(self.index_axes)
 
         # check for column conflicts
-        if validate:
-            for a in self.axes:
-                a.maybe_set_size(min_itemsize=min_itemsize)
+        for a in self.axes:
+            a.maybe_set_size(min_itemsize=min_itemsize)
 
         # reindex by our non_index_axes & compute data_columns
         for a in self.non_index_axes:
@@ -3364,7 +3580,7 @@ def get_blk_items(mgr, blocks):
             return [mgr.items.take(blk.mgr_locs) for blk in blocks]
 
         # figure out data_columns and get out blocks
-        block_obj = self.get_object(obj).consolidate()
+        block_obj = self.get_object(obj)._consolidate()
         blocks = block_obj._data.blocks
         blk_items = get_blk_items(block_obj._data, blocks)
         if len(self.non_index_axes):
@@ -3372,7 +3588,7 @@ def get_blk_items(mgr, blocks):
             data_columns = self.validate_data_columns(
                 data_columns, min_itemsize)
             if len(data_columns):
-                mgr = block_obj.reindex_axis(
+                mgr = block_obj.reindex(
                     Index(axis_labels).difference(Index(data_columns)),
                     axis=axis
                 )._data
@@ -3380,14 +3596,14 @@ def get_blk_items(mgr, blocks):
                 blocks = list(mgr.blocks)
                 blk_items = get_blk_items(mgr, blocks)
                 for c in data_columns:
-                    mgr = block_obj.reindex_axis([c], axis=axis)._data
+                    mgr = block_obj.reindex([c], axis=axis)._data
                     blocks.extend(mgr.blocks)
                     blk_items.extend(get_blk_items(mgr, mgr.blocks))
 
         # reorder the blocks in the same order as the existing_table if we can
         if existing_table is not None:
-            by_items = dict([(tuple(b_items.tolist()), (b, b_items))
-                             for b, b_items in zip(blocks, blk_items)])
+            by_items = {tuple(b_items.tolist()): (b, b_items)
+                        for b, b_items in zip(blocks, blk_items)}
             new_blocks = []
             new_blk_items = []
             for ea in existing_table.values_axes:
@@ -3399,7 +3615,7 @@ def get_blk_items(mgr, blocks):
                 except:
                     raise ValueError(
                         "cannot match existing table structure for [%s] on "
-                        "appending data" % ','.join(com.pprint_thing(item) for
+                        "appending data" % ','.join(pprint_thing(item) for
                                                     item in items))
             blocks = new_blocks
             blk_items = new_blk_items
@@ -3439,8 +3655,8 @@ def get_blk_items(mgr, blocks):
                              min_itemsize=min_itemsize,
                              nan_rep=nan_rep,
                              encoding=self.encoding,
-                             info=self.info,
-                             **kwargs)
+                             errors=self.errors,
+                             info=self.info)
                 col.set_pos(j)
 
                 self.values_axes.append(col)
@@ -3500,8 +3716,8 @@ def process_filter(field, filt):
                                 filt = filt.union(Index(self.levels))
 
                             takers = op(axis_values, filt)
-                            return obj.ix._getitem_axis(takers,
-                                                        axis=axis_number)
+                            return obj.loc._getitem_axis(takers,
+                                                         axis=axis_number)
 
                         # this might be the name of a file IN an axis
                         elif field in axis_values:
@@ -3514,8 +3730,8 @@ def process_filter(field, filt):
                             if isinstance(obj, DataFrame):
                                 axis_number = 1 - axis_number
                             takers = op(values, filt)
-                            return obj.ix._getitem_axis(takers,
-                                                        axis=axis_number)
+                            return obj.loc._getitem_axis(takers,
+                                                         axis=axis_number)
 
                     raise ValueError(
                         "cannot find the field [%s] for filtering!" % field)
@@ -3535,7 +3751,7 @@ def create_description(self, complib=None, complevel=None,
         d = dict(name='table', expectedrows=expectedrows)
 
         # description from the axes & values
-        d['description'] = dict([(a.cname, a.typ) for a in self.axes])
+        d['description'] = {a.cname: a.typ for a in self.axes}
 
         if complib:
             if complevel is None:
@@ -3567,8 +3783,10 @@ def read_coordinates(self, where=None, start=None, stop=None, **kwargs):
         coords = self.selection.select_coords()
         if self.selection.filter is not None:
             for field, op, filt in self.selection.filter.format():
-                data = self.read_column(field, start=coords.min(), stop=coords.max()+1)
-                coords = coords[op(data.iloc[coords-coords.min()], filt).values]
+                data = self.read_column(
+                    field, start=coords.min(), stop=coords.max() + 1)
+                coords = coords[
+                    op(data.iloc[coords - coords.min()], filt).values]
 
         return Index(coords)
 
@@ -3602,7 +3820,8 @@ def read_column(self, column, where=None, start=None, stop=None, **kwargs):
                 a.set_info(self.info)
                 return Series(_set_tz(a.convert(c[start:stop],
                                                 nan_rep=self.nan_rep,
-                                                encoding=self.encoding
+                                                encoding=self.encoding,
+                                                errors=self.errors
                                                 ).take_data(),
                                       a.tz, True), name=column)
 
@@ -3618,13 +3837,13 @@ class WORMTable(Table):
     table_type = u('worm')
 
     def read(self, **kwargs):
-        """ read the indicies and the indexing array, calculate offset rows and
+        """ read the indices and the indexing array, calculate offset rows and
         return """
         raise NotImplementedError("WORMTable needs to implement read")
 
     def write(self, **kwargs):
         """ write in a format that we can search later on (but cannot append
-               to): write out the indicies and the values using _write_array
+               to): write out the indices and the values using _write_array
                (e.g. a CArray) create an indexing table so that we can search
         """
         raise NotImplementedError("WORKTable needs to implement write")
@@ -3633,7 +3852,7 @@ def write(self, **kwargs):
 class LegacyTable(Table):
 
     """ an appendable table: allow append/query/delete operations to a
-          (possibily) already existing appendable table this table ALLOWS
+          (possibly) already existing appendable table this table ALLOWS
           append (but doesn't require them), and stores the data in a format
           that can be easily searched
 
@@ -3657,10 +3876,12 @@ def read(self, where=None, columns=None, **kwargs):
         if not self.read_axes(where=where, **kwargs):
             return None
 
-        factors = [Categorical.from_array(a.values, ordered=True) for a in self.index_axes]
-        levels = [f.categories for f in factors]
-        N = [len(f.categories) for f in factors]
-        labels = [f.codes for f in factors]
+        lst_vals = [a.values for a in self.index_axes]
+        labels, levels = _factorize_from_iterables(lst_vals)
+        # labels and levels are tuples but lists are expected
+        labels = list(labels)
+        levels = list(levels)
+        N = [len(lvl) for lvl in levels]
 
         # compute the key
         key = _factor_indexer(N[1:], labels)
@@ -3669,8 +3890,8 @@ def read(self, where=None, columns=None, **kwargs):
         if len(unique(key)) == len(key):
 
             sorter, _ = algos.groupsort_indexer(
-                com._ensure_int64(key), np.prod(N))
-            sorter = com._ensure_platform_int(sorter)
+                _ensure_int64(key), np.prod(N))
+            sorter = _ensure_platform_int(sorter)
 
             # create the objs
             for c in self.values_axes:
@@ -3678,7 +3899,8 @@ def read(self, where=None, columns=None, **kwargs):
                 # the data need to be sorted
                 sorted_values = c.take_data().take(sorter, axis=0)
                 if sorted_values.ndim == 1:
-                    sorted_values = sorted_values.reshape((sorted_values.shape[0],1))
+                    sorted_values = sorted_values.reshape(
+                        (sorted_values.shape[0], 1))
 
                 take_labels = [l.take(sorter) for l in labels]
                 items = Index(c.values)
@@ -3708,13 +3930,13 @@ def read(self, where=None, columns=None, **kwargs):
                 lp = DataFrame(c.data, index=long_index, columns=c.values)
 
                 # need a better algorithm
-                tuple_index = long_index._tuple_index
+                tuple_index = long_index.values
 
-                unique_tuples = lib.fast_unique(tuple_index.values)
-                unique_tuples = _asarray_tuplesafe(unique_tuples)
+                unique_tuples = unique(tuple_index)
+                unique_tuples = com._asarray_tuplesafe(unique_tuples)
 
                 indexer = match(unique_tuples, tuple_index)
-                indexer = com._ensure_platform_int(indexer)
+                indexer = _ensure_platform_int(indexer)
 
                 new_index = long_index.take(indexer)
                 new_values = lp.values.take(indexer, axis=0)
@@ -3726,7 +3948,7 @@ def read(self, where=None, columns=None, **kwargs):
         if len(objs) == 1:
             wp = objs[0]
         else:
-            wp = concat(objs, axis=0, verify_integrity=False).consolidate()
+            wp = concat(objs, axis=0, verify_integrity=False)._consolidate()
 
         # apply the selection filters & axis orderings
         wp = self.process_axes(wp, columns=columns)
@@ -3785,10 +4007,10 @@ def write(self, obj, axes=None, append=False, complib=None,
             self.set_attrs()
 
             # create the table
-            table = self._handle.create_table(self.group, **options)
-
+            self._handle.create_table(self.group, **options)
         else:
-            table = self.table
+            pass
+            # table = self.table
 
         # update my info
         self.set_info()
@@ -3808,24 +4030,24 @@ def write_data(self, chunksize, dropna=False):
         nrows = self.nrows_expected
 
         # if dropna==True, then drop ALL nan rows
+        masks = []
         if dropna:
 
-            masks = []
             for a in self.values_axes:
 
                 # figure the mask: only do if we can successfully process this
                 # column, otherwise ignore the mask
-                mask = com.isnull(a.data).all(axis=0)
-                masks.append(mask.astype('u1', copy=False))
+                mask = isna(a.data).all(axis=0)
+                if isinstance(mask, np.ndarray):
+                    masks.append(mask.astype('u1', copy=False))
 
-            # consolidate masks
+        # consolidate masks
+        if len(masks):
             mask = masks[0]
             for m in masks[1:]:
                 mask = mask & m
             mask = mask.ravel()
-
         else:
-
             mask = None
 
         # broadcast the indexes if needed
@@ -3842,7 +4064,7 @@ def write_data(self, chunksize, dropna=False):
 
             if i < nindexes - 1:
                 repeater = np.prod([indexes[bi].shape[0]
-                                   for bi in range(i + 1, nindexes)])
+                                    for bi in range(i + 1, nindexes)])
                 idx = np.repeat(idx, repeater)
 
             bindexes.append(idx)
@@ -3861,7 +4083,7 @@ def write_data(self, chunksize, dropna=False):
         if chunksize is None:
             chunksize = 100000
 
-        rows = np.empty(min(chunksize,nrows), dtype=self.dtype)
+        rows = np.empty(min(chunksize, nrows), dtype=self.dtype)
         chunks = int(nrows / chunksize) + 1
         for i in range(chunks):
             start_i = i * chunksize
@@ -3942,7 +4164,8 @@ def delete(self, where=None, start=None, stop=None, **kwargs):
 
         # create the selection
         table = self.table
-        self.selection = Selection(self, where, start=start, stop=stop, **kwargs)
+        self.selection = Selection(
+            self, where, start=start, stop=stop, **kwargs)
         values = self.selection.select_coords()
 
         # delete the rows in reverse order
@@ -3972,7 +4195,7 @@ def delete(self, where=None, start=None, stop=None, **kwargs):
             for g in reversed(groups):
                 rows = l.take(lrange(g, pg))
                 table.remove_rows(start=rows[rows.index[0]
-                                            ], stop=rows[rows.index[-1]] + 1)
+                                             ], stop=rows[rows.index[-1]] + 1)
                 pg = g
 
             self.table.flush()
@@ -4040,7 +4263,7 @@ def read(self, where=None, columns=None, **kwargs):
         if len(frames) == 1:
             df = frames[0]
         else:
-            df = concat(frames, axis=1, verify_integrity=False).consolidate()
+            df = concat(frames, axis=1)
 
         # apply the selection filters & axis orderings
         df = self.process_axes(df, columns=columns)
@@ -4070,7 +4293,7 @@ def write(self, obj, data_columns=None, **kwargs):
             obj = DataFrame({name: obj}, index=obj.index)
             obj.columns = [name]
         return super(AppendableSeriesTable, self).write(
-            obj=obj, data_columns=obj.columns, **kwargs)
+            obj=obj, data_columns=obj.columns.tolist(), **kwargs)
 
     def read(self, columns=None, **kwargs):
 
@@ -4161,7 +4384,7 @@ class AppendableMultiFrameTable(AppendableFrameTable):
     table_type = u('appendable_multiframe')
     obj_type = DataFrame
     ndim = 2
-    _re_levels = re.compile("^level_\d+$")
+    _re_levels = re.compile(r"^level_\d+$")
 
     @property
     def table_type_short(self):
@@ -4171,7 +4394,7 @@ def write(self, obj, data_columns=None, **kwargs):
         if data_columns is None:
             data_columns = []
         elif data_columns is True:
-            data_columns = obj.columns[:]
+            data_columns = obj.columns.tolist()
         obj, self.levels = self.validate_multiindex(obj)
         for n in self.levels:
             if n not in data_columns:
@@ -4191,6 +4414,7 @@ def read(self, **kwargs):
 
         return df
 
+
 class AppendablePanelTable(AppendableTable):
 
     """ suppor the new appendable table formats """
@@ -4209,14 +4433,6 @@ def is_transposed(self):
         return self.data_orientation != tuple(range(self.ndim))
 
 
-class AppendableNDimTable(AppendablePanelTable):
-
-    """ suppor the new appendable table formats """
-    table_type = u('appendable_ndim')
-    ndim = 4
-    obj_type = Panel4D
-
-
 def _reindex_axis(obj, axis, labels, other=None):
     ax = obj._get_axis(axis)
     labels = _ensure_index(labels)
@@ -4230,7 +4446,7 @@ def _reindex_axis(obj, axis, labels, other=None):
 
     labels = _ensure_index(labels.unique())
     if other is not None:
-        labels = labels & _ensure_index(other.unique())
+        labels = _ensure_index(other.unique()) & labels
     if not labels.equals(ax):
         slicer = [slice(None, None)] * obj.ndim
         slicer[axis] = labels
@@ -4246,8 +4462,47 @@ def _get_info(info, name):
         idx = info[name] = dict()
     return idx
 
+# tz to/from coercion
+
+
+def _get_tz(tz):
+    """ for a tz-aware type, return an encoded zone """
+    zone = timezones.get_timezone(tz)
+    if zone is None:
+        zone = tz.utcoffset().total_seconds()
+    return zone
 
-def _convert_index(index, encoding=None, format_type=None):
+
+def _set_tz(values, tz, preserve_UTC=False, coerce=False):
+    """
+    coerce the values to a DatetimeIndex if tz is set
+    preserve the input shape if possible
+
+    Parameters
+    ----------
+    values : ndarray
+    tz : string/pickled tz object
+    preserve_UTC : boolean,
+        preserve the UTC of the result
+    coerce : if we do not have a passed timezone, coerce to M8[ns] ndarray
+    """
+    if tz is not None:
+        name = getattr(values, 'name', None)
+        values = values.ravel()
+        tz = timezones.get_timezone(_ensure_decoded(tz))
+        values = DatetimeIndex(values, name=name)
+        if values.tz is None:
+            values = values.tz_localize('UTC').tz_convert(tz)
+        if preserve_UTC:
+            if tz == 'UTC':
+                values = list(values)
+    elif coerce:
+        values = np.asarray(values, dtype='M8[ns]')
+
+    return values
+
+
+def _convert_index(index, encoding=None, errors='strict', format_type=None):
     index_name = getattr(index, 'name', None)
 
     if isinstance(index, DatetimeIndex):
@@ -4263,9 +4518,10 @@ def _convert_index(index, encoding=None, format_type=None):
                         index_name=index_name)
     elif isinstance(index, (Int64Index, PeriodIndex)):
         atom = _tables().Int64Col()
-        return IndexCol(
-            index.values, 'integer', atom, freq=getattr(index, 'freq', None),
-            index_name=index_name)
+        # avoid to store ndarray of Period objects
+        return IndexCol(index._ndarray_values, 'integer', atom,
+                        freq=getattr(index, 'freq', None),
+                        index_name=index_name)
 
     if isinstance(index, MultiIndex):
         raise TypeError('MultiIndex not supported here!')
@@ -4300,7 +4556,7 @@ def _convert_index(index, encoding=None, format_type=None):
         # atom = _tables().ObjectAtom()
         # return np.asarray(values, dtype='O'), 'object', atom
 
-        converted = _convert_string_array(values, encoding)
+        converted = _convert_string_array(values, encoding, errors)
         itemsize = converted.dtype.itemsize
         return IndexCol(
             converted, 'string', _tables().StringCol(itemsize),
@@ -4331,7 +4587,7 @@ def _convert_index(index, encoding=None, format_type=None):
                         index_name=index_name)
 
 
-def _unconvert_index(data, kind, encoding=None):
+def _unconvert_index(data, kind, encoding=None, errors='strict'):
     kind = _ensure_decoded(kind)
     if kind == u('datetime64'):
         index = DatetimeIndex(data)
@@ -4350,7 +4606,8 @@ def _unconvert_index(data, kind, encoding=None):
     elif kind in (u('integer'), u('float')):
         index = np.asarray(data)
     elif kind in (u('string')):
-        index = _unconvert_string_array(data, nan_rep=None, encoding=encoding)
+        index = _unconvert_string_array(data, nan_rep=None, encoding=encoding,
+                                        errors=errors)
     elif kind == u('object'):
         index = np.asarray(data[0])
     else:  # pragma: no cover
@@ -4358,27 +4615,31 @@ def _unconvert_index(data, kind, encoding=None):
     return index
 
 
-def _unconvert_index_legacy(data, kind, legacy=False, encoding=None):
+def _unconvert_index_legacy(data, kind, legacy=False, encoding=None,
+                            errors='strict'):
     kind = _ensure_decoded(kind)
     if kind == u('datetime'):
-        index = lib.time64_to_datetime(data)
+        index = to_datetime(data)
     elif kind in (u('integer')):
         index = np.asarray(data, dtype=object)
     elif kind in (u('string')):
-        index = _unconvert_string_array(data, nan_rep=None, encoding=encoding)
+        index = _unconvert_string_array(data, nan_rep=None, encoding=encoding,
+                                        errors=errors)
     else:  # pragma: no cover
         raise ValueError('unrecognized index type %s' % kind)
     return index
 
 
-def _convert_string_array(data, encoding, itemsize=None):
+def _convert_string_array(data, encoding, errors, itemsize=None):
     """
-    we take a string-like that is object dtype and coerce to a fixed size string type
+    we take a string-like that is object dtype and coerce to a fixed size
+    string type
 
     Parameters
     ----------
     data : a numpy array of object dtype
     encoding : None or string-encoding
+    errors : handler for encoding errors
     itemsize : integer, optional, defaults to the max length of the strings
 
     Returns
@@ -4388,16 +4649,20 @@ def _convert_string_array(data, encoding, itemsize=None):
 
     # encode if needed
     if encoding is not None and len(data):
-        data = Series(data.ravel()).str.encode(encoding).values.reshape(data.shape)
+        data = Series(data.ravel()).str.encode(
+            encoding, errors).values.reshape(data.shape)
 
     # create the sized dtype
     if itemsize is None:
-        itemsize = lib.max_len_string_array(com._ensure_object(data.ravel()))
+        ensured = _ensure_object(data.ravel())
+        itemsize = libwriters.max_len_string_array(ensured)
 
     data = np.asarray(data, dtype="S%d" % itemsize)
     return data
 
-def _unconvert_string_array(data, nan_rep=None, encoding=None):
+
+def _unconvert_string_array(data, nan_rep=None, encoding=None,
+                            errors='strict'):
     """
     inverse of _convert_string_array
 
@@ -4406,6 +4671,7 @@ def _unconvert_string_array(data, nan_rep=None, encoding=None):
     data : fixed length string dtyped array
     nan_rep : the storage repr of NaN, optional
     encoding : the encoding of the data, optional
+    errors : handler for encoding errors, default 'strict'
 
     Returns
     -------
@@ -4420,40 +4686,41 @@ def _unconvert_string_array(data, nan_rep=None, encoding=None):
     encoding = _ensure_encoding(encoding)
     if encoding is not None and len(data):
 
-        itemsize = lib.max_len_string_array(com._ensure_object(data))
+        itemsize = libwriters.max_len_string_array(_ensure_object(data))
         if compat.PY3:
             dtype = "U{0}".format(itemsize)
         else:
             dtype = "S{0}".format(itemsize)
 
         if isinstance(data[0], compat.binary_type):
-            data = Series(data).str.decode(encoding).values
+            data = Series(data).str.decode(encoding, errors=errors).values
         else:
             data = data.astype(dtype, copy=False).astype(object, copy=False)
 
     if nan_rep is None:
         nan_rep = 'nan'
 
-    data = lib.string_array_replace_from_nan_rep(data, nan_rep)
+    data = libwriters.string_array_replace_from_nan_rep(data, nan_rep)
     return data.reshape(shape)
 
 
-def _maybe_convert(values, val_kind, encoding):
+def _maybe_convert(values, val_kind, encoding, errors):
     if _need_convert(val_kind):
-        conv = _get_converter(val_kind, encoding)
+        conv = _get_converter(val_kind, encoding, errors)
         # conv = np.frompyfunc(conv, 1, 1)
         values = conv(values)
     return values
 
 
-def _get_converter(kind, encoding):
+def _get_converter(kind, encoding, errors):
     kind = _ensure_decoded(kind)
     if kind == 'datetime64':
         return lambda x: np.asarray(x, dtype='M8[ns]')
     elif kind == 'datetime':
-        return lib.convert_timestamps
+        return lambda x: to_datetime(x, cache=True).to_pydatetime()
     elif kind == 'string':
-        return lambda x: _unconvert_string_array(x, encoding=encoding)
+        return lambda x: _unconvert_string_array(x, encoding=encoding,
+                                                 errors=errors)
     else:  # pragma: no cover
         raise ValueError('invalid kind %s' % kind)
 
@@ -4473,8 +4740,8 @@ class Selection(object):
     Parameters
     ----------
     table : a Table object
-    where : list of Terms (or convertable to)
-    start, stop: indicies to start and/or stop selection
+    where : list of Terms (or convertible to)
+    start, stop: indices to start and/or stop selection
 
     """
 
@@ -4488,7 +4755,7 @@ def __init__(self, table, where=None, start=None, stop=None, **kwargs):
         self.terms = None
         self.coordinates = None
 
-        if com.is_list_like(where):
+        if is_list_like(where):
 
             # see if we have a passed coordinate like
             try:
@@ -4532,13 +4799,13 @@ def generate(self, where):
         q = self.table.queryables()
         try:
             return Expr(where, queryables=q, encoding=self.table.encoding)
-        except NameError as detail:
+        except NameError:
             # raise a nice message, suggesting that the user should use
             # data_columns
             raise ValueError(
                 "The passed where expression: {0}\n"
                 "            contains an invalid variable reference\n"
-                "            all of the variable refrences must be a "
+                "            all of the variable references must be a "
                 "reference to\n"
                 "            an axis (e.g. 'index' or 'columns'), or a "
                 "data_column\n"
@@ -4552,7 +4819,8 @@ def select(self):
         """
         if self.condition is not None:
             return self.table.table.read_where(self.condition.format(),
-                                              start=self.start, stop=self.stop)
+                                               start=self.start,
+                                               stop=self.stop)
         elif self.coordinates is not None:
             return self.table.table.read_coordinates(self.coordinates)
         return self.table.table.read(start=self.start, stop=self.stop)
@@ -4574,8 +4842,8 @@ def select_coords(self):
 
         if self.condition is not None:
             return self.table.table.get_where_list(self.condition.format(),
-                                                 start=start, stop=stop,
-                                                 sort=True)
+                                                   start=start, stop=stop,
+                                                   sort=True)
         elif self.coordinates is not None:
             return self.coordinates
 
@@ -4583,6 +4851,7 @@ def select_coords(self):
 
 # utilities ###
 
+
 def timeit(key, df, fn=None, remove=True, **kwargs):
     if fn is None:
         fn = 'timeit.h5'
diff --git a/pandas/io/s3.py b/pandas/io/s3.py
new file mode 100644
index 0000000000000..bd2286c5c8569
--- /dev/null
+++ b/pandas/io/s3.py
@@ -0,0 +1,39 @@
+""" s3 support for remote file interactivity """
+from pandas import compat
+try:
+    import s3fs
+    from botocore.exceptions import NoCredentialsError
+except:
+    raise ImportError("The s3fs library is required to handle s3 files")
+
+if compat.PY3:
+    from urllib.parse import urlparse as parse_url
+else:
+    from urlparse import urlparse as parse_url
+
+
+def _strip_schema(url):
+    """Returns the url without the s3:// part"""
+    result = parse_url(url)
+    return result.netloc + result.path
+
+
+def get_filepath_or_buffer(filepath_or_buffer, encoding=None,
+                           compression=None, mode=None):
+
+    if mode is None:
+        mode = 'rb'
+
+    fs = s3fs.S3FileSystem(anon=False)
+    try:
+        filepath_or_buffer = fs.open(_strip_schema(filepath_or_buffer), mode)
+    except (compat.FileNotFoundError, NoCredentialsError):
+        # boto3 has troubles when trying to access a public file
+        # when credentialed...
+        # An OSError is raised if you have credentials, but they
+        # aren't valid for that bucket.
+        # A NoCredentialsError is raised if you don't have creds
+        # for that bucket.
+        fs = s3fs.S3FileSystem(anon=True)
+        filepath_or_buffer = fs.open(_strip_schema(filepath_or_buffer), mode)
+    return filepath_or_buffer, None, compression, True
diff --git a/pandas/io/sas.py b/pandas/io/sas.py
deleted file mode 100644
index 5f55f861afb72..0000000000000
--- a/pandas/io/sas.py
+++ /dev/null
@@ -1,459 +0,0 @@
-"""
-Tools for reading SAS XPort files into Pandas objects.
-
-Based on code from Jack Cushman (github.com/jcushman/xport).
-
-The file format is defined here:
-
-https://support.sas.com/techsup/technote/ts140.pdf
-"""
-
-from datetime import datetime
-import pandas as pd
-from pandas.io.common import get_filepath_or_buffer
-from pandas import compat
-import struct
-import numpy as np
-from pandas.util.decorators import Appender
-
-_correct_line1 = "HEADER RECORD*******LIBRARY HEADER RECORD!!!!!!!000000000000000000000000000000  "
-_correct_header1 = "HEADER RECORD*******MEMBER  HEADER RECORD!!!!!!!000000000000000001600000000"
-_correct_header2 = "HEADER RECORD*******DSCRPTR HEADER RECORD!!!!!!!000000000000000000000000000000  "
-_correct_obs_header = "HEADER RECORD*******OBS     HEADER RECORD!!!!!!!000000000000000000000000000000  "
-_fieldkeys = ['ntype', 'nhfun', 'field_length', 'nvar0', 'name', 'label',
-              'nform', 'nfl', 'num_decimals', 'nfj', 'nfill', 'niform',
-              'nifl', 'nifd', 'npos', '_']
-
-
-# TODO: Support for 4 byte floats, see https://github.com/jcushman/xport/pull/3
-# Need a test file
-
-
-_base_params_doc = """\
-Parameters
-----------
-filepath_or_buffer : string or file-like object
-    Path to SAS file or object implementing binary read method."""
-
-_params2_doc = """\
-index : identifier of index column
-    Identifier of column that should be used as index of the DataFrame.
-encoding : string
-    Encoding for text data.
-chunksize : int
-    Read file `chunksize` lines at a time, returns iterator."""
-
-_format_params_doc = """\
-format : string
-    File format, only `xport` is currently supported."""
-
-_iterator_doc = """\
-iterator : boolean, default False
-    Return XportReader object for reading file incrementally."""
-
-
-_read_sas_doc = """Read a SAS file into a DataFrame.
-
-%(_base_params_doc)s
-%(_format_params_doc)s
-%(_params2_doc)s
-%(_iterator_doc)s
-
-Returns
--------
-DataFrame or XportReader
-
-Examples
---------
-Read a SAS Xport file:
-
->>> df = pandas.read_sas('filename.XPT')
-
-Read a Xport file in 10,000 line chunks:
-
->>> itr = pandas.read_sas('filename.XPT', chunksize=10000)
->>> for chunk in itr:
->>>     do_something(chunk)
-
-.. versionadded:: 0.17.0
-""" % {"_base_params_doc": _base_params_doc,
-       "_format_params_doc": _format_params_doc,
-       "_params2_doc": _params2_doc,
-       "_iterator_doc": _iterator_doc}
-
-
-_xport_reader_doc = """\
-Class for reading SAS Xport files.
-
-%(_base_params_doc)s
-%(_params2_doc)s
-
-Attributes
-----------
-member_info : list
-    Contains information about the file
-fields : list
-    Contains information about the variables in the file
-""" % {"_base_params_doc": _base_params_doc,
-       "_params2_doc": _params2_doc}
-
-
-_read_method_doc = """\
-Read observations from SAS Xport file, returning as data frame.
-
-Parameters
-----------
-nrows : int
-    Number of rows to read from data file; if None, read whole
-    file.
-
-Returns
--------
-A DataFrame.
-"""
-
-
-@Appender(_read_sas_doc)
-def read_sas(filepath_or_buffer, format='xport', index=None, encoding='ISO-8859-1',
-             chunksize=None, iterator=False):
-
-    format = format.lower()
-
-    if format == 'xport':
-        reader = XportReader(filepath_or_buffer, index=index, encoding=encoding,
-                             chunksize=chunksize)
-    else:
-        raise ValueError('only xport format is supported')
-
-    if iterator or chunksize:
-        return reader
-
-    return reader.read()
-
-
-def _parse_date(datestr):
-    """ Given a date in xport format, return Python date. """
-    try:
-        return datetime.strptime(datestr, "%d%b%y:%H:%M:%S") # e.g. "16FEB11:10:07:55"
-    except ValueError:
-        return pd.NaT
-
-
-def _split_line(s, parts):
-    """
-    Parameters
-    ----------
-    s: string
-        Fixed-length string to split
-    parts: list of (name, length) pairs
-        Used to break up string, name '_' will be filtered from output.
-
-    Returns
-    -------
-    Dict of name:contents of string at given location.
-    """
-    out = {}
-    start = 0
-    for name, length in parts:
-        out[name] = s[start:start+length].strip()
-        start += length
-    del out['_']
-    return out
-
-
-def _parse_float_vec(vec):
-    """
-    Parse a vector of 8-byte values representing IBM 8 byte floats
-    into native 8 byte floats.
-    """
-
-    dtype = np.dtype('>u4,>u4')
-    vec1 = vec.view(dtype=dtype)
-
-    xport1 = vec1['f0']
-    xport2 = vec1['f1']
-
-    # Start by setting first half of ieee number to first half of IBM
-    # number sans exponent
-    ieee1 = xport1 & 0x00ffffff
-
-    # Get the second half of the ibm number into the second half of
-    # the ieee number
-    ieee2 = xport2
-
-    # The fraction bit to the left of the binary point in the ieee
-    # format was set and the number was shifted 0, 1, 2, or 3
-    # places. This will tell us how to adjust the ibm exponent to be a
-    # power of 2 ieee exponent and how to shift the fraction bits to
-    # restore the correct magnitude.
-    shift = np.zeros(len(vec), dtype=np.uint8)
-    shift[np.where(xport1 & 0x00200000)] = 1
-    shift[np.where(xport1 & 0x00400000)] = 2
-    shift[np.where(xport1 & 0x00800000)] = 3
-
-    # shift the ieee number down the correct number of places then
-    # set the second half of the ieee number to be the second half
-    # of the ibm number shifted appropriately, ored with the bits
-    # from the first half that would have been shifted in if we
-    # could shift a double. All we are worried about are the low
-    # order 3 bits of the first half since we're only shifting by
-    # 1, 2, or 3.
-    ieee1 >>= shift
-    ieee2 = (xport2 >> shift) | ((xport1 & 0x00000007) << (29 + (3 - shift)))
-
-    # clear the 1 bit to the left of the binary point
-    ieee1 &= 0xffefffff
-
-    # set the exponent of the ieee number to be the actual exponent
-    # plus the shift count + 1023. Or this into the first half of the
-    # ieee number. The ibm exponent is excess 64 but is adjusted by 65
-    # since during conversion to ibm format the exponent is
-    # incremented by 1 and the fraction bits left 4 positions to the
-    # right of the radix point.  (had to add >> 24 because C treats &
-    # 0x7f as 0x7f000000 and Python doesn't)
-    ieee1 |= ((((((xport1 >> 24) & 0x7f) - 65) << 2) + shift + 1023) << 20) | (xport1 & 0x80000000)
-
-    ieee = np.empty((len(ieee1),), dtype='>u4,>u4')
-    ieee['f0'] = ieee1
-    ieee['f1'] = ieee2
-    ieee = ieee.view(dtype='>f8')
-    ieee = ieee.astype('f8')
-
-    return ieee
-
-
-
-class XportReader(object):
-    __doc__ = _xport_reader_doc
-
-
-    def __init__(self, filepath_or_buffer, index=None, encoding='ISO-8859-1',
-                 chunksize=None):
-
-        self._encoding = encoding
-        self._lines_read = 0
-        self._index = index
-        self._chunksize = chunksize
-
-        if isinstance(filepath_or_buffer, str):
-            filepath_or_buffer, encoding, compression = get_filepath_or_buffer(
-                filepath_or_buffer, encoding=encoding)
-
-        if isinstance(filepath_or_buffer, (str, compat.text_type, bytes)):
-            self.filepath_or_buffer = open(filepath_or_buffer, 'rb')
-        else:
-            # Copy to BytesIO, and ensure no encoding
-            contents = filepath_or_buffer.read()
-            try:
-                contents = contents.encode(self._encoding)
-            except:
-                pass
-            self.filepath_or_buffer = compat.BytesIO(contents)
-
-        self._read_header()
-
-
-    def _get_row(self):
-        return self.filepath_or_buffer.read(80).decode()
-
-
-    def _read_header(self):
-        self.filepath_or_buffer.seek(0)
-
-        # read file header
-        line1 = self._get_row()
-        if line1 != _correct_line1:
-            raise ValueError("Header record is not an XPORT file.")
-
-        line2 = self._get_row()
-        file_info = _split_line(line2, [ ['prefix',24], ['version',8], ['OS',8], ['_',24], ['created',16]])
-        if file_info['prefix'] != "SAS     SAS     SASLIB":
-            raise ValueError("Header record has invalid prefix.")
-        file_info['created'] = _parse_date(file_info['created'])
-        self.file_info = file_info
-
-        line3 = self._get_row()
-        file_info['modified'] = _parse_date(line3[:16])
-
-        # read member header
-        header1 = self._get_row()
-        header2 = self._get_row()
-        if not header1.startswith(_correct_header1) or not header2 == _correct_header2:
-            raise ValueError("Member header not found.")
-        fieldnamelength = int(header1[-5:-2]) # usually 140, could be 135
-
-        # member info
-        member_info = _split_line(self._get_row(), [['prefix',8], ['set_name',8],
-                                                    ['sasdata',8],['version',8],
-                                                    ['OS',8],['_',24],['created',16]])
-        member_info.update( _split_line(self._get_row(), [['modified',16], ['_',16],
-                                                          ['label',40],['type',8]]))
-        member_info['modified'] = _parse_date(member_info['modified'])
-        member_info['created'] = _parse_date(member_info['created'])
-        self.member_info = member_info
-
-        # read field names
-        types = {1: 'numeric', 2: 'char'}
-        fieldcount = int(self._get_row()[54:58])
-        datalength = fieldnamelength*fieldcount
-        if datalength % 80: # round up to nearest 80
-            datalength += 80 - datalength%80
-        fielddata = self.filepath_or_buffer.read(datalength)
-        fields = []
-        obs_length = 0
-        while len(fielddata) >= fieldnamelength:
-            # pull data for one field
-            field, fielddata = (fielddata[:fieldnamelength], fielddata[fieldnamelength:])
-
-            # rest at end gets ignored, so if field is short, pad out
-            # to match struct pattern below
-            field = field.ljust(140)
-
-            fieldstruct = struct.unpack('>hhhh8s40s8shhh2s8shhl52s', field)
-            field = dict(zip(_fieldkeys, fieldstruct))
-            del field['_']
-            field['ntype'] = types[field['ntype']]
-            if field['ntype'] == 'numeric' and field['field_length'] != 8:
-                raise TypeError("Only 8-byte floats are currently implemented. Can't read field %s." % field)
-
-            for k, v in field.items():
-                try:
-                    field[k] = v.strip()
-                except AttributeError:
-                    pass
-
-            obs_length += field['field_length']
-            fields += [field]
-
-        header = self._get_row()
-        if not header == _correct_obs_header:
-            raise ValueError("Observation header not found.")
-
-        self.fields = fields
-        self.record_length = obs_length
-        self.record_start = self.filepath_or_buffer.tell()
-
-        self.nobs = self._record_count()
-        self.columns = [x['name'].decode() for x in self.fields]
-
-        # Setup the dtype.
-        dtypel = []
-        for i,field in enumerate(self.fields):
-            ntype = field['ntype']
-            if ntype == "numeric":
-                dtypel.append(('s' + str(i), ">u8"))
-            elif ntype == "char":
-                dtypel.append(('s' + str(i), "S" + str(field['field_length'])))
-        dtype = np.dtype(dtypel)
-        self._dtype = dtype
-
-
-    def __iter__(self):
-        try:
-            if self._chunksize:
-                while True:
-                    yield self.read(self._chunksize)
-            else:
-                yield self.read()
-        except StopIteration:
-            pass
-
-
-    def _record_count(self):
-        """
-        Get number of records in file.
-
-        This is maybe suboptimal because we have to seek to the end of the file.
-
-        Side effect: returns file position to record_start.
-        """
-
-        self.filepath_or_buffer.seek(0, 2)
-        total_records_length = self.filepath_or_buffer.tell() - self.record_start
-
-        if total_records_length % 80 != 0:
-            warnings.warn("xport file may be corrupted")
-
-        if self.record_length > 80:
-            self.filepath_or_buffer.seek(self.record_start)
-            return total_records_length // self.record_length
-
-        self.filepath_or_buffer.seek(-80, 2)
-        last_card = self.filepath_or_buffer.read(80)
-        last_card = np.frombuffer(last_card, dtype=np.uint64)
-
-        # 8 byte blank
-        ix = np.flatnonzero(last_card == 2314885530818453536)
-
-        if len(ix) == 0:
-            tail_pad = 0
-        else:
-            tail_pad = 8 * len(ix)
-
-        self.filepath_or_buffer.seek(self.record_start)
-
-        return (total_records_length - tail_pad) // self.record_length
-
-
-    def get_chunk(self, size=None):
-        """
-        Reads lines from Xport file and returns as dataframe
-
-        Parameters
-        ----------
-        size : int, defaults to None
-            Number of lines to read.  If None, reads whole file.
-
-        Returns
-        -------
-        DataFrame
-        """
-        if size is None:
-            size = self._chunksize
-        return self.read(nrows=size)
-
-
-    def _missing_double(self, vec):
-        v = vec.view(dtype='u1,u1,u2,u4')
-        miss = (v['f1'] == 0) & (v['f2'] == 0) & (v['f3'] == 0)
-        miss1 = ((v['f0'] >= 0x41) & (v['f0'] <= 0x5a)) |\
-                (v['f0'] == 0x5f) | (v['f0'] == 0x2e)
-        miss &= miss1
-        return miss
-
-
-    @Appender(_read_method_doc)
-    def read(self, nrows=None):
-
-        if nrows is None:
-            nrows = self.nobs
-
-        read_lines = min(nrows, self.nobs - self._lines_read)
-        read_len = read_lines * self.record_length
-        if read_len <= 0:
-            raise StopIteration
-        raw = self.filepath_or_buffer.read(read_len)
-        data = np.frombuffer(raw, dtype=self._dtype, count=read_lines)
-
-        df = pd.DataFrame(index=range(read_lines))
-        for j,x in enumerate(self.columns):
-            vec = data['s%d' % j]
-            ntype = self.fields[j]['ntype']
-            if ntype == "numeric":
-                miss = self._missing_double(vec)
-                v = _parse_float_vec(vec)
-                v[miss] = np.nan
-            elif self.fields[j]['ntype'] == 'char':
-                v = [y.rstrip() for y in vec]
-                if compat.PY3:
-                    v = [y.decode(self._encoding) for y in v]
-            df[x] = v
-
-        if self._index is None:
-            df.index = range(self._lines_read, self._lines_read + read_lines)
-        else:
-            df = df.set_index(self._index)
-
-        self._lines_read += read_lines
-
-        return df
diff --git a/pandas/io/sas/__init__.py b/pandas/io/sas/__init__.py
new file mode 100644
index 0000000000000..fa6b29a1a3fcc
--- /dev/null
+++ b/pandas/io/sas/__init__.py
@@ -0,0 +1 @@
+from .sasreader import read_sas  # noqa
diff --git a/pandas/io/sas/sas.pyx b/pandas/io/sas/sas.pyx
new file mode 100644
index 0000000000000..e2a1107969990
--- /dev/null
+++ b/pandas/io/sas/sas.pyx
@@ -0,0 +1,439 @@
+# cython: profile=False
+# cython: boundscheck=False, initializedcheck=False
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport uint8_t, uint16_t, int8_t, int64_t, ndarray
+import sas_constants as const
+
+# rle_decompress decompresses data using a Run Length Encoding
+# algorithm.  It is partially documented here:
+#
+# https://cran.r-project.org/web/packages/sas7bdat/vignettes/sas7bdat.pdf
+cdef ndarray[uint8_t, ndim=1] rle_decompress(
+        int result_length, ndarray[uint8_t, ndim=1] inbuff):
+
+    cdef:
+        uint8_t control_byte, x
+        uint8_t [:] result = np.zeros(result_length, np.uint8)
+        int rpos = 0, ipos = 0, length = len(inbuff)
+        int i, nbytes, end_of_first_byte
+
+    while ipos < length:
+        control_byte = inbuff[ipos] & 0xF0
+        end_of_first_byte = <int>(inbuff[ipos] & 0x0F)
+        ipos += 1
+
+        if control_byte == 0x00:
+            if end_of_first_byte != 0:
+                raise ValueError("Unexpected non-zero end_of_first_byte")
+            nbytes = <int>(inbuff[ipos]) + 64
+            ipos += 1
+            for i in range(nbytes):
+                result[rpos] = inbuff[ipos]
+                rpos += 1
+                ipos += 1
+        elif control_byte == 0x40:
+            # not documented
+            nbytes = end_of_first_byte * 16
+            nbytes += <int>(inbuff[ipos])
+            ipos += 1
+            for i in range(nbytes):
+                result[rpos] = inbuff[ipos]
+                rpos += 1
+            ipos += 1
+        elif control_byte == 0x60:
+            nbytes = end_of_first_byte * 256 + <int>(inbuff[ipos]) + 17
+            ipos += 1
+            for i in range(nbytes):
+                result[rpos] = 0x20
+                rpos += 1
+        elif control_byte == 0x70:
+            nbytes = end_of_first_byte * 256 + <int>(inbuff[ipos]) + 17
+            ipos += 1
+            for i in range(nbytes):
+                result[rpos] = 0x00
+                rpos += 1
+        elif control_byte == 0x80:
+            nbytes = end_of_first_byte + 1
+            for i in range(nbytes):
+                result[rpos] = inbuff[ipos + i]
+                rpos += 1
+            ipos += nbytes
+        elif control_byte == 0x90:
+            nbytes = end_of_first_byte + 17
+            for i in range(nbytes):
+                result[rpos] = inbuff[ipos + i]
+                rpos += 1
+            ipos += nbytes
+        elif control_byte == 0xA0:
+            nbytes = end_of_first_byte + 33
+            for i in range(nbytes):
+                result[rpos] = inbuff[ipos + i]
+                rpos += 1
+            ipos += nbytes
+        elif control_byte == 0xB0:
+            nbytes = end_of_first_byte + 49
+            for i in range(nbytes):
+                result[rpos] = inbuff[ipos + i]
+                rpos += 1
+            ipos += nbytes
+        elif control_byte == 0xC0:
+            nbytes = end_of_first_byte + 3
+            x = inbuff[ipos]
+            ipos += 1
+            for i in range(nbytes):
+                result[rpos] = x
+                rpos += 1
+        elif control_byte == 0xD0:
+            nbytes = end_of_first_byte + 2
+            for i in range(nbytes):
+                result[rpos] = 0x40
+                rpos += 1
+        elif control_byte == 0xE0:
+            nbytes = end_of_first_byte + 2
+            for i in range(nbytes):
+                result[rpos] = 0x20
+                rpos += 1
+        elif control_byte == 0xF0:
+            nbytes = end_of_first_byte + 2
+            for i in range(nbytes):
+                result[rpos] = 0x00
+                rpos += 1
+        else:
+            raise ValueError("unknown control byte: {byte}"
+                             .format(byte=control_byte))
+
+    if len(result) != result_length:
+        raise ValueError("RLE: {got} != {expect}".format(got=len(result),
+                                                         expect=result_length))
+
+    return np.asarray(result)
+
+
+# rdc_decompress decompresses data using the Ross Data Compression algorithm:
+#
+# http://collaboration.cmc.ec.gc.ca/science/rpn/biblio/ddj/Website/articles/CUJ/1992/9210/ross/ross.htm
+cdef ndarray[uint8_t, ndim=1] rdc_decompress(
+        int result_length, ndarray[uint8_t, ndim=1] inbuff):
+
+    cdef:
+        uint8_t cmd
+        uint16_t ctrl_bits, ctrl_mask = 0, ofs, cnt
+        int ipos = 0, rpos = 0, k
+        uint8_t [:] outbuff = np.zeros(result_length, dtype=np.uint8)
+
+    ii = -1
+
+    while ipos < len(inbuff):
+        ii += 1
+        ctrl_mask = ctrl_mask >> 1
+        if ctrl_mask == 0:
+            ctrl_bits = ((<uint16_t>inbuff[ipos] << 8) +
+                         <uint16_t>inbuff[ipos + 1])
+            ipos += 2
+            ctrl_mask = 0x8000
+
+        if ctrl_bits & ctrl_mask == 0:
+            outbuff[rpos] = inbuff[ipos]
+            ipos += 1
+            rpos += 1
+            continue
+
+        cmd = (inbuff[ipos] >> 4) & 0x0F
+        cnt = <uint16_t>(inbuff[ipos] & 0x0F)
+        ipos += 1
+
+        # short RLE
+        if cmd == 0:
+            cnt += 3
+            for k in range(cnt):
+                outbuff[rpos + k] = inbuff[ipos]
+            rpos += cnt
+            ipos += 1
+
+        # long RLE
+        elif cmd == 1:
+            cnt += <uint16_t>inbuff[ipos] << 4
+            cnt += 19
+            ipos += 1
+            for k in range(cnt):
+                outbuff[rpos + k] = inbuff[ipos]
+            rpos += cnt
+            ipos += 1
+
+        # long pattern
+        elif cmd == 2:
+            ofs = cnt + 3
+            ofs += <uint16_t>inbuff[ipos] << 4
+            ipos += 1
+            cnt = <uint16_t>inbuff[ipos]
+            ipos += 1
+            cnt += 16
+            for k in range(cnt):
+                outbuff[rpos + k] = outbuff[rpos - <int>ofs + k]
+            rpos += cnt
+
+        # short pattern
+        elif (cmd >= 3) & (cmd <= 15):
+            ofs = cnt + 3
+            ofs += <uint16_t>inbuff[ipos] << 4
+            ipos += 1
+            for k in range(cmd):
+                outbuff[rpos + k] = outbuff[rpos - <int>ofs + k]
+            rpos += cmd
+
+        else:
+            raise ValueError("unknown RDC command")
+
+    if len(outbuff) != result_length:
+        raise ValueError("RDC: {got} != {expect}\n"
+                         .format(got=len(outbuff), expect=result_length))
+
+    return np.asarray(outbuff)
+
+cdef enum ColumnTypes:
+    column_type_decimal = 1
+    column_type_string = 2
+
+
+# type the page_data types
+cdef int page_meta_type = const.page_meta_type
+cdef int page_mix_types_0 = const.page_mix_types[0]
+cdef int page_mix_types_1 = const.page_mix_types[1]
+cdef int page_data_type = const.page_data_type
+cdef int subheader_pointers_offset = const.subheader_pointers_offset
+
+cdef class Parser(object):
+
+    cdef:
+        int column_count
+        int64_t[:] lengths
+        int64_t[:] offsets
+        int64_t[:] column_types
+        uint8_t[:, :] byte_chunk
+        object[:, :] string_chunk
+        char *cached_page
+        int current_row_on_page_index
+        int current_page_block_count
+        int current_page_data_subheader_pointers_len
+        int current_page_subheaders_count
+        int current_row_in_chunk_index
+        int current_row_in_file_index
+        int header_length
+        int row_length
+        int bit_offset
+        int subheader_pointer_length
+        int current_page_type
+        bint is_little_endian
+        ndarray[uint8_t, ndim=1] (*decompress)(
+            int result_length, ndarray[uint8_t, ndim=1] inbuff)
+        object parser
+
+    def __init__(self, object parser):
+        cdef:
+            int j
+            char[:] column_types
+
+        self.parser = parser
+        self.header_length = self.parser.header_length
+        self.column_count = parser.column_count
+        self.lengths = parser._column_data_lengths
+        self.offsets = parser._column_data_offsets
+        self.byte_chunk = parser._byte_chunk
+        self.string_chunk = parser._string_chunk
+        self.row_length = parser.row_length
+        self.bit_offset = self.parser._page_bit_offset
+        self.subheader_pointer_length = self.parser._subheader_pointer_length
+        self.is_little_endian = parser.byte_order == "<"
+        self.column_types = np.empty(self.column_count, dtype='int64')
+
+        # page indicators
+        self.update_next_page()
+
+        column_types = parser.column_types
+
+        # map column types
+        for j in range(self.column_count):
+            if column_types[j] == b'd':
+                self.column_types[j] = column_type_decimal
+            elif column_types[j] == b's':
+                self.column_types[j] = column_type_string
+            else:
+                raise ValueError("unknown column type: "
+                                 "{typ}"
+                                 .format(typ=self.parser.columns[j].ctype))
+
+        # compression
+        if parser.compression == const.rle_compression:
+            self.decompress = rle_decompress
+        elif parser.compression == const.rdc_compression:
+            self.decompress = rdc_decompress
+        else:
+            self.decompress = NULL
+
+        # update to current state of the parser
+        self.current_row_in_chunk_index = parser._current_row_in_chunk_index
+        self.current_row_in_file_index = parser._current_row_in_file_index
+        self.current_row_on_page_index = parser._current_row_on_page_index
+
+    def read(self, int nrows):
+        cdef:
+            bint done
+            int i
+
+        for i in range(nrows):
+            done = self.readline()
+            if done:
+                break
+
+        # update the parser
+        self.parser._current_row_on_page_index = self.current_row_on_page_index
+        self.parser._current_row_in_chunk_index =\
+            self.current_row_in_chunk_index
+        self.parser._current_row_in_file_index = self.current_row_in_file_index
+
+    cdef bint read_next_page(self):
+        cdef done
+
+        done = self.parser._read_next_page()
+        if done:
+            self.cached_page = NULL
+        else:
+            self.update_next_page()
+        return done
+
+    cdef update_next_page(self):
+        # update data for the current page
+
+        self.cached_page = <char *>self.parser._cached_page
+        self.current_row_on_page_index = 0
+        self.current_page_type = self.parser._current_page_type
+        self.current_page_block_count = self.parser._current_page_block_count
+        self.current_page_data_subheader_pointers_len = len(
+            self.parser._current_page_data_subheader_pointers)
+        self.current_page_subheaders_count =\
+            self.parser._current_page_subheaders_count
+
+    cdef readline(self):
+
+        cdef:
+            int offset, bit_offset, align_correction
+            int subheader_pointer_length, mn
+            bint done, flag
+
+        bit_offset = self.bit_offset
+        subheader_pointer_length = self.subheader_pointer_length
+
+        # If there is no page, go to the end of the header and read a page.
+        if self.cached_page == NULL:
+            self.parser._path_or_buf.seek(self.header_length)
+            done = self.read_next_page()
+            if done:
+                return True
+
+        # Loop until a data row is read
+        while True:
+            if self.current_page_type == page_meta_type:
+                flag = self.current_row_on_page_index >=\
+                    self.current_page_data_subheader_pointers_len
+                if flag:
+                    done = self.read_next_page()
+                    if done:
+                        return True
+                    continue
+                current_subheader_pointer = (
+                    self.parser._current_page_data_subheader_pointers[
+                        self.current_row_on_page_index])
+                self.process_byte_array_with_data(
+                    current_subheader_pointer.offset,
+                    current_subheader_pointer.length)
+                return False
+            elif (self.current_page_type == page_mix_types_0 or
+                    self.current_page_type == page_mix_types_1):
+                align_correction = (bit_offset + subheader_pointers_offset +
+                                    self.current_page_subheaders_count *
+                                    subheader_pointer_length)
+                align_correction = align_correction % 8
+                offset = bit_offset + align_correction
+                offset += subheader_pointers_offset
+                offset += (self.current_page_subheaders_count *
+                           subheader_pointer_length)
+                offset += self.current_row_on_page_index * self.row_length
+                self.process_byte_array_with_data(offset,
+                                                  self.row_length)
+                mn = min(self.parser.row_count,
+                         self.parser._mix_page_row_count)
+                if self.current_row_on_page_index == mn:
+                    done = self.read_next_page()
+                    if done:
+                        return True
+                return False
+            elif self.current_page_type == page_data_type:
+                self.process_byte_array_with_data(
+                    bit_offset + subheader_pointers_offset +
+                    self.current_row_on_page_index * self.row_length,
+                    self.row_length)
+                flag = (self.current_row_on_page_index ==
+                        self.current_page_block_count)
+                if flag:
+                    done = self.read_next_page()
+                    if done:
+                        return True
+                return False
+            else:
+                raise ValueError("unknown page type: {typ}"
+                                 .format(typ=self.current_page_type))
+
+    cdef void process_byte_array_with_data(self, int offset, int length):
+
+        cdef:
+            Py_ssize_t j
+            int s, k, m, jb, js, current_row
+            int64_t lngt, start, ct
+            ndarray[uint8_t, ndim=1] source
+            int64_t[:] column_types
+            int64_t[:] lengths
+            int64_t[:] offsets
+            uint8_t[:, :] byte_chunk
+            object[:, :] string_chunk
+
+        source = np.frombuffer(
+            self.cached_page[offset:offset + length], dtype=np.uint8)
+
+        if self.decompress != NULL and (length < self.row_length):
+            source = self.decompress(self.row_length, source)
+
+        current_row = self.current_row_in_chunk_index
+        column_types = self.column_types
+        lengths = self.lengths
+        offsets = self.offsets
+        byte_chunk = self.byte_chunk
+        string_chunk = self.string_chunk
+        s = 8 * self.current_row_in_chunk_index
+        js = 0
+        jb = 0
+        for j in range(self.column_count):
+            lngt = lengths[j]
+            if lngt == 0:
+                break
+            start = offsets[j]
+            ct = column_types[j]
+            if ct == column_type_decimal:
+                # decimal
+                if self.is_little_endian:
+                    m = s + 8 - lngt
+                else:
+                    m = s
+                for k in range(lngt):
+                    byte_chunk[jb, m + k] = source[start + k]
+                jb += 1
+            elif column_types[j] == column_type_string:
+                # string
+                string_chunk[js, current_row] = source[start:(
+                    start + lngt)].tostring().rstrip()
+                js += 1
+
+        self.current_row_on_page_index += 1
+        self.current_row_in_chunk_index += 1
+        self.current_row_in_file_index += 1
diff --git a/pandas/io/sas/sas7bdat.py b/pandas/io/sas/sas7bdat.py
new file mode 100644
index 0000000000000..4d187a8282859
--- /dev/null
+++ b/pandas/io/sas/sas7bdat.py
@@ -0,0 +1,687 @@
+"""
+Read SAS7BDAT files
+
+Based on code written by Jared Hobbs:
+  https://bitbucket.org/jaredhobbs/sas7bdat
+
+See also:
+  https://github.com/BioStatMatt/sas7bdat
+
+Partial documentation of the file format:
+  https://cran.r-project.org/web/packages/sas7bdat/vignettes/sas7bdat.pdf
+
+Reference for binary data compression:
+  http://collaboration.cmc.ec.gc.ca/science/rpn/biblio/ddj/Website/articles/CUJ/1992/9210/ross/ross.htm
+"""
+
+import pandas as pd
+from pandas import compat
+from pandas.io.common import get_filepath_or_buffer, BaseIterator
+from pandas.errors import EmptyDataError
+import numpy as np
+import struct
+import pandas.io.sas.sas_constants as const
+from pandas.io.sas._sas import Parser
+
+
+class _subheader_pointer(object):
+    pass
+
+
+class _column(object):
+    pass
+
+
+# SAS7BDAT represents a SAS data file in SAS7BDAT format.
+class SAS7BDATReader(BaseIterator):
+    """
+    Read SAS files in SAS7BDAT format.
+
+    Parameters
+    ----------
+    path_or_buf : path name or buffer
+        Name of SAS file or file-like object pointing to SAS file
+        contents.
+    index : column identifier, defaults to None
+        Column to use as index.
+    convert_dates : boolean, defaults to True
+        Attempt to convert dates to Pandas datetime values.  Note that
+        some rarely used SAS date formats may be unsupported.
+    blank_missing : boolean, defaults to True
+        Convert empty strings to missing values (SAS uses blanks to
+        indicate missing character variables).
+    chunksize : int, defaults to None
+        Return SAS7BDATReader object for iterations, returns chunks
+        with given number of lines.
+    encoding : string, defaults to None
+        String encoding.
+    convert_text : bool, defaults to True
+        If False, text variables are left as raw bytes.
+    convert_header_text : bool, defaults to True
+        If False, header text, including column names, are left as raw
+        bytes.
+    """
+
+    def __init__(self, path_or_buf, index=None, convert_dates=True,
+                 blank_missing=True, chunksize=None, encoding=None,
+                 convert_text=True, convert_header_text=True):
+
+        self.index = index
+        self.convert_dates = convert_dates
+        self.blank_missing = blank_missing
+        self.chunksize = chunksize
+        self.encoding = encoding
+        self.convert_text = convert_text
+        self.convert_header_text = convert_header_text
+
+        self.default_encoding = "latin-1"
+        self.compression = ""
+        self.column_names_strings = []
+        self.column_names = []
+        self.column_types = []
+        self.column_formats = []
+        self.columns = []
+
+        self._current_page_data_subheader_pointers = []
+        self._cached_page = None
+        self._column_data_lengths = []
+        self._column_data_offsets = []
+        self._current_row_in_file_index = 0
+        self._current_row_on_page_index = 0
+        self._current_row_in_file_index = 0
+
+        self._path_or_buf, _, _, _ = get_filepath_or_buffer(path_or_buf)
+        if isinstance(self._path_or_buf, compat.string_types):
+            self._path_or_buf = open(self._path_or_buf, 'rb')
+            self.handle = self._path_or_buf
+
+        self._get_properties()
+        self._parse_metadata()
+
+    def close(self):
+        try:
+            self.handle.close()
+        except AttributeError:
+            pass
+
+    def _get_properties(self):
+
+        # Check magic number
+        self._path_or_buf.seek(0)
+        self._cached_page = self._path_or_buf.read(288)
+        if self._cached_page[0:len(const.magic)] != const.magic:
+            self.close()
+            raise ValueError("magic number mismatch (not a SAS file?)")
+
+        # Get alignment information
+        align1, align2 = 0, 0
+        buf = self._read_bytes(const.align_1_offset, const.align_1_length)
+        if buf == const.u64_byte_checker_value:
+            align2 = const.align_2_value
+            self.U64 = True
+            self._int_length = 8
+            self._page_bit_offset = const.page_bit_offset_x64
+            self._subheader_pointer_length = const.subheader_pointer_length_x64
+        else:
+            self.U64 = False
+            self._page_bit_offset = const.page_bit_offset_x86
+            self._subheader_pointer_length = const.subheader_pointer_length_x86
+            self._int_length = 4
+        buf = self._read_bytes(const.align_2_offset, const.align_2_length)
+        if buf == const.align_1_checker_value:
+            align1 = const.align_2_value
+        total_align = align1 + align2
+
+        # Get endianness information
+        buf = self._read_bytes(const.endianness_offset,
+                               const.endianness_length)
+        if buf == b'\x01':
+            self.byte_order = "<"
+        else:
+            self.byte_order = ">"
+
+        # Get encoding information
+        buf = self._read_bytes(const.encoding_offset, const.encoding_length)[0]
+        if buf in const.encoding_names:
+            self.file_encoding = const.encoding_names[buf]
+        else:
+            self.file_encoding = "unknown (code=%s)" % str(buf)
+
+        # Get platform information
+        buf = self._read_bytes(const.platform_offset, const.platform_length)
+        if buf == b'1':
+            self.platform = "unix"
+        elif buf == b'2':
+            self.platform = "windows"
+        else:
+            self.platform = "unknown"
+
+        buf = self._read_bytes(const.dataset_offset, const.dataset_length)
+        self.name = buf.rstrip(b'\x00 ')
+        if self.convert_header_text:
+            self.name = self.name.decode(
+                self.encoding or self.default_encoding)
+
+        buf = self._read_bytes(const.file_type_offset, const.file_type_length)
+        self.file_type = buf.rstrip(b'\x00 ')
+        if self.convert_header_text:
+            self.file_type = self.file_type.decode(
+                self.encoding or self.default_encoding)
+
+        # Timestamp is epoch 01/01/1960
+        epoch = pd.datetime(1960, 1, 1)
+        x = self._read_float(const.date_created_offset + align1,
+                             const.date_created_length)
+        self.date_created = epoch + pd.to_timedelta(x, unit='s')
+        x = self._read_float(const.date_modified_offset + align1,
+                             const.date_modified_length)
+        self.date_modified = epoch + pd.to_timedelta(x, unit='s')
+
+        self.header_length = self._read_int(const.header_size_offset + align1,
+                                            const.header_size_length)
+
+        # Read the rest of the header into cached_page.
+        buf = self._path_or_buf.read(self.header_length - 288)
+        self._cached_page += buf
+        if len(self._cached_page) != self.header_length:
+            self.close()
+            raise ValueError("The SAS7BDAT file appears to be truncated.")
+
+        self._page_length = self._read_int(const.page_size_offset + align1,
+                                           const.page_size_length)
+        self._page_count = self._read_int(const.page_count_offset + align1,
+                                          const.page_count_length)
+
+        buf = self._read_bytes(const.sas_release_offset + total_align,
+                               const.sas_release_length)
+        self.sas_release = buf.rstrip(b'\x00 ')
+        if self.convert_header_text:
+            self.sas_release = self.sas_release.decode(
+                self.encoding or self.default_encoding)
+
+        buf = self._read_bytes(const.sas_server_type_offset + total_align,
+                               const.sas_server_type_length)
+        self.server_type = buf.rstrip(b'\x00 ')
+        if self.convert_header_text:
+            self.server_type = self.server_type.decode(
+                self.encoding or self.default_encoding)
+
+        buf = self._read_bytes(const.os_version_number_offset + total_align,
+                               const.os_version_number_length)
+        self.os_version = buf.rstrip(b'\x00 ')
+        if self.convert_header_text:
+            self.os_version = self.os_version.decode(
+                self.encoding or self.default_encoding)
+
+        buf = self._read_bytes(const.os_name_offset + total_align,
+                               const.os_name_length)
+        buf = buf.rstrip(b'\x00 ')
+        if len(buf) > 0:
+            self.os_name = buf.decode(self.encoding or self.default_encoding)
+        else:
+            buf = self._read_bytes(const.os_maker_offset + total_align,
+                                   const.os_maker_length)
+            self.os_name = buf.rstrip(b'\x00 ')
+            if self.convert_header_text:
+                self.os_name = self.os_name.decode(
+                    self.encoding or self.default_encoding)
+
+    def __next__(self):
+        da = self.read(nrows=self.chunksize or 1)
+        if da is None:
+            raise StopIteration
+        return da
+
+    # Read a single float of the given width (4 or 8).
+    def _read_float(self, offset, width):
+        if width not in (4, 8):
+            self.close()
+            raise ValueError("invalid float width")
+        buf = self._read_bytes(offset, width)
+        fd = "f" if width == 4 else "d"
+        return struct.unpack(self.byte_order + fd, buf)[0]
+
+    # Read a single signed integer of the given width (1, 2, 4 or 8).
+    def _read_int(self, offset, width):
+        if width not in (1, 2, 4, 8):
+            self.close()
+            raise ValueError("invalid int width")
+        buf = self._read_bytes(offset, width)
+        it = {1: "b", 2: "h", 4: "l", 8: "q"}[width]
+        iv = struct.unpack(self.byte_order + it, buf)[0]
+        return iv
+
+    def _read_bytes(self, offset, length):
+        if self._cached_page is None:
+            self._path_or_buf.seek(offset)
+            buf = self._path_or_buf.read(length)
+            if len(buf) < length:
+                self.close()
+                msg = "Unable to read {:d} bytes from file position {:d}."
+                raise ValueError(msg.format(length, offset))
+            return buf
+        else:
+            if offset + length > len(self._cached_page):
+                self.close()
+                raise ValueError("The cached page is too small.")
+            return self._cached_page[offset:offset + length]
+
+    def _parse_metadata(self):
+        done = False
+        while not done:
+            self._cached_page = self._path_or_buf.read(self._page_length)
+            if len(self._cached_page) <= 0:
+                break
+            if len(self._cached_page) != self._page_length:
+                self.close()
+                raise ValueError(
+                    "Failed to read a meta data page from the SAS file.")
+            done = self._process_page_meta()
+
+    def _process_page_meta(self):
+        self._read_page_header()
+        pt = [const.page_meta_type, const.page_amd_type] + const.page_mix_types
+        if self._current_page_type in pt:
+            self._process_page_metadata()
+        return ((self._current_page_type in [256] + const.page_mix_types) or
+                (self._current_page_data_subheader_pointers is not None))
+
+    def _read_page_header(self):
+        bit_offset = self._page_bit_offset
+        tx = const.page_type_offset + bit_offset
+        self._current_page_type = self._read_int(tx, const.page_type_length)
+        tx = const.block_count_offset + bit_offset
+        self._current_page_block_count = self._read_int(
+            tx, const.block_count_length)
+        tx = const.subheader_count_offset + bit_offset
+        self._current_page_subheaders_count = (
+            self._read_int(tx, const.subheader_count_length))
+
+    def _process_page_metadata(self):
+        bit_offset = self._page_bit_offset
+
+        for i in range(self._current_page_subheaders_count):
+            pointer = self._process_subheader_pointers(
+                const.subheader_pointers_offset + bit_offset, i)
+            if pointer.length == 0:
+                continue
+            if pointer.compression == const.truncated_subheader_id:
+                continue
+            subheader_signature = self._read_subheader_signature(
+                pointer.offset)
+            subheader_index = (
+                self._get_subheader_index(subheader_signature,
+                                          pointer.compression, pointer.ptype))
+            self._process_subheader(subheader_index, pointer)
+
+    def _get_subheader_index(self, signature, compression, ptype):
+        index = const.subheader_signature_to_index.get(signature)
+        if index is None:
+            f1 = ((compression == const.compressed_subheader_id) or
+                  (compression == 0))
+            f2 = (ptype == const.compressed_subheader_type)
+            if (self.compression != "") and f1 and f2:
+                index = const.SASIndex.data_subheader_index
+            else:
+                self.close()
+                raise ValueError("Unknown subheader signature")
+        return index
+
+    def _process_subheader_pointers(self, offset, subheader_pointer_index):
+
+        subheader_pointer_length = self._subheader_pointer_length
+        total_offset = (offset +
+                        subheader_pointer_length * subheader_pointer_index)
+
+        subheader_offset = self._read_int(total_offset, self._int_length)
+        total_offset += self._int_length
+
+        subheader_length = self._read_int(total_offset, self._int_length)
+        total_offset += self._int_length
+
+        subheader_compression = self._read_int(total_offset, 1)
+        total_offset += 1
+
+        subheader_type = self._read_int(total_offset, 1)
+
+        x = _subheader_pointer()
+        x.offset = subheader_offset
+        x.length = subheader_length
+        x.compression = subheader_compression
+        x.ptype = subheader_type
+
+        return x
+
+    def _read_subheader_signature(self, offset):
+        subheader_signature = self._read_bytes(offset, self._int_length)
+        return subheader_signature
+
+    def _process_subheader(self, subheader_index, pointer):
+        offset = pointer.offset
+        length = pointer.length
+
+        if subheader_index == const.SASIndex.row_size_index:
+            processor = self._process_rowsize_subheader
+        elif subheader_index == const.SASIndex.column_size_index:
+            processor = self._process_columnsize_subheader
+        elif subheader_index == const.SASIndex.column_text_index:
+            processor = self._process_columntext_subheader
+        elif subheader_index == const.SASIndex.column_name_index:
+            processor = self._process_columnname_subheader
+        elif subheader_index == const.SASIndex.column_attributes_index:
+            processor = self._process_columnattributes_subheader
+        elif subheader_index == const.SASIndex.format_and_label_index:
+            processor = self._process_format_subheader
+        elif subheader_index == const.SASIndex.column_list_index:
+            processor = self._process_columnlist_subheader
+        elif subheader_index == const.SASIndex.subheader_counts_index:
+            processor = self._process_subheader_counts
+        elif subheader_index == const.SASIndex.data_subheader_index:
+            self._current_page_data_subheader_pointers.append(pointer)
+            return
+        else:
+            raise ValueError("unknown subheader index")
+
+        processor(offset, length)
+
+    def _process_rowsize_subheader(self, offset, length):
+
+        int_len = self._int_length
+        lcs_offset = offset
+        lcp_offset = offset
+        if self.U64:
+            lcs_offset += 682
+            lcp_offset += 706
+        else:
+            lcs_offset += 354
+            lcp_offset += 378
+
+        self.row_length = self._read_int(
+            offset + const.row_length_offset_multiplier * int_len, int_len)
+        self.row_count = self._read_int(
+            offset + const.row_count_offset_multiplier * int_len, int_len)
+        self.col_count_p1 = self._read_int(
+            offset + const.col_count_p1_multiplier * int_len, int_len)
+        self.col_count_p2 = self._read_int(
+            offset + const.col_count_p2_multiplier * int_len, int_len)
+        mx = const.row_count_on_mix_page_offset_multiplier * int_len
+        self._mix_page_row_count = self._read_int(offset + mx, int_len)
+        self._lcs = self._read_int(lcs_offset, 2)
+        self._lcp = self._read_int(lcp_offset, 2)
+
+    def _process_columnsize_subheader(self, offset, length):
+        int_len = self._int_length
+        offset += int_len
+        self.column_count = self._read_int(offset, int_len)
+        if (self.col_count_p1 + self.col_count_p2 !=
+                self.column_count):
+            print("Warning: column count mismatch (%d + %d != %d)\n",
+                  self.col_count_p1, self.col_count_p2, self.column_count)
+
+    # Unknown purpose
+    def _process_subheader_counts(self, offset, length):
+        pass
+
+    def _process_columntext_subheader(self, offset, length):
+
+        offset += self._int_length
+        text_block_size = self._read_int(offset, const.text_block_size_length)
+
+        buf = self._read_bytes(offset, text_block_size)
+        cname_raw = buf[0:text_block_size].rstrip(b"\x00 ")
+        cname = cname_raw
+        if self.convert_header_text:
+            cname = cname.decode(self.encoding or self.default_encoding)
+        self.column_names_strings.append(cname)
+
+        if len(self.column_names_strings) == 1:
+            compression_literal = ""
+            for cl in const.compression_literals:
+                if cl in cname_raw:
+                    compression_literal = cl
+            self.compression = compression_literal
+            offset -= self._int_length
+
+            offset1 = offset + 16
+            if self.U64:
+                offset1 += 4
+
+            buf = self._read_bytes(offset1, self._lcp)
+            compression_literal = buf.rstrip(b"\x00")
+            if compression_literal == "":
+                self._lcs = 0
+                offset1 = offset + 32
+                if self.U64:
+                    offset1 += 4
+                buf = self._read_bytes(offset1, self._lcp)
+                self.creator_proc = buf[0:self._lcp]
+            elif compression_literal == const.rle_compression:
+                offset1 = offset + 40
+                if self.U64:
+                    offset1 += 4
+                buf = self._read_bytes(offset1, self._lcp)
+                self.creator_proc = buf[0:self._lcp]
+            elif self._lcs > 0:
+                self._lcp = 0
+                offset1 = offset + 16
+                if self.U64:
+                    offset1 += 4
+                buf = self._read_bytes(offset1, self._lcs)
+                self.creator_proc = buf[0:self._lcp]
+            if self.convert_header_text:
+                if hasattr(self, "creator_proc"):
+                    self.creator_proc = self.creator_proc.decode(
+                        self.encoding or self.default_encoding)
+
+    def _process_columnname_subheader(self, offset, length):
+        int_len = self._int_length
+        offset += int_len
+        column_name_pointers_count = (length - 2 * int_len - 12) // 8
+        for i in range(column_name_pointers_count):
+            text_subheader = offset + const.column_name_pointer_length * \
+                (i + 1) + const.column_name_text_subheader_offset
+            col_name_offset = offset + const.column_name_pointer_length * \
+                (i + 1) + const.column_name_offset_offset
+            col_name_length = offset + const.column_name_pointer_length * \
+                (i + 1) + const.column_name_length_offset
+
+            idx = self._read_int(
+                text_subheader, const.column_name_text_subheader_length)
+            col_offset = self._read_int(
+                col_name_offset, const.column_name_offset_length)
+            col_len = self._read_int(
+                col_name_length, const.column_name_length_length)
+
+            name_str = self.column_names_strings[idx]
+            self.column_names.append(name_str[col_offset:col_offset + col_len])
+
+    def _process_columnattributes_subheader(self, offset, length):
+        int_len = self._int_length
+        column_attributes_vectors_count = (
+            length - 2 * int_len - 12) // (int_len + 8)
+        self.column_types = np.empty(
+            column_attributes_vectors_count, dtype=np.dtype('S1'))
+        self._column_data_lengths = np.empty(
+            column_attributes_vectors_count, dtype=np.int64)
+        self._column_data_offsets = np.empty(
+            column_attributes_vectors_count, dtype=np.int64)
+        for i in range(column_attributes_vectors_count):
+            col_data_offset = (offset + int_len +
+                               const.column_data_offset_offset +
+                               i * (int_len + 8))
+            col_data_len = (offset + 2 * int_len +
+                            const.column_data_length_offset +
+                            i * (int_len + 8))
+            col_types = (offset + 2 * int_len +
+                         const.column_type_offset + i * (int_len + 8))
+
+            x = self._read_int(col_data_offset, int_len)
+            self._column_data_offsets[i] = x
+
+            x = self._read_int(col_data_len, const.column_data_length_length)
+            self._column_data_lengths[i] = x
+
+            x = self._read_int(col_types, const.column_type_length)
+            if x == 1:
+                self.column_types[i] = b'd'
+            else:
+                self.column_types[i] = b's'
+
+    def _process_columnlist_subheader(self, offset, length):
+        # unknown purpose
+        pass
+
+    def _process_format_subheader(self, offset, length):
+        int_len = self._int_length
+        text_subheader_format = (
+            offset +
+            const.column_format_text_subheader_index_offset +
+            3 * int_len)
+        col_format_offset = (offset +
+                             const.column_format_offset_offset +
+                             3 * int_len)
+        col_format_len = (offset +
+                          const.column_format_length_offset +
+                          3 * int_len)
+        text_subheader_label = (
+            offset +
+            const.column_label_text_subheader_index_offset +
+            3 * int_len)
+        col_label_offset = (offset +
+                            const.column_label_offset_offset +
+                            3 * int_len)
+        col_label_len = offset + const.column_label_length_offset + 3 * int_len
+
+        x = self._read_int(text_subheader_format,
+                           const.column_format_text_subheader_index_length)
+        format_idx = min(x, len(self.column_names_strings) - 1)
+
+        format_start = self._read_int(
+            col_format_offset, const.column_format_offset_length)
+        format_len = self._read_int(
+            col_format_len, const.column_format_length_length)
+
+        label_idx = self._read_int(
+            text_subheader_label,
+            const.column_label_text_subheader_index_length)
+        label_idx = min(label_idx, len(self.column_names_strings) - 1)
+
+        label_start = self._read_int(
+            col_label_offset, const.column_label_offset_length)
+        label_len = self._read_int(col_label_len,
+                                   const.column_label_length_length)
+
+        label_names = self.column_names_strings[label_idx]
+        column_label = label_names[label_start: label_start + label_len]
+        format_names = self.column_names_strings[format_idx]
+        column_format = format_names[format_start: format_start + format_len]
+        current_column_number = len(self.columns)
+
+        col = _column()
+        col.col_id = current_column_number
+        col.name = self.column_names[current_column_number]
+        col.label = column_label
+        col.format = column_format
+        col.ctype = self.column_types[current_column_number]
+        col.length = self._column_data_lengths[current_column_number]
+
+        self.column_formats.append(column_format)
+        self.columns.append(col)
+
+    def read(self, nrows=None):
+
+        if (nrows is None) and (self.chunksize is not None):
+            nrows = self.chunksize
+        elif nrows is None:
+            nrows = self.row_count
+
+        if len(self.column_types) == 0:
+            self.close()
+            raise EmptyDataError("No columns to parse from file")
+
+        if self._current_row_in_file_index >= self.row_count:
+            return None
+
+        m = self.row_count - self._current_row_in_file_index
+        if nrows > m:
+            nrows = m
+
+        nd = (self.column_types == b'd').sum()
+        ns = (self.column_types == b's').sum()
+
+        self._string_chunk = np.empty((ns, nrows), dtype=np.object)
+        self._byte_chunk = np.empty((nd, 8 * nrows), dtype=np.uint8)
+
+        self._current_row_in_chunk_index = 0
+        p = Parser(self)
+        p.read(nrows)
+
+        rslt = self._chunk_to_dataframe()
+        if self.index is not None:
+            rslt = rslt.set_index(self.index)
+
+        return rslt
+
+    def _read_next_page(self):
+        self._current_page_data_subheader_pointers = []
+        self._cached_page = self._path_or_buf.read(self._page_length)
+        if len(self._cached_page) <= 0:
+            return True
+        elif len(self._cached_page) != self._page_length:
+            self.close()
+            msg = ("failed to read complete page from file "
+                   "(read {:d} of {:d} bytes)")
+            raise ValueError(msg.format(len(self._cached_page),
+                                        self._page_length))
+
+        self._read_page_header()
+        if self._current_page_type == const.page_meta_type:
+            self._process_page_metadata()
+        pt = [const.page_meta_type, const.page_data_type]
+        pt += [const.page_mix_types]
+        if self._current_page_type not in pt:
+            return self._read_next_page()
+
+        return False
+
+    def _chunk_to_dataframe(self):
+
+        n = self._current_row_in_chunk_index
+        m = self._current_row_in_file_index
+        ix = range(m - n, m)
+        rslt = pd.DataFrame(index=ix)
+
+        js, jb = 0, 0
+        for j in range(self.column_count):
+
+            name = self.column_names[j]
+
+            if self.column_types[j] == b'd':
+                rslt[name] = self._byte_chunk[jb, :].view(
+                    dtype=self.byte_order + 'd')
+                rslt[name] = np.asarray(rslt[name], dtype=np.float64)
+                if self.convert_dates:
+                    unit = None
+                    if self.column_formats[j] in const.sas_date_formats:
+                        unit = 'd'
+                    elif self.column_formats[j] in const.sas_datetime_formats:
+                        unit = 's'
+                    if unit:
+                        rslt[name] = pd.to_datetime(rslt[name], unit=unit,
+                                                    origin="1960-01-01")
+                jb += 1
+            elif self.column_types[j] == b's':
+                rslt[name] = self._string_chunk[js, :]
+                if self.convert_text and (self.encoding is not None):
+                    rslt[name] = rslt[name].str.decode(
+                        self.encoding or self.default_encoding)
+                if self.blank_missing:
+                    ii = rslt[name].str.len() == 0
+                    rslt.loc[ii, name] = np.nan
+                js += 1
+            else:
+                self.close()
+                raise ValueError("unknown column type %s" %
+                                 self.column_types[j])
+
+        return rslt
diff --git a/pandas/io/sas/sas_constants.py b/pandas/io/sas/sas_constants.py
new file mode 100644
index 0000000000000..98502d32d39e8
--- /dev/null
+++ b/pandas/io/sas/sas_constants.py
@@ -0,0 +1,171 @@
+magic = (b"\x00\x00\x00\x00\x00\x00\x00\x00" +
+         b"\x00\x00\x00\x00\xc2\xea\x81\x60" +
+         b"\xb3\x14\x11\xcf\xbd\x92\x08\x00" +
+         b"\x09\xc7\x31\x8c\x18\x1f\x10\x11")
+
+align_1_checker_value = b'3'
+align_1_offset = 32
+align_1_length = 1
+align_1_value = 4
+u64_byte_checker_value = b'3'
+align_2_offset = 35
+align_2_length = 1
+align_2_value = 4
+endianness_offset = 37
+endianness_length = 1
+platform_offset = 39
+platform_length = 1
+encoding_offset = 70
+encoding_length = 1
+dataset_offset = 92
+dataset_length = 64
+file_type_offset = 156
+file_type_length = 8
+date_created_offset = 164
+date_created_length = 8
+date_modified_offset = 172
+date_modified_length = 8
+header_size_offset = 196
+header_size_length = 4
+page_size_offset = 200
+page_size_length = 4
+page_count_offset = 204
+page_count_length = 4
+sas_release_offset = 216
+sas_release_length = 8
+sas_server_type_offset = 224
+sas_server_type_length = 16
+os_version_number_offset = 240
+os_version_number_length = 16
+os_maker_offset = 256
+os_maker_length = 16
+os_name_offset = 272
+os_name_length = 16
+page_bit_offset_x86 = 16
+page_bit_offset_x64 = 32
+subheader_pointer_length_x86 = 12
+subheader_pointer_length_x64 = 24
+page_type_offset = 0
+page_type_length = 2
+block_count_offset = 2
+block_count_length = 2
+subheader_count_offset = 4
+subheader_count_length = 2
+page_meta_type = 0
+page_data_type = 256
+page_amd_type = 1024
+page_metc_type = 16384
+page_comp_type = -28672
+page_mix_types = [512, 640]
+subheader_pointers_offset = 8
+truncated_subheader_id = 1
+compressed_subheader_id = 4
+compressed_subheader_type = 1
+text_block_size_length = 2
+row_length_offset_multiplier = 5
+row_count_offset_multiplier = 6
+col_count_p1_multiplier = 9
+col_count_p2_multiplier = 10
+row_count_on_mix_page_offset_multiplier = 15
+column_name_pointer_length = 8
+column_name_text_subheader_offset = 0
+column_name_text_subheader_length = 2
+column_name_offset_offset = 2
+column_name_offset_length = 2
+column_name_length_offset = 4
+column_name_length_length = 2
+column_data_offset_offset = 8
+column_data_length_offset = 8
+column_data_length_length = 4
+column_type_offset = 14
+column_type_length = 1
+column_format_text_subheader_index_offset = 22
+column_format_text_subheader_index_length = 2
+column_format_offset_offset = 24
+column_format_offset_length = 2
+column_format_length_offset = 26
+column_format_length_length = 2
+column_label_text_subheader_index_offset = 28
+column_label_text_subheader_index_length = 2
+column_label_offset_offset = 30
+column_label_offset_length = 2
+column_label_length_offset = 32
+column_label_length_length = 2
+rle_compression = b'SASYZCRL'
+rdc_compression = b'SASYZCR2'
+
+compression_literals = [rle_compression, rdc_compression]
+
+# Incomplete list of encodings, using SAS nomenclature:
+# http://support.sas.com/documentation/cdl/en/nlsref/61893/HTML/default/viewer.htm#a002607278.htm
+encoding_names = {29: "latin1", 20: "utf-8", 33: "cyrillic", 60: "wlatin2",
+                  61: "wcyrillic", 62: "wlatin1", 90: "ebcdic870"}
+
+
+class SASIndex(object):
+    row_size_index = 0
+    column_size_index = 1
+    subheader_counts_index = 2
+    column_text_index = 3
+    column_name_index = 4
+    column_attributes_index = 5
+    format_and_label_index = 6
+    column_list_index = 7
+    data_subheader_index = 8
+
+
+subheader_signature_to_index = {
+    b"\xF7\xF7\xF7\xF7": SASIndex.row_size_index,
+    b"\x00\x00\x00\x00\xF7\xF7\xF7\xF7": SASIndex.row_size_index,
+    b"\xF7\xF7\xF7\xF7\x00\x00\x00\x00": SASIndex.row_size_index,
+    b"\xF7\xF7\xF7\xF7\xFF\xFF\xFB\xFE": SASIndex.row_size_index,
+    b"\xF6\xF6\xF6\xF6": SASIndex.column_size_index,
+    b"\x00\x00\x00\x00\xF6\xF6\xF6\xF6": SASIndex.column_size_index,
+    b"\xF6\xF6\xF6\xF6\x00\x00\x00\x00": SASIndex.column_size_index,
+    b"\xF6\xF6\xF6\xF6\xFF\xFF\xFB\xFE": SASIndex.column_size_index,
+    b"\x00\xFC\xFF\xFF": SASIndex.subheader_counts_index,
+    b"\xFF\xFF\xFC\x00": SASIndex.subheader_counts_index,
+    b"\x00\xFC\xFF\xFF\xFF\xFF\xFF\xFF": SASIndex.subheader_counts_index,
+    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFC\x00": SASIndex.subheader_counts_index,
+    b"\xFD\xFF\xFF\xFF": SASIndex.column_text_index,
+    b"\xFF\xFF\xFF\xFD": SASIndex.column_text_index,
+    b"\xFD\xFF\xFF\xFF\xFF\xFF\xFF\xFF": SASIndex.column_text_index,
+    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFD": SASIndex.column_text_index,
+    b"\xFF\xFF\xFF\xFF": SASIndex.column_name_index,
+    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFF": SASIndex.column_name_index,
+    b"\xFC\xFF\xFF\xFF": SASIndex.column_attributes_index,
+    b"\xFF\xFF\xFF\xFC": SASIndex.column_attributes_index,
+    b"\xFC\xFF\xFF\xFF\xFF\xFF\xFF\xFF": SASIndex.column_attributes_index,
+    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFC": SASIndex.column_attributes_index,
+    b"\xFE\xFB\xFF\xFF": SASIndex.format_and_label_index,
+    b"\xFF\xFF\xFB\xFE": SASIndex.format_and_label_index,
+    b"\xFE\xFB\xFF\xFF\xFF\xFF\xFF\xFF": SASIndex.format_and_label_index,
+    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFB\xFE": SASIndex.format_and_label_index,
+    b"\xFE\xFF\xFF\xFF": SASIndex.column_list_index,
+    b"\xFF\xFF\xFF\xFE": SASIndex.column_list_index,
+    b"\xFE\xFF\xFF\xFF\xFF\xFF\xFF\xFF": SASIndex.column_list_index,
+    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFE": SASIndex.column_list_index}
+
+
+# List of frequently used SAS date and datetime formats
+# http://support.sas.com/documentation/cdl/en/etsug/60372/HTML/default/viewer.htm#etsug_intervals_sect009.htm
+# https://github.com/epam/parso/blob/master/src/main/java/com/epam/parso/impl/SasFileConstants.java
+sas_date_formats = ("DATE", "DAY", "DDMMYY", "DOWNAME", "JULDAY", "JULIAN",
+                    "MMDDYY", "MMYY", "MMYYC", "MMYYD", "MMYYP", "MMYYS",
+                    "MMYYN", "MONNAME", "MONTH", "MONYY", "QTR", "QTRR",
+                    "NENGO", "WEEKDATE", "WEEKDATX", "WEEKDAY", "WEEKV",
+                    "WORDDATE", "WORDDATX", "YEAR", "YYMM", "YYMMC", "YYMMD",
+                    "YYMMP", "YYMMS", "YYMMN", "YYMON", "YYMMDD", "YYQ",
+                    "YYQC", "YYQD", "YYQP", "YYQS", "YYQN", "YYQR", "YYQRC",
+                    "YYQRD", "YYQRP", "YYQRS", "YYQRN",
+                    "YYMMDDP", "YYMMDDC", "E8601DA", "YYMMDDN", "MMDDYYC",
+                    "MMDDYYS", "MMDDYYD", "YYMMDDS", "B8601DA", "DDMMYYN",
+                    "YYMMDDD", "DDMMYYB", "DDMMYYP", "MMDDYYP", "YYMMDDB",
+                    "MMDDYYN", "DDMMYYC", "DDMMYYD", "DDMMYYS",
+                    "MINGUO")
+
+sas_datetime_formats = ("DATETIME", "DTWKDATX",
+                        "B8601DN", "B8601DT", "B8601DX", "B8601DZ", "B8601LX",
+                        "E8601DN", "E8601DT", "E8601DX", "E8601DZ", "E8601LX",
+                        "DATEAMPM", "DTDATE", "DTMONYY", "DTMONYY", "DTWKDATX",
+                        "DTYEAR", "TOD", "MDYAMPM")
diff --git a/pandas/io/sas/sas_xport.py b/pandas/io/sas/sas_xport.py
new file mode 100644
index 0000000000000..7994517b9f303
--- /dev/null
+++ b/pandas/io/sas/sas_xport.py
@@ -0,0 +1,465 @@
+"""
+Read a SAS XPort format file into a Pandas DataFrame.
+
+Based on code from Jack Cushman (github.com/jcushman/xport).
+
+The file format is defined here:
+
+https://support.sas.com/techsup/technote/ts140.pdf
+"""
+
+from datetime import datetime
+import pandas as pd
+from pandas.io.common import get_filepath_or_buffer, BaseIterator
+from pandas import compat
+import struct
+import numpy as np
+from pandas.util._decorators import Appender
+import warnings
+
+_correct_line1 = ("HEADER RECORD*******LIBRARY HEADER RECORD!!!!!!!"
+                  "000000000000000000000000000000  ")
+_correct_header1 = ("HEADER RECORD*******MEMBER  HEADER RECORD!!!!!!!"
+                    "000000000000000001600000000")
+_correct_header2 = ("HEADER RECORD*******DSCRPTR HEADER RECORD!!!!!!!"
+                    "000000000000000000000000000000  ")
+_correct_obs_header = ("HEADER RECORD*******OBS     HEADER RECORD!!!!!!!"
+                       "000000000000000000000000000000  ")
+_fieldkeys = ['ntype', 'nhfun', 'field_length', 'nvar0', 'name', 'label',
+              'nform', 'nfl', 'num_decimals', 'nfj', 'nfill', 'niform',
+              'nifl', 'nifd', 'npos', '_']
+
+
+_base_params_doc = """\
+Parameters
+----------
+filepath_or_buffer : string or file-like object
+    Path to SAS file or object implementing binary read method."""
+
+_params2_doc = """\
+index : identifier of index column
+    Identifier of column that should be used as index of the DataFrame.
+encoding : string
+    Encoding for text data.
+chunksize : int
+    Read file `chunksize` lines at a time, returns iterator."""
+
+_format_params_doc = """\
+format : string
+    File format, only `xport` is currently supported."""
+
+_iterator_doc = """\
+iterator : boolean, default False
+    Return XportReader object for reading file incrementally."""
+
+
+_read_sas_doc = """Read a SAS file into a DataFrame.
+
+%(_base_params_doc)s
+%(_format_params_doc)s
+%(_params2_doc)s
+%(_iterator_doc)s
+
+Returns
+-------
+DataFrame or XportReader
+
+Examples
+--------
+Read a SAS Xport file:
+
+>>> df = pandas.read_sas('filename.XPT')
+
+Read a Xport file in 10,000 line chunks:
+
+>>> itr = pandas.read_sas('filename.XPT', chunksize=10000)
+>>> for chunk in itr:
+>>>     do_something(chunk)
+
+""" % {"_base_params_doc": _base_params_doc,
+       "_format_params_doc": _format_params_doc,
+       "_params2_doc": _params2_doc,
+       "_iterator_doc": _iterator_doc}
+
+
+_xport_reader_doc = """\
+Class for reading SAS Xport files.
+
+%(_base_params_doc)s
+%(_params2_doc)s
+
+Attributes
+----------
+member_info : list
+    Contains information about the file
+fields : list
+    Contains information about the variables in the file
+""" % {"_base_params_doc": _base_params_doc,
+       "_params2_doc": _params2_doc}
+
+
+_read_method_doc = """\
+Read observations from SAS Xport file, returning as data frame.
+
+Parameters
+----------
+nrows : int
+    Number of rows to read from data file; if None, read whole
+    file.
+
+Returns
+-------
+A DataFrame.
+"""
+
+
+def _parse_date(datestr):
+    """ Given a date in xport format, return Python date. """
+    try:
+        # e.g. "16FEB11:10:07:55"
+        return datetime.strptime(datestr, "%d%b%y:%H:%M:%S")
+    except ValueError:
+        return pd.NaT
+
+
+def _split_line(s, parts):
+    """
+    Parameters
+    ----------
+    s: string
+        Fixed-length string to split
+    parts: list of (name, length) pairs
+        Used to break up string, name '_' will be filtered from output.
+
+    Returns
+    -------
+    Dict of name:contents of string at given location.
+    """
+    out = {}
+    start = 0
+    for name, length in parts:
+        out[name] = s[start:start + length].strip()
+        start += length
+    del out['_']
+    return out
+
+
+def _handle_truncated_float_vec(vec, nbytes):
+    # This feature is not well documented, but some SAS XPORT files
+    # have 2-7 byte "truncated" floats.  To read these truncated
+    # floats, pad them with zeros on the right to make 8 byte floats.
+    #
+    # References:
+    # https://github.com/jcushman/xport/pull/3
+    # The R "foreign" library
+
+    if nbytes != 8:
+        vec1 = np.zeros(len(vec), np.dtype('S8'))
+        dtype = np.dtype('S%d,S%d' % (nbytes, 8 - nbytes))
+        vec2 = vec1.view(dtype=dtype)
+        vec2['f0'] = vec
+        return vec2
+
+    return vec
+
+
+def _parse_float_vec(vec):
+    """
+    Parse a vector of float values representing IBM 8 byte floats into
+    native 8 byte floats.
+    """
+
+    dtype = np.dtype('>u4,>u4')
+    vec1 = vec.view(dtype=dtype)
+    xport1 = vec1['f0']
+    xport2 = vec1['f1']
+
+    # Start by setting first half of ieee number to first half of IBM
+    # number sans exponent
+    ieee1 = xport1 & 0x00ffffff
+
+    # Get the second half of the ibm number into the second half of
+    # the ieee number
+    ieee2 = xport2
+
+    # The fraction bit to the left of the binary point in the ieee
+    # format was set and the number was shifted 0, 1, 2, or 3
+    # places. This will tell us how to adjust the ibm exponent to be a
+    # power of 2 ieee exponent and how to shift the fraction bits to
+    # restore the correct magnitude.
+    shift = np.zeros(len(vec), dtype=np.uint8)
+    shift[np.where(xport1 & 0x00200000)] = 1
+    shift[np.where(xport1 & 0x00400000)] = 2
+    shift[np.where(xport1 & 0x00800000)] = 3
+
+    # shift the ieee number down the correct number of places then
+    # set the second half of the ieee number to be the second half
+    # of the ibm number shifted appropriately, ored with the bits
+    # from the first half that would have been shifted in if we
+    # could shift a double. All we are worried about are the low
+    # order 3 bits of the first half since we're only shifting by
+    # 1, 2, or 3.
+    ieee1 >>= shift
+    ieee2 = (xport2 >> shift) | ((xport1 & 0x00000007) << (29 + (3 - shift)))
+
+    # clear the 1 bit to the left of the binary point
+    ieee1 &= 0xffefffff
+
+    # set the exponent of the ieee number to be the actual exponent
+    # plus the shift count + 1023. Or this into the first half of the
+    # ieee number. The ibm exponent is excess 64 but is adjusted by 65
+    # since during conversion to ibm format the exponent is
+    # incremented by 1 and the fraction bits left 4 positions to the
+    # right of the radix point.  (had to add >> 24 because C treats &
+    # 0x7f as 0x7f000000 and Python doesn't)
+    ieee1 |= ((((((xport1 >> 24) & 0x7f) - 65) << 2) +
+               shift + 1023) << 20) | (xport1 & 0x80000000)
+
+    ieee = np.empty((len(ieee1),), dtype='>u4,>u4')
+    ieee['f0'] = ieee1
+    ieee['f1'] = ieee2
+    ieee = ieee.view(dtype='>f8')
+    ieee = ieee.astype('f8')
+
+    return ieee
+
+
+class XportReader(BaseIterator):
+    __doc__ = _xport_reader_doc
+
+    def __init__(self, filepath_or_buffer, index=None, encoding='ISO-8859-1',
+                 chunksize=None):
+
+        self._encoding = encoding
+        self._lines_read = 0
+        self._index = index
+        self._chunksize = chunksize
+
+        if isinstance(filepath_or_buffer, str):
+            (filepath_or_buffer, encoding,
+             compression, should_close) = get_filepath_or_buffer(
+                filepath_or_buffer, encoding=encoding)
+
+        if isinstance(filepath_or_buffer, (str, compat.text_type, bytes)):
+            self.filepath_or_buffer = open(filepath_or_buffer, 'rb')
+        else:
+            # Copy to BytesIO, and ensure no encoding
+            contents = filepath_or_buffer.read()
+            try:
+                contents = contents.encode(self._encoding)
+            except:
+                pass
+            self.filepath_or_buffer = compat.BytesIO(contents)
+
+        self._read_header()
+
+    def close(self):
+        self.filepath_or_buffer.close()
+
+    def _get_row(self):
+        return self.filepath_or_buffer.read(80).decode()
+
+    def _read_header(self):
+        self.filepath_or_buffer.seek(0)
+
+        # read file header
+        line1 = self._get_row()
+        if line1 != _correct_line1:
+            self.close()
+            raise ValueError("Header record is not an XPORT file.")
+
+        line2 = self._get_row()
+        fif = [['prefix', 24], ['version', 8], ['OS', 8],
+               ['_', 24], ['created', 16]]
+        file_info = _split_line(line2, fif)
+        if file_info['prefix'] != "SAS     SAS     SASLIB":
+            self.close()
+            raise ValueError("Header record has invalid prefix.")
+        file_info['created'] = _parse_date(file_info['created'])
+        self.file_info = file_info
+
+        line3 = self._get_row()
+        file_info['modified'] = _parse_date(line3[:16])
+
+        # read member header
+        header1 = self._get_row()
+        header2 = self._get_row()
+        headflag1 = header1.startswith(_correct_header1)
+        headflag2 = (header2 == _correct_header2)
+        if not (headflag1 and headflag2):
+            self.close()
+            raise ValueError("Member header not found")
+        # usually 140, could be 135
+        fieldnamelength = int(header1[-5:-2])
+
+        # member info
+        mem = [['prefix', 8], ['set_name', 8], ['sasdata', 8],
+               ['version', 8], ['OS', 8], ['_', 24], ['created', 16]]
+        member_info = _split_line(self._get_row(), mem)
+        mem = [['modified', 16], ['_', 16], ['label', 40], ['type', 8]]
+        member_info.update(_split_line(self._get_row(), mem))
+        member_info['modified'] = _parse_date(member_info['modified'])
+        member_info['created'] = _parse_date(member_info['created'])
+        self.member_info = member_info
+
+        # read field names
+        types = {1: 'numeric', 2: 'char'}
+        fieldcount = int(self._get_row()[54:58])
+        datalength = fieldnamelength * fieldcount
+        # round up to nearest 80
+        if datalength % 80:
+            datalength += 80 - datalength % 80
+        fielddata = self.filepath_or_buffer.read(datalength)
+        fields = []
+        obs_length = 0
+        while len(fielddata) >= fieldnamelength:
+            # pull data for one field
+            field, fielddata = (fielddata[:fieldnamelength],
+                                fielddata[fieldnamelength:])
+
+            # rest at end gets ignored, so if field is short, pad out
+            # to match struct pattern below
+            field = field.ljust(140)
+
+            fieldstruct = struct.unpack('>hhhh8s40s8shhh2s8shhl52s', field)
+            field = dict(zip(_fieldkeys, fieldstruct))
+            del field['_']
+            field['ntype'] = types[field['ntype']]
+            fl = field['field_length']
+            if field['ntype'] == 'numeric' and ((fl < 2) or (fl > 8)):
+                self.close()
+                msg = "Floating field width {0} is not between 2 and 8."
+                raise TypeError(msg.format(fl))
+
+            for k, v in field.items():
+                try:
+                    field[k] = v.strip()
+                except AttributeError:
+                    pass
+
+            obs_length += field['field_length']
+            fields += [field]
+
+        header = self._get_row()
+        if not header == _correct_obs_header:
+            self.close()
+            raise ValueError("Observation header not found.")
+
+        self.fields = fields
+        self.record_length = obs_length
+        self.record_start = self.filepath_or_buffer.tell()
+
+        self.nobs = self._record_count()
+        self.columns = [x['name'].decode() for x in self.fields]
+
+        # Setup the dtype.
+        dtypel = []
+        for i, field in enumerate(self.fields):
+            dtypel.append(('s' + str(i), "S" + str(field['field_length'])))
+        dtype = np.dtype(dtypel)
+        self._dtype = dtype
+
+    def __next__(self):
+        return self.read(nrows=self._chunksize or 1)
+
+    def _record_count(self):
+        """
+        Get number of records in file.
+
+        This is maybe suboptimal because we have to seek to the end of
+        the file.
+
+        Side effect: returns file position to record_start.
+        """
+
+        self.filepath_or_buffer.seek(0, 2)
+        total_records_length = (self.filepath_or_buffer.tell() -
+                                self.record_start)
+
+        if total_records_length % 80 != 0:
+            warnings.warn("xport file may be corrupted")
+
+        if self.record_length > 80:
+            self.filepath_or_buffer.seek(self.record_start)
+            return total_records_length // self.record_length
+
+        self.filepath_or_buffer.seek(-80, 2)
+        last_card = self.filepath_or_buffer.read(80)
+        last_card = np.frombuffer(last_card, dtype=np.uint64)
+
+        # 8 byte blank
+        ix = np.flatnonzero(last_card == 2314885530818453536)
+
+        if len(ix) == 0:
+            tail_pad = 0
+        else:
+            tail_pad = 8 * len(ix)
+
+        self.filepath_or_buffer.seek(self.record_start)
+
+        return (total_records_length - tail_pad) // self.record_length
+
+    def get_chunk(self, size=None):
+        """
+        Reads lines from Xport file and returns as dataframe
+
+        Parameters
+        ----------
+        size : int, defaults to None
+            Number of lines to read.  If None, reads whole file.
+
+        Returns
+        -------
+        DataFrame
+        """
+        if size is None:
+            size = self._chunksize
+        return self.read(nrows=size)
+
+    def _missing_double(self, vec):
+        v = vec.view(dtype='u1,u1,u2,u4')
+        miss = (v['f1'] == 0) & (v['f2'] == 0) & (v['f3'] == 0)
+        miss1 = (((v['f0'] >= 0x41) & (v['f0'] <= 0x5a)) |
+                 (v['f0'] == 0x5f) | (v['f0'] == 0x2e))
+        miss &= miss1
+        return miss
+
+    @Appender(_read_method_doc)
+    def read(self, nrows=None):
+
+        if nrows is None:
+            nrows = self.nobs
+
+        read_lines = min(nrows, self.nobs - self._lines_read)
+        read_len = read_lines * self.record_length
+        if read_len <= 0:
+            self.close()
+            raise StopIteration
+        raw = self.filepath_or_buffer.read(read_len)
+        data = np.frombuffer(raw, dtype=self._dtype, count=read_lines)
+
+        df = pd.DataFrame(index=range(read_lines))
+        for j, x in enumerate(self.columns):
+            vec = data['s%d' % j]
+            ntype = self.fields[j]['ntype']
+            if ntype == "numeric":
+                vec = _handle_truncated_float_vec(
+                    vec, self.fields[j]['field_length'])
+                miss = self._missing_double(vec)
+                v = _parse_float_vec(vec)
+                v[miss] = np.nan
+            elif self.fields[j]['ntype'] == 'char':
+                v = [y.rstrip() for y in vec]
+                if compat.PY3:
+                    if self._encoding is not None:
+                        v = [y.decode(self._encoding) for y in v]
+            df[x] = v
+
+        if self._index is None:
+            df.index = range(self._lines_read, self._lines_read + read_lines)
+        else:
+            df = df.set_index(self._index)
+
+        self._lines_read += read_lines
+
+        return df
diff --git a/pandas/io/sas/sasreader.py b/pandas/io/sas/sasreader.py
new file mode 100644
index 0000000000000..b8a0bf5733158
--- /dev/null
+++ b/pandas/io/sas/sasreader.py
@@ -0,0 +1,70 @@
+"""
+Read SAS sas7bdat or xport files.
+"""
+from pandas import compat
+from pandas.io.common import _stringify_path
+
+
+def read_sas(filepath_or_buffer, format=None, index=None, encoding=None,
+             chunksize=None, iterator=False):
+    """
+    Read SAS files stored as either XPORT or SAS7BDAT format files.
+
+    Parameters
+    ----------
+    filepath_or_buffer : string or file-like object
+        Path to the SAS file.
+    format : string {'xport', 'sas7bdat'} or None
+        If None, file format is inferred.  If 'xport' or 'sas7bdat',
+        uses the corresponding format.
+    index : identifier of index column, defaults to None
+        Identifier of column that should be used as index of the DataFrame.
+    encoding : string, default is None
+        Encoding for text data.  If None, text data are stored as raw bytes.
+    chunksize : int
+        Read file `chunksize` lines at a time, returns iterator.
+    iterator : bool, defaults to False
+        If True, returns an iterator for reading the file incrementally.
+
+    Returns
+    -------
+    DataFrame if iterator=False and chunksize=None, else SAS7BDATReader
+    or XportReader
+    """
+    if format is None:
+        buffer_error_msg = ("If this is a buffer object rather "
+                            "than a string name, you must specify "
+                            "a format string")
+        filepath_or_buffer = _stringify_path(filepath_or_buffer)
+        if not isinstance(filepath_or_buffer, compat.string_types):
+            raise ValueError(buffer_error_msg)
+        try:
+            fname = filepath_or_buffer.lower()
+            if fname.endswith(".xpt"):
+                format = "xport"
+            elif fname.endswith(".sas7bdat"):
+                format = "sas7bdat"
+            else:
+                raise ValueError("unable to infer format of SAS file")
+        except:
+            pass
+
+    if format.lower() == 'xport':
+        from pandas.io.sas.sas_xport import XportReader
+        reader = XportReader(filepath_or_buffer, index=index,
+                             encoding=encoding,
+                             chunksize=chunksize)
+    elif format.lower() == 'sas7bdat':
+        from pandas.io.sas.sas7bdat import SAS7BDATReader
+        reader = SAS7BDATReader(filepath_or_buffer, index=index,
+                                encoding=encoding,
+                                chunksize=chunksize)
+    else:
+        raise ValueError('unknown SAS format')
+
+    if iterator or chunksize:
+        return reader
+
+    data = reader.read()
+    reader.close()
+    return data
diff --git a/pandas/io/sql.py b/pandas/io/sql.py
index 799d1e88260f2..a582d32741ae9 100644
--- a/pandas/io/sql.py
+++ b/pandas/io/sql.py
@@ -5,22 +5,24 @@
 """
 
 from __future__ import print_function, division
-from datetime import datetime, date
+from datetime import datetime, date, time
 
 import warnings
-import traceback
 import re
 import numpy as np
 
-import pandas.lib as lib
-import pandas.core.common as com
-from pandas.compat import lzip, map, zip, raise_with_traceback, string_types
+import pandas._libs.lib as lib
+from pandas.core.dtypes.missing import isna
+from pandas.core.dtypes.dtypes import DatetimeTZDtype
+from pandas.core.dtypes.common import (
+    is_list_like, is_dict_like,
+    is_datetime64tz_dtype)
+
+from pandas.compat import (map, zip, raise_with_traceback,
+                           string_types, text_type)
 from pandas.core.api import DataFrame, Series
-from pandas.core.common import isnull
 from pandas.core.base import PandasObject
-from pandas.core.dtypes import DatetimeTZDtype
-from pandas.tseries.tools import to_datetime
-from pandas.util.decorators import Appender
+from pandas.core.tools.datetimes import to_datetime
 
 from contextlib import contextmanager
 
@@ -33,8 +35,8 @@ class DatabaseError(IOError):
     pass
 
 
-#------------------------------------------------------------------------------
-#--- Helper functions
+# -----------------------------------------------------------------------------
+# -- Helper functions
 
 _SQLALCHEMY_INSTALLED = None
 
@@ -47,11 +49,11 @@ def _is_sqlalchemy_connectable(con):
             _SQLALCHEMY_INSTALLED = True
 
             from distutils.version import LooseVersion
-            ver = LooseVersion(sqlalchemy.__version__)
+            ver = sqlalchemy.__version__
             # For sqlalchemy versions < 0.8.2, the BIGINT type is recognized
             # for a sqlite engine, which results in a warning when trying to
             # read/write a DataFrame with int64 values. (GH7433)
-            if ver < '0.8.2':
+            if LooseVersion(ver) < LooseVersion('0.8.2'):
                 from sqlalchemy import BigInteger
                 from sqlalchemy.ext.compiler import compiles
 
@@ -69,7 +71,7 @@ def compile_big_int_sqlite(type_, compiler, **kw):
 
 
 def _convert_params(sql, params):
-    """convert sql and params args to DBAPI2.0 compliant format"""
+    """Convert SQL and params args to DBAPI2.0 compliant format."""
     args = [sql]
     if params is not None:
         if hasattr(params, 'keys'):  # test if params is a mapping
@@ -79,29 +81,30 @@ def _convert_params(sql, params):
     return args
 
 
-def _handle_date_column(col, format=None):
+def _handle_date_column(col, utc=None, format=None):
     if isinstance(format, dict):
         return to_datetime(col, errors='ignore', **format)
     else:
-        if format in ['D', 's', 'ms', 'us', 'ns']:
-            return to_datetime(col, errors='coerce', unit=format, utc=True)
-        elif (issubclass(col.dtype.type, np.floating)
-                or issubclass(col.dtype.type, np.integer)):
-            # parse dates as timestamp
-            format = 's' if format is None else format
-            return to_datetime(col, errors='coerce', unit=format, utc=True)
-        elif com.is_datetime64tz_dtype(col):
+        # Allow passing of formatting string for integers
+        # GH17855
+        if format is None and (issubclass(col.dtype.type, np.floating) or
+                               issubclass(col.dtype.type, np.integer)):
+            format = 's'
+        if format in ['D', 'd', 'h', 'm', 's', 'ms', 'us', 'ns']:
+            return to_datetime(col, errors='coerce', unit=format, utc=utc)
+        elif is_datetime64tz_dtype(col):
             # coerce to UTC timezone
             # GH11216
-            return to_datetime(col,errors='coerce').astype('datetime64[ns, UTC]')
+            return (to_datetime(col, errors='coerce')
+                    .astype('datetime64[ns, UTC]'))
         else:
-            return to_datetime(col, errors='coerce', format=format, utc=True)
+            return to_datetime(col, errors='coerce', format=format, utc=utc)
 
 
 def _parse_date_columns(data_frame, parse_dates):
     """
     Force non-datetime columns to be read as such.
-    Supports both string formatted and integer timestamp columns
+    Supports both string formatted and integer timestamp columns.
     """
     # handle non-list entries for parse_dates gracefully
     if parse_dates is True or parse_dates is None or parse_dates is False:
@@ -118,12 +121,11 @@ def _parse_date_columns(data_frame, parse_dates):
             fmt = None
         data_frame[col_name] = _handle_date_column(df_col, format=fmt)
 
-
     # we want to coerce datetime64_tz dtypes for now
     # we could in theory do a 'nice' conversion from a FixedOffset tz
     # GH11216
     for col_name, df_col in data_frame.iteritems():
-        if com.is_datetime64tz_dtype(df_col):
+        if is_datetime64tz_dtype(df_col):
             data_frame[col_name] = _handle_date_column(df_col)
 
     return data_frame
@@ -131,7 +133,7 @@ def _parse_date_columns(data_frame, parse_dates):
 
 def _wrap_result(data, columns, index_col=None, coerce_float=True,
                  parse_dates=None):
-    """Wrap result set of query in a DataFrame """
+    """Wrap result set of query in a DataFrame."""
 
     frame = DataFrame.from_records(data, columns=columns,
                                    coerce_float=coerce_float)
@@ -151,9 +153,9 @@ def execute(sql, con, cur=None, params=None):
     Parameters
     ----------
     sql : string
-        Query to be executed
-    con : SQLAlchemy connectable(engine/connection) or sqlite3 DBAPI2 connection
-        Using SQLAlchemy makes it possible to use any DB supported by that
+        SQL query to be executed.
+    con : SQLAlchemy connectable(engine/connection) or sqlite3 connection
+        Using SQLAlchemy makes it possible to use any DB supported by the
         library.
         If a DBAPI2 object, only sqlite3 is supported.
     cur : deprecated, cursor is obtained from connection, default: None
@@ -172,161 +174,44 @@ def execute(sql, con, cur=None, params=None):
     return pandas_sql.execute(*args)
 
 
-#------------------------------------------------------------------------------
-#--- Deprecated tquery and uquery
-
-def _safe_fetch(cur):
-    try:
-        result = cur.fetchall()
-        if not isinstance(result, list):
-            result = list(result)
-        return result
-    except Exception as e:  # pragma: no cover
-        excName = e.__class__.__name__
-        if excName == 'OperationalError':
-            return []
-
-
-def tquery(sql, con=None, cur=None, retry=True):
-    """
-    DEPRECATED. Returns list of tuples corresponding to each row in given sql
-    query.
-
-    If only one column selected, then plain list is returned.
-
-    To obtain the same result in the future, you can use the following:
-
-    >>> execute(sql, con, params).fetchall()
-
-    Parameters
-    ----------
-    sql: string
-        SQL query to be executed
-    con: DBAPI2 connection, default: None
-    cur: deprecated, cursor is obtained from connection, default: None
-    retry: boolean value to specify whether to retry after failure, default: True
-
-    Returns
-    -------
-    Results Iterable
-
-    """
-    warnings.warn(
-        "tquery is deprecated, and will be removed in future versions. "
-        "You can use ``execute(...).fetchall()`` instead.",
-        FutureWarning, stacklevel=2)
-
-    cur = execute(sql, con, cur=cur)
-    result = _safe_fetch(cur)
-
-    if con is not None:
-        try:
-            cur.close()
-            con.commit()
-        except Exception as e:
-            excName = e.__class__.__name__
-            if excName == 'OperationalError':  # pragma: no cover
-                print('Failed to commit, may need to restart interpreter')
-            else:
-                raise
-
-            traceback.print_exc()
-            if retry:
-                return tquery(sql, con=con, retry=False)
-
-    if result and len(result[0]) == 1:
-        # python 3 compat
-        result = list(lzip(*result)[0])
-    elif result is None:  # pragma: no cover
-        result = []
-
-    return result
-
-
-def uquery(sql, con=None, cur=None, retry=True, params=None):
-    """
-    DEPRECATED. Does the same thing as tquery, but instead of returning
-    results, it returns the number of rows affected.  Good for update queries.
-
-    To obtain the same result in the future, you can use the following:
-
-    >>> execute(sql, con).rowcount
-
-    Parameters
-    ----------
-    sql: string
-        SQL query to be executed
-    con: DBAPI2 connection, default: None
-    cur: deprecated, cursor is obtained from connection, default: None
-    retry: boolean value to specify whether to retry after failure, default: True
-    params: list or tuple, optional, default: None
-        List of parameters to pass to execute method.
-
-    Returns
-    -------
-    Number of affected rows
-
-    """
-    warnings.warn(
-        "uquery is deprecated, and will be removed in future versions. "
-        "You can use ``execute(...).rowcount`` instead.",
-        FutureWarning, stacklevel=2)
-
-    cur = execute(sql, con, cur=cur, params=params)
-
-    result = cur.rowcount
-    try:
-        con.commit()
-    except Exception as e:
-        excName = e.__class__.__name__
-        if excName != 'OperationalError':
-            raise
-
-        traceback.print_exc()
-        if retry:
-            print('Looks like your connection failed, reconnecting...')
-            return uquery(sql, con, retry=False)
-    return result
-
-
-#------------------------------------------------------------------------------
-#--- Read and write to DataFrames
+# -----------------------------------------------------------------------------
+# -- Read and write to DataFrames
 
 def read_sql_table(table_name, con, schema=None, index_col=None,
                    coerce_float=True, parse_dates=None, columns=None,
                    chunksize=None):
     """Read SQL database table into a DataFrame.
 
-    Given a table name and an SQLAlchemy connectable, returns a DataFrame.
+    Given a table name and a SQLAlchemy connectable, returns a DataFrame.
     This function does not support DBAPI connections.
 
     Parameters
     ----------
     table_name : string
-        Name of SQL table in database
+        Name of SQL table in database.
     con : SQLAlchemy connectable (or database string URI)
-        Sqlite DBAPI connection mode not supported
+        SQLite DBAPI connection mode not supported.
     schema : string, default None
         Name of SQL schema in database to query (if database flavor
-        supports this). If None, use default schema (default).
+        supports this). Uses default schema if None (default).
     index_col : string or list of strings, optional, default: None
-        Column(s) to set as index(MultiIndex)
+        Column(s) to set as index(MultiIndex).
     coerce_float : boolean, default True
-        Attempt to convert values to non-string, non-numeric objects (like
+        Attempts to convert values of non-string, non-numeric objects (like
         decimal.Decimal) to floating point. Can result in loss of Precision.
     parse_dates : list or dict, default: None
-        - List of column names to parse as dates
+        - List of column names to parse as dates.
         - Dict of ``{column_name: format string}`` where format string is
           strftime compatible in case of parsing string times or is one of
-          (D, s, ns, ms, us) in case of parsing integer timestamps
+          (D, s, ns, ms, us) in case of parsing integer timestamps.
         - Dict of ``{column_name: arg dict}``, where the arg dict corresponds
           to the keyword arguments of :func:`pandas.to_datetime`
           Especially useful with databases without native Datetime support,
-          such as SQLite
+          such as SQLite.
     columns : list, default: None
-        List of column names to select from sql table
+        List of column names to select from SQL table
     chunksize : int, default None
-        If specified, return an iterator where `chunksize` is the number of
+        If specified, returns an iterator where `chunksize` is the number of
         rows to include in each chunk.
 
     Returns
@@ -335,7 +220,7 @@ def read_sql_table(table_name, con, schema=None, index_col=None,
 
     Notes
     -----
-    Any datetime values with time zone information will be converted to UTC
+    Any datetime values with time zone information will be converted to UTC.
 
     See also
     --------
@@ -378,17 +263,17 @@ def read_sql_query(sql, con, index_col=None, coerce_float=True, params=None,
     Parameters
     ----------
     sql : string SQL query or SQLAlchemy Selectable (select or text object)
-        to be executed.
-    con : SQLAlchemy connectable(engine/connection) or database string URI
+        SQL query to be executed.
+    con : SQLAlchemy connectable(engine/connection), database string URI,
         or sqlite3 DBAPI2 connection
         Using SQLAlchemy makes it possible to use any DB supported by that
         library.
         If a DBAPI2 object, only sqlite3 is supported.
     index_col : string or list of strings, optional, default: None
-        Column(s) to set as index(MultiIndex)
+        Column(s) to set as index(MultiIndex).
     coerce_float : boolean, default True
-        Attempt to convert values to non-string, non-numeric objects (like
-        decimal.Decimal) to floating point, useful for SQL result sets
+        Attempts to convert values of non-string, non-numeric objects (like
+        decimal.Decimal) to floating point. Useful for SQL result sets.
     params : list, tuple or dict, optional, default: None
         List of parameters to pass to execute method.  The syntax used
         to pass parameters is database driver dependent. Check your
@@ -396,14 +281,14 @@ def read_sql_query(sql, con, index_col=None, coerce_float=True, params=None,
         described in PEP 249's paramstyle, is supported.
         Eg. for psycopg2, uses %(name)s so use params={'name' : 'value'}
     parse_dates : list or dict, default: None
-        - List of column names to parse as dates
+        - List of column names to parse as dates.
         - Dict of ``{column_name: format string}`` where format string is
-          strftime compatible in case of parsing string times or is one of
-          (D, s, ns, ms, us) in case of parsing integer timestamps
+          strftime compatible in case of parsing string times, or is one of
+          (D, s, ns, ms, us) in case of parsing integer timestamps.
         - Dict of ``{column_name: arg dict}``, where the arg dict corresponds
           to the keyword arguments of :func:`pandas.to_datetime`
           Especially useful with databases without native Datetime support,
-          such as SQLite
+          such as SQLite.
     chunksize : int, default None
         If specified, return an iterator where `chunksize` is the number of
         rows to include in each chunk.
@@ -415,11 +300,11 @@ def read_sql_query(sql, con, index_col=None, coerce_float=True, params=None,
     Notes
     -----
     Any datetime values with time zone information parsed via the `parse_dates`
-    parameter will be converted to UTC
+    parameter will be converted to UTC.
 
     See also
     --------
-    read_sql_table : Read SQL database table into a DataFrame
+    read_sql_table : Read SQL database table into a DataFrame.
     read_sql
 
     """
@@ -434,20 +319,27 @@ def read_sql(sql, con, index_col=None, coerce_float=True, params=None,
     """
     Read SQL query or database table into a DataFrame.
 
+    This function is a convenience wrapper around ``read_sql_table`` and
+    ``read_sql_query`` (for backward compatibility). It will delegate
+    to the specific function depending on the provided input. A SQL query
+    will be routed to ``read_sql_query``, while a database table name will
+    be routed to ``read_sql_table``. Note that the delegated function might
+    have more specific notes about their functionality not listed here.
+
     Parameters
     ----------
-    sql : string SQL query or SQLAlchemy Selectable (select or text object)
-        to be executed, or database table name.
-    con : SQLAlchemy connectable(engine/connection) or database string URI
+    sql : string or SQLAlchemy Selectable (select or text object)
+        SQL query to be executed or a table name.
+    con : SQLAlchemy connectable (engine/connection) or database string URI
         or DBAPI2 connection (fallback mode)
+
         Using SQLAlchemy makes it possible to use any DB supported by that
-        library.
-        If a DBAPI2 object, only sqlite3 is supported.
+        library. If a DBAPI2 object, only sqlite3 is supported.
     index_col : string or list of strings, optional, default: None
-        Column(s) to set as index(MultiIndex)
+        Column(s) to set as index(MultiIndex).
     coerce_float : boolean, default True
-        Attempt to convert values to non-string, non-numeric objects (like
-        decimal.Decimal) to floating point, useful for SQL result sets
+        Attempts to convert values of non-string, non-numeric objects (like
+        decimal.Decimal) to floating point, useful for SQL result sets.
     params : list, tuple or dict, optional, default: None
         List of parameters to pass to execute method.  The syntax used
         to pass parameters is database driver dependent. Check your
@@ -455,16 +347,16 @@ def read_sql(sql, con, index_col=None, coerce_float=True, params=None,
         described in PEP 249's paramstyle, is supported.
         Eg. for psycopg2, uses %(name)s so use params={'name' : 'value'}
     parse_dates : list or dict, default: None
-        - List of column names to parse as dates
+        - List of column names to parse as dates.
         - Dict of ``{column_name: format string}`` where format string is
-          strftime compatible in case of parsing string times or is one of
-          (D, s, ns, ms, us) in case of parsing integer timestamps
+          strftime compatible in case of parsing string times, or is one of
+          (D, s, ns, ms, us) in case of parsing integer timestamps.
         - Dict of ``{column_name: arg dict}``, where the arg dict corresponds
           to the keyword arguments of :func:`pandas.to_datetime`
           Especially useful with databases without native Datetime support,
-          such as SQLite
+          such as SQLite.
     columns : list, default: None
-        List of column names to select from sql table (only used when reading
+        List of column names to select from SQL table (only used when reading
         a table).
     chunksize : int, default None
         If specified, return an iterator where `chunksize` is the
@@ -474,18 +366,10 @@ def read_sql(sql, con, index_col=None, coerce_float=True, params=None,
     -------
     DataFrame
 
-    Notes
-    -----
-    This function is a convenience wrapper around ``read_sql_table`` and
-    ``read_sql_query`` (and for backward compatibility) and will delegate
-    to the specific function depending on the provided input (database
-    table name or sql query).  The delegated function might have more specific
-    notes about their functionality not listed here.
-
     See also
     --------
-    read_sql_table : Read SQL database table into a DataFrame
-    read_sql_query : Read SQL query into a DataFrame
+    read_sql_table : Read SQL database table into a DataFrame.
+    read_sql_query : Read SQL query into a DataFrame.
 
     """
     pandas_sql = pandasSQL_builder(con)
@@ -513,25 +397,21 @@ def read_sql(sql, con, index_col=None, coerce_float=True, params=None,
             chunksize=chunksize)
 
 
-def to_sql(frame, name, con, flavor='sqlite', schema=None, if_exists='fail',
-           index=True, index_label=None, chunksize=None, dtype=None):
+def to_sql(frame, name, con, schema=None, if_exists='fail', index=True,
+           index_label=None, chunksize=None, dtype=None):
     """
     Write records stored in a DataFrame to a SQL database.
 
     Parameters
     ----------
-    frame : DataFrame
+    frame : DataFrame, Series
     name : string
-        Name of SQL table
+        Name of SQL table.
     con : SQLAlchemy connectable(engine/connection) or database string URI
         or sqlite3 DBAPI2 connection
         Using SQLAlchemy makes it possible to use any DB supported by that
         library.
         If a DBAPI2 object, only sqlite3 is supported.
-    flavor : {'sqlite', 'mysql'}, default 'sqlite'
-        The flavor of SQL to use. Ignored when using SQLAlchemy connectable.
-        'mysql' is deprecated and will be removed in future versions, but it
-        will be further supported through SQLAlchemy connectables.
     schema : string, default None
         Name of SQL schema in database to write to (if database flavor
         supports this). If None, use default schema (default).
@@ -540,7 +420,7 @@ def to_sql(frame, name, con, flavor='sqlite', schema=None, if_exists='fail',
         - replace: If table exists, drop it, recreate it, and insert data.
         - append: If table exists, insert data. Create if does not exist.
     index : boolean, default True
-        Write DataFrame index as a column
+        Write DataFrame index as a column.
     index_label : string or sequence, default None
         Column label for index column(s). If None is given (default) and
         `index` is True, then the index names are used.
@@ -548,15 +428,16 @@ def to_sql(frame, name, con, flavor='sqlite', schema=None, if_exists='fail',
     chunksize : int, default None
         If not None, then rows will be written in batches of this size at a
         time.  If None, all rows will be written at once.
-    dtype : dict of column name to SQL type, default None
+    dtype : single SQLtype or dict of column name to SQL type, default None
         Optional specifying the datatype for columns. The SQL type should
         be a SQLAlchemy type, or a string for sqlite3 fallback connection.
+        If all columns are of the same type, one single value can be used.
 
     """
     if if_exists not in ('fail', 'replace', 'append'):
         raise ValueError("'{0}' is not valid for if_exists".format(if_exists))
 
-    pandas_sql = pandasSQL_builder(con, schema=schema, flavor=flavor)
+    pandas_sql = pandasSQL_builder(con, schema=schema)
 
     if isinstance(frame, Series):
         frame = frame.to_frame()
@@ -569,22 +450,18 @@ def to_sql(frame, name, con, flavor='sqlite', schema=None, if_exists='fail',
                       chunksize=chunksize, dtype=dtype)
 
 
-def has_table(table_name, con, flavor='sqlite', schema=None):
+def has_table(table_name, con, schema=None):
     """
     Check if DataBase has named table.
 
     Parameters
     ----------
     table_name: string
-        Name of SQL table
+        Name of SQL table.
     con: SQLAlchemy connectable(engine/connection) or sqlite3 DBAPI2 connection
         Using SQLAlchemy makes it possible to use any DB supported by that
         library.
         If a DBAPI2 object, only sqlite3 is supported.
-    flavor: {'sqlite', 'mysql'}, default 'sqlite'
-        The flavor of SQL to use. Ignored when using SQLAlchemy connectable.
-        'mysql' is deprecated and will be removed in future versions, but it
-        will be further supported through SQLAlchemy connectables.
     schema : string, default None
         Name of SQL schema in database to write to (if database flavor supports
         this). If None, use default schema (default).
@@ -593,59 +470,58 @@ def has_table(table_name, con, flavor='sqlite', schema=None):
     -------
     boolean
     """
-    pandas_sql = pandasSQL_builder(con, flavor=flavor, schema=schema)
+    pandas_sql = pandasSQL_builder(con, schema=schema)
     return pandas_sql.has_table(table_name)
 
-table_exists = has_table
 
-
-_MYSQL_WARNING = ("The 'mysql' flavor with DBAPI connection is deprecated "
-                  "and will be removed in future versions. "
-                  "MySQL will be further supported with SQLAlchemy connectables.")
+table_exists = has_table
 
 
 def _engine_builder(con):
     """
     Returns a SQLAlchemy engine from a URI (if con is a string)
-    else it just return con without modifying it
+    else it just return con without modifying it.
     """
+    global _SQLALCHEMY_INSTALLED
     if isinstance(con, string_types):
         try:
             import sqlalchemy
-            con = sqlalchemy.create_engine(con)
-            return con
-
         except ImportError:
             _SQLALCHEMY_INSTALLED = False
+        else:
+            con = sqlalchemy.create_engine(con)
+            return con
 
     return con
 
-def pandasSQL_builder(con, flavor=None, schema=None, meta=None,
+
+def pandasSQL_builder(con, schema=None, meta=None,
                       is_cursor=False):
     """
     Convenience function to return the correct PandasSQL subclass based on the
-    provided parameters
+    provided parameters.
     """
     # When support for DBAPI connections is removed,
     # is_cursor should not be necessary.
     con = _engine_builder(con)
     if _is_sqlalchemy_connectable(con):
         return SQLDatabase(con, schema=schema, meta=meta)
+    elif isinstance(con, string_types):
+        raise ImportError("Using URI string without sqlalchemy installed.")
     else:
-        if flavor == 'mysql':
-            warnings.warn(_MYSQL_WARNING, FutureWarning, stacklevel=3)
-        return SQLiteDatabase(con, flavor, is_cursor=is_cursor)
+        return SQLiteDatabase(con, is_cursor=is_cursor)
 
 
 class SQLTable(PandasObject):
     """
     For mapping Pandas tables to SQL tables.
     Uses fact that table is reflected by SQLAlchemy to
-    do better type convertions.
+    do better type conversions.
     Also holds various flags needed to avoid having to
     pass them between functions all the time.
     """
     # TODO: support for multiIndex
+
     def __init__(self, name, pandas_sql_engine, frame=None, index=True,
                  if_exists='fail', prefix='pandas', index_label=None,
                  schema=None, keys=None, dtype=None):
@@ -711,7 +587,7 @@ def insert_data(self):
         else:
             temp = self.frame
 
-        column_names = list(map(str, temp.columns))
+        column_names = list(map(text_type, temp.columns))
         ncols = len(column_names)
         data_list = [None] * ncols
         blocks = temp._data.blocks
@@ -727,7 +603,7 @@ def insert_data(self):
 
             # replace NaN with None
             if b._can_hold_na:
-                mask = isnull(d)
+                mask = isna(d)
                 d[mask] = None
 
             for col_loc, col in zip(b.mgr_locs, d):
@@ -736,7 +612,7 @@ def insert_data(self):
         return column_names, data_list
 
     def _execute_insert(self, conn, keys, data_iter):
-        data = [dict((k, v) for k, v in zip(keys, row)) for row in data_iter]
+        data = [{k: v for k, v in zip(keys, row)} for row in data_iter]
         conn.execute(self.insert_statement(), data)
 
     def insert(self, chunksize=None):
@@ -766,7 +642,7 @@ def insert(self, chunksize=None):
 
     def _query_iterator(self, result, chunksize, columns, coerce_float=True,
                         parse_dates=None):
-        """Return generator through chunked result set"""
+        """Return generator through chunked result set."""
 
         while True:
             data = result.fetchmany(chunksize)
@@ -829,8 +705,8 @@ def _index_name(self, index, index_label):
                 else:
                     return index_label
             # return the used column labels for the index columns
-            if (nlevels == 1 and 'index' not in self.frame.columns
-                    and self.frame.index.name is None):
+            if (nlevels == 1 and 'index' not in self.frame.columns and
+                    self.frame.index.name is None):
                 return ['index']
             else:
                 return [l if l is not None else "level_{0}".format(i)
@@ -849,15 +725,16 @@ def _get_column_names_and_types(self, dtype_mapper):
         if self.index is not None:
             for i, idx_label in enumerate(self.index):
                 idx_type = dtype_mapper(
-                    self.frame.index.get_level_values(i))
-                column_names_and_types.append((idx_label, idx_type, True))
+                    self.frame.index._get_level_values(i))
+                column_names_and_types.append((text_type(idx_label),
+                                              idx_type, True))
 
         column_names_and_types += [
-            (str(self.frame.columns[i]),
+            (text_type(self.frame.columns[i]),
              dtype_mapper(self.frame.iloc[:, i]),
              False)
             for i in range(len(self.frame.columns))
-            ]
+        ]
 
         return column_names_and_types
 
@@ -871,7 +748,7 @@ def _create_table_setup(self):
                    for name, typ, is_index in column_names_and_types]
 
         if self.keys is not None:
-            if not com.is_list_like(self.keys):
+            if not is_list_like(self.keys):
                 keys = [self.keys]
             else:
                 keys = self.keys
@@ -897,7 +774,7 @@ def _harmonize_columns(self, parse_dates=None):
         all Nones with false. Therefore only convert bool if there are no
         NA values.
         Datetimes should already be converted to np.datetime64 if supported,
-        but here we also force conversion if required
+        but here we also force conversion if required.
         """
         # handle non-list entries for parse_dates gracefully
         if parse_dates is True or parse_dates is None or parse_dates is False:
@@ -913,9 +790,11 @@ def _harmonize_columns(self, parse_dates=None):
                 # the type the dataframe column should have
                 col_type = self._get_dtype(sql_col.type)
 
-                if col_type is datetime or col_type is date or col_type is DatetimeTZDtype:
-                    self.frame[col_name] = _handle_date_column(df_col)
-
+                if (col_type is datetime or col_type is date or
+                        col_type is DatetimeTZDtype):
+                    # Convert tz-aware Datetime SQL columns to UTC
+                    utc = col_type is DatetimeTZDtype
+                    self.frame[col_name] = _handle_date_column(df_col, utc=utc)
                 elif col_type is float:
                     # floats support NA, can always convert!
                     self.frame[col_name] = df_col.astype(col_type, copy=False)
@@ -923,7 +802,8 @@ def _harmonize_columns(self, parse_dates=None):
                 elif len(df_col) == df_col.count():
                     # No NA values, can convert ints and bools
                     if col_type is np.dtype('int64') or col_type is bool:
-                        self.frame[col_name] = df_col.astype(col_type, copy=False)
+                        self.frame[col_name] = df_col.astype(
+                            col_type, copy=False)
 
                 # Handle date parsing
                 if col_name in parse_dates:
@@ -937,7 +817,7 @@ def _harmonize_columns(self, parse_dates=None):
             except KeyError:
                 pass  # this column not in results
 
-    def _get_notnull_col_dtype(self, col):
+    def _get_notna_col_dtype(self, col):
         """
         Infer datatype of the Series col.  In case the dtype of col is 'object'
         and it contains NA values, this infers the datatype of the not-NA
@@ -945,9 +825,9 @@ def _get_notnull_col_dtype(self, col):
         """
         col_for_inference = col
         if col.dtype == 'object':
-            notnulldata = col[~isnull(col)]
-            if len(notnulldata):
-                col_for_inference = notnulldata
+            notnadata = col[~isna(col)]
+            if len(notnadata):
+                col_for_inference = notnadata
 
         return lib.infer_dtype(col_for_inference)
 
@@ -957,14 +837,15 @@ def _sqlalchemy_type(self, col):
         if col.name in dtype:
             return self.dtype[col.name]
 
-        col_type = self._get_notnull_col_dtype(col)
+        col_type = self._get_notna_col_dtype(col)
 
-        from sqlalchemy.types import (BigInteger, Integer, Float, Text, Boolean,
-            DateTime, Date, Time)
+        from sqlalchemy.types import (BigInteger, Integer, Float,
+                                      Text, Boolean,
+                                      DateTime, Date, Time)
 
         if col_type == 'datetime64' or col_type == 'datetime':
             try:
-                tz = col.tzinfo
+                tz = col.tzinfo  # noqa
                 return DateTime(timezone=True)
             except:
                 return DateTime
@@ -995,7 +876,8 @@ def _sqlalchemy_type(self, col):
         return Text
 
     def _get_dtype(self, sqltype):
-        from sqlalchemy.types import Integer, Float, Boolean, DateTime, Date, TIMESTAMP
+        from sqlalchemy.types import (Integer, Float, Boolean, DateTime,
+                                      Date, TIMESTAMP)
 
         if isinstance(sqltype, Float):
             return float
@@ -1019,22 +901,22 @@ def _get_dtype(self, sqltype):
 
 class PandasSQL(PandasObject):
     """
-    Subclasses Should define read_sql and to_sql
+    Subclasses Should define read_sql and to_sql.
     """
 
     def read_sql(self, *args, **kwargs):
-        raise ValueError("PandasSQL must be created with an SQLAlchemy connectable"
-                         " or connection+sql flavor")
+        raise ValueError("PandasSQL must be created with an SQLAlchemy "
+                         "connectable or sqlite connection")
 
     def to_sql(self, *args, **kwargs):
-        raise ValueError("PandasSQL must be created with an SQLAlchemy connectable"
-                         " or connection+sql flavor")
+        raise ValueError("PandasSQL must be created with an SQLAlchemy "
+                         "connectable or sqlite connection")
 
 
 class SQLDatabase(PandasSQL):
     """
-    This class enables convertion between DataFrame and SQL databases
-    using SQLAlchemy to handle DataBase abstraction
+    This class enables conversion between DataFrame and SQL databases
+    using SQLAlchemy to handle DataBase abstraction.
 
     Parameters
     ----------
@@ -1079,28 +961,28 @@ def read_table(self, table_name, index_col=None, coerce_float=True,
         Parameters
         ----------
         table_name : string
-            Name of SQL table in database
+            Name of SQL table in database.
         index_col : string, optional, default: None
-            Column to set as index
+            Column to set as index.
         coerce_float : boolean, default True
-            Attempt to convert values to non-string, non-numeric objects
+            Attempts to convert values of non-string, non-numeric objects
             (like decimal.Decimal) to floating point. This can result in
             loss of precision.
         parse_dates : list or dict, default: None
-            - List of column names to parse as dates
+            - List of column names to parse as dates.
             - Dict of ``{column_name: format string}`` where format string is
-              strftime compatible in case of parsing string times or is one of
-              (D, s, ns, ms, us) in case of parsing integer timestamps
+              strftime compatible in case of parsing string times, or is one of
+              (D, s, ns, ms, us) in case of parsing integer timestamps.
             - Dict of ``{column_name: arg}``, where the arg corresponds
               to the keyword arguments of :func:`pandas.to_datetime`.
               Especially useful with databases without native Datetime support,
-              such as SQLite
+              such as SQLite.
         columns : list, default: None
-            List of column names to select from sql table
+            List of column names to select from SQL table.
         schema : string, default None
             Name of SQL schema in database to query (if database flavor
             supports this).  If specified, this overwrites the default
-            schema of the SQLDatabase object.
+            schema of the SQL database object.
         chunksize : int, default None
             If specified, return an iterator where `chunksize` is the number
             of rows to include in each chunk.
@@ -1141,12 +1023,12 @@ def read_query(self, sql, index_col=None, coerce_float=True,
         Parameters
         ----------
         sql : string
-            SQL query to be executed
+            SQL query to be executed.
         index_col : string, optional, default: None
             Column name to use as index for the returned DataFrame object.
         coerce_float : boolean, default True
-            Attempt to convert values to non-string, non-numeric objects (like
-            decimal.Decimal) to floating point, useful for SQL result sets
+            Attempt to convert values of non-string, non-numeric objects (like
+            decimal.Decimal) to floating point, useful for SQL result sets.
         params : list, tuple or dict, optional, default: None
             List of parameters to pass to execute method.  The syntax used
             to pass parameters is database driver dependent. Check your
@@ -1154,14 +1036,14 @@ def read_query(self, sql, index_col=None, coerce_float=True,
             described in PEP 249's paramstyle, is supported.
             Eg. for psycopg2, uses %(name)s so use params={'name' : 'value'}
         parse_dates : list or dict, default: None
-            - List of column names to parse as dates
+            - List of column names to parse as dates.
             - Dict of ``{column_name: format string}`` where format string is
-              strftime compatible in case of parsing string times or is one of
-              (D, s, ns, ms, us) in case of parsing integer timestamps
-            - Dict of ``{column_name: arg dict}``, where the arg dict corresponds
-              to the keyword arguments of :func:`pandas.to_datetime`
-              Especially useful with databases without native Datetime support,
-              such as SQLite
+              strftime compatible in case of parsing string times, or is one of
+              (D, s, ns, ms, us) in case of parsing integer timestamps.
+            - Dict of ``{column_name: arg dict}``, where the arg dict
+              corresponds to the keyword arguments of
+              :func:`pandas.to_datetime` Especially useful with databases
+              without native Datetime support, such as SQLite.
         chunksize : int, default None
             If specified, return an iterator where `chunksize` is the number
             of rows to include in each chunk.
@@ -1204,13 +1086,13 @@ def to_sql(self, frame, name, if_exists='fail', index=True,
         ----------
         frame : DataFrame
         name : string
-            Name of SQL table
+            Name of SQL table.
         if_exists : {'fail', 'replace', 'append'}, default 'fail'
             - fail: If table exists, do nothing.
             - replace: If table exists, drop it, recreate it, and insert data.
             - append: If table exists, insert data. Create if does not exist.
         index : boolean, default True
-            Write DataFrame index as a column
+            Write DataFrame index as a column.
         index_label : string or sequence, default None
             Column label for index column(s). If None is given (default) and
             `index` is True, then the index names are used.
@@ -1222,11 +1104,15 @@ def to_sql(self, frame, name, if_exists='fail', index=True,
         chunksize : int, default None
             If not None, then rows will be written in batches of this size at a
             time.  If None, all rows will be written at once.
-        dtype : dict of column name to SQL type, default None
+        dtype : single type or dict of column name to SQL type, default None
             Optional specifying the datatype for columns. The SQL type should
-            be a SQLAlchemy type.
+            be a SQLAlchemy type. If all columns are of the same type, one
+            single value can be used.
 
         """
+        if dtype and not is_dict_like(dtype):
+            dtype = {col_name: dtype for col_name in frame}
+
         if dtype is not None:
             from sqlalchemy.types import to_instance, TypeEngine
             for col, my_type in dtype.items():
@@ -1239,18 +1125,23 @@ def to_sql(self, frame, name, if_exists='fail', index=True,
                          schema=schema, dtype=dtype)
         table.create()
         table.insert(chunksize)
-        # check for potentially case sensitivity issues (GH7815)
-        engine = self.connectable.engine
-        with self.connectable.connect() as conn:
-            table_names = engine.table_names(
-                schema=schema or self.meta.schema,
-                connection=conn,
-            )
-        if name not in table_names:
-            warnings.warn("The provided table name '{0}' is not found exactly "
-                          "as such in the database after writing the table, "
-                          "possibly due to case sensitivity issues. Consider "
-                          "using lower case table names.".format(name), UserWarning)
+        if (not name.isdigit() and not name.islower()):
+            # check for potentially case sensitivity issues (GH7815)
+            # Only check when name is not a number and name is not lower case
+            engine = self.connectable.engine
+            with self.connectable.connect() as conn:
+                table_names = engine.table_names(
+                    schema=schema or self.meta.schema,
+                    connection=conn,
+                )
+            if name not in table_names:
+                msg = (
+                    "The provided table name '{0}' is not found exactly as "
+                    "such in the database after writing the table, possibly "
+                    "due to case sensitivity issues. Consider using lower "
+                    "case table names."
+                ).format(name)
+                warnings.warn(msg, UserWarning)
 
     @property
     def tables(self):
@@ -1292,66 +1183,30 @@ def _create_sql_schema(self, frame, table_name, keys=None, dtype=None):
 
 
 # ---- SQL without SQLAlchemy ---
-# Flavour specific sql strings and handler class for access to DBs without
-# SQLAlchemy installed
-# SQL type convertions for each DB
+# sqlite-specific sql strings and handler class
+# dictionary used for readability purposes
 _SQL_TYPES = {
-    'string': {
-        'mysql': 'VARCHAR (63)',
-        'sqlite': 'TEXT',
-    },
-    'floating': {
-        'mysql': 'DOUBLE',
-        'sqlite': 'REAL',
-    },
-    'integer': {
-        'mysql': 'BIGINT',
-        'sqlite': 'INTEGER',
-    },
-    'datetime': {
-        'mysql': 'DATETIME',
-        'sqlite': 'TIMESTAMP',
-    },
-    'date': {
-        'mysql': 'DATE',
-        'sqlite': 'DATE',
-    },
-    'time': {
-        'mysql': 'TIME',
-        'sqlite': 'TIME',
-    },
-    'boolean': {
-        'mysql': 'BOOLEAN',
-        'sqlite': 'INTEGER',
-    }
+    'string': 'TEXT',
+    'floating': 'REAL',
+    'integer': 'INTEGER',
+    'datetime': 'TIMESTAMP',
+    'date': 'DATE',
+    'time': 'TIME',
+    'boolean': 'INTEGER',
 }
 
 
 def _get_unicode_name(name):
     try:
-        uname = name.encode("utf-8", "strict").decode("utf-8")
+        uname = text_type(name).encode("utf-8", "strict").decode("utf-8")
     except UnicodeError:
         raise ValueError("Cannot convert identifier to UTF-8: '%s'" % name)
     return uname
 
-def _get_valid_mysql_name(name):
-    # Filter for unquoted identifiers
-    # See http://dev.mysql.com/doc/refman/5.0/en/identifiers.html
-    uname = _get_unicode_name(name)
-    if not len(uname):
-        raise ValueError("Empty table or column name specified")
-
-    basere = r'[0-9,a-z,A-Z$_]'
-    for c in uname:
-        if not re.match(basere, c):
-            if not (0x80 < ord(c) < 0xFFFF):
-                raise ValueError("Invalid MySQL identifier '%s'" % uname)
-
-    return '`' + uname + '`'
-
 
 def _get_valid_sqlite_name(name):
-    # See http://stackoverflow.com/questions/6514274/how-do-you-escape-strings-for-sqlite-table-column-names-in-python
+    # See http://stackoverflow.com/questions/6514274/how-do-you-escape-strings\
+    # -for-sqlite-table-column-names-in-python
     # Ensure the string can be encoded as UTF-8.
     # Ensure the string does not include any NUL characters.
     # Replace all " with "".
@@ -1367,19 +1222,6 @@ def _get_valid_sqlite_name(name):
     return '"' + uname.replace('"', '""') + '"'
 
 
-# SQL enquote and wildcard symbols
-_SQL_WILDCARD = {
-    'mysql': '%s',
-    'sqlite': '?'
-}
-
-# Validate and return escaped identifier
-_SQL_GET_IDENTIFIER = {
-    'mysql': _get_valid_mysql_name,
-    'sqlite': _get_valid_sqlite_name,
-}
-
-
 _SAFE_NAMES_WARNING = ("The spaces in these column names will not be changed. "
                        "In pandas versions < 0.14, spaces were converted to "
                        "underscores.")
@@ -1391,6 +1233,15 @@ class SQLiteTable(SQLTable):
     Instead of a table variable just use the Create Table statement.
     """
 
+    def __init__(self, *args, **kwargs):
+        # GH 8341
+        # register an adapter callable for datetime.time object
+        import sqlite3
+        # this will transform time(12,34,56,789) into '12:34:56.000789'
+        # (this is what sqlalchemy does)
+        sqlite3.register_adapter(time, lambda _: _.strftime("%H:%M:%S.%f"))
+        super(SQLiteTable, self).__init__(*args, **kwargs)
+
     def sql_schema(self):
         return str(";\n".join(self.table))
 
@@ -1400,10 +1251,9 @@ def _execute_create(self):
                 conn.execute(stmt)
 
     def insert_statement(self):
-        names = list(map(str, self.frame.columns))
-        flv = self.pd_sql.flavor
-        wld = _SQL_WILDCARD[flv]  # wildcard char
-        escape = _SQL_GET_IDENTIFIER[flv]
+        names = list(map(text_type, self.frame.columns))
+        wld = '?'  # wildcard char
+        escape = _get_valid_sqlite_name
 
         if self.index is not None:
             [names.insert(0, idx) for idx in self.index[::-1]]
@@ -1421,33 +1271,32 @@ def _execute_insert(self, conn, keys, data_iter):
 
     def _create_table_setup(self):
         """
-        Return a list of SQL statement that create a table reflecting the
+        Return a list of SQL statements that creates a table reflecting the
         structure of a DataFrame.  The first entry will be a CREATE TABLE
-        statement while the rest will be CREATE INDEX statements
+        statement while the rest will be CREATE INDEX statements.
         """
         column_names_and_types = \
             self._get_column_names_and_types(self._sql_type_name)
 
-        pat = re.compile('\s+')
+        pat = re.compile(r'\s+')
         column_names = [col_name for col_name, _, _ in column_names_and_types]
         if any(map(pat.search, column_names)):
             warnings.warn(_SAFE_NAMES_WARNING, stacklevel=6)
 
-        flv = self.pd_sql.flavor
-        escape = _SQL_GET_IDENTIFIER[flv]
+        escape = _get_valid_sqlite_name
 
         create_tbl_stmts = [escape(cname) + ' ' + ctype
                             for cname, ctype, _ in column_names_and_types]
 
         if self.keys is not None and len(self.keys):
-            if not com.is_list_like(self.keys):
+            if not is_list_like(self.keys):
                 keys = [self.keys]
             else:
                 keys = self.keys
-            cnames_br = ", ".join([escape(c) for c in keys])
+            cnames_br = ", ".join(escape(c) for c in keys)
             create_tbl_stmts.append(
                 "CONSTRAINT {tbl}_pk PRIMARY KEY ({cnames_br})".format(
-                tbl=self.name, cnames_br=cnames_br))
+                    tbl=self.name, cnames_br=cnames_br))
 
         create_stmts = ["CREATE TABLE " + escape(self.name) + " (\n" +
                         ',\n  '.join(create_tbl_stmts) + "\n)"]
@@ -1456,9 +1305,9 @@ def _create_table_setup(self):
                    if is_index]
         if len(ix_cols):
             cnames = "_".join(ix_cols)
-            cnames_br = ",".join([escape(c) for c in ix_cols])
+            cnames_br = ",".join(escape(c) for c in ix_cols)
             create_stmts.append(
-                "CREATE INDEX " + escape("ix_"+self.name+"_"+cnames) +
+                "CREATE INDEX " + escape("ix_" + self.name + "_" + cnames) +
                 "ON " + escape(self.name) + " (" + cnames_br + ")")
 
         return create_stmts
@@ -1468,7 +1317,7 @@ def _sql_type_name(self, col):
         if col.name in dtype:
             return dtype[col.name]
 
-        col_type = self._get_notnull_col_dtype(col)
+        col_type = self._get_notna_col_dtype(col)
         if col_type == 'timedelta64':
             warnings.warn("the 'timedelta' type is not supported, and will be "
                           "written as integer values (ns frequency) to the "
@@ -1487,16 +1336,13 @@ def _sql_type_name(self, col):
         if col_type not in _SQL_TYPES:
             col_type = "string"
 
-        return _SQL_TYPES[col_type][self.pd_sql.flavor]
+        return _SQL_TYPES[col_type]
 
 
 class SQLiteDatabase(PandasSQL):
     """
-    Version of SQLDatabase to support sqlite connections (fallback without
-    sqlalchemy). This should only be used internally.
-
-    For now still supports `flavor` argument to deal with 'mysql' database
-    for backwards compatibility, but this will be removed in future versions.
+    Version of SQLDatabase to support SQLite connections (fallback without
+    SQLAlchemy). This should only be used internally.
 
     Parameters
     ----------
@@ -1504,16 +1350,9 @@ class SQLiteDatabase(PandasSQL):
 
     """
 
-    def __init__(self, con, flavor, is_cursor=False):
+    def __init__(self, con, is_cursor=False):
         self.is_cursor = is_cursor
         self.con = con
-        if flavor is None:
-            flavor = 'sqlite'
-        if flavor not in ['sqlite', 'mysql']:
-            raise NotImplementedError("flavors other than SQLite and MySQL "
-                                      "are not supported")
-        else:
-            self.flavor = flavor
 
     @contextmanager
     def run_transaction(self):
@@ -1546,7 +1385,8 @@ def execute(self, *args, **kwargs):
                                    " to rollback" % (args[0], exc))
                 raise_with_traceback(ex)
 
-            ex = DatabaseError("Execution failed on sql '%s': %s" % (args[0], exc))
+            ex = DatabaseError(
+                "Execution failed on sql '%s': %s" % (args[0], exc))
             raise_with_traceback(ex)
 
     @staticmethod
@@ -1556,6 +1396,8 @@ def _query_iterator(cursor, chunksize, columns, index_col=None,
 
         while True:
             data = cursor.fetchmany(chunksize)
+            if type(data) == tuple:
+                data = list(data)
             if not data:
                 cursor.close()
                 break
@@ -1599,11 +1441,12 @@ def to_sql(self, frame, name, if_exists='fail', index=True,
         Parameters
         ----------
         frame: DataFrame
-        name: name of SQL table
+        name: string
+            Name of SQL table.
         if_exists: {'fail', 'replace', 'append'}, default 'fail'
             fail: If table exists, do nothing.
             replace: If table exists, drop it, recreate it, and insert data.
-            append: If table exists, insert data. Create if does not exist.
+            append: If table exists, insert data. Create if it does not exist.
         index : boolean, default True
             Write DataFrame index as a column
         index_label : string or sequence, default None
@@ -1611,16 +1454,20 @@ def to_sql(self, frame, name, if_exists='fail', index=True,
             `index` is True, then the index names are used.
             A sequence should be given if the DataFrame uses MultiIndex.
         schema : string, default None
-            Ignored parameter included for compatability with SQLAlchemy
+            Ignored parameter included for compatibility with SQLAlchemy
             version of ``to_sql``.
         chunksize : int, default None
             If not None, then rows will be written in batches of this
             size at a time. If None, all rows will be written at once.
-        dtype : dict of column name to SQL type, default None
+        dtype : single type or dict of column name to SQL type, default None
             Optional specifying the datatype for columns. The SQL type should
-            be a string.
+            be a string. If all columns are of the same type, one single value
+            can be used.
 
         """
+        if dtype and not is_dict_like(dtype):
+            dtype = {col_name: dtype for col_name in frame}
+
         if dtype is not None:
             for col, my_type in dtype.items():
                 if not isinstance(my_type, str):
@@ -1634,23 +1481,21 @@ def to_sql(self, frame, name, if_exists='fail', index=True,
         table.insert(chunksize)
 
     def has_table(self, name, schema=None):
-        escape = _SQL_GET_IDENTIFIER[self.flavor]
-        esc_name = escape(name)
-        wld = _SQL_WILDCARD[self.flavor]
-        flavor_map = {
-            'sqlite': ("SELECT name FROM sqlite_master "
-                       "WHERE type='table' AND name=%s;") % wld,
-            'mysql': "SHOW TABLES LIKE %s" % wld}
-        query = flavor_map.get(self.flavor)
+        # TODO(wesm): unused?
+        # escape = _get_valid_sqlite_name
+        # esc_name = escape(name)
 
-        return len(self.execute(query, [name,]).fetchall()) > 0
+        wld = '?'
+        query = ("SELECT name FROM sqlite_master "
+                 "WHERE type='table' AND name=%s;") % wld
+
+        return len(self.execute(query, [name, ]).fetchall()) > 0
 
     def get_table(self, table_name, schema=None):
         return None  # not supported in fallback mode
 
     def drop_table(self, name, schema=None):
-        escape = _SQL_GET_IDENTIFIER[self.flavor]
-        drop_sql = "DROP TABLE %s" % escape(name)
+        drop_sql = "DROP TABLE %s" % _get_valid_sqlite_name(name)
         self.execute(drop_sql)
 
     def _create_sql_schema(self, frame, table_name, keys=None, dtype=None):
@@ -1659,7 +1504,7 @@ def _create_sql_schema(self, frame, table_name, keys=None, dtype=None):
         return str(table.sql_schema())
 
 
-def get_schema(frame, name, flavor='sqlite', keys=None, con=None, dtype=None):
+def get_schema(frame, name, keys=None, con=None, dtype=None):
     """
     Get the SQL db table schema for the given frame.
 
@@ -1668,10 +1513,6 @@ def get_schema(frame, name, flavor='sqlite', keys=None, con=None, dtype=None):
     frame : DataFrame
     name : string
         name of SQL table
-    flavor : {'sqlite', 'mysql'}, default 'sqlite'
-        The flavor of SQL to use. Ignored when using SQLAlchemy connectable.
-        'mysql' is deprecated and will be removed in future versions, but it
-        will be further supported through SQLAlchemy engines.
     keys : string or sequence, default: None
         columns to use a primary key
     con: an open SQL database connection object or a SQLAlchemy connectable
@@ -1684,68 +1525,5 @@ def get_schema(frame, name, flavor='sqlite', keys=None, con=None, dtype=None):
 
     """
 
-    pandas_sql = pandasSQL_builder(con=con, flavor=flavor)
+    pandas_sql = pandasSQL_builder(con=con)
     return pandas_sql._create_sql_schema(frame, name, keys=keys, dtype=dtype)
-
-
-# legacy names, with depreciation warnings and copied docs
-
-@Appender(read_sql.__doc__, join='\n')
-def read_frame(*args, **kwargs):
-    """DEPRECATED - use read_sql
-    """
-    warnings.warn("read_frame is deprecated, use read_sql", FutureWarning,
-                  stacklevel=2)
-    return read_sql(*args, **kwargs)
-
-
-@Appender(read_sql.__doc__, join='\n')
-def frame_query(*args, **kwargs):
-    """DEPRECATED - use read_sql
-    """
-    warnings.warn("frame_query is deprecated, use read_sql", FutureWarning,
-                  stacklevel=2)
-    return read_sql(*args, **kwargs)
-
-
-def write_frame(frame, name, con, flavor='sqlite', if_exists='fail', **kwargs):
-    """DEPRECATED - use to_sql
-
-    Write records stored in a DataFrame to a SQL database.
-
-    Parameters
-    ----------
-    frame : DataFrame
-    name : string
-    con : DBAPI2 connection
-    flavor : {'sqlite', 'mysql'}, default 'sqlite'
-        The flavor of SQL to use.
-    if_exists : {'fail', 'replace', 'append'}, default 'fail'
-        - fail: If table exists, do nothing.
-        - replace: If table exists, drop it, recreate it, and insert data.
-        - append: If table exists, insert data. Create if does not exist.
-    index : boolean, default False
-        Write DataFrame index as a column
-
-    Notes
-    -----
-    This function is deprecated in favor of ``to_sql``. There are however
-    two differences:
-
-    - With ``to_sql`` the index is written to the sql database by default. To
-      keep the behaviour this function you need to specify ``index=False``.
-    - The new ``to_sql`` function supports sqlalchemy connectables to work
-      with different sql flavors.
-
-    See also
-    --------
-    pandas.DataFrame.to_sql
-
-    """
-    warnings.warn("write_frame is deprecated, use to_sql", FutureWarning,
-                  stacklevel=2)
-
-    # for backwards compatibility, set index=False when not specified
-    index = kwargs.pop('index', False)
-    return to_sql(frame, name, con, flavor=flavor, if_exists=if_exists,
-                  index=index, **kwargs)
diff --git a/pandas/io/stata.py b/pandas/io/stata.py
index 5afbc2671e3a7..b2a5bec2a4837 100644
--- a/pandas/io/stata.py
+++ b/pandas/io/stata.py
@@ -7,74 +7,82 @@
 a once again improved version.
 
 You can find more information on http://presbrey.mit.edu/PyDTA and
-http://statsmodels.sourceforge.net/devel/
+http://www.statsmodels.org/devel/
 """
-import numpy as np
 
-import sys
+import datetime
 import struct
+import sys
+from collections import OrderedDict
+
+import numpy as np
 from dateutil.relativedelta import relativedelta
+from pandas._libs.lib import infer_dtype
+from pandas._libs.tslib import NaT, Timestamp
+from pandas._libs.writers import max_len_string_array
+
+import pandas as pd
+from pandas import compat, to_timedelta, to_datetime, isna, DatetimeIndex
+from pandas.compat import (lrange, lmap, lzip, text_type, string_types, range,
+                           zip, BytesIO)
+from pandas.core.arrays import Categorical
 from pandas.core.base import StringMixin
-from pandas.core.categorical import Categorical
+from pandas.core.dtypes.common import (is_categorical_dtype, _ensure_object,
+                                       is_datetime64_dtype)
 from pandas.core.frame import DataFrame
 from pandas.core.series import Series
-import datetime
-from pandas import compat, to_timedelta, to_datetime, isnull, DatetimeIndex
-from pandas.compat import lrange, lmap, lzip, text_type, string_types, range, \
-    zip, BytesIO
-from pandas.util.decorators import Appender
-import pandas as pd
-import pandas.core.common as com
-from pandas.io.common import get_filepath_or_buffer
-from pandas.lib import max_len_string_array, infer_dtype
-from pandas.tslib import NaT, Timestamp
+from pandas.io.common import (get_filepath_or_buffer, BaseIterator,
+                              _stringify_path)
+from pandas.util._decorators import Appender, deprecate_kwarg
 
-_version_error = "Version of given Stata file is not 104, 105, 108, 113 (Stata 8/9), 114 (Stata 10/11), 115 (Stata 12), 117 (Stata 13), or 118 (Stata 14)"
+_version_error = ("Version of given Stata file is not 104, 105, 108, "
+                  "111 (Stata 7SE), 113 (Stata 8/9), 114 (Stata 10/11), "
+                  "115 (Stata 12), 117 (Stata 13), or 118 (Stata 14)")
 
 _statafile_processing_params1 = """\
 convert_dates : boolean, defaults to True
-    Convert date variables to DataFrame time values
+    Convert date variables to DataFrame time values.
 convert_categoricals : boolean, defaults to True
-    Read value labels and convert columns to Categorical/Factor variables"""
+    Read value labels and convert columns to Categorical/Factor variables."""
 
 _encoding_params = """\
 encoding : string, None or encoding
-    Encoding used to parse the files. Note that Stata doesn't
-    support unicode. None defaults to iso-8859-1."""
+    Encoding used to parse the files. None defaults to latin-1."""
 
 _statafile_processing_params2 = """\
-index : identifier of index column
-    identifier of column that should be used as index of the DataFrame
+index_col : string, optional, default: None
+    Column to set as index.
 convert_missing : boolean, defaults to False
     Flag indicating whether to convert missing values to their Stata
-    representations.  If False, missing values are replaced with nans.
+    representations.  If False, missing values are replaced with nan.
     If True, columns containing missing values are returned with
     object data types and missing values are represented by
     StataMissingValue objects.
 preserve_dtypes : boolean, defaults to True
     Preserve Stata datatypes. If False, numeric data are upcast to pandas
-    default types for foreign data (float64 or int64)
+    default types for foreign data (float64 or int64).
 columns : list or None
     Columns to retain.  Columns will be returned in the given order.  None
-    returns all columns
+    returns all columns.
 order_categoricals : boolean, defaults to True
     Flag indicating whether converted categorical data are ordered."""
 
 _chunksize_params = """\
 chunksize : int, default None
     Return StataReader object for iterations, returns chunks with
-    given number of lines"""
+    given number of lines."""
 
 _iterator_params = """\
 iterator : boolean, default False
-    Return StataReader object"""
+    Return StataReader object."""
 
-_read_stata_doc = """Read Stata file into DataFrame
+_read_stata_doc = """
+Read Stata file into DataFrame.
 
 Parameters
 ----------
 filepath_or_buffer : string or file-like object
-    Path to .dta file or object implementing a binary read() functions
+    Path to .dta file or object implementing a binary read() functions.
 %s
 %s
 %s
@@ -85,22 +93,32 @@
 -------
 DataFrame or StataReader
 
+See Also
+--------
+pandas.io.stata.StataReader : low-level reader for Stata data files
+pandas.DataFrame.to_stata: export Stata data files
+
 Examples
 --------
 Read a Stata dta file:
->> df = pandas.read_stata('filename.dta')
+
+>>> import pandas as pd
+>>> df = pd.read_stata('filename.dta')
 
 Read a Stata dta file in 10,000 line chunks:
->> itr = pandas.read_stata('filename.dta', chunksize=10000)
->> for chunk in itr:
->>     do_something(chunk)
+
+>>> itr = pd.read_stata('filename.dta', chunksize=10000)
+>>> for chunk in itr:
+...     do_something(chunk)
 """ % (_statafile_processing_params1, _encoding_params,
        _statafile_processing_params2, _chunksize_params,
        _iterator_params)
 
-_data_method_doc = """Reads observations from Stata file, converting them into a dataframe
+_data_method_doc = """\
+Reads observations from Stata file, converting them into a dataframe
 
-This is a legacy method.  Use `read` in new code.
+    .. deprecated::
+       This is a legacy method.  Use `read` in new code.
 
 Parameters
 ----------
@@ -112,7 +130,6 @@
 DataFrame
 """ % (_statafile_processing_params1, _statafile_processing_params2)
 
-
 _read_method_doc = """\
 Reads observations from Stata file, converting them into a dataframe
 
@@ -134,8 +151,11 @@
 
 Parameters
 ----------
-path_or_buf : string or file-like object
-    Path to .dta file or object implementing a binary read() functions
+path_or_buf : path (string), buffer or path object
+    string, path object (pathlib.Path or py._path.local.LocalPath) or object
+    implementing a binary read() functions.
+
+    .. versionadded:: 0.23.0 support for pathlib, py.path.
 %s
 %s
 %s
@@ -145,24 +165,31 @@
 
 
 @Appender(_read_stata_doc)
+@deprecate_kwarg(old_arg_name='encoding', new_arg_name=None)
+@deprecate_kwarg(old_arg_name='index', new_arg_name='index_col')
 def read_stata(filepath_or_buffer, convert_dates=True,
-               convert_categoricals=True, encoding=None, index=None,
+               convert_categoricals=True, encoding=None, index_col=None,
                convert_missing=False, preserve_dtypes=True, columns=None,
                order_categoricals=True, chunksize=None, iterator=False):
 
     reader = StataReader(filepath_or_buffer,
                          convert_dates=convert_dates,
                          convert_categoricals=convert_categoricals,
-                         index=index, convert_missing=convert_missing,
+                         index_col=index_col, convert_missing=convert_missing,
                          preserve_dtypes=preserve_dtypes,
                          columns=columns,
                          order_categoricals=order_categoricals,
-                         chunksize=chunksize, encoding=encoding)
+                         chunksize=chunksize)
 
     if iterator or chunksize:
-        return reader
+        data = reader
+    else:
+        try:
+            data = reader.read()
+        finally:
+            reader.close()
+    return data
 
-    return reader.read()
 
 _date_formats = ["%tc", "%tC", "%td", "%d", "%tw", "%tm", "%tq", "%th", "%ty"]
 
@@ -229,8 +256,9 @@ def _stata_elapsed_date_to_datetime_vec(dates, fmt):
     def convert_year_month_safe(year, month):
         """
         Convert year and month to datetimes, using pandas vectorized versions
-        when the date range falls within the range supported by pandas.  Other
-        wise it falls back to a slower but more robust method using datetime.
+        when the date range falls within the range supported by pandas.
+        Otherwise it falls back to a slower but more robust method
+        using datetime.
         """
         if year.max() < MAX_YEAR and year.min() > MIN_YEAR:
             return to_datetime(100 * year + month, format='%Y%m')
@@ -246,11 +274,12 @@ def convert_year_days_safe(year, days):
         datetime or datetime64 Series
         """
         if year.max() < (MAX_YEAR - 1) and year.min() > MIN_YEAR:
-            return to_datetime(year, format='%Y') + to_timedelta(days, unit='d')
+            return (to_datetime(year, format='%Y') +
+                    to_timedelta(days, unit='d'))
         else:
             index = getattr(year, 'index', None)
-            value = [datetime.datetime(y, 1, 1) + relativedelta(days=int(d)) for
-                     y, d in zip(year, days)]
+            value = [datetime.datetime(y, 1, 1) + relativedelta(days=int(d))
+                     for y, d in zip(year, days)]
             return Series(value, index=index)
 
     def convert_delta_safe(base, deltas, unit):
@@ -266,8 +295,8 @@ def convert_delta_safe(base, deltas, unit):
                 return Series(values, index=index)
         elif unit == 'ms':
             if deltas.max() > MAX_MS_DELTA or deltas.min() < MIN_MS_DELTA:
-                values = [base + relativedelta(microseconds=(int(d) * 1000)) for
-                          d in deltas]
+                values = [base + relativedelta(microseconds=(int(d) * 1000))
+                          for d in deltas]
                 return Series(values, index=index)
         else:
             raise ValueError('format not understood')
@@ -275,7 +304,8 @@ def convert_delta_safe(base, deltas, unit):
         deltas = to_timedelta(deltas, unit=unit)
         return base + deltas
 
-    # TODO: If/when pandas supports more than datetime64[ns], this should be improved to use correct range, e.g. datetime[Y] for yearly
+    # TODO: If/when pandas supports more than datetime64[ns], this should be
+    # improved to use correct range, e.g. datetime[Y] for yearly
     bad_locs = np.isnan(dates)
     has_bad_values = False
     if bad_locs.any():
@@ -284,11 +314,11 @@ def convert_delta_safe(base, deltas, unit):
         data_col[bad_locs] = 1.0  # Replace with NaT
     dates = dates.astype(np.int64)
 
-    if fmt in ["%tc", "tc"]:  # Delta ms relative to base
+    if fmt.startswith(("%tc", "tc")):  # Delta ms relative to base
         base = stata_epoch
         ms = dates
         conv_dates = convert_delta_safe(base, ms, 'ms')
-    elif fmt in ["%tC", "tC"]:
+    elif fmt.startswith(("%tC", "tC")):
         from warnings import warn
 
         warn("Encountered %tC format. Leaving in Stata Internal Format.")
@@ -296,27 +326,30 @@ def convert_delta_safe(base, deltas, unit):
         if has_bad_values:
             conv_dates[bad_locs] = pd.NaT
         return conv_dates
-    elif fmt in ["%td", "td", "%d", "d"]:  # Delta days relative to base
+    # Delta days relative to base
+    elif fmt.startswith(("%td", "td", "%d", "d")):
         base = stata_epoch
         days = dates
         conv_dates = convert_delta_safe(base, days, 'd')
-    elif fmt in ["%tw", "tw"]:  # does not count leap days - 7 days is a week
+    # does not count leap days - 7 days is a week.
+    # 52nd week may have more than 7 days
+    elif fmt.startswith(("%tw", "tw")):
         year = stata_epoch.year + dates // 52
         days = (dates % 52) * 7
         conv_dates = convert_year_days_safe(year, days)
-    elif fmt in ["%tm", "tm"]:  # Delta months relative to base
+    elif fmt.startswith(("%tm", "tm")):  # Delta months relative to base
         year = stata_epoch.year + dates // 12
         month = (dates % 12) + 1
         conv_dates = convert_year_month_safe(year, month)
-    elif fmt in ["%tq", "tq"]:  # Delta quarters relative to base
+    elif fmt.startswith(("%tq", "tq")):  # Delta quarters relative to base
         year = stata_epoch.year + dates // 4
         month = (dates % 4) * 3 + 1
         conv_dates = convert_year_month_safe(year, month)
-    elif fmt in ["%th", "th"]:  # Delta half-years relative to base
+    elif fmt.startswith(("%th", "th")):  # Delta half-years relative to base
         year = stata_epoch.year + dates // 2
         month = (dates % 2) * 6 + 1
         conv_dates = convert_year_month_safe(year, month)
-    elif fmt in ["%ty", "ty"]:  # Years -- not delta
+    elif fmt.startswith(("%ty", "ty")):  # Years -- not delta
         year = dates
         month = np.ones_like(dates)
         conv_dates = convert_year_month_safe(year, month)
@@ -347,7 +380,7 @@ def _datetime_to_stata_elapsed_vec(dates, fmt):
 
     def parse_dates_safe(dates, delta=False, year=False, days=False):
         d = {}
-        if com.is_datetime64_dtype(dates.values):
+        if is_datetime64_dtype(dates.values):
             if delta:
                 delta = dates - stata_epoch
                 d['delta'] = delta.values.astype(
@@ -381,11 +414,11 @@ def parse_dates_safe(dates, delta=False, year=False, days=False):
 
         return DataFrame(d, index=index)
 
-    bad_loc = isnull(dates)
+    bad_loc = isna(dates)
     index = dates.index
     if bad_loc.any():
         dates = Series(dates)
-        if com.is_datetime64_dtype(dates):
+        if is_datetime64_dtype(dates):
             dates[bad_loc] = to_datetime(stata_epoch)
         else:
             dates[bad_loc] = stata_epoch
@@ -417,7 +450,7 @@ def parse_dates_safe(dates, delta=False, year=False, days=False):
         d = parse_dates_safe(dates, year=True)
         conv_dates = d.year
     else:
-        raise ValueError("fmt %s not understood" % fmt)
+        raise ValueError("Format %s is not a known Stata date format" % fmt)
 
     conv_dates = Series(conv_dates, dtype=np.float64)
     missing_value = struct.unpack('<d', b'\x00\x00\x00\x00\x00\x00\xe0\x7f')[0]
@@ -427,10 +460,11 @@ def parse_dates_safe(dates, delta=False, year=False, days=False):
 
 
 excessive_string_length_error = """
-Fixed width strings in Stata .dta files are limited to 244 (or fewer) characters.
-Column '%s' does not satisfy this restriction.
+Fixed width strings in Stata .dta files are limited to 244 (or fewer)
+characters.  Column '%s' does not satisfy this restriction.
 """
 
+
 class PossiblePrecisionLoss(Warning):
     pass
 
@@ -440,9 +474,11 @@ class PossiblePrecisionLoss(Warning):
 conversion range. This may result in a loss of precision in the saved data.
 """
 
+
 class ValueLabelTypeMismatch(Warning):
     pass
 
+
 value_label_mismatch_doc = """
 Stata value labels (pandas categories) must be strings. Column {0} contains
 non-string labels which will be converted to strings.  Please check that the
@@ -461,8 +497,8 @@ class InvalidColumnName(Warning):
     {0}
 
 If this is not what you expect, please make sure you have Stata-compliant
-column names in your DataFrame (strings only, max 32 characters, only alphanumerics and
-underscores, no Stata reserved words)
+column names in your DataFrame (strings only, max 32 characters, only
+alphanumerics and underscores, no Stata reserved words)
 """
 
 
@@ -480,17 +516,16 @@ def _cast_to_stata_types(data):
     -----
     Numeric columns in Stata must be one of int8, int16, int32, float32 or
     float64, with some additional value restrictions.  int8 and int16 columns
-    are checked for violations of the value restrictions and
-    upcast if needed.  int64 data is not usable in Stata, and so it is
-    downcast to int32 whenever the value are in the int32 range, and
-    sidecast to float64 when larger than this range.  If the int64 values
-    are outside of the range of those perfectly representable as float64 values,
-    a warning is raised.
-
-    bool columns are cast to int8.  uint colums are converted to int of the same
-    size if there is no loss in precision, other wise are upcast to a larger
-    type.  uint64 is currently not supported since it is concerted to object in
-    a DataFrame.
+    are checked for violations of the value restrictions and upcast if needed.
+    int64 data is not usable in Stata, and so it is downcast to int32 whenever
+    the value are in the int32 range, and sidecast to float64 when larger than
+    this range.  If the int64 values are outside of the range of those
+    perfectly representable as float64 values, a warning is raised.
+
+    bool columns are cast to int8.  uint columns are converted to int of the
+    same size if there is no loss in precision, otherwise are upcast to a
+    larger type.  uint64 is currently not supported since it is concerted to
+    object in a DataFrame.
     """
     ws = ''
     #                  original, if small, if large
@@ -499,6 +534,9 @@ def _cast_to_stata_types(data):
                        (np.uint16, np.int16, np.int32),
                        (np.uint32, np.int32, np.int64))
 
+    float32_max = struct.unpack('<f', b'\xff\xff\xff\x7e')[0]
+    float64_max = struct.unpack('<d', b'\xff\xff\xff\xff\xff\xff\xdf\x7f')[0]
+
     for col in data:
         dtype = data[col].dtype
         # Cast from unsupported types to supported types
@@ -509,12 +547,11 @@ def _cast_to_stata_types(data):
                 else:
                     dtype = c_data[2]
                 if c_data[2] == np.float64:  # Warn if necessary
-                        if data[col].max() >= 2 ** 53:
-                            ws = precision_loss_doc % ('uint64', 'float64')
+                    if data[col].max() >= 2 ** 53:
+                        ws = precision_loss_doc % ('uint64', 'float64')
 
                 data[col] = data[col].astype(dtype)
 
-
         # Check values and upcast if necessary
         if dtype == np.int8:
             if data[col].max() > 100 or data[col].min() < -127:
@@ -523,12 +560,26 @@ def _cast_to_stata_types(data):
             if data[col].max() > 32740 or data[col].min() < -32767:
                 data[col] = data[col].astype(np.int32)
         elif dtype == np.int64:
-            if data[col].max() <= 2147483620 and data[col].min() >= -2147483647:
+            if (data[col].max() <= 2147483620 and
+                    data[col].min() >= -2147483647):
                 data[col] = data[col].astype(np.int32)
             else:
                 data[col] = data[col].astype(np.float64)
                 if data[col].max() >= 2 ** 53 or data[col].min() <= -2 ** 53:
                     ws = precision_loss_doc % ('int64', 'float64')
+        elif dtype in (np.float32, np.float64):
+            value = data[col].max()
+            if np.isinf(value):
+                msg = 'Column {0} has a maximum value of infinity which is ' \
+                      'outside the range supported by Stata.'
+                raise ValueError(msg.format(col))
+            if dtype == np.float32 and value > float32_max:
+                data[col] = data[col].astype(np.float64)
+            elif dtype == np.float64:
+                if value > float64_max:
+                    msg = 'Column {0} has a maximum value ({1}) outside the ' \
+                          'range supported by Stata ({1})'
+                    raise ValueError(msg.format(col, value, float64_max))
 
     if ws:
         import warnings
@@ -602,7 +653,7 @@ def __init__(self, catarray):
 
     def _encode(self, s):
         """
-        Python 3 compatability shim
+        Python 3 compatibility shim
         """
         if compat.PY3:
             return s.encode(self._encoding)
@@ -723,7 +774,8 @@ class StataMissingValue(StringMixin):
         MISSING_VALUES[value] = '.'
         if i > 0:
             MISSING_VALUES[value] += chr(96 + i)
-        int_value = struct.unpack('<i', struct.pack('<f', value))[0] + increment
+        int_value = struct.unpack('<i', struct.pack('<f', value))[
+            0] + increment
         float32_base = struct.pack('<i', int_value)
 
     float64_base = b'\x00\x00\x00\x00\x00\x00\xe0\x7f'
@@ -762,8 +814,8 @@ def __repr__(self):
         return "%s(%s)" % (self.__class__, self)
 
     def __eq__(self, other):
-        return (isinstance(other, self.__class__)
-                and self.string == other.string and self.value == other.value)
+        return (isinstance(other, self.__class__) and
+                self.string == other.string and self.value == other.value)
 
     @classmethod
     def get_base_missing_value(cls, dtype):
@@ -783,24 +835,22 @@ def get_base_missing_value(cls, dtype):
 
 
 class StataParser(object):
-    _default_encoding = 'iso-8859-1'
 
-    def __init__(self, encoding):
-        self._encoding = encoding
-
-        #type          code.
-        #--------------------
-        #str1        1 = 0x01
-        #str2        2 = 0x02
-        #...
-        #str244    244 = 0xf4
-        #byte      251 = 0xfb  (sic)
-        #int       252 = 0xfc
-        #long      253 = 0xfd
-        #float     254 = 0xfe
-        #double    255 = 0xff
-        #--------------------
-        #NOTE: the byte type seems to be reserved for categorical variables
+    def __init__(self):
+
+        # type          code.
+        # --------------------
+        # str1        1 = 0x01
+        # str2        2 = 0x02
+        # ...
+        # str244    244 = 0xf4
+        # byte      251 = 0xfb  (sic)
+        # int       252 = 0xfc
+        # long      253 = 0xfd
+        # float     254 = 0xfe
+        # double    255 = 0xff
+        # --------------------
+        # NOTE: the byte type seems to be reserved for categorical variables
         # with a label, but the underlying variable is -127 to 100
         # we're going to drop the label and cast to int
         self.DTYPE_MAP = \
@@ -829,7 +879,9 @@ def __init__(self, encoding):
         self.TYPE_MAP_XML = \
             dict(
                 [
-                    (32768, 'Q'), # Not really a Q, unclear how to handle byteswap
+                    # Not really a Q, unclear how to handle byteswap
+                    (32768, 'Q'),
+
                     (65526, 'd'),
                     (65527, 'f'),
                     (65528, 'l'),
@@ -837,48 +889,48 @@ def __init__(self, encoding):
                     (65530, 'b')
                 ]
             )
-        #NOTE: technically, some of these are wrong. there are more numbers
+        # NOTE: technically, some of these are wrong. there are more numbers
         # that can be represented. it's the 27 ABOVE and BELOW the max listed
         # numeric data type in [U] 12.2.2 of the 11.2 manual
         float32_min = b'\xff\xff\xff\xfe'
         float32_max = b'\xff\xff\xff\x7e'
         float64_min = b'\xff\xff\xff\xff\xff\xff\xef\xff'
         float64_max = b'\xff\xff\xff\xff\xff\xff\xdf\x7f'
-        self.VALID_RANGE = \
-            {
-                'b': (-127, 100),
-                'h': (-32767, 32740),
-                'l': (-2147483647, 2147483620),
-                'f': (np.float32(struct.unpack('<f', float32_min)[0]),
-                      np.float32(struct.unpack('<f', float32_max)[0])),
-                'd': (np.float64(struct.unpack('<d', float64_min)[0]),
-                      np.float64(struct.unpack('<d', float64_max)[0]))
-            }
-
-        self.OLD_TYPE_MAPPING = \
-            {
-                'i': 252,
-                'f': 254,
-                'b': 251
-            }
+        self.VALID_RANGE = {
+            'b': (-127, 100),
+            'h': (-32767, 32740),
+            'l': (-2147483647, 2147483620),
+            'f': (np.float32(struct.unpack('<f', float32_min)[0]),
+                  np.float32(struct.unpack('<f', float32_max)[0])),
+            'd': (np.float64(struct.unpack('<d', float64_min)[0]),
+                  np.float64(struct.unpack('<d', float64_max)[0]))
+        }
+
+        self.OLD_TYPE_MAPPING = {
+            98: 251,  # byte
+            105: 252,  # int
+            108: 253,  # long
+            102: 254  # float
+            # don't know old code for double
+        }
+
         # These missing values are the generic '.' in Stata, and are used
         # to replace nans
-        self.MISSING_VALUES = \
-            {
-                'b': 101,
-                'h': 32741,
-                'l': 2147483621,
-                'f': np.float32(struct.unpack('<f', b'\x00\x00\x00\x7f')[0]),
-                'd': np.float64(struct.unpack('<d', b'\x00\x00\x00\x00\x00\x00\xe0\x7f')[0])
-            }
-        self.NUMPY_TYPE_MAP = \
-        {
-                'b': 'i1',
-                'h': 'i2',
-                'l': 'i4',
-                'f': 'f4',
-                'd': 'f8',
-                'Q': 'u8'
+        self.MISSING_VALUES = {
+            'b': 101,
+            'h': 32741,
+            'l': 2147483621,
+            'f': np.float32(struct.unpack('<f', b'\x00\x00\x00\x7f')[0]),
+            'd': np.float64(
+                struct.unpack('<d', b'\x00\x00\x00\x00\x00\x00\xe0\x7f')[0])
+        }
+        self.NUMPY_TYPE_MAP = {
+            'b': 'i1',
+            'h': 'i2',
+            'l': 'i4',
+            'f': 'f4',
+            'd': 'f8',
+            'Q': 'u8'
         }
 
         # Reserved words cannot be used as variable names
@@ -893,33 +945,30 @@ def __init__(self, encoding):
                                'protected', 'quad', 'rowvector', 'short',
                                'typedef', 'typename', 'virtual')
 
-    def _decode_bytes(self, str, errors=None):
-        if compat.PY3 or self._encoding is not None:
-            return str.decode(self._encoding, errors)
-        else:
-            return str
 
-class StataReader(StataParser):
+class StataReader(StataParser, BaseIterator):
     __doc__ = _stata_reader_doc
 
+    @deprecate_kwarg(old_arg_name='encoding', new_arg_name=None)
+    @deprecate_kwarg(old_arg_name='index', new_arg_name='index_col')
     def __init__(self, path_or_buf, convert_dates=True,
-                 convert_categoricals=True, index=None,
+                 convert_categoricals=True, index_col=None,
                  convert_missing=False, preserve_dtypes=True,
                  columns=None, order_categoricals=True,
-                 encoding='iso-8859-1', chunksize=None):
-        super(StataReader, self).__init__(encoding)
+                 encoding=None, chunksize=None):
+        super(StataReader, self).__init__()
         self.col_sizes = ()
 
         # Arguments to the reader (can be temporarily overridden in
         # calls to read).
         self._convert_dates = convert_dates
         self._convert_categoricals = convert_categoricals
-        self._index = index
+        self._index_col = index_col
         self._convert_missing = convert_missing
         self._preserve_dtypes = preserve_dtypes
         self._columns = columns
         self._order_categoricals = order_categoricals
-        self._encoding = encoding
+        self._encoding = None
         self._chunksize = chunksize
 
         # State variables for the file
@@ -932,25 +981,21 @@ def __init__(self, path_or_buf, convert_dates=True,
         self._dtype = None
         self._lines_read = 0
 
-        self._native_byteorder =  _set_endianness(sys.byteorder)
+        self._native_byteorder = _set_endianness(sys.byteorder)
+        path_or_buf = _stringify_path(path_or_buf)
         if isinstance(path_or_buf, str):
-            path_or_buf, encoding, _ = get_filepath_or_buffer(
-                path_or_buf, encoding=self._default_encoding
-            )
+            path_or_buf, encoding, _, should_close = get_filepath_or_buffer(
+                path_or_buf)
 
-        if isinstance(path_or_buf, (str, compat.text_type, bytes)):
+        if isinstance(path_or_buf, (str, text_type, bytes)):
             self.path_or_buf = open(path_or_buf, 'rb')
         else:
             # Copy to BytesIO, and ensure no encoding
             contents = path_or_buf.read()
-            try:
-                contents = contents.encode(self._default_encoding)
-            except:
-                pass
             self.path_or_buf = BytesIO(contents)
 
         self._read_header()
-
+        self._setup_dtype()
 
     def __enter__(self):
         """ enter context manager """
@@ -967,6 +1012,14 @@ def close(self):
         except IOError:
             pass
 
+    def _set_encoding(self):
+        """
+        Set string encoding which depends on file version
+        """
+        if self.format_version < 118:
+            self._encoding = 'latin-1'
+        else:
+            self._encoding = 'utf-8'
 
     def _read_header(self):
         first_char = self.path_or_buf.read(1)
@@ -981,18 +1034,15 @@ def _read_header(self):
         # calculate size of a data record
         self.col_sizes = lmap(lambda x: self._calcsize(x), self.typlist)
 
-        # remove format details from %td
-        self.fmtlist = ["%td" if x.startswith("%td") else x for x in self.fmtlist]
-
-
     def _read_new_header(self, first_char):
         # The first part of the header is common to 117 and 118.
         self.path_or_buf.read(27)  # stata_dta><header><release>
         self.format_version = int(self.path_or_buf.read(3))
         if self.format_version not in [117, 118]:
             raise ValueError(_version_error)
+        self._set_encoding()
         self.path_or_buf.read(21)  # </release><byteorder>
-        self.byteorder = self.path_or_buf.read(3) == "MSF" and '>' or '<'
+        self.byteorder = self.path_or_buf.read(3) == b'MSF' and '>' or '<'
         self.path_or_buf.read(15)  # </byteorder><K>
         self.nvar = struct.unpack(self.byteorder + 'H',
                                   self.path_or_buf.read(2))[0]
@@ -1047,8 +1097,7 @@ def _read_new_header(self, first_char):
         self.lbllist = self._get_lbllist()
 
         self.path_or_buf.seek(self._seek_variable_labels)
-        self.vlblist = self._get_vlblist()
-
+        self._variable_labels = self._get_variable_labels()
 
     # Get data type information, works for versions 117-118.
     def _get_dtypes(self, seek_vartypes):
@@ -1082,7 +1131,6 @@ def f(typ):
 
         return typlist, dtyplist
 
-
     def _get_varlist(self):
         if self.format_version == 117:
             b = 33
@@ -1092,7 +1140,6 @@ def _get_varlist(self):
         return [self._null_terminate(self.path_or_buf.read(b))
                 for i in range(self.nvar)]
 
-
     # Returns the format list
     def _get_fmtlist(self):
         if self.format_version == 118:
@@ -1107,7 +1154,6 @@ def _get_fmtlist(self):
         return [self._null_terminate(self.path_or_buf.read(b))
                 for i in range(self.nvar)]
 
-
     # Returns the label list
     def _get_lbllist(self):
         if self.format_version >= 118:
@@ -1119,8 +1165,7 @@ def _get_lbllist(self):
         return [self._null_terminate(self.path_or_buf.read(b))
                 for i in range(self.nvar)]
 
-
-    def _get_vlblist(self):
+    def _get_variable_labels(self):
         if self.format_version == 118:
             vlblist = [self._decode(self.path_or_buf.read(321))
                        for i in range(self.nvar)]
@@ -1132,7 +1177,6 @@ def _get_vlblist(self):
                        for i in range(self.nvar)]
         return vlblist
 
-
     def _get_nobs(self):
         if self.format_version == 118:
             return struct.unpack(self.byteorder + 'Q',
@@ -1141,10 +1185,10 @@ def _get_nobs(self):
             return struct.unpack(self.byteorder + 'I',
                                  self.path_or_buf.read(4))[0]
 
-
     def _get_data_label(self):
         if self.format_version == 118:
-            strlen = struct.unpack(self.byteorder + 'H', self.path_or_buf.read(2))[0]
+            strlen = struct.unpack(self.byteorder + 'H',
+                                   self.path_or_buf.read(2))[0]
             return self._decode(self.path_or_buf.read(strlen))
         elif self.format_version == 117:
             strlen = struct.unpack('b', self.path_or_buf.read(1))[0]
@@ -1154,7 +1198,6 @@ def _get_data_label(self):
         else:
             return self._null_terminate(self.path_or_buf.read(32))
 
-
     def _get_time_stamp(self):
         if self.format_version == 118:
             strlen = struct.unpack('b', self.path_or_buf.read(1))[0]
@@ -1167,25 +1210,26 @@ def _get_time_stamp(self):
         else:
             raise ValueError()
 
-
     def _get_seek_variable_labels(self):
         if self.format_version == 117:
             self.path_or_buf.read(8)  # <variable_lables>, throw away
             # Stata 117 data files do not follow the described format.  This is
             # a work around that uses the previous label, 33 bytes for each
             # variable, 20 for the closing tag and 17 for the opening tag
-            return self._seek_value_label_names + (33*self.nvar) + 20 + 17
+            return self._seek_value_label_names + (33 * self.nvar) + 20 + 17
         elif self.format_version == 118:
-            return struct.unpack(self.byteorder + 'q', self.path_or_buf.read(8))[0] + 17
+            return struct.unpack(self.byteorder + 'q',
+                                 self.path_or_buf.read(8))[0] + 17
         else:
             raise ValueError()
 
-
     def _read_old_header(self, first_char):
         self.format_version = struct.unpack('b', first_char)[0]
-        if self.format_version not in [104, 105, 108, 113, 114, 115]:
+        if self.format_version not in [104, 105, 108, 111, 113, 114, 115]:
             raise ValueError(_version_error)
-        self.byteorder = struct.unpack('b', self.path_or_buf.read(1))[0] == 0x1 and '>' or '<'
+        self._set_encoding()
+        self.byteorder = struct.unpack('b', self.path_or_buf.read(1))[
+            0] == 0x1 and '>' or '<'
         self.filetype = struct.unpack('b', self.path_or_buf.read(1))[0]
         self.path_or_buf.read(1)  # unused
 
@@ -1202,22 +1246,25 @@ def _read_old_header(self, first_char):
             typlist = [ord(self.path_or_buf.read(1))
                        for i in range(self.nvar)]
         else:
-            typlist = [
-                self.OLD_TYPE_MAPPING[
-                    self._decode_bytes(self.path_or_buf.read(1))
-                ] for i in range(self.nvar)
-            ]
+            buf = self.path_or_buf.read(self.nvar)
+            typlistb = np.frombuffer(buf, dtype=np.uint8)
+            typlist = []
+            for tp in typlistb:
+                if tp in self.OLD_TYPE_MAPPING:
+                    typlist.append(self.OLD_TYPE_MAPPING[tp])
+                else:
+                    typlist.append(tp - 127)  # py2 string, py3 bytes
 
         try:
             self.typlist = [self.TYPE_MAP[typ] for typ in typlist]
         except:
             raise ValueError("cannot convert stata types [{0}]"
-                             .format(','.join(typlist)))
+                             .format(','.join(str(x) for x in typlist)))
         try:
             self.dtyplist = [self.DTYPE_MAP[typ] for typ in typlist]
         except:
             raise ValueError("cannot convert stata dtypes [{0}]"
-                             .format(','.join(typlist)))
+                             .format(','.join(str(x) for x in typlist)))
 
         if self.format_version > 108:
             self.varlist = [self._null_terminate(self.path_or_buf.read(33))
@@ -1234,7 +1281,7 @@ def _read_old_header(self, first_char):
 
         self.lbllist = self._get_lbllist()
 
-        self.vlblist = self._get_vlblist()
+        self._variable_labels = self._get_variable_labels()
 
         # ignore expansion fields (Format 105 and later)
         # When reading, read five bytes; the last four bytes now tell you
@@ -1258,36 +1305,45 @@ def _read_old_header(self, first_char):
         # necessary data to continue parsing
         self.data_location = self.path_or_buf.tell()
 
+    def _setup_dtype(self):
+        """Map between numpy and state dtypes"""
+        if self._dtype is not None:
+            return self._dtype
 
-    def _calcsize(self, fmt):
-        return (type(fmt) is int and fmt
-                or struct.calcsize(self.byteorder + fmt))
+        dtype = []  # Convert struct data types to numpy data type
+        for i, typ in enumerate(self.typlist):
+            if typ in self.NUMPY_TYPE_MAP:
+                dtype.append(('s' + str(i), self.byteorder +
+                              self.NUMPY_TYPE_MAP[typ]))
+            else:
+                dtype.append(('s' + str(i), 'S' + str(typ)))
+        dtype = np.dtype(dtype)
+        self._dtype = dtype
 
+        return self._dtype
+
+    def _calcsize(self, fmt):
+        return (type(fmt) is int and fmt or
+                struct.calcsize(self.byteorder + fmt))
 
     def _decode(self, s):
         s = s.partition(b"\0")[0]
         return s.decode('utf-8')
 
-
     def _null_terminate(self, s):
-        if compat.PY3 or self._encoding is not None:  # have bytes not strings,
-                                                      # so must decode
-            s = s.partition(b"\0")[0]
-            return s.decode(self._encoding or self._default_encoding)
-        else:
-            null_byte = "\0"
-            try:
-                return s.lstrip(null_byte)[:s.index(null_byte)]
-            except:
-                return s
+        # have bytes not strings, so must decode
+        s = s.partition(b"\0")[0]
+        return s.decode(self._encoding)
 
     def _read_value_labels(self):
-        if self.format_version <= 108:
-            # Value labels are not supported in version 108 and earlier.
-            return
         if self._value_labels_read:
             # Don't read twice
             return
+        if self.format_version <= 108:
+            # Value labels are not supported in version 108 and earlier.
+            self._value_labels_read = True
+            self.value_label_dict = dict()
+            return
 
         if self.format_version >= 117:
             self.path_or_buf.seek(self.seek_value_labels)
@@ -1301,11 +1357,11 @@ def _read_value_labels(self):
         while True:
             if self.format_version >= 117:
                 if self.path_or_buf.read(5) == b'</val':  # <lbl>
-                    break  # end of variable label table
+                    break  # end of value label table
 
             slength = self.path_or_buf.read(4)
             if not slength:
-                break  # end of variable label table (format < 117)
+                break  # end of value label table (format < 117)
             if self.format_version <= 117:
                 labname = self._null_terminate(self.path_or_buf.read(33))
             else:
@@ -1316,39 +1372,40 @@ def _read_value_labels(self):
                               self.path_or_buf.read(4))[0]
             txtlen = struct.unpack(self.byteorder + 'I',
                                    self.path_or_buf.read(4))[0]
-            off = []
-            for i in range(n):
-                off.append(struct.unpack(self.byteorder + 'I',
-                                         self.path_or_buf.read(4))[0])
-            val = []
-            for i in range(n):
-                val.append(struct.unpack(self.byteorder + 'I',
-                                         self.path_or_buf.read(4))[0])
+            off = np.frombuffer(self.path_or_buf.read(4 * n),
+                                dtype=self.byteorder + "i4",
+                                count=n)
+            val = np.frombuffer(self.path_or_buf.read(4 * n),
+                                dtype=self.byteorder + "i4",
+                                count=n)
+            ii = np.argsort(off)
+            off = off[ii]
+            val = val[ii]
             txt = self.path_or_buf.read(txtlen)
             self.value_label_dict[labname] = dict()
             for i in range(n):
+                end = off[i + 1] if i < n - 1 else txtlen
                 if self.format_version <= 117:
                     self.value_label_dict[labname][val[i]] = (
-                        self._null_terminate(txt[off[i]:])
-                        )
+                        self._null_terminate(txt[off[i]:end]))
                 else:
                     self.value_label_dict[labname][val[i]] = (
-                        self._decode(txt[off[i]:])
-                        )
+                        self._decode(txt[off[i]:end]))
             if self.format_version >= 117:
                 self.path_or_buf.read(6)  # </lbl>
         self._value_labels_read = True
 
-
     def _read_strls(self):
         self.path_or_buf.seek(self.seek_strls)
-        self.GSO = {0 : ''}
+        # Wrap v_o in a string to allow uint64 values as keys on 32bit OS
+        self.GSO = {'0': ''}
         while True:
             if self.path_or_buf.read(3) != b'GSO':
                 break
 
             if self.format_version == 117:
-                v_o = struct.unpack(self.byteorder + 'Q', self.path_or_buf.read(8))[0]
+                v_o = struct.unpack(self.byteorder + 'Q',
+                                    self.path_or_buf.read(8))[0]
             else:
                 buf = self.path_or_buf.read(12)
                 # Only tested on little endian file on little endian machine.
@@ -1362,14 +1419,12 @@ def _read_strls(self):
                                    self.path_or_buf.read(4))[0]
             va = self.path_or_buf.read(length)
             if typ == 130:
-                encoding = 'utf-8'
-                if self.format_version == 117:
-                    encoding = self._encoding or self._default_encoding
-                va = va[0:-1].decode(encoding)
-            self.GSO[v_o] = va
+                va = va[0:-1].decode(self._encoding)
+            # Wrap v_o in a string to allow uint64 values as keys on 32bit OS
+            self.GSO[str(v_o)] = va
 
     # legacy
-    @Appender('DEPRECATED: ' + _data_method_doc)
+    @Appender(_data_method_doc)
     def data(self, **kwargs):
 
         import warnings
@@ -1381,17 +1436,8 @@ def data(self, **kwargs):
 
         return self.read(None, **kwargs)
 
-
-    def __iter__(self):
-        try:
-            if self._chunksize:
-                while True:
-                    yield self.read(self._chunksize)
-            else:
-                yield self.read()
-        except StopIteration:
-            pass
-
+    def __next__(self):
+        return self.read(nrows=self._chunksize or 1)
 
     def get_chunk(self, size=None):
         """
@@ -1410,19 +1456,19 @@ def get_chunk(self, size=None):
             size = self._chunksize
         return self.read(nrows=size)
 
-
     @Appender(_read_method_doc)
+    @deprecate_kwarg(old_arg_name='index', new_arg_name='index_col')
     def read(self, nrows=None, convert_dates=None,
-             convert_categoricals=None, index=None,
+             convert_categoricals=None, index_col=None,
              convert_missing=None, preserve_dtypes=None,
              columns=None, order_categoricals=None):
-
         # Handle empty file or chunk.  If reading incrementally raise
         # StopIteration.  If reading the whole thing return an empty
         # data frame.
         if (self.nobs == 0) and (nrows is None):
             self._can_read_value_labels = True
             self._data_read = True
+            self.close()
             return DataFrame(columns=self.varlist)
 
         # Handle options
@@ -1438,25 +1484,16 @@ def read(self, nrows=None, convert_dates=None,
             columns = self._columns
         if order_categoricals is None:
             order_categoricals = self._order_categoricals
+        if index_col is None:
+            index_col = self._index_col
 
         if nrows is None:
             nrows = self.nobs
 
-        if (self.format_version >= 117) and (self._dtype is None):
+        if (self.format_version >= 117) and (not self._value_labels_read):
             self._can_read_value_labels = True
             self._read_strls()
 
-        # Setup the dtype.
-        if self._dtype is None:
-            dtype = []  # Convert struct data types to numpy data type
-            for i, typ in enumerate(self.typlist):
-                if typ in self.NUMPY_TYPE_MAP:
-                    dtype.append(('s' + str(i), self.byteorder + self.NUMPY_TYPE_MAP[typ]))
-                else:
-                    dtype.append(('s' + str(i), 'S' + str(typ)))
-            dtype = np.dtype(dtype)
-            self._dtype = dtype
-
         # Read data
         dtype = self._dtype
         max_read_len = (self.nobs - self._lines_read) * dtype.itemsize
@@ -1465,7 +1502,9 @@ def read(self, nrows=None, convert_dates=None,
         if read_len <= 0:
             # Iterator has finished, should never be here unless
             # we are reading the file incrementally
-            self._read_value_labels()
+            if convert_categoricals:
+                self._read_value_labels()
+            self.close()
             raise StopIteration
         offset = self._lines_read * dtype.itemsize
         self.path_or_buf.seek(self.data_location + offset)
@@ -1484,59 +1523,74 @@ def read(self, nrows=None, convert_dates=None,
         if convert_categoricals:
             self._read_value_labels()
 
-        if len(data)==0:
-            data = DataFrame(columns=self.varlist, index=index)
+        if len(data) == 0:
+            data = DataFrame(columns=self.varlist)
         else:
-            data = DataFrame.from_records(data, index=index)
+            data = DataFrame.from_records(data)
             data.columns = self.varlist
 
         # If index is not specified, use actual row number rather than
         # restarting at 0 for each chunk.
-        if index is None:
+        if index_col is None:
             ix = np.arange(self._lines_read - read_lines, self._lines_read)
             data = data.set_index(ix)
 
         if columns is not None:
-            data = self._do_select_columns(data, columns)
+            try:
+                data = self._do_select_columns(data, columns)
+            except ValueError:
+                self.close()
+                raise
 
         # Decode strings
         for col, typ in zip(data, self.typlist):
             if type(typ) is int:
-                data[col] = data[col].apply(self._null_terminate, convert_dtype=True)
+                data[col] = data[col].apply(
+                    self._null_terminate, convert_dtype=True)
 
         data = self._insert_strls(data)
 
         cols_ = np.where(self.dtyplist)[0]
 
         # Convert columns (if needed) to match input type
-        index = data.index
+        ix = data.index
         requires_type_conversion = False
         data_formatted = []
         for i in cols_:
             if self.dtyplist[i] is not None:
                 col = data.columns[i]
                 dtype = data[col].dtype
-                if (dtype != np.dtype(object)) and (dtype != self.dtyplist[i]):
+                if dtype != np.dtype(object) and dtype != self.dtyplist[i]:
                     requires_type_conversion = True
-                    data_formatted.append((col, Series(data[col], index, self.dtyplist[i])))
+                    data_formatted.append(
+                        (col, Series(data[col], ix, self.dtyplist[i])))
                 else:
                     data_formatted.append((col, data[col]))
         if requires_type_conversion:
-            data = DataFrame.from_items(data_formatted)
+            data = DataFrame.from_dict(OrderedDict(data_formatted))
         del data_formatted
 
         self._do_convert_missing(data, convert_missing)
 
         if convert_dates:
-            cols = np.where(lmap(lambda x: x in _date_formats,
+            cols = np.where(lmap(lambda x: any(x.startswith(fmt)
+                                               for fmt in _date_formats),
                                  self.fmtlist))[0]
             for i in cols:
                 col = data.columns[i]
-                data[col] = _stata_elapsed_date_to_datetime_vec(data[col], self.fmtlist[i])
-
-        if convert_categoricals and self.value_label_dict:
-            data = self._do_convert_categoricals(data, self.value_label_dict, self.lbllist,
-                                             order_categoricals)
+                try:
+                    data[col] = _stata_elapsed_date_to_datetime_vec(
+                        data[col],
+                        self.fmtlist[i])
+                except ValueError:
+                    self.close()
+                    raise
+
+        if convert_categoricals and self.format_version > 108:
+            data = self._do_convert_categoricals(data,
+                                                 self.value_label_dict,
+                                                 self.lbllist,
+                                                 order_categoricals)
 
         if not preserve_dtypes:
             retyped_data = []
@@ -1551,7 +1605,10 @@ def read(self, nrows=None, convert_dates=None,
                     convert = True
                 retyped_data.append((col, data[col].astype(dtype)))
             if convert:
-                data = DataFrame.from_items(retyped_data)
+                data = DataFrame.from_dict(OrderedDict(retyped_data))
+
+        if index_col is not None:
+            data = data.set_index(data.pop(index_col))
 
         return data
 
@@ -1595,7 +1652,8 @@ def _insert_strls(self, data):
         for i, typ in enumerate(self.typlist):
             if typ != 'Q':
                 continue
-            data.iloc[:, i] = [self.GSO[k] for k in data.iloc[:, i]]
+            # Wrap v_o in a string to allow uint64 values as keys on 32bit OS
+            data.iloc[:, i] = [self.GSO[str(k)] for k in data.iloc[:, i]]
         return data
 
     def _do_select_columns(self, data, columns):
@@ -1629,8 +1687,8 @@ def _do_select_columns(self, data, columns):
 
         return data[columns]
 
-
-    def _do_convert_categoricals(self, data, value_label_dict, lbllist, order_categoricals):
+    def _do_convert_categoricals(self, data, value_label_dict, lbllist,
+                                 order_categoricals):
         """
         Converts categorical columns to Categorical type.
         """
@@ -1646,13 +1704,21 @@ def _do_convert_categoricals(self, data, value_label_dict, lbllist, order_catego
                         categories.append(value_label_dict[label][category])
                     else:
                         categories.append(category)  # Partially labeled
-                cat_data.categories = categories
+                try:
+                    cat_data.categories = categories
+                except ValueError:
+                    vc = Series(categories).value_counts()
+                    repeats = list(vc.index[vc > 1])
+                    repeats = '\n' + '-' * 80 + '\n'.join(repeats)
+                    msg = 'Value labels for column {0} are not unique. The ' \
+                          'repeated labels are:\n{1}'.format(col, repeats)
+                    raise ValueError(msg)
                 # TODO: is the next line needed above in the data(...) method?
                 cat_data = Series(cat_data, index=data.index)
                 cat_converted_data.append((col, cat_data))
             else:
                 cat_converted_data.append((col, data[col]))
-        data = DataFrame.from_items(cat_converted_data)
+        data = DataFrame.from_dict(OrderedDict(cat_converted_data))
         return data
 
     def data_label(self):
@@ -1663,7 +1729,7 @@ def variable_labels(self):
         """Returns variable labels as a dict, associating each variable name
         with corresponding label
         """
-        return dict(zip(self.varlist, self.vlblist))
+        return dict(zip(self.varlist, self._variable_labels))
 
     def value_labels(self):
         """Returns a dict, associating each variable name a dict, associating
@@ -1675,11 +1741,25 @@ def value_labels(self):
         return self.value_label_dict
 
 
-def _open_file_binary_write(fname, encoding):
+def _open_file_binary_write(fname):
+    """
+    Open a binary file or no-op if file-like
+
+    Parameters
+    ----------
+    fname : string path, path object or buffer
+
+    Returns
+    -------
+    file : file-like object
+        File object supporting write
+    own : bool
+        True if the file was created, otherwise False
+    """
     if hasattr(fname, 'write'):
-        #if 'b' not in fname.mode:
-        return fname
-    return open(fname, "wb")
+        # if 'b' not in fname.mode:
+        return fname, False
+    return open(fname, "wb"), True
 
 
 def _set_endianness(endianness):
@@ -1693,7 +1773,7 @@ def _set_endianness(endianness):
 
 def _pad_bytes(name, length):
     """
-    Takes a char string and pads it wih null bytes until it's length chars
+    Takes a char string and pads it with null bytes until it's length chars
     """
     return name + "\x00" * (length - len(name))
 
@@ -1706,7 +1786,7 @@ def _convert_datetime_to_stata_type(fmt):
                "%tq", "th", "%th", "ty", "%ty"]:
         return np.float64  # Stata expects doubles for SIFs
     else:
-        raise ValueError("fmt %s not understood" % fmt)
+        raise NotImplementedError("Format %s not implemented" % fmt)
 
 
 def _maybe_convert_to_int_keys(convert_dates, varlist):
@@ -1718,9 +1798,8 @@ def _maybe_convert_to_int_keys(convert_dates, varlist):
             new_dict.update({varlist.index(key): convert_dates[key]})
         else:
             if not isinstance(key, int):
-                raise ValueError(
-                    "convert_dates key is not in varlist and is not an int"
-                )
+                raise ValueError("convert_dates key must be a "
+                                 "column or an integer")
             new_dict.update({key: convert_dates[key]})
     return new_dict
 
@@ -1732,39 +1811,37 @@ def _dtype_to_stata_type(dtype, column):
     the dta spec.
     1 - 244 are strings of this length
                          Pandas    Stata
-    251 - chr(251) - for int8      byte
-    252 - chr(252) - for int16     int
-    253 - chr(253) - for int32     long
-    254 - chr(254) - for float32   float
-    255 - chr(255) - for double    double
+    251 - for int8      byte
+    252 - for int16     int
+    253 - for int32     long
+    254 - for float32   float
+    255 - for double    double
 
     If there are dates to convert, then dtype will already have the correct
     type inserted.
     """
     # TODO: expand to handle datetime to integer conversion
-    if dtype.type == np.string_:
-        return chr(dtype.itemsize)
-    elif dtype.type == np.object_:  # try to coerce it to the biggest string
-                                    # not memory efficient, what else could we
-                                    # do?
-        itemsize = max_len_string_array(com._ensure_object(column.values))
-        return chr(max(itemsize, 1))
+    if dtype.type == np.object_:  # try to coerce it to the biggest string
+        # not memory efficient, what else could we
+        # do?
+        itemsize = max_len_string_array(_ensure_object(column.values))
+        return max(itemsize, 1)
     elif dtype == np.float64:
-        return chr(255)
+        return 255
     elif dtype == np.float32:
-        return chr(254)
+        return 254
     elif dtype == np.int32:
-        return chr(253)
+        return 253
     elif dtype == np.int16:
-        return chr(252)
+        return 252
     elif dtype == np.int8:
-        return chr(251)
+        return 251
     else:  # pragma : no cover
-        raise ValueError("Data type %s not currently understood. "
-                         "Please report an error to the developers." % dtype)
+        raise NotImplementedError("Data type %s not supported." % dtype)
 
 
-def _dtype_to_default_stata_fmt(dtype, column):
+def _dtype_to_default_stata_fmt(dtype, column, dta_version=114,
+                                force_strl=False):
     """
     Maps numpy dtype to stata's default format for this type. Not terribly
     important since users can change this in Stata. Semantics are
@@ -1777,17 +1854,27 @@ def _dtype_to_default_stata_fmt(dtype, column):
     int32   -> "%12.0g"
     int16   -> "%8.0g"
     int8    -> "%8.0g"
+    strl    -> "%9s"
     """
     # TODO: Refactor to combine type with format
     # TODO: expand this to handle a default datetime format?
+    if dta_version < 117:
+        max_str_len = 244
+    else:
+        max_str_len = 2045
+        if force_strl:
+            return '%9s'
     if dtype.type == np.object_:
         inferred_dtype = infer_dtype(column.dropna())
-        if not (inferred_dtype in ('string', 'unicode')
-                or len(column) == 0):
+        if not (inferred_dtype in ('string', 'unicode') or
+                len(column) == 0):
             raise ValueError('Writing general object arrays is not supported')
-        itemsize = max_len_string_array(com._ensure_object(column.values))
-        if itemsize > 244:
-            raise ValueError(excessive_string_length_error % column.name)
+        itemsize = max_len_string_array(_ensure_object(column.values))
+        if itemsize > max_str_len:
+            if dta_version >= 117:
+                return '%9s'
+            else:
+                raise ValueError(excessive_string_length_error % column.name)
         return "%" + str(max(itemsize, 1)) + "s"
     elif dtype == np.float64:
         return "%10.0g"
@@ -1798,35 +1885,47 @@ def _dtype_to_default_stata_fmt(dtype, column):
     elif dtype == np.int8 or dtype == np.int16:
         return "%8.0g"
     else:  # pragma : no cover
-        raise ValueError("Data type %s not currently understood. "
-                         "Please report an error to the developers." % dtype)
+        raise NotImplementedError("Data type %s not supported." % dtype)
 
 
 class StataWriter(StataParser):
     """
-    A class for writing Stata binary dta files from array-like objects
+    A class for writing Stata binary dta files
 
     Parameters
     ----------
-    fname : file path or buffer
-        Where to save the dta file.
-    data : array-like
-        Array-like input to save. Pandas objects are also accepted.
+    fname : path (string), buffer or path object
+        string, path object (pathlib.Path or py._path.local.LocalPath) or
+        object implementing a binary write() functions. If using a buffer
+        then the buffer will not be automatically closed after the file
+        is written.
+
+        .. versionadded:: 0.23.0 support for pathlib, py.path.
+
+    data : DataFrame
+        Input to save
     convert_dates : dict
-        Dictionary mapping column of datetime types to the stata internal
-        format that you want to use for the dates. Options are
-        'tc', 'td', 'tm', 'tw', 'th', 'tq', 'ty'. Column can be either a
-        number or a name.
+        Dictionary mapping columns containing datetime types to stata internal
+        format to use when writing the dates. Options are 'tc', 'td', 'tm',
+        'tw', 'th', 'tq', 'ty'. Column can be either an integer or a name.
+        Datetime columns that do not have a conversion type specified will be
+        converted to 'tc'. Raises NotImplementedError if a datetime column has
+        timezone information
+    write_index : bool
+        Write the index to Stata dataset.
     encoding : str
-        Default is latin-1. Note that Stata does not support unicode.
+        Default is latin-1. Only latin-1 and ascii are supported.
     byteorder : str
-        Can be ">", "<", "little", or "big". The default is None which uses
-        `sys.byteorder`
+        Can be ">", "<", "little", or "big". default is `sys.byteorder`
     time_stamp : datetime
-        A date time to use when writing the file.  Can be None, in which
-        case the current time is used.
-    dataset_label : str
-        A label for the data set.  Should be 80 characters or smaller.
+        A datetime to use as file creation date.  Default is the current time
+    data_label : str
+        A label for the data set.  Must be 80 characters or smaller.
+    variable_labels : dict
+        Dictionary containing columns as keys and variable labels as values.
+        Each label must be 80 characters or smaller.
+
+        .. versionadded:: 0.19.0
 
     Returns
     -------
@@ -1834,6 +1933,17 @@ class StataWriter(StataParser):
         The StataWriter instance has a write_file method, which will
         write the file to the given `fname`.
 
+    Raises
+    ------
+    NotImplementedError
+        * If datetimes contain timezone information
+    ValueError
+        * Columns listed in convert_dates are neither datetime64[ns]
+          or datetime.datetime
+        * Column dtype is not representable in Stata
+        * Column listed in convert_dates is not in DataFrame
+        * Categorical label contains more than 32,000 characters
+
     Examples
     --------
     >>> import pandas as pd
@@ -1847,24 +1957,30 @@ class StataWriter(StataParser):
     >>> writer = StataWriter('./date_data_file.dta', data, {'date' : 'tw'})
     >>> writer.write_file()
     """
+
+    _max_string_length = 244
+
+    @deprecate_kwarg(old_arg_name='encoding', new_arg_name=None)
     def __init__(self, fname, data, convert_dates=None, write_index=True,
                  encoding="latin-1", byteorder=None, time_stamp=None,
-                 data_label=None):
-        super(StataWriter, self).__init__(encoding)
-        self._convert_dates = convert_dates
+                 data_label=None, variable_labels=None):
+        super(StataWriter, self).__init__()
+        self._convert_dates = {} if convert_dates is None else convert_dates
         self._write_index = write_index
+        self._encoding = 'latin-1'
         self._time_stamp = time_stamp
         self._data_label = data_label
+        self._variable_labels = variable_labels
+        self._own_file = True
         # attach nobs, nvars, data, varlist, typlist
         self._prepare_pandas(data)
 
         if byteorder is None:
             byteorder = sys.byteorder
         self._byteorder = _set_endianness(byteorder)
-        self._file = _open_file_binary_write(
-            fname, self._encoding or self._default_encoding
-        )
+        self._fname = _stringify_path(fname)
         self.type_converters = {253: np.int32, 252: np.int16, 251: np.int8}
+        self._converted_names = {}
 
     def _write(self, to_write):
         """
@@ -1880,22 +1996,21 @@ def _prepare_categoricals(self, data):
         """Check for categorical columns, retain categorical information for
         Stata file and convert categorical data to int"""
 
-        is_cat = [com.is_categorical_dtype(data[col]) for col in data]
+        is_cat = [is_categorical_dtype(data[col]) for col in data]
         self._is_col_cat = is_cat
         self._value_labels = []
         if not any(is_cat):
             return data
 
         get_base_missing_value = StataMissingValue.get_base_missing_value
-        index = data.index
         data_formatted = []
         for col, col_is_cat in zip(data, is_cat):
             if col_is_cat:
                 self._value_labels.append(StataValueLabel(data[col]))
                 dtype = data[col].cat.codes.dtype
                 if dtype == np.int64:
-                    raise ValueError('It is not possible to export int64-based '
-                                     'categorical data to Stata.')
+                    raise ValueError('It is not possible to export '
+                                     'int64-based categorical data to Stata.')
                 values = data[col].cat.codes.values.copy()
 
                 # Upcast if needed so that correct missing values can be set
@@ -1910,11 +2025,10 @@ def _prepare_categoricals(self, data):
 
                 # Replace missing values with Stata missing value for type
                 values[values == -1] = get_base_missing_value(dtype)
-                data_formatted.append((col, values, index))
-
+                data_formatted.append((col, values))
             else:
                 data_formatted.append((col, data[col]))
-        return DataFrame.from_items(data_formatted)
+        return DataFrame.from_dict(OrderedDict(data_formatted))
 
     def _replace_nans(self, data):
         # return data
@@ -1931,19 +2045,24 @@ def _replace_nans(self, data):
 
         return data
 
+    def _update_strl_names(self):
+        """No-op, forward compatibility"""
+        pass
+
     def _check_column_names(self, data):
-        """Checks column names to ensure that they are valid Stata column names.
+        """
+        Checks column names to ensure that they are valid Stata column names.
         This includes checks for:
             * Non-string names
             * Stata keywords
             * Variables that start with numbers
             * Variables with names that are too long
 
-        When an illegal variable name is detected, it is converted, and if dates
-        are exported, the variable name is propogated to the date conversion
-        dictionary
+        When an illegal variable name is detected, it is converted, and if
+        dates are exported, the variable name is propagated to the date
+        conversion dictionary
         """
-        converted_names = []
+        converted_names = {}
         columns = list(data.columns)
         original_columns = columns[:]
 
@@ -1975,13 +2094,7 @@ def _check_column_names(self, data):
                     name = '_' + str(duplicate_var_id) + name
                     name = name[:min(len(name), 32)]
                     duplicate_var_id += 1
-
-                # need to possibly encode the orig name if its unicode
-                try:
-                    orig_name = orig_name.encode('utf-8')
-                except:
-                    pass
-                converted_names.append('{0}   ->   {1}'.format(orig_name, name))
+                converted_names[orig_name] = name
 
             columns[j] = name
 
@@ -1996,14 +2109,33 @@ def _check_column_names(self, data):
 
         if converted_names:
             import warnings
+            conversion_warning = []
+            for orig_name, name in converted_names.items():
+                # need to possibly encode the orig name if its unicode
+                try:
+                    orig_name = orig_name.encode('utf-8')
+                except (UnicodeDecodeError, AttributeError):
+                    pass
+                msg = '{0}   ->   {1}'.format(orig_name, name)
+                conversion_warning.append(msg)
 
-            ws = invalid_name_doc.format('\n    '.join(converted_names))
+            ws = invalid_name_doc.format('\n    '.join(conversion_warning))
             warnings.warn(ws, InvalidColumnName)
 
+        self._converted_names = converted_names
+        self._update_strl_names()
+
         return data
 
+    def _set_formats_and_types(self, data, dtypes):
+        self.typlist = []
+        self.fmtlist = []
+        for col, dtype in dtypes.iteritems():
+            self.fmtlist.append(_dtype_to_default_stata_fmt(dtype, data[col]))
+            self.typlist.append(_dtype_to_stata_type(dtype, data[col]))
+
     def _prepare_pandas(self, data):
-        #NOTE: we might need a different API / class for pandas objects so
+        # NOTE: we might need a different API / class for pandas objects so
         # we can set different semantics - handle this with a PR to pandas.io
 
         data = data.copy()
@@ -2015,6 +2147,7 @@ def _prepare_pandas(self, data):
         data = self._check_column_names(data)
 
         # Check columns for compatibility with stata, upcast if necessary
+        # Raise if outside the supported range
         data = _cast_to_stata_types(data)
 
         # Replace NaNs with Stata missing values
@@ -2028,20 +2161,23 @@ def _prepare_pandas(self, data):
         self.varlist = data.columns.tolist()
 
         dtypes = data.dtypes
-        if self._convert_dates is not None:
-            self._convert_dates = _maybe_convert_to_int_keys(
-                self._convert_dates, self.varlist
+
+        # Ensure all date columns are converted
+        for col in data:
+            if col in self._convert_dates:
+                continue
+            if is_datetime64_dtype(data[col]):
+                self._convert_dates[col] = 'tc'
+
+        self._convert_dates = _maybe_convert_to_int_keys(self._convert_dates,
+                                                         self.varlist)
+        for key in self._convert_dates:
+            new_type = _convert_datetime_to_stata_type(
+                self._convert_dates[key]
             )
-            for key in self._convert_dates:
-                new_type = _convert_datetime_to_stata_type(
-                    self._convert_dates[key]
-                )
-                dtypes[key] = np.dtype(new_type)
-        self.typlist = []
-        self.fmtlist = []
-        for col, dtype in dtypes.iteritems():
-            self.fmtlist.append(_dtype_to_default_stata_fmt(dtype, data[col]))
-            self.typlist.append(_dtype_to_stata_type(dtype, data[col]))
+            dtypes[key] = np.dtype(new_type)
+
+        self._set_formats_and_types(data, dtypes)
 
         # set the given format for the datetime cols
         if self._convert_dates is not None:
@@ -2049,16 +2185,64 @@ def _prepare_pandas(self, data):
                 self.fmtlist[key] = self._convert_dates[key]
 
     def write_file(self):
-        self._write_header(time_stamp=self._time_stamp,
-                           data_label=self._data_label)
-        self._write_descriptors()
-        self._write_variable_labels()
-        # write 5 zeros for expansion fields
+        self._file, self._own_file = _open_file_binary_write(self._fname)
+        try:
+            self._write_header(time_stamp=self._time_stamp,
+                               data_label=self._data_label)
+            self._write_map()
+            self._write_variable_types()
+            self._write_varnames()
+            self._write_sortlist()
+            self._write_formats()
+            self._write_value_label_names()
+            self._write_variable_labels()
+            self._write_expansion_fields()
+            self._write_characteristics()
+            self._prepare_data()
+            self._write_data()
+            self._write_strls()
+            self._write_value_labels()
+            self._write_file_close_tag()
+            self._write_map()
+        finally:
+            self._close()
+
+    def _close(self):
+        """
+        Close the file if it was created by the writer.
+
+        If a buffer or file-like object was passed in, for example a GzipFile,
+        then leave this file open for the caller to close. In either case,
+        attempt to flush the file contents to ensure they are written to disk
+        (if supported)
+        """
+        # Some file-like objects might not support flush
+        try:
+            self._file.flush()
+        except AttributeError:
+            pass
+        if self._own_file:
+            self._file.close()
+
+    def _write_map(self):
+        """No-op, future compatibility"""
+        pass
+
+    def _write_file_close_tag(self):
+        """No-op, future compatibility"""
+        pass
+
+    def _write_characteristics(self):
+        """No-op, future compatibility"""
+        pass
+
+    def _write_strls(self):
+        """No-op, future compatibility"""
+        pass
+
+    def _write_expansion_fields(self):
+        """Write 5 zeros for expansion fields"""
         self._write(_pad_bytes("", 5))
-        self._prepare_data()
-        self._write_data()
-        self._write_value_labels()
-        self._file.close()
 
     def _write_value_labels(self):
         for vl in self._value_labels:
@@ -2076,9 +2260,9 @@ def _write_header(self, data_label=None, time_stamp=None):
         # unused
         self._write("\x00")
         # number of vars, 2 bytes
-        self._file.write(struct.pack(byteorder+"h", self.nvar)[:2])
+        self._file.write(struct.pack(byteorder + "h", self.nvar)[:2])
         # number of obs, 4 bytes
-        self._file.write(struct.pack(byteorder+"i", self.nobs)[:4])
+        self._file.write(struct.pack(byteorder + "i", self.nobs)[:4])
         # data label 81 bytes, char, null terminated
         if data_label is None:
             self._file.write(self._null_terminate(_pad_bytes("", 80)))
@@ -2092,17 +2276,21 @@ def _write_header(self, data_label=None, time_stamp=None):
             time_stamp = datetime.datetime.now()
         elif not isinstance(time_stamp, datetime.datetime):
             raise ValueError("time_stamp should be datetime type")
-        self._file.write(
-            self._null_terminate(time_stamp.strftime("%d %b %Y %H:%M"))
-        )
-
-    def _write_descriptors(self, typlist=None, varlist=None, srtlist=None,
-                           fmtlist=None, lbllist=None):
-        nvar = self.nvar
-        # typlist, length nvar, format byte array
+        # GH #13856
+        # Avoid locale-specific month conversion
+        months = ['Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun', 'Jul', 'Aug',
+                  'Sep', 'Oct', 'Nov', 'Dec']
+        month_lookup = {i + 1: month for i, month in enumerate(months)}
+        ts = (time_stamp.strftime("%d ") +
+              month_lookup[time_stamp.month] +
+              time_stamp.strftime(" %Y %H:%M"))
+        self._file.write(self._null_terminate(ts))
+
+    def _write_variable_types(self):
         for typ in self.typlist:
-            self._write(typ)
+            self._file.write(struct.pack('B', typ))
 
+    def _write_varnames(self):
         # varlist names are checked by _check_column_names
         # varlist, requires null terminated
         for name in self.varlist:
@@ -2110,16 +2298,19 @@ def _write_descriptors(self, typlist=None, varlist=None, srtlist=None,
             name = _pad_bytes(name[:32], 33)
             self._write(name)
 
+    def _write_sortlist(self):
         # srtlist, 2*(nvar+1), int array, encoded by byteorder
-        srtlist = _pad_bytes("", (2*(nvar+1)))
+        srtlist = _pad_bytes("", 2 * (self.nvar + 1))
         self._write(srtlist)
 
+    def _write_formats(self):
         # fmtlist, 49*nvar, char array
         for fmt in self.fmtlist:
             self._write(_pad_bytes(fmt, 49))
 
+    def _write_value_label_names(self):
         # lbllist, 33*nvar, char array
-        for i in range(nvar):
+        for i in range(self.nvar):
             # Use variable name when categorical
             if self._is_col_cat[i]:
                 name = self.varlist[i]
@@ -2129,11 +2320,33 @@ def _write_descriptors(self, typlist=None, varlist=None, srtlist=None,
             else:  # Default is empty label
                 self._write(_pad_bytes("", 33))
 
-    def _write_variable_labels(self, labels=None):
-        nvar = self.nvar
-        if labels is None:
-            for i in range(nvar):
-                self._write(_pad_bytes("", 81))
+    def _write_variable_labels(self):
+        # Missing labels are 80 blank characters plus null termination
+        blank = _pad_bytes('', 81)
+
+        if self._variable_labels is None:
+            for i in range(self.nvar):
+                self._write(blank)
+            return
+
+        for col in self.data:
+            if col in self._variable_labels:
+                label = self._variable_labels[col]
+                if len(label) > 80:
+                    raise ValueError('Variable labels must be 80 characters '
+                                     'or fewer')
+                is_latin1 = all(ord(c) < 256 for c in label)
+                if not is_latin1:
+                    raise ValueError('Variable labels must contain only '
+                                     'characters that can be encoded in '
+                                     'Latin-1')
+                self._write(_pad_bytes(label, 81))
+            else:
+                self._write(blank)
+
+    def _convert_strls(self, data):
+        """No-op, future compatibility"""
+        return data
 
     def _prepare_data(self):
         data = self.data
@@ -2145,33 +2358,40 @@ def _prepare_data(self):
                 if i in convert_dates:
                     data[col] = _datetime_to_stata_elapsed_vec(data[col],
                                                                self.fmtlist[i])
+        # 2. Convert strls
+        data = self._convert_strls(data)
 
-        # 2. Convert bad string data to '' and pad to correct length
-        dtype = []
+        # 3. Convert bad string data to '' and pad to correct length
+        dtypes = []
         data_cols = []
         has_strings = False
+        native_byteorder = self._byteorder == _set_endianness(sys.byteorder)
         for i, col in enumerate(data):
-            typ = ord(typlist[i])
-            if typ <= 244:
+            typ = typlist[i]
+            if typ <= self._max_string_length:
                 has_strings = True
                 data[col] = data[col].fillna('').apply(_pad_bytes, args=(typ,))
                 stype = 'S%d' % typ
-                dtype.append(('c'+str(i), stype))
+                dtypes.append(('c' + str(i), stype))
                 string = data[col].str.encode(self._encoding)
                 data_cols.append(string.values.astype(stype))
             else:
-                dtype.append(('c'+str(i), data[col].dtype))
-                data_cols.append(data[col].values)
-        dtype = np.dtype(dtype)
-
-        if has_strings:
-            self.data = np.fromiter(zip(*data_cols), dtype=dtype)
+                values = data[col].values
+                dtype = data[col].dtype
+                if not native_byteorder:
+                    dtype = dtype.newbyteorder(self._byteorder)
+                dtypes.append(('c' + str(i), dtype))
+                data_cols.append(values)
+        dtypes = np.dtype(dtypes)
+
+        if has_strings or not native_byteorder:
+            self.data = np.fromiter(zip(*data_cols), dtype=dtypes)
         else:
             self.data = data.to_records(index=False)
 
     def _write_data(self):
         data = self.data
-        data.tofile(self._file)
+        self._file.write(data.tobytes())
 
     def _null_terminate(self, s, as_string=False):
         null_byte = '\x00'
@@ -2181,3 +2401,565 @@ def _null_terminate(self, s, as_string=False):
         else:
             s += null_byte
             return s
+
+
+def _dtype_to_stata_type_117(dtype, column, force_strl):
+    """
+    Converts dtype types to stata types. Returns the byte of the given ordinal.
+    See TYPE_MAP and comments for an explanation. This is also explained in
+    the dta spec.
+    1 - 2045 are strings of this length
+                Pandas    Stata
+    32768 - for object    strL
+    65526 - for int8      byte
+    65527 - for int16     int
+    65528 - for int32     long
+    65529 - for float32   float
+    65530 - for double    double
+
+    If there are dates to convert, then dtype will already have the correct
+    type inserted.
+    """
+    # TODO: expand to handle datetime to integer conversion
+    if force_strl:
+        return 32768
+    if dtype.type == np.object_:  # try to coerce it to the biggest string
+        # not memory efficient, what else could we
+        # do?
+        itemsize = max_len_string_array(_ensure_object(column.values))
+        itemsize = max(itemsize, 1)
+        if itemsize <= 2045:
+            return itemsize
+        return 32768
+    elif dtype == np.float64:
+        return 65526
+    elif dtype == np.float32:
+        return 65527
+    elif dtype == np.int32:
+        return 65528
+    elif dtype == np.int16:
+        return 65529
+    elif dtype == np.int8:
+        return 65530
+    else:  # pragma : no cover
+        raise NotImplementedError("Data type %s not supported." % dtype)
+
+
+def _bytes(s, encoding):
+    if compat.PY3:
+        return bytes(s, encoding)
+    else:
+        return bytes(s.encode(encoding))
+
+
+def _pad_bytes_new(name, length):
+    """
+    Takes a bytes instance and pads it with null bytes until it's length chars.
+    """
+    if isinstance(name, string_types):
+        name = _bytes(name, 'utf-8')
+    return name + b'\x00' * (length - len(name))
+
+
+class StataStrLWriter(object):
+    """
+    Converter for Stata StrLs
+
+    Stata StrLs map 8 byte values to strings which are stored using a
+    dictionary-like format where strings are keyed to two values.
+
+    Parameters
+    ----------
+    df : DataFrame
+        DataFrame to convert
+    columns : list
+        List of columns names to convert to StrL
+    version : int, optional
+        dta version.  Currently supports 117, 118 and 119
+    byteorder : str, optional
+        Can be ">", "<", "little", or "big". default is `sys.byteorder`
+
+    Notes
+    -----
+    Supports creation of the StrL block of a dta file for dta versions
+    117, 118 and 119.  These differ in how the GSO is stored.  118 and
+    119 store the GSO lookup value as a uint32 and a uint64, while 117
+    uses two uint32s. 118 and 119 also encode all strings as unicode
+    which is required by the format.  117 uses 'latin-1' a fixed width
+    encoding that extends the 7-bit ascii table with an additional 128
+    characters.
+    """
+
+    def __init__(self, df, columns, version=117, byteorder=None):
+        if version not in (117, 118, 119):
+            raise ValueError('Only dta versions 117, 118 and 119 supported')
+        self._dta_ver = version
+
+        self.df = df
+        self.columns = columns
+        self._gso_table = OrderedDict((('', (0, 0)),))
+        if byteorder is None:
+            byteorder = sys.byteorder
+        self._byteorder = _set_endianness(byteorder)
+
+        gso_v_type = 'I'  # uint32
+        gso_o_type = 'Q'  # uint64
+        self._encoding = 'utf-8'
+        if version == 117:
+            o_size = 4
+            gso_o_type = 'I'  # 117 used uint32
+            self._encoding = 'latin-1'
+        elif version == 118:
+            o_size = 6
+        else:  # version == 119
+            o_size = 5
+        self._o_offet = 2 ** (8 * (8 - o_size))
+        self._gso_o_type = gso_o_type
+        self._gso_v_type = gso_v_type
+
+    def _convert_key(self, key):
+        v, o = key
+        return v + self._o_offet * o
+
+    def generate_table(self):
+        """
+        Generates the GSO lookup table for the DataFRame
+
+        Returns
+        -------
+        gso_table : OrderedDict
+            Ordered dictionary using the string found as keys
+            and their lookup position (v,o) as values
+        gso_df : DataFrame
+            DataFrame where strl columns have been converted to
+            (v,o) values
+
+        Notes
+        -----
+        Modifies the DataFrame in-place.
+
+        The DataFrame returned encodes the (v,o) values as uint64s. The
+        encoding depends on teh dta version, and can be expressed as
+
+        enc = v + o * 2 ** (o_size * 8)
+
+        so that v is stored in the lower bits and o is in the upper
+        bits. o_size is
+
+          * 117: 4
+          * 118: 6
+          * 119: 5
+        """
+
+        gso_table = self._gso_table
+        gso_df = self.df
+        columns = list(gso_df.columns)
+        selected = gso_df[self.columns]
+        col_index = [(col, columns.index(col)) for col in self.columns]
+        keys = np.empty(selected.shape, dtype=np.uint64)
+        for o, (idx, row) in enumerate(selected.iterrows()):
+            for j, (col, v) in enumerate(col_index):
+                val = row[col]
+                key = gso_table.get(val, None)
+                if key is None:
+                    # Stata prefers human numbers
+                    key = (v + 1, o + 1)
+                    gso_table[val] = key
+                keys[o, j] = self._convert_key(key)
+        for i, col in enumerate(self.columns):
+            gso_df[col] = keys[:, i]
+
+        return gso_table, gso_df
+
+    def _encode(self, s):
+        """
+        Python 3 compatibility shim
+        """
+        if compat.PY3:
+            return s.encode(self._encoding)
+        else:
+            if isinstance(s, text_type):
+                return s.encode(self._encoding)
+            return s
+
+    def generate_blob(self, gso_table):
+        """
+        Generates the binary blob of GSOs that is written to the dta file.
+
+        Parameters
+        ----------
+        gso_table : OrderedDict
+            Ordered dictionary (str, vo)
+
+        Returns
+        -------
+        gso : bytes
+            Binary content of dta file to be placed between strl tags
+
+        Notes
+        -----
+        Output format depends on dta version.  117 uses two uint32s to
+        express v and o while 118+ uses a uint32 for v and a uint64 for o.
+        """
+        # Format information
+        # Length includes null term
+        # 117
+        # GSOvvvvooootllllxxxxxxxxxxxxxxx...x
+        #  3  u4  u4 u1 u4  string + null term
+        #
+        # 118, 119
+        # GSOvvvvooooooootllllxxxxxxxxxxxxxxx...x
+        #  3  u4   u8   u1 u4    string + null term
+
+        bio = BytesIO()
+        gso = _bytes('GSO', 'ascii')
+        gso_type = struct.pack(self._byteorder + 'B', 130)
+        null = struct.pack(self._byteorder + 'B', 0)
+        v_type = self._byteorder + self._gso_v_type
+        o_type = self._byteorder + self._gso_o_type
+        len_type = self._byteorder + 'I'
+        for strl, vo in gso_table.items():
+            if vo == (0, 0):
+                continue
+            v, o = vo
+
+            # GSO
+            bio.write(gso)
+
+            # vvvv
+            bio.write(struct.pack(v_type, v))
+
+            # oooo / oooooooo
+            bio.write(struct.pack(o_type, o))
+
+            # t
+            bio.write(gso_type)
+
+            # llll
+            encoded = self._encode(strl)
+            bio.write(struct.pack(len_type, len(encoded) + 1))
+
+            # xxx...xxx
+            s = _bytes(strl, 'utf-8')
+            bio.write(s)
+            bio.write(null)
+
+        bio.seek(0)
+        return bio.read()
+
+
+class StataWriter117(StataWriter):
+    """
+    A class for writing Stata binary dta files in Stata 13 format (117)
+
+    .. versionadded:: 0.23.0
+
+    Parameters
+    ----------
+    fname : path (string), buffer or path object
+        string, path object (pathlib.Path or py._path.local.LocalPath) or
+        object implementing a binary write() functions. If using a buffer
+        then the buffer will not be automatically closed after the file
+        is written.
+    data : DataFrame
+        Input to save
+    convert_dates : dict
+        Dictionary mapping columns containing datetime types to stata internal
+        format to use when writing the dates. Options are 'tc', 'td', 'tm',
+        'tw', 'th', 'tq', 'ty'. Column can be either an integer or a name.
+        Datetime columns that do not have a conversion type specified will be
+        converted to 'tc'. Raises NotImplementedError if a datetime column has
+        timezone information
+    write_index : bool
+        Write the index to Stata dataset.
+    encoding : str
+        Default is latin-1. Only latin-1 and ascii are supported.
+    byteorder : str
+        Can be ">", "<", "little", or "big". default is `sys.byteorder`
+    time_stamp : datetime
+        A datetime to use as file creation date.  Default is the current time
+    data_label : str
+        A label for the data set.  Must be 80 characters or smaller.
+    variable_labels : dict
+        Dictionary containing columns as keys and variable labels as values.
+        Each label must be 80 characters or smaller.
+    convert_strl : list
+        List of columns names to convert to Stata StrL format.  Columns with
+        more than 2045 characters are aautomatically written as StrL.
+        Smaller columns can be converted by including the column name.  Using
+        StrLs can reduce output file size when strings are longer than 8
+        characters, and either frequently repeated or sparse.
+
+    Returns
+    -------
+    writer : StataWriter117 instance
+        The StataWriter117 instance has a write_file method, which will
+        write the file to the given `fname`.
+
+    Raises
+    ------
+    NotImplementedError
+        * If datetimes contain timezone information
+    ValueError
+        * Columns listed in convert_dates are neither datetime64[ns]
+          or datetime.datetime
+        * Column dtype is not representable in Stata
+        * Column listed in convert_dates is not in DataFrame
+        * Categorical label contains more than 32,000 characters
+
+    Examples
+    --------
+    >>> import pandas as pd
+    >>> from pandas.io.stata import StataWriter117
+    >>> data = pd.DataFrame([[1.0, 1, 'a']], columns=['a', 'b', 'c'])
+    >>> writer = StataWriter117('./data_file.dta', data)
+    >>> writer.write_file()
+
+    Or with long strings stored in strl format
+
+    >>> data = pd.DataFrame([['A relatively long string'], [''], ['']],
+    ...                     columns=['strls'])
+    >>> writer = StataWriter117('./data_file_with_long_strings.dta', data,
+    ...                         convert_strl=['strls'])
+    >>> writer.write_file()
+    """
+
+    _max_string_length = 2045
+
+    @deprecate_kwarg(old_arg_name='encoding', new_arg_name=None)
+    def __init__(self, fname, data, convert_dates=None, write_index=True,
+                 encoding="latin-1", byteorder=None, time_stamp=None,
+                 data_label=None, variable_labels=None, convert_strl=None):
+        # Shallow copy since convert_strl might be modified later
+        self._convert_strl = [] if convert_strl is None else convert_strl[:]
+
+        super(StataWriter117, self).__init__(fname, data, convert_dates,
+                                             write_index, byteorder=byteorder,
+                                             time_stamp=time_stamp,
+                                             data_label=data_label,
+                                             variable_labels=variable_labels)
+        self._map = None
+        self._strl_blob = None
+
+    @staticmethod
+    def _tag(val, tag):
+        """Surround val with <tag></tag>"""
+        if isinstance(val, str) and compat.PY3:
+            val = _bytes(val, 'utf-8')
+        return (_bytes('<' + tag + '>', 'utf-8') + val +
+                _bytes('</' + tag + '>', 'utf-8'))
+
+    def _update_map(self, tag):
+        """Update map location for tag with file position"""
+        self._map[tag] = self._file.tell()
+
+    def _write_header(self, data_label=None, time_stamp=None):
+        """Write the file header"""
+        byteorder = self._byteorder
+        self._file.write(_bytes('<stata_dta>', 'utf-8'))
+        bio = BytesIO()
+        # ds_format - 117
+        bio.write(self._tag(_bytes('117', 'utf-8'), 'release'))
+        # byteorder
+        bio.write(self._tag(byteorder == ">" and "MSF" or "LSF", 'byteorder'))
+        # number of vars, 2 bytes
+        assert self.nvar < 2 ** 16
+        bio.write(self._tag(struct.pack(byteorder + "H", self.nvar), 'K'))
+        # number of obs, 4 bytes
+        bio.write(self._tag(struct.pack(byteorder + "I", self.nobs), 'N'))
+        # data label 81 bytes, char, null terminated
+        label = data_label[:80] if data_label is not None else ''
+        label_len = struct.pack(byteorder + "B", len(label))
+        label = label_len + _bytes(label, 'utf-8')
+        bio.write(self._tag(label, 'label'))
+        # time stamp, 18 bytes, char, null terminated
+        # format dd Mon yyyy hh:mm
+        if time_stamp is None:
+            time_stamp = datetime.datetime.now()
+        elif not isinstance(time_stamp, datetime.datetime):
+            raise ValueError("time_stamp should be datetime type")
+        # Avoid locale-specific month conversion
+        months = ['Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun', 'Jul', 'Aug',
+                  'Sep', 'Oct', 'Nov', 'Dec']
+        month_lookup = {i + 1: month for i, month in enumerate(months)}
+        ts = (time_stamp.strftime("%d ") +
+              month_lookup[time_stamp.month] +
+              time_stamp.strftime(" %Y %H:%M"))
+        # '\x11' added due to inspection of Stata file
+        ts = b'\x11' + _bytes(ts, 'utf8')
+        bio.write(self._tag(ts, 'timestamp'))
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'header'))
+
+    def _write_map(self):
+        """Called twice during file write. The first populates the values in
+        the map with 0s.  The second call writes the final map locations when
+        all blocks have been written."""
+        if self._map is None:
+            self._map = OrderedDict((('stata_data', 0),
+                                     ('map', self._file.tell()),
+                                     ('variable_types', 0),
+                                     ('varnames', 0),
+                                     ('sortlist', 0),
+                                     ('formats', 0),
+                                     ('value_label_names', 0),
+                                     ('variable_labels', 0),
+                                     ('characteristics', 0),
+                                     ('data', 0),
+                                     ('strls', 0),
+                                     ('value_labels', 0),
+                                     ('stata_data_close', 0),
+                                     ('end-of-file', 0)))
+        # Move to start of map
+        self._file.seek(self._map['map'])
+        bio = BytesIO()
+        for val in self._map.values():
+            bio.write(struct.pack(self._byteorder + 'Q', val))
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'map'))
+
+    def _write_variable_types(self):
+        self._update_map('variable_types')
+        bio = BytesIO()
+        for typ in self.typlist:
+            bio.write(struct.pack(self._byteorder + 'H', typ))
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'variable_types'))
+
+    def _write_varnames(self):
+        self._update_map('varnames')
+        bio = BytesIO()
+        for name in self.varlist:
+            name = self._null_terminate(name, True)
+            name = _pad_bytes_new(name[:32], 33)
+            bio.write(name)
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'varnames'))
+
+    def _write_sortlist(self):
+        self._update_map('sortlist')
+        self._file.write(self._tag(b'\x00\00' * (self.nvar + 1), 'sortlist'))
+
+    def _write_formats(self):
+        self._update_map('formats')
+        bio = BytesIO()
+        for fmt in self.fmtlist:
+            bio.write(_pad_bytes_new(fmt, 49))
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'formats'))
+
+    def _write_value_label_names(self):
+        self._update_map('value_label_names')
+        bio = BytesIO()
+        for i in range(self.nvar):
+            # Use variable name when categorical
+            name = ''  # default name
+            if self._is_col_cat[i]:
+                name = self.varlist[i]
+            name = self._null_terminate(name, True)
+            name = _pad_bytes_new(name[:32], 33)
+            bio.write(name)
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'value_label_names'))
+
+    def _write_variable_labels(self):
+        # Missing labels are 80 blank characters plus null termination
+        self._update_map('variable_labels')
+        bio = BytesIO()
+        blank = _pad_bytes_new('', 81)
+
+        if self._variable_labels is None:
+            for _ in range(self.nvar):
+                bio.write(blank)
+            bio.seek(0)
+            self._file.write(self._tag(bio.read(), 'variable_labels'))
+            return
+
+        for col in self.data:
+            if col in self._variable_labels:
+                label = self._variable_labels[col]
+                if len(label) > 80:
+                    raise ValueError('Variable labels must be 80 characters '
+                                     'or fewer')
+                is_latin1 = all(ord(c) < 256 for c in label)
+                if not is_latin1:
+                    raise ValueError('Variable labels must contain only '
+                                     'characters that can be encoded in '
+                                     'Latin-1')
+                bio.write(_pad_bytes_new(label, 81))
+            else:
+                bio.write(blank)
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'variable_labels'))
+
+    def _write_characteristics(self):
+        self._update_map('characteristics')
+        self._file.write(self._tag(b'', 'characteristics'))
+
+    def _write_data(self):
+        self._update_map('data')
+        data = self.data
+        self._file.write(b'<data>')
+        self._file.write(data.tobytes())
+        self._file.write(b'</data>')
+
+    def _write_strls(self):
+        self._update_map('strls')
+        strls = b''
+        if self._strl_blob is not None:
+            strls = self._strl_blob
+        self._file.write(self._tag(strls, 'strls'))
+
+    def _write_expansion_fields(self):
+        """No-op in dta 117+"""
+        pass
+
+    def _write_value_labels(self):
+        self._update_map('value_labels')
+        bio = BytesIO()
+        for vl in self._value_labels:
+            lab = vl.generate_value_label(self._byteorder, self._encoding)
+            lab = self._tag(lab, 'lbl')
+            bio.write(lab)
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'value_labels'))
+
+    def _write_file_close_tag(self):
+        self._update_map('stata_data_close')
+        self._file.write(_bytes('</stata_dta>', 'utf-8'))
+        self._update_map('end-of-file')
+
+    def _update_strl_names(self):
+        """Update column names for conversion to strl if they might have been
+        changed to comply with Stata naming rules"""
+        # Update convert_strl if names changed
+        for orig, new in self._converted_names.items():
+            if orig in self._convert_strl:
+                idx = self._convert_strl.index(orig)
+                self._convert_strl[idx] = new
+
+    def _convert_strls(self, data):
+        """Convert columns to StrLs if either very large or in the
+        convert_strl variable"""
+        convert_cols = []
+        for i, col in enumerate(data):
+            if self.typlist[i] == 32768 or col in self._convert_strl:
+                convert_cols.append(col)
+        if convert_cols:
+            ssw = StataStrLWriter(data, convert_cols)
+            tab, new_data = ssw.generate_table()
+            data = new_data
+            self._strl_blob = ssw.generate_blob(tab)
+        return data
+
+    def _set_formats_and_types(self, data, dtypes):
+        self.typlist = []
+        self.fmtlist = []
+        for col, dtype in dtypes.iteritems():
+            force_strl = col in self._convert_strl
+            fmt = _dtype_to_default_stata_fmt(dtype, data[col],
+                                              dta_version=117,
+                                              force_strl=force_strl)
+            self.fmtlist.append(fmt)
+            self.typlist.append(_dtype_to_stata_type_117(dtype, data[col],
+                                                         force_strl))
diff --git a/pandas/io/tests/data/legacy_hdf/legacy.h5 b/pandas/io/tests/data/legacy_hdf/legacy.h5
deleted file mode 100644
index 38b822dd16994..0000000000000
Binary files a/pandas/io/tests/data/legacy_hdf/legacy.h5 and /dev/null differ
diff --git a/pandas/io/tests/data/legacy_hdf/legacy_0.10.h5 b/pandas/io/tests/data/legacy_hdf/legacy_0.10.h5
deleted file mode 100644
index b1439ef16361a..0000000000000
Binary files a/pandas/io/tests/data/legacy_hdf/legacy_0.10.h5 and /dev/null differ
diff --git a/pandas/io/tests/data/legacy_hdf/legacy_table_0.11.h5 b/pandas/io/tests/data/legacy_hdf/legacy_table_0.11.h5
deleted file mode 100644
index 958effc2ce6f8..0000000000000
Binary files a/pandas/io/tests/data/legacy_hdf/legacy_table_0.11.h5 and /dev/null differ
diff --git a/pandas/io/tests/data/stata2_115.dta~1dc157c... Added additional data files for testing alternative Stata file formats b/pandas/io/tests/data/stata2_115.dta~1dc157c... Added additional data files for testing alternative Stata file formats
deleted file mode 100644
index ad7dda3fdc4b3..0000000000000
Binary files a/pandas/io/tests/data/stata2_115.dta~1dc157c... Added additional data files for testing alternative Stata file formats and /dev/null differ
diff --git a/pandas/io/tests/data/stata3_115.dta~1dc157c... Added additional data files for testing alternative Stata file formats b/pandas/io/tests/data/stata3_115.dta~1dc157c... Added additional data files for testing alternative Stata file formats
deleted file mode 100644
index 1c4ad0dae8092..0000000000000
Binary files a/pandas/io/tests/data/stata3_115.dta~1dc157c... Added additional data files for testing alternative Stata file formats and /dev/null differ
diff --git a/pandas/io/tests/data/stata4_115.dta~1dc157c... Added additional data files for testing alternative Stata file formats b/pandas/io/tests/data/stata4_115.dta~1dc157c... Added additional data files for testing alternative Stata file formats
deleted file mode 100644
index 2c68cfb393b9e..0000000000000
Binary files a/pandas/io/tests/data/stata4_115.dta~1dc157c... Added additional data files for testing alternative Stata file formats and /dev/null differ
diff --git a/pandas/io/tests/data/test_multisheet.xls b/pandas/io/tests/data/test_multisheet.xls
deleted file mode 100644
index fa37723fcdefb..0000000000000
Binary files a/pandas/io/tests/data/test_multisheet.xls and /dev/null differ
diff --git a/pandas/io/tests/data/test_multisheet.xlsm b/pandas/io/tests/data/test_multisheet.xlsm
deleted file mode 100644
index 694f8e07d5e29..0000000000000
Binary files a/pandas/io/tests/data/test_multisheet.xlsm and /dev/null differ
diff --git a/pandas/io/tests/data/test_multisheet.xlsx b/pandas/io/tests/data/test_multisheet.xlsx
deleted file mode 100644
index 5de07772b276a..0000000000000
Binary files a/pandas/io/tests/data/test_multisheet.xlsx and /dev/null differ
diff --git a/pandas/io/tests/data/testmultiindex.xls b/pandas/io/tests/data/testmultiindex.xls
deleted file mode 100644
index 3664c5c8dedcc..0000000000000
Binary files a/pandas/io/tests/data/testmultiindex.xls and /dev/null differ
diff --git a/pandas/io/tests/data/testmultiindex.xlsm b/pandas/io/tests/data/testmultiindex.xlsm
deleted file mode 100644
index 8f359782b57bb..0000000000000
Binary files a/pandas/io/tests/data/testmultiindex.xlsm and /dev/null differ
diff --git a/pandas/io/tests/data/testmultiindex.xlsx b/pandas/io/tests/data/testmultiindex.xlsx
deleted file mode 100644
index a70110caf1ec7..0000000000000
Binary files a/pandas/io/tests/data/testmultiindex.xlsx and /dev/null differ
diff --git a/pandas/io/tests/data/yahoo_options1.html b/pandas/io/tests/data/yahoo_options1.html
deleted file mode 100644
index 2846a2bd12732..0000000000000
--- a/pandas/io/tests/data/yahoo_options1.html
+++ /dev/null
@@ -1,6065 +0,0 @@
-<!DOCTYPE html>
-<html>
-<head>
-    <!-- customizable : anything you expected.  -->
-    <title>AAPL Options | Yahoo! Inc. Stock - Yahoo! Finance</title>
-
-    <meta http-equiv="X-UA-Compatible" content="IE=edge,chrome=1" />
-    <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
-
-
-
-    
-        <link rel="stylesheet" type="text/css" href="https://s.yimg.com/zz/combo?/os/mit/td/stencil-0.1.306/stencil-css/stencil-css-min.css&/os/mit/td/finance-td-app-mobile-web-2.0.294/css.master/css.master-min.css"/><link rel="stylesheet" type="text/css" href="https://s.yimg.com/os/mit/media/m/quotes/quotes-search-gs-smartphone-min-1680382.css"/>
-
-
-<script>(function(html){var c = html.className;c += " JsEnabled";c = c.replace("NoJs","");html.className = c;})(document.documentElement);</script>
-    
-
-
-    <!-- UH -->
-    <link rel="stylesheet" href="https://s.yimg.com/zz/combo?kx/yucs/uh3/uh/1114/css//uh_non_mail-min.css&amp;kx/yucs/uh_common/meta/3/css/meta-min.css&amp;kx/yucs/uh3/top_bar/317/css/no_icons-min.css&amp;kx/yucs/uh3/search/css/588/blue_border-min.css&amp;kx/yucs/uh3/get-the-app/151/css/get_the_app-min.css&amp;kx/yucs/uh3/uh/1114/css/uh_ssl-min.css&amp;&amp;bm/lib/fi/common/p/d/static/css/2.0.356953/2.0.0/mini/yfi_theme_teal.css&amp;bm/lib/fi/common/p/d/static/css/2.0.356953/2.0.0/mini/yfi_interactive_charts_embedded.css">
-
-
-
-
-    <style>
-        .dev-desktop .y-header {
-            position: fixed;
-            top: 0;
-            left: 0;
-            right: 0;
-            padding-bottom: 10px;
-            background-color: #FFF;
-            z-index: 500;
-            -webkit-transition:border 0.25s, box-shadow 0.25s;
-            -moz-transition:border 0.25s, box-shadow 0.25s;
-            transition:border 0.25s, box-shadow 0.25s;
-        }
-        .Scrolling .dev-desktop .y-header,
-        .has-scrolled .dev-desktop .y-header {
-            -webkit-box-shadow: 0 0 9px 0 #490f76!important;
-            -moz-box-shadow: 0 0 9px 0 #490f76!important;
-            box-shadow: 0 0 9px 0 #490f76!important;
-            border-bottom: 1px solid #490f76!important;
-        }
-        .yucs-sidebar, .yui3-sidebar {
-            position: relative;
-        }
-    </style>
-    <style>
-
-        #content-area {
-            margin-top: 100px;
-            z-index: 4;
-        }
-        #finance-navigation {
-
-            padding: 0 12px;
-        }
-        #finance-navigation a, #finance-navigation a:link, #finance-navigation a:visited {
-            color: #1D1DA3;
-        }
-        #finance-navigation li.nav-section {
-            position: relative;
-        }
-        #finance-navigation li.nav-section a {
-            display: block;
-            padding: 10px 20px;
-        }
-        #finance-navigation li.nav-section ul.nav-subsection {
-            background-color: #FFFFFF;
-            border: 1px solid #DDDDDD;
-            box-shadow: 0 3px 15px 2px #FFFFFF;
-            display: none;
-            left: 0;
-            min-width: 100%;
-            padding: 5px 0;
-            position: absolute;
-            top: 35px;
-            z-index: 11;
-        }
-        #finance-navigation li.nav-section ul.nav-subsection a {
-            display: block;
-            padding: 5px 11px;
-            white-space: nowrap;
-        }
-        #finance-navigation li.nav-section ul.nav-subsection ul.scroll {
-            margin: 0 0 13px;
-            max-height: 168px;
-            overflow: auto;
-            padding-bottom: 8px;
-            width: auto;
-        }
-        #finance-navigation li.first a {
-            padding-left: 0;
-        }
-        #finance-navigation li.on ul.nav-subsection {
-            display: block;
-        }
-        #finance-navigation li.on:before {
-            -moz-border-bottom-colors: none;
-            -moz-border-left-colors: none;
-            -moz-border-right-colors: none;
-            -moz-border-top-colors: none;
-            border-color: -moz-use-text-color rgba(0, 0, 0, 0) #DDDDDD;
-            border-image: none;
-            border-left: 10px solid rgba(0, 0, 0, 0);
-            border-right: 10px solid rgba(0, 0, 0, 0);
-            border-style: none solid solid;
-            border-width: 0 10px 10px;
-            bottom: -5px;
-            content: "";
-            left: 50%;
-            margin-left: -10px;
-            position: absolute;
-            z-index: 1;
-        }
-        #finance-navigation li.on:after {
-            -moz-border-bottom-colors: none;
-            -moz-border-left-colors: none;
-            -moz-border-right-colors: none;
-            -moz-border-top-colors: none;
-            border-color: -moz-use-text-color rgba(0, 0, 0, 0) #FFFFFF;
-            border-image: none;
-            border-left: 10px solid rgba(0, 0, 0, 0);
-            border-right: 10px solid rgba(0, 0, 0, 0);
-            border-style: none solid solid;
-            border-width: 0 10px 10px;
-            bottom: -6px;
-            content: "";
-            left: 50%;
-            margin-left: -10px;
-            position: absolute;
-            z-index: 1;
-        }
-
-
-        #finance-navigation {
-            position: relative;
-            left: -100%;
-            padding-left: 102%;
-
-        }
-
-
-        ul {
-            margin: .55em 0;
-        }
-
-        div[data-region=subNav] {
-            z-index: 11;
-        }
-
-        #yfi_investing_content {
-            position: relative;
-        }
-
-        #yfi_charts.desktop #yfi_investing_content {
-            width: 1070px;
-        }
-
-        #yfi_charts.tablet #yfi_investing_content {
-            width: 930px;
-        }
-
-        #yfi_charts.tablet #yfi_doc {
-            width: 1100px;
-        }
-
-        #compareSearch {
-            position: absolute;
-            right: 0;
-            padding-top: 10px;
-            z-index: 10;
-        }
-
-        /* remove this once int1 verification happens */
-        #yfi_broker_buttons {
-            height: 60px;
-        }
-
-        #yfi_charts.desktop #yfi_doc {
-            width: 1240px;
-        }
-
-        .tablet #content-area {
-            margin-top: 0;
-            padding-top: 55px;
-
-        }
-
-        .tablet #marketindices {
-            margin-top: -5px;
-        }
-
-        .tablet #quoteContainer {
-            right: 191px;
-        }
-    </style>
-</head>
-<body  id="yfi_charts" class="dev-desktop desktop intl-us yfin_gs gsg-0">
-
-<div id="outer-wrapper" class="outer-wrapper">
-    <div class="yui-sv y-header">
-        <div class="yui-sv-hd">
-            <!-- yucs header bar. Property sticks UH header bar here. UH supplies the div -->
-            <style>#header,#y-hd,#hd .yfi_doc,#yfi_hd{background:#fff !important}#yfin_gs #yfimh #yucsHead,#yfin_gs #yfi_doc #yucsHead,#yfin_gs #yfi_fp_hd #yucsHead,#yfin_gs #y-hd #yucsHead,#yfin_gs #yfi_hd #yucsHead,#yfin_gs #yfi-doc #yucsHead{-webkit-box-shadow:0 0 9px 0 #490f76 !important;-moz-box-shadow:0 0 9px 0 #490f76 !important;box-shadow:0 0 9px 0 #490f76 !important;border-bottom:1px solid #490f76 !important}#yog-hd,#yfi-hd,#ysp-hd,#hd,#yfimh,#yfi_hd,#yfi_fp_hd,#masthead,#yfi_nav_header #navigation,#y-nav #navigation,.ad_in_head{background-color:#fff;background-image:none}#header,#hd .yfi_doc,#y-hd .yfi_doc,#yfi_hd .yfi_doc{width:100% !important}#yucs{margin:0 auto;width:970px}#yfi_nav_header,.y-nav-legobg,#y-nav #navigation{margin:0 auto;width:970px}#yucs .yucs-avatar{height:22px;width:22px}#yucs #yucs-profile_text .yuhead-name-greeting{display:none}#yucs #yucs-profile_text .yuhead-name{top:0;max-width:65px}#yucs-profile_text{max-width:65px}#yog-bd .yom-stage{background:transparent}#yog-hd{height:84px}.yog-bd,.yog-grid{padding:4px 10px}.nav-stack ul.yog-grid{padding:0}#yucs #yucs-search.yucs-bbb .yucs-button_theme{background:-moz-linear-gradient(top, #01a5e1 0, #0297ce 100%);background:-webkit-gradient(linear, left top, left bottom, color-stop(0%, #01a5e1), color-stop(100%, #0297ce));background:-webkit-linear-gradient(top, #01a5e1 0, #0297ce 100%);background:-o-linear-gradient(top, #01a5e1 0, #0297ce 100%);background:-ms-linear-gradient(top, #01a5e1 0, #0297ce 100%);background:linear-gradient(to bottom, #01a5e1 0, #0297ce 100%);-webkit-box-shadow:inset 0 1px 3px 0 #01c0eb;box-shadow:inset 0 1px 3px 0 #01c0eb;background-color:#019ed8;background-color:transparent\0/IE9;background-color:transparent\9;*background:none;border:1px solid #595959;padding-left:0px;padding-right:0px}#yucs #yucs-search.yucs-bbb #yucs-prop_search_button_wrapper .yucs-gradient{filter:progid:DXImageTransform.Microsoft.gradient(startColorstr='#01a5e1', endColorstr='#0297ce',GradientType=0 );-ms-filter:"progid:DXImageTransform.Microsoft.gradient( startColorstr='#01a5e1', endColorstr='#0297ce',GradientType=0 )";background-color:#019ed8\0/IE9}#yucs #yucs-search.yucs-bbb #yucs-prop_search_button_wrapper{*border:1px solid #595959}#yucs #yucs-search .yucs-button_theme{background:#0f8ed8;border:0;box-shadow:0 2px #044e6e}@media all{#yucs.yucs-mc,#yucs-top-inner{width:auto !important;margin:0 !important}#yucsHead{_text-align:left !important}#yucs-top-inner,#yucs.yucs-mc{min-width:970px !important;max-width:1240px !important;padding-left:10px !important;padding-right:10px !important}#yucs.yucs-mc{_width:970px !important;_margin:0 !important}#yucsHead #yucs .yucs-fl-left #yucs-search{position:absolute;left:190px !important;max-width:none !important;margin-left:0;_left:190px;_width:510px !important}.yog-ad-billboard #yucs-top-inner,.yog-ad-billboard #yucs.yucs-mc{max-width:1130px !important}#yucs .yog-cp{position:inherit}}#yucs #yucs-logo{width:150px !important;height:34px !important}#yucs #yucs-logo div{width:94px !important;margin:0 auto !important}.lt #yucs-logo div{background-position:-121px center !important}#yucs-logo a{margin-left:-13px !important}</style><style>#yog-hd .yom-bar, #yog-hd .yom-nav, #y-nav, #hd .ysp-full-bar,  #yfi_nav_header, #hd .mast {
-float: none;
-width: 970px;
-margin: 0 auto;
-}
-
-#yog-bd .yom-stage {
-background: transparent;
-}
-
-#y-nav .yom-nav {
-padding-top: 0px;
-}
-
-#ysp-search-assist .bd {
-display:none;
-}
-
-#ysp-search-assist h4 {
-padding-left: 8px;
-}
-
-
-    #yfi-portfolios-multi-quotes #y-nav, #yfi-portfolios-multi-quotes #navigation, #yfi-portfolios-multi-quotes .y-nav-legobg, 
-    #yfi-portfolios-my-portfolios #y-nav, #yfi-portfolios-my-portfolios #navigation, #yfi-portfolios-my-portfolios .y-nav-legobg {
-        width : 100%;
-    }</style> <div id="yucsHead" class="yucs-finance yucs-en-us  yucs-standard"><!-- meta --><div id="yucs-meta" data-authstate="signedout" data-cobrand="standard" data-crumb=".d5cI7.xGCl" data-mc-crumb="MFwtnTzg3H9" data-gta="rpdy8E0R8By" data-device="desktop" data-experience="GS" data-firstname="" data-flight="1414127024" data-forcecobrand="standard" data-guid="" data-host="finance.yahoo.com" data-https="1" data-languagetag="en-us" data-property="finance" data-protocol="https" data-shortfirstname="" data-shortuserid="" data-status="active" data-spaceid="2022773886" data-test_id="" data-userid="" data-stickyheader = "true" ></div><!-- /meta --><div id="yucs-comet" style="display:none;"></div><div id="yucs-disclaimer" class="yucs-disclaimer yucs-activate yucs-hide yucs-property-finance yucs-fcb- " data-dsstext="Want a better search experience? {dssLink}Set your Search to Yahoo{linkEnd}" data-dsstext-mobile="Search Less, Find More" data-dsstext-mobile-ok="OK" data-dsstext-mobile-set-search="Set Search to Yahoo" data-ylt-link="https://search.yahoo.com/searchset;_ylt=AiX7vV4ZC1yV0es0bQEcfMN.FJF4?pn=" data-ylt-dssbarclose="/;_ylt=AglQ0xnmFQQWM1k6v2Jf_PB.FJF4" data-ylt-dssbaropen="/;_ylt=AtHZnuOiE2P8YQ05_E2N_ft.FJF4" data-linktarget="_top" data-lang="en-us" data-property="finance" data-device="Desktop" data-close-txt="Close this window" data-maybelater-txt = "Maybe Later" data-killswitch = "0" data-host="finance.yahoo.com" data-spaceid="2022773886" data-pn="NK06zkRovIL" data-pn-tablet="IVUdbzrxpp." data-news-search-yahoo-com="Tsdg3det8Fz" data-answers-search-yahoo-com="mBfRvq3MFtO" data-finance-search-yahoo-com="tilQFF65AfB" data-images-search-yahoo-com="fu.2EFRBATf" data-video-search-yahoo-com="pBGrxLOlxKq" data-sports-search-yahoo-com="ql91kCDGb6G" data-shopping-search-yahoo-com="se0TwfAcKAl" data-shopping-yahoo-com="se0TwfAcKAl" data-us-qa-trunk-news-search-yahoo-com ="Tsdg3det8Fz" data-dss="1"></div> <div id="yucs-top-bar" class='yucs-ps' ><div id='yucs-top-inner'><ul id="yucs-top-list"><li id="yucs-top-home"><a href="https://us.lrd.yahoo.com/_ylt=AlWj_.LE3Rl.g9g29t8AwSp.FJF4/SIG=11atoq9tt/EXP=1414155824/**https%3a//www.yahoo.com/" ><span class="sp yucs-top-ico"></span>Home</a></li><li id="yucs-top-mail"><a href="https://mail.yahoo.com/;_ylt=AmM9rkLc5YyjTZdpoYubtKd.FJF4" >Mail</a></li><li id="yucs-top-news"><a href="http://news.yahoo.com/;_ylt=AgcCHge4Y6LIVfRaRsHWV2J.FJF4" >News</a></li><li id="yucs-top-sports"><a href="http://sports.yahoo.com/;_ylt=AnjgCGcaXPicH5SvMfmfklp.FJF4" >Sports</a></li><li id="yucs-top-finance"><a href="http://finance.yahoo.com/;_ylt=AmxnlgEg3uq0dTLtzPoAlZt.FJF4" >Finance</a></li><li id="yucs-top-weather"><a href="https://weather.yahoo.com/;_ylt=AsNaHP2mECGMvWs9He7eE2V.FJF4" >Weather</a></li><li id="yucs-top-games"><a href="https://games.yahoo.com/;_ylt=AkzjzJDbSQdJwSPYcbtE065.FJF4" >Games</a></li><li id="yucs-top-groups"><a href="https://us.lrd.yahoo.com/_ylt=AoLh6wDIgsOULMv1esU0.xh.FJF4/SIG=11d3d8i5l/EXP=1414155824/**https%3a//groups.yahoo.com/" >Groups</a></li><li id="yucs-top-answers"><a href="https://answers.yahoo.com/;_ylt=Agm10pEc0pWtHHemjQ0.TbN.FJF4" >Answers</a></li><li id="yucs-top-screen"><a href="https://us.lrd.yahoo.com/_ylt=AhkWWPdLcb.U7wLVkIMns2x.FJF4/SIG=11dbl0nul/EXP=1414155824/**https%3a//screen.yahoo.com/" >Screen</a></li><li id="yucs-top-flickr"><a href="https://us.lrd.yahoo.com/_ylt=Auq88NnzKsZFzmlR7DmFXop.FJF4/SIG=11bpagu72/EXP=1414155824/**https%3a//www.flickr.com/" >Flickr</a></li><li id="yucs-top-mobile"><a href="https://mobile.yahoo.com/;_ylt=AtK46fiW2XkLVHJcIJJHDXR.FJF4" >Mobile</a></li><li id='yucs-more' class='yucs-menu yucs-more-activate' data-ylt="/;_ylt=Auw3PsCquvnBW4jphIBgQP9.FJF4"><a href="http://everything.yahoo.com/" id='yucs-more-link'>More<span class="sp yucs-top-ico"></span></a><div id='yucs-top-menu'><div class="yui3-menu-content"><ul class="yucs-hide yucs-leavable"><li id='yucs-top-celebrity'><a href="https://celebrity.yahoo.com/;_ylt=An8noQQZzAHgNVQYPpOPivx.FJF4" >Celebrity</a></li><li id='yucs-top-movies'><a href="https://us.lrd.yahoo.com/_ylt=AgZ.CoRWr7VM95LwnIYJsDd.FJF4/SIG=11gh39fme/EXP=1414155824/**https%3a//www.yahoo.com/movies" >Movies</a></li><li id='yucs-top-music'><a href="https://music.yahoo.com/;_ylt=AkfHRwYPZIAvLfaLO29kdNt.FJF4" >Music</a></li><li id='yucs-top-tv'><a href="https://tv.yahoo.com/;_ylt=Ajwqy5ckTfy87hxdl_RxOkh.FJF4" >TV</a></li><li id='yucs-top-health'><a href="https://us.lrd.yahoo.com/_ylt=AnFvXKWh.tNnT_XYp3pLkTB.FJF4/SIG=11gb7tafd/EXP=1414155824/**https%3a//www.yahoo.com/health" >Health</a></li><li id='yucs-top-style'><a href="https://us.lrd.yahoo.com/_ylt=AnPaLisKYEgQeqCndShg0Sh.FJF4/SIG=11f5cf8lu/EXP=1414155824/**https%3a//www.yahoo.com/style" >Style</a></li><li id='yucs-top-beauty'><a href="https://us.lrd.yahoo.com/_ylt=Agz48lXRC_.eH.E52Kls9mN.FJF4/SIG=11gjh15a0/EXP=1414155824/**https%3a//www.yahoo.com/beauty" >Beauty</a></li><li id='yucs-top-food'><a href="https://us.lrd.yahoo.com/_ylt=AoZxQDvvgxk2rE228crcIXB.FJF4/SIG=11eog6ies/EXP=1414155824/**https%3a//www.yahoo.com/food" >Food</a></li><li id='yucs-top-parenting'><a href="https://us.lrd.yahoo.com/_ylt=AqhzdHsD6rILPrARDJw.9Ud.FJF4/SIG=11ji3mugq/EXP=1414155824/**https%3a//www.yahoo.com/parenting" >Parenting</a></li><li id='yucs-top-diy'><a href="https://us.lrd.yahoo.com/_ylt=AupR0vV1McfivTFs1zpjhzt.FJF4/SIG=11dda9l6n/EXP=1414155824/**https%3a//www.yahoo.com/diy" >DIY</a></li><li id='yucs-top-tech'><a href="https://us.lrd.yahoo.com/_ylt=Ar6F6vaGZ9tPEKeLjGhKrXt.FJF4/SIG=11e4rhgrd/EXP=1414155824/**https%3a//www.yahoo.com/tech" >Tech</a></li><li id='yucs-top-shopping'><a href="http://shopping.yahoo.com/;_ylt=AhMb4HL3nTgtUKdZTR7CqRx.FJF4" >Shopping</a></li><li id='yucs-top-travel'><a href="https://us.lrd.yahoo.com/_ylt=ArXRy57WNum4HFWUtbtWQPJ.FJF4/SIG=11gdkf3je/EXP=1414155824/**https%3a//www.yahoo.com/travel" >Travel</a></li><li id='yucs-top-autos'><a href="https://autos.yahoo.com/;_ylt=ApOi.mJ4LmMDE5X7mKQNuCN.FJF4" >Autos</a></li><li id='yucs-top-homes'><a href="https://us.lrd.yahoo.com/_ylt=AjXtihZ1uQ.YGZlf4VbO6VB.FJF4/SIG=11li5nuit/EXP=1414155824/**https%3a//homes.yahoo.com/own-rent/" >Homes</a></li></ul></div></div></li></ul></div></div><div id="yucs" class="yucs yucs-mc  yog-grid" data-lang="en-us" data-property="finance" data-flight="1414127024" data-linktarget="_top" data-uhvc="/;_ylt=Aoq23BCf..XTjZsQny3qRat.FJF4"> <div class="yucs-fl-left yog-cp">   <div id="yucs-logo"> <style> #yucs #yucs-logo-ani { width:120px ; height:34px; background-image:url(https://s.yimg.com/rz/l/yahoo_finance_en-US_f_pw_119x34.png) ; _background-image:url(https://s.yimg.com/rz/l/yahoo_finance_en-US_f_pw_119x34.gif) ; *left: 0px; display:block ; visibility: visible; position: relative; clip: auto; } .lt #yucs-logo-ani { background-position: 100% 0px !important; } .lt #yucs[data-property='mail'] #yucs-logo-ani { background-position: -350px 0px !important; } #yucs-logo { margin-top:0px!important; padding-top: 11px; width: 120px; } #yucs[data-property='homes'] #yucs-logo { width: 102px; } .advisor #yucs-link-ani { left: 21px !important; } #yucs #yucs-logo a {margin-left: 0!important;}#yucs #yucs-link-ani {width: 100% !important;} @media only screen and (-webkit-min-device-pixel-ratio: 2), only screen and ( min--moz-device-pixel-ratio: 2), only screen and ( -o-min-device-pixel-ratio: 2/1), only screen and ( min-device-pixel-ratio: 2), only screen and ( min-resolution: 192dpi), only screen and ( min-resolution: 2dppx) { #yucs #yucs-logo-ani { background-image: url(https://s.yimg.com/rz/l/yahoo_finance_en-US_f_pw_119x34_2x.png) !important; background-size: 235px 34px; } } </style> <div> <a id="yucs-logo-ani" class="" href="https://finance.yahoo.com/;_ylt=ApEamJdqId1sT14VmnNAggN.FJF4" target="_top" data-alg=""> Yahoo Finance </a> </div> <img id="imageCheck" src="https://s.yimg.com/os/mit/media/m/base/images/transparent-1093278.png" alt=""/> </div><noscript><style>#yucs #yucs-logo-ani {visibility: visible;position: relative;clip: auto;}</style></noscript> <div id="yucs-search" style="width: 570px; display: block;" class=' yucs-search-activate'> <form role="search" class="yucs-search yucs-activate" target="_top" data-webaction="https://search.yahoo.com/search;_ylt=AvzzNtek38kqPZkneL1cv41.FJF4" action="https://finance.yahoo.com/q;_ylt=AkkcTJxFXYZHn7XinkNp9Dt.FJF4" method="get"> <table role="presentation"> <tbody role="presentation"> <tr role="presentation"> <td class="yucs-form-input" role="presentation"> <input autocomplete="off" class="yucs-search-input" name="s" type="search" aria-describedby="mnp-search_box" data-yltvsearch="https://finance.yahoo.com/q;_ylt=AuWsJdKVIZAaJAFNjmdFzdp.FJF4" data-yltvsearchsugg="/;_ylt=AndtjiGZZXRjQFmJgLfTwfN.FJF4" data-satype="mini" data-gosurl="https://s.yimg.com/aq/autoc" data-pubid="666" data-enter-ylt="https://finance.yahoo.com/q;_ylt=Atgi914uJaa1w839_nW4vjF.FJF4" data-enter-fr="" data-maxresults="" id="mnp-search_box" data-rapidbucket=""/> </td><td NOWRAP class="yucs-form-btn" role="presentation"><div id="yucs-prop_search_button_wrapper" class="yucs-search-buttons"><div class="yucs-shadow"><div class="yucs-gradient"></div></div><button id="yucs-sprop_button" class="yucs-action_btn yucs-button_theme yucs-vsearch-button" type="submit" data-vfr="uh3_finance_vert_gs" onclick="var vfr = this.getAttribute('data-vfr'); if(vfr){document.getElementById('fr').value = vfr}" data-vsearch="https://finance.yahoo.com/q">Search Finance</button></div><div id="yucs-web_search_button_wrapper" class="yucs-search-buttons"><div class="yucs-shadow"><div class="yucs-gradient"></div></div><button id="yucs-search_button" class="yucs-action_btn yucs-wsearch-button" onclick="var form=document.getElementById('yucs-search').children[0];var wa=form.getAttribute('data-webaction');form.setAttribute('action',wa);var searchbox=document.getElementById('mnp-search_box');searchbox.setAttribute('name','p');" type="submit">Search Web</button></div></td></tr> </tbody> </table> <input type="hidden" id="uhb" name="uhb" value="uhb2" /> <input type="hidden" name="type" value="2button" data-ylk="slk:yhstype-hddn;itc:1;"/> <input type="hidden" id="fr" name="fr" value="uh3_finance_web_gs" />   </form><div id="yucs-satray" class="sa-tray sa-hidden" data-wstext="Search Web for: " data-wsearch="https://search.yahoo.com/search;_ylt=AsyLPUvBzWIsibkoPAU2mSF.FJF4" data-vfr="uh3_finance_vert_gs" data-vsearchAll="/;_ylt=AjuLB_9kDoarHxg9WHKrQFh.FJF4" data-vsearch="https://finance.yahoo.com/q;_ylt=AndtjiGZZXRjQFmJgLfTwfN.FJF4" data-vstext= "Search news for: " data-vert_fin_search="https://finance.search.yahoo.com/search/;_ylt=AhY.XJlk07RC1OLtEsONnod.FJF4"></div> </div></div><div class="yucs-fl-right"> <div id="yucs-profile" class="yucs-profile yucs-signedout"> <a id="yucs-menu_link_profile_signed_out" href="https://login.yahoo.com/config/login;_ylt=Aiv1AtgGDcyfPccXRJZyALd.FJF4?.src=quote&.intl=us&.lang=en-US&.done=https://finance.yahoo.com/q/op%3fs=AAPL%26date=1414108800" target="_top" rel="nofollow" class="sp yucs-fc" aria-label="Profile"> </a> <div id="yucs-profile_text" class="yucs-fc"> <a id="yucs-login_signIn" href="https://login.yahoo.com/config/login;_ylt=Aiv1AtgGDcyfPccXRJZyALd.FJF4?.src=quote&.intl=us&.lang=en-US&.done=https://finance.yahoo.com/q/op%3fs=AAPL%26date=1414108800" target="_top" rel="nofollow" class="yucs-fc"> Sign In </a> </div></div><div class="yucs-mail_link yucs-mailpreview-ancestor"><a id="yucs-mail_link_id" class="sp yltasis yucs-fc" href="https://mail.yahoo.com/;_ylt=ApGaJa9yQSnPsFQkLFQ1U5Z.FJF4?.intl=us&.lang=en-US&.src=ym" rel="nofollow" target="_top"> Mail </a><div class="yucs-mail-preview-panel yucs-menu yucs-hide" data-mail-txt="Mail" data-uri-scheme="http" data-uri-path="ucs.query.yahoo.com/v1/console/yql" data-mail-view="Go to Mail" data-mail-help-txt="Help" data-mail-help-url="http://help.yahoo.com/l/us/yahoo/mail/ymail/" data-mail-loading-txt="Loading..." data-languagetag="en-us" data-mrd-crumb="6Vkdr7RdZpJ" data-authstate="signedout" data-middleauth-signin-text="Click here to view your mail" data-popup-login-url="https://login.yahoo.com/config/login_verify2?.pd=c%3DOIVaOGq62e5hAP8Tv..nr5E3&.src=sc" data-middleauthtext="You have {count} new messages." data-yltmessage-link="https://us.lrd.yahoo.com/_ylt=Aucx4moRFQgf2g2bSHE9py9.FJF4/SIG=13d75r7nj/EXP=1414155824/**http%3a//mrd.mail.yahoo.com/msg%3fmid=%7bmsgID%7d%26fid=Inbox%26src=uh%26.crumb=6Vkdr7RdZpJ" data-yltviewall-link="https://mail.yahoo.com/;_ylt=AqotC4n_1ppwWzLiK6hnC8x.FJF4" data-yltpanelshown="/;_ylt=AviEZ5yPSInq1ISINh4rld9.FJF4" data-ylterror="/;_ylt=AhD02EN2eg_KbPb1S.HR2lB.FJF4" data-ylttimeout="/;_ylt=Allr4MA9gWpAVvID4.EZC31.FJF4" data-generic-error="We're unable to preview your mail.<br>Go to Mail." data-nosubject="[No Subject]" data-timestamp='short'></div></div> <div id="yucs-help" class="yucs-activate yucs-help yucs-menu_nav"> <a id="yucs-help_button" class="sp yltasis" href="javascript:void(0);" aria-label="Help" rel="nofollow"> <em class="yucs-hide yucs-menu_anchor">Help</em> </a> <div id="yucs-help_inner" class="yucs-hide yucs-menu yucs-hm-activate" data-yltmenushown="/;_ylt=AtMQYyDok1lRxVAWTafuUaV.FJF4"> <span class="sp yucs-dock"></span> <ul id="yuhead-help-panel"> <li><a class="yucs-acct-link" href="https://us.lrd.yahoo.com/_ylt=Ar_NN1pEWr_kGdok6f9VT3R.FJF4/SIG=16g2b574a/EXP=1414155824/**https%3a//edit.yahoo.com/mc2.0/eval_profile%3f.intl=us%26.lang=en-US%26.done=https%3a//finance.yahoo.com/q/op%253fs=AAPL%2526date=1414108800%26amp;.src=quote%26amp;.intl=us%26amp;.lang=en-US" target="_top">Account Info</a></li> <li><a href="https://help.yahoo.com/l/us/yahoo/finance/;_ylt=AhSqjkYWRUO8nKyR9VjH3mt.FJF4" rel="nofollow" >Help</a></li> <span class="yucs-separator" role="presentation" style="display: block;"></span><li><a href="https://us.lrd.yahoo.com/_ylt=AvmpYUMGZn7OP1zejmClGSV.FJF4/SIG=11r5s8q6p/EXP=1414155824/**http%3a//feedback.yahoo.com/forums/207809" rel="nofollow" >Suggestions</a></li>  </ul> </div></div> <div id="yucs-network_link"><a id="yucs-home_link" href="https://us.lrd.yahoo.com/_ylt=AuO6pdRIcv24pP_Xiqa6vAZ.FJF4/SIG=11atoq9tt/EXP=1414155824/**https%3a//www.yahoo.com/" rel="nofollow" target="_top"><em class="sp">Yahoo</em><span class="yucs-fc">Home</span></a></div>       </div>   </div> <!-- contextual_shortcuts --><!-- /contextual_shortcuts --><!-- property: finance | languagetag: en-us | status: active | spaceid: 2022773886 | cobrand: standard | markup: empty --><div id="yucs-location-js" class="yucs-hide yucs-offscreen yucs-location-activate" data-appid="yahoo.locdrop.ucs.desktop" data-crumb="ax40SnAXIQa"><!-- empty for ie --></div><div id="yUnivHead" class="yucs-hide"><!-- empty --></div><div id="yhelp_container" class="yui3-skin-sam"></div></div><!-- alert --><!-- /alert -->
-        </div>
-
-
-    </div>
-
-    <div id="content-area" class="yui-sv-bd">
-
-        <div data-region="subNav">
-
-    
-    <ul id="finance-navigation" class="Grid Fz-m Fw-200 Whs-nw">
-        
-        
-        <li class="nav-section Grid-U  first">
-            <a href="/" title="">Finance Home</a>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U nav-fin-portfolios no-pjax has-entries">
-            <a href="/portfolios.html" title="portfolio nav">My Portfolio</a>
-            
-            <ul class="nav-subsection">
-                
-                <li>
-                    <ul class="scroll">
-                    
-                    </ul>
-                </li>
-                
-                
-                <li><a href="/portfolios/manage" title="portfolio nav" class="no-pjax">View All Portfolios</a></li>
-                
-                <li><a href="/portfolio/new" title="portfolio nav" class="no-pjax">Create Portfolio</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U  has-entries">
-            <a href="/market-overview/" title="">Market Data</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/stock-center/" title="" class="">Stocks</a></li>
-                
-                <li><a href="/funds/" title="" class="no-pjax">Mutual Funds</a></li>
-                
-                <li><a href="/options/" title="" class="no-pjax">Options</a></li>
-                
-                <li><a href="/etf/" title="" class="no-pjax">ETFs</a></li>
-                
-                <li><a href="/bonds" title="" class="no-pjax">Bonds</a></li>
-                
-                <li><a href="/futures" title="" class="no-pjax">Commodities</a></li>
-                
-                <li><a href="/currency-investing" title="" class="no-pjax">Currencies</a></li>
-                
-                <li><a href="http://biz.yahoo.com/research/earncal/today.html" title="" class="">Calendars</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U  has-entries">
-            <a href="/yahoofinance/" title="Yahoo Originals">Yahoo Originals</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/yahoofinance/business/" title="" class="">Business</a></li>
-                
-                <li><a href="/yahoofinance/investing" title="" class="">Investing</a></li>
-                
-                <li><a href="/yahoofinance/personalfinance" title="" class="">Personal Finance</a></li>
-                
-                <li><a href="/blogs/breakout/" title="" class="no-pjax">Breakout</a></li>
-                
-                <li><a href="/blogs/cost-of-living/" title="" class="no-pjax">Cost of Living</a></li>
-                
-                <li><a href="/blogs/daily-ticker/" title="" class="no-pjax">The Daily Ticker</a></li>
-                
-                <li><a href="/blogs/driven/" title="" class="no-pjax">Driven</a></li>
-                
-                <li><a href="/blogs/hot-stock-minute/" title="" class="no-pjax">Hot Stock Minute</a></li>
-                
-                <li><a href="/blogs/just-explain-it/" title="" class="no-pjax">Just Explain It</a></li>
-                
-                <li><a href="http://finance.yahoo.com/blogs/author/aaron-task/" title="" class="">Aaron Task, Editor</a></li>
-                
-                <li><a href="/blogs/author/michael-santoli/" title="" class="">Michael Santoli</a></li>
-                
-                <li><a href="/blogs/author/jeff-macke/" title="" class="">Jeff Macke</a></li>
-                
-                <li><a href="/blogs/author/lauren-lyster/" title="" class="">Lauren Lyster</a></li>
-                
-                <li><a href="/blogs/author/aaron-pressman/" title="" class="">Aaron Pressman</a></li>
-                
-                <li><a href="/blogs/author/rick-newman/" title="" class="">Rick Newman</a></li>
-                
-                <li><a href="/blogs/author/mandi-woodruff/" title="" class="">Mandi Woodruff</a></li>
-                
-                <li><a href="/blogs/author/chris-nichols/" title="" class="">Chris Nichols</a></li>
-                
-                <li><a href="/blogs/the-exchange/" title="" class="no-pjax">The Exchange</a></li>
-                
-                <li><a href="/blogs/michael-santoli/" title="" class="no-pjax">Unexpected Returns</a></li>
-                
-                <li><a href="http://finance.yahoo.com/blogs/author/philip-pearlman/" title="" class="">Philip Pearlman</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U  has-entries">
-            <a href="/news/" title="">Business &amp; Finance</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/corporate-news/" title="" class="">Company News</a></li>
-                
-                <li><a href="/economic-policy-news/" title="" class="">Economic News</a></li>
-                
-                <li><a href="/investing-news/" title="" class="">Market News</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U &amp;amp;amp;amp;amp;amp;amp;quot;new&amp;amp;amp;amp;amp;amp;amp;quot; has-entries">
-            <a href="/personal-finance/" title="Personal Finance">Personal Finance</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/career-education/" title="" class="">Career &amp; Education</a></li>
-                
-                <li><a href="/real-estate/" title="" class="">Real Estate</a></li>
-                
-                <li><a href="/retirement/" title="" class="">Retirement</a></li>
-                
-                <li><a href="/credit-debt/" title="" class="">Credit &amp; Debt</a></li>
-                
-                <li><a href="/taxes/" title="" class="">Taxes</a></li>
-                
-                <li><a href="/autos/" title="" class="">Autos</a></li>
-                
-                <li><a href="/lifestyle/" title="" class="">Health &amp; Lifestyle</a></li>
-                
-                <li><a href="/videos/" title="" class="">Featured Videos</a></li>
-                
-                <li><a href="/rates/" title="" class="no-pjax">Rates in Your Area</a></li>
-                
-                <li><a href="/calculator/index/" title="" class="no-pjax">Calculators</a></li>
-                
-                <li><a href="/personal-finance/tools/" title="" class="">Tools</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U  has-entries">
-            <a href="/cnbc/" title="Business News from CNBC">CNBC</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/blogs/big-data-download/" title="" class="no-pjax">Big Data Download</a></li>
-                
-                <li><a href="/blogs/off-the-cuff/" title="" class="no-pjax">Off the Cuff</a></li>
-                
-                <li><a href="/blogs/power-pitch/" title="" class="no-pjax">Power Pitch</a></li>
-                
-                <li><a href="/blogs/talking-numbers/" title="" class="no-pjax">Talking Numbers</a></li>
-                
-                <li><a href="/blogs/the-biz-fix/" title="" class="no-pjax">The Biz Fix</a></li>
-                
-                <li><a href="/blogs/top-best-most/" title="" class="no-pjax">Top/Best/Most</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U ">
-            <a href="/contributors/" title="Contributors">Contributors</a>
-            
-        </li>
-        
-        
-    </ul>
-    
-
-
-
-</div><!--END subNav-->
-
-
-        <div id="y-nav">
-            
-   
-       <div data-region="td-applet-mw-quote-search">
-<div id="applet_4971909175267776" class="App_v2 js-applet" data-applet-guid="4971909175267776" data-applet-type="td-applet-mw-quote-search">
-
-
-    
-    
-
-    <div class="App-Bd">
-        <div class="App-Main" data-region="main">
-            <div class="js-applet-view-container-main">
-                
-                <style>
-    #lookupTxtQuotes {
-        float: left;
-        height: 22px;
-        padding: 3px 0 3px 5px;
-        width: 80px;
-        font-size: 11px;
-    }
-
-    .ac-form .yui3-fin-ac {
-        width: 50em;
-        border: 1px solid #DDD;
-        background: #fefefe;
-        overflow: visible;
-        text-align: left;
-        padding: .5em;
-        font-size: 12px;
-        z-index: 1000;
-        line-height: 1.22em;
-    }
-
-    .ac-form .yui3-highlight, em {
-        font-weight: bold;
-        font-style: normal;
-    }
-
-    .ac-form .yui3-fin-ac-list {
-        margin: 0;
-        padding-bottom: .4em;
-        padding: 0.38em 0;
-        width: 100%;
-    }
-
-    .ac-form .yui3-fin-ac-list li {
-        padding: 0.15em 0.38em;
-        _width: 100%;
-        cursor: default;
-        white-space: nowrap;
-        list-style: none;
-        vertical-align: bottom;
-        margin: 0;
-        position: relative;
-    }
-
-    .ac-form .symbol {
-        width: 8.5em;
-        display: inline-block;
-        margin: 0 1em 0 0;
-        overflow: hidden;
-    }
-
-    .ac-form .name {
-        display: inline-block;
-        left: 0;
-        width: 25em;
-        overflow: hidden;
-        position: relative;
-    }
-
-    .ac-form .exch_type_wrapper {
-        color: #aaa;
-        height: auto;
-        text-align: right;
-        font-size: 92%;
-        _font-size: 72%;
-        position: absolute;
-        right: 0;
-    }
-
-    .ac-form .yui-ac-ft {
-        font-family: Verdana,sans-serif;
-        font-size: 92%;
-        text-align: left;
-    }
-
-    .ac-form .moreresults {
-        padding-left: 0.3em;
-    }
-
-    .yui3-fin-ac-item-hover, .yui3-fin-ac-item-active {
-        background: #D6F7FF;
-        cursor: pointer;
-    }
-
-    .yui-ac-ft a {
-        color: #039;
-        text-decoration: none;
-        font-size: inherit !important;
-    }
-
-    .yui-ac-ft .tip {
-        border-top: 1px solid #D6D6D6;
-        color: #636363;
-        padding: 0.5em 0 0 0.4em;
-        margin-top: .25em;
-    }
-
-</style>
-<div mode="search" class="ticker-search mod" id="searchQuotes">
-    <div class="hd"></div>
-    <div class="bd" >
-        <form action="/q" name="quote" id="lookupQuote" class="ac-form">
-            <h2 class="yfi_signpost">Search for share prices</h2>
-            <label id="lookupPlaceHolder" class='Hidden'>Enter Symbol</label>
-            <input placeholder="Enter Symbol" type="text" autocomplete="off" value="" name="s" id="lookupTxtQuotes" class="fin-ac-input yui-ac-input">
-
-            <input type="hidden" autocomplete="off" value="1" name="ql" id="lookupGet_quote_logic_opt">
-
-            <div id="yfi_quotes_submit">
-                <span>
-                    <span>
-                        <span>
-                            <input type="submit" class="rapid-nf" id="btnQuotes" value="Look Up">
-                        </span>
-                    </span>
-                </span>
-            </div>
-        </form>
-    </div>
-    <div class="ft"><a href="http://finance.search.yahoo.com?fr=fin-v1" data-rapid_p="4">Finance Search</a>
-        <p><span id="yfs_market_time">Fri, Oct 24 2014, 1:03am EDT - U.S. Markets open in 8 hrs 27 mins</span></p></div>
-</div>
-
-                
-            </div>
-        </div>
-    </div>
-
-    
-
-    
-
-</div>
-
-</div><!--END td-applet-mw-quote-search-->
-   
-
-
-        </div>
-        <div id="yfi_doc">
-            <div id="yfi_bd">
-                <div id="marketindices">
-
-                    
-                        
-                            <span><a href="/q?s=^DJI">Dow</a></span>
-                            <span id="yfs_pp0_^dji">
-                                
-                                    
-                                        <img width="10" height="14" border="0" alt="Up" class="pos_arrow" src="https://s.yimg.com/os/mit/media/m/base/images/transparent-1093278.png" style="margin-right:-2px;">
-                                    
-                                
-                                <b class="yfi-price-change-up">1.32%</b>
-                            </span>
-                        
-                        
-                    
-                        
-                        
-                            <span><a href="/q?s=^IXIC">Nasdaq</a></span>
-                        <span id="yfs_pp0_^ixic">
-                            
-                                
-                                    <img width="10" height="14" border="0" alt="Up" class="pos_arrow" src="https://s.yimg.com/os/mit/media/m/base/images/transparent-1093278.png" style="margin-right:-2px;">
-                                
-                            
-                            <b class="yfi-price-change-up">1.60%</b>
-
-                        
-                    
-                        
-                        
-                    
-                </div>
-
-                <div data-region="leftNav">
-<div id="yfi_investing_nav">
-    <div id="tickerSearch">
-        
-
-    </div>
-
-    <div class="hd">
-        <h2>More on AAPL</h2>
-    </div>
-    <div class="bd">
-
-        
-            <h3>Quotes</h3>
-            <ul>
-            
-                <li  ><a href="/q?s=AAPL">Summary</a></li>
-            
-                <li class="selected" ><a href="/q/op?s=AAPL">Options</a></li>
-            
-                <li  ><a href="/q/hp?s=AAPL">Historical Prices</a></li>
-            
-            </ul>
-        
-            <h3>Charts</h3>
-            <ul>
-            
-                <li  ><a href="/echarts?s=AAPL">Interactive</a></li>
-            
-                <li  ><a href="/q/bc?s=AAPL">Basic Chart</a></li>
-            
-                <li  ><a href="/q/ta?s=AAPL">Basic Tech. Analysis</a></li>
-            
-            </ul>
-        
-            <h3>News &amp; Info</h3>
-            <ul>
-            
-                <li  ><a href="/q/h?s=AAPL">Headlines</a></li>
-            
-                <li  ><a href="/q/b?s=AAPL">Financial Blogs</a></li>
-            
-                <li  ><a href="/q/ce?s=AAPL">Company Events</a></li>
-            
-                <li  ><a href="/q/mb?s=AAPL">Message Board</a></li>
-            
-            </ul>
-        
-            <h3>Company</h3>
-            <ul>
-            
-                <li  ><a href="/q/pr?s=AAPL">Profile</a></li>
-            
-                <li  ><a href="/q/ks?s=AAPL">Key Statistics</a></li>
-            
-                <li  ><a href="/q/sec?s=AAPL">SEC Filings</a></li>
-            
-                <li  ><a href="/q/co?s=AAPL">Competitors</a></li>
-            
-                <li  ><a href="/q/in?s=AAPL">Industry</a></li>
-            
-                <li  ><a href="/q/ct?s=AAPL">Components</a></li>
-            
-            </ul>
-        
-            <h3>Analyst Coverage</h3>
-            <ul>
-            
-                <li  ><a href="/q/ao?s=AAPL">Analyst Opinion</a></li>
-            
-                <li  ><a href="/q/ae?s=AAPL">Analyst Estimates</a></li>
-            
-                <li  ><a href="/q/rr?s=AAPL">Research Reports</a></li>
-            
-                <li  ><a href="/q/sa?s=AAPL">Star Analysts</a></li>
-            
-            </ul>
-        
-            <h3>Ownership</h3>
-            <ul>
-            
-                <li  ><a href="/q/mh?s=AAPL">Major Holders</a></li>
-            
-                <li  ><a href="/q/it?s=AAPL">Insider Transactions</a></li>
-            
-                <li  ><a href="/q/ir?s=AAPL">Insider Roster</a></li>
-            
-            </ul>
-        
-            <h3>Financials</h3>
-            <ul>
-            
-                <li  ><a href="/q/is?s=AAPL">Income Statement</a></li>
-            
-                <li  ><a href="/q/bs?s=AAPL">Balance Sheet</a></li>
-            
-                <li  ><a href="/q/cf?s=AAPL">Cash Flow</a></li>
-            
-            </ul>
-        
-
-    </div>
-    <div class="ft">
-
-    </div>
-</div>
-
-</div><!--END leftNav-->
-                <div id="sky">
-                    <div id="yom-ad-SKY"><div id="yom-ad-SKY-iframe"></div></div><!--ESI Ads for SKY -->
-                </div>
-                <div id="yfi_investing_content">
-
-                    <div id="yfi_broker_buttons">
-                        <div class='yom-ad D-ib W-20'>
-                            <div id="yom-ad-FB2-1"><div id="yom-ad-FB2-1-iframe"></div></div><!--ESI Ads for FB2-1 -->
-                        </div>
-                        <div class='yom-ad D-ib W-25'>
-                            <div id="yom-ad-FB2-2"><div id="yom-ad-FB2-2-iframe"><script>var FB2_2_noadPos = document.getElementById("yom-ad-FB2-2");  if (FB2_2_noadPos) {FB2_2_noadPos.style.display="none";}</script></div></div><!--ESI Ads for FB2-2 -->
-                        </div>
-                        <div class='yom-ad D-ib W-25'>
-                            <div id="yom-ad-FB2-3"><div id="yom-ad-FB2-3-iframe"></div></div><!--ESI Ads for FB2-3 -->
-                        </div>
-                        <div class='yom-ad D-ib W-25'>
-                            <div id="yom-ad-FB2-4"><div id="yom-ad-FB2-4-iframe"></div></div><!--ESI Ads for FB2-4 -->
-                        </div>
-                    </div>
-                    
-   
-       <div data-region="td-applet-mw-quote-details"><style>/*
-*  Stencil defined classes - https://git.corp.yahoo.com/pages/ape/stencil/behavior/index.html
-*   .PageOverlay
-*   .ModalDismissBtn.Btn
-*/
-
-/*
-* User defined classes
-*   #ham-nav-cue-modal - styles for the modal window
-*   .padd-border - styles for the content box of #ham-nav-cue-modal
-*   #ham-nav-cue-modal:after, #ham-nav-cue-modal:before - used to create modal window's arrow.
-*/
-
-.PageOverlay #ham-nav-cue-modal {
-    left: 49px;
-    transition: -webkit-transform .3s;
-    max-width: 240px;
-}
-
-.PageOverlay #ham-nav-cue-modal .padd-border {
-    border: solid #5300C5 2px;
-    padding: 5px 5px 10px 15px;
-}
-
-.PageOverlay {
-    z-index: 201;
-}
-
-#ham-nav-cue-modal:after,
-#ham-nav-cue-modal:before {
-    content: "";
-    border-style: solid;
-    border-width: 10px;
-    width: 0;
-    height: 0;
-    position: absolute;
-    top: 4%;
-    left: -20px;
-}
-
-#ham-nav-cue-modal:before {
-    border-color: transparent #5300C5 transparent transparent;
-}
-
-#ham-nav-cue-modal:after {
-    margin-left: 3px;
-    border-color: transparent #fff transparent transparent;
-}
-
-.ModalDismissBtn.Btn {
-    background: transparent;
-    border-color: transparent;
-}
-.follow-quote,.follow-quote-proxy {
-    color: #999;
-}
-.Icon.follow-quote-following {
-    color: #eac02b;
-}
-
-.follow-quote-tooltip {
-    z-index: 400;
-    text-align: center;
-}
-
-.follow-quote-area:hover .follow-quote {
-    display: inline-block;
-}
-
-.follow-quote-area:hover .quote-link,.follow-quote-visible .quote-link {
-    display: inline-block;
-    max-width: 50px;
-    _width: 50px;
-}</style>
-<div id="applet_4971909176457958" class="App_v2 js-applet" data-applet-guid="4971909176457958" data-applet-type="td-applet-mw-quote-details">
-
-
-    
-    
-
-    <div class="App-Bd">
-        <div class="App-Main" data-region="main">
-            <div class="js-applet-view-container-main">
-                
-                
-  
-    <style>
-        img {
-            vertical-align: baseline;
-        }
-        .follow-quote {
-            margin-left: 5px;
-            margin-right: 2px;
-        }
-        .yfi_rt_quote_summary .rtq_exch {
-            font: inherit;
-        }
-        .up_g.time_rtq_content, span.yfi-price-change-green {
-            color: #80 !important;
-        }
-        .time_rtq, .follow-quote-txt {
-            color: #979ba2;
-        }
-        .yfin_gs span.yfi-price-change-red, .yfin_gs span.yfi-price-change-green {
-            font-weight: bold;
-        }
-        .yfi_rt_quote_summary .hd h2 {
-            font: inherit;
-        }
-        span.yfi-price-change-red {
-            color: #C00 !important;
-        }
-        /* to hide the up/down arrow */
-        .yfi_rt_quote_summary_rt_top .time_rtq_content img {
-            display: none;
-        }
-
-        .quote_summary {
-            min-height: 77px;
-        }
-
-        .app_promo.after_hours, .app_promo.pre_market {
-            top: 8px;
-        }
-    </style>
-    <div class="rtq_leaf">
-      <div class="rtq_div">
-        <div class="yui-g quote_summary">
-          <div class="yfi_rt_quote_summary" id="yfi_rt_quote_summary">
-            <div class="hd">
-              <div class="title Fz-xl">
-                <h2 class="symbol-name">Apple Inc. (AAPL)</h2>
-                <span class="wl_sign Invisible"><button class="follow-quote follow-quote-follow follow-quote-always-visible D-ib Bd-0 O-0 Cur-p Sprite P-0 M-0 Fz-s" data-flw-quote="AAPL"><i class="Icon">&#xe023;</i></button>  <span class="follow-quote-txt Fz-m" data-flw-quote="AAPL">
-                    Watchlist
-                </span></span>
-              </div>
-            </div>
-            <div class="yfi_rt_quote_summary_rt_top sigfig_promo_1">
-              <div>
-                  <span class="time_rtq_ticker Fz-30 Fw-b">
-                        <span id="yfs_l84_AAPL" data-sq="AAPL:value">104.83</span>
-                  </span>
-                
-
-                    
-                        <span class="up_g time_rtq_content Fz-2xl Fw-b"><span id="yfs_c63_AAPL"><img width="10" height="14" border="0" style="margin-right:-2px;" src="https://s.yimg.com/lq/i/us/fi/03rd/up_g.gif" alt="Up"> <span class="yfi-price-change-green" data-sq="AAPL:chg">+1.84</span></span><span id="yfs_p43_AAPL">(<span class="yfi-price-change-green" data-sq="AAPL:pctChg">1.79%</span>)</span> </span>
-                    
-                
-                    <span class="time_rtq Fz-m"><span class="rtq_exch">NasdaqGS - </span><span id="yfs_t53_AAPL">As of <span data-sq="AAPL:lstTrdTime">4:00PM EDT</span></span></span>
-
-              </div>
-              <div><span class="rtq_separator">|</span>
-                    
-                    
-              </div>
-            </div>
-            <style>
-              #yfi_toolbox_mini_rtq.sigfig_promo {
-              bottom:45px !important;
-              }
-            </style>
-            <div class="app_promo  " >
-                <a href="https://mobile.yahoo.com/finance/?src=gta" title="Get the App" target="_blank" ></a>
-
-            </div>
-          </div>
-        </div>
-      </div>
-    </div>
-  
-
-
-                
-            </div>
-        </div>
-    </div>
-
-    
-
-    
-
-</div>
-
-</div><!--END td-applet-mw-quote-details-->
-   
-
-
-                    <div id="optionsTableApplet">
-                    
-   
-       <div data-region="td-applet-options-table"><style>.App_v2 {
-    border: none;
-    margin: 0;
-    padding: 0;
-}
-
-.options-table {
-    position: relative;
-}
-
-/*.Icon.up {*/
-    /*display: none;*/
-/*}*/
-
-.option_column {
-    width: auto;
-}
-
-.header_text {
-    float: left;
-    max-width: 50px;
-}
-.header_sorts {
-    color: #00be8c;
-    float: left;
-}
-
-.size-toggle-menu {
-    margin-left: 600px;
-}
-
-.in-the-money-banner {
-    background-color: rgba(224,241,231,1);
-    padding: 7px;
-    position: relative;
-    top: -3px;
-    width: 95px;
-}
-
-.in-the-money.odd {
-    background-color: rgba(232,249,239,1);
-}
-
-.in-the-money.even {
-    background-color: rgba(224,241,231,1);
-}
-
-.toggle li{
-    display: inline-block;
-    cursor: pointer;
-    border: 1px solid #e2e2e6;
-    border-right-width: 0;
-    color: #454545;
-    background-color: #fff;
-    float: left;
-    padding: 0px;
-    margin: 0px;
-}
-
-.toggle li a {
-  padding: 7px; 
-  display: block;
-}
-
-.toggle li:hover{
-    background-color: #e2e2e6;
-}
-
-.toggle li.active{
-    color: #fff;
-    background-color: #30d3b6;
-    border-color: #30d3b6;
-    border-bottom-color: #0c8087;
-}
-
-.toggle li:first-child{
-    border-radius: 3px 0 0 3px;
-}
-
-.toggle li:last-child{
-    border-radius: 0 3px 3px 0;
-    border-right-width: 1px;
-}
-
-.high-low .up {
-    display: none;
-}
-
-.high-low .down {
-    display: block;
-}
-
-.low-high .down {
-    display: none;
-}
-
-.low-high .up {
-    display: block;
-}
-
-.option_column.sortable {
-    cursor: pointer;
-}
-
-.option-filter-overlay {
-    background-color: #fff;
-    border: 1px solid #979ba2;
-    border-radius: 3px;
-    float: left;
-    padding: 15px;
-    position: absolute;
-    top: 60px;
-    z-index: 10;
-    display: none;
-}
-
-#optionsStraddlesTable .option-filter-overlay {
-    left: 430px;
-}
-
-.option-filter-overlay.active {
-    display: block;
-}
-
-.option-filter-overlay .strike-filter{
-    height: 25px;
-    width: 75px;
-}
-
-#straddleTable .column-strike .cell{
-    width: 30px;
-}
-
-/**columns**/
-
-#quote-table th.column-expires {
-    width: 102px;
-}
-.straddle-expire div.option_entry {
-    min-width: 65px;
-}
-.column-last .cell {
-    width: 55px;
-}
-
-.column-change .cell {
-    width: 70px;
-}
-
-.cell .change {
-    width: 35px;
-}
-
-.column-percentChange .cell {
-    width: 85px;
-}
-
-.column-volume .cell {
-    width: 70px;
-}
-
-.cell .sessionVolume {
-    width: 37px;
-}
-
-.column-session-volume .cell {
-    width: 75px;
-}
-
-.column-openInterest .cell, .column-openInterestChange .cell {
-    width: 75px;
-}
-.cell .openInterest, .cell .openInterestChange {
-    width: 37px;
-}
-
-.column-bid .cell {
-    width: 50px;
-}
-
-.column-ask .cell {
-    width: 55px;
-}
-
-.column-impliedVolatility .cell {
-    width: 75px;
-}
-
-.cell .impliedVolatility {
-    width: 37px;
-}
-
-.column-contractName .cell {
-    width: 170px;
-}
-
-.options-menu-item {
-    position: relative;
-    top: -11px;
-}
-
-.options-table {
-  margin-bottom: 30px;
-}
-.options-table.hidden {
-  display: none;
-}
-#quote-table table {
-  width: 100%;
-}
-#quote-table tr * {
-  font-family: 'Helvetica Neue', Helvetica, Arial, sans-serif;
-  font-size: 15px;
-  color: #454545;
-  font-weight: 200;
-}
-#quote-table tr a {
-    color: #1D1DA3;
-}
-#quote-table tr .Icon {
-  font-family: YGlyphs;
-}
-#quote-table tr.odd {
-  background-color: #f7f7f7;
-}
-#quote-table tr th {
-  -webkit-box-sizing: border-box;
-  -moz-box-sizing: border-box;
-  box-sizing: border-box;
-  text-align: center;
-  width: 60px;
-  font-size: 11px !important;
-  padding-top: 10px;
-  padding-right: 5px;
-  padding-bottom: 10px;
-  vertical-align: middle;
-}
-#quote-table tr th * {
-  font-size: 11px;
-}
-#quote-table tr th .expand-icon {
-  display: block !important;
-  margin: 0 auto;
-  border: 1px solid #e2e2e6;
-  background-color: #fcfcfc;
-  -webkit-border-radius: 2px;
-  border-radius: 2px;
-  padding: 2px 0;
-}
-#quote-table tr th.column-strike {
-  width: 82px;
-}
-#quote-table tr th .sort-icons {
-  position: absolute;
-  margin-left: 2px;
-}
-#quote-table tr th .Icon {
-  display: none;
-}
-#quote-table tr th.low-high .up {
-  display: block !important;
-}
-#quote-table tr th.high-low .down {
-  display: block !important;
-}
-#quote-table td {
-  text-align: center;
-  padding: 7px 5px 7px 5px;
-}
-#quote-table td:first-child,
-#quote-table th:first-child {
-  border-right: 1px solid #e2e2e6;
-}
-#quote-table .D-ib .Icon {
-  color: #66aeb2;
-}
-#quote-table caption {
-  background-color: #454545 !important;
-  color: #fff;
-  font-size: medium;
-  padding: 4px;
-  padding-left: 20px !important;
-  text-rendering: antialiased;
-  -webkit-box-sizing: border-box;
-  -moz-box-sizing: border-box;
-  box-sizing: border-box;
-}
-#quote-table caption .callStraddles {
-  width:50%; 
-  text-align:center; 
-  float:left;
-}
-#quote-table caption .putStraddles {
-  width:50%; 
-  text-align:center; 
-  float:right;
-}
-#quote-table .in-the-money.even {
-  background-color: #f3fdfc;
-}
-#quote-table .in-the-money.even td:first-child {
-  -webkit-box-shadow: inset 5px 0 0 0 #d5f8f3;
-  box-shadow: inset 5px 0 0 0 #d5f8f3;
-}
-#quote-table .in-the-money.even td:last-child {
-  -webkit-box-shadow: inset -5px 0 0 0 #d5f8f3;
-  box-shadow: inset -5px 0 0 0 #d5f8f3;
-}
-#quote-table .in-the-money.odd {
-  background-color: #ecf6f4;
-}
-#quote-table .in-the-money.odd td:first-child {
-  -webkit-box-shadow: inset 5px 0 0 0 #cff3ec;
-  box-shadow: inset 5px 0 0 0 #cff3ec;
-}
-#quote-table .in-the-money.odd td:last-child {
-  -webkit-box-shadow: inset -5px 0 0 0 #cff3ec;
-  box-shadow: inset -5px 0 0 0 #cff3ec;
-}
-#quote-table .column-strike {
-  text-align: center;
-  padding: 4px 20px;
-}
-#quote-table .column-strike .header_text,
-#quote-table .column-expires .cell .expiration{
-  color: #454545;
-  font-size: 15px;
-  font-weight: bold;
-  max-width: 100%;
-}
-#quote-table .column-strike .header_text {
-    width: 100%;
-}
-#quote-table .column-strike .filter {
-  border: 1px solid #e2e2e6;
-  background-color: #fcfcfc;
-  color: #858585;
-  display: inline-block;
-  padding: 1px 10px;
-  -webkit-border-radius: 3px;
-  border-radius: 3px;
-  margin-top: 4px;
-}
-#quote-table .column-strike .filter span {
-  position: relative;
-  top: -2px;
-  font-weight: bold;
-  margin-left: -5px;
-}
-
-#quote-table .column-strike .sort-icons {
-   top: 35px;
-}
-#quote-table .column-expires .sort-icons {
-    top: 45px;
-}
-#optionsStraddlesTable .column-expires .sort-icons {
-    top: 40px;
-}
-#quote-table #options_menu {
-  width: 100%;
-}
-#quote-table #options_menu .SelectBox-Pick {
-  background-color: #fcfcfc !important;
-  border: 1px solid #e2e2e6;
-  color: #128086;
-  font-size: 14px;
-  padding: 5px;
-  padding-top: 8px;
-}
-#quote-table #options_menu .SelectBox-Text {
-  font-weight: bold;
-}
-#quote-table .size-toggle-menu {
-  margin-left: 15px !important;
-}
-#quote-table .options-menu-item {
-  top: -9px;
-}
-#quote-table .option_view {
-  float: right;
-}
-#quote-table .option-change-pos {
-  color: #2ac194;
-}
-#quote-table .option-change-neg {
-  color: #f90f31;
-}
-#quote-table .toggle li {
-  color: #128086;
-  background-color: #fcfcfc;
-}
-#quote-table .toggle li.active {
-  color: #fff;
-  background-color: #35d2b6;
-}
-#quote-table .expand-icon {
-  color: #b5b5b5;
-  font-size: 12px;
-  cursor: pointer;
-}
-#quote-table .straddleCallContractName {
-  padding-left: 25px;
-}
-#quote-table .straddlePutContractName {
-  padding-left: 20px;
-}
-#quote-table .straddle-row-expand {
-  display: none;
-  border-bottom: 1px solid #f9f9f9;
-}
-#quote-table .straddle-row-expand td {
-  padding-right: 5px;
-}
-#quote-table .straddle-row-expand label {
-  color: #454545;
-  font-size: 11px;
-  margin-bottom: 2px;
-  color: #888;
-}
-#quote-table .straddle-row-expand label,
-#quote-table .straddle-row-expand div {
-  display: block;
-  font-weight: 400;
-  text-align: left;
-  padding-left: 5px;
-}
-#quote-table .expand-icon-up {
-  display: none;
-}
-#quote-table tr.expanded + .straddle-row-expand {
-  display: table-row;
-}
-#quote-table tr.expanded .expand-icon-up {
-  display: inline-block;
-}
-#quote-table tr.expanded .expand-icon-down {
-  display: none;
-}
-.in-the-money-banner {
-  color: #7f8584;
-  font-size: 11px;
-  background-color: #eefcfa;
-  border-left: 12px solid #e0faf6;
-  border-right: 12px solid #e0faf6;
-  width: 76px !important;
-  text-align: center;
-  padding: 5px !important;
-  margin-top: 5px;
-  margin-left: 15px;
-}
-#optionsStraddlesTable td div {
-  text-align: center;
-}
-#optionsStraddlesTable .straddle-strike,
-#optionsStraddlesTable .column-strike,
-#optionsStraddlesTable .straddle-expire{
-  border-right: 1px solid #e2e2e6;
-  border-left: 1px solid #e2e2e6;
-}
-#optionsStraddlesTable td:first-child,
-#optionsStraddlesTable th:first-child {
-  border-right: none !important;
-}
-#optionsStraddlesTable .odd td.in-the-money {
-  background-color: #ecf6f4;
-}
-#optionsStraddlesTable .odd td.in-the-money:first-child {
-  -webkit-box-shadow: inset 5px 0 0 0 #cff3ec;
-  box-shadow: inset 5px 0 0 0 #cff3ec;
-}
-#optionsStraddlesTable .odd td.in-the-money:last-child {
-  -webkit-box-shadow: inset -5px 0 0 0 #cff3ec;
-  box-shadow: inset -5px 0 0 0 #cff3ec;
-}
-#optionsStraddlesTable .even td.in-the-money {
-  background-color: #f3fdfc;
-}
-#optionsStraddlesTable .even td.in-the-money:first-child {
-  -webkit-box-shadow: inset 5px 0 0 0 #d5f8f3;
-  box-shadow: inset 5px 0 0 0 #d5f8f3;
-}
-#optionsStraddlesTable .even td.in-the-money:last-child {
-  -webkit-box-shadow: inset -5px 0 0 0 #d5f8f3;
-  box-shadow: inset -5px 0 0 0 #d5f8f3;
-}
-.column-expand-all {
-  cursor: pointer;
-}
-.options-table.expand-all tr + .straddle-row-expand {
-  display: table-row !important;
-}
-.options-table.expand-all tr .expand-icon-up {
-  display: inline-block !important;
-}
-.options-table.expand-all tr .expand-icon-down {
-  display: none !important;
-}
-.options_menu .toggle a {
-  color: #128086;
-}
-.options_menu .toggle a:hover {
-  text-decoration: none;
-}
-.options_menu .toggle .active a {
-  color: #fff;
-}
-#options_menu .symbol_lookup {
-    float: right;
-    top: -11px;
-}
-.symbol_lookup .options-ac-input {
-    border-radius: 0;
-    height: 26px;
-    width: 79%;
-}
-.goto-icon {
-    border-left: 1px solid #e2e2e6;
-    color: #028087;
-    cursor: pointer;
-}
-.symbol_lookup .goto-icon {
-    height: 27px;
-    line-height: 2.1em;
-}
-#finAcOutput {
-    left: 10px;
-    top: -10px;
-}
-#finAcOutput .yui3-fin-ac-hidden {
-    display: none;
-}
-#finAcOutput .yui3-aclist {
-    border: 1px solid #DDD;
-    background: #fefefe;
-    font-size: 92%;
-    left: 0 !important;
-    overflow: visible;
-    padding: .5em;
-    position: absolute !important;
-    text-align: left;
-    top: 0 !important;
-
-}
-#finAcOutput li.yui3-fin-ac-item-active,
-#finAcOutput li.yui3-fin-ac-item-hover {
-    background: #F1F1F1;
-    cursor: pointer;
-}
-#finAcOutput div:first-child {
-    width: 30em !important;
-}
-#finAcOutput b.yui3-highlight {
-    font-weight: bold;
-}
-#finAcOutput li .name {
-    display: inline-block;
-    left: 0;
-    width: 25em;
-    overflow: hidden;
-    position: relative;
-}
-
-#finAcOutput li .symbol {
-    width: 8.5em;
-    display: inline-block;
-    margin: 0 1em 0 0;
-    overflow: hidden;
-}
-
-#finAcOutput li {
-    color: #444;
-    cursor: default;
-    font-weight: 300;
-    list-style: none;
-    margin: 0;
-    padding: .15em .38em;
-    position: relative;
-    vertical-align: bottom;
-    white-space: nowrap;
-}
-
-.yui3-fin-ac-hidden {
-    visibility: hidden;
-}
-
-.filterRangeRow {
-    line-height: 5px;
-}
-.filterRangeTitle {
-    padding-bottom: 5px;
-    font-size: 12px !important;
-}
-.clear-filter {
-    padding-left: 20px;
-}
-.closeFilter {
-    font-size: 10px !important;
-    color: red !important;
-}
-.modify-filter {
-    font-size: 11px !important;
-}
-.showModifyFilter {
-    top: 80px;
-    left: 630px;
-}
-
-#options_menu {
-    margin-bottom: -15px;
-}
-
-#optionsTableApplet {
-    margin-top: 9px;
-    width: 1070px;
-}
-
-#yfi_charts.desktop #yfi_doc {
-    width: 1440px;
-}
-#sky {
-    float: right;
-    margin-left: 30px;
-    margin-top: 50px;
-    width: 170px;
-}
-</style>
-<div id="applet_4971909175742216" class="App_v2 js-applet" data-applet-guid="4971909175742216" data-applet-type="td-applet-options-table">
-
-
-    
-    
-
-    <div class="App-Bd">
-        <div class="App-Main" data-region="main">
-            <div class="js-applet-view-container-main">
-                
-                <div id="quote-table">
-    <div id="options_menu" class="Grid-U options_menu">
-        
-        <form class="Grid-U SelectBox">
-            <div class="SelectBox-Pick"><b class='SelectBox-Text '>October 24, 2014</b><i class='Icon Va-m'>&#xe002;</i></div>
-            <select class='Start-0' data-plugin="selectbox">
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1414108800" value="1414108800" selected >October 24, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1414713600" value="1414713600"  >October 31, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1415318400" value="1415318400"  >November 7, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1415923200" value="1415923200"  >November 14, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1416614400" value="1416614400"  >November 22, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1417132800" value="1417132800"  >November 28, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1419033600" value="1419033600"  >December 20, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1421452800" value="1421452800"  >January 17, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1424390400" value="1424390400"  >February 20, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1429228800" value="1429228800"  >April 17, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1437091200" value="1437091200"  >July 17, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1452816000" value="1452816000"  >January 15, 2016</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1484870400" value="1484870400"  >January 20, 2017</option>
-                
-            </select>
-        </form>
-        
-        
-        <div class="Grid-U options-menu-item size-toggle-menu">
-            <ul class="toggle size-toggle">
-                <li data-size="REGULAR" class="size-toggle-option toggle-regular active Cur-p">
-                    <a href="/q/op?s=AAPL&date=1414108800">Regular</a>
-                </li>
-                <li data-size="MINI" class="size-toggle-option toggle-mini  Cur-p">
-                    <a href="/q/op?s=AAPL&size=mini&date=1414108800">Mini</a>
-                </li>
-            </ul>
-        </div>
-        
-
-        <div class="Grid-U options-menu-item symbol_lookup">
-            <div class="Cf">
-                <div class="fin-ac-container Bd-1 Pos-r M-10">
-                    <input placeholder="Lookup Option" type="text" autocomplete="off" value="" name="s" class="options-ac-input Bd-0" id="finAcOptions">
-                    <i class="Icon Fl-end W-20 goto-icon">&#xe015;</i>
-                </div>
-                <div id="finAcOutput" class="yui-ac-container Pos-r"></div>
-            </div>
-        </div>
-        <div class="Grid-U option_view options-menu-item">
-            <ul class="toggle toggle-view-mode">
-                <li class="toggle-list active">
-                  <a href="/q/op?s=AAPL&date=1414108800">List</a>
-                </li>
-                <li class="toggle-straddle ">
-                  <a href="/q/op?s=AAPL&straddle=true&date=1414108800">Straddle</a>
-                </li>
-            </ul>
-
-        </div>
-        <div class="Grid-U in_the_money in-the-money-banner">
-            In The Money
-        </div>
-    </div>
-
-    
-        
-            <div class="options-table " id="optionsCallsTable" data-sec="options-calls-table">
-                <div class="strike-filter option-filter-overlay">
-	<p>Show Me Strikes From</p>
-	<div class="My-6">
-	    $ <input class="filter-low strike-filter" data-filter-type="low" type="text">
-	    to $ <input class="filter-high strike-filter" data-filter-type="high" type="text">
-	</div>
-	<a data-table-filter="optionsCalls" class="Cur-p apply-filter">Apply Filter</a>
-	<a class="Cur-p clear-filter">Clear Filter</a>
-</div>
-                
-
-<div class="follow-quote-area">
-    <div class="quote-table-overflow">
-        <table class="details-table quote-table Fz-m">
-            
-                
-                    <caption>
-                        Calls
-                    </caption>
-                
-            
-            <thead class="details-header quote-table-headers">
-                <tr>
-                    
-    
-
-        
-            <th class='column-strike Pstart-38 low-high  Fz-xs filterable sortable option_column' style='color: #454545;' data-sort-column='strike' data-col-pos='0'>
-                <div class="cell">
-                    <div class="D-ib header_text strike">Strike</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-                <div class="filter  Cur-p "><span>&#8757;</span> Filter</div>
-            </th>
-        
-    
-
-    
-        
-            <th class='column-contractName Pstart-10 '>Contract Name</th>
-        
-    
-
-    
-
-        
-            <th class='column-last Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='lastPrice' data-col-pos='2'>
-                <div class="cell">
-                    <div class="D-ib lastPrice">Last</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-bid Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='bid' data-col-pos='3'>
-                <div class="cell">
-                    <div class="D-ib bid">Bid</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-ask Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='ask' data-col-pos='4'>
-                <div class="cell">
-                    <div class="D-ib ask">Ask</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-change Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='change' data-col-pos='5'>
-                <div class="cell">
-                    <div class="D-ib change">Change</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-percentChange Pstart-16  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='percentChange' data-col-pos='6'>
-                <div class="cell">
-                    <div class="D-ib percentChange">%Change</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-volume Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='volume' data-col-pos='7'>
-                <div class="cell">
-                    <div class="D-ib volume">Volume</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-openInterest Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='openInterest' data-col-pos='8'>
-                <div class="cell">
-                    <div class="D-ib openInterest">Open Interest</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-impliedVolatility Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='impliedVolatility' data-col-pos='9'>
-                <div class="cell">
-                    <div class="D-ib impliedVolatility">Implied Volatility</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-
-                </tr>
-                
-                <tr class="filterRangeRow D-n">
-                    <td colspan="10">
-                        <div>
-                            <span class="filterRangeTitle"></span>
-                            <span class="closeFilter Cur-p">&#10005;</span>
-                            <span class="modify-filter Cur-p">[modify]</span>
-                        </div>
-                    </td>
-                </tr>
-                
-            </thead>
-
-            <tbody>
-                
-                    
-                    
-    <tr data-row="0" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=55.00">55.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00055000">AAPL141024C00055000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >44.16</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >49.70</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >49.95</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="25">25</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >568.75%</div>
-        </td>
-    </tr>
-
-    <tr data-row="1" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=75.00">75.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00075000">AAPL141024C00075000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >27.71</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >29.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >29.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2">2</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >247</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >293.75%</div>
-        </td>
-    </tr>
-
-    <tr data-row="2" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=80.00">80.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00080000">AAPL141024C00080000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >24.95</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >24.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >24.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.60</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+6.85%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1">1</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >77</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >242.97%</div>
-        </td>
-    </tr>
-
-    <tr data-row="3" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=83.00">83.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00083000">AAPL141024C00083000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >19.84</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >21.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >21.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1">1</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >214.06%</div>
-        </td>
-    </tr>
-
-    <tr data-row="4" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=85.00">85.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00085000">AAPL141024C00085000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >19.86</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >19.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >19.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.36</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+7.35%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="13">13</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >233</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >194.53%</div>
-        </td>
-    </tr>
-
-    <tr data-row="5" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=86.00">86.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00086000">AAPL141024C00086000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >16.72</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >18.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >18.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2">2</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >16</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >185.16%</div>
-        </td>
-    </tr>
-
-    <tr data-row="6" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=87.00">87.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00087000">AAPL141024C00087000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >12.50</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >17.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >17.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="20">20</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >15</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >175.78%</div>
-        </td>
-    </tr>
-
-    <tr data-row="7" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=88.00">88.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00088000">AAPL141024C00088000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >16.95</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >16.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >16.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.75</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+11.51%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2">2</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >346</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >166.41%</div>
-        </td>
-    </tr>
-
-    <tr data-row="8" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=89.00">89.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00089000">AAPL141024C00089000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >15.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >15.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="5">5</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >314</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >157.42%</div>
-        </td>
-    </tr>
-
-    <tr data-row="9" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=90.00">90.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00090000">AAPL141024C00090000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >14.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >14.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >14.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.38</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+10.28%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="198">198</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >617</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >148.44%</div>
-        </td>
-    </tr>
-
-    <tr data-row="10" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=91.00">91.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00091000">AAPL141024C00091000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13.60</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.20</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+9.68%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="8">8</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >385</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >139.06%</div>
-        </td>
-    </tr>
-
-    <tr data-row="11" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=92.00">92.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00092000">AAPL141024C00092000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >12.95</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >12.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >12.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.47</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+12.80%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="3">3</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1036</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >129.69%</div>
-        </td>
-    </tr>
-
-    <tr data-row="12" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=93.00">93.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00093000">AAPL141024C00093000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >12.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >11.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >11.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2.00</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+20.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="22">22</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >613</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >120.70%</div>
-        </td>
-    </tr>
-
-    <tr data-row="13" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=94.00">94.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00094000">AAPL141024C00094000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >10.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >10.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >10.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.20</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+12.50%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="19">19</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1726</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >111.72%</div>
-        </td>
-    </tr>
-
-    <tr data-row="14" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=95.00">95.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00095000">AAPL141024C00095000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >9.85</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >9.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >9.85</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.34</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+15.75%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="3799">3799</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >14099</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >84.38%</div>
-        </td>
-    </tr>
-
-    <tr data-row="15" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=96.00">96.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00096000">AAPL141024C00096000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.45</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+19.73%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="374">374</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8173</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >93.36%</div>
-        </td>
-    </tr>
-
-    <tr data-row="16" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=97.00">97.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00097000">AAPL141024C00097000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7.85</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.66</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+26.82%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="5094">5094</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >21122</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >84.38%</div>
-        </td>
-    </tr>
-
-    <tr data-row="17" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=98.00">98.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00098000">AAPL141024C00098000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.81</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+36.27%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1039">1039</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >18540</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >75.00%</div>
-        </td>
-    </tr>
-
-    <tr data-row="18" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=99.00">99.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00099000">AAPL141024C00099000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.70</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+41.98%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2602">2602</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >15608</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >65.63%</div>
-        </td>
-    </tr>
-
-    <tr data-row="19" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=100.00">100.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00100000">AAPL141024C00100000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4.85</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.85</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+61.67%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="8867">8867</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >31290</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >56.25%</div>
-        </td>
-    </tr>
-
-    <tr data-row="20" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=101.00">101.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00101000">AAPL141024C00101000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.70</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.58</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+74.53%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="5232">5232</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >19255</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >46.68%</div>
-        </td>
-    </tr>
-
-    <tr data-row="21" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=102.00">102.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00102000">AAPL141024C00102000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2.85</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2.84</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2.91</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.52</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+114.29%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="11311">11311</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >32820</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >38.09%</div>
-        </td>
-    </tr>
-
-    <tr data-row="22" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=103.00">103.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00103000">AAPL141024C00103000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.88</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.87</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.21</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+180.60%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="26745">26745</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >40149</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >26.56%</div>
-        </td>
-    </tr>
-
-    <tr data-row="23" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=104.00">104.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00104000">AAPL141024C00104000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.05</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.77</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+275.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="38966">38966</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >38899</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >23.44%</div>
-        </td>
-    </tr>
-
-    <tr data-row="24" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=105.00">105.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00105000">AAPL141024C00105000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.40</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.38</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.40</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.30</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+300.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="66026">66026</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >42521</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >21.88%</div>
-        </td>
-    </tr>
-
-    <tr data-row="25" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=106.00">106.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00106000">AAPL141024C00106000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.12</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.11</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.12</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.08</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+200.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="54624">54624</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >22789</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >22.85%</div>
-        </td>
-    </tr>
-
-    <tr data-row="26" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=107.00">107.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00107000">AAPL141024C00107000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.04</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.04</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+100.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="15310">15310</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >60738</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >25.78%</div>
-        </td>
-    </tr>
-
-    <tr data-row="27" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=108.00">108.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00108000">AAPL141024C00108000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+100.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="10333">10333</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >20808</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >32.81%</div>
-        </td>
-    </tr>
-
-    <tr data-row="28" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=109.00">109.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00109000">AAPL141024C00109000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+100.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="343">343</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8606</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >40.63%</div>
-        </td>
-    </tr>
-
-    <tr data-row="29" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=110.00">110.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00110000">AAPL141024C00110000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+100.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1151">1151</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >32265</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >45.31%</div>
-        </td>
-    </tr>
-
-    <tr data-row="30" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=111.00">111.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00111000">AAPL141024C00111000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-50.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="14">14</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4228</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >47.66%</div>
-        </td>
-    </tr>
-
-    <tr data-row="31" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=112.00">112.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00112000">AAPL141024C00112000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="22">22</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3281</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >54.69%</div>
-        </td>
-    </tr>
-
-    <tr data-row="32" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=113.00">113.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00113000">AAPL141024C00113000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="13">13</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1734</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >56.25%</div>
-        </td>
-    </tr>
-
-    <tr data-row="33" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=114.00">114.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00114000">AAPL141024C00114000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="20">20</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1306</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >62.50%</div>
-        </td>
-    </tr>
-
-    <tr data-row="34" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=115.00">115.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00115000">AAPL141024C00115000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="16">16</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1968</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >65.63%</div>
-        </td>
-    </tr>
-
-    <tr data-row="35" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=116.00">116.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00116000">AAPL141024C00116000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2">2</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >733</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >71.88%</div>
-        </td>
-    </tr>
-
-    <tr data-row="36" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=117.00">117.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00117000">AAPL141024C00117000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="127">127</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >183</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >78.13%</div>
-        </td>
-    </tr>
-
-    <tr data-row="37" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=118.00">118.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00118000">AAPL141024C00118000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="4">4</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >203</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >84.38%</div>
-        </td>
-    </tr>
-
-    <tr data-row="38" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=119.00">119.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00119000">AAPL141024C00119000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="215">215</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >225</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >87.50%</div>
-        </td>
-    </tr>
-
-    <tr data-row="39" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=120.00">120.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00120000">AAPL141024C00120000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="526">526</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >523</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >93.75%</div>
-        </td>
-    </tr>
-
-    <tr data-row="40" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=122.00">122.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00122000">AAPL141024C00122000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="0">0</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >103.13%</div>
-        </td>
-    </tr>
-
-    <tr data-row="41" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=130.00">130.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024C00130000">AAPL141024C00130000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1">1</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >143.75%</div>
-        </td>
-    </tr>
-
-
-                    
-                    
-                    
-                    
-                
-            </tbody>
-        </table>
-    </div>
-</div>
-
-
-            </div>
-
-            <div class="options-table " id="optionsPutsTable" data-sec="options-puts-table">
-                <div class="strike-filter option-filter-overlay">
-	<p>Show Me Strikes From</p>
-	<div class="My-6">
-	    $ <input class="filter-low strike-filter" data-filter-type="low" type="text">
-	    to $ <input class="filter-high strike-filter" data-filter-type="high" type="text">
-	</div>
-	<a data-table-filter="optionsPuts" class="Cur-p apply-filter">Apply Filter</a>
-	<a class="Cur-p clear-filter">Clear Filter</a>
-</div>
-                
-
-<div class="follow-quote-area">
-    <div class="quote-table-overflow">
-        <table class="details-table quote-table Fz-m">
-            
-                
-                    <caption>
-                        Puts
-                    </caption>
-                
-            
-            <thead class="details-header quote-table-headers">
-                <tr>
-                    
-    
-
-        
-            <th class='column-strike Pstart-38 low-high  Fz-xs filterable sortable option_column' style='color: #454545;' data-sort-column='strike' data-col-pos='0'>
-                <div class="cell">
-                    <div class="D-ib header_text strike">Strike</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-                <div class="filter  Cur-p "><span>&#8757;</span> Filter</div>
-            </th>
-        
-    
-
-    
-        
-            <th class='column-contractName Pstart-10 '>Contract Name</th>
-        
-    
-
-    
-
-        
-            <th class='column-last Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='lastPrice' data-col-pos='2'>
-                <div class="cell">
-                    <div class="D-ib lastPrice">Last</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-bid Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='bid' data-col-pos='3'>
-                <div class="cell">
-                    <div class="D-ib bid">Bid</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-ask Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='ask' data-col-pos='4'>
-                <div class="cell">
-                    <div class="D-ib ask">Ask</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-change Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='change' data-col-pos='5'>
-                <div class="cell">
-                    <div class="D-ib change">Change</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-percentChange Pstart-16  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='percentChange' data-col-pos='6'>
-                <div class="cell">
-                    <div class="D-ib percentChange">%Change</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-volume Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='volume' data-col-pos='7'>
-                <div class="cell">
-                    <div class="D-ib volume">Volume</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-openInterest Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='openInterest' data-col-pos='8'>
-                <div class="cell">
-                    <div class="D-ib openInterest">Open Interest</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-impliedVolatility Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='impliedVolatility' data-col-pos='9'>
-                <div class="cell">
-                    <div class="D-ib impliedVolatility">Implied Volatility</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-
-                </tr>
-                
-                <tr class="filterRangeRow D-n">
-                    <td colspan="10">
-                        <div>
-                            <span class="filterRangeTitle"></span>
-                            <span class="closeFilter Cur-p">&#10005;</span>
-                            <span class="modify-filter Cur-p">[modify]</span>
-                        </div>
-                    </td>
-                </tr>
-                
-            </thead>
-
-            <tbody>
-                
-                    
-    <tr data-row="0" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=55.00">55.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00055000">AAPL141024P00055000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2">2</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >400.00%</div>
-        </td>
-    </tr>
-
-    <tr data-row="1" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=60.00">60.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00060000">AAPL141024P00060000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="161">161</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >162</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >350.00%</div>
-        </td>
-    </tr>
-
-    <tr data-row="2" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=70.00">70.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00070000">AAPL141024P00070000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="101">101</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >104</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >262.50%</div>
-        </td>
-    </tr>
-
-    <tr data-row="3" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=75.00">75.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00075000">AAPL141024P00075000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="5">5</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1670</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >218.75%</div>
-        </td>
-    </tr>
-
-    <tr data-row="4" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=80.00">80.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00080000">AAPL141024P00080000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1200">1200</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1754</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >181.25%</div>
-        </td>
-    </tr>
-
-    <tr data-row="5" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=83.00">83.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00083000">AAPL141024P00083000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="34">34</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4148</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >156.25%</div>
-        </td>
-    </tr>
-
-    <tr data-row="6" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=84.00">84.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00084000">AAPL141024P00084000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1325">1325</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2296</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >150.00%</div>
-        </td>
-    </tr>
-
-    <tr data-row="7" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=85.00">85.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00085000">AAPL141024P00085000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="5">5</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7442</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >143.75%</div>
-        </td>
-    </tr>
-
-    <tr data-row="8" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=86.00">86.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00086000">AAPL141024P00086000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="32">32</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1782</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >134.38%</div>
-        </td>
-    </tr>
-
-    <tr data-row="9" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=87.00">87.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00087000">AAPL141024P00087000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="20">20</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3490</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >125.00%</div>
-        </td>
-    </tr>
-
-    <tr data-row="10" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=88.00">88.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00088000">AAPL141024P00088000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="36">36</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5516</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >118.75%</div>
-        </td>
-    </tr>
-
-    <tr data-row="11" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=89.00">89.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00089000">AAPL141024P00089000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="20">20</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3694</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >112.50%</div>
-        </td>
-    </tr>
-
-    <tr data-row="12" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=90.00">90.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00090000">AAPL141024P00090000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+100.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="149">149</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13444</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >106.25%</div>
-        </td>
-    </tr>
-
-    <tr data-row="13" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=91.00">91.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00091000">AAPL141024P00091000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-50.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="402">402</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7670</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >98.44%</div>
-        </td>
-    </tr>
-
-    <tr data-row="14" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=92.00">92.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00092000">AAPL141024P00092000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-50.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="81">81</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >12728</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >93.75%</div>
-        </td>
-    </tr>
-
-    <tr data-row="15" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=93.00">93.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00093000">AAPL141024P00093000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-50.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="409">409</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >15985</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >84.38%</div>
-        </td>
-    </tr>
-
-    <tr data-row="16" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=94.00">94.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00094000">AAPL141024P00094000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-50.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="673">673</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >17398</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >78.13%</div>
-        </td>
-    </tr>
-
-    <tr data-row="17" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=95.00">95.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00095000">AAPL141024P00095000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-50.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="480">480</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >22751</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >71.88%</div>
-        </td>
-    </tr>
-
-    <tr data-row="18" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=96.00">96.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00096000">AAPL141024P00096000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="818">818</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >18293</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >65.63%</div>
-        </td>
-    </tr>
-
-    <tr data-row="19" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=97.00">97.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00097000">AAPL141024P00097000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.02</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-66.67%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1534">1534</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >17302</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >57.81%</div>
-        </td>
-    </tr>
-
-    <tr data-row="20" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=98.00">98.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00098000">AAPL141024P00098000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.02</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-66.67%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1945">1945</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >26469</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >54.69%</div>
-        </td>
-    </tr>
-
-    <tr data-row="21" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=99.00">99.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00099000">AAPL141024P00099000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.02</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-50.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="3821">3821</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >21769</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >50.78%</div>
-        </td>
-    </tr>
-
-    <tr data-row="22" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=100.00">100.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00100000">AAPL141024P00100000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.04</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-57.14%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="4979">4979</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >21891</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >44.53%</div>
-        </td>
-    </tr>
-
-    <tr data-row="23" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=101.00">101.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00101000">AAPL141024P00101000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.12</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-80.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="10032">10032</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >15354</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >39.45%</div>
-        </td>
-    </tr>
-
-    <tr data-row="24" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=102.00">102.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00102000">AAPL141024P00102000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.04</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.30</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-90.91%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="12599">12599</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >15053</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >32.42%</div>
-        </td>
-    </tr>
-
-    <tr data-row="25" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=103.00">103.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00103000">AAPL141024P00103000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.07</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.07</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.08</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.64</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-90.14%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="21356">21356</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >10473</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >27.54%</div>
-        </td>
-    </tr>
-
-    <tr data-row="26" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=104.00">104.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00104000">AAPL141024P00104000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.18</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.18</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.19</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-1.09</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-85.83%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="50078">50078</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4619</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >22.85%</div>
-        </td>
-    </tr>
-
-    <tr data-row="27" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=105.00">105.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00105000">AAPL141024P00105000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.56</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.55</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.58</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-1.46</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-72.28%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="25194">25194</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1483</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >22.36%</div>
-        </td>
-    </tr>
-
-    <tr data-row="28" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=106.00">106.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00106000">AAPL141024P00106000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.31</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.26</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.31</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-1.54</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-54.04%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2558">2558</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >709</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >24.22%</div>
-        </td>
-    </tr>
-
-    <tr data-row="29" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=107.00">107.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00107000">AAPL141024P00107000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2.33</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2.17</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2.24</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-1.47</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-38.68%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="372">372</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >185</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >29.49%</div>
-        </td>
-    </tr>
-
-    <tr data-row="30" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=108.00">108.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00108000">AAPL141024P00108000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.15</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.15</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.25</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-1.55</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-32.98%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="84">84</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >445</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >40.23%</div>
-        </td>
-    </tr>
-
-    <tr data-row="31" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=109.00">109.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00109000">AAPL141024P00109000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4.25</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4.10</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4.25</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-2.35</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-35.61%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="41">41</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >62</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >49.61%</div>
-        </td>
-    </tr>
-
-    <tr data-row="32" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=110.00">110.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00110000">AAPL141024P00110000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5.10</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5.10</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5.25</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-2.50</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-32.89%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="258">258</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >175</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >58.20%</div>
-        </td>
-    </tr>
-
-    <tr data-row="33" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=111.00">111.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00111000">AAPL141024P00111000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6.05</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6.10</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6.25</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-5.75</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-48.73%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="10">10</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >118</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >66.80%</div>
-        </td>
-    </tr>
-
-    <tr data-row="34" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=112.00">112.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00112000">AAPL141024P00112000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7.05</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7.10</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7.25</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-4.65</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-39.74%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2">2</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >83</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >50.00%</div>
-        </td>
-    </tr>
-
-    <tr data-row="35" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=113.00">113.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00113000">AAPL141024P00113000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8.10</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8.25</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-5.10</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-38.93%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2">2</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >37</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >56.25%</div>
-        </td>
-    </tr>
-
-    <tr data-row="36" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=116.00">116.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00116000">AAPL141024P00116000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >14.45</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >11.10</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >11.25</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="57">57</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >71.88%</div>
-        </td>
-    </tr>
-
-    <tr data-row="37" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=118.00">118.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141024P00118000">AAPL141024P00118000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >15.60</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13.10</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13.25</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="5">5</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >84.38%</div>
-        </td>
-    </tr>
-
-
-                    
-                    
-                    
-                    
-                    
-                
-            </tbody>
-        </table>
-    </div>
-</div>
-
-
-            </div>
-        
-    
-</div>
-
-                
-            </div>
-        </div>
-    </div>
-
-    
-
-    
-
-</div>
-
-</div><!--END td-applet-options-table-->
-   
-
-
-                    </div>
-
-
-                </div>
-
-            </div>
-        </div>
-
-
-
-    </div>
-</div>
-
-        <script>
-(function (root) {
-// -- Data --
-root.Af || (root.Af = {});
-root.Af.config || (root.Af.config = {});
-root.Af.config.transport || (root.Af.config.transport = {});
-root.Af.config.transport.xhr = "\u002F_td_charts_api";
-root.YUI || (root.YUI = {});
-root.YUI.Env || (root.YUI.Env = {});
-root.YUI.Env.Af || (root.YUI.Env.Af = {});
-root.YUI.Env.Af.settings || (root.YUI.Env.Af.settings = {});
-root.YUI.Env.Af.settings.transport || (root.YUI.Env.Af.settings.transport = {});
-root.YUI.Env.Af.settings.transport.xhr = "\u002F_td_charts_api";
-root.YUI.Env.Af.settings.beacon || (root.YUI.Env.Af.settings.beacon = {});
-root.YUI.Env.Af.settings.beacon.pathPrefix = "\u002F_td_charts_api\u002Fbeacon";
-root.app || (root.app = {});
-root.app.yui = {"use":function bootstrap() { var self = this, d = document, head = d.getElementsByTagName('head')[0], ie = /MSIE/.test(navigator.userAgent), pending = 0, callback = [], args = arguments, config = typeof YUI_config != "undefined" ? YUI_config : {}; function flush() { var l = callback.length, i; if (!self.YUI && typeof YUI == "undefined") { throw new Error("YUI was not injected correctly!"); } self.YUI = self.YUI || YUI; for (i = 0; i < l; i++) { callback.shift()(); } } function decrementRequestPending() { pending--; if (pending <= 0) { setTimeout(flush, 0); } else { load(); } } function createScriptNode(src) { var node = d.createElement('script'); if (node.async) { node.async = false; } if (ie) { node.onreadystatechange = function () { if (/loaded|complete/.test(this.readyState)) { this.onreadystatechange = null; decrementRequestPending(); } }; } else { node.onload = node.onerror = decrementRequestPending; } node.setAttribute('src', src); return node; } function load() { if (!config.seed) { throw new Error('YUI_config.seed array is required.'); } var seed = config.seed, l = seed.length, i, node; pending = pending || seed.length; self._injected = true; for (i = 0; i < l; i++) { node = createScriptNode(seed.shift()); head.appendChild(node); if (node.async !== false) { break; } } } callback.push(function () { var i; if (!self._Y) { self.YUI.Env.core.push.apply(self.YUI.Env.core, config.extendedCore || []); self._Y = self.YUI(); self.use = self._Y.use; if (config.patches && config.patches.length) { for (i = 0; i < config.patches.length; i += 1) { config.patches[i](self._Y, self._Y.Env._loader); } } } self._Y.use.apply(self._Y, args); }); self.YUI = self.YUI || (typeof YUI != "undefined" ? YUI : null); if (!self.YUI && !self._injected) { load(); } else if (pending <= 0) { flush(); } return this; },"ready":function (callback) { this.use(function () { callback(); }); }};
-root.routeMap = {"quote-details":{"path":"\u002Fq\u002F?","keys":[],"regexp":/^\/q\/?\/?$/i,"annotations":{"name":"quote-details","aliases":["quote-details"]}},"recent-quotes":{"path":"\u002Fquotes\u002F?","keys":[],"regexp":/^\/quotes\/?\/?$/i,"annotations":{"name":"recent-quotes","aliases":["recent-quotes"]}},"quote-chart":{"path":"\u002Fchart\u002F?","keys":[],"regexp":/^\/chart\/?\/?$/i,"annotations":{"name":"quote-chart","aliases":["quote-chart"]}},"desktop-chart":{"path":"\u002Fecharts\u002F?","keys":[],"regexp":/^\/echarts\/?\/?$/i,"annotations":{"name":"desktop-chart","aliases":["desktop-chart"]}},"options":{"path":"\u002Fq\u002Fop\u002F?","keys":[],"regexp":/^\/q\/op\/?\/?$/i,"annotations":{"name":"options","aliases":["options"]}}};
-root.genUrl = function (routeName, context) {
-        var route = routeMap[routeName],
-            path, keys, i, len, key, param, regex;
-
-        if (!route) { return ''; }
-
-        path = route.path;
-        keys = route.keys;
-
-        if (context && (len = keys.length)) {
-            for (i = 0; i < len; i += 1) {
-                key   = keys[i];
-                param = key.name || key;
-                regex = new RegExp('[:*]' + param + '\\b');
-                path  = path.replace(regex, context[param]);
-            }
-        }
-
-        // Replace missing params with empty strings.
-        return path.replace(/([:*])([\w\-]+)?/g, '');
-    };
-root.App || (root.App = {});
-root.App.Cache || (root.App.Cache = {});
-root.App.Cache.globals = {"config":{"hosts":{"_default":"finance.yahoo.com","production":"finance.yahoo.com","staging":"stage.finance.yahoo.com","functional.test":"qa1.finance.yahoo.com","smoke.test":"int1.finance.yahoo.com","development":"int1.finance.yahoo.com"},"dss":{"assetPath":"\u002Fpv\u002Fstatic\u002Flib\u002Fios-default-set_201312031214.js","pn":"yahoo_finance_us_web","secureAssetHost":"https:\u002F\u002Fs.yimg.com","assetHost":"http:\u002F\u002Fl.yimg.com","cookieName":"DSS"},"mrs":{"mrs_host":"mrs-ynews.mrs.o.yimg.com","key":"mrs.ynews.crumbkey","app_id":"ynews"},"title":"Yahoo Finance - Business Finance, Stock Market, Quotes, News","crumbKey":"touchdown.crumbkey","asset_combo":true,"asset_mode":"prod","asset_filter":"min","assets":{"js":[{"location":"bottom","value":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Fmedia\u002Fm\u002Fheader\u002Fheader-uh3-finance-hardcoded-jsonblob-min-1583812.js"}],"css":["css.master",{"location":"top","value":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Fmedia\u002Fm\u002Fquotes\u002Fquotes-search-gs-smartphone-min-1680382.css"}],"options":{"inc_init_bottom":"0","inc_rapid":"1","rapid_version":"3.21","yui_instance_location":"bottom"}},"cdn":{"comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&","prefixMap":{"http:\u002F\u002Fl.yimg.com\u002F":""},"base":"https:\u002F\u002Fs.yimg.com"},"prefix_map":{"http:\u002F\u002Fl.yimg.com\u002F":""},"xhrPath":"_td_charts_api","adsEnabled":true,"ads":{"position":{"LREC":{"w":"300","h":"265"},"FB2-1":{"w":"198","h":"60"},"FB2-2":{"w":"198","h":"60"},"FB2-3":{"w":"198","h":"60"},"FB2-4":{"w":"198","h":"60"},"LDRP":{"w":"320","h":"76","metaSize":true},"WBTN":{"w":"120","h":"60"},"WBTN-1":{"w":"120","h":"60"},"FB2-0":{"w":"120","h":"60"},"SKY":{"w":"160","h":"600"}}},"spaceid":"2022773886","urlSpaceId":"true","urlSpaceIdMap":{"quotes":"980779717","q\u002Fop":"28951412","q":"980779724"},"rapidSettings":{"webworker_file":"\u002Frapid-worker.js","client_only":1,"keys":{"version":"td app","site":"mobile-web-quotes"},"ywa":{"project_id":"1000911397279","document_group":"interactive-chart","host":"y.analytics.yahoo.com"},"ywaMappingAction":{"click":12,"hvr":115,"rottn":128,"drag":105},"ywaMappingCf":{"_p":20,"ad":58,"authfb":11,"bpos":24,"camp":54,"cat":25,"code":55,"cpos":21,"ct":23,"dcl":26,"dir":108,"domContentLoadedEventEnd":44,"elm":56,"elmt":57,"f":40,"ft":51,"grpt":109,"ilc":39,"itc":111,"loadEventEnd":45,"ltxt":17,"mpos":110,"mrkt":12,"pcp":67,"pct":48,"pd":46,"pkgt":22,"pos":20,"prov":114,"psp":72,"pst":68,"pstcat":47,"pt":13,"rescode":27,"responseEnd":43,"responseStart":41,"rspns":107,"sca":53,"sec":18,"site":42,"slk":19,"sort":28,"t1":121,"t2":122,"t3":123,"t4":124,"t5":125,"t6":126,"t7":127,"t8":128,"t9":129,"tar":113,"test":14,"v":52,"ver":49,"x":50},"tracked_mods":["yfi_investing_nav","chart-details"],"nofollow_class":[]},"property":"finance","uh":{"experience":"GS"},"loginRedirectHost":"finance.yahoo.com","default_ticker":"YHOO","default_market_tickers":["^DJI","^IXIC"],"uhAssetsBase":"https:\u002F\u002Fs.yimg.com","sslEnabled":true,"layout":"options","packageName":"finance-td-app-mobile-web","customActions":{"before":[function (req, res, data, callback) {
-    var header,
-        config = req.config(),
-        path = req.path;
-
-    if (req.i13n && req.i13n.stampNonClassified) {
-        //console.log('=====> [universal_header] page stamped: ' + req.i13n.isStamped() + ' with spaceid ' + req.i13n.getSpaceid());
-        req.i13n.stampNonClassified(config.spaceid);
-    }
-    config.uh = config.uh || {};
-    config.uh.experience = config.uh.experience || 'uh3';
-
-    req.query.experience = config.uh.experience;
-    req.query.property = 'finance';
-    header = finUH.getMarkup(req);
-
-    res.locals = res.locals || {};
-
-    if (header.sidebar) {
-        res.locals.sidebar_css = header.sidebar.uh_css;
-        res.locals.sidebar_js = header.sidebar.uh_js;
-        data.sidebar_markup = header.sidebar.uh_markup;
-    }
-
-    res.locals.uh_css = header.uh_css;
-    res.locals.uh_js = header.uh_js;
-    data.uh_markup = header.uh_markup;
-    //TODO - localize these strings
-    if (path && path.indexOf('op') > -1) {
-        res.locals.page_title = parseSymbol(req.query.s) + " Options | Yahoo! Inc. Stock - Yahoo! Finance";
-    } else if (path && ((path.indexOf('echarts') > -1) || (path.indexOf('q') > -1))) {
-        res.locals.page_title = parseSymbol(req.query.s) + " Interactive Chart | Yahoo! Inc. Stock - Yahoo! Finance";
-    } else {
-        res.locals.page_title = config.title;
-    }
-    callback();
-},function (req, res, data, next) {
-    /* this would invoke the ESI plugin on YTS */
-    res.parentRes.set('X-Esi', '1');
-
-    var hosts = req.config().hosts,
-        hostToSet = hosts._default;
-
-    Object.keys(hosts).some(function (host) {
-        if (req.headers.host.indexOf(host) >= 0) {
-            hostToSet = hosts[host];
-            return true;
-        }
-    });
-
-    /* saving request host server name for esi end point */
-    res.locals.requesturl = {
-        host: hostToSet
-    };
-
-     /* saving header x-yahoo-request-url for Darla configuration */
-    res.locals.requestxhosturl = req.headers['x-env-host'] ? {host: req.headers['x-env-host']} : {host: hostToSet};
-
-    //urlPath is used for ./node_modules/assembler/node_modules/dust-helpers/lib/util.js::getSpaceId()
-    //see: https://git.corp.yahoo.com/sports/sportacular-web
-    req.context.urlPath = req.path;
-
-    // console.log(JSON.stringify({
-    //     requesturl: res.locals.requesturl.host,
-    //     requestxhosturl: res.locals.requestxhosturl,
-    //     urlPath: req.context.urlPath
-    // }));
-
-    next();
-},function (req, res, data, callback) {
-
-    res.locals = res.locals || {};
-    if (req.query && req.query.s) {
-        res.locals.quote = req.query.s;
-    }
-
-    callback();
-},function (req, res, data, callback) {
-    var params,
-        ticker,
-        config, i;
-
-    req = req || {};
-    req.params = req.params || {};
-
-    config = req.config() || {};
-
-
-    data = data || {};
-
-    params = req.params || {};
-    ticker = (params.ticker || (req.query && req.query.s) || 'YHOO').toUpperCase();
-    ticker = ticker.split('+')[0];//Split on + if it's in the ticker
-    ticker = ticker.split(' ')[0];//Split on space if it's in the ticker
-
-    params.tickers = [];
-    if (config.default_market_tickers) {
-        params.tickers = params.tickers.concat(config.default_market_tickers);
-    }
-    params.tickers.push(ticker);
-    params.tickers = params.tickers.join(',');
-    params.format = 'inflated';
-
-    //Move this into a new action
-    res.locals.isTablet = config.isTablet;
-
-    quoteStore.read('finance_quote', params, req, function (err, qData) {
-        if (!err && qData.quotes && qData.quotes.length > 0) {
-            res.locals.quoteData = qData;
-            for (i = 0; i < qData.quotes.length; i = i +  1) {
-                if (qData.quotes[i].symbol.toUpperCase() === ticker.toUpperCase()) {
-                    params.ticker_securityType = qData.quotes[i].type;
-                }
-            }
-            params.tickers = ticker;
-        }
-        callback();
-    });
-},function (req, res, data, callback) {
-
-    marketTimeStore.read('markettime', {}, req, function (err, data) {
-        if (data && data.index) {
-            res.parentRes.locals.markettime = data.index.markettime;
-        }
-        callback();
-    });
-}],"after":[]}},"context":{"authed":"0","ynet":"0","ssl":"1","spdy":"0","bucket":"gs513","colo":"gq1","device":"desktop","environment":"prod","lang":"en-US","partner":"none","site":"finance","region":"US","intl":"us","tz":"America\u002FLos_Angeles","edgepipeEnabled":false,"urlPath":"\u002Fq\u002Fop"},"intl":{"locales":"en-US"},"user":{"crumb":"Mo4ghtv8vTn"}};
-root.YUI_config = {"version":"3.17.2","base":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:3.17.2\u002F","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&","root":"yui:3.17.2\u002F","filter":"min","logLevel":"error","combine":true,"patches":[function patchLangBundlesRequires(Y, loader) {
-    var getRequires = loader.getRequires;
-    loader.getRequires = function (mod) {
-        var i, j, m, name, mods, loadDefaultBundle,
-            locales = Y.config.lang || [],
-            r = getRequires.apply(this, arguments);
-        // expanding requirements with optional requires
-        if (mod.langBundles && !mod.langBundlesExpanded) {
-            mod.langBundlesExpanded = [];
-            locales = typeof locales === 'string' ? [locales] : locales.concat();
-            for (i = 0; i < mod.langBundles.length; i += 1) {
-                mods = [];
-                loadDefaultBundle = false;
-                name = mod.group + '-lang-' + mod.langBundles[i];
-                for (j = 0; j < locales.length; j += 1) {
-                    m = this.getModule(name + '_' + locales[j].toLowerCase());
-                    if (m) {
-                        mods.push(m);
-                    } else {
-                        // if one of the requested locales is missing,
-                        // the default lang should be fetched
-                        loadDefaultBundle = true;
-                    }
-                }
-                if (!mods.length || loadDefaultBundle) {
-                    // falling back to the default lang bundle when needed
-                    m = this.getModule(name);
-                    if (m) {
-                        mods.push(m);
-                    }
-                }
-                // adding requirements for each lang bundle
-                // (duplications are not a problem since they will be deduped)
-                for (j = 0; j < mods.length; j += 1) {
-                    mod.langBundlesExpanded = mod.langBundlesExpanded.concat(this.getRequires(mods[j]), [mods[j].name]);
-                }
-            }
-        }
-        return mod.langBundlesExpanded && mod.langBundlesExpanded.length ?
-                [].concat(mod.langBundlesExpanded, r) : r;
-    };
-}],"modules":{"IntlPolyfill":{"fullpath":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:platform\u002Fintl\u002F0.1.4\u002FIntl.min.js&yui:platform\u002Fintl\u002F0.1.4\u002Flocale-data\u002Fjsonp\u002F{lang}.js","condition":{"name":"IntlPolyfill","trigger":"intl-messageformat","test":function (Y) {
-                        return !Y.config.global.Intl;
-                    },"when":"before"},"configFn":function (mod) {
-                    var lang = 'en-US';
-                    if (window.YUI_config && window.YUI_config.lang && window.IntlAvailableLangs && window.IntlAvailableLangs[window.YUI_config.lang]) {
-                        lang = window.YUI_config.lang;
-                    }
-                    mod.fullpath = mod.fullpath.replace('{lang}', lang);
-                    return true;
-                }}},"groups":{"finance-td-app-mobile-web":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.294\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.294\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"ape-af":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fape-af-0.0.313\u002F","root":"os\u002Fmit\u002Ftd\u002Fape-af-0.0.313\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"mjata":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fmjata-0.4.33\u002F","root":"os\u002Fmit\u002Ftd\u002Fmjata-0.4.33\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"ape-applet":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fape-applet-0.0.201\u002F","root":"os\u002Fmit\u002Ftd\u002Fape-applet-0.0.201\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"applet-server":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fapplet-server-0.2.70\u002F","root":"os\u002Fmit\u002Ftd\u002Fapplet-server-0.2.70\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-api":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-api-0.1.65\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-api-0.1.65\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"finance-streamer":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"stencil":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002F","root":"os\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-ads":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.321\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.321\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-charts":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.146\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.146\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"finance-yui-scripts":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.21\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.21\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-details":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.131\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.131\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-news":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.136\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.136\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-search":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.56\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.56\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quotes":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.9\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.9\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-options-table":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.86\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.86\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-finance-uh":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"assembler":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fassembler-0.3.87\u002F","root":"os\u002Fmit\u002Ftd\u002Fassembler-0.3.87\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-dev-info":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"dust-helpers":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.132\u002F","root":"os\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.132\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"}},"seed":["yui","loader-finance-td-app-mobile-web","loader-ape-af","loader-mjata","loader-ape-applet","loader-applet-server","loader-td-api","loader-finance-streamer","loader-stencil","loader-td-applet-ads","loader-td-applet-charts","loader-finance-yui-scripts","loader-td-applet-mw-quote-details","loader-td-applet-mw-quote-news","loader-td-applet-mw-quote-search","loader-td-applet-mw-quotes","loader-td-applet-options-table","loader-td-finance-uh","loader-assembler","loader-td-dev-info","loader-dust-helpers"],"extendedCore":["loader-finance-td-app-mobile-web","loader-ape-af","loader-mjata","loader-ape-applet","loader-applet-server","loader-td-api","loader-finance-streamer","loader-stencil","loader-td-applet-ads","loader-td-applet-charts","loader-finance-yui-scripts","loader-td-applet-mw-quote-details","loader-td-applet-mw-quote-news","loader-td-applet-mw-quote-search","loader-td-applet-mw-quotes","loader-td-applet-options-table","loader-td-finance-uh","loader-assembler","loader-td-dev-info","loader-dust-helpers"]};
-root.YUI_config || (root.YUI_config = {});
-root.YUI_config.seed = ["https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:3.17.2\u002Fyui\u002Fyui-min.js&os\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.294\u002Floader-finance-td-app-mobile-web\u002Floader-finance-td-app-mobile-web-min.js&os\u002Fmit\u002Ftd\u002Fape-af-0.0.313\u002Floader-ape-af\u002Floader-ape-af-min.js&os\u002Fmit\u002Ftd\u002Fmjata-0.4.33\u002Floader-mjata\u002Floader-mjata-min.js&os\u002Fmit\u002Ftd\u002Fape-applet-0.0.201\u002Floader-ape-applet\u002Floader-ape-applet-min.js&os\u002Fmit\u002Ftd\u002Fapplet-server-0.2.70\u002Floader-applet-server\u002Floader-applet-server-min.js&os\u002Fmit\u002Ftd\u002Ftd-api-0.1.65\u002Floader-td-api\u002Floader-td-api-min.js&os\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002Floader-finance-streamer\u002Floader-finance-streamer-min.js&os\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002Floader-stencil\u002Floader-stencil-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.321\u002Floader-td-applet-ads\u002Floader-td-applet-ads-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.146\u002Floader-td-applet-charts\u002Floader-td-applet-charts-min.js&os\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.21\u002Floader-finance-yui-scripts\u002Floader-finance-yui-scripts-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.131\u002Floader-td-applet-mw-quote-details\u002Floader-td-applet-mw-quote-details-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.136\u002Floader-td-applet-mw-quote-news\u002Floader-td-applet-mw-quote-news-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.56\u002Floader-td-applet-mw-quote-search\u002Floader-td-applet-mw-quote-search-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.9\u002Floader-td-applet-mw-quotes\u002Floader-td-applet-mw-quotes-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.86\u002Floader-td-applet-options-table\u002Floader-td-applet-options-table-min.js&os\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002Floader-td-finance-uh\u002Floader-td-finance-uh-min.js&os\u002Fmit\u002Ftd\u002Fassembler-0.3.87\u002Floader-assembler\u002Floader-assembler-min.js&os\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002Floader-td-dev-info\u002Floader-td-dev-info-min.js&os\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.132\u002Floader-dust-helpers\u002Floader-dust-helpers-min.js"];
-root.YUI_config.lang = "en-US";
-}(this));
-</script>
-
-        
-            
-<script type="text/javascript" src="https://s1.yimg.com/zz/combo?yui:/3.17.2/yui/yui-min.js&/os/mit/td/asset-loader-s-f690f5aa.js&/ss/rapid-3.21.js&/os/mit/media/m/header/header-uh3-finance-hardcoded-jsonblob-min-1583812.js"></script>
-
-<script>
-(function (root) {
-// -- Data --
-root.Af || (root.Af = {});
-root.Af.config || (root.Af.config = {});
-root.Af.config.transport || (root.Af.config.transport = {});
-root.Af.config.transport.xhr = "\u002F_td_charts_api";
-root.YUI || (root.YUI = {});
-root.YUI.Env || (root.YUI.Env = {});
-root.YUI.Env.Af || (root.YUI.Env.Af = {});
-root.YUI.Env.Af.settings || (root.YUI.Env.Af.settings = {});
-root.YUI.Env.Af.settings.transport || (root.YUI.Env.Af.settings.transport = {});
-root.YUI.Env.Af.settings.transport.xhr = "\u002F_td_charts_api";
-root.YUI.Env.Af.settings.beacon || (root.YUI.Env.Af.settings.beacon = {});
-root.YUI.Env.Af.settings.beacon.pathPrefix = "\u002F_td_charts_api\u002Fbeacon";
-root.app || (root.app = {});
-root.app.yui = {"use":function bootstrap() { var self = this, d = document, head = d.getElementsByTagName('head')[0], ie = /MSIE/.test(navigator.userAgent), pending = 0, callback = [], args = arguments, config = typeof YUI_config != "undefined" ? YUI_config : {}; function flush() { var l = callback.length, i; if (!self.YUI && typeof YUI == "undefined") { throw new Error("YUI was not injected correctly!"); } self.YUI = self.YUI || YUI; for (i = 0; i < l; i++) { callback.shift()(); } } function decrementRequestPending() { pending--; if (pending <= 0) { setTimeout(flush, 0); } else { load(); } } function createScriptNode(src) { var node = d.createElement('script'); if (node.async) { node.async = false; } if (ie) { node.onreadystatechange = function () { if (/loaded|complete/.test(this.readyState)) { this.onreadystatechange = null; decrementRequestPending(); } }; } else { node.onload = node.onerror = decrementRequestPending; } node.setAttribute('src', src); return node; } function load() { if (!config.seed) { throw new Error('YUI_config.seed array is required.'); } var seed = config.seed, l = seed.length, i, node; pending = pending || seed.length; self._injected = true; for (i = 0; i < l; i++) { node = createScriptNode(seed.shift()); head.appendChild(node); if (node.async !== false) { break; } } } callback.push(function () { var i; if (!self._Y) { self.YUI.Env.core.push.apply(self.YUI.Env.core, config.extendedCore || []); self._Y = self.YUI(); self.use = self._Y.use; if (config.patches && config.patches.length) { for (i = 0; i < config.patches.length; i += 1) { config.patches[i](self._Y, self._Y.Env._loader); } } } self._Y.use.apply(self._Y, args); }); self.YUI = self.YUI || (typeof YUI != "undefined" ? YUI : null); if (!self.YUI && !self._injected) { load(); } else if (pending <= 0) { flush(); } return this; },"ready":function (callback) { this.use(function () { callback(); }); }};
-root.routeMap = {"quote-details":{"path":"\u002Fq\u002F?","keys":[],"regexp":/^\/q\/?\/?$/i,"annotations":{"name":"quote-details","aliases":["quote-details"]}},"recent-quotes":{"path":"\u002Fquotes\u002F?","keys":[],"regexp":/^\/quotes\/?\/?$/i,"annotations":{"name":"recent-quotes","aliases":["recent-quotes"]}},"quote-chart":{"path":"\u002Fchart\u002F?","keys":[],"regexp":/^\/chart\/?\/?$/i,"annotations":{"name":"quote-chart","aliases":["quote-chart"]}},"desktop-chart":{"path":"\u002Fecharts\u002F?","keys":[],"regexp":/^\/echarts\/?\/?$/i,"annotations":{"name":"desktop-chart","aliases":["desktop-chart"]}},"options":{"path":"\u002Fq\u002Fop\u002F?","keys":[],"regexp":/^\/q\/op\/?\/?$/i,"annotations":{"name":"options","aliases":["options"]}}};
-root.genUrl = function (routeName, context) {
-        var route = routeMap[routeName],
-            path, keys, i, len, key, param, regex;
-
-        if (!route) { return ''; }
-
-        path = route.path;
-        keys = route.keys;
-
-        if (context && (len = keys.length)) {
-            for (i = 0; i < len; i += 1) {
-                key   = keys[i];
-                param = key.name || key;
-                regex = new RegExp('[:*]' + param + '\\b');
-                path  = path.replace(regex, context[param]);
-            }
-        }
-
-        // Replace missing params with empty strings.
-        return path.replace(/([:*])([\w\-]+)?/g, '');
-    };
-root.App || (root.App = {});
-root.App.Cache || (root.App.Cache = {});
-root.App.Cache.globals = {"config":{"hosts":{"_default":"finance.yahoo.com","production":"finance.yahoo.com","staging":"stage.finance.yahoo.com","functional.test":"qa1.finance.yahoo.com","smoke.test":"int1.finance.yahoo.com","development":"int1.finance.yahoo.com"},"dss":{"assetPath":"\u002Fpv\u002Fstatic\u002Flib\u002Fios-default-set_201312031214.js","pn":"yahoo_finance_us_web","secureAssetHost":"https:\u002F\u002Fs.yimg.com","assetHost":"http:\u002F\u002Fl.yimg.com","cookieName":"DSS"},"mrs":{"mrs_host":"mrs-ynews.mrs.o.yimg.com","key":"mrs.ynews.crumbkey","app_id":"ynews"},"title":"Yahoo Finance - Business Finance, Stock Market, Quotes, News","crumbKey":"touchdown.crumbkey","asset_combo":true,"asset_mode":"prod","asset_filter":"min","assets":{"js":[{"location":"bottom","value":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Fmedia\u002Fm\u002Fheader\u002Fheader-uh3-finance-hardcoded-jsonblob-min-1583812.js"}],"css":["css.master",{"location":"top","value":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Fmedia\u002Fm\u002Fquotes\u002Fquotes-search-gs-smartphone-min-1680382.css"}],"options":{"inc_init_bottom":"0","inc_rapid":"1","rapid_version":"3.21","yui_instance_location":"bottom"}},"cdn":{"comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&","prefixMap":{"http:\u002F\u002Fl.yimg.com\u002F":""},"base":"https:\u002F\u002Fs.yimg.com"},"prefix_map":{"http:\u002F\u002Fl.yimg.com\u002F":""},"xhrPath":"_td_charts_api","adsEnabled":true,"ads":{"position":{"LREC":{"w":"300","h":"265"},"FB2-1":{"w":"198","h":"60"},"FB2-2":{"w":"198","h":"60"},"FB2-3":{"w":"198","h":"60"},"FB2-4":{"w":"198","h":"60"},"LDRP":{"w":"320","h":"76","metaSize":true},"WBTN":{"w":"120","h":"60"},"WBTN-1":{"w":"120","h":"60"},"FB2-0":{"w":"120","h":"60"},"SKY":{"w":"160","h":"600"}}},"spaceid":"2022773886","urlSpaceId":"true","urlSpaceIdMap":{"quotes":"980779717","q\u002Fop":"28951412","q":"980779724"},"rapidSettings":{"webworker_file":"\u002Frapid-worker.js","client_only":1,"keys":{"version":"td app","site":"mobile-web-quotes"},"ywa":{"project_id":"1000911397279","document_group":"interactive-chart","host":"y.analytics.yahoo.com"},"ywaMappingAction":{"click":12,"hvr":115,"rottn":128,"drag":105},"ywaMappingCf":{"_p":20,"ad":58,"authfb":11,"bpos":24,"camp":54,"cat":25,"code":55,"cpos":21,"ct":23,"dcl":26,"dir":108,"domContentLoadedEventEnd":44,"elm":56,"elmt":57,"f":40,"ft":51,"grpt":109,"ilc":39,"itc":111,"loadEventEnd":45,"ltxt":17,"mpos":110,"mrkt":12,"pcp":67,"pct":48,"pd":46,"pkgt":22,"pos":20,"prov":114,"psp":72,"pst":68,"pstcat":47,"pt":13,"rescode":27,"responseEnd":43,"responseStart":41,"rspns":107,"sca":53,"sec":18,"site":42,"slk":19,"sort":28,"t1":121,"t2":122,"t3":123,"t4":124,"t5":125,"t6":126,"t7":127,"t8":128,"t9":129,"tar":113,"test":14,"v":52,"ver":49,"x":50},"tracked_mods":["yfi_investing_nav","chart-details"],"nofollow_class":[]},"property":"finance","uh":{"experience":"GS"},"loginRedirectHost":"finance.yahoo.com","default_ticker":"YHOO","default_market_tickers":["^DJI","^IXIC"],"uhAssetsBase":"https:\u002F\u002Fs.yimg.com","sslEnabled":true,"layout":"options","packageName":"finance-td-app-mobile-web","customActions":{"before":[function (req, res, data, callback) {
-    var header,
-        config = req.config(),
-        path = req.path;
-
-    if (req.i13n && req.i13n.stampNonClassified) {
-        //console.log('=====> [universal_header] page stamped: ' + req.i13n.isStamped() + ' with spaceid ' + req.i13n.getSpaceid());
-        req.i13n.stampNonClassified(config.spaceid);
-    }
-    config.uh = config.uh || {};
-    config.uh.experience = config.uh.experience || 'uh3';
-
-    req.query.experience = config.uh.experience;
-    req.query.property = 'finance';
-    header = finUH.getMarkup(req);
-
-    res.locals = res.locals || {};
-
-    if (header.sidebar) {
-        res.locals.sidebar_css = header.sidebar.uh_css;
-        res.locals.sidebar_js = header.sidebar.uh_js;
-        data.sidebar_markup = header.sidebar.uh_markup;
-    }
-
-    res.locals.uh_css = header.uh_css;
-    res.locals.uh_js = header.uh_js;
-    data.uh_markup = header.uh_markup;
-    //TODO - localize these strings
-    if (path && path.indexOf('op') > -1) {
-        res.locals.page_title = parseSymbol(req.query.s) + " Options | Yahoo! Inc. Stock - Yahoo! Finance";
-    } else if (path && ((path.indexOf('echarts') > -1) || (path.indexOf('q') > -1))) {
-        res.locals.page_title = parseSymbol(req.query.s) + " Interactive Chart | Yahoo! Inc. Stock - Yahoo! Finance";
-    } else {
-        res.locals.page_title = config.title;
-    }
-    callback();
-},function (req, res, data, next) {
-    /* this would invoke the ESI plugin on YTS */
-    res.parentRes.set('X-Esi', '1');
-
-    var hosts = req.config().hosts,
-        hostToSet = hosts._default;
-
-    Object.keys(hosts).some(function (host) {
-        if (req.headers.host.indexOf(host) >= 0) {
-            hostToSet = hosts[host];
-            return true;
-        }
-    });
-
-    /* saving request host server name for esi end point */
-    res.locals.requesturl = {
-        host: hostToSet
-    };
-
-     /* saving header x-yahoo-request-url for Darla configuration */
-    res.locals.requestxhosturl = req.headers['x-env-host'] ? {host: req.headers['x-env-host']} : {host: hostToSet};
-
-    //urlPath is used for ./node_modules/assembler/node_modules/dust-helpers/lib/util.js::getSpaceId()
-    //see: https://git.corp.yahoo.com/sports/sportacular-web
-    req.context.urlPath = req.path;
-
-    // console.log(JSON.stringify({
-    //     requesturl: res.locals.requesturl.host,
-    //     requestxhosturl: res.locals.requestxhosturl,
-    //     urlPath: req.context.urlPath
-    // }));
-
-    next();
-},function (req, res, data, callback) {
-
-    res.locals = res.locals || {};
-    if (req.query && req.query.s) {
-        res.locals.quote = req.query.s;
-    }
-
-    callback();
-},function (req, res, data, callback) {
-    var params,
-        ticker,
-        config, i;
-
-    req = req || {};
-    req.params = req.params || {};
-
-    config = req.config() || {};
-
-
-    data = data || {};
-
-    params = req.params || {};
-    ticker = (params.ticker || (req.query && req.query.s) || 'YHOO').toUpperCase();
-    ticker = ticker.split('+')[0];//Split on + if it's in the ticker
-    ticker = ticker.split(' ')[0];//Split on space if it's in the ticker
-
-    params.tickers = [];
-    if (config.default_market_tickers) {
-        params.tickers = params.tickers.concat(config.default_market_tickers);
-    }
-    params.tickers.push(ticker);
-    params.tickers = params.tickers.join(',');
-    params.format = 'inflated';
-
-    //Move this into a new action
-    res.locals.isTablet = config.isTablet;
-
-    quoteStore.read('finance_quote', params, req, function (err, qData) {
-        if (!err && qData.quotes && qData.quotes.length > 0) {
-            res.locals.quoteData = qData;
-            for (i = 0; i < qData.quotes.length; i = i +  1) {
-                if (qData.quotes[i].symbol.toUpperCase() === ticker.toUpperCase()) {
-                    params.ticker_securityType = qData.quotes[i].type;
-                }
-            }
-            params.tickers = ticker;
-        }
-        callback();
-    });
-},function (req, res, data, callback) {
-
-    marketTimeStore.read('markettime', {}, req, function (err, data) {
-        if (data && data.index) {
-            res.parentRes.locals.markettime = data.index.markettime;
-        }
-        callback();
-    });
-}],"after":[]}},"context":{"authed":"0","ynet":"0","ssl":"1","spdy":"0","bucket":"gs513","colo":"gq1","device":"desktop","environment":"prod","lang":"en-US","partner":"none","site":"finance","region":"US","intl":"us","tz":"America\u002FLos_Angeles","edgepipeEnabled":false,"urlPath":"\u002Fq\u002Fop"},"intl":{"locales":"en-US"},"user":{"crumb":"Mo4ghtv8vTn"}};
-root.YUI_config = {"version":"3.17.2","base":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:3.17.2\u002F","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&","root":"yui:3.17.2\u002F","filter":"min","logLevel":"error","combine":true,"patches":[function patchLangBundlesRequires(Y, loader) {
-    var getRequires = loader.getRequires;
-    loader.getRequires = function (mod) {
-        var i, j, m, name, mods, loadDefaultBundle,
-            locales = Y.config.lang || [],
-            r = getRequires.apply(this, arguments);
-        // expanding requirements with optional requires
-        if (mod.langBundles && !mod.langBundlesExpanded) {
-            mod.langBundlesExpanded = [];
-            locales = typeof locales === 'string' ? [locales] : locales.concat();
-            for (i = 0; i < mod.langBundles.length; i += 1) {
-                mods = [];
-                loadDefaultBundle = false;
-                name = mod.group + '-lang-' + mod.langBundles[i];
-                for (j = 0; j < locales.length; j += 1) {
-                    m = this.getModule(name + '_' + locales[j].toLowerCase());
-                    if (m) {
-                        mods.push(m);
-                    } else {
-                        // if one of the requested locales is missing,
-                        // the default lang should be fetched
-                        loadDefaultBundle = true;
-                    }
-                }
-                if (!mods.length || loadDefaultBundle) {
-                    // falling back to the default lang bundle when needed
-                    m = this.getModule(name);
-                    if (m) {
-                        mods.push(m);
-                    }
-                }
-                // adding requirements for each lang bundle
-                // (duplications are not a problem since they will be deduped)
-                for (j = 0; j < mods.length; j += 1) {
-                    mod.langBundlesExpanded = mod.langBundlesExpanded.concat(this.getRequires(mods[j]), [mods[j].name]);
-                }
-            }
-        }
-        return mod.langBundlesExpanded && mod.langBundlesExpanded.length ?
-                [].concat(mod.langBundlesExpanded, r) : r;
-    };
-}],"modules":{"IntlPolyfill":{"fullpath":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:platform\u002Fintl\u002F0.1.4\u002FIntl.min.js&yui:platform\u002Fintl\u002F0.1.4\u002Flocale-data\u002Fjsonp\u002F{lang}.js","condition":{"name":"IntlPolyfill","trigger":"intl-messageformat","test":function (Y) {
-                        return !Y.config.global.Intl;
-                    },"when":"before"},"configFn":function (mod) {
-                    var lang = 'en-US';
-                    if (window.YUI_config && window.YUI_config.lang && window.IntlAvailableLangs && window.IntlAvailableLangs[window.YUI_config.lang]) {
-                        lang = window.YUI_config.lang;
-                    }
-                    mod.fullpath = mod.fullpath.replace('{lang}', lang);
-                    return true;
-                }}},"groups":{"finance-td-app-mobile-web":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.294\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.294\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"ape-af":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fape-af-0.0.313\u002F","root":"os\u002Fmit\u002Ftd\u002Fape-af-0.0.313\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"mjata":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fmjata-0.4.33\u002F","root":"os\u002Fmit\u002Ftd\u002Fmjata-0.4.33\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"ape-applet":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fape-applet-0.0.201\u002F","root":"os\u002Fmit\u002Ftd\u002Fape-applet-0.0.201\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"applet-server":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fapplet-server-0.2.70\u002F","root":"os\u002Fmit\u002Ftd\u002Fapplet-server-0.2.70\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-api":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-api-0.1.65\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-api-0.1.65\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"finance-streamer":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"stencil":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002F","root":"os\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-ads":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.321\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.321\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-charts":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.146\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.146\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"finance-yui-scripts":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.21\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.21\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-details":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.131\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.131\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-news":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.136\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.136\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-search":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.56\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.56\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quotes":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.9\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.9\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-options-table":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.86\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.86\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-finance-uh":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"assembler":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fassembler-0.3.87\u002F","root":"os\u002Fmit\u002Ftd\u002Fassembler-0.3.87\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-dev-info":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"dust-helpers":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.132\u002F","root":"os\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.132\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"}},"seed":["yui","loader-finance-td-app-mobile-web","loader-ape-af","loader-mjata","loader-ape-applet","loader-applet-server","loader-td-api","loader-finance-streamer","loader-stencil","loader-td-applet-ads","loader-td-applet-charts","loader-finance-yui-scripts","loader-td-applet-mw-quote-details","loader-td-applet-mw-quote-news","loader-td-applet-mw-quote-search","loader-td-applet-mw-quotes","loader-td-applet-options-table","loader-td-finance-uh","loader-assembler","loader-td-dev-info","loader-dust-helpers"],"extendedCore":["loader-finance-td-app-mobile-web","loader-ape-af","loader-mjata","loader-ape-applet","loader-applet-server","loader-td-api","loader-finance-streamer","loader-stencil","loader-td-applet-ads","loader-td-applet-charts","loader-finance-yui-scripts","loader-td-applet-mw-quote-details","loader-td-applet-mw-quote-news","loader-td-applet-mw-quote-search","loader-td-applet-mw-quotes","loader-td-applet-options-table","loader-td-finance-uh","loader-assembler","loader-td-dev-info","loader-dust-helpers"]};
-root.YUI_config || (root.YUI_config = {});
-root.YUI_config.seed = ["https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:3.17.2\u002Fyui\u002Fyui-min.js&os\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.294\u002Floader-finance-td-app-mobile-web\u002Floader-finance-td-app-mobile-web-min.js&os\u002Fmit\u002Ftd\u002Fape-af-0.0.313\u002Floader-ape-af\u002Floader-ape-af-min.js&os\u002Fmit\u002Ftd\u002Fmjata-0.4.33\u002Floader-mjata\u002Floader-mjata-min.js&os\u002Fmit\u002Ftd\u002Fape-applet-0.0.201\u002Floader-ape-applet\u002Floader-ape-applet-min.js&os\u002Fmit\u002Ftd\u002Fapplet-server-0.2.70\u002Floader-applet-server\u002Floader-applet-server-min.js&os\u002Fmit\u002Ftd\u002Ftd-api-0.1.65\u002Floader-td-api\u002Floader-td-api-min.js&os\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002Floader-finance-streamer\u002Floader-finance-streamer-min.js&os\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002Floader-stencil\u002Floader-stencil-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.321\u002Floader-td-applet-ads\u002Floader-td-applet-ads-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.146\u002Floader-td-applet-charts\u002Floader-td-applet-charts-min.js&os\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.21\u002Floader-finance-yui-scripts\u002Floader-finance-yui-scripts-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.131\u002Floader-td-applet-mw-quote-details\u002Floader-td-applet-mw-quote-details-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.136\u002Floader-td-applet-mw-quote-news\u002Floader-td-applet-mw-quote-news-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.56\u002Floader-td-applet-mw-quote-search\u002Floader-td-applet-mw-quote-search-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.9\u002Floader-td-applet-mw-quotes\u002Floader-td-applet-mw-quotes-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.86\u002Floader-td-applet-options-table\u002Floader-td-applet-options-table-min.js&os\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002Floader-td-finance-uh\u002Floader-td-finance-uh-min.js&os\u002Fmit\u002Ftd\u002Fassembler-0.3.87\u002Floader-assembler\u002Floader-assembler-min.js&os\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002Floader-td-dev-info\u002Floader-td-dev-info-min.js&os\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.132\u002Floader-dust-helpers\u002Floader-dust-helpers-min.js"];
-root.YUI_config.lang = "en-US";
-}(this));
-</script>
-<script>YMedia = YUI({"combine":true,"filter":"min","maxURLLength":2000});</script><script>if (YMedia.config.patches && YMedia.config.patches.length) {for (var i = 0; i < YMedia.config.patches.length; i += 1) {YMedia.config.patches[i](YMedia, YMedia.Env._loader);}}</script>
-<script>YMedia.applyConfig({"groups":{"td-applet-mw-quote-search":{"base":"https://s1.yimg.com/os/mit/td/td-applet-mw-quote-search-1.2.56/","root":"os/mit/td/td-applet-mw-quote-search-1.2.56/","combine":true,"filter":"min","comboBase":"https://s.yimg.com/zz/combo?","comboSep":"&"}}});</script><script>window.Af=window.Af||{};window.Af.bootstrap=window.Af.bootstrap||{};window.Af.bootstrap["4971909175267776"] = {"applet_type":"td-applet-mw-quote-search","views":{"main":{"yui_module":"td-applet-quotesearch-desktopview","yui_class":"TD.Applet.QuotesearchDesktopView","config":{"type":"lookup"}}},"templates":{"main":{"yui_module":"td-applet-mw-quote-search-templates-main","template_name":"td-applet-mw-quote-search-templates-main"},"lookup":{"yui_module":"td-applet-mw-quote-search-templates-lookup","template_name":"td-applet-mw-quote-search-templates-lookup"}},"i18n":{"TITLE":"quotesearch"},"transport":{"xhr":"/_td_charts_api"},"context":{"bucket":"gs513","crumb":"Mo4ghtv8vTn","device":"desktop","lang":"en-US","region":"US","site":"finance"}};</script>
-<script>YMedia.applyConfig({"groups":{"td-applet-mw-quote-search":{"base":"https://s1.yimg.com/os/mit/td/td-applet-mw-quote-search-1.2.56/","root":"os/mit/td/td-applet-mw-quote-search-1.2.56/","combine":true,"filter":"min","comboBase":"https://s.yimg.com/zz/combo?","comboSep":"&"}}});</script><script>window.Af=window.Af||{};window.Af.bootstrap=window.Af.bootstrap||{};window.Af.bootstrap["4971909176108286"] = {"applet_type":"td-applet-mw-quote-search","views":{"main":{"yui_module":"td-applet-quotesearch-desktopview","yui_class":"TD.Applet.QuotesearchDesktopView","config":{"type":"options"}}},"templates":{"main":{"yui_module":"td-applet-mw-quote-search-templates-main","template_name":"td-applet-mw-quote-search-templates-main"},"lookup":{"yui_module":"td-applet-mw-quote-search-templates-lookup","template_name":"td-applet-mw-quote-search-templates-lookup"}},"i18n":{"TITLE":"quotesearch"},"transport":{"xhr":"/_td_charts_api"},"context":{"bucket":"gs513","crumb":"Mo4ghtv8vTn","device":"desktop","lang":"en-US","region":"US","site":"finance"}};</script>
-<script>YMedia.applyConfig({"groups":{"td-applet-options-table":{"base":"https://s1.yimg.com/os/mit/td/td-applet-options-table-0.1.86/","root":"os/mit/td/td-applet-options-table-0.1.86/","combine":true,"filter":"min","comboBase":"https://s.yimg.com/zz/combo?","comboSep":"&"}}});</script><script>window.Af=window.Af||{};window.Af.bootstrap=window.Af.bootstrap||{};window.Af.bootstrap["4971909175742216"] = {"applet_type":"td-applet-options-table","models":{"options-table":{"yui_module":"td-options-table-model","yui_class":"TD.Options-table.Model"},"applet_model":{"models":["options-table"],"data":{"optionData":{"underlyingSymbol":"AAPL","expirationDates":["2014-10-24T00:00:00.000Z","2014-10-31T00:00:00.000Z","2014-11-07T00:00:00.000Z","2014-11-14T00:00:00.000Z","2014-11-22T00:00:00.000Z","2014-11-28T00:00:00.000Z","2014-12-20T00:00:00.000Z","2015-01-17T00:00:00.000Z","2015-02-20T00:00:00.000Z","2015-04-17T00:00:00.000Z","2015-07-17T00:00:00.000Z","2016-01-15T00:00:00.000Z","2017-01-20T00:00:00.000Z"],"hasMiniOptions":true,"quote":{"preMarketChange":1.0200043,"preMarketChangePercent":0.9903916,"preMarketTime":1414070999,"preMarketPrice":104.01,"preMarketSource":"FREE_REALTIME","postMarketChange":0.15999603,"postMarketChangePercent":0.15262428,"postMarketTime":1414108795,"postMarketPrice":104.99,"postMarketSource":"DELAYED","regularMarketChange":1.840004,"regularMarketChangePercent":1.7865851,"regularMarketTime":1414094400,"regularMarketPrice":104.83,"regularMarketDayHigh":105.05,"regularMarketDayLow":103.63,"regularMarketVolume":69483389,"regularMarketPreviousClose":102.99,"regularMarketSource":"FREE_REALTIME","regularMarketOpen":103.95,"exchange":"NMS","quoteType":"EQUITY","symbol":"AAPL","currency":"USD"},"options":{"calls":[{"contractSymbol":"AAPL141024C00055000","currency":"USD","volume":25,"openInterest":0,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":5.687502890625,"bid":"49.70","ask":"49.95","impliedVolatility":"568.75","strike":"55.00","lastPrice":"44.16","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00075000","currency":"USD","volume":2,"openInterest":247,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":2.93750265625,"bid":"29.75","ask":"29.90","impliedVolatility":"293.75","strike":"75.00","lastPrice":"27.71","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00080000","currency":"USD","volume":1,"openInterest":77,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":6.8522496,"impliedVolatilityRaw":2.42969142578125,"bid":"24.75","ask":"24.90","impliedVolatility":"242.97","strike":"80.00","lastPrice":"24.95","change":"1.60","percentChange":"+6.85"},{"contractSymbol":"AAPL141024C00083000","currency":"USD","volume":1,"openInterest":6,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":2.1406296484375,"bid":"21.75","ask":"21.90","impliedVolatility":"214.06","strike":"83.00","lastPrice":"19.84","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00085000","currency":"USD","volume":13,"openInterest":233,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":7.3513546,"impliedVolatilityRaw":1.9453127734375002,"bid":"19.75","ask":"19.90","impliedVolatility":"194.53","strike":"85.00","lastPrice":"19.86","change":"1.36","percentChange":"+7.35"},{"contractSymbol":"AAPL141024C00086000","currency":"USD","volume":2,"openInterest":16,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":1.8515632421875,"bid":"18.75","ask":"18.90","impliedVolatility":"185.16","strike":"86.00","lastPrice":"16.72","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00087000","currency":"USD","volume":20,"openInterest":15,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":1.7578137109375,"bid":"17.75","ask":"17.90","impliedVolatility":"175.78","strike":"87.00","lastPrice":"12.50","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00088000","currency":"USD","volume":2,"openInterest":346,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":11.5131645,"impliedVolatilityRaw":1.6640641796875002,"bid":"16.75","ask":"16.90","impliedVolatility":"166.41","strike":"88.00","lastPrice":"16.95","change":"1.75","percentChange":"+11.51"},{"contractSymbol":"AAPL141024C00089000","currency":"USD","volume":5,"openInterest":314,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":1.57422087890625,"bid":"15.75","ask":"15.90","impliedVolatility":"157.42","strike":"89.00","lastPrice":"13.80","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00090000","currency":"USD","volume":198,"openInterest":617,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094328,"inTheMoney":true,"percentChangeRaw":10.28316,"impliedVolatilityRaw":1.484377578125,"bid":"14.75","ask":"14.90","impliedVolatility":"148.44","strike":"90.00","lastPrice":"14.80","change":"1.38","percentChange":"+10.28"},{"contractSymbol":"AAPL141024C00091000","currency":"USD","volume":8,"openInterest":385,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":9.677425,"impliedVolatilityRaw":1.3906280468749999,"bid":"13.75","ask":"13.90","impliedVolatility":"139.06","strike":"91.00","lastPrice":"13.60","change":"1.20","percentChange":"+9.68"},{"contractSymbol":"AAPL141024C00092000","currency":"USD","volume":3,"openInterest":1036,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":12.804881,"impliedVolatilityRaw":1.2968785156249998,"bid":"12.75","ask":"12.90","impliedVolatility":"129.69","strike":"92.00","lastPrice":"12.95","change":"1.47","percentChange":"+12.80"},{"contractSymbol":"AAPL141024C00093000","currency":"USD","volume":22,"openInterest":613,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":20,"impliedVolatilityRaw":1.2070352148437498,"bid":"11.75","ask":"11.90","impliedVolatility":"120.70","strike":"93.00","lastPrice":"12.00","change":"2.00","percentChange":"+20.00"},{"contractSymbol":"AAPL141024C00094000","currency":"USD","volume":19,"openInterest":1726,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094326,"inTheMoney":true,"percentChangeRaw":12.499998,"impliedVolatilityRaw":1.1171919140625,"bid":"10.75","ask":"10.90","impliedVolatility":"111.72","strike":"94.00","lastPrice":"10.80","change":"1.20","percentChange":"+12.50"},{"contractSymbol":"AAPL141024C00095000","currency":"USD","volume":3799,"openInterest":14099,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":15.746182,"impliedVolatilityRaw":0.8437515624999999,"bid":"9.75","ask":"9.85","impliedVolatility":"84.38","strike":"95.00","lastPrice":"9.85","change":"1.34","percentChange":"+15.75"},{"contractSymbol":"AAPL141024C00096000","currency":"USD","volume":374,"openInterest":8173,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094325,"inTheMoney":true,"percentChangeRaw":19.727894,"impliedVolatilityRaw":0.9335944140625,"bid":"8.75","ask":"8.90","impliedVolatility":"93.36","strike":"96.00","lastPrice":"8.80","change":"1.45","percentChange":"+19.73"},{"contractSymbol":"AAPL141024C00097000","currency":"USD","volume":5094,"openInterest":21122,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094384,"inTheMoney":true,"percentChangeRaw":26.817444,"impliedVolatilityRaw":0.8437515624999999,"bid":"7.75","ask":"7.90","impliedVolatility":"84.38","strike":"97.00","lastPrice":"7.85","change":"1.66","percentChange":"+26.82"},{"contractSymbol":"AAPL141024C00098000","currency":"USD","volume":1039,"openInterest":18540,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094325,"inTheMoney":true,"percentChangeRaw":36.272556,"impliedVolatilityRaw":0.7500025,"bid":"6.75","ask":"6.90","impliedVolatility":"75.00","strike":"98.00","lastPrice":"6.80","change":"1.81","percentChange":"+36.27"},{"contractSymbol":"AAPL141024C00099000","currency":"USD","volume":2602,"openInterest":15608,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":41.9753,"impliedVolatilityRaw":0.6562534375000001,"bid":"5.75","ask":"5.90","impliedVolatility":"65.63","strike":"99.00","lastPrice":"5.75","change":"1.70","percentChange":"+41.98"},{"contractSymbol":"AAPL141024C00100000","currency":"USD","volume":8867,"openInterest":31290,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094395,"inTheMoney":true,"percentChangeRaw":61.66666,"impliedVolatilityRaw":0.5625043750000001,"bid":"4.80","ask":"4.90","impliedVolatility":"56.25","strike":"100.00","lastPrice":"4.85","change":"1.85","percentChange":"+61.67"},{"contractSymbol":"AAPL141024C00101000","currency":"USD","volume":5232,"openInterest":19255,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094250,"inTheMoney":true,"percentChangeRaw":74.52831,"impliedVolatilityRaw":0.46680220703125,"bid":"3.80","ask":"3.90","impliedVolatility":"46.68","strike":"101.00","lastPrice":"3.70","change":"1.58","percentChange":"+74.53"},{"contractSymbol":"AAPL141024C00102000","currency":"USD","volume":11311,"openInterest":32820,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094367,"inTheMoney":true,"percentChangeRaw":114.2857,"impliedVolatilityRaw":0.38086556640624997,"bid":"2.84","ask":"2.91","impliedVolatility":"38.09","strike":"102.00","lastPrice":"2.85","change":"1.52","percentChange":"+114.29"},{"contractSymbol":"AAPL141024C00103000","currency":"USD","volume":26745,"openInterest":40149,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094392,"inTheMoney":true,"percentChangeRaw":180.59702,"impliedVolatilityRaw":0.26563234375,"bid":"1.87","ask":"1.90","impliedVolatility":"26.56","strike":"103.00","lastPrice":"1.88","change":"1.21","percentChange":"+180.60"},{"contractSymbol":"AAPL141024C00104000","currency":"USD","volume":38966,"openInterest":38899,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094395,"inTheMoney":true,"percentChangeRaw":275,"impliedVolatilityRaw":0.23438265625,"bid":"1.00","ask":"1.03","impliedVolatility":"23.44","strike":"104.00","lastPrice":"1.05","change":"0.77","percentChange":"+275.00"},{"contractSymbol":"AAPL141024C00105000","currency":"USD","volume":66026,"openInterest":42521,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094398,"inTheMoney":false,"percentChangeRaw":300,"impliedVolatilityRaw":0.21875781249999998,"bid":"0.38","ask":"0.40","impliedVolatility":"21.88","strike":"105.00","lastPrice":"0.40","change":"0.30","percentChange":"+300.00"},{"contractSymbol":"AAPL141024C00106000","currency":"USD","volume":54624,"openInterest":22789,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094393,"inTheMoney":false,"percentChangeRaw":200,"impliedVolatilityRaw":0.22852333984375,"bid":"0.11","ask":"0.12","impliedVolatility":"22.85","strike":"106.00","lastPrice":"0.12","change":"0.08","percentChange":"+200.00"},{"contractSymbol":"AAPL141024C00107000","currency":"USD","volume":15310,"openInterest":60738,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094373,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.257819921875,"bid":"0.03","ask":"0.04","impliedVolatility":"25.78","strike":"107.00","lastPrice":"0.04","change":"0.02","percentChange":"+100.00"},{"contractSymbol":"AAPL141024C00108000","currency":"USD","volume":10333,"openInterest":20808,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094250,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.32813171874999997,"bid":"0.02","ask":"0.03","impliedVolatility":"32.81","strike":"108.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00"},{"contractSymbol":"AAPL141024C00109000","currency":"USD","volume":343,"openInterest":8606,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094250,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.4062559375,"bid":"0.01","ask":"0.03","impliedVolatility":"40.63","strike":"109.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00"},{"contractSymbol":"AAPL141024C00110000","currency":"USD","volume":1151,"openInterest":32265,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094250,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.45313046875,"bid":"0.01","ask":"0.02","impliedVolatility":"45.31","strike":"110.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00"},{"contractSymbol":"AAPL141024C00111000","currency":"USD","volume":14,"openInterest":4228,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.476567734375,"bid":"0.00","ask":"0.01","impliedVolatility":"47.66","strike":"111.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00"},{"contractSymbol":"AAPL141024C00112000","currency":"USD","volume":22,"openInterest":3281,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094342,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.5468795312500001,"bid":"0.00","ask":"0.02","impliedVolatility":"54.69","strike":"112.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00113000","currency":"USD","volume":13,"openInterest":1734,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.5625043750000001,"bid":"0.00","ask":"0.01","impliedVolatility":"56.25","strike":"113.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00114000","currency":"USD","volume":20,"openInterest":1306,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.6250037500000001,"bid":"0.00","ask":"0.01","impliedVolatility":"62.50","strike":"114.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00115000","currency":"USD","volume":16,"openInterest":1968,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.6562534375000001,"bid":"0.00","ask":"0.01","impliedVolatility":"65.63","strike":"115.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00116000","currency":"USD","volume":2,"openInterest":733,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.7187528125,"bid":"0.00","ask":"0.01","impliedVolatility":"71.88","strike":"116.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00117000","currency":"USD","volume":127,"openInterest":183,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.7812521875,"bid":"0.00","ask":"0.01","impliedVolatility":"78.13","strike":"117.00","lastPrice":"0.02","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00118000","currency":"USD","volume":4,"openInterest":203,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.8437515624999999,"bid":"0.00","ask":"0.01","impliedVolatility":"84.38","strike":"118.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00119000","currency":"USD","volume":215,"openInterest":225,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.87500125,"bid":"0.00","ask":"0.01","impliedVolatility":"87.50","strike":"119.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00120000","currency":"USD","volume":526,"openInterest":523,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.937500625,"bid":"0.00","ask":"0.01","impliedVolatility":"93.75","strike":"120.00","lastPrice":"0.02","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00122000","currency":"USD","volume":0,"openInterest":5,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.0312548437500002,"bid":"0.00","ask":"0.01","impliedVolatility":"103.13","strike":"122.00","lastPrice":"0.03","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00130000","currency":"USD","volume":1,"openInterest":1,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.4375028125,"bid":"0.00","ask":"0.01","impliedVolatility":"143.75","strike":"130.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"}],"puts":[{"contractSymbol":"AAPL141024P00055000","currency":"USD","volume":2,"openInterest":2,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":4.000005,"bid":"0.00","ask":"0.01","impliedVolatility":"400.00","strike":"55.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00060000","currency":"USD","volume":161,"openInterest":162,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":3.50000125,"bid":"0.00","ask":"0.01","impliedVolatility":"350.00","strike":"60.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00070000","currency":"USD","volume":101,"openInterest":104,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":2.6250034375,"bid":"0.00","ask":"0.01","impliedVolatility":"262.50","strike":"70.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00075000","currency":"USD","volume":5,"openInterest":1670,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":2.1875045312499997,"bid":"0.00","ask":"0.01","impliedVolatility":"218.75","strike":"75.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00080000","currency":"USD","volume":1200,"openInterest":1754,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.8125009374999999,"bid":"0.00","ask":"0.01","impliedVolatility":"181.25","strike":"80.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00083000","currency":"USD","volume":34,"openInterest":4148,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.5625021874999998,"bid":"0.00","ask":"0.01","impliedVolatility":"156.25","strike":"83.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00084000","currency":"USD","volume":1325,"openInterest":2296,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.5000025,"bid":"0.00","ask":"0.01","impliedVolatility":"150.00","strike":"84.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00085000","currency":"USD","volume":5,"openInterest":7442,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.4375028125,"bid":"0.00","ask":"0.01","impliedVolatility":"143.75","strike":"85.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00086000","currency":"USD","volume":32,"openInterest":1782,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.3437532812499997,"bid":"0.00","ask":"0.01","impliedVolatility":"134.38","strike":"86.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00087000","currency":"USD","volume":20,"openInterest":3490,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.2500037499999999,"bid":"0.00","ask":"0.01","impliedVolatility":"125.00","strike":"87.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00088000","currency":"USD","volume":36,"openInterest":5516,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.1875040625,"bid":"0.00","ask":"0.01","impliedVolatility":"118.75","strike":"88.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00089000","currency":"USD","volume":20,"openInterest":3694,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.125004375,"bid":"0.00","ask":"0.01","impliedVolatility":"112.50","strike":"89.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00090000","currency":"USD","volume":149,"openInterest":13444,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":1.0625046875000002,"bid":"0.00","ask":"0.01","impliedVolatility":"106.25","strike":"90.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00"},{"contractSymbol":"AAPL141024P00091000","currency":"USD","volume":402,"openInterest":7670,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.98437515625,"bid":"0.00","ask":"0.01","impliedVolatility":"98.44","strike":"91.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00"},{"contractSymbol":"AAPL141024P00092000","currency":"USD","volume":81,"openInterest":12728,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.937500625,"bid":"0.00","ask":"0.01","impliedVolatility":"93.75","strike":"92.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00"},{"contractSymbol":"AAPL141024P00093000","currency":"USD","volume":409,"openInterest":15985,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.8437515624999999,"bid":"0.00","ask":"0.01","impliedVolatility":"84.38","strike":"93.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00"},{"contractSymbol":"AAPL141024P00094000","currency":"USD","volume":673,"openInterest":17398,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.7812521875,"bid":"0.00","ask":"0.01","impliedVolatility":"78.13","strike":"94.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00"},{"contractSymbol":"AAPL141024P00095000","currency":"USD","volume":480,"openInterest":22751,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.7187528125,"bid":"0.00","ask":"0.01","impliedVolatility":"71.88","strike":"95.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00"},{"contractSymbol":"AAPL141024P00096000","currency":"USD","volume":818,"openInterest":18293,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094319,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.6562534375000001,"bid":"0.00","ask":"0.01","impliedVolatility":"65.63","strike":"96.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00097000","currency":"USD","volume":1534,"openInterest":17302,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094391,"inTheMoney":false,"percentChangeRaw":-66.66667,"impliedVolatilityRaw":0.57812921875,"bid":"0.00","ask":"0.01","impliedVolatility":"57.81","strike":"97.00","lastPrice":"0.01","change":"-0.02","percentChange":"-66.67"},{"contractSymbol":"AAPL141024P00098000","currency":"USD","volume":1945,"openInterest":26469,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-66.66667,"impliedVolatilityRaw":0.5468795312500001,"bid":"0.00","ask":"0.02","impliedVolatility":"54.69","strike":"98.00","lastPrice":"0.01","change":"-0.02","percentChange":"-66.67"},{"contractSymbol":"AAPL141024P00099000","currency":"USD","volume":3821,"openInterest":21769,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.507817421875,"bid":"0.01","ask":"0.02","impliedVolatility":"50.78","strike":"99.00","lastPrice":"0.02","change":"-0.02","percentChange":"-50.00"},{"contractSymbol":"AAPL141024P00100000","currency":"USD","volume":4979,"openInterest":21891,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094259,"inTheMoney":false,"percentChangeRaw":-57.142853,"impliedVolatilityRaw":0.445318046875,"bid":"0.01","ask":"0.02","impliedVolatility":"44.53","strike":"100.00","lastPrice":"0.03","change":"-0.04","percentChange":"-57.14"},{"contractSymbol":"AAPL141024P00101000","currency":"USD","volume":10032,"openInterest":15354,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094391,"inTheMoney":false,"percentChangeRaw":-80,"impliedVolatilityRaw":0.39453730468750003,"bid":"0.02","ask":"0.03","impliedVolatility":"39.45","strike":"101.00","lastPrice":"0.03","change":"-0.12","percentChange":"-80.00"},{"contractSymbol":"AAPL141024P00102000","currency":"USD","volume":12599,"openInterest":15053,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094396,"inTheMoney":false,"percentChangeRaw":-90.909096,"impliedVolatilityRaw":0.3242255078124999,"bid":"0.03","ask":"0.04","impliedVolatility":"32.42","strike":"102.00","lastPrice":"0.03","change":"-0.30","percentChange":"-90.91"},{"contractSymbol":"AAPL141024P00103000","currency":"USD","volume":21356,"openInterest":10473,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094398,"inTheMoney":false,"percentChangeRaw":-90.14085,"impliedVolatilityRaw":0.27539787109374997,"bid":"0.07","ask":"0.08","impliedVolatility":"27.54","strike":"103.00","lastPrice":"0.07","change":"-0.64","percentChange":"-90.14"},{"contractSymbol":"AAPL141024P00104000","currency":"USD","volume":50078,"openInterest":4619,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094398,"inTheMoney":false,"percentChangeRaw":-85.82677,"impliedVolatilityRaw":0.22852333984375,"bid":"0.18","ask":"0.19","impliedVolatility":"22.85","strike":"104.00","lastPrice":"0.18","change":"-1.09","percentChange":"-85.83"},{"contractSymbol":"AAPL141024P00105000","currency":"USD","volume":25194,"openInterest":1483,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094398,"inTheMoney":true,"percentChangeRaw":-72.27723,"impliedVolatilityRaw":0.22364057617187497,"bid":"0.55","ask":"0.58","impliedVolatility":"22.36","strike":"105.00","lastPrice":"0.56","change":"-1.46","percentChange":"-72.28"},{"contractSymbol":"AAPL141024P00106000","currency":"USD","volume":2558,"openInterest":709,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094392,"inTheMoney":true,"percentChangeRaw":-54.035084,"impliedVolatilityRaw":0.242195078125,"bid":"1.26","ask":"1.31","impliedVolatility":"24.22","strike":"106.00","lastPrice":"1.31","change":"-1.54","percentChange":"-54.04"},{"contractSymbol":"AAPL141024P00107000","currency":"USD","volume":372,"openInterest":185,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094259,"inTheMoney":true,"percentChangeRaw":-38.68421,"impliedVolatilityRaw":0.29492892578124996,"bid":"2.17","ask":"2.24","impliedVolatility":"29.49","strike":"107.00","lastPrice":"2.33","change":"-1.47","percentChange":"-38.68"},{"contractSymbol":"AAPL141024P00108000","currency":"USD","volume":84,"openInterest":445,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094259,"inTheMoney":true,"percentChangeRaw":-32.978718,"impliedVolatilityRaw":0.4023497265625,"bid":"3.15","ask":"3.25","impliedVolatility":"40.23","strike":"108.00","lastPrice":"3.15","change":"-1.55","percentChange":"-32.98"},{"contractSymbol":"AAPL141024P00109000","currency":"USD","volume":41,"openInterest":62,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094260,"inTheMoney":true,"percentChangeRaw":-35.60606,"impliedVolatilityRaw":0.49609878906250005,"bid":"4.10","ask":"4.25","impliedVolatility":"49.61","strike":"109.00","lastPrice":"4.25","change":"-2.35","percentChange":"-35.61"},{"contractSymbol":"AAPL141024P00110000","currency":"USD","volume":258,"openInterest":175,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094260,"inTheMoney":true,"percentChangeRaw":-32.894737,"impliedVolatilityRaw":0.5820354296875,"bid":"5.10","ask":"5.25","impliedVolatility":"58.20","strike":"110.00","lastPrice":"5.10","change":"-2.50","percentChange":"-32.89"},{"contractSymbol":"AAPL141024P00111000","currency":"USD","volume":10,"openInterest":118,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094260,"inTheMoney":true,"percentChangeRaw":-48.728813,"impliedVolatilityRaw":0.6679720703125002,"bid":"6.10","ask":"6.25","impliedVolatility":"66.80","strike":"111.00","lastPrice":"6.05","change":"-5.75","percentChange":"-48.73"},{"contractSymbol":"AAPL141024P00112000","currency":"USD","volume":2,"openInterest":83,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094260,"inTheMoney":true,"percentChangeRaw":-39.743587,"impliedVolatilityRaw":0.500005,"bid":"7.10","ask":"7.25","impliedVolatility":"50.00","strike":"112.00","lastPrice":"7.05","change":"-4.65","percentChange":"-39.74"},{"contractSymbol":"AAPL141024P00113000","currency":"USD","volume":2,"openInterest":37,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094260,"inTheMoney":true,"percentChangeRaw":-38.931297,"impliedVolatilityRaw":0.5625043750000001,"bid":"8.10","ask":"8.25","impliedVolatility":"56.25","strike":"113.00","lastPrice":"8.00","change":"-5.10","percentChange":"-38.93"},{"contractSymbol":"AAPL141024P00116000","currency":"USD","volume":57,"openInterest":0,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094260,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":0.7187528125,"bid":"11.10","ask":"11.25","impliedVolatility":"71.88","strike":"116.00","lastPrice":"14.45","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00118000","currency":"USD","volume":5,"openInterest":2,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":0.8437515624999999,"bid":"13.10","ask":"13.25","impliedVolatility":"84.38","strike":"118.00","lastPrice":"15.60","change":"0.00","percentChange":"0.00"}]},"_options":[{"expirationDate":1414108800,"hasMiniOptions":true,"calls":[{"contractSymbol":"AAPL141024C00055000","currency":"USD","volume":25,"openInterest":0,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":5.687502890625,"bid":"49.70","ask":"49.95","impliedVolatility":"568.75","strike":"55.00","lastPrice":"44.16","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00075000","currency":"USD","volume":2,"openInterest":247,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":2.93750265625,"bid":"29.75","ask":"29.90","impliedVolatility":"293.75","strike":"75.00","lastPrice":"27.71","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00080000","currency":"USD","volume":1,"openInterest":77,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":6.8522496,"impliedVolatilityRaw":2.42969142578125,"bid":"24.75","ask":"24.90","impliedVolatility":"242.97","strike":"80.00","lastPrice":"24.95","change":"1.60","percentChange":"+6.85"},{"contractSymbol":"AAPL141024C00083000","currency":"USD","volume":1,"openInterest":6,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":2.1406296484375,"bid":"21.75","ask":"21.90","impliedVolatility":"214.06","strike":"83.00","lastPrice":"19.84","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00085000","currency":"USD","volume":13,"openInterest":233,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":7.3513546,"impliedVolatilityRaw":1.9453127734375002,"bid":"19.75","ask":"19.90","impliedVolatility":"194.53","strike":"85.00","lastPrice":"19.86","change":"1.36","percentChange":"+7.35"},{"contractSymbol":"AAPL141024C00086000","currency":"USD","volume":2,"openInterest":16,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":1.8515632421875,"bid":"18.75","ask":"18.90","impliedVolatility":"185.16","strike":"86.00","lastPrice":"16.72","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00087000","currency":"USD","volume":20,"openInterest":15,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":1.7578137109375,"bid":"17.75","ask":"17.90","impliedVolatility":"175.78","strike":"87.00","lastPrice":"12.50","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00088000","currency":"USD","volume":2,"openInterest":346,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":11.5131645,"impliedVolatilityRaw":1.6640641796875002,"bid":"16.75","ask":"16.90","impliedVolatility":"166.41","strike":"88.00","lastPrice":"16.95","change":"1.75","percentChange":"+11.51"},{"contractSymbol":"AAPL141024C00089000","currency":"USD","volume":5,"openInterest":314,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":1.57422087890625,"bid":"15.75","ask":"15.90","impliedVolatility":"157.42","strike":"89.00","lastPrice":"13.80","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00090000","currency":"USD","volume":198,"openInterest":617,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094328,"inTheMoney":true,"percentChangeRaw":10.28316,"impliedVolatilityRaw":1.484377578125,"bid":"14.75","ask":"14.90","impliedVolatility":"148.44","strike":"90.00","lastPrice":"14.80","change":"1.38","percentChange":"+10.28"},{"contractSymbol":"AAPL141024C00091000","currency":"USD","volume":8,"openInterest":385,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":9.677425,"impliedVolatilityRaw":1.3906280468749999,"bid":"13.75","ask":"13.90","impliedVolatility":"139.06","strike":"91.00","lastPrice":"13.60","change":"1.20","percentChange":"+9.68"},{"contractSymbol":"AAPL141024C00092000","currency":"USD","volume":3,"openInterest":1036,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":12.804881,"impliedVolatilityRaw":1.2968785156249998,"bid":"12.75","ask":"12.90","impliedVolatility":"129.69","strike":"92.00","lastPrice":"12.95","change":"1.47","percentChange":"+12.80"},{"contractSymbol":"AAPL141024C00093000","currency":"USD","volume":22,"openInterest":613,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":20,"impliedVolatilityRaw":1.2070352148437498,"bid":"11.75","ask":"11.90","impliedVolatility":"120.70","strike":"93.00","lastPrice":"12.00","change":"2.00","percentChange":"+20.00"},{"contractSymbol":"AAPL141024C00094000","currency":"USD","volume":19,"openInterest":1726,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094326,"inTheMoney":true,"percentChangeRaw":12.499998,"impliedVolatilityRaw":1.1171919140625,"bid":"10.75","ask":"10.90","impliedVolatility":"111.72","strike":"94.00","lastPrice":"10.80","change":"1.20","percentChange":"+12.50"},{"contractSymbol":"AAPL141024C00095000","currency":"USD","volume":3799,"openInterest":14099,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":15.746182,"impliedVolatilityRaw":0.8437515624999999,"bid":"9.75","ask":"9.85","impliedVolatility":"84.38","strike":"95.00","lastPrice":"9.85","change":"1.34","percentChange":"+15.75"},{"contractSymbol":"AAPL141024C00096000","currency":"USD","volume":374,"openInterest":8173,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094325,"inTheMoney":true,"percentChangeRaw":19.727894,"impliedVolatilityRaw":0.9335944140625,"bid":"8.75","ask":"8.90","impliedVolatility":"93.36","strike":"96.00","lastPrice":"8.80","change":"1.45","percentChange":"+19.73"},{"contractSymbol":"AAPL141024C00097000","currency":"USD","volume":5094,"openInterest":21122,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094384,"inTheMoney":true,"percentChangeRaw":26.817444,"impliedVolatilityRaw":0.8437515624999999,"bid":"7.75","ask":"7.90","impliedVolatility":"84.38","strike":"97.00","lastPrice":"7.85","change":"1.66","percentChange":"+26.82"},{"contractSymbol":"AAPL141024C00098000","currency":"USD","volume":1039,"openInterest":18540,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094325,"inTheMoney":true,"percentChangeRaw":36.272556,"impliedVolatilityRaw":0.7500025,"bid":"6.75","ask":"6.90","impliedVolatility":"75.00","strike":"98.00","lastPrice":"6.80","change":"1.81","percentChange":"+36.27"},{"contractSymbol":"AAPL141024C00099000","currency":"USD","volume":2602,"openInterest":15608,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094252,"inTheMoney":true,"percentChangeRaw":41.9753,"impliedVolatilityRaw":0.6562534375000001,"bid":"5.75","ask":"5.90","impliedVolatility":"65.63","strike":"99.00","lastPrice":"5.75","change":"1.70","percentChange":"+41.98"},{"contractSymbol":"AAPL141024C00100000","currency":"USD","volume":8867,"openInterest":31290,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094395,"inTheMoney":true,"percentChangeRaw":61.66666,"impliedVolatilityRaw":0.5625043750000001,"bid":"4.80","ask":"4.90","impliedVolatility":"56.25","strike":"100.00","lastPrice":"4.85","change":"1.85","percentChange":"+61.67"},{"contractSymbol":"AAPL141024C00101000","currency":"USD","volume":5232,"openInterest":19255,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094250,"inTheMoney":true,"percentChangeRaw":74.52831,"impliedVolatilityRaw":0.46680220703125,"bid":"3.80","ask":"3.90","impliedVolatility":"46.68","strike":"101.00","lastPrice":"3.70","change":"1.58","percentChange":"+74.53"},{"contractSymbol":"AAPL141024C00102000","currency":"USD","volume":11311,"openInterest":32820,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094367,"inTheMoney":true,"percentChangeRaw":114.2857,"impliedVolatilityRaw":0.38086556640624997,"bid":"2.84","ask":"2.91","impliedVolatility":"38.09","strike":"102.00","lastPrice":"2.85","change":"1.52","percentChange":"+114.29"},{"contractSymbol":"AAPL141024C00103000","currency":"USD","volume":26745,"openInterest":40149,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094392,"inTheMoney":true,"percentChangeRaw":180.59702,"impliedVolatilityRaw":0.26563234375,"bid":"1.87","ask":"1.90","impliedVolatility":"26.56","strike":"103.00","lastPrice":"1.88","change":"1.21","percentChange":"+180.60"},{"contractSymbol":"AAPL141024C00104000","currency":"USD","volume":38966,"openInterest":38899,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094395,"inTheMoney":true,"percentChangeRaw":275,"impliedVolatilityRaw":0.23438265625,"bid":"1.00","ask":"1.03","impliedVolatility":"23.44","strike":"104.00","lastPrice":"1.05","change":"0.77","percentChange":"+275.00"},{"contractSymbol":"AAPL141024C00105000","currency":"USD","volume":66026,"openInterest":42521,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094398,"inTheMoney":false,"percentChangeRaw":300,"impliedVolatilityRaw":0.21875781249999998,"bid":"0.38","ask":"0.40","impliedVolatility":"21.88","strike":"105.00","lastPrice":"0.40","change":"0.30","percentChange":"+300.00"},{"contractSymbol":"AAPL141024C00106000","currency":"USD","volume":54624,"openInterest":22789,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094393,"inTheMoney":false,"percentChangeRaw":200,"impliedVolatilityRaw":0.22852333984375,"bid":"0.11","ask":"0.12","impliedVolatility":"22.85","strike":"106.00","lastPrice":"0.12","change":"0.08","percentChange":"+200.00"},{"contractSymbol":"AAPL141024C00107000","currency":"USD","volume":15310,"openInterest":60738,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094373,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.257819921875,"bid":"0.03","ask":"0.04","impliedVolatility":"25.78","strike":"107.00","lastPrice":"0.04","change":"0.02","percentChange":"+100.00"},{"contractSymbol":"AAPL141024C00108000","currency":"USD","volume":10333,"openInterest":20808,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094250,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.32813171874999997,"bid":"0.02","ask":"0.03","impliedVolatility":"32.81","strike":"108.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00"},{"contractSymbol":"AAPL141024C00109000","currency":"USD","volume":343,"openInterest":8606,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094250,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.4062559375,"bid":"0.01","ask":"0.03","impliedVolatility":"40.63","strike":"109.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00"},{"contractSymbol":"AAPL141024C00110000","currency":"USD","volume":1151,"openInterest":32265,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094250,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.45313046875,"bid":"0.01","ask":"0.02","impliedVolatility":"45.31","strike":"110.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00"},{"contractSymbol":"AAPL141024C00111000","currency":"USD","volume":14,"openInterest":4228,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.476567734375,"bid":"0.00","ask":"0.01","impliedVolatility":"47.66","strike":"111.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00"},{"contractSymbol":"AAPL141024C00112000","currency":"USD","volume":22,"openInterest":3281,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094342,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.5468795312500001,"bid":"0.00","ask":"0.02","impliedVolatility":"54.69","strike":"112.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00113000","currency":"USD","volume":13,"openInterest":1734,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.5625043750000001,"bid":"0.00","ask":"0.01","impliedVolatility":"56.25","strike":"113.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00114000","currency":"USD","volume":20,"openInterest":1306,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.6250037500000001,"bid":"0.00","ask":"0.01","impliedVolatility":"62.50","strike":"114.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00115000","currency":"USD","volume":16,"openInterest":1968,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.6562534375000001,"bid":"0.00","ask":"0.01","impliedVolatility":"65.63","strike":"115.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00116000","currency":"USD","volume":2,"openInterest":733,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.7187528125,"bid":"0.00","ask":"0.01","impliedVolatility":"71.88","strike":"116.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00117000","currency":"USD","volume":127,"openInterest":183,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.7812521875,"bid":"0.00","ask":"0.01","impliedVolatility":"78.13","strike":"117.00","lastPrice":"0.02","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00118000","currency":"USD","volume":4,"openInterest":203,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.8437515624999999,"bid":"0.00","ask":"0.01","impliedVolatility":"84.38","strike":"118.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00119000","currency":"USD","volume":215,"openInterest":225,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.87500125,"bid":"0.00","ask":"0.01","impliedVolatility":"87.50","strike":"119.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00120000","currency":"USD","volume":526,"openInterest":523,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.937500625,"bid":"0.00","ask":"0.01","impliedVolatility":"93.75","strike":"120.00","lastPrice":"0.02","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00122000","currency":"USD","volume":0,"openInterest":5,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.0312548437500002,"bid":"0.00","ask":"0.01","impliedVolatility":"103.13","strike":"122.00","lastPrice":"0.03","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024C00130000","currency":"USD","volume":1,"openInterest":1,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094251,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.4375028125,"bid":"0.00","ask":"0.01","impliedVolatility":"143.75","strike":"130.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"}],"puts":[{"contractSymbol":"AAPL141024P00055000","currency":"USD","volume":2,"openInterest":2,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":4.000005,"bid":"0.00","ask":"0.01","impliedVolatility":"400.00","strike":"55.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00060000","currency":"USD","volume":161,"openInterest":162,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":3.50000125,"bid":"0.00","ask":"0.01","impliedVolatility":"350.00","strike":"60.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00070000","currency":"USD","volume":101,"openInterest":104,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":2.6250034375,"bid":"0.00","ask":"0.01","impliedVolatility":"262.50","strike":"70.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00075000","currency":"USD","volume":5,"openInterest":1670,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":2.1875045312499997,"bid":"0.00","ask":"0.01","impliedVolatility":"218.75","strike":"75.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00080000","currency":"USD","volume":1200,"openInterest":1754,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.8125009374999999,"bid":"0.00","ask":"0.01","impliedVolatility":"181.25","strike":"80.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00083000","currency":"USD","volume":34,"openInterest":4148,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.5625021874999998,"bid":"0.00","ask":"0.01","impliedVolatility":"156.25","strike":"83.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00084000","currency":"USD","volume":1325,"openInterest":2296,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.5000025,"bid":"0.00","ask":"0.01","impliedVolatility":"150.00","strike":"84.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00085000","currency":"USD","volume":5,"openInterest":7442,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.4375028125,"bid":"0.00","ask":"0.01","impliedVolatility":"143.75","strike":"85.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00086000","currency":"USD","volume":32,"openInterest":1782,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.3437532812499997,"bid":"0.00","ask":"0.01","impliedVolatility":"134.38","strike":"86.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00087000","currency":"USD","volume":20,"openInterest":3490,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.2500037499999999,"bid":"0.00","ask":"0.01","impliedVolatility":"125.00","strike":"87.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00088000","currency":"USD","volume":36,"openInterest":5516,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.1875040625,"bid":"0.00","ask":"0.01","impliedVolatility":"118.75","strike":"88.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00089000","currency":"USD","volume":20,"openInterest":3694,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.125004375,"bid":"0.00","ask":"0.01","impliedVolatility":"112.50","strike":"89.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00090000","currency":"USD","volume":149,"openInterest":13444,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":1.0625046875000002,"bid":"0.00","ask":"0.01","impliedVolatility":"106.25","strike":"90.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00"},{"contractSymbol":"AAPL141024P00091000","currency":"USD","volume":402,"openInterest":7670,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.98437515625,"bid":"0.00","ask":"0.01","impliedVolatility":"98.44","strike":"91.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00"},{"contractSymbol":"AAPL141024P00092000","currency":"USD","volume":81,"openInterest":12728,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.937500625,"bid":"0.00","ask":"0.01","impliedVolatility":"93.75","strike":"92.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00"},{"contractSymbol":"AAPL141024P00093000","currency":"USD","volume":409,"openInterest":15985,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.8437515624999999,"bid":"0.00","ask":"0.01","impliedVolatility":"84.38","strike":"93.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00"},{"contractSymbol":"AAPL141024P00094000","currency":"USD","volume":673,"openInterest":17398,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.7812521875,"bid":"0.00","ask":"0.01","impliedVolatility":"78.13","strike":"94.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00"},{"contractSymbol":"AAPL141024P00095000","currency":"USD","volume":480,"openInterest":22751,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.7187528125,"bid":"0.00","ask":"0.01","impliedVolatility":"71.88","strike":"95.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00"},{"contractSymbol":"AAPL141024P00096000","currency":"USD","volume":818,"openInterest":18293,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094319,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.6562534375000001,"bid":"0.00","ask":"0.01","impliedVolatility":"65.63","strike":"96.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00097000","currency":"USD","volume":1534,"openInterest":17302,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094391,"inTheMoney":false,"percentChangeRaw":-66.66667,"impliedVolatilityRaw":0.57812921875,"bid":"0.00","ask":"0.01","impliedVolatility":"57.81","strike":"97.00","lastPrice":"0.01","change":"-0.02","percentChange":"-66.67"},{"contractSymbol":"AAPL141024P00098000","currency":"USD","volume":1945,"openInterest":26469,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-66.66667,"impliedVolatilityRaw":0.5468795312500001,"bid":"0.00","ask":"0.02","impliedVolatility":"54.69","strike":"98.00","lastPrice":"0.01","change":"-0.02","percentChange":"-66.67"},{"contractSymbol":"AAPL141024P00099000","currency":"USD","volume":3821,"openInterest":21769,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.507817421875,"bid":"0.01","ask":"0.02","impliedVolatility":"50.78","strike":"99.00","lastPrice":"0.02","change":"-0.02","percentChange":"-50.00"},{"contractSymbol":"AAPL141024P00100000","currency":"USD","volume":4979,"openInterest":21891,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094259,"inTheMoney":false,"percentChangeRaw":-57.142853,"impliedVolatilityRaw":0.445318046875,"bid":"0.01","ask":"0.02","impliedVolatility":"44.53","strike":"100.00","lastPrice":"0.03","change":"-0.04","percentChange":"-57.14"},{"contractSymbol":"AAPL141024P00101000","currency":"USD","volume":10032,"openInterest":15354,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094391,"inTheMoney":false,"percentChangeRaw":-80,"impliedVolatilityRaw":0.39453730468750003,"bid":"0.02","ask":"0.03","impliedVolatility":"39.45","strike":"101.00","lastPrice":"0.03","change":"-0.12","percentChange":"-80.00"},{"contractSymbol":"AAPL141024P00102000","currency":"USD","volume":12599,"openInterest":15053,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094396,"inTheMoney":false,"percentChangeRaw":-90.909096,"impliedVolatilityRaw":0.3242255078124999,"bid":"0.03","ask":"0.04","impliedVolatility":"32.42","strike":"102.00","lastPrice":"0.03","change":"-0.30","percentChange":"-90.91"},{"contractSymbol":"AAPL141024P00103000","currency":"USD","volume":21356,"openInterest":10473,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094398,"inTheMoney":false,"percentChangeRaw":-90.14085,"impliedVolatilityRaw":0.27539787109374997,"bid":"0.07","ask":"0.08","impliedVolatility":"27.54","strike":"103.00","lastPrice":"0.07","change":"-0.64","percentChange":"-90.14"},{"contractSymbol":"AAPL141024P00104000","currency":"USD","volume":50078,"openInterest":4619,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094398,"inTheMoney":false,"percentChangeRaw":-85.82677,"impliedVolatilityRaw":0.22852333984375,"bid":"0.18","ask":"0.19","impliedVolatility":"22.85","strike":"104.00","lastPrice":"0.18","change":"-1.09","percentChange":"-85.83"},{"contractSymbol":"AAPL141024P00105000","currency":"USD","volume":25194,"openInterest":1483,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094398,"inTheMoney":true,"percentChangeRaw":-72.27723,"impliedVolatilityRaw":0.22364057617187497,"bid":"0.55","ask":"0.58","impliedVolatility":"22.36","strike":"105.00","lastPrice":"0.56","change":"-1.46","percentChange":"-72.28"},{"contractSymbol":"AAPL141024P00106000","currency":"USD","volume":2558,"openInterest":709,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094392,"inTheMoney":true,"percentChangeRaw":-54.035084,"impliedVolatilityRaw":0.242195078125,"bid":"1.26","ask":"1.31","impliedVolatility":"24.22","strike":"106.00","lastPrice":"1.31","change":"-1.54","percentChange":"-54.04"},{"contractSymbol":"AAPL141024P00107000","currency":"USD","volume":372,"openInterest":185,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094259,"inTheMoney":true,"percentChangeRaw":-38.68421,"impliedVolatilityRaw":0.29492892578124996,"bid":"2.17","ask":"2.24","impliedVolatility":"29.49","strike":"107.00","lastPrice":"2.33","change":"-1.47","percentChange":"-38.68"},{"contractSymbol":"AAPL141024P00108000","currency":"USD","volume":84,"openInterest":445,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094259,"inTheMoney":true,"percentChangeRaw":-32.978718,"impliedVolatilityRaw":0.4023497265625,"bid":"3.15","ask":"3.25","impliedVolatility":"40.23","strike":"108.00","lastPrice":"3.15","change":"-1.55","percentChange":"-32.98"},{"contractSymbol":"AAPL141024P00109000","currency":"USD","volume":41,"openInterest":62,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094260,"inTheMoney":true,"percentChangeRaw":-35.60606,"impliedVolatilityRaw":0.49609878906250005,"bid":"4.10","ask":"4.25","impliedVolatility":"49.61","strike":"109.00","lastPrice":"4.25","change":"-2.35","percentChange":"-35.61"},{"contractSymbol":"AAPL141024P00110000","currency":"USD","volume":258,"openInterest":175,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094260,"inTheMoney":true,"percentChangeRaw":-32.894737,"impliedVolatilityRaw":0.5820354296875,"bid":"5.10","ask":"5.25","impliedVolatility":"58.20","strike":"110.00","lastPrice":"5.10","change":"-2.50","percentChange":"-32.89"},{"contractSymbol":"AAPL141024P00111000","currency":"USD","volume":10,"openInterest":118,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094260,"inTheMoney":true,"percentChangeRaw":-48.728813,"impliedVolatilityRaw":0.6679720703125002,"bid":"6.10","ask":"6.25","impliedVolatility":"66.80","strike":"111.00","lastPrice":"6.05","change":"-5.75","percentChange":"-48.73"},{"contractSymbol":"AAPL141024P00112000","currency":"USD","volume":2,"openInterest":83,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094260,"inTheMoney":true,"percentChangeRaw":-39.743587,"impliedVolatilityRaw":0.500005,"bid":"7.10","ask":"7.25","impliedVolatility":"50.00","strike":"112.00","lastPrice":"7.05","change":"-4.65","percentChange":"-39.74"},{"contractSymbol":"AAPL141024P00113000","currency":"USD","volume":2,"openInterest":37,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094260,"inTheMoney":true,"percentChangeRaw":-38.931297,"impliedVolatilityRaw":0.5625043750000001,"bid":"8.10","ask":"8.25","impliedVolatility":"56.25","strike":"113.00","lastPrice":"8.00","change":"-5.10","percentChange":"-38.93"},{"contractSymbol":"AAPL141024P00116000","currency":"USD","volume":57,"openInterest":0,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094260,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":0.7187528125,"bid":"11.10","ask":"11.25","impliedVolatility":"71.88","strike":"116.00","lastPrice":"14.45","change":"0.00","percentChange":"0.00"},{"contractSymbol":"AAPL141024P00118000","currency":"USD","volume":5,"openInterest":2,"contractSize":"REGULAR","expiration":1414108800,"lastTradeDate":1414094261,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":0.8437515624999999,"bid":"13.10","ask":"13.25","impliedVolatility":"84.38","strike":"118.00","lastPrice":"15.60","change":"0.00","percentChange":"0.00"}]}],"epochs":[1414108800,1414713600,1415318400,1415923200,1416614400,1417132800,1419033600,1421452800,1424390400,1429228800,1437091200,1452816000,1484870400]},"columns":{"list_table_columns":[{"column":{"name":"Strike","header_cell_class":"column-strike Pstart-38 low-high","body_cell_class":"Pstart-10","template":"table/columns/strike","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"strike","filter":true}},{"column":{"name":"Contract Name","header_cell_class":"column-contractName Pstart-10","body_cell_class":"w-100","template":"table/columns/contract_name","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"symbol"}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"lastPrice"}},{"column":{"name":"Bid","header_cell_class":"column-bid Pstart-10","body_cell_class":"w-100","template":"table/columns/bid","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"bid"}},{"column":{"name":"Ask","header_cell_class":"column-ask Pstart-10","body_cell_class":"w-100","template":"table/columns/ask","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"ask"}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-14","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"change"}},{"column":{"name":"%Change","header_cell_class":"column-percentChange Pstart-16","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-14","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-14","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"openInterest"}},{"column":{"name":"Implied Volatility","header_cell_class":"column-impliedVolatility Pstart-10","body_cell_class":"w-100","template":"table/columns/implied_volatility","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"impliedVolatility"}}],"straddle_table_columns":[{"column":{"name":"Expand All","header_cell_class":"column-expand-all Pstart-38","body_cell_class":"Pstart-10","template":"table/columns/strike","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"expand","filter":false}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.lastPrice","filter":false}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-10","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.change"}},{"column":{"name":"%Change","header_cell_class":"column-pctchange","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-10","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-10","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.openInterest"}},{"column":{"name":"Strike","header_cell_class":"column-strike","body_cell_class":"Pstart-10","template":"table/columns/strike","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"strike","filter":true}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.lastPrice","filter":false}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-10","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.change"}},{"column":{"name":"%Change","header_cell_class":"column-pctchange","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-10","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-10","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.openInterest"}}],"single_strike_filter_list_table_columns":[{"column":{"name":"Expires","header_cell_class":"column-expires Pstart-38 low-high","body_cell_class":"Pstart-10","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"expiration","filter":false}},{"column":{"name":"Contract Name","header_cell_class":"column-contractName Pstart-10","body_cell_class":"w-100","template":"table/columns/contract_name","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"symbol"}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"lastPrice"}},{"column":{"name":"Bid","header_cell_class":"column-bid Pstart-10","body_cell_class":"w-100","template":"table/columns/bid","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"bid"}},{"column":{"name":"Ask","header_cell_class":"column-ask Pstart-10","body_cell_class":"w-100","template":"table/columns/ask","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"ask"}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-14","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"change"}},{"column":{"name":"%Change","header_cell_class":"column-percentChange Pstart-16","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-14","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-14","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"openInterest"}},{"column":{"name":"Implied Volatility","header_cell_class":"column-impliedVolatility Pstart-10","body_cell_class":"w-100","template":"table/columns/implied_volatility","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"impliedVolatility"}}],"single_strike_filter_straddle_table_columns":[{"column":{"name":"Expand All","header_cell_class":"column-expand-all Pstart-38","body_cell_class":"Pstart-10","template":"table/columns/strike","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"expand","filter":false}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.lastPrice","filter":false}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-10","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.change"}},{"column":{"name":"%Change","header_cell_class":"column-pctchange","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-10","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-10","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.openInterest"}},{"column":{"name":"Expires","header_cell_class":"column-expires","body_cell_class":"Pstart-10","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"expiration"}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.lastPrice","filter":false}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-10","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.change"}},{"column":{"name":"%Change","header_cell_class":"column-pctchange","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-10","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-10","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.openInterest"}}]},"params":{"date":"1414108800","size":false,"straddle":false,"ticker":"AAPL","singleStrikeFilter":false,"dateObj":"2014-10-24T00:00:00.000Z"}}}},"views":{"main":{"yui_module":"td-options-table-mainview","yui_class":"TD.Options-table.MainView"}},"templates":{"main":{"yui_module":"td-applet-options-table-templates-main","template_name":"td-applet-options-table-templates-main"},"error":{"yui_module":"td-applet-options-table-templates-error","template_name":"td-applet-options-table-templates-error"}},"i18n":{"TITLE":"options-table"},"transport":{"xhr":"/_td_charts_api"},"context":{"bucket":"gs513","crumb":"Mo4ghtv8vTn","device":"desktop","lang":"en-US","region":"US","site":"finance"}};</script>
-<script>YMedia.applyConfig({"groups":{"td-applet-mw-quote-details":{"base":"https://s1.yimg.com/os/mit/td/td-applet-mw-quote-details-2.3.131/","root":"os/mit/td/td-applet-mw-quote-details-2.3.131/","combine":true,"filter":"min","comboBase":"https://s.yimg.com/zz/combo?","comboSep":"&"}}});</script><script>window.Af=window.Af||{};window.Af.bootstrap=window.Af.bootstrap||{};window.Af.bootstrap["4971909176457958"] = {"applet_type":"td-applet-mw-quote-details","models":{"mwquotedetails":{"yui_module":"td-applet-mw-quote-details-model","yui_class":"TD.Applet.MWQuoteDetailsModel","data":{"quoteDetails":{"quotes":[{"name":"Apple Inc.","symbol":"AAPL","details_url":"http://finance.yahoo.com/q?s=AAPL","exchange":{"symbol":"NasdaqGS","id":"NMS","status":"REGULAR_MARKET"},"type":"equity","price":{"fmt":"104.83","raw":"104.830002"},"volume":{"fmt":"71.1m","raw":"71074674","longFmt":"71,074,674"},"avg_daily_volume":{"fmt":"59.0m","raw":"58983600","longFmt":"58,983,600"},"avg_3m_volume":{"fmt":"59.0m","raw":"58983600","longFmt":"58,983,600"},"timestamp":"1414094400","time":"4:00PM EDT","trend":"up","price_change":{"fmt":"+1.84","raw":"1.840004"},"price_pct_change":{"fmt":"1.79%","raw":"1.786585"},"day_high":{"fmt":"105.05","raw":"105.051003"},"day_low":{"fmt":"103.63","raw":"103.629997"},"fiftytwo_week_high":{"fmt":"105.05","raw":"105.051003"},"fiftytwo_week_low":{"fmt":"70.51","raw":"70.507100"},"open":{"data_source":"1","fmt":"103.95","raw":"103.949997"},"pe_ratio":{"fmt":"16.25","raw":"16.252714"},"prev_close":{"data_source":"1","fmt":"102.99","raw":"102.989998"},"beta_coefficient":{"fmt":"1.03","raw":"1.030000"},"market_cap":{"data_source":"1","currency":"USD","fmt":"614.95B","raw":"614949715968.000000"},"eps":{"fmt":"6.45","raw":"6.450000"},"one_year_target":{"fmt":"115.53","raw":"115.530000"},"dividend_per_share":{"raw":"1.880000","fmt":"1.88"}}]},"symbol":"aapl","login":"https://login.yahoo.com/config/login_verify2?.src=finance&.done=http%3A%2F%2Ffinance.yahoo.com%2Fecharts%3Fs%3Daapl","hamNavQueEnabled":false,"crumb":"Mo4ghtv8vTn"}},"applet_model":{"models":["mwquotedetails"],"data":{}}},"views":{"main":{"yui_module":"td-applet-quote-details-desktopview","yui_class":"TD.Applet.QuoteDetailsDesktopView"}},"templates":{"main":{"yui_module":"td-applet-mw-quote-details-templates-main","template_name":"td-applet-mw-quote-details-templates-main"}},"i18n":{"HAM_NAV_MODAL_MSG":"has been added to your list. Go to My Portfolio for more!","FOLLOW":"Follow","FOLLOWING":"Following","WATCHLIST":"Watchlist","IN_WATCHLIST":"In Watchlist","TO_FOLLOW":" to Follow","TO_WATCHLIST":" to Add to Watchlist"},"transport":{"xhr":"/_td_charts_api"},"context":{"bucket":"gs513","crumb":"Mo4ghtv8vTn","device":"desktop","lang":"en-US","region":"US","site":"finance"}};</script>
-        
-
-        <script>if (!window.YMedia) { var YMedia = YUI(); YMedia.includes = []; }</script><div id="yom-ad-SDARLA-iframe"><script type='text/javascript' src='https://s.yimg.com/rq/darla/2-8-4/js/g-r-min.js'></script><script type="text/x-safeframe" id="fc" _ver="2-8-4">{ "positions": [ { "html": "<!-- APT Vendor: WSOD, Format: Polite in Page -->\n<scr"+"ipt type=\"text/javascr"+"ipt\" src=\"https://ad.wsod.com/embed/8bec9b10877d5d7fd7c0fb6e6a631357/1542.0.js.120x60/1414127024.494824?yud=smpv%3d3%26ed%3dKfb2BHkzZLF3yh3sUja2DRXi3LZjugk7yJsheWWxeT5uV9SYCdYQ_446QvaEZCyKSLrr70o.Nc5oZrJI1hhOOlXySheUe7BOTrobj0Mos29XwFs0ZhpzyPcti5AY4YuEAVvQZ.zRltdz7vZ16o0-&encver=1&encalgo=3DES-CFB-SHA1&app=apt&intf=1&click=https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3ZmI0MnVnZShnaWQkVUpja1d6SXdOaTVfcS5PM1ZFaDRYZ0dxTVRBNExsUkozYkRfaWlDWSxzdCQxNDE0MTI3MDI0NDQxNjEwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkNDI4MjE5OTU1MSx2JDIuMCxhaWQkaU5YcmNtS0xjM1UtLGN0JDI1LHlieCRETEZYQ3QwRzZKd3EwMnUwM2NNN2J3LGJpJDIxNzAwNjI1NTEsbW1lJDkxNTk2MzQzMDU5NzY0OTA4NjUsbG5nJGVuLXVzLHIkMCx5b28kMSxhZ3AkMzMxOTU4NzA1MSxhcCRGQjIpKQ/2/*\"></scr"+"ipt><NOSCR"+"IPT><a href=\"https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3czAyaWwyMShnaWQkVUpja1d6SXdOaTVfcS5PM1ZFaDRYZ0dxTVRBNExsUkozYkRfaWlDWSxzdCQxNDE0MTI3MDI0NDQxNjEwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkNDI4MjE5OTU1MSx2JDIuMCxhaWQkaU5YcmNtS0xjM1UtLGN0JDI1LHlieCRETEZYQ3QwRzZKd3EwMnUwM2NNN2J3LGJpJDIxNzAwNjI1NTEsbW1lJDkxNTk2MzQzMDU5NzY0OTA4NjUsbG5nJGVuLXVzLHIkMSxyZCQxNGJ0N29ncGIseW9vJDEsYWdwJDMzMTk1ODcwNTEsYXAkRkIyKSk/1/*https://ad.wsod.com/click/8bec9b10877d5d7fd7c0fb6e6a631357/1542.0.img.120x60/?yud=&encver=${ENC_VERSION}&encalgo=${ENC_ALGO}&app=apt&intf=1\" target=\"_blank\"><img width=\"120\" height=\"60\" border=\"0\" src=\"https://ad.wsod.com/embed/8bec9b10877d5d7fd7c0fb6e6a631357/1542.0.img.120x60/1414127024.494824?yud=smpv%3d3%26ed%3dKfb2BHkzZLF3yh3sUja2DRXi3LZjugk7yJsheWWxeT5uV9SYCdYQ_446QvaEZCyKSLrr70o.Nc5oZrJI1hhOOlXySheUe7BOTrobj0Mos29XwFs0ZhpzyPcti5AY4YuEAVvQZ.zRltdz7vZ16o0-&encver=1&encalgo=3DES-CFB-SHA1&app=apt&intf=1&\" /></a></NOSCR"+"IPT>\n\n<img src=\"https://ads.yahoo.com/pixel?id=2529352&t=2\" width=\"1\" height=\"1\" />\n\n<img src=\"https://sp.analytics.yahoo.com/spp.pl?a=10001021715385&.yp=16283&js=no\"/><scr"+"ipt>var url = \"\"; if(url && url.search(\"http\") != -1){new Image().src = url;}</scr"+"ipt><!--QYZ 2170062551,4282199551,98.139.115.242;;FB2;28951412;1;-->", "id": "FB2-1", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['iNXrcmKLc3U-']='(as$12rcg5ark,aid$iNXrcmKLc3U-,bi$2170062551,cr$4282199551,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(1348kg3ve(gid$UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY,st$1414127024441610,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$12rcg5ark,aid$iNXrcmKLc3U-,bi$2170062551,cr$4282199551,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)\"></noscr"+"ipt>", "cscURI": "", "impID": "iNXrcmKLc3U-", "supp_ugc": "0", "placementID": "3319587051", "creativeID": "4282199551", "serveTime": "1414127024441610", "behavior": "expIfr_exp", "adID": "9159634305976490865", "matchID": "999999.999999.999999.999999", "err": "", "hasExternal": 0, "size": "120x60", "bookID": "2170062551", "serveType": "-1", "slotID": "0", "fdb": "{ \"fdb_url\": \"https:\\\/\\\/af.beap.bc.yahoo.com\\\/af?bv=1.0.0&bs=(167ekjrps(gid$UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY,st$1414127024441610,srv$1,si$4451051,adv$22886174375,ct$25,li$3314801051,exp$1414134224441610,cr$4282199551,dmn$www.scottrade.com,pbid$20459933223,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1414134224441\", \"fdb_intl\": \"en-US\" }" } } },{ "html": "<!-- SpaceID=28951412 loc=FB2 noad --><!-- fac-gd2-noad --><!-- gd2-status-2 --><!--QYZ 2170915051,,98.139.115.242;;FB2;28951412;2;-->", "id": "FB2-2", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['8OnrcmKLc3U-']='(as$125krhtob,aid$8OnrcmKLc3U-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(1348kg3ve(gid$UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY,st$1414127024441610,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$125krhtob,aid$8OnrcmKLc3U-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)\"></noscr"+"ipt>", "cscURI": "", "impID": "", "supp_ugc": "0", "placementID": "-1", "creativeID": "-1", "serveTime": "1414127024441610", "behavior": "non_exp", "adID": "#2", "matchID": "#2", "err": "invalid_space", "hasExternal": 0, "size": "", "bookID": "2170915051", "serveType": "-1", "slotID": "1", "fdb": "{ \"fdb_url\": \"http:\\/\\/gd1457.adx.gq1.yahoo.com\\/af?bv=1.0.0&bs=(15ir45r6b(gid$jmTVQDk4LjHHbFsHU5jMkgKkMTAuNwAAAACljpkK,st$1402537233026922,srv$1,si$13303551,adv$25941429036,ct$25,li$3239250051,exp$1402544433026922,cr$4154984551,pbid$25372728133,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1402544433026\", \"fdb_intl\": \"en-us\" , \"d\" : \"1\" }" } } },{ "html": "<a href=\"https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3c21zZWdtcShnaWQkVUpja1d6SXdOaTVfcS5PM1ZFaDRYZ0dxTVRBNExsUkozYkRfaWlDWSxzdCQxNDE0MTI3MDI0NDQxNjEwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkNDI4NDEwMDU1MSx2JDIuMCxhaWQkV1A3cmNtS0xjM1UtLGN0JDI1LHlieCRETEZYQ3QwRzZKd3EwMnUwM2NNN2J3LGJpJDIxNzA5MTUwNTEsbW1lJDkxNjM0MDc0MzQ3NDYwMzA1ODIsbG5nJGVuLXVzLHIkMCxyZCQxMW5taDNxa2MseW9vJDEsYWdwJDMzMjA2MDU1NTEsYXAkRkIyKSk/1/*http://ad.doubleclick.net/ddm/clk/285320418;112252545;v\" target=\"_blank\"><img src=\"https://s.yimg.com/gs/apex/mediastore/84934116-51b9-48fd-99a6-f7cfc735298e\" alt=\"\" title=\"\" width=120 height=60 border=0/></a><scr"+"ipt>var url = \"\"; if(url && url.search(\"http\") != -1){new Image().src = url;}</scr"+"ipt><img src=\"https://secure.insightexpressai.com/adServer/adServerESI.aspx?bannerID=252780&scr"+"ipt=false&redir=https://secure.insightexpressai.com/adserver/1pixel.gif\"><!--QYZ 2170915051,4284100551,98.139.115.242;;FB2;28951412;1;-->", "id": "FB2-3", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['WP7rcmKLc3U-']='(as$12rdh7i8b,aid$WP7rcmKLc3U-,bi$2170915051,cr$4284100551,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(1348kg3ve(gid$UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY,st$1414127024441610,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$12rdh7i8b,aid$WP7rcmKLc3U-,bi$2170915051,cr$4284100551,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)\"></noscr"+"ipt>", "cscURI": "", "impID": "WP7rcmKLc3U-", "supp_ugc": "0", "placementID": "3320605551", "creativeID": "4284100551", "serveTime": "1414127024441610", "behavior": "non_exp", "adID": "9163407434746030582", "matchID": "999999.999999.999999.999999", "err": "", "hasExternal": 0, "size": "120x60", "bookID": "2170915051", "serveType": "-1", "slotID": "2", "fdb": "{ \"fdb_url\": \"https:\\\/\\\/af.beap.bc.yahoo.com\\\/af?bv=1.0.0&bs=(168kd6m6d(gid$UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY,st$1414127024441610,srv$1,si$4451051,adv$21074470295,ct$25,li$3315787051,exp$1414134224441610,cr$4284100551,dmn$ad.doubleclick.net,pbid$20459933223,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1414134224441\", \"fdb_intl\": \"en-US\" }" } } },{ "html": "<!-- APT Vendor: WSOD, Format: Standard Graphical -->\n<scr"+"ipt type=\"text/javascr"+"ipt\" src=\"https://ad.wsod.com/embed/5fbc498f96d2d4ea0e6c7a3e8dc788e2/1.0.js.120x60/1414127024.496325?yud=smpv%3d3%26ed%3dKfb2BHkzZLF3yh3sUja2DRXi3LZjugk7yJsheWWxeT5uV9SYCdYQ_446QvaEZCyKSLrr70o.Nc5oZrJI1hhOOlXySheUe7BOTrobj0Mos29XwFs0ZhpwzwsnXg8bbBUxpZjh3VQizhfI9wtnEXU-&encver=1&encalgo=3DES-CFB-SHA1&app=apt&intf=1&click=https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3ZjYzMjNodChnaWQkVUpja1d6SXdOaTVfcS5PM1ZFaDRYZ0dxTVRBNExsUkozYkRfaWlDWSxzdCQxNDE0MTI3MDI0NDQxNjEwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkMzk5NDcxNDU1MSx2JDIuMCxhaWQkd0JMc2NtS0xjM1UtLGN0JDI1LHlieCRETEZYQ3QwRzZKd3EwMnUwM2NNN2J3LGJpJDIwODA1NTAwNTEsbW1lJDg3NjU3ODE1MDk5NjU1NTI4NDEsbG5nJGVuLXVzLHIkMCx5b28kMSxhZ3AkMzE2NzQ3MzA1MSxhcCRGQjIpKQ/2/*\"></scr"+"ipt><NOSCR"+"IPT><a href=\"https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3c3F1OGJuYyhnaWQkVUpja1d6SXdOaTVfcS5PM1ZFaDRYZ0dxTVRBNExsUkozYkRfaWlDWSxzdCQxNDE0MTI3MDI0NDQxNjEwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkMzk5NDcxNDU1MSx2JDIuMCxhaWQkd0JMc2NtS0xjM1UtLGN0JDI1LHlieCRETEZYQ3QwRzZKd3EwMnUwM2NNN2J3LGJpJDIwODA1NTAwNTEsbW1lJDg3NjU3ODE1MDk5NjU1NTI4NDEsbG5nJGVuLXVzLHIkMSxyZCQxNDhrdHRwcmIseW9vJDEsYWdwJDMxNjc0NzMwNTEsYXAkRkIyKSk/1/*https://ad.wsod.com/click/5fbc498f96d2d4ea0e6c7a3e8dc788e2/1.0.img.120x60/?yud=&encver=${ENC_VERSION}&encalgo=${ENC_ALGO}&app=apt&intf=1\" target=\"_blank\"><img width=\"120\" height=\"60\" border=\"0\" src=\"https://ad.wsod.com/embed/5fbc498f96d2d4ea0e6c7a3e8dc788e2/1.0.img.120x60/1414127024.496325?yud=smpv%3d3%26ed%3dKfb2BHkzZLF3yh3sUja2DRXi3LZjugk7yJsheWWxeT5uV9SYCdYQ_446QvaEZCyKSLrr70o.Nc5oZrJI1hhOOlXySheUe7BOTrobj0Mos29XwFs0ZhpwzwsnXg8bbBUxpZjh3VQizhfI9wtnEXU-&encver=1&encalgo=3DES-CFB-SHA1&app=apt&intf=1&\" /></a></NOSCR"+"IPT>\n\n<img src=\"https://adfarm.mediaplex.com/ad/tr/17113-191624-6548-18?mpt=1414127024.496325\" border=\"0\" width=1 height=1>\n\n<scr"+"ipt type=\"text/javascr"+"ipt\" src=\"https://cdn-view.c3tag.com/v.js?cid=338&c3ch=Display&c3nid=Yahoo-S-FOChain&size=120x60&creative=Finance\"></scr"+"ipt><!--QYZ 2080550051,3994714551,98.139.115.242;;FB2;28951412;1;-->", "id": "FB2-4", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['wBLscmKLc3U-']='(as$12r13j6it,aid$wBLscmKLc3U-,bi$2080550051,cr$3994714551,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(1348kg3ve(gid$UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY,st$1414127024441610,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$12r13j6it,aid$wBLscmKLc3U-,bi$2080550051,cr$3994714551,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)\"></noscr"+"ipt>", "cscURI": "", "impID": "wBLscmKLc3U-", "supp_ugc": "0", "placementID": "3167473051", "creativeID": "3994714551", "serveTime": "1414127024441610", "behavior": "expIfr_exp", "adID": "8765781509965552841", "matchID": "999999.999999.999999.999999", "err": "", "hasExternal": 0, "size": "120x60", "bookID": "2080550051", "serveType": "-1", "slotID": "3", "fdb": "{ \"fdb_url\": \"https:\\\/\\\/af.beap.bc.yahoo.com\\\/af?bv=1.0.0&bs=(15hgeoc5i(gid$UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY,st$1414127024441610,srv$1,si$4451051,adv$23207704431,ct$25,li$3160542551,exp$1414134224441610,cr$3994714551,pbid$20459933223,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1414134224441\", \"fdb_intl\": \"en-US\" }" } } },{ "html": "<!-- APT Vendor: Right Media, Format: Standard Graphical -->\n<SCR"+"IPT TYPE=\"text/javascr"+"ipt\" SRC=\"https://ads.yahoo.com/st?ad_type=ad&publisher_blob=${RS}|UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY|28951412|SKY|1414127024.494606|2-8-4|ysd|1&cnt=yan&ad_size=160x600&site=140440&section_code=3298733051&cb=1414127024.494606&yud=smpv%3d3%26ed%3dzAomdC25_0v58WhS9XOuKMdqiupb5raETJKzYQ--&K=1&pub_redirect_unencoded=1&pub_url=http://finance.yahoo.com/q/op&pub_redirect=https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3ZjZlNDNlZihnaWQkVUpja1d6SXdOaTVfcS5PM1ZFaDRYZ0dxTVRBNExsUkozYkRfaWlDWSxzdCQxNDE0MTI3MDI0NDQxNjEwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkNDI2NTMxMDA1MSx2JDIuMCxhaWQka0R2c2NtS0xjM1UtLGN0JDI1LHlieCRETEZYQ3QwRzZKd3EwMnUwM2NNN2J3LGJpJDIxNjUyNDEwNTEsbW1lJDkxMzk1ODUzOTg2Mzg3MDM0NTAsbG5nJGVuLXVzLHIkMCx5b28kMSxhZ3AkMzI5ODczMzA1MSxhcCRTS1kpKQ/2/*\"></SCR"+"IPT><scr"+"ipt>var url = \"\"; if(url && url.search(\"http\") != -1){new Image().src = url;}</scr"+"ipt><!--QYZ 2165241051,4265310051,98.139.115.242;;SKY;28951412;1;-->", "id": "SKY", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['kDvscmKLc3U-']='(as$12rsiquuu,aid$kDvscmKLc3U-,bi$2165241051,cr$4265310051,ct$25,at$H,eob$gd1_match_id=-1:ypos=SKY)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(1348kg3ve(gid$UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY,st$1414127024441610,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$12rsiquuu,aid$kDvscmKLc3U-,bi$2165241051,cr$4265310051,ct$25,at$H,eob$gd1_match_id=-1:ypos=SKY)\"></noscr"+"ipt>", "cscURI": "", "impID": "kDvscmKLc3U-", "supp_ugc": "0", "placementID": "3298733051", "creativeID": "4265310051", "serveTime": "1414127024441610", "behavior": "non_exp", "adID": "9139585398638703450", "matchID": "999999.999999.999999.999999", "err": "", "hasExternal": 0, "size": "160x600", "bookID": "2165241051", "serveType": "-1", "slotID": "5", "fdb": "{ \"fdb_url\": \"https:\\\/\\\/af.beap.bc.yahoo.com\\\/af?bv=1.0.0&bs=(15hrvl3pd(gid$UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY,st$1414127024441610,srv$1,si$4451051,adv$26513753608,ct$25,li$3293594551,exp$1414134224441610,cr$4265310051,pbid$20459933223,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1414134224441\", \"fdb_intl\": \"en-US\" }" } } } ], "meta": { "y": { "pageEndHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['KCfscmKLc3U-']='(as$125dh2pgj,aid$KCfscmKLc3U-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=LOGO)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(1348kg3ve(gid$UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY,st$1414127024441610,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$125dh2pgj,aid$KCfscmKLc3U-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=LOGO)\"></noscr"+"ipt><scr"+"ipt language=javascr"+"ipt>\n(function(){window.xzq_p=function(R){M=R};window.xzq_svr=function(R){J=R};function F(S){var T=document;if(T.xzq_i==null){T.xzq_i=new Array();T.xzq_i.c=0}var R=T.xzq_i;R[++R.c]=new Image();R[R.c].src=S}window.xzq_sr=function(){var S=window;var Y=S.xzq_d;if(Y==null){return }if(J==null){return }var T=J+M;if(T.length>P){C();return }var X=\"\";var U=0;var W=Math.random();var V=(Y.hasOwnProperty!=null);var R;for(R in Y){if(typeof Y[R]==\"string\"){if(V&&!Y.hasOwnProperty(R)){continue}if(T.length+X.length+Y[R].length<=P){X+=Y[R]}else{if(T.length+Y[R].length>P){}else{U++;N(T,X,U,W);X=Y[R]}}}}if(U){U++}N(T,X,U,W);C()};function N(R,U,S,T){if(U.length>0){R+=\"&al=\"}F(R+U+\"&s=\"+S+\"&r=\"+T)}function C(){window.xzq_d=null;M=null;J=null}function K(R){xzq_sr()}function B(R){xzq_sr()}function L(U,V,W){if(W){var R=W.toString();var T=U;var Y=R.match(new RegExp(\"\\\\\\\\(([^\\\\\\\\)]*)\\\\\\\\)\"));Y=(Y[1].length>0?Y[1]:\"e\");T=T.replace(new RegExp(\"\\\\\\\\([^\\\\\\\\)]*\\\\\\\\)\",\"g\"),\"(\"+Y+\")\");if(R.indexOf(T)<0){var X=R.indexOf(\"{\");if(X>0){R=R.substring(X,R.length)}else{return W}R=R.replace(new RegExp(\"([^a-zA-Z0-9$_])this([^a-zA-Z0-9$_])\",\"g\"),\"$1xzq_this$2\");var Z=T+\";var rv = f( \"+Y+\",this);\";var S=\"{var a0 = '\"+Y+\"';var ofb = '\"+escape(R)+\"' ;var f = new Function( a0, 'xzq_this', unescape(ofb));\"+Z+\"return rv;}\";return new Function(Y,S)}else{return W}}return V}window.xzq_eh=function(){if(E||I){this.onload=L(\"xzq_onload(e)\",K,this.onload,0);if(E&&typeof (this.onbeforeunload)!=O){this.onbeforeunload=L(\"xzq_dobeforeunload(e)\",B,this.onbeforeunload,0)}}};window.xzq_s=function(){setTimeout(\"xzq_sr()\",1)};var J=null;var M=null;var Q=navigator.appName;var H=navigator.appVersion;var G=navigator.userAgent;var A=parseInt(H);var D=Q.indexOf(\"Microsoft\");var E=D!=-1&&A>=4;var I=(Q.indexOf(\"Netscape\")!=-1||Q.indexOf(\"Opera\")!=-1)&&A>=4;var O=\"undefined\";var P=2000})();\n</scr"+"ipt><scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_svr)xzq_svr('https://csc.beap.bc.yahoo.com/');\nif(window.xzq_p)xzq_p('yi?bv=1.0.0&bs=(1348kg3ve(gid$UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY,st$1414127024441610,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3');\nif(window.xzq_s)xzq_s();\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(1348kg3ve(gid$UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY,st$1414127024441610,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3\"></noscr"+"ipt>", "pos_list": [ "FB2-1","FB2-2","FB2-3","FB2-4","LOGO","SKY" ], "spaceID": "28951412", "host": "finance.yahoo.com", "lookupTime": "68", "k2_uri": "", "fac_rt": "56727", "serveTime":"1414127024441610", "pvid": "UJckWzIwNi5_q.O3VEh4XgGqMTA4LlRJ3bD_iiCY", "tID": "darla_prefetch_1414127024440_957211518_1", "npv": "1", "ep": "{\"site-attribute\":[],\"ult\":{\"ln\":{\"slk\":\"ads\"}},\"nopageview\":true,\"ref\":\"http:\\/\\/finance.yahoo.com\\/q\\/op\",\"secure\":true,\"filter\":\"no_expandable;exp_iframe_expandable;\",\"darlaID\":\"darla_instance_1414127024440_535323200_0\"}" } } } </script></div><div id="yom-ad-SDARLAEXTRA-iframe"><script type='text/javascript'>
-DARLA_CONFIG = {"useYAC":0,"servicePath":"https:\/\/finance.yahoo.com\/__darla\/php\/fc.php","xservicePath":"","beaconPath":"https:\/\/finance.yahoo.com\/__darla\/php\/b.php","renderPath":"","allowFiF":false,"srenderPath":"https:\/\/s.yimg.com\/rq\/darla\/2-8-4\/html\/r-sf.html","renderFile":"https:\/\/s.yimg.com\/rq\/darla\/2-8-4\/html\/r-sf.html","sfbrenderPath":"https:\/\/s.yimg.com\/rq\/darla\/2-8-4\/html\/r-sf.html","msgPath":"https:\/\/finance.yahoo.com\/__darla\/2-8-4\/html\/msg.html","cscPath":"https:\/\/s.yimg.com\/rq\/darla\/2-8-4\/html\/r-csc.html","root":"__darla","edgeRoot":"http:\/\/l.yimg.com\/rq\/darla\/2-8-4","sedgeRoot":"https:\/\/s.yimg.com\/rq\/darla\/2-8-4","version":"2-8-4","tpbURI":"","hostFile":"https:\/\/s.yimg.com\/rq\/darla\/2-8-4\/js\/g-r-min.js","beaconsDisabled":true,"rotationTimingDisabled":true,"fdb_locale":"What don't you like about this ad?|<span>Thank you<\/span> for helping us improve your Yahoo experience|I don't like this ad|I don't like the advertiser|It's offensive|Other (tell us more)|Send|Done","positions":{"FB2-1":{"w":120,"h":60},"FB2-2":[],"FB2-3":{"w":120,"h":60},"FB2-4":{"w":120,"h":60},"LOGO":[],"SKY":{"w":160,"h":600}}};
-DARLA_CONFIG.servicePath = DARLA_CONFIG.servicePath.replace(/\:8033/g, "");
-DARLA_CONFIG.msgPath = DARLA_CONFIG.msgPath.replace(/\:8033/g, "");
-DARLA_CONFIG.k2E2ERate = 2;
-DARLA_CONFIG.positions = {"FB2-4":{"w":"198","h":"60","dest":"yom-ad-FB2-4-iframe","fr":"expIfr_exp","pos":"FB2-4","id":"FB2-4","clean":"yom-ad-FB2-4","rmxp":0},"FB2-1":{"w":"198","h":"60","dest":"yom-ad-FB2-1-iframe","fr":"expIfr_exp","pos":"FB2-1","id":"FB2-1","clean":"yom-ad-FB2-1","rmxp":0},"FB2-2":{"w":"198","h":"60","dest":"yom-ad-FB2-2-iframe","fr":"expIfr_exp","pos":"FB2-2","id":"FB2-2","clean":"yom-ad-FB2-2","rmxp":0},"SKY":{"w":"160","h":"600","dest":"yom-ad-SKY-iframe","fr":"expIfr_exp","pos":"SKY","id":"SKY","clean":"yom-ad-SKY","rmxp":0},"FB2-3":{"w":"198","h":"60","dest":"yom-ad-FB2-3-iframe","fr":"expIfr_exp","pos":"FB2-3","id":"FB2-3","clean":"yom-ad-FB2-3","rmxp":0},"FB2-0":{"w":"120","h":"60","dest":"yom-ad-FB2-0-iframe","fr":"expIfr_exp","pos":"FB2-0","id":"FB2-0","clean":"yom-ad-FB2-0","rmxp":0},"WBTN-1":{"w":"120","h":"60","dest":"yom-ad-WBTN-1-iframe","fr":"expIfr_exp","pos":"WBTN-1","id":"WBTN-1","clean":"yom-ad-WBTN-1","rmxp":0},"WBTN":{"w":"120","h":"60","dest":"yom-ad-WBTN-iframe","fr":"expIfr_exp","pos":"WBTN","id":"WBTN","clean":"yom-ad-WBTN","rmxp":0},"LDRP":{"w":"320","h":"76","dest":"yom-ad-LDRP-iframe","fr":"expIfr_exp","pos":"LDRP","id":"LDRP","clean":"yom-ad-LDRP","rmxp":0,"metaSize":true,"supports":{"exp-ovr":1,"exp-push":1}},"LREC":{"w":"300","h":"265","dest":"yom-ad-LREC-iframe","fr":"expIfr_exp","pos":"LREC","id":"LREC","clean":"yom-ad-LREC","rmxp":0,"metaSize":true,"supports":{"exp-ovr":1,"lyr":1}},"LREC-1":{"w":"300","h":"265","dest":"yom-ad-LREC-iframe-lb","fr":"expIfr_exp","pos":"LREC","id":"LREC-1","clean":"yom-ad-LREC-lb","rmxp":0,"metaSize":true,"supports":{"exp-ovr":1,"lyr":1}}};DARLA_CONFIG.positions['DEFAULT'] = { meta: { title: document.title, url: document.URL || location.href, urlref: document.referrer }};
-DARLA_CONFIG.events = {"darla_td":{"lvl":"","sp":"28951412","npv":true,"bg":"","sa":[],"sa_orig":[],"filter":"no_expandable;exp_iframe_expandable;","mpid":"","mpnm":"","locale":"","ps":"LREC,FB2-1,FB2-2,FB2-3,FB2-4,LDRP,WBTN,WBTN-1,FB2-0,SKY","ml":"","mps":"","ssl":"1"}};YMedia.later(10, this, function() {YMedia.use("node-base", function(Y){
-
-    /* YUI Ads Darla begins... */
-    YUI.AdsDarla = (function (){
-
-        var NAME = 'AdsDarla',
-            LB_EVENT = 'lightbox',
-            AUTO_EVENT = 'AUTO',
-            LREC3_EVENT = 'lrec3Event',
-            MUTEX_ADS = {},
-            AD_PERF_COMP = [];
-
-        if (DARLA_CONFIG.positions && DARLA_CONFIG.positions['TL1']) {
-            var navlink = Y.one('ul.navlist li>a'),
-                linkcolor;
-            if (navlink) {
-                linkcolor = navlink.getStyle('color');
-                DARLA_CONFIG.positions['TL1'].css = ".ad-tl2b {overflow:hidden; text-align:left;} p {margin:0px;} .y-fp-pg-controls {margin-top:5px; margin-bottom:5px;} #tl1_slug { font-family:'Helvetica Neue',Helvetica,Arial,sans-serif; font-size:12px; color:" + linkcolor + ";} #fc_align a {font-family:'Helvetica Neue',Helvetica,Arial,sans-serif; font-size:11px; color:" + linkcolor + ";} a:link {text-decoration:none;} a:hover {color: " + linkcolor + ";}";
-            }
-        }
-
-    /* setting up DARLA events */
-    var w = window,
-        D = w.DARLA,
-        C = w.DARLA_CONFIG,
-        DM = w.DOC_DOMAIN_SET || 0;
-    if (D) {
-        if (D && C) {
-            C.dm = DM;
-        }
-
-
-        /* setting DARLA configuration */
-        DARLA.config(C);
-
-        /* prefetch Ads if applicable */
-        DARLA.prefetched("fc");
-
-        /* rendering prefetched Ad */
-
-        DARLA.render();
-
-
-    }
-
-    return {
-        event: function (eventId, spaceId, adsSa) {
-            if (window.DARLA && eventId) {
-                var eventConfig = {};
-                if (!isNaN(spaceId)) {
-                    eventConfig.sp = spaceId;
-                }
-                /* Site attributes */
-                adsSa = (typeof adsSa !== "undefined" && adsSa !== null) ? adsSa : "";
-                eventConfig.sa = DARLA_CONFIG.events[eventId].sa_orig.replace ? DARLA_CONFIG.events[eventId].sa_orig.replace("ADSSA", adsSa) : "";
-                DARLA.event(eventId, eventConfig);
-            }
-        },
-        render: function() {
-            if (!!(Y.one('#yom-slideshow-lightbox') || Y.one('#content-lightbox') || false)) {
-                /* skip configuring DARLA in case of lightbox being triggered */
-            } else {
-                // abort current darla action
-                if (DARLA && DARLA.abort) {
-                    DARLA.abort();
-                }
-
-                /* setting DARLA configuration */
-                DARLA.config(DARLA_CONFIG);
-
-                /* prefetch Ads if applicable */
-                DARLA.prefetched("fc");
-
-                /* rendering prefetched Ad */
-                DARLA.render();
-            }
-        }
-    };
-
-})(); /* End of YUI.AdsDarla */
-
-YUI.AdsDarla.darla_td = { fetch: (Y.bind(YUI.AdsDarla.event, YUI.AdsDarla, 'darla_td')) };    YUI.AdsDarla.fetch = YUI.AdsDarla.darla_td.fetch;
-    Y.Global.fire('darla:ready'); 
-}); /* End of YMedia */}); /* End of YMedia.later */var ___adLT___ = [];
-function onDarlaFinishPosRender(position) {
-  if (window.performance !== undefined && window.performance.now !== undefined) {
-    var ltime = window.performance.now();
-    ___adLT___.push(['AD_'+position, Math.round(ltime)]);
-    setTimeout(function () {
-        if (window.LH !== undefined && window.YAFT !== undefined && window.YAFT.isInitialized()) {
-          window.YAFT.triggerCustomTiming('yom-ad-'+position, '', ltime);
-        }
-    },1000);
-  }
-}
-
-if ((DARLA && DARLA.config) || DARLA_CONFIG) {
-    var oldConf = DARLA.config() || DARLA_CONFIG || null;
-    if (oldConf) {
-        if (oldConf.onFinishPosRender) {
-            (function() {
-                var oldVersion = oldConf.onFinishPosRender;
-                oldConf.onFinishPosRender = function(position) {
-                    onDarlaFinishPosRender(position);
-                    return oldVersion.apply(me, arguments);
-                };
-            })();
-        } else {
-            oldConf.onFinishPosRender  = onDarlaFinishPosRender;
-        }
-        DARLA.config(oldConf);
-    }
-}
-
-</script></div><div><!-- SpaceID=28951412 loc=LOGO noad --><!-- fac-gd2-noad --><!-- gd2-status-2 --><!--QYZ CMS_NONE_AVAIL,,98.139.115.242;;LOGO;28951412;2;--></div><!-- END DARLA CONFIG -->
-
-        <script>window.YAHOO = window.YAHOO || {}; window.YAHOO.i13n = window.YAHOO.i13n || {}; if (!window.YMedia) { var YMedia = YUI(); YMedia.includes = []; }</script><script>YAHOO.i13n.YWA_CF_MAP = {"_p":20,"ad":58,"authfb":11,"bpos":24,"camp":54,"cat":25,"code":55,"cpos":21,"ct":23,"dcl":26,"dir":108,"domContentLoadedEventEnd":44,"elm":56,"elmt":57,"f":40,"ft":51,"grpt":109,"ilc":39,"itc":111,"loadEventEnd":45,"ltxt":17,"mpos":110,"mrkt":12,"pcp":67,"pct":48,"pd":46,"pkgt":22,"pos":20,"prov":114,"psp":72,"pst":68,"pstcat":47,"pt":13,"rescode":27,"responseEnd":43,"responseStart":41,"rspns":107,"sca":53,"sec":18,"site":42,"slk":19,"sort":28,"t1":121,"t2":122,"t3":123,"t4":124,"t5":125,"t6":126,"t7":127,"t8":128,"t9":129,"tar":113,"test":14,"v":52,"ver":49,"x":50};YAHOO.i13n.YWA_ACTION_MAP = {"click":12,"hvr":115,"rottn":128,"drag":105};YAHOO.i13n.YWA_OUTCOME_MAP = {};</script><script>YMedia.rapid = new YAHOO.i13n.Rapid({"spaceid":"28951412","client_only":1,"test_id":"","compr_type":"deflate","webworker_file":"/rapid-worker.js","text_link_len":8,"keys":{"version":"td app","site":"mobile-web-quotes"},"ywa":{"project_id":"1000911397279","document_group":"interactive-chart","host":"y.analytics.yahoo.com"},"tracked_mods":["yfi_investing_nav","chart-details"],"nofollow_class":[],"pageview_on_init":true});</script><!-- RAPID INIT -->
-
-        <script>
-            YMedia.use('main');
-        </script>
-
-	    <!-- Universal Header -->
-	    <script src="https://s.yimg.com/zz/combo?kx/yucs/uh3/uh/1078/js/uh-min.js&kx/yucs/uh3/uh/1078/js/gallery-jsonp-min.js&kx/yucs/uh3/uh/1078/js/menu_utils_v3-min.js&kx/yucs/uh3/uh/1078/js/localeDateFormat-min.js&kx/yucs/uh3/uh/1078/js/timestamp_library_v2-min.js&kx/yucs/uh3/uh/1104/js/logo_debug-min.js&kx/yucs/uh3/switch-theme/6/js/switch_theme-min.js&kx/yucs/uhc/meta/55/js/meta-min.js&kx/yucs/uh_common/beacon/18/js/beacon-min.js&kx/ucs/comet/js/77/cometd-yui3-min.js&kx/ucs/comet/js/77/conn-min.js&kx/ucs/comet/js/77/dark-test-min.js&kx/yucs/uh3/disclaimer/294/js/disclaimer_seed-min.js&kx/yucs/uh3/top-bar/321/js/top_bar_v3-min.js&kx/yucs/uh3/search/598/js/search-min.js&kx/yucs/uh3/search/611/js/search_plugin-min.js&kx/yucs/uh3/help/58/js/help_menu_v3-min.js&kx/yucs/uhc/rapid/36/js/uh_rapid-min.js&kx/yucs/uh3/get-the-app/148/js/inputMaskClient-min.js&kx/yucs/uh3/get-the-app/160/js/get_the_app-min.js&kx/yucs/uh3/location/10/js/uh_locdrop-min.js&amp;"></script>
-
-    </body>
-
-</html>
-<!-- ad prefetch pagecsc setting -->
\ No newline at end of file
diff --git a/pandas/io/tests/data/yahoo_options2.html b/pandas/io/tests/data/yahoo_options2.html
deleted file mode 100644
index bae9c193e03e1..0000000000000
--- a/pandas/io/tests/data/yahoo_options2.html
+++ /dev/null
@@ -1,5853 +0,0 @@
-<!DOCTYPE html>
-<html>
-<head>
-    <!-- customizable : anything you expected.  -->
-    <title>AAPL Option Chain | Yahoo! Inc. Stock - Yahoo! Finance</title>
-
-    <meta http-equiv="X-UA-Compatible" content="IE=edge,chrome=1" />
-    <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
-
-
-
-    
-        <link rel="stylesheet" type="text/css" href="https://s.yimg.com/zz/combo?/os/mit/td/stencil-0.1.306/stencil-css/stencil-css-min.css&/os/mit/td/finance-td-app-mobile-web-2.0.305/css.master/css.master-min.css"/><link rel="stylesheet" type="text/css" href="https://s.yimg.com/os/mit/media/m/quotes/quotes-search-gs-smartphone-min-1680382.css"/>
-
-
-<script>(function(html){var c = html.className;c += " JsEnabled";c = c.replace("NoJs","");html.className = c;})(document.documentElement);</script>
-    
-
-
-    <!-- UH -->
-    <link rel="stylesheet" href="https://s.yimg.com/zz/combo?kx/yucs/uh3/uh/1114/css//uh_non_mail-min.css&amp;kx/yucs/uh_common/meta/3/css/meta-min.css&amp;kx/yucs/uh3/top_bar/317/css/no_icons-min.css&amp;kx/yucs/uh3/search/css/588/blue_border-min.css&amp;kx/yucs/uh3/get-the-app/151/css/get_the_app-min.css&amp;kx/yucs/uh3/uh/1114/css/uh_ssl-min.css&amp;&amp;bm/lib/fi/common/p/d/static/css/2.0.356953/2.0.0/mini/yfi_theme_teal.css&amp;bm/lib/fi/common/p/d/static/css/2.0.356953/2.0.0/mini/yfi_interactive_charts_embedded.css">
-
-
-
-
-    <style>
-        .dev-desktop .y-header {
-            position: fixed;
-            top: 0;
-            left: 0;
-            right: 0;
-            padding-bottom: 10px;
-            background-color: #FFF;
-            z-index: 500;
-            -webkit-transition:border 0.25s, box-shadow 0.25s;
-            -moz-transition:border 0.25s, box-shadow 0.25s;
-            transition:border 0.25s, box-shadow 0.25s;
-        }
-        .Scrolling .dev-desktop .y-header,
-        .has-scrolled .dev-desktop .y-header {
-            -webkit-box-shadow: 0 0 9px 0 #490f76!important;
-            -moz-box-shadow: 0 0 9px 0 #490f76!important;
-            box-shadow: 0 0 9px 0 #490f76!important;
-            border-bottom: 1px solid #490f76!important;
-        }
-        .yucs-sidebar, .yui3-sidebar {
-            position: relative;
-        }
-    </style>
-    <style>
-
-        #content-area {
-            margin-top: 100px;
-            z-index: 4;
-        }
-        #finance-navigation {
-
-            padding: 0 12px;
-        }
-        #finance-navigation a, #finance-navigation a:link, #finance-navigation a:visited {
-            color: #1D1DA3;
-        }
-        #finance-navigation li.nav-section {
-            position: relative;
-        }
-        #finance-navigation li.nav-section a {
-            display: block;
-            padding: 10px 20px;
-        }
-        #finance-navigation li.nav-section ul.nav-subsection {
-            background-color: #FFFFFF;
-            border: 1px solid #DDDDDD;
-            box-shadow: 0 3px 15px 2px #FFFFFF;
-            display: none;
-            left: 0;
-            min-width: 100%;
-            padding: 5px 0;
-            position: absolute;
-            top: 35px;
-            z-index: 11;
-        }
-        #finance-navigation li.nav-section ul.nav-subsection a {
-            display: block;
-            padding: 5px 11px;
-            white-space: nowrap;
-        }
-        #finance-navigation li.nav-section ul.nav-subsection ul.scroll {
-            margin: 0 0 13px;
-            max-height: 168px;
-            overflow: auto;
-            padding-bottom: 8px;
-            width: auto;
-        }
-        #finance-navigation li.first a {
-            padding-left: 0;
-        }
-        #finance-navigation li.on ul.nav-subsection {
-            display: block;
-        }
-        #finance-navigation li.on:before {
-            -moz-border-bottom-colors: none;
-            -moz-border-left-colors: none;
-            -moz-border-right-colors: none;
-            -moz-border-top-colors: none;
-            border-color: -moz-use-text-color rgba(0, 0, 0, 0) #DDDDDD;
-            border-image: none;
-            border-left: 10px solid rgba(0, 0, 0, 0);
-            border-right: 10px solid rgba(0, 0, 0, 0);
-            border-style: none solid solid;
-            border-width: 0 10px 10px;
-            bottom: -5px;
-            content: "";
-            left: 50%;
-            margin-left: -10px;
-            position: absolute;
-            z-index: 1;
-        }
-        #finance-navigation li.on:after {
-            -moz-border-bottom-colors: none;
-            -moz-border-left-colors: none;
-            -moz-border-right-colors: none;
-            -moz-border-top-colors: none;
-            border-color: -moz-use-text-color rgba(0, 0, 0, 0) #FFFFFF;
-            border-image: none;
-            border-left: 10px solid rgba(0, 0, 0, 0);
-            border-right: 10px solid rgba(0, 0, 0, 0);
-            border-style: none solid solid;
-            border-width: 0 10px 10px;
-            bottom: -6px;
-            content: "";
-            left: 50%;
-            margin-left: -10px;
-            position: absolute;
-            z-index: 1;
-        }
-
-
-        #finance-navigation {
-            position: relative;
-            left: -100%;
-            padding-left: 102%;
-
-        }
-
-
-        ul {
-            margin: .55em 0;
-        }
-
-        div[data-region=subNav] {
-            z-index: 11;
-        }
-
-        #yfi_investing_content {
-            position: relative;
-        }
-
-        #yfi_charts.desktop #yfi_investing_content {
-            width: 1070px;
-        }
-
-        #yfi_charts.tablet #yfi_investing_content {
-            width: 930px;
-        }
-
-        #yfi_charts.tablet #yfi_doc {
-            width: 1100px;
-        }
-
-        .tablet #yucs #yucs-search {
-            text-align: left;
-        }
-
-        #compareSearch {
-            position: absolute;
-            right: 0;
-            padding-top: 10px;
-            z-index: 10;
-        }
-
-        /* remove this once int1 verification happens */
-        #yfi_broker_buttons {
-            height: 60px;
-        }
-
-        #yfi_charts.desktop #yfi_doc {
-            width: 1240px;
-        }
-
-        .tablet #content-area {
-            margin-top: 0;
-
-        }
-
-        .tablet #marketindices {
-            margin-top: -5px;
-        }
-
-        .tablet #quoteContainer {
-            right: 191px;
-        }
-    </style>
-</head>
-<body  id="yfi_charts" class="dev-desktop desktop intl-us yfin_gs gsg-0">
-
-<div id="outer-wrapper" class="outer-wrapper">
-    <div class="yui-sv y-header">
-        <div class="yui-sv-hd">
-            <!-- yucs header bar. Property sticks UH header bar here. UH supplies the div -->
-            <style>#header,#y-hd,#hd .yfi_doc,#yfi_hd{background:#fff !important}#yfin_gs #yfimh #yucsHead,#yfin_gs #yfi_doc #yucsHead,#yfin_gs #yfi_fp_hd #yucsHead,#yfin_gs #y-hd #yucsHead,#yfin_gs #yfi_hd #yucsHead,#yfin_gs #yfi-doc #yucsHead{-webkit-box-shadow:0 0 9px 0 #490f76 !important;-moz-box-shadow:0 0 9px 0 #490f76 !important;box-shadow:0 0 9px 0 #490f76 !important;border-bottom:1px solid #490f76 !important}#yog-hd,#yfi-hd,#ysp-hd,#hd,#yfimh,#yfi_hd,#yfi_fp_hd,#masthead,#yfi_nav_header #navigation,#y-nav #navigation,.ad_in_head{background-color:#fff;background-image:none}#header,#hd .yfi_doc,#y-hd .yfi_doc,#yfi_hd .yfi_doc{width:100% !important}#yucs{margin:0 auto;width:970px}#yfi_nav_header,.y-nav-legobg,#y-nav #navigation{margin:0 auto;width:970px}#yucs .yucs-avatar{height:22px;width:22px}#yucs #yucs-profile_text .yuhead-name-greeting{display:none}#yucs #yucs-profile_text .yuhead-name{top:0;max-width:65px}#yucs-profile_text{max-width:65px}#yog-bd .yom-stage{background:transparent}#yog-hd{height:84px}.yog-bd,.yog-grid{padding:4px 10px}.nav-stack ul.yog-grid{padding:0}#yucs #yucs-search.yucs-bbb .yucs-button_theme{background:-moz-linear-gradient(top, #01a5e1 0, #0297ce 100%);background:-webkit-gradient(linear, left top, left bottom, color-stop(0%, #01a5e1), color-stop(100%, #0297ce));background:-webkit-linear-gradient(top, #01a5e1 0, #0297ce 100%);background:-o-linear-gradient(top, #01a5e1 0, #0297ce 100%);background:-ms-linear-gradient(top, #01a5e1 0, #0297ce 100%);background:linear-gradient(to bottom, #01a5e1 0, #0297ce 100%);-webkit-box-shadow:inset 0 1px 3px 0 #01c0eb;box-shadow:inset 0 1px 3px 0 #01c0eb;background-color:#019ed8;background-color:transparent\0/IE9;background-color:transparent\9;*background:none;border:1px solid #595959;padding-left:0px;padding-right:0px}#yucs #yucs-search.yucs-bbb #yucs-prop_search_button_wrapper .yucs-gradient{filter:progid:DXImageTransform.Microsoft.gradient(startColorstr='#01a5e1', endColorstr='#0297ce',GradientType=0 );-ms-filter:"progid:DXImageTransform.Microsoft.gradient( startColorstr='#01a5e1', endColorstr='#0297ce',GradientType=0 )";background-color:#019ed8\0/IE9}#yucs #yucs-search.yucs-bbb #yucs-prop_search_button_wrapper{*border:1px solid #595959}#yucs #yucs-search .yucs-button_theme{background:#0f8ed8;border:0;box-shadow:0 2px #044e6e}@media all{#yucs.yucs-mc,#yucs-top-inner{width:auto !important;margin:0 !important}#yucsHead{_text-align:left !important}#yucs-top-inner,#yucs.yucs-mc{min-width:970px !important;max-width:1240px !important;padding-left:10px !important;padding-right:10px !important}#yucs.yucs-mc{_width:970px !important;_margin:0 !important}#yucsHead #yucs .yucs-fl-left #yucs-search{position:absolute;left:190px !important;max-width:none !important;margin-left:0;_left:190px;_width:510px !important}.yog-ad-billboard #yucs-top-inner,.yog-ad-billboard #yucs.yucs-mc{max-width:1130px !important}#yucs .yog-cp{position:inherit}}#yucs #yucs-logo{width:150px !important;height:34px !important}#yucs #yucs-logo div{width:94px !important;margin:0 auto !important}.lt #yucs-logo div{background-position:-121px center !important}#yucs-logo a{margin-left:-13px !important}</style><style>#yog-hd .yom-bar, #yog-hd .yom-nav, #y-nav, #hd .ysp-full-bar,  #yfi_nav_header, #hd .mast {
-float: none;
-width: 970px;
-margin: 0 auto;
-}
-
-#yog-bd .yom-stage {
-background: transparent;
-}
-
-#y-nav .yom-nav {
-padding-top: 0px;
-}
-
-#ysp-search-assist .bd {
-display:none;
-}
-
-#ysp-search-assist h4 {
-padding-left: 8px;
-}
-
-
-    #yfi-portfolios-multi-quotes #y-nav, #yfi-portfolios-multi-quotes #navigation, #yfi-portfolios-multi-quotes .y-nav-legobg, 
-    #yfi-portfolios-my-portfolios #y-nav, #yfi-portfolios-my-portfolios #navigation, #yfi-portfolios-my-portfolios .y-nav-legobg {
-        width : 100%;
-    }</style> <div id="yucsHead" class="yucs-finance yucs-en-us  yucs-standard"><!-- meta --><div id="yucs-meta" data-authstate="signedout" data-cobrand="standard" data-crumb="7MSUqCslfmq" data-mc-crumb="TbYF6XpCvXp" data-gta="4grTATfduzS" data-device="desktop" data-experience="GS" data-firstname="" data-flight="1415246434" data-forcecobrand="standard" data-guid="" data-host="finance.yahoo.com" data-https="1" data-languagetag="en-us" data-property="finance" data-protocol="https" data-shortfirstname="" data-shortuserid="" data-status="active" data-spaceid="2022773886" data-test_id="" data-userid="" data-stickyheader="true" data-headercollapse='' ></div><!-- /meta --><div id="yucs-comet" style="display:none;"></div><div id="yucs-disclaimer" class="yucs-disclaimer yucs-activate yucs-hide yucs-property-finance yucs-fcb- " data-dsstext="Want a better search experience? {dssLink}Set your Search to Yahoo{linkEnd}" data-dsstext-mobile="Search Less, Find More" data-dsstext-mobile-ok="OK" data-dsstext-mobile-set-search="Set Search to Yahoo" data-ylt-link="https://search.yahoo.com/searchset;_ylt=Am7XSa7sJpLHatHat.zq1f1.FJF4?pn=" data-ylt-dssbarclose="/;_ylt=Ap5IhmuQxFFBgYOVkq._clN.FJF4" data-ylt-dssbaropen="/;_ylt=AsS10T3mtpfMs1Rfijd1P5F.FJF4" data-linktarget="_top" data-lang="en-us" data-property="finance" data-device="Desktop" data-close-txt="Close this window" data-maybelater-txt = "Maybe Later" data-killswitch = "0" data-host="finance.yahoo.com" data-spaceid="2022773886" data-pn="jMQEdfvy1VZ" data-pn-es-ar-mobile="61giSAsx0tj" data-pn-de-at-mobile="QI0EndOTofo" data-pn-pt-br-mobile="Or0CpeiSFIl" data-pn-en-ca-mobile="HZF.uvZoDox" data-pn-de-ch-mobile="dUxzpqabuSD" data-pn-fr-ch-mobile="ldR8KxKhAf2" data-pn-it-ch-mobile="KEZNC8HLPL6" data-pn-es-cl-mobile="ZUjbcIkNfHa" data-pn-es-co-mobile="qjPACHiFfpY" data-pn-de-de-mobile="y5rewFNvaPr" data-pn-da-dk-mobile="oXmPEE0ncuy" data-pn-es-es-mobile=".n88bFIO.i." data-pn-es-us-mobile="9pnFWM70pR/" data-pn-fi-fi-mobile="UtIk3u5R6a2" data-pn-fr-fr-mobile="dID.gJIPC9Z" data-pn-el-gr-mobile="EoKx2BICJ/I" data-pn-zh-hant-hk-mobile="TDPGDr2Hz2D" data-pn-id-id-mobile="gBirwQSXzwN" data-pn-en-in-mobile="nqkshGALBoW" data-pn-it-it-mobile="Sl6cvxJymwA" data-pn-ar-mobile="FL.NBwXJmoy" data-pn-en-my-mobile="zFnQOW9GYgt" data-pn-es-mx-mobile="8RUr5RD5hK/" data-pn-nl-nl-mobile="3tY9iaVAGGp" data-pn-no-no-mobile="ZScATbWBPHw" data-pn-es-pe-mobile="tAlsinMKlEk" data-pn-en-ph-mobile="NNBweS148cu" data-pn-pl-pl-mobile="JE/A9Eb6Ibe" data-pn-fr-ca-mobile="b7HR.5qICBo" data-pn-ro-ro-mobile="06kf6zZ5eaC" data-pn-ru-ru-mobile="1ECBl0/z.6o" data-pn-sv-se-mobile="GuO2Uy99woM" data-pn-en-sg-mobile="7zive1kglOx" data-pn-th-th-mobile="54ev8fmG.Xj" data-pn-tr-tr-mobile="0mI.rseHOwj" data-pn-zh-hant-tw-mobile="kjoxvQPxNKy" data-pn-en-gb-mobile="JFgD9Fzz8TB" data-pn-en-us-mobile="jMQEdfvy1VZ" data-pn-es-ve-mobile="k7m2PEYSwjs" data-pn-vi-vn-mobile="flrEAUtRyX5" data-pn-tablet="p9.mFLm6HBX" data-news-search-yahoo-com="iQvX1T5R5Zl" data-answers-search-yahoo-com="3n85iI8AH/P" data-finance-search-yahoo-com="at/IAUoh0H1" data-images-search-yahoo-com="jmrA89dSbgb" data-video-search-yahoo-com="DK9HPXrzBDM" data-sports-search-yahoo-com="fwIzr/JcDuI" data-shopping-search-yahoo-com="Lgxb1PpkBwg" data-shopping-yahoo-com="Lgxb1PpkBwg" data-us-qa-trunk-news-search-yahoo-com ="iQvX1T5R5Zl" data-dss="1"></div> <div id="yucs-top-bar" class='yucs-ps' ><div id='yucs-top-inner'><ul id="yucs-top-list"><li id="yucs-top-home"><a href="https://us.lrd.yahoo.com/_ylt=AhW2NYdEl7KmgRmVvlaDv2l.FJF4/SIG=11a8uhr0m/EXP=1415275234/**https%3a//www.yahoo.com/" ><span class="sp yucs-top-ico"></span>Home</a></li><li id="yucs-top-mail"><a href="https://mail.yahoo.com/;_ylt=Aq8hFudmq.D4gdhHZuBG.vp.FJF4" >Mail</a></li><li id="yucs-top-news"><a href="http://news.yahoo.com/;_ylt=AtMRWTiiAoHkyoodfDpP9ud.FJF4" >News</a></li><li id="yucs-top-sports"><a href="http://sports.yahoo.com/;_ylt=AjjmNqaOG3h25OvMgzXJbvF.FJF4" >Sports</a></li><li id="yucs-top-finance"><a href="http://finance.yahoo.com/;_ylt=AsBNygH2BKZGwnH.XV5QoWV.FJF4" >Finance</a></li><li id="yucs-top-weather"><a href="https://weather.yahoo.com/;_ylt=AkoN2ZKsa_.0C2swqIfjpW9.FJF4" >Weather</a></li><li id="yucs-top-games"><a href="https://games.yahoo.com/;_ylt=Akj6hSwgTgLP.TWEED_aQ6t.FJF4" >Games</a></li><li id="yucs-top-groups"><a href="https://us.lrd.yahoo.com/_ylt=AqsPPoGNrSeCaH7w4Yhi9LR.FJF4/SIG=11dtqt15j/EXP=1415275234/**https%3a//groups.yahoo.com/" >Groups</a></li><li id="yucs-top-answers"><a href="https://answers.yahoo.com/;_ylt=AnY4NSiaZwu9WrW6TskHDyV.FJF4" >Answers</a></li><li id="yucs-top-screen"><a href="https://us.lrd.yahoo.com/_ylt=AqjZbwKx0pGFTIRQmaGAYa5.FJF4/SIG=11d3g0lgh/EXP=1415275234/**https%3a//screen.yahoo.com/" >Screen</a></li><li id="yucs-top-flickr"><a href="https://us.lrd.yahoo.com/_ylt=AvwXve7RAeW0YzBWETIRo99.FJF4/SIG=11bimllm5/EXP=1415275234/**https%3a//www.flickr.com/" >Flickr</a></li><li id="yucs-top-mobile"><a href="https://mobile.yahoo.com/;_ylt=Asqmi8sn2lbXquKJH6jh8TB.FJF4" >Mobile</a></li><li id='yucs-more' class='yucs-menu yucs-more-activate' data-ylt="/;_ylt=Al9sc8nVJUMr8Yp1AbBbrv5.FJF4"><a href="http://everything.yahoo.com/" id='yucs-more-link'>More<span class="sp yucs-top-ico"></span></a><div id='yucs-top-menu'><div class="yui3-menu-content"><ul class="yucs-hide yucs-leavable"><li id='yucs-top-celebrity'><a href="https://celebrity.yahoo.com/;_ylt=ArgD4gwPttPrsxjYetUg1NF.FJF4" >Celebrity</a></li><li id='yucs-top-movies'><a href="https://us.lrd.yahoo.com/_ylt=AmpFv1Z5qj4Bu22CfQy9UwV.FJF4/SIG=11g9a2jbt/EXP=1415275234/**https%3a//www.yahoo.com/movies" >Movies</a></li><li id='yucs-top-music'><a href="https://music.yahoo.com/;_ylt=At704lHbn7DLCPU97PdXPZ1.FJF4" >Music</a></li><li id='yucs-top-tv'><a href="https://tv.yahoo.com/;_ylt=AsebaJy9WJ5ZIfPlJ7b.ZOV.FJF4" >TV</a></li><li id='yucs-top-health'><a href="https://us.lrd.yahoo.com/_ylt=ArGsCKu2Edz3vJbV_pTf0YR.FJF4/SIG=11gqmm9mm/EXP=1415275234/**https%3a//www.yahoo.com/health" >Health</a></li><li id='yucs-top-style'><a href="https://us.lrd.yahoo.com/_ylt=Avjk6Z.sn1ZDHHP5Q1ROX65.FJF4/SIG=11fh33f3d/EXP=1415275234/**https%3a//www.yahoo.com/style" >Style</a></li><li id='yucs-top-beauty'><a href="https://us.lrd.yahoo.com/_ylt=AuCdUPo2OKtS2m2vJR27nFR.FJF4/SIG=11g36dklg/EXP=1415275234/**https%3a//www.yahoo.com/beauty" >Beauty</a></li><li id='yucs-top-food'><a href="https://us.lrd.yahoo.com/_ylt=AjSUpTFo6gijt4CkSXsu6sV.FJF4/SIG=11efc199m/EXP=1415275234/**https%3a//www.yahoo.com/food" >Food</a></li><li id='yucs-top-parenting'><a href="https://us.lrd.yahoo.com/_ylt=Aj7Sv6I_3aco.nDJD2M7N7V.FJF4/SIG=11jpndb1n/EXP=1415275234/**https%3a//www.yahoo.com/parenting" >Parenting</a></li><li id='yucs-top-diy'><a href="https://us.lrd.yahoo.com/_ylt=AiIOLTYdgInI93wMLoh3PjZ.FJF4/SIG=11d7h4efh/EXP=1415275234/**https%3a//www.yahoo.com/diy" >DIY</a></li><li id='yucs-top-tech'><a href="https://us.lrd.yahoo.com/_ylt=AqJwVqNHgTSf6_jzpHoeUpZ.FJF4/SIG=11e77g755/EXP=1415275234/**https%3a//www.yahoo.com/tech" >Tech</a></li><li id='yucs-top-shopping'><a href="http://shopping.yahoo.com/;_ylt=Ahfsab6ODRnj92mkXOZ56nJ.FJF4" >Shopping</a></li><li id='yucs-top-travel'><a href="https://us.lrd.yahoo.com/_ylt=AvpEGOOuSqLhHvXKtg5gcd5.FJF4/SIG=11g61d98f/EXP=1415275234/**https%3a//www.yahoo.com/travel" >Travel</a></li><li id='yucs-top-autos'><a href="https://autos.yahoo.com/;_ylt=AvbKH7B502ugIu60Bd9FCj9.FJF4" >Autos</a></li><li id='yucs-top-homes'><a href="https://us.lrd.yahoo.com/_ylt=Arke6PQAMUV1.U9pveVgpCR.FJF4/SIG=11l2iaa1v/EXP=1415275234/**https%3a//homes.yahoo.com/own-rent/" >Homes</a></li></ul></div></div></li></ul></div></div><div id="yucs" class="yucs yucs-mc  yog-grid" data-lang="en-us" data-property="finance" data-flight="1415246434" data-linktarget="_top" data-uhvc="/;_ylt=AjlNfSRtvtNJVRZblaBQtlt.FJF4"> <div class="yucs-fl-left yog-cp">   <div id="yucs-logo"> <style> #yucs #yucs-logo-ani { width:120px ; height:34px; background-image:url(https://s.yimg.com/rz/l/yahoo_finance_en-US_f_pw_119x34.png) ; _background-image:url(https://s.yimg.com/rz/l/yahoo_finance_en-US_f_pw_119x34.gif) ; *left: 0px; display:block ; visibility: visible; position: relative; clip: auto; } .lt #yucs-logo-ani { background-position: 100% 0px !important; } .lt #yucs[data-property='mail'] #yucs-logo-ani { background-position: -350px 0px !important; } #yucs-logo { margin-top:0px!important; padding-top: 11px; width: 120px; } #yucs[data-property='homes'] #yucs-logo { width: 102px; } .advisor #yucs-link-ani { left: 21px !important; } #yucs #yucs-logo a {margin-left: 0!important;}#yucs #yucs-link-ani {width: 100% !important;} @media only screen and (-webkit-min-device-pixel-ratio: 2), only screen and ( min--moz-device-pixel-ratio: 2), only screen and ( -o-min-device-pixel-ratio: 2/1), only screen and ( min-device-pixel-ratio: 2), only screen and ( min-resolution: 192dpi), only screen and ( min-resolution: 2dppx) { #yucs #yucs-logo-ani { background-image: url(https://s.yimg.com/rz/l/yahoo_finance_en-US_f_pw_119x34_2x.png) !important; background-size: 235px 34px; } } </style> <div> <a id="yucs-logo-ani" class="" href="https://finance.yahoo.com/;_ylt=Aq1IeSi2QV16rxBFY9QCTp1.FJF4" target="_top" data-alg=""> Yahoo Finance </a> </div> <img id="imageCheck" src="https://s.yimg.com/os/mit/media/m/base/images/transparent-1093278.png" alt=""/> </div><noscript><style>#yucs #yucs-logo-ani {visibility: visible;position: relative;clip: auto;}</style></noscript> <div id="yucs-search" style="width: 570px; display: block;" class=' yucs-search-activate'> <form role="search" class="yucs-search yucs-activate" target="_top" data-webaction="https://search.yahoo.com/search;_ylt=AnPxEhqVtaDMH7w_jS2_b.V.FJF4" action="https://finance.yahoo.com/q;_ylt=AvQZGc96_yHu76g8yuJy8jR.FJF4" method="get"> <table role="presentation"> <tbody role="presentation"> <tr role="presentation"> <td class="yucs-form-input" role="presentation"> <input autocomplete="off" class="yucs-search-input" name="s" type="search" aria-describedby="mnp-search_box" data-yltvsearch="https://finance.yahoo.com/q;_ylt=AjmPUzYatcChhFCVTZdg0Wh.FJF4" data-yltvsearchsugg="/;_ylt=AknKBVGXSjv1neFQ2zy6ccR.FJF4" data-satype="mini" data-gosurl="https://s.yimg.com/aq/autoc" data-pubid="666" data-enter-ylt="https://finance.yahoo.com/q;_ylt=ApXeLdbOnkuZce1QRT_iP7B.FJF4" data-enter-fr="" data-maxresults="" id="mnp-search_box" data-rapidbucket=""/> </td><td NOWRAP class="yucs-form-btn" role="presentation"><div id="yucs-prop_search_button_wrapper" class="yucs-search-buttons"><div class="yucs-shadow"><div class="yucs-gradient"></div></div><button id="yucs-sprop_button" class="yucs-action_btn yucs-button_theme yucs-vsearch-button" type="submit" data-vfr="uh3_finance_vert_gs" onclick="var vfr = this.getAttribute('data-vfr'); if(vfr){document.getElementById('fr').value = vfr}" data-vsearch="https://finance.yahoo.com/q">Search Finance</button></div><div id="yucs-web_search_button_wrapper" class="yucs-search-buttons"><div class="yucs-shadow"><div class="yucs-gradient"></div></div><button id="yucs-search_button" class="yucs-action_btn yucs-wsearch-button" onclick="var form=document.getElementById('yucs-search').children[0];var wa=form.getAttribute('data-webaction');form.setAttribute('action',wa);var searchbox=document.getElementById('mnp-search_box');searchbox.setAttribute('name','p');" type="submit">Search Web</button></div></td></tr> </tbody> </table> <input type="hidden" id="uhb" name="uhb" value="uhb2" /> <input type="hidden" name="type" value="2button" data-ylk="slk:yhstype-hddn;itc:1;"/> <input type="hidden" id="fr" name="fr" value="uh3_finance_web_gs" />   </form><div id="yucs-satray" class="sa-tray sa-hidden" data-wstext="Search Web for: " data-wsearch="https://search.yahoo.com/search;_ylt=Av30GxTqRj_iF47j07GMbMd.FJF4" data-vfr="uh3_finance_vert_gs" data-vsearchAll="/;_ylt=AtTdhJitRpAGYXo0EKPS3cZ.FJF4" data-vsearch="https://finance.yahoo.com/q;_ylt=AknKBVGXSjv1neFQ2zy6ccR.FJF4" data-vstext= "Search news for: " data-vert_fin_search="https://finance.search.yahoo.com/search/;_ylt=Armtbi_fyne9e6KT4fGbzu5.FJF4"></div> </div></div><div class="yucs-fl-right"> <div id="yucs-profile" class="yucs-profile yucs-signedout"> <a id="yucs-menu_link_profile_signed_out" href="https://login.yahoo.com/config/login;_ylt=AmGq5CTE_HrIpafarS46uEl.FJF4?.src=quote&.intl=us&.lang=en-US&.done=https://finance.yahoo.com/q/op%3fs=AAPL" target="_top" rel="nofollow" class="sp yucs-fc" aria-label="Profile"> </a> <div id="yucs-profile_text" class="yucs-fc"> <a id="yucs-login_signIn" href="https://login.yahoo.com/config/login;_ylt=AmGq5CTE_HrIpafarS46uEl.FJF4?.src=quote&.intl=us&.lang=en-US&.done=https://finance.yahoo.com/q/op%3fs=AAPL" target="_top" rel="nofollow" class="yucs-fc"> Sign In </a> </div></div><div class="yucs-mail_link yucs-mailpreview-ancestor"><a id="yucs-mail_link_id" class="sp yltasis yucs-fc" href="https://mail.yahoo.com/;_ylt=AoqFDbHDE2LgVWWt2iIicrV.FJF4?.intl=us&.lang=en-US&.src=ym" rel="nofollow" target="_top"> Mail </a><div class="yucs-mail-preview-panel yucs-menu yucs-hide" data-mail-txt="Mail" data-uri-scheme="http" data-uri-path="ucs.query.yahoo.com/v1/console/yql" data-mail-view="Go to Mail" data-mail-help-txt="Help" data-mail-help-url="http://help.yahoo.com/l/us/yahoo/mail/ymail/" data-mail-loading-txt="Loading..." data-languagetag="en-us" data-mrd-crumb="aZBofaj31.n" data-authstate="signedout" data-middleauth-signin-text="Click here to view your mail" data-popup-login-url="https://login.yahoo.com/config/login_verify2?.pd=c%3DOIVaOGq62e5hAP8Tv..nr5E3&.src=sc" data-middleauthtext="You have {count} new messages." data-yltmessage-link="https://us.lrd.yahoo.com/_ylt=Apjs_7Bw4AQ5COKvTbrMDKx.FJF4/SIG=13du204tl/EXP=1415275234/**http%3a//mrd.mail.yahoo.com/msg%3fmid=%7bmsgID%7d%26fid=Inbox%26src=uh%26.crumb=aZBofaj31.n" data-yltviewall-link="https://mail.yahoo.com/;_ylt=AkZXUf33MxPfw4XkZY1bqdF.FJF4" data-yltpanelshown="/;_ylt=AvV9fdBkZu0DRjrOJ1yaV2R.FJF4" data-ylterror="/;_ylt=Aqh5OGjhTlmzeb.Y463yxtN.FJF4" data-ylttimeout="/;_ylt=AjxO6d0TeAd9Jf0SBG2mmUt.FJF4" data-generic-error="We're unable to preview your mail.<br>Go to Mail." data-nosubject="[No Subject]" data-timestamp='short'></div></div> <div id="yucs-help" class="yucs-activate yucs-help yucs-menu_nav"> <a id="yucs-help_button" class="sp yltasis" href="javascript:void(0);" aria-label="Help" rel="nofollow"> <em class="yucs-hide yucs-menu_anchor">Help</em> </a> <div id="yucs-help_inner" class="yucs-hide yucs-menu yucs-hm-activate" data-yltmenushown="/;_ylt=Ah9fa5WrZdRgDLUzOiLLpVl.FJF4"> <span class="sp yucs-dock"></span> <ul id="yuhead-help-panel"> <li><a class="yucs-acct-link" href="https://us.lrd.yahoo.com/_ylt=AlsuZ_6yHv0NDKyfJNNvHG1.FJF4/SIG=15sbagtrs/EXP=1415275234/**https%3a//edit.yahoo.com/mc2.0/eval_profile%3f.intl=us%26.lang=en-US%26.done=https%3a//finance.yahoo.com/q/op%253fs=AAPL%26amp;.src=quote%26amp;.intl=us%26amp;.lang=en-US" target="_top">Account Info</a></li> <li><a href="https://help.yahoo.com/l/us/yahoo/finance/;_ylt=An6G3Wp7BbpG._Y9LLd3VG9.FJF4" rel="nofollow" >Help</a></li> <span class="yucs-separator" role="presentation" style="display: block;"></span><li><a href="https://us.lrd.yahoo.com/_ylt=AuUffeNOhmC6O.nl5UerF0F.FJF4/SIG=11rqao4mv/EXP=1415275234/**http%3a//feedback.yahoo.com/forums/207809" rel="nofollow" >Suggestions</a></li>  </ul> </div></div> <div id="yucs-network_link"><a id="yucs-home_link" href="https://us.lrd.yahoo.com/_ylt=AjxTXiLYDPm3IinSDeGVmE9.FJF4/SIG=11a8uhr0m/EXP=1415275234/**https%3a//www.yahoo.com/" rel="nofollow" target="_top"><em class="sp">Yahoo</em><span class="yucs-fc">Home</span></a></div>       </div>   </div> <!-- contextual_shortcuts --><!-- /contextual_shortcuts --><!-- property: finance | languagetag: en-us | status: active | spaceid: 2022773886 | cobrand: standard | markup: empty --><div id="yucs-location-js" class="yucs-hide yucs-offscreen yucs-location-activate" data-appid="yahoo.locdrop.ucs.desktop" data-crumb="ZW4AS4U53s3"><!-- empty for ie --></div><div id="yUnivHead" class="yucs-hide"><!-- empty --></div><div id="yhelp_container" class="yui3-skin-sam"></div></div><!-- alert --><!-- /alert -->
-        </div>
-
-
-    </div>
-
-    <div id="content-area" class="yui-sv-bd">
-
-        <div data-region="subNav">
-
-    
-    <ul id="finance-navigation" class="Grid Fz-m Fw-200 Whs-nw">
-        
-        
-        <li class="nav-section Grid-U  first">
-            <a href="/" title="">Finance Home</a>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U nav-fin-portfolios no-pjax has-entries">
-            <a href="/portfolios.html" title="portfolio nav">My Portfolio</a>
-            
-            <ul class="nav-subsection">
-                
-                <li>
-                    <ul class="scroll">
-                    
-                    </ul>
-                </li>
-                
-                
-                <li><a href="/portfolios/manage" title="portfolio nav" class="no-pjax">View All Portfolios</a></li>
-                
-                <li><a href="/portfolio/new" title="portfolio nav" class="no-pjax">Create Portfolio</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U  has-entries">
-            <a href="/market-overview/" title="">Market Data</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/stock-center/" title="" class="">Stocks</a></li>
-                
-                <li><a href="/funds/" title="" class="no-pjax">Mutual Funds</a></li>
-                
-                <li><a href="/options/" title="" class="no-pjax">Options</a></li>
-                
-                <li><a href="/etf/" title="" class="no-pjax">ETFs</a></li>
-                
-                <li><a href="/bonds" title="" class="no-pjax">Bonds</a></li>
-                
-                <li><a href="/futures" title="" class="no-pjax">Commodities</a></li>
-                
-                <li><a href="/currency-investing" title="" class="no-pjax">Currencies</a></li>
-                
-                <li><a href="http://biz.yahoo.com/research/earncal/today.html" title="" class="">Calendars</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U  has-entries">
-            <a href="/yahoofinance/" title="Yahoo Originals">Yahoo Originals</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/yahoofinance/business/" title="" class="">Business</a></li>
-                
-                <li><a href="/yahoofinance/investing" title="" class="">Investing</a></li>
-                
-                <li><a href="/yahoofinance/personalfinance" title="" class="">Personal Finance</a></li>
-                
-                <li><a href="/blogs/breakout/" title="" class="no-pjax">Breakout</a></li>
-                
-                <li><a href="/blogs/cost-of-living/" title="" class="no-pjax">Cost of Living</a></li>
-                
-                <li><a href="/blogs/daily-ticker/" title="" class="no-pjax">The Daily Ticker</a></li>
-                
-                <li><a href="/blogs/driven/" title="" class="no-pjax">Driven</a></li>
-                
-                <li><a href="/blogs/hot-stock-minute/" title="" class="no-pjax">Hot Stock Minute</a></li>
-                
-                <li><a href="/blogs/just-explain-it/" title="" class="no-pjax">Just Explain It</a></li>
-                
-                <li><a href="http://finance.yahoo.com/blogs/author/aaron-task/" title="" class="">Aaron Task, Editor</a></li>
-                
-                <li><a href="/blogs/author/michael-santoli/" title="" class="">Michael Santoli</a></li>
-                
-                <li><a href="/blogs/author/jeff-macke/" title="" class="">Jeff Macke</a></li>
-                
-                <li><a href="/blogs/author/aaron-pressman/" title="" class="">Aaron Pressman</a></li>
-                
-                <li><a href="/blogs/author/rick-newman/" title="" class="">Rick Newman</a></li>
-                
-                <li><a href="/blogs/author/mandi-woodruff/" title="" class="">Mandi Woodruff</a></li>
-                
-                <li><a href="/blogs/author/chris-nichols/" title="" class="">Chris Nichols</a></li>
-                
-                <li><a href="/blogs/the-exchange/" title="" class="no-pjax">The Exchange</a></li>
-                
-                <li><a href="/blogs/michael-santoli/" title="" class="no-pjax">Unexpected Returns</a></li>
-                
-                <li><a href="http://finance.yahoo.com/blogs/author/philip-pearlman/" title="" class="">Philip Pearlman</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U  has-entries">
-            <a href="/news/" title="">Business &amp; Finance</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/corporate-news/" title="" class="">Company News</a></li>
-                
-                <li><a href="/economic-policy-news/" title="" class="">Economic News</a></li>
-                
-                <li><a href="/investing-news/" title="" class="">Market News</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U &amp;amp;amp;amp;amp;amp;amp;quot;new&amp;amp;amp;amp;amp;amp;amp;quot; has-entries">
-            <a href="/personal-finance/" title="Personal Finance">Personal Finance</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/career-education/" title="" class="">Career &amp; Education</a></li>
-                
-                <li><a href="/real-estate/" title="" class="">Real Estate</a></li>
-                
-                <li><a href="/retirement/" title="" class="">Retirement</a></li>
-                
-                <li><a href="/credit-debt/" title="" class="">Credit &amp; Debt</a></li>
-                
-                <li><a href="/taxes/" title="" class="">Taxes</a></li>
-                
-                <li><a href="/autos/" title="" class="">Autos</a></li>
-                
-                <li><a href="/lifestyle/" title="" class="">Health &amp; Lifestyle</a></li>
-                
-                <li><a href="/videos/" title="" class="">Featured Videos</a></li>
-                
-                <li><a href="/rates/" title="" class="no-pjax">Rates in Your Area</a></li>
-                
-                <li><a href="/calculator/index/" title="" class="no-pjax">Calculators</a></li>
-                
-                <li><a href="/personal-finance/tools/" title="" class="">Tools</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U  has-entries">
-            <a href="/cnbc/" title="Business News from CNBC">CNBC</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/blogs/big-data-download/" title="" class="no-pjax">Big Data Download</a></li>
-                
-                <li><a href="/blogs/off-the-cuff/" title="" class="no-pjax">Off the Cuff</a></li>
-                
-                <li><a href="/blogs/power-pitch/" title="" class="no-pjax">Power Pitch</a></li>
-                
-                <li><a href="/blogs/talking-numbers/" title="" class="no-pjax">Talking Numbers</a></li>
-                
-                <li><a href="/blogs/the-biz-fix/" title="" class="no-pjax">The Biz Fix</a></li>
-                
-                <li><a href="/blogs/top-best-most/" title="" class="no-pjax">Top/Best/Most</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U ">
-            <a href="/contributors/" title="Contributors">Contributors</a>
-            
-        </li>
-        
-        
-    </ul>
-    
-
-
-
-</div><!--END subNav-->
-
-
-        <div id="y-nav">
-            
-   
-       <div data-region="td-applet-mw-quote-search">
-<div id="applet_7416600208709417" class="App_v2 js-applet" data-applet-guid="7416600208709417" data-applet-type="td-applet-mw-quote-search">
-
-
-    
-    
-
-    <div class="App-Bd">
-        <div class="App-Main" data-region="main">
-            <div class="js-applet-view-container-main">
-                
-                <style>
-    #lookupTxtQuotes {
-        float: left;
-        height: 22px;
-        padding: 3px 0 3px 5px;
-        width: 80px;
-        font-size: 11px;
-    }
-
-    .ac-form .yui3-fin-ac {
-        width: 50em;
-        border: 1px solid #DDD;
-        background: #fefefe;
-        overflow: visible;
-        text-align: left;
-        padding: .5em;
-        font-size: 12px;
-        z-index: 1000;
-        line-height: 1.22em;
-    }
-
-    .ac-form .yui3-highlight, em {
-        font-weight: bold;
-        font-style: normal;
-    }
-
-    .ac-form .yui3-fin-ac-list {
-        margin: 0;
-        padding-bottom: .4em;
-        padding: 0.38em 0;
-        width: 100%;
-    }
-
-    .ac-form .yui3-fin-ac-list li {
-        padding: 0.15em 0.38em;
-        _width: 100%;
-        cursor: default;
-        white-space: nowrap;
-        list-style: none;
-        vertical-align: bottom;
-        margin: 0;
-        position: relative;
-    }
-
-    .ac-form .symbol {
-        width: 8.5em;
-        display: inline-block;
-        margin: 0 1em 0 0;
-        overflow: hidden;
-    }
-
-    .ac-form .name {
-        display: inline-block;
-        left: 0;
-        width: 25em;
-        overflow: hidden;
-        position: relative;
-    }
-
-    .ac-form .exch_type_wrapper {
-        color: #aaa;
-        height: auto;
-        text-align: right;
-        font-size: 92%;
-        _font-size: 72%;
-        position: absolute;
-        right: 0;
-    }
-
-    .ac-form .yui-ac-ft {
-        font-family: Verdana,sans-serif;
-        font-size: 92%;
-        text-align: left;
-    }
-
-    .ac-form .moreresults {
-        padding-left: 0.3em;
-    }
-
-    .yui3-fin-ac-item-hover, .yui3-fin-ac-item-active {
-        background: #D6F7FF;
-        cursor: pointer;
-    }
-
-    .yui-ac-ft a {
-        color: #039;
-        text-decoration: none;
-        font-size: inherit !important;
-    }
-
-    .yui-ac-ft .tip {
-        border-top: 1px solid #D6D6D6;
-        color: #636363;
-        padding: 0.5em 0 0 0.4em;
-        margin-top: .25em;
-    }
-
-</style>
-<div mode="search" class="ticker-search mod" id="searchQuotes">
-    <div class="hd"></div>
-    <div class="bd" >
-        <form action="/q" name="quote" id="lookupQuote" class="ac-form">
-            <h2 class="yfi_signpost">Search for share prices</h2>
-            <label id="lookupPlaceHolder" class='Hidden'>Enter Symbol</label>
-            <input placeholder="Enter Symbol" type="text" autocomplete="off" value="" name="s" id="lookupTxtQuotes" class="fin-ac-input yui-ac-input">
-
-            <input type="hidden" autocomplete="off" value="1" name="ql" id="lookupGet_quote_logic_opt">
-
-            <div id="yfi_quotes_submit">
-                <span>
-                    <span>
-                        <span>
-                            <input type="submit" class="rapid-nf" id="btnQuotes" value="Look Up">
-                        </span>
-                    </span>
-                </span>
-            </div>
-        </form>
-    </div>
-    <div class="ft"><a href="http://finance.search.yahoo.com?fr=fin-v1" data-rapid_p="4">Finance Search</a>
-        <p><span id="yfs_market_time">Wed, Nov 05 2014, 11:00pm EST - U.S. Markets closed</span></p></div>
-</div>
-
-                
-            </div>
-        </div>
-    </div>
-
-    
-
-    
-
-</div>
-
-</div><!--END td-applet-mw-quote-search-->
-   
-
-
-        </div>
-        <div id="yfi_doc">
-            <div id="yfi_bd">
-                <div id="marketindices">
-
-                    
-                        
-                            <span><a href="/q?s=^DJI">Dow</a></span>
-                            <span id="yfs_pp0_^dji">
-                                
-                                    
-                                        <img width="10" height="14" border="0" alt="Up" class="pos_arrow" src="https://s.yimg.com/os/mit/media/m/base/images/transparent-1093278.png" style="margin-right:-2px;">
-                                    
-                                
-                                <b class="yfi-price-change-up">0.58%</b>
-                            </span>
-                        
-                        
-                    
-                        
-                        
-                            <span><a href="/q?s=^IXIC">Nasdaq</a></span>
-                        <span id="yfs_pp0_^ixic">
-                            
-                                
-                                    <img width="10" height="14" border="0" alt="Down" class="neg_arrow" src="https://s.yimg.com/os/mit/media/m/base/images/transparent-1093278.png" style="margin-right:-2px;">
-                                
-                            
-                            <b class="yfi-price-change-down">0.06%</b>
-
-                        
-                    
-                        
-                        
-                    
-                </div>
-
-                <div data-region="leftNav">
-<div id="yfi_investing_nav">
-    <div id="tickerSearch">
-        
-
-    </div>
-
-    <div class="hd">
-        <h2>More on AAPL</h2>
-    </div>
-    <div class="bd">
-
-        
-            <h3>Quotes</h3>
-            <ul>
-            
-                <li  ><a href="/q?s=AAPL">Summary</a></li>
-            
-                <li class="selected" ><a href="/q/op?s=AAPL">Options</a></li>
-            
-                <li  ><a href="/q/hp?s=AAPL">Historical Prices</a></li>
-            
-            </ul>
-        
-            <h3>Charts</h3>
-            <ul>
-            
-                <li  ><a href="/echarts?s=AAPL">Interactive</a></li>
-            
-                <li  ><a href="/q/bc?s=AAPL">Basic Chart</a></li>
-            
-                <li  ><a href="/q/ta?s=AAPL">Basic Tech. Analysis</a></li>
-            
-            </ul>
-        
-            <h3>News &amp; Info</h3>
-            <ul>
-            
-                <li  ><a href="/q/h?s=AAPL">Headlines</a></li>
-            
-                <li  ><a href="/q/b?s=AAPL">Financial Blogs</a></li>
-            
-                <li  ><a href="/q/ce?s=AAPL">Company Events</a></li>
-            
-                <li  ><a href="/q/mb?s=AAPL">Message Board</a></li>
-            
-            </ul>
-        
-            <h3>Company</h3>
-            <ul>
-            
-                <li  ><a href="/q/pr?s=AAPL">Profile</a></li>
-            
-                <li  ><a href="/q/ks?s=AAPL">Key Statistics</a></li>
-            
-                <li  ><a href="/q/sec?s=AAPL">SEC Filings</a></li>
-            
-                <li  ><a href="/q/co?s=AAPL">Competitors</a></li>
-            
-                <li  ><a href="/q/in?s=AAPL">Industry</a></li>
-            
-                <li  ><a href="/q/ct?s=AAPL">Components</a></li>
-            
-            </ul>
-        
-            <h3>Analyst Coverage</h3>
-            <ul>
-            
-                <li  ><a href="/q/ao?s=AAPL">Analyst Opinion</a></li>
-            
-                <li  ><a href="/q/ae?s=AAPL">Analyst Estimates</a></li>
-            
-                <li  ><a href="/q/rr?s=AAPL">Research Reports</a></li>
-            
-                <li  ><a href="/q/sa?s=AAPL">Star Analysts</a></li>
-            
-            </ul>
-        
-            <h3>Ownership</h3>
-            <ul>
-            
-                <li  ><a href="/q/mh?s=AAPL">Major Holders</a></li>
-            
-                <li  ><a href="/q/it?s=AAPL">Insider Transactions</a></li>
-            
-                <li  ><a href="/q/ir?s=AAPL">Insider Roster</a></li>
-            
-            </ul>
-        
-            <h3>Financials</h3>
-            <ul>
-            
-                <li  ><a href="/q/is?s=AAPL">Income Statement</a></li>
-            
-                <li  ><a href="/q/bs?s=AAPL">Balance Sheet</a></li>
-            
-                <li  ><a href="/q/cf?s=AAPL">Cash Flow</a></li>
-            
-            </ul>
-        
-
-    </div>
-    <div class="ft">
-
-    </div>
-</div>
-
-</div><!--END leftNav-->
-                <div id="sky">
-                    <div id="yom-ad-SKY"><div id="yom-ad-SKY-iframe"></div></div><!--ESI Ads for SKY -->
-                </div>
-                <div id="yfi_investing_content">
-
-                    <div id="yfi_broker_buttons">
-                        <div class='yom-ad D-ib W-20'>
-                            <div id="yom-ad-FB2-1"><div id="yom-ad-FB2-1-iframe"></div></div><!--ESI Ads for FB2-1 -->
-                        </div>
-                        <div class='yom-ad D-ib W-25'>
-                            <div id="yom-ad-FB2-2"><div id="yom-ad-FB2-2-iframe"></div></div><!--ESI Ads for FB2-2 -->
-                        </div>
-                        <div class='yom-ad D-ib W-25'>
-                            <div id="yom-ad-FB2-3"><div id="yom-ad-FB2-3-iframe"></div></div><!--ESI Ads for FB2-3 -->
-                        </div>
-                        <div class='yom-ad D-ib W-25'>
-                            <div id="yom-ad-FB2-4"><div id="yom-ad-FB2-4-iframe"><script>var FB2_4_noadPos = document.getElementById("yom-ad-FB2-4");  if (FB2_4_noadPos) {FB2_4_noadPos.style.display="none";}</script></div></div><!--ESI Ads for FB2-4 -->
-                        </div>
-                    </div>
-                    
-   
-       <div data-region="td-applet-mw-quote-details"><style>/*
-*  Stencil defined classes - https://git.corp.yahoo.com/pages/ape/stencil/behavior/index.html
-*   .PageOverlay
-*   .ModalDismissBtn.Btn
-*/
-
-/*
-* User defined classes
-*   #ham-nav-cue-modal - styles for the modal window
-*   .padd-border - styles for the content box of #ham-nav-cue-modal
-*   #ham-nav-cue-modal:after, #ham-nav-cue-modal:before - used to create modal window's arrow.
-*/
-
-.PageOverlay #ham-nav-cue-modal {
-    left: 49px;
-    transition: -webkit-transform .3s;
-    max-width: 240px;
-}
-
-.PageOverlay #ham-nav-cue-modal .padd-border {
-    border: solid #5300C5 2px;
-    padding: 5px 5px 10px 15px;
-}
-
-.PageOverlay {
-    z-index: 201;
-}
-
-#ham-nav-cue-modal:after,
-#ham-nav-cue-modal:before {
-    content: "";
-    border-style: solid;
-    border-width: 10px;
-    width: 0;
-    height: 0;
-    position: absolute;
-    top: 4%;
-    left: -20px;
-}
-
-#ham-nav-cue-modal:before {
-    border-color: transparent #5300C5 transparent transparent;
-}
-
-#ham-nav-cue-modal:after {
-    margin-left: 3px;
-    border-color: transparent #fff transparent transparent;
-}
-
-.ModalDismissBtn.Btn {
-    background: transparent;
-    border-color: transparent;
-}
-.follow-quote,.follow-quote-proxy {
-    color: #999;
-}
-.Icon.follow-quote-following {
-    color: #eac02b;
-}
-
-.follow-quote-tooltip {
-    z-index: 400;
-    text-align: center;
-}
-
-.follow-quote-area:hover .follow-quote {
-    display: inline-block;
-}
-
-.follow-quote-area:hover .quote-link,.follow-quote-visible .quote-link {
-    display: inline-block;
-    max-width: 50px;
-    _width: 50px;
-}</style>
-<div id="applet_7416600209955624" class="App_v2 js-applet" data-applet-guid="7416600209955624" data-applet-type="td-applet-mw-quote-details">
-
-
-    
-    
-
-    <div class="App-Bd">
-        <div class="App-Main" data-region="main">
-            <div class="js-applet-view-container-main">
-                
-                
-  
-    <style>
-        img {
-            vertical-align: baseline;
-        }
-        .follow-quote {
-            margin-left: 5px;
-            margin-right: 2px;
-        }
-        .yfi_rt_quote_summary .rtq_exch {
-            font: inherit;
-        }
-        .up_g.time_rtq_content, span.yfi-price-change-green {
-            color: #80 !important;
-        }
-        .time_rtq, .follow-quote-txt {
-            color: #979ba2;
-        }
-        .yfin_gs span.yfi-price-change-red, .yfin_gs span.yfi-price-change-green {
-            font-weight: bold;
-        }
-        .yfi_rt_quote_summary .hd h2 {
-            font: inherit;
-        }
-        span.yfi-price-change-red {
-            color: #C00 !important;
-        }
-        /* to hide the up/down arrow */
-        .yfi_rt_quote_summary_rt_top .time_rtq_content img {
-            display: none;
-        }
-
-        .quote_summary {
-            min-height: 77px;
-        }
-
-        .app_promo.after_hours, .app_promo.pre_market {
-            top: 8px;
-        }
-    </style>
-    <div class="rtq_leaf">
-      <div class="rtq_div">
-        <div class="yui-g quote_summary">
-          <div class="yfi_rt_quote_summary" id="yfi_rt_quote_summary">
-            <div class="hd">
-              <div class="title Fz-xl">
-                <h2 class="symbol-name">Apple Inc. (AAPL)</h2>
-                <span class="wl_sign Invisible"><button class="follow-quote follow-quote-follow follow-quote-always-visible D-ib Bd-0 O-0 Cur-p Sprite P-0 M-0 Fz-s" data-flw-quote="AAPL"><i class="Icon">&#xe023;</i></button>  <span class="follow-quote-txt Fz-m" data-flw-quote="AAPL">
-                    Watchlist
-                </span></span>
-              </div>
-            </div>
-            <div class="yfi_rt_quote_summary_rt_top sigfig_promo_1">
-              <div>
-                  <span class="time_rtq_ticker Fz-30 Fw-b">
-                        <span id="yfs_l84_AAPL" data-sq="AAPL:value">108.86</span>
-                  </span>
-                
-
-                    
-                        <span class="up_g time_rtq_content Fz-2xl Fw-b"><span id="yfs_c63_AAPL"><img width="10" height="14" border="0" style="margin-right:-2px;" src="https://s.yimg.com/lq/i/us/fi/03rd/up_g.gif" alt="Up"> <span class="yfi-price-change-green" data-sq="AAPL:chg">+0.26</span></span><span id="yfs_p43_AAPL">(<span class="yfi-price-change-green" data-sq="AAPL:pctChg">0.24%</span>)</span> </span>
-                    
-                
-                    <span class="time_rtq Fz-m"><span class="rtq_exch">NasdaqGS - </span><span id="yfs_t53_AAPL">As of <span data-sq="AAPL:lstTrdTime">4:00PM EST</span></span></span>
-
-              </div>
-              <div><span class="rtq_separator">|</span>
-                    
-                    After Hours:
-                        <span class="yfs_rtq_quote"><span id="yfs_l86_AAPL" data-sq="AAPL:ahValue">108.86</span></span> <span class=""><span id="yfs_c85_AAPL"><img width="10" height="14" style="margin-right:-2px;" border="0" src="https://s.yimg.com/os/mit/media/m/base/images/transparent-1093278.png" class="" alt="" data-sq="AAPL:ahChg"> 0.00</span> (<span id="yfs_c86_AAPL" data-sq="AAPL:ahPctChg">0.00%</span>)</span><span class="time_rtq"> <span id="yfs_t54_AAPL" data-sq="AAPL:ahLstTrdTime">7:59PM EST</span></span>
-                    
-                    
-              </div>
-            </div>
-            <style>
-              #yfi_toolbox_mini_rtq.sigfig_promo {
-              bottom:45px !important;
-              }
-            </style>
-            <div class="app_promo after_hours " >
-                <a href="https://mobile.yahoo.com/finance/?src=gta" title="Get the App" target="_blank" ></a>
-
-            </div>
-          </div>
-        </div>
-      </div>
-    </div>
-  
-
-
-                
-            </div>
-        </div>
-    </div>
-
-    
-
-    
-
-</div>
-
-</div><!--END td-applet-mw-quote-details-->
-   
-
-
-                    <div id="optionsTableApplet">
-                    
-   
-       <div data-region="td-applet-options-table"><style>.App_v2 {
-    border: none;
-    margin: 0;
-    padding: 0;
-}
-
-.options-table {
-    position: relative;
-}
-
-/*.Icon.up {*/
-    /*display: none;*/
-/*}*/
-
-.option_column {
-    width: auto;
-}
-
-.header_text {
-    float: left;
-    max-width: 50px;
-}
-.header_sorts {
-    color: #00be8c;
-    float: left;
-}
-
-.size-toggle-menu {
-    margin-left: 600px;
-}
-
-.in-the-money-banner {
-    background-color: rgba(224,241,231,1);
-    padding: 7px;
-    position: relative;
-    top: -3px;
-    width: 95px;
-}
-
-.in-the-money.odd {
-    background-color: rgba(232,249,239,1);
-}
-
-.in-the-money.even {
-    background-color: rgba(224,241,231,1);
-}
-
-.toggle li{
-    display: inline-block;
-    cursor: pointer;
-    border: 1px solid #e2e2e6;
-    border-right-width: 0;
-    color: #454545;
-    background-color: #fff;
-    float: left;
-    padding: 0px;
-    margin: 0px;
-}
-
-.toggle li a {
-  padding: 7px;
-  display: block;
-}
-
-.toggle li:hover{
-    background-color: #e2e2e6;
-}
-
-.toggle li.active{
-    color: #fff;
-    background-color: #30d3b6;
-    border-color: #30d3b6;
-    border-bottom-color: #0c8087;
-}
-
-.toggle li:first-child{
-    border-radius: 3px 0 0 3px;
-}
-
-.toggle li:last-child{
-    border-radius: 0 3px 3px 0;
-    border-right-width: 1px;
-}
-
-.high-low .up {
-    display: none;
-}
-
-.high-low .down {
-    display: block;
-}
-
-.low-high .down {
-    display: none;
-}
-
-.low-high .up {
-    display: block;
-}
-
-.option_column.sortable {
-    cursor: pointer;
-}
-
-.option-filter-overlay {
-    background-color: #fff;
-    border: 1px solid #979ba2;
-    border-radius: 3px;
-    float: left;
-    padding: 15px;
-    position: absolute;
-    top: 60px;
-    z-index: 10;
-    display: none;
-}
-
-#optionsStraddlesTable .option-filter-overlay {
-    left: 430px;
-}
-
-.option-filter-overlay.active {
-    display: block;
-}
-
-.option-filter-overlay .strike-filter{
-    height: 25px;
-    width: 75px;
-}
-
-#straddleTable .column-strike .cell{
-    width: 30px;
-}
-
-/**columns**/
-
-#quote-table th.column-expires {
-    width: 102px;
-}
-.straddle-expire div.option_entry {
-    min-width: 65px;
-}
-.column-last .cell {
-    width: 55px;
-}
-
-.column-change .cell {
-    width: 70px;
-}
-
-.cell .change {
-    width: 35px;
-}
-
-.column-percentChange .cell {
-    width: 85px;
-}
-
-.column-volume .cell {
-    width: 70px;
-}
-
-.cell .sessionVolume {
-    width: 37px;
-}
-
-.column-session-volume .cell {
-    width: 75px;
-}
-
-.column-openInterest .cell, .column-openInterestChange .cell {
-    width: 75px;
-}
-.cell .openInterest, .cell .openInterestChange {
-    width: 37px;
-}
-
-.column-bid .cell {
-    width: 50px;
-}
-
-.column-ask .cell {
-    width: 55px;
-}
-
-.column-impliedVolatility .cell {
-    width: 75px;
-}
-
-.cell .impliedVolatility {
-    width: 37px;
-}
-
-.column-contractName .cell {
-    width: 170px;
-}
-
-.options-menu-item {
-    position: relative;
-    top: -11px;
-}
-
-.options-table {
-  margin-bottom: 30px;
-}
-.options-table.hidden {
-  display: none;
-}
-#quote-table table {
-  width: 100%;
-}
-#quote-table tr * {
-  font-family: 'Helvetica Neue', Helvetica, Arial, sans-serif;
-  font-size: 15px;
-  color: #454545;
-  font-weight: 200;
-}
-#quote-table tr a {
-    color: #1D1DA3;
-}
-#quote-table tr .Icon {
-  font-family: YGlyphs;
-}
-#quote-table tr.odd {
-  background-color: #f7f7f7;
-}
-#quote-table tr th {
-  -webkit-box-sizing: border-box;
-  -moz-box-sizing: border-box;
-  box-sizing: border-box;
-  text-align: center;
-  width: 60px;
-  font-size: 11px !important;
-  padding-top: 10px;
-  padding-right: 5px;
-  padding-bottom: 10px;
-  vertical-align: middle;
-}
-#quote-table tr th * {
-  font-size: 11px;
-}
-#quote-table tr th .expand-icon {
-  display: block !important;
-  margin: 0 auto;
-  border: 1px solid #e2e2e6;
-  background-color: #fcfcfc;
-  -webkit-border-radius: 2px;
-  border-radius: 2px;
-  padding: 2px 0;
-}
-#quote-table tr th.column-strike {
-  width: 82px;
-}
-#quote-table tr th .sort-icons {
-  position: absolute;
-  margin-left: 2px;
-}
-#quote-table tr th .Icon {
-  display: none;
-}
-#quote-table tr th.low-high .up {
-  display: block !important;
-}
-#quote-table tr th.high-low .down {
-  display: block !important;
-}
-#quote-table td {
-  text-align: center;
-  padding: 7px 5px 7px 5px;
-}
-#quote-table td:first-child,
-#quote-table th:first-child {
-  border-right: 1px solid #e2e2e6;
-}
-#quote-table .D-ib .Icon {
-  color: #66aeb2;
-}
-#quote-table caption {
-  background-color: #454545 !important;
-  color: #fff;
-  font-size: medium;
-  padding: 4px;
-  padding-left: 20px !important;
-  text-rendering: antialiased;
-  -webkit-box-sizing: border-box;
-  -moz-box-sizing: border-box;
-  box-sizing: border-box;
-}
-#quote-table caption .callStraddles {
-  width:50%;
-  text-align:center;
-  float:left;
-}
-#quote-table caption .putStraddles {
-  width:50%;
-  text-align:center;
-  float:right;
-}
-#quote-table .in-the-money.even {
-  background-color: #f3fdfc;
-}
-#quote-table .in-the-money.even td:first-child {
-  -webkit-box-shadow: inset 5px 0 0 0 #d5f8f3;
-  box-shadow: inset 5px 0 0 0 #d5f8f3;
-}
-#quote-table .in-the-money.even td:last-child {
-  -webkit-box-shadow: inset -5px 0 0 0 #d5f8f3;
-  box-shadow: inset -5px 0 0 0 #d5f8f3;
-}
-#quote-table .in-the-money.odd {
-  background-color: #ecf6f4;
-}
-#quote-table .in-the-money.odd td:first-child {
-  -webkit-box-shadow: inset 5px 0 0 0 #cff3ec;
-  box-shadow: inset 5px 0 0 0 #cff3ec;
-}
-#quote-table .in-the-money.odd td:last-child {
-  -webkit-box-shadow: inset -5px 0 0 0 #cff3ec;
-  box-shadow: inset -5px 0 0 0 #cff3ec;
-}
-#quote-table .column-strike {
-  text-align: center;
-  padding: 4px 20px;
-}
-#quote-table .column-strike .header_text,
-#quote-table .column-expires .cell .expiration{
-  color: #454545;
-  font-size: 15px;
-  font-weight: bold;
-  max-width: 100%;
-}
-#quote-table .column-strike .header_text {
-    width: 100%;
-}
-#quote-table .column-strike .filter {
-  border: 1px solid #e2e2e6;
-  background-color: #fcfcfc;
-  color: #858585;
-  display: inline-block;
-  padding: 1px 10px;
-  -webkit-border-radius: 3px;
-  border-radius: 3px;
-  margin-top: 4px;
-}
-#quote-table .column-strike .filter span {
-  position: relative;
-  top: -2px;
-  font-weight: bold;
-  margin-left: -5px;
-}
-
-#quote-table .column-strike .sort-icons {
-   top: 35px;
-}
-#quote-table .column-expires .sort-icons {
-    top: 45px;
-}
-#optionsStraddlesTable .column-expires .sort-icons {
-    top: 40px;
-}
-#quote-table #options_menu {
-  width: 100%;
-}
-#quote-table #options_menu .SelectBox-Pick {
-  background-color: #fcfcfc !important;
-  border: 1px solid #e2e2e6;
-  color: #128086;
-  font-size: 14px;
-  padding: 5px;
-  padding-top: 8px;
-}
-#quote-table #options_menu .SelectBox-Text {
-  font-weight: bold;
-}
-#quote-table .size-toggle-menu {
-  margin-left: 15px !important;
-}
-#quote-table .options-menu-item {
-  top: -9px;
-}
-#quote-table .option_view {
-  float: right;
-}
-#quote-table .option-change-pos {
-  color: #2ac194;
-}
-#quote-table .option-change-neg {
-  color: #f90f31;
-}
-#quote-table .toggle li {
-  color: #128086;
-  background-color: #fcfcfc;
-}
-#quote-table .toggle li.active {
-  color: #fff;
-  background-color: #35d2b6;
-}
-#quote-table .expand-icon {
-  color: #b5b5b5;
-  font-size: 12px;
-  cursor: pointer;
-}
-#quote-table .straddleCallContractName {
-  padding-left: 25px;
-}
-#quote-table .straddlePutContractName {
-  padding-left: 20px;
-}
-#quote-table .straddle-row-expand {
-  display: none;
-  border-bottom: 1px solid #f9f9f9;
-}
-#quote-table .straddle-row-expand td {
-  padding-right: 5px;
-}
-#quote-table .straddle-row-expand label {
-  color: #454545;
-  font-size: 11px;
-  margin-bottom: 2px;
-  color: #888;
-}
-#quote-table .straddle-row-expand label,
-#quote-table .straddle-row-expand div {
-  display: block;
-  font-weight: 400;
-  text-align: left;
-  padding-left: 5px;
-}
-#quote-table .expand-icon-up {
-  display: none;
-}
-#quote-table tr.expanded + .straddle-row-expand {
-  display: table-row;
-}
-#quote-table tr.expanded .expand-icon-up {
-  display: inline-block;
-}
-#quote-table tr.expanded .expand-icon-down {
-  display: none;
-}
-.in-the-money-banner {
-  color: #7f8584;
-  font-size: 11px;
-  background-color: #eefcfa;
-  border-left: 12px solid #e0faf6;
-  border-right: 12px solid #e0faf6;
-  width: 76px !important;
-  text-align: center;
-  padding: 5px !important;
-  margin-top: 5px;
-  margin-left: 15px;
-}
-#optionsStraddlesTable td div {
-  text-align: center;
-}
-#optionsStraddlesTable .straddle-strike,
-#optionsStraddlesTable .column-strike,
-#optionsStraddlesTable .straddle-expire{
-  border-right: 1px solid #e2e2e6;
-  border-left: 1px solid #e2e2e6;
-}
-#optionsStraddlesTable td:first-child,
-#optionsStraddlesTable th:first-child {
-  border-right: none !important;
-}
-#optionsStraddlesTable .odd td.in-the-money {
-  background-color: #ecf6f4;
-}
-#optionsStraddlesTable .odd td.in-the-money:first-child {
-  -webkit-box-shadow: inset 5px 0 0 0 #cff3ec;
-  box-shadow: inset 5px 0 0 0 #cff3ec;
-}
-#optionsStraddlesTable .odd td.in-the-money:last-child {
-  -webkit-box-shadow: inset -5px 0 0 0 #cff3ec;
-  box-shadow: inset -5px 0 0 0 #cff3ec;
-}
-#optionsStraddlesTable .even td.in-the-money {
-  background-color: #f3fdfc;
-}
-#optionsStraddlesTable .even td.in-the-money:first-child {
-  -webkit-box-shadow: inset 5px 0 0 0 #d5f8f3;
-  box-shadow: inset 5px 0 0 0 #d5f8f3;
-}
-#optionsStraddlesTable .even td.in-the-money:last-child {
-  -webkit-box-shadow: inset -5px 0 0 0 #d5f8f3;
-  box-shadow: inset -5px 0 0 0 #d5f8f3;
-}
-.column-expand-all {
-  cursor: pointer;
-}
-.options-table.expand-all tr + .straddle-row-expand {
-  display: table-row !important;
-}
-.options-table.expand-all tr .expand-icon-up {
-  display: inline-block !important;
-}
-.options-table.expand-all tr .expand-icon-down {
-  display: none !important;
-}
-.options_menu .toggle a {
-  color: #128086;
-}
-.options_menu .toggle a:hover {
-  text-decoration: none;
-}
-.options_menu .toggle .active a {
-  color: #fff;
-}
-#options_menu .symbol_lookup {
-    float: right;
-    top: -11px;
-}
-.symbol_lookup .options-ac-input {
-    border-radius: 0;
-    height: 26px;
-    width: 79%;
-}
-.goto-icon {
-    border-left: 1px solid #e2e2e6;
-    color: #028087;
-    cursor: pointer;
-}
-.symbol_lookup .goto-icon {
-    height: 27px;
-    line-height: 2.1em;
-}
-#finAcOutput {
-    left: 10px;
-    top: -10px;
-}
-#finAcOutput .yui3-fin-ac-hidden {
-    display: none;
-}
-#finAcOutput .yui3-aclist {
-    border: 1px solid #DDD;
-    background: #fefefe;
-    font-size: 92%;
-    left: 0 !important;
-    overflow: visible;
-    padding: .5em;
-    position: absolute !important;
-    text-align: left;
-    top: 0 !important;
-
-}
-#finAcOutput li.yui3-fin-ac-item-active,
-#finAcOutput li.yui3-fin-ac-item-hover {
-    background: #F1F1F1;
-    cursor: pointer;
-}
-#finAcOutput div:first-child {
-    width: 30em !important;
-}
-#finAcOutput b.yui3-highlight {
-    font-weight: bold;
-}
-#finAcOutput li .name {
-    display: inline-block;
-    left: 0;
-    width: 25em;
-    overflow: hidden;
-    position: relative;
-}
-
-#finAcOutput li .symbol {
-    width: 8.5em;
-    display: inline-block;
-    margin: 0 1em 0 0;
-    overflow: hidden;
-}
-
-#finAcOutput li {
-    color: #444;
-    cursor: default;
-    font-weight: 300;
-    list-style: none;
-    margin: 0;
-    padding: .15em .38em;
-    position: relative;
-    vertical-align: bottom;
-    white-space: nowrap;
-}
-
-.yui3-fin-ac-hidden {
-    visibility: hidden;
-}
-
-.filterRangeRow {
-    line-height: 5px;
-}
-.filterRangeTitle {
-    padding-bottom: 5px;
-    font-size: 12px !important;
-}
-.clear-filter {
-    padding-left: 20px;
-}
-.closeFilter {
-    font-size: 10px !important;
-    color: red !important;
-}
-.modify-filter {
-    font-size: 11px !important;
-}
-.showModifyFilter {
-    top: 80px;
-    left: 630px;
-}
-
-#options_menu {
-    margin-bottom: -15px;
-}
-
-#optionsTableApplet {
-    margin-top: 9px;
-    width: 1070px;
-}
-
-#yfi_charts.desktop #yfi_doc, #yfi_charts.tablet #yfi_doc {
-    width: 1440px;
-}
-
-#yfi_charts.tablet #yfi_investing_content {
-    width: 1070px;
-}
-
-#sky {
-    float: right;
-    margin-left: 30px;
-    margin-top: 50px;
-    width: 170px;
-}
-</style>
-<div id="applet_7416600209231742" class="App_v2 js-applet" data-applet-guid="7416600209231742" data-applet-type="td-applet-options-table">
-
-
-    
-    
-
-    <div class="App-Bd">
-        <div class="App-Main" data-region="main">
-            <div class="js-applet-view-container-main">
-                
-                <div id="quote-table">
-    <div id="options_menu" class="Grid-U options_menu">
-        
-        <form class="Grid-U SelectBox Disabled">
-            <div class="SelectBox-Pick"><b class='SelectBox-Text '>November 7, 2014</b><i class='Icon Va-m'>&#xe002;</i></div>
-            <select class='Start-0' disabled data-plugin="selectbox">
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1415318400" value="1415318400"  >November 7, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1415923200" value="1415923200"  >November 14, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1416614400" value="1416614400"  >November 22, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1417132800" value="1417132800"  >November 28, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1417737600" value="1417737600"  >December 5, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1418342400" value="1418342400"  >December 12, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1419033600" value="1419033600"  >December 20, 2014</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1421452800" value="1421452800"  >January 17, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1424390400" value="1424390400"  >February 20, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1429228800" value="1429228800"  >April 17, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1437091200" value="1437091200"  >July 17, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1452816000" value="1452816000"  >January 15, 2016</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=AAPL&date=1484870400" value="1484870400"  >January 20, 2017</option>
-                
-            </select>
-        </form>
-        
-        
-
-        <div class="Grid-U options-menu-item symbol_lookup">
-            <div class="Cf">
-                <div class="fin-ac-container Bd-1 Pos-r M-10">
-                    <input placeholder="Lookup Option" type="text" autocomplete="off" value="" name="s" class="options-ac-input Bd-0" id="finAcOptions">
-                    <i class="Icon Fl-end W-20 goto-icon">&#xe015;</i>
-                </div>
-                <div id="finAcOutput" class="yui-ac-container Pos-r"></div>
-            </div>
-        </div>
-        <div class="Grid-U option_view options-menu-item">
-            <ul class="toggle toggle-view-mode">
-                <li class="toggle-list active">
-                  <a href="/q/op?s=AAPL&date=1415318400">List</a>
-                </li>
-                <li class="toggle-straddle ">
-                  <a href="/q/op?s=AAPL&straddle=true&date=1415318400">Straddle</a>
-                </li>
-            </ul>
-
-        </div>
-        <div class="Grid-U in_the_money in-the-money-banner">
-            In The Money
-        </div>
-    </div>
-
-    
-        
-            <div class="options-table " id="optionsCallsTable" data-sec="options-calls-table">
-                <div class="strike-filter option-filter-overlay">
-	<p>Show Me Strikes From</p>
-	<div class="My-6">
-	    $ <input class="filter-low strike-filter" data-filter-type="low" type="text">
-	    to $ <input class="filter-high strike-filter" data-filter-type="high" type="text">
-	</div>
-	<a data-table-filter="optionsCalls" class="Cur-p apply-filter">Apply Filter</a>
-	<a class="Cur-p clear-filter">Clear Filter</a>
-</div>
-                
-
-<div class="follow-quote-area">
-    <div class="quote-table-overflow">
-        <table class="details-table quote-table Fz-m">
-            
-                
-                    <caption>
-                        Calls
-                    </caption>
-                
-            
-            <thead class="details-header quote-table-headers">
-                <tr>
-                    
-    
-
-        
-            <th class='column-strike Pstart-38 low-high  Fz-xs filterable sortable option_column' style='color: #454545;' data-sort-column='strike' data-col-pos='0'>
-                <div class="cell">
-                    <div class="D-ib header_text strike">Strike</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-                <div class="filter  Cur-p "><span>&#8757;</span> Filter</div>
-            </th>
-        
-    
-
-    
-        
-            <th class='column-contractName Pstart-10 '>Contract Name</th>
-        
-    
-
-    
-
-        
-            <th class='column-last Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='lastPrice' data-col-pos='2'>
-                <div class="cell">
-                    <div class="D-ib lastPrice">Last</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-bid Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='bid' data-col-pos='3'>
-                <div class="cell">
-                    <div class="D-ib bid">Bid</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-ask Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='ask' data-col-pos='4'>
-                <div class="cell">
-                    <div class="D-ib ask">Ask</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-change Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='change' data-col-pos='5'>
-                <div class="cell">
-                    <div class="D-ib change">Change</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-percentChange Pstart-16  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='percentChange' data-col-pos='6'>
-                <div class="cell">
-                    <div class="D-ib percentChange">%Change</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-volume Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='volume' data-col-pos='7'>
-                <div class="cell">
-                    <div class="D-ib volume">Volume</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-openInterest Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='openInterest' data-col-pos='8'>
-                <div class="cell">
-                    <div class="D-ib openInterest">Open Interest</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-impliedVolatility Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='impliedVolatility' data-col-pos='9'>
-                <div class="cell">
-                    <div class="D-ib impliedVolatility">Implied Volatility</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-
-                </tr>
-                
-                <tr class="filterRangeRow D-n">
-                    <td colspan="10">
-                        <div>
-                            <span class="filterRangeTitle"></span>
-                            <span class="closeFilter Cur-p">&#10005;</span>
-                            <span class="modify-filter Cur-p">[modify]</span>
-                        </div>
-                    </td>
-                </tr>
-                
-            </thead>
-
-            <tbody>
-                
-                    
-                    
-    <tr data-row="0" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=60.00">60.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00060000">AAPL141107C00060000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >48.85</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >48.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >48.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.95</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-1.91%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="60">60</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >61</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >323.44%</div>
-        </td>
-    </tr>
-
-    <tr data-row="1" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=75.00">75.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00075000">AAPL141107C00075000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >30.05</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >33.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >34.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1">1</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >250.78%</div>
-        </td>
-    </tr>
-
-    <tr data-row="2" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=80.00">80.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00080000">AAPL141107C00080000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >28.76</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >28.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >28.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.66</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+2.35%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="16">16</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >178.13%</div>
-        </td>
-    </tr>
-
-    <tr data-row="3" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=85.00">85.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00085000">AAPL141107C00085000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >23.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >23.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >23.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.07</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-0.29%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="600">600</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >297</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >146.09%</div>
-        </td>
-    </tr>
-
-    <tr data-row="4" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=88.00">88.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00088000">AAPL141107C00088000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >20.85</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >20.70</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >20.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.45</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-2.11%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="90">90</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >128.13%</div>
-        </td>
-    </tr>
-
-    <tr data-row="5" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=89.00">89.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00089000">AAPL141107C00089000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >19.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >19.70</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >19.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.51</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+8.26%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="290">290</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >135</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >121.88%</div>
-        </td>
-    </tr>
-
-    <tr data-row="6" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=90.00">90.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00090000">AAPL141107C00090000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >18.85</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >18.70</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >18.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.20</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+1.07%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="480">480</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >227</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >116.41%</div>
-        </td>
-    </tr>
-
-    <tr data-row="7" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=91.00">91.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00091000">AAPL141107C00091000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >17.76</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >17.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >17.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.26</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+7.64%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="43">43</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >43</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >110.16%</div>
-        </td>
-    </tr>
-
-    <tr data-row="8" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=92.00">92.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00092000">AAPL141107C00092000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >16.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >16.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >16.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.84</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+5.23%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="240">240</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >142</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >104.30%</div>
-        </td>
-    </tr>
-
-    <tr data-row="9" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=93.00">93.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00093000">AAPL141107C00093000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >15.56</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >15.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >15.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-1.09</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-6.55%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="121">121</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >96</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >98.44%</div>
-        </td>
-    </tr>
-
-    <tr data-row="10" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=94.00">94.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00094000">AAPL141107C00094000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >14.87</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >14.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >14.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.88</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+14.47%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="981">981</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >510</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >92.58%</div>
-        </td>
-    </tr>
-
-    <tr data-row="11" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=95.00">95.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00095000">AAPL141107C00095000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.07</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+0.51%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="4116">4116</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1526</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >86.72%</div>
-        </td>
-    </tr>
-
-    <tr data-row="12" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=96.00">96.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00096000">AAPL141107C00096000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >12.95</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >12.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >12.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.20</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+1.57%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="891">891</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >413</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >81.25%</div>
-        </td>
-    </tr>
-
-    <tr data-row="13" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=97.00">97.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00097000">AAPL141107C00097000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >11.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >11.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >11.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+0.17%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1423">1423</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >719</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >75.00%</div>
-        </td>
-    </tr>
-
-    <tr data-row="14" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=98.00">98.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00098000">AAPL141107C00098000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >10.70</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >10.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >10.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.03</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-0.28%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2075">2075</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1130</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >69.53%</div>
-        </td>
-    </tr>
-
-    <tr data-row="15" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=99.00">99.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00099000">AAPL141107C00099000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >9.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >9.70</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >9.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.10</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+1.04%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="4252">4252</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3893</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >63.67%</div>
-        </td>
-    </tr>
-
-    <tr data-row="16" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=100.00">100.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00100000">AAPL141107C00100000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8.84</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.04</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-0.45%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="22067">22067</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7752</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >57.81%</div>
-        </td>
-    </tr>
-
-    <tr data-row="17" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=101.00">101.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00101000">AAPL141107C00101000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.04</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+0.52%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="6048">6048</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1795</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >51.95%</div>
-        </td>
-    </tr>
-
-    <tr data-row="18" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=102.00">102.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00102000">AAPL141107C00102000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.10</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+1.47%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="3488">3488</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2828</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >46.09%</div>
-        </td>
-    </tr>
-
-    <tr data-row="19" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=103.00">103.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00103000">AAPL141107C00103000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5.85</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.15</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+2.63%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="7725">7725</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3505</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >40.43%</div>
-        </td>
-    </tr>
-
-    <tr data-row="20" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=104.00">104.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00104000">AAPL141107C00104000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.20</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+4.35%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="6271">6271</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3082</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >34.38%</div>
-        </td>
-    </tr>
-
-    <tr data-row="21" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=105.00">105.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00105000">AAPL141107C00105000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.20</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+5.56%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="16703">16703</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6176</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >28.52%</div>
-        </td>
-    </tr>
-
-    <tr data-row="22" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=106.00">106.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00106000">AAPL141107C00106000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2.78</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2.78</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2.87</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.16</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+6.11%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="21589">21589</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >9798</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >17.19%</div>
-        </td>
-    </tr>
-
-    <tr data-row="23" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=107.00">107.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00107000">AAPL141107C00107000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.83</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.78</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.86</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.07</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+3.98%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="22126">22126</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13365</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6.25%</div>
-        </td>
-    </tr>
-
-    <tr data-row="24" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=108.00">108.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00108000">AAPL141107C00108000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.86</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.87</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.90</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.12</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-12.24%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="15256">15256</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >14521</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8.89%</div>
-        </td>
-    </tr>
-
-    <tr data-row="25" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=109.00">109.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00109000">AAPL141107C00109000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.37</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.36</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.38</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.11</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-22.92%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="30797">30797</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >25097</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13.87%</div>
-        </td>
-    </tr>
-
-    <tr data-row="26" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=110.00">110.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00110000">AAPL141107C00110000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.14</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.14</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.15</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.07</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-33.33%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="27366">27366</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >44444</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >16.70%</div>
-        </td>
-    </tr>
-
-    <tr data-row="27" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=111.00">111.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00111000">AAPL141107C00111000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.05</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.04</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.05</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.04</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-44.44%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="10243">10243</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >17981</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >18.36%</div>
-        </td>
-    </tr>
-
-    <tr data-row="28" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=112.00">112.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00112000">AAPL141107C00112000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-33.33%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2280">2280</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13500</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >22.07%</div>
-        </td>
-    </tr>
-
-    <tr data-row="29" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=113.00">113.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00113000">AAPL141107C00113000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="582">582</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >9033</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >25.78%</div>
-        </td>
-    </tr>
-
-    <tr data-row="30" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=114.00">114.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00114000">AAPL141107C00114000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-50.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="496">496</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5402</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >30.86%</div>
-        </td>
-    </tr>
-
-    <tr data-row="31" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=115.00">115.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00115000">AAPL141107C00115000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1965">1965</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4971</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >35.55%</div>
-        </td>
-    </tr>
-
-    <tr data-row="32" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=116.00">116.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00116000">AAPL141107C00116000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="71">71</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2303</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >36.72%</div>
-        </td>
-    </tr>
-
-    <tr data-row="33" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=117.00">117.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00117000">AAPL141107C00117000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2">2</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >899</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >40.63%</div>
-        </td>
-    </tr>
-
-    <tr data-row="34" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=118.00">118.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00118000">AAPL141107C00118000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="30">30</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >38</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >45.31%</div>
-        </td>
-    </tr>
-
-    <tr data-row="35" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=119.00">119.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00119000">AAPL141107C00119000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="935">935</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >969</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >49.22%</div>
-        </td>
-    </tr>
-
-    <tr data-row="36" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=120.00">120.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00120000">AAPL141107C00120000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="3800">3800</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >558</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >50.00%</div>
-        </td>
-    </tr>
-
-    <tr data-row="37" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=123.00">123.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00123000">AAPL141107C00123000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="176">176</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >176</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >59.38%</div>
-        </td>
-    </tr>
-
-    <tr data-row="38" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=130.00">130.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107C00130000">AAPL141107C00130000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="10">10</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >499</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >84.38%</div>
-        </td>
-    </tr>
-
-
-                    
-                    
-                    
-                    
-                
-            </tbody>
-        </table>
-    </div>
-</div>
-
-
-            </div>
-
-            <div class="options-table " id="optionsPutsTable" data-sec="options-puts-table">
-                <div class="strike-filter option-filter-overlay">
-	<p>Show Me Strikes From</p>
-	<div class="My-6">
-	    $ <input class="filter-low strike-filter" data-filter-type="low" type="text">
-	    to $ <input class="filter-high strike-filter" data-filter-type="high" type="text">
-	</div>
-	<a data-table-filter="optionsPuts" class="Cur-p apply-filter">Apply Filter</a>
-	<a class="Cur-p clear-filter">Clear Filter</a>
-</div>
-                
-
-<div class="follow-quote-area">
-    <div class="quote-table-overflow">
-        <table class="details-table quote-table Fz-m">
-            
-                
-                    <caption>
-                        Puts
-                    </caption>
-                
-            
-            <thead class="details-header quote-table-headers">
-                <tr>
-                    
-    
-
-        
-            <th class='column-strike Pstart-38 low-high  Fz-xs filterable sortable option_column' style='color: #454545;' data-sort-column='strike' data-col-pos='0'>
-                <div class="cell">
-                    <div class="D-ib header_text strike">Strike</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-                <div class="filter  Cur-p "><span>&#8757;</span> Filter</div>
-            </th>
-        
-    
-
-    
-        
-            <th class='column-contractName Pstart-10 '>Contract Name</th>
-        
-    
-
-    
-
-        
-            <th class='column-last Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='lastPrice' data-col-pos='2'>
-                <div class="cell">
-                    <div class="D-ib lastPrice">Last</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-bid Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='bid' data-col-pos='3'>
-                <div class="cell">
-                    <div class="D-ib bid">Bid</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-ask Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='ask' data-col-pos='4'>
-                <div class="cell">
-                    <div class="D-ib ask">Ask</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-change Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='change' data-col-pos='5'>
-                <div class="cell">
-                    <div class="D-ib change">Change</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-percentChange Pstart-16  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='percentChange' data-col-pos='6'>
-                <div class="cell">
-                    <div class="D-ib percentChange">%Change</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-volume Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='volume' data-col-pos='7'>
-                <div class="cell">
-                    <div class="D-ib volume">Volume</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-openInterest Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='openInterest' data-col-pos='8'>
-                <div class="cell">
-                    <div class="D-ib openInterest">Open Interest</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-impliedVolatility Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='impliedVolatility' data-col-pos='9'>
-                <div class="cell">
-                    <div class="D-ib impliedVolatility">Implied Volatility</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-
-                </tr>
-                
-                <tr class="filterRangeRow D-n">
-                    <td colspan="10">
-                        <div>
-                            <span class="filterRangeTitle"></span>
-                            <span class="closeFilter Cur-p">&#10005;</span>
-                            <span class="modify-filter Cur-p">[modify]</span>
-                        </div>
-                    </td>
-                </tr>
-                
-            </thead>
-
-            <tbody>
-                
-                    
-    <tr data-row="0" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=70.00">70.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00070000">AAPL141107P00070000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="10">10</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >295</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >196.88%</div>
-        </td>
-    </tr>
-
-    <tr data-row="1" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=75.00">75.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00075000">AAPL141107P00075000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="525">525</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2086</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >181.25%</div>
-        </td>
-    </tr>
-
-    <tr data-row="2" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=80.00">80.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00080000">AAPL141107P00080000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="3672">3672</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7955</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >143.75%</div>
-        </td>
-    </tr>
-
-    <tr data-row="3" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=85.00">85.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00085000">AAPL141107P00085000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2120">2120</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1425</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >129.69%</div>
-        </td>
-    </tr>
-
-    <tr data-row="4" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=88.00">88.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00088000">AAPL141107P00088000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="301">301</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1072</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >109.38%</div>
-        </td>
-    </tr>
-
-    <tr data-row="5" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=89.00">89.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00089000">AAPL141107P00089000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="211">211</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >760</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >107.81%</div>
-        </td>
-    </tr>
-
-    <tr data-row="6" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=90.00">90.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00090000">AAPL141107P00090000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+100.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="4870">4870</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3693</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >103.13%</div>
-        </td>
-    </tr>
-
-    <tr data-row="7" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=91.00">91.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00091000">AAPL141107P00091000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+100.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="333">333</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1196</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >96.88%</div>
-        </td>
-    </tr>
-
-    <tr data-row="8" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=92.00">92.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00092000">AAPL141107P00092000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+100.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="4392">4392</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1294</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >92.19%</div>
-        </td>
-    </tr>
-
-    <tr data-row="9" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=93.00">93.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00093000">AAPL141107P00093000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+100.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="3780">3780</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >778</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >89.84%</div>
-        </td>
-    </tr>
-
-    <tr data-row="10" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=94.00">94.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00094000">AAPL141107P00094000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+100.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1463">1463</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5960</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >86.72%</div>
-        </td>
-    </tr>
-
-    <tr data-row="11" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=95.00">95.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00095000">AAPL141107P00095000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+100.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2098">2098</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >11469</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >81.25%</div>
-        </td>
-    </tr>
-
-    <tr data-row="12" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=96.00">96.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00096000">AAPL141107P00096000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="4163">4163</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3496</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >75.78%</div>
-        </td>
-    </tr>
-
-    <tr data-row="13" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=97.00">97.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00097000">AAPL141107P00097000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.04</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+50.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="4364">4364</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1848</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >71.88%</div>
-        </td>
-    </tr>
-
-    <tr data-row="14" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=98.00">98.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00098000">AAPL141107P00098000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.04</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1960">1960</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6036</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >66.41%</div>
-        </td>
-    </tr>
-
-    <tr data-row="15" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=99.00">99.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00099000">AAPL141107P00099000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.04</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.04</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.02</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+100.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="852">852</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5683</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >60.94%</div>
-        </td>
-    </tr>
-
-    <tr data-row="16" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=100.00">100.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00100000">AAPL141107P00100000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.05</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+50.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2204">2204</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4774</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >57.81%</div>
-        </td>
-    </tr>
-
-    <tr data-row="17" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=101.00">101.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00101000">AAPL141107P00101000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.04</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.03</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.05</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+33.33%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="3596">3596</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2621</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >51.95%</div>
-        </td>
-    </tr>
-
-    <tr data-row="18" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=102.00">102.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00102000">AAPL141107P00102000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.05</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.04</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.05</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+25.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2445">2445</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7791</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >48.05%</div>
-        </td>
-    </tr>
-
-    <tr data-row="19" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=103.00">103.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00103000">AAPL141107P00103000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.05</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.04</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.05</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+25.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="8386">8386</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7247</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >42.19%</div>
-        </td>
-    </tr>
-
-    <tr data-row="20" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=104.00">104.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00104000">AAPL141107P00104000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.06</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.05</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.06</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2939">2939</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >12639</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >37.31%</div>
-        </td>
-    </tr>
-
-    <tr data-row="21" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=105.00">105.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00105000">AAPL141107P00105000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.08</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.07</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.08</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.01</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-11.11%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2407">2407</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >14842</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >33.01%</div>
-        </td>
-    </tr>
-
-    <tr data-row="22" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=106.00">106.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00106000">AAPL141107P00106000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.10</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.11</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.12</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.08</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-44.44%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="8659">8659</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13528</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >29.10%</div>
-        </td>
-    </tr>
-
-    <tr data-row="23" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=107.00">107.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00107000">AAPL141107P00107000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.22</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.21</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.22</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.14</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-38.89%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="5825">5825</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >17069</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >26.47%</div>
-        </td>
-    </tr>
-
-    <tr data-row="24" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=108.00">108.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00108000">AAPL141107P00108000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.50</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.48</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.50</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.22</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-30.56%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="12554">12554</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >12851</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >26.95%</div>
-        </td>
-    </tr>
-
-    <tr data-row="25" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=109.00">109.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00109000">AAPL141107P00109000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.01</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.96</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.02</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.27</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-21.09%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="9877">9877</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >9295</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >29.49%</div>
-        </td>
-    </tr>
-
-    <tr data-row="26" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=110.00">110.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00110000">AAPL141107P00110000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.76</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.74</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.89</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.24</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-12.00%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="2722">2722</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >7129</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >38.28%</div>
-        </td>
-    </tr>
-
-    <tr data-row="27" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=111.00">111.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00111000">AAPL141107P00111000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2.71</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2.64</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2.75</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.05</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-1.81%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="4925">4925</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >930</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >44.14%</div>
-        </td>
-    </tr>
-
-    <tr data-row="28" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=112.00">112.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00112000">AAPL141107P00112000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.60</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.05</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+1.39%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="247">247</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >328</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >51.66%</div>
-        </td>
-    </tr>
-
-    <tr data-row="29" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=113.00">113.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00113000">AAPL141107P00113000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4.70</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4.55</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.60</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-11.32%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="14">14</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >354</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >59.28%</div>
-        </td>
-    </tr>
-
-    <tr data-row="30" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=114.00">114.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00114000">AAPL141107P00114000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5.65</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5.60</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >5.85</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.20</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+3.67%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="16">16</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >71</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >69.82%</div>
-        </td>
-    </tr>
-
-    <tr data-row="31" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=115.00">115.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00115000">AAPL141107P00115000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6.61</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6.55</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >6.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.06</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+0.92%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="6">6</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >51</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >75.29%</div>
-        </td>
-    </tr>
-
-    <tr data-row="32" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=117.00">117.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00117000">AAPL141107P00117000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8.55</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8.55</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >8.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-2.20</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-20.47%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="5">5</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >90.04%</div>
-        </td>
-    </tr>
-
-    <tr data-row="33" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=119.00">119.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00119000">AAPL141107P00119000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >14.35</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >10.55</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >10.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="1">1</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >103.91%</div>
-        </td>
-    </tr>
-
-    <tr data-row="34" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=120.00">120.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00120000">AAPL141107P00120000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >11.55</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >11.55</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >11.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.65</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-pos">+5.96%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="3800">3800</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >152</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >110.55%</div>
-        </td>
-    </tr>
-
-    <tr data-row="35" data-row-quote="_" class="in-the-money 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=AAPL&strike=122.00">122.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=AAPL141107P00122000">AAPL141107P00122000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13.66</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13.55</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >13.80</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-9.59</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-41.25%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="7500">7500</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >2</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >123.44%</div>
-        </td>
-    </tr>
-
-
-                    
-                    
-                    
-                    
-                    
-                
-            </tbody>
-        </table>
-    </div>
-</div>
-
-
-            </div>
-        
-    
-</div>
-
-                
-            </div>
-        </div>
-    </div>
-
-    
-
-    
-
-</div>
-
-</div><!--END td-applet-options-table-->
-   
-
-
-                    </div>
-
-
-                </div>
-
-            </div>
-        </div>
-
-
-
-    </div>
-</div>
-
-        <script>
-(function (root) {
-// -- Data --
-root.Af || (root.Af = {});
-root.Af.config || (root.Af.config = {});
-root.Af.config.transport || (root.Af.config.transport = {});
-root.Af.config.transport.xhr = "\u002F_td_charts_api";
-root.YUI || (root.YUI = {});
-root.YUI.Env || (root.YUI.Env = {});
-root.YUI.Env.Af || (root.YUI.Env.Af = {});
-root.YUI.Env.Af.settings || (root.YUI.Env.Af.settings = {});
-root.YUI.Env.Af.settings.transport || (root.YUI.Env.Af.settings.transport = {});
-root.YUI.Env.Af.settings.transport.xhr = "\u002F_td_charts_api";
-root.YUI.Env.Af.settings.beacon || (root.YUI.Env.Af.settings.beacon = {});
-root.YUI.Env.Af.settings.beacon.pathPrefix = "\u002F_td_charts_api\u002Fbeacon";
-root.app || (root.app = {});
-root.app.yui = {"use":function bootstrap() { var self = this, d = document, head = d.getElementsByTagName('head')[0], ie = /MSIE/.test(navigator.userAgent), pending = 0, callback = [], args = arguments, config = typeof YUI_config != "undefined" ? YUI_config : {}; function flush() { var l = callback.length, i; if (!self.YUI && typeof YUI == "undefined") { throw new Error("YUI was not injected correctly!"); } self.YUI = self.YUI || YUI; for (i = 0; i < l; i++) { callback.shift()(); } } function decrementRequestPending() { pending--; if (pending <= 0) { setTimeout(flush, 0); } else { load(); } } function createScriptNode(src) { var node = d.createElement('script'); if (node.async) { node.async = false; } if (ie) { node.onreadystatechange = function () { if (/loaded|complete/.test(this.readyState)) { this.onreadystatechange = null; decrementRequestPending(); } }; } else { node.onload = node.onerror = decrementRequestPending; } node.setAttribute('src', src); return node; } function load() { if (!config.seed) { throw new Error('YUI_config.seed array is required.'); } var seed = config.seed, l = seed.length, i, node; pending = pending || seed.length; self._injected = true; for (i = 0; i < l; i++) { node = createScriptNode(seed.shift()); head.appendChild(node); if (node.async !== false) { break; } } } callback.push(function () { var i; if (!self._Y) { self.YUI.Env.core.push.apply(self.YUI.Env.core, config.extendedCore || []); self._Y = self.YUI(); self.use = self._Y.use; if (config.patches && config.patches.length) { for (i = 0; i < config.patches.length; i += 1) { config.patches[i](self._Y, self._Y.Env._loader); } } } self._Y.use.apply(self._Y, args); }); self.YUI = self.YUI || (typeof YUI != "undefined" ? YUI : null); if (!self.YUI && !self._injected) { load(); } else if (pending <= 0) { flush(); } return this; },"ready":function (callback) { this.use(function () { callback(); }); }};
-root.routeMap = {"quote-details":{"path":"\u002Fq\u002F?","keys":[],"regexp":/^\/q\/?\/?$/i,"annotations":{"name":"quote-details","aliases":["quote-details"]}},"recent-quotes":{"path":"\u002Fquotes\u002F?","keys":[],"regexp":/^\/quotes\/?\/?$/i,"annotations":{"name":"recent-quotes","aliases":["recent-quotes"]}},"quote-chart":{"path":"\u002Fchart\u002F?","keys":[],"regexp":/^\/chart\/?\/?$/i,"annotations":{"name":"quote-chart","aliases":["quote-chart"]}},"desktop-chart":{"path":"\u002Fecharts\u002F?","keys":[],"regexp":/^\/echarts\/?\/?$/i,"annotations":{"name":"desktop-chart","aliases":["desktop-chart"]}},"options":{"path":"\u002Fq\u002Fop\u002F?","keys":[],"regexp":/^\/q\/op\/?\/?$/i,"annotations":{"name":"options","aliases":["options"]}}};
-root.genUrl = function (routeName, context) {
-        var route = routeMap[routeName],
-            path, keys, i, len, key, param, regex;
-
-        if (!route) { return ''; }
-
-        path = route.path;
-        keys = route.keys;
-
-        if (context && (len = keys.length)) {
-            for (i = 0; i < len; i += 1) {
-                key   = keys[i];
-                param = key.name || key;
-                regex = new RegExp('[:*]' + param + '\\b');
-                path  = path.replace(regex, context[param]);
-            }
-        }
-
-        // Replace missing params with empty strings.
-        return path.replace(/([:*])([\w\-]+)?/g, '');
-    };
-root.App || (root.App = {});
-root.App.Cache || (root.App.Cache = {});
-root.App.Cache.globals = {"config":{"hosts":{"_default":"finance.yahoo.com","production":"finance.yahoo.com","staging":"stage.finance.yahoo.com","functional.test":"qa1.finance.yahoo.com","smoke.test":"int1.finance.yahoo.com","development":"int1.finance.yahoo.com"},"dss":{"assetPath":"\u002Fpv\u002Fstatic\u002Flib\u002Fios-default-set_201312031214.js","pn":"yahoo_finance_us_web","secureAssetHost":"https:\u002F\u002Fs.yimg.com","assetHost":"http:\u002F\u002Fl.yimg.com","cookieName":"DSS"},"mrs":{"mrs_host":"mrs-ynews.mrs.o.yimg.com","key":"mrs.ynews.crumbkey","app_id":"ynews"},"title":"Yahoo Finance - Business Finance, Stock Market, Quotes, News","crumbKey":"touchdown.crumbkey","asset_combo":true,"asset_mode":"prod","asset_filter":"min","assets":{"js":[{"location":"bottom","value":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Fmedia\u002Fm\u002Fheader\u002Fheader-uh3-finance-hardcoded-jsonblob-min-1583812.js"}],"css":["css.master",{"location":"top","value":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Fmedia\u002Fm\u002Fquotes\u002Fquotes-search-gs-smartphone-min-1680382.css"}],"options":{"inc_init_bottom":"0","inc_rapid":"1","rapid_version":"3.21","yui_instance_location":"bottom"}},"cdn":{"comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&","prefixMap":{"http:\u002F\u002Fl.yimg.com\u002F":""},"base":"https:\u002F\u002Fs.yimg.com"},"prefix_map":{"http:\u002F\u002Fl.yimg.com\u002F":""},"xhrPath":"_td_charts_api","adsEnabled":true,"ads":{"position":{"LREC":{"w":"300","h":"265"},"FB2-1":{"w":"198","h":"60"},"FB2-2":{"w":"198","h":"60"},"FB2-3":{"w":"198","h":"60"},"FB2-4":{"w":"198","h":"60"},"LDRP":{"w":"320","h":"76","metaSize":true},"WBTN":{"w":"120","h":"60"},"WBTN-1":{"w":"120","h":"60"},"FB2-0":{"w":"120","h":"60"},"SKY":{"w":"160","h":"600"}}},"spaceid":"2022773886","urlSpaceId":"true","urlSpaceIdMap":{"quotes":"980779717","q\u002Fop":"28951412","q":"980779724"},"rapidSettings":{"webworker_file":"\u002Frapid-worker.js","client_only":1,"keys":{"version":"td app","site":"mobile-web-quotes"},"ywa":{"project_id":"1000911397279","document_group":"interactive-chart","host":"y.analytics.yahoo.com"},"ywaMappingAction":{"click":12,"hvr":115,"rottn":128,"drag":105},"ywaMappingCf":{"_p":20,"ad":58,"authfb":11,"bpos":24,"camp":54,"cat":25,"code":55,"cpos":21,"ct":23,"dcl":26,"dir":108,"domContentLoadedEventEnd":44,"elm":56,"elmt":57,"f":40,"ft":51,"grpt":109,"ilc":39,"itc":111,"loadEventEnd":45,"ltxt":17,"mpos":110,"mrkt":12,"pcp":67,"pct":48,"pd":46,"pkgt":22,"pos":20,"prov":114,"psp":72,"pst":68,"pstcat":47,"pt":13,"rescode":27,"responseEnd":43,"responseStart":41,"rspns":107,"sca":53,"sec":18,"site":42,"slk":19,"sort":28,"t1":121,"t2":122,"t3":123,"t4":124,"t5":125,"t6":126,"t7":127,"t8":128,"t9":129,"tar":113,"test":14,"v":52,"ver":49,"x":50},"tracked_mods":["yfi_investing_nav","chart-details"],"nofollow_class":[]},"property":"finance","uh":{"experience":"GS"},"loginRedirectHost":"finance.yahoo.com","default_ticker":"YHOO","default_market_tickers":["^DJI","^IXIC"],"uhAssetsBase":"https:\u002F\u002Fs.yimg.com","sslEnabled":true,"layout":"options","packageName":"finance-td-app-mobile-web","customActions":{"before":[function (req, res, data, callback) {
-    var header,
-        config = req.config(),
-        path = req.path;
-
-    if (req.i13n && req.i13n.stampNonClassified) {
-        //console.log('=====> [universal_header] page stamped: ' + req.i13n.isStamped() + ' with spaceid ' + req.i13n.getSpaceid());
-        req.i13n.stampNonClassified(config.spaceid);
-    }
-    config.uh = config.uh || {};
-    config.uh.experience = config.uh.experience || 'uh3';
-
-    req.query.experience = config.uh.experience;
-    req.query.property = 'finance';
-    header = finUH.getMarkup(req);
-
-    res.locals = res.locals || {};
-
-    if (header.sidebar) {
-        res.locals.sidebar_css = header.sidebar.uh_css;
-        res.locals.sidebar_js = header.sidebar.uh_js;
-        data.sidebar_markup = header.sidebar.uh_markup;
-    }
-
-    res.locals.uh_css = header.uh_css;
-    res.locals.uh_js = header.uh_js;
-    data.uh_markup = header.uh_markup;
-    //TODO - localize these strings
-    if (path && path.indexOf('op') > -1) {
-        res.locals.page_title = parseSymbol(req.query.s) + " Option Chain | Yahoo! Inc. Stock - Yahoo! Finance";
-    } else if (path && ((path.indexOf('echarts') > -1) || (path.indexOf('q') > -1))) {
-        res.locals.page_title = parseSymbol(req.query.s) + " Interactive Stock Chart | Yahoo! Inc. Stock - Yahoo! Finance";
-    } else {
-        res.locals.page_title = config.title;
-    }
-    callback();
-},function (req, res, data, next) {
-    /* this would invoke the ESI plugin on YTS */
-    res.parentRes.set('X-Esi', '1');
-
-    var hosts = req.config().hosts,
-        hostToSet = hosts._default;
-
-    Object.keys(hosts).some(function (host) {
-        if (req.headers.host.indexOf(host) >= 0) {
-            hostToSet = hosts[host];
-            return true;
-        }
-    });
-
-    /* saving request host server name for esi end point */
-    res.locals.requesturl = {
-        host: hostToSet
-    };
-
-     /* saving header x-yahoo-request-url for Darla configuration */
-    res.locals.requestxhosturl = req.headers['x-env-host'] ? {host: req.headers['x-env-host']} : {host: hostToSet};
-
-    //urlPath is used for ./node_modules/assembler/node_modules/dust-helpers/lib/util.js::getSpaceId()
-    //see: https://git.corp.yahoo.com/sports/sportacular-web
-    req.context.urlPath = req.path;
-
-    // console.log(JSON.stringify({
-    //     requesturl: res.locals.requesturl.host,
-    //     requestxhosturl: res.locals.requestxhosturl,
-    //     urlPath: req.context.urlPath
-    // }));
-
-    next();
-},function (req, res, data, callback) {
-
-    res.locals = res.locals || {};
-    if (req.query && req.query.s) {
-        res.locals.quote = req.query.s;
-    }
-
-    callback();
-},function (req, res, data, callback) {
-    var params,
-        ticker,
-        config, i;
-
-    req = req || {};
-    req.params = req.params || {};
-
-    config = req.config() || {};
-
-
-    data = data || {};
-
-    params = req.params || {};
-    ticker = (params.ticker || (req.query && req.query.s) || 'YHOO').toUpperCase();
-    ticker = ticker.split('+')[0];//Split on + if it's in the ticker
-    ticker = ticker.split(' ')[0];//Split on space if it's in the ticker
-
-    params.tickers = [];
-    if (config.default_market_tickers) {
-        params.tickers = params.tickers.concat(config.default_market_tickers);
-    }
-    params.tickers.push(ticker);
-    params.tickers = params.tickers.join(',');
-    params.format = 'inflated';
-
-    //Move this into a new action
-    res.locals.isTablet = config.isTablet;
-
-    quoteStore.read('finance_quote', params, req, function (err, qData) {
-        if (!err && qData.quotes && qData.quotes.length > 0) {
-            res.locals.quoteData = qData;
-            for (i = 0; i < qData.quotes.length; i = i +  1) {
-                if (qData.quotes[i].symbol.toUpperCase() === ticker.toUpperCase()) {
-                    params.ticker_securityType = qData.quotes[i].type;
-                }
-            }
-            params.tickers = ticker;
-        }
-        callback();
-    });
-},function (req, res, data, callback) {
-
-    marketTimeStore.read('markettime', {}, req, function (err, data) {
-        if (data && data.index) {
-            res.parentRes.locals.markettime = data.index.markettime;
-        }
-        callback();
-    });
-}],"after":[]}},"context":{"authed":"0","ynet":"0","ssl":"1","spdy":"0","bucket":"","colo":"gq1","device":"desktop","environment":"prod","lang":"en-US","partner":"none","site":"finance","region":"US","intl":"us","tz":"America\u002FLos_Angeles","edgepipeEnabled":false,"urlPath":"\u002Fq\u002Fop"},"intl":{"locales":"en-US"},"user":{"crumb":"ly1MJzURQo0"}};
-root.YUI_config = {"version":"3.17.2","base":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:3.17.2\u002F","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&","root":"yui:3.17.2\u002F","filter":"min","logLevel":"error","combine":true,"patches":[function patchLangBundlesRequires(Y, loader) {
-    var getRequires = loader.getRequires;
-    loader.getRequires = function (mod) {
-        var i, j, m, name, mods, loadDefaultBundle,
-            locales = Y.config.lang || [],
-            r = getRequires.apply(this, arguments);
-        // expanding requirements with optional requires
-        if (mod.langBundles && !mod.langBundlesExpanded) {
-            mod.langBundlesExpanded = [];
-            locales = typeof locales === 'string' ? [locales] : locales.concat();
-            for (i = 0; i < mod.langBundles.length; i += 1) {
-                mods = [];
-                loadDefaultBundle = false;
-                name = mod.group + '-lang-' + mod.langBundles[i];
-                for (j = 0; j < locales.length; j += 1) {
-                    m = this.getModule(name + '_' + locales[j].toLowerCase());
-                    if (m) {
-                        mods.push(m);
-                    } else {
-                        // if one of the requested locales is missing,
-                        // the default lang should be fetched
-                        loadDefaultBundle = true;
-                    }
-                }
-                if (!mods.length || loadDefaultBundle) {
-                    // falling back to the default lang bundle when needed
-                    m = this.getModule(name);
-                    if (m) {
-                        mods.push(m);
-                    }
-                }
-                // adding requirements for each lang bundle
-                // (duplications are not a problem since they will be deduped)
-                for (j = 0; j < mods.length; j += 1) {
-                    mod.langBundlesExpanded = mod.langBundlesExpanded.concat(this.getRequires(mods[j]), [mods[j].name]);
-                }
-            }
-        }
-        return mod.langBundlesExpanded && mod.langBundlesExpanded.length ?
-                [].concat(mod.langBundlesExpanded, r) : r;
-    };
-}],"modules":{"IntlPolyfill":{"fullpath":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:platform\u002Fintl\u002F0.1.4\u002FIntl.min.js&yui:platform\u002Fintl\u002F0.1.4\u002Flocale-data\u002Fjsonp\u002F{lang}.js","condition":{"name":"IntlPolyfill","trigger":"intl-messageformat","test":function (Y) {
-                        return !Y.config.global.Intl;
-                    },"when":"before"},"configFn":function (mod) {
-                    var lang = 'en-US';
-                    if (window.YUI_config && window.YUI_config.lang && window.IntlAvailableLangs && window.IntlAvailableLangs[window.YUI_config.lang]) {
-                        lang = window.YUI_config.lang;
-                    }
-                    mod.fullpath = mod.fullpath.replace('{lang}', lang);
-                    return true;
-                }}},"groups":{"finance-td-app-mobile-web":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.305\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.305\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"ape-af":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fape-af-0.0.314\u002F","root":"os\u002Fmit\u002Ftd\u002Fape-af-0.0.314\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"mjata":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fmjata-0.4.33\u002F","root":"os\u002Fmit\u002Ftd\u002Fmjata-0.4.33\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"ape-applet":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fape-applet-0.0.202\u002F","root":"os\u002Fmit\u002Ftd\u002Fape-applet-0.0.202\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"applet-server":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fapplet-server-0.2.70\u002F","root":"os\u002Fmit\u002Ftd\u002Fapplet-server-0.2.70\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-api":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-api-0.1.69\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-api-0.1.69\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"finance-streamer":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"stencil":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002F","root":"os\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-ads":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.321\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.321\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-charts":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.176\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.176\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"finance-yui-scripts":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.21\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.21\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-details":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.139\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.139\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-news":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.145\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.145\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-search":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.57\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.57\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quotes":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.10\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.10\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-options-table":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.99\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.99\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-finance-uh":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"assembler":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fassembler-0.3.88\u002F","root":"os\u002Fmit\u002Ftd\u002Fassembler-0.3.88\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-dev-info":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"dust-helpers":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.134\u002F","root":"os\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.134\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"}},"seed":["yui","loader-finance-td-app-mobile-web","loader-ape-af","loader-mjata","loader-ape-applet","loader-applet-server","loader-td-api","loader-finance-streamer","loader-stencil","loader-td-applet-ads","loader-td-applet-charts","loader-finance-yui-scripts","loader-td-applet-mw-quote-details","loader-td-applet-mw-quote-news","loader-td-applet-mw-quote-search","loader-td-applet-mw-quotes","loader-td-applet-options-table","loader-td-finance-uh","loader-assembler","loader-td-dev-info","loader-dust-helpers"],"extendedCore":["loader-finance-td-app-mobile-web","loader-ape-af","loader-mjata","loader-ape-applet","loader-applet-server","loader-td-api","loader-finance-streamer","loader-stencil","loader-td-applet-ads","loader-td-applet-charts","loader-finance-yui-scripts","loader-td-applet-mw-quote-details","loader-td-applet-mw-quote-news","loader-td-applet-mw-quote-search","loader-td-applet-mw-quotes","loader-td-applet-options-table","loader-td-finance-uh","loader-assembler","loader-td-dev-info","loader-dust-helpers"]};
-root.YUI_config || (root.YUI_config = {});
-root.YUI_config.seed = ["https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:3.17.2\u002Fyui\u002Fyui-min.js&os\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.305\u002Floader-finance-td-app-mobile-web\u002Floader-finance-td-app-mobile-web-min.js&os\u002Fmit\u002Ftd\u002Fape-af-0.0.314\u002Floader-ape-af\u002Floader-ape-af-min.js&os\u002Fmit\u002Ftd\u002Fmjata-0.4.33\u002Floader-mjata\u002Floader-mjata-min.js&os\u002Fmit\u002Ftd\u002Fape-applet-0.0.202\u002Floader-ape-applet\u002Floader-ape-applet-min.js&os\u002Fmit\u002Ftd\u002Fapplet-server-0.2.70\u002Floader-applet-server\u002Floader-applet-server-min.js&os\u002Fmit\u002Ftd\u002Ftd-api-0.1.69\u002Floader-td-api\u002Floader-td-api-min.js&os\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002Floader-finance-streamer\u002Floader-finance-streamer-min.js&os\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002Floader-stencil\u002Floader-stencil-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.321\u002Floader-td-applet-ads\u002Floader-td-applet-ads-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.176\u002Floader-td-applet-charts\u002Floader-td-applet-charts-min.js&os\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.21\u002Floader-finance-yui-scripts\u002Floader-finance-yui-scripts-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.139\u002Floader-td-applet-mw-quote-details\u002Floader-td-applet-mw-quote-details-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.145\u002Floader-td-applet-mw-quote-news\u002Floader-td-applet-mw-quote-news-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.57\u002Floader-td-applet-mw-quote-search\u002Floader-td-applet-mw-quote-search-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.10\u002Floader-td-applet-mw-quotes\u002Floader-td-applet-mw-quotes-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.99\u002Floader-td-applet-options-table\u002Floader-td-applet-options-table-min.js&os\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002Floader-td-finance-uh\u002Floader-td-finance-uh-min.js&os\u002Fmit\u002Ftd\u002Fassembler-0.3.88\u002Floader-assembler\u002Floader-assembler-min.js&os\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002Floader-td-dev-info\u002Floader-td-dev-info-min.js&os\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.134\u002Floader-dust-helpers\u002Floader-dust-helpers-min.js"];
-root.YUI_config.lang = "en-US";
-}(this));
-</script>
-
-        
-            
-<script type="text/javascript" src="https://s1.yimg.com/zz/combo?yui:/3.17.2/yui/yui-min.js&/os/mit/td/asset-loader-s-c1dd4607.js&/ss/rapid-3.21.js&/os/mit/media/m/header/header-uh3-finance-hardcoded-jsonblob-min-1583812.js"></script>
-
-<script>
-(function (root) {
-// -- Data --
-root.Af || (root.Af = {});
-root.Af.config || (root.Af.config = {});
-root.Af.config.transport || (root.Af.config.transport = {});
-root.Af.config.transport.xhr = "\u002F_td_charts_api";
-root.YUI || (root.YUI = {});
-root.YUI.Env || (root.YUI.Env = {});
-root.YUI.Env.Af || (root.YUI.Env.Af = {});
-root.YUI.Env.Af.settings || (root.YUI.Env.Af.settings = {});
-root.YUI.Env.Af.settings.transport || (root.YUI.Env.Af.settings.transport = {});
-root.YUI.Env.Af.settings.transport.xhr = "\u002F_td_charts_api";
-root.YUI.Env.Af.settings.beacon || (root.YUI.Env.Af.settings.beacon = {});
-root.YUI.Env.Af.settings.beacon.pathPrefix = "\u002F_td_charts_api\u002Fbeacon";
-root.app || (root.app = {});
-root.app.yui = {"use":function bootstrap() { var self = this, d = document, head = d.getElementsByTagName('head')[0], ie = /MSIE/.test(navigator.userAgent), pending = 0, callback = [], args = arguments, config = typeof YUI_config != "undefined" ? YUI_config : {}; function flush() { var l = callback.length, i; if (!self.YUI && typeof YUI == "undefined") { throw new Error("YUI was not injected correctly!"); } self.YUI = self.YUI || YUI; for (i = 0; i < l; i++) { callback.shift()(); } } function decrementRequestPending() { pending--; if (pending <= 0) { setTimeout(flush, 0); } else { load(); } } function createScriptNode(src) { var node = d.createElement('script'); if (node.async) { node.async = false; } if (ie) { node.onreadystatechange = function () { if (/loaded|complete/.test(this.readyState)) { this.onreadystatechange = null; decrementRequestPending(); } }; } else { node.onload = node.onerror = decrementRequestPending; } node.setAttribute('src', src); return node; } function load() { if (!config.seed) { throw new Error('YUI_config.seed array is required.'); } var seed = config.seed, l = seed.length, i, node; pending = pending || seed.length; self._injected = true; for (i = 0; i < l; i++) { node = createScriptNode(seed.shift()); head.appendChild(node); if (node.async !== false) { break; } } } callback.push(function () { var i; if (!self._Y) { self.YUI.Env.core.push.apply(self.YUI.Env.core, config.extendedCore || []); self._Y = self.YUI(); self.use = self._Y.use; if (config.patches && config.patches.length) { for (i = 0; i < config.patches.length; i += 1) { config.patches[i](self._Y, self._Y.Env._loader); } } } self._Y.use.apply(self._Y, args); }); self.YUI = self.YUI || (typeof YUI != "undefined" ? YUI : null); if (!self.YUI && !self._injected) { load(); } else if (pending <= 0) { flush(); } return this; },"ready":function (callback) { this.use(function () { callback(); }); }};
-root.routeMap = {"quote-details":{"path":"\u002Fq\u002F?","keys":[],"regexp":/^\/q\/?\/?$/i,"annotations":{"name":"quote-details","aliases":["quote-details"]}},"recent-quotes":{"path":"\u002Fquotes\u002F?","keys":[],"regexp":/^\/quotes\/?\/?$/i,"annotations":{"name":"recent-quotes","aliases":["recent-quotes"]}},"quote-chart":{"path":"\u002Fchart\u002F?","keys":[],"regexp":/^\/chart\/?\/?$/i,"annotations":{"name":"quote-chart","aliases":["quote-chart"]}},"desktop-chart":{"path":"\u002Fecharts\u002F?","keys":[],"regexp":/^\/echarts\/?\/?$/i,"annotations":{"name":"desktop-chart","aliases":["desktop-chart"]}},"options":{"path":"\u002Fq\u002Fop\u002F?","keys":[],"regexp":/^\/q\/op\/?\/?$/i,"annotations":{"name":"options","aliases":["options"]}}};
-root.genUrl = function (routeName, context) {
-        var route = routeMap[routeName],
-            path, keys, i, len, key, param, regex;
-
-        if (!route) { return ''; }
-
-        path = route.path;
-        keys = route.keys;
-
-        if (context && (len = keys.length)) {
-            for (i = 0; i < len; i += 1) {
-                key   = keys[i];
-                param = key.name || key;
-                regex = new RegExp('[:*]' + param + '\\b');
-                path  = path.replace(regex, context[param]);
-            }
-        }
-
-        // Replace missing params with empty strings.
-        return path.replace(/([:*])([\w\-]+)?/g, '');
-    };
-root.App || (root.App = {});
-root.App.Cache || (root.App.Cache = {});
-root.App.Cache.globals = {"config":{"hosts":{"_default":"finance.yahoo.com","production":"finance.yahoo.com","staging":"stage.finance.yahoo.com","functional.test":"qa1.finance.yahoo.com","smoke.test":"int1.finance.yahoo.com","development":"int1.finance.yahoo.com"},"dss":{"assetPath":"\u002Fpv\u002Fstatic\u002Flib\u002Fios-default-set_201312031214.js","pn":"yahoo_finance_us_web","secureAssetHost":"https:\u002F\u002Fs.yimg.com","assetHost":"http:\u002F\u002Fl.yimg.com","cookieName":"DSS"},"mrs":{"mrs_host":"mrs-ynews.mrs.o.yimg.com","key":"mrs.ynews.crumbkey","app_id":"ynews"},"title":"Yahoo Finance - Business Finance, Stock Market, Quotes, News","crumbKey":"touchdown.crumbkey","asset_combo":true,"asset_mode":"prod","asset_filter":"min","assets":{"js":[{"location":"bottom","value":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Fmedia\u002Fm\u002Fheader\u002Fheader-uh3-finance-hardcoded-jsonblob-min-1583812.js"}],"css":["css.master",{"location":"top","value":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Fmedia\u002Fm\u002Fquotes\u002Fquotes-search-gs-smartphone-min-1680382.css"}],"options":{"inc_init_bottom":"0","inc_rapid":"1","rapid_version":"3.21","yui_instance_location":"bottom"}},"cdn":{"comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&","prefixMap":{"http:\u002F\u002Fl.yimg.com\u002F":""},"base":"https:\u002F\u002Fs.yimg.com"},"prefix_map":{"http:\u002F\u002Fl.yimg.com\u002F":""},"xhrPath":"_td_charts_api","adsEnabled":true,"ads":{"position":{"LREC":{"w":"300","h":"265"},"FB2-1":{"w":"198","h":"60"},"FB2-2":{"w":"198","h":"60"},"FB2-3":{"w":"198","h":"60"},"FB2-4":{"w":"198","h":"60"},"LDRP":{"w":"320","h":"76","metaSize":true},"WBTN":{"w":"120","h":"60"},"WBTN-1":{"w":"120","h":"60"},"FB2-0":{"w":"120","h":"60"},"SKY":{"w":"160","h":"600"}}},"spaceid":"2022773886","urlSpaceId":"true","urlSpaceIdMap":{"quotes":"980779717","q\u002Fop":"28951412","q":"980779724"},"rapidSettings":{"webworker_file":"\u002Frapid-worker.js","client_only":1,"keys":{"version":"td app","site":"mobile-web-quotes"},"ywa":{"project_id":"1000911397279","document_group":"interactive-chart","host":"y.analytics.yahoo.com"},"ywaMappingAction":{"click":12,"hvr":115,"rottn":128,"drag":105},"ywaMappingCf":{"_p":20,"ad":58,"authfb":11,"bpos":24,"camp":54,"cat":25,"code":55,"cpos":21,"ct":23,"dcl":26,"dir":108,"domContentLoadedEventEnd":44,"elm":56,"elmt":57,"f":40,"ft":51,"grpt":109,"ilc":39,"itc":111,"loadEventEnd":45,"ltxt":17,"mpos":110,"mrkt":12,"pcp":67,"pct":48,"pd":46,"pkgt":22,"pos":20,"prov":114,"psp":72,"pst":68,"pstcat":47,"pt":13,"rescode":27,"responseEnd":43,"responseStart":41,"rspns":107,"sca":53,"sec":18,"site":42,"slk":19,"sort":28,"t1":121,"t2":122,"t3":123,"t4":124,"t5":125,"t6":126,"t7":127,"t8":128,"t9":129,"tar":113,"test":14,"v":52,"ver":49,"x":50},"tracked_mods":["yfi_investing_nav","chart-details"],"nofollow_class":[]},"property":"finance","uh":{"experience":"GS"},"loginRedirectHost":"finance.yahoo.com","default_ticker":"YHOO","default_market_tickers":["^DJI","^IXIC"],"uhAssetsBase":"https:\u002F\u002Fs.yimg.com","sslEnabled":true,"layout":"options","packageName":"finance-td-app-mobile-web","customActions":{"before":[function (req, res, data, callback) {
-    var header,
-        config = req.config(),
-        path = req.path;
-
-    if (req.i13n && req.i13n.stampNonClassified) {
-        //console.log('=====> [universal_header] page stamped: ' + req.i13n.isStamped() + ' with spaceid ' + req.i13n.getSpaceid());
-        req.i13n.stampNonClassified(config.spaceid);
-    }
-    config.uh = config.uh || {};
-    config.uh.experience = config.uh.experience || 'uh3';
-
-    req.query.experience = config.uh.experience;
-    req.query.property = 'finance';
-    header = finUH.getMarkup(req);
-
-    res.locals = res.locals || {};
-
-    if (header.sidebar) {
-        res.locals.sidebar_css = header.sidebar.uh_css;
-        res.locals.sidebar_js = header.sidebar.uh_js;
-        data.sidebar_markup = header.sidebar.uh_markup;
-    }
-
-    res.locals.uh_css = header.uh_css;
-    res.locals.uh_js = header.uh_js;
-    data.uh_markup = header.uh_markup;
-    //TODO - localize these strings
-    if (path && path.indexOf('op') > -1) {
-        res.locals.page_title = parseSymbol(req.query.s) + " Option Chain | Yahoo! Inc. Stock - Yahoo! Finance";
-    } else if (path && ((path.indexOf('echarts') > -1) || (path.indexOf('q') > -1))) {
-        res.locals.page_title = parseSymbol(req.query.s) + " Interactive Stock Chart | Yahoo! Inc. Stock - Yahoo! Finance";
-    } else {
-        res.locals.page_title = config.title;
-    }
-    callback();
-},function (req, res, data, next) {
-    /* this would invoke the ESI plugin on YTS */
-    res.parentRes.set('X-Esi', '1');
-
-    var hosts = req.config().hosts,
-        hostToSet = hosts._default;
-
-    Object.keys(hosts).some(function (host) {
-        if (req.headers.host.indexOf(host) >= 0) {
-            hostToSet = hosts[host];
-            return true;
-        }
-    });
-
-    /* saving request host server name for esi end point */
-    res.locals.requesturl = {
-        host: hostToSet
-    };
-
-     /* saving header x-yahoo-request-url for Darla configuration */
-    res.locals.requestxhosturl = req.headers['x-env-host'] ? {host: req.headers['x-env-host']} : {host: hostToSet};
-
-    //urlPath is used for ./node_modules/assembler/node_modules/dust-helpers/lib/util.js::getSpaceId()
-    //see: https://git.corp.yahoo.com/sports/sportacular-web
-    req.context.urlPath = req.path;
-
-    // console.log(JSON.stringify({
-    //     requesturl: res.locals.requesturl.host,
-    //     requestxhosturl: res.locals.requestxhosturl,
-    //     urlPath: req.context.urlPath
-    // }));
-
-    next();
-},function (req, res, data, callback) {
-
-    res.locals = res.locals || {};
-    if (req.query && req.query.s) {
-        res.locals.quote = req.query.s;
-    }
-
-    callback();
-},function (req, res, data, callback) {
-    var params,
-        ticker,
-        config, i;
-
-    req = req || {};
-    req.params = req.params || {};
-
-    config = req.config() || {};
-
-
-    data = data || {};
-
-    params = req.params || {};
-    ticker = (params.ticker || (req.query && req.query.s) || 'YHOO').toUpperCase();
-    ticker = ticker.split('+')[0];//Split on + if it's in the ticker
-    ticker = ticker.split(' ')[0];//Split on space if it's in the ticker
-
-    params.tickers = [];
-    if (config.default_market_tickers) {
-        params.tickers = params.tickers.concat(config.default_market_tickers);
-    }
-    params.tickers.push(ticker);
-    params.tickers = params.tickers.join(',');
-    params.format = 'inflated';
-
-    //Move this into a new action
-    res.locals.isTablet = config.isTablet;
-
-    quoteStore.read('finance_quote', params, req, function (err, qData) {
-        if (!err && qData.quotes && qData.quotes.length > 0) {
-            res.locals.quoteData = qData;
-            for (i = 0; i < qData.quotes.length; i = i +  1) {
-                if (qData.quotes[i].symbol.toUpperCase() === ticker.toUpperCase()) {
-                    params.ticker_securityType = qData.quotes[i].type;
-                }
-            }
-            params.tickers = ticker;
-        }
-        callback();
-    });
-},function (req, res, data, callback) {
-
-    marketTimeStore.read('markettime', {}, req, function (err, data) {
-        if (data && data.index) {
-            res.parentRes.locals.markettime = data.index.markettime;
-        }
-        callback();
-    });
-}],"after":[]}},"context":{"authed":"0","ynet":"0","ssl":"1","spdy":"0","bucket":"","colo":"gq1","device":"desktop","environment":"prod","lang":"en-US","partner":"none","site":"finance","region":"US","intl":"us","tz":"America\u002FLos_Angeles","edgepipeEnabled":false,"urlPath":"\u002Fq\u002Fop"},"intl":{"locales":"en-US"},"user":{"crumb":"ly1MJzURQo0"}};
-root.YUI_config = {"version":"3.17.2","base":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:3.17.2\u002F","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&","root":"yui:3.17.2\u002F","filter":"min","logLevel":"error","combine":true,"patches":[function patchLangBundlesRequires(Y, loader) {
-    var getRequires = loader.getRequires;
-    loader.getRequires = function (mod) {
-        var i, j, m, name, mods, loadDefaultBundle,
-            locales = Y.config.lang || [],
-            r = getRequires.apply(this, arguments);
-        // expanding requirements with optional requires
-        if (mod.langBundles && !mod.langBundlesExpanded) {
-            mod.langBundlesExpanded = [];
-            locales = typeof locales === 'string' ? [locales] : locales.concat();
-            for (i = 0; i < mod.langBundles.length; i += 1) {
-                mods = [];
-                loadDefaultBundle = false;
-                name = mod.group + '-lang-' + mod.langBundles[i];
-                for (j = 0; j < locales.length; j += 1) {
-                    m = this.getModule(name + '_' + locales[j].toLowerCase());
-                    if (m) {
-                        mods.push(m);
-                    } else {
-                        // if one of the requested locales is missing,
-                        // the default lang should be fetched
-                        loadDefaultBundle = true;
-                    }
-                }
-                if (!mods.length || loadDefaultBundle) {
-                    // falling back to the default lang bundle when needed
-                    m = this.getModule(name);
-                    if (m) {
-                        mods.push(m);
-                    }
-                }
-                // adding requirements for each lang bundle
-                // (duplications are not a problem since they will be deduped)
-                for (j = 0; j < mods.length; j += 1) {
-                    mod.langBundlesExpanded = mod.langBundlesExpanded.concat(this.getRequires(mods[j]), [mods[j].name]);
-                }
-            }
-        }
-        return mod.langBundlesExpanded && mod.langBundlesExpanded.length ?
-                [].concat(mod.langBundlesExpanded, r) : r;
-    };
-}],"modules":{"IntlPolyfill":{"fullpath":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:platform\u002Fintl\u002F0.1.4\u002FIntl.min.js&yui:platform\u002Fintl\u002F0.1.4\u002Flocale-data\u002Fjsonp\u002F{lang}.js","condition":{"name":"IntlPolyfill","trigger":"intl-messageformat","test":function (Y) {
-                        return !Y.config.global.Intl;
-                    },"when":"before"},"configFn":function (mod) {
-                    var lang = 'en-US';
-                    if (window.YUI_config && window.YUI_config.lang && window.IntlAvailableLangs && window.IntlAvailableLangs[window.YUI_config.lang]) {
-                        lang = window.YUI_config.lang;
-                    }
-                    mod.fullpath = mod.fullpath.replace('{lang}', lang);
-                    return true;
-                }}},"groups":{"finance-td-app-mobile-web":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.305\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.305\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"ape-af":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fape-af-0.0.314\u002F","root":"os\u002Fmit\u002Ftd\u002Fape-af-0.0.314\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"mjata":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fmjata-0.4.33\u002F","root":"os\u002Fmit\u002Ftd\u002Fmjata-0.4.33\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"ape-applet":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fape-applet-0.0.202\u002F","root":"os\u002Fmit\u002Ftd\u002Fape-applet-0.0.202\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"applet-server":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fapplet-server-0.2.70\u002F","root":"os\u002Fmit\u002Ftd\u002Fapplet-server-0.2.70\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-api":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-api-0.1.69\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-api-0.1.69\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"finance-streamer":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"stencil":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002F","root":"os\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-ads":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.321\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.321\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-charts":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.176\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.176\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"finance-yui-scripts":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.21\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.21\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-details":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.139\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.139\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-news":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.145\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.145\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-search":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.57\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.57\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quotes":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.10\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.10\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-options-table":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.99\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.99\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-finance-uh":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"assembler":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fassembler-0.3.88\u002F","root":"os\u002Fmit\u002Ftd\u002Fassembler-0.3.88\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-dev-info":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"dust-helpers":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.134\u002F","root":"os\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.134\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"}},"seed":["yui","loader-finance-td-app-mobile-web","loader-ape-af","loader-mjata","loader-ape-applet","loader-applet-server","loader-td-api","loader-finance-streamer","loader-stencil","loader-td-applet-ads","loader-td-applet-charts","loader-finance-yui-scripts","loader-td-applet-mw-quote-details","loader-td-applet-mw-quote-news","loader-td-applet-mw-quote-search","loader-td-applet-mw-quotes","loader-td-applet-options-table","loader-td-finance-uh","loader-assembler","loader-td-dev-info","loader-dust-helpers"],"extendedCore":["loader-finance-td-app-mobile-web","loader-ape-af","loader-mjata","loader-ape-applet","loader-applet-server","loader-td-api","loader-finance-streamer","loader-stencil","loader-td-applet-ads","loader-td-applet-charts","loader-finance-yui-scripts","loader-td-applet-mw-quote-details","loader-td-applet-mw-quote-news","loader-td-applet-mw-quote-search","loader-td-applet-mw-quotes","loader-td-applet-options-table","loader-td-finance-uh","loader-assembler","loader-td-dev-info","loader-dust-helpers"]};
-root.YUI_config || (root.YUI_config = {});
-root.YUI_config.seed = ["https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:3.17.2\u002Fyui\u002Fyui-min.js&os\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.305\u002Floader-finance-td-app-mobile-web\u002Floader-finance-td-app-mobile-web-min.js&os\u002Fmit\u002Ftd\u002Fape-af-0.0.314\u002Floader-ape-af\u002Floader-ape-af-min.js&os\u002Fmit\u002Ftd\u002Fmjata-0.4.33\u002Floader-mjata\u002Floader-mjata-min.js&os\u002Fmit\u002Ftd\u002Fape-applet-0.0.202\u002Floader-ape-applet\u002Floader-ape-applet-min.js&os\u002Fmit\u002Ftd\u002Fapplet-server-0.2.70\u002Floader-applet-server\u002Floader-applet-server-min.js&os\u002Fmit\u002Ftd\u002Ftd-api-0.1.69\u002Floader-td-api\u002Floader-td-api-min.js&os\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002Floader-finance-streamer\u002Floader-finance-streamer-min.js&os\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002Floader-stencil\u002Floader-stencil-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.321\u002Floader-td-applet-ads\u002Floader-td-applet-ads-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.176\u002Floader-td-applet-charts\u002Floader-td-applet-charts-min.js&os\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.21\u002Floader-finance-yui-scripts\u002Floader-finance-yui-scripts-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.139\u002Floader-td-applet-mw-quote-details\u002Floader-td-applet-mw-quote-details-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.145\u002Floader-td-applet-mw-quote-news\u002Floader-td-applet-mw-quote-news-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.57\u002Floader-td-applet-mw-quote-search\u002Floader-td-applet-mw-quote-search-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.10\u002Floader-td-applet-mw-quotes\u002Floader-td-applet-mw-quotes-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.99\u002Floader-td-applet-options-table\u002Floader-td-applet-options-table-min.js&os\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002Floader-td-finance-uh\u002Floader-td-finance-uh-min.js&os\u002Fmit\u002Ftd\u002Fassembler-0.3.88\u002Floader-assembler\u002Floader-assembler-min.js&os\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002Floader-td-dev-info\u002Floader-td-dev-info-min.js&os\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.134\u002Floader-dust-helpers\u002Floader-dust-helpers-min.js"];
-root.YUI_config.lang = "en-US";
-}(this));
-</script>
-<script>YMedia = YUI({"combine":true,"filter":"min","maxURLLength":2000});</script><script>if (YMedia.config.patches && YMedia.config.patches.length) {for (var i = 0; i < YMedia.config.patches.length; i += 1) {YMedia.config.patches[i](YMedia, YMedia.Env._loader);}}</script>
-<script>YMedia.applyConfig({"groups":{"td-applet-mw-quote-search":{"base":"https://s1.yimg.com/os/mit/td/td-applet-mw-quote-search-1.2.57/","root":"os/mit/td/td-applet-mw-quote-search-1.2.57/","combine":true,"filter":"min","comboBase":"https://s.yimg.com/zz/combo?","comboSep":"&"}}});</script><script>window.Af=window.Af||{};window.Af.bootstrap=window.Af.bootstrap||{};window.Af.bootstrap["7416600208709417"] = {"applet_type":"td-applet-mw-quote-search","views":{"main":{"yui_module":"td-applet-quotesearch-desktopview","yui_class":"TD.Applet.QuotesearchDesktopView","config":{"type":"lookup"}}},"templates":{"main":{"yui_module":"td-applet-mw-quote-search-templates-main","template_name":"td-applet-mw-quote-search-templates-main"},"lookup":{"yui_module":"td-applet-mw-quote-search-templates-lookup","template_name":"td-applet-mw-quote-search-templates-lookup"}},"i18n":{"TITLE":"quotesearch"},"transport":{"xhr":"/_td_charts_api"},"context":{"bucket":"","crumb":"ly1MJzURQo0","device":"desktop","lang":"en-US","region":"US","site":"finance"}};</script>
-<script>YMedia.applyConfig({"groups":{"td-applet-mw-quote-search":{"base":"https://s1.yimg.com/os/mit/td/td-applet-mw-quote-search-1.2.57/","root":"os/mit/td/td-applet-mw-quote-search-1.2.57/","combine":true,"filter":"min","comboBase":"https://s.yimg.com/zz/combo?","comboSep":"&"}}});</script><script>window.Af=window.Af||{};window.Af.bootstrap=window.Af.bootstrap||{};window.Af.bootstrap["7416600209608762"] = {"applet_type":"td-applet-mw-quote-search","views":{"main":{"yui_module":"td-applet-quotesearch-desktopview","yui_class":"TD.Applet.QuotesearchDesktopView","config":{"type":"options"}}},"templates":{"main":{"yui_module":"td-applet-mw-quote-search-templates-main","template_name":"td-applet-mw-quote-search-templates-main"},"lookup":{"yui_module":"td-applet-mw-quote-search-templates-lookup","template_name":"td-applet-mw-quote-search-templates-lookup"}},"i18n":{"TITLE":"quotesearch"},"transport":{"xhr":"/_td_charts_api"},"context":{"bucket":"","crumb":"ly1MJzURQo0","device":"desktop","lang":"en-US","region":"US","site":"finance"}};</script>
-<script>YMedia.applyConfig({"groups":{"td-applet-options-table":{"base":"https://s.yimg.com/os/mit/td/td-applet-options-table-0.1.99/","root":"os/mit/td/td-applet-options-table-0.1.99/","combine":true,"filter":"min","comboBase":"https://s.yimg.com/zz/combo?","comboSep":"&"}}});</script><script>window.Af=window.Af||{};window.Af.bootstrap=window.Af.bootstrap||{};window.Af.bootstrap["7416600209231742"] = {"applet_type":"td-applet-options-table","models":{"options-table":{"yui_module":"td-options-table-model","yui_class":"TD.Options-table.Model"},"applet_model":{"models":["options-table"],"data":{"optionData":{"underlyingSymbol":"AAPL","expirationDates":["2014-11-07T00:00:00.000Z","2014-11-14T00:00:00.000Z","2014-11-22T00:00:00.000Z","2014-11-28T00:00:00.000Z","2014-12-05T00:00:00.000Z","2014-12-12T00:00:00.000Z","2014-12-20T00:00:00.000Z","2015-01-17T00:00:00.000Z","2015-02-20T00:00:00.000Z","2015-04-17T00:00:00.000Z","2015-07-17T00:00:00.000Z","2016-01-15T00:00:00.000Z","2017-01-20T00:00:00.000Z"],"hasMiniOptions":false,"quote":{"preMarketChange":0.48010254,"preMarketChangePercent":0.44208378,"preMarketTime":1415197791,"preMarketPrice":109.08,"preMarketSource":"FREE_REALTIME","postMarketChange":0,"postMarketChangePercent":0,"postMarketTime":1415235599,"postMarketPrice":108.86,"postMarketSource":"DELAYED","regularMarketChange":0.26000214,"regularMarketChangePercent":0.23941265,"regularMarketTime":1415221200,"regularMarketPrice":108.86,"regularMarketDayHigh":109.3,"regularMarketDayLow":108.125,"regularMarketVolume":33511800,"regularMarketPreviousClose":108.6,"regularMarketSource":"FREE_REALTIME","regularMarketOpen":109.19,"exchange":"NMS","quoteType":"EQUITY","symbol":"AAPL","currency":"USD"},"options":{"calls":[{"contractSymbol":"AAPL141107C00060000","currency":"USD","volume":60,"openInterest":61,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":-1.9076321,"impliedVolatilityRaw":3.2343769140624996,"strike":"60.00","lastPrice":"48.85","change":"-0.95","percentChange":"-1.91","bid":"48.65","ask":"48.90","impliedVolatility":"323.44"},{"contractSymbol":"AAPL141107C00075000","currency":"USD","volume":1,"openInterest":1,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":2.50781623046875,"strike":"75.00","lastPrice":"30.05","change":"0.00","percentChange":"0.00","bid":"33.65","ask":"34.00","impliedVolatility":"250.78"},{"contractSymbol":"AAPL141107C00080000","currency":"USD","volume":16,"openInterest":8,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":2.348754,"impliedVolatilityRaw":1.78125109375,"strike":"80.00","lastPrice":"28.76","change":"0.66","percentChange":"+2.35","bid":"28.65","ask":"28.90","impliedVolatility":"178.13"},{"contractSymbol":"AAPL141107C00085000","currency":"USD","volume":600,"openInterest":297,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":-0.29326183,"impliedVolatilityRaw":1.4609401953124999,"strike":"85.00","lastPrice":"23.80","change":"-0.07","percentChange":"-0.29","bid":"23.65","ask":"23.90","impliedVolatility":"146.09"},{"contractSymbol":"AAPL141107C00088000","currency":"USD","volume":90,"openInterest":90,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":-2.112671,"impliedVolatilityRaw":1.2812535937499998,"strike":"88.00","lastPrice":"20.85","change":"-0.45","percentChange":"-2.11","bid":"20.70","ask":"20.90","impliedVolatility":"128.13"},{"contractSymbol":"AAPL141107C00089000","currency":"USD","volume":290,"openInterest":135,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":8.255868,"impliedVolatilityRaw":1.21875390625,"strike":"89.00","lastPrice":"19.80","change":"1.51","percentChange":"+8.26","bid":"19.70","ask":"19.90","impliedVolatility":"121.88"},{"contractSymbol":"AAPL141107C00090000","currency":"USD","volume":480,"openInterest":227,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":1.0723902,"impliedVolatilityRaw":1.1640666796875,"strike":"90.00","lastPrice":"18.85","change":"0.20","percentChange":"+1.07","bid":"18.70","ask":"18.90","impliedVolatility":"116.41"},{"contractSymbol":"AAPL141107C00091000","currency":"USD","volume":43,"openInterest":43,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":7.6363654,"impliedVolatilityRaw":1.1015669921875002,"strike":"91.00","lastPrice":"17.76","change":"1.26","percentChange":"+7.64","bid":"17.65","ask":"17.90","impliedVolatility":"110.16"},{"contractSymbol":"AAPL141107C00092000","currency":"USD","volume":240,"openInterest":142,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":5.230387,"impliedVolatilityRaw":1.0429735351562504,"strike":"92.00","lastPrice":"16.90","change":"0.84","percentChange":"+5.23","bid":"16.65","ask":"16.90","impliedVolatility":"104.30"},{"contractSymbol":"AAPL141107C00093000","currency":"USD","volume":121,"openInterest":96,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":-6.546542,"impliedVolatilityRaw":0.98437515625,"strike":"93.00","lastPrice":"15.56","change":"-1.09","percentChange":"-6.55","bid":"15.65","ask":"15.90","impliedVolatility":"98.44"},{"contractSymbol":"AAPL141107C00094000","currency":"USD","volume":981,"openInterest":510,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":14.472672,"impliedVolatilityRaw":0.9257819921875,"strike":"94.00","lastPrice":"14.87","change":"1.88","percentChange":"+14.47","bid":"14.65","ask":"14.90","impliedVolatility":"92.58"},{"contractSymbol":"AAPL141107C00095000","currency":"USD","volume":4116,"openInterest":1526,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":0.5098372,"impliedVolatilityRaw":0.867188828125,"strike":"95.00","lastPrice":"13.80","change":"0.07","percentChange":"+0.51","bid":"13.65","ask":"13.90","impliedVolatility":"86.72"},{"contractSymbol":"AAPL141107C00096000","currency":"USD","volume":891,"openInterest":413,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":1.5686259,"impliedVolatilityRaw":0.8125018749999999,"strike":"96.00","lastPrice":"12.95","change":"0.20","percentChange":"+1.57","bid":"12.65","ask":"12.90","impliedVolatility":"81.25"},{"contractSymbol":"AAPL141107C00097000","currency":"USD","volume":1423,"openInterest":719,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":0.1705069,"impliedVolatilityRaw":0.7500025,"strike":"97.00","lastPrice":"11.75","change":"0.02","percentChange":"+0.17","bid":"11.65","ask":"11.90","impliedVolatility":"75.00"},{"contractSymbol":"AAPL141107C00098000","currency":"USD","volume":2075,"openInterest":1130,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":-0.27958745,"impliedVolatilityRaw":0.6953155468750001,"strike":"98.00","lastPrice":"10.70","change":"-0.03","percentChange":"-0.28","bid":"10.65","ask":"10.90","impliedVolatility":"69.53"},{"contractSymbol":"AAPL141107C00099000","currency":"USD","volume":4252,"openInterest":3893,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":1.0362734,"impliedVolatilityRaw":0.6367223828125,"strike":"99.00","lastPrice":"9.75","change":"0.10","percentChange":"+1.04","bid":"9.70","ask":"9.90","impliedVolatility":"63.67"},{"contractSymbol":"AAPL141107C00100000","currency":"USD","volume":22067,"openInterest":7752,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":true,"percentChangeRaw":-0.45045,"impliedVolatilityRaw":0.57812921875,"strike":"100.00","lastPrice":"8.84","change":"-0.04","percentChange":"-0.45","bid":"8.75","ask":"8.90","impliedVolatility":"57.81"},{"contractSymbol":"AAPL141107C00101000","currency":"USD","volume":6048,"openInterest":1795,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":true,"percentChangeRaw":0.5154634,"impliedVolatilityRaw":0.5195360546875,"strike":"101.00","lastPrice":"7.80","change":"0.04","percentChange":"+0.52","bid":"7.75","ask":"7.90","impliedVolatility":"51.95"},{"contractSymbol":"AAPL141107C00102000","currency":"USD","volume":3488,"openInterest":2828,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":true,"percentChangeRaw":1.4705868,"impliedVolatilityRaw":0.46094289062500005,"strike":"102.00","lastPrice":"6.90","change":"0.10","percentChange":"+1.47","bid":"6.75","ask":"6.90","impliedVolatility":"46.09"},{"contractSymbol":"AAPL141107C00103000","currency":"USD","volume":7725,"openInterest":3505,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221199,"inTheMoney":true,"percentChangeRaw":2.6315806,"impliedVolatilityRaw":0.40430283203125,"strike":"103.00","lastPrice":"5.85","change":"0.15","percentChange":"+2.63","bid":"5.75","ask":"5.90","impliedVolatility":"40.43"},{"contractSymbol":"AAPL141107C00104000","currency":"USD","volume":6271,"openInterest":3082,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221141,"inTheMoney":true,"percentChangeRaw":4.3478327,"impliedVolatilityRaw":0.3437565625,"strike":"104.00","lastPrice":"4.80","change":"0.20","percentChange":"+4.35","bid":"4.75","ask":"4.90","impliedVolatility":"34.38"},{"contractSymbol":"AAPL141107C00105000","currency":"USD","volume":16703,"openInterest":6176,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221143,"inTheMoney":true,"percentChangeRaw":5.5555573,"impliedVolatilityRaw":0.28516339843749994,"strike":"105.00","lastPrice":"3.80","change":"0.20","percentChange":"+5.56","bid":"3.75","ask":"3.90","impliedVolatility":"28.52"},{"contractSymbol":"AAPL141107C00106000","currency":"USD","volume":21589,"openInterest":9798,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221138,"inTheMoney":true,"percentChangeRaw":6.1068735,"impliedVolatilityRaw":0.17188328125000002,"strike":"106.00","lastPrice":"2.78","change":"0.16","percentChange":"+6.11","bid":"2.78","ask":"2.87","impliedVolatility":"17.19"},{"contractSymbol":"AAPL141107C00107000","currency":"USD","volume":22126,"openInterest":13365,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221173,"inTheMoney":true,"percentChangeRaw":3.9772756,"impliedVolatilityRaw":0.062509375,"strike":"107.00","lastPrice":"1.83","change":"0.07","percentChange":"+3.98","bid":"1.78","ask":"1.86","impliedVolatility":"6.25"},{"contractSymbol":"AAPL141107C00108000","currency":"USD","volume":15256,"openInterest":14521,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221188,"inTheMoney":true,"percentChangeRaw":-12.244898,"impliedVolatilityRaw":0.088876298828125,"strike":"108.00","lastPrice":"0.86","change":"-0.12","percentChange":"-12.24","bid":"0.87","ask":"0.90","impliedVolatility":"8.89"},{"contractSymbol":"AAPL141107C00109000","currency":"USD","volume":30797,"openInterest":25097,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221199,"inTheMoney":false,"percentChangeRaw":-22.916664,"impliedVolatilityRaw":0.13868048828125001,"strike":"109.00","lastPrice":"0.37","change":"-0.11","percentChange":"-22.92","bid":"0.36","ask":"0.38","impliedVolatility":"13.87"},{"contractSymbol":"AAPL141107C00110000","currency":"USD","volume":27366,"openInterest":44444,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221197,"inTheMoney":false,"percentChangeRaw":-33.333332,"impliedVolatilityRaw":0.16700051757812504,"strike":"110.00","lastPrice":"0.14","change":"-0.07","percentChange":"-33.33","bid":"0.14","ask":"0.15","impliedVolatility":"16.70"},{"contractSymbol":"AAPL141107C00111000","currency":"USD","volume":10243,"openInterest":17981,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221137,"inTheMoney":false,"percentChangeRaw":-44.444447,"impliedVolatilityRaw":0.18360191406249998,"strike":"111.00","lastPrice":"0.05","change":"-0.04","percentChange":"-44.44","bid":"0.04","ask":"0.05","impliedVolatility":"18.36"},{"contractSymbol":"AAPL141107C00112000","currency":"USD","volume":2280,"openInterest":13500,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221131,"inTheMoney":false,"percentChangeRaw":-33.333336,"impliedVolatilityRaw":0.22071091796874998,"strike":"112.00","lastPrice":"0.02","change":"-0.01","percentChange":"-33.33","bid":"0.02","ask":"0.03","impliedVolatility":"22.07"},{"contractSymbol":"AAPL141107C00113000","currency":"USD","volume":582,"openInterest":9033,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.257819921875,"strike":"113.00","lastPrice":"0.02","change":"0.00","percentChange":"0.00","bid":"0.01","ask":"0.02","impliedVolatility":"25.78"},{"contractSymbol":"AAPL141107C00114000","currency":"USD","volume":496,"openInterest":5402,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.3086006640625,"strike":"114.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00","bid":"0.01","ask":"0.02","impliedVolatility":"30.86"},{"contractSymbol":"AAPL141107C00115000","currency":"USD","volume":1965,"openInterest":4971,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.35547519531249994,"strike":"115.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.02","impliedVolatility":"35.55"},{"contractSymbol":"AAPL141107C00116000","currency":"USD","volume":71,"openInterest":2303,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.367193828125,"strike":"116.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"36.72"},{"contractSymbol":"AAPL141107C00117000","currency":"USD","volume":2,"openInterest":899,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.4062559375,"strike":"117.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"40.63"},{"contractSymbol":"AAPL141107C00118000","currency":"USD","volume":30,"openInterest":38,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.45313046875,"strike":"118.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"45.31"},{"contractSymbol":"AAPL141107C00119000","currency":"USD","volume":935,"openInterest":969,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.49219257812500006,"strike":"119.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"49.22"},{"contractSymbol":"AAPL141107C00120000","currency":"USD","volume":3800,"openInterest":558,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.500005,"strike":"120.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"50.00"},{"contractSymbol":"AAPL141107C00123000","currency":"USD","volume":176,"openInterest":176,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.5937540625000001,"strike":"123.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"59.38"},{"contractSymbol":"AAPL141107C00130000","currency":"USD","volume":10,"openInterest":499,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.8437515624999999,"strike":"130.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"84.38"}],"puts":[{"contractSymbol":"AAPL141107P00070000","currency":"USD","volume":10,"openInterest":295,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.96875015625,"strike":"70.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"196.88"},{"contractSymbol":"AAPL141107P00075000","currency":"USD","volume":525,"openInterest":2086,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.8125009374999999,"strike":"75.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.02","impliedVolatility":"181.25"},{"contractSymbol":"AAPL141107P00080000","currency":"USD","volume":3672,"openInterest":7955,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221200,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.4375028125,"strike":"80.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"143.75"},{"contractSymbol":"AAPL141107P00085000","currency":"USD","volume":2120,"openInterest":1425,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.2968785156249998,"strike":"85.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.01","ask":"0.02","impliedVolatility":"129.69"},{"contractSymbol":"AAPL141107P00088000","currency":"USD","volume":301,"openInterest":1072,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.09375453125,"strike":"88.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.02","impliedVolatility":"109.38"},{"contractSymbol":"AAPL141107P00089000","currency":"USD","volume":211,"openInterest":760,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.0781296093750001,"strike":"89.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.01","ask":"0.02","impliedVolatility":"107.81"},{"contractSymbol":"AAPL141107P00090000","currency":"USD","volume":4870,"openInterest":3693,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":1.0312548437500002,"strike":"90.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00","bid":"0.01","ask":"0.02","impliedVolatility":"103.13"},{"contractSymbol":"AAPL141107P00091000","currency":"USD","volume":333,"openInterest":1196,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.9687503125,"strike":"91.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00","bid":"0.01","ask":"0.02","impliedVolatility":"96.88"},{"contractSymbol":"AAPL141107P00092000","currency":"USD","volume":4392,"openInterest":1294,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.92187578125,"strike":"92.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00","bid":"0.01","ask":"0.02","impliedVolatility":"92.19"},{"contractSymbol":"AAPL141107P00093000","currency":"USD","volume":3780,"openInterest":778,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.8984385156249999,"strike":"93.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00","bid":"0.01","ask":"0.03","impliedVolatility":"89.84"},{"contractSymbol":"AAPL141107P00094000","currency":"USD","volume":1463,"openInterest":5960,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221194,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.867188828125,"strike":"94.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00","bid":"0.02","ask":"0.03","impliedVolatility":"86.72"},{"contractSymbol":"AAPL141107P00095000","currency":"USD","volume":2098,"openInterest":11469,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.8125018749999999,"strike":"95.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00","bid":"0.02","ask":"0.03","impliedVolatility":"81.25"},{"contractSymbol":"AAPL141107P00096000","currency":"USD","volume":4163,"openInterest":3496,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221065,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.7578149218750001,"strike":"96.00","lastPrice":"0.03","change":"0.00","percentChange":"0.00","bid":"0.02","ask":"0.03","impliedVolatility":"75.78"},{"contractSymbol":"AAPL141107P00097000","currency":"USD","volume":4364,"openInterest":1848,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221072,"inTheMoney":false,"percentChangeRaw":50,"impliedVolatilityRaw":0.7187528125,"strike":"97.00","lastPrice":"0.03","change":"0.01","percentChange":"+50.00","bid":"0.02","ask":"0.04","impliedVolatility":"71.88"},{"contractSymbol":"AAPL141107P00098000","currency":"USD","volume":1960,"openInterest":6036,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221129,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.6640658593750002,"strike":"98.00","lastPrice":"0.02","change":"0.00","percentChange":"0.00","bid":"0.02","ask":"0.04","impliedVolatility":"66.41"},{"contractSymbol":"AAPL141107P00099000","currency":"USD","volume":852,"openInterest":5683,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.6093789062500001,"strike":"99.00","lastPrice":"0.04","change":"0.02","percentChange":"+100.00","bid":"0.02","ask":"0.04","impliedVolatility":"60.94"},{"contractSymbol":"AAPL141107P00100000","currency":"USD","volume":2204,"openInterest":4774,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221185,"inTheMoney":false,"percentChangeRaw":50,"impliedVolatilityRaw":0.57812921875,"strike":"100.00","lastPrice":"0.03","change":"0.01","percentChange":"+50.00","bid":"0.03","ask":"0.05","impliedVolatility":"57.81"},{"contractSymbol":"AAPL141107P00101000","currency":"USD","volume":3596,"openInterest":2621,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":false,"percentChangeRaw":33.333336,"impliedVolatilityRaw":0.5195360546875,"strike":"101.00","lastPrice":"0.04","change":"0.01","percentChange":"+33.33","bid":"0.03","ask":"0.05","impliedVolatility":"51.95"},{"contractSymbol":"AAPL141107P00102000","currency":"USD","volume":2445,"openInterest":7791,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":false,"percentChangeRaw":25.000006,"impliedVolatilityRaw":0.4804739453125,"strike":"102.00","lastPrice":"0.05","change":"0.01","percentChange":"+25.00","bid":"0.04","ask":"0.05","impliedVolatility":"48.05"},{"contractSymbol":"AAPL141107P00103000","currency":"USD","volume":8386,"openInterest":7247,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221191,"inTheMoney":false,"percentChangeRaw":25.000006,"impliedVolatilityRaw":0.42188078125,"strike":"103.00","lastPrice":"0.05","change":"0.01","percentChange":"+25.00","bid":"0.04","ask":"0.05","impliedVolatility":"42.19"},{"contractSymbol":"AAPL141107P00104000","currency":"USD","volume":2939,"openInterest":12639,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221116,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.37305314453125,"strike":"104.00","lastPrice":"0.06","change":"0.00","percentChange":"0.00","bid":"0.05","ask":"0.06","impliedVolatility":"37.31"},{"contractSymbol":"AAPL141107P00105000","currency":"USD","volume":2407,"openInterest":14842,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221192,"inTheMoney":false,"percentChangeRaw":-11.111116,"impliedVolatilityRaw":0.33008482421874996,"strike":"105.00","lastPrice":"0.08","change":"-0.01","percentChange":"-11.11","bid":"0.07","ask":"0.08","impliedVolatility":"33.01"},{"contractSymbol":"AAPL141107P00106000","currency":"USD","volume":8659,"openInterest":13528,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221167,"inTheMoney":false,"percentChangeRaw":-44.444447,"impliedVolatilityRaw":0.2910227148437499,"strike":"106.00","lastPrice":"0.10","change":"-0.08","percentChange":"-44.44","bid":"0.11","ask":"0.12","impliedVolatility":"29.10"},{"contractSymbol":"AAPL141107P00107000","currency":"USD","volume":5825,"openInterest":17069,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221197,"inTheMoney":false,"percentChangeRaw":-38.888893,"impliedVolatilityRaw":0.264655791015625,"strike":"107.00","lastPrice":"0.22","change":"-0.14","percentChange":"-38.89","bid":"0.21","ask":"0.22","impliedVolatility":"26.47"},{"contractSymbol":"AAPL141107P00108000","currency":"USD","volume":12554,"openInterest":12851,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221197,"inTheMoney":false,"percentChangeRaw":-30.555557,"impliedVolatilityRaw":0.2695385546875,"strike":"108.00","lastPrice":"0.50","change":"-0.22","percentChange":"-30.56","bid":"0.48","ask":"0.50","impliedVolatility":"26.95"},{"contractSymbol":"AAPL141107P00109000","currency":"USD","volume":9877,"openInterest":9295,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221192,"inTheMoney":true,"percentChangeRaw":-21.093748,"impliedVolatilityRaw":0.29492892578124996,"strike":"109.00","lastPrice":"1.01","change":"-0.27","percentChange":"-21.09","bid":"0.96","ask":"1.02","impliedVolatility":"29.49"},{"contractSymbol":"AAPL141107P00110000","currency":"USD","volume":2722,"openInterest":7129,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221096,"inTheMoney":true,"percentChangeRaw":-12,"impliedVolatilityRaw":0.38281867187499996,"strike":"110.00","lastPrice":"1.76","change":"-0.24","percentChange":"-12.00","bid":"1.74","ask":"1.89","impliedVolatility":"38.28"},{"contractSymbol":"AAPL141107P00111000","currency":"USD","volume":4925,"openInterest":930,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":-1.8115925,"impliedVolatilityRaw":0.4414118359375,"strike":"111.00","lastPrice":"2.71","change":"-0.05","percentChange":"-1.81","bid":"2.64","ask":"2.75","impliedVolatility":"44.14"},{"contractSymbol":"AAPL141107P00112000","currency":"USD","volume":247,"openInterest":328,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":1.3888942,"impliedVolatilityRaw":0.516606396484375,"strike":"112.00","lastPrice":"3.65","change":"0.05","percentChange":"+1.39","bid":"3.60","ask":"3.80","impliedVolatility":"51.66"},{"contractSymbol":"AAPL141107P00113000","currency":"USD","volume":14,"openInterest":354,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":-11.320762,"impliedVolatilityRaw":0.5927775097656252,"strike":"113.00","lastPrice":"4.70","change":"-0.60","percentChange":"-11.32","bid":"4.55","ask":"4.80","impliedVolatility":"59.28"},{"contractSymbol":"AAPL141107P00114000","currency":"USD","volume":16,"openInterest":71,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":3.6697302,"impliedVolatilityRaw":0.6982452050781252,"strike":"114.00","lastPrice":"5.65","change":"0.20","percentChange":"+3.67","bid":"5.60","ask":"5.85","impliedVolatility":"69.82"},{"contractSymbol":"AAPL141107P00115000","currency":"USD","volume":6,"openInterest":51,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":0.91602963,"impliedVolatilityRaw":0.752932158203125,"strike":"115.00","lastPrice":"6.61","change":"0.06","percentChange":"+0.92","bid":"6.55","ask":"6.80","impliedVolatility":"75.29"},{"contractSymbol":"AAPL141107P00117000","currency":"USD","volume":5,"openInterest":1,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":-20.465115,"impliedVolatilityRaw":0.9003916210937499,"strike":"117.00","lastPrice":"8.55","change":"-2.20","percentChange":"-20.47","bid":"8.55","ask":"8.80","impliedVolatility":"90.04"},{"contractSymbol":"AAPL141107P00119000","currency":"USD","volume":1,"openInterest":1,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":1.0390673046875003,"strike":"119.00","lastPrice":"14.35","change":"0.00","percentChange":"0.00","bid":"10.55","ask":"10.80","impliedVolatility":"103.91"},{"contractSymbol":"AAPL141107P00120000","currency":"USD","volume":3800,"openInterest":152,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":5.9633083,"impliedVolatilityRaw":1.1054732226562503,"strike":"120.00","lastPrice":"11.55","change":"0.65","percentChange":"+5.96","bid":"11.55","ask":"11.80","impliedVolatility":"110.55"},{"contractSymbol":"AAPL141107P00122000","currency":"USD","volume":7500,"openInterest":2,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":-41.24731,"impliedVolatilityRaw":1.2343788281249999,"strike":"122.00","lastPrice":"13.66","change":"-9.59","percentChange":"-41.25","bid":"13.55","ask":"13.80","impliedVolatility":"123.44"}]},"_options":[{"expirationDate":1415318400,"hasMiniOptions":false,"calls":[{"contractSymbol":"AAPL141107C00060000","currency":"USD","volume":60,"openInterest":61,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":-1.9076321,"impliedVolatilityRaw":3.2343769140624996,"strike":"60.00","lastPrice":"48.85","change":"-0.95","percentChange":"-1.91","bid":"48.65","ask":"48.90","impliedVolatility":"323.44"},{"contractSymbol":"AAPL141107C00075000","currency":"USD","volume":1,"openInterest":1,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":2.50781623046875,"strike":"75.00","lastPrice":"30.05","change":"0.00","percentChange":"0.00","bid":"33.65","ask":"34.00","impliedVolatility":"250.78"},{"contractSymbol":"AAPL141107C00080000","currency":"USD","volume":16,"openInterest":8,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":2.348754,"impliedVolatilityRaw":1.78125109375,"strike":"80.00","lastPrice":"28.76","change":"0.66","percentChange":"+2.35","bid":"28.65","ask":"28.90","impliedVolatility":"178.13"},{"contractSymbol":"AAPL141107C00085000","currency":"USD","volume":600,"openInterest":297,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":-0.29326183,"impliedVolatilityRaw":1.4609401953124999,"strike":"85.00","lastPrice":"23.80","change":"-0.07","percentChange":"-0.29","bid":"23.65","ask":"23.90","impliedVolatility":"146.09"},{"contractSymbol":"AAPL141107C00088000","currency":"USD","volume":90,"openInterest":90,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":-2.112671,"impliedVolatilityRaw":1.2812535937499998,"strike":"88.00","lastPrice":"20.85","change":"-0.45","percentChange":"-2.11","bid":"20.70","ask":"20.90","impliedVolatility":"128.13"},{"contractSymbol":"AAPL141107C00089000","currency":"USD","volume":290,"openInterest":135,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":8.255868,"impliedVolatilityRaw":1.21875390625,"strike":"89.00","lastPrice":"19.80","change":"1.51","percentChange":"+8.26","bid":"19.70","ask":"19.90","impliedVolatility":"121.88"},{"contractSymbol":"AAPL141107C00090000","currency":"USD","volume":480,"openInterest":227,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":1.0723902,"impliedVolatilityRaw":1.1640666796875,"strike":"90.00","lastPrice":"18.85","change":"0.20","percentChange":"+1.07","bid":"18.70","ask":"18.90","impliedVolatility":"116.41"},{"contractSymbol":"AAPL141107C00091000","currency":"USD","volume":43,"openInterest":43,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":7.6363654,"impliedVolatilityRaw":1.1015669921875002,"strike":"91.00","lastPrice":"17.76","change":"1.26","percentChange":"+7.64","bid":"17.65","ask":"17.90","impliedVolatility":"110.16"},{"contractSymbol":"AAPL141107C00092000","currency":"USD","volume":240,"openInterest":142,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":5.230387,"impliedVolatilityRaw":1.0429735351562504,"strike":"92.00","lastPrice":"16.90","change":"0.84","percentChange":"+5.23","bid":"16.65","ask":"16.90","impliedVolatility":"104.30"},{"contractSymbol":"AAPL141107C00093000","currency":"USD","volume":121,"openInterest":96,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":-6.546542,"impliedVolatilityRaw":0.98437515625,"strike":"93.00","lastPrice":"15.56","change":"-1.09","percentChange":"-6.55","bid":"15.65","ask":"15.90","impliedVolatility":"98.44"},{"contractSymbol":"AAPL141107C00094000","currency":"USD","volume":981,"openInterest":510,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":14.472672,"impliedVolatilityRaw":0.9257819921875,"strike":"94.00","lastPrice":"14.87","change":"1.88","percentChange":"+14.47","bid":"14.65","ask":"14.90","impliedVolatility":"92.58"},{"contractSymbol":"AAPL141107C00095000","currency":"USD","volume":4116,"openInterest":1526,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":0.5098372,"impliedVolatilityRaw":0.867188828125,"strike":"95.00","lastPrice":"13.80","change":"0.07","percentChange":"+0.51","bid":"13.65","ask":"13.90","impliedVolatility":"86.72"},{"contractSymbol":"AAPL141107C00096000","currency":"USD","volume":891,"openInterest":413,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":1.5686259,"impliedVolatilityRaw":0.8125018749999999,"strike":"96.00","lastPrice":"12.95","change":"0.20","percentChange":"+1.57","bid":"12.65","ask":"12.90","impliedVolatility":"81.25"},{"contractSymbol":"AAPL141107C00097000","currency":"USD","volume":1423,"openInterest":719,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":0.1705069,"impliedVolatilityRaw":0.7500025,"strike":"97.00","lastPrice":"11.75","change":"0.02","percentChange":"+0.17","bid":"11.65","ask":"11.90","impliedVolatility":"75.00"},{"contractSymbol":"AAPL141107C00098000","currency":"USD","volume":2075,"openInterest":1130,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":-0.27958745,"impliedVolatilityRaw":0.6953155468750001,"strike":"98.00","lastPrice":"10.70","change":"-0.03","percentChange":"-0.28","bid":"10.65","ask":"10.90","impliedVolatility":"69.53"},{"contractSymbol":"AAPL141107C00099000","currency":"USD","volume":4252,"openInterest":3893,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220939,"inTheMoney":true,"percentChangeRaw":1.0362734,"impliedVolatilityRaw":0.6367223828125,"strike":"99.00","lastPrice":"9.75","change":"0.10","percentChange":"+1.04","bid":"9.70","ask":"9.90","impliedVolatility":"63.67"},{"contractSymbol":"AAPL141107C00100000","currency":"USD","volume":22067,"openInterest":7752,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":true,"percentChangeRaw":-0.45045,"impliedVolatilityRaw":0.57812921875,"strike":"100.00","lastPrice":"8.84","change":"-0.04","percentChange":"-0.45","bid":"8.75","ask":"8.90","impliedVolatility":"57.81"},{"contractSymbol":"AAPL141107C00101000","currency":"USD","volume":6048,"openInterest":1795,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":true,"percentChangeRaw":0.5154634,"impliedVolatilityRaw":0.5195360546875,"strike":"101.00","lastPrice":"7.80","change":"0.04","percentChange":"+0.52","bid":"7.75","ask":"7.90","impliedVolatility":"51.95"},{"contractSymbol":"AAPL141107C00102000","currency":"USD","volume":3488,"openInterest":2828,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":true,"percentChangeRaw":1.4705868,"impliedVolatilityRaw":0.46094289062500005,"strike":"102.00","lastPrice":"6.90","change":"0.10","percentChange":"+1.47","bid":"6.75","ask":"6.90","impliedVolatility":"46.09"},{"contractSymbol":"AAPL141107C00103000","currency":"USD","volume":7725,"openInterest":3505,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221199,"inTheMoney":true,"percentChangeRaw":2.6315806,"impliedVolatilityRaw":0.40430283203125,"strike":"103.00","lastPrice":"5.85","change":"0.15","percentChange":"+2.63","bid":"5.75","ask":"5.90","impliedVolatility":"40.43"},{"contractSymbol":"AAPL141107C00104000","currency":"USD","volume":6271,"openInterest":3082,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221141,"inTheMoney":true,"percentChangeRaw":4.3478327,"impliedVolatilityRaw":0.3437565625,"strike":"104.00","lastPrice":"4.80","change":"0.20","percentChange":"+4.35","bid":"4.75","ask":"4.90","impliedVolatility":"34.38"},{"contractSymbol":"AAPL141107C00105000","currency":"USD","volume":16703,"openInterest":6176,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221143,"inTheMoney":true,"percentChangeRaw":5.5555573,"impliedVolatilityRaw":0.28516339843749994,"strike":"105.00","lastPrice":"3.80","change":"0.20","percentChange":"+5.56","bid":"3.75","ask":"3.90","impliedVolatility":"28.52"},{"contractSymbol":"AAPL141107C00106000","currency":"USD","volume":21589,"openInterest":9798,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221138,"inTheMoney":true,"percentChangeRaw":6.1068735,"impliedVolatilityRaw":0.17188328125000002,"strike":"106.00","lastPrice":"2.78","change":"0.16","percentChange":"+6.11","bid":"2.78","ask":"2.87","impliedVolatility":"17.19"},{"contractSymbol":"AAPL141107C00107000","currency":"USD","volume":22126,"openInterest":13365,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221173,"inTheMoney":true,"percentChangeRaw":3.9772756,"impliedVolatilityRaw":0.062509375,"strike":"107.00","lastPrice":"1.83","change":"0.07","percentChange":"+3.98","bid":"1.78","ask":"1.86","impliedVolatility":"6.25"},{"contractSymbol":"AAPL141107C00108000","currency":"USD","volume":15256,"openInterest":14521,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221188,"inTheMoney":true,"percentChangeRaw":-12.244898,"impliedVolatilityRaw":0.088876298828125,"strike":"108.00","lastPrice":"0.86","change":"-0.12","percentChange":"-12.24","bid":"0.87","ask":"0.90","impliedVolatility":"8.89"},{"contractSymbol":"AAPL141107C00109000","currency":"USD","volume":30797,"openInterest":25097,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221199,"inTheMoney":false,"percentChangeRaw":-22.916664,"impliedVolatilityRaw":0.13868048828125001,"strike":"109.00","lastPrice":"0.37","change":"-0.11","percentChange":"-22.92","bid":"0.36","ask":"0.38","impliedVolatility":"13.87"},{"contractSymbol":"AAPL141107C00110000","currency":"USD","volume":27366,"openInterest":44444,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221197,"inTheMoney":false,"percentChangeRaw":-33.333332,"impliedVolatilityRaw":0.16700051757812504,"strike":"110.00","lastPrice":"0.14","change":"-0.07","percentChange":"-33.33","bid":"0.14","ask":"0.15","impliedVolatility":"16.70"},{"contractSymbol":"AAPL141107C00111000","currency":"USD","volume":10243,"openInterest":17981,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221137,"inTheMoney":false,"percentChangeRaw":-44.444447,"impliedVolatilityRaw":0.18360191406249998,"strike":"111.00","lastPrice":"0.05","change":"-0.04","percentChange":"-44.44","bid":"0.04","ask":"0.05","impliedVolatility":"18.36"},{"contractSymbol":"AAPL141107C00112000","currency":"USD","volume":2280,"openInterest":13500,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221131,"inTheMoney":false,"percentChangeRaw":-33.333336,"impliedVolatilityRaw":0.22071091796874998,"strike":"112.00","lastPrice":"0.02","change":"-0.01","percentChange":"-33.33","bid":"0.02","ask":"0.03","impliedVolatility":"22.07"},{"contractSymbol":"AAPL141107C00113000","currency":"USD","volume":582,"openInterest":9033,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.257819921875,"strike":"113.00","lastPrice":"0.02","change":"0.00","percentChange":"0.00","bid":"0.01","ask":"0.02","impliedVolatility":"25.78"},{"contractSymbol":"AAPL141107C00114000","currency":"USD","volume":496,"openInterest":5402,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":-50,"impliedVolatilityRaw":0.3086006640625,"strike":"114.00","lastPrice":"0.01","change":"-0.01","percentChange":"-50.00","bid":"0.01","ask":"0.02","impliedVolatility":"30.86"},{"contractSymbol":"AAPL141107C00115000","currency":"USD","volume":1965,"openInterest":4971,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.35547519531249994,"strike":"115.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.02","impliedVolatility":"35.55"},{"contractSymbol":"AAPL141107C00116000","currency":"USD","volume":71,"openInterest":2303,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.367193828125,"strike":"116.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"36.72"},{"contractSymbol":"AAPL141107C00117000","currency":"USD","volume":2,"openInterest":899,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.4062559375,"strike":"117.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"40.63"},{"contractSymbol":"AAPL141107C00118000","currency":"USD","volume":30,"openInterest":38,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.45313046875,"strike":"118.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"45.31"},{"contractSymbol":"AAPL141107C00119000","currency":"USD","volume":935,"openInterest":969,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.49219257812500006,"strike":"119.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"49.22"},{"contractSymbol":"AAPL141107C00120000","currency":"USD","volume":3800,"openInterest":558,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.500005,"strike":"120.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"50.00"},{"contractSymbol":"AAPL141107C00123000","currency":"USD","volume":176,"openInterest":176,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.5937540625000001,"strike":"123.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"59.38"},{"contractSymbol":"AAPL141107C00130000","currency":"USD","volume":10,"openInterest":499,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220938,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.8437515624999999,"strike":"130.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"84.38"}],"puts":[{"contractSymbol":"AAPL141107P00070000","currency":"USD","volume":10,"openInterest":295,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.96875015625,"strike":"70.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"196.88"},{"contractSymbol":"AAPL141107P00075000","currency":"USD","volume":525,"openInterest":2086,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.8125009374999999,"strike":"75.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.02","impliedVolatility":"181.25"},{"contractSymbol":"AAPL141107P00080000","currency":"USD","volume":3672,"openInterest":7955,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221200,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.4375028125,"strike":"80.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.01","impliedVolatility":"143.75"},{"contractSymbol":"AAPL141107P00085000","currency":"USD","volume":2120,"openInterest":1425,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.2968785156249998,"strike":"85.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.01","ask":"0.02","impliedVolatility":"129.69"},{"contractSymbol":"AAPL141107P00088000","currency":"USD","volume":301,"openInterest":1072,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.09375453125,"strike":"88.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.02","impliedVolatility":"109.38"},{"contractSymbol":"AAPL141107P00089000","currency":"USD","volume":211,"openInterest":760,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":1.0781296093750001,"strike":"89.00","lastPrice":"0.01","change":"0.00","percentChange":"0.00","bid":"0.01","ask":"0.02","impliedVolatility":"107.81"},{"contractSymbol":"AAPL141107P00090000","currency":"USD","volume":4870,"openInterest":3693,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":1.0312548437500002,"strike":"90.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00","bid":"0.01","ask":"0.02","impliedVolatility":"103.13"},{"contractSymbol":"AAPL141107P00091000","currency":"USD","volume":333,"openInterest":1196,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.9687503125,"strike":"91.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00","bid":"0.01","ask":"0.02","impliedVolatility":"96.88"},{"contractSymbol":"AAPL141107P00092000","currency":"USD","volume":4392,"openInterest":1294,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.92187578125,"strike":"92.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00","bid":"0.01","ask":"0.02","impliedVolatility":"92.19"},{"contractSymbol":"AAPL141107P00093000","currency":"USD","volume":3780,"openInterest":778,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.8984385156249999,"strike":"93.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00","bid":"0.01","ask":"0.03","impliedVolatility":"89.84"},{"contractSymbol":"AAPL141107P00094000","currency":"USD","volume":1463,"openInterest":5960,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221194,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.867188828125,"strike":"94.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00","bid":"0.02","ask":"0.03","impliedVolatility":"86.72"},{"contractSymbol":"AAPL141107P00095000","currency":"USD","volume":2098,"openInterest":11469,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.8125018749999999,"strike":"95.00","lastPrice":"0.02","change":"0.01","percentChange":"+100.00","bid":"0.02","ask":"0.03","impliedVolatility":"81.25"},{"contractSymbol":"AAPL141107P00096000","currency":"USD","volume":4163,"openInterest":3496,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221065,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.7578149218750001,"strike":"96.00","lastPrice":"0.03","change":"0.00","percentChange":"0.00","bid":"0.02","ask":"0.03","impliedVolatility":"75.78"},{"contractSymbol":"AAPL141107P00097000","currency":"USD","volume":4364,"openInterest":1848,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221072,"inTheMoney":false,"percentChangeRaw":50,"impliedVolatilityRaw":0.7187528125,"strike":"97.00","lastPrice":"0.03","change":"0.01","percentChange":"+50.00","bid":"0.02","ask":"0.04","impliedVolatility":"71.88"},{"contractSymbol":"AAPL141107P00098000","currency":"USD","volume":1960,"openInterest":6036,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221129,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.6640658593750002,"strike":"98.00","lastPrice":"0.02","change":"0.00","percentChange":"0.00","bid":"0.02","ask":"0.04","impliedVolatility":"66.41"},{"contractSymbol":"AAPL141107P00099000","currency":"USD","volume":852,"openInterest":5683,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220948,"inTheMoney":false,"percentChangeRaw":100,"impliedVolatilityRaw":0.6093789062500001,"strike":"99.00","lastPrice":"0.04","change":"0.02","percentChange":"+100.00","bid":"0.02","ask":"0.04","impliedVolatility":"60.94"},{"contractSymbol":"AAPL141107P00100000","currency":"USD","volume":2204,"openInterest":4774,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221185,"inTheMoney":false,"percentChangeRaw":50,"impliedVolatilityRaw":0.57812921875,"strike":"100.00","lastPrice":"0.03","change":"0.01","percentChange":"+50.00","bid":"0.03","ask":"0.05","impliedVolatility":"57.81"},{"contractSymbol":"AAPL141107P00101000","currency":"USD","volume":3596,"openInterest":2621,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":false,"percentChangeRaw":33.333336,"impliedVolatilityRaw":0.5195360546875,"strike":"101.00","lastPrice":"0.04","change":"0.01","percentChange":"+33.33","bid":"0.03","ask":"0.05","impliedVolatility":"51.95"},{"contractSymbol":"AAPL141107P00102000","currency":"USD","volume":2445,"openInterest":7791,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":false,"percentChangeRaw":25.000006,"impliedVolatilityRaw":0.4804739453125,"strike":"102.00","lastPrice":"0.05","change":"0.01","percentChange":"+25.00","bid":"0.04","ask":"0.05","impliedVolatility":"48.05"},{"contractSymbol":"AAPL141107P00103000","currency":"USD","volume":8386,"openInterest":7247,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221191,"inTheMoney":false,"percentChangeRaw":25.000006,"impliedVolatilityRaw":0.42188078125,"strike":"103.00","lastPrice":"0.05","change":"0.01","percentChange":"+25.00","bid":"0.04","ask":"0.05","impliedVolatility":"42.19"},{"contractSymbol":"AAPL141107P00104000","currency":"USD","volume":2939,"openInterest":12639,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221116,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.37305314453125,"strike":"104.00","lastPrice":"0.06","change":"0.00","percentChange":"0.00","bid":"0.05","ask":"0.06","impliedVolatility":"37.31"},{"contractSymbol":"AAPL141107P00105000","currency":"USD","volume":2407,"openInterest":14842,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221192,"inTheMoney":false,"percentChangeRaw":-11.111116,"impliedVolatilityRaw":0.33008482421874996,"strike":"105.00","lastPrice":"0.08","change":"-0.01","percentChange":"-11.11","bid":"0.07","ask":"0.08","impliedVolatility":"33.01"},{"contractSymbol":"AAPL141107P00106000","currency":"USD","volume":8659,"openInterest":13528,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221167,"inTheMoney":false,"percentChangeRaw":-44.444447,"impliedVolatilityRaw":0.2910227148437499,"strike":"106.00","lastPrice":"0.10","change":"-0.08","percentChange":"-44.44","bid":"0.11","ask":"0.12","impliedVolatility":"29.10"},{"contractSymbol":"AAPL141107P00107000","currency":"USD","volume":5825,"openInterest":17069,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221197,"inTheMoney":false,"percentChangeRaw":-38.888893,"impliedVolatilityRaw":0.264655791015625,"strike":"107.00","lastPrice":"0.22","change":"-0.14","percentChange":"-38.89","bid":"0.21","ask":"0.22","impliedVolatility":"26.47"},{"contractSymbol":"AAPL141107P00108000","currency":"USD","volume":12554,"openInterest":12851,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221197,"inTheMoney":false,"percentChangeRaw":-30.555557,"impliedVolatilityRaw":0.2695385546875,"strike":"108.00","lastPrice":"0.50","change":"-0.22","percentChange":"-30.56","bid":"0.48","ask":"0.50","impliedVolatility":"26.95"},{"contractSymbol":"AAPL141107P00109000","currency":"USD","volume":9877,"openInterest":9295,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221192,"inTheMoney":true,"percentChangeRaw":-21.093748,"impliedVolatilityRaw":0.29492892578124996,"strike":"109.00","lastPrice":"1.01","change":"-0.27","percentChange":"-21.09","bid":"0.96","ask":"1.02","impliedVolatility":"29.49"},{"contractSymbol":"AAPL141107P00110000","currency":"USD","volume":2722,"openInterest":7129,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415221096,"inTheMoney":true,"percentChangeRaw":-12,"impliedVolatilityRaw":0.38281867187499996,"strike":"110.00","lastPrice":"1.76","change":"-0.24","percentChange":"-12.00","bid":"1.74","ask":"1.89","impliedVolatility":"38.28"},{"contractSymbol":"AAPL141107P00111000","currency":"USD","volume":4925,"openInterest":930,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":-1.8115925,"impliedVolatilityRaw":0.4414118359375,"strike":"111.00","lastPrice":"2.71","change":"-0.05","percentChange":"-1.81","bid":"2.64","ask":"2.75","impliedVolatility":"44.14"},{"contractSymbol":"AAPL141107P00112000","currency":"USD","volume":247,"openInterest":328,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":1.3888942,"impliedVolatilityRaw":0.516606396484375,"strike":"112.00","lastPrice":"3.65","change":"0.05","percentChange":"+1.39","bid":"3.60","ask":"3.80","impliedVolatility":"51.66"},{"contractSymbol":"AAPL141107P00113000","currency":"USD","volume":14,"openInterest":354,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":-11.320762,"impliedVolatilityRaw":0.5927775097656252,"strike":"113.00","lastPrice":"4.70","change":"-0.60","percentChange":"-11.32","bid":"4.55","ask":"4.80","impliedVolatility":"59.28"},{"contractSymbol":"AAPL141107P00114000","currency":"USD","volume":16,"openInterest":71,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":3.6697302,"impliedVolatilityRaw":0.6982452050781252,"strike":"114.00","lastPrice":"5.65","change":"0.20","percentChange":"+3.67","bid":"5.60","ask":"5.85","impliedVolatility":"69.82"},{"contractSymbol":"AAPL141107P00115000","currency":"USD","volume":6,"openInterest":51,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":0.91602963,"impliedVolatilityRaw":0.752932158203125,"strike":"115.00","lastPrice":"6.61","change":"0.06","percentChange":"+0.92","bid":"6.55","ask":"6.80","impliedVolatility":"75.29"},{"contractSymbol":"AAPL141107P00117000","currency":"USD","volume":5,"openInterest":1,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":-20.465115,"impliedVolatilityRaw":0.9003916210937499,"strike":"117.00","lastPrice":"8.55","change":"-2.20","percentChange":"-20.47","bid":"8.55","ask":"8.80","impliedVolatility":"90.04"},{"contractSymbol":"AAPL141107P00119000","currency":"USD","volume":1,"openInterest":1,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":0,"impliedVolatilityRaw":1.0390673046875003,"strike":"119.00","lastPrice":"14.35","change":"0.00","percentChange":"0.00","bid":"10.55","ask":"10.80","impliedVolatility":"103.91"},{"contractSymbol":"AAPL141107P00120000","currency":"USD","volume":3800,"openInterest":152,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":5.9633083,"impliedVolatilityRaw":1.1054732226562503,"strike":"120.00","lastPrice":"11.55","change":"0.65","percentChange":"+5.96","bid":"11.55","ask":"11.80","impliedVolatility":"110.55"},{"contractSymbol":"AAPL141107P00122000","currency":"USD","volume":7500,"openInterest":2,"contractSize":"REGULAR","expiration":1415318400,"lastTradeDate":1415220947,"inTheMoney":true,"percentChangeRaw":-41.24731,"impliedVolatilityRaw":1.2343788281249999,"strike":"122.00","lastPrice":"13.66","change":"-9.59","percentChange":"-41.25","bid":"13.55","ask":"13.80","impliedVolatility":"123.44"}]}],"epochs":[1415318400,1415923200,1416614400,1417132800,1417737600,1418342400,1419033600,1421452800,1424390400,1429228800,1437091200,1452816000,1484870400]},"columns":{"list_table_columns":[{"column":{"name":"Strike","header_cell_class":"column-strike Pstart-38 low-high","body_cell_class":"Pstart-10","template":"table/columns/strike","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"strike","filter":true}},{"column":{"name":"Contract Name","header_cell_class":"column-contractName Pstart-10","body_cell_class":"w-100","template":"table/columns/contract_name","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"symbol"}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"lastPrice"}},{"column":{"name":"Bid","header_cell_class":"column-bid Pstart-10","body_cell_class":"w-100","template":"table/columns/bid","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"bid"}},{"column":{"name":"Ask","header_cell_class":"column-ask Pstart-10","body_cell_class":"w-100","template":"table/columns/ask","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"ask"}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-14","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"change"}},{"column":{"name":"%Change","header_cell_class":"column-percentChange Pstart-16","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-14","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-14","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"openInterest"}},{"column":{"name":"Implied Volatility","header_cell_class":"column-impliedVolatility Pstart-10","body_cell_class":"w-100","template":"table/columns/implied_volatility","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"impliedVolatility"}}],"straddle_table_columns":[{"column":{"name":"Expand All","header_cell_class":"column-expand-all Pstart-38","body_cell_class":"Pstart-10","template":"table/columns/strike","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"expand","filter":false}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.lastPrice","filter":false}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-10","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.change"}},{"column":{"name":"%Change","header_cell_class":"column-pctchange","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-10","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-10","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.openInterest"}},{"column":{"name":"Strike","header_cell_class":"column-strike","body_cell_class":"Pstart-10","template":"table/columns/strike","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"strike","filter":true}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.lastPrice","filter":false}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-10","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.change"}},{"column":{"name":"%Change","header_cell_class":"column-pctchange","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-10","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-10","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.openInterest"}}],"single_strike_filter_list_table_columns":[{"column":{"name":"Expires","header_cell_class":"column-expires Pstart-38 low-high","body_cell_class":"Pstart-10","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"expiration","filter":false}},{"column":{"name":"Contract Name","header_cell_class":"column-contractName Pstart-10","body_cell_class":"w-100","template":"table/columns/contract_name","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"symbol"}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"lastPrice"}},{"column":{"name":"Bid","header_cell_class":"column-bid Pstart-10","body_cell_class":"w-100","template":"table/columns/bid","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"bid"}},{"column":{"name":"Ask","header_cell_class":"column-ask Pstart-10","body_cell_class":"w-100","template":"table/columns/ask","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"ask"}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-14","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"change"}},{"column":{"name":"%Change","header_cell_class":"column-percentChange Pstart-16","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-14","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-14","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"openInterest"}},{"column":{"name":"Implied Volatility","header_cell_class":"column-impliedVolatility Pstart-10","body_cell_class":"w-100","template":"table/columns/implied_volatility","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"impliedVolatility"}}],"single_strike_filter_straddle_table_columns":[{"column":{"name":"Expand All","header_cell_class":"column-expand-all Pstart-38","body_cell_class":"Pstart-10","template":"table/columns/strike","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"expand","filter":false}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.lastPrice","filter":false}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-10","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.change"}},{"column":{"name":"%Change","header_cell_class":"column-pctchange","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-10","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-10","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.openInterest"}},{"column":{"name":"Expires","header_cell_class":"column-expires","body_cell_class":"Pstart-10","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"expiration"}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.lastPrice","filter":false}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-10","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.change"}},{"column":{"name":"%Change","header_cell_class":"column-pctchange","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-10","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-10","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.openInterest"}}]},"params":{"size":false,"straddle":false,"ticker":"AAPL","singleStrikeFilter":false,"date":1415318400}}}},"views":{"main":{"yui_module":"td-options-table-mainview","yui_class":"TD.Options-table.MainView"}},"templates":{"main":{"yui_module":"td-applet-options-table-templates-main","template_name":"td-applet-options-table-templates-main"},"error":{"yui_module":"td-applet-options-table-templates-error","template_name":"td-applet-options-table-templates-error"}},"i18n":{"TITLE":"options-table"},"transport":{"xhr":"/_td_charts_api"},"context":{"bucket":"","crumb":"ly1MJzURQo0","device":"desktop","lang":"en-US","region":"US","site":"finance"}};</script>
-<script>YMedia.applyConfig({"groups":{"td-applet-mw-quote-details":{"base":"https://s.yimg.com/os/mit/td/td-applet-mw-quote-details-2.3.139/","root":"os/mit/td/td-applet-mw-quote-details-2.3.139/","combine":true,"filter":"min","comboBase":"https://s.yimg.com/zz/combo?","comboSep":"&"}}});</script><script>window.Af=window.Af||{};window.Af.bootstrap=window.Af.bootstrap||{};window.Af.bootstrap["7416600209955624"] = {"applet_type":"td-applet-mw-quote-details","models":{"mwquotedetails":{"yui_module":"td-applet-mw-quote-details-model","yui_class":"TD.Applet.MWQuoteDetailsModel","data":{"quoteDetails":{"quotes":[{"name":"Apple Inc.","symbol":"AAPL","details_url":"http://finance.yahoo.com/q?s=AAPL","exchange":{"symbol":"NasdaqGS","id":"NMS","status":"REGULAR_MARKET"},"type":"equity","price":{"fmt":"108.86","raw":"108.860001"},"volume":{"fmt":"37.4m","raw":"37435905","longFmt":"37,435,905"},"avg_daily_volume":{"fmt":"58.6m","raw":"58623300","longFmt":"58,623,300"},"avg_3m_volume":{"fmt":"58.6m","raw":"58623300","longFmt":"58,623,300"},"timestamp":"1415221200","time":"4:00PM EST","trend":"up","price_change":{"fmt":"+0.26","raw":"0.260002"},"price_pct_change":{"fmt":"0.24%","raw":"0.239413"},"day_high":{"fmt":"109.30","raw":"109.300003"},"day_low":{"fmt":"108.12","raw":"108.125000"},"fiftytwo_week_high":{"fmt":"110.3","raw":"110.300000"},"fiftytwo_week_low":{"fmt":"70.51","raw":"70.507100"},"open":{"data_source":"1","fmt":"109.19","raw":"109.190002"},"pe_ratio":{"fmt":"16.88","raw":"16.877520"},"prev_close":{"data_source":"1","fmt":"108.60","raw":"108.599998"},"beta_coefficient":{"fmt":"1.26","raw":"1.260000"},"market_cap":{"data_source":"1","currency":"USD","fmt":"638.45B","raw":"638446403584.000000"},"eps":{"fmt":"6.45","raw":"6.450000"},"one_year_target":{"fmt":"116.33","raw":"116.330000"},"dividend_per_share":{"raw":"1.880000","fmt":"1.88"},"after_hours":{"percent_change":"0.00%","change":{"data_source":"1","raw":"0.000000","fmt":"0.00"},"isFlat":true,"time":{"data_source":"1","raw":"2014-11-06T00:59:59Z","fmt":"7:59PM EST"},"price":{"data_source":"1","raw":"108.860001","fmt":"108.86"}}}]},"symbol":"aapl","login":"https://login.yahoo.com/config/login_verify2?.src=finance&.done=http%3A%2F%2Ffinance.yahoo.com%2Fecharts%3Fs%3Daapl","hamNavQueEnabled":false,"crumb":"ly1MJzURQo0"}},"applet_model":{"models":["mwquotedetails"],"data":{}}},"views":{"main":{"yui_module":"td-applet-quote-details-desktopview","yui_class":"TD.Applet.QuoteDetailsDesktopView"}},"templates":{"main":{"yui_module":"td-applet-mw-quote-details-templates-main","template_name":"td-applet-mw-quote-details-templates-main"}},"i18n":{"HAM_NAV_MODAL_MSG":"has been added to your list. Go to My Portfolio for more!","FOLLOW":"Follow","FOLLOWING":"Following","WATCHLIST":"Watchlist","IN_WATCHLIST":"In Watchlist","TO_FOLLOW":" to Follow","TO_WATCHLIST":" to Add to Watchlist"},"transport":{"xhr":"/_td_charts_api"},"context":{"bucket":"","crumb":"ly1MJzURQo0","device":"desktop","lang":"en-US","region":"US","site":"finance"}};</script>
-        
-
-        <script>if (!window.YMedia) { var YMedia = YUI(); YMedia.includes = []; }</script><div id="yom-ad-SDARLA-iframe"><script type='text/javascript' src='https://s.yimg.com/rq/darla/2-8-4/js/g-r-min.js'></script><script type="text/x-safeframe" id="fc" _ver="2-8-4">{ "positions": [ { "html": "<a href=\"https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3czdiZzZsZShnaWQkZ0doT3NqSXdOaTZZOUtWZ1ZGcnBUZ0hUTVRBNExsUmE4bUxfdmFmSSxzdCQxNDE1MjQ2NDM0ODc3NjMwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkNDI4NDAzODU1MSx2JDIuMCxhaWQkVWg4MFdHS0xjMmMtLGN0JDI1LHlieCRwam5tMW9ocWhsWE9MX21OQnNHc3FBLGJpJDIxNzA5MTUwNTEsbW1lJDkxNjM0MDc0MzQ3NDYwMzA1NzgsbG5nJGVuLXVzLHIkMCxyZCQxMW5lNDIzYmkseW9vJDEsYWdwJDMzMjA2MDU1NTEsYXAkRkIyKSk/1/*http://ad.doubleclick.net/ddm/clk/285320019;112252545;s\" target=\"_blank\"><img src=\"https://s.yimg.com/gs/apex/mediastore/c99704ab-88bb-480c-ba80-a3839e7b3c2c\" alt=\"\" title=\"\" width=120 height=60 border=0/></a><scr"+"ipt>var url = \"\"; if(url && url.search(\"http\") != -1){new Image().src = url;}</scr"+"ipt><img src=\"https://secure.insightexpressai.com/adServer/adServerESI.aspx?bannerID=252780&scr"+"ipt=false&redir=https://secure.insightexpressai.com/adserver/1pixel.gif\">\n\n<img src=\"https://sp.analytics.yahoo.com/spp.pl?a=1000524867285&.yp=18780&js=no\"/><!--QYZ 2170915051,4284038551,98.139.115.131;;FB2;28951412;1;-->", "id": "FB2-1", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['Uh80WGKLc2c-']='(as$12rj30nvs,aid$Uh80WGKLc2c-,bi$2170915051,cr$4284038551,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134um7k2g(gid$gGhOsjIwNi6Y9KVgVFrpTgHTMTA4LlRa8mL_vafI,st$1415246434877630,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$12rj30nvs,aid$Uh80WGKLc2c-,bi$2170915051,cr$4284038551,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)\"></noscr"+"ipt>", "cscURI": "", "impID": "Uh80WGKLc2c-", "supp_ugc": "0", "placementID": "3320605551", "creativeID": "4284038551", "serveTime": "1415246434877630", "behavior": "non_exp", "adID": "9163407434746030578", "matchID": "999999.999999.999999.999999", "err": "", "hasExternal": 0, "size": "120x60", "bookID": "2170915051", "serveType": "-1", "slotID": "0", "fdb": "{ \"fdb_url\": \"https:\\\/\\\/af.beap.bc.yahoo.com\\\/af?bv=1.0.0&bs=(168ihbqti(gid$gGhOsjIwNi6Y9KVgVFrpTgHTMTA4LlRa8mL_vafI,st$1415246434877630,srv$1,si$4451051,adv$21074470295,ct$25,li$3315787051,exp$1415253634877630,cr$4284038551,dmn$ad.doubleclick.net,pbid$20459933223,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1415253634877\", \"fdb_intl\": \"en-US\" }" } } },{ "html": "<!-- APT Vendor: WSOD, Format: Standard Graphical -->\n<scr"+"ipt type=\"text/javascr"+"ipt\" src=\"https://ad.wsod.com/embed/5fbc498f96d2d4ea0e6c7a3e8dc788e2/1.0.js.120x60/1415246434.932311?yud=smpv%3d3%26ed%3dKfb2BHkzZLF3yh3sUja2DRXi3LZjugk7yJsheWWxeT5uV9SYCdYQ_446QvaEZCyKSKTv6RZhaJKuII89ltMbmIkZPAANlg0vgCG8Ax5gnXghso5s8Ys-&encver=1&encalgo=3DES-CFB-SHA1&app=apt&intf=1&click=https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3ZjM1cDUyNihnaWQkZ0doT3NqSXdOaTZZOUtWZ1ZGcnBUZ0hUTVRBNExsUmE4bUxfdmFmSSxzdCQxNDE1MjQ2NDM0ODc3NjMwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkMzk5NDcxNDU1MSx2JDIuMCxhaWQkY1dZMFdHS0xjMmMtLGN0JDI1LHlieCRwam5tMW9ocWhsWE9MX21OQnNHc3FBLGJpJDIwODA1NTAwNTEsbW1lJDg3NjU3ODE1MDk5NjU1NTI4NDEsbG5nJGVuLXVzLHIkMCx5b28kMSxhZ3AkMzE2NzQ3MzA1MSxhcCRGQjIpKQ/2/*\"></scr"+"ipt><NOSCR"+"IPT><a href=\"https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3c25jN2N1byhnaWQkZ0doT3NqSXdOaTZZOUtWZ1ZGcnBUZ0hUTVRBNExsUmE4bUxfdmFmSSxzdCQxNDE1MjQ2NDM0ODc3NjMwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkMzk5NDcxNDU1MSx2JDIuMCxhaWQkY1dZMFdHS0xjMmMtLGN0JDI1LHlieCRwam5tMW9ocWhsWE9MX21OQnNHc3FBLGJpJDIwODA1NTAwNTEsbW1lJDg3NjU3ODE1MDk5NjU1NTI4NDEsbG5nJGVuLXVzLHIkMSxyZCQxNDhrdHRwcmIseW9vJDEsYWdwJDMxNjc0NzMwNTEsYXAkRkIyKSk/1/*https://ad.wsod.com/click/5fbc498f96d2d4ea0e6c7a3e8dc788e2/1.0.img.120x60/?yud=&encver=${ENC_VERSION}&encalgo=${ENC_ALGO}&app=apt&intf=1\" target=\"_blank\"><img width=\"120\" height=\"60\" border=\"0\" src=\"https://ad.wsod.com/embed/5fbc498f96d2d4ea0e6c7a3e8dc788e2/1.0.img.120x60/1415246434.932311?yud=smpv%3d3%26ed%3dKfb2BHkzZLF3yh3sUja2DRXi3LZjugk7yJsheWWxeT5uV9SYCdYQ_446QvaEZCyKSKTv6RZhaJKuII89ltMbmIkZPAANlg0vgCG8Ax5gnXghso5s8Ys-&encver=1&encalgo=3DES-CFB-SHA1&app=apt&intf=1&\" /></a></NOSCR"+"IPT>\n\n<img src=\"https://adfarm.mediaplex.com/ad/tr/17113-191624-6548-18?mpt=1415246434.932311\" border=\"0\" width=1 height=1>\n\n<scr"+"ipt type=\"text/javascr"+"ipt\" src=\"https://cdn-view.c3tag.com/v.js?cid=338&c3ch=Display&c3nid=Yahoo-S-FOChain&size=120x60&creative=Finance\"></scr"+"ipt><!--QYZ 2080550051,3994714551,98.139.115.131;;FB2;28951412;1;-->", "id": "FB2-2", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['cWY0WGKLc2c-']='(as$12rnh3mvs,aid$cWY0WGKLc2c-,bi$2080550051,cr$3994714551,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134um7k2g(gid$gGhOsjIwNi6Y9KVgVFrpTgHTMTA4LlRa8mL_vafI,st$1415246434877630,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$12rnh3mvs,aid$cWY0WGKLc2c-,bi$2080550051,cr$3994714551,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)\"></noscr"+"ipt>", "cscURI": "", "impID": "cWY0WGKLc2c-", "supp_ugc": "0", "placementID": "3167473051", "creativeID": "3994714551", "serveTime": "1415246434877630", "behavior": "expIfr_exp", "adID": "8765781509965552841", "matchID": "999999.999999.999999.999999", "err": "", "hasExternal": 0, "size": "120x60", "bookID": "2080550051", "serveType": "-1", "slotID": "1", "fdb": "{ \"fdb_url\": \"https:\\\/\\\/af.beap.bc.yahoo.com\\\/af?bv=1.0.0&bs=(15hlob2gb(gid$gGhOsjIwNi6Y9KVgVFrpTgHTMTA4LlRa8mL_vafI,st$1415246434877630,srv$1,si$4451051,adv$23207704431,ct$25,li$3160542551,exp$1415253634877630,cr$3994714551,pbid$20459933223,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1415253634877\", \"fdb_intl\": \"en-US\" }" } } },{ "html": "<!-- APT Vendor: WSOD, Format: Polite in Page -->\n<scr"+"ipt type=\"text/javascr"+"ipt\" src=\"https://ad.wsod.com/embed/8bec9b10877d5d7fd7c0fb6e6a631357/1542.0.js.120x60/1415246434.933015?yud=smpv%3d3%26ed%3dKfb2BHkzZLF3yh3sUja2DRXi3LZjugk7yJsheWWxeT5uV9SYCdYQ_446QvaEZCyKSKTv6RZhaJKuII89ltMYn1Apg0gmv2nn1YNYblEy3AFCGa4C18w-&encver=1&encalgo=3DES-CFB-SHA1&app=apt&intf=1&click=https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3Zm8zMWtnYShnaWQkZ0doT3NqSXdOaTZZOUtWZ1ZGcnBUZ0hUTVRBNExsUmE4bUxfdmFmSSxzdCQxNDE1MjQ2NDM0ODc3NjMwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkNDI5MzE3ODA1MSx2JDIuMCxhaWQka0swMFdHS0xjMmMtLGN0JDI1LHlieCRwam5tMW9ocWhsWE9MX21OQnNHc3FBLGJpJDIxNzgwODg1NTEsbW1lJDkxOTMzNDMzNTY3OTkxOTg0ODksbG5nJGVuLXVzLHIkMCx5b28kMSxhZ3AkMzMzMzM1MzA1MSxhcCRGQjIpKQ/2/*\"></scr"+"ipt><NOSCR"+"IPT><a href=\"https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3c2loMm1jcShnaWQkZ0doT3NqSXdOaTZZOUtWZ1ZGcnBUZ0hUTVRBNExsUmE4bUxfdmFmSSxzdCQxNDE1MjQ2NDM0ODc3NjMwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkNDI5MzE3ODA1MSx2JDIuMCxhaWQka0swMFdHS0xjMmMtLGN0JDI1LHlieCRwam5tMW9ocWhsWE9MX21OQnNHc3FBLGJpJDIxNzgwODg1NTEsbW1lJDkxOTMzNDMzNTY3OTkxOTg0ODksbG5nJGVuLXVzLHIkMSxyZCQxNGJ0N29ncGIseW9vJDEsYWdwJDMzMzMzNTMwNTEsYXAkRkIyKSk/1/*https://ad.wsod.com/click/8bec9b10877d5d7fd7c0fb6e6a631357/1542.0.img.120x60/?yud=&encver=${ENC_VERSION}&encalgo=${ENC_ALGO}&app=apt&intf=1\" target=\"_blank\"><img width=\"120\" height=\"60\" border=\"0\" src=\"https://ad.wsod.com/embed/8bec9b10877d5d7fd7c0fb6e6a631357/1542.0.img.120x60/1415246434.933015?yud=smpv%3d3%26ed%3dKfb2BHkzZLF3yh3sUja2DRXi3LZjugk7yJsheWWxeT5uV9SYCdYQ_446QvaEZCyKSKTv6RZhaJKuII89ltMYn1Apg0gmv2nn1YNYblEy3AFCGa4C18w-&encver=1&encalgo=3DES-CFB-SHA1&app=apt&intf=1&\" /></a></NOSCR"+"IPT>\n\n<img src=\"https://ads.yahoo.com/pixel?id=2529352&t=2\" width=\"1\" height=\"1\" />\n\n<img src=\"https://sp.analytics.yahoo.com/spp.pl?a=10001021715385&.yp=16283&js=no\"/><scr"+"ipt>var url = \"\"; if(url && url.search(\"http\") != -1){new Image().src = url;}</scr"+"ipt><!--QYZ 2178088551,4293178051,98.139.115.131;;FB2;28951412;1;-->", "id": "FB2-3", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['kK00WGKLc2c-']='(as$12r0ktbdt,aid$kK00WGKLc2c-,bi$2178088551,cr$4293178051,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134um7k2g(gid$gGhOsjIwNi6Y9KVgVFrpTgHTMTA4LlRa8mL_vafI,st$1415246434877630,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$12r0ktbdt,aid$kK00WGKLc2c-,bi$2178088551,cr$4293178051,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)\"></noscr"+"ipt>", "cscURI": "", "impID": "kK00WGKLc2c-", "supp_ugc": "0", "placementID": "3333353051", "creativeID": "4293178051", "serveTime": "1415246434877630", "behavior": "expIfr_exp", "adID": "9193343356799198489", "matchID": "999999.999999.999999.999999", "err": "", "hasExternal": 0, "size": "120x60", "bookID": "2178088551", "serveType": "-1", "slotID": "2", "fdb": "{ \"fdb_url\": \"https:\\\/\\\/af.beap.bc.yahoo.com\\\/af?bv=1.0.0&bs=(16ae726ak(gid$gGhOsjIwNi6Y9KVgVFrpTgHTMTA4LlRa8mL_vafI,st$1415246434877630,srv$1,si$4451051,adv$22886174375,ct$25,li$3328804551,exp$1415253634877630,cr$4293178051,dmn$mobile.scottrade.com,pbid$20459933223,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1415253634877\", \"fdb_intl\": \"en-US\" }" } } },{ "html": "<!-- SpaceID=28951412 loc=FB2 noad --><!-- fac-gd2-noad --><!-- gd2-status-2 --><!--QYZ 2178088551,,98.139.115.131;;FB2;28951412;2;-->", "id": "FB2-4", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['r_Q0WGKLc2c-']='(as$1254gcrdc,aid$r_Q0WGKLc2c-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134um7k2g(gid$gGhOsjIwNi6Y9KVgVFrpTgHTMTA4LlRa8mL_vafI,st$1415246434877630,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$1254gcrdc,aid$r_Q0WGKLc2c-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)\"></noscr"+"ipt>", "cscURI": "", "impID": "", "supp_ugc": "0", "placementID": "-1", "creativeID": "-1", "serveTime": "1415246434877630", "behavior": "non_exp", "adID": "#2", "matchID": "#2", "err": "invalid_space", "hasExternal": 0, "size": "", "bookID": "2178088551", "serveType": "-1", "slotID": "3", "fdb": "{ \"fdb_url\": \"http:\\/\\/gd1457.adx.gq1.yahoo.com\\/af?bv=1.0.0&bs=(15ir45r6b(gid$jmTVQDk4LjHHbFsHU5jMkgKkMTAuNwAAAACljpkK,st$1402537233026922,srv$1,si$13303551,adv$25941429036,ct$25,li$3239250051,exp$1402544433026922,cr$4154984551,pbid$25372728133,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1402544433026\", \"fdb_intl\": \"en-us\" , \"d\" : \"1\" }" } } },{ "html": "<style type=\"text/css\">\n.CAN_ad .yadslug {\n    position: absolute !important; right: 1px; top:1px; display:inline-block\n!important; z-index : 999;\n    color:#999 !important;text-decoration:none;background:#fff\nurl('https://secure.footprint.net/yieldmanager/apex/mediastore/adchoice_1.png') no-repeat 100% 0\n!important;cursor:hand !important;height:12px !important;padding:0px 14px 0px\n1px !important;display:inline-block !important;\n}\n.CAN_ad .yadslug span {display:none !important;}\n.CAN_ad .yadslug:hover {zoom: 1;}\n.CAN_ad .yadslug:hover span {display:inline-block !important;color:#999\n!important;}\n.CAN_ad .yadslug:hover span, .CAN_ad .yadslug:hover {font:11px arial\n!important;}\n</style>    \n<div class=\"CAN_ad\" style=\"display:inline-block;position: relative;\">\n<a class=\"yadslug\"\nhref=\"https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3cHMwMHFlNihnaWQkZ0doT3NqSXdOaTZZOUtWZ1ZGcnBUZ0hUTVRBNExsUmE4bUxfdmFmSSxzdCQxNDE1MjQ2NDM0ODc3NjMwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkNDI4MDk5MzA1MSx2JDIuMCxhaWQkN1lJMVdHS0xjMmMtLGN0JDI1LHlieCRwam5tMW9ocWhsWE9MX21OQnNHc3FBLGJpJDIxNjkwMDMwNTEsbW1lJDkxNTU1MTExMzczNzIzMjgzOTAsbG5nJGVuLXVzLHckMCx5b28kMSxhZ3AkMzMxNzk2NzU1MSxhcCRTS1kpLGxuZyRlbi11cyk/1/*http://info.yahoo.com/relevantads/\"\ntarget=\"_blank\"><span>AdChoices</span></a><!-- APT Vendor: WSOD, Format: Standard Graphical -->\n<scr"+"ipt type=\"text/javascr"+"ipt\" src=\"https://ad.wsod.com/embed/5fbc498f96d2d4ea0e6c7a3e8dc788e2/18.0.js.160x600/1415246434.932035?yud=smpv%3d3%26ed%3dKfb2BHkzZLF3yh3sUja2DRXi3LZjugk7yJsheWWxeT5uV9SYCdYQ_446QvaEZCyKSKTv6RZhaJKuII89ltMbmIkZPAANlg0vgCG8Ax5gnXghso5s8Ys-&encver=1&encalgo=3DES-CFB-SHA1&app=apt&intf=1&click=https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3ZjJiY3F1MShnaWQkZ0doT3NqSXdOaTZZOUtWZ1ZGcnBUZ0hUTVRBNExsUmE4bUxfdmFmSSxzdCQxNDE1MjQ2NDM0ODc3NjMwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkNDI4MDk5MzA1MSx2JDIuMCxhaWQkN1lJMVdHS0xjMmMtLGN0JDI1LHlieCRwam5tMW9ocWhsWE9MX21OQnNHc3FBLGJpJDIxNjkwMDMwNTEsbW1lJDkxNTU1MTExMzczNzIzMjgzOTAsbG5nJGVuLXVzLHIkMCx5b28kMSxhZ3AkMzMxNzk2NzU1MSxhcCRTS1kpKQ/2/*\"></scr"+"ipt><NOSCR"+"IPT><a href=\"https://clicks.beap.bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3c2N2NDl0aShnaWQkZ0doT3NqSXdOaTZZOUtWZ1ZGcnBUZ0hUTVRBNExsUmE4bUxfdmFmSSxzdCQxNDE1MjQ2NDM0ODc3NjMwLHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkNDI4MDk5MzA1MSx2JDIuMCxhaWQkN1lJMVdHS0xjMmMtLGN0JDI1LHlieCRwam5tMW9ocWhsWE9MX21OQnNHc3FBLGJpJDIxNjkwMDMwNTEsbW1lJDkxNTU1MTExMzczNzIzMjgzOTAsbG5nJGVuLXVzLHIkMSxyZCQxNGFyNW11a3YseW9vJDEsYWdwJDMzMTc5Njc1NTEsYXAkU0tZKSk/1/*https://ad.wsod.com/click/5fbc498f96d2d4ea0e6c7a3e8dc788e2/18.0.img.160x600/?yud=&encver=${ENC_VERSION}&encalgo=${ENC_ALGO}&app=apt&intf=1\" target=\"_blank\"><img width=\"160\" height=\"600\" border=\"0\" src=\"https://ad.wsod.com/embed/5fbc498f96d2d4ea0e6c7a3e8dc788e2/18.0.img.160x600/1415246434.932035?yud=smpv%3d3%26ed%3dKfb2BHkzZLF3yh3sUja2DRXi3LZjugk7yJsheWWxeT5uV9SYCdYQ_446QvaEZCyKSKTv6RZhaJKuII89ltMbmIkZPAANlg0vgCG8Ax5gnXghso5s8Ys-&encver=1&encalgo=3DES-CFB-SHA1&app=apt&intf=1&\" /></a></NOSCR"+"IPT>\n\n<img src=\"https://adfarm.mediaplex.com/ad/tr/17113-191624-6548-24?mpt=1415246434.932035\" border=\"0\" width=1 height=1>\n\n<scr"+"ipt type=\"text/javascr"+"ipt\" src=\"https://cdn-view.c3tag.com/v.js?cid=338&c3ch=Display&c3nid=Yahoo-S-FOChain&size=160x600&creative=Finance\"></scr"+"ipt><scr"+"ipt>var url = \"\"; if(url && url.search(\"http\") != -1){new Image().src = url;}</scr"+"ipt><!--QYZ 2169003051,4280993051,98.139.115.131;;SKY;28951412;1;--></div>", "id": "SKY", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['7YI1WGKLc2c-']='(as$12r42i3c5,aid$7YI1WGKLc2c-,bi$2169003051,cr$4280993051,ct$25,at$H,eob$gd1_match_id=-1:ypos=SKY)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134um7k2g(gid$gGhOsjIwNi6Y9KVgVFrpTgHTMTA4LlRa8mL_vafI,st$1415246434877630,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$12r42i3c5,aid$7YI1WGKLc2c-,bi$2169003051,cr$4280993051,ct$25,at$H,eob$gd1_match_id=-1:ypos=SKY)\"></noscr"+"ipt>", "cscURI": "", "impID": "7YI1WGKLc2c-", "supp_ugc": "0", "placementID": "3317967551", "creativeID": "4280993051", "serveTime": "1415246434877630", "behavior": "expIfr_exp", "adID": "9155511137372328390", "matchID": "999999.999999.999999.999999", "err": "", "hasExternal": 0, "size": "160x600", "bookID": "2169003051", "serveType": "-1", "slotID": "5", "fdb": "{ \"fdb_url\": \"https:\\\/\\\/af.beap.bc.yahoo.com\\\/af?bv=1.0.0&bs=(16bliv061(gid$gGhOsjIwNi6Y9KVgVFrpTgHTMTA4LlRa8mL_vafI,st$1415246434877630,srv$1,si$4451051,adv$23207704431,ct$25,li$3313116551,exp$1415253634877630,cr$4280993051,dmn$content.tradeking.com,pbid$20459933223,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1415253634877\", \"fdb_intl\": \"en-US\" }" } } } ], "meta": { "y": { "pageEndHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['zjs1WGKLc2c-']='(as$125unvubb,aid$zjs1WGKLc2c-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=LOGO)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134um7k2g(gid$gGhOsjIwNi6Y9KVgVFrpTgHTMTA4LlRa8mL_vafI,st$1415246434877630,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$125unvubb,aid$zjs1WGKLc2c-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=LOGO)\"></noscr"+"ipt><scr"+"ipt language=javascr"+"ipt>\n(function(){window.xzq_p=function(R){M=R};window.xzq_svr=function(R){J=R};function F(S){var T=document;if(T.xzq_i==null){T.xzq_i=new Array();T.xzq_i.c=0}var R=T.xzq_i;R[++R.c]=new Image();R[R.c].src=S}window.xzq_sr=function(){var S=window;var Y=S.xzq_d;if(Y==null){return }if(J==null){return }var T=J+M;if(T.length>P){C();return }var X=\"\";var U=0;var W=Math.random();var V=(Y.hasOwnProperty!=null);var R;for(R in Y){if(typeof Y[R]==\"string\"){if(V&&!Y.hasOwnProperty(R)){continue}if(T.length+X.length+Y[R].length<=P){X+=Y[R]}else{if(T.length+Y[R].length>P){}else{U++;N(T,X,U,W);X=Y[R]}}}}if(U){U++}N(T,X,U,W);C()};function N(R,U,S,T){if(U.length>0){R+=\"&al=\"}F(R+U+\"&s=\"+S+\"&r=\"+T)}function C(){window.xzq_d=null;M=null;J=null}function K(R){xzq_sr()}function B(R){xzq_sr()}function L(U,V,W){if(W){var R=W.toString();var T=U;var Y=R.match(new RegExp(\"\\\\\\\\(([^\\\\\\\\)]*)\\\\\\\\)\"));Y=(Y[1].length>0?Y[1]:\"e\");T=T.replace(new RegExp(\"\\\\\\\\([^\\\\\\\\)]*\\\\\\\\)\",\"g\"),\"(\"+Y+\")\");if(R.indexOf(T)<0){var X=R.indexOf(\"{\");if(X>0){R=R.substring(X,R.length)}else{return W}R=R.replace(new RegExp(\"([^a-zA-Z0-9$_])this([^a-zA-Z0-9$_])\",\"g\"),\"$1xzq_this$2\");var Z=T+\";var rv = f( \"+Y+\",this);\";var S=\"{var a0 = '\"+Y+\"';var ofb = '\"+escape(R)+\"' ;var f = new Function( a0, 'xzq_this', unescape(ofb));\"+Z+\"return rv;}\";return new Function(Y,S)}else{return W}}return V}window.xzq_eh=function(){if(E||I){this.onload=L(\"xzq_onload(e)\",K,this.onload,0);if(E&&typeof (this.onbeforeunload)!=O){this.onbeforeunload=L(\"xzq_dobeforeunload(e)\",B,this.onbeforeunload,0)}}};window.xzq_s=function(){setTimeout(\"xzq_sr()\",1)};var J=null;var M=null;var Q=navigator.appName;var H=navigator.appVersion;var G=navigator.userAgent;var A=parseInt(H);var D=Q.indexOf(\"Microsoft\");var E=D!=-1&&A>=4;var I=(Q.indexOf(\"Netscape\")!=-1||Q.indexOf(\"Opera\")!=-1)&&A>=4;var O=\"undefined\";var P=2000})();\n</scr"+"ipt><scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_svr)xzq_svr('https://csc.beap.bc.yahoo.com/');\nif(window.xzq_p)xzq_p('yi?bv=1.0.0&bs=(134um7k2g(gid$gGhOsjIwNi6Y9KVgVFrpTgHTMTA4LlRa8mL_vafI,st$1415246434877630,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3');\nif(window.xzq_s)xzq_s();\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134um7k2g(gid$gGhOsjIwNi6Y9KVgVFrpTgHTMTA4LlRa8mL_vafI,st$1415246434877630,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3\"></noscr"+"ipt><scr"+"ipt>(function(c){var e=\"https://\",a=c&&c.JSON,f=\"ypcdb\",g=document,d=[\"yahoo.com\",\"flickr.com\",\"rivals.com\",\"yahoo.net\",\"yimg.com\"],b;function i(l,o,n,m){var k,p;try{k=new Date();k.setTime(k.getTime()+m*1000);g.cookie=[l,\"=\",encodeURIComponent(o),\"; domain=\",n,\"; path=/; max-age=\",m,\"; expires=\",k.toUTCString()].join(\"\")}catch(p){}}function h(l){var k,m;try{k=new Image();k.onerror=k.onload=function(){k.onerror=k.onload=null;k=null};k.src=l}catch(m){}}function j(u,A,n,y){var w=0,v,z,x,s,t,p,m,r,l,o,k,q;try{b=location}catch(r){b=null}try{if(a){k=a.parse(y)}else{q=new Function(\"return \"+y);k=q()}}catch(r){k=null}try{v=b.hostname;z=b.protocol;if(z){z+=\"//\"}}catch(r){v=z=\"\"}if(!v){try{x=g.URL||b.href||\"\";s=x.match(/^((http[s]?)\\:[\\/]+)?([^:\\/\\s]+|[\\:\\dabcdef\\.]+)/i);if(s&&s[1]&&s[3]){z=s[1]||\"\";v=s[3]||\"\"}}catch(r){z=v=\"\"}}if(!v||!k||!z||!A){return}while(l=d[w++]){t=l.replace(/\\./g,\"\\\\.\");p=new RegExp(\"(\\\\.)+\"+t+\"$\");if(v==l||v.search(p)!=-1){o=l;break}}if(!o){return}if(g.cookie.indexOf(\"ypcdb=\"+u)>-1){return}if(z===e){A=n}w=0;while(m=A[w++]){h(z+m+k[m.substr(1+m.lastIndexOf(\"=\"))])}i(f,u,o,86400)}j('2998ae1fefd2dfc7cfcd62e5bc1a53d4',['csync.flickr.com/csync?ver=2.1','csync.yahooapis.com/csync?ver=2.1','u2sb.interclick.com/beacon.gif?ver=2.1'],['cdnk.interclick.com/beacon.gif?ver=2.1','csync.flickr.com/csync?ver=2.1','csync.yahooapis.com/csync?ver=2.1'],'{\"2.1\":\"&id=23351&value=9ug55p1n5ydnr%26o%3d3%26f%3dpy&optout=b%3d0&timeout=1415246434&sig=11l0n3fbf\"}')})(window);\n</scr"+"ipt>", "pos_list": [ "FB2-1","FB2-2","FB2-3","FB2-4","LOGO","SKY" ], "spaceID": "28951412", "host": "finance.yahoo.com", "lookupTime": "65", "k2_uri": "", "fac_rt": "59169", "serveTime":"1415246434877630", "pvid": "gGhOsjIwNi6Y9KVgVFrpTgHTMTA4LlRa8mL_vafI", "tID": "darla_prefetch_1415246434876_862138589_1", "npv": "1", "ep": "{\"site-attribute\":[],\"ult\":{\"ln\":{\"slk\":\"ads\"}},\"nopageview\":true,\"ref\":\"http:\\/\\/finance.yahoo.com\\/q\\/op\",\"secure\":true,\"filter\":\"no_expandable;exp_iframe_expandable;\",\"darlaID\":\"darla_instance_1415246434876_1459690747_0\"}" } } } </script></div><div id="yom-ad-SDARLAEXTRA-iframe"><script type='text/javascript'>
-DARLA_CONFIG = {"useYAC":0,"servicePath":"https:\/\/finance.yahoo.com\/__darla\/php\/fc.php","xservicePath":"","beaconPath":"https:\/\/finance.yahoo.com\/__darla\/php\/b.php","renderPath":"","allowFiF":false,"srenderPath":"https:\/\/s.yimg.com\/rq\/darla\/2-8-4\/html\/r-sf.html","renderFile":"https:\/\/s.yimg.com\/rq\/darla\/2-8-4\/html\/r-sf.html","sfbrenderPath":"https:\/\/s.yimg.com\/rq\/darla\/2-8-4\/html\/r-sf.html","msgPath":"https:\/\/finance.yahoo.com\/__darla\/2-8-4\/html\/msg.html","cscPath":"https:\/\/s.yimg.com\/rq\/darla\/2-8-4\/html\/r-csc.html","root":"__darla","edgeRoot":"http:\/\/l.yimg.com\/rq\/darla\/2-8-4","sedgeRoot":"https:\/\/s.yimg.com\/rq\/darla\/2-8-4","version":"2-8-4","tpbURI":"","hostFile":"https:\/\/s.yimg.com\/rq\/darla\/2-8-4\/js\/g-r-min.js","beaconsDisabled":true,"rotationTimingDisabled":true,"fdb_locale":"What don't you like about this ad?|<span>Thank you<\/span> for helping us improve your Yahoo experience|I don't like this ad|I don't like the advertiser|It's offensive|Other (tell us more)|Send|Done","positions":{"FB2-1":{"w":120,"h":60},"FB2-2":{"w":120,"h":60},"FB2-3":{"w":120,"h":60},"FB2-4":[],"LOGO":[],"SKY":{"w":160,"h":600}}};
-DARLA_CONFIG.servicePath = DARLA_CONFIG.servicePath.replace(/\:8033/g, "");
-DARLA_CONFIG.msgPath = DARLA_CONFIG.msgPath.replace(/\:8033/g, "");
-DARLA_CONFIG.k2E2ERate = 2;
-DARLA_CONFIG.positions = {"FB2-4":{"w":"198","h":"60","dest":"yom-ad-FB2-4-iframe","fr":"expIfr_exp","pos":"FB2-4","id":"FB2-4","clean":"yom-ad-FB2-4","rmxp":0},"FB2-1":{"w":"198","h":"60","dest":"yom-ad-FB2-1-iframe","fr":"expIfr_exp","pos":"FB2-1","id":"FB2-1","clean":"yom-ad-FB2-1","rmxp":0},"FB2-2":{"w":"198","h":"60","dest":"yom-ad-FB2-2-iframe","fr":"expIfr_exp","pos":"FB2-2","id":"FB2-2","clean":"yom-ad-FB2-2","rmxp":0},"SKY":{"w":"160","h":"600","dest":"yom-ad-SKY-iframe","fr":"expIfr_exp","pos":"SKY","id":"SKY","clean":"yom-ad-SKY","rmxp":0},"FB2-3":{"w":"198","h":"60","dest":"yom-ad-FB2-3-iframe","fr":"expIfr_exp","pos":"FB2-3","id":"FB2-3","clean":"yom-ad-FB2-3","rmxp":0},"FB2-0":{"w":"120","h":"60","dest":"yom-ad-FB2-0-iframe","fr":"expIfr_exp","pos":"FB2-0","id":"FB2-0","clean":"yom-ad-FB2-0","rmxp":0},"WBTN-1":{"w":"120","h":"60","dest":"yom-ad-WBTN-1-iframe","fr":"expIfr_exp","pos":"WBTN-1","id":"WBTN-1","clean":"yom-ad-WBTN-1","rmxp":0},"WBTN":{"w":"120","h":"60","dest":"yom-ad-WBTN-iframe","fr":"expIfr_exp","pos":"WBTN","id":"WBTN","clean":"yom-ad-WBTN","rmxp":0},"LDRP":{"w":"320","h":"76","dest":"yom-ad-LDRP-iframe","fr":"expIfr_exp","pos":"LDRP","id":"LDRP","clean":"yom-ad-LDRP","rmxp":0,"metaSize":true,"supports":{"exp-ovr":1,"exp-push":1}},"LREC":{"w":"300","h":"265","dest":"yom-ad-LREC-iframe","fr":"expIfr_exp","pos":"LREC","id":"LREC","clean":"yom-ad-LREC","rmxp":0,"metaSize":true,"supports":{"exp-ovr":1,"lyr":1}},"LREC-1":{"w":"300","h":"265","dest":"yom-ad-LREC-iframe-lb","fr":"expIfr_exp","pos":"LREC","id":"LREC-1","clean":"yom-ad-LREC-lb","rmxp":0,"metaSize":true,"supports":{"exp-ovr":1,"lyr":1}}};DARLA_CONFIG.positions['DEFAULT'] = { meta: { title: document.title, url: document.URL || location.href, urlref: document.referrer }};
-DARLA_CONFIG.events = {"darla_td":{"lvl":"","sp":"28951412","npv":true,"bg":"","sa":[],"sa_orig":[],"filter":"no_expandable;exp_iframe_expandable;","mpid":"","mpnm":"","locale":"","ps":"LREC,FB2-1,FB2-2,FB2-3,FB2-4,LDRP,WBTN,WBTN-1,FB2-0,SKY","ml":"","mps":"","ssl":"1"}};YMedia.later(10, this, function() {YMedia.use("node-base", function(Y){
-
-    /* YUI Ads Darla begins... */
-    YUI.AdsDarla = (function (){
-
-        var NAME = 'AdsDarla',
-            LB_EVENT = 'lightbox',
-            AUTO_EVENT = 'AUTO',
-            LREC3_EVENT = 'lrec3Event',
-            MUTEX_ADS = {},
-            AD_PERF_COMP = [];
-
-        if (DARLA_CONFIG.positions && DARLA_CONFIG.positions['TL1']) {
-            var navlink = Y.one('ul.navlist li>a'),
-                linkcolor;
-            if (navlink) {
-                linkcolor = navlink.getStyle('color');
-                DARLA_CONFIG.positions['TL1'].css = ".ad-tl2b {overflow:hidden; text-align:left;} p {margin:0px;} .y-fp-pg-controls {margin-top:5px; margin-bottom:5px;} #tl1_slug { font-family:'Helvetica Neue',Helvetica,Arial,sans-serif; font-size:12px; color:" + linkcolor + ";} #fc_align a {font-family:'Helvetica Neue',Helvetica,Arial,sans-serif; font-size:11px; color:" + linkcolor + ";} a:link {text-decoration:none;} a:hover {color: " + linkcolor + ";}";
-            }
-        }
-
-    /* setting up DARLA events */
-    var w = window,
-        D = w.DARLA,
-        C = w.DARLA_CONFIG,
-        DM = w.DOC_DOMAIN_SET || 0;
-    if (D) {
-        if (D && C) {
-            C.dm = DM;
-        }
-
-
-        /* setting DARLA configuration */
-        DARLA.config(C);
-
-        /* prefetch Ads if applicable */
-        DARLA.prefetched("fc");
-
-        /* rendering prefetched Ad */
-
-        DARLA.render();
-
-
-    }
-
-    return {
-        event: function (eventId, spaceId, adsSa) {
-            if (window.DARLA && eventId) {
-                var eventConfig = {};
-                if (!isNaN(spaceId)) {
-                    eventConfig.sp = spaceId;
-                }
-                /* Site attributes */
-                adsSa = (typeof adsSa !== "undefined" && adsSa !== null) ? adsSa : "";
-                eventConfig.sa = DARLA_CONFIG.events[eventId].sa_orig.replace ? DARLA_CONFIG.events[eventId].sa_orig.replace("ADSSA", adsSa) : "";
-                DARLA.event(eventId, eventConfig);
-            }
-        },
-        render: function() {
-            if (!!(Y.one('#yom-slideshow-lightbox') || Y.one('#content-lightbox') || false)) {
-                /* skip configuring DARLA in case of lightbox being triggered */
-            } else {
-                // abort current darla action
-                if (DARLA && DARLA.abort) {
-                    DARLA.abort();
-                }
-
-                /* setting DARLA configuration */
-                DARLA.config(DARLA_CONFIG);
-
-                /* prefetch Ads if applicable */
-                DARLA.prefetched("fc");
-
-                /* rendering prefetched Ad */
-                DARLA.render();
-            }
-        }
-    };
-
-})(); /* End of YUI.AdsDarla */
-
-YUI.AdsDarla.darla_td = { fetch: (Y.bind(YUI.AdsDarla.event, YUI.AdsDarla, 'darla_td')) };    YUI.AdsDarla.fetch = YUI.AdsDarla.darla_td.fetch;
-    Y.Global.fire('darla:ready'); 
-}); /* End of YMedia */}); /* End of YMedia.later */var ___adLT___ = [];
-function onDarlaFinishPosRender(position) {
-  if (window.performance !== undefined && window.performance.now !== undefined) {
-    var ltime = window.performance.now();
-    ___adLT___.push(['AD_'+position, Math.round(ltime)]);
-    setTimeout(function () {
-        if (window.LH !== undefined && window.YAFT !== undefined && window.YAFT.isInitialized()) {
-          window.YAFT.triggerCustomTiming('yom-ad-'+position, '', ltime);
-        }
-    },1000);
-  }
-}
-
-if ((DARLA && DARLA.config) || DARLA_CONFIG) {
-    var oldConf = DARLA.config() || DARLA_CONFIG || null;
-    if (oldConf) {
-        if (oldConf.onFinishPosRender) {
-            (function() {
-                var oldVersion = oldConf.onFinishPosRender;
-                oldConf.onFinishPosRender = function(position) {
-                    onDarlaFinishPosRender(position);
-                    return oldVersion.apply(me, arguments);
-                };
-            })();
-        } else {
-            oldConf.onFinishPosRender  = onDarlaFinishPosRender;
-        }
-        DARLA.config(oldConf);
-    }
-}
-
-</script></div><div><!-- SpaceID=28951412 loc=LOGO noad --><!-- fac-gd2-noad --><!-- gd2-status-2 --><!--QYZ CMS_NONE_AVAIL,,98.139.115.131;;LOGO;28951412;2;--></div><!-- END DARLA CONFIG -->
-
-        <script>window.YAHOO = window.YAHOO || {}; window.YAHOO.i13n = window.YAHOO.i13n || {}; if (!window.YMedia) { var YMedia = YUI(); YMedia.includes = []; }</script><script>YAHOO.i13n.YWA_CF_MAP = {"_p":20,"ad":58,"authfb":11,"bpos":24,"camp":54,"cat":25,"code":55,"cpos":21,"ct":23,"dcl":26,"dir":108,"domContentLoadedEventEnd":44,"elm":56,"elmt":57,"f":40,"ft":51,"grpt":109,"ilc":39,"itc":111,"loadEventEnd":45,"ltxt":17,"mpos":110,"mrkt":12,"pcp":67,"pct":48,"pd":46,"pkgt":22,"pos":20,"prov":114,"psp":72,"pst":68,"pstcat":47,"pt":13,"rescode":27,"responseEnd":43,"responseStart":41,"rspns":107,"sca":53,"sec":18,"site":42,"slk":19,"sort":28,"t1":121,"t2":122,"t3":123,"t4":124,"t5":125,"t6":126,"t7":127,"t8":128,"t9":129,"tar":113,"test":14,"v":52,"ver":49,"x":50};YAHOO.i13n.YWA_ACTION_MAP = {"click":12,"hvr":115,"rottn":128,"drag":105};YAHOO.i13n.YWA_OUTCOME_MAP = {};</script><script>YMedia.rapid = new YAHOO.i13n.Rapid({"spaceid":"28951412","client_only":1,"test_id":"","compr_type":"deflate","webworker_file":"/rapid-worker.js","text_link_len":8,"keys":{"version":"td app","site":"mobile-web-quotes"},"ywa":{"project_id":"1000911397279","document_group":"interactive-chart","host":"y.analytics.yahoo.com"},"tracked_mods":["yfi_investing_nav","chart-details"],"nofollow_class":[],"pageview_on_init":true});</script><!-- RAPID INIT -->
-
-        <script>
-            YMedia.use('main');
-        </script>
-
-	    <!-- Universal Header -->
-	    <script src="https://s.yimg.com/zz/combo?kx/yucs/uh3/uh/1078/js/uh-min.js&kx/yucs/uh3/uh/1078/js/gallery-jsonp-min.js&kx/yucs/uh3/uh/1078/js/menu_utils_v3-min.js&kx/yucs/uh3/uh/1078/js/localeDateFormat-min.js&kx/yucs/uh3/uh/1078/js/timestamp_library_v2-min.js&kx/yucs/uh3/uh/1104/js/logo_debug-min.js&kx/yucs/uh3/switch-theme/6/js/switch_theme-min.js&kx/yucs/uhc/meta/55/js/meta-min.js&kx/yucs/uh_common/beacon/18/js/beacon-min.js&kx/ucs/comet/js/77/cometd-yui3-min.js&kx/ucs/comet/js/77/conn-min.js&kx/ucs/comet/js/77/dark-test-min.js&kx/yucs/uh3/disclaimer/294/js/disclaimer_seed-min.js&kx/yucs/uh3/top-bar/321/js/top_bar_v3-min.js&kx/yucs/uh3/search/598/js/search-min.js&kx/yucs/uh3/search/611/js/search_plugin-min.js&kx/yucs/uh3/help/58/js/help_menu_v3-min.js&kx/yucs/uhc/rapid/37/js/uh_rapid-min.js&kx/yucs/uh3/get-the-app/148/js/inputMaskClient-min.js&kx/yucs/uh3/get-the-app/160/js/get_the_app-min.js&kx/yucs/uh3/location/10/js/uh_locdrop-min.js&amp;"></script>
-
-    </body>
-
-</html>
-<!-- ad prefetch pagecsc setting -->
\ No newline at end of file
diff --git a/pandas/io/tests/data/yahoo_options3.html b/pandas/io/tests/data/yahoo_options3.html
deleted file mode 100644
index 6e79bb9bf9f36..0000000000000
--- a/pandas/io/tests/data/yahoo_options3.html
+++ /dev/null
@@ -1,2807 +0,0 @@
-<!DOCTYPE html>
-<html>
-<head>
-    <!-- customizable : anything you expected.  -->
-    <title>SPWR Option Chain | Yahoo! Inc. Stock - Yahoo! Finance</title>
-
-    <meta http-equiv="X-UA-Compatible" content="IE=edge,chrome=1" />
-    <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
-
-
-
-    
-        <link rel="stylesheet" type="text/css" href="https://s.yimg.com/zz/combo?/os/mit/td/stencil-0.1.306/stencil-css/stencil-css-min.css&/os/mit/td/finance-td-app-mobile-web-2.0.356/css.master/css.master-min.css"/><link rel="stylesheet" type="text/css" href="https://s.yimg.com/os/mit/media/m/quotes/quotes-search-gs-smartphone-min-1680382.css"/>
-
-
-<script>(function(html){var c = html.className;c += " JsEnabled";c = c.replace("NoJs","");html.className = c;})(document.documentElement);</script>
-    
-
-
-    <!-- UH -->
-    <link rel="stylesheet" href="https://s.yimg.com/zz/combo?kx/yucs/uh3/uh/1132/css/uh_non_mail-min.css&amp;kx/yucs/uh_common/meta/3/css/meta-min.css&amp;kx/yucs/uh3/top-bar/366/css/no_icons-min.css&amp;kx/yucs/uh3/search/css/588/blue_border-min.css&amp;kx/yucs/uh3/get-the-app/151/css/get_the_app-min.css&amp;kx/yucs/uh3/uh/1132/css/uh_ssl-min.css&amp;&amp;bm/lib/fi/common/p/d/static/css/2.0.356953/2.0.0/mini/yfi_theme_teal.css&amp;bm/lib/fi/common/p/d/static/css/2.0.356953/2.0.0/mini/yfi_interactive_charts_embedded.css">
-
-
-
-
-    <style>
-        .dev-desktop .y-header {
-            position: fixed;
-            top: 0;
-            left: 0;
-            right: 0;
-            padding-bottom: 10px;
-            background-color: #FFF;
-            z-index: 500;
-            -webkit-transition:border 0.25s, box-shadow 0.25s;
-            -moz-transition:border 0.25s, box-shadow 0.25s;
-            transition:border 0.25s, box-shadow 0.25s;
-        }
-        .Scrolling .dev-desktop .y-header,
-        .has-scrolled .dev-desktop .y-header {
-            -webkit-box-shadow: 0 0 9px 0 #490f76!important;
-            -moz-box-shadow: 0 0 9px 0 #490f76!important;
-            box-shadow: 0 0 9px 0 #490f76!important;
-            border-bottom: 1px solid #490f76!important;
-        }
-        .yucs-sidebar, .yui3-sidebar {
-            position: relative;
-        }
-    </style>
-    <style>
-
-        #content-area {
-            margin-top: 100px;
-            z-index: 4;
-        }
-        #finance-navigation {
-
-            padding: 0 12px;
-        }
-        #finance-navigation a, #finance-navigation a:link, #finance-navigation a:visited {
-            color: #1D1DA3;
-        }
-        #finance-navigation li.nav-section {
-            position: relative;
-        }
-        #finance-navigation li.nav-section a {
-            display: block;
-            padding: 10px 20px;
-        }
-        #finance-navigation li.nav-section ul.nav-subsection {
-            background-color: #FFFFFF;
-            border: 1px solid #DDDDDD;
-            box-shadow: 0 3px 15px 2px #FFFFFF;
-            display: none;
-            left: 0;
-            min-width: 100%;
-            padding: 5px 0;
-            position: absolute;
-            top: 35px;
-            z-index: 11;
-        }
-        #finance-navigation li.nav-section ul.nav-subsection a {
-            display: block;
-            padding: 5px 11px;
-            white-space: nowrap;
-        }
-        #finance-navigation li.nav-section ul.nav-subsection ul.scroll {
-            margin: 0 0 13px;
-            max-height: 168px;
-            overflow: auto;
-            padding-bottom: 8px;
-            width: auto;
-        }
-        #finance-navigation li.first a {
-            padding-left: 0;
-        }
-        #finance-navigation li.on ul.nav-subsection {
-            display: block;
-        }
-        #finance-navigation li.on:before {
-            -moz-border-bottom-colors: none;
-            -moz-border-left-colors: none;
-            -moz-border-right-colors: none;
-            -moz-border-top-colors: none;
-            border-color: -moz-use-text-color rgba(0, 0, 0, 0) #DDDDDD;
-            border-image: none;
-            border-left: 10px solid rgba(0, 0, 0, 0);
-            border-right: 10px solid rgba(0, 0, 0, 0);
-            border-style: none solid solid;
-            border-width: 0 10px 10px;
-            bottom: -5px;
-            content: "";
-            left: 50%;
-            margin-left: -10px;
-            position: absolute;
-            z-index: 1;
-        }
-        #finance-navigation li.on:after {
-            -moz-border-bottom-colors: none;
-            -moz-border-left-colors: none;
-            -moz-border-right-colors: none;
-            -moz-border-top-colors: none;
-            border-color: -moz-use-text-color rgba(0, 0, 0, 0) #FFFFFF;
-            border-image: none;
-            border-left: 10px solid rgba(0, 0, 0, 0);
-            border-right: 10px solid rgba(0, 0, 0, 0);
-            border-style: none solid solid;
-            border-width: 0 10px 10px;
-            bottom: -6px;
-            content: "";
-            left: 50%;
-            margin-left: -10px;
-            position: absolute;
-            z-index: 1;
-        }
-
-
-        #finance-navigation {
-            position: relative;
-            left: -100%;
-            padding-left: 102%;
-
-        }
-
-
-        ul {
-            margin: .55em 0;
-        }
-
-        div[data-region=subNav] {
-            z-index: 11;
-        }
-
-        #yfi_investing_content {
-            position: relative;
-        }
-
-        #yfi_charts.desktop #yfi_investing_content {
-            width: 1070px;
-        }
-
-        #yfi_charts.tablet #yfi_investing_content {
-            width: 930px;
-        }
-
-        #yfi_charts.tablet #yfi_doc {
-            width: 1100px;
-        }
-
-        .tablet #yucs #yucs-search {
-            text-align: left;
-        }
-
-        #compareSearch {
-            position: absolute;
-            right: 0;
-            padding-top: 10px;
-            z-index: 10;
-        }
-
-        /* remove this once int1 verification happens */
-        #yfi_broker_buttons {
-            height: 60px;
-        }
-
-        #yfi_charts.desktop #yfi_doc {
-            width: 1240px;
-        }
-
-        .tablet #content-area {
-            margin-top: 0;
-
-        }
-
-        .tablet #marketindices {
-            margin-top: -5px;
-        }
-
-        .tablet #quoteContainer {
-            right: 191px;
-        }
-    </style>
-</head>
-<body  id="yfi_charts" class="dev-desktop desktop intl-us yfin_gs gsg-0">
-
-<div id="outer-wrapper" class="outer-wrapper">
-    <div class="yui-sv y-header">
-        <div class="yui-sv-hd">
-            <!-- yucs header bar. Property sticks UH header bar here. UH supplies the div -->
-            <style>#header,#y-hd,#hd .yfi_doc,#yfi_hd{background:#fff !important}#yfin_gs #yfimh #yucsHead,#yfin_gs #yfi_doc #yucsHead,#yfin_gs #yfi_fp_hd #yucsHead,#yfin_gs #y-hd #yucsHead,#yfin_gs #yfi_hd #yucsHead,#yfin_gs #yfi-doc #yucsHead{-webkit-box-shadow:0 0 9px 0 #490f76 !important;-moz-box-shadow:0 0 9px 0 #490f76 !important;box-shadow:0 0 9px 0 #490f76 !important;border-bottom:1px solid #490f76 !important}#yog-hd,#yfi-hd,#ysp-hd,#hd,#yfimh,#yfi_hd,#yfi_fp_hd,#masthead,#yfi_nav_header #navigation,#y-nav #navigation,.ad_in_head{background-color:#fff;background-image:none}#header,#hd .yfi_doc,#y-hd .yfi_doc,#yfi_hd .yfi_doc{width:100% !important}#yucs{margin:0 auto;width:970px}#yfi_nav_header,.y-nav-legobg,#y-nav #navigation{margin:0 auto;width:970px}#yucs .yucs-avatar{height:22px;width:22px}#yucs #yucs-profile_text .yuhead-name-greeting{display:none}#yucs #yucs-profile_text .yuhead-name{top:0;max-width:65px}#yucs-profile_text{max-width:65px}#yog-bd .yom-stage{background:transparent}#yog-hd{height:84px}.yog-bd,.yog-grid{padding:4px 10px}.nav-stack ul.yog-grid{padding:0}#yucs #yucs-search.yucs-bbb .yucs-button_theme{background:-moz-linear-gradient(top, #01a5e1 0, #0297ce 100%);background:-webkit-gradient(linear, left top, left bottom, color-stop(0%, #01a5e1), color-stop(100%, #0297ce));background:-webkit-linear-gradient(top, #01a5e1 0, #0297ce 100%);background:-o-linear-gradient(top, #01a5e1 0, #0297ce 100%);background:-ms-linear-gradient(top, #01a5e1 0, #0297ce 100%);background:linear-gradient(to bottom, #01a5e1 0, #0297ce 100%);-webkit-box-shadow:inset 0 1px 3px 0 #01c0eb;box-shadow:inset 0 1px 3px 0 #01c0eb;background-color:#019ed8;background-color:transparent\0/IE9;background-color:transparent\9;*background:none;border:1px solid #595959;padding-left:0px;padding-right:0px}#yucs #yucs-search.yucs-bbb #yucs-prop_search_button_wrapper .yucs-gradient{filter:progid:DXImageTransform.Microsoft.gradient(startColorstr='#01a5e1', endColorstr='#0297ce',GradientType=0 );-ms-filter:"progid:DXImageTransform.Microsoft.gradient( startColorstr='#01a5e1', endColorstr='#0297ce',GradientType=0 )";background-color:#019ed8\0/IE9}#yucs #yucs-search.yucs-bbb #yucs-prop_search_button_wrapper{*border:1px solid #595959}#yucs #yucs-search .yucs-button_theme{background:#0f8ed8;border:0;box-shadow:0 2px #044e6e}@media all{#yucs.yucs-mc,#yucs-top-inner{width:auto !important;margin:0 !important}#yucsHead{_text-align:left !important}#yucs-top-inner,#yucs.yucs-mc{min-width:970px !important;max-width:1240px !important;padding-left:10px !important;padding-right:10px !important}#yucs.yucs-mc{_width:970px !important;_margin:0 !important}#yucsHead #yucs .yucs-fl-left #yucs-search{position:absolute;left:190px !important;max-width:none !important;margin-left:0;_left:190px;_width:510px !important}.yog-ad-billboard #yucs-top-inner,.yog-ad-billboard #yucs.yucs-mc{max-width:1130px !important}#yucs .yog-cp{position:inherit}}#yucs #yucs-logo{width:150px !important;height:34px !important}#yucs #yucs-logo div{width:94px !important;margin:0 auto !important}.lt #yucs-logo div{background-position:-121px center !important}#yucs-logo a{margin-left:-13px !important}</style><style>#yog-hd .yom-bar, #yog-hd .yom-nav, #y-nav, #hd .ysp-full-bar,  #yfi_nav_header, #hd .mast {
-float: none;
-width: 970px;
-margin: 0 auto;
-}
-
-#yog-bd .yom-stage {
-background: transparent;
-}
-
-#y-nav .yom-nav {
-padding-top: 0px;
-}
-
-#ysp-search-assist .bd {
-display:none;
-}
-
-#ysp-search-assist h4 {
-padding-left: 8px;
-}
-
-
-    #yfi-portfolios-multi-quotes #y-nav, #yfi-portfolios-multi-quotes #navigation, #yfi-portfolios-multi-quotes .y-nav-legobg, 
-    #yfi-portfolios-my-portfolios #y-nav, #yfi-portfolios-my-portfolios #navigation, #yfi-portfolios-my-portfolios .y-nav-legobg {
-        width : 100%;
-    }</style> <div id="yucsHead" class="yucs-finance yucs-en-us  yucs-standard"><!-- meta --><div id="yucs-meta" data-authstate="signedout" data-cobrand="standard" data-crumb="HVSMb/Vg12G" data-mc-crumb="Tdz9BZvXIPG" data-gta="FpUml9Lj/0t" data-device="desktop" data-experience="GS" data-firstname="" data-flight="1427251673" data-forcecobrand="standard" data-guid="" data-host="finance.yahoo.com" data-https="1" data-languagetag="en-us" data-property="finance" data-protocol="https" data-shortfirstname="" data-shortuserid="" data-status="active" data-spaceid="2022773886" data-test_id="" data-userid="" data-stickyheader="true" data-headercollapse='' ></div><!-- /meta --><div id="yucs-comet" style="display:none;"></div><div id="yucs-disclaimer" class="yucs-disclaimer yucs-activate yucs-hide yucs-property-finance yucs-fcb- " data-cobrand="standard" data-cu = "0" data-dsstext="Want a better search experience? {dssLink}Set your Search to Yahoo{linkEnd}" data-dsstext-mobile="Search Less, Find More" data-dsstext-mobile-ok="OK" data-dsstext-mobile-set-search="Set Search to Yahoo" data-dssstbtext="Yahoo is the preferred search engine for Firefox. Switch now." data-dssstb-ok="Yes" data-dssstb-no="Not Now" data-ylt-link="https://search.yahoo.com/searchset;_ylt=AvBd8yuXQP1FE7AzOK.9WWF.FJF4?pn=" data-ylt-dssbarclose="/;_ylt=AnpKQu_VtRlt5IsJjOTC4BV.FJF4" data-ylt-dssbaropen="/;_ylt=AiBSa6g.6aEIcYqDmcGfZLp.FJF4" data-ylt-dssstb-link="https://downloads.yahoo.com/sp-firefox;_ylt=Ah1pbpBocj7b_r2PPRwNjCN.FJF4" data-ylt-dssstbbarclose="/;_ylt=ArBIkRSucjOS2yWDOXhp1SF.FJF4" data-ylt-dssstbbaropen="/;_ylt=Ag76Bu0Li5VeRf0Tak01ETJ.FJF4" data-ylt-dssCookieCleanedSuccess="/;_ylt=Ah8hiXxlLJoV_3FBq3tFWeN.FJF4" data-ylt-dssCookieCleanedFailed="/;_ylt=AqDJx6PCHeaMGrVVc1uqUiV.FJF4" data-linktarget="_top" data-lang="en-us" data-property="finance" data-device="Desktop" data-close-txt="Close this window" data-maybelater-txt = "Maybe Later" data-killswitch = "0" data-host="finance.yahoo.com" data-spaceid="2022773886" data-pn="tb5l.j/xP1L" data-dss-cookie-cleanup="p0FosBsWgFi" data-pn-en-ca-mobile-frontpage="PKu30aPHhjC" data-pn-de-de-mobile-frontpage="8oOlpg2WMt8" data-pn-es-es-mobile-frontpage="5jsZIeQOv6v" data-pn-fr-fr-mobile-frontpage="hOhiEWVp5Zn" data-pn-en-in-mobile-frontpage="aG/6BLG3d1s" data-pn-it-it-mobile-frontpage="JfUbdMeYkyc" data-pn-en-us-mobile-frontpage="tb5l.j/xP1L" data-pn-en-sg-mobile-frontpage="b5YG2DcdA5b" data-pn-en-gb-mobile-frontpage="21QBB5CyCG8" data-pn-en-us-mobile-mail="tAbva7/szv1" data-pn-en-ca-mobile-mail="ij8Lg6VVXHm" data-pn-de-de-mobile-mail="pkZg1NRefVJ" data-pn-es-es-mobile-mail="MTfCu70e6/R" data-pn-fr-fr-mobile-mail="lT74Z7Mbx2Q" data-pn-en-in-mobile-mail="Rj3vS.eDtbs" data-pn-it-it-mobile-mail="3worGce1Tr9" data-pn-en-sg-mobile-mail="4FrKaNBexjw" data-pn-en-gb-mobile-mail="LVl9wNL2kdW" data-pn-pt-br-mobile-mail="a/c5oMjNxgy" data-pn-en-us-tablet-frontpage="yxj4T5.AXUX" data-pn-en-us-tablet-mail="Aap3Vjs9bRF" data-pn-en-ca-tablet-mail="Rc5pJtym4j7" data-pn-de-de-tablet-mail="Uat6ofVUjGk" data-pn-es-es-tablet-mail="lNyAEKczB2u" data-pn-fr-fr-tablet-mail="I3ULq8KrFL9" data-pn-en-in-tablet-mail="TV.5An.lhfV" data-pn-it-it-tablet-mail="epI8iT8QcS0" data-pn-en-sg-tablet-mail="6oD.RwmiFtU" data-pn-en-gb-tablet-mail="Wf.IRx16ZPj" data-pn-pt-br-tablet-mail="ZHZsfe1OZE9" data-news-search-yahoo-com="Q5/uUxHV.LD" data-answers-search-yahoo-com="9RpG8B7zhd1" data-finance-search-yahoo-com="K2Ts05.cawy" data-images-search-yahoo-com="o3glPuo2OB9" data-video-search-yahoo-com="yj0lG.iRj7i" data-sports-search-yahoo-com="N8Hj.HzPyGy" data-shopping-search-yahoo-com="NykVrTEq9bV" data-shopping-yahoo-com="NykVrTEq9bV" data-us-qa-trunk-news-search-yahoo-com ="Q5/uUxHV.LD" data-dss="1"></div>  <div id="yucs-top-bar" class='yucs-ps' ><div id='yucs-top-inner'><ul id="yucs-top-list"><li id="yucs-top-home"><a href="https://us.lrd.yahoo.com/_ylt=Alc1CCAC6f_uzmdYCPdd1ER.FJF4/SIG=11a69k544/EXP=1427280473/**https%3a//www.yahoo.com/" ><span class="sp yucs-top-ico"></span>Home</a></li><li id="yucs-top-mail"><a href="https://mail.yahoo.com/;_ylt=AuueiFLURKY7TiMlAM2fZIV.FJF4?.intl=us&.lang=en-US&.src=ym" >Mail</a></li><li id="yucs-top-search"><a href="https://search.yahoo.com/search;_ylt=AlmeCfaxHsJUT3f._psnh.Z.FJF4" >Search</a></li><li id="yucs-top-news"><a href="http://news.yahoo.com/;_ylt=AuFaMM3Vm.oia56nN35tUBZ.FJF4" >News</a></li><li id="yucs-top-sports"><a href="http://sports.yahoo.com/;_ylt=AiQMnxBgWkxzvNmSUCbZ1b5.FJF4" >Sports</a></li><li id="yucs-top-finance"><a href="http://finance.yahoo.com/;_ylt=AtpFK8VlpMSXquVKCRPzVaV.FJF4" >Finance</a></li><li id="yucs-top-weather"><a href="https://weather.yahoo.com/;_ylt=AunejRGJjm7YbbnDbN8NGeV.FJF4" >Weather</a></li><li id="yucs-top-games"><a href="https://games.yahoo.com/;_ylt=AiEQlc7if0DvDSJ_71.zvp5.FJF4" >Games</a></li><li id="yucs-top-answers"><a href="https://answers.yahoo.com/;_ylt=AvPBQONLCkk5oPDhPunmfOZ.FJF4" >Answers</a></li><li id="yucs-top-screen"><a href="https://us.lrd.yahoo.com/_ylt=AkpnBo3cM1BTX6gb93m5leZ.FJF4/SIG=11dq8l4t0/EXP=1427280473/**https%3a//screen.yahoo.com/" >Screen</a></li><li id="yucs-top-flickr"><a href="https://us.lrd.yahoo.com/_ylt=Ag1fValWD8UDsTHS0hijL4l.FJF4/SIG=11bf7n8bv/EXP=1427280473/**https%3a//www.flickr.com/" >Flickr</a></li><li id="yucs-top-mobile"><a href="https://mobile.yahoo.com/;_ylt=AjB.0cyRbZbD6D4smGyAylV.FJF4" >Mobile</a></li><li id='yucs-more' class='yucs-menu yucs-more-activate' data-ylt="/;_ylt=AlJ9FArayZOdJ47rOsvkGJt.FJF4"><a href="http://everything.yahoo.com/" id='yucs-more-link'>More<span class="sp yucs-top-ico"></span></a><div id='yucs-top-menu'><div class="yui3-menu-content"><ul class="yucs-hide yucs-leavable"><li id='yucs-top-politics'><a href="https://us.lrd.yahoo.com/_ylt=Aq6ektXsyl9PO2gyOX9TzOl.FJF4/SIG=11ia2uuk4/EXP=1427280473/**https%3a//www.yahoo.com/politics" >Politics</a></li><li id='yucs-top-celebrity'><a href="https://celebrity.yahoo.com/;_ylt=AuT4mNkT26N0podRHoepQGd.FJF4" >Celebrity</a></li><li id='yucs-top-movies'><a href="https://us.lrd.yahoo.com/_ylt=Ar2TUW3sHJe.qZ05Mobockd.FJF4/SIG=11gpbhj81/EXP=1427280473/**https%3a//www.yahoo.com/movies" >Movies</a></li><li id='yucs-top-music'><a href="https://us.lrd.yahoo.com/_ylt=AhAqjcnRMA1NVrsFj5.CzIp.FJF4/SIG=11fotdr7r/EXP=1427280473/**https%3a//www.yahoo.com/music" >Music</a></li><li id='yucs-top-tv'><a href="https://us.lrd.yahoo.com/_ylt=Aru1.cFazm_ae5kRaK_G4mB.FJF4/SIG=11cj4cm6r/EXP=1427280473/**https%3a//www.yahoo.com/tv" >TV</a></li><li id='yucs-top-groups'><a href="https://us.lrd.yahoo.com/_ylt=ArU4kxnoa6mC8gKkKtkj6Ux.FJF4/SIG=11dium6ad/EXP=1427280473/**https%3a//groups.yahoo.com/" >Groups</a></li><li id='yucs-top-health'><a href="https://us.lrd.yahoo.com/_ylt=Ap.jxGs5VxvWwvs6UmzFq4B.FJF4/SIG=11g94de63/EXP=1427280473/**https%3a//www.yahoo.com/health" >Health</a></li><li id='yucs-top-style'><a href="https://us.lrd.yahoo.com/_ylt=Aqt2UQ6AkjhFqUyi9k42FHR.FJF4/SIG=11fhdove9/EXP=1427280473/**https%3a//www.yahoo.com/style" >Style</a></li><li id='yucs-top-beauty'><a href="https://us.lrd.yahoo.com/_ylt=AsRy_fzn_R993z99ix3Bov5.FJF4/SIG=11gqp8q7c/EXP=1427280473/**https%3a//www.yahoo.com/beauty" >Beauty</a></li><li id='yucs-top-food'><a href="https://us.lrd.yahoo.com/_ylt=Ak2J5Xy6bJtXo56RKLG9FeB.FJF4/SIG=11er55dl3/EXP=1427280473/**https%3a//www.yahoo.com/food" >Food</a></li><li id='yucs-top-parenting'><a href="https://us.lrd.yahoo.com/_ylt=ApK5hfVgasf2iTBR0fFOjkR.FJF4/SIG=11jkqqrqk/EXP=1427280473/**https%3a//www.yahoo.com/parenting" >Parenting</a></li><li id='yucs-top-makers'><a href="https://us.lrd.yahoo.com/_ylt=AqmBSZCRMqArgtRRwKv9Ybt.FJF4/SIG=11gsifckf/EXP=1427280473/**https%3a//www.yahoo.com/makers" >Makers</a></li><li id='yucs-top-tech'><a href="https://us.lrd.yahoo.com/_ylt=ApqSlHxSXO6EIm.ZsOPY69V.FJF4/SIG=11eli6t63/EXP=1427280473/**https%3a//www.yahoo.com/tech" >Tech</a></li><li id='yucs-top-shopping'><a href="http://shopping.yahoo.com/;_ylt=AkPMr8mhP1E_vyFqQWTHqoN.FJF4" >Shopping</a></li><li id='yucs-top-travel'><a href="https://us.lrd.yahoo.com/_ylt=AlKE6DyHBpG0DWxmFl4qsBR.FJF4/SIG=11gc5j78m/EXP=1427280473/**https%3a//www.yahoo.com/travel" >Travel</a></li><li id='yucs-top-autos'><a href="https://autos.yahoo.com/;_ylt=Al5mxcf7awy3RIvyOshW.Gx.FJF4" >Autos</a></li><li id='yucs-top-homes'><a href="https://us.lrd.yahoo.com/_ylt=AqHTaJywhfhmvfG6NCpqKft.FJF4/SIG=11l3r2u9o/EXP=1427280473/**https%3a//homes.yahoo.com/own-rent/" >Homes</a></li></ul></div></div></li></ul></div><style>#yucs-top-ff-promo { position:absolute; right:0; right:auto\9; left:950px\9; right:0\9\0; left:auto\9\0; margin-left:18px;}#yucs-top-ff-promo a span { text-decoration: none; display: inline-block;}@media screen and (max-width:1150px) { #yucs-top-ff-promo { right:auto; }}</style><li id='yucs-top-ff-promo' class="Grid-U Mend-18 Pstart-14 D-n"><a class="D-b Pstart-4" href="https://www.mozilla.org/firefox/new/?utm_source=yahoo&utm_medium=referral&utm_campaign=y-uh&utm_content=y-install-new-firefox" data-ylk="t5:ff-promo;slk:ff-promo;t4:pty-mu;" target="_blank"><img id="yucs-ff-img" class="Pend-4 Va-m" src='https://s.yimg.com/kx/yucs/uh3s/promo-ff/1/images/ff_icon-compressed.png' width="15" height="15" alt="Firefox" />Install the new Firefox<span>&nbsp;&raquo;</span></a></li><script> var s = false, ts,re2,sdts,v2= null, cookies = "; " + document.cookie, dss = cookies.split("; DSS="), m, ua = window.navigator.userAgent.toLowerCase(); m = ua.match(/firefox\/(\d+)/); if (!m || (m && m[1] && parseInt(m[1]) < 34)) { if (ua.indexOf('version') >= 0 && ua.indexOf('crios') < 0) { s = true; } if (!!window.opera || navigator.userAgent.indexOf(' OPR/') >= 0) { s = true; } if (dss && dss.length === 2) { re2 = new RegExp('sdts=(\\d+)'); v2 = re2.exec(dss[1]); if (v2 && v2.length === 2) { sdts = v2[1]; } if (sdts && (parseInt(new Date().getTime()) - sdts) < 604800000) { s = true; } } if (!s) { m = document.getElementById('yucs-top-ff-promo'); m.className = m.className.replace(/D-n/g,''); } }</script></div><div id="yucs" class="yucs yucs-mc  yog-grid" data-lang="en-us" data-property="finance" data-flight="1427251673" data-linktarget="_top" data-uhvc="/;_ylt=AvcHsWUPdvTmykmqE68HzkJ.FJF4"> <div class="yucs-fl-left yog-cp">   <div id="yucs-logo"> <style> #yucs #yucs-logo-ani { width:120px ; height:34px; background-image:url(https://s.yimg.com/rz/l/yahoo_finance_en-US_f_pw_119x34.png) ; _background-image:url(https://s.yimg.com/rz/l/yahoo_finance_en-US_f_pw_119x34.gif) ; *left: 0px; display:block ; visibility: visible; position: relative; clip: auto; } .lt #yucs-logo-ani { background-position: 100% 0px !important; } .lt #yucs[data-property='mail'] #yucs-logo-ani { background-position: -350px 0px !important; } #yucs-logo { margin-top:0px!important; padding-top: 11px; width: 120px; } #yucs[data-property='homes'] #yucs-logo { width: 102px; } .advisor #yucs-link-ani { left: 21px !important; } #yucs #yucs-logo a {margin-left: 0!important;}#yucs #yucs-link-ani {width: 100% !important;} @media only screen and (-webkit-min-device-pixel-ratio: 2), only screen and ( min--moz-device-pixel-ratio: 2), only screen and ( -o-min-device-pixel-ratio: 2/1), only screen and ( min-device-pixel-ratio: 2), only screen and ( min-resolution: 192dpi), only screen and ( min-resolution: 2dppx) { #yucs #yucs-logo-ani { background-image: url(https://s.yimg.com/rz/l/yahoo_finance_en-US_f_pw_119x34_2x.png) !important; background-size: 235px 34px; } } </style> <div> <a id="yucs-logo-ani" class="" href="https://finance.yahoo.com/;_ylt=AuWQGm5QyPConYLRZRuI.Id.FJF4" target="_top" data-alg=""> Yahoo Finance </a> </div> <img id="imageCheck" src="https://s.yimg.com/os/mit/media/m/base/images/transparent-1093278.png" alt=""/> </div><noscript><style>#yucs #yucs-logo-ani {visibility: visible;position: relative;clip: auto;}</style></noscript> <div id="yucs-search" style="width: 570px; display: block;" class=' yucs-search-activate'> <form role="search" class="yucs-search yucs-activate" target="_top" data-webaction="https://search.yahoo.com/search;_ylt=Ao0AjSjy0AJJj5jdWXvvy5F.FJF4" action="https://finance.yahoo.com/q;_ylt=AgOkjN.KdE1wQ3hDAYdMIE5.FJF4" method="get"> <table role="presentation"> <tbody role="presentation"> <tr role="presentation"> <td class="yucs-form-input" role="presentation"> <input autocomplete="off" class="yucs-search-input" name="s" type="search" aria-describedby="mnp-search_box" data-yltvsearch="https://finance.yahoo.com/q;_ylt=Ap029z7TnYp0Aq9cKYpgG9x.FJF4" data-yltvsearchsugg="/;_ylt=AsyYlh40cTexyeFGYOG9WuZ.FJF4" data-satype="mini" data-gosurl="https://s.yimg.com/aq/autoc" data-pubid="666" data-enter-ylt="https://finance.yahoo.com/q;_ylt=Av5261wqtswPQNVr5AeclQx.FJF4" data-enter-fr="uh3_finance_vert_gs_ctrl1_e" data-maxresults="" id="mnp-search_box" data-rapidbucket=""/> </td><td NOWRAP class="yucs-form-btn" role="presentation"><div id="yucs-prop_search_button_wrapper" class="yucs-search-buttons"><div class="yucs-shadow"><div class="yucs-gradient"></div></div><button id="yucs-sprop_button" class="yucs-action_btn yucs-button_theme yucs-vsearch-button" type="submit" data-vfr="uh3_finance_vert_gs_ctrl1" onclick="var vfr = this.getAttribute('data-vfr'); if(vfr){document.getElementById('fr').value = vfr}" data-vsearch="https://finance.yahoo.com/q">Search Finance</button></div><div id="yucs-web_search_button_wrapper" class="yucs-search-buttons"><div class="yucs-shadow"><div class="yucs-gradient"></div></div><button id="yucs-search_button" class="yucs-action_btn yucs-wsearch-button" onclick="var form=document.getElementById('yucs-search').children[0];var wa=form.getAttribute('data-webaction');form.setAttribute('action',wa);var searchbox=document.getElementById('mnp-search_box');searchbox.setAttribute('name','p');" type="submit">Search Web</button></div></td></tr> </tbody> </table> <input type="hidden" id="uhb" name="uhb" value="uhb2" /> <input type="hidden" id="fr" name="fr" value="uh3_finance_web_gs_ctrl1" />   </form><div id="yucs-satray" class="sa-tray sa-hidden" data-wstext="Search Web for: " data-wsearch="https://search.yahoo.com/search;_ylt=AhHTTc4iRVef2uYykv.dAV1.FJF4" data-vfr="uh3_finance_vert_gs_ctrl1" data-vsearchAll="/;_ylt=Ajsvih9I8PgxVw4GCf.j2UJ.FJF4" data-vsearch="https://finance.yahoo.com/q;_ylt=AsyYlh40cTexyeFGYOG9WuZ.FJF4" data-vstext= "Search news for: " data-vert_fin_search="https://finance.search.yahoo.com/search/;_ylt=AprJLstNw5hBNdKdMX63J1R.FJF4"></div> </div></div><div class="yucs-fl-right"> <div id="yucs-profile" class="yucs-profile yucs-signedout"> <a id="yucs-menu_link_profile_signed_out" href="https://login.yahoo.com/config/login;_ylt=AuqAiHlREKVYl7SblLxofdp.FJF4?.src=quote&.intl=us&.lang=en-US&.done=https://finance.yahoo.com/q/op%3fs=SPWR%26date=1430438400" target="_top" rel="nofollow" class="sp yucs-fc" aria-label="Profile"> </a> <div id="yucs-profile_text" class="yucs-fc"> <a id="yucs-login_signIn" href="https://login.yahoo.com/config/login;_ylt=AuqAiHlREKVYl7SblLxofdp.FJF4?.src=quote&.intl=us&.lang=en-US&.done=https://finance.yahoo.com/q/op%3fs=SPWR%26date=1430438400" target="_top" rel="nofollow" class="yucs-fc"> Sign In </a> </div></div><div class="yucs-mail_link yucs-mailpreview-ancestor"><a id="yucs-mail_link_id" class="sp yltasis yucs-fc" href="https://mail.yahoo.com/;_ylt=Ar2oSO6zkRbixRcpYXo0cS5.FJF4?.intl=us&.lang=en-US&.src=ym" rel="nofollow" target="_top"> Mail </a><div class="yucs-mail-preview-panel yucs-menu yucs-hide" data-mail-txt="Mail" data-uri-scheme="http" data-uri-path="ucs.query.yahoo.com/v1/console/yql" data-mail-view="Go to Mail" data-mail-help-txt="Help" data-mail-help-url="http://help.yahoo.com/l/us/yahoo/mail/ymail/" data-mail-loading-txt="Loading..." data-languagetag="en-us" data-mrd-crumb="BNYGON2FKjD" data-authstate="signedout" data-middleauth-signin-text="Click here to view your mail" data-popup-login-url="https://login.yahoo.com/config/login_verify2?.pd=c%3DOIVaOGq62e5hAP8Tv..nr5E3&.src=sc" data-middleauthtext="You have {count} new messages." data-yltmessage-link="https://us.lrd.yahoo.com/_ylt=Ah1yAuVFU5bBd63mpGG84YR.FJF4/SIG=13eormtee/EXP=1427280473/**https%3a//mrd.mail.yahoo.com/msg%3fmid=%7bmsgID%7d%26fid=Inbox%26src=uh%26.crumb=BNYGON2FKjD" data-yltviewall-link="https://mail.yahoo.com/;_ylt=AvBQIZMdQWjDmk1Jh5KCeIB.FJF4" data-yltpanelshown="/;_ylt=AvX.rE3fZZOGOGRWYSgnj_p.FJF4" data-ylterror="/;_ylt=ApMHfvFgYr9RKW8OIicXS.5.FJF4" data-ylttimeout="/;_ylt=AmrS9ubbhhbpqNhFOPw3n_5.FJF4" data-generic-error="We're unable to preview your mail.<br>Go to Mail." data-nosubject="[No Subject]" data-timestamp='short'></div></div> <div id="yucs-help" class="yucs-activate yucs-help yucs-menu_nav"> <a id="yucs-help_button" class="sp yltasis" href="javascript:void(0);" aria-label="Help" rel="nofollow"> <em class="yucs-hide yucs-menu_anchor">Help</em> </a> <div id="yucs-help_inner" class="yucs-hide yucs-menu yucs-hm-activate" data-yltmenushown="/;_ylt=AiQyIw2eXW.8CHzoJZ_1AxV.FJF4"> <span class="sp yucs-dock"></span> <ul id="yuhead-help-panel"> <li><a class="yucs-acct-link" href="https://login.yahoo.com/account/personalinfo;_ylt=AsfjQxZ6jZsl3me2FMHIf_F.FJF4?.intl=us&.lang=en-US&.done=https://finance.yahoo.com/q/op%3fs=SPWR%26date=1430438400&amp;.src=quote&amp;.intl=us&amp;.lang=en-US" target="_top">Account Info</a></li> <li><a href="https://help.yahoo.com/l/us/yahoo/finance/;_ylt=AjfX9GZyZzkrnxb9ULu_gOV.FJF4" rel="nofollow" >Help</a></li> <span class="yucs-separator" role="presentation" style="display: block;"></span><li><a href="https://us.lrd.yahoo.com/_ylt=AuxJKY_x.uu8BeISqJ3YSUN.FJF4/SIG=11r8kequs/EXP=1427280473/**http%3a//feedback.yahoo.com/forums/207809" rel="nofollow" >Suggestions</a></li>  </ul> </div></div>  <div id="yucs-network_link"><a id="yucs-home_link" href="https://us.lrd.yahoo.com/_ylt=AobDXob037M2iMNVA8cdqnF.FJF4/SIG=11a69k544/EXP=1427280473/**https%3a//www.yahoo.com/" rel="nofollow" target="_top"><em class="sp">Yahoo</em><span class="yucs-fc">Home</span></a></div>       </div>   </div> <div id="yucs-location-js" class="yucs-hide yucs-offscreen yucs-location-activate" data-appid="yahoo.locdrop.ucs.desktop" data-crumb="4BSNBZKMo4y"><!-- empty for ie --></div><div id="yUnivHead" class="yucs-hide"><!-- empty --></div><div id="yhelp_container" class="yui3-skin-sam"></div></div><!-- alert --><!-- /alert -->
-        </div>
-
-
-    </div>
-
-    <div id="content-area" class="yui-sv-bd">
-
-        <div data-region="subNav">
-
-    
-    <ul id="finance-navigation" class="Grid Fz-m Fw-200 Whs-nw">
-        
-        
-        <li class="nav-section Grid-U  first">
-            <a href="/" title="">Finance Home</a>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U nav-fin-portfolios no-pjax has-entries">
-            <a href="/portfolios.html" title="portfolio nav">My Portfolio</a>
-            
-            <ul class="nav-subsection">
-                
-                <li>
-                    <ul class="scroll">
-                    
-                    </ul>
-                </li>
-                
-                
-                <li><a href="/portfolios/manage" title="portfolio nav" class="no-pjax">View All Portfolios</a></li>
-                
-                <li><a href="/portfolio/new" title="portfolio nav" class="no-pjax">Create Portfolio</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U ">
-            <a href="/my-quotes-news/" title="">My Quotes News</a>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U  has-entries">
-            <a href="/market-overview/" title="">Market Data</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/stock-center/" title="" class="">Stocks</a></li>
-                
-                <li><a href="/funds/" title="" class="no-pjax">Mutual Funds</a></li>
-                
-                <li><a href="/options/" title="" class="no-pjax">Options</a></li>
-                
-                <li><a href="/etf/" title="" class="no-pjax">ETFs</a></li>
-                
-                <li><a href="/bonds" title="" class="no-pjax">Bonds</a></li>
-                
-                <li><a href="/futures" title="" class="no-pjax">Commodities</a></li>
-                
-                <li><a href="/currency-investing" title="" class="no-pjax">Currencies</a></li>
-                
-                <li><a href="http://biz.yahoo.com/research/earncal/today.html" title="" class="">Calendars</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U  has-entries">
-            <a href="/yahoofinance/" title="Yahoo Originals">Yahoo Originals</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/yahoofinance/business/" title="" class="">Business</a></li>
-                
-                <li><a href="/yahoofinance/investing" title="" class="">Investing</a></li>
-                
-                <li><a href="/yahoofinance/personalfinance" title="" class="">Personal Finance</a></li>
-                
-                <li><a href="/blogs/breakout/" title="" class="no-pjax">Breakout</a></li>
-                
-                <li><a href="/blogs/cost-of-living/" title="" class="no-pjax">Cost of Living</a></li>
-                
-                <li><a href="/blogs/daily-ticker/" title="" class="no-pjax">The Daily Ticker</a></li>
-                
-                <li><a href="/blogs/driven/" title="" class="no-pjax">Driven</a></li>
-                
-                <li><a href="/blogs/hot-stock-minute/" title="" class="no-pjax">Hot Stock Minute</a></li>
-                
-                <li><a href="/blogs/just-explain-it/" title="" class="no-pjax">Just Explain It</a></li>
-                
-                <li><a href="http://finance.yahoo.com/blogs/author/aaron-task/" title="" class="">Aaron Task, Editor</a></li>
-                
-                <li><a href="/blogs/author/michael-santoli/" title="" class="">Michael Santoli</a></li>
-                
-                <li><a href="/blogs/author/jeff-macke/" title="" class="">Jeff Macke</a></li>
-                
-                <li><a href="/blogs/author/aaron-pressman/" title="" class="">Aaron Pressman</a></li>
-                
-                <li><a href="/blogs/author/rick-newman/" title="" class="">Rick Newman</a></li>
-                
-                <li><a href="/blogs/author/mandi-woodruff/" title="" class="">Mandi Woodruff</a></li>
-                
-                <li><a href="/blogs/author/chris-nichols/" title="" class="">Chris Nichols</a></li>
-                
-                <li><a href="/blogs/the-exchange/" title="" class="no-pjax">The Exchange</a></li>
-                
-                <li><a href="/blogs/michael-santoli/" title="" class="no-pjax">Unexpected Returns</a></li>
-                
-                <li><a href="http://finance.yahoo.com/blogs/author/philip-pearlman/" title="" class="">Philip Pearlman</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U  has-entries">
-            <a href="/news/" title="">Business &amp; Finance</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/corporate-news/" title="" class="">Company News</a></li>
-                
-                <li><a href="/economic-policy-news/" title="" class="">Economic News</a></li>
-                
-                <li><a href="/investing-news/" title="" class="">Market News</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U &amp;amp;amp;amp;amp;amp;amp;quot;new&amp;amp;amp;amp;amp;amp;amp;quot; has-entries">
-            <a href="/personal-finance/" title="Personal Finance">Personal Finance</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/career-education/" title="" class="">Career &amp; Education</a></li>
-                
-                <li><a href="/real-estate/" title="" class="">Real Estate</a></li>
-                
-                <li><a href="/retirement/" title="" class="">Retirement</a></li>
-                
-                <li><a href="/credit-debt/" title="" class="">Credit &amp; Debt</a></li>
-                
-                <li><a href="/taxes/" title="" class="">Taxes</a></li>
-                
-                <li><a href="/autos/" title="" class="">Autos</a></li>
-                
-                <li><a href="/lifestyle/" title="" class="">Health &amp; Lifestyle</a></li>
-                
-                <li><a href="/videos/" title="" class="">Featured Videos</a></li>
-                
-                <li><a href="/rates/" title="" class="no-pjax">Rates in Your Area</a></li>
-                
-                <li><a href="/calculator/index/" title="" class="no-pjax">Calculators</a></li>
-                
-                <li><a href="/personal-finance/tools/" title="" class="">Tools</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U  has-entries">
-            <a href="/cnbc/" title="Business News from CNBC">CNBC</a>
-            
-            <ul class="nav-subsection">
-                
-                
-                <li><a href="/blogs/big-data-download/" title="" class="no-pjax">Big Data Download</a></li>
-                
-                <li><a href="/blogs/off-the-cuff/" title="" class="no-pjax">Off the Cuff</a></li>
-                
-                <li><a href="/blogs/power-pitch/" title="" class="no-pjax">Power Pitch</a></li>
-                
-                <li><a href="/blogs/talking-numbers/" title="" class="no-pjax">Talking Numbers</a></li>
-                
-                <li><a href="/blogs/the-biz-fix/" title="" class="no-pjax">The Biz Fix</a></li>
-                
-                <li><a href="/blogs/top-best-most/" title="" class="no-pjax">Top/Best/Most</a></li>
-                
-            </ul>
-            
-        </li>
-        
-        
-        
-        <li class="nav-section Grid-U ">
-            <a href="/contributors/" title="Contributors">Contributors</a>
-            
-        </li>
-        
-        
-    </ul>
-    
-
-
-
-</div><!--END subNav-->
-
-
-        <div id="y-nav">
-            
-   
-       <div data-region="td-applet-mw-quote-search"><div id="applet_4305521169179279" class="App_v2 js-applet" data-applet-guid="4305521169179279" data-applet-type="td-applet-mw-quote-search">   <div class="App-Bd"> <div class="App-Main" data-region="main"> <div class="js-applet-view-container-main">  <style>
-    #lookupTxtQuotes {
-        float: left;
-        height: 22px;
-        padding: 3px 0 3px 5px;
-        width: 80px;
-        font-size: 11px;
-    }
-
-    .ac-form .yui3-fin-ac {
-        width: 50em;
-        border: 1px solid #DDD;
-        background: #fefefe;
-        overflow: visible;
-        text-align: left;
-        padding: .5em;
-        font-size: 12px;
-        z-index: 1000;
-        line-height: 1.22em;
-    }
-
-    .ac-form .yui3-highlight, em {
-        font-weight: bold;
-        font-style: normal;
-    }
-
-    .ac-form .yui3-fin-ac-list {
-        margin: 0;
-        padding-bottom: .4em;
-        padding: 0.38em 0;
-        width: 100%;
-    }
-
-    .ac-form .yui3-fin-ac-list li {
-        padding: 0.15em 0.38em;
-        _width: 100%;
-        cursor: default;
-        white-space: nowrap;
-        list-style: none;
-        vertical-align: bottom;
-        margin: 0;
-        position: relative;
-    }
-
-    .ac-form .symbol {
-        width: 8.5em;
-        display: inline-block;
-        margin: 0 1em 0 0;
-        overflow: hidden;
-    }
-
-    .ac-form .name {
-        display: inline-block;
-        left: 0;
-        width: 25em;
-        overflow: hidden;
-        position: relative;
-    }
-
-    .ac-form .exch_type_wrapper {
-        color: #aaa;
-        height: auto;
-        text-align: right;
-        font-size: 92%;
-        _font-size: 72%;
-        position: absolute;
-        right: 0;
-    }
-
-    .ac-form .yui-ac-ft {
-        font-family: Verdana,sans-serif;
-        font-size: 92%;
-        text-align: left;
-    }
-
-    .ac-form .moreresults {
-        padding-left: 0.3em;
-    }
-
-    .yui3-fin-ac-item-hover, .yui3-fin-ac-item-active {
-        background: #D6F7FF;
-        cursor: pointer;
-    }
-
-    .yui-ac-ft a {
-        color: #039;
-        text-decoration: none;
-        font-size: inherit !important;
-    }
-
-    .yui-ac-ft .tip {
-        border-top: 1px solid #D6D6D6;
-        color: #636363;
-        padding: 0.5em 0 0 0.4em;
-        margin-top: .25em;
-    }
-
-</style>
-<div mode="search" class="ticker-search mod" id="searchQuotes">
-    <div class="hd"></div>
-    <div class="bd" >
-        <form action="/q" name="quote" id="lookupQuote" class="ac-form">
-            <h2 class="yfi_signpost">Search for share prices</h2>
-            <label id="lookupPlaceHolder" class='Hidden'>Enter Symbol</label>
-            <input placeholder="Enter Symbol" type="text" autocomplete="off" value="" name="s" id="lookupTxtQuotes" class="fin-ac-input yui-ac-input">
-
-            <input type="hidden" autocomplete="off" value="1" name="ql" id="lookupGet_quote_logic_opt">
-
-            <div id="yfi_quotes_submit">
-                <span>
-                    <span>
-                        <span>
-                            <input type="submit" class="rapid-nf" id="btnQuotes" value="Look Up">
-                        </span>
-                    </span>
-                </span>
-            </div>
-        </form>
-    </div>
-    <div class="ft"><a href="http://finance.search.yahoo.com?fr=fin-v1" data-rapid_p="4">Finance Search</a>
-        <p><span id="yfs_market_time">Tue, Mar 24 2015, 10:47pm EDT - U.S. Markets closed</span></p></div>
-</div>
- </div> </div> </div> </div></div><!--END td-applet-mw-quote-search-->
-   
-
-
-        </div>
-        <div id="yfi_doc">
-            <div id="yfi_bd">
-                <div id="marketindices">
-
-                    
-                        
-                            <span><a href="/q?s=^DJI">Dow</a></span>
-                            <span id="yfs_pp0_^dji">
-                                
-                                    
-                                        <img width="10" height="14" border="0" alt="Down" class="neg_arrow" src="https://s.yimg.com/os/mit/media/m/base/images/transparent-1093278.png" style="margin-right:-2px;">
-                                    
-                                
-                                <b class="yfi-price-change-down">0.58%</b>
-                            </span>
-                        
-                        
-                    
-                        
-                        
-                            <span><a href="/q?s=^IXIC">Nasdaq</a></span>
-                        <span id="yfs_pp0_^ixic">
-                            
-                                
-                                    <img width="10" height="14" border="0" alt="Down" class="neg_arrow" src="https://s.yimg.com/os/mit/media/m/base/images/transparent-1093278.png" style="margin-right:-2px;">
-                                
-                            
-                            <b class="yfi-price-change-down">0.32%</b>
-
-                        
-                    
-                        
-                        
-                    
-                </div>
-
-                <div data-region="leftNav">
-<div id="yfi_investing_nav">
-    <div id="tickerSearch">
-        
-
-    </div>
-
-    <div class="hd">
-        <h2>More on SPWR</h2>
-    </div>
-    <div class="bd">
-
-        
-            <h3>Quotes</h3>
-            <ul>
-            
-                
-                    <li  ><a href="/q?s=SPWR">Summary</a></li>
-                
-            
-                
-                    <li  ><a href="/q/ecn?s=SPWR+Order+Book">Order Book</a></li>
-                
-            
-                
-                    <li class="selected" ><a href="/q/op?s=SPWR+Options">Options</a></li>
-                
-            
-                
-                    <li  ><a href="/q/hp?s=SPWR+Historical+Prices">Historical Prices</a></li>
-                
-            
-            </ul>
-        
-            <h3>Charts</h3>
-            <ul>
-            
-                
-                    <li  ><a href="/echarts?s=SPWR+Interactive">Interactive</a></li>
-                
-            
-            </ul>
-        
-            <h3>News &amp; Info</h3>
-            <ul>
-            
-                
-                    <li  ><a href="/q/h?s=SPWR+Headlines">Headlines</a></li>
-                
-            
-                
-                    
-                    
-                        <li  ><a href="/q/p?s=SPWR+Press+Releases">Press Releases</a></li>
-                    
-                
-            
-                
-                    <li  ><a href="/q/ce?s=SPWR+Company+Events">Company Events</a></li>
-                
-            
-                
-                    <li  ><a href="/mb?s=SPWR">Message Boards</a></li>
-                
-            
-                
-                    <li  ><a href="/marketpulse/?s=SPWR">Market Pulse</a></li>
-                
-            
-            </ul>
-        
-            <h3>Company</h3>
-            <ul>
-            
-                
-                    <li  ><a href="/q/pr?s=SPWR+Profile">Profile</a></li>
-                
-            
-                
-                    <li  ><a href="/q/ks?s=SPWR+Key+Statistics">Key Statistics</a></li>
-                
-            
-                
-                    <li  ><a href="/q/sec?s=SPWR+SEC+Filings">SEC Filings</a></li>
-                
-            
-                
-                    <li  ><a href="/q/co?s=SPWR+Competitors">Competitors</a></li>
-                
-            
-                
-                    <li  ><a href="/q/in?s=SPWR+Industry">Industry</a></li>
-                
-            
-                
-                    
-                    
-                        <li class="deselected">Components</li>
-                    
-                
-            
-            </ul>
-        
-            <h3>Analyst Coverage</h3>
-            <ul>
-            
-                
-                    <li  ><a href="/q/ao?s=SPWR+Analyst+Opinion">Analyst Opinion</a></li>
-                
-            
-                
-                    <li  ><a href="/q/ae?s=SPWR+Analyst+Estimates">Analyst Estimates</a></li>
-                
-            
-            </ul>
-        
-            <h3>Ownership</h3>
-            <ul>
-            
-                
-                    <li  ><a href="/q/mh?s=SPWR+Major+Holders">Major Holders</a></li>
-                
-            
-                
-                    <li  ><a href="/q/it?s=SPWR+Insider+Transactions">Insider Transactions</a></li>
-                
-            
-                
-                    <li  ><a href="/q/ir?s=SPWR+Insider+Roster">Insider Roster</a></li>
-                
-            
-            </ul>
-        
-            <h3>Financials</h3>
-            <ul>
-            
-                
-                    <li  ><a href="/q/is?s=SPWR+Income+Statement">Income Statement</a></li>
-                
-            
-                
-                    <li  ><a href="/q/bs?s=SPWR+Balance+Sheet">Balance Sheet</a></li>
-                
-            
-                
-                    <li  ><a href="/q/cf?s=SPWR+Cash+Flow">Cash Flow</a></li>
-                
-            
-            </ul>
-        
-    </div>
-    <div class="ft">
-
-    </div>
-</div>
-
-</div><!--END leftNav-->
-                <div id="sky">
-                    <div id="yom-ad-SKY"><div id="yom-ad-SKY-iframe"></div></div><!--ESI Ads for SKY -->
-                </div>
-                <div id="yfi_investing_content">
-
-                    <div id="yfi_broker_buttons">
-                        <div class='yom-ad D-ib W-20'>
-                            <div id="yom-ad-FB2-1"><div id="yom-ad-FB2-1-iframe"><script>var FB2_1_noadPos = document.getElementById("yom-ad-FB2-1");  if (FB2_1_noadPos) {FB2_1_noadPos.style.display="none";}</script></div></div><!--ESI Ads for FB2-1 -->
-                        </div>
-                        <div class='yom-ad D-ib W-25'>
-                            <div id="yom-ad-FB2-2"><div id="yom-ad-FB2-2-iframe"><script>var FB2_2_noadPos = document.getElementById("yom-ad-FB2-2");  if (FB2_2_noadPos) {FB2_2_noadPos.style.display="none";}</script></div></div><!--ESI Ads for FB2-2 -->
-                        </div>
-                        <div class='yom-ad D-ib W-25'>
-                            <div id="yom-ad-FB2-3"><div id="yom-ad-FB2-3-iframe"><script>var FB2_3_noadPos = document.getElementById("yom-ad-FB2-3");  if (FB2_3_noadPos) {FB2_3_noadPos.style.display="none";}</script></div></div><!--ESI Ads for FB2-3 -->
-                        </div>
-                        <div class='yom-ad D-ib W-25'>
-                            <div id="yom-ad-FB2-4"><div id="yom-ad-FB2-4-iframe"><script>var FB2_4_noadPos = document.getElementById("yom-ad-FB2-4");  if (FB2_4_noadPos) {FB2_4_noadPos.style.display="none";}</script></div></div><!--ESI Ads for FB2-4 -->
-                        </div>
-                    </div>
-                    
-   
-       <div data-region="td-applet-mw-quote-details"><style>/*
-*  Stencil defined classes - https://git.corp.yahoo.com/pages/ape/stencil/behavior/index.html
-*   .PageOverlay
-*   .ModalDismissBtn.Btn
-*/
-
-/*
-* User defined classes
-*   #ham-nav-cue-modal - styles for the modal window
-*   .padd-border - styles for the content box of #ham-nav-cue-modal
-*   #ham-nav-cue-modal:after, #ham-nav-cue-modal:before - used to create modal window's arrow.
-*/
-
-.PageOverlay #ham-nav-cue-modal {
-    left: 49px;
-    transition: -webkit-transform .3s;
-    max-width: 240px;
-}
-
-.PageOverlay #ham-nav-cue-modal .padd-border {
-    border: solid #5300C5 2px;
-    padding: 5px 5px 10px 15px;
-}
-
-.PageOverlay {
-    z-index: 201;
-}
-
-#ham-nav-cue-modal:after,
-#ham-nav-cue-modal:before {
-    content: "";
-    border-style: solid;
-    border-width: 10px;
-    width: 0;
-    height: 0;
-    position: absolute;
-    top: 4%;
-    left: -20px;
-}
-
-#ham-nav-cue-modal:before {
-    border-color: transparent #5300C5 transparent transparent;
-}
-
-#ham-nav-cue-modal:after {
-    margin-left: 3px;
-    border-color: transparent #fff transparent transparent;
-}
-
-.ModalDismissBtn.Btn {
-    background: transparent;
-    border-color: transparent;
-}
-.follow-quote,.follow-quote-proxy {
-    color: #999;
-}
-.Icon.follow-quote-following {
-    color: #eac02b;
-}
-
-.follow-quote-tooltip {
-    z-index: 400;
-    text-align: center;
-}
-
-.follow-quote-area:hover .follow-quote {
-    display: inline-block;
-}
-
-.follow-quote-area:hover .quote-link,.follow-quote-visible .quote-link {
-    display: inline-block;
-    max-width: 50px;
-    _width: 50px;
-}</style><div id="applet_4305521170488091" class="App_v2 js-applet" data-applet-guid="4305521170488091" data-applet-type="td-applet-mw-quote-details">   <div class="App-Bd"> <div class="App-Main" data-region="main"> <div class="js-applet-view-container-main">  
-  
-    <style>
-        img {
-            vertical-align: baseline;
-        }
-        .follow-quote {
-            margin-left: 5px;
-            margin-right: 2px;
-        }
-        .yfi_rt_quote_summary .rtq_exch {
-            font: inherit;
-        }
-        .up_g.time_rtq_content, span.yfi-price-change-green {
-            color: #80 !important;
-        }
-        .time_rtq, .follow-quote-txt {
-            color: #979ba2;
-        }
-        .yfin_gs span.yfi-price-change-red, .yfin_gs span.yfi-price-change-green {
-            font-weight: bold;
-        }
-        .yfi_rt_quote_summary .hd h2 {
-            font: inherit;
-        }
-        span.yfi-price-change-red {
-            color: #C00 !important;
-        }
-        /* to hide the up/down arrow */
-        .yfi_rt_quote_summary_rt_top .time_rtq_content img {
-            display: none;
-        }
-
-        .quote_summary {
-            min-height: 77px;
-        }
-
-        .app_promo.after_hours, .app_promo.pre_market {
-            top: 8px;
-        }
-    </style>
-    <div class="rtq_leaf">
-      <div class="rtq_div">
-        <div class="yui-g quote_summary">
-          <div class="yfi_rt_quote_summary" id="yfi_rt_quote_summary">
-            <div class="hd">
-              <div class="title Fz-xl">
-                <h2 class="symbol-name">SunPower Corporation (SPWR)</h2>
-                <span class="wl_sign Invisible"><button class="follow-quote follow-quote-follow follow-quote-always-visible D-ib Bd-0 O-0 Cur-p Sprite P-0 M-0 Fz-s" data-flw-quote="SPWR"><i class="Icon">&#xe023;</i></button>  <span class="follow-quote-txt Fz-m" data-flw-quote="SPWR">
-                    Watchlist
-                </span></span>
-              </div>
-            </div>
-            <div class="yfi_rt_quote_summary_rt_top sigfig_promo_1">
-              <div>
-                  <span class="time_rtq_ticker Fz-30 Fw-b">
-                        <span id="yfs_l84_SPWR" data-sq="SPWR:value">33.05</span>
-                  </span>
-                
-
-                    
-                        <span class="up_g time_rtq_content Fz-2xl Fw-b"><span id="yfs_c63_SPWR"><img width="10" height="14" border="0" style="margin-right:-2px;" src="https://s.yimg.com/lq/i/us/fi/03rd/up_g.gif" alt="Up"> <span class="yfi-price-change-green" data-sq="SPWR:chg">+0.07</span></span><span id="yfs_p43_SPWR">(<span class="yfi-price-change-green" data-sq="SPWR:pctChg">0.21%</span>)</span> </span>
-                    
-                
-                    <span class="time_rtq Fz-m"><span class="rtq_exch">NASDAQ - </span><span id="yfs_t53_SPWR">As of <span data-sq="SPWR:lstTrdTime">4:00PM EDT</span></span></span>
-
-              </div>
-              <div><span class="rtq_separator">|</span>
-                    
-                    After Hours:
-                        <span class="yfs_rtq_quote"><span id="yfs_l86_SPWR" data-sq="SPWR:ahValue">33.10</span></span> <span class="up_g"><span id="yfs_c85_SPWR"><img width="10" height="14" style="margin-right:-2px;" border="0" src="https://s.yimg.com/os/mit/media/m/base/images/transparent-1093278.png" class="pos_arrow" alt="Up" data-sq="SPWR:ahChg"> +0.05</span> (<span id="yfs_c86_SPWR" data-sq="SPWR:ahPctChg">0.15%</span>)</span><span class="time_rtq"> <span id="yfs_t54_SPWR" data-sq="SPWR:ahLstTrdTime">7:47PM EDT</span></span>
-                    
-                    
-              </div>
-            </div>
-            <style>
-              #yfi_toolbox_mini_rtq.sigfig_promo {
-              bottom:45px !important;
-              }
-            </style>
-            <div class="app_promo after_hours " >
-                <a href="https://mobile.yahoo.com/finance/?src=gta" title="Get the App" target="_blank" ></a>
-
-            </div>
-          </div>
-        </div>
-      </div>
-    </div>
-  
-
- </div> </div> </div> </div></div><!--END td-applet-mw-quote-details-->
-   
-
-
-                    <div id="optionsTableApplet">
-                    
-   
-       <div data-region="td-applet-options-table"><style>.App_v2 {
-    border: none;
-    margin: 0;
-    padding: 0;
-}
-
-.options-table {
-    position: relative;
-}
-
-/*.Icon.up {*/
-    /*display: none;*/
-/*}*/
-
-.option_column {
-    width: auto;
-}
-
-.header_text {
-    float: left;
-    max-width: 50px;
-}
-.header_sorts {
-    color: #00be8c;
-    float: left;
-}
-
-.size-toggle-menu {
-    margin-left: 600px;
-}
-
-.in-the-money-banner {
-    background-color: rgba(224,241,231,1);
-    padding: 7px;
-    position: relative;
-    top: -3px;
-    width: 95px;
-}
-
-.in-the-money.odd {
-    background-color: rgba(232,249,239,1);
-}
-
-.in-the-money.even {
-    background-color: rgba(224,241,231,1);
-}
-
-.toggle li{
-    display: inline-block;
-    cursor: pointer;
-    border: 1px solid #e2e2e6;
-    border-right-width: 0;
-    color: #454545;
-    background-color: #fff;
-    float: left;
-    padding: 0px;
-    margin: 0px;
-}
-
-.toggle li a {
-  padding: 7px;
-  display: block;
-}
-
-.toggle li:hover{
-    background-color: #e2e2e6;
-}
-
-.toggle li.active{
-    color: #fff;
-    background-color: #30d3b6;
-    border-color: #30d3b6;
-    border-bottom-color: #0c8087;
-}
-
-.toggle li:first-child{
-    border-radius: 3px 0 0 3px;
-}
-
-.toggle li:last-child{
-    border-radius: 0 3px 3px 0;
-    border-right-width: 1px;
-}
-
-.high-low .up {
-    display: none;
-}
-
-.high-low .down {
-    display: block;
-}
-
-.low-high .down {
-    display: none;
-}
-
-.low-high .up {
-    display: block;
-}
-
-.option_column.sortable {
-    cursor: pointer;
-}
-
-.option-filter-overlay {
-    background-color: #fff;
-    border: 1px solid #979ba2;
-    border-radius: 3px;
-    float: left;
-    padding: 15px;
-    position: absolute;
-    top: 60px;
-    z-index: 10;
-    display: none;
-}
-
-#optionsStraddlesTable .option-filter-overlay {
-    left: 430px;
-}
-
-.option-filter-overlay.active {
-    display: block;
-}
-
-.option-filter-overlay .strike-filter{
-    height: 25px;
-    width: 75px;
-}
-
-#straddleTable .column-strike .cell{
-    width: 30px;
-}
-
-/**columns**/
-
-#quote-table th.column-expires {
-    width: 102px;
-}
-.straddle-expire div.option_entry {
-    min-width: 65px;
-}
-.column-last .cell {
-    width: 55px;
-}
-
-.column-change .cell {
-    width: 70px;
-}
-
-.cell .change {
-    width: 35px;
-}
-
-.column-percentChange .cell {
-    width: 85px;
-}
-
-.column-volume .cell {
-    width: 70px;
-}
-
-.cell .sessionVolume {
-    width: 37px;
-}
-
-.column-session-volume .cell {
-    width: 75px;
-}
-
-.column-openInterest .cell, .column-openInterestChange .cell {
-    width: 75px;
-}
-.cell .openInterest, .cell .openInterestChange {
-    width: 37px;
-}
-
-.column-bid .cell {
-    width: 50px;
-}
-
-.column-ask .cell {
-    width: 55px;
-}
-
-.column-impliedVolatility .cell {
-    width: 75px;
-}
-
-.cell .impliedVolatility {
-    width: 37px;
-}
-
-.column-contractName .cell {
-    width: 170px;
-}
-
-.options-menu-item {
-    position: relative;
-    top: -11px;
-}
-
-.options-table {
-  margin-bottom: 30px;
-}
-.options-table.hidden {
-  display: none;
-}
-#quote-table table {
-  width: 100%;
-}
-#quote-table tr * {
-  font-family: 'Helvetica Neue', Helvetica, Arial, sans-serif;
-  font-size: 15px;
-  color: #454545;
-  font-weight: 200;
-}
-#quote-table tr a {
-    color: #1D1DA3;
-}
-#quote-table tr .Icon {
-  font-family: YGlyphs;
-}
-#quote-table tr.odd {
-  background-color: #f7f7f7;
-}
-#quote-table tr th {
-  -webkit-box-sizing: border-box;
-  -moz-box-sizing: border-box;
-  box-sizing: border-box;
-  text-align: center;
-  width: 60px;
-  font-size: 11px !important;
-  padding-top: 10px;
-  padding-right: 5px;
-  padding-bottom: 10px;
-  vertical-align: middle;
-}
-#quote-table tr th * {
-  font-size: 11px;
-}
-#quote-table tr th .expand-icon {
-  display: block !important;
-  margin: 0 auto;
-  border: 1px solid #e2e2e6;
-  background-color: #fcfcfc;
-  -webkit-border-radius: 2px;
-  border-radius: 2px;
-  padding: 2px 0;
-}
-#quote-table tr th.column-strike {
-  width: 82px;
-}
-#quote-table tr th .sort-icons {
-  position: absolute;
-  margin-left: 2px;
-}
-#quote-table tr th .Icon {
-  display: none;
-}
-#quote-table tr th.low-high .up {
-  display: block !important;
-}
-#quote-table tr th.high-low .down {
-  display: block !important;
-}
-#quote-table td {
-  text-align: center;
-  padding: 7px 5px 7px 5px;
-}
-#quote-table td:first-child,
-#quote-table th:first-child {
-  border-right: 1px solid #e2e2e6;
-}
-#quote-table .D-ib .Icon {
-  color: #66aeb2;
-}
-#quote-table caption {
-  background-color: #454545 !important;
-  color: #fff;
-  font-size: medium;
-  padding: 4px;
-  padding-left: 20px !important;
-  text-rendering: antialiased;
-  -webkit-box-sizing: border-box;
-  -moz-box-sizing: border-box;
-  box-sizing: border-box;
-}
-#quote-table caption .callStraddles {
-  width:50%;
-  text-align:center;
-  float:left;
-}
-#quote-table caption .putStraddles {
-  width:50%;
-  text-align:center;
-  float:right;
-}
-#quote-table .in-the-money.even {
-  background-color: #f3fdfc;
-}
-#quote-table .in-the-money.even td:first-child {
-  -webkit-box-shadow: inset 5px 0 0 0 #d5f8f3;
-  box-shadow: inset 5px 0 0 0 #d5f8f3;
-}
-#quote-table .in-the-money.even td:last-child {
-  -webkit-box-shadow: inset -5px 0 0 0 #d5f8f3;
-  box-shadow: inset -5px 0 0 0 #d5f8f3;
-}
-#quote-table .in-the-money.odd {
-  background-color: #ecf6f4;
-}
-#quote-table .in-the-money.odd td:first-child {
-  -webkit-box-shadow: inset 5px 0 0 0 #cff3ec;
-  box-shadow: inset 5px 0 0 0 #cff3ec;
-}
-#quote-table .in-the-money.odd td:last-child {
-  -webkit-box-shadow: inset -5px 0 0 0 #cff3ec;
-  box-shadow: inset -5px 0 0 0 #cff3ec;
-}
-#quote-table .column-strike {
-  text-align: center;
-  padding: 4px 20px;
-}
-#quote-table .column-strike .header_text,
-#quote-table .column-expires .cell .expiration{
-  color: #454545;
-  font-size: 15px;
-  font-weight: bold;
-  max-width: 100%;
-}
-#quote-table .column-strike .header_text {
-    width: 100%;
-}
-#quote-table .column-strike .filter {
-  border: 1px solid #e2e2e6;
-  background-color: #fcfcfc;
-  color: #858585;
-  display: inline-block;
-  padding: 1px 10px;
-  -webkit-border-radius: 3px;
-  border-radius: 3px;
-  margin-top: 4px;
-}
-#quote-table .column-strike .filter span {
-  position: relative;
-  top: -2px;
-  font-weight: bold;
-  margin-left: -5px;
-}
-
-#quote-table .column-strike .sort-icons {
-   top: 35px;
-}
-#quote-table .column-expires .sort-icons {
-    top: 45px;
-}
-#optionsStraddlesTable .column-expires .sort-icons {
-    top: 40px;
-}
-#quote-table #options_menu {
-  width: 100%;
-}
-#quote-table #options_menu .SelectBox-Pick {
-  background-color: #fcfcfc !important;
-  border: 1px solid #e2e2e6;
-  color: #128086;
-  font-size: 14px;
-  padding: 5px;
-  padding-top: 8px;
-}
-#quote-table #options_menu .SelectBox-Text {
-  font-weight: bold;
-}
-#quote-table .size-toggle-menu {
-  margin-left: 15px !important;
-}
-#quote-table .options-menu-item {
-  top: -9px;
-}
-#quote-table .option_view {
-  float: right;
-}
-#quote-table .option-change-pos {
-  color: #2ac194;
-}
-#quote-table .option-change-neg {
-  color: #f90f31;
-}
-#quote-table .toggle li {
-  color: #128086;
-  background-color: #fcfcfc;
-}
-#quote-table .toggle li.active {
-  color: #fff;
-  background-color: #35d2b6;
-}
-#quote-table .expand-icon {
-  color: #b5b5b5;
-  font-size: 12px;
-  cursor: pointer;
-}
-#quote-table .straddleCallContractName {
-  padding-left: 25px;
-}
-#quote-table .straddlePutContractName {
-  padding-left: 20px;
-}
-#quote-table .straddle-row-expand {
-  display: none;
-  border-bottom: 1px solid #f9f9f9;
-}
-#quote-table .straddle-row-expand td {
-  padding-right: 5px;
-}
-#quote-table .straddle-row-expand label {
-  color: #454545;
-  font-size: 11px;
-  margin-bottom: 2px;
-  color: #888;
-}
-#quote-table .straddle-row-expand label,
-#quote-table .straddle-row-expand div {
-  display: block;
-  font-weight: 400;
-  text-align: left;
-  padding-left: 5px;
-}
-#quote-table .expand-icon-up {
-  display: none;
-}
-#quote-table tr.expanded + .straddle-row-expand {
-  display: table-row;
-}
-#quote-table tr.expanded .expand-icon-up {
-  display: inline-block;
-}
-#quote-table tr.expanded .expand-icon-down {
-  display: none;
-}
-.in-the-money-banner {
-  color: #7f8584;
-  font-size: 11px;
-  background-color: #eefcfa;
-  border-left: 12px solid #e0faf6;
-  border-right: 12px solid #e0faf6;
-  width: 76px !important;
-  text-align: center;
-  padding: 5px !important;
-  margin-top: 5px;
-  margin-left: 15px;
-}
-#optionsStraddlesTable td div {
-  text-align: center;
-}
-#optionsStraddlesTable .straddle-strike,
-#optionsStraddlesTable .column-strike,
-#optionsStraddlesTable .straddle-expire{
-  border-right: 1px solid #e2e2e6;
-  border-left: 1px solid #e2e2e6;
-}
-#optionsStraddlesTable td:first-child,
-#optionsStraddlesTable th:first-child {
-  border-right: none !important;
-}
-#optionsStraddlesTable .odd td.in-the-money {
-  background-color: #ecf6f4;
-}
-#optionsStraddlesTable .odd td.in-the-money:first-child {
-  -webkit-box-shadow: inset 5px 0 0 0 #cff3ec;
-  box-shadow: inset 5px 0 0 0 #cff3ec;
-}
-#optionsStraddlesTable .odd td.in-the-money:last-child {
-  -webkit-box-shadow: inset -5px 0 0 0 #cff3ec;
-  box-shadow: inset -5px 0 0 0 #cff3ec;
-}
-#optionsStraddlesTable .even td.in-the-money {
-  background-color: #f3fdfc;
-}
-#optionsStraddlesTable .even td.in-the-money:first-child {
-  -webkit-box-shadow: inset 5px 0 0 0 #d5f8f3;
-  box-shadow: inset 5px 0 0 0 #d5f8f3;
-}
-#optionsStraddlesTable .even td.in-the-money:last-child {
-  -webkit-box-shadow: inset -5px 0 0 0 #d5f8f3;
-  box-shadow: inset -5px 0 0 0 #d5f8f3;
-}
-.column-expand-all {
-  cursor: pointer;
-}
-.options-table.expand-all tr + .straddle-row-expand {
-  display: table-row !important;
-}
-.options-table.expand-all tr .expand-icon-up {
-  display: inline-block !important;
-}
-.options-table.expand-all tr .expand-icon-down {
-  display: none !important;
-}
-.options_menu .toggle a {
-  color: #128086;
-}
-.options_menu .toggle a:hover {
-  text-decoration: none;
-}
-.options_menu .toggle .active a {
-  color: #fff;
-}
-#options_menu .symbol_lookup {
-    float: right;
-    top: -11px;
-}
-.symbol_lookup .options-ac-input {
-    border-radius: 0;
-    height: 26px;
-    width: 79%;
-}
-.goto-icon {
-    border-left: 1px solid #e2e2e6;
-    color: #028087;
-    cursor: pointer;
-}
-.symbol_lookup .goto-icon {
-    height: 27px;
-    line-height: 2.1em;
-}
-#finAcOutput {
-    left: 10px;
-    top: -10px;
-}
-#finAcOutput .yui3-fin-ac-hidden {
-    display: none;
-}
-#finAcOutput .yui3-aclist {
-    border: 1px solid #DDD;
-    background: #fefefe;
-    font-size: 92%;
-    left: 0 !important;
-    overflow: visible;
-    padding: .5em;
-    position: absolute !important;
-    text-align: left;
-    top: 0 !important;
-
-}
-#finAcOutput li.yui3-fin-ac-item-active,
-#finAcOutput li.yui3-fin-ac-item-hover {
-    background: #F1F1F1;
-    cursor: pointer;
-}
-#finAcOutput div:first-child {
-    width: 30em !important;
-}
-#finAcOutput b.yui3-highlight {
-    font-weight: bold;
-}
-#finAcOutput li .name {
-    display: inline-block;
-    left: 0;
-    width: 25em;
-    overflow: hidden;
-    position: relative;
-}
-
-#finAcOutput li .symbol {
-    width: 8.5em;
-    display: inline-block;
-    margin: 0 1em 0 0;
-    overflow: hidden;
-}
-
-#finAcOutput li {
-    color: #444;
-    cursor: default;
-    font-weight: 300;
-    list-style: none;
-    margin: 0;
-    padding: .15em .38em;
-    position: relative;
-    vertical-align: bottom;
-    white-space: nowrap;
-}
-
-.yui3-fin-ac-hidden {
-    visibility: hidden;
-}
-
-.filterRangeRow {
-    line-height: 5px;
-}
-.filterRangeTitle {
-    padding-bottom: 5px;
-    font-size: 12px !important;
-}
-.clear-filter {
-    padding-left: 20px;
-}
-.closeFilter {
-    font-size: 10px !important;
-    color: red !important;
-}
-.modify-filter {
-    font-size: 11px !important;
-}
-.showModifyFilter {
-    top: 80px;
-    left: 630px;
-}
-
-#options_menu {
-    margin-bottom: -15px;
-}
-
-#optionsTableApplet {
-    margin-top: 9px;
-    width: 1070px;
-}
-
-#yfi_charts.desktop #yfi_doc, #yfi_charts.tablet #yfi_doc {
-    width: 1440px;
-}
-
-#yfi_charts.tablet #yfi_investing_content {
-    width: 1070px;
-}
-
-#sky {
-    float: right;
-    margin-left: 30px;
-    margin-top: 50px;
-    width: 170px;
-}
-</style><div id="applet_4305521169702139" class="App_v2 js-applet" data-applet-guid="4305521169702139" data-applet-type="td-applet-options-table">   <div class="App-Bd"> <div class="App-Main" data-region="main"> <div class="js-applet-view-container-main">  <div id="quote-table">
-    <div id="options_menu" class="Grid-U options_menu">
-        
-        <form class="Grid-U SelectBox Disabled">
-            <div class="SelectBox-Pick"><b class='SelectBox-Text '>May 1, 2015</b><i class='Icon Va-m'>&#xe002;</i></div>
-            <select class='Start-0' disabled data-plugin="selectbox">
-                
-
-                    <option data-selectbox-link="/q/op?s=SPWR&date=1427414400" value="1427414400"  >March 27, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=SPWR&date=1427932800" value="1427932800"  >April 2, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=SPWR&date=1428624000" value="1428624000"  >April 10, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=SPWR&date=1429228800" value="1429228800"  >April 17, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=SPWR&date=1429833600" value="1429833600"  >April 24, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=SPWR&date=1430438400" value="1430438400" selected >May 1, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=SPWR&date=1434672000" value="1434672000"  >June 19, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=SPWR&date=1442534400" value="1442534400"  >September 18, 2015</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=SPWR&date=1452816000" value="1452816000"  >January 15, 2016</option>
-                
-
-                    <option data-selectbox-link="/q/op?s=SPWR&date=1484870400" value="1484870400"  >January 20, 2017</option>
-                
-            </select>
-        </form>
-        
-        
-
-        <div class="Grid-U options-menu-item symbol_lookup">
-            <div class="Cf">
-                <div class="fin-ac-container Bd-1 Pos-r M-10">
-                    <input placeholder="Lookup Option" type="text" autocomplete="off" value="" name="s" class="options-ac-input Bd-0" id="finAcOptions">
-                    <i class="Icon Fl-end W-20 goto-icon">&#xe015;</i>
-                </div>
-                <div id="finAcOutput" class="yui-ac-container Pos-r"></div>
-            </div>
-        </div>
-        <div class="Grid-U option_view options-menu-item">
-            <ul class="toggle toggle-view-mode">
-                <li class="toggle-list active">
-                  <a href="/q/op?s=SPWR&date=1430438400">List</a>
-                </li>
-                <li class="toggle-straddle ">
-                  <a href="/q/op?s=SPWR&straddle=true&date=1430438400">Straddle</a>
-                </li>
-            </ul>
-
-        </div>
-        <div class="Grid-U in_the_money in-the-money-banner">
-            In The Money
-        </div>
-    </div>
-
-    
-        
-            <div class="options-table " id="optionsCallsTable" data-sec="options-calls-table">
-                <div class="strike-filter option-filter-overlay">
-	<p>Show Me Strikes From</p>
-	<div class="My-6">
-	    $ <input class="filter-low strike-filter" data-filter-type="low" type="text">
-	    to $ <input class="filter-high strike-filter" data-filter-type="high" type="text">
-	</div>
-	<a data-table-filter="optionsCalls" class="Cur-p apply-filter">Apply Filter</a>
-	<a class="Cur-p clear-filter">Clear Filter</a>
-</div>
-                
-
-<div class="follow-quote-area">
-    <div class="quote-table-overflow">
-        <table class="details-table quote-table Fz-m">
-            
-                
-                    <caption>
-                        Calls
-                    </caption>
-                
-            
-            <thead class="details-header quote-table-headers">
-                <tr>
-                    
-    
-
-        
-            <th class='column-strike Pstart-38 low-high  Fz-xs filterable sortable option_column' style='color: #454545;' data-sort-column='strike' data-col-pos='0'>
-                <div class="cell">
-                    <div class="D-ib header_text strike">Strike</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-                <div class="filter  Cur-p "><span>&#8757;</span> Filter</div>
-            </th>
-        
-    
-
-    
-        
-            <th class='column-contractName Pstart-10 '>Contract Name</th>
-        
-    
-
-    
-
-        
-            <th class='column-last Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='lastPrice' data-col-pos='2'>
-                <div class="cell">
-                    <div class="D-ib lastPrice">Last</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-bid Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='bid' data-col-pos='3'>
-                <div class="cell">
-                    <div class="D-ib bid">Bid</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-ask Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='ask' data-col-pos='4'>
-                <div class="cell">
-                    <div class="D-ib ask">Ask</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-change Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='change' data-col-pos='5'>
-                <div class="cell">
-                    <div class="D-ib change">Change</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-percentChange Pstart-16  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='percentChange' data-col-pos='6'>
-                <div class="cell">
-                    <div class="D-ib percentChange">%Change</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-volume Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='volume' data-col-pos='7'>
-                <div class="cell">
-                    <div class="D-ib volume">Volume</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-openInterest Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='openInterest' data-col-pos='8'>
-                <div class="cell">
-                    <div class="D-ib openInterest">Open Interest</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-impliedVolatility Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='impliedVolatility' data-col-pos='9'>
-                <div class="cell">
-                    <div class="D-ib impliedVolatility">Implied Volatility</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-
-                </tr>
-                
-                <tr class="filterRangeRow D-n">
-                    <td colspan="10">
-                        <div>
-                            <span class="filterRangeTitle"></span>
-                            <span class="closeFilter Cur-p">&#10005;</span>
-                            <span class="modify-filter Cur-p">[modify]</span>
-                        </div>
-                    </td>
-                </tr>
-                
-            </thead>
-
-            <tbody>
-                
-                    
-                    
-    <tr data-row="0" data-row-quote="_" class="in-the-money 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=SPWR&strike=30.50">30.50</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=SPWR150501C00030500">SPWR150501C00030500</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.57</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >3.30</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >4.20</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >-0.49</div>
-        </td>
-        <td>
-            
-                
-                
-                    <div class="option_entry Fz-m option-change-neg">-13.73%</div>
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="10">10</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >20</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >55.08%</div>
-        </td>
-    </tr>
-
-    <tr data-row="1" data-row-quote="_" class=" 
-        
-         odd
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=SPWR&strike=35.00">35.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=SPWR150501C00035000">SPWR150501C00035000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.10</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.06</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >1.44</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="107">107</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >119</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >52.20%</div>
-        </td>
-    </tr>
-
-    <tr data-row="2" data-row-quote="_" class=" 
-        
-        even
-    
-    ">
-        <td>
-            <strong data-sq=":value" data-raw=""><a href="/q/op?s=SPWR&strike=42.00">42.00</a></strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" ><a href="/q?s=SPWR150501C00042000">SPWR150501C00042000</a></div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.41</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.50</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >0.00</div>
-        </td>
-        <td>
-            
-                
-                    <div class="option_entry Fz-m">0.00%</div>
-                
-                
-            
-        </td>
-        <td>
-            <strong data-sq=":volume" data-raw="20">20</strong>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >10</div>
-        </td>
-        <td>
-            <div class="option_entry Fz-m" >54.00%</div>
-        </td>
-    </tr>
-
-
-                    
-                    
-                    
-                    
-                
-            </tbody>
-        </table>
-    </div>
-</div>
-
-
-            </div>
-
-            <div class="options-table " id="optionsPutsTable" data-sec="options-puts-table">
-                <div class="strike-filter option-filter-overlay">
-	<p>Show Me Strikes From</p>
-	<div class="My-6">
-	    $ <input class="filter-low strike-filter" data-filter-type="low" type="text">
-	    to $ <input class="filter-high strike-filter" data-filter-type="high" type="text">
-	</div>
-	<a data-table-filter="optionsPuts" class="Cur-p apply-filter">Apply Filter</a>
-	<a class="Cur-p clear-filter">Clear Filter</a>
-</div>
-                
-
-<div class="follow-quote-area">
-    <div class="quote-table-overflow">
-        <table class="details-table quote-table Fz-m">
-            
-                
-                    <caption>
-                        Puts
-                    </caption>
-                
-            
-            <thead class="details-header quote-table-headers">
-                <tr>
-                    
-    
-
-        
-            <th class='column-strike Pstart-38 low-high  Fz-xs filterable sortable option_column' style='color: #454545;' data-sort-column='strike' data-col-pos='0'>
-                <div class="cell">
-                    <div class="D-ib header_text strike">Strike</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-                <div class="filter  Cur-p "><span>&#8757;</span> Filter</div>
-            </th>
-        
-    
-
-    
-        
-            <th class='column-contractName Pstart-10 '>Contract Name</th>
-        
-    
-
-    
-
-        
-            <th class='column-last Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='lastPrice' data-col-pos='2'>
-                <div class="cell">
-                    <div class="D-ib lastPrice">Last</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-bid Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='bid' data-col-pos='3'>
-                <div class="cell">
-                    <div class="D-ib bid">Bid</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-ask Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='ask' data-col-pos='4'>
-                <div class="cell">
-                    <div class="D-ib ask">Ask</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-change Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='change' data-col-pos='5'>
-                <div class="cell">
-                    <div class="D-ib change">Change</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-percentChange Pstart-16  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='percentChange' data-col-pos='6'>
-                <div class="cell">
-                    <div class="D-ib percentChange">%Change</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-volume Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='volume' data-col-pos='7'>
-                <div class="cell">
-                    <div class="D-ib volume">Volume</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-openInterest Pstart-14  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='openInterest' data-col-pos='8'>
-                <div class="cell">
-                    <div class="D-ib openInterest">Open Interest</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-    
-
-        
-            <th class='column-impliedVolatility Pstart-10  Fz-xs sortable option_column' style='color: #454545;' data-sort-column='impliedVolatility' data-col-pos='9'>
-                <div class="cell">
-                    <div class="D-ib impliedVolatility">Implied Volatility</div>
-                    <div class="D-ib sort-icons">
-                        <i class='Icon up'>&#xe004;</i>
-                        <i class='Icon down'>&#xe002;</i>
-                    </div>
-                </div>
-            </th>
-        
-    
-
-
-                </tr>
-                
-                <tr class="filterRangeRow D-n">
-                    <td colspan="10">
-                        <div>
-                            <span class="filterRangeTitle"></span>
-                            <span class="closeFilter Cur-p">&#10005;</span>
-                            <span class="modify-filter Cur-p">[modify]</span>
-                        </div>
-                    </td>
-                </tr>
-                
-            </thead>
-
-            <tbody>
-                
-                    
-
-                    
-                    
-                    
-                    
-                    
-                
-            </tbody>
-        </table>
-    </div>
-</div>
-
-
-            </div>
-        
-    
-</div>
- </div> </div> </div> </div></div><!--END td-applet-options-table-->
-   
-
-
-                    </div>
-
-
-                </div>
-
-            </div>
-        </div>
-
-
-
-    </div>
-</div>
-
-        <script>
-(function (root) {
-// -- Data --
-root.Af || (root.Af = {});
-root.Af.config || (root.Af.config = {});
-root.Af.config.transport || (root.Af.config.transport = {});
-root.Af.config.transport.xhr = "\u002F_td_charts_api";
-root.YUI || (root.YUI = {});
-root.YUI.Env || (root.YUI.Env = {});
-root.YUI.Env.Af || (root.YUI.Env.Af = {});
-root.YUI.Env.Af.settings || (root.YUI.Env.Af.settings = {});
-root.YUI.Env.Af.settings.transport || (root.YUI.Env.Af.settings.transport = {});
-root.YUI.Env.Af.settings.transport.xhr = "\u002F_td_charts_api";
-root.YUI.Env.Af.settings.beacon || (root.YUI.Env.Af.settings.beacon = {});
-root.YUI.Env.Af.settings.beacon.pathPrefix = "\u002F_td_charts_api\u002Fbeacon";
-root.app || (root.app = {});
-root.app.yui = {"use":function bootstrap() { var self = this, d = document, head = d.getElementsByTagName('head')[0], ie = /MSIE/.test(navigator.userAgent), pending = 0, callback = [], args = arguments, config = typeof YUI_config != "undefined" ? YUI_config : {}; function flush() { var l = callback.length, i; if (!self.YUI && typeof YUI == "undefined") { throw new Error("YUI was not injected correctly!"); } self.YUI = self.YUI || YUI; for (i = 0; i < l; i++) { callback.shift()(); } } function decrementRequestPending() { pending--; if (pending <= 0) { setTimeout(flush, 0); } else { load(); } } function createScriptNode(src) { var node = d.createElement('script'); if (node.async) { node.async = false; } if (ie) { node.onreadystatechange = function () { if (/loaded|complete/.test(this.readyState)) { this.onreadystatechange = null; decrementRequestPending(); } }; } else { node.onload = node.onerror = decrementRequestPending; } node.setAttribute('src', src); return node; } function load() { if (!config.seed) { throw new Error('YUI_config.seed array is required.'); } var seed = config.seed, l = seed.length, i, node; pending = pending || seed.length; self._injected = true; for (i = 0; i < l; i++) { node = createScriptNode(seed.shift()); head.appendChild(node); if (node.async !== false) { break; } } } callback.push(function () { var i; if (!self._Y) { self.YUI.Env.core.push.apply(self.YUI.Env.core, config.extendedCore || []); self._Y = self.YUI(); self.use = self._Y.use; if (config.patches && config.patches.length) { for (i = 0; i < config.patches.length; i += 1) { config.patches[i](self._Y, self._Y.Env._loader); } } } self._Y.use.apply(self._Y, args); }); self.YUI = self.YUI || (typeof YUI != "undefined" ? YUI : null); if (!self.YUI && !self._injected) { load(); } else if (pending <= 0) { flush(); } return this; },"ready":function (callback) { this.use(function () { callback(); }); }};
-root.routeMap = {"quote-details":{"path":"\u002Fq\u002F?","keys":[],"regexp":/^\/q\/?\/?$/i,"annotations":{"name":"quote-details","aliases":["quote-details"]}},"recent-quotes":{"path":"\u002Fquotes\u002F?","keys":[],"regexp":/^\/quotes\/?\/?$/i,"annotations":{"name":"recent-quotes","aliases":["recent-quotes"]}},"quote-chart":{"path":"\u002Fchart\u002F?","keys":[],"regexp":/^\/chart\/?\/?$/i,"annotations":{"name":"quote-chart","aliases":["quote-chart"]}},"desktop-chart":{"path":"\u002Fecharts\u002F?","keys":[],"regexp":/^\/echarts\/?\/?$/i,"annotations":{"name":"desktop-chart","aliases":["desktop-chart"]}},"desktop-chart-virgo":{"path":"\u002Fecharts2\u002F?","keys":[],"regexp":/^\/echarts2\/?\/?$/i,"annotations":{"name":"desktop-chart-virgo","aliases":["desktop-chart-virgo"]}},"options":{"path":"\u002Fq\u002Fop\u002F?","keys":[],"regexp":/^\/q\/op\/?\/?$/i,"annotations":{"name":"options","aliases":["options"]}}};
-root.genUrl = function (routeName, context) {
-        var route = routeMap[routeName],
-            path, keys, i, len, key, param, regex;
-
-        if (!route) { return ''; }
-
-        path = route.path;
-        keys = route.keys;
-
-        if (context && (len = keys.length)) {
-            for (i = 0; i < len; i += 1) {
-                key   = keys[i];
-                param = key.name || key;
-                regex = new RegExp('[:*]' + param + '\\b');
-                path  = path.replace(regex, context[param]);
-            }
-        }
-
-        // Replace missing params with empty strings.
-        return path.replace(/([:*])([\w\-]+)?/g, '');
-    };
-root.App || (root.App = {});
-root.App.Cache || (root.App.Cache = {});
-root.App.Cache.globals = {"config":{"hosts":{"_default":"finance.yahoo.com","production":"finance.yahoo.com","staging":"stage.finance.yahoo.com","functional.test":"qa1.finance.yahoo.com","smoke.test":"int1.finance.yahoo.com","development":"int1.finance.yahoo.com"},"dss":{"assetPath":"\u002Fpv\u002Fstatic\u002Flib\u002Fios-default-set_201312031214.js","pn":"yahoo_finance_us_web","secureAssetHost":"https:\u002F\u002Fs.yimg.com","assetHost":"http:\u002F\u002Fl.yimg.com","cookieName":"DSS"},"mrs":{"mrs_host":"mrs-ynews.mrs.o.yimg.com","key":"mrs.ynews.crumbkey","app_id":"ynews"},"title":"Yahoo Finance - Business Finance, Stock Market, Quotes, News","crumbKey":"touchdown.crumbkey","asset_combo":true,"asset_mode":"prod","asset_filter":"min","assets":{"js":[{"location":"bottom","value":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Fmedia\u002Fm\u002Fheader\u002Fheader-uh3-finance-hardcoded-jsonblob-min-1583812.js"}],"css":["css.master",{"location":"top","value":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Fmedia\u002Fm\u002Fquotes\u002Fquotes-search-gs-smartphone-min-1680382.css"}],"options":{"inc_init_bottom":"0","inc_rapid":"1","rapid_version":"3.21","yui_instance_location":"bottom"}},"cdn":{"comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&","prefixMap":{"http:\u002F\u002Fl.yimg.com\u002F":""},"base":"https:\u002F\u002Fs.yimg.com"},"prefix_map":{"http:\u002F\u002Fl.yimg.com\u002F":""},"xhrPath":"_td_charts_api","adsEnabled":true,"ads":{"position":{"LREC":{"w":"300","h":"265"},"FB2-1":{"w":"198","h":"60"},"FB2-2":{"w":"198","h":"60"},"FB2-3":{"w":"198","h":"60"},"FB2-4":{"w":"198","h":"60"},"LDRP":{"w":"320","h":"76","metaSize":true},"WBTN":{"w":"120","h":"60"},"WBTN-1":{"w":"120","h":"60"},"FB2-0":{"w":"120","h":"60"},"SKY":{"w":"160","h":"600"}}},"spaceid":"2022773886","customSpaceIds":{"currency":"2142178955","mutualfund":"1197773430"},"urlSpaceId":"true","urlSpaceIdMap":{"quotes":"980779717","q\u002Fop":"28951412","q":"980779724"},"rapidSettings":{"webworker_file":"\u002Frapid-worker.js","client_only":1,"keys":{"version":"td app","site":"mobile-web-quotes"},"ywa":{"project_id":"1000911397279","document_group":"interactive-chart","host":"y.analytics.yahoo.com"},"ywaMappingAction":{"click":12,"hvr":115,"rottn":128,"drag":105},"ywaMappingCf":{"_p":20,"ad":58,"authfb":11,"bpos":24,"camp":54,"cat":25,"code":55,"cpos":21,"ct":23,"dcl":26,"dir":108,"domContentLoadedEventEnd":44,"elm":56,"elmt":57,"f":40,"ft":51,"grpt":109,"ilc":39,"itc":111,"loadEventEnd":45,"ltxt":17,"mpos":110,"mrkt":12,"pcp":67,"pct":48,"pd":46,"pkgt":22,"pos":20,"prov":114,"psp":72,"pst":68,"pstcat":47,"pt":13,"rescode":27,"responseEnd":43,"responseStart":41,"rspns":107,"sca":53,"sec":18,"site":42,"slk":19,"sort":28,"t1":121,"t2":122,"t3":123,"t4":124,"t5":125,"t6":126,"t7":127,"t8":128,"t9":129,"tar":113,"test":14,"v":52,"ver":49,"x":50},"tracked_mods":["yfi_investing_nav","chart-details"],"nofollow_class":[]},"property":"finance","uh":{"experience":"GS"},"loginRedirectHost":"finance.yahoo.com","default_ticker":"YHOO","default_market_tickers":["^DJI","^IXIC"],"uhAssetsBase":"https:\u002F\u002Fs.yimg.com","sslEnabled":true,"layout":"options","packageName":"finance-td-app-mobile-web","customActions":{"before":[function (req, res, data, callback) {
-    var header,
-        config = req.config(),
-        path = req.path;
-
-    if (req.i13n && req.i13n.stampNonClassified) {
-        //console.log('=====> [universal_header] page stamped: ' + req.i13n.isStamped() + ' with spaceid ' + req.i13n.getSpaceid());
-        req.i13n.stampNonClassified(config.spaceid);
-    }
-    config.uh = config.uh || {};
-    config.uh.experience = config.uh.experience || 'uh3';
-
-    req.query.experience = config.uh.experience;
-    req.query.property = 'finance';
-    header = finUH.getMarkup(req);
-
-    res.locals = res.locals || {};
-
-    if (header.sidebar) {
-        res.locals.sidebar_css = header.sidebar.uh_css;
-        res.locals.sidebar_js = header.sidebar.uh_js;
-        data.sidebar_markup = header.sidebar.uh_markup;
-    }
-
-    res.locals.uh_css = header.uh_css;
-    res.locals.uh_js = header.uh_js;
-    data.uh_markup = header.uh_markup;
-    //TODO - localize these strings
-    if (path && path.indexOf('op') > -1) {
-        res.locals.page_title = parseSymbol(req.query.s) + " Option Chain | Yahoo! Inc. Stock - Yahoo! Finance";
-    } else if (path && ((path.indexOf('echarts') > -1) || (path.indexOf('q') > -1))) {
-        res.locals.page_title = parseSymbol(req.query.s) + " Interactive Stock Chart | Yahoo! Inc. Stock - Yahoo! Finance";
-    } else {
-        res.locals.page_title = config.title;
-    }
-    callback();
-},function (req, res, data, next) {
-    /* this would invoke the ESI plugin on YTS */
-    res.parentRes.set('X-Esi', '1');
-
-    var hosts = req.config().hosts,
-        hostToSet = hosts._default;
-
-    Object.keys(hosts).some(function (host) {
-        if (req.headers.host.indexOf(host) >= 0) {
-            hostToSet = hosts[host];
-            return true;
-        }
-    });
-
-    /* saving request host server name for esi end point */
-    res.locals.requesturl = {
-        host: hostToSet
-    };
-
-     /* saving header x-yahoo-request-url for Darla configuration */
-    res.locals.requestxhosturl = req.headers['x-env-host'] ? {host: req.headers['x-env-host']} : {host: hostToSet};
-
-    //urlPath is used for ./node_modules/assembler/node_modules/dust-helpers/lib/util.js::getSpaceId()
-    //see: https://git.corp.yahoo.com/sports/sportacular-web
-    req.context.urlPath = req.path;
-
-    // console.log(JSON.stringify({
-    //     requesturl: res.locals.requesturl.host,
-    //     requestxhosturl: res.locals.requestxhosturl,
-    //     urlPath: req.context.urlPath
-    // }));
-
-    next();
-},function (req, res, data, callback) {
-
-    res.locals = res.locals || {};
-    if (req.query && req.query.s) {
-        res.locals.quote = req.query.s;
-    }
-
-    callback();
-},function (req, res, data, callback) {
-    var params,
-        ticker,
-        config, i;
-
-    req = req || {};
-    req.params = req.params || {};
-
-    config = req.config() || {};
-
-
-    data = data || {};
-
-    params = req.params || {};
-    ticker = (params.ticker || (req.query && req.query.s) || 'YHOO').toUpperCase();
-    ticker = ticker.split('+')[0];//Split on + if it's in the ticker
-    ticker = ticker.split(' ')[0];//Split on space if it's in the ticker
-
-    params.tickers = [];
-    if (config.default_market_tickers) {
-        params.tickers = params.tickers.concat(config.default_market_tickers);
-    }
-    params.tickers.push(ticker);
-    params.tickers = params.tickers.join(',');
-    params.format = 'inflated';
-
-    //Move this into a new action
-    res.locals.isTablet = config.isTablet;
-
-    quoteStore.read('finance_quote', params, req, function (err, qData) {
-        if (!err && qData.quotes && qData.quotes.length > 0) {
-            res.locals.quoteData = qData;
-            for (i = 0; i < qData.quotes.length; i = i +  1) {
-                if (qData.quotes[i].symbol.toUpperCase() === ticker.toUpperCase()) {
-                    params.ticker_securityType = qData.quotes[i].type;
-                }
-            }
-            params.tickers = ticker;
-        }
-        callback();
-    });
-},function (req, res, data, callback) {
-
-    marketTimeStore.read('markettime', {}, req, function (err, data) {
-        if (data && data.index) {
-            res.parentRes.locals.markettime = data.index.markettime;
-        }
-        callback();
-    });
-}],"after":[]}},"context":{"authed":"0","ynet":"0","ssl":"1","spdy":"0","bucket":"","colo":"gq1","device":"desktop","environment":"prod","lang":"en-US","partner":"none","site":"finance","region":"US","intl":"us","tz":"America\u002FLos_Angeles","edgepipeEnabled":false,"urlPath":"\u002Fq\u002Fop"},"intl":{"locales":"en-US"},"user":{"crumb":"RaKZ96VJ.kK","firstName":null}};
-root.YUI_config = {"version":"3.17.2","base":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:3.17.2\u002F","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&","root":"yui:3.17.2\u002F","filter":"min","logLevel":"error","combine":true,"patches":[function patchLangBundlesRequires(Y, loader) {
-    var getRequires = loader.getRequires;
-    loader.getRequires = function (mod) {
-        var i, j, m, name, mods, loadDefaultBundle,
-            locales = Y.config.lang || [],
-            r = getRequires.apply(this, arguments);
-        // expanding requirements with optional requires
-        if (mod.langBundles && !mod.langBundlesExpanded) {
-            mod.langBundlesExpanded = [];
-            locales = typeof locales === 'string' ? [locales] : locales.concat();
-            for (i = 0; i < mod.langBundles.length; i += 1) {
-                mods = [];
-                loadDefaultBundle = false;
-                name = mod.group + '-lang-' + mod.langBundles[i];
-                for (j = 0; j < locales.length; j += 1) {
-                    m = this.getModule(name + '_' + locales[j].toLowerCase());
-                    if (m) {
-                        mods.push(m);
-                    } else {
-                        // if one of the requested locales is missing,
-                        // the default lang should be fetched
-                        loadDefaultBundle = true;
-                    }
-                }
-                if (!mods.length || loadDefaultBundle) {
-                    // falling back to the default lang bundle when needed
-                    m = this.getModule(name);
-                    if (m) {
-                        mods.push(m);
-                    }
-                }
-                // adding requirements for each lang bundle
-                // (duplications are not a problem since they will be deduped)
-                for (j = 0; j < mods.length; j += 1) {
-                    mod.langBundlesExpanded = mod.langBundlesExpanded.concat(this.getRequires(mods[j]), [mods[j].name]);
-                }
-            }
-        }
-        return mod.langBundlesExpanded && mod.langBundlesExpanded.length ?
-                [].concat(mod.langBundlesExpanded, r) : r;
-    };
-}],"modules":{"IntlPolyfill":{"fullpath":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:platform\u002Fintl\u002F0.1.4\u002FIntl.min.js&yui:platform\u002Fintl\u002F0.1.4\u002Flocale-data\u002Fjsonp\u002F{lang}.js","condition":{"name":"IntlPolyfill","trigger":"intl-messageformat","test":function (Y) {
-                        return !Y.config.global.Intl;
-                    },"when":"before"},"configFn":function (mod) {
-                    var lang = 'en-US';
-                    if (window.YUI_config && window.YUI_config.lang && window.IntlAvailableLangs && window.IntlAvailableLangs[window.YUI_config.lang]) {
-                        lang = window.YUI_config.lang;
-                    }
-                    mod.fullpath = mod.fullpath.replace('{lang}', lang);
-                    return true;
-                }}},"groups":{"finance-td-app-mobile-web":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.356\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.356\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"ape-af":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fape-af-0.0.318\u002F","root":"os\u002Fmit\u002Ftd\u002Fape-af-0.0.318\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"mjata":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fmjata-0.4.35\u002F","root":"os\u002Fmit\u002Ftd\u002Fmjata-0.4.35\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"ape-applet":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fape-applet-0.0.202\u002F","root":"os\u002Fmit\u002Ftd\u002Fape-applet-0.0.202\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"applet-server":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fapplet-server-0.2.75\u002F","root":"os\u002Fmit\u002Ftd\u002Fapplet-server-0.2.75\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-api":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-api-0.1.85\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-api-0.1.85\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"finance-streamer":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"stencil":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002F","root":"os\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-ads":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.575\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.575\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-charts":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.312\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.312\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"finance-yui-scripts":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.23\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.23\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-lib-social":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-lib-social-0.1.181\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-lib-social-0.1.181\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-details":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.157\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.157\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-news":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.224\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.224\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-search":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.63\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.63\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quotes":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.10\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.10\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-options-table":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.191\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.191\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-finance-uh":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"assembler":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fassembler-0.3.97\u002F","root":"os\u002Fmit\u002Ftd\u002Fassembler-0.3.97\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-dev-info":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"dust-helpers":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.142\u002F","root":"os\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.142\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"}},"seed":["yui","loader-finance-td-app-mobile-web","loader-ape-af","loader-mjata","loader-ape-applet","loader-applet-server","loader-td-api","loader-finance-streamer","loader-stencil","loader-td-applet-ads","loader-td-applet-charts","loader-finance-yui-scripts","loader-td-lib-social","loader-td-applet-mw-quote-details","loader-td-applet-mw-quote-news","loader-td-applet-mw-quote-search","loader-td-applet-mw-quotes","loader-td-applet-options-table","loader-td-finance-uh","loader-assembler","loader-td-dev-info","loader-dust-helpers"],"extendedCore":["loader-finance-td-app-mobile-web","loader-ape-af","loader-mjata","loader-ape-applet","loader-applet-server","loader-td-api","loader-finance-streamer","loader-stencil","loader-td-applet-ads","loader-td-applet-charts","loader-finance-yui-scripts","loader-td-lib-social","loader-td-applet-mw-quote-details","loader-td-applet-mw-quote-news","loader-td-applet-mw-quote-search","loader-td-applet-mw-quotes","loader-td-applet-options-table","loader-td-finance-uh","loader-assembler","loader-td-dev-info","loader-dust-helpers"]};
-root.YUI_config || (root.YUI_config = {});
-root.YUI_config.seed = ["https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:3.17.2\u002Fyui\u002Fyui-min.js&os\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.356\u002Floader-finance-td-app-mobile-web\u002Floader-finance-td-app-mobile-web-min.js&os\u002Fmit\u002Ftd\u002Fape-af-0.0.318\u002Floader-ape-af\u002Floader-ape-af-min.js&os\u002Fmit\u002Ftd\u002Fmjata-0.4.35\u002Floader-mjata\u002Floader-mjata-min.js&os\u002Fmit\u002Ftd\u002Fape-applet-0.0.202\u002Floader-ape-applet\u002Floader-ape-applet-min.js&os\u002Fmit\u002Ftd\u002Fapplet-server-0.2.75\u002Floader-applet-server\u002Floader-applet-server-min.js&os\u002Fmit\u002Ftd\u002Ftd-api-0.1.85\u002Floader-td-api\u002Floader-td-api-min.js&os\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002Floader-finance-streamer\u002Floader-finance-streamer-min.js&os\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002Floader-stencil\u002Floader-stencil-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.575\u002Floader-td-applet-ads\u002Floader-td-applet-ads-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.312\u002Floader-td-applet-charts\u002Floader-td-applet-charts-min.js&os\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.23\u002Floader-finance-yui-scripts\u002Floader-finance-yui-scripts-min.js&os\u002Fmit\u002Ftd\u002Ftd-lib-social-0.1.181\u002Floader-td-lib-social\u002Floader-td-lib-social-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.157\u002Floader-td-applet-mw-quote-details\u002Floader-td-applet-mw-quote-details-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.224\u002Floader-td-applet-mw-quote-news\u002Floader-td-applet-mw-quote-news-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.63\u002Floader-td-applet-mw-quote-search\u002Floader-td-applet-mw-quote-search-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.10\u002Floader-td-applet-mw-quotes\u002Floader-td-applet-mw-quotes-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.191\u002Floader-td-applet-options-table\u002Floader-td-applet-options-table-min.js&os\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002Floader-td-finance-uh\u002Floader-td-finance-uh-min.js&os\u002Fmit\u002Ftd\u002Fassembler-0.3.97\u002Floader-assembler\u002Floader-assembler-min.js&os\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002Floader-td-dev-info\u002Floader-td-dev-info-min.js&os\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.142\u002Floader-dust-helpers\u002Floader-dust-helpers-min.js"];
-root.YUI_config.lang = "en-US";
-}(this));
-</script>
-
-        
-            
-<script type="text/javascript" src="https://s.yimg.com/zz/combo?yui:/3.17.2/yui/yui-min.js&/os/mit/td/asset-loader-s-4065d1ab.js&/ss/rapid-3.21.js&/os/mit/media/m/header/header-uh3-finance-hardcoded-jsonblob-min-1583812.js"></script>
-
-<script>
-(function (root) {
-// -- Data --
-root.Af || (root.Af = {});
-root.Af.config || (root.Af.config = {});
-root.Af.config.transport || (root.Af.config.transport = {});
-root.Af.config.transport.xhr = "\u002F_td_charts_api";
-root.YUI || (root.YUI = {});
-root.YUI.Env || (root.YUI.Env = {});
-root.YUI.Env.Af || (root.YUI.Env.Af = {});
-root.YUI.Env.Af.settings || (root.YUI.Env.Af.settings = {});
-root.YUI.Env.Af.settings.transport || (root.YUI.Env.Af.settings.transport = {});
-root.YUI.Env.Af.settings.transport.xhr = "\u002F_td_charts_api";
-root.YUI.Env.Af.settings.beacon || (root.YUI.Env.Af.settings.beacon = {});
-root.YUI.Env.Af.settings.beacon.pathPrefix = "\u002F_td_charts_api\u002Fbeacon";
-root.app || (root.app = {});
-root.app.yui = {"use":function bootstrap() { var self = this, d = document, head = d.getElementsByTagName('head')[0], ie = /MSIE/.test(navigator.userAgent), pending = 0, callback = [], args = arguments, config = typeof YUI_config != "undefined" ? YUI_config : {}; function flush() { var l = callback.length, i; if (!self.YUI && typeof YUI == "undefined") { throw new Error("YUI was not injected correctly!"); } self.YUI = self.YUI || YUI; for (i = 0; i < l; i++) { callback.shift()(); } } function decrementRequestPending() { pending--; if (pending <= 0) { setTimeout(flush, 0); } else { load(); } } function createScriptNode(src) { var node = d.createElement('script'); if (node.async) { node.async = false; } if (ie) { node.onreadystatechange = function () { if (/loaded|complete/.test(this.readyState)) { this.onreadystatechange = null; decrementRequestPending(); } }; } else { node.onload = node.onerror = decrementRequestPending; } node.setAttribute('src', src); return node; } function load() { if (!config.seed) { throw new Error('YUI_config.seed array is required.'); } var seed = config.seed, l = seed.length, i, node; pending = pending || seed.length; self._injected = true; for (i = 0; i < l; i++) { node = createScriptNode(seed.shift()); head.appendChild(node); if (node.async !== false) { break; } } } callback.push(function () { var i; if (!self._Y) { self.YUI.Env.core.push.apply(self.YUI.Env.core, config.extendedCore || []); self._Y = self.YUI(); self.use = self._Y.use; if (config.patches && config.patches.length) { for (i = 0; i < config.patches.length; i += 1) { config.patches[i](self._Y, self._Y.Env._loader); } } } self._Y.use.apply(self._Y, args); }); self.YUI = self.YUI || (typeof YUI != "undefined" ? YUI : null); if (!self.YUI && !self._injected) { load(); } else if (pending <= 0) { flush(); } return this; },"ready":function (callback) { this.use(function () { callback(); }); }};
-root.routeMap = {"quote-details":{"path":"\u002Fq\u002F?","keys":[],"regexp":/^\/q\/?\/?$/i,"annotations":{"name":"quote-details","aliases":["quote-details"]}},"recent-quotes":{"path":"\u002Fquotes\u002F?","keys":[],"regexp":/^\/quotes\/?\/?$/i,"annotations":{"name":"recent-quotes","aliases":["recent-quotes"]}},"quote-chart":{"path":"\u002Fchart\u002F?","keys":[],"regexp":/^\/chart\/?\/?$/i,"annotations":{"name":"quote-chart","aliases":["quote-chart"]}},"desktop-chart":{"path":"\u002Fecharts\u002F?","keys":[],"regexp":/^\/echarts\/?\/?$/i,"annotations":{"name":"desktop-chart","aliases":["desktop-chart"]}},"desktop-chart-virgo":{"path":"\u002Fecharts2\u002F?","keys":[],"regexp":/^\/echarts2\/?\/?$/i,"annotations":{"name":"desktop-chart-virgo","aliases":["desktop-chart-virgo"]}},"options":{"path":"\u002Fq\u002Fop\u002F?","keys":[],"regexp":/^\/q\/op\/?\/?$/i,"annotations":{"name":"options","aliases":["options"]}}};
-root.genUrl = function (routeName, context) {
-        var route = routeMap[routeName],
-            path, keys, i, len, key, param, regex;
-
-        if (!route) { return ''; }
-
-        path = route.path;
-        keys = route.keys;
-
-        if (context && (len = keys.length)) {
-            for (i = 0; i < len; i += 1) {
-                key   = keys[i];
-                param = key.name || key;
-                regex = new RegExp('[:*]' + param + '\\b');
-                path  = path.replace(regex, context[param]);
-            }
-        }
-
-        // Replace missing params with empty strings.
-        return path.replace(/([:*])([\w\-]+)?/g, '');
-    };
-root.App || (root.App = {});
-root.App.Cache || (root.App.Cache = {});
-root.App.Cache.globals = {"config":{"hosts":{"_default":"finance.yahoo.com","production":"finance.yahoo.com","staging":"stage.finance.yahoo.com","functional.test":"qa1.finance.yahoo.com","smoke.test":"int1.finance.yahoo.com","development":"int1.finance.yahoo.com"},"dss":{"assetPath":"\u002Fpv\u002Fstatic\u002Flib\u002Fios-default-set_201312031214.js","pn":"yahoo_finance_us_web","secureAssetHost":"https:\u002F\u002Fs.yimg.com","assetHost":"http:\u002F\u002Fl.yimg.com","cookieName":"DSS"},"mrs":{"mrs_host":"mrs-ynews.mrs.o.yimg.com","key":"mrs.ynews.crumbkey","app_id":"ynews"},"title":"Yahoo Finance - Business Finance, Stock Market, Quotes, News","crumbKey":"touchdown.crumbkey","asset_combo":true,"asset_mode":"prod","asset_filter":"min","assets":{"js":[{"location":"bottom","value":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Fmedia\u002Fm\u002Fheader\u002Fheader-uh3-finance-hardcoded-jsonblob-min-1583812.js"}],"css":["css.master",{"location":"top","value":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Fmedia\u002Fm\u002Fquotes\u002Fquotes-search-gs-smartphone-min-1680382.css"}],"options":{"inc_init_bottom":"0","inc_rapid":"1","rapid_version":"3.21","yui_instance_location":"bottom"}},"cdn":{"comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&","prefixMap":{"http:\u002F\u002Fl.yimg.com\u002F":""},"base":"https:\u002F\u002Fs.yimg.com"},"prefix_map":{"http:\u002F\u002Fl.yimg.com\u002F":""},"xhrPath":"_td_charts_api","adsEnabled":true,"ads":{"position":{"LREC":{"w":"300","h":"265"},"FB2-1":{"w":"198","h":"60"},"FB2-2":{"w":"198","h":"60"},"FB2-3":{"w":"198","h":"60"},"FB2-4":{"w":"198","h":"60"},"LDRP":{"w":"320","h":"76","metaSize":true},"WBTN":{"w":"120","h":"60"},"WBTN-1":{"w":"120","h":"60"},"FB2-0":{"w":"120","h":"60"},"SKY":{"w":"160","h":"600"}}},"spaceid":"2022773886","customSpaceIds":{"currency":"2142178955","mutualfund":"1197773430"},"urlSpaceId":"true","urlSpaceIdMap":{"quotes":"980779717","q\u002Fop":"28951412","q":"980779724"},"rapidSettings":{"webworker_file":"\u002Frapid-worker.js","client_only":1,"keys":{"version":"td app","site":"mobile-web-quotes"},"ywa":{"project_id":"1000911397279","document_group":"interactive-chart","host":"y.analytics.yahoo.com"},"ywaMappingAction":{"click":12,"hvr":115,"rottn":128,"drag":105},"ywaMappingCf":{"_p":20,"ad":58,"authfb":11,"bpos":24,"camp":54,"cat":25,"code":55,"cpos":21,"ct":23,"dcl":26,"dir":108,"domContentLoadedEventEnd":44,"elm":56,"elmt":57,"f":40,"ft":51,"grpt":109,"ilc":39,"itc":111,"loadEventEnd":45,"ltxt":17,"mpos":110,"mrkt":12,"pcp":67,"pct":48,"pd":46,"pkgt":22,"pos":20,"prov":114,"psp":72,"pst":68,"pstcat":47,"pt":13,"rescode":27,"responseEnd":43,"responseStart":41,"rspns":107,"sca":53,"sec":18,"site":42,"slk":19,"sort":28,"t1":121,"t2":122,"t3":123,"t4":124,"t5":125,"t6":126,"t7":127,"t8":128,"t9":129,"tar":113,"test":14,"v":52,"ver":49,"x":50},"tracked_mods":["yfi_investing_nav","chart-details"],"nofollow_class":[]},"property":"finance","uh":{"experience":"GS"},"loginRedirectHost":"finance.yahoo.com","default_ticker":"YHOO","default_market_tickers":["^DJI","^IXIC"],"uhAssetsBase":"https:\u002F\u002Fs.yimg.com","sslEnabled":true,"layout":"options","packageName":"finance-td-app-mobile-web","customActions":{"before":[function (req, res, data, callback) {
-    var header,
-        config = req.config(),
-        path = req.path;
-
-    if (req.i13n && req.i13n.stampNonClassified) {
-        //console.log('=====> [universal_header] page stamped: ' + req.i13n.isStamped() + ' with spaceid ' + req.i13n.getSpaceid());
-        req.i13n.stampNonClassified(config.spaceid);
-    }
-    config.uh = config.uh || {};
-    config.uh.experience = config.uh.experience || 'uh3';
-
-    req.query.experience = config.uh.experience;
-    req.query.property = 'finance';
-    header = finUH.getMarkup(req);
-
-    res.locals = res.locals || {};
-
-    if (header.sidebar) {
-        res.locals.sidebar_css = header.sidebar.uh_css;
-        res.locals.sidebar_js = header.sidebar.uh_js;
-        data.sidebar_markup = header.sidebar.uh_markup;
-    }
-
-    res.locals.uh_css = header.uh_css;
-    res.locals.uh_js = header.uh_js;
-    data.uh_markup = header.uh_markup;
-    //TODO - localize these strings
-    if (path && path.indexOf('op') > -1) {
-        res.locals.page_title = parseSymbol(req.query.s) + " Option Chain | Yahoo! Inc. Stock - Yahoo! Finance";
-    } else if (path && ((path.indexOf('echarts') > -1) || (path.indexOf('q') > -1))) {
-        res.locals.page_title = parseSymbol(req.query.s) + " Interactive Stock Chart | Yahoo! Inc. Stock - Yahoo! Finance";
-    } else {
-        res.locals.page_title = config.title;
-    }
-    callback();
-},function (req, res, data, next) {
-    /* this would invoke the ESI plugin on YTS */
-    res.parentRes.set('X-Esi', '1');
-
-    var hosts = req.config().hosts,
-        hostToSet = hosts._default;
-
-    Object.keys(hosts).some(function (host) {
-        if (req.headers.host.indexOf(host) >= 0) {
-            hostToSet = hosts[host];
-            return true;
-        }
-    });
-
-    /* saving request host server name for esi end point */
-    res.locals.requesturl = {
-        host: hostToSet
-    };
-
-     /* saving header x-yahoo-request-url for Darla configuration */
-    res.locals.requestxhosturl = req.headers['x-env-host'] ? {host: req.headers['x-env-host']} : {host: hostToSet};
-
-    //urlPath is used for ./node_modules/assembler/node_modules/dust-helpers/lib/util.js::getSpaceId()
-    //see: https://git.corp.yahoo.com/sports/sportacular-web
-    req.context.urlPath = req.path;
-
-    // console.log(JSON.stringify({
-    //     requesturl: res.locals.requesturl.host,
-    //     requestxhosturl: res.locals.requestxhosturl,
-    //     urlPath: req.context.urlPath
-    // }));
-
-    next();
-},function (req, res, data, callback) {
-
-    res.locals = res.locals || {};
-    if (req.query && req.query.s) {
-        res.locals.quote = req.query.s;
-    }
-
-    callback();
-},function (req, res, data, callback) {
-    var params,
-        ticker,
-        config, i;
-
-    req = req || {};
-    req.params = req.params || {};
-
-    config = req.config() || {};
-
-
-    data = data || {};
-
-    params = req.params || {};
-    ticker = (params.ticker || (req.query && req.query.s) || 'YHOO').toUpperCase();
-    ticker = ticker.split('+')[0];//Split on + if it's in the ticker
-    ticker = ticker.split(' ')[0];//Split on space if it's in the ticker
-
-    params.tickers = [];
-    if (config.default_market_tickers) {
-        params.tickers = params.tickers.concat(config.default_market_tickers);
-    }
-    params.tickers.push(ticker);
-    params.tickers = params.tickers.join(',');
-    params.format = 'inflated';
-
-    //Move this into a new action
-    res.locals.isTablet = config.isTablet;
-
-    quoteStore.read('finance_quote', params, req, function (err, qData) {
-        if (!err && qData.quotes && qData.quotes.length > 0) {
-            res.locals.quoteData = qData;
-            for (i = 0; i < qData.quotes.length; i = i +  1) {
-                if (qData.quotes[i].symbol.toUpperCase() === ticker.toUpperCase()) {
-                    params.ticker_securityType = qData.quotes[i].type;
-                }
-            }
-            params.tickers = ticker;
-        }
-        callback();
-    });
-},function (req, res, data, callback) {
-
-    marketTimeStore.read('markettime', {}, req, function (err, data) {
-        if (data && data.index) {
-            res.parentRes.locals.markettime = data.index.markettime;
-        }
-        callback();
-    });
-}],"after":[]}},"context":{"authed":"0","ynet":"0","ssl":"1","spdy":"0","bucket":"","colo":"gq1","device":"desktop","environment":"prod","lang":"en-US","partner":"none","site":"finance","region":"US","intl":"us","tz":"America\u002FLos_Angeles","edgepipeEnabled":false,"urlPath":"\u002Fq\u002Fop"},"intl":{"locales":"en-US"},"user":{"crumb":"RaKZ96VJ.kK","firstName":null}};
-root.YUI_config = {"version":"3.17.2","base":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:3.17.2\u002F","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&","root":"yui:3.17.2\u002F","filter":"min","logLevel":"error","combine":true,"patches":[function patchLangBundlesRequires(Y, loader) {
-    var getRequires = loader.getRequires;
-    loader.getRequires = function (mod) {
-        var i, j, m, name, mods, loadDefaultBundle,
-            locales = Y.config.lang || [],
-            r = getRequires.apply(this, arguments);
-        // expanding requirements with optional requires
-        if (mod.langBundles && !mod.langBundlesExpanded) {
-            mod.langBundlesExpanded = [];
-            locales = typeof locales === 'string' ? [locales] : locales.concat();
-            for (i = 0; i < mod.langBundles.length; i += 1) {
-                mods = [];
-                loadDefaultBundle = false;
-                name = mod.group + '-lang-' + mod.langBundles[i];
-                for (j = 0; j < locales.length; j += 1) {
-                    m = this.getModule(name + '_' + locales[j].toLowerCase());
-                    if (m) {
-                        mods.push(m);
-                    } else {
-                        // if one of the requested locales is missing,
-                        // the default lang should be fetched
-                        loadDefaultBundle = true;
-                    }
-                }
-                if (!mods.length || loadDefaultBundle) {
-                    // falling back to the default lang bundle when needed
-                    m = this.getModule(name);
-                    if (m) {
-                        mods.push(m);
-                    }
-                }
-                // adding requirements for each lang bundle
-                // (duplications are not a problem since they will be deduped)
-                for (j = 0; j < mods.length; j += 1) {
-                    mod.langBundlesExpanded = mod.langBundlesExpanded.concat(this.getRequires(mods[j]), [mods[j].name]);
-                }
-            }
-        }
-        return mod.langBundlesExpanded && mod.langBundlesExpanded.length ?
-                [].concat(mod.langBundlesExpanded, r) : r;
-    };
-}],"modules":{"IntlPolyfill":{"fullpath":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:platform\u002Fintl\u002F0.1.4\u002FIntl.min.js&yui:platform\u002Fintl\u002F0.1.4\u002Flocale-data\u002Fjsonp\u002F{lang}.js","condition":{"name":"IntlPolyfill","trigger":"intl-messageformat","test":function (Y) {
-                        return !Y.config.global.Intl;
-                    },"when":"before"},"configFn":function (mod) {
-                    var lang = 'en-US';
-                    if (window.YUI_config && window.YUI_config.lang && window.IntlAvailableLangs && window.IntlAvailableLangs[window.YUI_config.lang]) {
-                        lang = window.YUI_config.lang;
-                    }
-                    mod.fullpath = mod.fullpath.replace('{lang}', lang);
-                    return true;
-                }}},"groups":{"finance-td-app-mobile-web":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.356\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.356\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"ape-af":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fape-af-0.0.318\u002F","root":"os\u002Fmit\u002Ftd\u002Fape-af-0.0.318\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"mjata":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fmjata-0.4.35\u002F","root":"os\u002Fmit\u002Ftd\u002Fmjata-0.4.35\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"ape-applet":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fape-applet-0.0.202\u002F","root":"os\u002Fmit\u002Ftd\u002Fape-applet-0.0.202\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"applet-server":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fapplet-server-0.2.75\u002F","root":"os\u002Fmit\u002Ftd\u002Fapplet-server-0.2.75\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-api":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-api-0.1.85\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-api-0.1.85\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"finance-streamer":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"stencil":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002F","root":"os\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-ads":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.575\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.575\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-charts":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.312\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.312\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"finance-yui-scripts":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.23\u002F","root":"os\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.23\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-lib-social":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-lib-social-0.1.181\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-lib-social-0.1.181\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-details":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.157\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.157\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-news":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.224\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.224\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quote-search":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.63\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.63\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-mw-quotes":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.10\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.10\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-applet-options-table":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.191\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.191\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-finance-uh":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"assembler":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fassembler-0.3.97\u002F","root":"os\u002Fmit\u002Ftd\u002Fassembler-0.3.97\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"td-dev-info":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002F","root":"os\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"},"dust-helpers":{"base":"https:\u002F\u002Fs.yimg.com\u002Fos\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.142\u002F","root":"os\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.142\u002F","combine":true,"filter":"min","comboBase":"https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?","comboSep":"&"}},"seed":["yui","loader-finance-td-app-mobile-web","loader-ape-af","loader-mjata","loader-ape-applet","loader-applet-server","loader-td-api","loader-finance-streamer","loader-stencil","loader-td-applet-ads","loader-td-applet-charts","loader-finance-yui-scripts","loader-td-lib-social","loader-td-applet-mw-quote-details","loader-td-applet-mw-quote-news","loader-td-applet-mw-quote-search","loader-td-applet-mw-quotes","loader-td-applet-options-table","loader-td-finance-uh","loader-assembler","loader-td-dev-info","loader-dust-helpers"],"extendedCore":["loader-finance-td-app-mobile-web","loader-ape-af","loader-mjata","loader-ape-applet","loader-applet-server","loader-td-api","loader-finance-streamer","loader-stencil","loader-td-applet-ads","loader-td-applet-charts","loader-finance-yui-scripts","loader-td-lib-social","loader-td-applet-mw-quote-details","loader-td-applet-mw-quote-news","loader-td-applet-mw-quote-search","loader-td-applet-mw-quotes","loader-td-applet-options-table","loader-td-finance-uh","loader-assembler","loader-td-dev-info","loader-dust-helpers"]};
-root.YUI_config || (root.YUI_config = {});
-root.YUI_config.seed = ["https:\u002F\u002Fs.yimg.com\u002Fzz\u002Fcombo?yui:3.17.2\u002Fyui\u002Fyui-min.js&os\u002Fmit\u002Ftd\u002Ffinance-td-app-mobile-web-2.0.356\u002Floader-finance-td-app-mobile-web\u002Floader-finance-td-app-mobile-web-min.js&os\u002Fmit\u002Ftd\u002Fape-af-0.0.318\u002Floader-ape-af\u002Floader-ape-af-min.js&os\u002Fmit\u002Ftd\u002Fmjata-0.4.35\u002Floader-mjata\u002Floader-mjata-min.js&os\u002Fmit\u002Ftd\u002Fape-applet-0.0.202\u002Floader-ape-applet\u002Floader-ape-applet-min.js&os\u002Fmit\u002Ftd\u002Fapplet-server-0.2.75\u002Floader-applet-server\u002Floader-applet-server-min.js&os\u002Fmit\u002Ftd\u002Ftd-api-0.1.85\u002Floader-td-api\u002Floader-td-api-min.js&os\u002Fmit\u002Ftd\u002Ffinance-streamer-0.0.16\u002Floader-finance-streamer\u002Floader-finance-streamer-min.js&os\u002Fmit\u002Ftd\u002Fstencil-0.1.306\u002Floader-stencil\u002Floader-stencil-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-ads-0.1.575\u002Floader-td-applet-ads\u002Floader-td-applet-ads-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-charts-0.2.312\u002Floader-td-applet-charts\u002Floader-td-applet-charts-min.js&os\u002Fmit\u002Ftd\u002Ffinance-yui-scripts-0.0.23\u002Floader-finance-yui-scripts\u002Floader-finance-yui-scripts-min.js&os\u002Fmit\u002Ftd\u002Ftd-lib-social-0.1.181\u002Floader-td-lib-social\u002Floader-td-lib-social-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-details-2.3.157\u002Floader-td-applet-mw-quote-details\u002Floader-td-applet-mw-quote-details-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-news-2.3.224\u002Floader-td-applet-mw-quote-news\u002Floader-td-applet-mw-quote-news-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quote-search-1.2.63\u002Floader-td-applet-mw-quote-search\u002Floader-td-applet-mw-quote-search-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-mw-quotes-4.2.10\u002Floader-td-applet-mw-quotes\u002Floader-td-applet-mw-quotes-min.js&os\u002Fmit\u002Ftd\u002Ftd-applet-options-table-0.1.191\u002Floader-td-applet-options-table\u002Floader-td-applet-options-table-min.js&os\u002Fmit\u002Ftd\u002Ftd-finance-uh-0.1.2\u002Floader-td-finance-uh\u002Floader-td-finance-uh-min.js&os\u002Fmit\u002Ftd\u002Fassembler-0.3.97\u002Floader-assembler\u002Floader-assembler-min.js&os\u002Fmit\u002Ftd\u002Ftd-dev-info-0.0.30\u002Floader-td-dev-info\u002Floader-td-dev-info-min.js&os\u002Fmit\u002Ftd\u002Fdust-helpers-0.0.142\u002Floader-dust-helpers\u002Floader-dust-helpers-min.js"];
-root.YUI_config.lang = "en-US";
-}(this));
-</script>
-<script>YMedia = YUI({"combine":true,"filter":"min","maxURLLength":2000});</script><script>if (YMedia.config.patches && YMedia.config.patches.length) {for (var i = 0; i < YMedia.config.patches.length; i += 1) {YMedia.config.patches[i](YMedia, YMedia.Env._loader);}}</script>
-<script>YMedia.applyConfig({"groups":{"td-applet-mw-quote-search":{"base":"https://s1.yimg.com/os/mit/td/td-applet-mw-quote-search-1.2.63/","root":"os/mit/td/td-applet-mw-quote-search-1.2.63/","combine":true,"filter":"min","comboBase":"https://s.yimg.com/zz/combo?","comboSep":"&"}}});</script><script>window.Af=window.Af||{};window.Af.bootstrap=window.Af.bootstrap||{};window.Af.bootstrap["4305521169179279"] = {"applet_type":"td-applet-mw-quote-search","views":{"main":{"yui_module":"td-applet-quotesearch-desktopview","yui_class":"TD.Applet.QuotesearchDesktopView","config":{"type":"lookup"}}},"templates":{"main":{"yui_module":"td-applet-mw-quote-search-templates-main","template_name":"td-applet-mw-quote-search-templates-main"},"lookup":{"yui_module":"td-applet-mw-quote-search-templates-lookup","template_name":"td-applet-mw-quote-search-templates-lookup"}},"i18n":{"TITLE":"quotesearch"},"transport":{"xhr":"/_td_charts_api"},"context":{"bucket":"","crumb":"RaKZ96VJ.kK","device":"desktop","lang":"en-US","region":"US","site":"finance"}};</script>
-<script>YMedia.applyConfig({"groups":{"td-applet-mw-quote-search":{"base":"https://s1.yimg.com/os/mit/td/td-applet-mw-quote-search-1.2.63/","root":"os/mit/td/td-applet-mw-quote-search-1.2.63/","combine":true,"filter":"min","comboBase":"https://s.yimg.com/zz/combo?","comboSep":"&"}}});</script><script>window.Af=window.Af||{};window.Af.bootstrap=window.Af.bootstrap||{};window.Af.bootstrap["4305521170092653"] = {"applet_type":"td-applet-mw-quote-search","views":{"main":{"yui_module":"td-applet-quotesearch-desktopview","yui_class":"TD.Applet.QuotesearchDesktopView","config":{"type":"options"}}},"templates":{"main":{"yui_module":"td-applet-mw-quote-search-templates-main","template_name":"td-applet-mw-quote-search-templates-main"},"lookup":{"yui_module":"td-applet-mw-quote-search-templates-lookup","template_name":"td-applet-mw-quote-search-templates-lookup"}},"i18n":{"TITLE":"quotesearch"},"transport":{"xhr":"/_td_charts_api"},"context":{"bucket":"","crumb":"RaKZ96VJ.kK","device":"desktop","lang":"en-US","region":"US","site":"finance"}};</script>
-<script>YMedia.applyConfig({"groups":{"td-applet-options-table":{"base":"https://s1.yimg.com/os/mit/td/td-applet-options-table-0.1.191/","root":"os/mit/td/td-applet-options-table-0.1.191/","combine":true,"filter":"min","comboBase":"https://s.yimg.com/zz/combo?","comboSep":"&"}}});</script><script>window.Af=window.Af||{};window.Af.bootstrap=window.Af.bootstrap||{};window.Af.bootstrap["4305521169702139"] = {"applet_type":"td-applet-options-table","models":{"options-table":{"yui_module":"td-options-table-model","yui_class":"TD.Options-table.Model"},"applet_model":{"models":["options-table"],"data":{"optionData":{"underlyingSymbol":"SPWR","expirationDates":["2015-03-27T00:00:00.000Z","2015-04-02T00:00:00.000Z","2015-04-10T00:00:00.000Z","2015-04-17T00:00:00.000Z","2015-04-24T00:00:00.000Z","2015-05-01T00:00:00.000Z","2015-06-19T00:00:00.000Z","2015-09-18T00:00:00.000Z","2016-01-15T00:00:00.000Z","2017-01-20T00:00:00.000Z"],"strikes":[30.5,35,42],"hasMiniOptions":false,"quote":{"preMarketChange":0,"preMarketChangePercent":0,"preMarketTime":1427113398,"preMarketPrice":32.87,"preMarketSource":"DELAYED","postMarketChange":0.049999237,"postMarketChangePercent":0.15128362,"postMarketTime":1427240864,"postMarketPrice":33.1,"postMarketSource":"DELAYED","regularMarketChange":0.069999695,"regularMarketChangePercent":0.21224892,"regularMarketTime":1427227200,"regularMarketPrice":33.05,"regularMarketDayHigh":33.76,"regularMarketDayLow":32.8,"regularMarketVolume":1611401,"regularMarketPreviousClose":32.98,"regularMarketOpen":32.91,"bid":39.21,"ask":39.31,"bidSize":1,"askSize":1,"averageDailyVolume3Month":2325996,"averageDailyVolume10Day":1402050,"fiftyTwoWeekLow":22.75,"fiftyTwoWeekHigh":42.07,"regularMarketSource":"DELAYED","exchange":"NMS","quoteType":"EQUITY","symbol":"SPWR","shortName":"SunPower Corporation","longName":"SunPower Corporation","currency":"USD","epsTrailingTwelveMonths":1.552,"epsForward":1.79,"sharesOutstanding":131480377,"marketCap":4345426400,"marketState":"POST"},"options":{"calls":[{"contractSymbol":"SPWR150501C00030500","currency":"USD","volume":10,"openInterest":20,"contractSize":"REGULAR","expiration":1430438400,"lastTradeDate":1427250638,"inTheMoney":true,"percentChangeRaw":-13.725491,"impliedVolatilityRaw":0.5507857421875001,"impliedVolatility":"55.08","strike":"30.50","lastPrice":"3.57","change":"-0.49","percentChange":"-13.73","bid":"3.30","ask":"4.20"},{"contractSymbol":"SPWR150501C00035000","currency":"USD","volume":107,"openInterest":119,"contractSize":"REGULAR","expiration":1430438400,"lastTradeDate":1427250639,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.5219774365234374,"impliedVolatility":"52.20","strike":"35.00","lastPrice":"1.10","change":"0.00","percentChange":"0.00","bid":"1.06","ask":"1.44"},{"contractSymbol":"SPWR150501C00042000","currency":"USD","volume":20,"openInterest":10,"contractSize":"REGULAR","expiration":1430438400,"lastTradeDate":1427250639,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.5400436621093752,"impliedVolatility":"54.00","strike":"42.00","lastPrice":"0.41","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.50"}],"puts":[]},"_options":[{"expirationDate":1430438400,"hasMiniOptions":false,"calls":[{"contractSymbol":"SPWR150501C00030500","currency":"USD","volume":10,"openInterest":20,"contractSize":"REGULAR","expiration":1430438400,"lastTradeDate":1427250638,"inTheMoney":true,"percentChangeRaw":-13.725491,"impliedVolatilityRaw":0.5507857421875001,"impliedVolatility":"55.08","strike":"30.50","lastPrice":"3.57","change":"-0.49","percentChange":"-13.73","bid":"3.30","ask":"4.20"},{"contractSymbol":"SPWR150501C00035000","currency":"USD","volume":107,"openInterest":119,"contractSize":"REGULAR","expiration":1430438400,"lastTradeDate":1427250639,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.5219774365234374,"impliedVolatility":"52.20","strike":"35.00","lastPrice":"1.10","change":"0.00","percentChange":"0.00","bid":"1.06","ask":"1.44"},{"contractSymbol":"SPWR150501C00042000","currency":"USD","volume":20,"openInterest":10,"contractSize":"REGULAR","expiration":1430438400,"lastTradeDate":1427250639,"inTheMoney":false,"percentChangeRaw":0,"impliedVolatilityRaw":0.5400436621093752,"impliedVolatility":"54.00","strike":"42.00","lastPrice":"0.41","change":"0.00","percentChange":"0.00","bid":"0.00","ask":"0.50"}],"puts":[]}],"epochs":[1427414400,1427932800,1428624000,1429228800,1429833600,1430438400,1434672000,1442534400,1452816000,1484870400]},"columns":{"list_table_columns":[{"column":{"name":"Strike","header_cell_class":"column-strike Pstart-38 low-high","body_cell_class":"Pstart-10","template":"table/columns/strike","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"strike","filter":true}},{"column":{"name":"Contract Name","header_cell_class":"column-contractName Pstart-10","body_cell_class":"w-100","template":"table/columns/contract_name","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"symbol"}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"lastPrice"}},{"column":{"name":"Bid","header_cell_class":"column-bid Pstart-10","body_cell_class":"w-100","template":"table/columns/bid","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"bid"}},{"column":{"name":"Ask","header_cell_class":"column-ask Pstart-10","body_cell_class":"w-100","template":"table/columns/ask","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"ask"}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-14","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"change"}},{"column":{"name":"%Change","header_cell_class":"column-percentChange Pstart-16","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-14","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-14","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"openInterest"}},{"column":{"name":"Implied Volatility","header_cell_class":"column-impliedVolatility Pstart-10","body_cell_class":"w-100","template":"table/columns/implied_volatility","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"impliedVolatility"}}],"straddle_table_columns":[{"column":{"name":"Expand All","header_cell_class":"column-expand-all Pstart-38","body_cell_class":"Pstart-10","template":"table/columns/strike","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"expand","filter":false}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.lastPrice","filter":false}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-10","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.change"}},{"column":{"name":"%Change","header_cell_class":"column-pctchange","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-10","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-10","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.openInterest"}},{"column":{"name":"Strike","header_cell_class":"column-strike","body_cell_class":"Pstart-10","template":"table/columns/strike","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"strike","filter":true}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.lastPrice","filter":false}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-10","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.change"}},{"column":{"name":"%Change","header_cell_class":"column-pctchange","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-10","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-10","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.openInterest"}}],"single_strike_filter_list_table_columns":[{"column":{"name":"Expires","header_cell_class":"column-expires Pstart-38 low-high","body_cell_class":"Pstart-10","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"expiration","filter":false}},{"column":{"name":"Contract Name","header_cell_class":"column-contractName Pstart-10","body_cell_class":"w-100","template":"table/columns/contract_name","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"symbol"}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"lastPrice"}},{"column":{"name":"Bid","header_cell_class":"column-bid Pstart-10","body_cell_class":"w-100","template":"table/columns/bid","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"bid"}},{"column":{"name":"Ask","header_cell_class":"column-ask Pstart-10","body_cell_class":"w-100","template":"table/columns/ask","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"ask"}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-14","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"change"}},{"column":{"name":"%Change","header_cell_class":"column-percentChange Pstart-16","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-14","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-14","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"openInterest"}},{"column":{"name":"Implied Volatility","header_cell_class":"column-impliedVolatility Pstart-10","body_cell_class":"w-100","template":"table/columns/implied_volatility","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"impliedVolatility"}}],"single_strike_filter_straddle_table_columns":[{"column":{"name":"Expand All","header_cell_class":"column-expand-all Pstart-38","body_cell_class":"Pstart-10","template":"table/columns/strike","sortable":false,"align":null,"sort_order":null,"column_id":"","sort_name":"expand","filter":false}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.lastPrice","filter":false}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-10","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.change"}},{"column":{"name":"%Change","header_cell_class":"column-pctchange","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-10","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-10","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"call.openInterest"}},{"column":{"name":"Expires","header_cell_class":"column-expires","body_cell_class":"Pstart-10","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"expiration"}},{"column":{"name":"Last","header_cell_class":"column-last Pstart-10","body_cell_class":"w-100","template":"table/columns/last","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.lastPrice","filter":false}},{"column":{"name":"Change","header_cell_class":"column-change Pstart-10","body_cell_class":"w-100","template":"table/columns/change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.change"}},{"column":{"name":"%Change","header_cell_class":"column-pctchange","body_cell_class":"w-100","template":"table/columns/pct_change","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.percentChange"}},{"column":{"name":"Volume","header_cell_class":"column-volume Pstart-10","body_cell_class":"w-100","template":"table/columns/volume","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.volume"}},{"column":{"name":"Open Interest","header_cell_class":"column-openInterest Pstart-10","body_cell_class":"w-100","template":"table/columns/open_interest","sortable":true,"align":null,"sort_order":null,"column_id":"","sort_name":"put.openInterest"}}]},"params":{"date":"1430438400","size":false,"straddle":false,"ticker":"SPWR","singleStrikeFilter":false,"dateObj":"2015-05-01T00:00:00.000Z"}}}},"views":{"main":{"yui_module":"td-options-table-mainview","yui_class":"TD.Options-table.MainView"}},"templates":{"main":{"yui_module":"td-applet-options-table-templates-main","template_name":"td-applet-options-table-templates-main"},"error":{"yui_module":"td-applet-options-table-templates-error","template_name":"td-applet-options-table-templates-error"}},"i18n":{"TITLE":"options-table"},"transport":{"xhr":"/_td_charts_api"},"context":{"bucket":"","crumb":"RaKZ96VJ.kK","device":"desktop","lang":"en-US","region":"US","site":"finance"}};</script>
-<script>YMedia.applyConfig({"groups":{"td-applet-mw-quote-details":{"base":"https://s.yimg.com/os/mit/td/td-applet-mw-quote-details-2.3.157/","root":"os/mit/td/td-applet-mw-quote-details-2.3.157/","combine":true,"filter":"min","comboBase":"https://s.yimg.com/zz/combo?","comboSep":"&"}}});</script><script>window.Af=window.Af||{};window.Af.bootstrap=window.Af.bootstrap||{};window.Af.bootstrap["4305521170488091"] = {"applet_type":"td-applet-mw-quote-details","models":{"mwquotedetails":{"yui_module":"td-applet-mw-quote-details-model","yui_class":"TD.Applet.MWQuoteDetailsModel","data":{"quoteDetails":{"quotes":[{"name":"SunPower Corporation","symbol":"SPWR","details_url":"http://finance.yahoo.com/q?s=SPWR","exchange":{"symbol":"NASDAQ","id":"NMS","status":"REGULAR_MARKET"},"type":"equity","price":{"fmt":"33.05","raw":"33.049999"},"volume":{"fmt":"1.6m","raw":"1614011","longFmt":"1,614,011"},"avg_daily_volume":{"fmt":"2.4m","raw":"2360670","longFmt":"2,360,670"},"avg_3m_volume":{"fmt":"2.4m","raw":"2360670","longFmt":"2,360,670"},"timestamp":"1427227200","time":"4:00PM EDT","trend":"up","price_change":{"fmt":"+0.07","raw":"0.070000"},"price_pct_change":{"fmt":"0.21%","raw":"0.212249"},"day_high":{"fmt":"33.76","raw":"33.759998"},"day_low":{"fmt":"32.80","raw":"32.799999"},"fiftytwo_week_high":{"fmt":"42.07","raw":"42.070000"},"fiftytwo_week_low":{"fmt":"22.75","raw":"22.750000"},"open":{"data_source":"1","fmt":"32.91","raw":"32.910000"},"pe_ratio":{"fmt":"21.30","raw":"21.295101"},"prev_close":{"data_source":"1","fmt":"32.98","raw":"32.980000"},"beta_coefficient":{"fmt":"2.92","raw":"2.920000"},"market_cap":{"data_source":"1","currency":"USD","fmt":"4.35B","raw":"4345414144.000000"},"eps":{"fmt":"1.55","raw":"1.552000"},"one_year_target":{"fmt":"41.08","raw":"41.080000"},"after_hours":{"percent_change":"0.15%","change":{"data_source":"1","raw":"0.049999","fmt":"+0.05"},"isUp":true,"time":{"data_source":"1","raw":"2015-03-24T23:47:44Z","fmt":"7:47PM EDT"},"price":{"data_source":"1","raw":"33.099998","fmt":"33.10"}}}]},"symbol":"spwr","login":"https://login.yahoo.com/config/login_verify2?.src=finance&.done=http%3A%2F%2Ffinance.yahoo.com%2Fecharts%3Fs%3Dspwr","hamNavQueEnabled":false,"crumb":"RaKZ96VJ.kK"}},"applet_model":{"models":["mwquotedetails"],"data":{}}},"views":{"main":{"yui_module":"td-applet-quote-details-desktopview","yui_class":"TD.Applet.QuoteDetailsDesktopView"}},"templates":{"main":{"yui_module":"td-applet-mw-quote-details-templates-main","template_name":"td-applet-mw-quote-details-templates-main"}},"i18n":{"HAM_NAV_MODAL_MSG":"has been added to your list. Go to My Portfolio for more!","FOLLOW":"Follow","FOLLOWING":"Following","WATCHLIST":"Watchlist","IN_WATCHLIST":"In Watchlist","TO_FOLLOW":" to Follow","TO_WATCHLIST":" to Add to Watchlist"},"transport":{"xhr":"/_td_charts_api"},"context":{"bucket":"","crumb":"RaKZ96VJ.kK","device":"desktop","lang":"en-US","region":"US","site":"finance"}};</script>
-        
-
-        <script>if (!window.YMedia) { var YMedia = YUI(); YMedia.includes = []; }</script><div id="yom-ad-SDARLA-iframe"><script type='text/javascript' src='https://s.yimg.com/rq/darla/2-8-7/js/g-r-min.js'></script><script type="text/x-safeframe" id="fc" _ver="2-8-7">{ "positions": [ { "html": "<!-- SpaceID=28951412 loc=FB2 noad --><!-- fac-gd2-noad --><!-- gd2-status-2 --><!--QYZ CMS_NONE_AVAIL,,98.139.115.80;;FB2;28951412;2;-->", "id": "FB2-1", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['WP.0v2KLc6Q-']='(as$125cialb8,aid$WP.0v2KLc6Q-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134jqr6p5(gid$969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY,st$1427251674080589,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$125cialb8,aid$WP.0v2KLc6Q-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)\"></noscr"+"ipt>", "cscURI": "https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134jqr6p5(gid$969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY,st$1427251674080589,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$125cialb8,aid$WP.0v2KLc6Q-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)", "impID": "", "supp_ugc": "0", "placementID": "-1", "creativeID": "-1", "serveTime": "1.4272516740806E+15", "behavior": "non_exp", "adID": "#2", "matchID": "#2", "err": "invalid_space", "hasExternal": 0, "size": "", "bookID": "CMS_NONE_AVAIL", "serveType": "-1", "slotID": "0", "fdb": "{ \"fdb_url\": \"http:\\/\\/gd1457.adx.gq1.yahoo.com\\/af?bv=1.0.0&bs=(15ir45r6b(gid$jmTVQDk4LjHHbFsHU5jMkgKkMTAuNwAAAACljpkK,st$1402537233026922,srv$1,si$13303551,adv$25941429036,ct$25,li$3239250051,exp$1402544433026922,cr$4154984551,pbid$25372728133,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1402544433026\", \"fdb_intl\": \"en-us\" , \"d\" : \"1\" }", "slotData": "{\"pt\":\"672938972\",\"bamt\":\"10000000000.000000\",\"namt\":\"0.000000\",\"is_ad_feedback\":\"false\",\"isCompAds\":\"false\",\"pvid\":\"969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY\"}", "adc": "{\"label\":\"AdChoices\",\"url\":\"https:\\/\\/info.yahoo.com\\/privacy\\/us\\/yahoo\\/relevantads.html\",\"close\":\"Close\"}", "is3rd": "0" } } },{ "html": "<!-- SpaceID=28951412 loc=FB2 noad --><!-- fac-gd2-noad --><!-- gd2-status-2 --><!--QYZ CMS_NONE_AVAIL,,98.139.115.80;;FB2;28951412;2;-->", "id": "FB2-2", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['gAq1v2KLc6Q-']='(as$12536rf1u,aid$gAq1v2KLc6Q-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134jqr6p5(gid$969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY,st$1427251674080589,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$12536rf1u,aid$gAq1v2KLc6Q-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)\"></noscr"+"ipt>", "cscURI": "https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134jqr6p5(gid$969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY,st$1427251674080589,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$12536rf1u,aid$gAq1v2KLc6Q-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)", "impID": "", "supp_ugc": "0", "placementID": "-1", "creativeID": "-1", "serveTime": "1.4272516740806E+15", "behavior": "non_exp", "adID": "#2", "matchID": "#2", "err": "invalid_space", "hasExternal": 0, "size": "", "bookID": "CMS_NONE_AVAIL", "serveType": "-1", "slotID": "1", "fdb": "{ \"fdb_url\": \"http:\\/\\/gd1457.adx.gq1.yahoo.com\\/af?bv=1.0.0&bs=(15ir45r6b(gid$jmTVQDk4LjHHbFsHU5jMkgKkMTAuNwAAAACljpkK,st$1402537233026922,srv$1,si$13303551,adv$25941429036,ct$25,li$3239250051,exp$1402544433026922,cr$4154984551,pbid$25372728133,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1402544433026\", \"fdb_intl\": \"en-us\" , \"d\" : \"1\" }", "slotData": "{\"pt\":\"672938972\",\"bamt\":\"10000000000.000000\",\"namt\":\"0.000000\",\"is_ad_feedback\":\"false\",\"isCompAds\":\"false\",\"pvid\":\"969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY\"}", "adc": "{\"label\":\"AdChoices\",\"url\":\"https:\\/\\/info.yahoo.com\\/privacy\\/us\\/yahoo\\/relevantads.html\",\"close\":\"Close\"}", "is3rd": "0" } } },{ "html": "<!-- SpaceID=28951412 loc=FB2 noad --><!-- fac-gd2-noad --><!-- gd2-status-2 --><!--QYZ CMS_NONE_AVAIL,,98.139.115.80;;FB2;28951412;2;-->", "id": "FB2-3", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['qBW1v2KLc6Q-']='(as$12525obku,aid$qBW1v2KLc6Q-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134jqr6p5(gid$969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY,st$1427251674080589,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$12525obku,aid$qBW1v2KLc6Q-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)\"></noscr"+"ipt>", "cscURI": "https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134jqr6p5(gid$969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY,st$1427251674080589,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$12525obku,aid$qBW1v2KLc6Q-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)", "impID": "", "supp_ugc": "0", "placementID": "-1", "creativeID": "-1", "serveTime": "1.4272516740806E+15", "behavior": "non_exp", "adID": "#2", "matchID": "#2", "err": "invalid_space", "hasExternal": 0, "size": "", "bookID": "CMS_NONE_AVAIL", "serveType": "-1", "slotID": "2", "fdb": "{ \"fdb_url\": \"http:\\/\\/gd1457.adx.gq1.yahoo.com\\/af?bv=1.0.0&bs=(15ir45r6b(gid$jmTVQDk4LjHHbFsHU5jMkgKkMTAuNwAAAACljpkK,st$1402537233026922,srv$1,si$13303551,adv$25941429036,ct$25,li$3239250051,exp$1402544433026922,cr$4154984551,pbid$25372728133,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1402544433026\", \"fdb_intl\": \"en-us\" , \"d\" : \"1\" }", "slotData": "{\"pt\":\"672938972\",\"bamt\":\"10000000000.000000\",\"namt\":\"0.000000\",\"is_ad_feedback\":\"false\",\"isCompAds\":\"false\",\"pvid\":\"969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY\"}", "adc": "{\"label\":\"AdChoices\",\"url\":\"https:\\/\\/info.yahoo.com\\/privacy\\/us\\/yahoo\\/relevantads.html\",\"close\":\"Close\"}", "is3rd": "0" } } },{ "html": "<!-- SpaceID=28951412 loc=FB2 noad --><!-- fac-gd2-noad --><!-- gd2-status-2 --><!--QYZ CMS_NONE_AVAIL,,98.139.115.80;;FB2;28951412;2;-->", "id": "FB2-4", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['0CC1v2KLc6Q-']='(as$125kcp4l2,aid$0CC1v2KLc6Q-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134jqr6p5(gid$969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY,st$1427251674080589,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$125kcp4l2,aid$0CC1v2KLc6Q-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)\"></noscr"+"ipt>", "cscURI": "https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134jqr6p5(gid$969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY,st$1427251674080589,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$125kcp4l2,aid$0CC1v2KLc6Q-,cr$-1,ct$25,at$H,eob$gd1_match_id=-1:ypos=FB2)", "impID": "", "supp_ugc": "0", "placementID": "-1", "creativeID": "-1", "serveTime": "1.4272516740806E+15", "behavior": "non_exp", "adID": "#2", "matchID": "#2", "err": "invalid_space", "hasExternal": 0, "size": "", "bookID": "CMS_NONE_AVAIL", "serveType": "-1", "slotID": "3", "fdb": "{ \"fdb_url\": \"http:\\/\\/gd1457.adx.gq1.yahoo.com\\/af?bv=1.0.0&bs=(15ir45r6b(gid$jmTVQDk4LjHHbFsHU5jMkgKkMTAuNwAAAACljpkK,st$1402537233026922,srv$1,si$13303551,adv$25941429036,ct$25,li$3239250051,exp$1402544433026922,cr$4154984551,pbid$25372728133,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1402544433026\", \"fdb_intl\": \"en-us\" , \"d\" : \"1\" }", "slotData": "{\"pt\":\"672938972\",\"bamt\":\"10000000000.000000\",\"namt\":\"0.000000\",\"is_ad_feedback\":\"false\",\"isCompAds\":\"false\",\"pvid\":\"969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY\"}", "adc": "{\"label\":\"AdChoices\",\"url\":\"https:\\/\\/info.yahoo.com\\/privacy\\/us\\/yahoo\\/relevantads.html\",\"close\":\"Close\"}", "is3rd": "0" } } },{ "html": "<!-- APT Vendor: Right Media, Format: Standard Graphical -->\n<SCR"+"IPT TYPE=\"text/javascr"+"ipt\" SRC=\"https://ads.yahoo.com/st?ad_type=ad&publisher_blob=${RS}|969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY|28951412|SKY|1427251674.118915|2-8-7|ysd|1&cnt=yan&ad_size=160x600&site=140440&section_code=3298733051&cb=1427251674.118915&yud=smpv%3d3%26ed%3dzAomdC25_0v58WhS9XOuKMdqiupb5raETJKzYQ--&K=1&pub_redirect_unencoded=1&pub_url=http://finance.yahoo.com/q/op&pub_redirect=https://beap-bc.yahoo.com/yc/YnY9MS4wLjAmYnM9KDE3ZnY1aXBscihnaWQkOTY5c0ZUSXdOaTZtMUZtelZSSUxZQUNOTVRBNExsVVNJZHJfbmJlWSxzdCQxNDI3MjUxNjc0MDgwNTg5LHNpJDQ0NTEwNTEsc3AkMjg5NTE0MTIsY3IkNDI2NTMxMDA1MSx2JDIuMCxhaWQkSURlMXYyS0xjNlEtLGN0JDI1LHlieCRBSEE5RGN1Mmd4bkZ2TzczcWZXVmhBLGJpJDIxNjUyNDEwNTEsbW1lJDkxMzk1ODUzOTg2Mzg3MDM0NTAsbG5nJGVuLXVzLHIkMCx5b28kMSxhZ3AkMzI5ODczMzA1MSxhcCRTS1kpKQ/2/*\"></SCR"+"IPT><scr"+"ipt>var url = \"\"; if(url && url.search(\"http\") != -1){new Image().src = url;}</scr"+"ipt><!--QYZ 2165241051,4265310051,98.139.115.80;;SKY;28951412;1;-->", "id": "SKY", "meta": { "y": { "cscHTML": "<scr"+"ipt language=javascr"+"ipt>\nif(window.xzq_d==null)window.xzq_d=new Object();\nwindow.xzq_d['IDe1v2KLc6Q-']='(as$13a4ivhc2,aid$IDe1v2KLc6Q-,bi$2165241051,agp$3298733051,cr$4265310051,ct$25,at$H,eob$gd1_match_id=-1:ypos=SKY)';\n</scr"+"ipt><noscr"+"ipt><img width=1 height=1 alt=\"\" src=\"https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134jqr6p5(gid$969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY,st$1427251674080589,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$13a4ivhc2,aid$IDe1v2KLc6Q-,bi$2165241051,agp$3298733051,cr$4265310051,ct$25,at$H,eob$gd1_match_id=-1:ypos=SKY)\"></noscr"+"ipt>", "cscURI": "https://csc.beap.bc.yahoo.com/yi?bv=1.0.0&bs=(134jqr6p5(gid$969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY,st$1427251674080589,si$4451051,sp$28951412,pv$0,v$2.0))&t=J_3-D_3&al=(as$13a4ivhc2,aid$IDe1v2KLc6Q-,bi$2165241051,agp$3298733051,cr$4265310051,ct$25,at$H,eob$gd1_match_id=-1:ypos=SKY)", "impID": "IDe1v2KLc6Q-", "supp_ugc": "0", "placementID": "3298733051", "creativeID": "4265310051", "serveTime": "1427251674080589", "behavior": "non_exp", "adID": "9139585398638703450", "matchID": "999999.999999.999999.999999", "err": "", "hasExternal": 0, "size": "160x600", "bookID": "2165241051", "serveType": "-1", "slotID": "5", "fdb": "{ \"fdb_url\": \"https:\\\/\\\/beap-bc.yahoo.com\\\/af\\\/us?bv=1.0.0&bs=(15h35eaj4(gid$969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY,st$1427251674080589,srv$1,si$4451051,adv$26513753608,ct$25,li$3293594551,exp$1427258874080589,cr$4265310051,pbid$20459933223,v$1.0))&al=(type${type},cmnt${cmnt},subo${subo})&r=10\", \"fdb_on\": \"1\", \"fdb_exp\": \"1427258874080\", \"fdb_intl\": \"en-US\" }", "slotData": "{\"pt\":\"8\",\"bamt\":\"10000000000.000000\",\"namt\":\"0.000000\",\"is_ad_feedback\":\"false\",\"isCompAds\":\"false\",\"adjf\":\"1.000000\",\"alpha\":\"-1.000000\",\"ffrac\":\"0.999356\",\"pcpm\":\"-1.000000\",\"fc\":\"false\",\"sdate\":\"1411704000\",\"edate\":\"1498881599\",\"bimpr\":399999991808.000000,\"pimpr\":0.000000,\"spltp\":0.000000,\"frp\":\"false\",\"pvid\":\"969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY\"}", "adc": "{\"label\":\"AdChoices\",\"url\":\"https:\\/\\/info.yahoo.com\\/privacy\\/us\\/yahoo\\/relevantads.html\",\"close\":\"Close\"}", "is3rd": "1" } } } ], "meta": { "y": { "pageEndHTML": "", "pos_list": [ "FB2-1","FB2-2","FB2-3","FB2-4","LOGO","SKY" ], "spaceID": "28951412", "host": "finance.yahoo.com", "lookupTime": "45", "k2_uri": "", "fac_rt": "38077", "serveTime":"1427251674080589", "pvid": "969sFTIwNi6m1FmzVRILYACNMTA4LlUSIdr_nbeY", "tID": "darla_prefetch_1427251674081_687567458_1", "npv": "1", "ep": "{\"site-attribute\":{},\"ult\":{\"ln\":{\"slk\":\"ads\"}},\"nopageview\":true,\"ref\":\"http:\\/\\/finance.yahoo.com\\/q\\/op\",\"secure\":true,\"filter\":\"no_expandable;exp_iframe_expandable;\",\"darlaID\":\"darla_instance_1427251674081_4984828_0\"}", "pe": "CWZ1bmN0aW9uIGRlcGZkKCkgeyAKCQppZih3aW5kb3cueHpxX2Q9PW51bGwpd2luZG93Lnh6cV9kPW5ldyBPYmplY3QoKTsKd2luZG93Lnh6cV9kWydXUC4wdjJLTGM2US0nXT0nKGFzJDEyNWNpYWxiOCxhaWQkV1AuMHYyS0xjNlEtLGNyJC0xLGN0JDI1LGF0JEgsZW9iJGdkMV9tYXRjaF9pZD0tMTp5cG9zPUZCMiknOwoKCQppZih3aW5kb3cueHpxX2Q9PW51bGwpd2luZG93Lnh6cV9kPW5ldyBPYmplY3QoKTsKd2luZG93Lnh6cV9kWydnQXExdjJLTGM2US0nXT0nKGFzJDEyNTM2cmYxdSxhaWQkZ0FxMXYyS0xjNlEtLGNyJC0xLGN0JDI1LGF0JEgsZW9iJGdkMV9tYXRjaF9pZD0tMTp5cG9zPUZCMiknOwoKCQppZih3aW5kb3cueHpxX2Q9PW51bGwpd2luZG93Lnh6cV9kPW5ldyBPYmplY3QoKTsKd2luZG93Lnh6cV9kWydxQlcxdjJLTGM2US0nXT0nKGFzJDEyNTI1b2JrdSxhaWQkcUJXMXYyS0xjNlEtLGNyJC0xLGN0JDI1LGF0JEgsZW9iJGdkMV9tYXRjaF9pZD0tMTp5cG9zPUZCMiknOwoKCQppZih3aW5kb3cueHpxX2Q9PW51bGwpd2luZG93Lnh6cV9kPW5ldyBPYmplY3QoKTsKd2luZG93Lnh6cV9kWycwQ0MxdjJLTGM2US0nXT0nKGFzJDEyNWtjcDRsMixhaWQkMENDMXYyS0xjNlEtLGNyJC0xLGN0JDI1LGF0JEgsZW9iJGdkMV9tYXRjaF9pZD0tMTp5cG9zPUZCMiknOwoKCQppZih3aW5kb3cueHpxX2Q9PW51bGwpd2luZG93Lnh6cV9kPW5ldyBPYmplY3QoKTsKd2luZG93Lnh6cV9kWycuQ3UxdjJLTGM2US0nXT0nKGFzJDEyNTAzdWUxNSxhaWQkLkN1MXYyS0xjNlEtLGNyJC0xLGN0JDI1LGF0JEgsZW9iJGdkMV9tYXRjaF9pZD0tMTp5cG9zPUxPR08pJzsKCgkKaWYod2luZG93Lnh6cV9kPT1udWxsKXdpbmRvdy54enFfZD1uZXcgT2JqZWN0KCk7CndpbmRvdy54enFfZFsnSURlMXYyS0xjNlEtJ109JyhhcyQxM2E0aXZoYzIsYWlkJElEZTF2MktMYzZRLSxiaSQyMTY1MjQxMDUxLGFncCQzMjk4NzMzMDUxLGNyJDQyNjUzMTAwNTEsY3QkMjUsYXQkSCxlb2IkZ2QxX21hdGNoX2lkPS0xOnlwb3M9U0tZKSc7CgkgfTsKZGVwZmQudHJhbnNJRCA9ICJkYXJsYV9wcmVmZXRjaF8xNDI3MjUxNjc0MDgxXzY4NzU2NzQ1OF8xIjsKCglmdW5jdGlvbiBkcGVyKCkgeyAKCQppZih3aW5kb3cueHpxX3N2cil4enFfc3ZyKCdodHRwczovL2NzYy5iZWFwLmJjLnlhaG9vLmNvbS8nKTsKaWYod2luZG93Lnh6cV9wKXh6cV9wKCd5aT9idj0xLjAuMCZicz0oMTM0anFyNnA1KGdpZCQ5NjlzRlRJd05pNm0xRm16VlJJTFlBQ05NVEE0TGxVU0lkcl9uYmVZLHN0JDE0MjcyNTE2NzQwODA1ODksc2kkNDQ1MTA1MSxzcCQyODk1MTQxMixwdiQwLHYkMi4wKSkmdD1KXzMtRF8zJyk7CmlmKHdpbmRvdy54enFfcyl4enFfcygpOwooZnVuY3Rpb24oYyl7dmFyIGQ9Imh0dHBzOi8vIixhPWMmJmMuSlNPTixlPSJ5cGNkYiIsZz1kb2N1bWVudCxiO2Z1bmN0aW9uIGoobixxLHAsbyl7dmFyIG0scjt0cnl7bT1uZXcgRGF0ZSgpO20uc2V0VGltZShtLmdldFRpbWUoKStvKjEwMDApO2cuY29va2llPVtuLCI9IixlbmNvZGVVUklDb21wb25lbnQocSksIjsgZG9tYWluPSIscCwiOyBwYXRoPS87IG1heC1hZ2U9IixvLCI7IGV4cGlyZXM9IixtLnRvVVRDU3RyaW5nKCldLmpvaW4oIiIpfWNhdGNoKHIpe319ZnVuY3Rpb24gayhtKXtyZXR1cm4gZnVuY3Rpb24oKXtpKG0pfX1mdW5jdGlvbiBpKG4pe3ZhciBtLG87dHJ5e209bmV3IEltYWdlKCk7bS5vbmVycm9yPW0ub25sb2FkPWZ1bmN0aW9uKCl7bS5vbmVycm9yPW0ub25sb2FkPW51bGw7bT1udWxsfTttLnNyYz1ufWNhdGNoKG8pe319ZnVuY3Rpb24gZihvKXt2YXIgcD0iIixuLHMscixxO2lmKG8pe3RyeXtuPW8ubWF0Y2goL15odHRwcz86XC9cLyhbXlwvXD9dKikoeWFob29cLmNvbXx5aW1nXC5jb218ZmxpY2tyXC5jb218eWFob29cLm5ldHxyaXZhbHNcLmNvbSkoOlxkKyk/KFtcL1w/XXwkKS8pO2lmKG4mJm5bMl0pe3A9blsyXX1uPShuJiZuWzFdKXx8bnVsbDtzPW4/bi5sZW5ndGgtMTotMTtyPW4mJnM+PTA/bltzXTpudWxsO2lmKHImJnIhPSIuIiYmciE9Ii8iKXtwPSIifX1jYXRjaChxKXtwPSIifX1yZXR1cm4gcH1mdW5jdGlvbiBsKEIsbixxLG0scCl7dmFyIHUscyx0LEEscixGLHosRSxDLHksbyxELHgsdj0xMDAwLHc9djt0cnl7Yj1sb2NhdGlvbn1jYXRjaCh6KXtiPW51bGx9dHJ5e2lmKGEpe0M9YS5wYXJzZShwKX1lbHNle3k9bmV3IEZ1bmN0aW9uKCJyZXR1cm4gIitwKTtDPXkoKX19Y2F0Y2goeil7Qz1udWxsfWlmKHkpe3k9bnVsbH10cnl7cz1iLmhvc3RuYW1lO3Q9Yi5wcm90b2NvbDtpZih0KXt0Kz0iLy8ifX1jYXRjaCh6KXtzPXQ9IiJ9aWYoIXMpe3RyeXtBPWcuVVJMfHxiLmhyZWZ8fCIiO3I9QS5tYXRjaCgvXigoaHR0cFtzXT8pXDpbXC9dKyk/KFteOlwvXHNdK3xbXDpcZGFiY2RlZlwuXSspL2kpO2lmKHImJnJbMV0mJnJbM10pe3Q9clsxXXx8IiI7cz1yWzNdfHwiIn19Y2F0Y2goeil7dD1zPSIifX1pZighc3x8IUN8fCF0fHwhcSl7cmV0dXJufUE9Zy5VUkx8fGIuaHJlZnx8IiI7RT1mKEEpO2lmKCFFfHxnLmNvb2tpZS5pbmRleE9mKCJ5cGNkYj0iK24pPi0xKXtyZXR1cm59aWYodD09PWQpe3E9bX11PTA7d2hpbGUoRj1xW3UrK10pe289Ri5sYXN0SW5kZXhPZigiPSIpO2lmKG8hPS0xKXtEPUYuc3Vic3RyKDErbyk7eD1DW0RdO2lmKHgpe3NldFRpbWVvdXQoayh0K0YreCksdyk7dys9dn19fXU9MDt3aGlsZShGPUJbdSsrXSl7c2V0VGltZW91dChrKHQrRiksdyk7dys9dn1zZXRUaW1lb3V0KGZ1bmN0aW9uKCl7aihlLG4sRSw4NjQwMCl9LHcpfWZ1bmN0aW9uIGgoKXtsKFtdLCdmYzE0MTQ0MzU1YWRiODMxNTUwYWFjYTE2NDNkN2FlMycsWydjc3luYy5mbGlja3IuY29tL2NzeW5jP3Zlcj0yLjEnLCdjc3luYy55YWhvb2FwaXMuY29tL2NzeW5jP3Zlcj0yLjEnXSxbJ2NzeW5jLmZsaWNrci5jb20vY3N5bmM/dmVyPTIuMScsJ2NzeW5jLnlhaG9vYXBpcy5jb20vY3N5bmM/dmVyPTIuMSddLCd7IjIuMSI6IiZpZD0yMzM1MSZ2YWx1ZT1ucXkyY3pxbnU0MmUwJTI2byUzZDMlMjZmJTNkdXAmb3B0b3V0PSZ0aW1lb3V0PTE0MjcyNTE2NzQmc2lnPTExZ3ZkcWgwbCJ9Jyl9aWYoYy5hZGRFdmVudExpc3RlbmVyKXtjLmFkZEV2ZW50TGlzdGVuZXIoImxvYWQiLGgsZmFsc2UpfWVsc2V7aWYoYy5hdHRhY2hFdmVudCl7Yy5hdHRhY2hFdmVudCgib25sb2FkIixoKX1lbHNle2Mub25sb2FkPWh9fX0pKHdpbmRvdyk7CgogfTsKZHBlci50cmFuc0lEID0iZGFybGFfcHJlZmV0Y2hfMTQyNzI1MTY3NDA4MV82ODc1Njc0NThfMSI7Cg==", "pym": "" } } } </script></div><div id="yom-ad-SDARLAEXTRA-iframe"><script type='text/javascript'>
-DARLA_CONFIG = {"useYAC":0,"servicePath":"https:\/\/finance.yahoo.com\/__darla\/php\/fc.php","xservicePath":"","beaconPath":"https:\/\/finance.yahoo.com\/__darla\/php\/b.php","renderPath":"","allowFiF":false,"srenderPath":"https:\/\/s.yimg.com\/rq\/darla\/2-8-7\/html\/r-sf.html","renderFile":"https:\/\/s.yimg.com\/rq\/darla\/2-8-7\/html\/r-sf.html","sfbrenderPath":"https:\/\/s.yimg.com\/rq\/darla\/2-8-7\/html\/r-sf.html","msgPath":"https:\/\/finance.yahoo.com\/__darla\/2-8-7\/html\/msg.html","cscPath":"https:\/\/s.yimg.com\/rq\/darla\/2-8-7\/html\/r-csc.html","root":"__darla","edgeRoot":"http:\/\/l.yimg.com\/rq\/darla\/2-8-7","sedgeRoot":"https:\/\/s.yimg.com\/rq\/darla\/2-8-7","version":"2-8-7","tpbURI":"","hostFile":"https:\/\/s.yimg.com\/rq\/darla\/2-8-7\/js\/g-r-min.js","beaconsDisabled":true,"rotationTimingDisabled":true,"fdb_locale":"What don't you like about this ad?|It's offensive|Something else|Thank you for helping us improve your Yahoo experience|It's not relevant|It's distracting|I don't like this ad|Send|Done|Why do I see ads?|Learn more about your feedback.","positions":{"FB2-1":[],"FB2-2":[],"FB2-3":[],"FB2-4":[],"LOGO":[],"SKY":{"w":160,"h":600}}};
-DARLA_CONFIG.servicePath = DARLA_CONFIG.servicePath.replace(/\:8033/g, "");
-DARLA_CONFIG.msgPath = DARLA_CONFIG.msgPath.replace(/\:8033/g, "");
-DARLA_CONFIG.k2E2ERate = 2;
-DARLA_CONFIG.positions = {"FB2-4":{"w":"198","h":"60","dest":"yom-ad-FB2-4-iframe","fr":"expIfr_exp","pos":"FB2-4","id":"FB2-4","clean":"yom-ad-FB2-4","rmxp":0},"FB2-1":{"w":"198","h":"60","dest":"yom-ad-FB2-1-iframe","fr":"expIfr_exp","pos":"FB2-1","id":"FB2-1","clean":"yom-ad-FB2-1","rmxp":0},"FB2-2":{"w":"198","h":"60","dest":"yom-ad-FB2-2-iframe","fr":"expIfr_exp","pos":"FB2-2","id":"FB2-2","clean":"yom-ad-FB2-2","rmxp":0},"SKY":{"w":"160","h":"600","dest":"yom-ad-SKY-iframe","fr":"expIfr_exp","pos":"SKY","id":"SKY","clean":"yom-ad-SKY","rmxp":0},"FB2-3":{"w":"198","h":"60","dest":"yom-ad-FB2-3-iframe","fr":"expIfr_exp","pos":"FB2-3","id":"FB2-3","clean":"yom-ad-FB2-3","rmxp":0},"FB2-0":{"w":"120","h":"60","dest":"yom-ad-FB2-0-iframe","fr":"expIfr_exp","pos":"FB2-0","id":"FB2-0","clean":"yom-ad-FB2-0","rmxp":0},"WBTN-1":{"w":"120","h":"60","dest":"yom-ad-WBTN-1-iframe","fr":"expIfr_exp","pos":"WBTN-1","id":"WBTN-1","clean":"yom-ad-WBTN-1","rmxp":0},"WBTN":{"w":"120","h":"60","dest":"yom-ad-WBTN-iframe","fr":"expIfr_exp","pos":"WBTN","id":"WBTN","clean":"yom-ad-WBTN","rmxp":0},"LDRP":{"w":"320","h":"76","dest":"yom-ad-LDRP-iframe","fr":"expIfr_exp","pos":"LDRP","id":"LDRP","clean":"yom-ad-LDRP","rmxp":0,"metaSize":true,"supports":{"exp-ovr":1,"exp-push":1}},"LREC":{"w":"300","h":"265","dest":"yom-ad-LREC-iframe","fr":"expIfr_exp","pos":"LREC","id":"LREC","clean":"yom-ad-LREC","rmxp":0,"metaSize":true,"supports":{"exp-ovr":1,"lyr":1}},"LREC-1":{"w":"300","h":"265","dest":"yom-ad-LREC-iframe-lb","fr":"expIfr_exp","pos":"LREC","id":"LREC-1","clean":"yom-ad-LREC-lb","rmxp":0,"metaSize":true,"supports":{"exp-ovr":1,"lyr":1}}};DARLA_CONFIG.positions['DEFAULT'] = { meta: { title: document.title, url: document.URL || location.href, urlref: document.referrer }};
-DARLA_CONFIG.events = {"darla_td":{"lvl":"","sp":"28951412","npv":true,"bg":"","sa":[],"sa_orig":[],"filter":"no_expandable;exp_iframe_expandable;","mpid":"","mpnm":"","locale":"","ps":"LREC,FB2-1,FB2-2,FB2-3,FB2-4,LDRP,WBTN,WBTN-1,FB2-0,SKY","ml":"","mps":"","ssl":"1"}};YMedia.later(10, this, function() {YMedia.use("node-base", function(Y){
-
-    /* YUI Ads Darla begins... */
-    YUI.AdsDarla = (function (){
-
-        var NAME = 'AdsDarla',
-            LB_EVENT = 'lightbox',
-            AUTO_EVENT = 'AUTO',
-            LREC3_EVENT = 'lrec3Event',
-            MUTEX_ADS = {},
-            AD_PERF_COMP = [];
-
-        if (DARLA_CONFIG.positions && DARLA_CONFIG.positions['TL1']) {
-            var navlink = Y.one('ul.navlist li>a'),
-                linkcolor;
-            if (navlink) {
-                linkcolor = navlink.getStyle('color');
-                DARLA_CONFIG.positions['TL1'].css = ".ad-tl2b {overflow:hidden; text-align:left;} p {margin:0px;} .y-fp-pg-controls {margin-top:5px; margin-bottom:5px;} #tl1_slug { font-family:'Helvetica Neue',Helvetica,Arial,sans-serif; font-size:12px; color:" + linkcolor + ";} #fc_align a {font-family:'Helvetica Neue',Helvetica,Arial,sans-serif; font-size:11px; color:" + linkcolor + ";} a:link {text-decoration:none;} a:hover {color: " + linkcolor + ";}";
-            }
-        }
-
-    /* setting up DARLA events */
-    var w = window,
-        D = w.DARLA,
-        C = w.DARLA_CONFIG,
-        DM = w.DOC_DOMAIN_SET || 0;
-    if (D) {
-        if (D && C) {
-            C.dm = DM;
-        }
-
-
-        /* setting DARLA configuration */
-        DARLA.config(C);
-
-        /* prefetch Ads if applicable */
-        DARLA.prefetched("fc");
-
-        /* rendering prefetched Ad */
-
-        DARLA.render();
-
-
-    }
-
-    return {
-        event: function (eventId, spaceId, adsSa) {
-            if (window.DARLA && eventId) {
-                var eventConfig = {};
-                if (!isNaN(spaceId)) {
-                    eventConfig.sp = spaceId;
-                }
-                /* Site attributes */
-                adsSa = (typeof adsSa !== "undefined" && adsSa !== null) ? adsSa : "";
-                eventConfig.sa = DARLA_CONFIG.events[eventId].sa_orig.replace ? DARLA_CONFIG.events[eventId].sa_orig.replace("ADSSA", adsSa) : "";
-                DARLA.event(eventId, eventConfig);
-            }
-        },
-        render: function() {
-            if (!!(Y.one('#yom-slideshow-lightbox') || Y.one('#content-lightbox') || false)) {
-                /* skip configuring DARLA in case of lightbox being triggered */
-            } else {
-                // abort current darla action
-                if (DARLA && DARLA.abort) {
-                    DARLA.abort();
-                }
-
-                /* setting DARLA configuration */
-                DARLA.config(DARLA_CONFIG);
-
-                /* prefetch Ads if applicable */
-                DARLA.prefetched("fc");
-
-                /* rendering prefetched Ad */
-                DARLA.render();
-            }
-        }
-    };
-
-})(); /* End of YUI.AdsDarla */
-
-YUI.AdsDarla.darla_td = { fetch: (Y.bind(YUI.AdsDarla.event, YUI.AdsDarla, 'darla_td')) };    YUI.AdsDarla.fetch = YUI.AdsDarla.darla_td.fetch;
-    Y.Global.fire('darla:ready'); 
-}); /* End of YMedia */}); /* End of YMedia.later */var ___adLT___ = [];
-function onDarlaFinishPosRender(position) {
-  if (window.performance !== undefined && window.performance.now !== undefined) {
-    var ltime = window.performance.now();
-    ___adLT___.push(['AD_'+position, Math.round(ltime)]);
-    setTimeout(function () {
-        if (window.LH !== undefined && window.YAFT !== undefined && window.YAFT.isInitialized()) {
-          window.YAFT.triggerCustomTiming('yom-ad-'+position, '', ltime);
-        }
-    },1000);
-  }
-}
-
-if ((DARLA && DARLA.config) || DARLA_CONFIG) {
-    var oldConf = DARLA.config() || DARLA_CONFIG || null;
-    if (oldConf) {
-        if (oldConf.onFinishPosRender) {
-            (function() {
-                var oldVersion = oldConf.onFinishPosRender;
-                oldConf.onFinishPosRender = function(position) {
-                    onDarlaFinishPosRender(position);
-                    return oldVersion.apply(me, arguments);
-                };
-            })();
-        } else {
-            oldConf.onFinishPosRender  = onDarlaFinishPosRender;
-        }
-        DARLA.config(oldConf);
-    }
-}
-
-</script></div><div><!-- SpaceID=28951412 loc=LOGO noad --><!-- fac-gd2-noad --><!-- gd2-status-2 --><!--QYZ CMS_NONE_AVAIL,,98.139.115.80;;LOGO;28951412;2;--></div><!-- END DARLA CONFIG -->
-
-        <script>window.YAHOO = window.YAHOO || {}; window.YAHOO.i13n = window.YAHOO.i13n || {}; if (!window.YMedia) { var YMedia = YUI(); YMedia.includes = []; }</script><script>YAHOO.i13n.YWA_CF_MAP = {"_p":20,"ad":58,"authfb":11,"bpos":24,"camp":54,"cat":25,"code":55,"cpos":21,"ct":23,"dcl":26,"dir":108,"domContentLoadedEventEnd":44,"elm":56,"elmt":57,"f":40,"ft":51,"grpt":109,"ilc":39,"itc":111,"loadEventEnd":45,"ltxt":17,"mpos":110,"mrkt":12,"pcp":67,"pct":48,"pd":46,"pkgt":22,"pos":20,"prov":114,"psp":72,"pst":68,"pstcat":47,"pt":13,"rescode":27,"responseEnd":43,"responseStart":41,"rspns":107,"sca":53,"sec":18,"site":42,"slk":19,"sort":28,"t1":121,"t2":122,"t3":123,"t4":124,"t5":125,"t6":126,"t7":127,"t8":128,"t9":129,"tar":113,"test":14,"v":52,"ver":49,"x":50};YAHOO.i13n.YWA_ACTION_MAP = {"click":12,"hvr":115,"rottn":128,"drag":105};YAHOO.i13n.YWA_OUTCOME_MAP = {};</script><script>YMedia.rapid = new YAHOO.i13n.Rapid({"spaceid":"28951412","client_only":1,"test_id":"","compr_type":"deflate","webworker_file":"/rapid-worker.js","text_link_len":8,"keys":{"version":"td app","site":"mobile-web-quotes"},"ywa":{"project_id":"1000911397279","document_group":"interactive-chart","host":"y.analytics.yahoo.com"},"tracked_mods":["yfi_investing_nav","chart-details"],"perf_navigationtime":0,"perf_resourcetime":0,"nofollow_class":[],"pageview_on_init":true});</script><!-- RAPID INIT -->
-
-        <script>
-            YMedia.use('main');
-        </script>
-
-	    <!-- Universal Header -->
-	    <script src="https://s.yimg.com/zz/combo?kx/yucs/uh3/uh/1078/js/uh-min.js&kx/yucs/uh3/uh/1078/js/gallery-jsonp-min.js&kx/yucs/uh3/uh/1134/js/menu_utils_v3-min.js&kx/yucs/uh3/uh/1078/js/localeDateFormat-min.js&kx/yucs/uh3/uh/1078/js/timestamp_library_v2-min.js&kx/yucs/uh3/uh/1104/js/logo_debug-min.js&kx/yucs/uh3/switch-theme/6/js/switch_theme-min.js&kx/yucs/uhc/meta/55/js/meta-min.js&kx/yucs/uh_common/beacon/18/js/beacon-min.js&kx/yucs/uh2/comet/84/js/cometd-yui3-min.js&kx/yucs/uh2/comet/84/js/conn-min.js&kx/yucs/uh2/comet/84/js/dark-test-min.js&kx/yucs/uh3/disclaimer/384/js/disclaimer_seed-min.js&kx/yucs/uh3/top-bar/321/js/top_bar_v3-min.js&kx/yucs/uh3/search/598/js/search-min.js&kx/yucs/uh3/search/611/js/search_plugin-min.js&kx/yucs/uh3/help/83/js/help_menu_v3-min.js&kx/yucs/uhc/rapid/41/js/uh_rapid-min.js&kx/yucs/uh3/get-the-app/148/js/inputMaskClient-min.js&kx/yucs/uh3/get-the-app/160/js/get_the_app-min.js&kx/yucs/uh3/location/10/js/uh_locdrop-min.js&amp;"></script>
-
-    </body>
-
-</html>
-<!-- ad prefetch pagecsc setting -->
\ No newline at end of file
diff --git a/pandas/io/tests/generate_legacy_storage_files.py b/pandas/io/tests/generate_legacy_storage_files.py
deleted file mode 100644
index 91d0333b3407f..0000000000000
--- a/pandas/io/tests/generate_legacy_storage_files.py
+++ /dev/null
@@ -1,217 +0,0 @@
-""" self-contained to write legacy storage (pickle/msgpack) files """
-from __future__ import print_function
-from distutils.version import LooseVersion
-from pandas import (Series, DataFrame, Panel,
-                    SparseSeries, SparseDataFrame, SparsePanel,
-                    Index, MultiIndex, PeriodIndex, bdate_range, to_msgpack,
-                    date_range, period_range, bdate_range, Timestamp, Categorical,
-                    Period)
-import os
-import sys
-import numpy as np
-import pandas
-import pandas.util.testing as tm
-import platform as pl
-
-
-def _create_sp_series():
-    nan = np.nan
-
-    # nan-based
-    arr = np.arange(15, dtype=np.float64)
-    arr[7:12] = nan
-    arr[-1:] = nan
-
-    bseries = SparseSeries(arr, kind='block')
-    bseries.name = 'bseries'
-    return bseries
-
-
-def _create_sp_tsseries():
-    nan = np.nan
-
-    # nan-based
-    arr = np.arange(15, dtype=np.float64)
-    arr[7:12] = nan
-    arr[-1:] = nan
-
-    date_index = bdate_range('1/1/2011', periods=len(arr))
-    bseries = SparseSeries(arr, index=date_index, kind='block')
-    bseries.name = 'btsseries'
-    return bseries
-
-
-def _create_sp_frame():
-    nan = np.nan
-
-    data = {'A': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
-            'B': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
-            'C': np.arange(10).astype(np.int64),
-            'D': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]}
-
-    dates = bdate_range('1/1/2011', periods=10)
-    return SparseDataFrame(data, index=dates)
-
-
-def create_data():
-    """ create the pickle/msgpack data """
-
-    data = {
-        'A': [0., 1., 2., 3., np.nan],
-        'B': [0, 1, 0, 1, 0],
-        'C': ['foo1', 'foo2', 'foo3', 'foo4', 'foo5'],
-        'D': date_range('1/1/2009', periods=5),
-        'E': [0., 1, Timestamp('20100101'), 'foo', 2.]
-    }
-
-    scalars = dict(timestamp=Timestamp('20130101'))
-    if LooseVersion(pandas.__version__) >= '0.17.0':
-        scalars['period'] = Period('2012','M')
-
-    index = dict(int=Index(np.arange(10)),
-                 date=date_range('20130101', periods=10),
-                 period=period_range('2013-01-01', freq='M', periods=10))
-
-    mi = dict(reg2=MultiIndex.from_tuples(tuple(zip(*[['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-                                                      ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']])),
-                                          names=['first', 'second']))
-    series = dict(float=Series(data['A']),
-                  int=Series(data['B']),
-                  mixed=Series(data['E']),
-                  ts=Series(np.arange(10).astype(np.int64), index=date_range('20130101',periods=10)),
-                  mi=Series(np.arange(5).astype(np.float64),
-                            index=MultiIndex.from_tuples(tuple(zip(*[[1, 1, 2, 2, 2], [3, 4, 3, 4, 5]])),
-                                                         names=['one', 'two'])),
-                  dup=Series(np.arange(5).astype(np.float64), index=['A', 'B', 'C', 'D', 'A']),
-                  cat=Series(Categorical(['foo', 'bar', 'baz'])),
-                  dt=Series(date_range('20130101',periods=5)),
-                  dt_tz=Series(date_range('20130101',periods=5,tz='US/Eastern')))
-    if LooseVersion(pandas.__version__) >= '0.17.0':
-        series['period'] = Series([Period('2000Q1')] * 5)
-
-    mixed_dup_df = DataFrame(data)
-    mixed_dup_df.columns = list("ABCDA")
-    frame = dict(float=DataFrame(dict(A=series['float'], B=series['float'] + 1)),
-                 int=DataFrame(dict(A=series['int'], B=series['int'] + 1)),
-                 mixed=DataFrame(dict([(k, data[k]) for k in ['A', 'B', 'C', 'D']])),
-                 mi=DataFrame(dict(A=np.arange(5).astype(np.float64), B=np.arange(5).astype(np.int64)),
-                              index=MultiIndex.from_tuples(tuple(zip(*[['bar', 'bar', 'baz', 'baz', 'baz'],
-                                                                       ['one', 'two', 'one', 'two', 'three']])),
-                                                           names=['first', 'second'])),
-                 dup=DataFrame(np.arange(15).reshape(5, 3).astype(np.float64),
-                               columns=['A', 'B', 'A']),
-                 cat_onecol=DataFrame(dict(A=Categorical(['foo', 'bar']))),
-                 cat_and_float=DataFrame(dict(A=Categorical(['foo', 'bar', 'baz']),
-                                              B=np.arange(3).astype(np.int64))),
-                 mixed_dup=mixed_dup_df,
-                 dt_mixed_tzs=DataFrame(dict(A=Timestamp('20130102', tz='US/Eastern'), B=Timestamp('20130603', tz='CET')), index=range(5)),
-                 )
-
-    mixed_dup_panel = Panel(dict(ItemA=frame['float'], ItemB=frame['int']))
-    mixed_dup_panel.items = ['ItemA', 'ItemA']
-    panel = dict(float=Panel(dict(ItemA=frame['float'], ItemB=frame['float'] + 1)),
-                 dup=Panel(np.arange(30).reshape(3, 5, 2).astype(np.float64),
-                           items=['A', 'B', 'A']),
-                 mixed_dup=mixed_dup_panel)
-
-    return dict(series=series,
-                frame=frame,
-                panel=panel,
-                index=index,
-                scalars=scalars,
-                mi=mi,
-                sp_series=dict(float=_create_sp_series(),
-                               ts=_create_sp_tsseries()),
-                sp_frame=dict(float=_create_sp_frame()))
-
-
-def create_pickle_data():
-    data = create_data()
-
-    # Pre-0.14.1 versions generated non-unpicklable mixed-type frames and
-    # panels if their columns/items were non-unique.
-    if LooseVersion(pandas.__version__) < '0.14.1':
-        del data['frame']['mixed_dup']
-        del data['panel']['mixed_dup']
-    return data
-
-
-def create_msgpack_data():
-    data = create_data()
-    if LooseVersion(pandas.__version__) < '0.17.0':
-        del data['frame']['mixed_dup']
-        del data['panel']['mixed_dup']
-        del data['frame']['dup']
-        del data['panel']['dup']
-    # Not supported
-    del data['sp_series']
-    del data['sp_frame']
-    del data['series']['cat']
-    del data['frame']['cat_onecol']
-    del data['frame']['cat_and_float']
-    return data
-
-
-def platform_name():
-    return '_'.join([str(pandas.__version__), str(pl.machine()), str(pl.system().lower()), str(pl.python_version())])
-
-
-def write_legacy_pickles(output_dir):
-
-    # make sure we are < 0.13 compat (in py3)
-    try:
-        from pandas.compat import zip, cPickle as pickle
-    except:
-        import pickle
-
-    version = pandas.__version__
-
-    print("This script generates a storage file for the current arch, system, and python version")
-    print("  pandas version: {0}".format(version))
-    print("  output dir    : {0}".format(output_dir))
-    print("  storage format: pickle")
-
-    pth = '{0}.pickle'.format(platform_name())
-
-    fh = open(os.path.join(output_dir, pth), 'wb')
-    pickle.dump(create_pickle_data(), fh, pickle.HIGHEST_PROTOCOL)
-    fh.close()
-
-    print("created pickle file: %s" % pth)
-
-
-def write_legacy_msgpack(output_dir):
-
-    version = pandas.__version__
-
-    print("This script generates a storage file for the current arch, system, and python version")
-    print("  pandas version: {0}".format(version))
-    print("  output dir    : {0}".format(output_dir))
-    print("  storage format: msgpack")
-
-    pth = '{0}.msgpack'.format(platform_name())
-    to_msgpack(os.path.join(output_dir, pth), create_msgpack_data())
-
-    print("created msgpack file: %s" % pth)
-
-
-def write_legacy_file():
-    # force our cwd to be the first searched
-    sys.path.insert(0, '.')
-
-    if len(sys.argv) != 3:
-        exit("Specify output directory and storage type: generate_legacy_storage_files.py <output_dir> <storage_type>")
-
-    output_dir = str(sys.argv[1])
-    storage_type = str(sys.argv[2])
-
-    if storage_type == 'pickle':
-        write_legacy_pickles(output_dir=output_dir)
-    elif storage_type == 'msgpack':
-        write_legacy_msgpack(output_dir=output_dir)
-    else:
-        exit("storage_type must be one of {'pickle', 'msgpack'}")
-
-
-if __name__ == '__main__':
-    write_legacy_file()
diff --git a/pandas/io/tests/test_clipboard.py b/pandas/io/tests/test_clipboard.py
deleted file mode 100644
index 4855b715ebbe2..0000000000000
--- a/pandas/io/tests/test_clipboard.py
+++ /dev/null
@@ -1,109 +0,0 @@
-import numpy as np
-from numpy.random import randint
-
-import nose
-import pandas as pd
-
-from pandas import DataFrame
-from pandas import read_clipboard
-from pandas import get_option
-from pandas.util import testing as tm
-from pandas.util.testing import makeCustomDataframe as mkdf, disabled
-
-
-try:
-    import pandas.util.clipboard
-except OSError:
-    raise nose.SkipTest("no clipboard found")
-
-
-@disabled
-class TestClipboard(tm.TestCase):
-    @classmethod
-    def setUpClass(cls):
-        super(TestClipboard, cls).setUpClass()
-        cls.data = {}
-        cls.data['string'] = mkdf(5, 3, c_idx_type='s', r_idx_type='i',
-                                  c_idx_names=[None], r_idx_names=[None])
-        cls.data['int'] = mkdf(5, 3, data_gen_f=lambda *args: randint(2),
-                               c_idx_type='s', r_idx_type='i',
-                               c_idx_names=[None], r_idx_names=[None])
-        cls.data['float'] = mkdf(5, 3,
-                                 data_gen_f=lambda r, c: float(r) + 0.01,
-                                 c_idx_type='s', r_idx_type='i',
-                                 c_idx_names=[None], r_idx_names=[None])
-        cls.data['mixed'] = DataFrame({'a': np.arange(1.0, 6.0) + 0.01,
-                                       'b': np.arange(1, 6),
-                                       'c': list('abcde')})
-
-        # Test columns exceeding "max_colwidth" (GH8305)
-        _cw = get_option('display.max_colwidth') + 1
-        cls.data['colwidth'] = mkdf(5, 3, data_gen_f=lambda *args: 'x' * _cw,
-                                   c_idx_type='s', r_idx_type='i',
-                                   c_idx_names=[None], r_idx_names=[None])
-        # Test GH-5346
-        max_rows = get_option('display.max_rows')
-        cls.data['longdf'] = mkdf(max_rows+1, 3, data_gen_f=lambda *args: randint(2),
-                                  c_idx_type='s', r_idx_type='i',
-                                  c_idx_names=[None], r_idx_names=[None])
-        cls.data_types = list(cls.data.keys())
-
-    @classmethod
-    def tearDownClass(cls):
-        super(TestClipboard, cls).tearDownClass()
-        del cls.data_types, cls.data
-
-    def check_round_trip_frame(self, data_type, excel=None, sep=None):
-        data = self.data[data_type]
-        data.to_clipboard(excel=excel, sep=sep)
-        if sep is not None:
-            result = read_clipboard(sep=sep,index_col=0)
-        else:
-            result = read_clipboard()
-        tm.assert_frame_equal(data, result, check_dtype=False)
-
-    def test_round_trip_frame_sep(self):
-        for dt in self.data_types:
-            self.check_round_trip_frame(dt,sep=',')
-
-    def test_round_trip_frame_string(self):
-        for dt in self.data_types:
-            self.check_round_trip_frame(dt,excel=False)
-
-    def test_round_trip_frame(self):
-        for dt in self.data_types:
-            self.check_round_trip_frame(dt)
-
-    def test_read_clipboard_infer_excel(self):
-        from textwrap import dedent
-        from pandas.util.clipboard import clipboard_set
-
-        text = dedent("""
-            John James	Charlie Mingus
-            1	2
-            4	Harry Carney
-            """.strip())
-        clipboard_set(text)
-        df = pd.read_clipboard()
-
-        # excel data is parsed correctly
-        self.assertEqual(df.iloc[1][1], 'Harry Carney')
-
-        # having diff tab counts doesn't trigger it
-        text = dedent("""
-            a\t b
-            1  2
-            3  4
-            """.strip())
-        clipboard_set(text)
-        res = pd.read_clipboard()
-
-        text = dedent("""
-            a  b
-            1  2
-            3  4
-            """.strip())
-        clipboard_set(text)
-        exp = pd.read_clipboard()
-
-        tm.assert_frame_equal(res, exp)
diff --git a/pandas/io/tests/test_common.py b/pandas/io/tests/test_common.py
deleted file mode 100644
index 03d1e4fb1f365..0000000000000
--- a/pandas/io/tests/test_common.py
+++ /dev/null
@@ -1,40 +0,0 @@
-"""
-    Tests for the pandas.io.common functionalities
-"""
-from pandas.compat import StringIO
-import os
-from os.path import isabs
-
-import pandas.util.testing as tm
-
-from pandas.io import common
-
-
-class TestCommonIOCapabilities(tm.TestCase):
-
-    def test_expand_user(self):
-        filename = '~/sometest'
-        expanded_name = common._expand_user(filename)
-
-        self.assertNotEqual(expanded_name, filename)
-        self.assertTrue(isabs(expanded_name))
-        self.assertEqual(os.path.expanduser(filename), expanded_name)
-
-    def test_expand_user_normal_path(self):
-        filename = '/somefolder/sometest'
-        expanded_name = common._expand_user(filename)
-
-        self.assertEqual(expanded_name, filename)
-        self.assertEqual(os.path.expanduser(filename), expanded_name)
-
-    def test_get_filepath_or_buffer_with_path(self):
-        filename = '~/sometest'
-        filepath_or_buffer, _, _ = common.get_filepath_or_buffer(filename)
-        self.assertNotEqual(filepath_or_buffer, filename)
-        self.assertTrue(isabs(filepath_or_buffer))
-        self.assertEqual(os.path.expanduser(filename), filepath_or_buffer)
-
-    def test_get_filepath_or_buffer_with_buffer(self):
-        input_buffer = StringIO()
-        filepath_or_buffer, _, _ = common.get_filepath_or_buffer(input_buffer)
-        self.assertEqual(filepath_or_buffer, input_buffer)
diff --git a/pandas/io/tests/test_cparser.py b/pandas/io/tests/test_cparser.py
deleted file mode 100644
index ceb845073e2c3..0000000000000
--- a/pandas/io/tests/test_cparser.py
+++ /dev/null
@@ -1,407 +0,0 @@
-"""
-C/Cython ascii file parser tests
-"""
-
-from pandas.compat import StringIO, BytesIO, map
-from datetime import datetime
-from pandas import compat
-import csv
-import os
-import sys
-import re
-
-import nose
-
-from numpy import nan
-import numpy as np
-
-from pandas import DataFrame, Series, Index, isnull, MultiIndex
-import pandas.io.parsers as parsers
-from pandas.io.parsers import (read_csv, read_table, read_fwf,
-                               TextParser, TextFileReader)
-from pandas.util.testing import (assert_almost_equal, assert_frame_equal,
-                                 assert_series_equal, network)
-import pandas.lib as lib
-from pandas import compat
-from pandas.lib import Timestamp
-
-import pandas.util.testing as tm
-
-from pandas.parser import TextReader
-import pandas.parser as parser
-
-
-class TestCParser(tm.TestCase):
-
-    def setUp(self):
-        self.dirpath = tm.get_data_path()
-        self.csv1 = os.path.join(self.dirpath, 'test1.csv')
-        self.csv2 = os.path.join(self.dirpath, 'test2.csv')
-        self.xls1 = os.path.join(self.dirpath, 'test.xls')
-
-    def test_file_handle(self):
-        try:
-            f = open(self.csv1, 'rb')
-            reader = TextReader(f)
-            result = reader.read()
-        finally:
-            f.close()
-
-    def test_string_filename(self):
-        reader = TextReader(self.csv1, header=None)
-        result = reader.read()
-
-    def test_file_handle_mmap(self):
-        try:
-            f = open(self.csv1, 'rb')
-            reader = TextReader(f, memory_map=True, header=None)
-            result = reader.read()
-        finally:
-            f.close()
-
-    def test_StringIO(self):
-        text = open(self.csv1, 'rb').read()
-        src = BytesIO(text)
-        reader = TextReader(src, header=None)
-        result = reader.read()
-
-    def test_string_factorize(self):
-        # should this be optional?
-        data = 'a\nb\na\nb\na'
-        reader = TextReader(StringIO(data), header=None)
-        result = reader.read()
-        self.assertEqual(len(set(map(id, result[0]))), 2)
-
-    def test_skipinitialspace(self):
-        data = ('a,   b\n'
-                'a,   b\n'
-                'a,   b\n'
-                'a,   b')
-
-        reader = TextReader(StringIO(data), skipinitialspace=True,
-                            header=None)
-        result = reader.read()
-
-        self.assert_numpy_array_equal(result[0], ['a', 'a', 'a', 'a'])
-        self.assert_numpy_array_equal(result[1], ['b', 'b', 'b', 'b'])
-
-    def test_parse_booleans(self):
-        data = 'True\nFalse\nTrue\nTrue'
-
-        reader = TextReader(StringIO(data), header=None)
-        result = reader.read()
-
-        self.assertEqual(result[0].dtype, np.bool_)
-
-    def test_delimit_whitespace(self):
-        data = 'a  b\na\t\t "b"\n"a"\t \t b'
-
-        reader = TextReader(StringIO(data), delim_whitespace=True,
-                            header=None)
-        result = reader.read()
-
-        self.assert_numpy_array_equal(result[0], ['a', 'a', 'a'])
-        self.assert_numpy_array_equal(result[1], ['b', 'b', 'b'])
-
-    def test_embedded_newline(self):
-        data = 'a\n"hello\nthere"\nthis'
-
-        reader = TextReader(StringIO(data), header=None)
-        result = reader.read()
-
-        expected = ['a', 'hello\nthere', 'this']
-        self.assert_numpy_array_equal(result[0], expected)
-
-    def test_euro_decimal(self):
-        data = '12345,67\n345,678'
-
-        reader = TextReader(StringIO(data), delimiter=':',
-                            decimal=',', header=None)
-        result = reader.read()
-
-        expected = [12345.67, 345.678]
-        tm.assert_almost_equal(result[0], expected)
-
-    def test_integer_thousands(self):
-        data = '123,456\n12,500'
-
-        reader = TextReader(StringIO(data), delimiter=':',
-                            thousands=',', header=None)
-        result = reader.read()
-
-        expected = [123456, 12500]
-        tm.assert_almost_equal(result[0], expected)
-
-    def test_integer_thousands_alt(self):
-        data = '123.456\n12.500'
-
-        reader = TextFileReader(StringIO(data), delimiter=':',
-                            thousands='.', header=None)
-        result = reader.read()
-
-        expected = [123456, 12500]
-        tm.assert_almost_equal(result[0], expected)
-
-    def test_skip_bad_lines(self):
-        # too many lines, see #2430 for why
-        data = ('a:b:c\n'
-                'd:e:f\n'
-                'g:h:i\n'
-                'j:k:l:m\n'
-                'l:m:n\n'
-                'o:p:q:r')
-
-        reader = TextReader(StringIO(data), delimiter=':',
-                            header=None)
-        self.assertRaises(parser.CParserError, reader.read)
-
-        reader = TextReader(StringIO(data), delimiter=':',
-                            header=None,
-                            error_bad_lines=False,
-                            warn_bad_lines=False)
-        result = reader.read()
-        expected = {0: ['a', 'd', 'g', 'l'],
-                    1: ['b', 'e', 'h', 'm'],
-                    2: ['c', 'f', 'i', 'n']}
-        assert_array_dicts_equal(result, expected)
-
-        stderr = sys.stderr
-        sys.stderr = StringIO()
-        try:
-            reader = TextReader(StringIO(data), delimiter=':',
-                                header=None,
-                                error_bad_lines=False,
-                                warn_bad_lines=True)
-            reader.read()
-            val = sys.stderr.getvalue()
-            self.assertTrue('Skipping line 4' in val)
-            self.assertTrue('Skipping line 6' in val)
-        finally:
-            sys.stderr = stderr
-
-    def test_header_not_enough_lines(self):
-        data = ('skip this\n'
-                'skip this\n'
-                'a,b,c\n'
-                '1,2,3\n'
-                '4,5,6')
-
-        reader = TextReader(StringIO(data), delimiter=',', header=2)
-        header = reader.header
-        expected = [['a', 'b', 'c']]
-        self.assertEqual(header, expected)
-
-        recs = reader.read()
-        expected = {0 : [1, 4], 1 : [2, 5], 2 : [3, 6]}
-        assert_array_dicts_equal(expected, recs)
-
-        # not enough rows
-        self.assertRaises(parser.CParserError, TextReader, StringIO(data),
-                          delimiter=',', header=5, as_recarray=True)
-
-    def test_header_not_enough_lines_as_recarray(self):
-
-        if compat.is_platform_windows():
-            raise nose.SkipTest("segfaults on win-64, only when all tests are run")
-
-        data = ('skip this\n'
-                'skip this\n'
-                'a,b,c\n'
-                '1,2,3\n'
-                '4,5,6')
-
-        reader = TextReader(StringIO(data), delimiter=',', header=2,
-                            as_recarray=True)
-        header = reader.header
-        expected = [['a', 'b', 'c']]
-        self.assertEqual(header, expected)
-
-        recs = reader.read()
-        expected = {'a': [1, 4], 'b': [2, 5], 'c': [3, 6]}
-        assert_array_dicts_equal(expected, recs)
-
-        # not enough rows
-        self.assertRaises(parser.CParserError, TextReader, StringIO(data),
-                          delimiter=',', header=5, as_recarray=True)
-
-    def test_escapechar(self):
-        data = ('\\"hello world\"\n'
-                '\\"hello world\"\n'
-                '\\"hello world\"')
-
-        reader = TextReader(StringIO(data), delimiter=',', header=None,
-                            escapechar='\\')
-        result = reader.read()
-        expected = {0: ['"hello world"'] * 3}
-        assert_array_dicts_equal(result, expected)
-
-    def test_eof_has_eol(self):
-        # handling of new line at EOF
-        pass
-
-    def test_na_substitution(self):
-        pass
-
-    def test_numpy_string_dtype(self):
-        data = """\
-a,1
-aa,2
-aaa,3
-aaaa,4
-aaaaa,5"""
-
-        def _make_reader(**kwds):
-            return TextReader(StringIO(data), delimiter=',', header=None,
-                              **kwds)
-
-        reader = _make_reader(dtype='S5,i4')
-        result = reader.read()
-
-        self.assertEqual(result[0].dtype, 'S5')
-
-        ex_values = np.array(['a', 'aa', 'aaa', 'aaaa', 'aaaaa'], dtype='S5')
-        self.assertTrue((result[0] == ex_values).all())
-        self.assertEqual(result[1].dtype, 'i4')
-
-        reader = _make_reader(dtype='S4')
-        result = reader.read()
-        self.assertEqual(result[0].dtype, 'S4')
-        ex_values = np.array(['a', 'aa', 'aaa', 'aaaa', 'aaaa'], dtype='S4')
-        self.assertTrue((result[0] == ex_values).all())
-        self.assertEqual(result[1].dtype, 'S4')
-
-    def test_numpy_string_dtype_as_recarray(self):
-        data = """\
-a,1
-aa,2
-aaa,3
-aaaa,4
-aaaaa,5"""
-
-        if compat.is_platform_windows():
-            raise nose.SkipTest("segfaults on win-64, only when all tests are run")
-
-        def _make_reader(**kwds):
-            return TextReader(StringIO(data), delimiter=',', header=None,
-                              **kwds)
-
-        reader = _make_reader(dtype='S4', as_recarray=True)
-        result = reader.read()
-        self.assertEqual(result['0'].dtype, 'S4')
-        ex_values = np.array(['a', 'aa', 'aaa', 'aaaa', 'aaaa'], dtype='S4')
-        self.assertTrue((result['0'] == ex_values).all())
-        self.assertEqual(result['1'].dtype, 'S4')
-
-    def test_pass_dtype(self):
-        data = """\
-one,two
-1,a
-2,b
-3,c
-4,d"""
-
-        def _make_reader(**kwds):
-            return TextReader(StringIO(data), delimiter=',', **kwds)
-
-        reader = _make_reader(dtype={'one': 'u1', 1: 'S1'})
-        result = reader.read()
-        self.assertEqual(result[0].dtype, 'u1')
-        self.assertEqual(result[1].dtype, 'S1')
-
-        reader = _make_reader(dtype={'one': np.uint8, 1: object})
-        result = reader.read()
-        self.assertEqual(result[0].dtype, 'u1')
-        self.assertEqual(result[1].dtype, 'O')
-
-        reader = _make_reader(dtype={'one': np.dtype('u1'),
-                                     1: np.dtype('O')})
-        result = reader.read()
-        self.assertEqual(result[0].dtype, 'u1')
-        self.assertEqual(result[1].dtype, 'O')
-
-    def test_usecols(self):
-        data = """\
-a,b,c
-1,2,3
-4,5,6
-7,8,9
-10,11,12"""
-
-        def _make_reader(**kwds):
-            return TextReader(StringIO(data), delimiter=',', **kwds)
-
-        reader = _make_reader(usecols=(1, 2))
-        result = reader.read()
-
-        exp = _make_reader().read()
-        self.assertEqual(len(result), 2)
-        self.assertTrue((result[1] == exp[1]).all())
-        self.assertTrue((result[2] == exp[2]).all())
-
-    def test_cr_delimited(self):
-        def _test(text, **kwargs):
-            nice_text = text.replace('\r', '\r\n')
-            result = TextReader(StringIO(text), **kwargs).read()
-            expected = TextReader(StringIO(nice_text), **kwargs).read()
-            assert_array_dicts_equal(result, expected)
-
-        data = 'a,b,c\r1,2,3\r4,5,6\r7,8,9\r10,11,12'
-        _test(data, delimiter=',')
-
-        data = 'a  b  c\r1  2  3\r4  5  6\r7  8  9\r10  11  12'
-        _test(data, delim_whitespace=True)
-
-        data = 'a,b,c\r1,2,3\r4,5,6\r,88,9\r10,11,12'
-        _test(data, delimiter=',')
-
-        sample = ('A,B,C,D,E,F,G,H,I,J,K,L,M,N,O\r'
-                  'AAAAA,BBBBB,0,0,0,0,0,0,0,0,0,0,0,0,0\r'
-                  ',BBBBB,0,0,0,0,0,0,0,0,0,0,0,0,0')
-        _test(sample, delimiter=',')
-
-        data = 'A  B  C\r  2  3\r4  5  6'
-        _test(data, delim_whitespace=True)
-
-        data = 'A B C\r2 3\r4 5 6'
-        _test(data, delim_whitespace=True)
-
-    def test_empty_field_eof(self):
-        data = 'a,b,c\n1,2,3\n4,,'
-
-        result = TextReader(StringIO(data), delimiter=',').read()
-
-        expected = {0: np.array([1, 4]),
-                    1: np.array(['2', ''], dtype=object),
-                    2: np.array(['3', ''], dtype=object)}
-        assert_array_dicts_equal(result, expected)
-
-        # GH5664
-        a = DataFrame([['b'], [nan]], columns=['a'], index=['a', 'c'])
-        b = DataFrame([[1, 1, 1, 0], [1, 1, 1, 0]],
-                      columns=list('abcd'),
-                      index=[1, 1])
-        c = DataFrame([[1, 2, 3, 4], [6, nan, nan, nan],
-                       [8, 9, 10, 11], [13, 14, nan, nan]],
-                       columns=list('abcd'),
-                       index=[0, 5, 7, 12])
-
-        for _ in range(100):
-            df = read_csv(StringIO('a,b\nc\n'), skiprows=0,
-                          names=['a'], engine='c')
-            assert_frame_equal(df, a)
-
-            df = read_csv(StringIO('1,1,1,1,0\n'*2 + '\n'*2),
-                          names=list("abcd"), engine='c')
-            assert_frame_equal(df, b)
-
-            df = read_csv(StringIO('0,1,2,3,4\n5,6\n7,8,9,10,11\n12,13,14'),
-                          names=list('abcd'), engine='c')
-            assert_frame_equal(df, c)
-
-def assert_array_dicts_equal(left, right):
-    for k, v in compat.iteritems(left):
-        assert(np.array_equal(v, right[k]))
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/io/tests/test_data.py b/pandas/io/tests/test_data.py
deleted file mode 100644
index ad0e05f91d184..0000000000000
--- a/pandas/io/tests/test_data.py
+++ /dev/null
@@ -1,569 +0,0 @@
-from __future__ import print_function
-from pandas import compat
-import warnings
-import nose
-from nose.tools import assert_equal
-from datetime import datetime
-import os
-
-import numpy as np
-import pandas as pd
-from pandas import DataFrame, Timestamp
-from pandas.io import data as web
-from pandas.io.data import DataReader, SymbolWarning, RemoteDataError, _yahoo_codes
-from pandas.util.testing import (assert_series_equal, assert_produces_warning,
-                                 network, assert_frame_equal)
-import pandas.util.testing as tm
-
-if compat.PY3:
-    from urllib.error import HTTPError
-else:
-    from urllib2 import HTTPError
-
-
-def _skip_if_no_lxml():
-    try:
-        import lxml
-    except ImportError:
-        raise nose.SkipTest("no lxml")
-
-def _skip_if_no_bs():
-    try:
-        import bs4
-        import html5lib
-    except ImportError:
-        raise nose.SkipTest("no html5lib/bs4")
-
-
-def assert_n_failed_equals_n_null_columns(wngs, obj, cls=SymbolWarning):
-    all_nan_cols = pd.Series(dict((k, pd.isnull(v).all()) for k, v in
-                                  compat.iteritems(obj)))
-    n_all_nan_cols = all_nan_cols.sum()
-    valid_warnings = pd.Series([wng for wng in wngs if wng.category == cls])
-    assert_equal(len(valid_warnings), n_all_nan_cols)
-    failed_symbols = all_nan_cols[all_nan_cols].index
-    msgs = valid_warnings.map(lambda x: x.message)
-    assert msgs.str.contains('|'.join(failed_symbols)).all()
-
-
-class TestGoogle(tm.TestCase):
-    @classmethod
-    def setUpClass(cls):
-        super(TestGoogle, cls).setUpClass()
-        cls.locales = tm.get_locales(prefix='en_US')
-        if not cls.locales:
-            raise nose.SkipTest("US English locale not available for testing")
-
-    @classmethod
-    def tearDownClass(cls):
-        super(TestGoogle, cls).tearDownClass()
-        del cls.locales
-
-    @network
-    def test_google(self):
-        # asserts that google is minimally working and that it throws
-        # an exception when DataReader can't get a 200 response from
-        # google
-        start = datetime(2010, 1, 1)
-        end = datetime(2013, 1, 27)
-
-        for locale in self.locales:
-            with tm.set_locale(locale):
-                panel = web.DataReader("F", 'google', start, end)
-            self.assertEqual(panel.Close[-1], 13.68)
-
-        self.assertRaises(Exception, web.DataReader, "NON EXISTENT TICKER",
-                          'google', start, end)
-
-    @network
-    def test_get_quote_fails(self):
-        self.assertRaises(NotImplementedError, web.get_quote_google,
-                          pd.Series(['GOOG', 'AAPL', 'GOOG']))
-
-    @network
-    def test_get_goog_volume(self):
-        for locale in self.locales:
-            with tm.set_locale(locale):
-                df = web.get_data_google('GOOG').sort_index()
-            self.assertEqual(df.Volume.ix['JAN-02-2015'], 1446662)
-
-    @network
-    def test_get_multi1(self):
-        for locale in self.locales:
-            sl = ['AAPL', 'AMZN', 'GOOG']
-            with tm.set_locale(locale):
-                pan = web.get_data_google(sl, '2012', '2013')
-            ts = pan.Close.GOOG.index[pan.Close.AAPL < pan.Close.GOOG]
-            if (hasattr(pan, 'Close') and hasattr(pan.Close, 'GOOG') and
-                hasattr(pan.Close, 'AAPL')):
-                self.assertEqual(ts[0].dayofyear, 3)
-            else:
-                self.assertRaises(AttributeError, lambda: pan.Close)
-
-    @network
-    def test_get_multi_invalid(self):
-        sl = ['AAPL', 'AMZN', 'INVALID']
-        pan = web.get_data_google(sl, '2012')
-        self.assertIn('INVALID', pan.minor_axis)
-
-    @network
-    def test_get_multi_all_invalid(self):
-        sl = ['INVALID', 'INVALID2', 'INVALID3']
-        self.assertRaises(RemoteDataError, web.get_data_google, sl, '2012')
-
-    @network
-    def test_get_multi2(self):
-        with warnings.catch_warnings(record=True) as w:
-            for locale in self.locales:
-                with tm.set_locale(locale):
-                    pan = web.get_data_google(['GE', 'MSFT', 'INTC'],
-                                              'JAN-01-12', 'JAN-31-12')
-                result = pan.Close.ix['01-18-12']
-                assert_n_failed_equals_n_null_columns(w, result)
-
-                # sanity checking
-
-                self.assertTrue(np.issubdtype(result.dtype, np.floating))
-                result = pan.Open.ix['Jan-15-12':'Jan-20-12']
-                self.assertEqual((4, 3), result.shape)
-                assert_n_failed_equals_n_null_columns(w, result)
-
-    @network
-    def test_dtypes(self):
-        #GH3995, #GH8980
-        data = web.get_data_google('F', start='JAN-01-10', end='JAN-27-13')
-        self.assertTrue(np.issubdtype(data.Open.dtype, np.number))
-        self.assertTrue(np.issubdtype(data.Close.dtype, np.number))
-        self.assertTrue(np.issubdtype(data.Low.dtype, np.number))
-        self.assertTrue(np.issubdtype(data.High.dtype, np.number))
-        self.assertTrue(np.issubdtype(data.Volume.dtype, np.number))
-
-    @network
-    def test_unicode_date(self):
-        #GH8967
-        data = web.get_data_google('F', start='JAN-01-10', end='JAN-27-13')
-        self.assertEqual(data.index.name, 'Date')
-
-
-class TestYahoo(tm.TestCase):
-    @classmethod
-    def setUpClass(cls):
-        super(TestYahoo, cls).setUpClass()
-        _skip_if_no_lxml()
-
-    @network
-    def test_yahoo(self):
-        # asserts that yahoo is minimally working and that it throws
-        # an exception when DataReader can't get a 200 response from
-        # yahoo
-        start = datetime(2010, 1, 1)
-        end = datetime(2013, 1, 27)
-
-        self.assertEqual(web.DataReader("F", 'yahoo', start, end)['Close'][-1],
-                         13.68)
-
-    @network
-    def test_yahoo_fails(self):
-        start = datetime(2010, 1, 1)
-        end = datetime(2013, 1, 27)
-        self.assertRaises(Exception, web.DataReader, "NON EXISTENT TICKER",
-                          'yahoo', start, end)
-
-    @network
-    def test_get_quote_series(self):
-        df = web.get_quote_yahoo(pd.Series(['GOOG', 'AAPL', 'GOOG']))
-        assert_series_equal(df.ix[0], df.ix[2])
-
-    @network
-    def test_get_quote_string(self):
-        df = web.get_quote_yahoo('GOOG')
-
-    @network
-    def test_get_quote_string(self):
-        _yahoo_codes.update({'MarketCap': 'j1'})
-        df = web.get_quote_yahoo('GOOG')
-        self.assertFalse(pd.isnull(df['MarketCap'][0]))
-
-    @network
-    def test_get_quote_stringlist(self):
-        df = web.get_quote_yahoo(['GOOG', 'AAPL', 'GOOG'])
-        assert_series_equal(df.ix[0], df.ix[2])
-
-    @network
-    def test_get_components_dow_jones(self):
-        raise nose.SkipTest('unreliable test, receive partial components back for dow_jones')
-
-        df = web.get_components_yahoo('^DJI') #Dow Jones
-        self.assertIsInstance(df, pd.DataFrame)
-        self.assertEqual(len(df), 30)
-
-    @network
-    def test_get_components_dax(self):
-        raise nose.SkipTest('unreliable test, receive partial components back for dax')
-
-        df = web.get_components_yahoo('^GDAXI') #DAX
-        self.assertIsInstance(df, pd.DataFrame)
-        self.assertEqual(len(df), 30)
-        self.assertEqual(df[df.name.str.contains('adidas', case=False)].index,
-                         'ADS.DE')
-
-    @network
-    def test_get_components_nasdaq_100(self):
-        # as of 7/12/13 the conditional will test false because the link is invalid
-        raise nose.SkipTest('unreliable test, receive partial components back for nasdaq_100')
-
-        df = web.get_components_yahoo('^NDX') #NASDAQ-100
-        self.assertIsInstance(df, pd.DataFrame)
-
-        if len(df) > 1:
-            # Usual culprits, should be around for a while
-            self.assertTrue('AAPL' in df.index)
-            self.assertTrue('GOOG' in df.index)
-            self.assertTrue('AMZN' in df.index)
-        else:
-            expected = DataFrame({'exchange': 'N/A', 'name': '@^NDX'},
-                                 index=['@^NDX'])
-            assert_frame_equal(df, expected)
-
-    @network
-    def test_get_data_single_symbol(self):
-        #single symbol
-        #http://finance.yahoo.com/q/hp?s=GOOG&a=09&b=08&c=2010&d=09&e=10&f=2010&g=d
-        # just test that we succeed
-        web.get_data_yahoo('GOOG')
-
-    @network
-    def test_get_data_interval(self):
-        # daily interval data
-        pan = web.get_data_yahoo('XOM', '2013-01-01', '2013-12-31', interval='d')
-        self.assertEqual(len(pan), 252)
-
-        # weekly interval data
-        pan = web.get_data_yahoo('XOM', '2013-01-01', '2013-12-31', interval='w')
-        self.assertEqual(len(pan), 53)
-
-        # montly interval data
-        pan = web.get_data_yahoo('XOM', '2013-01-01', '2013-12-31', interval='m')
-        self.assertEqual(len(pan), 12)
-
-        # dividend data
-        pan = web.get_data_yahoo('XOM', '2013-01-01', '2013-12-31', interval='v')
-        self.assertEqual(len(pan), 4)
-
-        # test fail on invalid interval
-        self.assertRaises(ValueError, web.get_data_yahoo, 'XOM', interval='NOT VALID')
-
-    @network
-    def test_get_data_multiple_symbols(self):
-        # just test that we succeed
-        sl = ['AAPL', 'AMZN', 'GOOG']
-        web.get_data_yahoo(sl, '2012')
-
-    @network
-    def test_get_data_multiple_symbols_two_dates(self):
-        pan = web.get_data_yahoo(['GE', 'MSFT', 'INTC'], 'JAN-01-12',
-                                 'JAN-31-12')
-        result = pan.Close.ix['01-18-12']
-        self.assertEqual(len(result), 3)
-
-        # sanity checking
-        self.assertTrue(np.issubdtype(result.dtype, np.floating))
-
-        expected = np.array([[18.99,  28.4, 25.18],
-                             [18.58, 28.31, 25.13],
-                             [19.03, 28.16, 25.52],
-                             [18.81, 28.82, 25.87]])
-        result = pan.Open.ix['Jan-15-12':'Jan-20-12']
-        self.assertEqual(expected.shape, result.shape)
-
-    @network
-    def test_get_date_ret_index(self):
-        pan = web.get_data_yahoo(['GE', 'INTC', 'IBM'], '1977', '1987',
-                                 ret_index=True)
-        self.assertTrue(hasattr(pan, 'Ret_Index'))
-        if hasattr(pan, 'Ret_Index') and hasattr(pan.Ret_Index, 'INTC'):
-            tstamp = pan.Ret_Index.INTC.first_valid_index()
-            result = pan.Ret_Index.ix[tstamp]['INTC']
-            self.assertEqual(result, 1.0)
-
-        # sanity checking
-        self.assertTrue(np.issubdtype(pan.values.dtype, np.floating))
-
-
-class TestYahooOptions(tm.TestCase):
-    @classmethod
-    def setUpClass(cls):
-        super(TestYahooOptions, cls).setUpClass()
-        _skip_if_no_lxml()
-        _skip_if_no_bs()
-
-        # aapl has monthlies
-        cls.aapl = web.Options('aapl', 'yahoo')
-        d = (Timestamp.today() + pd.offsets.MonthBegin(1)).normalize()
-        cls.year = d.year
-        cls.month = d.month
-        cls.expiry = d
-        cls.expiry2 = d + pd.offsets.MonthBegin(1)
-        cls.dirpath = tm.get_data_path()
-        cls.html1 = os.path.join(cls.dirpath, 'yahoo_options1.html')
-        cls.html2 = os.path.join(cls.dirpath, 'yahoo_options2.html')
-        cls.html3 = os.path.join(cls.dirpath, 'yahoo_options3.html') #Empty table GH#22
-        cls.data1 = cls.aapl._option_frames_from_url(cls.html1)['puts']
-
-    @classmethod
-    def tearDownClass(cls):
-        super(TestYahooOptions, cls).tearDownClass()
-        del cls.aapl, cls.expiry
-
-    @network
-    def test_get_options_data(self):
-        # regression test GH6105
-        self.assertRaises(ValueError, self.aapl.get_options_data, month=3)
-        self.assertRaises(ValueError, self.aapl.get_options_data, year=1992)
-
-        try:
-            options = self.aapl.get_options_data(expiry=self.expiry)
-        except RemoteDataError as e:
-            raise nose.SkipTest(e)
-        self.assertTrue(len(options) > 1)
-
-    @network
-    def test_get_near_stock_price(self):
-        try:
-            options = self.aapl.get_near_stock_price(call=True, put=True,
-                                                     expiry=[self.expiry,self.expiry2])
-        except RemoteDataError as e:
-            raise nose.SkipTest(e)
-        self.assertTrue(len(options) > 1)
-
-    @network
-    def test_get_call_data(self):
-        try:
-            calls = self.aapl.get_call_data(expiry=self.expiry)
-        except RemoteDataError as e:
-            raise nose.SkipTest(e)
-        self.assertTrue(len(calls) > 1)
-
-    @network
-    def test_get_put_data(self):
-        try:
-            puts = self.aapl.get_put_data(expiry=self.expiry)
-        except RemoteDataError as e:
-            raise nose.SkipTest(e)
-        self.assertTrue(len(puts) > 1)
-
-    @network
-    def test_get_expiry_dates(self):
-        try:
-            dates, _ = self.aapl._get_expiry_dates_and_links()
-        except RemoteDataError as e:
-            raise nose.SkipTest(e)
-        self.assertTrue(len(dates) > 1)
-
-    @network
-    def test_get_all_data(self):
-        try:
-            data = self.aapl.get_all_data(put=True)
-        except RemoteDataError as e:
-            raise nose.SkipTest(e)
-        self.assertTrue(len(data) > 1)
-
-    @network
-    def test_get_data_with_list(self):
-        try:
-            data = self.aapl.get_call_data(expiry=self.aapl.expiry_dates)
-        except RemoteDataError as e:
-            raise nose.SkipTest(e)
-        self.assertTrue(len(data) > 1)
-
-    @network
-    def test_get_all_data_calls_only(self):
-        try:
-            data = self.aapl.get_all_data(call=True, put=False)
-        except RemoteDataError as e:
-            raise nose.SkipTest(e)
-        self.assertTrue(len(data) > 1)
-
-    @network
-    def test_get_underlying_price(self):
-        #GH7
-        try:
-            options_object = web.Options('^spxpm', 'yahoo')
-            url = options_object._yahoo_url_from_expiry(options_object.expiry_dates[0])
-            root = options_object._parse_url(url)
-            quote_price = options_object._underlying_price_from_root(root)
-        except RemoteDataError as e:
-            raise nose.SkipTest(e)
-        self.assertIsInstance(quote_price, float)
-
-    def test_sample_page_price_quote_time1(self):
-        #Tests the weekend quote time format
-        price, quote_time = self.aapl._underlying_price_and_time_from_url(self.html1)
-        self.assertIsInstance(price, (int, float, complex))
-        self.assertIsInstance(quote_time, (datetime, Timestamp))
-
-    def test_chop(self):
-        #regression test for #7625
-        self.aapl.chop_data(self.data1, above_below=2, underlying_price=np.nan)
-        chopped = self.aapl.chop_data(self.data1, above_below=2, underlying_price=100)
-        self.assertIsInstance(chopped, DataFrame)
-        self.assertTrue(len(chopped) > 1)
-
-    def test_chop_out_of_strike_range(self):
-        #regression test for #7625
-        self.aapl.chop_data(self.data1, above_below=2, underlying_price=np.nan)
-        chopped = self.aapl.chop_data(self.data1, above_below=2, underlying_price=100000)
-        self.assertIsInstance(chopped, DataFrame)
-        self.assertTrue(len(chopped) > 1)
-
-
-    @network
-    def test_sample_page_price_quote_time2(self):
-        #Tests the EDT page format
-        #regression test for #8741
-        price, quote_time = self.aapl._underlying_price_and_time_from_url(self.html2)
-        self.assertIsInstance(price, (int, float, complex))
-        self.assertIsInstance(quote_time, (datetime, Timestamp))
-
-    @network
-    def test_sample_page_chg_float(self):
-        #Tests that numeric columns with comma's are appropriately dealt with
-        self.assertEqual(self.data1['Chg'].dtype, 'float64')
-
-    @network
-    def test_month_year(self):
-        try:
-            data = self.aapl.get_call_data(month=self.month, year=self.year)
-        except RemoteDataError as e:
-            raise nose.SkipTest(e)
-
-        self.assertTrue(len(data) > 1)
-
-    @network
-    def test_empty_table(self):
-        #GH22
-        empty = self.aapl._option_frames_from_url(self.html3)['puts']
-        self.assertTrue(len(empty) == 0)
-
-
-class TestOptionsWarnings(tm.TestCase):
-    @classmethod
-    def setUpClass(cls):
-        super(TestOptionsWarnings, cls).setUpClass()
-
-    @classmethod
-    def tearDownClass(cls):
-        super(TestOptionsWarnings, cls).tearDownClass()
-
-    @network
-    def test_options_source_warning(self):
-        with assert_produces_warning():
-            aapl = web.Options('aapl')
-
-
-class TestDataReader(tm.TestCase):
-    def test_is_s3_url(self):
-        from pandas.io.common import _is_s3_url
-        self.assertTrue(_is_s3_url("s3://pandas/somethingelse.com"))
-
-    @network
-    def test_read_yahoo(self):
-        gs = DataReader("GS", "yahoo")
-        self.assertIsInstance(gs, DataFrame)
-
-    @network
-    def test_read_google(self):
-        gs = DataReader("GS", "google")
-        self.assertIsInstance(gs, DataFrame)
-
-    @network
-    def test_read_fred(self):
-        vix = DataReader("VIXCLS", "fred")
-        self.assertIsInstance(vix, DataFrame)
-
-    @network
-    def test_read_famafrench(self):
-        for name in ("F-F_Research_Data_Factors",
-                     "F-F_Research_Data_Factors_weekly", "6_Portfolios_2x3",
-                     "F-F_ST_Reversal_Factor", "F-F_Momentum_Factor"):
-            ff = DataReader(name, "famafrench")
-            self.assertTrue(ff is not None)
-            self.assertIsInstance(ff, dict)
-
-
-class TestFred(tm.TestCase):
-    @network
-    def test_fred(self):
-
-        # Throws an exception when DataReader can't get a 200 response from
-        # FRED.
-
-        start = datetime(2010, 1, 1)
-        end = datetime(2013, 1, 27)
-
-        received = web.DataReader("GDP", "fred", start, end)['GDP'].tail(1)[0]
-        self.assertTrue(int(received) > 10000)
-
-        self.assertRaises(Exception, web.DataReader, "NON EXISTENT SERIES",
-                          'fred', start, end)
-
-    @network
-    def test_fred_nan(self):
-        start = datetime(2010, 1, 1)
-        end = datetime(2013, 1, 27)
-        df = web.DataReader("DFII5", "fred", start, end)
-        self.assertTrue(pd.isnull(df.ix['2010-01-01'][0]))
-
-    @network
-    def test_fred_parts(self):
-        raise nose.SkipTest('buggy as of 2/18/14; maybe a data revision?')
-
-        start = datetime(2010, 1, 1)
-        end = datetime(2013, 1, 27)
-        df = web.get_data_fred("CPIAUCSL", start, end)
-        self.assertEqual(df.ix['2010-05-01'][0], 217.23)
-
-        t = df.CPIAUCSL.values
-        self.assertTrue(np.issubdtype(t.dtype, np.floating))
-        self.assertEqual(t.shape, (37,))
-
-    @network
-    def test_fred_part2(self):
-        expected = [[576.7],
-                    [962.9],
-                    [684.7],
-                    [848.3],
-                    [933.3]]
-        result = web.get_data_fred("A09024USA144NNBR", start="1915").ix[:5]
-        tm.assert_numpy_array_equal(result.values, np.array(expected))
-
-    @network
-    def test_invalid_series(self):
-        name = "NOT A REAL SERIES"
-        self.assertRaises(Exception, web.get_data_fred, name)
-
-    @network
-    def test_fred_multi(self):
-        raise nose.SkipTest('buggy as of 2/18/14; maybe a data revision?')
-
-        names = ['CPIAUCSL', 'CPALTT01USQ661S', 'CPILFESL']
-        start = datetime(2010, 1, 1)
-        end = datetime(2013, 1, 27)
-
-        received = web.DataReader(names, "fred", start, end).head(1)
-        expected = DataFrame([[217.478, 0.99701529, 220.544]], columns=names,
-                             index=[pd.tslib.Timestamp('2010-01-01 00:00:00')])
-        expected.index.rename('DATE', inplace=True)
-        assert_frame_equal(received, expected, check_less_precise=True)
-
-    @network
-    def test_fred_multi_bad_series(self):
-
-        names = ['NOTAREALSERIES', 'CPIAUCSL', "ALSO FAKE"]
-        with tm.assertRaises(HTTPError):
-            DataReader(names, data_source="fred")
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/io/tests/test_date_converters.py b/pandas/io/tests/test_date_converters.py
deleted file mode 100644
index 2b23556706f0c..0000000000000
--- a/pandas/io/tests/test_date_converters.py
+++ /dev/null
@@ -1,151 +0,0 @@
-from pandas.compat import StringIO, BytesIO
-from datetime import date, datetime
-import csv
-import os
-import sys
-import re
-
-import nose
-
-from numpy import nan
-import numpy as np
-from numpy.testing.decorators import slow
-
-from pandas import DataFrame, Series, Index, MultiIndex, isnull
-import pandas.io.parsers as parsers
-from pandas.io.parsers import (read_csv, read_table, read_fwf,
-                               TextParser)
-from pandas.util.testing import (assert_almost_equal, assert_frame_equal,
-                                 assert_series_equal, network)
-import pandas.lib as lib
-from pandas import compat
-from pandas.lib import Timestamp
-import pandas.io.date_converters as conv
-import pandas.util.testing as tm
-
-class TestConverters(tm.TestCase):
-
-    def setUp(self):
-        self.years = np.array([2007, 2008])
-        self.months = np.array([1, 2])
-        self.days = np.array([3, 4])
-        self.hours = np.array([5, 6])
-        self.minutes = np.array([7, 8])
-        self.seconds = np.array([9, 0])
-        self.dates = np.array(['2007/1/3', '2008/2/4'], dtype=object)
-        self.times = np.array(['05:07:09', '06:08:00'], dtype=object)
-        self.expected = np.array([datetime(2007, 1, 3, 5, 7, 9),
-                                  datetime(2008, 2, 4, 6, 8, 0)])
-
-    def test_parse_date_time(self):
-        result = conv.parse_date_time(self.dates, self.times)
-        self.assertTrue((result == self.expected).all())
-
-        data = """\
-date, time, a, b
-2001-01-05, 10:00:00, 0.0, 10.
-2001-01-05, 00:00:00, 1., 11.
-"""
-        datecols = {'date_time': [0, 1]}
-        df = read_table(StringIO(data), sep=',', header=0,
-                        parse_dates=datecols, date_parser=conv.parse_date_time)
-        self.assertIn('date_time', df)
-        self.assertEqual(df.date_time.ix[0], datetime(2001, 1, 5, 10, 0, 0))
-
-        data = ("KORD,19990127, 19:00:00, 18:56:00, 0.8100\n"
-                "KORD,19990127, 20:00:00, 19:56:00, 0.0100\n"
-                "KORD,19990127, 21:00:00, 20:56:00, -0.5900\n"
-                "KORD,19990127, 21:00:00, 21:18:00, -0.9900\n"
-                "KORD,19990127, 22:00:00, 21:56:00, -0.5900\n"
-                "KORD,19990127, 23:00:00, 22:56:00, -0.5900")
-
-        date_spec = {'nominal': [1, 2], 'actual': [1, 3]}
-        df = read_csv(StringIO(data), header=None, parse_dates=date_spec,
-                      date_parser=conv.parse_date_time)
-
-    def test_parse_date_fields(self):
-        result = conv.parse_date_fields(self.years, self.months, self.days)
-        expected = np.array([datetime(2007, 1, 3), datetime(2008, 2, 4)])
-        self.assertTrue((result == expected).all())
-
-        data = "year, month, day, a\n 2001 , 01 , 10 , 10.\n 2001 , 02 , 1 , 11."
-        datecols = {'ymd': [0, 1, 2]}
-        df = read_table(StringIO(data), sep=',', header=0,
-                        parse_dates=datecols,
-                        date_parser=conv.parse_date_fields)
-        self.assertIn('ymd', df)
-        self.assertEqual(df.ymd.ix[0], datetime(2001, 1, 10))
-
-    def test_datetime_six_col(self):
-        result = conv.parse_all_fields(self.years, self.months, self.days,
-                                       self.hours, self.minutes, self.seconds)
-        self.assertTrue((result == self.expected).all())
-
-        data = """\
-year, month, day, hour, minute, second, a, b
-2001, 01, 05, 10, 00, 0, 0.0, 10.
-2001, 01, 5, 10, 0, 00, 1., 11.
-"""
-        datecols = {'ymdHMS': [0, 1, 2, 3, 4, 5]}
-        df = read_table(StringIO(data), sep=',', header=0,
-                        parse_dates=datecols,
-                        date_parser=conv.parse_all_fields)
-        self.assertIn('ymdHMS', df)
-        self.assertEqual(df.ymdHMS.ix[0], datetime(2001, 1, 5, 10, 0, 0))
-
-    def test_datetime_fractional_seconds(self):
-        data = """\
-year, month, day, hour, minute, second, a, b
-2001, 01, 05, 10, 00, 0.123456, 0.0, 10.
-2001, 01, 5, 10, 0, 0.500000, 1., 11.
-"""
-        datecols = {'ymdHMS': [0, 1, 2, 3, 4, 5]}
-        df = read_table(StringIO(data), sep=',', header=0,
-                        parse_dates=datecols,
-                        date_parser=conv.parse_all_fields)
-        self.assertIn('ymdHMS', df)
-        self.assertEqual(df.ymdHMS.ix[0], datetime(2001, 1, 5, 10, 0, 0,
-                                                   microsecond=123456))
-        self.assertEqual(df.ymdHMS.ix[1], datetime(2001, 1, 5, 10, 0, 0,
-                                                   microsecond=500000))
-
-    def test_generic(self):
-        data = "year, month, day, a\n 2001, 01, 10, 10.\n 2001, 02, 1, 11."
-        datecols = {'ym': [0, 1]}
-        dateconverter = lambda y, m: date(year=int(y), month=int(m), day=1)
-        df = read_table(StringIO(data), sep=',', header=0,
-                        parse_dates=datecols,
-                        date_parser=dateconverter)
-        self.assertIn('ym', df)
-        self.assertEqual(df.ym.ix[0], date(2001, 1, 1))
-
-    def test_dateparser_resolution_if_not_ns(self):
-        # issue 10245
-        data = """\
-date,time,prn,rxstatus
-2013-11-03,19:00:00,126,00E80000
-2013-11-03,19:00:00,23,00E80000
-2013-11-03,19:00:00,13,00E80000
-"""
-
-        def date_parser(date, time):
-            datetime = np.array(date + 'T' + time + 'Z', dtype='datetime64[s]')
-            return datetime
-
-        df = read_csv(StringIO(data), date_parser=date_parser,
-                      parse_dates={'datetime': ['date', 'time']},
-                      index_col=['datetime', 'prn'])
-
-        datetimes = np.array(['2013-11-03T19:00:00Z']*3, dtype='datetime64[s]')
-        df_correct = DataFrame(data={'rxstatus': ['00E80000']*3},
-                               index=MultiIndex.from_tuples(
-                                   [(datetimes[0], 126),
-                                    (datetimes[1], 23),
-                                    (datetimes[2], 13)],
-                               names=['datetime', 'prn']))
-        assert_frame_equal(df, df_correct)
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/io/tests/test_excel.py b/pandas/io/tests/test_excel.py
deleted file mode 100644
index 40cbd97ea539f..0000000000000
--- a/pandas/io/tests/test_excel.py
+++ /dev/null
@@ -1,1946 +0,0 @@
-# pylint: disable=E1101
-
-from pandas.compat import u, range, map, openpyxl_compat, BytesIO, iteritems
-from datetime import datetime, date, time
-import sys
-import os
-from distutils.version import LooseVersion
-
-import operator
-import functools
-import nose
-
-from numpy import nan
-import numpy as np
-from numpy.testing.decorators import slow
-
-import pandas as pd
-from pandas import DataFrame, Index, MultiIndex
-from pandas.io.parsers import read_csv
-from pandas.io.excel import (
-    ExcelFile, ExcelWriter, read_excel, _XlwtWriter, _Openpyxl1Writer,
-    _Openpyxl20Writer, _Openpyxl22Writer, register_writer, _XlsxWriter
-)
-from pandas.io.common import URLError
-from pandas.util.testing import ensure_clean, makeCustomDataframe as mkdf
-from pandas.core.config import set_option, get_option
-import pandas.util.testing as tm
-
-
-def _skip_if_no_xlrd():
-    try:
-        import xlrd
-        ver = tuple(map(int, xlrd.__VERSION__.split(".")[:2]))
-        if ver < (0, 9):
-            raise nose.SkipTest('xlrd < 0.9, skipping')
-    except ImportError:
-        raise nose.SkipTest('xlrd not installed, skipping')
-
-
-def _skip_if_no_xlwt():
-    try:
-        import xlwt  # NOQA
-    except ImportError:
-        raise nose.SkipTest('xlwt not installed, skipping')
-
-
-def _skip_if_no_openpyxl():
-    try:
-        import openpyxl  # NOQA
-    except ImportError:
-        raise nose.SkipTest('openpyxl not installed, skipping')
-
-
-def _skip_if_no_xlsxwriter():
-    try:
-        import xlsxwriter  # NOQA
-    except ImportError:
-        raise nose.SkipTest('xlsxwriter not installed, skipping')
-
-
-def _skip_if_no_excelsuite():
-    _skip_if_no_xlrd()
-    _skip_if_no_xlwt()
-    _skip_if_no_openpyxl()
-
-
-_seriesd = tm.getSeriesData()
-_tsd = tm.getTimeSeriesData()
-_frame = DataFrame(_seriesd)[:10]
-_frame2 = DataFrame(_seriesd, columns=['D', 'C', 'B', 'A'])[:10]
-_tsframe = tm.makeTimeDataFrame()[:5]
-_mixed_frame = _frame.copy()
-_mixed_frame['foo'] = 'bar'
-
-
-class SharedItems(object):
-    def setUp(self):
-        self.dirpath = tm.get_data_path()
-        self.frame = _frame.copy()
-        self.frame2 = _frame2.copy()
-        self.tsframe = _tsframe.copy()
-        self.mixed_frame = _mixed_frame.copy()
-
-    def get_csv_refdf(self, basename):
-        """
-        Obtain the reference data from read_csv with the Python engine.
-        Test data path is defined by pandas.util.testing.get_data_path()
-
-        Parameters
-        ----------
-
-        basename : str
-            File base name, excluding file extension.
-
-        Returns
-        -------
-
-        dfref : DataFrame
-        """
-        pref = os.path.join(self.dirpath, basename + '.csv')
-        dfref = read_csv(pref, index_col=0, parse_dates=True, engine='python')
-        return dfref
-
-    def get_excelfile(self, basename):
-        """
-        Return test data ExcelFile instance. Test data path is defined by
-        pandas.util.testing.get_data_path()
-
-        Parameters
-        ----------
-
-        basename : str
-            File base name, excluding file extension.
-
-        Returns
-        -------
-
-        excel : io.excel.ExcelFile
-        """
-        return ExcelFile(os.path.join(self.dirpath, basename + self.ext))
-
-    def get_exceldf(self, basename, *args, **kwds):
-        """
-        Return test data DataFrame. Test data path is defined by
-        pandas.util.testing.get_data_path()
-
-        Parameters
-        ----------
-
-        basename : str
-            File base name, excluding file extension.
-
-        Returns
-        -------
-
-        df : DataFrame
-        """
-        pth = os.path.join(self.dirpath, basename + self.ext)
-        return read_excel(pth, *args, **kwds)
-
-
-class ReadingTestsBase(SharedItems):
-    # This is based on ExcelWriterBase
-    #
-    # Base class for test cases to run with different Excel readers.
-    # To add a reader test, define the following:
-    # 1. A check_skip function that skips your tests if your reader isn't
-    #    installed.
-    # 2. Add a property ext, which is the file extension that your reader
-    #    reades from. (needs to start with '.' so it's a valid path)
-    # 3. Add a property engine_name, which is the name of the reader class.
-    #    For the reader this is not used for anything at the moment.
-
-    def setUp(self):
-        self.check_skip()
-        super(ReadingTestsBase, self).setUp()
-
-    def test_parse_cols_int(self):
-
-        dfref = self.get_csv_refdf('test1')
-        dfref = dfref.reindex(columns=['A', 'B', 'C'])
-        df1 = self.get_exceldf('test1', 'Sheet1', index_col=0, parse_dates=True,
-                               parse_cols=3)
-        df2 = self.get_exceldf('test1', 'Sheet2', skiprows=[1], index_col=0,
-                               parse_dates=True, parse_cols=3)
-        # TODO add index to xls file)
-        tm.assert_frame_equal(df1, dfref, check_names=False)
-        tm.assert_frame_equal(df2, dfref, check_names=False)
-
-    def test_parse_cols_list(self):
-
-        dfref = self.get_csv_refdf('test1')
-        dfref = dfref.reindex(columns=['B', 'C'])
-        df1 = self.get_exceldf('test1', 'Sheet1', index_col=0, parse_dates=True,
-                               parse_cols=[0, 2, 3])
-        df2 = self.get_exceldf('test1', 'Sheet2', skiprows=[1], index_col=0,
-                               parse_dates=True,
-                               parse_cols=[0, 2, 3])
-        # TODO add index to xls file)
-        tm.assert_frame_equal(df1, dfref, check_names=False)
-        tm.assert_frame_equal(df2, dfref, check_names=False)
-
-    def test_parse_cols_str(self):
-
-        dfref = self.get_csv_refdf('test1')
-
-        df1 = dfref.reindex(columns=['A', 'B', 'C'])
-        df2 = self.get_exceldf('test1', 'Sheet1', index_col=0, parse_dates=True,
-                               parse_cols='A:D')
-        df3 = self.get_exceldf('test1', 'Sheet2', skiprows=[1], index_col=0,
-                               parse_dates=True, parse_cols='A:D')
-        # TODO add index to xls, read xls ignores index name ?
-        tm.assert_frame_equal(df2, df1, check_names=False)
-        tm.assert_frame_equal(df3, df1, check_names=False)
-
-        df1 = dfref.reindex(columns=['B', 'C'])
-        df2 = self.get_exceldf('test1', 'Sheet1', index_col=0, parse_dates=True,
-                               parse_cols='A,C,D')
-        df3 = self.get_exceldf('test1', 'Sheet2', skiprows=[1], index_col=0,
-                               parse_dates=True, parse_cols='A,C,D')
-        # TODO add index to xls file
-        tm.assert_frame_equal(df2, df1, check_names=False)
-        tm.assert_frame_equal(df3, df1, check_names=False)
-
-        df1 = dfref.reindex(columns=['B', 'C'])
-        df2 = self.get_exceldf('test1', 'Sheet1', index_col=0, parse_dates=True,
-                               parse_cols='A,C:D')
-        df3 = self.get_exceldf('test1', 'Sheet2', skiprows=[1], index_col=0,
-                               parse_dates=True, parse_cols='A,C:D')
-        tm.assert_frame_equal(df2, df1, check_names=False)
-        tm.assert_frame_equal(df3, df1, check_names=False)
-
-    def test_excel_stop_iterator(self):
-
-        parsed = self.get_exceldf('test2', 'Sheet1')
-        expected = DataFrame([['aaaa', 'bbbbb']], columns=['Test', 'Test1'])
-        tm.assert_frame_equal(parsed, expected)
-
-    def test_excel_cell_error_na(self):
-
-        parsed = self.get_exceldf('test3', 'Sheet1')
-        expected = DataFrame([[np.nan]], columns=['Test'])
-        tm.assert_frame_equal(parsed, expected)
-
-    def test_excel_passes_na(self):
-
-        excel = self.get_excelfile('test4')
-
-        parsed = read_excel(excel, 'Sheet1', keep_default_na=False,
-                             na_values=['apple'])
-        expected = DataFrame([['NA'], [1], ['NA'], [np.nan], ['rabbit']],
-                             columns=['Test'])
-        tm.assert_frame_equal(parsed, expected)
-
-        parsed = read_excel(excel, 'Sheet1', keep_default_na=True,
-                             na_values=['apple'])
-        expected = DataFrame([[np.nan], [1], [np.nan], [np.nan], ['rabbit']],
-                             columns=['Test'])
-        tm.assert_frame_equal(parsed, expected)
-
-    def test_excel_table_sheet_by_index(self):
-
-        excel = self.get_excelfile('test1')
-        dfref = self.get_csv_refdf('test1')
-
-        df1 = read_excel(excel, 0, index_col=0, parse_dates=True)
-        df2 = read_excel(excel, 1, skiprows=[1], index_col=0, parse_dates=True)
-        tm.assert_frame_equal(df1, dfref, check_names=False)
-        tm.assert_frame_equal(df2, dfref, check_names=False)
-
-        df1 = excel.parse(0, index_col=0, parse_dates=True)
-        df2 = excel.parse(1, skiprows=[1], index_col=0, parse_dates=True)
-        tm.assert_frame_equal(df1, dfref, check_names=False)
-        tm.assert_frame_equal(df2, dfref, check_names=False)
-
-        df3 = read_excel(excel, 0, index_col=0, parse_dates=True, skipfooter=1)
-        df4 = read_excel(excel, 0, index_col=0, parse_dates=True, skip_footer=1)
-        tm.assert_frame_equal(df3, df1.ix[:-1])
-        tm.assert_frame_equal(df3, df4)
-
-        df3 = excel.parse(0, index_col=0, parse_dates=True, skipfooter=1)
-        df4 = excel.parse(0, index_col=0, parse_dates=True, skip_footer=1)
-        tm.assert_frame_equal(df3, df1.ix[:-1])
-        tm.assert_frame_equal(df3, df4)
-
-        import xlrd
-        with tm.assertRaises(xlrd.XLRDError):
-            read_excel(excel, 'asdf')
-
-    def test_excel_table(self):
-
-        dfref = self.get_csv_refdf('test1')
-
-        df1 = self.get_exceldf('test1', 'Sheet1', index_col=0, parse_dates=True)
-        df2 = self.get_exceldf('test1', 'Sheet2', skiprows=[1], index_col=0,
-                               parse_dates=True)
-        # TODO add index to file
-        tm.assert_frame_equal(df1, dfref, check_names=False)
-        tm.assert_frame_equal(df2, dfref, check_names=False)
-
-        df3 = self.get_exceldf('test1', 'Sheet1', index_col=0, parse_dates=True,
-                               skipfooter=1)
-        df4 = self.get_exceldf('test1', 'Sheet1', index_col=0, parse_dates=True,
-                               skip_footer=1)
-        tm.assert_frame_equal(df3, df1.ix[:-1])
-        tm.assert_frame_equal(df3, df4)
-
-    def test_reader_special_dtypes(self):
-
-        expected = DataFrame.from_items([
-            ("IntCol", [1, 2, -3, 4, 0]),
-            ("FloatCol", [1.25, 2.25, 1.83, 1.92, 0.0000000005]),
-            ("BoolCol", [True, False, True, True, False]),
-            ("StrCol", [1, 2, 3, 4, 5]),
-            # GH5394 - this is why convert_float isn't vectorized
-            ("Str2Col", ["a", 3, "c", "d", "e"]),
-            ("DateCol", [datetime(2013, 10, 30), datetime(2013, 10, 31),
-                         datetime(1905, 1, 1), datetime(2013, 12, 14),
-                         datetime(2015, 3, 14)])
-        ])
-
-        basename = 'test_types'
-
-        # should read in correctly and infer types
-        actual = self.get_exceldf(basename, 'Sheet1')
-        tm.assert_frame_equal(actual, expected)
-
-        # if not coercing number, then int comes in as float
-        float_expected = expected.copy()
-        float_expected["IntCol"] = float_expected["IntCol"].astype(float)
-        float_expected.loc[1, "Str2Col"] = 3.0
-        actual = self.get_exceldf(basename, 'Sheet1', convert_float=False)
-        tm.assert_frame_equal(actual, float_expected)
-
-        # check setting Index (assuming xls and xlsx are the same here)
-        for icol, name in enumerate(expected.columns):
-            actual = self.get_exceldf(basename, 'Sheet1', index_col=icol)
-            exp = expected.set_index(name)
-            tm.assert_frame_equal(actual, exp)
-
-        # convert_float and converters should be different but both accepted
-        expected["StrCol"] = expected["StrCol"].apply(str)
-        actual = self.get_exceldf(basename, 'Sheet1', converters={"StrCol": str})
-        tm.assert_frame_equal(actual, expected)
-
-        no_convert_float = float_expected.copy()
-        no_convert_float["StrCol"] = no_convert_float["StrCol"].apply(str)
-        actual = self.get_exceldf(basename, 'Sheet1', convert_float=False,
-                                  converters={"StrCol": str})
-        tm.assert_frame_equal(actual, no_convert_float)
-
-    # GH8212 - support for converters and missing values
-    def test_reader_converters(self):
-
-        basename = 'test_converters'
-
-        expected = DataFrame.from_items([
-            ("IntCol", [1, 2, -3, -1000, 0]),
-            ("FloatCol", [12.5, np.nan, 18.3, 19.2, 0.000000005]),
-            ("BoolCol", ['Found', 'Found', 'Found', 'Not found', 'Found']),
-            ("StrCol", ['1', np.nan, '3', '4', '5']),
-        ])
-
-        converters = {'IntCol': lambda x: int(x) if x != '' else -1000,
-                      'FloatCol': lambda x: 10 * x if x else np.nan,
-                      2: lambda x: 'Found' if x != '' else 'Not found',
-                      3: lambda x: str(x) if x else '',
-                      }
-
-        # should read in correctly and set types of single cells (not array dtypes)
-        actual = self.get_exceldf(basename, 'Sheet1', converters=converters)
-        tm.assert_frame_equal(actual, expected)
-
-    def test_reading_all_sheets(self):
-        # Test reading all sheetnames by setting sheetname to None,
-        # Ensure a dict is returned.
-        # See PR #9450
-        basename = 'test_multisheet'
-        dfs = self.get_exceldf(basename, sheetname=None)
-        expected_keys = ['Alpha', 'Beta', 'Charlie']
-        tm.assert_contains_all(expected_keys, dfs.keys())
-
-    def test_reading_multiple_specific_sheets(self):
-        # Test reading specific sheetnames by specifying a mixed list
-        # of integers and strings, and confirm that duplicated sheet
-        # references (positions/names) are removed properly.
-        # Ensure a dict is returned
-        # See PR #9450
-        basename = 'test_multisheet'
-        # Explicitly request duplicates. Only the set should be returned.
-        expected_keys = [2, 'Charlie', 'Charlie']
-        dfs = self.get_exceldf(basename, sheetname=expected_keys)
-        expected_keys = list(set(expected_keys))
-        tm.assert_contains_all(expected_keys, dfs.keys())
-        assert len(expected_keys) == len(dfs.keys())
-
-    # GH6403
-    def test_read_excel_blank(self):
-        actual = self.get_exceldf('blank', 'Sheet1')
-        tm.assert_frame_equal(actual, DataFrame())
-
-    def test_read_excel_blank_with_header(self):
-        expected = DataFrame(columns=['col_1', 'col_2'])
-        actual = self.get_exceldf('blank_with_header', 'Sheet1')
-        tm.assert_frame_equal(actual, expected)
-
-
-class XlrdTests(ReadingTestsBase):
-    """
-    This is the base class for the xlrd tests, and 3 different file formats
-    are supported: xls, xlsx, xlsm
-    """
-
-    def test_excel_read_buffer(self):
-
-        pth = os.path.join(self.dirpath, 'test1' + self.ext)
-        expected = read_excel(pth, 'Sheet1', index_col=0, parse_dates=True)
-        with open(pth, 'rb') as f:
-            actual = read_excel(f, 'Sheet1', index_col=0, parse_dates=True)
-            tm.assert_frame_equal(expected, actual)
-
-        with open(pth, 'rb') as f:
-            xls = ExcelFile(f)
-            actual = read_excel(xls, 'Sheet1', index_col=0, parse_dates=True)
-            tm.assert_frame_equal(expected, actual)
-
-    def test_read_xlrd_Book(self):
-        _skip_if_no_xlwt()
-
-        import xlrd
-        df = self.frame
-        with ensure_clean('.xls') as pth:
-            df.to_excel(pth, "SheetA")
-            book = xlrd.open_workbook(pth)
-
-            with ExcelFile(book, engine="xlrd") as xl:
-                result = read_excel(xl, "SheetA")
-                tm.assert_frame_equal(df, result)
-
-            result = read_excel(book, sheetname="SheetA", engine="xlrd")
-            tm.assert_frame_equal(df, result)
-
-    @tm.network
-    def test_read_from_http_url(self):
-        url = ('https://raw.github.com/pydata/pandas/master/'
-               'pandas/io/tests/data/test1' + self.ext)
-        url_table = read_excel(url)
-        local_table = self.get_exceldf('test1')
-        tm.assert_frame_equal(url_table, local_table)
-
-    @slow
-    def test_read_from_file_url(self):
-
-        # FILE
-        if sys.version_info[:2] < (2, 6):
-            raise nose.SkipTest("file:// not supported with Python < 2.6")
-
-        localtable = os.path.join(self.dirpath, 'test1' + self.ext)
-        local_table = read_excel(localtable)
-
-        try:
-            url_table = read_excel('file://localhost/' + localtable)
-        except URLError:
-            # fails on some systems
-            import platform
-            raise nose.SkipTest("failing on %s" %
-                                ' '.join(platform.uname()).strip())
-
-        tm.assert_frame_equal(url_table, local_table)
-
-    def test_reader_closes_file(self):
-
-        pth = os.path.join(self.dirpath, 'test1' + self.ext)
-        f = open(pth, 'rb')
-        with ExcelFile(f) as xlsx:
-            # parses okay
-            read_excel(xlsx, 'Sheet1', index_col=0)
-
-        self.assertTrue(f.closed)
-
-    def test_creating_and_reading_multiple_sheets(self):
-        # Test reading multiple sheets, from a runtime created excel file
-        # with multiple sheets.
-        # See PR #9450
-
-        _skip_if_no_xlwt()
-        _skip_if_no_openpyxl()
-
-        def tdf(sheetname):
-            d, i = [11,22,33], [1,2,3]
-            return DataFrame(d,i,columns=[sheetname])
-
-        sheets = ['AAA','BBB','CCC']
-
-        dfs = [tdf(s) for s in sheets]
-        dfs = dict(zip(sheets,dfs))
-
-        with ensure_clean(self.ext) as pth:
-            with ExcelWriter(pth) as ew:
-                for sheetname, df in iteritems(dfs):
-                    df.to_excel(ew,sheetname)
-            dfs_returned = read_excel(pth,sheetname=sheets)
-            for s in sheets:
-                tm.assert_frame_equal(dfs[s],dfs_returned[s])
-
-    def test_reader_seconds(self):
-        # Test reading times with and without milliseconds. GH5945.
-        import xlrd
-
-        if LooseVersion(xlrd.__VERSION__) >= LooseVersion("0.9.3"):
-            # Xlrd >= 0.9.3 can handle Excel milliseconds.
-            expected = DataFrame.from_items([("Time",
-                                              [time(1, 2, 3),
-                                               time(2, 45, 56, 100000),
-                                               time(4, 29, 49, 200000),
-                                               time(6, 13, 42, 300000),
-                                               time(7, 57, 35, 400000),
-                                               time(9, 41, 28, 500000),
-                                               time(11, 25, 21, 600000),
-                                               time(13, 9, 14, 700000),
-                                               time(14, 53, 7, 800000),
-                                               time(16, 37, 0, 900000),
-                                               time(18, 20, 54)])])
-        else:
-            # Xlrd < 0.9.3 rounds Excel milliseconds.
-            expected = DataFrame.from_items([("Time",
-                                              [time(1, 2, 3),
-                                               time(2, 45, 56),
-                                               time(4, 29, 49),
-                                               time(6, 13, 42),
-                                               time(7, 57, 35),
-                                               time(9, 41, 29),
-                                               time(11, 25, 22),
-                                               time(13, 9, 15),
-                                               time(14, 53, 8),
-                                               time(16, 37, 1),
-                                               time(18, 20, 54)])])
-
-        actual = self.get_exceldf('times_1900', 'Sheet1')
-        tm.assert_frame_equal(actual, expected)
-
-        actual = self.get_exceldf('times_1904', 'Sheet1')
-        tm.assert_frame_equal(actual, expected)
-
-    def test_read_excel_multiindex(self):
-        #GH 4679
-        mi = MultiIndex.from_product([['foo','bar'],['a','b']])
-        mi_file = os.path.join(self.dirpath, 'testmultiindex' + self.ext)
-
-        expected = DataFrame([[1, 2.5, pd.Timestamp('2015-01-01'), True],
-                            [2, 3.5, pd.Timestamp('2015-01-02'), False],
-                            [3, 4.5, pd.Timestamp('2015-01-03'), False],
-                            [4, 5.5, pd.Timestamp('2015-01-04'), True]],
-                            columns = mi)
-
-        actual = read_excel(mi_file, 'mi_column', header=[0,1])
-        tm.assert_frame_equal(actual, expected)
-        actual = read_excel(mi_file, 'mi_column', header=[0,1], index_col=0)
-        tm.assert_frame_equal(actual, expected)
-
-        expected.columns = ['a', 'b', 'c', 'd']
-        expected.index = mi
-        actual = read_excel(mi_file, 'mi_index', index_col=[0,1])
-        tm.assert_frame_equal(actual, expected, check_names=False)
-
-        expected.columns = mi
-        actual = read_excel(mi_file, 'both', index_col=[0,1], header=[0,1])
-        tm.assert_frame_equal(actual, expected, check_names=False)
-
-        expected.index = mi.set_names(['ilvl1', 'ilvl2'])
-        expected.columns = ['a', 'b', 'c', 'd']
-        actual = read_excel(mi_file, 'mi_index_name', index_col=[0,1])
-        tm.assert_frame_equal(actual, expected)
-
-        expected.index = list(range(4))
-        expected.columns = mi.set_names(['c1', 'c2'])
-        actual = read_excel(mi_file, 'mi_column_name', header=[0,1], index_col=0)
-        tm.assert_frame_equal(actual, expected)
-
-        expected.index = mi.set_names(['ilvl1', 'ilvl2'])
-        actual = read_excel(mi_file, 'both_name', index_col=[0,1], header=[0,1])
-        tm.assert_frame_equal(actual, expected)
-
-        actual = read_excel(mi_file, 'both_name', index_col=[0,1], header=[0,1])
-        tm.assert_frame_equal(actual, expected)
-
-        actual = read_excel(mi_file, 'both_name_skiprows', index_col=[0,1],
-                            header=[0,1],  skiprows=2)
-        tm.assert_frame_equal(actual, expected)
-
-
-    def test_excel_multindex_roundtrip(self):
-        #GH 4679
-        _skip_if_no_xlsxwriter()
-        with ensure_clean('.xlsx') as pth:
-            for c_idx_names in [True, False]:
-                for r_idx_names in [True, False]:
-                    for c_idx_levels in [1, 3]:
-                        for r_idx_levels in [1, 3]:
-                            # column index name can't be serialized unless MultiIndex
-                            if (c_idx_levels == 1 and c_idx_names):
-                                continue
-
-                            # empty name case current read in as unamed levels, not Nones
-                            check_names = True
-                            if not r_idx_names and r_idx_levels > 1:
-                                check_names = False
-
-                            df = mkdf(5, 5, c_idx_names,
-                                        r_idx_names, c_idx_levels,
-                                        r_idx_levels)
-                            df.to_excel(pth)
-                            act = pd.read_excel(pth, index_col=list(range(r_idx_levels)),
-                                                header=list(range(c_idx_levels)))
-                            tm.assert_frame_equal(df, act, check_names=check_names)
-
-                            df.iloc[0, :] = np.nan
-                            df.to_excel(pth)
-                            act = pd.read_excel(pth, index_col=list(range(r_idx_levels)),
-                                                header=list(range(c_idx_levels)))
-                            tm.assert_frame_equal(df, act, check_names=check_names)
-
-                            df.iloc[-1, :] = np.nan
-                            df.to_excel(pth)
-                            act = pd.read_excel(pth, index_col=list(range(r_idx_levels)),
-                                                header=list(range(c_idx_levels)))
-                            tm.assert_frame_equal(df, act, check_names=check_names)
-
-    def test_excel_oldindex_format(self):
-        #GH 4679
-        data = np.array([['R0C0', 'R0C1', 'R0C2', 'R0C3', 'R0C4'],
-                         ['R1C0', 'R1C1', 'R1C2', 'R1C3', 'R1C4'],
-                         ['R2C0', 'R2C1', 'R2C2', 'R2C3', 'R2C4'],
-                         ['R3C0', 'R3C1', 'R3C2', 'R3C3', 'R3C4'],
-                         ['R4C0', 'R4C1', 'R4C2', 'R4C3', 'R4C4']])
-        columns = ['C_l0_g0', 'C_l0_g1', 'C_l0_g2', 'C_l0_g3', 'C_l0_g4']
-        mi = MultiIndex(levels=[['R_l0_g0', 'R_l0_g1', 'R_l0_g2', 'R_l0_g3', 'R_l0_g4'],
-                                ['R_l1_g0', 'R_l1_g1', 'R_l1_g2', 'R_l1_g3', 'R_l1_g4']],
-                        labels=[[0, 1, 2, 3, 4], [0, 1, 2, 3, 4]],
-                        names=['R0', 'R1'])
-        si = Index(['R_l0_g0', 'R_l0_g1', 'R_l0_g2', 'R_l0_g3', 'R_l0_g4'],  name='R0')
-
-        in_file = os.path.join(self.dirpath, 'test_index_name_pre17' + self.ext)
-
-        expected = pd.DataFrame(data, index=si, columns=columns)
-        with tm.assert_produces_warning(FutureWarning):
-            actual = pd.read_excel(in_file, 'single_names', has_index_names=True)
-        tm.assert_frame_equal(actual, expected)
-
-        expected.index.name = None
-        actual = pd.read_excel(in_file, 'single_no_names')
-        tm.assert_frame_equal(actual, expected)
-        with tm.assert_produces_warning(FutureWarning):
-            actual = pd.read_excel(in_file, 'single_no_names', has_index_names=False)
-        tm.assert_frame_equal(actual, expected)
-
-        expected.index = mi
-        with tm.assert_produces_warning(FutureWarning):
-            actual = pd.read_excel(in_file, 'multi_names', has_index_names=True)
-        tm.assert_frame_equal(actual, expected)
-
-        expected.index.names = [None, None]
-        actual = pd.read_excel(in_file, 'multi_no_names', index_col=[0,1])
-        tm.assert_frame_equal(actual, expected, check_names=False)
-        with tm.assert_produces_warning(FutureWarning):
-            actual = pd.read_excel(in_file, 'multi_no_names', index_col=[0,1],
-                                   has_index_names=False)
-        tm.assert_frame_equal(actual, expected, check_names=False)
-
-    def test_read_excel_bool_header_arg(self):
-        #GH 6114
-        for arg in [True, False]:
-            with tm.assertRaises(TypeError):
-                pd.read_excel(os.path.join(self.dirpath, 'test1' + self.ext),
-                              header=arg)
-
-    def test_read_excel_chunksize(self):
-        #GH 8011
-        with tm.assertRaises(NotImplementedError):
-            pd.read_excel(os.path.join(self.dirpath, 'test1' + self.ext),
-                          chunksize=100)
-
-class XlsReaderTests(XlrdTests, tm.TestCase):
-    ext = '.xls'
-    engine_name = 'xlrd'
-    check_skip = staticmethod(_skip_if_no_xlrd)
-
-
-class XlsxReaderTests(XlrdTests, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'xlrd'
-    check_skip = staticmethod(_skip_if_no_xlrd)
-
-
-class XlsmReaderTests(XlrdTests, tm.TestCase):
-    ext = '.xlsm'
-    engine_name = 'xlrd'
-    check_skip = staticmethod(_skip_if_no_xlrd)
-
-
-
-
-class ExcelWriterBase(SharedItems):
-    # Base class for test cases to run with different Excel writers.
-    # To add a writer test, define the following:
-    # 1. A check_skip function that skips your tests if your writer isn't
-    #    installed.
-    # 2. Add a property ext, which is the file extension that your writer
-    #    writes to. (needs to start with '.' so it's a valid path)
-    # 3. Add a property engine_name, which is the name of the writer class.
-
-    # Test with MultiIndex and Hierarchical Rows as merged cells.
-    merge_cells = True
-
-    def setUp(self):
-        self.check_skip()
-        super(ExcelWriterBase, self).setUp()
-        self.option_name = 'io.excel.%s.writer' % self.ext.strip('.')
-        self.prev_engine = get_option(self.option_name)
-        set_option(self.option_name, self.engine_name)
-
-    def tearDown(self):
-        set_option(self.option_name, self.prev_engine)
-
-    def test_excel_sheet_by_name_raise(self):
-        _skip_if_no_xlrd()
-        import xlrd
-
-        with ensure_clean(self.ext) as pth:
-            gt = DataFrame(np.random.randn(10, 2))
-            gt.to_excel(pth)
-            xl = ExcelFile(pth)
-            df = read_excel(xl, 0)
-            tm.assert_frame_equal(gt, df)
-
-            with tm.assertRaises(xlrd.XLRDError):
-                read_excel(xl, '0')
-
-    def test_excelwriter_contextmanager(self):
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as pth:
-            with ExcelWriter(pth) as writer:
-                self.frame.to_excel(writer, 'Data1')
-                self.frame2.to_excel(writer, 'Data2')
-
-            with ExcelFile(pth) as reader:
-                found_df = read_excel(reader, 'Data1')
-                found_df2 = read_excel(reader, 'Data2')
-                tm.assert_frame_equal(found_df, self.frame)
-                tm.assert_frame_equal(found_df2, self.frame2)
-
-    def test_roundtrip(self):
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as path:
-            self.frame['A'][:5] = nan
-
-            self.frame.to_excel(path, 'test1')
-            self.frame.to_excel(path, 'test1', columns=['A', 'B'])
-            self.frame.to_excel(path, 'test1', header=False)
-            self.frame.to_excel(path, 'test1', index=False)
-
-            # test roundtrip
-            self.frame.to_excel(path, 'test1')
-            recons = read_excel(path, 'test1', index_col=0)
-            tm.assert_frame_equal(self.frame, recons)
-
-            self.frame.to_excel(path, 'test1', index=False)
-            recons = read_excel(path, 'test1', index_col=None)
-            recons.index = self.frame.index
-            tm.assert_frame_equal(self.frame, recons)
-
-            self.frame.to_excel(path, 'test1', na_rep='NA')
-            recons = read_excel(path, 'test1', index_col=0, na_values=['NA'])
-            tm.assert_frame_equal(self.frame, recons)
-
-            # GH 3611
-            self.frame.to_excel(path, 'test1', na_rep='88')
-            recons = read_excel(path, 'test1', index_col=0, na_values=['88'])
-            tm.assert_frame_equal(self.frame, recons)
-
-            self.frame.to_excel(path, 'test1', na_rep='88')
-            recons = read_excel(path, 'test1', index_col=0,
-                                na_values=[88, 88.0])
-            tm.assert_frame_equal(self.frame, recons)
-
-            # GH 6573
-            self.frame.to_excel(path, 'Sheet1')
-            recons = read_excel(path, index_col=0)
-            tm.assert_frame_equal(self.frame, recons)
-
-            self.frame.to_excel(path, '0')
-            recons = read_excel(path, index_col=0)
-            tm.assert_frame_equal(self.frame, recons)
-
-    def test_mixed(self):
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as path:
-            self.mixed_frame.to_excel(path, 'test1')
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1', index_col=0)
-            tm.assert_frame_equal(self.mixed_frame, recons)
-
-    def test_tsframe(self):
-        _skip_if_no_xlrd()
-
-        df = tm.makeTimeDataFrame()[:5]
-
-        with ensure_clean(self.ext) as path:
-            df.to_excel(path, 'test1')
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1')
-            tm.assert_frame_equal(df, recons)
-
-    def test_basics_with_nan(self):
-        _skip_if_no_xlrd()
-        with ensure_clean(self.ext) as path:
-            self.frame['A'][:5] = nan
-            self.frame.to_excel(path, 'test1')
-            self.frame.to_excel(path, 'test1', columns=['A', 'B'])
-            self.frame.to_excel(path, 'test1', header=False)
-            self.frame.to_excel(path, 'test1', index=False)
-
-    def test_int_types(self):
-        _skip_if_no_xlrd()
-
-        for np_type in (np.int8, np.int16, np.int32, np.int64):
-
-            with ensure_clean(self.ext) as path:
-                # Test np.int values read come back as int (rather than float
-                # which is Excel's format).
-                frame = DataFrame(np.random.randint(-10, 10, size=(10, 2)),
-                                  dtype=np_type)
-                frame.to_excel(path, 'test1')
-                reader = ExcelFile(path)
-                recons = read_excel(reader, 'test1')
-                int_frame = frame.astype(np.int64)
-                tm.assert_frame_equal(int_frame, recons)
-                recons2 = read_excel(path, 'test1')
-                tm.assert_frame_equal(int_frame, recons2)
-
-                # test with convert_float=False comes back as float
-                float_frame = frame.astype(float)
-                recons = read_excel(path, 'test1', convert_float=False)
-                tm.assert_frame_equal(recons, float_frame)
-
-    def test_float_types(self):
-        _skip_if_no_xlrd()
-
-        for np_type in (np.float16, np.float32, np.float64):
-            with ensure_clean(self.ext) as path:
-                # Test np.float values read come back as float.
-                frame = DataFrame(np.random.random_sample(10), dtype=np_type)
-                frame.to_excel(path, 'test1')
-                reader = ExcelFile(path)
-                recons = read_excel(reader, 'test1').astype(np_type)
-                tm.assert_frame_equal(frame, recons, check_dtype=False)
-
-    def test_bool_types(self):
-        _skip_if_no_xlrd()
-
-        for np_type in (np.bool8, np.bool_):
-            with ensure_clean(self.ext) as path:
-                # Test np.bool values read come back as float.
-                frame = (DataFrame([1, 0, True, False], dtype=np_type))
-                frame.to_excel(path, 'test1')
-                reader = ExcelFile(path)
-                recons = read_excel(reader, 'test1').astype(np_type)
-                tm.assert_frame_equal(frame, recons)
-
-    def test_inf_roundtrip(self):
-        _skip_if_no_xlrd()
-
-        frame = DataFrame([(1, np.inf), (2, 3), (5, -np.inf)])
-        with ensure_clean(self.ext) as path:
-            frame.to_excel(path, 'test1')
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1')
-            tm.assert_frame_equal(frame, recons)
-
-    def test_sheets(self):
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as path:
-            self.frame['A'][:5] = nan
-
-            self.frame.to_excel(path, 'test1')
-            self.frame.to_excel(path, 'test1', columns=['A', 'B'])
-            self.frame.to_excel(path, 'test1', header=False)
-            self.frame.to_excel(path, 'test1', index=False)
-
-            # Test writing to separate sheets
-            writer = ExcelWriter(path)
-            self.frame.to_excel(writer, 'test1')
-            self.tsframe.to_excel(writer, 'test2')
-            writer.save()
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1', index_col=0)
-            tm.assert_frame_equal(self.frame, recons)
-            recons = read_excel(reader, 'test2', index_col=0)
-            tm.assert_frame_equal(self.tsframe, recons)
-            np.testing.assert_equal(2, len(reader.sheet_names))
-            np.testing.assert_equal('test1', reader.sheet_names[0])
-            np.testing.assert_equal('test2', reader.sheet_names[1])
-
-    def test_colaliases(self):
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as path:
-            self.frame['A'][:5] = nan
-
-            self.frame.to_excel(path, 'test1')
-            self.frame.to_excel(path, 'test1', columns=['A', 'B'])
-            self.frame.to_excel(path, 'test1', header=False)
-            self.frame.to_excel(path, 'test1', index=False)
-
-            # column aliases
-            col_aliases = Index(['AA', 'X', 'Y', 'Z'])
-            self.frame2.to_excel(path, 'test1', header=col_aliases)
-            reader = ExcelFile(path)
-            rs = read_excel(reader, 'test1', index_col=0)
-            xp = self.frame2.copy()
-            xp.columns = col_aliases
-            tm.assert_frame_equal(xp, rs)
-
-    def test_roundtrip_indexlabels(self):
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as path:
-
-            self.frame['A'][:5] = nan
-
-            self.frame.to_excel(path, 'test1')
-            self.frame.to_excel(path, 'test1', columns=['A', 'B'])
-            self.frame.to_excel(path, 'test1', header=False)
-            self.frame.to_excel(path, 'test1', index=False)
-
-            # test index_label
-            frame = (DataFrame(np.random.randn(10, 2)) >= 0)
-            frame.to_excel(path, 'test1',
-                           index_label=['test'],
-                           merge_cells=self.merge_cells)
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1',
-                                  index_col=0,
-                                  ).astype(np.int64)
-            frame.index.names = ['test']
-            self.assertEqual(frame.index.names, recons.index.names)
-
-            frame = (DataFrame(np.random.randn(10, 2)) >= 0)
-            frame.to_excel(path,
-                           'test1',
-                           index_label=['test', 'dummy', 'dummy2'],
-                           merge_cells=self.merge_cells)
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1',
-                                  index_col=0,
-                                  ).astype(np.int64)
-            frame.index.names = ['test']
-            self.assertEqual(frame.index.names, recons.index.names)
-
-            frame = (DataFrame(np.random.randn(10, 2)) >= 0)
-            frame.to_excel(path,
-                           'test1',
-                           index_label='test',
-                           merge_cells=self.merge_cells)
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1',
-                                  index_col=0,
-                                  ).astype(np.int64)
-            frame.index.names = ['test']
-            tm.assert_frame_equal(frame, recons.astype(bool))
-
-        with ensure_clean(self.ext) as path:
-
-            self.frame.to_excel(path,
-                                'test1',
-                                columns=['A', 'B', 'C', 'D'],
-                                index=False, merge_cells=self.merge_cells)
-            # take 'A' and 'B' as indexes (same row as cols 'C', 'D')
-            df = self.frame.copy()
-            df = df.set_index(['A', 'B'])
-
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1', index_col=[0, 1])
-            tm.assert_frame_equal(df, recons, check_less_precise=True)
-
-    def test_excel_roundtrip_indexname(self):
-        _skip_if_no_xlrd()
-
-        df = DataFrame(np.random.randn(10, 4))
-        df.index.name = 'foo'
-
-        with ensure_clean(self.ext) as path:
-            df.to_excel(path, merge_cells=self.merge_cells)
-
-            xf = ExcelFile(path)
-            result = read_excel(xf, xf.sheet_names[0],
-                              index_col=0)
-
-            tm.assert_frame_equal(result, df)
-            self.assertEqual(result.index.name, 'foo')
-
-    def test_excel_roundtrip_datetime(self):
-        _skip_if_no_xlrd()
-
-        # datetime.date, not sure what to test here exactly
-        tsf = self.tsframe.copy()
-        with ensure_clean(self.ext) as path:
-
-            tsf.index = [x.date() for x in self.tsframe.index]
-            tsf.to_excel(path, 'test1', merge_cells=self.merge_cells)
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1')
-            tm.assert_frame_equal(self.tsframe, recons)
-
-    # GH4133 - excel output format strings
-    def test_excel_date_datetime_format(self):
-        _skip_if_no_xlrd()
-        df = DataFrame([[date(2014, 1, 31),
-                         date(1999, 9, 24)],
-                        [datetime(1998, 5, 26, 23, 33, 4),
-                         datetime(2014, 2, 28, 13, 5, 13)]],
-                       index=['DATE', 'DATETIME'], columns=['X', 'Y'])
-        df_expected = DataFrame([[datetime(2014, 1, 31),
-                                  datetime(1999, 9, 24)],
-                                 [datetime(1998, 5, 26, 23, 33, 4),
-                                  datetime(2014, 2, 28, 13, 5, 13)]],
-                                index=['DATE', 'DATETIME'], columns=['X', 'Y'])
-
-        with ensure_clean(self.ext) as filename1:
-            with ensure_clean(self.ext) as filename2:
-                writer1 = ExcelWriter(filename1)
-                writer2 = ExcelWriter(filename2,
-                  date_format='DD.MM.YYYY',
-                  datetime_format='DD.MM.YYYY HH-MM-SS')
-
-                df.to_excel(writer1, 'test1')
-                df.to_excel(writer2, 'test1')
-
-                writer1.close()
-                writer2.close()
-
-                reader1 = ExcelFile(filename1)
-                reader2 = ExcelFile(filename2)
-
-                rs1 = read_excel(reader1, 'test1', index_col=None)
-                rs2 = read_excel(reader2, 'test1', index_col=None)
-
-                tm.assert_frame_equal(rs1, rs2)
-
-                # since the reader returns a datetime object for dates, we need
-                # to use df_expected to check the result
-                tm.assert_frame_equal(rs2, df_expected)
-
-    def test_to_excel_periodindex(self):
-        _skip_if_no_xlrd()
-
-        frame = self.tsframe
-        xp = frame.resample('M', kind='period')
-
-        with ensure_clean(self.ext) as path:
-            xp.to_excel(path, 'sht1')
-
-            reader = ExcelFile(path)
-            rs = read_excel(reader, 'sht1', index_col=0, parse_dates=True)
-            tm.assert_frame_equal(xp, rs.to_period('M'))
-
-    def test_to_excel_multiindex(self):
-        _skip_if_no_xlrd()
-
-        frame = self.frame
-        arrays = np.arange(len(frame.index) * 2).reshape(2, -1)
-        new_index = MultiIndex.from_arrays(arrays,
-                                           names=['first', 'second'])
-        frame.index = new_index
-
-        with ensure_clean(self.ext) as path:
-            frame.to_excel(path, 'test1', header=False)
-            frame.to_excel(path, 'test1', columns=['A', 'B'])
-
-            # round trip
-            frame.to_excel(path, 'test1', merge_cells=self.merge_cells)
-            reader = ExcelFile(path)
-            df = read_excel(reader, 'test1', index_col=[0, 1],
-                              parse_dates=False)
-            tm.assert_frame_equal(frame, df)
-            self.assertEqual(frame.index.names, df.index.names)
-
-    def test_to_excel_multiindex_dates(self):
-        _skip_if_no_xlrd()
-
-        # try multiindex with dates
-        tsframe = self.tsframe.copy()
-        new_index = [tsframe.index, np.arange(len(tsframe.index))]
-        tsframe.index = MultiIndex.from_arrays(new_index)
-
-        with ensure_clean(self.ext) as path:
-            tsframe.index.names = ['time', 'foo']
-            tsframe.to_excel(path, 'test1', merge_cells=self.merge_cells)
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1',
-                                  index_col=[0, 1])
-
-            tm.assert_frame_equal(tsframe, recons)
-            self.assertEqual(recons.index.names, ('time', 'foo'))
-
-    def test_to_excel_multiindex_no_write_index(self):
-        _skip_if_no_xlrd()
-
-        # Test writing and re-reading a MI witout the index. GH 5616.
-
-        # Initial non-MI frame.
-        frame1 = DataFrame({'a': [10, 20], 'b': [30, 40], 'c': [50, 60]})
-
-        # Add a MI.
-        frame2 = frame1.copy()
-        multi_index = MultiIndex.from_tuples([(70, 80), (90, 100)])
-        frame2.index = multi_index
-
-        with ensure_clean(self.ext) as path:
-
-            # Write out to Excel without the index.
-            frame2.to_excel(path, 'test1', index=False)
-
-            # Read it back in.
-            reader = ExcelFile(path)
-            frame3 = read_excel(reader, 'test1')
-
-            # Test that it is the same as the initial frame.
-            tm.assert_frame_equal(frame1, frame3)
-
-    def test_to_excel_float_format(self):
-        _skip_if_no_xlrd()
-
-        df = DataFrame([[0.123456, 0.234567, 0.567567],
-                        [12.32112, 123123.2, 321321.2]],
-                        index=['A', 'B'], columns=['X', 'Y', 'Z'])
-
-        with ensure_clean(self.ext) as filename:
-            df.to_excel(filename, 'test1', float_format='%.2f')
-
-            reader = ExcelFile(filename)
-            rs = read_excel(reader, 'test1', index_col=None)
-            xp = DataFrame([[0.12, 0.23, 0.57],
-                            [12.32, 123123.20, 321321.20]],
-                            index=['A', 'B'], columns=['X', 'Y', 'Z'])
-            tm.assert_frame_equal(rs, xp)
-
-    def test_to_excel_output_encoding(self):
-        _skip_if_no_xlrd()
-        ext = self.ext
-        filename = '__tmp_to_excel_float_format__.' + ext
-        df = DataFrame([[u('\u0192'), u('\u0193'), u('\u0194')],
-                        [u('\u0195'), u('\u0196'), u('\u0197')]],
-                        index=[u('A\u0192'), 'B'], columns=[u('X\u0193'), 'Y', 'Z'])
-
-        with ensure_clean(filename) as filename:
-            df.to_excel(filename, sheet_name='TestSheet', encoding='utf8')
-            result = read_excel(filename, 'TestSheet', encoding='utf8')
-            tm.assert_frame_equal(result, df)
-
-    def test_to_excel_unicode_filename(self):
-        _skip_if_no_xlrd()
-        with ensure_clean(u('\u0192u.') + self.ext) as filename:
-            try:
-                f = open(filename, 'wb')
-            except UnicodeEncodeError:
-                raise nose.SkipTest('no unicode file names on this system')
-            else:
-                f.close()
-
-            df = DataFrame([[0.123456, 0.234567, 0.567567],
-                            [12.32112, 123123.2, 321321.2]],
-                            index=['A', 'B'], columns=['X', 'Y', 'Z'])
-
-            df.to_excel(filename, 'test1', float_format='%.2f')
-
-            reader = ExcelFile(filename)
-            rs = read_excel(reader, 'test1', index_col=None)
-            xp = DataFrame([[0.12, 0.23, 0.57],
-                            [12.32, 123123.20, 321321.20]],
-                            index=['A', 'B'], columns=['X', 'Y', 'Z'])
-            tm.assert_frame_equal(rs, xp)
-
-    # def test_to_excel_header_styling_xls(self):
-
-    #     import StringIO
-    #     s = StringIO(
-    #     """Date,ticker,type,value
-    #     2001-01-01,x,close,12.2
-    #     2001-01-01,x,open ,12.1
-    #     2001-01-01,y,close,12.2
-    #     2001-01-01,y,open ,12.1
-    #     2001-02-01,x,close,12.2
-    #     2001-02-01,x,open ,12.1
-    #     2001-02-01,y,close,12.2
-    #     2001-02-01,y,open ,12.1
-    #     2001-03-01,x,close,12.2
-    #     2001-03-01,x,open ,12.1
-    #     2001-03-01,y,close,12.2
-    #     2001-03-01,y,open ,12.1""")
-    #     df = read_csv(s, parse_dates=["Date"])
-    #     pdf = df.pivot_table(values="value", rows=["ticker"],
-    #                                          cols=["Date", "type"])
-
-    #     try:
-    #         import xlwt
-    #         import xlrd
-    #     except ImportError:
-    #         raise nose.SkipTest
-
-    #     filename = '__tmp_to_excel_header_styling_xls__.xls'
-    #     pdf.to_excel(filename, 'test1')
-
-    #     wbk = xlrd.open_workbook(filename,
-    #                              formatting_info=True)
-    #     self.assertEqual(["test1"], wbk.sheet_names())
-    #     ws = wbk.sheet_by_name('test1')
-    #     self.assertEqual([(0, 1, 5, 7), (0, 1, 3, 5), (0, 1, 1, 3)],
-    #                       ws.merged_cells)
-    #     for i in range(0, 2):
-    #         for j in range(0, 7):
-    #             xfx = ws.cell_xf_index(0, 0)
-    #             cell_xf = wbk.xf_list[xfx]
-    #             font = wbk.font_list
-    #             self.assertEqual(1, font[cell_xf.font_index].bold)
-    #             self.assertEqual(1, cell_xf.border.top_line_style)
-    #             self.assertEqual(1, cell_xf.border.right_line_style)
-    #             self.assertEqual(1, cell_xf.border.bottom_line_style)
-    #             self.assertEqual(1, cell_xf.border.left_line_style)
-    #             self.assertEqual(2, cell_xf.alignment.hor_align)
-    #     os.remove(filename)
-    # def test_to_excel_header_styling_xlsx(self):
-    #     import StringIO
-    #     s = StringIO(
-    #     """Date,ticker,type,value
-    #     2001-01-01,x,close,12.2
-    #     2001-01-01,x,open ,12.1
-    #     2001-01-01,y,close,12.2
-    #     2001-01-01,y,open ,12.1
-    #     2001-02-01,x,close,12.2
-    #     2001-02-01,x,open ,12.1
-    #     2001-02-01,y,close,12.2
-    #     2001-02-01,y,open ,12.1
-    #     2001-03-01,x,close,12.2
-    #     2001-03-01,x,open ,12.1
-    #     2001-03-01,y,close,12.2
-    #     2001-03-01,y,open ,12.1""")
-    #     df = read_csv(s, parse_dates=["Date"])
-    #     pdf = df.pivot_table(values="value", rows=["ticker"],
-    #                                          cols=["Date", "type"])
-    #     try:
-    #         import openpyxl
-    #         from openpyxl.cell import get_column_letter
-    #     except ImportError:
-    #         raise nose.SkipTest
-    #     if openpyxl.__version__ < '1.6.1':
-    #         raise nose.SkipTest
-    #     # test xlsx_styling
-    #     filename = '__tmp_to_excel_header_styling_xlsx__.xlsx'
-    #     pdf.to_excel(filename, 'test1')
-    #     wbk = openpyxl.load_workbook(filename)
-    #     self.assertEqual(["test1"], wbk.get_sheet_names())
-    #     ws = wbk.get_sheet_by_name('test1')
-    #     xlsaddrs = ["%s2" % chr(i) for i in range(ord('A'), ord('H'))]
-    #     xlsaddrs += ["A%s" % i for i in range(1, 6)]
-    #     xlsaddrs += ["B1", "D1", "F1"]
-    #     for xlsaddr in xlsaddrs:
-    #         cell = ws.cell(xlsaddr)
-    #         self.assertTrue(cell.style.font.bold)
-    #         self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-    #                           cell.style.borders.top.border_style)
-    #         self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-    #                           cell.style.borders.right.border_style)
-    #         self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-    #                           cell.style.borders.bottom.border_style)
-    #         self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-    #                           cell.style.borders.left.border_style)
-    #         self.assertEqual(openpyxl.style.Alignment.HORIZONTAL_CENTER,
-    #                           cell.style.alignment.horizontal)
-    #     mergedcells_addrs = ["C1", "E1", "G1"]
-    #     for maddr in mergedcells_addrs:
-    #         self.assertTrue(ws.cell(maddr).merged)
-    #     os.remove(filename)
-
-    def test_excel_010_hemstring(self):
-        _skip_if_no_xlrd()
-
-        if self.merge_cells:
-            raise nose.SkipTest('Skip tests for merged MI format.')
-
-        from pandas.util.testing import makeCustomDataframe as mkdf
-        # ensure limited functionality in 0.10
-        # override of #2370 until sorted out in 0.11
-
-        def roundtrip(df, header=True, parser_hdr=0, index=True):
-
-            with ensure_clean(self.ext) as path:
-                df.to_excel(path, header=header, merge_cells=self.merge_cells, index=index)
-                xf = ExcelFile(path)
-                res = read_excel(xf, xf.sheet_names[0], header=parser_hdr)
-                return res
-
-        nrows = 5
-        ncols = 3
-        for use_headers in (True, False):
-            for i in range(1, 4):  # row multindex upto nlevel=3
-                for j in range(1, 4):  # col ""
-                    df = mkdf(nrows, ncols, r_idx_nlevels=i, c_idx_nlevels=j)
-
-                    #this if will be removed once multi column excel writing
-                    #is implemented for now fixing #9794
-                    if j>1:
-                        with tm.assertRaises(NotImplementedError):
-                            res = roundtrip(df, use_headers, index=False)
-                    else:
-                        res = roundtrip(df, use_headers)
-
-                    if use_headers:
-                        self.assertEqual(res.shape, (nrows, ncols + i))
-                    else:
-                        # first row taken as columns
-                        self.assertEqual(res.shape, (nrows - 1, ncols + i))
-
-                    # no nans
-                    for r in range(len(res.index)):
-                        for c in range(len(res.columns)):
-                            self.assertTrue(res.ix[r, c] is not np.nan)
-
-        res = roundtrip(DataFrame([0]))
-        self.assertEqual(res.shape, (1, 1))
-        self.assertTrue(res.ix[0, 0] is not np.nan)
-
-        res = roundtrip(DataFrame([0]), False, None)
-        self.assertEqual(res.shape, (1, 2))
-        self.assertTrue(res.ix[0, 0] is not np.nan)
-
-    def test_excel_010_hemstring_raises_NotImplementedError(self):
-        # This test was failing only for j>1 and header=False,
-        # So I reproduced a simple test.
-        _skip_if_no_xlrd()
-
-        if self.merge_cells:
-            raise nose.SkipTest('Skip tests for merged MI format.')
-
-        from pandas.util.testing import makeCustomDataframe as mkdf
-        # ensure limited functionality in 0.10
-        # override of #2370 until sorted out in 0.11
-
-        def roundtrip2(df, header=True, parser_hdr=0, index=True):
-
-            with ensure_clean(self.ext) as path:
-                df.to_excel(path, header=header, merge_cells=self.merge_cells, index=index)
-                xf = ExcelFile(path)
-                res = read_excel(xf, xf.sheet_names[0], header=parser_hdr)
-                return res
-
-        nrows = 5; ncols = 3
-        j = 2; i = 1
-        df = mkdf(nrows, ncols, r_idx_nlevels=i, c_idx_nlevels=j)
-        with tm.assertRaises(NotImplementedError):
-            res = roundtrip2(df, header=False, index=False)
-
-
-    def test_duplicated_columns(self):
-        # Test for issue #5235
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as path:
-            write_frame = DataFrame([[1, 2, 3], [1, 2, 3], [1, 2, 3]])
-            colnames = ['A', 'B', 'B']
-
-            write_frame.columns = colnames
-            write_frame.to_excel(path, 'test1')
-
-            read_frame = read_excel(path, 'test1')
-            read_frame.columns = colnames
-            tm.assert_frame_equal(write_frame, read_frame)
-
-            # 11007 / #10970
-            write_frame = DataFrame([[1,2,3,4],[5,6,7,8]],
-                                    columns=['A','B','A','B'])
-            write_frame.to_excel(path, 'test1')
-            read_frame = read_excel(path, 'test1')
-            read_frame.columns = ['A','B','A','B']
-            tm.assert_frame_equal(write_frame, read_frame)
-
-            # 10982
-            write_frame.to_excel(path, 'test1', index=False, header=False)
-            read_frame = read_excel(path, 'test1', header=None)
-            write_frame.columns = [0, 1, 2, 3]
-            tm.assert_frame_equal(write_frame, read_frame)
-
-    def test_swapped_columns(self):
-        # Test for issue #5427.
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as path:
-            write_frame = DataFrame({'A': [1, 1, 1],
-                                     'B': [2, 2, 2]})
-            write_frame.to_excel(path, 'test1', columns=['B', 'A'])
-
-            read_frame = read_excel(path, 'test1', header=0)
-
-            tm.assert_series_equal(write_frame['A'], read_frame['A'])
-            tm.assert_series_equal(write_frame['B'], read_frame['B'])
-
-    def test_invalid_columns(self):
-        # 10982
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as path:
-            write_frame = DataFrame({'A': [1, 1, 1],
-                                     'B': [2, 2, 2]})
-
-            write_frame.to_excel(path, 'test1', columns=['B', 'C'])
-            expected = write_frame.loc[:, ['B','C']]
-            read_frame = read_excel(path, 'test1')
-            tm.assert_frame_equal(expected, read_frame)
-
-            with tm.assertRaises(KeyError):
-                write_frame.to_excel(path, 'test1', columns=['C', 'D'])
-
-
-    def test_datetimes(self):
-
-        # Test writing and reading datetimes. For issue #9139. (xref #9185)
-        _skip_if_no_xlrd()
-
-        datetimes = [datetime(2013, 1, 13, 1, 2, 3),
-                     datetime(2013, 1, 13, 2, 45, 56),
-                     datetime(2013, 1, 13, 4, 29, 49),
-                     datetime(2013, 1, 13, 6, 13, 42),
-                     datetime(2013, 1, 13, 7, 57, 35),
-                     datetime(2013, 1, 13, 9, 41, 28),
-                     datetime(2013, 1, 13, 11, 25, 21),
-                     datetime(2013, 1, 13, 13, 9, 14),
-                     datetime(2013, 1, 13, 14, 53, 7),
-                     datetime(2013, 1, 13, 16, 37, 0),
-                     datetime(2013, 1, 13, 18, 20, 52)]
-
-        with ensure_clean(self.ext) as path:
-            write_frame = DataFrame.from_items([('A', datetimes)])
-            write_frame.to_excel(path, 'Sheet1')
-            read_frame = read_excel(path, 'Sheet1', header=0)
-
-            tm.assert_series_equal(write_frame['A'], read_frame['A'])
-
-    # GH7074
-    def test_bytes_io(self):
-        _skip_if_no_xlrd()
-
-        bio = BytesIO()
-        df = DataFrame(np.random.randn(10, 2))
-        writer = ExcelWriter(bio)
-        df.to_excel(writer)
-        writer.save()
-        bio.seek(0)
-        reread_df = read_excel(bio)
-        tm.assert_frame_equal(df, reread_df)
-
-    # GH8188
-    def test_write_lists_dict(self):
-        _skip_if_no_xlrd()
-
-        df = DataFrame({'mixed': ['a', ['b', 'c'], {'d': 'e', 'f': 2}],
-                        'numeric': [1, 2, 3.0],
-                        'str': ['apple', 'banana', 'cherry']})
-        expected = df.copy()
-        expected.mixed = expected.mixed.apply(str)
-        expected.numeric = expected.numeric.astype('int64')
-        with ensure_clean(self.ext) as path:
-            df.to_excel(path, 'Sheet1')
-            read = read_excel(path, 'Sheet1', header=0)
-            tm.assert_frame_equal(read, expected)
-
-
-def raise_wrapper(major_ver):
-    def versioned_raise_wrapper(orig_method):
-        @functools.wraps(orig_method)
-        def wrapped(self, *args, **kwargs):
-            _skip_if_no_openpyxl()
-            if openpyxl_compat.is_compat(major_ver=major_ver):
-                orig_method(self, *args, **kwargs)
-            else:
-                msg = 'Installed openpyxl is not supported at this time\. Use.+'
-                with tm.assertRaisesRegexp(ValueError, msg):
-                    orig_method(self, *args, **kwargs)
-        return wrapped
-    return versioned_raise_wrapper
-
-
-def raise_on_incompat_version(major_ver):
-    def versioned_raise_on_incompat_version(cls):
-        methods = filter(operator.methodcaller('startswith', 'test_'), dir(cls))
-        for method in methods:
-            setattr(cls, method, raise_wrapper(major_ver)(getattr(cls, method)))
-        return cls
-    return versioned_raise_on_incompat_version
-
-
-@raise_on_incompat_version(1)
-class OpenpyxlTests(ExcelWriterBase, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'openpyxl1'
-    check_skip = staticmethod(lambda *args, **kwargs: None)
-
-    def test_to_excel_styleconverter(self):
-        _skip_if_no_openpyxl()
-        if not openpyxl_compat.is_compat(major_ver=1):
-            raise nose.SkipTest('incompatiable openpyxl version')
-
-        import openpyxl
-
-        hstyle = {"font": {"bold": True},
-                  "borders": {"top": "thin",
-                              "right": "thin",
-                              "bottom": "thin",
-                              "left": "thin"},
-                  "alignment": {"horizontal": "center", "vertical": "top"}}
-
-        xlsx_style = _Openpyxl1Writer._convert_to_style(hstyle)
-        self.assertTrue(xlsx_style.font.bold)
-        self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-                         xlsx_style.borders.top.border_style)
-        self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-                         xlsx_style.borders.right.border_style)
-        self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-                         xlsx_style.borders.bottom.border_style)
-        self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-                         xlsx_style.borders.left.border_style)
-        self.assertEqual(openpyxl.style.Alignment.HORIZONTAL_CENTER,
-                         xlsx_style.alignment.horizontal)
-        self.assertEqual(openpyxl.style.Alignment.VERTICAL_TOP,
-                         xlsx_style.alignment.vertical)
-
-
-def skip_openpyxl_gt21(cls):
-    """Skip a TestCase instance if openpyxl >= 2.2"""
-
-    @classmethod
-    def setUpClass(cls):
-        _skip_if_no_openpyxl()
-        import openpyxl
-        ver = openpyxl.__version__
-        if not (LooseVersion(ver) >= LooseVersion('2.0.0') and LooseVersion(ver) < LooseVersion('2.2.0')):
-            raise nose.SkipTest("openpyxl %s >= 2.2" % str(ver))
-
-    cls.setUpClass = setUpClass
-    return cls
-
-@raise_on_incompat_version(2)
-@skip_openpyxl_gt21
-class Openpyxl20Tests(ExcelWriterBase, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'openpyxl20'
-    check_skip = staticmethod(lambda *args, **kwargs: None)
-
-    def test_to_excel_styleconverter(self):
-        import openpyxl
-        from openpyxl import styles
-
-        hstyle = {
-            "font": {
-                "color": '00FF0000',
-                "bold": True,
-            },
-            "borders": {
-                "top": "thin",
-                "right": "thin",
-                "bottom": "thin",
-                "left": "thin",
-            },
-            "alignment": {
-                "horizontal": "center",
-                "vertical": "top",
-            },
-            "fill": {
-                "patternType": 'solid',
-                'fgColor': {
-                    'rgb': '006666FF',
-                    'tint': 0.3,
-                },
-            },
-            "number_format": {
-                "format_code": "0.00"
-            },
-            "protection": {
-                "locked": True,
-                "hidden": False,
-            },
-        }
-
-        font_color = styles.Color('00FF0000')
-        font = styles.Font(bold=True, color=font_color)
-        side = styles.Side(style=styles.borders.BORDER_THIN)
-        border = styles.Border(top=side, right=side, bottom=side, left=side)
-        alignment = styles.Alignment(horizontal='center', vertical='top')
-        fill_color = styles.Color(rgb='006666FF', tint=0.3)
-        fill = styles.PatternFill(patternType='solid', fgColor=fill_color)
-
-        # ahh openpyxl API changes
-        ver = openpyxl.__version__
-        if ver >= LooseVersion('2.0.0') and ver < LooseVersion('2.1.0'):
-            number_format = styles.NumberFormat(format_code='0.00')
-        else:
-            number_format = '0.00' # XXX: Only works with openpyxl-2.1.0
-
-        protection = styles.Protection(locked=True, hidden=False)
-
-        kw = _Openpyxl20Writer._convert_to_style_kwargs(hstyle)
-        self.assertEqual(kw['font'], font)
-        self.assertEqual(kw['border'], border)
-        self.assertEqual(kw['alignment'], alignment)
-        self.assertEqual(kw['fill'], fill)
-        self.assertEqual(kw['number_format'], number_format)
-        self.assertEqual(kw['protection'], protection)
-
-
-    def test_write_cells_merge_styled(self):
-        from pandas.core.format import ExcelCell
-        from openpyxl import styles
-
-        sheet_name='merge_styled'
-
-        sty_b1 = {'font': {'color': '00FF0000'}}
-        sty_a2 = {'font': {'color': '0000FF00'}}
-
-        initial_cells = [
-            ExcelCell(col=1, row=0, val=42, style=sty_b1),
-            ExcelCell(col=0, row=1, val=99, style=sty_a2),
-        ]
-
-        sty_merged = {'font': { 'color': '000000FF', 'bold': True }}
-        sty_kwargs = _Openpyxl20Writer._convert_to_style_kwargs(sty_merged)
-        openpyxl_sty_merged = styles.Style(**sty_kwargs)
-        merge_cells = [
-            ExcelCell(col=0, row=0, val='pandas',
-                    mergestart=1, mergeend=1, style=sty_merged),
-        ]
-
-        with ensure_clean('.xlsx') as path:
-            writer = _Openpyxl20Writer(path)
-            writer.write_cells(initial_cells, sheet_name=sheet_name)
-            writer.write_cells(merge_cells, sheet_name=sheet_name)
-
-            wks = writer.sheets[sheet_name]
-            xcell_b1 = wks.cell('B1')
-            xcell_a2 = wks.cell('A2')
-            self.assertEqual(xcell_b1.style, openpyxl_sty_merged)
-            self.assertEqual(xcell_a2.style, openpyxl_sty_merged)
-
-def skip_openpyxl_lt22(cls):
-    """Skip a TestCase instance if openpyxl < 2.2"""
-
-    @classmethod
-    def setUpClass(cls):
-        _skip_if_no_openpyxl()
-        import openpyxl
-        ver = openpyxl.__version__
-        if LooseVersion(ver) < LooseVersion('2.2.0'):
-            raise nose.SkipTest("openpyxl %s < 2.2" % str(ver))
-
-    cls.setUpClass = setUpClass
-    return cls
-
-@raise_on_incompat_version(2)
-@skip_openpyxl_lt22
-class Openpyxl22Tests(ExcelWriterBase, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'openpyxl22'
-    check_skip = staticmethod(lambda *args, **kwargs: None)
-
-    def test_to_excel_styleconverter(self):
-        import openpyxl
-        from openpyxl import styles
-
-        hstyle = {
-            "font": {
-                "color": '00FF0000',
-                "bold": True,
-            },
-            "borders": {
-                "top": "thin",
-                "right": "thin",
-                "bottom": "thin",
-                "left": "thin",
-            },
-            "alignment": {
-                "horizontal": "center",
-                "vertical": "top",
-            },
-            "fill": {
-                "patternType": 'solid',
-                'fgColor': {
-                    'rgb': '006666FF',
-                    'tint': 0.3,
-                },
-            },
-            "number_format": {
-                "format_code": "0.00"
-            },
-            "protection": {
-                "locked": True,
-                "hidden": False,
-            },
-        }
-
-        font_color = styles.Color('00FF0000')
-        font = styles.Font(bold=True, color=font_color)
-        side = styles.Side(style=styles.borders.BORDER_THIN)
-        border = styles.Border(top=side, right=side, bottom=side, left=side)
-        alignment = styles.Alignment(horizontal='center', vertical='top')
-        fill_color = styles.Color(rgb='006666FF', tint=0.3)
-        fill = styles.PatternFill(patternType='solid', fgColor=fill_color)
-
-        number_format = '0.00'
-
-        protection = styles.Protection(locked=True, hidden=False)
-
-        kw = _Openpyxl22Writer._convert_to_style_kwargs(hstyle)
-        self.assertEqual(kw['font'], font)
-        self.assertEqual(kw['border'], border)
-        self.assertEqual(kw['alignment'], alignment)
-        self.assertEqual(kw['fill'], fill)
-        self.assertEqual(kw['number_format'], number_format)
-        self.assertEqual(kw['protection'], protection)
-
-
-    def test_write_cells_merge_styled(self):
-        if not openpyxl_compat.is_compat(major_ver=2):
-            raise nose.SkipTest('incompatiable openpyxl version')
-
-        from pandas.core.format import ExcelCell
-        from openpyxl import styles
-
-        sheet_name='merge_styled'
-
-        sty_b1 = {'font': {'color': '00FF0000'}}
-        sty_a2 = {'font': {'color': '0000FF00'}}
-
-        initial_cells = [
-            ExcelCell(col=1, row=0, val=42, style=sty_b1),
-            ExcelCell(col=0, row=1, val=99, style=sty_a2),
-        ]
-
-        sty_merged = {'font': { 'color': '000000FF', 'bold': True }}
-        sty_kwargs = _Openpyxl22Writer._convert_to_style_kwargs(sty_merged)
-        openpyxl_sty_merged = sty_kwargs['font']
-        merge_cells = [
-            ExcelCell(col=0, row=0, val='pandas',
-                    mergestart=1, mergeend=1, style=sty_merged),
-        ]
-
-        with ensure_clean('.xlsx') as path:
-            writer = _Openpyxl22Writer(path)
-            writer.write_cells(initial_cells, sheet_name=sheet_name)
-            writer.write_cells(merge_cells, sheet_name=sheet_name)
-
-            wks = writer.sheets[sheet_name]
-            xcell_b1 = wks.cell('B1')
-            xcell_a2 = wks.cell('A2')
-            self.assertEqual(xcell_b1.font, openpyxl_sty_merged)
-            self.assertEqual(xcell_a2.font, openpyxl_sty_merged)
-
-
-class XlwtTests(ExcelWriterBase, tm.TestCase):
-    ext = '.xls'
-    engine_name = 'xlwt'
-    check_skip = staticmethod(_skip_if_no_xlwt)
-
-    def test_excel_raise_error_on_multiindex_columns_and_no_index(self):
-        _skip_if_no_xlwt()
-        # MultiIndex as columns is not yet implemented 9794
-        cols = MultiIndex.from_tuples([('site', ''),
-                                          ('2014', 'height'),
-                                          ('2014', 'weight')])
-        df = DataFrame(np.random.randn(10, 3), columns=cols)
-        with tm.assertRaises(NotImplementedError):
-            with ensure_clean(self.ext) as path:
-                df.to_excel(path, index=False)
-
-    def test_excel_multiindex_columns_and_index_true(self):
-        _skip_if_no_xlwt()
-        cols = MultiIndex.from_tuples([('site', ''),
-                                          ('2014', 'height'),
-                                          ('2014', 'weight')])
-        df = pd.DataFrame(np.random.randn(10, 3), columns=cols)
-        with ensure_clean(self.ext) as path:
-            df.to_excel(path, index=True)
-
-    def test_excel_multiindex_index(self):
-        _skip_if_no_xlwt()
-        # MultiIndex as index works so assert no error #9794
-        cols = MultiIndex.from_tuples([('site', ''),
-                                          ('2014', 'height'),
-                                          ('2014', 'weight')])
-        df = DataFrame(np.random.randn(3, 10), index=cols)
-        with ensure_clean(self.ext) as path:
-            df.to_excel(path, index=False)
-
-    def test_to_excel_styleconverter(self):
-        _skip_if_no_xlwt()
-
-        import xlwt
-
-        hstyle = {"font": {"bold": True},
-                  "borders": {"top": "thin",
-                              "right": "thin",
-                              "bottom": "thin",
-                              "left": "thin"},
-                  "alignment": {"horizontal": "center", "vertical": "top"}}
-
-        xls_style = _XlwtWriter._convert_to_style(hstyle)
-        self.assertTrue(xls_style.font.bold)
-        self.assertEqual(xlwt.Borders.THIN, xls_style.borders.top)
-        self.assertEqual(xlwt.Borders.THIN, xls_style.borders.right)
-        self.assertEqual(xlwt.Borders.THIN, xls_style.borders.bottom)
-        self.assertEqual(xlwt.Borders.THIN, xls_style.borders.left)
-        self.assertEqual(xlwt.Alignment.HORZ_CENTER, xls_style.alignment.horz)
-        self.assertEqual(xlwt.Alignment.VERT_TOP, xls_style.alignment.vert)
-
-
-class XlsxWriterTests(ExcelWriterBase, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'xlsxwriter'
-    check_skip = staticmethod(_skip_if_no_xlsxwriter)
-
-    def test_column_format(self):
-        # Test that column formats are applied to cells. Test for issue #9167.
-        # Applicable to xlsxwriter only.
-        _skip_if_no_xlsxwriter()
-
-        import warnings
-        with warnings.catch_warnings():
-            # Ignore the openpyxl lxml warning.
-            warnings.simplefilter("ignore")
-            _skip_if_no_openpyxl()
-            import openpyxl
-
-        with ensure_clean(self.ext) as path:
-            frame = DataFrame({'A': [123456, 123456],
-                               'B': [123456, 123456]})
-
-            writer = ExcelWriter(path)
-            frame.to_excel(writer)
-
-            # Add a number format to col B and ensure it is applied to cells.
-            num_format = '#,##0'
-            write_workbook = writer.book
-            write_worksheet = write_workbook.worksheets()[0]
-            col_format = write_workbook.add_format({'num_format': num_format})
-            write_worksheet.set_column('B:B', None, col_format)
-            writer.save()
-
-            read_workbook = openpyxl.load_workbook(path)
-            read_worksheet = read_workbook.get_sheet_by_name(name='Sheet1')
-
-            # Get the number format from the cell. This method is backward
-            # compatible with older versions of openpyxl.
-            cell = read_worksheet.cell('B2')
-
-            try:
-                read_num_format = cell.number_format
-            except:
-                read_num_format = cell.style.number_format._format_code
-
-            self.assertEqual(read_num_format, num_format)
-
-
-class OpenpyxlTests_NoMerge(ExcelWriterBase, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'openpyxl'
-    check_skip = staticmethod(_skip_if_no_openpyxl)
-
-    # Test < 0.13 non-merge behaviour for MultiIndex and Hierarchical Rows.
-    merge_cells = False
-
-
-class XlwtTests_NoMerge(ExcelWriterBase, tm.TestCase):
-    ext = '.xls'
-    engine_name = 'xlwt'
-    check_skip = staticmethod(_skip_if_no_xlwt)
-
-    # Test < 0.13 non-merge behaviour for MultiIndex and Hierarchical Rows.
-    merge_cells = False
-
-
-class XlsxWriterTests_NoMerge(ExcelWriterBase, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'xlsxwriter'
-    check_skip = staticmethod(_skip_if_no_xlsxwriter)
-
-    # Test < 0.13 non-merge behaviour for MultiIndex and Hierarchical Rows.
-    merge_cells = False
-
-
-class ExcelWriterEngineTests(tm.TestCase):
-
-    def test_ExcelWriter_dispatch(self):
-        with tm.assertRaisesRegexp(ValueError, 'No engine'):
-            ExcelWriter('nothing')
-
-        try:
-            import xlsxwriter
-            writer_klass = _XlsxWriter
-        except ImportError:
-            _skip_if_no_openpyxl()
-            if not openpyxl_compat.is_compat(major_ver=1):
-                raise nose.SkipTest('incompatible openpyxl version')
-            writer_klass = _Openpyxl1Writer
-
-        with ensure_clean('.xlsx') as path:
-            writer = ExcelWriter(path)
-            tm.assertIsInstance(writer, writer_klass)
-
-        _skip_if_no_xlwt()
-        with ensure_clean('.xls') as path:
-            writer = ExcelWriter(path)
-            tm.assertIsInstance(writer, _XlwtWriter)
-
-    def test_register_writer(self):
-        # some awkward mocking to test out dispatch and such actually works
-        called_save = []
-        called_write_cells = []
-
-        class DummyClass(ExcelWriter):
-            called_save = False
-            called_write_cells = False
-            supported_extensions = ['test', 'xlsx', 'xls']
-            engine = 'dummy'
-
-            def save(self):
-                called_save.append(True)
-
-            def write_cells(self, *args, **kwargs):
-                called_write_cells.append(True)
-
-        def check_called(func):
-            func()
-            self.assertTrue(len(called_save) >= 1)
-            self.assertTrue(len(called_write_cells) >= 1)
-            del called_save[:]
-            del called_write_cells[:]
-
-        register_writer(DummyClass)
-        writer = ExcelWriter('something.test')
-        tm.assertIsInstance(writer, DummyClass)
-        df = tm.makeCustomDataframe(1, 1)
-        panel = tm.makePanel()
-        func = lambda: df.to_excel('something.test')
-        check_called(func)
-        check_called(lambda: panel.to_excel('something.test'))
-        val = get_option('io.excel.xlsx.writer')
-        set_option('io.excel.xlsx.writer', 'dummy')
-        check_called(lambda: df.to_excel('something.xlsx'))
-        check_called(lambda: df.to_excel('something.xls', engine='dummy'))
-        set_option('io.excel.xlsx.writer', val)
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/io/tests/test_ga.py b/pandas/io/tests/test_ga.py
deleted file mode 100644
index 13d31b43ac39a..0000000000000
--- a/pandas/io/tests/test_ga.py
+++ /dev/null
@@ -1,190 +0,0 @@
-import os
-from datetime import datetime
-
-import nose
-import pandas as pd
-from pandas import compat
-from pandas.util.testing import network, assert_frame_equal, with_connectivity_check
-from numpy.testing.decorators import slow
-import pandas.util.testing as tm
-
-if compat.PY3:
-    raise nose.SkipTest("python-gflags does not support Python 3 yet")
-
-try:
-    import httplib2
-    import pandas.io.ga as ga
-    from pandas.io.ga import GAnalytics, read_ga
-    from pandas.io.auth import AuthenticationConfigError, reset_default_token_store
-    from pandas.io import auth
-except ImportError:
-    raise nose.SkipTest("need httplib2 and auth libs")
-
-
-class TestGoogle(tm.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    def test_remove_token_store(self):
-        auth.DEFAULT_TOKEN_FILE = 'test.dat'
-        with open(auth.DEFAULT_TOKEN_FILE, 'w') as fh:
-            fh.write('test')
-
-        reset_default_token_store()
-        self.assertFalse(os.path.exists(auth.DEFAULT_TOKEN_FILE))
-
-    @with_connectivity_check("http://www.google.com")
-    def test_getdata(self):
-        try:
-            end_date = datetime.now()
-            start_date = end_date - pd.offsets.Day() * 5
-            end_date = end_date.strftime('%Y-%m-%d')
-            start_date = start_date.strftime('%Y-%m-%d')
-
-            reader = GAnalytics()
-            df = reader.get_data(
-                metrics=['avgTimeOnSite', 'visitors', 'newVisits',
-                         'pageviewsPerVisit'],
-                start_date=start_date,
-                end_date=end_date,
-                dimensions=['date', 'hour'],
-                parse_dates={'ts': ['date', 'hour']},
-                index_col=0)
-
-            self.assertIsInstance(df, pd.DataFrame)
-            self.assertIsInstance(df.index, pd.DatetimeIndex)
-            self.assertGreater(len(df), 1)
-            self.assertTrue('date' not in df)
-            self.assertTrue('hour' not in df)
-            self.assertEqual(df.index.name, 'ts')
-            self.assertTrue('avgTimeOnSite' in df)
-            self.assertTrue('visitors' in df)
-            self.assertTrue('newVisits' in df)
-            self.assertTrue('pageviewsPerVisit' in df)
-
-            df2 = read_ga(
-                metrics=['avgTimeOnSite', 'visitors', 'newVisits',
-                         'pageviewsPerVisit'],
-                start_date=start_date,
-                end_date=end_date,
-                dimensions=['date', 'hour'],
-                parse_dates={'ts': ['date', 'hour']},
-                index_col=0)
-
-            assert_frame_equal(df, df2)
-
-        except AuthenticationConfigError:
-            raise nose.SkipTest("authentication error")
-
-    @with_connectivity_check("http://www.google.com")
-    def test_iterator(self):
-        try:
-            reader = GAnalytics()
-
-            it = reader.get_data(
-                metrics='visitors',
-                start_date='2005-1-1',
-                dimensions='date',
-                max_results=10, chunksize=5,
-                index_col=0)
-
-            df1 = next(it)
-            df2 = next(it)
-
-            for df in [df1, df2]:
-                self.assertIsInstance(df, pd.DataFrame)
-                self.assertIsInstance(df.index, pd.DatetimeIndex)
-                self.assertEqual(len(df), 5)
-                self.assertTrue('date' not in df)
-                self.assertEqual(df.index.name, 'date')
-                self.assertTrue('visitors' in df)
-
-            self.assertTrue((df2.index > df1.index).all())
-
-        except AuthenticationConfigError:
-            raise nose.SkipTest("authentication error")
-
-    def test_v2_advanced_segment_format(self):
-        advanced_segment_id = 1234567
-        query = ga.format_query('google_profile_id', ['visits'], '2013-09-01', segment=advanced_segment_id)
-        self.assertEqual(query['segment'], 'gaid::' + str(advanced_segment_id), "An integer value should be formatted as an advanced segment.")
-
-    def test_v2_dynamic_segment_format(self):
-        dynamic_segment_id = 'medium==referral'
-        query = ga.format_query('google_profile_id', ['visits'], '2013-09-01', segment=dynamic_segment_id)
-        self.assertEqual(query['segment'], 'dynamic::ga:' + str(dynamic_segment_id), "A string value with more than just letters and numbers should be formatted as a dynamic segment.")
-
-    def test_v3_advanced_segment_common_format(self):
-        advanced_segment_id = 'aZwqR234'
-        query = ga.format_query('google_profile_id', ['visits'], '2013-09-01', segment=advanced_segment_id)
-        self.assertEqual(query['segment'], 'gaid::' + str(advanced_segment_id), "A string value with just letters and numbers should be formatted as an advanced segment.")
-
-    def test_v3_advanced_segment_weird_format(self):
-        advanced_segment_id = '_aZwqR234-s1'
-        query = ga.format_query('google_profile_id', ['visits'], '2013-09-01', segment=advanced_segment_id)
-        self.assertEqual(query['segment'], 'gaid::' + str(advanced_segment_id), "A string value with just letters, numbers, and hyphens should be formatted as an advanced segment.")
-
-    def test_v3_advanced_segment_with_underscore_format(self):
-        advanced_segment_id = 'aZwqR234_s1'
-        query = ga.format_query('google_profile_id', ['visits'], '2013-09-01', segment=advanced_segment_id)
-        self.assertEqual(query['segment'], 'gaid::' + str(advanced_segment_id), "A string value with just letters, numbers, and underscores should be formatted as an advanced segment.")
-
-    @with_connectivity_check("http://www.google.com")
-    def test_segment(self):
-        try:
-            end_date = datetime.now()
-            start_date = end_date - pd.offsets.Day() * 5
-            end_date = end_date.strftime('%Y-%m-%d')
-            start_date = start_date.strftime('%Y-%m-%d')
-
-            reader = GAnalytics()
-            df = reader.get_data(
-                metrics=['avgTimeOnSite', 'visitors', 'newVisits',
-                         'pageviewsPerVisit'],
-                start_date=start_date,
-                end_date=end_date,
-                segment=-2,
-                dimensions=['date', 'hour'],
-                parse_dates={'ts': ['date', 'hour']},
-                index_col=0)
-
-            self.assertIsInstance(df, pd.DataFrame)
-            self.assertIsInstance(df.index, pd.DatetimeIndex)
-            self.assertGreater(len(df), 1)
-            self.assertTrue('date' not in df)
-            self.assertTrue('hour' not in df)
-            self.assertEqual(df.index.name, 'ts')
-            self.assertTrue('avgTimeOnSite' in df)
-            self.assertTrue('visitors' in df)
-            self.assertTrue('newVisits' in df)
-            self.assertTrue('pageviewsPerVisit' in df)
-
-            # dynamic
-            df = read_ga(
-                metrics=['avgTimeOnSite', 'visitors', 'newVisits',
-                         'pageviewsPerVisit'],
-                start_date=start_date,
-                end_date=end_date,
-                segment="source=~twitter",
-                dimensions=['date', 'hour'],
-                parse_dates={'ts': ['date', 'hour']},
-                index_col=0)
-
-            assert isinstance(df, pd.DataFrame)
-            assert isinstance(df.index, pd.DatetimeIndex)
-            self.assertGreater(len(df), 1)
-            self.assertTrue('date' not in df)
-            self.assertTrue('hour' not in df)
-            self.assertEqual(df.index.name, 'ts')
-            self.assertTrue('avgTimeOnSite' in df)
-            self.assertTrue('visitors' in df)
-            self.assertTrue('newVisits' in df)
-            self.assertTrue('pageviewsPerVisit' in df)
-
-        except AuthenticationConfigError:
-            raise nose.SkipTest("authentication error")
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/io/tests/test_gbq.py b/pandas/io/tests/test_gbq.py
deleted file mode 100644
index cc1e901d8f119..0000000000000
--- a/pandas/io/tests/test_gbq.py
+++ /dev/null
@@ -1,557 +0,0 @@
-from datetime import datetime
-import nose
-import pytz
-import platform
-from time import sleep
-
-import numpy as np
-
-from distutils.version import StrictVersion
-from pandas import compat
-
-from pandas import NaT
-from pandas.compat import u, range
-from pandas.core.frame import DataFrame
-import pandas.io.gbq as gbq
-import pandas.util.testing as tm
-
-PROJECT_ID = None
-DATASET_ID = 'pydata_pandas_bq_testing'
-TABLE_ID = 'new_test'
-DESTINATION_TABLE = "{0}.{1}".format(DATASET_ID + "1", TABLE_ID)
-
-VERSION = platform.python_version()
-
-_IMPORTS = False
-_GOOGLE_API_CLIENT_INSTALLED = False
-_GOOGLE_API_CLIENT_VALID_VERSION = False
-_HTTPLIB2_INSTALLED = False
-_SETUPTOOLS_INSTALLED = False
-
-
-def _test_imports():
-    global _GOOGLE_API_CLIENT_INSTALLED, _GOOGLE_API_CLIENT_VALID_VERSION, \
-           _HTTPLIB2_INSTALLED, _SETUPTOOLS_INSTALLED
-
-    try:
-        import pkg_resources
-        _SETUPTOOLS_INSTALLED = True
-    except ImportError:
-        _SETUPTOOLS_INSTALLED = False
-
-    if compat.PY3:
-        google_api_minimum_version = '1.4.1'
-    else:
-        google_api_minimum_version = '1.2.0'
-
-    if _SETUPTOOLS_INSTALLED:
-        try:
-            from apiclient.discovery import build
-            from apiclient.errors import HttpError
-
-            from oauth2client.client import OAuth2WebServerFlow
-            from oauth2client.client import AccessTokenRefreshError
-
-            from oauth2client.file import Storage
-            from oauth2client.tools import run_flow
-            _GOOGLE_API_CLIENT_INSTALLED=True
-            _GOOGLE_API_CLIENT_VERSION = pkg_resources.get_distribution('google-api-python-client').version
-
-            if StrictVersion(_GOOGLE_API_CLIENT_VERSION) >= StrictVersion(google_api_minimum_version):
-                _GOOGLE_API_CLIENT_VALID_VERSION = True
-
-        except ImportError:
-            _GOOGLE_API_CLIENT_INSTALLED = False
-
-        try:
-            import httplib2
-            _HTTPLIB2_INSTALLED = True
-        except ImportError:
-            _HTTPLIB2_INSTALLED = False
-
-    if not _SETUPTOOLS_INSTALLED:
-        raise ImportError('Could not import pkg_resources (setuptools).')
-
-    if not _GOOGLE_API_CLIENT_INSTALLED:
-        raise ImportError('Could not import Google API Client.')
-
-    if not _GOOGLE_API_CLIENT_VALID_VERSION:
-        raise ImportError("pandas requires google-api-python-client >= {0} for Google BigQuery support, "
-                          "current version {1}".format(google_api_minimum_version, _GOOGLE_API_CLIENT_VERSION))
-
-    if not _HTTPLIB2_INSTALLED:
-        raise ImportError("pandas requires httplib2 for Google BigQuery support")
-
-
-def test_requirements():
-    try:
-        _test_imports()
-    except (ImportError, NotImplementedError) as import_exception:
-        raise nose.SkipTest(import_exception)
-
-
-def clean_gbq_environment():
-    dataset = gbq._Dataset(PROJECT_ID)
-
-    for i in range(1, 10):
-        if DATASET_ID + str(i) in dataset.datasets():
-            dataset_id = DATASET_ID + str(i)
-            table = gbq._Table(PROJECT_ID, dataset_id)
-            for j in range(1, 20):
-                if TABLE_ID + str(j) in dataset.tables(dataset_id):
-                    table.delete(TABLE_ID + str(j))
-
-            dataset.delete(dataset_id)
-
-
-def make_mixed_dataframe_v2(test_size):
-    # create df to test for all BQ datatypes except RECORD
-    bools = np.random.randint(2, size=(1, test_size)).astype(bool)
-    flts = np.random.randn(1, test_size)
-    ints = np.random.randint(1, 10, size=(1, test_size))
-    strs = np.random.randint(1, 10, size=(1, test_size)).astype(str)
-    times = [datetime.now(pytz.timezone('US/Arizona')) for t in range(test_size)]
-    return DataFrame({'bools': bools[0],
-                      'flts': flts[0],
-                      'ints': ints[0],
-                      'strs': strs[0],
-                      'times': times[0]},
-                      index=range(test_size))
-
-
-def test_generate_bq_schema_deprecated():
-    # 11121 Deprecation of generate_bq_schema
-    with tm.assert_produces_warning(FutureWarning):
-        df = make_mixed_dataframe_v2(10)
-        gbq.generate_bq_schema(df)
-
-class TestGBQConnectorIntegration(tm.TestCase):
-    def setUp(self):
-        test_requirements()
-
-        if not PROJECT_ID:
-            raise nose.SkipTest("Cannot run integration tests without a project id")
-
-        self.sut = gbq.GbqConnector(PROJECT_ID)
-
-    def test_should_be_able_to_make_a_connector(self):
-        self.assertTrue(self.sut is not None, 'Could not create a GbqConnector')
-
-    def test_should_be_able_to_get_valid_credentials(self):
-        credentials = self.sut.get_credentials()
-        self.assertFalse(credentials.invalid, 'Returned credentials invalid')
-
-    def test_should_be_able_to_get_a_bigquery_service(self):
-        credentials = self.sut.get_credentials()
-        bigquery_service = self.sut.get_service(credentials)
-        self.assertTrue(bigquery_service is not None, 'No service returned')
-
-    def test_should_be_able_to_get_schema_from_query(self):
-        schema, pages = self.sut.run_query('SELECT 1')
-        self.assertTrue(schema is not None)
-
-    def test_should_be_able_to_get_results_from_query(self):
-        schema, pages = self.sut.run_query('SELECT 1')
-        self.assertTrue(pages is not None)
-
-
-class TestReadGBQUnitTests(tm.TestCase):
-    def setUp(self):
-        test_requirements()
-
-    def test_should_return_bigquery_integers_as_python_floats(self):
-        result = gbq._parse_entry(1, 'INTEGER')
-        tm.assert_equal(result, float(1))
-
-    def test_should_return_bigquery_floats_as_python_floats(self):
-        result = gbq._parse_entry(1, 'FLOAT')
-        tm.assert_equal(result, float(1))
-
-    def test_should_return_bigquery_timestamps_as_numpy_datetime(self):
-        result = gbq._parse_entry('0e9', 'TIMESTAMP')
-        tm.assert_equal(result, np.datetime64('1970-01-01T00:00:00Z'))
-
-    def test_should_return_bigquery_booleans_as_python_booleans(self):
-        result = gbq._parse_entry('false', 'BOOLEAN')
-        tm.assert_equal(result, False)
-
-    def test_should_return_bigquery_strings_as_python_strings(self):
-        result = gbq._parse_entry('STRING', 'STRING')
-        tm.assert_equal(result, 'STRING')
-
-    def test_to_gbq_should_fail_if_invalid_table_name_passed(self):
-        with tm.assertRaises(gbq.NotFoundException):
-            gbq.to_gbq(DataFrame(), 'invalid_table_name', project_id="1234")
-
-    def test_to_gbq_with_no_project_id_given_should_fail(self):
-        with tm.assertRaises(TypeError):
-            gbq.to_gbq(DataFrame(), 'dataset.tablename')
-
-    def test_read_gbq_with_no_project_id_given_should_fail(self):
-        with tm.assertRaises(TypeError):
-            gbq.read_gbq('SELECT "1" as NUMBER_1')
-
-    def test_that_parse_data_works_properly(self):
-        test_schema = {'fields': [{'mode': 'NULLABLE', 'name': 'VALID_STRING', 'type': 'STRING'}]}
-        test_page = [{'f': [{'v': 'PI'}]}]
-
-        test_output = gbq._parse_data(test_schema, test_page)
-        correct_output = DataFrame({'VALID_STRING': ['PI']})
-        tm.assert_frame_equal(test_output, correct_output)
-
-
-class TestReadGBQIntegration(tm.TestCase):
-    @classmethod
-    def setUpClass(cls):
-        # - GLOBAL CLASS FIXTURES -
-        #   put here any instruction you want to execute only *ONCE* *BEFORE* executing *ALL* tests
-        #   described below.
-
-        if not PROJECT_ID:
-            raise nose.SkipTest("Cannot run integration tests without a project id")
-
-        test_requirements()
-
-    def setUp(self):
-        # - PER-TEST FIXTURES -
-        #   put here any instruction you want to be run *BEFORE* *EVERY* test is executed.
-        pass
-
-    @classmethod
-    def tearDownClass(cls):
-        # - GLOBAL CLASS FIXTURES -
-        #   put here any instruction you want to execute only *ONCE* *AFTER* executing all tests.
-        pass
-
-    def tearDown(self):
-        # - PER-TEST FIXTURES -
-        #   put here any instructions you want to be run *AFTER* *EVERY* test is executed.
-        pass
-
-    def test_should_properly_handle_valid_strings(self):
-        query = 'SELECT "PI" as VALID_STRING'
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, DataFrame({'VALID_STRING': ['PI']}))
-
-    def test_should_properly_handle_empty_strings(self):
-        query = 'SELECT "" as EMPTY_STRING'
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, DataFrame({'EMPTY_STRING': [""]}))
-
-    def test_should_properly_handle_null_strings(self):
-        query = 'SELECT STRING(NULL) as NULL_STRING'
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, DataFrame({'NULL_STRING': [None]}))
-
-    def test_should_properly_handle_valid_integers(self):
-        query = 'SELECT INTEGER(3) as VALID_INTEGER'
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, DataFrame({'VALID_INTEGER': [3]}))
-
-    def test_should_properly_handle_null_integers(self):
-        query = 'SELECT INTEGER(NULL) as NULL_INTEGER'
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, DataFrame({'NULL_INTEGER': [np.nan]}))
-
-    def test_should_properly_handle_valid_floats(self):
-        query = 'SELECT PI() as VALID_FLOAT'
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, DataFrame({'VALID_FLOAT': [3.141592653589793]}))
-
-    def test_should_properly_handle_null_floats(self):
-        query = 'SELECT FLOAT(NULL) as NULL_FLOAT'
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, DataFrame({'NULL_FLOAT': [np.nan]}))
-
-    def test_should_properly_handle_timestamp_unix_epoch(self):
-        query = 'SELECT TIMESTAMP("1970-01-01 00:00:00") as UNIX_EPOCH'
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, DataFrame({'UNIX_EPOCH': [np.datetime64('1970-01-01T00:00:00.000000Z')]}))
-
-    def test_should_properly_handle_arbitrary_timestamp(self):
-        query = 'SELECT TIMESTAMP("2004-09-15 05:00:00") as VALID_TIMESTAMP'
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, DataFrame({'VALID_TIMESTAMP': [np.datetime64('2004-09-15T05:00:00.000000Z')]}))
-
-    def test_should_properly_handle_null_timestamp(self):
-        query = 'SELECT TIMESTAMP(NULL) as NULL_TIMESTAMP'
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, DataFrame({'NULL_TIMESTAMP': [NaT]}))
-
-    def test_should_properly_handle_true_boolean(self):
-        query = 'SELECT BOOLEAN(TRUE) as TRUE_BOOLEAN'
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, DataFrame({'TRUE_BOOLEAN': [True]}))
-
-    def test_should_properly_handle_false_boolean(self):
-        query = 'SELECT BOOLEAN(FALSE) as FALSE_BOOLEAN'
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, DataFrame({'FALSE_BOOLEAN': [False]}))
-
-    def test_should_properly_handle_null_boolean(self):
-        query = 'SELECT BOOLEAN(NULL) as NULL_BOOLEAN'
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, DataFrame({'NULL_BOOLEAN': [None]}))
-
-    def test_unicode_string_conversion_and_normalization(self):
-        correct_test_datatype = DataFrame(
-            {'UNICODE_STRING': [u("\xe9\xfc")]}
-        )
-
-        unicode_string = "\xc3\xa9\xc3\xbc"
-
-        if compat.PY3:
-            unicode_string = unicode_string.encode('latin-1').decode('utf8')
-
-        query = 'SELECT "{0}" as UNICODE_STRING'.format(unicode_string)
-
-        df = gbq.read_gbq(query, project_id=PROJECT_ID)
-        tm.assert_frame_equal(df, correct_test_datatype)
-
-    def test_index_column(self):
-        query = "SELECT 'a' as STRING_1, 'b' as STRING_2"
-        result_frame = gbq.read_gbq(query, project_id=PROJECT_ID, index_col="STRING_1")
-        correct_frame = DataFrame({'STRING_1': ['a'], 'STRING_2': ['b']}).set_index("STRING_1")
-        tm.assert_equal(result_frame.index.name, correct_frame.index.name)
-
-    def test_column_order(self):
-        query = "SELECT 'a' as STRING_1, 'b' as STRING_2, 'c' as STRING_3"
-        col_order = ['STRING_3', 'STRING_1', 'STRING_2']
-        result_frame = gbq.read_gbq(query, project_id=PROJECT_ID, col_order=col_order)
-        correct_frame = DataFrame({'STRING_1': ['a'], 'STRING_2': ['b'], 'STRING_3': ['c']})[col_order]
-        tm.assert_frame_equal(result_frame, correct_frame)
-
-    def test_column_order_plus_index(self):
-        query = "SELECT 'a' as STRING_1, 'b' as STRING_2, 'c' as STRING_3"
-        col_order = ['STRING_3', 'STRING_2']
-        result_frame = gbq.read_gbq(query, project_id=PROJECT_ID, index_col='STRING_1', col_order=col_order)
-        correct_frame = DataFrame({'STRING_1': ['a'], 'STRING_2': ['b'], 'STRING_3': ['c']})
-        correct_frame.set_index('STRING_1', inplace=True)
-        correct_frame = correct_frame[col_order]
-        tm.assert_frame_equal(result_frame, correct_frame)
-
-    def test_malformed_query(self):
-        with tm.assertRaises(gbq.GenericGBQException):
-            gbq.read_gbq("SELCET * FORM [publicdata:samples.shakespeare]", project_id=PROJECT_ID)
-
-    def test_bad_project_id(self):
-        with tm.assertRaises(gbq.GenericGBQException):
-            gbq.read_gbq("SELECT 1", project_id='001')
-
-    def test_bad_table_name(self):
-        with tm.assertRaises(gbq.GenericGBQException):
-            gbq.read_gbq("SELECT * FROM [publicdata:samples.nope]", project_id=PROJECT_ID)
-
-    def test_download_dataset_larger_than_200k_rows(self):
-        test_size = 200005
-        # Test for known BigQuery bug in datasets larger than 100k rows
-        # http://stackoverflow.com/questions/19145587/bq-py-not-paging-results
-        df = gbq.read_gbq("SELECT id FROM [publicdata:samples.wikipedia] GROUP EACH BY id ORDER BY id ASC LIMIT {0}".format(test_size),
-                          project_id=PROJECT_ID)
-        self.assertEqual(len(df.drop_duplicates()), test_size)
-
-    def test_zero_rows(self):
-        # Bug fix for https://github.com/pydata/pandas/issues/10273
-        df = gbq.read_gbq("SELECT title, language  FROM [publicdata:samples.wikipedia] where timestamp=-9999999",
-                          project_id=PROJECT_ID)
-        expected_result = DataFrame(columns=['title', 'language'])
-        self.assert_frame_equal(df, expected_result)
-
-
-class TestToGBQIntegration(tm.TestCase):
-    # Changes to BigQuery table schema may take up to 2 minutes as of May 2015
-    # As a workaround to this issue, each test should use a unique table name.
-    # Make sure to modify the for loop range in the tearDownClass when a new test is added
-    # See `Issue 191 <https://code.google.com/p/google-bigquery/issues/detail?id=191>`__
-
-    @classmethod
-    def setUpClass(cls):
-        # - GLOBAL CLASS FIXTURES -
-        # put here any instruction you want to execute only *ONCE* *BEFORE* executing *ALL* tests
-        # described below.
-
-        if not PROJECT_ID:
-            raise nose.SkipTest("Cannot run integration tests without a project id")
-
-        test_requirements()
-        clean_gbq_environment()
-
-        gbq._Dataset(PROJECT_ID).create(DATASET_ID + "1")
-
-    def setUp(self):
-        # - PER-TEST FIXTURES -
-        # put here any instruction you want to be run *BEFORE* *EVERY* test is executed.
-
-        self.dataset = gbq._Dataset(PROJECT_ID)
-        self.table = gbq._Table(PROJECT_ID, DATASET_ID + "1")
-
-    @classmethod
-    def tearDownClass(cls):
-        # - GLOBAL CLASS FIXTURES -
-        #   put here any instruction you want to execute only *ONCE* *AFTER* executing all tests.
-
-        clean_gbq_environment()
-
-    def tearDown(self):
-        # - PER-TEST FIXTURES -
-        # put here any instructions you want to be run *AFTER* *EVERY* test is executed.
-        pass
-
-    def test_upload_data(self):
-        destination_table = DESTINATION_TABLE + "1"
-
-        test_size = 1000001
-        df = make_mixed_dataframe_v2(test_size)
-
-        gbq.to_gbq(df, destination_table, PROJECT_ID, chunksize=10000)
-
-        sleep(60)  # <- Curses Google!!!
-
-        result = gbq.read_gbq("SELECT COUNT(*) as NUM_ROWS FROM {0}".format(destination_table),
-                              project_id=PROJECT_ID)
-        self.assertEqual(result['NUM_ROWS'][0], test_size)
-
-    def test_upload_data_if_table_exists_fail(self):
-        destination_table = DESTINATION_TABLE + "2"
-
-        test_size = 10
-        df = make_mixed_dataframe_v2(test_size)
-        self.table.create(TABLE_ID + "2", gbq._generate_bq_schema(df))
-
-        # Test the default value of if_exists is 'fail'
-        with tm.assertRaises(gbq.TableCreationError):
-            gbq.to_gbq(df, destination_table, PROJECT_ID)
-
-        # Test the if_exists parameter with value 'fail'
-        with tm.assertRaises(gbq.TableCreationError):
-            gbq.to_gbq(df, destination_table, PROJECT_ID, if_exists='fail')
-
-    def test_upload_data_if_table_exists_append(self):
-        destination_table = DESTINATION_TABLE + "3"
-
-        test_size = 10
-        df = make_mixed_dataframe_v2(test_size)
-        df_different_schema = tm.makeMixedDataFrame()
-
-        # Initialize table with sample data
-        gbq.to_gbq(df, destination_table, PROJECT_ID, chunksize=10000)
-
-        # Test the if_exists parameter with value 'append'
-        gbq.to_gbq(df, destination_table, PROJECT_ID, if_exists='append')
-
-        sleep(60)  # <- Curses Google!!!
-
-        result = gbq.read_gbq("SELECT COUNT(*) as NUM_ROWS FROM {0}".format(destination_table), project_id=PROJECT_ID)
-        self.assertEqual(result['NUM_ROWS'][0], test_size * 2)
-
-        # Try inserting with a different schema, confirm failure
-        with tm.assertRaises(gbq.InvalidSchema):
-            gbq.to_gbq(df_different_schema, destination_table, PROJECT_ID, if_exists='append')
-
-    def test_upload_data_if_table_exists_replace(self):
-        destination_table = DESTINATION_TABLE + "4"
-
-        test_size = 10
-        df = make_mixed_dataframe_v2(test_size)
-        df_different_schema = tm.makeMixedDataFrame()
-
-        # Initialize table with sample data
-        gbq.to_gbq(df, destination_table, PROJECT_ID, chunksize=10000)
-
-        # Test the if_exists parameter with the value 'replace'.
-        gbq.to_gbq(df_different_schema, destination_table, PROJECT_ID, if_exists='replace')
-
-        sleep(60)  # <- Curses Google!!!
-
-        result = gbq.read_gbq("SELECT COUNT(*) as NUM_ROWS FROM {0}".format(destination_table), project_id=PROJECT_ID)
-        self.assertEqual(result['NUM_ROWS'][0], 5)
-
-    def test_google_upload_errors_should_raise_exception(self):
-        destination_table = DESTINATION_TABLE + "5"
-
-        test_timestamp = datetime.now(pytz.timezone('US/Arizona'))
-        bad_df = DataFrame({'bools': [False, False], 'flts': [0.0, 1.0], 'ints': [0, '1'], 'strs': ['a', 1],
-                            'times': [test_timestamp, test_timestamp]}, index=range(2))
-
-        with tm.assertRaises(gbq.StreamingInsertError):
-            gbq.to_gbq(bad_df, destination_table, PROJECT_ID, verbose=True)
-
-    def test_generate_schema(self):
-        df = tm.makeMixedDataFrame()
-        schema = gbq._generate_bq_schema(df)
-
-        test_schema = {'fields': [{'name': 'A', 'type': 'FLOAT'},
-                                  {'name': 'B', 'type': 'FLOAT'},
-                                  {'name': 'C', 'type': 'STRING'},
-                                  {'name': 'D', 'type': 'TIMESTAMP'}]}
-
-        self.assertEqual(schema, test_schema)
-
-    def test_create_table(self):
-        destination_table = TABLE_ID + "6"
-        test_schema = {'fields': [{'name': 'A', 'type': 'FLOAT'}, {'name': 'B', 'type': 'FLOAT'},
-                                  {'name': 'C', 'type': 'STRING'}, {'name': 'D', 'type': 'TIMESTAMP'}]}
-        self.table.create(destination_table, test_schema)
-        self.assertTrue(self.table.exists(destination_table), 'Expected table to exist')
-
-    def test_table_does_not_exist(self):
-        self.assertTrue(not self.table.exists(TABLE_ID + "7"), 'Expected table not to exist')
-
-    def test_delete_table(self):
-        destination_table = TABLE_ID + "8"
-        test_schema = {'fields': [{'name': 'A', 'type': 'FLOAT'}, {'name': 'B', 'type': 'FLOAT'},
-                                  {'name': 'C', 'type': 'STRING'}, {'name': 'D', 'type': 'TIMESTAMP'}]}
-        self.table.create(destination_table, test_schema)
-        self.table.delete(destination_table)
-        self.assertTrue(not self.table.exists(destination_table), 'Expected table not to exist')
-
-    def test_list_table(self):
-        destination_table = TABLE_ID + "9"
-        test_schema = {'fields': [{'name': 'A', 'type': 'FLOAT'}, {'name': 'B', 'type': 'FLOAT'},
-                                  {'name': 'C', 'type': 'STRING'}, {'name': 'D', 'type': 'TIMESTAMP'}]}
-        self.table.create(destination_table, test_schema)
-        self.assertTrue(destination_table in self.dataset.tables(DATASET_ID + "1"),
-                        'Expected table list to contain table {0}'.format(destination_table))
-
-    def test_list_dataset(self):
-        dataset_id = DATASET_ID + "1"
-        self.assertTrue(dataset_id in self.dataset.datasets(),
-                        'Expected dataset list to contain dataset {0}'.format(dataset_id))
-
-    def test_list_table_zero_results(self):
-        dataset_id = DATASET_ID + "2"
-        self.dataset.create(dataset_id)
-        table_list = gbq._Dataset(PROJECT_ID).tables(dataset_id)
-        self.assertEqual(len(table_list), 0, 'Expected gbq.list_table() to return 0')
-
-    def test_create_dataset(self):
-        dataset_id = DATASET_ID + "3"
-        self.dataset.create(dataset_id)
-        self.assertTrue(dataset_id in self.dataset.datasets(), 'Expected dataset to exist')
-
-    def test_delete_dataset(self):
-        dataset_id = DATASET_ID + "4"
-        self.dataset.create(dataset_id)
-        self.dataset.delete(dataset_id)
-        self.assertTrue(dataset_id not in self.dataset.datasets(), 'Expected dataset not to exist')
-
-    def test_dataset_exists(self):
-        dataset_id = DATASET_ID + "5"
-        self.dataset.create(dataset_id)
-        self.assertTrue(self.dataset.exists(dataset_id), 'Expected dataset to exist')
-
-    def create_table_data_dataset_does_not_exist(self):
-        dataset_id = DATASET_ID + "6"
-        table_id = TABLE_ID + "1"
-        table_with_new_dataset = gbq._Table(PROJECT_ID, dataset_id)
-        df = make_mixed_dataframe_v2(10)
-        table_with_new_dataset.create(table_id, gbq._generate_bq_schema(df))
-        self.assertTrue(self.dataset.exists(dataset_id), 'Expected dataset to exist')
-        self.assertTrue(table_with_new_dataset.exists(table_id), 'Expected dataset to exist')
-
-    def test_dataset_does_not_exist(self):
-        self.assertTrue(not self.dataset.exists(DATASET_ID + "_not_found"), 'Expected dataset not to exist')
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/io/tests/test_html.py b/pandas/io/tests/test_html.py
deleted file mode 100644
index 141533a131e42..0000000000000
--- a/pandas/io/tests/test_html.py
+++ /dev/null
@@ -1,802 +0,0 @@
-from __future__ import print_function
-
-import glob
-import os
-import re
-import warnings
-
-try:
-    from importlib import import_module
-except ImportError:
-    import_module = __import__
-
-from distutils.version import LooseVersion
-
-import nose
-
-import numpy as np
-from numpy.random import rand
-from numpy.testing.decorators import slow
-
-from pandas import (DataFrame, MultiIndex, read_csv, Timestamp, Index,
-                    date_range, Series)
-from pandas.compat import map, zip, StringIO, string_types, BytesIO, is_platform_windows
-from pandas.io.common import URLError, urlopen, file_path_to_url
-from pandas.io.html import read_html
-from pandas.parser import CParserError
-
-import pandas.util.testing as tm
-from pandas.util.testing import makeCustomDataframe as mkdf, network
-
-
-def _have_module(module_name):
-    try:
-        import_module(module_name)
-        return True
-    except ImportError:
-        return False
-
-
-def _skip_if_no(module_name):
-    if not _have_module(module_name):
-        raise nose.SkipTest("{0!r} not found".format(module_name))
-
-
-def _skip_if_none_of(module_names):
-    if isinstance(module_names, string_types):
-        _skip_if_no(module_names)
-        if module_names == 'bs4':
-            import bs4
-            if bs4.__version__ == LooseVersion('4.2.0'):
-                raise nose.SkipTest("Bad version of bs4: 4.2.0")
-    else:
-        not_found = [module_name for module_name in module_names if not
-                     _have_module(module_name)]
-        if set(not_found) & set(module_names):
-            raise nose.SkipTest("{0!r} not found".format(not_found))
-        if 'bs4' in module_names:
-            import bs4
-            if bs4.__version__ == LooseVersion('4.2.0'):
-                raise nose.SkipTest("Bad version of bs4: 4.2.0")
-
-
-DATA_PATH = tm.get_data_path()
-
-
-def assert_framelist_equal(list1, list2, *args, **kwargs):
-    assert len(list1) == len(list2), ('lists are not of equal size '
-                                      'len(list1) == {0}, '
-                                      'len(list2) == {1}'.format(len(list1),
-                                                                 len(list2)))
-    msg = 'not all list elements are DataFrames'
-    both_frames = all(map(lambda x, y: isinstance(x, DataFrame) and
-                          isinstance(y, DataFrame), list1, list2))
-    assert both_frames, msg
-    for frame_i, frame_j in zip(list1, list2):
-        tm.assert_frame_equal(frame_i, frame_j, *args, **kwargs)
-        assert not frame_i.empty, 'frames are both empty'
-
-
-def test_bs4_version_fails():
-    _skip_if_none_of(('bs4', 'html5lib'))
-    import bs4
-    if bs4.__version__ == LooseVersion('4.2.0'):
-        tm.assert_raises(AssertionError, read_html, os.path.join(DATA_PATH,
-                                                                 "spam.html"),
-                         flavor='bs4')
-
-
-class ReadHtmlMixin(object):
-    def read_html(self, *args, **kwargs):
-        kwargs.setdefault('flavor', self.flavor)
-        return read_html(*args, **kwargs)
-
-
-class TestReadHtml(tm.TestCase, ReadHtmlMixin):
-    flavor = 'bs4'
-    spam_data = os.path.join(DATA_PATH, 'spam.html')
-    banklist_data = os.path.join(DATA_PATH, 'banklist.html')
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestReadHtml, cls).setUpClass()
-        _skip_if_none_of(('bs4', 'html5lib'))
-
-    def test_to_html_compat(self):
-        df = mkdf(4, 3, data_gen_f=lambda *args: rand(), c_idx_names=False,
-                  r_idx_names=False).applymap('{0:.3f}'.format).astype(float)
-        out = df.to_html()
-        res = self.read_html(out, attrs={'class': 'dataframe'}, index_col=0)[0]
-        tm.assert_frame_equal(res, df)
-
-    @network
-    def test_banklist_url(self):
-        url = 'http://www.fdic.gov/bank/individual/failed/banklist.html'
-        df1 = self.read_html(url, 'First Federal Bank of Florida',
-                             attrs={"id": 'table'})
-        df2 = self.read_html(url, 'Metcalf Bank', attrs={'id': 'table'})
-
-        assert_framelist_equal(df1, df2)
-
-    @network
-    def test_spam_url(self):
-        url = ('http://ndb.nal.usda.gov/ndb/foods/show/1732?fg=&man=&'
-               'lfacet=&format=&count=&max=25&offset=&sort=&qlookup=spam')
-        df1 = self.read_html(url, '.*Water.*')
-        df2 = self.read_html(url, 'Unit')
-
-        assert_framelist_equal(df1, df2)
-
-    @slow
-    def test_banklist(self):
-        df1 = self.read_html(self.banklist_data, '.*Florida.*',
-                             attrs={'id': 'table'})
-        df2 = self.read_html(self.banklist_data, 'Metcalf Bank',
-                             attrs={'id': 'table'})
-
-        assert_framelist_equal(df1, df2)
-
-    def test_spam_no_types(self):
-
-        # infer_types removed in #10892
-        df1 = self.read_html(self.spam_data, '.*Water.*')
-        df2 = self.read_html(self.spam_data, 'Unit')
-        assert_framelist_equal(df1, df2)
-
-        self.assertEqual(df1[0].ix[0, 0], 'Proximates')
-        self.assertEqual(df1[0].columns[0], 'Nutrient')
-
-    def test_spam_with_types(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*')
-        df2 = self.read_html(self.spam_data, 'Unit')
-        assert_framelist_equal(df1, df2)
-
-        self.assertEqual(df1[0].ix[0, 0], 'Proximates')
-        self.assertEqual(df1[0].columns[0], 'Nutrient')
-
-    def test_spam_no_match(self):
-        dfs = self.read_html(self.spam_data)
-        for df in dfs:
-            tm.assertIsInstance(df, DataFrame)
-
-    def test_banklist_no_match(self):
-        dfs = self.read_html(self.banklist_data, attrs={'id': 'table'})
-        for df in dfs:
-            tm.assertIsInstance(df, DataFrame)
-
-    def test_spam_header(self):
-        df = self.read_html(self.spam_data, '.*Water.*', header=1)[0]
-        self.assertEqual(df.columns[0], 'Proximates')
-        self.assertFalse(df.empty)
-
-    def test_skiprows_int(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=1)
-        df2 = self.read_html(self.spam_data, 'Unit', skiprows=1)
-
-        assert_framelist_equal(df1, df2)
-
-    def test_skiprows_xrange(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=range(2))[0]
-        df2 = self.read_html(self.spam_data, 'Unit', skiprows=range(2))[0]
-        tm.assert_frame_equal(df1, df2)
-
-    def test_skiprows_list(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=[1, 2])
-        df2 = self.read_html(self.spam_data, 'Unit', skiprows=[2, 1])
-
-        assert_framelist_equal(df1, df2)
-
-    def test_skiprows_set(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=set([1, 2]))
-        df2 = self.read_html(self.spam_data, 'Unit', skiprows=set([2, 1]))
-
-        assert_framelist_equal(df1, df2)
-
-    def test_skiprows_slice(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=1)
-        df2 = self.read_html(self.spam_data, 'Unit', skiprows=1)
-
-        assert_framelist_equal(df1, df2)
-
-    def test_skiprows_slice_short(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=slice(2))
-        df2 = self.read_html(self.spam_data, 'Unit', skiprows=slice(2))
-
-        assert_framelist_equal(df1, df2)
-
-    def test_skiprows_slice_long(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=slice(2, 5))
-        df2 = self.read_html(self.spam_data, 'Unit', skiprows=slice(4, 1, -1))
-
-        assert_framelist_equal(df1, df2)
-
-    def test_skiprows_ndarray(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*',
-                             skiprows=np.arange(2))
-        df2 = self.read_html(self.spam_data, 'Unit', skiprows=np.arange(2))
-
-        assert_framelist_equal(df1, df2)
-
-    def test_skiprows_invalid(self):
-        with tm.assertRaisesRegexp(TypeError,
-                                   'is not a valid type for skipping rows'):
-            self.read_html(self.spam_data, '.*Water.*', skiprows='asdf')
-
-    def test_index(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*', index_col=0)
-        df2 = self.read_html(self.spam_data, 'Unit', index_col=0)
-        assert_framelist_equal(df1, df2)
-
-    def test_header_and_index_no_types(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*', header=1,
-                             index_col=0)
-        df2 = self.read_html(self.spam_data, 'Unit', header=1, index_col=0)
-        assert_framelist_equal(df1, df2)
-
-    def test_header_and_index_with_types(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*', header=1,
-                             index_col=0)
-        df2 = self.read_html(self.spam_data, 'Unit', header=1, index_col=0)
-        assert_framelist_equal(df1, df2)
-
-    def test_infer_types(self):
-
-        # 10892 infer_types removed
-        df1 = self.read_html(self.spam_data, '.*Water.*', index_col=0)
-        df2 = self.read_html(self.spam_data, 'Unit', index_col=0)
-        assert_framelist_equal(df1, df2)
-
-    def test_string_io(self):
-        with open(self.spam_data) as f:
-            data1 = StringIO(f.read())
-
-        with open(self.spam_data) as f:
-            data2 = StringIO(f.read())
-
-        df1 = self.read_html(data1, '.*Water.*')
-        df2 = self.read_html(data2, 'Unit')
-        assert_framelist_equal(df1, df2)
-
-    def test_string(self):
-        with open(self.spam_data) as f:
-            data = f.read()
-
-        df1 = self.read_html(data, '.*Water.*')
-        df2 = self.read_html(data, 'Unit')
-
-        assert_framelist_equal(df1, df2)
-
-    def test_file_like(self):
-        with open(self.spam_data) as f:
-            df1 = self.read_html(f, '.*Water.*')
-
-        with open(self.spam_data) as f:
-            df2 = self.read_html(f, 'Unit')
-
-        assert_framelist_equal(df1, df2)
-
-    @network
-    def test_bad_url_protocol(self):
-        with tm.assertRaises(URLError):
-            self.read_html('git://github.com', match='.*Water.*')
-
-    @network
-    def test_invalid_url(self):
-        try:
-            with tm.assertRaises(URLError):
-                self.read_html('http://www.a23950sdfa908sd.com',
-                               match='.*Water.*')
-        except ValueError as e:
-            tm.assert_equal(str(e), 'No tables found')
-
-    @slow
-    def test_file_url(self):
-        url = self.banklist_data
-        dfs = self.read_html(file_path_to_url(url), 'First',
-                             attrs={'id': 'table'})
-        tm.assertIsInstance(dfs, list)
-        for df in dfs:
-            tm.assertIsInstance(df, DataFrame)
-
-    @slow
-    def test_invalid_table_attrs(self):
-        url = self.banklist_data
-        with tm.assertRaisesRegexp(ValueError, 'No tables found'):
-            self.read_html(url, 'First Federal Bank of Florida',
-                           attrs={'id': 'tasdfable'})
-
-    def _bank_data(self, *args, **kwargs):
-        return self.read_html(self.banklist_data, 'Metcalf',
-                              attrs={'id': 'table'}, *args, **kwargs)
-
-    @slow
-    def test_multiindex_header(self):
-        df = self._bank_data(header=[0, 1])[0]
-        tm.assertIsInstance(df.columns, MultiIndex)
-
-    @slow
-    def test_multiindex_index(self):
-        df = self._bank_data(index_col=[0, 1])[0]
-        tm.assertIsInstance(df.index, MultiIndex)
-
-    @slow
-    def test_multiindex_header_index(self):
-        df = self._bank_data(header=[0, 1], index_col=[0, 1])[0]
-        tm.assertIsInstance(df.columns, MultiIndex)
-        tm.assertIsInstance(df.index, MultiIndex)
-
-    @slow
-    def test_multiindex_header_skiprows_tuples(self):
-        df = self._bank_data(header=[0, 1], skiprows=1, tupleize_cols=True)[0]
-        tm.assertIsInstance(df.columns, Index)
-
-    @slow
-    def test_multiindex_header_skiprows(self):
-        df = self._bank_data(header=[0, 1], skiprows=1)[0]
-        tm.assertIsInstance(df.columns, MultiIndex)
-
-    @slow
-    def test_multiindex_header_index_skiprows(self):
-        df = self._bank_data(header=[0, 1], index_col=[0, 1], skiprows=1)[0]
-        tm.assertIsInstance(df.index, MultiIndex)
-        tm.assertIsInstance(df.columns, MultiIndex)
-
-    @slow
-    def test_regex_idempotency(self):
-        url = self.banklist_data
-        dfs = self.read_html(file_path_to_url(url),
-                             match=re.compile(re.compile('Florida')),
-                             attrs={'id': 'table'})
-        tm.assertIsInstance(dfs, list)
-        for df in dfs:
-            tm.assertIsInstance(df, DataFrame)
-
-    def test_negative_skiprows(self):
-        with tm.assertRaisesRegexp(ValueError,
-                                   '\(you passed a negative value\)'):
-            self.read_html(self.spam_data, 'Water', skiprows=-1)
-
-    @network
-    def test_multiple_matches(self):
-        url = 'https://docs.python.org/2/'
-        dfs = self.read_html(url, match='Python')
-        self.assertTrue(len(dfs) > 1)
-
-    @network
-    def test_python_docs_table(self):
-        url = 'https://docs.python.org/2/'
-        dfs = self.read_html(url, match='Python')
-        zz = [df.iloc[0, 0][0:4] for df in dfs]
-        self.assertEqual(sorted(zz), sorted(['Repo', 'What']))
-
-    @slow
-    def test_thousands_macau_stats(self):
-        all_non_nan_table_index = -2
-        macau_data = os.path.join(DATA_PATH, 'macau.html')
-        dfs = self.read_html(macau_data, index_col=0,
-                             attrs={'class': 'style1'})
-        df = dfs[all_non_nan_table_index]
-
-        self.assertFalse(any(s.isnull().any() for _, s in df.iteritems()))
-
-    @slow
-    def test_thousands_macau_index_col(self):
-        all_non_nan_table_index = -2
-        macau_data = os.path.join(DATA_PATH, 'macau.html')
-        dfs = self.read_html(macau_data, index_col=0, header=0)
-        df = dfs[all_non_nan_table_index]
-
-        self.assertFalse(any(s.isnull().any() for _, s in df.iteritems()))
-
-    def test_empty_tables(self):
-        """
-        Make sure that read_html ignores empty tables.
-        """
-        data1 = '''<table>
-            <thead>
-                <tr>
-                    <th>A</th>
-                    <th>B</th>
-                </tr>
-            </thead>
-            <tbody>
-                <tr>
-                    <td>1</td>
-                    <td>2</td>
-                </tr>
-            </tbody>
-        </table>'''
-        data2 = data1 + '''<table>
-            <tbody>
-            </tbody>
-        </table>'''
-        res1 = self.read_html(StringIO(data1))
-        res2 = self.read_html(StringIO(data2))
-        assert_framelist_equal(res1, res2)
-
-    def test_tfoot_read(self):
-        """
-        Make sure that read_html reads tfoot, containing td or th.
-        Ignores empty tfoot
-        """
-        data_template = '''<table>
-            <thead>
-                <tr>
-                    <th>A</th>
-                    <th>B</th>
-                </tr>
-            </thead>
-            <tbody>
-                <tr>
-                    <td>bodyA</td>
-                    <td>bodyB</td>
-                </tr>
-            </tbody>
-            <tfoot>
-                {footer}
-            </tfoot>
-        </table>'''
-
-        data1 = data_template.format(footer = "")
-        data2 = data_template.format(footer ="<tr><td>footA</td><th>footB</th></tr>")
-
-        d1 = {'A': ['bodyA'], 'B': ['bodyB']}
-        d2 = {'A': ['bodyA', 'footA'], 'B': ['bodyB', 'footB']}
-
-        tm.assert_frame_equal(self.read_html(data1)[0], DataFrame(d1))
-        tm.assert_frame_equal(self.read_html(data2)[0], DataFrame(d2))
-
-    def test_countries_municipalities(self):
-        # GH5048
-        data1 = StringIO('''<table>
-            <thead>
-                <tr>
-                    <th>Country</th>
-                    <th>Municipality</th>
-                    <th>Year</th>
-                </tr>
-            </thead>
-            <tbody>
-                <tr>
-                    <td>Ukraine</td>
-                    <th>Odessa</th>
-                    <td>1944</td>
-                </tr>
-            </tbody>
-        </table>''')
-        data2 = StringIO('''
-        <table>
-            <tbody>
-                <tr>
-                    <th>Country</th>
-                    <th>Municipality</th>
-                    <th>Year</th>
-                </tr>
-                <tr>
-                    <td>Ukraine</td>
-                    <th>Odessa</th>
-                    <td>1944</td>
-                </tr>
-            </tbody>
-        </table>''')
-        res1 = self.read_html(data1)
-        res2 = self.read_html(data2, header=0)
-        assert_framelist_equal(res1, res2)
-
-    def test_nyse_wsj_commas_table(self):
-        data = os.path.join(DATA_PATH, 'nyse_wsj.html')
-        df = self.read_html(data, index_col=0, header=0,
-                            attrs={'class': 'mdcTable'})[0]
-
-        columns = Index(['Issue(Roll over for charts and headlines)',
-                         'Volume', 'Price', 'Chg', '% Chg'])
-        nrows = 100
-        self.assertEqual(df.shape[0], nrows)
-        self.assertTrue(df.columns.equals(columns))
-
-    @slow
-    def test_banklist_header(self):
-        from pandas.io.html import _remove_whitespace
-
-        def try_remove_ws(x):
-            try:
-                return _remove_whitespace(x)
-            except AttributeError:
-                return x
-
-        df = self.read_html(self.banklist_data, 'Metcalf',
-                            attrs={'id': 'table'})[0]
-        ground_truth = read_csv(os.path.join(DATA_PATH, 'banklist.csv'),
-                                converters={'Updated Date': Timestamp,
-                                            'Closing Date': Timestamp})
-        self.assertEqual(df.shape, ground_truth.shape)
-        old = ['First Vietnamese American BankIn Vietnamese',
-               'Westernbank Puerto RicoEn Espanol',
-               'R-G Premier Bank of Puerto RicoEn Espanol',
-               'EurobankEn Espanol', 'Sanderson State BankEn Espanol',
-               'Washington Mutual Bank(Including its subsidiary Washington '
-               'Mutual Bank FSB)',
-               'Silver State BankEn Espanol',
-               'AmTrade International BankEn Espanol',
-               'Hamilton Bank, NAEn Espanol',
-               'The Citizens Savings BankPioneer Community Bank, Inc.']
-        new = ['First Vietnamese American Bank', 'Westernbank Puerto Rico',
-               'R-G Premier Bank of Puerto Rico', 'Eurobank',
-               'Sanderson State Bank', 'Washington Mutual Bank',
-               'Silver State Bank', 'AmTrade International Bank',
-               'Hamilton Bank, NA', 'The Citizens Savings Bank']
-        dfnew = df.applymap(try_remove_ws).replace(old, new)
-        gtnew = ground_truth.applymap(try_remove_ws)
-        converted = dfnew._convert(datetime=True, numeric=True)
-        date_cols = ['Closing Date','Updated Date']
-        converted[date_cols] = converted[date_cols]._convert(datetime=True,
-                                                             coerce=True)
-        tm.assert_frame_equal(converted,gtnew)
-
-    @slow
-    def test_gold_canyon(self):
-        gc = 'Gold Canyon'
-        with open(self.banklist_data, 'r') as f:
-            raw_text = f.read()
-
-        self.assertIn(gc, raw_text)
-        df = self.read_html(self.banklist_data, 'Gold Canyon',
-                            attrs={'id': 'table'})[0]
-        self.assertIn(gc, df.to_string())
-
-    def test_different_number_of_rows(self):
-        expected = """<table border="1" class="dataframe">
-                        <thead>
-                            <tr style="text-align: right;">
-                            <th></th>
-                            <th>C_l0_g0</th>
-                            <th>C_l0_g1</th>
-                            <th>C_l0_g2</th>
-                            <th>C_l0_g3</th>
-                            <th>C_l0_g4</th>
-                            </tr>
-                        </thead>
-                        <tbody>
-                            <tr>
-                            <th>R_l0_g0</th>
-                            <td> 0.763</td>
-                            <td> 0.233</td>
-                            <td> nan</td>
-                            <td> nan</td>
-                            <td> nan</td>
-                            </tr>
-                            <tr>
-                            <th>R_l0_g1</th>
-                            <td> 0.244</td>
-                            <td> 0.285</td>
-                            <td> 0.392</td>
-                            <td> 0.137</td>
-                            <td> 0.222</td>
-                            </tr>
-                        </tbody>
-                    </table>"""
-        out = """<table border="1" class="dataframe">
-                    <thead>
-                        <tr style="text-align: right;">
-                        <th></th>
-                        <th>C_l0_g0</th>
-                        <th>C_l0_g1</th>
-                        <th>C_l0_g2</th>
-                        <th>C_l0_g3</th>
-                        <th>C_l0_g4</th>
-                        </tr>
-                    </thead>
-                    <tbody>
-                        <tr>
-                        <th>R_l0_g0</th>
-                        <td> 0.763</td>
-                        <td> 0.233</td>
-                        </tr>
-                        <tr>
-                        <th>R_l0_g1</th>
-                        <td> 0.244</td>
-                        <td> 0.285</td>
-                        <td> 0.392</td>
-                        <td> 0.137</td>
-                        <td> 0.222</td>
-                        </tr>
-                    </tbody>
-                 </table>"""
-        expected = self.read_html(expected, index_col=0)[0]
-        res = self.read_html(out, index_col=0)[0]
-        tm.assert_frame_equal(expected, res)
-
-    def test_parse_dates_list(self):
-        df = DataFrame({'date': date_range('1/1/2001', periods=10)})
-        expected = df.to_html()
-        res = self.read_html(expected, parse_dates=[1], index_col=0)
-        tm.assert_frame_equal(df, res[0])
-        res = self.read_html(expected, parse_dates=['date'], index_col=0)
-        tm.assert_frame_equal(df, res[0])
-
-    def test_parse_dates_combine(self):
-        raw_dates = Series(date_range('1/1/2001', periods=10))
-        df = DataFrame({'date': raw_dates.map(lambda x: str(x.date())),
-                        'time': raw_dates.map(lambda x: str(x.time()))})
-        res = self.read_html(df.to_html(), parse_dates={'datetime': [1, 2]},
-                             index_col=1)
-        newdf = DataFrame({'datetime': raw_dates})
-        tm.assert_frame_equal(newdf, res[0])
-
-    def test_computer_sales_page(self):
-        data = os.path.join(DATA_PATH, 'computer_sales_page.html')
-        with tm.assertRaisesRegexp(CParserError, r"Passed header=\[0,1\] are "
-                                   "too many rows for this multi_index "
-                                   "of columns"):
-            self.read_html(data, header=[0, 1])
-
-    def test_wikipedia_states_table(self):
-        data = os.path.join(DATA_PATH, 'wikipedia_states.html')
-        assert os.path.isfile(data), '%r is not a file' % data
-        assert os.path.getsize(data), '%r is an empty file' % data
-        result = self.read_html(data, 'Arizona', header=1)[0]
-        nose.tools.assert_equal(result['sq mi'].dtype, np.dtype('float64'))
-
-    def test_bool_header_arg(self):
-        #GH 6114
-        for arg in [True, False]:
-            with tm.assertRaises(TypeError):
-                read_html(self.spam_data, header=arg)
-
-def _lang_enc(filename):
-    return os.path.splitext(os.path.basename(filename))[0].split('_')
-
-
-class TestReadHtmlEncoding(tm.TestCase):
-    files = glob.glob(os.path.join(DATA_PATH, 'html_encoding', '*.html'))
-    flavor = 'bs4'
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestReadHtmlEncoding, cls).setUpClass()
-        _skip_if_none_of((cls.flavor, 'html5lib'))
-
-    def read_html(self, *args, **kwargs):
-        kwargs['flavor'] = self.flavor
-        return read_html(*args, **kwargs)
-
-    def read_filename(self, f, encoding):
-        return self.read_html(f, encoding=encoding, index_col=0)
-
-    def read_file_like(self, f, encoding):
-        with open(f, 'rb') as fobj:
-            return self.read_html(BytesIO(fobj.read()), encoding=encoding,
-                                  index_col=0)
-
-    def read_string(self, f, encoding):
-        with open(f, 'rb') as fobj:
-            return self.read_html(fobj.read(), encoding=encoding, index_col=0)
-
-    def test_encode(self):
-        assert self.files, 'no files read from the data folder'
-        for f in self.files:
-            _, encoding = _lang_enc(f)
-            try:
-                from_string = self.read_string(f, encoding).pop()
-                from_file_like = self.read_file_like(f, encoding).pop()
-                from_filename = self.read_filename(f, encoding).pop()
-                tm.assert_frame_equal(from_string, from_file_like)
-                tm.assert_frame_equal(from_string, from_filename)
-            except Exception as e:
-
-                # seems utf-16/32 fail on windows
-                if is_platform_windows():
-                    if '16' in encoding or '32' in encoding:
-                        continue
-                    raise
-
-class TestReadHtmlEncodingLxml(TestReadHtmlEncoding):
-    flavor = 'lxml'
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestReadHtmlEncodingLxml, cls).setUpClass()
-        _skip_if_no(cls.flavor)
-
-
-class TestReadHtmlLxml(tm.TestCase, ReadHtmlMixin):
-    flavor = 'lxml'
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestReadHtmlLxml, cls).setUpClass()
-        _skip_if_no('lxml')
-
-    def test_data_fail(self):
-        from lxml.etree import XMLSyntaxError
-        spam_data = os.path.join(DATA_PATH, 'spam.html')
-        banklist_data = os.path.join(DATA_PATH, 'banklist.html')
-
-        with tm.assertRaises(XMLSyntaxError):
-            self.read_html(spam_data)
-
-        with tm.assertRaises(XMLSyntaxError):
-            self.read_html(banklist_data)
-
-    def test_works_on_valid_markup(self):
-        filename = os.path.join(DATA_PATH, 'valid_markup.html')
-        dfs = self.read_html(filename, index_col=0)
-        tm.assertIsInstance(dfs, list)
-        tm.assertIsInstance(dfs[0], DataFrame)
-
-    @slow
-    def test_fallback_success(self):
-        _skip_if_none_of(('bs4', 'html5lib'))
-        banklist_data = os.path.join(DATA_PATH, 'banklist.html')
-        self.read_html(banklist_data, '.*Water.*', flavor=['lxml', 'html5lib'])
-
-    def test_parse_dates_list(self):
-        df = DataFrame({'date': date_range('1/1/2001', periods=10)})
-        expected = df.to_html()
-        res = self.read_html(expected, parse_dates=[1], index_col=0)
-        tm.assert_frame_equal(df, res[0])
-        res = self.read_html(expected, parse_dates=['date'], index_col=0)
-        tm.assert_frame_equal(df, res[0])
-
-    def test_parse_dates_combine(self):
-        raw_dates = Series(date_range('1/1/2001', periods=10))
-        df = DataFrame({'date': raw_dates.map(lambda x: str(x.date())),
-                        'time': raw_dates.map(lambda x: str(x.time()))})
-        res = self.read_html(df.to_html(), parse_dates={'datetime': [1, 2]},
-                             index_col=1)
-        newdf = DataFrame({'datetime': raw_dates})
-        tm.assert_frame_equal(newdf, res[0])
-
-    def test_computer_sales_page(self):
-        data = os.path.join(DATA_PATH, 'computer_sales_page.html')
-        self.read_html(data, header=[0, 1])
-
-
-def test_invalid_flavor():
-    url = 'google.com'
-    with tm.assertRaises(ValueError):
-        read_html(url, 'google', flavor='not a* valid**++ flaver')
-
-
-def get_elements_from_file(url, element='table'):
-    _skip_if_none_of(('bs4', 'html5lib'))
-    url = file_path_to_url(url)
-    from bs4 import BeautifulSoup
-    with urlopen(url) as f:
-        soup = BeautifulSoup(f, features='html5lib')
-    return soup.find_all(element)
-
-
-@slow
-def test_bs4_finds_tables():
-    filepath = os.path.join(DATA_PATH, "spam.html")
-    with warnings.catch_warnings():
-        warnings.filterwarnings('ignore')
-        assert get_elements_from_file(filepath, 'table')
-
-
-def get_lxml_elements(url, element):
-    _skip_if_no('lxml')
-    from lxml.html import parse
-    doc = parse(url)
-    return doc.xpath('.//{0}'.format(element))
-
-
-@slow
-def test_lxml_finds_tables():
-    filepath = os.path.join(DATA_PATH, "spam.html")
-    assert get_lxml_elements(filepath, 'table')
-
-
-@slow
-def test_lxml_finds_tbody():
-    filepath = os.path.join(DATA_PATH, "spam.html")
-    assert get_lxml_elements(filepath, 'tbody')
-
-
-def test_same_ordering():
-    _skip_if_none_of(['bs4', 'lxml', 'html5lib'])
-    filename = os.path.join(DATA_PATH, 'valid_markup.html')
-    dfs_lxml = read_html(filename, index_col=0, flavor=['lxml'])
-    dfs_bs4 = read_html(filename, index_col=0, flavor=['bs4'])
-    assert_framelist_equal(dfs_lxml, dfs_bs4)
diff --git a/pandas/io/tests/test_json/test_pandas.py b/pandas/io/tests/test_json/test_pandas.py
deleted file mode 100644
index 40cdc8fe8478c..0000000000000
--- a/pandas/io/tests/test_json/test_pandas.py
+++ /dev/null
@@ -1,764 +0,0 @@
-# pylint: disable-msg=W0612,E1101
-from pandas.compat import range, lrange, StringIO, OrderedDict
-import os
-
-import numpy as np
-from pandas import (Series, DataFrame, DatetimeIndex, Timestamp, CategoricalIndex,
-                    read_json, compat)
-from datetime import timedelta
-import pandas as pd
-
-from pandas.util.testing import (assert_almost_equal, assert_frame_equal,
-                                 assert_series_equal, network,
-                                 ensure_clean, assert_index_equal)
-import pandas.util.testing as tm
-
-_seriesd = tm.getSeriesData()
-_tsd = tm.getTimeSeriesData()
-
-_frame = DataFrame(_seriesd)
-_frame2 = DataFrame(_seriesd, columns=['D', 'C', 'B', 'A'])
-_intframe = DataFrame(dict((k, v.astype(np.int64))
-                           for k, v in compat.iteritems(_seriesd)))
-
-_tsframe = DataFrame(_tsd)
-_cat_frame = _frame.copy()
-cat = ['bah']*5 + ['bar']*5 + ['baz']*5 + ['foo']*(len(_cat_frame)-15)
-_cat_frame.index = pd.CategoricalIndex(cat,name='E')
-_cat_frame['E'] = list(reversed(cat))
-_cat_frame['sort'] = np.arange(len(_cat_frame),dtype='int64')
-
-_mixed_frame = _frame.copy()
-
-class TestPandasContainer(tm.TestCase):
-
-    def setUp(self):
-        self.dirpath = tm.get_data_path()
-
-        self.ts = tm.makeTimeSeries()
-        self.ts.name = 'ts'
-
-        self.series = tm.makeStringSeries()
-        self.series.name = 'series'
-
-        self.objSeries = tm.makeObjectSeries()
-        self.objSeries.name = 'objects'
-
-        self.empty_series = Series([], index=[])
-        self.empty_frame = DataFrame({})
-
-        self.frame = _frame.copy()
-        self.frame2 = _frame2.copy()
-        self.intframe = _intframe.copy()
-        self.tsframe = _tsframe.copy()
-        self.mixed_frame = _mixed_frame.copy()
-        self.categorical = _cat_frame.copy()
-
-    def tearDown(self):
-        del self.dirpath
-
-        del self.ts
-
-        del self.series
-
-        del self.objSeries
-
-        del self.empty_series
-        del self.empty_frame
-
-        del self.frame
-        del self.frame2
-        del self.intframe
-        del self.tsframe
-        del self.mixed_frame
-
-    def test_frame_double_encoded_labels(self):
-        df = DataFrame([['a', 'b'], ['c', 'd']],
-                       index=['index " 1', 'index / 2'],
-                       columns=['a \\ b', 'y / z'])
-
-        assert_frame_equal(df, read_json(df.to_json(orient='split'),
-                                         orient='split'))
-        assert_frame_equal(df, read_json(df.to_json(orient='columns'),
-                                         orient='columns'))
-        assert_frame_equal(df, read_json(df.to_json(orient='index'),
-                                         orient='index'))
-        df_unser = read_json(df.to_json(orient='records'), orient='records')
-        assert_index_equal(df.columns, df_unser.columns)
-        np.testing.assert_equal(df.values, df_unser.values)
-
-    def test_frame_non_unique_index(self):
-        df = DataFrame([['a', 'b'], ['c', 'd']], index=[1, 1],
-                       columns=['x', 'y'])
-
-        self.assertRaises(ValueError, df.to_json, orient='index')
-        self.assertRaises(ValueError, df.to_json, orient='columns')
-
-        assert_frame_equal(df, read_json(df.to_json(orient='split'),
-                                         orient='split'))
-        unser = read_json(df.to_json(orient='records'), orient='records')
-        self.assertTrue(df.columns.equals(unser.columns))
-        np.testing.assert_equal(df.values, unser.values)
-        unser = read_json(df.to_json(orient='values'), orient='values')
-        np.testing.assert_equal(df.values, unser.values)
-
-    def test_frame_non_unique_columns(self):
-        df = DataFrame([['a', 'b'], ['c', 'd']], index=[1, 2],
-                       columns=['x', 'x'])
-
-        self.assertRaises(ValueError, df.to_json, orient='index')
-        self.assertRaises(ValueError, df.to_json, orient='columns')
-        self.assertRaises(ValueError, df.to_json, orient='records')
-
-        assert_frame_equal(df, read_json(df.to_json(orient='split'),
-                                         orient='split', dtype=False))
-        unser = read_json(df.to_json(orient='values'), orient='values')
-        np.testing.assert_equal(df.values, unser.values)
-
-        # GH4377; duplicate columns not processing correctly
-        df = DataFrame([['a','b'],['c','d']], index=[1,2], columns=['x','y'])
-        result = read_json(df.to_json(orient='split'), orient='split')
-        assert_frame_equal(result, df)
-
-        def _check(df):
-            result = read_json(df.to_json(orient='split'), orient='split',
-                               convert_dates=['x'])
-            assert_frame_equal(result, df)
-
-        for o in [[['a','b'],['c','d']],
-                  [[1.5,2.5],[3.5,4.5]],
-                  [[1,2.5],[3,4.5]],
-                  [[Timestamp('20130101'),3.5],[Timestamp('20130102'),4.5]]]:
-            _check(DataFrame(o, index=[1,2], columns=['x','x']))
-
-    def test_frame_from_json_to_json(self):
-        def _check_orient(df, orient, dtype=None, numpy=False,
-                          convert_axes=True, check_dtype=True, raise_ok=None,
-                          sort=None):
-            if sort is not None:
-                df = df.sort_values(sort)
-            else:
-                df = df.sort_index()
-
-            # if we are not unique, then check that we are raising ValueError
-            # for the appropriate orients
-            if not df.index.is_unique and orient in ['index','columns']:
-                self.assertRaises(ValueError, lambda : df.to_json(orient=orient))
-                return
-            if not df.columns.is_unique and orient in ['index','columns','records']:
-                self.assertRaises(ValueError, lambda : df.to_json(orient=orient))
-                return
-
-            dfjson = df.to_json(orient=orient)
-
-            try:
-                unser = read_json(dfjson, orient=orient, dtype=dtype,
-                                  numpy=numpy, convert_axes=convert_axes)
-            except Exception as detail:
-                if raise_ok is not None:
-                    if isinstance(detail, raise_ok):
-                        return
-                    raise
-
-            if sort is not None and sort in unser.columns:
-                unser = unser.sort_values(sort)
-            else:
-                unser = unser.sort_index()
-
-            if dtype is False:
-                check_dtype=False
-
-            if not convert_axes and df.index.dtype.type == np.datetime64:
-                unser.index = DatetimeIndex(
-                    unser.index.values.astype('i8') * 1e6)
-            if orient == "records":
-                # index is not captured in this orientation
-                assert_almost_equal(df.values, unser.values)
-                self.assertTrue(df.columns.equals(unser.columns))
-            elif orient == "values":
-                # index and cols are not captured in this orientation
-                if numpy is True and df.shape == (0, 0):
-                    assert unser.shape[0] == 0
-                else:
-                    assert_almost_equal(df.values, unser.values)
-            elif orient == "split":
-                # index and col labels might not be strings
-                unser.index = [str(i) for i in unser.index]
-                unser.columns = [str(i) for i in unser.columns]
-
-                if sort is None:
-                    unser = unser.sort_index()
-                assert_almost_equal(df.values, unser.values)
-            else:
-                if convert_axes:
-                    assert_frame_equal(df, unser, check_dtype=check_dtype)
-                else:
-                    assert_frame_equal(df, unser, check_less_precise=False,
-                                       check_dtype=check_dtype)
-
-        def _check_all_orients(df, dtype=None, convert_axes=True, raise_ok=None, sort=None):
-
-            # numpy=False
-            if convert_axes:
-                _check_orient(df, "columns", dtype=dtype, sort=sort)
-                _check_orient(df, "records", dtype=dtype, sort=sort)
-                _check_orient(df, "split", dtype=dtype, sort=sort)
-                _check_orient(df, "index", dtype=dtype, sort=sort)
-                _check_orient(df, "values", dtype=dtype, sort=sort)
-
-            _check_orient(df, "columns", dtype=dtype, convert_axes=False, sort=sort)
-            _check_orient(df, "records", dtype=dtype, convert_axes=False, sort=sort)
-            _check_orient(df, "split", dtype=dtype, convert_axes=False, sort=sort)
-            _check_orient(df, "index", dtype=dtype, convert_axes=False, sort=sort)
-            _check_orient(df, "values", dtype=dtype ,convert_axes=False, sort=sort)
-
-            # numpy=True and raise_ok might be not None, so ignore the error
-            if convert_axes:
-                _check_orient(df, "columns", dtype=dtype, numpy=True,
-                              raise_ok=raise_ok, sort=sort)
-                _check_orient(df, "records", dtype=dtype, numpy=True,
-                              raise_ok=raise_ok, sort=sort)
-                _check_orient(df, "split", dtype=dtype, numpy=True,
-                              raise_ok=raise_ok, sort=sort)
-                _check_orient(df, "index", dtype=dtype, numpy=True,
-                              raise_ok=raise_ok, sort=sort)
-                _check_orient(df, "values", dtype=dtype, numpy=True,
-                              raise_ok=raise_ok, sort=sort)
-
-            _check_orient(df, "columns", dtype=dtype, numpy=True,
-                          convert_axes=False, raise_ok=raise_ok, sort=sort)
-            _check_orient(df, "records", dtype=dtype, numpy=True,
-                          convert_axes=False, raise_ok=raise_ok, sort=sort)
-            _check_orient(df, "split", dtype=dtype, numpy=True,
-                          convert_axes=False, raise_ok=raise_ok, sort=sort)
-            _check_orient(df, "index", dtype=dtype, numpy=True,
-                          convert_axes=False, raise_ok=raise_ok, sort=sort)
-            _check_orient(df, "values", dtype=dtype, numpy=True,
-                          convert_axes=False, raise_ok=raise_ok, sort=sort)
-
-        # basic
-        _check_all_orients(self.frame)
-        self.assertEqual(self.frame.to_json(),
-                         self.frame.to_json(orient="columns"))
-
-        _check_all_orients(self.intframe, dtype=self.intframe.values.dtype)
-        _check_all_orients(self.intframe, dtype=False)
-
-        # big one
-        # index and columns are strings as all unserialised JSON object keys
-        # are assumed to be strings
-        biggie = DataFrame(np.zeros((200, 4)),
-                           columns=[str(i) for i in range(4)],
-                           index=[str(i) for i in range(200)])
-        _check_all_orients(biggie,dtype=False,convert_axes=False)
-
-        # dtypes
-        _check_all_orients(DataFrame(biggie, dtype=np.float64),
-                           dtype=np.float64, convert_axes=False)
-        _check_all_orients(DataFrame(biggie, dtype=np.int), dtype=np.int,
-                           convert_axes=False)
-        _check_all_orients(DataFrame(biggie, dtype='U3'), dtype='U3',
-                           convert_axes=False, raise_ok=ValueError)
-
-        # categorical
-        _check_all_orients(self.categorical, sort='sort', raise_ok=ValueError)
-
-        # empty
-        _check_all_orients(self.empty_frame)
-
-        # time series data
-        _check_all_orients(self.tsframe)
-
-        # mixed data
-        index = pd.Index(['a', 'b', 'c', 'd', 'e'])
-        data = {
-            'A': [0., 1., 2., 3., 4.],
-            'B': [0., 1., 0., 1., 0.],
-            'C': ['foo1', 'foo2', 'foo3', 'foo4', 'foo5'],
-            'D': [True, False, True, False, True]
-        }
-        df = DataFrame(data=data, index=index)
-        _check_orient(df, "split", check_dtype=False)
-        _check_orient(df, "records", check_dtype=False)
-        _check_orient(df, "values", check_dtype=False)
-        _check_orient(df, "columns", check_dtype=False)
-        # index oriented is problematic as it is read back in in a transposed
-        # state, so the columns are interpreted as having mixed data and
-        # given object dtypes.
-        # force everything to have object dtype beforehand
-        _check_orient(df.transpose().transpose(), "index", dtype=False)
-
-    def test_frame_from_json_bad_data(self):
-        self.assertRaises(ValueError, read_json, StringIO('{"key":b:a:d}'))
-
-        # too few indices
-        json = StringIO('{"columns":["A","B"],'
-                        '"index":["2","3"],'
-                        '"data":[[1.0,"1"],[2.0,"2"],[null,"3"]]}')
-        self.assertRaises(ValueError, read_json, json,
-                          orient="split")
-
-        # too many columns
-        json = StringIO('{"columns":["A","B","C"],'
-                        '"index":["1","2","3"],'
-                        '"data":[[1.0,"1"],[2.0,"2"],[null,"3"]]}')
-        self.assertRaises(AssertionError, read_json, json,
-                          orient="split")
-
-        # bad key
-        json = StringIO('{"badkey":["A","B"],'
-                        '"index":["2","3"],'
-                        '"data":[[1.0,"1"],[2.0,"2"],[null,"3"]]}')
-        with tm.assertRaisesRegexp(ValueError, r"unexpected key\(s\): badkey"):
-            read_json(json, orient="split")
-
-    def test_frame_from_json_nones(self):
-        df = DataFrame([[1, 2], [4, 5, 6]])
-        unser = read_json(df.to_json())
-        self.assertTrue(np.isnan(unser[2][0]))
-
-        df = DataFrame([['1', '2'], ['4', '5', '6']])
-        unser = read_json(df.to_json())
-        self.assertTrue(np.isnan(unser[2][0]))
-        unser = read_json(df.to_json(),dtype=False)
-        self.assertTrue(unser[2][0] is None)
-        unser = read_json(df.to_json(),convert_axes=False,dtype=False)
-        self.assertTrue(unser['2']['0'] is None)
-
-        unser = read_json(df.to_json(), numpy=False)
-        self.assertTrue(np.isnan(unser[2][0]))
-        unser = read_json(df.to_json(), numpy=False, dtype=False)
-        self.assertTrue(unser[2][0] is None)
-        unser = read_json(df.to_json(), numpy=False, convert_axes=False, dtype=False)
-        self.assertTrue(unser['2']['0'] is None)
-
-        # infinities get mapped to nulls which get mapped to NaNs during
-        # deserialisation
-        df = DataFrame([[1, 2], [4, 5, 6]])
-        df.loc[0,2] = np.inf
-        unser = read_json(df.to_json())
-        self.assertTrue(np.isnan(unser[2][0]))
-        unser = read_json(df.to_json(), dtype=False)
-        self.assertTrue(np.isnan(unser[2][0]))
-
-        df.loc[0,2] = np.NINF
-        unser = read_json(df.to_json())
-        self.assertTrue(np.isnan(unser[2][0]))
-        unser = read_json(df.to_json(),dtype=False)
-        self.assertTrue(np.isnan(unser[2][0]))
-
-    def test_frame_to_json_except(self):
-        df = DataFrame([1, 2, 3])
-        self.assertRaises(ValueError, df.to_json, orient="garbage")
-
-    def test_frame_empty(self):
-        df = DataFrame(columns=['jim', 'joe'])
-        self.assertFalse(df._is_mixed_type)
-        assert_frame_equal(read_json(df.to_json(), dtype=dict(df.dtypes)), df)
-
-    def test_frame_empty_mixedtype(self):
-        # mixed type
-        df = DataFrame(columns=['jim', 'joe'])
-        df['joe'] = df['joe'].astype('i8')
-        self.assertTrue(df._is_mixed_type)
-        assert_frame_equal(read_json(df.to_json(), dtype=dict(df.dtypes)), df)
-
-    def test_frame_mixedtype_orient(self):  # GH10289
-        vals = [[10, 1, 'foo', .1, .01],
-                [20, 2, 'bar', .2, .02],
-                [30, 3, 'baz', .3, .03],
-                [40, 4, 'qux', .4, .04]]
-
-        df = DataFrame(vals, index=list('abcd'),
-                       columns=['1st', '2nd', '3rd', '4th', '5th'])
-
-        self.assertTrue(df._is_mixed_type)
-        right = df.copy()
-
-        for orient in ['split', 'index', 'columns']:
-            inp = df.to_json(orient=orient)
-            left = read_json(inp, orient=orient, convert_axes=False)
-            assert_frame_equal(left, right)
-
-        right.index = np.arange(len(df))
-        inp = df.to_json(orient='records')
-        left = read_json(inp, orient='records', convert_axes=False)
-        assert_frame_equal(left, right)
-
-        right.columns = np.arange(df.shape[1])
-        inp = df.to_json(orient='values')
-        left = read_json(inp, orient='values', convert_axes=False)
-        assert_frame_equal(left, right)
-
-    def test_v12_compat(self):
-        df = DataFrame(
-            [[1.56808523,  0.65727391,  1.81021139, -0.17251653],
-             [-0.2550111, -0.08072427, -0.03202878, -0.17581665],
-             [1.51493992,  0.11805825,  1.629455, -1.31506612],
-             [-0.02765498,  0.44679743,  0.33192641, -0.27885413],
-             [0.05951614, -2.69652057,  1.28163262,  0.34703478]],
-            columns=['A', 'B', 'C', 'D'],
-            index=pd.date_range('2000-01-03', '2000-01-07'))
-        df['date'] = pd.Timestamp('19920106 18:21:32.12')
-        df.ix[3, 'date'] = pd.Timestamp('20130101')
-        df['modified'] = df['date']
-        df.ix[1, 'modified'] = pd.NaT
-
-        v12_json = os.path.join(self.dirpath, 'tsframe_v012.json')
-        df_unser = pd.read_json(v12_json)
-        assert_frame_equal(df, df_unser)
-
-        df_iso = df.drop(['modified'], axis=1)
-        v12_iso_json = os.path.join(self.dirpath, 'tsframe_iso_v012.json')
-        df_unser_iso = pd.read_json(v12_iso_json)
-        assert_frame_equal(df_iso, df_unser_iso)
-
-    def test_blocks_compat_GH9037(self):
-        index = pd.date_range('20000101', periods=10, freq='H')
-        df_mixed = DataFrame(OrderedDict(
-            float_1=[-0.92077639, 0.77434435, 1.25234727, 0.61485564,
-                     -0.60316077, 0.24653374, 0.28668979, -2.51969012,
-                     0.95748401, -1.02970536],
-            int_1=[19680418, 75337055, 99973684, 65103179, 79373900,
-                   40314334, 21290235,  4991321, 41903419, 16008365],
-            str_1=['78c608f1', '64a99743', '13d2ff52', 'ca7f4af2', '97236474',
-                   'bde7e214', '1a6bde47', 'b1190be5', '7a669144', '8d64d068'],
-            float_2=[-0.0428278, -1.80872357,  3.36042349, -0.7573685,
-                     -0.48217572, 0.86229683, 1.08935819, 0.93898739,
-                     -0.03030452, 1.43366348],
-            str_2=['14f04af9', 'd085da90', '4bcfac83', '81504caf', '2ffef4a9',
-                   '08e2f5c4', '07e1af03', 'addbd4a7', '1f6a09ba', '4bfc4d87'],
-            int_2=[86967717, 98098830, 51927505, 20372254, 12601730, 20884027,
-                   34193846, 10561746, 24867120, 76131025]
-        ), index=index)
-
-        # JSON deserialisation always creates unicode strings
-        df_mixed.columns = df_mixed.columns.astype('unicode')
-
-        df_roundtrip = pd.read_json(df_mixed.to_json(orient='split'),
-                                    orient='split')
-        assert_frame_equal(df_mixed, df_roundtrip,
-                           check_index_type=True,
-                           check_column_type=True,
-                           check_frame_type=True,
-                           by_blocks=True,
-                           check_exact=True)
-
-    def test_series_non_unique_index(self):
-        s = Series(['a', 'b'], index=[1, 1])
-
-        self.assertRaises(ValueError, s.to_json, orient='index')
-
-        assert_series_equal(s, read_json(s.to_json(orient='split'),
-                            orient='split', typ='series'))
-        unser = read_json(s.to_json(orient='records'),
-                          orient='records', typ='series')
-        np.testing.assert_equal(s.values, unser.values)
-
-    def test_series_from_json_to_json(self):
-
-        def _check_orient(series, orient, dtype=None, numpy=False):
-            series = series.sort_index()
-            unser = read_json(series.to_json(orient=orient),
-                              typ='series', orient=orient, numpy=numpy,
-                              dtype=dtype)
-            unser = unser.sort_index()
-            if orient == "records" or orient == "values":
-                assert_almost_equal(series.values, unser.values)
-            else:
-                if orient == "split":
-                    assert_series_equal(series, unser)
-                else:
-                    assert_series_equal(series, unser, check_names=False)
-
-        def _check_all_orients(series, dtype=None):
-            _check_orient(series, "columns", dtype=dtype)
-            _check_orient(series, "records", dtype=dtype)
-            _check_orient(series, "split", dtype=dtype)
-            _check_orient(series, "index", dtype=dtype)
-            _check_orient(series, "values", dtype=dtype)
-
-            _check_orient(series, "columns", dtype=dtype, numpy=True)
-            _check_orient(series, "records", dtype=dtype, numpy=True)
-            _check_orient(series, "split", dtype=dtype, numpy=True)
-            _check_orient(series, "index", dtype=dtype, numpy=True)
-            _check_orient(series, "values", dtype=dtype, numpy=True)
-
-        # basic
-        _check_all_orients(self.series)
-        self.assertEqual(self.series.to_json(),
-                         self.series.to_json(orient="index"))
-
-        objSeries = Series([str(d) for d in self.objSeries],
-                           index=self.objSeries.index,
-                           name=self.objSeries.name)
-        _check_all_orients(objSeries, dtype=False)
-        _check_all_orients(self.empty_series)
-        _check_all_orients(self.ts)
-
-        # dtype
-        s = Series(lrange(6), index=['a','b','c','d','e','f'])
-        _check_all_orients(Series(s, dtype=np.float64), dtype=np.float64)
-        _check_all_orients(Series(s, dtype=np.int), dtype=np.int)
-
-    def test_series_to_json_except(self):
-        s = Series([1, 2, 3])
-        self.assertRaises(ValueError, s.to_json, orient="garbage")
-
-    def test_series_from_json_precise_float(self):
-        s = Series([4.56, 4.56, 4.56])
-        result = read_json(s.to_json(), typ='series', precise_float=True)
-        assert_series_equal(result, s)
-
-    def test_frame_from_json_precise_float(self):
-        df = DataFrame([[4.56, 4.56, 4.56], [4.56, 4.56, 4.56]])
-        result = read_json(df.to_json(), precise_float=True)
-        assert_frame_equal(result, df)
-
-    def test_typ(self):
-
-        s = Series(lrange(6), index=['a','b','c','d','e','f'], dtype='int64')
-        result = read_json(s.to_json(),typ=None)
-        assert_series_equal(result,s)
-
-    def test_reconstruction_index(self):
-
-        df = DataFrame([[1, 2, 3], [4, 5, 6]])
-        result = read_json(df.to_json())
-
-        # the index is serialized as strings....correct?
-        assert_frame_equal(result, df)
-
-    def test_path(self):
-        with ensure_clean('test.json') as path:
-            for df in [self.frame, self.frame2, self.intframe, self.tsframe,
-                       self.mixed_frame]:
-                df.to_json(path)
-                read_json(path)
-
-    def test_axis_dates(self):
-
-        # frame
-        json = self.tsframe.to_json()
-        result = read_json(json)
-        assert_frame_equal(result, self.tsframe)
-
-        # series
-        json = self.ts.to_json()
-        result = read_json(json, typ='series')
-        assert_series_equal(result, self.ts, check_names=False)
-        self.assertTrue(result.name is None)
-
-    def test_convert_dates(self):
-
-        # frame
-        df = self.tsframe.copy()
-        df['date'] = Timestamp('20130101')
-
-        json = df.to_json()
-        result = read_json(json)
-        assert_frame_equal(result, df)
-
-        df['foo'] = 1.
-        json = df.to_json(date_unit='ns')
-        result = read_json(json, convert_dates=False)
-        expected = df.copy()
-        expected['date'] = expected['date'].values.view('i8')
-        expected['foo'] = expected['foo'].astype('int64')
-        assert_frame_equal(result, expected)
-
-        # series
-        ts = Series(Timestamp('20130101'), index=self.ts.index)
-        json = ts.to_json()
-        result = read_json(json, typ='series')
-        assert_series_equal(result, ts)
-
-    def test_convert_dates_infer(self):
-        #GH10747
-        infer_words = ['trade_time', 'date', 'datetime', 'sold_at',
-                       'modified', 'timestamp', 'timestamps']
-        for infer_word in infer_words:
-            data = [{'id': 1, infer_word: 1036713600000}, {'id': 2}]
-            expected = DataFrame([[1, Timestamp('2002-11-08')], [2, pd.NaT]], columns=['id', infer_word])
-            result = read_json(pd.json.dumps(data))[['id', infer_word]]
-            assert_frame_equal(result, expected)
-
-    def test_date_format_frame(self):
-        df = self.tsframe.copy()
-
-        def test_w_date(date, date_unit=None):
-            df['date'] = Timestamp(date)
-            df.ix[1, 'date'] = pd.NaT
-            df.ix[5, 'date'] = pd.NaT
-            if date_unit:
-                json = df.to_json(date_format='iso', date_unit=date_unit)
-            else:
-                json = df.to_json(date_format='iso')
-            result = read_json(json)
-            assert_frame_equal(result, df)
-
-        test_w_date('20130101 20:43:42.123')
-        test_w_date('20130101 20:43:42', date_unit='s')
-        test_w_date('20130101 20:43:42.123', date_unit='ms')
-        test_w_date('20130101 20:43:42.123456', date_unit='us')
-        test_w_date('20130101 20:43:42.123456789', date_unit='ns')
-
-        self.assertRaises(ValueError, df.to_json, date_format='iso',
-                          date_unit='foo')
-
-    def test_date_format_series(self):
-        def test_w_date(date, date_unit=None):
-            ts = Series(Timestamp(date), index=self.ts.index)
-            ts.ix[1] = pd.NaT
-            ts.ix[5] = pd.NaT
-            if date_unit:
-                json = ts.to_json(date_format='iso', date_unit=date_unit)
-            else:
-                json = ts.to_json(date_format='iso')
-            result = read_json(json, typ='series')
-            assert_series_equal(result, ts)
-
-        test_w_date('20130101 20:43:42.123')
-        test_w_date('20130101 20:43:42', date_unit='s')
-        test_w_date('20130101 20:43:42.123', date_unit='ms')
-        test_w_date('20130101 20:43:42.123456', date_unit='us')
-        test_w_date('20130101 20:43:42.123456789', date_unit='ns')
-
-        ts = Series(Timestamp('20130101 20:43:42.123'), index=self.ts.index)
-        self.assertRaises(ValueError, ts.to_json, date_format='iso',
-                          date_unit='foo')
-
-    def test_date_unit(self):
-        df = self.tsframe.copy()
-        df['date'] = Timestamp('20130101 20:43:42')
-        df.ix[1, 'date'] = Timestamp('19710101 20:43:42')
-        df.ix[2, 'date'] = Timestamp('21460101 20:43:42')
-        df.ix[4, 'date'] = pd.NaT
-
-        for unit in ('s', 'ms', 'us', 'ns'):
-            json = df.to_json(date_format='epoch', date_unit=unit)
-
-            # force date unit
-            result = read_json(json, date_unit=unit)
-            assert_frame_equal(result, df)
-
-            # detect date unit
-            result = read_json(json, date_unit=None)
-            assert_frame_equal(result, df)
-
-    def test_weird_nested_json(self):
-        # this used to core dump the parser
-        s = r'''{
-        "status": "success",
-        "data": {
-        "posts": [
-            {
-            "id": 1,
-            "title": "A blog post",
-            "body": "Some useful content"
-            },
-            {
-            "id": 2,
-            "title": "Another blog post",
-            "body": "More content"
-            }
-           ]
-          }
-        }'''
-
-        read_json(s)
-
-    def test_doc_example(self):
-        dfj2 = DataFrame(np.random.randn(5, 2), columns=list('AB'))
-        dfj2['date'] = Timestamp('20130101')
-        dfj2['ints'] = lrange(5)
-        dfj2['bools'] = True
-        dfj2.index = pd.date_range('20130101',periods=5)
-
-        json = dfj2.to_json()
-        result = read_json(json,dtype={'ints' : np.int64, 'bools' : np.bool_})
-        assert_frame_equal(result,result)
-
-    def test_misc_example(self):
-
-        # parsing unordered input fails
-        result = read_json('[{"a": 1, "b": 2}, {"b":2, "a" :1}]', numpy=True)
-        expected = DataFrame([[1,2], [1,2]], columns=['a', 'b'])
-
-        error_msg = """DataFrame\\.index are different
-
-DataFrame\\.index values are different \\(100\\.0 %\\)
-\\[left\\]:  Index\\(\\[u?'a', u?'b'\\], dtype='object'\\)
-\\[right\\]: Int64Index\\(\\[0, 1\\], dtype='int64'\\)"""
-        with tm.assertRaisesRegexp(AssertionError, error_msg):
-            assert_frame_equal(result, expected)
-
-        result = read_json('[{"a": 1, "b": 2}, {"b":2, "a" :1}]')
-        expected = DataFrame([[1,2], [1,2]], columns=['a','b'])
-        assert_frame_equal(result, expected)
-
-    @network
-    def test_round_trip_exception_(self):
-        # GH 3867
-        csv = 'https://raw.github.com/hayd/lahman2012/master/csvs/Teams.csv'
-        df = pd.read_csv(csv)
-        s = df.to_json()
-        result = pd.read_json(s)
-        assert_frame_equal(result.reindex(index=df.index,columns=df.columns),df)
-
-    @network
-    def test_url(self):
-        url = 'https://api.github.com/repos/pydata/pandas/issues?per_page=5'
-        result = read_json(url, convert_dates=True)
-        for c in ['created_at', 'closed_at', 'updated_at']:
-            self.assertEqual(result[c].dtype, 'datetime64[ns]')
-
-    def test_timedelta(self):
-        converter = lambda x: pd.to_timedelta(x,unit='ms')
-
-        s = Series([timedelta(23), timedelta(seconds=5)])
-        self.assertEqual(s.dtype,'timedelta64[ns]')
-        assert_series_equal(s, pd.read_json(s.to_json(),typ='series').apply(converter))
-
-        frame = DataFrame([timedelta(23), timedelta(seconds=5)])
-        self.assertEqual(frame[0].dtype,'timedelta64[ns]')
-        assert_frame_equal(
-            frame, pd.read_json(frame.to_json()).apply(converter))
-
-        frame = DataFrame({'a': [timedelta(days=23), timedelta(seconds=5)],
-                           'b': [1, 2],
-                           'c': pd.date_range(start='20130101', periods=2)})
-
-        result = pd.read_json(frame.to_json(date_unit='ns'))
-        result['a'] = pd.to_timedelta(result.a, unit='ns')
-        result['c'] = pd.to_datetime(result.c)
-        assert_frame_equal(frame, result)
-
-    def test_mixed_timedelta_datetime(self):
-        frame = DataFrame({'a': [timedelta(23), pd.Timestamp('20130101')]},
-                          dtype=object)
-
-        expected = DataFrame({'a': [pd.Timedelta(frame.a[0]).value,
-                                    pd.Timestamp(frame.a[1]).value]})
-        result = pd.read_json(frame.to_json(date_unit='ns'),
-                              dtype={'a': 'int64'})
-        assert_frame_equal(result, expected)
-
-    def test_default_handler(self):
-        value = object()
-        frame = DataFrame({'a': ['a', value]})
-        expected = frame.applymap(str)
-        result = pd.read_json(frame.to_json(default_handler=str))
-        assert_frame_equal(expected, result)
-
-    def test_default_handler_raises(self):
-        def my_handler_raises(obj):
-            raise TypeError("raisin")
-        self.assertRaises(TypeError, DataFrame({'a': [1, 2, object()]}).to_json,
-                          default_handler=my_handler_raises)
-
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb',
-                         '--pdb-failure', '-s'], exit=False)
diff --git a/pandas/io/tests/test_json/test_ujson.py b/pandas/io/tests/test_json/test_ujson.py
deleted file mode 100644
index 8e8a798b2e792..0000000000000
--- a/pandas/io/tests/test_json/test_ujson.py
+++ /dev/null
@@ -1,1536 +0,0 @@
-# -*- coding: utf-8 -*-
-
-from unittest import TestCase
-
-try:
-    import json
-except ImportError:
-    import simplejson as json
-import math
-import nose
-import platform
-import sys
-import time
-import datetime
-import calendar
-import re
-import decimal
-from functools import partial
-from pandas.compat import range, zip, StringIO, u
-import pandas.json as ujson
-import pandas.compat as compat
-
-import numpy as np
-from numpy.testing import (assert_array_almost_equal_nulp,
-                           assert_approx_equal)
-import pytz
-import dateutil
-from pandas import DataFrame, Series, Index, NaT, DatetimeIndex
-import pandas.util.testing as tm
-
-
-def _skip_if_python_ver(skip_major, skip_minor=None):
-    major, minor = sys.version_info[:2]
-    if major == skip_major and (skip_minor is None or minor == skip_minor):
-        raise nose.SkipTest("skipping Python version %d.%d" % (major, minor))
-
-
-json_unicode = (json.dumps if compat.PY3
-                else partial(json.dumps, encoding="utf-8"))
-
-class UltraJSONTests(TestCase):
-
-    def test_encodeDecimal(self):
-        sut = decimal.Decimal("1337.1337")
-        encoded = ujson.encode(sut, double_precision=15)
-        decoded = ujson.decode(encoded)
-        self.assertEqual(decoded, 1337.1337)
-
-    def test_encodeStringConversion(self):
-        input = "A string \\ / \b \f \n \r \t </script> &"
-        not_html_encoded = '"A string \\\\ \\/ \\b \\f \\n \\r \\t <\\/script> &"'
-        html_encoded = '"A string \\\\ \\/ \\b \\f \\n \\r \\t \\u003c\\/script\\u003e \\u0026"'
-
-        def helper(expected_output, **encode_kwargs):
-            output = ujson.encode(input, **encode_kwargs)
-            self.assertEqual(input, json.loads(output))
-            self.assertEqual(output, expected_output)
-            self.assertEqual(input, ujson.decode(output))
-
-        # Default behavior assumes encode_html_chars=False.
-        helper(not_html_encoded, ensure_ascii=True)
-        helper(not_html_encoded, ensure_ascii=False)
-
-        # Make sure explicit encode_html_chars=False works.
-        helper(not_html_encoded, ensure_ascii=True, encode_html_chars=False)
-        helper(not_html_encoded, ensure_ascii=False, encode_html_chars=False)
-
-        # Make sure explicit encode_html_chars=True does the encoding.
-        helper(html_encoded, ensure_ascii=True, encode_html_chars=True)
-        helper(html_encoded, ensure_ascii=False, encode_html_chars=True)
-
-    def test_doubleLongIssue(self):
-        sut = {u('a'): -4342969734183514}
-        encoded = json.dumps(sut)
-        decoded = json.loads(encoded)
-        self.assertEqual(sut, decoded)
-        encoded = ujson.encode(sut, double_precision=15)
-        decoded = ujson.decode(encoded)
-        self.assertEqual(sut, decoded)
-
-    def test_doubleLongDecimalIssue(self):
-        sut = {u('a'): -12345678901234.56789012}
-        encoded = json.dumps(sut)
-        decoded = json.loads(encoded)
-        self.assertEqual(sut, decoded)
-        encoded = ujson.encode(sut, double_precision=15)
-        decoded = ujson.decode(encoded)
-        self.assertEqual(sut, decoded)
-
-    def test_encodeNonCLocale(self):
-        import locale
-        savedlocale = locale.getlocale(locale.LC_NUMERIC)
-        try:
-            locale.setlocale(locale.LC_NUMERIC, 'it_IT.UTF-8')
-        except:
-            try:
-                locale.setlocale(locale.LC_NUMERIC, 'Italian_Italy')
-            except:
-                raise nose.SkipTest('Could not set locale for testing')
-        self.assertEqual(ujson.loads(ujson.dumps(4.78e60)), 4.78e60)
-        self.assertEqual(ujson.loads('4.78', precise_float=True), 4.78)
-        locale.setlocale(locale.LC_NUMERIC, savedlocale)
-
-    def test_encodeDecodeLongDecimal(self):
-        sut = {u('a'): -528656961.4399388}
-        encoded = ujson.dumps(sut, double_precision=15)
-        ujson.decode(encoded)
-
-    def test_decimalDecodeTestPrecise(self):
-        sut = {u('a'): 4.56}
-        encoded = ujson.encode(sut)
-        decoded = ujson.decode(encoded, precise_float=True)
-        self.assertEqual(sut, decoded)
-
-    def test_encodeDoubleTinyExponential(self):
-        if compat.is_platform_windows() and not compat.PY3:
-            raise nose.SkipTest("buggy on win-64 for py2")
-
-        num = 1e-40
-        self.assertEqual(num, ujson.decode(ujson.encode(num)))
-        num = 1e-100
-        self.assertEqual(num, ujson.decode(ujson.encode(num)))
-        num = -1e-45
-        self.assertEqual(num, ujson.decode(ujson.encode(num)))
-        num = -1e-145
-        self.assertTrue(np.allclose(num, ujson.decode(ujson.encode(num))))
-
-    def test_encodeDictWithUnicodeKeys(self):
-        input = {u("key1"): u("value1"), u("key1"):
-                u("value1"), u("key1"): u("value1"),
-                u("key1"): u("value1"), u("key1"):
-                u("value1"), u("key1"): u("value1")}
-        output = ujson.encode(input)
-
-        input = {u("بن"): u("value1"), u("بن"): u("value1"),
-                u("بن"): u("value1"), u("بن"): u("value1"),
-                u("بن"): u("value1"), u("بن"): u("value1"),
-                u("بن"): u("value1")}
-        output = ujson.encode(input)
-
-        pass
-
-    def test_encodeDoubleConversion(self):
-        input = math.pi
-        output = ujson.encode(input)
-        self.assertEqual(round(input, 5), round(json.loads(output), 5))
-        self.assertEqual(round(input, 5), round(ujson.decode(output), 5))
-
-    def test_encodeWithDecimal(self):
-        input = 1.0
-        output = ujson.encode(input)
-        self.assertEqual(output, "1.0")
-
-    def test_encodeDoubleNegConversion(self):
-        input = -math.pi
-        output = ujson.encode(input)
-
-        self.assertEqual(round(input, 5), round(json.loads(output), 5))
-        self.assertEqual(round(input, 5), round(ujson.decode(output), 5))
-
-    def test_encodeArrayOfNestedArrays(self):
-        input = [[[[]]]] * 20
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        #self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        input = np.array(input)
-        tm.assert_numpy_array_equal(input, ujson.decode(output, numpy=True, dtype=input.dtype))
-
-    def test_encodeArrayOfDoubles(self):
-        input = [ 31337.31337, 31337.31337, 31337.31337, 31337.31337] * 10
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        #self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        tm.assert_numpy_array_equal(np.array(input), ujson.decode(output, numpy=True))
-
-    def test_doublePrecisionTest(self):
-        input = 30.012345678901234
-        output = ujson.encode(input, double_precision = 15)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(input, ujson.decode(output))
-
-        output = ujson.encode(input, double_precision = 9)
-        self.assertEqual(round(input, 9), json.loads(output))
-        self.assertEqual(round(input, 9), ujson.decode(output))
-
-        output = ujson.encode(input, double_precision = 3)
-        self.assertEqual(round(input, 3), json.loads(output))
-        self.assertEqual(round(input, 3), ujson.decode(output))
-
-    def test_invalidDoublePrecision(self):
-        input = 30.12345678901234567890
-
-        self.assertRaises(ValueError, ujson.encode, input, double_precision = 20)
-        self.assertRaises(ValueError, ujson.encode, input, double_precision = -1)
-
-        # will throw typeError
-        self.assertRaises(TypeError, ujson.encode, input, double_precision = '9')
-        # will throw typeError
-        self.assertRaises(TypeError, ujson.encode, input, double_precision = None)
-
-    def test_encodeStringConversion(self):
-        input = "A string \\ / \b \f \n \r \t"
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, '"A string \\\\ \\/ \\b \\f \\n \\r \\t"')
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_decodeUnicodeConversion(self):
-        pass
-
-    def test_encodeUnicodeConversion1(self):
-        input = "Räksmörgås اسامة بن محمد بن عوض بن لادن"
-        enc = ujson.encode(input)
-        dec = ujson.decode(enc)
-        self.assertEqual(enc, json_unicode(input))
-        self.assertEqual(dec, json.loads(enc))
-
-    def test_encodeControlEscaping(self):
-        input = "\x19"
-        enc = ujson.encode(input)
-        dec = ujson.decode(enc)
-        self.assertEqual(input, dec)
-        self.assertEqual(enc, json_unicode(input))
-
-    def test_encodeUnicodeConversion2(self):
-        input = "\xe6\x97\xa5\xd1\x88"
-        enc = ujson.encode(input)
-        dec = ujson.decode(enc)
-        self.assertEqual(enc, json_unicode(input))
-        self.assertEqual(dec, json.loads(enc))
-
-    def test_encodeUnicodeSurrogatePair(self):
-        _skip_if_python_ver(2, 5)
-        _skip_if_python_ver(2, 6)
-        input = "\xf0\x90\x8d\x86"
-        enc = ujson.encode(input)
-        dec = ujson.decode(enc)
-
-        self.assertEqual(enc, json_unicode(input))
-        self.assertEqual(dec, json.loads(enc))
-
-    def test_encodeUnicode4BytesUTF8(self):
-        _skip_if_python_ver(2, 5)
-        _skip_if_python_ver(2, 6)
-        input = "\xf0\x91\x80\xb0TRAILINGNORMAL"
-        enc = ujson.encode(input)
-        dec = ujson.decode(enc)
-
-        self.assertEqual(enc, json_unicode(input))
-        self.assertEqual(dec, json.loads(enc))
-
-    def test_encodeUnicode4BytesUTF8Highest(self):
-        _skip_if_python_ver(2, 5)
-        _skip_if_python_ver(2, 6)
-        input = "\xf3\xbf\xbf\xbfTRAILINGNORMAL"
-        enc = ujson.encode(input)
-
-        dec = ujson.decode(enc)
-
-        self.assertEqual(enc, json_unicode(input))
-        self.assertEqual(dec, json.loads(enc))
-
-    def test_encodeArrayInArray(self):
-        input = [[[[]]]]
-        output = ujson.encode(input)
-
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        tm.assert_numpy_array_equal(np.array(input), ujson.decode(output, numpy=True))
-        pass
-
-    def test_encodeIntConversion(self):
-        input = 31337
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_encodeIntNegConversion(self):
-        input = -31337
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_encodeLongNegConversion(self):
-        input = -9223372036854775808
-        output = ujson.encode(input)
-
-        outputjson = json.loads(output)
-        outputujson = ujson.decode(output)
-
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_encodeListConversion(self):
-        input = [ 1, 2, 3, 4 ]
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(input, ujson.decode(output))
-        tm.assert_numpy_array_equal(np.array(input), ujson.decode(output, numpy=True))
-        pass
-
-    def test_encodeDictConversion(self):
-        input = { "k1": 1, "k2":  2, "k3": 3, "k4": 4 }
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(input, ujson.decode(output))
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_encodeNoneConversion(self):
-        input = None
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_encodeTrueConversion(self):
-        input = True
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_encodeFalseConversion(self):
-        input = False
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-
-    def test_encodeDatetimeConversion(self):
-        ts = time.time()
-        input = datetime.datetime.fromtimestamp(ts)
-        output = ujson.encode(input, date_unit='s')
-        expected = calendar.timegm(input.utctimetuple())
-        self.assertEqual(int(expected), json.loads(output))
-        self.assertEqual(int(expected), ujson.decode(output))
-
-    def test_encodeDateConversion(self):
-        ts = time.time()
-        input = datetime.date.fromtimestamp(ts)
-
-        output = ujson.encode(input, date_unit='s')
-        tup = (input.year, input.month, input.day, 0, 0, 0)
-
-        expected = calendar.timegm(tup)
-        self.assertEqual(int(expected), json.loads(output))
-        self.assertEqual(int(expected), ujson.decode(output))
-
-    def test_encodeTimeConversion(self):
-        tests = [
-            datetime.time(),
-            datetime.time(1, 2, 3),
-            datetime.time(10, 12, 15, 343243),
-            datetime.time(10, 12, 15, 343243, pytz.utc),
-#             datetime.time(10, 12, 15, 343243, dateutil.tz.gettz('UTC')),  # this segfaults! No idea why.
-            ]
-        for test in tests:
-            output = ujson.encode(test)
-            expected = '"%s"' % test.isoformat()
-            self.assertEqual(expected, output)
-
-    def test_nat(self):
-        input = NaT
-        assert ujson.encode(input) == 'null', "Expected null"
-
-    def test_npy_nat(self):
-        from distutils.version import LooseVersion
-        if LooseVersion(np.__version__) < '1.7.0':
-            raise nose.SkipTest("numpy version < 1.7.0, is "
-                                "{0}".format(np.__version__))
-
-        input = np.datetime64('NaT')
-        assert ujson.encode(input) == 'null', "Expected null"
-
-    def test_datetime_units(self):
-        from pandas.lib import Timestamp
-
-        val = datetime.datetime(2013, 8, 17, 21, 17, 12, 215504)
-        stamp = Timestamp(val)
-
-        roundtrip = ujson.decode(ujson.encode(val, date_unit='s'))
-        self.assertEqual(roundtrip, stamp.value // 10**9)
-
-        roundtrip = ujson.decode(ujson.encode(val, date_unit='ms'))
-        self.assertEqual(roundtrip, stamp.value // 10**6)
-
-        roundtrip = ujson.decode(ujson.encode(val, date_unit='us'))
-        self.assertEqual(roundtrip, stamp.value // 10**3)
-
-        roundtrip = ujson.decode(ujson.encode(val, date_unit='ns'))
-        self.assertEqual(roundtrip, stamp.value)
-
-        self.assertRaises(ValueError, ujson.encode, val, date_unit='foo')
-
-    def test_encodeToUTF8(self):
-        _skip_if_python_ver(2, 5)
-        input = "\xe6\x97\xa5\xd1\x88"
-        enc = ujson.encode(input, ensure_ascii=False)
-        dec = ujson.decode(enc)
-        self.assertEqual(enc, json_unicode(input, ensure_ascii=False))
-        self.assertEqual(dec, json.loads(enc))
-
-    def test_decodeFromUnicode(self):
-        input = u("{\"obj\": 31337}")
-        dec1 = ujson.decode(input)
-        dec2 = ujson.decode(str(input))
-        self.assertEqual(dec1, dec2)
-
-    def test_encodeRecursionMax(self):
-        # 8 is the max recursion depth
-
-        class O2:
-            member = 0
-            pass
-
-        class O1:
-            member = 0
-            pass
-
-        input = O1()
-        input.member = O2()
-        input.member.member = input
-
-        try:
-            output = ujson.encode(input)
-            assert False, "Expected overflow exception"
-        except(OverflowError):
-            pass
-
-    def test_encodeDoubleNan(self):
-        input = np.nan
-        assert ujson.encode(input) == 'null', "Expected null"
-
-    def test_encodeDoubleInf(self):
-        input = np.inf
-        assert ujson.encode(input) == 'null', "Expected null"
-
-    def test_encodeDoubleNegInf(self):
-        input = -np.inf
-        assert ujson.encode(input) == 'null', "Expected null"
-
-    def test_decodeJibberish(self):
-        input = "fdsa sda v9sa fdsa"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeBrokenArrayStart(self):
-        input = "["
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeBrokenObjectStart(self):
-        input = "{"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeBrokenArrayEnd(self):
-        input = "]"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeArrayDepthTooBig(self):
-        input = '[' * (1024 * 1024)
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeBrokenObjectEnd(self):
-        input = "}"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeObjectDepthTooBig(self):
-        input = '{' * (1024 * 1024)
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeStringUnterminated(self):
-        input = "\"TESTING"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeStringUntermEscapeSequence(self):
-        input = "\"TESTING\\\""
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeStringBadEscape(self):
-        input = "\"TESTING\\\""
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeTrueBroken(self):
-        input = "tru"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeFalseBroken(self):
-        input = "fa"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeNullBroken(self):
-        input = "n"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeBrokenDictKeyTypeLeakTest(self):
-        input = '{{1337:""}}'
-        for x in range(1000):
-            try:
-                ujson.decode(input)
-                assert False, "Expected exception!"
-            except ValueError as e:
-                continue
-
-            assert False, "Wrong exception"
-
-    def test_decodeBrokenDictLeakTest(self):
-        input = '{{"key":"}'
-        for x in range(1000):
-            try:
-                ujson.decode(input)
-                assert False, "Expected exception!"
-            except(ValueError):
-                continue
-
-            assert False, "Wrong exception"
-
-    def test_decodeBrokenListLeakTest(self):
-        input = '[[[true'
-        for x in range(1000):
-            try:
-                ujson.decode(input)
-                assert False, "Expected exception!"
-            except(ValueError):
-                continue
-
-            assert False, "Wrong exception"
-
-    def test_decodeDictWithNoKey(self):
-        input = "{{{{31337}}}}"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-
-        assert False, "Wrong exception"
-
-    def test_decodeDictWithNoColonOrValue(self):
-        input = "{{{{\"key\"}}}}"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-
-        assert False, "Wrong exception"
-
-    def test_decodeDictWithNoValue(self):
-        input = "{{{{\"key\":}}}}"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-
-        assert False, "Wrong exception"
-
-    def test_decodeNumericIntPos(self):
-        input = "31337"
-        self.assertEqual(31337, ujson.decode(input))
-
-    def test_decodeNumericIntNeg(self):
-        input = "-31337"
-        self.assertEqual(-31337, ujson.decode(input))
-
-    def test_encodeUnicode4BytesUTF8Fail(self):
-        _skip_if_python_ver(3)
-        input = "\xfd\xbf\xbf\xbf\xbf\xbf"
-        try:
-            enc = ujson.encode(input)
-            assert False, "Expected exception"
-        except OverflowError:
-            pass
-
-    def test_encodeNullCharacter(self):
-        input = "31337 \x00 1337"
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-
-        input = "\x00"
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-
-        self.assertEqual('"  \\u0000\\r\\n "', ujson.dumps(u("  \u0000\r\n ")))
-        pass
-
-    def test_decodeNullCharacter(self):
-        input = "\"31337 \\u0000 31337\""
-        self.assertEqual(ujson.decode(input), json.loads(input))
-
-    def test_encodeListLongConversion(self):
-        input = [9223372036854775807, 9223372036854775807, 9223372036854775807,
-                 9223372036854775807, 9223372036854775807, 9223372036854775807 ]
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(input, ujson.decode(output))
-        tm.assert_numpy_array_equal(np.array(input), ujson.decode(output, numpy=True,
-                                                                  dtype=np.int64))
-        pass
-
-    def test_encodeLongConversion(self):
-        input = 9223372036854775807
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_numericIntExp(self):
-        input = "1337E40"
-        output = ujson.decode(input)
-        self.assertEqual(output, json.loads(input))
-
-    def test_numericIntFrcExp(self):
-        input = "1.337E40"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_decodeNumericIntExpEPLUS(self):
-        input = "1337E+9"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_decodeNumericIntExpePLUS(self):
-        input = "1.337e+40"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_decodeNumericIntExpE(self):
-        input = "1337E40"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_decodeNumericIntExpe(self):
-        input = "1337e40"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_decodeNumericIntExpEMinus(self):
-        input = "1.337E-4"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_decodeNumericIntExpeMinus(self):
-        input = "1.337e-4"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_dumpToFile(self):
-        f = StringIO()
-        ujson.dump([1, 2, 3], f)
-        self.assertEqual("[1,2,3]", f.getvalue())
-
-    def test_dumpToFileLikeObject(self):
-        class filelike:
-            def __init__(self):
-                self.bytes = ''
-            def write(self, bytes):
-                self.bytes += bytes
-        f = filelike()
-        ujson.dump([1, 2, 3], f)
-        self.assertEqual("[1,2,3]", f.bytes)
-
-    def test_dumpFileArgsError(self):
-        try:
-            ujson.dump([], '')
-        except TypeError:
-            pass
-        else:
-            assert False, 'expected TypeError'
-
-    def test_loadFile(self):
-        f = StringIO("[1,2,3,4]")
-        self.assertEqual([1, 2, 3, 4], ujson.load(f))
-        f = StringIO("[1,2,3,4]")
-        tm.assert_numpy_array_equal(np.array([1, 2, 3, 4]), ujson.load(f, numpy=True))
-
-    def test_loadFileLikeObject(self):
-        class filelike:
-            def read(self):
-                try:
-                    self.end
-                except AttributeError:
-                    self.end = True
-                    return "[1,2,3,4]"
-        f = filelike()
-        self.assertEqual([1, 2, 3, 4], ujson.load(f))
-        f = filelike()
-        tm.assert_numpy_array_equal(np.array([1, 2, 3, 4]), ujson.load(f, numpy=True))
-
-    def test_loadFileArgsError(self):
-        try:
-            ujson.load("[]")
-        except TypeError:
-            pass
-        else:
-            assert False, "expected TypeError"
-
-    def test_version(self):
-        assert re.match(r'^\d+\.\d+(\.\d+)?$', ujson.__version__), \
-               "ujson.__version__ must be a string like '1.4.0'"
-
-    def test_encodeNumericOverflow(self):
-        try:
-            ujson.encode(12839128391289382193812939)
-        except OverflowError:
-            pass
-        else:
-            assert False, "expected OverflowError"
-
-    def test_encodeNumericOverflowNested(self):
-        for n in range(0, 100):
-            class Nested:
-                x = 12839128391289382193812939
-
-            nested = Nested()
-
-            try:
-                ujson.encode(nested)
-            except OverflowError:
-                pass
-            else:
-                assert False, "expected OverflowError"
-
-    def test_decodeNumberWith32bitSignBit(self):
-        #Test that numbers that fit within 32 bits but would have the
-        # sign bit set (2**31 <= x < 2**32) are decoded properly.
-        boundary1 = 2**31
-        boundary2 = 2**32
-        docs = (
-            '{"id": 3590016419}',
-            '{"id": %s}' % 2**31,
-            '{"id": %s}' % 2**32,
-            '{"id": %s}' % ((2**32)-1),
-        )
-        results = (3590016419, 2**31, 2**32, 2**32-1)
-        for doc,result in zip(docs, results):
-            self.assertEqual(ujson.decode(doc)['id'], result)
-
-    def test_encodeBigEscape(self):
-        for x in range(10):
-            if compat.PY3:
-                base = '\u00e5'.encode('utf-8')
-            else:
-                base = "\xc3\xa5"
-            input = base * 1024 * 1024 * 2
-            output = ujson.encode(input)
-
-    def test_decodeBigEscape(self):
-        for x in range(10):
-            if compat.PY3:
-                base = '\u00e5'.encode('utf-8')
-            else:
-                base = "\xc3\xa5"
-            quote = compat.str_to_bytes("\"")
-            input = quote + (base * 1024 * 1024 * 2) + quote
-            output = ujson.decode(input)
-
-    def test_toDict(self):
-        d = {u("key"): 31337}
-
-        class DictTest:
-            def toDict(self):
-                return d
-
-        o = DictTest()
-        output = ujson.encode(o)
-        dec = ujson.decode(output)
-        self.assertEqual(dec, d)
-
-    def test_defaultHandler(self):
-
-        class _TestObject(object):
-
-            def __init__(self, val):
-                self.val = val
-
-            @property
-            def recursive_attr(self):
-                return _TestObject("recursive_attr")
-
-            def __str__(self):
-                return str(self.val)
-
-        self.assertRaises(OverflowError, ujson.encode, _TestObject("foo"))
-        self.assertEqual('"foo"', ujson.encode(_TestObject("foo"),
-                                                default_handler=str))
-
-        def my_handler(obj):
-            return "foobar"
-        self.assertEqual('"foobar"', ujson.encode(_TestObject("foo"),
-                                                   default_handler=my_handler))
-
-        def my_handler_raises(obj):
-            raise TypeError("I raise for anything")
-        with tm.assertRaisesRegexp(TypeError, "I raise for anything"):
-            ujson.encode(_TestObject("foo"), default_handler=my_handler_raises)
-
-        def my_int_handler(obj):
-            return 42
-        self.assertEqual(
-            42, ujson.decode(ujson.encode(_TestObject("foo"),
-                                          default_handler=my_int_handler)))
-
-        def my_obj_handler(obj):
-            return datetime.datetime(2013, 2, 3)
-        self.assertEqual(
-            ujson.decode(ujson.encode(datetime.datetime(2013, 2, 3))),
-            ujson.decode(ujson.encode(_TestObject("foo"),
-                                      default_handler=my_obj_handler)))
-
-        l = [_TestObject("foo"), _TestObject("bar")]
-        self.assertEqual(json.loads(json.dumps(l, default=str)),
-                          ujson.decode(ujson.encode(l, default_handler=str)))
-
-
-class NumpyJSONTests(TestCase):
-
-    def testBool(self):
-        b = np.bool(True)
-        self.assertEqual(ujson.decode(ujson.encode(b)), b)
-
-    def testBoolArray(self):
-        inpt = np.array([True, False, True, True, False, True, False , False],
-                         dtype=np.bool)
-        outp = np.array(ujson.decode(ujson.encode(inpt)), dtype=np.bool)
-        tm.assert_numpy_array_equal(inpt, outp)
-
-    def testInt(self):
-        num = np.int(2562010)
-        self.assertEqual(np.int(ujson.decode(ujson.encode(num))), num)
-
-        num = np.int8(127)
-        self.assertEqual(np.int8(ujson.decode(ujson.encode(num))), num)
-
-        num = np.int16(2562010)
-        self.assertEqual(np.int16(ujson.decode(ujson.encode(num))), num)
-
-        num = np.int32(2562010)
-        self.assertEqual(np.int32(ujson.decode(ujson.encode(num))), num)
-
-        num = np.int64(2562010)
-        self.assertEqual(np.int64(ujson.decode(ujson.encode(num))), num)
-
-        num = np.uint8(255)
-        self.assertEqual(np.uint8(ujson.decode(ujson.encode(num))), num)
-
-        num = np.uint16(2562010)
-        self.assertEqual(np.uint16(ujson.decode(ujson.encode(num))), num)
-
-        num = np.uint32(2562010)
-        self.assertEqual(np.uint32(ujson.decode(ujson.encode(num))), num)
-
-        num = np.uint64(2562010)
-        self.assertEqual(np.uint64(ujson.decode(ujson.encode(num))), num)
-
-    def testIntArray(self):
-        arr = np.arange(100, dtype=np.int)
-        dtypes = (np.int, np.int8, np.int16, np.int32, np.int64,
-                  np.uint, np.uint8, np.uint16, np.uint32, np.uint64)
-        for dtype in dtypes:
-            inpt = arr.astype(dtype)
-            outp = np.array(ujson.decode(ujson.encode(inpt)), dtype=dtype)
-            tm.assert_numpy_array_equal(inpt, outp)
-
-    def testIntMax(self):
-        num = np.int(np.iinfo(np.int).max)
-        self.assertEqual(np.int(ujson.decode(ujson.encode(num))), num)
-
-        num = np.int8(np.iinfo(np.int8).max)
-        self.assertEqual(np.int8(ujson.decode(ujson.encode(num))), num)
-
-        num = np.int16(np.iinfo(np.int16).max)
-        self.assertEqual(np.int16(ujson.decode(ujson.encode(num))), num)
-
-        num = np.int32(np.iinfo(np.int32).max)
-        self.assertEqual(np.int32(ujson.decode(ujson.encode(num))), num)
-
-        num = np.uint8(np.iinfo(np.uint8).max)
-        self.assertEqual(np.uint8(ujson.decode(ujson.encode(num))), num)
-
-        num = np.uint16(np.iinfo(np.uint16).max)
-        self.assertEqual(np.uint16(ujson.decode(ujson.encode(num))), num)
-
-        num = np.uint32(np.iinfo(np.uint32).max)
-        self.assertEqual(np.uint32(ujson.decode(ujson.encode(num))), num)
-
-        if platform.architecture()[0] != '32bit':
-            num = np.int64(np.iinfo(np.int64).max)
-            self.assertEqual(np.int64(ujson.decode(ujson.encode(num))), num)
-
-            # uint64 max will always overflow as it's encoded to signed
-            num = np.uint64(np.iinfo(np.int64).max)
-            self.assertEqual(np.uint64(ujson.decode(ujson.encode(num))), num)
-
-    def testFloat(self):
-        num = np.float(256.2013)
-        self.assertEqual(np.float(ujson.decode(ujson.encode(num))), num)
-
-        num = np.float32(256.2013)
-        self.assertEqual(np.float32(ujson.decode(ujson.encode(num))), num)
-
-        num = np.float64(256.2013)
-        self.assertEqual(np.float64(ujson.decode(ujson.encode(num))), num)
-
-    def testFloatArray(self):
-        arr = np.arange(12.5, 185.72, 1.7322, dtype=np.float)
-        dtypes = (np.float, np.float32, np.float64)
-
-        for dtype in dtypes:
-            inpt = arr.astype(dtype)
-            outp = np.array(ujson.decode(ujson.encode(inpt, double_precision=15)), dtype=dtype)
-            assert_array_almost_equal_nulp(inpt, outp)
-
-    def testFloatMax(self):
-        num = np.float(np.finfo(np.float).max/10)
-        assert_approx_equal(np.float(ujson.decode(ujson.encode(num, double_precision=15))), num, 15)
-
-        num = np.float32(np.finfo(np.float32).max/10)
-        assert_approx_equal(np.float32(ujson.decode(ujson.encode(num, double_precision=15))), num, 15)
-
-        num = np.float64(np.finfo(np.float64).max/10)
-        assert_approx_equal(np.float64(ujson.decode(ujson.encode(num, double_precision=15))), num, 15)
-
-    def testArrays(self):
-        arr = np.arange(100);
-
-        arr = arr.reshape((10, 10))
-        tm.assert_numpy_array_equal(np.array(ujson.decode(ujson.encode(arr))), arr)
-        tm.assert_numpy_array_equal(ujson.decode(ujson.encode(arr), numpy=True), arr)
-
-        arr = arr.reshape((5, 5, 4))
-        tm.assert_numpy_array_equal(np.array(ujson.decode(ujson.encode(arr))), arr)
-        tm.assert_numpy_array_equal(ujson.decode(ujson.encode(arr), numpy=True), arr)
-
-        arr = arr.reshape((100, 1))
-        tm.assert_numpy_array_equal(np.array(ujson.decode(ujson.encode(arr))), arr)
-        tm.assert_numpy_array_equal(ujson.decode(ujson.encode(arr), numpy=True), arr)
-
-        arr = np.arange(96);
-        arr = arr.reshape((2, 2, 2, 2, 3, 2))
-        tm.assert_numpy_array_equal(np.array(ujson.decode(ujson.encode(arr))), arr)
-        tm.assert_numpy_array_equal(ujson.decode(ujson.encode(arr), numpy=True), arr)
-
-        l = ['a', list(), dict(), dict(), list(),
-             42, 97.8, ['a', 'b'], {'key': 'val'}]
-        arr = np.array(l)
-        tm.assert_numpy_array_equal(np.array(ujson.decode(ujson.encode(arr))), arr)
-
-        arr = np.arange(100.202, 200.202, 1, dtype=np.float32);
-        arr = arr.reshape((5, 5, 4))
-        outp = np.array(ujson.decode(ujson.encode(arr)), dtype=np.float32)
-        assert_array_almost_equal_nulp(arr, outp)
-        outp = ujson.decode(ujson.encode(arr), numpy=True, dtype=np.float32)
-        assert_array_almost_equal_nulp(arr, outp)
-
-    def testOdArray(self):
-        def will_raise():
-            ujson.encode(np.array(1))
-
-        self.assertRaises(TypeError, will_raise)
-
-    def testArrayNumpyExcept(self):
-
-        input = ujson.dumps([42, {}, 'a'])
-        try:
-            ujson.decode(input, numpy=True)
-            assert False, "Expected exception!"
-        except(TypeError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps(['a', 'b', [], 'c'])
-        try:
-            ujson.decode(input, numpy=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps([['a'], 42])
-        try:
-            ujson.decode(input, numpy=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps([42, ['a'], 42])
-        try:
-            ujson.decode(input, numpy=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps([{}, []])
-        try:
-            ujson.decode(input, numpy=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps([42, None])
-        try:
-            ujson.decode(input, numpy=True)
-            assert False, "Expected exception!"
-        except(TypeError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps([{'a': 'b'}])
-        try:
-            ujson.decode(input, numpy=True, labelled=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps({'a': {'b': {'c': 42}}})
-        try:
-            ujson.decode(input, numpy=True, labelled=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps([{'a': 42, 'b': 23}, {'c': 17}])
-        try:
-            ujson.decode(input, numpy=True, labelled=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-    def testArrayNumpyLabelled(self):
-        input = {'a': []}
-        output = ujson.loads(ujson.dumps(input), numpy=True, labelled=True)
-        self.assertTrue((np.empty((1, 0)) == output[0]).all())
-        self.assertTrue((np.array(['a']) == output[1]).all())
-        self.assertTrue(output[2] is None)
-
-        input = [{'a': 42}]
-        output = ujson.loads(ujson.dumps(input), numpy=True, labelled=True)
-        self.assertTrue((np.array([42]) == output[0]).all())
-        self.assertTrue(output[1] is None)
-        self.assertTrue((np.array([u('a')]) == output[2]).all())
-
-        # Write out the dump explicitly so there is no dependency on iteration order GH10837
-        input_dumps = '[{"a": 42, "b":31}, {"a": 24, "c": 99}, {"a": 2.4, "b": 78}]'
-        output = ujson.loads(input_dumps, numpy=True, labelled=True)
-        expectedvals = np.array([42, 31, 24, 99, 2.4, 78], dtype=int).reshape((3, 2))
-        self.assertTrue((expectedvals == output[0]).all())
-        self.assertTrue(output[1] is None)
-        self.assertTrue((np.array([u('a'), 'b']) == output[2]).all())
-
-        input_dumps = '{"1": {"a": 42, "b":31}, "2": {"a": 24, "c": 99}, "3": {"a": 2.4, "b": 78}}'
-        output = ujson.loads(input_dumps, numpy=True, labelled=True)
-        expectedvals = np.array([42, 31, 24, 99, 2.4, 78], dtype=int).reshape((3, 2))
-        self.assertTrue((expectedvals == output[0]).all())
-        self.assertTrue((np.array(['1', '2', '3']) == output[1]).all())
-        self.assertTrue((np.array(['a', 'b']) == output[2]).all())
-
-
-class PandasJSONTests(TestCase):
-
-    def testDataFrame(self):
-        df = DataFrame([[1,2,3], [4,5,6]], index=['a', 'b'], columns=['x', 'y', 'z'])
-
-        # column indexed
-        outp = DataFrame(ujson.decode(ujson.encode(df)))
-        self.assertTrue((df == outp).values.all())
-        tm.assert_numpy_array_equal(df.columns, outp.columns)
-        tm.assert_numpy_array_equal(df.index, outp.index)
-
-        dec = _clean_dict(ujson.decode(ujson.encode(df, orient="split")))
-        outp = DataFrame(**dec)
-        self.assertTrue((df == outp).values.all())
-        tm.assert_numpy_array_equal(df.columns, outp.columns)
-        tm.assert_numpy_array_equal(df.index, outp.index)
-
-        outp = DataFrame(ujson.decode(ujson.encode(df, orient="records")))
-        outp.index = df.index
-        self.assertTrue((df == outp).values.all())
-        tm.assert_numpy_array_equal(df.columns, outp.columns)
-
-        outp = DataFrame(ujson.decode(ujson.encode(df, orient="values")))
-        outp.index = df.index
-        self.assertTrue((df.values == outp.values).all())
-
-        outp = DataFrame(ujson.decode(ujson.encode(df, orient="index")))
-        self.assertTrue((df.transpose() == outp).values.all())
-        tm.assert_numpy_array_equal(df.transpose().columns, outp.columns)
-        tm.assert_numpy_array_equal(df.transpose().index, outp.index)
-
-    def testDataFrameNumpy(self):
-        df = DataFrame([[1,2,3], [4,5,6]], index=['a', 'b'], columns=['x', 'y', 'z'])
-
-        # column indexed
-        outp = DataFrame(ujson.decode(ujson.encode(df), numpy=True))
-        self.assertTrue((df == outp).values.all())
-        tm.assert_numpy_array_equal(df.columns, outp.columns)
-        tm.assert_numpy_array_equal(df.index, outp.index)
-
-        dec = _clean_dict(ujson.decode(ujson.encode(df, orient="split"),
-                          numpy=True))
-        outp = DataFrame(**dec)
-        self.assertTrue((df == outp).values.all())
-        tm.assert_numpy_array_equal(df.columns, outp.columns)
-        tm.assert_numpy_array_equal(df.index, outp.index)
-
-        outp = DataFrame(ujson.decode(ujson.encode(df, orient="index"), numpy=True))
-        self.assertTrue((df.transpose() == outp).values.all())
-        tm.assert_numpy_array_equal(df.transpose().columns, outp.columns)
-        tm.assert_numpy_array_equal(df.transpose().index, outp.index)
-
-    def testDataFrameNested(self):
-        df = DataFrame([[1,2,3], [4,5,6]], index=['a', 'b'], columns=['x', 'y', 'z'])
-
-        nested = {'df1': df, 'df2': df.copy()}
-
-        exp = {'df1': ujson.decode(ujson.encode(df)),
-               'df2': ujson.decode(ujson.encode(df))}
-        self.assertTrue(ujson.decode(ujson.encode(nested)) == exp)
-
-        exp = {'df1': ujson.decode(ujson.encode(df, orient="index")),
-               'df2': ujson.decode(ujson.encode(df, orient="index"))}
-        self.assertTrue(ujson.decode(ujson.encode(nested, orient="index")) == exp)
-
-        exp = {'df1': ujson.decode(ujson.encode(df, orient="records")),
-               'df2': ujson.decode(ujson.encode(df, orient="records"))}
-        self.assertTrue(ujson.decode(ujson.encode(nested, orient="records")) == exp)
-
-        exp = {'df1': ujson.decode(ujson.encode(df, orient="values")),
-               'df2': ujson.decode(ujson.encode(df, orient="values"))}
-        self.assertTrue(ujson.decode(ujson.encode(nested, orient="values")) == exp)
-
-        exp = {'df1': ujson.decode(ujson.encode(df, orient="split")),
-               'df2': ujson.decode(ujson.encode(df, orient="split"))}
-        self.assertTrue(ujson.decode(ujson.encode(nested, orient="split")) == exp)
-
-    def testDataFrameNumpyLabelled(self):
-        df = DataFrame([[1,2,3], [4,5,6]], index=['a', 'b'], columns=['x', 'y', 'z'])
-
-        # column indexed
-        outp = DataFrame(*ujson.decode(ujson.encode(df), numpy=True, labelled=True))
-        self.assertTrue((df.T == outp).values.all())
-        tm.assert_numpy_array_equal(df.T.columns, outp.columns)
-        tm.assert_numpy_array_equal(df.T.index, outp.index)
-
-        outp = DataFrame(*ujson.decode(ujson.encode(df, orient="records"), numpy=True, labelled=True))
-        outp.index = df.index
-        self.assertTrue((df == outp).values.all())
-        tm.assert_numpy_array_equal(df.columns, outp.columns)
-
-        outp = DataFrame(*ujson.decode(ujson.encode(df, orient="index"), numpy=True, labelled=True))
-        self.assertTrue((df == outp).values.all())
-        tm.assert_numpy_array_equal(df.columns, outp.columns)
-        tm.assert_numpy_array_equal(df.index, outp.index)
-
-    def testSeries(self):
-        s = Series([10, 20, 30, 40, 50, 60], name="series", index=[6,7,8,9,10,15]).sort_values()
-
-        # column indexed
-        outp = Series(ujson.decode(ujson.encode(s))).sort_values()
-        self.assertTrue((s == outp).values.all())
-
-        outp = Series(ujson.decode(ujson.encode(s), numpy=True)).sort_values()
-        self.assertTrue((s == outp).values.all())
-
-        dec = _clean_dict(ujson.decode(ujson.encode(s, orient="split")))
-        outp = Series(**dec)
-        self.assertTrue((s == outp).values.all())
-        self.assertTrue(s.name == outp.name)
-
-        dec = _clean_dict(ujson.decode(ujson.encode(s, orient="split"),
-                          numpy=True))
-        outp = Series(**dec)
-        self.assertTrue((s == outp).values.all())
-        self.assertTrue(s.name == outp.name)
-
-        outp = Series(ujson.decode(ujson.encode(s, orient="records"), numpy=True))
-        self.assertTrue((s == outp).values.all())
-
-        outp = Series(ujson.decode(ujson.encode(s, orient="records")))
-        self.assertTrue((s == outp).values.all())
-
-        outp = Series(ujson.decode(ujson.encode(s, orient="values"), numpy=True))
-        self.assertTrue((s == outp).values.all())
-
-        outp = Series(ujson.decode(ujson.encode(s, orient="values")))
-        self.assertTrue((s == outp).values.all())
-
-        outp = Series(ujson.decode(ujson.encode(s, orient="index"))).sort_values()
-        self.assertTrue((s == outp).values.all())
-
-        outp = Series(ujson.decode(ujson.encode(s, orient="index"), numpy=True)).sort_values()
-        self.assertTrue((s == outp).values.all())
-
-    def testSeriesNested(self):
-        s = Series([10, 20, 30, 40, 50, 60], name="series", index=[6,7,8,9,10,15]).sort_values()
-
-        nested = {'s1': s, 's2': s.copy()}
-
-        exp = {'s1': ujson.decode(ujson.encode(s)),
-               's2': ujson.decode(ujson.encode(s))}
-        self.assertTrue(ujson.decode(ujson.encode(nested)) == exp)
-
-        exp = {'s1': ujson.decode(ujson.encode(s, orient="split")),
-               's2': ujson.decode(ujson.encode(s, orient="split"))}
-        self.assertTrue(ujson.decode(ujson.encode(nested, orient="split")) == exp)
-
-        exp = {'s1': ujson.decode(ujson.encode(s, orient="records")),
-               's2': ujson.decode(ujson.encode(s, orient="records"))}
-        self.assertTrue(ujson.decode(ujson.encode(nested, orient="records")) == exp)
-
-        exp = {'s1': ujson.decode(ujson.encode(s, orient="values")),
-               's2': ujson.decode(ujson.encode(s, orient="values"))}
-        self.assertTrue(ujson.decode(ujson.encode(nested, orient="values")) == exp)
-
-        exp = {'s1': ujson.decode(ujson.encode(s, orient="index")),
-               's2': ujson.decode(ujson.encode(s, orient="index"))}
-        self.assertTrue(ujson.decode(ujson.encode(nested, orient="index")) == exp)
-
-    def testIndex(self):
-        i = Index([23, 45, 18, 98, 43, 11], name="index")
-
-        # column indexed
-        outp = Index(ujson.decode(ujson.encode(i)))
-        self.assertTrue(i.equals(outp))
-
-        outp = Index(ujson.decode(ujson.encode(i), numpy=True))
-        self.assertTrue(i.equals(outp))
-
-        dec = _clean_dict(ujson.decode(ujson.encode(i, orient="split")))
-        outp = Index(**dec)
-        self.assertTrue(i.equals(outp))
-        self.assertTrue(i.name == outp.name)
-
-        dec = _clean_dict(ujson.decode(ujson.encode(i, orient="split"),
-                          numpy=True))
-        outp = Index(**dec)
-        self.assertTrue(i.equals(outp))
-        self.assertTrue(i.name == outp.name)
-
-        outp = Index(ujson.decode(ujson.encode(i, orient="values")))
-        self.assertTrue(i.equals(outp))
-
-        outp = Index(ujson.decode(ujson.encode(i, orient="values"), numpy=True))
-        self.assertTrue(i.equals(outp))
-
-        outp = Index(ujson.decode(ujson.encode(i, orient="records")))
-        self.assertTrue(i.equals(outp))
-
-        outp = Index(ujson.decode(ujson.encode(i, orient="records"), numpy=True))
-        self.assertTrue(i.equals(outp))
-
-        outp = Index(ujson.decode(ujson.encode(i, orient="index")))
-        self.assertTrue(i.equals(outp))
-
-        outp = Index(ujson.decode(ujson.encode(i, orient="index"), numpy=True))
-        self.assertTrue(i.equals(outp))
-
-    def test_datetimeindex(self):
-        from pandas.tseries.index import date_range
-
-        rng = date_range('1/1/2000', periods=20)
-
-        encoded = ujson.encode(rng, date_unit='ns')
-        decoded = DatetimeIndex(np.array(ujson.decode(encoded)))
-
-        self.assertTrue(rng.equals(decoded))
-
-        ts = Series(np.random.randn(len(rng)), index=rng)
-        decoded = Series(ujson.decode(ujson.encode(ts, date_unit='ns')))
-        idx_values = decoded.index.values.astype(np.int64)
-        decoded.index = DatetimeIndex(idx_values)
-        tm.assert_series_equal(ts, decoded)
-
-    def test_decodeArrayTrailingCommaFail(self):
-        input = "[31337,]"
-        try:
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeArrayLeadingCommaFail(self):
-        input = "[,31337]"
-        try:
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeArrayOnlyCommaFail(self):
-        input = "[,]"
-        try:
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeArrayUnmatchedBracketFail(self):
-        input = "[]]"
-        try:
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeArrayEmpty(self):
-        input = "[]"
-        ujson.decode(input)
-
-    def test_decodeArrayOneItem(self):
-        input = "[31337]"
-        ujson.decode(input)
-
-    def test_decodeBigValue(self):
-        input = "9223372036854775807"
-        ujson.decode(input)
-
-    def test_decodeSmallValue(self):
-        input = "-9223372036854775808"
-        ujson.decode(input)
-
-    def test_decodeTooBigValue(self):
-        try:
-            input = "9223372036854775808"
-            ujson.decode(input)
-        except ValueError as e:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeTooSmallValue(self):
-        try:
-            input = "-90223372036854775809"
-            ujson.decode(input)
-        except ValueError as e:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeVeryTooBigValue(self):
-        try:
-            input = "9223372036854775808"
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeVeryTooSmallValue(self):
-        try:
-            input = "-90223372036854775809"
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeWithTrailingWhitespaces(self):
-        input = "{}\n\t "
-        ujson.decode(input)
-
-    def test_decodeWithTrailingNonWhitespaces(self):
-        try:
-            input = "{}\n\t a"
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeArrayWithBigInt(self):
-        try:
-            ujson.loads('[18446098363113800555]')
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeArrayFaultyUnicode(self):
-        try:
-            ujson.loads('[18446098363113800555]')
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeFloatingPointAdditionalTests(self):
-        places = 15
-
-        self.assertAlmostEqual(-1.1234567893, ujson.loads("-1.1234567893"), places=places)
-        self.assertAlmostEqual(-1.234567893, ujson.loads("-1.234567893"), places=places)
-        self.assertAlmostEqual(-1.34567893, ujson.loads("-1.34567893"), places=places)
-        self.assertAlmostEqual(-1.4567893, ujson.loads("-1.4567893"), places=places)
-        self.assertAlmostEqual(-1.567893, ujson.loads("-1.567893"), places=places)
-        self.assertAlmostEqual(-1.67893, ujson.loads("-1.67893"), places=places)
-        self.assertAlmostEqual(-1.7893, ujson.loads("-1.7893"), places=places)
-        self.assertAlmostEqual(-1.893, ujson.loads("-1.893"), places=places)
-        self.assertAlmostEqual(-1.3, ujson.loads("-1.3"), places=places)
-
-        self.assertAlmostEqual(1.1234567893, ujson.loads("1.1234567893"), places=places)
-        self.assertAlmostEqual(1.234567893, ujson.loads("1.234567893"), places=places)
-        self.assertAlmostEqual(1.34567893, ujson.loads("1.34567893"), places=places)
-        self.assertAlmostEqual(1.4567893, ujson.loads("1.4567893"), places=places)
-        self.assertAlmostEqual(1.567893, ujson.loads("1.567893"), places=places)
-        self.assertAlmostEqual(1.67893, ujson.loads("1.67893"), places=places)
-        self.assertAlmostEqual(1.7893, ujson.loads("1.7893"), places=places)
-        self.assertAlmostEqual(1.893, ujson.loads("1.893"), places=places)
-        self.assertAlmostEqual(1.3, ujson.loads("1.3"), places=places)
-
-    def test_encodeBigSet(self):
-        s = set()
-        for x in range(0, 100000):
-            s.add(x)
-        ujson.encode(s)
-
-    def test_encodeEmptySet(self):
-        s = set()
-        self.assertEqual("[]", ujson.encode(s))
-
-    def test_encodeSet(self):
-        s = set([1,2,3,4,5,6,7,8,9])
-        enc = ujson.encode(s)
-        dec = ujson.decode(enc)
-
-        for v in dec:
-            self.assertTrue(v in s)
-
-
-def _clean_dict(d):
-    return dict((str(k), v) for k, v in compat.iteritems(d))
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__,'-vvs','-x','--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/io/tests/test_json_norm.py b/pandas/io/tests/test_json_norm.py
deleted file mode 100644
index 8084446d2d246..0000000000000
--- a/pandas/io/tests/test_json_norm.py
+++ /dev/null
@@ -1,207 +0,0 @@
-import nose
-
-from pandas import DataFrame
-import numpy as np
-
-import pandas.util.testing as tm
-
-from pandas.io.json import json_normalize, nested_to_record
-
-def _assert_equal_data(left, right):
-    if not left.columns.equals(right.columns):
-        left = left.reindex(columns=right.columns)
-
-    tm.assert_frame_equal(left, right)
-
-
-class TestJSONNormalize(tm.TestCase):
-
-    def setUp(self):
-        self.state_data = [
-             {'counties': [{'name': 'Dade', 'population': 12345},
-                           {'name': 'Broward', 'population': 40000},
-                           {'name': 'Palm Beach', 'population': 60000}],
-              'info': {'governor': 'Rick Scott'},
-              'shortname': 'FL',
-              'state': 'Florida'},
-             {'counties': [{'name': 'Summit', 'population': 1234},
-                           {'name': 'Cuyahoga', 'population': 1337}],
-              'info': {'governor': 'John Kasich'},
-              'shortname': 'OH',
-              'state': 'Ohio'}]
-
-    def test_simple_records(self):
-        recs = [{'a': 1, 'b': 2, 'c': 3},
-                {'a': 4, 'b': 5, 'c': 6},
-                {'a': 7, 'b': 8, 'c': 9},
-                {'a': 10, 'b': 11, 'c': 12}]
-
-        result = json_normalize(recs)
-        expected = DataFrame(recs)
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_simple_normalize(self):
-        result = json_normalize(self.state_data[0], 'counties')
-        expected = DataFrame(self.state_data[0]['counties'])
-        tm.assert_frame_equal(result, expected)
-
-        result = json_normalize(self.state_data, 'counties')
-
-        expected = []
-        for rec in self.state_data:
-            expected.extend(rec['counties'])
-        expected = DataFrame(expected)
-
-        tm.assert_frame_equal(result, expected)
-
-        result = json_normalize(self.state_data, 'counties', meta='state')
-        expected['state'] = np.array(['Florida', 'Ohio']).repeat([3, 2])
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_more_deeply_nested(self):
-        data = [{'country': 'USA',
-                 'states': [{'name': 'California',
-                             'cities': [{'name': 'San Francisco',
-                                         'pop': 12345},
-                                        {'name': 'Los Angeles',
-                                         'pop': 12346}]
-                            },
-                            {'name': 'Ohio',
-                             'cities': [{'name': 'Columbus',
-                                         'pop': 1234},
-                                        {'name': 'Cleveland',
-                                         'pop': 1236}]}
-                           ]
-                 },
-                {'country': 'Germany',
-                 'states': [{'name': 'Bayern',
-                             'cities': [{'name': 'Munich', 'pop': 12347}]
-                            },
-                            {'name': 'Nordrhein-Westfalen',
-                             'cities': [{'name': 'Duesseldorf', 'pop': 1238},
-                                        {'name': 'Koeln', 'pop': 1239}]}
-                           ]
-                 }
-                ]
-
-        result = json_normalize(data, ['states', 'cities'],
-                                meta=['country', ['states', 'name']])
-                                # meta_prefix={'states': 'state_'})
-
-        ex_data = {'country': ['USA'] * 4 + ['Germany'] * 3,
-                   'states.name': ['California', 'California', 'Ohio', 'Ohio',
-                                   'Bayern', 'Nordrhein-Westfalen',
-                                   'Nordrhein-Westfalen'],
-                   'name': ['San Francisco', 'Los Angeles', 'Columbus',
-                            'Cleveland', 'Munich', 'Duesseldorf', 'Koeln'],
-                   'pop': [12345, 12346, 1234, 1236, 12347, 1238, 1239]}
-
-        expected = DataFrame(ex_data, columns=result.columns)
-        tm.assert_frame_equal(result, expected)
-
-    def test_shallow_nested(self):
-        data = [{'state': 'Florida',
-                 'shortname': 'FL',
-                 'info': {
-                      'governor': 'Rick Scott'
-                 },
-                 'counties': [{'name': 'Dade', 'population': 12345},
-                             {'name': 'Broward', 'population': 40000},
-                             {'name': 'Palm Beach', 'population': 60000}]},
-                {'state': 'Ohio',
-                 'shortname': 'OH',
-                 'info': {
-                      'governor': 'John Kasich'
-                 },
-                 'counties': [{'name': 'Summit', 'population': 1234},
-                              {'name': 'Cuyahoga', 'population': 1337}]}]
-
-        result = json_normalize(data, 'counties',
-                                ['state', 'shortname',
-                                 ['info', 'governor']])
-        ex_data = {'name': ['Dade', 'Broward', 'Palm Beach', 'Summit',
-                            'Cuyahoga'],
-                   'state': ['Florida'] * 3 + ['Ohio'] * 2,
-                   'shortname': ['FL', 'FL', 'FL', 'OH', 'OH'],
-                   'info.governor': ['Rick Scott'] * 3 + ['John Kasich'] * 2,
-                   'population': [12345, 40000, 60000, 1234, 1337]}
-        expected = DataFrame(ex_data, columns=result.columns)
-        tm.assert_frame_equal(result, expected)
-
-    def test_meta_name_conflict(self):
-        data = [{'foo': 'hello',
-                 'bar': 'there',
-                 'data': [{'foo': 'something', 'bar': 'else'},
-                          {'foo': 'something2', 'bar': 'else2'}]}]
-
-        self.assertRaises(ValueError, json_normalize, data,
-                          'data', meta=['foo', 'bar'])
-
-        result = json_normalize(data, 'data', meta=['foo', 'bar'],
-                                meta_prefix='meta')
-
-        for val in ['metafoo', 'metabar', 'foo', 'bar']:
-            self.assertTrue(val in result)
-
-    def test_record_prefix(self):
-        result = json_normalize(self.state_data[0], 'counties')
-        expected = DataFrame(self.state_data[0]['counties'])
-        tm.assert_frame_equal(result, expected)
-
-        result = json_normalize(self.state_data, 'counties',
-                                meta='state',
-                                record_prefix='county_')
-
-        expected = []
-        for rec in self.state_data:
-            expected.extend(rec['counties'])
-        expected = DataFrame(expected)
-        expected = expected.rename(columns=lambda x: 'county_' + x)
-        expected['state'] = np.array(['Florida', 'Ohio']).repeat([3, 2])
-
-        tm.assert_frame_equal(result, expected)
-
-
-class TestNestedToRecord(tm.TestCase):
-
-    def test_flat_stays_flat(self):
-        recs = [dict(flat1=1,flat2=2),
-                dict(flat1=3,flat2=4),
-                ]
-
-        result = nested_to_record(recs)
-        expected = recs
-        self.assertEqual(result, expected)
-
-    def test_one_level_deep_flattens(self):
-        data = dict(flat1=1,
-                    dict1=dict(c=1,d=2))
-
-        result = nested_to_record(data)
-        expected =     {'dict1.c': 1,
-             'dict1.d': 2,
-             'flat1': 1}
-
-        self.assertEqual(result,expected)
-
-    def test_nested_flattens(self):
-        data = dict(flat1=1,
-                    dict1=dict(c=1,d=2),
-                    nested=dict(e=dict(c=1,d=2),
-                                d=2))
-
-        result = nested_to_record(data)
-        expected =     {'dict1.c': 1,
-             'dict1.d': 2,
-             'flat1': 1,
-             'nested.d': 2,
-             'nested.e.c': 1,
-             'nested.e.d': 2}
-
-        self.assertEqual(result,expected)
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb',
-                         '--pdb-failure', '-s'], exit=False)
diff --git a/pandas/io/tests/test_packers.py b/pandas/io/tests/test_packers.py
deleted file mode 100644
index 894b699281c80..0000000000000
--- a/pandas/io/tests/test_packers.py
+++ /dev/null
@@ -1,641 +0,0 @@
-import nose
-
-import os
-import datetime
-import numpy as np
-import sys
-from distutils.version import LooseVersion
-
-from pandas import compat
-from pandas.compat import u
-from pandas import (Series, DataFrame, Panel, MultiIndex, bdate_range,
-                    date_range, period_range, Index, SparseSeries, SparseDataFrame,
-                    SparsePanel)
-import pandas.util.testing as tm
-from pandas.util.testing import ensure_clean, assert_index_equal
-from pandas.tests.test_series import assert_series_equal
-from pandas.tests.test_frame import assert_frame_equal
-from pandas.tests.test_panel import assert_panel_equal
-
-import pandas
-from pandas.sparse.tests.test_sparse import assert_sp_series_equal, assert_sp_frame_equal
-from pandas import Timestamp, tslib
-
-nan = np.nan
-
-from pandas.io.packers import to_msgpack, read_msgpack
-
-_multiprocess_can_split_ = False
-
-
-def check_arbitrary(a, b):
-
-    if isinstance(a, (list, tuple)) and isinstance(b, (list, tuple)):
-        assert(len(a) == len(b))
-        for a_, b_ in zip(a, b):
-            check_arbitrary(a_, b_)
-    elif isinstance(a, Panel):
-        assert_panel_equal(a, b)
-    elif isinstance(a, DataFrame):
-        assert_frame_equal(a, b)
-    elif isinstance(a, Series):
-        assert_series_equal(a, b)
-    elif isinstance(a, Index):
-        assert_index_equal(a, b)
-    else:
-        assert(a == b)
-
-class TestPackers(tm.TestCase):
-
-    def setUp(self):
-        self.path = '__%s__.msg' % tm.rands(10)
-
-    def tearDown(self):
-        pass
-
-    def encode_decode(self, x, compress=None, **kwargs):
-        with ensure_clean(self.path) as p:
-            to_msgpack(p, x, compress=compress, **kwargs)
-            return read_msgpack(p, **kwargs)
-
-class TestAPI(TestPackers):
-
-    def test_string_io(self):
-
-        df = DataFrame(np.random.randn(10,2))
-        s = df.to_msgpack(None)
-        result = read_msgpack(s)
-        tm.assert_frame_equal(result,df)
-
-        s = df.to_msgpack()
-        result = read_msgpack(s)
-        tm.assert_frame_equal(result,df)
-
-        s = df.to_msgpack()
-        result = read_msgpack(compat.BytesIO(s))
-        tm.assert_frame_equal(result,df)
-
-        s = to_msgpack(None,df)
-        result = read_msgpack(s)
-        tm.assert_frame_equal(result, df)
-
-        with ensure_clean(self.path) as p:
-
-            s = df.to_msgpack()
-            fh = open(p,'wb')
-            fh.write(s)
-            fh.close()
-            result = read_msgpack(p)
-            tm.assert_frame_equal(result, df)
-
-    def test_iterator_with_string_io(self):
-
-        dfs = [ DataFrame(np.random.randn(10,2)) for i in range(5) ]
-        s = to_msgpack(None,*dfs)
-        for i, result in enumerate(read_msgpack(s,iterator=True)):
-            tm.assert_frame_equal(result,dfs[i])
-
-    def test_invalid_arg(self):
-        #GH10369
-        class A(object):
-            def __init__(self):
-                self.read = 0
-
-        tm.assertRaises(ValueError, read_msgpack, path_or_buf=None)
-        tm.assertRaises(ValueError, read_msgpack, path_or_buf={})
-        tm.assertRaises(ValueError, read_msgpack, path_or_buf=A())
-
-
-class TestNumpy(TestPackers):
-
-    def test_numpy_scalar_float(self):
-        x = np.float32(np.random.rand())
-        x_rec = self.encode_decode(x)
-        tm.assert_almost_equal(x,x_rec)
-
-    def test_numpy_scalar_complex(self):
-        x = np.complex64(np.random.rand() + 1j * np.random.rand())
-        x_rec = self.encode_decode(x)
-        self.assertTrue(np.allclose(x, x_rec))
-
-    def test_scalar_float(self):
-        x = np.random.rand()
-        x_rec = self.encode_decode(x)
-        tm.assert_almost_equal(x,x_rec)
-
-    def test_scalar_complex(self):
-        x = np.random.rand() + 1j * np.random.rand()
-        x_rec = self.encode_decode(x)
-        self.assertTrue(np.allclose(x, x_rec))
-
-    def test_list_numpy_float(self):
-        x = [np.float32(np.random.rand()) for i in range(5)]
-        x_rec = self.encode_decode(x)
-        tm.assert_almost_equal(x,x_rec)
-
-    def test_list_numpy_float_complex(self):
-        if not hasattr(np, 'complex128'):
-            raise nose.SkipTest('numpy cant handle complex128')
-
-        x = [np.float32(np.random.rand()) for i in range(5)] + \
-            [np.complex128(np.random.rand() + 1j * np.random.rand())
-             for i in range(5)]
-        x_rec = self.encode_decode(x)
-        self.assertTrue(np.allclose(x, x_rec))
-
-    def test_list_float(self):
-        x = [np.random.rand() for i in range(5)]
-        x_rec = self.encode_decode(x)
-        tm.assert_almost_equal(x,x_rec)
-
-    def test_list_float_complex(self):
-        x = [np.random.rand() for i in range(5)] + \
-            [(np.random.rand() + 1j * np.random.rand()) for i in range(5)]
-        x_rec = self.encode_decode(x)
-        self.assertTrue(np.allclose(x, x_rec))
-
-    def test_dict_float(self):
-        x = {'foo': 1.0, 'bar': 2.0}
-        x_rec = self.encode_decode(x)
-        tm.assert_almost_equal(x,x_rec)
-
-    def test_dict_complex(self):
-        x = {'foo': 1.0 + 1.0j, 'bar': 2.0 + 2.0j}
-        x_rec = self.encode_decode(x)
-        self.assertEqual(x, x_rec)
-        for key in x:
-            self.assertEqual(type(x[key]), type(x_rec[key]))
-
-    def test_dict_numpy_float(self):
-        x = {'foo': np.float32(1.0), 'bar': np.float32(2.0)}
-        x_rec = self.encode_decode(x)
-        tm.assert_almost_equal(x,x_rec)
-
-    def test_dict_numpy_complex(self):
-        x = {'foo': np.complex128(1.0 + 1.0j),
-             'bar': np.complex128(2.0 + 2.0j)}
-        x_rec = self.encode_decode(x)
-        self.assertEqual(x, x_rec)
-        for key in x:
-            self.assertEqual(type(x[key]), type(x_rec[key]))
-
-    def test_numpy_array_float(self):
-
-        # run multiple times
-        for n in range(10):
-            x = np.random.rand(10)
-            for dtype in ['float32','float64']:
-                x = x.astype(dtype)
-                x_rec = self.encode_decode(x)
-                tm.assert_almost_equal(x,x_rec)
-
-    def test_numpy_array_complex(self):
-        x = (np.random.rand(5) + 1j * np.random.rand(5)).astype(np.complex128)
-        x_rec = self.encode_decode(x)
-        self.assertTrue(all(map(lambda x, y: x == y, x, x_rec)) and
-                        x.dtype == x_rec.dtype)
-
-    def test_list_mixed(self):
-        x = [1.0, np.float32(3.5), np.complex128(4.25), u('foo')]
-        x_rec = self.encode_decode(x)
-        tm.assert_almost_equal(x,x_rec)
-
-class TestBasic(TestPackers):
-
-    def test_timestamp(self):
-
-        for i in [Timestamp(
-            '20130101'), Timestamp('20130101', tz='US/Eastern'),
-                Timestamp('201301010501')]:
-            i_rec = self.encode_decode(i)
-            self.assertEqual(i, i_rec)
-
-    def test_datetimes(self):
-
-        # fails under 2.6/win32 (np.datetime64 seems broken)
-
-        if LooseVersion(sys.version) < '2.7':
-            raise nose.SkipTest('2.6 with np.datetime64 is broken')
-
-        for i in [datetime.datetime(
-            2013, 1, 1), datetime.datetime(2013, 1, 1, 5, 1),
-                datetime.date(2013, 1, 1), np.datetime64(datetime.datetime(2013, 1, 5, 2, 15))]:
-            i_rec = self.encode_decode(i)
-            self.assertEqual(i, i_rec)
-
-    def test_timedeltas(self):
-
-        for i in [datetime.timedelta(days=1),
-                  datetime.timedelta(days=1, seconds=10),
-                  np.timedelta64(1000000)]:
-            i_rec = self.encode_decode(i)
-            self.assertEqual(i, i_rec)
-
-
-class TestIndex(TestPackers):
-
-    def setUp(self):
-        super(TestIndex, self).setUp()
-
-        self.d = {
-            'string': tm.makeStringIndex(100),
-            'date': tm.makeDateIndex(100),
-            'int': tm.makeIntIndex(100),
-            'float': tm.makeFloatIndex(100),
-            'empty': Index([]),
-            'tuple': Index(zip(['foo', 'bar', 'baz'], [1, 2, 3])),
-            'period': Index(period_range('2012-1-1', freq='M', periods=3)),
-            'date2': Index(date_range('2013-01-1', periods=10)),
-            'bdate': Index(bdate_range('2013-01-02', periods=10)),
-        }
-
-        self.mi = {
-            'reg': MultiIndex.from_tuples([('bar', 'one'), ('baz', 'two'), ('foo', 'two'),
-                                           ('qux', 'one'), ('qux', 'two')], names=['first', 'second']),
-        }
-
-    def test_basic_index(self):
-
-        for s, i in self.d.items():
-            i_rec = self.encode_decode(i)
-            self.assertTrue(i.equals(i_rec))
-
-        # datetime with no freq (GH5506)
-        i = Index([Timestamp('20130101'),Timestamp('20130103')])
-        i_rec = self.encode_decode(i)
-        self.assertTrue(i.equals(i_rec))
-
-        # datetime with timezone
-        i = Index([Timestamp('20130101 9:00:00'),Timestamp('20130103 11:00:00')]).tz_localize('US/Eastern')
-        i_rec = self.encode_decode(i)
-        self.assertTrue(i.equals(i_rec))
-
-    def test_multi_index(self):
-
-        for s, i in self.mi.items():
-            i_rec = self.encode_decode(i)
-            self.assertTrue(i.equals(i_rec))
-
-    def test_unicode(self):
-        i = tm.makeUnicodeIndex(100)
-
-        # this currently fails
-        self.assertRaises(UnicodeEncodeError, self.encode_decode, i)
-
-        #i_rec = self.encode_decode(i)
-        #self.assertTrue(i.equals(i_rec))
-
-
-class TestSeries(TestPackers):
-
-    def setUp(self):
-        super(TestSeries, self).setUp()
-
-        self.d = {}
-
-        s = tm.makeStringSeries()
-        s.name = 'string'
-        self.d['string'] = s
-
-        s = tm.makeObjectSeries()
-        s.name = 'object'
-        self.d['object'] = s
-
-        s = Series(tslib.iNaT, dtype='M8[ns]', index=range(5))
-        self.d['date'] = s
-
-        data = {
-            'A': [0., 1., 2., 3., np.nan],
-            'B': [0, 1, 0, 1, 0],
-            'C': ['foo1', 'foo2', 'foo3', 'foo4', 'foo5'],
-            'D': date_range('1/1/2009', periods=5),
-            'E': [0., 1, Timestamp('20100101'), 'foo', 2.],
-        }
-
-        self.d['float'] = Series(data['A'])
-        self.d['int'] = Series(data['B'])
-        self.d['mixed'] = Series(data['E'])
-
-    def test_basic(self):
-
-        # run multiple times here
-        for n in range(10):
-            for s, i in self.d.items():
-                i_rec = self.encode_decode(i)
-                assert_series_equal(i, i_rec)
-
-
-class TestNDFrame(TestPackers):
-
-    def setUp(self):
-        super(TestNDFrame, self).setUp()
-
-        data = {
-            'A': [0., 1., 2., 3., np.nan],
-            'B': [0, 1, 0, 1, 0],
-            'C': ['foo1', 'foo2', 'foo3', 'foo4', 'foo5'],
-            'D': date_range('1/1/2009', periods=5),
-            'E': [0., 1, Timestamp('20100101'), 'foo', 2.],
-        }
-
-        self.frame = {
-            'float': DataFrame(dict(A=data['A'], B=Series(data['A']) + 1)),
-            'int': DataFrame(dict(A=data['B'], B=Series(data['B']) + 1)),
-            'mixed': DataFrame(dict([(k, data[k]) for k in ['A', 'B', 'C', 'D']]))}
-
-        self.panel = {
-            'float': Panel(dict(ItemA=self.frame['float'], ItemB=self.frame['float'] + 1))}
-
-    def test_basic_frame(self):
-
-        for s, i in self.frame.items():
-            i_rec = self.encode_decode(i)
-            assert_frame_equal(i, i_rec)
-
-    def test_basic_panel(self):
-
-        for s, i in self.panel.items():
-            i_rec = self.encode_decode(i)
-            assert_panel_equal(i, i_rec)
-
-    def test_multi(self):
-
-        i_rec = self.encode_decode(self.frame)
-        for k in self.frame.keys():
-            assert_frame_equal(self.frame[k], i_rec[k])
-
-        l = tuple(
-            [self.frame['float'], self.frame['float'].A, self.frame['float'].B, None])
-        l_rec = self.encode_decode(l)
-        check_arbitrary(l, l_rec)
-
-        # this is an oddity in that packed lists will be returned as tuples
-        l = [self.frame['float'], self.frame['float']
-             .A, self.frame['float'].B, None]
-        l_rec = self.encode_decode(l)
-        self.assertIsInstance(l_rec, tuple)
-        check_arbitrary(l, l_rec)
-
-    def test_iterator(self):
-
-        l = [self.frame['float'], self.frame['float']
-             .A, self.frame['float'].B, None]
-
-        with ensure_clean(self.path) as path:
-            to_msgpack(path, *l)
-            for i, packed in enumerate(read_msgpack(path, iterator=True)):
-                check_arbitrary(packed, l[i])
-
-    def tests_datetimeindex_freq_issue(self):
-
-        # GH 5947
-        # inferring freq on the datetimeindex
-        df = DataFrame([1, 2, 3], index=date_range('1/1/2013', '1/3/2013'))
-        result = self.encode_decode(df)
-        assert_frame_equal(result, df)
-
-        df = DataFrame([1, 2], index=date_range('1/1/2013', '1/2/2013'))
-        result = self.encode_decode(df)
-        assert_frame_equal(result, df)
-
-    def test_dataframe_duplicate_column_names(self):
-
-        # GH 9618
-        expected_1 = DataFrame(columns=['a', 'a'])
-        expected_2 = DataFrame(columns=[1]*100)
-        expected_2.loc[0] = np.random.randn(100)
-        expected_3 = DataFrame(columns=[1, 1])
-        expected_3.loc[0] = ['abc', np.nan]
-
-        result_1 = self.encode_decode(expected_1)
-        result_2 = self.encode_decode(expected_2)
-        result_3 = self.encode_decode(expected_3)
-
-        assert_frame_equal(result_1, expected_1)
-        assert_frame_equal(result_2, expected_2)
-        assert_frame_equal(result_3, expected_3)
-
-
-class TestSparse(TestPackers):
-
-    def _check_roundtrip(self, obj, comparator, **kwargs):
-
-        # currently these are not implemetned
-        #i_rec = self.encode_decode(obj)
-        #comparator(obj, i_rec, **kwargs)
-        self.assertRaises(NotImplementedError, self.encode_decode, obj)
-
-    def test_sparse_series(self):
-
-        s = tm.makeStringSeries()
-        s[3:5] = np.nan
-        ss = s.to_sparse()
-        self._check_roundtrip(ss, tm.assert_series_equal,
-                              check_series_type=True)
-
-        ss2 = s.to_sparse(kind='integer')
-        self._check_roundtrip(ss2, tm.assert_series_equal,
-                              check_series_type=True)
-
-        ss3 = s.to_sparse(fill_value=0)
-        self._check_roundtrip(ss3, tm.assert_series_equal,
-                              check_series_type=True)
-
-    def test_sparse_frame(self):
-
-        s = tm.makeDataFrame()
-        s.ix[3:5, 1:3] = np.nan
-        s.ix[8:10, -2] = np.nan
-        ss = s.to_sparse()
-
-        self._check_roundtrip(ss, tm.assert_frame_equal,
-                              check_frame_type=True)
-
-        ss2 = s.to_sparse(kind='integer')
-        self._check_roundtrip(ss2, tm.assert_frame_equal,
-                              check_frame_type=True)
-
-        ss3 = s.to_sparse(fill_value=0)
-        self._check_roundtrip(ss3, tm.assert_frame_equal,
-                              check_frame_type=True)
-
-    def test_sparse_panel(self):
-
-        items = ['x', 'y', 'z']
-        p = Panel(dict((i, tm.makeDataFrame().ix[:2, :2]) for i in items))
-        sp = p.to_sparse()
-
-        self._check_roundtrip(sp, tm.assert_panel_equal,
-                              check_panel_type=True)
-
-        sp2 = p.to_sparse(kind='integer')
-        self._check_roundtrip(sp2, tm.assert_panel_equal,
-                              check_panel_type=True)
-
-        sp3 = p.to_sparse(fill_value=0)
-        self._check_roundtrip(sp3, tm.assert_panel_equal,
-                              check_panel_type=True)
-
-
-class TestCompression(TestPackers):
-    """See https://github.com/pydata/pandas/pull/9783
-    """
-
-    def setUp(self):
-        super(TestCompression, self).setUp()
-        data = {
-            'A': np.arange(1000, dtype=np.float64),
-            'B': np.arange(1000, dtype=np.int32),
-            'C': list(100 * 'abcdefghij'),
-            'D': date_range(datetime.datetime(2015, 4, 1), periods=1000),
-            'E': [datetime.timedelta(days=x) for x in range(1000)],
-        }
-        self.frame = {
-            'float': DataFrame(dict((k, data[k]) for k in ['A', 'A'])),
-            'int': DataFrame(dict((k, data[k]) for k in ['B', 'B'])),
-            'mixed': DataFrame(data),
-        }
-
-    def test_plain(self):
-        i_rec = self.encode_decode(self.frame)
-        for k in self.frame.keys():
-            assert_frame_equal(self.frame[k], i_rec[k])
-
-    def test_compression_zlib(self):
-        i_rec = self.encode_decode(self.frame, compress='zlib')
-        for k in self.frame.keys():
-            assert_frame_equal(self.frame[k], i_rec[k])
-
-    def test_compression_blosc(self):
-        try:
-            import blosc
-        except ImportError:
-            raise nose.SkipTest('no blosc')
-        i_rec = self.encode_decode(self.frame, compress='blosc')
-        for k in self.frame.keys():
-            assert_frame_equal(self.frame[k], i_rec[k])
-
-
-class TestEncoding(TestPackers):
-        def setUp(self):
-            super(TestEncoding, self).setUp()
-            data = {
-                'A': [compat.u('\u2019')] * 1000,
-                'B': np.arange(1000, dtype=np.int32),
-                'C': list(100 * 'abcdefghij'),
-                'D': date_range(datetime.datetime(2015, 4, 1), periods=1000),
-                'E': [datetime.timedelta(days=x) for x in range(1000)],
-                'G': [400] * 1000
-            }
-            self.frame = {
-                'float': DataFrame(dict((k, data[k]) for k in ['A', 'A'])),
-                'int': DataFrame(dict((k, data[k]) for k in ['B', 'B'])),
-                'mixed': DataFrame(data),
-            }
-            self.utf_encodings = ['utf8', 'utf16', 'utf32']
-
-        def test_utf(self):
-            # GH10581
-            for encoding in self.utf_encodings:
-                for frame in compat.itervalues(self.frame):
-                    result = self.encode_decode(frame, encoding=encoding)
-                    assert_frame_equal(result, frame)
-
-
-class TestMsgpack():
-    """
-    How to add msgpack tests:
-
-    1. Install pandas version intended to output the msgpack.
-TestPackers
-    2. Execute "generate_legacy_storage_files.py" to create the msgpack.
-    $ python generate_legacy_storage_files.py <output_dir> msgpack
-
-    3. Move the created pickle to "data/legacy_msgpack/<version>" directory.
-
-    NOTE: TestMsgpack can't be a subclass of tm.Testcase to use test generator.
-    http://stackoverflow.com/questions/6689537/nose-test-generators-inside-class
-    """
-    def setUp(self):
-        from pandas.io.tests.generate_legacy_storage_files import (
-            create_msgpack_data, create_data)
-        self.data = create_msgpack_data()
-        self.all_data = create_data()
-        self.path = u('__%s__.msgpack' % tm.rands(10))
-        self.minimum_structure = {'series': ['float', 'int', 'mixed', 'ts', 'mi', 'dup'],
-                                  'frame': ['float', 'int', 'mixed', 'mi'],
-                                  'panel': ['float'],
-                                  'index': ['int', 'date', 'period'],
-                                  'mi': ['reg2']}
-
-    def check_min_structure(self, data):
-        for typ, v in self.minimum_structure.items():
-            assert typ in data, '"{0}" not found in unpacked data'.format(typ)
-            for kind in v:
-                assert kind in data[typ], '"{0}" not found in data["{1}"]'.format(kind, typ)
-
-    def compare(self, vf, version):
-        data = read_msgpack(vf)
-        self.check_min_structure(data)
-        for typ, dv in data.items():
-            assert typ in self.all_data, 'unpacked data contains extra key "{0}"'.format(typ)
-            for dt, result in dv.items():
-                assert dt in self.all_data[typ], 'data["{0}"] contains extra key "{1}"'.format(typ, dt)
-                try:
-                    expected = self.data[typ][dt]
-                except KeyError:
-                    continue
-
-                # use a specific comparator
-                # if available
-                comparator = getattr(self,"compare_{typ}_{dt}".format(typ=typ,dt=dt), None)
-                if comparator is not None:
-                    comparator(result, expected, typ, version)
-                else:
-                    check_arbitrary(result, expected)
-
-        return data
-
-    def compare_series_dt_tz(self, result, expected, typ, version):
-        # 8260
-        # dtype is object < 0.17.0
-        if LooseVersion(version) < '0.17.0':
-            expected = expected.astype(object)
-            tm.assert_series_equal(result, expected)
-        else:
-            tm.assert_series_equal(result, expected)
-
-    def compare_frame_dt_mixed_tzs(self, result, expected, typ, version):
-        # 8260
-        # dtype is object < 0.17.0
-        if LooseVersion(version) < '0.17.0':
-            expected = expected.astype(object)
-            tm.assert_frame_equal(result, expected)
-        else:
-            tm.assert_frame_equal(result, expected)
-
-    def read_msgpacks(self, version):
-
-        pth = tm.get_data_path('legacy_msgpack/{0}'.format(str(version)))
-        n = 0
-        for f in os.listdir(pth):
-            vf = os.path.join(pth, f)
-            self.compare(vf, version)
-            n += 1
-        assert n > 0, 'Msgpack files are not tested'
-
-    def test_msgpack(self):
-        msgpack_path = tm.get_data_path('legacy_msgpack')
-        n = 0
-        for v in os.listdir(msgpack_path):
-            pth = os.path.join(msgpack_path, v)
-            if os.path.isdir(pth):
-                yield self.read_msgpacks, v
-            n += 1
-        assert n > 0, 'Msgpack files are not tested'
-
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/io/tests/test_parsers.py b/pandas/io/tests/test_parsers.py
deleted file mode 100755
index 799c573b13c8b..0000000000000
--- a/pandas/io/tests/test_parsers.py
+++ /dev/null
@@ -1,4406 +0,0 @@
-# -*- coding: utf-8 -*-
-# pylint: disable=E1101
-
-from datetime import datetime
-import csv
-import os
-import sys
-import re
-import nose
-import platform
-
-from numpy import nan
-import numpy as np
-from pandas.io.common import DtypeWarning
-
-from pandas import DataFrame, Series, Index, MultiIndex, DatetimeIndex
-from pandas.compat import(
-    StringIO, BytesIO, PY3, range, long, lrange, lmap, u
-)
-from pandas.io.common import URLError
-import pandas.io.parsers as parsers
-from pandas.io.parsers import (read_csv, read_table, read_fwf,
-                               TextFileReader, TextParser)
-
-import pandas.util.testing as tm
-import pandas as pd
-
-from pandas.compat import parse_date
-import pandas.lib as lib
-from pandas import compat
-from pandas.lib import Timestamp
-from pandas.tseries.index import date_range
-import pandas.tseries.tools as tools
-
-from numpy.testing.decorators import slow
-
-import pandas.parser
-
-
-class ParserTests(object):
-    """
-    Want to be able to test either C+Cython or Python+Cython parsers
-    """
-    data1 = """index,A,B,C,D
-foo,2,3,4,5
-bar,7,8,9,10
-baz,12,13,14,15
-qux,12,13,14,15
-foo2,12,13,14,15
-bar2,12,13,14,15
-"""
-
-    def read_csv(self, *args, **kwargs):
-        raise NotImplementedError
-
-    def read_table(self, *args, **kwargs):
-        raise NotImplementedError
-
-    def setUp(self):
-        import warnings
-        warnings.filterwarnings(action='ignore', category=FutureWarning)
-
-        self.dirpath = tm.get_data_path()
-        self.csv1 = os.path.join(self.dirpath, 'test1.csv')
-        self.csv2 = os.path.join(self.dirpath, 'test2.csv')
-        self.xls1 = os.path.join(self.dirpath, 'test.xls')
-
-    def test_converters_type_must_be_dict(self):
-        with tm.assertRaisesRegexp(TypeError, 'Type converters.+'):
-            self.read_csv(StringIO(self.data1), converters=0)
-
-    def test_multi_character_decimal_marker(self):
-        data = """A|B|C
-1|2,334|5
-10|13|10.
-"""
-        self.assertRaises(ValueError, read_csv, StringIO(data), decimal=',,')
-
-    def test_empty_decimal_marker(self):
-        data = """A|B|C
-1|2,334|5
-10|13|10.
-"""
-        self.assertRaises(ValueError, read_csv, StringIO(data), decimal='')
-
-    def test_empty_thousands_marker(self):
-        data = """A|B|C
-1|2,334|5
-10|13|10.
-"""
-        self.assertRaises(ValueError, read_csv, StringIO(data), thousands='')
-
-
-    def test_multi_character_decimal_marker(self):
-        data = """A|B|C
-1|2,334|5
-10|13|10.
-"""
-        self.assertRaises(ValueError, read_csv, StringIO(data), thousands=',,')
-
-    def test_empty_string(self):
-        data = """\
-One,Two,Three
-a,1,one
-b,2,two
-,3,three
-d,4,nan
-e,5,five
-nan,6,
-g,7,seven
-"""
-        df = self.read_csv(StringIO(data))
-        xp = DataFrame({'One': ['a', 'b', np.nan, 'd', 'e', np.nan, 'g'],
-                        'Two': [1, 2, 3, 4, 5, 6, 7],
-                        'Three': ['one', 'two', 'three', np.nan, 'five',
-                                  np.nan, 'seven']})
-        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
-
-        df = self.read_csv(StringIO(data), na_values={'One': [], 'Three': []},
-                           keep_default_na=False)
-        xp = DataFrame({'One': ['a', 'b', '', 'd', 'e', 'nan', 'g'],
-                        'Two': [1, 2, 3, 4, 5, 6, 7],
-                        'Three': ['one', 'two', 'three', 'nan', 'five',
-                                  '', 'seven']})
-        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
-
-        df = self.read_csv(
-            StringIO(data), na_values=['a'], keep_default_na=False)
-        xp = DataFrame({'One': [np.nan, 'b', '', 'd', 'e', 'nan', 'g'],
-                        'Two': [1, 2, 3, 4, 5, 6, 7],
-                        'Three': ['one', 'two', 'three', 'nan', 'five', '',
-                                  'seven']})
-        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
-
-        df = self.read_csv(StringIO(data), na_values={'One': [], 'Three': []})
-        xp = DataFrame({'One': ['a', 'b', np.nan, 'd', 'e', np.nan, 'g'],
-                        'Two': [1, 2, 3, 4, 5, 6, 7],
-                        'Three': ['one', 'two', 'three', np.nan, 'five',
-                                  np.nan, 'seven']})
-        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
-
-
-        # GH4318, passing na_values=None and keep_default_na=False yields 'None' as a na_value
-        data = """\
-One,Two,Three
-a,1,None
-b,2,two
-,3,None
-d,4,nan
-e,5,five
-nan,6,
-g,7,seven
-"""
-        df = self.read_csv(
-            StringIO(data), keep_default_na=False)
-        xp = DataFrame({'One': ['a', 'b', '', 'd', 'e', 'nan', 'g'],
-                        'Two': [1, 2, 3, 4, 5, 6, 7],
-                        'Three': ['None', 'two', 'None', 'nan', 'five', '',
-                                  'seven']})
-        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
-
-
-    def test_read_csv(self):
-        if not compat.PY3:
-            if compat.is_platform_windows():
-                prefix = u("file:///")
-            else:
-                prefix = u("file://")
-            fname = prefix + compat.text_type(self.csv1)
-            # it works!
-            df1 = read_csv(fname, index_col=0, parse_dates=True)
-
-    def test_dialect(self):
-        data = """\
-label1,label2,label3
-index1,"a,c,e
-index2,b,d,f
-"""
-
-        dia = csv.excel()
-        dia.quoting = csv.QUOTE_NONE
-        df = self.read_csv(StringIO(data), dialect=dia)
-
-        data = '''\
-label1,label2,label3
-index1,a,c,e
-index2,b,d,f
-'''
-        exp = self.read_csv(StringIO(data))
-        exp.replace('a', '"a', inplace=True)
-        tm.assert_frame_equal(df, exp)
-
-    def test_dialect_str(self):
-        data = """\
-fruit:vegetable
-apple:brocolli
-pear:tomato
-"""
-        exp = DataFrame({
-            'fruit': ['apple', 'pear'],
-            'vegetable': ['brocolli', 'tomato']
-        })
-        dia = csv.register_dialect('mydialect', delimiter=':')
-        df = self.read_csv(StringIO(data), dialect='mydialect')
-        tm.assert_frame_equal(df, exp)
-        csv.unregister_dialect('mydialect')
-
-    def test_1000_sep(self):
-        data = """A|B|C
-1|2,334|5
-10|13|10.
-"""
-        expected = DataFrame({
-            'A': [1, 10],
-            'B': [2334, 13],
-            'C': [5, 10.]
-        })
-
-        df = self.read_csv(StringIO(data), sep='|', thousands=',')
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_table(StringIO(data), sep='|', thousands=',')
-        tm.assert_frame_equal(df, expected)
-
-    def test_1000_sep_with_decimal(self):
-        data = """A|B|C
-1|2,334.01|5
-10|13|10.
-"""
-        expected = DataFrame({
-            'A': [1, 10],
-            'B': [2334.01, 13],
-            'C': [5, 10.]
-        })
-
-        tm.assert_equal(expected.A.dtype, 'int64')
-        tm.assert_equal(expected.B.dtype, 'float')
-        tm.assert_equal(expected.C.dtype, 'float')
-
-        df = self.read_csv(StringIO(data), sep='|', thousands=',', decimal='.')
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_table(StringIO(data), sep='|', thousands=',', decimal='.')
-        tm.assert_frame_equal(df, expected)
-
-        data_with_odd_sep = """A|B|C
-1|2.334,01|5
-10|13|10,
-"""
-        df = self.read_csv(StringIO(data_with_odd_sep), sep='|', thousands='.', decimal=',')
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_table(StringIO(data_with_odd_sep), sep='|', thousands='.', decimal=',')
-        tm.assert_frame_equal(df, expected)
-
-    def test_separator_date_conflict(self):
-        # Regression test for issue #4678: make sure thousands separator and
-        # date parsing do not conflict.
-        data = '06-02-2013;13:00;1-000.215'
-        expected = DataFrame(
-            [[datetime(2013, 6, 2, 13, 0, 0), 1000.215]],
-            columns=['Date', 2]
-        )
-
-        df = self.read_csv(StringIO(data), sep=';', thousands='-', parse_dates={'Date': [0, 1]}, header=None)
-        tm.assert_frame_equal(df, expected)
-
-    def test_squeeze(self):
-        data = """\
-a,1
-b,2
-c,3
-"""
-        idx = Index(['a', 'b', 'c'], name=0)
-        expected = Series([1, 2, 3], name=1, index=idx)
-        result = self.read_table(StringIO(data), sep=',', index_col=0,
-                                 header=None, squeeze=True)
-        tm.assertIsInstance(result, Series)
-        tm.assert_series_equal(result, expected)
-
-    def test_squeeze_no_view(self):
-
-        # GH 8217
-        # series should not be a view
-
-        data = """time,data\n0,10\n1,11\n2,12\n4,14\n5,15\n3,13"""
-        result = self.read_csv(StringIO(data), index_col='time', squeeze=True)
-        self.assertFalse(result._is_view)
-
-    def test_inf_parsing(self):
-        data = """\
-,A
-a,inf
-b,-inf
-c,Inf
-d,-Inf
-e,INF
-f,-INF
-g,INf
-h,-INf
-i,inF
-j,-inF"""
-        inf = float('inf')
-        expected = Series([inf, -inf] * 5)
-        df = read_csv(StringIO(data), index_col=0)
-        tm.assert_almost_equal(df['A'].values, expected.values)
-        df = read_csv(StringIO(data), index_col=0, na_filter=False)
-        tm.assert_almost_equal(df['A'].values, expected.values)
-
-    def test_multiple_date_col(self):
-        # Can use multiple date parsers
-        data = """\
-KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
-"""
-
-        def func(*date_cols):
-            return lib.try_parse_dates(parsers._concat_date_cols(date_cols))
-
-        df = self.read_csv(StringIO(data), header=None,
-                           date_parser=func,
-                           prefix='X',
-                           parse_dates={'nominal': [1, 2],
-                                        'actual': [1, 3]})
-        self.assertIn('nominal', df)
-        self.assertIn('actual', df)
-        self.assertNotIn('X1', df)
-        self.assertNotIn('X2', df)
-        self.assertNotIn('X3', df)
-
-        d = datetime(1999, 1, 27, 19, 0)
-        self.assertEqual(df.ix[0, 'nominal'], d)
-
-        df = self.read_csv(StringIO(data), header=None,
-                           date_parser=func,
-                           parse_dates={'nominal': [1, 2],
-                                        'actual': [1, 3]},
-                           keep_date_col=True)
-        self.assertIn('nominal', df)
-        self.assertIn('actual', df)
-
-        self.assertIn(1, df)
-        self.assertIn(2, df)
-        self.assertIn(3, df)
-
-        data = """\
-KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
-"""
-        df = read_csv(StringIO(data), header=None,
-                      prefix='X',
-                      parse_dates=[[1, 2], [1, 3]])
-
-        self.assertIn('X1_X2', df)
-        self.assertIn('X1_X3', df)
-        self.assertNotIn('X1', df)
-        self.assertNotIn('X2', df)
-        self.assertNotIn('X3', df)
-
-        d = datetime(1999, 1, 27, 19, 0)
-        self.assertEqual(df.ix[0, 'X1_X2'], d)
-
-        df = read_csv(StringIO(data), header=None,
-                      parse_dates=[[1, 2], [1, 3]], keep_date_col=True)
-
-        self.assertIn('1_2', df)
-        self.assertIn('1_3', df)
-        self.assertIn(1, df)
-        self.assertIn(2, df)
-        self.assertIn(3, df)
-
-        data = '''\
-KORD,19990127 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-'''
-        df = self.read_csv(StringIO(data), sep=',', header=None,
-                           parse_dates=[1], index_col=1)
-        d = datetime(1999, 1, 27, 19, 0)
-        self.assertEqual(df.index[0], d)
-
-    def test_multiple_date_cols_int_cast(self):
-        data = ("KORD,19990127, 19:00:00, 18:56:00, 0.8100\n"
-                "KORD,19990127, 20:00:00, 19:56:00, 0.0100\n"
-                "KORD,19990127, 21:00:00, 20:56:00, -0.5900\n"
-                "KORD,19990127, 21:00:00, 21:18:00, -0.9900\n"
-                "KORD,19990127, 22:00:00, 21:56:00, -0.5900\n"
-                "KORD,19990127, 23:00:00, 22:56:00, -0.5900")
-        date_spec = {'nominal': [1, 2], 'actual': [1, 3]}
-        import pandas.io.date_converters as conv
-
-        # it works!
-        df = self.read_csv(StringIO(data), header=None, parse_dates=date_spec,
-                           date_parser=conv.parse_date_time)
-        self.assertIn('nominal', df)
-
-    def test_multiple_date_col_timestamp_parse(self):
-        data = """05/31/2012,15:30:00.029,1306.25,1,E,0,,1306.25
-05/31/2012,15:30:00.029,1306.25,8,E,0,,1306.25"""
-        result = self.read_csv(StringIO(data), sep=',', header=None,
-                               parse_dates=[[0,1]], date_parser=Timestamp)
-
-        ex_val = Timestamp('05/31/2012 15:30:00.029')
-        self.assertEqual(result['0_1'][0], ex_val)
-
-    def test_single_line(self):
-        # GH 6607
-        # Test currently only valid with python engine because sep=None and
-        # delim_whitespace=False. Temporarily copied to TestPythonParser.
-        # Test for ValueError with other engines:
-
-        with tm.assertRaisesRegexp(ValueError,
-                                   'sep=None with delim_whitespace=False'):
-            # sniff separator
-            buf = StringIO()
-            sys.stdout = buf
-
-            # printing warning message when engine == 'c' for now
-
-            try:
-                # it works!
-                df = self.read_csv(StringIO('1,2'), names=['a', 'b'],
-                                   header=None, sep=None)
-                tm.assert_frame_equal(DataFrame({'a': [1], 'b': [2]}), df)
-            finally:
-                sys.stdout = sys.__stdout__
-
-    def test_multiple_date_cols_with_header(self):
-        data = """\
-ID,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir
-KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000"""
-
-        df = self.read_csv(StringIO(data), parse_dates={'nominal': [1, 2]})
-        self.assertNotIsInstance(df.nominal[0], compat.string_types)
-
-    ts_data = """\
-ID,date,nominalTime,actualTime,A,B,C,D,E
-KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
-"""
-
-    def test_multiple_date_col_name_collision(self):
-        self.assertRaises(ValueError, self.read_csv, StringIO(self.ts_data),
-                          parse_dates={'ID': [1, 2]})
-
-        data = """\
-date_NominalTime,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir
-KORD1,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD2,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD3,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD4,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD5,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD6,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000"""
-
-        self.assertRaises(ValueError, self.read_csv, StringIO(data),
-                          parse_dates=[[1, 2]])
-
-    def test_index_col_named(self):
-        no_header = """\
-KORD1,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD2,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD3,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD4,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD5,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD6,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000"""
-
-        h = "ID,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir\n"
-        data = h + no_header
-        rs = self.read_csv(StringIO(data), index_col='ID')
-        xp = self.read_csv(StringIO(data), header=0).set_index('ID')
-        tm.assert_frame_equal(rs, xp)
-
-        self.assertRaises(ValueError, self.read_csv, StringIO(no_header),
-                          index_col='ID')
-
-        data = """\
-1,2,3,4,hello
-5,6,7,8,world
-9,10,11,12,foo
-"""
-        names = ['a', 'b', 'c', 'd', 'message']
-        xp = DataFrame({'a': [1, 5, 9], 'b': [2, 6, 10], 'c': [3, 7, 11],
-                        'd': [4, 8, 12]},
-                       index=Index(['hello', 'world', 'foo'], name='message'))
-        rs = self.read_csv(StringIO(data), names=names, index_col=['message'])
-        tm.assert_frame_equal(xp, rs)
-        self.assertEqual(xp.index.name, rs.index.name)
-
-        rs = self.read_csv(StringIO(data), names=names, index_col='message')
-        tm.assert_frame_equal(xp, rs)
-        self.assertEqual(xp.index.name, rs.index.name)
-
-    def test_usecols_index_col_False(self):
-        # Issue 9082
-        s = "a,b,c,d\n1,2,3,4\n5,6,7,8"
-        s_malformed = "a,b,c,d\n1,2,3,4,\n5,6,7,8,"
-        cols = ['a','c','d']
-        expected = DataFrame({'a':[1,5], 'c':[3,7], 'd':[4,8]})
-        df = self.read_csv(StringIO(s), usecols=cols, index_col=False)
-        tm.assert_frame_equal(expected, df)
-        df = self.read_csv(StringIO(s_malformed), usecols=cols, index_col=False)
-        tm.assert_frame_equal(expected, df)
-
-    def test_index_col_is_True(self):
-        # Issue 9798
-        self.assertRaises(ValueError, self.read_csv, StringIO(self.ts_data),
-                          index_col=True)
-
-    def test_converter_index_col_bug(self):
-        # 1835
-        data = "A;B\n1;2\n3;4"
-
-        rs = self.read_csv(StringIO(data), sep=';', index_col='A',
-                           converters={'A': lambda x: x})
-
-        xp = DataFrame({'B': [2, 4]}, index=Index([1, 3], name='A'))
-        tm.assert_frame_equal(rs, xp)
-        self.assertEqual(rs.index.name, xp.index.name)
-
-    def test_date_parser_int_bug(self):
-        # #3071
-        log_file = StringIO(
-            'posix_timestamp,elapsed,sys,user,queries,query_time,rows,'
-                'accountid,userid,contactid,level,silo,method\n'
-            '1343103150,0.062353,0,4,6,0.01690,3,'
-                '12345,1,-1,3,invoice_InvoiceResource,search\n'
-        )
-
-        def f(posix_string):
-            return datetime.utcfromtimestamp(int(posix_string))
-
-        # it works!
-        read_csv(log_file, index_col=0, parse_dates=0, date_parser=f)
-
-    def test_multiple_skts_example(self):
-        data = "year, month, a, b\n 2001, 01, 0.0, 10.\n 2001, 02, 1.1, 11."
-        pass
-
-    def test_malformed(self):
-        # all
-        data = """ignore
-A,B,C
-1,2,3 # comment
-1,2,3,4,5
-2,3,4
-"""
-
-        try:
-            df = self.read_table(
-                StringIO(data), sep=',', header=1, comment='#')
-            self.assertTrue(False)
-        except Exception as inst:
-            self.assertIn('Expected 3 fields in line 4, saw 5', str(inst))
-
-        # skip_footer
-        data = """ignore
-A,B,C
-1,2,3 # comment
-1,2,3,4,5
-2,3,4
-footer
-"""
-
-        # GH 6607
-        # Test currently only valid with python engine because
-        # skip_footer != 0. Temporarily copied to TestPythonParser.
-        # Test for ValueError with other engines:
-
-        try:
-            with tm.assertRaisesRegexp(ValueError, 'skip_footer'):  #XXX
-                df = self.read_table(
-                    StringIO(data), sep=',', header=1, comment='#',
-                    skip_footer=1)
-                self.assertTrue(False)
-        except Exception as inst:
-            self.assertIn('Expected 3 fields in line 4, saw 5', str(inst))
-
-        # first chunk
-        data = """ignore
-A,B,C
-skip
-1,2,3
-3,5,10 # comment
-1,2,3,4,5
-2,3,4
-"""
-        try:
-            it = self.read_table(StringIO(data), sep=',',
-                                 header=1, comment='#', iterator=True, chunksize=1,
-                                 skiprows=[2])
-            df = it.read(5)
-            self.assertTrue(False)
-        except Exception as inst:
-            self.assertIn('Expected 3 fields in line 6, saw 5', str(inst))
-
-        # middle chunk
-        data = """ignore
-A,B,C
-skip
-1,2,3
-3,5,10 # comment
-1,2,3,4,5
-2,3,4
-"""
-        try:
-            it = self.read_table(StringIO(data), sep=',', header=1,
-                                 comment='#', iterator=True, chunksize=1,
-                                 skiprows=[2])
-            df = it.read(1)
-            it.read(2)
-            self.assertTrue(False)
-        except Exception as inst:
-            self.assertIn('Expected 3 fields in line 6, saw 5', str(inst))
-
-        # last chunk
-        data = """ignore
-A,B,C
-skip
-1,2,3
-3,5,10 # comment
-1,2,3,4,5
-2,3,4
-"""
-        try:
-            it = self.read_table(StringIO(data), sep=',',
-                                 header=1, comment='#', iterator=True, chunksize=1,
-                                 skiprows=[2])
-            df = it.read(1)
-            it.read()
-            self.assertTrue(False)
-        except Exception as inst:
-            self.assertIn('Expected 3 fields in line 6, saw 5', str(inst))
-
-    def test_passing_dtype(self):
-        # GH 6607
-        # Passing dtype is currently only supported by the C engine.
-        # Temporarily copied to TestCParser*.
-        # Test for ValueError with other engines:
-
-        with tm.assertRaisesRegexp(ValueError,
-                "The 'dtype' option is not supported"):
-
-            df = DataFrame(np.random.rand(5,2),columns=list('AB'),index=['1A','1B','1C','1D','1E'])
-
-            with tm.ensure_clean('__passing_str_as_dtype__.csv') as path:
-                df.to_csv(path)
-
-                # GH 3795
-                # passing 'str' as the dtype
-                result = self.read_csv(path, dtype=str, index_col=0)
-                tm.assert_series_equal(result.dtypes,Series({ 'A' : 'object', 'B' : 'object' }))
-
-                # we expect all object columns, so need to convert to test for equivalence
-                result = result.astype(float)
-                tm.assert_frame_equal(result,df)
-
-                # invalid dtype
-                self.assertRaises(TypeError, self.read_csv, path, dtype={'A' : 'foo', 'B' : 'float64' },
-                                  index_col=0)
-
-                # valid but we don't support it (date)
-                self.assertRaises(TypeError, self.read_csv, path, dtype={'A' : 'datetime64', 'B' : 'float64' },
-                                  index_col=0)
-                self.assertRaises(TypeError, self.read_csv, path, dtype={'A' : 'datetime64', 'B' : 'float64' },
-                                  index_col=0, parse_dates=['B'])
-
-                # valid but we don't support it
-                self.assertRaises(TypeError, self.read_csv, path, dtype={'A' : 'timedelta64', 'B' : 'float64' },
-                                  index_col=0)
-
-        def test_quoting(self):
-            bad_line_small = """printer\tresult\tvariant_name
-Klosterdruckerei\tKlosterdruckerei <Salem> (1611-1804)\tMuller, Jacob
-Klosterdruckerei\tKlosterdruckerei <Salem> (1611-1804)\tMuller, Jakob
-Klosterdruckerei\tKlosterdruckerei <Kempten> (1609-1805)\t"Furststiftische Hofdruckerei,  <Kempten""
-Klosterdruckerei\tKlosterdruckerei <Kempten> (1609-1805)\tGaller, Alois
-Klosterdruckerei\tKlosterdruckerei <Kempten> (1609-1805)\tHochfurstliche Buchhandlung <Kempten>"""
-            self.assertRaises(Exception, self.read_table, StringIO(bad_line_small),
-                              sep='\t')
-
-            good_line_small = bad_line_small + '"'
-            df = self.read_table(StringIO(good_line_small), sep='\t')
-            self.assertEqual(len(df), 3)
-
-    def test_non_string_na_values(self):
-        # GH3611, na_values that are not a string are an issue
-        with tm.ensure_clean('__non_string_na_values__.csv') as path:
-            df = DataFrame({'A' : [-999, 2, 3], 'B' : [1.2, -999, 4.5]})
-            df.to_csv(path, sep=' ', index=False)
-            result1 = read_csv(path, sep= ' ', header=0, na_values=['-999.0','-999'])
-            result2 = read_csv(path, sep= ' ', header=0, na_values=[-999,-999.0])
-            result3 = read_csv(path, sep= ' ', header=0, na_values=[-999.0,-999])
-            tm.assert_frame_equal(result1,result2)
-            tm.assert_frame_equal(result2,result3)
-
-            result4 = read_csv(path, sep= ' ', header=0, na_values=['-999.0'])
-            result5 = read_csv(path, sep= ' ', header=0, na_values=['-999'])
-            result6 = read_csv(path, sep= ' ', header=0, na_values=[-999.0])
-            result7 = read_csv(path, sep= ' ', header=0, na_values=[-999])
-            tm.assert_frame_equal(result4,result3)
-            tm.assert_frame_equal(result5,result3)
-            tm.assert_frame_equal(result6,result3)
-            tm.assert_frame_equal(result7,result3)
-
-            good_compare = result3
-
-            # with an odd float format, so we can't match the string 999.0 exactly,
-            # but need float matching
-            df.to_csv(path, sep=' ', index=False, float_format = '%.3f')
-            result1 = read_csv(path, sep= ' ', header=0, na_values=['-999.0','-999'])
-            result2 = read_csv(path, sep= ' ', header=0, na_values=[-999,-999.0])
-            result3 = read_csv(path, sep= ' ', header=0, na_values=[-999.0,-999])
-            tm.assert_frame_equal(result1,good_compare)
-            tm.assert_frame_equal(result2,good_compare)
-            tm.assert_frame_equal(result3,good_compare)
-
-            result4 = read_csv(path, sep= ' ', header=0, na_values=['-999.0'])
-            result5 = read_csv(path, sep= ' ', header=0, na_values=['-999'])
-            result6 = read_csv(path, sep= ' ', header=0, na_values=[-999.0])
-            result7 = read_csv(path, sep= ' ', header=0, na_values=[-999])
-            tm.assert_frame_equal(result4,good_compare)
-            tm.assert_frame_equal(result5,good_compare)
-            tm.assert_frame_equal(result6,good_compare)
-            tm.assert_frame_equal(result7,good_compare)
-
-    def test_default_na_values(self):
-        _NA_VALUES = set(['-1.#IND', '1.#QNAN', '1.#IND', '-1.#QNAN',
-                          '#N/A','N/A', 'NA', '#NA', 'NULL', 'NaN',
-                          'nan', '-NaN', '-nan', '#N/A N/A',''])
-        self.assertEqual(_NA_VALUES, parsers._NA_VALUES)
-        nv = len(_NA_VALUES)
-        def f(i, v):
-            if i == 0:
-                buf = ''
-            elif i > 0:
-                buf = ''.join([','] * i)
-
-            buf = "{0}{1}".format(buf,v)
-
-            if i < nv-1:
-                buf = "{0}{1}".format(buf,''.join([','] * (nv-i-1)))
-
-            return buf
-
-        data = StringIO('\n'.join([ f(i, v) for i, v in enumerate(_NA_VALUES) ]))
-        expected = DataFrame(np.nan,columns=range(nv),index=range(nv))
-        df = self.read_csv(data, header=None)
-        tm.assert_frame_equal(df, expected)
-
-    def test_custom_na_values(self):
-        data = """A,B,C
-ignore,this,row
-1,NA,3
--1.#IND,5,baz
-7,8,NaN
-"""
-        expected = [[1., nan, 3],
-                    [nan, 5, nan],
-                    [7, 8, nan]]
-
-        df = self.read_csv(StringIO(data), na_values=['baz'], skiprows=[1])
-        tm.assert_almost_equal(df.values, expected)
-
-        df2 = self.read_table(StringIO(data), sep=',', na_values=['baz'],
-                              skiprows=[1])
-        tm.assert_almost_equal(df2.values, expected)
-
-        df3 = self.read_table(StringIO(data), sep=',', na_values='baz',
-                              skiprows=[1])
-        tm.assert_almost_equal(df3.values, expected)
-
-    def test_nat_parse(self):
-
-        # GH 3062
-        df = DataFrame(dict({
-                    'A' : np.asarray(lrange(10),dtype='float64'),
-                    'B' : pd.Timestamp('20010101') }))
-        df.iloc[3:6,:] = np.nan
-
-        with tm.ensure_clean('__nat_parse_.csv') as path:
-            df.to_csv(path)
-            result = read_csv(path,index_col=0,parse_dates=['B'])
-            tm.assert_frame_equal(result,df)
-
-            expected = Series(dict( A = 'float64',B = 'datetime64[ns]'))
-            tm.assert_series_equal(expected,result.dtypes)
-
-            # test with NaT for the nan_rep
-            # we don't have a method to specif the Datetime na_rep (it defaults to '')
-            df.to_csv(path)
-            result = read_csv(path,index_col=0,parse_dates=['B'])
-            tm.assert_frame_equal(result,df)
-
-    def test_skiprows_bug(self):
-        # GH #505
-        text = """#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-1/1/2000,1.,2.,3.
-1/2/2000,4,5,6
-1/3/2000,7,8,9
-"""
-        data = self.read_csv(StringIO(text), skiprows=lrange(6), header=None,
-                             index_col=0, parse_dates=True)
-
-        data2 = self.read_csv(StringIO(text), skiprows=6, header=None,
-                              index_col=0, parse_dates=True)
-
-        expected = DataFrame(np.arange(1., 10.).reshape((3, 3)),
-                             columns=[1, 2, 3],
-                             index=[datetime(2000, 1, 1), datetime(2000, 1, 2),
-                                    datetime(2000, 1, 3)])
-        expected.index.name = 0
-        tm.assert_frame_equal(data, expected)
-        tm.assert_frame_equal(data, data2)
-
-    def test_deep_skiprows(self):
-        # GH #4382
-        text = "a,b,c\n" + "\n".join([",".join([str(i), str(i+1), str(i+2)]) for i in range(10)])
-        condensed_text = "a,b,c\n" + "\n".join([",".join([str(i), str(i+1), str(i+2)]) for i in [0, 1, 2, 3, 4, 6, 8, 9]])
-        data = self.read_csv(StringIO(text), skiprows=[6, 8])
-        condensed_data = self.read_csv(StringIO(condensed_text))
-        tm.assert_frame_equal(data, condensed_data)
-
-    def test_skiprows_blank(self):
-        # GH 9832
-        text = """#foo,a,b,c
-#foo,a,b,c
-
-#foo,a,b,c
-#foo,a,b,c
-
-1/1/2000,1.,2.,3.
-1/2/2000,4,5,6
-1/3/2000,7,8,9
-"""
-        data = self.read_csv(StringIO(text), skiprows=6, header=None,
-                              index_col=0, parse_dates=True)
-
-        expected = DataFrame(np.arange(1., 10.).reshape((3, 3)),
-                             columns=[1, 2, 3],
-                             index=[datetime(2000, 1, 1), datetime(2000, 1, 2),
-                                    datetime(2000, 1, 3)])
-        expected.index.name = 0
-        tm.assert_frame_equal(data, expected)
-
-    def test_detect_string_na(self):
-        data = """A,B
-foo,bar
-NA,baz
-NaN,nan
-"""
-        expected = [['foo', 'bar'],
-                    [nan, 'baz'],
-                    [nan, nan]]
-
-        df = self.read_csv(StringIO(data))
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_unnamed_columns(self):
-        data = """A,B,C,,
-1,2,3,4,5
-6,7,8,9,10
-11,12,13,14,15
-"""
-        expected = [[1, 2, 3, 4, 5.],
-                    [6, 7, 8, 9, 10],
-                    [11, 12, 13, 14, 15]]
-        df = self.read_table(StringIO(data), sep=',')
-        tm.assert_almost_equal(df.values, expected)
-        self.assert_numpy_array_equal(df.columns,
-                                      ['A', 'B', 'C', 'Unnamed: 3',
-                                       'Unnamed: 4'])
-
-    def test_string_nas(self):
-        data = """A,B,C
-a,b,c
-d,,f
-,g,h
-"""
-        result = self.read_csv(StringIO(data))
-        expected = DataFrame([['a', 'b', 'c'],
-                              ['d', np.nan, 'f'],
-                              [np.nan, 'g', 'h']],
-                             columns=['A', 'B', 'C'])
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_duplicate_columns(self):
-        for engine in ['python', 'c']:
-            data = """A,A,B,B,B
-    1,2,3,4,5
-    6,7,8,9,10
-    11,12,13,14,15
-    """
-            # check default beahviour
-            df = self.read_table(StringIO(data), sep=',',engine=engine)
-            self.assertEqual(list(df.columns), ['A', 'A.1', 'B', 'B.1', 'B.2'])
-
-            df = self.read_table(StringIO(data), sep=',',engine=engine,mangle_dupe_cols=False)
-            self.assertEqual(list(df.columns), ['A', 'A', 'B', 'B', 'B'])
-
-            df = self.read_table(StringIO(data), sep=',',engine=engine,mangle_dupe_cols=True)
-            self.assertEqual(list(df.columns), ['A', 'A.1', 'B', 'B.1', 'B.2'])
-
-    def test_csv_mixed_type(self):
-        data = """A,B,C
-a,1,2
-b,3,4
-c,4,5
-"""
-        df = self.read_csv(StringIO(data))
-        # TODO
-
-    def test_csv_custom_parser(self):
-        data = """A,B,C
-20090101,a,1,2
-20090102,b,3,4
-20090103,c,4,5
-"""
-        f = lambda x: datetime.strptime(x, '%Y%m%d')
-        df = self.read_csv(StringIO(data), date_parser=f)
-        expected = self.read_csv(StringIO(data), parse_dates=True)
-        tm.assert_frame_equal(df, expected)
-
-    def test_parse_dates_implicit_first_col(self):
-        data = """A,B,C
-20090101,a,1,2
-20090102,b,3,4
-20090103,c,4,5
-"""
-        df = self.read_csv(StringIO(data), parse_dates=True)
-        expected = self.read_csv(StringIO(data), index_col=0, parse_dates=True)
-        self.assertIsInstance(df.index[0], (datetime, np.datetime64, Timestamp))
-        tm.assert_frame_equal(df, expected)
-
-    def test_parse_dates_string(self):
-        data = """date,A,B,C
-20090101,a,1,2
-20090102,b,3,4
-20090103,c,4,5
-"""
-        rs = self.read_csv(
-            StringIO(data), index_col='date', parse_dates='date')
-        idx = date_range('1/1/2009', periods=3)
-        idx.name = 'date'
-        xp = DataFrame({'A': ['a', 'b', 'c'],
-                        'B': [1, 3, 4],
-                        'C': [2, 4, 5]}, idx)
-        tm.assert_frame_equal(rs, xp)
-
-    def test_yy_format(self):
-        data = """date,time,B,C
-090131,0010,1,2
-090228,1020,3,4
-090331,0830,5,6
-"""
-        rs = self.read_csv(StringIO(data), index_col=0,
-                           parse_dates=[['date', 'time']])
-        idx = DatetimeIndex([datetime(2009, 1, 31, 0, 10, 0),
-                             datetime(2009, 2, 28, 10, 20, 0),
-                             datetime(2009, 3, 31, 8, 30, 0)],
-                            dtype=object, name='date_time')
-        xp = DataFrame({'B': [1, 3, 5], 'C': [2, 4, 6]}, idx)
-        tm.assert_frame_equal(rs, xp)
-
-        rs = self.read_csv(StringIO(data), index_col=0,
-                           parse_dates=[[0, 1]])
-        idx = DatetimeIndex([datetime(2009, 1, 31, 0, 10, 0),
-                             datetime(2009, 2, 28, 10, 20, 0),
-                             datetime(2009, 3, 31, 8, 30, 0)],
-                            dtype=object, name='date_time')
-        xp = DataFrame({'B': [1, 3, 5], 'C': [2, 4, 6]}, idx)
-        tm.assert_frame_equal(rs, xp)
-
-    def test_parse_dates_column_list(self):
-        from pandas.core.datetools import to_datetime
-
-        data = '''date;destination;ventilationcode;unitcode;units;aux_date
-01/01/2010;P;P;50;1;12/1/2011
-01/01/2010;P;R;50;1;13/1/2011
-15/01/2010;P;P;50;1;14/1/2011
-01/05/2010;P;P;50;1;15/1/2011'''
-
-        expected = self.read_csv(StringIO(data), sep=";", index_col=lrange(4))
-
-        lev = expected.index.levels[0]
-        levels = list(expected.index.levels)
-        levels[0] = lev.to_datetime(dayfirst=True)
-        # hack to get this to work - remove for final test
-        levels[0].name = lev.name
-        expected.index.set_levels(levels, inplace=True)
-        expected['aux_date'] = to_datetime(expected['aux_date'],
-                                           dayfirst=True)
-        expected['aux_date'] = lmap(Timestamp, expected['aux_date'])
-        tm.assertIsInstance(expected['aux_date'][0], datetime)
-
-        df = self.read_csv(StringIO(data), sep=";", index_col=lrange(4),
-                           parse_dates=[0, 5], dayfirst=True)
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_csv(StringIO(data), sep=";", index_col=lrange(4),
-                           parse_dates=['date', 'aux_date'], dayfirst=True)
-        tm.assert_frame_equal(df, expected)
-
-    def test_no_header(self):
-        data = """1,2,3,4,5
-6,7,8,9,10
-11,12,13,14,15
-"""
-        df = self.read_table(StringIO(data), sep=',', header=None)
-        df_pref = self.read_table(StringIO(data), sep=',', prefix='X',
-                                  header=None)
-
-        names = ['foo', 'bar', 'baz', 'quux', 'panda']
-        df2 = self.read_table(StringIO(data), sep=',', names=names)
-        expected = [[1, 2, 3, 4, 5.],
-                    [6, 7, 8, 9, 10],
-                    [11, 12, 13, 14, 15]]
-        tm.assert_almost_equal(df.values, expected)
-        tm.assert_almost_equal(df.values, df2.values)
-
-        self.assert_numpy_array_equal(df_pref.columns,
-                                      ['X0', 'X1', 'X2', 'X3', 'X4'])
-        self.assert_numpy_array_equal(df.columns, lrange(5))
-
-        self.assert_numpy_array_equal(df2.columns, names)
-
-    def test_no_header_prefix(self):
-        data = """1,2,3,4,5
-6,7,8,9,10
-11,12,13,14,15
-"""
-        df_pref = self.read_table(StringIO(data), sep=',', prefix='Field',
-                                  header=None)
-
-        expected = [[1, 2, 3, 4, 5.],
-                    [6, 7, 8, 9, 10],
-                    [11, 12, 13, 14, 15]]
-        tm.assert_almost_equal(df_pref.values, expected)
-
-        self.assert_numpy_array_equal(df_pref.columns,
-                                      ['Field0', 'Field1', 'Field2', 'Field3', 'Field4'])
-
-    def test_header_with_index_col(self):
-        data = """foo,1,2,3
-bar,4,5,6
-baz,7,8,9
-"""
-        names = ['A', 'B', 'C']
-        df = self.read_csv(StringIO(data), names=names)
-
-        self.assertEqual(names, ['A', 'B', 'C'])
-
-        values = [[1, 2, 3], [4, 5, 6], [7, 8, 9]]
-        expected = DataFrame(values, index=['foo', 'bar', 'baz'],
-                             columns=['A', 'B', 'C'])
-        tm.assert_frame_equal(df, expected)
-
-    def test_read_csv_dataframe(self):
-        df = self.read_csv(self.csv1, index_col=0, parse_dates=True)
-        df2 = self.read_table(self.csv1, sep=',', index_col=0,
-                              parse_dates=True)
-        self.assert_numpy_array_equal(df.columns, ['A', 'B', 'C', 'D'])
-        self.assertEqual(df.index.name, 'index')
-        self.assertIsInstance(df.index[0], (datetime, np.datetime64, Timestamp))
-        self.assertEqual(df.values.dtype, np.float64)
-        tm.assert_frame_equal(df, df2)
-
-    def test_read_csv_no_index_name(self):
-        df = self.read_csv(self.csv2, index_col=0, parse_dates=True)
-        df2 = self.read_table(self.csv2, sep=',', index_col=0,
-                              parse_dates=True)
-        self.assert_numpy_array_equal(df.columns, ['A', 'B', 'C', 'D', 'E'])
-        self.assertIsInstance(df.index[0], (datetime, np.datetime64, Timestamp))
-        self.assertEqual(df.ix[:, ['A', 'B', 'C', 'D']].values.dtype, np.float64)
-        tm.assert_frame_equal(df, df2)
-
-    def test_read_csv_infer_compression(self):
-        # GH 9770
-        expected = self.read_csv(self.csv1, index_col=0, parse_dates=True)
-
-        inputs = [self.csv1, self.csv1 + '.gz',
-                  self.csv1 + '.bz2', open(self.csv1)]
-
-        for f in inputs:
-            df = self.read_csv(f, index_col=0, parse_dates=True,
-                compression='infer')
-
-            tm.assert_frame_equal(expected, df)
-
-        inputs[3].close()
-
-    def test_read_table_unicode(self):
-        fin = BytesIO(u('\u0141aski, Jan;1').encode('utf-8'))
-        df1 = read_table(fin, sep=";", encoding="utf-8", header=None)
-        tm.assertIsInstance(df1[0].values[0], compat.text_type)
-
-    def test_read_table_wrong_num_columns(self):
-        # too few!
-        data = """A,B,C,D,E,F
-1,2,3,4,5,6
-6,7,8,9,10,11,12
-11,12,13,14,15,16
-"""
-        self.assertRaises(Exception, self.read_csv, StringIO(data))
-
-    def test_read_table_duplicate_index(self):
-        data = """index,A,B,C,D
-foo,2,3,4,5
-bar,7,8,9,10
-baz,12,13,14,15
-qux,12,13,14,15
-foo,12,13,14,15
-bar,12,13,14,15
-"""
-
-        result = self.read_csv(StringIO(data), index_col=0)
-        expected = self.read_csv(StringIO(data)).set_index('index',
-                                                           verify_integrity=False)
-        tm.assert_frame_equal(result, expected)
-
-    def test_read_table_duplicate_index_implicit(self):
-        data = """A,B,C,D
-foo,2,3,4,5
-bar,7,8,9,10
-baz,12,13,14,15
-qux,12,13,14,15
-foo,12,13,14,15
-bar,12,13,14,15
-"""
-
-        # it works!
-        result = self.read_csv(StringIO(data))
-
-    def test_parse_bools(self):
-        data = """A,B
-True,1
-False,2
-True,3
-"""
-        data = self.read_csv(StringIO(data))
-        self.assertEqual(data['A'].dtype, np.bool_)
-
-        data = """A,B
-YES,1
-no,2
-yes,3
-No,3
-Yes,3
-"""
-        data = self.read_csv(StringIO(data),
-                             true_values=['yes', 'Yes', 'YES'],
-                             false_values=['no', 'NO', 'No'])
-        self.assertEqual(data['A'].dtype, np.bool_)
-
-        data = """A,B
-TRUE,1
-FALSE,2
-TRUE,3
-"""
-        data = self.read_csv(StringIO(data))
-        self.assertEqual(data['A'].dtype, np.bool_)
-
-        data = """A,B
-foo,bar
-bar,foo"""
-        result = self.read_csv(StringIO(data), true_values=['foo'],
-                               false_values=['bar'])
-        expected = DataFrame({'A': [True, False], 'B': [False, True]})
-        tm.assert_frame_equal(result, expected)
-
-    def test_int_conversion(self):
-        data = """A,B
-1.0,1
-2.0,2
-3.0,3
-"""
-        data = self.read_csv(StringIO(data))
-        self.assertEqual(data['A'].dtype, np.float64)
-        self.assertEqual(data['B'].dtype, np.int64)
-
-    def test_infer_index_col(self):
-        data = """A,B,C
-foo,1,2,3
-bar,4,5,6
-baz,7,8,9
-"""
-        data = self.read_csv(StringIO(data))
-        self.assertTrue(data.index.equals(Index(['foo', 'bar', 'baz'])))
-
-    def test_read_nrows(self):
-        df = self.read_csv(StringIO(self.data1), nrows=3)
-        expected = self.read_csv(StringIO(self.data1))[:3]
-        tm.assert_frame_equal(df, expected)
-
-    def test_read_chunksize(self):
-        reader = self.read_csv(StringIO(self.data1), index_col=0, chunksize=2)
-        df = self.read_csv(StringIO(self.data1), index_col=0)
-
-        chunks = list(reader)
-
-        tm.assert_frame_equal(chunks[0], df[:2])
-        tm.assert_frame_equal(chunks[1], df[2:4])
-        tm.assert_frame_equal(chunks[2], df[4:])
-
-    def test_read_chunksize_named(self):
-        reader = self.read_csv(
-            StringIO(self.data1), index_col='index', chunksize=2)
-        df = self.read_csv(StringIO(self.data1), index_col='index')
-
-        chunks = list(reader)
-
-        tm.assert_frame_equal(chunks[0], df[:2])
-        tm.assert_frame_equal(chunks[1], df[2:4])
-        tm.assert_frame_equal(chunks[2], df[4:])
-
-    def test_get_chunk_passed_chunksize(self):
-        data = """A,B,C
-1,2,3
-4,5,6
-7,8,9
-1,2,3"""
-        result = self.read_csv(StringIO(data), chunksize=2)
-
-        piece = result.get_chunk()
-        self.assertEqual(len(piece), 2)
-
-    def test_read_text_list(self):
-        data = """A,B,C\nfoo,1,2,3\nbar,4,5,6"""
-        as_list = [['A', 'B', 'C'], ['foo', '1', '2', '3'], ['bar',
-                                                             '4', '5', '6']]
-        df = self.read_csv(StringIO(data), index_col=0)
-
-        parser = TextParser(as_list, index_col=0, chunksize=2)
-        chunk = parser.read(None)
-
-        tm.assert_frame_equal(chunk, df)
-
-    def test_iterator(self):
-        # GH 6607
-        # Test currently only valid with python engine because
-        # skip_footer != 0. Temporarily copied to TestPythonParser.
-        # Test for ValueError with other engines:
-
-        with tm.assertRaisesRegexp(ValueError, 'skip_footer'):
-            reader = self.read_csv(StringIO(self.data1), index_col=0,
-                                   iterator=True)
-            df = self.read_csv(StringIO(self.data1), index_col=0)
-
-            chunk = reader.read(3)
-            tm.assert_frame_equal(chunk, df[:3])
-
-            last_chunk = reader.read(5)
-            tm.assert_frame_equal(last_chunk, df[3:])
-
-            # pass list
-            lines = list(csv.reader(StringIO(self.data1)))
-            parser = TextParser(lines, index_col=0, chunksize=2)
-
-            df = self.read_csv(StringIO(self.data1), index_col=0)
-
-            chunks = list(parser)
-            tm.assert_frame_equal(chunks[0], df[:2])
-            tm.assert_frame_equal(chunks[1], df[2:4])
-            tm.assert_frame_equal(chunks[2], df[4:])
-
-            # pass skiprows
-            parser = TextParser(lines, index_col=0, chunksize=2, skiprows=[1])
-            chunks = list(parser)
-            tm.assert_frame_equal(chunks[0], df[1:3])
-
-            # test bad parameter (skip_footer)
-            reader = self.read_csv(StringIO(self.data1), index_col=0,
-                                   iterator=True, skip_footer=True)
-            self.assertRaises(ValueError, reader.read, 3)
-
-            treader = self.read_table(StringIO(self.data1), sep=',', index_col=0,
-                                      iterator=True)
-            tm.assertIsInstance(treader, TextFileReader)
-
-            # stopping iteration when on chunksize is specified, GH 3967
-            data = """A,B,C
-foo,1,2,3
-bar,4,5,6
-baz,7,8,9
-"""
-            reader = self.read_csv(StringIO(data), iterator=True)
-            result = list(reader)
-            expected = DataFrame(dict(A = [1,4,7], B = [2,5,8], C = [3,6,9]), index=['foo','bar','baz'])
-            tm.assert_frame_equal(result[0], expected)
-
-            # chunksize = 1
-            reader = self.read_csv(StringIO(data), chunksize=1)
-            result = list(reader)
-            expected = DataFrame(dict(A = [1,4,7], B = [2,5,8], C = [3,6,9]), index=['foo','bar','baz'])
-            self.assertEqual(len(result), 3)
-            tm.assert_frame_equal(pd.concat(result), expected)
-
-    def test_header_not_first_line(self):
-        data = """got,to,ignore,this,line
-got,to,ignore,this,line
-index,A,B,C,D
-foo,2,3,4,5
-bar,7,8,9,10
-baz,12,13,14,15
-"""
-        data2 = """index,A,B,C,D
-foo,2,3,4,5
-bar,7,8,9,10
-baz,12,13,14,15
-"""
-
-        df = self.read_csv(StringIO(data), header=2, index_col=0)
-        expected = self.read_csv(StringIO(data2), header=0, index_col=0)
-        tm.assert_frame_equal(df, expected)
-
-    def test_header_multi_index(self):
-        expected = tm.makeCustomDataframe(5,3,r_idx_nlevels=2,c_idx_nlevels=4)
-
-        data = """\
-C0,,C_l0_g0,C_l0_g1,C_l0_g2
-
-C1,,C_l1_g0,C_l1_g1,C_l1_g2
-C2,,C_l2_g0,C_l2_g1,C_l2_g2
-C3,,C_l3_g0,C_l3_g1,C_l3_g2
-R0,R1,,,
-R_l0_g0,R_l1_g0,R0C0,R0C1,R0C2
-R_l0_g1,R_l1_g1,R1C0,R1C1,R1C2
-R_l0_g2,R_l1_g2,R2C0,R2C1,R2C2
-R_l0_g3,R_l1_g3,R3C0,R3C1,R3C2
-R_l0_g4,R_l1_g4,R4C0,R4C1,R4C2
-"""
-
-        df = self.read_csv(StringIO(data), header=[0, 1, 2, 3], index_col=[0, 1], tupleize_cols=False)
-        tm.assert_frame_equal(df, expected)
-
-        # skipping lines in the header
-        df = self.read_csv(StringIO(data), header=[0, 1, 2, 3], index_col=[0, 1], tupleize_cols=False)
-        tm.assert_frame_equal(df, expected)
-
-        #### invalid options ####
-
-        # no as_recarray
-        self.assertRaises(ValueError, self.read_csv, StringIO(data), header=[0,1,2,3],
-                          index_col=[0,1], as_recarray=True, tupleize_cols=False)
-
-        # names
-        self.assertRaises(ValueError, self.read_csv, StringIO(data), header=[0,1,2,3],
-                          index_col=[0,1], names=['foo','bar'], tupleize_cols=False)
-        # usecols
-        self.assertRaises(ValueError, self.read_csv, StringIO(data), header=[0,1,2,3],
-                          index_col=[0,1], usecols=['foo','bar'], tupleize_cols=False)
-        # non-numeric index_col
-        self.assertRaises(ValueError, self.read_csv, StringIO(data), header=[0,1,2,3],
-                          index_col=['foo','bar'], tupleize_cols=False)
-
-    def test_header_multiindex_common_format(self):
-
-        df = DataFrame([[1,2,3,4,5,6],[7,8,9,10,11,12]],
-                       index=['one','two'],
-                       columns=MultiIndex.from_tuples([('a','q'),('a','r'),('a','s'),
-                                                       ('b','t'),('c','u'),('c','v')]))
-
-        # to_csv
-        data = """,a,a,a,b,c,c
-,q,r,s,t,u,v
-,,,,,,
-one,1,2,3,4,5,6
-two,7,8,9,10,11,12"""
-
-        result = self.read_csv(StringIO(data),header=[0,1],index_col=0)
-        tm.assert_frame_equal(df,result)
-
-        # common
-        data = """,a,a,a,b,c,c
-,q,r,s,t,u,v
-one,1,2,3,4,5,6
-two,7,8,9,10,11,12"""
-
-        result = self.read_csv(StringIO(data),header=[0,1],index_col=0)
-        tm.assert_frame_equal(df,result)
-
-        # common, no index_col
-        data = """a,a,a,b,c,c
-q,r,s,t,u,v
-1,2,3,4,5,6
-7,8,9,10,11,12"""
-
-        result = self.read_csv(StringIO(data),header=[0,1],index_col=None)
-        tm.assert_frame_equal(df.reset_index(drop=True),result)
-
-        # malformed case 1
-        expected = DataFrame(np.array([[2,  3,  4,  5,  6],
-                                       [8,  9, 10, 11, 12]], dtype='int64'),
-                             index=Index([1, 7]),
-                             columns=MultiIndex(levels=[[u('a'), u('b'), u('c')], [u('r'), u('s'), u('t'), u('u'), u('v')]],
-                                                labels=[[0, 0, 1, 2, 2], [0, 1, 2, 3, 4]],
-                                                names=[u('a'), u('q')]))
-
-        data = """a,a,a,b,c,c
-q,r,s,t,u,v
-1,2,3,4,5,6
-7,8,9,10,11,12"""
-
-        result = self.read_csv(StringIO(data),header=[0,1],index_col=0)
-        tm.assert_frame_equal(expected,result)
-
-        # malformed case 2
-        expected = DataFrame(np.array([[2,  3,  4,  5,  6],
-                                       [8,  9, 10, 11, 12]], dtype='int64'),
-                             index=Index([1, 7]),
-                             columns=MultiIndex(levels=[[u('a'), u('b'), u('c')], [u('r'), u('s'), u('t'), u('u'), u('v')]],
-                                                labels=[[0, 0, 1, 2, 2], [0, 1, 2, 3, 4]],
-                                                names=[None, u('q')]))
-
-        data = """,a,a,b,c,c
-q,r,s,t,u,v
-1,2,3,4,5,6
-7,8,9,10,11,12"""
-
-        result = self.read_csv(StringIO(data),header=[0,1],index_col=0)
-        tm.assert_frame_equal(expected,result)
-
-        # mi on columns and index (malformed)
-        expected = DataFrame(np.array([[ 3,  4,  5,  6],
-                                       [ 9, 10, 11, 12]], dtype='int64'),
-                             index=MultiIndex(levels=[[1, 7], [2, 8]],
-                                              labels=[[0, 1], [0, 1]]),
-                             columns=MultiIndex(levels=[[u('a'), u('b'), u('c')], [u('s'), u('t'), u('u'), u('v')]],
-                                                labels=[[0, 1, 2, 2], [0, 1, 2, 3]],
-                                                names=[None, u('q')]))
-
-        data = """,a,a,b,c,c
-q,r,s,t,u,v
-1,2,3,4,5,6
-7,8,9,10,11,12"""
-
-        result = self.read_csv(StringIO(data),header=[0,1],index_col=[0, 1])
-        tm.assert_frame_equal(expected,result)
-
-    def test_pass_names_with_index(self):
-        lines = self.data1.split('\n')
-        no_header = '\n'.join(lines[1:])
-
-        # regular index
-        names = ['index', 'A', 'B', 'C', 'D']
-        df = self.read_csv(StringIO(no_header), index_col=0, names=names)
-        expected = self.read_csv(StringIO(self.data1), index_col=0)
-        tm.assert_frame_equal(df, expected)
-
-        # multi index
-        data = """index1,index2,A,B,C,D
-foo,one,2,3,4,5
-foo,two,7,8,9,10
-foo,three,12,13,14,15
-bar,one,12,13,14,15
-bar,two,12,13,14,15
-"""
-        lines = data.split('\n')
-        no_header = '\n'.join(lines[1:])
-        names = ['index1', 'index2', 'A', 'B', 'C', 'D']
-        df = self.read_csv(StringIO(no_header), index_col=[0, 1],
-                           names=names)
-        expected = self.read_csv(StringIO(data), index_col=[0, 1])
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_csv(StringIO(data), index_col=['index1', 'index2'])
-        tm.assert_frame_equal(df, expected)
-
-    def test_multi_index_no_level_names(self):
-        data = """index1,index2,A,B,C,D
-foo,one,2,3,4,5
-foo,two,7,8,9,10
-foo,three,12,13,14,15
-bar,one,12,13,14,15
-bar,two,12,13,14,15
-"""
-
-        data2 = """A,B,C,D
-foo,one,2,3,4,5
-foo,two,7,8,9,10
-foo,three,12,13,14,15
-bar,one,12,13,14,15
-bar,two,12,13,14,15
-"""
-
-        lines = data.split('\n')
-        no_header = '\n'.join(lines[1:])
-        names = ['A', 'B', 'C', 'D']
-
-        df = self.read_csv(StringIO(no_header), index_col=[0, 1],
-                           header=None, names=names)
-        expected = self.read_csv(StringIO(data), index_col=[0, 1])
-        tm.assert_frame_equal(df, expected, check_names=False)
-
-        # 2 implicit first cols
-        df2 = self.read_csv(StringIO(data2))
-        tm.assert_frame_equal(df2, df)
-
-        # reverse order of index
-        df = self.read_csv(StringIO(no_header), index_col=[1, 0], names=names,
-                           header=None)
-        expected = self.read_csv(StringIO(data), index_col=[1, 0])
-        tm.assert_frame_equal(df, expected, check_names=False)
-
-    def test_multi_index_parse_dates(self):
-        data = """index1,index2,A,B,C
-20090101,one,a,1,2
-20090101,two,b,3,4
-20090101,three,c,4,5
-20090102,one,a,1,2
-20090102,two,b,3,4
-20090102,three,c,4,5
-20090103,one,a,1,2
-20090103,two,b,3,4
-20090103,three,c,4,5
-"""
-        df = self.read_csv(StringIO(data), index_col=[0, 1], parse_dates=True)
-        self.assertIsInstance(df.index.levels[0][0],
-                              (datetime, np.datetime64, Timestamp))
-
-        # specify columns out of order!
-        df2 = self.read_csv(StringIO(data), index_col=[1, 0], parse_dates=True)
-        self.assertIsInstance(df2.index.levels[1][0],
-                              (datetime, np.datetime64, Timestamp))
-
-    def test_skip_footer(self):
-        # GH 6607
-        # Test currently only valid with python engine because
-        # skip_footer != 0. Temporarily copied to TestPythonParser.
-        # Test for ValueError with other engines:
-
-        with tm.assertRaisesRegexp(ValueError, 'skip_footer'):
-            data = """A,B,C
-1,2,3
-4,5,6
-7,8,9
-want to skip this
-also also skip this
-"""
-            result = self.read_csv(StringIO(data), skip_footer=2)
-            no_footer = '\n'.join(data.split('\n')[:-3])
-            expected = self.read_csv(StringIO(no_footer))
-
-            tm.assert_frame_equal(result, expected)
-
-            result = self.read_csv(StringIO(data), nrows=3)
-            tm.assert_frame_equal(result, expected)
-
-            # skipfooter alias
-            result = read_csv(StringIO(data), skipfooter=2)
-            no_footer = '\n'.join(data.split('\n')[:-3])
-            expected = read_csv(StringIO(no_footer))
-
-            tm.assert_frame_equal(result, expected)
-
-    def test_no_unnamed_index(self):
-        data = """ id c0 c1 c2
-0 1 0 a b
-1 2 0 c d
-2 2 2 e f
-"""
-        df = self.read_table(StringIO(data), sep=' ')
-        self.assertIsNone(df.index.name)
-
-    def test_converters(self):
-        data = """A,B,C,D
-a,1,2,01/01/2009
-b,3,4,01/02/2009
-c,4,5,01/03/2009
-"""
-        from pandas.compat import parse_date
-
-        result = self.read_csv(StringIO(data), converters={'D': parse_date})
-        result2 = self.read_csv(StringIO(data), converters={3: parse_date})
-
-        expected = self.read_csv(StringIO(data))
-        expected['D'] = expected['D'].map(parse_date)
-
-        tm.assertIsInstance(result['D'][0], (datetime, Timestamp))
-        tm.assert_frame_equal(result, expected)
-        tm.assert_frame_equal(result2, expected)
-
-        # produce integer
-        converter = lambda x: int(x.split('/')[2])
-        result = self.read_csv(StringIO(data), converters={'D': converter})
-        expected = self.read_csv(StringIO(data))
-        expected['D'] = expected['D'].map(converter)
-        tm.assert_frame_equal(result, expected)
-
-    def test_converters_no_implicit_conv(self):
-        # GH2184
-        data = """000102,1.2,A\n001245,2,B"""
-        f = lambda x: x.strip()
-        converter = {0: f}
-        df = self.read_csv(StringIO(data), header=None, converters=converter)
-        self.assertEqual(df[0].dtype, object)
-
-    def test_converters_euro_decimal_format(self):
-        data = """Id;Number1;Number2;Text1;Text2;Number3
-1;1521,1541;187101,9543;ABC;poi;4,738797819
-2;121,12;14897,76;DEF;uyt;0,377320872
-3;878,158;108013,434;GHI;rez;2,735694704"""
-        f = lambda x: float(x.replace(",", "."))
-        converter = {'Number1': f, 'Number2': f, 'Number3': f}
-        df2 = self.read_csv(StringIO(data), sep=';', converters=converter)
-        self.assertEqual(df2['Number1'].dtype, float)
-        self.assertEqual(df2['Number2'].dtype, float)
-        self.assertEqual(df2['Number3'].dtype, float)
-
-    def test_converter_return_string_bug(self):
-        # GH #583
-        data = """Id;Number1;Number2;Text1;Text2;Number3
-1;1521,1541;187101,9543;ABC;poi;4,738797819
-2;121,12;14897,76;DEF;uyt;0,377320872
-3;878,158;108013,434;GHI;rez;2,735694704"""
-        f = lambda x: float(x.replace(",", "."))
-        converter = {'Number1': f, 'Number2': f, 'Number3': f}
-        df2 = self.read_csv(StringIO(data), sep=';', converters=converter)
-        self.assertEqual(df2['Number1'].dtype, float)
-
-    def test_read_table_buglet_4x_multiindex(self):
-        # GH 6607
-        # Parsing multi-level index currently causes an error in the C parser.
-        # Temporarily copied to TestPythonParser.
-        # Here test that CParserError is raised:
-
-        with tm.assertRaises(pandas.parser.CParserError):
-            text = """                      A       B       C       D        E
-one two three   four
-a   b   10.0032 5    -0.5109 -2.3358 -0.4645  0.05076  0.3640
-a   q   20      4     0.4473  1.4152  0.2834  1.00661  0.1744
-x   q   30      3    -0.6662 -0.5243 -0.3580  0.89145  2.5838"""
-
-            # it works!
-            df = self.read_table(StringIO(text), sep='\s+')
-            self.assertEqual(df.index.names, ('one', 'two', 'three', 'four'))
-
-    def test_line_comment(self):
-        data = """# empty
-A,B,C
-1,2.,4.#hello world
-#ignore this line
-5.,NaN,10.0
-"""
-        expected = [[1., 2., 4.],
-                    [5., np.nan, 10.]]
-        df = self.read_csv(StringIO(data), comment='#')
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_comment_skiprows(self):
-        data = """# empty
-random line
-# second empty line
-1,2,3
-A,B,C
-1,2.,4.
-5.,NaN,10.0
-"""
-        expected = [[1., 2., 4.],
-                    [5., np.nan, 10.]]
-        # this should ignore the first four lines (including comments)
-        df = self.read_csv(StringIO(data), comment='#', skiprows=4)
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_comment_header(self):
-        data = """# empty
-# second empty line
-1,2,3
-A,B,C
-1,2.,4.
-5.,NaN,10.0
-"""
-        expected = [[1., 2., 4.],
-                    [5., np.nan, 10.]]
-        # header should begin at the second non-comment line
-        df = self.read_csv(StringIO(data), comment='#', header=1)
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_comment_skiprows_header(self):
-        data = """# empty
-# second empty line
-# third empty line
-X,Y,Z
-1,2,3
-A,B,C
-1,2.,4.
-5.,NaN,10.0
-"""
-        expected = [[1., 2., 4.],
-                    [5., np.nan, 10.]]
-        # skiprows should skip the first 4 lines (including comments), while
-        # header should start from the second non-commented line starting
-        # with line 5
-        df = self.read_csv(StringIO(data), comment='#', skiprows=4, header=1)
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_read_csv_parse_simple_list(self):
-        text = """foo
-bar baz
-qux foo
-foo
-bar"""
-        df = read_csv(StringIO(text), header=None)
-        expected = DataFrame({0: ['foo', 'bar baz', 'qux foo',
-                                  'foo', 'bar']})
-        tm.assert_frame_equal(df, expected)
-
-    def test_parse_dates_custom_euroformat(self):
-        text = """foo,bar,baz
-31/01/2010,1,2
-01/02/2010,1,NA
-02/02/2010,1,2
-"""
-        parser = lambda d: parse_date(d, dayfirst=True)
-        df = self.read_csv(StringIO(text),
-                           names=['time', 'Q', 'NTU'], header=0,
-                           index_col=0, parse_dates=True,
-                           date_parser=parser, na_values=['NA'])
-
-        exp_index = Index([datetime(2010, 1, 31), datetime(2010, 2, 1),
-                           datetime(2010, 2, 2)], name='time')
-        expected = DataFrame({'Q': [1, 1, 1], 'NTU': [2, np.nan, 2]},
-                             index=exp_index, columns=['Q', 'NTU'])
-        tm.assert_frame_equal(df, expected)
-
-        parser = lambda d: parse_date(d, day_first=True)
-        self.assertRaises(Exception, self.read_csv,
-                          StringIO(text), skiprows=[0],
-                          names=['time', 'Q', 'NTU'], index_col=0,
-                          parse_dates=True, date_parser=parser,
-                          na_values=['NA'])
-
-    def test_na_value_dict(self):
-        data = """A,B,C
-foo,bar,NA
-bar,foo,foo
-foo,bar,NA
-bar,foo,foo"""
-
-        df = self.read_csv(StringIO(data),
-                           na_values={'A': ['foo'], 'B': ['bar']})
-        expected = DataFrame({'A': [np.nan, 'bar', np.nan, 'bar'],
-                              'B': [np.nan, 'foo', np.nan, 'foo'],
-                              'C': [np.nan, 'foo', np.nan, 'foo']})
-        tm.assert_frame_equal(df, expected)
-
-        data = """\
-a,b,c,d
-0,NA,1,5
-"""
-        xp = DataFrame({'b': [np.nan], 'c': [1], 'd': [5]}, index=[0])
-        xp.index.name = 'a'
-        df = self.read_csv(StringIO(data), na_values={}, index_col=0)
-        tm.assert_frame_equal(df, xp)
-
-        xp = DataFrame({'b': [np.nan], 'd': [5]},
-                       MultiIndex.from_tuples([(0, 1)]))
-        xp.index.names = ['a', 'c']
-        df = self.read_csv(StringIO(data), na_values={}, index_col=[0, 2])
-        tm.assert_frame_equal(df, xp)
-
-        xp = DataFrame({'b': [np.nan], 'd': [5]},
-                       MultiIndex.from_tuples([(0, 1)]))
-        xp.index.names = ['a', 'c']
-        df = self.read_csv(StringIO(data), na_values={}, index_col=['a', 'c'])
-        tm.assert_frame_equal(df, xp)
-
-    @tm.network
-    def test_url(self):
-        # HTTP(S)
-        url = ('https://raw.github.com/pydata/pandas/master/'
-                'pandas/io/tests/data/salary.table')
-        url_table = self.read_table(url)
-        dirpath = tm.get_data_path()
-        localtable = os.path.join(dirpath, 'salary.table')
-        local_table = self.read_table(localtable)
-        tm.assert_frame_equal(url_table, local_table)
-        # TODO: ftp testing
-
-    @slow
-    def test_file(self):
-
-        # FILE
-        if sys.version_info[:2] < (2, 6):
-            raise nose.SkipTest("file:// not supported with Python < 2.6")
-        dirpath = tm.get_data_path()
-        localtable = os.path.join(dirpath, 'salary.table')
-        local_table = self.read_table(localtable)
-
-        try:
-            url_table = self.read_table('file://localhost/' + localtable)
-        except URLError:
-            # fails on some systems
-            raise nose.SkipTest("failing on %s" %
-                                ' '.join(platform.uname()).strip())
-
-        tm.assert_frame_equal(url_table, local_table)
-
-    def test_parse_tz_aware(self):
-        import pytz
-        # #1693
-        data = StringIO("Date,x\n2012-06-13T01:39:00Z,0.5")
-
-        # it works
-        result = read_csv(data, index_col=0, parse_dates=True)
-        stamp = result.index[0]
-        self.assertEqual(stamp.minute, 39)
-        try:
-            self.assertIs(result.index.tz, pytz.utc)
-        except AssertionError:  # hello Yaroslav
-            arr = result.index.to_pydatetime()
-            result = tools.to_datetime(arr, utc=True)[0]
-            self.assertEqual(stamp.minute, result.minute)
-            self.assertEqual(stamp.hour, result.hour)
-            self.assertEqual(stamp.day, result.day)
-
-    def test_multiple_date_cols_index(self):
-        data = """\
-ID,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir
-KORD1,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD2,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD3,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD4,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD5,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD6,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000"""
-
-        xp = self.read_csv(StringIO(data), parse_dates={'nominal': [1, 2]})
-        df = self.read_csv(StringIO(data), parse_dates={'nominal': [1, 2]},
-                           index_col='nominal')
-        tm.assert_frame_equal(xp.set_index('nominal'), df)
-        df2 = self.read_csv(StringIO(data), parse_dates={'nominal': [1, 2]},
-                            index_col=0)
-        tm.assert_frame_equal(df2, df)
-
-        df3 = self.read_csv(StringIO(data), parse_dates=[[1, 2]], index_col=0)
-        tm.assert_frame_equal(df3, df, check_names=False)
-
-    def test_multiple_date_cols_chunked(self):
-        df = self.read_csv(StringIO(self.ts_data), parse_dates={
-                           'nominal': [1, 2]}, index_col='nominal')
-        reader = self.read_csv(StringIO(self.ts_data), parse_dates={'nominal':
-                               [1, 2]}, index_col='nominal', chunksize=2)
-
-        chunks = list(reader)
-
-        self.assertNotIn('nominalTime', df)
-
-        tm.assert_frame_equal(chunks[0], df[:2])
-        tm.assert_frame_equal(chunks[1], df[2:4])
-        tm.assert_frame_equal(chunks[2], df[4:])
-
-    def test_multiple_date_col_named_components(self):
-        xp = self.read_csv(StringIO(self.ts_data),
-                           parse_dates={'nominal': [1, 2]},
-                           index_col='nominal')
-        colspec = {'nominal': ['date', 'nominalTime']}
-        df = self.read_csv(StringIO(self.ts_data), parse_dates=colspec,
-                           index_col='nominal')
-        tm.assert_frame_equal(df, xp)
-
-    def test_multiple_date_col_multiple_index(self):
-        df = self.read_csv(StringIO(self.ts_data),
-                           parse_dates={'nominal': [1, 2]},
-                           index_col=['nominal', 'ID'])
-
-        xp = self.read_csv(StringIO(self.ts_data),
-                           parse_dates={'nominal': [1, 2]})
-
-        tm.assert_frame_equal(xp.set_index(['nominal', 'ID']), df)
-
-    def test_comment(self):
-        data = """A,B,C
-1,2.,4.#hello world
-5.,NaN,10.0
-"""
-        expected = [[1., 2., 4.],
-                    [5., np.nan, 10.]]
-        df = self.read_csv(StringIO(data), comment='#')
-        tm.assert_almost_equal(df.values, expected)
-
-        df = self.read_table(StringIO(data), sep=',', comment='#',
-                             na_values=['NaN'])
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_bool_na_values(self):
-        data = """A,B,C
-True,False,True
-NA,True,False
-False,NA,True"""
-
-        result = self.read_csv(StringIO(data))
-        expected = DataFrame({'A': np.array([True, nan, False], dtype=object),
-                              'B': np.array([False, True, nan], dtype=object),
-                              'C': [True, False, True]})
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_nonexistent_path(self):
-        # don't segfault pls #2428
-        path = '%s.csv' % tm.rands(10)
-        self.assertRaises(Exception, self.read_csv, path)
-
-    def test_missing_trailing_delimiters(self):
-        data = """A,B,C,D
-1,2,3,4
-1,3,3,
-1,4,5"""
-        result = self.read_csv(StringIO(data))
-        self.assertTrue(result['D'].isnull()[1:].all())
-
-    def test_skipinitialspace(self):
-        s = ('"09-Apr-2012", "01:10:18.300", 2456026.548822908, 12849, '
-             '1.00361,  1.12551, 330.65659, 0355626618.16711,  73.48821, '
-             '314.11625,  1917.09447,   179.71425,  80.000, 240.000, -350,  '
-             '70.06056, 344.98370, 1,   1, -0.689265, -0.692787,  '
-             '0.212036,    14.7674,   41.605,   -9999.0,   -9999.0,   '
-             '-9999.0,   -9999.0,   -9999.0,  -9999.0, 000, 012, 128')
-
-        sfile = StringIO(s)
-        # it's 33 columns
-        result = self.read_csv(sfile, names=lrange(33), na_values=['-9999.0'],
-                               header=None, skipinitialspace=True)
-        self.assertTrue(pd.isnull(result.ix[0, 29]))
-
-    def test_utf16_bom_skiprows(self):
-        # #2298
-        data = u("""skip this
-skip this too
-A\tB\tC
-1\t2\t3
-4\t5\t6""")
-
-        data2 = u("""skip this
-skip this too
-A,B,C
-1,2,3
-4,5,6""")
-
-        path = '__%s__.csv' % tm.rands(10)
-
-        with tm.ensure_clean(path) as path:
-            for sep, dat in [('\t', data), (',', data2)]:
-                for enc in ['utf-16', 'utf-16le', 'utf-16be']:
-                    bytes = dat.encode(enc)
-                    with open(path, 'wb') as f:
-                        f.write(bytes)
-
-                    s = BytesIO(dat.encode('utf-8'))
-                    if compat.PY3:
-                        # somewhat False since the code never sees bytes
-                        from io import TextIOWrapper
-                        s = TextIOWrapper(s, encoding='utf-8')
-
-                    result = self.read_csv(path, encoding=enc, skiprows=2,
-                                           sep=sep)
-                    expected = self.read_csv(s, encoding='utf-8', skiprows=2,
-                                             sep=sep)
-
-                    tm.assert_frame_equal(result, expected)
-
-    def test_utf16_example(self):
-        path = tm.get_data_path('utf16_ex.txt')
-
-        # it works! and is the right length
-        result = self.read_table(path, encoding='utf-16')
-        self.assertEqual(len(result), 50)
-
-        if not compat.PY3:
-            buf = BytesIO(open(path, 'rb').read())
-            result = self.read_table(buf, encoding='utf-16')
-            self.assertEqual(len(result), 50)
-
-    def test_converters_corner_with_nas(self):
-        # skip aberration observed on Win64 Python 3.2.2
-        if hash(np.int64(-1)) != -2:
-            raise nose.SkipTest("skipping because of windows hash on Python"
-                                " 3.2.2")
-
-        csv = """id,score,days
-1,2,12
-2,2-5,
-3,,14+
-4,6-12,2"""
-
-        def convert_days(x):
-            x = x.strip()
-            if not x:
-                return np.nan
-
-            is_plus = x.endswith('+')
-            if is_plus:
-                x = int(x[:-1]) + 1
-            else:
-                x = int(x)
-            return x
-
-        def convert_days_sentinel(x):
-            x = x.strip()
-            if not x:
-                return np.nan
-
-            is_plus = x.endswith('+')
-            if is_plus:
-                x = int(x[:-1]) + 1
-            else:
-                x = int(x)
-            return x
-
-        def convert_score(x):
-            x = x.strip()
-            if not x:
-                return np.nan
-            if x.find('-') > 0:
-                valmin, valmax = lmap(int, x.split('-'))
-                val = 0.5 * (valmin + valmax)
-            else:
-                val = float(x)
-
-            return val
-
-        fh = StringIO(csv)
-        result = self.read_csv(fh, converters={'score': convert_score,
-                                               'days': convert_days},
-                               na_values=['', None])
-        self.assertTrue(pd.isnull(result['days'][1]))
-
-        fh = StringIO(csv)
-        result2 = self.read_csv(fh, converters={'score': convert_score,
-                                                'days': convert_days_sentinel},
-                                na_values=['', None])
-        tm.assert_frame_equal(result, result2)
-
-    def test_unicode_encoding(self):
-        pth = tm.get_data_path('unicode_series.csv')
-
-        result = self.read_csv(pth, header=None, encoding='latin-1')
-        result = result.set_index(0)
-
-        got = result[1][1632]
-        expected = u('\xc1 k\xf6ldum klaka (Cold Fever) (1994)')
-
-        self.assertEqual(got, expected)
-
-    def test_trailing_delimiters(self):
-        # #2442. grumble grumble
-        data = """A,B,C
-1,2,3,
-4,5,6,
-7,8,9,"""
-        result = self.read_csv(StringIO(data), index_col=False)
-
-        expected = DataFrame({'A': [1, 4, 7], 'B': [2, 5, 8],
-                              'C': [3, 6, 9]})
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_escapechar(self):
-        # http://stackoverflow.com/questions/13824840/feature-request-for-
-        # pandas-read-csv
-        data = '''SEARCH_TERM,ACTUAL_URL
-"bra tv bord","http://www.ikea.com/se/sv/catalog/categories/departments/living_room/10475/?se%7cps%7cnonbranded%7cvardagsrum%7cgoogle%7ctv_bord"
-"tv p\xc3\xa5 hjul","http://www.ikea.com/se/sv/catalog/categories/departments/living_room/10475/?se%7cps%7cnonbranded%7cvardagsrum%7cgoogle%7ctv_bord"
-"SLAGBORD, \\"Bergslagen\\", IKEA:s 1700-tals serie","http://www.ikea.com/se/sv/catalog/categories/departments/living_room/10475/?se%7cps%7cnonbranded%7cvardagsrum%7cgoogle%7ctv_bord"'''
-
-        result = self.read_csv(StringIO(data), escapechar='\\',
-                               quotechar='"', encoding='utf-8')
-        self.assertEqual(result['SEARCH_TERM'][2],
-                         'SLAGBORD, "Bergslagen", IKEA:s 1700-tals serie')
-        self.assertTrue(np.array_equal(result.columns,
-                                       ['SEARCH_TERM', 'ACTUAL_URL']))
-
-    def test_header_names_backward_compat(self):
-        # #2539
-        data = '1,2,3\n4,5,6'
-
-        result = self.read_csv(StringIO(data), names=['a', 'b', 'c'])
-        expected = self.read_csv(StringIO(data), names=['a', 'b', 'c'],
-                                 header=None)
-        tm.assert_frame_equal(result, expected)
-
-        data2 = 'foo,bar,baz\n' + data
-        result = self.read_csv(StringIO(data2), names=['a', 'b', 'c'],
-                               header=0)
-        tm.assert_frame_equal(result, expected)
-
-    def test_int64_min_issues(self):
-        # #2599
-        data = 'A,B\n0,0\n0,'
-
-        result = self.read_csv(StringIO(data))
-        expected = DataFrame({'A': [0, 0], 'B': [0, np.nan]})
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_parse_integers_above_fp_precision(self):
-        data = """Numbers
-17007000002000191
-17007000002000191
-17007000002000191
-17007000002000191
-17007000002000192
-17007000002000192
-17007000002000192
-17007000002000192
-17007000002000192
-17007000002000194"""
-
-        result = self.read_csv(StringIO(data))
-        expected = DataFrame({'Numbers': [17007000002000191,
-                                          17007000002000191,
-                                          17007000002000191,
-                                          17007000002000191,
-                                          17007000002000192,
-                                          17007000002000192,
-                                          17007000002000192,
-                                          17007000002000192,
-                                          17007000002000192,
-                                          17007000002000194]})
-
-        self.assertTrue(np.array_equal(result['Numbers'], expected['Numbers']))
-
-    def test_usecols_index_col_conflict(self):
-        # Issue 4201  Test that index_col as integer reflects usecols
-        data = """SecId,Time,Price,P2,P3
-10000,2013-5-11,100,10,1
-500,2013-5-12,101,11,1
-"""
-        expected = DataFrame({'Price': [100, 101]}, index=[datetime(2013, 5, 11), datetime(2013, 5, 12)])
-        expected.index.name = 'Time'
-
-        df = self.read_csv(StringIO(data), usecols=['Time', 'Price'], parse_dates=True, index_col=0)
-        tm.assert_frame_equal(expected, df)
-
-        df = self.read_csv(StringIO(data), usecols=['Time', 'Price'], parse_dates=True, index_col='Time')
-        tm.assert_frame_equal(expected, df)
-
-        df = self.read_csv(StringIO(data), usecols=[1, 2], parse_dates=True, index_col='Time')
-        tm.assert_frame_equal(expected, df)
-
-        df = self.read_csv(StringIO(data), usecols=[1, 2], parse_dates=True, index_col=0)
-        tm.assert_frame_equal(expected, df)
-
-        expected = DataFrame({'P3': [1, 1], 'Price': (100, 101), 'P2': (10, 11)})
-        expected = expected.set_index(['Price', 'P2'])
-        df = self.read_csv(StringIO(data), usecols=['Price', 'P2', 'P3'], parse_dates=True, index_col=['Price', 'P2'])
-        tm.assert_frame_equal(expected, df)
-
-    def test_chunks_have_consistent_numerical_type(self):
-        integers = [str(i) for i in range(499999)]
-        data = "a\n" + "\n".join(integers + ["1.0", "2.0"] + integers)
-
-        with tm.assert_produces_warning(False):
-            df = self.read_csv(StringIO(data))
-        self.assertTrue(type(df.a[0]) is np.float64)  # Assert that types were coerced.
-        self.assertEqual(df.a.dtype, np.float)
-
-    def test_warn_if_chunks_have_mismatched_type(self):
-        # See test in TestCParserLowMemory.
-        integers = [str(i) for i in range(499999)]
-        data = "a\n" + "\n".join(integers + ['a', 'b'] + integers)
-
-        with tm.assert_produces_warning(False):
-            df = self.read_csv(StringIO(data))
-        self.assertEqual(df.a.dtype, np.object)
-
-    def test_usecols(self):
-        data = """\
-a,b,c
-1,2,3
-4,5,6
-7,8,9
-10,11,12"""
-
-        result = self.read_csv(StringIO(data), usecols=(1, 2))
-        result2 = self.read_csv(StringIO(data), usecols=('b', 'c'))
-        exp = self.read_csv(StringIO(data))
-
-        self.assertEqual(len(result.columns), 2)
-        self.assertTrue((result['b'] == exp['b']).all())
-        self.assertTrue((result['c'] == exp['c']).all())
-
-        tm.assert_frame_equal(result, result2)
-
-        result = self.read_csv(StringIO(data), usecols=[1, 2], header=0,
-                               names=['foo', 'bar'])
-        expected = self.read_csv(StringIO(data), usecols=[1, 2])
-        expected.columns = ['foo', 'bar']
-        tm.assert_frame_equal(result, expected)
-
-        data = """\
-1,2,3
-4,5,6
-7,8,9
-10,11,12"""
-        result = self.read_csv(StringIO(data), names=['b', 'c'],
-                               header=None, usecols=[1, 2])
-
-        expected = self.read_csv(StringIO(data), names=['a', 'b', 'c'],
-                                 header=None)
-        expected = expected[['b', 'c']]
-        tm.assert_frame_equal(result, expected)
-
-        result2 = self.read_csv(StringIO(data), names=['a', 'b', 'c'],
-                                header=None, usecols=['b', 'c'])
-        tm.assert_frame_equal(result2, result)
-
-
-        # 5766
-        result = self.read_csv(StringIO(data), names=['a', 'b'],
-                               header=None, usecols=[0, 1])
-
-        expected = self.read_csv(StringIO(data), names=['a', 'b', 'c'],
-                                 header=None)
-        expected = expected[['a', 'b']]
-        tm.assert_frame_equal(result, expected)
-
-        # length conflict, passed names and usecols disagree
-        self.assertRaises(ValueError, self.read_csv, StringIO(data),
-                          names=['a', 'b'], usecols=[1], header=None)
-
-    def test_integer_overflow_bug(self):
-        # #2601
-        data = "65248E10 11\n55555E55 22\n"
-
-        result = self.read_csv(StringIO(data), header=None, sep=' ')
-        self.assertTrue(result[0].dtype == np.float64)
-
-        result = self.read_csv(StringIO(data), header=None, sep='\s+')
-        self.assertTrue(result[0].dtype == np.float64)
-
-    def test_catch_too_many_names(self):
-        # Issue 5156
-        data = """\
-1,2,3
-4,,6
-7,8,9
-10,11,12\n"""
-        tm.assertRaises(Exception, read_csv, StringIO(data), header=0, names=['a', 'b', 'c', 'd'])
-
-    def test_ignore_leading_whitespace(self):
-        # GH 6607, GH 3374
-        data = ' a b c\n 1 2 3\n 4 5 6\n 7 8 9'
-        result = self.read_table(StringIO(data), sep='\s+')
-        expected = DataFrame({'a':[1,4,7], 'b':[2,5,8], 'c': [3,6,9]})
-        tm.assert_frame_equal(result, expected)
-
-    def test_nrows_and_chunksize_raises_notimplemented(self):
-        data = 'a b c'
-        self.assertRaises(NotImplementedError, self.read_csv, StringIO(data),
-                     nrows=10, chunksize=5)
-
-    def test_single_char_leading_whitespace(self):
-        # GH 9710
-        data = """\
-MyColumn
-   a
-   b
-   a
-   b\n"""
-
-        expected = DataFrame({'MyColumn' : list('abab')})
-
-        result = self.read_csv(StringIO(data), skipinitialspace=True)
-        tm.assert_frame_equal(result, expected)
-
-    def test_chunk_begins_with_newline_whitespace(self):
-        # GH 10022
-        data = '\n hello\nworld\n'
-        result = self.read_csv(StringIO(data), header=None)
-        self.assertEqual(len(result), 2)
-
-        # GH 9735
-        chunk1 = 'a' * (1024 * 256 - 2) + '\na'
-        chunk2 = '\n a'
-        result = pd.read_csv(StringIO(chunk1 + chunk2), header=None)
-        expected = pd.DataFrame(['a' * (1024 * 256 - 2), 'a', ' a'])
-        tm.assert_frame_equal(result, expected)
-
-    def test_empty_with_index(self):
-        # GH 10184
-        data = 'x,y'
-        result = self.read_csv(StringIO(data), index_col=0)
-        expected = DataFrame([], columns=['y'], index=Index([], name='x'))
-        tm.assert_frame_equal(result, expected)
-
-    def test_emtpy_with_multiindex(self):
-        # GH 10467
-        data = 'x,y,z'
-        result = self.read_csv(StringIO(data), index_col=['x', 'y'])
-        expected = DataFrame([], columns=['z'],
-                             index=MultiIndex.from_arrays([[]] * 2, names=['x', 'y']))
-        tm.assert_frame_equal(result, expected)
-
-    def test_empty_with_reversed_multiindex(self):
-        data = 'x,y,z'
-        result = self.read_csv(StringIO(data), index_col=[1, 0])
-        expected = DataFrame([], columns=['z'],
-                             index=MultiIndex.from_arrays([[]] * 2, names=['y', 'x']))
-        tm.assert_frame_equal(result, expected)
-
-    def test_empty_index_col_scenarios(self):
-        data = 'x,y,z'
-
-        # None, no index
-        index_col, expected = None, DataFrame([], columns=list('xyz')),
-        tm.assert_frame_equal(self.read_csv(StringIO(data), index_col=index_col), expected)
-
-        # False, no index
-        index_col, expected = False, DataFrame([], columns=list('xyz')),
-        tm.assert_frame_equal(self.read_csv(StringIO(data), index_col=index_col), expected)
-
-        # int, first column
-        index_col, expected = 0, DataFrame([], columns=['y', 'z'], index=Index([], name='x'))
-        tm.assert_frame_equal(self.read_csv(StringIO(data), index_col=index_col), expected)
-
-        # int, not first column
-        index_col, expected = 1, DataFrame([], columns=['x', 'z'], index=Index([], name='y'))
-        tm.assert_frame_equal(self.read_csv(StringIO(data), index_col=index_col), expected)
-
-        # str, first column
-        index_col, expected = 'x', DataFrame([], columns=['y', 'z'], index=Index([], name='x'))
-        tm.assert_frame_equal(self.read_csv(StringIO(data), index_col=index_col), expected)
-
-        # str, not the first column
-        index_col, expected = 'y', DataFrame([], columns=['x', 'z'], index=Index([], name='y'))
-        tm.assert_frame_equal(self.read_csv(StringIO(data), index_col=index_col), expected)
-
-        # list of int
-        index_col, expected = [0, 1], DataFrame([], columns=['z'],
-                                                index=MultiIndex.from_arrays([[]] * 2, names=['x', 'y']))
-        tm.assert_frame_equal(self.read_csv(StringIO(data), index_col=index_col), expected)
-
-        # list of str
-        index_col, expected = (
-            ['x', 'y'],
-            DataFrame([], columns=['z'], index=MultiIndex.from_arrays([[]] * 2, names=['x', 'y']))
-        )
-        tm.assert_frame_equal(self.read_csv(StringIO(data), index_col=index_col), expected)
-
-        # list of int, reversed sequence
-        index_col, expected = (
-            [1, 0],
-            DataFrame([], columns=['z'], index=MultiIndex.from_arrays([[]] * 2, names=['y', 'x']))
-        )
-        tm.assert_frame_equal(self.read_csv(StringIO(data), index_col=index_col), expected)
-
-        # list of str, reversed sequence
-        index_col, expected = (
-            ['y', 'x'],
-            DataFrame([], columns=['z'], index=MultiIndex.from_arrays([[]] * 2, names=['y', 'x']))
-        )
-        tm.assert_frame_equal(self.read_csv(StringIO(data), index_col=index_col), expected)
-
-    def test_empty_with_index_col_false(self):
-        # GH 10413
-        data = 'x,y'
-        result = self.read_csv(StringIO(data), index_col=False)
-        expected = DataFrame([], columns=['x', 'y'])
-        tm.assert_frame_equal(result, expected)
-
-    def test_float_parser(self):
-        # GH 9565
-        data = '45e-1,4.5,45.,inf,-inf'
-        result = self.read_csv(StringIO(data), header=None)
-        expected = pd.DataFrame([[float(s) for s in data.split(',')]])
-        tm.assert_frame_equal(result, expected)
-
-    def test_int64_overflow(self):
-        data = """ID
-00013007854817840016671868
-00013007854817840016749251
-00013007854817840016754630
-00013007854817840016781876
-00013007854817840017028824
-00013007854817840017963235
-00013007854817840018860166"""
-
-        result = self.read_csv(StringIO(data))
-        self.assertTrue(result['ID'].dtype == object)
-
-        self.assertRaises((OverflowError, pandas.parser.OverflowError),
-            self.read_csv, StringIO(data),
-            converters={'ID' : np.int64})
-
-        # Just inside int64 range: parse as integer
-        i_max = np.iinfo(np.int64).max
-        i_min = np.iinfo(np.int64).min
-        for x in [i_max, i_min]:
-            result = pd.read_csv(StringIO(str(x)), header=None)
-            expected = pd.DataFrame([x])
-            tm.assert_frame_equal(result, expected)
-
-        # Just outside int64 range: parse as string
-        too_big = i_max + 1
-        too_small = i_min - 1
-        for x in [too_big, too_small]:
-            result = pd.read_csv(StringIO(str(x)), header=None)
-            expected = pd.DataFrame([str(x)])
-            tm.assert_frame_equal(result, expected)
-
-    def test_empty_with_nrows_chunksize(self):
-        # GH 9535
-        expected = pd.DataFrame([], columns=['foo', 'bar'])
-
-        result = self.read_csv(StringIO('foo,bar\n'), nrows=10)
-        tm.assert_frame_equal(result, expected)
-
-        result = next(iter(pd.read_csv(StringIO('foo,bar\n'), chunksize=10)))
-        tm.assert_frame_equal(result, expected)
-
-        result = pd.read_csv(StringIO('foo,bar\n'), nrows=10, as_recarray=True)
-        result = pd.DataFrame(result[2], columns=result[1], index=result[0])
-        tm.assert_frame_equal(pd.DataFrame.from_records(result), expected)
-
-        result = next(iter(pd.read_csv(StringIO('foo,bar\n'), chunksize=10, as_recarray=True)))
-        result = pd.DataFrame(result[2], columns=result[1], index=result[0])
-        tm.assert_frame_equal(pd.DataFrame.from_records(result), expected)
-
-    def test_eof_states(self):
-        # GH 10728 and 10548
-
-        ## With skip_blank_lines = True
-        expected = pd.DataFrame([[4, 5, 6]], columns=['a', 'b', 'c'])
-
-        # GH 10728
-        # WHITESPACE_LINE
-        data = 'a,b,c\n4,5,6\n '
-        result = self.read_csv(StringIO(data))
-        tm.assert_frame_equal(result, expected)
-
-        # GH 10548
-        # EAT_LINE_COMMENT
-        data = 'a,b,c\n4,5,6\n#comment'
-        result = self.read_csv(StringIO(data), comment='#')
-        tm.assert_frame_equal(result, expected)
-
-        # EAT_CRNL_NOP
-        data = 'a,b,c\n4,5,6\n\r'
-        result = self.read_csv(StringIO(data))
-        tm.assert_frame_equal(result, expected)
-
-        # EAT_COMMENT
-        data = 'a,b,c\n4,5,6#comment'
-        result = self.read_csv(StringIO(data), comment='#')
-        tm.assert_frame_equal(result, expected)
-
-        # SKIP_LINE
-        data = 'a,b,c\n4,5,6\nskipme'
-        result = self.read_csv(StringIO(data), skiprows=[2])
-        tm.assert_frame_equal(result, expected)
-
-        ## With skip_blank_lines = False
-
-        # EAT_LINE_COMMENT
-        data = 'a,b,c\n4,5,6\n#comment'
-        result = self.read_csv(StringIO(data), comment='#', skip_blank_lines=False)
-        expected = pd.DataFrame([[4, 5, 6]], columns=['a', 'b', 'c'])
-        tm.assert_frame_equal(result, expected)
-
-        # IN_FIELD
-        data = 'a,b,c\n4,5,6\n '
-        result = self.read_csv(StringIO(data), skip_blank_lines=False)
-        expected = pd.DataFrame([['4', 5, 6], [' ', None, None]], columns=['a', 'b', 'c'])
-        tm.assert_frame_equal(result, expected)
-
-        # EAT_CRNL
-        data = 'a,b,c\n4,5,6\n\r'
-        result = self.read_csv(StringIO(data), skip_blank_lines=False)
-        expected = pd.DataFrame([[4, 5, 6], [None, None, None]], columns=['a', 'b', 'c'])
-        tm.assert_frame_equal(result, expected)
-
-        ## Should produce exceptions
-
-        # ESCAPED_CHAR
-        data = "a,b,c\n4,5,6\n\\"
-        self.assertRaises(Exception, self.read_csv, StringIO(data), escapechar='\\')
-
-        # ESCAPE_IN_QUOTED_FIELD
-        data = 'a,b,c\n4,5,6\n"\\'
-        self.assertRaises(Exception, self.read_csv, StringIO(data), escapechar='\\')
-
-        # IN_QUOTED_FIELD
-        # Python 2.6 won't throw an exception for this case (see http://bugs.python.org/issue16013)
-        tm._skip_if_python26()
-        data = 'a,b,c\n4,5,6\n"'
-        self.assertRaises(Exception, self.read_csv, StringIO(data), escapechar='\\')
-
-
-
-class TestPythonParser(ParserTests, tm.TestCase):
-    def test_negative_skipfooter_raises(self):
-        text = """#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-1/1/2000,1.,2.,3.
-1/2/2000,4,5,6
-1/3/2000,7,8,9
-"""
-
-        with tm.assertRaisesRegexp(ValueError,
-                                   'skip footer cannot be negative'):
-            df = self.read_csv(StringIO(text), skipfooter=-1)
-
-    def read_csv(self, *args, **kwds):
-        kwds = kwds.copy()
-        kwds['engine'] = 'python'
-        return read_csv(*args, **kwds)
-
-    def read_table(self, *args, **kwds):
-        kwds = kwds.copy()
-        kwds['engine'] = 'python'
-        return read_table(*args, **kwds)
-
-    def test_sniff_delimiter(self):
-        text = """index|A|B|C
-foo|1|2|3
-bar|4|5|6
-baz|7|8|9
-"""
-        data = self.read_csv(StringIO(text), index_col=0, sep=None)
-        self.assertTrue(data.index.equals(Index(['foo', 'bar', 'baz'])))
-
-        data2 = self.read_csv(StringIO(text), index_col=0, delimiter='|')
-        tm.assert_frame_equal(data, data2)
-
-        text = """ignore this
-ignore this too
-index|A|B|C
-foo|1|2|3
-bar|4|5|6
-baz|7|8|9
-"""
-        data3 = self.read_csv(StringIO(text), index_col=0,
-                              sep=None, skiprows=2)
-        tm.assert_frame_equal(data, data3)
-
-        text = u("""ignore this
-ignore this too
-index|A|B|C
-foo|1|2|3
-bar|4|5|6
-baz|7|8|9
-""").encode('utf-8')
-
-        s = BytesIO(text)
-        if compat.PY3:
-            # somewhat False since the code never sees bytes
-            from io import TextIOWrapper
-            s = TextIOWrapper(s, encoding='utf-8')
-
-        data4 = self.read_csv(s, index_col=0, sep=None, skiprows=2,
-                              encoding='utf-8')
-        tm.assert_frame_equal(data, data4)
-
-    def test_regex_separator(self):
-        data = """   A   B   C   D
-a   1   2   3   4
-b   1   2   3   4
-c   1   2   3   4
-"""
-        df = self.read_table(StringIO(data), sep='\s+')
-        expected = self.read_csv(StringIO(re.sub('[ ]+', ',', data)),
-                                 index_col=0)
-        self.assertIsNone(expected.index.name)
-        tm.assert_frame_equal(df, expected)
-
-    def test_1000_fwf(self):
-        data = """
- 1 2,334.0    5
-10   13     10.
-"""
-        expected = [[1, 2334., 5],
-                    [10, 13, 10]]
-        df = read_fwf(StringIO(data), colspecs=[(0, 3), (3, 11), (12, 16)],
-                      thousands=',')
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_1000_sep_with_decimal(self):
-        data = """A|B|C
-1|2,334.01|5
-10|13|10.
-"""
-
-        expected = DataFrame({
-            'A': [1, 10],
-            'B': [2334.01, 13],
-            'C': [5, 10.]
-        })
-
-        df = self.read_csv(StringIO(data), sep='|', thousands=',')
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_table(StringIO(data), sep='|', thousands=',')
-        tm.assert_frame_equal(df, expected)
-
-    def test_comment_fwf(self):
-        data = """
-  1   2.   4  #hello world
-  5  NaN  10.0
-"""
-        expected = [[1, 2., 4],
-                    [5, np.nan, 10.]]
-        df = read_fwf(StringIO(data), colspecs=[(0, 3), (4, 9), (9, 25)],
-                      comment='#')
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_fwf(self):
-        data_expected = """\
-2011,58,360.242940,149.910199,11950.7
-2011,59,444.953632,166.985655,11788.4
-2011,60,364.136849,183.628767,11806.2
-2011,61,413.836124,184.375703,11916.8
-2011,62,502.953953,173.237159,12468.3
-"""
-        expected = self.read_csv(StringIO(data_expected), header=None)
-
-        data1 = """\
-201158    360.242940   149.910199   11950.7
-201159    444.953632   166.985655   11788.4
-201160    364.136849   183.628767   11806.2
-201161    413.836124   184.375703   11916.8
-201162    502.953953   173.237159   12468.3
-"""
-        colspecs = [(0, 4), (4, 8), (8, 20), (21, 33), (34, 43)]
-        df = read_fwf(StringIO(data1), colspecs=colspecs, header=None)
-        tm.assert_frame_equal(df, expected)
-
-        data2 = """\
-2011 58   360.242940   149.910199   11950.7
-2011 59   444.953632   166.985655   11788.4
-2011 60   364.136849   183.628767   11806.2
-2011 61   413.836124   184.375703   11916.8
-2011 62   502.953953   173.237159   12468.3
-"""
-        df = read_fwf(StringIO(data2), widths=[5, 5, 13, 13, 7], header=None)
-        tm.assert_frame_equal(df, expected)
-
-        # From Thomas Kluyver: apparently some non-space filler characters can
-        # be seen, this is supported by specifying the 'delimiter' character:
-        # http://publib.boulder.ibm.com/infocenter/dmndhelp/v6r1mx/index.jsp?topic=/com.ibm.wbit.612.help.config.doc/topics/rfixwidth.html
-        data3 = """\
-201158~~~~360.242940~~~149.910199~~~11950.7
-201159~~~~444.953632~~~166.985655~~~11788.4
-201160~~~~364.136849~~~183.628767~~~11806.2
-201161~~~~413.836124~~~184.375703~~~11916.8
-201162~~~~502.953953~~~173.237159~~~12468.3
-"""
-        df = read_fwf(
-            StringIO(data3), colspecs=colspecs, delimiter='~', header=None)
-        tm.assert_frame_equal(df, expected)
-
-        with tm.assertRaisesRegexp(ValueError, "must specify only one of"):
-            read_fwf(StringIO(data3), colspecs=colspecs, widths=[6, 10, 10, 7])
-
-        with tm.assertRaisesRegexp(ValueError, "Must specify either"):
-            read_fwf(StringIO(data3), colspecs=None, widths=None)
-
-    def test_fwf_colspecs_is_list_or_tuple(self):
-        with tm.assertRaisesRegexp(TypeError,
-                                   'column specifications must be a list or '
-                                   'tuple.+'):
-            pd.io.parsers.FixedWidthReader(StringIO(self.data1),
-                                           {'a': 1}, ',', '#')
-
-    def test_fwf_colspecs_is_list_or_tuple_of_two_element_tuples(self):
-        with tm.assertRaisesRegexp(TypeError,
-                                   'Each column specification must be.+'):
-            read_fwf(StringIO(self.data1), [('a', 1)])
-
-    def test_fwf_colspecs_None(self):
-        # GH 7079
-        data = """\
-123456
-456789
-"""
-        colspecs = [(0, 3), (3, None)]
-        result = read_fwf(StringIO(data), colspecs=colspecs, header=None)
-        expected = DataFrame([[123, 456], [456, 789]])
-        tm.assert_frame_equal(result, expected)
-
-        colspecs = [(None, 3), (3, 6)]
-        result = read_fwf(StringIO(data), colspecs=colspecs, header=None)
-        expected = DataFrame([[123, 456], [456, 789]])
-        tm.assert_frame_equal(result, expected)
-
-        colspecs = [(0, None), (3, None)]
-        result = read_fwf(StringIO(data), colspecs=colspecs, header=None)
-        expected = DataFrame([[123456, 456], [456789, 789]])
-        tm.assert_frame_equal(result, expected)
-
-        colspecs = [(None, None), (3, 6)]
-        result = read_fwf(StringIO(data), colspecs=colspecs, header=None)
-        expected = DataFrame([[123456, 456], [456789, 789]])
-        tm.assert_frame_equal(result, expected)
-
-
-    def test_fwf_regression(self):
-        # GH 3594
-        #### turns out 'T060' is parsable as a datetime slice!
-
-        tzlist = [1,10,20,30,60,80,100]
-        ntz = len(tzlist)
-        tcolspecs = [16]+[8]*ntz
-        tcolnames = ['SST'] + ["T%03d" % z for z in tzlist[1:]]
-        data = """  2009164202000   9.5403  9.4105  8.6571  7.8372  6.0612  5.8843  5.5192
-  2009164203000   9.5435  9.2010  8.6167  7.8176  6.0804  5.8728  5.4869
-  2009164204000   9.5873  9.1326  8.4694  7.5889  6.0422  5.8526  5.4657
-  2009164205000   9.5810  9.0896  8.4009  7.4652  6.0322  5.8189  5.4379
-  2009164210000   9.6034  9.0897  8.3822  7.4905  6.0908  5.7904  5.4039
-"""
-
-        df = read_fwf(StringIO(data),
-                      index_col=0,
-                      header=None,
-                      names=tcolnames,
-                      widths=tcolspecs,
-                      parse_dates=True,
-                      date_parser=lambda s: datetime.strptime(s,'%Y%j%H%M%S'))
-
-        for c in df.columns:
-            res = df.loc[:,c]
-            self.assertTrue(len(res))
-
-    def test_fwf_for_uint8(self):
-        data = """1421302965.213420    PRI=3 PGN=0xef00      DST=0x17 SRC=0x28    04 154 00 00 00 00 00 127
-1421302964.226776    PRI=6 PGN=0xf002               SRC=0x47    243 00 00 255 247 00 00 71"""
-        df = read_fwf(StringIO(data),
-                colspecs=[(0,17),(25,26),(33,37),(49,51),(58,62),(63,1000)],
-                names=['time','pri','pgn','dst','src','data'],
-                converters={
-                        'pgn':lambda x: int(x,16),
-                        'src':lambda x: int(x,16),
-                        'dst':lambda x: int(x,16),
-                        'data':lambda x: len(x.split(' '))})
-
-        expected = DataFrame([[1421302965.213420,3,61184,23,40,8],
-                [1421302964.226776,6,61442,None, 71,8]],
-                columns = ["time", "pri", "pgn", "dst", "src","data"])
-        expected["dst"] = expected["dst"].astype(object)
-
-        tm.assert_frame_equal(df, expected)
-
-    def test_fwf_compression(self):
-        try:
-            import gzip
-            import bz2
-        except ImportError:
-            raise nose.SkipTest("Need gzip and bz2 to run this test")
-
-        data = """1111111111
-        2222222222
-        3333333333""".strip()
-        widths = [5, 5]
-        names = ['one', 'two']
-        expected = read_fwf(StringIO(data), widths=widths, names=names)
-        if compat.PY3:
-            data = bytes(data, encoding='utf-8')
-        comps = [('gzip', gzip.GzipFile), ('bz2', bz2.BZ2File)]
-        for comp_name, compresser in comps:
-            with tm.ensure_clean() as path:
-                tmp = compresser(path, mode='wb')
-                tmp.write(data)
-                tmp.close()
-                result = read_fwf(path, widths=widths, names=names,
-                                  compression=comp_name)
-                tm.assert_frame_equal(result, expected)
-
-    def test_BytesIO_input(self):
-        if not compat.PY3:
-            raise nose.SkipTest("Bytes-related test - only needs to work on Python 3")
-        result = pd.read_fwf(BytesIO("שלום\nשלום".encode('utf8')), widths=[2,2], encoding='utf8')
-        expected = pd.DataFrame([["של", "ום"]], columns=["של", "ום"])
-        tm.assert_frame_equal(result, expected)
-        data = BytesIO("שלום::1234\n562::123".encode('cp1255'))
-        result = pd.read_table(data, sep="::", engine='python',
-                               encoding='cp1255')
-        expected = pd.DataFrame([[562, 123]], columns=["שלום","1234"])
-        tm.assert_frame_equal(result, expected)
-
-    def test_verbose_import(self):
-        text = """a,b,c,d
-one,1,2,3
-one,1,2,3
-,1,2,3
-one,1,2,3
-,1,2,3
-,1,2,3
-one,1,2,3
-two,1,2,3"""
-
-        buf = StringIO()
-        sys.stdout = buf
-
-        try:
-            # it works!
-            df = self.read_csv(StringIO(text), verbose=True)
-            self.assertEqual(buf.getvalue(), 'Filled 3 NA values in column a\n')
-        finally:
-            sys.stdout = sys.__stdout__
-
-        buf = StringIO()
-        sys.stdout = buf
-
-        text = """a,b,c,d
-one,1,2,3
-two,1,2,3
-three,1,2,3
-four,1,2,3
-five,1,2,3
-,1,2,3
-seven,1,2,3
-eight,1,2,3"""
-
-        try:
-            # it works!
-            df = self.read_csv(StringIO(text), verbose=True, index_col=0)
-            self.assertEqual(buf.getvalue(), 'Filled 1 NA values in column a\n')
-        finally:
-            sys.stdout = sys.__stdout__
-
-    def test_float_precision_specified(self):
-        # Should raise an error if float_precision (C parser option) is specified
-        with tm.assertRaisesRegexp(ValueError, "The 'float_precision' option "
-                                   "is not supported with the 'python' engine"):
-            self.read_csv(StringIO('a,b,c\n1,2,3'), float_precision='high')
-
-    def test_iteration_open_handle(self):
-        if PY3:
-            raise nose.SkipTest("won't work in Python 3 {0}".format(sys.version_info))
-
-        with tm.ensure_clean() as path:
-            with open(path, 'wb') as f:
-                f.write('AAA\nBBB\nCCC\nDDD\nEEE\nFFF\nGGG')
-
-            with open(path, 'rb') as f:
-                for line in f:
-                    if 'CCC' in line:
-                        break
-
-                try:
-                    read_table(f, squeeze=True, header=None, engine='c')
-                except Exception:
-                    pass
-                else:
-                    raise ValueError('this should not happen')
-
-                result = read_table(f, squeeze=True, header=None,
-                                    engine='python')
-
-                expected = Series(['DDD', 'EEE', 'FFF', 'GGG'], name=0)
-                tm.assert_series_equal(result, expected)
-
-    def test_iterator(self):
-        # GH 6607
-        # This is a copy which should eventually be merged into ParserTests
-        # when the issue with the C parser is fixed
-
-        reader = self.read_csv(StringIO(self.data1), index_col=0,
-                               iterator=True)
-        df = self.read_csv(StringIO(self.data1), index_col=0)
-
-        chunk = reader.read(3)
-        tm.assert_frame_equal(chunk, df[:3])
-
-        last_chunk = reader.read(5)
-        tm.assert_frame_equal(last_chunk, df[3:])
-
-        # pass list
-        lines = list(csv.reader(StringIO(self.data1)))
-        parser = TextParser(lines, index_col=0, chunksize=2)
-
-        df = self.read_csv(StringIO(self.data1), index_col=0)
-
-        chunks = list(parser)
-        tm.assert_frame_equal(chunks[0], df[:2])
-        tm.assert_frame_equal(chunks[1], df[2:4])
-        tm.assert_frame_equal(chunks[2], df[4:])
-
-        # pass skiprows
-        parser = TextParser(lines, index_col=0, chunksize=2, skiprows=[1])
-        chunks = list(parser)
-        tm.assert_frame_equal(chunks[0], df[1:3])
-
-        # test bad parameter (skip_footer)
-        reader = self.read_csv(StringIO(self.data1), index_col=0,
-                               iterator=True, skip_footer=True)
-        self.assertRaises(ValueError, reader.read, 3)
-
-        treader = self.read_table(StringIO(self.data1), sep=',', index_col=0,
-                                  iterator=True)
-        tm.assertIsInstance(treader, TextFileReader)
-
-        # stopping iteration when on chunksize is specified, GH 3967
-        data = """A,B,C
-foo,1,2,3
-bar,4,5,6
-baz,7,8,9
-"""
-        reader = self.read_csv(StringIO(data), iterator=True)
-        result = list(reader)
-        expected = DataFrame(dict(A = [1,4,7], B = [2,5,8], C = [3,6,9]), index=['foo','bar','baz'])
-        tm.assert_frame_equal(result[0], expected)
-
-        # chunksize = 1
-        reader = self.read_csv(StringIO(data), chunksize=1)
-        result = list(reader)
-        expected = DataFrame(dict(A = [1,4,7], B = [2,5,8], C = [3,6,9]), index=['foo','bar','baz'])
-        self.assertEqual(len(result), 3)
-        tm.assert_frame_equal(pd.concat(result), expected)
-
-    def test_single_line(self):
-        # GH 6607
-        # This is a copy which should eventually be merged into ParserTests
-        # when the issue with the C parser is fixed
-
-        # sniff separator
-        buf = StringIO()
-        sys.stdout = buf
-
-        # printing warning message when engine == 'c' for now
-
-        try:
-            # it works!
-            df = self.read_csv(StringIO('1,2'), names=['a', 'b'],
-                               header=None, sep=None)
-            tm.assert_frame_equal(DataFrame({'a': [1], 'b': [2]}), df)
-        finally:
-            sys.stdout = sys.__stdout__
-
-    def test_malformed(self):
-        # GH 6607
-        # This is a copy which should eventually be merged into ParserTests
-        # when the issue with the C parser is fixed
-
-        # all
-        data = """ignore
-A,B,C
-1,2,3 # comment
-1,2,3,4,5
-2,3,4
-"""
-
-        try:
-            df = self.read_table(
-                StringIO(data), sep=',', header=1, comment='#')
-            self.assertTrue(False)
-        except Exception as inst:
-            self.assertIn('Expected 3 fields in line 4, saw 5', str(inst))
-
-        # skip_footer
-        data = """ignore
-A,B,C
-1,2,3 # comment
-1,2,3,4,5
-2,3,4
-footer
-"""
-
-        try:
-            df = self.read_table(
-                StringIO(data), sep=',', header=1, comment='#',
-                skip_footer=1)
-            self.assertTrue(False)
-        except Exception as inst:
-            self.assertIn('Expected 3 fields in line 4, saw 5', str(inst))
-
-        # first chunk
-        data = """ignore
-A,B,C
-skip
-1,2,3
-3,5,10 # comment
-1,2,3,4,5
-2,3,4
-"""
-        try:
-            it = self.read_table(StringIO(data), sep=',',
-                                 header=1, comment='#', iterator=True, chunksize=1,
-                                 skiprows=[2])
-            df = it.read(5)
-            self.assertTrue(False)
-        except Exception as inst:
-            self.assertIn('Expected 3 fields in line 6, saw 5', str(inst))
-
-        # middle chunk
-        data = """ignore
-A,B,C
-skip
-1,2,3
-3,5,10 # comment
-1,2,3,4,5
-2,3,4
-"""
-        try:
-            it = self.read_table(StringIO(data), sep=',', header=1,
-                                 comment='#', iterator=True, chunksize=1,
-                                 skiprows=[2])
-            df = it.read(1)
-            it.read(2)
-            self.assertTrue(False)
-        except Exception as inst:
-            self.assertIn('Expected 3 fields in line 6, saw 5', str(inst))
-
-        # last chunk
-        data = """ignore
-A,B,C
-skip
-1,2,3
-3,5,10 # comment
-1,2,3,4,5
-2,3,4
-"""
-        try:
-            it = self.read_table(StringIO(data), sep=',',
-                                 header=1, comment='#', iterator=True, chunksize=1,
-                                 skiprows=[2])
-            df = it.read(1)
-            it.read()
-            self.assertTrue(False)
-        except Exception as inst:
-            self.assertIn('Expected 3 fields in line 6, saw 5', str(inst))
-
-    def test_skip_footer(self):
-        # GH 6607
-        # This is a copy which should eventually be merged into ParserTests
-        # when the issue with the C parser is fixed
-
-        data = """A,B,C
-1,2,3
-4,5,6
-7,8,9
-want to skip this
-also also skip this
-"""
-        result = self.read_csv(StringIO(data), skip_footer=2)
-        no_footer = '\n'.join(data.split('\n')[:-3])
-        expected = self.read_csv(StringIO(no_footer))
-
-        tm.assert_frame_equal(result, expected)
-
-        result = self.read_csv(StringIO(data), nrows=3)
-        tm.assert_frame_equal(result, expected)
-
-        # skipfooter alias
-        result = self.read_csv(StringIO(data), skipfooter=2)
-        no_footer = '\n'.join(data.split('\n')[:-3])
-        expected = self.read_csv(StringIO(no_footer))
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_decompression_regex_sep(self):
-        # GH 6607
-        # This is a copy which should eventually be moved to ParserTests
-        # when the issue with the C parser is fixed
-
-        try:
-            import gzip
-            import bz2
-        except ImportError:
-            raise nose.SkipTest('need gzip and bz2 to run')
-
-        data = open(self.csv1, 'rb').read()
-        data = data.replace(b',', b'::')
-        expected = self.read_csv(self.csv1)
-
-        with tm.ensure_clean() as path:
-            tmp = gzip.GzipFile(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-
-            result = self.read_csv(path, sep='::', compression='gzip')
-            tm.assert_frame_equal(result, expected)
-
-        with tm.ensure_clean() as path:
-            tmp = bz2.BZ2File(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-
-            result = self.read_csv(path, sep='::', compression='bz2')
-            tm.assert_frame_equal(result, expected)
-
-            self.assertRaises(ValueError, self.read_csv,
-                              path, compression='bz3')
-
-    def test_read_table_buglet_4x_multiindex(self):
-        # GH 6607
-        # This is a copy which should eventually be merged into ParserTests
-        # when the issue with multi-level index is fixed in the C parser.
-
-        text = """                      A       B       C       D        E
-one two three   four
-a   b   10.0032 5    -0.5109 -2.3358 -0.4645  0.05076  0.3640
-a   q   20      4     0.4473  1.4152  0.2834  1.00661  0.1744
-x   q   30      3    -0.6662 -0.5243 -0.3580  0.89145  2.5838"""
-
-        # it works!
-        df = self.read_table(StringIO(text), sep='\s+')
-        self.assertEqual(df.index.names, ('one', 'two', 'three', 'four'))
-
-        # GH 6893
-        data = '      A B C\na b c\n1 3 7 0 3 6\n3 1 4 1 5 9'
-        expected = DataFrame.from_records([(1,3,7,0,3,6), (3,1,4,1,5,9)],
-                columns=list('abcABC'), index=list('abc'))
-        actual = self.read_table(StringIO(data), sep='\s+')
-        tm.assert_frame_equal(actual, expected)
-
-    def test_line_comment(self):
-        data = """# empty
-A,B,C
-1,2.,4.#hello world
-#ignore this line
-5.,NaN,10.0
-"""
-        expected = [[1., 2., 4.],
-                    [5., np.nan, 10.]]
-        df = self.read_csv(StringIO(data), comment='#')
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_empty_lines(self):
-        data = """\
-A,B,C
-1,2.,4.
-
-
-5.,NaN,10.0
-
--70,.4,1
-"""
-        expected = [[1., 2., 4.],
-                    [5., np.nan, 10.],
-                    [-70., .4, 1.]]
-        df = self.read_csv(StringIO(data))
-        tm.assert_almost_equal(df.values, expected)
-        df = self.read_csv(StringIO(data.replace(',', '  ')), sep='\s+')
-        tm.assert_almost_equal(df.values, expected)
-        expected = [[1., 2., 4.],
-                    [np.nan, np.nan, np.nan],
-                    [np.nan, np.nan, np.nan],
-                    [5., np.nan, 10.],
-                    [np.nan, np.nan, np.nan],
-                    [-70., .4, 1.]]
-        df = self.read_csv(StringIO(data), skip_blank_lines=False)
-        tm.assert_almost_equal(list(df.values), list(expected))
-
-    def test_whitespace_lines(self):
-        data = """
-
-\t  \t\t
-  \t
-A,B,C
-  \t    1,2.,4.
-5.,NaN,10.0
-"""
-        expected = [[1, 2., 4.],
-                     [5., np.nan, 10.]]
-        df = self.read_csv(StringIO(data))
-        tm.assert_almost_equal(df.values, expected)
-
-
-class TestFwfColspaceSniffing(tm.TestCase):
-    def test_full_file(self):
-        # File with all values
-        test = '''index                             A    B    C
-2000-01-03T00:00:00  0.980268513777    3  foo
-2000-01-04T00:00:00  1.04791624281    -4  bar
-2000-01-05T00:00:00  0.498580885705   73  baz
-2000-01-06T00:00:00  1.12020151869     1  foo
-2000-01-07T00:00:00  0.487094399463    0  bar
-2000-01-10T00:00:00  0.836648671666    2  baz
-2000-01-11T00:00:00  0.157160753327   34  foo'''
-        colspecs = ((0, 19), (21, 35), (38, 40), (42, 45))
-        expected = read_fwf(StringIO(test), colspecs=colspecs)
-        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
-
-    def test_full_file_with_missing(self):
-        # File with missing values
-        test = '''index                             A    B    C
-2000-01-03T00:00:00  0.980268513777    3  foo
-2000-01-04T00:00:00  1.04791624281    -4  bar
-                     0.498580885705   73  baz
-2000-01-06T00:00:00  1.12020151869     1  foo
-2000-01-07T00:00:00                    0  bar
-2000-01-10T00:00:00  0.836648671666    2  baz
-                                      34'''
-        colspecs = ((0, 19), (21, 35), (38, 40), (42, 45))
-        expected = read_fwf(StringIO(test), colspecs=colspecs)
-        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
-
-    def test_full_file_with_spaces(self):
-        # File with spaces in columns
-        test = '''
-Account                 Name  Balance     CreditLimit   AccountCreated
-101     Keanu Reeves          9315.45     10000.00           1/17/1998
-312     Gerard Butler         90.00       1000.00             8/6/2003
-868     Jennifer Love Hewitt  0           17000.00           5/25/1985
-761     Jada Pinkett-Smith    49654.87    100000.00          12/5/2006
-317     Bill Murray           789.65      5000.00             2/5/2007
-'''.strip('\r\n')
-        colspecs = ((0, 7), (8, 28), (30, 38), (42, 53), (56, 70))
-        expected = read_fwf(StringIO(test), colspecs=colspecs)
-        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
-
-    def test_full_file_with_spaces_and_missing(self):
-        # File with spaces and missing values in columsn
-        test = '''
-Account               Name    Balance     CreditLimit   AccountCreated
-101                           10000.00                       1/17/1998
-312     Gerard Butler         90.00       1000.00             8/6/2003
-868                                                          5/25/1985
-761     Jada Pinkett-Smith    49654.87    100000.00          12/5/2006
-317     Bill Murray           789.65
-'''.strip('\r\n')
-        colspecs = ((0, 7), (8, 28), (30, 38), (42, 53), (56, 70))
-        expected = read_fwf(StringIO(test), colspecs=colspecs)
-        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
-
-    def test_messed_up_data(self):
-        # Completely messed up file
-        test = '''
-   Account          Name             Balance     Credit Limit   Account Created
-       101                           10000.00                       1/17/1998
-       312     Gerard Butler         90.00       1000.00
-
-       761     Jada Pinkett-Smith    49654.87    100000.00          12/5/2006
-  317          Bill Murray           789.65
-'''.strip('\r\n')
-        colspecs = ((2, 10), (15, 33), (37, 45), (49, 61), (64, 79))
-        expected = read_fwf(StringIO(test), colspecs=colspecs)
-        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
-
-    def test_multiple_delimiters(self):
-        test = r'''
-col1~~~~~col2  col3++++++++++++++++++col4
-~~22.....11.0+++foo~~~~~~~~~~Keanu Reeves
-  33+++122.33\\\bar.........Gerard Butler
-++44~~~~12.01   baz~~Jennifer Love Hewitt
-~~55       11+++foo++++Jada Pinkett-Smith
-..66++++++.03~~~bar           Bill Murray
-'''.strip('\r\n')
-        colspecs = ((0, 4), (7, 13), (15, 19), (21, 41))
-        expected = read_fwf(StringIO(test), colspecs=colspecs,
-                            delimiter=' +~.\\')
-        tm.assert_frame_equal(expected, read_fwf(StringIO(test),
-                                                 delimiter=' +~.\\'))
-
-    def test_variable_width_unicode(self):
-        if not compat.PY3:
-            raise nose.SkipTest('Bytes-related test - only needs to work on Python 3')
-        test = '''
-שלום שלום
-ום   שלל
-של   ום
-'''.strip('\r\n')
-        expected = pd.read_fwf(BytesIO(test.encode('utf8')),
-                               colspecs=[(0, 4), (5, 9)], header=None, encoding='utf8')
-        tm.assert_frame_equal(expected, read_fwf(BytesIO(test.encode('utf8')),
-                                                 header=None, encoding='utf8'))
-
-
-class TestCParserHighMemory(ParserTests, tm.TestCase):
-
-    def read_csv(self, *args, **kwds):
-        kwds = kwds.copy()
-        kwds['engine'] = 'c'
-        kwds['low_memory'] = False
-        return read_csv(*args, **kwds)
-
-    def read_table(self, *args, **kwds):
-        kwds = kwds.copy()
-        kwds['engine'] = 'c'
-        kwds['low_memory'] = False
-        return read_table(*args, **kwds)
-
-    def test_compact_ints(self):
-        if compat.is_platform_windows():
-            raise nose.SkipTest("segfaults on win-64, only when all tests are run")
-
-        data = ('0,1,0,0\n'
-                '1,1,0,0\n'
-                '0,1,0,1')
-
-        result = read_csv(StringIO(data), delimiter=',', header=None,
-                          compact_ints=True, as_recarray=True)
-        ex_dtype = np.dtype([(str(i), 'i1') for i in range(4)])
-        self.assertEqual(result.dtype, ex_dtype)
-
-        result = read_csv(StringIO(data), delimiter=',', header=None,
-                          as_recarray=True, compact_ints=True,
-                          use_unsigned=True)
-        ex_dtype = np.dtype([(str(i), 'u1') for i in range(4)])
-        self.assertEqual(result.dtype, ex_dtype)
-
-    def test_parse_dates_empty_string(self):
-        # #2263
-        s = StringIO("Date, test\n2012-01-01, 1\n,2")
-        result = self.read_csv(s, parse_dates=["Date"], na_filter=False)
-        self.assertTrue(result['Date'].isnull()[1])
-
-    def test_usecols(self):
-        raise nose.SkipTest("Usecols is not supported in C High Memory engine.")
-
-    def test_line_comment(self):
-        data = """# empty
-A,B,C
-1,2.,4.#hello world
-#ignore this line
-5.,NaN,10.0
-"""
-        expected = [[1., 2., 4.],
-                    [5., np.nan, 10.]]
-        df = self.read_csv(StringIO(data), comment='#')
-        tm.assert_almost_equal(df.values, expected)
-        # check with delim_whitespace=True
-        df = self.read_csv(StringIO(data.replace(',', ' ')), comment='#',
-                            delim_whitespace=True)
-        tm.assert_almost_equal(df.values, expected)
-        # check with custom line terminator
-        df = self.read_csv(StringIO(data.replace('\n', '*')), comment='#',
-                            lineterminator='*')
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_comment_skiprows(self):
-        data = """# empty
-random line
-# second empty line
-1,2,3
-A,B,C
-1,2.,4.
-5.,NaN,10.0
-"""
-        expected = [[1., 2., 4.],
-                    [5., np.nan, 10.]]
-        # this should ignore the first four lines (including comments)
-        df = self.read_csv(StringIO(data), comment='#', skiprows=4)
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_skiprows_lineterminator(self):
-        #GH #9079
-        data = '\n'.join(['SMOSMANIA ThetaProbe-ML2X ',
-                          '2007/01/01 01:00   0.2140 U M ',
-                          '2007/01/01 02:00   0.2141 M O ',
-                          '2007/01/01 04:00   0.2142 D M '])
-        expected = pd.DataFrame([['2007/01/01', '01:00', 0.2140, 'U', 'M'],
-                                 ['2007/01/01', '02:00', 0.2141, 'M', 'O'],
-                                 ['2007/01/01', '04:00', 0.2142, 'D', 'M']],
-                                columns=['date', 'time', 'var', 'flag',
-                                         'oflag'])
-        # test with the three default lineterminators LF, CR and CRLF
-        df = self.read_csv(StringIO(data), skiprows=1, delim_whitespace=True,
-                           names=['date', 'time', 'var', 'flag', 'oflag'])
-        tm.assert_frame_equal(df, expected)
-        df = self.read_csv(StringIO(data.replace('\n', '\r')),
-                           skiprows=1, delim_whitespace=True,
-                           names=['date', 'time', 'var', 'flag', 'oflag'])
-        tm.assert_frame_equal(df, expected)
-        df = self.read_csv(StringIO(data.replace('\n', '\r\n')),
-                           skiprows=1, delim_whitespace=True,
-                           names=['date', 'time', 'var', 'flag', 'oflag'])
-        tm.assert_frame_equal(df, expected)
-
-    def test_trailing_spaces(self):
-        data = "A B C  \nrandom line with trailing spaces    \nskip\n1,2,3\n1,2.,4.\nrandom line with trailing tabs\t\t\t\n   \n5.1,NaN,10.0\n"
-        expected = pd.DataFrame([[1., 2., 4.],
-                    [5.1, np.nan, 10.]])
-        # this should ignore six lines including lines with trailing
-        # whitespace and blank lines.  issues 8661, 8679
-        df = self.read_csv(StringIO(data.replace(',', '  ')),
-                           header=None, delim_whitespace=True,
-                           skiprows=[0,1,2,3,5,6], skip_blank_lines=True)
-        tm.assert_frame_equal(df, expected)
-        df = self.read_table(StringIO(data.replace(',', '  ')),
-                             header=None, delim_whitespace=True,
-                             skiprows=[0,1,2,3,5,6], skip_blank_lines=True)
-        tm.assert_frame_equal(df, expected)
-        # test skipping set of rows after a row with trailing spaces, issue #8983
-        expected = pd.DataFrame({"A":[1., 5.1], "B":[2., np.nan],
-                                "C":[4., 10]})
-        df = self.read_table(StringIO(data.replace(',', '  ')),
-                             delim_whitespace=True,
-                             skiprows=[1,2,3,5,6], skip_blank_lines=True)
-        tm.assert_frame_equal(df, expected)
-
-    def test_comment_header(self):
-        data = """# empty
-# second empty line
-1,2,3
-A,B,C
-1,2.,4.
-5.,NaN,10.0
-"""
-        expected = [[1., 2., 4.],
-                    [5., np.nan, 10.]]
-        # header should begin at the second non-comment line
-        df = self.read_csv(StringIO(data), comment='#', header=1)
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_comment_skiprows_header(self):
-        data = """# empty
-# second empty line
-# third empty line
-X,Y,Z
-1,2,3
-A,B,C
-1,2.,4.
-5.,NaN,10.0
-"""
-        expected = [[1., 2., 4.],
-                    [5., np.nan, 10.]]
-        # skiprows should skip the first 4 lines (including comments), while
-        # header should start from the second non-commented line starting
-        # with line 5
-        df = self.read_csv(StringIO(data), comment='#', skiprows=4, header=1)
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_empty_lines(self):
-        data = """\
-A,B,C
-1,2.,4.
-
-
-5.,NaN,10.0
-
--70,.4,1
-"""
-        expected = [[1., 2., 4.],
-                    [5., np.nan, 10.],
-                    [-70., .4, 1.]]
-        df = self.read_csv(StringIO(data))
-        tm.assert_almost_equal(df.values, expected)
-        df = self.read_csv(StringIO(data.replace(',', '  ')), sep='\s+')
-        tm.assert_almost_equal(df.values, expected)
-        expected = [[1., 2., 4.],
-                    [np.nan, np.nan, np.nan],
-                    [np.nan, np.nan, np.nan],
-                    [5., np.nan, 10.],
-                    [np.nan, np.nan, np.nan],
-                    [-70., .4, 1.]]
-        df = self.read_csv(StringIO(data), skip_blank_lines=False)
-        tm.assert_almost_equal(list(df.values), list(expected))
-
-    def test_whitespace_lines(self):
-        data = """
-
-\t  \t\t
-  \t
-A,B,C
-  \t    1,2.,4.
-5.,NaN,10.0
-"""
-        expected = [[1, 2., 4.],
-                     [5., np.nan, 10.]]
-        df = self.read_csv(StringIO(data))
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_passing_dtype(self):
-        # GH 6607
-        # This is a copy which should eventually be merged into ParserTests
-        # when the dtype argument is supported by all engines.
-
-        df = DataFrame(np.random.rand(5,2),columns=list('AB'),index=['1A','1B','1C','1D','1E'])
-
-        with tm.ensure_clean('__passing_str_as_dtype__.csv') as path:
-            df.to_csv(path)
-
-            # GH 3795
-            # passing 'str' as the dtype
-            result = self.read_csv(path, dtype=str, index_col=0)
-            tm.assert_series_equal(result.dtypes,Series({ 'A' : 'object', 'B' : 'object' }))
-
-            # we expect all object columns, so need to convert to test for equivalence
-            result = result.astype(float)
-            tm.assert_frame_equal(result,df)
-
-            # invalid dtype
-            self.assertRaises(TypeError, self.read_csv, path, dtype={'A' : 'foo', 'B' : 'float64' },
-                              index_col=0)
-
-            # valid but we don't support it (date)
-            self.assertRaises(TypeError, self.read_csv, path, dtype={'A' : 'datetime64', 'B' : 'float64' },
-                              index_col=0)
-            self.assertRaises(TypeError, self.read_csv, path, dtype={'A' : 'datetime64', 'B' : 'float64' },
-                              index_col=0, parse_dates=['B'])
-
-            # valid but we don't support it
-            self.assertRaises(TypeError, self.read_csv, path, dtype={'A' : 'timedelta64', 'B' : 'float64' },
-                              index_col=0)
-
-    def test_dtype_and_names_error(self):
-
-        # GH 8833
-        # passing both dtype and names resulting in an error reporting issue
-
-        data = """
-1.0 1
-2.0 2
-3.0 3
-"""
-        # base cases
-        result = self.read_csv(StringIO(data),sep='\s+',header=None)
-        expected = DataFrame([[1.0,1],[2.0,2],[3.0,3]])
-        tm.assert_frame_equal(result, expected)
-
-        result = self.read_csv(StringIO(data),sep='\s+',header=None,names=['a','b'])
-        expected = DataFrame([[1.0,1],[2.0,2],[3.0,3]],columns=['a','b'])
-        tm.assert_frame_equal(result, expected)
-
-        # fallback casting
-        result = self.read_csv(StringIO(data),sep='\s+',header=None,names=['a','b'],dtype={'a' : np.int32})
-        expected = DataFrame([[1,1],[2,2],[3,3]],columns=['a','b'])
-        expected['a'] = expected['a'].astype(np.int32)
-        tm.assert_frame_equal(result, expected)
-
-        data = """
-1.0 1
-nan 2
-3.0 3
-"""
-        # fallback casting, but not castable
-        with tm.assertRaisesRegexp(ValueError, 'cannot safely convert'):
-            self.read_csv(StringIO(data),sep='\s+',header=None,names=['a','b'],dtype={'a' : np.int32})
-
-    def test_fallback_to_python(self):
-        # GH 6607
-        data = 'a b c\n1 2 3'
-
-        # specify C engine with unsupported options (raise)
-        with tm.assertRaisesRegexp(ValueError, 'does not support'):
-            self.read_table(StringIO(data), engine='c', sep=None,
-                    delim_whitespace=False)
-        with tm.assertRaisesRegexp(ValueError, 'does not support'):
-            self.read_table(StringIO(data), engine='c', sep='\s')
-        with tm.assertRaisesRegexp(ValueError, 'does not support'):
-            self.read_table(StringIO(data), engine='c', skip_footer=1)
-
-
-    def test_buffer_overflow(self):
-        # GH9205
-        # test certain malformed input files that cause buffer overflows in
-        # tokenizer.c
-        malfw = "1\r1\r1\r 1\r 1\r"         # buffer overflow in words pointer
-        malfs = "1\r1\r1\r 1\r 1\r11\r"     # buffer overflow in stream pointer
-        malfl = "1\r1\r1\r 1\r 1\r11\r1\r"  # buffer overflow in lines pointer
-        for malf in (malfw, malfs, malfl):
-            try:
-                df = self.read_table(StringIO(malf))
-            except Exception as cperr:
-                self.assertIn('Buffer overflow caught - possible malformed input file.', str(cperr))
-
-    def test_single_char_leading_whitespace(self):
-        # GH 9710
-        data = """\
-MyColumn
-   a
-   b
-   a
-   b\n"""
-
-        expected = DataFrame({'MyColumn' : list('abab')})
-
-        result = self.read_csv(StringIO(data), delim_whitespace=True,
-                               skipinitialspace=True)
-        tm.assert_frame_equal(result, expected)
-
-        result = self.read_csv(StringIO(data), lineterminator='\n',
-                               skipinitialspace=True)
-        tm.assert_frame_equal(result, expected)
-
-class TestCParserLowMemory(ParserTests, tm.TestCase):
-
-    def read_csv(self, *args, **kwds):
-        kwds = kwds.copy()
-        kwds['engine'] = 'c'
-        kwds['low_memory'] = True
-        kwds['buffer_lines'] = 2
-        return read_csv(*args, **kwds)
-
-    def read_table(self, *args, **kwds):
-        kwds = kwds.copy()
-        kwds['engine'] = 'c'
-        kwds['low_memory'] = True
-        kwds['buffer_lines'] = 2
-        return read_table(*args, **kwds)
-
-    def test_compact_ints(self):
-        data = ('0,1,0,0\n'
-                '1,1,0,0\n'
-                '0,1,0,1')
-
-        result = read_csv(StringIO(data), delimiter=',', header=None,
-                          compact_ints=True)
-        ex_dtype = np.dtype([(str(i), 'i1') for i in range(4)])
-        self.assertEqual(result.to_records(index=False).dtype, ex_dtype)
-
-        result = read_csv(StringIO(data), delimiter=',', header=None,
-			  compact_ints=True,
-                          use_unsigned=True)
-        ex_dtype = np.dtype([(str(i), 'u1') for i in range(4)])
-        self.assertEqual(result.to_records(index=False).dtype, ex_dtype)
-
-    def test_compact_ints_as_recarray(self):
-        if compat.is_platform_windows():
-            raise nose.SkipTest("segfaults on win-64, only when all tests are run")
-
-        data = ('0,1,0,0\n'
-                '1,1,0,0\n'
-                '0,1,0,1')
-
-        result = read_csv(StringIO(data), delimiter=',', header=None,
-                          compact_ints=True, as_recarray=True)
-        ex_dtype = np.dtype([(str(i), 'i1') for i in range(4)])
-        self.assertEqual(result.dtype, ex_dtype)
-
-        result = read_csv(StringIO(data), delimiter=',', header=None,
-                          as_recarray=True, compact_ints=True,
-                          use_unsigned=True)
-        ex_dtype = np.dtype([(str(i), 'u1') for i in range(4)])
-        self.assertEqual(result.dtype, ex_dtype)
-
-    def test_precise_conversion(self):
-        # GH #8002
-        tm._skip_if_32bit()
-        from decimal import Decimal
-        normal_errors = []
-        precise_errors = []
-        for num in np.linspace(1., 2., num=500): # test numbers between 1 and 2
-            text = 'a\n{0:.25}'.format(num) # 25 decimal digits of precision
-            normal_val = float(self.read_csv(StringIO(text))['a'][0])
-            precise_val = float(self.read_csv(StringIO(text), float_precision='high')['a'][0])
-            roundtrip_val = float(self.read_csv(StringIO(text), float_precision='round_trip')['a'][0])
-            actual_val = Decimal(text[2:])
-            def error(val):
-                return abs(Decimal('{0:.100}'.format(val)) - actual_val)
-            normal_errors.append(error(normal_val))
-            precise_errors.append(error(precise_val))
-            self.assertEqual(roundtrip_val, float(text[2:])) # round-trip should match float()
-        self.assertTrue(sum(precise_errors) <= sum(normal_errors))
-        self.assertTrue(max(precise_errors) <= max(normal_errors))
-
-    def test_pass_dtype(self):
-        data = """\
-one,two
-1,2.5
-2,3.5
-3,4.5
-4,5.5"""
-
-        result = self.read_csv(StringIO(data), dtype={'one': 'u1', 1: 'S1'})
-        self.assertEqual(result['one'].dtype, 'u1')
-        self.assertEqual(result['two'].dtype, 'object')
-
-    def test_pass_dtype_as_recarray(self):
-        data = """\
-one,two
-1,2.5
-2,3.5
-3,4.5
-4,5.5"""
-
-        if compat.is_platform_windows():
-            raise nose.SkipTest("segfaults on win-64, only when all tests are run")
-
-        result = self.read_csv(StringIO(data), dtype={'one': 'u1', 1: 'S1'},
-                               as_recarray=True)
-        self.assertEqual(result['one'].dtype, 'u1')
-        self.assertEqual(result['two'].dtype, 'S1')
-
-    def test_empty_pass_dtype(self):
-        data = 'one,two'
-        result = self.read_csv(StringIO(data), dtype={'one': 'u1'})
-
-        expected = DataFrame({'one': np.empty(0, dtype='u1'),
-                              'two': np.empty(0, dtype=np.object)})
-        tm.assert_frame_equal(result, expected)
-
-    def test_empty_with_index_pass_dtype(self):
-        data = 'one,two'
-        result = self.read_csv(StringIO(data), index_col=['one'],
-                               dtype={'one': 'u1', 1: 'f'})
-
-        expected = DataFrame({'two': np.empty(0, dtype='f')},
-                             index=Index([], dtype='u1', name='one'))
-        tm.assert_frame_equal(result, expected)
-
-    def test_empty_with_multiindex_pass_dtype(self):
-        data = 'one,two,three'
-        result = self.read_csv(StringIO(data), index_col=['one', 'two'],
-                               dtype={'one': 'u1', 1: 'f8'})
-
-        expected = DataFrame({'three': np.empty(0, dtype=np.object)}, index=MultiIndex.from_arrays(
-            [np.empty(0, dtype='u1'), np.empty(0, dtype='O')],
-            names=['one', 'two'])
-            )
-        tm.assert_frame_equal(result, expected)
-
-    def test_empty_with_mangled_column_pass_dtype_by_names(self):
-        data = 'one,one'
-        result = self.read_csv(StringIO(data), dtype={'one': 'u1', 'one.1': 'f'})
-
-        expected = DataFrame({'one': np.empty(0, dtype='u1'), 'one.1': np.empty(0, dtype='f')})
-        tm.assert_frame_equal(result, expected)
-
-    def test_empty_with_mangled_column_pass_dtype_by_indexes(self):
-        data = 'one,one'
-        result = self.read_csv(StringIO(data), dtype={0: 'u1', 1: 'f'})
-
-        expected = DataFrame({'one': np.empty(0, dtype='u1'), 'one.1': np.empty(0, dtype='f')})
-        tm.assert_frame_equal(result, expected)
-
-    def test_empty_with_dup_column_pass_dtype_by_names(self):
-        data = 'one,one'
-        result = self.read_csv(StringIO(data), mangle_dupe_cols=False, dtype={'one': 'u1'})
-        expected = pd.concat([Series([], name='one', dtype='u1')] * 2, axis=1)
-        tm.assert_frame_equal(result, expected)
-
-    def test_empty_with_dup_column_pass_dtype_by_indexes(self):
-        ### FIXME in GH9424
-        raise nose.SkipTest("GH 9424; known failure read_csv with duplicate columns")
-
-        data = 'one,one'
-        result = self.read_csv(StringIO(data), mangle_dupe_cols=False, dtype={0: 'u1', 1: 'f'})
-        expected = pd.concat([Series([], name='one', dtype='u1'),
-                              Series([], name='one', dtype='f')], axis=1)
-        tm.assert_frame_equal(result, expected)
-
-    def test_usecols_dtypes(self):
-        data = """\
-1,2,3
-4,5,6
-7,8,9
-10,11,12"""
-
-        result = self.read_csv(StringIO(data), usecols=(0, 1, 2),
-                               names=('a', 'b', 'c'),
-                               header=None,
-                               converters={'a': str},
-                               dtype={'b': int, 'c': float},
-                              )
-        result2 = self.read_csv(StringIO(data), usecols=(0, 2),
-                               names=('a', 'b', 'c'),
-                               header=None,
-                               converters={'a': str},
-                               dtype={'b': int, 'c': float},
-                              )
-        self.assertTrue((result.dtypes == [object, np.int, np.float]).all())
-        self.assertTrue((result2.dtypes == [object, np.float]).all())
-
-    def test_usecols_implicit_index_col(self):
-        # #2654
-        data = 'a,b,c\n4,apple,bat,5.7\n8,orange,cow,10'
-
-        result = self.read_csv(StringIO(data), usecols=['a', 'b'])
-        expected = DataFrame({'a': ['apple', 'orange'],
-                              'b': ['bat', 'cow']}, index=[4, 8])
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_usecols_with_whitespace(self):
-        data = 'a  b  c\n4  apple  bat  5.7\n8  orange  cow  10'
-
-        result = self.read_csv(StringIO(data), delim_whitespace=True,
-                               usecols=('a', 'b'))
-        expected = DataFrame({'a': ['apple', 'orange'],
-                              'b': ['bat', 'cow']}, index=[4, 8])
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_usecols_regex_sep(self):
-        # #2733
-        data = 'a  b  c\n4  apple  bat  5.7\n8  orange  cow  10'
-
-        df = self.read_csv(StringIO(data), sep='\s+', usecols=('a', 'b'))
-
-        expected = DataFrame({'a': ['apple', 'orange'],
-                              'b': ['bat', 'cow']}, index=[4, 8])
-        tm.assert_frame_equal(df, expected)
-
-    def test_pure_python_failover(self):
-        data = "a,b,c\n1,2,3#ignore this!\n4,5,6#ignorethistoo"
-
-        result = self.read_csv(StringIO(data), comment='#')
-        expected = DataFrame({'a': [1, 4], 'b': [2, 5], 'c': [3, 6]})
-        tm.assert_frame_equal(result, expected)
-
-    def test_decompression(self):
-        try:
-            import gzip
-            import bz2
-        except ImportError:
-            raise nose.SkipTest('need gzip and bz2 to run')
-
-        data = open(self.csv1, 'rb').read()
-        expected = self.read_csv(self.csv1)
-
-        with tm.ensure_clean() as path:
-            tmp = gzip.GzipFile(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-
-            result = self.read_csv(path, compression='gzip')
-            tm.assert_frame_equal(result, expected)
-
-            result = self.read_csv(open(path, 'rb'), compression='gzip')
-            tm.assert_frame_equal(result, expected)
-
-        with tm.ensure_clean() as path:
-            tmp = bz2.BZ2File(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-
-            result = self.read_csv(path, compression='bz2')
-            tm.assert_frame_equal(result, expected)
-
-            # result = self.read_csv(open(path, 'rb'), compression='bz2')
-            # tm.assert_frame_equal(result, expected)
-
-            self.assertRaises(ValueError, self.read_csv,
-                              path, compression='bz3')
-
-            with open(path, 'rb') as fin:
-                if compat.PY3:
-                    result = self.read_csv(fin, compression='bz2')
-                    tm.assert_frame_equal(result, expected)
-                else:
-                    self.assertRaises(ValueError, self.read_csv,
-                                      fin, compression='bz2')
-
-    def test_decompression_regex_sep(self):
-        try:
-            import gzip
-            import bz2
-        except ImportError:
-            raise nose.SkipTest('need gzip and bz2 to run')
-
-        data = open(self.csv1, 'rb').read()
-        data = data.replace(b',', b'::')
-        expected = self.read_csv(self.csv1)
-
-        with tm.ensure_clean() as path:
-            tmp = gzip.GzipFile(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-
-            # GH 6607
-            # Test currently only valid with the python engine because of
-            # regex sep. Temporarily copied to TestPythonParser.
-            # Here test for ValueError when passing regex sep:
-
-            with tm.assertRaisesRegexp(ValueError, 'regex sep'): #XXX
-                result = self.read_csv(path, sep='::', compression='gzip')
-                tm.assert_frame_equal(result, expected)
-
-        with tm.ensure_clean() as path:
-            tmp = bz2.BZ2File(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-
-            # GH 6607
-            with tm.assertRaisesRegexp(ValueError, 'regex sep'): #XXX
-                result = self.read_csv(path, sep='::', compression='bz2')
-                tm.assert_frame_equal(result, expected)
-
-            self.assertRaises(ValueError, self.read_csv,
-                              path, compression='bz3')
-
-    def test_memory_map(self):
-        # it works!
-        result = self.read_csv(self.csv1, memory_map=True)
-
-    def test_disable_bool_parsing(self):
-        # #2090
-
-        data = """A,B,C
-Yes,No,Yes
-No,Yes,Yes
-Yes,,Yes
-No,No,No"""
-
-        result = read_csv(StringIO(data), dtype=object)
-        self.assertTrue((result.dtypes == object).all())
-
-        result = read_csv(StringIO(data), dtype=object, na_filter=False)
-        self.assertEqual(result['B'][2], '')
-
-    def test_euro_decimal_format(self):
-        data = """Id;Number1;Number2;Text1;Text2;Number3
-1;1521,1541;187101,9543;ABC;poi;4,738797819
-2;121,12;14897,76;DEF;uyt;0,377320872
-3;878,158;108013,434;GHI;rez;2,735694704"""
-
-        df2 = self.read_csv(StringIO(data), sep=';', decimal=',')
-        self.assertEqual(df2['Number1'].dtype, float)
-        self.assertEqual(df2['Number2'].dtype, float)
-        self.assertEqual(df2['Number3'].dtype, float)
-
-    def test_custom_lineterminator(self):
-        data = 'a,b,c~1,2,3~4,5,6'
-
-        result = self.read_csv(StringIO(data), lineterminator='~')
-        expected = self.read_csv(StringIO(data.replace('~', '\n')))
-
-        tm.assert_frame_equal(result, expected)
-
-        data2 = data.replace('~', '~~')
-        result = self.assertRaises(ValueError, read_csv, StringIO(data2),
-                                   lineterminator='~~')
-
-    def test_raise_on_passed_int_dtype_with_nas(self):
-        # #2631
-        data = """YEAR, DOY, a
-2001,106380451,10
-2001,,11
-2001,106380451,67"""
-        self.assertRaises(Exception, read_csv, StringIO(data), sep=",",
-                          skipinitialspace=True,
-                          dtype={'DOY': np.int64})
-
-    def test_na_trailing_columns(self):
-        data = """Date,Currenncy,Symbol,Type,Units,UnitPrice,Cost,Tax
-2012-03-14,USD,AAPL,BUY,1000
-2012-05-12,USD,SBUX,SELL,500"""
-
-        result = self.read_csv(StringIO(data))
-        self.assertEqual(result['Date'][1], '2012-05-12')
-        self.assertTrue(result['UnitPrice'].isnull().all())
-
-    def test_parse_ragged_csv(self):
-        data = """1,2,3
-1,2,3,4
-1,2,3,4,5
-1,2
-1,2,3,4"""
-
-        nice_data = """1,2,3,,
-1,2,3,4,
-1,2,3,4,5
-1,2,,,
-1,2,3,4,"""
-        result = self.read_csv(StringIO(data), header=None,
-                               names=['a', 'b', 'c', 'd', 'e'])
-
-        expected = self.read_csv(StringIO(nice_data), header=None,
-                                 names=['a', 'b', 'c', 'd', 'e'])
-
-        tm.assert_frame_equal(result, expected)
-
-        # too many columns, cause segfault if not careful
-        data = "1,2\n3,4,5"
-
-        result = self.read_csv(StringIO(data), header=None,
-                               names=lrange(50))
-        expected = self.read_csv(StringIO(data), header=None,
-                                 names=lrange(3)).reindex(columns=lrange(50))
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_tokenize_CR_with_quoting(self):
-        # #3453, this doesn't work with Python parser for some reason
-
-        data = ' a,b,c\r"a,b","e,d","f,f"'
-
-        result = self.read_csv(StringIO(data), header=None)
-        expected = self.read_csv(StringIO(data.replace('\r', '\n')),
-                                 header=None)
-        tm.assert_frame_equal(result, expected)
-
-        result = self.read_csv(StringIO(data))
-        expected = self.read_csv(StringIO(data.replace('\r', '\n')))
-        tm.assert_frame_equal(result, expected)
-
-    def test_raise_on_no_columns(self):
-        # single newline
-        data = "\n"
-        self.assertRaises(ValueError, self.read_csv, StringIO(data))
-
-        # test with more than a single newline
-        data = "\n\n\n"
-        self.assertRaises(ValueError, self.read_csv, StringIO(data))
-
-    def test_warn_if_chunks_have_mismatched_type(self):
-        # Issue #3866 If chunks are different types and can't
-        # be coerced using numerical types, then issue warning.
-        integers = [str(i) for i in range(499999)]
-        data = "a\n" + "\n".join(integers + ['a', 'b'] + integers)
-
-        with tm.assert_produces_warning(DtypeWarning):
-            df = self.read_csv(StringIO(data))
-        self.assertEqual(df.a.dtype, np.object)
-
-    def test_invalid_c_parser_opts_with_not_c_parser(self):
-        from pandas.io.parsers import _c_parser_defaults as c_defaults
-
-        data = """1,2,3,,
-1,2,3,4,
-1,2,3,4,5
-1,2,,,
-1,2,3,4,"""
-
-        engines = 'python', 'python-fwf'
-        for default in c_defaults:
-            for engine in engines:
-                kwargs = {default: object()}
-                with tm.assertRaisesRegexp(ValueError,
-                                           'The %r option is not supported '
-                                           'with the %r engine' % (default,
-                                                                   engine)):
-                    read_csv(StringIO(data), engine=engine, **kwargs)
-
-    def test_passing_dtype(self):
-        # GH 6607
-        # This is a copy which should eventually be merged into ParserTests
-        # when the dtype argument is supported by all engines.
-
-        df = DataFrame(np.random.rand(5,2),columns=list('AB'),index=['1A','1B','1C','1D','1E'])
-
-        with tm.ensure_clean('__passing_str_as_dtype__.csv') as path:
-            df.to_csv(path)
-
-            # GH 3795
-            # passing 'str' as the dtype
-            result = self.read_csv(path, dtype=str, index_col=0)
-            tm.assert_series_equal(result.dtypes,Series({ 'A' : 'object', 'B' : 'object' }))
-
-            # we expect all object columns, so need to convert to test for equivalence
-            result = result.astype(float)
-            tm.assert_frame_equal(result,df)
-
-            # invalid dtype
-            self.assertRaises(TypeError, self.read_csv, path, dtype={'A' : 'foo', 'B' : 'float64' },
-                              index_col=0)
-
-            # valid but we don't support it (date)
-            self.assertRaises(TypeError, self.read_csv, path, dtype={'A' : 'datetime64', 'B' : 'float64' },
-                              index_col=0)
-            self.assertRaises(TypeError, self.read_csv, path, dtype={'A' : 'datetime64', 'B' : 'float64' },
-                              index_col=0, parse_dates=['B'])
-
-            # valid but we don't support it
-            self.assertRaises(TypeError, self.read_csv, path, dtype={'A' : 'timedelta64', 'B' : 'float64' },
-                              index_col=0)
-
-    def test_fallback_to_python(self):
-        # GH 6607
-        data = 'a b c\n1 2 3'
-
-        # specify C engine with C-unsupported options (raise)
-        with tm.assertRaisesRegexp(ValueError, 'does not support'):
-            self.read_table(StringIO(data), engine='c', sep=None,
-                    delim_whitespace=False)
-        with tm.assertRaisesRegexp(ValueError, 'does not support'):
-            self.read_table(StringIO(data), engine='c', sep='\s')
-        with tm.assertRaisesRegexp(ValueError, 'does not support'):
-            self.read_table(StringIO(data), engine='c', skip_footer=1)
-
-    def test_raise_on_sep_with_delim_whitespace(self):
-        # GH 6607
-        data = 'a b c\n1 2 3'
-        with tm.assertRaisesRegexp(ValueError, 'you can only specify one'):
-            self.read_table(StringIO(data), sep='\s', delim_whitespace=True)
-
-
-    def test_buffer_overflow(self):
-        # GH9205
-        # test certain malformed input files that cause buffer overflows in
-        # tokenizer.c
-        malfw = "1\r1\r1\r 1\r 1\r"         # buffer overflow in words pointer
-        malfs = "1\r1\r1\r 1\r 1\r11\r"     # buffer overflow in stream pointer
-        malfl = "1\r1\r1\r 1\r 1\r11\r1\r"  # buffer overflow in lines pointer
-        for malf in (malfw, malfs, malfl):
-            try:
-                df = self.read_table(StringIO(malf))
-            except Exception as cperr:
-                self.assertIn('Buffer overflow caught - possible malformed input file.', str(cperr))
-
-    def test_single_char_leading_whitespace(self):
-        # GH 9710
-        data = """\
-MyColumn
-   a
-   b
-   a
-   b\n"""
-
-        expected = DataFrame({'MyColumn' : list('abab')})
-
-        result = self.read_csv(StringIO(data), delim_whitespace=True,
-                               skipinitialspace=True)
-        tm.assert_frame_equal(result, expected)
-
-        result = self.read_csv(StringIO(data), lineterminator='\n',
-                               skipinitialspace=True)
-        tm.assert_frame_equal(result, expected)
-
-    def test_bool_header_arg(self):
-        # GH 6114
-        data = """\
-MyColumn
-   a
-   b
-   a
-   b"""
-        for arg in [True, False]:
-            with tm.assertRaises(TypeError):
-                pd.read_csv(StringIO(data), header=arg)
-            with tm.assertRaises(TypeError):
-                pd.read_table(StringIO(data), header=arg)
-            with tm.assertRaises(TypeError):
-                pd.read_fwf(StringIO(data), header=arg)
-
-class TestMiscellaneous(tm.TestCase):
-
-    # for tests that don't fit into any of the other classes, e.g. those that
-    # compare results for different engines or test the behavior when 'engine'
-    # is not passed
-
-    def test_compare_whitespace_regex(self):
-        # GH 6607
-        data = '    a b c\n1 2 3 \n4 5  6\n 7 8 9'
-        result_c = pd.read_table(StringIO(data), sep='\s+', engine='c')
-        result_py = pd.read_table(StringIO(data), sep='\s+', engine='python')
-        print(result_c)
-        tm.assert_frame_equal(result_c, result_py)
-
-    def test_fallback_to_python(self):
-        # GH 6607
-        data = 'a b c\n1 2 3'
-
-        # specify C-unsupported options with python-unsupported option
-        # (options will be ignored on fallback, raise)
-        with tm.assertRaisesRegexp(ValueError, 'Falling back'):
-            pd.read_table(StringIO(data), sep=None,
-                    delim_whitespace=False, dtype={'a': float})
-        with tm.assertRaisesRegexp(ValueError, 'Falling back'):
-            pd.read_table(StringIO(data), sep='\s', dtype={'a': float})
-        with tm.assertRaisesRegexp(ValueError, 'Falling back'):
-            pd.read_table(StringIO(data), skip_footer=1, dtype={'a': float})
-
-        # specify C-unsupported options without python-unsupported options
-        with tm.assert_produces_warning(parsers.ParserWarning):
-            pd.read_table(StringIO(data), sep=None, delim_whitespace=False)
-        with tm.assert_produces_warning(parsers.ParserWarning):
-            pd.read_table(StringIO(data), sep='\s')
-        with tm.assert_produces_warning(parsers.ParserWarning):
-            pd.read_table(StringIO(data), skip_footer=1)
-
-
-class TestParseSQL(tm.TestCase):
-
-    def test_convert_sql_column_floats(self):
-        arr = np.array([1.5, None, 3, 4.2], dtype=object)
-        result = lib.convert_sql_column(arr)
-        expected = np.array([1.5, np.nan, 3, 4.2], dtype='f8')
-        assert_same_values_and_dtype(result, expected)
-
-    def test_convert_sql_column_strings(self):
-        arr = np.array(['1.5', None, '3', '4.2'], dtype=object)
-        result = lib.convert_sql_column(arr)
-        expected = np.array(['1.5', np.nan, '3', '4.2'], dtype=object)
-        assert_same_values_and_dtype(result, expected)
-
-    def test_convert_sql_column_unicode(self):
-        arr = np.array([u('1.5'), None, u('3'), u('4.2')],
-                       dtype=object)
-        result = lib.convert_sql_column(arr)
-        expected = np.array([u('1.5'), np.nan, u('3'), u('4.2')],
-                            dtype=object)
-        assert_same_values_and_dtype(result, expected)
-
-    def test_convert_sql_column_ints(self):
-        arr = np.array([1, 2, 3, 4], dtype='O')
-        arr2 = np.array([1, 2, 3, 4], dtype='i4').astype('O')
-        result = lib.convert_sql_column(arr)
-        result2 = lib.convert_sql_column(arr2)
-        expected = np.array([1, 2, 3, 4], dtype='i8')
-        assert_same_values_and_dtype(result, expected)
-        assert_same_values_and_dtype(result2, expected)
-
-        arr = np.array([1, 2, 3, None, 4], dtype='O')
-        result = lib.convert_sql_column(arr)
-        expected = np.array([1, 2, 3, np.nan, 4], dtype='f8')
-        assert_same_values_and_dtype(result, expected)
-
-    def test_convert_sql_column_longs(self):
-        arr = np.array([long(1), long(2), long(3), long(4)], dtype='O')
-        result = lib.convert_sql_column(arr)
-        expected = np.array([1, 2, 3, 4], dtype='i8')
-        assert_same_values_and_dtype(result, expected)
-
-        arr = np.array([long(1), long(2), long(3), None, long(4)], dtype='O')
-        result = lib.convert_sql_column(arr)
-        expected = np.array([1, 2, 3, np.nan, 4], dtype='f8')
-        assert_same_values_and_dtype(result, expected)
-
-    def test_convert_sql_column_bools(self):
-        arr = np.array([True, False, True, False], dtype='O')
-        result = lib.convert_sql_column(arr)
-        expected = np.array([True, False, True, False], dtype=bool)
-        assert_same_values_and_dtype(result, expected)
-
-        arr = np.array([True, False, None, False], dtype='O')
-        result = lib.convert_sql_column(arr)
-        expected = np.array([True, False, np.nan, False], dtype=object)
-        assert_same_values_and_dtype(result, expected)
-
-    def test_convert_sql_column_decimals(self):
-        from decimal import Decimal
-        arr = np.array([Decimal('1.5'), None, Decimal('3'), Decimal('4.2')])
-        result = lib.convert_sql_column(arr)
-        expected = np.array([1.5, np.nan, 3, 4.2], dtype='f8')
-        assert_same_values_and_dtype(result, expected)
-
-
-class TestUrlGz(tm.TestCase):
-    def setUp(self):
-        dirpath = tm.get_data_path()
-        localtable = os.path.join(dirpath, 'salary.table')
-        self.local_table = read_table(localtable)
-
-    @tm.network
-    def test_url_gz(self):
-        url = 'https://raw.github.com/pydata/pandas/master/pandas/io/tests/data/salary.table.gz'
-        url_table = read_table(url, compression="gzip", engine="python")
-        tm.assert_frame_equal(url_table, self.local_table)
-
-    @tm.network
-    def test_url_gz_infer(self):
-        url = ('https://s3.amazonaws.com/pandas-test/salary.table.gz')
-        url_table = read_table(url, compression="infer", engine="python")
-        tm.assert_frame_equal(url_table, self.local_table)
-
-
-class TestS3(tm.TestCase):
-    def setUp(self):
-        try:
-            import boto
-        except ImportError:
-            raise nose.SkipTest("boto not installed")
-
-    @tm.network
-    def test_parse_public_s3_bucket(self):
-        for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
-            if comp == 'bz2' and compat.PY2:
-                # The Python 2 C parser can't read bz2 from S3.
-                self.assertRaises(ValueError, pd.read_csv,
-                                  's3://pandas-test/tips.csv' + ext,
-                                  compression=comp)
-            else:
-                df = pd.read_csv('s3://pandas-test/tips.csv' + ext, compression=comp)
-                self.assertTrue(isinstance(df, pd.DataFrame))
-                self.assertFalse(df.empty)
-                tm.assert_frame_equal(pd.read_csv(tm.get_data_path('tips.csv')), df)
-
-        # Read public file from bucket with not-public contents
-        df = pd.read_csv('s3://cant_get_it/tips.csv')
-        self.assertTrue(isinstance(df, pd.DataFrame))
-        self.assertFalse(df.empty)
-        tm.assert_frame_equal(pd.read_csv(tm.get_data_path('tips.csv')), df)
-
-    @tm.network
-    def test_parse_public_s3n_bucket(self):
-        # Read from AWS s3 as "s3n" URL
-        df = pd.read_csv('s3n://pandas-test/tips.csv', nrows=10)
-        self.assertTrue(isinstance(df, pd.DataFrame))
-        self.assertFalse(df.empty)
-        tm.assert_frame_equal(pd.read_csv(tm.get_data_path('tips.csv')).iloc[:10], df)
-
-    @tm.network
-    def test_parse_public_s3a_bucket(self):
-        # Read from AWS s3 as "s3a" URL
-        df = pd.read_csv('s3a://pandas-test/tips.csv', nrows=10)
-        self.assertTrue(isinstance(df, pd.DataFrame))
-        self.assertFalse(df.empty)
-        tm.assert_frame_equal(pd.read_csv(tm.get_data_path('tips.csv')).iloc[:10], df)
-
-    @tm.network
-    def test_parse_public_s3_bucket_nrows(self):
-        for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
-            if comp == 'bz2' and compat.PY2:
-                # The Python 2 C parser can't read bz2 from S3.
-                self.assertRaises(ValueError, pd.read_csv,
-                                  's3://pandas-test/tips.csv' + ext,
-                                  compression=comp)
-            else:
-                df = pd.read_csv('s3://pandas-test/tips.csv' + ext, nrows=10, compression=comp)
-                self.assertTrue(isinstance(df, pd.DataFrame))
-                self.assertFalse(df.empty)
-                tm.assert_frame_equal(pd.read_csv(tm.get_data_path('tips.csv')).iloc[:10], df)
-
-    @tm.network
-    def test_parse_public_s3_bucket_chunked(self):
-        # Read with a chunksize
-        chunksize = 5
-        local_tips = pd.read_csv(tm.get_data_path('tips.csv'))
-        for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
-            if comp == 'bz2' and compat.PY2:
-                # The Python 2 C parser can't read bz2 from S3.
-                self.assertRaises(ValueError, pd.read_csv,
-                                  's3://pandas-test/tips.csv' + ext,
-                                  compression=comp)
-            else:
-                df_reader = pd.read_csv('s3://pandas-test/tips.csv' + ext,
-                                        chunksize=chunksize, compression=comp)
-                self.assertEqual(df_reader.chunksize, chunksize)
-                for i_chunk in [0, 1, 2]:
-                    # Read a couple of chunks and make sure we see them properly.
-                    df = df_reader.get_chunk()
-                    self.assertTrue(isinstance(df, pd.DataFrame))
-                    self.assertFalse(df.empty)
-                    true_df = local_tips.iloc[chunksize * i_chunk: chunksize * (i_chunk + 1)]
-                    true_df = true_df.reset_index().drop('index', axis=1)  # Chunking doesn't preserve row numbering
-                    tm.assert_frame_equal(true_df, df)
-
-    @tm.network
-    def test_parse_public_s3_bucket_chunked_python(self):
-        # Read with a chunksize using the Python parser
-        chunksize = 5
-        local_tips = pd.read_csv(tm.get_data_path('tips.csv'))
-        for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
-            df_reader = pd.read_csv('s3://pandas-test/tips.csv' + ext,
-                                    chunksize=chunksize, compression=comp,
-                                    engine='python')
-            self.assertEqual(df_reader.chunksize, chunksize)
-            for i_chunk in [0, 1, 2]:
-                # Read a couple of chunks and make sure we see them properly.
-                df = df_reader.get_chunk()
-                self.assertTrue(isinstance(df, pd.DataFrame))
-                self.assertFalse(df.empty)
-                true_df = local_tips.iloc[chunksize * i_chunk: chunksize * (i_chunk + 1)]
-                true_df = true_df.reset_index().drop('index', axis=1)  # Chunking doesn't preserve row numbering
-                tm.assert_frame_equal(true_df, df)
-
-    @tm.network
-    def test_parse_public_s3_bucket_python(self):
-        for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
-            df = pd.read_csv('s3://pandas-test/tips.csv' + ext, engine='python',
-                             compression=comp)
-            self.assertTrue(isinstance(df, pd.DataFrame))
-            self.assertFalse(df.empty)
-            tm.assert_frame_equal(pd.read_csv(tm.get_data_path('tips.csv')), df)
-
-    @tm.network
-    def test_infer_s3_compression(self):
-        for ext in ['', '.gz', '.bz2']:
-            df = pd.read_csv('s3://pandas-test/tips.csv' + ext,
-                             engine='python', compression='infer')
-            self.assertTrue(isinstance(df, pd.DataFrame))
-            self.assertFalse(df.empty)
-            tm.assert_frame_equal(pd.read_csv(tm.get_data_path('tips.csv')), df)
-
-    @tm.network
-    def test_parse_public_s3_bucket_nrows_python(self):
-        for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
-            df = pd.read_csv('s3://pandas-test/tips.csv' + ext, engine='python',
-                             nrows=10, compression=comp)
-            self.assertTrue(isinstance(df, pd.DataFrame))
-            self.assertFalse(df.empty)
-            tm.assert_frame_equal(pd.read_csv(tm.get_data_path('tips.csv')).iloc[:10], df)
-
-    @tm.network
-    def test_s3_fails(self):
-        import boto
-        with tm.assertRaisesRegexp(boto.exception.S3ResponseError,
-                                'S3ResponseError: 404 Not Found'):
-            pd.read_csv('s3://nyqpug/asdf.csv')
-
-        # Receive a permission error when trying to read a private bucket.
-        # It's irrelevant here that this isn't actually a table.
-        with tm.assertRaisesRegexp(boto.exception.S3ResponseError,
-                                   'S3ResponseError: 403 Forbidden'):
-            pd.read_csv('s3://cant_get_it/')
-
-
-def assert_same_values_and_dtype(res, exp):
-    tm.assert_equal(res.dtype, exp.dtype)
-    tm.assert_almost_equal(res, exp)
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/io/tests/test_pickle.py b/pandas/io/tests/test_pickle.py
deleted file mode 100644
index 2a4e429e28580..0000000000000
--- a/pandas/io/tests/test_pickle.py
+++ /dev/null
@@ -1,218 +0,0 @@
-# pylint: disable=E1101,E1103,W0232
-
-""" manage legacy pickle tests """
-
-from datetime import datetime, timedelta
-import operator
-import pickle as pkl
-import nose
-import os
-
-from distutils.version import LooseVersion
-
-import numpy as np
-import pandas.util.testing as tm
-import pandas as pd
-from pandas import Index
-from pandas.sparse.tests import test_sparse
-from pandas import compat
-from pandas.compat import u
-from pandas.util.misc import is_little_endian
-import pandas
-from pandas.tseries.offsets import Day, MonthEnd
-
-
-class TestPickle():
-    """
-    How to add pickle tests:
-
-    1. Install pandas version intended to output the pickle.
-
-    2. Execute "generate_legacy_storage_files.py" to create the pickle.
-    $ python generate_legacy_storage_files.py <output_dir> pickle
-
-    3. Move the created pickle to "data/legacy_pickle/<version>" directory.
-
-    NOTE: TestPickle can't be a subclass of tm.Testcase to use test generator.
-    http://stackoverflow.com/questions/6689537/nose-test-generators-inside-class
-    """
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        from pandas.io.tests.generate_legacy_storage_files import create_pickle_data
-        self.data = create_pickle_data()
-        self.path = u('__%s__.pickle' % tm.rands(10))
-
-    def compare_element(self, result, expected, typ, version=None):
-        if isinstance(expected,Index):
-            tm.assert_index_equal(expected, result)
-            return
-
-        if typ.startswith('sp_'):
-            comparator = getattr(test_sparse,"assert_%s_equal" % typ)
-            comparator(result,expected,exact_indices=False)
-        else:
-            comparator = getattr(tm,"assert_%s_equal" % typ,tm.assert_almost_equal)
-            comparator(result,expected)
-
-    def compare(self, vf, version):
-
-        # py3 compat when reading py2 pickle
-        try:
-            data = pandas.read_pickle(vf)
-        except (ValueError) as e:
-            if 'unsupported pickle protocol:' in str(e):
-                # trying to read a py3 pickle in py2
-                return
-            else:
-                raise
-
-        for typ, dv in data.items():
-            for dt, result in dv.items():
-                try:
-                    expected = self.data[typ][dt]
-                except (KeyError):
-                    continue
-
-                # use a specific comparator
-                # if available
-                comparator = getattr(self,"compare_{typ}_{dt}".format(typ=typ,dt=dt), self.compare_element)
-                comparator(result, expected, typ, version)
-        return data
-
-    def compare_series_dt_tz(self, result, expected, typ, version):
-        # 8260
-        # dtype is object < 0.17.0
-        if LooseVersion(version) < '0.17.0':
-            expected = expected.astype(object)
-            tm.assert_series_equal(result, expected)
-        else:
-            tm.assert_series_equal(result, expected)
-
-    def compare_frame_dt_mixed_tzs(self, result, expected, typ, version):
-        # 8260
-        # dtype is object < 0.17.0
-        if LooseVersion(version) < '0.17.0':
-            expected = expected.astype(object)
-            tm.assert_frame_equal(result, expected)
-        else:
-            tm.assert_frame_equal(result, expected)
-
-    def read_pickles(self, version):
-        if not is_little_endian():
-            raise nose.SkipTest("known failure on non-little endian")
-
-        pth = tm.get_data_path('legacy_pickle/{0}'.format(str(version)))
-        n = 0
-        for f in os.listdir(pth):
-            vf = os.path.join(pth, f)
-            data = self.compare(vf, version)
-
-            if data is None:
-                continue
-
-            if 'series' in data:
-                if 'ts' in data['series']:
-                    self._validate_timeseries(data['series']['ts'], self.data['series']['ts'])
-                    self._validate_frequency(data['series']['ts'])
-            if 'index' in data:
-                if 'period' in data['index']:
-                    self._validate_periodindex(data['index']['period'],
-                                               self.data['index']['period'])
-            n += 1
-        assert n > 0, 'Pickle files are not tested'
-
-    def test_pickles(self):
-        pickle_path = tm.get_data_path('legacy_pickle')
-        n = 0
-        for v in os.listdir(pickle_path):
-            pth = os.path.join(pickle_path, v)
-            if os.path.isdir(pth):
-                yield self.read_pickles, v
-            n += 1
-        assert n > 0, 'Pickle files are not tested'
-
-    def test_round_trip_current(self):
-
-        try:
-            import cPickle as c_pickle
-            def c_pickler(obj,path):
-                with open(path,'wb') as fh:
-                    c_pickle.dump(obj,fh,protocol=-1)
-
-            def c_unpickler(path):
-                with open(path,'rb') as fh:
-                    fh.seek(0)
-                    return c_pickle.load(fh)
-        except:
-            c_pickler = None
-            c_unpickler = None
-
-        import pickle as python_pickle
-
-        def python_pickler(obj,path):
-            with open(path,'wb') as fh:
-                python_pickle.dump(obj,fh,protocol=-1)
-
-        def python_unpickler(path):
-            with open(path,'rb') as fh:
-                fh.seek(0)
-                return python_pickle.load(fh)
-
-        for typ, dv in self.data.items():
-            for dt, expected in dv.items():
-
-                for writer in [pd.to_pickle, c_pickler, python_pickler ]:
-                    if writer is None:
-                        continue
-
-                    with tm.ensure_clean(self.path) as path:
-
-                        # test writing with each pickler
-                        writer(expected,path)
-
-                        # test reading with each unpickler
-                        result = pd.read_pickle(path)
-                        self.compare_element(result, expected, typ)
-
-                        if c_unpickler is not None:
-                            result = c_unpickler(path)
-                            self.compare_element(result, expected, typ)
-
-                        result = python_unpickler(path)
-                        self.compare_element(result, expected, typ)
-
-    def _validate_timeseries(self, pickled, current):
-        # GH 7748
-        tm.assert_series_equal(pickled, current)
-        tm.assert_equal(pickled.index.freq, current.index.freq)
-        tm.assert_equal(pickled.index.freq.normalize, False)
-        tm.assert_numpy_array_equal(pickled > 0, current > 0)
-
-    def _validate_frequency(self, pickled):
-        # GH 9291
-        freq = pickled.index.freq
-        result = freq + Day(1)
-        tm.assert_equal(result, Day(2))
-
-        result = freq + pandas.Timedelta(hours=1)
-        tm.assert_equal(isinstance(result, pandas.Timedelta), True)
-        tm.assert_equal(result, pandas.Timedelta(days=1, hours=1))
-
-        result = freq + pandas.Timedelta(nanoseconds=1)
-        tm.assert_equal(isinstance(result, pandas.Timedelta), True)
-        tm.assert_equal(result, pandas.Timedelta(days=1, nanoseconds=1))
-
-    def _validate_periodindex(self, pickled, current):
-        tm.assert_index_equal(pickled, current)
-        tm.assertIsInstance(pickled.freq, MonthEnd)
-        tm.assert_equal(pickled.freq, MonthEnd())
-        tm.assert_equal(pickled.freqstr, 'M')
-        tm.assert_index_equal(pickled.shift(2), current.shift(2))
-
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   # '--with-coverage', '--cover-package=pandas.core'],
-                   exit=False)
diff --git a/pandas/io/tests/test_pytables.py b/pandas/io/tests/test_pytables.py
deleted file mode 100644
index 6c78f9cf3937c..0000000000000
--- a/pandas/io/tests/test_pytables.py
+++ /dev/null
@@ -1,5003 +0,0 @@
-import nose
-import sys
-import os
-import warnings
-import tempfile
-from contextlib import contextmanager
-
-import datetime
-import numpy as np
-
-import pandas
-import pandas as pd
-from pandas import (Series, DataFrame, Panel, MultiIndex, Categorical, bdate_range,
-                    date_range, timedelta_range, Index, DatetimeIndex, TimedeltaIndex, isnull)
-
-from pandas.compat import is_platform_windows, PY3
-from pandas.io.pytables import _tables, TableIterator
-try:
-    _tables()
-except ImportError as e:
-    raise nose.SkipTest(e)
-
-
-from pandas.io.pytables import (HDFStore, get_store, Term, read_hdf,
-                                IncompatibilityWarning, PerformanceWarning,
-                                AttributeConflictWarning, DuplicateWarning,
-                                PossibleDataLossError, ClosedFileError)
-from pandas.io import pytables as pytables
-import pandas.util.testing as tm
-from pandas.util.testing import (assert_panel4d_equal,
-                                 assert_panel_equal,
-                                 assert_frame_equal,
-                                 assert_series_equal)
-from pandas import concat, Timestamp
-from pandas import compat
-from pandas.compat import range, lrange, u
-from pandas.util.testing import assert_produces_warning
-from numpy.testing.decorators import slow
-
-try:
-    import tables
-except ImportError:
-    raise nose.SkipTest('no pytables')
-
-from distutils.version import LooseVersion
-
-_default_compressor = LooseVersion(tables.__version__) >= '2.2' \
-    and 'blosc' or 'zlib'
-
-_multiprocess_can_split_ = False
-
-# testing on windows/py3 seems to fault
-# for using compression
-skip_compression = PY3 and is_platform_windows()
-
-# contextmanager to ensure the file cleanup
-def safe_remove(path):
-    if path is not None:
-        try:
-            os.remove(path)
-        except:
-            pass
-
-
-def safe_close(store):
-    try:
-        if store is not None:
-            store.close()
-    except:
-        pass
-
-
-def create_tempfile(path):
-    """ create an unopened named temporary file """
-    return os.path.join(tempfile.gettempdir(),path)
-
-
-@contextmanager
-def ensure_clean_store(path, mode='a', complevel=None, complib=None,
-              fletcher32=False):
-
-    try:
-
-        # put in the temporary path if we don't have one already
-        if not len(os.path.dirname(path)):
-            path = create_tempfile(path)
-
-        store = HDFStore(path, mode=mode, complevel=complevel,
-                         complib=complib, fletcher32=False)
-        yield store
-    finally:
-        safe_close(store)
-        if mode == 'w' or mode == 'a':
-            safe_remove(path)
-
-
-@contextmanager
-def ensure_clean_path(path):
-    """
-    return essentially a named temporary file that is not opened
-    and deleted on existing; if path is a list, then create and
-    return list of filenames
-    """
-    try:
-        if isinstance(path, list):
-            filenames = [ create_tempfile(p) for p in path ]
-            yield filenames
-        else:
-            filenames = [ create_tempfile(path) ]
-            yield filenames[0]
-    finally:
-        for f in filenames:
-            safe_remove(f)
-
-
-# set these parameters so we don't have file sharing
-tables.parameters.MAX_NUMEXPR_THREADS = 1
-tables.parameters.MAX_BLOSC_THREADS   = 1
-tables.parameters.MAX_THREADS   = 1
-
-def _maybe_remove(store, key):
-    """For tests using tables, try removing the table to be sure there is
-    no content from previous tests using the same table name."""
-    try:
-        store.remove(key)
-    except:
-        pass
-
-
-def compat_assert_produces_warning(w, f):
-    """ don't produce a warning under PY3 """
-    if compat.PY3:
-        f()
-    else:
-        with tm.assert_produces_warning(expected_warning=w):
-            f()
-
-
-class Base(tm.TestCase):
-
-    @classmethod
-    def setUpClass(cls):
-        super(Base, cls).setUpClass()
-
-        # Pytables 3.0.0 deprecates lots of things
-        tm.reset_testing_mode()
-
-    @classmethod
-    def tearDownClass(cls):
-        super(Base, cls).tearDownClass()
-
-        # Pytables 3.0.0 deprecates lots of things
-        tm.set_testing_mode()
-
-    def setUp(self):
-        warnings.filterwarnings(action='ignore', category=FutureWarning)
-
-        self.path = 'tmp.__%s__.h5' % tm.rands(10)
-
-    def tearDown(self):
-        pass
-
-
-class TestHDFStore(Base, tm.TestCase):
-
-    def test_factory_fun(self):
-        path = create_tempfile(self.path)
-        try:
-            with get_store(path) as tbl:
-                raise ValueError('blah')
-        except ValueError:
-            pass
-        finally:
-            safe_remove(path)
-
-        try:
-            with get_store(path) as tbl:
-                tbl['a'] = tm.makeDataFrame()
-
-            with get_store(path) as tbl:
-                self.assertEqual(len(tbl), 1)
-                self.assertEqual(type(tbl['a']), DataFrame)
-        finally:
-            safe_remove(self.path)
-
-    def test_context(self):
-        path = create_tempfile(self.path)
-        try:
-            with HDFStore(path) as tbl:
-                raise ValueError('blah')
-        except ValueError:
-            pass
-        finally:
-            safe_remove(path)
-
-        try:
-            with HDFStore(path) as tbl:
-                tbl['a'] = tm.makeDataFrame()
-
-            with HDFStore(path) as tbl:
-                self.assertEqual(len(tbl), 1)
-                self.assertEqual(type(tbl['a']), DataFrame)
-        finally:
-            safe_remove(path)
-
-    def test_conv_read_write(self):
-        path = create_tempfile(self.path)
-        try:
-            def roundtrip(key, obj,**kwargs):
-                obj.to_hdf(path, key,**kwargs)
-                return read_hdf(path, key)
-
-            o = tm.makeTimeSeries()
-            assert_series_equal(o, roundtrip('series',o))
-
-            o = tm.makeStringSeries()
-            assert_series_equal(o, roundtrip('string_series',o))
-
-            o = tm.makeDataFrame()
-            assert_frame_equal(o, roundtrip('frame',o))
-
-            o = tm.makePanel()
-            assert_panel_equal(o, roundtrip('panel',o))
-
-            # table
-            df = DataFrame(dict(A=lrange(5), B=lrange(5)))
-            df.to_hdf(path,'table',append=True)
-            result = read_hdf(path, 'table', where = ['index>2'])
-            assert_frame_equal(df[df.index>2],result)
-
-        finally:
-            safe_remove(path)
-
-    def test_long_strings(self):
-
-        # GH6166
-        # unconversion of long strings was being chopped in earlier
-        # versions of numpy < 1.7.2
-        df = DataFrame({'a': tm.rands_array(100, size=10)},
-                       index=tm.rands_array(100, size=10))
-
-        with ensure_clean_store(self.path) as store:
-            store.append('df', df, data_columns=['a'])
-
-            result = store.select('df')
-            assert_frame_equal(df, result)
-
-
-    def test_api(self):
-
-        # GH4584
-        # API issue when to_hdf doesn't acdept append AND format args
-        with ensure_clean_path(self.path) as path:
-
-            df = tm.makeDataFrame()
-            df.iloc[:10].to_hdf(path,'df',append=True,format='table')
-            df.iloc[10:].to_hdf(path,'df',append=True,format='table')
-            assert_frame_equal(read_hdf(path,'df'),df)
-
-            # append to False
-            df.iloc[:10].to_hdf(path,'df',append=False,format='table')
-            df.iloc[10:].to_hdf(path,'df',append=True,format='table')
-            assert_frame_equal(read_hdf(path,'df'),df)
-
-        with ensure_clean_path(self.path) as path:
-
-            df = tm.makeDataFrame()
-            df.iloc[:10].to_hdf(path,'df',append=True)
-            df.iloc[10:].to_hdf(path,'df',append=True,format='table')
-            assert_frame_equal(read_hdf(path,'df'),df)
-
-            # append to False
-            df.iloc[:10].to_hdf(path,'df',append=False,format='table')
-            df.iloc[10:].to_hdf(path,'df',append=True)
-            assert_frame_equal(read_hdf(path,'df'),df)
-
-        with ensure_clean_path(self.path) as path:
-
-            df = tm.makeDataFrame()
-            df.to_hdf(path,'df',append=False,format='fixed')
-            assert_frame_equal(read_hdf(path,'df'),df)
-
-            df.to_hdf(path,'df',append=False,format='f')
-            assert_frame_equal(read_hdf(path,'df'),df)
-
-            df.to_hdf(path,'df',append=False)
-            assert_frame_equal(read_hdf(path,'df'),df)
-
-            df.to_hdf(path,'df')
-            assert_frame_equal(read_hdf(path,'df'),df)
-
-        with ensure_clean_store(self.path) as store:
-
-            path = store._path
-            df = tm.makeDataFrame()
-
-            _maybe_remove(store,'df')
-            store.append('df',df.iloc[:10],append=True,format='table')
-            store.append('df',df.iloc[10:],append=True,format='table')
-            assert_frame_equal(store.select('df'),df)
-
-            # append to False
-            _maybe_remove(store,'df')
-            store.append('df',df.iloc[:10],append=False,format='table')
-            store.append('df',df.iloc[10:],append=True,format='table')
-            assert_frame_equal(store.select('df'),df)
-
-            # formats
-            _maybe_remove(store,'df')
-            store.append('df',df.iloc[:10],append=False,format='table')
-            store.append('df',df.iloc[10:],append=True,format='table')
-            assert_frame_equal(store.select('df'),df)
-
-            _maybe_remove(store,'df')
-            store.append('df',df.iloc[:10],append=False,format='table')
-            store.append('df',df.iloc[10:],append=True,format=None)
-            assert_frame_equal(store.select('df'),df)
-
-        with ensure_clean_path(self.path) as path:
-
-            # invalid
-            df = tm.makeDataFrame()
-            self.assertRaises(ValueError, df.to_hdf, path,'df',append=True,format='f')
-            self.assertRaises(ValueError, df.to_hdf, path,'df',append=True,format='fixed')
-
-            self.assertRaises(TypeError, df.to_hdf, path,'df',append=True,format='foo')
-            self.assertRaises(TypeError, df.to_hdf, path,'df',append=False,format='bar')
-
-        #File path doesn't exist
-        path = ""
-        self.assertRaises(IOError, read_hdf, path, 'df')
-
-    def test_api_default_format(self):
-
-        # default_format option
-        with ensure_clean_store(self.path) as store:
-            df = tm.makeDataFrame()
-
-            pandas.set_option('io.hdf.default_format','fixed')
-            _maybe_remove(store,'df')
-            store.put('df',df)
-            self.assertFalse(store.get_storer('df').is_table)
-            self.assertRaises(ValueError, store.append, 'df2',df)
-
-            pandas.set_option('io.hdf.default_format','table')
-            _maybe_remove(store,'df')
-            store.put('df',df)
-            self.assertTrue(store.get_storer('df').is_table)
-            _maybe_remove(store,'df2')
-            store.append('df2',df)
-            self.assertTrue(store.get_storer('df').is_table)
-
-            pandas.set_option('io.hdf.default_format',None)
-
-        with ensure_clean_path(self.path) as path:
-
-            df = tm.makeDataFrame()
-
-            pandas.set_option('io.hdf.default_format','fixed')
-            df.to_hdf(path,'df')
-            with get_store(path) as store:
-                self.assertFalse(store.get_storer('df').is_table)
-            self.assertRaises(ValueError, df.to_hdf, path,'df2', append=True)
-
-            pandas.set_option('io.hdf.default_format','table')
-            df.to_hdf(path,'df3')
-            with HDFStore(path) as store:
-                self.assertTrue(store.get_storer('df3').is_table)
-            df.to_hdf(path,'df4',append=True)
-            with HDFStore(path) as store:
-                self.assertTrue(store.get_storer('df4').is_table)
-
-            pandas.set_option('io.hdf.default_format',None)
-
-    def test_keys(self):
-
-        with ensure_clean_store(self.path) as store:
-            store['a'] = tm.makeTimeSeries()
-            store['b'] = tm.makeStringSeries()
-            store['c'] = tm.makeDataFrame()
-            store['d'] = tm.makePanel()
-            store['foo/bar'] = tm.makePanel()
-            self.assertEqual(len(store), 5)
-            self.assertTrue(set(
-                store.keys()) == set(['/a', '/b', '/c', '/d', '/foo/bar']))
-
-    def test_repr(self):
-
-        with ensure_clean_store(self.path) as store:
-            repr(store)
-            store['a'] = tm.makeTimeSeries()
-            store['b'] = tm.makeStringSeries()
-            store['c'] = tm.makeDataFrame()
-            store['d'] = tm.makePanel()
-            store['foo/bar'] = tm.makePanel()
-            store.append('e', tm.makePanel())
-
-            df = tm.makeDataFrame()
-            df['obj1'] = 'foo'
-            df['obj2'] = 'bar'
-            df['bool1'] = df['A'] > 0
-            df['bool2'] = df['B'] > 0
-            df['bool3'] = True
-            df['int1'] = 1
-            df['int2'] = 2
-            df['timestamp1'] = Timestamp('20010102')
-            df['timestamp2'] = Timestamp('20010103')
-            df['datetime1']  = datetime.datetime(2001,1,2,0,0)
-            df['datetime2']  = datetime.datetime(2001,1,3,0,0)
-            df.ix[3:6,['obj1']] = np.nan
-            df = df.consolidate()._convert(datetime=True)
-
-            warnings.filterwarnings('ignore', category=PerformanceWarning)
-            store['df'] = df
-            warnings.filterwarnings('always', category=PerformanceWarning)
-
-            # make a random group in hdf space
-            store._handle.create_group(store._handle.root,'bah')
-
-            repr(store)
-            str(store)
-
-        # storers
-        with ensure_clean_store(self.path) as store:
-
-            df = tm.makeDataFrame()
-            store.append('df',df)
-
-            s = store.get_storer('df')
-            repr(s)
-            str(s)
-
-    def test_contains(self):
-
-        with ensure_clean_store(self.path) as store:
-            store['a'] = tm.makeTimeSeries()
-            store['b'] = tm.makeDataFrame()
-            store['foo/bar'] = tm.makeDataFrame()
-            self.assertIn('a', store)
-            self.assertIn('b', store)
-            self.assertNotIn('c', store)
-            self.assertIn('foo/bar', store)
-            self.assertIn('/foo/bar', store)
-            self.assertNotIn('/foo/b', store)
-            self.assertNotIn('bar', store)
-
-            # GH 2694
-            warnings.filterwarnings('ignore', category=tables.NaturalNameWarning)
-            store['node())'] = tm.makeDataFrame()
-            self.assertIn('node())', store)
-
-    def test_versioning(self):
-
-        with ensure_clean_store(self.path) as store:
-            store['a'] = tm.makeTimeSeries()
-            store['b'] = tm.makeDataFrame()
-            df = tm.makeTimeDataFrame()
-            _maybe_remove(store, 'df1')
-            store.append('df1', df[:10])
-            store.append('df1', df[10:])
-            self.assertEqual(store.root.a._v_attrs.pandas_version, '0.15.2')
-            self.assertEqual(store.root.b._v_attrs.pandas_version, '0.15.2')
-            self.assertEqual(store.root.df1._v_attrs.pandas_version, '0.15.2')
-
-            # write a file and wipe its versioning
-            _maybe_remove(store, 'df2')
-            store.append('df2', df)
-
-            # this is an error because its table_type is appendable, but no version
-            # info
-            store.get_node('df2')._v_attrs.pandas_version = None
-            self.assertRaises(Exception, store.select, 'df2')
-
-    def test_mode(self):
-
-        df = tm.makeTimeDataFrame()
-
-        def check(mode):
-
-            with ensure_clean_path(self.path) as path:
-
-                # constructor
-                if mode in ['r','r+']:
-                    self.assertRaises(IOError, HDFStore, path, mode=mode)
-
-                else:
-                    store = HDFStore(path,mode=mode)
-                    self.assertEqual(store._handle.mode, mode)
-                    store.close()
-
-            with ensure_clean_path(self.path) as path:
-
-                # context
-                if mode in ['r','r+']:
-                    def f():
-                        with HDFStore(path,mode=mode) as store:
-                            pass
-                    self.assertRaises(IOError, f)
-                else:
-                    with HDFStore(path,mode=mode) as store:
-                        self.assertEqual(store._handle.mode, mode)
-
-            with ensure_clean_path(self.path) as path:
-
-                # conv write
-                if mode in ['r','r+']:
-                    self.assertRaises(IOError, df.to_hdf, path, 'df', mode=mode)
-                    df.to_hdf(path,'df',mode='w')
-                else:
-                    df.to_hdf(path,'df',mode=mode)
-
-                # conv read
-                if mode in ['w']:
-                    self.assertRaises(KeyError, read_hdf, path, 'df', mode=mode)
-                else:
-                    result = read_hdf(path,'df',mode=mode)
-                    assert_frame_equal(result,df)
-
-        check('r')
-        check('r+')
-        check('a')
-        check('w')
-
-    def test_reopen_handle(self):
-
-        with ensure_clean_path(self.path) as path:
-
-            store = HDFStore(path,mode='a')
-            store['a'] = tm.makeTimeSeries()
-
-            # invalid mode change
-            self.assertRaises(PossibleDataLossError, store.open, 'w')
-            store.close()
-            self.assertFalse(store.is_open)
-
-            # truncation ok here
-            store.open('w')
-            self.assertTrue(store.is_open)
-            self.assertEqual(len(store), 0)
-            store.close()
-            self.assertFalse(store.is_open)
-
-            store = HDFStore(path,mode='a')
-            store['a'] = tm.makeTimeSeries()
-
-            # reopen as read
-            store.open('r')
-            self.assertTrue(store.is_open)
-            self.assertEqual(len(store), 1)
-            self.assertEqual(store._mode, 'r')
-            store.close()
-            self.assertFalse(store.is_open)
-
-            # reopen as append
-            store.open('a')
-            self.assertTrue(store.is_open)
-            self.assertEqual(len(store), 1)
-            self.assertEqual(store._mode, 'a')
-            store.close()
-            self.assertFalse(store.is_open)
-
-            # reopen as append (again)
-            store.open('a')
-            self.assertTrue(store.is_open)
-            self.assertEqual(len(store), 1)
-            self.assertEqual(store._mode, 'a')
-            store.close()
-            self.assertFalse(store.is_open)
-
-    def test_open_args(self):
-
-        with ensure_clean_path(self.path) as path:
-
-            df = tm.makeDataFrame()
-
-            # create an in memory store
-            store = HDFStore(path,mode='a',driver='H5FD_CORE',driver_core_backing_store=0)
-            store['df'] = df
-            store.append('df2',df)
-
-            tm.assert_frame_equal(store['df'],df)
-            tm.assert_frame_equal(store['df2'],df)
-
-            store.close()
-
-            # the file should not have actually been written
-            self.assertFalse(os.path.exists(path))
-
-    def test_flush(self):
-
-        with ensure_clean_store(self.path) as store:
-            store['a'] = tm.makeTimeSeries()
-            store.flush()
-            store.flush(fsync=True)
-
-    def test_get(self):
-
-        with ensure_clean_store(self.path) as store:
-            store['a'] = tm.makeTimeSeries()
-            left = store.get('a')
-            right = store['a']
-            tm.assert_series_equal(left, right)
-
-            left = store.get('/a')
-            right = store['/a']
-            tm.assert_series_equal(left, right)
-
-            self.assertRaises(KeyError, store.get, 'b')
-
-    def test_getattr(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            s = tm.makeTimeSeries()
-            store['a'] = s
-
-            # test attribute access
-            result = store.a
-            tm.assert_series_equal(result, s)
-            result = getattr(store,'a')
-            tm.assert_series_equal(result, s)
-
-            df = tm.makeTimeDataFrame()
-            store['df'] = df
-            result = store.df
-            tm.assert_frame_equal(result, df)
-
-            # errors
-            self.assertRaises(AttributeError, getattr, store, 'd')
-
-            for x in ['mode','path','handle','complib']:
-                self.assertRaises(AttributeError, getattr, store, x)
-
-            # not stores
-            for x in ['mode','path','handle','complib']:
-                getattr(store,"_%s" % x)
-
-    def test_put(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            ts = tm.makeTimeSeries()
-            df = tm.makeTimeDataFrame()
-            store['a'] = ts
-            store['b'] = df[:10]
-            store['foo/bar/bah'] = df[:10]
-            store['foo'] = df[:10]
-            store['/foo'] = df[:10]
-            store.put('c', df[:10], format='table')
-
-            # not OK, not a table
-            self.assertRaises(
-                ValueError, store.put, 'b', df[10:], append=True)
-
-            # node does not currently exist, test _is_table_type returns False in
-            # this case
-            # _maybe_remove(store, 'f')
-            # self.assertRaises(ValueError, store.put, 'f', df[10:], append=True)
-
-            # can't put to a table (use append instead)
-            self.assertRaises(ValueError, store.put, 'c', df[10:], append=True)
-
-            # overwrite table
-            store.put('c', df[:10], format='table', append=False)
-            tm.assert_frame_equal(df[:10], store['c'])
-
-    def test_put_string_index(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            index = Index(
-                ["I am a very long string index: %s" % i for i in range(20)])
-            s = Series(np.arange(20), index=index)
-            df = DataFrame({'A': s, 'B': s})
-
-            store['a'] = s
-            tm.assert_series_equal(store['a'], s)
-
-            store['b'] = df
-            tm.assert_frame_equal(store['b'], df)
-
-            # mixed length
-            index = Index(['abcdefghijklmnopqrstuvwxyz1234567890'] + ["I am a very long string index: %s" % i for i in range(20)])
-            s = Series(np.arange(21), index=index)
-            df = DataFrame({'A': s, 'B': s})
-            store['a'] = s
-            tm.assert_series_equal(store['a'], s)
-
-            store['b'] = df
-            tm.assert_frame_equal(store['b'], df)
-
-    def test_put_compression(self):
-
-        with ensure_clean_store(self.path) as store:
-            df = tm.makeTimeDataFrame()
-
-            store.put('c', df, format='table', complib='zlib')
-            tm.assert_frame_equal(store['c'], df)
-
-            # can't compress if format='fixed'
-            self.assertRaises(ValueError, store.put, 'b', df,
-                              format='fixed', complib='zlib')
-
-    def test_put_compression_blosc(self):
-        tm.skip_if_no_package('tables', '2.2', app='blosc support')
-        if skip_compression:
-            raise nose.SkipTest("skipping on windows/PY3")
-
-        df = tm.makeTimeDataFrame()
-
-        with ensure_clean_store(self.path) as store:
-
-            # can't compress if format='fixed'
-            self.assertRaises(ValueError, store.put, 'b', df,
-                              format='fixed', complib='blosc')
-
-            store.put('c', df, format='table', complib='blosc')
-            tm.assert_frame_equal(store['c'], df)
-
-    def test_put_integer(self):
-        # non-date, non-string index
-        df = DataFrame(np.random.randn(50, 100))
-        self._check_roundtrip(df, tm.assert_frame_equal)
-
-    def test_put_mixed_type(self):
-        df = tm.makeTimeDataFrame()
-        df['obj1'] = 'foo'
-        df['obj2'] = 'bar'
-        df['bool1'] = df['A'] > 0
-        df['bool2'] = df['B'] > 0
-        df['bool3'] = True
-        df['int1'] = 1
-        df['int2'] = 2
-        df['timestamp1'] = Timestamp('20010102')
-        df['timestamp2'] = Timestamp('20010103')
-        df['datetime1'] = datetime.datetime(2001, 1, 2, 0, 0)
-        df['datetime2'] = datetime.datetime(2001, 1, 3, 0, 0)
-        df.ix[3:6, ['obj1']] = np.nan
-        df = df.consolidate()._convert(datetime=True)
-
-        with ensure_clean_store(self.path) as store:
-            _maybe_remove(store, 'df')
-
-            # cannot use assert_produces_warning here for some reason
-            # a PendingDeprecationWarning is also raised?
-            warnings.filterwarnings('ignore', category=PerformanceWarning)
-            store.put('df',df)
-            warnings.filterwarnings('always', category=PerformanceWarning)
-
-            expected = store.get('df')
-            tm.assert_frame_equal(expected,df)
-
-    def test_append(self):
-
-        with ensure_clean_store(self.path) as store:
-            df = tm.makeTimeDataFrame()
-            _maybe_remove(store, 'df1')
-            store.append('df1', df[:10])
-            store.append('df1', df[10:])
-            tm.assert_frame_equal(store['df1'], df)
-
-            _maybe_remove(store, 'df2')
-            store.put('df2', df[:10], format='table')
-            store.append('df2', df[10:])
-            tm.assert_frame_equal(store['df2'], df)
-
-            _maybe_remove(store, 'df3')
-            store.append('/df3', df[:10])
-            store.append('/df3', df[10:])
-            tm.assert_frame_equal(store['df3'], df)
-
-            # this is allowed by almost always don't want to do it
-            with tm.assert_produces_warning(expected_warning=tables.NaturalNameWarning):
-                _maybe_remove(store, '/df3 foo')
-                store.append('/df3 foo', df[:10])
-                store.append('/df3 foo', df[10:])
-                tm.assert_frame_equal(store['df3 foo'], df)
-
-            # panel
-            wp = tm.makePanel()
-            _maybe_remove(store, 'wp1')
-            store.append('wp1', wp.ix[:, :10, :])
-            store.append('wp1', wp.ix[:, 10:, :])
-            assert_panel_equal(store['wp1'], wp)
-
-            # ndim
-            p4d = tm.makePanel4D()
-            _maybe_remove(store, 'p4d')
-            store.append('p4d', p4d.ix[:, :, :10, :])
-            store.append('p4d', p4d.ix[:, :, 10:, :])
-            assert_panel4d_equal(store['p4d'], p4d)
-
-            # test using axis labels
-            _maybe_remove(store, 'p4d')
-            store.append('p4d', p4d.ix[:, :, :10, :], axes=[
-                    'items', 'major_axis', 'minor_axis'])
-            store.append('p4d', p4d.ix[:, :, 10:, :], axes=[
-                    'items', 'major_axis', 'minor_axis'])
-            assert_panel4d_equal(store['p4d'], p4d)
-
-            # test using differnt number of items on each axis
-            p4d2 = p4d.copy()
-            p4d2['l4'] = p4d['l1']
-            p4d2['l5'] = p4d['l1']
-            _maybe_remove(store, 'p4d2')
-            store.append(
-                'p4d2', p4d2, axes=['items', 'major_axis', 'minor_axis'])
-            assert_panel4d_equal(store['p4d2'], p4d2)
-
-            # test using differt order of items on the non-index axes
-            _maybe_remove(store, 'wp1')
-            wp_append1 = wp.ix[:, :10, :]
-            store.append('wp1', wp_append1)
-            wp_append2 = wp.ix[:, 10:, :].reindex(items=wp.items[::-1])
-            store.append('wp1', wp_append2)
-            assert_panel_equal(store['wp1'], wp)
-
-            # dtype issues - mizxed type in a single object column
-            df = DataFrame(data=[[1, 2], [0, 1], [1, 2], [0, 0]])
-            df['mixed_column'] = 'testing'
-            df.ix[2, 'mixed_column'] = np.nan
-            _maybe_remove(store, 'df')
-            store.append('df', df)
-            tm.assert_frame_equal(store['df'], df)
-
-            # uints - test storage of uints
-            uint_data = DataFrame({'u08' : Series(np.random.random_integers(0, high=255, size=5), dtype=np.uint8),
-                                   'u16' : Series(np.random.random_integers(0, high=65535, size=5), dtype=np.uint16),
-                                   'u32' : Series(np.random.random_integers(0, high=2**30, size=5), dtype=np.uint32),
-                                   'u64' : Series([2**58, 2**59, 2**60, 2**61, 2**62], dtype=np.uint64)},
-                                  index=np.arange(5))
-            _maybe_remove(store, 'uints')
-            store.append('uints', uint_data)
-            tm.assert_frame_equal(store['uints'], uint_data)
-
-            # uints - test storage of uints in indexable columns
-            _maybe_remove(store, 'uints')
-            store.append('uints', uint_data, data_columns=['u08','u16','u32']) # 64-bit indices not yet supported
-            tm.assert_frame_equal(store['uints'], uint_data)
-
-    def test_append_series(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            # basic
-            ss = tm.makeStringSeries()
-            ts = tm.makeTimeSeries()
-            ns = Series(np.arange(100))
-
-            store.append('ss', ss)
-            result = store['ss']
-            tm.assert_series_equal(result, ss)
-            self.assertIsNone(result.name)
-
-            store.append('ts', ts)
-            result = store['ts']
-            tm.assert_series_equal(result, ts)
-            self.assertIsNone(result.name)
-
-            ns.name = 'foo'
-            store.append('ns', ns)
-            result = store['ns']
-            tm.assert_series_equal(result, ns)
-            self.assertEqual(result.name, ns.name)
-
-            # select on the values
-            expected = ns[ns>60]
-            result = store.select('ns',Term('foo>60'))
-            tm.assert_series_equal(result,expected)
-
-            # select on the index and values
-            expected = ns[(ns>70) & (ns.index<90)]
-            result = store.select('ns',[Term('foo>70'), Term('index<90')])
-            tm.assert_series_equal(result,expected)
-
-            # multi-index
-            mi = DataFrame(np.random.randn(5,1),columns=['A'])
-            mi['B'] = np.arange(len(mi))
-            mi['C'] = 'foo'
-            mi.loc[3:5,'C'] = 'bar'
-            mi.set_index(['C','B'],inplace=True)
-            s = mi.stack()
-            s.index = s.index.droplevel(2)
-            store.append('mi', s)
-            tm.assert_series_equal(store['mi'], s)
-
-    def test_store_index_types(self):
-        # GH5386
-        # test storing various index types
-
-        with ensure_clean_store(self.path) as store:
-
-            def check(format,index):
-                df = DataFrame(np.random.randn(10,2),columns=list('AB'))
-                df.index = index(len(df))
-
-                _maybe_remove(store, 'df')
-                store.put('df',df,format=format)
-                assert_frame_equal(df,store['df'])
-
-            for index in [ tm.makeFloatIndex, tm.makeStringIndex, tm.makeIntIndex,
-                           tm.makeDateIndex ]:
-
-                check('table',index)
-                check('fixed',index)
-
-            # period index currently broken for table
-            # seee GH7796 FIXME
-            check('fixed',tm.makePeriodIndex)
-            #check('table',tm.makePeriodIndex)
-
-            # unicode
-            index = tm.makeUnicodeIndex
-            if compat.PY3:
-                check('table',index)
-                check('fixed',index)
-            else:
-
-                # only support for fixed types (and they have a perf warning)
-                self.assertRaises(TypeError, check, 'table', index)
-                with tm.assert_produces_warning(expected_warning=PerformanceWarning):
-                    check('fixed',index)
-
-    def test_encoding(self):
-
-        if sys.byteorder != 'little':
-            raise nose.SkipTest('system byteorder is not little')
-
-        with ensure_clean_store(self.path) as store:
-            df = DataFrame(dict(A='foo',B='bar'),index=range(5))
-            df.loc[2,'A'] = np.nan
-            df.loc[3,'B'] = np.nan
-            _maybe_remove(store, 'df')
-            store.append('df', df, encoding='ascii')
-            tm.assert_frame_equal(store['df'], df)
-
-            expected = df.reindex(columns=['A'])
-            result = store.select('df',Term('columns=A',encoding='ascii'))
-            tm.assert_frame_equal(result,expected)
-
-    def test_latin_encoding(self):
-
-        if compat.PY2:
-            self.assertRaisesRegexp(TypeError, '\[unicode\] is not implemented as a table column')
-            return
-
-        values = [[b'E\xc9, 17', b'', b'a', b'b', b'c'],
-                  [b'E\xc9, 17', b'a', b'b', b'c'],
-                  [b'EE, 17', b'', b'a', b'b', b'c'],
-                  [b'E\xc9, 17', b'\xf8\xfc', b'a', b'b', b'c'],
-                  [b'', b'a', b'b', b'c'],
-                  [b'\xf8\xfc', b'a', b'b', b'c'],
-                  [b'A\xf8\xfc', b'', b'a', b'b', b'c'],
-                  [np.nan, b'', b'b', b'c'],
-                  [b'A\xf8\xfc', np.nan, b'', b'b', b'c']]
-
-        def _try_decode(x, encoding='latin-1'):
-            try:
-                return x.decode(encoding)
-            except AttributeError:
-                return x
-        # not sure how to remove latin-1 from code in python 2 and 3
-        values = [[_try_decode(x) for x in y] for y in values]
-
-        examples = []
-        for dtype in ['category', object]:
-            for val in values:
-                examples.append(pandas.Series(val, dtype=dtype))
-
-        def roundtrip(s, key='data', encoding='latin-1', nan_rep=''):
-            with ensure_clean_path(self.path) as store:
-                s.to_hdf(store, key, format='table', encoding=encoding,
-                        nan_rep=nan_rep)
-                retr = read_hdf(store, key)
-                s_nan = s.replace(nan_rep, np.nan)
-                assert_series_equal(s_nan, retr)
-
-        for s in examples:
-            roundtrip(s)
-
-        # fails:
-        # for x in examples:
-        #     roundtrip(s, nan_rep=b'\xf8\xfc')
-
-
-    def test_append_some_nans(self):
-
-        with ensure_clean_store(self.path) as store:
-            df = DataFrame({'A' : Series(np.random.randn(20)).astype('int32'),
-                            'A1' : np.random.randn(20),
-                            'A2' : np.random.randn(20),
-                            'B' : 'foo', 'C' : 'bar', 'D' : Timestamp("20010101"), 'E' : datetime.datetime(2001,1,2,0,0) },
-                           index=np.arange(20))
-            # some nans
-            _maybe_remove(store, 'df1')
-            df.ix[0:15,['A1','B','D','E']] = np.nan
-            store.append('df1', df[:10])
-            store.append('df1', df[10:])
-            tm.assert_frame_equal(store['df1'], df)
-
-            # first column
-            df1 = df.copy()
-            df1.ix[:,'A1'] = np.nan
-            _maybe_remove(store, 'df1')
-            store.append('df1', df1[:10])
-            store.append('df1', df1[10:])
-            tm.assert_frame_equal(store['df1'], df1)
-
-            # 2nd column
-            df2 = df.copy()
-            df2.ix[:,'A2'] = np.nan
-            _maybe_remove(store, 'df2')
-            store.append('df2', df2[:10])
-            store.append('df2', df2[10:])
-            tm.assert_frame_equal(store['df2'], df2)
-
-            # datetimes
-            df3 = df.copy()
-            df3.ix[:,'E'] = np.nan
-            _maybe_remove(store, 'df3')
-            store.append('df3', df3[:10])
-            store.append('df3', df3[10:])
-            tm.assert_frame_equal(store['df3'], df3)
-
-    def test_append_all_nans(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            df = DataFrame({'A1' : np.random.randn(20),
-                            'A2' : np.random.randn(20)},
-                           index=np.arange(20))
-            df.ix[0:15,:] = np.nan
-
-
-            # nan some entire rows (dropna=True)
-            _maybe_remove(store, 'df')
-            store.append('df', df[:10], dropna=True)
-            store.append('df', df[10:], dropna=True)
-            tm.assert_frame_equal(store['df'], df[-4:])
-
-            # nan some entire rows (dropna=False)
-            _maybe_remove(store, 'df2')
-            store.append('df2', df[:10], dropna=False)
-            store.append('df2', df[10:], dropna=False)
-            tm.assert_frame_equal(store['df2'], df)
-
-            # tests the option io.hdf.dropna_table
-            pandas.set_option('io.hdf.dropna_table',False)
-            _maybe_remove(store, 'df3')
-            store.append('df3', df[:10])
-            store.append('df3', df[10:])
-            tm.assert_frame_equal(store['df3'], df)
-
-            pandas.set_option('io.hdf.dropna_table',True)
-            _maybe_remove(store, 'df4')
-            store.append('df4', df[:10])
-            store.append('df4', df[10:])
-            tm.assert_frame_equal(store['df4'], df[-4:])
-
-            # nan some entire rows (string are still written!)
-            df = DataFrame({'A1' : np.random.randn(20),
-                            'A2' : np.random.randn(20),
-                            'B' : 'foo', 'C' : 'bar'},
-                           index=np.arange(20))
-
-            df.ix[0:15,:] = np.nan
-
-            _maybe_remove(store, 'df')
-            store.append('df', df[:10], dropna=True)
-            store.append('df', df[10:], dropna=True)
-            tm.assert_frame_equal(store['df'], df)
-
-            _maybe_remove(store, 'df2')
-            store.append('df2', df[:10], dropna=False)
-            store.append('df2', df[10:], dropna=False)
-            tm.assert_frame_equal(store['df2'], df)
-
-            # nan some entire rows (but since we have dates they are still written!)
-            df = DataFrame({'A1' : np.random.randn(20),
-                            'A2' : np.random.randn(20),
-                            'B' : 'foo', 'C' : 'bar', 'D' : Timestamp("20010101"), 'E' : datetime.datetime(2001,1,2,0,0) },
-                           index=np.arange(20))
-
-            df.ix[0:15,:] = np.nan
-
-            _maybe_remove(store, 'df')
-            store.append('df', df[:10], dropna=True)
-            store.append('df', df[10:], dropna=True)
-            tm.assert_frame_equal(store['df'], df)
-
-            _maybe_remove(store, 'df2')
-            store.append('df2', df[:10], dropna=False)
-            store.append('df2', df[10:], dropna=False)
-            tm.assert_frame_equal(store['df2'], df)
-
-        # Test to make sure defaults are to not drop.
-        # Corresponding to Issue 9382
-        df_with_missing = DataFrame({'col1':[0, np.nan, 2], 'col2':[1, np.nan,  np.nan]})
-
-        with ensure_clean_path(self.path) as path:
-            df_with_missing.to_hdf(path, 'df_with_missing', format = 'table')
-            reloaded = read_hdf(path, 'df_with_missing')
-            tm.assert_frame_equal(df_with_missing, reloaded)
-
-        matrix = [[[np.nan, np.nan, np.nan],[1,np.nan,np.nan]],
-            [[np.nan, np.nan, np.nan], [np.nan,5,6]],
-            [[np.nan, np.nan, np.nan],[np.nan,3,np.nan]]]
-
-        panel_with_missing = Panel(matrix, items=['Item1', 'Item2','Item3'],
-                   major_axis=[1,2],
-                   minor_axis=['A', 'B', 'C'])
-
-        with ensure_clean_path(self.path) as path:
-           panel_with_missing.to_hdf(path, 'panel_with_missing', format='table')
-           reloaded_panel = read_hdf(path, 'panel_with_missing')
-           tm.assert_panel_equal(panel_with_missing, reloaded_panel)
-
-    def test_append_frame_column_oriented(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            # column oriented
-            df = tm.makeTimeDataFrame()
-            _maybe_remove(store, 'df1')
-            store.append('df1', df.ix[:, :2], axes=['columns'])
-            store.append('df1', df.ix[:, 2:])
-            tm.assert_frame_equal(store['df1'], df)
-
-            result = store.select('df1', 'columns=A')
-            expected = df.reindex(columns=['A'])
-            tm.assert_frame_equal(expected, result)
-
-            # selection on the non-indexable
-            result = store.select(
-                'df1', ('columns=A', Term('index=df.index[0:4]')))
-            expected = df.reindex(columns=['A'], index=df.index[0:4])
-            tm.assert_frame_equal(expected, result)
-
-            # this isn't supported
-            self.assertRaises(TypeError, store.select, 'df1', (
-                    'columns=A', Term('index>df.index[4]')))
-
-    def test_append_with_different_block_ordering(self):
-
-        #GH 4096; using same frames, but different block orderings
-        with ensure_clean_store(self.path) as store:
-
-            for i in range(10):
-
-                df = DataFrame(np.random.randn(10,2),columns=list('AB'))
-                df['index'] = range(10)
-                df['index'] += i*10
-                df['int64'] = Series([1]*len(df),dtype='int64')
-                df['int16'] = Series([1]*len(df),dtype='int16')
-
-                if i % 2 == 0:
-                    del df['int64']
-                    df['int64'] = Series([1]*len(df),dtype='int64')
-                if i % 3 == 0:
-                    a = df.pop('A')
-                    df['A'] = a
-
-                df.set_index('index',inplace=True)
-
-                store.append('df',df)
-
-        # test a different ordering but with more fields (like invalid combinate)
-        with ensure_clean_store(self.path) as store:
-
-            df = DataFrame(np.random.randn(10,2),columns=list('AB'), dtype='float64')
-            df['int64'] = Series([1]*len(df),dtype='int64')
-            df['int16'] = Series([1]*len(df),dtype='int16')
-            store.append('df',df)
-
-            # store additonal fields in different blocks
-            df['int16_2'] = Series([1]*len(df),dtype='int16')
-            self.assertRaises(ValueError, store.append, 'df', df)
-
-            # store multile additonal fields in different blocks
-            df['float_3'] = Series([1.]*len(df),dtype='float64')
-            self.assertRaises(ValueError, store.append, 'df', df)
-
-    def test_ndim_indexables(self):
-        """ test using ndim tables in new ways"""
-
-        with ensure_clean_store(self.path) as store:
-
-            p4d = tm.makePanel4D()
-
-            def check_indexers(key, indexers):
-                for i, idx in enumerate(indexers):
-                    self.assertTrue(getattr(getattr(
-                        store.root, key).table.description, idx)._v_pos == i)
-
-            # append then change (will take existing schema)
-            indexers = ['items', 'major_axis', 'minor_axis']
-
-            _maybe_remove(store, 'p4d')
-            store.append('p4d', p4d.ix[:, :, :10, :], axes=indexers)
-            store.append('p4d', p4d.ix[:, :, 10:, :])
-            assert_panel4d_equal(store.select('p4d'), p4d)
-            check_indexers('p4d', indexers)
-
-            # same as above, but try to append with differnt axes
-            _maybe_remove(store, 'p4d')
-            store.append('p4d', p4d.ix[:, :, :10, :], axes=indexers)
-            store.append('p4d', p4d.ix[:, :, 10:, :], axes=[
-                    'labels', 'items', 'major_axis'])
-            assert_panel4d_equal(store.select('p4d'), p4d)
-            check_indexers('p4d', indexers)
-
-            # pass incorrect number of axes
-            _maybe_remove(store, 'p4d')
-            self.assertRaises(ValueError, store.append, 'p4d', p4d.ix[
-                    :, :, :10, :], axes=['major_axis', 'minor_axis'])
-
-            # different than default indexables #1
-            indexers = ['labels', 'major_axis', 'minor_axis']
-            _maybe_remove(store, 'p4d')
-            store.append('p4d', p4d.ix[:, :, :10, :], axes=indexers)
-            store.append('p4d', p4d.ix[:, :, 10:, :])
-            assert_panel4d_equal(store['p4d'], p4d)
-            check_indexers('p4d', indexers)
-
-            # different than default indexables #2
-            indexers = ['major_axis', 'labels', 'minor_axis']
-            _maybe_remove(store, 'p4d')
-            store.append('p4d', p4d.ix[:, :, :10, :], axes=indexers)
-            store.append('p4d', p4d.ix[:, :, 10:, :])
-            assert_panel4d_equal(store['p4d'], p4d)
-            check_indexers('p4d', indexers)
-
-            # partial selection
-            result = store.select('p4d', ['labels=l1'])
-            expected = p4d.reindex(labels=['l1'])
-            assert_panel4d_equal(result, expected)
-
-            # partial selection2
-            result = store.select('p4d', [Term(
-                        'labels=l1'), Term('items=ItemA'), Term('minor_axis=B')])
-            expected = p4d.reindex(
-                labels=['l1'], items=['ItemA'], minor_axis=['B'])
-            assert_panel4d_equal(result, expected)
-
-            # non-existant partial selection
-            result = store.select('p4d', [Term(
-                        'labels=l1'), Term('items=Item1'), Term('minor_axis=B')])
-            expected = p4d.reindex(labels=['l1'], items=[], minor_axis=['B'])
-            assert_panel4d_equal(result, expected)
-
-    def test_append_with_strings(self):
-
-        with ensure_clean_store(self.path) as store:
-            wp = tm.makePanel()
-            wp2 = wp.rename_axis(
-                dict([(x, "%s_extra" % x) for x in wp.minor_axis]), axis=2)
-
-            def check_col(key,name,size):
-                self.assertEqual(getattr(store.get_storer(key).table.description,name).itemsize, size)
-
-            store.append('s1', wp, min_itemsize=20)
-            store.append('s1', wp2)
-            expected = concat([wp, wp2], axis=2)
-            expected = expected.reindex(minor_axis=sorted(expected.minor_axis))
-            assert_panel_equal(store['s1'], expected)
-            check_col('s1', 'minor_axis', 20)
-
-            # test dict format
-            store.append('s2', wp, min_itemsize={'minor_axis': 20})
-            store.append('s2', wp2)
-            expected = concat([wp, wp2], axis=2)
-            expected = expected.reindex(minor_axis=sorted(expected.minor_axis))
-            assert_panel_equal(store['s2'], expected)
-            check_col('s2', 'minor_axis', 20)
-
-            # apply the wrong field (similar to #1)
-            store.append('s3', wp, min_itemsize={'major_axis': 20})
-            self.assertRaises(ValueError, store.append, 's3', wp2)
-
-            # test truncation of bigger strings
-            store.append('s4', wp)
-            self.assertRaises(ValueError, store.append, 's4', wp2)
-
-            # avoid truncation on elements
-            df = DataFrame([[123, 'asdqwerty'], [345, 'dggnhebbsdfbdfb']])
-            store.append('df_big', df)
-            tm.assert_frame_equal(store.select('df_big'), df)
-            check_col('df_big', 'values_block_1', 15)
-
-            # appending smaller string ok
-            df2 = DataFrame([[124, 'asdqy'], [346, 'dggnhefbdfb']])
-            store.append('df_big', df2)
-            expected = concat([df, df2])
-            tm.assert_frame_equal(store.select('df_big'), expected)
-            check_col('df_big', 'values_block_1', 15)
-
-            # avoid truncation on elements
-            df = DataFrame([[123, 'asdqwerty'], [345, 'dggnhebbsdfbdfb']])
-            store.append('df_big2', df, min_itemsize={'values': 50})
-            tm.assert_frame_equal(store.select('df_big2'), df)
-            check_col('df_big2', 'values_block_1', 50)
-
-            # bigger string on next append
-            store.append('df_new', df)
-            df_new = DataFrame(
-                [[124, 'abcdefqhij'], [346, 'abcdefghijklmnopqrtsuvwxyz']])
-            self.assertRaises(ValueError, store.append, 'df_new', df_new)
-
-            # with nans
-            _maybe_remove(store, 'df')
-            df = tm.makeTimeDataFrame()
-            df['string'] = 'foo'
-            df.ix[1:4, 'string'] = np.nan
-            df['string2'] = 'bar'
-            df.ix[4:8, 'string2'] = np.nan
-            df['string3'] = 'bah'
-            df.ix[1:, 'string3'] = np.nan
-            store.append('df', df)
-            result = store.select('df')
-            tm.assert_frame_equal(result, df)
-
-        with ensure_clean_store(self.path) as store:
-
-            def check_col(key,name,size):
-                self.assertEqual(getattr(store.get_storer(key).table.description,name).itemsize, size)
-
-            df = DataFrame(dict(A = 'foo', B = 'bar'),index=range(10))
-
-            # a min_itemsize that creates a data_column
-            _maybe_remove(store, 'df')
-            store.append('df', df, min_itemsize={'A' : 200 })
-            check_col('df', 'A', 200)
-            self.assertEqual(store.get_storer('df').data_columns, ['A'])
-
-            # a min_itemsize that creates a data_column2
-            _maybe_remove(store, 'df')
-            store.append('df', df, data_columns = ['B'], min_itemsize={'A' : 200 })
-            check_col('df', 'A', 200)
-            self.assertEqual(store.get_storer('df').data_columns, ['B','A'])
-
-            # a min_itemsize that creates a data_column2
-            _maybe_remove(store, 'df')
-            store.append('df', df, data_columns = ['B'], min_itemsize={'values' : 200 })
-            check_col('df', 'B', 200)
-            check_col('df', 'values_block_0', 200)
-            self.assertEqual(store.get_storer('df').data_columns, ['B'])
-
-            # infer the .typ on subsequent appends
-            _maybe_remove(store, 'df')
-            store.append('df', df[:5], min_itemsize=200)
-            store.append('df', df[5:], min_itemsize=200)
-            tm.assert_frame_equal(store['df'], df)
-
-            # invalid min_itemsize keys
-            df = DataFrame(['foo','foo','foo','barh','barh','barh'],columns=['A'])
-            _maybe_remove(store, 'df')
-            self.assertRaises(ValueError, store.append, 'df', df, min_itemsize={'foo' : 20, 'foobar' : 20})
-
-    def test_append_with_data_columns(self):
-
-        with ensure_clean_store(self.path) as store:
-            df = tm.makeTimeDataFrame()
-            df.loc[:,'B'].iloc[0] = 1.
-            _maybe_remove(store, 'df')
-            store.append('df', df[:2], data_columns=['B'])
-            store.append('df', df[2:])
-            tm.assert_frame_equal(store['df'], df)
-
-            # check that we have indicies created
-            assert(store._handle.root.df.table.cols.index.is_indexed is True)
-            assert(store._handle.root.df.table.cols.B.is_indexed is True)
-
-            # data column searching
-            result = store.select('df', [Term('B>0')])
-            expected = df[df.B > 0]
-            tm.assert_frame_equal(result, expected)
-
-            # data column searching (with an indexable and a data_columns)
-            result = store.select(
-                'df', [Term('B>0'), Term('index>df.index[3]')])
-            df_new = df.reindex(index=df.index[4:])
-            expected = df_new[df_new.B > 0]
-            tm.assert_frame_equal(result, expected)
-
-            # data column selection with a string data_column
-            df_new = df.copy()
-            df_new['string'] = 'foo'
-            df_new.loc[1:4,'string'] = np.nan
-            df_new.loc[5:6,'string'] = 'bar'
-            _maybe_remove(store, 'df')
-            store.append('df', df_new, data_columns=['string'])
-            result = store.select('df', [Term('string=foo')])
-            expected = df_new[df_new.string == 'foo']
-            tm.assert_frame_equal(result, expected)
-
-            # using min_itemsize and a data column
-            def check_col(key,name,size):
-                self.assertEqual(getattr(store.get_storer(key).table.description,name).itemsize, size)
-
-        with ensure_clean_store(self.path) as store:
-            _maybe_remove(store, 'df')
-            store.append('df', df_new, data_columns=['string'],
-                         min_itemsize={'string': 30})
-            check_col('df', 'string', 30)
-            _maybe_remove(store, 'df')
-            store.append(
-                'df', df_new, data_columns=['string'], min_itemsize=30)
-            check_col('df', 'string', 30)
-            _maybe_remove(store, 'df')
-            store.append('df', df_new, data_columns=['string'],
-                         min_itemsize={'values': 30})
-            check_col('df', 'string', 30)
-
-        with ensure_clean_store(self.path) as store:
-            df_new['string2'] = 'foobarbah'
-            df_new['string_block1'] = 'foobarbah1'
-            df_new['string_block2'] = 'foobarbah2'
-            _maybe_remove(store, 'df')
-            store.append('df', df_new, data_columns=['string', 'string2'], min_itemsize={'string': 30, 'string2': 40, 'values': 50})
-            check_col('df', 'string', 30)
-            check_col('df', 'string2', 40)
-            check_col('df', 'values_block_1', 50)
-
-        with ensure_clean_store(self.path) as store:
-            # multiple data columns
-            df_new = df.copy()
-            df_new.ix[0,'A'] = 1.
-            df_new.ix[0,'B'] = -1.
-            df_new['string'] = 'foo'
-            df_new.loc[1:4,'string'] = np.nan
-            df_new.loc[5:6,'string'] = 'bar'
-            df_new['string2'] = 'foo'
-            df_new.loc[2:5,'string2'] = np.nan
-            df_new.loc[7:8,'string2'] = 'bar'
-            _maybe_remove(store, 'df')
-            store.append(
-                'df', df_new, data_columns=['A', 'B', 'string', 'string2'])
-            result = store.select('df', [Term('string=foo'), Term(
-                        'string2=foo'), Term('A>0'), Term('B<0')])
-            expected = df_new[(df_new.string == 'foo') & (
-                    df_new.string2 == 'foo') & (df_new.A > 0) & (df_new.B < 0)]
-            tm.assert_frame_equal(result, expected, check_index_type=False)
-
-            # yield an empty frame
-            result = store.select('df', [Term('string=foo'), Term(
-                        'string2=cool')])
-            expected = df_new[(df_new.string == 'foo') & (
-                    df_new.string2 == 'cool')]
-            tm.assert_frame_equal(result, expected, check_index_type=False)
-
-        with ensure_clean_store(self.path) as store:
-            # doc example
-            df_dc = df.copy()
-            df_dc['string'] = 'foo'
-            df_dc.ix[4:6, 'string'] = np.nan
-            df_dc.ix[7:9, 'string'] = 'bar'
-            df_dc['string2'] = 'cool'
-            df_dc['datetime'] = Timestamp('20010102')
-            df_dc = df_dc._convert(datetime=True)
-            df_dc.ix[3:5, ['A', 'B', 'datetime']] = np.nan
-
-            _maybe_remove(store, 'df_dc')
-            store.append('df_dc', df_dc, data_columns=['B', 'C',
-                                                       'string', 'string2', 'datetime'])
-            result = store.select('df_dc', [Term('B>0')])
-
-            expected = df_dc[df_dc.B > 0]
-            tm.assert_frame_equal(result, expected, check_index_type=False)
-
-            result = store.select(
-                'df_dc', ['B > 0', 'C > 0', 'string == foo'])
-            expected = df_dc[(df_dc.B > 0) & (df_dc.C > 0) & (
-                    df_dc.string == 'foo')]
-            tm.assert_frame_equal(result, expected, check_index_type=False)
-
-        with ensure_clean_store(self.path) as store:
-            # doc example part 2
-            np.random.seed(1234)
-            index = date_range('1/1/2000', periods=8)
-            df_dc = DataFrame(np.random.randn(8, 3), index=index,
-                              columns=['A', 'B', 'C'])
-            df_dc['string'] = 'foo'
-            df_dc.ix[4:6,'string'] = np.nan
-            df_dc.ix[7:9,'string'] = 'bar'
-            df_dc.ix[:,['B','C']] = df_dc.ix[:,['B','C']].abs()
-            df_dc['string2'] = 'cool'
-
-            # on-disk operations
-            store.append('df_dc', df_dc, data_columns = ['B', 'C', 'string', 'string2'])
-
-            result = store.select('df_dc', [ Term('B>0') ])
-            expected = df_dc[df_dc.B>0]
-            tm.assert_frame_equal(result,expected)
-
-            result = store.select('df_dc', ['B > 0', 'C > 0', 'string == "foo"'])
-            expected = df_dc[(df_dc.B > 0) & (df_dc.C > 0) & (df_dc.string == 'foo')]
-            tm.assert_frame_equal(result,expected)
-
-        with ensure_clean_store(self.path) as store:
-            # panel
-            # GH5717 not handling data_columns
-            np.random.seed(1234)
-            p = tm.makePanel()
-
-            store.append('p1',p)
-            tm.assert_panel_equal(store.select('p1'),p)
-
-            store.append('p2',p,data_columns=True)
-            tm.assert_panel_equal(store.select('p2'),p)
-
-            result = store.select('p2',where='ItemA>0')
-            expected = p.to_frame()
-            expected = expected[expected['ItemA']>0]
-            tm.assert_frame_equal(result.to_frame(),expected)
-
-            result = store.select('p2',where='ItemA>0 & minor_axis=["A","B"]')
-            expected = p.to_frame()
-            expected = expected[expected['ItemA']>0]
-            expected = expected[expected.reset_index(level=['major']).index.isin(['A','B'])]
-            tm.assert_frame_equal(result.to_frame(),expected)
-
-    def test_create_table_index(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            def col(t,column):
-                return getattr(store.get_storer(t).table.cols,column)
-
-            # index=False
-            wp = tm.makePanel()
-            store.append('p5', wp, index=False)
-            store.create_table_index('p5', columns=['major_axis'])
-            assert(col('p5', 'major_axis').is_indexed is True)
-            assert(col('p5', 'minor_axis').is_indexed is False)
-
-            # index=True
-            store.append('p5i', wp, index=True)
-            assert(col('p5i', 'major_axis').is_indexed is True)
-            assert(col('p5i', 'minor_axis').is_indexed is True)
-
-            # default optlevels
-            store.get_storer('p5').create_index()
-            assert(col('p5', 'major_axis').index.optlevel == 6)
-            assert(col('p5', 'minor_axis').index.kind == 'medium')
-
-            # let's change the indexing scheme
-            store.create_table_index('p5')
-            assert(col('p5', 'major_axis').index.optlevel == 6)
-            assert(col('p5', 'minor_axis').index.kind == 'medium')
-            store.create_table_index('p5', optlevel=9)
-            assert(col('p5', 'major_axis').index.optlevel == 9)
-            assert(col('p5', 'minor_axis').index.kind == 'medium')
-            store.create_table_index('p5', kind='full')
-            assert(col('p5', 'major_axis').index.optlevel == 9)
-            assert(col('p5', 'minor_axis').index.kind == 'full')
-            store.create_table_index('p5', optlevel=1, kind='light')
-            assert(col('p5', 'major_axis').index.optlevel == 1)
-            assert(col('p5', 'minor_axis').index.kind == 'light')
-
-            # data columns
-            df = tm.makeTimeDataFrame()
-            df['string'] = 'foo'
-            df['string2'] = 'bar'
-            store.append('f', df, data_columns=['string', 'string2'])
-            assert(col('f', 'index').is_indexed is True)
-            assert(col('f', 'string').is_indexed is True)
-            assert(col('f', 'string2').is_indexed is True)
-
-            # specify index=columns
-            store.append(
-                'f2', df, index=['string'], data_columns=['string', 'string2'])
-            assert(col('f2', 'index').is_indexed is False)
-            assert(col('f2', 'string').is_indexed is True)
-            assert(col('f2', 'string2').is_indexed is False)
-
-            # try to index a non-table
-            _maybe_remove(store, 'f2')
-            store.put('f2', df)
-            self.assertRaises(TypeError, store.create_table_index, 'f2')
-
-    def test_append_diff_item_order(self):
-
-        wp = tm.makePanel()
-        wp1 = wp.ix[:, :10, :]
-        wp2 = wp.ix[['ItemC', 'ItemB', 'ItemA'], 10:, :]
-
-        with ensure_clean_store(self.path) as store:
-            store.put('panel', wp1, format='table')
-            self.assertRaises(ValueError, store.put, 'panel', wp2,
-                              append=True)
-
-    def test_append_hierarchical(self):
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['foo', 'bar'])
-        df = DataFrame(np.random.randn(10, 3), index=index,
-                       columns=['A', 'B', 'C'])
-
-        with ensure_clean_store(self.path) as store:
-            store.append('mi', df)
-            result = store.select('mi')
-            tm.assert_frame_equal(result, df)
-
-            # GH 3748
-            result = store.select('mi',columns=['A','B'])
-            expected = df.reindex(columns=['A','B'])
-            tm.assert_frame_equal(result,expected)
-
-        with ensure_clean_path('test.hdf') as path:
-            df.to_hdf(path,'df',format='table')
-            result = read_hdf(path,'df',columns=['A','B'])
-            expected = df.reindex(columns=['A','B'])
-            tm.assert_frame_equal(result,expected)
-
-    def test_column_multiindex(self):
-        # GH 4710
-        # recreate multi-indexes properly
-
-        index = MultiIndex.from_tuples([('A','a'), ('A','b'), ('B','a'), ('B','b')], names=['first','second'])
-        df = DataFrame(np.arange(12).reshape(3,4), columns=index)
-
-        with ensure_clean_store(self.path) as store:
-
-            store.put('df',df)
-            tm.assert_frame_equal(store['df'],df,check_index_type=True,check_column_type=True)
-
-            store.put('df1',df,format='table')
-            tm.assert_frame_equal(store['df1'],df,check_index_type=True,check_column_type=True)
-
-            self.assertRaises(ValueError, store.put, 'df2',df,format='table',data_columns=['A'])
-            self.assertRaises(ValueError, store.put, 'df3',df,format='table',data_columns=True)
-
-        # appending multi-column on existing table (see GH 6167)
-        with ensure_clean_store(self.path) as store:
-            store.append('df2', df)
-            store.append('df2', df)
-
-            tm.assert_frame_equal(store['df2'], concat((df,df)))
-
-        # non_index_axes name
-        df = DataFrame(np.arange(12).reshape(3,4), columns=Index(list('ABCD'),name='foo'))
-
-        with ensure_clean_store(self.path) as store:
-
-            store.put('df1',df,format='table')
-            tm.assert_frame_equal(store['df1'],df,check_index_type=True,check_column_type=True)
-
-    def test_store_multiindex(self):
-
-        # validate multi-index names
-        # GH 5527
-        with ensure_clean_store(self.path) as store:
-
-            def make_index(names=None):
-                return MultiIndex.from_tuples([( datetime.datetime(2013,12,d), s, t) for d in range(1,3) for s in range(2) for t in range(3)],
-                                              names=names)
-
-
-            # no names
-            _maybe_remove(store, 'df')
-            df = DataFrame(np.zeros((12,2)), columns=['a','b'], index=make_index())
-            store.append('df',df)
-            tm.assert_frame_equal(store.select('df'),df)
-
-            # partial names
-            _maybe_remove(store, 'df')
-            df = DataFrame(np.zeros((12,2)), columns=['a','b'], index=make_index(['date',None,None]))
-            store.append('df',df)
-            tm.assert_frame_equal(store.select('df'),df)
-
-            # series
-            _maybe_remove(store, 's')
-            s = Series(np.zeros(12), index=make_index(['date', None, None]))
-            store.append('s',s)
-            xp = Series(np.zeros(12), index=make_index(['date', 'level_1', 'level_2']))
-            tm.assert_series_equal(store.select('s'), xp)
-
-            # dup with column
-            _maybe_remove(store, 'df')
-            df = DataFrame(np.zeros((12,2)), columns=['a','b'], index=make_index(['date','a','t']))
-            self.assertRaises(ValueError, store.append, 'df',df)
-
-            # dup within level
-            _maybe_remove(store, 'df')
-            df = DataFrame(np.zeros((12,2)), columns=['a','b'], index=make_index(['date','date','date']))
-            self.assertRaises(ValueError, store.append, 'df',df)
-
-            # fully names
-            _maybe_remove(store, 'df')
-            df = DataFrame(np.zeros((12,2)), columns=['a','b'], index=make_index(['date','s','t']))
-            store.append('df',df)
-            tm.assert_frame_equal(store.select('df'),df)
-
-    def test_select_columns_in_where(self):
-
-        # GH 6169
-        # recreate multi-indexes when columns is passed
-        # in the `where` argument
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['foo_name', 'bar_name'])
-
-        # With a DataFrame
-        df = DataFrame(np.random.randn(10, 3), index=index,
-                       columns=['A', 'B', 'C'])
-
-        with ensure_clean_store(self.path) as store:
-            store.put('df', df, format='table')
-            expected = df[['A']]
-
-            tm.assert_frame_equal(store.select('df', columns=['A']), expected)
-
-            tm.assert_frame_equal(store.select('df', where="columns=['A']"), expected)
-
-        # With a Series
-        s = Series(np.random.randn(10), index=index,
-                   name='A')
-        with ensure_clean_store(self.path) as store:
-            store.put('s', s, format='table')
-            tm.assert_series_equal(store.select('s', where="columns=['A']"),s)
-
-    def test_pass_spec_to_storer(self):
-
-        df = tm.makeDataFrame()
-
-        with ensure_clean_store(self.path) as store:
-            store.put('df',df)
-            self.assertRaises(TypeError, store.select, 'df', columns=['A'])
-            self.assertRaises(TypeError, store.select, 'df',where=[('columns=A')])
-
-    def test_append_misc(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            # unsuported data types for non-tables
-            p4d = tm.makePanel4D()
-            self.assertRaises(TypeError, store.put,'p4d',p4d)
-
-            # unsuported data types
-            self.assertRaises(TypeError, store.put,'abc',None)
-            self.assertRaises(TypeError, store.put,'abc','123')
-            self.assertRaises(TypeError, store.put,'abc',123)
-            self.assertRaises(TypeError, store.put,'abc',np.arange(5))
-
-            df = tm.makeDataFrame()
-            store.append('df', df, chunksize=1)
-            result = store.select('df')
-            tm.assert_frame_equal(result, df)
-
-            store.append('df1', df, expectedrows=10)
-            result = store.select('df1')
-            tm.assert_frame_equal(result, df)
-
-        # more chunksize in append tests
-        def check(obj, comparator):
-            for c in [10, 200, 1000]:
-                with ensure_clean_store(self.path,mode='w') as store:
-                    store.append('obj', obj, chunksize=c)
-                    result = store.select('obj')
-                    comparator(result,obj)
-
-        df = tm.makeDataFrame()
-        df['string'] = 'foo'
-        df['float322'] = 1.
-        df['float322'] = df['float322'].astype('float32')
-        df['bool']     = df['float322'] > 0
-        df['time1']    = Timestamp('20130101')
-        df['time2']    = Timestamp('20130102')
-        check(df, tm.assert_frame_equal)
-
-        p = tm.makePanel()
-        check(p, assert_panel_equal)
-
-        p4d = tm.makePanel4D()
-        check(p4d, assert_panel4d_equal)
-
-        # empty frame, GH4273
-        with ensure_clean_store(self.path) as store:
-
-            # 0 len
-            df_empty = DataFrame(columns=list('ABC'))
-            store.append('df',df_empty)
-            self.assertRaises(KeyError,store.select, 'df')
-
-            # repeated append of 0/non-zero frames
-            df = DataFrame(np.random.rand(10,3),columns=list('ABC'))
-            store.append('df',df)
-            assert_frame_equal(store.select('df'),df)
-            store.append('df',df_empty)
-            assert_frame_equal(store.select('df'),df)
-
-            # store
-            df = DataFrame(columns=list('ABC'))
-            store.put('df2',df)
-            assert_frame_equal(store.select('df2'),df)
-
-            # 0 len
-            p_empty = Panel(items=list('ABC'))
-            store.append('p',p_empty)
-            self.assertRaises(KeyError,store.select, 'p')
-
-            # repeated append of 0/non-zero frames
-            p = Panel(np.random.randn(3,4,5),items=list('ABC'))
-            store.append('p',p)
-            assert_panel_equal(store.select('p'),p)
-            store.append('p',p_empty)
-            assert_panel_equal(store.select('p'),p)
-
-            # store
-            store.put('p2',p_empty)
-            assert_panel_equal(store.select('p2'),p_empty)
-
-    def test_append_raise(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            # test append with invalid input to get good error messages
-
-            # list in column
-            df = tm.makeDataFrame()
-            df['invalid'] = [['a']] * len(df)
-            self.assertEqual(df.dtypes['invalid'], np.object_)
-            self.assertRaises(TypeError, store.append,'df',df)
-
-            # multiple invalid columns
-            df['invalid2'] = [['a']] * len(df)
-            df['invalid3'] = [['a']] * len(df)
-            self.assertRaises(TypeError, store.append,'df',df)
-
-            # datetime with embedded nans as object
-            df = tm.makeDataFrame()
-            s = Series(datetime.datetime(2001,1,2),index=df.index)
-            s = s.astype(object)
-            s[0:5] = np.nan
-            df['invalid'] = s
-            self.assertEqual(df.dtypes['invalid'], np.object_)
-            self.assertRaises(TypeError, store.append,'df', df)
-
-            # directy ndarray
-            self.assertRaises(TypeError, store.append,'df',np.arange(10))
-
-            # series directly
-            self.assertRaises(TypeError, store.append,'df',Series(np.arange(10)))
-
-            # appending an incompatbile table
-            df = tm.makeDataFrame()
-            store.append('df',df)
-
-            df['foo'] = 'foo'
-            self.assertRaises(ValueError, store.append,'df',df)
-
-    def test_table_index_incompatible_dtypes(self):
-        df1 = DataFrame({'a': [1, 2, 3]})
-        df2 = DataFrame({'a': [4, 5, 6]},
-                        index=date_range('1/1/2000', periods=3))
-
-        with ensure_clean_store(self.path) as store:
-            store.put('frame', df1, format='table')
-            self.assertRaises(TypeError, store.put, 'frame', df2,
-                              format='table', append=True)
-
-    def test_table_values_dtypes_roundtrip(self):
-
-        with ensure_clean_store(self.path) as store:
-            df1 = DataFrame({'a': [1, 2, 3]}, dtype='f8')
-            store.append('df_f8', df1)
-            assert_series_equal(df1.dtypes,store['df_f8'].dtypes)
-
-            df2 = DataFrame({'a': [1, 2, 3]}, dtype='i8')
-            store.append('df_i8', df2)
-            assert_series_equal(df2.dtypes,store['df_i8'].dtypes)
-
-            # incompatible dtype
-            self.assertRaises(ValueError, store.append, 'df_i8', df1)
-
-            # check creation/storage/retrieval of float32 (a bit hacky to actually create them thought)
-            df1 = DataFrame(np.array([[1],[2],[3]],dtype='f4'),columns = ['A'])
-            store.append('df_f4', df1)
-            assert_series_equal(df1.dtypes,store['df_f4'].dtypes)
-            assert df1.dtypes[0] == 'float32'
-
-            # check with mixed dtypes
-            df1 = DataFrame(dict([ (c,Series(np.random.randn(5),dtype=c)) for c in
-                                   ['float32','float64','int32','int64','int16','int8'] ]))
-            df1['string'] = 'foo'
-            df1['float322'] = 1.
-            df1['float322'] = df1['float322'].astype('float32')
-            df1['bool']     = df1['float32'] > 0
-            df1['time1']    = Timestamp('20130101')
-            df1['time2']    = Timestamp('20130102')
-
-            store.append('df_mixed_dtypes1', df1)
-            result = store.select('df_mixed_dtypes1').get_dtype_counts()
-            expected = Series({ 'float32' : 2, 'float64' : 1,'int32' : 1, 'bool' : 1,
-                                'int16' : 1, 'int8' : 1, 'int64' : 1, 'object' : 1,
-                                'datetime64[ns]' : 2})
-            result.sort()
-            expected.sort()
-            tm.assert_series_equal(result,expected)
-
-    def test_table_mixed_dtypes(self):
-
-        # frame
-        df = tm.makeDataFrame()
-        df['obj1'] = 'foo'
-        df['obj2'] = 'bar'
-        df['bool1'] = df['A'] > 0
-        df['bool2'] = df['B'] > 0
-        df['bool3'] = True
-        df['int1'] = 1
-        df['int2'] = 2
-        df['timestamp1'] = Timestamp('20010102')
-        df['timestamp2'] = Timestamp('20010103')
-        df['datetime1'] = datetime.datetime(2001, 1, 2, 0, 0)
-        df['datetime2'] = datetime.datetime(2001, 1, 3, 0, 0)
-        df.ix[3:6, ['obj1']] = np.nan
-        df = df.consolidate()._convert(datetime=True)
-
-        with ensure_clean_store(self.path) as store:
-            store.append('df1_mixed', df)
-            tm.assert_frame_equal(store.select('df1_mixed'), df)
-
-        # panel
-        wp = tm.makePanel()
-        wp['obj1'] = 'foo'
-        wp['obj2'] = 'bar'
-        wp['bool1'] = wp['ItemA'] > 0
-        wp['bool2'] = wp['ItemB'] > 0
-        wp['int1'] = 1
-        wp['int2'] = 2
-        wp = wp.consolidate()
-
-        with ensure_clean_store(self.path) as store:
-            store.append('p1_mixed', wp)
-            assert_panel_equal(store.select('p1_mixed'), wp)
-
-        # ndim
-        wp = tm.makePanel4D()
-        wp['obj1'] = 'foo'
-        wp['obj2'] = 'bar'
-        wp['bool1'] = wp['l1'] > 0
-        wp['bool2'] = wp['l2'] > 0
-        wp['int1'] = 1
-        wp['int2'] = 2
-        wp = wp.consolidate()
-
-        with ensure_clean_store(self.path) as store:
-            store.append('p4d_mixed', wp)
-            assert_panel4d_equal(store.select('p4d_mixed'), wp)
-
-    def test_unimplemented_dtypes_table_columns(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            l = [('date', datetime.date(2001, 1, 2))]
-
-            # py3 ok for unicode
-            if not compat.PY3:
-                l.append(('unicode', u('\\u03c3')))
-
-            ### currently not supported dtypes ####
-            for n, f in l:
-                df = tm.makeDataFrame()
-                df[n] = f
-                self.assertRaises(
-                    TypeError, store.append, 'df1_%s' % n, df)
-
-        # frame
-        df = tm.makeDataFrame()
-        df['obj1'] = 'foo'
-        df['obj2'] = 'bar'
-        df['datetime1'] = datetime.date(2001, 1, 2)
-        df = df.consolidate()._convert(datetime=True)
-
-        with ensure_clean_store(self.path) as store:
-            # this fails because we have a date in the object block......
-            self.assertRaises(TypeError, store.append, 'df_unimplemented', df)
-
-    def test_calendar_roundtrip_issue(self):
-
-        # 8591
-        # doc example from tseries holiday section
-        weekmask_egypt = 'Sun Mon Tue Wed Thu'
-        holidays = ['2012-05-01', datetime.datetime(2013, 5, 1), np.datetime64('2014-05-01')]
-        bday_egypt = pandas.offsets.CustomBusinessDay(holidays=holidays, weekmask=weekmask_egypt)
-        dt = datetime.datetime(2013, 4, 30)
-        dts = date_range(dt, periods=5, freq=bday_egypt)
-
-        s = (Series(dts.weekday, dts).map(Series('Mon Tue Wed Thu Fri Sat Sun'.split())))
-
-        with ensure_clean_store(self.path) as store:
-
-            store.put('fixed',s)
-            result = store.select('fixed')
-            assert_series_equal(result, s)
-
-            store.append('table',s)
-            result = store.select('table')
-            assert_series_equal(result, s)
-
-    def test_append_with_timedelta(self):
-        # GH 3577
-        # append timedelta
-
-        from datetime import timedelta
-        df = DataFrame(dict(A = Timestamp('20130101'), B = [ Timestamp('20130101') + timedelta(days=i,seconds=10) for i in range(10) ]))
-        df['C'] = df['A']-df['B']
-        df.ix[3:5,'C'] = np.nan
-
-        with ensure_clean_store(self.path) as store:
-
-            # table
-            _maybe_remove(store, 'df')
-            store.append('df',df,data_columns=True)
-            result = store.select('df')
-            assert_frame_equal(result,df)
-
-            result = store.select('df',Term("C<100000"))
-            assert_frame_equal(result,df)
-
-            result = store.select('df',Term("C","<",-3*86400))
-            assert_frame_equal(result,df.iloc[3:])
-
-            result = store.select('df',"C<'-3D'")
-            assert_frame_equal(result,df.iloc[3:])
-
-            # a bit hacky here as we don't really deal with the NaT properly
-
-            result = store.select('df',"C<'-500000s'")
-            result = result.dropna(subset=['C'])
-            assert_frame_equal(result,df.iloc[6:])
-
-            result = store.select('df',"C<'-3.5D'")
-            result = result.iloc[1:]
-            assert_frame_equal(result,df.iloc[4:])
-
-            # fixed
-            _maybe_remove(store, 'df2')
-            store.put('df2',df)
-            result = store.select('df2')
-            assert_frame_equal(result,df)
-
-    def test_remove(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            ts = tm.makeTimeSeries()
-            df = tm.makeDataFrame()
-            store['a'] = ts
-            store['b'] = df
-            _maybe_remove(store, 'a')
-            self.assertEqual(len(store), 1)
-            tm.assert_frame_equal(df, store['b'])
-
-            _maybe_remove(store, 'b')
-            self.assertEqual(len(store), 0)
-
-            # nonexistence
-            self.assertRaises(KeyError, store.remove, 'a_nonexistent_store')
-
-            # pathing
-            store['a'] = ts
-            store['b/foo'] = df
-            _maybe_remove(store, 'foo')
-            _maybe_remove(store, 'b/foo')
-            self.assertEqual(len(store), 1)
-
-            store['a'] = ts
-            store['b/foo'] = df
-            _maybe_remove(store, 'b')
-            self.assertEqual(len(store), 1)
-
-            # __delitem__
-            store['a'] = ts
-            store['b'] = df
-            del store['a']
-            del store['b']
-            self.assertEqual(len(store), 0)
-
-    def test_remove_where(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            # non-existance
-            crit1 = Term('index>foo')
-            self.assertRaises(KeyError, store.remove, 'a', [crit1])
-
-            # try to remove non-table (with crit)
-            # non-table ok (where = None)
-            wp = tm.makePanel(30)
-            store.put('wp', wp, format='table')
-            store.remove('wp', ["minor_axis=['A', 'D']"])
-            rs = store.select('wp')
-            expected = wp.reindex(minor_axis=['B', 'C'])
-            assert_panel_equal(rs, expected)
-
-            # empty where
-            _maybe_remove(store, 'wp')
-            store.put('wp', wp, format='table')
-
-            # deleted number (entire table)
-            n = store.remove('wp', [])
-            self.assertTrue(n == 120)
-
-            # non - empty where
-            _maybe_remove(store, 'wp')
-            store.put('wp', wp, format='table')
-            self.assertRaises(ValueError, store.remove,
-                              'wp', ['foo'])
-
-            # selectin non-table with a where
-            # store.put('wp2', wp, format='f')
-            # self.assertRaises(ValueError, store.remove,
-            #                  'wp2', [('column', ['A', 'D'])])
-
-    def test_remove_startstop(self):
-        # GH #4835 and #6177
-
-        with ensure_clean_store(self.path) as store:
-
-            wp = tm.makePanel(30)
-
-            # start
-            _maybe_remove(store, 'wp1')
-            store.put('wp1', wp, format='t')
-            n = store.remove('wp1', start=32)
-            self.assertTrue(n == 120-32)
-            result = store.select('wp1')
-            expected = wp.reindex(major_axis=wp.major_axis[:32//4])
-            assert_panel_equal(result, expected)
-
-            _maybe_remove(store, 'wp2')
-            store.put('wp2', wp, format='t')
-            n = store.remove('wp2', start=-32)
-            self.assertTrue(n == 32)
-            result = store.select('wp2')
-            expected = wp.reindex(major_axis=wp.major_axis[:-32//4])
-            assert_panel_equal(result, expected)
-
-            # stop
-            _maybe_remove(store, 'wp3')
-            store.put('wp3', wp, format='t')
-            n = store.remove('wp3', stop=32)
-            self.assertTrue(n == 32)
-            result = store.select('wp3')
-            expected = wp.reindex(major_axis=wp.major_axis[32//4:])
-            assert_panel_equal(result, expected)
-
-            _maybe_remove(store, 'wp4')
-            store.put('wp4', wp, format='t')
-            n = store.remove('wp4', stop=-32)
-            self.assertTrue(n == 120-32)
-            result = store.select('wp4')
-            expected = wp.reindex(major_axis=wp.major_axis[-32//4:])
-            assert_panel_equal(result, expected)
-
-            # start n stop
-            _maybe_remove(store, 'wp5')
-            store.put('wp5', wp, format='t')
-            n = store.remove('wp5', start=16, stop=-16)
-            self.assertTrue(n == 120-32)
-            result = store.select('wp5')
-            expected = wp.reindex(major_axis=wp.major_axis[:16//4].union(wp.major_axis[-16//4:]))
-            assert_panel_equal(result, expected)
-
-            _maybe_remove(store, 'wp6')
-            store.put('wp6', wp, format='t')
-            n = store.remove('wp6', start=16, stop=16)
-            self.assertTrue(n == 0)
-            result = store.select('wp6')
-            expected = wp.reindex(major_axis=wp.major_axis)
-            assert_panel_equal(result, expected)
-
-            # with where
-            _maybe_remove(store, 'wp7')
-            date = wp.major_axis.take(np.arange(0,30,3))
-            crit = Term('major_axis=date')
-            store.put('wp7', wp, format='t')
-            n = store.remove('wp7', where=[crit], stop=80)
-            self.assertTrue(n == 28)
-            result = store.select('wp7')
-            expected = wp.reindex(major_axis=wp.major_axis.difference(wp.major_axis[np.arange(0,20,3)]))
-            assert_panel_equal(result, expected)
-
-    def test_remove_crit(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            wp = tm.makePanel(30)
-
-            # group row removal
-            _maybe_remove(store, 'wp3')
-            date4 = wp.major_axis.take([0, 1, 2, 4, 5, 6, 8, 9, 10])
-            crit4 = Term('major_axis=date4')
-            store.put('wp3', wp, format='t')
-            n = store.remove('wp3', where=[crit4])
-            self.assertTrue(n == 36)
-
-            result = store.select('wp3')
-            expected = wp.reindex(major_axis=wp.major_axis.difference(date4))
-            assert_panel_equal(result, expected)
-
-            # upper half
-            _maybe_remove(store, 'wp')
-            store.put('wp', wp, format='table')
-            date = wp.major_axis[len(wp.major_axis) // 2]
-
-            crit1 = Term('major_axis>date')
-            crit2 = Term("minor_axis=['A', 'D']")
-            n = store.remove('wp', where=[crit1])
-            self.assertTrue(n == 56)
-
-            n = store.remove('wp', where=[crit2])
-            self.assertTrue(n == 32)
-
-            result = store['wp']
-            expected = wp.truncate(after=date).reindex(minor=['B', 'C'])
-            assert_panel_equal(result, expected)
-
-            # individual row elements
-            _maybe_remove(store, 'wp2')
-            store.put('wp2', wp, format='table')
-
-            date1 = wp.major_axis[1:3]
-            crit1 = Term('major_axis=date1')
-            store.remove('wp2', where=[crit1])
-            result = store.select('wp2')
-            expected = wp.reindex(major_axis=wp.major_axis.difference(date1))
-            assert_panel_equal(result, expected)
-
-            date2 = wp.major_axis[5]
-            crit2 = Term('major_axis=date2')
-            store.remove('wp2', where=[crit2])
-            result = store['wp2']
-            expected = wp.reindex(
-                major_axis=wp.major_axis.difference(date1).difference(Index([date2])))
-            assert_panel_equal(result, expected)
-
-            date3 = [wp.major_axis[7], wp.major_axis[9]]
-            crit3 = Term('major_axis=date3')
-            store.remove('wp2', where=[crit3])
-            result = store['wp2']
-            expected = wp.reindex(
-                major_axis=wp.major_axis.difference(date1).difference(Index([date2])).difference(Index(date3)))
-            assert_panel_equal(result, expected)
-
-            # corners
-            _maybe_remove(store, 'wp4')
-            store.put('wp4', wp, format='table')
-            n = store.remove(
-                'wp4', where=[Term('major_axis>wp.major_axis[-1]')])
-            result = store.select('wp4')
-            assert_panel_equal(result, wp)
-
-    def test_invalid_terms(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            df = tm.makeTimeDataFrame()
-            df['string'] = 'foo'
-            df.ix[0:4,'string'] = 'bar'
-            wp = tm.makePanel()
-            p4d = tm.makePanel4D()
-            store.put('df', df, format='table')
-            store.put('wp', wp, format='table')
-            store.put('p4d', p4d, format='table')
-
-            # some invalid terms
-            self.assertRaises(ValueError, store.select, 'wp', "minor=['A', 'B']")
-            self.assertRaises(ValueError, store.select, 'wp', ["index=['20121114']"])
-            self.assertRaises(ValueError, store.select, 'wp', ["index=['20121114', '20121114']"])
-            self.assertRaises(TypeError, Term)
-
-            # more invalid
-            self.assertRaises(ValueError,  store.select, 'df','df.index[3]')
-            self.assertRaises(SyntaxError, store.select, 'df','index>')
-            self.assertRaises(ValueError,  store.select, 'wp', "major_axis<'20000108' & minor_axis['A', 'B']")
-
-        # from the docs
-        with ensure_clean_path(self.path) as path:
-            dfq = DataFrame(np.random.randn(10,4),columns=list('ABCD'),index=date_range('20130101',periods=10))
-            dfq.to_hdf(path,'dfq',format='table',data_columns=True)
-
-            # check ok
-            read_hdf(path,'dfq',where="index>Timestamp('20130104') & columns=['A', 'B']")
-            read_hdf(path,'dfq',where="A>0 or C>0")
-
-        # catch the invalid reference
-        with ensure_clean_path(self.path) as path:
-            dfq = DataFrame(np.random.randn(10,4),columns=list('ABCD'),index=date_range('20130101',periods=10))
-            dfq.to_hdf(path,'dfq',format='table')
-
-            self.assertRaises(ValueError, read_hdf, path,'dfq',where="A>0 or C>0")
-
-    def test_terms(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            wp = tm.makePanel()
-            p4d = tm.makePanel4D()
-            wpneg = Panel.fromDict({-1: tm.makeDataFrame(), 0: tm.makeDataFrame(),
-                                    1: tm.makeDataFrame()})
-            store.put('wp', wp, format='table')
-            store.put('p4d', p4d, format='table')
-            store.put('wpneg', wpneg, format='table')
-
-            # panel
-            result = store.select('wp', [Term(
-                        'major_axis<"20000108"'), Term("minor_axis=['A', 'B']")])
-            expected = wp.truncate(after='20000108').reindex(minor=['A', 'B'])
-            assert_panel_equal(result, expected)
-
-            # with deprecation
-            result = store.select('wp', [Term(
-                'major_axis','<',"20000108"), Term("minor_axis=['A', 'B']")])
-            expected = wp.truncate(after='20000108').reindex(minor=['A', 'B'])
-            tm.assert_panel_equal(result, expected)
-
-            # p4d
-            result = store.select('p4d', [Term('major_axis<"20000108"'),
-                                          Term("minor_axis=['A', 'B']"),
-                                          Term("items=['ItemA', 'ItemB']")])
-            expected = p4d.truncate(after='20000108').reindex(
-                minor=['A', 'B'], items=['ItemA', 'ItemB'])
-            assert_panel4d_equal(result, expected)
-
-            # back compat invalid terms
-            terms = [
-                dict(field='major_axis', op='>', value='20121114'),
-                [ dict(field='major_axis', op='>', value='20121114') ],
-                [ "minor_axis=['A','B']", dict(field='major_axis', op='>', value='20121114') ]
-                ]
-            for t in terms:
-                with tm.assert_produces_warning(expected_warning=DeprecationWarning,
-                                                check_stacklevel=False):
-                    Term(t)
-
-            # valid terms
-            terms = [
-                ('major_axis=20121114'),
-                ('major_axis>20121114'),
-                (("major_axis=['20121114', '20121114']"),),
-                ('major_axis=datetime.datetime(2012, 11, 14)'),
-                'major_axis> 20121114',
-                'major_axis >20121114',
-                'major_axis > 20121114',
-                (("minor_axis=['A', 'B']"),),
-                (("minor_axis=['A', 'B']"),),
-                ((("minor_axis==['A', 'B']"),),),
-                (("items=['ItemA', 'ItemB']"),),
-                ('items=ItemA'),
-                ]
-
-            for t in terms:
-                store.select('wp', t)
-                store.select('p4d', t)
-
-            # valid for p4d only
-            terms = [
-                (("labels=['l1', 'l2']"),),
-                Term("labels=['l1', 'l2']"),
-                ]
-
-            for t in terms:
-                store.select('p4d', t)
-
-            with tm.assertRaisesRegexp(TypeError, 'Only named functions are supported'):
-                store.select('wp', Term('major_axis == (lambda x: x)("20130101")'))
-
-            # check USub node parsing
-            res = store.select('wpneg', Term('items == -1'))
-            expected = Panel({-1: wpneg[-1]})
-            tm.assert_panel_equal(res, expected)
-
-            with tm.assertRaisesRegexp(NotImplementedError,
-                                       'Unary addition not supported'):
-                store.select('wpneg', Term('items == +1'))
-
-    def test_term_compat(self):
-        with ensure_clean_store(self.path) as store:
-
-            wp = Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
-                       major_axis=date_range('1/1/2000', periods=5),
-                       minor_axis=['A', 'B', 'C', 'D'])
-            store.append('wp',wp)
-
-            result = store.select('wp', [Term('major_axis>20000102'),
-                                         Term('minor_axis', '=', ['A','B']) ])
-            expected = wp.loc[:,wp.major_axis>Timestamp('20000102'),['A','B']]
-            assert_panel_equal(result, expected)
-
-            store.remove('wp', Term('major_axis>20000103'))
-            result = store.select('wp')
-            expected = wp.loc[:,wp.major_axis<=Timestamp('20000103'),:]
-            assert_panel_equal(result, expected)
-
-        with ensure_clean_store(self.path) as store:
-
-            wp = Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
-                       major_axis=date_range('1/1/2000', periods=5),
-                       minor_axis=['A', 'B', 'C', 'D'])
-            store.append('wp',wp)
-
-            # stringified datetimes
-            result = store.select('wp', [Term('major_axis','>',datetime.datetime(2000,1,2))])
-            expected = wp.loc[:,wp.major_axis>Timestamp('20000102')]
-            assert_panel_equal(result, expected)
-
-            result = store.select('wp', [Term('major_axis','>',datetime.datetime(2000,1,2,0,0))])
-            expected = wp.loc[:,wp.major_axis>Timestamp('20000102')]
-            assert_panel_equal(result, expected)
-
-            result = store.select('wp', [Term('major_axis','=',[datetime.datetime(2000,1,2,0,0),datetime.datetime(2000,1,3,0,0)])])
-            expected = wp.loc[:,[Timestamp('20000102'),Timestamp('20000103')]]
-            assert_panel_equal(result, expected)
-
-            result = store.select('wp', [Term('minor_axis','=',['A','B'])])
-            expected = wp.loc[:,:,['A','B']]
-            assert_panel_equal(result, expected)
-
-    def test_backwards_compat_without_term_object(self):
-        with ensure_clean_store(self.path) as store:
-
-            wp = Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
-                       major_axis=date_range('1/1/2000', periods=5),
-                       minor_axis=['A', 'B', 'C', 'D'])
-            store.append('wp',wp)
-            with tm.assert_produces_warning(expected_warning=DeprecationWarning,
-                                            check_stacklevel=not compat.PY3):
-                result = store.select('wp', [('major_axis>20000102'),
-                                             ('minor_axis', '=', ['A','B']) ])
-            expected = wp.loc[:,wp.major_axis>Timestamp('20000102'),['A','B']]
-            assert_panel_equal(result, expected)
-
-            store.remove('wp', ('major_axis>20000103'))
-            result = store.select('wp')
-            expected = wp.loc[:,wp.major_axis<=Timestamp('20000103'),:]
-            assert_panel_equal(result, expected)
-
-        with ensure_clean_store(self.path) as store:
-
-            wp = Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
-                       major_axis=date_range('1/1/2000', periods=5),
-                       minor_axis=['A', 'B', 'C', 'D'])
-            store.append('wp',wp)
-
-            # stringified datetimes
-            with tm.assert_produces_warning(expected_warning=DeprecationWarning,
-                                            check_stacklevel=not compat.PY3):
-                result = store.select('wp', [('major_axis','>',datetime.datetime(2000,1,2))])
-            expected = wp.loc[:,wp.major_axis>Timestamp('20000102')]
-            assert_panel_equal(result, expected)
-            with tm.assert_produces_warning(expected_warning=DeprecationWarning,
-                                            check_stacklevel=not compat.PY3):
-                result = store.select('wp', [('major_axis','>',datetime.datetime(2000,1,2,0,0))])
-            expected = wp.loc[:,wp.major_axis>Timestamp('20000102')]
-            assert_panel_equal(result, expected)
-            with tm.assert_produces_warning(expected_warning=DeprecationWarning,
-                                            check_stacklevel=not compat.PY3):
-                result = store.select('wp', [('major_axis','=',[datetime.datetime(2000,1,2,0,0),
-                                                                datetime.datetime(2000,1,3,0,0)])])
-            expected = wp.loc[:,[Timestamp('20000102'),Timestamp('20000103')]]
-            assert_panel_equal(result, expected)
-            with tm.assert_produces_warning(expected_warning=DeprecationWarning,
-                                            check_stacklevel=not compat.PY3):
-                result = store.select('wp', [('minor_axis','=',['A','B'])])
-            expected = wp.loc[:,:,['A','B']]
-            assert_panel_equal(result, expected)
-
-    def test_same_name_scoping(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            import pandas as pd
-            df  = DataFrame(np.random.randn(20, 2),index=pd.date_range('20130101',periods=20))
-            store.put('df', df, format='table')
-            expected = df[df.index>pd.Timestamp('20130105')]
-
-            import datetime
-            result = store.select('df','index>datetime.datetime(2013,1,5)')
-            assert_frame_equal(result,expected)
-
-            from datetime import datetime
-
-            # technically an error, but allow it
-            result = store.select('df','index>datetime.datetime(2013,1,5)')
-            assert_frame_equal(result,expected)
-
-            result = store.select('df','index>datetime(2013,1,5)')
-            assert_frame_equal(result,expected)
-
-    def test_series(self):
-
-        s = tm.makeStringSeries()
-        self._check_roundtrip(s, tm.assert_series_equal)
-
-        ts = tm.makeTimeSeries()
-        self._check_roundtrip(ts, tm.assert_series_equal)
-
-        ts2 = Series(ts.index, Index(ts.index, dtype=object))
-        self._check_roundtrip(ts2, tm.assert_series_equal)
-
-        ts3 = Series(ts.values, Index(np.asarray(ts.index, dtype=object),
-                                      dtype=object))
-        self._check_roundtrip(ts3, tm.assert_series_equal)
-
-    def test_sparse_series(self):
-
-        s = tm.makeStringSeries()
-        s[3:5] = np.nan
-        ss = s.to_sparse()
-        self._check_roundtrip(ss, tm.assert_series_equal,
-                              check_series_type=True)
-
-        ss2 = s.to_sparse(kind='integer')
-        self._check_roundtrip(ss2, tm.assert_series_equal,
-                              check_series_type=True)
-
-        ss3 = s.to_sparse(fill_value=0)
-        self._check_roundtrip(ss3, tm.assert_series_equal,
-                              check_series_type=True)
-
-    def test_sparse_frame(self):
-
-        s = tm.makeDataFrame()
-        s.ix[3:5, 1:3] = np.nan
-        s.ix[8:10, -2] = np.nan
-        ss = s.to_sparse()
-
-        self._check_double_roundtrip(ss, tm.assert_frame_equal,
-                                     check_frame_type=True)
-
-        ss2 = s.to_sparse(kind='integer')
-        self._check_double_roundtrip(ss2, tm.assert_frame_equal,
-                                     check_frame_type=True)
-
-        ss3 = s.to_sparse(fill_value=0)
-        self._check_double_roundtrip(ss3, tm.assert_frame_equal,
-                                     check_frame_type=True)
-
-    def test_sparse_panel(self):
-
-        items = ['x', 'y', 'z']
-        p = Panel(dict((i, tm.makeDataFrame().ix[:2, :2]) for i in items))
-        sp = p.to_sparse()
-
-        self._check_double_roundtrip(sp, assert_panel_equal,
-                                     check_panel_type=True)
-
-        sp2 = p.to_sparse(kind='integer')
-        self._check_double_roundtrip(sp2, assert_panel_equal,
-                                     check_panel_type=True)
-
-        sp3 = p.to_sparse(fill_value=0)
-        self._check_double_roundtrip(sp3, assert_panel_equal,
-                                     check_panel_type=True)
-
-    def test_float_index(self):
-
-        # GH #454
-        index = np.random.randn(10)
-        s = Series(np.random.randn(10), index=index)
-        self._check_roundtrip(s, tm.assert_series_equal)
-
-    def test_tuple_index(self):
-
-        # GH #492
-        col = np.arange(10)
-        idx = [(0., 1.), (2., 3.), (4., 5.)]
-        data = np.random.randn(30).reshape((3, 10))
-        DF = DataFrame(data, index=idx, columns=col)
-
-        expected_warning = Warning if compat.PY35 else PerformanceWarning
-        with tm.assert_produces_warning(expected_warning=expected_warning, check_stacklevel=False):
-            self._check_roundtrip(DF, tm.assert_frame_equal)
-
-    def test_index_types(self):
-
-        values = np.random.randn(2)
-
-        func = lambda l, r: tm.assert_series_equal(l, r,
-                                                   check_dtype=True,
-                                                   check_index_type=True,
-                                                   check_series_type=True)
-
-        # nose has a deprecation warning in 3.5
-        expected_warning = Warning if compat.PY35 else PerformanceWarning
-        with tm.assert_produces_warning(expected_warning=expected_warning, check_stacklevel=False):
-            ser = Series(values, [0, 'y'])
-            self._check_roundtrip(ser, func)
-
-        with tm.assert_produces_warning(expected_warning=expected_warning, check_stacklevel=False):
-            ser = Series(values, [datetime.datetime.today(), 0])
-            self._check_roundtrip(ser, func)
-
-        with tm.assert_produces_warning(expected_warning=expected_warning, check_stacklevel=False):
-            ser = Series(values, ['y', 0])
-            self._check_roundtrip(ser, func)
-
-        with tm.assert_produces_warning(expected_warning=expected_warning, check_stacklevel=False):
-            ser = Series(values, [datetime.date.today(), 'a'])
-            self._check_roundtrip(ser, func)
-
-        with tm.assert_produces_warning(expected_warning=expected_warning, check_stacklevel=False):
-            ser = Series(values, [1.23, 'b'])
-            self._check_roundtrip(ser, func)
-
-        ser = Series(values, [1, 1.53])
-        self._check_roundtrip(ser, func)
-
-        ser = Series(values, [1, 5])
-        self._check_roundtrip(ser, func)
-
-        ser = Series(values, [datetime.datetime(
-            2012, 1, 1), datetime.datetime(2012, 1, 2)])
-        self._check_roundtrip(ser, func)
-
-    def test_timeseries_preepoch(self):
-
-        if sys.version_info[0] == 2 and sys.version_info[1] < 7:
-            raise nose.SkipTest("won't work on Python < 2.7")
-
-        dr = bdate_range('1/1/1940', '1/1/1960')
-        ts = Series(np.random.randn(len(dr)), index=dr)
-        try:
-            self._check_roundtrip(ts, tm.assert_series_equal)
-        except OverflowError:
-            raise nose.SkipTest('known failer on some windows platforms')
-
-    def test_frame(self):
-
-        df = tm.makeDataFrame()
-
-        # put in some random NAs
-        df.values[0, 0] = np.nan
-        df.values[5, 3] = np.nan
-
-        self._check_roundtrip_table(df, tm.assert_frame_equal)
-        self._check_roundtrip(df, tm.assert_frame_equal)
-
-        if not skip_compression:
-            self._check_roundtrip_table(df, tm.assert_frame_equal,
-                                        compression=True)
-            self._check_roundtrip(df, tm.assert_frame_equal,
-                                  compression=True)
-
-        tdf = tm.makeTimeDataFrame()
-        self._check_roundtrip(tdf, tm.assert_frame_equal)
-
-        if not skip_compression:
-            self._check_roundtrip(tdf, tm.assert_frame_equal,
-                                  compression=True)
-
-        with ensure_clean_store(self.path) as store:
-            # not consolidated
-            df['foo'] = np.random.randn(len(df))
-            store['df'] = df
-            recons = store['df']
-            self.assertTrue(recons._data.is_consolidated())
-
-        # empty
-        self._check_roundtrip(df[:0], tm.assert_frame_equal)
-
-    def test_empty_series_frame(self):
-        s0 = Series()
-        s1 = Series(name='myseries')
-        df0 = DataFrame()
-        df1 = DataFrame(index=['a', 'b', 'c'])
-        df2 = DataFrame(columns=['d', 'e', 'f'])
-
-        self._check_roundtrip(s0, tm.assert_series_equal)
-        self._check_roundtrip(s1, tm.assert_series_equal)
-        self._check_roundtrip(df0, tm.assert_frame_equal)
-        self._check_roundtrip(df1, tm.assert_frame_equal)
-        self._check_roundtrip(df2, tm.assert_frame_equal)
-
-    def test_empty_series(self):
-        for dtype in [np.int64, np.float64, np.object, 'm8[ns]', 'M8[ns]']:
-            s = Series(dtype=dtype)
-            self._check_roundtrip(s, tm.assert_series_equal)
-
-    def test_can_serialize_dates(self):
-
-        rng = [x.date() for x in bdate_range('1/1/2000', '1/30/2000')]
-        frame = DataFrame(np.random.randn(len(rng), 4), index=rng)
-
-        self._check_roundtrip(frame, tm.assert_frame_equal)
-
-    def test_store_hierarchical(self):
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['foo', 'bar'])
-        frame = DataFrame(np.random.randn(10, 3), index=index,
-                          columns=['A', 'B', 'C'])
-
-        self._check_roundtrip(frame, tm.assert_frame_equal)
-        self._check_roundtrip(frame.T, tm.assert_frame_equal)
-        self._check_roundtrip(frame['A'], tm.assert_series_equal)
-
-        # check that the names are stored
-        with ensure_clean_store(self.path) as store:
-            store['frame'] = frame
-            recons = store['frame']
-            assert(recons.index.names == ('foo', 'bar'))
-
-    def test_store_index_name(self):
-        df = tm.makeDataFrame()
-        df.index.name = 'foo'
-
-        with ensure_clean_store(self.path) as store:
-            store['frame'] = df
-            recons = store['frame']
-            assert(recons.index.name == 'foo')
-
-    def test_store_series_name(self):
-        df = tm.makeDataFrame()
-        series = df['A']
-
-        with ensure_clean_store(self.path) as store:
-            store['series'] = series
-            recons = store['series']
-            assert(recons.name == 'A')
-
-    def test_store_mixed(self):
-
-        def _make_one():
-            df = tm.makeDataFrame()
-            df['obj1'] = 'foo'
-            df['obj2'] = 'bar'
-            df['bool1'] = df['A'] > 0
-            df['bool2'] = df['B'] > 0
-            df['int1'] = 1
-            df['int2'] = 2
-            return df.consolidate()
-
-        df1 = _make_one()
-        df2 = _make_one()
-
-        self._check_roundtrip(df1, tm.assert_frame_equal)
-        self._check_roundtrip(df2, tm.assert_frame_equal)
-
-        with ensure_clean_store(self.path) as store:
-            store['obj'] = df1
-            tm.assert_frame_equal(store['obj'], df1)
-            store['obj'] = df2
-            tm.assert_frame_equal(store['obj'], df2)
-
-        # check that can store Series of all of these types
-        self._check_roundtrip(df1['obj1'], tm.assert_series_equal)
-        self._check_roundtrip(df1['bool1'], tm.assert_series_equal)
-        self._check_roundtrip(df1['int1'], tm.assert_series_equal)
-
-        if not skip_compression:
-            self._check_roundtrip(df1['obj1'], tm.assert_series_equal,
-                                  compression=True)
-            self._check_roundtrip(df1['bool1'], tm.assert_series_equal,
-                                  compression=True)
-            self._check_roundtrip(df1['int1'], tm.assert_series_equal,
-                                  compression=True)
-            self._check_roundtrip(df1, tm.assert_frame_equal,
-                                  compression=True)
-
-    def test_wide(self):
-
-        wp = tm.makePanel()
-        self._check_roundtrip(wp, assert_panel_equal)
-
-    def test_wide_table(self):
-
-        wp = tm.makePanel()
-        self._check_roundtrip_table(wp, assert_panel_equal)
-
-    def test_select_with_dups(self):
-
-        # single dtypes
-        df = DataFrame(np.random.randn(10,4),columns=['A','A','B','B'])
-        df.index = date_range('20130101 9:30',periods=10,freq='T')
-
-        with ensure_clean_store(self.path) as store:
-            store.append('df',df)
-
-            result = store.select('df')
-            expected = df
-            assert_frame_equal(result,expected,by_blocks=True)
-
-            result = store.select('df',columns=df.columns)
-            expected = df
-            assert_frame_equal(result,expected,by_blocks=True)
-
-            result = store.select('df',columns=['A'])
-            expected = df.loc[:,['A']]
-            assert_frame_equal(result,expected)
-
-        # dups accross dtypes
-        df = concat([DataFrame(np.random.randn(10,4),columns=['A','A','B','B']),
-                     DataFrame(np.random.randint(0,10,size=20).reshape(10,2),columns=['A','C'])],
-                    axis=1)
-        df.index = date_range('20130101 9:30',periods=10,freq='T')
-
-        with ensure_clean_store(self.path) as store:
-            store.append('df',df)
-
-            result = store.select('df')
-            expected = df
-            assert_frame_equal(result,expected,by_blocks=True)
-
-            result = store.select('df',columns=df.columns)
-            expected = df
-            assert_frame_equal(result,expected,by_blocks=True)
-
-            expected = df.loc[:,['A']]
-            result = store.select('df',columns=['A'])
-            assert_frame_equal(result,expected,by_blocks=True)
-
-            expected = df.loc[:,['B','A']]
-            result = store.select('df',columns=['B','A'])
-            assert_frame_equal(result,expected,by_blocks=True)
-
-        # duplicates on both index and columns
-        with ensure_clean_store(self.path) as store:
-            store.append('df',df)
-            store.append('df',df)
-
-            expected = df.loc[:,['B','A']]
-            expected = concat([expected, expected])
-            result = store.select('df',columns=['B','A'])
-            assert_frame_equal(result,expected,by_blocks=True)
-
-    def test_wide_table_dups(self):
-        wp = tm.makePanel()
-        with ensure_clean_store(self.path) as store:
-            store.put('panel', wp, format='table')
-            store.put('panel', wp, format='table', append=True)
-
-            with tm.assert_produces_warning(expected_warning=DuplicateWarning):
-                recons = store['panel']
-
-            assert_panel_equal(recons, wp)
-
-    def test_long(self):
-        def _check(left, right):
-            assert_panel_equal(left.to_panel(), right.to_panel())
-
-        wp = tm.makePanel()
-        self._check_roundtrip(wp.to_frame(), _check)
-
-        # empty
-        # self._check_roundtrip(wp.to_frame()[:0], _check)
-
-    def test_longpanel(self):
-        pass
-
-    def test_overwrite_node(self):
-
-        with ensure_clean_store(self.path) as store:
-            store['a'] = tm.makeTimeDataFrame()
-            ts = tm.makeTimeSeries()
-            store['a'] = ts
-
-            tm.assert_series_equal(store['a'], ts)
-
-    def test_sparse_with_compression(self):
-
-        # GH 2931
-
-        # make sparse dataframe
-        df = DataFrame(np.random.binomial(n=1, p=.01, size=(1e3, 10))).to_sparse(fill_value=0)
-
-        # case 1: store uncompressed
-        self._check_double_roundtrip(df, tm.assert_frame_equal,
-                                     compression = False,
-                                     check_frame_type=True)
-
-        # case 2: store compressed (works)
-        self._check_double_roundtrip(df, tm.assert_frame_equal,
-                                     compression = 'zlib',
-                                     check_frame_type=True)
-
-        # set one series to be completely sparse
-        df[0] = np.zeros(1e3)
-
-        # case 3: store df with completely sparse series uncompressed
-        self._check_double_roundtrip(df, tm.assert_frame_equal,
-                                     compression = False,
-                                     check_frame_type=True)
-
-        # case 4: try storing df with completely sparse series compressed (fails)
-        self._check_double_roundtrip(df, tm.assert_frame_equal,
-                                     compression = 'zlib',
-                                     check_frame_type=True)
-
-    def test_select(self):
-        wp = tm.makePanel()
-
-        with ensure_clean_store(self.path) as store:
-
-            # put/select ok
-            _maybe_remove(store, 'wp')
-            store.put('wp', wp, format='table')
-            store.select('wp')
-
-            # non-table ok (where = None)
-            _maybe_remove(store, 'wp')
-            store.put('wp2', wp)
-            store.select('wp2')
-
-            # selection on the non-indexable with a large number of columns
-            wp = Panel(
-                np.random.randn(100, 100, 100), items=['Item%03d' % i for i in range(100)],
-                major_axis=date_range('1/1/2000', periods=100), minor_axis=['E%03d' % i for i in range(100)])
-
-            _maybe_remove(store, 'wp')
-            store.append('wp', wp)
-            items = ['Item%03d' % i for i in range(80)]
-            result = store.select('wp', Term('items=items'))
-            expected = wp.reindex(items=items)
-            assert_panel_equal(expected, result)
-
-            # selectin non-table with a where
-            # self.assertRaises(ValueError, store.select,
-            #                  'wp2', ('column', ['A', 'D']))
-
-            # select with columns=
-            df = tm.makeTimeDataFrame()
-            _maybe_remove(store, 'df')
-            store.append('df', df)
-            result = store.select('df', columns=['A', 'B'])
-            expected = df.reindex(columns=['A', 'B'])
-            tm.assert_frame_equal(expected, result)
-
-            # equivalentsly
-            result = store.select('df', [("columns=['A', 'B']")])
-            expected = df.reindex(columns=['A', 'B'])
-            tm.assert_frame_equal(expected, result)
-
-            # with a data column
-            _maybe_remove(store, 'df')
-            store.append('df', df, data_columns=['A'])
-            result = store.select('df', ['A > 0'], columns=['A', 'B'])
-            expected = df[df.A > 0].reindex(columns=['A', 'B'])
-            tm.assert_frame_equal(expected, result)
-
-            # all a data columns
-            _maybe_remove(store, 'df')
-            store.append('df', df, data_columns=True)
-            result = store.select('df', ['A > 0'], columns=['A', 'B'])
-            expected = df[df.A > 0].reindex(columns=['A', 'B'])
-            tm.assert_frame_equal(expected, result)
-
-            # with a data column, but different columns
-            _maybe_remove(store, 'df')
-            store.append('df', df, data_columns=['A'])
-            result = store.select('df', ['A > 0'], columns=['C', 'D'])
-            expected = df[df.A > 0].reindex(columns=['C', 'D'])
-            tm.assert_frame_equal(expected, result)
-
-    def test_select_dtypes(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            # with a Timestamp data column (GH #2637)
-            df = DataFrame(dict(ts=bdate_range('2012-01-01', periods=300), A=np.random.randn(300)))
-            _maybe_remove(store, 'df')
-            store.append('df', df, data_columns=['ts', 'A'])
-
-            result = store.select('df', [Term("ts>=Timestamp('2012-02-01')")])
-            expected = df[df.ts >= Timestamp('2012-02-01')]
-            tm.assert_frame_equal(expected, result)
-
-            # bool columns (GH #2849)
-            df = DataFrame(np.random.randn(5,2), columns =['A','B'])
-            df['object'] = 'foo'
-            df.ix[4:5,'object'] = 'bar'
-            df['boolv'] = df['A'] > 0
-            _maybe_remove(store, 'df')
-            store.append('df', df, data_columns = True)
-
-            expected = df[df.boolv == True].reindex(columns=['A','boolv'])
-            for v in [True,'true',1]:
-                result = store.select('df', Term('boolv == %s' % str(v)), columns = ['A','boolv'])
-                tm.assert_frame_equal(expected, result)
-
-            expected = df[df.boolv == False ].reindex(columns=['A','boolv'])
-            for v in [False,'false',0]:
-                result = store.select('df', Term('boolv == %s' % str(v)), columns = ['A','boolv'])
-                tm.assert_frame_equal(expected, result)
-
-            # integer index
-            df = DataFrame(dict(A=np.random.rand(20), B=np.random.rand(20)))
-            _maybe_remove(store, 'df_int')
-            store.append('df_int', df)
-            result = store.select(
-                'df_int', [Term("index<10"), Term("columns=['A']")])
-            expected = df.reindex(index=list(df.index)[0:10],columns=['A'])
-            tm.assert_frame_equal(expected, result)
-
-            # float index
-            df = DataFrame(dict(A=np.random.rand(
-                        20), B=np.random.rand(20), index=np.arange(20, dtype='f8')))
-            _maybe_remove(store, 'df_float')
-            store.append('df_float', df)
-            result = store.select(
-                'df_float', [Term("index<10.0"), Term("columns=['A']")])
-            expected = df.reindex(index=list(df.index)[0:10],columns=['A'])
-            tm.assert_frame_equal(expected, result)
-
-        with ensure_clean_store(self.path) as store:
-
-            # floats w/o NaN
-            df = DataFrame(dict(cols = range(11), values = range(11)),dtype='float64')
-            df['cols'] = (df['cols']+10).apply(str)
-
-            store.append('df1',df,data_columns=True)
-            result = store.select(
-                'df1', where='values>2.0')
-            expected = df[df['values']>2.0]
-            tm.assert_frame_equal(expected, result)
-
-            # floats with NaN
-            df.iloc[0] = np.nan
-            expected = df[df['values']>2.0]
-
-            store.append('df2',df,data_columns=True,index=False)
-            result = store.select(
-                'df2', where='values>2.0')
-            tm.assert_frame_equal(expected, result)
-
-            # https://github.com/PyTables/PyTables/issues/282
-            # bug in selection when 0th row has a np.nan and an index
-            #store.append('df3',df,data_columns=True)
-            #result = store.select(
-            #    'df3', where='values>2.0')
-            #tm.assert_frame_equal(expected, result)
-
-            # not in first position float with NaN ok too
-            df = DataFrame(dict(cols = range(11), values = range(11)),dtype='float64')
-            df['cols'] = (df['cols']+10).apply(str)
-
-            df.iloc[1] = np.nan
-            expected = df[df['values']>2.0]
-
-            store.append('df4',df,data_columns=True)
-            result = store.select(
-                'df4', where='values>2.0')
-            tm.assert_frame_equal(expected, result)
-        
-        # test selection with comparison against numpy scalar
-        # GH 11283
-        with ensure_clean_store(self.path) as store:
-            df = tm.makeDataFrame()
-
-            expected = df[df['A']>0]
-
-            store.append('df', df, data_columns=True)
-            np_zero = np.float64(0)
-            result = store.select('df', where=["A>np_zero"])
-            tm.assert_frame_equal(expected, result)
-
-    def test_select_with_many_inputs(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            df = DataFrame(dict(ts=bdate_range('2012-01-01', periods=300),
-                                A=np.random.randn(300),
-                                B=range(300),
-                                users = ['a']*50 + ['b']*50 + ['c']*100 + ['a%03d' % i for i in range(100)]))
-            _maybe_remove(store, 'df')
-            store.append('df', df, data_columns=['ts', 'A', 'B', 'users'])
-
-            # regular select
-            result = store.select('df', [Term("ts>=Timestamp('2012-02-01')")])
-            expected = df[df.ts >= Timestamp('2012-02-01')]
-            tm.assert_frame_equal(expected, result)
-
-            # small selector
-            result = store.select('df', [Term("ts>=Timestamp('2012-02-01') & users=['a','b','c']")])
-            expected = df[ (df.ts >= Timestamp('2012-02-01')) & df.users.isin(['a','b','c']) ]
-            tm.assert_frame_equal(expected, result)
-
-            # big selector along the columns
-            selector = [ 'a','b','c' ] + [ 'a%03d' % i for i in range(60) ]
-            result = store.select('df', [Term("ts>=Timestamp('2012-02-01')"),Term('users=selector')])
-            expected = df[ (df.ts >= Timestamp('2012-02-01')) & df.users.isin(selector) ]
-            tm.assert_frame_equal(expected, result)
-
-            selector = range(100,200)
-            result = store.select('df', [Term('B=selector')])
-            expected = df[ df.B.isin(selector) ]
-            tm.assert_frame_equal(expected, result)
-            self.assertEqual(len(result), 100)
-
-            # big selector along the index
-            selector = Index(df.ts[0:100].values)
-            result  = store.select('df', [Term('ts=selector')])
-            expected = df[ df.ts.isin(selector.values) ]
-            tm.assert_frame_equal(expected, result)
-            self.assertEqual(len(result), 100)
-
-    def test_select_iterator(self):
-
-        # single table
-        with ensure_clean_store(self.path) as store:
-
-            df = tm.makeTimeDataFrame(500)
-            _maybe_remove(store, 'df')
-            store.append('df', df)
-
-            expected = store.select('df')
-
-            results = [ s for s in store.select('df',iterator=True) ]
-            result = concat(results)
-            tm.assert_frame_equal(expected, result)
-
-            results = [ s for s in store.select('df',chunksize=100) ]
-            self.assertEqual(len(results), 5)
-            result = concat(results)
-            tm.assert_frame_equal(expected, result)
-
-            results = [ s for s in store.select('df',chunksize=150) ]
-            result = concat(results)
-            tm.assert_frame_equal(result, expected)
-
-        with ensure_clean_path(self.path) as path:
-
-            df = tm.makeTimeDataFrame(500)
-            df.to_hdf(path,'df_non_table')
-            self.assertRaises(TypeError, read_hdf, path,'df_non_table',chunksize=100)
-            self.assertRaises(TypeError, read_hdf, path,'df_non_table',iterator=True)
-
-        with ensure_clean_path(self.path) as path:
-
-            df = tm.makeTimeDataFrame(500)
-            df.to_hdf(path,'df',format='table')
-
-            results = [ s for s in read_hdf(path,'df',chunksize=100) ]
-            result = concat(results)
-
-            self.assertEqual(len(results), 5)
-            tm.assert_frame_equal(result, df)
-            tm.assert_frame_equal(result, read_hdf(path,'df'))
-
-        # multiple
-
-        with ensure_clean_store(self.path) as store:
-
-            df1 = tm.makeTimeDataFrame(500)
-            store.append('df1',df1,data_columns=True)
-            df2 = tm.makeTimeDataFrame(500).rename(columns=lambda x: "%s_2" % x)
-            df2['foo'] = 'bar'
-            store.append('df2',df2)
-
-            df = concat([df1, df2], axis=1)
-
-            # full selection
-            expected = store.select_as_multiple(
-                ['df1', 'df2'], selector='df1')
-            results = [ s for s in store.select_as_multiple(
-                ['df1', 'df2'], selector='df1', chunksize=150) ]
-            result = concat(results)
-            tm.assert_frame_equal(expected, result)
-
-            # where selection
-            #expected = store.select_as_multiple(
-            #    ['df1', 'df2'], where= Term('A>0'), selector='df1')
-            #results = []
-            #for s in store.select_as_multiple(
-            #    ['df1', 'df2'], where= Term('A>0'), selector='df1', chunksize=25):
-            #    results.append(s)
-            #result = concat(results)
-            #tm.assert_frame_equal(expected, result)
-
-    def test_select_iterator_complete_8014(self):
-
-        # GH 8014
-        # using iterator and where clause
-        chunksize=1e4
-
-        # no iterator
-        with ensure_clean_store(self.path) as store:
-
-            expected = tm.makeTimeDataFrame(100064, 'S')
-            _maybe_remove(store, 'df')
-            store.append('df',expected)
-
-            beg_dt = expected.index[0]
-            end_dt = expected.index[-1]
-
-            # select w/o iteration and no where clause works
-            result = store.select('df')
-            tm.assert_frame_equal(expected, result)
-
-            # select w/o iterator and where clause, single term, begin
-            # of range, works
-            where = "index >= '%s'" % beg_dt
-            result = store.select('df',where=where)
-            tm.assert_frame_equal(expected, result)
-
-            # select w/o iterator and where clause, single term, end
-            # of range, works
-            where = "index <= '%s'" % end_dt
-            result = store.select('df',where=where)
-            tm.assert_frame_equal(expected, result)
-
-            # select w/o iterator and where clause, inclusive range,
-            # works
-            where = "index >= '%s' & index <= '%s'" % (beg_dt, end_dt)
-            result = store.select('df',where=where)
-            tm.assert_frame_equal(expected, result)
-
-        # with iterator, full range
-        with ensure_clean_store(self.path) as store:
-
-            expected = tm.makeTimeDataFrame(100064, 'S')
-            _maybe_remove(store, 'df')
-            store.append('df',expected)
-
-            beg_dt = expected.index[0]
-            end_dt = expected.index[-1]
-
-            # select w/iterator and no where clause works
-            results = [ s for s in store.select('df',chunksize=chunksize) ]
-            result = concat(results)
-            tm.assert_frame_equal(expected, result)
-
-            # select w/iterator and where clause, single term, begin of range
-            where = "index >= '%s'" % beg_dt
-            results = [ s for s in store.select('df',where=where,chunksize=chunksize) ]
-            result = concat(results)
-            tm.assert_frame_equal(expected, result)
-
-            # select w/iterator and where clause, single term, end of range
-            where = "index <= '%s'" % end_dt
-            results = [ s for s in store.select('df',where=where,chunksize=chunksize) ]
-            result = concat(results)
-            tm.assert_frame_equal(expected, result)
-
-            # select w/iterator and where clause, inclusive range
-            where = "index >= '%s' & index <= '%s'" % (beg_dt, end_dt)
-            results = [ s for s in store.select('df',where=where,chunksize=chunksize) ]
-            result = concat(results)
-            tm.assert_frame_equal(expected, result)
-
-    def test_select_iterator_non_complete_8014(self):
-
-        # GH 8014
-        # using iterator and where clause
-        chunksize=1e4
-
-        # with iterator, non complete range
-        with ensure_clean_store(self.path) as store:
-
-            expected = tm.makeTimeDataFrame(100064, 'S')
-            _maybe_remove(store, 'df')
-            store.append('df',expected)
-
-            beg_dt = expected.index[1]
-            end_dt = expected.index[-2]
-
-            # select w/iterator and where clause, single term, begin of range
-            where = "index >= '%s'" % beg_dt
-            results = [ s for s in store.select('df',where=where,chunksize=chunksize) ]
-            result = concat(results)
-            rexpected = expected[expected.index >= beg_dt]
-            tm.assert_frame_equal(rexpected, result)
-
-            # select w/iterator and where clause, single term, end of range
-            where = "index <= '%s'" % end_dt
-            results = [ s for s in store.select('df',where=where,chunksize=chunksize) ]
-            result = concat(results)
-            rexpected = expected[expected.index <= end_dt]
-            tm.assert_frame_equal(rexpected, result)
-
-            # select w/iterator and where clause, inclusive range
-            where = "index >= '%s' & index <= '%s'" % (beg_dt, end_dt)
-            results = [ s for s in store.select('df',where=where,chunksize=chunksize) ]
-            result = concat(results)
-            rexpected = expected[(expected.index >= beg_dt) & (expected.index <= end_dt)]
-            tm.assert_frame_equal(rexpected, result)
-
-        # with iterator, empty where
-        with ensure_clean_store(self.path) as store:
-
-            expected = tm.makeTimeDataFrame(100064, 'S')
-            _maybe_remove(store, 'df')
-            store.append('df',expected)
-
-            end_dt = expected.index[-1]
-
-            # select w/iterator and where clause, single term, begin of range
-            where = "index > '%s'" % end_dt
-            results = [ s for s in store.select('df',where=where,chunksize=chunksize) ]
-            self.assertEqual(0, len(results))
-
-    def test_select_iterator_many_empty_frames(self):
-
-        # GH 8014
-        # using iterator and where clause can return many empty
-        # frames.
-        chunksize=int(1e4)
-
-        # with iterator, range limited to the first chunk
-        with ensure_clean_store(self.path) as store:
-
-            expected = tm.makeTimeDataFrame(100000, 'S')
-            _maybe_remove(store, 'df')
-            store.append('df',expected)
-
-            beg_dt = expected.index[0]
-            end_dt = expected.index[chunksize-1]
-
-            # select w/iterator and where clause, single term, begin of range
-            where = "index >= '%s'" % beg_dt
-            results = [ s for s in store.select('df',where=where,chunksize=chunksize) ]
-            result = concat(results)
-            rexpected = expected[expected.index >= beg_dt]
-            tm.assert_frame_equal(rexpected, result)
-
-            # select w/iterator and where clause, single term, end of range
-            where = "index <= '%s'" % end_dt
-            results = [ s for s in store.select('df',where=where,chunksize=chunksize) ]
-
-            tm.assert_equal(1, len(results))
-            result = concat(results)
-            rexpected = expected[expected.index <= end_dt]
-            tm.assert_frame_equal(rexpected, result)
-
-            # select w/iterator and where clause, inclusive range
-            where = "index >= '%s' & index <= '%s'" % (beg_dt, end_dt)
-            results = [ s for s in store.select('df',where=where,chunksize=chunksize) ]
-
-            # should be 1, is 10
-            tm.assert_equal(1, len(results))
-            result = concat(results)
-            rexpected = expected[(expected.index >= beg_dt) & (expected.index <= end_dt)]
-            tm.assert_frame_equal(rexpected, result)
-
-            # select w/iterator and where clause which selects
-            # *nothing*.
-            #
-            # To be consistent with Python idiom I suggest this should
-            # return [] e.g. `for e in []: print True` never prints
-            # True.
-
-            where = "index <= '%s' & index >= '%s'" % (beg_dt, end_dt)
-            results = [ s for s in store.select('df',where=where,chunksize=chunksize) ]
-
-            # should be []
-            tm.assert_equal(0, len(results))
-
-
-    def test_retain_index_attributes(self):
-
-        # GH 3499, losing frequency info on index recreation
-        df = DataFrame(dict(A = Series(lrange(3),
-                                       index=date_range('2000-1-1',periods=3,freq='H'))))
-
-        with ensure_clean_store(self.path) as store:
-            _maybe_remove(store,'data')
-            store.put('data', df, format='table')
-
-            result = store.get('data')
-            tm.assert_frame_equal(df,result)
-
-            for attr in ['freq','tz','name']:
-                for idx in ['index','columns']:
-                    self.assertEqual(getattr(getattr(df,idx),attr,None),
-                                     getattr(getattr(result,idx),attr,None))
-
-
-            # try to append a table with a different frequency
-            with tm.assert_produces_warning(expected_warning=AttributeConflictWarning):
-                df2 = DataFrame(dict(A = Series(lrange(3),
-                                                index=date_range('2002-1-1',periods=3,freq='D'))))
-                store.append('data',df2)
-
-            self.assertIsNone(store.get_storer('data').info['index']['freq'])
-
-            # this is ok
-            _maybe_remove(store,'df2')
-            df2 = DataFrame(dict(A = Series(lrange(3),
-                                            index=[Timestamp('20010101'),Timestamp('20010102'),Timestamp('20020101')])))
-            store.append('df2',df2)
-            df3 = DataFrame(dict(A = Series(lrange(3),index=date_range('2002-1-1',periods=3,freq='D'))))
-            store.append('df2',df3)
-
-    def test_retain_index_attributes2(self):
-
-        with ensure_clean_path(self.path) as path:
-
-            expected_warning = Warning if compat.PY35 else AttributeConflictWarning
-            with tm.assert_produces_warning(expected_warning=expected_warning, check_stacklevel=False):
-
-                df  = DataFrame(dict(A = Series(lrange(3), index=date_range('2000-1-1',periods=3,freq='H'))))
-                df.to_hdf(path,'data',mode='w',append=True)
-                df2 = DataFrame(dict(A = Series(lrange(3), index=date_range('2002-1-1',periods=3,freq='D'))))
-                df2.to_hdf(path,'data',append=True)
-
-                idx = date_range('2000-1-1',periods=3,freq='H')
-                idx.name = 'foo'
-                df  = DataFrame(dict(A = Series(lrange(3), index=idx)))
-                df.to_hdf(path,'data',mode='w',append=True)
-
-            self.assertEqual(read_hdf(path,'data').index.name, 'foo')
-
-            with tm.assert_produces_warning(expected_warning=expected_warning, check_stacklevel=False):
-
-                idx2 = date_range('2001-1-1',periods=3,freq='H')
-                idx2.name = 'bar'
-                df2 = DataFrame(dict(A = Series(lrange(3), index=idx2)))
-                df2.to_hdf(path,'data',append=True)
-
-            self.assertIsNone(read_hdf(path,'data').index.name)
-
-    def test_panel_select(self):
-
-        wp = tm.makePanel()
-
-        with ensure_clean_store(self.path) as store:
-            store.put('wp', wp, format='table')
-            date = wp.major_axis[len(wp.major_axis) // 2]
-
-            crit1 = ('major_axis>=date')
-            crit2 = ("minor_axis=['A', 'D']")
-
-            result = store.select('wp', [crit1, crit2])
-            expected = wp.truncate(before=date).reindex(minor=['A', 'D'])
-            assert_panel_equal(result, expected)
-
-            result = store.select(
-                'wp', ['major_axis>="20000124"', ("minor_axis=['A', 'B']")])
-            expected = wp.truncate(before='20000124').reindex(minor=['A', 'B'])
-            assert_panel_equal(result, expected)
-
-    def test_frame_select(self):
-
-        df = tm.makeTimeDataFrame()
-
-        with ensure_clean_store(self.path) as store:
-            store.put('frame', df,format='table')
-            date = df.index[len(df) // 2]
-
-            crit1 = Term('index>=date')
-            self.assertEqual(crit1.env.scope['date'], date)
-
-            crit2 = ("columns=['A', 'D']")
-            crit3 = ('columns=A')
-
-            result = store.select('frame', [crit1, crit2])
-            expected = df.ix[date:, ['A', 'D']]
-            tm.assert_frame_equal(result, expected)
-
-            result = store.select('frame', [crit3])
-            expected = df.ix[:, ['A']]
-            tm.assert_frame_equal(result, expected)
-
-            # invalid terms
-            df = tm.makeTimeDataFrame()
-            store.append('df_time', df)
-            self.assertRaises(
-                ValueError, store.select, 'df_time', [Term("index>0")])
-
-            # can't select if not written as table
-            # store['frame'] = df
-            # self.assertRaises(ValueError, store.select,
-            #                  'frame', [crit1, crit2])
-
-    def test_frame_select_complex(self):
-        # select via complex criteria
-
-        df = tm.makeTimeDataFrame()
-        df['string'] = 'foo'
-        df.loc[df.index[0:4],'string'] = 'bar'
-
-        with ensure_clean_store(self.path) as store:
-            store.put('df', df, format='table', data_columns=['string'])
-
-            # empty
-            result = store.select('df', 'index>df.index[3] & string="bar"')
-            expected = df.loc[(df.index>df.index[3]) & (df.string=='bar')]
-            tm.assert_frame_equal(result, expected)
-
-            result = store.select('df', 'index>df.index[3] & string="foo"')
-            expected = df.loc[(df.index>df.index[3]) & (df.string=='foo')]
-            tm.assert_frame_equal(result, expected)
-
-            # or
-            result = store.select('df', 'index>df.index[3] | string="bar"')
-            expected = df.loc[(df.index>df.index[3]) | (df.string=='bar')]
-            tm.assert_frame_equal(result, expected)
-
-            result = store.select('df', '(index>df.index[3] & index<=df.index[6]) | string="bar"')
-            expected = df.loc[((df.index>df.index[3]) & (df.index<=df.index[6])) | (df.string=='bar')]
-            tm.assert_frame_equal(result, expected)
-
-            # invert
-            result = store.select('df', 'string!="bar"')
-            expected = df.loc[df.string!='bar']
-            tm.assert_frame_equal(result, expected)
-
-            # invert not implemented in numexpr :(
-            self.assertRaises(NotImplementedError, store.select, 'df', '~(string="bar")')
-
-            # invert ok for filters
-            result = store.select('df', "~(columns=['A','B'])")
-            expected = df.loc[:,df.columns.difference(['A','B'])]
-            tm.assert_frame_equal(result, expected)
-
-            # in
-            result = store.select('df', "index>df.index[3] & columns in ['A','B']")
-            expected = df.loc[df.index>df.index[3]].reindex(columns=['A','B'])
-            tm.assert_frame_equal(result, expected)
-
-    def test_frame_select_complex2(self):
-
-        with ensure_clean_path(['parms.hdf','hist.hdf']) as paths:
-
-            pp, hh = paths
-
-            # use non-trivial selection criteria
-            parms = DataFrame({ 'A' : [1,1,2,2,3] })
-            parms.to_hdf(pp,'df',mode='w',format='table',data_columns=['A'])
-
-            selection = read_hdf(pp,'df',where='A=[2,3]')
-            hist = DataFrame(np.random.randn(25,1),columns=['data'],
-                             index=MultiIndex.from_tuples([ (i,j) for i in range(5) for j in range(5) ],
-                                                          names=['l1','l2']))
-
-            hist.to_hdf(hh,'df',mode='w',format='table')
-
-            expected = read_hdf(hh,'df',where=Term('l1','=',[2,3,4]))
-
-            # list like
-            result = read_hdf(hh,'df',where=Term('l1','=',selection.index.tolist()))
-            assert_frame_equal(result, expected)
-            l = selection.index.tolist()
-
-            # sccope with list like
-            store = HDFStore(hh)
-            result = store.select('df',where='l1=l')
-            assert_frame_equal(result, expected)
-            store.close()
-
-            result = read_hdf(hh,'df',where='l1=l')
-            assert_frame_equal(result, expected)
-
-            # index
-            index = selection.index
-            result = read_hdf(hh,'df',where='l1=index')
-            assert_frame_equal(result, expected)
-
-            result = read_hdf(hh,'df',where='l1=selection.index')
-            assert_frame_equal(result, expected)
-
-            result = read_hdf(hh,'df',where='l1=selection.index.tolist()')
-            assert_frame_equal(result, expected)
-
-            result = read_hdf(hh,'df',where='l1=list(selection.index)')
-            assert_frame_equal(result, expected)
-
-            # sccope with index
-            store = HDFStore(hh)
-
-            result = store.select('df',where='l1=index')
-            assert_frame_equal(result, expected)
-
-            result = store.select('df',where='l1=selection.index')
-            assert_frame_equal(result, expected)
-
-            result = store.select('df',where='l1=selection.index.tolist()')
-            assert_frame_equal(result, expected)
-
-            result = store.select('df',where='l1=list(selection.index)')
-            assert_frame_equal(result, expected)
-
-            store.close()
-
-    def test_invalid_filtering(self):
-
-        # can't use more than one filter (atm)
-
-        df = tm.makeTimeDataFrame()
-
-        with ensure_clean_store(self.path) as store:
-            store.put('df', df, format='table')
-
-            # not implemented
-            self.assertRaises(NotImplementedError, store.select, 'df', "columns=['A'] | columns=['B']")
-
-            # in theory we could deal with this
-            self.assertRaises(NotImplementedError, store.select, 'df', "columns=['A','B'] & columns=['C']")
-
-    def test_string_select(self):
-        # GH 2973
-        with ensure_clean_store(self.path) as store:
-
-            df = tm.makeTimeDataFrame()
-
-            # test string ==/!=
-            df['x'] = 'none'
-            df.ix[2:7,'x'] = ''
-
-            store.append('df',df,data_columns=['x'])
-
-            result = store.select('df',Term('x=none'))
-            expected = df[df.x == 'none']
-            assert_frame_equal(result,expected)
-
-            try:
-                result = store.select('df',Term('x!=none'))
-                expected = df[df.x != 'none']
-                assert_frame_equal(result,expected)
-            except Exception as detail:
-                com.pprint_thing("[{0}]".format(detail))
-                com.pprint_thing(store)
-                com.pprint_thing(expected)
-
-            df2 = df.copy()
-            df2.loc[df2.x=='','x'] = np.nan
-
-            store.append('df2',df2,data_columns=['x'])
-            result = store.select('df2',Term('x!=none'))
-            expected = df2[isnull(df2.x)]
-            assert_frame_equal(result,expected)
-
-            # int ==/!=
-            df['int'] = 1
-            df.ix[2:7,'int'] = 2
-
-            store.append('df3',df,data_columns=['int'])
-
-            result = store.select('df3',Term('int=2'))
-            expected = df[df.int==2]
-            assert_frame_equal(result,expected)
-
-            result = store.select('df3',Term('int!=2'))
-            expected = df[df.int!=2]
-            assert_frame_equal(result,expected)
-
-    def test_read_column(self):
-
-        df = tm.makeTimeDataFrame()
-
-        with ensure_clean_store(self.path) as store:
-            _maybe_remove(store, 'df')
-            store.append('df', df)
-
-            # error
-            self.assertRaises(KeyError, store.select_column, 'df', 'foo')
-
-            def f():
-                store.select_column('df', 'index', where = ['index>5'])
-            self.assertRaises(Exception, f)
-
-            # valid
-            result = store.select_column('df', 'index')
-            tm.assert_almost_equal(result.values, Series(df.index).values)
-            self.assertIsInstance(result, Series)
-
-            # not a data indexable column
-            self.assertRaises(
-                ValueError, store.select_column, 'df', 'values_block_0')
-
-            # a data column
-            df2 = df.copy()
-            df2['string'] = 'foo'
-            store.append('df2', df2, data_columns=['string'])
-            result = store.select_column('df2', 'string')
-            tm.assert_almost_equal(result.values, df2['string'].values)
-
-            # a data column with NaNs, result excludes the NaNs
-            df3 = df.copy()
-            df3['string'] = 'foo'
-            df3.ix[4:6, 'string'] = np.nan
-            store.append('df3', df3, data_columns=['string'])
-            result = store.select_column('df3', 'string')
-            tm.assert_almost_equal(result.values, df3['string'].values)
-
-            # start/stop
-            result = store.select_column('df3', 'string', start=2)
-            tm.assert_almost_equal(result.values, df3['string'].values[2:])
-
-            result = store.select_column('df3', 'string', start=-2)
-            tm.assert_almost_equal(result.values, df3['string'].values[-2:])
-
-            result = store.select_column('df3', 'string', stop=2)
-            tm.assert_almost_equal(result.values, df3['string'].values[:2])
-
-            result = store.select_column('df3', 'string', stop=-2)
-            tm.assert_almost_equal(result.values, df3['string'].values[:-2])
-
-            result = store.select_column('df3', 'string', start=2, stop=-2)
-            tm.assert_almost_equal(result.values, df3['string'].values[2:-2])
-
-            result = store.select_column('df3', 'string', start=-2, stop=2)
-            tm.assert_almost_equal(result.values, df3['string'].values[-2:2])
-
-            # GH 10392 - make sure column name is preserved
-            df4 = DataFrame({'A': np.random.randn(10), 'B': 'foo'})
-            store.append('df4', df4, data_columns=True)
-            expected = df4['B']
-            result = store.select_column('df4', 'B')
-            tm.assert_series_equal(result, expected)
-
-
-    def test_coordinates(self):
-        df = tm.makeTimeDataFrame()
-
-        with ensure_clean_store(self.path) as store:
-
-            _maybe_remove(store, 'df')
-            store.append('df', df)
-
-            # all
-            c = store.select_as_coordinates('df')
-            assert((c.values == np.arange(len(df.index))).all() == True)
-
-            # get coordinates back & test vs frame
-            _maybe_remove(store, 'df')
-
-            df = DataFrame(dict(A=lrange(5), B=lrange(5)))
-            store.append('df', df)
-            c = store.select_as_coordinates('df', ['index<3'])
-            assert((c.values == np.arange(3)).all() == True)
-            result = store.select('df', where=c)
-            expected = df.ix[0:2, :]
-            tm.assert_frame_equal(result, expected)
-
-            c = store.select_as_coordinates('df', ['index>=3', 'index<=4'])
-            assert((c.values == np.arange(2) + 3).all() == True)
-            result = store.select('df', where=c)
-            expected = df.ix[3:4, :]
-            tm.assert_frame_equal(result, expected)
-            self.assertIsInstance(c, Index)
-
-            # multiple tables
-            _maybe_remove(store, 'df1')
-            _maybe_remove(store, 'df2')
-            df1 = tm.makeTimeDataFrame()
-            df2 = tm.makeTimeDataFrame().rename(columns=lambda x: "%s_2" % x)
-            store.append('df1', df1, data_columns=['A', 'B'])
-            store.append('df2', df2)
-
-            c = store.select_as_coordinates('df1', ['A>0', 'B>0'])
-            df1_result = store.select('df1', c)
-            df2_result = store.select('df2', c)
-            result = concat([df1_result, df2_result], axis=1)
-
-            expected = concat([df1, df2], axis=1)
-            expected = expected[(expected.A > 0) & (expected.B > 0)]
-            tm.assert_frame_equal(result, expected)
-
-        # pass array/mask as the coordinates
-        with ensure_clean_store(self.path) as store:
-
-            df = DataFrame(np.random.randn(1000,2),index=date_range('20000101',periods=1000))
-            store.append('df',df)
-            c = store.select_column('df','index')
-            where = c[DatetimeIndex(c).month==5].index
-            expected = df.iloc[where]
-
-            # locations
-            result = store.select('df',where=where)
-            tm.assert_frame_equal(result,expected)
-
-            # boolean
-            result = store.select('df',where=where)
-            tm.assert_frame_equal(result,expected)
-
-            # invalid
-            self.assertRaises(ValueError, store.select, 'df',where=np.arange(len(df),dtype='float64'))
-            self.assertRaises(ValueError, store.select, 'df',where=np.arange(len(df)+1))
-            self.assertRaises(ValueError, store.select, 'df',where=np.arange(len(df)),start=5)
-            self.assertRaises(ValueError, store.select, 'df',where=np.arange(len(df)),start=5,stop=10)
-
-            # selection with filter
-            selection = date_range('20000101',periods=500)
-            result = store.select('df', where='index in selection')
-            expected = df[df.index.isin(selection)]
-            tm.assert_frame_equal(result,expected)
-
-            # list
-            df = DataFrame(np.random.randn(10,2))
-            store.append('df2',df)
-            result = store.select('df2',where=[0,3,5])
-            expected = df.iloc[[0,3,5]]
-            tm.assert_frame_equal(result,expected)
-
-            # boolean
-            where = [True] * 10
-            where[-2] = False
-            result = store.select('df2',where=where)
-            expected = df.loc[where]
-            tm.assert_frame_equal(result,expected)
-
-            # start/stop
-            result = store.select('df2', start=5, stop=10)
-            expected = df[5:10]
-            tm.assert_frame_equal(result,expected)
-
-    def test_append_to_multiple(self):
-        df1 = tm.makeTimeDataFrame()
-        df2 = tm.makeTimeDataFrame().rename(columns=lambda x: "%s_2" % x)
-        df2['foo'] = 'bar'
-        df = concat([df1, df2], axis=1)
-
-        with ensure_clean_store(self.path) as store:
-
-            # exceptions
-            self.assertRaises(ValueError, store.append_to_multiple,
-                              {'df1': ['A', 'B'], 'df2': None}, df, selector='df3')
-            self.assertRaises(ValueError, store.append_to_multiple,
-                              {'df1': None, 'df2': None}, df, selector='df3')
-            self.assertRaises(
-                ValueError, store.append_to_multiple, 'df1', df, 'df1')
-
-            # regular operation
-            store.append_to_multiple(
-                {'df1': ['A', 'B'], 'df2': None}, df, selector='df1')
-            result = store.select_as_multiple(
-                ['df1', 'df2'], where=['A>0', 'B>0'], selector='df1')
-            expected = df[(df.A > 0) & (df.B > 0)]
-            tm.assert_frame_equal(result, expected)
-
-    def test_append_to_multiple_dropna(self):
-        df1 = tm.makeTimeDataFrame()
-        df2 = tm.makeTimeDataFrame().rename(columns=lambda x: "%s_2" % x)
-        df1.ix[1, ['A', 'B']] = np.nan
-        df = concat([df1, df2], axis=1)
-
-        with ensure_clean_store(self.path) as store:
-            # dropna=True should guarantee rows are synchronized
-            store.append_to_multiple(
-                {'df1': ['A', 'B'], 'df2': None}, df, selector='df1',
-                dropna=True)
-            result = store.select_as_multiple(['df1', 'df2'])
-            expected = df.dropna()
-            tm.assert_frame_equal(result, expected)
-            tm.assert_index_equal(store.select('df1').index,
-                                  store.select('df2').index)
-
-            # dropna=False shouldn't synchronize row indexes
-            store.append_to_multiple(
-                {'df1': ['A', 'B'], 'df2': None}, df, selector='df1',
-                dropna=False)
-            self.assertRaises(
-                ValueError, store.select_as_multiple, ['df1', 'df2'])
-            assert not store.select('df1').index.equals(
-                store.select('df2').index)
-
-    def test_select_as_multiple(self):
-
-        df1 = tm.makeTimeDataFrame()
-        df2 = tm.makeTimeDataFrame().rename(columns=lambda x: "%s_2" % x)
-        df2['foo'] = 'bar'
-
-        with ensure_clean_store(self.path) as store:
-
-            # no tables stored
-            self.assertRaises(Exception, store.select_as_multiple,
-                              None, where=['A>0', 'B>0'], selector='df1')
-
-            store.append('df1', df1, data_columns=['A', 'B'])
-            store.append('df2', df2)
-
-            # exceptions
-            self.assertRaises(Exception, store.select_as_multiple,
-                              None, where=['A>0', 'B>0'], selector='df1')
-            self.assertRaises(Exception, store.select_as_multiple,
-                              [None], where=['A>0', 'B>0'], selector='df1')
-            self.assertRaises(KeyError, store.select_as_multiple,
-                              ['df1','df3'], where=['A>0', 'B>0'], selector='df1')
-            self.assertRaises(KeyError, store.select_as_multiple,
-                              ['df3'], where=['A>0', 'B>0'], selector='df1')
-            self.assertRaises(KeyError, store.select_as_multiple,
-                              ['df1','df2'], where=['A>0', 'B>0'], selector='df4')
-
-            # default select
-            result = store.select('df1', ['A>0', 'B>0'])
-            expected = store.select_as_multiple(
-                ['df1'], where=['A>0', 'B>0'], selector='df1')
-            tm.assert_frame_equal(result, expected)
-            expected = store.select_as_multiple(
-                'df1', where=['A>0', 'B>0'], selector='df1')
-            tm.assert_frame_equal(result, expected)
-
-            # multiple
-            result = store.select_as_multiple(
-                ['df1', 'df2'], where=['A>0', 'B>0'], selector='df1')
-            expected = concat([df1, df2], axis=1)
-            expected = expected[(expected.A > 0) & (expected.B > 0)]
-            tm.assert_frame_equal(result, expected)
-
-            # multiple (diff selector)
-            result = store.select_as_multiple(['df1', 'df2'], where=[Term(
-                'index>df2.index[4]')], selector='df2')
-            expected = concat([df1, df2], axis=1)
-            expected = expected[5:]
-            tm.assert_frame_equal(result, expected)
-
-            # test excpection for diff rows
-            store.append('df3', tm.makeTimeDataFrame(nper=50))
-            self.assertRaises(ValueError, store.select_as_multiple,
-                              ['df1','df3'], where=['A>0', 'B>0'], selector='df1')
-
-    def test_nan_selection_bug_4858(self):
-
-        # GH 4858; nan selection bug, only works for pytables >= 3.1
-        if LooseVersion(tables.__version__) < '3.1.0':
-            raise nose.SkipTest('tables version does not support fix for nan selection bug: GH 4858')
-
-        with ensure_clean_store(self.path) as store:
-
-            df = DataFrame(dict(cols = range(6), values = range(6)), dtype='float64')
-            df['cols'] = (df['cols']+10).apply(str)
-            df.iloc[0] = np.nan
-
-            expected = DataFrame(dict(cols = ['13.0','14.0','15.0'], values = [3.,4.,5.]), index=[3,4,5])
-
-            # write w/o the index on that particular column
-            store.append('df',df, data_columns=True,index=['cols'])
-            result = store.select('df',where='values>2.0')
-            assert_frame_equal(result,expected)
-
-    def test_start_stop(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            df = DataFrame(dict(A=np.random.rand(20), B=np.random.rand(20)))
-            store.append('df', df)
-
-            result = store.select(
-                'df', [Term("columns=['A']")], start=0, stop=5)
-            expected = df.ix[0:4, ['A']]
-            tm.assert_frame_equal(result, expected)
-
-            # out of range
-            result = store.select(
-                'df', [Term("columns=['A']")], start=30, stop=40)
-            assert(len(result) == 0)
-            assert(type(result) == DataFrame)
-
-    def test_select_filter_corner(self):
-
-        df = DataFrame(np.random.randn(50, 100))
-        df.index = ['%.3d' % c for c in df.index]
-        df.columns = ['%.3d' % c for c in df.columns]
-
-        with ensure_clean_store(self.path) as store:
-            store.put('frame', df, format='table')
-
-            crit = Term('columns=df.columns[:75]')
-            result = store.select('frame', [crit])
-            tm.assert_frame_equal(result, df.ix[:, df.columns[:75]])
-
-            crit = Term('columns=df.columns[:75:2]')
-            result = store.select('frame', [crit])
-            tm.assert_frame_equal(result, df.ix[:, df.columns[:75:2]])
-
-    def _check_roundtrip(self, obj, comparator, compression=False, **kwargs):
-
-        options = {}
-        if compression:
-            options['complib'] = _default_compressor
-
-        with ensure_clean_store(self.path, 'w', **options) as store:
-            store['obj'] = obj
-            retrieved = store['obj']
-            comparator(retrieved, obj, **kwargs)
-
-    def _check_double_roundtrip(self, obj, comparator, compression=False,
-                                **kwargs):
-        options = {}
-        if compression:
-            options['complib'] = compression or _default_compressor
-
-        with ensure_clean_store(self.path, 'w', **options) as store:
-            store['obj'] = obj
-            retrieved = store['obj']
-            comparator(retrieved, obj, **kwargs)
-            store['obj'] = retrieved
-            again = store['obj']
-            comparator(again, obj, **kwargs)
-
-    def _check_roundtrip_table(self, obj, comparator, compression=False):
-        options = {}
-        if compression:
-            options['complib'] = _default_compressor
-
-        with ensure_clean_store(self.path, 'w', **options) as store:
-            store.put('obj', obj, format='table')
-            retrieved = store['obj']
-            # sorted_obj = _test_sort(obj)
-            comparator(retrieved, obj)
-
-    def test_multiple_open_close(self):
-        # GH 4409, open & close multiple times
-
-        with ensure_clean_path(self.path) as path:
-
-            df = tm.makeDataFrame()
-            df.to_hdf(path,'df',mode='w',format='table')
-
-            # single
-            store = HDFStore(path)
-            self.assertNotIn('CLOSED', str(store))
-            self.assertTrue(store.is_open)
-            store.close()
-            self.assertIn('CLOSED', str(store))
-            self.assertFalse(store.is_open)
-
-        with ensure_clean_path(self.path) as path:
-
-            if pytables._table_file_open_policy_is_strict:
-
-                # multiples
-                store1 = HDFStore(path)
-                def f():
-                    HDFStore(path)
-                self.assertRaises(ValueError, f)
-                store1.close()
-
-            else:
-
-                # multiples
-                store1 = HDFStore(path)
-                store2 = HDFStore(path)
-
-                self.assertNotIn('CLOSED', str(store1))
-                self.assertNotIn('CLOSED', str(store2))
-                self.assertTrue(store1.is_open)
-                self.assertTrue(store2.is_open)
-
-                store1.close()
-                self.assertIn('CLOSED', str(store1))
-                self.assertFalse(store1.is_open)
-                self.assertNotIn('CLOSED', str(store2))
-                self.assertTrue(store2.is_open)
-
-                store2.close()
-                self.assertIn('CLOSED', str(store1))
-                self.assertIn('CLOSED', str(store2))
-                self.assertFalse(store1.is_open)
-                self.assertFalse(store2.is_open)
-
-                # nested close
-                store = HDFStore(path,mode='w')
-                store.append('df',df)
-
-                store2 = HDFStore(path)
-                store2.append('df2',df)
-                store2.close()
-                self.assertIn('CLOSED', str(store2))
-                self.assertFalse(store2.is_open)
-
-                store.close()
-                self.assertIn('CLOSED', str(store))
-                self.assertFalse(store.is_open)
-
-                # double closing
-                store = HDFStore(path,mode='w')
-                store.append('df', df)
-
-                store2 = HDFStore(path)
-                store.close()
-                self.assertIn('CLOSED', str(store))
-                self.assertFalse(store.is_open)
-
-                store2.close()
-                self.assertIn('CLOSED', str(store2))
-                self.assertFalse(store2.is_open)
-
-        # ops on a closed store
-        with ensure_clean_path(self.path) as path:
-
-            df = tm.makeDataFrame()
-            df.to_hdf(path,'df',mode='w',format='table')
-
-            store = HDFStore(path)
-            store.close()
-
-            self.assertRaises(ClosedFileError, store.keys)
-            self.assertRaises(ClosedFileError, lambda : 'df' in store)
-            self.assertRaises(ClosedFileError, lambda : len(store))
-            self.assertRaises(ClosedFileError, lambda : store['df'])
-            self.assertRaises(ClosedFileError, lambda : store.df)
-            self.assertRaises(ClosedFileError, store.select, 'df')
-            self.assertRaises(ClosedFileError, store.get, 'df')
-            self.assertRaises(ClosedFileError, store.append, 'df2', df)
-            self.assertRaises(ClosedFileError, store.put, 'df3', df)
-            self.assertRaises(ClosedFileError, store.get_storer, 'df2')
-            self.assertRaises(ClosedFileError, store.remove, 'df2')
-
-            def f():
-                store.select('df')
-            tm.assertRaisesRegexp(ClosedFileError, 'file is not open', f)
-
-    def test_pytables_native_read(self):
-
-        with ensure_clean_store(tm.get_data_path('legacy_hdf/pytables_native.h5'), mode='r') as store:
-            d2 = store['detector/readout']
-            self.assertIsInstance(d2, DataFrame)
-
-        with ensure_clean_store(tm.get_data_path('legacy_hdf/pytables_native2.h5'), mode='r') as store:
-            str(store)
-            d1 = store['detector']
-            self.assertIsInstance(d1, DataFrame)
-
-    def test_legacy_read(self):
-        with ensure_clean_store(tm.get_data_path('legacy_hdf/legacy.h5'), mode='r') as store:
-            store['a']
-            store['b']
-            store['c']
-            store['d']
-
-    def test_legacy_table_read(self):
-        # legacy table types
-        with ensure_clean_store(tm.get_data_path('legacy_hdf/legacy_table.h5'), mode='r') as store:
-            store.select('df1')
-            store.select('df2')
-            store.select('wp1')
-
-            # force the frame
-            store.select('df2', typ='legacy_frame')
-
-            # old version warning
-            with tm.assert_produces_warning(expected_warning=IncompatibilityWarning):
-                self.assertRaises(
-                    Exception, store.select, 'wp1', Term('minor_axis=B'))
-
-                df2 = store.select('df2')
-                result = store.select('df2', Term('index>df2.index[2]'))
-                expected = df2[df2.index > df2.index[2]]
-                assert_frame_equal(expected, result)
-
-    def test_legacy_0_10_read(self):
-        # legacy from 0.10
-        with ensure_clean_store(tm.get_data_path('legacy_hdf/legacy_0.10.h5'), mode='r') as store:
-            str(store)
-            for k in store.keys():
-                store.select(k)
-
-    def test_legacy_0_11_read(self):
-        # legacy from 0.11
-        path = os.path.join('legacy_hdf', 'legacy_table_0.11.h5')
-        with ensure_clean_store(tm.get_data_path(path), mode='r') as store:
-            str(store)
-            assert 'df' in store
-            assert 'df1' in store
-            assert 'mi' in store
-            df = store.select('df')
-            df1 = store.select('df1')
-            mi = store.select('mi')
-            assert isinstance(df, DataFrame)
-            assert isinstance(df1, DataFrame)
-            assert isinstance(mi, DataFrame)
-
-    def test_copy(self):
-
-        def do_copy(f = None, new_f = None, keys = None, propindexes = True, **kwargs):
-            try:
-                if f is None:
-                    f = tm.get_data_path(os.path.join('legacy_hdf',
-                                                      'legacy_0.10.h5'))
-
-
-                store = HDFStore(f, 'r')
-
-                if new_f is None:
-                    import tempfile
-                    fd, new_f = tempfile.mkstemp()
-
-                tstore = store.copy(new_f, keys = keys, propindexes = propindexes, **kwargs)
-
-                # check keys
-                if keys is None:
-                    keys = store.keys()
-                self.assertEqual(set(keys), set(tstore.keys()))
-
-                # check indicies & nrows
-                for k in tstore.keys():
-                    if tstore.get_storer(k).is_table:
-                        new_t = tstore.get_storer(k)
-                        orig_t = store.get_storer(k)
-
-                        self.assertEqual(orig_t.nrows, new_t.nrows)
-
-                        # check propindixes
-                        if propindexes:
-                            for a in orig_t.axes:
-                                if a.is_indexed:
-                                    self.assertTrue(new_t[a.name].is_indexed)
-
-            finally:
-                safe_close(store)
-                safe_close(tstore)
-                try:
-                    os.close(fd)
-                except:
-                    pass
-                safe_remove(new_f)
-
-        do_copy()
-        do_copy(keys = ['/a','/b','/df1_mixed'])
-        do_copy(propindexes = False)
-
-        # new table
-        df = tm.makeDataFrame()
-
-        try:
-            path = create_tempfile(self.path)
-            st = HDFStore(path)
-            st.append('df', df, data_columns = ['A'])
-            st.close()
-            do_copy(f = path)
-            do_copy(f = path, propindexes = False)
-        finally:
-            safe_remove(path)
-
-    def test_legacy_table_write(self):
-        raise nose.SkipTest("cannot write legacy tables")
-
-        store = HDFStore(tm.get_data_path('legacy_hdf/legacy_table_%s.h5' % pandas.__version__), 'a')
-
-        df = tm.makeDataFrame()
-        wp = tm.makePanel()
-
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['foo', 'bar'])
-        df = DataFrame(np.random.randn(10, 3), index=index,
-                       columns=['A', 'B', 'C'])
-        store.append('mi', df)
-
-        df = DataFrame(dict(A = 'foo', B = 'bar'),index=lrange(10))
-        store.append('df', df, data_columns = ['B'], min_itemsize={'A' : 200 })
-        store.append('wp', wp)
-
-        store.close()
-
-    def test_store_datetime_fractional_secs(self):
-
-        with ensure_clean_store(self.path) as store:
-            dt = datetime.datetime(2012, 1, 2, 3, 4, 5, 123456)
-            series = Series([0], [dt])
-            store['a'] = series
-            self.assertEqual(store['a'].index[0], dt)
-
-    def test_tseries_indices_series(self):
-
-        with ensure_clean_store(self.path) as store:
-            idx = tm.makeDateIndex(10)
-            ser = Series(np.random.randn(len(idx)), idx)
-            store['a'] = ser
-            result = store['a']
-
-            assert_series_equal(result, ser)
-            self.assertEqual(type(result.index), type(ser.index))
-            self.assertEqual(result.index.freq, ser.index.freq)
-
-            idx = tm.makePeriodIndex(10)
-            ser = Series(np.random.randn(len(idx)), idx)
-            store['a'] = ser
-            result = store['a']
-
-            assert_series_equal(result, ser)
-            self.assertEqual(type(result.index), type(ser.index))
-            self.assertEqual(result.index.freq, ser.index.freq)
-
-    def test_tseries_indices_frame(self):
-
-        with ensure_clean_store(self.path) as store:
-            idx = tm.makeDateIndex(10)
-            df = DataFrame(np.random.randn(len(idx), 3), index=idx)
-            store['a'] = df
-            result = store['a']
-
-            assert_frame_equal(result, df)
-            self.assertEqual(type(result.index), type(df.index))
-            self.assertEqual(result.index.freq, df.index.freq)
-
-            idx = tm.makePeriodIndex(10)
-            df = DataFrame(np.random.randn(len(idx), 3), idx)
-            store['a'] = df
-            result = store['a']
-
-            assert_frame_equal(result, df)
-            self.assertEqual(type(result.index), type(df.index))
-            self.assertEqual(result.index.freq, df.index.freq)
-
-    def test_unicode_index(self):
-
-        unicode_values = [u('\u03c3'), u('\u03c3\u03c3')]
-        def f():
-            s = Series(np.random.randn(len(unicode_values)), unicode_values)
-            self._check_roundtrip(s, tm.assert_series_equal)
-
-        compat_assert_produces_warning(PerformanceWarning, f)
-
-
-    def test_unicode_longer_encoded(self):
-        # GH 11234
-        char = '\u0394'
-        df = pd.DataFrame({'A': [char]})
-        with ensure_clean_store(self.path) as store:
-            store.put('df', df, format='table', encoding='utf-8')
-            result = store.get('df')
-            tm.assert_frame_equal(result, df)
-
-        df = pd.DataFrame({'A': ['a', char], 'B': ['b', 'b']})
-        with ensure_clean_store(self.path) as store:
-            store.put('df', df, format='table', encoding='utf-8')
-            result = store.get('df')
-            tm.assert_frame_equal(result, df)
-
-    def test_store_datetime_mixed(self):
-
-        df = DataFrame(
-            {'a': [1, 2, 3], 'b': [1., 2., 3.], 'c': ['a', 'b', 'c']})
-        ts = tm.makeTimeSeries()
-        df['d'] = ts.index[:3]
-        self._check_roundtrip(df, tm.assert_frame_equal)
-
-    # def test_cant_write_multiindex_table(self):
-    #    # for now, #1848
-    #    df = DataFrame(np.random.randn(10, 4),
-    #                   index=[np.arange(5).repeat(2),
-    #                          np.tile(np.arange(2), 5)])
-
-    #    self.assertRaises(Exception, store.put, 'foo', df, format='table')
-
-    def test_append_with_diff_col_name_types_raises_value_error(self):
-        df = DataFrame(np.random.randn(10, 1))
-        df2 = DataFrame({'a': np.random.randn(10)})
-        df3 = DataFrame({(1, 2): np.random.randn(10)})
-        df4 = DataFrame({('1', 2): np.random.randn(10)})
-        df5 = DataFrame({('1', 2, object): np.random.randn(10)})
-
-        with ensure_clean_store(self.path) as store:
-            name = 'df_%s' % tm.rands(10)
-            store.append(name, df)
-
-            for d in (df2, df3, df4, df5):
-                with tm.assertRaises(ValueError):
-                    store.append(name, d)
-
-    def test_query_with_nested_special_character(self):
-        df = DataFrame({'a': ['a', 'a', 'c', 'b', 'test & test', 'c' , 'b', 'e'],
-                        'b': [1, 2, 3, 4, 5, 6, 7, 8]})
-        expected = df[df.a == 'test & test']
-        with ensure_clean_store(self.path) as store:
-            store.append('test', df, format='table', data_columns=True)
-            result = store.select('test', 'a = "test & test"')
-        tm.assert_frame_equal(expected, result)
-
-    def test_categorical(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            # basic
-            _maybe_remove(store, 's')
-            s = Series(Categorical(['a', 'b', 'b', 'a', 'a', 'c'], categories=['a','b','c','d'], ordered=False))
-            store.append('s', s, format='table')
-            result = store.select('s')
-            tm.assert_series_equal(s, result)
-
-            _maybe_remove(store, 's_ordered')
-            s = Series(Categorical(['a', 'b', 'b', 'a', 'a', 'c'], categories=['a','b','c','d'], ordered=True))
-            store.append('s_ordered', s, format='table')
-            result = store.select('s_ordered')
-            tm.assert_series_equal(s, result)
-
-            _maybe_remove(store, 'df')
-            df = DataFrame({"s":s, "vals":[1,2,3,4,5,6]})
-            store.append('df', df, format='table')
-            result = store.select('df')
-            tm.assert_frame_equal(result, df)
-
-            # dtypes
-            s = Series([1,1,2,2,3,4,5]).astype('category')
-            store.append('si',s)
-            result = store.select('si')
-            tm.assert_series_equal(result, s)
-
-            s = Series([1,1,np.nan,2,3,4,5]).astype('category')
-            store.append('si2',s)
-            result = store.select('si2')
-            tm.assert_series_equal(result, s)
-
-            # multiple
-            df2 = df.copy()
-            df2['s2'] = Series(list('abcdefg')).astype('category')
-            store.append('df2',df2)
-            result = store.select('df2')
-            tm.assert_frame_equal(result, df2)
-
-            # make sure the metadata is ok
-            self.assertTrue('/df2   ' in str(store))
-            self.assertTrue('/df2/meta/values_block_0/meta' in str(store))
-            self.assertTrue('/df2/meta/values_block_1/meta' in str(store))
-
-            # unordered
-            s = Series(Categorical(['a', 'b', 'b', 'a', 'a', 'c'], categories=['a','b','c','d'],ordered=False))
-            store.append('s2', s, format='table')
-            result = store.select('s2')
-            tm.assert_series_equal(result, s)
-
-            # query
-            store.append('df3', df, data_columns=['s'])
-            expected = df[df.s.isin(['b','c'])]
-            result = store.select('df3', where = ['s in ["b","c"]'])
-            tm.assert_frame_equal(result, expected)
-
-            expected = df[df.s.isin(['b','c'])]
-            result = store.select('df3', where = ['s = ["b","c"]'])
-            tm.assert_frame_equal(result, expected)
-
-            expected = df[df.s.isin(['d'])]
-            result = store.select('df3', where = ['s in ["d"]'])
-            tm.assert_frame_equal(result, expected)
-
-            expected = df[df.s.isin(['f'])]
-            result = store.select('df3', where = ['s in ["f"]'])
-            tm.assert_frame_equal(result, expected)
-
-            # appending with same categories is ok
-            store.append('df3', df)
-
-            df = concat([df,df])
-            expected = df[df.s.isin(['b','c'])]
-            result = store.select('df3', where = ['s in ["b","c"]'])
-            tm.assert_frame_equal(result, expected)
-
-            # appending must have the same categories
-            df3 = df.copy()
-            df3['s'].cat.remove_unused_categories(inplace=True)
-
-            self.assertRaises(ValueError, lambda : store.append('df3', df3))
-
-            # remove
-            # make sure meta data is removed (its a recursive removal so should be)
-            result = store.select('df3/meta/s/meta')
-            self.assertIsNotNone(result)
-            store.remove('df3')
-            self.assertRaises(KeyError, lambda : store.select('df3/meta/s/meta'))
-
-    def test_duplicate_column_name(self):
-        df = DataFrame(columns=["a", "a"], data=[[0, 0]])
-
-        with ensure_clean_path(self.path) as path:
-            self.assertRaises(ValueError, df.to_hdf, path, 'df', format='fixed')
-
-            df.to_hdf(path, 'df', format='table')
-            other = read_hdf(path, 'df')
-
-            tm.assert_frame_equal(df, other)
-            self.assertTrue(df.equals(other))
-            self.assertTrue(other.equals(df))
-
-    def test_round_trip_equals(self):
-        # GH 9330
-        df = DataFrame({"B": [1,2], "A": ["x","y"]})
-
-        with ensure_clean_path(self.path) as path:
-            df.to_hdf(path, 'df', format='table')
-            other = read_hdf(path, 'df')
-            tm.assert_frame_equal(df, other)
-            self.assertTrue(df.equals(other))
-            self.assertTrue(other.equals(df))
-
-    def test_preserve_timedeltaindex_type(self):
-        # GH9635
-        # Storing TimedeltaIndexed DataFrames in fixed stores did not preserve
-        # the type of the index.
-        df = DataFrame(np.random.normal(size=(10,5)))
-        df.index = timedelta_range(start='0s',periods=10,freq='1s',name='example')
-
-        with ensure_clean_store(self.path) as store:
-
-            store['df'] = df
-            assert_frame_equal(store['df'], df)
-
-    def test_colums_multiindex_modified(self):
-        # BUG: 7212
-        # read_hdf store.select modified the passed columns parameters
-        # when multi-indexed.
-
-        df = DataFrame(np.random.rand(4, 5),
-                       index=list('abcd'),
-                       columns=list('ABCDE'))
-        df.index.name = 'letters'
-        df = df.set_index(keys='E', append=True)
-
-        data_columns = df.index.names+df.columns.tolist()
-        with ensure_clean_path(self.path) as path:
-            df.to_hdf(path, 'df',
-                      mode='a',
-                      append=True,
-                      data_columns=data_columns,
-                      index=False)
-            cols2load = list('BCD')
-            cols2load_original = list(cols2load)
-            df_loaded = read_hdf(path, 'df', columns=cols2load)
-            self.assertTrue(cols2load_original == cols2load)
-
-    def test_to_hdf_with_object_column_names(self):
-        # GH9057
-        # Writing HDF5 table format should only work for string-like
-        # column types
-
-        types_should_fail = [ tm.makeIntIndex, tm.makeFloatIndex,
-                                tm.makeDateIndex, tm.makeTimedeltaIndex,
-                                tm.makePeriodIndex ]
-        types_should_run = [ tm.makeStringIndex, tm.makeCategoricalIndex ]
-
-        if compat.PY3:
-            types_should_run.append(tm.makeUnicodeIndex)
-        else:
-            types_should_fail.append(tm.makeUnicodeIndex)
-
-        for index in types_should_fail:
-            df = DataFrame(np.random.randn(10, 2), columns=index(2))
-            with ensure_clean_path(self.path) as path:
-                with self.assertRaises(ValueError,
-                        msg="cannot have non-object label DataIndexableCol"):
-                    df.to_hdf(path, 'df', format='table', data_columns=True)
-
-        for index in types_should_run:
-            df = DataFrame(np.random.randn(10, 2), columns=index(2))
-            with ensure_clean_path(self.path) as path:
-                df.to_hdf(path, 'df', format='table', data_columns=True)
-                result = pd.read_hdf(path, 'df', where="index = [{0}]".format(df.index[0]))
-                assert(len(result))
-
-
-    def test_read_hdf_open_store(self):
-        # GH10330
-        # No check for non-string path_or-buf, and no test of open store
-        df = DataFrame(np.random.rand(4, 5),
-                       index=list('abcd'),
-                       columns=list('ABCDE'))
-        df.index.name = 'letters'
-        df = df.set_index(keys='E', append=True)
-
-        with ensure_clean_path(self.path) as path:
-            df.to_hdf(path, 'df', mode='w')
-            direct = read_hdf(path, 'df')
-            store = HDFStore(path, mode='r')
-            indirect = read_hdf(store, 'df')
-            tm.assert_frame_equal(direct, indirect)
-            self.assertTrue(store.is_open)
-            store.close()
-
-    def test_read_hdf_iterator(self):
-        df = DataFrame(np.random.rand(4, 5),
-                       index=list('abcd'),
-                       columns=list('ABCDE'))
-        df.index.name = 'letters'
-        df = df.set_index(keys='E', append=True)
-
-        with ensure_clean_path(self.path) as path:
-            df.to_hdf(path, 'df', mode='w', format='t')
-            direct = read_hdf(path, 'df')
-            iterator = read_hdf(path, 'df', iterator=True)
-            self.assertTrue(isinstance(iterator, TableIterator))
-            indirect = next(iterator.__iter__())
-            tm.assert_frame_equal(direct, indirect)
-            iterator.store.close()
-
-    def test_read_hdf_errors(self):
-        df = DataFrame(np.random.rand(4, 5),
-                       index=list('abcd'),
-                       columns=list('ABCDE'))
-
-        with ensure_clean_path(self.path) as path:
-            self.assertRaises(IOError, read_hdf, path, 'key')
-            df.to_hdf(path, 'df')
-            store = HDFStore(path, mode='r')
-            store.close()
-            self.assertRaises(IOError, read_hdf, store, 'df')
-            with open(path, mode='r') as store:
-                self.assertRaises(NotImplementedError, read_hdf, store, 'df')
-
-    def test_invalid_complib(self):
-        df = DataFrame(np.random.rand(4, 5),
-                       index=list('abcd'),
-                       columns=list('ABCDE'))
-        with ensure_clean_path(self.path) as path:
-            self.assertRaises(ValueError, df.to_hdf, path, 'df', complib='blosc:zlib')
-    # GH10443
-    def test_read_nokey(self):
-        df = DataFrame(np.random.rand(4, 5),
-                       index=list('abcd'),
-                       columns=list('ABCDE'))
-        with ensure_clean_path(self.path) as path:
-            df.to_hdf(path, 'df', mode='a')
-            reread = read_hdf(path)
-            assert_frame_equal(df, reread)
-            df.to_hdf(path, 'df2', mode='a')
-            self.assertRaises(ValueError, read_hdf, path)
-
-
-class TestHDFComplexValues(Base):
-    # GH10447
-    def test_complex_fixed(self):
-        df = DataFrame(np.random.rand(4, 5).astype(np.complex64),
-                       index=list('abcd'),
-                       columns=list('ABCDE'))
-
-        with ensure_clean_path(self.path) as path:
-            df.to_hdf(path, 'df')
-            reread = read_hdf(path, 'df')
-            assert_frame_equal(df, reread)
-
-        df = DataFrame(np.random.rand(4, 5).astype(np.complex128),
-                       index=list('abcd'),
-                       columns=list('ABCDE'))
-        with ensure_clean_path(self.path) as path:
-            df.to_hdf(path, 'df')
-            reread = read_hdf(path, 'df')
-            assert_frame_equal(df, reread)
-
-    def test_complex_table(self):
-        df = DataFrame(np.random.rand(4, 5).astype(np.complex64),
-                       index=list('abcd'),
-                       columns=list('ABCDE'))
-
-        with ensure_clean_path(self.path) as path:
-            df.to_hdf(path, 'df', format='table')
-            reread = read_hdf(path, 'df')
-            assert_frame_equal(df, reread)
-
-        df = DataFrame(np.random.rand(4, 5).astype(np.complex128),
-                       index=list('abcd'),
-                       columns=list('ABCDE'))
-
-        with ensure_clean_path(self.path) as path:
-            df.to_hdf(path, 'df', format='table', mode='w')
-            reread = read_hdf(path, 'df')
-            assert_frame_equal(df, reread)
-
-    def test_complex_mixed_fixed(self):
-        complex64 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j], dtype=np.complex64)
-        complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j],
-                              dtype=np.complex128)
-        df = DataFrame({'A': [1, 2, 3, 4],
-                        'B': ['a', 'b', 'c', 'd'],
-                        'C': complex64,
-                        'D': complex128,
-                        'E': [1.0, 2.0, 3.0, 4.0]},
-                       index=list('abcd'))
-        with ensure_clean_path(self.path) as path:
-            df.to_hdf(path, 'df')
-            reread = read_hdf(path, 'df')
-            assert_frame_equal(df, reread)
-
-    def test_complex_mixed_table(self):
-        complex64 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j], dtype=np.complex64)
-        complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j],
-                              dtype=np.complex128)
-        df = DataFrame({'A': [1, 2, 3, 4],
-                        'B': ['a', 'b', 'c', 'd'],
-                        'C': complex64,
-                        'D': complex128,
-                        'E': [1.0, 2.0, 3.0, 4.0]},
-                       index=list('abcd'))
-
-        with ensure_clean_store(self.path) as store:
-            store.append('df', df, data_columns=['A', 'B'])
-            result = store.select('df', where=Term('A>2'))
-            assert_frame_equal(df.loc[df.A > 2], result)
-
-        with ensure_clean_path(self.path) as path:
-            df.to_hdf(path, 'df', format='table')
-            reread = read_hdf(path, 'df')
-            assert_frame_equal(df, reread)
-
-    def test_complex_across_dimensions_fixed(self):
-        complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j])
-        s = Series(complex128, index=list('abcd'))
-        df = DataFrame({'A': s, 'B': s})
-        p = Panel({'One': df, 'Two': df})
-
-        objs = [s, df, p]
-        comps = [tm.assert_series_equal, tm.assert_frame_equal,
-                 tm.assert_panel_equal]
-        for obj, comp in zip(objs, comps):
-            with ensure_clean_path(self.path) as path:
-                obj.to_hdf(path, 'obj', format='fixed')
-                reread = read_hdf(path, 'obj')
-                comp(obj, reread)
-
-    def test_complex_across_dimensions(self):
-        complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j])
-        s = Series(complex128, index=list('abcd'))
-        df = DataFrame({'A': s, 'B': s})
-        p = Panel({'One': df, 'Two': df})
-        p4d = pd.Panel4D({'i': p, 'ii': p})
-
-        objs = [df, p, p4d]
-        comps = [tm.assert_frame_equal, tm.assert_panel_equal,
-                 tm.assert_panel4d_equal]
-        for obj, comp in zip(objs, comps):
-            with ensure_clean_path(self.path) as path:
-                obj.to_hdf(path, 'obj', format='table')
-                reread = read_hdf(path, 'obj')
-                comp(obj, reread)
-
-    def test_complex_indexing_error(self):
-        complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j],
-                              dtype=np.complex128)
-        df = DataFrame({'A': [1, 2, 3, 4],
-                        'B': ['a', 'b', 'c', 'd'],
-                        'C': complex128},
-                       index=list('abcd'))
-        with ensure_clean_store(self.path) as store:
-            self.assertRaises(TypeError, store.append, 'df', df, data_columns=['C'])
-
-    def test_complex_series_error(self):
-        complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j])
-        s = Series(complex128, index=list('abcd'))
-
-        with ensure_clean_path(self.path) as path:
-            self.assertRaises(TypeError, s.to_hdf, path, 'obj', format='t')
-
-        with ensure_clean_path(self.path) as path:
-            s.to_hdf(path, 'obj', format='t', index=False)
-            reread = read_hdf(path, 'obj')
-            tm.assert_series_equal(s, reread)
-
-    def test_complex_append(self):
-        df = DataFrame({'a': np.random.randn(100).astype(np.complex128),
-                        'b': np.random.randn(100)})
-
-        with ensure_clean_store(self.path) as store:
-            store.append('df', df, data_columns=['b'])
-            store.append('df', df)
-            result = store.select('df')
-            assert_frame_equal(pd.concat([df, df], 0), result)
-
-class TestTimezones(Base, tm.TestCase):
-
-
-    def _compare_with_tz(self, a, b):
-        tm.assert_frame_equal(a, b)
-
-        # compare the zones on each element
-        for c in a.columns:
-            for i in a.index:
-                a_e = a.loc[i,c]
-                b_e = b.loc[i,c]
-                if not (a_e == b_e and a_e.tz == b_e.tz):
-                    raise AssertionError("invalid tz comparsion [%s] [%s]" % (a_e, b_e))
-
-    def test_append_with_timezones_dateutil(self):
-
-        from datetime import timedelta
-        tm._skip_if_no_dateutil()
-
-        # use maybe_get_tz instead of dateutil.tz.gettz to handle the windows filename issues.
-        from pandas.tslib import maybe_get_tz
-        gettz = lambda x: maybe_get_tz('dateutil/' + x)
-
-        # as columns
-        with ensure_clean_store(self.path) as store:
-
-            _maybe_remove(store, 'df_tz')
-            df = DataFrame(dict(A=[ Timestamp('20130102 2:00:00', tz=gettz('US/Eastern')) + timedelta(hours=1) * i for i in range(5) ]))
-
-            store.append('df_tz', df, data_columns=['A'])
-            result = store['df_tz']
-            self._compare_with_tz(result, df)
-            assert_frame_equal(result, df)
-
-            # select with tz aware
-            expected = df[df.A >= df.A[3]]
-            result = store.select('df_tz', where=Term('A>=df.A[3]'))
-            self._compare_with_tz(result, expected)
-
-            # ensure we include dates in DST and STD time here.
-            _maybe_remove(store, 'df_tz')
-            df = DataFrame(dict(A=Timestamp('20130102', tz=gettz('US/Eastern')), B=Timestamp('20130603', tz=gettz('US/Eastern'))), index=range(5))
-            store.append('df_tz', df)
-            result = store['df_tz']
-            self._compare_with_tz(result, df)
-            assert_frame_equal(result, df)
-
-            df = DataFrame(dict(A=Timestamp('20130102', tz=gettz('US/Eastern')), B=Timestamp('20130102', tz=gettz('EET'))), index=range(5))
-            self.assertRaises(ValueError, store.append, 'df_tz', df)
-
-            # this is ok
-            _maybe_remove(store, 'df_tz')
-            store.append('df_tz', df, data_columns=['A', 'B'])
-            result = store['df_tz']
-            self._compare_with_tz(result, df)
-            assert_frame_equal(result, df)
-
-            # can't append with diff timezone
-            df = DataFrame(dict(A=Timestamp('20130102', tz=gettz('US/Eastern')), B=Timestamp('20130102', tz=gettz('CET'))), index=range(5))
-            self.assertRaises(ValueError, store.append, 'df_tz', df)
-
-        # as index
-        with ensure_clean_store(self.path) as store:
-
-            # GH 4098 example
-            df = DataFrame(dict(A=Series(lrange(3), index=date_range('2000-1-1', periods=3, freq='H', tz=gettz('US/Eastern')))))
-
-            _maybe_remove(store, 'df')
-            store.put('df', df)
-            result = store.select('df')
-            assert_frame_equal(result, df)
-
-            _maybe_remove(store, 'df')
-            store.append('df', df)
-            result = store.select('df')
-            assert_frame_equal(result, df)
-
-    def test_append_with_timezones_pytz(self):
-
-        from datetime import timedelta
-
-        # as columns
-        with ensure_clean_store(self.path) as store:
-
-            _maybe_remove(store, 'df_tz')
-            df = DataFrame(dict(A = [ Timestamp('20130102 2:00:00',tz='US/Eastern') + timedelta(hours=1)*i for i in range(5) ]))
-            store.append('df_tz',df,data_columns=['A'])
-            result = store['df_tz']
-            self._compare_with_tz(result,df)
-            assert_frame_equal(result,df)
-
-            # select with tz aware
-            self._compare_with_tz(store.select('df_tz',where=Term('A>=df.A[3]')),df[df.A>=df.A[3]])
-
-            _maybe_remove(store, 'df_tz')
-            # ensure we include dates in DST and STD time here.
-            df = DataFrame(dict(A = Timestamp('20130102',tz='US/Eastern'), B = Timestamp('20130603',tz='US/Eastern')),index=range(5))
-            store.append('df_tz',df)
-            result = store['df_tz']
-            self._compare_with_tz(result,df)
-            assert_frame_equal(result,df)
-
-            df = DataFrame(dict(A = Timestamp('20130102',tz='US/Eastern'), B = Timestamp('20130102',tz='EET')),index=range(5))
-            self.assertRaises(ValueError, store.append, 'df_tz', df)
-
-            # this is ok
-            _maybe_remove(store, 'df_tz')
-            store.append('df_tz',df,data_columns=['A','B'])
-            result = store['df_tz']
-            self._compare_with_tz(result,df)
-            assert_frame_equal(result,df)
-
-            # can't append with diff timezone
-            df = DataFrame(dict(A = Timestamp('20130102',tz='US/Eastern'), B = Timestamp('20130102',tz='CET')),index=range(5))
-            self.assertRaises(ValueError, store.append, 'df_tz', df)
-
-        # as index
-        with ensure_clean_store(self.path) as store:
-
-            # GH 4098 example
-            df = DataFrame(dict(A = Series(lrange(3), index=date_range('2000-1-1',periods=3,freq='H', tz='US/Eastern'))))
-
-            _maybe_remove(store, 'df')
-            store.put('df',df)
-            result = store.select('df')
-            assert_frame_equal(result,df)
-
-            _maybe_remove(store, 'df')
-            store.append('df',df)
-            result = store.select('df')
-            assert_frame_equal(result,df)
-
-    def test_tseries_select_index_column(self):
-        # GH7777
-        # selecting a UTC datetimeindex column did
-        # not preserve UTC tzinfo set before storing
-
-        # check that no tz still works
-        rng = date_range('1/1/2000', '1/30/2000')
-        frame = DataFrame(np.random.randn(len(rng), 4), index=rng)
-
-        with ensure_clean_store(self.path) as store:
-            store.append('frame', frame)
-            result = store.select_column('frame', 'index')
-            self.assertEqual(rng.tz, DatetimeIndex(result.values).tz)
-
-        # check utc
-        rng = date_range('1/1/2000', '1/30/2000', tz='UTC')
-        frame = DataFrame(np.random.randn(len(rng), 4), index=rng)
-
-        with ensure_clean_store(self.path) as store:
-            store.append('frame', frame)
-            result = store.select_column('frame', 'index')
-            self.assertEqual(rng.tz, result.dt.tz)
-
-        # double check non-utc
-        rng = date_range('1/1/2000', '1/30/2000', tz='US/Eastern')
-        frame = DataFrame(np.random.randn(len(rng), 4), index=rng)
-
-        with ensure_clean_store(self.path) as store:
-            store.append('frame', frame)
-            result = store.select_column('frame', 'index')
-            self.assertEqual(rng.tz, result.dt.tz)
-
-    def test_timezones(self):
-        rng = date_range('1/1/2000', '1/30/2000', tz='US/Eastern')
-        frame = DataFrame(np.random.randn(len(rng), 4), index=rng)
-
-        with ensure_clean_store(self.path) as store:
-            store['frame'] = frame
-            recons = store['frame']
-            self.assertTrue(recons.index.equals(rng))
-            self.assertEqual(rng.tz, recons.index.tz)
-
-    def test_fixed_offset_tz(self):
-        rng = date_range('1/1/2000 00:00:00-07:00', '1/30/2000 00:00:00-07:00')
-        frame = DataFrame(np.random.randn(len(rng), 4), index=rng)
-
-        with ensure_clean_store(self.path) as store:
-            store['frame'] = frame
-            recons = store['frame']
-            self.assertTrue(recons.index.equals(rng))
-            self.assertEqual(rng.tz, recons.index.tz)
-
-    def test_store_timezone(self):
-        # GH2852
-        # issue storing datetime.date with a timezone as it resets when read back in a new timezone
-
-        import platform
-        if platform.system() == "Windows":
-            raise nose.SkipTest("timezone setting not supported on windows")
-
-        import datetime
-        import time
-        import os
-
-        # original method
-        with ensure_clean_store(self.path) as store:
-
-            today = datetime.date(2013,9,10)
-            df = DataFrame([1,2,3], index = [today, today, today])
-            store['obj1'] = df
-            result = store['obj1']
-            assert_frame_equal(result, df)
-
-        # with tz setting
-        orig_tz = os.environ.get('TZ')
-
-        def setTZ(tz):
-            if tz is None:
-                try:
-                    del os.environ['TZ']
-                except:
-                    pass
-            else:
-                os.environ['TZ']=tz
-                time.tzset()
-
-        try:
-
-            with ensure_clean_store(self.path) as store:
-
-                setTZ('EST5EDT')
-                today = datetime.date(2013,9,10)
-                df = DataFrame([1,2,3], index = [today, today, today])
-                store['obj1'] = df
-
-                setTZ('CST6CDT')
-                result = store['obj1']
-
-                assert_frame_equal(result, df)
-
-        finally:
-            setTZ(orig_tz)
-
-    def test_legacy_datetimetz_object(self):
-        # legacy from < 0.17.0
-        # 8260
-        expected = DataFrame(dict(A=Timestamp('20130102', tz='US/Eastern'), B=Timestamp('20130603', tz='CET')), index=range(5))
-        with ensure_clean_store(tm.get_data_path('legacy_hdf/datetimetz_object.h5'), mode='r') as store:
-            result = store['df']
-            assert_frame_equal(result, expected)
-
-def _test_sort(obj):
-    if isinstance(obj, DataFrame):
-        return obj.reindex(sorted(obj.index))
-    elif isinstance(obj, Panel):
-        return obj.reindex(major=sorted(obj.major_axis))
-    else:
-        raise ValueError('type not supported here')
-
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/io/tests/test_sas.py b/pandas/io/tests/test_sas.py
deleted file mode 100644
index 0e08252fdce97..0000000000000
--- a/pandas/io/tests/test_sas.py
+++ /dev/null
@@ -1,112 +0,0 @@
-import pandas as pd
-import pandas.util.testing as tm
-from pandas import compat
-from pandas.io.sas import XportReader, read_sas
-import numpy as np
-import os
-
-# CSV versions of test XPT files were obtained using the R foreign library
-
-# Numbers in a SAS xport file are always float64, so need to convert
-# before making comparisons.
-def numeric_as_float(data):
-    for v in data.columns:
-        if data[v].dtype is np.dtype('int64'):
-            data[v] = data[v].astype(np.float64)
-
-
-class TestXport(tm.TestCase):
-
-    def setUp(self):
-        self.dirpath = tm.get_data_path()
-        self.file01 = os.path.join(self.dirpath, "DEMO_G.XPT")
-        self.file02 = os.path.join(self.dirpath, "SSHSV1_A.XPT")
-        self.file03 = os.path.join(self.dirpath, "DRXFCD_G.XPT")
-
-
-    def test1(self):
-        # Tests with DEMO_G.XPT (all numeric file)
-
-        # Compare to this
-        data_csv = pd.read_csv(self.file01.replace(".XPT", ".csv"))
-        numeric_as_float(data_csv)
-
-        # Read full file
-        data = XportReader(self.file01).read()
-        tm.assert_frame_equal(data, data_csv)
-
-        # Test incremental read with `read` method.
-        reader = XportReader(self.file01)
-        data = reader.read(10)
-        tm.assert_frame_equal(data, data_csv.iloc[0:10, :])
-
-        # Test incremental read with `get_chunk` method.
-        reader = XportReader(self.file01, chunksize=10)
-        data = reader.get_chunk()
-        tm.assert_frame_equal(data, data_csv.iloc[0:10, :])
-
-        # Read full file with `read_sas` method
-        data = read_sas(self.file01)
-        tm.assert_frame_equal(data, data_csv)
-
-
-    def test1_index(self):
-        # Tests with DEMO_G.XPT using index (all numeric file)
-
-        # Compare to this
-        data_csv = pd.read_csv(self.file01.replace(".XPT", ".csv"))
-        data_csv = data_csv.set_index("SEQN")
-        numeric_as_float(data_csv)
-
-        # Read full file
-        data = XportReader(self.file01, index="SEQN").read()
-        tm.assert_frame_equal(data, data_csv)
-
-        # Test incremental read with `read` method.
-        reader = XportReader(self.file01, index="SEQN")
-        data = reader.read(10)
-        tm.assert_frame_equal(data, data_csv.iloc[0:10, :])
-
-        # Test incremental read with `get_chunk` method.
-        reader = XportReader(self.file01, index="SEQN", chunksize=10)
-        data = reader.get_chunk()
-        tm.assert_frame_equal(data, data_csv.iloc[0:10, :])
-
-
-    def test1_incremental(self):
-        # Test with DEMO_G.XPT, reading full file incrementally
-
-        data_csv = pd.read_csv(self.file01.replace(".XPT", ".csv"))
-        data_csv = data_csv.set_index("SEQN")
-        numeric_as_float(data_csv)
-
-        reader = XportReader(self.file01, index="SEQN", chunksize=1000)
-
-        all_data = [x for x in reader]
-        data = pd.concat(all_data, axis=0)
-
-        tm.assert_frame_equal(data, data_csv)
-
-
-    def test2(self):
-        # Test with SSHSV1_A.XPT
-
-        # Compare to this
-        data_csv = pd.read_csv(self.file02.replace(".XPT", ".csv"))
-        numeric_as_float(data_csv)
-
-        data = XportReader(self.file02).read()
-        tm.assert_frame_equal(data, data_csv)
-
-
-    def test3(self):
-        # Test with DRXFCD_G.XPT (contains text and numeric variables)
-
-        # Compare to this
-        data_csv = pd.read_csv(self.file03.replace(".XPT", ".csv"))
-
-        data = XportReader(self.file03).read()
-        tm.assert_frame_equal(data, data_csv)
-
-        data = read_sas(self.file03)
-        tm.assert_frame_equal(data, data_csv)
diff --git a/pandas/io/tests/test_sql.py b/pandas/io/tests/test_sql.py
deleted file mode 100644
index aced92ec8abd0..0000000000000
--- a/pandas/io/tests/test_sql.py
+++ /dev/null
@@ -1,2728 +0,0 @@
-"""SQL io tests
-
-The SQL tests are broken down in different classes:
-
-- `PandasSQLTest`: base class with common methods for all test classes
-- Tests for the public API (only tests with sqlite3)
-    - `_TestSQLApi` base class
-    - `TestSQLApi`: test the public API with sqlalchemy engine
-    - `TestSQLiteFallbackApi`: test the public API with a sqlite DBAPI connection
-- Tests for the different SQL flavors (flavor specific type conversions)
-    - Tests for the sqlalchemy mode: `_TestSQLAlchemy` is the base class with
-      common methods, `_TestSQLAlchemyConn` tests the API with a SQLAlchemy
-      Connection object. The different tested flavors (sqlite3, MySQL, PostgreSQL)
-      derive from the base class
-    - Tests for the fallback mode (`TestSQLiteFallback` and `TestMySQLLegacy`)
-
-"""
-
-from __future__ import print_function
-import unittest
-import sqlite3
-import csv
-import os
-import sys
-
-import nose
-import warnings
-import numpy as np
-import pandas as pd
-
-from datetime import datetime, date, time
-
-from pandas import DataFrame, Series, Index, MultiIndex, isnull, concat
-from pandas import date_range, to_datetime, to_timedelta, Timestamp
-import pandas.compat as compat
-from pandas.compat import StringIO, range, lrange, string_types
-from pandas.core import common as com
-from pandas.core.datetools import format as date_format
-
-import pandas.io.sql as sql
-from pandas.io.sql import read_sql_table, read_sql_query
-import pandas.util.testing as tm
-
-
-try:
-    import sqlalchemy
-    import sqlalchemy.schema
-    import sqlalchemy.sql.sqltypes as sqltypes
-    from sqlalchemy.ext import declarative
-    from sqlalchemy.orm import session as sa_session
-    SQLALCHEMY_INSTALLED = True
-except ImportError:
-    SQLALCHEMY_INSTALLED = False
-
-SQL_STRINGS = {
-    'create_iris': {
-        'sqlite': """CREATE TABLE iris (
-                "SepalLength" REAL,
-                "SepalWidth" REAL,
-                "PetalLength" REAL,
-                "PetalWidth" REAL,
-                "Name" TEXT
-            )""",
-        'mysql': """CREATE TABLE iris (
-                `SepalLength` DOUBLE,
-                `SepalWidth` DOUBLE,
-                `PetalLength` DOUBLE,
-                `PetalWidth` DOUBLE,
-                `Name` VARCHAR(200)
-            )""",
-        'postgresql': """CREATE TABLE iris (
-                "SepalLength" DOUBLE PRECISION,
-                "SepalWidth" DOUBLE PRECISION,
-                "PetalLength" DOUBLE PRECISION,
-                "PetalWidth" DOUBLE PRECISION,
-                "Name" VARCHAR(200)
-            )"""
-    },
-    'insert_iris': {
-        'sqlite': """INSERT INTO iris VALUES(?, ?, ?, ?, ?)""",
-        'mysql': """INSERT INTO iris VALUES(%s, %s, %s, %s, "%s");""",
-        'postgresql': """INSERT INTO iris VALUES(%s, %s, %s, %s, %s);"""
-    },
-    'create_test_types': {
-        'sqlite': """CREATE TABLE types_test_data (
-                    "TextCol" TEXT,
-                    "DateCol" TEXT,
-                    "IntDateCol" INTEGER,
-                    "FloatCol" REAL,
-                    "IntCol" INTEGER,
-                    "BoolCol" INTEGER,
-                    "IntColWithNull" INTEGER,
-                    "BoolColWithNull" INTEGER
-                )""",
-        'mysql': """CREATE TABLE types_test_data (
-                    `TextCol` TEXT,
-                    `DateCol` DATETIME,
-                    `IntDateCol` INTEGER,
-                    `FloatCol` DOUBLE,
-                    `IntCol` INTEGER,
-                    `BoolCol` BOOLEAN,
-                    `IntColWithNull` INTEGER,
-                    `BoolColWithNull` BOOLEAN
-                )""",
-        'postgresql': """CREATE TABLE types_test_data (
-                    "TextCol" TEXT,
-                    "DateCol" TIMESTAMP,
-                    "DateColWithTz" TIMESTAMP WITH TIME ZONE,
-                    "IntDateCol" INTEGER,
-                    "FloatCol" DOUBLE PRECISION,
-                    "IntCol" INTEGER,
-                    "BoolCol" BOOLEAN,
-                    "IntColWithNull" INTEGER,
-                    "BoolColWithNull" BOOLEAN
-                )"""
-    },
-    'insert_test_types': {
-        'sqlite': {
-            'query': """
-                INSERT INTO types_test_data
-                VALUES(?, ?, ?, ?, ?, ?, ?, ?)
-                """,
-            'fields': (
-                'TextCol', 'DateCol', 'IntDateCol', 'FloatCol',
-                'IntCol', 'BoolCol', 'IntColWithNull', 'BoolColWithNull'
-            )
-        },
-        'mysql': {
-            'query': """
-                INSERT INTO types_test_data
-                VALUES("%s", %s, %s, %s, %s, %s, %s, %s)
-                """,
-            'fields': (
-                'TextCol', 'DateCol', 'IntDateCol', 'FloatCol',
-                'IntCol', 'BoolCol', 'IntColWithNull', 'BoolColWithNull'
-            )
-        },
-        'postgresql': {
-            'query': """
-                INSERT INTO types_test_data
-                VALUES(%s, %s, %s, %s, %s, %s, %s, %s, %s)
-                """,
-            'fields': (
-                'TextCol', 'DateCol', 'DateColWithTz', 'IntDateCol', 'FloatCol',
-                'IntCol', 'BoolCol', 'IntColWithNull', 'BoolColWithNull'
-            )
-        },
-    },
-    'read_parameters': {
-        'sqlite': "SELECT * FROM iris WHERE Name=? AND SepalLength=?",
-        'mysql': 'SELECT * FROM iris WHERE `Name`="%s" AND `SepalLength`=%s',
-        'postgresql': 'SELECT * FROM iris WHERE "Name"=%s AND "SepalLength"=%s'
-    },
-    'read_named_parameters': {
-        'sqlite': """
-                SELECT * FROM iris WHERE Name=:name AND SepalLength=:length
-                """,
-        'mysql': """
-                SELECT * FROM iris WHERE
-                `Name`="%(name)s" AND `SepalLength`=%(length)s
-                """,
-        'postgresql': """
-                SELECT * FROM iris WHERE
-                "Name"=%(name)s AND "SepalLength"=%(length)s
-                """
-    },
-    'create_view': {
-        'sqlite': """
-                CREATE VIEW iris_view AS
-                SELECT * FROM iris
-                """
-    }
-}
-
-
-class MixInBase(object):
-    def tearDown(self):
-        for tbl in self._get_all_tables():
-            self.drop_table(tbl)
-        self._close_conn()
-
-
-class MySQLMixIn(MixInBase):
-    def drop_table(self, table_name):
-        cur = self.conn.cursor()
-        cur.execute("DROP TABLE IF EXISTS %s" % sql._get_valid_mysql_name(table_name))
-        self.conn.commit()
-
-    def _get_all_tables(self):
-        cur = self.conn.cursor()
-        cur.execute('SHOW TABLES')
-        return [table[0] for table in cur.fetchall()]
-
-    def _close_conn(self):
-        from pymysql.err import Error
-        try:
-            self.conn.close()
-        except Error:
-            pass
-
-
-class SQLiteMixIn(MixInBase):
-    def drop_table(self, table_name):
-        self.conn.execute("DROP TABLE IF EXISTS %s" % sql._get_valid_sqlite_name(table_name))
-        self.conn.commit()
-
-    def _get_all_tables(self):
-        c = self.conn.execute("SELECT name FROM sqlite_master WHERE type='table'")
-        return [table[0] for table in c.fetchall()]
-
-    def _close_conn(self):
-        self.conn.close()
-
-
-class SQLAlchemyMixIn(MixInBase):
-    def drop_table(self, table_name):
-        sql.SQLDatabase(self.conn).drop_table(table_name)
-
-    def _get_all_tables(self):
-        meta = sqlalchemy.schema.MetaData(bind=self.conn)
-        meta.reflect()
-        table_list = meta.tables.keys()
-        return table_list
-
-    def _close_conn(self):
-        pass
-
-class PandasSQLTest(unittest.TestCase):
-    """
-    Base class with common private methods for SQLAlchemy and fallback cases.
-
-    """
-
-    def _get_exec(self):
-        if hasattr(self.conn, 'execute'):
-            return self.conn
-        else:
-            return self.conn.cursor()
-
-    def _load_iris_data(self):
-        import io
-        iris_csv_file = os.path.join(tm.get_data_path(), 'iris.csv')
-
-        self.drop_table('iris')
-        self._get_exec().execute(SQL_STRINGS['create_iris'][self.flavor])
-
-        with io.open(iris_csv_file, mode='r', newline=None) as iris_csv:
-            r = csv.reader(iris_csv)
-            next(r)  # skip header row
-            ins = SQL_STRINGS['insert_iris'][self.flavor]
-
-            for row in r:
-                self._get_exec().execute(ins, row)
-
-    def _load_iris_view(self):
-        self.drop_table('iris_view')
-        self._get_exec().execute(SQL_STRINGS['create_view'][self.flavor])
-
-    def _check_iris_loaded_frame(self, iris_frame):
-        pytype = iris_frame.dtypes[0].type
-        row = iris_frame.iloc[0]
-
-        self.assertTrue(
-            issubclass(pytype, np.floating), 'Loaded frame has incorrect type')
-        tm.equalContents(row.values, [5.1, 3.5, 1.4, 0.2, 'Iris-setosa'])
-
-    def _load_test1_data(self):
-        columns = ['index', 'A', 'B', 'C', 'D']
-        data = [(
-            '2000-01-03 00:00:00', 0.980268513777, 3.68573087906, -0.364216805298, -1.15973806169),
-            ('2000-01-04 00:00:00', 1.04791624281, -
-             0.0412318367011, -0.16181208307, 0.212549316967),
-            ('2000-01-05 00:00:00', 0.498580885705,
-             0.731167677815, -0.537677223318, 1.34627041952),
-            ('2000-01-06 00:00:00', 1.12020151869, 1.56762092543, 0.00364077397681, 0.67525259227)]
-
-        self.test_frame1 = DataFrame(data, columns=columns)
-
-    def _load_test2_data(self):
-        df = DataFrame(dict(A=[4, 1, 3, 6],
-                            B=['asd', 'gsq', 'ylt', 'jkl'],
-                            C=[1.1, 3.1, 6.9, 5.3],
-                            D=[False, True, True, False],
-                            E=['1990-11-22', '1991-10-26', '1993-11-26', '1995-12-12']))
-        df['E'] = to_datetime(df['E'])
-
-        self.test_frame2 = df
-
-    def _load_test3_data(self):
-        columns = ['index', 'A', 'B']
-        data = [(
-            '2000-01-03 00:00:00', 2 ** 31 - 1, -1.987670),
-            ('2000-01-04 00:00:00', -29, -0.0412318367011),
-            ('2000-01-05 00:00:00', 20000, 0.731167677815),
-            ('2000-01-06 00:00:00', -290867, 1.56762092543)]
-
-        self.test_frame3 = DataFrame(data, columns=columns)
-
-    def _load_raw_sql(self):
-        self.drop_table('types_test_data')
-        self._get_exec().execute(SQL_STRINGS['create_test_types'][self.flavor])
-        ins = SQL_STRINGS['insert_test_types'][self.flavor]
-
-        data = [
-            {
-                'TextCol': 'first',
-                'DateCol': '2000-01-03 00:00:00',
-                'DateColWithTz': '2000-01-01 00:00:00-08:00',
-                'IntDateCol': 535852800,
-                'FloatCol': 10.10,
-                'IntCol': 1,
-                'BoolCol': False,
-                'IntColWithNull': 1,
-                'BoolColWithNull': False,
-            },
-            {
-                'TextCol': 'first',
-                'DateCol': '2000-01-04 00:00:00',
-                'DateColWithTz': '2000-06-01 00:00:00-07:00',
-                'IntDateCol': 1356998400,
-                'FloatCol': 10.10,
-                'IntCol': 1,
-                'BoolCol': False,
-                'IntColWithNull': None,
-                'BoolColWithNull': None,
-            },
-        ]
-
-        for d in data:
-            self._get_exec().execute(
-                ins['query'],
-                [d[field] for field in ins['fields']]
-            )
-
-    def _count_rows(self, table_name):
-        result = self._get_exec().execute(
-            "SELECT count(*) AS count_1 FROM %s" % table_name).fetchone()
-        return result[0]
-
-    def _read_sql_iris(self):
-        iris_frame = self.pandasSQL.read_query("SELECT * FROM iris")
-        self._check_iris_loaded_frame(iris_frame)
-
-    def _read_sql_iris_parameter(self):
-        query = SQL_STRINGS['read_parameters'][self.flavor]
-        params = ['Iris-setosa', 5.1]
-        iris_frame = self.pandasSQL.read_query(query, params=params)
-        self._check_iris_loaded_frame(iris_frame)
-
-    def _read_sql_iris_named_parameter(self):
-        query = SQL_STRINGS['read_named_parameters'][self.flavor]
-        params = {'name': 'Iris-setosa', 'length': 5.1}
-        iris_frame = self.pandasSQL.read_query(query, params=params)
-        self._check_iris_loaded_frame(iris_frame)
-
-    def _to_sql(self):
-        self.drop_table('test_frame1')
-
-        self.pandasSQL.to_sql(self.test_frame1, 'test_frame1')
-        self.assertTrue(self.pandasSQL.has_table(
-            'test_frame1'), 'Table not written to DB')
-
-        # Nuke table
-        self.drop_table('test_frame1')
-
-    def _to_sql_empty(self):
-        self.drop_table('test_frame1')
-        self.pandasSQL.to_sql(self.test_frame1.iloc[:0], 'test_frame1')
-
-    def _to_sql_fail(self):
-        self.drop_table('test_frame1')
-
-        self.pandasSQL.to_sql(
-            self.test_frame1, 'test_frame1', if_exists='fail')
-        self.assertTrue(self.pandasSQL.has_table(
-            'test_frame1'), 'Table not written to DB')
-
-        self.assertRaises(ValueError, self.pandasSQL.to_sql,
-                          self.test_frame1, 'test_frame1', if_exists='fail')
-
-        self.drop_table('test_frame1')
-
-    def _to_sql_replace(self):
-        self.drop_table('test_frame1')
-
-        self.pandasSQL.to_sql(
-            self.test_frame1, 'test_frame1', if_exists='fail')
-        # Add to table again
-        self.pandasSQL.to_sql(
-            self.test_frame1, 'test_frame1', if_exists='replace')
-        self.assertTrue(self.pandasSQL.has_table(
-            'test_frame1'), 'Table not written to DB')
-
-        num_entries = len(self.test_frame1)
-        num_rows = self._count_rows('test_frame1')
-
-        self.assertEqual(
-            num_rows, num_entries, "not the same number of rows as entries")
-
-        self.drop_table('test_frame1')
-
-    def _to_sql_append(self):
-        # Nuke table just in case
-        self.drop_table('test_frame1')
-
-        self.pandasSQL.to_sql(
-            self.test_frame1, 'test_frame1', if_exists='fail')
-
-        # Add to table again
-        self.pandasSQL.to_sql(
-            self.test_frame1, 'test_frame1', if_exists='append')
-        self.assertTrue(self.pandasSQL.has_table(
-            'test_frame1'), 'Table not written to DB')
-
-        num_entries = 2 * len(self.test_frame1)
-        num_rows = self._count_rows('test_frame1')
-
-        self.assertEqual(
-            num_rows, num_entries, "not the same number of rows as entries")
-
-        self.drop_table('test_frame1')
-
-    def _roundtrip(self):
-        self.drop_table('test_frame_roundtrip')
-        self.pandasSQL.to_sql(self.test_frame1, 'test_frame_roundtrip')
-        result = self.pandasSQL.read_query('SELECT * FROM test_frame_roundtrip')
-
-        result.set_index('level_0', inplace=True)
-        # result.index.astype(int)
-
-        result.index.name = None
-
-        tm.assert_frame_equal(result, self.test_frame1)
-
-    def _execute_sql(self):
-        # drop_sql = "DROP TABLE IF EXISTS test"  # should already be done
-        iris_results = self.pandasSQL.execute("SELECT * FROM iris")
-        row = iris_results.fetchone()
-        tm.equalContents(row, [5.1, 3.5, 1.4, 0.2, 'Iris-setosa'])
-
-    def _to_sql_save_index(self):
-        df = DataFrame.from_records([(1,2.1,'line1'), (2,1.5,'line2')],
-                                    columns=['A','B','C'], index=['A'])
-        self.pandasSQL.to_sql(df, 'test_to_sql_saves_index')
-        ix_cols = self._get_index_columns('test_to_sql_saves_index')
-        self.assertEqual(ix_cols, [['A',],])
-
-    def _transaction_test(self):
-        self.pandasSQL.execute("CREATE TABLE test_trans (A INT, B TEXT)")
-
-        ins_sql = "INSERT INTO test_trans (A,B) VALUES (1, 'blah')"
-
-        # Make sure when transaction is rolled back, no rows get inserted
-        try:
-            with self.pandasSQL.run_transaction() as trans:
-                trans.execute(ins_sql)
-                raise Exception('error')
-        except:
-            # ignore raised exception
-            pass
-        res = self.pandasSQL.read_query('SELECT * FROM test_trans')
-        self.assertEqual(len(res), 0)
-
-        # Make sure when transaction is committed, rows do get inserted
-        with self.pandasSQL.run_transaction() as trans:
-            trans.execute(ins_sql)
-        res2 = self.pandasSQL.read_query('SELECT * FROM test_trans')
-        self.assertEqual(len(res2), 1)
-
-
-#------------------------------------------------------------------------------
-#--- Testing the public API
-
-class _TestSQLApi(PandasSQLTest):
-
-    """
-    Base class to test the public API.
-
-    From this two classes are derived to run these tests for both the
-    sqlalchemy mode (`TestSQLApi`) and the fallback mode (`TestSQLiteFallbackApi`).
-    These tests are run with sqlite3. Specific tests for the different
-    sql flavours are included in `_TestSQLAlchemy`.
-
-    Notes:
-    flavor can always be passed even in SQLAlchemy mode,
-    should be correctly ignored.
-
-    we don't use drop_table because that isn't part of the public api
-
-    """
-    flavor = 'sqlite'
-    mode = None
-
-    def setUp(self):
-        self.conn = self.connect()
-        self._load_iris_data()
-        self._load_iris_view()
-        self._load_test1_data()
-        self._load_test2_data()
-        self._load_test3_data()
-        self._load_raw_sql()
-
-    def test_read_sql_iris(self):
-        iris_frame = sql.read_sql_query(
-            "SELECT * FROM iris", self.conn)
-        self._check_iris_loaded_frame(iris_frame)
-
-    def test_read_sql_view(self):
-        iris_frame = sql.read_sql_query(
-            "SELECT * FROM iris_view", self.conn)
-        self._check_iris_loaded_frame(iris_frame)
-
-    def test_legacy_read_frame(self):
-        with tm.assert_produces_warning(FutureWarning):
-            iris_frame = sql.read_frame(
-                "SELECT * FROM iris", self.conn)
-        self._check_iris_loaded_frame(iris_frame)
-
-    def test_to_sql(self):
-        sql.to_sql(self.test_frame1, 'test_frame1', self.conn, flavor='sqlite')
-        self.assertTrue(
-            sql.has_table('test_frame1', self.conn, flavor='sqlite'), 'Table not written to DB')
-
-    def test_to_sql_fail(self):
-        sql.to_sql(self.test_frame1, 'test_frame2',
-                   self.conn, flavor='sqlite', if_exists='fail')
-        self.assertTrue(
-            sql.has_table('test_frame2', self.conn, flavor='sqlite'), 'Table not written to DB')
-
-        self.assertRaises(ValueError, sql.to_sql, self.test_frame1,
-                          'test_frame2', self.conn, flavor='sqlite', if_exists='fail')
-
-    def test_to_sql_replace(self):
-        sql.to_sql(self.test_frame1, 'test_frame3',
-                   self.conn, flavor='sqlite', if_exists='fail')
-        # Add to table again
-        sql.to_sql(self.test_frame1, 'test_frame3',
-                   self.conn, flavor='sqlite', if_exists='replace')
-        self.assertTrue(
-            sql.has_table('test_frame3', self.conn, flavor='sqlite'),
-            'Table not written to DB')
-
-        num_entries = len(self.test_frame1)
-        num_rows = self._count_rows('test_frame3')
-
-        self.assertEqual(
-            num_rows, num_entries, "not the same number of rows as entries")
-
-    def test_to_sql_append(self):
-        sql.to_sql(self.test_frame1, 'test_frame4',
-                   self.conn, flavor='sqlite', if_exists='fail')
-
-        # Add to table again
-        sql.to_sql(self.test_frame1, 'test_frame4',
-                   self.conn, flavor='sqlite', if_exists='append')
-        self.assertTrue(
-            sql.has_table('test_frame4', self.conn, flavor='sqlite'),
-            'Table not written to DB')
-
-        num_entries = 2 * len(self.test_frame1)
-        num_rows = self._count_rows('test_frame4')
-
-        self.assertEqual(
-            num_rows, num_entries, "not the same number of rows as entries")
-
-    def test_to_sql_type_mapping(self):
-        sql.to_sql(self.test_frame3, 'test_frame5',
-                   self.conn, flavor='sqlite', index=False)
-        result = sql.read_sql("SELECT * FROM test_frame5", self.conn)
-
-        tm.assert_frame_equal(self.test_frame3, result)
-
-    def test_to_sql_series(self):
-        s = Series(np.arange(5, dtype='int64'), name='series')
-        sql.to_sql(s, "test_series", self.conn, flavor='sqlite', index=False)
-        s2 = sql.read_sql_query("SELECT * FROM test_series", self.conn)
-        tm.assert_frame_equal(s.to_frame(), s2)
-
-    def test_to_sql_panel(self):
-        panel = tm.makePanel()
-        self.assertRaises(NotImplementedError, sql.to_sql, panel,
-                          'test_panel', self.conn, flavor='sqlite')
-
-    def test_legacy_write_frame(self):
-        # Assume that functionality is already tested above so just do
-        # quick check that it basically works
-        with tm.assert_produces_warning(FutureWarning):
-            sql.write_frame(self.test_frame1, 'test_frame_legacy', self.conn,
-                            flavor='sqlite')
-
-        self.assertTrue(
-            sql.has_table('test_frame_legacy', self.conn, flavor='sqlite'),
-            'Table not written to DB')
-
-    def test_roundtrip(self):
-        sql.to_sql(self.test_frame1, 'test_frame_roundtrip',
-                   con=self.conn, flavor='sqlite')
-        result = sql.read_sql_query(
-            'SELECT * FROM test_frame_roundtrip',
-            con=self.conn)
-
-        # HACK!
-        result.index = self.test_frame1.index
-        result.set_index('level_0', inplace=True)
-        result.index.astype(int)
-        result.index.name = None
-        tm.assert_frame_equal(result, self.test_frame1)
-
-    def test_roundtrip_chunksize(self):
-        sql.to_sql(self.test_frame1, 'test_frame_roundtrip', con=self.conn,
-            index=False, flavor='sqlite', chunksize=2)
-        result = sql.read_sql_query(
-            'SELECT * FROM test_frame_roundtrip',
-            con=self.conn)
-        tm.assert_frame_equal(result, self.test_frame1)
-
-    def test_execute_sql(self):
-        # drop_sql = "DROP TABLE IF EXISTS test"  # should already be done
-        iris_results = sql.execute("SELECT * FROM iris", con=self.conn)
-        row = iris_results.fetchone()
-        tm.equalContents(row, [5.1, 3.5, 1.4, 0.2, 'Iris-setosa'])
-
-    def test_date_parsing(self):
-        # Test date parsing in read_sq
-        # No Parsing
-        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn)
-        self.assertFalse(
-            issubclass(df.DateCol.dtype.type, np.datetime64),
-            "DateCol loaded with incorrect type")
-
-        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
-                                parse_dates=['DateCol'])
-        self.assertTrue(
-            issubclass(df.DateCol.dtype.type, np.datetime64),
-            "DateCol loaded with incorrect type")
-
-        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
-                                parse_dates={'DateCol': '%Y-%m-%d %H:%M:%S'})
-        self.assertTrue(
-            issubclass(df.DateCol.dtype.type, np.datetime64),
-            "DateCol loaded with incorrect type")
-
-        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
-                                parse_dates=['IntDateCol'])
-
-        self.assertTrue(issubclass(df.IntDateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
-
-        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
-                                parse_dates={'IntDateCol': 's'})
-
-        self.assertTrue(issubclass(df.IntDateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
-
-    def test_date_and_index(self):
-        # Test case where same column appears in parse_date and index_col
-
-        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
-                                index_col='DateCol',
-                                parse_dates=['DateCol', 'IntDateCol'])
-
-        self.assertTrue(issubclass(df.index.dtype.type, np.datetime64),
-                        "DateCol loaded with incorrect type")
-
-        self.assertTrue(issubclass(df.IntDateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
-
-    def test_timedelta(self):
-
-        # see #6921
-        df = to_timedelta(Series(['00:00:01', '00:00:03'], name='foo')).to_frame()
-        with tm.assert_produces_warning(UserWarning):
-            df.to_sql('test_timedelta', self.conn)
-        result = sql.read_sql_query('SELECT * FROM test_timedelta', self.conn)
-        tm.assert_series_equal(result['foo'], df['foo'].astype('int64'))
-
-    def test_complex(self):
-        df = DataFrame({'a':[1+1j, 2j]})
-        # Complex data type should raise error
-        self.assertRaises(ValueError, df.to_sql, 'test_complex', self.conn)
-
-    def test_to_sql_index_label(self):
-        temp_frame = DataFrame({'col1': range(4)})
-
-        # no index name, defaults to 'index'
-        sql.to_sql(temp_frame, 'test_index_label', self.conn)
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[0], 'index')
-
-        # specifying index_label
-        sql.to_sql(temp_frame, 'test_index_label', self.conn,
-                   if_exists='replace', index_label='other_label')
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[0], 'other_label',
-                         "Specified index_label not written to database")
-
-        # using the index name
-        temp_frame.index.name = 'index_name'
-        sql.to_sql(temp_frame, 'test_index_label', self.conn,
-                   if_exists='replace')
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[0], 'index_name',
-                         "Index name not written to database")
-
-        # has index name, but specifying index_label
-        sql.to_sql(temp_frame, 'test_index_label', self.conn,
-                   if_exists='replace', index_label='other_label')
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[0], 'other_label',
-                         "Specified index_label not written to database")
-
-    def test_to_sql_index_label_multiindex(self):
-        temp_frame = DataFrame({'col1': range(4)},
-            index=MultiIndex.from_product([('A0', 'A1'), ('B0', 'B1')]))
-
-        # no index name, defaults to 'level_0' and 'level_1'
-        sql.to_sql(temp_frame, 'test_index_label', self.conn)
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[0], 'level_0')
-        self.assertEqual(frame.columns[1], 'level_1')
-
-        # specifying index_label
-        sql.to_sql(temp_frame, 'test_index_label', self.conn,
-                   if_exists='replace', index_label=['A', 'B'])
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[:2].tolist(), ['A', 'B'],
-                         "Specified index_labels not written to database")
-
-        # using the index name
-        temp_frame.index.names = ['A', 'B']
-        sql.to_sql(temp_frame, 'test_index_label', self.conn,
-                   if_exists='replace')
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[:2].tolist(), ['A', 'B'],
-                         "Index names not written to database")
-
-        # has index name, but specifying index_label
-        sql.to_sql(temp_frame, 'test_index_label', self.conn,
-                   if_exists='replace', index_label=['C', 'D'])
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[:2].tolist(), ['C', 'D'],
-                         "Specified index_labels not written to database")
-
-        # wrong length of index_label
-        self.assertRaises(ValueError, sql.to_sql, temp_frame,
-                          'test_index_label', self.conn, if_exists='replace',
-                          index_label='C')
-
-    def test_multiindex_roundtrip(self):
-        df = DataFrame.from_records([(1,2.1,'line1'), (2,1.5,'line2')],
-                                    columns=['A','B','C'], index=['A','B'])
-
-        df.to_sql('test_multiindex_roundtrip', self.conn)
-        result = sql.read_sql_query('SELECT * FROM test_multiindex_roundtrip',
-                                    self.conn, index_col=['A','B'])
-        tm.assert_frame_equal(df, result, check_index_type=True)
-
-    def test_integer_col_names(self):
-        df = DataFrame([[1, 2], [3, 4]], columns=[0, 1])
-        sql.to_sql(df, "test_frame_integer_col_names", self.conn,
-                   if_exists='replace')
-
-    def test_get_schema(self):
-        create_sql = sql.get_schema(self.test_frame1, 'test', 'sqlite',
-                                    con=self.conn)
-        self.assertTrue('CREATE' in create_sql)
-
-    def test_get_schema_dtypes(self):
-        float_frame = DataFrame({'a':[1.1,1.2], 'b':[2.1,2.2]})
-        dtype = sqlalchemy.Integer if self.mode == 'sqlalchemy' else 'INTEGER'
-        create_sql = sql.get_schema(float_frame, 'test', 'sqlite',
-                                    con=self.conn, dtype={'b':dtype})
-        self.assertTrue('CREATE' in create_sql)
-        self.assertTrue('INTEGER' in create_sql)
-
-    def test_get_schema_keys(self):
-        frame = DataFrame({'Col1':[1.1,1.2], 'Col2':[2.1,2.2]})
-        create_sql = sql.get_schema(frame, 'test', 'sqlite',
-                                    con=self.conn, keys='Col1')
-        constraint_sentence = 'CONSTRAINT test_pk PRIMARY KEY ("Col1")'
-        self.assertTrue(constraint_sentence in create_sql)
-
-        # multiple columns as key (GH10385)
-        create_sql = sql.get_schema(self.test_frame1, 'test', 'sqlite',
-                                    con=self.conn, keys=['A', 'B'])
-        constraint_sentence = 'CONSTRAINT test_pk PRIMARY KEY ("A", "B")'
-        self.assertTrue(constraint_sentence in create_sql)
-
-    def test_chunksize_read(self):
-        df = DataFrame(np.random.randn(22, 5), columns=list('abcde'))
-        df.to_sql('test_chunksize', self.conn, index=False)
-
-        # reading the query in one time
-        res1 = sql.read_sql_query("select * from test_chunksize", self.conn)
-
-        # reading the query in chunks with read_sql_query
-        res2 = DataFrame()
-        i = 0
-        sizes = [5, 5, 5, 5, 2]
-
-        for chunk in sql.read_sql_query("select * from test_chunksize",
-                                        self.conn, chunksize=5):
-            res2 = concat([res2, chunk], ignore_index=True)
-            self.assertEqual(len(chunk), sizes[i])
-            i += 1
-
-        tm.assert_frame_equal(res1, res2)
-
-        # reading the query in chunks with read_sql_query
-        if self.mode == 'sqlalchemy':
-            res3 = DataFrame()
-            i = 0
-            sizes = [5, 5, 5, 5, 2]
-
-            for chunk in sql.read_sql_table("test_chunksize", self.conn,
-                                            chunksize=5):
-                res3 = concat([res3, chunk], ignore_index=True)
-                self.assertEqual(len(chunk), sizes[i])
-                i += 1
-
-            tm.assert_frame_equal(res1, res3)
-
-    def test_categorical(self):
-        # GH8624
-        # test that categorical gets written correctly as dense column
-        df = DataFrame(
-            {'person_id': [1, 2, 3],
-             'person_name': ['John P. Doe', 'Jane Dove', 'John P. Doe']})
-        df2 = df.copy()
-        df2['person_name'] = df2['person_name'].astype('category')
-
-        df2.to_sql('test_categorical', self.conn, index=False)
-        res = sql.read_sql_query('SELECT * FROM test_categorical', self.conn)
-
-        tm.assert_frame_equal(res, df)
-
-
-class TestSQLApi(SQLAlchemyMixIn, _TestSQLApi):
-    """
-    Test the public API as it would be used directly
-
-    Tests for `read_sql_table` are included here, as this is specific for the
-    sqlalchemy mode.
-
-    """
-    flavor = 'sqlite'
-    mode = 'sqlalchemy'
-
-    def connect(self):
-        if SQLALCHEMY_INSTALLED:
-            return sqlalchemy.create_engine('sqlite:///:memory:')
-        else:
-            raise nose.SkipTest('SQLAlchemy not installed')
-
-    def test_read_table_columns(self):
-        # test columns argument in read_table
-        sql.to_sql(self.test_frame1, 'test_frame', self.conn)
-
-        cols = ['A', 'B']
-        result = sql.read_sql_table('test_frame', self.conn, columns=cols)
-        self.assertEqual(result.columns.tolist(), cols,
-                         "Columns not correctly selected")
-
-    def test_read_table_index_col(self):
-        # test columns argument in read_table
-        sql.to_sql(self.test_frame1, 'test_frame', self.conn)
-
-        result = sql.read_sql_table('test_frame', self.conn, index_col="index")
-        self.assertEqual(result.index.names, ["index"],
-                         "index_col not correctly set")
-
-        result = sql.read_sql_table('test_frame', self.conn, index_col=["A", "B"])
-        self.assertEqual(result.index.names, ["A", "B"],
-                         "index_col not correctly set")
-
-        result = sql.read_sql_table('test_frame', self.conn, index_col=["A", "B"],
-                                columns=["C", "D"])
-        self.assertEqual(result.index.names, ["A", "B"],
-                         "index_col not correctly set")
-        self.assertEqual(result.columns.tolist(), ["C", "D"],
-                         "columns not set correctly whith index_col")
-
-    def test_read_sql_delegate(self):
-        iris_frame1 = sql.read_sql_query(
-            "SELECT * FROM iris", self.conn)
-        iris_frame2 = sql.read_sql(
-            "SELECT * FROM iris", self.conn)
-        tm.assert_frame_equal(iris_frame1, iris_frame2)
-
-        iris_frame1 = sql.read_sql_table('iris', self.conn)
-        iris_frame2 = sql.read_sql('iris', self.conn)
-        tm.assert_frame_equal(iris_frame1, iris_frame2)
-
-    def test_not_reflect_all_tables(self):
-        # create invalid table
-        qry = """CREATE TABLE invalid (x INTEGER, y UNKNOWN);"""
-        self.conn.execute(qry)
-        qry = """CREATE TABLE other_table (x INTEGER, y INTEGER);"""
-        self.conn.execute(qry)
-
-        with warnings.catch_warnings(record=True) as w:
-            # Cause all warnings to always be triggered.
-            warnings.simplefilter("always")
-            # Trigger a warning.
-            sql.read_sql_table('other_table', self.conn)
-            sql.read_sql_query('SELECT * FROM other_table', self.conn)
-            # Verify some things
-            self.assertEqual(len(w), 0, "Warning triggered for other table")
-
-    def test_warning_case_insensitive_table_name(self):
-        # see GH7815.
-        # We can't test that this warning is triggered, a the database
-        # configuration would have to be altered. But here we test that
-        # the warning is certainly NOT triggered in a normal case.
-        with warnings.catch_warnings(record=True) as w:
-            # Cause all warnings to always be triggered.
-            warnings.simplefilter("always")
-            # This should not trigger a Warning
-            self.test_frame1.to_sql('CaseSensitive', self.conn)
-            # Verify some things
-            self.assertEqual(len(w), 0, "Warning triggered for writing a table")
-
-    def _get_index_columns(self, tbl_name):
-        from sqlalchemy.engine import reflection
-        insp = reflection.Inspector.from_engine(self.conn)
-        ixs = insp.get_indexes('test_index_saved')
-        ixs = [i['column_names'] for i in ixs]
-        return ixs
-
-    def test_sqlalchemy_type_mapping(self):
-
-        # Test Timestamp objects (no datetime64 because of timezone) (GH9085)
-        df = DataFrame({'time': to_datetime(['201412120154', '201412110254'],
-                                            utc=True)})
-        db = sql.SQLDatabase(self.conn)
-        table = sql.SQLTable("test_type", db, frame=df)
-        self.assertTrue(isinstance(table.table.c['time'].type, sqltypes.DateTime))
-
-    def test_to_sql_read_sql_with_database_uri(self):
-
-        # Test read_sql and .to_sql method with a database URI (GH10654)
-        test_frame1 = self.test_frame1
-        #db_uri = 'sqlite:///:memory:' # raises sqlalchemy.exc.OperationalError: (sqlite3.OperationalError) near "iris": syntax error [SQL: 'iris']
-        with tm.ensure_clean() as name:
-            db_uri = 'sqlite:///' + name
-            table = 'iris'
-            test_frame1.to_sql(table, db_uri, if_exists='replace', index=False)
-            test_frame2 = sql.read_sql(table, db_uri)
-            test_frame3 = sql.read_sql_table(table, db_uri)
-            query = 'SELECT * FROM iris'
-            test_frame4 = sql.read_sql_query(query, db_uri)
-        tm.assert_frame_equal(test_frame1, test_frame2)
-        tm.assert_frame_equal(test_frame1, test_frame3)
-        tm.assert_frame_equal(test_frame1, test_frame4)
-
-    def _make_iris_table_metadata(self):
-        sa = sqlalchemy
-        metadata = sa.MetaData()
-        iris = sa.Table('iris', metadata,
-            sa.Column('SepalLength', sa.REAL),
-            sa.Column('SepalWidth', sa.REAL),
-            sa.Column('PetalLength', sa.REAL),
-            sa.Column('PetalWidth', sa.REAL),
-            sa.Column('Name', sa.TEXT)
-        )
-
-        return iris
-
-    def test_query_by_text_obj(self):
-        # WIP : GH10846
-        name_text = sqlalchemy.text('select * from iris where name=:name')
-        iris_df = sql.read_sql(name_text, self.conn, params={'name': 'Iris-versicolor'})
-        all_names = set(iris_df['Name'])
-        self.assertEqual(all_names, set(['Iris-versicolor']))
-
-    def test_query_by_select_obj(self):
-        # WIP : GH10846
-        iris = self._make_iris_table_metadata()
-
-        name_select = sqlalchemy.select([iris]).where(iris.c.Name == sqlalchemy.bindparam('name'))
-        iris_df = sql.read_sql(name_select, self.conn, params={'name': 'Iris-setosa'})
-        all_names = set(iris_df['Name'])
-        self.assertEqual(all_names, set(['Iris-setosa']))
-
-
-class _EngineToConnMixin(object):
-    """
-    A mixin that causes setup_connect to create a conn rather than an engine.
-    """
-
-    def setUp(self):
-        super(_EngineToConnMixin, self).setUp()
-        engine = self.conn
-        conn = engine.connect()
-        self.__tx = conn.begin()
-        self.pandasSQL = sql.SQLDatabase(conn)
-        self.__engine = engine
-        self.conn = conn
-
-    def tearDown(self):
-        self.__tx.rollback()
-        self.conn.close()
-        self.conn = self.__engine
-        self.pandasSQL = sql.SQLDatabase(self.__engine)
-        super(_EngineToConnMixin, self).tearDown()
-
-
-class TestSQLApiConn(_EngineToConnMixin, TestSQLApi):
-    pass
-
-
-class TestSQLiteFallbackApi(SQLiteMixIn, _TestSQLApi):
-    """
-    Test the public sqlite connection fallback API
-
-    """
-    flavor = 'sqlite'
-    mode = 'fallback'
-
-    def connect(self, database=":memory:"):
-        return sqlite3.connect(database)
-
-    def test_sql_open_close(self):
-        # Test if the IO in the database still work if the connection closed
-        # between the writing and reading (as in many real situations).
-
-        with tm.ensure_clean() as name:
-
-            conn = self.connect(name)
-            sql.to_sql(self.test_frame3, "test_frame3_legacy", conn,
-                       flavor="sqlite", index=False)
-            conn.close()
-
-            conn = self.connect(name)
-            result = sql.read_sql_query("SELECT * FROM test_frame3_legacy;",
-                                        conn)
-            conn.close()
-
-        tm.assert_frame_equal(self.test_frame3, result)
-
-    def test_read_sql_delegate(self):
-        iris_frame1 = sql.read_sql_query("SELECT * FROM iris", self.conn)
-        iris_frame2 = sql.read_sql("SELECT * FROM iris", self.conn)
-        tm.assert_frame_equal(iris_frame1, iris_frame2)
-
-        self.assertRaises(sql.DatabaseError, sql.read_sql, 'iris', self.conn)
-
-    def test_safe_names_warning(self):
-        # GH 6798
-        df = DataFrame([[1, 2], [3, 4]], columns=['a', 'b '])  # has a space
-        # warns on create table with spaces in names
-        with tm.assert_produces_warning():
-            sql.to_sql(df, "test_frame3_legacy", self.conn,
-                       flavor="sqlite", index=False)
-
-    def test_get_schema2(self):
-        # without providing a connection object (available for backwards comp)
-        create_sql = sql.get_schema(self.test_frame1, 'test', 'sqlite')
-        self.assertTrue('CREATE' in create_sql)
-
-    def test_tquery(self):
-        with tm.assert_produces_warning(FutureWarning):
-            iris_results = sql.tquery("SELECT * FROM iris", con=self.conn)
-        row = iris_results[0]
-        tm.equalContents(row, [5.1, 3.5, 1.4, 0.2, 'Iris-setosa'])
-
-    def test_uquery(self):
-        with tm.assert_produces_warning(FutureWarning):
-            rows = sql.uquery("SELECT * FROM iris LIMIT 1", con=self.conn)
-        self.assertEqual(rows, -1)
-
-    def _get_sqlite_column_type(self, schema, column):
-
-        for col in schema.split('\n'):
-            if col.split()[0].strip('""') == column:
-                return col.split()[1]
-        raise ValueError('Column %s not found' % (column))
-
-    def test_sqlite_type_mapping(self):
-
-        # Test Timestamp objects (no datetime64 because of timezone) (GH9085)
-        df = DataFrame({'time': to_datetime(['201412120154', '201412110254'],
-                                            utc=True)})
-        db = sql.SQLiteDatabase(self.conn, self.flavor)
-        table = sql.SQLiteTable("test_type", db, frame=df)
-        schema = table.sql_schema()
-        self.assertEqual(self._get_sqlite_column_type(schema, 'time'),
-                         "TIMESTAMP")
-
-
-#------------------------------------------------------------------------------
-#--- Database flavor specific tests
-
-
-class _TestSQLAlchemy(SQLAlchemyMixIn, PandasSQLTest):
-    """
-    Base class for testing the sqlalchemy backend.
-
-    Subclasses for specific database types are created below. Tests that
-    deviate for each flavor are overwritten there.
-
-    """
-    flavor = None
-
-    @classmethod
-    def setUpClass(cls):
-        cls.setup_import()
-        cls.setup_driver()
-
-        # test connection
-        try:
-            conn = cls.connect()
-            conn.connect()
-        except sqlalchemy.exc.OperationalError:
-            msg = "{0} - can't connect to {1} server".format(cls, cls.flavor)
-            raise nose.SkipTest(msg)
-
-    def setUp(self):
-        self.setup_connect()
-
-        self._load_iris_data()
-        self._load_raw_sql()
-        self._load_test1_data()
-
-    @classmethod
-    def setup_import(cls):
-        # Skip this test if SQLAlchemy not available
-        if not SQLALCHEMY_INSTALLED:
-            raise nose.SkipTest('SQLAlchemy not installed')
-
-    @classmethod
-    def setup_driver(cls):
-        raise NotImplementedError()
-
-    @classmethod
-    def connect(cls):
-        raise NotImplementedError()
-
-    def setup_connect(self):
-        try:
-            self.conn = self.connect()
-            self.pandasSQL = sql.SQLDatabase(self.conn)
-            # to test if connection can be made:
-            self.conn.connect()
-        except sqlalchemy.exc.OperationalError:
-            raise nose.SkipTest("Can't connect to {0} server".format(self.flavor))
-
-    def test_aread_sql(self):
-        self._read_sql_iris()
-
-    def test_read_sql_parameter(self):
-        self._read_sql_iris_parameter()
-
-    def test_read_sql_named_parameter(self):
-        self._read_sql_iris_named_parameter()
-
-    def test_to_sql(self):
-        self._to_sql()
-
-    def test_to_sql_empty(self):
-        self._to_sql_empty()
-
-    def test_to_sql_fail(self):
-        self._to_sql_fail()
-
-    def test_to_sql_replace(self):
-        self._to_sql_replace()
-
-    def test_to_sql_append(self):
-        self._to_sql_append()
-
-    def test_create_table(self):
-        temp_conn = self.connect()
-        temp_frame = DataFrame(
-            {'one': [1., 2., 3., 4.], 'two': [4., 3., 2., 1.]})
-
-        pandasSQL = sql.SQLDatabase(temp_conn)
-        pandasSQL.to_sql(temp_frame, 'temp_frame')
-
-        self.assertTrue(
-            temp_conn.has_table('temp_frame'), 'Table not written to DB')
-
-    def test_drop_table(self):
-        temp_conn = self.connect()
-
-        temp_frame = DataFrame(
-            {'one': [1., 2., 3., 4.], 'two': [4., 3., 2., 1.]})
-
-        pandasSQL = sql.SQLDatabase(temp_conn)
-        pandasSQL.to_sql(temp_frame, 'temp_frame')
-
-        self.assertTrue(
-            temp_conn.has_table('temp_frame'), 'Table not written to DB')
-
-        pandasSQL.drop_table('temp_frame')
-
-        self.assertFalse(
-            temp_conn.has_table('temp_frame'), 'Table not deleted from DB')
-
-    def test_roundtrip(self):
-        self._roundtrip()
-
-    def test_execute_sql(self):
-        self._execute_sql()
-
-    def test_read_table(self):
-        iris_frame = sql.read_sql_table("iris", con=self.conn)
-        self._check_iris_loaded_frame(iris_frame)
-
-    def test_read_table_columns(self):
-        iris_frame = sql.read_sql_table(
-            "iris", con=self.conn, columns=['SepalLength', 'SepalLength'])
-        tm.equalContents(
-            iris_frame.columns.values, ['SepalLength', 'SepalLength'])
-
-    def test_read_table_absent(self):
-        self.assertRaises(
-            ValueError, sql.read_sql_table, "this_doesnt_exist", con=self.conn)
-
-    def test_default_type_conversion(self):
-        df = sql.read_sql_table("types_test_data", self.conn)
-
-        self.assertTrue(issubclass(df.FloatCol.dtype.type, np.floating),
-                        "FloatCol loaded with incorrect type")
-        self.assertTrue(issubclass(df.IntCol.dtype.type, np.integer),
-                        "IntCol loaded with incorrect type")
-        self.assertTrue(issubclass(df.BoolCol.dtype.type, np.bool_),
-                        "BoolCol loaded with incorrect type")
-
-        # Int column with NA values stays as float
-        self.assertTrue(issubclass(df.IntColWithNull.dtype.type, np.floating),
-                        "IntColWithNull loaded with incorrect type")
-        # Bool column with NA values becomes object
-        self.assertTrue(issubclass(df.BoolColWithNull.dtype.type, np.object),
-                        "BoolColWithNull loaded with incorrect type")
-
-    def test_bigint(self):
-        # int64 should be converted to BigInteger, GH7433
-        df = DataFrame(data={'i64':[2**62]})
-        df.to_sql('test_bigint', self.conn, index=False)
-        result = sql.read_sql_table('test_bigint', self.conn)
-
-        tm.assert_frame_equal(df, result)
-
-    def test_default_date_load(self):
-        df = sql.read_sql_table("types_test_data", self.conn)
-
-        # IMPORTANT - sqlite has no native date type, so shouldn't parse, but
-        # MySQL SHOULD be converted.
-        self.assertTrue(issubclass(df.DateCol.dtype.type, np.datetime64),
-                        "DateCol loaded with incorrect type")
-
-    def test_datetime_with_timezone(self):
-        # edge case that converts postgresql datetime with time zone types
-        # to datetime64[ns,psycopg2.tz.FixedOffsetTimezone..], which is ok
-        # but should be more natural, so coerce to datetime64[ns] for now
-
-        def check(col):
-            # check that a column is either datetime64[ns]
-            # or datetime64[ns, UTC]
-            if com.is_datetime64_dtype(col.dtype):
-
-                # "2000-01-01 00:00:00-08:00" should convert to "2000-01-01 08:00:00"
-                self.assertEqual(col[0], Timestamp('2000-01-01 08:00:00'))
-
-                # "2000-06-01 00:00:00-07:00" should convert to "2000-06-01 07:00:00"
-                self.assertEqual(col[1], Timestamp('2000-06-01 07:00:00'))
-
-            elif com.is_datetime64tz_dtype(col.dtype):
-                self.assertTrue(str(col.dt.tz) == 'UTC')
-
-                # "2000-01-01 00:00:00-08:00" should convert to "2000-01-01 08:00:00"
-                self.assertEqual(col[0], Timestamp('2000-01-01 08:00:00', tz='UTC'))
-
-                # "2000-06-01 00:00:00-07:00" should convert to "2000-06-01 07:00:00"
-                self.assertEqual(col[1], Timestamp('2000-06-01 07:00:00', tz='UTC'))
-
-            else:
-                raise AssertionError("DateCol loaded with incorrect type -> {0}".format(col.dtype))
-
-        # GH11216
-        df = pd.read_sql_query("select * from types_test_data", self.conn)
-        if not hasattr(df,'DateColWithTz'):
-            raise nose.SkipTest("no column with datetime with time zone")
-
-        # this is parsed on Travis (linux), but not on macosx for some reason
-        # even with the same versions of psycopg2 & sqlalchemy, possibly a Postgrsql server
-        # version difference
-        col = df.DateColWithTz
-        self.assertTrue(com.is_object_dtype(col.dtype) or com.is_datetime64_dtype(col.dtype) \
-                        or com.is_datetime64tz_dtype(col.dtype),
-                        "DateCol loaded with incorrect type -> {0}".format(col.dtype))
-
-        df = pd.read_sql_query("select * from types_test_data", self.conn, parse_dates=['DateColWithTz'])
-        if not hasattr(df,'DateColWithTz'):
-            raise nose.SkipTest("no column with datetime with time zone")
-        check(df.DateColWithTz)
-
-        df = pd.concat(list(pd.read_sql_query("select * from types_test_data",
-                                              self.conn,chunksize=1)),ignore_index=True)
-        col = df.DateColWithTz
-        self.assertTrue(com.is_datetime64tz_dtype(col.dtype),
-                        "DateCol loaded with incorrect type -> {0}".format(col.dtype))
-        self.assertTrue(str(col.dt.tz) == 'UTC')
-        expected = sql.read_sql_table("types_test_data", self.conn)
-        tm.assert_series_equal(df.DateColWithTz, expected.DateColWithTz.astype('datetime64[ns, UTC]'))
-
-        # xref #7139
-        # this might or might not be converted depending on the postgres driver
-        df = sql.read_sql_table("types_test_data", self.conn)
-        check(df.DateColWithTz)
-
-    def test_date_parsing(self):
-        # No Parsing
-        df = sql.read_sql_table("types_test_data", self.conn)
-
-        df = sql.read_sql_table("types_test_data", self.conn,
-                                parse_dates=['DateCol'])
-        self.assertTrue(issubclass(df.DateCol.dtype.type, np.datetime64),
-                        "DateCol loaded with incorrect type")
-
-        df = sql.read_sql_table("types_test_data", self.conn,
-                                parse_dates={'DateCol': '%Y-%m-%d %H:%M:%S'})
-        self.assertTrue(issubclass(df.DateCol.dtype.type, np.datetime64),
-                        "DateCol loaded with incorrect type")
-
-        df = sql.read_sql_table("types_test_data", self.conn, parse_dates={
-                            'DateCol': {'format': '%Y-%m-%d %H:%M:%S'}})
-        self.assertTrue(issubclass(df.DateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
-
-        df = sql.read_sql_table(
-            "types_test_data", self.conn, parse_dates=['IntDateCol'])
-        self.assertTrue(issubclass(df.IntDateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
-
-        df = sql.read_sql_table(
-            "types_test_data", self.conn, parse_dates={'IntDateCol': 's'})
-        self.assertTrue(issubclass(df.IntDateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
-
-        df = sql.read_sql_table(
-            "types_test_data", self.conn, parse_dates={'IntDateCol': {'unit': 's'}})
-        self.assertTrue(issubclass(df.IntDateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
-
-    def test_datetime(self):
-        df = DataFrame({'A': date_range('2013-01-01 09:00:00', periods=3),
-                        'B': np.arange(3.0)})
-        df.to_sql('test_datetime', self.conn)
-
-        # with read_table -> type information from schema used
-        result = sql.read_sql_table('test_datetime', self.conn)
-        result = result.drop('index', axis=1)
-        tm.assert_frame_equal(result, df)
-
-        # with read_sql -> no type information -> sqlite has no native
-        result = sql.read_sql_query('SELECT * FROM test_datetime', self.conn)
-        result = result.drop('index', axis=1)
-        if self.flavor == 'sqlite':
-            self.assertTrue(isinstance(result.loc[0, 'A'], string_types))
-            result['A'] = to_datetime(result['A'])
-            tm.assert_frame_equal(result, df)
-        else:
-            tm.assert_frame_equal(result, df)
-
-    def test_datetime_NaT(self):
-        df = DataFrame({'A': date_range('2013-01-01 09:00:00', periods=3),
-                        'B': np.arange(3.0)})
-        df.loc[1, 'A'] = np.nan
-        df.to_sql('test_datetime', self.conn, index=False)
-
-        # with read_table -> type information from schema used
-        result = sql.read_sql_table('test_datetime', self.conn)
-        tm.assert_frame_equal(result, df)
-
-        # with read_sql -> no type information -> sqlite has no native
-        result = sql.read_sql_query('SELECT * FROM test_datetime', self.conn)
-        if self.flavor == 'sqlite':
-            self.assertTrue(isinstance(result.loc[0, 'A'], string_types))
-            result['A'] = to_datetime(result['A'], errors='coerce')
-            tm.assert_frame_equal(result, df)
-        else:
-            tm.assert_frame_equal(result, df)
-
-    def test_datetime_date(self):
-        # test support for datetime.date
-        df = DataFrame([date(2014, 1, 1), date(2014, 1, 2)], columns=["a"])
-        df.to_sql('test_date', self.conn, index=False)
-        res = read_sql_table('test_date', self.conn)
-        # comes back as datetime64
-        tm.assert_series_equal(res['a'], to_datetime(df['a']))
-
-    def test_datetime_time(self):
-        # test support for datetime.time
-        df = DataFrame([time(9, 0, 0), time(9, 1, 30)], columns=["a"])
-        df.to_sql('test_time', self.conn, index=False)
-        res = read_sql_table('test_time', self.conn)
-        tm.assert_frame_equal(res, df)
-
-    def test_mixed_dtype_insert(self):
-        # see GH6509
-        s1 = Series(2**25 + 1,dtype=np.int32)
-        s2 = Series(0.0,dtype=np.float32)
-        df = DataFrame({'s1': s1, 's2': s2})
-
-        # write and read again
-        df.to_sql("test_read_write", self.conn, index=False)
-        df2 = sql.read_sql_table("test_read_write", self.conn)
-
-        tm.assert_frame_equal(df, df2, check_dtype=False, check_exact=True)
-
-    def test_nan_numeric(self):
-        # NaNs in numeric float column
-        df = DataFrame({'A':[0, 1, 2], 'B':[0.2, np.nan, 5.6]})
-        df.to_sql('test_nan', self.conn, index=False)
-
-        # with read_table
-        result = sql.read_sql_table('test_nan', self.conn)
-        tm.assert_frame_equal(result, df)
-
-        # with read_sql
-        result = sql.read_sql_query('SELECT * FROM test_nan', self.conn)
-        tm.assert_frame_equal(result, df)
-
-    def test_nan_fullcolumn(self):
-        # full NaN column (numeric float column)
-        df = DataFrame({'A':[0, 1, 2], 'B':[np.nan, np.nan, np.nan]})
-        df.to_sql('test_nan', self.conn, index=False)
-
-        # with read_table
-        result = sql.read_sql_table('test_nan', self.conn)
-        tm.assert_frame_equal(result, df)
-
-        # with read_sql -> not type info from table -> stays None
-        df['B'] = df['B'].astype('object')
-        df['B'] = None
-        result = sql.read_sql_query('SELECT * FROM test_nan', self.conn)
-        tm.assert_frame_equal(result, df)
-
-    def test_nan_string(self):
-        # NaNs in string column
-        df = DataFrame({'A':[0, 1, 2], 'B':['a', 'b', np.nan]})
-        df.to_sql('test_nan', self.conn, index=False)
-
-        # NaNs are coming back as None
-        df.loc[2, 'B'] = None
-
-        # with read_table
-        result = sql.read_sql_table('test_nan', self.conn)
-        tm.assert_frame_equal(result, df)
-
-        # with read_sql
-        result = sql.read_sql_query('SELECT * FROM test_nan', self.conn)
-        tm.assert_frame_equal(result, df)
-
-    def _get_index_columns(self, tbl_name):
-        from sqlalchemy.engine import reflection
-        insp = reflection.Inspector.from_engine(self.conn)
-        ixs = insp.get_indexes(tbl_name)
-        ixs = [i['column_names'] for i in ixs]
-        return ixs
-
-    def test_to_sql_save_index(self):
-        self._to_sql_save_index()
-
-    def test_transactions(self):
-        self._transaction_test()
-
-    def test_get_schema_create_table(self):
-        # Use a dataframe without a bool column, since MySQL converts bool to
-        # TINYINT (which read_sql_table returns as an int and causes a dtype
-        # mismatch)
-
-        self._load_test3_data()
-        tbl = 'test_get_schema_create_table'
-        create_sql = sql.get_schema(self.test_frame3, tbl, con=self.conn)
-        blank_test_df = self.test_frame3.iloc[:0]
-
-        self.drop_table(tbl)
-        self.conn.execute(create_sql)
-        returned_df = sql.read_sql_table(tbl, self.conn)
-        tm.assert_frame_equal(returned_df, blank_test_df)
-        self.drop_table(tbl)
-
-    def test_dtype(self):
-        cols = ['A', 'B']
-        data = [(0.8, True),
-                (0.9, None)]
-        df = DataFrame(data, columns=cols)
-        df.to_sql('dtype_test', self.conn)
-        df.to_sql('dtype_test2', self.conn, dtype={'B': sqlalchemy.TEXT})
-        meta = sqlalchemy.schema.MetaData(bind=self.conn)
-        meta.reflect()
-        sqltype = meta.tables['dtype_test2'].columns['B'].type
-        self.assertTrue(isinstance(sqltype, sqlalchemy.TEXT))
-        self.assertRaises(ValueError, df.to_sql,
-                          'error', self.conn, dtype={'B': str})
-
-        # GH9083
-        df.to_sql('dtype_test3', self.conn, dtype={'B': sqlalchemy.String(10)})
-        meta.reflect()
-        sqltype = meta.tables['dtype_test3'].columns['B'].type
-        self.assertTrue(isinstance(sqltype, sqlalchemy.String))
-        self.assertEqual(sqltype.length, 10)
-
-    def test_notnull_dtype(self):
-        cols = {'Bool': Series([True,None]),
-                'Date': Series([datetime(2012, 5, 1), None]),
-                'Int' : Series([1, None], dtype='object'),
-                'Float': Series([1.1, None])
-               }
-        df = DataFrame(cols)
-
-        tbl = 'notnull_dtype_test'
-        df.to_sql(tbl, self.conn)
-        returned_df = sql.read_sql_table(tbl, self.conn)
-        meta = sqlalchemy.schema.MetaData(bind=self.conn)
-        meta.reflect()
-        if self.flavor == 'mysql':
-            my_type = sqltypes.Integer
-        else:
-            my_type = sqltypes.Boolean
-
-        col_dict = meta.tables[tbl].columns
-
-        self.assertTrue(isinstance(col_dict['Bool'].type, my_type))
-        self.assertTrue(isinstance(col_dict['Date'].type, sqltypes.DateTime))
-        self.assertTrue(isinstance(col_dict['Int'].type, sqltypes.Integer))
-        self.assertTrue(isinstance(col_dict['Float'].type, sqltypes.Float))
-
-    def test_double_precision(self):
-        V = 1.23456789101112131415
-
-        df = DataFrame({'f32':Series([V,], dtype='float32'),
-                        'f64':Series([V,], dtype='float64'),
-                        'f64_as_f32':Series([V,], dtype='float64'),
-                        'i32':Series([5,], dtype='int32'),
-                        'i64':Series([5,], dtype='int64'),
-                        })
-
-        df.to_sql('test_dtypes', self.conn, index=False, if_exists='replace',
-            dtype={'f64_as_f32':sqlalchemy.Float(precision=23)})
-        res = sql.read_sql_table('test_dtypes', self.conn)
-
-        # check precision of float64
-        self.assertEqual(np.round(df['f64'].iloc[0],14),
-                         np.round(res['f64'].iloc[0],14))
-
-        # check sql types
-        meta = sqlalchemy.schema.MetaData(bind=self.conn)
-        meta.reflect()
-        col_dict = meta.tables['test_dtypes'].columns
-        self.assertEqual(str(col_dict['f32'].type),
-                         str(col_dict['f64_as_f32'].type))
-        self.assertTrue(isinstance(col_dict['f32'].type, sqltypes.Float))
-        self.assertTrue(isinstance(col_dict['f64'].type, sqltypes.Float))
-        self.assertTrue(isinstance(col_dict['i32'].type, sqltypes.Integer))
-        self.assertTrue(isinstance(col_dict['i64'].type, sqltypes.BigInteger))
-
-    def test_connectable_issue_example(self):
-        # This tests the example raised in issue
-        # https://github.com/pydata/pandas/issues/10104
-
-        def foo(connection):
-            query = 'SELECT test_foo_data FROM test_foo_data'
-            return sql.read_sql_query(query, con=connection)
-
-        def bar(connection, data):
-            data.to_sql(name='test_foo_data', con=connection, if_exists='append')
-
-        def main(connectable):
-            with connectable.connect() as conn:
-                with conn.begin():
-                    foo_data = conn.run_callable(foo)
-                    conn.run_callable(bar, foo_data)
-
-        DataFrame({'test_foo_data': [0, 1, 2]}).to_sql('test_foo_data', self.conn)
-        main(self.conn)
-
-    def test_temporary_table(self):
-        test_data = u'Hello, World!'
-        expected = DataFrame({'spam': [test_data]})
-        Base = declarative.declarative_base()
-
-        class Temporary(Base):
-            __tablename__ = 'temp_test'
-            __table_args__ = {'prefixes': ['TEMPORARY']}
-            id = sqlalchemy.Column(sqlalchemy.Integer, primary_key=True)
-            spam = sqlalchemy.Column(sqlalchemy.Unicode(30), nullable=False)
-
-        Session = sa_session.sessionmaker(bind=self.conn)
-        session = Session()
-        with session.transaction:
-            conn = session.connection()
-            Temporary.__table__.create(conn)
-            session.add(Temporary(spam=test_data))
-            session.flush()
-            df = sql.read_sql_query(
-                sql=sqlalchemy.select([Temporary.spam]),
-                con=conn,
-            )
-
-        tm.assert_frame_equal(df, expected)
-
-
-class _TestSQLAlchemyConn(_EngineToConnMixin, _TestSQLAlchemy):
-    def test_transactions(self):
-        raise nose.SkipTest("Nested transactions rollbacks don't work with Pandas")
-
-
-class _TestSQLiteAlchemy(object):
-    """
-    Test the sqlalchemy backend against an in-memory sqlite database.
-
-    """
-    flavor = 'sqlite'
-
-    @classmethod
-    def connect(cls):
-        return sqlalchemy.create_engine('sqlite:///:memory:')
-
-    @classmethod
-    def setup_driver(cls):
-        # sqlite3 is built-in
-        cls.driver = None
-
-    def test_default_type_conversion(self):
-        df = sql.read_sql_table("types_test_data", self.conn)
-
-        self.assertTrue(issubclass(df.FloatCol.dtype.type, np.floating),
-                        "FloatCol loaded with incorrect type")
-        self.assertTrue(issubclass(df.IntCol.dtype.type, np.integer),
-                        "IntCol loaded with incorrect type")
-        # sqlite has no boolean type, so integer type is returned
-        self.assertTrue(issubclass(df.BoolCol.dtype.type, np.integer),
-                        "BoolCol loaded with incorrect type")
-
-        # Int column with NA values stays as float
-        self.assertTrue(issubclass(df.IntColWithNull.dtype.type, np.floating),
-                        "IntColWithNull loaded with incorrect type")
-        # Non-native Bool column with NA values stays as float
-        self.assertTrue(issubclass(df.BoolColWithNull.dtype.type, np.floating),
-                        "BoolColWithNull loaded with incorrect type")
-
-    def test_default_date_load(self):
-        df = sql.read_sql_table("types_test_data", self.conn)
-
-        # IMPORTANT - sqlite has no native date type, so shouldn't parse, but
-        self.assertFalse(issubclass(df.DateCol.dtype.type, np.datetime64),
-                         "DateCol loaded with incorrect type")
-
-    def test_bigint_warning(self):
-        # test no warning for BIGINT (to support int64) is raised (GH7433)
-        df = DataFrame({'a':[1,2]}, dtype='int64')
-        df.to_sql('test_bigintwarning', self.conn, index=False)
-
-        with warnings.catch_warnings(record=True) as w:
-            warnings.simplefilter("always")
-            sql.read_sql_table('test_bigintwarning', self.conn)
-            self.assertEqual(len(w), 0, "Warning triggered for other table")
-
-
-class _TestMySQLAlchemy(object):
-    """
-    Test the sqlalchemy backend against an MySQL database.
-
-    """
-    flavor = 'mysql'
-
-    @classmethod
-    def connect(cls):
-        url = 'mysql+{driver}://root@localhost/pandas_nosetest'
-        return sqlalchemy.create_engine(url.format(driver=cls.driver))
-
-    @classmethod
-    def setup_driver(cls):
-        try:
-            import pymysql
-            cls.driver = 'pymysql'
-        except ImportError:
-            raise nose.SkipTest('pymysql not installed')
-
-    def test_default_type_conversion(self):
-        df = sql.read_sql_table("types_test_data", self.conn)
-
-        self.assertTrue(issubclass(df.FloatCol.dtype.type, np.floating),
-                        "FloatCol loaded with incorrect type")
-        self.assertTrue(issubclass(df.IntCol.dtype.type, np.integer),
-                        "IntCol loaded with incorrect type")
-        # MySQL has no real BOOL type (it's an alias for TINYINT)
-        self.assertTrue(issubclass(df.BoolCol.dtype.type, np.integer),
-                        "BoolCol loaded with incorrect type")
-
-        # Int column with NA values stays as float
-        self.assertTrue(issubclass(df.IntColWithNull.dtype.type, np.floating),
-                        "IntColWithNull loaded with incorrect type")
-        # Bool column with NA = int column with NA values => becomes float
-        self.assertTrue(issubclass(df.BoolColWithNull.dtype.type, np.floating),
-                        "BoolColWithNull loaded with incorrect type")
-
-    def test_read_procedure(self):
-        # see GH7324. Although it is more an api test, it is added to the
-        # mysql tests as sqlite does not have stored procedures
-        df = DataFrame({'a': [1, 2, 3], 'b':[0.1, 0.2, 0.3]})
-        df.to_sql('test_procedure', self.conn, index=False)
-
-        proc = """DROP PROCEDURE IF EXISTS get_testdb;
-
-        CREATE PROCEDURE get_testdb ()
-
-        BEGIN
-            SELECT * FROM test_procedure;
-        END"""
-
-        connection = self.conn.connect()
-        trans = connection.begin()
-        try:
-            r1 = connection.execute(proc)
-            trans.commit()
-        except:
-            trans.rollback()
-            raise
-
-        res1 = sql.read_sql_query("CALL get_testdb();", self.conn)
-        tm.assert_frame_equal(df, res1)
-
-        # test delegation to read_sql_query
-        res2 = sql.read_sql("CALL get_testdb();", self.conn)
-        tm.assert_frame_equal(df, res2)
-
-
-class _TestPostgreSQLAlchemy(object):
-    """
-    Test the sqlalchemy backend against an PostgreSQL database.
-
-    """
-    flavor = 'postgresql'
-
-    @classmethod
-    def connect(cls):
-        url = 'postgresql+{driver}://postgres@localhost/pandas_nosetest'
-        return sqlalchemy.create_engine(url.format(driver=cls.driver))
-
-    @classmethod
-    def setup_driver(cls):
-        try:
-            import psycopg2
-            cls.driver = 'psycopg2'
-        except ImportError:
-            raise nose.SkipTest('psycopg2 not installed')
-
-    def test_schema_support(self):
-        # only test this for postgresql (schema's not supported in mysql/sqlite)
-        df = DataFrame({'col1':[1, 2], 'col2':[0.1, 0.2], 'col3':['a', 'n']})
-
-        # create a schema
-        self.conn.execute("DROP SCHEMA IF EXISTS other CASCADE;")
-        self.conn.execute("CREATE SCHEMA other;")
-
-        # write dataframe to different schema's
-        df.to_sql('test_schema_public', self.conn, index=False)
-        df.to_sql('test_schema_public_explicit', self.conn, index=False,
-                  schema='public')
-        df.to_sql('test_schema_other', self.conn, index=False, schema='other')
-
-        # read dataframes back in
-        res1 = sql.read_sql_table('test_schema_public', self.conn)
-        tm.assert_frame_equal(df, res1)
-        res2 = sql.read_sql_table('test_schema_public_explicit', self.conn)
-        tm.assert_frame_equal(df, res2)
-        res3 = sql.read_sql_table('test_schema_public_explicit', self.conn,
-                                  schema='public')
-        tm.assert_frame_equal(df, res3)
-        res4 = sql.read_sql_table('test_schema_other', self.conn,
-                                  schema='other')
-        tm.assert_frame_equal(df, res4)
-        self.assertRaises(ValueError, sql.read_sql_table, 'test_schema_other',
-                          self.conn, schema='public')
-
-        ## different if_exists options
-
-        # create a schema
-        self.conn.execute("DROP SCHEMA IF EXISTS other CASCADE;")
-        self.conn.execute("CREATE SCHEMA other;")
-
-        # write dataframe with different if_exists options
-        df.to_sql('test_schema_other', self.conn, schema='other', index=False)
-        df.to_sql('test_schema_other', self.conn, schema='other', index=False,
-                  if_exists='replace')
-        df.to_sql('test_schema_other', self.conn, schema='other', index=False,
-                  if_exists='append')
-        res = sql.read_sql_table('test_schema_other', self.conn, schema='other')
-        tm.assert_frame_equal(concat([df, df], ignore_index=True), res)
-
-        ## specifying schema in user-provided meta
-
-        # The schema won't be applied on another Connection
-        # because of transactional schemas
-        if isinstance(self.conn, sqlalchemy.engine.Engine):
-            engine2 = self.connect()
-            meta = sqlalchemy.MetaData(engine2, schema='other')
-            pdsql = sql.SQLDatabase(engine2, meta=meta)
-            pdsql.to_sql(df, 'test_schema_other2', index=False)
-            pdsql.to_sql(df, 'test_schema_other2', index=False, if_exists='replace')
-            pdsql.to_sql(df, 'test_schema_other2', index=False, if_exists='append')
-            res1 = sql.read_sql_table('test_schema_other2', self.conn, schema='other')
-            res2 = pdsql.read_table('test_schema_other2')
-            tm.assert_frame_equal(res1, res2)
-
-class TestMySQLAlchemy(_TestMySQLAlchemy, _TestSQLAlchemy):
-    pass
-
-
-class TestMySQLAlchemyConn(_TestMySQLAlchemy, _TestSQLAlchemyConn):
-    pass
-
-
-class TestPostgreSQLAlchemy(_TestPostgreSQLAlchemy, _TestSQLAlchemy):
-    pass
-
-
-class TestPostgreSQLAlchemyConn(_TestPostgreSQLAlchemy, _TestSQLAlchemyConn):
-    pass
-
-
-class TestSQLiteAlchemy(_TestSQLiteAlchemy, _TestSQLAlchemy):
-    pass
-
-
-class TestSQLiteAlchemyConn(_TestSQLiteAlchemy, _TestSQLAlchemyConn):
-    pass
-
-
-#------------------------------------------------------------------------------
-#--- Test Sqlite / MySQL fallback
-
-class TestSQLiteFallback(SQLiteMixIn, PandasSQLTest):
-    """
-    Test the fallback mode against an in-memory sqlite database.
-
-    """
-    flavor = 'sqlite'
-
-    @classmethod
-    def connect(cls):
-        return sqlite3.connect(':memory:')
-
-    def setUp(self):
-        self.conn = self.connect()
-        self.pandasSQL = sql.SQLiteDatabase(self.conn, 'sqlite')
-
-        self._load_iris_data()
-
-        self._load_test1_data()
-
-    def test_invalid_flavor(self):
-        self.assertRaises(
-            NotImplementedError, sql.SQLiteDatabase, self.conn, 'oracle')
-
-    def test_read_sql(self):
-        self._read_sql_iris()
-
-    def test_read_sql_parameter(self):
-        self._read_sql_iris_parameter()
-
-    def test_read_sql_named_parameter(self):
-        self._read_sql_iris_named_parameter()
-
-    def test_to_sql(self):
-        self._to_sql()
-
-    def test_to_sql_empty(self):
-        self._to_sql_empty()
-
-    def test_to_sql_fail(self):
-        self._to_sql_fail()
-
-    def test_to_sql_replace(self):
-        self._to_sql_replace()
-
-    def test_to_sql_append(self):
-        self._to_sql_append()
-
-    def test_create_and_drop_table(self):
-        temp_frame = DataFrame(
-            {'one': [1., 2., 3., 4.], 'two': [4., 3., 2., 1.]})
-
-        self.pandasSQL.to_sql(temp_frame, 'drop_test_frame')
-
-        self.assertTrue(self.pandasSQL.has_table('drop_test_frame'),
-                        'Table not written to DB')
-
-        self.pandasSQL.drop_table('drop_test_frame')
-
-        self.assertFalse(self.pandasSQL.has_table('drop_test_frame'),
-                         'Table not deleted from DB')
-
-    def test_roundtrip(self):
-        self._roundtrip()
-
-    def test_execute_sql(self):
-        self._execute_sql()
-
-    def test_datetime_date(self):
-        # test support for datetime.date
-        df = DataFrame([date(2014, 1, 1), date(2014, 1, 2)], columns=["a"])
-        df.to_sql('test_date', self.conn, index=False, flavor=self.flavor)
-        res = read_sql_query('SELECT * FROM test_date', self.conn)
-        if self.flavor == 'sqlite':
-            # comes back as strings
-            tm.assert_frame_equal(res, df.astype(str))
-        elif self.flavor == 'mysql':
-            tm.assert_frame_equal(res, df)
-
-    def test_datetime_time(self):
-        # test support for datetime.time
-        df = DataFrame([time(9, 0, 0), time(9, 1, 30)], columns=["a"])
-        # test it raises an error and not fails silently (GH8341)
-        if self.flavor == 'sqlite':
-            self.assertRaises(sqlite3.InterfaceError, sql.to_sql, df,
-                              'test_time', self.conn)
-
-    def _get_index_columns(self, tbl_name):
-        ixs = sql.read_sql_query(
-            "SELECT * FROM sqlite_master WHERE type = 'index' " +
-            "AND tbl_name = '%s'" % tbl_name, self.conn)
-        ix_cols = []
-        for ix_name in ixs.name:
-            ix_info = sql.read_sql_query(
-                "PRAGMA index_info(%s)" % ix_name, self.conn)
-            ix_cols.append(ix_info.name.tolist())
-        return ix_cols
-
-    def test_to_sql_save_index(self):
-        self._to_sql_save_index()
-
-    def test_transactions(self):
-        self._transaction_test()
-
-    def _get_sqlite_column_type(self, table, column):
-        recs = self.conn.execute('PRAGMA table_info(%s)' % table)
-        for cid, name, ctype, not_null, default, pk in recs:
-            if name == column:
-                return ctype
-        raise ValueError('Table %s, column %s not found' % (table, column))
-
-    def test_dtype(self):
-        if self.flavor == 'mysql':
-            raise nose.SkipTest('Not applicable to MySQL legacy')
-        cols = ['A', 'B']
-        data = [(0.8, True),
-                (0.9, None)]
-        df = DataFrame(data, columns=cols)
-        df.to_sql('dtype_test', self.conn)
-        df.to_sql('dtype_test2', self.conn, dtype={'B': 'STRING'})
-
-        # sqlite stores Boolean values as INTEGER
-        self.assertEqual(self._get_sqlite_column_type('dtype_test', 'B'), 'INTEGER')
-
-        self.assertEqual(self._get_sqlite_column_type('dtype_test2', 'B'), 'STRING')
-        self.assertRaises(ValueError, df.to_sql,
-                          'error', self.conn, dtype={'B': bool})
-
-    def test_notnull_dtype(self):
-        if self.flavor == 'mysql':
-            raise nose.SkipTest('Not applicable to MySQL legacy')
-
-        cols = {'Bool': Series([True,None]),
-                'Date': Series([datetime(2012, 5, 1), None]),
-                'Int' : Series([1, None], dtype='object'),
-                'Float': Series([1.1, None])
-               }
-        df = DataFrame(cols)
-
-        tbl = 'notnull_dtype_test'
-        df.to_sql(tbl, self.conn)
-
-        self.assertEqual(self._get_sqlite_column_type(tbl, 'Bool'), 'INTEGER')
-        self.assertEqual(self._get_sqlite_column_type(tbl, 'Date'), 'TIMESTAMP')
-        self.assertEqual(self._get_sqlite_column_type(tbl, 'Int'), 'INTEGER')
-        self.assertEqual(self._get_sqlite_column_type(tbl, 'Float'), 'REAL')
-
-    def test_illegal_names(self):
-        # For sqlite, these should work fine
-        df = DataFrame([[1, 2], [3, 4]], columns=['a', 'b'])
-
-        # Raise error on blank
-        self.assertRaises(ValueError, df.to_sql, "", self.conn,
-            flavor=self.flavor)
-
-        for ndx, weird_name in enumerate(['test_weird_name]','test_weird_name[',
-            'test_weird_name`','test_weird_name"', 'test_weird_name\'',
-            '_b.test_weird_name_01-30', '"_b.test_weird_name_01-30"',
-            '99beginswithnumber', '12345']):
-            df.to_sql(weird_name, self.conn, flavor=self.flavor)
-            sql.table_exists(weird_name, self.conn)
-
-            df2 = DataFrame([[1, 2], [3, 4]], columns=['a', weird_name])
-            c_tbl = 'test_weird_col_name%d'%ndx
-            df2.to_sql(c_tbl, self.conn, flavor=self.flavor)
-            sql.table_exists(c_tbl, self.conn)
-
-
-class TestMySQLLegacy(MySQLMixIn, TestSQLiteFallback):
-    """
-    Test the legacy mode against a MySQL database.
-
-    """
-    flavor = 'mysql'
-
-    @classmethod
-    def setUpClass(cls):
-        cls.setup_driver()
-
-        # test connection
-        try:
-            cls.connect()
-        except cls.driver.err.OperationalError:
-            raise nose.SkipTest("{0} - can't connect to MySQL server".format(cls))
-
-    @classmethod
-    def setup_driver(cls):
-        try:
-            import pymysql
-            cls.driver = pymysql
-        except ImportError:
-            raise nose.SkipTest('pymysql not installed')
-
-    @classmethod
-    def connect(cls):
-        return cls.driver.connect(host='127.0.0.1', user='root', passwd='', db='pandas_nosetest')
-
-    def _count_rows(self, table_name):
-        cur = self._get_exec()
-        cur.execute(
-            "SELECT count(*) AS count_1 FROM %s" % table_name)
-        rows = cur.fetchall()
-        return rows[0][0]
-
-    def setUp(self):
-        try:
-            self.conn = self.connect()
-        except self.driver.err.OperationalError:
-            raise nose.SkipTest("Can't connect to MySQL server")
-
-        self.pandasSQL = sql.SQLiteDatabase(self.conn, 'mysql')
-
-        self._load_iris_data()
-        self._load_test1_data()
-
-    def test_a_deprecation(self):
-        with tm.assert_produces_warning(FutureWarning):
-            sql.to_sql(self.test_frame1, 'test_frame1', self.conn,
-                       flavor='mysql')
-        self.assertTrue(
-            sql.has_table('test_frame1', self.conn, flavor='mysql'),
-            'Table not written to DB')
-
-    def _get_index_columns(self, tbl_name):
-        ixs = sql.read_sql_query(
-            "SHOW INDEX IN %s" % tbl_name, self.conn)
-        ix_cols = {}
-        for ix_name, ix_col in zip(ixs.Key_name, ixs.Column_name):
-            if ix_name not in ix_cols:
-                ix_cols[ix_name] = []
-            ix_cols[ix_name].append(ix_col)
-        return list(ix_cols.values())
-
-    def test_to_sql_save_index(self):
-        self._to_sql_save_index()
-
-        for ix_name, ix_col in zip(ixs.Key_name, ixs.Column_name):
-            if ix_name not in ix_cols:
-                ix_cols[ix_name] = []
-            ix_cols[ix_name].append(ix_col)
-        return ix_cols.values()
-
-    def test_to_sql_save_index(self):
-        self._to_sql_save_index()
-
-    def test_illegal_names(self):
-        df = DataFrame([[1, 2], [3, 4]], columns=['a', 'b'])
-
-        # These tables and columns should be ok
-        for ndx, ok_name in enumerate(['99beginswithnumber','12345']):
-            df.to_sql(ok_name, self.conn, flavor=self.flavor, index=False,
-                      if_exists='replace')
-            df2 = DataFrame([[1, 2], [3, 4]], columns=['a', ok_name])
-
-            df2.to_sql('test_ok_col_name', self.conn, flavor=self.flavor, index=False,
-                      if_exists='replace')
-
-        # For MySQL, these should raise ValueError
-        for ndx, illegal_name in enumerate(['test_illegal_name]','test_illegal_name[',
-            'test_illegal_name`','test_illegal_name"', 'test_illegal_name\'', '']):
-            self.assertRaises(ValueError, df.to_sql, illegal_name, self.conn,
-                flavor=self.flavor, index=False)
-
-            df2 = DataFrame([[1, 2], [3, 4]], columns=['a', illegal_name])
-            self.assertRaises(ValueError, df2.to_sql, 'test_illegal_col_name%d'%ndx,
-                self.conn, flavor=self.flavor, index=False)
-
-
-#------------------------------------------------------------------------------
-#--- Old tests from 0.13.1 (before refactor using sqlalchemy)
-
-
-_formatters = {
-    datetime: lambda dt: "'%s'" % date_format(dt),
-    str: lambda x: "'%s'" % x,
-    np.str_: lambda x: "'%s'" % x,
-    compat.text_type: lambda x: "'%s'" % x,
-    compat.binary_type: lambda x: "'%s'" % x,
-    float: lambda x: "%.8f" % x,
-    int: lambda x: "%s" % x,
-    type(None): lambda x: "NULL",
-    np.float64: lambda x: "%.10f" % x,
-    bool: lambda x: "'%s'" % x,
-}
-
-def format_query(sql, *args):
-    """
-
-    """
-    processed_args = []
-    for arg in args:
-        if isinstance(arg, float) and isnull(arg):
-            arg = None
-
-        formatter = _formatters[type(arg)]
-        processed_args.append(formatter(arg))
-
-    return sql % tuple(processed_args)
-
-def _skip_if_no_pymysql():
-    try:
-        import pymysql
-    except ImportError:
-        raise nose.SkipTest('pymysql not installed, skipping')
-
-
-class TestXSQLite(SQLiteMixIn, tm.TestCase):
-
-    def setUp(self):
-        self.conn = sqlite3.connect(':memory:')
-
-    def test_basic(self):
-        frame = tm.makeTimeDataFrame()
-        self._check_roundtrip(frame)
-
-    def test_write_row_by_row(self):
-
-        frame = tm.makeTimeDataFrame()
-        frame.ix[0, 0] = np.nan
-        create_sql = sql.get_schema(frame, 'test', 'sqlite')
-        cur = self.conn.cursor()
-        cur.execute(create_sql)
-
-        cur = self.conn.cursor()
-
-        ins = "INSERT INTO test VALUES (%s, %s, %s, %s)"
-        for idx, row in frame.iterrows():
-            fmt_sql = format_query(ins, *row)
-            sql.tquery(fmt_sql, cur=cur)
-
-        self.conn.commit()
-
-        result = sql.read_frame("select * from test", con=self.conn)
-        result.index = frame.index
-        tm.assert_frame_equal(result, frame)
-
-    def test_execute(self):
-        frame = tm.makeTimeDataFrame()
-        create_sql = sql.get_schema(frame, 'test', 'sqlite')
-        cur = self.conn.cursor()
-        cur.execute(create_sql)
-        ins = "INSERT INTO test VALUES (?, ?, ?, ?)"
-
-        row = frame.ix[0]
-        sql.execute(ins, self.conn, params=tuple(row))
-        self.conn.commit()
-
-        result = sql.read_frame("select * from test", self.conn)
-        result.index = frame.index[:1]
-        tm.assert_frame_equal(result, frame[:1])
-
-    def test_schema(self):
-        frame = tm.makeTimeDataFrame()
-        create_sql = sql.get_schema(frame, 'test', 'sqlite')
-        lines = create_sql.splitlines()
-        for l in lines:
-            tokens = l.split(' ')
-            if len(tokens) == 2 and tokens[0] == 'A':
-                self.assertTrue(tokens[1] == 'DATETIME')
-
-        frame = tm.makeTimeDataFrame()
-        create_sql = sql.get_schema(frame, 'test', 'sqlite', keys=['A', 'B'],)
-        lines = create_sql.splitlines()
-        self.assertTrue('PRIMARY KEY ("A", "B")' in create_sql)
-        cur = self.conn.cursor()
-        cur.execute(create_sql)
-
-    def test_execute_fail(self):
-        create_sql = """
-        CREATE TABLE test
-        (
-        a TEXT,
-        b TEXT,
-        c REAL,
-        PRIMARY KEY (a, b)
-        );
-        """
-        cur = self.conn.cursor()
-        cur.execute(create_sql)
-
-        sql.execute('INSERT INTO test VALUES("foo", "bar", 1.234)', self.conn)
-        sql.execute('INSERT INTO test VALUES("foo", "baz", 2.567)', self.conn)
-
-        try:
-            sys.stdout = StringIO()
-            self.assertRaises(Exception, sql.execute,
-                              'INSERT INTO test VALUES("foo", "bar", 7)',
-                              self.conn)
-        finally:
-            sys.stdout = sys.__stdout__
-
-    def test_execute_closed_connection(self):
-        create_sql = """
-        CREATE TABLE test
-        (
-        a TEXT,
-        b TEXT,
-        c REAL,
-        PRIMARY KEY (a, b)
-        );
-        """
-        cur = self.conn.cursor()
-        cur.execute(create_sql)
-
-        sql.execute('INSERT INTO test VALUES("foo", "bar", 1.234)', self.conn)
-        self.conn.close()
-        try:
-            sys.stdout = StringIO()
-            self.assertRaises(Exception, sql.tquery, "select * from test",
-                              con=self.conn)
-        finally:
-            sys.stdout = sys.__stdout__
-
-        # Initialize connection again (needed for tearDown)
-        self.setUp()
-
-    def test_na_roundtrip(self):
-        pass
-
-    def _check_roundtrip(self, frame):
-        sql.write_frame(frame, name='test_table', con=self.conn)
-        result = sql.read_frame("select * from test_table", self.conn)
-
-        # HACK! Change this once indexes are handled properly.
-        result.index = frame.index
-
-        expected = frame
-        tm.assert_frame_equal(result, expected)
-
-        frame['txt'] = ['a'] * len(frame)
-        frame2 = frame.copy()
-        frame2['Idx'] = Index(lrange(len(frame2))) + 10
-        sql.write_frame(frame2, name='test_table2', con=self.conn)
-        result = sql.read_frame("select * from test_table2", self.conn,
-                                index_col='Idx')
-        expected = frame.copy()
-        expected.index = Index(lrange(len(frame2))) + 10
-        expected.index.name = 'Idx'
-        tm.assert_frame_equal(expected, result)
-
-    def test_tquery(self):
-        frame = tm.makeTimeDataFrame()
-        sql.write_frame(frame, name='test_table', con=self.conn)
-        result = sql.tquery("select A from test_table", self.conn)
-        expected = Series(frame.A.values, frame.index) # not to have name
-        result = Series(result, frame.index)
-        tm.assert_series_equal(result, expected)
-
-        try:
-            sys.stdout = StringIO()
-            self.assertRaises(sql.DatabaseError, sql.tquery,
-                              'select * from blah', con=self.conn)
-
-            self.assertRaises(sql.DatabaseError, sql.tquery,
-                              'select * from blah', con=self.conn, retry=True)
-        finally:
-            sys.stdout = sys.__stdout__
-
-    def test_uquery(self):
-        frame = tm.makeTimeDataFrame()
-        sql.write_frame(frame, name='test_table', con=self.conn)
-        stmt = 'INSERT INTO test_table VALUES(2.314, -123.1, 1.234, 2.3)'
-        self.assertEqual(sql.uquery(stmt, con=self.conn), 1)
-
-        try:
-            sys.stdout = StringIO()
-
-            self.assertRaises(sql.DatabaseError, sql.tquery,
-                              'insert into blah values (1)', con=self.conn)
-
-            self.assertRaises(sql.DatabaseError, sql.tquery,
-                              'insert into blah values (1)', con=self.conn,
-                              retry=True)
-        finally:
-            sys.stdout = sys.__stdout__
-
-    def test_keyword_as_column_names(self):
-        '''
-        '''
-        df = DataFrame({'From':np.ones(5)})
-        sql.write_frame(df, con = self.conn, name = 'testkeywords')
-
-    def test_onecolumn_of_integer(self):
-        # GH 3628
-        # a column_of_integers dataframe should transfer well to sql
-
-        mono_df=DataFrame([1 , 2], columns=['c0'])
-        sql.write_frame(mono_df, con = self.conn, name = 'mono_df')
-        # computing the sum via sql
-        con_x=self.conn
-        the_sum=sum([my_c0[0] for  my_c0 in con_x.execute("select * from mono_df")])
-        # it should not fail, and gives 3 ( Issue #3628 )
-        self.assertEqual(the_sum , 3)
-
-        result = sql.read_frame("select * from mono_df",con_x)
-        tm.assert_frame_equal(result,mono_df)
-
-    def test_if_exists(self):
-        df_if_exists_1 = DataFrame({'col1': [1, 2], 'col2': ['A', 'B']})
-        df_if_exists_2 = DataFrame({'col1': [3, 4, 5], 'col2': ['C', 'D', 'E']})
-        table_name = 'table_if_exists'
-        sql_select = "SELECT * FROM %s" % table_name
-
-        def clean_up(test_table_to_drop):
-            """
-            Drops tables created from individual tests
-            so no dependencies arise from sequential tests
-            """
-            self.drop_table(test_table_to_drop)
-
-        # test if invalid value for if_exists raises appropriate error
-        self.assertRaises(ValueError,
-                          sql.write_frame,
-                          frame=df_if_exists_1,
-                          con=self.conn,
-                          name=table_name,
-                          flavor='sqlite',
-                          if_exists='notvalidvalue')
-        clean_up(table_name)
-
-        # test if_exists='fail'
-        sql.write_frame(frame=df_if_exists_1, con=self.conn, name=table_name,
-                        flavor='sqlite', if_exists='fail')
-        self.assertRaises(ValueError,
-                          sql.write_frame,
-                          frame=df_if_exists_1,
-                          con=self.conn,
-                          name=table_name,
-                          flavor='sqlite',
-                          if_exists='fail')
-
-        # test if_exists='replace'
-        sql.write_frame(frame=df_if_exists_1, con=self.conn, name=table_name,
-                        flavor='sqlite', if_exists='replace')
-        self.assertEqual(sql.tquery(sql_select, con=self.conn),
-                         [(1, 'A'), (2, 'B')])
-        sql.write_frame(frame=df_if_exists_2, con=self.conn, name=table_name,
-                        flavor='sqlite', if_exists='replace')
-        self.assertEqual(sql.tquery(sql_select, con=self.conn),
-                         [(3, 'C'), (4, 'D'), (5, 'E')])
-        clean_up(table_name)
-
-        # test if_exists='append'
-        sql.write_frame(frame=df_if_exists_1, con=self.conn, name=table_name,
-                        flavor='sqlite', if_exists='fail')
-        self.assertEqual(sql.tquery(sql_select, con=self.conn),
-                         [(1, 'A'), (2, 'B')])
-        sql.write_frame(frame=df_if_exists_2, con=self.conn, name=table_name,
-                        flavor='sqlite', if_exists='append')
-        self.assertEqual(sql.tquery(sql_select, con=self.conn),
-                         [(1, 'A'), (2, 'B'), (3, 'C'), (4, 'D'), (5, 'E')])
-        clean_up(table_name)
-
-
-class TestXMySQL(MySQLMixIn, tm.TestCase):
-
-    @classmethod
-    def setUpClass(cls):
-        _skip_if_no_pymysql()
-
-        # test connection
-        import pymysql
-        try:
-            # Try Travis defaults.
-            # No real user should allow root access with a blank password.
-            pymysql.connect(host='localhost', user='root', passwd='',
-                            db='pandas_nosetest')
-        except:
-            pass
-        else:
-            return
-        try:
-            pymysql.connect(read_default_group='pandas')
-        except pymysql.ProgrammingError as e:
-            raise nose.SkipTest(
-                "Create a group of connection parameters under the heading "
-                "[pandas] in your system's mysql default file, "
-                "typically located at ~/.my.cnf or /etc/.my.cnf. ")
-        except pymysql.Error as e:
-            raise nose.SkipTest(
-                "Cannot connect to database. "
-                "Create a group of connection parameters under the heading "
-                "[pandas] in your system's mysql default file, "
-                "typically located at ~/.my.cnf or /etc/.my.cnf. ")
-
-    def setUp(self):
-        _skip_if_no_pymysql()
-        import pymysql
-        try:
-            # Try Travis defaults.
-            # No real user should allow root access with a blank password.
-            self.conn = pymysql.connect(host='localhost', user='root', passwd='',
-                                    db='pandas_nosetest')
-        except:
-            pass
-        else:
-            return
-        try:
-            self.conn = pymysql.connect(read_default_group='pandas')
-        except pymysql.ProgrammingError as e:
-            raise nose.SkipTest(
-                "Create a group of connection parameters under the heading "
-                "[pandas] in your system's mysql default file, "
-                "typically located at ~/.my.cnf or /etc/.my.cnf. ")
-        except pymysql.Error as e:
-            raise nose.SkipTest(
-                "Cannot connect to database. "
-                "Create a group of connection parameters under the heading "
-                "[pandas] in your system's mysql default file, "
-                "typically located at ~/.my.cnf or /etc/.my.cnf. ")
-
-
-    def test_basic(self):
-        _skip_if_no_pymysql()
-        frame = tm.makeTimeDataFrame()
-        self._check_roundtrip(frame)
-
-    def test_write_row_by_row(self):
-
-        _skip_if_no_pymysql()
-        frame = tm.makeTimeDataFrame()
-        frame.ix[0, 0] = np.nan
-        drop_sql = "DROP TABLE IF EXISTS test"
-        create_sql = sql.get_schema(frame, 'test', 'mysql')
-        cur = self.conn.cursor()
-        cur.execute(drop_sql)
-        cur.execute(create_sql)
-        ins = "INSERT INTO test VALUES (%s, %s, %s, %s)"
-        for idx, row in frame.iterrows():
-            fmt_sql = format_query(ins, *row)
-            sql.tquery(fmt_sql, cur=cur)
-
-        self.conn.commit()
-
-        result = sql.read_frame("select * from test", con=self.conn)
-        result.index = frame.index
-        tm.assert_frame_equal(result, frame)
-
-    def test_execute(self):
-        _skip_if_no_pymysql()
-        frame = tm.makeTimeDataFrame()
-        drop_sql = "DROP TABLE IF EXISTS test"
-        create_sql = sql.get_schema(frame, 'test', 'mysql')
-        cur = self.conn.cursor()
-        with warnings.catch_warnings():
-            warnings.filterwarnings("ignore", "Unknown table.*")
-            cur.execute(drop_sql)
-        cur.execute(create_sql)
-        ins = "INSERT INTO test VALUES (%s, %s, %s, %s)"
-
-        row = frame.ix[0].values.tolist()
-        sql.execute(ins, self.conn, params=tuple(row))
-        self.conn.commit()
-
-        result = sql.read_frame("select * from test", self.conn)
-        result.index = frame.index[:1]
-        tm.assert_frame_equal(result, frame[:1])
-
-    def test_schema(self):
-        _skip_if_no_pymysql()
-        frame = tm.makeTimeDataFrame()
-        create_sql = sql.get_schema(frame, 'test', 'mysql')
-        lines = create_sql.splitlines()
-        for l in lines:
-            tokens = l.split(' ')
-            if len(tokens) == 2 and tokens[0] == 'A':
-                self.assertTrue(tokens[1] == 'DATETIME')
-
-        frame = tm.makeTimeDataFrame()
-        drop_sql = "DROP TABLE IF EXISTS test"
-        create_sql = sql.get_schema(frame, 'test', 'mysql', keys=['A', 'B'],)
-        lines = create_sql.splitlines()
-        self.assertTrue('PRIMARY KEY (`A`, `B`)' in create_sql)
-        cur = self.conn.cursor()
-        cur.execute(drop_sql)
-        cur.execute(create_sql)
-
-    def test_execute_fail(self):
-        _skip_if_no_pymysql()
-        drop_sql = "DROP TABLE IF EXISTS test"
-        create_sql = """
-        CREATE TABLE test
-        (
-        a TEXT,
-        b TEXT,
-        c REAL,
-        PRIMARY KEY (a(5), b(5))
-        );
-        """
-        cur = self.conn.cursor()
-        cur.execute(drop_sql)
-        cur.execute(create_sql)
-
-        sql.execute('INSERT INTO test VALUES("foo", "bar", 1.234)', self.conn)
-        sql.execute('INSERT INTO test VALUES("foo", "baz", 2.567)', self.conn)
-
-        try:
-            sys.stdout = StringIO()
-            self.assertRaises(Exception, sql.execute,
-                              'INSERT INTO test VALUES("foo", "bar", 7)',
-                              self.conn)
-        finally:
-            sys.stdout = sys.__stdout__
-
-    def test_execute_closed_connection(self):
-        _skip_if_no_pymysql()
-        drop_sql = "DROP TABLE IF EXISTS test"
-        create_sql = """
-        CREATE TABLE test
-        (
-        a TEXT,
-        b TEXT,
-        c REAL,
-        PRIMARY KEY (a(5), b(5))
-        );
-        """
-        cur = self.conn.cursor()
-        cur.execute(drop_sql)
-        cur.execute(create_sql)
-
-        sql.execute('INSERT INTO test VALUES("foo", "bar", 1.234)', self.conn)
-        self.conn.close()
-        try:
-            sys.stdout = StringIO()
-            self.assertRaises(Exception, sql.tquery, "select * from test",
-                              con=self.conn)
-        finally:
-            sys.stdout = sys.__stdout__
-
-        # Initialize connection again (needed for tearDown)
-        self.setUp()
-
-
-    def test_na_roundtrip(self):
-        _skip_if_no_pymysql()
-        pass
-
-    def _check_roundtrip(self, frame):
-        _skip_if_no_pymysql()
-        drop_sql = "DROP TABLE IF EXISTS test_table"
-        cur = self.conn.cursor()
-        with warnings.catch_warnings():
-            warnings.filterwarnings("ignore", "Unknown table.*")
-            cur.execute(drop_sql)
-        sql.write_frame(frame, name='test_table', con=self.conn, flavor='mysql')
-        result = sql.read_frame("select * from test_table", self.conn)
-
-        # HACK! Change this once indexes are handled properly.
-        result.index = frame.index
-        result.index.name = frame.index.name
-
-        expected = frame
-        tm.assert_frame_equal(result, expected)
-
-        frame['txt'] = ['a'] * len(frame)
-        frame2 = frame.copy()
-        index = Index(lrange(len(frame2))) + 10
-        frame2['Idx'] = index
-        drop_sql = "DROP TABLE IF EXISTS test_table2"
-        cur = self.conn.cursor()
-        with warnings.catch_warnings():
-            warnings.filterwarnings("ignore", "Unknown table.*")
-            cur.execute(drop_sql)
-        sql.write_frame(frame2, name='test_table2', con=self.conn, flavor='mysql')
-        result = sql.read_frame("select * from test_table2", self.conn,
-                                index_col='Idx')
-        expected = frame.copy()
-
-        # HACK! Change this once indexes are handled properly.
-        expected.index = index
-        expected.index.names = result.index.names
-        tm.assert_frame_equal(expected, result)
-
-    def test_tquery(self):
-        try:
-            import pymysql
-        except ImportError:
-            raise nose.SkipTest("no pymysql")
-        frame = tm.makeTimeDataFrame()
-        drop_sql = "DROP TABLE IF EXISTS test_table"
-        cur = self.conn.cursor()
-        cur.execute(drop_sql)
-        sql.write_frame(frame, name='test_table', con=self.conn, flavor='mysql')
-        result = sql.tquery("select A from test_table", self.conn)
-        expected = Series(frame.A.values, frame.index) # not to have name
-        result = Series(result, frame.index)
-        tm.assert_series_equal(result, expected)
-
-        try:
-            sys.stdout = StringIO()
-            self.assertRaises(sql.DatabaseError, sql.tquery,
-                              'select * from blah', con=self.conn)
-
-            self.assertRaises(sql.DatabaseError, sql.tquery,
-                              'select * from blah', con=self.conn, retry=True)
-        finally:
-            sys.stdout = sys.__stdout__
-
-    def test_uquery(self):
-        try:
-            import pymysql
-        except ImportError:
-            raise nose.SkipTest("no pymysql")
-        frame = tm.makeTimeDataFrame()
-        drop_sql = "DROP TABLE IF EXISTS test_table"
-        cur = self.conn.cursor()
-        cur.execute(drop_sql)
-        sql.write_frame(frame, name='test_table', con=self.conn, flavor='mysql')
-        stmt = 'INSERT INTO test_table VALUES(2.314, -123.1, 1.234, 2.3)'
-        self.assertEqual(sql.uquery(stmt, con=self.conn), 1)
-
-        try:
-            sys.stdout = StringIO()
-
-            self.assertRaises(sql.DatabaseError, sql.tquery,
-                              'insert into blah values (1)', con=self.conn)
-
-            self.assertRaises(sql.DatabaseError, sql.tquery,
-                              'insert into blah values (1)', con=self.conn,
-                              retry=True)
-        finally:
-            sys.stdout = sys.__stdout__
-
-    def test_keyword_as_column_names(self):
-        '''
-        '''
-        _skip_if_no_pymysql()
-        df = DataFrame({'From':np.ones(5)})
-        sql.write_frame(df, con = self.conn, name = 'testkeywords',
-                        if_exists='replace', flavor='mysql')
-
-    def test_if_exists(self):
-        _skip_if_no_pymysql()
-        df_if_exists_1 = DataFrame({'col1': [1, 2], 'col2': ['A', 'B']})
-        df_if_exists_2 = DataFrame({'col1': [3, 4, 5], 'col2': ['C', 'D', 'E']})
-        table_name = 'table_if_exists'
-        sql_select = "SELECT * FROM %s" % table_name
-
-        def clean_up(test_table_to_drop):
-            """
-            Drops tables created from individual tests
-            so no dependencies arise from sequential tests
-            """
-            self.drop_table(test_table_to_drop)
-
-        # test if invalid value for if_exists raises appropriate error
-        self.assertRaises(ValueError,
-                          sql.write_frame,
-                          frame=df_if_exists_1,
-                          con=self.conn,
-                          name=table_name,
-                          flavor='mysql',
-                          if_exists='notvalidvalue')
-        clean_up(table_name)
-
-        # test if_exists='fail'
-        sql.write_frame(frame=df_if_exists_1, con=self.conn, name=table_name,
-                        flavor='mysql', if_exists='fail')
-        self.assertRaises(ValueError,
-                          sql.write_frame,
-                          frame=df_if_exists_1,
-                          con=self.conn,
-                          name=table_name,
-                          flavor='mysql',
-                          if_exists='fail')
-
-        # test if_exists='replace'
-        sql.write_frame(frame=df_if_exists_1, con=self.conn, name=table_name,
-                        flavor='mysql', if_exists='replace')
-        self.assertEqual(sql.tquery(sql_select, con=self.conn),
-                         [(1, 'A'), (2, 'B')])
-        sql.write_frame(frame=df_if_exists_2, con=self.conn, name=table_name,
-                        flavor='mysql', if_exists='replace')
-        self.assertEqual(sql.tquery(sql_select, con=self.conn),
-                         [(3, 'C'), (4, 'D'), (5, 'E')])
-        clean_up(table_name)
-
-        # test if_exists='append'
-        sql.write_frame(frame=df_if_exists_1, con=self.conn, name=table_name,
-                        flavor='mysql', if_exists='fail')
-        self.assertEqual(sql.tquery(sql_select, con=self.conn),
-                         [(1, 'A'), (2, 'B')])
-        sql.write_frame(frame=df_if_exists_2, con=self.conn, name=table_name,
-                        flavor='mysql', if_exists='append')
-        self.assertEqual(sql.tquery(sql_select, con=self.conn),
-                         [(1, 'A'), (2, 'B'), (3, 'C'), (4, 'D'), (5, 'E')])
-        clean_up(table_name)
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/io/tests/test_stata.py b/pandas/io/tests/test_stata.py
deleted file mode 100644
index aff9cd6c558e2..0000000000000
--- a/pandas/io/tests/test_stata.py
+++ /dev/null
@@ -1,1053 +0,0 @@
-# -*- coding: utf-8 -*-
-# pylint: disable=E1101
-
-from datetime import datetime
-import datetime as dt
-import os
-import warnings
-import nose
-import struct
-import sys
-from distutils.version import LooseVersion
-
-import numpy as np
-
-import pandas as pd
-from pandas.compat import iterkeys
-from pandas.core.frame import DataFrame, Series
-from pandas.core.common import is_categorical_dtype
-from pandas.io.parsers import read_csv
-from pandas.io.stata import (read_stata, StataReader, InvalidColumnName,
-    PossiblePrecisionLoss, StataMissingValue)
-import pandas.util.testing as tm
-from pandas.tslib import NaT
-from pandas import compat
-
-
-class TestStata(tm.TestCase):
-
-    def setUp(self):
-        self.dirpath = tm.get_data_path()
-        self.dta1_114 = os.path.join(self.dirpath, 'stata1_114.dta')
-        self.dta1_117 = os.path.join(self.dirpath, 'stata1_117.dta')
-
-        self.dta2_113 = os.path.join(self.dirpath, 'stata2_113.dta')
-        self.dta2_114 = os.path.join(self.dirpath, 'stata2_114.dta')
-        self.dta2_115 = os.path.join(self.dirpath, 'stata2_115.dta')
-        self.dta2_117 = os.path.join(self.dirpath, 'stata2_117.dta')
-
-        self.dta3_113 = os.path.join(self.dirpath, 'stata3_113.dta')
-        self.dta3_114 = os.path.join(self.dirpath, 'stata3_114.dta')
-        self.dta3_115 = os.path.join(self.dirpath, 'stata3_115.dta')
-        self.dta3_117 = os.path.join(self.dirpath, 'stata3_117.dta')
-        self.csv3 = os.path.join(self.dirpath, 'stata3.csv')
-
-        self.dta4_113 = os.path.join(self.dirpath, 'stata4_113.dta')
-        self.dta4_114 = os.path.join(self.dirpath, 'stata4_114.dta')
-        self.dta4_115 = os.path.join(self.dirpath, 'stata4_115.dta')
-        self.dta4_117 = os.path.join(self.dirpath, 'stata4_117.dta')
-
-        self.dta_encoding = os.path.join(self.dirpath, 'stata1_encoding.dta')
-
-        self.csv14 = os.path.join(self.dirpath, 'stata5.csv')
-        self.dta14_113 = os.path.join(self.dirpath, 'stata5_113.dta')
-        self.dta14_114 = os.path.join(self.dirpath, 'stata5_114.dta')
-        self.dta14_115 = os.path.join(self.dirpath, 'stata5_115.dta')
-        self.dta14_117 = os.path.join(self.dirpath, 'stata5_117.dta')
-
-        self.csv15 = os.path.join(self.dirpath, 'stata6.csv')
-        self.dta15_113 = os.path.join(self.dirpath, 'stata6_113.dta')
-        self.dta15_114 = os.path.join(self.dirpath, 'stata6_114.dta')
-        self.dta15_115 = os.path.join(self.dirpath, 'stata6_115.dta')
-        self.dta15_117 = os.path.join(self.dirpath, 'stata6_117.dta')
-
-        self.dta16_115 = os.path.join(self.dirpath, 'stata7_115.dta')
-        self.dta16_117 = os.path.join(self.dirpath, 'stata7_117.dta')
-
-        self.dta17_113 = os.path.join(self.dirpath, 'stata8_113.dta')
-        self.dta17_115 = os.path.join(self.dirpath, 'stata8_115.dta')
-        self.dta17_117 = os.path.join(self.dirpath, 'stata8_117.dta')
-
-        self.dta18_115 = os.path.join(self.dirpath, 'stata9_115.dta')
-        self.dta18_117 = os.path.join(self.dirpath, 'stata9_117.dta')
-
-        self.dta19_115 = os.path.join(self.dirpath, 'stata10_115.dta')
-        self.dta19_117 = os.path.join(self.dirpath, 'stata10_117.dta')
-
-        self.dta20_115 = os.path.join(self.dirpath, 'stata11_115.dta')
-        self.dta20_117 = os.path.join(self.dirpath, 'stata11_117.dta')
-
-        self.dta21_117 = os.path.join(self.dirpath, 'stata12_117.dta')
-
-        self.dta22_118 = os.path.join(self.dirpath, 'stata14_118.dta')
-
-    def read_dta(self, file):
-        # Legacy default reader configuration
-        return read_stata(file, convert_dates=True)
-
-    def read_csv(self, file):
-        return read_csv(file, parse_dates=True)
-
-    def test_read_empty_dta(self):
-        empty_ds = DataFrame(columns=['unit'])
-        # GH 7369, make sure can read a 0-obs dta file
-        with tm.ensure_clean() as path:
-            empty_ds.to_stata(path,write_index=False)
-            empty_ds2 = read_stata(path)
-            tm.assert_frame_equal(empty_ds, empty_ds2)
-
-    def test_data_method(self):
-        # Minimal testing of legacy data method
-        with StataReader(self.dta1_114) as rdr:
-            with warnings.catch_warnings(record=True) as w:
-                parsed_114_data = rdr.data()
-
-        with StataReader(self.dta1_114) as rdr:
-            parsed_114_read = rdr.read()
-        tm.assert_frame_equal(parsed_114_data, parsed_114_read)
-
-    def test_read_dta1(self):
-
-        parsed_114 = self.read_dta(self.dta1_114)
-        parsed_117 = self.read_dta(self.dta1_117)
-
-        # Pandas uses np.nan as missing value.
-        # Thus, all columns will be of type float, regardless of their name.
-        expected = DataFrame([(np.nan, np.nan, np.nan, np.nan, np.nan)],
-                             columns=['float_miss', 'double_miss', 'byte_miss',
-                                      'int_miss', 'long_miss'])
-
-        # this is an oddity as really the nan should be float64, but
-        # the casting doesn't fail so need to match stata here
-        expected['float_miss'] = expected['float_miss'].astype(np.float32)
-
-        tm.assert_frame_equal(parsed_114, expected)
-        tm.assert_frame_equal(parsed_117, expected)
-
-    def test_read_dta2(self):
-        if LooseVersion(sys.version) < '2.7':
-            raise nose.SkipTest('datetime interp under 2.6 is faulty')
-
-        expected = DataFrame.from_records(
-            [
-                (
-                    datetime(2006, 11, 19, 23, 13, 20),
-                    1479596223000,
-                    datetime(2010, 1, 20),
-                    datetime(2010, 1, 8),
-                    datetime(2010, 1, 1),
-                    datetime(1974, 7, 1),
-                    datetime(2010, 1, 1),
-                    datetime(2010, 1, 1)
-                ),
-                (
-                    datetime(1959, 12, 31, 20, 3, 20),
-                    -1479590,
-                    datetime(1953, 10, 2),
-                    datetime(1948, 6, 10),
-                    datetime(1955, 1, 1),
-                    datetime(1955, 7, 1),
-                    datetime(1955, 1, 1),
-                    datetime(2, 1, 1)
-                ),
-                (
-                    pd.NaT,
-                    pd.NaT,
-                    pd.NaT,
-                    pd.NaT,
-                    pd.NaT,
-                    pd.NaT,
-                    pd.NaT,
-                    pd.NaT,
-                )
-            ],
-            columns=['datetime_c', 'datetime_big_c', 'date', 'weekly_date',
-                     'monthly_date', 'quarterly_date', 'half_yearly_date',
-                     'yearly_date']
-        )
-        expected['yearly_date'] = expected['yearly_date'].astype('O')
-
-        with warnings.catch_warnings(record=True) as w:
-            warnings.simplefilter("always")
-            parsed_114 = self.read_dta(self.dta2_114)
-            parsed_115 = self.read_dta(self.dta2_115)
-            parsed_117 = self.read_dta(self.dta2_117)
-            # 113 is buggy due to limits of date format support in Stata
-            # parsed_113 = self.read_dta(self.dta2_113)
-
-            # Remove resource warnings
-            w = [x for x in w if x.category is UserWarning]
-
-            # should get warning for each call to read_dta
-            tm.assert_equal(len(w), 3)
-
-        # buggy test because of the NaT comparison on certain platforms
-        # Format 113 test fails since it does not support tc and tC formats
-        # tm.assert_frame_equal(parsed_113, expected)
-        tm.assert_frame_equal(parsed_114, expected, check_datetimelike_compat=True)
-        tm.assert_frame_equal(parsed_115, expected, check_datetimelike_compat=True)
-        tm.assert_frame_equal(parsed_117, expected, check_datetimelike_compat=True)
-
-    def test_read_dta3(self):
-        parsed_113 = self.read_dta(self.dta3_113)
-        parsed_114 = self.read_dta(self.dta3_114)
-        parsed_115 = self.read_dta(self.dta3_115)
-        parsed_117 = self.read_dta(self.dta3_117)
-
-        # match stata here
-        expected = self.read_csv(self.csv3)
-        expected = expected.astype(np.float32)
-        expected['year'] = expected['year'].astype(np.int16)
-        expected['quarter'] = expected['quarter'].astype(np.int8)
-
-        tm.assert_frame_equal(parsed_113, expected)
-        tm.assert_frame_equal(parsed_114, expected)
-        tm.assert_frame_equal(parsed_115, expected)
-        tm.assert_frame_equal(parsed_117, expected)
-
-    def test_read_dta4(self):
-        parsed_113 = self.read_dta(self.dta4_113)
-        parsed_114 = self.read_dta(self.dta4_114)
-        parsed_115 = self.read_dta(self.dta4_115)
-        parsed_117 = self.read_dta(self.dta4_117)
-
-        expected = DataFrame.from_records(
-            [
-                ["one", "ten", "one", "one", "one"],
-                ["two", "nine", "two", "two", "two"],
-                ["three", "eight", "three", "three", "three"],
-                ["four", "seven", 4, "four", "four"],
-                ["five", "six", 5, np.nan, "five"],
-                ["six", "five", 6, np.nan, "six"],
-                ["seven", "four", 7, np.nan, "seven"],
-                ["eight", "three", 8, np.nan, "eight"],
-                ["nine", "two", 9, np.nan, "nine"],
-                ["ten", "one", "ten", np.nan, "ten"]
-            ],
-            columns=['fully_labeled', 'fully_labeled2', 'incompletely_labeled',
-                     'labeled_with_missings', 'float_labelled'])
-
-        # these are all categoricals
-        expected = pd.concat([expected[col].astype('category') for col in expected], axis=1)
-
-        tm.assert_frame_equal(parsed_113, expected)
-        tm.assert_frame_equal(parsed_114, expected)
-        tm.assert_frame_equal(parsed_115, expected)
-        tm.assert_frame_equal(parsed_117, expected)
-
-    # File containing strls
-    def test_read_dta12(self):
-        parsed_117 = self.read_dta(self.dta21_117)
-        expected = DataFrame.from_records(
-            [
-                [1, "abc", "abcdefghi"],
-                [3, "cba", "qwertywertyqwerty"],
-                [93, "", "strl"],
-            ],
-            columns=['x', 'y', 'z'])
-
-        tm.assert_frame_equal(parsed_117, expected, check_dtype=False)
-
-
-    def test_read_dta18(self):
-        parsed_118 = self.read_dta(self.dta22_118)
-        parsed_118["Bytes"] = parsed_118["Bytes"].astype('O')
-        expected = DataFrame.from_records(
-            [['Cat', 'Bogota', u'Bogotá', 1, 1.0, u'option b Ünicode', 1.0],
-             ['Dog', 'Boston', u'Uzunköprü', np.nan, np.nan, np.nan, np.nan],
-             ['Plane', 'Rome', u'Tromsø', 0, 0.0, 'option a', 0.0],
-             ['Potato', 'Tokyo', u'Elâzığ', -4, 4.0, 4, 4],
-             ['', '', '', 0, 0.3332999, 'option a', 1/3.]
-             ],
-            columns=['Things', 'Cities', 'Unicode_Cities_Strl', 'Ints', 'Floats', 'Bytes', 'Longs'])
-        expected["Floats"] = expected["Floats"].astype(np.float32)
-        for col in parsed_118.columns:
-            tm.assert_almost_equal(parsed_118[col], expected[col])
-
-        with StataReader(self.dta22_118) as rdr:
-            vl = rdr.variable_labels()
-            vl_expected = {u'Unicode_Cities_Strl': u'Here are some strls with Ünicode chars',
-                           u'Longs': u'long data',
-                           u'Things': u'Here are some things',
-                           u'Bytes': u'byte data',
-                           u'Ints': u'int data',
-                           u'Cities': u'Here are some cities',
-                           u'Floats': u'float data'}
-            tm.assert_dict_equal(vl, vl_expected)
-
-            self.assertEqual(rdr.data_label, u'This is a  Ünicode data label')
-
-    def test_read_write_dta5(self):
-        original = DataFrame([(np.nan, np.nan, np.nan, np.nan, np.nan)],
-                             columns=['float_miss', 'double_miss', 'byte_miss',
-                                      'int_miss', 'long_miss'])
-        original.index.name = 'index'
-
-        with tm.ensure_clean() as path:
-            original.to_stata(path, None)
-            written_and_read_again = self.read_dta(path)
-            tm.assert_frame_equal(written_and_read_again.set_index('index'),
-                                  original)
-
-    def test_write_dta6(self):
-        original = self.read_csv(self.csv3)
-        original.index.name = 'index'
-        original.index = original.index.astype(np.int32)
-        original['year'] = original['year'].astype(np.int32)
-        original['quarter'] = original['quarter'].astype(np.int32)
-
-        with tm.ensure_clean() as path:
-            original.to_stata(path, None)
-            written_and_read_again = self.read_dta(path)
-            tm.assert_frame_equal(written_and_read_again.set_index('index'),
-                                  original)
-
-    def test_read_write_dta10(self):
-        original = DataFrame(data=[["string", "object", 1, 1.1,
-                                    np.datetime64('2003-12-25')]],
-                             columns=['string', 'object', 'integer', 'floating',
-                                      'datetime'])
-        original["object"] = Series(original["object"], dtype=object)
-        original.index.name = 'index'
-        original.index = original.index.astype(np.int32)
-        original['integer'] = original['integer'].astype(np.int32)
-
-        with tm.ensure_clean() as path:
-            original.to_stata(path, {'datetime': 'tc'})
-            written_and_read_again = self.read_dta(path)
-            tm.assert_frame_equal(written_and_read_again.set_index('index'),
-                                  original)
-
-    def test_stata_doc_examples(self):
-        with tm.ensure_clean() as path:
-            df = DataFrame(np.random.randn(10, 2), columns=list('AB'))
-            df.to_stata(path)
-
-    def test_write_preserves_original(self):
-        # 9795
-        np.random.seed(423)
-        df = pd.DataFrame(np.random.randn(5,4), columns=list('abcd'))
-        df.ix[2, 'a':'c'] = np.nan
-        df_copy = df.copy()
-        with tm.ensure_clean() as path:
-            df.to_stata(path, write_index=False)
-        tm.assert_frame_equal(df, df_copy)
-
-    def test_encoding(self):
-
-        # GH 4626, proper encoding handling
-        raw = read_stata(self.dta_encoding)
-        encoded = read_stata(self.dta_encoding, encoding="latin-1")
-        result = encoded.kreis1849[0]
-
-        if compat.PY3:
-            expected = raw.kreis1849[0]
-            self.assertEqual(result, expected)
-            self.assertIsInstance(result, compat.string_types)
-        else:
-            expected = raw.kreis1849.str.decode("latin-1")[0]
-            self.assertEqual(result, expected)
-            self.assertIsInstance(result, unicode)
-
-        with tm.ensure_clean() as path:
-            encoded.to_stata(path,encoding='latin-1', write_index=False)
-            reread_encoded = read_stata(path, encoding='latin-1')
-            tm.assert_frame_equal(encoded, reread_encoded)
-
-    def test_read_write_dta11(self):
-        original = DataFrame([(1, 2, 3, 4)],
-                             columns=['good', compat.u('b\u00E4d'), '8number', 'astringwithmorethan32characters______'])
-        formatted = DataFrame([(1, 2, 3, 4)],
-                              columns=['good', 'b_d', '_8number', 'astringwithmorethan32characters_'])
-        formatted.index.name = 'index'
-        formatted = formatted.astype(np.int32)
-
-        with tm.ensure_clean() as path:
-            with warnings.catch_warnings(record=True) as w:
-                original.to_stata(path, None)
-                # should get a warning for that format.
-            tm.assert_equal(len(w), 1)
-
-            written_and_read_again = self.read_dta(path)
-            tm.assert_frame_equal(written_and_read_again.set_index('index'), formatted)
-
-    def test_read_write_dta12(self):
-        original = DataFrame([(1, 2, 3, 4, 5, 6)],
-                             columns=['astringwithmorethan32characters_1',
-                                      'astringwithmorethan32characters_2',
-                                      '+',
-                                      '-',
-                                      'short',
-                                      'delete'])
-        formatted = DataFrame([(1, 2, 3, 4, 5, 6)],
-                              columns=['astringwithmorethan32characters_',
-                                       '_0astringwithmorethan32character',
-                                       '_',
-                                       '_1_',
-                                       '_short',
-                                       '_delete'])
-        formatted.index.name = 'index'
-        formatted = formatted.astype(np.int32)
-
-        with tm.ensure_clean() as path:
-            with warnings.catch_warnings(record=True) as w:
-                original.to_stata(path, None)
-                tm.assert_equal(len(w), 1)  # should get a warning for that format.
-
-            written_and_read_again = self.read_dta(path)
-            tm.assert_frame_equal(written_and_read_again.set_index('index'), formatted)
-
-    def test_read_write_dta13(self):
-        s1 = Series(2**9, dtype=np.int16)
-        s2 = Series(2**17, dtype=np.int32)
-        s3 = Series(2**33, dtype=np.int64)
-        original = DataFrame({'int16': s1, 'int32': s2, 'int64': s3})
-        original.index.name = 'index'
-
-        formatted = original
-        formatted['int64'] = formatted['int64'].astype(np.float64)
-
-        with tm.ensure_clean() as path:
-            original.to_stata(path)
-            written_and_read_again = self.read_dta(path)
-            tm.assert_frame_equal(written_and_read_again.set_index('index'),
-                                  formatted)
-
-    def test_read_write_reread_dta14(self):
-        expected = self.read_csv(self.csv14)
-        cols = ['byte_', 'int_', 'long_', 'float_', 'double_']
-        for col in cols:
-            expected[col] = expected[col]._convert(datetime=True, numeric=True)
-        expected['float_'] = expected['float_'].astype(np.float32)
-        expected['date_td'] = pd.to_datetime(expected['date_td'], errors='coerce')
-
-        parsed_113 = self.read_dta(self.dta14_113)
-        parsed_113.index.name = 'index'
-        parsed_114 = self.read_dta(self.dta14_114)
-        parsed_114.index.name = 'index'
-        parsed_115 = self.read_dta(self.dta14_115)
-        parsed_115.index.name = 'index'
-        parsed_117 = self.read_dta(self.dta14_117)
-        parsed_117.index.name = 'index'
-
-        tm.assert_frame_equal(parsed_114, parsed_113)
-        tm.assert_frame_equal(parsed_114, parsed_115)
-        tm.assert_frame_equal(parsed_114, parsed_117)
-
-        with tm.ensure_clean() as path:
-            parsed_114.to_stata(path, {'date_td': 'td'})
-            written_and_read_again = self.read_dta(path)
-            tm.assert_frame_equal(written_and_read_again.set_index('index'), parsed_114)
-
-    def test_read_write_reread_dta15(self):
-        expected = self.read_csv(self.csv15)
-        expected['byte_'] = expected['byte_'].astype(np.int8)
-        expected['int_'] = expected['int_'].astype(np.int16)
-        expected['long_'] = expected['long_'].astype(np.int32)
-        expected['float_'] = expected['float_'].astype(np.float32)
-        expected['double_'] = expected['double_'].astype(np.float64)
-        expected['date_td'] = expected['date_td'].apply(datetime.strptime, args=('%Y-%m-%d',))
-
-        parsed_113 = self.read_dta(self.dta15_113)
-        parsed_114 = self.read_dta(self.dta15_114)
-        parsed_115 = self.read_dta(self.dta15_115)
-        parsed_117 = self.read_dta(self.dta15_117)
-
-        tm.assert_frame_equal(expected, parsed_114)
-        tm.assert_frame_equal(parsed_113, parsed_114)
-        tm.assert_frame_equal(parsed_114, parsed_115)
-        tm.assert_frame_equal(parsed_114, parsed_117)
-
-    def test_timestamp_and_label(self):
-        original = DataFrame([(1,)], columns=['var'])
-        time_stamp = datetime(2000, 2, 29, 14, 21)
-        data_label = 'This is a data file.'
-        with tm.ensure_clean() as path:
-            original.to_stata(path, time_stamp=time_stamp, data_label=data_label)
-
-            with StataReader(path) as reader:
-                parsed_time_stamp = dt.datetime.strptime(reader.time_stamp, ('%d %b %Y %H:%M'))
-                assert parsed_time_stamp == time_stamp
-                assert reader.data_label == data_label
-
-    def test_numeric_column_names(self):
-        original = DataFrame(np.reshape(np.arange(25.0), (5, 5)))
-        original.index.name = 'index'
-        with tm.ensure_clean() as path:
-            # should get a warning for that format.
-            with tm.assert_produces_warning(InvalidColumnName):
-                original.to_stata(path)
-
-            written_and_read_again = self.read_dta(path)
-            written_and_read_again = written_and_read_again.set_index('index')
-            columns = list(written_and_read_again.columns)
-            convert_col_name = lambda x: int(x[1])
-            written_and_read_again.columns = map(convert_col_name, columns)
-            tm.assert_frame_equal(original, written_and_read_again)
-
-    def test_nan_to_missing_value(self):
-        s1 = Series(np.arange(4.0), dtype=np.float32)
-        s2 = Series(np.arange(4.0), dtype=np.float64)
-        s1[::2] = np.nan
-        s2[1::2] = np.nan
-        original = DataFrame({'s1': s1, 's2': s2})
-        original.index.name = 'index'
-        with tm.ensure_clean() as path:
-            original.to_stata(path)
-            written_and_read_again = self.read_dta(path)
-            written_and_read_again = written_and_read_again.set_index('index')
-            tm.assert_frame_equal(written_and_read_again, original)
-
-    def test_no_index(self):
-        columns = ['x', 'y']
-        original = DataFrame(np.reshape(np.arange(10.0), (5, 2)),
-                             columns=columns)
-        original.index.name = 'index_not_written'
-        with tm.ensure_clean() as path:
-            original.to_stata(path, write_index=False)
-            written_and_read_again = self.read_dta(path)
-            tm.assertRaises(KeyError,
-                            lambda: written_and_read_again['index_not_written'])
-
-    def test_string_no_dates(self):
-        s1 = Series(['a', 'A longer string'])
-        s2 = Series([1.0, 2.0], dtype=np.float64)
-        original = DataFrame({'s1': s1, 's2': s2})
-        original.index.name = 'index'
-        with tm.ensure_clean() as path:
-            original.to_stata(path)
-            written_and_read_again = self.read_dta(path)
-            tm.assert_frame_equal(written_and_read_again.set_index('index'),
-                                  original)
-
-    def test_large_value_conversion(self):
-        s0 = Series([1, 99], dtype=np.int8)
-        s1 = Series([1, 127], dtype=np.int8)
-        s2 = Series([1, 2 ** 15 - 1], dtype=np.int16)
-        s3 = Series([1, 2 ** 63 - 1], dtype=np.int64)
-        original = DataFrame({'s0': s0, 's1': s1, 's2': s2, 's3': s3})
-        original.index.name = 'index'
-        with tm.ensure_clean() as path:
-            with tm.assert_produces_warning(PossiblePrecisionLoss):
-                original.to_stata(path)
-
-            written_and_read_again = self.read_dta(path)
-            modified = original.copy()
-            modified['s1'] = Series(modified['s1'], dtype=np.int16)
-            modified['s2'] = Series(modified['s2'], dtype=np.int32)
-            modified['s3'] = Series(modified['s3'], dtype=np.float64)
-            tm.assert_frame_equal(written_and_read_again.set_index('index'),
-                                  modified)
-
-    def test_dates_invalid_column(self):
-        original = DataFrame([datetime(2006, 11, 19, 23, 13, 20)])
-        original.index.name = 'index'
-        with tm.ensure_clean() as path:
-            with tm.assert_produces_warning(InvalidColumnName):
-                original.to_stata(path, {0: 'tc'})
-
-            written_and_read_again = self.read_dta(path)
-            modified = original.copy()
-            modified.columns = ['_0']
-            tm.assert_frame_equal(written_and_read_again.set_index('index'),
-                                  modified)
-
-    def test_date_export_formats(self):
-        columns = ['tc', 'td', 'tw', 'tm', 'tq', 'th', 'ty']
-        conversions = dict(((c, c) for c in columns))
-        data = [datetime(2006, 11, 20, 23, 13, 20)] * len(columns)
-        original = DataFrame([data], columns=columns)
-        original.index.name = 'index'
-        expected_values = [datetime(2006, 11, 20, 23, 13, 20),  # Time
-                           datetime(2006, 11, 20),  # Day
-                           datetime(2006, 11, 19),  # Week
-                           datetime(2006, 11, 1),  # Month
-                           datetime(2006, 10, 1),  # Quarter year
-                           datetime(2006, 7, 1),  # Half year
-                           datetime(2006, 1, 1)]  # Year
-
-        expected = DataFrame([expected_values], columns=columns)
-        expected.index.name = 'index'
-        with tm.ensure_clean() as path:
-            original.to_stata(path, conversions)
-            written_and_read_again = self.read_dta(path)
-            tm.assert_frame_equal(written_and_read_again.set_index('index'),
-                                  expected)
-
-    def test_write_missing_strings(self):
-        original = DataFrame([["1"], [None]], columns=["foo"])
-        expected = DataFrame([["1"], [""]], columns=["foo"])
-        expected.index.name = 'index'
-        with tm.ensure_clean() as path:
-            original.to_stata(path)
-            written_and_read_again = self.read_dta(path)
-            tm.assert_frame_equal(written_and_read_again.set_index('index'),
-                                  expected)
-
-    def test_bool_uint(self):
-        s0 = Series([0, 1, True], dtype=np.bool)
-        s1 = Series([0, 1, 100], dtype=np.uint8)
-        s2 = Series([0, 1, 255], dtype=np.uint8)
-        s3 = Series([0, 1, 2 ** 15 - 100], dtype=np.uint16)
-        s4 = Series([0, 1, 2 ** 16 - 1], dtype=np.uint16)
-        s5 = Series([0, 1, 2 ** 31 - 100], dtype=np.uint32)
-        s6 = Series([0, 1, 2 ** 32 - 1], dtype=np.uint32)
-
-        original = DataFrame({'s0': s0, 's1': s1, 's2': s2, 's3': s3,
-                              's4': s4, 's5': s5, 's6': s6})
-        original.index.name = 'index'
-        expected = original.copy()
-        expected_types = (np.int8, np.int8, np.int16, np.int16, np.int32,
-                          np.int32, np.float64)
-        for c, t in zip(expected.columns, expected_types):
-            expected[c] = expected[c].astype(t)
-
-        with tm.ensure_clean() as path:
-            original.to_stata(path)
-            written_and_read_again = self.read_dta(path)
-            written_and_read_again = written_and_read_again.set_index('index')
-            tm.assert_frame_equal(written_and_read_again, expected)
-
-    def test_variable_labels(self):
-        with StataReader(self.dta16_115) as rdr:
-            sr_115 = rdr.variable_labels()
-        with StataReader(self.dta16_117) as rdr:
-            sr_117 = rdr.variable_labels()
-        keys = ('var1', 'var2', 'var3')
-        labels = ('label1', 'label2', 'label3')
-        for k,v in compat.iteritems(sr_115):
-            self.assertTrue(k in sr_117)
-            self.assertTrue(v == sr_117[k])
-            self.assertTrue(k in keys)
-            self.assertTrue(v in labels)
-
-    def test_minimal_size_col(self):
-        str_lens = (1, 100, 244)
-        s = {}
-        for str_len in str_lens:
-            s['s' + str(str_len)] = Series(['a' * str_len, 'b' * str_len, 'c' * str_len])
-        original = DataFrame(s)
-        with tm.ensure_clean() as path:
-            original.to_stata(path, write_index=False)
-
-            with StataReader(path) as sr:
-                typlist = sr.typlist
-                variables = sr.varlist
-                formats = sr.fmtlist
-                for variable, fmt, typ in zip(variables, formats, typlist):
-                    self.assertTrue(int(variable[1:]) == int(fmt[1:-1]))
-                    self.assertTrue(int(variable[1:]) == typ)
-
-    def test_excessively_long_string(self):
-        str_lens = (1, 244, 500)
-        s = {}
-        for str_len in str_lens:
-            s['s' + str(str_len)] = Series(['a' * str_len, 'b' * str_len, 'c' * str_len])
-        original = DataFrame(s)
-        with tm.assertRaises(ValueError):
-            with tm.ensure_clean() as path:
-                original.to_stata(path)
-
-    def test_missing_value_generator(self):
-        types = ('b','h','l')
-        df = DataFrame([[0.0]],columns=['float_'])
-        with tm.ensure_clean() as path:
-            df.to_stata(path)
-            with StataReader(path) as rdr:
-                valid_range = rdr.VALID_RANGE
-        expected_values = ['.' + chr(97 + i) for i in range(26)]
-        expected_values.insert(0, '.')
-        for t in types:
-            offset = valid_range[t][1]
-            for i in range(0,27):
-                val = StataMissingValue(offset+1+i)
-                self.assertTrue(val.string == expected_values[i])
-
-        # Test extremes for floats
-        val = StataMissingValue(struct.unpack('<f',b'\x00\x00\x00\x7f')[0])
-        self.assertTrue(val.string == '.')
-        val = StataMissingValue(struct.unpack('<f',b'\x00\xd0\x00\x7f')[0])
-        self.assertTrue(val.string == '.z')
-
-        # Test extremes for floats
-        val = StataMissingValue(struct.unpack('<d',b'\x00\x00\x00\x00\x00\x00\xe0\x7f')[0])
-        self.assertTrue(val.string == '.')
-        val = StataMissingValue(struct.unpack('<d',b'\x00\x00\x00\x00\x00\x1a\xe0\x7f')[0])
-        self.assertTrue(val.string == '.z')
-
-    def test_missing_value_conversion(self):
-        columns = ['int8_', 'int16_', 'int32_', 'float32_', 'float64_']
-        smv = StataMissingValue(101)
-        keys = [key for key in iterkeys(smv.MISSING_VALUES)]
-        keys.sort()
-        data = []
-        for i in range(27):
-            row = [StataMissingValue(keys[i+(j*27)]) for j in range(5)]
-            data.append(row)
-        expected = DataFrame(data,columns=columns)
-
-        parsed_113 = read_stata(self.dta17_113, convert_missing=True)
-        parsed_115 = read_stata(self.dta17_115, convert_missing=True)
-        parsed_117 = read_stata(self.dta17_117, convert_missing=True)
-
-        tm.assert_frame_equal(expected, parsed_113)
-        tm.assert_frame_equal(expected, parsed_115)
-        tm.assert_frame_equal(expected, parsed_117)
-
-    def test_big_dates(self):
-        yr = [1960, 2000, 9999, 100, 2262, 1677]
-        mo = [1, 1, 12, 1, 4, 9]
-        dd = [1, 1, 31, 1, 22, 23]
-        hr = [0, 0, 23, 0, 0, 0]
-        mm = [0, 0, 59, 0, 0, 0]
-        ss = [0, 0, 59, 0, 0, 0]
-        expected = []
-        for i in range(len(yr)):
-            row = []
-            for j in range(7):
-                if j == 0:
-                    row.append(
-                        datetime(yr[i], mo[i], dd[i], hr[i], mm[i], ss[i]))
-                elif j == 6:
-                    row.append(datetime(yr[i], 1, 1))
-                else:
-                    row.append(datetime(yr[i], mo[i], dd[i]))
-            expected.append(row)
-        expected.append([NaT] * 7)
-        columns = ['date_tc', 'date_td', 'date_tw', 'date_tm', 'date_tq',
-                   'date_th', 'date_ty']
-
-        # Fixes for weekly, quarterly,half,year
-        expected[2][2] = datetime(9999,12,24)
-        expected[2][3] = datetime(9999,12,1)
-        expected[2][4] = datetime(9999,10,1)
-        expected[2][5] = datetime(9999,7,1)
-        expected[4][2] = datetime(2262,4,16)
-        expected[4][3] = expected[4][4] = datetime(2262,4,1)
-        expected[4][5] = expected[4][6] = datetime(2262,1,1)
-        expected[5][2] = expected[5][3] = expected[5][4] = datetime(1677,10,1)
-        expected[5][5] = expected[5][6] = datetime(1678,1,1)
-
-        expected = DataFrame(expected, columns=columns, dtype=np.object)
-        parsed_115 = read_stata(self.dta18_115)
-        parsed_117 = read_stata(self.dta18_117)
-        tm.assert_frame_equal(expected, parsed_115, check_datetimelike_compat=True)
-        tm.assert_frame_equal(expected, parsed_117, check_datetimelike_compat=True)
-
-        date_conversion =  dict((c, c[-2:]) for c in columns)
-        #{c : c[-2:] for c in columns}
-        with tm.ensure_clean() as path:
-            expected.index.name = 'index'
-            expected.to_stata(path, date_conversion)
-            written_and_read_again = self.read_dta(path)
-            tm.assert_frame_equal(written_and_read_again.set_index('index'),
-                                  expected,
-                                  check_datetimelike_compat=True)
-
-    def test_dtype_conversion(self):
-        expected = self.read_csv(self.csv15)
-        expected['byte_'] = expected['byte_'].astype(np.int8)
-        expected['int_'] = expected['int_'].astype(np.int16)
-        expected['long_'] = expected['long_'].astype(np.int32)
-        expected['float_'] = expected['float_'].astype(np.float32)
-        expected['double_'] = expected['double_'].astype(np.float64)
-        expected['date_td'] = expected['date_td'].apply(datetime.strptime,
-                                                        args=('%Y-%m-%d',))
-
-        no_conversion = read_stata(self.dta15_117,
-                                   convert_dates=True)
-        tm.assert_frame_equal(expected, no_conversion)
-
-        conversion = read_stata(self.dta15_117,
-                                convert_dates=True,
-                                preserve_dtypes=False)
-
-        # read_csv types are the same
-        expected = self.read_csv(self.csv15)
-        expected['date_td'] = expected['date_td'].apply(datetime.strptime,
-                                                        args=('%Y-%m-%d',))
-
-        tm.assert_frame_equal(expected, conversion)
-
-    def test_drop_column(self):
-        expected = self.read_csv(self.csv15)
-        expected['byte_'] = expected['byte_'].astype(np.int8)
-        expected['int_'] = expected['int_'].astype(np.int16)
-        expected['long_'] = expected['long_'].astype(np.int32)
-        expected['float_'] = expected['float_'].astype(np.float32)
-        expected['double_'] = expected['double_'].astype(np.float64)
-        expected['date_td'] = expected['date_td'].apply(datetime.strptime,
-                                                        args=('%Y-%m-%d',))
-
-        columns = ['byte_', 'int_', 'long_']
-        expected = expected[columns]
-        dropped = read_stata(self.dta15_117, convert_dates=True,
-                             columns=columns)
-
-        tm.assert_frame_equal(expected, dropped)
-
-        # See PR 10757
-        columns = ['int_', 'long_', 'byte_']
-        expected = expected[columns]
-        reordered = read_stata(self.dta15_117, convert_dates=True,
-                               columns=columns)
-        tm.assert_frame_equal(expected, reordered)
-
-        with tm.assertRaises(ValueError):
-            columns = ['byte_', 'byte_']
-            read_stata(self.dta15_117, convert_dates=True, columns=columns)
-
-        with tm.assertRaises(ValueError):
-            columns = ['byte_', 'int_', 'long_', 'not_found']
-            read_stata(self.dta15_117, convert_dates=True, columns=columns)
-
-    def test_categorical_writing(self):
-        original = DataFrame.from_records(
-            [
-                ["one", "ten", "one", "one", "one", 1],
-                ["two", "nine", "two", "two", "two", 2],
-                ["three", "eight", "three", "three", "three", 3],
-                ["four", "seven", 4, "four", "four", 4],
-                ["five", "six", 5, np.nan, "five", 5],
-                ["six", "five", 6, np.nan, "six", 6],
-                ["seven", "four", 7, np.nan, "seven", 7],
-                ["eight", "three", 8, np.nan, "eight", 8],
-                ["nine", "two", 9, np.nan, "nine", 9],
-                ["ten", "one", "ten", np.nan, "ten", 10]
-            ],
-            columns=['fully_labeled', 'fully_labeled2', 'incompletely_labeled',
-                     'labeled_with_missings', 'float_labelled', 'unlabeled'])
-        expected = original.copy()
-
-        # these are all categoricals
-        original = pd.concat([original[col].astype('category') for col in original], axis=1)
-
-        expected['incompletely_labeled'] = expected['incompletely_labeled'].apply(str)
-        expected['unlabeled'] = expected['unlabeled'].apply(str)
-        expected = pd.concat([expected[col].astype('category') for col in expected], axis=1)
-        expected.index.name = 'index'
-
-        with tm.ensure_clean() as path:
-            with warnings.catch_warnings(record=True) as w:
-                # Silence warnings
-                original.to_stata(path)
-                written_and_read_again = self.read_dta(path)
-                tm.assert_frame_equal(written_and_read_again.set_index('index'), expected)
-
-
-    def test_categorical_warnings_and_errors(self):
-        # Warning for non-string labels
-        # Error for labels too long
-        original = pd.DataFrame.from_records(
-            [['a' * 10000],
-             ['b' * 10000],
-             ['c' * 10000],
-             ['d' * 10000]],
-            columns=['Too_long'])
-
-        original = pd.concat([original[col].astype('category') for col in original], axis=1)
-        with tm.ensure_clean() as path:
-            tm.assertRaises(ValueError, original.to_stata, path)
-
-        original = pd.DataFrame.from_records(
-            [['a'],
-             ['b'],
-             ['c'],
-             ['d'],
-             [1]],
-            columns=['Too_long'])
-        original = pd.concat([original[col].astype('category') for col in original], axis=1)
-
-        with warnings.catch_warnings(record=True) as w:
-            original.to_stata(path)
-            tm.assert_equal(len(w), 1)  # should get a warning for mixed content
-
-    def test_categorical_with_stata_missing_values(self):
-        values = [['a' + str(i)] for i in range(120)]
-        values.append([np.nan])
-        original = pd.DataFrame.from_records(values, columns=['many_labels'])
-        original = pd.concat([original[col].astype('category') for col in original], axis=1)
-        original.index.name = 'index'
-        with tm.ensure_clean() as path:
-            original.to_stata(path)
-            written_and_read_again = self.read_dta(path)
-            tm.assert_frame_equal(written_and_read_again.set_index('index'), original)
-
-    def test_categorical_order(self):
-        # Directly construct using expected codes
-        # Format is is_cat, col_name, labels (in order), underlying data
-        expected = [(True, 'ordered', ['a', 'b', 'c', 'd', 'e'], np.arange(5)),
-                    (True, 'reverse', ['a', 'b', 'c', 'd', 'e'], np.arange(5)[::-1]),
-                    (True, 'noorder', ['a', 'b', 'c', 'd', 'e'], np.array([2, 1, 4, 0, 3])),
-                    (True, 'floating', ['a', 'b', 'c', 'd', 'e'], np.arange(0, 5)),
-                    (True, 'float_missing', ['a', 'd', 'e'], np.array([0, 1, 2, -1, -1])),
-                    (False, 'nolabel', [1.0, 2.0, 3.0, 4.0, 5.0], np.arange(5)),
-                    (True, 'int32_mixed', ['d', 2, 'e', 'b', 'a'], np.arange(5))]
-        cols = []
-        for is_cat, col, labels, codes in expected:
-            if is_cat:
-                cols.append((col, pd.Categorical.from_codes(codes, labels)))
-            else:
-                cols.append((col, pd.Series(labels, dtype=np.float32)))
-        expected = DataFrame.from_items(cols)
-
-        # Read with and with out categoricals, ensure order is identical
-        parsed_115 = read_stata(self.dta19_115)
-        parsed_117 = read_stata(self.dta19_117)
-        tm.assert_frame_equal(expected, parsed_115)
-        tm.assert_frame_equal(expected, parsed_117)
-
-        # Check identity of codes
-        for col in expected:
-            if is_categorical_dtype(expected[col]):
-                tm.assert_series_equal(expected[col].cat.codes,
-                                       parsed_115[col].cat.codes)
-                tm.assert_index_equal(expected[col].cat.categories,
-                                      parsed_115[col].cat.categories)
-
-    def test_categorical_sorting(self):
-        parsed_115 = read_stata(self.dta20_115)
-        parsed_117 = read_stata(self.dta20_117)
-        # Sort based on codes, not strings
-        parsed_115 = parsed_115.sort_values("srh")
-        parsed_117 = parsed_117.sort_values("srh")
-        # Don't sort index
-        parsed_115.index = np.arange(parsed_115.shape[0])
-        parsed_117.index = np.arange(parsed_117.shape[0])
-        codes = [-1, -1, 0, 1, 1, 1, 2, 2, 3, 4]
-        categories = ["Poor", "Fair", "Good", "Very good", "Excellent"]
-        cat = pd.Categorical.from_codes(codes=codes, categories=categories)
-        expected = pd.Series(cat, name='srh')
-        tm.assert_series_equal(expected, parsed_115["srh"])
-        tm.assert_series_equal(expected, parsed_117["srh"])
-
-    def test_categorical_ordering(self):
-        parsed_115 = read_stata(self.dta19_115)
-        parsed_117 = read_stata(self.dta19_117)
-
-        parsed_115_unordered = read_stata(self.dta19_115,
-                                          order_categoricals=False)
-        parsed_117_unordered = read_stata(self.dta19_117,
-                                          order_categoricals=False)
-        for col in parsed_115:
-            if not is_categorical_dtype(parsed_115[col]):
-                continue
-            tm.assert_equal(True, parsed_115[col].cat.ordered)
-            tm.assert_equal(True, parsed_117[col].cat.ordered)
-            tm.assert_equal(False, parsed_115_unordered[col].cat.ordered)
-            tm.assert_equal(False, parsed_117_unordered[col].cat.ordered)
-
-
-    def test_read_chunks_117(self):
-        files_117 = [self.dta1_117, self.dta2_117, self.dta3_117,
-                     self.dta4_117, self.dta14_117, self.dta15_117,
-                     self.dta16_117, self.dta17_117, self.dta18_117,
-                     self.dta19_117, self.dta20_117]
-
-        for fname in files_117:
-            for chunksize in 1,2:
-                for convert_categoricals in False, True:
-                    for convert_dates in False, True:
-
-                        with warnings.catch_warnings(record=True) as w:
-                            warnings.simplefilter("always")
-                            parsed = read_stata(fname, convert_categoricals=convert_categoricals,
-                                                convert_dates=convert_dates)
-                        itr = read_stata(fname, iterator=True, convert_categoricals=convert_categoricals,
-                                         convert_dates=convert_dates)
-
-                        pos = 0
-                        for j in range(5):
-                            with warnings.catch_warnings(record=True) as w:
-                                warnings.simplefilter("always")
-                                try:
-                                    chunk = itr.read(chunksize)
-                                except StopIteration:
-                                    break
-                            from_frame = parsed.iloc[pos:pos+chunksize, :]
-                            tm.assert_frame_equal(from_frame,
-                                                  chunk,
-                                                  check_dtype=False,
-                                                  check_datetimelike_compat=True)
-
-                            pos += chunksize
-
-    def test_iterator(self):
-
-        fname = self.dta3_117
-
-        parsed = read_stata(fname)
-
-        itr = read_stata(fname, iterator=True)
-        chunk = itr.read(5)
-        tm.assert_frame_equal(parsed.iloc[0:5, :], chunk)
-
-        itr = read_stata(fname, chunksize=5)
-        chunk = list(itr)
-        tm.assert_frame_equal(parsed.iloc[0:5, :], chunk[0])
-
-        itr = read_stata(fname, iterator=True)
-        chunk = itr.get_chunk(5)
-        tm.assert_frame_equal(parsed.iloc[0:5, :], chunk)
-
-        itr = read_stata(fname, chunksize=5)
-        chunk = itr.get_chunk()
-        tm.assert_frame_equal(parsed.iloc[0:5, :], chunk)
-
-
-    def test_read_chunks_115(self):
-        files_115 = [self.dta2_115, self.dta3_115, self.dta4_115,
-                     self.dta14_115, self.dta15_115, self.dta16_115,
-                     self.dta17_115, self.dta18_115, self.dta19_115,
-                     self.dta20_115]
-
-        for fname in files_115:
-            for chunksize in 1,2:
-                for convert_categoricals in False, True:
-                    for convert_dates in False, True:
-
-                        # Read the whole file
-                        with warnings.catch_warnings(record=True) as w:
-                            warnings.simplefilter("always")
-                            parsed = read_stata(fname, convert_categoricals=convert_categoricals,
-                                                convert_dates=convert_dates)
-
-                        # Compare to what we get when reading by chunk
-                        itr = read_stata(fname, iterator=True, convert_dates=convert_dates,
-                                         convert_categoricals=convert_categoricals)
-                        pos = 0
-                        for j in range(5):
-                            with warnings.catch_warnings(record=True) as w:
-                                warnings.simplefilter("always")
-                                try:
-                                    chunk = itr.read(chunksize)
-                                except StopIteration:
-                                    break
-                            from_frame = parsed.iloc[pos:pos+chunksize, :]
-                            tm.assert_frame_equal(from_frame,
-                                                  chunk,
-                                                  check_dtype=False,
-                                                  check_datetimelike_compat=True)
-
-                            pos += chunksize
-
-    def test_read_chunks_columns(self):
-        fname = self.dta3_117
-        columns = ['quarter', 'cpi', 'm1']
-        chunksize = 2
-
-        parsed = read_stata(fname, columns=columns)
-        itr = read_stata(fname, iterator=True)
-        pos = 0
-        for j in range(5):
-            chunk = itr.read(chunksize, columns=columns)
-            if chunk is None:
-                break
-            from_frame = parsed.iloc[pos:pos+chunksize, :]
-            tm.assert_frame_equal(from_frame, chunk, check_dtype=False)
-            pos += chunksize
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/io/tests/test_wb.py b/pandas/io/tests/test_wb.py
deleted file mode 100644
index 51d6ac02f0f20..0000000000000
--- a/pandas/io/tests/test_wb.py
+++ /dev/null
@@ -1,111 +0,0 @@
-import nose
-
-import pandas
-from pandas.compat import u
-from pandas.util.testing import network
-from pandas.util.testing import assert_frame_equal
-from numpy.testing.decorators import slow
-from pandas.io.wb import search, download, get_countries
-import pandas.util.testing as tm
-
-
-class TestWB(tm.TestCase):
-
-    @slow
-    @network
-    def test_wdi_search(self):
-
-        # Test that a name column exists, and that some results were returned
-        # ...without being too strict about what the actual contents of the
-        # results actually are.  The fact that there are some, is good enough.
-
-        result = search('gdp.*capita.*constant')
-        self.assertTrue(result.name.str.contains('GDP').any())
-
-    @slow
-    @network
-    def test_wdi_download(self):
-
-        # Test a bad indicator with double (US), triple (USA),
-        # standard (CA, MX), non standard (KSV),
-        # duplicated (US, US, USA), and unknown (BLA) country codes
-
-        # ...but NOT a crash inducing country code (World bank strips pandas
-        #    users of the luxury of laziness, because they create their
-        #    own exceptions, and don't clean up legacy country codes.
-        # ...but NOT a retired indicator (User should want it to error.)
-
-        cntry_codes = ['CA', 'MX', 'USA', 'US', 'US', 'KSV', 'BLA']
-        inds = ['NY.GDP.PCAP.CD','BAD.INDICATOR']
-
-        expected = {'NY.GDP.PCAP.CD': {('Canada', '2003'): 28026.006013044702, ('Mexico', '2003'): 6601.0420648056606, ('Canada', '2004'): 31829.522562759001, ('Kosovo', '2003'): 1969.56271307405, ('Mexico', '2004'): 7042.0247834044303, ('United States', '2004'): 41928.886136479705, ('United States', '2003'): 39682.472247320402, ('Kosovo', '2004'): 2135.3328465238301}}
-        expected = pandas.DataFrame(expected)
-        #Round, to ignore revisions to data.
-        expected = pandas.np.round(expected,decimals=-3)
-        expected.sort(inplace=True)
-        result = download(country=cntry_codes, indicator=inds,
-                          start=2003, end=2004, errors='ignore')
-        result.sort(inplace=True)
-        #Round, to ignore revisions to data.
-        result = pandas.np.round(result,decimals=-3)
-        expected.index = result.index
-        assert_frame_equal(result, pandas.DataFrame(expected))
-
-    @slow
-    @network
-    def test_wdi_download_w_retired_indicator(self):
-
-        cntry_codes = ['CA', 'MX', 'US']
-        # Despite showing up in the search feature, and being listed online,
-        # the api calls to GDPPCKD don't work in their own query builder, nor
-        # pandas module.  GDPPCKD used to be a common symbol.
-        # This test is written to ensure that error messages to pandas users
-        # continue to make sense, rather than a user getting some missing
-        # key error, cause their JSON message format changed.  If
-        # World bank ever finishes the deprecation of this symbol,
-        # this nose test should still pass.
-
-        inds = ['GDPPCKD']
-
-        try:
-            result = download(country=cntry_codes, indicator=inds,
-                              start=2003, end=2004, errors='ignore')
-        # If for some reason result actually ever has data, it's cause WB
-        # fixed the issue with this ticker.  Find another bad one.
-        except ValueError as e:
-            raise nose.SkipTest("No indicators returned data: {0}".format(e))
-
-        # if it ever gets here, it means WB unretired the indicator.
-        # even if they dropped it completely, it would still get caught above
-        # or the WB API changed somehow in a really unexpected way.
-        if len(result) > 0:
-            raise nose.SkipTest("Invalid results")
-
-    @slow
-    @network
-    def test_wdi_download_w_crash_inducing_countrycode(self):
-
-        cntry_codes = ['CA', 'MX', 'US', 'XXX']
-        inds = ['NY.GDP.PCAP.CD']
-
-        try:
-            result = download(country=cntry_codes, indicator=inds,
-                              start=2003, end=2004, errors='ignore')
-        except ValueError as e:
-            raise nose.SkipTest("No indicators returned data: {0}".format(e))
-
-        # if it ever gets here, it means the country code XXX got used by WB
-        # or the WB API changed somehow in a really unexpected way.
-        if len(result) > 0:
-            raise nose.SkipTest("Invalid results")
-
-    @slow
-    @network
-    def test_wdi_get_countries(self):
-        result = get_countries()
-        self.assertTrue('Zimbabwe' in list(result['name']))
-        self.assertTrue(len(result) > 100)
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/io/wb.py b/pandas/io/wb.py
deleted file mode 100644
index e617a01b73bfd..0000000000000
--- a/pandas/io/wb.py
+++ /dev/null
@@ -1,308 +0,0 @@
-# -*- coding: utf-8 -*-
-
-from __future__ import print_function
-
-from pandas.compat import map, reduce, range, lrange
-from pandas.io.common import urlopen
-from pandas.io import json
-import pandas
-import numpy as np
-import warnings
-
-warnings.warn("\n"
-              "The pandas.io.wb module is moved to a separate package "
-              "(pandas-datareader) and will be removed from pandas in a "
-              "future version.\nAfter installing the pandas-datareader package "
-              "(https://github.com/pydata/pandas-datareader), you can change "
-              "the import ``from pandas.io import data, wb`` to "
-              "``from pandas_datareader import data, wb``.",
-              FutureWarning)
-
-
-# This list of country codes was pulled from wikipedia during October 2014.
-# While some exceptions do exist, it is the best proxy for countries supported
-# by World Bank.  It is an aggregation of the 2-digit ISO 3166-1 alpha-2, and
-# 3-digit ISO 3166-1 alpha-3, codes, with 'all', 'ALL', and 'All' appended ot
-# the end.
-
-country_codes = ['AD', 'AE', 'AF', 'AG', 'AI', 'AL', 'AM', 'AO', 'AQ', 'AR', \
-                 'AS', 'AT', 'AU', 'AW', 'AX', 'AZ', 'BA', 'BB', 'BD', 'BE', \
-                 'BF', 'BG', 'BH', 'BI', 'BJ', 'BL', 'BM', 'BN', 'BO', 'BQ', \
-                 'BR', 'BS', 'BT', 'BV', 'BW', 'BY', 'BZ', 'CA', 'CC', 'CD', \
-                 'CF', 'CG', 'CH', 'CI', 'CK', 'CL', 'CM', 'CN', 'CO', 'CR', \
-                 'CU', 'CV', 'CW', 'CX', 'CY', 'CZ', 'DE', 'DJ', 'DK', 'DM', \
-                 'DO', 'DZ', 'EC', 'EE', 'EG', 'EH', 'ER', 'ES', 'ET', 'FI', \
-                 'FJ', 'FK', 'FM', 'FO', 'FR', 'GA', 'GB', 'GD', 'GE', 'GF', \
-                 'GG', 'GH', 'GI', 'GL', 'GM', 'GN', 'GP', 'GQ', 'GR', 'GS', \
-                 'GT', 'GU', 'GW', 'GY', 'HK', 'HM', 'HN', 'HR', 'HT', 'HU', \
-                 'ID', 'IE', 'IL', 'IM', 'IN', 'IO', 'IQ', 'IR', 'IS', 'IT', \
-                 'JE', 'JM', 'JO', 'JP', 'KE', 'KG', 'KH', 'KI', 'KM', 'KN', \
-                 'KP', 'KR', 'KW', 'KY', 'KZ', 'LA', 'LB', 'LC', 'LI', 'LK', \
-                 'LR', 'LS', 'LT', 'LU', 'LV', 'LY', 'MA', 'MC', 'MD', 'ME', \
-                 'MF', 'MG', 'MH', 'MK', 'ML', 'MM', 'MN', 'MO', 'MP', 'MQ', \
-                 'MR', 'MS', 'MT', 'MU', 'MV', 'MW', 'MX', 'MY', 'MZ', 'NA', \
-                 'NC', 'NE', 'NF', 'NG', 'NI', 'NL', 'NO', 'NP', 'NR', 'NU', \
-                 'NZ', 'OM', 'PA', 'PE', 'PF', 'PG', 'PH', 'PK', 'PL', 'PM', \
-                 'PN', 'PR', 'PS', 'PT', 'PW', 'PY', 'QA', 'RE', 'RO', 'RS', \
-                 'RU', 'RW', 'SA', 'SB', 'SC', 'SD', 'SE', 'SG', 'SH', 'SI', \
-                 'SJ', 'SK', 'SL', 'SM', 'SN', 'SO', 'SR', 'SS', 'ST', 'SV', \
-                 'SX', 'SY', 'SZ', 'TC', 'TD', 'TF', 'TG', 'TH', 'TJ', 'TK', \
-                 'TL', 'TM', 'TN', 'TO', 'TR', 'TT', 'TV', 'TW', 'TZ', 'UA', \
-                 'UG', 'UM', 'US', 'UY', 'UZ', 'VA', 'VC', 'VE', 'VG', 'VI', \
-                 'VN', 'VU', 'WF', 'WS', 'YE', 'YT', 'ZA', 'ZM', 'ZW', \
-                 'ABW', 'AFG', 'AGO', 'AIA', 'ALA', 'ALB', 'AND', 'ARE', \
-                 'ARG', 'ARM', 'ASM', 'ATA', 'ATF', 'ATG', 'AUS', 'AUT', \
-                 'AZE', 'BDI', 'BEL', 'BEN', 'BES', 'BFA', 'BGD', 'BGR', \
-                 'BHR', 'BHS', 'BIH', 'BLM', 'BLR', 'BLZ', 'BMU', 'BOL', \
-                 'BRA', 'BRB', 'BRN', 'BTN', 'BVT', 'BWA', 'CAF', 'CAN', \
-                 'CCK', 'CHE', 'CHL', 'CHN', 'CIV', 'CMR', 'COD', 'COG', \
-                 'COK', 'COL', 'COM', 'CPV', 'CRI', 'CUB', 'CUW', 'CXR', \
-                 'CYM', 'CYP', 'CZE', 'DEU', 'DJI', 'DMA', 'DNK', 'DOM', \
-                 'DZA', 'ECU', 'EGY', 'ERI', 'ESH', 'ESP', 'EST', 'ETH', \
-                 'FIN', 'FJI', 'FLK', 'FRA', 'FRO', 'FSM', 'GAB', 'GBR', \
-                 'GEO', 'GGY', 'GHA', 'GIB', 'GIN', 'GLP', 'GMB', 'GNB', \
-                 'GNQ', 'GRC', 'GRD', 'GRL', 'GTM', 'GUF', 'GUM', 'GUY', \
-                 'HKG', 'HMD', 'HND', 'HRV', 'HTI', 'HUN', 'IDN', 'IMN', \
-                 'IND', 'IOT', 'IRL', 'IRN', 'IRQ', 'ISL', 'ISR', 'ITA', \
-                 'JAM', 'JEY', 'JOR', 'JPN', 'KAZ', 'KEN', 'KGZ', 'KHM', \
-                 'KIR', 'KNA', 'KOR', 'KWT', 'LAO', 'LBN', 'LBR', 'LBY', \
-                 'LCA', 'LIE', 'LKA', 'LSO', 'LTU', 'LUX', 'LVA', 'MAC', \
-                 'MAF', 'MAR', 'MCO', 'MDA', 'MDG', 'MDV', 'MEX', 'MHL', \
-                 'MKD', 'MLI', 'MLT', 'MMR', 'MNE', 'MNG', 'MNP', 'MOZ', \
-                 'MRT', 'MSR', 'MTQ', 'MUS', 'MWI', 'MYS', 'MYT', 'NAM', \
-                 'NCL', 'NER', 'NFK', 'NGA', 'NIC', 'NIU', 'NLD', 'NOR', \
-                 'NPL', 'NRU', 'NZL', 'OMN', 'PAK', 'PAN', 'PCN', 'PER', \
-                 'PHL', 'PLW', 'PNG', 'POL', 'PRI', 'PRK', 'PRT', 'PRY', \
-                 'PSE', 'PYF', 'QAT', 'REU', 'ROU', 'RUS', 'RWA', 'SAU', \
-                 'SDN', 'SEN', 'SGP', 'SGS', 'SHN', 'SJM', 'SLB', 'SLE', \
-                 'SLV', 'SMR', 'SOM', 'SPM', 'SRB', 'SSD', 'STP', 'SUR', \
-                 'SVK', 'SVN', 'SWE', 'SWZ', 'SXM', 'SYC', 'SYR', 'TCA', \
-                 'TCD', 'TGO', 'THA', 'TJK', 'TKL', 'TKM', 'TLS', 'TON', \
-                 'TTO', 'TUN', 'TUR', 'TUV', 'TWN', 'TZA', 'UGA', 'UKR', \
-                 'UMI', 'URY', 'USA', 'UZB', 'VAT', 'VCT', 'VEN', 'VGB', \
-                 'VIR', 'VNM', 'VUT', 'WLF', 'WSM', 'YEM', 'ZAF', 'ZMB', \
-                 'ZWE', 'all', 'ALL', 'All']
-
-def download(country=['MX', 'CA', 'US'], indicator=['NY.GDP.MKTP.CD', 'NY.GNS.ICTR.ZS'],
-             start=2003, end=2005,errors='warn'):
-    """
-    Download data series from the World Bank's World Development Indicators
-
-    Parameters
-    ----------
-
-    indicator: string or list of strings
-        taken from the ``id`` field in ``WDIsearch()``
-
-    country: string or list of strings.
-        ``all`` downloads data for all countries
-        2 or 3 character ISO country codes select individual
-        countries (e.g.``US``,``CA``) or (e.g.``USA``,``CAN``).  The codes
-        can be mixed.
-
-        The two ISO lists of countries, provided by wikipedia, are hardcoded
-        into pandas as of 11/10/2014.
-
-    start: int
-        First year of the data series
-
-    end: int
-        Last year of the data series (inclusive)
-
-    errors: str {'ignore', 'warn', 'raise'}, default 'warn'
-        Country codes are validated against a hardcoded list.  This controls
-        the outcome of that validation, and attempts to also apply
-        to the results from world bank.
-
-        errors='raise', will raise a ValueError on a bad country code.
-
-    Returns
-    -------
-
-    ``pandas`` DataFrame with columns: country, iso_code, year,
-    indicator value.
-
-    """
-
-    if type(country) == str:
-        country = [country]
-
-    bad_countries = np.setdiff1d(country, country_codes)
-
-    # Validate the input
-    if len(bad_countries) > 0:
-        tmp = ", ".join(bad_countries)
-        if errors == 'raise':
-            raise ValueError("Invalid Country Code(s): %s" % tmp)
-        if errors == 'warn':
-            warnings.warn('Non-standard ISO country codes: %s' % tmp)
-
-    # Work with a list of indicators
-    if type(indicator) == str:
-        indicator = [indicator]
-
-    # Download
-    data = []
-    bad_indicators = {}
-    for ind in indicator:
-        one_indicator_data,msg = _get_data(ind, country, start, end)
-        if msg == "Success":
-            data.append(one_indicator_data)
-        else:
-            bad_indicators[ind] = msg
-
-    if len(bad_indicators.keys()) > 0:
-        bad_ind_msgs = [i + " : " + m for i,m in bad_indicators.items()]
-        bad_ind_msgs = "\n\n".join(bad_ind_msgs)
-        bad_ind_msgs = "\n\nInvalid Indicators:\n\n%s" % bad_ind_msgs
-        if errors == 'raise':
-            raise ValueError(bad_ind_msgs)
-        if errors == 'warn':
-            warnings.warn(bad_ind_msgs)
-
-    # Confirm we actually got some data, and build Dataframe
-    if len(data) > 0:
-        out = reduce(lambda x, y: x.merge(y, how='outer'), data)
-        out = out.drop('iso_code', axis=1)
-        out = out.set_index(['country', 'year'])
-        out = out._convert(datetime=True, numeric=True)
-        return out
-    else:
-        msg = "No indicators returned data."
-        if errors == 'ignore':
-            msg += "  Set errors='warn' for more information."
-        raise ValueError(msg)
-
-def _get_data(indicator="NY.GNS.ICTR.GN.ZS", country='US',
-              start=2002, end=2005):
-
-    if type(country) == str:
-        country = [country]
-
-    countries = ';'.join(country)
-
-    # Build URL for api call
-    url = ("http://api.worldbank.org/countries/" + countries + "/indicators/" +
-           indicator + "?date=" + str(start) + ":" + str(end) +
-           "&per_page=25000&format=json")
-
-    # Download
-    with urlopen(url) as response:
-        data = response.read()
-
-    # Check to see if there is a possible problem
-    possible_message = json.loads(data)[0]
-    if 'message' in possible_message.keys():
-        msg = possible_message['message'][0]
-        try:
-            msg = msg['key'].split() + ["\n "] + msg['value'].split()
-            wb_err = ' '.join(msg)
-        except:
-            wb_err = ""
-            if 'key' in msg.keys():
-                wb_err = msg['key'] + "\n "
-            if 'value' in msg.keys():
-                wb_err += msg['value']
-        error_msg = "Problem with a World Bank Query \n %s"
-        return None, error_msg % wb_err
-
-    if 'total' in possible_message.keys():
-        if possible_message['total'] == 0:
-            return None, "No results from world bank."
-
-    # Parse JSON file
-    data = json.loads(data)[1]
-    country = [x['country']['value'] for x in data]
-    iso_code = [x['country']['id'] for x in data]
-    year = [x['date'] for x in data]
-    value = [x['value'] for x in data]
-    # Prepare output
-    out = pandas.DataFrame([country, iso_code, year, value]).T
-    out.columns = ['country', 'iso_code', 'year', indicator]
-    return out,"Success"
-
-def get_countries():
-    '''Query information about countries
-    '''
-    url = 'http://api.worldbank.org/countries/?per_page=1000&format=json'
-    with urlopen(url) as response:
-        data = response.read()
-    data = json.loads(data)[1]
-    data = pandas.DataFrame(data)
-    data.adminregion = [x['value'] for x in data.adminregion]
-    data.incomeLevel = [x['value'] for x in data.incomeLevel]
-    data.lendingType = [x['value'] for x in data.lendingType]
-    data.region = [x['value'] for x in data.region]
-    data = data.rename(columns={'id': 'iso3c', 'iso2Code': 'iso2c'})
-    return data
-
-def get_indicators():
-    '''Download information about all World Bank data series
-    '''
-    url = 'http://api.worldbank.org/indicators?per_page=50000&format=json'
-    with urlopen(url) as response:
-        data = response.read()
-    data = json.loads(data)[1]
-    data = pandas.DataFrame(data)
-    # Clean fields
-    data.source = [x['value'] for x in data.source]
-    fun = lambda x: x.encode('ascii', 'ignore')
-    data.sourceOrganization = data.sourceOrganization.apply(fun)
-    # Clean topic field
-
-    def get_value(x):
-        try:
-            return x['value']
-        except:
-            return ''
-    fun = lambda x: [get_value(y) for y in x]
-    data.topics = data.topics.apply(fun)
-    data.topics = data.topics.apply(lambda x: ' ; '.join(x))
-    # Clean outpu
-    data = data.sort(columns='id')
-    data.index = pandas.Index(lrange(data.shape[0]))
-    return data
-
-_cached_series = None
-
-
-def search(string='gdp.*capi', field='name', case=False):
-    """
-    Search available data series from the world bank
-
-    Parameters
-    ----------
-
-    string: string
-        regular expression
-    field: string
-        id, name, source, sourceNote, sourceOrganization, topics
-        See notes below
-    case: bool
-        case sensitive search?
-
-    Notes
-    -----
-
-    The first time this function is run it will download and cache the full
-    list of available series. Depending on the speed of your network
-    connection, this can take time. Subsequent searches will use the cached
-    copy, so they should be much faster.
-
-    id : Data series indicator (for use with the ``indicator`` argument of
-    ``WDI()``) e.g. NY.GNS.ICTR.GN.ZS"
-    name: Short description of the data series
-    source: Data collection project
-    sourceOrganization: Data collection organization
-    note:
-    sourceNote:
-    topics:
-    """
-    # Create cached list of series if it does not exist
-    global _cached_series
-    if type(_cached_series) is not pandas.core.frame.DataFrame:
-        _cached_series = get_indicators()
-    data = _cached_series[field]
-    idx = data.str.contains(string, case=case)
-    out = _cached_series.ix[idx].dropna()
-    return out
diff --git a/pandas/json.py b/pandas/json.py
new file mode 100644
index 0000000000000..16d6580c87951
--- /dev/null
+++ b/pandas/json.py
@@ -0,0 +1,7 @@
+# flake8: noqa
+
+import warnings
+warnings.warn("The pandas.json module is deprecated and will be "
+              "removed in a future version. Please import from "
+              "pandas.io.json instead", FutureWarning, stacklevel=2)
+from pandas._libs.json import dumps, loads
diff --git a/pandas/lib.pxd b/pandas/lib.pxd
deleted file mode 100644
index ba52e4cc47c89..0000000000000
--- a/pandas/lib.pxd
+++ /dev/null
@@ -1 +0,0 @@
-cdef bint is_null_datetimelike(v)
diff --git a/pandas/lib.py b/pandas/lib.py
new file mode 100644
index 0000000000000..859a78060fcc1
--- /dev/null
+++ b/pandas/lib.py
@@ -0,0 +1,8 @@
+# flake8: noqa
+
+import warnings
+warnings.warn("The pandas.lib module is deprecated and will be "
+              "removed in a future version. These are private functions "
+              "and can be accessed from pandas._libs.lib instead",
+              FutureWarning, stacklevel=2)
+from pandas._libs.lib import *
diff --git a/pandas/lib.pyx b/pandas/lib.pyx
deleted file mode 100644
index 2b4974155d44c..0000000000000
--- a/pandas/lib.pyx
+++ /dev/null
@@ -1,1874 +0,0 @@
-cimport numpy as np
-cimport cython
-import numpy as np
-import sys
-
-from numpy cimport *
-
-np.import_array()
-
-cdef extern from "numpy/arrayobject.h":
-    cdef enum NPY_TYPES:
-        NPY_intp "NPY_INTP"
-
-
-from cpython cimport (PyDict_New, PyDict_GetItem, PyDict_SetItem,
-                      PyDict_Contains, PyDict_Keys,
-                      Py_INCREF, PyTuple_SET_ITEM,
-                      PyList_Check, PyFloat_Check,
-                      PyString_Check,
-                      PyBytes_Check,
-                      PyTuple_SetItem,
-                      PyTuple_New,
-                      PyObject_SetAttrString,
-                      PyObject_RichCompareBool,
-                      PyBytes_GET_SIZE,
-                      PyUnicode_GET_SIZE)
-
-try:
-    from cpython cimport PyString_GET_SIZE
-except ImportError:
-    from cpython cimport PyUnicode_GET_SIZE as PyString_GET_SIZE
-
-cdef extern from "Python.h":
-    Py_ssize_t PY_SSIZE_T_MAX
-
-    ctypedef struct PySliceObject:
-        pass
-
-    cdef int PySlice_GetIndicesEx(
-        PySliceObject* s, Py_ssize_t length,
-        Py_ssize_t *start, Py_ssize_t *stop, Py_ssize_t *step,
-        Py_ssize_t *slicelength) except -1
-
-
-cimport cpython
-
-isnan = np.isnan
-cdef double NaN = <double> np.NaN
-cdef double nan = NaN
-cdef double NAN = nan
-
-from datetime import datetime as pydatetime
-
-# this is our tseries.pxd
-from datetime cimport *
-
-from tslib cimport convert_to_tsobject, convert_to_timedelta64
-import tslib
-from tslib import NaT, Timestamp, Timedelta
-
-cdef int64_t NPY_NAT = util.get_nat()
-
-ctypedef unsigned char UChar
-
-cimport util
-from util cimport is_array, _checknull, _checknan
-
-cdef extern from "headers/stdint.h":
-    enum: UINT8_MAX
-    enum: INT64_MAX
-    enum: INT64_MIN
-
-
-cdef extern from "math.h":
-    double sqrt(double x)
-    double fabs(double)
-
-# import datetime C API
-PyDateTime_IMPORT
-
-# initialize numpy
-import_array()
-import_ufunc()
-
-def values_from_object(object o):
-    """ return my values or the object if we are say an ndarray """
-    cdef f
-
-    f = getattr(o, 'get_values', None)
-    if f is not None:
-        o = f()
-
-    return o
-
-cpdef map_indices_list(list index):
-    '''
-    Produce a dict mapping the values of the input array to their respective
-    locations.
-
-    Example:
-        array(['hi', 'there']) --> {'hi' : 0 , 'there' : 1}
-
-    Better to do this with Cython because of the enormous speed boost.
-    '''
-    cdef Py_ssize_t i, length
-    cdef dict result = {}
-
-    length = len(index)
-
-    for i from 0 <= i < length:
-        result[index[i]] = i
-
-    return result
-
-
-from libc.stdlib cimport malloc, free
-
-
-def ismember_nans(float64_t[:] arr, set values, bint hasnans):
-    cdef:
-        Py_ssize_t i, n
-        ndarray[uint8_t] result
-        float64_t val
-
-    n = len(arr)
-    result = np.empty(n, dtype=np.uint8)
-    for i in range(n):
-        val = arr[i]
-        result[i] = val in values or hasnans and isnan(val)
-
-    return result.view(np.bool_)
-
-
-def ismember(ndarray arr, set values):
-    '''
-    Checks whether
-
-    Parameters
-    ----------
-    arr : ndarray
-    values : set
-
-    Returns
-    -------
-    ismember : ndarray (boolean dtype)
-    '''
-    cdef:
-        Py_ssize_t i, n
-        ndarray[uint8_t] result
-        object val
-
-    n = len(arr)
-    result = np.empty(n, dtype=np.uint8)
-    for i in range(n):
-        val = util.get_value_at(arr, i)
-        result[i] = val in values
-
-    return result.view(np.bool_)
-
-def ismember_int64(ndarray[int64_t] arr, set values):
-    '''
-    Checks whether
-
-    Parameters
-    ----------
-    arr : ndarray of int64
-    values : set
-
-    Returns
-    -------
-    ismember : ndarray (boolean dtype)
-    '''
-    cdef:
-        Py_ssize_t i, n
-        ndarray[uint8_t] result
-        int64_t v
-
-    n = len(arr)
-    result = np.empty(n, dtype=np.uint8)
-    for i in range(n):
-        result[i] = arr[i] in values
-
-    return result.view(np.bool_)
-
-#----------------------------------------------------------------------
-# datetime / io related
-
-cdef int _EPOCH_ORD = 719163
-
-from datetime import date as pydate
-
-cdef inline int64_t gmtime(object date):
-    cdef int y, m, d, h, mn, s, days
-
-    y = PyDateTime_GET_YEAR(date)
-    m = PyDateTime_GET_MONTH(date)
-    d = PyDateTime_GET_DAY(date)
-    h = PyDateTime_DATE_GET_HOUR(date)
-    mn = PyDateTime_DATE_GET_MINUTE(date)
-    s = PyDateTime_DATE_GET_SECOND(date)
-
-    days = pydate(y, m, 1).toordinal() - _EPOCH_ORD + d - 1
-    return ((<int64_t> (((days * 24 + h) * 60 + mn))) * 60 + s) * 1000
-
-cpdef object to_datetime(int64_t timestamp):
-    return pydatetime.utcfromtimestamp(timestamp / 1000.0)
-
-cpdef object to_timestamp(object dt):
-    return gmtime(dt)
-
-def array_to_timestamp(ndarray[object, ndim=1] arr):
-    cdef int i, n
-    cdef ndarray[int64_t, ndim=1] result
-
-    n = len(arr)
-    result = np.empty(n, dtype=np.int64)
-
-    for i from 0 <= i < n:
-        result[i] = gmtime(arr[i])
-
-    return result
-
-def time64_to_datetime(ndarray[int64_t, ndim=1] arr):
-    cdef int i, n
-    cdef ndarray[object, ndim=1] result
-
-    n = len(arr)
-    result = np.empty(n, dtype=object)
-
-    for i from 0 <= i < n:
-        result[i] = to_datetime(arr[i])
-
-    return result
-
-cdef inline int64_t get_timedelta64_value(val):
-    return val.view('i8')
-
-#----------------------------------------------------------------------
-# isnull / notnull related
-
-cdef double INF = <double> np.inf
-cdef double NEGINF = -INF
-
-cpdef checknull(object val):
-    if util.is_float_object(val) or util.is_complex_object(val):
-        return val != val # and val != INF and val != NEGINF
-    elif util.is_datetime64_object(val):
-        return get_datetime64_value(val) == NPY_NAT
-    elif val is NaT:
-        return True
-    elif util.is_timedelta64_object(val):
-        return get_timedelta64_value(val) == NPY_NAT
-    elif is_array(val):
-        return False
-    else:
-        return _checknull(val)
-
-cpdef checknull_old(object val):
-    if util.is_float_object(val) or util.is_complex_object(val):
-        return val != val or val == INF or val == NEGINF
-    elif util.is_datetime64_object(val):
-        return get_datetime64_value(val) == NPY_NAT
-    elif val is NaT:
-        return True
-    elif util.is_timedelta64_object(val):
-        return get_timedelta64_value(val) == NPY_NAT
-    elif is_array(val):
-        return False
-    else:
-        return util._checknull(val)
-
-def isscalar(object val):
-    """
-    Return True if given value is scalar.
-
-    This includes:
-    - numpy array scalar (e.g. np.int64)
-    - Python builtin numerics
-    - Python builtin byte arrays and strings
-    - None
-    - instances of datetime.datetime
-    - instances of datetime.timedelta
-    - Period
-
-    """
-
-    return (np.PyArray_IsAnyScalar(val)
-            # As of numpy-1.9, PyArray_IsAnyScalar misses bytearrays on Py3.
-            or PyBytes_Check(val)
-            or val is None
-            or PyDate_Check(val)
-            or PyDelta_Check(val)
-            or PyTime_Check(val)
-            or util.is_period_object(val))
-
-
-def item_from_zerodim(object val):
-    """
-    If the value is a zerodim array, return the item it contains.
-
-    Examples
-    --------
-    >>> item_from_zerodim(1)
-    1
-    >>> item_from_zerodim('foobar')
-    'foobar'
-    >>> item_from_zerodim(np.array(1))
-    1
-    >>> item_from_zerodim(np.array([1]))
-    array([1])
-
-    """
-    return util.unbox_if_zerodim(val)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def isnullobj(ndarray[object] arr):
-    cdef Py_ssize_t i, n
-    cdef object val
-    cdef ndarray[uint8_t] result
-
-    n = len(arr)
-    result = np.zeros(n, dtype=np.uint8)
-    for i from 0 <= i < n:
-        val = arr[i]
-        result[i] = val is NaT or _checknull(val)
-    return result.view(np.bool_)
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def isnullobj_old(ndarray[object] arr):
-    cdef Py_ssize_t i, n
-    cdef object val
-    cdef ndarray[uint8_t] result
-
-    n = len(arr)
-    result = np.zeros(n, dtype=np.uint8)
-    for i from 0 <= i < n:
-        val = arr[i]
-        result[i] = val is NaT or util._checknull_old(val)
-    return result.view(np.bool_)
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def isnullobj2d(ndarray[object, ndim=2] arr):
-    cdef Py_ssize_t i, j, n, m
-    cdef object val
-    cdef ndarray[uint8_t, ndim=2] result
-
-    n, m = (<object> arr).shape
-    result = np.zeros((n, m), dtype=np.uint8)
-    for i from 0 <= i < n:
-        for j from 0 <= j < m:
-            val = arr[i, j]
-            if checknull(val):
-                result[i, j] = 1
-    return result.view(np.bool_)
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def isnullobj2d_old(ndarray[object, ndim=2] arr):
-    cdef Py_ssize_t i, j, n, m
-    cdef object val
-    cdef ndarray[uint8_t, ndim=2] result
-
-    n, m = (<object> arr).shape
-    result = np.zeros((n, m), dtype=np.uint8)
-    for i from 0 <= i < n:
-        for j from 0 <= j < m:
-            val = arr[i, j]
-            if checknull_old(val):
-                result[i, j] = 1
-    return result.view(np.bool_)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cpdef ndarray[object] list_to_object_array(list obj):
-    '''
-    Convert list to object ndarray. Seriously can\'t believe I had to write this
-    function
-    '''
-    cdef:
-        Py_ssize_t i, n = len(obj)
-        ndarray[object] arr = np.empty(n, dtype=object)
-
-    for i in range(n):
-        arr[i] = obj[i]
-
-    return arr
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def fast_unique(ndarray[object] values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        list uniques = []
-        dict table = {}
-        object val, stub = 0
-
-    for i from 0 <= i < n:
-        val = values[i]
-        if val not in table:
-            table[val] = stub
-            uniques.append(val)
-    try:
-        uniques.sort()
-    except Exception:
-        pass
-
-    return uniques
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def fast_unique_multiple(list arrays):
-    cdef:
-        ndarray[object] buf
-        Py_ssize_t k = len(arrays)
-        Py_ssize_t i, j, n
-        list uniques = []
-        dict table = {}
-        object val, stub = 0
-
-    for i from 0 <= i < k:
-        buf = arrays[i]
-        n = len(buf)
-        for j from 0 <= j < n:
-            val = buf[j]
-            if val not in table:
-                table[val] = stub
-                uniques.append(val)
-    try:
-        uniques.sort()
-    except Exception:
-        pass
-
-    return uniques
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def fast_unique_multiple_list(list lists):
-    cdef:
-        list buf
-        Py_ssize_t k = len(lists)
-        Py_ssize_t i, j, n
-        list uniques = []
-        dict table = {}
-        object val, stub = 0
-
-    for i from 0 <= i < k:
-        buf = lists[i]
-        n = len(buf)
-        for j from 0 <= j < n:
-            val = buf[j]
-            if val not in table:
-                table[val] = stub
-                uniques.append(val)
-    try:
-        uniques.sort()
-    except Exception:
-        pass
-
-    return uniques
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def fast_unique_multiple_list_gen(object gen):
-    cdef:
-        list buf
-        Py_ssize_t j, n
-        list uniques = []
-        dict table = {}
-        object val, stub = 0
-
-    for buf in gen:
-        n = len(buf)
-        for j from 0 <= j < n:
-            val = buf[j]
-            if val not in table:
-                table[val] = stub
-                uniques.append(val)
-
-    try:
-        uniques.sort()
-    except Exception:
-        pass
-
-    return uniques
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def dicts_to_array(list dicts, list columns):
-    cdef:
-        Py_ssize_t i, j, k, n
-        ndarray[object, ndim=2] result
-        dict row
-        object col, onan = np.nan
-
-    k = len(columns)
-    n = len(dicts)
-
-    result = np.empty((n, k), dtype='O')
-
-    for i in range(n):
-        row = dicts[i]
-        for j in range(k):
-            col = columns[j]
-            if col in row:
-                result[i, j] = row[col]
-            else:
-                result[i, j] = onan
-
-    return result
-
-def fast_zip(list ndarrays):
-    '''
-    For zipping multiple ndarrays into an ndarray of tuples
-    '''
-    cdef:
-        Py_ssize_t i, j, k, n
-        ndarray[object] result
-        flatiter it
-        object val, tup
-
-    k = len(ndarrays)
-    n = len(ndarrays[0])
-
-    result = np.empty(n, dtype=object)
-
-    # initialize tuples on first pass
-    arr = ndarrays[0]
-    it = <flatiter> PyArray_IterNew(arr)
-    for i in range(n):
-        val = PyArray_GETITEM(arr, PyArray_ITER_DATA(it))
-        tup = PyTuple_New(k)
-
-        PyTuple_SET_ITEM(tup, 0, val)
-        Py_INCREF(val)
-        result[i] = tup
-        PyArray_ITER_NEXT(it)
-
-    for j in range(1, k):
-        arr = ndarrays[j]
-        it = <flatiter> PyArray_IterNew(arr)
-        if len(arr) != n:
-            raise ValueError('all arrays must be same length')
-
-        for i in range(n):
-            val = PyArray_GETITEM(arr, PyArray_ITER_DATA(it))
-            PyTuple_SET_ITEM(result[i], j, val)
-            Py_INCREF(val)
-            PyArray_ITER_NEXT(it)
-
-    return result
-
-def get_reverse_indexer(ndarray[int64_t] indexer, Py_ssize_t length):
-    """
-    Reverse indexing operation.
-
-    Given `indexer`, make `indexer_inv` of it, such that::
-
-        indexer_inv[indexer[x]] = x
-
-    .. note:: If indexer is not unique, only first occurrence is accounted.
-
-    """
-
-    cdef:
-        Py_ssize_t i, n = len(indexer)
-        ndarray[int64_t] rev_indexer
-        int64_t idx
-
-    rev_indexer = np.empty(length, dtype=np.int64)
-    rev_indexer.fill(-1)
-    for i in range(n):
-        idx = indexer[i]
-        if idx != -1:
-            rev_indexer[idx] = i
-
-    return rev_indexer
-
-
-def has_infs_f4(ndarray[float32_t] arr):
-    cdef:
-        Py_ssize_t i, n = len(arr)
-        float32_t inf, neginf, val
-
-    inf = np.inf
-    neginf = -inf
-
-    for i in range(n):
-        val = arr[i]
-        if val == inf or val == neginf:
-            return True
-    return False
-
-def has_infs_f8(ndarray[float64_t] arr):
-    cdef:
-        Py_ssize_t i, n = len(arr)
-        float64_t inf, neginf, val
-
-    inf = np.inf
-    neginf = -inf
-
-    for i in range(n):
-        val = arr[i]
-        if val == inf or val == neginf:
-            return True
-    return False
-
-def convert_timestamps(ndarray values):
-    cdef:
-        object val, f, result
-        dict cache = {}
-        Py_ssize_t i, n = len(values)
-        ndarray[object] out
-
-    # for HDFStore, a bit temporary but...
-
-    from datetime import datetime
-    f = datetime.fromtimestamp
-
-    out = np.empty(n, dtype='O')
-
-    for i in range(n):
-        val = util.get_value_1d(values, i)
-        if val in cache:
-            out[i] = cache[val]
-        else:
-            cache[val] = out[i] = f(val)
-
-    return out
-
-
-def maybe_indices_to_slice(ndarray[int64_t] indices, int max_len):
-    cdef:
-        Py_ssize_t i, n = len(indices)
-        int k, vstart, vlast, v
-
-    if n == 0:
-        return slice(0, 0)
-
-    vstart = indices[0]
-    if vstart < 0 or max_len <= vstart:
-        return indices
-
-    if n == 1:
-        return slice(vstart, vstart + 1)
-
-    vlast = indices[n - 1]
-    if vlast < 0 or max_len <= vlast:
-        return indices
-
-    k = indices[1] - indices[0]
-    if k == 0:
-        return indices
-    else:
-        for i in range(2, n):
-            v = indices[i]
-            if v - indices[i - 1] != k:
-                return indices
-
-        if k > 0:
-            return slice(vstart, vlast + 1, k)
-        else:
-            if vlast == 0:
-                return slice(vstart, None, k)
-            else:
-                return slice(vstart, vlast - 1, k)
-
-
-def maybe_booleans_to_slice(ndarray[uint8_t] mask):
-    cdef:
-        Py_ssize_t i, n = len(mask)
-        Py_ssize_t start, end
-        bint started = 0, finished = 0
-
-    for i in range(n):
-        if mask[i]:
-            if finished:
-                return mask.view(np.bool_)
-            if not started:
-                started = 1
-                start = i
-        else:
-            if finished:
-                continue
-
-            if started:
-                end = i
-                finished = 1
-
-    if not started:
-        return slice(0, 0)
-    if not finished:
-        return slice(start, None)
-    else:
-        return slice(start, end)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def scalar_compare(ndarray[object] values, object val, object op):
-    import operator
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[uint8_t, cast=True] result
-        bint isnull_val
-        int flag
-        object x
-
-    if op is operator.lt:
-        flag = cpython.Py_LT
-    elif op is operator.le:
-        flag = cpython.Py_LE
-    elif op is operator.gt:
-        flag = cpython.Py_GT
-    elif op is operator.ge:
-        flag = cpython.Py_GE
-    elif op is operator.eq:
-        flag = cpython.Py_EQ
-    elif op is operator.ne:
-        flag = cpython.Py_NE
-    else:
-        raise ValueError('Unrecognized operator')
-
-    result = np.empty(n, dtype=bool).view(np.uint8)
-    isnull_val = _checknull(val)
-
-    if flag == cpython.Py_NE:
-        for i in range(n):
-            x = values[i]
-            if _checknull(x):
-                result[i] = True
-            elif isnull_val:
-                result[i] = True
-            else:
-                try:
-                    result[i] = cpython.PyObject_RichCompareBool(x, val, flag)
-                except (TypeError):
-                    result[i] = True
-    elif flag == cpython.Py_EQ:
-        for i in range(n):
-            x = values[i]
-            if _checknull(x):
-                result[i] = False
-            elif isnull_val:
-                result[i] = False
-            else:
-                try:
-                    result[i] = cpython.PyObject_RichCompareBool(x, val, flag)
-                except (TypeError):
-                    result[i] = False
-
-    else:
-        for i in range(n):
-            x = values[i]
-            if _checknull(x):
-                result[i] = False
-            elif isnull_val:
-                result[i] = False
-            else:
-                result[i] = cpython.PyObject_RichCompareBool(x, val, flag)
-
-    return result.view(bool)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cpdef bint array_equivalent_object(object[:] left, object[:] right):
-    """ perform an element by element comparion on 1-d object arrays
-        taking into account nan positions """
-    cdef:
-        Py_ssize_t i, n = left.shape[0]
-        object x, y
-
-    for i in range(n):
-        x = left[i]
-        y = right[i]
-
-        # we are either not equal or both nan
-        # I think None == None will be true here
-        if not (PyObject_RichCompareBool(x, y, cpython.Py_EQ) or
-                _checknull(x) and _checknull(y)):
-            return False
-    return True
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def vec_compare(ndarray[object] left, ndarray[object] right, object op):
-    import operator
-    cdef:
-        Py_ssize_t i, n = len(left)
-        ndarray[uint8_t, cast=True] result
-        int flag
-
-    if n != len(right):
-        raise ValueError('Arrays were different lengths: %d vs %d'
-                         % (n, len(right)))
-
-    if op is operator.lt:
-        flag = cpython.Py_LT
-    elif op is operator.le:
-        flag = cpython.Py_LE
-    elif op is operator.gt:
-        flag = cpython.Py_GT
-    elif op is operator.ge:
-        flag = cpython.Py_GE
-    elif op is operator.eq:
-        flag = cpython.Py_EQ
-    elif op is operator.ne:
-        flag = cpython.Py_NE
-    else:
-        raise ValueError('Unrecognized operator')
-
-    result = np.empty(n, dtype=bool).view(np.uint8)
-
-    if flag == cpython.Py_NE:
-        for i in range(n):
-            x = left[i]
-            y = right[i]
-
-            if _checknull(x) or _checknull(y):
-                result[i] = True
-            else:
-                result[i] = cpython.PyObject_RichCompareBool(x, y, flag)
-    else:
-        for i in range(n):
-            x = left[i]
-            y = right[i]
-
-            if _checknull(x) or _checknull(y):
-                result[i] = False
-            else:
-                result[i] = cpython.PyObject_RichCompareBool(x, y, flag)
-
-    return result.view(bool)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def scalar_binop(ndarray[object] values, object val, object op):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] result
-        object x
-
-    result = np.empty(n, dtype=object)
-    if util._checknull(val):
-        result.fill(val)
-        return result
-
-    for i in range(n):
-        x = values[i]
-        if util._checknull(x):
-            result[i] = x
-        else:
-            result[i] = op(x, val)
-
-    return maybe_convert_bool(result)
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def vec_binop(ndarray[object] left, ndarray[object] right, object op):
-    cdef:
-        Py_ssize_t i, n = len(left)
-        ndarray[object] result
-
-    if n != len(right):
-        raise ValueError('Arrays were different lengths: %d vs %d'
-                         % (n, len(right)))
-
-    result = np.empty(n, dtype=object)
-
-    for i in range(n):
-        x = left[i]
-        y = right[i]
-        try:
-            result[i] = op(x, y)
-        except TypeError:
-            if util._checknull(x):
-                result[i] = x
-            elif util._checknull(y):
-                result[i] = y
-            else:
-                raise
-
-    return maybe_convert_bool(result)
-
-
-def astype_intsafe(ndarray[object] arr, new_dtype):
-    cdef:
-        Py_ssize_t i, n = len(arr)
-        object v
-        bint is_datelike
-        ndarray result
-
-    # on 32-bit, 1.6.2 numpy M8[ns] is a subdtype of integer, which is weird
-    is_datelike = new_dtype in ['M8[ns]','m8[ns]']
-
-    result = np.empty(n, dtype=new_dtype)
-    for i in range(n):
-        v = arr[i]
-        if is_datelike and checknull(v):
-           result[i] = NPY_NAT
-        else:
-           util.set_value_at(result, i, v)
-
-    return result
-
-cpdef ndarray[object] astype_unicode(ndarray arr):
-    cdef:
-        Py_ssize_t i, n = arr.size
-        ndarray[object] result = np.empty(n, dtype=object)
-
-    for i in range(n):
-        util.set_value_at(result, i, unicode(arr[i]))
-
-    return result
-
-cpdef ndarray[object] astype_str(ndarray arr):
-    cdef:
-        Py_ssize_t i, n = arr.size
-        ndarray[object] result = np.empty(n, dtype=object)
-
-    for i in range(n):
-        util.set_value_at(result, i, str(arr[i]))
-
-    return result
-
-def clean_index_list(list obj):
-    '''
-    Utility used in pandas.core.index._ensure_index
-    '''
-    cdef:
-        ndarray[object] converted
-        Py_ssize_t i, n = len(obj)
-        object v
-        bint all_arrays = 1
-
-    for i in range(n):
-        v = obj[i]
-        if not (PyList_Check(v) or np.PyArray_Check(v) or hasattr(v,'_data')):
-            all_arrays = 0
-            break
-
-    if all_arrays:
-        return obj, all_arrays
-
-    converted = np.empty(n, dtype=object)
-    for i in range(n):
-        v = obj[i]
-        if PyList_Check(v) or np.PyArray_Check(v) or hasattr(v,'_data'):
-            converted[i] = tuple(v)
-        else:
-            converted[i] = v
-
-    return maybe_convert_objects(converted), 0
-
-
-ctypedef fused pandas_string:
-    str
-    unicode
-    bytes
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-cpdef Py_ssize_t max_len_string_array(pandas_string[:] arr):
-    """ return the maximum size of elements in a 1-dim string array """
-    cdef:
-        Py_ssize_t i, m = 0, l = 0, length = arr.shape[0]
-        pandas_string v
-
-    for i in range(length):
-        v = arr[i]
-        if PyString_Check(v):
-            l = PyString_GET_SIZE(v)
-        elif PyBytes_Check(v):
-            l = PyBytes_GET_SIZE(v)
-        elif PyUnicode_Check(v):
-            l = PyUnicode_GET_SIZE(v)
-
-        if l > m:
-            m = l
-
-    return m
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def string_array_replace_from_nan_rep(ndarray[object, ndim=1] arr, object nan_rep, object replace = None):
-    """ replace the values in the array with replacement if they are nan_rep; return the same array """
-
-    cdef int length = arr.shape[0], i = 0
-    if replace is None:
-        replace = np.nan
-
-    for i from 0 <= i < length:
-        if arr[i] == nan_rep:
-            arr[i] = replace
-
-    return arr
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def write_csv_rows(list data, ndarray data_index, int nlevels, ndarray cols, object writer):
-
-    cdef int N, j, i, ncols
-    cdef list rows
-    cdef object val
-
-    # In crude testing, N>100 yields little marginal improvement
-    N=100
-
-    # pre-allocate  rows
-    ncols = len(cols)
-    rows = [[None]*(nlevels+ncols) for x in range(N)]
-
-    j = -1
-    if nlevels == 1:
-        for j in range(len(data_index)):
-            row = rows[j % N]
-            row[0] = data_index[j]
-            for i in range(ncols):
-                row[1+i] = data[i][j]
-
-            if j >= N-1 and j % N == N-1:
-                writer.writerows(rows)
-    elif nlevels > 1:
-        for j in range(len(data_index)):
-            row = rows[j % N]
-            row[:nlevels] = list(data_index[j])
-            for i in range(ncols):
-                row[nlevels+i] = data[i][j]
-
-            if j >= N-1 and j % N == N-1:
-                writer.writerows(rows)
-    else:
-        for j in range(len(data_index)):
-            row = rows[j % N]
-            for i in range(ncols):
-                row[i] = data[i][j]
-
-            if j >= N-1 and j % N == N-1:
-                writer.writerows(rows)
-
-    if  j >= 0 and (j < N-1 or (j % N) != N-1 ):
-        writer.writerows(rows[:((j+1) % N)])
-
-#-------------------------------------------------------------------------------
-# Groupby-related functions
-
-@cython.boundscheck(False)
-def arrmap(ndarray[object] index, object func):
-    cdef int length = index.shape[0]
-    cdef int i = 0
-
-    cdef ndarray[object] result = np.empty(length, dtype=np.object_)
-
-    for i from 0 <= i < length:
-        result[i] = func(index[i])
-
-    return result
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def is_lexsorted(list list_of_arrays):
-    cdef:
-        int i
-        Py_ssize_t n, nlevels
-        int64_t k, cur, pre
-        ndarray arr
-
-    nlevels = len(list_of_arrays)
-    n = len(list_of_arrays[0])
-
-    cdef int64_t **vecs = <int64_t**> malloc(nlevels * sizeof(int64_t*))
-    for i from 0 <= i < nlevels:
-        # vecs[i] = <int64_t *> (<ndarray> list_of_arrays[i]).data
-
-        arr = list_of_arrays[i]
-        vecs[i] = <int64_t *> arr.data
-    # assume uniqueness??
-
-    for i from 1 <= i < n:
-        for k from 0 <= k < nlevels:
-            cur = vecs[k][i]
-            pre = vecs[k][i-1]
-            if cur == pre:
-                continue
-            elif cur > pre:
-                break
-            else:
-                return False
-    free(vecs)
-    return True
-
-
-
-# TODO: could do even better if we know something about the data. eg, index has
-# 1-min data, binner has 5-min data, then  bins are just strides in index. This
-# is a general, O(max(len(values), len(binner))) method.
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def generate_bins_dt64(ndarray[int64_t] values, ndarray[int64_t] binner,
-                       object closed='left', bint hasnans=0):
-    """
-    Int64 (datetime64) version of generic python version in groupby.py
-    """
-    cdef:
-        Py_ssize_t lenidx, lenbin, i, j, bc, vc
-        ndarray[int64_t] bins
-        int64_t l_bin, r_bin, nat_count
-        bint right_closed = closed == 'right'
-
-    nat_count = 0
-    if hasnans:
-        mask = values == iNaT
-        nat_count = np.sum(mask)
-        values = values[~mask]
-
-    lenidx = len(values)
-    lenbin = len(binner)
-
-    if lenidx <= 0 or lenbin <= 0:
-        raise ValueError("Invalid length for values or for binner")
-
-    # check binner fits data
-    if values[0] < binner[0]:
-        raise ValueError("Values falls before first bin")
-
-    if values[lenidx-1] > binner[lenbin-1]:
-        raise ValueError("Values falls after last bin")
-
-    bins = np.empty(lenbin - 1, dtype=np.int64)
-
-    j  = 0 # index into values
-    bc = 0 # bin count
-
-    # linear scan
-    if right_closed:
-        for i in range(0, lenbin - 1):
-            r_bin = binner[i+1]
-            # count values in current bin, advance to next bin
-            while j < lenidx and values[j] <= r_bin:
-                j += 1
-            bins[bc] = j
-            bc += 1
-    else:
-        for i in range(0, lenbin - 1):
-            r_bin = binner[i+1]
-            # count values in current bin, advance to next bin
-            while j < lenidx and values[j] < r_bin:
-                j += 1
-            bins[bc] = j
-            bc += 1
-
-    if nat_count > 0:
-        # shift bins by the number of NaT
-        bins = bins + nat_count
-        bins = np.insert(bins, 0, nat_count)
-
-    return bins
-
-
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def row_bool_subset(ndarray[float64_t, ndim=2] values,
-                    ndarray[uint8_t, cast=True] mask):
-    cdef:
-        Py_ssize_t i, j, n, k, pos = 0
-        ndarray[float64_t, ndim=2] out
-
-    n, k = (<object> values).shape
-    assert(n == len(mask))
-
-    out = np.empty((mask.sum(), k), dtype=np.float64)
-
-    for i in range(n):
-        if mask[i]:
-            for j in range(k):
-                out[pos, j] = values[i, j]
-            pos += 1
-
-    return out
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def row_bool_subset_object(ndarray[object, ndim=2] values,
-                           ndarray[uint8_t, cast=True] mask):
-    cdef:
-        Py_ssize_t i, j, n, k, pos = 0
-        ndarray[object, ndim=2] out
-
-    n, k = (<object> values).shape
-    assert(n == len(mask))
-
-    out = np.empty((mask.sum(), k), dtype=object)
-
-    for i in range(n):
-        if mask[i]:
-            for j in range(k):
-                out[pos, j] = values[i, j]
-            pos += 1
-
-    return out
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def get_level_sorter(ndarray[int64_t, ndim=1] label,
-                     ndarray[int64_t, ndim=1] starts):
-    """
-    argsort for a single level of a multi-index, keeping the order of higher
-    levels unchanged. `starts` points to starts of same-key indices w.r.t
-    to leading levels; equivalent to:
-        np.hstack([label[starts[i]:starts[i+1]].argsort(kind='mergesort')
-            + starts[i] for i in range(len(starts) - 1)])
-    """
-    cdef:
-        int64_t l, r
-        Py_ssize_t i
-        ndarray[int64_t, ndim=1] out = np.empty(len(label), dtype=np.int64)
-
-    for i in range(len(starts) - 1):
-        l, r = starts[i], starts[i + 1]
-        out[l:r] = l + label[l:r].argsort(kind='mergesort')
-
-    return out
-
-def group_count(ndarray[int64_t] values, Py_ssize_t size):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[int64_t] counts
-
-    counts = np.zeros(size, dtype=np.int64)
-    for i in range(n):
-        counts[values[i]] += 1
-    return counts
-
-def lookup_values(ndarray[object] values, dict mapping):
-    cdef:
-        Py_ssize_t i, n = len(values)
-
-    result = np.empty(n, dtype='O')
-    for i in range(n):
-        result[i] = mapping[values[i]]
-    return maybe_convert_objects(result)
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def count_level_2d(ndarray[uint8_t, ndim=2, cast=True] mask,
-                   ndarray[int64_t, ndim=1] labels,
-                   Py_ssize_t max_bin,
-                   int axis):
-    cdef:
-        Py_ssize_t i, j, k, n
-        ndarray[int64_t, ndim=2] counts
-
-    assert(axis == 0 or axis == 1)
-    n, k = (<object> mask).shape
-
-    if axis == 0:
-        counts = np.zeros((max_bin, k), dtype='i8')
-        with nogil:
-            for i from 0 <= i < n:
-                for j from 0 <= j < k:
-                    counts[labels[i], j] += mask[i, j]
-
-    else:  # axis == 1
-        counts = np.zeros((n, max_bin), dtype='i8')
-        with nogil:
-            for i from 0 <= i < n:
-                for j from 0 <= j < k:
-                    counts[i, labels[j]] += mask[i, j]
-
-    return counts
-
-cdef class _PandasNull:
-
-    def __richcmp__(_PandasNull self, object other, int op):
-        if op == 2: # ==
-            return isinstance(other, _PandasNull)
-        elif op == 3: # !=
-            return not isinstance(other, _PandasNull)
-        else:
-            return False
-
-    def __hash__(self):
-        return 0
-
-pandas_null = _PandasNull()
-
-def fast_zip_fillna(list ndarrays, fill_value=pandas_null):
-    '''
-    For zipping multiple ndarrays into an ndarray of tuples
-    '''
-    cdef:
-        Py_ssize_t i, j, k, n
-        ndarray[object] result
-        flatiter it
-        object val, tup
-
-    k = len(ndarrays)
-    n = len(ndarrays[0])
-
-    result = np.empty(n, dtype=object)
-
-    # initialize tuples on first pass
-    arr = ndarrays[0]
-    it = <flatiter> PyArray_IterNew(arr)
-    for i in range(n):
-        val = PyArray_GETITEM(arr, PyArray_ITER_DATA(it))
-        tup = PyTuple_New(k)
-
-        if val != val:
-            val = fill_value
-
-        PyTuple_SET_ITEM(tup, 0, val)
-        Py_INCREF(val)
-        result[i] = tup
-        PyArray_ITER_NEXT(it)
-
-    for j in range(1, k):
-        arr = ndarrays[j]
-        it = <flatiter> PyArray_IterNew(arr)
-        if len(arr) != n:
-            raise ValueError('all arrays must be same length')
-
-        for i in range(n):
-            val = PyArray_GETITEM(arr, PyArray_ITER_DATA(it))
-            if val != val:
-                val = fill_value
-
-            PyTuple_SET_ITEM(result[i], j, val)
-            Py_INCREF(val)
-            PyArray_ITER_NEXT(it)
-
-    return result
-
-
-def duplicated(ndarray[object] values, object keep='first'):
-    cdef:
-        Py_ssize_t i, n
-        dict seen = dict()
-        object row
-
-    n = len(values)
-    cdef ndarray[uint8_t] result = np.zeros(n, dtype=np.uint8)
-
-    if keep == 'last':
-        for i from n > i >= 0:
-            row = values[i]
-            if row in seen:
-                result[i] = 1
-            else:
-                seen[row] = i
-                result[i] = 0
-    elif keep == 'first':
-        for i from 0 <= i < n:
-            row = values[i]
-            if row in seen:
-                result[i] = 1
-            else:
-                seen[row] = i
-                result[i] = 0
-    elif keep is False:
-        for i from 0 <= i < n:
-            row = values[i]
-            if row in seen:
-                result[i] = 1
-                result[seen[row]] = 1
-            else:
-                seen[row] = i
-                result[i] = 0
-    else:
-        raise ValueError('keep must be either "first", "last" or False')
-
-    return result.view(np.bool_)
-
-
-def generate_slices(ndarray[int64_t] labels, Py_ssize_t ngroups):
-    cdef:
-        Py_ssize_t i, group_size, n, start
-        int64_t lab
-        object slobj
-        ndarray[int64_t] starts, ends
-
-    n = len(labels)
-
-    starts = np.zeros(ngroups, dtype=np.int64)
-    ends = np.zeros(ngroups, dtype=np.int64)
-
-    start = 0
-    group_size = 0
-    for i in range(n):
-        lab = labels[i]
-        if lab < 0:
-            start += 1
-        else:
-            group_size += 1
-            if i == n - 1 or lab != labels[i + 1]:
-                starts[lab] = start
-                ends[lab] = start + group_size
-                start += group_size
-                group_size = 0
-
-    return starts, ends
-
-
-def indices_fast(object index, ndarray[int64_t] labels, list keys,
-                 list sorted_labels):
-    cdef:
-        Py_ssize_t i, j, k, lab, cur, start, n = len(labels)
-        dict result = {}
-        object tup
-
-    k = len(keys)
-
-    if n == 0:
-        return result
-
-    start = 0
-    cur = labels[0]
-    for i in range(1, n):
-        lab = labels[i]
-
-        if lab != cur:
-            if lab != -1:
-                tup = PyTuple_New(k)
-                for j in range(k):
-                    val = util.get_value_at(keys[j],
-                                            sorted_labels[j][i-1])
-                    PyTuple_SET_ITEM(tup, j, val)
-                    Py_INCREF(val)
-
-                result[tup] = index[start:i]
-            start = i
-        cur = lab
-
-    tup = PyTuple_New(k)
-    for j in range(k):
-        val = util.get_value_at(keys[j],
-                                sorted_labels[j][n - 1])
-        PyTuple_SET_ITEM(tup, j, val)
-        Py_INCREF(val)
-    result[tup] = index[start:]
-
-    return result
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def get_blkno_indexers(int64_t[:] blknos, bint group=True):
-    """
-    Enumerate contiguous runs of integers in ndarray.
-
-    Iterate over elements of `blknos` yielding ``(blkno, slice(start, stop))``
-    pairs for each contiguous run found.
-
-    If `group` is True and there is more than one run for a certain blkno,
-    ``(blkno, array)`` with an array containing positions of all elements equal
-    to blkno.
-
-    Returns
-    -------
-    iter : iterator of (int, slice or array)
-
-    """
-    # There's blkno in this function's name because it's used in block &
-    # blockno handling.
-    cdef:
-        int64_t cur_blkno
-        Py_ssize_t i, start, stop, n, diff
-
-        list group_order
-        dict group_slices
-        int64_t[:] res_view
-
-    n = blknos.shape[0]
-
-    if n > 0:
-        start = 0
-        cur_blkno = blknos[start]
-
-        if group == False:
-            for i in range(1, n):
-                if blknos[i] != cur_blkno:
-                    yield cur_blkno, slice(start, i)
-
-                    start = i
-                    cur_blkno = blknos[i]
-
-            yield cur_blkno, slice(start, n)
-        else:
-            group_order = []
-            group_dict = {}
-
-            for i in range(1, n):
-                if blknos[i] != cur_blkno:
-                    if cur_blkno not in group_dict:
-                        group_order.append(cur_blkno)
-                        group_dict[cur_blkno] = [(start, i)]
-                    else:
-                        group_dict[cur_blkno].append((start, i))
-
-                    start = i
-                    cur_blkno = blknos[i]
-
-            if cur_blkno not in group_dict:
-                group_order.append(cur_blkno)
-                group_dict[cur_blkno] = [(start, n)]
-            else:
-                group_dict[cur_blkno].append((start, n))
-
-            for blkno in group_order:
-                slices = group_dict[blkno]
-                if len(slices) == 1:
-                    yield blkno, slice(slices[0][0], slices[0][1])
-                else:
-                    tot_len = sum(stop - start for start, stop in slices)
-                    result = np.empty(tot_len, dtype=np.int64)
-                    res_view = result
-
-                    i = 0
-                    for start, stop in slices:
-                        for diff in range(start, stop):
-                            res_view[i] = diff
-                            i += 1
-
-                    yield blkno, result
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-cpdef slice indexer_as_slice(int64_t[:] vals):
-    cdef:
-        Py_ssize_t i, n, start, stop
-        int64_t d
-
-    if vals is None:
-        raise TypeError("vals must be ndarray")
-
-    n = vals.shape[0]
-
-    if n == 0 or vals[0] < 0:
-        return None
-
-    if n == 1:
-        return slice(vals[0], vals[0] + 1, 1)
-
-    if vals[1] < 0:
-        return None
-
-    # n > 2
-    d = vals[1] - vals[0]
-
-    if d == 0:
-        return None
-
-    for i in range(2, n):
-        if vals[i] < 0 or vals[i] - vals[i-1] != d:
-            return None
-
-    start = vals[0]
-    stop = start + n * d
-    if stop < 0 and d < 0:
-        return slice(start, None, d)
-    else:
-        return slice(start, stop, d)
-
-
-cpdef slice_canonize(slice s):
-    """
-    Convert slice to canonical bounded form.
-    """
-    cdef:
-        Py_ssize_t start, stop, step, length
-
-    if s.step is None:
-        step = 1
-    else:
-        step = <Py_ssize_t>s.step
-        if step == 0:
-            raise ValueError("slice step cannot be zero")
-
-    if step > 0:
-        if s.stop is None:
-            raise ValueError("unbounded slice")
-
-        stop = <Py_ssize_t>s.stop
-        if s.start is None:
-            start = 0
-        else:
-            start = <Py_ssize_t>s.start
-            if start > stop:
-                start = stop
-    elif step < 0:
-        if s.start is None:
-            raise ValueError("unbounded slice")
-
-        start = <Py_ssize_t>s.start
-        if s.stop is None:
-            stop = -1
-        else:
-            stop = <Py_ssize_t>s.stop
-            if stop > start:
-                stop = start
-
-    if start < 0 or (stop < 0 and s.stop is not None):
-        raise ValueError("unbounded slice")
-
-    if stop < 0:
-        return slice(start, None, step)
-    else:
-        return slice(start, stop, step)
-
-
-cpdef slice_get_indices_ex(slice slc, Py_ssize_t objlen=PY_SSIZE_T_MAX):
-    """
-    Get (start, stop, step, length) tuple for a slice.
-
-    If `objlen` is not specified, slice must be bounded, otherwise the result
-    will be wrong.
-
-    """
-    cdef:
-        Py_ssize_t start, stop, step, length
-
-    if slc is None:
-        raise TypeError("slc should be a slice")
-
-    PySlice_GetIndicesEx(<PySliceObject*>slc, objlen,
-                         &start, &stop, &step, &length)
-    return start, stop, step, length
-
-
-cpdef Py_ssize_t slice_len(slice slc, Py_ssize_t objlen=PY_SSIZE_T_MAX) except -1:
-    """
-    Get length of a bounded slice.
-
-    The slice must not have any "open" bounds that would create dependency on
-    container size, i.e.:
-    - if ``s.step is None or s.step > 0``, ``s.stop`` is not ``None``
-    - if ``s.step < 0``, ``s.start`` is not ``None``
-
-    Otherwise, the result is unreliable.
-
-    """
-    cdef:
-        Py_ssize_t start, stop, step, length
-
-    if slc is None:
-        raise TypeError("slc must be slice")
-
-    PySlice_GetIndicesEx(<PySliceObject*>slc, objlen,
-                         &start, &stop, &step, &length)
-
-    return length
-
-
-def slice_getitem(slice slc not None, ind):
-    cdef:
-        Py_ssize_t s_start, s_stop, s_step, s_len
-        Py_ssize_t ind_start, ind_stop, ind_step, ind_len
-
-    s_start, s_stop, s_step, s_len = slice_get_indices_ex(slc)
-
-    if isinstance(ind, slice):
-        ind_start, ind_stop, ind_step, ind_len = slice_get_indices_ex(ind,
-                                                                      s_len)
-
-        if ind_step > 0 and ind_len == s_len:
-            # short-cut for no-op slice
-            if ind_len == s_len:
-                return slc
-
-        if ind_step < 0:
-            s_start = s_stop - s_step
-            ind_step = -ind_step
-
-        s_step *= ind_step
-        s_stop = s_start + ind_stop * s_step
-        s_start = s_start + ind_start * s_step
-
-        if s_step < 0 and s_stop < 0:
-            return slice(s_start, None, s_step)
-        else:
-            return slice(s_start, s_stop, s_step)
-
-    else:
-        return np.arange(s_start, s_stop, s_step, dtype=np.int64)[ind]
-
-
-cdef class BlockPlacement:
-    # __slots__ = '_as_slice', '_as_array', '_len'
-    cdef slice _as_slice
-    cdef object _as_array
-
-    cdef bint _has_slice, _has_array, _is_known_slice_like
-
-    def __init__(self, val):
-        cdef slice slc
-
-        self._has_slice = False
-        self._has_array = False
-
-        if isinstance(val, slice):
-            slc = slice_canonize(val)
-
-            if slc.start != slc.stop:
-                self._as_slice = slc
-                self._has_slice = True
-            else:
-                arr = np.empty(0, dtype=np.int64)
-                self._as_array = arr
-                self._has_array = True
-        else:
-            # Cython memoryview interface requires ndarray to be writeable.
-            arr = np.require(val, dtype=np.int64, requirements='W')
-            assert arr.ndim == 1
-            self._as_array = arr
-            self._has_array = True
-
-    def __str__(self):
-        cdef slice s = self._ensure_has_slice()
-        if s is not None:
-            v = self._as_slice
-        else:
-            v = self._as_array
-
-        return '%s(%r)' % (self.__class__.__name__, v)
-
-    __repr__ = __str__
-
-    def __len__(self):
-        cdef slice s = self._ensure_has_slice()
-        if s is not None:
-            return slice_len(s)
-        else:
-            return len(self._as_array)
-
-    def __iter__(self):
-        cdef slice s = self._ensure_has_slice()
-        cdef Py_ssize_t start, stop, step, _
-        if s is not None:
-            start, stop, step, _ = slice_get_indices_ex(s)
-            return iter(range(start, stop, step))
-        else:
-            return iter(self._as_array)
-
-    @property
-    def as_slice(self):
-        cdef slice s = self._ensure_has_slice()
-        if s is None:
-            raise TypeError('Not slice-like')
-        else:
-            return s
-
-    @property
-    def indexer(self):
-        cdef slice s = self._ensure_has_slice()
-        if s is not None:
-            return s
-        else:
-            return self._as_array
-
-    def isin(self, arr):
-        from pandas.core.index import Int64Index
-        return Int64Index(self.as_array, copy=False).isin(arr)
-
-    @property
-    def as_array(self):
-        cdef Py_ssize_t start, stop, end, _
-        if not self._has_array:
-            start, stop, step, _ = slice_get_indices_ex(self._as_slice)
-            self._as_array = np.arange(start, stop, step,
-                                       dtype=np.int64)
-            self._has_array = True
-        return self._as_array
-
-    @property
-    def is_slice_like(self):
-        cdef slice s = self._ensure_has_slice()
-        return s is not None
-
-    def __getitem__(self, loc):
-        cdef slice s = self._ensure_has_slice()
-        if s is not None:
-            val = slice_getitem(s, loc)
-        else:
-            val = self._as_array[loc]
-
-        if not isinstance(val, slice) and val.ndim == 0:
-            return val
-
-        return BlockPlacement(val)
-
-    def delete(self, loc):
-        return BlockPlacement(np.delete(self.as_array, loc, axis=0))
-
-    def append(self, others):
-        if len(others) == 0:
-            return self
-
-        return BlockPlacement(np.concatenate([self.as_array] +
-                                             [o.as_array for o in others]))
-
-    cdef iadd(self, other):
-        cdef slice s = self._ensure_has_slice()
-        cdef Py_ssize_t other_int, start, stop, step, l
-
-        if isinstance(other, int) and s is not None:
-            other_int = <Py_ssize_t>other
-
-            if other_int == 0:
-                return self
-
-            start, stop, step, l = slice_get_indices_ex(s)
-            start += other_int
-            stop += other_int
-
-            if ((step > 0 and start < 0) or
-                (step < 0 and stop < step)):
-                raise ValueError("iadd causes length change")
-
-            if stop < 0:
-                self._as_slice = slice(start, None, step)
-            else:
-                self._as_slice = slice(start, stop, step)
-
-            self._has_array = False
-            self._as_array = None
-        else:
-            newarr = self.as_array + other
-            if (newarr < 0).any():
-                raise ValueError("iadd causes length change")
-
-            self._as_array = newarr
-            self._has_array = True
-            self._has_slice = False
-            self._as_slice = None
-
-        return self
-
-    cdef BlockPlacement copy(self):
-        cdef slice s = self._ensure_has_slice()
-        if s is not None:
-            return BlockPlacement(s)
-        else:
-            return BlockPlacement(self._as_array)
-
-    def add(self, other):
-        return self.copy().iadd(other)
-
-    def sub(self, other):
-        return self.add(-other)
-
-    cdef slice _ensure_has_slice(self):
-        if not self._has_slice:
-            self._as_slice = indexer_as_slice(self._as_array)
-            self._has_slice = True
-        return self._as_slice
-
-
-include "reduce.pyx"
-include "properties.pyx"
-include "inference.pyx"
diff --git a/pandas/msgpack/__init__.py b/pandas/msgpack/__init__.py
deleted file mode 100644
index bf0e2853ae131..0000000000000
--- a/pandas/msgpack/__init__.py
+++ /dev/null
@@ -1,49 +0,0 @@
-# coding: utf-8
-from pandas.msgpack._version import version
-from pandas.msgpack.exceptions import *
-
-from collections import namedtuple
-
-
-class ExtType(namedtuple('ExtType', 'code data')):
-    """ExtType represents ext type in msgpack."""
-    def __new__(cls, code, data):
-        if not isinstance(code, int):
-            raise TypeError("code must be int")
-        if not isinstance(data, bytes):
-            raise TypeError("data must be bytes")
-        if not 0 <= code <= 127:
-            raise ValueError("code must be 0~127")
-        return super(ExtType, cls).__new__(cls, code, data)
-
-
-import os
-from pandas.msgpack._packer import Packer
-from pandas.msgpack._unpacker import unpack, unpackb, Unpacker
-
-
-
-def pack(o, stream, **kwargs):
-    """
-    Pack object `o` and write it to `stream`
-
-    See :class:`Packer` for options.
-    """
-    packer = Packer(**kwargs)
-    stream.write(packer.pack(o))
-
-
-def packb(o, **kwargs):
-    """
-    Pack object `o` and return packed bytes
-
-    See :class:`Packer` for options.
-    """
-    return Packer(**kwargs).pack(o)
-
-# alias for compatibility to simplejson/marshal/pickle.
-load = unpack
-loads = unpackb
-
-dump = pack
-dumps = packb
diff --git a/pandas/msgpack/exceptions.py b/pandas/msgpack/exceptions.py
deleted file mode 100644
index f7678f135bd26..0000000000000
--- a/pandas/msgpack/exceptions.py
+++ /dev/null
@@ -1,29 +0,0 @@
-class UnpackException(Exception):
-    pass
-
-
-class BufferFull(UnpackException):
-    pass
-
-
-class OutOfData(UnpackException):
-    pass
-
-
-class UnpackValueError(UnpackException, ValueError):
-    pass
-
-
-class ExtraData(ValueError):
-    def __init__(self, unpacked, extra):
-        self.unpacked = unpacked
-        self.extra = extra
-
-    def __str__(self):
-        return "unpack(b) received extra data."
-
-class PackException(Exception):
-    pass
-
-class PackValueError(PackException, ValueError):
-    pass
diff --git a/pandas/parser.py b/pandas/parser.py
new file mode 100644
index 0000000000000..f43a408c943d0
--- /dev/null
+++ b/pandas/parser.py
@@ -0,0 +1,8 @@
+# flake8: noqa
+
+import warnings
+warnings.warn("The pandas.parser module is deprecated and will be "
+              "removed in a future version. Please import from "
+              "pandas.io.parser instead", FutureWarning, stacklevel=2)
+from pandas._libs.parsers import na_values
+from pandas.io.common import CParserError
diff --git a/pandas/parser.pyx b/pandas/parser.pyx
deleted file mode 100644
index 8ac1f64f2d50e..0000000000000
--- a/pandas/parser.pyx
+++ /dev/null
@@ -1,1986 +0,0 @@
-# Copyright (c) 2012, Lambda Foundry, Inc.
-# See LICENSE for the license
-
-from libc.stdio cimport fopen, fclose
-from libc.stdlib cimport malloc, free
-from libc.string cimport strncpy, strlen, strcmp, strcasecmp
-cimport libc.stdio as stdio
-import warnings
-
-from cpython cimport (PyObject, PyBytes_FromString,
-                      PyBytes_AsString, PyBytes_Check,
-                      PyUnicode_Check, PyUnicode_AsUTF8String)
-from io.common import DtypeWarning
-
-
-cdef extern from "Python.h":
-    object PyUnicode_FromString(char *v)
-
-    object PyUnicode_Decode(char *v, Py_ssize_t size, char *encoding,
-                            char *errors)
-
-cdef extern from "stdlib.h":
-    void memcpy(void *dst, void *src, size_t n)
-
-cimport numpy as cnp
-
-from numpy cimport ndarray, uint8_t, uint64_t
-
-import numpy as np
-cimport util
-
-import pandas.lib as lib
-
-import time
-import os
-
-cnp.import_array()
-
-from khash cimport *
-
-import sys
-
-cdef bint PY3 = (sys.version_info[0] >= 3)
-
-cdef double INF = <double> np.inf
-cdef double NEGINF = -INF
-
-cdef extern from "headers/stdint.h":
-    enum: UINT8_MAX
-    enum: UINT16_MAX
-    enum: UINT32_MAX
-    enum: UINT64_MAX
-    enum: INT8_MIN
-    enum: INT8_MAX
-    enum: INT16_MIN
-    enum: INT16_MAX
-    enum: INT32_MAX
-    enum: INT32_MIN
-    enum: INT64_MAX
-    enum: INT64_MIN
-
-cdef extern from "headers/portable.h":
-    pass
-
-cdef extern from "errno.h":
-    int errno
-
-try:
-    basestring
-except NameError:
-    basestring = str
-
-cdef extern from "parser/tokenizer.h":
-
-    ctypedef enum ParserState:
-        START_RECORD
-        START_FIELD
-        ESCAPED_CHAR
-        IN_FIELD
-        IN_QUOTED_FIELD
-        ESCAPE_IN_QUOTED_FIELD
-        QUOTE_IN_QUOTED_FIELD
-        EAT_CRNL
-        EAT_CRNL_NOP
-        EAT_WHITESPACE
-        EAT_COMMENT
-        EAT_LINE_COMMENT
-        WHITESPACE_LINE
-        SKIP_LINE
-        FINISHED
-
-    enum: ERROR_OVERFLOW
-
-    ctypedef void* (*io_callback)(void *src, size_t nbytes, size_t *bytes_read,
-                                 int *status)
-    ctypedef int (*io_cleanup)(void *src)
-
-    ctypedef struct parser_t:
-        void *source
-        io_callback cb_io
-        io_cleanup cb_cleanup
-
-        int chunksize  # Number of bytes to prepare for each chunk
-        char *data     # pointer to data to be processed
-        int datalen    # amount of data available
-        int datapos
-
-        # where to write out tokenized data
-        char *stream
-        int stream_len
-        int stream_cap
-
-        # Store words in (potentially ragged) matrix for now, hmm
-        char **words
-        int *word_starts # where we are in the stream
-        int words_len
-        int words_cap
-
-        char *pword_start    # pointer to stream start of current field
-        int word_start       # position start of current field
-
-        int *line_start      # position in words for start of line
-        int *line_fields     # Number of fields in each line
-        int lines            # Number of lines observed
-        int file_lines       # Number of file lines observed (with bad/skipped)
-        int lines_cap        # Vector capacity
-
-        # Tokenizing stuff
-        ParserState state
-        int doublequote            # is " represented by ""? */
-        char delimiter             # field separator */
-        int delim_whitespace       # consume tabs / spaces instead
-        char quotechar             # quote character */
-        char escapechar            # escape character */
-        char lineterminator
-        int skipinitialspace       # ignore spaces following delimiter? */
-        int quoting                # style of quoting to write */
-
-        # hmm =/
-#        int numeric_field
-
-        char commentchar
-        int allow_embedded_newline
-        int strict                 # raise exception on bad CSV */
-
-        int expected_fields
-        int error_bad_lines
-        int warn_bad_lines
-
-        # floating point options
-        char decimal
-        char sci
-
-        # thousands separator (comma, period)
-        char thousands
-
-        int header # Boolean: 1: has header, 0: no header
-        int header_start # header row start
-        int header_end # header row end
-
-        void *skipset
-        int64_t skip_first_N_rows
-        int skip_footer
-        double (*converter)(const char *, char **, char, char, char, int)
-
-        #  error handling
-        char *warn_msg
-        char *error_msg
-
-        int skip_empty_lines
-
-    ctypedef struct coliter_t:
-        char **words
-        int *line_start
-        int col
-
-    void coliter_setup(coliter_t *it, parser_t *parser, int i, int start)
-    void COLITER_NEXT(coliter_t, const char *)
-
-    parser_t* parser_new()
-
-    int parser_init(parser_t *self) nogil
-    void parser_free(parser_t *self) nogil
-    int parser_add_skiprow(parser_t *self, int64_t row)
-
-    int parser_set_skipfirstnrows(parser_t *self, int64_t nrows)
-
-    void parser_set_default_options(parser_t *self)
-
-    int parser_consume_rows(parser_t *self, size_t nrows)
-
-    int parser_trim_buffers(parser_t *self)
-
-    void debug_print_parser(parser_t *self)
-
-    int tokenize_all_rows(parser_t *self)
-    int tokenize_nrows(parser_t *self, size_t nrows)
-
-    int64_t str_to_int64(char *p_item, int64_t int_min,
-                         int64_t int_max, int *error, char tsep)
-#    uint64_t str_to_uint64(char *p_item, uint64_t uint_max, int *error)
-
-    double xstrtod(const char *p, char **q, char decimal, char sci,
-                   char tsep, int skip_trailing)
-    double precise_xstrtod(const char *p, char **q, char decimal, char sci,
-                   char tsep, int skip_trailing)
-    double round_trip(const char *p, char **q, char decimal, char sci,
-                   char tsep, int skip_trailing)
-
-#    inline int to_complex(char *item, double *p_real,
-#                          double *p_imag, char sci, char decimal)
-    inline int to_longlong(char *item, long long *p_value)
-#    inline int to_longlong_thousands(char *item, long long *p_value,
-#                                     char tsep)
-    int to_boolean(const char *item, uint8_t *val)
-
-
-cdef extern from "parser/io.h":
-    void *new_mmap(char *fname)
-    int del_mmap(void *src)
-    void* buffer_mmap_bytes(void *source, size_t nbytes,
-                            size_t *bytes_read, int *status)
-
-    void *new_file_source(char *fname, size_t buffer_size)
-
-    void *new_rd_source(object obj)
-
-    int del_file_source(void *src)
-    int del_rd_source(void *src)
-
-    void* buffer_file_bytes(void *source, size_t nbytes,
-                            size_t *bytes_read, int *status)
-
-    void* buffer_rd_bytes(void *source, size_t nbytes,
-                          size_t *bytes_read, int *status)
-
-
-DEFAULT_CHUNKSIZE = 256 * 1024
-
-# common NA values
-# no longer excluding inf representations
-# '1.#INF','-1.#INF', '1.#INF000000',
-_NA_VALUES = [b'-1.#IND', b'1.#QNAN', b'1.#IND', b'-1.#QNAN',
-              b'#N/A N/A', b'NA', b'#NA', b'NULL', b'NaN',
-              b'nan', b'']
-
-
-cdef class TextReader:
-    '''
-
-    # source: StringIO or file object
-
-    '''
-
-    cdef:
-        parser_t *parser
-        object file_handle, na_fvalues
-        bint na_filter, verbose, has_usecols, has_mi_columns
-        int parser_start
-        list clocks
-        char *c_encoding
-
-    cdef public:
-        int leading_cols, table_width, skip_footer, buffer_lines
-        object allow_leading_cols
-        object delimiter, converters, delim_whitespace
-        object na_values, true_values, false_values
-        object memory_map
-        object as_recarray
-        object header, orig_header, names, header_start, header_end
-        object index_col
-        object low_memory
-        object skiprows
-        object compact_ints, use_unsigned
-        object dtype
-        object encoding
-        object compression
-        object mangle_dupe_cols
-        object tupleize_cols
-        set noconvert, usecols
-
-    def __cinit__(self, source,
-                  delimiter=b',',
-
-                  header=0,
-                  header_start=0,
-                  header_end=0,
-                  index_col=None,
-                  names=None,
-
-                  memory_map=False,
-                  tokenize_chunksize=DEFAULT_CHUNKSIZE,
-                  delim_whitespace=False,
-
-                  compression=None,
-
-                  converters=None,
-
-                  as_recarray=False,
-
-                  skipinitialspace=False,
-                  escapechar=None,
-                  doublequote=True,
-                  quotechar=b'"',
-                  quoting=0,
-                  lineterminator=None,
-
-                  encoding=None,
-
-                  comment=None,
-                  decimal=b'.',
-                  thousands=None,
-
-                  dtype=None,
-                  usecols=None,
-                  error_bad_lines=True,
-                  warn_bad_lines=True,
-
-                  na_filter=True,
-                  na_values=None,
-                  na_fvalues=None,
-                  true_values=None,
-                  false_values=None,
-
-                  compact_ints=False,
-                  allow_leading_cols=True,
-                  use_unsigned=False,
-                  low_memory=False,
-                  buffer_lines=None,
-                  skiprows=None,
-                  skip_footer=0,
-                  verbose=False,
-                  mangle_dupe_cols=True,
-                  tupleize_cols=False,
-                  float_precision=None,
-                  skip_blank_lines=True):
-
-        self.parser = parser_new()
-        self.parser.chunksize = tokenize_chunksize
-
-        self.mangle_dupe_cols=mangle_dupe_cols
-        self.tupleize_cols=tupleize_cols
-
-        # For timekeeping
-        self.clocks = []
-
-        self.compression = compression
-        self.memory_map = memory_map
-
-        self._setup_parser_source(source)
-        parser_set_default_options(self.parser)
-
-        parser_init(self.parser)
-
-        if delim_whitespace:
-            self.parser.delim_whitespace = delim_whitespace
-        else:
-            if len(delimiter) > 1:
-                raise ValueError('only length-1 separators excluded right now')
-            self.parser.delimiter = ord(delimiter)
-
-        #----------------------------------------
-        # parser options
-
-        self.parser.doublequote = doublequote
-        self.parser.skipinitialspace = skipinitialspace
-        self.parser.skip_empty_lines = skip_blank_lines
-
-        if lineterminator is not None:
-            if len(lineterminator) != 1:
-                raise ValueError('Only length-1 line terminators supported')
-            self.parser.lineterminator = ord(lineterminator)
-
-        if len(decimal) != 1:
-            raise ValueError('Only length-1 decimal markers supported')
-        self.parser.decimal = ord(decimal)
-
-        if thousands is not None:
-            if len(thousands) != 1:
-                raise ValueError('Only length-1 thousands markers supported')
-            self.parser.thousands = ord(thousands)
-
-        if escapechar is not None:
-            if len(escapechar) != 1:
-                raise ValueError('Only length-1 escapes  supported')
-            self.parser.escapechar = ord(escapechar)
-
-        self.parser.quotechar = ord(quotechar)
-        self.parser.quoting = quoting
-
-        if comment is not None:
-            if len(comment) > 1:
-                raise ValueError('Only length-1 comment characters supported')
-            self.parser.commentchar = ord(comment)
-
-        # error handling of bad lines
-        self.parser.error_bad_lines = int(error_bad_lines)
-        self.parser.warn_bad_lines = int(warn_bad_lines)
-
-        self.skiprows = skiprows
-        if skiprows is not None:
-            self._make_skiprow_set()
-
-        self.skip_footer = skip_footer
-
-        # suboptimal
-        if usecols is not None:
-            self.has_usecols = 1
-            self.usecols = set(usecols)
-
-        # XXX
-        if skip_footer > 0:
-            self.parser.error_bad_lines = 0
-            self.parser.warn_bad_lines = 0
-
-        self.delimiter = delimiter
-        self.delim_whitespace = delim_whitespace
-
-        self.na_values = na_values
-        if na_fvalues is None:
-           na_fvalues = set()
-        self.na_fvalues = na_fvalues
-
-        self.true_values = _maybe_encode(true_values)
-        self.false_values = _maybe_encode(false_values)
-
-        self.converters = converters
-
-        self.na_filter = na_filter
-        self.as_recarray = as_recarray
-
-        self.compact_ints = compact_ints
-        self.use_unsigned = use_unsigned
-
-        self.verbose = verbose
-        self.low_memory = low_memory
-        self.parser.converter = xstrtod
-        if float_precision == 'high':
-            self.parser.converter = precise_xstrtod
-        elif float_precision == 'round_trip':
-            self.parser.converter = round_trip
-
-        # encoding
-        if encoding is not None:
-            if not isinstance(encoding, bytes):
-                encoding = encoding.encode('utf-8')
-            encoding = encoding.lower()
-            self.c_encoding = <char*> encoding
-        else:
-            self.c_encoding = NULL
-
-        self.encoding = encoding
-
-        if isinstance(dtype, dict):
-            conv = {}
-            for k in dtype:
-                v = dtype[k]
-                if isinstance(v, basestring):
-                    v = np.dtype(v)
-                conv[k] = v
-            dtype = conv
-        elif dtype is not None:
-            dtype = np.dtype(dtype)
-
-        self.dtype = dtype
-
-        # XXX
-        self.noconvert = set()
-
-        self.index_col = index_col
-
-        #----------------------------------------
-        # header stuff
-
-        self.allow_leading_cols = allow_leading_cols
-        self.leading_cols = 0
-
-        # TODO: no header vs. header is not the first row
-        self.has_mi_columns = 0
-        self.orig_header = header
-        if header is None:
-            # sentinel value
-            self.parser.header_start = -1
-            self.parser.header_end = -1
-            self.parser.header = -1
-            self.parser_start = 0
-            self.header = []
-        else:
-            if isinstance(header, list) and len(header):
-                # need to artifically skip the final line
-                # which is still a header line
-                header = list(header)
-                header.append(header[-1]+1)
-
-                self.parser.header_start = header[0]
-                self.parser.header_end = header[-1]
-                self.parser.header = header[0]
-                self.parser_start = header[-1] + 1
-                self.has_mi_columns = 1
-                self.header = header
-            else:
-                self.parser.header_start = header
-                self.parser.header_end = header
-                self.parser.header = header
-                self.parser_start = header + 1
-                self.header = [ header ]
-
-        self.names = names
-        self.header, self.table_width = self._get_header()
-
-        if not self.table_width:
-            raise ValueError("No columns to parse from file")
-
-        # compute buffer_lines as function of table width
-        heuristic = 2**20 // self.table_width
-        self.buffer_lines = 1
-        while self.buffer_lines * 2< heuristic:
-            self.buffer_lines *= 2
-
-    def __init__(self, *args, **kwards):
-        pass
-
-    def __dealloc__(self):
-        parser_free(self.parser)
-
-    def set_error_bad_lines(self, int status):
-        self.parser.error_bad_lines = status
-
-    cdef _make_skiprow_set(self):
-        if isinstance(self.skiprows, (int, np.integer)):
-            parser_set_skipfirstnrows(self.parser, self.skiprows)
-        else:
-            for i in self.skiprows:
-                parser_add_skiprow(self.parser, i)
-
-    cdef _setup_parser_source(self, source):
-        cdef:
-            int status
-            void *ptr
-
-        self.parser.cb_io = NULL
-        self.parser.cb_cleanup = NULL
-
-        if self.compression:
-            if self.compression == 'gzip':
-                import gzip
-                if isinstance(source, basestring):
-                    source = gzip.GzipFile(source, 'rb')
-                else:
-                    source = gzip.GzipFile(fileobj=source)
-            elif self.compression == 'bz2':
-                import bz2
-                if isinstance(source, basestring) or PY3:
-                    source = bz2.BZ2File(source, 'rb')
-                else:
-                    raise ValueError('Python 2 cannot read bz2 from open file '
-                                     'handle')
-            else:
-                raise ValueError('Unrecognized compression type: %s' %
-                                 self.compression)
-
-        if isinstance(source, basestring):
-            if not isinstance(source, bytes):
-                source = source.encode(sys.getfilesystemencoding() or 'utf-8')
-
-            if self.memory_map:
-                ptr = new_mmap(source)
-                if ptr == NULL:
-                    # fall back
-                    ptr = new_file_source(source, self.parser.chunksize)
-                    self.parser.cb_io = &buffer_file_bytes
-                    self.parser.cb_cleanup = &del_file_source
-                else:
-                    self.parser.cb_io = &buffer_mmap_bytes
-                    self.parser.cb_cleanup = &del_mmap
-            else:
-                ptr = new_file_source(source, self.parser.chunksize)
-                self.parser.cb_io = &buffer_file_bytes
-                self.parser.cb_cleanup = &del_file_source
-
-            if ptr == NULL:
-                if not os.path.exists(source):
-                    raise IOError('File %s does not exist' % source)
-                raise IOError('Initializing from file failed')
-
-            self.parser.source = ptr
-
-        elif hasattr(source, 'read'):
-            # e.g., StringIO
-
-            ptr = new_rd_source(source)
-            if ptr == NULL:
-                raise IOError('Initializing parser from file-like '
-                              'object failed')
-
-            self.parser.source = ptr
-            self.parser.cb_io = &buffer_rd_bytes
-            self.parser.cb_cleanup = &del_rd_source
-        else:
-            raise IOError('Expected file path name or file-like object,'
-                          ' got %s type' % type(source))
-
-    cdef _get_header(self):
-        # header is now a list of lists, so field_count should use header[0]
-
-        cdef:
-            size_t i, start, data_line, field_count, passed_count, hr, unnamed_count
-            char *word
-            object name
-            int status
-            Py_ssize_t size
-            char *errors = "strict"
-
-        header = []
-
-        if self.parser.header_start >= 0:
-
-            # Header is in the file
-            for level, hr in enumerate(self.header):
-
-                this_header = []
-
-                if self.parser.lines < hr + 1:
-                    self._tokenize_rows(hr + 2)
-
-                if self.parser.lines == 0:
-                    field_count = 0
-                    start = self.parser.line_start[0]
-
-                # e.g., if header=3 and file only has 2 lines
-                elif self.parser.lines < hr + 1:
-                    msg = self.orig_header
-                    if isinstance(msg,list):
-                           msg = "[%s], len of %d," % (','.join([ str(m) for m in msg ]),len(msg))
-                    raise CParserError('Passed header=%s but only %d lines in file'
-                                       % (msg, self.parser.lines))
-
-                else:
-                    field_count = self.parser.line_fields[hr]
-                    start = self.parser.line_start[hr]
-
-                # TODO: Py3 vs. Py2
-                counts = {}
-                unnamed_count = 0
-                for i in range(field_count):
-                    word = self.parser.words[start + i]
-
-                    if self.c_encoding == NULL and not PY3:
-                        name = PyBytes_FromString(word)
-                    else:
-                        if self.c_encoding == NULL or self.c_encoding == b'utf-8':
-                            name = PyUnicode_FromString(word)
-                        else:
-                            name = PyUnicode_Decode(word, strlen(word),
-                                                    self.c_encoding, errors)
-
-                    if name == '':
-                        if self.has_mi_columns:
-                            name = 'Unnamed: %d_level_%d' % (i,level)
-                        else:
-                            name = 'Unnamed: %d' % i
-                        unnamed_count += 1
-
-                    count = counts.get(name, 0)
-                    if count > 0 and self.mangle_dupe_cols and not self.has_mi_columns:
-                        this_header.append('%s.%d' % (name, count))
-                    else:
-                        this_header.append(name)
-                    counts[name] = count + 1
-
-                if self.has_mi_columns:
-
-                    # if we have grabbed an extra line, but its not in our format
-                    # so save in the buffer, and create an blank extra line for the rest of the
-                    # parsing code
-                    if hr == self.header[-1]:
-                        lc = len(this_header)
-                        ic = len(self.index_col) if self.index_col is not None else 0
-                        if lc != unnamed_count and lc-ic > unnamed_count:
-                           hr -= 1
-                           self.parser_start -= 1
-                           this_header = [ None ] * lc
-
-                data_line = hr + 1
-                header.append(this_header)
-
-            if self.names is not None:
-                header = [ self.names ]
-
-        elif self.names is not None:
-            # Enforce this unless usecols
-            if not self.has_usecols:
-                self.parser.expected_fields = len(self.names)
-
-            # Names passed
-            if self.parser.lines < 1:
-                self._tokenize_rows(1)
-
-            header = [ self.names ]
-            data_line = 0
-
-            if self.parser.lines < 1:
-                field_count = len(header[0])
-            else:
-                field_count = self.parser.line_fields[data_line]
-        else:
-            # No header passed nor to be found in the file
-            if self.parser.lines < 1:
-                self._tokenize_rows(1)
-
-            return None, self.parser.line_fields[0]
-
-        # Corner case, not enough lines in the file
-        if self.parser.lines < data_line + 1:
-            field_count = len(header[0])
-        else: # not self.has_usecols:
-
-            field_count = self.parser.line_fields[data_line]
-
-            # #2981
-            if self.names is not None:
-                field_count = max(field_count, len(self.names))
-
-            passed_count = len(header[0])
-
-            # if passed_count > field_count:
-            #     raise CParserError('Column names have %d fields, '
-            #                        'data has %d fields'
-            #                        % (passed_count, field_count))
-
-            if self.has_usecols and self.allow_leading_cols:
-                nuse = len(self.usecols)
-                if nuse == passed_count:
-                    self.leading_cols = 0
-                elif self.names is None and nuse < passed_count:
-                    self.leading_cols = field_count - passed_count
-                elif passed_count != field_count:
-                    raise ValueError('Passed header names '
-                                     'mismatches usecols')
-            # oh boy, #2442, #2981
-            elif self.allow_leading_cols and passed_count < field_count:
-                self.leading_cols = field_count - passed_count
-
-        return header, field_count
-
-    cdef _implicit_index_count(self):
-        pass
-
-    def read(self, rows=None):
-        """
-        rows=None --> read all rows
-        """
-        cdef:
-            int status
-
-        if self.low_memory:
-            # Conserve intermediate space
-            columns = self._read_low_memory(rows)
-        else:
-            # Don't care about memory usage
-            columns = self._read_rows(rows, 1)
-
-        if self.as_recarray:
-            self._start_clock()
-            result = _to_structured_array(columns, self.header)
-            self._end_clock('Conversion to structured array')
-
-            return result
-        else:
-            return columns
-
-    cdef _read_low_memory(self, rows):
-        cdef:
-            size_t rows_read = 0
-            chunks = []
-
-        if rows is None:
-            while True:
-                try:
-                    chunk = self._read_rows(self.buffer_lines, 0)
-                    if len(chunk) == 0:
-                        break
-                except StopIteration:
-                    break
-                else:
-                    chunks.append(chunk)
-        else:
-            while rows_read < rows:
-                try:
-                    crows = min(self.buffer_lines, rows - rows_read)
-
-                    chunk = self._read_rows(crows, 0)
-                    if len(chunk) == 0:
-                        break
-
-                    rows_read += len(list(chunk.values())[0])
-                except StopIteration:
-                    break
-                else:
-                    chunks.append(chunk)
-
-        parser_trim_buffers(self.parser)
-
-        if len(chunks) == 0:
-            raise StopIteration
-
-        # destructive to chunks
-        return _concatenate_chunks(chunks)
-
-    cdef _tokenize_rows(self, size_t nrows):
-        cdef int status
-        status = tokenize_nrows(self.parser, nrows)
-
-        if self.parser.warn_msg != NULL:
-            print >> sys.stderr, self.parser.warn_msg
-            free(self.parser.warn_msg)
-            self.parser.warn_msg = NULL
-
-        if status < 0:
-            raise_parser_error('Error tokenizing data', self.parser)
-
-    cdef _read_rows(self, rows, bint trim):
-        cdef:
-            int buffered_lines
-            int irows, footer = 0
-
-        self._start_clock()
-
-        if rows is not None:
-            irows = rows
-            buffered_lines = self.parser.lines - self.parser_start
-            if buffered_lines < irows:
-                self._tokenize_rows(irows - buffered_lines)
-
-            if self.skip_footer > 0:
-                raise ValueError('skip_footer can only be used to read '
-                                 'the whole file')
-        else:
-            status = tokenize_all_rows(self.parser)
-
-            if self.parser.warn_msg != NULL:
-                print >> sys.stderr, self.parser.warn_msg
-                free(self.parser.warn_msg)
-                self.parser.warn_msg = NULL
-
-            if status < 0:
-                raise_parser_error('Error tokenizing data', self.parser)
-            footer = self.skip_footer
-
-        if self.parser_start == self.parser.lines:
-            raise StopIteration
-        self._end_clock('Tokenization')
-
-        self._start_clock()
-        columns = self._convert_column_data(rows=rows,
-                                            footer=footer,
-                                            upcast_na=not self.as_recarray)
-        self._end_clock('Type conversion')
-
-        self._start_clock()
-        if len(columns) > 0:
-            rows_read = len(list(columns.values())[0])
-            # trim
-            parser_consume_rows(self.parser, rows_read)
-            if trim:
-                parser_trim_buffers(self.parser)
-            self.parser_start -= rows_read
-
-        self._end_clock('Parser memory cleanup')
-
-        return columns
-
-    def debug_print(self):
-        debug_print_parser(self.parser)
-
-    cdef _start_clock(self):
-        self.clocks.append(time.time())
-
-    cdef _end_clock(self, what):
-        if self.verbose:
-            elapsed = time.time() - self.clocks.pop(-1)
-            print '%s took: %.2f ms' % (what, elapsed * 1000)
-
-    def set_noconvert(self, i):
-        self.noconvert.add(i)
-
-    def remove_noconvert(self, i):
-        self.noconvert.remove(i)
-
-    def _convert_column_data(self, rows=None, upcast_na=False, footer=0):
-        cdef:
-            Py_ssize_t i, nused
-            kh_str_t *na_hashset = NULL
-            int start, end
-            object name, na_flist
-            bint na_filter = 0
-            Py_ssize_t num_cols
-
-        start = self.parser_start
-
-        if rows is None:
-            end = self.parser.lines
-        else:
-            end = min(start + rows, self.parser.lines)
-
-        # # skip footer
-        # if footer > 0:
-        #     end -= footer
-
-        #print >> sys.stderr, self.table_width
-        #print >> sys.stderr, self.leading_cols
-        #print >> sys.stderr, self.parser.lines
-        #print >> sys.stderr, start
-        #print >> sys.stderr, end
-        #print >> sys.stderr, self.header
-        #print >> sys.stderr, "index"
-        num_cols = -1
-        for i in range(self.parser.lines):
-            num_cols = (num_cols < self.parser.line_fields[i]) * self.parser.line_fields[i] +\
-                (num_cols >= self.parser.line_fields[i]) * num_cols
-
-        if self.table_width - self.leading_cols > num_cols:
-            raise CParserError("Too many columns specified: expected %s and found %s" %
-                (self.table_width - self.leading_cols, num_cols))
-
-        results = {}
-        nused = 0
-        for i in range(self.table_width):
-            if i < self.leading_cols:
-                # Pass through leading columns always
-                name = i
-            elif self.usecols and nused == len(self.usecols):
-                # Once we've gathered all requested columns, stop. GH5766
-                break
-            else:
-                name = self._get_column_name(i, nused)
-                if self.has_usecols and not (i in self.usecols or
-                                             name in self.usecols):
-                    continue
-                nused += 1
-
-            conv = self._get_converter(i, name)
-
-            # XXX
-            na_flist = set()
-            if self.na_filter:
-                na_list, na_flist = self._get_na_list(i, name)
-                if na_list is None:
-                    na_filter = 0
-                else:
-                    na_filter = 1
-                    na_hashset = kset_from_list(na_list)
-            else:
-                na_filter = 0
-
-            if conv:
-                results[i] = _apply_converter(conv, self.parser, i, start, end,
-                                              self.c_encoding)
-                continue
-
-            # Should return as the desired dtype (inferred or specified)
-            col_res, na_count = self._convert_tokens(i, start, end, name,
-                                                     na_filter, na_hashset, na_flist)
-
-            if na_filter:
-                self._free_na_set(na_hashset)
-
-            if upcast_na and na_count > 0:
-                col_res = _maybe_upcast(col_res)
-
-            if issubclass(col_res.dtype.type, np.integer) and self.compact_ints:
-                col_res = downcast_int64(col_res, self.use_unsigned)
-
-            if col_res is None:
-                raise Exception('Unable to parse column %d' % i)
-
-            results[i] = col_res
-
-        self.parser_start += end - start
-
-        return results
-
-    cdef inline _convert_tokens(self, Py_ssize_t i, int start, int end,
-                                object name, bint na_filter,
-                                kh_str_t *na_hashset,
-                                object na_flist):
-        cdef:
-            object col_dtype = None
-
-        if self.dtype is not None:
-            if isinstance(self.dtype, dict):
-                if name in self.dtype:
-                    col_dtype = self.dtype[name]
-                elif i in self.dtype:
-                    col_dtype = self.dtype[i]
-            else:
-                if self.dtype.names:
-                    col_dtype = self.dtype.descr[i][1]
-                else:
-                    col_dtype = self.dtype
-
-            if col_dtype is not None:
-                if not isinstance(col_dtype, basestring):
-                    if isinstance(col_dtype, np.dtype):
-                        col_dtype = col_dtype.str
-                    else:
-                        col_dtype = np.dtype(col_dtype).str
-
-                col_res, na_count = self._convert_with_dtype(col_dtype, i, start, end,
-                                                             na_filter, 1, na_hashset, na_flist)
-
-                # fallback on the parse (e.g. we requested int dtype, but its actually a float)
-                if col_res is not None:
-                    return col_res, na_count
-
-        if i in self.noconvert:
-            return self._string_convert(i, start, end, na_filter, na_hashset)
-        else:
-            col_res = None
-            for dt in dtype_cast_order:
-                try:
-                    col_res, na_count = self._convert_with_dtype(
-                        dt, i, start, end, na_filter, 0, na_hashset, na_flist)
-                except OverflowError:
-                    col_res, na_count = self._convert_with_dtype(
-                        '|O8', i, start, end, na_filter, 0, na_hashset, na_flist)
-
-                if col_res is not None:
-                    break
-
-        # we had a fallback parse on the dtype, so now try to cast
-        # only allow safe casts, eg. with a nan you cannot safely cast to int
-        if col_res is not None and col_dtype is not None:
-            try:
-                col_res = col_res.astype(col_dtype,casting='safe')
-            except TypeError:
-
-                # float -> int conversions can fail the above
-                # even with no nans
-                col_res_orig = col_res
-                col_res = col_res.astype(col_dtype)
-                if (col_res != col_res_orig).any():
-                    raise ValueError("cannot safely convert passed user dtype of "
-                                     "{col_dtype} for {col_res} dtyped data in "
-                                     "column {column}".format(col_dtype=col_dtype,
-                                                              col_res=col_res_orig.dtype.name,
-                                                              column=i))
-
-
-        return col_res, na_count
-
-    cdef _convert_with_dtype(self, object dtype, Py_ssize_t i,
-                             int start, int end,
-                             bint na_filter,
-                             bint user_dtype,
-                             kh_str_t *na_hashset,
-                             object na_flist):
-        cdef kh_str_t *true_set
-        cdef kh_str_t *false_set
-
-        if dtype[1] == 'i' or dtype[1] == 'u':
-            result, na_count = _try_int64(self.parser, i, start, end,
-                                          na_filter, na_hashset)
-            if user_dtype and na_count is not None:
-                if na_count > 0:
-                    raise Exception("Integer column has NA values in "
-                                    "column {column}".format(column=i))
-
-            if result is not None and dtype[1:] != 'i8':
-                result = result.astype(dtype)
-
-            return result, na_count
-
-        elif dtype[1] == 'f':
-            result, na_count = _try_double(self.parser, i, start, end,
-                          na_filter, na_hashset, na_flist)
-
-            if result is not None and dtype[1:] != 'f8':
-                result = result.astype(dtype)
-            return result, na_count
-
-        elif dtype[1] == 'b':
-            if self.true_values is not None or self.false_values is not None:
-
-                true_set = kset_from_list(self.true_values + _true_values)
-                false_set = kset_from_list(self.false_values + _false_values)
-                result, na_count = _try_bool_flex(self.parser, i, start, end,
-                                                  na_filter, na_hashset,
-                                                  true_set, false_set)
-                kh_destroy_str(true_set)
-                kh_destroy_str(false_set)
-            else:
-                result, na_count = _try_bool(self.parser, i, start, end,
-                                             na_filter, na_hashset)
-            return result, na_count
-        elif dtype[1] == 'c':
-            raise NotImplementedError("the dtype %s is not supported for parsing" % dtype)
-
-        elif dtype[1] == 'S':
-            # TODO: na handling
-            width = int(dtype[2:])
-            if width > 0:
-                result = _to_fw_string(self.parser, i, start, end, width)
-                return result, 0
-
-            # treat as a regular string parsing
-            return self._string_convert(i, start, end, na_filter,
-                                       na_hashset)
-        elif dtype[1] == 'U':
-            width = int(dtype[2:])
-            if width > 0:
-                raise NotImplementedError("the dtype %s is not supported for parsing" % dtype)
-
-            # unicode variable width
-            return self._string_convert(i, start, end, na_filter,
-                                        na_hashset)
-
-
-        elif dtype[1] == 'O':
-            return self._string_convert(i, start, end, na_filter,
-                                        na_hashset)
-        else:
-            if dtype[1] == 'M':
-                 raise TypeError("the dtype %s is not supported for parsing, "
-                                 "pass this column using parse_dates instead" % dtype)
-            raise TypeError("the dtype %s is not supported for parsing" % dtype)
-
-    cdef _string_convert(self, Py_ssize_t i, int start, int end,
-                         bint na_filter, kh_str_t *na_hashset):
-        if PY3:
-            if self.c_encoding != NULL:
-                if self.c_encoding == b"utf-8":
-                    return _string_box_utf8(self.parser, i, start, end,
-                                            na_filter, na_hashset)
-                else:
-                    return _string_box_decode(self.parser, i, start, end,
-                                              na_filter, na_hashset,
-                                              self.c_encoding)
-            else:
-                return _string_box_utf8(self.parser, i, start, end,
-                                        na_filter, na_hashset)
-        else:
-            if self.c_encoding != NULL:
-                if self.c_encoding == b"utf-8":
-                    return _string_box_utf8(self.parser, i, start, end,
-                                            na_filter, na_hashset)
-                else:
-                    return _string_box_decode(self.parser, i, start, end,
-                                              na_filter, na_hashset,
-                                              self.c_encoding)
-            else:
-                return _string_box_factorize(self.parser, i, start, end,
-                                             na_filter, na_hashset)
-
-    def _get_converter(self, i, name):
-        if self.converters is None:
-            return None
-
-        if name is not None and name in self.converters:
-            return self.converters[name]
-
-        # Converter for position, if any
-        return self.converters.get(i)
-
-    cdef _get_na_list(self, i, name):
-        if self.na_values is None:
-            return None, set()
-
-        if isinstance(self.na_values, dict):
-            values = None
-            if name is not None and name in self.na_values:
-                values = self.na_values[name]
-                if values is not None and not isinstance(values, list):
-                    values = list(values)
-                fvalues = self.na_fvalues[name]
-                if fvalues is not None and not isinstance(fvalues, set):
-                    fvalues = set(fvalues)
-            else:
-                if i in self.na_values:
-                    return self.na_values[i], self.na_fvalues[i]
-                else:
-                    return _NA_VALUES, set()
-
-            return _ensure_encoded(values), fvalues
-        else:
-            if not isinstance(self.na_values, list):
-                self.na_values = list(self.na_values)
-            if not isinstance(self.na_fvalues, set):
-                self.na_fvalues = set(self.na_fvalues)
-
-            return _ensure_encoded(self.na_values), self.na_fvalues
-
-    cdef _free_na_set(self, kh_str_t *table):
-        kh_destroy_str(table)
-
-    cdef _get_column_name(self, Py_ssize_t i, Py_ssize_t nused):
-        if self.has_usecols and self.names is not None:
-            if len(self.names) == len(self.usecols):
-                return self.names[nused]
-            else:
-                return self.names[i - self.leading_cols]
-        else:
-            if self.header is not None:
-                j = i - self.leading_cols
-                # hack for #2442
-                if j == len(self.header[0]):
-                    return j
-                else:
-                    return self.header[0][j]
-            else:
-                return None
-
-class CParserError(Exception):
-    pass
-
-
-class OverflowError(ValueError):
-    pass
-
-cdef object _true_values = [b'True', b'TRUE', b'true']
-cdef object _false_values = [b'False', b'FALSE', b'false']
-
-
-def _ensure_encoded(list lst):
-    cdef list result = []
-    for x in lst:
-        if PyUnicode_Check(x):
-            x = PyUnicode_AsUTF8String(x)
-        elif not PyBytes_Check(x):
-            x = asbytes(x)
-
-        result.append(x)
-    return result
-
-cdef asbytes(object o):
-    if PY3:
-        return str(o).encode('utf-8')
-    else:
-        return str(o)
-
-
-def _is_file_like(obj):
-    if PY3:
-        import io
-        if isinstance(obj, io.TextIOWrapper):
-            raise CParserError('Cannot handle open unicode files (yet)')
-
-        # BufferedReader is a byte reader for Python 3
-        file = io.BufferedReader
-    else:
-        import __builtin__
-        file = __builtin__.file
-
-    return isinstance(obj, (basestring, file))
-
-
-def _maybe_upcast(arr):
-    """
-
-    """
-    if issubclass(arr.dtype.type, np.integer):
-        na_value = na_values[arr.dtype]
-        arr = arr.astype(float)
-        np.putmask(arr, arr == na_value, np.nan)
-    elif arr.dtype == np.bool_:
-        mask = arr.view(np.uint8) == na_values[np.uint8]
-        arr = arr.astype(object)
-        np.putmask(arr, mask, np.nan)
-
-    return arr
-
-# ----------------------------------------------------------------------
-# Type conversions / inference support code
-
-cdef _string_box_factorize(parser_t *parser, int col,
-                           int line_start, int line_end,
-                           bint na_filter, kh_str_t *na_hashset):
-    cdef:
-        int error, na_count = 0
-        Py_ssize_t i
-        size_t lines
-        coliter_t it
-        const char *word = NULL
-        ndarray[object] result
-
-        int ret = 0
-        kh_strbox_t *table
-
-        object pyval
-
-        object NA = na_values[np.object_]
-        khiter_t k
-
-    table = kh_init_strbox()
-    lines = line_end - line_start
-    result = np.empty(lines, dtype=np.object_)
-    coliter_setup(&it, parser, col, line_start)
-
-    for i in range(lines):
-        COLITER_NEXT(it, word)
-
-        if na_filter:
-            k = kh_get_str(na_hashset, word)
-            # in the hash table
-            if k != na_hashset.n_buckets:
-                na_count += 1
-                result[i] = NA
-                continue
-
-        k = kh_get_strbox(table, word)
-
-        # in the hash table
-        if k != table.n_buckets:
-            # this increments the refcount, but need to test
-            pyval = <object> table.vals[k]
-        else:
-            # box it. new ref?
-            pyval = PyBytes_FromString(word)
-
-            k = kh_put_strbox(table, word, &ret)
-            table.vals[k] = <PyObject*> pyval
-
-        result[i] = pyval
-
-    kh_destroy_strbox(table)
-
-    return result, na_count
-
-cdef _string_box_utf8(parser_t *parser, int col,
-                      int line_start, int line_end,
-                      bint na_filter, kh_str_t *na_hashset):
-    cdef:
-        int error, na_count = 0
-        Py_ssize_t i
-        size_t lines
-        coliter_t it
-        const char *word = NULL
-        ndarray[object] result
-
-        int ret = 0
-        kh_strbox_t *table
-
-        object pyval
-
-        object NA = na_values[np.object_]
-        khiter_t k
-
-    table = kh_init_strbox()
-    lines = line_end - line_start
-    result = np.empty(lines, dtype=np.object_)
-    coliter_setup(&it, parser, col, line_start)
-
-    for i in range(lines):
-        COLITER_NEXT(it, word)
-
-        if na_filter:
-            k = kh_get_str(na_hashset, word)
-            # in the hash table
-            if k != na_hashset.n_buckets:
-                na_count += 1
-                result[i] = NA
-                continue
-
-        k = kh_get_strbox(table, word)
-
-        # in the hash table
-        if k != table.n_buckets:
-            # this increments the refcount, but need to test
-            pyval = <object> table.vals[k]
-        else:
-            # box it. new ref?
-            pyval = PyUnicode_FromString(word)
-
-            k = kh_put_strbox(table, word, &ret)
-            table.vals[k] = <PyObject*> pyval
-
-        result[i] = pyval
-
-    kh_destroy_strbox(table)
-
-    return result, na_count
-
-cdef _string_box_decode(parser_t *parser, int col,
-                        int line_start, int line_end,
-                        bint na_filter, kh_str_t *na_hashset,
-                        char *encoding):
-    cdef:
-        int error, na_count = 0
-        Py_ssize_t i, size
-        size_t lines
-        coliter_t it
-        const char *word = NULL
-        ndarray[object] result
-
-        int ret = 0
-        kh_strbox_t *table
-
-        char *errors = "strict"
-
-        object pyval
-
-        object NA = na_values[np.object_]
-        khiter_t k
-
-    table = kh_init_strbox()
-    lines = line_end - line_start
-    result = np.empty(lines, dtype=np.object_)
-    coliter_setup(&it, parser, col, line_start)
-
-    for i in range(lines):
-        COLITER_NEXT(it, word)
-
-        if na_filter:
-            k = kh_get_str(na_hashset, word)
-            # in the hash table
-            if k != na_hashset.n_buckets:
-                na_count += 1
-                result[i] = NA
-                continue
-
-        k = kh_get_strbox(table, word)
-
-        # in the hash table
-        if k != table.n_buckets:
-            # this increments the refcount, but need to test
-            pyval = <object> table.vals[k]
-        else:
-            # box it. new ref?
-            size = strlen(word)
-            pyval = PyUnicode_Decode(word, size, encoding, errors)
-
-            k = kh_put_strbox(table, word, &ret)
-            table.vals[k] = <PyObject*> pyval
-
-        result[i] = pyval
-
-    kh_destroy_strbox(table)
-
-    return result, na_count
-
-
-cdef _to_fw_string(parser_t *parser, int col, int line_start,
-                   int line_end, size_t width):
-    cdef:
-        int error
-        Py_ssize_t i, j
-        coliter_t it
-        const char *word = NULL
-        char *data
-        ndarray result
-
-    result = np.empty(line_end - line_start, dtype='|S%d' % width)
-    data = <char*> result.data
-
-    coliter_setup(&it, parser, col, line_start)
-
-    for i in range(line_end - line_start):
-        COLITER_NEXT(it, word)
-        strncpy(data, word, width)
-        data += width
-
-    return result
-
-cdef char* cinf = b'inf'
-cdef char* cneginf = b'-inf'
-
-cdef _try_double(parser_t *parser, int col, int line_start, int line_end,
-                 bint na_filter, kh_str_t *na_hashset, object na_flist):
-    cdef:
-        int error, na_count = 0
-        size_t i, lines
-        coliter_t it
-        const char *word = NULL
-        char *p_end
-        double *data
-        double NA = na_values[np.float64]
-        ndarray result
-        khiter_t k
-        bint use_na_flist = len(na_flist) > 0
-
-    global errno
-    lines = line_end - line_start
-    result = np.empty(lines, dtype=np.float64)
-    data = <double *> result.data
-    coliter_setup(&it, parser, col, line_start)
-
-    if na_filter:
-        for i in range(lines):
-            COLITER_NEXT(it, word)
-
-            k = kh_get_str(na_hashset, word)
-            # in the hash table
-            if k != na_hashset.n_buckets:
-                na_count += 1
-                data[0] = NA
-            else:
-                data[0] = parser.converter(word, &p_end, parser.decimal, parser.sci,
-                                         parser.thousands, 1)
-                if errno != 0 or p_end[0] or p_end == word:
-                    if strcasecmp(word, cinf) == 0:
-                        data[0] = INF
-                    elif strcasecmp(word, cneginf) == 0:
-                        data[0] = NEGINF
-                    else:
-                        return None, None
-                if use_na_flist:
-                    if data[0] in na_flist:
-                        na_count += 1
-                        data[0] = NA
-            data += 1
-    else:
-        for i in range(lines):
-            COLITER_NEXT(it, word)
-            data[0] = parser.converter(word, &p_end, parser.decimal, parser.sci,
-                                         parser.thousands, 1)
-            if errno != 0 or p_end[0] or p_end == word:
-                if strcasecmp(word, cinf) == 0:
-                    data[0] = INF
-                elif strcasecmp(word, cneginf) == 0:
-                    data[0] = NEGINF
-                else:
-                    return None, None
-            data += 1
-
-    return result, na_count
-
-
-cdef _try_int64(parser_t *parser, int col, int line_start, int line_end,
-                bint na_filter, kh_str_t *na_hashset):
-    cdef:
-        int error, na_count = 0
-        size_t i, lines
-        coliter_t it
-        const char *word = NULL
-        int64_t *data
-        ndarray result
-
-        int64_t NA = na_values[np.int64]
-        khiter_t k
-
-    lines = line_end - line_start
-    result = np.empty(lines, dtype=np.int64)
-    data = <int64_t *> result.data
-    coliter_setup(&it, parser, col, line_start)
-
-    if na_filter:
-        for i in range(lines):
-            COLITER_NEXT(it, word)
-            k = kh_get_str(na_hashset, word)
-            # in the hash table
-            if k != na_hashset.n_buckets:
-                na_count += 1
-                data[i] = NA
-                continue
-
-            data[i] = str_to_int64(word, INT64_MIN, INT64_MAX,
-                                   &error, parser.thousands)
-            if error != 0:
-                if error == ERROR_OVERFLOW:
-                    raise OverflowError(word)
-
-                return None, None
-    else:
-        for i in range(lines):
-            COLITER_NEXT(it, word)
-            data[i] = str_to_int64(word, INT64_MIN, INT64_MAX,
-                                   &error, parser.thousands)
-            if error != 0:
-                if error == ERROR_OVERFLOW:
-                    raise OverflowError(word)
-                return None, None
-
-    return result, na_count
-
-
-cdef _try_bool(parser_t *parser, int col, int line_start, int line_end,
-               bint na_filter, kh_str_t *na_hashset):
-    cdef:
-        int error, na_count = 0
-        size_t i, lines
-        coliter_t it
-        const char *word = NULL
-        uint8_t *data
-        ndarray result
-
-        uint8_t NA = na_values[np.bool_]
-        khiter_t k
-
-    lines = line_end - line_start
-    result = np.empty(lines, dtype=np.uint8)
-    data = <uint8_t *> result.data
-    coliter_setup(&it, parser, col, line_start)
-
-    if na_filter:
-        for i in range(lines):
-            COLITER_NEXT(it, word)
-
-            k = kh_get_str(na_hashset, word)
-            # in the hash table
-            if k != na_hashset.n_buckets:
-                na_count += 1
-                data[0] = NA
-                data += 1
-                continue
-
-            error = to_boolean(word, data)
-            if error != 0:
-                return None, None
-            data += 1
-    else:
-        for i in range(lines):
-            COLITER_NEXT(it, word)
-
-            error = to_boolean(word, data)
-            if error != 0:
-                return None, None
-            data += 1
-
-    return result.view(np.bool_), na_count
-
-
-cdef _try_bool_flex(parser_t *parser, int col, int line_start, int line_end,
-                    bint na_filter, kh_str_t *na_hashset,
-                    kh_str_t *true_hashset, kh_str_t *false_hashset):
-    cdef:
-        int error, na_count = 0
-        size_t i, lines
-        coliter_t it
-        const char *word = NULL
-        uint8_t *data
-        ndarray result
-
-        uint8_t NA = na_values[np.bool_]
-        khiter_t k
-
-    lines = line_end - line_start
-    result = np.empty(lines, dtype=np.uint8)
-    data = <uint8_t *> result.data
-    coliter_setup(&it, parser, col, line_start)
-
-    if na_filter:
-        for i in range(lines):
-            COLITER_NEXT(it, word)
-
-            k = kh_get_str(na_hashset, word)
-            # in the hash table
-            if k != na_hashset.n_buckets:
-                na_count += 1
-                data[0] = NA
-                data += 1
-                continue
-
-            k = kh_get_str(true_hashset, word)
-            if k != true_hashset.n_buckets:
-                data[0] = 1
-                data += 1
-                continue
-
-            k = kh_get_str(false_hashset, word)
-            if k != false_hashset.n_buckets:
-                data[0] = 0
-                data += 1
-                continue
-
-            error = to_boolean(word, data)
-            if error != 0:
-                return None, None
-            data += 1
-    else:
-        for i in range(lines):
-            COLITER_NEXT(it, word)
-
-            k = kh_get_str(true_hashset, word)
-            if k != true_hashset.n_buckets:
-                data[0] = 1
-                data += 1
-                continue
-
-            k = kh_get_str(false_hashset, word)
-            if k != false_hashset.n_buckets:
-                data[0] = 0
-                data += 1
-                continue
-
-            error = to_boolean(word, data)
-            if error != 0:
-                return None, None
-            data += 1
-
-    return result.view(np.bool_), na_count
-
-cdef kh_str_t* kset_from_list(list values) except NULL:
-    # caller takes responsibility for freeing the hash table
-    cdef:
-        Py_ssize_t i
-        khiter_t k
-        kh_str_t *table
-        int ret = 0
-
-        object val
-
-    table = kh_init_str()
-
-    for i in range(len(values)):
-        val = values[i]
-
-        # None creeps in sometimes, which isn't possible here
-        if not PyBytes_Check(val):
-            raise Exception('Must be all encoded bytes')
-
-        k = kh_put_str(table, PyBytes_AsString(val), &ret)
-
-    return table
-
-
-# if at first you don't succeed...
-
-# TODO: endianness just a placeholder?
-cdef list dtype_cast_order = ['<i8', '<f8', '|b1', '|O8']
-
-
-cdef raise_parser_error(object base, parser_t *parser):
-    message = '%s. C error: ' % base
-    if parser.error_msg != NULL:
-        if PY3:
-            message += parser.error_msg.decode('utf-8')
-        else:
-            message += parser.error_msg
-    else:
-        message += 'no error message set'
-
-    raise CParserError(message)
-
-
-def downcast_int64(ndarray[int64_t] arr, bint use_unsigned=0):
-    cdef:
-        Py_ssize_t i, n = len(arr)
-        int64_t mx = INT64_MIN + 1, mn = INT64_MAX
-        int64_t NA = na_values[np.int64]
-        int64_t val
-        ndarray[uint8_t] mask
-        int na_count = 0
-
-    _mask = np.empty(n, dtype=bool)
-    mask = _mask.view(np.uint8)
-
-    for i in range(n):
-        val = arr[i]
-
-        if val == NA:
-            mask[i] = 1
-            na_count += 1
-            continue
-
-        # not NA
-        mask[i] = 0
-
-        if val > mx:
-            mx = val
-
-        if val < mn:
-            mn = val
-
-    if mn >= 0 and use_unsigned:
-        if mx <= UINT8_MAX - 1:
-            result = arr.astype(np.uint8)
-            if na_count:
-                np.putmask(result, _mask, na_values[np.uint8])
-            return result
-
-        if mx <= UINT16_MAX - 1:
-            result = arr.astype(np.uint16)
-            if na_count:
-                np.putmask(result, _mask, na_values[np.uint16])
-            return result
-
-        if mx <= UINT32_MAX - 1:
-            result = arr.astype(np.uint32)
-            if na_count:
-                np.putmask(result, _mask, na_values[np.uint32])
-            return result
-
-    else:
-        if mn >= INT8_MIN + 1 and mx <= INT8_MAX:
-            result = arr.astype(np.int8)
-            if na_count:
-                np.putmask(result, _mask, na_values[np.int8])
-            return result
-
-        if mn >= INT16_MIN + 1 and mx <= INT16_MAX:
-            result = arr.astype(np.int16)
-            if na_count:
-                np.putmask(result, _mask, na_values[np.int16])
-            return result
-
-        if mn >= INT32_MIN + 1 and mx <= INT32_MAX:
-            result = arr.astype(np.int32)
-            if na_count:
-                np.putmask(result, _mask, na_values[np.int32])
-            return result
-
-    return arr
-
-
-def _concatenate_chunks(list chunks):
-    cdef:
-        list names = list(chunks[0].keys())
-        object name
-        list warning_columns
-        object warning_names
-        object common_type
-
-    result = {}
-    warning_columns = list()
-    for name in names:
-        arrs = [chunk.pop(name) for chunk in chunks]
-        # Check each arr for consistent types.
-        dtypes = set([a.dtype for a in arrs])
-        if len(dtypes) > 1:
-            common_type = np.find_common_type(dtypes, [])
-            if common_type == np.object:
-                warning_columns.append(str(name))
-        result[name] = np.concatenate(arrs)
-
-    if warning_columns:
-        warning_names = ','.join(warning_columns)
-        warning_message = " ".join(["Columns (%s) have mixed types." % warning_names,
-            "Specify dtype option on import or set low_memory=False."
-          ])
-        warnings.warn(warning_message, DtypeWarning, stacklevel=8)
-    return result
-
-#----------------------------------------------------------------------
-
-# NA values
-def _compute_na_values():
-    int64info = np.iinfo(np.int64)
-    int32info = np.iinfo(np.int32)
-    int16info = np.iinfo(np.int16)
-    int8info = np.iinfo(np.int8)
-    uint64info = np.iinfo(np.uint64)
-    uint32info = np.iinfo(np.uint32)
-    uint16info = np.iinfo(np.uint16)
-    uint8info = np.iinfo(np.uint8)
-    na_values = {
-        np.float64 : np.nan,
-        np.int64 : int64info.min,
-        np.int32 : int32info.min,
-        np.int16 : int16info.min,
-        np.int8  : int8info.min,
-        np.uint64 : uint64info.max,
-        np.uint32 : uint32info.max,
-        np.uint16 : uint16info.max,
-        np.uint8 : uint8info.max,
-        np.bool_ : uint8info.max,
-        np.object_ : np.nan    # oof
-    }
-    return na_values
-
-na_values = _compute_na_values()
-
-for k in list(na_values):
-    na_values[np.dtype(k)] = na_values[k]
-
-
-cdef _apply_converter(object f, parser_t *parser, int col,
-                      int line_start, int line_end,
-                      char* c_encoding):
-    cdef:
-        int error
-        Py_ssize_t i
-        size_t lines
-        coliter_t it
-        const char *word = NULL
-        char *errors = "strict"
-        ndarray[object] result
-        object val
-
-    lines = line_end - line_start
-    result = np.empty(lines, dtype=np.object_)
-
-    coliter_setup(&it, parser, col, line_start)
-
-    if not PY3 and c_encoding == NULL:
-        for i in range(lines):
-            COLITER_NEXT(it, word)
-            val = PyBytes_FromString(word)
-            result[i] = f(val)
-    elif ((PY3 and c_encoding == NULL) or c_encoding == b'utf-8'):
-        for i in range(lines):
-            COLITER_NEXT(it, word)
-            val = PyUnicode_FromString(word)
-            result[i] = f(val)
-    else:
-        for i in range(lines):
-            COLITER_NEXT(it, word)
-            val = PyUnicode_Decode(word, strlen(word),
-                                   c_encoding, errors)
-            result[i] = f(val)
-
-    return lib.maybe_convert_objects(result)
-
-
-def _to_structured_array(dict columns, object names):
-    cdef:
-        ndarray recs, column
-        cnp.dtype dt
-        dict fields
-
-        object name, fnames, field_type
-        Py_ssize_t i, offset, nfields, length
-        int stride, elsize
-        char *buf
-
-    if names is None:
-        names = ['%d' % i for i in range(len(columns))]
-    else:
-        # single line header
-        names = names[0]
-
-    dt = np.dtype([(str(name), columns[i].dtype)
-                   for i, name in enumerate(names)])
-    fnames = dt.names
-    fields = dt.fields
-
-    nfields = len(fields)
-
-    if PY3:
-        length = len(list(columns.values())[0])
-    else:
-        length = len(columns.values()[0])
-
-    stride = dt.itemsize
-
-    # start = time.time()
-
-    # we own the data
-    buf = <char*> malloc(length * stride)
-
-    recs = util.sarr_from_data(dt, length, buf)
-    assert(recs.flags.owndata)
-
-    # buf = <char*> recs.data
-    # end = time.time()
-    # print 'took %.4f' % (end - start)
-
-    for i in range(nfields):
-        # start = time.clock()
-        # name = names[i]
-
-        # XXX
-        field_type = fields[fnames[i]]
-
-        # (dtype, stride) tuple
-        offset = field_type[1]
-        elsize = field_type[0].itemsize
-        column = columns[i]
-
-        _fill_structured_column(buf + offset, <char*> column.data,
-                                elsize, stride, length,
-                                field_type[0] == np.object_)
-
-        # print 'Transfer of %s took %.4f' % (str(field_type),
-        #                                     time.clock() - start)
-
-    return recs
-
-cdef _fill_structured_column(char *dst, char* src, int elsize,
-                             int stride, int length, bint incref):
-    cdef:
-        size_t i
-
-    if incref:
-        util.transfer_object_column(dst, src, stride, length)
-    else:
-        for i in range(length):
-            memcpy(dst, src, elsize)
-            dst += stride
-            src += elsize
-
-
-
-def _maybe_encode(values):
-    if values is None:
-        return []
-    return [x.encode('utf-8') if isinstance(x, unicode) else x for x in values]
diff --git a/pandas/plotting/__init__.py b/pandas/plotting/__init__.py
new file mode 100644
index 0000000000000..385d4d7f047c7
--- /dev/null
+++ b/pandas/plotting/__init__.py
@@ -0,0 +1,20 @@
+"""
+Plotting api
+"""
+
+# flake8: noqa
+
+from pandas.plotting._misc import (scatter_matrix, radviz,
+                                   andrews_curves, bootstrap_plot,
+                                   parallel_coordinates, lag_plot,
+                                   autocorrelation_plot)
+from pandas.plotting._core import boxplot
+from pandas.plotting._style import plot_params
+from pandas.plotting._tools import table
+try:
+    from pandas.plotting._converter import \
+        register as register_matplotlib_converters
+    from pandas.plotting._converter import \
+        deregister as deregister_matplotlib_converters
+except ImportError:
+    pass
diff --git a/pandas/plotting/_compat.py b/pandas/plotting/_compat.py
new file mode 100644
index 0000000000000..46ebd4217862d
--- /dev/null
+++ b/pandas/plotting/_compat.py
@@ -0,0 +1,31 @@
+# being a bit too dynamic
+# pylint: disable=E1101
+from __future__ import division
+import operator
+
+from distutils.version import LooseVersion
+
+
+def _mpl_version(version, op):
+    def inner():
+        try:
+            import matplotlib as mpl
+        except ImportError:
+            return False
+        return (op(LooseVersion(mpl.__version__), LooseVersion(version)) and
+                str(mpl.__version__)[0] != '0')
+
+    return inner
+
+
+_mpl_ge_1_2_1 = _mpl_version('1.2.1', operator.ge)
+_mpl_le_1_2_1 = _mpl_version('1.2.1', operator.le)
+_mpl_ge_1_3_1 = _mpl_version('1.3.1', operator.ge)
+_mpl_ge_1_4_0 = _mpl_version('1.4.0', operator.ge)
+_mpl_ge_1_4_1 = _mpl_version('1.4.1', operator.ge)
+_mpl_ge_1_5_0 = _mpl_version('1.5.0', operator.ge)
+_mpl_ge_2_0_0 = _mpl_version('2.0.0', operator.ge)
+_mpl_le_2_0_0 = _mpl_version('2.0.0', operator.le)
+_mpl_ge_2_0_1 = _mpl_version('2.0.1', operator.ge)
+_mpl_ge_2_1_0 = _mpl_version('2.1.0', operator.ge)
+_mpl_ge_2_2_0 = _mpl_version('2.2.0', operator.ge)
diff --git a/pandas/plotting/_converter.py b/pandas/plotting/_converter.py
new file mode 100644
index 0000000000000..f413e4177b386
--- /dev/null
+++ b/pandas/plotting/_converter.py
@@ -0,0 +1,1163 @@
+import warnings
+from datetime import datetime, timedelta
+import datetime as pydt
+import numpy as np
+
+from dateutil.relativedelta import relativedelta
+
+import matplotlib.units as units
+import matplotlib.dates as dates
+
+from matplotlib.ticker import Formatter, AutoLocator, Locator
+from matplotlib.transforms import nonsingular
+
+from pandas.core.dtypes.common import (
+    is_float, is_integer,
+    is_integer_dtype,
+    is_float_dtype,
+    is_datetime64_ns_dtype,
+    is_period_arraylike,
+    is_nested_list_like
+)
+from pandas.core.dtypes.generic import ABCSeries
+
+from pandas.compat import lrange
+import pandas.compat as compat
+from pandas._libs import tslib
+import pandas.core.common as com
+from pandas.core.index import Index
+
+from pandas.core.indexes.datetimes import date_range
+import pandas.core.tools.datetimes as tools
+from pandas._libs.tslibs import resolution
+import pandas.tseries.frequencies as frequencies
+from pandas.tseries.frequencies import FreqGroup
+from pandas.core.indexes.period import Period, PeriodIndex
+
+from pandas.plotting._compat import _mpl_le_2_0_0
+
+# constants
+HOURS_PER_DAY = 24.
+MIN_PER_HOUR = 60.
+SEC_PER_MIN = 60.
+
+SEC_PER_HOUR = SEC_PER_MIN * MIN_PER_HOUR
+SEC_PER_DAY = SEC_PER_HOUR * HOURS_PER_DAY
+
+MUSEC_PER_DAY = 1e6 * SEC_PER_DAY
+
+_WARN = True  # Global for whether pandas has registered the units explicitly
+_mpl_units = {}  # Cache for units overwritten by us
+
+
+def get_pairs():
+    pairs = [
+        (tslib.Timestamp, DatetimeConverter),
+        (Period, PeriodConverter),
+        (pydt.datetime, DatetimeConverter),
+        (pydt.date, DatetimeConverter),
+        (pydt.time, TimeConverter),
+        (np.datetime64, DatetimeConverter),
+    ]
+    return pairs
+
+
+def register(explicit=True):
+    """Register Pandas Formatters and Converters with matplotlib
+
+    This function modifies the global ``matplotlib.units.registry``
+    dictionary. Pandas adds custom converters for
+
+    * pd.Timestamp
+    * pd.Period
+    * np.datetime64
+    * datetime.datetime
+    * datetime.date
+    * datetime.time
+
+    See Also
+    --------
+    deregister_matplotlib_converter
+    """
+    # Renamed in pandas.plotting.__init__
+    global _WARN
+
+    if explicit:
+        _WARN = False
+
+    pairs = get_pairs()
+    for type_, cls in pairs:
+        converter = cls()
+        if type_ in units.registry:
+            previous = units.registry[type_]
+            _mpl_units[type_] = previous
+        units.registry[type_] = converter
+
+
+def deregister():
+    """Remove pandas' formatters and converters
+
+    Removes the custom converters added by :func:`register`. This
+    attempts to set the state of the registry back to the state before
+    pandas registered its own units. Converters for pandas' own types like
+    Timestamp and Period are removed completely. Converters for types
+    pandas overwrites, like ``datetime.datetime``, are restored to their
+    original value.
+
+    See Also
+    --------
+    deregister_matplotlib_converters
+    """
+    # Renamed in pandas.plotting.__init__
+    for type_, cls in get_pairs():
+        # We use type to catch our classes directly, no inheritance
+        if type(units.registry.get(type_)) is cls:
+            units.registry.pop(type_)
+
+    # restore the old keys
+    for unit, formatter in _mpl_units.items():
+        if type(formatter) not in {DatetimeConverter, PeriodConverter,
+                                   TimeConverter}:
+            # make it idempotent by excluding ours.
+            units.registry[unit] = formatter
+
+
+def _check_implicitly_registered():
+    global _WARN
+
+    if _WARN:
+        msg = ("Using an implicitly registered datetime converter for a "
+               "matplotlib plotting method. The converter was registered "
+               "by pandas on import. Future versions of pandas will require "
+               "you to explicitly register matplotlib converters.\n\n"
+               "To register the converters:\n\t"
+               ">>> from pandas.plotting import register_matplotlib_converters"
+               "\n\t"
+               ">>> register_matplotlib_converters()")
+        warnings.warn(msg, FutureWarning)
+        _WARN = False
+
+
+def _to_ordinalf(tm):
+    tot_sec = (tm.hour * 3600 + tm.minute * 60 + tm.second +
+               float(tm.microsecond / 1e6))
+    return tot_sec
+
+
+def time2num(d):
+    if isinstance(d, compat.string_types):
+        parsed = tools.to_datetime(d)
+        if not isinstance(parsed, datetime):
+            raise ValueError('Could not parse time {d}'.format(d=d))
+        return _to_ordinalf(parsed.time())
+    if isinstance(d, pydt.time):
+        return _to_ordinalf(d)
+    return d
+
+
+class TimeConverter(units.ConversionInterface):
+
+    @staticmethod
+    def convert(value, unit, axis):
+        valid_types = (str, pydt.time)
+        if (isinstance(value, valid_types) or is_integer(value) or
+                is_float(value)):
+            return time2num(value)
+        if isinstance(value, Index):
+            return value.map(time2num)
+        if isinstance(value, (list, tuple, np.ndarray, Index)):
+            return [time2num(x) for x in value]
+        return value
+
+    @staticmethod
+    def axisinfo(unit, axis):
+        if unit != 'time':
+            return None
+
+        majloc = AutoLocator()
+        majfmt = TimeFormatter(majloc)
+        return units.AxisInfo(majloc=majloc, majfmt=majfmt, label='time')
+
+    @staticmethod
+    def default_units(x, axis):
+        return 'time'
+
+
+# time formatter
+class TimeFormatter(Formatter):
+
+    def __init__(self, locs):
+        self.locs = locs
+
+    def __call__(self, x, pos=0):
+        """
+        Return the time of day as a formatted string.
+
+        Parameters
+        ----------
+        x : float
+            The time of day specified as seconds since 00:00 (midnight),
+            with up to microsecond precision.
+        pos
+            Unused
+
+        Returns
+        -------
+        str
+            A string in HH:MM:SS.mmmuuu format. Microseconds,
+            milliseconds and seconds are only displayed if non-zero.
+        """
+        fmt = '%H:%M:%S.%f'
+        s = int(x)
+        msus = int(round((x - s) * 1e6))
+        ms = msus // 1000
+        us = msus % 1000
+        m, s = divmod(s, 60)
+        h, m = divmod(m, 60)
+        _, h = divmod(h, 24)
+        if us != 0:
+            return pydt.time(h, m, s, msus).strftime(fmt)
+        elif ms != 0:
+            return pydt.time(h, m, s, msus).strftime(fmt)[:-3]
+        elif s != 0:
+            return pydt.time(h, m, s).strftime('%H:%M:%S')
+
+        return pydt.time(h, m).strftime('%H:%M')
+
+
+# Period Conversion
+
+
+class PeriodConverter(dates.DateConverter):
+
+    @staticmethod
+    def convert(values, units, axis):
+        if is_nested_list_like(values):
+            values = [PeriodConverter._convert_1d(v, units, axis)
+                      for v in values]
+        else:
+            values = PeriodConverter._convert_1d(values, units, axis)
+        return values
+
+    @staticmethod
+    def _convert_1d(values, units, axis):
+        if not hasattr(axis, 'freq'):
+            raise TypeError('Axis must have `freq` set to convert to Periods')
+        valid_types = (compat.string_types, datetime,
+                       Period, pydt.date, pydt.time, np.datetime64)
+        if (isinstance(values, valid_types) or is_integer(values) or
+                is_float(values)):
+            return get_datevalue(values, axis.freq)
+        if isinstance(values, PeriodIndex):
+            return values.asfreq(axis.freq)._ndarray_values
+        if isinstance(values, Index):
+            return values.map(lambda x: get_datevalue(x, axis.freq))
+        if is_period_arraylike(values):
+            return PeriodIndex(values, freq=axis.freq)._ndarray_values
+        if isinstance(values, (list, tuple, np.ndarray, Index)):
+            return [get_datevalue(x, axis.freq) for x in values]
+        return values
+
+
+def get_datevalue(date, freq):
+    if isinstance(date, Period):
+        return date.asfreq(freq).ordinal
+    elif isinstance(date, (compat.string_types, datetime,
+                           pydt.date, pydt.time, np.datetime64)):
+        return Period(date, freq).ordinal
+    elif (is_integer(date) or is_float(date) or
+          (isinstance(date, (np.ndarray, Index)) and (date.size == 1))):
+        return date
+    elif date is None:
+        return None
+    raise ValueError("Unrecognizable date '{date}'".format(date=date))
+
+
+def _dt_to_float_ordinal(dt):
+    """
+    Convert :mod:`datetime` to the Gregorian date as UTC float days,
+    preserving hours, minutes, seconds and microseconds.  Return value
+    is a :func:`float`.
+    """
+    if (isinstance(dt, (np.ndarray, Index, ABCSeries)
+                   ) and is_datetime64_ns_dtype(dt)):
+        base = dates.epoch2num(dt.asi8 / 1.0E9)
+    else:
+        base = dates.date2num(dt)
+    return base
+
+
+# Datetime Conversion
+class DatetimeConverter(dates.DateConverter):
+
+    @staticmethod
+    def convert(values, unit, axis):
+        # values might be a 1-d array, or a list-like of arrays.
+        _check_implicitly_registered()
+        if is_nested_list_like(values):
+            values = [DatetimeConverter._convert_1d(v, unit, axis)
+                      for v in values]
+        else:
+            values = DatetimeConverter._convert_1d(values, unit, axis)
+        return values
+
+    @staticmethod
+    def _convert_1d(values, unit, axis):
+        def try_parse(values):
+            try:
+                return _dt_to_float_ordinal(tools.to_datetime(values))
+            except Exception:
+                return values
+
+        if isinstance(values, (datetime, pydt.date)):
+            return _dt_to_float_ordinal(values)
+        elif isinstance(values, np.datetime64):
+            return _dt_to_float_ordinal(tslib.Timestamp(values))
+        elif isinstance(values, pydt.time):
+            return dates.date2num(values)
+        elif (is_integer(values) or is_float(values)):
+            return values
+        elif isinstance(values, compat.string_types):
+            return try_parse(values)
+        elif isinstance(values, (list, tuple, np.ndarray, Index)):
+            if isinstance(values, Index):
+                values = values.values
+            if not isinstance(values, np.ndarray):
+                values = com._asarray_tuplesafe(values)
+
+            if is_integer_dtype(values) or is_float_dtype(values):
+                return values
+
+            try:
+                values = tools.to_datetime(values)
+                if isinstance(values, Index):
+                    values = _dt_to_float_ordinal(values)
+                else:
+                    values = [_dt_to_float_ordinal(x) for x in values]
+            except Exception:
+                values = _dt_to_float_ordinal(values)
+
+        return values
+
+    @staticmethod
+    def axisinfo(unit, axis):
+        """
+        Return the :class:`~matplotlib.units.AxisInfo` for *unit*.
+
+        *unit* is a tzinfo instance or None.
+        The *axis* argument is required but not used.
+        """
+        tz = unit
+
+        majloc = PandasAutoDateLocator(tz=tz)
+        majfmt = PandasAutoDateFormatter(majloc, tz=tz)
+        datemin = pydt.date(2000, 1, 1)
+        datemax = pydt.date(2010, 1, 1)
+
+        return units.AxisInfo(majloc=majloc, majfmt=majfmt, label='',
+                              default_limits=(datemin, datemax))
+
+
+class PandasAutoDateFormatter(dates.AutoDateFormatter):
+
+    def __init__(self, locator, tz=None, defaultfmt='%Y-%m-%d'):
+        dates.AutoDateFormatter.__init__(self, locator, tz, defaultfmt)
+        # matplotlib.dates._UTC has no _utcoffset called by pandas
+        if self._tz is dates.UTC:
+            self._tz._utcoffset = self._tz.utcoffset(None)
+
+        # For mpl > 2.0 the format strings are controlled via rcparams
+        # so do not mess with them.  For mpl < 2.0 change the second
+        # break point and add a musec break point
+        if _mpl_le_2_0_0():
+            self.scaled[1. / SEC_PER_DAY] = '%H:%M:%S'
+            self.scaled[1. / MUSEC_PER_DAY] = '%H:%M:%S.%f'
+
+
+class PandasAutoDateLocator(dates.AutoDateLocator):
+
+    def get_locator(self, dmin, dmax):
+        'Pick the best locator based on a distance.'
+        _check_implicitly_registered()
+        delta = relativedelta(dmax, dmin)
+
+        num_days = (delta.years * 12.0 + delta.months) * 31.0 + delta.days
+        num_sec = (delta.hours * 60.0 + delta.minutes) * 60.0 + delta.seconds
+        tot_sec = num_days * 86400. + num_sec
+
+        if abs(tot_sec) < self.minticks:
+            self._freq = -1
+            locator = MilliSecondLocator(self.tz)
+            locator.set_axis(self.axis)
+
+            locator.set_view_interval(*self.axis.get_view_interval())
+            locator.set_data_interval(*self.axis.get_data_interval())
+            return locator
+
+        return dates.AutoDateLocator.get_locator(self, dmin, dmax)
+
+    def _get_unit(self):
+        return MilliSecondLocator.get_unit_generic(self._freq)
+
+
+class MilliSecondLocator(dates.DateLocator):
+
+    UNIT = 1. / (24 * 3600 * 1000)
+
+    def __init__(self, tz):
+        dates.DateLocator.__init__(self, tz)
+        self._interval = 1.
+
+    def _get_unit(self):
+        return self.get_unit_generic(-1)
+
+    @staticmethod
+    def get_unit_generic(freq):
+        unit = dates.RRuleLocator.get_unit_generic(freq)
+        if unit < 0:
+            return MilliSecondLocator.UNIT
+        return unit
+
+    def __call__(self):
+        # if no data have been set, this will tank with a ValueError
+        _check_implicitly_registered()
+        try:
+            dmin, dmax = self.viewlim_to_dt()
+        except ValueError:
+            return []
+
+        if dmin > dmax:
+            dmax, dmin = dmin, dmax
+        # We need to cap at the endpoints of valid datetime
+
+        # TODO(wesm) unused?
+        # delta = relativedelta(dmax, dmin)
+        # try:
+        #     start = dmin - delta
+        # except ValueError:
+        #     start = _from_ordinal(1.0)
+
+        # try:
+        #     stop = dmax + delta
+        # except ValueError:
+        #     # The magic number!
+        #     stop = _from_ordinal(3652059.9999999)
+
+        nmax, nmin = dates.date2num((dmax, dmin))
+
+        num = (nmax - nmin) * 86400 * 1000
+        max_millis_ticks = 6
+        for interval in [1, 10, 50, 100, 200, 500]:
+            if num <= interval * (max_millis_ticks - 1):
+                self._interval = interval
+                break
+            else:
+                # We went through the whole loop without breaking, default to 1
+                self._interval = 1000.
+
+        estimate = (nmax - nmin) / (self._get_unit() * self._get_interval())
+
+        if estimate > self.MAXTICKS * 2:
+            raise RuntimeError(('MillisecondLocator estimated to generate '
+                                '{estimate:d} ticks from {dmin} to {dmax}: '
+                                'exceeds Locator.MAXTICKS'
+                                '* 2 ({arg:d}) ').format(
+                                    estimate=estimate, dmin=dmin, dmax=dmax,
+                                    arg=self.MAXTICKS * 2))
+
+        freq = '%dL' % self._get_interval()
+        tz = self.tz.tzname(None)
+        st = _from_ordinal(dates.date2num(dmin))  # strip tz
+        ed = _from_ordinal(dates.date2num(dmax))
+        all_dates = date_range(start=st, end=ed,
+                               freq=freq, tz=tz).astype(object)
+
+        try:
+            if len(all_dates) > 0:
+                locs = self.raise_if_exceeds(dates.date2num(all_dates))
+                return locs
+        except Exception:  # pragma: no cover
+            pass
+
+        lims = dates.date2num([dmin, dmax])
+        return lims
+
+    def _get_interval(self):
+        return self._interval
+
+    def autoscale(self):
+        """
+        Set the view limits to include the data range.
+        """
+        dmin, dmax = self.datalim_to_dt()
+        if dmin > dmax:
+            dmax, dmin = dmin, dmax
+
+        # We need to cap at the endpoints of valid datetime
+
+        # TODO(wesm): unused?
+
+        # delta = relativedelta(dmax, dmin)
+        # try:
+        #     start = dmin - delta
+        # except ValueError:
+        #     start = _from_ordinal(1.0)
+
+        # try:
+        #     stop = dmax + delta
+        # except ValueError:
+        #     # The magic number!
+        #     stop = _from_ordinal(3652059.9999999)
+
+        dmin, dmax = self.datalim_to_dt()
+
+        vmin = dates.date2num(dmin)
+        vmax = dates.date2num(dmax)
+
+        return self.nonsingular(vmin, vmax)
+
+
+def _from_ordinal(x, tz=None):
+    ix = int(x)
+    dt = datetime.fromordinal(ix)
+    remainder = float(x) - ix
+    hour, remainder = divmod(24 * remainder, 1)
+    minute, remainder = divmod(60 * remainder, 1)
+    second, remainder = divmod(60 * remainder, 1)
+    microsecond = int(1e6 * remainder)
+    if microsecond < 10:
+        microsecond = 0  # compensate for rounding errors
+    dt = datetime(dt.year, dt.month, dt.day, int(hour), int(minute),
+                  int(second), microsecond)
+    if tz is not None:
+        dt = dt.astimezone(tz)
+
+    if microsecond > 999990:  # compensate for rounding errors
+        dt += timedelta(microseconds=1e6 - microsecond)
+
+    return dt
+
+# Fixed frequency dynamic tick locators and formatters
+
+# -------------------------------------------------------------------------
+# --- Locators ---
+# -------------------------------------------------------------------------
+
+
+def _get_default_annual_spacing(nyears):
+    """
+    Returns a default spacing between consecutive ticks for annual data.
+    """
+    if nyears < 11:
+        (min_spacing, maj_spacing) = (1, 1)
+    elif nyears < 20:
+        (min_spacing, maj_spacing) = (1, 2)
+    elif nyears < 50:
+        (min_spacing, maj_spacing) = (1, 5)
+    elif nyears < 100:
+        (min_spacing, maj_spacing) = (5, 10)
+    elif nyears < 200:
+        (min_spacing, maj_spacing) = (5, 25)
+    elif nyears < 600:
+        (min_spacing, maj_spacing) = (10, 50)
+    else:
+        factor = nyears // 1000 + 1
+        (min_spacing, maj_spacing) = (factor * 20, factor * 100)
+    return (min_spacing, maj_spacing)
+
+
+def period_break(dates, period):
+    """
+    Returns the indices where the given period changes.
+
+    Parameters
+    ----------
+    dates : PeriodIndex
+        Array of intervals to monitor.
+    period : string
+        Name of the period to monitor.
+    """
+    current = getattr(dates, period)
+    previous = getattr(dates - 1, period)
+    return np.nonzero(current - previous)[0]
+
+
+def has_level_label(label_flags, vmin):
+    """
+    Returns true if the ``label_flags`` indicate there is at least one label
+    for this level.
+
+    if the minimum view limit is not an exact integer, then the first tick
+    label won't be shown, so we must adjust for that.
+    """
+    if label_flags.size == 0 or (label_flags.size == 1 and
+                                 label_flags[0] == 0 and
+                                 vmin % 1 > 0.0):
+        return False
+    else:
+        return True
+
+
+def _daily_finder(vmin, vmax, freq):
+    periodsperday = -1
+
+    if freq >= FreqGroup.FR_HR:
+        if freq == FreqGroup.FR_NS:
+            periodsperday = 24 * 60 * 60 * 1000000000
+        elif freq == FreqGroup.FR_US:
+            periodsperday = 24 * 60 * 60 * 1000000
+        elif freq == FreqGroup.FR_MS:
+            periodsperday = 24 * 60 * 60 * 1000
+        elif freq == FreqGroup.FR_SEC:
+            periodsperday = 24 * 60 * 60
+        elif freq == FreqGroup.FR_MIN:
+            periodsperday = 24 * 60
+        elif freq == FreqGroup.FR_HR:
+            periodsperday = 24
+        else:  # pragma: no cover
+            raise ValueError("unexpected frequency: {freq}".format(freq=freq))
+        periodsperyear = 365 * periodsperday
+        periodspermonth = 28 * periodsperday
+
+    elif freq == FreqGroup.FR_BUS:
+        periodsperyear = 261
+        periodspermonth = 19
+    elif freq == FreqGroup.FR_DAY:
+        periodsperyear = 365
+        periodspermonth = 28
+    elif resolution.get_freq_group(freq) == FreqGroup.FR_WK:
+        periodsperyear = 52
+        periodspermonth = 3
+    else:  # pragma: no cover
+        raise ValueError("unexpected frequency")
+
+    # save this for later usage
+    vmin_orig = vmin
+
+    (vmin, vmax) = (Period(ordinal=int(vmin), freq=freq),
+                    Period(ordinal=int(vmax), freq=freq))
+    span = vmax.ordinal - vmin.ordinal + 1
+    dates_ = PeriodIndex(start=vmin, end=vmax, freq=freq)
+    # Initialize the output
+    info = np.zeros(span,
+                    dtype=[('val', np.int64), ('maj', bool),
+                           ('min', bool), ('fmt', '|S20')])
+    info['val'][:] = dates_._ndarray_values
+    info['fmt'][:] = ''
+    info['maj'][[0, -1]] = True
+    # .. and set some shortcuts
+    info_maj = info['maj']
+    info_min = info['min']
+    info_fmt = info['fmt']
+
+    def first_label(label_flags):
+        if (label_flags[0] == 0) and (label_flags.size > 1) and \
+                ((vmin_orig % 1) > 0.0):
+            return label_flags[1]
+        else:
+            return label_flags[0]
+
+    # Case 1. Less than a month
+    if span <= periodspermonth:
+        day_start = period_break(dates_, 'day')
+        month_start = period_break(dates_, 'month')
+
+        def _hour_finder(label_interval, force_year_start):
+            _hour = dates_.hour
+            _prev_hour = (dates_ - 1).hour
+            hour_start = (_hour - _prev_hour) != 0
+            info_maj[day_start] = True
+            info_min[hour_start & (_hour % label_interval == 0)] = True
+            year_start = period_break(dates_, 'year')
+            info_fmt[hour_start & (_hour % label_interval == 0)] = '%H:%M'
+            info_fmt[day_start] = '%H:%M\n%d-%b'
+            info_fmt[year_start] = '%H:%M\n%d-%b\n%Y'
+            if force_year_start and not has_level_label(year_start, vmin_orig):
+                info_fmt[first_label(day_start)] = '%H:%M\n%d-%b\n%Y'
+
+        def _minute_finder(label_interval):
+            hour_start = period_break(dates_, 'hour')
+            _minute = dates_.minute
+            _prev_minute = (dates_ - 1).minute
+            minute_start = (_minute - _prev_minute) != 0
+            info_maj[hour_start] = True
+            info_min[minute_start & (_minute % label_interval == 0)] = True
+            year_start = period_break(dates_, 'year')
+            info_fmt = info['fmt']
+            info_fmt[minute_start & (_minute % label_interval == 0)] = '%H:%M'
+            info_fmt[day_start] = '%H:%M\n%d-%b'
+            info_fmt[year_start] = '%H:%M\n%d-%b\n%Y'
+
+        def _second_finder(label_interval):
+            minute_start = period_break(dates_, 'minute')
+            _second = dates_.second
+            _prev_second = (dates_ - 1).second
+            second_start = (_second - _prev_second) != 0
+            info['maj'][minute_start] = True
+            info['min'][second_start & (_second % label_interval == 0)] = True
+            year_start = period_break(dates_, 'year')
+            info_fmt = info['fmt']
+            info_fmt[second_start & (_second %
+                                     label_interval == 0)] = '%H:%M:%S'
+            info_fmt[day_start] = '%H:%M:%S\n%d-%b'
+            info_fmt[year_start] = '%H:%M:%S\n%d-%b\n%Y'
+
+        if span < periodsperday / 12000.0:
+            _second_finder(1)
+        elif span < periodsperday / 6000.0:
+            _second_finder(2)
+        elif span < periodsperday / 2400.0:
+            _second_finder(5)
+        elif span < periodsperday / 1200.0:
+            _second_finder(10)
+        elif span < periodsperday / 800.0:
+            _second_finder(15)
+        elif span < periodsperday / 400.0:
+            _second_finder(30)
+        elif span < periodsperday / 150.0:
+            _minute_finder(1)
+        elif span < periodsperday / 70.0:
+            _minute_finder(2)
+        elif span < periodsperday / 24.0:
+            _minute_finder(5)
+        elif span < periodsperday / 12.0:
+            _minute_finder(15)
+        elif span < periodsperday / 6.0:
+            _minute_finder(30)
+        elif span < periodsperday / 2.5:
+            _hour_finder(1, False)
+        elif span < periodsperday / 1.5:
+            _hour_finder(2, False)
+        elif span < periodsperday * 1.25:
+            _hour_finder(3, False)
+        elif span < periodsperday * 2.5:
+            _hour_finder(6, True)
+        elif span < periodsperday * 4:
+            _hour_finder(12, True)
+        else:
+            info_maj[month_start] = True
+            info_min[day_start] = True
+            year_start = period_break(dates_, 'year')
+            info_fmt = info['fmt']
+            info_fmt[day_start] = '%d'
+            info_fmt[month_start] = '%d\n%b'
+            info_fmt[year_start] = '%d\n%b\n%Y'
+            if not has_level_label(year_start, vmin_orig):
+                if not has_level_label(month_start, vmin_orig):
+                    info_fmt[first_label(day_start)] = '%d\n%b\n%Y'
+                else:
+                    info_fmt[first_label(month_start)] = '%d\n%b\n%Y'
+
+    # Case 2. Less than three months
+    elif span <= periodsperyear // 4:
+        month_start = period_break(dates_, 'month')
+        info_maj[month_start] = True
+        if freq < FreqGroup.FR_HR:
+            info['min'] = True
+        else:
+            day_start = period_break(dates_, 'day')
+            info['min'][day_start] = True
+        week_start = period_break(dates_, 'week')
+        year_start = period_break(dates_, 'year')
+        info_fmt[week_start] = '%d'
+        info_fmt[month_start] = '\n\n%b'
+        info_fmt[year_start] = '\n\n%b\n%Y'
+        if not has_level_label(year_start, vmin_orig):
+            if not has_level_label(month_start, vmin_orig):
+                info_fmt[first_label(week_start)] = '\n\n%b\n%Y'
+            else:
+                info_fmt[first_label(month_start)] = '\n\n%b\n%Y'
+    # Case 3. Less than 14 months ...............
+    elif span <= 1.15 * periodsperyear:
+        year_start = period_break(dates_, 'year')
+        month_start = period_break(dates_, 'month')
+        week_start = period_break(dates_, 'week')
+        info_maj[month_start] = True
+        info_min[week_start] = True
+        info_min[year_start] = False
+        info_min[month_start] = False
+        info_fmt[month_start] = '%b'
+        info_fmt[year_start] = '%b\n%Y'
+        if not has_level_label(year_start, vmin_orig):
+            info_fmt[first_label(month_start)] = '%b\n%Y'
+    # Case 4. Less than 2.5 years ...............
+    elif span <= 2.5 * periodsperyear:
+        year_start = period_break(dates_, 'year')
+        quarter_start = period_break(dates_, 'quarter')
+        month_start = period_break(dates_, 'month')
+        info_maj[quarter_start] = True
+        info_min[month_start] = True
+        info_fmt[quarter_start] = '%b'
+        info_fmt[year_start] = '%b\n%Y'
+    # Case 4. Less than 4 years .................
+    elif span <= 4 * periodsperyear:
+        year_start = period_break(dates_, 'year')
+        month_start = period_break(dates_, 'month')
+        info_maj[year_start] = True
+        info_min[month_start] = True
+        info_min[year_start] = False
+
+        month_break = dates_[month_start].month
+        jan_or_jul = month_start[(month_break == 1) | (month_break == 7)]
+        info_fmt[jan_or_jul] = '%b'
+        info_fmt[year_start] = '%b\n%Y'
+    # Case 5. Less than 11 years ................
+    elif span <= 11 * periodsperyear:
+        year_start = period_break(dates_, 'year')
+        quarter_start = period_break(dates_, 'quarter')
+        info_maj[year_start] = True
+        info_min[quarter_start] = True
+        info_min[year_start] = False
+        info_fmt[year_start] = '%Y'
+    # Case 6. More than 12 years ................
+    else:
+        year_start = period_break(dates_, 'year')
+        year_break = dates_[year_start].year
+        nyears = span / periodsperyear
+        (min_anndef, maj_anndef) = _get_default_annual_spacing(nyears)
+        major_idx = year_start[(year_break % maj_anndef == 0)]
+        info_maj[major_idx] = True
+        minor_idx = year_start[(year_break % min_anndef == 0)]
+        info_min[minor_idx] = True
+        info_fmt[major_idx] = '%Y'
+
+    return info
+
+
+def _monthly_finder(vmin, vmax, freq):
+    periodsperyear = 12
+
+    vmin_orig = vmin
+    (vmin, vmax) = (int(vmin), int(vmax))
+    span = vmax - vmin + 1
+
+    # Initialize the output
+    info = np.zeros(span,
+                    dtype=[('val', int), ('maj', bool), ('min', bool),
+                           ('fmt', '|S8')])
+    info['val'] = np.arange(vmin, vmax + 1)
+    dates_ = info['val']
+    info['fmt'] = ''
+    year_start = (dates_ % 12 == 0).nonzero()[0]
+    info_maj = info['maj']
+    info_fmt = info['fmt']
+
+    if span <= 1.15 * periodsperyear:
+        info_maj[year_start] = True
+        info['min'] = True
+
+        info_fmt[:] = '%b'
+        info_fmt[year_start] = '%b\n%Y'
+
+        if not has_level_label(year_start, vmin_orig):
+            if dates_.size > 1:
+                idx = 1
+            else:
+                idx = 0
+            info_fmt[idx] = '%b\n%Y'
+
+    elif span <= 2.5 * periodsperyear:
+        quarter_start = (dates_ % 3 == 0).nonzero()
+        info_maj[year_start] = True
+        # TODO: Check the following : is it really info['fmt'] ?
+        info['fmt'][quarter_start] = True
+        info['min'] = True
+
+        info_fmt[quarter_start] = '%b'
+        info_fmt[year_start] = '%b\n%Y'
+
+    elif span <= 4 * periodsperyear:
+        info_maj[year_start] = True
+        info['min'] = True
+
+        jan_or_jul = (dates_ % 12 == 0) | (dates_ % 12 == 6)
+        info_fmt[jan_or_jul] = '%b'
+        info_fmt[year_start] = '%b\n%Y'
+
+    elif span <= 11 * periodsperyear:
+        quarter_start = (dates_ % 3 == 0).nonzero()
+        info_maj[year_start] = True
+        info['min'][quarter_start] = True
+
+        info_fmt[year_start] = '%Y'
+
+    else:
+        nyears = span / periodsperyear
+        (min_anndef, maj_anndef) = _get_default_annual_spacing(nyears)
+        years = dates_[year_start] // 12 + 1
+        major_idx = year_start[(years % maj_anndef == 0)]
+        info_maj[major_idx] = True
+        info['min'][year_start[(years % min_anndef == 0)]] = True
+
+        info_fmt[major_idx] = '%Y'
+
+    return info
+
+
+def _quarterly_finder(vmin, vmax, freq):
+    periodsperyear = 4
+    vmin_orig = vmin
+    (vmin, vmax) = (int(vmin), int(vmax))
+    span = vmax - vmin + 1
+
+    info = np.zeros(span,
+                    dtype=[('val', int), ('maj', bool), ('min', bool),
+                           ('fmt', '|S8')])
+    info['val'] = np.arange(vmin, vmax + 1)
+    info['fmt'] = ''
+    dates_ = info['val']
+    info_maj = info['maj']
+    info_fmt = info['fmt']
+    year_start = (dates_ % 4 == 0).nonzero()[0]
+
+    if span <= 3.5 * periodsperyear:
+        info_maj[year_start] = True
+        info['min'] = True
+
+        info_fmt[:] = 'Q%q'
+        info_fmt[year_start] = 'Q%q\n%F'
+        if not has_level_label(year_start, vmin_orig):
+            if dates_.size > 1:
+                idx = 1
+            else:
+                idx = 0
+            info_fmt[idx] = 'Q%q\n%F'
+
+    elif span <= 11 * periodsperyear:
+        info_maj[year_start] = True
+        info['min'] = True
+        info_fmt[year_start] = '%F'
+
+    else:
+        years = dates_[year_start] // 4 + 1
+        nyears = span / periodsperyear
+        (min_anndef, maj_anndef) = _get_default_annual_spacing(nyears)
+        major_idx = year_start[(years % maj_anndef == 0)]
+        info_maj[major_idx] = True
+        info['min'][year_start[(years % min_anndef == 0)]] = True
+        info_fmt[major_idx] = '%F'
+
+    return info
+
+
+def _annual_finder(vmin, vmax, freq):
+    (vmin, vmax) = (int(vmin), int(vmax + 1))
+    span = vmax - vmin + 1
+
+    info = np.zeros(span,
+                    dtype=[('val', int), ('maj', bool), ('min', bool),
+                           ('fmt', '|S8')])
+    info['val'] = np.arange(vmin, vmax + 1)
+    info['fmt'] = ''
+    dates_ = info['val']
+
+    (min_anndef, maj_anndef) = _get_default_annual_spacing(span)
+    major_idx = dates_ % maj_anndef == 0
+    info['maj'][major_idx] = True
+    info['min'][(dates_ % min_anndef == 0)] = True
+    info['fmt'][major_idx] = '%Y'
+
+    return info
+
+
+def get_finder(freq):
+    if isinstance(freq, compat.string_types):
+        freq = frequencies.get_freq(freq)
+    fgroup = resolution.get_freq_group(freq)
+
+    if fgroup == FreqGroup.FR_ANN:
+        return _annual_finder
+    elif fgroup == FreqGroup.FR_QTR:
+        return _quarterly_finder
+    elif freq == FreqGroup.FR_MTH:
+        return _monthly_finder
+    elif ((freq >= FreqGroup.FR_BUS) or fgroup == FreqGroup.FR_WK):
+        return _daily_finder
+    else:  # pragma: no cover
+        errmsg = "Unsupported frequency: {freq}".format(freq=freq)
+        raise NotImplementedError(errmsg)
+
+
+class TimeSeries_DateLocator(Locator):
+    """
+    Locates the ticks along an axis controlled by a :class:`Series`.
+
+    Parameters
+    ----------
+    freq : {var}
+        Valid frequency specifier.
+    minor_locator : {False, True}, optional
+        Whether the locator is for minor ticks (True) or not.
+    dynamic_mode : {True, False}, optional
+        Whether the locator should work in dynamic mode.
+    base : {int}, optional
+    quarter : {int}, optional
+    month : {int}, optional
+    day : {int}, optional
+    """
+
+    def __init__(self, freq, minor_locator=False, dynamic_mode=True,
+                 base=1, quarter=1, month=1, day=1, plot_obj=None):
+        if isinstance(freq, compat.string_types):
+            freq = frequencies.get_freq(freq)
+        self.freq = freq
+        self.base = base
+        (self.quarter, self.month, self.day) = (quarter, month, day)
+        self.isminor = minor_locator
+        self.isdynamic = dynamic_mode
+        self.offset = 0
+        self.plot_obj = plot_obj
+        self.finder = get_finder(freq)
+
+    def _get_default_locs(self, vmin, vmax):
+        "Returns the default locations of ticks."
+
+        if self.plot_obj.date_axis_info is None:
+            self.plot_obj.date_axis_info = self.finder(vmin, vmax, self.freq)
+
+        locator = self.plot_obj.date_axis_info
+
+        if self.isminor:
+            return np.compress(locator['min'], locator['val'])
+        return np.compress(locator['maj'], locator['val'])
+
+    def __call__(self):
+        'Return the locations of the ticks.'
+        # axis calls Locator.set_axis inside set_m<xxxx>_formatter
+        _check_implicitly_registered()
+
+        vi = tuple(self.axis.get_view_interval())
+        if vi != self.plot_obj.view_interval:
+            self.plot_obj.date_axis_info = None
+        self.plot_obj.view_interval = vi
+        vmin, vmax = vi
+        if vmax < vmin:
+            vmin, vmax = vmax, vmin
+        if self.isdynamic:
+            locs = self._get_default_locs(vmin, vmax)
+        else:  # pragma: no cover
+            base = self.base
+            (d, m) = divmod(vmin, base)
+            vmin = (d + 1) * base
+            locs = lrange(vmin, vmax + 1, base)
+        return locs
+
+    def autoscale(self):
+        """
+        Sets the view limits to the nearest multiples of base that contain the
+        data.
+        """
+        # requires matplotlib >= 0.98.0
+        (vmin, vmax) = self.axis.get_data_interval()
+
+        locs = self._get_default_locs(vmin, vmax)
+        (vmin, vmax) = locs[[0, -1]]
+        if vmin == vmax:
+            vmin -= 1
+            vmax += 1
+        return nonsingular(vmin, vmax)
+
+# -------------------------------------------------------------------------
+# --- Formatter ---
+# -------------------------------------------------------------------------
+
+
+class TimeSeries_DateFormatter(Formatter):
+    """
+    Formats the ticks along an axis controlled by a :class:`PeriodIndex`.
+
+    Parameters
+    ----------
+    freq : {int, string}
+        Valid frequency specifier.
+    minor_locator : {False, True}
+        Whether the current formatter should apply to minor ticks (True) or
+        major ticks (False).
+    dynamic_mode : {True, False}
+        Whether the formatter works in dynamic mode or not.
+    """
+
+    def __init__(self, freq, minor_locator=False, dynamic_mode=True,
+                 plot_obj=None):
+        if isinstance(freq, compat.string_types):
+            freq = frequencies.get_freq(freq)
+        self.format = None
+        self.freq = freq
+        self.locs = []
+        self.formatdict = None
+        self.isminor = minor_locator
+        self.isdynamic = dynamic_mode
+        self.offset = 0
+        self.plot_obj = plot_obj
+        self.finder = get_finder(freq)
+
+    def _set_default_format(self, vmin, vmax):
+        "Returns the default ticks spacing."
+
+        if self.plot_obj.date_axis_info is None:
+            self.plot_obj.date_axis_info = self.finder(vmin, vmax, self.freq)
+        info = self.plot_obj.date_axis_info
+
+        if self.isminor:
+            format = np.compress(info['min'] & np.logical_not(info['maj']),
+                                 info)
+        else:
+            format = np.compress(info['maj'], info)
+        self.formatdict = {x: f for (x, _, _, f) in format}
+        return self.formatdict
+
+    def set_locs(self, locs):
+        'Sets the locations of the ticks'
+        # don't actually use the locs. This is just needed to work with
+        # matplotlib. Force to use vmin, vmax
+        _check_implicitly_registered()
+
+        self.locs = locs
+
+        (vmin, vmax) = vi = tuple(self.axis.get_view_interval())
+        if vi != self.plot_obj.view_interval:
+            self.plot_obj.date_axis_info = None
+        self.plot_obj.view_interval = vi
+        if vmax < vmin:
+            (vmin, vmax) = (vmax, vmin)
+        self._set_default_format(vmin, vmax)
+
+    def __call__(self, x, pos=0):
+        _check_implicitly_registered()
+
+        if self.formatdict is None:
+            return ''
+        else:
+            fmt = self.formatdict.pop(x, '')
+            return Period(ordinal=int(x), freq=self.freq).strftime(fmt)
+
+
+class TimeSeries_TimedeltaFormatter(Formatter):
+    """
+    Formats the ticks along an axis controlled by a :class:`TimedeltaIndex`.
+    """
+
+    @staticmethod
+    def format_timedelta_ticks(x, pos, n_decimals):
+        """
+        Convert seconds to 'D days HH:MM:SS.F'
+        """
+        s, ns = divmod(x, 1e9)
+        m, s = divmod(s, 60)
+        h, m = divmod(m, 60)
+        d, h = divmod(h, 24)
+        decimals = int(ns * 10**(n_decimals - 9))
+        s = r'{:02d}:{:02d}:{:02d}'.format(int(h), int(m), int(s))
+        if n_decimals > 0:
+            s += '.{{:0{:0d}d}}'.format(n_decimals).format(decimals)
+        if d != 0:
+            s = '{:d} days '.format(int(d)) + s
+        return s
+
+    def __call__(self, x, pos=0):
+        _check_implicitly_registered()
+        (vmin, vmax) = tuple(self.axis.get_view_interval())
+        n_decimals = int(np.ceil(np.log10(100 * 1e9 / (vmax - vmin))))
+        if n_decimals > 9:
+            n_decimals = 9
+        return self.format_timedelta_ticks(x, pos, n_decimals)
diff --git a/pandas/plotting/_core.py b/pandas/plotting/_core.py
new file mode 100644
index 0000000000000..8c713548d1ede
--- /dev/null
+++ b/pandas/plotting/_core.py
@@ -0,0 +1,3558 @@
+# being a bit too dynamic
+# pylint: disable=E1101
+from __future__ import division
+
+import warnings
+import re
+from collections import namedtuple
+from distutils.version import LooseVersion
+
+import numpy as np
+
+from pandas.util._decorators import cache_readonly
+import pandas.core.common as com
+from pandas.core.base import PandasObject
+from pandas.core.config import get_option
+from pandas.core.dtypes.missing import isna, notna, remove_na_arraylike
+from pandas.core.dtypes.common import (
+    is_list_like,
+    is_integer,
+    is_number,
+    is_hashable,
+    is_iterator)
+from pandas.core.dtypes.generic import ABCSeries, ABCDataFrame
+
+from pandas.core.generic import _shared_docs, _shared_doc_kwargs
+from pandas.core.index import Index, MultiIndex
+
+from pandas.core.indexes.period import PeriodIndex
+from pandas.compat import range, lrange, map, zip, string_types
+import pandas.compat as compat
+from pandas.io.formats.printing import pprint_thing
+from pandas.util._decorators import Appender
+
+from pandas.plotting._compat import (_mpl_ge_1_3_1,
+                                     _mpl_ge_1_5_0,
+                                     _mpl_ge_2_0_0)
+from pandas.plotting._style import (plot_params,
+                                    _get_standard_colors)
+from pandas.plotting._tools import (_subplots, _flatten, table,
+                                    _handle_shared_axes, _get_all_lines,
+                                    _get_xlim, _set_ticks_props,
+                                    format_date_labels)
+
+try:
+    from pandas.plotting import _converter
+except ImportError:
+    _HAS_MPL = False
+else:
+    _HAS_MPL = True
+    if get_option('plotting.matplotlib.register_converters'):
+        _converter.register(explicit=True)
+
+
+def _raise_if_no_mpl():
+    # TODO(mpl_converter): remove once converter is explicit
+    if not _HAS_MPL:
+        raise ImportError("matplotlib is required for plotting.")
+
+
+def _get_standard_kind(kind):
+    return {'density': 'kde'}.get(kind, kind)
+
+
+def _gca(rc=None):
+    import matplotlib.pyplot as plt
+    with plt.rc_context(rc):
+        return plt.gca()
+
+
+def _gcf():
+    import matplotlib.pyplot as plt
+    return plt.gcf()
+
+
+class MPLPlot(object):
+    """
+    Base class for assembling a pandas plot using matplotlib
+
+    Parameters
+    ----------
+    data :
+
+    """
+
+    @property
+    def _kind(self):
+        """Specify kind str. Must be overridden in child class"""
+        raise NotImplementedError
+
+    _layout_type = 'vertical'
+    _default_rot = 0
+    orientation = None
+    _pop_attributes = ['label', 'style', 'logy', 'logx', 'loglog',
+                       'mark_right', 'stacked']
+    _attr_defaults = {'logy': False, 'logx': False, 'loglog': False,
+                      'mark_right': True, 'stacked': False}
+
+    def __init__(self, data, kind=None, by=None, subplots=False, sharex=None,
+                 sharey=False, use_index=True,
+                 figsize=None, grid=None, legend=True, rot=None,
+                 ax=None, fig=None, title=None, xlim=None, ylim=None,
+                 xticks=None, yticks=None,
+                 sort_columns=False, fontsize=None,
+                 secondary_y=False, colormap=None,
+                 table=False, layout=None, **kwds):
+
+        _raise_if_no_mpl()
+        _converter._WARN = False
+        self.data = data
+        self.by = by
+
+        self.kind = kind
+
+        self.sort_columns = sort_columns
+
+        self.subplots = subplots
+
+        if sharex is None:
+            if ax is None:
+                self.sharex = True
+            else:
+                # if we get an axis, the users should do the visibility
+                # setting...
+                self.sharex = False
+        else:
+            self.sharex = sharex
+
+        self.sharey = sharey
+        self.figsize = figsize
+        self.layout = layout
+
+        self.xticks = xticks
+        self.yticks = yticks
+        self.xlim = xlim
+        self.ylim = ylim
+        self.title = title
+        self.use_index = use_index
+
+        self.fontsize = fontsize
+
+        if rot is not None:
+            self.rot = rot
+            # need to know for format_date_labels since it's rotated to 30 by
+            # default
+            self._rot_set = True
+        else:
+            self._rot_set = False
+            self.rot = self._default_rot
+
+        if grid is None:
+            grid = False if secondary_y else self.plt.rcParams['axes.grid']
+
+        self.grid = grid
+        self.legend = legend
+        self.legend_handles = []
+        self.legend_labels = []
+
+        for attr in self._pop_attributes:
+            value = kwds.pop(attr, self._attr_defaults.get(attr, None))
+            setattr(self, attr, value)
+
+        self.ax = ax
+        self.fig = fig
+        self.axes = None
+
+        # parse errorbar input if given
+        xerr = kwds.pop('xerr', None)
+        yerr = kwds.pop('yerr', None)
+        self.errors = {}
+        for kw, err in zip(['xerr', 'yerr'], [xerr, yerr]):
+            self.errors[kw] = self._parse_errorbars(kw, err)
+
+        if not isinstance(secondary_y, (bool, tuple, list, np.ndarray, Index)):
+            secondary_y = [secondary_y]
+        self.secondary_y = secondary_y
+
+        # ugly TypeError if user passes matplotlib's `cmap` name.
+        # Probably better to accept either.
+        if 'cmap' in kwds and colormap:
+            raise TypeError("Only specify one of `cmap` and `colormap`.")
+        elif 'cmap' in kwds:
+            self.colormap = kwds.pop('cmap')
+        else:
+            self.colormap = colormap
+
+        self.table = table
+
+        self.kwds = kwds
+
+        self._validate_color_args()
+
+    def _validate_color_args(self):
+        if 'color' not in self.kwds and 'colors' in self.kwds:
+            warnings.warn(("'colors' is being deprecated. Please use 'color'"
+                           "instead of 'colors'"))
+            colors = self.kwds.pop('colors')
+            self.kwds['color'] = colors
+
+        if ('color' in self.kwds and self.nseries == 1 and
+                not is_list_like(self.kwds['color'])):
+            # support series.plot(color='green')
+            self.kwds['color'] = [self.kwds['color']]
+
+        if ('color' in self.kwds and isinstance(self.kwds['color'], tuple) and
+                self.nseries == 1 and len(self.kwds['color']) in (3, 4)):
+            # support RGB and RGBA tuples in series plot
+            self.kwds['color'] = [self.kwds['color']]
+
+        if ('color' in self.kwds or 'colors' in self.kwds) and \
+                self.colormap is not None:
+            warnings.warn("'color' and 'colormap' cannot be used "
+                          "simultaneously. Using 'color'")
+
+        if 'color' in self.kwds and self.style is not None:
+            if is_list_like(self.style):
+                styles = self.style
+            else:
+                styles = [self.style]
+            # need only a single match
+            for s in styles:
+                if re.match('^[a-z]+?', s) is not None:
+                    raise ValueError(
+                        "Cannot pass 'style' string with a color "
+                        "symbol and 'color' keyword argument. Please"
+                        " use one or the other or pass 'style' "
+                        "without a color symbol")
+
+    def _iter_data(self, data=None, keep_index=False, fillna=None):
+        if data is None:
+            data = self.data
+        if fillna is not None:
+            data = data.fillna(fillna)
+
+        # TODO: unused?
+        # if self.sort_columns:
+        #     columns = com._try_sort(data.columns)
+        # else:
+        #     columns = data.columns
+
+        for col, values in data.iteritems():
+            if keep_index is True:
+                yield col, values
+            else:
+                yield col, values.values
+
+    @property
+    def nseries(self):
+        if self.data.ndim == 1:
+            return 1
+        else:
+            return self.data.shape[1]
+
+    def draw(self):
+        self.plt.draw_if_interactive()
+
+    def generate(self):
+        self._args_adjust()
+        self._compute_plot_data()
+        self._setup_subplots()
+        self._make_plot()
+        self._add_table()
+        self._make_legend()
+        self._adorn_subplots()
+
+        for ax in self.axes:
+            self._post_plot_logic_common(ax, self.data)
+            self._post_plot_logic(ax, self.data)
+
+    def _args_adjust(self):
+        pass
+
+    def _has_plotted_object(self, ax):
+        """check whether ax has data"""
+        return (len(ax.lines) != 0 or
+                len(ax.artists) != 0 or
+                len(ax.containers) != 0)
+
+    def _maybe_right_yaxis(self, ax, axes_num):
+        if not self.on_right(axes_num):
+            # secondary axes may be passed via ax kw
+            return self._get_ax_layer(ax)
+
+        if hasattr(ax, 'right_ax'):
+            # if it has right_ax proparty, ``ax`` must be left axes
+            return ax.right_ax
+        elif hasattr(ax, 'left_ax'):
+            # if it has left_ax proparty, ``ax`` must be right axes
+            return ax
+        else:
+            # otherwise, create twin axes
+            orig_ax, new_ax = ax, ax.twinx()
+            # TODO: use Matplotlib public API when available
+            new_ax._get_lines = orig_ax._get_lines
+            new_ax._get_patches_for_fill = orig_ax._get_patches_for_fill
+            orig_ax.right_ax, new_ax.left_ax = new_ax, orig_ax
+
+            if not self._has_plotted_object(orig_ax):  # no data on left y
+                orig_ax.get_yaxis().set_visible(False)
+            return new_ax
+
+    def _setup_subplots(self):
+        if self.subplots:
+            fig, axes = _subplots(naxes=self.nseries,
+                                  sharex=self.sharex, sharey=self.sharey,
+                                  figsize=self.figsize, ax=self.ax,
+                                  layout=self.layout,
+                                  layout_type=self._layout_type)
+        else:
+            if self.ax is None:
+                fig = self.plt.figure(figsize=self.figsize)
+                axes = fig.add_subplot(111)
+            else:
+                fig = self.ax.get_figure()
+                if self.figsize is not None:
+                    fig.set_size_inches(self.figsize)
+                axes = self.ax
+
+        axes = _flatten(axes)
+
+        if self.logx or self.loglog:
+            [a.set_xscale('log') for a in axes]
+        if self.logy or self.loglog:
+            [a.set_yscale('log') for a in axes]
+
+        self.fig = fig
+        self.axes = axes
+
+    @property
+    def result(self):
+        """
+        Return result axes
+        """
+        if self.subplots:
+            if self.layout is not None and not is_list_like(self.ax):
+                return self.axes.reshape(*self.layout)
+            else:
+                return self.axes
+        else:
+            sec_true = isinstance(self.secondary_y, bool) and self.secondary_y
+            all_sec = (is_list_like(self.secondary_y) and
+                       len(self.secondary_y) == self.nseries)
+            if (sec_true or all_sec):
+                # if all data is plotted on secondary, return right axes
+                return self._get_ax_layer(self.axes[0], primary=False)
+            else:
+                return self.axes[0]
+
+    def _compute_plot_data(self):
+        data = self.data
+
+        if isinstance(data, ABCSeries):
+            label = self.label
+            if label is None and data.name is None:
+                label = 'None'
+            data = data.to_frame(name=label)
+
+        # GH16953, _convert is needed as fallback, for ``Series``
+        # with ``dtype == object``
+        data = data._convert(datetime=True, timedelta=True)
+        numeric_data = data.select_dtypes(include=[np.number,
+                                                   "datetime",
+                                                   "datetimetz",
+                                                   "timedelta"])
+
+        try:
+            is_empty = numeric_data.empty
+        except AttributeError:
+            is_empty = not len(numeric_data)
+
+        # no empty frames or series allowed
+        if is_empty:
+            raise TypeError('Empty {0!r}: no numeric data to '
+                            'plot'.format(numeric_data.__class__.__name__))
+
+        self.data = numeric_data
+
+    def _make_plot(self):
+        raise com.AbstractMethodError(self)
+
+    def _add_table(self):
+        if self.table is False:
+            return
+        elif self.table is True:
+            data = self.data.transpose()
+        else:
+            data = self.table
+        ax = self._get_ax(0)
+        table(ax, data)
+
+    def _post_plot_logic_common(self, ax, data):
+        """Common post process for each axes"""
+
+        def get_label(i):
+            try:
+                return pprint_thing(data.index[i])
+            except Exception:
+                return ''
+
+        if self.orientation == 'vertical' or self.orientation is None:
+            if self._need_to_set_index:
+                xticklabels = [get_label(x) for x in ax.get_xticks()]
+                ax.set_xticklabels(xticklabels)
+            self._apply_axis_properties(ax.xaxis, rot=self.rot,
+                                        fontsize=self.fontsize)
+            self._apply_axis_properties(ax.yaxis, fontsize=self.fontsize)
+
+            if hasattr(ax, 'right_ax'):
+                self._apply_axis_properties(ax.right_ax.yaxis,
+                                            fontsize=self.fontsize)
+
+        elif self.orientation == 'horizontal':
+            if self._need_to_set_index:
+                yticklabels = [get_label(y) for y in ax.get_yticks()]
+                ax.set_yticklabels(yticklabels)
+            self._apply_axis_properties(ax.yaxis, rot=self.rot,
+                                        fontsize=self.fontsize)
+            self._apply_axis_properties(ax.xaxis, fontsize=self.fontsize)
+
+            if hasattr(ax, 'right_ax'):
+                self._apply_axis_properties(ax.right_ax.yaxis,
+                                            fontsize=self.fontsize)
+        else:  # pragma no cover
+            raise ValueError
+
+    def _post_plot_logic(self, ax, data):
+        """Post process for each axes. Overridden in child classes"""
+        pass
+
+    def _adorn_subplots(self):
+        """Common post process unrelated to data"""
+        if len(self.axes) > 0:
+            all_axes = self._get_subplots()
+            nrows, ncols = self._get_axes_layout()
+            _handle_shared_axes(axarr=all_axes, nplots=len(all_axes),
+                                naxes=nrows * ncols, nrows=nrows,
+                                ncols=ncols, sharex=self.sharex,
+                                sharey=self.sharey)
+
+        for ax in self.axes:
+            if self.yticks is not None:
+                ax.set_yticks(self.yticks)
+
+            if self.xticks is not None:
+                ax.set_xticks(self.xticks)
+
+            if self.ylim is not None:
+                ax.set_ylim(self.ylim)
+
+            if self.xlim is not None:
+                ax.set_xlim(self.xlim)
+
+            ax.grid(self.grid)
+
+        if self.title:
+            if self.subplots:
+                if is_list_like(self.title):
+                    if len(self.title) != self.nseries:
+                        msg = ('The length of `title` must equal the number '
+                               'of columns if using `title` of type `list` '
+                               'and `subplots=True`.\n'
+                               'length of title = {}\n'
+                               'number of columns = {}').format(
+                            len(self.title), self.nseries)
+                        raise ValueError(msg)
+
+                    for (ax, title) in zip(self.axes, self.title):
+                        ax.set_title(title)
+                else:
+                    self.fig.suptitle(self.title)
+            else:
+                if is_list_like(self.title):
+                    msg = ('Using `title` of type `list` is not supported '
+                           'unless `subplots=True` is passed')
+                    raise ValueError(msg)
+                self.axes[0].set_title(self.title)
+
+    def _apply_axis_properties(self, axis, rot=None, fontsize=None):
+        labels = axis.get_majorticklabels() + axis.get_minorticklabels()
+        for label in labels:
+            if rot is not None:
+                label.set_rotation(rot)
+            if fontsize is not None:
+                label.set_fontsize(fontsize)
+
+    @property
+    def legend_title(self):
+        if not isinstance(self.data.columns, MultiIndex):
+            name = self.data.columns.name
+            if name is not None:
+                name = pprint_thing(name)
+            return name
+        else:
+            stringified = map(pprint_thing,
+                              self.data.columns.names)
+            return ','.join(stringified)
+
+    def _add_legend_handle(self, handle, label, index=None):
+        if label is not None:
+            if self.mark_right and index is not None:
+                if self.on_right(index):
+                    label = label + ' (right)'
+            self.legend_handles.append(handle)
+            self.legend_labels.append(label)
+
+    def _make_legend(self):
+        ax, leg = self._get_ax_legend(self.axes[0])
+
+        handles = []
+        labels = []
+        title = ''
+
+        if not self.subplots:
+            if leg is not None:
+                title = leg.get_title().get_text()
+                handles = leg.legendHandles
+                labels = [x.get_text() for x in leg.get_texts()]
+
+            if self.legend:
+                if self.legend == 'reverse':
+                    self.legend_handles = reversed(self.legend_handles)
+                    self.legend_labels = reversed(self.legend_labels)
+
+                handles += self.legend_handles
+                labels += self.legend_labels
+                if self.legend_title is not None:
+                    title = self.legend_title
+
+            if len(handles) > 0:
+                ax.legend(handles, labels, loc='best', title=title)
+
+        elif self.subplots and self.legend:
+            for ax in self.axes:
+                if ax.get_visible():
+                    ax.legend(loc='best')
+
+    def _get_ax_legend(self, ax):
+        leg = ax.get_legend()
+        other_ax = (getattr(ax, 'left_ax', None) or
+                    getattr(ax, 'right_ax', None))
+        other_leg = None
+        if other_ax is not None:
+            other_leg = other_ax.get_legend()
+        if leg is None and other_leg is not None:
+            leg = other_leg
+            ax = other_ax
+        return ax, leg
+
+    @cache_readonly
+    def plt(self):
+        import matplotlib.pyplot as plt
+        return plt
+
+    @staticmethod
+    def mpl_ge_1_3_1():
+        return _mpl_ge_1_3_1()
+
+    @staticmethod
+    def mpl_ge_1_5_0():
+        return _mpl_ge_1_5_0()
+
+    _need_to_set_index = False
+
+    def _get_xticks(self, convert_period=False):
+        index = self.data.index
+        is_datetype = index.inferred_type in ('datetime', 'date',
+                                              'datetime64', 'time')
+
+        if self.use_index:
+            if convert_period and isinstance(index, PeriodIndex):
+                self.data = self.data.reindex(index=index.sort_values())
+                x = self.data.index.to_timestamp()._mpl_repr()
+            elif index.is_numeric():
+                """
+                Matplotlib supports numeric values or datetime objects as
+                xaxis values. Taking LBYL approach here, by the time
+                matplotlib raises exception when using non numeric/datetime
+                values for xaxis, several actions are already taken by plt.
+                """
+                x = index._mpl_repr()
+            elif is_datetype:
+                self.data = self.data[notna(self.data.index)]
+                self.data = self.data.sort_index()
+                x = self.data.index._mpl_repr()
+            else:
+                self._need_to_set_index = True
+                x = lrange(len(index))
+        else:
+            x = lrange(len(index))
+
+        return x
+
+    @classmethod
+    def _plot(cls, ax, x, y, style=None, is_errorbar=False, **kwds):
+        mask = isna(y)
+        if mask.any():
+            y = np.ma.array(y)
+            y = np.ma.masked_where(mask, y)
+
+        if isinstance(x, Index):
+            x = x._mpl_repr()
+
+        if is_errorbar:
+            if 'xerr' in kwds:
+                kwds['xerr'] = np.array(kwds.get('xerr'))
+            if 'yerr' in kwds:
+                kwds['yerr'] = np.array(kwds.get('yerr'))
+            return ax.errorbar(x, y, **kwds)
+        else:
+            # prevent style kwarg from going to errorbar, where it is
+            # unsupported
+            if style is not None:
+                args = (x, y, style)
+            else:
+                args = (x, y)
+            return ax.plot(*args, **kwds)
+
+    def _get_index_name(self):
+        if isinstance(self.data.index, MultiIndex):
+            name = self.data.index.names
+            if com._any_not_none(*name):
+                name = ','.join(pprint_thing(x) for x in name)
+            else:
+                name = None
+        else:
+            name = self.data.index.name
+            if name is not None:
+                name = pprint_thing(name)
+
+        return name
+
+    @classmethod
+    def _get_ax_layer(cls, ax, primary=True):
+        """get left (primary) or right (secondary) axes"""
+        if primary:
+            return getattr(ax, 'left_ax', ax)
+        else:
+            return getattr(ax, 'right_ax', ax)
+
+    def _get_ax(self, i):
+        # get the twinx ax if appropriate
+        if self.subplots:
+            ax = self.axes[i]
+            ax = self._maybe_right_yaxis(ax, i)
+            self.axes[i] = ax
+        else:
+            ax = self.axes[0]
+            ax = self._maybe_right_yaxis(ax, i)
+
+        ax.get_yaxis().set_visible(True)
+        return ax
+
+    def on_right(self, i):
+        if isinstance(self.secondary_y, bool):
+            return self.secondary_y
+
+        if isinstance(self.secondary_y, (tuple, list, np.ndarray, Index)):
+            return self.data.columns[i] in self.secondary_y
+
+    def _apply_style_colors(self, colors, kwds, col_num, label):
+        """
+        Manage style and color based on column number and its label.
+        Returns tuple of appropriate style and kwds which "color" may be added.
+        """
+        style = None
+        if self.style is not None:
+            if isinstance(self.style, list):
+                try:
+                    style = self.style[col_num]
+                except IndexError:
+                    pass
+            elif isinstance(self.style, dict):
+                style = self.style.get(label, style)
+            else:
+                style = self.style
+
+        has_color = 'color' in kwds or self.colormap is not None
+        nocolor_style = style is None or re.match('[a-z]+', style) is None
+        if (has_color or self.subplots) and nocolor_style:
+            kwds['color'] = colors[col_num % len(colors)]
+        return style, kwds
+
+    def _get_colors(self, num_colors=None, color_kwds='color'):
+        if num_colors is None:
+            num_colors = self.nseries
+
+        return _get_standard_colors(num_colors=num_colors,
+                                    colormap=self.colormap,
+                                    color=self.kwds.get(color_kwds))
+
+    def _parse_errorbars(self, label, err):
+        """
+        Look for error keyword arguments and return the actual errorbar data
+        or return the error DataFrame/dict
+
+        Error bars can be specified in several ways:
+            Series: the user provides a pandas.Series object of the same
+                    length as the data
+            ndarray: provides a np.ndarray of the same length as the data
+            DataFrame/dict: error values are paired with keys matching the
+                    key in the plotted DataFrame
+            str: the name of the column within the plotted DataFrame
+        """
+
+        if err is None:
+            return None
+
+        from pandas import DataFrame, Series
+
+        def match_labels(data, e):
+            e = e.reindex(data.index)
+            return e
+
+        # key-matched DataFrame
+        if isinstance(err, DataFrame):
+
+            err = match_labels(self.data, err)
+        # key-matched dict
+        elif isinstance(err, dict):
+            pass
+
+        # Series of error values
+        elif isinstance(err, Series):
+            # broadcast error series across data
+            err = match_labels(self.data, err)
+            err = np.atleast_2d(err)
+            err = np.tile(err, (self.nseries, 1))
+
+        # errors are a column in the dataframe
+        elif isinstance(err, string_types):
+            evalues = self.data[err].values
+            self.data = self.data[self.data.columns.drop(err)]
+            err = np.atleast_2d(evalues)
+            err = np.tile(err, (self.nseries, 1))
+
+        elif is_list_like(err):
+            if is_iterator(err):
+                err = np.atleast_2d(list(err))
+            else:
+                # raw error values
+                err = np.atleast_2d(err)
+
+            err_shape = err.shape
+
+            # asymmetrical error bars
+            if err.ndim == 3:
+                if (err_shape[0] != self.nseries) or \
+                        (err_shape[1] != 2) or \
+                        (err_shape[2] != len(self.data)):
+                    msg = "Asymmetrical error bars should be provided " + \
+                        "with the shape (%u, 2, %u)" % \
+                        (self.nseries, len(self.data))
+                    raise ValueError(msg)
+
+            # broadcast errors to each data series
+            if len(err) == 1:
+                err = np.tile(err, (self.nseries, 1))
+
+        elif is_number(err):
+            err = np.tile([err], (self.nseries, len(self.data)))
+
+        else:
+            msg = "No valid {label} detected".format(label=label)
+            raise ValueError(msg)
+
+        return err
+
+    def _get_errorbars(self, label=None, index=None, xerr=True, yerr=True):
+        from pandas import DataFrame
+        errors = {}
+
+        for kw, flag in zip(['xerr', 'yerr'], [xerr, yerr]):
+            if flag:
+                err = self.errors[kw]
+                # user provided label-matched dataframe of errors
+                if isinstance(err, (DataFrame, dict)):
+                    if label is not None and label in err.keys():
+                        err = err[label]
+                    else:
+                        err = None
+                elif index is not None and err is not None:
+                    err = err[index]
+
+                if err is not None:
+                    errors[kw] = err
+        return errors
+
+    def _get_subplots(self):
+        from matplotlib.axes import Subplot
+        return [ax for ax in self.axes[0].get_figure().get_axes()
+                if isinstance(ax, Subplot)]
+
+    def _get_axes_layout(self):
+        axes = self._get_subplots()
+        x_set = set()
+        y_set = set()
+        for ax in axes:
+            # check axes coordinates to estimate layout
+            points = ax.get_position().get_points()
+            x_set.add(points[0][0])
+            y_set.add(points[0][1])
+        return (len(y_set), len(x_set))
+
+
+class PlanePlot(MPLPlot):
+    """
+    Abstract class for plotting on plane, currently scatter and hexbin.
+    """
+
+    _layout_type = 'single'
+
+    def __init__(self, data, x, y, **kwargs):
+        MPLPlot.__init__(self, data, **kwargs)
+        if x is None or y is None:
+            raise ValueError(self._kind + ' requires an x and y column')
+        if is_integer(x) and not self.data.columns.holds_integer():
+            x = self.data.columns[x]
+        if is_integer(y) and not self.data.columns.holds_integer():
+            y = self.data.columns[y]
+        if len(self.data[x]._get_numeric_data()) == 0:
+            raise ValueError(self._kind + ' requires x column to be numeric')
+        if len(self.data[y]._get_numeric_data()) == 0:
+            raise ValueError(self._kind + ' requires y column to be numeric')
+
+        self.x = x
+        self.y = y
+
+    @property
+    def nseries(self):
+        return 1
+
+    def _post_plot_logic(self, ax, data):
+        x, y = self.x, self.y
+        ax.set_ylabel(pprint_thing(y))
+        ax.set_xlabel(pprint_thing(x))
+
+
+class ScatterPlot(PlanePlot):
+    _kind = 'scatter'
+
+    def __init__(self, data, x, y, s=None, c=None, **kwargs):
+        if s is None:
+            # hide the matplotlib default for size, in case we want to change
+            # the handling of this argument later
+            s = 20
+        super(ScatterPlot, self).__init__(data, x, y, s=s, **kwargs)
+        if is_integer(c) and not self.data.columns.holds_integer():
+            c = self.data.columns[c]
+        self.c = c
+
+    def _make_plot(self):
+        x, y, c, data = self.x, self.y, self.c, self.data
+        ax = self.axes[0]
+
+        c_is_column = is_hashable(c) and c in self.data.columns
+
+        # plot a colorbar only if a colormap is provided or necessary
+        cb = self.kwds.pop('colorbar', self.colormap or c_is_column)
+
+        # pandas uses colormap, matplotlib uses cmap.
+        cmap = self.colormap or 'Greys'
+        cmap = self.plt.cm.get_cmap(cmap)
+        color = self.kwds.pop("color", None)
+        if c is not None and color is not None:
+            raise TypeError('Specify exactly one of `c` and `color`')
+        elif c is None and color is None:
+            c_values = self.plt.rcParams['patch.facecolor']
+        elif color is not None:
+            c_values = color
+        elif c_is_column:
+            c_values = self.data[c].values
+        else:
+            c_values = c
+
+        if self.legend and hasattr(self, 'label'):
+            label = self.label
+        else:
+            label = None
+        scatter = ax.scatter(data[x].values, data[y].values, c=c_values,
+                             label=label, cmap=cmap, **self.kwds)
+        if cb:
+            img = ax.collections[0]
+            kws = dict(ax=ax)
+            if self.mpl_ge_1_3_1():
+                kws['label'] = c if c_is_column else ''
+            self.fig.colorbar(img, **kws)
+
+        if label is not None:
+            self._add_legend_handle(scatter, label)
+        else:
+            self.legend = False
+
+        errors_x = self._get_errorbars(label=x, index=0, yerr=False)
+        errors_y = self._get_errorbars(label=y, index=0, xerr=False)
+        if len(errors_x) > 0 or len(errors_y) > 0:
+            err_kwds = dict(errors_x, **errors_y)
+            err_kwds['ecolor'] = scatter.get_facecolor()[0]
+            ax.errorbar(data[x].values, data[y].values,
+                        linestyle='none', **err_kwds)
+
+
+class HexBinPlot(PlanePlot):
+    _kind = 'hexbin'
+
+    def __init__(self, data, x, y, C=None, **kwargs):
+        super(HexBinPlot, self).__init__(data, x, y, **kwargs)
+        if is_integer(C) and not self.data.columns.holds_integer():
+            C = self.data.columns[C]
+        self.C = C
+
+    def _make_plot(self):
+        x, y, data, C = self.x, self.y, self.data, self.C
+        ax = self.axes[0]
+        # pandas uses colormap, matplotlib uses cmap.
+        cmap = self.colormap or 'BuGn'
+        cmap = self.plt.cm.get_cmap(cmap)
+        cb = self.kwds.pop('colorbar', True)
+
+        if C is None:
+            c_values = None
+        else:
+            c_values = data[C].values
+
+        ax.hexbin(data[x].values, data[y].values, C=c_values, cmap=cmap,
+                  **self.kwds)
+        if cb:
+            img = ax.collections[0]
+            self.fig.colorbar(img, ax=ax)
+
+    def _make_legend(self):
+        pass
+
+
+class LinePlot(MPLPlot):
+    _kind = 'line'
+    _default_rot = 0
+    orientation = 'vertical'
+
+    def __init__(self, data, **kwargs):
+        MPLPlot.__init__(self, data, **kwargs)
+        if self.stacked:
+            self.data = self.data.fillna(value=0)
+        self.x_compat = plot_params['x_compat']
+        if 'x_compat' in self.kwds:
+            self.x_compat = bool(self.kwds.pop('x_compat'))
+
+    def _is_ts_plot(self):
+        # this is slightly deceptive
+        return not self.x_compat and self.use_index and self._use_dynamic_x()
+
+    def _use_dynamic_x(self):
+        from pandas.plotting._timeseries import _use_dynamic_x
+        return _use_dynamic_x(self._get_ax(0), self.data)
+
+    def _make_plot(self):
+        if self._is_ts_plot():
+            from pandas.plotting._timeseries import _maybe_convert_index
+            data = _maybe_convert_index(self._get_ax(0), self.data)
+
+            x = data.index      # dummy, not used
+            plotf = self._ts_plot
+            it = self._iter_data(data=data, keep_index=True)
+        else:
+            x = self._get_xticks(convert_period=True)
+            plotf = self._plot
+            it = self._iter_data()
+
+        stacking_id = self._get_stacking_id()
+        is_errorbar = com._any_not_none(*self.errors.values())
+
+        colors = self._get_colors()
+        for i, (label, y) in enumerate(it):
+            ax = self._get_ax(i)
+            kwds = self.kwds.copy()
+            style, kwds = self._apply_style_colors(colors, kwds, i, label)
+
+            errors = self._get_errorbars(label=label, index=i)
+            kwds = dict(kwds, **errors)
+
+            label = pprint_thing(label)  # .encode('utf-8')
+            kwds['label'] = label
+
+            newlines = plotf(ax, x, y, style=style, column_num=i,
+                             stacking_id=stacking_id,
+                             is_errorbar=is_errorbar,
+                             **kwds)
+            self._add_legend_handle(newlines[0], label, index=i)
+
+            if not _mpl_ge_2_0_0():
+                lines = _get_all_lines(ax)
+                left, right = _get_xlim(lines)
+                ax.set_xlim(left, right)
+
+    @classmethod
+    def _plot(cls, ax, x, y, style=None, column_num=None,
+              stacking_id=None, **kwds):
+        # column_num is used to get the target column from protf in line and
+        # area plots
+        if column_num == 0:
+            cls._initialize_stacker(ax, stacking_id, len(y))
+        y_values = cls._get_stacked_values(ax, stacking_id, y, kwds['label'])
+        lines = MPLPlot._plot(ax, x, y_values, style=style, **kwds)
+        cls._update_stacker(ax, stacking_id, y)
+        return lines
+
+    @classmethod
+    def _ts_plot(cls, ax, x, data, style=None, **kwds):
+        from pandas.plotting._timeseries import (_maybe_resample,
+                                                 _decorate_axes,
+                                                 format_dateaxis)
+        # accept x to be consistent with normal plot func,
+        # x is not passed to tsplot as it uses data.index as x coordinate
+        # column_num must be in kwds for stacking purpose
+        freq, data = _maybe_resample(data, ax, kwds)
+
+        # Set ax with freq info
+        _decorate_axes(ax, freq, kwds)
+        # digging deeper
+        if hasattr(ax, 'left_ax'):
+            _decorate_axes(ax.left_ax, freq, kwds)
+        if hasattr(ax, 'right_ax'):
+            _decorate_axes(ax.right_ax, freq, kwds)
+        ax._plot_data.append((data, cls._kind, kwds))
+
+        lines = cls._plot(ax, data.index, data.values, style=style, **kwds)
+        # set date formatter, locators and rescale limits
+        format_dateaxis(ax, ax.freq, data.index)
+        return lines
+
+    def _get_stacking_id(self):
+        if self.stacked:
+            return id(self.data)
+        else:
+            return None
+
+    @classmethod
+    def _initialize_stacker(cls, ax, stacking_id, n):
+        if stacking_id is None:
+            return
+        if not hasattr(ax, '_stacker_pos_prior'):
+            ax._stacker_pos_prior = {}
+        if not hasattr(ax, '_stacker_neg_prior'):
+            ax._stacker_neg_prior = {}
+        ax._stacker_pos_prior[stacking_id] = np.zeros(n)
+        ax._stacker_neg_prior[stacking_id] = np.zeros(n)
+
+    @classmethod
+    def _get_stacked_values(cls, ax, stacking_id, values, label):
+        if stacking_id is None:
+            return values
+        if not hasattr(ax, '_stacker_pos_prior'):
+            # stacker may not be initialized for subplots
+            cls._initialize_stacker(ax, stacking_id, len(values))
+
+        if (values >= 0).all():
+            return ax._stacker_pos_prior[stacking_id] + values
+        elif (values <= 0).all():
+            return ax._stacker_neg_prior[stacking_id] + values
+
+        raise ValueError('When stacked is True, each column must be either '
+                         'all positive or negative.'
+                         '{0} contains both positive and negative values'
+                         .format(label))
+
+    @classmethod
+    def _update_stacker(cls, ax, stacking_id, values):
+        if stacking_id is None:
+            return
+        if (values >= 0).all():
+            ax._stacker_pos_prior[stacking_id] += values
+        elif (values <= 0).all():
+            ax._stacker_neg_prior[stacking_id] += values
+
+    def _post_plot_logic(self, ax, data):
+        condition = (not self._use_dynamic_x() and
+                     data.index.is_all_dates and
+                     not self.subplots or
+                     (self.subplots and self.sharex))
+
+        index_name = self._get_index_name()
+
+        if condition:
+            # irregular TS rotated 30 deg. by default
+            # probably a better place to check / set this.
+            if not self._rot_set:
+                self.rot = 30
+            format_date_labels(ax, rot=self.rot)
+
+        if index_name is not None and self.use_index:
+            ax.set_xlabel(index_name)
+
+
+class AreaPlot(LinePlot):
+    _kind = 'area'
+
+    def __init__(self, data, **kwargs):
+        kwargs.setdefault('stacked', True)
+        data = data.fillna(value=0)
+        LinePlot.__init__(self, data, **kwargs)
+
+        if not self.stacked:
+            # use smaller alpha to distinguish overlap
+            self.kwds.setdefault('alpha', 0.5)
+
+        if self.logy or self.loglog:
+            raise ValueError("Log-y scales are not supported in area plot")
+
+    @classmethod
+    def _plot(cls, ax, x, y, style=None, column_num=None,
+              stacking_id=None, is_errorbar=False, **kwds):
+
+        if column_num == 0:
+            cls._initialize_stacker(ax, stacking_id, len(y))
+        y_values = cls._get_stacked_values(ax, stacking_id, y, kwds['label'])
+
+        # need to remove label, because subplots uses mpl legend as it is
+        line_kwds = kwds.copy()
+        if cls.mpl_ge_1_5_0():
+            line_kwds.pop('label')
+        lines = MPLPlot._plot(ax, x, y_values, style=style, **line_kwds)
+
+        # get data from the line to get coordinates for fill_between
+        xdata, y_values = lines[0].get_data(orig=False)
+
+        # unable to use ``_get_stacked_values`` here to get starting point
+        if stacking_id is None:
+            start = np.zeros(len(y))
+        elif (y >= 0).all():
+            start = ax._stacker_pos_prior[stacking_id]
+        elif (y <= 0).all():
+            start = ax._stacker_neg_prior[stacking_id]
+        else:
+            start = np.zeros(len(y))
+
+        if 'color' not in kwds:
+            kwds['color'] = lines[0].get_color()
+
+        rect = ax.fill_between(xdata, start, y_values, **kwds)
+        cls._update_stacker(ax, stacking_id, y)
+
+        # LinePlot expects list of artists
+        res = [rect] if cls.mpl_ge_1_5_0() else lines
+        return res
+
+    def _add_legend_handle(self, handle, label, index=None):
+        if not self.mpl_ge_1_5_0():
+            from matplotlib.patches import Rectangle
+            # Because fill_between isn't supported in legend,
+            # specifically add Rectangle handle here
+            alpha = self.kwds.get('alpha', None)
+            handle = Rectangle((0, 0), 1, 1, fc=handle.get_color(),
+                               alpha=alpha)
+        LinePlot._add_legend_handle(self, handle, label, index=index)
+
+    def _post_plot_logic(self, ax, data):
+        LinePlot._post_plot_logic(self, ax, data)
+
+        if self.ylim is None:
+            if (data >= 0).all().all():
+                ax.set_ylim(0, None)
+            elif (data <= 0).all().all():
+                ax.set_ylim(None, 0)
+
+
+class BarPlot(MPLPlot):
+    _kind = 'bar'
+    _default_rot = 90
+    orientation = 'vertical'
+
+    def __init__(self, data, **kwargs):
+        # we have to treat a series differently than a
+        # 1-column DataFrame w.r.t. color handling
+        self._is_series = isinstance(data, ABCSeries)
+        self.bar_width = kwargs.pop('width', 0.5)
+        pos = kwargs.pop('position', 0.5)
+        kwargs.setdefault('align', 'center')
+        self.tick_pos = np.arange(len(data))
+
+        self.bottom = kwargs.pop('bottom', 0)
+        self.left = kwargs.pop('left', 0)
+
+        self.log = kwargs.pop('log', False)
+        MPLPlot.__init__(self, data, **kwargs)
+
+        if self.stacked or self.subplots:
+            self.tickoffset = self.bar_width * pos
+            if kwargs['align'] == 'edge':
+                self.lim_offset = self.bar_width / 2
+            else:
+                self.lim_offset = 0
+        else:
+            if kwargs['align'] == 'edge':
+                w = self.bar_width / self.nseries
+                self.tickoffset = self.bar_width * (pos - 0.5) + w * 0.5
+                self.lim_offset = w * 0.5
+            else:
+                self.tickoffset = self.bar_width * pos
+                self.lim_offset = 0
+
+        self.ax_pos = self.tick_pos - self.tickoffset
+
+    def _args_adjust(self):
+        if is_list_like(self.bottom):
+            self.bottom = np.array(self.bottom)
+        if is_list_like(self.left):
+            self.left = np.array(self.left)
+
+    @classmethod
+    def _plot(cls, ax, x, y, w, start=0, log=False, **kwds):
+        return ax.bar(x, y, w, bottom=start, log=log, **kwds)
+
+    @property
+    def _start_base(self):
+        return self.bottom
+
+    def _make_plot(self):
+        import matplotlib as mpl
+
+        colors = self._get_colors()
+        ncolors = len(colors)
+
+        pos_prior = neg_prior = np.zeros(len(self.data))
+        K = self.nseries
+
+        for i, (label, y) in enumerate(self._iter_data(fillna=0)):
+            ax = self._get_ax(i)
+            kwds = self.kwds.copy()
+            if self._is_series:
+                kwds['color'] = colors
+            else:
+                kwds['color'] = colors[i % ncolors]
+
+            errors = self._get_errorbars(label=label, index=i)
+            kwds = dict(kwds, **errors)
+
+            label = pprint_thing(label)
+
+            if (('yerr' in kwds) or ('xerr' in kwds)) \
+                    and (kwds.get('ecolor') is None):
+                kwds['ecolor'] = mpl.rcParams['xtick.color']
+
+            start = 0
+            if self.log and (y >= 1).all():
+                start = 1
+            start = start + self._start_base
+
+            if self.subplots:
+                w = self.bar_width / 2
+                rect = self._plot(ax, self.ax_pos + w, y, self.bar_width,
+                                  start=start, label=label,
+                                  log=self.log, **kwds)
+                ax.set_title(label)
+            elif self.stacked:
+                mask = y > 0
+                start = np.where(mask, pos_prior, neg_prior) + self._start_base
+                w = self.bar_width / 2
+                rect = self._plot(ax, self.ax_pos + w, y, self.bar_width,
+                                  start=start, label=label,
+                                  log=self.log, **kwds)
+                pos_prior = pos_prior + np.where(mask, y, 0)
+                neg_prior = neg_prior + np.where(mask, 0, y)
+            else:
+                w = self.bar_width / K
+                rect = self._plot(ax, self.ax_pos + (i + 0.5) * w, y, w,
+                                  start=start, label=label,
+                                  log=self.log, **kwds)
+            self._add_legend_handle(rect, label, index=i)
+
+    def _post_plot_logic(self, ax, data):
+        if self.use_index:
+            str_index = [pprint_thing(key) for key in data.index]
+        else:
+            str_index = [pprint_thing(key) for key in range(data.shape[0])]
+        name = self._get_index_name()
+
+        s_edge = self.ax_pos[0] - 0.25 + self.lim_offset
+        e_edge = self.ax_pos[-1] + 0.25 + self.bar_width + self.lim_offset
+
+        self._decorate_ticks(ax, name, str_index, s_edge, e_edge)
+
+    def _decorate_ticks(self, ax, name, ticklabels, start_edge, end_edge):
+        ax.set_xlim((start_edge, end_edge))
+        ax.set_xticks(self.tick_pos)
+        ax.set_xticklabels(ticklabels)
+        if name is not None and self.use_index:
+            ax.set_xlabel(name)
+
+
+class BarhPlot(BarPlot):
+    _kind = 'barh'
+    _default_rot = 0
+    orientation = 'horizontal'
+
+    @property
+    def _start_base(self):
+        return self.left
+
+    @classmethod
+    def _plot(cls, ax, x, y, w, start=0, log=False, **kwds):
+        return ax.barh(x, y, w, left=start, log=log, **kwds)
+
+    def _decorate_ticks(self, ax, name, ticklabels, start_edge, end_edge):
+        # horizontal bars
+        ax.set_ylim((start_edge, end_edge))
+        ax.set_yticks(self.tick_pos)
+        ax.set_yticklabels(ticklabels)
+        if name is not None and self.use_index:
+            ax.set_ylabel(name)
+
+
+class HistPlot(LinePlot):
+    _kind = 'hist'
+
+    def __init__(self, data, bins=10, bottom=0, **kwargs):
+        self.bins = bins        # use mpl default
+        self.bottom = bottom
+        # Do not call LinePlot.__init__ which may fill nan
+        MPLPlot.__init__(self, data, **kwargs)
+
+    def _args_adjust(self):
+        if is_integer(self.bins):
+            # create common bin edge
+            values = (self.data._convert(datetime=True)._get_numeric_data())
+            values = np.ravel(values)
+            values = values[~isna(values)]
+
+            hist, self.bins = np.histogram(
+                values, bins=self.bins,
+                range=self.kwds.get('range', None),
+                weights=self.kwds.get('weights', None))
+
+        if is_list_like(self.bottom):
+            self.bottom = np.array(self.bottom)
+
+    @classmethod
+    def _plot(cls, ax, y, style=None, bins=None, bottom=0, column_num=0,
+              stacking_id=None, **kwds):
+        if column_num == 0:
+            cls._initialize_stacker(ax, stacking_id, len(bins) - 1)
+        y = y[~isna(y)]
+
+        base = np.zeros(len(bins) - 1)
+        bottom = bottom + \
+            cls._get_stacked_values(ax, stacking_id, base, kwds['label'])
+        # ignore style
+        n, bins, patches = ax.hist(y, bins=bins, bottom=bottom, **kwds)
+        cls._update_stacker(ax, stacking_id, n)
+        return patches
+
+    def _make_plot(self):
+        colors = self._get_colors()
+        stacking_id = self._get_stacking_id()
+
+        for i, (label, y) in enumerate(self._iter_data()):
+            ax = self._get_ax(i)
+
+            kwds = self.kwds.copy()
+
+            label = pprint_thing(label)
+            kwds['label'] = label
+
+            style, kwds = self._apply_style_colors(colors, kwds, i, label)
+            if style is not None:
+                kwds['style'] = style
+
+            kwds = self._make_plot_keywords(kwds, y)
+            artists = self._plot(ax, y, column_num=i,
+                                 stacking_id=stacking_id, **kwds)
+            self._add_legend_handle(artists[0], label, index=i)
+
+    def _make_plot_keywords(self, kwds, y):
+        """merge BoxPlot/KdePlot properties to passed kwds"""
+        # y is required for KdePlot
+        kwds['bottom'] = self.bottom
+        kwds['bins'] = self.bins
+        return kwds
+
+    def _post_plot_logic(self, ax, data):
+        if self.orientation == 'horizontal':
+            ax.set_xlabel('Frequency')
+        else:
+            ax.set_ylabel('Frequency')
+
+    @property
+    def orientation(self):
+        if self.kwds.get('orientation', None) == 'horizontal':
+            return 'horizontal'
+        else:
+            return 'vertical'
+
+
+_kde_docstring = """
+        Generate Kernel Density Estimate plot using Gaussian kernels.
+
+        In statistics, `kernel density estimation`_ (KDE) is a non-parametric
+        way to estimate the probability density function (PDF) of a random
+        variable. This function uses Gaussian kernels and includes automatic
+        bandwidth determination.
+
+        .. _kernel density estimation:
+            https://en.wikipedia.org/wiki/Kernel_density_estimation
+
+        Parameters
+        ----------
+        bw_method : str, scalar or callable, optional
+            The method used to calculate the estimator bandwidth. This can be
+            'scott', 'silverman', a scalar constant or a callable.
+            If None (default), 'scott' is used.
+            See :class:`scipy.stats.gaussian_kde` for more information.
+        ind : NumPy array or integer, optional
+            Evaluation points for the estimated PDF. If None (default),
+            1000 equally spaced points are used. If `ind` is a NumPy array, the
+            KDE is evaluated at the points passed. If `ind` is an integer,
+            `ind` number of equally spaced points are used.
+        **kwds : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.%(this-datatype)s.plot`.
+
+        Returns
+        -------
+        axes : matplotlib.axes.Axes or numpy.ndarray of them
+
+        See Also
+        --------
+        scipy.stats.gaussian_kde : Representation of a kernel-density
+            estimate using Gaussian kernels. This is the function used
+            internally to estimate the PDF.
+        %(sibling-datatype)s.plot.kde : Generate a KDE plot for a
+            %(sibling-datatype)s.
+
+        Examples
+        --------
+        %(examples)s
+        """
+
+
+class KdePlot(HistPlot):
+    _kind = 'kde'
+    orientation = 'vertical'
+
+    def __init__(self, data, bw_method=None, ind=None, **kwargs):
+        MPLPlot.__init__(self, data, **kwargs)
+        self.bw_method = bw_method
+        self.ind = ind
+
+    def _args_adjust(self):
+        pass
+
+    def _get_ind(self, y):
+        if self.ind is None:
+            # np.nanmax() and np.nanmin() ignores the missing values
+            sample_range = np.nanmax(y) - np.nanmin(y)
+            ind = np.linspace(np.nanmin(y) - 0.5 * sample_range,
+                              np.nanmax(y) + 0.5 * sample_range, 1000)
+        elif is_integer(self.ind):
+            sample_range = np.nanmax(y) - np.nanmin(y)
+            ind = np.linspace(np.nanmin(y) - 0.5 * sample_range,
+                              np.nanmax(y) + 0.5 * sample_range, self.ind)
+        else:
+            ind = self.ind
+        return ind
+
+    @classmethod
+    def _plot(cls, ax, y, style=None, bw_method=None, ind=None,
+              column_num=None, stacking_id=None, **kwds):
+        from scipy.stats import gaussian_kde
+        from scipy import __version__ as spv
+
+        y = remove_na_arraylike(y)
+
+        if LooseVersion(spv) >= '0.11.0':
+            gkde = gaussian_kde(y, bw_method=bw_method)
+        else:
+            gkde = gaussian_kde(y)
+            if bw_method is not None:
+                msg = ('bw_method was added in Scipy 0.11.0.' +
+                       ' Scipy version in use is {spv}.'.format(spv=spv))
+                warnings.warn(msg)
+
+        y = gkde.evaluate(ind)
+        lines = MPLPlot._plot(ax, ind, y, style=style, **kwds)
+        return lines
+
+    def _make_plot_keywords(self, kwds, y):
+        kwds['bw_method'] = self.bw_method
+        kwds['ind'] = self._get_ind(y)
+        return kwds
+
+    def _post_plot_logic(self, ax, data):
+        ax.set_ylabel('Density')
+
+
+class PiePlot(MPLPlot):
+    _kind = 'pie'
+    _layout_type = 'horizontal'
+
+    def __init__(self, data, kind=None, **kwargs):
+        data = data.fillna(value=0)
+        if (data < 0).any().any():
+            raise ValueError("{0} doesn't allow negative values".format(kind))
+        MPLPlot.__init__(self, data, kind=kind, **kwargs)
+
+    def _args_adjust(self):
+        self.grid = False
+        self.logy = False
+        self.logx = False
+        self.loglog = False
+
+    def _validate_color_args(self):
+        pass
+
+    def _make_plot(self):
+        colors = self._get_colors(
+            num_colors=len(self.data), color_kwds='colors')
+        self.kwds.setdefault('colors', colors)
+
+        for i, (label, y) in enumerate(self._iter_data()):
+            ax = self._get_ax(i)
+            if label is not None:
+                label = pprint_thing(label)
+                ax.set_ylabel(label)
+
+            kwds = self.kwds.copy()
+
+            def blank_labeler(label, value):
+                if value == 0:
+                    return ''
+                else:
+                    return label
+
+            idx = [pprint_thing(v) for v in self.data.index]
+            labels = kwds.pop('labels', idx)
+            # labels is used for each wedge's labels
+            # Blank out labels for values of 0 so they don't overlap
+            # with nonzero wedges
+            if labels is not None:
+                blabels = [blank_labeler(l, value) for
+                           l, value in zip(labels, y)]
+            else:
+                blabels = None
+            results = ax.pie(y, labels=blabels, **kwds)
+
+            if kwds.get('autopct', None) is not None:
+                patches, texts, autotexts = results
+            else:
+                patches, texts = results
+                autotexts = []
+
+            if self.fontsize is not None:
+                for t in texts + autotexts:
+                    t.set_fontsize(self.fontsize)
+
+            # leglabels is used for legend labels
+            leglabels = labels if labels is not None else idx
+            for p, l in zip(patches, leglabels):
+                self._add_legend_handle(p, l)
+
+
+class BoxPlot(LinePlot):
+    _kind = 'box'
+    _layout_type = 'horizontal'
+
+    _valid_return_types = (None, 'axes', 'dict', 'both')
+    # namedtuple to hold results
+    BP = namedtuple("Boxplot", ['ax', 'lines'])
+
+    def __init__(self, data, return_type='axes', **kwargs):
+        # Do not call LinePlot.__init__ which may fill nan
+        if return_type not in self._valid_return_types:
+            raise ValueError(
+                "return_type must be {None, 'axes', 'dict', 'both'}")
+
+        self.return_type = return_type
+        MPLPlot.__init__(self, data, **kwargs)
+
+    def _args_adjust(self):
+        if self.subplots:
+            # Disable label ax sharing. Otherwise, all subplots shows last
+            # column label
+            if self.orientation == 'vertical':
+                self.sharex = False
+            else:
+                self.sharey = False
+
+    @classmethod
+    def _plot(cls, ax, y, column_num=None, return_type='axes', **kwds):
+        if y.ndim == 2:
+            y = [remove_na_arraylike(v) for v in y]
+            # Boxplot fails with empty arrays, so need to add a NaN
+            #   if any cols are empty
+            # GH 8181
+            y = [v if v.size > 0 else np.array([np.nan]) for v in y]
+        else:
+            y = remove_na_arraylike(y)
+        bp = ax.boxplot(y, **kwds)
+
+        if return_type == 'dict':
+            return bp, bp
+        elif return_type == 'both':
+            return cls.BP(ax=ax, lines=bp), bp
+        else:
+            return ax, bp
+
+    def _validate_color_args(self):
+        if 'color' in self.kwds:
+            if self.colormap is not None:
+                warnings.warn("'color' and 'colormap' cannot be used "
+                              "simultaneously. Using 'color'")
+            self.color = self.kwds.pop('color')
+
+            if isinstance(self.color, dict):
+                valid_keys = ['boxes', 'whiskers', 'medians', 'caps']
+                for key, values in compat.iteritems(self.color):
+                    if key not in valid_keys:
+                        raise ValueError("color dict contains invalid "
+                                         "key '{0}' "
+                                         "The key must be either {1}"
+                                         .format(key, valid_keys))
+        else:
+            self.color = None
+
+        # get standard colors for default
+        colors = _get_standard_colors(num_colors=3,
+                                      colormap=self.colormap,
+                                      color=None)
+        # use 2 colors by default, for box/whisker and median
+        # flier colors isn't needed here
+        # because it can be specified by ``sym`` kw
+        self._boxes_c = colors[0]
+        self._whiskers_c = colors[0]
+        self._medians_c = colors[2]
+        self._caps_c = 'k'          # mpl default
+
+    def _get_colors(self, num_colors=None, color_kwds='color'):
+        pass
+
+    def maybe_color_bp(self, bp):
+        if isinstance(self.color, dict):
+            boxes = self.color.get('boxes', self._boxes_c)
+            whiskers = self.color.get('whiskers', self._whiskers_c)
+            medians = self.color.get('medians', self._medians_c)
+            caps = self.color.get('caps', self._caps_c)
+        else:
+            # Other types are forwarded to matplotlib
+            # If None, use default colors
+            boxes = self.color or self._boxes_c
+            whiskers = self.color or self._whiskers_c
+            medians = self.color or self._medians_c
+            caps = self.color or self._caps_c
+
+        from matplotlib.artist import setp
+        setp(bp['boxes'], color=boxes, alpha=1)
+        setp(bp['whiskers'], color=whiskers, alpha=1)
+        setp(bp['medians'], color=medians, alpha=1)
+        setp(bp['caps'], color=caps, alpha=1)
+
+    def _make_plot(self):
+        if self.subplots:
+            from pandas.core.series import Series
+            self._return_obj = Series()
+
+            for i, (label, y) in enumerate(self._iter_data()):
+                ax = self._get_ax(i)
+                kwds = self.kwds.copy()
+
+                ret, bp = self._plot(ax, y, column_num=i,
+                                     return_type=self.return_type, **kwds)
+                self.maybe_color_bp(bp)
+                self._return_obj[label] = ret
+
+                label = [pprint_thing(label)]
+                self._set_ticklabels(ax, label)
+        else:
+            y = self.data.values.T
+            ax = self._get_ax(0)
+            kwds = self.kwds.copy()
+
+            ret, bp = self._plot(ax, y, column_num=0,
+                                 return_type=self.return_type, **kwds)
+            self.maybe_color_bp(bp)
+            self._return_obj = ret
+
+            labels = [l for l, _ in self._iter_data()]
+            labels = [pprint_thing(l) for l in labels]
+            if not self.use_index:
+                labels = [pprint_thing(key) for key in range(len(labels))]
+            self._set_ticklabels(ax, labels)
+
+    def _set_ticklabels(self, ax, labels):
+        if self.orientation == 'vertical':
+            ax.set_xticklabels(labels)
+        else:
+            ax.set_yticklabels(labels)
+
+    def _make_legend(self):
+        pass
+
+    def _post_plot_logic(self, ax, data):
+        pass
+
+    @property
+    def orientation(self):
+        if self.kwds.get('vert', True):
+            return 'vertical'
+        else:
+            return 'horizontal'
+
+    @property
+    def result(self):
+        if self.return_type is None:
+            return super(BoxPlot, self).result
+        else:
+            return self._return_obj
+
+
+# kinds supported by both dataframe and series
+_common_kinds = ['line', 'bar', 'barh',
+                 'kde', 'density', 'area', 'hist', 'box']
+# kinds supported by dataframe
+_dataframe_kinds = ['scatter', 'hexbin']
+# kinds supported only by series or dataframe single column
+_series_kinds = ['pie']
+_all_kinds = _common_kinds + _dataframe_kinds + _series_kinds
+
+_klasses = [LinePlot, BarPlot, BarhPlot, KdePlot, HistPlot, BoxPlot,
+            ScatterPlot, HexBinPlot, AreaPlot, PiePlot]
+
+_plot_klass = {}
+for klass in _klasses:
+    _plot_klass[klass._kind] = klass
+
+
+def _plot(data, x=None, y=None, subplots=False,
+          ax=None, kind='line', **kwds):
+    kind = _get_standard_kind(kind.lower().strip())
+    if kind in _all_kinds:
+        klass = _plot_klass[kind]
+    else:
+        raise ValueError("%r is not a valid plot kind" % kind)
+
+    if kind in _dataframe_kinds:
+        if isinstance(data, ABCDataFrame):
+            plot_obj = klass(data, x=x, y=y, subplots=subplots, ax=ax,
+                             kind=kind, **kwds)
+        else:
+            raise ValueError("plot kind %r can only be used for data frames"
+                             % kind)
+
+    elif kind in _series_kinds:
+        if isinstance(data, ABCDataFrame):
+            if y is None and subplots is False:
+                msg = "{0} requires either y column or 'subplots=True'"
+                raise ValueError(msg.format(kind))
+            elif y is not None:
+                if is_integer(y) and not data.columns.holds_integer():
+                    y = data.columns[y]
+                # converted to series actually. copy to not modify
+                data = data[y].copy()
+                data.index.name = y
+        plot_obj = klass(data, subplots=subplots, ax=ax, kind=kind, **kwds)
+    else:
+        if isinstance(data, ABCDataFrame):
+            data_cols = data.columns
+            if x is not None:
+                if is_integer(x) and not data.columns.holds_integer():
+                    x = data_cols[x]
+                elif not isinstance(data[x], ABCSeries):
+                    raise ValueError("x must be a label or position")
+                data = data.set_index(x)
+
+            if y is not None:
+                # check if we have y as int or list of ints
+                int_ylist = is_list_like(y) and all(is_integer(c) for c in y)
+                int_y_arg = is_integer(y) or int_ylist
+                if int_y_arg and not data.columns.holds_integer():
+                    y = data_cols[y]
+
+                label_kw = kwds['label'] if 'label' in kwds else False
+                for kw in ['xerr', 'yerr']:
+                    if (kw in kwds) and \
+                        (isinstance(kwds[kw], string_types) or
+                            is_integer(kwds[kw])):
+                        try:
+                            kwds[kw] = data[kwds[kw]]
+                        except (IndexError, KeyError, TypeError):
+                            pass
+
+                # don't overwrite
+                data = data[y].copy()
+
+                if isinstance(data, ABCSeries):
+                    label_name = label_kw or y
+                    data.name = label_name
+                else:
+                    match = is_list_like(label_kw) and len(label_kw) == len(y)
+                    if label_kw and not match:
+                        raise ValueError(
+                            "label should be list-like and same length as y"
+                        )
+                    label_name = label_kw or data.columns
+                    data.columns = label_name
+
+        plot_obj = klass(data, subplots=subplots, ax=ax, kind=kind, **kwds)
+
+    plot_obj.generate()
+    plot_obj.draw()
+    return plot_obj.result
+
+
+df_kind = """- 'scatter' : scatter plot
+        - 'hexbin' : hexbin plot"""
+series_kind = ""
+
+df_coord = """x : label or position, default None
+    y : label, position or list of label, positions, default None
+        Allows plotting of one column versus another"""
+series_coord = ""
+
+df_unique = """stacked : boolean, default False in line and
+        bar plots, and True in area plot. If True, create stacked plot.
+    sort_columns : boolean, default False
+        Sort column names to determine plot ordering
+    secondary_y : boolean or sequence, default False
+        Whether to plot on the secondary y-axis
+        If a list/tuple, which columns to plot on secondary y-axis"""
+series_unique = """label : label argument to provide to plot
+    secondary_y : boolean or sequence of ints, default False
+        If True then y-axis will be on the right"""
+
+df_ax = """ax : matplotlib axes object, default None
+    subplots : boolean, default False
+        Make separate subplots for each column
+    sharex : boolean, default True if ax is None else False
+        In case subplots=True, share x axis and set some x axis labels to
+        invisible; defaults to True if ax is None otherwise False if an ax
+        is passed in; Be aware, that passing in both an ax and sharex=True
+        will alter all x axis labels for all axis in a figure!
+    sharey : boolean, default False
+        In case subplots=True, share y axis and set some y axis labels to
+        invisible
+    layout : tuple (optional)
+        (rows, columns) for the layout of subplots"""
+series_ax = """ax : matplotlib axes object
+        If not passed, uses gca()"""
+
+df_note = """- If `kind` = 'scatter' and the argument `c` is the name of a dataframe
+      column, the values of that column are used to color each point.
+    - If `kind` = 'hexbin', you can control the size of the bins with the
+      `gridsize` argument. By default, a histogram of the counts around each
+      `(x, y)` point is computed. You can specify alternative aggregations
+      by passing values to the `C` and `reduce_C_function` arguments.
+      `C` specifies the value at each `(x, y)` point and `reduce_C_function`
+      is a function of one argument that reduces all the values in a bin to
+      a single number (e.g. `mean`, `max`, `sum`, `std`)."""
+series_note = ""
+
+_shared_doc_df_kwargs = dict(klass='DataFrame', klass_obj='df',
+                             klass_kind=df_kind, klass_coord=df_coord,
+                             klass_ax=df_ax, klass_unique=df_unique,
+                             klass_note=df_note)
+_shared_doc_series_kwargs = dict(klass='Series', klass_obj='s',
+                                 klass_kind=series_kind,
+                                 klass_coord=series_coord, klass_ax=series_ax,
+                                 klass_unique=series_unique,
+                                 klass_note=series_note)
+
+_shared_docs['plot'] = """
+    Make plots of %(klass)s using matplotlib / pylab.
+
+    *New in version 0.17.0:* Each plot kind has a corresponding method on the
+    ``%(klass)s.plot`` accessor:
+    ``%(klass_obj)s.plot(kind='line')`` is equivalent to
+    ``%(klass_obj)s.plot.line()``.
+
+    Parameters
+    ----------
+    data : %(klass)s
+    %(klass_coord)s
+    kind : str
+        - 'line' : line plot (default)
+        - 'bar' : vertical bar plot
+        - 'barh' : horizontal bar plot
+        - 'hist' : histogram
+        - 'box' : boxplot
+        - 'kde' : Kernel Density Estimation plot
+        - 'density' : same as 'kde'
+        - 'area' : area plot
+        - 'pie' : pie plot
+        %(klass_kind)s
+    %(klass_ax)s
+    figsize : a tuple (width, height) in inches
+    use_index : boolean, default True
+        Use index as ticks for x axis
+    title : string or list
+        Title to use for the plot. If a string is passed, print the string at
+        the top of the figure. If a list is passed and `subplots` is True,
+        print each item in the list above the corresponding subplot.
+    grid : boolean, default None (matlab style default)
+        Axis grid lines
+    legend : False/True/'reverse'
+        Place legend on axis subplots
+    style : list or dict
+        matplotlib line style per column
+    logx : boolean, default False
+        Use log scaling on x axis
+    logy : boolean, default False
+        Use log scaling on y axis
+    loglog : boolean, default False
+        Use log scaling on both x and y axes
+    xticks : sequence
+        Values to use for the xticks
+    yticks : sequence
+        Values to use for the yticks
+    xlim : 2-tuple/list
+    ylim : 2-tuple/list
+    rot : int, default None
+        Rotation for ticks (xticks for vertical, yticks for horizontal plots)
+    fontsize : int, default None
+        Font size for xticks and yticks
+    colormap : str or matplotlib colormap object, default None
+        Colormap to select colors from. If string, load colormap with that name
+        from matplotlib.
+    colorbar : boolean, optional
+        If True, plot colorbar (only relevant for 'scatter' and 'hexbin' plots)
+    position : float
+        Specify relative alignments for bar plot layout.
+        From 0 (left/bottom-end) to 1 (right/top-end). Default is 0.5 (center)
+    table : boolean, Series or DataFrame, default False
+        If True, draw a table using the data in the DataFrame and the data will
+        be transposed to meet matplotlib's default layout.
+        If a Series or DataFrame is passed, use passed data to draw a table.
+    yerr : DataFrame, Series, array-like, dict and str
+        See :ref:`Plotting with Error Bars <visualization.errorbars>` for
+        detail.
+    xerr : same types as yerr.
+    %(klass_unique)s
+    mark_right : boolean, default True
+        When using a secondary_y axis, automatically mark the column
+        labels with "(right)" in the legend
+    `**kwds` : keywords
+        Options to pass to matplotlib plotting method
+
+    Returns
+    -------
+    axes : :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+
+    Notes
+    -----
+
+    - See matplotlib documentation online for more on this subject
+    - If `kind` = 'bar' or 'barh', you can specify relative alignments
+      for bar plot layout by `position` keyword.
+      From 0 (left/bottom-end) to 1 (right/top-end). Default is 0.5 (center)
+    %(klass_note)s
+
+    """
+
+
+@Appender(_shared_docs['plot'] % _shared_doc_df_kwargs)
+def plot_frame(data, x=None, y=None, kind='line', ax=None,
+               subplots=False, sharex=None, sharey=False, layout=None,
+               figsize=None, use_index=True, title=None, grid=None,
+               legend=True, style=None, logx=False, logy=False, loglog=False,
+               xticks=None, yticks=None, xlim=None, ylim=None,
+               rot=None, fontsize=None, colormap=None, table=False,
+               yerr=None, xerr=None,
+               secondary_y=False, sort_columns=False,
+               **kwds):
+    return _plot(data, kind=kind, x=x, y=y, ax=ax,
+                 subplots=subplots, sharex=sharex, sharey=sharey,
+                 layout=layout, figsize=figsize, use_index=use_index,
+                 title=title, grid=grid, legend=legend,
+                 style=style, logx=logx, logy=logy, loglog=loglog,
+                 xticks=xticks, yticks=yticks, xlim=xlim, ylim=ylim,
+                 rot=rot, fontsize=fontsize, colormap=colormap, table=table,
+                 yerr=yerr, xerr=xerr,
+                 secondary_y=secondary_y, sort_columns=sort_columns,
+                 **kwds)
+
+
+@Appender(_shared_docs['plot'] % _shared_doc_series_kwargs)
+def plot_series(data, kind='line', ax=None,                    # Series unique
+                figsize=None, use_index=True, title=None, grid=None,
+                legend=False, style=None, logx=False, logy=False, loglog=False,
+                xticks=None, yticks=None, xlim=None, ylim=None,
+                rot=None, fontsize=None, colormap=None, table=False,
+                yerr=None, xerr=None,
+                label=None, secondary_y=False,                 # Series unique
+                **kwds):
+
+    import matplotlib.pyplot as plt
+    if ax is None and len(plt.get_fignums()) > 0:
+        ax = _gca()
+        ax = MPLPlot._get_ax_layer(ax)
+    return _plot(data, kind=kind, ax=ax,
+                 figsize=figsize, use_index=use_index, title=title,
+                 grid=grid, legend=legend,
+                 style=style, logx=logx, logy=logy, loglog=loglog,
+                 xticks=xticks, yticks=yticks, xlim=xlim, ylim=ylim,
+                 rot=rot, fontsize=fontsize, colormap=colormap, table=table,
+                 yerr=yerr, xerr=xerr,
+                 label=label, secondary_y=secondary_y,
+                 **kwds)
+
+
+_shared_docs['boxplot'] = """
+    Make a box plot from DataFrame columns.
+
+    Make a box-and-whisker plot from DataFrame columns, optionally grouped
+    by some other columns. A box plot is a method for graphically depicting
+    groups of numerical data through their quartiles.
+    The box extends from the Q1 to Q3 quartile values of the data,
+    with a line at the median (Q2). The whiskers extend from the edges
+    of box to show the range of the data. The position of the whiskers
+    is set by default to `1.5 * IQR (IQR = Q3 - Q1)` from the edges of the box.
+    Outlier points are those past the end of the whiskers.
+
+    For further details see
+    Wikipedia's entry for `boxplot <https://en.wikipedia.org/wiki/Box_plot>`_.
+
+    Parameters
+    ----------
+    column : str or list of str, optional
+        Column name or list of names, or vector.
+        Can be any valid input to :meth:`pandas.DataFrame.groupby`.
+    by : str or array-like, optional
+        Column in the DataFrame to :meth:`pandas.DataFrame.groupby`.
+        One box-plot will be done per value of columns in `by`.
+    ax : object of class matplotlib.axes.Axes, optional
+        The matplotlib axes to be used by boxplot.
+    fontsize : float or str
+        Tick label font size in points or as a string (e.g., `large`).
+    rot : int or float, default 0
+        The rotation angle of labels (in degrees)
+        with respect to the screen coordinate system.
+    grid : boolean, default True
+        Setting this to True will show the grid.
+    figsize : A tuple (width, height) in inches
+        The size of the figure to create in matplotlib.
+    layout : tuple (rows, columns), optional
+        For example, (3, 5) will display the subplots
+        using 3 columns and 5 rows, starting from the top-left.
+    return_type : {'axes', 'dict', 'both'} or None, default 'axes'
+        The kind of object to return. The default is ``axes``.
+
+        * 'axes' returns the matplotlib axes the boxplot is drawn on.
+        * 'dict' returns a dictionary whose values are the matplotlib
+          Lines of the boxplot.
+        * 'both' returns a namedtuple with the axes and dict.
+        * when grouping with ``by``, a Series mapping columns to
+          ``return_type`` is returned.
+
+          If ``return_type`` is `None`, a NumPy array
+          of axes with the same shape as ``layout`` is returned.
+    **kwds
+        All other plotting keyword arguments to be passed to
+        :func:`matplotlib.pyplot.boxplot`.
+
+    Returns
+    -------
+    result :
+
+        The return type depends on the `return_type` parameter:
+
+        * 'axes' : object of class matplotlib.axes.Axes
+        * 'dict' : dict of matplotlib.lines.Line2D objects
+        * 'both' : a namedtuple with structure (ax, lines)
+
+        For data grouped with ``by``:
+
+        * :class:`~pandas.Series`
+        * :class:`~numpy.array` (for ``return_type = None``)
+
+    See Also
+    --------
+    Series.plot.hist: Make a histogram.
+    matplotlib.pyplot.boxplot : Matplotlib equivalent plot.
+
+    Notes
+    -----
+    Use ``return_type='dict'`` when you want to tweak the appearance
+    of the lines after plotting. In this case a dict containing the Lines
+    making up the boxes, caps, fliers, medians, and whiskers is returned.
+
+    Examples
+    --------
+
+    Boxplots can be created for every column in the dataframe
+    by ``df.boxplot()`` or indicating the columns to be used:
+
+    .. plot::
+        :context: close-figs
+
+        >>> np.random.seed(1234)
+        >>> df = pd.DataFrame(np.random.randn(10,4),
+        ...                   columns=['Col1', 'Col2', 'Col3', 'Col4'])
+        >>> boxplot = df.boxplot(column=['Col1', 'Col2', 'Col3'])
+
+    Boxplots of variables distributions grouped by the values of a third
+    variable can be created using the option ``by``. For instance:
+
+    .. plot::
+        :context: close-figs
+
+        >>> df = pd.DataFrame(np.random.randn(10, 2),
+        ...                   columns=['Col1', 'Col2'])
+        >>> df['X'] = pd.Series(['A', 'A', 'A', 'A', 'A',
+        ...                      'B', 'B', 'B', 'B', 'B'])
+        >>> boxplot = df.boxplot(by='X')
+
+    A list of strings (i.e. ``['X', 'Y']``) can be passed to boxplot
+    in order to group the data by combination of the variables in the x-axis:
+
+    .. plot::
+        :context: close-figs
+
+        >>> df = pd.DataFrame(np.random.randn(10,3),
+        ...                   columns=['Col1', 'Col2', 'Col3'])
+        >>> df['X'] = pd.Series(['A', 'A', 'A', 'A', 'A',
+        ...                      'B', 'B', 'B', 'B', 'B'])
+        >>> df['Y'] = pd.Series(['A', 'B', 'A', 'B', 'A',
+        ...                      'B', 'A', 'B', 'A', 'B'])
+        >>> boxplot = df.boxplot(column=['Col1', 'Col2'], by=['X', 'Y'])
+
+    The layout of boxplot can be adjusted giving a tuple to ``layout``:
+
+    .. plot::
+        :context: close-figs
+
+        >>> boxplot = df.boxplot(column=['Col1', 'Col2'], by='X',
+        ...                      layout=(2, 1))
+
+    Additional formatting can be done to the boxplot, like suppressing the grid
+    (``grid=False``), rotating the labels in the x-axis (i.e. ``rot=45``)
+    or changing the fontsize (i.e. ``fontsize=15``):
+
+    .. plot::
+        :context: close-figs
+
+        >>> boxplot = df.boxplot(grid=False, rot=45, fontsize=15)
+
+    The parameter ``return_type`` can be used to select the type of element
+    returned by `boxplot`.  When ``return_type='axes'`` is selected,
+    the matplotlib axes on which the boxplot is drawn are returned:
+
+        >>> boxplot = df.boxplot(column=['Col1','Col2'], return_type='axes')
+        >>> type(boxplot)
+        <class 'matplotlib.axes._subplots.AxesSubplot'>
+
+    When grouping with ``by``, a Series mapping columns to ``return_type``
+    is returned:
+
+        >>> boxplot = df.boxplot(column=['Col1', 'Col2'], by='X',
+        ...                      return_type='axes')
+        >>> type(boxplot)
+        <class 'pandas.core.series.Series'>
+
+    If ``return_type`` is `None`, a NumPy array of axes with the same shape
+    as ``layout`` is returned:
+
+        >>> boxplot =  df.boxplot(column=['Col1', 'Col2'], by='X',
+        ...                       return_type=None)
+        >>> type(boxplot)
+        <class 'numpy.ndarray'>
+    """
+
+
+@Appender(_shared_docs['boxplot'] % _shared_doc_kwargs)
+def boxplot(data, column=None, by=None, ax=None, fontsize=None,
+            rot=0, grid=True, figsize=None, layout=None, return_type=None,
+            **kwds):
+
+    # validate return_type:
+    if return_type not in BoxPlot._valid_return_types:
+        raise ValueError("return_type must be {'axes', 'dict', 'both'}")
+
+    from pandas import Series, DataFrame
+    if isinstance(data, Series):
+        data = DataFrame({'x': data})
+        column = 'x'
+
+    def _get_colors():
+        return _get_standard_colors(color=kwds.get('color'), num_colors=1)
+
+    def maybe_color_bp(bp):
+        if 'color' not in kwds:
+            from matplotlib.artist import setp
+            setp(bp['boxes'], color=colors[0], alpha=1)
+            setp(bp['whiskers'], color=colors[0], alpha=1)
+            setp(bp['medians'], color=colors[2], alpha=1)
+
+    def plot_group(keys, values, ax):
+        keys = [pprint_thing(x) for x in keys]
+        values = [np.asarray(remove_na_arraylike(v)) for v in values]
+        bp = ax.boxplot(values, **kwds)
+        if fontsize is not None:
+            ax.tick_params(axis='both', labelsize=fontsize)
+        if kwds.get('vert', 1):
+            ax.set_xticklabels(keys, rotation=rot)
+        else:
+            ax.set_yticklabels(keys, rotation=rot)
+        maybe_color_bp(bp)
+
+        # Return axes in multiplot case, maybe revisit later # 985
+        if return_type == 'dict':
+            return bp
+        elif return_type == 'both':
+            return BoxPlot.BP(ax=ax, lines=bp)
+        else:
+            return ax
+
+    colors = _get_colors()
+    if column is None:
+        columns = None
+    else:
+        if isinstance(column, (list, tuple)):
+            columns = column
+        else:
+            columns = [column]
+
+    if by is not None:
+        # Prefer array return type for 2-D plots to match the subplot layout
+        # https://github.com/pandas-dev/pandas/pull/12216#issuecomment-241175580
+        result = _grouped_plot_by_column(plot_group, data, columns=columns,
+                                         by=by, grid=grid, figsize=figsize,
+                                         ax=ax, layout=layout,
+                                         return_type=return_type)
+    else:
+        if return_type is None:
+            return_type = 'axes'
+        if layout is not None:
+            raise ValueError("The 'layout' keyword is not supported when "
+                             "'by' is None")
+
+        if ax is None:
+            rc = {'figure.figsize': figsize} if figsize is not None else {}
+            ax = _gca(rc)
+        data = data._get_numeric_data()
+        if columns is None:
+            columns = data.columns
+        else:
+            data = data[columns]
+
+        result = plot_group(columns, data.values.T, ax)
+        ax.grid(grid)
+
+    return result
+
+
+@Appender(_shared_docs['boxplot'] % _shared_doc_kwargs)
+def boxplot_frame(self, column=None, by=None, ax=None, fontsize=None, rot=0,
+                  grid=True, figsize=None, layout=None,
+                  return_type=None, **kwds):
+    import matplotlib.pyplot as plt
+    _converter._WARN = False
+    ax = boxplot(self, column=column, by=by, ax=ax, fontsize=fontsize,
+                 grid=grid, rot=rot, figsize=figsize, layout=layout,
+                 return_type=return_type, **kwds)
+    plt.draw_if_interactive()
+    return ax
+
+
+def scatter_plot(data, x, y, by=None, ax=None, figsize=None, grid=False,
+                 **kwargs):
+    """
+    Make a scatter plot from two DataFrame columns
+
+    Parameters
+    ----------
+    data : DataFrame
+    x : Column name for the x-axis values
+    y : Column name for the y-axis values
+    ax : Matplotlib axis object
+    figsize : A tuple (width, height) in inches
+    grid : Setting this to True will show the grid
+    kwargs : other plotting keyword arguments
+        To be passed to scatter function
+
+    Returns
+    -------
+    fig : matplotlib.Figure
+    """
+    import matplotlib.pyplot as plt
+
+    kwargs.setdefault('edgecolors', 'none')
+
+    def plot_group(group, ax):
+        xvals = group[x].values
+        yvals = group[y].values
+        ax.scatter(xvals, yvals, **kwargs)
+        ax.grid(grid)
+
+    if by is not None:
+        fig = _grouped_plot(plot_group, data, by=by, figsize=figsize, ax=ax)
+    else:
+        if ax is None:
+            fig = plt.figure()
+            ax = fig.add_subplot(111)
+        else:
+            fig = ax.get_figure()
+        plot_group(data, ax)
+        ax.set_ylabel(pprint_thing(y))
+        ax.set_xlabel(pprint_thing(x))
+
+        ax.grid(grid)
+
+    return fig
+
+
+def hist_frame(data, column=None, by=None, grid=True, xlabelsize=None,
+               xrot=None, ylabelsize=None, yrot=None, ax=None, sharex=False,
+               sharey=False, figsize=None, layout=None, bins=10, **kwds):
+    """
+    Make a histogram of the DataFrame's.
+
+    A `histogram`_ is a representation of the distribution of data.
+    This function calls :meth:`matplotlib.pyplot.hist`, on each series in
+    the DataFrame, resulting in one histogram per column.
+
+    .. _histogram: https://en.wikipedia.org/wiki/Histogram
+
+    Parameters
+    ----------
+    data : DataFrame
+        The pandas object holding the data.
+    column : string or sequence
+        If passed, will be used to limit data to a subset of columns.
+    by : object, optional
+        If passed, then used to form histograms for separate groups.
+    grid : boolean, default True
+        Whether to show axis grid lines.
+    xlabelsize : int, default None
+        If specified changes the x-axis label size.
+    xrot : float, default None
+        Rotation of x axis labels. For example, a value of 90 displays the
+        x labels rotated 90 degrees clockwise.
+    ylabelsize : int, default None
+        If specified changes the y-axis label size.
+    yrot : float, default None
+        Rotation of y axis labels. For example, a value of 90 displays the
+        y labels rotated 90 degrees clockwise.
+    ax : Matplotlib axes object, default None
+        The axes to plot the histogram on.
+    sharex : boolean, default True if ax is None else False
+        In case subplots=True, share x axis and set some x axis labels to
+        invisible; defaults to True if ax is None otherwise False if an ax
+        is passed in.
+        Note that passing in both an ax and sharex=True will alter all x axis
+        labels for all subplots in a figure.
+    sharey : boolean, default False
+        In case subplots=True, share y axis and set some y axis labels to
+        invisible.
+    figsize : tuple
+        The size in inches of the figure to create. Uses the value in
+        `matplotlib.rcParams` by default.
+    layout : tuple, optional
+        Tuple of (rows, columns) for the layout of the histograms.
+    bins : integer or sequence, default 10
+        Number of histogram bins to be used. If an integer is given, bins + 1
+        bin edges are calculated and returned. If bins is a sequence, gives
+        bin edges, including left edge of first bin and right edge of last
+        bin. In this case, bins is returned unmodified.
+    **kwds
+        All other plotting keyword arguments to be passed to
+        :meth:`matplotlib.pyplot.hist`.
+
+    Returns
+    -------
+    axes : matplotlib.AxesSubplot or numpy.ndarray of them
+
+    See Also
+    --------
+    matplotlib.pyplot.hist : Plot a histogram using matplotlib.
+
+    Examples
+    --------
+
+    .. plot::
+        :context: close-figs
+
+        This example draws a histogram based on the length and width of
+        some animals, displayed in three bins
+
+        >>> df = pd.DataFrame({
+        ...     'length': [1.5, 0.5, 1.2, 0.9, 3],
+        ...     'width': [0.7, 0.2, 0.15, 0.2, 1.1]
+        ...     }, index= ['pig', 'rabbit', 'duck', 'chicken', 'horse'])
+        >>> hist = df.hist(bins=3)
+    """
+    _raise_if_no_mpl()
+    _converter._WARN = False
+    if by is not None:
+        axes = grouped_hist(data, column=column, by=by, ax=ax, grid=grid,
+                            figsize=figsize, sharex=sharex, sharey=sharey,
+                            layout=layout, bins=bins, xlabelsize=xlabelsize,
+                            xrot=xrot, ylabelsize=ylabelsize,
+                            yrot=yrot, **kwds)
+        return axes
+
+    if column is not None:
+        if not isinstance(column, (list, np.ndarray, Index)):
+            column = [column]
+        data = data[column]
+    data = data._get_numeric_data()
+    naxes = len(data.columns)
+
+    fig, axes = _subplots(naxes=naxes, ax=ax, squeeze=False,
+                          sharex=sharex, sharey=sharey, figsize=figsize,
+                          layout=layout)
+    _axes = _flatten(axes)
+
+    for i, col in enumerate(com._try_sort(data.columns)):
+        ax = _axes[i]
+        ax.hist(data[col].dropna().values, bins=bins, **kwds)
+        ax.set_title(col)
+        ax.grid(grid)
+
+    _set_ticks_props(axes, xlabelsize=xlabelsize, xrot=xrot,
+                     ylabelsize=ylabelsize, yrot=yrot)
+    fig.subplots_adjust(wspace=0.3, hspace=0.3)
+
+    return axes
+
+
+def hist_series(self, by=None, ax=None, grid=True, xlabelsize=None,
+                xrot=None, ylabelsize=None, yrot=None, figsize=None,
+                bins=10, **kwds):
+    """
+    Draw histogram of the input series using matplotlib
+
+    Parameters
+    ----------
+    by : object, optional
+        If passed, then used to form histograms for separate groups
+    ax : matplotlib axis object
+        If not passed, uses gca()
+    grid : boolean, default True
+        Whether to show axis grid lines
+    xlabelsize : int, default None
+        If specified changes the x-axis label size
+    xrot : float, default None
+        rotation of x axis labels
+    ylabelsize : int, default None
+        If specified changes the y-axis label size
+    yrot : float, default None
+        rotation of y axis labels
+    figsize : tuple, default None
+        figure size in inches by default
+    bins : integer or sequence, default 10
+        Number of histogram bins to be used. If an integer is given, bins + 1
+        bin edges are calculated and returned. If bins is a sequence, gives
+        bin edges, including left edge of first bin and right edge of last
+        bin. In this case, bins is returned unmodified.
+    bins: integer, default 10
+        Number of histogram bins to be used
+    `**kwds` : keywords
+        To be passed to the actual plotting function
+
+    See Also
+    --------
+    matplotlib.axes.Axes.hist : Plot a histogram using matplotlib.
+
+    """
+    import matplotlib.pyplot as plt
+
+    if by is None:
+        if kwds.get('layout', None) is not None:
+            raise ValueError("The 'layout' keyword is not supported when "
+                             "'by' is None")
+        # hack until the plotting interface is a bit more unified
+        fig = kwds.pop('figure', plt.gcf() if plt.get_fignums() else
+                       plt.figure(figsize=figsize))
+        if (figsize is not None and tuple(figsize) !=
+                tuple(fig.get_size_inches())):
+            fig.set_size_inches(*figsize, forward=True)
+        if ax is None:
+            ax = fig.gca()
+        elif ax.get_figure() != fig:
+            raise AssertionError('passed axis not bound to passed figure')
+        values = self.dropna().values
+
+        ax.hist(values, bins=bins, **kwds)
+        ax.grid(grid)
+        axes = np.array([ax])
+
+        _set_ticks_props(axes, xlabelsize=xlabelsize, xrot=xrot,
+                         ylabelsize=ylabelsize, yrot=yrot)
+
+    else:
+        if 'figure' in kwds:
+            raise ValueError("Cannot pass 'figure' when using the "
+                             "'by' argument, since a new 'Figure' instance "
+                             "will be created")
+        axes = grouped_hist(self, by=by, ax=ax, grid=grid, figsize=figsize,
+                            bins=bins, xlabelsize=xlabelsize, xrot=xrot,
+                            ylabelsize=ylabelsize, yrot=yrot, **kwds)
+
+    if hasattr(axes, 'ndim'):
+        if axes.ndim == 1 and len(axes) == 1:
+            return axes[0]
+    return axes
+
+
+def grouped_hist(data, column=None, by=None, ax=None, bins=50, figsize=None,
+                 layout=None, sharex=False, sharey=False, rot=90, grid=True,
+                 xlabelsize=None, xrot=None, ylabelsize=None, yrot=None,
+                 **kwargs):
+    """
+    Grouped histogram
+
+    Parameters
+    ----------
+    data: Series/DataFrame
+    column: object, optional
+    by: object, optional
+    ax: axes, optional
+    bins: int, default 50
+    figsize: tuple, optional
+    layout: optional
+    sharex: boolean, default False
+    sharey: boolean, default False
+    rot: int, default 90
+    grid: bool, default True
+    kwargs: dict, keyword arguments passed to matplotlib.Axes.hist
+
+    Returns
+    -------
+    axes: collection of Matplotlib Axes
+    """
+    _raise_if_no_mpl()
+    _converter._WARN = False
+
+    def plot_group(group, ax):
+        ax.hist(group.dropna().values, bins=bins, **kwargs)
+
+    xrot = xrot or rot
+
+    fig, axes = _grouped_plot(plot_group, data, column=column,
+                              by=by, sharex=sharex, sharey=sharey, ax=ax,
+                              figsize=figsize, layout=layout, rot=rot)
+
+    _set_ticks_props(axes, xlabelsize=xlabelsize, xrot=xrot,
+                     ylabelsize=ylabelsize, yrot=yrot)
+
+    fig.subplots_adjust(bottom=0.15, top=0.9, left=0.1, right=0.9,
+                        hspace=0.5, wspace=0.3)
+    return axes
+
+
+def boxplot_frame_groupby(grouped, subplots=True, column=None, fontsize=None,
+                          rot=0, grid=True, ax=None, figsize=None,
+                          layout=None, sharex=False, sharey=True, **kwds):
+    """
+    Make box plots from DataFrameGroupBy data.
+
+    Parameters
+    ----------
+    grouped : Grouped DataFrame
+    subplots :
+        * ``False`` - no subplots will be used
+        * ``True`` - create a subplot for each group
+    column : column name or list of names, or vector
+        Can be any valid input to groupby
+    fontsize : int or string
+    rot : label rotation angle
+    grid : Setting this to True will show the grid
+    ax : Matplotlib axis object, default None
+    figsize : A tuple (width, height) in inches
+    layout : tuple (optional)
+        (rows, columns) for the layout of the plot
+    sharex : bool, default False
+        Whether x-axes will be shared among subplots
+
+        .. versionadded:: 0.23.1
+    sharey : bool, default True
+        Whether y-axes will be shared among subplots
+
+        .. versionadded:: 0.23.1
+    `**kwds` : Keyword Arguments
+        All other plotting keyword arguments to be passed to
+        matplotlib's boxplot function
+
+    Returns
+    -------
+    dict of key/value = group key/DataFrame.boxplot return value
+    or DataFrame.boxplot return value in case subplots=figures=False
+
+    Examples
+    --------
+    >>> import pandas
+    >>> import numpy as np
+    >>> import itertools
+    >>>
+    >>> tuples = [t for t in itertools.product(range(1000), range(4))]
+    >>> index = pandas.MultiIndex.from_tuples(tuples, names=['lvl0', 'lvl1'])
+    >>> data = np.random.randn(len(index),4)
+    >>> df = pandas.DataFrame(data, columns=list('ABCD'), index=index)
+    >>>
+    >>> grouped = df.groupby(level='lvl1')
+    >>> boxplot_frame_groupby(grouped)
+    >>>
+    >>> grouped = df.unstack(level='lvl1').groupby(level=0, axis=1)
+    >>> boxplot_frame_groupby(grouped, subplots=False)
+    """
+    _raise_if_no_mpl()
+    _converter._WARN = False
+    if subplots is True:
+        naxes = len(grouped)
+        fig, axes = _subplots(naxes=naxes, squeeze=False,
+                              ax=ax, sharex=sharex, sharey=sharey,
+                              figsize=figsize, layout=layout)
+        axes = _flatten(axes)
+
+        from pandas.core.series import Series
+        ret = Series()
+        for (key, group), ax in zip(grouped, axes):
+            d = group.boxplot(ax=ax, column=column, fontsize=fontsize,
+                              rot=rot, grid=grid, **kwds)
+            ax.set_title(pprint_thing(key))
+            ret.loc[key] = d
+        fig.subplots_adjust(bottom=0.15, top=0.9, left=0.1,
+                            right=0.9, wspace=0.2)
+    else:
+        from pandas.core.reshape.concat import concat
+        keys, frames = zip(*grouped)
+        if grouped.axis == 0:
+            df = concat(frames, keys=keys, axis=1)
+        else:
+            if len(frames) > 1:
+                df = frames[0].join(frames[1::])
+            else:
+                df = frames[0]
+        ret = df.boxplot(column=column, fontsize=fontsize, rot=rot,
+                         grid=grid, ax=ax, figsize=figsize,
+                         layout=layout, **kwds)
+    return ret
+
+
+def _grouped_plot(plotf, data, column=None, by=None, numeric_only=True,
+                  figsize=None, sharex=True, sharey=True, layout=None,
+                  rot=0, ax=None, **kwargs):
+    from pandas import DataFrame
+
+    if figsize == 'default':
+        # allowed to specify mpl default with 'default'
+        warnings.warn("figsize='default' is deprecated. Specify figure"
+                      "size by tuple instead", FutureWarning, stacklevel=4)
+        figsize = None
+
+    grouped = data.groupby(by)
+    if column is not None:
+        grouped = grouped[column]
+
+    naxes = len(grouped)
+    fig, axes = _subplots(naxes=naxes, figsize=figsize,
+                          sharex=sharex, sharey=sharey, ax=ax,
+                          layout=layout)
+
+    _axes = _flatten(axes)
+
+    for i, (key, group) in enumerate(grouped):
+        ax = _axes[i]
+        if numeric_only and isinstance(group, DataFrame):
+            group = group._get_numeric_data()
+        plotf(group, ax, **kwargs)
+        ax.set_title(pprint_thing(key))
+
+    return fig, axes
+
+
+def _grouped_plot_by_column(plotf, data, columns=None, by=None,
+                            numeric_only=True, grid=False,
+                            figsize=None, ax=None, layout=None,
+                            return_type=None, **kwargs):
+    grouped = data.groupby(by)
+    if columns is None:
+        if not isinstance(by, (list, tuple)):
+            by = [by]
+        columns = data._get_numeric_data().columns.difference(by)
+    naxes = len(columns)
+    fig, axes = _subplots(naxes=naxes, sharex=True, sharey=True,
+                          figsize=figsize, ax=ax, layout=layout)
+
+    _axes = _flatten(axes)
+
+    ax_values = []
+
+    for i, col in enumerate(columns):
+        ax = _axes[i]
+        gp_col = grouped[col]
+        keys, values = zip(*gp_col)
+        re_plotf = plotf(keys, values, ax, **kwargs)
+        ax.set_title(col)
+        ax.set_xlabel(pprint_thing(by))
+        ax_values.append(re_plotf)
+        ax.grid(grid)
+
+    from pandas.core.series import Series
+    result = Series(ax_values, index=columns)
+
+    # Return axes in multiplot case, maybe revisit later # 985
+    if return_type is None:
+        result = axes
+
+    byline = by[0] if len(by) == 1 else by
+    fig.suptitle('Boxplot grouped by {byline}'.format(byline=byline))
+    fig.subplots_adjust(bottom=0.15, top=0.9, left=0.1, right=0.9, wspace=0.2)
+
+    return result
+
+
+class BasePlotMethods(PandasObject):
+
+    def __init__(self, data):
+        self._data = data
+
+    def __call__(self, *args, **kwargs):
+        raise NotImplementedError
+
+
+class SeriesPlotMethods(BasePlotMethods):
+    """Series plotting accessor and method
+
+    Examples
+    --------
+    >>> s.plot.line()
+    >>> s.plot.bar()
+    >>> s.plot.hist()
+
+    Plotting methods can also be accessed by calling the accessor as a method
+    with the ``kind`` argument:
+    ``s.plot(kind='line')`` is equivalent to ``s.plot.line()``
+    """
+
+    def __call__(self, kind='line', ax=None,
+                 figsize=None, use_index=True, title=None, grid=None,
+                 legend=False, style=None, logx=False, logy=False,
+                 loglog=False, xticks=None, yticks=None,
+                 xlim=None, ylim=None,
+                 rot=None, fontsize=None, colormap=None, table=False,
+                 yerr=None, xerr=None,
+                 label=None, secondary_y=False, **kwds):
+        return plot_series(self._data, kind=kind, ax=ax, figsize=figsize,
+                           use_index=use_index, title=title, grid=grid,
+                           legend=legend, style=style, logx=logx, logy=logy,
+                           loglog=loglog, xticks=xticks, yticks=yticks,
+                           xlim=xlim, ylim=ylim, rot=rot, fontsize=fontsize,
+                           colormap=colormap, table=table, yerr=yerr,
+                           xerr=xerr, label=label, secondary_y=secondary_y,
+                           **kwds)
+    __call__.__doc__ = plot_series.__doc__
+
+    def line(self, **kwds):
+        """
+        Line plot
+
+        Parameters
+        ----------
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        axes : :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+
+        Examples
+        --------
+
+        .. plot::
+            :context: close-figs
+
+            >>> s = pd.Series([1, 3, 2])
+            >>> s.plot.line()
+        """
+        return self(kind='line', **kwds)
+
+    def bar(self, **kwds):
+        """
+        Vertical bar plot
+
+        Parameters
+        ----------
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        axes : :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+        """
+        return self(kind='bar', **kwds)
+
+    def barh(self, **kwds):
+        """
+        Horizontal bar plot
+
+        Parameters
+        ----------
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        axes : :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+        """
+        return self(kind='barh', **kwds)
+
+    def box(self, **kwds):
+        """
+        Boxplot
+
+        Parameters
+        ----------
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        axes : :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+        """
+        return self(kind='box', **kwds)
+
+    def hist(self, bins=10, **kwds):
+        """
+        Histogram
+
+        Parameters
+        ----------
+        bins: integer, default 10
+            Number of histogram bins to be used
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        axes : :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+        """
+        return self(kind='hist', bins=bins, **kwds)
+
+    @Appender(_kde_docstring % {
+        'this-datatype': 'Series',
+        'sibling-datatype': 'DataFrame',
+        'examples': """
+        Given a Series of points randomly sampled from an unknown
+        distribution, estimate its PDF using KDE with automatic
+        bandwidth determination and plot the results, evaluating them at
+        1000 equally spaced points (default):
+
+        .. plot::
+            :context: close-figs
+
+            >>> s = pd.Series([1, 2, 2.5, 3, 3.5, 4, 5])
+            >>> ax = s.plot.kde()
+
+        A scalar bandwidth can be specified. Using a small bandwidth value can
+        lead to over-fitting, while using a large bandwidth value may result
+        in under-fitting:
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = s.plot.kde(bw_method=0.3)
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = s.plot.kde(bw_method=3)
+
+        Finally, the `ind` parameter determines the evaluation points for the
+        plot of the estimated PDF:
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = s.plot.kde(ind=[1, 2, 3, 4, 5])
+        """.strip()
+    })
+    def kde(self, bw_method=None, ind=None, **kwds):
+        return self(kind='kde', bw_method=bw_method, ind=ind, **kwds)
+
+    density = kde
+
+    def area(self, **kwds):
+        """
+        Area plot
+
+        Parameters
+        ----------
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        axes : :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+        """
+        return self(kind='area', **kwds)
+
+    def pie(self, **kwds):
+        """
+        Pie chart
+
+        Parameters
+        ----------
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        axes : :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+        """
+        return self(kind='pie', **kwds)
+
+
+class FramePlotMethods(BasePlotMethods):
+    """DataFrame plotting accessor and method
+
+    Examples
+    --------
+    >>> df.plot.line()
+    >>> df.plot.scatter('x', 'y')
+    >>> df.plot.hexbin()
+
+    These plotting methods can also be accessed by calling the accessor as a
+    method with the ``kind`` argument:
+    ``df.plot(kind='line')`` is equivalent to ``df.plot.line()``
+    """
+
+    def __call__(self, x=None, y=None, kind='line', ax=None,
+                 subplots=False, sharex=None, sharey=False, layout=None,
+                 figsize=None, use_index=True, title=None, grid=None,
+                 legend=True, style=None, logx=False, logy=False, loglog=False,
+                 xticks=None, yticks=None, xlim=None, ylim=None,
+                 rot=None, fontsize=None, colormap=None, table=False,
+                 yerr=None, xerr=None,
+                 secondary_y=False, sort_columns=False, **kwds):
+        return plot_frame(self._data, kind=kind, x=x, y=y, ax=ax,
+                          subplots=subplots, sharex=sharex, sharey=sharey,
+                          layout=layout, figsize=figsize, use_index=use_index,
+                          title=title, grid=grid, legend=legend, style=style,
+                          logx=logx, logy=logy, loglog=loglog, xticks=xticks,
+                          yticks=yticks, xlim=xlim, ylim=ylim, rot=rot,
+                          fontsize=fontsize, colormap=colormap, table=table,
+                          yerr=yerr, xerr=xerr, secondary_y=secondary_y,
+                          sort_columns=sort_columns, **kwds)
+    __call__.__doc__ = plot_frame.__doc__
+
+    def line(self, x=None, y=None, **kwds):
+        """
+        Plot DataFrame columns as lines.
+
+        This function is useful to plot lines using DataFrame's values
+        as coordinates.
+
+        Parameters
+        ----------
+        x : int or str, optional
+            Columns to use for the horizontal axis.
+            Either the location or the label of the columns to be used.
+            By default, it will use the DataFrame indices.
+        y : int, str, or list of them, optional
+            The values to be plotted.
+            Either the location or the label of the columns to be used.
+            By default, it will use the remaining DataFrame numeric columns.
+        **kwds
+            Keyword arguments to pass on to :meth:`pandas.DataFrame.plot`.
+
+        Returns
+        -------
+        axes : :class:`matplotlib.axes.Axes` or :class:`numpy.ndarray`
+            Returns an ndarray when ``subplots=True``.
+
+        See Also
+        --------
+        matplotlib.pyplot.plot : Plot y versus x as lines and/or markers.
+
+        Examples
+        --------
+
+        .. plot::
+            :context: close-figs
+
+            The following example shows the populations for some animals
+            over the years.
+
+            >>> df = pd.DataFrame({
+            ...    'pig': [20, 18, 489, 675, 1776],
+            ...    'horse': [4, 25, 281, 600, 1900]
+            ...    }, index=[1990, 1997, 2003, 2009, 2014])
+            >>> lines = df.plot.line()
+
+        .. plot::
+           :context: close-figs
+
+           An example with subplots, so an array of axes is returned.
+
+           >>> axes = df.plot.line(subplots=True)
+           >>> type(axes)
+           <class 'numpy.ndarray'>
+
+        .. plot::
+            :context: close-figs
+
+            The following example shows the relationship between both
+            populations.
+
+            >>> lines = df.plot.line(x='pig', y='horse')
+        """
+        return self(kind='line', x=x, y=y, **kwds)
+
+    def bar(self, x=None, y=None, **kwds):
+        """
+        Vertical bar plot.
+
+        A bar plot is a plot that presents categorical data with
+        rectangular bars with lengths proportional to the values that they
+        represent. A bar plot shows comparisons among discrete categories. One
+        axis of the plot shows the specific categories being compared, and the
+        other axis represents a measured value.
+
+        Parameters
+        ----------
+        x : label or position, optional
+            Allows plotting of one column versus another. If not specified,
+            the index of the DataFrame is used.
+        y : label or position, optional
+            Allows plotting of one column versus another. If not specified,
+            all numerical columns are used.
+        **kwds
+            Additional keyword arguments are documented in
+            :meth:`pandas.DataFrame.plot`.
+
+        Returns
+        -------
+        axes : matplotlib.axes.Axes or np.ndarray of them
+            An ndarray is returned with one :class:`matplotlib.axes.Axes`
+            per column when ``subplots=True``.
+
+        See Also
+        --------
+        pandas.DataFrame.plot.barh : Horizontal bar plot.
+        pandas.DataFrame.plot : Make plots of a DataFrame.
+        matplotlib.pyplot.bar : Make a bar plot with matplotlib.
+
+        Examples
+        --------
+        Basic plot.
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame({'lab':['A', 'B', 'C'], 'val':[10, 30, 20]})
+            >>> ax = df.plot.bar(x='lab', y='val', rot=0)
+
+        Plot a whole dataframe to a bar plot. Each column is assigned a
+        distinct color, and each row is nested in a group along the
+        horizontal axis.
+
+        .. plot::
+            :context: close-figs
+
+            >>> speed = [0.1, 17.5, 40, 48, 52, 69, 88]
+            >>> lifespan = [2, 8, 70, 1.5, 25, 12, 28]
+            >>> index = ['snail', 'pig', 'elephant',
+            ...          'rabbit', 'giraffe', 'coyote', 'horse']
+            >>> df = pd.DataFrame({'speed': speed,
+            ...                    'lifespan': lifespan}, index=index)
+            >>> ax = df.plot.bar(rot=0)
+
+        Instead of nesting, the figure can be split by column with
+        ``subplots=True``. In this case, a :class:`numpy.ndarray` of
+        :class:`matplotlib.axes.Axes` are returned.
+
+        .. plot::
+            :context: close-figs
+
+            >>> axes = df.plot.bar(rot=0, subplots=True)
+            >>> axes[1].legend(loc=2)  # doctest: +SKIP
+
+        Plot a single column.
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = df.plot.bar(y='speed', rot=0)
+
+        Plot only selected categories for the DataFrame.
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = df.plot.bar(x='lifespan', rot=0)
+        """
+        return self(kind='bar', x=x, y=y, **kwds)
+
+    def barh(self, x=None, y=None, **kwds):
+        """
+        Make a horizontal bar plot.
+
+        A horizontal bar plot is a plot that presents quantitative data with
+        rectangular bars with lengths proportional to the values that they
+        represent. A bar plot shows comparisons among discrete categories. One
+        axis of the plot shows the specific categories being compared, and the
+        other axis represents a measured value.
+
+        Parameters
+        ----------
+        x : label or position, default DataFrame.index
+            Column to be used for categories.
+        y : label or position, default All numeric columns in dataframe
+            Columns to be plotted from the DataFrame.
+        **kwds
+            Keyword arguments to pass on to :meth:`pandas.DataFrame.plot`.
+
+        Returns
+        -------
+        axes : :class:`matplotlib.axes.Axes` or numpy.ndarray of them.
+
+        See Also
+        --------
+        pandas.DataFrame.plot.bar: Vertical bar plot.
+        pandas.DataFrame.plot : Make plots of DataFrame using matplotlib.
+        matplotlib.axes.Axes.bar : Plot a vertical bar plot using matplotlib.
+
+        Examples
+        --------
+        Basic example
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame({'lab':['A', 'B', 'C'], 'val':[10, 30, 20]})
+            >>> ax = df.plot.barh(x='lab', y='val')
+
+        Plot a whole DataFrame to a horizontal bar plot
+
+        .. plot::
+            :context: close-figs
+
+            >>> speed = [0.1, 17.5, 40, 48, 52, 69, 88]
+            >>> lifespan = [2, 8, 70, 1.5, 25, 12, 28]
+            >>> index = ['snail', 'pig', 'elephant',
+            ...          'rabbit', 'giraffe', 'coyote', 'horse']
+            >>> df = pd.DataFrame({'speed': speed,
+            ...                    'lifespan': lifespan}, index=index)
+            >>> ax = df.plot.barh()
+
+        Plot a column of the DataFrame to a horizontal bar plot
+
+        .. plot::
+            :context: close-figs
+
+            >>> speed = [0.1, 17.5, 40, 48, 52, 69, 88]
+            >>> lifespan = [2, 8, 70, 1.5, 25, 12, 28]
+            >>> index = ['snail', 'pig', 'elephant',
+            ...          'rabbit', 'giraffe', 'coyote', 'horse']
+            >>> df = pd.DataFrame({'speed': speed,
+            ...                    'lifespan': lifespan}, index=index)
+            >>> ax = df.plot.barh(y='speed')
+
+        Plot DataFrame versus the desired column
+
+        .. plot::
+            :context: close-figs
+
+            >>> speed = [0.1, 17.5, 40, 48, 52, 69, 88]
+            >>> lifespan = [2, 8, 70, 1.5, 25, 12, 28]
+            >>> index = ['snail', 'pig', 'elephant',
+            ...          'rabbit', 'giraffe', 'coyote', 'horse']
+            >>> df = pd.DataFrame({'speed': speed,
+            ...                    'lifespan': lifespan}, index=index)
+            >>> ax = df.plot.barh(x='lifespan')
+        """
+        return self(kind='barh', x=x, y=y, **kwds)
+
+    def box(self, by=None, **kwds):
+        r"""
+        Make a box plot of the DataFrame columns.
+
+        A box plot is a method for graphically depicting groups of numerical
+        data through their quartiles.
+        The box extends from the Q1 to Q3 quartile values of the data,
+        with a line at the median (Q2). The whiskers extend from the edges
+        of box to show the range of the data. The position of the whiskers
+        is set by default to 1.5*IQR (IQR = Q3 - Q1) from the edges of the
+        box. Outlier points are those past the end of the whiskers.
+
+        For further details see Wikipedia's
+        entry for `boxplot <https://en.wikipedia.org/wiki/Box_plot>`__.
+
+        A consideration when using this chart is that the box and the whiskers
+        can overlap, which is very common when plotting small sets of data.
+
+        Parameters
+        ----------
+        by : string or sequence
+            Column in the DataFrame to group by.
+        **kwds : optional
+            Additional keywords are documented in
+            :meth:`pandas.DataFrame.plot`.
+
+        Returns
+        -------
+        axes : :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+
+        See Also
+        --------
+        pandas.DataFrame.boxplot: Another method to draw a box plot.
+        pandas.Series.plot.box: Draw a box plot from a Series object.
+        matplotlib.pyplot.boxplot: Draw a box plot in matplotlib.
+
+        Examples
+        --------
+        Draw a box plot from a DataFrame with four columns of randomly
+        generated data.
+
+        .. plot::
+            :context: close-figs
+
+            >>> data = np.random.randn(25, 4)
+            >>> df = pd.DataFrame(data, columns=list('ABCD'))
+            >>> ax = df.plot.box()
+        """
+        return self(kind='box', by=by, **kwds)
+
+    def hist(self, by=None, bins=10, **kwds):
+        """
+        Draw one histogram of the DataFrame's columns.
+
+        A histogram is a representation of the distribution of data.
+        This function groups the values of all given Series in the DataFrame
+        into bins and draws all bins in one :class:`matplotlib.axes.Axes`.
+        This is useful when the DataFrame's Series are in a similar scale.
+
+        Parameters
+        ----------
+        by : str or sequence, optional
+            Column in the DataFrame to group by.
+        bins : int, default 10
+            Number of histogram bins to be used.
+        **kwds
+            Additional keyword arguments are documented in
+            :meth:`pandas.DataFrame.plot`.
+
+        Returns
+        -------
+        axes : matplotlib.AxesSubplot histogram.
+
+        See Also
+        --------
+        DataFrame.hist : Draw histograms per DataFrame's Series.
+        Series.hist : Draw a histogram with Series' data.
+
+        Examples
+        --------
+        When we draw a dice 6000 times, we expect to get each value around 1000
+        times. But when we draw two dices and sum the result, the distribution
+        is going to be quite different. A histogram illustrates those
+        distributions.
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame(
+            ...     np.random.randint(1, 7, 6000),
+            ...     columns = ['one'])
+            >>> df['two'] = df['one'] + np.random.randint(1, 7, 6000)
+            >>> ax = df.plot.hist(bins=12, alpha=0.5)
+        """
+        return self(kind='hist', by=by, bins=bins, **kwds)
+
+    @Appender(_kde_docstring % {
+        'this-datatype': 'DataFrame',
+        'sibling-datatype': 'Series',
+        'examples': """
+        Given several Series of points randomly sampled from unknown
+        distributions, estimate their PDFs using KDE with automatic
+        bandwidth determination and plot the results, evaluating them at
+        1000 equally spaced points (default):
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame({
+            ...     'x': [1, 2, 2.5, 3, 3.5, 4, 5],
+            ...     'y': [4, 4, 4.5, 5, 5.5, 6, 6],
+            ... })
+            >>> ax = df.plot.kde()
+
+        A scalar bandwidth can be specified. Using a small bandwidth value can
+        lead to over-fitting, while using a large bandwidth value may result
+        in under-fitting:
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = df.plot.kde(bw_method=0.3)
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = df.plot.kde(bw_method=3)
+
+        Finally, the `ind` parameter determines the evaluation points for the
+        plot of the estimated PDF:
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = df.plot.kde(ind=[1, 2, 3, 4, 5, 6])
+        """.strip()
+    })
+    def kde(self, bw_method=None, ind=None, **kwds):
+        return self(kind='kde', bw_method=bw_method, ind=ind, **kwds)
+
+    density = kde
+
+    def area(self, x=None, y=None, **kwds):
+        """
+        Area plot
+
+        Parameters
+        ----------
+        x, y : label or position, optional
+            Coordinates for each point.
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.DataFrame.plot`.
+
+        Returns
+        -------
+        axes : :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+        """
+        return self(kind='area', x=x, y=y, **kwds)
+
+    def pie(self, y=None, **kwds):
+        """
+        Generate a pie plot.
+
+        A pie plot is a proportional representation of the numerical data in a
+        column. This function wraps :meth:`matplotlib.pyplot.pie` for the
+        specified column. If no column reference is passed and
+        ``subplots=True`` a pie plot is drawn for each numerical column
+        independently.
+
+        Parameters
+        ----------
+        y : int or label, optional
+            Label or position of the column to plot.
+            If not provided, ``subplots=True`` argument must be passed.
+        **kwds
+            Keyword arguments to pass on to :meth:`pandas.DataFrame.plot`.
+
+        Returns
+        -------
+        axes : matplotlib.axes.Axes or np.ndarray of them.
+            A NumPy array is returned when `subplots` is True.
+
+        See Also
+        --------
+        Series.plot.pie : Generate a pie plot for a Series.
+        DataFrame.plot : Make plots of a DataFrame.
+
+        Examples
+        --------
+        In the example below we have a DataFrame with the information about
+        planet's mass and radius. We pass the the 'mass' column to the
+        pie function to get a pie plot.
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame({'mass': [0.330, 4.87 , 5.97],
+            ...                    'radius': [2439.7, 6051.8, 6378.1]},
+            ...                   index=['Mercury', 'Venus', 'Earth'])
+            >>> plot = df.plot.pie(y='mass', figsize=(5, 5))
+
+        .. plot::
+            :context: close-figs
+
+            >>> plot = df.plot.pie(subplots=True, figsize=(6, 3))
+
+        """
+        return self(kind='pie', y=y, **kwds)
+
+    def scatter(self, x, y, s=None, c=None, **kwds):
+        """
+        Create a scatter plot with varying marker point size and color.
+
+        The coordinates of each point are defined by two dataframe columns and
+        filled circles are used to represent each point. This kind of plot is
+        useful to see complex correlations between two variables. Points could
+        be for instance natural 2D coordinates like longitude and latitude in
+        a map or, in general, any pair of metrics that can be plotted against
+        each other.
+
+        Parameters
+        ----------
+        x : int or str
+            The column name or column position to be used as horizontal
+            coordinates for each point.
+        y : int or str
+            The column name or column position to be used as vertical
+            coordinates for each point.
+        s : scalar or array_like, optional
+            The size of each point. Possible values are:
+
+            - A single scalar so all points have the same size.
+
+            - A sequence of scalars, which will be used for each point's size
+              recursively. For instance, when passing [2,14] all points size
+              will be either 2 or 14, alternatively.
+
+        c : str, int or array_like, optional
+            The color of each point. Possible values are:
+
+            - A single color string referred to by name, RGB or RGBA code,
+              for instance 'red' or '#a98d19'.
+
+            - A sequence of color strings referred to by name, RGB or RGBA
+              code, which will be used for each point's color recursively. For
+              instance ['green','yellow'] all points will be filled in green or
+              yellow, alternatively.
+
+            - A column name or position whose values will be used to color the
+              marker points according to a colormap.
+
+        **kwds
+            Keyword arguments to pass on to :meth:`pandas.DataFrame.plot`.
+
+        Returns
+        -------
+        axes : :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+
+        See Also
+        --------
+        matplotlib.pyplot.scatter : scatter plot using multiple input data
+            formats.
+
+        Examples
+        --------
+        Let's see how to draw a scatter plot using coordinates from the values
+        in a DataFrame's columns.
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame([[5.1, 3.5, 0], [4.9, 3.0, 0], [7.0, 3.2, 1],
+            ...                    [6.4, 3.2, 1], [5.9, 3.0, 2]],
+            ...                   columns=['length', 'width', 'species'])
+            >>> ax1 = df.plot.scatter(x='length',
+            ...                       y='width',
+            ...                       c='DarkBlue')
+
+        And now with the color determined by a column as well.
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax2 = df.plot.scatter(x='length',
+            ...                       y='width',
+            ...                       c='species',
+            ...                       colormap='viridis')
+        """
+        return self(kind='scatter', x=x, y=y, c=c, s=s, **kwds)
+
+    def hexbin(self, x, y, C=None, reduce_C_function=None, gridsize=None,
+               **kwds):
+        """
+        Generate a hexagonal binning plot.
+
+        Generate a hexagonal binning plot of `x` versus `y`. If `C` is `None`
+        (the default), this is a histogram of the number of occurrences
+        of the observations at ``(x[i], y[i])``.
+
+        If `C` is specified, specifies values at given coordinates
+        ``(x[i], y[i])``. These values are accumulated for each hexagonal
+        bin and then reduced according to `reduce_C_function`,
+        having as default the NumPy's mean function (:meth:`numpy.mean`).
+        (If `C` is specified, it must also be a 1-D sequence
+        of the same length as `x` and `y`, or a column label.)
+
+        Parameters
+        ----------
+        x : int or str
+            The column label or position for x points.
+        y : int or str
+            The column label or position for y points.
+        C : int or str, optional
+            The column label or position for the value of `(x, y)` point.
+        reduce_C_function : callable, default `np.mean`
+            Function of one argument that reduces all the values in a bin to
+            a single number (e.g. `np.mean`, `np.max`, `np.sum`, `np.std`).
+        gridsize : int or tuple of (int, int), default 100
+            The number of hexagons in the x-direction.
+            The corresponding number of hexagons in the y-direction is
+            chosen in a way that the hexagons are approximately regular.
+            Alternatively, gridsize can be a tuple with two elements
+            specifying the number of hexagons in the x-direction and the
+            y-direction.
+        **kwds
+            Additional keyword arguments are documented in
+            :meth:`pandas.DataFrame.plot`.
+
+        Returns
+        -------
+        matplotlib.AxesSubplot
+            The matplotlib ``Axes`` on which the hexbin is plotted.
+
+        See Also
+        --------
+        DataFrame.plot : Make plots of a DataFrame.
+        matplotlib.pyplot.hexbin : hexagonal binning plot using matplotlib,
+            the matplotlib function that is used under the hood.
+
+        Examples
+        --------
+        The following examples are generated with random data from
+        a normal distribution.
+
+        .. plot::
+            :context: close-figs
+
+            >>> n = 10000
+            >>> df = pd.DataFrame({'x': np.random.randn(n),
+            ...                    'y': np.random.randn(n)})
+            >>> ax = df.plot.hexbin(x='x', y='y', gridsize=20)
+
+        The next example uses `C` and `np.sum` as `reduce_C_function`.
+        Note that `'observations'` values ranges from 1 to 5 but the result
+        plot shows values up to more than 25. This is because of the
+        `reduce_C_function`.
+
+        .. plot::
+            :context: close-figs
+
+            >>> n = 500
+            >>> df = pd.DataFrame({
+            ...     'coord_x': np.random.uniform(-3, 3, size=n),
+            ...     'coord_y': np.random.uniform(30, 50, size=n),
+            ...     'observations': np.random.randint(1,5, size=n)
+            ...     })
+            >>> ax = df.plot.hexbin(x='coord_x',
+            ...                     y='coord_y',
+            ...                     C='observations',
+            ...                     reduce_C_function=np.sum,
+            ...                     gridsize=10,
+            ...                     cmap="viridis")
+        """
+        if reduce_C_function is not None:
+            kwds['reduce_C_function'] = reduce_C_function
+        if gridsize is not None:
+            kwds['gridsize'] = gridsize
+        return self(kind='hexbin', x=x, y=y, C=C, **kwds)
diff --git a/pandas/plotting/_misc.py b/pandas/plotting/_misc.py
new file mode 100644
index 0000000000000..150c9274d4e5c
--- /dev/null
+++ b/pandas/plotting/_misc.py
@@ -0,0 +1,645 @@
+# being a bit too dynamic
+# pylint: disable=E1101
+from __future__ import division
+
+import numpy as np
+
+from pandas.util._decorators import deprecate_kwarg
+from pandas.core.dtypes.missing import notna
+from pandas.compat import range, lrange, lmap, zip
+from pandas.io.formats.printing import pprint_thing
+
+
+from pandas.plotting._style import _get_standard_colors
+from pandas.plotting._tools import _subplots, _set_ticks_props
+
+
+def scatter_matrix(frame, alpha=0.5, figsize=None, ax=None, grid=False,
+                   diagonal='hist', marker='.', density_kwds=None,
+                   hist_kwds=None, range_padding=0.05, **kwds):
+    """
+    Draw a matrix of scatter plots.
+
+    Parameters
+    ----------
+    frame : DataFrame
+    alpha : float, optional
+        amount of transparency applied
+    figsize : (float,float), optional
+        a tuple (width, height) in inches
+    ax : Matplotlib axis object, optional
+    grid : bool, optional
+        setting this to True will show the grid
+    diagonal : {'hist', 'kde'}
+        pick between 'kde' and 'hist' for
+        either Kernel Density Estimation or Histogram
+        plot in the diagonal
+    marker : str, optional
+        Matplotlib marker type, default '.'
+    hist_kwds : other plotting keyword arguments
+        To be passed to hist function
+    density_kwds : other plotting keyword arguments
+        To be passed to kernel density estimate plot
+    range_padding : float, optional
+        relative extension of axis range in x and y
+        with respect to (x_max - x_min) or (y_max - y_min),
+        default 0.05
+    kwds : other plotting keyword arguments
+        To be passed to scatter function
+
+    Examples
+    --------
+    >>> df = DataFrame(np.random.randn(1000, 4), columns=['A','B','C','D'])
+    >>> scatter_matrix(df, alpha=0.2)
+    """
+
+    df = frame._get_numeric_data()
+    n = df.columns.size
+    naxes = n * n
+    fig, axes = _subplots(naxes=naxes, figsize=figsize, ax=ax,
+                          squeeze=False)
+
+    # no gaps between subplots
+    fig.subplots_adjust(wspace=0, hspace=0)
+
+    mask = notna(df)
+
+    marker = _get_marker_compat(marker)
+
+    hist_kwds = hist_kwds or {}
+    density_kwds = density_kwds or {}
+
+    # GH 14855
+    kwds.setdefault('edgecolors', 'none')
+
+    boundaries_list = []
+    for a in df.columns:
+        values = df[a].values[mask[a].values]
+        rmin_, rmax_ = np.min(values), np.max(values)
+        rdelta_ext = (rmax_ - rmin_) * range_padding / 2.
+        boundaries_list.append((rmin_ - rdelta_ext, rmax_ + rdelta_ext))
+
+    for i, a in zip(lrange(n), df.columns):
+        for j, b in zip(lrange(n), df.columns):
+            ax = axes[i, j]
+
+            if i == j:
+                values = df[a].values[mask[a].values]
+
+                # Deal with the diagonal by drawing a histogram there.
+                if diagonal == 'hist':
+                    ax.hist(values, **hist_kwds)
+
+                elif diagonal in ('kde', 'density'):
+                    from scipy.stats import gaussian_kde
+                    y = values
+                    gkde = gaussian_kde(y)
+                    ind = np.linspace(y.min(), y.max(), 1000)
+                    ax.plot(ind, gkde.evaluate(ind), **density_kwds)
+
+                ax.set_xlim(boundaries_list[i])
+
+            else:
+                common = (mask[a] & mask[b]).values
+
+                ax.scatter(df[b][common], df[a][common],
+                           marker=marker, alpha=alpha, **kwds)
+
+                ax.set_xlim(boundaries_list[j])
+                ax.set_ylim(boundaries_list[i])
+
+            ax.set_xlabel(b)
+            ax.set_ylabel(a)
+
+            if j != 0:
+                ax.yaxis.set_visible(False)
+            if i != n - 1:
+                ax.xaxis.set_visible(False)
+
+    if len(df.columns) > 1:
+        lim1 = boundaries_list[0]
+        locs = axes[0][1].yaxis.get_majorticklocs()
+        locs = locs[(lim1[0] <= locs) & (locs <= lim1[1])]
+        adj = (locs - lim1[0]) / (lim1[1] - lim1[0])
+
+        lim0 = axes[0][0].get_ylim()
+        adj = adj * (lim0[1] - lim0[0]) + lim0[0]
+        axes[0][0].yaxis.set_ticks(adj)
+
+        if np.all(locs == locs.astype(int)):
+            # if all ticks are int
+            locs = locs.astype(int)
+        axes[0][0].yaxis.set_ticklabels(locs)
+
+    _set_ticks_props(axes, xlabelsize=8, xrot=90, ylabelsize=8, yrot=0)
+
+    return axes
+
+
+def _get_marker_compat(marker):
+    import matplotlib.lines as mlines
+    import matplotlib as mpl
+    if mpl.__version__ < '1.1.0' and marker == '.':
+        return 'o'
+    if marker not in mlines.lineMarkers:
+        return 'o'
+    return marker
+
+
+def radviz(frame, class_column, ax=None, color=None, colormap=None, **kwds):
+    """
+    Plot a multidimensional dataset in 2D.
+
+    Each Series in the DataFrame is represented as a evenly distributed
+    slice on a circle. Each data point is rendered in the circle according to
+    the value on each Series. Highly correlated `Series` in the `DataFrame`
+    are placed closer on the unit circle.
+
+    RadViz allow to project a N-dimensional data set into a 2D space where the
+    influence of each dimension can be interpreted as a balance between the
+    influence of all dimensions.
+
+    More info available at the `original article
+    <http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.135.889>`_
+    describing RadViz.
+
+    Parameters
+    ----------
+    frame : `DataFrame`
+        Pandas object holding the data.
+    class_column : str
+        Column name containing the name of the data point category.
+    ax : :class:`matplotlib.axes.Axes`, optional
+        A plot instance to which to add the information.
+    color : list[str] or tuple[str], optional
+        Assign a color to each category. Example: ['blue', 'green'].
+    colormap : str or :class:`matplotlib.colors.Colormap`, default None
+        Colormap to select colors from. If string, load colormap with that
+        name from matplotlib.
+    kwds : optional
+        Options to pass to matplotlib scatter plotting method.
+
+    Returns
+    -------
+    axes : :class:`matplotlib.axes.Axes`
+
+    See Also
+    --------
+    pandas.plotting.andrews_curves : Plot clustering visualization
+
+    Examples
+    --------
+    .. plot::
+        :context: close-figs
+
+        >>> df = pd.DataFrame({
+        ...         'SepalLength': [6.5, 7.7, 5.1, 5.8, 7.6, 5.0, 5.4, 4.6,
+        ...                         6.7, 4.6],
+        ...         'SepalWidth': [3.0, 3.8, 3.8, 2.7, 3.0, 2.3, 3.0, 3.2,
+        ...                        3.3, 3.6],
+        ...         'PetalLength': [5.5, 6.7, 1.9, 5.1, 6.6, 3.3, 4.5, 1.4,
+        ...                         5.7, 1.0],
+        ...         'PetalWidth': [1.8, 2.2, 0.4, 1.9, 2.1, 1.0, 1.5, 0.2,
+        ...                        2.1, 0.2],
+        ...         'Category': ['virginica', 'virginica', 'setosa',
+        ...                      'virginica', 'virginica', 'versicolor',
+        ...                      'versicolor', 'setosa', 'virginica',
+        ...                      'setosa']
+        ...     })
+        >>> rad_viz = pd.plotting.radviz(df, 'Category')
+    """
+    import matplotlib.pyplot as plt
+    import matplotlib.patches as patches
+
+    def normalize(series):
+        a = min(series)
+        b = max(series)
+        return (series - a) / (b - a)
+
+    n = len(frame)
+    classes = frame[class_column].drop_duplicates()
+    class_col = frame[class_column]
+    df = frame.drop(class_column, axis=1).apply(normalize)
+
+    if ax is None:
+        ax = plt.gca(xlim=[-1, 1], ylim=[-1, 1])
+
+    to_plot = {}
+    colors = _get_standard_colors(num_colors=len(classes), colormap=colormap,
+                                  color_type='random', color=color)
+
+    for kls in classes:
+        to_plot[kls] = [[], []]
+
+    m = len(frame.columns) - 1
+    s = np.array([(np.cos(t), np.sin(t))
+                  for t in [2.0 * np.pi * (i / float(m))
+                            for i in range(m)]])
+
+    for i in range(n):
+        row = df.iloc[i].values
+        row_ = np.repeat(np.expand_dims(row, axis=1), 2, axis=1)
+        y = (s * row_).sum(axis=0) / row.sum()
+        kls = class_col.iat[i]
+        to_plot[kls][0].append(y[0])
+        to_plot[kls][1].append(y[1])
+
+    for i, kls in enumerate(classes):
+        ax.scatter(to_plot[kls][0], to_plot[kls][1], color=colors[i],
+                   label=pprint_thing(kls), **kwds)
+    ax.legend()
+
+    ax.add_patch(patches.Circle((0.0, 0.0), radius=1.0, facecolor='none'))
+
+    for xy, name in zip(s, df.columns):
+
+        ax.add_patch(patches.Circle(xy, radius=0.025, facecolor='gray'))
+
+        if xy[0] < 0.0 and xy[1] < 0.0:
+            ax.text(xy[0] - 0.025, xy[1] - 0.025, name,
+                    ha='right', va='top', size='small')
+        elif xy[0] < 0.0 and xy[1] >= 0.0:
+            ax.text(xy[0] - 0.025, xy[1] + 0.025, name,
+                    ha='right', va='bottom', size='small')
+        elif xy[0] >= 0.0 and xy[1] < 0.0:
+            ax.text(xy[0] + 0.025, xy[1] - 0.025, name,
+                    ha='left', va='top', size='small')
+        elif xy[0] >= 0.0 and xy[1] >= 0.0:
+            ax.text(xy[0] + 0.025, xy[1] + 0.025, name,
+                    ha='left', va='bottom', size='small')
+
+    ax.axis('equal')
+    return ax
+
+
+@deprecate_kwarg(old_arg_name='data', new_arg_name='frame')
+def andrews_curves(frame, class_column, ax=None, samples=200, color=None,
+                   colormap=None, **kwds):
+    """
+    Generates a matplotlib plot of Andrews curves, for visualising clusters of
+    multivariate data.
+
+    Andrews curves have the functional form:
+
+    f(t) = x_1/sqrt(2) + x_2 sin(t) + x_3 cos(t) +
+           x_4 sin(2t) + x_5 cos(2t) + ...
+
+    Where x coefficients correspond to the values of each dimension and t is
+    linearly spaced between -pi and +pi. Each row of frame then corresponds to
+    a single curve.
+
+    Parameters
+    ----------
+    frame : DataFrame
+        Data to be plotted, preferably normalized to (0.0, 1.0)
+    class_column : Name of the column containing class names
+    ax : matplotlib axes object, default None
+    samples : Number of points to plot in each curve
+    color: list or tuple, optional
+        Colors to use for the different classes
+    colormap : str or matplotlib colormap object, default None
+        Colormap to select colors from. If string, load colormap with that name
+        from matplotlib.
+    kwds: keywords
+        Options to pass to matplotlib plotting method
+
+    Returns
+    -------
+    ax: Matplotlib axis object
+
+    """
+    from math import sqrt, pi
+    import matplotlib.pyplot as plt
+
+    def function(amplitudes):
+        def f(t):
+            x1 = amplitudes[0]
+            result = x1 / sqrt(2.0)
+
+            # Take the rest of the coefficients and resize them
+            # appropriately. Take a copy of amplitudes as otherwise numpy
+            # deletes the element from amplitudes itself.
+            coeffs = np.delete(np.copy(amplitudes), 0)
+            coeffs.resize(int((coeffs.size + 1) / 2), 2)
+
+            # Generate the harmonics and arguments for the sin and cos
+            # functions.
+            harmonics = np.arange(0, coeffs.shape[0]) + 1
+            trig_args = np.outer(harmonics, t)
+
+            result += np.sum(coeffs[:, 0, np.newaxis] * np.sin(trig_args) +
+                             coeffs[:, 1, np.newaxis] * np.cos(trig_args),
+                             axis=0)
+            return result
+        return f
+
+    n = len(frame)
+    class_col = frame[class_column]
+    classes = frame[class_column].drop_duplicates()
+    df = frame.drop(class_column, axis=1)
+    t = np.linspace(-pi, pi, samples)
+    used_legends = set([])
+
+    color_values = _get_standard_colors(num_colors=len(classes),
+                                        colormap=colormap, color_type='random',
+                                        color=color)
+    colors = dict(zip(classes, color_values))
+    if ax is None:
+        ax = plt.gca(xlim=(-pi, pi))
+    for i in range(n):
+        row = df.iloc[i].values
+        f = function(row)
+        y = f(t)
+        kls = class_col.iat[i]
+        label = pprint_thing(kls)
+        if label not in used_legends:
+            used_legends.add(label)
+            ax.plot(t, y, color=colors[kls], label=label, **kwds)
+        else:
+            ax.plot(t, y, color=colors[kls], **kwds)
+
+    ax.legend(loc='upper right')
+    ax.grid()
+    return ax
+
+
+def bootstrap_plot(series, fig=None, size=50, samples=500, **kwds):
+    """
+    Bootstrap plot on mean, median and mid-range statistics.
+
+    The bootstrap plot is used to estimate the uncertainty of a statistic
+    by relaying on random sampling with replacement [1]_. This function will
+    generate bootstrapping plots for mean, median and mid-range statistics
+    for the given number of samples of the given size.
+
+    .. [1] "Bootstrapping (statistics)" in \
+    https://en.wikipedia.org/wiki/Bootstrapping_%28statistics%29
+
+    Parameters
+    ----------
+    series : pandas.Series
+        Pandas Series from where to get the samplings for the bootstrapping.
+    fig : matplotlib.figure.Figure, default None
+        If given, it will use the `fig` reference for plotting instead of
+        creating a new one with default parameters.
+    size : int, default 50
+        Number of data points to consider during each sampling. It must be
+        greater or equal than the length of the `series`.
+    samples : int, default 500
+        Number of times the bootstrap procedure is performed.
+    **kwds :
+        Options to pass to matplotlib plotting method.
+
+    Returns
+    -------
+    fig : matplotlib.figure.Figure
+        Matplotlib figure
+
+    See Also
+    --------
+    pandas.DataFrame.plot : Basic plotting for DataFrame objects.
+    pandas.Series.plot : Basic plotting for Series objects.
+
+    Examples
+    --------
+
+    .. plot::
+            :context: close-figs
+
+            >>> import numpy as np
+            >>> s = pd.Series(np.random.uniform(size=100))
+            >>> fig = pd.plotting.bootstrap_plot(s)
+    """
+    import random
+    import matplotlib.pyplot as plt
+
+    # random.sample(ndarray, int) fails on python 3.3, sigh
+    data = list(series.values)
+    samplings = [random.sample(data, size) for _ in range(samples)]
+
+    means = np.array([np.mean(sampling) for sampling in samplings])
+    medians = np.array([np.median(sampling) for sampling in samplings])
+    midranges = np.array([(min(sampling) + max(sampling)) * 0.5
+                          for sampling in samplings])
+    if fig is None:
+        fig = plt.figure()
+    x = lrange(samples)
+    axes = []
+    ax1 = fig.add_subplot(2, 3, 1)
+    ax1.set_xlabel("Sample")
+    axes.append(ax1)
+    ax1.plot(x, means, **kwds)
+    ax2 = fig.add_subplot(2, 3, 2)
+    ax2.set_xlabel("Sample")
+    axes.append(ax2)
+    ax2.plot(x, medians, **kwds)
+    ax3 = fig.add_subplot(2, 3, 3)
+    ax3.set_xlabel("Sample")
+    axes.append(ax3)
+    ax3.plot(x, midranges, **kwds)
+    ax4 = fig.add_subplot(2, 3, 4)
+    ax4.set_xlabel("Mean")
+    axes.append(ax4)
+    ax4.hist(means, **kwds)
+    ax5 = fig.add_subplot(2, 3, 5)
+    ax5.set_xlabel("Median")
+    axes.append(ax5)
+    ax5.hist(medians, **kwds)
+    ax6 = fig.add_subplot(2, 3, 6)
+    ax6.set_xlabel("Midrange")
+    axes.append(ax6)
+    ax6.hist(midranges, **kwds)
+    for axis in axes:
+        plt.setp(axis.get_xticklabels(), fontsize=8)
+        plt.setp(axis.get_yticklabels(), fontsize=8)
+    return fig
+
+
+@deprecate_kwarg(old_arg_name='colors', new_arg_name='color')
+@deprecate_kwarg(old_arg_name='data', new_arg_name='frame', stacklevel=3)
+def parallel_coordinates(frame, class_column, cols=None, ax=None, color=None,
+                         use_columns=False, xticks=None, colormap=None,
+                         axvlines=True, axvlines_kwds=None, sort_labels=False,
+                         **kwds):
+    """Parallel coordinates plotting.
+
+    Parameters
+    ----------
+    frame: DataFrame
+    class_column: str
+        Column name containing class names
+    cols: list, optional
+        A list of column names to use
+    ax: matplotlib.axis, optional
+        matplotlib axis object
+    color: list or tuple, optional
+        Colors to use for the different classes
+    use_columns: bool, optional
+        If true, columns will be used as xticks
+    xticks: list or tuple, optional
+        A list of values to use for xticks
+    colormap: str or matplotlib colormap, default None
+        Colormap to use for line colors.
+    axvlines: bool, optional
+        If true, vertical lines will be added at each xtick
+    axvlines_kwds: keywords, optional
+        Options to be passed to axvline method for vertical lines
+    sort_labels: bool, False
+        Sort class_column labels, useful when assigning colors
+
+        .. versionadded:: 0.20.0
+
+    kwds: keywords
+        Options to pass to matplotlib plotting method
+
+    Returns
+    -------
+    ax: matplotlib axis object
+
+    Examples
+    --------
+    >>> from pandas import read_csv
+    >>> from pandas.tools.plotting import parallel_coordinates
+    >>> from matplotlib import pyplot as plt
+    >>> df = read_csv('https://raw.github.com/pandas-dev/pandas/master'
+                      '/pandas/tests/data/iris.csv')
+    >>> parallel_coordinates(df, 'Name', color=('#556270',
+                             '#4ECDC4', '#C7F464'))
+    >>> plt.show()
+    """
+    if axvlines_kwds is None:
+        axvlines_kwds = {'linewidth': 1, 'color': 'black'}
+    import matplotlib.pyplot as plt
+
+    n = len(frame)
+    classes = frame[class_column].drop_duplicates()
+    class_col = frame[class_column]
+
+    if cols is None:
+        df = frame.drop(class_column, axis=1)
+    else:
+        df = frame[cols]
+
+    used_legends = set([])
+
+    ncols = len(df.columns)
+
+    # determine values to use for xticks
+    if use_columns is True:
+        if not np.all(np.isreal(list(df.columns))):
+            raise ValueError('Columns must be numeric to be used as xticks')
+        x = df.columns
+    elif xticks is not None:
+        if not np.all(np.isreal(xticks)):
+            raise ValueError('xticks specified must be numeric')
+        elif len(xticks) != ncols:
+            raise ValueError('Length of xticks must match number of columns')
+        x = xticks
+    else:
+        x = lrange(ncols)
+
+    if ax is None:
+        ax = plt.gca()
+
+    color_values = _get_standard_colors(num_colors=len(classes),
+                                        colormap=colormap, color_type='random',
+                                        color=color)
+
+    if sort_labels:
+        classes = sorted(classes)
+        color_values = sorted(color_values)
+    colors = dict(zip(classes, color_values))
+
+    for i in range(n):
+        y = df.iloc[i].values
+        kls = class_col.iat[i]
+        label = pprint_thing(kls)
+        if label not in used_legends:
+            used_legends.add(label)
+            ax.plot(x, y, color=colors[kls], label=label, **kwds)
+        else:
+            ax.plot(x, y, color=colors[kls], **kwds)
+
+    if axvlines:
+        for i in x:
+            ax.axvline(i, **axvlines_kwds)
+
+    ax.set_xticks(x)
+    ax.set_xticklabels(df.columns)
+    ax.set_xlim(x[0], x[-1])
+    ax.legend(loc='upper right')
+    ax.grid()
+    return ax
+
+
+def lag_plot(series, lag=1, ax=None, **kwds):
+    """Lag plot for time series.
+
+    Parameters
+    ----------
+    series: Time series
+    lag: lag of the scatter plot, default 1
+    ax: Matplotlib axis object, optional
+    kwds: Matplotlib scatter method keyword arguments, optional
+
+    Returns
+    -------
+    ax: Matplotlib axis object
+    """
+    import matplotlib.pyplot as plt
+
+    # workaround because `c='b'` is hardcoded in matplotlibs scatter method
+    kwds.setdefault('c', plt.rcParams['patch.facecolor'])
+
+    data = series.values
+    y1 = data[:-lag]
+    y2 = data[lag:]
+    if ax is None:
+        ax = plt.gca()
+    ax.set_xlabel("y(t)")
+    ax.set_ylabel("y(t + {lag})".format(lag=lag))
+    ax.scatter(y1, y2, **kwds)
+    return ax
+
+
+def autocorrelation_plot(series, ax=None, **kwds):
+    """Autocorrelation plot for time series.
+
+    Parameters:
+    -----------
+    series: Time series
+    ax: Matplotlib axis object, optional
+    kwds : keywords
+        Options to pass to matplotlib plotting method
+
+    Returns:
+    -----------
+    ax: Matplotlib axis object
+    """
+    import matplotlib.pyplot as plt
+    n = len(series)
+    data = np.asarray(series)
+    if ax is None:
+        ax = plt.gca(xlim=(1, n), ylim=(-1.0, 1.0))
+    mean = np.mean(data)
+    c0 = np.sum((data - mean) ** 2) / float(n)
+
+    def r(h):
+        return ((data[:n - h] - mean) *
+                (data[h:] - mean)).sum() / float(n) / c0
+    x = np.arange(n) + 1
+    y = lmap(r, x)
+    z95 = 1.959963984540054
+    z99 = 2.5758293035489004
+    ax.axhline(y=z99 / np.sqrt(n), linestyle='--', color='grey')
+    ax.axhline(y=z95 / np.sqrt(n), color='grey')
+    ax.axhline(y=0.0, color='black')
+    ax.axhline(y=-z95 / np.sqrt(n), color='grey')
+    ax.axhline(y=-z99 / np.sqrt(n), linestyle='--', color='grey')
+    ax.set_xlabel("Lag")
+    ax.set_ylabel("Autocorrelation")
+    ax.plot(x, y, **kwds)
+    if 'label' in kwds:
+        ax.legend()
+    ax.grid()
+    return ax
diff --git a/pandas/plotting/_style.py b/pandas/plotting/_style.py
new file mode 100644
index 0000000000000..426b29a8840f4
--- /dev/null
+++ b/pandas/plotting/_style.py
@@ -0,0 +1,183 @@
+# being a bit too dynamic
+# pylint: disable=E1101
+from __future__ import division
+
+import warnings
+from contextlib import contextmanager
+import re
+
+import numpy as np
+
+from pandas.core.dtypes.common import is_list_like
+from pandas.compat import lrange, lmap
+import pandas.compat as compat
+from pandas.plotting._compat import _mpl_ge_2_0_0
+
+
+def _get_standard_colors(num_colors=None, colormap=None, color_type='default',
+                         color=None):
+    import matplotlib.pyplot as plt
+
+    if color is None and colormap is not None:
+        if isinstance(colormap, compat.string_types):
+            import matplotlib.cm as cm
+            cmap = colormap
+            colormap = cm.get_cmap(colormap)
+            if colormap is None:
+                raise ValueError("Colormap {0} is not recognized".format(cmap))
+        colors = lmap(colormap, np.linspace(0, 1, num=num_colors))
+    elif color is not None:
+        if colormap is not None:
+            warnings.warn("'color' and 'colormap' cannot be used "
+                          "simultaneously. Using 'color'")
+        colors = list(color) if is_list_like(color) else color
+    else:
+        if color_type == 'default':
+            # need to call list() on the result to copy so we don't
+            # modify the global rcParams below
+            try:
+                colors = [c['color']
+                          for c in list(plt.rcParams['axes.prop_cycle'])]
+            except KeyError:
+                colors = list(plt.rcParams.get('axes.color_cycle',
+                                               list('bgrcmyk')))
+            if isinstance(colors, compat.string_types):
+                colors = list(colors)
+        elif color_type == 'random':
+            import pandas.core.common as com
+
+            def random_color(column):
+                """ Returns a random color represented as a list of length 3"""
+                # GH17525 use common._random_state to avoid resetting the seed
+                rs = com._random_state(column)
+                return rs.rand(3).tolist()
+
+            colors = lmap(random_color, lrange(num_colors))
+        else:
+            raise ValueError("color_type must be either 'default' or 'random'")
+
+    if isinstance(colors, compat.string_types):
+        import matplotlib.colors
+        conv = matplotlib.colors.ColorConverter()
+
+        def _maybe_valid_colors(colors):
+            try:
+                [conv.to_rgba(c) for c in colors]
+                return True
+            except ValueError:
+                return False
+
+        # check whether the string can be convertible to single color
+        maybe_single_color = _maybe_valid_colors([colors])
+        # check whether each character can be convertible to colors
+        maybe_color_cycle = _maybe_valid_colors(list(colors))
+        if maybe_single_color and maybe_color_cycle and len(colors) > 1:
+            # Special case for single str 'CN' match and convert to hex
+            # for supporting matplotlib < 2.0.0
+            if re.match(r'\AC[0-9]\Z', colors) and _mpl_ge_2_0_0():
+                hex_color = [c['color']
+                             for c in list(plt.rcParams['axes.prop_cycle'])]
+                colors = [hex_color[int(colors[1])]]
+            else:
+                # this may no longer be required
+                msg = ("'{0}' can be parsed as both single color and "
+                       "color cycle. Specify each color using a list "
+                       "like ['{0}'] or {1}")
+                raise ValueError(msg.format(colors, list(colors)))
+        elif maybe_single_color:
+            colors = [colors]
+        else:
+            # ``colors`` is regarded as color cycle.
+            # mpl will raise error any of them is invalid
+            pass
+
+    if len(colors) != num_colors:
+        try:
+            multiple = num_colors // len(colors) - 1
+        except ZeroDivisionError:
+            raise ValueError("Invalid color argument: ''")
+        mod = num_colors % len(colors)
+
+        colors += multiple * colors
+        colors += colors[:mod]
+
+    return colors
+
+
+class _Options(dict):
+    """
+    Stores pandas plotting options.
+    Allows for parameter aliasing so you can just use parameter names that are
+    the same as the plot function parameters, but is stored in a canonical
+    format that makes it easy to breakdown into groups later
+    """
+
+    # alias so the names are same as plotting method parameter names
+    _ALIASES = {'x_compat': 'xaxis.compat'}
+    _DEFAULT_KEYS = ['xaxis.compat']
+
+    def __init__(self, deprecated=False):
+        self._deprecated = deprecated
+        # self['xaxis.compat'] = False
+        super(_Options, self).__setitem__('xaxis.compat', False)
+
+    def _warn_if_deprecated(self):
+        if self._deprecated:
+            warnings.warn("'pandas.plot_params' is deprecated. Use "
+                          "'pandas.plotting.plot_params' instead",
+                          FutureWarning, stacklevel=3)
+
+    def __getitem__(self, key):
+        self._warn_if_deprecated()
+        key = self._get_canonical_key(key)
+        if key not in self:
+            raise ValueError(
+                '{key} is not a valid pandas plotting option'.format(key=key))
+        return super(_Options, self).__getitem__(key)
+
+    def __setitem__(self, key, value):
+        self._warn_if_deprecated()
+        key = self._get_canonical_key(key)
+        return super(_Options, self).__setitem__(key, value)
+
+    def __delitem__(self, key):
+        key = self._get_canonical_key(key)
+        if key in self._DEFAULT_KEYS:
+            raise ValueError(
+                'Cannot remove default parameter {key}'.format(key=key))
+        return super(_Options, self).__delitem__(key)
+
+    def __contains__(self, key):
+        key = self._get_canonical_key(key)
+        return super(_Options, self).__contains__(key)
+
+    def reset(self):
+        """
+        Reset the option store to its initial state
+
+        Returns
+        -------
+        None
+        """
+        self._warn_if_deprecated()
+        self.__init__()
+
+    def _get_canonical_key(self, key):
+        return self._ALIASES.get(key, key)
+
+    @contextmanager
+    def use(self, key, value):
+        """
+        Temporarily set a parameter value using the with statement.
+        Aliasing allowed.
+        """
+        self._warn_if_deprecated()
+        old_value = self[key]
+        try:
+            self[key] = value
+            yield self
+        finally:
+            self[key] = old_value
+
+
+plot_params = _Options()
diff --git a/pandas/plotting/_timeseries.py b/pandas/plotting/_timeseries.py
new file mode 100644
index 0000000000000..21a03ea388566
--- /dev/null
+++ b/pandas/plotting/_timeseries.py
@@ -0,0 +1,352 @@
+# TODO: Use the fact that axis can have units to simplify the process
+
+import functools
+
+import numpy as np
+
+from matplotlib import pylab
+from pandas.core.indexes.period import Period
+from pandas.tseries.offsets import DateOffset
+import pandas.tseries.frequencies as frequencies
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexes.period import PeriodIndex
+from pandas.core.indexes.timedeltas import TimedeltaIndex
+from pandas.io.formats.printing import pprint_thing
+import pandas.compat as compat
+
+from pandas.plotting._converter import (TimeSeries_DateLocator,
+                                        TimeSeries_DateFormatter,
+                                        TimeSeries_TimedeltaFormatter)
+
+# ---------------------------------------------------------------------
+# Plotting functions and monkey patches
+
+
+def tsplot(series, plotf, ax=None, **kwargs):
+    import warnings
+    """
+    Plots a Series on the given Matplotlib axes or the current axes
+
+    Parameters
+    ----------
+    axes : Axes
+    series : Series
+
+    Notes
+    _____
+    Supports same kwargs as Axes.plot
+
+
+    .. deprecated:: 0.23.0
+       Use Series.plot() instead
+    """
+    warnings.warn("'tsplot' is deprecated and will be removed in a "
+                  "future version. Please use Series.plot() instead.",
+                  FutureWarning, stacklevel=2)
+
+    # Used inferred freq is possible, need a test case for inferred
+    if ax is None:
+        import matplotlib.pyplot as plt
+        ax = plt.gca()
+
+    freq, series = _maybe_resample(series, ax, kwargs)
+
+    # Set ax with freq info
+    _decorate_axes(ax, freq, kwargs)
+    ax._plot_data.append((series, plotf, kwargs))
+    lines = plotf(ax, series.index._mpl_repr(), series.values, **kwargs)
+
+    # set date formatter, locators and rescale limits
+    format_dateaxis(ax, ax.freq, series.index)
+    return lines
+
+
+def _maybe_resample(series, ax, kwargs):
+    # resample against axes freq if necessary
+    freq, ax_freq = _get_freq(ax, series)
+
+    if freq is None:  # pragma: no cover
+        raise ValueError('Cannot use dynamic axis without frequency info')
+
+    # Convert DatetimeIndex to PeriodIndex
+    if isinstance(series.index, DatetimeIndex):
+        series = series.to_period(freq=freq)
+
+    if ax_freq is not None and freq != ax_freq:
+        if frequencies.is_superperiod(freq, ax_freq):  # upsample input
+            series = series.copy()
+            series.index = series.index.asfreq(ax_freq, how='s')
+            freq = ax_freq
+        elif _is_sup(freq, ax_freq):  # one is weekly
+            how = kwargs.pop('how', 'last')
+            series = getattr(series.resample('D'), how)().dropna()
+            series = getattr(series.resample(ax_freq), how)().dropna()
+            freq = ax_freq
+        elif frequencies.is_subperiod(freq, ax_freq) or _is_sub(freq, ax_freq):
+            _upsample_others(ax, freq, kwargs)
+            ax_freq = freq
+        else:  # pragma: no cover
+            raise ValueError('Incompatible frequency conversion')
+    return freq, series
+
+
+def _is_sub(f1, f2):
+    return ((f1.startswith('W') and frequencies.is_subperiod('D', f2)) or
+            (f2.startswith('W') and frequencies.is_subperiod(f1, 'D')))
+
+
+def _is_sup(f1, f2):
+    return ((f1.startswith('W') and frequencies.is_superperiod('D', f2)) or
+            (f2.startswith('W') and frequencies.is_superperiod(f1, 'D')))
+
+
+def _upsample_others(ax, freq, kwargs):
+    legend = ax.get_legend()
+    lines, labels = _replot_ax(ax, freq, kwargs)
+    _replot_ax(ax, freq, kwargs)
+
+    other_ax = None
+    if hasattr(ax, 'left_ax'):
+        other_ax = ax.left_ax
+    if hasattr(ax, 'right_ax'):
+        other_ax = ax.right_ax
+
+    if other_ax is not None:
+        rlines, rlabels = _replot_ax(other_ax, freq, kwargs)
+        lines.extend(rlines)
+        labels.extend(rlabels)
+
+    if (legend is not None and kwargs.get('legend', True) and
+            len(lines) > 0):
+        title = legend.get_title().get_text()
+        if title == 'None':
+            title = None
+        ax.legend(lines, labels, loc='best', title=title)
+
+
+def _replot_ax(ax, freq, kwargs):
+    data = getattr(ax, '_plot_data', None)
+
+    # clear current axes and data
+    ax._plot_data = []
+    ax.clear()
+
+    _decorate_axes(ax, freq, kwargs)
+
+    lines = []
+    labels = []
+    if data is not None:
+        for series, plotf, kwds in data:
+            series = series.copy()
+            idx = series.index.asfreq(freq, how='S')
+            series.index = idx
+            ax._plot_data.append((series, plotf, kwds))
+
+            # for tsplot
+            if isinstance(plotf, compat.string_types):
+                from pandas.plotting._core import _plot_klass
+                plotf = _plot_klass[plotf]._plot
+
+            lines.append(plotf(ax, series.index._mpl_repr(),
+                               series.values, **kwds)[0])
+            labels.append(pprint_thing(series.name))
+
+    return lines, labels
+
+
+def _decorate_axes(ax, freq, kwargs):
+    """Initialize axes for time-series plotting"""
+    if not hasattr(ax, '_plot_data'):
+        ax._plot_data = []
+
+    ax.freq = freq
+    xaxis = ax.get_xaxis()
+    xaxis.freq = freq
+    if not hasattr(ax, 'legendlabels'):
+        ax.legendlabels = [kwargs.get('label', None)]
+    else:
+        ax.legendlabels.append(kwargs.get('label', None))
+    ax.view_interval = None
+    ax.date_axis_info = None
+
+
+def _get_ax_freq(ax):
+    """
+    Get the freq attribute of the ax object if set.
+    Also checks shared axes (eg when using secondary yaxis, sharex=True
+    or twinx)
+    """
+    ax_freq = getattr(ax, 'freq', None)
+    if ax_freq is None:
+        # check for left/right ax in case of secondary yaxis
+        if hasattr(ax, 'left_ax'):
+            ax_freq = getattr(ax.left_ax, 'freq', None)
+        elif hasattr(ax, 'right_ax'):
+            ax_freq = getattr(ax.right_ax, 'freq', None)
+    if ax_freq is None:
+        # check if a shared ax (sharex/twinx) has already freq set
+        shared_axes = ax.get_shared_x_axes().get_siblings(ax)
+        if len(shared_axes) > 1:
+            for shared_ax in shared_axes:
+                ax_freq = getattr(shared_ax, 'freq', None)
+                if ax_freq is not None:
+                    break
+    return ax_freq
+
+
+def _get_freq(ax, series):
+    # get frequency from data
+    freq = getattr(series.index, 'freq', None)
+    if freq is None:
+        freq = getattr(series.index, 'inferred_freq', None)
+
+    ax_freq = _get_ax_freq(ax)
+
+    # use axes freq if no data freq
+    if freq is None:
+        freq = ax_freq
+
+    # get the period frequency
+    if isinstance(freq, DateOffset):
+        freq = freq.rule_code
+    else:
+        freq = frequencies.get_base_alias(freq)
+
+    freq = frequencies.get_period_alias(freq)
+    return freq, ax_freq
+
+
+def _use_dynamic_x(ax, data):
+    freq = _get_index_freq(data)
+    ax_freq = _get_ax_freq(ax)
+
+    if freq is None:  # convert irregular if axes has freq info
+        freq = ax_freq
+    else:  # do not use tsplot if irregular was plotted first
+        if (ax_freq is None) and (len(ax.get_lines()) > 0):
+            return False
+
+    if freq is None:
+        return False
+
+    if isinstance(freq, DateOffset):
+        freq = freq.rule_code
+    else:
+        freq = frequencies.get_base_alias(freq)
+    freq = frequencies.get_period_alias(freq)
+
+    if freq is None:
+        return False
+
+    # hack this for 0.10.1, creating more technical debt...sigh
+    if isinstance(data.index, DatetimeIndex):
+        base = frequencies.get_freq(freq)
+        x = data.index
+        if (base <= frequencies.FreqGroup.FR_DAY):
+            return x[:1].is_normalized
+        return Period(x[0], freq).to_timestamp(tz=x.tz) == x[0]
+    return True
+
+
+def _get_index_freq(data):
+    freq = getattr(data.index, 'freq', None)
+    if freq is None:
+        freq = getattr(data.index, 'inferred_freq', None)
+        if freq == 'B':
+            weekdays = np.unique(data.index.dayofweek)
+            if (5 in weekdays) or (6 in weekdays):
+                freq = None
+    return freq
+
+
+def _maybe_convert_index(ax, data):
+    # tsplot converts automatically, but don't want to convert index
+    # over and over for DataFrames
+    if isinstance(data.index, DatetimeIndex):
+        freq = getattr(data.index, 'freq', None)
+
+        if freq is None:
+            freq = getattr(data.index, 'inferred_freq', None)
+        if isinstance(freq, DateOffset):
+            freq = freq.rule_code
+
+        if freq is None:
+            freq = _get_ax_freq(ax)
+
+        if freq is None:
+            raise ValueError('Could not get frequency alias for plotting')
+
+        freq = frequencies.get_base_alias(freq)
+        freq = frequencies.get_period_alias(freq)
+
+        data = data.to_period(freq=freq)
+    return data
+
+
+# Patch methods for subplot. Only format_dateaxis is currently used.
+# Do we need the rest for convenience?
+
+def format_timedelta_ticks(x, pos, n_decimals):
+    """
+    Convert seconds to 'D days HH:MM:SS.F'
+    """
+    s, ns = divmod(x, 1e9)
+    m, s = divmod(s, 60)
+    h, m = divmod(m, 60)
+    d, h = divmod(h, 24)
+    decimals = int(ns * 10**(n_decimals - 9))
+    s = r'{:02d}:{:02d}:{:02d}'.format(int(h), int(m), int(s))
+    if n_decimals > 0:
+        s += '.{{:0{:0d}d}}'.format(n_decimals).format(decimals)
+    if d != 0:
+        s = '{:d} days '.format(int(d)) + s
+    return s
+
+
+def _format_coord(freq, t, y):
+    return "t = {0}  y = {1:8f}".format(Period(ordinal=int(t), freq=freq), y)
+
+
+def format_dateaxis(subplot, freq, index):
+    """
+    Pretty-formats the date axis (x-axis).
+
+    Major and minor ticks are automatically set for the frequency of the
+    current underlying series.  As the dynamic mode is activated by
+    default, changing the limits of the x axis will intelligently change
+    the positions of the ticks.
+    """
+
+    # handle index specific formatting
+    # Note: DatetimeIndex does not use this
+    # interface. DatetimeIndex uses matplotlib.date directly
+    if isinstance(index, PeriodIndex):
+
+        majlocator = TimeSeries_DateLocator(freq, dynamic_mode=True,
+                                            minor_locator=False,
+                                            plot_obj=subplot)
+        minlocator = TimeSeries_DateLocator(freq, dynamic_mode=True,
+                                            minor_locator=True,
+                                            plot_obj=subplot)
+        subplot.xaxis.set_major_locator(majlocator)
+        subplot.xaxis.set_minor_locator(minlocator)
+
+        majformatter = TimeSeries_DateFormatter(freq, dynamic_mode=True,
+                                                minor_locator=False,
+                                                plot_obj=subplot)
+        minformatter = TimeSeries_DateFormatter(freq, dynamic_mode=True,
+                                                minor_locator=True,
+                                                plot_obj=subplot)
+        subplot.xaxis.set_major_formatter(majformatter)
+        subplot.xaxis.set_minor_formatter(minformatter)
+
+        # x and y coord info
+        subplot.format_coord = functools.partial(_format_coord, freq)
+
+    elif isinstance(index, TimedeltaIndex):
+        subplot.xaxis.set_major_formatter(
+            TimeSeries_TimedeltaFormatter())
+    else:
+        raise TypeError('index type not supported')
+
+    pylab.draw_if_interactive()
diff --git a/pandas/plotting/_tools.py b/pandas/plotting/_tools.py
new file mode 100644
index 0000000000000..816586fbb82f5
--- /dev/null
+++ b/pandas/plotting/_tools.py
@@ -0,0 +1,383 @@
+# being a bit too dynamic
+# pylint: disable=E1101
+from __future__ import division
+
+import warnings
+from math import ceil
+
+import numpy as np
+
+from pandas.core.dtypes.common import is_list_like
+from pandas.core.dtypes.generic import ABCSeries
+from pandas.core.index import Index
+from pandas.compat import range
+
+
+def format_date_labels(ax, rot):
+    # mini version of autofmt_xdate
+    try:
+        for label in ax.get_xticklabels():
+            label.set_ha('right')
+            label.set_rotation(rot)
+        fig = ax.get_figure()
+        fig.subplots_adjust(bottom=0.2)
+    except Exception:  # pragma: no cover
+        pass
+
+
+def table(ax, data, rowLabels=None, colLabels=None, **kwargs):
+    """
+    Helper function to convert DataFrame and Series to matplotlib.table
+
+    Parameters
+    ----------
+    `ax`: Matplotlib axes object
+    `data`: DataFrame or Series
+        data for table contents
+    `kwargs`: keywords, optional
+        keyword arguments which passed to matplotlib.table.table.
+        If `rowLabels` or `colLabels` is not specified, data index or column
+        name will be used.
+
+    Returns
+    -------
+    matplotlib table object
+    """
+    from pandas import DataFrame
+    if isinstance(data, ABCSeries):
+        data = DataFrame(data, columns=[data.name])
+    elif isinstance(data, DataFrame):
+        pass
+    else:
+        raise ValueError('Input data must be DataFrame or Series')
+
+    if rowLabels is None:
+        rowLabels = data.index
+
+    if colLabels is None:
+        colLabels = data.columns
+
+    cellText = data.values
+
+    import matplotlib.table
+    table = matplotlib.table.table(ax, cellText=cellText,
+                                   rowLabels=rowLabels,
+                                   colLabels=colLabels, **kwargs)
+    return table
+
+
+def _get_layout(nplots, layout=None, layout_type='box'):
+    if layout is not None:
+        if not isinstance(layout, (tuple, list)) or len(layout) != 2:
+            raise ValueError('Layout must be a tuple of (rows, columns)')
+
+        nrows, ncols = layout
+
+        # Python 2 compat
+        ceil_ = lambda x: int(ceil(x))
+        if nrows == -1 and ncols > 0:
+            layout = nrows, ncols = (ceil_(float(nplots) / ncols), ncols)
+        elif ncols == -1 and nrows > 0:
+            layout = nrows, ncols = (nrows, ceil_(float(nplots) / nrows))
+        elif ncols <= 0 and nrows <= 0:
+            msg = "At least one dimension of layout must be positive"
+            raise ValueError(msg)
+
+        if nrows * ncols < nplots:
+            raise ValueError('Layout of {nrows}x{ncols} must be larger '
+                             'than required size {nplots}'.format(
+                                 nrows=nrows, ncols=ncols, nplots=nplots))
+
+        return layout
+
+    if layout_type == 'single':
+        return (1, 1)
+    elif layout_type == 'horizontal':
+        return (1, nplots)
+    elif layout_type == 'vertical':
+        return (nplots, 1)
+
+    layouts = {1: (1, 1), 2: (1, 2), 3: (2, 2), 4: (2, 2)}
+    try:
+        return layouts[nplots]
+    except KeyError:
+        k = 1
+        while k ** 2 < nplots:
+            k += 1
+
+        if (k - 1) * k >= nplots:
+            return k, (k - 1)
+        else:
+            return k, k
+
+# copied from matplotlib/pyplot.py and modified for pandas.plotting
+
+
+def _subplots(naxes=None, sharex=False, sharey=False, squeeze=True,
+              subplot_kw=None, ax=None, layout=None, layout_type='box',
+              **fig_kw):
+    """Create a figure with a set of subplots already made.
+
+    This utility wrapper makes it convenient to create common layouts of
+    subplots, including the enclosing figure object, in a single call.
+
+    Keyword arguments:
+
+    naxes : int
+      Number of required axes. Exceeded axes are set invisible. Default is
+      nrows * ncols.
+
+    sharex : bool
+      If True, the X axis will be shared amongst all subplots.
+
+    sharey : bool
+      If True, the Y axis will be shared amongst all subplots.
+
+    squeeze : bool
+
+      If True, extra dimensions are squeezed out from the returned axis object:
+        - if only one subplot is constructed (nrows=ncols=1), the resulting
+        single Axis object is returned as a scalar.
+        - for Nx1 or 1xN subplots, the returned object is a 1-d numpy object
+        array of Axis objects are returned as numpy 1-d arrays.
+        - for NxM subplots with N>1 and M>1 are returned as a 2d array.
+
+      If False, no squeezing is done: the returned axis object is always
+      a 2-d array containing Axis instances, even if it ends up being 1x1.
+
+    subplot_kw : dict
+      Dict with keywords passed to the add_subplot() call used to create each
+      subplots.
+
+    ax : Matplotlib axis object, optional
+
+    layout : tuple
+      Number of rows and columns of the subplot grid.
+      If not specified, calculated from naxes and layout_type
+
+    layout_type : {'box', 'horziontal', 'vertical'}, default 'box'
+      Specify how to layout the subplot grid.
+
+    fig_kw : Other keyword arguments to be passed to the figure() call.
+        Note that all keywords not recognized above will be
+        automatically included here.
+
+    Returns:
+
+    fig, ax : tuple
+      - fig is the Matplotlib Figure object
+      - ax can be either a single axis object or an array of axis objects if
+      more than one subplot was created.  The dimensions of the resulting array
+      can be controlled with the squeeze keyword, see above.
+
+    **Examples:**
+
+    x = np.linspace(0, 2*np.pi, 400)
+    y = np.sin(x**2)
+
+    # Just a figure and one subplot
+    f, ax = plt.subplots()
+    ax.plot(x, y)
+    ax.set_title('Simple plot')
+
+    # Two subplots, unpack the output array immediately
+    f, (ax1, ax2) = plt.subplots(1, 2, sharey=True)
+    ax1.plot(x, y)
+    ax1.set_title('Sharing Y axis')
+    ax2.scatter(x, y)
+
+    # Four polar axes
+    plt.subplots(2, 2, subplot_kw=dict(polar=True))
+    """
+    import matplotlib.pyplot as plt
+
+    if subplot_kw is None:
+        subplot_kw = {}
+
+    if ax is None:
+        fig = plt.figure(**fig_kw)
+    else:
+        if is_list_like(ax):
+            ax = _flatten(ax)
+            if layout is not None:
+                warnings.warn("When passing multiple axes, layout keyword is "
+                              "ignored", UserWarning)
+            if sharex or sharey:
+                warnings.warn("When passing multiple axes, sharex and sharey "
+                              "are ignored. These settings must be specified "
+                              "when creating axes", UserWarning,
+                              stacklevel=4)
+            if len(ax) == naxes:
+                fig = ax[0].get_figure()
+                return fig, ax
+            else:
+                raise ValueError("The number of passed axes must be {0}, the "
+                                 "same as the output plot".format(naxes))
+
+        fig = ax.get_figure()
+        # if ax is passed and a number of subplots is 1, return ax as it is
+        if naxes == 1:
+            if squeeze:
+                return fig, ax
+            else:
+                return fig, _flatten(ax)
+        else:
+            warnings.warn("To output multiple subplots, the figure containing "
+                          "the passed axes is being cleared", UserWarning,
+                          stacklevel=4)
+            fig.clear()
+
+    nrows, ncols = _get_layout(naxes, layout=layout, layout_type=layout_type)
+    nplots = nrows * ncols
+
+    # Create empty object array to hold all axes.  It's easiest to make it 1-d
+    # so we can just append subplots upon creation, and then
+    axarr = np.empty(nplots, dtype=object)
+
+    # Create first subplot separately, so we can share it if requested
+    ax0 = fig.add_subplot(nrows, ncols, 1, **subplot_kw)
+
+    if sharex:
+        subplot_kw['sharex'] = ax0
+    if sharey:
+        subplot_kw['sharey'] = ax0
+    axarr[0] = ax0
+
+    # Note off-by-one counting because add_subplot uses the MATLAB 1-based
+    # convention.
+    for i in range(1, nplots):
+        kwds = subplot_kw.copy()
+        # Set sharex and sharey to None for blank/dummy axes, these can
+        # interfere with proper axis limits on the visible axes if
+        # they share axes e.g. issue #7528
+        if i >= naxes:
+            kwds['sharex'] = None
+            kwds['sharey'] = None
+        ax = fig.add_subplot(nrows, ncols, i + 1, **kwds)
+        axarr[i] = ax
+
+    if naxes != nplots:
+        for ax in axarr[naxes:]:
+            ax.set_visible(False)
+
+    _handle_shared_axes(axarr, nplots, naxes, nrows, ncols, sharex, sharey)
+
+    if squeeze:
+        # Reshape the array to have the final desired dimension (nrow,ncol),
+        # though discarding unneeded dimensions that equal 1.  If we only have
+        # one subplot, just return it instead of a 1-element array.
+        if nplots == 1:
+            axes = axarr[0]
+        else:
+            axes = axarr.reshape(nrows, ncols).squeeze()
+    else:
+        # returned axis array will be always 2-d, even if nrows=ncols=1
+        axes = axarr.reshape(nrows, ncols)
+
+    return fig, axes
+
+
+def _remove_labels_from_axis(axis):
+    for t in axis.get_majorticklabels():
+        t.set_visible(False)
+
+    try:
+        # set_visible will not be effective if
+        # minor axis has NullLocator and NullFormattor (default)
+        import matplotlib.ticker as ticker
+        if isinstance(axis.get_minor_locator(), ticker.NullLocator):
+            axis.set_minor_locator(ticker.AutoLocator())
+        if isinstance(axis.get_minor_formatter(), ticker.NullFormatter):
+            axis.set_minor_formatter(ticker.FormatStrFormatter(''))
+        for t in axis.get_minorticklabels():
+            t.set_visible(False)
+    except Exception:   # pragma no cover
+        raise
+    axis.get_label().set_visible(False)
+
+
+def _handle_shared_axes(axarr, nplots, naxes, nrows, ncols, sharex, sharey):
+    if nplots > 1:
+
+        if nrows > 1:
+            try:
+                # first find out the ax layout,
+                # so that we can correctly handle 'gaps"
+                layout = np.zeros((nrows + 1, ncols + 1), dtype=np.bool)
+                for ax in axarr:
+                    layout[ax.rowNum, ax.colNum] = ax.get_visible()
+
+                for ax in axarr:
+                    # only the last row of subplots should get x labels -> all
+                    # other off layout handles the case that the subplot is
+                    # the last in the column, because below is no subplot/gap.
+                    if not layout[ax.rowNum + 1, ax.colNum]:
+                        continue
+                    if sharex or len(ax.get_shared_x_axes()
+                                     .get_siblings(ax)) > 1:
+                        _remove_labels_from_axis(ax.xaxis)
+
+            except IndexError:
+                # if gridspec is used, ax.rowNum and ax.colNum may different
+                # from layout shape. in this case, use last_row logic
+                for ax in axarr:
+                    if ax.is_last_row():
+                        continue
+                    if sharex or len(ax.get_shared_x_axes()
+                                     .get_siblings(ax)) > 1:
+                        _remove_labels_from_axis(ax.xaxis)
+
+        if ncols > 1:
+            for ax in axarr:
+                # only the first column should get y labels -> set all other to
+                # off as we only have labels in the first column and we always
+                # have a subplot there, we can skip the layout test
+                if ax.is_first_col():
+                    continue
+                if sharey or len(ax.get_shared_y_axes().get_siblings(ax)) > 1:
+                    _remove_labels_from_axis(ax.yaxis)
+
+
+def _flatten(axes):
+    if not is_list_like(axes):
+        return np.array([axes])
+    elif isinstance(axes, (np.ndarray, Index)):
+        return axes.ravel()
+    return np.array(axes)
+
+
+def _get_all_lines(ax):
+    lines = ax.get_lines()
+
+    if hasattr(ax, 'right_ax'):
+        lines += ax.right_ax.get_lines()
+
+    if hasattr(ax, 'left_ax'):
+        lines += ax.left_ax.get_lines()
+
+    return lines
+
+
+def _get_xlim(lines):
+    left, right = np.inf, -np.inf
+    for l in lines:
+        x = l.get_xdata(orig=False)
+        left = min(np.nanmin(x), left)
+        right = max(np.nanmax(x), right)
+    return left, right
+
+
+def _set_ticks_props(axes, xlabelsize=None, xrot=None,
+                     ylabelsize=None, yrot=None):
+    import matplotlib.pyplot as plt
+
+    for ax in _flatten(axes):
+        if xlabelsize is not None:
+            plt.setp(ax.get_xticklabels(), fontsize=xlabelsize)
+        if xrot is not None:
+            plt.setp(ax.get_xticklabels(), rotation=xrot)
+        if ylabelsize is not None:
+            plt.setp(ax.get_yticklabels(), fontsize=ylabelsize)
+        if yrot is not None:
+            plt.setp(ax.get_yticklabels(), rotation=yrot)
+    return axes
diff --git a/pandas/rpy/__init__.py b/pandas/rpy/__init__.py
deleted file mode 100644
index 8c92ce5842e15..0000000000000
--- a/pandas/rpy/__init__.py
+++ /dev/null
@@ -1,16 +0,0 @@
-
-# GH9602
-# deprecate rpy to instead directly use rpy2
-
-import warnings
-warnings.warn("The pandas.rpy module is deprecated and will be "
-              "removed in a future version. We refer to external packages "
-              "like rpy2. "
-              "\nSee here for a guide on how to port your code to rpy2: "
-              "http://pandas.pydata.org/pandas-docs/stable/r_interface.html",
-              FutureWarning, stacklevel=2)
-
-try:
-    from .common import importr, r, load_data
-except ImportError:
-    pass
diff --git a/pandas/rpy/base.py b/pandas/rpy/base.py
deleted file mode 100644
index 4cd86d3c3f4e3..0000000000000
--- a/pandas/rpy/base.py
+++ /dev/null
@@ -1,12 +0,0 @@
-import pandas.rpy.util as util
-
-
-class lm(object):
-    """
-    Examples
-    --------
-    >>> model = lm('x ~ y + z', data)
-    >>> model.coef
-    """
-    def __init__(self, formula, data):
-        pass
diff --git a/pandas/rpy/common.py b/pandas/rpy/common.py
deleted file mode 100644
index 55adad3610816..0000000000000
--- a/pandas/rpy/common.py
+++ /dev/null
@@ -1,369 +0,0 @@
-"""
-Utilities for making working with rpy2 more user- and
-developer-friendly.
-"""
-from __future__ import print_function
-
-from distutils.version import LooseVersion
-from pandas.compat import zip, range
-import numpy as np
-
-import pandas as pd
-import pandas.core.common as com
-import pandas.util.testing as _test
-
-from rpy2.robjects.packages import importr
-from rpy2.robjects import r
-import rpy2.robjects as robj
-
-import itertools as IT
-
-
-__all__ = ['convert_robj', 'load_data', 'convert_to_r_dataframe',
-           'convert_to_r_matrix']
-
-
-def load_data(name, package=None, convert=True):
-    if package:
-        importr(package)
-
-    r.data(name)
-
-    robj = r[name]
-
-    if convert:
-        return convert_robj(robj)
-    else:
-        return robj
-
-
-def _rclass(obj):
-    """
-    Return R class name for input object
-    """
-    return r['class'](obj)[0]
-
-
-def _is_null(obj):
-    return _rclass(obj) == 'NULL'
-
-
-def _convert_list(obj):
-    """
-    Convert named Vector to dict, factors to list
-    """
-    try:
-        values = [convert_robj(x) for x in obj]
-        keys = r['names'](obj)
-        return dict(zip(keys, values))
-    except TypeError:
-        # For state.division and state.region
-        factors = list(r['factor'](obj))
-        level = list(r['levels'](obj))
-        result = [level[index-1] for index in factors]
-        return result
-
-
-def _convert_array(obj):
-    """
-    Convert Array to DataFrame
-    """
-    def _list(item):
-        try:
-            return list(item)
-        except TypeError:
-            return []
-
-    # For iris3, HairEyeColor, UCBAdmissions, Titanic
-    dim = list(obj.dim)
-    values = np.array(list(obj))
-    names = r['dimnames'](obj)
-    try:
-        columns = list(r['names'](names))[::-1]
-    except TypeError:
-        columns = ['X{:d}'.format(i) for i in range(len(names))][::-1]
-    columns.append('value')
-    name_list = [(_list(x) or range(d)) for x, d in zip(names, dim)][::-1]
-    arr = np.array(list(IT.product(*name_list)))
-    arr = np.column_stack([arr,values])
-    df = pd.DataFrame(arr, columns=columns)
-    return df
-
-
-def _convert_vector(obj):
-    if isinstance(obj, robj.IntVector):
-        return _convert_int_vector(obj)
-    elif isinstance(obj, robj.StrVector):
-        return _convert_str_vector(obj)
-    # Check if the vector has extra information attached to it that can be used
-    # as an index
-    try:
-        attributes = set(r['attributes'](obj).names)
-    except AttributeError:
-        return list(obj)
-    if 'names' in attributes:
-        return pd.Series(list(obj), index=r['names'](obj))
-    elif 'tsp' in attributes:
-        return pd.Series(list(obj), index=r['time'](obj))
-    elif 'labels' in attributes:
-        return pd.Series(list(obj), index=r['labels'](obj))
-    if _rclass(obj) == 'dist':
-        # For 'eurodist'. WARNING: This results in a DataFrame, not a Series or list.
-        matrix = r['as.matrix'](obj)
-        return convert_robj(matrix)
-    else:
-        return list(obj)
-
-NA_INTEGER = -2147483648
-
-
-def _convert_int_vector(obj):
-    arr = np.asarray(obj)
-    mask = arr == NA_INTEGER
-    if mask.any():
-        arr = arr.astype(float)
-        arr[mask] = np.nan
-    return arr
-
-
-def _convert_str_vector(obj):
-    arr = np.asarray(obj, dtype=object)
-    mask = arr == robj.NA_Character
-    if mask.any():
-        arr[mask] = np.nan
-    return arr
-
-
-def _convert_DataFrame(rdf):
-    columns = list(rdf.colnames)
-    rows = np.array(rdf.rownames)
-
-    data = {}
-    for i, col in enumerate(columns):
-        vec = rdf.rx2(i + 1)
-        values = _convert_vector(vec)
-
-        if isinstance(vec, robj.FactorVector):
-            levels = np.asarray(vec.levels)
-            if com.is_float_dtype(values):
-                mask = np.isnan(values)
-                notmask = -mask
-                result = np.empty(len(values), dtype=object)
-                result[mask] = np.nan
-
-                locs = (values[notmask] - 1).astype(np.int_)
-                result[notmask] = levels.take(locs)
-                values = result
-            else:
-                values = np.asarray(vec.levels).take(values - 1)
-
-        data[col] = values
-
-    return pd.DataFrame(data, index=_check_int(rows), columns=columns)
-
-
-def _convert_Matrix(mat):
-    columns = mat.colnames
-    rows = mat.rownames
-
-    columns = None if _is_null(columns) else list(columns)
-    index = r['time'](mat) if _is_null(rows) else list(rows)
-    return pd.DataFrame(np.array(mat), index=_check_int(index),
-                        columns=columns)
-
-
-def _check_int(vec):
-    try:
-        # R observation numbers come through as strings
-        vec = vec.astype(int)
-    except Exception:
-        pass
-
-    return vec
-
-_pandas_converters = [
-    (robj.DataFrame, _convert_DataFrame),
-    (robj.Matrix, _convert_Matrix),
-    (robj.StrVector, _convert_vector),
-    (robj.FloatVector, _convert_vector),
-    (robj.Array, _convert_array),
-    (robj.Vector, _convert_list),
-]
-
-_converters = [
-    (robj.DataFrame, lambda x: _convert_DataFrame(x).toRecords(index=False)),
-    (robj.Matrix, lambda x: _convert_Matrix(x).toRecords(index=False)),
-    (robj.IntVector, _convert_vector),
-    (robj.StrVector, _convert_vector),
-    (robj.FloatVector, _convert_vector),
-    (robj.Array, _convert_array),
-    (robj.Vector, _convert_list),
-]
-
-
-def convert_robj(obj, use_pandas=True):
-    """
-    Convert rpy2 object to a pandas-friendly form
-
-    Parameters
-    ----------
-    obj : rpy2 object
-
-    Returns
-    -------
-    Non-rpy data structure, mix of NumPy and pandas objects
-    """
-    if not isinstance(obj, robj.RObjectMixin):
-        return obj
-
-    converters = _pandas_converters if use_pandas else _converters
-
-    for rpy_type, converter in converters:
-        if isinstance(obj, rpy_type):
-            return converter(obj)
-
-    raise TypeError('Do not know what to do with %s object' % type(obj))
-
-
-def convert_to_r_posixct(obj):
-    """
-    Convert DatetimeIndex or np.datetime array to R POSIXct using
-    m8[s] format.
-
-    Parameters
-    ----------
-    obj : source pandas object (one of [DatetimeIndex, np.datetime])
-
-    Returns
-    -------
-    An R POSIXct vector (rpy2.robjects.vectors.POSIXct)
-
-    """
-    import time
-    from rpy2.rinterface import StrSexpVector
-
-    # convert m8[ns] to m8[s]
-    vals = robj.vectors.FloatSexpVector(obj.values.view('i8') / 1E9)
-    as_posixct = robj.baseenv.get('as.POSIXct')
-    origin = StrSexpVector([time.strftime("%Y-%m-%d",
-                                          time.gmtime(0)), ])
-
-    # We will be sending ints as UTC
-    tz = obj.tz.zone if hasattr(
-        obj, 'tz') and hasattr(obj.tz, 'zone') else 'UTC'
-    tz = StrSexpVector([tz])
-    utc_tz = StrSexpVector(['UTC'])
-
-    posixct = as_posixct(vals, origin=origin, tz=utc_tz)
-    posixct.do_slot_assign('tzone', tz)
-    return posixct
-
-
-VECTOR_TYPES = {np.float64: robj.FloatVector,
-                np.float32: robj.FloatVector,
-                np.float: robj.FloatVector,
-                np.int: robj.IntVector,
-                np.int32: robj.IntVector,
-                np.int64: robj.IntVector,
-                np.object_: robj.StrVector,
-                np.str: robj.StrVector,
-                np.bool: robj.BoolVector}
-
-
-NA_TYPES = {np.float64: robj.NA_Real,
-            np.float32: robj.NA_Real,
-            np.float: robj.NA_Real,
-            np.int: robj.NA_Integer,
-            np.int32: robj.NA_Integer,
-            np.int64: robj.NA_Integer,
-            np.object_: robj.NA_Character,
-            np.str: robj.NA_Character,
-            np.bool: robj.NA_Logical}
-
-
-if LooseVersion(np.__version__) >= LooseVersion('1.8'):
-    for dict_ in (VECTOR_TYPES, NA_TYPES):
-        dict_.update({
-            np.bool_: dict_[np.bool],
-            np.int_: dict_[np.int],
-            np.float_: dict_[np.float],
-            np.string_: dict_[np.str]
-        })
-
-
-def convert_to_r_dataframe(df, strings_as_factors=False):
-    """
-    Convert a pandas DataFrame to a R data.frame.
-
-    Parameters
-    ----------
-    df: The DataFrame being converted
-    strings_as_factors: Whether to turn strings into R factors (default: False)
-
-    Returns
-    -------
-    A R data.frame
-
-    """
-
-    import rpy2.rlike.container as rlc
-
-    columns = rlc.OrdDict()
-
-    # FIXME: This doesn't handle MultiIndex
-
-    for column in df:
-        value = df[column]
-        value_type = value.dtype.type
-
-        if value_type == np.datetime64:
-            value = convert_to_r_posixct(value)
-        else:
-            value = [item if pd.notnull(item) else NA_TYPES[value_type]
-                     for item in value]
-
-            value = VECTOR_TYPES[value_type](value)
-
-            if not strings_as_factors:
-                I = robj.baseenv.get("I")
-                value = I(value)
-
-        columns[column] = value
-
-    r_dataframe = robj.DataFrame(columns)
-
-    del columns
-
-    r_dataframe.rownames = robj.StrVector(df.index)
-
-    return r_dataframe
-
-
-def convert_to_r_matrix(df, strings_as_factors=False):
-
-    """
-    Convert a pandas DataFrame to a R matrix.
-
-    Parameters
-    ----------
-    df: The DataFrame being converted
-    strings_as_factors: Whether to turn strings into R factors (default: False)
-
-    Returns
-    -------
-    A R matrix
-
-    """
-
-    if df._is_mixed_type:
-        raise TypeError("Conversion to matrix only possible with non-mixed "
-                        "type DataFrames")
-
-    r_dataframe = convert_to_r_dataframe(df, strings_as_factors)
-    as_matrix = robj.baseenv.get("as.matrix")
-    r_matrix = as_matrix(r_dataframe)
-
-    return r_matrix
-
-if __name__ == '__main__':
-    pass
diff --git a/pandas/rpy/mass.py b/pandas/rpy/mass.py
deleted file mode 100644
index 12fbbdfa4dc98..0000000000000
--- a/pandas/rpy/mass.py
+++ /dev/null
@@ -1,2 +0,0 @@
-class rlm(object):
-    pass
diff --git a/pandas/rpy/tests/test_common.py b/pandas/rpy/tests/test_common.py
deleted file mode 100644
index a2e6d08d07b58..0000000000000
--- a/pandas/rpy/tests/test_common.py
+++ /dev/null
@@ -1,213 +0,0 @@
-"""
-Testing that functions from rpy work as expected
-"""
-
-import pandas as pd
-import numpy as np
-import unittest
-import nose
-import pandas.util.testing as tm
-
-try:
-    import pandas.rpy.common as com
-    from rpy2.robjects import r
-    import rpy2.robjects as robj
-except ImportError:
-    raise nose.SkipTest('R not installed')
-
-
-class TestCommon(unittest.TestCase):
-    def test_convert_list(self):
-        obj = r('list(a=1, b=2, c=3)')
-
-        converted = com.convert_robj(obj)
-        expected = {'a': [1], 'b': [2], 'c': [3]}
-
-        tm.assert_dict_equal(converted, expected)
-
-    def test_convert_nested_list(self):
-        obj = r('list(a=list(foo=1, bar=2))')
-
-        converted = com.convert_robj(obj)
-        expected = {'a': {'foo': [1], 'bar': [2]}}
-
-        tm.assert_dict_equal(converted, expected)
-
-    def test_convert_frame(self):
-        # built-in dataset
-        df = r['faithful']
-
-        converted = com.convert_robj(df)
-
-        assert np.array_equal(converted.columns, ['eruptions', 'waiting'])
-        assert np.array_equal(converted.index, np.arange(1, 273))
-
-    def _test_matrix(self):
-        r('mat <- matrix(rnorm(9), ncol=3)')
-        r('colnames(mat) <- c("one", "two", "three")')
-        r('rownames(mat) <- c("a", "b", "c")')
-
-        return r['mat']
-
-    def test_convert_matrix(self):
-        mat = self._test_matrix()
-
-        converted = com.convert_robj(mat)
-
-        assert np.array_equal(converted.index, ['a', 'b', 'c'])
-        assert np.array_equal(converted.columns, ['one', 'two', 'three'])
-
-    def test_convert_r_dataframe(self):
-
-        is_na = robj.baseenv.get("is.na")
-
-        seriesd = tm.getSeriesData()
-        frame = pd.DataFrame(seriesd, columns=['D', 'C', 'B', 'A'])
-
-        # Null data
-        frame["E"] = [np.nan for item in frame["A"]]
-        # Some mixed type data
-        frame["F"] = ["text" if item %
-                      2 == 0 else np.nan for item in range(30)]
-
-        r_dataframe = com.convert_to_r_dataframe(frame)
-
-        assert np.array_equal(
-            com.convert_robj(r_dataframe.rownames), frame.index)
-        assert np.array_equal(
-            com.convert_robj(r_dataframe.colnames), frame.columns)
-        assert all(is_na(item) for item in r_dataframe.rx2("E"))
-
-        for column in frame[["A", "B", "C", "D"]]:
-            coldata = r_dataframe.rx2(column)
-            original_data = frame[column]
-            assert np.array_equal(com.convert_robj(coldata), original_data)
-
-        for column in frame[["D", "E"]]:
-            for original, converted in zip(frame[column],
-                                           r_dataframe.rx2(column)):
-
-                if pd.isnull(original):
-                    assert is_na(converted)
-                else:
-                    assert original == converted
-
-    def test_convert_r_matrix(self):
-
-        is_na = robj.baseenv.get("is.na")
-
-        seriesd = tm.getSeriesData()
-        frame = pd.DataFrame(seriesd, columns=['D', 'C', 'B', 'A'])
-        # Null data
-        frame["E"] = [np.nan for item in frame["A"]]
-
-        r_dataframe = com.convert_to_r_matrix(frame)
-
-        assert np.array_equal(
-            com.convert_robj(r_dataframe.rownames), frame.index)
-        assert np.array_equal(
-            com.convert_robj(r_dataframe.colnames), frame.columns)
-        assert all(is_na(item) for item in r_dataframe.rx(True, "E"))
-
-        for column in frame[["A", "B", "C", "D"]]:
-            coldata = r_dataframe.rx(True, column)
-            original_data = frame[column]
-            assert np.array_equal(com.convert_robj(coldata),
-                                  original_data)
-
-        # Pandas bug 1282
-        frame["F"] = ["text" if item %
-                      2 == 0 else np.nan for item in range(30)]
-
-        try:
-            wrong_matrix = com.convert_to_r_matrix(frame)
-        except TypeError:
-            pass
-        except Exception:
-            raise
-
-    def test_dist(self):
-        for name in ('eurodist',):
-            df = com.load_data(name)
-            dist = r[name]
-            labels = r['labels'](dist)
-            assert np.array_equal(df.index, labels)
-            assert np.array_equal(df.columns, labels)
-
-    def test_timeseries(self):
-        """
-        Test that the series has an informative index.
-        Unfortunately the code currently does not build a DateTimeIndex
-        """
-        for name in (
-            'austres', 'co2', 'fdeaths', 'freeny.y', 'JohnsonJohnson',
-            'ldeaths', 'mdeaths', 'nottem', 'presidents', 'sunspot.month', 'sunspots',
-            'UKDriverDeaths', 'UKgas', 'USAccDeaths',
-            'airmiles', 'discoveries', 'EuStockMarkets',
-            'LakeHuron', 'lh', 'lynx', 'nhtemp', 'Nile',
-                'Seatbelts', 'sunspot.year', 'treering', 'uspop'):
-            series = com.load_data(name)
-            ts = r[name]
-            assert np.array_equal(series.index, r['time'](ts))
-
-    def test_numeric(self):
-        for name in ('euro', 'islands', 'precip'):
-            series = com.load_data(name)
-            numeric = r[name]
-            names = numeric.names
-            assert np.array_equal(series.index, names)
-
-    def test_table(self):
-        iris3 = pd.DataFrame({'X0': {0: '0', 1: '1', 2: '2', 3: '3', 4: '4'},
-                              'X1': {0: 'Sepal L.',
-                                     1: 'Sepal L.',
-                                     2: 'Sepal L.',
-                                     3: 'Sepal L.',
-                                     4: 'Sepal L.'},
-                              'X2': {0: 'Setosa',
-                                     1: 'Setosa',
-                                     2: 'Setosa',
-                                     3: 'Setosa',
-                                     4: 'Setosa'},
-                              'value': {0: '5.1', 1: '4.9', 2: '4.7', 3: '4.6', 4: '5.0'}})
-        hec = pd.DataFrame(
-            {
-                'Eye': {0: 'Brown', 1: 'Brown', 2: 'Brown', 3: 'Brown', 4: 'Blue'},
-                'Hair': {0: 'Black', 1: 'Brown', 2: 'Red', 3: 'Blond', 4: 'Black'},
-                'Sex': {0: 'Male', 1: 'Male', 2: 'Male', 3: 'Male', 4: 'Male'},
-                'value': {0: '32.0', 1: '53.0', 2: '10.0', 3: '3.0', 4: '11.0'}})
-        titanic = pd.DataFrame(
-            {
-                'Age': {0: 'Child', 1: 'Child', 2: 'Child', 3: 'Child', 4: 'Child'},
-                'Class': {0: '1st', 1: '2nd', 2: '3rd', 3: 'Crew', 4: '1st'},
-                'Sex': {0: 'Male', 1: 'Male', 2: 'Male', 3: 'Male', 4: 'Female'},
-                'Survived': {0: 'No', 1: 'No', 2: 'No', 3: 'No', 4: 'No'},
-                'value': {0: '0.0', 1: '0.0', 2: '35.0', 3: '0.0', 4: '0.0'}})
-        for name, expected in zip(('HairEyeColor', 'Titanic', 'iris3'),
-                                 (hec, titanic, iris3)):
-            df = com.load_data(name)
-            table = r[name]
-            names = r['dimnames'](table)
-            try:
-                columns = list(r['names'](names))[::-1]
-            except TypeError:
-                columns = ['X{:d}'.format(i) for i in range(len(names))][::-1]
-            columns.append('value')
-            assert np.array_equal(df.columns, columns)
-            result = df.head()
-            cond = ((result.sort(axis=1) == expected.sort(axis=1))).values
-            assert np.all(cond)
-
-    def test_factor(self):
-        for name in ('state.division', 'state.region'):
-            vector = r[name]
-            factors = list(r['factor'](vector))
-            level = list(r['levels'](vector))
-            factors = [level[index - 1] for index in factors]
-            result = com.load_data(name)
-            assert np.equal(result, factors)
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   # '--with-coverage', '--cover-package=pandas.core'],
-                   exit=False)
diff --git a/pandas/rpy/vars.py b/pandas/rpy/vars.py
deleted file mode 100644
index 4756b2779224c..0000000000000
--- a/pandas/rpy/vars.py
+++ /dev/null
@@ -1,20 +0,0 @@
-import pandas.rpy.util as util
-
-
-class VAR(object):
-    """
-
-    Parameters
-    ----------
-    y :
-    p :
-    type : {"const", "trend", "both", "none"}
-    season :
-    exogen :
-    lag_max :
-    ic : {"AIC", "HQ", "SC", "FPE"}
-        Information criterion to use, if lag_max is not None
-    """
-    def __init__(y, p=1, type="none", season=None, exogen=None,
-                 lag_max=None, ic=None):
-        pass
diff --git a/pandas/sandbox/qtpandas.py b/pandas/sandbox/qtpandas.py
deleted file mode 100644
index 2655aa5a452c8..0000000000000
--- a/pandas/sandbox/qtpandas.py
+++ /dev/null
@@ -1,143 +0,0 @@
-'''
-Easy integration of DataFrame into pyqt framework
-
-@author: Jev Kuznetsov
-'''
-
-# GH9615
-
-import warnings
-warnings.warn("The pandas.sandbox.qtpandas module is deprecated and will be "
-              "removed in a future version. We refer users to the external package "
-              "here: https://github.com/datalyze-solutions/pandas-qt")
-
-try:
-    from PyQt4.QtCore import QAbstractTableModel, Qt, QVariant, QModelIndex
-    from PyQt4.QtGui import (
-        QApplication, QDialog, QVBoxLayout, QTableView, QWidget)
-except ImportError:
-    from PySide.QtCore import QAbstractTableModel, Qt, QModelIndex
-    from PySide.QtGui import (
-        QApplication, QDialog, QVBoxLayout, QTableView, QWidget)
-    QVariant = lambda value=None: value
-
-from pandas import DataFrame, Index
-
-
-class DataFrameModel(QAbstractTableModel):
-    ''' data model for a DataFrame class '''
-    def __init__(self):
-        super(DataFrameModel, self).__init__()
-        self.df = DataFrame()
-
-    def setDataFrame(self, dataFrame):
-        self.df = dataFrame
-
-    def signalUpdate(self):
-        ''' tell viewers to update their data (this is full update, not
-        efficient)'''
-        self.layoutChanged.emit()
-
-    #------------- table display functions -----------------
-    def headerData(self, section, orientation, role=Qt.DisplayRole):
-        if role != Qt.DisplayRole:
-            return QVariant()
-
-        if orientation == Qt.Horizontal:
-            try:
-                return self.df.columns.tolist()[section]
-            except (IndexError, ):
-                return QVariant()
-        elif orientation == Qt.Vertical:
-            try:
-                # return self.df.index.tolist()
-                return self.df.index.tolist()[section]
-            except (IndexError, ):
-                return QVariant()
-
-    def data(self, index, role=Qt.DisplayRole):
-        if role != Qt.DisplayRole:
-            return QVariant()
-
-        if not index.isValid():
-            return QVariant()
-
-        return QVariant(str(self.df.ix[index.row(), index.column()]))
-
-    def flags(self, index):
-            flags = super(DataFrameModel, self).flags(index)
-            flags |= Qt.ItemIsEditable
-            return flags
-
-    def setData(self, index, value, role):
-        row = self.df.index[index.row()]
-        col = self.df.columns[index.column()]
-        if hasattr(value, 'toPyObject'):
-            # PyQt4 gets a QVariant
-            value = value.toPyObject()
-        else:
-            # PySide gets an unicode
-            dtype = self.df[col].dtype
-            if dtype != object:
-                value = None if value == '' else dtype.type(value)
-        self.df.set_value(row, col, value)
-        return True
-
-    def rowCount(self, index=QModelIndex()):
-        return self.df.shape[0]
-
-    def columnCount(self, index=QModelIndex()):
-        return self.df.shape[1]
-
-
-class DataFrameWidget(QWidget):
-    ''' a simple widget for using DataFrames in a gui '''
-    def __init__(self, dataFrame, parent=None):
-        super(DataFrameWidget, self).__init__(parent)
-
-        self.dataModel = DataFrameModel()
-        self.dataTable = QTableView()
-        self.dataTable.setModel(self.dataModel)
-
-        layout = QVBoxLayout()
-        layout.addWidget(self.dataTable)
-        self.setLayout(layout)
-        # Set DataFrame
-        self.setDataFrame(dataFrame)
-
-    def setDataFrame(self, dataFrame):
-        self.dataModel.setDataFrame(dataFrame)
-        self.dataModel.signalUpdate()
-        self.dataTable.resizeColumnsToContents()
-
-#-----------------stand alone test code
-
-
-def testDf():
-    ''' creates test dataframe '''
-    data = {'int': [1, 2, 3], 'float': [1.5, 2.5, 3.5],
-            'string': ['a', 'b', 'c'], 'nan': [np.nan, np.nan, np.nan]}
-    return DataFrame(data, index=Index(['AAA', 'BBB', 'CCC']),
-                     columns=['int', 'float', 'string', 'nan'])
-
-
-class Form(QDialog):
-    def __init__(self, parent=None):
-        super(Form, self).__init__(parent)
-
-        df = testDf()  # make up some data
-        widget = DataFrameWidget(df)
-        widget.resizeColumnsToContents()
-
-        layout = QVBoxLayout()
-        layout.addWidget(widget)
-        self.setLayout(layout)
-
-if __name__ == '__main__':
-    import sys
-    import numpy as np
-
-    app = QApplication(sys.argv)
-    form = Form()
-    form.show()
-    app.exec_()
diff --git a/pandas/sparse/api.py b/pandas/sparse/api.py
deleted file mode 100644
index 230ad15937c92..0000000000000
--- a/pandas/sparse/api.py
+++ /dev/null
@@ -1,7 +0,0 @@
-# pylint: disable=W0611
-
-from pandas.sparse.array import SparseArray
-from pandas.sparse.list import SparseList
-from pandas.sparse.series import SparseSeries, SparseTimeSeries
-from pandas.sparse.frame import SparseDataFrame
-from pandas.sparse.panel import SparsePanel
diff --git a/pandas/sparse/array.py b/pandas/sparse/array.py
deleted file mode 100644
index b765fdb8d67be..0000000000000
--- a/pandas/sparse/array.py
+++ /dev/null
@@ -1,574 +0,0 @@
-"""
-SparseArray data structure
-"""
-from __future__ import division
-# pylint: disable=E1101,E1103,W0231
-
-from numpy import nan, ndarray
-import numpy as np
-
-from pandas.core.base import PandasObject
-import pandas.core.common as com
-
-from pandas import compat, lib
-from pandas.compat import range
-
-from pandas._sparse import BlockIndex, IntIndex
-import pandas._sparse as splib
-import pandas.index as _index
-import pandas.core.ops as ops
-
-
-def _arith_method(op, name, str_rep=None, default_axis=None,
-                              fill_zeros=None, **eval_kwargs):
-    """
-    Wrapper function for Series arithmetic operations, to avoid
-    code duplication.
-    """
-    def wrapper(self, other):
-        if isinstance(other, np.ndarray):
-            if len(self) != len(other):
-                raise AssertionError("length mismatch: %d vs. %d" %
-                                     (len(self), len(other)))
-            if not isinstance(other, com.ABCSparseArray):
-                other = SparseArray(other, fill_value=self.fill_value)
-            if name[0] == 'r':
-                return _sparse_array_op(other, self, op, name[1:])
-            else:
-                return _sparse_array_op(self, other, op, name)
-        elif np.isscalar(other):
-            new_fill_value = op(np.float64(self.fill_value),
-                                np.float64(other))
-
-            return SparseArray(op(self.sp_values, other),
-                               sparse_index=self.sp_index,
-                               fill_value=new_fill_value)
-        else:  # pragma: no cover
-            raise TypeError('operation with %s not supported' % type(other))
-    if name.startswith("__"):
-        name = name[2:-2]
-    wrapper.__name__ = name
-    return wrapper
-
-
-def _sparse_array_op(left, right, op, name):
-    if np.isnan(left.fill_value):
-        sparse_op = lambda a, b: _sparse_nanop(a, b, name)
-    else:
-        sparse_op = lambda a, b: _sparse_fillop(a, b, name)
-
-    if left.sp_index.equals(right.sp_index):
-        result = op(left.sp_values, right.sp_values)
-        result_index = left.sp_index
-    else:
-        result, result_index = sparse_op(left, right)
-
-    try:
-        fill_value = op(left.fill_value, right.fill_value)
-    except:
-        fill_value = nan
-
-    return SparseArray(result, sparse_index=result_index,
-                       fill_value=fill_value)
-
-
-def _sparse_nanop(this, other, name):
-    sparse_op = getattr(splib, 'sparse_nan%s' % name)
-    result, result_index = sparse_op(this.sp_values,
-                                     this.sp_index,
-                                     other.sp_values,
-                                     other.sp_index)
-
-    return result, result_index
-
-
-def _sparse_fillop(this, other, name):
-    sparse_op = getattr(splib, 'sparse_%s' % name)
-    result, result_index = sparse_op(this.sp_values,
-                                     this.sp_index,
-                                     this.fill_value,
-                                     other.sp_values,
-                                     other.sp_index,
-                                     other.fill_value)
-
-    return result, result_index
-
-
-class SparseArray(PandasObject, np.ndarray):
-
-    """Data structure for labeled, sparse floating point data
-
-Parameters
-----------
-data : {array-like, Series, SparseSeries, dict}
-kind : {'block', 'integer'}
-fill_value : float
-    Defaults to NaN (code for missing)
-sparse_index : {BlockIndex, IntIndex}, optional
-    Only if you have one. Mainly used internally
-
-Notes
------
-SparseArray objects are immutable via the typical Python means. If you
-must change values, convert to dense, make your changes, then convert back
-to sparse
-    """
-    __array_priority__ = 15
-    _typ = 'array'
-    _subtyp = 'sparse_array'
-
-    sp_index = None
-    fill_value = None
-
-    def __new__(
-        cls, data, sparse_index=None, index=None, kind='integer', fill_value=None,
-            dtype=np.float64, copy=False):
-
-        if index is not None:
-            if data is None:
-                data = np.nan
-            if not np.isscalar(data):
-                raise Exception("must only pass scalars with an index ")
-            values = np.empty(len(index), dtype='float64')
-            values.fill(data)
-            data = values
-
-        if dtype is not None:
-            dtype = np.dtype(dtype)
-        is_sparse_array = isinstance(data, SparseArray)
-        if fill_value is None:
-            if is_sparse_array:
-                fill_value = data.fill_value
-            else:
-                fill_value = nan
-
-        if is_sparse_array:
-            sparse_index = data.sp_index
-            values = np.asarray(data)
-        else:
-            # array-like
-            if sparse_index is None:
-                values, sparse_index = make_sparse(data, kind=kind,
-                                                   fill_value=fill_value)
-            else:
-                values = data
-                if len(values) != sparse_index.npoints:
-                    raise AssertionError("Non array-like type {0} must have"
-                                         " the same length as the"
-                                         " index".format(type(values)))
-
-        # Create array, do *not* copy data by default
-        if copy:
-            subarr = np.array(values, dtype=dtype, copy=True)
-        else:
-            subarr = np.asarray(values, dtype=dtype)
-
-        # if we have a bool type, make sure that we have a bool fill_value
-        if (dtype is not None and issubclass(dtype.type, np.bool_)) or (data is not None and lib.is_bool_array(subarr)):
-            if np.isnan(fill_value) or not fill_value:
-                fill_value = False
-            else:
-                fill_value = bool(fill_value)
-
-        # Change the class of the array to be the subclass type.
-        output = subarr.view(cls)
-        output.sp_index = sparse_index
-        output.fill_value = fill_value
-        return output
-
-    @property
-    def _constructor(self):
-        return lambda x: SparseArray(x, fill_value=self.fill_value,
-                                     kind=self.kind)
-
-    @property
-    def kind(self):
-        if isinstance(self.sp_index, BlockIndex):
-            return 'block'
-        elif isinstance(self.sp_index, IntIndex):
-            return 'integer'
-
-    def __array_finalize__(self, obj):
-        """
-        Gets called after any ufunc or other array operations, necessary
-        to pass on the index.
-        """
-        self.sp_index = getattr(obj, 'sp_index', None)
-        self.fill_value = getattr(obj, 'fill_value', None)
-
-    def __reduce__(self):
-        """Necessary for making this object picklable"""
-        object_state = list(ndarray.__reduce__(self))
-        subclass_state = self.fill_value, self.sp_index
-        object_state[2] = (object_state[2], subclass_state)
-        return tuple(object_state)
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-        nd_state, own_state = state
-        ndarray.__setstate__(self, nd_state)
-
-        fill_value, sp_index = own_state[:2]
-        self.sp_index = sp_index
-        self.fill_value = fill_value
-
-    def __len__(self):
-        try:
-            return self.sp_index.length
-        except:
-            return 0
-
-    def __unicode__(self):
-        return '%s\nFill: %s\n%s' % (com.pprint_thing(self),
-                                     com.pprint_thing(self.fill_value),
-                                     com.pprint_thing(self.sp_index))
-
-    def disable(self, other):
-        raise NotImplementedError('inplace binary ops not supported')
-    # Inplace operators
-    __iadd__ = disable
-    __isub__ = disable
-    __imul__ = disable
-    __itruediv__ = disable
-    __ifloordiv__ = disable
-    __ipow__ = disable
-
-    # Python 2 division operators
-    if not compat.PY3:
-        __idiv__ = disable
-
-    @property
-    def values(self):
-        """
-        Dense values
-        """
-        output = np.empty(len(self), dtype=np.float64)
-        int_index = self.sp_index.to_int_index()
-        output.fill(self.fill_value)
-        output.put(int_index.indices, self)
-        return output
-
-    @property
-    def sp_values(self):
-        # caching not an option, leaks memory
-        return self.view(np.ndarray)
-
-    def get_values(self, fill=None):
-        """ return a dense representation """
-        return self.to_dense(fill=fill)
-
-    def to_dense(self, fill=None):
-        """
-        Convert SparseSeries to (dense) Series
-        """
-        values = self.values
-
-        # fill the nans
-        if fill is None:
-            fill = self.fill_value
-        if not np.isnan(fill):
-            values[np.isnan(values)] = fill
-
-        return values
-
-    def __iter__(self):
-        for i in range(len(self)):
-            yield self._get_val_at(i)
-        raise StopIteration
-
-    def __getitem__(self, key):
-        """
-
-        """
-        if com.is_integer(key):
-            return self._get_val_at(key)
-        else:
-            data_slice = self.values[key]
-            return self._constructor(data_slice)
-
-    def __getslice__(self, i, j):
-        if i < 0:
-            i = 0
-        if j < 0:
-            j = 0
-        slobj = slice(i, j)
-        return self.__getitem__(slobj)
-
-    def _get_val_at(self, loc):
-        n = len(self)
-        if loc < 0:
-            loc += n
-
-        if loc >= n or loc < 0:
-            raise IndexError('Out of bounds access')
-
-        sp_loc = self.sp_index.lookup(loc)
-        if sp_loc == -1:
-            return self.fill_value
-        else:
-            return _index.get_value_at(self, sp_loc)
-
-    def take(self, indices, axis=0):
-        """
-        Sparse-compatible version of ndarray.take
-
-        Returns
-        -------
-        taken : ndarray
-        """
-        if axis:
-            raise ValueError("axis must be 0, input was {0}".format(axis))
-        indices = np.atleast_1d(np.asarray(indices, dtype=int))
-
-        # allow -1 to indicate missing values
-        n = len(self)
-        if ((indices >= n) | (indices < -1)).any():
-            raise IndexError('out of bounds access')
-
-        if self.sp_index.npoints > 0:
-            locs = np.array([self.sp_index.lookup(loc) if loc > -1 else -1
-                             for loc in indices])
-            result = self.sp_values.take(locs)
-            mask = locs == -1
-            if mask.any():
-                try:
-                    result[mask] = self.fill_value
-                except ValueError:
-                    # wrong dtype
-                    result = result.astype('float64')
-                    result[mask] = self.fill_value
-
-        else:
-            result = np.empty(len(indices))
-            result.fill(self.fill_value)
-
-        return result
-
-    def __setitem__(self, key, value):
-        # if com.is_integer(key):
-        #    self.values[key] = value
-        # else:
-        #    raise Exception("SparseArray does not support seting non-scalars via setitem")
-        raise TypeError(
-            "SparseArray does not support item assignment via setitem")
-
-    def __setslice__(self, i, j, value):
-        if i < 0:
-            i = 0
-        if j < 0:
-            j = 0
-        slobj = slice(i, j)
-
-        # if not np.isscalar(value):
-        #    raise Exception("SparseArray does not support seting non-scalars via slices")
-
-        #x = self.values
-        #x[slobj] = value
-        #self.values = x
-        raise TypeError(
-            "SparseArray does not support item assignment via slices")
-
-    def astype(self, dtype=None):
-        """
-
-        """
-        dtype = np.dtype(dtype)
-        if dtype is not None and dtype not in (np.float_, float):
-            raise TypeError('Can only support floating point data for now')
-        return self.copy()
-
-    def copy(self, deep=True):
-        """
-        Make a copy of the SparseSeries. Only the actual sparse values need to
-        be copied
-        """
-        if deep:
-            values = self.sp_values.copy()
-        else:
-            values = self.sp_values
-        return SparseArray(values, sparse_index=self.sp_index,
-                           dtype=self.dtype,
-                           fill_value=self.fill_value)
-
-    def count(self):
-        """
-        Compute sum of non-NA/null observations in SparseSeries. If the
-        fill_value is not NaN, the "sparse" locations will be included in the
-        observation count
-
-        Returns
-        -------
-        nobs : int
-        """
-        sp_values = self.sp_values
-        valid_spvals = np.isfinite(sp_values).sum()
-        if self._null_fill_value:
-            return valid_spvals
-        else:
-            return valid_spvals + self.sp_index.ngaps
-
-    @property
-    def _null_fill_value(self):
-        return np.isnan(self.fill_value)
-
-    @property
-    def _valid_sp_values(self):
-        sp_vals = self.sp_values
-        mask = np.isfinite(sp_vals)
-        return sp_vals[mask]
-
-    def sum(self, axis=None, dtype=None, out=None):
-        """
-        Sum of non-NA/null values
-
-        Returns
-        -------
-        sum : float
-        """
-        valid_vals = self._valid_sp_values
-        sp_sum = valid_vals.sum()
-        if self._null_fill_value:
-            return sp_sum
-        else:
-            nsparse = self.sp_index.ngaps
-            return sp_sum + self.fill_value * nsparse
-
-    def cumsum(self, axis=0, dtype=None, out=None):
-        """
-        Cumulative sum of values. Preserves locations of NaN values
-
-        Extra parameters are to preserve ndarray interface.
-
-        Returns
-        -------
-        cumsum : Series
-        """
-        if com.notnull(self.fill_value):
-            return self.to_dense().cumsum()
-        # TODO: what if sp_values contains NaN??
-        return SparseArray(self.sp_values.cumsum(),
-                           sparse_index=self.sp_index,
-                           fill_value=self.fill_value)
-
-    def mean(self, axis=None, dtype=None, out=None):
-        """
-        Mean of non-NA/null values
-
-        Returns
-        -------
-        mean : float
-        """
-        valid_vals = self._valid_sp_values
-        sp_sum = valid_vals.sum()
-        ct = len(valid_vals)
-
-        if self._null_fill_value:
-            return sp_sum / ct
-        else:
-            nsparse = self.sp_index.ngaps
-            return (sp_sum + self.fill_value * nsparse) / (ct + nsparse)
-
-
-def _maybe_to_dense(obj):
-    """ try to convert to dense """
-    if hasattr(obj, 'to_dense'):
-        return obj.to_dense()
-    return obj
-
-
-def _maybe_to_sparse(array):
-    if isinstance(array, com.ABCSparseSeries):
-        array = SparseArray(
-            array.values, sparse_index=array.sp_index, fill_value=array.fill_value, copy=True)
-    if not isinstance(array, SparseArray):
-        array = com._values_from_object(array)
-    return array
-
-
-def make_sparse(arr, kind='block', fill_value=nan):
-    """
-    Convert ndarray to sparse format
-
-    Parameters
-    ----------
-    arr : ndarray
-    kind : {'block', 'integer'}
-    fill_value : NaN or another value
-
-    Returns
-    -------
-    (sparse_values, index) : (ndarray, SparseIndex)
-    """
-    if hasattr(arr, 'values'):
-        arr = arr.values
-    else:
-        if np.isscalar(arr):
-            arr = [arr]
-        arr = np.asarray(arr)
-
-    length = len(arr)
-
-    if np.isnan(fill_value):
-        mask = ~np.isnan(arr)
-    else:
-        mask = arr != fill_value
-
-    indices = np.arange(length, dtype=np.int32)[mask]
-
-    if kind == 'block':
-        locs, lens = splib.get_blocks(indices)
-        index = BlockIndex(length, locs, lens)
-    elif kind == 'integer':
-        index = IntIndex(length, indices)
-    else:  # pragma: no cover
-        raise ValueError('must be block or integer type')
-
-    sparsified_values = arr[mask]
-    return sparsified_values, index
-
-ops.add_special_arithmetic_methods(SparseArray,
-                                   arith_method=_arith_method,
-                                   use_numexpr=False)
-
-
-
-def _concat_compat(to_concat, axis=0):
-    """
-    provide concatenation of an sparse/dense array of arrays each of which is a single dtype
-
-    Parameters
-    ----------
-    to_concat : array of arrays
-    axis : axis to provide concatenation
-
-    Returns
-    -------
-    a single array, preserving the combined dtypes
-    """
-
-    def convert_sparse(x, axis):
-        # coerce to native type
-        if isinstance(x, SparseArray):
-            x = x.get_values()
-        x = x.ravel()
-        if axis > 0:
-            x = np.atleast_2d(x)
-        return x
-
-    typs = com.get_dtype_kinds(to_concat)
-
-    # we have more than one type here, so densify and regular concat
-    to_concat = [ convert_sparse(x, axis) for x in to_concat ]
-    result = np.concatenate(to_concat,axis=axis)
-
-    if not len(typs-set(['sparse','f','i'])):
-
-        # we can remain sparse
-        result = SparseArray(result.ravel())
-
-    else:
-
-        # coerce to object if needed
-        result = result.astype('object')
-
-    return result
diff --git a/pandas/sparse/frame.py b/pandas/sparse/frame.py
deleted file mode 100644
index f1799eb99f720..0000000000000
--- a/pandas/sparse/frame.py
+++ /dev/null
@@ -1,831 +0,0 @@
-"""
-Data structures for sparse float data. Life is made simpler by dealing only
-with float64 data
-"""
-from __future__ import division
-# pylint: disable=E1101,E1103,W0231,E0202
-
-from numpy import nan
-from pandas.compat import range, lmap, map
-from pandas import compat
-import numpy as np
-
-from pandas.core.common import (isnull, notnull, _pickle_array,
-                                _unpickle_array, _try_sort)
-from pandas.core.index import Index, MultiIndex, _ensure_index
-from pandas.core.series import Series
-from pandas.core.frame import (DataFrame, extract_index, _prep_ndarray,
-                               _default_index)
-from pandas.util.decorators import cache_readonly
-import pandas.core.common as com
-import pandas.core.datetools as datetools
-from pandas.core.internals import BlockManager, create_block_manager_from_arrays
-
-from pandas.core.generic import NDFrame
-from pandas.sparse.series import SparseSeries, SparseArray
-from pandas.util.decorators import Appender
-import pandas.core.ops as ops
-
-
-class SparseDataFrame(DataFrame):
-
-    """
-    DataFrame containing sparse floating point data in the form of SparseSeries
-    objects
-
-    Parameters
-    ----------
-    data : same types as can be passed to DataFrame
-    index : array-like, optional
-    column : array-like, optional
-    default_kind : {'block', 'integer'}, default 'block'
-        Default sparse kind for converting Series to SparseSeries. Will not
-        override SparseSeries passed into constructor
-    default_fill_value : float
-        Default fill_value for converting Series to SparseSeries. Will not
-        override SparseSeries passed in
-    """
-    _constructor_sliced = SparseSeries
-    _subtyp = 'sparse_frame'
-
-    def __init__(self, data=None, index=None, columns=None,
-                 default_kind=None, default_fill_value=None,
-                 dtype=None, copy=False):
-
-        # pick up the defaults from the Sparse structures
-        if isinstance(data, SparseDataFrame):
-            if index is None:
-                index = data.index
-            if columns is None:
-                columns = data.columns
-            if default_fill_value is None:
-                default_fill_value = data.default_fill_value
-            if default_kind is None:
-                default_kind = data.default_kind
-        elif isinstance(data, (SparseSeries, SparseArray)):
-            if index is None:
-                index = data.index
-            if default_fill_value is None:
-                default_fill_value = data.fill_value
-            if columns is None and hasattr(data, 'name'):
-                columns = [data.name]
-            if columns is None:
-                raise Exception("cannot pass a series w/o a name or columns")
-            data = {columns[0]: data}
-
-        if default_fill_value is None:
-            default_fill_value = np.nan
-        if default_kind is None:
-            default_kind = 'block'
-
-        self._default_kind = default_kind
-        self._default_fill_value = default_fill_value
-
-        if isinstance(data, dict):
-            mgr = self._init_dict(data, index, columns)
-            if dtype is not None:
-                mgr = mgr.astype(dtype)
-        elif isinstance(data, (np.ndarray, list)):
-            mgr = self._init_matrix(data, index, columns)
-            if dtype is not None:
-                mgr = mgr.astype(dtype)
-        elif isinstance(data, SparseDataFrame):
-            mgr = self._init_mgr(
-                data._data, dict(index=index, columns=columns), dtype=dtype, copy=copy)
-        elif isinstance(data, DataFrame):
-            mgr = self._init_dict(data, data.index, data.columns)
-            if dtype is not None:
-                mgr = mgr.astype(dtype)
-        elif isinstance(data, BlockManager):
-            mgr = self._init_mgr(
-                data, axes=dict(index=index, columns=columns), dtype=dtype, copy=copy)
-        elif data is None:
-            data = DataFrame()
-
-            if index is None:
-                index = Index([])
-            else:
-                index = _ensure_index(index)
-
-            if columns is None:
-                columns = Index([])
-            else:
-                for c in columns:
-                    data[c] = SparseArray(np.nan,
-                                          index=index,
-                                          kind=self._default_kind,
-                                          fill_value=self._default_fill_value)
-            mgr = to_manager(data, columns, index)
-            if dtype is not None:
-                mgr = mgr.astype(dtype)
-
-        NDFrame.__init__(self, mgr)
-
-    @property
-    def _constructor(self):
-        def wrapper(data=None, index=None, columns=None, default_fill_value=None, kind=None, fill_value=None, copy=False):
-            result = SparseDataFrame(data, index=index, columns=columns,
-                                     default_fill_value=fill_value,
-                                     default_kind=kind,
-                                     copy=copy)
-
-            # fill if requested
-            if fill_value is not None and not isnull(fill_value):
-                result.fillna(fill_value, inplace=True)
-
-            # set the default_fill_value
-            # if default_fill_value is not None:
-            #    result._default_fill_value = default_fill_value
-            return result
-
-        return wrapper
-
-    def _init_dict(self, data, index, columns, dtype=None):
-        # pre-filter out columns if we passed it
-        if columns is not None:
-            columns = _ensure_index(columns)
-            data = dict((k, v) for k, v in compat.iteritems(data) if k in columns)
-        else:
-            columns = Index(_try_sort(list(data.keys())))
-
-        if index is None:
-            index = extract_index(list(data.values()))
-
-        sp_maker = lambda x: SparseArray(x,
-                                         kind=self._default_kind,
-                                         fill_value=self._default_fill_value,
-                                         copy=True)
-        sdict = DataFrame()
-        for k, v in compat.iteritems(data):
-            if isinstance(v, Series):
-                # Force alignment, no copy necessary
-                if not v.index.equals(index):
-                    v = v.reindex(index)
-
-                if not isinstance(v, SparseSeries):
-                    v = sp_maker(v.values)
-            elif isinstance(v, SparseArray):
-                v = sp_maker(v.values)
-            else:
-                if isinstance(v, dict):
-                    v = [v.get(i, nan) for i in index]
-
-                v = sp_maker(v)
-            sdict[k] = v
-
-        # TODO: figure out how to handle this case, all nan's?
-        # add in any other columns we want to have (completeness)
-        nan_vec = np.empty(len(index))
-        nan_vec.fill(nan)
-        for c in columns:
-            if c not in sdict:
-                sdict[c] = sp_maker(nan_vec)
-
-        return to_manager(sdict, columns, index)
-
-    def _init_matrix(self, data, index, columns, dtype=None):
-        data = _prep_ndarray(data, copy=False)
-        N, K = data.shape
-        if index is None:
-            index = _default_index(N)
-        if columns is None:
-            columns = _default_index(K)
-
-        if len(columns) != K:
-            raise ValueError('Column length mismatch: %d vs. %d' %
-                            (len(columns), K))
-        if len(index) != N:
-            raise ValueError('Index length mismatch: %d vs. %d' %
-                            (len(index), N))
-
-        data = dict([(idx, data[:, i]) for i, idx in enumerate(columns)])
-        return self._init_dict(data, index, columns, dtype)
-
-    def __array_wrap__(self, result):
-        return SparseDataFrame(result, index=self.index, columns=self.columns,
-                               default_kind=self._default_kind,
-                               default_fill_value=self._default_fill_value).__finalize__(self)
-
-    def __getstate__(self):
-        # pickling
-        return dict(_typ=self._typ,
-                    _subtyp=self._subtyp,
-                    _data=self._data,
-                    _default_fill_value=self._default_fill_value,
-                    _default_kind=self._default_kind)
-
-    def _unpickle_sparse_frame_compat(self, state):
-        """ original pickle format """
-        series, cols, idx, fv, kind = state
-
-        if not isinstance(cols, Index):  # pragma: no cover
-            columns = _unpickle_array(cols)
-        else:
-            columns = cols
-
-        if not isinstance(idx, Index):  # pragma: no cover
-            index = _unpickle_array(idx)
-        else:
-            index = idx
-
-        series_dict = DataFrame()
-        for col, (sp_index, sp_values) in compat.iteritems(series):
-            series_dict[col] = SparseSeries(sp_values, sparse_index=sp_index,
-                                            fill_value=fv)
-
-        self._data = to_manager(series_dict, columns, index)
-        self._default_fill_value = fv
-        self._default_kind = kind
-
-    def to_dense(self):
-        """
-        Convert to dense DataFrame
-
-        Returns
-        -------
-        df : DataFrame
-        """
-        data = dict((k, v.to_dense()) for k, v in compat.iteritems(self))
-        return DataFrame(data, index=self.index)
-
-    def astype(self, dtype):
-        raise NotImplementedError
-
-    def copy(self, deep=True):
-        """
-        Make a copy of this SparseDataFrame
-        """
-        result = super(SparseDataFrame, self).copy(deep=deep)
-        result._default_fill_value = self._default_fill_value
-        result._default_kind = self._default_kind
-        return result
-
-    @property
-    def default_fill_value(self):
-        return self._default_fill_value
-
-    @property
-    def default_kind(self):
-        return self._default_kind
-
-    @property
-    def density(self):
-        """
-        Ratio of non-sparse points to total (dense) data points
-        represented in the frame
-        """
-        tot_nonsparse = sum([ser.sp_index.npoints
-                             for _, ser in compat.iteritems(self)])
-        tot = len(self.index) * len(self.columns)
-        return tot_nonsparse / float(tot)
-
-    def fillna(self, value=None, method=None, axis=0, inplace=False,
-               limit=None, downcast=None):
-        new_self = super(
-            SparseDataFrame, self).fillna(value=value, method=method, axis=axis,
-                                          inplace=inplace, limit=limit, downcast=downcast)
-        if not inplace:
-            self = new_self
-
-        # set the fill value if we are filling as a scalar with nothing special
-        # going on
-        if value is not None and value == value and method is None and limit is None:
-            self._default_fill_value = value
-
-        if not inplace:
-            return self
-
-    #----------------------------------------------------------------------
-    # Support different internal representation of SparseDataFrame
-
-    def _sanitize_column(self, key, value):
-        sp_maker = lambda x, index=None: SparseArray(x,
-                                                     index=index,
-                                                     fill_value=self._default_fill_value,
-                                                     kind=self._default_kind)
-        if isinstance(value, SparseSeries):
-            clean = value.reindex(
-                self.index).as_sparse_array(fill_value=self._default_fill_value,
-                                            kind=self._default_kind)
-
-        elif isinstance(value, SparseArray):
-            if len(value) != len(self.index):
-                raise AssertionError('Length of values does not match '
-                                     'length of index')
-            clean = value
-
-        elif hasattr(value, '__iter__'):
-            if isinstance(value, Series):
-                clean = value.reindex(self.index)
-                if not isinstance(value, SparseSeries):
-                    clean = sp_maker(clean)
-            else:
-                if len(value) != len(self.index):
-                    raise AssertionError('Length of values does not match '
-                                         'length of index')
-                clean = sp_maker(value)
-
-        # Scalar
-        else:
-            clean = sp_maker(value, self.index)
-
-        # always return a SparseArray!
-        return clean
-
-    def __getitem__(self, key):
-        """
-        Retrieve column or slice from DataFrame
-        """
-        if isinstance(key, slice):
-            date_rng = self.index[key]
-            return self.reindex(date_rng)
-        elif isinstance(key, (np.ndarray, list, Series)):
-            return self._getitem_array(key)
-        else:
-            return self._get_item_cache(key)
-
-    @Appender(DataFrame.get_value.__doc__, indents=0)
-    def get_value(self, index, col, takeable=False):
-        if takeable is True:
-            series = self._iget_item_cache(col)
-        else:
-            series = self._get_item_cache(col)
-
-        return series.get_value(index, takeable=takeable)
-
-    def set_value(self, index, col, value, takeable=False):
-        """
-        Put single value at passed column and index
-
-        Parameters
-        ----------
-        index : row label
-        col : column label
-        value : scalar value
-        takeable : interpret the index/col as indexers, default False
-
-        Notes
-        -----
-        This method *always* returns a new object. It is currently not
-        particularly efficient (and potentially very expensive) but is provided
-        for API compatibility with DataFrame
-
-        Returns
-        -------
-        frame : DataFrame
-        """
-        dense = self.to_dense().set_value(index, col, value, takeable=takeable)
-        return dense.to_sparse(kind=self._default_kind,
-                               fill_value=self._default_fill_value)
-
-    def _slice(self, slobj, axis=0, kind=None):
-        if axis == 0:
-            new_index = self.index[slobj]
-            new_columns = self.columns
-        else:
-            new_index = self.index
-            new_columns = self.columns[slobj]
-
-        return self.reindex(index=new_index, columns=new_columns)
-
-    def xs(self, key, axis=0, copy=False):
-        """
-        Returns a row (cross-section) from the SparseDataFrame as a Series
-        object.
-
-        Parameters
-        ----------
-        key : some index contained in the index
-
-        Returns
-        -------
-        xs : Series
-        """
-        if axis == 1:
-            data = self[key]
-            return data
-
-        i = self.index.get_loc(key)
-        data = self.take([i]).get_values()[0]
-        return Series(data, index=self.columns)
-
-    #----------------------------------------------------------------------
-    # Arithmetic-related methods
-
-    def _combine_frame(self, other, func, fill_value=None, level=None):
-        this, other = self.align(other, join='outer', level=level,
-                                 copy=False)
-        new_index, new_columns = this.index, this.columns
-
-        if level is not None:
-            raise NotImplementedError("'level' argument is not supported")
-
-        if self.empty and other.empty:
-            return SparseDataFrame(index=new_index).__finalize__(self)
-
-        new_data = {}
-        new_fill_value = None
-        if fill_value is not None:
-            # TODO: be a bit more intelligent here
-            for col in new_columns:
-                if col in this and col in other:
-                    dleft = this[col].to_dense()
-                    dright = other[col].to_dense()
-                    result = dleft._binop(dright, func, fill_value=fill_value)
-                    result = result.to_sparse(fill_value=this[col].fill_value)
-                    new_data[col] = result
-        else:
-
-            for col in new_columns:
-                if col in this and col in other:
-                    new_data[col] = func(this[col], other[col])
-
-        # if the fill values are the same use them? or use a valid one
-        other_fill_value = getattr(other, 'default_fill_value', np.nan)
-        if self.default_fill_value == other_fill_value:
-            new_fill_value = self.default_fill_value
-        elif np.isnan(self.default_fill_value) and not np.isnan(other_fill_value):
-            new_fill_value = other_fill_value
-        elif not np.isnan(self.default_fill_value) and np.isnan(other_fill_value):
-            new_fill_value = self.default_fill_value
-
-        return self._constructor(data=new_data,
-                                 index=new_index,
-                                 columns=new_columns,
-                                 default_fill_value=new_fill_value,
-                                 fill_value=new_fill_value).__finalize__(self)
-
-    def _combine_match_index(self, other, func, level=None, fill_value=None):
-        new_data = {}
-
-        if fill_value is not None:
-            raise NotImplementedError("'fill_value' argument is not supported")
-        if level is not None:
-            raise NotImplementedError("'level' argument is not supported")
-
-        new_index = self.index.union(other.index)
-        this = self
-        if self.index is not new_index:
-            this = self.reindex(new_index)
-
-        if other.index is not new_index:
-            other = other.reindex(new_index)
-
-        for col, series in compat.iteritems(this):
-            new_data[col] = func(series.values, other.values)
-
-        # fill_value is a function of our operator
-        if isnull(other.fill_value) or isnull(self.default_fill_value):
-            fill_value = np.nan
-        else:
-            fill_value = func(np.float64(self.default_fill_value),
-                              np.float64(other.fill_value))
-
-        return self._constructor(new_data,
-                                 index=new_index,
-                                 columns=self.columns,
-                                 default_fill_value=fill_value,
-                                 fill_value=self.default_fill_value).__finalize__(self)
-
-    def _combine_match_columns(self, other, func, level=None, fill_value=None):
-        # patched version of DataFrame._combine_match_columns to account for
-        # NumPy circumventing __rsub__ with float64 types, e.g.: 3.0 - series,
-        # where 3.0 is numpy.float64 and series is a SparseSeries. Still
-        # possible for this to happen, which is bothersome
-
-        if fill_value is not None:
-            raise NotImplementedError("'fill_value' argument is not supported")
-        if level is not None:
-            raise NotImplementedError("'level' argument is not supported")
-
-        new_data = {}
-
-        union = intersection = self.columns
-
-        if not union.equals(other.index):
-            union = other.index.union(self.columns)
-            intersection = other.index.intersection(self.columns)
-
-        for col in intersection:
-            new_data[col] = func(self[col], float(other[col]))
-
-        return self._constructor(new_data,
-                                 index=self.index,
-                                 columns=union,
-                                 default_fill_value=self.default_fill_value,
-                                 fill_value=self.default_fill_value).__finalize__(self)
-
-    def _combine_const(self, other, func):
-        new_data = {}
-        for col, series in compat.iteritems(self):
-            new_data[col] = func(series, other)
-
-        return self._constructor(data=new_data,
-                                 index=self.index,
-                                 columns=self.columns,
-                                 default_fill_value=self.default_fill_value,
-                                 fill_value=self.default_fill_value).__finalize__(self)
-
-    def _reindex_index(self, index, method, copy, level, fill_value=np.nan,
-                       limit=None, takeable=False):
-        if level is not None:
-            raise TypeError('Reindex by level not supported for sparse')
-
-        if self.index.equals(index):
-            if copy:
-                return self.copy()
-            else:
-                return self
-
-        if len(self.index) == 0:
-            return SparseDataFrame(index=index, columns=self.columns)
-
-        indexer = self.index.get_indexer(index, method, limit=limit)
-        indexer = com._ensure_platform_int(indexer)
-        mask = indexer == -1
-        need_mask = mask.any()
-
-        new_series = {}
-        for col, series in self.iteritems():
-            if mask.all():
-                continue
-
-            values = series.values
-            new = values.take(indexer)
-
-            if need_mask:
-                np.putmask(new, mask, fill_value)
-
-            new_series[col] = new
-
-        return SparseDataFrame(new_series, index=index, columns=self.columns,
-                               default_fill_value=self._default_fill_value)
-
-    def _reindex_columns(self, columns, copy, level, fill_value, limit=None,
-                         takeable=False):
-        if level is not None:
-            raise TypeError('Reindex by level not supported for sparse')
-
-        if com.notnull(fill_value):
-            raise NotImplementedError("'fill_value' argument is not supported")
-
-        if limit:
-            raise NotImplementedError("'limit' argument is not supported")
-
-        # TODO: fill value handling
-        sdict = dict((k, v) for k, v in compat.iteritems(self) if k in columns)
-        return SparseDataFrame(sdict, index=self.index, columns=columns,
-                               default_fill_value=self._default_fill_value)
-
-    def _reindex_with_indexers(self, reindexers, method=None, fill_value=None, limit=None,
-                               copy=False, allow_dups=False):
-
-        if method is not None or limit is not None:
-            raise NotImplementedError("cannot reindex with a method or limit with sparse")
-
-        if fill_value is None:
-            fill_value = np.nan
-
-        index,   row_indexer = reindexers.get(0, (None, None))
-        columns, col_indexer = reindexers.get(1, (None, None))
-
-        if columns is None:
-            columns = self.columns
-
-        new_arrays = {}
-        for col in columns:
-            if col not in self:
-                continue
-            if row_indexer is not None:
-                new_arrays[col] = com.take_1d(
-                    self[col].get_values(), row_indexer,
-                    fill_value=fill_value)
-            else:
-                new_arrays[col] = self[col]
-
-        return SparseDataFrame(new_arrays, index=index, columns=columns).__finalize__(self)
-
-    def _join_compat(self, other, on=None, how='left', lsuffix='', rsuffix='',
-                     sort=False):
-        if on is not None:
-            raise NotImplementedError("'on' keyword parameter is not yet "
-                                      "implemented")
-        return self._join_index(other, how, lsuffix, rsuffix)
-
-    def _join_index(self, other, how, lsuffix, rsuffix):
-        if isinstance(other, Series):
-            if other.name is None:
-                raise ValueError('Other Series must have a name')
-
-            other = SparseDataFrame({other.name: other},
-                                    default_fill_value=self._default_fill_value)
-
-        join_index = self.index.join(other.index, how=how)
-
-        this = self.reindex(join_index)
-        other = other.reindex(join_index)
-
-        this, other = this._maybe_rename_join(other, lsuffix, rsuffix)
-
-        from pandas import concat
-        return concat([this, other], axis=1, verify_integrity=True)
-
-    def _maybe_rename_join(self, other, lsuffix, rsuffix):
-        to_rename = self.columns.intersection(other.columns)
-        if len(to_rename) > 0:
-            if not lsuffix and not rsuffix:
-                raise ValueError('columns overlap but no suffix specified: %s'
-                                 % to_rename)
-
-            def lrenamer(x):
-                if x in to_rename:
-                    return '%s%s' % (x, lsuffix)
-                return x
-
-            def rrenamer(x):
-                if x in to_rename:
-                    return '%s%s' % (x, rsuffix)
-                return x
-
-            this = self.rename(columns=lrenamer)
-            other = other.rename(columns=rrenamer)
-        else:
-            this = self
-
-        return this, other
-
-    def transpose(self):
-        """
-        Returns a DataFrame with the rows/columns switched.
-        """
-        return SparseDataFrame(self.values.T, index=self.columns,
-                               columns=self.index,
-                               default_fill_value=self._default_fill_value,
-                               default_kind=self._default_kind).__finalize__(self)
-    T = property(transpose)
-
-    @Appender(DataFrame.count.__doc__)
-    def count(self, axis=0, **kwds):
-        return self.apply(lambda x: x.count(), axis=axis)
-
-    def cumsum(self, axis=0):
-        """
-        Return SparseDataFrame of cumulative sums over requested axis.
-
-        Parameters
-        ----------
-        axis : {0, 1}
-            0 for row-wise, 1 for column-wise
-
-        Returns
-        -------
-        y : SparseDataFrame
-        """
-        return self.apply(lambda x: x.cumsum(), axis=axis)
-
-    def apply(self, func, axis=0, broadcast=False, reduce=False):
-        """
-        Analogous to DataFrame.apply, for SparseDataFrame
-
-        Parameters
-        ----------
-        func : function
-            Function to apply to each column
-        axis : {0, 1, 'index', 'columns'}
-        broadcast : bool, default False
-            For aggregation functions, return object of same size with values
-            propagated
-
-        Returns
-        -------
-        applied : Series or SparseDataFrame
-        """
-        if not len(self.columns):
-            return self
-        axis = self._get_axis_number(axis)
-
-        if isinstance(func, np.ufunc):
-            new_series = {}
-            for k, v in compat.iteritems(self):
-                applied = func(v)
-                applied.fill_value = func(applied.fill_value)
-                new_series[k] = applied
-            return self._constructor(new_series, index=self.index,
-                                     columns=self.columns,
-                                     default_fill_value=self._default_fill_value,
-                                     kind=self._default_kind).__finalize__(self)
-        else:
-            if not broadcast:
-                return self._apply_standard(func, axis, reduce=reduce)
-            else:
-                return self._apply_broadcast(func, axis)
-
-    def applymap(self, func):
-        """
-        Apply a function to a DataFrame that is intended to operate
-        elementwise, i.e. like doing map(func, series) for each series in the
-        DataFrame
-
-        Parameters
-        ----------
-        func : function
-            Python function, returns a single value from a single value
-
-        Returns
-        -------
-        applied : DataFrame
-        """
-        return self.apply(lambda x: lmap(func, x))
-
-def to_manager(sdf, columns, index):
-    """ create and return the block manager from a dataframe of series, columns, index """
-
-    # from BlockManager perspective
-    axes = [_ensure_index(columns), _ensure_index(index)]
-
-    return create_block_manager_from_arrays([sdf[c] for c in columns], columns, axes)
-
-
-def stack_sparse_frame(frame):
-    """
-    Only makes sense when fill_value is NaN
-    """
-    lengths = [s.sp_index.npoints for _, s in compat.iteritems(frame)]
-    nobs = sum(lengths)
-
-    # this is pretty fast
-    minor_labels = np.repeat(np.arange(len(frame.columns)), lengths)
-
-    inds_to_concat = []
-    vals_to_concat = []
-    # TODO: Figure out whether this can be reached.
-    # I think this currently can't be reached because you can't build a SparseDataFrame
-    # with a non-np.NaN fill value (fails earlier).
-    for _, series in compat.iteritems(frame):
-        if not np.isnan(series.fill_value):
-            raise TypeError('This routine assumes NaN fill value')
-
-        int_index = series.sp_index.to_int_index()
-        inds_to_concat.append(int_index.indices)
-        vals_to_concat.append(series.sp_values)
-
-    major_labels = np.concatenate(inds_to_concat)
-    stacked_values = np.concatenate(vals_to_concat)
-    index = MultiIndex(levels=[frame.index, frame.columns],
-                       labels=[major_labels, minor_labels],
-                       verify_integrity=False)
-
-    lp = DataFrame(stacked_values.reshape((nobs, 1)), index=index,
-                   columns=['foo'])
-    return lp.sortlevel(level=0)
-
-
-def homogenize(series_dict):
-    """
-    Conform a set of SparseSeries (with NaN fill_value) to a common SparseIndex
-    corresponding to the locations where they all have data
-
-    Parameters
-    ----------
-    series_dict : dict or DataFrame
-
-    Notes
-    -----
-    Using the dumbest algorithm I could think of. Should put some more thought
-    into this
-
-    Returns
-    -------
-    homogenized : dict of SparseSeries
-    """
-    index = None
-
-    need_reindex = False
-
-    for _, series in compat.iteritems(series_dict):
-        if not np.isnan(series.fill_value):
-            raise TypeError('this method is only valid with NaN fill values')
-
-        if index is None:
-            index = series.sp_index
-        elif not series.sp_index.equals(index):
-            need_reindex = True
-            index = index.intersect(series.sp_index)
-
-    if need_reindex:
-        output = {}
-        for name, series in compat.iteritems(series_dict):
-            if not series.sp_index.equals(index):
-                series = series.sparse_reindex(index)
-
-            output[name] = series
-    else:
-        output = series_dict
-
-    return output
-
-# use unaccelerated ops for sparse objects
-ops.add_flex_arithmetic_methods(SparseDataFrame, use_numexpr=False,
-                                **ops.frame_flex_funcs)
-ops.add_special_arithmetic_methods(SparseDataFrame, use_numexpr=False,
-                                   **ops.frame_special_funcs)
diff --git a/pandas/sparse/list.py b/pandas/sparse/list.py
deleted file mode 100644
index bfc4ab9d3eb48..0000000000000
--- a/pandas/sparse/list.py
+++ /dev/null
@@ -1,142 +0,0 @@
-import numpy as np
-from pandas.core.base import PandasObject
-from pandas.core.common import pprint_thing
-
-from pandas.sparse.array import SparseArray
-import pandas._sparse as splib
-
-
-class SparseList(PandasObject):
-
-    """
-    Data structure for accumulating data to be converted into a
-    SparseArray. Has similar API to the standard Python list
-
-    Parameters
-    ----------
-    data : scalar or array-like
-    fill_value : scalar, default NaN
-    """
-
-    def __init__(self, data=None, fill_value=np.nan):
-        self.fill_value = fill_value
-        self._chunks = []
-
-        if data is not None:
-            self.append(data)
-
-    def __unicode__(self):
-        contents = '\n'.join(repr(c) for c in self._chunks)
-        return '%s\n%s' % (object.__repr__(self), pprint_thing(contents))
-
-    def __len__(self):
-        return sum(len(c) for c in self._chunks)
-
-    def __getitem__(self, i):
-        if i < 0:
-            if i + len(self) < 0:  # pragma: no cover
-                raise ValueError('%d out of range' % i)
-            i += len(self)
-
-        passed = 0
-        j = 0
-        while i >= passed + len(self._chunks[j]):
-            passed += len(self._chunks[j])
-            j += 1
-        return self._chunks[j][i - passed]
-
-    def __setitem__(self, i, value):
-        raise NotImplementedError
-
-    @property
-    def nchunks(self):
-        return len(self._chunks)
-
-    @property
-    def is_consolidated(self):
-        return self.nchunks == 1
-
-    def consolidate(self, inplace=True):
-        """
-        Internally consolidate chunks of data
-
-        Parameters
-        ----------
-        inplace : boolean, default True
-            Modify the calling object instead of constructing a new one
-
-        Returns
-        -------
-        splist : SparseList
-            If inplace=False, new object, otherwise reference to existing
-            object
-        """
-        if not inplace:
-            result = self.copy()
-        else:
-            result = self
-
-        if result.is_consolidated:
-            return result
-
-        result._consolidate_inplace()
-        return result
-
-    def _consolidate_inplace(self):
-        new_values = np.concatenate([c.sp_values for c in self._chunks])
-        new_index = _concat_sparse_indexes([c.sp_index for c in self._chunks])
-        new_arr = SparseArray(new_values, sparse_index=new_index,
-                              fill_value=self.fill_value)
-        self._chunks = [new_arr]
-
-    def copy(self):
-        """
-        Return copy of the list
-
-        Returns
-        -------
-        new_list : SparseList
-        """
-        new_splist = SparseList(fill_value=self.fill_value)
-        new_splist._chunks = list(self._chunks)
-        return new_splist
-
-    def to_array(self):
-        """
-        Return SparseArray from data stored in the SparseList
-
-        Returns
-        -------
-        sparr : SparseArray
-        """
-        self.consolidate(inplace=True)
-        return self._chunks[0]
-
-    def append(self, value):
-        """
-        Append element or array-like chunk of data to the SparseList
-
-        Parameters
-        ----------
-        value: scalar or array-like
-        """
-        if np.isscalar(value):
-            value = [value]
-
-        sparr = SparseArray(value, fill_value=self.fill_value)
-        self._chunks.append(sparr)
-        self._consolidated = False
-
-
-def _concat_sparse_indexes(indexes):
-    all_indices = []
-    total_length = 0
-
-    for index in indexes:
-        # increment by offset
-        inds = index.to_int_index().indices + total_length
-
-        all_indices.append(inds)
-        total_length += index.length
-
-    return splib.IntIndex(total_length, np.concatenate(all_indices))
diff --git a/pandas/sparse/panel.py b/pandas/sparse/panel.py
deleted file mode 100644
index f57339fea0a7f..0000000000000
--- a/pandas/sparse/panel.py
+++ /dev/null
@@ -1,564 +0,0 @@
-"""
-Data structures for sparse float data. Life is made simpler by dealing only
-with float64 data
-"""
-
-# pylint: disable=E1101,E1103,W0231
-
-import warnings
-from pandas.compat import range, lrange, zip
-from pandas import compat
-import numpy as np
-
-from pandas.core.index import Index, MultiIndex, _ensure_index
-from pandas.core.frame import DataFrame
-from pandas.core.panel import Panel
-from pandas.sparse.frame import SparseDataFrame
-from pandas.util.decorators import deprecate
-
-import pandas.core.common as com
-import pandas.core.ops as ops
-
-
-class SparsePanelAxis(object):
-
-    def __init__(self, cache_field, frame_attr):
-        self.cache_field = cache_field
-        self.frame_attr = frame_attr
-
-    def __get__(self, obj, type=None):
-        return getattr(obj, self.cache_field, None)
-
-    def __set__(self, obj, value):
-        value = _ensure_index(value)
-
-        if isinstance(value, MultiIndex):
-            raise NotImplementedError("value cannot be a MultiIndex")
-
-        for v in compat.itervalues(obj._frames):
-            setattr(v, self.frame_attr, value)
-
-        setattr(obj, self.cache_field, value)
-
-
-class SparsePanel(Panel):
-
-    """
-    Sparse version of Panel
-
-    Parameters
-    ----------
-    frames : dict of DataFrame objects
-    items : array-like
-    major_axis : array-like
-    minor_axis : array-like
-    default_kind : {'block', 'integer'}, default 'block'
-        Default sparse kind for converting Series to SparseSeries. Will not
-        override SparseSeries passed into constructor
-    default_fill_value : float
-        Default fill_value for converting Series to SparseSeries. Will not
-        override SparseSeries passed in
-
-    Notes
-    -----
-    """
-    ndim = 3
-    _typ = 'panel'
-    _subtyp = 'sparse_panel'
-
-    def __init__(self, frames=None, items=None, major_axis=None, minor_axis=None,
-                 default_fill_value=np.nan, default_kind='block',
-                 copy=False):
-
-        # deprecation #11157
-        warnings.warn("SparsePanel is deprecated and will be removed in a future version",
-                      FutureWarning, stacklevel=2)
-
-        if frames is None:
-            frames = {}
-
-        if isinstance(frames, np.ndarray):
-            new_frames = {}
-            for item, vals in zip(items, frames):
-                new_frames[item] = \
-                    SparseDataFrame(vals, index=major_axis,
-                                    columns=minor_axis,
-                                    default_fill_value=default_fill_value,
-                                    default_kind=default_kind)
-            frames = new_frames
-
-        if not isinstance(frames, dict):
-            raise TypeError('input must be a dict, a %r was passed' %
-                            type(frames).__name__)
-
-        self.default_fill_value = fill_value = default_fill_value
-        self.default_kind = kind = default_kind
-
-        # pre-filter, if necessary
-        if items is None:
-            items = Index(sorted(frames.keys()))
-        items = _ensure_index(items)
-
-        (clean_frames,
-         major_axis,
-         minor_axis) = _convert_frames(frames, major_axis,
-                                       minor_axis, kind=kind,
-                                       fill_value=fill_value)
-
-        self._frames = clean_frames
-
-        # do we want to fill missing ones?
-        for item in items:
-            if item not in clean_frames:
-                raise ValueError('column %r not found in data' % item)
-
-        self._items = items
-        self.major_axis = major_axis
-        self.minor_axis = minor_axis
-
-    def _consolidate_inplace(self):  # pragma: no cover
-        # do nothing when DataFrame calls this method
-        pass
-
-    def __array_wrap__(self, result):
-        return SparsePanel(result, items=self.items,
-                           major_axis=self.major_axis,
-                           minor_axis=self.minor_axis,
-                           default_kind=self.default_kind,
-                           default_fill_value=self.default_fill_value)
-
-    @classmethod
-    def from_dict(cls, data):
-        """
-        Analogous to Panel.from_dict
-        """
-        return SparsePanel(data)
-
-    def to_dense(self):
-        """
-        Convert SparsePanel to (dense) Panel
-
-        Returns
-        -------
-        dense : Panel
-        """
-        return Panel(self.values, self.items, self.major_axis,
-                     self.minor_axis)
-
-    def as_matrix(self):
-        return self.values
-
-    @property
-    def values(self):
-        # return dense values
-        return np.array([self._frames[item].values
-                         for item in self.items])
-
-    # need a special property for items to make the field assignable
-
-    _items = None
-
-    def _get_items(self):
-        return self._items
-
-    def _set_items(self, new_items):
-        new_items = _ensure_index(new_items)
-        if isinstance(new_items, MultiIndex):
-            raise NotImplementedError("itemps cannot be a MultiIndex")
-
-        # need to create new frames dict
-
-        old_frame_dict = self._frames
-        old_items = self._items
-        self._frames = dict((new_k, old_frame_dict[old_k])
-                            for new_k, old_k in zip(new_items, old_items))
-        self._items = new_items
-    items = property(fget=_get_items, fset=_set_items)
-
-    # DataFrame's index
-    major_axis = SparsePanelAxis('_major_axis', 'index')
-
-    # DataFrame's columns / "items"
-    minor_axis = SparsePanelAxis('_minor_axis', 'columns')
-
-    def _ixs(self, i, axis=0):
-        """
-        for compat as we don't support Block Manager here
-        i : int, slice, or sequence of integers
-        axis : int
-        """
-
-        key = self._get_axis(axis)[i]
-
-        # xs cannot handle a non-scalar key, so just reindex here
-        if com.is_list_like(key):
-            return self.reindex(**{self._get_axis_name(axis): key})
-
-        return self.xs(key, axis=axis)
-
-    def _slice(self, slobj, axis=0, kind=None):
-        """
-        for compat as we don't support Block Manager here
-        """
-        axis = self._get_axis_name(axis)
-        index = self._get_axis(axis)
-
-        return self.reindex(**{axis: index[slobj]})
-
-    def _get_item_cache(self, key):
-        return self._frames[key]
-
-    def __setitem__(self, key, value):
-        if isinstance(value, DataFrame):
-            value = value.reindex(index=self.major_axis,
-                                  columns=self.minor_axis)
-            if not isinstance(value, SparseDataFrame):
-                value = value.to_sparse(fill_value=self.default_fill_value,
-                                        kind=self.default_kind)
-        else:
-            raise ValueError('only DataFrame objects can be set currently')
-
-        self._frames[key] = value
-
-        if key not in self.items:
-            self._items = Index(list(self.items) + [key])
-
-    def set_value(self, item, major, minor, value):
-        """
-        Quickly set single value at (item, major, minor) location
-
-        Parameters
-        ----------
-        item : item label (panel item)
-        major : major axis label (panel item row)
-        minor : minor axis label (panel item column)
-        value : scalar
-
-        Notes
-        -----
-        This method *always* returns a new object. It is not particularly
-        efficient but is provided for API compatibility with Panel
-
-        Returns
-        -------
-        panel : SparsePanel
-        """
-        dense = self.to_dense().set_value(item, major, minor, value)
-        return dense.to_sparse(kind=self.default_kind,
-                               fill_value=self.default_fill_value)
-
-    def __delitem__(self, key):
-        loc = self.items.get_loc(key)
-        indices = lrange(loc) + lrange(loc + 1, len(self.items))
-        del self._frames[key]
-        self._items = self._items.take(indices)
-
-    def __getstate__(self):
-        # pickling
-        return (self._frames, com._pickle_array(self.items),
-                com._pickle_array(self.major_axis),
-                com._pickle_array(self.minor_axis),
-                self.default_fill_value, self.default_kind)
-
-    def __setstate__(self, state):
-        frames, items, major, minor, fv, kind = state
-
-        self.default_fill_value = fv
-        self.default_kind = kind
-        self._items = _ensure_index(com._unpickle_array(items))
-        self._major_axis = _ensure_index(com._unpickle_array(major))
-        self._minor_axis = _ensure_index(com._unpickle_array(minor))
-        self._frames = frames
-
-    def copy(self, deep=True):
-        """
-        Make a copy of the sparse panel
-
-        Returns
-        -------
-        copy : SparsePanel
-        """
-
-        d = self._construct_axes_dict()
-        if deep:
-            new_data = dict((k, v.copy(deep=True)) for k, v in compat.iteritems(self._frames))
-            d = dict((k, v.copy(deep=True)) for k, v in compat.iteritems(d))
-        else:
-            new_data = self._frames.copy()
-        d['default_fill_value']=self.default_fill_value
-        d['default_kind']=self.default_kind
-
-        return SparsePanel(new_data, **d)
-
-    def to_frame(self, filter_observations=True):
-        """
-        Convert SparsePanel to (dense) DataFrame
-
-        Returns
-        -------
-        frame : DataFrame
-        """
-        if not filter_observations:
-            raise TypeError('filter_observations=False not supported for '
-                            'SparsePanel.to_long')
-
-        I, N, K = self.shape
-        counts = np.zeros(N * K, dtype=int)
-
-        d_values = {}
-        d_indexer = {}
-
-        for item in self.items:
-            frame = self[item]
-
-            values, major, minor = _stack_sparse_info(frame)
-
-            # values are stacked column-major
-            indexer = minor * N + major
-            counts.put(indexer, counts.take(indexer) + 1)  # cuteness
-
-            d_values[item] = values
-            d_indexer[item] = indexer
-
-        # have full set of observations for each item
-        mask = counts == I
-
-        # for each item, take mask values at index locations for those sparse
-        # values, and use that to select values
-        values = np.column_stack([d_values[item][mask.take(d_indexer[item])]
-                                  for item in self.items])
-
-        inds, = mask.nonzero()
-
-        # still column major
-        major_labels = inds % N
-        minor_labels = inds // N
-
-        index = MultiIndex(levels=[self.major_axis, self.minor_axis],
-                           labels=[major_labels, minor_labels],
-                           verify_integrity=False)
-
-        df = DataFrame(values, index=index, columns=self.items)
-        return df.sortlevel(level=0)
-
-    to_long = deprecate('to_long', to_frame)
-    toLong = deprecate('toLong', to_frame)
-
-    def reindex(self, major=None, items=None, minor=None, major_axis=None,
-                minor_axis=None, copy=False):
-        """
-        Conform / reshape panel axis labels to new input labels
-
-        Parameters
-        ----------
-        major : array-like, default None
-        items : array-like, default None
-        minor : array-like, default None
-        copy : boolean, default False
-            Copy underlying SparseDataFrame objects
-
-        Returns
-        -------
-        reindexed : SparsePanel
-        """
-        major = com._mut_exclusive(major=major, major_axis=major_axis)
-        minor = com._mut_exclusive(minor=minor, minor_axis=minor_axis)
-
-        if com._all_none(items, major, minor):
-            raise ValueError('Must specify at least one axis')
-
-        major = self.major_axis if major is None else major
-        minor = self.minor_axis if minor is None else minor
-
-        if items is not None:
-            new_frames = {}
-            for item in items:
-                if item in self._frames:
-                    new_frames[item] = self._frames[item]
-                else:
-                    raise NotImplementedError('Reindexing with new items not yet '
-                                              'supported')
-        else:
-            new_frames = self._frames
-
-        if copy:
-            new_frames = dict((k, v.copy()) for k, v in compat.iteritems(new_frames))
-
-        return SparsePanel(new_frames, items=items,
-                           major_axis=major,
-                           minor_axis=minor,
-                           default_fill_value=self.default_fill_value,
-                           default_kind=self.default_kind)
-
-    def _combine(self, other, func, axis=0):
-        if isinstance(other, DataFrame):
-            return self._combineFrame(other, func, axis=axis)
-        elif isinstance(other, Panel):
-            return self._combinePanel(other, func)
-        elif np.isscalar(other):
-            new_frames = dict((k, func(v, other))
-                              for k, v in compat.iteritems(self))
-            return self._new_like(new_frames)
-
-    def _combineFrame(self, other, func, axis=0):
-        index, columns = self._get_plane_axes(axis)
-        axis = self._get_axis_number(axis)
-
-        other = other.reindex(index=index, columns=columns)
-
-        if axis == 0:
-            new_values = func(self.values, other.values)
-        elif axis == 1:
-            new_values = func(self.values.swapaxes(0, 1), other.values.T)
-            new_values = new_values.swapaxes(0, 1)
-        elif axis == 2:
-            new_values = func(self.values.swapaxes(0, 2), other.values)
-            new_values = new_values.swapaxes(0, 2)
-
-        # TODO: make faster!
-        new_frames = {}
-        for item, item_slice in zip(self.items, new_values):
-            old_frame = self[item]
-            ofv = old_frame.default_fill_value
-            ok = old_frame.default_kind
-            new_frames[item] = SparseDataFrame(item_slice,
-                                               index=self.major_axis,
-                                               columns=self.minor_axis,
-                                               default_fill_value=ofv,
-                                               default_kind=ok)
-
-        return self._new_like(new_frames)
-
-    def _new_like(self, new_frames):
-        return SparsePanel(new_frames, self.items, self.major_axis,
-                           self.minor_axis,
-                           default_fill_value=self.default_fill_value,
-                           default_kind=self.default_kind)
-
-    def _combinePanel(self, other, func):
-        items = self.items.union(other.items)
-        major = self.major_axis.union(other.major_axis)
-        minor = self.minor_axis.union(other.minor_axis)
-
-        # could check that everything's the same size, but forget it
-
-        this = self.reindex(items=items, major=major, minor=minor)
-        other = other.reindex(items=items, major=major, minor=minor)
-
-        new_frames = {}
-        for item in items:
-            new_frames[item] = func(this[item], other[item])
-
-        if not isinstance(other, SparsePanel):
-            new_default_fill = self.default_fill_value
-        else:
-            # maybe unnecessary
-            new_default_fill = func(self.default_fill_value,
-                                    other.default_fill_value)
-
-        return SparsePanel(new_frames, items, major, minor,
-                           default_fill_value=new_default_fill,
-                           default_kind=self.default_kind)
-
-    def major_xs(self, key):
-        """
-        Return slice of panel along major axis
-
-        Parameters
-        ----------
-        key : object
-            Major axis label
-
-        Returns
-        -------
-        y : DataFrame
-            index -> minor axis, columns -> items
-        """
-        slices = dict((k, v.xs(key)) for k, v in compat.iteritems(self))
-        return DataFrame(slices, index=self.minor_axis, columns=self.items)
-
-    def minor_xs(self, key):
-        """
-        Return slice of panel along minor axis
-
-        Parameters
-        ----------
-        key : object
-            Minor axis label
-
-        Returns
-        -------
-        y : SparseDataFrame
-            index -> major axis, columns -> items
-        """
-        slices = dict((k, v[key]) for k, v in compat.iteritems(self))
-        return SparseDataFrame(slices, index=self.major_axis,
-                               columns=self.items,
-                               default_fill_value=self.default_fill_value,
-                               default_kind=self.default_kind)
-
-    # TODO: allow SparsePanel to work with flex arithmetic.
-    # pow and mod only work for scalars for now
-    def pow(self, val, *args, **kwargs):
-        """wrapper around `__pow__` (only works for scalar values)"""
-        return self.__pow__(val)
-
-    def mod(self, val, *args, **kwargs):
-        """wrapper around `__mod__` (only works for scalar values"""
-        return self.__mod__(val)
-
-# Sparse objects opt out of numexpr
-SparsePanel._add_aggregate_operations(use_numexpr=False)
-ops.add_special_arithmetic_methods(SparsePanel, use_numexpr=False, **ops.panel_special_funcs)
-SparseWidePanel = SparsePanel
-
-
-def _convert_frames(frames, index, columns, fill_value=np.nan, kind='block'):
-    from pandas.core.panel import _get_combined_index
-    output = {}
-    for item, df in compat.iteritems(frames):
-        if not isinstance(df, SparseDataFrame):
-            df = SparseDataFrame(df, default_kind=kind,
-                                 default_fill_value=fill_value)
-
-        output[item] = df
-
-    if index is None:
-        all_indexes = [df.index for df in output.values()]
-        index = _get_combined_index(all_indexes)
-    if columns is None:
-        all_columns = [df.columns for df in output.values()]
-        columns = _get_combined_index(all_columns)
-
-    index = _ensure_index(index)
-    columns = _ensure_index(columns)
-
-    for item, df in compat.iteritems(output):
-        if not (df.index.equals(index) and df.columns.equals(columns)):
-            output[item] = df.reindex(index=index, columns=columns)
-
-    return output, index, columns
-
-
-def _stack_sparse_info(frame):
-    lengths = [s.sp_index.npoints for _, s in compat.iteritems(frame)]
-
-    # this is pretty fast
-    minor_labels = np.repeat(np.arange(len(frame.columns)), lengths)
-
-    inds_to_concat = []
-    vals_to_concat = []
-    for col in frame.columns:
-        series = frame[col]
-
-        if not np.isnan(series.fill_value):
-            raise TypeError('This routine assumes NaN fill value')
-
-        int_index = series.sp_index.to_int_index()
-        inds_to_concat.append(int_index.indices)
-        vals_to_concat.append(series.sp_values)
-
-    major_labels = np.concatenate(inds_to_concat)
-    sparse_values = np.concatenate(vals_to_concat)
-
-    return sparse_values, major_labels, minor_labels
diff --git a/pandas/sparse/scipy_sparse.py b/pandas/sparse/scipy_sparse.py
deleted file mode 100644
index a815ca7545561..0000000000000
--- a/pandas/sparse/scipy_sparse.py
+++ /dev/null
@@ -1,134 +0,0 @@
-"""
-Interaction with scipy.sparse matrices.
-
-Currently only includes SparseSeries.to_coo helpers.
-"""
-from pandas.core.frame import DataFrame
-from pandas.core.index import MultiIndex, Index
-from pandas.core.series import Series
-import itertools
-import numpy as np
-from pandas.compat import OrderedDict, lmap
-from pandas.tools.util import cartesian_product
-
-
-def _check_is_partition(parts, whole):
-    whole = set(whole)
-    parts = [set(x) for x in parts]
-    if set.intersection(*parts) != set():
-        raise ValueError(
-            'Is not a partition because intersection is not null.')
-    if set.union(*parts) != whole:
-        raise ValueError('Is not a partition becuase union is not the whole.')
-
-
-def _to_ijv(ss, row_levels=(0,), column_levels=(1,), sort_labels=False):
-    """ For arbitrary (MultiIndexed) SparseSeries return
-    (v, i, j, ilabels, jlabels) where (v, (i, j)) is suitable for
-    passing to scipy.sparse.coo constructor. """
-    # index and column levels must be a partition of the index
-    _check_is_partition([row_levels, column_levels], range(ss.index.nlevels))
-
-    # from the SparseSeries: get the labels and data for non-null entries
-    values = ss._data.internal_values()._valid_sp_values
-
-    nonnull_labels = ss.dropna()
-
-    def get_indexers(levels):
-        """ Return sparse coords and dense labels for subset levels """
-
-        # TODO: how to do this better? cleanly slice nonnull_labels given the
-        # coord
-        values_ilabels = [tuple(x[i] for i in levels)
-                          for x in nonnull_labels.index]
-        if len(levels) == 1:
-            values_ilabels = [x[0] for x in values_ilabels]
-
-        #######################################################################
-        # # performance issues with groupby ###################################
-        # TODO: these two lines can rejplace the code below but
-        # groupby is too slow (in some cases at least)
-        # labels_to_i = ss.groupby(level=levels, sort=sort_labels).first()
-        # labels_to_i[:] = np.arange(labels_to_i.shape[0])
-
-        def _get_label_to_i_dict(labels, sort_labels=False):
-            """ Return OrderedDict of unique labels to number.
-            Optionally sort by label. """
-            labels = Index(lmap(tuple, labels)).unique().tolist()  # squish
-            if sort_labels:
-                labels = sorted(list(labels))
-            d = OrderedDict((k, i) for i, k in enumerate(labels))
-            return(d)
-
-        def _get_index_subset_to_coord_dict(index, subset, sort_labels=False):
-            def robust_get_level_values(i):
-                # if index has labels (that are not None) use those,
-                # else use the level location
-                try:
-                    return(index.get_level_values(index.names[i]))
-                except KeyError:
-                    return(index.get_level_values(i))
-            ilabels = list(
-                zip(*[robust_get_level_values(i) for i in subset]))
-            labels_to_i = _get_label_to_i_dict(
-                ilabels, sort_labels=sort_labels)
-            labels_to_i = Series(labels_to_i)
-            if len(subset) > 1:
-                labels_to_i.index = MultiIndex.from_tuples(labels_to_i.index)
-            labels_to_i.index.names = [index.names[i] for i in subset]
-            labels_to_i.name = 'value'
-            return(labels_to_i)
-
-        labels_to_i = _get_index_subset_to_coord_dict(
-            ss.index, levels, sort_labels=sort_labels)
-        #######################################################################
-        #######################################################################
-
-        i_coord = labels_to_i[values_ilabels].tolist()
-        i_labels = labels_to_i.index.tolist()
-
-        return i_coord, i_labels
-
-    i_coord, i_labels = get_indexers(row_levels)
-    j_coord, j_labels = get_indexers(column_levels)
-
-    return values, i_coord, j_coord, i_labels, j_labels
-
-
-def _sparse_series_to_coo(ss, row_levels=(0,), column_levels=(1,), sort_labels=False):
-    """ Convert a SparseSeries to a scipy.sparse.coo_matrix using index
-    levels row_levels, column_levels as the row and column
-    labels respectively. Returns the sparse_matrix, row and column labels. """
-
-    import scipy.sparse
-
-    if ss.index.nlevels < 2:
-        raise ValueError('to_coo requires MultiIndex with nlevels > 2')
-    if not ss.index.is_unique:
-        raise ValueError(
-            'Duplicate index entries are not allowed in to_coo transformation.')
-
-    # to keep things simple, only rely on integer indexing (not labels)
-    row_levels = [ss.index._get_level_number(x) for x in row_levels]
-    column_levels = [ss.index._get_level_number(x) for x in column_levels]
-
-    v, i, j, rows, columns = _to_ijv(
-        ss, row_levels=row_levels, column_levels=column_levels, sort_labels=sort_labels)
-    sparse_matrix = scipy.sparse.coo_matrix(
-        (v, (i, j)), shape=(len(rows), len(columns)))
-    return sparse_matrix, rows, columns
-
-
-def _coo_to_sparse_series(A, dense_index=False):
-    """ Convert a scipy.sparse.coo_matrix to a SparseSeries.
-    Use the defaults given in the SparseSeries constructor. """
-    s = Series(A.data, MultiIndex.from_arrays((A.row, A.col)))
-    s = s.sort_index()
-    s = s.to_sparse()  # TODO: specify kind?
-    if dense_index:
-        # is there a better constructor method to use here?
-        i = range(A.shape[0])
-        j = range(A.shape[1])
-        ind = MultiIndex.from_product([i, j])
-        s = s.reindex_axis(ind)
-    return s
diff --git a/pandas/sparse/series.py b/pandas/sparse/series.py
deleted file mode 100644
index 96d509ed9b7c1..0000000000000
--- a/pandas/sparse/series.py
+++ /dev/null
@@ -1,777 +0,0 @@
-"""
-Data structures for sparse float data. Life is made simpler by dealing only
-with float64 data
-"""
-
-# pylint: disable=E1101,E1103,W0231
-
-from numpy import nan, ndarray
-import numpy as np
-import warnings
-import operator
-
-from pandas.core.common import isnull, _values_from_object, _maybe_match_name
-from pandas.core.index import Index, _ensure_index
-from pandas.core.series import Series
-from pandas.core.frame import DataFrame
-from pandas.core.internals import SingleBlockManager
-from pandas.core import generic
-import pandas.core.common as com
-import pandas.core.ops as ops
-import pandas.core.datetools as datetools
-import pandas.index as _index
-
-from pandas import compat
-
-from pandas.sparse.array import (make_sparse, _sparse_array_op, SparseArray)
-from pandas._sparse import BlockIndex, IntIndex
-import pandas._sparse as splib
-
-from pandas.util.decorators import Appender
-
-from pandas.sparse.scipy_sparse import _sparse_series_to_coo, _coo_to_sparse_series
-
-#------------------------------------------------------------------------------
-# Wrapper function for Series arithmetic methods
-
-
-def _arith_method(op, name, str_rep=None, default_axis=None, fill_zeros=None,
-                  **eval_kwargs):
-    """
-    Wrapper function for Series arithmetic operations, to avoid
-    code duplication.
-
-    str_rep, default_axis, fill_zeros and eval_kwargs are not used, but are present
-    for compatibility.
-    """
-
-    def wrapper(self, other):
-        if isinstance(other, Series):
-            if not isinstance(other, SparseSeries):
-                other = other.to_sparse(fill_value=self.fill_value)
-            return _sparse_series_op(self, other, op, name)
-        elif isinstance(other, DataFrame):
-            return NotImplemented
-        elif np.isscalar(other):
-            if isnull(other) or isnull(self.fill_value):
-                new_fill_value = np.nan
-            else:
-                new_fill_value = op(np.float64(self.fill_value),
-                                    np.float64(other))
-
-            return SparseSeries(op(self.sp_values, other),
-                                index=self.index,
-                                sparse_index=self.sp_index,
-                                fill_value=new_fill_value,
-                                name=self.name)
-        else:  # pragma: no cover
-            raise TypeError('operation with %s not supported' % type(other))
-
-    wrapper.__name__ = name
-    if name.startswith("__"):
-        # strip special method names, e.g. `__add__` needs to be `add` when passed
-        # to _sparse_series_op
-        name = name[2:-2]
-    return wrapper
-
-
-def _sparse_series_op(left, right, op, name):
-    left, right = left.align(right, join='outer', copy=False)
-    new_index = left.index
-    new_name = _maybe_match_name(left, right)
-
-    result = _sparse_array_op(left, right, op, name)
-    return SparseSeries(result, index=new_index, name=new_name)
-
-
-class SparseSeries(Series):
-
-    """Data structure for labeled, sparse floating point data
-
-    Parameters
-    ----------
-    data : {array-like, Series, SparseSeries, dict}
-    kind : {'block', 'integer'}
-    fill_value : float
-        Defaults to NaN (code for missing)
-    sparse_index : {BlockIndex, IntIndex}, optional
-        Only if you have one. Mainly used internally
-
-    Notes
-    -----
-    SparseSeries objects are immutable via the typical Python means. If you
-    must change values, convert to dense, make your changes, then convert back
-    to sparse
-    """
-    _subtyp = 'sparse_series'
-
-    def __init__(self, data=None, index=None, sparse_index=None, kind='block',
-                 fill_value=None, name=None, dtype=None, copy=False,
-                 fastpath=False):
-
-        # we are called internally, so short-circuit
-        if fastpath:
-
-            # data is an ndarray, index is defined
-            data = SingleBlockManager(data, index, fastpath=True)
-            if copy:
-                data = data.copy()
-        else:
-
-            if data is None:
-                data = []
-
-            if isinstance(data, Series) and name is None:
-                name = data.name
-
-            is_sparse_array = isinstance(data, SparseArray)
-            if fill_value is None:
-                if is_sparse_array:
-                    fill_value = data.fill_value
-                else:
-                    fill_value = nan
-
-            if is_sparse_array:
-                if isinstance(data, SparseSeries) and index is None:
-                    index = data.index.view()
-                elif index is not None:
-                    assert(len(index) == len(data))
-
-                sparse_index = data.sp_index
-                data = np.asarray(data)
-
-            elif isinstance(data, SparseSeries):
-                if index is None:
-                    index = data.index.view()
-
-                # extract the SingleBlockManager
-                data = data._data
-
-            elif isinstance(data, (Series, dict)):
-                if index is None:
-                    index = data.index.view()
-
-                data = Series(data)
-                data, sparse_index = make_sparse(data, kind=kind,
-                                                 fill_value=fill_value)
-
-            elif isinstance(data, (tuple, list, np.ndarray)):
-                # array-like
-                if sparse_index is None:
-                    data, sparse_index = make_sparse(data, kind=kind,
-                                                     fill_value=fill_value)
-                else:
-                    assert(len(data) == sparse_index.npoints)
-
-            elif isinstance(data, SingleBlockManager):
-                if dtype is not None:
-                    data = data.astype(dtype)
-                if index is None:
-                    index = data.index.view()
-                else:
-                    data = data.reindex(index, copy=False)
-
-            else:
-
-                length = len(index)
-
-                if data == fill_value or (isnull(data)
-                                          and isnull(fill_value)):
-                    if kind == 'block':
-                        sparse_index = BlockIndex(length, [], [])
-                    else:
-                        sparse_index = IntIndex(length, [])
-                    data = np.array([])
-
-                else:
-                    if kind == 'block':
-                        locs, lens = ([0], [length]) if length else ([], [])
-                        sparse_index = BlockIndex(length, locs, lens)
-                    else:
-                        sparse_index = IntIndex(length, index)
-                    v = data
-                    data = np.empty(length)
-                    data.fill(v)
-
-            if index is None:
-                index = com._default_index(sparse_index.length)
-            index = _ensure_index(index)
-
-            # create/copy the manager
-            if isinstance(data, SingleBlockManager):
-
-                if copy:
-                    data = data.copy()
-            else:
-
-                # create a sparse array
-                if not isinstance(data, SparseArray):
-                    data = SparseArray(
-                        data, sparse_index=sparse_index, fill_value=fill_value, dtype=dtype, copy=copy)
-
-                data = SingleBlockManager(data, index)
-
-        generic.NDFrame.__init__(self, data)
-
-        self.index = index
-        self.name = name
-
-    @property
-    def values(self):
-        """ return the array """
-        return self.block.values
-
-    def __array__(self, result=None):
-        """ the array interface, return my values """
-        return self.block.values
-
-    def get_values(self):
-        """ same as values """
-        return self.block.to_dense().view()
-
-    @property
-    def block(self):
-        return self._data._block
-
-    @property
-    def fill_value(self):
-        return self.block.fill_value
-
-    @fill_value.setter
-    def fill_value(self, v):
-        self.block.fill_value = v
-
-    @property
-    def sp_index(self):
-        return self.block.sp_index
-
-    @property
-    def sp_values(self):
-        return self.values.sp_values
-
-    @property
-    def npoints(self):
-        return self.sp_index.npoints
-
-    @classmethod
-    def from_array(cls, arr, index=None, name=None, copy=False, fill_value=None, fastpath=False):
-        """
-        Simplified alternate constructor
-        """
-        return cls(arr, index=index, name=name, copy=copy, fill_value=fill_value, fastpath=fastpath)
-
-    @property
-    def _constructor(self):
-        return SparseSeries
-
-    @property
-    def kind(self):
-        if isinstance(self.sp_index, BlockIndex):
-            return 'block'
-        elif isinstance(self.sp_index, IntIndex):
-            return 'integer'
-
-    def as_sparse_array(self, kind=None, fill_value=None, copy=False):
-        """ return my self as a sparse array, do not copy by default """
-
-        if fill_value is None:
-            fill_value = self.fill_value
-        if kind is None:
-            kind = self.kind
-        return SparseArray(self.values,
-                           sparse_index=self.sp_index,
-                           fill_value=fill_value,
-                           kind=kind,
-                           copy=copy)
-
-    def __len__(self):
-        return len(self.block)
-
-    def __unicode__(self):
-        # currently, unicode is same as repr...fixes infinite loop
-        series_rep = Series.__unicode__(self)
-        rep = '%s\n%s' % (series_rep, repr(self.sp_index))
-        return rep
-
-    def __array_wrap__(self, result):
-        """
-        Gets called prior to a ufunc (and after)
-        """
-        return self._constructor(result,
-                                 index=self.index,
-                                 sparse_index=self.sp_index,
-                                 fill_value=self.fill_value,
-                                 copy=False).__finalize__(self)
-
-    def __array_finalize__(self, obj):
-        """
-        Gets called after any ufunc or other array operations, necessary
-        to pass on the index.
-        """
-        self.name = getattr(obj, 'name', None)
-        self.fill_value = getattr(obj, 'fill_value', None)
-
-    def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
-                filter_type=None, **kwds):
-        """ perform a reduction operation """
-        return op(self.get_values(), skipna=skipna, **kwds)
-
-    def __getstate__(self):
-        # pickling
-        return dict(_typ=self._typ,
-                    _subtyp=self._subtyp,
-                    _data=self._data,
-                    fill_value=self.fill_value,
-                    name=self.name)
-
-    def _unpickle_series_compat(self, state):
-
-        nd_state, own_state = state
-
-        # recreate the ndarray
-        data = np.empty(nd_state[1], dtype=nd_state[2])
-        np.ndarray.__setstate__(data, nd_state)
-
-        index, fill_value, sp_index = own_state[:3]
-        name = None
-        if len(own_state) > 3:
-            name = own_state[3]
-
-        # create a sparse array
-        if not isinstance(data, SparseArray):
-            data = SparseArray(
-                data, sparse_index=sp_index, fill_value=fill_value, copy=False)
-
-        # recreate
-        data = SingleBlockManager(data, index, fastpath=True)
-        generic.NDFrame.__init__(self, data)
-
-        self._set_axis(0, index)
-        self.name = name
-
-    def __iter__(self):
-        """ forward to the array """
-        return iter(self.values)
-
-    def _set_subtyp(self, is_all_dates):
-        if is_all_dates:
-            object.__setattr__(self, '_subtyp', 'sparse_time_series')
-        else:
-            object.__setattr__(self, '_subtyp', 'sparse_series')
-
-    def _get_val_at(self, loc):
-        """ forward to the array """
-        return self.block.values._get_val_at(loc)
-
-    def __getitem__(self, key):
-        """
-
-        """
-        try:
-            return self._get_val_at(self.index.get_loc(key))
-
-        except KeyError:
-            if isinstance(key, (int, np.integer)):
-                return self._get_val_at(key)
-            raise Exception('Requested index not in this series!')
-
-        except TypeError:
-            # Could not hash item, must be array-like?
-            pass
-
-        # is there a case where this would NOT be an ndarray?
-        # need to find an example, I took out the case for now
-
-        key = _values_from_object(key)
-        dataSlice = self.values[key]
-        new_index = Index(self.index.view(ndarray)[key])
-        return self._constructor(dataSlice, index=new_index).__finalize__(self)
-
-    def _set_with_engine(self, key, value):
-        return self.set_value(key, value)
-
-    def abs(self):
-        """
-        Return an object with absolute value taken. Only applicable to objects
-        that are all numeric
-
-        Returns
-        -------
-        abs: type of caller
-        """
-        res_sp_values = np.abs(self.sp_values)
-        return self._constructor(res_sp_values, index=self.index,
-                                 sparse_index=self.sp_index,
-                                 fill_value=self.fill_value).__finalize__(self)
-
-    def get(self, label, default=None):
-        """
-        Returns value occupying requested label, default to specified
-        missing value if not present. Analogous to dict.get
-
-        Parameters
-        ----------
-        label : object
-            Label value looking for
-        default : object, optional
-            Value to return if label not in index
-
-        Returns
-        -------
-        y : scalar
-        """
-        if label in self.index:
-            loc = self.index.get_loc(label)
-            return self._get_val_at(loc)
-        else:
-            return default
-
-    def get_value(self, label, takeable=False):
-        """
-        Retrieve single value at passed index label
-
-        Parameters
-        ----------
-        index : label
-        takeable : interpret the index as indexers, default False
-
-        Returns
-        -------
-        value : scalar value
-        """
-        loc = label if takeable is True else self.index.get_loc(label)
-        return self._get_val_at(loc)
-
-    def set_value(self, label, value, takeable=False):
-        """
-        Quickly set single value at passed label. If label is not contained, a
-        new object is created with the label placed at the end of the result
-        index
-
-        Parameters
-        ----------
-        label : object
-            Partial indexing with MultiIndex not allowed
-        value : object
-            Scalar value
-        takeable : interpret the index as indexers, default False
-
-        Notes
-        -----
-        This method *always* returns a new object. It is not particularly
-        efficient but is provided for API compatibility with Series
-
-        Returns
-        -------
-        series : SparseSeries
-        """
-        values = self.to_dense()
-
-        # if the label doesn't exist, we will create a new object here
-        # and possibily change the index
-        new_values = values.set_value(label, value, takeable=takeable)
-        if new_values is not None:
-            values = new_values
-        new_index = values.index
-        values = SparseArray(
-            values, fill_value=self.fill_value, kind=self.kind)
-        self._data = SingleBlockManager(values, new_index)
-        self._index = new_index
-
-    def _set_values(self, key, value):
-
-        # this might be inefficient as we have to recreate the sparse array
-        # rather than setting individual elements, but have to convert
-        # the passed slice/boolean that's in dense space into a sparse indexer
-        # not sure how to do that!
-        if isinstance(key, Series):
-            key = key.values
-
-        values = self.values.to_dense()
-        values[key] = _index.convert_scalar(values, value)
-        values = SparseArray(
-            values, fill_value=self.fill_value, kind=self.kind)
-        self._data = SingleBlockManager(values, self.index)
-
-    def to_dense(self, sparse_only=False):
-        """
-        Convert SparseSeries to (dense) Series
-        """
-        if sparse_only:
-            int_index = self.sp_index.to_int_index()
-            index = self.index.take(int_index.indices)
-            return Series(self.sp_values, index=index, name=self.name)
-        else:
-            return Series(self.values.to_dense(), index=self.index, name=self.name)
-
-    @property
-    def density(self):
-        r = float(self.sp_index.npoints) / float(self.sp_index.length)
-        return r
-
-    def copy(self, deep=True):
-        """
-        Make a copy of the SparseSeries. Only the actual sparse values need to
-        be copied
-        """
-        new_data = self._data
-        if deep:
-            new_data = self._data.copy()
-
-        return self._constructor(new_data,
-                                 sparse_index=self.sp_index,
-                                 fill_value=self.fill_value).__finalize__(self)
-
-    def reindex(self, index=None, method=None, copy=True, limit=None):
-        """
-        Conform SparseSeries to new Index
-
-        See Series.reindex docstring for general behavior
-
-        Returns
-        -------
-        reindexed : SparseSeries
-        """
-        new_index = _ensure_index(index)
-
-        if self.index.equals(new_index):
-            if copy:
-                return self.copy()
-            else:
-                return self
-        return self._constructor(self._data.reindex(new_index, method=method, limit=limit, copy=copy),
-                                 index=new_index).__finalize__(self)
-
-    def sparse_reindex(self, new_index):
-        """
-        Conform sparse values to new SparseIndex
-
-        Parameters
-        ----------
-        new_index : {BlockIndex, IntIndex}
-
-        Returns
-        -------
-        reindexed : SparseSeries
-        """
-        if not isinstance(new_index, splib.SparseIndex):
-            raise TypeError('new index must be a SparseIndex')
-
-        block = self.block.sparse_reindex(new_index)
-        new_data = SingleBlockManager(block, self.index)
-        return self._constructor(new_data, index=self.index,
-                                 sparse_index=new_index,
-                                 fill_value=self.fill_value).__finalize__(self)
-
-    def take(self, indices, axis=0, convert=True):
-        """
-        Sparse-compatible version of ndarray.take
-
-        Returns
-        -------
-        taken : ndarray
-        """
-        new_values = SparseArray.take(self.values, indices)
-        new_index = self.index.take(indices)
-        return self._constructor(new_values, index=new_index).__finalize__(self)
-
-    def cumsum(self, axis=0, dtype=None, out=None):
-        """
-        Cumulative sum of values. Preserves locations of NaN values
-
-        Returns
-        -------
-        cumsum : Series or SparseSeries
-        """
-        new_array = SparseArray.cumsum(self.values)
-        if isinstance(new_array, SparseArray):
-            return self._constructor(new_array, index=self.index, sparse_index=new_array.sp_index).__finalize__(self)
-        return Series(new_array, index=self.index).__finalize__(self)
-
-    def dropna(self, axis=0, inplace=False, **kwargs):
-        """
-        Analogous to Series.dropna. If fill_value=NaN, returns a dense Series
-        """
-        # TODO: make more efficient
-        axis = self._get_axis_number(axis or 0)
-        dense_valid = self.to_dense().valid()
-        if inplace:
-            raise NotImplementedError("Cannot perform inplace dropna"
-                                      " operations on a SparseSeries")
-        if isnull(self.fill_value):
-            return dense_valid
-        else:
-            dense_valid = dense_valid[dense_valid != self.fill_value]
-            return dense_valid.to_sparse(fill_value=self.fill_value)
-
-    def shift(self, periods, freq=None):
-        """
-        Analogous to Series.shift
-        """
-
-        # no special handling of fill values yet
-        if not isnull(self.fill_value):
-            dense_shifted = self.to_dense().shift(periods, freq=freq,
-                                                  **kwds)
-            return dense_shifted.to_sparse(fill_value=self.fill_value,
-                                           kind=self.kind)
-
-        if periods == 0:
-            return self.copy()
-
-        if freq is not None:
-            return self._constructor(self.sp_values,
-                                     sparse_index=self.sp_index,
-                                     index=self.index.shift(periods, freq),
-                                     fill_value=self.fill_value).__finalize__(self)
-
-        int_index = self.sp_index.to_int_index()
-        new_indices = int_index.indices + periods
-        start, end = new_indices.searchsorted([0, int_index.length])
-
-        new_indices = new_indices[start:end]
-
-        new_sp_index = IntIndex(len(self), new_indices)
-        if isinstance(self.sp_index, BlockIndex):
-            new_sp_index = new_sp_index.to_block_index()
-
-        return self._constructor(self.sp_values[start:end].copy(),
-                                 index=self.index,
-                                 sparse_index=new_sp_index,
-                                 fill_value=self.fill_value).__finalize__(self)
-
-    def combine_first(self, other):
-        """
-        Combine Series values, choosing the calling Series's values
-        first. Result index will be the union of the two indexes
-
-        Parameters
-        ----------
-        other : Series
-
-        Returns
-        -------
-        y : Series
-        """
-        if isinstance(other, SparseSeries):
-            other = other.to_dense()
-
-        dense_combined = self.to_dense().combine_first(other)
-        return dense_combined.to_sparse(fill_value=self.fill_value)
-
-    def to_coo(self, row_levels=(0,), column_levels=(1,), sort_labels=False):
-        """
-        Create a scipy.sparse.coo_matrix from a SparseSeries with MultiIndex.
-
-        Use row_levels and column_levels to determine the row and column coordinates respectively.
-        row_levels and column_levels are the names (labels) or numbers of the levels.
-        {row_levels, column_levels} must be a partition of the MultiIndex level names (or numbers).
-
-        .. versionadded:: 0.16.0
-
-        Parameters
-        ----------
-        row_levels : tuple/list
-        column_levels : tuple/list
-        sort_labels : bool, default False
-            Sort the row and column labels before forming the sparse matrix.
-
-        Returns
-        -------
-        y : scipy.sparse.coo_matrix
-        rows : list (row labels)
-        columns : list (column labels)
-
-        Examples
-        --------
-        >>> from numpy import nan
-        >>> s = Series([3.0, nan, 1.0, 3.0, nan, nan])
-        >>> s.index = MultiIndex.from_tuples([(1, 2, 'a', 0),
-                                              (1, 2, 'a', 1),
-                                              (1, 1, 'b', 0),
-                                              (1, 1, 'b', 1),
-                                              (2, 1, 'b', 0),
-                                              (2, 1, 'b', 1)],
-                                              names=['A', 'B', 'C', 'D'])
-        >>> ss = s.to_sparse()
-        >>> A, rows, columns = ss.to_coo(row_levels=['A', 'B'],
-                                         column_levels=['C', 'D'],
-                                         sort_labels=True)
-        >>> A
-        <3x4 sparse matrix of type '<class 'numpy.float64'>'
-                with 3 stored elements in COOrdinate format>
-        >>> A.todense()
-        matrix([[ 0.,  0.,  1.,  3.],
-        [ 3.,  0.,  0.,  0.],
-        [ 0.,  0.,  0.,  0.]])
-        >>> rows
-        [(1, 1), (1, 2), (2, 1)]
-        >>> columns
-        [('a', 0), ('a', 1), ('b', 0), ('b', 1)]
-        """
-        A, rows, columns = _sparse_series_to_coo(
-            self, row_levels, column_levels, sort_labels=sort_labels)
-        return A, rows, columns
-
-    @classmethod
-    def from_coo(cls, A, dense_index=False):
-        """
-        Create a SparseSeries from a scipy.sparse.coo_matrix.
-
-        .. versionadded:: 0.16.0
-
-        Parameters
-        ----------
-        A : scipy.sparse.coo_matrix
-        dense_index : bool, default False
-            If False (default), the SparseSeries index consists of only the coords of the non-null entries of the original coo_matrix.
-            If True, the SparseSeries index consists of the full sorted (row, col) coordinates of the coo_matrix.
-
-        Returns
-        -------
-        s : SparseSeries
-
-        Examples
-        ---------
-        >>> from scipy import sparse
-        >>> A = sparse.coo_matrix(([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])),
-                               shape=(3, 4))
-        >>> A
-        <3x4 sparse matrix of type '<class 'numpy.float64'>'
-                with 3 stored elements in COOrdinate format>
-        >>> A.todense()
-        matrix([[ 0.,  0.,  1.,  2.],
-                [ 3.,  0.,  0.,  0.],
-                [ 0.,  0.,  0.,  0.]])
-        >>> ss = SparseSeries.from_coo(A)
-        >>> ss
-        0  2    1
-           3    2
-        1  0    3
-        dtype: float64
-        BlockIndex
-        Block locations: array([0], dtype=int32)
-        Block lengths: array([3], dtype=int32)
-        """
-        return _coo_to_sparse_series(A, dense_index=dense_index)
-
-# overwrite series methods with unaccelerated versions
-ops.add_special_arithmetic_methods(SparseSeries, use_numexpr=False,
-                                   **ops.series_special_funcs)
-ops.add_flex_arithmetic_methods(SparseSeries, use_numexpr=False,
-                                **ops.series_flex_funcs)
-# overwrite basic arithmetic to use SparseSeries version
-# force methods to overwrite previous definitions.
-ops.add_special_arithmetic_methods(SparseSeries, _arith_method,
-                                   radd_func=operator.add, comp_method=None,
-                                   bool_method=None, use_numexpr=False, force=True)
-
-# backwards compatiblity
-class SparseTimeSeries(SparseSeries):
-
-    def __init__(self, *args, **kwargs):
-        # deprecation TimeSeries, #10890
-        warnings.warn("SparseTimeSeries is deprecated. Please use SparseSeries",
-                      FutureWarning, stacklevel=2)
-
-        super(SparseTimeSeries, self).__init__(*args, **kwargs)
diff --git a/pandas/sparse/tests/test_array.py b/pandas/sparse/tests/test_array.py
deleted file mode 100644
index 4ffc0b98ebc71..0000000000000
--- a/pandas/sparse/tests/test_array.py
+++ /dev/null
@@ -1,180 +0,0 @@
-from pandas.compat import range
-import re
-from numpy import nan, ndarray
-import numpy as np
-
-import operator
-
-from pandas.core.series import Series
-from pandas.core.common import notnull
-from pandas.sparse.api import SparseArray
-from pandas.util.testing import assert_almost_equal, assertRaisesRegexp
-import pandas.util.testing as tm
-
-
-def assert_sp_array_equal(left, right):
-    assert_almost_equal(left.sp_values, right.sp_values)
-    assert(left.sp_index.equals(right.sp_index))
-    if np.isnan(left.fill_value):
-        assert(np.isnan(right.fill_value))
-    else:
-        assert(left.fill_value == right.fill_value)
-
-
-class TestSparseArray(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.arr_data = np.array([nan, nan, 1, 2, 3, nan, 4, 5, nan, 6])
-        self.arr = SparseArray(self.arr_data)
-        self.zarr = SparseArray([0, 0, 1, 2, 3, 0, 4, 5, 0, 6], fill_value=0)
-
-    def test_get_item(self):
-        errmsg = re.compile("bounds")
-        assertRaisesRegexp(IndexError, errmsg, lambda: self.arr[11])
-        assertRaisesRegexp(IndexError, errmsg, lambda: self.arr[-11])
-        self.assertEqual(self.arr[-1], self.arr[len(self.arr) - 1])
-
-    def test_bad_take(self):
-        assertRaisesRegexp(IndexError, "bounds", lambda: self.arr.take(11))
-        self.assertRaises(IndexError, lambda: self.arr.take(-11))
-
-    def test_set_item(self):
-        def setitem():
-            self.arr[5] = 3
-
-        def setslice():
-            self.arr[1:5] = 2
-        assertRaisesRegexp(TypeError, "item assignment", setitem)
-        assertRaisesRegexp(TypeError, "item assignment", setslice)
-
-    def test_constructor_from_sparse(self):
-        res = SparseArray(self.zarr)
-        self.assertEqual(res.fill_value, 0)
-        assert_almost_equal(res.sp_values, self.zarr.sp_values)
-
-    def test_constructor_copy(self):
-        cp = SparseArray(self.arr, copy=True)
-        cp.sp_values[:3] = 0
-        self.assertFalse((self.arr.sp_values[:3] == 0).any())
-
-        not_copy = SparseArray(self.arr)
-        not_copy.sp_values[:3] = 0
-        self.assertTrue((self.arr.sp_values[:3] == 0).all())
-
-    def test_astype(self):
-        res = self.arr.astype('f8')
-        res.sp_values[:3] = 27
-        self.assertFalse((self.arr.sp_values[:3] == 27).any())
-
-        assertRaisesRegexp(TypeError, "floating point", self.arr.astype, 'i8')
-
-    def test_copy_shallow(self):
-        arr2 = self.arr.copy(deep=False)
-
-        def _get_base(values):
-            base = values.base
-            while base.base is not None:
-                base = base.base
-            return base
-
-        assert(_get_base(arr2) is _get_base(self.arr))
-
-    def test_values_asarray(self):
-        assert_almost_equal(self.arr.values, self.arr_data)
-        assert_almost_equal(self.arr.to_dense(), self.arr_data)
-        assert_almost_equal(self.arr.sp_values, np.asarray(self.arr))
-
-    def test_getitem(self):
-        def _checkit(i):
-            assert_almost_equal(self.arr[i], self.arr.values[i])
-
-        for i in range(len(self.arr)):
-            _checkit(i)
-            _checkit(-i)
-
-    def test_getslice(self):
-        result = self.arr[:-3]
-        exp = SparseArray(self.arr.values[:-3])
-        assert_sp_array_equal(result, exp)
-
-        result = self.arr[-4:]
-        exp = SparseArray(self.arr.values[-4:])
-        assert_sp_array_equal(result, exp)
-
-        # two corner cases from Series
-        result = self.arr[-12:]
-        exp = SparseArray(self.arr)
-        assert_sp_array_equal(result, exp)
-
-        result = self.arr[:-12]
-        exp = SparseArray(self.arr.values[:0])
-        assert_sp_array_equal(result, exp)
-
-    def test_binary_operators(self):
-        data1 = np.random.randn(20)
-        data2 = np.random.randn(20)
-        data1[::2] = np.nan
-        data2[::3] = np.nan
-
-        arr1 = SparseArray(data1)
-        arr2 = SparseArray(data2)
-
-        data1[::2] = 3
-        data2[::3] = 3
-        farr1 = SparseArray(data1, fill_value=3)
-        farr2 = SparseArray(data2, fill_value=3)
-
-        def _check_op(op, first, second):
-            res = op(first, second)
-            exp = SparseArray(op(first.values, second.values),
-                              fill_value=first.fill_value)
-            tm.assertIsInstance(res, SparseArray)
-            assert_almost_equal(res.values, exp.values)
-
-            res2 = op(first, second.values)
-            tm.assertIsInstance(res2, SparseArray)
-            assert_sp_array_equal(res, res2)
-
-            res3 = op(first.values, second)
-            tm.assertIsInstance(res3, SparseArray)
-            assert_sp_array_equal(res, res3)
-
-            res4 = op(first, 4)
-            tm.assertIsInstance(res4, SparseArray)
-
-            # ignore this if the actual op raises (e.g. pow)
-            try:
-                exp = op(first.values, 4)
-                exp_fv = op(first.fill_value, 4)
-                assert_almost_equal(res4.fill_value, exp_fv)
-                assert_almost_equal(res4.values, exp)
-            except (ValueError) :
-                pass
-
-        def _check_inplace_op(op):
-            tmp = arr1.copy()
-            self.assertRaises(NotImplementedError, op, tmp, arr2)
-
-        bin_ops = [operator.add, operator.sub, operator.mul, operator.truediv,
-                   operator.floordiv, operator.pow]
-        for op in bin_ops:
-            _check_op(op, arr1, arr2)
-            _check_op(op, farr1, farr2)
-
-        inplace_ops = ['iadd', 'isub', 'imul', 'itruediv', 'ifloordiv', 'ipow']
-        for op in inplace_ops:
-            _check_inplace_op(getattr(operator, op))
-
-    def test_pickle(self):
-        def _check_roundtrip(obj):
-            unpickled = self.round_trip_pickle(obj)
-            assert_sp_array_equal(unpickled, obj)
-
-        _check_roundtrip(self.arr)
-        _check_roundtrip(self.zarr)
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/sparse/tests/test_libsparse.py b/pandas/sparse/tests/test_libsparse.py
deleted file mode 100644
index 7f9e61571ebfc..0000000000000
--- a/pandas/sparse/tests/test_libsparse.py
+++ /dev/null
@@ -1,400 +0,0 @@
-from pandas import Series
-
-import nose
-from numpy import nan
-import numpy as np
-import operator
-from numpy.testing import assert_almost_equal, assert_equal
-import pandas.util.testing as tm
-
-from pandas.core.sparse import SparseSeries
-from pandas import DataFrame, compat
-
-from pandas._sparse import IntIndex, BlockIndex
-import pandas._sparse as splib
-
-TEST_LENGTH = 20
-
-plain_case = dict(xloc=[0, 7, 15],
-                  xlen=[3, 5, 5],
-                  yloc=[2, 9, 14],
-                  ylen=[2, 3, 5],
-                  intersect_loc=[2, 9, 15],
-                  intersect_len=[1, 3, 4])
-delete_blocks = dict(xloc=[0, 5],
-                     xlen=[4, 4],
-                     yloc=[1],
-                     ylen=[4],
-                     intersect_loc=[1],
-                     intersect_len=[3])
-split_blocks = dict(xloc=[0],
-                    xlen=[10],
-                    yloc=[0, 5],
-                    ylen=[3, 7],
-                    intersect_loc=[0, 5],
-                    intersect_len=[3, 5])
-skip_block = dict(xloc=[10],
-                  xlen=[5],
-                  yloc=[0, 12],
-                  ylen=[5, 3],
-                  intersect_loc=[12],
-                  intersect_len=[3])
-
-no_intersect = dict(xloc=[0, 10],
-                    xlen=[4, 6],
-                    yloc=[5, 17],
-                    ylen=[4, 2],
-                    intersect_loc=[],
-                    intersect_len=[])
-
-
-def check_cases(_check_case):
-    def _check_case_dict(case):
-        _check_case(case['xloc'], case['xlen'], case['yloc'], case['ylen'],
-                    case['intersect_loc'], case['intersect_len'])
-
-    _check_case_dict(plain_case)
-    _check_case_dict(delete_blocks)
-    _check_case_dict(split_blocks)
-    _check_case_dict(skip_block)
-    _check_case_dict(no_intersect)
-
-    # one or both is empty
-    _check_case([0], [5], [], [], [], [])
-    _check_case([], [], [], [], [], [])
-
-
-def test_index_make_union():
-    def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
-        xindex = BlockIndex(TEST_LENGTH, xloc, xlen)
-        yindex = BlockIndex(TEST_LENGTH, yloc, ylen)
-        bresult = xindex.make_union(yindex)
-        assert(isinstance(bresult, BlockIndex))
-        assert_equal(bresult.blocs, eloc)
-        assert_equal(bresult.blengths, elen)
-
-        ixindex = xindex.to_int_index()
-        iyindex = yindex.to_int_index()
-        iresult = ixindex.make_union(iyindex)
-        assert(isinstance(iresult, IntIndex))
-        assert_equal(iresult.indices, bresult.to_int_index().indices)
-
-    """
-    x: ----
-    y:     ----
-    r: --------
-    """
-    xloc = [0]
-    xlen = [5]
-    yloc = [5]
-    ylen = [4]
-    eloc = [0]
-    elen = [9]
-    _check_case(xloc, xlen, yloc, ylen, eloc, elen)
-
-    """
-    x: -----     -----
-    y:   -----          --
-    """
-    xloc = [0, 10]
-    xlen = [5, 5]
-    yloc = [2, 17]
-    ylen = [5, 2]
-    eloc = [0, 10, 17]
-    elen = [7, 5, 2]
-    _check_case(xloc, xlen, yloc, ylen, eloc, elen)
-
-    """
-    x: ------
-    y:    -------
-    r: ----------
-    """
-    xloc = [1]
-    xlen = [5]
-    yloc = [3]
-    ylen = [5]
-    eloc = [1]
-    elen = [7]
-    _check_case(xloc, xlen, yloc, ylen, eloc, elen)
-
-    """
-    x: ------  -----
-    y:    -------
-    r: -------------
-    """
-    xloc = [2, 10]
-    xlen = [4, 4]
-    yloc = [4]
-    ylen = [8]
-    eloc = [2]
-    elen = [12]
-    _check_case(xloc, xlen, yloc, ylen, eloc, elen)
-
-    """
-    x: ---  -----
-    y: -------
-    r: -------------
-    """
-    xloc = [0, 5]
-    xlen = [3, 5]
-    yloc = [0]
-    ylen = [7]
-    eloc = [0]
-    elen = [10]
-    _check_case(xloc, xlen, yloc, ylen, eloc, elen)
-
-    """
-    x: ------  -----
-    y:    -------  ---
-    r: -------------
-    """
-    xloc = [2, 10]
-    xlen = [4, 4]
-    yloc = [4, 13]
-    ylen = [8, 4]
-    eloc = [2]
-    elen = [15]
-    _check_case(xloc, xlen, yloc, ylen, eloc, elen)
-
-    """
-    x: ----------------------
-    y:   ----  ----   ---
-    r: ----------------------
-    """
-    xloc = [2]
-    xlen = [15]
-    yloc = [4, 9, 14]
-    ylen = [3, 2, 2]
-    eloc = [2]
-    elen = [15]
-    _check_case(xloc, xlen, yloc, ylen, eloc, elen)
-
-    """
-    x: ----       ---
-    y:       ---       ---
-    """
-    xloc = [0, 10]
-    xlen = [3, 3]
-    yloc = [5, 15]
-    ylen = [2, 2]
-    eloc = [0, 5, 10, 15]
-    elen = [3, 2, 3, 2]
-    _check_case(xloc, xlen, yloc, ylen, eloc, elen)
-
-    # TODO: different-length index objects
-
-
-def test_lookup():
-
-    def _check(index):
-        assert(index.lookup(0) == -1)
-        assert(index.lookup(5) == 0)
-        assert(index.lookup(7) == 2)
-        assert(index.lookup(8) == -1)
-        assert(index.lookup(9) == -1)
-        assert(index.lookup(10) == -1)
-        assert(index.lookup(11) == -1)
-        assert(index.lookup(12) == 3)
-        assert(index.lookup(17) == 8)
-        assert(index.lookup(18) == -1)
-
-    bindex = BlockIndex(20, [5, 12], [3, 6])
-    iindex = bindex.to_int_index()
-
-    _check(bindex)
-    _check(iindex)
-
-    # corner cases
-
-
-def test_intersect():
-    def _check_correct(a, b, expected):
-        result = a.intersect(b)
-        assert(result.equals(expected))
-
-    def _check_length_exc(a, longer):
-        nose.tools.assert_raises(Exception, a.intersect, longer)
-
-    def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
-        xindex = BlockIndex(TEST_LENGTH, xloc, xlen)
-        yindex = BlockIndex(TEST_LENGTH, yloc, ylen)
-        expected = BlockIndex(TEST_LENGTH, eloc, elen)
-        longer_index = BlockIndex(TEST_LENGTH + 1, yloc, ylen)
-
-        _check_correct(xindex, yindex, expected)
-        _check_correct(xindex.to_int_index(),
-                       yindex.to_int_index(),
-                       expected.to_int_index())
-
-        _check_length_exc(xindex, longer_index)
-        _check_length_exc(xindex.to_int_index(),
-                          longer_index.to_int_index())
-
-    if compat.is_platform_windows():
-        raise nose.SkipTest("segfaults on win-64 when all tests are run")
-    check_cases(_check_case)
-
-
-class TestBlockIndex(tm.TestCase):
-
-    def test_equals(self):
-        index = BlockIndex(10, [0, 4], [2, 5])
-
-        self.assertTrue(index.equals(index))
-        self.assertFalse(index.equals(BlockIndex(10, [0, 4], [2, 6])))
-
-    def test_check_integrity(self):
-        locs = []
-        lengths = []
-
-        # 0-length OK
-        index = BlockIndex(0, locs, lengths)
-
-        # also OK even though empty
-        index = BlockIndex(1, locs, lengths)
-
-        # block extend beyond end
-        self.assertRaises(Exception, BlockIndex, 10, [5], [10])
-
-        # block overlap
-        self.assertRaises(Exception, BlockIndex, 10, [2, 5], [5, 3])
-
-    def test_to_int_index(self):
-        locs = [0, 10]
-        lengths = [4, 6]
-        exp_inds = [0, 1, 2, 3, 10, 11, 12, 13, 14, 15]
-
-        block = BlockIndex(20, locs, lengths)
-        dense = block.to_int_index()
-
-        assert_equal(dense.indices, exp_inds)
-
-    def test_to_block_index(self):
-        index = BlockIndex(10, [0, 5], [4, 5])
-        self.assertIs(index.to_block_index(), index)
-
-
-class TestIntIndex(tm.TestCase):
-
-    def test_equals(self):
-        index = IntIndex(10, [0, 1, 2, 3, 4])
-        self.assertTrue(index.equals(index))
-        self.assertFalse(index.equals(IntIndex(10, [0, 1, 2, 3])))
-
-    def test_to_block_index(self):
-        def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
-            xindex = BlockIndex(TEST_LENGTH, xloc, xlen)
-            yindex = BlockIndex(TEST_LENGTH, yloc, ylen)
-
-            # see if survive the round trip
-            xbindex = xindex.to_int_index().to_block_index()
-            ybindex = yindex.to_int_index().to_block_index()
-            tm.assertIsInstance(xbindex, BlockIndex)
-            self.assertTrue(xbindex.equals(xindex))
-            self.assertTrue(ybindex.equals(yindex))
-        check_cases(_check_case)
-
-    def test_to_int_index(self):
-        index = IntIndex(10, [2, 3, 4, 5, 6])
-        self.assertIs(index.to_int_index(), index)
-
-
-class TestSparseOperators(tm.TestCase):
-
-    def _nan_op_tests(self, sparse_op, python_op):
-        def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
-            xindex = BlockIndex(TEST_LENGTH, xloc, xlen)
-            yindex = BlockIndex(TEST_LENGTH, yloc, ylen)
-
-            xdindex = xindex.to_int_index()
-            ydindex = yindex.to_int_index()
-
-            x = np.arange(xindex.npoints) * 10. + 1
-            y = np.arange(yindex.npoints) * 100. + 1
-
-            result_block_vals, rb_index = sparse_op(x, xindex, y, yindex)
-            result_int_vals, ri_index = sparse_op(x, xdindex, y, ydindex)
-
-            self.assertTrue(rb_index.to_int_index().equals(ri_index))
-            assert_equal(result_block_vals, result_int_vals)
-
-            # check versus Series...
-            xseries = Series(x, xdindex.indices)
-            yseries = Series(y, ydindex.indices)
-            series_result = python_op(xseries, yseries).valid()
-            assert_equal(result_block_vals, series_result.values)
-            assert_equal(result_int_vals, series_result.values)
-
-        check_cases(_check_case)
-
-    def _op_tests(self, sparse_op, python_op):
-        def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
-            xindex = BlockIndex(TEST_LENGTH, xloc, xlen)
-            yindex = BlockIndex(TEST_LENGTH, yloc, ylen)
-
-            xdindex = xindex.to_int_index()
-            ydindex = yindex.to_int_index()
-
-            x = np.arange(xindex.npoints) * 10. + 1
-            y = np.arange(yindex.npoints) * 100. + 1
-
-            xfill = 0
-            yfill = 2
-
-            result_block_vals, rb_index = sparse_op(
-                x, xindex, xfill, y, yindex, yfill)
-            result_int_vals, ri_index = sparse_op(x, xdindex, xfill,
-                                                  y, ydindex, yfill)
-
-            self.assertTrue(rb_index.to_int_index().equals(ri_index))
-            assert_equal(result_block_vals, result_int_vals)
-
-            # check versus Series...
-            xseries = Series(x, xdindex.indices)
-            xseries = xseries.reindex(np.arange(TEST_LENGTH)).fillna(xfill)
-
-            yseries = Series(y, ydindex.indices)
-            yseries = yseries.reindex(np.arange(TEST_LENGTH)).fillna(yfill)
-
-            series_result = python_op(xseries, yseries)
-            series_result = series_result.reindex(ri_index.indices)
-
-            assert_equal(result_block_vals, series_result.values)
-            assert_equal(result_int_vals, series_result.values)
-
-        check_cases(_check_case)
-
-# too cute? oh but how I abhor code duplication
-
-check_ops = ['add', 'sub', 'mul', 'truediv', 'floordiv']
-
-
-def make_nanoptestf(op):
-    def f(self):
-        sparse_op = getattr(splib, 'sparse_nan%s' % op)
-        python_op = getattr(operator, op)
-        self._nan_op_tests(sparse_op, python_op)
-    f.__name__ = 'test_nan%s' % op
-    return f
-
-
-def make_optestf(op):
-    def f(self):
-        sparse_op = getattr(splib, 'sparse_%s' % op)
-        python_op = getattr(operator, op)
-        self._op_tests(sparse_op, python_op)
-    f.__name__ = 'test_%s' % op
-    return f
-
-for op in check_ops:
-    f = make_nanoptestf(op)
-    g = make_optestf(op)
-    setattr(TestSparseOperators, f.__name__, f)
-    setattr(TestSparseOperators, g.__name__, g)
-    del f
-    del g
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/sparse/tests/test_list.py b/pandas/sparse/tests/test_list.py
deleted file mode 100644
index 7b81e483da2b0..0000000000000
--- a/pandas/sparse/tests/test_list.py
+++ /dev/null
@@ -1,107 +0,0 @@
-from pandas.compat import range
-import unittest
-
-from numpy import nan
-import numpy as np
-
-from pandas.sparse.api import SparseList, SparseArray
-from pandas.util.testing import assert_almost_equal
-
-from .test_sparse import assert_sp_array_equal
-
-
-def assert_sp_list_equal(left, right):
-    assert_sp_array_equal(left.to_array(), right.to_array())
-
-
-class TestSparseList(unittest.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.na_data = np.array([nan, nan, 1, 2, 3, nan, 4, 5, nan, 6])
-        self.zero_data = np.array([0, 0, 1, 2, 3, 0, 4, 5, 0, 6])
-
-    def test_constructor(self):
-        lst1 = SparseList(self.na_data[:5])
-        exp = SparseList()
-        exp.append(self.na_data[:5])
-        assert_sp_list_equal(lst1, exp)
-
-    def test_len(self):
-        arr = self.na_data
-        splist = SparseList()
-        splist.append(arr[:5])
-        self.assertEqual(len(splist), 5)
-        splist.append(arr[5])
-        self.assertEqual(len(splist), 6)
-        splist.append(arr[6:])
-        self.assertEqual(len(splist), 10)
-
-    def test_append_na(self):
-        arr = self.na_data
-        splist = SparseList()
-        splist.append(arr[:5])
-        splist.append(arr[5])
-        splist.append(arr[6:])
-
-        sparr = splist.to_array()
-        assert_sp_array_equal(sparr, SparseArray(arr))
-
-    def test_append_zero(self):
-        arr = self.zero_data
-        splist = SparseList(fill_value=0)
-        splist.append(arr[:5])
-        splist.append(arr[5])
-        splist.append(arr[6:])
-
-        sparr = splist.to_array()
-        assert_sp_array_equal(sparr, SparseArray(arr, fill_value=0))
-
-    def test_consolidate(self):
-        arr = self.na_data
-        exp_sparr = SparseArray(arr)
-
-        splist = SparseList()
-        splist.append(arr[:5])
-        splist.append(arr[5])
-        splist.append(arr[6:])
-
-        consol = splist.consolidate(inplace=False)
-        self.assertEqual(consol.nchunks, 1)
-        self.assertEqual(splist.nchunks, 3)
-        assert_sp_array_equal(consol.to_array(), exp_sparr)
-
-        splist.consolidate()
-        self.assertEqual(splist.nchunks, 1)
-        assert_sp_array_equal(splist.to_array(), exp_sparr)
-
-    def test_copy(self):
-        arr = self.na_data
-        exp_sparr = SparseArray(arr)
-
-        splist = SparseList()
-        splist.append(arr[:5])
-        splist.append(arr[5])
-
-        cp = splist.copy()
-        cp.append(arr[6:])
-        self.assertEqual(splist.nchunks, 2)
-        assert_sp_array_equal(cp.to_array(), exp_sparr)
-
-    def test_getitem(self):
-        arr = self.na_data
-        splist = SparseList()
-        splist.append(arr[:5])
-        splist.append(arr[5])
-        splist.append(arr[6:])
-
-        for i in range(len(arr)):
-            assert_almost_equal(splist[i], arr[i])
-            assert_almost_equal(splist[-i], arr[-i])
-
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/sparse/tests/test_sparse.py b/pandas/sparse/tests/test_sparse.py
deleted file mode 100644
index a86942718091c..0000000000000
--- a/pandas/sparse/tests/test_sparse.py
+++ /dev/null
@@ -1,1980 +0,0 @@
-# pylint: disable-msg=E1101,W0612
-
-import operator
-from datetime import datetime
-import functools
-
-import nose
-
-from numpy import nan
-import numpy as np
-import pandas as pd
-dec = np.testing.dec
-
-from pandas.util.testing import (assert_almost_equal, assert_series_equal,
-                                 assert_frame_equal, assert_panel_equal, assertRaisesRegexp,
-                                 assert_numpy_array_equal, assert_attr_equal)
-from numpy.testing import assert_equal
-
-from pandas import Series, DataFrame, bdate_range, Panel, MultiIndex
-from pandas.core.datetools import BDay
-from pandas.core.index import Index
-from pandas.tseries.index import DatetimeIndex
-import pandas.core.datetools as datetools
-from pandas.core.common import isnull
-import pandas.util.testing as tm
-from pandas.compat import range, lrange, StringIO, lrange
-from pandas import compat
-from pandas.tools.util import cartesian_product
-
-import pandas.sparse.frame as spf
-
-from pandas._sparse import BlockIndex, IntIndex
-from pandas.sparse.api import (SparseSeries,
-                               SparseDataFrame, SparsePanel,
-                               SparseArray)
-import pandas.tests.test_frame as test_frame
-import pandas.tests.test_panel as test_panel
-import pandas.tests.test_series as test_series
-
-from pandas.sparse.tests.test_array import assert_sp_array_equal
-
-import warnings
-warnings.filterwarnings(action='ignore', category=FutureWarning)
-
-
-def _test_data1():
-    # nan-based
-    arr = np.arange(20, dtype=float)
-    index = np.arange(20)
-    arr[:2] = nan
-    arr[5:10] = nan
-    arr[-3:] = nan
-
-    return arr, index
-
-
-def _test_data2():
-    # nan-based
-    arr = np.arange(15, dtype=float)
-    index = np.arange(15)
-    arr[7:12] = nan
-    arr[-1:] = nan
-    return arr, index
-
-
-def _test_data1_zero():
-    # zero-based
-    arr, index = _test_data1()
-    arr[np.isnan(arr)] = 0
-    return arr, index
-
-
-def _test_data2_zero():
-    # zero-based
-    arr, index = _test_data2()
-    arr[np.isnan(arr)] = 0
-    return arr, index
-
-
-def assert_sp_series_equal(a, b, exact_indices=True, check_names=True):
-    assert(a.index.equals(b.index))
-    assert_sp_array_equal(a, b)
-    if check_names:
-        assert_attr_equal('name', a, b)
-
-
-def assert_sp_frame_equal(left, right, exact_indices=True):
-    """
-    exact: Series SparseIndex objects must be exactly the same, otherwise just
-    compare dense representations
-    """
-    for col, series in compat.iteritems(left):
-        assert(col in right)
-        # trade-off?
-
-        if exact_indices:
-            assert_sp_series_equal(series, right[col])
-        else:
-            assert_series_equal(series.to_dense(), right[col].to_dense())
-
-    assert_almost_equal(left.default_fill_value,
-                        right.default_fill_value)
-
-    # do I care?
-    # assert(left.default_kind == right.default_kind)
-
-    for col in right:
-        assert(col in left)
-
-
-def assert_sp_panel_equal(left, right, exact_indices=True):
-    for item, frame in compat.iteritems(left):
-        assert(item in right)
-        # trade-off?
-        assert_sp_frame_equal(frame, right[item], exact_indices=exact_indices)
-
-    assert_almost_equal(left.default_fill_value,
-                        right.default_fill_value)
-    assert(left.default_kind == right.default_kind)
-
-    for item in right:
-        assert(item in left)
-
-
-class TestSparseSeries(tm.TestCase,
-                       test_series.CheckNameIntegration):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        arr, index = _test_data1()
-
-        date_index = bdate_range('1/1/2011', periods=len(index))
-
-        self.bseries = SparseSeries(arr, index=index, kind='block',
-                                    name='bseries')
-        self.ts = self.bseries
-
-        self.btseries = SparseSeries(arr, index=date_index, kind='block')
-
-        self.iseries = SparseSeries(arr, index=index, kind='integer',
-                                    name='iseries')
-
-        arr, index = _test_data2()
-        self.bseries2 = SparseSeries(arr, index=index, kind='block')
-        self.iseries2 = SparseSeries(arr, index=index, kind='integer')
-
-        arr, index = _test_data1_zero()
-        self.zbseries = SparseSeries(arr, index=index, kind='block',
-                                     fill_value=0, name='zbseries')
-        self.ziseries = SparseSeries(arr, index=index, kind='integer',
-                                     fill_value=0)
-
-        arr, index = _test_data2_zero()
-        self.zbseries2 = SparseSeries(arr, index=index, kind='block',
-                                      fill_value=0)
-        self.ziseries2 = SparseSeries(arr, index=index, kind='integer',
-                                      fill_value=0)
-
-    def test_iteration_and_str(self):
-        [x for x in self.bseries]
-        str(self.bseries)
-
-    def test_TimeSeries_deprecation(self):
-
-        # deprecation TimeSeries, #10890
-        with tm.assert_produces_warning(FutureWarning):
-            pd.SparseTimeSeries(1,index=pd.date_range('20130101',periods=3))
-
-    def test_construct_DataFrame_with_sp_series(self):
-        # it works!
-        df = DataFrame({'col': self.bseries})
-
-        # printing & access
-        df.iloc[:1]
-        df['col']
-        df.dtypes
-        str(df)
-
-        assert_sp_series_equal(df['col'], self.bseries, check_names=False)
-
-        result = df.iloc[:, 0]
-        assert_sp_series_equal(result, self.bseries, check_names=False)
-
-        # blocking
-        expected = Series({'col': 'float64:sparse'})
-        result = df.ftypes
-        assert_series_equal(expected, result)
-
-    def test_series_density(self):
-        # GH2803
-        ts = Series(np.random.randn(10))
-        ts[2:-2] = nan
-        sts = ts.to_sparse()
-        density = sts.density  # don't die
-        self.assertEqual(density, 4 / 10.0)
-
-    def test_sparse_to_dense(self):
-        arr, index = _test_data1()
-        series = self.bseries.to_dense()
-        assert_equal(series, arr)
-
-        series = self.bseries.to_dense(sparse_only=True)
-        assert_equal(series, arr[np.isfinite(arr)])
-
-        series = self.iseries.to_dense()
-        assert_equal(series, arr)
-
-        arr, index = _test_data1_zero()
-        series = self.zbseries.to_dense()
-        assert_equal(series, arr)
-
-        series = self.ziseries.to_dense()
-        assert_equal(series, arr)
-
-    def test_dense_to_sparse(self):
-        series = self.bseries.to_dense()
-        bseries = series.to_sparse(kind='block')
-        iseries = series.to_sparse(kind='integer')
-        assert_sp_series_equal(bseries, self.bseries)
-        assert_sp_series_equal(iseries, self.iseries, check_names=False)
-        self.assertEqual(iseries.name, self.bseries.name)
-
-        # non-NaN fill value
-        series = self.zbseries.to_dense()
-        zbseries = series.to_sparse(kind='block', fill_value=0)
-        ziseries = series.to_sparse(kind='integer', fill_value=0)
-        assert_sp_series_equal(zbseries, self.zbseries)
-        assert_sp_series_equal(ziseries, self.ziseries, check_names=False)
-        self.assertEqual(ziseries.name, self.zbseries.name)
-
-    def test_to_dense_preserve_name(self):
-        assert(self.bseries.name is not None)
-        result = self.bseries.to_dense()
-        self.assertEqual(result.name, self.bseries.name)
-
-    def test_constructor(self):
-        # test setup guys
-        self.assertTrue(np.isnan(self.bseries.fill_value))
-        tm.assertIsInstance(self.bseries.sp_index, BlockIndex)
-        self.assertTrue(np.isnan(self.iseries.fill_value))
-        tm.assertIsInstance(self.iseries.sp_index, IntIndex)
-
-        self.assertEqual(self.zbseries.fill_value, 0)
-        assert_equal(self.zbseries.values.values,
-                     self.bseries.to_dense().fillna(0).values)
-
-        # pass SparseSeries
-        def _check_const(sparse, name):
-            # use passed series name
-            result = SparseSeries(sparse)
-            assert_sp_series_equal(result, sparse)
-            self.assertEqual(sparse.name, name)
-            self.assertEqual(result.name, name)
-
-            # use passed name
-            result = SparseSeries(sparse, name='x')
-            assert_sp_series_equal(result, sparse, check_names=False)
-            self.assertEqual(result.name, 'x')
-
-        _check_const(self.bseries, 'bseries')
-        _check_const(self.iseries, 'iseries')
-        _check_const(self.zbseries, 'zbseries')
-
-        # Sparse time series works
-        date_index = bdate_range('1/1/2000', periods=len(self.bseries))
-        s5 = SparseSeries(self.bseries, index=date_index)
-        tm.assertIsInstance(s5, SparseSeries)
-
-        # pass Series
-        bseries2 = SparseSeries(self.bseries.to_dense())
-        assert_equal(self.bseries.sp_values, bseries2.sp_values)
-
-        # pass dict?
-
-        # don't copy the data by default
-        values = np.ones(self.bseries.npoints)
-        sp = SparseSeries(values, sparse_index=self.bseries.sp_index)
-        sp.sp_values[:5] = 97
-        self.assertEqual(values[0], 97)
-
-        # but can make it copy!
-        sp = SparseSeries(values, sparse_index=self.bseries.sp_index,
-                          copy=True)
-        sp.sp_values[:5] = 100
-        self.assertEqual(values[0], 97)
-
-    def test_constructor_scalar(self):
-        data = 5
-        sp = SparseSeries(data, np.arange(100))
-        sp = sp.reindex(np.arange(200))
-        self.assertTrue((sp.ix[:99] == data).all())
-        self.assertTrue(isnull(sp.ix[100:]).all())
-
-        data = np.nan
-        sp = SparseSeries(data, np.arange(100))
-
-    def test_constructor_ndarray(self):
-        pass
-
-    def test_constructor_nonnan(self):
-        arr = [0, 0, 0, nan, nan]
-        sp_series = SparseSeries(arr, fill_value=0)
-        assert_equal(sp_series.values.values, arr)
-
-    # GH 9272
-    def test_constructor_empty(self):
-        sp = SparseSeries()
-        self.assertEqual(len(sp.index), 0)
-
-    def test_copy_astype(self):
-        cop = self.bseries.astype(np.float64)
-        self.assertIsNot(cop, self.bseries)
-        self.assertIs(cop.sp_index, self.bseries.sp_index)
-        self.assertEqual(cop.dtype, np.float64)
-
-        cop2 = self.iseries.copy()
-
-        assert_sp_series_equal(cop, self.bseries)
-        assert_sp_series_equal(cop2, self.iseries)
-
-        # test that data is copied
-        cop[:5] = 97
-        self.assertEqual(cop.sp_values[0], 97)
-        self.assertNotEqual(self.bseries.sp_values[0], 97)
-
-        # correct fill value
-        zbcop = self.zbseries.copy()
-        zicop = self.ziseries.copy()
-
-        assert_sp_series_equal(zbcop, self.zbseries)
-        assert_sp_series_equal(zicop, self.ziseries)
-
-        # no deep copy
-        view = self.bseries.copy(deep=False)
-        view.sp_values[:5] = 5
-        self.assertTrue((self.bseries.sp_values[:5] == 5).all())
-
-    def test_astype(self):
-        self.assertRaises(Exception, self.bseries.astype, np.int64)
-
-    def test_kind(self):
-        self.assertEqual(self.bseries.kind, 'block')
-        self.assertEqual(self.iseries.kind, 'integer')
-
-    def test_pickle(self):
-        def _test_roundtrip(series):
-            unpickled = self.round_trip_pickle(series)
-            assert_sp_series_equal(series, unpickled)
-            assert_series_equal(series.to_dense(), unpickled.to_dense())
-
-        self._check_all(_test_roundtrip)
-
-    def _check_all(self, check_func):
-        check_func(self.bseries)
-        check_func(self.iseries)
-        check_func(self.zbseries)
-        check_func(self.ziseries)
-
-    def test_getitem(self):
-        def _check_getitem(sp, dense):
-            for idx, val in compat.iteritems(dense):
-                assert_almost_equal(val, sp[idx])
-
-            for i in range(len(dense)):
-                assert_almost_equal(sp[i], dense[i])
-                # j = np.float64(i)
-                # assert_almost_equal(sp[j], dense[j])
-
-            # API change 1/6/2012
-            # negative getitem works
-            # for i in xrange(len(dense)):
-            #     assert_almost_equal(sp[-i], dense[-i])
-
-        _check_getitem(self.bseries, self.bseries.to_dense())
-        _check_getitem(self.btseries, self.btseries.to_dense())
-
-        _check_getitem(self.zbseries, self.zbseries.to_dense())
-        _check_getitem(self.iseries, self.iseries.to_dense())
-        _check_getitem(self.ziseries, self.ziseries.to_dense())
-
-        # exception handling
-        self.assertRaises(Exception, self.bseries.__getitem__,
-                          len(self.bseries) + 1)
-
-        # index not contained
-        self.assertRaises(Exception, self.btseries.__getitem__,
-                          self.btseries.index[-1] + BDay())
-
-    def test_get_get_value(self):
-        assert_almost_equal(self.bseries.get(10), self.bseries[10])
-        self.assertIsNone(self.bseries.get(len(self.bseries) + 1))
-
-        dt = self.btseries.index[10]
-        result = self.btseries.get(dt)
-        expected = self.btseries.to_dense()[dt]
-        assert_almost_equal(result, expected)
-
-        assert_almost_equal(self.bseries.get_value(10), self.bseries[10])
-
-    def test_set_value(self):
-
-        idx = self.btseries.index[7]
-        self.btseries.set_value(idx, 0)
-        self.assertEqual(self.btseries[idx], 0)
-
-        self.iseries.set_value('foobar', 0)
-        self.assertEqual(self.iseries.index[-1], 'foobar')
-        self.assertEqual(self.iseries['foobar'], 0)
-
-    def test_getitem_slice(self):
-        idx = self.bseries.index
-        res = self.bseries[::2]
-        tm.assertIsInstance(res, SparseSeries)
-
-        expected = self.bseries.reindex(idx[::2])
-        assert_sp_series_equal(res, expected)
-
-        res = self.bseries[:5]
-        tm.assertIsInstance(res, SparseSeries)
-        assert_sp_series_equal(res, self.bseries.reindex(idx[:5]))
-
-        res = self.bseries[5:]
-        assert_sp_series_equal(res, self.bseries.reindex(idx[5:]))
-
-        # negative indices
-        res = self.bseries[:-3]
-        assert_sp_series_equal(res, self.bseries.reindex(idx[:-3]))
-
-    def test_take(self):
-        def _compare_with_dense(sp):
-            dense = sp.to_dense()
-
-            def _compare(idx):
-                dense_result = dense.take(idx).values
-                sparse_result = sp.take(idx)
-                self.assertIsInstance(sparse_result, SparseSeries)
-                assert_almost_equal(dense_result, sparse_result.values.values)
-
-            _compare([1., 2., 3., 4., 5., 0.])
-            _compare([7, 2, 9, 0, 4])
-            _compare([3, 6, 3, 4, 7])
-
-        self._check_all(_compare_with_dense)
-
-        self.assertRaises(Exception, self.bseries.take,
-                          [0, len(self.bseries) + 1])
-
-        # Corner case
-        sp = SparseSeries(np.ones(10) * nan)
-        assert_almost_equal(sp.take([0, 1, 2, 3, 4]), np.repeat(nan, 5))
-
-    def test_setitem(self):
-        self.bseries[5] = 7.
-        self.assertEqual(self.bseries[5], 7.)
-
-    def test_setslice(self):
-        self.bseries[5:10] = 7.
-        assert_series_equal(self.bseries[5:10].to_dense(), Series(
-            7., index=range(5, 10), name=self.bseries.name))
-
-    def test_operators(self):
-        def _check_op(a, b, op):
-            sp_result = op(a, b)
-            adense = a.to_dense() if isinstance(a, SparseSeries) else a
-            bdense = b.to_dense() if isinstance(b, SparseSeries) else b
-            dense_result = op(adense, bdense)
-            assert_almost_equal(sp_result.to_dense(), dense_result)
-
-        def check(a, b):
-            _check_op(a, b, operator.add)
-            _check_op(a, b, operator.sub)
-            _check_op(a, b, operator.truediv)
-            _check_op(a, b, operator.floordiv)
-            _check_op(a, b, operator.mul)
-
-            _check_op(a, b, lambda x, y: operator.add(y, x))
-            _check_op(a, b, lambda x, y: operator.sub(y, x))
-            _check_op(a, b, lambda x, y: operator.truediv(y, x))
-            _check_op(a, b, lambda x, y: operator.floordiv(y, x))
-            _check_op(a, b, lambda x, y: operator.mul(y, x))
-
-            # NaN ** 0 = 1 in C?
-            # _check_op(a, b, operator.pow)
-            # _check_op(a, b, lambda x, y: operator.pow(y, x))
-
-        check(self.bseries, self.bseries)
-        check(self.iseries, self.iseries)
-        check(self.bseries, self.iseries)
-
-        check(self.bseries, self.bseries2)
-        check(self.bseries, self.iseries2)
-        check(self.iseries, self.iseries2)
-
-        # scalar value
-        check(self.bseries, 5)
-
-        # zero-based
-        check(self.zbseries, self.zbseries * 2)
-        check(self.zbseries, self.zbseries2)
-        check(self.ziseries, self.ziseries2)
-
-        # with dense
-        result = self.bseries + self.bseries.to_dense()
-        assert_sp_series_equal(result, self.bseries + self.bseries)
-
-    # @dec.knownfailureif(True, 'Known NumPy failer as of 1.5.1')
-    def test_operators_corner2(self):
-        raise nose.SkipTest('known failer on numpy 1.5.1')
-
-        # NumPy circumvents __r*__ operations
-        val = np.float64(3.0)
-        result = val - self.zbseries
-        assert_sp_series_equal(result, 3 - self.zbseries)
-
-    def test_binary_operators(self):
-
-        # skipping for now #####
-        raise nose.SkipTest("skipping sparse binary operators test")
-
-        def _check_inplace_op(iop, op):
-            tmp = self.bseries.copy()
-
-            expected = op(tmp, self.bseries)
-            iop(tmp, self.bseries)
-            assert_sp_series_equal(tmp, expected)
-
-        inplace_ops = ['add', 'sub', 'mul', 'truediv', 'floordiv', 'pow']
-        for op in inplace_ops:
-            _check_inplace_op(
-                getattr(operator, "i%s" % op), getattr(operator, op))
-
-    def test_abs(self):
-        s = SparseSeries([1, 2, -3], name='x')
-        expected = SparseSeries([1, 2, 3], name='x')
-        result = s.abs()
-        assert_sp_series_equal(result, expected)
-        self.assertEqual(result.name, 'x')
-
-        result = abs(s)
-        assert_sp_series_equal(result, expected)
-        self.assertEqual(result.name, 'x')
-
-        result = np.abs(s)
-        assert_sp_series_equal(result, expected)
-        self.assertEqual(result.name, 'x')
-
-    def test_reindex(self):
-        def _compare_with_series(sps, new_index):
-            spsre = sps.reindex(new_index)
-
-            series = sps.to_dense()
-            seriesre = series.reindex(new_index)
-            seriesre = seriesre.to_sparse(fill_value=sps.fill_value)
-
-            assert_sp_series_equal(spsre, seriesre)
-            assert_series_equal(spsre.to_dense(), seriesre.to_dense())
-
-        _compare_with_series(self.bseries, self.bseries.index[::2])
-        _compare_with_series(self.bseries, list(self.bseries.index[::2]))
-        _compare_with_series(self.bseries, self.bseries.index[:10])
-        _compare_with_series(self.bseries, self.bseries.index[5:])
-
-        _compare_with_series(self.zbseries, self.zbseries.index[::2])
-        _compare_with_series(self.zbseries, self.zbseries.index[:10])
-        _compare_with_series(self.zbseries, self.zbseries.index[5:])
-
-        # special cases
-        same_index = self.bseries.reindex(self.bseries.index)
-        assert_sp_series_equal(self.bseries, same_index)
-        self.assertIsNot(same_index, self.bseries)
-
-        # corner cases
-        sp = SparseSeries([], index=[])
-        sp_zero = SparseSeries([], index=[], fill_value=0)
-        _compare_with_series(sp, np.arange(10))
-
-        # with copy=False
-        reindexed = self.bseries.reindex(self.bseries.index, copy=True)
-        reindexed.sp_values[:] = 1.
-        self.assertTrue((self.bseries.sp_values != 1.).all())
-
-        reindexed = self.bseries.reindex(self.bseries.index, copy=False)
-        reindexed.sp_values[:] = 1.
-        tm.assert_numpy_array_equal(self.bseries.sp_values, np.repeat(1., 10))
-
-    def test_sparse_reindex(self):
-        length = 10
-
-        def _check(values, index1, index2, fill_value):
-            first_series = SparseSeries(values, sparse_index=index1,
-                                        fill_value=fill_value)
-            reindexed = first_series.sparse_reindex(index2)
-            self.assertIs(reindexed.sp_index, index2)
-
-            int_indices1 = index1.to_int_index().indices
-            int_indices2 = index2.to_int_index().indices
-
-            expected = Series(values, index=int_indices1)
-            expected = expected.reindex(int_indices2).fillna(fill_value)
-            assert_almost_equal(expected.values, reindexed.sp_values)
-
-            # make sure level argument asserts
-            expected = expected.reindex(int_indices2).fillna(fill_value)
-
-        def _check_with_fill_value(values, first, second, fill_value=nan):
-            i_index1 = IntIndex(length, first)
-            i_index2 = IntIndex(length, second)
-
-            b_index1 = i_index1.to_block_index()
-            b_index2 = i_index2.to_block_index()
-
-            _check(values, i_index1, i_index2, fill_value)
-            _check(values, b_index1, b_index2, fill_value)
-
-        def _check_all(values, first, second):
-            _check_with_fill_value(values, first, second, fill_value=nan)
-            _check_with_fill_value(values, first, second, fill_value=0)
-
-        index1 = [2, 4, 5, 6, 8, 9]
-        values1 = np.arange(6.)
-
-        _check_all(values1, index1, [2, 4, 5])
-        _check_all(values1, index1, [2, 3, 4, 5, 6, 7, 8, 9])
-        _check_all(values1, index1, [0, 1])
-        _check_all(values1, index1, [0, 1, 7, 8, 9])
-        _check_all(values1, index1, [])
-
-        first_series = SparseSeries(values1, sparse_index=IntIndex(length,
-                                                                   index1),
-                                    fill_value=nan)
-        with tm.assertRaisesRegexp(TypeError,
-                                   'new index must be a SparseIndex'):
-            reindexed = first_series.sparse_reindex(0)
-
-    def test_repr(self):
-        bsrepr = repr(self.bseries)
-        isrepr = repr(self.iseries)
-
-    def test_iter(self):
-        pass
-
-    def test_truncate(self):
-        pass
-
-    def test_fillna(self):
-        pass
-
-    def test_groupby(self):
-        pass
-
-    def test_reductions(self):
-        def _compare_with_dense(obj, op):
-            sparse_result = getattr(obj, op)()
-            series = obj.to_dense()
-            dense_result = getattr(series, op)()
-            self.assertEqual(sparse_result, dense_result)
-
-        to_compare = ['count', 'sum', 'mean', 'std', 'var', 'skew']
-
-        def _compare_all(obj):
-            for op in to_compare:
-                _compare_with_dense(obj, op)
-
-        _compare_all(self.bseries)
-
-        self.bseries.sp_values[5:10] = np.NaN
-        _compare_all(self.bseries)
-
-        _compare_all(self.zbseries)
-        self.zbseries.sp_values[5:10] = np.NaN
-        _compare_all(self.zbseries)
-
-        series = self.zbseries.copy()
-        series.fill_value = 2
-        _compare_all(series)
-
-        nonna = Series(np.random.randn(20)).to_sparse()
-        _compare_all(nonna)
-
-        nonna2 = Series(np.random.randn(20)).to_sparse(fill_value=0)
-        _compare_all(nonna2)
-
-    def test_dropna(self):
-        sp = SparseSeries([0, 0, 0, nan, nan, 5, 6],
-                          fill_value=0)
-
-        sp_valid = sp.valid()
-
-        expected = sp.to_dense().valid()
-        expected = expected[expected != 0]
-
-        assert_almost_equal(sp_valid.values, expected.values)
-        self.assertTrue(sp_valid.index.equals(expected.index))
-        self.assertEqual(len(sp_valid.sp_values), 2)
-
-        result = self.bseries.dropna()
-        expected = self.bseries.to_dense().dropna()
-        self.assertNotIsInstance(result, SparseSeries)
-        tm.assert_series_equal(result, expected)
-
-    def test_homogenize(self):
-        def _check_matches(indices, expected):
-            data = {}
-            for i, idx in enumerate(indices):
-                data[i] = SparseSeries(idx.to_int_index().indices,
-                                       sparse_index=idx)
-            homogenized = spf.homogenize(data)
-
-            for k, v in compat.iteritems(homogenized):
-                assert(v.sp_index.equals(expected))
-
-        indices1 = [BlockIndex(10, [2], [7]),
-                    BlockIndex(10, [1, 6], [3, 4]),
-                    BlockIndex(10, [0], [10])]
-        expected1 = BlockIndex(10, [2, 6], [2, 3])
-        _check_matches(indices1, expected1)
-
-        indices2 = [BlockIndex(10, [2], [7]),
-                    BlockIndex(10, [2], [7])]
-        expected2 = indices2[0]
-        _check_matches(indices2, expected2)
-
-        # must have NaN fill value
-        data = {'a': SparseSeries(np.arange(7), sparse_index=expected2,
-                                  fill_value=0)}
-        assertRaisesRegexp(TypeError, "NaN fill value", spf.homogenize, data)
-
-    def test_fill_value_corner(self):
-        cop = self.zbseries.copy()
-        cop.fill_value = 0
-        result = self.bseries / cop
-
-        self.assertTrue(np.isnan(result.fill_value))
-
-        cop2 = self.zbseries.copy()
-        cop2.fill_value = 1
-        result = cop2 / cop
-        self.assertTrue(np.isnan(result.fill_value))
-
-    def test_shift(self):
-        series = SparseSeries([nan, 1., 2., 3., nan, nan],
-                              index=np.arange(6))
-
-        shifted = series.shift(0)
-        self.assertIsNot(shifted, series)
-        assert_sp_series_equal(shifted, series)
-
-        f = lambda s: s.shift(1)
-        _dense_series_compare(series, f)
-
-        f = lambda s: s.shift(-2)
-        _dense_series_compare(series, f)
-
-        series = SparseSeries([nan, 1., 2., 3., nan, nan],
-                              index=bdate_range('1/1/2000', periods=6))
-        f = lambda s: s.shift(2, freq='B')
-        _dense_series_compare(series, f)
-
-        f = lambda s: s.shift(2, freq=datetools.bday)
-        _dense_series_compare(series, f)
-
-    def test_cumsum(self):
-        result = self.bseries.cumsum()
-        expected = self.bseries.to_dense().cumsum()
-        tm.assertIsInstance(result, SparseSeries)
-        self.assertEqual(result.name, self.bseries.name)
-        assert_series_equal(result.to_dense(), expected)
-
-        result = self.zbseries.cumsum()
-        expected = self.zbseries.to_dense().cumsum()
-        tm.assertIsInstance(result, Series)
-        assert_series_equal(result, expected)
-
-    def test_combine_first(self):
-        s = self.bseries
-
-        result = s[::2].combine_first(s)
-        result2 = s[::2].combine_first(s.to_dense())
-
-        expected = s[::2].to_dense().combine_first(s.to_dense())
-        expected = expected.to_sparse(fill_value=s.fill_value)
-
-        assert_sp_series_equal(result, result2)
-        assert_sp_series_equal(result, expected)
-
-
-class TestSparseSeriesScipyInteraction(tm.TestCase):
-    # Issue 8048: add SparseSeries coo methods
-
-    def setUp(self):
-        tm._skip_if_no_scipy()
-        import scipy.sparse
-        # SparseSeries inputs used in tests, the tests rely on the order
-        self.sparse_series = []
-        s = pd.Series([3.0, nan, 1.0, 2.0, nan, nan])
-        s.index = pd.MultiIndex.from_tuples([(1, 2, 'a', 0),
-                                             (1, 2, 'a', 1),
-                                             (1, 1, 'b', 0),
-                                             (1, 1, 'b', 1),
-                                             (2, 1, 'b', 0),
-                                             (2, 1, 'b', 1)],
-                                            names=['A', 'B', 'C', 'D'])
-        self.sparse_series.append(s.to_sparse())
-
-        ss = self.sparse_series[0].copy()
-        ss.index.names = [3, 0, 1, 2]
-        self.sparse_series.append(ss)
-
-        ss = pd.Series(
-            [nan] * 12, index=cartesian_product((range(3), range(4)))).to_sparse()
-        for k, v in zip([(0, 0), (1, 2), (1, 3)], [3.0, 1.0, 2.0]):
-            ss[k] = v
-        self.sparse_series.append(ss)
-
-        # results used in tests
-        self.coo_matrices = []
-        self.coo_matrices.append(scipy.sparse.coo_matrix(
-            ([3.0, 1.0, 2.0], ([0, 1, 1], [0, 2, 3])), shape=(3, 4)))
-        self.coo_matrices.append(scipy.sparse.coo_matrix(
-            ([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])), shape=(3, 4)))
-        self.coo_matrices.append(scipy.sparse.coo_matrix(
-            ([3.0, 1.0, 2.0], ([0, 1, 1], [0, 0, 1])), shape=(3, 2)))
-        self.ils = [[(1, 2), (1, 1), (2, 1)], [(1, 1), (1, 2), (2, 1)], [(1, 2, 'a'), (1, 1, 'b'), (2, 1, 'b')]]
-        self.jls = [[('a', 0), ('a', 1), ('b', 0), ('b', 1)], [0, 1]]
-
-    def test_to_coo_text_names_integer_row_levels_nosort(self):
-        ss = self.sparse_series[0]
-        kwargs = {'row_levels': [0, 1], 'column_levels': [2, 3]}
-        result = (self.coo_matrices[0], self.ils[0], self.jls[0])
-        self._run_test(ss, kwargs, result)
-
-    def test_to_coo_text_names_integer_row_levels_sort(self):
-        ss = self.sparse_series[0]
-        kwargs = {'row_levels': [0, 1],
-                  'column_levels': [2, 3], 'sort_labels': True}
-        result = (self.coo_matrices[1], self.ils[1], self.jls[0])
-        self._run_test(ss, kwargs, result)
-
-    def test_to_coo_text_names_text_row_levels_nosort_col_level_single(self):
-        ss = self.sparse_series[0]
-        kwargs = {'row_levels': ['A', 'B', 'C'],
-                  'column_levels': ['D'], 'sort_labels': False}
-        result = (self.coo_matrices[2], self.ils[2], self.jls[1])
-        self._run_test(ss, kwargs, result)
-
-    def test_to_coo_integer_names_integer_row_levels_nosort(self):
-        ss = self.sparse_series[1]
-        kwargs = {'row_levels': [3, 0], 'column_levels': [1, 2]}
-        result = (self.coo_matrices[0], self.ils[0], self.jls[0])
-        self._run_test(ss, kwargs, result)
-
-    def test_to_coo_text_names_text_row_levels_nosort(self):
-        ss = self.sparse_series[0]
-        kwargs = {'row_levels': ['A', 'B'], 'column_levels': ['C', 'D']}
-        result = (self.coo_matrices[0], self.ils[0], self.jls[0])
-        self._run_test(ss, kwargs, result)
-
-    def test_to_coo_bad_partition_nonnull_intersection(self):
-        ss = self.sparse_series[0]
-        self.assertRaises(ValueError, ss.to_coo, ['A', 'B', 'C'], ['C', 'D'])
-
-    def test_to_coo_bad_partition_small_union(self):
-        ss = self.sparse_series[0]
-        self.assertRaises(ValueError, ss.to_coo, ['A'], ['C', 'D'])
-
-    def test_to_coo_nlevels_less_than_two(self):
-        ss = self.sparse_series[0]
-        ss.index = np.arange(len(ss.index))
-        self.assertRaises(ValueError, ss.to_coo)
-
-    def test_to_coo_bad_ilevel(self):
-        ss = self.sparse_series[0]
-        self.assertRaises(KeyError, ss.to_coo, ['A', 'B'], ['C', 'D', 'E'])
-
-    def test_to_coo_duplicate_index_entries(self):
-        ss = pd.concat(
-            [self.sparse_series[0], self.sparse_series[0]]).to_sparse()
-        self.assertRaises(ValueError, ss.to_coo, ['A', 'B'], ['C', 'D'])
-
-    def test_from_coo_dense_index(self):
-        ss = SparseSeries.from_coo(self.coo_matrices[0], dense_index=True)
-        check = self.sparse_series[2]
-        assert_sp_series_equal(ss, check)
-
-    def test_from_coo_nodense_index(self):
-        ss = SparseSeries.from_coo(self.coo_matrices[0], dense_index=False)
-        check = self.sparse_series[2]
-        check = check.dropna().to_sparse()
-        assert_sp_series_equal(ss, check)
-
-    def _run_test(self, ss, kwargs, check):
-        results = ss.to_coo(**kwargs)
-        self._check_results_to_coo(results, check)
-        # for every test, also test symmetry property (transpose), switch
-        # row_levels and column_levels
-        d = kwargs.copy()
-        d['row_levels'] = kwargs['column_levels']
-        d['column_levels'] = kwargs['row_levels']
-        results = ss.to_coo(**d)
-        results = (results[0].T, results[2], results[1])
-        self._check_results_to_coo(results, check)
-
-    @staticmethod
-    def _check_results_to_coo(results, check):
-        (A, il, jl) = results
-        (A_result, il_result, jl_result) = check
-        # convert to dense and compare
-        assert_numpy_array_equal(A.todense(), A_result.todense())
-        # or compare directly as difference of sparse
-        # assert(abs(A - A_result).max() < 1e-12) # max is failing in python
-        # 2.6
-        assert_equal(il, il_result)
-        assert_equal(jl, jl_result)
-
-
-class TestSparseTimeSeries(tm.TestCase):
-    pass
-
-
-class TestSparseDataFrame(tm.TestCase, test_frame.SafeForSparse):
-    klass = SparseDataFrame
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-
-        self.data = {'A': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
-                     'B': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
-                     'C': np.arange(10),
-                     'D': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]}
-
-        self.dates = bdate_range('1/1/2011', periods=10)
-
-        self.frame = SparseDataFrame(self.data, index=self.dates)
-        self.iframe = SparseDataFrame(self.data, index=self.dates,
-                                      default_kind='integer')
-
-        values = self.frame.values.copy()
-        values[np.isnan(values)] = 0
-
-        self.zframe = SparseDataFrame(values, columns=['A', 'B', 'C', 'D'],
-                                      default_fill_value=0,
-                                      index=self.dates)
-
-        values = self.frame.values.copy()
-        values[np.isnan(values)] = 2
-        self.fill_frame = SparseDataFrame(values, columns=['A', 'B', 'C', 'D'],
-                                          default_fill_value=2,
-                                          index=self.dates)
-
-        self.empty = SparseDataFrame()
-
-    def test_as_matrix(self):
-        empty = self.empty.as_matrix()
-        self.assertEqual(empty.shape, (0, 0))
-
-        no_cols = SparseDataFrame(index=np.arange(10))
-        mat = no_cols.as_matrix()
-        self.assertEqual(mat.shape, (10, 0))
-
-        no_index = SparseDataFrame(columns=np.arange(10))
-        mat = no_index.as_matrix()
-        self.assertEqual(mat.shape, (0, 10))
-
-    def test_copy(self):
-        cp = self.frame.copy()
-        tm.assertIsInstance(cp, SparseDataFrame)
-        assert_sp_frame_equal(cp, self.frame)
-
-        # as of v0.15.0
-        # this is now identical (but not is_a )
-        self.assertTrue(cp.index.identical(self.frame.index))
-
-    def test_constructor(self):
-        for col, series in compat.iteritems(self.frame):
-            tm.assertIsInstance(series, SparseSeries)
-
-        tm.assertIsInstance(self.iframe['A'].sp_index, IntIndex)
-
-        # constructed zframe from matrix above
-        self.assertEqual(self.zframe['A'].fill_value, 0)
-        assert_almost_equal([0, 0, 0, 0, 1, 2, 3, 4, 5, 6],
-                            self.zframe['A'].values)
-
-        # construct no data
-        sdf = SparseDataFrame(columns=np.arange(10), index=np.arange(10))
-        for col, series in compat.iteritems(sdf):
-            tm.assertIsInstance(series, SparseSeries)
-
-        # construct from nested dict
-        data = {}
-        for c, s in compat.iteritems(self.frame):
-            data[c] = s.to_dict()
-
-        sdf = SparseDataFrame(data)
-        assert_sp_frame_equal(sdf, self.frame)
-
-        # TODO: test data is copied from inputs
-
-        # init dict with different index
-        idx = self.frame.index[:5]
-        cons = SparseDataFrame(self.frame, index=idx,
-                               columns=self.frame.columns,
-                               default_fill_value=self.frame.default_fill_value,
-                               default_kind=self.frame.default_kind,
-                               copy=True)
-        reindexed = self.frame.reindex(idx)
-        assert_sp_frame_equal(cons, reindexed, exact_indices=False)
-
-        # assert level parameter breaks reindex
-        self.assertRaises(TypeError, self.frame.reindex, idx, level=0)
-
-        repr(self.frame)
-
-    def test_constructor_ndarray(self):
-        # no index or columns
-        sp = SparseDataFrame(self.frame.values)
-
-        # 1d
-        sp = SparseDataFrame(self.data['A'], index=self.dates,
-                             columns=['A'])
-        assert_sp_frame_equal(sp, self.frame.reindex(columns=['A']))
-
-        # raise on level argument
-        self.assertRaises(TypeError, self.frame.reindex, columns=['A'],
-                          level=1)
-
-        # wrong length index / columns
-        assertRaisesRegexp(
-            ValueError, "^Index length", SparseDataFrame, self.frame.values,
-            index=self.frame.index[:-1])
-        assertRaisesRegexp(
-            ValueError, "^Column length", SparseDataFrame, self.frame.values,
-            columns=self.frame.columns[:-1])
-
-    # GH 9272
-    def test_constructor_empty(self):
-        sp = SparseDataFrame()
-        self.assertEqual(len(sp.index), 0)
-        self.assertEqual(len(sp.columns), 0)
-
-    def test_constructor_dataframe(self):
-        dense = self.frame.to_dense()
-        sp = SparseDataFrame(dense)
-        assert_sp_frame_equal(sp, self.frame)
-
-    def test_constructor_convert_index_once(self):
-        arr = np.array([1.5, 2.5, 3.5])
-        sdf = SparseDataFrame(columns=lrange(4), index=arr)
-        self.assertTrue(sdf[0].index is sdf[1].index)
-
-    def test_constructor_from_series(self):
-
-        # GH 2873
-        x = Series(np.random.randn(10000), name='a')
-        x = x.to_sparse(fill_value=0)
-        tm.assertIsInstance(x, SparseSeries)
-        df = SparseDataFrame(x)
-        tm.assertIsInstance(df, SparseDataFrame)
-
-        x = Series(np.random.randn(10000), name='a')
-        y = Series(np.random.randn(10000), name='b')
-        x2 = x.astype(float)
-        x2.ix[:9998] = np.NaN
-        x_sparse = x2.to_sparse(fill_value=np.NaN)
-
-        # Currently fails too with weird ufunc error
-        # df1 = SparseDataFrame([x_sparse, y])
-
-        y.ix[:9998] = 0
-        y_sparse = y.to_sparse(fill_value=0)
-        # without sparse value raises error
-        # df2 = SparseDataFrame([x2_sparse, y])
-
-    def test_dtypes(self):
-        df = DataFrame(np.random.randn(10000, 4))
-        df.ix[:9998] = np.nan
-        sdf = df.to_sparse()
-
-        result = sdf.get_dtype_counts()
-        expected = Series({'float64': 4})
-        assert_series_equal(result, expected)
-
-    def test_str(self):
-        df = DataFrame(np.random.randn(10000, 4))
-        df.ix[:9998] = np.nan
-
-        sdf = df.to_sparse()
-        str(sdf)
-
-    def test_array_interface(self):
-        res = np.sqrt(self.frame)
-        dres = np.sqrt(self.frame.to_dense())
-        assert_frame_equal(res.to_dense(), dres)
-
-    def test_pickle(self):
-        def _test_roundtrip(frame):
-            result = self.round_trip_pickle(frame)
-            assert_sp_frame_equal(frame, result)
-
-        _test_roundtrip(SparseDataFrame())
-        self._check_all(_test_roundtrip)
-
-    def test_dense_to_sparse(self):
-        df = DataFrame({'A': [nan, nan, nan, 1, 2],
-                        'B': [1, 2, nan, nan, nan]})
-        sdf = df.to_sparse()
-        tm.assertIsInstance(sdf, SparseDataFrame)
-        self.assertTrue(np.isnan(sdf.default_fill_value))
-        tm.assertIsInstance(sdf['A'].sp_index, BlockIndex)
-        tm.assert_frame_equal(sdf.to_dense(), df)
-
-        sdf = df.to_sparse(kind='integer')
-        tm.assertIsInstance(sdf['A'].sp_index, IntIndex)
-
-        df = DataFrame({'A': [0, 0, 0, 1, 2],
-                        'B': [1, 2, 0, 0, 0]}, dtype=float)
-        sdf = df.to_sparse(fill_value=0)
-        self.assertEqual(sdf.default_fill_value, 0)
-        tm.assert_frame_equal(sdf.to_dense(), df)
-
-    def test_density(self):
-        df = SparseSeries([nan, nan, nan, 0, 1, 2, 3, 4, 5, 6])
-        self.assertEqual(df.density, 0.7)
-
-    def test_sparse_to_dense(self):
-        pass
-
-    def test_sparse_series_ops(self):
-        import sys
-        buf = StringIO()
-        tmp = sys.stderr
-        sys.stderr = buf
-        try:
-            self._check_frame_ops(self.frame)
-        finally:
-            sys.stderr = tmp
-
-    def test_sparse_series_ops_i(self):
-        import sys
-        buf = StringIO()
-        tmp = sys.stderr
-        sys.stderr = buf
-        try:
-            self._check_frame_ops(self.iframe)
-        finally:
-            sys.stderr = tmp
-
-    def test_sparse_series_ops_z(self):
-        import sys
-        buf = StringIO()
-        tmp = sys.stderr
-        sys.stderr = buf
-        try:
-            self._check_frame_ops(self.zframe)
-        finally:
-            sys.stderr = tmp
-
-    def test_sparse_series_ops_fill(self):
-        import sys
-        buf = StringIO()
-        tmp = sys.stderr
-        sys.stderr = buf
-        try:
-            self._check_frame_ops(self.fill_frame)
-        finally:
-            sys.stderr = tmp
-
-    def _check_frame_ops(self, frame):
-        fill = frame.default_fill_value
-
-        def _compare_to_dense(a, b, da, db, op):
-            sparse_result = op(a, b)
-            dense_result = op(da, db)
-
-            dense_result = dense_result.to_sparse(fill_value=fill)
-            assert_sp_frame_equal(sparse_result, dense_result,
-                                  exact_indices=False)
-
-            if isinstance(a, DataFrame) and isinstance(db, DataFrame):
-                mixed_result = op(a, db)
-                tm.assertIsInstance(mixed_result, SparseDataFrame)
-                assert_sp_frame_equal(mixed_result, sparse_result,
-                                      exact_indices=False)
-
-        opnames = ['add', 'sub', 'mul', 'truediv', 'floordiv']
-        ops = [getattr(operator, name) for name in opnames]
-
-        fidx = frame.index
-
-        # time series operations
-
-        series = [frame['A'], frame['B'],
-                  frame['C'], frame['D'],
-                  frame['A'].reindex(fidx[:7]),
-                  frame['A'].reindex(fidx[::2]),
-                  SparseSeries([], index=[])]
-
-        for op in opnames:
-            _compare_to_dense(frame, frame[::2], frame.to_dense(),
-                              frame[::2].to_dense(), getattr(operator, op))
-
-            # 2304, no auto-broadcasting
-            for i, s in enumerate(series):
-                f = lambda a, b: getattr(a,op)(b,axis='index')
-                _compare_to_dense(frame, s, frame.to_dense(),
-                                  s.to_dense(), f)
-
-                # rops are not implemented
-                #_compare_to_dense(s, frame, s.to_dense(),
-                #                  frame.to_dense(), f)
-
-        # cross-sectional operations
-        series = [frame.xs(fidx[0]),
-                  frame.xs(fidx[3]),
-                  frame.xs(fidx[5]),
-                  frame.xs(fidx[7]),
-                  frame.xs(fidx[5])[:2]]
-
-        for op in ops:
-            for s in series:
-                _compare_to_dense(frame, s, frame.to_dense(),
-                                  s, op)
-                _compare_to_dense(s, frame, s,
-                                  frame.to_dense(), op)
-
-        # it works!
-        result = self.frame + self.frame.ix[:, ['A', 'B']]
-
-    def test_op_corners(self):
-        empty = self.empty + self.empty
-        self.assertTrue(empty.empty)
-
-        foo = self.frame + self.empty
-        tm.assertIsInstance(foo.index, DatetimeIndex)
-        assert_frame_equal(foo, self.frame * np.nan)
-
-        foo = self.empty + self.frame
-        assert_frame_equal(foo, self.frame * np.nan)
-
-    def test_scalar_ops(self):
-        pass
-
-    def test_getitem(self):
-        # 1585 select multiple columns
-        sdf = SparseDataFrame(index=[0, 1, 2], columns=['a', 'b', 'c'])
-
-        result = sdf[['a', 'b']]
-        exp = sdf.reindex(columns=['a', 'b'])
-        assert_sp_frame_equal(result, exp)
-
-        self.assertRaises(Exception, sdf.__getitem__, ['a', 'd'])
-
-    def test_icol(self):
-        # 10711 deprecated
-
-        # 2227
-        result = self.frame.iloc[:, 0]
-        self.assertTrue(isinstance(result, SparseSeries))
-        assert_sp_series_equal(result, self.frame['A'])
-
-        # preserve sparse index type. #2251
-        data = {'A': [0, 1]}
-        iframe = SparseDataFrame(data, default_kind='integer')
-        self.assertEqual(type(iframe['A'].sp_index),
-                         type(iframe.iloc[:, 0].sp_index))
-
-    def test_set_value(self):
-
-        # ok as the index gets conver to object
-        frame = self.frame.copy()
-        res = frame.set_value('foobar', 'B', 1.5)
-        self.assertEqual(res.index.dtype, 'object')
-
-        res = self.frame
-        res.index = res.index.astype(object)
-
-        res = self.frame.set_value('foobar', 'B', 1.5)
-        self.assertIsNot(res, self.frame)
-        self.assertEqual(res.index[-1], 'foobar')
-        self.assertEqual(res.get_value('foobar', 'B'), 1.5)
-
-        res2 = res.set_value('foobar', 'qux', 1.5)
-        self.assertIsNot(res2, res)
-        self.assert_numpy_array_equal(res2.columns,
-                                      list(self.frame.columns) + ['qux'])
-        self.assertEqual(res2.get_value('foobar', 'qux'), 1.5)
-
-    def test_fancy_index_misc(self):
-        # axis = 0
-        sliced = self.frame.ix[-2:, :]
-        expected = self.frame.reindex(index=self.frame.index[-2:])
-        assert_sp_frame_equal(sliced, expected)
-
-        # axis = 1
-        sliced = self.frame.ix[:, -2:]
-        expected = self.frame.reindex(columns=self.frame.columns[-2:])
-        assert_sp_frame_equal(sliced, expected)
-
-    def test_getitem_overload(self):
-        # slicing
-        sl = self.frame[:20]
-        assert_sp_frame_equal(sl, self.frame.reindex(self.frame.index[:20]))
-
-        # boolean indexing
-        d = self.frame.index[5]
-        indexer = self.frame.index > d
-
-        subindex = self.frame.index[indexer]
-        subframe = self.frame[indexer]
-
-        self.assert_numpy_array_equal(subindex, subframe.index)
-        self.assertRaises(Exception, self.frame.__getitem__, indexer[:-1])
-
-    def test_setitem(self):
-        def _check_frame(frame):
-            N = len(frame)
-
-            # insert SparseSeries
-            frame['E'] = frame['A']
-            tm.assertIsInstance(frame['E'], SparseSeries)
-            assert_sp_series_equal(frame['E'], frame['A'], check_names=False)
-
-            # insert SparseSeries differently-indexed
-            to_insert = frame['A'][::2]
-            frame['E'] = to_insert
-            expected = to_insert.to_dense().reindex(
-                frame.index).fillna(to_insert.fill_value)
-            result = frame['E'].to_dense()
-            assert_series_equal(result, expected, check_names=False)
-            self.assertEqual(result.name, 'E')
-
-            # insert Series
-            frame['F'] = frame['A'].to_dense()
-            tm.assertIsInstance(frame['F'], SparseSeries)
-            assert_sp_series_equal(frame['F'], frame['A'], check_names=False)
-
-            # insert Series differently-indexed
-            to_insert = frame['A'].to_dense()[::2]
-            frame['G'] = to_insert
-            expected = to_insert.reindex(
-                frame.index).fillna(frame.default_fill_value)
-            expected.name = 'G'
-            assert_series_equal(frame['G'].to_dense(), expected)
-
-            # insert ndarray
-            frame['H'] = np.random.randn(N)
-            tm.assertIsInstance(frame['H'], SparseSeries)
-
-            to_sparsify = np.random.randn(N)
-            to_sparsify[N // 2:] = frame.default_fill_value
-            frame['I'] = to_sparsify
-            self.assertEqual(len(frame['I'].sp_values), N // 2)
-
-            # insert ndarray wrong size
-            self.assertRaises(Exception, frame.__setitem__, 'foo',
-                              np.random.randn(N - 1))
-
-            # scalar value
-            frame['J'] = 5
-            self.assertEqual(len(frame['J'].sp_values), N)
-            self.assertTrue((frame['J'].sp_values == 5).all())
-
-            frame['K'] = frame.default_fill_value
-            self.assertEqual(len(frame['K'].sp_values), 0)
-
-        self._check_all(_check_frame)
-
-    def test_setitem_corner(self):
-        self.frame['a'] = self.frame['B']
-        assert_sp_series_equal(self.frame['a'], self.frame['B'], check_names=False)
-
-    def test_setitem_array(self):
-        arr = self.frame['B']
-
-        self.frame['E'] = arr
-        assert_sp_series_equal(self.frame['E'], self.frame['B'], check_names=False)
-
-        self.frame['F'] = arr[:-1]
-        index = self.frame.index[:-1]
-        assert_sp_series_equal(self.frame['E'].reindex(index),
-                               self.frame['F'].reindex(index), check_names=False)
-
-    def test_delitem(self):
-        A = self.frame['A']
-        C = self.frame['C']
-
-        del self.frame['B']
-        self.assertNotIn('B', self.frame)
-        assert_sp_series_equal(self.frame['A'], A)
-        assert_sp_series_equal(self.frame['C'], C)
-
-        del self.frame['D']
-        self.assertNotIn('D', self.frame)
-
-        del self.frame['A']
-        self.assertNotIn('A', self.frame)
-
-    def test_set_columns(self):
-        self.frame.columns = self.frame.columns
-        self.assertRaises(Exception, setattr, self.frame, 'columns',
-                          self.frame.columns[:-1])
-
-    def test_set_index(self):
-        self.frame.index = self.frame.index
-        self.assertRaises(Exception, setattr, self.frame, 'index',
-                          self.frame.index[:-1])
-
-    def test_append(self):
-        a = self.frame[:5]
-        b = self.frame[5:]
-
-        appended = a.append(b)
-        assert_sp_frame_equal(appended, self.frame, exact_indices=False)
-
-        a = self.frame.ix[:5, :3]
-        b = self.frame.ix[5:]
-        appended = a.append(b)
-        assert_sp_frame_equal(
-            appended.ix[:, :3], self.frame.ix[:, :3], exact_indices=False)
-
-    def test_apply(self):
-        applied = self.frame.apply(np.sqrt)
-        tm.assertIsInstance(applied, SparseDataFrame)
-        assert_almost_equal(applied.values, np.sqrt(self.frame.values))
-
-        applied = self.fill_frame.apply(np.sqrt)
-        self.assertEqual(applied['A'].fill_value, np.sqrt(2))
-
-        # agg / broadcast
-        broadcasted = self.frame.apply(np.sum, broadcast=True)
-        tm.assertIsInstance(broadcasted, SparseDataFrame)
-        assert_frame_equal(broadcasted.to_dense(),
-                           self.frame.to_dense().apply(np.sum, broadcast=True))
-
-        self.assertIs(self.empty.apply(np.sqrt), self.empty)
-
-        from pandas.core import nanops
-        applied = self.frame.apply(np.sum)
-        assert_series_equal(applied,
-                            self.frame.to_dense().apply(nanops.nansum))
-
-    def test_apply_nonuq(self):
-        df_orig = DataFrame(
-            [[1, 2, 3], [4, 5, 6], [7, 8, 9]], index=['a', 'a', 'c'])
-        df = df_orig.to_sparse()
-        rs = df.apply(lambda s: s[0], axis=1)
-        xp = Series([1., 4., 7.], ['a', 'a', 'c'])
-        assert_series_equal(rs, xp)
-
-        # df.T breaks
-        df = df_orig.T.to_sparse()
-        rs = df.apply(lambda s: s[0], axis=0)
-        # no non-unique columns supported in sparse yet
-        # assert_series_equal(rs, xp)
-
-    def test_applymap(self):
-        # just test that it works
-        result = self.frame.applymap(lambda x: x * 2)
-        tm.assertIsInstance(result, SparseDataFrame)
-
-    def test_astype(self):
-        self.assertRaises(Exception, self.frame.astype, np.int64)
-
-    def test_fillna(self):
-        df = self.zframe.reindex(lrange(5))
-        result = df.fillna(0)
-        expected = df.to_dense().fillna(0).to_sparse(fill_value=0)
-        assert_sp_frame_equal(result, expected, exact_indices=False)
-
-        result = df.copy()
-        result.fillna(0, inplace=True)
-        expected = df.to_dense().fillna(0).to_sparse(fill_value=0)
-        assert_sp_frame_equal(result, expected, exact_indices=False)
-
-        result = df.copy()
-        result = df['A']
-        result.fillna(0, inplace=True)
-        assert_series_equal(result, df['A'].fillna(0))
-
-    def test_rename(self):
-        # just check this works
-        renamed = self.frame.rename(index=str)
-        renamed = self.frame.rename(columns=lambda x: '%s%d' % (x, len(x)))
-
-    def test_corr(self):
-        res = self.frame.corr()
-        assert_frame_equal(res, self.frame.to_dense().corr())
-
-    def test_describe(self):
-        self.frame['foo'] = np.nan
-        self.frame.get_dtype_counts()
-        str(self.frame)
-        desc = self.frame.describe()
-
-    def test_join(self):
-        left = self.frame.ix[:, ['A', 'B']]
-        right = self.frame.ix[:, ['C', 'D']]
-        joined = left.join(right)
-        assert_sp_frame_equal(joined, self.frame, exact_indices=False)
-
-        right = self.frame.ix[:, ['B', 'D']]
-        self.assertRaises(Exception, left.join, right)
-
-        with tm.assertRaisesRegexp(ValueError, 'Other Series must have a name'):
-            self.frame.join(Series(np.random.randn(len(self.frame)),
-                                   index=self.frame.index))
-
-    def test_reindex(self):
-
-        def _check_frame(frame):
-            index = frame.index
-            sidx = index[::2]
-            sidx2 = index[:5]
-
-            sparse_result = frame.reindex(sidx)
-            dense_result = frame.to_dense().reindex(sidx)
-            assert_frame_equal(sparse_result.to_dense(), dense_result)
-
-            assert_frame_equal(frame.reindex(list(sidx)).to_dense(),
-                               dense_result)
-
-            sparse_result2 = sparse_result.reindex(index)
-            dense_result2 = dense_result.reindex(
-                index).fillna(frame.default_fill_value)
-            assert_frame_equal(sparse_result2.to_dense(), dense_result2)
-
-            # propagate CORRECT fill value
-            assert_almost_equal(sparse_result.default_fill_value,
-                                frame.default_fill_value)
-            assert_almost_equal(sparse_result['A'].fill_value,
-                                frame['A'].fill_value)
-
-            # length zero
-            length_zero = frame.reindex([])
-            self.assertEqual(len(length_zero), 0)
-            self.assertEqual(len(length_zero.columns), len(frame.columns))
-            self.assertEqual(len(length_zero['A']), 0)
-
-            # frame being reindexed has length zero
-            length_n = length_zero.reindex(index)
-            self.assertEqual(len(length_n), len(frame))
-            self.assertEqual(len(length_n.columns), len(frame.columns))
-            self.assertEqual(len(length_n['A']), len(frame))
-
-            # reindex columns
-            reindexed = frame.reindex(columns=['A', 'B', 'Z'])
-            self.assertEqual(len(reindexed.columns), 3)
-            assert_almost_equal(reindexed['Z'].fill_value,
-                                frame.default_fill_value)
-            self.assertTrue(np.isnan(reindexed['Z'].sp_values).all())
-
-        _check_frame(self.frame)
-        _check_frame(self.iframe)
-        _check_frame(self.zframe)
-        _check_frame(self.fill_frame)
-
-        # with copy=False
-        reindexed = self.frame.reindex(self.frame.index, copy=False)
-        reindexed['F'] = reindexed['A']
-        self.assertIn('F', self.frame)
-
-        reindexed = self.frame.reindex(self.frame.index)
-        reindexed['G'] = reindexed['A']
-        self.assertNotIn('G', self.frame)
-
-    def test_reindex_fill_value(self):
-        rng = bdate_range('20110110', periods=20)
-        result = self.zframe.reindex(rng, fill_value=0)
-        expected = self.zframe.reindex(rng).fillna(0)
-        assert_sp_frame_equal(result, expected)
-
-    def test_take(self):
-        result = self.frame.take([1, 0, 2], axis=1)
-        expected = self.frame.reindex(columns=['B', 'A', 'C'])
-        assert_sp_frame_equal(result, expected)
-
-    def test_density(self):
-        df = SparseDataFrame({'A': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
-                              'B': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
-                              'C': np.arange(10),
-                              'D': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]})
-
-        self.assertEqual(df.density, 0.75)
-
-    def test_to_dense(self):
-        def _check(frame):
-            dense_dm = frame.to_dense()
-            assert_frame_equal(frame, dense_dm)
-
-        self._check_all(_check)
-
-    def test_stack_sparse_frame(self):
-        def _check(frame):
-            dense_frame = frame.to_dense()
-
-            wp = Panel.from_dict({'foo': frame})
-            from_dense_lp = wp.to_frame()
-
-            from_sparse_lp = spf.stack_sparse_frame(frame)
-
-            self.assert_numpy_array_equal(from_dense_lp.values,
-                                          from_sparse_lp.values)
-
-        _check(self.frame)
-        _check(self.iframe)
-
-        # for now
-        self.assertRaises(Exception, _check, self.zframe)
-        self.assertRaises(Exception, _check, self.fill_frame)
-
-    def test_transpose(self):
-        def _check(frame):
-            transposed = frame.T
-            untransposed = transposed.T
-            assert_sp_frame_equal(frame, untransposed)
-        self._check_all(_check)
-
-    def test_shift(self):
-        def _check(frame):
-            shifted = frame.shift(0)
-            assert_sp_frame_equal(shifted, frame)
-
-            f = lambda s: s.shift(1)
-            _dense_frame_compare(frame, f)
-
-            f = lambda s: s.shift(-2)
-            _dense_frame_compare(frame, f)
-
-            f = lambda s: s.shift(2, freq='B')
-            _dense_frame_compare(frame, f)
-
-            f = lambda s: s.shift(2, freq=datetools.bday)
-            _dense_frame_compare(frame, f)
-
-        self._check_all(_check)
-
-    def test_count(self):
-        result = self.frame.count()
-        dense_result = self.frame.to_dense().count()
-        assert_series_equal(result, dense_result)
-
-        result = self.frame.count(1)
-        dense_result = self.frame.to_dense().count(1)
-
-        # win32 don't check dtype
-        assert_series_equal(result, dense_result, check_dtype=False)
-
-    def test_cumsum(self):
-        result = self.frame.cumsum()
-        expected = self.frame.to_dense().cumsum()
-        tm.assertIsInstance(result, SparseDataFrame)
-        assert_frame_equal(result.to_dense(), expected)
-
-    def _check_all(self, check_func):
-        check_func(self.frame)
-        check_func(self.iframe)
-        check_func(self.zframe)
-        check_func(self.fill_frame)
-
-    def test_combine_first(self):
-        df = self.frame
-
-        result = df[::2].combine_first(df)
-        result2 = df[::2].combine_first(df.to_dense())
-
-        expected = df[::2].to_dense().combine_first(df.to_dense())
-        expected = expected.to_sparse(fill_value=df.default_fill_value)
-
-        assert_sp_frame_equal(result, result2)
-        assert_sp_frame_equal(result, expected)
-
-    def test_combine_add(self):
-        df = self.frame.to_dense()
-        df2 = df.copy()
-        df2['C'][:3] = np.nan
-        df['A'][:3] = 5.7
-
-        result = df.to_sparse().add(df2.to_sparse(), fill_value=0)
-        expected = df.add(df2, fill_value=0).to_sparse()
-        assert_sp_frame_equal(result, expected)
-
-    def test_isin(self):
-        sparse_df = DataFrame({'flag': [1., 0., 1.]}).to_sparse(fill_value=0.)
-        xp = sparse_df[sparse_df.flag == 1.]
-        rs = sparse_df[sparse_df.flag.isin([1.])]
-        assert_frame_equal(xp, rs)
-
-    def test_sparse_pow_issue(self):
-        # 2220
-        df = SparseDataFrame({'A': [1.1, 3.3], 'B': [2.5, -3.9]})
-
-        # note : no error without nan
-        df = SparseDataFrame({'A': [nan, 0, 1]})
-
-        # note that 2 ** df works fine, also df ** 1
-        result = 1 ** df
-
-        r1 = result.take([0], 1)['A']
-        r2 = result['A']
-
-        self.assertEqual(len(r2.sp_values), len(r1.sp_values))
-
-    def test_as_blocks(self):
-        df = SparseDataFrame({'A': [1.1, 3.3], 'B': [nan, -3.9]},
-                             dtype='float64')
-
-        df_blocks = df.blocks
-        self.assertEqual(list(df_blocks.keys()), ['float64'])
-        assert_frame_equal(df_blocks['float64'], df)
-
-    def test_nan_columnname(self):
-        # GH 8822
-        nan_colname = DataFrame(Series(1.0,index=[0]),columns=[nan])
-        nan_colname_sparse = nan_colname.to_sparse()
-        self.assertTrue(np.isnan(nan_colname_sparse.columns[0]))
-
-
-def _dense_series_compare(s, f):
-    result = f(s)
-    assert(isinstance(result, SparseSeries))
-    dense_result = f(s.to_dense())
-    assert_series_equal(result.to_dense(), dense_result)
-
-
-def _dense_frame_compare(frame, f):
-    result = f(frame)
-    assert(isinstance(frame, SparseDataFrame))
-    dense_result = f(frame.to_dense()).fillna(frame.default_fill_value)
-    assert_frame_equal(result.to_dense(), dense_result)
-
-
-def panel_data1():
-    index = bdate_range('1/1/2011', periods=8)
-
-    return DataFrame({
-        'A': [nan, nan, nan, 0, 1, 2, 3, 4],
-        'B': [0, 1, 2, 3, 4, nan, nan, nan],
-        'C': [0, 1, 2, nan, nan, nan, 3, 4],
-        'D': [nan, 0, 1, nan, 2, 3, 4, nan]
-    }, index=index)
-
-
-def panel_data2():
-    index = bdate_range('1/1/2011', periods=9)
-
-    return DataFrame({
-        'A': [nan, nan, nan, 0, 1, 2, 3, 4, 5],
-        'B': [0, 1, 2, 3, 4, 5, nan, nan, nan],
-        'C': [0, 1, 2, nan, nan, nan, 3, 4, 5],
-        'D': [nan, 0, 1, nan, 2, 3, 4, 5, nan]
-    }, index=index)
-
-
-def panel_data3():
-    index = bdate_range('1/1/2011', periods=10).shift(-2)
-
-    return DataFrame({
-        'A': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
-        'B': [0, 1, 2, 3, 4, 5, 6, nan, nan, nan],
-        'C': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
-        'D': [nan, 0, 1, nan, 2, 3, 4, 5, 6, nan]
-    }, index=index)
-
-
-class TestSparsePanel(tm.TestCase,
-                      test_panel.SafeForLongAndSparse,
-                      test_panel.SafeForSparse):
-    _multiprocess_can_split_ = True
-
-    @classmethod
-    def assert_panel_equal(cls, x, y):
-        assert_sp_panel_equal(x, y)
-
-    def setUp(self):
-        self.data_dict = {
-            'ItemA': panel_data1(),
-            'ItemB': panel_data2(),
-            'ItemC': panel_data3(),
-            'ItemD': panel_data1(),
-        }
-        self.panel = SparsePanel(self.data_dict)
-
-    @staticmethod
-    def _test_op(panel, op):
-        # arithmetic tests
-        result = op(panel, 1)
-        assert_sp_frame_equal(result['ItemA'], op(panel['ItemA'], 1))
-
-    def test_constructor(self):
-        self.assertRaises(ValueError, SparsePanel, self.data_dict,
-                          items=['Item0', 'ItemA', 'ItemB'])
-        with tm.assertRaisesRegexp(TypeError,
-                                   "input must be a dict, a 'list' was passed"):
-            SparsePanel(['a', 'b', 'c'])
-
-    # deprecation GH11157
-    def test_deprecation(self):
-        with tm.assert_produces_warning(FutureWarning):
-            SparsePanel()
-
-    # GH 9272
-    def test_constructor_empty(self):
-        sp = SparsePanel()
-        self.assertEqual(len(sp.items), 0)
-        self.assertEqual(len(sp.major_axis), 0)
-        self.assertEqual(len(sp.minor_axis), 0)
-
-    def test_from_dict(self):
-        fd = SparsePanel.from_dict(self.data_dict)
-        assert_sp_panel_equal(fd, self.panel)
-
-    def test_pickle(self):
-        def _test_roundtrip(panel):
-            result = self.round_trip_pickle(panel)
-            tm.assertIsInstance(result.items, Index)
-            tm.assertIsInstance(result.major_axis, Index)
-            tm.assertIsInstance(result.minor_axis, Index)
-            assert_sp_panel_equal(panel, result)
-
-        _test_roundtrip(self.panel)
-
-    def test_dense_to_sparse(self):
-        wp = Panel.from_dict(self.data_dict)
-        dwp = wp.to_sparse()
-        tm.assertIsInstance(dwp['ItemA']['A'], SparseSeries)
-
-    def test_to_dense(self):
-        dwp = self.panel.to_dense()
-        dwp2 = Panel.from_dict(self.data_dict)
-        assert_panel_equal(dwp, dwp2)
-
-    def test_to_frame(self):
-        def _compare_with_dense(panel):
-            slp = panel.to_frame()
-            dlp = panel.to_dense().to_frame()
-
-            self.assert_numpy_array_equal(slp.values, dlp.values)
-            self.assertTrue(slp.index.equals(dlp.index))
-
-        _compare_with_dense(self.panel)
-        _compare_with_dense(self.panel.reindex(items=['ItemA']))
-
-        zero_panel = SparsePanel(self.data_dict, default_fill_value=0)
-        self.assertRaises(Exception, zero_panel.to_frame)
-
-        self.assertRaises(Exception, self.panel.to_frame,
-                          filter_observations=False)
-
-    def test_long_to_wide_sparse(self):
-        pass
-
-    def test_values(self):
-        pass
-
-    def test_setitem(self):
-        self.panel['ItemE'] = self.panel['ItemC']
-        self.panel['ItemF'] = self.panel['ItemC'].to_dense()
-
-        assert_sp_frame_equal(self.panel['ItemE'], self.panel['ItemC'])
-        assert_sp_frame_equal(self.panel['ItemF'], self.panel['ItemC'])
-        assert_almost_equal(self.panel.items, ['ItemA', 'ItemB', 'ItemC',
-                                               'ItemD', 'ItemE', 'ItemF'])
-
-        self.assertRaises(Exception, self.panel.__setitem__, 'item6', 1)
-
-    def test_set_value(self):
-        def _check_loc(item, major, minor, val=1.5):
-            res = self.panel.set_value(item, major, minor, val)
-            self.assertIsNot(res, self.panel)
-            self.assertEqual(res.get_value(item, major, minor), val)
-
-        _check_loc('ItemA', self.panel.major_axis[4], self.panel.minor_axis[3])
-        _check_loc('ItemF', self.panel.major_axis[4], self.panel.minor_axis[3])
-        _check_loc('ItemF', 'foo', self.panel.minor_axis[3])
-        _check_loc('ItemE', 'foo', 'bar')
-
-    def test_delitem_pop(self):
-        del self.panel['ItemB']
-        assert_almost_equal(self.panel.items, ['ItemA', 'ItemC', 'ItemD'])
-        crackle = self.panel['ItemC']
-        pop = self.panel.pop('ItemC')
-        self.assertIs(pop, crackle)
-        assert_almost_equal(self.panel.items, ['ItemA', 'ItemD'])
-
-        self.assertRaises(KeyError, self.panel.__delitem__, 'ItemC')
-
-    def test_copy(self):
-        cop = self.panel.copy()
-        assert_sp_panel_equal(cop, self.panel)
-
-    def test_reindex(self):
-        def _compare_with_dense(swp, items, major, minor):
-            swp_re = swp.reindex(items=items, major=major,
-                                 minor=minor)
-            dwp_re = swp.to_dense().reindex(items=items, major=major,
-                                            minor=minor)
-            assert_panel_equal(swp_re.to_dense(), dwp_re)
-
-        _compare_with_dense(self.panel, self.panel.items[:2],
-                            self.panel.major_axis[::2],
-                            self.panel.minor_axis[::2])
-        _compare_with_dense(self.panel, None,
-                            self.panel.major_axis[::2],
-                            self.panel.minor_axis[::2])
-
-        self.assertRaises(ValueError, self.panel.reindex)
-
-        # TODO: do something about this later...
-        self.assertRaises(Exception, self.panel.reindex,
-                          items=['item0', 'ItemA', 'ItemB'])
-
-        # test copying
-        cp = self.panel.reindex(self.panel.major_axis, copy=True)
-        cp['ItemA']['E'] = cp['ItemA']['A']
-        self.assertNotIn('E', self.panel['ItemA'])
-
-    def test_operators(self):
-        def _check_ops(panel):
-            def _dense_comp(op):
-                dense = panel.to_dense()
-                sparse_result = op(panel)
-                dense_result = op(dense)
-                assert_panel_equal(sparse_result.to_dense(), dense_result)
-
-            def _mixed_comp(op):
-                result = op(panel, panel.to_dense())
-                expected = op(panel.to_dense(), panel.to_dense())
-                assert_panel_equal(result, expected)
-
-            op1 = lambda x: x + 2
-
-            _dense_comp(op1)
-            op2 = lambda x: x.add(x.reindex(major=x.major_axis[::2]))
-            _dense_comp(op2)
-            op3 = lambda x: x.subtract(x.mean(0), axis=0)
-            _dense_comp(op3)
-            op4 = lambda x: x.subtract(x.mean(1), axis=1)
-            _dense_comp(op4)
-            op5 = lambda x: x.subtract(x.mean(2), axis=2)
-            _dense_comp(op5)
-
-            _mixed_comp(Panel.multiply)
-            _mixed_comp(Panel.subtract)
-
-            # TODO: this case not yet supported!
-            # op6 = lambda x: x.add(x.to_frame())
-            # _dense_comp(op6)
-
-        _check_ops(self.panel)
-
-    def test_major_xs(self):
-        def _dense_comp(sparse):
-            dense = sparse.to_dense()
-
-            for idx in sparse.major_axis:
-                dslice = dense.major_xs(idx)
-                sslice = sparse.major_xs(idx)
-                assert_frame_equal(dslice, sslice)
-
-        _dense_comp(self.panel)
-
-    def test_minor_xs(self):
-        def _dense_comp(sparse):
-            dense = sparse.to_dense()
-
-            for idx in sparse.minor_axis:
-                dslice = dense.minor_xs(idx)
-                sslice = sparse.minor_xs(idx).to_dense()
-                assert_frame_equal(dslice, sslice)
-
-        _dense_comp(self.panel)
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
-
-    # nose.runmodule(argv=[__file__,'-vvs','-x','--pdb', '--pdb-failure',
-    #                      '--with-profile'],
-    #                exit=False)
diff --git a/pandas/src/datetime.pxd b/pandas/src/datetime.pxd
deleted file mode 100644
index 0896965162698..0000000000000
--- a/pandas/src/datetime.pxd
+++ /dev/null
@@ -1,196 +0,0 @@
-from numpy cimport int64_t, int32_t, npy_int64, npy_int32, ndarray
-from cpython cimport PyObject
-
-from cpython cimport PyUnicode_Check, PyUnicode_AsASCIIString
-
-
-cdef extern from "headers/stdint.h":
-    enum: INT64_MIN
-    enum: INT32_MIN
-
-
-
-cdef extern from "datetime.h":
-
-    ctypedef class datetime.date [object PyDateTime_Date]:
-        pass
-
-    ctypedef class datetime.datetime [object PyDateTime_DateTime]:
-        pass
-
-    ctypedef class datetime.timedelta [object PyDateTime_Delta]:
-        pass
-
-    void PyDateTime_IMPORT()
-
-    int PyDateTime_GET_YEAR(date)
-    int PyDateTime_GET_MONTH(date)
-    int PyDateTime_GET_DAY(date)
-    int PyDateTime_DATE_GET_HOUR(object o)
-    int PyDateTime_DATE_GET_MINUTE(object o)
-    int PyDateTime_DATE_GET_SECOND(object o)
-    int PyDateTime_DATE_GET_MICROSECOND(object o)
-    int PyDateTime_TIME_GET_HOUR(object o)
-    int PyDateTime_TIME_GET_MINUTE(object o)
-    int PyDateTime_TIME_GET_SECOND(object o)
-    int PyDateTime_TIME_GET_MICROSECOND(object o)
-    bint PyDateTime_Check(object o)
-    bint PyDate_Check(object o)
-    bint PyTime_Check(object o)
-    bint PyDelta_Check(object o)
-    object PyDateTime_FromDateAndTime(int year, int month, int day, int hour,
-                                      int minute, int second, int us)
-
-cdef extern from "datetime_helper.h":
-    void mangle_nat(object o)
-
-cdef extern from "numpy/ndarrayobject.h":
-
-    ctypedef int64_t npy_timedelta
-    ctypedef int64_t npy_datetime
-
-    ctypedef enum NPY_CASTING:
-            NPY_NO_CASTING
-            NPY_EQUIV_CASTING
-            NPY_SAFE_CASTING
-            NPY_SAME_KIND_CASTING
-            NPY_UNSAFE_CASTING
-
-
-cdef extern from "numpy_helper.h":
-    npy_datetime get_datetime64_value(object o)
-
-cdef extern from "numpy/npy_common.h":
-
-    ctypedef unsigned char npy_bool
-
-cdef extern from "datetime/np_datetime.h":
-
-    ctypedef enum PANDAS_DATETIMEUNIT:
-        PANDAS_FR_Y
-        PANDAS_FR_M
-        PANDAS_FR_W
-        PANDAS_FR_D
-        PANDAS_FR_B
-        PANDAS_FR_h
-        PANDAS_FR_m
-        PANDAS_FR_s
-        PANDAS_FR_ms
-        PANDAS_FR_us
-        PANDAS_FR_ns
-        PANDAS_FR_ps
-        PANDAS_FR_fs
-        PANDAS_FR_as
-
-    ctypedef struct pandas_datetimestruct:
-        npy_int64 year
-        npy_int32 month, day, hour, min, sec, us, ps, as
-
-    int cmp_pandas_datetimestruct(pandas_datetimestruct *a,
-                                  pandas_datetimestruct *b)
-
-    int convert_pydatetime_to_datetimestruct(PyObject *obj,
-                                             pandas_datetimestruct *out,
-                                             PANDAS_DATETIMEUNIT *out_bestunit,
-                                             int apply_tzinfo)
-
-    npy_datetime pandas_datetimestruct_to_datetime(PANDAS_DATETIMEUNIT fr,
-                                                   pandas_datetimestruct *d)
-    void pandas_datetime_to_datetimestruct(npy_datetime val,
-                                           PANDAS_DATETIMEUNIT fr,
-                                           pandas_datetimestruct *result)
-    int days_per_month_table[2][12]
-
-    int dayofweek(int y, int m, int d)
-    int is_leapyear(int64_t year)
-    PANDAS_DATETIMEUNIT get_datetime64_unit(object o)
-
-cdef extern from "datetime/np_datetime_strings.h":
-
-    int parse_iso_8601_datetime(char *str, int len, PANDAS_DATETIMEUNIT unit,
-                                NPY_CASTING casting, pandas_datetimestruct *out,
-                                int *out_local, int *out_tzoffset,
-                                PANDAS_DATETIMEUNIT *out_bestunit,
-                                npy_bool *out_special)
-
-    int make_iso_8601_datetime(pandas_datetimestruct *dts, char *outstr, int outlen,
-                               int local, PANDAS_DATETIMEUNIT base, int tzoffset,
-                               NPY_CASTING casting)
-
-    int get_datetime_iso_8601_strlen(int local, PANDAS_DATETIMEUNIT base)
-
-    # int parse_python_string(object obj, pandas_datetimestruct *out) except -1
-
-
-
-
-cdef inline _string_to_dts(object val, pandas_datetimestruct* dts,
-                           int* out_local, int* out_tzoffset):
-    cdef int result
-    cdef char *tmp
-
-    if PyUnicode_Check(val):
-        val = PyUnicode_AsASCIIString(val);
-
-    tmp = val
-    result = _cstring_to_dts(tmp, len(val), dts, out_local, out_tzoffset)
-
-    if result == -1:
-        raise ValueError('Unable to parse %s' % str(val))
-
-cdef inline int _cstring_to_dts(char *val, int length,
-                                pandas_datetimestruct* dts,
-                                int* out_local, int* out_tzoffset):
-    cdef:
-        npy_bool special
-        PANDAS_DATETIMEUNIT out_bestunit
-        int result
-
-    result = parse_iso_8601_datetime(val, length, PANDAS_FR_ns,
-                                     NPY_UNSAFE_CASTING,
-                                     dts, out_local, out_tzoffset, &out_bestunit, &special)
-    return result
-
-
-cdef inline object _datetime64_to_datetime(int64_t val):
-    cdef pandas_datetimestruct dts
-    pandas_datetime_to_datetimestruct(val, PANDAS_FR_ns, &dts)
-    return _dts_to_pydatetime(&dts)
-
-cdef inline object _dts_to_pydatetime(pandas_datetimestruct *dts):
-    return <object> PyDateTime_FromDateAndTime(dts.year, dts.month,
-                                               dts.day, dts.hour,
-                                               dts.min, dts.sec, dts.us)
-
-cdef inline int64_t _pydatetime_to_dts(object val, pandas_datetimestruct *dts):
-    dts.year = PyDateTime_GET_YEAR(val)
-    dts.month = PyDateTime_GET_MONTH(val)
-    dts.day = PyDateTime_GET_DAY(val)
-    dts.hour = PyDateTime_DATE_GET_HOUR(val)
-    dts.min = PyDateTime_DATE_GET_MINUTE(val)
-    dts.sec = PyDateTime_DATE_GET_SECOND(val)
-    dts.us = PyDateTime_DATE_GET_MICROSECOND(val)
-    dts.ps = dts.as = 0
-    return pandas_datetimestruct_to_datetime(PANDAS_FR_ns, dts)
-
-cdef inline int64_t _dtlike_to_datetime64(object val,
-                                          pandas_datetimestruct *dts):
-    dts.year = val.year
-    dts.month = val.month
-    dts.day = val.day
-    dts.hour = val.hour
-    dts.min = val.minute
-    dts.sec = val.second
-    dts.us = val.microsecond
-    dts.ps = dts.as = 0
-    return pandas_datetimestruct_to_datetime(PANDAS_FR_ns, dts)
-
-cdef inline int64_t _date_to_datetime64(object val,
-                                        pandas_datetimestruct *dts):
-    dts.year = PyDateTime_GET_YEAR(val)
-    dts.month = PyDateTime_GET_MONTH(val)
-    dts.day = PyDateTime_GET_DAY(val)
-    dts.hour = dts.min = dts.sec = dts.us = 0
-    dts.ps = dts.as = 0
-    return pandas_datetimestruct_to_datetime(PANDAS_FR_ns, dts)
-
diff --git a/pandas/src/datetime/np_datetime.c b/pandas/src/datetime/np_datetime.c
deleted file mode 100644
index c30b404d2b8b2..0000000000000
--- a/pandas/src/datetime/np_datetime.c
+++ /dev/null
@@ -1,1018 +0,0 @@
-/*
- * This is derived from Numpy 1.7
- *
- * See NP_LICENSE.txt
- */
-
-#define NO_IMPORT
-
-#include <Python.h>
-#include <datetime.h>
-
-/* #define __MSVCRT_VERSION__ 0x0700    /\* whatever above 0x0601 *\/ */
-/* #include <time.h> */
-/* #define time_t __time64_t */
-/* #define localtime _localtime64 */
-/* #define time _time64 */
-
-#include <numpy/arrayobject.h>
-#include <numpy/arrayscalars.h>
-#include "np_datetime.h"
-
-#if PY_MAJOR_VERSION >= 3
-  #define PyIntObject                  PyLongObject
-  #define PyInt_Type                   PyLong_Type
-  #define PyInt_Check(op)              PyLong_Check(op)
-  #define PyInt_CheckExact(op)         PyLong_CheckExact(op)
-  #define PyInt_FromString             PyLong_FromString
-  #define PyInt_FromUnicode            PyLong_FromUnicode
-  #define PyInt_FromLong               PyLong_FromLong
-  #define PyInt_FromSize_t             PyLong_FromSize_t
-  #define PyInt_FromSsize_t            PyLong_FromSsize_t
-  #define PyInt_AsLong                 PyLong_AsLong
-  #define PyInt_AS_LONG                PyLong_AS_LONG
-  #define PyInt_AsSsize_t              PyLong_AsSsize_t
-  #define PyInt_AsUnsignedLongMask     PyLong_AsUnsignedLongMask
-  #define PyInt_AsUnsignedLongLongMask PyLong_AsUnsignedLongLongMask
-#endif
-
-const int days_per_month_table[2][12] = {
-    { 31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31 },
-    { 31, 29, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31 }
-};
-
-/*
- * Returns 1 if the given year is a leap year, 0 otherwise.
- */
-int is_leapyear(npy_int64 year)
-{
-    return (year & 0x3) == 0 && /* year % 4 == 0 */
-           ((year % 100) != 0 ||
-            (year % 400) == 0);
-}
-
-/*
- * Sakamoto's method, from wikipedia
- */
-int dayofweek(int y, int m, int d)
-{
-    int day;
-    static const int t[] = {0, 3, 2, 5, 0, 3, 5, 1, 4, 6, 2, 4};
-    y -= m < 3;
-    day = (y + y/4 - y/100 + y/400 + t[m-1] + d) % 7;
-    // convert to python day
-    return (day + 6) % 7;
-}
-
-/*
- * Adjusts a datetimestruct based on a minutes offset. Assumes
- * the current values are valid.g
- */
-void
-add_minutes_to_datetimestruct(pandas_datetimestruct *dts, int minutes)
-{
-    int isleap;
-
-    /* MINUTES */
-    dts->min += minutes;
-    while (dts->min < 0) {
-        dts->min += 60;
-        dts->hour--;
-    }
-    while (dts->min >= 60) {
-        dts->min -= 60;
-        dts->hour++;
-    }
-
-    /* HOURS */
-    while (dts->hour < 0) {
-        dts->hour += 24;
-        dts->day--;
-    }
-    while (dts->hour >= 24) {
-        dts->hour -= 24;
-        dts->day++;
-    }
-
-    /* DAYS */
-    if (dts->day < 1) {
-        dts->month--;
-        if (dts->month < 1) {
-            dts->year--;
-            dts->month = 12;
-        }
-        isleap = is_leapyear(dts->year);
-        dts->day += days_per_month_table[isleap][dts->month-1];
-    }
-    else if (dts->day > 28) {
-        isleap = is_leapyear(dts->year);
-        if (dts->day > days_per_month_table[isleap][dts->month-1]) {
-            dts->day -= days_per_month_table[isleap][dts->month-1];
-            dts->month++;
-            if (dts->month > 12) {
-                dts->year++;
-                dts->month = 1;
-            }
-        }
-    }
-}
-
-/*
- * Calculates the days offset from the 1970 epoch.
- */
-npy_int64
-get_datetimestruct_days(const pandas_datetimestruct *dts)
-{
-    int i, month;
-    npy_int64 year, days = 0;
-    const int *month_lengths;
-
-    year = dts->year - 1970;
-    days = year * 365;
-
-    /* Adjust for leap years */
-    if (days >= 0) {
-        /*
-         * 1968 is the closest leap year before 1970.
-         * Exclude the current year, so add 1.
-         */
-        year += 1;
-        /* Add one day for each 4 years */
-        days += year / 4;
-        /* 1900 is the closest previous year divisible by 100 */
-        year += 68;
-        /* Subtract one day for each 100 years */
-        days -= year / 100;
-        /* 1600 is the closest previous year divisible by 400 */
-        year += 300;
-        /* Add one day for each 400 years */
-        days += year / 400;
-    }
-    else {
-        /*
-         * 1972 is the closest later year after 1970.
-         * Include the current year, so subtract 2.
-         */
-        year -= 2;
-        /* Subtract one day for each 4 years */
-        days += year / 4;
-        /* 2000 is the closest later year divisible by 100 */
-        year -= 28;
-        /* Add one day for each 100 years */
-        days -= year / 100;
-        /* 2000 is also the closest later year divisible by 400 */
-        /* Subtract one day for each 400 years */
-        days += year / 400;
-    }
-
-    month_lengths = days_per_month_table[is_leapyear(dts->year)];
-    month = dts->month - 1;
-
-    /* Add the months */
-    for (i = 0; i < month; ++i) {
-        days += month_lengths[i];
-    }
-
-    /* Add the days */
-    days += dts->day - 1;
-
-    return days;
-}
-
-/*
- * Modifies '*days_' to be the day offset within the year,
- * and returns the year.
- */
-static npy_int64
-days_to_yearsdays(npy_int64 *days_)
-{
-    const npy_int64 days_per_400years = (400*365 + 100 - 4 + 1);
-    /* Adjust so it's relative to the year 2000 (divisible by 400) */
-    npy_int64 days = (*days_) - (365*30 + 7);
-    npy_int64 year;
-
-    /* Break down the 400 year cycle to get the year and day within the year */
-    if (days >= 0) {
-        year = 400 * (days / days_per_400years);
-        days = days % days_per_400years;
-    }
-    else {
-        year = 400 * ((days - (days_per_400years - 1)) / days_per_400years);
-        days = days % days_per_400years;
-        if (days < 0) {
-            days += days_per_400years;
-        }
-    }
-
-    /* Work out the year/day within the 400 year cycle */
-    if (days >= 366) {
-        year += 100 * ((days-1) / (100*365 + 25 - 1));
-        days = (days-1) % (100*365 + 25 - 1);
-        if (days >= 365) {
-            year += 4 * ((days+1) / (4*365 + 1));
-            days = (days+1) % (4*365 + 1);
-            if (days >= 366) {
-                year += (days-1) / 365;
-                days = (days-1) % 365;
-            }
-        }
-    }
-
-    *days_ = days;
-    return year + 2000;
-}
-
-/*
- * Adjusts a datetimestruct based on a seconds offset. Assumes
- * the current values are valid.
- */
-NPY_NO_EXPORT void
-add_seconds_to_datetimestruct(pandas_datetimestruct *dts, int seconds)
-{
-    int minutes;
-
-    dts->sec += seconds;
-    if (dts->sec < 0) {
-        minutes = dts->sec / 60;
-        dts->sec = dts->sec % 60;
-        if (dts->sec < 0) {
-            --minutes;
-            dts->sec += 60;
-        }
-        add_minutes_to_datetimestruct(dts, minutes);
-    }
-    else if (dts->sec >= 60) {
-        minutes = dts->sec / 60;
-        dts->sec = dts->sec % 60;
-        add_minutes_to_datetimestruct(dts, minutes);
-    }
-}
-
-/*
- * Fills in the year, month, day in 'dts' based on the days
- * offset from 1970.
- */
-static void
-set_datetimestruct_days(npy_int64 days, pandas_datetimestruct *dts)
-{
-    const int *month_lengths;
-    int i;
-
-    dts->year = days_to_yearsdays(&days);
-    month_lengths = days_per_month_table[is_leapyear(dts->year)];
-
-    for (i = 0; i < 12; ++i) {
-        if (days < month_lengths[i]) {
-            dts->month = i + 1;
-            dts->day = days + 1;
-            return;
-        }
-        else {
-            days -= month_lengths[i];
-        }
-    }
-}
-
-/*
- * Compares two pandas_datetimestruct objects chronologically
- */
-int
-cmp_pandas_datetimestruct(pandas_datetimestruct *a, pandas_datetimestruct *b)
-{
-    if (a->year > b->year) {
-        return 1;
-    } else if (a->year < b->year) {
-        return -1;
-    }
-
-    if (a->month > b->month) {
-        return 1;
-    } else if (a->month < b->month) {
-        return -1;
-    }
-
-    if (a->day > b->day) {
-        return 1;
-    } else if (a->day < b->day) {
-        return -1;
-    }
-
-    if (a->hour > b->hour) {
-        return 1;
-    } else if (a->hour < b->hour) {
-        return -1;
-    }
-
-    if (a->min > b->min) {
-        return 1;
-    } else if (a->min < b->min) {
-        return -1;
-    }
-
-    if (a->sec > b->sec) {
-        return 1;
-    } else if (a->sec < b->sec) {
-        return -1;
-    }
-
-    if (a->us > b->us) {
-        return 1;
-    } else if (a->us < b->us) {
-        return -1;
-    }
-
-    if (a->ps > b->ps) {
-        return 1;
-    } else if (a->ps < b->ps) {
-        return -1;
-    }
-
-    if (a->as > b->as) {
-        return 1;
-    } else if (a->as < b->as) {
-        return -1;
-    }
-
-    return 0;
-}
-
-/*
- *
- * Tests for and converts a Python datetime.datetime or datetime.date
- * object into a NumPy pandas_datetimestruct.
- *
- * While the C API has PyDate_* and PyDateTime_* functions, the following
- * implementation just asks for attributes, and thus supports
- * datetime duck typing. The tzinfo time zone conversion would require
- * this style of access anyway.
- *
- * 'out_bestunit' gives a suggested unit based on whether the object
- *      was a datetime.date or datetime.datetime object.
- *
- * If 'apply_tzinfo' is 1, this function uses the tzinfo to convert
- * to UTC time, otherwise it returns the struct with the local time.
- *
- * Returns -1 on error, 0 on success, and 1 (with no error set)
- * if obj doesn't have the neeeded date or datetime attributes.
- */
-int
-convert_pydatetime_to_datetimestruct(PyObject *obj, pandas_datetimestruct *out,
-                                     PANDAS_DATETIMEUNIT *out_bestunit,
-                                     int apply_tzinfo)
-{
-    PyObject *tmp;
-    int isleap;
-
-    /* Initialize the output to all zeros */
-    memset(out, 0, sizeof(pandas_datetimestruct));
-    out->month = 1;
-    out->day = 1;
-
-    /* Need at least year/month/day attributes */
-    if (!PyObject_HasAttrString(obj, "year") ||
-            !PyObject_HasAttrString(obj, "month") ||
-            !PyObject_HasAttrString(obj, "day")) {
-        return 1;
-    }
-
-    /* Get the year */
-    tmp = PyObject_GetAttrString(obj, "year");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->year = PyInt_AsLong(tmp);
-    if (out->year == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    /* Get the month */
-    tmp = PyObject_GetAttrString(obj, "month");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->month = PyInt_AsLong(tmp);
-    if (out->month == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    /* Get the day */
-    tmp = PyObject_GetAttrString(obj, "day");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->day = PyInt_AsLong(tmp);
-    if (out->day == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    /* Validate that the month and day are valid for the year */
-    if (out->month < 1 || out->month > 12) {
-        goto invalid_date;
-    }
-    isleap = is_leapyear(out->year);
-    if (out->day < 1 ||
-                out->day > days_per_month_table[isleap][out->month-1]) {
-        goto invalid_date;
-    }
-
-    /* Check for time attributes (if not there, return success as a date) */
-    if (!PyObject_HasAttrString(obj, "hour") ||
-            !PyObject_HasAttrString(obj, "minute") ||
-            !PyObject_HasAttrString(obj, "second") ||
-            !PyObject_HasAttrString(obj, "microsecond")) {
-        /* The best unit for date is 'D' */
-        if (out_bestunit != NULL) {
-            *out_bestunit = PANDAS_FR_D;
-        }
-        return 0;
-    }
-
-    /* Get the hour */
-    tmp = PyObject_GetAttrString(obj, "hour");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->hour = PyInt_AsLong(tmp);
-    if (out->hour == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    /* Get the minute */
-    tmp = PyObject_GetAttrString(obj, "minute");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->min = PyInt_AsLong(tmp);
-    if (out->min == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    /* Get the second */
-    tmp = PyObject_GetAttrString(obj, "second");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->sec = PyInt_AsLong(tmp);
-    if (out->sec == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    /* Get the microsecond */
-    tmp = PyObject_GetAttrString(obj, "microsecond");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->us = PyInt_AsLong(tmp);
-    if (out->us == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    if (out->hour < 0 || out->hour >= 24 ||
-            out->min < 0 || out->min >= 60 ||
-            out->sec < 0 || out->sec >= 60 ||
-            out->us < 0 || out->us >= 1000000) {
-        goto invalid_time;
-    }
-
-    /* Apply the time zone offset if it exists */
-    if (apply_tzinfo && PyObject_HasAttrString(obj, "tzinfo")) {
-        tmp = PyObject_GetAttrString(obj, "tzinfo");
-        if (tmp == NULL) {
-            return -1;
-        }
-        if (tmp == Py_None) {
-            Py_DECREF(tmp);
-        }
-        else {
-            PyObject *offset;
-            int seconds_offset, minutes_offset;
-
-            /* The utcoffset function should return a timedelta */
-            offset = PyObject_CallMethod(tmp, "utcoffset", "O", obj);
-            if (offset == NULL) {
-                Py_DECREF(tmp);
-                return -1;
-            }
-            Py_DECREF(tmp);
-
-            /*
-             * The timedelta should have a function "total_seconds"
-             * which contains the value we want.
-             */
-            tmp = PyObject_CallMethod(offset, "total_seconds", "");
-            if (tmp == NULL) {
-                return -1;
-            }
-            seconds_offset = PyInt_AsLong(tmp);
-            if (seconds_offset == -1 && PyErr_Occurred()) {
-                Py_DECREF(tmp);
-                return -1;
-            }
-            Py_DECREF(tmp);
-
-            /* Convert to a minutes offset and apply it */
-            minutes_offset = seconds_offset / 60;
-
-            add_minutes_to_datetimestruct(out, -minutes_offset);
-        }
-    }
-
-    /* The resolution of Python's datetime is 'us' */
-    if (out_bestunit != NULL) {
-        *out_bestunit = PANDAS_FR_us;
-    }
-
-    return 0;
-
-invalid_date:
-    PyErr_Format(PyExc_ValueError,
-            "Invalid date (%d,%d,%d) when converting to NumPy datetime",
-            (int)out->year, (int)out->month, (int)out->day);
-    return -1;
-
-invalid_time:
-    PyErr_Format(PyExc_ValueError,
-            "Invalid time (%d,%d,%d,%d) when converting "
-            "to NumPy datetime",
-            (int)out->hour, (int)out->min, (int)out->sec, (int)out->us);
-    return -1;
-}
-
-npy_datetime pandas_datetimestruct_to_datetime(PANDAS_DATETIMEUNIT fr, pandas_datetimestruct *d)
-{
-    pandas_datetime_metadata meta;
-    npy_datetime result = PANDAS_DATETIME_NAT;
-
-    meta.base = fr;
-    meta.num = 1;
-
-    convert_datetimestruct_to_datetime(&meta, d, &result);
-    return result;
-}
-
-void pandas_datetime_to_datetimestruct(npy_datetime val, PANDAS_DATETIMEUNIT fr,
-                                       pandas_datetimestruct *result)
-{
-    pandas_datetime_metadata meta;
-
-    meta.base = fr;
-    meta.num = 1;
-
-    convert_datetime_to_datetimestruct(&meta, val, result);
-}
-
-PANDAS_DATETIMEUNIT get_datetime64_unit(PyObject *obj) {
-    return ((PyDatetimeScalarObject *) obj)->obmeta.base;
-}
-
-
-/*
- * Converts a datetime from a datetimestruct to a datetime based
- * on some metadata. The date is assumed to be valid.
- *
- * TODO: If meta->num is really big, there could be overflow
- *
- * Returns 0 on success, -1 on failure.
- */
-int
-convert_datetimestruct_to_datetime(pandas_datetime_metadata *meta,
-                                    const pandas_datetimestruct *dts,
-                                    npy_datetime *out)
-{
-    npy_datetime ret;
-    PANDAS_DATETIMEUNIT base = meta->base;
-
-    if (base == PANDAS_FR_Y) {
-        /* Truncate to the year */
-        ret = dts->year - 1970;
-    }
-    else if (base == PANDAS_FR_M) {
-        /* Truncate to the month */
-        ret = 12 * (dts->year - 1970) + (dts->month - 1);
-    }
-    else {
-        /* Otherwise calculate the number of days to start */
-        npy_int64 days = get_datetimestruct_days(dts);
-
-        switch (base) {
-            case PANDAS_FR_W:
-                /* Truncate to weeks */
-                if (days >= 0) {
-                    ret = days / 7;
-                }
-                else {
-                    ret = (days - 6) / 7;
-                }
-                break;
-            case PANDAS_FR_D:
-                ret = days;
-                break;
-            case PANDAS_FR_h:
-                ret = days * 24 +
-                      dts->hour;
-                break;
-            case PANDAS_FR_m:
-                ret = (days * 24 +
-                      dts->hour) * 60 +
-                      dts->min;
-                break;
-            case PANDAS_FR_s:
-                ret = ((days * 24 +
-                      dts->hour) * 60 +
-                      dts->min) * 60 +
-                      dts->sec;
-                break;
-            case PANDAS_FR_ms:
-                ret = (((days * 24 +
-                      dts->hour) * 60 +
-                      dts->min) * 60 +
-                      dts->sec) * 1000 +
-                      dts->us / 1000;
-                break;
-            case PANDAS_FR_us:
-                ret = (((days * 24 +
-                      dts->hour) * 60 +
-                      dts->min) * 60 +
-                      dts->sec) * 1000000 +
-                      dts->us;
-                break;
-            case PANDAS_FR_ns:
-                ret = ((((days * 24 +
-                      dts->hour) * 60 +
-                      dts->min) * 60 +
-                      dts->sec) * 1000000 +
-                      dts->us) * 1000 +
-                      dts->ps / 1000;
-                break;
-            case PANDAS_FR_ps:
-                ret = ((((days * 24 +
-                      dts->hour) * 60 +
-                      dts->min) * 60 +
-                      dts->sec) * 1000000 +
-                      dts->us) * 1000000 +
-                      dts->ps;
-                break;
-            case PANDAS_FR_fs:
-                /* only 2.6 hours */
-                ret = (((((days * 24 +
-                      dts->hour) * 60 +
-                      dts->min) * 60 +
-                      dts->sec) * 1000000 +
-                      dts->us) * 1000000 +
-                      dts->ps) * 1000 +
-                      dts->as / 1000;
-                break;
-            case PANDAS_FR_as:
-                /* only 9.2 secs */
-                ret = (((((days * 24 +
-                      dts->hour) * 60 +
-                      dts->min) * 60 +
-                      dts->sec) * 1000000 +
-                      dts->us) * 1000000 +
-                      dts->ps) * 1000000 +
-                      dts->as;
-                break;
-            default:
-                /* Something got corrupted */
-                PyErr_SetString(PyExc_ValueError,
-                        "NumPy datetime metadata with corrupt unit value");
-                return -1;
-        }
-    }
-
-    /* Divide by the multiplier */
-    if (meta->num > 1) {
-        if (ret >= 0) {
-            ret /= meta->num;
-        }
-        else {
-            ret = (ret - meta->num + 1) / meta->num;
-        }
-    }
-
-    *out = ret;
-
-    return 0;
-}
-
-
-/*
- * This provides the casting rules for the TIMEDELTA data type units.
- *
- * Notably, there is a barrier between the nonlinear years and
- * months units, and all the other units.
- */
-npy_bool
-can_cast_timedelta64_units(PANDAS_DATETIMEUNIT src_unit,
-                          PANDAS_DATETIMEUNIT dst_unit,
-                          NPY_CASTING casting)
-{
-    switch (casting) {
-        /* Allow anything with unsafe casting */
-        case NPY_UNSAFE_CASTING:
-            return 1;
-
-        /*
-         * Only enforce the 'date units' vs 'time units' barrier with
-         * 'same_kind' casting.
-         */
-        case NPY_SAME_KIND_CASTING:
-            return (src_unit <= PANDAS_FR_M && dst_unit <= PANDAS_FR_M) ||
-                    (src_unit > PANDAS_FR_M && dst_unit > PANDAS_FR_M);
-
-        /*
-         * Enforce the 'date units' vs 'time units' barrier and that
-         * casting is only allowed towards more precise units with
-         * 'safe' casting.
-         */
-        case NPY_SAFE_CASTING:
-            return (src_unit <= dst_unit) &&
-                    ((src_unit <= PANDAS_FR_M && dst_unit <= PANDAS_FR_M) ||
-                    (src_unit > PANDAS_FR_M && dst_unit > PANDAS_FR_M));
-
-        /* Enforce equality with 'no' or 'equiv' casting */
-        default:
-            return src_unit == dst_unit;
-    }
-}
-
-/*
- * This provides the casting rules for the DATETIME data type units.
- *
- * Notably, there is a barrier between 'date units' and 'time units'
- * for all but 'unsafe' casting.
- */
-npy_bool
-can_cast_datetime64_units(PANDAS_DATETIMEUNIT src_unit,
-                          PANDAS_DATETIMEUNIT dst_unit,
-                          NPY_CASTING casting)
-{
-    switch (casting) {
-        /* Allow anything with unsafe casting */
-        case NPY_UNSAFE_CASTING:
-            return 1;
-
-        /*
-         * Only enforce the 'date units' vs 'time units' barrier with
-         * 'same_kind' casting.
-         */
-        case NPY_SAME_KIND_CASTING:
-            return (src_unit <= PANDAS_FR_D && dst_unit <= PANDAS_FR_D) ||
-                    (src_unit > PANDAS_FR_D && dst_unit > PANDAS_FR_D);
-
-        /*
-         * Enforce the 'date units' vs 'time units' barrier and that
-         * casting is only allowed towards more precise units with
-         * 'safe' casting.
-         */
-        case NPY_SAFE_CASTING:
-            return (src_unit <= dst_unit) &&
-                    ((src_unit <= PANDAS_FR_D && dst_unit <= PANDAS_FR_D) ||
-                    (src_unit > PANDAS_FR_D && dst_unit > PANDAS_FR_D));
-
-        /* Enforce equality with 'no' or 'equiv' casting */
-        default:
-            return src_unit == dst_unit;
-    }
-}
-
-/*
- * Converts a datetime based on the given metadata into a datetimestruct
- */
-int
-convert_datetime_to_datetimestruct(pandas_datetime_metadata *meta,
-                                    npy_datetime dt,
-                                    pandas_datetimestruct *out)
-{
-    npy_int64 perday;
-
-    /* Initialize the output to all zeros */
-    memset(out, 0, sizeof(pandas_datetimestruct));
-    out->year = 1970;
-    out->month = 1;
-    out->day = 1;
-
-    /* TODO: Change to a mechanism that avoids the potential overflow */
-    dt *= meta->num;
-
-    /*
-     * Note that care must be taken with the / and % operators
-     * for negative values.
-     */
-    switch (meta->base) {
-        case PANDAS_FR_Y:
-            out->year = 1970 + dt;
-            break;
-
-        case PANDAS_FR_M:
-            if (dt >= 0) {
-                out->year  = 1970 + dt / 12;
-                out->month = dt % 12 + 1;
-            }
-            else {
-                out->year  = 1969 + (dt + 1) / 12;
-                out->month = 12 + (dt + 1)% 12;
-            }
-            break;
-
-        case PANDAS_FR_W:
-            /* A week is 7 days */
-            set_datetimestruct_days(dt * 7, out);
-            break;
-
-        case PANDAS_FR_D:
-            set_datetimestruct_days(dt, out);
-            break;
-
-        case PANDAS_FR_h:
-            perday = 24LL;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt  = dt % perday;
-            }
-            else {
-                set_datetimestruct_days((dt - (perday-1)) / perday, out);
-                dt = (perday-1) + (dt + 1) % perday;
-            }
-            out->hour = dt;
-            break;
-
-        case PANDAS_FR_m:
-            perday = 24LL * 60;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt  = dt % perday;
-            }
-            else {
-                set_datetimestruct_days((dt - (perday-1)) / perday, out);
-                dt = (perday-1) + (dt + 1) % perday;
-            }
-            out->hour = dt / 60;
-            out->min = dt % 60;
-            break;
-
-        case PANDAS_FR_s:
-            perday = 24LL * 60 * 60;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt  = dt % perday;
-            }
-            else {
-                set_datetimestruct_days((dt - (perday-1)) / perday, out);
-                dt = (perday-1) + (dt + 1) % perday;
-            }
-            out->hour = dt / (60*60);
-            out->min = (dt / 60) % 60;
-            out->sec = dt % 60;
-            break;
-
-        case PANDAS_FR_ms:
-            perday = 24LL * 60 * 60 * 1000;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt  = dt % perday;
-            }
-            else {
-                set_datetimestruct_days((dt - (perday-1)) / perday, out);
-                dt = (perday-1) + (dt + 1) % perday;
-            }
-            out->hour = dt / (60*60*1000LL);
-            out->min = (dt / (60*1000LL)) % 60;
-            out->sec = (dt / 1000LL) % 60;
-            out->us = (dt % 1000LL) * 1000;
-            break;
-
-        case PANDAS_FR_us:
-            perday = 24LL * 60LL * 60LL * 1000LL * 1000LL;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt  = dt % perday;
-            }
-            else {
-                set_datetimestruct_days((dt - (perday-1)) / perday, out);
-                dt = (perday-1) + (dt + 1) % perday;
-            }
-            out->hour = dt / (60*60*1000000LL);
-            out->min = (dt / (60*1000000LL)) % 60;
-            out->sec = (dt / 1000000LL) % 60;
-            out->us = dt % 1000000LL;
-            break;
-
-        case PANDAS_FR_ns:
-            perday = 24LL * 60LL * 60LL * 1000LL * 1000LL * 1000LL;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt  = dt % perday;
-            }
-            else {
-                set_datetimestruct_days((dt - (perday-1)) / perday, out);
-                dt = (perday-1) + (dt + 1) % perday;
-            }
-            out->hour = dt / (60*60*1000000000LL);
-            out->min = (dt / (60*1000000000LL)) % 60;
-            out->sec = (dt / 1000000000LL) % 60;
-            out->us = (dt / 1000LL) % 1000000LL;
-            out->ps = (dt % 1000LL) * 1000;
-            break;
-
-        case PANDAS_FR_ps:
-            perday = 24LL * 60 * 60 * 1000 * 1000 * 1000 * 1000;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt  = dt % perday;
-            }
-            else {
-                set_datetimestruct_days((dt - (perday-1)) / perday, out);
-                dt = (perday-1) + (dt + 1) % perday;
-            }
-            out->hour = dt / (60*60*1000000000000LL);
-            out->min = (dt / (60*1000000000000LL)) % 60;
-            out->sec = (dt / 1000000000000LL) % 60;
-            out->us = (dt / 1000000LL) % 1000000LL;
-            out->ps = dt % 1000000LL;
-            break;
-
-        case PANDAS_FR_fs:
-            /* entire range is only +- 2.6 hours */
-            if (dt >= 0) {
-                out->hour = dt / (60*60*1000000000000000LL);
-                out->min = (dt / (60*1000000000000000LL)) % 60;
-                out->sec = (dt / 1000000000000000LL) % 60;
-                out->us = (dt / 1000000000LL) % 1000000LL;
-                out->ps = (dt / 1000LL) % 1000000LL;
-                out->as = (dt % 1000LL) * 1000;
-            }
-            else {
-                npy_datetime minutes;
-
-                minutes = dt / (60*1000000000000000LL);
-                dt = dt % (60*1000000000000000LL);
-                if (dt < 0) {
-                    dt += (60*1000000000000000LL);
-                    --minutes;
-                }
-                /* Offset the negative minutes */
-                add_minutes_to_datetimestruct(out, minutes);
-                out->sec = (dt / 1000000000000000LL) % 60;
-                out->us = (dt / 1000000000LL) % 1000000LL;
-                out->ps = (dt / 1000LL) % 1000000LL;
-                out->as = (dt % 1000LL) * 1000;
-            }
-            break;
-
-        case PANDAS_FR_as:
-            /* entire range is only +- 9.2 seconds */
-            if (dt >= 0) {
-                out->sec = (dt / 1000000000000000000LL) % 60;
-                out->us = (dt / 1000000000000LL) % 1000000LL;
-                out->ps = (dt / 1000000LL) % 1000000LL;
-                out->as = dt % 1000000LL;
-            }
-            else {
-                npy_datetime seconds;
-
-                seconds = dt / 1000000000000000000LL;
-                dt = dt % 1000000000000000000LL;
-                if (dt < 0) {
-                    dt += 1000000000000000000LL;
-                    --seconds;
-                }
-                /* Offset the negative seconds */
-                add_seconds_to_datetimestruct(out, seconds);
-                out->us = (dt / 1000000000000LL) % 1000000LL;
-                out->ps = (dt / 1000000LL) % 1000000LL;
-                out->as = dt % 1000000LL;
-            }
-            break;
-
-        default:
-            PyErr_SetString(PyExc_RuntimeError,
-                        "NumPy datetime metadata is corrupted with invalid "
-                        "base unit");
-            return -1;
-    }
-
-    return 0;
-}
-
diff --git a/pandas/src/datetime/np_datetime.h b/pandas/src/datetime/np_datetime.h
deleted file mode 100644
index f200d3a289c06..0000000000000
--- a/pandas/src/datetime/np_datetime.h
+++ /dev/null
@@ -1,119 +0,0 @@
-/*
- * This is derived from numpy 1.7
- * See NP_LICENSE.TXT
- */
-
-#ifndef _PANDAS_DATETIME_H_
-#define _PANDAS_DATETIME_H_
-
-#include <numpy/ndarraytypes.h>
-
-typedef enum {
-        PANDAS_FR_Y = 0, /* Years */
-        PANDAS_FR_M = 1, /* Months */
-        PANDAS_FR_W = 2, /* Weeks */
-        /* Gap where NPY_FR_B was */
-        PANDAS_FR_D = 4, /* Days */
-        PANDAS_FR_h = 5, /* hours */
-        PANDAS_FR_m = 6, /* minutes */
-        PANDAS_FR_s = 7, /* seconds */
-        PANDAS_FR_ms = 8,/* milliseconds */
-        PANDAS_FR_us = 9,/* microseconds */
-        PANDAS_FR_ns = 10,/* nanoseconds */
-        PANDAS_FR_ps = 11,/* picoseconds */
-        PANDAS_FR_fs = 12,/* femtoseconds */
-        PANDAS_FR_as = 13,/* attoseconds */
-        PANDAS_FR_GENERIC = 14 /* Generic, unbound units, can convert to anything */
-} PANDAS_DATETIMEUNIT;
-
-#define PANDAS_DATETIME_NUMUNITS 13
-
-#define PANDAS_DATETIME_MAX_ISO8601_STRLEN (21+3*5+1+3*6+6+1)
-
-#define PANDAS_DATETIME_NAT NPY_MIN_INT64
-
-typedef struct {
-        npy_int64 year;
-        npy_int32 month, day, hour, min, sec, us, ps, as;
-} pandas_datetimestruct;
-
-typedef struct {
-    PANDAS_DATETIMEUNIT base;
-    int num;
-} pandas_datetime_metadata;
-
-// stuff pandas needs
-// ----------------------------------------------------------------------------
-
-int convert_pydatetime_to_datetimestruct(PyObject *obj, pandas_datetimestruct *out,
-                                         PANDAS_DATETIMEUNIT *out_bestunit,
-                                         int apply_tzinfo);
-
-npy_datetime pandas_datetimestruct_to_datetime(PANDAS_DATETIMEUNIT fr,
-                                               pandas_datetimestruct *d);
-
-void pandas_datetime_to_datetimestruct(npy_datetime val, PANDAS_DATETIMEUNIT fr,
-                                       pandas_datetimestruct *result);
-
-int dayofweek(int y, int m, int d);
-
-extern const int days_per_month_table[2][12];
-
-// stuff numpy-derived code needs in header
-// ----------------------------------------------------------------------------
-
-int is_leapyear(npy_int64 year);
-
-/*
- * Converts a datetime from a datetimestruct to a datetime based
- * on some metadata. The date is assumed to be valid.
- *
- * TODO: If meta->num is really big, there could be overflow
- *
- * Returns 0 on success, -1 on failure.
- */
-int
-convert_datetimestruct_to_datetime(pandas_datetime_metadata *meta,
-                                   const pandas_datetimestruct *dts,
-                                   npy_datetime *out);
-
-/*
- * Calculates the days offset from the 1970 epoch.
- */
-npy_int64
-get_datetimestruct_days(const pandas_datetimestruct *dts);
-
-/*
- * Adjusts a datetimestruct based on a minutes offset. Assumes
- * the current values are valid.
- */
-void
-add_minutes_to_datetimestruct(pandas_datetimestruct *dts, int minutes);
-
-/*
- * This provides the casting rules for the TIMEDELTA data type units.
- *
- * Notably, there is a barrier between the nonlinear years and
- * months units, and all the other units.
- */
-//npy_bool
-//can_cast_timedelta64_units(PANDAS_DATETIMEUNIT src_unit,
-//                          PANDAS_DATETIMEUNIT dst_unit,
-//                          NPY_CASTING casting);
-
-npy_bool
-can_cast_datetime64_units(PANDAS_DATETIMEUNIT src_unit,
-                          PANDAS_DATETIMEUNIT dst_unit,
-                          NPY_CASTING casting);
-
-
-int
-convert_datetime_to_datetimestruct(pandas_datetime_metadata *meta,
-                                   npy_datetime dt,
-                                   pandas_datetimestruct *out);
-
-
-PANDAS_DATETIMEUNIT get_datetime64_unit(PyObject *obj);
-
-
-#endif
diff --git a/pandas/src/datetime/np_datetime_strings.c b/pandas/src/datetime/np_datetime_strings.c
deleted file mode 100644
index f7835971ed0b7..0000000000000
--- a/pandas/src/datetime/np_datetime_strings.c
+++ /dev/null
@@ -1,1461 +0,0 @@
-/*
- * This file implements string parsing and creation for NumPy datetime.
- *
- * Written by Mark Wiebe (mwwiebe@gmail.com)
- * Copyright (c) 2011 by Enthought, Inc.
- *
- * See NP_LICENSE.txt for the license.
- */
-
-#define PY_SSIZE_T_CLEAN
-#define NO_IMPORT
-
-#include <Python.h>
-
-#include <time.h>
-
-#include <numpy/arrayobject.h>
-#include "numpy/arrayscalars.h"
-
-#include "np_datetime.h"
-#include "np_datetime_strings.h"
-
-NPY_NO_EXPORT const char *
-npy_casting_to_string(NPY_CASTING casting)
-{
-    switch (casting) {
-        case NPY_NO_CASTING:
-            return "'no'";
-        case NPY_EQUIV_CASTING:
-            return "'equiv'";
-        case NPY_SAFE_CASTING:
-            return "'safe'";
-        case NPY_SAME_KIND_CASTING:
-            return "'same_kind'";
-        case NPY_UNSAFE_CASTING:
-            return "'unsafe'";
-        default:
-            return "<unknown>";
-    }
-}
-
-/* Platform-specific time_t typedef */
-typedef time_t NPY_TIME_T;
-
-/*// We *do* want these symbols, but for cython, not for C. fine in mac osx,*/
-/*// linux complains.*/
-/*static void _suppress_unused_variable_warning(void)*/
-/*{*/
-/*    int x = days_per_month_table[0][0];*/
-/*    x = x;*/
-
-/*    int y = _month_offset[0][0];*/
-/*    y = y;*/
-
-/*    char *z = _datetime_strings[0];*/
-/*    z = z;*/
-/*}*/
-
-/* Exported as DATETIMEUNITS in multiarraymodule.c */
-static char *_datetime_strings[PANDAS_DATETIME_NUMUNITS] = {
-    "Y",
-    "M",
-    "W",
-    "D",
-    "h",
-    "m",
-    "s",
-    "ms",
-    "us",
-    "ns",
-    "ps",
-    "fs",
-    "as",
-};
-/*
- * Wraps `localtime` functionality for multiple platforms. This
- * converts a time value to a time structure in the local timezone.
- *
- * Returns 0 on success, -1 on failure.
- */
-static int
-get_localtime(NPY_TIME_T *ts, struct tm *tms)
-{
-    char *func_name = "<unknown>";
-#if defined(_WIN32)
- #if defined(_MSC_VER) && (_MSC_VER >= 1400)
-    if (localtime_s(tms, ts) != 0) {
-        func_name = "localtime_s";
-        goto fail;
-    }
- #elif defined(__GNUC__) && defined(NPY_MINGW_USE_CUSTOM_MSVCR)
-    if (_localtime64_s(tms, ts) != 0) {
-        func_name = "_localtime64_s";
-        goto fail;
-    }
- #else
-    struct tm *tms_tmp;
-    tms_tmp = localtime(ts);
-    if (tms_tmp == NULL) {
-        func_name = "localtime";
-        goto fail;
-    }
-    memcpy(tms, tms_tmp, sizeof(struct tm));
- #endif
-#else
-    if (localtime_r(ts, tms) == NULL) {
-        func_name = "localtime_r";
-        goto fail;
-    }
-#endif
-
-    return 0;
-
-fail:
-    PyErr_Format(PyExc_OSError, "Failed to use '%s' to convert "
-                                "to a local time", func_name);
-    return -1;
-}
-
-#if 0
-/*
- * Wraps `gmtime` functionality for multiple platforms. This
- * converts a time value to a time structure in UTC.
- *
- * Returns 0 on success, -1 on failure.
- */
-static int
-get_gmtime(NPY_TIME_T *ts, struct tm *tms)
-{
-    char *func_name = "<unknown>";
-#if defined(_WIN32)
- #if defined(_MSC_VER) && (_MSC_VER >= 1400)
-    if (gmtime_s(tms, ts) != 0) {
-        func_name = "gmtime_s";
-        goto fail;
-    }
- #elif defined(__GNUC__) && defined(NPY_MINGW_USE_CUSTOM_MSVCR)
-    if (_gmtime64_s(tms, ts) != 0) {
-        func_name = "_gmtime64_s";
-        goto fail;
-    }
- #else
-    struct tm *tms_tmp;
-    tms_tmp = gmtime(ts);
-    if (tms_tmp == NULL) {
-        func_name = "gmtime";
-        goto fail;
-    }
-    memcpy(tms, tms_tmp, sizeof(struct tm));
- #endif
-#else
-    if (gmtime_r(ts, tms) == NULL) {
-        func_name = "gmtime_r";
-        goto fail;
-    }
-#endif
-
-    return 0;
-
-fail:
-    PyErr_Format(PyExc_OSError, "Failed to use '%s' to convert "
-                                "to a UTC time", func_name);
-    return -1;
-}
-#endif
-
-/*
- * Converts a datetimestruct in UTC to a datetimestruct in local time,
- * also returning the timezone offset applied.
- *
- * Returns 0 on success, -1 on failure.
- */
-static int
-convert_datetimestruct_utc_to_local(pandas_datetimestruct *out_dts_local,
-                const pandas_datetimestruct *dts_utc, int *out_timezone_offset)
-{
-    NPY_TIME_T rawtime = 0, localrawtime;
-    struct tm tm_;
-    npy_int64 year_correction = 0;
-
-    /* Make a copy of the input 'dts' to modify */
-    *out_dts_local = *dts_utc;
-
-    /* HACK: Use a year < 2038 for later years for small time_t */
-    if (sizeof(NPY_TIME_T) == 4 && out_dts_local->year >= 2038) {
-        if (is_leapyear(out_dts_local->year)) {
-            /* 2036 is a leap year */
-            year_correction = out_dts_local->year - 2036;
-            out_dts_local->year -= year_correction;
-        }
-        else {
-            /* 2037 is not a leap year */
-            year_correction = out_dts_local->year - 2037;
-            out_dts_local->year -= year_correction;
-        }
-    }
-
-    /*
-     * Convert everything in 'dts' to a time_t, to minutes precision.
-     * This is POSIX time, which skips leap-seconds, but because
-     * we drop the seconds value from the pandas_datetimestruct, everything
-     * is ok for this operation.
-     */
-    rawtime = (time_t)get_datetimestruct_days(out_dts_local) * 24 * 60 * 60;
-    rawtime += dts_utc->hour * 60 * 60;
-    rawtime += dts_utc->min * 60;
-
-    /* localtime converts a 'time_t' into a local 'struct tm' */
-    if (get_localtime(&rawtime, &tm_) < 0) {
-        return -1;
-    }
-
-    /* Copy back all the values except seconds */
-    out_dts_local->min = tm_.tm_min;
-    out_dts_local->hour = tm_.tm_hour;
-    out_dts_local->day = tm_.tm_mday;
-    out_dts_local->month = tm_.tm_mon + 1;
-    out_dts_local->year = tm_.tm_year + 1900;
-
-    /* Extract the timezone offset that was applied */
-    rawtime /= 60;
-    localrawtime = (time_t)get_datetimestruct_days(out_dts_local) * 24 * 60;
-    localrawtime += out_dts_local->hour * 60;
-    localrawtime += out_dts_local->min;
-
-    *out_timezone_offset = localrawtime - rawtime;
-
-    /* Reapply the year 2038 year correction HACK */
-    out_dts_local->year += year_correction;
-
-    return 0;
-}
-
-#if 0
-/*
- * Converts a datetimestruct in local time to a datetimestruct in UTC.
- *
- * Returns 0 on success, -1 on failure.
- */
-static int
-convert_datetimestruct_local_to_utc(pandas_datetimestruct *out_dts_utc,
-                const pandas_datetimestruct *dts_local)
-{
-    npy_int64 year_correction = 0;
-
-    /* Make a copy of the input 'dts' to modify */
-    *out_dts_utc = *dts_local;
-
-    /* HACK: Use a year < 2038 for later years for small time_t */
-    if (sizeof(NPY_TIME_T) == 4 && out_dts_utc->year >= 2038) {
-        if (is_leapyear(out_dts_utc->year)) {
-            /* 2036 is a leap year */
-            year_correction = out_dts_utc->year - 2036;
-            out_dts_utc->year -= year_correction;
-        }
-        else {
-            /* 2037 is not a leap year */
-            year_correction = out_dts_utc->year - 2037;
-            out_dts_utc->year -= year_correction;
-        }
-    }
-
-    /*
-     * ISO 8601 states to treat date-times without a timezone offset
-     * or 'Z' for UTC as local time. The C standard libary functions
-     * mktime and gmtime allow us to do this conversion.
-     *
-     * Only do this timezone adjustment for recent and future years.
-     * In this case, "recent" is defined to be 1970 and later, because
-     * on MS Windows, mktime raises an error when given an earlier date.
-     */
-    if (out_dts_utc->year >= 1970) {
-        NPY_TIME_T rawtime = 0;
-        struct tm tm_;
-
-        tm_.tm_sec = out_dts_utc->sec;
-        tm_.tm_min = out_dts_utc->min;
-        tm_.tm_hour = out_dts_utc->hour;
-        tm_.tm_mday = out_dts_utc->day;
-        tm_.tm_mon = out_dts_utc->month - 1;
-        tm_.tm_year = out_dts_utc->year - 1900;
-        tm_.tm_isdst = -1;
-
-        /* mktime converts a local 'struct tm' into a time_t */
-        rawtime = mktime(&tm_);
-        if (rawtime == -1) {
-            PyErr_SetString(PyExc_OSError, "Failed to use mktime to "
-                                        "convert local time to UTC");
-            return -1;
-        }
-
-        /* gmtime converts a 'time_t' into a UTC 'struct tm' */
-        if (get_gmtime(&rawtime, &tm_) < 0) {
-            return -1;
-        }
-        out_dts_utc->sec = tm_.tm_sec;
-        out_dts_utc->min = tm_.tm_min;
-        out_dts_utc->hour = tm_.tm_hour;
-        out_dts_utc->day = tm_.tm_mday;
-        out_dts_utc->month = tm_.tm_mon + 1;
-        out_dts_utc->year = tm_.tm_year + 1900;
-    }
-
-    /* Reapply the year 2038 year correction HACK */
-    out_dts_utc->year += year_correction;
-
-    return 0;
-}
-#endif
-
-/* int */
-/* parse_python_string(PyObject* obj, pandas_datetimestruct *dts) { */
-/*     PyObject *bytes = NULL; */
-/*     char *str = NULL; */
-/*     Py_ssize_t len = 0; */
-/*     PANDAS_DATETIMEUNIT bestunit = -1; */
-
-/*     /\* Convert to an ASCII string for the date parser *\/ */
-/*     if (PyUnicode_Check(obj)) { */
-/*         bytes = PyUnicode_AsASCIIString(obj); */
-/*         if (bytes == NULL) { */
-/*             return -1; */
-/*         } */
-/*     } */
-/*     else { */
-/*         bytes = obj; */
-/*         Py_INCREF(bytes); */
-/*     } */
-/*     if (PyBytes_AsStringAndSize(bytes, &str, &len) == -1) { */
-/*         Py_DECREF(bytes); */
-/*         return -1; */
-/*     } */
-
-/*     /\* Parse the ISO date *\/ */
-/*     if (parse_iso_8601_datetime(str, len, PANDAS_FR_us, NPY_UNSAFE_CASTING, */
-/*                             dts, NULL, &bestunit, NULL) < 0) { */
-/*         Py_DECREF(bytes); */
-/*         return -1; */
-/*     } */
-/*     Py_DECREF(bytes); */
-
-/*     return 0; */
-/* } */
-
-
-/*
- * Parses (almost) standard ISO 8601 date strings. The differences are:
- *
- * + The date "20100312" is parsed as the year 20100312, not as
- *   equivalent to "2010-03-12". The '-' in the dates are not optional.
- * + Only seconds may have a decimal point, with up to 18 digits after it
- *   (maximum attoseconds precision).
- * + Either a 'T' as in ISO 8601 or a ' ' may be used to separate
- *   the date and the time. Both are treated equivalently.
- * + Doesn't (yet) handle the "YYYY-DDD" or "YYYY-Www" formats.
- * + Doesn't handle leap seconds (seconds value has 60 in these cases).
- * + Doesn't handle 24:00:00 as synonym for midnight (00:00:00) tomorrow
- * + Accepts special values "NaT" (not a time), "Today", (current
- *   day according to local time) and "Now" (current time in UTC).
- *
- * 'str' must be a NULL-terminated string, and 'len' must be its length.
- * 'unit' should contain -1 if the unit is unknown, or the unit
- *      which will be used if it is.
- * 'casting' controls how the detected unit from the string is allowed
- *           to be cast to the 'unit' parameter.
- *
- * 'out' gets filled with the parsed date-time.
- * 'out_local' gets set to 1 if the parsed time contains timezone, 
- *      to 0 otherwise.
- * 'out_tzoffset' gets set to timezone offset by minutes
- *      if the parsed time was in local time,
- *      to 0 otherwise. The values 'now' and 'today' don't get counted
- *      as local, and neither do UTC +/-#### timezone offsets, because
- *      they aren't using the computer's local timezone offset.
- * 'out_bestunit' gives a suggested unit based on the amount of
- *      resolution provided in the string, or -1 for NaT.
- * 'out_special' gets set to 1 if the parsed time was 'today',
- *      'now', or ''/'NaT'. For 'today', the unit recommended is
- *      'D', for 'now', the unit recommended is 's', and for 'NaT'
- *      the unit recommended is 'Y'.
- *
- * Returns 0 on success, -1 on failure.
- */
-int
-parse_iso_8601_datetime(char *str, int len,
-                    PANDAS_DATETIMEUNIT unit,
-                    NPY_CASTING casting,
-                    pandas_datetimestruct *out,
-                    int *out_local,
-                    int *out_tzoffset,
-                    PANDAS_DATETIMEUNIT *out_bestunit,
-                    npy_bool *out_special)
-{
-    int year_leap = 0;
-    int i, numdigits;
-    char *substr, sublen;
-    PANDAS_DATETIMEUNIT bestunit;
-
-    /* Initialize the output to all zeros */
-    memset(out, 0, sizeof(pandas_datetimestruct));
-    out->month = 1;
-    out->day = 1;
-
-
-    /*
-     * The string "today" means take today's date in local time, and
-     * convert it to a date representation. This date representation, if
-     * forced into a time unit, will be at midnight UTC.
-     * This is perhaps a little weird, but done so that the
-     * 'datetime64[D]' type produces the date you expect, rather than
-     * switching to an adjacent day depending on the current time and your
-     * timezone.
-     */
-    if (len == 5 && tolower(str[0]) == 't' &&
-                    tolower(str[1]) == 'o' &&
-                    tolower(str[2]) == 'd' &&
-                    tolower(str[3]) == 'a' &&
-                    tolower(str[4]) == 'y') {
-        NPY_TIME_T rawtime = 0;
-        struct tm tm_;
-
-        time(&rawtime);
-        if (get_localtime(&rawtime, &tm_) < 0) {
-            return -1;
-        }
-        out->year = tm_.tm_year + 1900;
-        out->month = tm_.tm_mon + 1;
-        out->day = tm_.tm_mday;
-
-        bestunit = PANDAS_FR_D;
-
-        /*
-         * Indicate that this was a special value, and
-         * is a date (unit 'D').
-         */
-        if (out_local != NULL) {
-            *out_local = 0;
-        }
-        if (out_bestunit != NULL) {
-            *out_bestunit = bestunit;
-        }
-        if (out_special != NULL) {
-            *out_special = 1;
-        }
-
-        /* Check the casting rule */
-        if (unit != -1 && !can_cast_datetime64_units(bestunit, unit,
-                                                     casting)) {
-            PyErr_Format(PyExc_TypeError, "Cannot parse \"%s\" as unit "
-                         "'%s' using casting rule %s",
-                         str, _datetime_strings[unit],
-                         npy_casting_to_string(casting));
-            return -1;
-        }
-
-        return 0;
-    }
-
-    /* The string "now" resolves to the current UTC time */
-    if (len == 3 && tolower(str[0]) == 'n' &&
-                    tolower(str[1]) == 'o' &&
-                    tolower(str[2]) == 'w') {
-        NPY_TIME_T rawtime = 0;
-        pandas_datetime_metadata meta;
-
-        time(&rawtime);
-
-        /* Set up a dummy metadata for the conversion */
-        meta.base = PANDAS_FR_s;
-        meta.num = 1;
-
-        bestunit = PANDAS_FR_s;
-
-        /*
-         * Indicate that this was a special value, and
-         * use 's' because the time() function has resolution
-         * seconds.
-         */
-        if (out_local != NULL) {
-            *out_local = 0;
-        }
-        if (out_bestunit != NULL) {
-            *out_bestunit = bestunit;
-        }
-        if (out_special != NULL) {
-            *out_special = 1;
-        }
-
-        /* Check the casting rule */
-        if (unit != -1 && !can_cast_datetime64_units(bestunit, unit,
-                                                     casting)) {
-            PyErr_Format(PyExc_TypeError, "Cannot parse \"%s\" as unit "
-                         "'%s' using casting rule %s",
-                         str, _datetime_strings[unit],
-                         npy_casting_to_string(casting));
-            return -1;
-        }
-
-        return convert_datetime_to_datetimestruct(&meta, rawtime, out);
-    }
-
-    /* Anything else isn't a special value */
-    if (out_special != NULL) {
-        *out_special = 0;
-    }
-
-    substr = str;
-    sublen = len;
-
-    /* Skip leading whitespace */
-    while (sublen > 0 && isspace(*substr)) {
-        ++substr;
-        --sublen;
-    }
-
-    /* Leading '-' sign for negative year */
-    if (*substr == '-') {
-        ++substr;
-        --sublen;
-    }
-
-    if (sublen == 0) {
-        goto parse_error;
-    }
-
-    /* PARSE THE YEAR (digits until the '-' character) */
-    out->year = 0;
-    while (sublen > 0 && isdigit(*substr)) {
-        out->year = 10 * out->year + (*substr - '0');
-        ++substr;
-        --sublen;
-    }
-
-    /* Negate the year if necessary */
-    if (str[0] == '-') {
-        out->year = -out->year;
-    }
-    /* Check whether it's a leap-year */
-    year_leap = is_leapyear(out->year);
-
-    /* Next character must be a '-' or the end of the string */
-    if (sublen == 0) {
-        if (out_local != NULL) {
-            *out_local = 0;
-        }
-        bestunit = PANDAS_FR_Y;
-        goto finish;
-    }
-    else if (*substr == '-') {
-        ++substr;
-        --sublen;
-    }
-    else {
-        goto parse_error;
-    }
-
-    /* Can't have a trailing '-' */
-    if (sublen == 0) {
-        goto parse_error;
-    }
-
-    /* PARSE THE MONTH (2 digits) */
-    if (sublen >= 2 && isdigit(substr[0]) && isdigit(substr[1])) {
-        out->month = 10 * (substr[0] - '0') + (substr[1] - '0');
-
-        if (out->month < 1 || out->month > 12) {
-            PyErr_Format(PyExc_ValueError,
-                        "Month out of range in datetime string \"%s\"", str);
-            goto error;
-        }
-        substr += 2;
-        sublen -= 2;
-    }
-    else {
-        goto parse_error;
-    }
-
-    /* Next character must be a '-' or the end of the string */
-    if (sublen == 0) {
-        if (out_local != NULL) {
-            *out_local = 0;
-        }
-        bestunit = PANDAS_FR_M;
-        goto finish;
-    }
-    else if (*substr == '-') {
-        ++substr;
-        --sublen;
-    }
-    else {
-        goto parse_error;
-    }
-
-    /* Can't have a trailing '-' */
-    if (sublen == 0) {
-        goto parse_error;
-    }
-
-    /* PARSE THE DAY (2 digits) */
-    if (sublen >= 2 && isdigit(substr[0]) && isdigit(substr[1])) {
-        out->day = 10 * (substr[0] - '0') + (substr[1] - '0');
-
-        if (out->day < 1 ||
-                    out->day > days_per_month_table[year_leap][out->month-1]) {
-            PyErr_Format(PyExc_ValueError,
-                        "Day out of range in datetime string \"%s\"", str);
-            goto error;
-        }
-        substr += 2;
-        sublen -= 2;
-    }
-    else {
-        goto parse_error;
-    }
-
-    /* Next character must be a 'T', ' ', or end of string */
-    if (sublen == 0) {
-        if (out_local != NULL) {
-            *out_local = 0;
-        }
-        bestunit = PANDAS_FR_D;
-        goto finish;
-    }
-    else if (*substr != 'T' && *substr != ' ') {
-        goto parse_error;
-    }
-    else {
-        ++substr;
-        --sublen;
-    }
-
-    /* PARSE THE HOURS (2 digits) */
-    if (sublen >= 2 && isdigit(substr[0]) && isdigit(substr[1])) {
-        out->hour = 10 * (substr[0] - '0') + (substr[1] - '0');
-
-        if (out->hour < 0 || out->hour >= 24) {
-            PyErr_Format(PyExc_ValueError,
-                        "Hours out of range in datetime string \"%s\"", str);
-            goto error;
-        }
-        substr += 2;
-        sublen -= 2;
-    }
-    else {
-        goto parse_error;
-    }
-
-    /* Next character must be a ':' or the end of the string */
-    if (sublen > 0 && *substr == ':') {
-        ++substr;
-        --sublen;
-    }
-    else {
-        bestunit = PANDAS_FR_h;
-        goto parse_timezone;
-    }
-
-    /* Can't have a trailing ':' */
-    if (sublen == 0) {
-        goto parse_error;
-    }
-
-    /* PARSE THE MINUTES (2 digits) */
-    if (sublen >= 2 && isdigit(substr[0]) && isdigit(substr[1])) {
-        out->min = 10 * (substr[0] - '0') + (substr[1] - '0');
-
-        if (out->hour < 0 || out->min >= 60) {
-            PyErr_Format(PyExc_ValueError,
-                        "Minutes out of range in datetime string \"%s\"", str);
-            goto error;
-        }
-        substr += 2;
-        sublen -= 2;
-    }
-    else {
-        goto parse_error;
-    }
-
-    /* Next character must be a ':' or the end of the string */
-    if (sublen > 0 && *substr == ':') {
-        ++substr;
-        --sublen;
-    }
-    else {
-        bestunit = PANDAS_FR_m;
-        goto parse_timezone;
-    }
-
-    /* Can't have a trailing ':' */
-    if (sublen == 0) {
-        goto parse_error;
-    }
-
-    /* PARSE THE SECONDS (2 digits) */
-    if (sublen >= 2 && isdigit(substr[0]) && isdigit(substr[1])) {
-        out->sec = 10 * (substr[0] - '0') + (substr[1] - '0');
-
-        if (out->sec < 0 || out->sec >= 60) {
-            PyErr_Format(PyExc_ValueError,
-                        "Seconds out of range in datetime string \"%s\"", str);
-            goto error;
-        }
-        substr += 2;
-        sublen -= 2;
-    }
-    else {
-        goto parse_error;
-    }
-
-    /* Next character may be a '.' indicating fractional seconds */
-    if (sublen > 0 && *substr == '.') {
-        ++substr;
-        --sublen;
-    }
-    else {
-        bestunit = PANDAS_FR_s;
-        goto parse_timezone;
-    }
-
-    /* PARSE THE MICROSECONDS (0 to 6 digits) */
-    numdigits = 0;
-    for (i = 0; i < 6; ++i) {
-        out->us *= 10;
-        if (sublen > 0  && isdigit(*substr)) {
-            out->us += (*substr - '0');
-            ++substr;
-            --sublen;
-            ++numdigits;
-        }
-    }
-
-    if (sublen == 0 || !isdigit(*substr)) {
-        if (numdigits > 3) {
-            bestunit = PANDAS_FR_us;
-        }
-        else {
-            bestunit = PANDAS_FR_ms;
-        }
-        goto parse_timezone;
-    }
-
-    /* PARSE THE PICOSECONDS (0 to 6 digits) */
-    numdigits = 0;
-    for (i = 0; i < 6; ++i) {
-        out->ps *= 10;
-        if (sublen > 0 && isdigit(*substr)) {
-            out->ps += (*substr - '0');
-            ++substr;
-            --sublen;
-            ++numdigits;
-        }
-    }
-
-    if (sublen == 0 || !isdigit(*substr)) {
-        if (numdigits > 3) {
-            bestunit = PANDAS_FR_ps;
-        }
-        else {
-            bestunit = PANDAS_FR_ns;
-        }
-        goto parse_timezone;
-    }
-
-    /* PARSE THE ATTOSECONDS (0 to 6 digits) */
-    numdigits = 0;
-    for (i = 0; i < 6; ++i) {
-        out->as *= 10;
-        if (sublen > 0 && isdigit(*substr)) {
-            out->as += (*substr - '0');
-            ++substr;
-            --sublen;
-            ++numdigits;
-        }
-    }
-
-    if (numdigits > 3) {
-        bestunit = PANDAS_FR_as;
-    }
-    else {
-        bestunit = PANDAS_FR_fs;
-    }
-
-parse_timezone:
-    if (sublen == 0) {
-        // Unlike NumPy, treating no time zone as naive
-        goto finish;
-    }
-
-    /* UTC specifier */
-    if (*substr == 'Z') {
-        /* "Z" should be equivalent to tz offset "+00:00" */
-        if (out_local != NULL) {
-            *out_local = 1;
-        }
-
-        if (out_tzoffset != NULL) {
-            *out_tzoffset = 0;
-         }
-
-        if (sublen == 1) {
-            goto finish;
-        }
-        else {
-            ++substr;
-            --sublen;
-        }
-    }
-    /* Time zone offset */
-    else if (*substr == '-' || *substr == '+') {
-        int offset_neg = 0, offset_hour = 0, offset_minute = 0;
-
-        /*
-         * Since "local" means local with respect to the current
-         * machine, we say this is non-local.
-         */
-
-        if (*substr == '-') {
-            offset_neg = 1;
-        }
-        ++substr;
-        --sublen;
-
-        /* The hours offset */
-        if (sublen >= 2 && isdigit(substr[0]) && isdigit(substr[1])) {
-            offset_hour = 10 * (substr[0] - '0') + (substr[1] - '0');
-            substr += 2;
-            sublen -= 2;
-            if (offset_hour >= 24) {
-                PyErr_Format(PyExc_ValueError,
-                            "Timezone hours offset out of range "
-                            "in datetime string \"%s\"", str);
-                goto error;
-            }
-        }
-        else {
-            goto parse_error;
-        }
-
-        /* The minutes offset is optional */
-        if (sublen > 0) {
-            /* Optional ':' */
-            if (*substr == ':') {
-                ++substr;
-                --sublen;
-            }
-
-            /* The minutes offset (at the end of the string) */
-            if (sublen >= 2 && isdigit(substr[0]) && isdigit(substr[1])) {
-                offset_minute = 10 * (substr[0] - '0') + (substr[1] - '0');
-                substr += 2;
-                sublen -= 2;
-                if (offset_minute >= 60) {
-                    PyErr_Format(PyExc_ValueError,
-                                "Timezone minutes offset out of range "
-                                "in datetime string \"%s\"", str);
-                    goto error;
-                }
-            }
-            else {
-                goto parse_error;
-            }
-        }
-
-        /* Apply the time zone offset */
-        if (offset_neg) {
-            offset_hour = -offset_hour;
-            offset_minute = -offset_minute;
-        }
-        if (out_local != NULL) {
-            *out_local = 1;
-            // Unlike NumPy, do not change internal value to local time
-            *out_tzoffset = 60 * offset_hour - offset_minute;
-        }
-    }
-
-    /* Skip trailing whitespace */
-    while (sublen > 0 && isspace(*substr)) {
-        ++substr;
-        --sublen;
-    }
-
-    if (sublen != 0) {
-        goto parse_error;
-    }
-
-finish:
-    if (out_bestunit != NULL) {
-        *out_bestunit = bestunit;
-    }
-
-    /* Check the casting rule */
-    if (unit != -1 && !can_cast_datetime64_units(bestunit, unit,
-                                                 casting)) {
-        PyErr_Format(PyExc_TypeError, "Cannot parse \"%s\" as unit "
-                     "'%s' using casting rule %s",
-                     str, _datetime_strings[unit],
-                     npy_casting_to_string(casting));
-        return -1;
-    }
-
-    return 0;
-
-parse_error:
-    PyErr_Format(PyExc_ValueError,
-            "Error parsing datetime string \"%s\" at position %d",
-            str, (int)(substr-str));
-    return -1;
-
-error:
-    return -1;
-}
-
-/*
- * Provides a string length to use for converting datetime
- * objects with the given local and unit settings.
- */
-int
-get_datetime_iso_8601_strlen(int local, PANDAS_DATETIMEUNIT base)
-{
-    int len = 0;
-
-    /* If no unit is provided, return the maximum length */
-    if (base == -1) {
-        return PANDAS_DATETIME_MAX_ISO8601_STRLEN;
-    }
-
-    switch (base) {
-        /* Generic units can only be used to represent NaT */
-        /*case PANDAS_FR_GENERIC:*/
-        /*    return 4;*/
-        case PANDAS_FR_as:
-            len += 3;  /* "###" */
-        case PANDAS_FR_fs:
-            len += 3;  /* "###" */
-        case PANDAS_FR_ps:
-            len += 3;  /* "###" */
-        case PANDAS_FR_ns:
-            len += 3;  /* "###" */
-        case PANDAS_FR_us:
-            len += 3;  /* "###" */
-        case PANDAS_FR_ms:
-            len += 4;  /* ".###" */
-        case PANDAS_FR_s:
-            len += 3;  /* ":##" */
-        case PANDAS_FR_m:
-            len += 3;  /* ":##" */
-        case PANDAS_FR_h:
-            len += 3;  /* "T##" */
-        case PANDAS_FR_D:
-        case PANDAS_FR_W:
-            len += 3;  /* "-##" */
-        case PANDAS_FR_M:
-            len += 3;  /* "-##" */
-        case PANDAS_FR_Y:
-            len += 21; /* 64-bit year */
-            break;
-        default:
-            len += 3; /* handle the now defunct NPY_FR_B */
-            break;
-    }
-
-    if (base >= PANDAS_FR_h) {
-        if (local) {
-            len += 5;  /* "+####" or "-####" */
-        }
-        else {
-            len += 1;  /* "Z" */
-        }
-    }
-
-    len += 1; /* NULL terminator */
-
-    return len;
-}
-
-/*
- * Finds the largest unit whose value is nonzero, and for which
- * the remainder for the rest of the units is zero.
- */
-static PANDAS_DATETIMEUNIT
-lossless_unit_from_datetimestruct(pandas_datetimestruct *dts)
-{
-    if (dts->as % 1000 != 0) {
-        return PANDAS_FR_as;
-    }
-    else if (dts->as != 0) {
-        return PANDAS_FR_fs;
-    }
-    else if (dts->ps % 1000 != 0) {
-        return PANDAS_FR_ps;
-    }
-    else if (dts->ps != 0) {
-        return PANDAS_FR_ns;
-    }
-    else if (dts->us % 1000 != 0) {
-        return PANDAS_FR_us;
-    }
-    else if (dts->us != 0) {
-        return PANDAS_FR_ms;
-    }
-    else if (dts->sec != 0) {
-        return PANDAS_FR_s;
-    }
-    else if (dts->min != 0) {
-        return PANDAS_FR_m;
-    }
-    else if (dts->hour != 0) {
-        return PANDAS_FR_h;
-    }
-    else if (dts->day != 1) {
-        return PANDAS_FR_D;
-    }
-    else if (dts->month != 1) {
-        return PANDAS_FR_M;
-    }
-    else {
-        return PANDAS_FR_Y;
-    }
-}
-
-/*
- * Converts an pandas_datetimestruct to an (almost) ISO 8601
- * NULL-terminated string. If the string fits in the space exactly,
- * it leaves out the NULL terminator and returns success.
- *
- * The differences from ISO 8601 are the 'NaT' string, and
- * the number of year digits is >= 4 instead of strictly 4.
- *
- * If 'local' is non-zero, it produces a string in local time with
- * a +-#### timezone offset, otherwise it uses timezone Z (UTC).
- *
- * 'base' restricts the output to that unit. Set 'base' to
- * -1 to auto-detect a base after which all the values are zero.
- *
- *  'tzoffset' is used if 'local' is enabled, and 'tzoffset' is
- *  set to a value other than -1. This is a manual override for
- *  the local time zone to use, as an offset in minutes.
- *
- *  'casting' controls whether data loss is allowed by truncating
- *  the data to a coarser unit. This interacts with 'local', slightly,
- *  in order to form a date unit string as a local time, the casting
- *  must be unsafe.
- *
- *  Returns 0 on success, -1 on failure (for example if the output
- *  string was too short).
- */
-int
-make_iso_8601_datetime(pandas_datetimestruct *dts, char *outstr, int outlen,
-                    int local, PANDAS_DATETIMEUNIT base, int tzoffset,
-                    NPY_CASTING casting)
-{
-    pandas_datetimestruct dts_local;
-    int timezone_offset = 0;
-
-    char *substr = outstr, sublen = outlen;
-    int tmplen;
-
-    /* Only do local time within a reasonable year range */
-    if ((dts->year <= 1800 || dts->year >= 10000) && tzoffset == -1) {
-        local = 0;
-    }
-
-    /* Automatically detect a good unit */
-    if (base == -1) {
-        base = lossless_unit_from_datetimestruct(dts);
-        /*
-         * If there's a timezone, use at least minutes precision,
-         * and never split up hours and minutes by default
-         */
-        if ((base < PANDAS_FR_m && local) || base == PANDAS_FR_h) {
-            base = PANDAS_FR_m;
-        }
-        /* Don't split up dates by default */
-        else if (base < PANDAS_FR_D) {
-            base = PANDAS_FR_D;
-        }
-    }
-    /*
-     * Print weeks with the same precision as days.
-     *
-     * TODO: Could print weeks with YYYY-Www format if the week
-     *       epoch is a Monday.
-     */
-    else if (base == PANDAS_FR_W) {
-        base = PANDAS_FR_D;
-    }
-
-    /* Use the C API to convert from UTC to local time */
-    if (local && tzoffset == -1) {
-        if (convert_datetimestruct_utc_to_local(&dts_local, dts,
-                                                &timezone_offset) < 0) {
-            return -1;
-        }
-
-        /* Set dts to point to our local time instead of the UTC time */
-        dts = &dts_local;
-    }
-    /* Use the manually provided tzoffset */
-    else if (local) {
-        /* Make a copy of the pandas_datetimestruct we can modify */
-        dts_local = *dts;
-        dts = &dts_local;
-
-        /* Set and apply the required timezone offset */
-        timezone_offset = tzoffset;
-        add_minutes_to_datetimestruct(dts, timezone_offset);
-    }
-
-    /*
-     * Now the datetimestruct data is in the final form for
-     * the string representation, so ensure that the data
-     * is being cast according to the casting rule.
-     */
-    if (casting != NPY_UNSAFE_CASTING) {
-        /* Producing a date as a local time is always 'unsafe' */
-        if (base <= PANDAS_FR_D && local) {
-            PyErr_SetString(PyExc_TypeError, "Cannot create a local "
-                        "timezone-based date string from a NumPy "
-                        "datetime without forcing 'unsafe' casting");
-            return -1;
-        }
-        /* Only 'unsafe' and 'same_kind' allow data loss */
-        else {
-            PANDAS_DATETIMEUNIT unitprec;
-
-            unitprec = lossless_unit_from_datetimestruct(dts);
-            if (casting != NPY_SAME_KIND_CASTING && unitprec > base) {
-                PyErr_Format(PyExc_TypeError, "Cannot create a "
-                            "string with unit precision '%s' "
-                            "from the NumPy datetime, which has data at "
-                            "unit precision '%s', "
-                            "requires 'unsafe' or 'same_kind' casting",
-                             _datetime_strings[base],
-                             _datetime_strings[unitprec]);
-                return -1;
-            }
-        }
-    }
-
-    /* YEAR */
-    /*
-     * Can't use PyOS_snprintf, because it always produces a '\0'
-     * character at the end, and NumPy string types are permitted
-     * to have data all the way to the end of the buffer.
-     */
-#ifdef _WIN32
-    tmplen = _snprintf(substr, sublen, "%04" NPY_INT64_FMT, dts->year);
-#else
-    tmplen = snprintf(substr, sublen, "%04" NPY_INT64_FMT, dts->year);
-#endif
-    /* If it ran out of space or there isn't space for the NULL terminator */
-    if (tmplen < 0 || tmplen > sublen) {
-        goto string_too_short;
-    }
-    substr += tmplen;
-    sublen -= tmplen;
-
-    /* Stop if the unit is years */
-    if (base == PANDAS_FR_Y) {
-        if (sublen > 0) {
-            *substr = '\0';
-        }
-        return 0;
-    }
-
-    /* MONTH */
-    if (sublen < 1 ) {
-        goto string_too_short;
-    }
-    substr[0] = '-';
-    if (sublen < 2 ) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->month / 10) + '0');
-    if (sublen < 3 ) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->month % 10) + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is months */
-    if (base == PANDAS_FR_M) {
-        if (sublen > 0) {
-            *substr = '\0';
-        }
-        return 0;
-    }
-
-    /* DAY */
-    if (sublen < 1 ) {
-        goto string_too_short;
-    }
-    substr[0] = '-';
-    if (sublen < 2 ) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->day / 10) + '0');
-    if (sublen < 3 ) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->day % 10) + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is days */
-    if (base == PANDAS_FR_D) {
-        if (sublen > 0) {
-            *substr = '\0';
-        }
-        return 0;
-    }
-
-    /* HOUR */
-    if (sublen < 1 ) {
-        goto string_too_short;
-    }
-    substr[0] = 'T';
-    if (sublen < 2 ) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->hour / 10) + '0');
-    if (sublen < 3 ) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->hour % 10) + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is hours */
-    if (base == PANDAS_FR_h) {
-        goto add_time_zone;
-    }
-
-    /* MINUTE */
-    if (sublen < 1 ) {
-        goto string_too_short;
-    }
-    substr[0] = ':';
-    if (sublen < 2 ) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->min / 10) + '0');
-    if (sublen < 3 ) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->min % 10) + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is minutes */
-    if (base == PANDAS_FR_m) {
-        goto add_time_zone;
-    }
-
-    /* SECOND */
-    if (sublen < 1 ) {
-        goto string_too_short;
-    }
-    substr[0] = ':';
-    if (sublen < 2 ) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->sec / 10) + '0');
-    if (sublen < 3 ) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->sec % 10) + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is seconds */
-    if (base == PANDAS_FR_s) {
-        goto add_time_zone;
-    }
-
-    /* MILLISECOND */
-    if (sublen < 1 ) {
-        goto string_too_short;
-    }
-    substr[0] = '.';
-    if (sublen < 2 ) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->us / 100000) % 10 + '0');
-    if (sublen < 3 ) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->us / 10000) % 10 + '0');
-    if (sublen < 4 ) {
-        goto string_too_short;
-    }
-    substr[3] = (char)((dts->us / 1000) % 10 + '0');
-    substr += 4;
-    sublen -= 4;
-
-    /* Stop if the unit is milliseconds */
-    if (base == PANDAS_FR_ms) {
-        goto add_time_zone;
-    }
-
-    /* MICROSECOND */
-    if (sublen < 1 ) {
-        goto string_too_short;
-    }
-    substr[0] = (char)((dts->us / 100) % 10 + '0');
-    if (sublen < 2 ) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->us / 10) % 10 + '0');
-    if (sublen < 3 ) {
-        goto string_too_short;
-    }
-    substr[2] = (char)(dts->us % 10 + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is microseconds */
-    if (base == PANDAS_FR_us) {
-        goto add_time_zone;
-    }
-
-    /* NANOSECOND */
-    if (sublen < 1 ) {
-        goto string_too_short;
-    }
-    substr[0] = (char)((dts->ps / 100000) % 10 + '0');
-    if (sublen < 2 ) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->ps / 10000) % 10 + '0');
-    if (sublen < 3 ) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->ps / 1000) % 10 + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is nanoseconds */
-    if (base == PANDAS_FR_ns) {
-        goto add_time_zone;
-    }
-
-    /* PICOSECOND */
-    if (sublen < 1 ) {
-        goto string_too_short;
-    }
-    substr[0] = (char)((dts->ps / 100) % 10 + '0');
-    if (sublen < 2 ) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->ps / 10) % 10 + '0');
-    if (sublen < 3 ) {
-        goto string_too_short;
-    }
-    substr[2] = (char)(dts->ps % 10 + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is picoseconds */
-    if (base == PANDAS_FR_ps) {
-        goto add_time_zone;
-    }
-
-    /* FEMTOSECOND */
-    if (sublen < 1 ) {
-        goto string_too_short;
-    }
-    substr[0] = (char)((dts->as / 100000) % 10 + '0');
-    if (sublen < 2 ) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->as / 10000) % 10 + '0');
-    if (sublen < 3 ) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->as / 1000) % 10 + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is femtoseconds */
-    if (base == PANDAS_FR_fs) {
-        goto add_time_zone;
-    }
-
-    /* ATTOSECOND */
-    if (sublen < 1 ) {
-        goto string_too_short;
-    }
-    substr[0] = (char)((dts->as / 100) % 10 + '0');
-    if (sublen < 2 ) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->as / 10) % 10 + '0');
-    if (sublen < 3 ) {
-        goto string_too_short;
-    }
-    substr[2] = (char)(dts->as % 10 + '0');
-    substr += 3;
-    sublen -= 3;
-
-add_time_zone:
-    if (local) {
-        /* Add the +/- sign */
-        if (sublen < 1) {
-            goto string_too_short;
-        }
-        if (timezone_offset < 0) {
-            substr[0] = '-';
-            timezone_offset = -timezone_offset;
-        }
-        else {
-            substr[0] = '+';
-        }
-        substr += 1;
-        sublen -= 1;
-
-        /* Add the timezone offset */
-        if (sublen < 1 ) {
-            goto string_too_short;
-        }
-        substr[0] = (char)((timezone_offset / (10*60)) % 10 + '0');
-        if (sublen < 2 ) {
-            goto string_too_short;
-        }
-        substr[1] = (char)((timezone_offset / 60) % 10 + '0');
-        if (sublen < 3 ) {
-            goto string_too_short;
-        }
-        substr[2] = (char)(((timezone_offset % 60) / 10) % 10 + '0');
-        if (sublen < 4 ) {
-            goto string_too_short;
-        }
-        substr[3] = (char)((timezone_offset % 60) % 10 + '0');
-        substr += 4;
-        sublen -= 4;
-    }
-    /* UTC "Zulu" time */
-    else {
-        if (sublen < 1) {
-            goto string_too_short;
-        }
-        substr[0] = 'Z';
-        substr += 1;
-        sublen -= 1;
-    }
-
-    /* Add a NULL terminator, and return */
-    if (sublen > 0) {
-        substr[0] = '\0';
-    }
-
-    return 0;
-
-string_too_short:
-    PyErr_Format(PyExc_RuntimeError,
-                "The string provided for NumPy ISO datetime formatting "
-                "was too short, with length %d",
-                outlen);
-    return -1;
-}
diff --git a/pandas/src/datetime/np_datetime_strings.h b/pandas/src/datetime/np_datetime_strings.h
deleted file mode 100644
index 0d9a0944310fb..0000000000000
--- a/pandas/src/datetime/np_datetime_strings.h
+++ /dev/null
@@ -1,89 +0,0 @@
-/*
- * This is derived from numpy 1.7. See NP_LICENSE.txt
- */
-
-#ifndef _NPY_PRIVATE__DATETIME_STRINGS_H_
-#define _NPY_PRIVATE__DATETIME_STRINGS_H_
-
-/*
- * Parses (almost) standard ISO 8601 date strings. The differences are:
- *
- * + The date "20100312" is parsed as the year 20100312, not as
- *   equivalent to "2010-03-12". The '-' in the dates are not optional.
- * + Only seconds may have a decimal point, with up to 18 digits after it
- *   (maximum attoseconds precision).
- * + Either a 'T' as in ISO 8601 or a ' ' may be used to separate
- *   the date and the time. Both are treated equivalently.
- * + Doesn't (yet) handle the "YYYY-DDD" or "YYYY-Www" formats.
- * + Doesn't handle leap seconds (seconds value has 60 in these cases).
- * + Doesn't handle 24:00:00 as synonym for midnight (00:00:00) tomorrow
- * + Accepts special values "NaT" (not a time), "Today", (current
- *   day according to local time) and "Now" (current time in UTC).
- *
- * 'str' must be a NULL-terminated string, and 'len' must be its length.
- * 'unit' should contain -1 if the unit is unknown, or the unit
- *      which will be used if it is.
- * 'casting' controls how the detected unit from the string is allowed
- *           to be cast to the 'unit' parameter.
- *
- * 'out' gets filled with the parsed date-time.
- * 'out_local' gets whether returned value contains timezone. 0 for UTC, 1 for local time.
- * 'out_tzoffset' gets set to timezone offset by minutes
- *      if the parsed time was in local time,
- *      to 0 otherwise. The values 'now' and 'today' don't get counted
- *      as local, and neither do UTC +/-#### timezone offsets, because
- *      they aren't using the computer's local timezone offset.
- * 'out_bestunit' gives a suggested unit based on the amount of
- *      resolution provided in the string, or -1 for NaT.
- * 'out_special' gets set to 1 if the parsed time was 'today',
- *      'now', or ''/'NaT'. For 'today', the unit recommended is
- *      'D', for 'now', the unit recommended is 's', and for 'NaT'
- *      the unit recommended is 'Y'.
- *
- * Returns 0 on success, -1 on failure.
- */
-int
-parse_iso_8601_datetime(char *str, int len,
-                    PANDAS_DATETIMEUNIT unit,
-                    NPY_CASTING casting,
-                    pandas_datetimestruct *out,
-                    int *out_local,
-                    int *out_tzoffset,
-                    PANDAS_DATETIMEUNIT *out_bestunit,
-                    npy_bool *out_special);
-
-/*
- * Provides a string length to use for converting datetime
- * objects with the given local and unit settings.
- */
-int
-get_datetime_iso_8601_strlen(int local, PANDAS_DATETIMEUNIT base);
-
-/*
- * Converts an pandas_datetimestruct to an (almost) ISO 8601
- * NULL-terminated string.
- *
- * If 'local' is non-zero, it produces a string in local time with
- * a +-#### timezone offset, otherwise it uses timezone Z (UTC).
- *
- * 'base' restricts the output to that unit. Set 'base' to
- * -1 to auto-detect a base after which all the values are zero.
- *
- *  'tzoffset' is used if 'local' is enabled, and 'tzoffset' is
- *  set to a value other than -1. This is a manual override for
- *  the local time zone to use, as an offset in minutes.
- *
- *  'casting' controls whether data loss is allowed by truncating
- *  the data to a coarser unit. This interacts with 'local', slightly,
- *  in order to form a date unit string as a local time, the casting
- *  must be unsafe.
- *
- *  Returns 0 on success, -1 on failure (for example if the output
- *  string was too short).
- */
-int
-make_iso_8601_datetime(pandas_datetimestruct *dts, char *outstr, int outlen,
-                    int local, PANDAS_DATETIMEUNIT base, int tzoffset,
-                    NPY_CASTING casting);
-
-#endif
diff --git a/pandas/src/datetime_helper.h b/pandas/src/datetime_helper.h
deleted file mode 100644
index d78e91e747854..0000000000000
--- a/pandas/src/datetime_helper.h
+++ /dev/null
@@ -1,30 +0,0 @@
-#include "datetime.h"
-#include "numpy/arrayobject.h"
-#include "numpy/arrayscalars.h"
-#include <stdio.h>
-
-#if PY_MAJOR_VERSION >= 3
-#define PyInt_AS_LONG PyLong_AsLong
-#endif
-
-void mangle_nat(PyObject *val) {
-  PyDateTime_GET_MONTH(val) = -1;
-  PyDateTime_GET_DAY(val) = -1;
-}
-
-npy_int64 get_long_attr(PyObject *o, const char *attr) {
-  npy_int64 long_val;
-  PyObject *value = PyObject_GetAttrString(o, attr);
-  long_val = (PyLong_Check(value) ? PyLong_AsLongLong(value) : PyInt_AS_LONG(value));
-  Py_DECREF(value);
-  return long_val;
-}
-
-npy_float64 total_seconds(PyObject *td) {
-  // Python 2.6 compat
-  npy_int64 microseconds = get_long_attr(td, "microseconds");
-  npy_int64 seconds = get_long_attr(td, "seconds");
-  npy_int64 days = get_long_attr(td, "days");
-  npy_int64 days_in_seconds = days * 24LL * 3600LL;
-  return (microseconds + (seconds + days_in_seconds) * 1000000.0) / 1000000.0;
-}
diff --git a/pandas/src/generate_code.py b/pandas/src/generate_code.py
deleted file mode 100644
index 8c5c7d709e5f1..0000000000000
--- a/pandas/src/generate_code.py
+++ /dev/null
@@ -1,2020 +0,0 @@
-"""
-This file generates `generated.pyx` which is then included in `../algos.pyx`
-during building.  To regenerate `generated.pyx`, just run:
-
-    `python generate_code.py`.
-
-"""
-
-from __future__ import print_function
-import os
-from pandas.compat import StringIO
-import numpy as np
-
-_int64_max = np.iinfo(np.int64).max
-
-warning_to_new_contributors = """
-# DO NOT EDIT THIS FILE: This file was autogenerated from generate_code.py, so
-# please edit that file and then run `python2 generate_code.py` to re-generate
-# this file.
-"""
-
-header = """
-cimport numpy as np
-cimport cython
-
-from libc.string cimport memmove
-
-from numpy cimport *
-
-from cpython cimport (PyDict_New, PyDict_GetItem, PyDict_SetItem,
-                      PyDict_Contains, PyDict_Keys,
-                      Py_INCREF, PyTuple_SET_ITEM,
-                      PyTuple_SetItem,
-                      PyTuple_New)
-from cpython cimport PyFloat_Check
-cimport cpython
-
-cdef extern from "numpy/npy_math.h":
-    double NAN "NPY_NAN"
-
-import numpy as np
-isnan = np.isnan
-
-from datetime import datetime as pydatetime
-
-# this is our datetime.pxd
-from datetime cimport *
-
-from khash cimport *
-
-ctypedef unsigned char UChar
-
-cimport util
-from util cimport is_array, _checknull, _checknan, get_nat
-cimport lib
-from lib cimport is_null_datetimelike
-
-cdef int64_t iNaT = get_nat()
-
-# import datetime C API
-PyDateTime_IMPORT
-
-# initialize numpy
-import_array()
-import_ufunc()
-
-cdef int PLATFORM_INT = (<ndarray> np.arange(0, dtype=np.int_)).descr.type_num
-
-cpdef ensure_platform_int(object arr):
-    if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == PLATFORM_INT:
-            return arr
-        else:
-            return arr.astype(np.int_)
-    else:
-        return np.array(arr, dtype=np.int_)
-
-cpdef ensure_object(object arr):
-    if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == NPY_OBJECT:
-            return arr
-        else:
-            return arr.astype(np.object_)
-    elif hasattr(arr,'asobject'):
-        return arr.asobject
-    else:
-        return np.array(arr, dtype=np.object_)
-"""
-
-
-take_1d_template = """
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_%(name)s_%(dest)s(%(c_type_in)s[:] values,
-                              int64_t[:] indexer,
-                              %(c_type_out)s[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        %(c_type_out)s fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    %(nogil)s
-    %(tab)sfor i from 0 <= i < n:
-    %(tab)s    idx = indexer[i]
-    %(tab)s    if idx == -1:
-    %(tab)s        out[i] = fv
-    %(tab)s    else:
-    %(tab)s        out[i] = %(preval)svalues[idx]%(postval)s
-"""
-
-inner_take_2d_axis0_template = """\
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        %(c_type_out)s fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF %(can_copy)s:
-        cdef:
-            %(c_type_out)s *v
-            %(c_type_out)s *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(%(c_type_out)s) and
-            sizeof(%(c_type_out)s) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(%(c_type_out)s) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = %(preval)svalues[idx, j]%(postval)s
-"""
-
-take_2d_axis0_template = """\
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_%(name)s_%(dest)s_memview(%(c_type_in)s[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    %(c_type_out)s[:, :] out,
-                                                    fill_value=np.nan):
-""" + inner_take_2d_axis0_template + """
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_%(name)s_%(dest)s(ndarray[%(c_type_in)s, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    %(c_type_out)s[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_%(name)s_%(dest)s_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-""" + inner_take_2d_axis0_template
-
-
-inner_take_2d_axis1_template = """\
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        %(c_type_out)s fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = %(preval)svalues[i, idx]%(postval)s
-"""
-
-take_2d_axis1_template = """\
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_%(name)s_%(dest)s_memview(%(c_type_in)s[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    %(c_type_out)s[:, :] out,
-                                                    fill_value=np.nan):
-""" + inner_take_2d_axis1_template + """
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_%(name)s_%(dest)s(ndarray[%(c_type_in)s, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    %(c_type_out)s[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_%(name)s_%(dest)s_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-""" + inner_take_2d_axis1_template
-
-
-take_2d_multi_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_%(name)s_%(dest)s(ndarray[%(c_type_in)s, ndim=2] values,
-                                    indexer,
-                                    ndarray[%(c_type_out)s, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        %(c_type_out)s fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = %(preval)svalues[idx, idx1[j]]%(postval)s
-"""
-
-
-
-'''
-Backfilling logic for generating fill vector
-
-Diagram of what's going on
-
-Old      New    Fill vector    Mask
-         .        0               1
-         .        0               1
-         .        0               1
-A        A        0               1
-         .        1               1
-         .        1               1
-         .        1               1
-         .        1               1
-         .        1               1
-B        B        1               1
-         .        2               1
-         .        2               1
-         .        2               1
-C        C        2               1
-         .                        0
-         .                        0
-D
-'''
-
-backfill_template = """@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_%(name)s(ndarray[%(c_type)s] old, ndarray[%(c_type)s] new,
-                      limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef %(c_type)s cur, prev
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[0] > old[nleft - 1]:
-        return indexer
-
-    i = nleft - 1
-    j = nright - 1
-
-    cur = old[nleft - 1]
-
-    while j >= 0 and new[j] > cur:
-        j -= 1
-
-    while True:
-        if j < 0:
-            break
-
-        if i == 0:
-            while j >= 0:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] < cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j -= 1
-            break
-
-        prev = old[i - 1]
-
-        while j >= 0 and prev < new[j] <= cur:
-            if new[j] == cur:
-                indexer[j] = i
-            elif new[j] < cur and fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j -= 1
-
-        fill_count = 0
-        i -= 1
-        cur = prev
-
-    return indexer
-"""
-
-
-pad_template = """@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_%(name)s(ndarray[%(c_type)s] old, ndarray[%(c_type)s] new,
-                   limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef %(c_type)s cur, next
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[nright - 1] < old[0]:
-        return indexer
-
-    i = j = 0
-
-    cur = old[0]
-
-    while j <= nright - 1 and new[j] < cur:
-        j += 1
-
-    while True:
-        if j == nright:
-            break
-
-        if i == nleft - 1:
-            while j < nright:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] > cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j += 1
-            break
-
-        next = old[i + 1]
-
-        while j < nright and cur <= new[j] < next:
-            if new[j] == cur:
-                indexer[j] = i
-            elif fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j += 1
-
-        fill_count = 0
-        i += 1
-        cur = next
-
-    return indexer
-"""
-
-pad_1d_template = """@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_inplace_%(name)s(ndarray[%(c_type)s] values,
-                         ndarray[uint8_t, cast=True] mask,
-                         limit=None):
-    cdef Py_ssize_t i, N
-    cdef %(c_type)s val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[0]
-    for i in range(N):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-"""
-
-pad_2d_template = """@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_2d_inplace_%(name)s(ndarray[%(c_type)s, ndim=2] values,
-                            ndarray[uint8_t, ndim=2] mask,
-                            limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef %(c_type)s val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, 0]
-        for i in range(N):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-"""
-
-backfill_2d_template = """@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_2d_inplace_%(name)s(ndarray[%(c_type)s, ndim=2] values,
-                                 ndarray[uint8_t, ndim=2] mask,
-                                 limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef %(c_type)s val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, N - 1]
-        for i in range(N - 1, -1 , -1):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-"""
-
-backfill_1d_template = """@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_inplace_%(name)s(ndarray[%(c_type)s] values,
-                              ndarray[uint8_t, cast=True] mask,
-                              limit=None):
-    cdef Py_ssize_t i, N
-    cdef %(c_type)s val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[N - 1]
-    for i in range(N - 1, -1 , -1):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-"""
-
-
-diff_2d_template = """@cython.boundscheck(False)
-@cython.wraparound(False)
-def diff_2d_%(name)s(ndarray[%(c_type)s, ndim=2] arr,
-                     ndarray[%(dest_type2)s, ndim=2] out,
-                    Py_ssize_t periods, int axis):
-    cdef:
-        Py_ssize_t i, j, sx, sy
-
-    sx, sy = (<object> arr).shape
-    if arr.flags.f_contiguous:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for j in range(sy):
-                for i in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for j in range(start, stop):
-                for i in range(sx):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-    else:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for i in range(start, stop):
-                for j in range(sy):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for i in range(sx):
-                for j in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-"""
-
-is_monotonic_template = """@cython.boundscheck(False)
-@cython.wraparound(False)
-def is_monotonic_%(name)s(ndarray[%(c_type)s] arr, bint timelike):
-    '''
-    Returns
-    -------
-    is_monotonic_inc, is_monotonic_dec
-    '''
-    cdef:
-        Py_ssize_t i, n
-        %(c_type)s prev, cur
-        bint is_monotonic_inc = 1
-        bint is_monotonic_dec = 1
-
-    n = len(arr)
-
-    if n == 1:
-        if arr[0] != arr[0] or (timelike and arr[0] == iNaT):
-            # single value is NaN
-            return False, False
-        else:
-            return True, True
-    elif n < 2:
-        return True, True
-
-    if timelike and arr[0] == iNaT:
-        return False, False
-
-    %(nogil)s
-    %(tab)sprev = arr[0]
-    %(tab)sfor i in range(1, n):
-    %(tab)s    cur = arr[i]
-    %(tab)s    if timelike and cur == iNaT:
-    %(tab)s        is_monotonic_inc = 0
-    %(tab)s        is_monotonic_dec = 0
-    %(tab)s        break
-    %(tab)s    if cur < prev:
-    %(tab)s        is_monotonic_inc = 0
-    %(tab)s    elif cur > prev:
-    %(tab)s        is_monotonic_dec = 0
-    %(tab)s    elif cur == prev:
-    %(tab)s        pass # is_unique = 0
-    %(tab)s    else:
-    %(tab)s        # cur or prev is NaN
-    %(tab)s        is_monotonic_inc = 0
-    %(tab)s        is_monotonic_dec = 0
-    %(tab)s        break
-    %(tab)s    if not is_monotonic_inc and not is_monotonic_dec:
-    %(tab)s        is_monotonic_inc = 0
-    %(tab)s        is_monotonic_dec = 0
-    %(tab)s        break
-    %(tab)s    prev = cur
-    return is_monotonic_inc, is_monotonic_dec
-"""
-
-map_indices_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-cpdef map_indices_%(name)s(ndarray[%(c_type)s] index):
-    '''
-    Produce a dict mapping the values of the input array to their respective
-    locations.
-
-    Example:
-        array(['hi', 'there']) --> {'hi' : 0 , 'there' : 1}
-
-    Better to do this with Cython because of the enormous speed boost.
-    '''
-    cdef Py_ssize_t i, length
-    cdef dict result = {}
-
-    length = len(index)
-
-    for i in range(length):
-        result[index[i]] = i
-
-    return result
-"""
-
-groupby_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def groupby_%(name)s(ndarray[%(c_type)s] index, ndarray labels):
-    cdef dict result = {}
-    cdef Py_ssize_t i, length
-    cdef list members
-    cdef object idx, key
-
-    length = len(index)
-
-    if not length == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    for i in range(length):
-        key = util.get_value_1d(labels, i)
-
-        if is_null_datetimelike(key):
-            continue
-
-        idx = index[i]
-        if key in result:
-            members = result[key]
-            members.append(idx)
-        else:
-            result[key] = [idx]
-
-    return result
-"""
-
-group_last_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_last_%(name)s(ndarray[%(dest_type2)s, ndim=2] out,
-               ndarray[int64_t] counts,
-               ndarray[%(c_type)s, ndim=2] values,
-               ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        %(dest_type2)s val, count
-        ndarray[%(dest_type2)s, ndim=2] resx
-        ndarray[int64_t, ndim=2] nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
-    resx = np.empty_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab < 0:
-                continue
-
-            counts[lab] += 1
-            for j in range(K):
-                val = values[i, j]
-
-                # not nan
-                if val == val and val != %(nan_val)s:
-                    nobs[lab, j] += 1
-                    resx[lab, j] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = %(nan_val)s
-                else:
-                    out[i, j] = resx[i, j]
-"""
-
-group_nth_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_nth_%(name)s(ndarray[%(dest_type2)s, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[%(c_type)s, ndim=2] values,
-              ndarray[int64_t] labels, int64_t rank):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        %(dest_type2)s val, count
-        ndarray[%(dest_type2)s, ndim=2] resx
-        ndarray[int64_t, ndim=2] nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
-    resx = np.empty_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab < 0:
-                continue
-
-            counts[lab] += 1
-            for j in range(K):
-                val = values[i, j]
-
-                # not nan
-                if val == val and val != %(nan_val)s:
-                    nobs[lab, j] += 1
-                    if nobs[lab, j] == rank:
-                        resx[lab, j] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = %(nan_val)s
-                else:
-                    out[i, j] = resx[i, j]
-"""
-
-group_add_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_add_%(name)s(ndarray[%(dest_type2)s, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[%(c_type)s, ndim=2] values,
-              ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        %(dest_type2)s val, count
-        ndarray[%(dest_type2)s, ndim=2] sumx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    sumx = np.zeros_like(out)
-
-    N, K = (<object> values).shape
-
-
-    with nogil:
-
-        if K > 1:
-
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val:
-                        nobs[lab, j] += 1
-                        sumx[lab, j] += val
-
-        else:
-
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val:
-                    nobs[lab, 0] += 1
-                    sumx[lab, 0] += val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = sumx[i, j]
-"""
-
-group_prod_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_prod_%(name)s(ndarray[%(dest_type2)s, ndim=2] out,
-               ndarray[int64_t] counts,
-               ndarray[%(c_type)s, ndim=2] values,
-               ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        %(dest_type2)s val, count
-        ndarray[%(dest_type2)s, ndim=2] prodx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    prodx = np.ones_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val:
-                        nobs[lab, j] += 1
-                        prodx[lab, j] *= val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val:
-                    nobs[lab, 0] += 1
-                    prodx[lab, 0] *= val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = prodx[i, j]
-"""
-
-group_var_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-@cython.cdivision(True)
-def group_var_%(name)s(ndarray[%(dest_type2)s, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[%(dest_type2)s, ndim=2] values,
-              ndarray[int64_t] labels):
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        %(dest_type2)s val, ct, oldmean
-        ndarray[%(dest_type2)s, ndim=2] nobs, mean
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    mean = np.zeros_like(out)
-
-    N, K = (<object> values).shape
-
-    out[:, :] = 0.0
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab < 0:
-                continue
-
-            counts[lab] += 1
-
-            for j in range(K):
-                val = values[i, j]
-
-                # not nan
-                if val == val:
-                    nobs[lab, j] += 1
-                    oldmean = mean[lab, j]
-                    mean[lab, j] += (val - oldmean) / nobs[lab, j]
-                    out[lab, j] += (val - mean[lab, j]) * (val - oldmean)
-
-        for i in range(ncounts):
-            for j in range(K):
-                ct = nobs[i, j]
-                if ct < 2:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] /= (ct - 1)
-
-"""
-
-# add passing bin edges, instead of labels
-
-
-#----------------------------------------------------------------------
-# group_min, group_max
-
-group_max_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_max_%(name)s(ndarray[%(dest_type2)s, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[%(dest_type2)s, ndim=2] values,
-              ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        %(dest_type2)s val, count
-        ndarray[%(dest_type2)s, ndim=2] maxx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-
-    maxx = np.empty_like(out)
-    maxx.fill(-%(inf_val)s)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val and val != %(nan_val)s:
-                        nobs[lab, j] += 1
-                        if val > maxx[lab, j]:
-                            maxx[lab, j] = val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val and val != %(nan_val)s:
-                    nobs[lab, 0] += 1
-                    if val > maxx[lab, 0]:
-                        maxx[lab, 0] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = %(nan_val)s
-                else:
-                    out[i, j] = maxx[i, j]
-"""
-
-group_min_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_min_%(name)s(ndarray[%(dest_type2)s, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[%(dest_type2)s, ndim=2] values,
-              ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        %(dest_type2)s val, count
-        ndarray[%(dest_type2)s, ndim=2] minx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-
-    minx = np.empty_like(out)
-    minx.fill(%(inf_val)s)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val and val != %(nan_val)s:
-
-                        nobs[lab, j] += 1
-                        if val < minx[lab, j]:
-                            minx[lab, j] = val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val and val != %(nan_val)s:
-                    nobs[lab, 0] += 1
-                    if val < minx[lab, 0]:
-                        minx[lab, 0] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = %(nan_val)s
-                else:
-                    out[i, j] = minx[i, j]
-"""
-
-
-group_mean_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_mean_%(name)s(ndarray[%(dest_type2)s, ndim=2] out,
-               ndarray[int64_t] counts,
-               ndarray[%(dest_type2)s, ndim=2] values,
-               ndarray[int64_t] labels):
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        %(dest_type2)s val, count
-        ndarray[%(dest_type2)s, ndim=2] sumx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    sumx = np.zeros_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-                    # not nan
-                    if val == val:
-                        nobs[lab, j] += 1
-                        sumx[lab, j] += val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-                # not nan
-                if val == val:
-                    nobs[lab, 0] += 1
-                    sumx[lab, 0] += val
-
-        for i in range(ncounts):
-            for j in range(K):
-                count = nobs[i, j]
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = sumx[i, j] / count
-"""
-
-group_ohlc_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_ohlc_%(name)s(ndarray[%(dest_type2)s, ndim=2] out,
-                  ndarray[int64_t] counts,
-                  ndarray[%(dest_type2)s, ndim=2] values,
-                  ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab
-        %(dest_type2)s val, count
-        Py_ssize_t ngroups = len(counts)
-
-    if len(labels) == 0:
-        return
-
-    N, K = (<object> values).shape
-
-    if out.shape[1] != 4:
-        raise ValueError('Output array must have 4 columns')
-
-    if K > 1:
-        raise NotImplementedError("Argument 'values' must have only "
-                                  "one dimension")
-    out.fill(np.nan)
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab == -1:
-                continue
-
-            counts[lab] += 1
-            val = values[i, 0]
-            if val != val:
-                continue
-
-            if out[lab, 0] != out[lab, 0]:
-                out[lab, 0] = out[lab, 1] = out[lab, 2] = out[lab, 3] = val
-            else:
-                out[lab, 1] = max(out[lab, 1], val)
-                out[lab, 2] = min(out[lab, 2], val)
-                out[lab, 3] = val
-"""
-
-arrmap_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def arrmap_%(name)s(ndarray[%(c_type)s] index, object func):
-    cdef Py_ssize_t length = index.shape[0]
-    cdef Py_ssize_t i = 0
-
-    cdef ndarray[object] result = np.empty(length, dtype=np.object_)
-
-    from pandas.lib import maybe_convert_objects
-
-    for i in range(length):
-        result[i] = func(index[i])
-
-    return maybe_convert_objects(result)
-"""
-
-#----------------------------------------------------------------------
-# Joins on ordered, unique indices
-
-# right might contain non-unique values
-
-left_join_unique_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def left_join_indexer_unique_%(name)s(ndarray[%(c_type)s] left,
-                                      ndarray[%(c_type)s] right):
-    cdef:
-        Py_ssize_t i, j, nleft, nright
-        ndarray[int64_t] indexer
-        %(c_type)s lval, rval
-
-    i = 0
-    j = 0
-    nleft = len(left)
-    nright = len(right)
-
-    indexer = np.empty(nleft, dtype=np.int64)
-    while True:
-        if i == nleft:
-            break
-
-        if j == nright:
-            indexer[i] = -1
-            i += 1
-            continue
-
-        rval = right[j]
-
-        while i < nleft - 1 and left[i] == rval:
-            indexer[i] = j
-            i += 1
-
-        if left[i] == right[j]:
-            indexer[i] = j
-            i += 1
-            while i < nleft - 1 and left[i] == rval:
-                indexer[i] = j
-                i += 1
-            j += 1
-        elif left[i] > rval:
-            indexer[i] = -1
-            j += 1
-        else:
-            indexer[i] = -1
-            i += 1
-    return indexer
-"""
-
-# @cython.wraparound(False)
-# @cython.boundscheck(False)
-
-left_join_template = """
-def left_join_indexer_%(name)s(ndarray[%(c_type)s] left,
-                              ndarray[%(c_type)s] right):
-    '''
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    '''
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        %(c_type)s lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[%(c_type)s] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=%(dtype)s)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    i += 1
-                    count += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = left[i]
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-"""
-
-
-inner_join_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def inner_join_indexer_%(name)s(ndarray[%(c_type)s] left,
-                              ndarray[%(c_type)s] right):
-    '''
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    '''
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        %(c_type)s lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[%(c_type)s] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=%(dtype)s)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-"""
-
-
-outer_join_template2 = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def outer_join_indexer_%(name)s(ndarray[%(c_type)s] left,
-                                ndarray[%(c_type)s] right):
-    cdef:
-        Py_ssize_t i, j, nright, nleft, count
-        %(c_type)s lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[%(c_type)s] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        count = nright
-    elif nright == 0:
-        count = nleft
-    else:
-        while True:
-            if i == nleft:
-                count += nright - j
-                break
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                count += 1
-                j += 1
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=%(dtype)s)
-
-    # do it again, but populate the indexers / result
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        for j in range(nright):
-            lindexer[j] = -1
-            rindexer[j] = j
-            result[j] = right[j]
-    elif nright == 0:
-        for i in range(nleft):
-            lindexer[i] = i
-            rindexer[i] = -1
-            result[i] = left[i]
-    else:
-        while True:
-            if i == nleft:
-                while j < nright:
-                    lindexer[count] = -1
-                    rindexer[count] = j
-                    result[count] = right[j]
-                    count += 1
-                    j += 1
-                break
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    count += 1
-                    i += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = lval
-                count += 1
-                i += 1
-            else:
-                lindexer[count] = -1
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                j += 1
-
-    return result, lindexer, rindexer
-"""
-
-outer_join_template = """@cython.wraparound(False)
-@cython.boundscheck(False)
-def outer_join_indexer_%(name)s(ndarray[%(c_type)s] left,
-                                ndarray[%(c_type)s] right):
-    cdef:
-        Py_ssize_t i, j, nright, nleft, count
-        %(c_type)s lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[%(c_type)s] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    while True:
-        if i == nleft:
-            if j == nright:
-                # we are done
-                break
-            else:
-                while j < nright:
-                    j += 1
-                    count += 1
-                break
-        elif j == nright:
-            while i < nleft:
-                i += 1
-                count += 1
-            break
-        else:
-            if left[i] == right[j]:
-                i += 1
-                j += 1
-            elif left[i] < right[j]:
-                i += 1
-            else:
-                j += 1
-
-            count += 1
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=%(dtype)s)
-
-    # do it again, but populate the indexers / result
-
-    i = 0
-    j = 0
-    count = 0
-    while True:
-        if i == nleft:
-            if j == nright:
-                # we are done
-                break
-            else:
-                while j < nright:
-                    lindexer[count] = -1
-                    rindexer[count] = j
-                    result[count] = right[j]
-                    j += 1
-                    count += 1
-                break
-        elif j == nright:
-            while i < nleft:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = left[i]
-                i += 1
-                count += 1
-            break
-        else:
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                i += 1
-                j += 1
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = lval
-                i += 1
-            else:
-                lindexer[count] = -1
-                rindexer[count] = j
-                result[count] = rval
-                j += 1
-
-            count += 1
-
-    return result, lindexer, rindexer
-"""
-
-# ensure_dtype functions
-
-ensure_dtype_template = """
-cpdef ensure_%(name)s(object arr):
-    if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == NPY_%(ctype)s:
-            return arr
-        else:
-            return arr.astype(np.%(dtype)s)
-    else:
-        return np.array(arr, dtype=np.%(dtype)s)
-"""
-
-ensure_functions = [
-    ('float64', 'FLOAT64', 'float64'),
-    ('float32', 'FLOAT32', 'float32'),
-    ('int8', 'INT8', 'int8'),
-    ('int16', 'INT16', 'int16'),
-    ('int32', 'INT32', 'int32'),
-    ('int64', 'INT64', 'int64'),
-    # ('platform_int', 'INT', 'int_'),
-    #('object', 'OBJECT', 'object_'),
-]
-
-def generate_ensure_dtypes():
-    output = StringIO()
-    for name, ctype, dtype in ensure_functions:
-        filled = ensure_dtype_template % locals()
-        output.write(filled)
-    return output.getvalue()
-
-#----------------------------------------------------------------------
-# Fast "put" logic for speeding up interleaving logic
-
-put2d_template = """
-def put2d_%(name)s_%(dest_type)s(ndarray[%(c_type)s, ndim=2, cast=True] values,
-                              ndarray[int64_t] indexer, Py_ssize_t loc,
-                              ndarray[%(dest_type2)s] out):
-    cdef:
-        Py_ssize_t i, j, k
-
-    k = len(values)
-    for j from 0 <= j < k:
-        i = indexer[j]
-        out[i] = values[j, loc]
-"""
-
-
-#-------------------------------------------------------------------------
-# Generators
-
-def generate_put_template(template, use_ints=True, use_floats=True,
-                          use_objects=False, use_datelikes=False):
-    floats_list = [
-        ('float64', 'float64_t', 'float64_t', 'np.float64', True),
-        ('float32', 'float32_t', 'float32_t', 'np.float32', True),
-    ]
-    ints_list = [
-        ('int8',  'int8_t',  'float32_t', 'np.float32', True),
-        ('int16', 'int16_t', 'float32_t', 'np.float32', True),
-        ('int32', 'int32_t', 'float64_t', 'np.float64', True),
-        ('int64', 'int64_t', 'float64_t', 'np.float64', True),
-    ]
-    date_like_list = [
-        ('int64', 'int64_t', 'float64_t', 'np.float64', True),
-    ]
-    object_list = [('object', 'object', 'object', 'np.object_', False)]
-    function_list = []
-    if use_floats:
-        function_list.extend(floats_list)
-    if use_ints:
-        function_list.extend(ints_list)
-    if use_objects:
-        function_list.extend(object_list)
-    if use_datelikes:
-        function_list.extend(date_like_list)
-
-    output = StringIO()
-    for name, c_type, dest_type, dest_dtype, nogil in function_list:
-        func = template % {'name': name,
-                           'c_type': c_type,
-                           'dest_type': dest_type.replace('_t', ''),
-                           'dest_type2': dest_type,
-                           'dest_dtype': dest_dtype,
-                           'nogil' : 'with nogil:' if nogil else '',
-                           'tab' : '    ' if nogil else '' }
-        output.write(func)
-        output.write("\n")
-    return output.getvalue()
-
-def generate_put_min_max_template(template, use_ints=True, use_floats=True,
-                                  use_objects=False, use_datelikes=False):
-    floats_list = [
-        ('float64', 'float64_t', 'NAN', 'np.inf', True),
-        ('float32', 'float32_t', 'NAN', 'np.inf', True),
-    ]
-    ints_list = [
-        ('int64', 'int64_t', 'iNaT', _int64_max, True),
-    ]
-    date_like_list = [
-        ('int64', 'int64_t', 'iNaT', _int64_max, True),
-    ]
-    object_list = [('object', 'object', 'np.nan', 'np.inf', False)]
-    function_list = []
-    if use_floats:
-        function_list.extend(floats_list)
-    if use_ints:
-        function_list.extend(ints_list)
-    if use_objects:
-        function_list.extend(object_list)
-    if use_datelikes:
-        function_list.extend(date_like_list)
-
-    output = StringIO()
-    for name, dest_type, nan_val, inf_val, nogil in function_list:
-        func = template % {'name': name,
-                           'dest_type2': dest_type,
-                           'nan_val': nan_val,
-                           'inf_val': inf_val,
-                           'nogil' : "with nogil:" if nogil else '',
-                           'tab' : '    ' if nogil else '' }
-        output.write(func)
-        output.write("\n")
-    return output.getvalue()
-
-def generate_put_selection_template(template, use_ints=True, use_floats=True,
-                                    use_objects=False, use_datelikes=False):
-    floats_list = [
-        ('float64', 'float64_t', 'float64_t', 'NAN', True),
-        ('float32', 'float32_t', 'float32_t', 'NAN', True),
-    ]
-    ints_list = [
-        ('int64', 'int64_t', 'int64_t', 'iNaT', True),
-    ]
-    date_like_list = [
-        ('int64', 'int64_t', 'int64_t', 'iNaT', True),
-    ]
-    object_list = [('object', 'object', 'object', 'np.nan', False)]
-    function_list = []
-    if use_floats:
-        function_list.extend(floats_list)
-    if use_ints:
-        function_list.extend(ints_list)
-    if use_objects:
-        function_list.extend(object_list)
-    if use_datelikes:
-        function_list.extend(date_like_list)
-
-    output = StringIO()
-    for name, c_type, dest_type, nan_val, nogil in function_list:
-
-        if nogil:
-            nogil = "with nogil:"
-            tab = '    '
-        else:
-            nogil = ''
-            tab = ''
-
-        func = template % {'name': name,
-                           'c_type': c_type,
-                           'dest_type2': dest_type,
-                           'nan_val': nan_val,
-                           'nogil' : nogil,
-                           'tab' : tab }
-        output.write(func)
-        output.write("\n")
-    return output.getvalue()
-
-def generate_take_template(template, exclude=None):
-    # name, dest, ctypein, ctypeout, preval, postval, cancopy, nogil
-    function_list = [
-        ('bool', 'bool', 'uint8_t', 'uint8_t', '', '', True, True),
-        ('bool', 'object', 'uint8_t', 'object',
-         'True if ', ' > 0 else False', False, False),
-        ('int8', 'int8', 'int8_t', 'int8_t', '', '', True, False),
-        ('int8', 'int32', 'int8_t', 'int32_t', '', '', False, True),
-        ('int8', 'int64', 'int8_t', 'int64_t', '', '', False, True),
-        ('int8', 'float64', 'int8_t', 'float64_t', '', '', False, True),
-        ('int16', 'int16', 'int16_t', 'int16_t', '', '', True, True),
-        ('int16', 'int32', 'int16_t', 'int32_t', '', '', False, True),
-        ('int16', 'int64', 'int16_t', 'int64_t', '', '', False, True),
-        ('int16', 'float64', 'int16_t', 'float64_t', '', '', False, True),
-        ('int32', 'int32', 'int32_t', 'int32_t', '', '', True, True),
-        ('int32', 'int64', 'int32_t', 'int64_t', '', '', False, True),
-        ('int32', 'float64', 'int32_t', 'float64_t', '', '', False, True),
-        ('int64', 'int64', 'int64_t', 'int64_t', '', '', True, True),
-        ('int64', 'float64', 'int64_t', 'float64_t', '', '', False, True),
-        ('float32', 'float32', 'float32_t', 'float32_t', '', '', True, True),
-        ('float32', 'float64', 'float32_t', 'float64_t', '', '', False, True),
-        ('float64', 'float64', 'float64_t', 'float64_t', '', '', True, True),
-        ('object', 'object', 'object', 'object', '', '', False, False),
-    ]
-
-    output = StringIO()
-    for (name, dest, c_type_in, c_type_out,
-         preval, postval, can_copy, nogil) in function_list:
-
-        if exclude is not None and name in exclude:
-            continue
-
-        if nogil:
-            nogil = "with nogil:"
-            tab = '    '
-        else:
-            nogil = ''
-            tab = ''
-
-        func = template % {'name': name, 'dest': dest,
-                           'c_type_in': c_type_in, 'c_type_out': c_type_out,
-                           'preval': preval, 'postval': postval,
-                           'can_copy': 'True' if can_copy else 'False',
-                           'nogil' : nogil,
-                           'tab' : tab }
-        output.write(func)
-        output.write("\n")
-    return output.getvalue()
-
-def generate_from_template(template, exclude=None):
-    # name, ctype, capable of holding NA
-    function_list = [
-        ('float64', 'float64_t', 'np.float64', True, True),
-        ('float32', 'float32_t', 'np.float32', True, True),
-        ('object', 'object', 'object', True, False),
-        ('int32', 'int32_t', 'np.int32', False, True),
-        ('int64', 'int64_t', 'np.int64', False, True),
-        ('bool', 'uint8_t', 'np.bool', False, True)
-    ]
-
-    output = StringIO()
-    for name, c_type, dtype, can_hold_na, nogil in function_list:
-        if exclude is not None and name in exclude:
-            continue
-
-        func = template % {'name': name, 'c_type': c_type,
-                           'dtype': dtype,
-                           'raise_on_na': 'False' if can_hold_na else 'True',
-                           'nogil' : 'with nogil:' if nogil else '',
-                           'tab' : '    ' if nogil else '' }
-        output.write(func)
-        output.write("\n")
-    return output.getvalue()
-
-put_2d = [diff_2d_template]
-
-groupbys = [group_add_template,
-            group_prod_template,
-            group_var_template,
-            group_mean_template,
-            group_ohlc_template]
-
-groupby_selection = [group_last_template,
-                     group_nth_template]
-
-groupby_min_max = [group_min_template,
-                   group_max_template]
-
-templates_1d = [map_indices_template,
-                pad_template,
-                backfill_template,
-                pad_1d_template,
-                backfill_1d_template,
-                pad_2d_template,
-                backfill_2d_template,
-                is_monotonic_template,
-                groupby_template,
-                arrmap_template]
-
-nobool_1d_templates = [left_join_unique_template,
-                       left_join_template,
-                       outer_join_template2,
-                       inner_join_template]
-
-take_templates = [take_1d_template,
-                  take_2d_axis0_template,
-                  take_2d_axis1_template,
-                  take_2d_multi_template]
-
-
-def generate_take_cython_file():
-    # Put `generated.pyx` in the same directory as this file
-    directory = os.path.dirname(os.path.realpath(__file__))
-    filename = 'generated.pyx'
-    path = os.path.join(directory, filename)
-
-    with open(path, 'w') as f:
-        print(warning_to_new_contributors, file=f)
-        print(header, file=f)
-
-        print(generate_ensure_dtypes(), file=f)
-
-        for template in templates_1d:
-            print(generate_from_template(template), file=f)
-
-        for template in take_templates:
-            print(generate_take_template(template), file=f)
-
-        for template in put_2d:
-            print(generate_put_template(template), file=f)
-
-        for template in groupbys:
-            print(generate_put_template(template, use_ints=False), file=f)
-
-        for template in groupby_selection:
-            print(generate_put_selection_template(template, use_ints=True),
-                  file=f)
-
-        for template in groupby_min_max:
-            print(generate_put_min_max_template(template, use_ints=True),
-                  file=f)
-
-        for template in nobool_1d_templates:
-            print(generate_from_template(template, exclude=['bool']), file=f)
-
-
-if __name__ == '__main__':
-    generate_take_cython_file()
diff --git a/pandas/src/generated.pyx b/pandas/src/generated.pyx
deleted file mode 100644
index 767e7d6292b6d..0000000000000
--- a/pandas/src/generated.pyx
+++ /dev/null
@@ -1,9784 +0,0 @@
-
-# DO NOT EDIT THIS FILE: This file was autogenerated from generate_code.py, so
-# please edit that file and then run `python2 generate_code.py` to re-generate
-# this file.
-
-
-cimport numpy as np
-cimport cython
-
-from libc.string cimport memmove
-
-from numpy cimport *
-
-from cpython cimport (PyDict_New, PyDict_GetItem, PyDict_SetItem,
-                      PyDict_Contains, PyDict_Keys,
-                      Py_INCREF, PyTuple_SET_ITEM,
-                      PyTuple_SetItem,
-                      PyTuple_New)
-from cpython cimport PyFloat_Check
-cimport cpython
-
-cdef extern from "numpy/npy_math.h":
-    double NAN "NPY_NAN"
-
-import numpy as np
-isnan = np.isnan
-
-from datetime import datetime as pydatetime
-
-# this is our datetime.pxd
-from datetime cimport *
-
-from khash cimport *
-
-ctypedef unsigned char UChar
-
-cimport util
-from util cimport is_array, _checknull, _checknan, get_nat
-cimport lib
-from lib cimport is_null_datetimelike
-
-cdef int64_t iNaT = get_nat()
-
-# import datetime C API
-PyDateTime_IMPORT
-
-# initialize numpy
-import_array()
-import_ufunc()
-
-cdef int PLATFORM_INT = (<ndarray> np.arange(0, dtype=np.int_)).descr.type_num
-
-cpdef ensure_platform_int(object arr):
-    if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == PLATFORM_INT:
-            return arr
-        else:
-            return arr.astype(np.int_)
-    else:
-        return np.array(arr, dtype=np.int_)
-
-cpdef ensure_object(object arr):
-    if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == NPY_OBJECT:
-            return arr
-        else:
-            return arr.astype(np.object_)
-    elif hasattr(arr,'asobject'):
-        return arr.asobject
-    else:
-        return np.array(arr, dtype=np.object_)
-
-
-cpdef ensure_float64(object arr):
-    if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == NPY_FLOAT64:
-            return arr
-        else:
-            return arr.astype(np.float64)
-    else:
-        return np.array(arr, dtype=np.float64)
-
-cpdef ensure_float32(object arr):
-    if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == NPY_FLOAT32:
-            return arr
-        else:
-            return arr.astype(np.float32)
-    else:
-        return np.array(arr, dtype=np.float32)
-
-cpdef ensure_int8(object arr):
-    if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == NPY_INT8:
-            return arr
-        else:
-            return arr.astype(np.int8)
-    else:
-        return np.array(arr, dtype=np.int8)
-
-cpdef ensure_int16(object arr):
-    if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == NPY_INT16:
-            return arr
-        else:
-            return arr.astype(np.int16)
-    else:
-        return np.array(arr, dtype=np.int16)
-
-cpdef ensure_int32(object arr):
-    if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == NPY_INT32:
-            return arr
-        else:
-            return arr.astype(np.int32)
-    else:
-        return np.array(arr, dtype=np.int32)
-
-cpdef ensure_int64(object arr):
-    if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == NPY_INT64:
-            return arr
-        else:
-            return arr.astype(np.int64)
-    else:
-        return np.array(arr, dtype=np.int64)
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cpdef map_indices_float64(ndarray[float64_t] index):
-    '''
-    Produce a dict mapping the values of the input array to their respective
-    locations.
-
-    Example:
-        array(['hi', 'there']) --> {'hi' : 0 , 'there' : 1}
-
-    Better to do this with Cython because of the enormous speed boost.
-    '''
-    cdef Py_ssize_t i, length
-    cdef dict result = {}
-
-    length = len(index)
-
-    for i in range(length):
-        result[index[i]] = i
-
-    return result
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cpdef map_indices_float32(ndarray[float32_t] index):
-    '''
-    Produce a dict mapping the values of the input array to their respective
-    locations.
-
-    Example:
-        array(['hi', 'there']) --> {'hi' : 0 , 'there' : 1}
-
-    Better to do this with Cython because of the enormous speed boost.
-    '''
-    cdef Py_ssize_t i, length
-    cdef dict result = {}
-
-    length = len(index)
-
-    for i in range(length):
-        result[index[i]] = i
-
-    return result
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cpdef map_indices_object(ndarray[object] index):
-    '''
-    Produce a dict mapping the values of the input array to their respective
-    locations.
-
-    Example:
-        array(['hi', 'there']) --> {'hi' : 0 , 'there' : 1}
-
-    Better to do this with Cython because of the enormous speed boost.
-    '''
-    cdef Py_ssize_t i, length
-    cdef dict result = {}
-
-    length = len(index)
-
-    for i in range(length):
-        result[index[i]] = i
-
-    return result
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cpdef map_indices_int32(ndarray[int32_t] index):
-    '''
-    Produce a dict mapping the values of the input array to their respective
-    locations.
-
-    Example:
-        array(['hi', 'there']) --> {'hi' : 0 , 'there' : 1}
-
-    Better to do this with Cython because of the enormous speed boost.
-    '''
-    cdef Py_ssize_t i, length
-    cdef dict result = {}
-
-    length = len(index)
-
-    for i in range(length):
-        result[index[i]] = i
-
-    return result
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cpdef map_indices_int64(ndarray[int64_t] index):
-    '''
-    Produce a dict mapping the values of the input array to their respective
-    locations.
-
-    Example:
-        array(['hi', 'there']) --> {'hi' : 0 , 'there' : 1}
-
-    Better to do this with Cython because of the enormous speed boost.
-    '''
-    cdef Py_ssize_t i, length
-    cdef dict result = {}
-
-    length = len(index)
-
-    for i in range(length):
-        result[index[i]] = i
-
-    return result
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cpdef map_indices_bool(ndarray[uint8_t] index):
-    '''
-    Produce a dict mapping the values of the input array to their respective
-    locations.
-
-    Example:
-        array(['hi', 'there']) --> {'hi' : 0 , 'there' : 1}
-
-    Better to do this with Cython because of the enormous speed boost.
-    '''
-    cdef Py_ssize_t i, length
-    cdef dict result = {}
-
-    length = len(index)
-
-    for i in range(length):
-        result[index[i]] = i
-
-    return result
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_float64(ndarray[float64_t] old, ndarray[float64_t] new,
-                   limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef float64_t cur, next
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[nright - 1] < old[0]:
-        return indexer
-
-    i = j = 0
-
-    cur = old[0]
-
-    while j <= nright - 1 and new[j] < cur:
-        j += 1
-
-    while True:
-        if j == nright:
-            break
-
-        if i == nleft - 1:
-            while j < nright:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] > cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j += 1
-            break
-
-        next = old[i + 1]
-
-        while j < nright and cur <= new[j] < next:
-            if new[j] == cur:
-                indexer[j] = i
-            elif fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j += 1
-
-        fill_count = 0
-        i += 1
-        cur = next
-
-    return indexer
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_float32(ndarray[float32_t] old, ndarray[float32_t] new,
-                   limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef float32_t cur, next
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[nright - 1] < old[0]:
-        return indexer
-
-    i = j = 0
-
-    cur = old[0]
-
-    while j <= nright - 1 and new[j] < cur:
-        j += 1
-
-    while True:
-        if j == nright:
-            break
-
-        if i == nleft - 1:
-            while j < nright:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] > cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j += 1
-            break
-
-        next = old[i + 1]
-
-        while j < nright and cur <= new[j] < next:
-            if new[j] == cur:
-                indexer[j] = i
-            elif fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j += 1
-
-        fill_count = 0
-        i += 1
-        cur = next
-
-    return indexer
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_object(ndarray[object] old, ndarray[object] new,
-                   limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef object cur, next
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[nright - 1] < old[0]:
-        return indexer
-
-    i = j = 0
-
-    cur = old[0]
-
-    while j <= nright - 1 and new[j] < cur:
-        j += 1
-
-    while True:
-        if j == nright:
-            break
-
-        if i == nleft - 1:
-            while j < nright:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] > cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j += 1
-            break
-
-        next = old[i + 1]
-
-        while j < nright and cur <= new[j] < next:
-            if new[j] == cur:
-                indexer[j] = i
-            elif fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j += 1
-
-        fill_count = 0
-        i += 1
-        cur = next
-
-    return indexer
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_int32(ndarray[int32_t] old, ndarray[int32_t] new,
-                   limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef int32_t cur, next
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[nright - 1] < old[0]:
-        return indexer
-
-    i = j = 0
-
-    cur = old[0]
-
-    while j <= nright - 1 and new[j] < cur:
-        j += 1
-
-    while True:
-        if j == nright:
-            break
-
-        if i == nleft - 1:
-            while j < nright:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] > cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j += 1
-            break
-
-        next = old[i + 1]
-
-        while j < nright and cur <= new[j] < next:
-            if new[j] == cur:
-                indexer[j] = i
-            elif fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j += 1
-
-        fill_count = 0
-        i += 1
-        cur = next
-
-    return indexer
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_int64(ndarray[int64_t] old, ndarray[int64_t] new,
-                   limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef int64_t cur, next
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[nright - 1] < old[0]:
-        return indexer
-
-    i = j = 0
-
-    cur = old[0]
-
-    while j <= nright - 1 and new[j] < cur:
-        j += 1
-
-    while True:
-        if j == nright:
-            break
-
-        if i == nleft - 1:
-            while j < nright:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] > cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j += 1
-            break
-
-        next = old[i + 1]
-
-        while j < nright and cur <= new[j] < next:
-            if new[j] == cur:
-                indexer[j] = i
-            elif fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j += 1
-
-        fill_count = 0
-        i += 1
-        cur = next
-
-    return indexer
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_bool(ndarray[uint8_t] old, ndarray[uint8_t] new,
-                   limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef uint8_t cur, next
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[nright - 1] < old[0]:
-        return indexer
-
-    i = j = 0
-
-    cur = old[0]
-
-    while j <= nright - 1 and new[j] < cur:
-        j += 1
-
-    while True:
-        if j == nright:
-            break
-
-        if i == nleft - 1:
-            while j < nright:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] > cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j += 1
-            break
-
-        next = old[i + 1]
-
-        while j < nright and cur <= new[j] < next:
-            if new[j] == cur:
-                indexer[j] = i
-            elif fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j += 1
-
-        fill_count = 0
-        i += 1
-        cur = next
-
-    return indexer
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_float64(ndarray[float64_t] old, ndarray[float64_t] new,
-                      limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef float64_t cur, prev
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[0] > old[nleft - 1]:
-        return indexer
-
-    i = nleft - 1
-    j = nright - 1
-
-    cur = old[nleft - 1]
-
-    while j >= 0 and new[j] > cur:
-        j -= 1
-
-    while True:
-        if j < 0:
-            break
-
-        if i == 0:
-            while j >= 0:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] < cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j -= 1
-            break
-
-        prev = old[i - 1]
-
-        while j >= 0 and prev < new[j] <= cur:
-            if new[j] == cur:
-                indexer[j] = i
-            elif new[j] < cur and fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j -= 1
-
-        fill_count = 0
-        i -= 1
-        cur = prev
-
-    return indexer
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_float32(ndarray[float32_t] old, ndarray[float32_t] new,
-                      limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef float32_t cur, prev
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[0] > old[nleft - 1]:
-        return indexer
-
-    i = nleft - 1
-    j = nright - 1
-
-    cur = old[nleft - 1]
-
-    while j >= 0 and new[j] > cur:
-        j -= 1
-
-    while True:
-        if j < 0:
-            break
-
-        if i == 0:
-            while j >= 0:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] < cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j -= 1
-            break
-
-        prev = old[i - 1]
-
-        while j >= 0 and prev < new[j] <= cur:
-            if new[j] == cur:
-                indexer[j] = i
-            elif new[j] < cur and fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j -= 1
-
-        fill_count = 0
-        i -= 1
-        cur = prev
-
-    return indexer
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_object(ndarray[object] old, ndarray[object] new,
-                      limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef object cur, prev
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[0] > old[nleft - 1]:
-        return indexer
-
-    i = nleft - 1
-    j = nright - 1
-
-    cur = old[nleft - 1]
-
-    while j >= 0 and new[j] > cur:
-        j -= 1
-
-    while True:
-        if j < 0:
-            break
-
-        if i == 0:
-            while j >= 0:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] < cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j -= 1
-            break
-
-        prev = old[i - 1]
-
-        while j >= 0 and prev < new[j] <= cur:
-            if new[j] == cur:
-                indexer[j] = i
-            elif new[j] < cur and fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j -= 1
-
-        fill_count = 0
-        i -= 1
-        cur = prev
-
-    return indexer
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_int32(ndarray[int32_t] old, ndarray[int32_t] new,
-                      limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef int32_t cur, prev
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[0] > old[nleft - 1]:
-        return indexer
-
-    i = nleft - 1
-    j = nright - 1
-
-    cur = old[nleft - 1]
-
-    while j >= 0 and new[j] > cur:
-        j -= 1
-
-    while True:
-        if j < 0:
-            break
-
-        if i == 0:
-            while j >= 0:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] < cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j -= 1
-            break
-
-        prev = old[i - 1]
-
-        while j >= 0 and prev < new[j] <= cur:
-            if new[j] == cur:
-                indexer[j] = i
-            elif new[j] < cur and fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j -= 1
-
-        fill_count = 0
-        i -= 1
-        cur = prev
-
-    return indexer
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_int64(ndarray[int64_t] old, ndarray[int64_t] new,
-                      limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef int64_t cur, prev
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[0] > old[nleft - 1]:
-        return indexer
-
-    i = nleft - 1
-    j = nright - 1
-
-    cur = old[nleft - 1]
-
-    while j >= 0 and new[j] > cur:
-        j -= 1
-
-    while True:
-        if j < 0:
-            break
-
-        if i == 0:
-            while j >= 0:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] < cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j -= 1
-            break
-
-        prev = old[i - 1]
-
-        while j >= 0 and prev < new[j] <= cur:
-            if new[j] == cur:
-                indexer[j] = i
-            elif new[j] < cur and fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j -= 1
-
-        fill_count = 0
-        i -= 1
-        cur = prev
-
-    return indexer
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_bool(ndarray[uint8_t] old, ndarray[uint8_t] new,
-                      limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef uint8_t cur, prev
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[0] > old[nleft - 1]:
-        return indexer
-
-    i = nleft - 1
-    j = nright - 1
-
-    cur = old[nleft - 1]
-
-    while j >= 0 and new[j] > cur:
-        j -= 1
-
-    while True:
-        if j < 0:
-            break
-
-        if i == 0:
-            while j >= 0:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] < cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j -= 1
-            break
-
-        prev = old[i - 1]
-
-        while j >= 0 and prev < new[j] <= cur:
-            if new[j] == cur:
-                indexer[j] = i
-            elif new[j] < cur and fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j -= 1
-
-        fill_count = 0
-        i -= 1
-        cur = prev
-
-    return indexer
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_inplace_float64(ndarray[float64_t] values,
-                         ndarray[uint8_t, cast=True] mask,
-                         limit=None):
-    cdef Py_ssize_t i, N
-    cdef float64_t val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[0]
-    for i in range(N):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_inplace_float32(ndarray[float32_t] values,
-                         ndarray[uint8_t, cast=True] mask,
-                         limit=None):
-    cdef Py_ssize_t i, N
-    cdef float32_t val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[0]
-    for i in range(N):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_inplace_object(ndarray[object] values,
-                         ndarray[uint8_t, cast=True] mask,
-                         limit=None):
-    cdef Py_ssize_t i, N
-    cdef object val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[0]
-    for i in range(N):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_inplace_int32(ndarray[int32_t] values,
-                         ndarray[uint8_t, cast=True] mask,
-                         limit=None):
-    cdef Py_ssize_t i, N
-    cdef int32_t val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[0]
-    for i in range(N):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_inplace_int64(ndarray[int64_t] values,
-                         ndarray[uint8_t, cast=True] mask,
-                         limit=None):
-    cdef Py_ssize_t i, N
-    cdef int64_t val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[0]
-    for i in range(N):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_inplace_bool(ndarray[uint8_t] values,
-                         ndarray[uint8_t, cast=True] mask,
-                         limit=None):
-    cdef Py_ssize_t i, N
-    cdef uint8_t val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[0]
-    for i in range(N):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_inplace_float64(ndarray[float64_t] values,
-                              ndarray[uint8_t, cast=True] mask,
-                              limit=None):
-    cdef Py_ssize_t i, N
-    cdef float64_t val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[N - 1]
-    for i in range(N - 1, -1 , -1):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_inplace_float32(ndarray[float32_t] values,
-                              ndarray[uint8_t, cast=True] mask,
-                              limit=None):
-    cdef Py_ssize_t i, N
-    cdef float32_t val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[N - 1]
-    for i in range(N - 1, -1 , -1):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_inplace_object(ndarray[object] values,
-                              ndarray[uint8_t, cast=True] mask,
-                              limit=None):
-    cdef Py_ssize_t i, N
-    cdef object val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[N - 1]
-    for i in range(N - 1, -1 , -1):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_inplace_int32(ndarray[int32_t] values,
-                              ndarray[uint8_t, cast=True] mask,
-                              limit=None):
-    cdef Py_ssize_t i, N
-    cdef int32_t val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[N - 1]
-    for i in range(N - 1, -1 , -1):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_inplace_int64(ndarray[int64_t] values,
-                              ndarray[uint8_t, cast=True] mask,
-                              limit=None):
-    cdef Py_ssize_t i, N
-    cdef int64_t val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[N - 1]
-    for i in range(N - 1, -1 , -1):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_inplace_bool(ndarray[uint8_t] values,
-                              ndarray[uint8_t, cast=True] mask,
-                              limit=None):
-    cdef Py_ssize_t i, N
-    cdef uint8_t val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    val = values[N - 1]
-    for i in range(N - 1, -1 , -1):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_2d_inplace_float64(ndarray[float64_t, ndim=2] values,
-                            ndarray[uint8_t, ndim=2] mask,
-                            limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef float64_t val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, 0]
-        for i in range(N):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_2d_inplace_float32(ndarray[float32_t, ndim=2] values,
-                            ndarray[uint8_t, ndim=2] mask,
-                            limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef float32_t val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, 0]
-        for i in range(N):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_2d_inplace_object(ndarray[object, ndim=2] values,
-                            ndarray[uint8_t, ndim=2] mask,
-                            limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef object val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, 0]
-        for i in range(N):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_2d_inplace_int32(ndarray[int32_t, ndim=2] values,
-                            ndarray[uint8_t, ndim=2] mask,
-                            limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef int32_t val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, 0]
-        for i in range(N):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_2d_inplace_int64(ndarray[int64_t, ndim=2] values,
-                            ndarray[uint8_t, ndim=2] mask,
-                            limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef int64_t val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, 0]
-        for i in range(N):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_2d_inplace_bool(ndarray[uint8_t, ndim=2] values,
-                            ndarray[uint8_t, ndim=2] mask,
-                            limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef uint8_t val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, 0]
-        for i in range(N):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_2d_inplace_float64(ndarray[float64_t, ndim=2] values,
-                                 ndarray[uint8_t, ndim=2] mask,
-                                 limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef float64_t val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, N - 1]
-        for i in range(N - 1, -1 , -1):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_2d_inplace_float32(ndarray[float32_t, ndim=2] values,
-                                 ndarray[uint8_t, ndim=2] mask,
-                                 limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef float32_t val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, N - 1]
-        for i in range(N - 1, -1 , -1):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_2d_inplace_object(ndarray[object, ndim=2] values,
-                                 ndarray[uint8_t, ndim=2] mask,
-                                 limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef object val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, N - 1]
-        for i in range(N - 1, -1 , -1):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_2d_inplace_int32(ndarray[int32_t, ndim=2] values,
-                                 ndarray[uint8_t, ndim=2] mask,
-                                 limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef int32_t val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, N - 1]
-        for i in range(N - 1, -1 , -1):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_2d_inplace_int64(ndarray[int64_t, ndim=2] values,
-                                 ndarray[uint8_t, ndim=2] mask,
-                                 limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef int64_t val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, N - 1]
-        for i in range(N - 1, -1 , -1):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_2d_inplace_bool(ndarray[uint8_t, ndim=2] values,
-                                 ndarray[uint8_t, ndim=2] mask,
-                                 limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef uint8_t val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if limit < 0:
-            raise ValueError('Limit must be non-negative')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, N - 1]
-        for i in range(N - 1, -1 , -1):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def is_monotonic_float64(ndarray[float64_t] arr, bint timelike):
-    '''
-    Returns
-    -------
-    is_monotonic_inc, is_monotonic_dec
-    '''
-    cdef:
-        Py_ssize_t i, n
-        float64_t prev, cur
-        bint is_monotonic_inc = 1
-        bint is_monotonic_dec = 1
-
-    n = len(arr)
-
-    if n == 1:
-        if arr[0] != arr[0] or (timelike and arr[0] == iNaT):
-            # single value is NaN
-            return False, False
-        else:
-            return True, True
-    elif n < 2:
-        return True, True
-
-    if timelike and arr[0] == iNaT:
-        return False, False
-
-    with nogil:
-        prev = arr[0]
-        for i in range(1, n):
-            cur = arr[i]
-            if timelike and cur == iNaT:
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            if cur < prev:
-                is_monotonic_inc = 0
-            elif cur > prev:
-                is_monotonic_dec = 0
-            elif cur == prev:
-                pass # is_unique = 0
-            else:
-                # cur or prev is NaN
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            if not is_monotonic_inc and not is_monotonic_dec:
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            prev = cur
-    return is_monotonic_inc, is_monotonic_dec
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def is_monotonic_float32(ndarray[float32_t] arr, bint timelike):
-    '''
-    Returns
-    -------
-    is_monotonic_inc, is_monotonic_dec
-    '''
-    cdef:
-        Py_ssize_t i, n
-        float32_t prev, cur
-        bint is_monotonic_inc = 1
-        bint is_monotonic_dec = 1
-
-    n = len(arr)
-
-    if n == 1:
-        if arr[0] != arr[0] or (timelike and arr[0] == iNaT):
-            # single value is NaN
-            return False, False
-        else:
-            return True, True
-    elif n < 2:
-        return True, True
-
-    if timelike and arr[0] == iNaT:
-        return False, False
-
-    with nogil:
-        prev = arr[0]
-        for i in range(1, n):
-            cur = arr[i]
-            if timelike and cur == iNaT:
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            if cur < prev:
-                is_monotonic_inc = 0
-            elif cur > prev:
-                is_monotonic_dec = 0
-            elif cur == prev:
-                pass # is_unique = 0
-            else:
-                # cur or prev is NaN
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            if not is_monotonic_inc and not is_monotonic_dec:
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            prev = cur
-    return is_monotonic_inc, is_monotonic_dec
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def is_monotonic_object(ndarray[object] arr, bint timelike):
-    '''
-    Returns
-    -------
-    is_monotonic_inc, is_monotonic_dec
-    '''
-    cdef:
-        Py_ssize_t i, n
-        object prev, cur
-        bint is_monotonic_inc = 1
-        bint is_monotonic_dec = 1
-
-    n = len(arr)
-
-    if n == 1:
-        if arr[0] != arr[0] or (timelike and arr[0] == iNaT):
-            # single value is NaN
-            return False, False
-        else:
-            return True, True
-    elif n < 2:
-        return True, True
-
-    if timelike and arr[0] == iNaT:
-        return False, False
-
-    
-    prev = arr[0]
-    for i in range(1, n):
-        cur = arr[i]
-        if timelike and cur == iNaT:
-            is_monotonic_inc = 0
-            is_monotonic_dec = 0
-            break
-        if cur < prev:
-            is_monotonic_inc = 0
-        elif cur > prev:
-            is_monotonic_dec = 0
-        elif cur == prev:
-            pass # is_unique = 0
-        else:
-            # cur or prev is NaN
-            is_monotonic_inc = 0
-            is_monotonic_dec = 0
-            break
-        if not is_monotonic_inc and not is_monotonic_dec:
-            is_monotonic_inc = 0
-            is_monotonic_dec = 0
-            break
-        prev = cur
-    return is_monotonic_inc, is_monotonic_dec
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def is_monotonic_int32(ndarray[int32_t] arr, bint timelike):
-    '''
-    Returns
-    -------
-    is_monotonic_inc, is_monotonic_dec
-    '''
-    cdef:
-        Py_ssize_t i, n
-        int32_t prev, cur
-        bint is_monotonic_inc = 1
-        bint is_monotonic_dec = 1
-
-    n = len(arr)
-
-    if n == 1:
-        if arr[0] != arr[0] or (timelike and arr[0] == iNaT):
-            # single value is NaN
-            return False, False
-        else:
-            return True, True
-    elif n < 2:
-        return True, True
-
-    if timelike and arr[0] == iNaT:
-        return False, False
-
-    with nogil:
-        prev = arr[0]
-        for i in range(1, n):
-            cur = arr[i]
-            if timelike and cur == iNaT:
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            if cur < prev:
-                is_monotonic_inc = 0
-            elif cur > prev:
-                is_monotonic_dec = 0
-            elif cur == prev:
-                pass # is_unique = 0
-            else:
-                # cur or prev is NaN
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            if not is_monotonic_inc and not is_monotonic_dec:
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            prev = cur
-    return is_monotonic_inc, is_monotonic_dec
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def is_monotonic_int64(ndarray[int64_t] arr, bint timelike):
-    '''
-    Returns
-    -------
-    is_monotonic_inc, is_monotonic_dec
-    '''
-    cdef:
-        Py_ssize_t i, n
-        int64_t prev, cur
-        bint is_monotonic_inc = 1
-        bint is_monotonic_dec = 1
-
-    n = len(arr)
-
-    if n == 1:
-        if arr[0] != arr[0] or (timelike and arr[0] == iNaT):
-            # single value is NaN
-            return False, False
-        else:
-            return True, True
-    elif n < 2:
-        return True, True
-
-    if timelike and arr[0] == iNaT:
-        return False, False
-
-    with nogil:
-        prev = arr[0]
-        for i in range(1, n):
-            cur = arr[i]
-            if timelike and cur == iNaT:
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            if cur < prev:
-                is_monotonic_inc = 0
-            elif cur > prev:
-                is_monotonic_dec = 0
-            elif cur == prev:
-                pass # is_unique = 0
-            else:
-                # cur or prev is NaN
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            if not is_monotonic_inc and not is_monotonic_dec:
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            prev = cur
-    return is_monotonic_inc, is_monotonic_dec
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def is_monotonic_bool(ndarray[uint8_t] arr, bint timelike):
-    '''
-    Returns
-    -------
-    is_monotonic_inc, is_monotonic_dec
-    '''
-    cdef:
-        Py_ssize_t i, n
-        uint8_t prev, cur
-        bint is_monotonic_inc = 1
-        bint is_monotonic_dec = 1
-
-    n = len(arr)
-
-    if n == 1:
-        if arr[0] != arr[0] or (timelike and arr[0] == iNaT):
-            # single value is NaN
-            return False, False
-        else:
-            return True, True
-    elif n < 2:
-        return True, True
-
-    if timelike and arr[0] == iNaT:
-        return False, False
-
-    with nogil:
-        prev = arr[0]
-        for i in range(1, n):
-            cur = arr[i]
-            if timelike and cur == iNaT:
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            if cur < prev:
-                is_monotonic_inc = 0
-            elif cur > prev:
-                is_monotonic_dec = 0
-            elif cur == prev:
-                pass # is_unique = 0
-            else:
-                # cur or prev is NaN
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            if not is_monotonic_inc and not is_monotonic_dec:
-                is_monotonic_inc = 0
-                is_monotonic_dec = 0
-                break
-            prev = cur
-    return is_monotonic_inc, is_monotonic_dec
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def groupby_float64(ndarray[float64_t] index, ndarray labels):
-    cdef dict result = {}
-    cdef Py_ssize_t i, length
-    cdef list members
-    cdef object idx, key
-
-    length = len(index)
-
-    if not length == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    for i in range(length):
-        key = util.get_value_1d(labels, i)
-
-        if is_null_datetimelike(key):
-            continue
-
-        idx = index[i]
-        if key in result:
-            members = result[key]
-            members.append(idx)
-        else:
-            result[key] = [idx]
-
-    return result
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def groupby_float32(ndarray[float32_t] index, ndarray labels):
-    cdef dict result = {}
-    cdef Py_ssize_t i, length
-    cdef list members
-    cdef object idx, key
-
-    length = len(index)
-
-    if not length == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    for i in range(length):
-        key = util.get_value_1d(labels, i)
-
-        if is_null_datetimelike(key):
-            continue
-
-        idx = index[i]
-        if key in result:
-            members = result[key]
-            members.append(idx)
-        else:
-            result[key] = [idx]
-
-    return result
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def groupby_object(ndarray[object] index, ndarray labels):
-    cdef dict result = {}
-    cdef Py_ssize_t i, length
-    cdef list members
-    cdef object idx, key
-
-    length = len(index)
-
-    if not length == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    for i in range(length):
-        key = util.get_value_1d(labels, i)
-
-        if is_null_datetimelike(key):
-            continue
-
-        idx = index[i]
-        if key in result:
-            members = result[key]
-            members.append(idx)
-        else:
-            result[key] = [idx]
-
-    return result
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def groupby_int32(ndarray[int32_t] index, ndarray labels):
-    cdef dict result = {}
-    cdef Py_ssize_t i, length
-    cdef list members
-    cdef object idx, key
-
-    length = len(index)
-
-    if not length == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    for i in range(length):
-        key = util.get_value_1d(labels, i)
-
-        if is_null_datetimelike(key):
-            continue
-
-        idx = index[i]
-        if key in result:
-            members = result[key]
-            members.append(idx)
-        else:
-            result[key] = [idx]
-
-    return result
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def groupby_int64(ndarray[int64_t] index, ndarray labels):
-    cdef dict result = {}
-    cdef Py_ssize_t i, length
-    cdef list members
-    cdef object idx, key
-
-    length = len(index)
-
-    if not length == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    for i in range(length):
-        key = util.get_value_1d(labels, i)
-
-        if is_null_datetimelike(key):
-            continue
-
-        idx = index[i]
-        if key in result:
-            members = result[key]
-            members.append(idx)
-        else:
-            result[key] = [idx]
-
-    return result
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def groupby_bool(ndarray[uint8_t] index, ndarray labels):
-    cdef dict result = {}
-    cdef Py_ssize_t i, length
-    cdef list members
-    cdef object idx, key
-
-    length = len(index)
-
-    if not length == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    for i in range(length):
-        key = util.get_value_1d(labels, i)
-
-        if is_null_datetimelike(key):
-            continue
-
-        idx = index[i]
-        if key in result:
-            members = result[key]
-            members.append(idx)
-        else:
-            result[key] = [idx]
-
-    return result
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def arrmap_float64(ndarray[float64_t] index, object func):
-    cdef Py_ssize_t length = index.shape[0]
-    cdef Py_ssize_t i = 0
-
-    cdef ndarray[object] result = np.empty(length, dtype=np.object_)
-
-    from pandas.lib import maybe_convert_objects
-
-    for i in range(length):
-        result[i] = func(index[i])
-
-    return maybe_convert_objects(result)
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def arrmap_float32(ndarray[float32_t] index, object func):
-    cdef Py_ssize_t length = index.shape[0]
-    cdef Py_ssize_t i = 0
-
-    cdef ndarray[object] result = np.empty(length, dtype=np.object_)
-
-    from pandas.lib import maybe_convert_objects
-
-    for i in range(length):
-        result[i] = func(index[i])
-
-    return maybe_convert_objects(result)
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def arrmap_object(ndarray[object] index, object func):
-    cdef Py_ssize_t length = index.shape[0]
-    cdef Py_ssize_t i = 0
-
-    cdef ndarray[object] result = np.empty(length, dtype=np.object_)
-
-    from pandas.lib import maybe_convert_objects
-
-    for i in range(length):
-        result[i] = func(index[i])
-
-    return maybe_convert_objects(result)
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def arrmap_int32(ndarray[int32_t] index, object func):
-    cdef Py_ssize_t length = index.shape[0]
-    cdef Py_ssize_t i = 0
-
-    cdef ndarray[object] result = np.empty(length, dtype=np.object_)
-
-    from pandas.lib import maybe_convert_objects
-
-    for i in range(length):
-        result[i] = func(index[i])
-
-    return maybe_convert_objects(result)
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def arrmap_int64(ndarray[int64_t] index, object func):
-    cdef Py_ssize_t length = index.shape[0]
-    cdef Py_ssize_t i = 0
-
-    cdef ndarray[object] result = np.empty(length, dtype=np.object_)
-
-    from pandas.lib import maybe_convert_objects
-
-    for i in range(length):
-        result[i] = func(index[i])
-
-    return maybe_convert_objects(result)
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def arrmap_bool(ndarray[uint8_t] index, object func):
-    cdef Py_ssize_t length = index.shape[0]
-    cdef Py_ssize_t i = 0
-
-    cdef ndarray[object] result = np.empty(length, dtype=np.object_)
-
-    from pandas.lib import maybe_convert_objects
-
-    for i in range(length):
-        result[i] = func(index[i])
-
-    return maybe_convert_objects(result)
-
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_bool_bool(uint8_t[:] values,
-                              int64_t[:] indexer,
-                              uint8_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        uint8_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_bool_object(uint8_t[:] values,
-                              int64_t[:] indexer,
-                              object[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        object fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            out[i] = fv
-        else:
-            out[i] = True if values[idx] > 0 else False
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_int8_int8(int8_t[:] values,
-                              int64_t[:] indexer,
-                              int8_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        int8_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            out[i] = fv
-        else:
-            out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_int8_int32(int8_t[:] values,
-                              int64_t[:] indexer,
-                              int32_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        int32_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_int8_int64(int8_t[:] values,
-                              int64_t[:] indexer,
-                              int64_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        int64_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_int8_float64(int8_t[:] values,
-                              int64_t[:] indexer,
-                              float64_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        float64_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_int16_int16(int16_t[:] values,
-                              int64_t[:] indexer,
-                              int16_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        int16_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_int16_int32(int16_t[:] values,
-                              int64_t[:] indexer,
-                              int32_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        int32_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_int16_int64(int16_t[:] values,
-                              int64_t[:] indexer,
-                              int64_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        int64_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_int16_float64(int16_t[:] values,
-                              int64_t[:] indexer,
-                              float64_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        float64_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_int32_int32(int32_t[:] values,
-                              int64_t[:] indexer,
-                              int32_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        int32_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_int32_int64(int32_t[:] values,
-                              int64_t[:] indexer,
-                              int64_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        int64_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_int32_float64(int32_t[:] values,
-                              int64_t[:] indexer,
-                              float64_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        float64_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_int64_int64(int64_t[:] values,
-                              int64_t[:] indexer,
-                              int64_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        int64_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_int64_float64(int64_t[:] values,
-                              int64_t[:] indexer,
-                              float64_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        float64_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_float32_float32(float32_t[:] values,
-                              int64_t[:] indexer,
-                              float32_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        float32_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_float32_float64(float32_t[:] values,
-                              int64_t[:] indexer,
-                              float64_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        float64_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_float64_float64(float64_t[:] values,
-                              int64_t[:] indexer,
-                              float64_t[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        float64_t fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    with nogil:
-        for i from 0 <= i < n:
-            idx = indexer[i]
-            if idx == -1:
-                out[i] = fv
-            else:
-                out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_1d_object_object(object[:] values,
-                              int64_t[:] indexer,
-                              object[:] out,
-                              fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, n, idx
-        object fv
-
-    n = indexer.shape[0]
-
-    fv = fill_value
-
-    
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            out[i] = fv
-        else:
-            out[i] = values[idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_bool_bool_memview(uint8_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    uint8_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        uint8_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            uint8_t *v
-            uint8_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(uint8_t) and
-            sizeof(uint8_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(uint8_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_bool_bool(ndarray[uint8_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    uint8_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_bool_bool_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        uint8_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            uint8_t *v
-            uint8_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(uint8_t) and
-            sizeof(uint8_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(uint8_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_bool_object_memview(uint8_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    object[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        object fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            object *v
-            object *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(object) and
-            sizeof(object) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(object) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = True if values[idx, j] > 0 else False
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_bool_object(ndarray[uint8_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    object[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_bool_object_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        object fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            object *v
-            object *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(object) and
-            sizeof(object) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(object) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = True if values[idx, j] > 0 else False
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_int8_int8_memview(int8_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int8_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int8_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            int8_t *v
-            int8_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int8_t) and
-            sizeof(int8_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int8_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_int8_int8(ndarray[int8_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int8_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_int8_int8_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int8_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            int8_t *v
-            int8_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int8_t) and
-            sizeof(int8_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int8_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_int8_int32_memview(int8_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int32_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int32_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            int32_t *v
-            int32_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int32_t) and
-            sizeof(int32_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int32_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_int8_int32(ndarray[int8_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int32_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_int8_int32_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int32_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            int32_t *v
-            int32_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int32_t) and
-            sizeof(int32_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int32_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_int8_int64_memview(int8_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            int64_t *v
-            int64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int64_t) and
-            sizeof(int64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_int8_int64(ndarray[int8_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int64_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_int8_int64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            int64_t *v
-            int64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int64_t) and
-            sizeof(int64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_int8_float64_memview(int8_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            float64_t *v
-            float64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float64_t) and
-            sizeof(float64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_int8_float64(ndarray[int8_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float64_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_int8_float64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            float64_t *v
-            float64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float64_t) and
-            sizeof(float64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_int16_int16_memview(int16_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int16_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int16_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            int16_t *v
-            int16_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int16_t) and
-            sizeof(int16_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int16_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_int16_int16(ndarray[int16_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int16_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_int16_int16_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int16_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            int16_t *v
-            int16_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int16_t) and
-            sizeof(int16_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int16_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_int16_int32_memview(int16_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int32_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int32_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            int32_t *v
-            int32_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int32_t) and
-            sizeof(int32_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int32_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_int16_int32(ndarray[int16_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int32_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_int16_int32_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int32_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            int32_t *v
-            int32_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int32_t) and
-            sizeof(int32_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int32_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_int16_int64_memview(int16_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            int64_t *v
-            int64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int64_t) and
-            sizeof(int64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_int16_int64(ndarray[int16_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int64_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_int16_int64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            int64_t *v
-            int64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int64_t) and
-            sizeof(int64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_int16_float64_memview(int16_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            float64_t *v
-            float64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float64_t) and
-            sizeof(float64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_int16_float64(ndarray[int16_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float64_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_int16_float64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            float64_t *v
-            float64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float64_t) and
-            sizeof(float64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_int32_int32_memview(int32_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int32_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int32_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            int32_t *v
-            int32_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int32_t) and
-            sizeof(int32_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int32_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_int32_int32(ndarray[int32_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int32_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_int32_int32_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int32_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            int32_t *v
-            int32_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int32_t) and
-            sizeof(int32_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int32_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_int32_int64_memview(int32_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            int64_t *v
-            int64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int64_t) and
-            sizeof(int64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_int32_int64(ndarray[int32_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int64_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_int32_int64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            int64_t *v
-            int64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int64_t) and
-            sizeof(int64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_int32_float64_memview(int32_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            float64_t *v
-            float64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float64_t) and
-            sizeof(float64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_int32_float64(ndarray[int32_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float64_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_int32_float64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            float64_t *v
-            float64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float64_t) and
-            sizeof(float64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_int64_int64_memview(int64_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            int64_t *v
-            int64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int64_t) and
-            sizeof(int64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_int64_int64(ndarray[int64_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int64_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_int64_int64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            int64_t *v
-            int64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(int64_t) and
-            sizeof(int64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(int64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_int64_float64_memview(int64_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            float64_t *v
-            float64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float64_t) and
-            sizeof(float64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_int64_float64(ndarray[int64_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float64_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_int64_float64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            float64_t *v
-            float64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float64_t) and
-            sizeof(float64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_float32_float32_memview(float32_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float32_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float32_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            float32_t *v
-            float32_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float32_t) and
-            sizeof(float32_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float32_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_float32_float32(ndarray[float32_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float32_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_float32_float32_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float32_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            float32_t *v
-            float32_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float32_t) and
-            sizeof(float32_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float32_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_float32_float64_memview(float32_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            float64_t *v
-            float64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float64_t) and
-            sizeof(float64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_float32_float64(ndarray[float32_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float64_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_float32_float64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            float64_t *v
-            float64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float64_t) and
-            sizeof(float64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_float64_float64_memview(float64_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            float64_t *v
-            float64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float64_t) and
-            sizeof(float64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_float64_float64(ndarray[float64_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float64_t[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_float64_float64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF True:
-        cdef:
-            float64_t *v
-            float64_t *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(float64_t) and
-            sizeof(float64_t) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(float64_t) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis0_object_object_memview(object[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    object[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        object fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            object *v
-            object *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(object) and
-            sizeof(object) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(object) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis0_object_object(ndarray[object, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    object[:, :] out,
-                                    fill_value=np.nan):
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis0_object_object_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        object fv
-
-    n = len(indexer)
-    k = values.shape[1]
-
-    fv = fill_value
-
-    IF False:
-        cdef:
-            object *v
-            object *o
-
-        #GH3130
-        if (values.strides[1] == out.strides[1] and
-            values.strides[1] == sizeof(object) and
-            sizeof(object) * n >= 256):
-
-            for i from 0 <= i < n:
-                idx = indexer[i]
-                if idx == -1:
-                    for j from 0 <= j < k:
-                        out[i, j] = fv
-                else:
-                    v = &values[idx, 0]
-                    o = &out[i, 0]
-                    memmove(o, v, <size_t>(sizeof(object) * k))
-            return
-
-    for i from 0 <= i < n:
-        idx = indexer[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                out[i, j] = values[idx, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_bool_bool_memview(uint8_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    uint8_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        uint8_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_bool_bool(ndarray[uint8_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    uint8_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_bool_bool_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        uint8_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_bool_object_memview(uint8_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    object[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        object fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = True if values[i, idx] > 0 else False
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_bool_object(ndarray[uint8_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    object[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_bool_object_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        object fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = True if values[i, idx] > 0 else False
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_int8_int8_memview(int8_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int8_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int8_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_int8_int8(ndarray[int8_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int8_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_int8_int8_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int8_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_int8_int32_memview(int8_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int32_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int32_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_int8_int32(ndarray[int8_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int32_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_int8_int32_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int32_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_int8_int64_memview(int8_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_int8_int64(ndarray[int8_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int64_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_int8_int64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_int8_float64_memview(int8_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_int8_float64(ndarray[int8_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float64_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_int8_float64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_int16_int16_memview(int16_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int16_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int16_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_int16_int16(ndarray[int16_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int16_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_int16_int16_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int16_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_int16_int32_memview(int16_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int32_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int32_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_int16_int32(ndarray[int16_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int32_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_int16_int32_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int32_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_int16_int64_memview(int16_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_int16_int64(ndarray[int16_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int64_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_int16_int64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_int16_float64_memview(int16_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_int16_float64(ndarray[int16_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float64_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_int16_float64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_int32_int32_memview(int32_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int32_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int32_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_int32_int32(ndarray[int32_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int32_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_int32_int32_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int32_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_int32_int64_memview(int32_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_int32_int64(ndarray[int32_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int64_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_int32_int64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_int32_float64_memview(int32_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_int32_float64(ndarray[int32_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float64_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_int32_float64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_int64_int64_memview(int64_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    int64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_int64_int64(ndarray[int64_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    int64_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_int64_int64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        int64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_int64_float64_memview(int64_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_int64_float64(ndarray[int64_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float64_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_int64_float64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_float32_float32_memview(float32_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float32_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float32_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_float32_float32(ndarray[float32_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float32_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_float32_float32_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float32_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_float32_float64_memview(float32_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_float32_float64(ndarray[float32_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float64_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_float32_float64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_float64_float64_memview(float64_t[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    float64_t[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_float64_float64(ndarray[float64_t, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    float64_t[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_float64_float64_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        float64_t fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef inline take_2d_axis1_object_object_memview(object[:, :] values,
-                                                    int64_t[:] indexer,
-                                                    object[:, :] out,
-                                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        object fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_axis1_object_object(ndarray[object, ndim=2] values,
-                                    ndarray[int64_t] indexer,
-                                    object[:, :] out,
-                                    fill_value=np.nan):
-
-    if values.flags.writeable:
-        # We can call the memoryview version of the code
-        take_2d_axis1_object_object_memview(values, indexer, out,
-                                                fill_value=fill_value)
-        return
-
-    # We cannot use the memoryview version on readonly-buffers due to
-    # a limitation of Cython's typed memoryviews. Instead we can use
-    # the slightly slower Cython ndarray type directly.
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        object fv
-
-    n = len(values)
-    k = len(indexer)
-
-    if n == 0 or k == 0:
-        return
-
-    fv = fill_value
-
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
-            idx = indexer[j]
-            if idx == -1:
-                out[i, j] = fv
-            else:
-                out[i, j] = values[i, idx]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_bool_bool(ndarray[uint8_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[uint8_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        uint8_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_bool_object(ndarray[uint8_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[object, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        object fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = True if values[idx, idx1[j]] > 0 else False
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_int8_int8(ndarray[int8_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[int8_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        int8_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_int8_int32(ndarray[int8_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[int32_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        int32_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_int8_int64(ndarray[int8_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[int64_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        int64_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_int8_float64(ndarray[int8_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[float64_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        float64_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_int16_int16(ndarray[int16_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[int16_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        int16_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_int16_int32(ndarray[int16_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[int32_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        int32_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_int16_int64(ndarray[int16_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[int64_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        int64_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_int16_float64(ndarray[int16_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[float64_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        float64_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_int32_int32(ndarray[int32_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[int32_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        int32_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_int32_int64(ndarray[int32_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[int64_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        int64_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_int32_float64(ndarray[int32_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[float64_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        float64_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_int64_int64(ndarray[int64_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[int64_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        int64_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_int64_float64(ndarray[int64_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[float64_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        float64_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_float32_float32(ndarray[float32_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[float32_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        float32_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_float32_float64(ndarray[float32_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[float64_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        float64_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_float64_float64(ndarray[float64_t, ndim=2] values,
-                                    indexer,
-                                    ndarray[float64_t, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        float64_t fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def take_2d_multi_object_object(ndarray[object, ndim=2] values,
-                                    indexer,
-                                    ndarray[object, ndim=2] out,
-                                    fill_value=np.nan):
-    cdef:
-        Py_ssize_t i, j, k, n, idx
-        ndarray[int64_t] idx0 = indexer[0]
-        ndarray[int64_t] idx1 = indexer[1]
-        object fv
-
-    n = len(idx0)
-    k = len(idx1)
-
-    fv = fill_value
-    for i from 0 <= i < n:
-        idx = idx0[i]
-        if idx == -1:
-            for j from 0 <= j < k:
-                out[i, j] = fv
-        else:
-            for j from 0 <= j < k:
-                if idx1[j] == -1:
-                    out[i, j] = fv
-                else:
-                    out[i, j] = values[idx, idx1[j]]
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def diff_2d_float64(ndarray[float64_t, ndim=2] arr,
-                     ndarray[float64_t, ndim=2] out,
-                    Py_ssize_t periods, int axis):
-    cdef:
-        Py_ssize_t i, j, sx, sy
-
-    sx, sy = (<object> arr).shape
-    if arr.flags.f_contiguous:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for j in range(sy):
-                for i in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for j in range(start, stop):
-                for i in range(sx):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-    else:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for i in range(start, stop):
-                for j in range(sy):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for i in range(sx):
-                for j in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def diff_2d_float32(ndarray[float32_t, ndim=2] arr,
-                     ndarray[float32_t, ndim=2] out,
-                    Py_ssize_t periods, int axis):
-    cdef:
-        Py_ssize_t i, j, sx, sy
-
-    sx, sy = (<object> arr).shape
-    if arr.flags.f_contiguous:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for j in range(sy):
-                for i in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for j in range(start, stop):
-                for i in range(sx):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-    else:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for i in range(start, stop):
-                for j in range(sy):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for i in range(sx):
-                for j in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def diff_2d_int8(ndarray[int8_t, ndim=2] arr,
-                     ndarray[float32_t, ndim=2] out,
-                    Py_ssize_t periods, int axis):
-    cdef:
-        Py_ssize_t i, j, sx, sy
-
-    sx, sy = (<object> arr).shape
-    if arr.flags.f_contiguous:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for j in range(sy):
-                for i in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for j in range(start, stop):
-                for i in range(sx):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-    else:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for i in range(start, stop):
-                for j in range(sy):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for i in range(sx):
-                for j in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def diff_2d_int16(ndarray[int16_t, ndim=2] arr,
-                     ndarray[float32_t, ndim=2] out,
-                    Py_ssize_t periods, int axis):
-    cdef:
-        Py_ssize_t i, j, sx, sy
-
-    sx, sy = (<object> arr).shape
-    if arr.flags.f_contiguous:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for j in range(sy):
-                for i in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for j in range(start, stop):
-                for i in range(sx):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-    else:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for i in range(start, stop):
-                for j in range(sy):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for i in range(sx):
-                for j in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def diff_2d_int32(ndarray[int32_t, ndim=2] arr,
-                     ndarray[float64_t, ndim=2] out,
-                    Py_ssize_t periods, int axis):
-    cdef:
-        Py_ssize_t i, j, sx, sy
-
-    sx, sy = (<object> arr).shape
-    if arr.flags.f_contiguous:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for j in range(sy):
-                for i in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for j in range(start, stop):
-                for i in range(sx):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-    else:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for i in range(start, stop):
-                for j in range(sy):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for i in range(sx):
-                for j in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def diff_2d_int64(ndarray[int64_t, ndim=2] arr,
-                     ndarray[float64_t, ndim=2] out,
-                    Py_ssize_t periods, int axis):
-    cdef:
-        Py_ssize_t i, j, sx, sy
-
-    sx, sy = (<object> arr).shape
-    if arr.flags.f_contiguous:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for j in range(sy):
-                for i in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for j in range(start, stop):
-                for i in range(sx):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-    else:
-        if axis == 0:
-            if periods >= 0:
-                start, stop = periods, sx
-            else:
-                start, stop = 0, sx + periods
-            for i in range(start, stop):
-                for j in range(sy):
-                    out[i, j] = arr[i, j] - arr[i - periods, j]
-        else:
-            if periods >= 0:
-                start, stop = periods, sy
-            else:
-                start, stop = 0, sy + periods
-            for i in range(sx):
-                for j in range(start, stop):
-                    out[i, j] = arr[i, j] - arr[i, j - periods]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_add_float64(ndarray[float64_t, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[float64_t, ndim=2] values,
-              ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float64_t val, count
-        ndarray[float64_t, ndim=2] sumx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    sumx = np.zeros_like(out)
-
-    N, K = (<object> values).shape
-
-
-    with nogil:
-
-        if K > 1:
-
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val:
-                        nobs[lab, j] += 1
-                        sumx[lab, j] += val
-
-        else:
-
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val:
-                    nobs[lab, 0] += 1
-                    sumx[lab, 0] += val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = sumx[i, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_add_float32(ndarray[float32_t, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[float32_t, ndim=2] values,
-              ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float32_t val, count
-        ndarray[float32_t, ndim=2] sumx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    sumx = np.zeros_like(out)
-
-    N, K = (<object> values).shape
-
-
-    with nogil:
-
-        if K > 1:
-
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val:
-                        nobs[lab, j] += 1
-                        sumx[lab, j] += val
-
-        else:
-
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val:
-                    nobs[lab, 0] += 1
-                    sumx[lab, 0] += val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = sumx[i, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_prod_float64(ndarray[float64_t, ndim=2] out,
-               ndarray[int64_t] counts,
-               ndarray[float64_t, ndim=2] values,
-               ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float64_t val, count
-        ndarray[float64_t, ndim=2] prodx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    prodx = np.ones_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val:
-                        nobs[lab, j] += 1
-                        prodx[lab, j] *= val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val:
-                    nobs[lab, 0] += 1
-                    prodx[lab, 0] *= val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = prodx[i, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_prod_float32(ndarray[float32_t, ndim=2] out,
-               ndarray[int64_t] counts,
-               ndarray[float32_t, ndim=2] values,
-               ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float32_t val, count
-        ndarray[float32_t, ndim=2] prodx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    prodx = np.ones_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val:
-                        nobs[lab, j] += 1
-                        prodx[lab, j] *= val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val:
-                    nobs[lab, 0] += 1
-                    prodx[lab, 0] *= val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = prodx[i, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-@cython.cdivision(True)
-def group_var_float64(ndarray[float64_t, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[float64_t, ndim=2] values,
-              ndarray[int64_t] labels):
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float64_t val, ct, oldmean
-        ndarray[float64_t, ndim=2] nobs, mean
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    mean = np.zeros_like(out)
-
-    N, K = (<object> values).shape
-
-    out[:, :] = 0.0
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab < 0:
-                continue
-
-            counts[lab] += 1
-
-            for j in range(K):
-                val = values[i, j]
-
-                # not nan
-                if val == val:
-                    nobs[lab, j] += 1
-                    oldmean = mean[lab, j]
-                    mean[lab, j] += (val - oldmean) / nobs[lab, j]
-                    out[lab, j] += (val - mean[lab, j]) * (val - oldmean)
-
-        for i in range(ncounts):
-            for j in range(K):
-                ct = nobs[i, j]
-                if ct < 2:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] /= (ct - 1)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-@cython.cdivision(True)
-def group_var_float32(ndarray[float32_t, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[float32_t, ndim=2] values,
-              ndarray[int64_t] labels):
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float32_t val, ct, oldmean
-        ndarray[float32_t, ndim=2] nobs, mean
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    mean = np.zeros_like(out)
-
-    N, K = (<object> values).shape
-
-    out[:, :] = 0.0
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab < 0:
-                continue
-
-            counts[lab] += 1
-
-            for j in range(K):
-                val = values[i, j]
-
-                # not nan
-                if val == val:
-                    nobs[lab, j] += 1
-                    oldmean = mean[lab, j]
-                    mean[lab, j] += (val - oldmean) / nobs[lab, j]
-                    out[lab, j] += (val - mean[lab, j]) * (val - oldmean)
-
-        for i in range(ncounts):
-            for j in range(K):
-                ct = nobs[i, j]
-                if ct < 2:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] /= (ct - 1)
-
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_mean_float64(ndarray[float64_t, ndim=2] out,
-               ndarray[int64_t] counts,
-               ndarray[float64_t, ndim=2] values,
-               ndarray[int64_t] labels):
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float64_t val, count
-        ndarray[float64_t, ndim=2] sumx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    sumx = np.zeros_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-                    # not nan
-                    if val == val:
-                        nobs[lab, j] += 1
-                        sumx[lab, j] += val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-                # not nan
-                if val == val:
-                    nobs[lab, 0] += 1
-                    sumx[lab, 0] += val
-
-        for i in range(ncounts):
-            for j in range(K):
-                count = nobs[i, j]
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = sumx[i, j] / count
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_mean_float32(ndarray[float32_t, ndim=2] out,
-               ndarray[int64_t] counts,
-               ndarray[float32_t, ndim=2] values,
-               ndarray[int64_t] labels):
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float32_t val, count
-        ndarray[float32_t, ndim=2] sumx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    sumx = np.zeros_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-                    # not nan
-                    if val == val:
-                        nobs[lab, j] += 1
-                        sumx[lab, j] += val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-                # not nan
-                if val == val:
-                    nobs[lab, 0] += 1
-                    sumx[lab, 0] += val
-
-        for i in range(ncounts):
-            for j in range(K):
-                count = nobs[i, j]
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = sumx[i, j] / count
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_ohlc_float64(ndarray[float64_t, ndim=2] out,
-                  ndarray[int64_t] counts,
-                  ndarray[float64_t, ndim=2] values,
-                  ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab
-        float64_t val, count
-        Py_ssize_t ngroups = len(counts)
-
-    if len(labels) == 0:
-        return
-
-    N, K = (<object> values).shape
-
-    if out.shape[1] != 4:
-        raise ValueError('Output array must have 4 columns')
-
-    if K > 1:
-        raise NotImplementedError("Argument 'values' must have only "
-                                  "one dimension")
-    out.fill(np.nan)
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab == -1:
-                continue
-
-            counts[lab] += 1
-            val = values[i, 0]
-            if val != val:
-                continue
-
-            if out[lab, 0] != out[lab, 0]:
-                out[lab, 0] = out[lab, 1] = out[lab, 2] = out[lab, 3] = val
-            else:
-                out[lab, 1] = max(out[lab, 1], val)
-                out[lab, 2] = min(out[lab, 2], val)
-                out[lab, 3] = val
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_ohlc_float32(ndarray[float32_t, ndim=2] out,
-                  ndarray[int64_t] counts,
-                  ndarray[float32_t, ndim=2] values,
-                  ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab
-        float32_t val, count
-        Py_ssize_t ngroups = len(counts)
-
-    if len(labels) == 0:
-        return
-
-    N, K = (<object> values).shape
-
-    if out.shape[1] != 4:
-        raise ValueError('Output array must have 4 columns')
-
-    if K > 1:
-        raise NotImplementedError("Argument 'values' must have only "
-                                  "one dimension")
-    out.fill(np.nan)
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab == -1:
-                continue
-
-            counts[lab] += 1
-            val = values[i, 0]
-            if val != val:
-                continue
-
-            if out[lab, 0] != out[lab, 0]:
-                out[lab, 0] = out[lab, 1] = out[lab, 2] = out[lab, 3] = val
-            else:
-                out[lab, 1] = max(out[lab, 1], val)
-                out[lab, 2] = min(out[lab, 2], val)
-                out[lab, 3] = val
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_last_float64(ndarray[float64_t, ndim=2] out,
-               ndarray[int64_t] counts,
-               ndarray[float64_t, ndim=2] values,
-               ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float64_t val, count
-        ndarray[float64_t, ndim=2] resx
-        ndarray[int64_t, ndim=2] nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
-    resx = np.empty_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab < 0:
-                continue
-
-            counts[lab] += 1
-            for j in range(K):
-                val = values[i, j]
-
-                # not nan
-                if val == val and val != NAN:
-                    nobs[lab, j] += 1
-                    resx[lab, j] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = resx[i, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_last_float32(ndarray[float32_t, ndim=2] out,
-               ndarray[int64_t] counts,
-               ndarray[float32_t, ndim=2] values,
-               ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float32_t val, count
-        ndarray[float32_t, ndim=2] resx
-        ndarray[int64_t, ndim=2] nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
-    resx = np.empty_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab < 0:
-                continue
-
-            counts[lab] += 1
-            for j in range(K):
-                val = values[i, j]
-
-                # not nan
-                if val == val and val != NAN:
-                    nobs[lab, j] += 1
-                    resx[lab, j] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = resx[i, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_last_int64(ndarray[int64_t, ndim=2] out,
-               ndarray[int64_t] counts,
-               ndarray[int64_t, ndim=2] values,
-               ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        int64_t val, count
-        ndarray[int64_t, ndim=2] resx
-        ndarray[int64_t, ndim=2] nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
-    resx = np.empty_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab < 0:
-                continue
-
-            counts[lab] += 1
-            for j in range(K):
-                val = values[i, j]
-
-                # not nan
-                if val == val and val != iNaT:
-                    nobs[lab, j] += 1
-                    resx[lab, j] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = iNaT
-                else:
-                    out[i, j] = resx[i, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_nth_float64(ndarray[float64_t, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[float64_t, ndim=2] values,
-              ndarray[int64_t] labels, int64_t rank):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float64_t val, count
-        ndarray[float64_t, ndim=2] resx
-        ndarray[int64_t, ndim=2] nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
-    resx = np.empty_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab < 0:
-                continue
-
-            counts[lab] += 1
-            for j in range(K):
-                val = values[i, j]
-
-                # not nan
-                if val == val and val != NAN:
-                    nobs[lab, j] += 1
-                    if nobs[lab, j] == rank:
-                        resx[lab, j] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = resx[i, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_nth_float32(ndarray[float32_t, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[float32_t, ndim=2] values,
-              ndarray[int64_t] labels, int64_t rank):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float32_t val, count
-        ndarray[float32_t, ndim=2] resx
-        ndarray[int64_t, ndim=2] nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
-    resx = np.empty_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab < 0:
-                continue
-
-            counts[lab] += 1
-            for j in range(K):
-                val = values[i, j]
-
-                # not nan
-                if val == val and val != NAN:
-                    nobs[lab, j] += 1
-                    if nobs[lab, j] == rank:
-                        resx[lab, j] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = resx[i, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_nth_int64(ndarray[int64_t, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[int64_t, ndim=2] values,
-              ndarray[int64_t] labels, int64_t rank):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        int64_t val, count
-        ndarray[int64_t, ndim=2] resx
-        ndarray[int64_t, ndim=2] nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
-    resx = np.empty_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab < 0:
-                continue
-
-            counts[lab] += 1
-            for j in range(K):
-                val = values[i, j]
-
-                # not nan
-                if val == val and val != iNaT:
-                    nobs[lab, j] += 1
-                    if nobs[lab, j] == rank:
-                        resx[lab, j] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = iNaT
-                else:
-                    out[i, j] = resx[i, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_min_float64(ndarray[float64_t, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[float64_t, ndim=2] values,
-              ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float64_t val, count
-        ndarray[float64_t, ndim=2] minx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-
-    minx = np.empty_like(out)
-    minx.fill(np.inf)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val and val != NAN:
-
-                        nobs[lab, j] += 1
-                        if val < minx[lab, j]:
-                            minx[lab, j] = val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val and val != NAN:
-                    nobs[lab, 0] += 1
-                    if val < minx[lab, 0]:
-                        minx[lab, 0] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = minx[i, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_min_float32(ndarray[float32_t, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[float32_t, ndim=2] values,
-              ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float32_t val, count
-        ndarray[float32_t, ndim=2] minx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-
-    minx = np.empty_like(out)
-    minx.fill(np.inf)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val and val != NAN:
-
-                        nobs[lab, j] += 1
-                        if val < minx[lab, j]:
-                            minx[lab, j] = val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val and val != NAN:
-                    nobs[lab, 0] += 1
-                    if val < minx[lab, 0]:
-                        minx[lab, 0] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = minx[i, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_min_int64(ndarray[int64_t, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[int64_t, ndim=2] values,
-              ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        int64_t val, count
-        ndarray[int64_t, ndim=2] minx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-
-    minx = np.empty_like(out)
-    minx.fill(9223372036854775807)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val and val != iNaT:
-
-                        nobs[lab, j] += 1
-                        if val < minx[lab, j]:
-                            minx[lab, j] = val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val and val != iNaT:
-                    nobs[lab, 0] += 1
-                    if val < minx[lab, 0]:
-                        minx[lab, 0] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = iNaT
-                else:
-                    out[i, j] = minx[i, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_max_float64(ndarray[float64_t, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[float64_t, ndim=2] values,
-              ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float64_t val, count
-        ndarray[float64_t, ndim=2] maxx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-
-    maxx = np.empty_like(out)
-    maxx.fill(-np.inf)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val and val != NAN:
-                        nobs[lab, j] += 1
-                        if val > maxx[lab, j]:
-                            maxx[lab, j] = val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val and val != NAN:
-                    nobs[lab, 0] += 1
-                    if val > maxx[lab, 0]:
-                        maxx[lab, 0] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = maxx[i, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_max_float32(ndarray[float32_t, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[float32_t, ndim=2] values,
-              ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        float32_t val, count
-        ndarray[float32_t, ndim=2] maxx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-
-    maxx = np.empty_like(out)
-    maxx.fill(-np.inf)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val and val != NAN:
-                        nobs[lab, j] += 1
-                        if val > maxx[lab, j]:
-                            maxx[lab, j] = val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val and val != NAN:
-                    nobs[lab, 0] += 1
-                    if val > maxx[lab, 0]:
-                        maxx[lab, 0] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = maxx[i, j]
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_max_int64(ndarray[int64_t, ndim=2] out,
-              ndarray[int64_t] counts,
-              ndarray[int64_t, ndim=2] values,
-              ndarray[int64_t] labels):
-    '''
-    Only aggregates on axis=0
-    '''
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        int64_t val, count
-        ndarray[int64_t, ndim=2] maxx, nobs
-
-    if not len(values) == len(labels):
-       raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-
-    maxx = np.empty_like(out)
-    maxx.fill(-9223372036854775807)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val and val != iNaT:
-                        nobs[lab, j] += 1
-                        if val > maxx[lab, j]:
-                            maxx[lab, j] = val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val and val != iNaT:
-                    nobs[lab, 0] += 1
-                    if val > maxx[lab, 0]:
-                        maxx[lab, 0] = val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = iNaT
-                else:
-                    out[i, j] = maxx[i, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def left_join_indexer_unique_float64(ndarray[float64_t] left,
-                                      ndarray[float64_t] right):
-    cdef:
-        Py_ssize_t i, j, nleft, nright
-        ndarray[int64_t] indexer
-        float64_t lval, rval
-
-    i = 0
-    j = 0
-    nleft = len(left)
-    nright = len(right)
-
-    indexer = np.empty(nleft, dtype=np.int64)
-    while True:
-        if i == nleft:
-            break
-
-        if j == nright:
-            indexer[i] = -1
-            i += 1
-            continue
-
-        rval = right[j]
-
-        while i < nleft - 1 and left[i] == rval:
-            indexer[i] = j
-            i += 1
-
-        if left[i] == right[j]:
-            indexer[i] = j
-            i += 1
-            while i < nleft - 1 and left[i] == rval:
-                indexer[i] = j
-                i += 1
-            j += 1
-        elif left[i] > rval:
-            indexer[i] = -1
-            j += 1
-        else:
-            indexer[i] = -1
-            i += 1
-    return indexer
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def left_join_indexer_unique_float32(ndarray[float32_t] left,
-                                      ndarray[float32_t] right):
-    cdef:
-        Py_ssize_t i, j, nleft, nright
-        ndarray[int64_t] indexer
-        float32_t lval, rval
-
-    i = 0
-    j = 0
-    nleft = len(left)
-    nright = len(right)
-
-    indexer = np.empty(nleft, dtype=np.int64)
-    while True:
-        if i == nleft:
-            break
-
-        if j == nright:
-            indexer[i] = -1
-            i += 1
-            continue
-
-        rval = right[j]
-
-        while i < nleft - 1 and left[i] == rval:
-            indexer[i] = j
-            i += 1
-
-        if left[i] == right[j]:
-            indexer[i] = j
-            i += 1
-            while i < nleft - 1 and left[i] == rval:
-                indexer[i] = j
-                i += 1
-            j += 1
-        elif left[i] > rval:
-            indexer[i] = -1
-            j += 1
-        else:
-            indexer[i] = -1
-            i += 1
-    return indexer
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def left_join_indexer_unique_object(ndarray[object] left,
-                                      ndarray[object] right):
-    cdef:
-        Py_ssize_t i, j, nleft, nright
-        ndarray[int64_t] indexer
-        object lval, rval
-
-    i = 0
-    j = 0
-    nleft = len(left)
-    nright = len(right)
-
-    indexer = np.empty(nleft, dtype=np.int64)
-    while True:
-        if i == nleft:
-            break
-
-        if j == nright:
-            indexer[i] = -1
-            i += 1
-            continue
-
-        rval = right[j]
-
-        while i < nleft - 1 and left[i] == rval:
-            indexer[i] = j
-            i += 1
-
-        if left[i] == right[j]:
-            indexer[i] = j
-            i += 1
-            while i < nleft - 1 and left[i] == rval:
-                indexer[i] = j
-                i += 1
-            j += 1
-        elif left[i] > rval:
-            indexer[i] = -1
-            j += 1
-        else:
-            indexer[i] = -1
-            i += 1
-    return indexer
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def left_join_indexer_unique_int32(ndarray[int32_t] left,
-                                      ndarray[int32_t] right):
-    cdef:
-        Py_ssize_t i, j, nleft, nright
-        ndarray[int64_t] indexer
-        int32_t lval, rval
-
-    i = 0
-    j = 0
-    nleft = len(left)
-    nright = len(right)
-
-    indexer = np.empty(nleft, dtype=np.int64)
-    while True:
-        if i == nleft:
-            break
-
-        if j == nright:
-            indexer[i] = -1
-            i += 1
-            continue
-
-        rval = right[j]
-
-        while i < nleft - 1 and left[i] == rval:
-            indexer[i] = j
-            i += 1
-
-        if left[i] == right[j]:
-            indexer[i] = j
-            i += 1
-            while i < nleft - 1 and left[i] == rval:
-                indexer[i] = j
-                i += 1
-            j += 1
-        elif left[i] > rval:
-            indexer[i] = -1
-            j += 1
-        else:
-            indexer[i] = -1
-            i += 1
-    return indexer
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def left_join_indexer_unique_int64(ndarray[int64_t] left,
-                                      ndarray[int64_t] right):
-    cdef:
-        Py_ssize_t i, j, nleft, nright
-        ndarray[int64_t] indexer
-        int64_t lval, rval
-
-    i = 0
-    j = 0
-    nleft = len(left)
-    nright = len(right)
-
-    indexer = np.empty(nleft, dtype=np.int64)
-    while True:
-        if i == nleft:
-            break
-
-        if j == nright:
-            indexer[i] = -1
-            i += 1
-            continue
-
-        rval = right[j]
-
-        while i < nleft - 1 and left[i] == rval:
-            indexer[i] = j
-            i += 1
-
-        if left[i] == right[j]:
-            indexer[i] = j
-            i += 1
-            while i < nleft - 1 and left[i] == rval:
-                indexer[i] = j
-                i += 1
-            j += 1
-        elif left[i] > rval:
-            indexer[i] = -1
-            j += 1
-        else:
-            indexer[i] = -1
-            i += 1
-    return indexer
-
-
-
-def left_join_indexer_float64(ndarray[float64_t] left,
-                              ndarray[float64_t] right):
-    '''
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    '''
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        float64_t lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[float64_t] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=np.float64)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    i += 1
-                    count += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = left[i]
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-
-
-def left_join_indexer_float32(ndarray[float32_t] left,
-                              ndarray[float32_t] right):
-    '''
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    '''
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        float32_t lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[float32_t] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=np.float32)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    i += 1
-                    count += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = left[i]
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-
-
-def left_join_indexer_object(ndarray[object] left,
-                              ndarray[object] right):
-    '''
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    '''
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        object lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[object] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=object)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    i += 1
-                    count += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = left[i]
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-
-
-def left_join_indexer_int32(ndarray[int32_t] left,
-                              ndarray[int32_t] right):
-    '''
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    '''
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        int32_t lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[int32_t] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=np.int32)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    i += 1
-                    count += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = left[i]
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-
-
-def left_join_indexer_int64(ndarray[int64_t] left,
-                              ndarray[int64_t] right):
-    '''
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    '''
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        int64_t lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[int64_t] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=np.int64)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    i += 1
-                    count += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = left[i]
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def outer_join_indexer_float64(ndarray[float64_t] left,
-                                ndarray[float64_t] right):
-    cdef:
-        Py_ssize_t i, j, nright, nleft, count
-        float64_t lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[float64_t] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        count = nright
-    elif nright == 0:
-        count = nleft
-    else:
-        while True:
-            if i == nleft:
-                count += nright - j
-                break
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                count += 1
-                j += 1
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=np.float64)
-
-    # do it again, but populate the indexers / result
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        for j in range(nright):
-            lindexer[j] = -1
-            rindexer[j] = j
-            result[j] = right[j]
-    elif nright == 0:
-        for i in range(nleft):
-            lindexer[i] = i
-            rindexer[i] = -1
-            result[i] = left[i]
-    else:
-        while True:
-            if i == nleft:
-                while j < nright:
-                    lindexer[count] = -1
-                    rindexer[count] = j
-                    result[count] = right[j]
-                    count += 1
-                    j += 1
-                break
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    count += 1
-                    i += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = lval
-                count += 1
-                i += 1
-            else:
-                lindexer[count] = -1
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                j += 1
-
-    return result, lindexer, rindexer
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def outer_join_indexer_float32(ndarray[float32_t] left,
-                                ndarray[float32_t] right):
-    cdef:
-        Py_ssize_t i, j, nright, nleft, count
-        float32_t lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[float32_t] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        count = nright
-    elif nright == 0:
-        count = nleft
-    else:
-        while True:
-            if i == nleft:
-                count += nright - j
-                break
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                count += 1
-                j += 1
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=np.float32)
-
-    # do it again, but populate the indexers / result
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        for j in range(nright):
-            lindexer[j] = -1
-            rindexer[j] = j
-            result[j] = right[j]
-    elif nright == 0:
-        for i in range(nleft):
-            lindexer[i] = i
-            rindexer[i] = -1
-            result[i] = left[i]
-    else:
-        while True:
-            if i == nleft:
-                while j < nright:
-                    lindexer[count] = -1
-                    rindexer[count] = j
-                    result[count] = right[j]
-                    count += 1
-                    j += 1
-                break
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    count += 1
-                    i += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = lval
-                count += 1
-                i += 1
-            else:
-                lindexer[count] = -1
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                j += 1
-
-    return result, lindexer, rindexer
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def outer_join_indexer_object(ndarray[object] left,
-                                ndarray[object] right):
-    cdef:
-        Py_ssize_t i, j, nright, nleft, count
-        object lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[object] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        count = nright
-    elif nright == 0:
-        count = nleft
-    else:
-        while True:
-            if i == nleft:
-                count += nright - j
-                break
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                count += 1
-                j += 1
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=object)
-
-    # do it again, but populate the indexers / result
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        for j in range(nright):
-            lindexer[j] = -1
-            rindexer[j] = j
-            result[j] = right[j]
-    elif nright == 0:
-        for i in range(nleft):
-            lindexer[i] = i
-            rindexer[i] = -1
-            result[i] = left[i]
-    else:
-        while True:
-            if i == nleft:
-                while j < nright:
-                    lindexer[count] = -1
-                    rindexer[count] = j
-                    result[count] = right[j]
-                    count += 1
-                    j += 1
-                break
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    count += 1
-                    i += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = lval
-                count += 1
-                i += 1
-            else:
-                lindexer[count] = -1
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                j += 1
-
-    return result, lindexer, rindexer
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def outer_join_indexer_int32(ndarray[int32_t] left,
-                                ndarray[int32_t] right):
-    cdef:
-        Py_ssize_t i, j, nright, nleft, count
-        int32_t lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[int32_t] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        count = nright
-    elif nright == 0:
-        count = nleft
-    else:
-        while True:
-            if i == nleft:
-                count += nright - j
-                break
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                count += 1
-                j += 1
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=np.int32)
-
-    # do it again, but populate the indexers / result
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        for j in range(nright):
-            lindexer[j] = -1
-            rindexer[j] = j
-            result[j] = right[j]
-    elif nright == 0:
-        for i in range(nleft):
-            lindexer[i] = i
-            rindexer[i] = -1
-            result[i] = left[i]
-    else:
-        while True:
-            if i == nleft:
-                while j < nright:
-                    lindexer[count] = -1
-                    rindexer[count] = j
-                    result[count] = right[j]
-                    count += 1
-                    j += 1
-                break
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    count += 1
-                    i += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = lval
-                count += 1
-                i += 1
-            else:
-                lindexer[count] = -1
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                j += 1
-
-    return result, lindexer, rindexer
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def outer_join_indexer_int64(ndarray[int64_t] left,
-                                ndarray[int64_t] right):
-    cdef:
-        Py_ssize_t i, j, nright, nleft, count
-        int64_t lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[int64_t] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        count = nright
-    elif nright == 0:
-        count = nleft
-    else:
-        while True:
-            if i == nleft:
-                count += nright - j
-                break
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                count += 1
-                j += 1
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=np.int64)
-
-    # do it again, but populate the indexers / result
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        for j in range(nright):
-            lindexer[j] = -1
-            rindexer[j] = j
-            result[j] = right[j]
-    elif nright == 0:
-        for i in range(nleft):
-            lindexer[i] = i
-            rindexer[i] = -1
-            result[i] = left[i]
-    else:
-        while True:
-            if i == nleft:
-                while j < nright:
-                    lindexer[count] = -1
-                    rindexer[count] = j
-                    result[count] = right[j]
-                    count += 1
-                    j += 1
-                break
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    count += 1
-                    i += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = lval
-                count += 1
-                i += 1
-            else:
-                lindexer[count] = -1
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                j += 1
-
-    return result, lindexer, rindexer
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def inner_join_indexer_float64(ndarray[float64_t] left,
-                              ndarray[float64_t] right):
-    '''
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    '''
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        float64_t lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[float64_t] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=np.float64)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def inner_join_indexer_float32(ndarray[float32_t] left,
-                              ndarray[float32_t] right):
-    '''
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    '''
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        float32_t lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[float32_t] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=np.float32)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def inner_join_indexer_object(ndarray[object] left,
-                              ndarray[object] right):
-    '''
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    '''
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        object lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[object] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=object)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def inner_join_indexer_int32(ndarray[int32_t] left,
-                              ndarray[int32_t] right):
-    '''
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    '''
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        int32_t lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[int32_t] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=np.int32)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def inner_join_indexer_int64(ndarray[int64_t] left,
-                              ndarray[int64_t] right):
-    '''
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    '''
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        int64_t lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[int64_t] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype=np.int64)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-
-
diff --git a/pandas/src/headers/math.h b/pandas/src/headers/math.h
deleted file mode 100644
index 34ad9f24a58f9..0000000000000
--- a/pandas/src/headers/math.h
+++ /dev/null
@@ -1,11 +0,0 @@
-#ifndef _PANDAS_MATH_H_
-#define _PANDAS_MATH_H_
-
-#if defined(_MSC_VER) && (_MSC_VER < 1800)
-#include <math.h>
-__inline int signbit(double num) { return _copysign(1.0, num) < 0; }
-#else
-#include <math.h>
-#endif
-
-#endif
diff --git a/pandas/src/helper.h b/pandas/src/helper.h
deleted file mode 100644
index e97e45f4e87b3..0000000000000
--- a/pandas/src/helper.h
+++ /dev/null
@@ -1,16 +0,0 @@
-#ifndef C_HELPER_H
-#define C_HELPER_H
-
-#ifndef PANDAS_INLINE
-  #if defined(__GNUC__)
-    #define PANDAS_INLINE __inline__
-  #elif defined(_MSC_VER)
-    #define PANDAS_INLINE __inline
-  #elif defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
-    #define PANDAS_INLINE inline
-  #else
-    #define PANDAS_INLINE
-  #endif
-#endif
-
-#endif
diff --git a/pandas/src/inference.pyx b/pandas/src/inference.pyx
deleted file mode 100644
index 74bd437373c19..0000000000000
--- a/pandas/src/inference.pyx
+++ /dev/null
@@ -1,1167 +0,0 @@
-import sys
-cimport util
-from tslib import NaT
-from datetime import datetime, timedelta
-iNaT = util.get_nat()
-
-cdef bint PY2 = sys.version_info[0] == 2
-
-# core.common import for fast inference checks
-def is_float(object obj):
-    return util.is_float_object(obj)
-
-def is_integer(object obj):
-    return util.is_integer_object(obj)
-
-def is_bool(object obj):
-    return util.is_bool_object(obj)
-
-def is_complex(object obj):
-    return util.is_complex_object(obj)
-
-def is_period(object val):
-    """ Return a boolean if this is a Period object """
-    return util.is_period_object(val)
-
-_TYPE_MAP = {
-    'categorical' : 'categorical',
-    'category' : 'categorical',
-    'int8': 'integer',
-    'int16': 'integer',
-    'int32': 'integer',
-    'int64': 'integer',
-    'i' : 'integer',
-    'uint8': 'integer',
-    'uint16': 'integer',
-    'uint32': 'integer',
-    'uint64': 'integer',
-    'u' : 'integer',
-    'float32': 'floating',
-    'float64': 'floating',
-    'f' : 'floating',
-    'complex128': 'complex',
-    'c' : 'complex',
-    'string': 'string' if PY2 else 'bytes',
-    'S' : 'string' if PY2 else 'bytes',
-    'unicode': 'unicode' if PY2 else 'string',
-    'U' : 'unicode' if PY2 else 'string',
-    'bool': 'boolean',
-    'b' : 'boolean',
-    'datetime64[ns]' : 'datetime64',
-    'M' : 'datetime64',
-    'timedelta64[ns]' : 'timedelta64',
-    'm' : 'timedelta64',
-}
-
-# types only exist on certain platform
-try:
-    np.float128
-    _TYPE_MAP['float128'] = 'floating'
-except AttributeError:
-    pass
-try:
-    np.complex256
-    _TYPE_MAP['complex256'] = 'complex'
-except AttributeError:
-    pass
-try:
-    np.float16
-    _TYPE_MAP['float16'] = 'floating'
-except AttributeError:
-    pass
-
-cdef _try_infer_map(v):
-    """ if its in our map, just return the dtype """
-    cdef:
-        object attr, val
-    for attr in ['name','kind','base']:
-        val = getattr(v.dtype,attr)
-        if val in _TYPE_MAP:
-            return _TYPE_MAP[val]
-    return None
-
-def infer_dtype(object _values):
-    """
-    we are coercing to an ndarray here
-    """
-
-    cdef:
-        Py_ssize_t i, n
-        object val
-        ndarray values
-
-    if isinstance(_values, np.ndarray):
-        values = _values
-    elif hasattr(_values,'dtype'):
-
-        # this will handle ndarray-like
-        # e.g. categoricals
-        try:
-            values = getattr(_values, '_values', getattr(_values, 'values', _values))
-        except:
-            val = _try_infer_map(_values)
-            if val is not None:
-                return val
-
-            # its ndarray like but we can't handle
-            raise ValueError("cannot infer type for {0}".format(type(_values)))
-
-    else:
-        if not isinstance(_values, list):
-            _values = list(_values)
-        values = list_to_object_array(_values)
-
-    values = getattr(values, 'values', values)
-    val = _try_infer_map(values)
-    if val is not None:
-        return val
-
-    if values.dtype != np.object_:
-        values = values.astype('O')
-
-    n = len(values)
-    if n == 0:
-        return 'empty'
-
-    # make contiguous
-    values = values.ravel()
-
-    # try to use a valid value
-    for i in range(n):
-       val = util.get_value_1d(values, i)
-       if not is_null_datetimelike(val):
-           break
-
-    if util.is_datetime64_object(val) or val is NaT:
-        if is_datetime64_array(values):
-            return 'datetime64'
-        elif is_timedelta_or_timedelta64_array(values):
-            return 'timedelta'
-
-    elif util.is_integer_object(val):
-        # a timedelta will show true here as well
-        if is_timedelta(val):
-            if is_timedelta_or_timedelta64_array(values):
-                return 'timedelta'
-
-        if is_integer_array(values):
-            return 'integer'
-        elif is_integer_float_array(values):
-            return 'mixed-integer-float'
-        elif is_timedelta_or_timedelta64_array(values):
-            return 'timedelta'
-        return 'mixed-integer'
-
-    elif is_datetime(val):
-        if is_datetime_array(values):
-            return 'datetime'
-
-    elif is_date(val):
-        if is_date_array(values):
-            return 'date'
-
-    elif is_time(val):
-        if is_time_array(values):
-            return 'time'
-
-    elif util.is_float_object(val):
-        if is_float_array(values):
-            return 'floating'
-        elif is_integer_float_array(values):
-            return 'mixed-integer-float'
-
-    elif util.is_bool_object(val):
-        if is_bool_array(values):
-            return 'boolean'
-
-    elif PyString_Check(val):
-        if is_string_array(values):
-            return 'string'
-
-    elif PyUnicode_Check(val):
-        if is_unicode_array(values):
-            return 'unicode'
-
-    elif PyBytes_Check(val):
-        if is_bytes_array(values):
-            return 'bytes'
-
-    elif is_timedelta(val):
-        if is_timedelta_or_timedelta64_array(values):
-            return 'timedelta'
-
-    elif is_period(val):
-        if is_period_array(values):
-            return 'period'
-
-    for i in range(n):
-        val = util.get_value_1d(values, i)
-        if util.is_integer_object(val):
-            return 'mixed-integer'
-
-    return 'mixed'
-
-
-def is_possible_datetimelike_array(object arr):
-    # determine if we have a possible datetimelike (or null-like) array
-    cdef:
-        Py_ssize_t i, n = len(arr)
-        bint seen_timedelta = 0, seen_datetime = 0
-        object v
-
-    for i in range(n):
-        v = arr[i]
-        if util.is_string_object(v):
-           continue
-        elif util._checknull(v):
-           continue
-        elif is_datetime(v):
-           seen_datetime=1
-        elif is_timedelta(v):
-           seen_timedelta=1
-        else:
-           return False
-    return seen_datetime or seen_timedelta
-
-cdef inline bint is_null_datetimelike(v):
-    # determine if we have a null for a timedelta/datetime (or integer versions)x
-    if util._checknull(v):
-        return True
-    elif util.is_timedelta64_object(v):
-        return v.view('int64') == iNaT
-    elif util.is_datetime64_object(v):
-        return v.view('int64') == iNaT
-    elif util.is_integer_object(v):
-        return v == iNaT
-    elif v is NaT:
-        return True
-    return False
-
-cdef inline bint is_datetime(object o):
-    return PyDateTime_Check(o)
-
-cdef inline bint is_date(object o):
-    return PyDate_Check(o)
-
-cdef inline bint is_time(object o):
-    return PyTime_Check(o)
-
-cdef inline bint is_timedelta(object o):
-    return PyDelta_Check(o) or util.is_timedelta64_object(o)
-
-def is_bool_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if issubclass(values.dtype.type, np.bool_):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not util.is_bool_object(objbuf[i]):
-                return False
-        return True
-    else:
-        return False
-
-def is_integer(object o):
-    return util.is_integer_object(o)
-
-def is_integer_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if issubclass(values.dtype.type, np.integer):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not util.is_integer_object(objbuf[i]):
-                return False
-        return True
-    else:
-        return False
-
-def is_integer_float_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if issubclass(values.dtype.type, np.integer):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not (util.is_integer_object(objbuf[i]) or
-                    util.is_float_object(objbuf[i])):
-
-                return False
-        return True
-    else:
-        return False
-
-def is_float_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if issubclass(values.dtype.type, np.floating):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not util.is_float_object(objbuf[i]):
-                return False
-        return True
-    else:
-        return False
-
-def is_string_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if ((PY2 and issubclass(values.dtype.type, np.string_)) or
-        not PY2 and issubclass(values.dtype.type, np.unicode_)):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not PyString_Check(objbuf[i]):
-                return False
-        return True
-    else:
-        return False
-
-def is_unicode_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if issubclass(values.dtype.type, np.unicode_):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not PyUnicode_Check(objbuf[i]):
-                return False
-        return True
-    else:
-        return False
-
-
-def is_bytes_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if issubclass(values.dtype.type, np.bytes_):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not PyBytes_Check(objbuf[i]):
-                return False
-        return True
-    else:
-        return False
-
-
-def is_datetime_array(ndarray[object] values):
-    cdef Py_ssize_t i, null_count = 0, n = len(values)
-    cdef object v
-    if n == 0:
-        return False
-
-    # return False for all nulls
-    for i in range(n):
-        v = values[i]
-        if is_null_datetimelike(v):
-            # we are a regular null
-            if util._checknull(v):
-               null_count += 1
-        elif not is_datetime(v):
-            return False
-    return null_count != n
-
-def is_datetime64_array(ndarray values):
-    cdef Py_ssize_t i, null_count = 0, n = len(values)
-    cdef object v
-    if n == 0:
-        return False
-
-    # return False for all nulls
-    for i in range(n):
-        v = values[i]
-        if is_null_datetimelike(v):
-            # we are a regular null
-            if util._checknull(v):
-                null_count += 1
-        elif not util.is_datetime64_object(v):
-            return False
-    return null_count != n
-
-def is_timedelta_array(ndarray values):
-    cdef Py_ssize_t i, null_count = 0, n = len(values)
-    cdef object v
-    if n == 0:
-        return False
-    for i in range(n):
-        v = values[i]
-        if is_null_datetimelike(v):
-            # we are a regular null
-            if util._checknull(v):
-                null_count += 1
-        elif not PyDelta_Check(v):
-            return False
-    return null_count != n
-
-def is_timedelta64_array(ndarray values):
-    cdef Py_ssize_t i, null_count = 0, n = len(values)
-    cdef object v
-    if n == 0:
-        return False
-    for i in range(n):
-        v = values[i]
-        if is_null_datetimelike(v):
-            # we are a regular null
-            if util._checknull(v):
-                null_count += 1
-        elif not util.is_timedelta64_object(v):
-            return False
-    return null_count != n
-
-def is_timedelta_or_timedelta64_array(ndarray values):
-    """ infer with timedeltas and/or nat/none """
-    cdef Py_ssize_t i, null_count = 0, n = len(values)
-    cdef object v
-    if n == 0:
-        return False
-    for i in range(n):
-        v = values[i]
-        if is_null_datetimelike(v):
-            # we are a regular null
-            if util._checknull(v):
-                null_count += 1
-        elif not is_timedelta(v):
-            return False
-    return null_count != n
-
-def is_date_array(ndarray[object] values):
-    cdef Py_ssize_t i, n = len(values)
-    if n == 0:
-        return False
-    for i in range(n):
-        if not is_date(values[i]):
-            return False
-    return True
-
-def is_time_array(ndarray[object] values):
-    cdef Py_ssize_t i, n = len(values)
-    if n == 0:
-        return False
-    for i in range(n):
-        if not is_time(values[i]):
-            return False
-    return True
-
-def is_period(object o):
-    from pandas import Period
-    return isinstance(o,Period)
-
-def is_period_array(ndarray[object] values):
-    cdef Py_ssize_t i, n = len(values)
-    from pandas.tseries.period import Period
-
-    if n == 0:
-        return False
-    for i in range(n):
-        if not isinstance(values[i], Period):
-            return False
-    return True
-
-
-cdef extern from "parse_helper.h":
-    inline int floatify(object, double *result, int *maybe_int) except -1
-
-cdef int64_t iINT64_MAX = <int64_t> INT64_MAX
-cdef int64_t iINT64_MIN = <int64_t> INT64_MIN
-
-def maybe_convert_numeric(object[:] values, set na_values,
-                          bint convert_empty=True, bint coerce_numeric=False):
-    '''
-    Type inference function-- convert strings to numeric (potentially) and
-    convert to proper dtype array
-    '''
-    cdef:
-        int status, maybe_int
-        Py_ssize_t i, n = values.size
-        ndarray[float64_t] floats = np.empty(n, dtype='f8')
-        ndarray[complex128_t] complexes = np.empty(n, dtype='c16')
-        ndarray[int64_t] ints = np.empty(n, dtype='i8')
-        ndarray[uint8_t] bools = np.empty(n, dtype='u1')
-        bint seen_float = False
-        bint seen_complex = False
-        bint seen_int = False
-        bint seen_bool = False
-        object val
-        float64_t fval
-
-    for i in range(n):
-        val = values[i]
-
-        if val in na_values:
-            floats[i] = complexes[i] = nan
-            seen_float = True
-        elif util.is_float_object(val):
-            floats[i] = complexes[i] = val
-            seen_float = True
-        elif util.is_integer_object(val):
-            floats[i] = ints[i] = val
-            seen_int = True
-        elif util.is_bool_object(val):
-            floats[i] = ints[i] = bools[i] = val
-            seen_bool = True
-        elif val is None:
-            floats[i] = complexes[i] = nan
-            seen_float = True
-        elif hasattr(val, '__len__') and len(val) == 0:
-            if convert_empty or coerce_numeric:
-                floats[i] = complexes[i] = nan
-                seen_float = True
-            else:
-                raise ValueError('Empty string encountered')
-        elif util.is_complex_object(val):
-            complexes[i] = val
-            seen_complex = True
-        else:
-            try:
-                status = floatify(val, &fval, &maybe_int)
-                floats[i] = fval
-                if not seen_float:
-                    if maybe_int:
-                        as_int = int(val)
-
-                        if as_int <= iINT64_MAX and as_int >= iINT64_MIN:
-                            ints[i] = as_int
-                        else:
-                            raise ValueError('integer out of range')
-                    else:
-                        seen_float = True
-            except:
-                if not coerce_numeric:
-                    raise
-
-                floats[i] = nan
-                seen_float = True
-
-    if seen_complex:
-        return complexes
-    elif seen_float:
-        return floats
-    elif seen_int:
-        return ints
-    elif seen_bool:
-        return bools.view(np.bool_)
-    return ints
-
-
-def maybe_convert_objects(ndarray[object] objects, bint try_float=0,
-                          bint safe=0, bint convert_datetime=0,
-                          bint convert_timedelta=0):
-    '''
-    Type inference function-- convert object array to proper dtype
-    '''
-    cdef:
-        Py_ssize_t i, n
-        ndarray[float64_t] floats
-        ndarray[complex128_t] complexes
-        ndarray[int64_t] ints
-        ndarray[uint8_t] bools
-        ndarray[int64_t] idatetimes
-        ndarray[int64_t] itimedeltas
-        bint seen_float = 0
-        bint seen_complex = 0
-        bint seen_datetime = 0
-        bint seen_timedelta = 0
-        bint seen_int = 0
-        bint seen_bool = 0
-        bint seen_object = 0
-        bint seen_null = 0
-        bint seen_numeric = 0
-        object val, onan
-        float64_t fval, fnan
-
-    n = len(objects)
-
-    floats = np.empty(n, dtype='f8')
-    complexes = np.empty(n, dtype='c16')
-    ints = np.empty(n, dtype='i8')
-    bools = np.empty(n, dtype=np.uint8)
-
-    if convert_datetime:
-        datetimes = np.empty(n, dtype='M8[ns]')
-        idatetimes = datetimes.view(np.int64)
-
-    if convert_timedelta:
-        timedeltas = np.empty(n, dtype='m8[ns]')
-        itimedeltas = timedeltas.view(np.int64)
-
-    onan = np.nan
-    fnan = np.nan
-
-    for i from 0 <= i < n:
-        val = objects[i]
-
-        if val is None:
-            seen_null = 1
-            floats[i] = complexes[i] = fnan
-        elif util.is_bool_object(val):
-            seen_bool = 1
-            bools[i] = val
-        elif util.is_float_object(val):
-            floats[i] = complexes[i] = val
-            seen_float = 1
-        elif util.is_datetime64_object(val):
-            if convert_datetime:
-                idatetimes[i] = convert_to_tsobject(val, None, None).value
-                seen_datetime = 1
-            else:
-                seen_object = 1
-                # objects[i] = val.astype('O')
-                break
-        elif is_timedelta(val):
-            if convert_timedelta:
-                itimedeltas[i] = convert_to_timedelta64(val, 'ns', False)
-                seen_timedelta = 1
-            else:
-                seen_object = 1
-                break
-        elif util.is_integer_object(val):
-            seen_int = 1
-            floats[i] = <float64_t> val
-            complexes[i] = <double complex> val
-            if not seen_null:
-                try:
-                    ints[i] = val
-                except OverflowError:
-                    seen_object = 1
-                    break
-        elif util.is_complex_object(val):
-            complexes[i] = val
-            seen_complex = 1
-        elif PyDateTime_Check(val) or util.is_datetime64_object(val):
-            if convert_datetime:
-                seen_datetime = 1
-                idatetimes[i] = convert_to_tsobject(val, None, None).value
-            else:
-                seen_object = 1
-                break
-        elif try_float and not util.is_string_object(val):
-            # this will convert Decimal objects
-            try:
-                floats[i] = float(val)
-                complexes[i] = complex(val)
-                seen_float = 1
-            except Exception:
-                seen_object = 1
-                break
-        else:
-            seen_object = 1
-            break
-
-    seen_numeric = seen_complex or seen_float or seen_int
-
-    if not seen_object:
-
-        if not safe:
-            if seen_null:
-                if not seen_bool and not seen_datetime and not seen_timedelta:
-                    if seen_complex:
-                        return complexes
-                    elif seen_float or seen_int:
-                        return floats
-            else:
-                if not seen_bool:
-                    if seen_datetime:
-                        if not seen_numeric:
-                            return datetimes
-                    elif seen_timedelta:
-                        if not seen_numeric:
-                            return timedeltas
-                    else:
-                        if seen_complex:
-                            return complexes
-                        elif seen_float:
-                            return floats
-                        elif seen_int:
-                            return ints
-                elif not seen_datetime and not seen_numeric and not seen_timedelta:
-                    return bools.view(np.bool_)
-
-        else:
-            # don't cast int to float, etc.
-            if seen_null:
-                if not seen_bool and not seen_datetime and not seen_timedelta:
-                    if seen_complex:
-                        if not seen_int:
-                            return complexes
-                    elif seen_float:
-                        if not seen_int:
-                            return floats
-            else:
-                if not seen_bool:
-                    if seen_datetime:
-                        if not seen_numeric:
-                            return datetimes
-                    elif seen_timedelta:
-                        if not seen_numeric:
-                            return timedeltas
-                    else:
-                        if seen_complex:
-                            if not seen_int:
-                                return complexes
-                        elif seen_float:
-                            if not seen_int:
-                                return floats
-                        elif seen_int:
-                            return ints
-                elif not seen_datetime and not seen_numeric and not seen_timedelta:
-                    return bools.view(np.bool_)
-
-    return objects
-
-
-def convert_sql_column(x):
-    return maybe_convert_objects(x, try_float=1)
-
-def try_parse_dates(ndarray[object] values, parser=None,
-                    dayfirst=False,default=None):
-    cdef:
-        Py_ssize_t i, n
-        ndarray[object] result
-
-    n = len(values)
-    result = np.empty(n, dtype='O')
-
-    if parser is None:
-        if default is None: # GH2618
-           date=datetime.now()
-           default=datetime(date.year,date.month,1)
-
-        try:
-            from dateutil.parser import parse
-            parse_date = lambda x: parse(x, dayfirst=dayfirst,default=default)
-        except ImportError: # pragma: no cover
-            def parse_date(s):
-                try:
-                    return datetime.strptime(s, '%m/%d/%Y')
-                except Exception:
-                    return s
-        # EAFP here
-        try:
-            for i from 0 <= i < n:
-                if values[i] == '':
-                    result[i] = np.nan
-                else:
-                    result[i] = parse_date(values[i])
-        except Exception:
-            # failed
-            return values
-    else:
-        parse_date = parser
-
-        try:
-            for i from 0 <= i < n:
-                if values[i] == '':
-                    result[i] = np.nan
-                else:
-                    result[i] = parse_date(values[i])
-        except Exception:
-            # raise if passed parser and it failed
-            raise
-
-    return result
-
-def try_parse_date_and_time(ndarray[object] dates, ndarray[object] times,
-                            date_parser=None, time_parser=None,
-                            dayfirst=False,default=None):
-    cdef:
-        Py_ssize_t i, n
-        ndarray[object] result
-
-    from datetime import date, time, datetime, timedelta
-
-    n = len(dates)
-    if len(times) != n:
-        raise ValueError('Length of dates and times must be equal')
-    result = np.empty(n, dtype='O')
-
-    if date_parser is None:
-        if default is None: # GH2618
-           date=datetime.now()
-           default=datetime(date.year,date.month,1)
-
-        try:
-            from dateutil.parser import parse
-            parse_date = lambda x: parse(x, dayfirst=dayfirst, default=default)
-        except ImportError: # pragma: no cover
-            def parse_date(s):
-                try:
-                    return date.strptime(s, '%m/%d/%Y')
-                except Exception:
-                    return s
-    else:
-        parse_date = date_parser
-
-    if time_parser is None:
-        try:
-            from dateutil.parser import parse
-            parse_time = lambda x: parse(x)
-        except ImportError: # pragma: no cover
-            def parse_time(s):
-                try:
-                    return time.strptime(s, '%H:%M:%S')
-                except Exception:
-                    return s
-
-    else:
-        parse_time = time_parser
-
-    for i from 0 <= i < n:
-        d = parse_date(str(dates[i]))
-        t = parse_time(str(times[i]))
-        result[i] = datetime(d.year, d.month, d.day,
-                             t.hour, t.minute, t.second)
-
-    return result
-
-
-def try_parse_year_month_day(ndarray[object] years, ndarray[object] months,
-                             ndarray[object] days):
-    cdef:
-        Py_ssize_t i, n
-        ndarray[object] result
-
-    from datetime import datetime
-
-    n = len(years)
-    if len(months) != n or len(days) != n:
-        raise ValueError('Length of years/months/days must all be equal')
-    result = np.empty(n, dtype='O')
-
-    for i from 0 <= i < n:
-        result[i] = datetime(int(years[i]), int(months[i]), int(days[i]))
-
-    return result
-
-def try_parse_datetime_components(ndarray[object] years,
-                                  ndarray[object] months,
-                                  ndarray[object] days,
-                                  ndarray[object] hours,
-                                  ndarray[object] minutes,
-                                  ndarray[object] seconds):
-
-    cdef:
-        Py_ssize_t i, n
-        ndarray[object] result
-        int secs
-        double float_secs
-        double micros
-
-    from datetime import datetime
-
-    n = len(years)
-    if (len(months) != n or len(days) != n or len(hours) != n or
-        len(minutes) != n or len(seconds) != n):
-        raise ValueError('Length of all datetime components must be equal')
-    result = np.empty(n, dtype='O')
-
-    for i from 0 <= i < n:
-        float_secs = float(seconds[i])
-        secs = int(float_secs)
-
-        micros = float_secs - secs
-        if micros > 0:
-            micros = micros * 1000000
-
-        result[i] = datetime(int(years[i]), int(months[i]), int(days[i]),
-                             int(hours[i]), int(minutes[i]), secs,
-                             int(micros))
-
-    return result
-
-def sanitize_objects(ndarray[object] values, set na_values,
-                     convert_empty=True):
-    cdef:
-        Py_ssize_t i, n
-        object val, onan
-        Py_ssize_t na_count = 0
-        dict memo = {}
-
-    n = len(values)
-    onan = np.nan
-
-    for i from 0 <= i < n:
-        val = values[i]
-        if (convert_empty and val == '') or (val in na_values):
-            values[i] = onan
-            na_count += 1
-        elif val in memo:
-            values[i] = memo[val]
-        else:
-            memo[val] = val
-
-    return na_count
-
-def maybe_convert_bool(ndarray[object] arr,
-                       true_values=None, false_values=None):
-    cdef:
-        Py_ssize_t i, n
-        ndarray[uint8_t] result
-        object val
-        set true_vals, false_vals
-        int na_count = 0
-
-    n = len(arr)
-    result = np.empty(n, dtype=np.uint8)
-
-    # the defaults
-    true_vals = set(('True', 'TRUE', 'true'))
-    false_vals = set(('False', 'FALSE', 'false'))
-
-    if true_values is not None:
-        true_vals = true_vals | set(true_values)
-
-    if false_values is not None:
-        false_vals = false_vals | set(false_values)
-
-    for i from 0 <= i < n:
-        val = arr[i]
-
-        if cpython.PyBool_Check(val):
-            if val is True:
-                result[i] = 1
-            else:
-                result[i] = 0
-        elif val in true_vals:
-            result[i] = 1
-        elif val in false_vals:
-            result[i] = 0
-        elif PyFloat_Check(val):
-            result[i] = UINT8_MAX
-            na_count += 1
-        else:
-            return arr
-
-    if na_count > 0:
-        mask = result == UINT8_MAX
-        arr = result.view(np.bool_).astype(object)
-        np.putmask(arr, mask, np.nan)
-        return arr
-    else:
-        return result.view(np.bool_)
-
-
-def map_infer_mask(ndarray arr, object f, ndarray[uint8_t] mask,
-                   bint convert=1):
-    '''
-    Substitute for np.vectorize with pandas-friendly dtype inference
-
-    Parameters
-    ----------
-    arr : ndarray
-    f : function
-
-    Returns
-    -------
-    mapped : ndarray
-    '''
-    cdef:
-        Py_ssize_t i, n
-        ndarray[object] result
-        object val
-
-    n = len(arr)
-    result = np.empty(n, dtype=object)
-    for i in range(n):
-        if mask[i]:
-            val = util.get_value_at(arr, i)
-        else:
-            val = f(util.get_value_at(arr, i))
-
-            # unbox 0-dim arrays, GH #690
-            if is_array(val) and PyArray_NDIM(val) == 0:
-                # is there a faster way to unbox?
-                val = val.item()
-
-        result[i] = val
-
-    if convert:
-        return maybe_convert_objects(result,
-                                     try_float=0,
-                                     convert_datetime=0,
-                                     convert_timedelta=0)
-
-    return result
-
-def map_infer(ndarray arr, object f, bint convert=1):
-    '''
-    Substitute for np.vectorize with pandas-friendly dtype inference
-
-    Parameters
-    ----------
-    arr : ndarray
-    f : function
-
-    Returns
-    -------
-    mapped : ndarray
-    '''
-    cdef:
-        Py_ssize_t i, n
-        ndarray[object] result
-        object val
-
-    n = len(arr)
-    result = np.empty(n, dtype=object)
-    for i in range(n):
-        val = f(util.get_value_at(arr, i))
-
-        # unbox 0-dim arrays, GH #690
-        if is_array(val) and PyArray_NDIM(val) == 0:
-            # is there a faster way to unbox?
-            val = val.item()
-
-        result[i] = val
-
-    if convert:
-        return maybe_convert_objects(result,
-                                     try_float=0,
-                                     convert_datetime=0,
-                                     convert_timedelta=0)
-
-    return result
-
-
-def to_object_array(list rows):
-    cdef:
-        Py_ssize_t i, j, n, k, tmp
-        ndarray[object, ndim=2] result
-        list row
-
-    n = len(rows)
-
-    k = 0
-    for i from 0 <= i < n:
-        tmp = len(rows[i])
-        if tmp > k:
-            k = tmp
-
-    result = np.empty((n, k), dtype=object)
-
-    for i from 0 <= i < n:
-        row = rows[i]
-
-        for j from 0 <= j < len(row):
-            result[i, j] = row[j]
-
-    return result
-
-def tuples_to_object_array(ndarray[object] tuples):
-    cdef:
-        Py_ssize_t i, j, n, k, tmp
-        ndarray[object, ndim=2] result
-        tuple tup
-
-    n = len(tuples)
-    k = len(tuples[0])
-    result = np.empty((n, k), dtype=object)
-    for i in range(n):
-        tup = tuples[i]
-        for j in range(k):
-            result[i, j] = tup[j]
-
-    return result
-
-def to_object_array_tuples(list rows):
-    cdef:
-        Py_ssize_t i, j, n, k, tmp
-        ndarray[object, ndim=2] result
-        tuple row
-
-    n = len(rows)
-
-    k = 0
-    for i from 0 <= i < n:
-        tmp = len(rows[i])
-        if tmp > k:
-            k = tmp
-
-    result = np.empty((n, k), dtype=object)
-
-    try:
-        for i in range(n):
-            row = rows[i]
-            for j from 0 <= j < len(row):
-                result[i, j] = row[j]
-    except Exception:
-        # upcast any subclasses to tuple
-        for i in range(n):
-            row = tuple(rows[i])
-            for j from 0 <= j < len(row):
-                result[i, j] = row[j]
-
-    return result
-
-
-def fast_multiget(dict mapping, ndarray keys, default=np.nan):
-    cdef:
-        Py_ssize_t i, n = len(keys)
-        object val
-        ndarray[object] output = np.empty(n, dtype='O')
-
-    if n == 0:
-        # kludge, for Series
-        return np.empty(0, dtype='f8')
-
-    keys = getattr(keys, 'values', keys)
-
-    for i in range(n):
-        val = util.get_value_1d(keys, i)
-        if val in mapping:
-            output[i] = mapping[val]
-        else:
-            output[i] = default
-
-    return maybe_convert_objects(output)
diff --git a/pandas/src/khash.pxd b/pandas/src/khash.pxd
deleted file mode 100644
index b28f43eecfac7..0000000000000
--- a/pandas/src/khash.pxd
+++ /dev/null
@@ -1,123 +0,0 @@
-from cpython cimport PyObject
-from numpy cimport int64_t, int32_t, uint32_t, float64_t
-
-cdef extern from "khash_python.h":
-    ctypedef uint32_t khint_t
-    ctypedef khint_t khiter_t
-
-    ctypedef struct kh_pymap_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        PyObject **keys
-        size_t *vals
-
-    inline kh_pymap_t* kh_init_pymap()
-    inline void kh_destroy_pymap(kh_pymap_t*)
-    inline void kh_clear_pymap(kh_pymap_t*)
-    inline khint_t kh_get_pymap(kh_pymap_t*, PyObject*)
-    inline void kh_resize_pymap(kh_pymap_t*, khint_t)
-    inline khint_t kh_put_pymap(kh_pymap_t*, PyObject*, int*)
-    inline void kh_del_pymap(kh_pymap_t*, khint_t)
-
-    bint kh_exist_pymap(kh_pymap_t*, khiter_t)
-
-    ctypedef struct kh_pyset_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        PyObject **keys
-        size_t *vals
-
-    inline kh_pyset_t* kh_init_pyset()
-    inline void kh_destroy_pyset(kh_pyset_t*)
-    inline void kh_clear_pyset(kh_pyset_t*)
-    inline khint_t kh_get_pyset(kh_pyset_t*, PyObject*)
-    inline void kh_resize_pyset(kh_pyset_t*, khint_t)
-    inline khint_t kh_put_pyset(kh_pyset_t*, PyObject*, int*)
-    inline void kh_del_pyset(kh_pyset_t*, khint_t)
-
-    bint kh_exist_pyset(kh_pyset_t*, khiter_t)
-
-    ctypedef char* kh_cstr_t
-
-    ctypedef struct kh_str_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        kh_cstr_t *keys
-        size_t *vals
-
-    inline kh_str_t* kh_init_str() nogil
-    inline void kh_destroy_str(kh_str_t*) nogil
-    inline void kh_clear_str(kh_str_t*) nogil
-    inline khint_t kh_get_str(kh_str_t*, kh_cstr_t) nogil
-    inline void kh_resize_str(kh_str_t*, khint_t) nogil
-    inline khint_t kh_put_str(kh_str_t*, kh_cstr_t, int*) nogil
-    inline void kh_del_str(kh_str_t*, khint_t) nogil
-
-    bint kh_exist_str(kh_str_t*, khiter_t) nogil
-
-
-    ctypedef struct kh_int64_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        int64_t *keys
-        size_t *vals
-
-    inline kh_int64_t* kh_init_int64() nogil
-    inline void kh_destroy_int64(kh_int64_t*) nogil
-    inline void kh_clear_int64(kh_int64_t*) nogil
-    inline khint_t kh_get_int64(kh_int64_t*, int64_t) nogil
-    inline void kh_resize_int64(kh_int64_t*, khint_t) nogil
-    inline khint_t kh_put_int64(kh_int64_t*, int64_t, int*) nogil
-    inline void kh_del_int64(kh_int64_t*, khint_t) nogil
-
-    bint kh_exist_int64(kh_int64_t*, khiter_t) nogil
-
-    ctypedef struct kh_float64_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        float64_t *keys
-        size_t *vals
-
-    inline kh_float64_t* kh_init_float64() nogil
-    inline void kh_destroy_float64(kh_float64_t*) nogil
-    inline void kh_clear_float64(kh_float64_t*) nogil
-    inline khint_t kh_get_float64(kh_float64_t*, float64_t) nogil
-    inline void kh_resize_float64(kh_float64_t*, khint_t) nogil
-    inline khint_t kh_put_float64(kh_float64_t*, float64_t, int*) nogil
-    inline void kh_del_float64(kh_float64_t*, khint_t) nogil
-
-    bint kh_exist_float64(kh_float64_t*, khiter_t) nogil
-
-    ctypedef struct kh_int32_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        int32_t *keys
-        size_t *vals
-
-    inline kh_int32_t* kh_init_int32() nogil
-    inline void kh_destroy_int32(kh_int32_t*) nogil
-    inline void kh_clear_int32(kh_int32_t*) nogil
-    inline khint_t kh_get_int32(kh_int32_t*, int32_t) nogil
-    inline void kh_resize_int32(kh_int32_t*, khint_t) nogil
-    inline khint_t kh_put_int32(kh_int32_t*, int32_t, int*) nogil
-    inline void kh_del_int32(kh_int32_t*, khint_t) nogil
-
-    bint kh_exist_int32(kh_int32_t*, khiter_t) nogil
-
-    # sweep factorize
-
-    ctypedef struct kh_strbox_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        kh_cstr_t *keys
-        PyObject **vals
-
-    inline kh_strbox_t* kh_init_strbox() nogil
-    inline void kh_destroy_strbox(kh_strbox_t*) nogil
-    inline void kh_clear_strbox(kh_strbox_t*) nogil
-    inline khint_t kh_get_strbox(kh_strbox_t*, kh_cstr_t) nogil
-    inline void kh_resize_strbox(kh_strbox_t*, khint_t) nogil
-    inline khint_t kh_put_strbox(kh_strbox_t*, kh_cstr_t, int*) nogil
-    inline void kh_del_strbox(kh_strbox_t*, khint_t) nogil
-
-    bint kh_exist_strbox(kh_strbox_t*, khiter_t) nogil
diff --git a/pandas/src/klib/khash_python.h b/pandas/src/klib/khash_python.h
deleted file mode 100644
index cdd94b5d8522f..0000000000000
--- a/pandas/src/klib/khash_python.h
+++ /dev/null
@@ -1,49 +0,0 @@
-#include <Python.h>
-
-#include "khash.h"
-
-// kludge
-
-#define kh_float64_hash_func _Py_HashDouble
-#define kh_float64_hash_equal(a, b) ((a) == (b) || ((b) != (b) && (a) != (a)))
-
-#define KHASH_MAP_INIT_FLOAT64(name, khval_t)								\
-	KHASH_INIT(name, khfloat64_t, khval_t, 1, kh_float64_hash_func, kh_float64_hash_equal)
-
-KHASH_MAP_INIT_FLOAT64(float64, size_t)
-
-
-int PANDAS_INLINE pyobject_cmp(PyObject* a, PyObject* b) {
-	int result = PyObject_RichCompareBool(a, b, Py_EQ);
-	if (result < 0) {
-		PyErr_Clear();
-		return 0;
-	}
-	return result;
-}
-
-
-#define kh_python_hash_func(key) (PyObject_Hash(key))
-#define kh_python_hash_equal(a, b) (pyobject_cmp(a, b))
-
-
-// Python object
-
-typedef PyObject* kh_pyobject_t;
-
-#define KHASH_MAP_INIT_PYOBJECT(name, khval_t)							\
-	KHASH_INIT(name, kh_pyobject_t, khval_t, 1,						\
-			   kh_python_hash_func, kh_python_hash_equal)
-
-KHASH_MAP_INIT_PYOBJECT(pymap, Py_ssize_t)
-
-#define KHASH_SET_INIT_PYOBJECT(name)                                  \
-	KHASH_INIT(name, kh_pyobject_t, char, 0,     \
-			   kh_python_hash_func, kh_python_hash_equal)
-
-KHASH_SET_INIT_PYOBJECT(pyset)
-
-#define kh_exist_pymap(h, k) (kh_exist(h, k))
-#define kh_exist_pyset(h, k) (kh_exist(h, k))
-
-KHASH_MAP_INIT_STR(strbox, kh_pyobject_t)
diff --git a/pandas/src/klib/ktypes.h b/pandas/src/klib/ktypes.h
deleted file mode 100644
index 981f17372a2d5..0000000000000
--- a/pandas/src/klib/ktypes.h
+++ /dev/null
@@ -1,6 +0,0 @@
-#ifndef __KTYPES_H
-#define __KTYPES_H
-
-/* compipler specific configuration */
-
-#endif /* __KTYPES_H */
diff --git a/pandas/src/klib/kvec.h b/pandas/src/klib/kvec.h
deleted file mode 100644
index 032962e5e17db..0000000000000
--- a/pandas/src/klib/kvec.h
+++ /dev/null
@@ -1,151 +0,0 @@
-/* The MIT License
-
-   Copyright (c) 2008, by Attractive Chaos <attractor@live.co.uk>
-
-   Permission is hereby granted, free of charge, to any person obtaining
-   a copy of this software and associated documentation files (the
-   "Software"), to deal in the Software without restriction, including
-   without limitation the rights to use, copy, modify, merge, publish,
-   distribute, sublicense, and/or sell copies of the Software, and to
-   permit persons to whom the Software is furnished to do so, subject to
-   the following conditions:
-
-   The above copyright notice and this permission notice shall be
-   included in all copies or substantial portions of the Software.
-
-   THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
-   EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
-   MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
-   NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
-   BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
-   ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
-   CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-   SOFTWARE.
-*/
-
-/*
-  An example:
-
-#include "kvec.h"
-int main() {
-	kvec_t(int) array;
-	kv_init(array);
-	kv_push(int, array, 10); // append
-	kv_a(int, array, 20) = 5; // dynamic
-	kv_A(array, 20) = 4; // static
-	kv_destroy(array);
-	return 0;
-}
-*/
-
-/*
-  2008-09-22 (0.1.0):
-
-	* The initial version.
-
-*/
-
-#ifndef AC_KVEC_H
-#define AC_KVEC_H
-
-#include <stdlib.h>
-#include <Python.h>
-#include <numpy/ndarraytypes.h>
-
-#ifndef PANDAS_INLINE
-  #if defined(__GNUC__)
-    #define PANDAS_INLINE __inline__
-  #elif defined(_MSC_VER)
-    #define PANDAS_INLINE __inline
-  #elif defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
-    #define PANDAS_INLINE inline
-  #else
-    #define PANDAS_INLINE
-  #endif
-#endif
-
-#define kv_roundup32(x) (--(x), (x)|=(x)>>1, (x)|=(x)>>2, (x)|=(x)>>4, (x)|=(x)>>8, (x)|=(x)>>16, ++(x))
-
-#define kvec_t(type) struct { size_t n, m; type *a; }
-#define kv_init(v) ((v).n = (v).m = 0, (v).a = 0)
-#define kv_destroy(v) free((v).a)
-#define kv_A(v, i) ((v).a[(i)])
-#define kv_pop(v) ((v).a[--(v).n])
-#define kv_size(v) ((v).n)
-#define kv_max(v) ((v).m)
-
-#define kv_resize(type, v, s)  ((v).m = (s), (v).a = (type*)realloc((v).a, sizeof(type) * (v).m))
-
-#define kv_copy(type, v1, v0) do {							\
-		if ((v1).m < (v0).n) kv_resize(type, v1, (v0).n);	\
-		(v1).n = (v0).n;									\
-		memcpy((v1).a, (v0).a, sizeof(type) * (v0).n);		\
-	} while (0)												\
-
-#define kv_push(type, v, x) do {									\
-		if ((v)->n == (v)->m) {										\
-			(v)->m = (v)->m? (v)->m<<1 : 2;							\
-			(v)->a = (type*)realloc((v)->a, sizeof(type) * (v)->m);	\
-		}															\
-		(v)->a[(v)->n++] = (x);										\
-	} while (0)
-
-#define kv_pushp(type, v) (((v).n == (v).m)?							\
-						   ((v).m = ((v).m? (v).m<<1 : 2),				\
-							(v).a = (type*)realloc((v).a, sizeof(type) * (v).m), 0)	\
-						   : 0), ((v).a + ((v).n++))
-
-#define kv_a(type, v, i) ((v).m <= (size_t)(i)?						\
-						  ((v).m = (v).n = (i) + 1, kv_roundup32((v).m), \
-						   (v).a = (type*)realloc((v).a, sizeof(type) * (v).m), 0) \
-						  : (v).n <= (size_t)(i)? (v).n = (i)			\
-						  : 0), (v).a[(i)]
-
-// #define kv_int64_push(v, x) (kv_push(int64_t, (v), (x)))
-
-typedef struct {
-  size_t n, m;
-  int64_t* a;
-} kv_int64_t;
-
-typedef struct {
-  size_t n, m;
-  double* a;
-} kv_double;
-
-typedef struct {
-  size_t n, m;
-  PyObject** a;
-} kv_object_t;
-
-void PANDAS_INLINE kv_object_push(kv_object_t *v, PyObject *x) {
-  do {
-		if (v->n == v->m) {
-			v->m = v->m? v->m<<1 : 2;
-			v->a = (PyObject**)realloc(v->a, sizeof(PyObject*) * v->m);
-		}
-		v->a[v->n++] = x;
-	} while (0);
-  // kv_push(PyObject*, v, x);
-  Py_INCREF(x);
-}
-
-void PANDAS_INLINE kv_int64_push(kv_int64_t *v, int64_t x) {
-  kv_push(int64_t, v, x);
-}
-
-void PANDAS_INLINE kv_double_push(kv_double *v, double x) {
-  kv_push(double, v, x);
-}
-
-void PANDAS_INLINE kv_object_destroy(kv_object_t *v) {
-  int i;
-  for (i = 0; i < v->n; ++i)
-  {
-    Py_XDECREF(v->a[i]);
-  }
-  free(v->a);
-}
-
-
-#endif
diff --git a/pandas/src/numpy.pxd b/pandas/src/numpy.pxd
deleted file mode 100644
index 9ab3b9b1b81ae..0000000000000
--- a/pandas/src/numpy.pxd
+++ /dev/null
@@ -1,984 +0,0 @@
-# NumPy static imports for Cython
-#
-# If any of the PyArray_* functions are called, import_array must be
-# called first.
-#
-# This also defines backwards-compatability buffer acquisition
-# code for use in Python 2.x (or Python <= 2.5 when NumPy starts
-# implementing PEP-3118 directly).
-#
-# Because of laziness, the format string of the buffer is statically
-# allocated. Increase the size if this is not enough, or submit a
-# patch to do this properly.
-#
-# Author: Dag Sverre Seljebotn
-#
-
-DEF _buffer_format_string_len = 255
-
-cimport cpython.buffer as pybuf
-from cpython.ref cimport Py_INCREF, Py_XDECREF
-from cpython.object cimport PyObject
-cimport libc.stdlib as stdlib
-cimport libc.stdio as stdio
-
-cdef extern from "Python.h":
-    ctypedef int Py_intptr_t
-
-cdef extern from "numpy/arrayobject.h":
-    ctypedef Py_intptr_t npy_intp
-    ctypedef size_t npy_uintp
-
-    cdef enum NPY_TYPES:
-        NPY_BOOL
-        NPY_BYTE
-        NPY_UBYTE
-        NPY_SHORT
-        NPY_USHORT
-        NPY_INT
-        NPY_UINT
-        NPY_LONG
-        NPY_ULONG
-        NPY_LONGLONG
-        NPY_ULONGLONG
-        NPY_FLOAT
-        NPY_DOUBLE
-        NPY_LONGDOUBLE
-        NPY_CFLOAT
-        NPY_CDOUBLE
-        NPY_CLONGDOUBLE
-        NPY_OBJECT
-        NPY_STRING
-        NPY_UNICODE
-        NPY_VOID
-        NPY_NTYPES
-        NPY_NOTYPE
-
-        NPY_INT8
-        NPY_INT16
-        NPY_INT32
-        NPY_INT64
-        NPY_INT128
-        NPY_INT256
-        NPY_UINT8
-        NPY_UINT16
-        NPY_UINT32
-        NPY_UINT64
-        NPY_UINT128
-        NPY_UINT256
-        NPY_FLOAT16
-        NPY_FLOAT32
-        NPY_FLOAT64
-        NPY_FLOAT80
-        NPY_FLOAT96
-        NPY_FLOAT128
-        NPY_FLOAT256
-        NPY_COMPLEX32
-        NPY_COMPLEX64
-        NPY_COMPLEX128
-        NPY_COMPLEX160
-        NPY_COMPLEX192
-        NPY_COMPLEX256
-        NPY_COMPLEX512
-
-        NPY_DATETIME
-        NPY_TIMEDELTA
-
-        NPY_INTP
-
-    ctypedef enum NPY_ORDER:
-        NPY_ANYORDER
-        NPY_CORDER
-        NPY_FORTRANORDER
-
-    ctypedef enum NPY_CLIPMODE:
-        NPY_CLIP
-        NPY_WRAP
-        NPY_RAISE
-
-    ctypedef enum NPY_SCALARKIND:
-        NPY_NOSCALAR,
-        NPY_BOOL_SCALAR,
-        NPY_INTPOS_SCALAR,
-        NPY_INTNEG_SCALAR,
-        NPY_FLOAT_SCALAR,
-        NPY_COMPLEX_SCALAR,
-        NPY_OBJECT_SCALAR
-
-    ctypedef enum NPY_SORTKIND:
-        NPY_QUICKSORT
-        NPY_HEAPSORT
-        NPY_MERGESORT
-
-    ctypedef enum NPY_SEARCHSIDE:
-        NPY_SEARCHLEFT
-        NPY_SEARCHRIGHT
-
-    enum:
-        NPY_C_CONTIGUOUS
-        NPY_F_CONTIGUOUS
-        NPY_CONTIGUOUS
-        NPY_FORTRAN
-        NPY_OWNDATA
-        NPY_FORCECAST
-        NPY_ENSURECOPY
-        NPY_ENSUREARRAY
-        NPY_ELEMENTSTRIDES
-        NPY_ALIGNED
-        NPY_NOTSWAPPED
-        NPY_WRITEABLE
-        NPY_UPDATEIFCOPY
-        NPY_ARR_HAS_DESCR
-
-        NPY_BEHAVED
-        NPY_BEHAVED_NS
-        NPY_CARRAY
-        NPY_CARRAY_RO
-        NPY_FARRAY
-        NPY_FARRAY_RO
-        NPY_DEFAULT
-
-        NPY_IN_ARRAY
-        NPY_OUT_ARRAY
-        NPY_INOUT_ARRAY
-        NPY_IN_FARRAY
-        NPY_OUT_FARRAY
-        NPY_INOUT_FARRAY
-
-        NPY_UPDATE_ALL
-
-    cdef enum:
-        NPY_MAXDIMS
-
-    npy_intp NPY_MAX_ELSIZE
-
-    ctypedef void (*PyArray_VectorUnaryFunc)(void *, void *, npy_intp, void *,  void *)
-
-    ctypedef class numpy.dtype [object PyArray_Descr]:
-        # Use PyDataType_* macros when possible, however there are no macros
-        # for accessing some of the fields, so some are defined. Please
-        # ask on cython-dev if you need more.
-        cdef int type_num
-        cdef int itemsize "elsize"
-        cdef char byteorder
-        cdef object fields
-        cdef tuple names
-
-    ctypedef extern class numpy.flatiter [object PyArrayIterObject]:
-        # Use through macros
-        pass
-
-    ctypedef extern class numpy.broadcast [object PyArrayMultiIterObject]:
-        # Use through macros
-        pass
-
-    ctypedef struct PyArrayObject:
-        # For use in situations where ndarray can't replace PyArrayObject*,
-        # like PyArrayObject**.
-        pass
-
-    ctypedef class numpy.ndarray [object PyArrayObject]:
-        cdef __cythonbufferdefaults__ = {"mode": "strided"}
-
-        cdef:
-            # Only taking a few of the most commonly used and stable fields.
-            # One should use PyArray_* macros instead to access the C fields.
-            char *data
-            int ndim "nd"
-            npy_intp *shape "dimensions"
-            npy_intp *strides
-            dtype descr
-            PyObject* base
-
-        # Note: This syntax (function definition in pxd files) is an
-        # experimental exception made for __getbuffer__ and __releasebuffer__
-        # -- the details of this may change.
-        def __getbuffer__(ndarray self, Py_buffer* info, int flags):
-            # This implementation of getbuffer is geared towards Cython
-            # requirements, and does not yet fullfill the PEP.
-            # In particular strided access is always provided regardless
-            # of flags
-
-            if info == NULL: return
-
-            cdef int copy_shape, i, ndim
-            cdef int endian_detector = 1
-            cdef bint little_endian = ((<char*>&endian_detector)[0] != 0)
-
-            ndim = PyArray_NDIM(self)
-
-            if sizeof(npy_intp) != sizeof(Py_ssize_t):
-                copy_shape = 1
-            else:
-                copy_shape = 0
-
-            if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS)
-                and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)):
-                raise ValueError(u"ndarray is not C contiguous")
-
-            if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS)
-                and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)):
-                raise ValueError(u"ndarray is not Fortran contiguous")
-
-            info.buf = PyArray_DATA(self)
-            info.ndim = ndim
-            if copy_shape:
-                # Allocate new buffer for strides and shape info.
-                # This is allocated as one block, strides first.
-                info.strides = <Py_ssize_t*>stdlib.malloc(sizeof(Py_ssize_t) * <size_t>ndim * 2)
-                info.shape = info.strides + ndim
-                for i in range(ndim):
-                    info.strides[i] = PyArray_STRIDES(self)[i]
-                    info.shape[i] = PyArray_DIMS(self)[i]
-            else:
-                info.strides = <Py_ssize_t*>PyArray_STRIDES(self)
-                info.shape = <Py_ssize_t*>PyArray_DIMS(self)
-            info.suboffsets = NULL
-            info.itemsize = PyArray_ITEMSIZE(self)
-            info.readonly = not PyArray_ISWRITEABLE(self)
-
-            cdef int t
-            cdef char* f = NULL
-            cdef dtype descr = self.descr
-            cdef list stack
-            cdef int offset
-
-            cdef bint hasfields = PyDataType_HASFIELDS(descr)
-
-            if not hasfields and not copy_shape:
-                # do not call releasebuffer
-                info.obj = None
-            else:
-                # need to call releasebuffer
-                info.obj = self
-
-            if not hasfields:
-                t = descr.type_num
-                if ((descr.byteorder == '>' and little_endian) or
-                    (descr.byteorder == '<' and not little_endian)):
-                    raise ValueError(u"Non-native byte order not supported")
-                if   t == NPY_BYTE:        f = "b"
-                elif t == NPY_UBYTE:       f = "B"
-                elif t == NPY_SHORT:       f = "h"
-                elif t == NPY_USHORT:      f = "H"
-                elif t == NPY_INT:         f = "i"
-                elif t == NPY_UINT:        f = "I"
-                elif t == NPY_LONG:        f = "l"
-                elif t == NPY_ULONG:       f = "L"
-                elif t == NPY_LONGLONG:    f = "q"
-                elif t == NPY_ULONGLONG:   f = "Q"
-                elif t == NPY_FLOAT:       f = "f"
-                elif t == NPY_DOUBLE:      f = "d"
-                elif t == NPY_LONGDOUBLE:  f = "g"
-                elif t == NPY_CFLOAT:      f = "Zf"
-                elif t == NPY_CDOUBLE:     f = "Zd"
-                elif t == NPY_CLONGDOUBLE: f = "Zg"
-                elif t == NPY_OBJECT:      f = "O"
-                else:
-                    raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t)
-                info.format = f
-                return
-            else:
-                info.format = <char*>stdlib.malloc(_buffer_format_string_len)
-                info.format[0] = '^' # Native data types, manual alignment
-                offset = 0
-                f = _util_dtypestring(descr, info.format + 1,
-                                      info.format + _buffer_format_string_len,
-                                      &offset)
-                f[0] = 0 # Terminate format string
-
-        def __releasebuffer__(ndarray self, Py_buffer* info):
-            if PyArray_HASFIELDS(self):
-                stdlib.free(info.format)
-            if sizeof(npy_intp) != sizeof(Py_ssize_t):
-                stdlib.free(info.strides)
-                # info.shape was stored after info.strides in the same block
-
-
-    ctypedef signed char      npy_bool
-
-    ctypedef signed char      npy_byte
-    ctypedef signed short     npy_short
-    ctypedef signed int       npy_int
-    ctypedef signed long      npy_long
-    ctypedef signed long long npy_longlong
-
-    ctypedef unsigned char      npy_ubyte
-    ctypedef unsigned short     npy_ushort
-    ctypedef unsigned int       npy_uint
-    ctypedef unsigned long      npy_ulong
-    ctypedef unsigned long long npy_ulonglong
-
-    ctypedef float        npy_float
-    ctypedef double       npy_double
-    ctypedef long double  npy_longdouble
-
-    ctypedef signed char        npy_int8
-    ctypedef signed short       npy_int16
-    ctypedef signed int         npy_int32
-    ctypedef signed long long   npy_int64
-    ctypedef signed long long   npy_int96
-    ctypedef signed long long   npy_int128
-
-    ctypedef unsigned char      npy_uint8
-    ctypedef unsigned short     npy_uint16
-    ctypedef unsigned int       npy_uint32
-    ctypedef unsigned long long npy_uint64
-    ctypedef unsigned long long npy_uint96
-    ctypedef unsigned long long npy_uint128
-
-    ctypedef float        npy_float16
-    ctypedef float        npy_float32
-    ctypedef double       npy_float64
-    ctypedef long double  npy_float80
-    ctypedef long double  npy_float96
-    ctypedef long double  npy_float128
-
-    ctypedef struct npy_cfloat:
-        double real
-        double imag
-
-    ctypedef struct npy_cdouble:
-        double real
-        double imag
-
-    ctypedef struct npy_clongdouble:
-        double real
-        double imag
-
-    ctypedef struct npy_complex64:
-        double real
-        double imag
-
-    ctypedef struct npy_complex128:
-        double real
-        double imag
-
-    ctypedef struct npy_complex160:
-        double real
-        double imag
-
-    ctypedef struct npy_complex192:
-        double real
-        double imag
-
-    ctypedef struct npy_complex256:
-        double real
-        double imag
-
-    ctypedef struct PyArray_Dims:
-        npy_intp *ptr
-        int len
-
-    void import_array()
-
-    #
-    # Macros from ndarrayobject.h
-    #
-    bint PyArray_CHKFLAGS(ndarray m, int flags)
-    bint PyArray_ISCONTIGUOUS(ndarray m)
-    bint PyArray_ISWRITEABLE(ndarray m)
-    bint PyArray_ISALIGNED(ndarray m)
-
-    int PyArray_NDIM(ndarray)
-    bint PyArray_ISONESEGMENT(ndarray)
-    bint PyArray_ISFORTRAN(ndarray)
-    int PyArray_FORTRANIF(ndarray)
-
-    void* PyArray_DATA(ndarray)
-    char* PyArray_BYTES(ndarray)
-    npy_intp* PyArray_DIMS(ndarray)
-    npy_intp* PyArray_STRIDES(ndarray)
-    npy_intp PyArray_DIM(ndarray, size_t)
-    npy_intp PyArray_STRIDE(ndarray, size_t)
-
-    # object PyArray_BASE(ndarray) wrong refcount semantics
-    # dtype PyArray_DESCR(ndarray) wrong refcount semantics
-    int PyArray_FLAGS(ndarray)
-    npy_intp PyArray_ITEMSIZE(ndarray)
-    int PyArray_TYPE(ndarray arr)
-
-    object PyArray_GETITEM(ndarray arr, void *itemptr)
-    int PyArray_SETITEM(ndarray arr, void *itemptr, object obj)
-
-    bint PyTypeNum_ISBOOL(int)
-    bint PyTypeNum_ISUNSIGNED(int)
-    bint PyTypeNum_ISSIGNED(int)
-    bint PyTypeNum_ISINTEGER(int)
-    bint PyTypeNum_ISFLOAT(int)
-    bint PyTypeNum_ISNUMBER(int)
-    bint PyTypeNum_ISSTRING(int)
-    bint PyTypeNum_ISCOMPLEX(int)
-    bint PyTypeNum_ISPYTHON(int)
-    bint PyTypeNum_ISFLEXIBLE(int)
-    bint PyTypeNum_ISUSERDEF(int)
-    bint PyTypeNum_ISEXTENDED(int)
-    bint PyTypeNum_ISOBJECT(int)
-
-    bint PyDataType_ISBOOL(dtype)
-    bint PyDataType_ISUNSIGNED(dtype)
-    bint PyDataType_ISSIGNED(dtype)
-    bint PyDataType_ISINTEGER(dtype)
-    bint PyDataType_ISFLOAT(dtype)
-    bint PyDataType_ISNUMBER(dtype)
-    bint PyDataType_ISSTRING(dtype)
-    bint PyDataType_ISCOMPLEX(dtype)
-    bint PyDataType_ISPYTHON(dtype)
-    bint PyDataType_ISFLEXIBLE(dtype)
-    bint PyDataType_ISUSERDEF(dtype)
-    bint PyDataType_ISEXTENDED(dtype)
-    bint PyDataType_ISOBJECT(dtype)
-    bint PyDataType_HASFIELDS(dtype)
-
-    bint PyArray_ISBOOL(ndarray)
-    bint PyArray_ISUNSIGNED(ndarray)
-    bint PyArray_ISSIGNED(ndarray)
-    bint PyArray_ISINTEGER(ndarray)
-    bint PyArray_ISFLOAT(ndarray)
-    bint PyArray_ISNUMBER(ndarray)
-    bint PyArray_ISSTRING(ndarray)
-    bint PyArray_ISCOMPLEX(ndarray)
-    bint PyArray_ISPYTHON(ndarray)
-    bint PyArray_ISFLEXIBLE(ndarray)
-    bint PyArray_ISUSERDEF(ndarray)
-    bint PyArray_ISEXTENDED(ndarray)
-    bint PyArray_ISOBJECT(ndarray)
-    bint PyArray_HASFIELDS(ndarray)
-
-    bint PyArray_ISVARIABLE(ndarray)
-
-    bint PyArray_SAFEALIGNEDCOPY(ndarray)
-    bint PyArray_ISNBO(ndarray)
-    bint PyArray_IsNativeByteOrder(ndarray)
-    bint PyArray_ISNOTSWAPPED(ndarray)
-    bint PyArray_ISBYTESWAPPED(ndarray)
-
-    bint PyArray_FLAGSWAP(ndarray, int)
-
-    bint PyArray_ISCARRAY(ndarray)
-    bint PyArray_ISCARRAY_RO(ndarray)
-    bint PyArray_ISFARRAY(ndarray)
-    bint PyArray_ISFARRAY_RO(ndarray)
-    bint PyArray_ISBEHAVED(ndarray)
-    bint PyArray_ISBEHAVED_RO(ndarray)
-
-
-    bint PyDataType_ISNOTSWAPPED(dtype)
-    bint PyDataType_ISBYTESWAPPED(dtype)
-
-    bint PyArray_DescrCheck(object)
-
-    bint PyArray_Check(object)
-    bint PyArray_CheckExact(object)
-
-    # Cannot be supported due to out arg:
-    # bint PyArray_HasArrayInterfaceType(object, dtype, object, object&)
-    # bint PyArray_HasArrayInterface(op, out)
-
-
-    bint PyArray_IsZeroDim(object)
-    # Cannot be supported due to ## ## in macro:
-    # bint PyArray_IsScalar(object, verbatim work)
-    bint PyArray_CheckScalar(object)
-    bint PyArray_IsPythonNumber(object)
-    bint PyArray_IsPythonScalar(object)
-    bint PyArray_IsAnyScalar(object)
-    bint PyArray_CheckAnyScalar(object)
-    ndarray PyArray_GETCONTIGUOUS(ndarray)
-    bint PyArray_SAMESHAPE(ndarray, ndarray)
-    npy_intp PyArray_SIZE(ndarray)
-    npy_intp PyArray_NBYTES(ndarray)
-
-    object PyArray_FROM_O(object)
-    object PyArray_FROM_OF(object m, int flags)
-    bint PyArray_FROM_OT(object m, int type)
-    bint PyArray_FROM_OTF(object m, int type, int flags)
-    object PyArray_FROMANY(object m, int type, int min, int max, int flags)
-    object PyArray_ZEROS(int nd, npy_intp* dims, int type, int fortran)
-    object PyArray_EMPTY(int nd, npy_intp* dims, int type, int fortran)
-    void PyArray_FILLWBYTE(object, int val)
-    npy_intp PyArray_REFCOUNT(object)
-    object PyArray_ContiguousFromAny(op, int, int min_depth, int max_depth)
-    unsigned char PyArray_EquivArrTypes(ndarray a1, ndarray a2)
-    bint PyArray_EquivByteorders(int b1, int b2)
-    object PyArray_SimpleNew(int nd, npy_intp* dims, int typenum)
-    object PyArray_SimpleNewFromData(int nd, npy_intp* dims, int typenum, void* data)
-    #object PyArray_SimpleNewFromDescr(int nd, npy_intp* dims, dtype descr)
-    object PyArray_ToScalar(void* data, ndarray arr)
-
-    void* PyArray_GETPTR1(ndarray m, npy_intp i)
-    void* PyArray_GETPTR2(ndarray m, npy_intp i, npy_intp j)
-    void* PyArray_GETPTR3(ndarray m, npy_intp i, npy_intp j, npy_intp k)
-    void* PyArray_GETPTR4(ndarray m, npy_intp i, npy_intp j, npy_intp k, npy_intp l)
-
-    void PyArray_XDECREF_ERR(ndarray)
-    # Cannot be supported due to out arg
-    # void PyArray_DESCR_REPLACE(descr)
-
-
-    object PyArray_Copy(ndarray)
-    object PyArray_FromObject(object op, int type, int min_depth, int max_depth)
-    object PyArray_ContiguousFromObject(object op, int type, int min_depth, int max_depth)
-    object PyArray_CopyFromObject(object op, int type, int min_depth, int max_depth)
-
-    object PyArray_Cast(ndarray mp, int type_num)
-    object PyArray_Take(ndarray ap, object items, int axis)
-    object PyArray_Put(ndarray ap, object items, object values)
-
-    void PyArray_ITER_RESET(flatiter it) nogil
-    void PyArray_ITER_NEXT(flatiter it) nogil
-    void PyArray_ITER_GOTO(flatiter it, npy_intp* destination) nogil
-    void PyArray_ITER_GOTO1D(flatiter it, npy_intp ind) nogil
-    void* PyArray_ITER_DATA(flatiter it) nogil
-    bint PyArray_ITER_NOTDONE(flatiter it) nogil
-
-    void PyArray_MultiIter_RESET(broadcast multi) nogil
-    void PyArray_MultiIter_NEXT(broadcast multi) nogil
-    void PyArray_MultiIter_GOTO(broadcast multi, npy_intp dest) nogil
-    void PyArray_MultiIter_GOTO1D(broadcast multi, npy_intp ind) nogil
-    void* PyArray_MultiIter_DATA(broadcast multi, npy_intp i) nogil
-    void PyArray_MultiIter_NEXTi(broadcast multi, npy_intp i) nogil
-    bint PyArray_MultiIter_NOTDONE(broadcast multi) nogil
-
-    # Functions from __multiarray_api.h
-
-    # Functions taking dtype and returning object/ndarray are disabled
-    # for now as they steal dtype references. I'm conservative and disable
-    # more than is probably needed until it can be checked further.
-    int PyArray_SetNumericOps        (object)
-    object PyArray_GetNumericOps ()
-    int PyArray_INCREF (ndarray)
-    int PyArray_XDECREF (ndarray)
-    void PyArray_SetStringFunction (object, int)
-    dtype PyArray_DescrFromType (int)
-    object PyArray_TypeObjectFromType (int)
-    char * PyArray_Zero (ndarray)
-    char * PyArray_One (ndarray)
-    #object PyArray_CastToType (ndarray, dtype, int)
-    int PyArray_CastTo (ndarray, ndarray)
-    int PyArray_CastAnyTo (ndarray, ndarray)
-    int PyArray_CanCastSafely (int, int)
-    npy_bool PyArray_CanCastTo (dtype, dtype)
-    int PyArray_ObjectType (object, int)
-    dtype PyArray_DescrFromObject (object, dtype)
-    #ndarray* PyArray_ConvertToCommonType (object, int *)
-    dtype PyArray_DescrFromScalar (object)
-    dtype PyArray_DescrFromTypeObject (object)
-    npy_intp PyArray_Size (object)
-    #object PyArray_Scalar (void *, dtype, object)
-    #object PyArray_FromScalar (object, dtype)
-    void PyArray_ScalarAsCtype (object, void *)
-    #int PyArray_CastScalarToCtype (object, void *, dtype)
-    #int PyArray_CastScalarDirect (object, dtype, void *, int)
-    object PyArray_ScalarFromObject (object)
-    #PyArray_VectorUnaryFunc * PyArray_GetCastFunc (dtype, int)
-    object PyArray_FromDims (int, int *, int)
-    #object PyArray_FromDimsAndDataAndDescr (int, int *, dtype, char *)
-    #object PyArray_FromAny (object, dtype, int, int, int, object)
-    object PyArray_EnsureArray (object)
-    object PyArray_EnsureAnyArray (object)
-    #object PyArray_FromFile (stdio.FILE *, dtype, npy_intp, char *)
-    #object PyArray_FromString (char *, npy_intp, dtype, npy_intp, char *)
-    #object PyArray_FromBuffer (object, dtype, npy_intp, npy_intp)
-    #object PyArray_FromIter (object, dtype, npy_intp)
-    object PyArray_Return (ndarray)
-    #object PyArray_GetField (ndarray, dtype, int)
-    #int PyArray_SetField (ndarray, dtype, int, object)
-    object PyArray_Byteswap (ndarray, npy_bool)
-    object PyArray_Resize (ndarray, PyArray_Dims *, int, NPY_ORDER)
-    int PyArray_MoveInto (ndarray, ndarray)
-    int PyArray_CopyInto (ndarray, ndarray)
-    int PyArray_CopyAnyInto (ndarray, ndarray)
-    int PyArray_CopyObject (ndarray, object)
-    object PyArray_NewCopy (ndarray, NPY_ORDER)
-    object PyArray_ToList (ndarray)
-    object PyArray_ToString (ndarray, NPY_ORDER)
-    int PyArray_ToFile (ndarray, stdio.FILE *, char *, char *)
-    int PyArray_Dump (object, object, int)
-    object PyArray_Dumps (object, int)
-    int PyArray_ValidType (int)
-    void PyArray_UpdateFlags (ndarray, int)
-    object PyArray_New (type, int, npy_intp *, int, npy_intp *, void *, int, int, object)
-    #object PyArray_NewFromDescr (type, dtype, int, npy_intp *, npy_intp *, void *, int, object)
-    #dtype PyArray_DescrNew (dtype)
-    dtype PyArray_DescrNewFromType (int)
-    double PyArray_GetPriority (object, double)
-    object PyArray_IterNew (object)
-    object PyArray_MultiIterNew (int, ...)
-
-    int PyArray_PyIntAsInt (object)
-    npy_intp PyArray_PyIntAsIntp (object)
-    int PyArray_Broadcast (broadcast)
-    void PyArray_FillObjectArray (ndarray, object)
-    int PyArray_FillWithScalar (ndarray, object)
-    npy_bool PyArray_CheckStrides (int, int, npy_intp, npy_intp, npy_intp *, npy_intp *)
-    dtype PyArray_DescrNewByteorder (dtype, char)
-    object PyArray_IterAllButAxis (object, int *)
-    #object PyArray_CheckFromAny (object, dtype, int, int, int, object)
-    #object PyArray_FromArray (ndarray, dtype, int)
-    object PyArray_FromInterface (object)
-    object PyArray_FromStructInterface (object)
-    #object PyArray_FromArrayAttr (object, dtype, object)
-    #NPY_SCALARKIND PyArray_ScalarKind (int, ndarray*)
-    int PyArray_CanCoerceScalar (int, int, NPY_SCALARKIND)
-    object PyArray_NewFlagsObject (object)
-    npy_bool PyArray_CanCastScalar (type, type)
-    #int PyArray_CompareUCS4 (npy_ucs4 *, npy_ucs4 *, register size_t)
-    int PyArray_RemoveSmallest (broadcast)
-    int PyArray_ElementStrides (object)
-    void PyArray_Item_INCREF (char *, dtype)
-    void PyArray_Item_XDECREF (char *, dtype)
-    object PyArray_FieldNames (object)
-    object PyArray_Transpose (ndarray, PyArray_Dims *)
-    object PyArray_TakeFrom (ndarray, object, int, ndarray, NPY_CLIPMODE)
-    object PyArray_PutTo (ndarray, object, object, NPY_CLIPMODE)
-    object PyArray_PutMask (ndarray, object, object)
-    object PyArray_Repeat (ndarray, object, int)
-    object PyArray_Choose (ndarray, object, ndarray, NPY_CLIPMODE)
-    int PyArray_Sort (ndarray, int, NPY_SORTKIND)
-    object PyArray_ArgSort (ndarray, int, NPY_SORTKIND)
-    object PyArray_SearchSorted (ndarray, object, NPY_SEARCHSIDE)
-    object PyArray_ArgMax (ndarray, int, ndarray)
-    object PyArray_ArgMin (ndarray, int, ndarray)
-    object PyArray_Reshape (ndarray, object)
-    object PyArray_Newshape (ndarray, PyArray_Dims *, NPY_ORDER)
-    object PyArray_Squeeze (ndarray)
-    #object PyArray_View (ndarray, dtype, type)
-    object PyArray_SwapAxes (ndarray, int, int)
-    object PyArray_Max (ndarray, int, ndarray)
-    object PyArray_Min (ndarray, int, ndarray)
-    object PyArray_Ptp (ndarray, int, ndarray)
-    object PyArray_Mean (ndarray, int, int, ndarray)
-    object PyArray_Trace (ndarray, int, int, int, int, ndarray)
-    object PyArray_Diagonal (ndarray, int, int, int)
-    object PyArray_Clip (ndarray, object, object, ndarray)
-    object PyArray_Conjugate (ndarray, ndarray)
-    object PyArray_Nonzero (ndarray)
-    object PyArray_Std (ndarray, int, int, ndarray, int)
-    object PyArray_Sum (ndarray, int, int, ndarray)
-    object PyArray_CumSum (ndarray, int, int, ndarray)
-    object PyArray_Prod (ndarray, int, int, ndarray)
-    object PyArray_CumProd (ndarray, int, int, ndarray)
-    object PyArray_All (ndarray, int, ndarray)
-    object PyArray_Any (ndarray, int, ndarray)
-    object PyArray_Compress (ndarray, object, int, ndarray)
-    object PyArray_Flatten (ndarray, NPY_ORDER)
-    object PyArray_Ravel (ndarray, NPY_ORDER)
-    npy_intp PyArray_MultiplyList (npy_intp *, int)
-    int PyArray_MultiplyIntList (int *, int)
-    void * PyArray_GetPtr (ndarray, npy_intp*)
-    int PyArray_CompareLists (npy_intp *, npy_intp *, int)
-    #int PyArray_AsCArray (object*, void *, npy_intp *, int, dtype)
-    #int PyArray_As1D (object*, char **, int *, int)
-    #int PyArray_As2D (object*, char ***, int *, int *, int)
-    int PyArray_Free (object, void *)
-    #int PyArray_Converter (object, object*)
-    int PyArray_IntpFromSequence (object, npy_intp *, int)
-    object PyArray_Concatenate (object, int)
-    object PyArray_InnerProduct (object, object)
-    object PyArray_MatrixProduct (object, object)
-    object PyArray_CopyAndTranspose (object)
-    object PyArray_Correlate (object, object, int)
-    int PyArray_TypestrConvert (int, int)
-    #int PyArray_DescrConverter (object, dtype*)
-    #int PyArray_DescrConverter2 (object, dtype*)
-    int PyArray_IntpConverter (object, PyArray_Dims *)
-    #int PyArray_BufferConverter (object, chunk)
-    int PyArray_AxisConverter (object, int *)
-    int PyArray_BoolConverter (object, npy_bool *)
-    int PyArray_ByteorderConverter (object, char *)
-    int PyArray_OrderConverter (object, NPY_ORDER *)
-    unsigned char PyArray_EquivTypes (dtype, dtype)
-    #object PyArray_Zeros (int, npy_intp *, dtype, int)
-    #object PyArray_Empty (int, npy_intp *, dtype, int)
-    object PyArray_Where (object, object, object)
-    object PyArray_Arange (double, double, double, int)
-    #object PyArray_ArangeObj (object, object, object, dtype)
-    int PyArray_SortkindConverter (object, NPY_SORTKIND *)
-    object PyArray_LexSort (object, int)
-    object PyArray_Round (ndarray, int, ndarray)
-    unsigned char PyArray_EquivTypenums (int, int)
-    int PyArray_RegisterDataType (dtype)
-    int PyArray_RegisterCastFunc (dtype, int, PyArray_VectorUnaryFunc *)
-    int PyArray_RegisterCanCast (dtype, int, NPY_SCALARKIND)
-    #void PyArray_InitArrFuncs (PyArray_ArrFuncs *)
-    object PyArray_IntTupleFromIntp (int, npy_intp *)
-    int PyArray_TypeNumFromName (char *)
-    int PyArray_ClipmodeConverter (object, NPY_CLIPMODE *)
-    #int PyArray_OutputConverter (object, ndarray*)
-    object PyArray_BroadcastToShape (object, npy_intp *, int)
-    void _PyArray_SigintHandler (int)
-    void* _PyArray_GetSigintBuf ()
-    #int PyArray_DescrAlignConverter (object, dtype*)
-    #int PyArray_DescrAlignConverter2 (object, dtype*)
-    int PyArray_SearchsideConverter (object, void *)
-    object PyArray_CheckAxis (ndarray, int *, int)
-    npy_intp PyArray_OverflowMultiplyList (npy_intp *, int)
-    int PyArray_CompareString (char *, char *, size_t)
-
-
-# Typedefs that matches the runtime dtype objects in
-# the numpy module.
-
-# The ones that are commented out needs an IFDEF function
-# in Cython to enable them only on the right systems.
-
-ctypedef npy_int8       int8_t
-ctypedef npy_int16      int16_t
-ctypedef npy_int32      int32_t
-ctypedef npy_int64      int64_t
-#ctypedef npy_int96      int96_t
-#ctypedef npy_int128     int128_t
-
-ctypedef npy_uint8      uint8_t
-ctypedef npy_uint16     uint16_t
-ctypedef npy_uint32     uint32_t
-ctypedef npy_uint64     uint64_t
-#ctypedef npy_uint96     uint96_t
-#ctypedef npy_uint128    uint128_t
-
-ctypedef npy_float16    float16_t
-ctypedef npy_float32    float32_t
-ctypedef npy_float64    float64_t
-#ctypedef npy_float80    float80_t
-#ctypedef npy_float128   float128_t
-
-ctypedef float complex  complex64_t
-ctypedef double complex complex128_t
-
-# The int types are mapped a bit surprising --
-# numpy.int corresponds to 'l' and numpy.long to 'q'
-ctypedef npy_long       int_t
-ctypedef npy_longlong   long_t
-ctypedef npy_longlong   longlong_t
-
-ctypedef npy_ulong      uint_t
-ctypedef npy_ulonglong  ulong_t
-ctypedef npy_ulonglong  ulonglong_t
-
-ctypedef npy_intp       intp_t
-ctypedef npy_uintp      uintp_t
-
-ctypedef npy_double     float_t
-ctypedef npy_double     double_t
-ctypedef npy_longdouble longdouble_t
-
-ctypedef npy_cfloat      cfloat_t
-ctypedef npy_cdouble     cdouble_t
-ctypedef npy_clongdouble clongdouble_t
-
-ctypedef npy_cdouble     complex_t
-
-cdef inline object PyArray_MultiIterNew1(a):
-    return PyArray_MultiIterNew(1, <void*>a)
-
-cdef inline object PyArray_MultiIterNew2(a, b):
-    return PyArray_MultiIterNew(2, <void*>a, <void*>b)
-
-cdef inline object PyArray_MultiIterNew3(a, b, c):
-    return PyArray_MultiIterNew(3, <void*>a, <void*>b, <void*> c)
-
-cdef inline object PyArray_MultiIterNew4(a, b, c, d):
-    return PyArray_MultiIterNew(4, <void*>a, <void*>b, <void*>c, <void*> d)
-
-cdef inline object PyArray_MultiIterNew5(a, b, c, d, e):
-    return PyArray_MultiIterNew(5, <void*>a, <void*>b, <void*>c, <void*> d, <void*> e)
-
-cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL:
-    # Recursive utility function used in __getbuffer__ to get format
-    # string. The new location in the format string is returned.
-
-    cdef dtype child
-    cdef int delta_offset
-    cdef tuple i
-    cdef int endian_detector = 1
-    cdef bint little_endian = ((<char*>&endian_detector)[0] != 0)
-    cdef tuple fields
-
-    for childname in descr.names:
-        fields = descr.fields[childname]
-        child, new_offset = fields
-
-        if (end - f) - (new_offset - offset[0]) < 15:
-            raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd")
-
-        if ((child.byteorder == '>' and little_endian) or
-            (child.byteorder == '<' and not little_endian)):
-            raise ValueError(u"Non-native byte order not supported")
-            # One could encode it in the format string and have Cython
-            # complain instead, BUT: < and > in format strings also imply
-            # standardized sizes for datatypes, and we rely on native in
-            # order to avoid reencoding data types based on their size.
-            #
-            # A proper PEP 3118 exporter for other clients than Cython
-            # must deal properly with this!
-
-        # Output padding bytes
-        while offset[0] < new_offset:
-            f[0] = 120 # "x"; pad byte
-            f += 1
-            offset[0] += 1
-
-        offset[0] += child.itemsize
-
-        if not PyDataType_HASFIELDS(child):
-            t = child.type_num
-            if end - f < 5:
-                raise RuntimeError(u"Format string allocated too short.")
-
-            # Until ticket #99 is fixed, use integers to avoid warnings
-            if   t == NPY_BYTE:        f[0] =  98 #"b"
-            elif t == NPY_UBYTE:       f[0] =  66 #"B"
-            elif t == NPY_SHORT:       f[0] = 104 #"h"
-            elif t == NPY_USHORT:      f[0] =  72 #"H"
-            elif t == NPY_INT:         f[0] = 105 #"i"
-            elif t == NPY_UINT:        f[0] =  73 #"I"
-            elif t == NPY_LONG:        f[0] = 108 #"l"
-            elif t == NPY_ULONG:       f[0] = 76  #"L"
-            elif t == NPY_LONGLONG:    f[0] = 113 #"q"
-            elif t == NPY_ULONGLONG:   f[0] = 81  #"Q"
-            elif t == NPY_FLOAT:       f[0] = 102 #"f"
-            elif t == NPY_DOUBLE:      f[0] = 100 #"d"
-            elif t == NPY_LONGDOUBLE:  f[0] = 103 #"g"
-            elif t == NPY_CFLOAT:      f[0] = 90; f[1] = 102; f += 1 # Zf
-            elif t == NPY_CDOUBLE:     f[0] = 90; f[1] = 100; f += 1 # Zd
-            elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg
-            elif t == NPY_OBJECT:      f[0] = 79 #"O"
-            else:
-                raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t)
-            f += 1
-        else:
-            # Cython ignores struct boundary information ("T{...}"),
-            # so don't output it
-            f = _util_dtypestring(child, f, end, offset)
-    return f
-
-
-#
-# ufunc API
-#
-
-cdef extern from "numpy/ufuncobject.h":
-
-    ctypedef void (*PyUFuncGenericFunction) (char **, npy_intp *, npy_intp *, void *)
-
-    ctypedef extern class numpy.ufunc [object PyUFuncObject]:
-        cdef:
-            int nin, nout, nargs
-            int identity
-            PyUFuncGenericFunction *functions
-            void **data
-            int ntypes
-            int check_return
-            char *name
-            char *types
-            char *doc
-            void *ptr
-            PyObject *obj
-            PyObject *userloops
-
-    cdef enum:
-        PyUFunc_Zero
-        PyUFunc_One
-        PyUFunc_None
-        UFUNC_ERR_IGNORE
-        UFUNC_ERR_WARN
-        UFUNC_ERR_RAISE
-        UFUNC_ERR_CALL
-        UFUNC_ERR_PRINT
-        UFUNC_ERR_LOG
-        UFUNC_MASK_DIVIDEBYZERO
-        UFUNC_MASK_OVERFLOW
-        UFUNC_MASK_UNDERFLOW
-        UFUNC_MASK_INVALID
-        UFUNC_SHIFT_DIVIDEBYZERO
-        UFUNC_SHIFT_OVERFLOW
-        UFUNC_SHIFT_UNDERFLOW
-        UFUNC_SHIFT_INVALID
-        UFUNC_FPE_DIVIDEBYZERO
-        UFUNC_FPE_OVERFLOW
-        UFUNC_FPE_UNDERFLOW
-        UFUNC_FPE_INVALID
-        UFUNC_ERR_DEFAULT
-        UFUNC_ERR_DEFAULT2
-
-    object PyUFunc_FromFuncAndData(PyUFuncGenericFunction *,
-          void **, char *, int, int, int, int, char *, char *, int)
-    int PyUFunc_RegisterLoopForType(ufunc, int,
-                                    PyUFuncGenericFunction, int *, void *)
-    int PyUFunc_GenericFunction \
-        (ufunc, PyObject *, PyObject *, PyArrayObject **)
-    void PyUFunc_f_f_As_d_d \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_d_d \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_f_f \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_g_g \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_F_F_As_D_D \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_F_F \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_D_D \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_G_G \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_O_O \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_ff_f_As_dd_d \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_ff_f \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_dd_d \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_gg_g \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_FF_F_As_DD_D \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_DD_D \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_FF_F \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_GG_G \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_OO_O \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_O_O_method \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_OO_O_method \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_On_Om \
-         (char **, npy_intp *, npy_intp *, void *)
-    int PyUFunc_GetPyValues \
-        (char *, int *, int *, PyObject **)
-    int PyUFunc_checkfperr \
-           (int, PyObject *, int *)
-    void PyUFunc_clearfperr()
-    int PyUFunc_getfperr()
-    int PyUFunc_handlefperr \
-        (int, PyObject *, int, int *)
-    int PyUFunc_ReplaceLoopBySignature \
-        (ufunc, PyUFuncGenericFunction, int *, PyUFuncGenericFunction *)
-    object PyUFunc_FromFuncAndDataAndSignature \
-             (PyUFuncGenericFunction *, void **, char *, int, int, int,
-              int, char *, char *, int, char *)
-
-    void import_ufunc()
-
-
-cdef inline void set_array_base(ndarray arr, object base):
-     cdef PyObject* baseptr
-     if base is None:
-         baseptr = NULL
-     else:
-         Py_INCREF(base) # important to do this before decref below!
-         baseptr = <PyObject*>base
-     Py_XDECREF(arr.base)
-     arr.base = baseptr
-
-cdef inline object get_array_base(ndarray arr):
-    if arr.base is NULL:
-        return None
-    else:
-        return <object>arr.base
diff --git a/pandas/src/numpy_helper.h b/pandas/src/numpy_helper.h
deleted file mode 100644
index 8b79bbe79ff2f..0000000000000
--- a/pandas/src/numpy_helper.h
+++ /dev/null
@@ -1,200 +0,0 @@
-#include "Python.h"
-#include "numpy/arrayobject.h"
-#include "numpy/arrayscalars.h"
-#include "helper.h"
-
-#define PANDAS_FLOAT 0
-#define PANDAS_INT 1
-#define PANDAS_BOOL 2
-#define PANDAS_STRING 3
-#define PANDAS_OBJECT 4
-#define PANDAS_DATETIME 5
-
-PANDAS_INLINE int
-infer_type(PyObject* obj) {
-  if (PyBool_Check(obj)) {
-    return PANDAS_BOOL;
-  }
-  else if (PyArray_IsIntegerScalar(obj)) {
-    return PANDAS_INT;
-  }
-  else if (PyArray_IsScalar(obj, Datetime)) {
-    return PANDAS_DATETIME;
-  }
-  else if (PyFloat_Check(obj) || PyArray_IsScalar(obj, Floating)) {
-    return PANDAS_FLOAT;
-  }
-  else if (PyString_Check(obj) || PyUnicode_Check(obj)) {
-    return PANDAS_STRING;
-  }
-  else {
-    return PANDAS_OBJECT;
-  }
-}
-
-PANDAS_INLINE npy_int64
-get_nat(void) {
-  return NPY_MIN_INT64;
-}
-
-PANDAS_INLINE npy_datetime
-get_datetime64_value(PyObject* obj) {
-  return ((PyDatetimeScalarObject*) obj)->obval;
-
-}
-
-PANDAS_INLINE int
-is_integer_object(PyObject* obj) {
-  return (!PyBool_Check(obj)) && PyArray_IsIntegerScalar(obj);
-//  return PyArray_IsIntegerScalar(obj);
-}
-
-PANDAS_INLINE int
-is_float_object(PyObject* obj) {
-  return (PyFloat_Check(obj) || PyArray_IsScalar(obj, Floating));
-}
-PANDAS_INLINE int
-is_complex_object(PyObject* obj) {
-  return (PyComplex_Check(obj) || PyArray_IsScalar(obj, ComplexFloating));
-}
-
-PANDAS_INLINE int
-is_bool_object(PyObject* obj) {
-  return (PyBool_Check(obj) || PyArray_IsScalar(obj, Bool));
-}
-
-PANDAS_INLINE int
-is_string_object(PyObject* obj) {
-  return (PyString_Check(obj) || PyUnicode_Check(obj));
-}
-
-PANDAS_INLINE int
-is_datetime64_object(PyObject *obj) {
-  return PyArray_IsScalar(obj, Datetime);
-}
-
-PANDAS_INLINE int
-is_timedelta64_object(PyObject *obj) {
-  return PyArray_IsScalar(obj, Timedelta);
-}
-
-PANDAS_INLINE int
-assign_value_1d(PyArrayObject* ap, Py_ssize_t _i, PyObject* v) {
-  npy_intp i = (npy_intp) _i;
-  char *item = (char *) PyArray_DATA(ap) + i * PyArray_STRIDE(ap, 0);
-  return PyArray_DESCR(ap)->f->setitem(v, item, ap);
-}
-
-PANDAS_INLINE PyObject*
-get_value_1d(PyArrayObject* ap, Py_ssize_t i) {
-  char *item = (char *) PyArray_DATA(ap) + i * PyArray_STRIDE(ap, 0);
-  return PyArray_Scalar(item, PyArray_DESCR(ap), (PyObject*) ap);
-}
-
-
-PANDAS_INLINE char*
-get_c_string(PyObject* obj) {
-#if PY_VERSION_HEX >= 0x03000000
-  PyObject* enc_str = PyUnicode_AsEncodedString(obj, "utf-8", "error");
-
-  char *ret;
-  ret = PyBytes_AS_STRING(enc_str);
-
-  // TODO: memory leak here
-
-  // Py_XDECREF(enc_str);
-  return ret;
-#else
-  return PyString_AsString(obj);
-#endif
-}
-
-PANDAS_INLINE PyObject*
-char_to_string(char* data) {
-#if PY_VERSION_HEX >= 0x03000000
-    return PyUnicode_FromString(data);
-#else
-    return PyString_FromString(data);
-#endif
-}
-
-// PANDAS_INLINE int
-// is_string(PyObject* obj) {
-// #if PY_VERSION_HEX >= 0x03000000
-//   return PyUnicode_Check(obj);
-// #else
-//   return PyString_Check(obj);
-// #endif
-
-PyObject* sarr_from_data(PyArray_Descr *descr, int length, void* data) {
-    PyArrayObject *result;
-    npy_intp dims[1] = {length};
-    Py_INCREF(descr); // newfromdescr steals a reference to descr
-    result = (PyArrayObject*) PyArray_NewFromDescr(&PyArray_Type, descr, 1, dims,
-                                                   NULL, data, 0, NULL);
-
-    // Returned array doesn't own data by default
-    result->flags |= NPY_OWNDATA;
-
-    return (PyObject*) result;
-}
-
-
-void transfer_object_column(char *dst, char *src, size_t stride,
-                            size_t length) {
-    int i;
-    size_t sz = sizeof(PyObject*);
-
-    for (i = 0; i < length; ++i)
-    {
-        // uninitialized data
-
-        // Py_XDECREF(*((PyObject**) dst));
-
-        memcpy(dst, src, sz);
-        Py_INCREF(*((PyObject**) dst));
-        src += sz;
-        dst += stride;
-    }
-}
-
-void set_array_owndata(PyArrayObject *ao) {
-    ao->flags |= NPY_OWNDATA;
-}
-
-void set_array_not_contiguous(PyArrayObject *ao) {
-    ao->flags &= ~(NPY_C_CONTIGUOUS | NPY_F_CONTIGUOUS);
-}
-
-
-// If arr is zerodim array, return a proper array scalar (e.g. np.int64).
-// Otherwise, return arr as is.
-PANDAS_INLINE PyObject*
-unbox_if_zerodim(PyObject* arr) {
-    if (PyArray_IsZeroDim(arr)) {
-        PyObject *ret;
-        ret = PyArray_ToScalar(PyArray_DATA(arr), arr);
-        return ret;
-    } else {
-        Py_INCREF(arr);
-        return arr;
-    }
-}
-
-
-// PANDAS_INLINE PyObject*
-// get_base_ndarray(PyObject* ap) {
-//   // if (!ap || (NULL == ap)) {
-//   //   Py_RETURN_NONE;
-//   // }
-
-//   while (!PyArray_CheckExact(ap)) {
-//     ap = PyArray_BASE((PyArrayObject*) ap);
-//     if (ap == Py_None) Py_RETURN_NONE;
-//   }
-//   // PyArray_BASE is a borrowed reference
-//   if(ap) {
-//     Py_INCREF(ap);
-//   }
-//   return ap;
-// }
diff --git a/pandas/src/offsets.pyx b/pandas/src/offsets.pyx
deleted file mode 100644
index 096198c8a05fa..0000000000000
--- a/pandas/src/offsets.pyx
+++ /dev/null
@@ -1,367 +0,0 @@
-
-ctypedef enum time_res:
-    r_min = 0
-    r_microsecond
-    r_second
-    r_minute
-    r_hour
-    r_day
-    r_month
-    r_year
-    r_max = 98
-    r_invalid = 99
-
-
-cdef conversion_factor(time_res res1, time_res res2):
-    cdef:
-        time_res min_res, max_res
-        int64_t factor
-
-    min_res = min(res1, res2)
-    max_res = max(res1, res2)
-    factor = 1
-
-    if min_res == max_res:
-        return factor
-
-    while min_res < max_res:
-        if min_res < r_microsecond:
-            raise "Cannot convert from less than us"
-        elif min_res == r_microsecond:
-            factor *= 1000000
-            min_res = r_second
-        elif min_res == r_second:
-            factor *= 60
-            min_res = r_minute
-        elif min_res == r_minute:
-            factor *= 60
-            min_res = r_hour
-        elif min_res == r_hour:
-            factor *= 24
-            min_res = r_day
-        else:
-            raise "Cannot convert to month or year"
-
-    return factor
-
-# Logic to generate ranges
-# -----------------------------------------------------------------------------
-
-cdef inline int64_t weekend_adjustment(int64_t dow, int bkwd):
-    if dow > 4:                         # sat or sun?
-        if bkwd:                        # roll back 1 or 2 days
-            return (4 - dow)
-        else:                           # roll forward 2 or 1 days
-            return (7 - dow)
-    return 0
-
-cdef int64_t us_in_day = conversion_factor(r_microsecond, r_day)
-
-cdef class _Offset:
-    """
-    Base class to generate timestamps. Set the anchor, and then move offsets
-    with next & prev. Retrieve timestamp with ts attribute.
-    """
-    cdef:
-        int64_t t, dow, biz, dayoffset
-        object start
-        _TSObject ts
-
-    def __cinit__(self):
-        self.t=0
-        self.dow=0
-        self.biz=0
-        self.dayoffset=0
-
-    cpdef anchor(self, object start=None):
-        if start is not None:
-            self.start = start
-        self.ts = convert_to_tsobject(self.start, None, None)
-        self._setup()
-
-    cdef _setup(self):
-        pass
-
-    cpdef next(self):
-        pass
-
-    cpdef __next__(self):
-        """wrapper around next"""
-        return self.next()
-
-    cpdef prev(self):
-        pass
-
-    cdef int64_t _ts(self):
-        """
-        Access the current timestamp value, with a possible weekday
-        adjustment.
-        """
-        cdef int64_t adj
-
-        if self.biz != 0:
-            adj = weekend_adjustment(self.dow, self.biz < 0)
-            return self.t + us_in_day * adj
-        else:
-            return self.t
-
-    cdef int64_t _get_anchor(self):
-        """
-        Retrieve an anchor relating to current offset we're on.
-        """
-        return self.t - self.dayoffset * us_in_day
-
-    property ts:
-        def __get__(self):
-            return self._ts()
-
-cdef class YearOffset(_Offset):
-    """
-    Generate annual timestamps from provided start time; apply dayoffset to
-    each timestamp. If biz > 0, we choose the next business day at each time;
-    previous if < 0.
-
-    Parameters
-    ----------
-    dayoffset : int
-    biz : int
-    """
-    cdef:
-        int64_t y, ly
-
-    def __init__(self, int64_t dayoffset=0, int64_t biz=0, object anchor=None):
-        self.dayoffset = dayoffset
-        self.biz = biz
-
-        if anchor is not None:
-            self.anchor(anchor)
-
-    cdef _setup(self):
-        cdef _TSObject ts = self.ts
-
-        self.t = ts.value + self.dayoffset * us_in_day
-        self.y = ts.dts.year
-
-        self.ly = (ts.dts.month > 2 or
-                   ts.dts.month == 2 and ts.dts.day == 29)
-
-        if self.biz != 0:
-            self.dow = (ts_dayofweek(ts) + self.dayoffset) % 7
-
-    cpdef next(self):
-        cdef int64_t days
-
-        days = 365 + is_leapyear(self.y + self.ly)
-
-        self.t += days * us_in_day
-        self.y += 1
-
-        if self.biz != 0:
-            self.dow = (self.dow + days) % 7
-
-    cpdef prev(self):
-        cdef int64_t days
-
-        days = 365 + is_leapyear(self.y - (1-self.ly))
-
-        self.t -= days * us_in_day
-        self.y -= 1
-
-        if self.biz != 0:
-            self.dow = (self.dow - days) % 7
-
-cdef class MonthOffset(_Offset):
-    """
-    Generate monthly timestamps from provided start time, and apply dayoffset
-    to each timestamp.  Stride to construct strided timestamps (eg quarterly).
-    If biz > 0, we choose the next business day at each time; previous if < 0.
-
-    Parameters
-    ----------
-    dayoffset : int
-    stride : int, > 0
-    biz : int
-    """
-    cdef:
-        Py_ssize_t stride, ly, m
-        int64_t y
-
-    def __init__(self, int64_t dayoffset=0, Py_ssize_t stride=1,
-                 int64_t biz=0, object anchor=None):
-        self.dayoffset = dayoffset
-        self.stride = stride
-        self.biz = biz
-
-        if stride <= 0:
-            raise ValueError("Stride must be positive")
-
-        if anchor is not None:
-            self.anchor(anchor)
-
-    cdef _setup(self):
-        cdef _TSObject ts = self.ts
-
-        self.t = ts.value + (self.dayoffset * us_in_day)
-
-        # for day counting
-        self.m  = ts.dts.month - 1
-        self.y  = ts.dts.year
-        self.ly = is_leapyear(self.y)
-
-        if self.biz != 0:
-            self.dow = (ts_dayofweek(ts) + self.dayoffset) % 7
-
-    cpdef next(self):
-        cdef:
-            int64_t tmp, days
-            Py_ssize_t j
-
-        days = 0
-        for j in range(0, self.stride):
-            if self.m >= 12:
-                self.m -= 12
-                self.y += 1
-                self.ly = is_leapyear(self.y)
-            days += days_per_month_table[self.ly][self.m]
-            self.m += 1
-
-        self.t += days * us_in_day
-
-        if self.biz != 0:
-            self.dow = (self.dow + days) % 7
-
-    cpdef prev(self):
-        cdef:
-            int64_t tmp, days
-            Py_ssize_t j
-
-        days = 0
-        for j in range(0, self.stride):
-            self.m -= 1
-            if self.m < 0:
-                self.m += 12
-                self.y -= 1
-                self.ly = is_leapyear(self.y)
-            days += days_per_month_table[self.ly][self.m]
-
-        self.t -= days * us_in_day
-
-        if self.biz != 0:
-            self.dow = (self.dow - days) % 7
-
-cdef class DayOfMonthOffset(_Offset):
-    """
-    Generate relative monthly timestamps from month & year of provided start
-    time. For example, fridays of the third week of each month (week=3, day=4);
-    or, thursdays of the last week of each month (week=-1, day=3).
-
-    Parameters
-    ----------
-    week : int
-    day : int, 0 to 6
-    """
-    cdef:
-        Py_ssize_t ly, m
-        int64_t y, day, week
-
-    def __init__(self, int64_t week=0, int64_t day=0, object anchor=None):
-        self.week = week
-        self.day = day
-
-        if self.day < 0 or self.day > 6:
-            raise ValueError("Day offset must be 0 to 6")
-
-        if anchor is not None:
-            self.anchor(anchor)
-
-    cdef _setup(self):
-        cdef _TSObject ts = self.ts
-
-        # rewind to beginning of month
-        self.t = ts.value - (ts.dts.day - 1) * us_in_day
-        self.dow = dayofweek(ts.dts.year, ts.dts.month, 1)
-
-        # for day counting
-        self.m = ts.dts.month - 1
-        self.y = ts.dts.year
-        self.ly = is_leapyear(self.y)
-
-    cpdef next(self):
-        cdef:
-            int64_t tmp, days
-
-        days = days_per_month_table[self.ly][self.m]
-        self.t += days * us_in_day
-        self.dow = (self.dow + days) % 7
-
-        self.m += 1
-        if self.m >= 12:
-            self.m -= 12
-            self.y += 1
-            self.ly = is_leapyear(self.y)
-
-    cpdef prev(self):
-        cdef:
-            int64_t tmp, days
-
-        days = days_per_month_table[self.ly][(self.m - 1) % 12]
-        self.t -= days * us_in_day
-        self.dow = (self.dow - days) % 7
-
-        self.m -= 1
-        if self.m < 0:
-            self.m += 12
-            self.y -= 1
-            self.ly = is_leapyear(self.y)
-
-    cdef int64_t _ts(self):
-        """
-        Overwrite default adjustment
-        """
-        cdef int64_t adj = (self.week * 7) + (self.day - self.dow) % 7
-        return self.t + us_in_day * adj
-
-cdef class DayOffset(_Offset):
-    """
-    Generate daily timestamps beginning with first valid time >= start time. If
-    biz != 0, we skip weekends. Stride, to construct weekly timestamps.
-
-    Parameters
-    ----------
-    stride : int, > 0
-    biz : boolean
-    """
-    cdef:
-        Py_ssize_t stride
-
-    def __init__(self, int64_t stride=1, int64_t biz=0, object anchor=None):
-        self.stride = stride
-        self.biz = biz
-
-        if self.stride <= 0:
-            raise ValueError("Stride must be positive")
-
-        if anchor is not None:
-            self.anchor(anchor)
-
-    cdef _setup(self):
-        cdef _TSObject ts = self.ts
-        self.t = ts.value
-        if self.biz != 0:
-            self.dow = ts_dayofweek(ts)
-
-    cpdef next(self):
-        self.t += (self.stride * us_in_day)
-        if self.biz != 0:
-            self.dow = (self.dow + self.stride) % 7
-            if self.dow >= 5:
-                self.t += (7 - self.dow) * us_in_day
-                self.dow = 0
-
-    cpdef prev(self):
-        self.t -= (self.stride * us_in_day)
-        if self.biz != 0:
-            self.dow = (self.dow - self.stride) % 7
-            if self.dow >= 5:
-                self.t += (4 - self.dow) * us_in_day
-                self.dow = 4
diff --git a/pandas/src/parse_helper.h b/pandas/src/parse_helper.h
deleted file mode 100644
index 2cb1a7f017c62..0000000000000
--- a/pandas/src/parse_helper.h
+++ /dev/null
@@ -1,252 +0,0 @@
-#include <errno.h>
-#include <float.h>
-
-static double xstrtod(const char *p, char **q, char decimal, char sci,
-                      int skip_trailing, int *maybe_int);
-
-int to_double(char *item, double *p_value, char sci, char decimal, int *maybe_int)
-{
-    char *p_end = NULL;
-
-    *p_value = xstrtod(item, &p_end, decimal, sci, 1, maybe_int);
-
-    return (errno == 0) && (!*p_end);
-}
-
-#if PY_VERSION_HEX < 0x02060000
-  #define PyBytes_Check                PyString_Check
-  #define PyBytes_AS_STRING            PyString_AS_STRING
-#endif
-
-int floatify(PyObject* str, double *result, int *maybe_int) {
-    int status;
-    char *data;
-    PyObject* tmp = NULL;
-    const char sci = 'E';
-    const char dec = '.';
-
-    if (PyBytes_Check(str)) {
-        data = PyBytes_AS_STRING(str);
-    } else if (PyUnicode_Check(str)) {
-        tmp = PyUnicode_AsUTF8String(str);
-        data = PyBytes_AS_STRING(tmp);
-    } else {
-        PyErr_SetString(PyExc_TypeError, "Invalid object type");
-        return -1;
-    }
-
-    status = to_double(data, result, sci, dec, maybe_int);
-
-    if (!status) {
-        /* handle inf/-inf */
-        if (0 == strcmp(data, "-inf")) {
-            *result = -HUGE_VAL;
-            *maybe_int = 0;
-        } else if (0 == strcmp(data, "inf")) {
-            *result = HUGE_VAL;
-            *maybe_int = 0;
-        } else {
-            PyErr_SetString(PyExc_ValueError, "Unable to parse string");
-            Py_XDECREF(tmp);
-            return -1;
-        }
-    }
-
-    Py_XDECREF(tmp);
-    return 0;
-
-/*
-#if PY_VERSION_HEX >= 0x03000000
-  return PyFloat_FromString(str);
-#else
-  return PyFloat_FromString(str, NULL);
-#endif
-*/
-
-}
-
-
-// ---------------------------------------------------------------------------
-// Implementation of xstrtod
-
-//
-// strtod.c
-//
-// Convert string to double
-//
-// Copyright (C) 2002 Michael Ringgaard. All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions
-// are met:
-//
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the project nor the names of its contributors
-//    may be used to endorse or promote products derived from this software
-//    without specific prior written permission.
-//
-// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
-// ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
-// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
-// ARE DISCLAIMED.  IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
-// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
-// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
-// OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
-// HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
-// LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
-// OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
-// SUCH DAMAGE.
-//
-// -----------------------------------------------------------------------
-// Modifications by Warren Weckesser, March 2011:
-// * Rename strtod() to xstrtod().
-// * Added decimal and sci arguments.
-// * Skip trailing spaces.
-// * Commented out the other functions.
-//
-
-PANDAS_INLINE void lowercase(char *p) {
-    for ( ; *p; ++p) *p = tolower(*p);
-}
-
-PANDAS_INLINE void uppercase(char *p) {
-    for ( ; *p; ++p) *p = toupper(*p);
-}
-
-
-static double xstrtod(const char *str, char **endptr, char decimal,
-                      char sci, int skip_trailing, int *maybe_int)
-{
-  double number;
-  int exponent;
-  int negative;
-  char *p = (char *) str;
-  double p10;
-  int n;
-  int num_digits;
-  int num_decimals;
-
-  errno = 0;
-  *maybe_int = 1;
-
-  // Skip leading whitespace
-  while (isspace(*p)) p++;
-
-  // Handle optional sign
-  negative = 0;
-  switch (*p)
-  {
-    case '-': negative = 1; // Fall through to increment position
-    case '+': p++;
-  }
-
-  number = 0.;
-  exponent = 0;
-  num_digits = 0;
-  num_decimals = 0;
-
-  // Process string of digits
-  while (isdigit(*p))
-  {
-    number = number * 10. + (*p - '0');
-    p++;
-    num_digits++;
-  }
-
-  // Process decimal part
-  if (*p == decimal)
-  {
-    *maybe_int = 0;
-    p++;
-
-    while (isdigit(*p))
-    {
-      number = number * 10. + (*p - '0');
-      p++;
-      num_digits++;
-      num_decimals++;
-    }
-
-    exponent -= num_decimals;
-  }
-
-  if (num_digits == 0)
-  {
-    errno = ERANGE;
-    return 0.0;
-  }
-
-  // Correct for sign
-  if (negative) number = -number;
-
-  // Process an exponent string
-  if (toupper(*p) == toupper(sci))
-  {
-    *maybe_int = 0;
-
-    // Handle optional sign
-    negative = 0;
-    switch (*++p)
-    {
-      case '-': negative = 1;   // Fall through to increment pos
-      case '+': p++;
-    }
-
-    // Process string of digits
-    n = 0;
-    while (isdigit(*p))
-    {
-      n = n * 10 + (*p - '0');
-      p++;
-    }
-
-    if (negative)
-      exponent -= n;
-    else
-      exponent += n;
-  }
-
-
-  if (exponent < DBL_MIN_EXP  || exponent > DBL_MAX_EXP)
-  {
-
-    errno = ERANGE;
-    return HUGE_VAL;
-  }
-
-  // Scale the result
-  p10 = 10.;
-  n = exponent;
-  if (n < 0) n = -n;
-  while (n)
-  {
-    if (n & 1)
-    {
-      if (exponent < 0)
-        number /= p10;
-      else
-        number *= p10;
-    }
-    n >>= 1;
-    p10 *= p10;
-  }
-
-
-  if (number == HUGE_VAL) {
-	  errno = ERANGE;
-  }
-
-  if (skip_trailing) {
-      // Skip trailing whitespace
-      while (isspace(*p)) p++;
-  }
-
-  if (endptr) *endptr = p;
-
-
-  return number;
-}
diff --git a/pandas/src/parser/.gitignore b/pandas/src/parser/.gitignore
deleted file mode 100644
index f07e771a35eec..0000000000000
--- a/pandas/src/parser/.gitignore
+++ /dev/null
@@ -1,2 +0,0 @@
-!*.c
-test*
\ No newline at end of file
diff --git a/pandas/src/parser/Makefile b/pandas/src/parser/Makefile
deleted file mode 100644
index ec88eaf44ba15..0000000000000
--- a/pandas/src/parser/Makefile
+++ /dev/null
@@ -1,13 +0,0 @@
-PYTHONBASE = /Library/Frameworks/EPD64.framework/Versions/Current
-NUMPY_INC = /Library/Frameworks/EPD64.framework/Versions/7.1/lib/python2.7/site-packages/numpy/core/include
-PYTHON_INC = -I$(PYTHONBASE)/include/python2.7 -I$(NUMPY_INC)
-PYTHON_LINK = -L$(PYTHONBASE)/lib -lpython
-
-SOURCES = conversions.c parser.c str_to.c
-
-check-syntax:
-	gcc -g $(PYTHON_INC) -o /dev/null -S ${CHK_SOURCES}
-
-test: $(SOURCES)
-	gcc $(PYTHON_INC) -o test $(SOURCES)
-	./test
\ No newline at end of file
diff --git a/pandas/src/parser/io.c b/pandas/src/parser/io.c
deleted file mode 100644
index e6d54bd59d6fd..0000000000000
--- a/pandas/src/parser/io.c
+++ /dev/null
@@ -1,281 +0,0 @@
-#include "io.h"
-
- /*
-   On-disk FILE, uncompressed
-  */
-
-
-void *new_file_source(char *fname, size_t buffer_size) {
-    file_source *fs = (file_source *) malloc(sizeof(file_source));
-    fs->fp = fopen(fname, "rb");
-
-    if (fs->fp == NULL) {
-        free(fs);
-        return NULL;
-    }
-    setbuf(fs->fp, NULL);
-
-    fs->initial_file_pos = ftell(fs->fp);
-
-    // Only allocate this heap memory if we are not memory-mapping the file
-    fs->buffer = (char*) malloc((buffer_size + 1) * sizeof(char));
-
-    if (fs->buffer == NULL) {
-        return NULL;
-    }
-
-    memset(fs->buffer, 0, buffer_size + 1);
-    fs->buffer[buffer_size] = '\0';
-
-    return (void *) fs;
-}
-
-
-// XXX handle on systems without the capability
-
-
-/*
- *  void *new_file_buffer(FILE *f, int buffer_size)
- *
- *  Allocate a new file_buffer.
- *  Returns NULL if the memory allocation fails or if the call to mmap fails.
- *
- *  buffer_size is ignored.
- */
-
-
-void* new_rd_source(PyObject *obj) {
-    rd_source *rds = (rd_source *) malloc(sizeof(rd_source));
-
-    /* hold on to this object */
-    Py_INCREF(obj);
-    rds->obj = obj;
-    rds->buffer = NULL;
-    rds->position = 0;
-
-    return (void*) rds;
-}
-
-/*
-
-  Cleanup callbacks
-
- */
-
-int del_file_source(void *fs) {
-    // fseek(FS(fs)->fp, FS(fs)->initial_file_pos, SEEK_SET);
-    if (fs == NULL)
-        return 0;
-
-    /* allocated on the heap */
-    free(FS(fs)->buffer);
-    fclose(FS(fs)->fp);
-    free(fs);
-
-    return 0;
-}
-
-int del_rd_source(void *rds) {
-    Py_XDECREF(RDS(rds)->obj);
-    Py_XDECREF(RDS(rds)->buffer);
-    free(rds);
-
-    return 0;
-}
-
-/*
-
-  IO callbacks
-
- */
-
-
-void* buffer_file_bytes(void *source, size_t nbytes,
-                        size_t *bytes_read, int *status) {
-    file_source *src = FS(source);
-
-    *bytes_read = fread((void*) src->buffer, sizeof(char), nbytes,
-                        src->fp);
-
-    if (*bytes_read == 0) {
-        *status = REACHED_EOF;
-    } else {
-        *status = 0;
-    }
-
-    return (void*) src->buffer;
-
-}
-
-
-void* buffer_rd_bytes(void *source, size_t nbytes,
-                      size_t *bytes_read, int *status) {
-    PyGILState_STATE state;
-    PyObject *result, *func, *args, *tmp;
-
-    void *retval;
-
-    size_t length;
-    rd_source *src = RDS(source);
-
-    /* delete old object */
-    Py_XDECREF(src->buffer);
-    args = Py_BuildValue("(i)", nbytes);
-
-    state = PyGILState_Ensure();
-    func = PyObject_GetAttrString(src->obj, "read");
-    /* printf("%s\n", PyBytes_AsString(PyObject_Repr(func))); */
-
-    /* TODO: does this release the GIL? */
-    result = PyObject_CallObject(func, args);
-    Py_XDECREF(args);
-    Py_XDECREF(func);
-
-    /* PyObject_Print(PyObject_Type(result), stdout, 0); */
-    if (result == NULL) {
-        PyGILState_Release(state);
-        *bytes_read = 0;
-        *status = CALLING_READ_FAILED;
-        return NULL;
-    }
-    else if (!PyBytes_Check(result)) {
-        tmp = PyUnicode_AsUTF8String(result);
-        Py_XDECREF(result);
-        result = tmp;
-    }
-
-    length = PySequence_Length(result);
-
-    if (length == 0)
-        *status = REACHED_EOF;
-    else
-        *status = 0;
-
-    /* hang on to the Python object */
-    src->buffer = result;
-    retval = (void*) PyBytes_AsString(result);
-
-
-    PyGILState_Release(state);
-
-    /* TODO: more error handling */
-    *bytes_read = length;
-
-    return retval;
-}
-
-
-#ifdef HAVE_MMAP
-
-#include <sys/stat.h>
-#include <sys/mman.h>
-
-void *new_mmap(char *fname)
-{
-    struct stat buf;
-    int fd;
-    memory_map *mm;
-    /* off_t position; */
-    off_t filesize;
-
-    mm = (memory_map *) malloc(sizeof(memory_map));
-    mm->fp = fopen(fname, "rb");
-
-    fd = fileno(mm->fp);
-    if (fstat(fd, &buf) == -1) {
-        fprintf(stderr, "new_file_buffer: fstat() failed. errno =%d\n", errno);
-        return NULL;
-    }
-    filesize = buf.st_size;  /* XXX This might be 32 bits. */
-
-
-    if (mm == NULL) {
-        /* XXX Eventually remove this print statement. */
-        fprintf(stderr, "new_file_buffer: malloc() failed.\n");
-        return NULL;
-    }
-    mm->size = (off_t) filesize;
-    mm->line_number = 0;
-
-    mm->fileno = fd;
-    mm->position = ftell(mm->fp);
-    mm->last_pos = (off_t) filesize;
-
-    mm->memmap = mmap(NULL, filesize, PROT_READ, MAP_SHARED, fd, 0);
-    if (mm->memmap == NULL) {
-        /* XXX Eventually remove this print statement. */
-        fprintf(stderr, "new_file_buffer: mmap() failed.\n");
-        free(mm);
-        mm = NULL;
-    }
-
-    return (void*) mm;
-}
-
-
-int del_mmap(void *src)
-{
-    munmap(MM(src)->memmap, MM(src)->size);
-
-    fclose(MM(src)->fp);
-
-    /*
-     *  With a memory mapped file, there is no need to do
-     *  anything if restore == RESTORE_INITIAL.
-     */
-    /* if (restore == RESTORE_FINAL) { */
-    /*     fseek(FB(fb)->file, FB(fb)->current_pos, SEEK_SET); */
-    /* } */
-    free(src);
-
-    return 0;
-}
-
-void* buffer_mmap_bytes(void *source, size_t nbytes,
-                        size_t *bytes_read, int *status) {
-    void *retval;
-    memory_map *src = MM(source);
-
-    if (src->position == src->last_pos) {
-        *bytes_read = 0;
-        *status = REACHED_EOF;
-        return NULL;
-    }
-
-    retval = src->memmap + src->position;
-
-    if (src->position + nbytes > src->last_pos) {
-        // fewer than nbytes remaining
-        *bytes_read = src->last_pos - src->position;
-    } else {
-        *bytes_read = nbytes;
-    }
-
-    *status = 0;
-
-    /* advance position in mmap data structure */
-    src->position += *bytes_read;
-
-    return retval;
-}
-
-#else
-
-/* kludgy */
-
-void *new_mmap(char *fname) {
-  return NULL;
-}
-
-int del_mmap(void *src) {
-  return 0;
-}
-
-/* don't use this! */
-
-void* buffer_mmap_bytes(void *source, size_t nbytes,
-                        size_t *bytes_read, int *status) {
-  return NULL;
-}
-
-#endif
diff --git a/pandas/src/parser/io.h b/pandas/src/parser/io.h
deleted file mode 100644
index f5831ad9971a1..0000000000000
--- a/pandas/src/parser/io.h
+++ /dev/null
@@ -1,85 +0,0 @@
-#include "Python.h"
-#include "tokenizer.h"
-
-
-typedef struct _file_source {
-    /* The file being read. */
-    FILE *fp;
-
-    char *buffer;
-    /* Size of the file, in bytes. */
-    /* off_t size; */
-
-    /* file position when the file_buffer was created. */
-    off_t initial_file_pos;
-
-    /* Offset in the file of the data currently in the buffer. */
-    off_t buffer_file_pos;
-
-    /* Actual number of bytes in the current buffer. (Can be less than buffer_size.) */
-    off_t last_pos;
-
-    /* Size (in bytes) of the buffer. */
-    // off_t buffer_size;
-
-    /* Pointer to the buffer. */
-    // char *buffer;
-
-} file_source;
-
-#define FS(source) ((file_source *)source)
-
-#if !defined(_WIN32)
-#define HAVE_MMAP
-#endif
-
-typedef struct _memory_map {
-
-    FILE *fp;
-
-    /* Size of the file, in bytes. */
-    off_t size;
-
-    /* file position when the file_buffer was created. */
-    off_t initial_file_pos;
-
-    int line_number;
-
-    int fileno;
-    off_t position;
-    off_t last_pos;
-    char *memmap;
-
-} memory_map;
-
-#define MM(src) ((memory_map*) src)
-
-void *new_mmap(char *fname);
-
-int del_mmap(void *src);
-
-void* buffer_mmap_bytes(void *source, size_t nbytes,
-                        size_t *bytes_read, int *status);
-
-
-typedef struct _rd_source {
-    PyObject* obj;
-    PyObject* buffer;
-    size_t position;
-} rd_source;
-
-#define RDS(source) ((rd_source *)source)
-
-void *new_file_source(char *fname, size_t buffer_size);
-
-void *new_rd_source(PyObject *obj);
-
-int del_file_source(void *src);
-int del_rd_source(void *src);
-
-void* buffer_file_bytes(void *source, size_t nbytes,
-                        size_t *bytes_read, int *status);
-
-void* buffer_rd_bytes(void *source, size_t nbytes,
-                      size_t *bytes_read, int *status);
-
diff --git a/pandas/src/parser/tokenizer.c b/pandas/src/parser/tokenizer.c
deleted file mode 100644
index 9d81bc9c37b8d..0000000000000
--- a/pandas/src/parser/tokenizer.c
+++ /dev/null
@@ -1,2666 +0,0 @@
-/*
-
-Copyright (c) 2012, Lambda Foundry, Inc., except where noted
-
-Incorporates components of WarrenWeckesser/textreader, licensed under 3-clause
-BSD
-
-See LICENSE for the license
-
-*/
-
- /*
-   Low-level ascii-file processing for pandas. Combines some elements from
-   Python's built-in csv module and Warren Weckesser's textreader project on
-   GitHub. See Python Software Foundation License and BSD licenses for these.
-
-  */
-
-
-#include "tokenizer.h"
-
-#include <ctype.h>
-#include <math.h>
-#include <float.h>
-
-
-//#define READ_ERROR_OUT_OF_MEMORY   1
-
-
-/*
-* restore:
-*  RESTORE_NOT     (0):
-*      Free memory, but leave the file position wherever it
-*      happend to be.
-*  RESTORE_INITIAL (1):
-*      Restore the file position to the location at which
-*      the file_buffer was created.
-*  RESTORE_FINAL   (2):
-*      Put the file position at the next byte after the
-*      data read from the file_buffer.
-*
-#define RESTORE_NOT     0
-#define RESTORE_INITIAL 1
-#define RESTORE_FINAL   2
-*/
-
-static void *safe_realloc(void *buffer, size_t size) {
-    void *result;
-    // OS X is weird
-    // http://stackoverflow.com/questions/9560609/
-    // different-realloc-behaviour-in-linux-and-osx
-
-    result = realloc(buffer, size);
-    TRACE(("safe_realloc: buffer = %p, size = %zu, result = %p\n", buffer, size, result))
-
-/*    if (result != NULL) {
-        // errno gets set to 12 on my OS Xmachine in some cases even when the
-        // realloc succeeds. annoying
-        errno = 0;
-    } else {
-        return buffer;
-    }*/
-    return result;
-}
-
-
-void coliter_setup(coliter_t *self, parser_t *parser, int i, int start) {
-    // column i, starting at 0
-    self->words = parser->words;
-    self->col = i;
-    self->line_start = parser->line_start + start;
-}
-
-coliter_t *coliter_new(parser_t *self, int i) {
-    // column i, starting at 0
-    coliter_t *iter = (coliter_t*) malloc(sizeof(coliter_t));
-
-    if (NULL == iter) {
-        return NULL;
-    }
-
-    coliter_setup(iter, self, i, 0);
-    return iter;
-}
-
-
- /* int64_t str_to_int64(const char *p_item, int64_t int_min, int64_t int_max, int *error); */
- /* uint64_t str_to_uint64(const char *p_item, uint64_t uint_max, int *error); */
-
-
-static  void free_if_not_null(void **ptr) {
-    TRACE(("free_if_not_null %p\n", *ptr))
-    if (*ptr != NULL) {
-        free(*ptr);
-        *ptr = NULL;
-    }
- }
-
-
-
- /*
-
-   Parser / tokenizer
-
- */
-
-
-static void *grow_buffer(void *buffer, int length, int *capacity,
-                         int space, int elsize, int *error) {
-    int cap = *capacity;
-    void *newbuffer = buffer;
-
-    // Can we fit potentially nbytes tokens (+ null terminators) in the stream?
-    while ( (length + space > cap) && (newbuffer != NULL) ){
-        cap = cap? cap << 1 : 2;
-        buffer = newbuffer;
-        newbuffer = safe_realloc(newbuffer, elsize * cap);
-    }
-
-    if (newbuffer == NULL) {
-        // realloc failed so don't change *capacity, set *error to errno
-        // and return the last good realloc'd buffer so it can be freed
-        *error = errno;
-        newbuffer = buffer;
-        } else {
-        // realloc worked, update *capacity and set *error to 0
-        // sigh, multiple return values
-        *capacity = cap;
-        *error = 0;
-    }
-    return newbuffer;
- }
-
-
-void parser_set_default_options(parser_t *self) {
-    self->decimal = '.';
-    self->sci = 'E';
-
-    // For tokenization
-    self->state = START_RECORD;
-
-    self->delimiter = ','; // XXX
-    self->delim_whitespace = 0;
-
-    self->doublequote = 0;
-    self->quotechar = '"';
-    self->escapechar = 0;
-
-    self->lineterminator = '\0'; /* NUL->standard logic */
-
-    self->skipinitialspace = 0;
-    self->quoting = QUOTE_MINIMAL;
-    self->allow_embedded_newline = 1;
-    self->strict = 0;
-
-    self->expected_fields = -1;
-    self->error_bad_lines = 0;
-    self->warn_bad_lines = 0;
-
-    self->commentchar = '#';
-    self->thousands = '\0';
-
-    self->skipset = NULL;
-    self-> skip_first_N_rows = -1;
-    self->skip_footer = 0;
-}
-
-int get_parser_memory_footprint(parser_t *self) {
-    return 0;
-}
-
-parser_t* parser_new() {
-    return (parser_t*) calloc(1, sizeof(parser_t));
-}
-
-int parser_clear_data_buffers(parser_t *self) {
-    free_if_not_null((void *)&self->stream);
-    free_if_not_null((void *)&self->words);
-    free_if_not_null((void *)&self->word_starts);
-    free_if_not_null((void *)&self->line_start);
-    free_if_not_null((void *)&self->line_fields);
-    return 0;
-}
-
-int parser_cleanup(parser_t *self) {
-    int    status = 0;
-
-    // XXX where to put this
-    free_if_not_null((void *) &self->error_msg);
-    free_if_not_null((void *) &self->warn_msg);
-
-    if (self->skipset != NULL) {
-        kh_destroy_int64((kh_int64_t*) self->skipset);
-        self->skipset = NULL;
-    }
-
-    if (parser_clear_data_buffers(self) < 0) {
-        status = -1;
-    }
-
-    if (self->cb_cleanup != NULL) {
-        if (self->cb_cleanup(self->source) < 0) {
-            status = -1;
-        }
-    }
-
-    return status;
-}
-
-
-
-int parser_init(parser_t *self) {
-    int sz;
-
-    /*
-      Initialize data buffers
-    */
-
-    self->stream = NULL;
-    self->words = NULL;
-    self->word_starts = NULL;
-    self->line_start = NULL;
-    self->line_fields = NULL;
-    self->error_msg = NULL;
-    self->warn_msg = NULL;
-
-    // token stream
-    self->stream = (char*) malloc(STREAM_INIT_SIZE * sizeof(char));
-    if (self->stream == NULL) {
-        parser_cleanup(self);
-        return PARSER_OUT_OF_MEMORY;
-    }
-    self->stream_cap = STREAM_INIT_SIZE;
-    self->stream_len = 0;
-
-    // word pointers and metadata
-    sz = STREAM_INIT_SIZE / 10;
-    sz = sz? sz : 1;
-    self->words = (char**) malloc(sz * sizeof(char*));
-    self->word_starts = (int*) malloc(sz * sizeof(int));
-    self->words_cap = sz;
-    self->words_len = 0;
-
-    // line pointers and metadata
-    self->line_start = (int*) malloc(sz * sizeof(int));
-
-    self->line_fields = (int*) malloc(sz * sizeof(int));
-
-    self->lines_cap = sz;
-    self->lines = 0;
-    self->file_lines = 0;
-
-    if (self->stream == NULL || self->words == NULL ||
-        self->word_starts == NULL || self->line_start == NULL ||
-        self->line_fields == NULL) {
-
-        parser_cleanup(self);
-
-        return PARSER_OUT_OF_MEMORY;
-    }
-
-    /* amount of bytes buffered */
-    self->datalen = 0;
-    self->datapos = 0;
-
-    self->line_start[0] = 0;
-    self->line_fields[0] = 0;
-
-    self->pword_start = self->stream;
-    self->word_start = 0;
-
-    self->state = START_RECORD;
-
-    self->error_msg = NULL;
-    self->warn_msg = NULL;
-
-    self->commentchar = '\0';
-
-    return 0;
-}
-
-
-void parser_free(parser_t *self) {
-    // opposite of parser_init
-    parser_cleanup(self);
-    free(self);
-}
-
-static int make_stream_space(parser_t *self, size_t nbytes) {
-    int i, status, cap;
-    void *orig_ptr, *newptr;
-
-    // Can we fit potentially nbytes tokens (+ null terminators) in the stream?
-
-    /* TRACE(("maybe growing buffers\n")); */
-
-    /*
-      TOKEN STREAM
-    */
-
-    orig_ptr = (void *) self->stream;
-    TRACE(("\n\nmake_stream_space: nbytes = %zu.  grow_buffer(self->stream...)\n", nbytes))
-    self->stream = (char*) grow_buffer((void *) self->stream,
-                                        self->stream_len,
-                                        &self->stream_cap, nbytes * 2,
-                                        sizeof(char), &status);
-    TRACE(("make_stream_space: self->stream=%p, self->stream_len = %zu, self->stream_cap=%zu, status=%zu\n",
-           self->stream, self->stream_len, self->stream_cap, status))
-
-    if (status != 0) {
-        return PARSER_OUT_OF_MEMORY;
-    }
-
-    // realloc sets errno when moving buffer?
-    if (self->stream != orig_ptr) {
-        // uff
-        /* TRACE(("Moving word pointers\n")) */
-
-        self->pword_start = self->stream + self->word_start;
-
-        for (i = 0; i < self->words_len; ++i)
-        {
-            self->words[i] = self->stream + self->word_starts[i];
-        }
-    }
-
-
-    /*
-      WORD VECTORS
-    */
-
-    cap = self->words_cap;
-    self->words = (char**) grow_buffer((void *) self->words,
-                                       self->words_len,
-                                       &self->words_cap, nbytes,
-                                       sizeof(char*), &status);
-    TRACE(("make_stream_space: grow_buffer(self->self->words, %zu, %zu, %zu, %d)\n",
-           self->words_len, self->words_cap, nbytes, status))
-    if (status != 0) {
-        return PARSER_OUT_OF_MEMORY;
-    }
-
-
-    // realloc took place
-    if (cap != self->words_cap) {
-        TRACE(("make_stream_space: cap != self->words_cap, nbytes = %d, self->words_cap=%d\n", nbytes, self->words_cap))
-        newptr = safe_realloc((void *) self->word_starts, sizeof(int) * self->words_cap);
-        if (newptr == NULL) {
-            return PARSER_OUT_OF_MEMORY;
-        } else {
-            self->word_starts = (int*) newptr;
-        }
-    }
-
-
-    /*
-      LINE VECTORS
-    */
-    /*
-    printf("Line_start: ");
-
-    for (j = 0; j < self->lines + 1; ++j) {
-         printf("%d ", self->line_fields[j]);
-     }
-    printf("\n");
-
-    printf("lines_cap: %d\n", self->lines_cap);
-    */
-    cap = self->lines_cap;
-    self->line_start = (int*) grow_buffer((void *) self->line_start,
-                                          self->lines + 1,
-                                          &self->lines_cap, nbytes,
-                                          sizeof(int), &status);
-    TRACE(("make_stream_space: grow_buffer(self->line_start, %zu, %zu, %zu, %d)\n",
-           self->lines + 1, self->lines_cap, nbytes, status))
-    if (status != 0) {
-        return PARSER_OUT_OF_MEMORY;
-    }
-
-    // realloc took place
-    if (cap != self->lines_cap) {
-        TRACE(("make_stream_space: cap != self->lines_cap, nbytes = %d\n", nbytes))
-        newptr = safe_realloc((void *) self->line_fields, sizeof(int) * self->lines_cap);
-        if (newptr == NULL) {
-            return PARSER_OUT_OF_MEMORY;
-        } else {
-            self->line_fields = (int*) newptr;
-        }
-    }
-
-    /* TRACE(("finished growing buffers\n")); */
-
-    return 0;
-}
-
-
-static int push_char(parser_t *self, char c) {
-    /* TRACE(("pushing %c \n", c)) */
-    TRACE(("push_char: self->stream[%zu] = %x, stream_cap=%zu\n", self->stream_len+1, c, self->stream_cap))
-    if (self->stream_len >= self->stream_cap) {
-        TRACE(("push_char: ERROR!!! self->stream_len(%d) >= self->stream_cap(%d)\n",
-               self->stream_len, self->stream_cap))
-        self->error_msg = (char*) malloc(64);
-        sprintf(self->error_msg, "Buffer overflow caught - possible malformed input file.\n");
-        return PARSER_OUT_OF_MEMORY;
-    }
-    self->stream[self->stream_len++] = c;
-    return 0;
-}
-
-static int P_INLINE end_field(parser_t *self) {
-    // XXX cruft
-//    self->numeric_field = 0;
-    if (self->words_len >= self->words_cap) {
-        TRACE(("end_field: ERROR!!! self->words_len(%zu) >= self->words_cap(%zu)\n", self->words_len, self->words_cap))
-        self->error_msg = (char*) malloc(64);
-        sprintf(self->error_msg, "Buffer overflow caught - possible malformed input file.\n");
-        return PARSER_OUT_OF_MEMORY;
-    }
-
-    // null terminate token
-    push_char(self, '\0');
-
-    // set pointer and metadata
-    self->words[self->words_len] = self->pword_start;
-
-    TRACE(("end_field: Char diff: %d\n", self->pword_start - self->words[0]));
-
-    TRACE(("end_field: Saw word %s at: %d. Total: %d\n",
-           self->pword_start, self->word_start, self->words_len + 1))
-
-    self->word_starts[self->words_len] = self->word_start;
-    self->words_len++;
-
-    // increment line field count
-    self->line_fields[self->lines]++;
-
-    // New field begin in stream
-    self->pword_start = self->stream + self->stream_len;
-    self->word_start = self->stream_len;
-
-    return 0;
-}
-
-
-static void append_warning(parser_t *self, const char *msg) {
-    int ex_length;
-    int length = strlen(msg);
-    void *newptr;
-
-    if (self->warn_msg == NULL) {
-        self->warn_msg = (char*) malloc(length + 1);
-        strcpy(self->warn_msg, msg);
-    } else {
-        ex_length = strlen(self->warn_msg);
-        newptr = safe_realloc(self->warn_msg, ex_length + length + 1);
-        if (newptr != NULL) {
-            self->warn_msg = (char*) newptr;
-            strcpy(self->warn_msg + ex_length, msg);
-        }
-    }
-}
-
-static int end_line(parser_t *self) {
-    int fields;
-    int ex_fields = self->expected_fields;
-    char *msg;
-
-    fields = self->line_fields[self->lines];
-
-    TRACE(("end_line: Line end, nfields: %d\n", fields));
-
-    if (self->lines > 0) {
-        if (self->expected_fields >= 0) {
-            ex_fields = self->expected_fields;
-        } else {
-            ex_fields = self->line_fields[self->lines - 1];
-        }
-    }
-
-    if (self->state == SKIP_LINE) {
-        TRACE(("end_line: Skipping row %d\n", self->file_lines));
-        // increment file line count
-        self->file_lines++;
-
-        // skip the tokens from this bad line
-        self->line_start[self->lines] += fields;
-
-        // reset field count
-        self->line_fields[self->lines] = 0;
-        return 0;
-    }
-
-    /* printf("Line: %d, Fields: %d, Ex-fields: %d\n", self->lines, fields, ex_fields); */
-
-    if (!(self->lines <= self->header_end + 1)
-        && (self->expected_fields < 0 && fields > ex_fields)) {
-        // increment file line count
-        self->file_lines++;
-
-        // skip the tokens from this bad line
-        self->line_start[self->lines] += fields;
-
-        // reset field count
-        self->line_fields[self->lines] = 0;
-
-        // file_lines is now the _actual_ file line number (starting at 1)
-
-        if (self->error_bad_lines) {
-            self->error_msg = (char*) malloc(100);
-            sprintf(self->error_msg, "Expected %d fields in line %d, saw %d\n",
-                    ex_fields, self->file_lines, fields);
-
-            TRACE(("Error at line %d, %d fields\n", self->file_lines, fields));
-
-            return -1;
-        } else {
-            // simply skip bad lines
-            if (self->warn_bad_lines) {
-                // pass up error message
-                msg = (char*) malloc(100);
-                sprintf(msg, "Skipping line %d: expected %d fields, saw %d\n",
-                        self->file_lines, ex_fields, fields);
-                append_warning(self, msg);
-                free(msg);
-            }
-        }
-    }
-    else {
-        /* missing trailing delimiters */
-        if ((self->lines >= self->header_end + 1) && fields < ex_fields) {
-
-            /* Might overrun the buffer when closing fields */
-            if (make_stream_space(self, ex_fields - fields) < 0) {
-                self->error_msg = "out of memory";
-                return -1;
-            }
-
-            while (fields < ex_fields){
-                end_field(self);
-                /* printf("Prior word: %s\n", self->words[self->words_len - 2]); */
-                fields++;
-            }
-        }
-
-        // increment both line counts
-        self->file_lines++;
-
-        self->lines++;
-
-        /* coliter_t it; */
-        /* coliter_setup(&it, self, 5, self->lines - 1); */
-        /* printf("word at column 5: %s\n", COLITER_NEXT(it)); */
-
-        // good line, set new start point
-        if (self->lines >= self->lines_cap) {
-            TRACE(("end_line: ERROR!!! self->lines(%zu) >= self->lines_cap(%zu)\n", self->lines, self->lines_cap))  \
-            self->error_msg = (char*) malloc(100);      \
-            sprintf(self->error_msg, "Buffer overflow caught - possible malformed input file.\n"); \
-            return PARSER_OUT_OF_MEMORY;                \
-        }
-        self->line_start[self->lines] = (self->line_start[self->lines - 1] +
-                                         fields);
-
-        TRACE(("end_line: new line start: %d\n", self->line_start[self->lines]));
-
-        // new line start with 0 fields
-        self->line_fields[self->lines] = 0;
-    }
-
-    TRACE(("end_line: Finished line, at %d\n", self->lines));
-
-    return 0;
-}
-
-
-
-int parser_add_skiprow(parser_t *self, int64_t row) {
-    khiter_t k;
-    kh_int64_t *set;
-    int ret = 0;
-
-    if (self->skipset == NULL) {
-        self->skipset = (void*) kh_init_int64();
-    }
-
-    set = (kh_int64_t*) self->skipset;
-
-    k = kh_put_int64(set, row, &ret);
-    set->keys[k] = row;
-
-    return 0;
-}
-
-int parser_set_skipfirstnrows(parser_t *self, int64_t nrows) {
-    // self->file_lines is zero based so subtract 1 from nrows
-    if (nrows > 0) {
-        self->skip_first_N_rows = nrows - 1;
-    }
-
-    return 0;
-}
-
-static int parser_buffer_bytes(parser_t *self, size_t nbytes) {
-    int status;
-    size_t bytes_read;
-
-    status = 0;
-    self->datapos = 0;
-    self->data = self->cb_io(self->source, nbytes, &bytes_read, &status);
-    TRACE(("parser_buffer_bytes self->cb_io: nbytes=%zu, datalen: %d, status=%d\n",
-           nbytes, bytes_read, status));
-    self->datalen = bytes_read;
-
-    if (status != REACHED_EOF && self->data == NULL) {
-        self->error_msg = (char*) malloc(200);
-
-        if (status == CALLING_READ_FAILED) {
-            sprintf(self->error_msg, ("Calling read(nbytes) on source failed. "
-                                      "Try engine='python'."));
-        } else {
-            sprintf(self->error_msg, "Unknown error in IO callback");
-        }
-        return -1;
-    }
-
-    TRACE(("datalen: %d\n", self->datalen));
-
-    return status;
-}
-
-
-/*
-
-  Tokenization macros and state machine code
-
-*/
-
-//    printf("pushing %c\n", c);
-
-#define PUSH_CHAR(c)                                \
-    TRACE(("PUSH_CHAR: Pushing %c, slen= %d, stream_cap=%zu, stream_len=%zu\n", c, slen, self->stream_cap, self->stream_len)) \
-    if (slen >= maxstreamsize) {                    \
-        TRACE(("PUSH_CHAR: ERROR!!! slen(%d) >= maxstreamsize(%d)\n", slen, maxstreamsize))            \
-        self->error_msg = (char*) malloc(100);      \
-        sprintf(self->error_msg, "Buffer overflow caught - possible malformed input file.\n"); \
-        return PARSER_OUT_OF_MEMORY;                \
-    }                                               \
-    *stream++ = c;                                  \
-    slen++;
-
-// This is a little bit of a hack but works for now
-
-#define END_FIELD()                            \
-    self->stream_len = slen;                   \
-    if (end_field(self) < 0) {                 \
-        goto parsingerror;                     \
-    }                                          \
-    stream = self->stream + self->stream_len;  \
-    slen = self->stream_len;
-
-#define END_LINE_STATE(STATE)                                           \
-    self->stream_len = slen;                                            \
-    if (end_line(self) < 0) {                                           \
-        goto parsingerror;                                              \
-    }                                                                   \
-    stream = self->stream + self->stream_len;                           \
-    slen = self->stream_len;                                            \
-    self->state = STATE;                                                \
-    if (line_limit > 0 && self->lines == start_lines + line_limit) {    \
-        goto linelimit;                                                 \
-                                                                        \
-    }
-
-#define END_LINE_AND_FIELD_STATE(STATE)                                 \
-    self->stream_len = slen;                                            \
-    if (end_line(self) < 0) {                                           \
-        goto parsingerror;                                              \
-    }                                                                   \
-    if (end_field(self) < 0) {                                          \
-        goto parsingerror;                                              \
-    }                                                                   \
-    stream = self->stream + self->stream_len;                           \
-    slen = self->stream_len;                                            \
-    self->state = STATE;                                                \
-    if (line_limit > 0 && self->lines == start_lines + line_limit) {    \
-        goto linelimit;                                                 \
-                                                                        \
-    }
-
-#define END_LINE() END_LINE_STATE(START_RECORD)
-
-#define IS_WHITESPACE(c) ((c == ' ' || c == '\t'))
-
-typedef int (*parser_op)(parser_t *self, size_t line_limit);
-
-#define _TOKEN_CLEANUP()                                                \
-    self->stream_len = slen;                                            \
-    self->datapos = i;                                                  \
-    TRACE(("_TOKEN_CLEANUP: datapos: %d, datalen: %d\n", self->datapos, self->datalen));
-
-
-int skip_this_line(parser_t *self, int64_t rownum) {
-    if (self->skipset != NULL) {
-        return ( kh_get_int64((kh_int64_t*) self->skipset, self->file_lines) !=
-                 ((kh_int64_t*)self->skipset)->n_buckets );
-    }
-    else {
-        return ( rownum <= self->skip_first_N_rows );
-    }
-}
-
-int tokenize_delimited(parser_t *self, size_t line_limit)
-{
-    int i, slen, start_lines;
-    long maxstreamsize;
-    char c;
-    char *stream;
-    char *buf = self->data + self->datapos;
-
-
-    start_lines = self->lines;
-
-    if (make_stream_space(self, self->datalen - self->datapos) < 0) {
-        self->error_msg = "out of memory";
-        return -1;
-    }
-
-    stream = self->stream + self->stream_len;
-    slen = self->stream_len;
-    maxstreamsize = self->stream_cap;
-    TRACE(("%s\n", buf));
-
-    for (i = self->datapos; i < self->datalen; ++i)
-    {
-        // Next character in file
-        c = *buf++;
-
-        TRACE(("tokenize_delimited - Iter: %d Char: 0x%x Line %d field_count %d, state %d\n",
-               i, c, self->file_lines + 1, self->line_fields[self->lines],
-               self->state));
-
-        switch(self->state) {
-
-        case SKIP_LINE:
-            TRACE(("tokenize_delimited SKIP_LINE 0x%x, state %d\n", c, self->state));
-            if (c == '\n') {
-                END_LINE();
-            } else if (c == '\r') {
-                self->file_lines++;
-                self->state = EAT_CRNL_NOP;
-            }
-            break;
-
-        case START_RECORD:
-            // start of record
-            if (skip_this_line(self, self->file_lines)) {
-                self->state = SKIP_LINE;
-                if (c == '\n') {
-                    END_LINE();
-                }
-                break;
-            }
-            else if (c == '\n') {
-                // \n\r possible?
-                if (self->skip_empty_lines)
-                {
-                    self->file_lines++;
-                }
-                else
-                {
-                    END_LINE();
-                }
-                break;
-            }
-            else if (c == '\r') {
-                if (self->skip_empty_lines)
-                {
-                    self->file_lines++;
-                    self->state = EAT_CRNL_NOP;
-                }
-                else
-                    self->state = EAT_CRNL;
-                break;
-            }
-            else if (c == self->commentchar) {
-                self->state = EAT_LINE_COMMENT;
-                break;
-            }
-            else if (IS_WHITESPACE(c) && c != self->delimiter && self->skip_empty_lines) {
-                self->state = WHITESPACE_LINE;
-                break;
-            }
-
-            /* normal character - handle as START_FIELD */
-            self->state = START_FIELD;
-            /* fallthru */
-
-        case START_FIELD:
-            /* expecting field */
-            if (c == '\n') {
-                END_FIELD();
-                END_LINE();
-            } else if (c == '\r') {
-                END_FIELD();
-                self->state = EAT_CRNL;
-            }
-            else if (c == self->quotechar &&
-                     self->quoting != QUOTE_NONE) {
-                /* start quoted field */
-                self->state = IN_QUOTED_FIELD;
-            }
-            else if (c == self->escapechar) {
-                /* possible escaped character */
-                self->state = ESCAPED_CHAR;
-            }
-            else if (c == ' ' && self->skipinitialspace)
-                /* ignore space at start of field */
-                ;
-            else if (c == self->delimiter) {
-                /* save empty field */
-                END_FIELD();
-            }
-            else if (c == self->commentchar) {
-                END_FIELD();
-                self->state = EAT_COMMENT;
-            }
-            else {
-                /* begin new unquoted field */
-//                if (self->quoting == QUOTE_NONNUMERIC)
-//                    self->numeric_field = 1;
-
-                // TRACE(("pushing %c", c));
-                PUSH_CHAR(c);
-                self->state = IN_FIELD;
-            }
-            break;
-
-        case WHITESPACE_LINE: // check if line is whitespace-only
-            if (c == '\n') {
-                self->file_lines++;
-                self->state = START_RECORD; // ignore empty line
-            }
-            else if (c == '\r') {
-                self->file_lines++;
-                self->state = EAT_CRNL_NOP;
-            }
-            else if (IS_WHITESPACE(c) && c != self->delimiter)
-                ;
-            else { // backtrack
-                /* We have to use i + 1 because buf has been incremented but not i */
-                do {
-                    --buf;
-                    --i;
-                } while (i + 1 > self->datapos && *buf != '\n');
-
-                if (*buf == '\n') // reached a newline rather than the beginning
-                {
-                    ++buf; // move pointer to first char after newline
-                    ++i;
-                }
-                self->state = START_FIELD;
-            }
-            break;
-
-        case ESCAPED_CHAR:
-            /* if (c == '\0') */
-            /*  c = '\n'; */
-
-            PUSH_CHAR(c);
-            self->state = IN_FIELD;
-            break;
-
-        case EAT_LINE_COMMENT:
-            if (c == '\n') {
-                self->file_lines++;
-                self->state = START_RECORD;
-            } else if (c == '\r') {
-                self->file_lines++;
-                self->state = EAT_CRNL_NOP;
-            }
-            break;
-
-        case IN_FIELD:
-            /* in unquoted field */
-            if (c == '\n') {
-                END_FIELD();
-                END_LINE();
-                /* self->state = START_RECORD; */
-            } else if (c == '\r') {
-                END_FIELD();
-                self->state = EAT_CRNL;
-            }
-            else if (c == self->escapechar) {
-                /* possible escaped character */
-                self->state = ESCAPED_CHAR;
-            }
-            else if (c == self->delimiter) {
-                // End of field. End of line not reached yet
-                END_FIELD();
-                self->state = START_FIELD;
-            }
-            else if (c == self->commentchar) {
-                END_FIELD();
-                self->state = EAT_COMMENT;
-            }
-            else {
-                /* normal character - save in field */
-                PUSH_CHAR(c);
-            }
-            break;
-
-        case IN_QUOTED_FIELD:
-            /* in quoted field */
-            if (c == self->escapechar) {
-                /* Possible escape character */
-                self->state = ESCAPE_IN_QUOTED_FIELD;
-            }
-            else if (c == self->quotechar &&
-                     self->quoting != QUOTE_NONE) {
-                if (self->doublequote) {
-                    /* doublequote; " represented by "" */
-                    self->state = QUOTE_IN_QUOTED_FIELD;
-                }
-                else {
-                    /* end of quote part of field */
-                    self->state = IN_FIELD;
-                }
-            }
-            else {
-                /* normal character - save in field */
-                PUSH_CHAR(c);
-            }
-            break;
-
-        case ESCAPE_IN_QUOTED_FIELD:
-            /* if (c == '\0') */
-            /*  c = '\n'; */
-
-            PUSH_CHAR(c);
-            self->state = IN_QUOTED_FIELD;
-            break;
-
-        case QUOTE_IN_QUOTED_FIELD:
-            /* doublequote - seen a quote in an quoted field */
-            if (self->quoting != QUOTE_NONE && c == self->quotechar) {
-                /* save "" as " */
-
-                PUSH_CHAR(c);
-                self->state = IN_QUOTED_FIELD;
-            }
-            else if (c == self->delimiter) {
-                // End of field. End of line not reached yet
-
-                END_FIELD();
-                self->state = START_FIELD;
-            }
-            else if (c == '\n') {
-                END_FIELD();
-                END_LINE();
-                /* self->state = START_RECORD; */
-            }
-            else if (c == '\r') {
-                END_FIELD();
-                self->state = EAT_CRNL;
-            }
-            else if (!self->strict) {
-                PUSH_CHAR(c);
-                self->state = IN_FIELD;
-            }
-            else {
-                self->error_msg = (char*) malloc(50);
-                sprintf(self->error_msg, "'%c' expected after '%c'",
-                        self->delimiter, self->quotechar);
-                goto parsingerror;
-            }
-            break;
-
-        case EAT_COMMENT:
-            if (c == '\n') {
-                END_LINE();
-            } else if (c == '\r') {
-                self->state = EAT_CRNL;
-            }
-            break;
-
-        case EAT_CRNL:
-            if (c == '\n') {
-                END_LINE();
-                /* self->state = START_RECORD; */
-            } else if (c == self->delimiter){
-                // Handle \r-delimited files
-                END_LINE_AND_FIELD_STATE(START_FIELD);
-            } else {
-                /* \r line terminator */
-
-                /* UGH. we don't actually want to consume the token. fix this later */
-                self->stream_len = slen;
-                if (end_line(self) < 0) {
-                    goto parsingerror;
-                }
-                stream = self->stream + self->stream_len;
-                slen = self->stream_len;
-                self->state = START_RECORD;
-
-                /* HACK, let's try this one again */
-                --i; buf--;
-                if (line_limit > 0 && self->lines == start_lines + line_limit) {
-                    goto linelimit;
-                }
-
-            }
-            break;
-
-        case EAT_CRNL_NOP: /* inside an ignored comment line */
-            self->state = START_RECORD;
-            /* \r line terminator -- parse this character again */
-            if (c != '\n' && c != self->delimiter) {
-                --i;
-                --buf;
-            }
-            break;
-        default:
-            break;
-
-        }
-    }
-
-    _TOKEN_CLEANUP();
-
-    TRACE(("Finished tokenizing input\n"))
-
-    return 0;
-
-parsingerror:
-    i++;
-    _TOKEN_CLEANUP();
-
-    return -1;
-
-linelimit:
-    i++;
-    _TOKEN_CLEANUP();
-
-    return 0;
-}
-
-/* custom line terminator */
-int tokenize_delim_customterm(parser_t *self, size_t line_limit)
-{
-
-    int i, slen, start_lines;
-    long maxstreamsize;
-    char c;
-    char *stream;
-    char *buf = self->data + self->datapos;
-
-
-    start_lines = self->lines;
-
-    if (make_stream_space(self, self->datalen - self->datapos) < 0) {
-        self->error_msg = "out of memory";
-        return -1;
-    }
-
-    stream = self->stream + self->stream_len;
-    slen = self->stream_len;
-    maxstreamsize = self->stream_cap;
-
-    TRACE(("%s\n", buf));
-
-    for (i = self->datapos; i < self->datalen; ++i)
-    {
-        // Next character in file
-        c = *buf++;
-
-        TRACE(("tokenize_delim_customterm - Iter: %d Char: %c Line %d field_count %d, state %d\n",
-               i, c, self->file_lines + 1, self->line_fields[self->lines],
-               self->state));
-
-        switch(self->state) {
-
-        case SKIP_LINE:
-//            TRACE(("tokenize_delim_customterm SKIP_LINE %c, state %d\n", c, self->state));
-            if (c == self->lineterminator) {
-                END_LINE();
-            }
-            break;
-
-        case START_RECORD:
-            // start of record
-            if (skip_this_line(self, self->file_lines)) {
-                self->state = SKIP_LINE;
-                if (c == self->lineterminator) {
-                    END_LINE();
-                }
-                break;
-            }
-            else if (c == self->lineterminator) {
-                // \n\r possible?
-                if (self->skip_empty_lines)
-                {
-                    self->file_lines++;
-                }
-                else
-                {
-                    END_LINE();
-                }
-                break;
-            }
-            else if (c == self->commentchar) {
-                self->state = EAT_LINE_COMMENT;
-                break;
-            }
-            else if (IS_WHITESPACE(c) && c != self->delimiter && self->skip_empty_lines)
-            {
-                self->state = WHITESPACE_LINE;
-                break;
-            }
-            /* normal character - handle as START_FIELD */
-            self->state = START_FIELD;
-            /* fallthru */
-        case START_FIELD:
-            /* expecting field */
-            if (c == self->lineterminator) {
-                END_FIELD();
-                END_LINE();
-                /* self->state = START_RECORD; */
-            }
-            else if (c == self->quotechar &&
-                     self->quoting != QUOTE_NONE) {
-                /* start quoted field */
-                self->state = IN_QUOTED_FIELD;
-            }
-            else if (c == self->escapechar) {
-                /* possible escaped character */
-                self->state = ESCAPED_CHAR;
-            }
-            else if (c == ' ' && self->skipinitialspace)
-                /* ignore space at start of field */
-                ;
-            else if (c == self->delimiter) {
-                /* save empty field */
-                END_FIELD();
-            }
-            else if (c == self->commentchar) {
-                END_FIELD();
-                self->state = EAT_COMMENT;
-            }
-            else {
-                /* begin new unquoted field */
-                if (self->quoting == QUOTE_NONNUMERIC)
-                    self->numeric_field = 1;
-
-                // TRACE(("pushing %c", c));
-                PUSH_CHAR(c);
-                self->state = IN_FIELD;
-            }
-            break;
-
-        case WHITESPACE_LINE: // check if line is whitespace-only
-            if (c == self->lineterminator) {
-                self->file_lines++;
-                self->state = START_RECORD; // ignore empty line
-            }
-            else if (IS_WHITESPACE(c) && c != self->delimiter)
-                ;
-            else { // backtrack
-                /* We have to use i + 1 because buf has been incremented but not i */
-                do {
-                    --buf;
-                    --i;
-                } while (i + 1 > self->datapos && *buf != self->lineterminator);
-
-                if (*buf == self->lineterminator) // reached a newline rather than the beginning
-                {
-                    ++buf; // move pointer to first char after newline
-                    ++i;
-                }
-                self->state = START_FIELD;
-            }
-            break;
-
-        case ESCAPED_CHAR:
-            /* if (c == '\0') */
-            /*  c = '\n'; */
-
-            PUSH_CHAR(c);
-            self->state = IN_FIELD;
-            break;
-
-        case IN_FIELD:
-            /* in unquoted field */
-            if (c == self->lineterminator) {
-                END_FIELD();
-                END_LINE();
-                /* self->state = START_RECORD; */
-            }
-            else if (c == self->escapechar) {
-                /* possible escaped character */
-                self->state = ESCAPED_CHAR;
-            }
-            else if (c == self->delimiter) {
-                // End of field. End of line not reached yet
-                END_FIELD();
-                self->state = START_FIELD;
-            }
-            else if (c == self->commentchar) {
-                END_FIELD();
-                self->state = EAT_COMMENT;
-            }
-            else {
-                /* normal character - save in field */
-                PUSH_CHAR(c);
-            }
-            break;
-
-        case IN_QUOTED_FIELD:
-            /* in quoted field */
-            if (c == self->escapechar) {
-                /* Possible escape character */
-                self->state = ESCAPE_IN_QUOTED_FIELD;
-            }
-            else if (c == self->quotechar &&
-                     self->quoting != QUOTE_NONE) {
-                if (self->doublequote) {
-                    /* doublequote; " represented by "" */
-                    self->state = QUOTE_IN_QUOTED_FIELD;
-                }
-                else {
-                    /* end of quote part of field */
-                    self->state = IN_FIELD;
-                }
-            }
-            else {
-                /* normal character - save in field */
-                PUSH_CHAR(c);
-            }
-            break;
-
-        case ESCAPE_IN_QUOTED_FIELD:
-            PUSH_CHAR(c);
-            self->state = IN_QUOTED_FIELD;
-            break;
-
-        case QUOTE_IN_QUOTED_FIELD:
-            /* doublequote - seen a quote in an quoted field */
-            if (self->quoting != QUOTE_NONE && c == self->quotechar) {
-                /* save "" as " */
-
-                PUSH_CHAR(c);
-                self->state = IN_QUOTED_FIELD;
-            }
-            else if (c == self->delimiter) {
-                // End of field. End of line not reached yet
-
-                END_FIELD();
-                self->state = START_FIELD;
-            }
-            else if (c == self->lineterminator) {
-                END_FIELD();
-                END_LINE();
-                /* self->state = START_RECORD; */
-            }
-            else if (!self->strict) {
-                PUSH_CHAR(c);
-                self->state = IN_FIELD;
-            }
-            else {
-                self->error_msg = (char*) malloc(50);
-                sprintf(self->error_msg, "'%c' expected after '%c'",
-                        self->delimiter, self->quotechar);
-                goto parsingerror;
-            }
-            break;
-
-        case EAT_LINE_COMMENT:
-            if (c == self->lineterminator) {
-                self->file_lines++;
-                self->state = START_RECORD;
-            }
-            break;
-
-        case EAT_COMMENT:
-            if (c == self->lineterminator) {
-                END_LINE();
-            }
-            break;
-
-        default:
-            break;
-
-        }
-    }
-
-    _TOKEN_CLEANUP();
-
-    TRACE(("Finished tokenizing input\n"))
-
-    return 0;
-
-parsingerror:
-    i++;
-    _TOKEN_CLEANUP();
-
-    return -1;
-
-linelimit:
-    i++;
-    _TOKEN_CLEANUP();
-
-    return 0;
-}
-
-int tokenize_whitespace(parser_t *self, size_t line_limit)
-{
-    int i, slen, start_lines;
-    long maxstreamsize;
-    char c;
-    char *stream;
-    char *buf = self->data + self->datapos;
-
-    start_lines = self->lines;
-
-    if (make_stream_space(self, self->datalen - self->datapos) < 0) {
-        self->error_msg = "out of memory";
-        return -1;
-    }
-
-    stream = self->stream + self->stream_len;
-    slen = self->stream_len;
-    maxstreamsize = self->stream_cap;
-
-    TRACE(("%s\n", buf));
-
-    for (i = self->datapos; i < self->datalen; ++i)
-    {
-        // Next character in file
-        c = *buf++;
-
-        TRACE(("tokenize_whitespace - Iter: %d Char: %c Line %d field_count %d, state %d\n",
-               i, c, self->file_lines + 1, self->line_fields[self->lines],
-               self->state));
-
-        switch(self->state) {
-
-        case SKIP_LINE:
-//            TRACE(("tokenize_whitespace SKIP_LINE %c, state %d\n", c, self->state));
-            if (c == '\n') {
-                END_LINE();
-            } else if (c == '\r') {
-                self->file_lines++;
-                self->state = EAT_CRNL_NOP;
-            }
-            break;
-
-        case WHITESPACE_LINE:
-            if (c == '\n') {
-                self->file_lines++;
-                self->state = START_RECORD;
-                break;
-            }
-            else if (c == '\r') {
-                self->file_lines++;
-                self->state = EAT_CRNL_NOP;
-                break;
-            }
-            // fall through
-
-        case EAT_WHITESPACE:
-            if (c == '\n') {
-                END_LINE();
-                self->state = START_RECORD;
-                break;
-            } else if (c == '\r') {
-                self->state = EAT_CRNL;
-                break;
-            } else if (!IS_WHITESPACE(c)) {
-                // END_FIELD();
-                self->state = START_FIELD;
-                // Fall through to subsequent state
-            } else {
-                // if whitespace char, keep slurping
-                break;
-            }
-
-        case START_RECORD:
-            // start of record
-            if (skip_this_line(self, self->file_lines)) {
-                self->state = SKIP_LINE;
-                if (c == '\n') {
-                    END_LINE();
-                }
-                break;
-            } else  if (c == '\n') {
-                if (self->skip_empty_lines)
-                // \n\r possible?
-                {
-                    self->file_lines++;
-                }
-                else
-                {
-                    END_LINE();
-                }
-                break;
-            } else if (c == '\r') {
-                if (self->skip_empty_lines)
-                {
-                    self->file_lines++;
-                    self->state = EAT_CRNL_NOP;
-                }
-                else
-                    self->state = EAT_CRNL;
-                break;
-            } else if (IS_WHITESPACE(c)) {
-                if (self->skip_empty_lines)
-                    self->state = WHITESPACE_LINE;
-                else
-                    self->state = EAT_WHITESPACE;
-                break;
-            } else if (c == self->commentchar) {
-                self->state = EAT_LINE_COMMENT;
-                break;
-            } else {
-                /* normal character - handle as START_FIELD */
-                self->state = START_FIELD;
-            }
-            /* fallthru */
-        case START_FIELD:
-            /* expecting field */
-            if (c == '\n') {
-                END_FIELD();
-                END_LINE();
-                /* self->state = START_RECORD; */
-            } else if (c == '\r') {
-                END_FIELD();
-                self->state = EAT_CRNL;
-            }
-            else if (c == self->quotechar &&
-                     self->quoting != QUOTE_NONE) {
-                /* start quoted field */
-                self->state = IN_QUOTED_FIELD;
-            }
-            else if (c == self->escapechar) {
-                /* possible escaped character */
-                self->state = ESCAPED_CHAR;
-            }
-            /* else if (c == ' ' && self->skipinitialspace) */
-            /*     /\* ignore space at start of field *\/ */
-            /*     ; */
-            else if (IS_WHITESPACE(c)) {
-                self->state = EAT_WHITESPACE;
-            }
-            else if (c == self->commentchar) {
-                END_FIELD();
-                self->state = EAT_COMMENT;
-            }
-            else {
-                /* begin new unquoted field */
-                if (self->quoting == QUOTE_NONNUMERIC)
-                    self->numeric_field = 1;
-
-                // TRACE(("pushing %c", c));
-                PUSH_CHAR(c);
-                self->state = IN_FIELD;
-            }
-            break;
-
-        case EAT_LINE_COMMENT:
-            if (c == '\n') {
-                self->file_lines++;
-                self->state = START_RECORD;
-            } else if (c == '\r') {
-                self->file_lines++;
-                self->state = EAT_CRNL_NOP;
-            }
-            break;
-
-        case ESCAPED_CHAR:
-            /* if (c == '\0') */
-            /*  c = '\n'; */
-
-            PUSH_CHAR(c);
-            self->state = IN_FIELD;
-            break;
-
-        case IN_FIELD:
-            /* in unquoted field */
-            if (c == '\n') {
-                END_FIELD();
-                END_LINE();
-                /* self->state = START_RECORD; */
-            } else if (c == '\r') {
-                END_FIELD();
-                self->state = EAT_CRNL;
-            }
-            else if (c == self->escapechar) {
-                /* possible escaped character */
-                self->state = ESCAPED_CHAR;
-            }
-            else if (IS_WHITESPACE(c)) {
-                // End of field. End of line not reached yet
-                END_FIELD();
-                self->state = EAT_WHITESPACE;
-            }
-            else if (c == self->commentchar) {
-                END_FIELD();
-                self->state = EAT_COMMENT;
-            }
-            else {
-                /* normal character - save in field */
-                PUSH_CHAR(c);
-            }
-            break;
-
-        case IN_QUOTED_FIELD:
-            /* in quoted field */
-            if (c == self->escapechar) {
-                /* Possible escape character */
-                self->state = ESCAPE_IN_QUOTED_FIELD;
-            }
-            else if (c == self->quotechar &&
-                     self->quoting != QUOTE_NONE) {
-                if (self->doublequote) {
-                    /* doublequote; " represented by "" */
-                    self->state = QUOTE_IN_QUOTED_FIELD;
-                }
-                else {
-                    /* end of quote part of field */
-                    self->state = IN_FIELD;
-                }
-            }
-            else {
-                /* normal character - save in field */
-                PUSH_CHAR(c);
-            }
-            break;
-
-        case ESCAPE_IN_QUOTED_FIELD:
-            /* if (c == '\0') */
-            /*  c = '\n'; */
-
-            PUSH_CHAR(c);
-            self->state = IN_QUOTED_FIELD;
-            break;
-
-        case QUOTE_IN_QUOTED_FIELD:
-            /* doublequote - seen a quote in an quoted field */
-            if (self->quoting != QUOTE_NONE && c == self->quotechar) {
-                /* save "" as " */
-
-                PUSH_CHAR(c);
-                self->state = IN_QUOTED_FIELD;
-            }
-            else if (IS_WHITESPACE(c)) {
-                // End of field. End of line not reached yet
-
-                END_FIELD();
-                self->state = EAT_WHITESPACE;
-            }
-            else if (c == '\n') {
-                END_FIELD();
-                END_LINE();
-                /* self->state = START_RECORD; */
-            }
-            else if (c == '\r') {
-                END_FIELD();
-                self->state = EAT_CRNL;
-            }
-            else if (!self->strict) {
-                PUSH_CHAR(c);
-                self->state = IN_FIELD;
-            }
-            else {
-                self->error_msg = (char*) malloc(50);
-                sprintf(self->error_msg, "'%c' expected after '%c'",
-                        self->delimiter, self->quotechar);
-                goto parsingerror;
-            }
-            break;
-
-        case EAT_CRNL:
-            if (c == '\n') {
-                END_LINE();
-                /* self->state = START_RECORD; */
-            } else if (IS_WHITESPACE(c)){
-                // Handle \r-delimited files
-                END_LINE_STATE(EAT_WHITESPACE);
-            } else {
-                /* XXX
-                 * first character of a new record--need to back up and reread
-                 * to handle properly...
-                 */
-                i--; buf--; /* back up one character (HACK!) */
-                END_LINE_STATE(START_RECORD);
-            }
-            break;
-
-        case EAT_CRNL_NOP: // inside an ignored comment line
-            self->state = START_RECORD;
-            /* \r line terminator -- parse this character again */
-            if (c != '\n' && c != self->delimiter) {
-                --i;
-                --buf;
-            }
-            break;
-
-        case EAT_COMMENT:
-            if (c == '\n') {
-                END_LINE();
-            } else if (c == '\r') {
-                self->state = EAT_CRNL;
-            }
-            break;
-
-        default:
-            break;
-
-
-        }
-
-    }
-
-    _TOKEN_CLEANUP();
-
-    TRACE(("Finished tokenizing input\n"))
-
-    return 0;
-
-parsingerror:
-    i++;
-    _TOKEN_CLEANUP();
-
-    return -1;
-
-linelimit:
-    i++;
-    _TOKEN_CLEANUP();
-
-    return 0;
-}
-
-
-static int parser_handle_eof(parser_t *self) {
-    TRACE(("handling eof, datalen: %d, pstate: %d\n", self->datalen, self->state))
-
-    if (self->datalen != 0)
-        return -1;
-
-    switch (self->state) {
-    case START_RECORD:
-    case WHITESPACE_LINE:
-    case EAT_CRNL_NOP:
-    case EAT_LINE_COMMENT:
-        return 0;
-
-    case ESCAPE_IN_QUOTED_FIELD:
-    case IN_QUOTED_FIELD:
-        self->error_msg = (char*)malloc(100);
-        sprintf(self->error_msg, "EOF inside string starting at line %d",
-                self->file_lines);
-        return -1;
-
-    case ESCAPED_CHAR:
-        self->error_msg = (char*)malloc(100);
-        sprintf(self->error_msg, "EOF following escape character");
-        return -1;
-
-    case IN_FIELD:
-    case START_FIELD:
-    case QUOTE_IN_QUOTED_FIELD:
-        if (end_field(self) < 0)
-            return -1;
-        break;
-
-    default:
-        break;
-    }
-
-    if (end_line(self) < 0)
-        return -1;
-    else
-        return 0;
-}
-
-int parser_consume_rows(parser_t *self, size_t nrows) {
-    int i, offset, word_deletions, char_count;
-
-    if (nrows > self->lines) {
-        nrows = self->lines;
-    }
-
-    /* do nothing */
-    if (nrows == 0)
-        return 0;
-
-    /* cannot guarantee that nrows + 1 has been observed */
-    word_deletions = self->line_start[nrows - 1] + self->line_fields[nrows - 1];
-    char_count = (self->word_starts[word_deletions - 1] +
-                  strlen(self->words[word_deletions - 1]) + 1);
-
-    TRACE(("parser_consume_rows: Deleting %d words, %d chars\n", word_deletions, char_count));
-
-    /* move stream, only if something to move */
-    if (char_count < self->stream_len) {
-        memmove((void*) self->stream, (void*) (self->stream + char_count),
-                self->stream_len - char_count);
-    }
-    /* buffer counts */
-    self->stream_len -= char_count;
-
-    /* move token metadata */
-    for (i = 0; i < self->words_len - word_deletions; ++i) {
-        offset = i + word_deletions;
-
-        self->words[i] = self->words[offset] - char_count;
-        self->word_starts[i] = self->word_starts[offset] - char_count;
-    }
-    self->words_len -= word_deletions;
-
-    /* move current word pointer to stream */
-    self->pword_start -= char_count;
-    self->word_start -= char_count;
-    /*
-    printf("Line_start: ");
-    for (i = 0; i < self->lines + 1; ++i) {
-         printf("%d ", self->line_fields[i]);
-     }
-    printf("\n");
-    */
-    /* move line metadata */
-    for (i = 0; i < self->lines - nrows + 1; ++i)
-    {
-        offset = i + nrows;
-        self->line_start[i] = self->line_start[offset] - word_deletions;
-
-        /* TRACE(("First word in line %d is now %s\n", i, */
-        /*        self->words[self->line_start[i]])); */
-
-        self->line_fields[i] = self->line_fields[offset];
-    }
-    self->lines -= nrows;
-    /* self->line_fields[self->lines] = 0; */
-
-    return 0;
-}
-
-static size_t _next_pow2(size_t sz) {
-    size_t result = 1;
-    while (result < sz) result *= 2;
-    return result;
-}
-
-int parser_trim_buffers(parser_t *self) {
-    /*
-      Free memory
-     */
-    size_t new_cap;
-    void *newptr;
-
-    /* trim stream */
-    new_cap = _next_pow2(self->stream_len) + 1;
-    TRACE(("parser_trim_buffers: new_cap = %zu, stream_cap = %zu, lines_cap = %zu\n",
-           new_cap, self->stream_cap, self->lines_cap));
-    if (new_cap < self->stream_cap) {
-        TRACE(("parser_trim_buffers: new_cap < self->stream_cap, calling safe_realloc\n"));
-        newptr = safe_realloc((void*) self->stream, new_cap);
-        if (newptr == NULL) {
-            return PARSER_OUT_OF_MEMORY;
-        } else {
-            self->stream = newptr;
-            self->stream_cap = new_cap;
-        }
-    }
-
-    /* trim words, word_starts */
-    new_cap = _next_pow2(self->words_len) + 1;
-    if (new_cap < self->words_cap) {
-        TRACE(("parser_trim_buffers: new_cap < self->words_cap\n"));
-        newptr = safe_realloc((void*) self->words, new_cap * sizeof(char*));
-        if (newptr == NULL) {
-            return PARSER_OUT_OF_MEMORY;
-        } else {
-            self->words = (char**) newptr;
-        }
-        newptr = safe_realloc((void*) self->word_starts, new_cap * sizeof(int));
-        if (newptr == NULL) {
-            return PARSER_OUT_OF_MEMORY;
-        } else {
-            self->word_starts = (int*) newptr;
-            self->words_cap = new_cap;
-        }
-    }
-
-    /* trim line_start, line_fields */
-    new_cap = _next_pow2(self->lines) + 1;
-    if (new_cap < self->lines_cap) {
-        TRACE(("parser_trim_buffers: new_cap < self->lines_cap\n"));
-        newptr = safe_realloc((void*) self->line_start, new_cap * sizeof(int));
-        if (newptr == NULL) {
-            return PARSER_OUT_OF_MEMORY;
-        } else {
-            self->line_start = (int*) newptr;
-        }
-        newptr = safe_realloc((void*) self->line_fields, new_cap * sizeof(int));
-        if (newptr == NULL) {
-            return PARSER_OUT_OF_MEMORY;
-        } else {
-            self->line_fields = (int*) newptr;
-            self->lines_cap = new_cap;
-        }
-    }
-
-    return 0;
-}
-
-void debug_print_parser(parser_t *self) {
-    int j, line;
-    char *token;
-
-    for (line = 0; line < self->lines; ++line)
-    {
-        printf("(Parsed) Line %d: ", line);
-
-        for (j = 0; j < self->line_fields[j]; ++j)
-        {
-            token = self->words[j + self->line_start[line]];
-            printf("%s ", token);
-        }
-        printf("\n");
-    }
-}
-
-/*int clear_parsed_lines(parser_t *self, size_t nlines) {
-    // TODO. move data up in stream, shift relevant word pointers
-
-    return 0;
-}*/
-
-
-/*
-  nrows : number of rows to tokenize (or until reach EOF)
-  all : tokenize all the data vs. certain number of rows
- */
-
-int _tokenize_helper(parser_t *self, size_t nrows, int all) {
-    parser_op tokenize_bytes;
-
-    int status = 0;
-    int start_lines = self->lines;
-
-    if (self->delim_whitespace) {
-        tokenize_bytes = tokenize_whitespace;
-    } else if (self->lineterminator == '\0') {
-        tokenize_bytes = tokenize_delimited;
-    } else {
-        tokenize_bytes = tokenize_delim_customterm;
-    }
-
-    if (self->state == FINISHED) {
-        return 0;
-    }
-
-    TRACE(("_tokenize_helper: Asked to tokenize %d rows, datapos=%d, datalen=%d\n", \
-           (int) nrows, self->datapos, self->datalen));
-
-    while (1) {
-        if (!all && self->lines - start_lines >= nrows)
-            break;
-
-        if (self->datapos == self->datalen) {
-            status = parser_buffer_bytes(self, self->chunksize);
-
-            if (status == REACHED_EOF) {
-                // close out last line
-                status = parser_handle_eof(self);
-                self->state = FINISHED;
-                break;
-            } else if (status != 0) {
-                return status;
-            }
-        }
-
-        TRACE(("_tokenize_helper: Trying to process %d bytes, datalen=%d, datapos= %d\n",
-               self->datalen - self->datapos, self->datalen, self->datapos));
-        /* TRACE(("sourcetype: %c, status: %d\n", self->sourcetype, status)); */
-
-        status = tokenize_bytes(self, nrows);
-
-        /* debug_print_parser(self); */
-
-        if (status < 0) {
-            // XXX
-            TRACE(("_tokenize_helper: Status %d returned from tokenize_bytes, breaking\n",
-                   status));
-            status = -1;
-            break;
-        }
-    }
-    TRACE(("leaving tokenize_helper\n"));
-    return status;
-}
-
-int tokenize_nrows(parser_t *self, size_t nrows) {
-    int status = _tokenize_helper(self, nrows, 0);
-    return status;
-}
-
-int tokenize_all_rows(parser_t *self) {
-    int status = _tokenize_helper(self, -1, 1);
-    return status;
-}
-
-/* SEL - does not look like this routine is used anywhere
-void test_count_lines(char *fname) {
-    clock_t start = clock();
-
-    char *buffer, *tmp;
-    size_t bytes, lines = 0;
-    int i;
-    FILE *fp = fopen(fname, "rb");
-
-    buffer = (char*) malloc(CHUNKSIZE * sizeof(char));
-
-    while(1) {
-        tmp = buffer;
-        bytes = fread((void *) buffer, sizeof(char), CHUNKSIZE, fp);
-        // printf("Read %d bytes\n", bytes);
-
-        if (bytes == 0) {
-            break;
-        }
-
-        for (i = 0; i < bytes; ++i)
-        {
-            if (*tmp++ == '\n') {
-                lines++;
-            }
-        }
-    }
-
-
-    printf("Saw %d lines\n", (int) lines);
-
-    free(buffer);
-    fclose(fp);
-
-    printf("Time elapsed: %f\n", ((double)clock() - start) / CLOCKS_PER_SEC);
-}*/
-
-
-P_INLINE void uppercase(char *p) {
-    for ( ; *p; ++p) *p = toupper(*p);
-}
-
-/* SEL - does not look like these routines are used anywhere
-P_INLINE void lowercase(char *p) {
-    for ( ; *p; ++p) *p = tolower(*p);
-}
-
-int P_INLINE to_complex(char *item, double *p_real, double *p_imag, char sci, char decimal)
-{
-    char *p_end;
-
-    *p_real = xstrtod(item, &p_end, decimal, sci, '\0', FALSE);
-    if (*p_end == '\0') {
-        *p_imag = 0.0;
-        return errno == 0;
-    }
-    if (*p_end == 'i' || *p_end == 'j') {
-        *p_imag = *p_real;
-        *p_real = 0.0;
-        ++p_end;
-    }
-    else {
-        if (*p_end == '+') {
-            ++p_end;
-        }
-        *p_imag = xstrtod(p_end, &p_end, decimal, sci, '\0', FALSE);
-        if (errno || ((*p_end != 'i') && (*p_end != 'j'))) {
-            return FALSE;
-        }
-        ++p_end;
-    }
-    while(*p_end == ' ') {
-        ++p_end;
-    }
-    return *p_end == '\0';
-}*/
-
-
-int P_INLINE to_longlong(char *item, long long *p_value)
-{
-    char *p_end;
-
-    // Try integer conversion.  We explicitly give the base to be 10. If
-    // we used 0, strtoll() would convert '012' to 10, because the leading 0 in
-    // '012' signals an octal number in C.  For a general purpose reader, that
-    // would be a bug, not a feature.
-    *p_value = strtoll(item, &p_end, 10);
-
-    // Allow trailing spaces.
-    while (isspace(*p_end)) ++p_end;
-
-    return (errno == 0) && (!*p_end);
-}
-
-/* does not look like this routine is used anywhere
-int P_INLINE to_longlong_thousands(char *item, long long *p_value, char tsep)
-{
-    int i, pos, status, n = strlen(item), count = 0;
-    char *tmp;
-    char *p_end;
-
-    for (i = 0; i < n; ++i)
-    {
-        if (*(item + i) == tsep) {
-            count++;
-        }
-    }
-
-    if (count == 0) {
-        return to_longlong(item, p_value);
-    }
-
-    tmp = (char*) malloc((n - count + 1) * sizeof(char));
-    if (tmp == NULL) {
-        return 0;
-    }
-
-    pos = 0;
-    for (i = 0; i < n; ++i)
-    {
-        if (item[i] != tsep)
-            tmp[pos++] = item[i];
-    }
-
-    tmp[pos] = '\0';
-
-    status = to_longlong(tmp, p_value);
-    free(tmp);
-
-    return status;
-}*/
-
-int to_boolean(const char *item, uint8_t *val) {
-    char *tmp;
-    int i, status = 0;
-
-    static const char *tstrs[1] = {"TRUE"};
-    static const char *fstrs[1] = {"FALSE"};
-
-    tmp = malloc(sizeof(char) * (strlen(item) + 1));
-    strcpy(tmp, item);
-    uppercase(tmp);
-
-    for (i = 0; i < 1; ++i)
-    {
-        if (strcmp(tmp, tstrs[i]) == 0) {
-            *val = 1;
-            goto done;
-        }
-    }
-
-    for (i = 0; i < 1; ++i)
-    {
-        if (strcmp(tmp, fstrs[i]) == 0) {
-            *val = 0;
-            goto done;
-        }
-    }
-
-    status = -1;
-
-done:
-    free(tmp);
-    return status;
-}
-
-// #define TEST
-
-#ifdef TEST
-
-int main(int argc, char *argv[])
-{
-    double x, y;
-    long long xi;
-    int status;
-    char *s;
-
-    //s = "0.10e-3-+5.5e2i";
-    // s = "1-0j";
-    // status = to_complex(s, &x, &y, 'e', '.');
-    s = "123,789";
-    status = to_longlong_thousands(s, &xi, ',');
-    printf("s = '%s'\n", s);
-    printf("status = %d\n", status);
-    printf("x = %d\n", (int) xi);
-
-    // printf("x = %lg,  y = %lg\n", x, y);
-
-    return 0;
-}
-#endif
-
-// ---------------------------------------------------------------------------
-// Implementation of xstrtod
-
-//
-// strtod.c
-//
-// Convert string to double
-//
-// Copyright (C) 2002 Michael Ringgaard. All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions
-// are met:
-//
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the project nor the names of its contributors
-//    may be used to endorse or promote products derived from this software
-//    without specific prior written permission.
-//
-// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
-// ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
-// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
-// ARE DISCLAIMED.  IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
-// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
-// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
-// OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
-// HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
-// LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
-// OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
-// SUCH DAMAGE.
-//
-// -----------------------------------------------------------------------
-// Modifications by Warren Weckesser, March 2011:
-// * Rename strtod() to xstrtod().
-// * Added decimal and sci arguments.
-// * Skip trailing spaces.
-// * Commented out the other functions.
-// Modifications by Richard T Guy, August 2013:
-// * Add tsep argument for thousands separator
-//
-
-double xstrtod(const char *str, char **endptr, char decimal,
-                      char sci, char tsep, int skip_trailing)
-{
-  double number;
-  int exponent;
-  int negative;
-  char *p = (char *) str;
-  double p10;
-  int n;
-  int num_digits;
-  int num_decimals;
-
-  errno = 0;
-
-  // Skip leading whitespace
-  while (isspace(*p)) p++;
-
-  // Handle optional sign
-  negative = 0;
-  switch (*p)
-  {
-    case '-': negative = 1; // Fall through to increment position
-    case '+': p++;
-  }
-
-  number = 0.;
-  exponent = 0;
-  num_digits = 0;
-  num_decimals = 0;
-
-  // Process string of digits
-  while (isdigit(*p))
-  {
-    number = number * 10. + (*p - '0');
-    p++;
-    num_digits++;
-
-    p += (tsep != '\0' & *p == tsep);
-  }
-
-  // Process decimal part
-  if (*p == decimal)
-  {
-    p++;
-
-    while (isdigit(*p))
-    {
-      number = number * 10. + (*p - '0');
-      p++;
-      num_digits++;
-      num_decimals++;
-    }
-
-    exponent -= num_decimals;
-  }
-
-  if (num_digits == 0)
-  {
-    errno = ERANGE;
-    return 0.0;
-  }
-
-  // Correct for sign
-  if (negative) number = -number;
-
-  // Process an exponent string
-  if (toupper(*p) == toupper(sci))
-  {
-    // Handle optional sign
-    negative = 0;
-    switch (*++p)
-    {
-      case '-': negative = 1;   // Fall through to increment pos
-      case '+': p++;
-    }
-
-    // Process string of digits
-    n = 0;
-    while (isdigit(*p))
-    {
-      n = n * 10 + (*p - '0');
-      p++;
-    }
-
-    if (negative)
-      exponent -= n;
-    else
-      exponent += n;
-  }
-
-
-  if (exponent < DBL_MIN_EXP  || exponent > DBL_MAX_EXP)
-  {
-
-    errno = ERANGE;
-    return HUGE_VAL;
-  }
-
-  // Scale the result
-  p10 = 10.;
-  n = exponent;
-  if (n < 0) n = -n;
-  while (n)
-  {
-    if (n & 1)
-    {
-      if (exponent < 0)
-        number /= p10;
-      else
-        number *= p10;
-    }
-    n >>= 1;
-    p10 *= p10;
-  }
-
-
-  if (number == HUGE_VAL) {
-      errno = ERANGE;
-  }
-
-  if (skip_trailing) {
-      // Skip trailing whitespace
-      while (isspace(*p)) p++;
-  }
-
-  if (endptr) *endptr = p;
-
-
-  return number;
-}
-
-double precise_xstrtod(const char *str, char **endptr, char decimal,
-               char sci, char tsep, int skip_trailing)
-{
-    double number;
-    int exponent;
-    int negative;
-    char *p = (char *) str;
-    int num_digits;
-    int num_decimals;
-    int max_digits = 17;
-    int n;
-    // Cache powers of 10 in memory
-    static double e[] = {1., 1e1, 1e2, 1e3, 1e4, 1e5, 1e6, 1e7, 1e8, 1e9, 1e10,
-                         1e11, 1e12, 1e13, 1e14, 1e15, 1e16, 1e17, 1e18, 1e19, 1e20,
-                         1e21, 1e22, 1e23, 1e24, 1e25, 1e26, 1e27, 1e28, 1e29, 1e30,
-                         1e31, 1e32, 1e33, 1e34, 1e35, 1e36, 1e37, 1e38, 1e39, 1e40,
-                         1e41, 1e42, 1e43, 1e44, 1e45, 1e46, 1e47, 1e48, 1e49, 1e50,
-                         1e51, 1e52, 1e53, 1e54, 1e55, 1e56, 1e57, 1e58, 1e59, 1e60,
-                         1e61, 1e62, 1e63, 1e64, 1e65, 1e66, 1e67, 1e68, 1e69, 1e70,
-                         1e71, 1e72, 1e73, 1e74, 1e75, 1e76, 1e77, 1e78, 1e79, 1e80,
-                         1e81, 1e82, 1e83, 1e84, 1e85, 1e86, 1e87, 1e88, 1e89, 1e90,
-                         1e91, 1e92, 1e93, 1e94, 1e95, 1e96, 1e97, 1e98, 1e99, 1e100,
-                         1e101, 1e102, 1e103, 1e104, 1e105, 1e106, 1e107, 1e108, 1e109, 1e110,
-                         1e111, 1e112, 1e113, 1e114, 1e115, 1e116, 1e117, 1e118, 1e119, 1e120,
-                         1e121, 1e122, 1e123, 1e124, 1e125, 1e126, 1e127, 1e128, 1e129, 1e130,
-                         1e131, 1e132, 1e133, 1e134, 1e135, 1e136, 1e137, 1e138, 1e139, 1e140,
-                         1e141, 1e142, 1e143, 1e144, 1e145, 1e146, 1e147, 1e148, 1e149, 1e150,
-                         1e151, 1e152, 1e153, 1e154, 1e155, 1e156, 1e157, 1e158, 1e159, 1e160,
-                         1e161, 1e162, 1e163, 1e164, 1e165, 1e166, 1e167, 1e168, 1e169, 1e170,
-                         1e171, 1e172, 1e173, 1e174, 1e175, 1e176, 1e177, 1e178, 1e179, 1e180,
-                         1e181, 1e182, 1e183, 1e184, 1e185, 1e186, 1e187, 1e188, 1e189, 1e190,
-                         1e191, 1e192, 1e193, 1e194, 1e195, 1e196, 1e197, 1e198, 1e199, 1e200,
-                         1e201, 1e202, 1e203, 1e204, 1e205, 1e206, 1e207, 1e208, 1e209, 1e210,
-                         1e211, 1e212, 1e213, 1e214, 1e215, 1e216, 1e217, 1e218, 1e219, 1e220,
-                         1e221, 1e222, 1e223, 1e224, 1e225, 1e226, 1e227, 1e228, 1e229, 1e230,
-                         1e231, 1e232, 1e233, 1e234, 1e235, 1e236, 1e237, 1e238, 1e239, 1e240,
-                         1e241, 1e242, 1e243, 1e244, 1e245, 1e246, 1e247, 1e248, 1e249, 1e250,
-                         1e251, 1e252, 1e253, 1e254, 1e255, 1e256, 1e257, 1e258, 1e259, 1e260,
-                         1e261, 1e262, 1e263, 1e264, 1e265, 1e266, 1e267, 1e268, 1e269, 1e270,
-                         1e271, 1e272, 1e273, 1e274, 1e275, 1e276, 1e277, 1e278, 1e279, 1e280,
-                         1e281, 1e282, 1e283, 1e284, 1e285, 1e286, 1e287, 1e288, 1e289, 1e290,
-                         1e291, 1e292, 1e293, 1e294, 1e295, 1e296, 1e297, 1e298, 1e299, 1e300,
-                         1e301, 1e302, 1e303, 1e304, 1e305, 1e306, 1e307, 1e308};
-    errno = 0;
-
-    // Skip leading whitespace
-    while (isspace(*p)) p++;
-
-    // Handle optional sign
-    negative = 0;
-    switch (*p)
-    {
-    case '-': negative = 1; // Fall through to increment position
-    case '+': p++;
-    }
-
-    number = 0.;
-    exponent = 0;
-    num_digits = 0;
-    num_decimals = 0;
-
-    // Process string of digits
-    while (isdigit(*p))
-    {
-        if (num_digits < max_digits)
-        {
-            number = number * 10. + (*p - '0');
-            num_digits++;
-        }
-        else
-            ++exponent;
-
-        p++;
-        p += (tsep != '\0' & *p == tsep);
-    }
-
-    // Process decimal part
-    if (*p == decimal)
-    {
-        p++;
-
-        while (num_digits < max_digits && isdigit(*p))
-        {
-            number = number * 10. + (*p - '0');
-            p++;
-            num_digits++;
-            num_decimals++;
-        }
-
-        if (num_digits >= max_digits) // consume extra decimal digits
-            while (isdigit(*p))
-                ++p;
-
-        exponent -= num_decimals;
-    }
-
-    if (num_digits == 0)
-    {
-        errno = ERANGE;
-        return 0.0;
-    }
-
-    // Correct for sign
-    if (negative) number = -number;
-
-    // Process an exponent string
-    if (toupper(*p) == toupper(sci))
-    {
-        // Handle optional sign
-        negative = 0;
-        switch (*++p)
-        {
-        case '-': negative = 1;   // Fall through to increment pos
-        case '+': p++;
-        }
-
-        // Process string of digits
-        n = 0;
-        while (isdigit(*p))
-        {
-            n = n * 10 + (*p - '0');
-            p++;
-        }
-
-        if (negative)
-            exponent -= n;
-        else
-            exponent += n;
-    }
-
-    if (exponent > 308)
-    {
-        errno = ERANGE;
-        return HUGE_VAL;
-    }
-    else if (exponent > 0)
-        number *= e[exponent];
-    else if (exponent < -308) // subnormal
-    {
-        if (exponent < -616) // prevent invalid array access
-            number = 0.;
-        number /= e[-308 - exponent];
-        number /= e[308];
-    }
-    else
-        number /= e[-exponent];
-
-    if (number == HUGE_VAL || number == -HUGE_VAL)
-        errno = ERANGE;
-
-    if (skip_trailing) {
-        // Skip trailing whitespace
-        while (isspace(*p)) p++;
-    }
-
-    if (endptr) *endptr = p;
-    return number;
-}
-
-double round_trip(const char *p, char **q, char decimal, char sci,
-                  char tsep, int skip_trailing)
-{
-#if PY_VERSION_HEX >= 0x02070000
-    return PyOS_string_to_double(p, q, 0);
-#else
-    return strtod(p, q);
-#endif
-}
-
-/*
-float strtof(const char *str, char **endptr)
-{
-  return (float) strtod(str, endptr);
-}
-
-
-long double strtold(const char *str, char **endptr)
-{
-  return strtod(str, endptr);
-}
-
-double atof(const char *str)
-{
-  return strtod(str, NULL);
-}
-*/
-
-// End of xstrtod code
-// ---------------------------------------------------------------------------
-
-int64_t str_to_int64(const char *p_item, int64_t int_min, int64_t int_max,
-                     int *error, char tsep)
-{
-    const char *p = (const char *) p_item;
-    int isneg = 0;
-    int64_t number = 0;
-    int d;
-
-    // Skip leading spaces.
-    while (isspace(*p)) {
-        ++p;
-    }
-
-    // Handle sign.
-    if (*p == '-') {
-        isneg = 1;
-        ++p;
-    }
-    else if (*p == '+') {
-        p++;
-    }
-
-    // Check that there is a first digit.
-    if (!isdigit(*p)) {
-        // Error...
-        *error = ERROR_NO_DIGITS;
-        return 0;
-    }
-
-    if (isneg) {
-        // If number is greater than pre_min, at least one more digit
-        // can be processed without overflowing.
-        int dig_pre_min = -(int_min % 10);
-        int64_t pre_min = int_min / 10;
-
-        // Process the digits.
-        d = *p;
-        if (tsep != '\0') {
-            while (1) {
-                if (d == tsep) {
-                    d = *++p;
-                    continue;
-                } else if (!isdigit(d)) {
-                    break;
-                }
-                if ((number > pre_min) ||
-                    ((number == pre_min) && (d - '0' <= dig_pre_min))) {
-
-                    number = number * 10 - (d - '0');
-                    d = *++p;
-                }
-                else {
-                    *error = ERROR_OVERFLOW;
-                    return 0;
-                }
-            }
-        } else {
-            while (isdigit(d)) {
-                if ((number > pre_min) ||
-                    ((number == pre_min) && (d - '0' <= dig_pre_min))) {
-
-                    number = number * 10 - (d - '0');
-                    d = *++p;
-                }
-                else {
-                    *error = ERROR_OVERFLOW;
-                    return 0;
-                }
-            }
-        }
-    }
-    else {
-        // If number is less than pre_max, at least one more digit
-        // can be processed without overflowing.
-        int64_t pre_max = int_max / 10;
-        int dig_pre_max = int_max % 10;
-
-        //printf("pre_max = %lld  dig_pre_max = %d\n", pre_max, dig_pre_max);
-
-        // Process the digits.
-        d = *p;
-        if (tsep != '\0') {
-            while (1) {
-                if (d == tsep) {
-                    d = *++p;
-                    continue;
-                } else if (!isdigit(d)) {
-                    break;
-                }
-                if ((number < pre_max) ||
-                    ((number == pre_max) && (d - '0' <= dig_pre_max))) {
-
-                    number = number * 10 + (d - '0');
-                    d = *++p;
-
-                }
-                else {
-                    *error = ERROR_OVERFLOW;
-                    return 0;
-                }
-            }
-        } else {
-            while (isdigit(d)) {
-                if ((number < pre_max) ||
-                    ((number == pre_max) && (d - '0' <= dig_pre_max))) {
-
-                    number = number * 10 + (d - '0');
-                    d = *++p;
-
-                }
-                else {
-                    *error = ERROR_OVERFLOW;
-                    return 0;
-                }
-            }
-        }
-    }
-
-    // Skip trailing spaces.
-    while (isspace(*p)) {
-        ++p;
-    }
-
-    // Did we use up all the characters?
-    if (*p) {
-        *error = ERROR_INVALID_CHARS;
-        return 0;
-    }
-
-    *error = 0;
-    return number;
-}
-
-/* does not look like this routine is used anywhere
-uint64_t str_to_uint64(const char *p_item, uint64_t uint_max, int *error)
-{
-    int d, dig_pre_max;
-    uint64_t pre_max;
-    const char *p = (const char *) p_item;
-    uint64_t number = 0;
-
-    // Skip leading spaces.
-    while (isspace(*p)) {
-        ++p;
-    }
-
-    // Handle sign.
-    if (*p == '-') {
-        *error = ERROR_MINUS_SIGN;
-        return 0;
-    }
-    if (*p == '+') {
-        p++;
-    }
-
-    // Check that there is a first digit.
-    if (!isdigit(*p)) {
-        // Error...
-        *error = ERROR_NO_DIGITS;
-        return 0;
-    }
-
-    // If number is less than pre_max, at least one more digit
-    // can be processed without overflowing.
-    pre_max = uint_max / 10;
-    dig_pre_max = uint_max % 10;
-
-    // Process the digits.
-    d = *p;
-    while (isdigit(d)) {
-        if ((number < pre_max) || ((number == pre_max) && (d - '0' <= dig_pre_max))) {
-            number = number * 10 + (d - '0');
-            d = *++p;
-        }
-        else {
-            *error = ERROR_OVERFLOW;
-            return 0;
-        }
-    }
-
-    // Skip trailing spaces.
-    while (isspace(*p)) {
-        ++p;
-    }
-
-    // Did we use up all the characters?
-    if (*p) {
-        *error = ERROR_INVALID_CHARS;
-        return 0;
-    }
-
-    *error = 0;
-    return number;
-}
-*/
diff --git a/pandas/src/parser/tokenizer.h b/pandas/src/parser/tokenizer.h
deleted file mode 100644
index eef94e0616769..0000000000000
--- a/pandas/src/parser/tokenizer.h
+++ /dev/null
@@ -1,274 +0,0 @@
-/*
-
-Copyright (c) 2012, Lambda Foundry, Inc., except where noted
-
-Incorporates components of WarrenWeckesser/textreader, licensed under 3-clause
-BSD
-
-See LICENSE for the license
-
-*/
-
-#ifndef _PARSER_COMMON_H_
-#define _PARSER_COMMON_H_
-
-#include "Python.h"
-#include <stdio.h>
-#include <string.h>
-#include <stdlib.h>
-#include <time.h>
-#include <errno.h>
-
-#include <ctype.h>
-
-#define ERROR_OK             0
-#define ERROR_NO_DIGITS      1
-#define ERROR_OVERFLOW       2
-#define ERROR_INVALID_CHARS  3
-#define ERROR_MINUS_SIGN     4
-
-#include "../headers/stdint.h"
-
-#include "khash.h"
-
-#define CHUNKSIZE 1024*256
-#define KB 1024
-#define MB 1024 * KB
-#define STREAM_INIT_SIZE 32
-
-#define REACHED_EOF 1
-#define CALLING_READ_FAILED 2
-
-#ifndef P_INLINE
-  #if defined(__GNUC__)
-    #define P_INLINE __inline__
-  #elif defined(_MSC_VER)
-    #define P_INLINE
-  #elif defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
-    #define P_INLINE inline
-  #else
-    #define P_INLINE
-  #endif
-#endif
-
-#if defined(_MSC_VER)
-#define strtoll _strtoi64
-#endif
-
-/*
-
-  C flat file parsing low level code for pandas / NumPy
-
- */
-
-#define FALSE 0
-#define TRUE  1
-
-/* Maximum number of columns in a file. */
-#define MAX_NUM_COLUMNS    2000
-
-/* Maximum number of characters in single field. */
-
-#define FIELD_BUFFER_SIZE  2000
-
-
-/*
- *  Common set of error types for the read_rows() and tokenize()
- *  functions.
- */
-
-#define ERROR_OUT_OF_MEMORY             1
-#define ERROR_INVALID_COLUMN_INDEX     10
-#define ERROR_CHANGED_NUMBER_OF_FIELDS 12
-#define ERROR_TOO_MANY_CHARS           21
-#define ERROR_TOO_MANY_FIELDS          22
-#define ERROR_NO_DATA                  23
-
-
-/* #define VERBOSE */
-
-#if defined(VERBOSE)
-#define TRACE(X) printf X;
-#else
-#define TRACE(X)
-#endif
-
-
-#define PARSER_OUT_OF_MEMORY -1
-
-
-/*
- *  XXX Might want to couple count_rows() with read_rows() to avoid duplication
- *      of some file I/O.
- */
-
-/*
- *  WORD_BUFFER_SIZE determines the maximum amount of non-delimiter
- *  text in a row.
- */
-#define WORD_BUFFER_SIZE 4000
-
-
-typedef enum {
-    START_RECORD,
-    START_FIELD,
-    ESCAPED_CHAR,
-    IN_FIELD,
-    IN_QUOTED_FIELD,
-    ESCAPE_IN_QUOTED_FIELD,
-    QUOTE_IN_QUOTED_FIELD,
-    EAT_CRNL,
-    EAT_CRNL_NOP,
-    EAT_WHITESPACE,
-    EAT_COMMENT,
-    EAT_LINE_COMMENT,
-    WHITESPACE_LINE,
-    SKIP_LINE,
-    FINISHED
-} ParserState;
-
-typedef enum {
-    QUOTE_MINIMAL, QUOTE_ALL, QUOTE_NONNUMERIC, QUOTE_NONE
-} QuoteStyle;
-
-
-typedef void* (*io_callback)(void *src, size_t nbytes, size_t *bytes_read,
-                            int *status);
-typedef int (*io_cleanup)(void *src);
-
-typedef struct parser_t {
-    void *source;
-    io_callback cb_io;
-    io_cleanup cb_cleanup;
-
-    int chunksize;  // Number of bytes to prepare for each chunk
-    char *data;     // pointer to data to be processed
-    int datalen;    // amount of data available
-    int datapos;
-
-    // where to write out tokenized data
-    char *stream;
-    int stream_len;
-    int stream_cap;
-
-    // Store words in (potentially ragged) matrix for now, hmm
-    char **words;
-    int *word_starts; // where we are in the stream
-    int words_len;
-    int words_cap;
-
-    char *pword_start;    // pointer to stream start of current field
-    int word_start;       // position start of current field
-
-    int *line_start;      // position in words for start of line
-    int *line_fields;     // Number of fields in each line
-    int lines;            // Number of (good) lines observed
-    int file_lines;       // Number of file lines observed (including bad or skipped)
-    int lines_cap;        // Vector capacity
-
-    // Tokenizing stuff
-    ParserState state;
-    int doublequote;            /* is " represented by ""? */
-    char delimiter;             /* field separator */
-    int delim_whitespace;       /* delimit by consuming space/tabs instead */
-    char quotechar;             /* quote character */
-    char escapechar;            /* escape character */
-    char lineterminator;
-    int skipinitialspace;       /* ignore spaces following delimiter? */
-    int quoting;                /* style of quoting to write */
-
-    // krufty, hmm =/
-    int numeric_field;
-
-    char commentchar;
-    int allow_embedded_newline;
-    int strict;                 /* raise exception on bad CSV */
-
-    int expected_fields;
-    int error_bad_lines;
-    int warn_bad_lines;
-
-    // floating point options
-    char decimal;
-    char sci;
-
-    // thousands separator (comma, period)
-    char thousands;
-
-    int header; // Boolean: 1: has header, 0: no header
-    int header_start; // header row start
-    int header_end;   // header row end
-
-    void *skipset;
-    int64_t skip_first_N_rows;
-    int skip_footer;
-    double (*converter)(const char *, char **, char, char, char, int);
-
-    // error handling
-    char *warn_msg;
-    char *error_msg;
-
-    int skip_empty_lines;
-} parser_t;
-
-
-typedef struct coliter_t {
-    char **words;
-    int *line_start;
-    int col;
-} coliter_t;
-
-void coliter_setup(coliter_t *self, parser_t *parser, int i, int start);
-coliter_t *coliter_new(parser_t *self, int i);
-
-/* #define COLITER_NEXT(iter) iter->words[iter->line_start[iter->line++] + iter->col] */
-// #define COLITER_NEXT(iter) iter.words[iter.line_start[iter.line++] + iter.col]
-
-#define COLITER_NEXT(iter, word) do { \
-    const int i = *iter.line_start++ + iter.col; \
-    word = i < *iter.line_start ? iter.words[i]: ""; \
-    } while(0)
-
-parser_t* parser_new(void);
-
-int parser_init(parser_t *self);
-
-int parser_consume_rows(parser_t *self, size_t nrows);
-
-int parser_trim_buffers(parser_t *self);
-
-int parser_add_skiprow(parser_t *self, int64_t row);
-
-int parser_set_skipfirstnrows(parser_t *self, int64_t nrows);
-
-void parser_free(parser_t *self);
-
-void parser_set_default_options(parser_t *self);
-
-void debug_print_parser(parser_t *self);
-
-int tokenize_nrows(parser_t *self, size_t nrows);
-
-int tokenize_all_rows(parser_t *self);
-
-/*
-
-  Have parsed / type-converted a chunk of data and want to free memory from the
-  token stream
-
- */
-//int clear_parsed_lines(parser_t *self, size_t nlines);
-
-int64_t str_to_int64(const char *p_item, int64_t int_min,
-                     int64_t int_max, int *error, char tsep);
-//uint64_t str_to_uint64(const char *p_item, uint64_t uint_max, int *error);
-
-double xstrtod(const char *p, char **q, char decimal, char sci, char tsep, int skip_trailing);
-double precise_xstrtod(const char *p, char **q, char decimal, char sci, char tsep, int skip_trailing);
-double round_trip(const char *p, char **q, char decimal, char sci, char tsep, int skip_trailing);
-//int P_INLINE to_complex(char *item, double *p_real, double *p_imag, char sci, char decimal);
-int P_INLINE to_longlong(char *item, long long *p_value);
-//int P_INLINE to_longlong_thousands(char *item, long long *p_value, char tsep);
-int to_boolean(const char *item, uint8_t *val);
-
-#endif // _PARSER_COMMON_H_
diff --git a/pandas/src/period.pyx b/pandas/src/period.pyx
deleted file mode 100644
index 2a7c2135f8045..0000000000000
--- a/pandas/src/period.pyx
+++ /dev/null
@@ -1,1183 +0,0 @@
-from datetime import datetime, date, timedelta
-import operator
-
-from cpython cimport (
-    PyObject_RichCompareBool,
-    Py_EQ, Py_NE,
-)
-
-from numpy cimport (int8_t, int32_t, int64_t, import_array, ndarray,
-                    NPY_INT64, NPY_DATETIME, NPY_TIMEDELTA)
-import numpy as np
-
-cdef extern from "datetime_helper.h":
-    double total_seconds(object)
-
-from libc.stdlib cimport free
-
-from pandas import compat
-
-from pandas.tseries import offsets
-from pandas.tseries.tools import parse_time_string
-
-from datetime cimport *
-cimport util
-cimport lib
-import lib
-from pandas import tslib
-from tslib import Timedelta, Timestamp, iNaT, NaT
-from tslib import have_pytz, _get_utcoffset
-from tslib cimport (
-    maybe_get_tz,
-    _is_utc,
-    _is_tzlocal,
-    _get_dst_info,
-    _nat_scalar_rules,
-)
-
-from sys import version_info
-
-cdef bint PY2 = version_info[0] == 2
-
-cdef int64_t NPY_NAT = util.get_nat()
-
-
-cdef extern from "period_helper.h":
-    ctypedef struct date_info:
-        int64_t absdate
-        double abstime
-        double second
-        int minute
-        int hour
-        int day
-        int month
-        int quarter
-        int year
-        int day_of_week
-        int day_of_year
-        int calendar
-
-    ctypedef struct asfreq_info:
-        int from_week_end
-        int to_week_end
-
-        int from_a_year_end
-        int to_a_year_end
-
-        int from_q_year_end
-        int to_q_year_end
-
-    ctypedef int64_t (*freq_conv_func)(int64_t, char, asfreq_info*)
-
-    void initialize_daytime_conversion_factor_matrix()
-    int64_t asfreq(int64_t dtordinal, int freq1, int freq2, char relation) except INT32_MIN
-    freq_conv_func get_asfreq_func(int fromFreq, int toFreq)
-    void get_asfreq_info(int fromFreq, int toFreq, asfreq_info *af_info)
-
-    int64_t get_period_ordinal(int year, int month, int day,
-                          int hour, int minute, int second, int microseconds, int picoseconds,
-                          int freq) except INT32_MIN
-
-    int64_t get_python_ordinal(int64_t period_ordinal, int freq) except INT32_MIN
-
-    int get_date_info(int64_t ordinal, int freq, date_info *dinfo) except INT32_MIN
-    double getAbsTime(int, int64_t, int64_t)
-
-    int pyear(int64_t ordinal, int freq) except INT32_MIN
-    int pqyear(int64_t ordinal, int freq) except INT32_MIN
-    int pquarter(int64_t ordinal, int freq) except INT32_MIN
-    int pmonth(int64_t ordinal, int freq) except INT32_MIN
-    int pday(int64_t ordinal, int freq) except INT32_MIN
-    int pweekday(int64_t ordinal, int freq) except INT32_MIN
-    int pday_of_week(int64_t ordinal, int freq) except INT32_MIN
-    int pday_of_year(int64_t ordinal, int freq) except INT32_MIN
-    int pweek(int64_t ordinal, int freq) except INT32_MIN
-    int phour(int64_t ordinal, int freq) except INT32_MIN
-    int pminute(int64_t ordinal, int freq) except INT32_MIN
-    int psecond(int64_t ordinal, int freq) except INT32_MIN
-    int pdays_in_month(int64_t ordinal, int freq) except INT32_MIN
-    char *c_strftime(date_info *dinfo, char *fmt)
-    int get_yq(int64_t ordinal, int freq, int *quarter, int *year)
-
-initialize_daytime_conversion_factor_matrix()
-
-# Period logic
-#----------------------------------------------------------------------
-
-cdef inline int64_t apply_mult(int64_t period_ord, int64_t mult):
-    """
-    Get freq+multiple ordinal value from corresponding freq-only ordinal value.
-    For example, 5min ordinal will be 1/5th the 1min ordinal (rounding down to
-    integer).
-    """
-    if mult == 1:
-        return period_ord
-
-    return (period_ord - 1) // mult
-
-cdef inline int64_t remove_mult(int64_t period_ord_w_mult, int64_t mult):
-    """
-    Get freq-only ordinal value from corresponding freq+multiple ordinal.
-    """
-    if mult == 1:
-        return period_ord_w_mult
-
-    return period_ord_w_mult * mult + 1;
-
-def dt64arr_to_periodarr(ndarray[int64_t] dtarr, int freq, tz=None):
-    """
-    Convert array of datetime64 values (passed in as 'i8' dtype) to a set of
-    periods corresponding to desired frequency, per period convention.
-    """
-    cdef:
-        ndarray[int64_t] out
-        Py_ssize_t i, l
-        pandas_datetimestruct dts
-
-    l = len(dtarr)
-
-    out = np.empty(l, dtype='i8')
-
-    if tz is None:
-        for i in range(l):
-            if dtarr[i] == iNaT:
-                out[i] = iNaT
-                continue
-            pandas_datetime_to_datetimestruct(dtarr[i], PANDAS_FR_ns, &dts)
-            out[i] = get_period_ordinal(dts.year, dts.month, dts.day,
-                                        dts.hour, dts.min, dts.sec, dts.us, dts.ps, freq)
-    else:
-        out = localize_dt64arr_to_period(dtarr, freq, tz)
-    return out
-
-def periodarr_to_dt64arr(ndarray[int64_t] periodarr, int freq):
-    """
-    Convert array to datetime64 values from a set of ordinals corresponding to
-    periods per period convention.
-    """
-    cdef:
-        ndarray[int64_t] out
-        Py_ssize_t i, l
-
-    l = len(periodarr)
-
-    out = np.empty(l, dtype='i8')
-
-    for i in range(l):
-        if periodarr[i] == iNaT:
-            out[i] = iNaT
-            continue
-        out[i] = period_ordinal_to_dt64(periodarr[i], freq)
-
-    return out
-
-cdef char START = 'S'
-cdef char END = 'E'
-
-cpdef int64_t period_asfreq(int64_t period_ordinal, int freq1, int freq2,
-                            bint end):
-    """
-    Convert period ordinal from one frequency to another, and if upsampling,
-    choose to use start ('S') or end ('E') of period.
-    """
-    cdef:
-        int64_t retval
-
-    if period_ordinal == iNaT:
-        return iNaT
-
-    if end:
-        retval = asfreq(period_ordinal, freq1, freq2, END)
-    else:
-        retval = asfreq(period_ordinal, freq1, freq2, START)
-
-    if retval == INT32_MIN:
-        raise ValueError('Frequency conversion failed')
-
-    return retval
-
-def period_asfreq_arr(ndarray[int64_t] arr, int freq1, int freq2, bint end):
-    """
-    Convert int64-array of period ordinals from one frequency to another, and
-    if upsampling, choose to use start ('S') or end ('E') of period.
-    """
-    cdef:
-        ndarray[int64_t] result
-        Py_ssize_t i, n
-        freq_conv_func func
-        asfreq_info finfo
-        int64_t val, ordinal
-        char relation
-
-    n = len(arr)
-    result = np.empty(n, dtype=np.int64)
-
-    func = get_asfreq_func(freq1, freq2)
-    get_asfreq_info(freq1, freq2, &finfo)
-
-    if end:
-        relation = END
-    else:
-        relation = START
-
-    mask = arr == iNaT
-    if mask.any():      # NaT process
-        for i in range(n):
-            val = arr[i]
-            if val != iNaT:
-                val = func(val, relation, &finfo)
-                if val == INT32_MIN:
-                    raise ValueError("Unable to convert to desired frequency.")
-            result[i] = val
-    else:
-        for i in range(n):
-            val = func(arr[i], relation, &finfo)
-            if val == INT32_MIN:
-                raise ValueError("Unable to convert to desired frequency.")
-            result[i] = val
-
-    return result
-
-def period_ordinal(int y, int m, int d, int h, int min, int s, int us, int ps, int freq):
-    cdef:
-        int64_t ordinal
-
-    return get_period_ordinal(y, m, d, h, min, s, us, ps, freq)
-
-
-cpdef int64_t period_ordinal_to_dt64(int64_t ordinal, int freq):
-    cdef:
-        pandas_datetimestruct dts
-        date_info dinfo
-        float subsecond_fraction
-
-    if ordinal == iNaT:
-        return NPY_NAT
-
-    get_date_info(ordinal, freq, &dinfo)
-
-    dts.year = dinfo.year
-    dts.month = dinfo.month
-    dts.day = dinfo.day
-    dts.hour = dinfo.hour
-    dts.min = dinfo.minute
-    dts.sec = int(dinfo.second)
-    subsecond_fraction = dinfo.second - dts.sec
-    dts.us = int((subsecond_fraction) * 1e6)
-    dts.ps = int(((subsecond_fraction) * 1e6 - dts.us) * 1e6)
-
-    return pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-
-def period_format(int64_t value, int freq, object fmt=None):
-    cdef:
-        int freq_group
-
-    if value == iNaT:
-        return repr(NaT)
-
-    if fmt is None:
-        freq_group = (freq // 1000) * 1000
-        if freq_group == 1000: # FR_ANN
-            fmt = b'%Y'
-        elif freq_group == 2000: # FR_QTR
-            fmt = b'%FQ%q'
-        elif freq_group == 3000: # FR_MTH
-            fmt = b'%Y-%m'
-        elif freq_group == 4000: # WK
-            left = period_asfreq(value, freq, 6000, 0)
-            right = period_asfreq(value, freq, 6000, 1)
-            return '%s/%s' % (period_format(left, 6000),
-                              period_format(right, 6000))
-        elif (freq_group == 5000 # BUS
-              or freq_group == 6000): # DAY
-            fmt = b'%Y-%m-%d'
-        elif freq_group == 7000: # HR
-            fmt = b'%Y-%m-%d %H:00'
-        elif freq_group == 8000: # MIN
-            fmt = b'%Y-%m-%d %H:%M'
-        elif freq_group == 9000: # SEC
-            fmt = b'%Y-%m-%d %H:%M:%S'
-        elif freq_group == 10000: # MILLISEC
-            fmt = b'%Y-%m-%d %H:%M:%S.%l'
-        elif freq_group == 11000: # MICROSEC
-            fmt = b'%Y-%m-%d %H:%M:%S.%u'
-        elif freq_group == 12000: # NANOSEC
-            fmt = b'%Y-%m-%d %H:%M:%S.%n'
-        else:
-            raise ValueError('Unknown freq: %d' % freq)
-
-    return _period_strftime(value, freq, fmt)
-
-
-cdef list extra_fmts = [(b"%q", b"^`AB`^"),
-                        (b"%f", b"^`CD`^"),
-                        (b"%F", b"^`EF`^"),
-                        (b"%l", b"^`GH`^"),
-                        (b"%u", b"^`IJ`^"),
-                        (b"%n", b"^`KL`^")]
-
-cdef list str_extra_fmts = ["^`AB`^", "^`CD`^", "^`EF`^", "^`GH`^", "^`IJ`^", "^`KL`^"]
-
-cdef object _period_strftime(int64_t value, int freq, object fmt):
-    import sys
-
-    cdef:
-        Py_ssize_t i
-        date_info dinfo
-        char *formatted
-        object pat, repl, result
-        list found_pat = [False] * len(extra_fmts)
-        int year, quarter
-
-    if PyUnicode_Check(fmt):
-        fmt = fmt.encode('utf-8')
-
-    get_date_info(value, freq, &dinfo)
-    for i in range(len(extra_fmts)):
-        pat = extra_fmts[i][0]
-        repl = extra_fmts[i][1]
-        if pat in fmt:
-            fmt = fmt.replace(pat, repl)
-            found_pat[i] = True
-
-    formatted = c_strftime(&dinfo, <char*> fmt)
-
-    result = util.char_to_string(formatted)
-    free(formatted)
-
-    for i in range(len(extra_fmts)):
-        if found_pat[i]:
-            if get_yq(value, freq, &quarter, &year) < 0:
-                raise ValueError('Unable to get quarter and year')
-
-            if i == 0:
-                repl = '%d' % quarter
-            elif i == 1:  # %f, 2-digit year
-                repl = '%.2d' % (year % 100)
-            elif i == 2:
-                repl = '%d' % year
-            elif i == 3:
-                repl = '%03d' % (value % 1000)
-            elif i == 4:
-                repl = '%06d' % (value % 1000000)
-            elif i == 5:
-                repl = '%09d' % (value % 1000000000)
-
-            result = result.replace(str_extra_fmts[i], repl)
-
-    if PY2:
-        result = result.decode('utf-8', 'ignore')
-
-    return result
-
-# period accessors
-
-ctypedef int (*accessor)(int64_t ordinal, int freq) except INT32_MIN
-
-def get_period_field(int code, int64_t value, int freq):
-    cdef accessor f = _get_accessor_func(code)
-    if f is NULL:
-        raise ValueError('Unrecognized period code: %d' % code)
-    if value == iNaT:
-        return np.nan
-    return f(value, freq)
-
-def get_period_field_arr(int code, ndarray[int64_t] arr, int freq):
-    cdef:
-        Py_ssize_t i, sz
-        ndarray[int64_t] out
-        accessor f
-
-    f = _get_accessor_func(code)
-    if f is NULL:
-        raise ValueError('Unrecognized period code: %d' % code)
-
-    sz = len(arr)
-    out = np.empty(sz, dtype=np.int64)
-
-    for i in range(sz):
-        if arr[i] == iNaT:
-            out[i] = -1
-            continue
-        out[i] = f(arr[i], freq)
-
-    return out
-
-
-
-cdef accessor _get_accessor_func(int code):
-    if code == 0:
-        return &pyear
-    elif code == 1:
-        return &pqyear
-    elif code == 2:
-        return &pquarter
-    elif code == 3:
-        return &pmonth
-    elif code == 4:
-        return &pday
-    elif code == 5:
-        return &phour
-    elif code == 6:
-        return &pminute
-    elif code == 7:
-        return &psecond
-    elif code == 8:
-        return &pweek
-    elif code == 9:
-        return &pday_of_year
-    elif code == 10:
-        return &pweekday
-    elif code == 11:
-        return &pdays_in_month
-    return NULL
-
-
-def extract_ordinals(ndarray[object] values, freq):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[int64_t] ordinals = np.empty(n, dtype=np.int64)
-        object p
-
-    freqstr = Period._maybe_convert_freq(freq).freqstr
-
-    for i in range(n):
-        p = values[i]
-        ordinals[i] = p.ordinal
-        if p.freqstr != freqstr:
-            raise ValueError("%s is wrong freq" % p)
-
-    return ordinals
-
-cpdef resolution(ndarray[int64_t] stamps, tz=None):
-    cdef:
-        Py_ssize_t i, n = len(stamps)
-        pandas_datetimestruct dts
-        int reso = D_RESO, curr_reso
-
-    if tz is not None:
-        tz = maybe_get_tz(tz)
-        return _reso_local(stamps, tz)
-    else:
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns, &dts)
-            curr_reso = _reso_stamp(&dts)
-            if curr_reso < reso:
-                reso = curr_reso
-        return reso
-
-US_RESO = 0
-MS_RESO = 1
-S_RESO = 2
-T_RESO = 3
-H_RESO = 4
-D_RESO = 5
-
-cdef inline int _reso_stamp(pandas_datetimestruct *dts):
-    if dts.us != 0:
-        if dts.us % 1000 == 0:
-            return MS_RESO
-        return US_RESO
-    elif dts.sec != 0:
-        return S_RESO
-    elif dts.min != 0:
-        return T_RESO
-    elif dts.hour != 0:
-        return H_RESO
-    return D_RESO
-
-cdef _reso_local(ndarray[int64_t] stamps, object tz):
-    cdef:
-        Py_ssize_t n = len(stamps)
-        int reso = D_RESO, curr_reso
-        ndarray[int64_t] trans, deltas, pos
-        pandas_datetimestruct dts
-
-    if _is_utc(tz):
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns, &dts)
-            curr_reso = _reso_stamp(&dts)
-            if curr_reso < reso:
-                reso = curr_reso
-    elif _is_tzlocal(tz):
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns,
-                                              &dts)
-            dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                          dts.min, dts.sec, dts.us, tz)
-            delta = int(total_seconds(_get_utcoffset(tz, dt))) * 1000000000
-            pandas_datetime_to_datetimestruct(stamps[i] + delta,
-                                              PANDAS_FR_ns, &dts)
-            curr_reso = _reso_stamp(&dts)
-            if curr_reso < reso:
-                reso = curr_reso
-    else:
-        # Adjust datetime64 timestamp, recompute datetimestruct
-        trans, deltas, typ = _get_dst_info(tz)
-
-        _pos = trans.searchsorted(stamps, side='right') - 1
-        if _pos.dtype != np.int64:
-            _pos = _pos.astype(np.int64)
-        pos = _pos
-
-        # statictzinfo
-        if typ not in ['pytz','dateutil']:
-            for i in range(n):
-                if stamps[i] == NPY_NAT:
-                    continue
-                pandas_datetime_to_datetimestruct(stamps[i] + deltas[0],
-                                                  PANDAS_FR_ns, &dts)
-                curr_reso = _reso_stamp(&dts)
-                if curr_reso < reso:
-                    reso = curr_reso
-        else:
-            for i in range(n):
-                if stamps[i] == NPY_NAT:
-                    continue
-                pandas_datetime_to_datetimestruct(stamps[i] + deltas[pos[i]],
-                                                  PANDAS_FR_ns, &dts)
-                curr_reso = _reso_stamp(&dts)
-                if curr_reso < reso:
-                    reso = curr_reso
-
-    return reso
-
-
-# period helpers
-
-cdef ndarray[int64_t] localize_dt64arr_to_period(ndarray[int64_t] stamps,
-                                                 int freq, object tz):
-    cdef:
-        Py_ssize_t n = len(stamps)
-        ndarray[int64_t] result = np.empty(n, dtype=np.int64)
-        ndarray[int64_t] trans, deltas, pos
-        pandas_datetimestruct dts
-
-    if not have_pytz:
-        raise Exception('Could not find pytz module')
-
-    if _is_utc(tz):
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                result[i] = NPY_NAT
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns, &dts)
-            result[i] = get_period_ordinal(dts.year, dts.month, dts.day,
-                                           dts.hour, dts.min, dts.sec, dts.us, dts.ps, freq)
-
-    elif _is_tzlocal(tz):
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                result[i] = NPY_NAT
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns,
-                                              &dts)
-            dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                          dts.min, dts.sec, dts.us, tz)
-            delta = int(total_seconds(_get_utcoffset(tz, dt))) * 1000000000
-            pandas_datetime_to_datetimestruct(stamps[i] + delta,
-                                              PANDAS_FR_ns, &dts)
-            result[i] = get_period_ordinal(dts.year, dts.month, dts.day,
-                                           dts.hour, dts.min, dts.sec, dts.us, dts.ps, freq)
-    else:
-        # Adjust datetime64 timestamp, recompute datetimestruct
-        trans, deltas, typ = _get_dst_info(tz)
-
-        _pos = trans.searchsorted(stamps, side='right') - 1
-        if _pos.dtype != np.int64:
-            _pos = _pos.astype(np.int64)
-        pos = _pos
-
-        # statictzinfo
-        if typ not in ['pytz','dateutil']:
-            for i in range(n):
-                if stamps[i] == NPY_NAT:
-                    result[i] = NPY_NAT
-                    continue
-                pandas_datetime_to_datetimestruct(stamps[i] + deltas[0],
-                                                  PANDAS_FR_ns, &dts)
-                result[i] = get_period_ordinal(dts.year, dts.month, dts.day,
-                                               dts.hour, dts.min, dts.sec, dts.us, dts.ps, freq)
-        else:
-            for i in range(n):
-                if stamps[i] == NPY_NAT:
-                    result[i] = NPY_NAT
-                    continue
-                pandas_datetime_to_datetimestruct(stamps[i] + deltas[pos[i]],
-                                                  PANDAS_FR_ns, &dts)
-                result[i] = get_period_ordinal(dts.year, dts.month, dts.day,
-                                               dts.hour, dts.min, dts.sec, dts.us, dts.ps, freq)
-
-    return result
-
-
-_DIFFERENT_FREQ_ERROR = "Input has different freq={1} from Period(freq={0})"
-
-
-cdef class Period(object):
-    """
-    Represents an period of time
-
-    Parameters
-    ----------
-    value : Period or compat.string_types, default None
-        The time period represented (e.g., '4Q2005')
-    freq : str, default None
-        One of pandas period strings or corresponding objects
-    year : int, default None
-    month : int, default 1
-    quarter : int, default None
-    day : int, default 1
-    hour : int, default 0
-    minute : int, default 0
-    second : int, default 0
-    """
-    cdef public:
-        int64_t ordinal
-        object freq
-
-    _comparables = ['name','freqstr']
-    _typ = 'period'
-
-    @classmethod
-    def _maybe_convert_freq(cls, object freq):
-
-        if isinstance(freq, compat.string_types):
-            from pandas.tseries.frequencies import _period_alias_dict
-            freq = _period_alias_dict.get(freq, freq)
-        elif isinstance(freq, (int, tuple)):
-            from pandas.tseries.frequencies import get_freq_code as _gfc
-            from pandas.tseries.frequencies import _get_freq_str
-            code, stride = _gfc(freq)
-            freq = _get_freq_str(code, stride)
-
-        from pandas.tseries.frequencies import to_offset
-        freq = to_offset(freq)
-
-        if freq.n <= 0:
-            raise ValueError('Frequency must be positive, because it'
-                             ' represents span: {0}'.format(freq.freqstr))
-
-        return freq
-
-    @classmethod
-    def _from_ordinal(cls, ordinal, freq):
-        """ fast creation from an ordinal and freq that are already validated! """
-        self = Period.__new__(cls)
-        self.ordinal = ordinal
-        self.freq = cls._maybe_convert_freq(freq)
-        return self
-
-    def __init__(self, value=None, freq=None, ordinal=None,
-                 year=None, month=1, quarter=None, day=1,
-                 hour=0, minute=0, second=0):
-        from pandas.tseries import frequencies
-        from pandas.tseries.frequencies import get_freq_code as _gfc
-
-        # freq points to a tuple (base, mult);  base is one of the defined
-        # periods such as A, Q, etc. Every five minutes would be, e.g.,
-        # ('T', 5) but may be passed in as a string like '5T'
-
-        # ordinal is the period offset from the gregorian proleptic epoch
-
-        if ordinal is not None and value is not None:
-            raise ValueError(("Only value or ordinal but not both should be "
-                              "given but not both"))
-        elif ordinal is not None:
-            if not lib.is_integer(ordinal):
-                raise ValueError("Ordinal must be an integer")
-            if freq is None:
-                raise ValueError('Must supply freq for ordinal value')
-
-        elif value is None:
-            if freq is None:
-                raise ValueError("If value is None, freq cannot be None")
-            ordinal = _ordinal_from_fields(year, month, quarter, day,
-                                           hour, minute, second, freq)
-
-        elif isinstance(value, Period):
-            other = value
-            if freq is None or _gfc(freq) == _gfc(other.freq):
-                ordinal = other.ordinal
-                freq = other.freq
-            else:
-                converted = other.asfreq(freq)
-                ordinal = converted.ordinal
-
-        elif lib.is_null_datetimelike(value) or value in tslib._nat_strings:
-            ordinal = tslib.iNaT
-            if freq is None:
-                raise ValueError("If value is NaT, freq cannot be None "
-                                 "because it cannot be inferred")
-
-        elif isinstance(value, compat.string_types) or lib.is_integer(value):
-            if lib.is_integer(value):
-                value = str(value)
-            value = value.upper()
-            dt, _, reso = parse_time_string(value, freq)
-
-            if freq is None:
-                try:
-                    freq = frequencies.Resolution.get_freq(reso)
-                except KeyError:
-                    raise ValueError("Invalid frequency or could not infer: %s" % reso)
-
-        elif isinstance(value, datetime):
-            dt = value
-            if freq is None:
-                raise ValueError('Must supply freq for datetime value')
-        elif isinstance(value, np.datetime64):
-            dt = Timestamp(value)
-            if freq is None:
-                raise ValueError('Must supply freq for datetime value')
-        elif isinstance(value, date):
-            dt = datetime(year=value.year, month=value.month, day=value.day)
-            if freq is None:
-                raise ValueError('Must supply freq for datetime value')
-        else:
-            msg = "Value must be Period, string, integer, or datetime"
-            raise ValueError(msg)
-
-        base, mult = _gfc(freq)
-
-        if ordinal is None:
-            self.ordinal = get_period_ordinal(dt.year, dt.month, dt.day,
-                                              dt.hour, dt.minute, dt.second,
-                                              dt.microsecond, 0, base)
-        else:
-            self.ordinal = ordinal
-
-        self.freq = self._maybe_convert_freq(freq)
-
-    def __richcmp__(self, other, op):
-        if isinstance(other, Period):
-            from pandas.tseries.frequencies import get_freq_code as _gfc
-            if other.freq != self.freq:
-                msg = _DIFFERENT_FREQ_ERROR.format(self.freqstr, other.freqstr)
-                raise ValueError(msg)
-            if self.ordinal == tslib.iNaT or other.ordinal == tslib.iNaT:
-                return _nat_scalar_rules[op]
-            return PyObject_RichCompareBool(self.ordinal, other.ordinal, op)
-        else:
-            if op == Py_EQ:
-                return NotImplemented
-            elif op == Py_NE:
-                return NotImplemented
-            raise TypeError('Cannot compare type %r with type %r' %
-                            (type(self).__name__, type(other).__name__))
-
-    def __hash__(self):
-        return hash((self.ordinal, self.freq))
-
-    def _add_delta(self, other):
-        from pandas.tseries import frequencies
-        if isinstance(other, (timedelta, np.timedelta64, offsets.Tick, Timedelta)):
-            offset = frequencies.to_offset(self.freq.rule_code)
-            if isinstance(offset, offsets.Tick):
-                nanos = tslib._delta_to_nanoseconds(other)
-                offset_nanos = tslib._delta_to_nanoseconds(offset)
-
-                if nanos % offset_nanos == 0:
-                    if self.ordinal == tslib.iNaT:
-                        ordinal = self.ordinal
-                    else:
-                        ordinal = self.ordinal + (nanos // offset_nanos)
-                    return Period(ordinal=ordinal, freq=self.freq)
-            msg = 'Input cannnot be converted to Period(freq={0})'
-            raise ValueError(msg)
-        elif isinstance(other, offsets.DateOffset):
-            freqstr = frequencies.get_standard_freq(other)
-            base = frequencies.get_base_alias(freqstr)
-            if base == self.freq.rule_code:
-                if self.ordinal == tslib.iNaT:
-                    ordinal = self.ordinal
-                else:
-                    ordinal = self.ordinal + other.n
-                return Period(ordinal=ordinal, freq=self.freq)
-            msg = _DIFFERENT_FREQ_ERROR.format(self.freqstr, other.freqstr)
-            raise ValueError(msg)
-        else: # pragma no cover
-            return NotImplemented
-
-    def __add__(self, other):
-        if isinstance(other, (timedelta, np.timedelta64,
-                              offsets.Tick, offsets.DateOffset, Timedelta)):
-            return self._add_delta(other)
-        elif lib.is_integer(other):
-            if self.ordinal == tslib.iNaT:
-                ordinal = self.ordinal
-            else:
-                ordinal = self.ordinal + other * self.freq.n
-            return Period(ordinal=ordinal, freq=self.freq)
-        else:  # pragma: no cover
-            return NotImplemented
-
-    def __sub__(self, other):
-        if isinstance(other, (timedelta, np.timedelta64,
-                              offsets.Tick, offsets.DateOffset, Timedelta)):
-            neg_other = -other
-            return self + neg_other
-        elif lib.is_integer(other):
-            if self.ordinal == tslib.iNaT:
-                ordinal = self.ordinal
-            else:
-                ordinal = self.ordinal - other * self.freq.n
-            return Period(ordinal=ordinal, freq=self.freq)
-        elif isinstance(other, Period):
-            if other.freq != self.freq:
-                raise ValueError("Cannot do arithmetic with "
-                                 "non-conforming periods")
-            if self.ordinal == tslib.iNaT or other.ordinal == tslib.iNaT:
-                return Period(ordinal=tslib.iNaT, freq=self.freq)
-            return self.ordinal - other.ordinal
-        else:  # pragma: no cover
-            return NotImplemented
-
-    def asfreq(self, freq, how='E'):
-        """
-        Convert Period to desired frequency, either at the start or end of the
-        interval
-
-        Parameters
-        ----------
-        freq : string
-        how : {'E', 'S', 'end', 'start'}, default 'end'
-            Start or end of the timespan
-
-        Returns
-        -------
-        resampled : Period
-        """
-        from pandas.tseries.frequencies import get_freq_code as _gfc
-        how = _validate_end_alias(how)
-        base1, mult1 = _gfc(self.freq)
-        base2, mult2 = _gfc(freq)
-
-        if self.ordinal == tslib.iNaT:
-            ordinal = self.ordinal
-        else:
-            # mult1 can't be negative or 0
-            end = how == 'E'
-            if end:
-                ordinal = self.ordinal + mult1 - 1
-            else:
-                ordinal = self.ordinal
-            ordinal = period_asfreq(ordinal, base1, base2, end)
-
-        return Period(ordinal=ordinal, freq=freq)
-
-    @property
-    def start_time(self):
-        return self.to_timestamp(how='S')
-
-    @property
-    def end_time(self):
-        if self.ordinal == tslib.iNaT:
-            ordinal = self.ordinal
-        else:
-            # freq.n can't be negative or 0
-            ordinal = (self + self.freq.n).start_time.value - 1
-        return Timestamp(ordinal)
-
-    def to_timestamp(self, freq=None, how='start', tz=None):
-        """
-        Return the Timestamp representation of the Period at the target
-        frequency at the specified end (how) of the Period
-
-        Parameters
-        ----------
-        freq : string or DateOffset, default is 'D' if self.freq is week or
-               longer and 'S' otherwise
-            Target frequency
-        how: str, default 'S' (start)
-            'S', 'E'. Can be aliased as case insensitive
-            'Start', 'Finish', 'Begin', 'End'
-
-        Returns
-        -------
-        Timestamp
-        """
-        from pandas.tseries import frequencies
-        from pandas.tseries.frequencies import get_freq_code as _gfc
-        how = _validate_end_alias(how)
-
-        if freq is None:
-            base, mult = _gfc(self.freq)
-            freq = frequencies.get_to_timestamp_base(base)
-
-        base, mult = _gfc(freq)
-        val = self.asfreq(freq, how)
-
-        dt64 = period_ordinal_to_dt64(val.ordinal, base)
-        return Timestamp(dt64, tz=tz)
-
-    cdef _field(self, alias):
-        from pandas.tseries.frequencies import get_freq_code as _gfc
-        base, mult = _gfc(self.freq)
-        return get_period_field(alias, self.ordinal, base)
-
-    property year:
-        def __get__(self):
-            return self._field(0)
-    property month:
-        def __get__(self):
-            return self._field(3)
-    property day:
-        def __get__(self):
-            return self._field(4)
-    property hour:
-        def __get__(self):
-            return self._field(5)
-    property minute:
-        def __get__(self):
-            return self._field(6)
-    property second:
-        def __get__(self):
-            return self._field(7)
-    property weekofyear:
-        def __get__(self):
-            return self._field(8)
-    property week:
-        def __get__(self):
-            return self.weekofyear
-    property dayofweek:
-        def __get__(self):
-            return self._field(10)
-    property weekday:
-        def __get__(self):
-            return self.dayofweek
-    property dayofyear:
-        def __get__(self):
-            return self._field(9)
-    property quarter:
-        def __get__(self):
-            return self._field(2)
-    property qyear:
-        def __get__(self):
-            return self._field(1)
-    property days_in_month:
-        def __get__(self):
-            return self._field(11)
-    property daysinmonth:
-        def __get__(self):
-            return self.days_in_month
-
-    @classmethod
-    def now(cls, freq=None):
-        return Period(datetime.now(), freq=freq)
-
-    # HACK IT UP AND YOU BETTER FIX IT SOON
-    def __str__(self):
-        return self.__unicode__()
-
-    @property
-    def freqstr(self):
-        return self.freq.freqstr
-
-    def __repr__(self):
-        from pandas.tseries.frequencies import get_freq_code as _gfc
-        base, mult = _gfc(self.freq)
-        formatted = period_format(self.ordinal, base)
-        return "Period('%s', '%s')" % (formatted, self.freqstr)
-
-    def __unicode__(self):
-        """
-        Return a string representation for a particular DataFrame
-
-        Invoked by unicode(df) in py2 only. Yields a Unicode String in both
-        py2/py3.
-        """
-        from pandas.tseries.frequencies import get_freq_code as _gfc
-        base, mult = _gfc(self.freq)
-        formatted = period_format(self.ordinal, base)
-        value = ("%s" % formatted)
-        return value
-
-    def __setstate__(self, state):
-        self.freq=state[1]
-        self.ordinal=state[2]
-
-    def __reduce__(self):
-        object_state = None, self.freq, self.ordinal
-        return (Period, object_state)
-
-    def strftime(self, fmt):
-        """
-        Returns the string representation of the :class:`Period`, depending
-        on the selected :keyword:`format`. :keyword:`format` must be a string
-        containing one or several directives.  The method recognizes the same
-        directives as the :func:`time.strftime` function of the standard Python
-        distribution, as well as the specific additional directives ``%f``,
-        ``%F``, ``%q``. (formatting & docs originally from scikits.timeries)
-
-        +-----------+--------------------------------+-------+
-        | Directive | Meaning                        | Notes |
-        +===========+================================+=======+
-        | ``%a``    | Locale's abbreviated weekday   |       |
-        |           | name.                          |       |
-        +-----------+--------------------------------+-------+
-        | ``%A``    | Locale's full weekday name.    |       |
-        +-----------+--------------------------------+-------+
-        | ``%b``    | Locale's abbreviated month     |       |
-        |           | name.                          |       |
-        +-----------+--------------------------------+-------+
-        | ``%B``    | Locale's full month name.      |       |
-        +-----------+--------------------------------+-------+
-        | ``%c``    | Locale's appropriate date and  |       |
-        |           | time representation.           |       |
-        +-----------+--------------------------------+-------+
-        | ``%d``    | Day of the month as a decimal  |       |
-        |           | number [01,31].                |       |
-        +-----------+--------------------------------+-------+
-        | ``%f``    | 'Fiscal' year without a        | \(1)  |
-        |           | century  as a decimal number   |       |
-        |           | [00,99]                        |       |
-        +-----------+--------------------------------+-------+
-        | ``%F``    | 'Fiscal' year with a century   | \(2)  |
-        |           | as a decimal number            |       |
-        +-----------+--------------------------------+-------+
-        | ``%H``    | Hour (24-hour clock) as a      |       |
-        |           | decimal number [00,23].        |       |
-        +-----------+--------------------------------+-------+
-        | ``%I``    | Hour (12-hour clock) as a      |       |
-        |           | decimal number [01,12].        |       |
-        +-----------+--------------------------------+-------+
-        | ``%j``    | Day of the year as a decimal   |       |
-        |           | number [001,366].              |       |
-        +-----------+--------------------------------+-------+
-        | ``%m``    | Month as a decimal number      |       |
-        |           | [01,12].                       |       |
-        +-----------+--------------------------------+-------+
-        | ``%M``    | Minute as a decimal number     |       |
-        |           | [00,59].                       |       |
-        +-----------+--------------------------------+-------+
-        | ``%p``    | Locale's equivalent of either  | \(3)  |
-        |           | AM or PM.                      |       |
-        +-----------+--------------------------------+-------+
-        | ``%q``    | Quarter as a decimal number    |       |
-        |           | [01,04]                        |       |
-        +-----------+--------------------------------+-------+
-        | ``%S``    | Second as a decimal number     | \(4)  |
-        |           | [00,61].                       |       |
-        +-----------+--------------------------------+-------+
-        | ``%U``    | Week number of the year        | \(5)  |
-        |           | (Sunday as the first day of    |       |
-        |           | the week) as a decimal number  |       |
-        |           | [00,53].  All days in a new    |       |
-        |           | year preceding the first       |       |
-        |           | Sunday are considered to be in |       |
-        |           | week 0.                        |       |
-        +-----------+--------------------------------+-------+
-        | ``%w``    | Weekday as a decimal number    |       |
-        |           | [0(Sunday),6].                 |       |
-        +-----------+--------------------------------+-------+
-        | ``%W``    | Week number of the year        | \(5)  |
-        |           | (Monday as the first day of    |       |
-        |           | the week) as a decimal number  |       |
-        |           | [00,53].  All days in a new    |       |
-        |           | year preceding the first       |       |
-        |           | Monday are considered to be in |       |
-        |           | week 0.                        |       |
-        +-----------+--------------------------------+-------+
-        | ``%x``    | Locale's appropriate date      |       |
-        |           | representation.                |       |
-        +-----------+--------------------------------+-------+
-        | ``%X``    | Locale's appropriate time      |       |
-        |           | representation.                |       |
-        +-----------+--------------------------------+-------+
-        | ``%y``    | Year without century as a      |       |
-        |           | decimal number [00,99].        |       |
-        +-----------+--------------------------------+-------+
-        | ``%Y``    | Year with century as a decimal |       |
-        |           | number.                        |       |
-        +-----------+--------------------------------+-------+
-        | ``%Z``    | Time zone name (no characters  |       |
-        |           | if no time zone exists).       |       |
-        +-----------+--------------------------------+-------+
-        | ``%%``    | A literal ``'%'`` character.   |       |
-        +-----------+--------------------------------+-------+
-
-        .. note::
-
-            (1)
-                The ``%f`` directive is the same as ``%y`` if the frequency is
-                not quarterly.
-                Otherwise, it corresponds to the 'fiscal' year, as defined by
-                the :attr:`qyear` attribute.
-
-            (2)
-                The ``%F`` directive is the same as ``%Y`` if the frequency is
-                not quarterly.
-                Otherwise, it corresponds to the 'fiscal' year, as defined by
-                the :attr:`qyear` attribute.
-
-            (3)
-                The ``%p`` directive only affects the output hour field
-                if the ``%I`` directive is used to parse the hour.
-
-            (4)
-                The range really is ``0`` to ``61``; this accounts for leap
-                seconds and the (very rare) double leap seconds.
-
-            (5)
-                The ``%U`` and ``%W`` directives are only used in calculations
-                when the day of the week and the year are specified.
-
-        .. rubric::  Examples
-
-            >>> a = Period(freq='Q@JUL', year=2006, quarter=1)
-            >>> a.strftime('%F-Q%q')
-            '2006-Q1'
-            >>> # Output the last month in the quarter of this date
-            >>> a.strftime('%b-%Y')
-            'Oct-2005'
-            >>>
-            >>> a = Period(freq='D', year=2001, month=1, day=1)
-            >>> a.strftime('%d-%b-%Y')
-            '01-Jan-2006'
-            >>> a.strftime('%b. %d, %Y was a %A')
-            'Jan. 01, 2001 was a Monday'
-        """
-        from pandas.tseries.frequencies import get_freq_code as _gfc
-        base, mult = _gfc(self.freq)
-        return period_format(self.ordinal, base, fmt)
-
-
-def _ordinal_from_fields(year, month, quarter, day, hour, minute,
-                         second, freq):
-    from pandas.tseries.frequencies import get_freq_code as _gfc
-    base, mult = _gfc(freq)
-    if quarter is not None:
-        year, month = _quarter_to_myear(year, quarter, freq)
-
-    return get_period_ordinal(year, month, day, hour, minute, second, 0, 0, base)
-
-
-def _quarter_to_myear(year, quarter, freq):
-    if quarter is not None:
-        if quarter <= 0 or quarter > 4:
-            raise ValueError('Quarter must be 1 <= q <= 4')
-
-        from pandas.tseries import frequencies
-        mnum = frequencies._month_numbers[frequencies._get_rule_month(freq)] + 1
-        month = (mnum + (quarter - 1) * 3) % 12 + 1
-        if month > mnum:
-            year -= 1
-
-    return year, month
-
-
-def _validate_end_alias(how):
-    how_dict = {'S': 'S', 'E': 'E',
-                'START': 'S', 'FINISH': 'E',
-                'BEGIN': 'S', 'END': 'E'}
-    how = how_dict.get(str(how).upper())
-    if how not in set(['S', 'E']):
-        raise ValueError('How must be one of S or E')
-    return how
diff --git a/pandas/src/period_helper.c b/pandas/src/period_helper.c
deleted file mode 100644
index 032bc44de6355..0000000000000
--- a/pandas/src/period_helper.c
+++ /dev/null
@@ -1,1451 +0,0 @@
-#include "period_helper.h"
-
-
-/*
- * Borrowed and derived code from scikits.timeseries that we will expose via
- * Cython to pandas. This primarily concerns period representation and
- * frequency conversion routines.
- */
-
-/* see end of file for stuff pandas uses (search for 'pandas') */
-
-/* ------------------------------------------------------------------
- * Code derived from scikits.timeseries
- * ------------------------------------------------------------------*/
-
-static int mod_compat(int x, int m) {
-  int result = x % m;
-  if (result < 0) return result + m;
-  return result;
-}
-
-static int floordiv(int x, int divisor) {
-    if (x < 0) {
-        if (mod_compat(x, divisor)) {
-            return x / divisor - 1;
-        }
-        else return x / divisor;
-    } else {
-        return x / divisor;
-    }
-}
-
-static asfreq_info NULL_AF_INFO;
-
-/* Table with day offsets for each month (0-based, without and with leap) */
-static int month_offset[2][13] = {
-    { 0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365 },
-    { 0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366 }
-};
-
-/* Table of number of days in a month (0-based, without and with leap) */
-static int days_in_month[2][12] = {
-    { 31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31 },
-    { 31, 29, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31 }
-};
-
-/* Return 1/0 iff year points to a leap year in calendar. */
-static int dInfoCalc_Leapyear(npy_int64 year, int calendar)
-{
-    if (calendar == GREGORIAN_CALENDAR) {
-        return (year % 4 == 0) && ((year % 100 != 0) || (year % 400 == 0));
-    } else {
-        return (year % 4 == 0);
-    }
-}
-
-/* Return the day of the week for the given absolute date. */
-static int dInfoCalc_DayOfWeek(npy_int64 absdate)
-{
-    int day_of_week;
-
-    if (absdate >= 1) {
-        day_of_week = (absdate - 1) % 7;
-    } else {
-        day_of_week = 6 - ((-absdate) % 7);
-    }
-    return day_of_week;
-}
-
-static int monthToQuarter(int month) { return ((month-1)/3)+1; }
-
-/* Return the year offset, that is the absolute date of the day
-   31.12.(year-1) in the given calendar.
-
-   Note:
-   For the Julian calendar we shift the absdate (which is measured
-   using the Gregorian Epoch) value by two days because the Epoch
-   (0001-01-01) in the Julian calendar lies 2 days before the Epoch in
-   the Gregorian calendar. */
-static int dInfoCalc_YearOffset(npy_int64 year, int calendar)
-{
-    year--;
-    if (calendar == GREGORIAN_CALENDAR) {
-    if (year >= 0 || -1/4 == -1)
-        return year*365 + year/4 - year/100 + year/400;
-    else
-        return year*365 + (year-3)/4 - (year-99)/100 + (year-399)/400;
-    }
-    else if (calendar == JULIAN_CALENDAR) {
-    if (year >= 0 || -1/4 == -1)
-        return year*365 + year/4 - 2;
-    else
-        return year*365 + (year-3)/4 - 2;
-    }
-    Py_Error(PyExc_ValueError, "unknown calendar");
- onError:
-    return INT_ERR_CODE;
-}
-
-/* Set the instance's value using the given date and time. calendar may be set
- * to the flags: GREGORIAN_CALENDAR, JULIAN_CALENDAR to indicate the calendar
- * to be used. */
-
-static int dInfoCalc_SetFromDateAndTime(struct date_info *dinfo,
-        int year, int month, int day, int hour, int minute, double second,
-        int calendar)
-{
-
-    /* Calculate the absolute date */
-    {
-        int leap;
-		npy_int64 absdate;
-        int yearoffset;
-
-        /* Range check */
-        Py_AssertWithArg(year > -(INT_MAX / 366) && year < (INT_MAX / 366),
-                 PyExc_ValueError,
-                 "year out of range: %i",
-                 year);
-
-        /* Is it a leap year ? */
-        leap = dInfoCalc_Leapyear(year, calendar);
-
-        /* Negative month values indicate months relative to the years end */
-        if (month < 0) month += 13;
-        Py_AssertWithArg(month >= 1 && month <= 12,
-                 PyExc_ValueError,
-                 "month out of range (1-12): %i",
-                 month);
-
-        /* Negative values indicate days relative to the months end */
-        if (day < 0) day += days_in_month[leap][month - 1] + 1;
-        Py_AssertWithArg(day >= 1 && day <= days_in_month[leap][month - 1],
-                 PyExc_ValueError,
-                 "day out of range: %i",
-                 day);
-
-        yearoffset = dInfoCalc_YearOffset(year, calendar);
-        if (PyErr_Occurred()) goto onError;
-
-        absdate = day + month_offset[leap][month - 1] + yearoffset;
-
-        dinfo->absdate = absdate;
-
-        dinfo->year = year;
-        dinfo->month = month;
-        dinfo->quarter = ((month-1)/3)+1;
-        dinfo->day = day;
-
-        dinfo->day_of_week = dInfoCalc_DayOfWeek(absdate);
-        dinfo->day_of_year = (short)(absdate - yearoffset);
-
-        dinfo->calendar = calendar;
-    }
-
-    /* Calculate the absolute time */
-    {
-        Py_AssertWithArg(hour >= 0 && hour <= 23,
-                PyExc_ValueError,
-                "hour out of range (0-23): %i",
-                hour);
-        Py_AssertWithArg(minute >= 0 && minute <= 59,
-                PyExc_ValueError,
-                "minute out of range (0-59): %i",
-                minute);
-        Py_AssertWithArg(second >= (double)0.0 &&
-                (second < (double)60.0 ||
-                (hour == 23 && minute == 59 &&
-                second < (double)61.0)),
-                PyExc_ValueError,
-                "second out of range (0.0 - <60.0; <61.0 for 23:59): %f",
-                second);
-
-        dinfo->abstime = (double)(hour*3600 + minute*60) + second;
-
-        dinfo->hour = hour;
-        dinfo->minute = minute;
-        dinfo->second = second;
-    }
-    return 0;
-
- onError:
-    return INT_ERR_CODE;
-}
-
-/* Sets the date part of the date_info struct using the indicated
-   calendar.
-
-   XXX This could also be done using some integer arithmetics rather
-       than with this iterative approach... */
-static
-int dInfoCalc_SetFromAbsDate(register struct date_info *dinfo,
-							 npy_int64 absdate, int calendar)
-{
-    register npy_int64 year;
-    npy_int64 yearoffset;
-    int leap,dayoffset;
-    int *monthoffset;
-
-    /* Approximate year */
-    if (calendar == GREGORIAN_CALENDAR) {
-        year = (npy_int64)(((double)absdate) / 365.2425);
-    } else if (calendar == JULIAN_CALENDAR) {
-        year = (npy_int64)(((double)absdate) / 365.25);
-    } else {
-        Py_Error(PyExc_ValueError, "unknown calendar");
-    }
-
-    if (absdate > 0) year++;
-
-    /* Apply corrections to reach the correct year */
-    while (1) {
-        /* Calculate the year offset */
-        yearoffset = dInfoCalc_YearOffset(year, calendar);
-        if (PyErr_Occurred())
-            goto onError;
-
-        /* Backward correction: absdate must be greater than the
-           yearoffset */
-        if (yearoffset >= absdate) {
-            year--;
-            continue;
-        }
-
-        dayoffset = absdate - yearoffset;
-        leap = dInfoCalc_Leapyear(year,calendar);
-
-        /* Forward correction: non leap years only have 365 days */
-        if (dayoffset > 365 && !leap) {
-            year++;
-            continue;
-        }
-        break;
-    }
-
-    dinfo->year = year;
-    dinfo->calendar = calendar;
-
-    /* Now iterate to find the month */
-    monthoffset = month_offset[leap];
-    {
-        register int month;
-
-        for (month = 1; month < 13; month++) {
-            if (monthoffset[month] >= dayoffset)
-            break;
-        }
-
-        dinfo->month = month;
-        dinfo->quarter = monthToQuarter(month);
-        dinfo->day = dayoffset - month_offset[leap][month-1];
-    }
-
-
-    dinfo->day_of_week = dInfoCalc_DayOfWeek(absdate);
-    dinfo->day_of_year = dayoffset;
-    dinfo->absdate = absdate;
-
-    return 0;
-
- onError:
-    return INT_ERR_CODE;
-}
-
-///////////////////////////////////////////////
-
-// frequency specifc conversion routines
-// each function must take an integer fromDate and
-// a char relation ('S' or 'E' for 'START' or 'END')
-///////////////////////////////////////////////////////////////////////
-
-// helpers for frequency conversion routines //
-
-static int daytime_conversion_factors[][2] = {
-    { FR_DAY, 1 },
-    { FR_HR,  24 },
-    { FR_MIN, 60 },
-    { FR_SEC, 60 },
-    { FR_MS,  1000 },
-    { FR_US,  1000 },
-    { FR_NS,  1000 },
-    { 0, 0 }
-};
-
-static npy_int64** daytime_conversion_factor_matrix = NULL;
-
-PANDAS_INLINE static int max_value(int a, int b) {
-    return a > b ? a : b;
-}
-
-PANDAS_INLINE static int min_value(int a, int b) {
-    return a < b ? a : b;
-}
-
-PANDAS_INLINE static int get_freq_group(int freq) {
-    return (freq/1000)*1000;
-}
-
-PANDAS_INLINE static int get_freq_group_index(int freq) {
-    return freq/1000;
-}
-
-static int calc_conversion_factors_matrix_size() {
-    int matrix_size = 0;
-    int index;
-    for (index=0;; index++) {
-        int period_value = get_freq_group_index(daytime_conversion_factors[index][0]);
-        if (period_value == 0) {
-            break;
-        }
-        matrix_size = max_value(matrix_size, period_value);
-    }
-    return matrix_size + 1; 
-}
-
-static void alloc_conversion_factors_matrix(int matrix_size) {
-    int row_index;
-    int column_index;
-	daytime_conversion_factor_matrix = malloc(matrix_size * sizeof(**daytime_conversion_factor_matrix));
-    for (row_index = 0; row_index < matrix_size; row_index++) {
-        daytime_conversion_factor_matrix[row_index] = malloc(matrix_size * sizeof(**daytime_conversion_factor_matrix));
-        for (column_index = 0; column_index < matrix_size; column_index++) {
-            daytime_conversion_factor_matrix[row_index][column_index] = 0;
-        }
-    }
-}
-
-static npy_int64 calculate_conversion_factor(int start_value, int end_value) {
-    npy_int64 conversion_factor = 0;
-    int index;
-    for (index=0;; index++) {
-        int freq_group = daytime_conversion_factors[index][0];
-
-        if (freq_group == 0) {
-            conversion_factor = 0;
-            break;
-        }
-
-        if (freq_group == start_value) {
-            conversion_factor = 1;
-        } else {
-            conversion_factor *= daytime_conversion_factors[index][1];
-        }
-
-        if (freq_group == end_value) {
-            break;
-        }
-    }
-    return conversion_factor;
-}
-
-static void populate_conversion_factors_matrix() {
-    int row_index_index;
-	int row_value, row_index;
-    int column_index_index;
-	int column_value, column_index;
-
-	for (row_index_index = 0;; row_index_index++) {
-        row_value = daytime_conversion_factors[row_index_index][0];
-        if (row_value == 0) {
-            break;
-        }
-        row_index = get_freq_group_index(row_value);
-        for (column_index_index = row_index_index;; column_index_index++) {
-            column_value = daytime_conversion_factors[column_index_index][0];
-            if (column_value == 0) {
-                break;
-            }
-            column_index = get_freq_group_index(column_value);
-
-            daytime_conversion_factor_matrix[row_index][column_index] = calculate_conversion_factor(row_value, column_value);
-        }
-    }
-}
-
-void initialize_daytime_conversion_factor_matrix() {
-    if (daytime_conversion_factor_matrix == NULL) {
-        int matrix_size = calc_conversion_factors_matrix_size();
-        alloc_conversion_factors_matrix(matrix_size);
-        populate_conversion_factors_matrix();
-    }
-}
-
-PANDAS_INLINE npy_int64 get_daytime_conversion_factor(int from_index, int to_index)
-{
-    return daytime_conversion_factor_matrix[min_value(from_index, to_index)][max_value(from_index, to_index)];
-}
-
-PANDAS_INLINE npy_int64 upsample_daytime(npy_int64 ordinal, asfreq_info *af_info, int atEnd)
-{
-    if (atEnd) {
-        return (ordinal + 1) * af_info->intraday_conversion_factor - 1;
-    } else {
-        return ordinal * af_info->intraday_conversion_factor;
-    }
-}
-
-PANDAS_INLINE npy_int64 downsample_daytime(npy_int64 ordinal, asfreq_info *af_info, int atEnd)
-{
-    return ordinal / (af_info->intraday_conversion_factor);
-}
-
-PANDAS_INLINE static npy_int64 transform_via_day(npy_int64 ordinal, char relation, asfreq_info *af_info, freq_conv_func first_func, freq_conv_func second_func) {
-    //printf("transform_via_day(%ld, %ld, %d)\n", ordinal, af_info->intraday_conversion_factor, af_info->intraday_conversion_upsample);
-	npy_int64 result;
-
-    result = (*first_func)(ordinal, relation, af_info);
-    result = (*second_func)(result, relation, af_info);
-
-    return result;
-}
-
-static npy_int64 DtoB_weekday(npy_int64 absdate) {
-    return (((absdate) / 7) * 5) + (absdate) % 7 - BDAY_OFFSET;
-}
-
-static npy_int64 DtoB_WeekendToMonday(npy_int64 absdate, int day_of_week) {
-    if (day_of_week > 4) {
-        //change to Monday after weekend
-        absdate += (7 - day_of_week);
-    }
-    return DtoB_weekday(absdate);
-}
-
-static npy_int64 DtoB_WeekendToFriday(npy_int64 absdate, int day_of_week) {
-    if (day_of_week > 4) {
-        //change to friday before weekend
-        absdate -= (day_of_week - 4);
-    }
-    return DtoB_weekday(absdate);
-}
-
-static npy_int64 absdate_from_ymd(int y, int m, int d) {
-    struct date_info tempDate;
-    if (dInfoCalc_SetFromDateAndTime(&tempDate, y, m, d, 0, 0, 0, GREGORIAN_CALENDAR)) {
-        return INT_ERR_CODE;
-    }
-    return tempDate.absdate;
-}
-
-//************ FROM DAILY ***************
-
-static npy_int64 asfreq_DTtoA(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    struct date_info dinfo;
-    ordinal = downsample_daytime(ordinal, af_info, 0);
-    if (dInfoCalc_SetFromAbsDate(&dinfo, ordinal + ORD_OFFSET, GREGORIAN_CALENDAR))
-        return INT_ERR_CODE;
-    if (dinfo.month > af_info->to_a_year_end) {
-        return (npy_int64)(dinfo.year + 1 - BASE_YEAR);
-    }
-    else {
-        return (npy_int64)(dinfo.year - BASE_YEAR);
-    }
-}
-
-static npy_int64 DtoQ_yq(npy_int64 ordinal, asfreq_info *af_info, int *year, int *quarter) {
-    struct date_info dinfo;
-    if (dInfoCalc_SetFromAbsDate(&dinfo, ordinal + ORD_OFFSET, GREGORIAN_CALENDAR)) 
-        return INT_ERR_CODE;
-    if (af_info->to_q_year_end != 12) {
-        dinfo.month -= af_info->to_q_year_end;
-        if (dinfo.month <= 0) { dinfo.month += 12; }
-        else { dinfo.year += 1; }
-        dinfo.quarter = monthToQuarter(dinfo.month);
-    }
-
-    *year = dinfo.year;
-    *quarter = dinfo.quarter;
-
-    return 0;
-}
-
-static npy_int64 asfreq_DTtoQ(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    int year, quarter;
-
-    ordinal = downsample_daytime(ordinal, af_info, 0);
-
-    if (DtoQ_yq(ordinal, af_info, &year, &quarter) == INT_ERR_CODE) {
-        return INT_ERR_CODE;
-    }
-
-    return (npy_int64)((year - BASE_YEAR) * 4 + quarter - 1);
-}
-
-static npy_int64 asfreq_DTtoM(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    struct date_info dinfo;
-
-    ordinal = downsample_daytime(ordinal, af_info, 0);
-
-    if (dInfoCalc_SetFromAbsDate(&dinfo, ordinal + ORD_OFFSET, GREGORIAN_CALENDAR))
-        return INT_ERR_CODE;
-    return (npy_int64)((dinfo.year - BASE_YEAR) * 12 + dinfo.month - 1);
-}
-
-static npy_int64 asfreq_DTtoW(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    ordinal = downsample_daytime(ordinal, af_info, 0);
-    return (ordinal + ORD_OFFSET - (1 + af_info->to_week_end))/7 + 1 - WEEK_OFFSET;
-}
-
-static npy_int64 asfreq_DTtoB(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    struct date_info dinfo;
-
-	ordinal = downsample_daytime(ordinal, af_info, 0);
-
-    if (dInfoCalc_SetFromAbsDate(&dinfo, ordinal + ORD_OFFSET, GREGORIAN_CALENDAR))
-        return INT_ERR_CODE;
-
-    if (relation == 'S') {
-        return DtoB_WeekendToFriday(dinfo.absdate, dinfo.day_of_week);
-    } else {
-        return DtoB_WeekendToMonday(dinfo.absdate, dinfo.day_of_week);
-    }
-}
-
-// all intra day calculations are now done within one function
-static npy_int64 asfreq_DownsampleWithinDay(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return downsample_daytime(ordinal, af_info, relation == 'E');
-}
-
-static npy_int64 asfreq_UpsampleWithinDay(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return upsample_daytime(ordinal, af_info, relation == 'E');
-}
-//************ FROM BUSINESS ***************
-
-static npy_int64 asfreq_BtoDT(npy_int64 ordinal, char relation, asfreq_info *af_info)
-{
-    ordinal += BDAY_OFFSET;
-    ordinal = (((ordinal - 1) / 5) * 7 +
-            mod_compat(ordinal - 1, 5) + 1 - ORD_OFFSET);
-
-    return upsample_daytime(ordinal, af_info, relation != 'S');
-}
-
-static npy_int64 asfreq_BtoA(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_BtoDT, asfreq_DTtoA);
-}
-
-static npy_int64 asfreq_BtoQ(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_BtoDT, asfreq_DTtoQ);
-}
-
-static npy_int64 asfreq_BtoM(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_BtoDT, asfreq_DTtoM);
-}
-
-static npy_int64 asfreq_BtoW(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_BtoDT, asfreq_DTtoW);
-}
-
-//************ FROM WEEKLY ***************
-
-static npy_int64 asfreq_WtoDT(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    ordinal += WEEK_OFFSET;
-    if (relation != 'S') {
-        ordinal += 1;
-    }
-
-    ordinal = ordinal * 7 - 6 + af_info->from_week_end - ORD_OFFSET;
-
-    if (relation != 'S') {
-        ordinal -= 1;
-    }
-
-    return upsample_daytime(ordinal, af_info, relation != 'S');
-}
-
-static npy_int64 asfreq_WtoA(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_WtoDT, asfreq_DTtoA);
-}
-
-static npy_int64 asfreq_WtoQ(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_WtoDT, asfreq_DTtoQ);
-}
-
-static npy_int64 asfreq_WtoM(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_WtoDT, asfreq_DTtoM);
-}
-
-static npy_int64 asfreq_WtoW(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_WtoDT, asfreq_DTtoW);
-}
-
-static npy_int64 asfreq_WtoB(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-
-    struct date_info dinfo;
-    if (dInfoCalc_SetFromAbsDate(&dinfo,
-                asfreq_WtoDT(ordinal, relation, af_info) + ORD_OFFSET,
-                GREGORIAN_CALENDAR)) return INT_ERR_CODE;
-
-    if (relation == 'S') {
-        return DtoB_WeekendToMonday(dinfo.absdate, dinfo.day_of_week);
-    }
-    else {
-        return DtoB_WeekendToFriday(dinfo.absdate, dinfo.day_of_week);
-    }
-}
-
-//************ FROM MONTHLY ***************
-static void MtoD_ym(npy_int64 ordinal, int *y, int *m) {
-    *y = floordiv(ordinal, 12) + BASE_YEAR;
-    *m = mod_compat(ordinal, 12) + 1;
-}
-
-
-static npy_int64 asfreq_MtoDT(npy_int64 ordinal, char relation, asfreq_info* af_info) {
-    npy_int64 absdate;
-    int y, m;
-
-    if (relation == 'E') {
-      ordinal += 1;
-    }
-    MtoD_ym(ordinal, &y, &m);
-    if ((absdate = absdate_from_ymd(y, m, 1)) == INT_ERR_CODE) return INT_ERR_CODE;
-    ordinal = absdate - ORD_OFFSET;
-
-    if (relation == 'E') {
-      ordinal -= 1;
-    }
-
-    return upsample_daytime(ordinal, af_info, relation != 'S');
-}
-
-static npy_int64 asfreq_MtoA(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_MtoDT, asfreq_DTtoA);
-}
-
-static npy_int64 asfreq_MtoQ(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_MtoDT, asfreq_DTtoQ);
-}
-
-static npy_int64 asfreq_MtoW(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_MtoDT, asfreq_DTtoW);
-}
-
-static npy_int64 asfreq_MtoB(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    struct date_info dinfo;
-    
-    if (dInfoCalc_SetFromAbsDate(&dinfo,
-                asfreq_MtoDT(ordinal, relation, af_info) + ORD_OFFSET,
-                GREGORIAN_CALENDAR)) return INT_ERR_CODE;
-
-    if (relation == 'S') { return DtoB_WeekendToMonday(dinfo.absdate, dinfo.day_of_week); }
-    else                 { return DtoB_WeekendToFriday(dinfo.absdate, dinfo.day_of_week); }
-}
-
-//************ FROM QUARTERLY ***************
-
-static void QtoD_ym(npy_int64 ordinal, int *y, int *m, asfreq_info *af_info) {
-    *y = floordiv(ordinal, 4) + BASE_YEAR;
-    *m = mod_compat(ordinal, 4) * 3 + 1;
-
-    if (af_info->from_q_year_end != 12) {
-        *m += af_info->from_q_year_end;
-        if (*m > 12) { *m -= 12; }
-        else { *y -= 1; }
-    }
-}
-
-static npy_int64 asfreq_QtoDT(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-
-    npy_int64 absdate;
-    int y, m;
-
-    if (relation == 'E') {
-      ordinal += 1;
-    }
-
-    QtoD_ym(ordinal, &y, &m, af_info);
-
-    if ((absdate = absdate_from_ymd(y, m, 1)) == INT_ERR_CODE) return INT_ERR_CODE;
-
-    if (relation == 'E') {
-      absdate -= 1;
-    }
-
-    return upsample_daytime(absdate - ORD_OFFSET, af_info, relation != 'S');
-}
-
-static npy_int64 asfreq_QtoQ(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_QtoDT, asfreq_DTtoQ);
-}
-
-static npy_int64 asfreq_QtoA(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_QtoDT, asfreq_DTtoA);
-}
-
-static npy_int64 asfreq_QtoM(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_QtoDT, asfreq_DTtoM);
-}
-
-static npy_int64 asfreq_QtoW(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_QtoDT, asfreq_DTtoW);
-}
-
-static npy_int64 asfreq_QtoB(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-
-    struct date_info dinfo;
-    if (dInfoCalc_SetFromAbsDate(&dinfo,
-                asfreq_QtoDT(ordinal, relation, af_info) + ORD_OFFSET,
-                GREGORIAN_CALENDAR)) return INT_ERR_CODE;
-
-    if (relation == 'S') { return DtoB_WeekendToMonday(dinfo.absdate, dinfo.day_of_week); }
-    else                 { return DtoB_WeekendToFriday(dinfo.absdate, dinfo.day_of_week); }
-}
-
-
-//************ FROM ANNUAL ***************
-
-static npy_int64 asfreq_AtoDT(npy_int64 year, char relation, asfreq_info *af_info) {
-    npy_int64 absdate;
-    int month = (af_info->from_a_year_end) % 12;
-
-    // start from 1970
-    year += BASE_YEAR;
-
-    month += 1;
-
-    if (af_info->from_a_year_end != 12) {
-      year -= 1;
-    }
-
-    if (relation == 'E') {
-      year += 1;
-    }
-
-    absdate = absdate_from_ymd(year, month, 1);
-
-    if (absdate  == INT_ERR_CODE) {
-        return INT_ERR_CODE;
-    }
-
-    if (relation == 'E') {
-      absdate -= 1;
-    }
-
-    return upsample_daytime(absdate - ORD_OFFSET, af_info, relation != 'S');
-}
-
-static npy_int64 asfreq_AtoA(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_AtoDT, asfreq_DTtoA);
-}
-
-static npy_int64 asfreq_AtoQ(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_AtoDT, asfreq_DTtoQ);
-}
-
-static npy_int64 asfreq_AtoM(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_AtoDT, asfreq_DTtoM);
-}
-
-static npy_int64 asfreq_AtoW(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_AtoDT, asfreq_DTtoW);
-}
-
-static npy_int64 asfreq_AtoB(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-
-    struct date_info dinfo;
-    if (dInfoCalc_SetFromAbsDate(&dinfo,
-                asfreq_AtoDT(ordinal, relation, af_info) + ORD_OFFSET,
-                GREGORIAN_CALENDAR)) return INT_ERR_CODE;
-
-    if (relation == 'S') { return DtoB_WeekendToMonday(dinfo.absdate, dinfo.day_of_week); }
-    else                 { return DtoB_WeekendToFriday(dinfo.absdate, dinfo.day_of_week); }
-}
-
-static npy_int64 nofunc(npy_int64 ordinal, char relation, asfreq_info *af_info) { return INT_ERR_CODE; }
-static npy_int64 no_op(npy_int64 ordinal, char relation, asfreq_info *af_info) { return ordinal; }
-
-// end of frequency specific conversion routines
-
-static int calc_a_year_end(int freq, int group) {
-    int result = (freq - group) % 12;
-    if (result == 0) {return 12;}
-    else {return result;}
-}
-
-static int calc_week_end(int freq, int group) {
-    return freq - group;
-}
-
-void get_asfreq_info(int fromFreq, int toFreq, asfreq_info *af_info) {
-    int fromGroup = get_freq_group(fromFreq);
-    int toGroup = get_freq_group(toFreq);
-
-	af_info->intraday_conversion_factor =
-	    get_daytime_conversion_factor(
-	        get_freq_group_index(max_value(fromGroup, FR_DAY)),
-	        get_freq_group_index(max_value(toGroup, FR_DAY))
-	    );
-
-    //printf("get_asfreq_info(%d, %d) %ld, %d\n", fromFreq, toFreq, af_info->intraday_conversion_factor, af_info->intraday_conversion_upsample);
-
-    switch(fromGroup)
-    {
-        case FR_WK: 
-            af_info->from_week_end = calc_week_end(fromFreq, fromGroup);
-            break;
-        case FR_ANN: 
-            af_info->from_a_year_end = calc_a_year_end(fromFreq, fromGroup);
-            break;
-        case FR_QTR: 
-            af_info->from_q_year_end = calc_a_year_end(fromFreq, fromGroup);
-            break;
-    }
-
-    switch(toGroup)
-    {
-        case FR_WK: 
-            af_info->to_week_end = calc_week_end(toFreq, toGroup);
-            break;
-        case FR_ANN: 
-            af_info->to_a_year_end = calc_a_year_end(toFreq, toGroup);
-            break;
-        case FR_QTR: 
-            af_info->to_q_year_end = calc_a_year_end(toFreq, toGroup);
-            break;
-    }
-}
-
-
-freq_conv_func get_asfreq_func(int fromFreq, int toFreq)
-{
-    int fromGroup = get_freq_group(fromFreq);
-    int toGroup = get_freq_group(toFreq);
-
-    if (fromGroup == FR_UND) { fromGroup = FR_DAY; }
-
-    switch(fromGroup)
-    {
-        case FR_ANN:
-            switch(toGroup)
-            {
-                case FR_ANN: return &asfreq_AtoA;
-                case FR_QTR: return &asfreq_AtoQ;
-                case FR_MTH: return &asfreq_AtoM;
-                case FR_WK: return &asfreq_AtoW;
-                case FR_BUS: return &asfreq_AtoB;
-                case FR_DAY: 
-                case FR_HR: 
-                case FR_MIN: 
-                case FR_SEC:
-                case FR_MS:
-                case FR_US:
-                case FR_NS:
-                             return &asfreq_AtoDT;
-
-                default: return &nofunc;
-            }
-
-        case FR_QTR:
-            switch(toGroup)
-            {
-                case FR_ANN: return &asfreq_QtoA;
-                case FR_QTR: return &asfreq_QtoQ;
-                case FR_MTH: return &asfreq_QtoM;
-                case FR_WK: return &asfreq_QtoW;
-                case FR_BUS: return &asfreq_QtoB;
-                case FR_DAY: 
-                case FR_HR:
-                case FR_MIN:
-                case FR_SEC:
-                case FR_MS:
-                case FR_US:
-                case FR_NS:
-                             return &asfreq_QtoDT;
-                default: return &nofunc;
-            }
-
-        case FR_MTH:
-            switch(toGroup)
-            {
-                case FR_ANN: return &asfreq_MtoA;
-                case FR_QTR: return &asfreq_MtoQ;
-                case FR_MTH: return &no_op;
-                case FR_WK: return &asfreq_MtoW;
-                case FR_BUS: return &asfreq_MtoB;
-                case FR_DAY:
-                case FR_HR:
-                case FR_MIN:
-                case FR_SEC:
-                case FR_MS:
-                case FR_US:
-                case FR_NS:
-                             return &asfreq_MtoDT;
-                default: return &nofunc;
-            }
-
-        case FR_WK:
-            switch(toGroup)
-            {
-                case FR_ANN: return &asfreq_WtoA;
-                case FR_QTR: return &asfreq_WtoQ;
-                case FR_MTH: return &asfreq_WtoM;
-                case FR_WK: return &asfreq_WtoW;
-                case FR_BUS: return &asfreq_WtoB;
-                case FR_DAY: 
-                case FR_HR: 
-                case FR_MIN: 
-                case FR_SEC: 
-                case FR_MS:
-                case FR_US:
-                case FR_NS:
-                             return &asfreq_WtoDT;
-                default: return &nofunc;
-            }
-
-        case FR_BUS:
-            switch(toGroup)
-            {
-                case FR_ANN: return &asfreq_BtoA;
-                case FR_QTR: return &asfreq_BtoQ;
-                case FR_MTH: return &asfreq_BtoM;
-                case FR_WK: return &asfreq_BtoW;
-                case FR_BUS: return &no_op;
-                case FR_DAY: 
-                case FR_HR: 
-                case FR_MIN: 
-                case FR_SEC:
-                case FR_MS:
-                case FR_US:
-                case FR_NS:
-                             return &asfreq_BtoDT;
-                default: return &nofunc;
-            }
-
-        case FR_DAY:
-        case FR_HR:
-        case FR_MIN:
-        case FR_SEC:
-        case FR_MS:
-        case FR_US:
-        case FR_NS:
-            switch(toGroup)
-            {
-                case FR_ANN: return &asfreq_DTtoA;
-                case FR_QTR: return &asfreq_DTtoQ;
-                case FR_MTH: return &asfreq_DTtoM;
-                case FR_WK: return &asfreq_DTtoW;
-                case FR_BUS: return &asfreq_DTtoB;
-                case FR_DAY: 
-                case FR_HR:
-                case FR_MIN:
-                case FR_SEC:
-                case FR_MS:
-                case FR_US:
-                case FR_NS:
-                    if (fromGroup > toGroup) {
-                        return &asfreq_DownsampleWithinDay;
-                    } else {
-                        return &asfreq_UpsampleWithinDay;
-                    }
-                default: return &nofunc;
-            }
-
-        default: return &nofunc;
-    }
-}
-
-double get_abs_time(int freq, npy_int64 date_ordinal, npy_int64 ordinal) {
-    //printf("get_abs_time %d %lld %lld\n", freq, date_ordinal, ordinal);
-
-	int freq_index, day_index, base_index;
-	npy_int64 per_day, start_ord;
-	double unit, result;
-
-    if (freq <= FR_DAY) {
-      return 0;
-    }
-
-    freq_index = get_freq_group_index(freq);
-    day_index = get_freq_group_index(FR_DAY);
-    base_index = get_freq_group_index(FR_SEC);
-
-    //printf("  indices: day %d, freq %d, base %d\n", day_index, freq_index, base_index);
-
-    per_day = get_daytime_conversion_factor(day_index, freq_index);
-    unit = get_daytime_conversion_factor(freq_index, base_index);
-
-    //printf("  per_day: %lld, unit: %f\n", per_day, unit);
-
-    if (base_index < freq_index) {
-      unit = 1 / unit;
-      //printf("  corrected unit: %f\n", unit);
-    }
-
-    start_ord = date_ordinal * per_day;
-    //printf("start_ord: %lld\n", start_ord);
-    result = (double) ( unit * (ordinal - start_ord));
-    //printf("  result: %f\n", result);
-    return result;
-}
-
-/* Sets the time part of the DateTime object. */
-static int dInfoCalc_SetFromAbsTime(struct date_info *dinfo,
-        double abstime)
-{
-    int inttime;
-    int hour,minute;
-    double second;
-
-    inttime = (int)abstime;
-    hour = inttime / 3600;
-    minute = (inttime % 3600) / 60;
-    second = abstime - (double)(hour*3600 + minute*60);
-
-    dinfo->hour = hour;
-    dinfo->minute = minute;
-    dinfo->second = second;
-
-    dinfo->abstime = abstime;
-
-    return 0;
-}
-
-/* Set the instance's value using the given date and time. calendar
-   may be set to the flags: GREGORIAN_CALENDAR, JULIAN_CALENDAR to
-   indicate the calendar to be used. */
-static int dInfoCalc_SetFromAbsDateTime(struct date_info *dinfo,
-        npy_int64 absdate,
-        double abstime,
-        int calendar)
-{
-    /* Bounds check */
-    Py_AssertWithArg(abstime >= 0.0 && abstime <= SECONDS_PER_DAY,
-            PyExc_ValueError,
-            "abstime out of range (0.0 - 86400.0): %f",
-            abstime);
-
-    /* Calculate the date */
-    if (dInfoCalc_SetFromAbsDate(dinfo, absdate, calendar)) goto onError;
-
-    /* Calculate the time */
-    if (dInfoCalc_SetFromAbsTime(dinfo, abstime)) goto onError;
-
-    return 0;
-onError:
-    return INT_ERR_CODE;
-}
-
-/* ------------------------------------------------------------------
- * New pandas API-helper code, to expose to cython
- * ------------------------------------------------------------------*/
-
-npy_int64 asfreq(npy_int64 period_ordinal, int freq1, int freq2, char relation)
-{
-    npy_int64 val;
-    freq_conv_func func;
-    asfreq_info finfo;
-
-    func = get_asfreq_func(freq1, freq2);
-
-    get_asfreq_info(freq1, freq2, &finfo);
-
-    //printf("\n%x %d %d %ld %ld\n", func, freq1, freq2, finfo.intraday_conversion_factor, -finfo.intraday_conversion_factor);
-
-    val = (*func)(period_ordinal, relation, &finfo);
-
-    if (val == INT_ERR_CODE) {
-        //Py_Error(PyExc_ValueError, "Unable to convert to desired frequency.");
-        goto onError;
-    }
-    return val;
-onError:
-    return INT_ERR_CODE;
-}
-
-
-/* generate an ordinal in period space */
-npy_int64 get_period_ordinal(int year, int month, int day,
-        int hour, int minute, int second, int microseconds, int picoseconds,
-        int freq)
-{
-    npy_int64 absdays, delta, seconds;
-    npy_int64 weeks, days;
-    npy_int64 ordinal, day_adj;
-    int freq_group, fmonth, mdiff;
-    freq_group = get_freq_group(freq);
-
-    if (freq == FR_SEC || freq == FR_MS || freq == FR_US || freq == FR_NS) {
-
-        absdays = absdate_from_ymd(year, month, day);
-        delta = (absdays - ORD_OFFSET);
-        seconds = (npy_int64)(delta * 86400 + hour * 3600 + minute * 60 + second);
-
-        switch(freq) {
-          case FR_MS:
-            return seconds * 1000 + microseconds / 1000;
-
-          case FR_US:
-            return seconds * 1000000 + microseconds;
-
-          case FR_NS:
-            return seconds * 1000000000 + microseconds * 1000 + picoseconds / 1000;
-        }
-
-        return seconds;
-    }
-
-    if (freq == FR_MIN) {
-        absdays = absdate_from_ymd(year, month, day);
-        delta = (absdays - ORD_OFFSET);
-        return (npy_int64)(delta*1440 + hour*60 + minute);
-    }
-
-    if (freq == FR_HR) {
-        if ((absdays = absdate_from_ymd(year, month, day)) == INT_ERR_CODE)
-        {
-            goto onError;
-        }
-        delta = (absdays - ORD_OFFSET);
-        return (npy_int64)(delta*24 + hour);
-    }
-
-    if (freq == FR_DAY)
-    {
-        return (npy_int64) (absdate_from_ymd(year, month, day) - ORD_OFFSET);
-    }
-
-    if (freq == FR_UND)
-    {
-        return (npy_int64) (absdate_from_ymd(year, month, day) - ORD_OFFSET);
-    }
-
-    if (freq == FR_BUS)
-    {
-        if((days = absdate_from_ymd(year, month, day)) == INT_ERR_CODE)
-        {
-            goto onError;
-        }
-        // calculate the current week assuming sunday as last day of a week
-        weeks = (days - BASE_WEEK_TO_DAY_OFFSET) / DAYS_PER_WEEK;
-        // calculate the current weekday (in range 1 .. 7)
-        delta = (days - BASE_WEEK_TO_DAY_OFFSET) % DAYS_PER_WEEK + 1;
-        // return the number of business days in full weeks plus the business days in the last - possible partial - week
-        return (npy_int64)(weeks * BUSINESS_DAYS_PER_WEEK)
-            + (delta <= BUSINESS_DAYS_PER_WEEK
-                ? delta
-                : BUSINESS_DAYS_PER_WEEK + 1)
-             - BDAY_OFFSET;
-    }
-
-    if (freq_group == FR_WK)
-    {
-        if((ordinal = (npy_int64)absdate_from_ymd(year, month, day)) == INT_ERR_CODE)
-        {
-            goto onError;
-        }
-        day_adj = freq - FR_WK;
-        return (ordinal - (1 + day_adj)) / 7 + 1 - WEEK_OFFSET;
-    }
-
-    if (freq == FR_MTH)
-    {
-        return (year - BASE_YEAR) * 12 + month - 1;
-    }
-
-    if (freq_group == FR_QTR)
-    {
-        fmonth = freq - FR_QTR;
-        if (fmonth == 0) fmonth = 12;
-
-        mdiff = month - fmonth;
-        if (mdiff < 0) mdiff += 12;
-        if (month >= fmonth) mdiff += 12;
-
-        return (year - BASE_YEAR) * 4 + (mdiff - 1) / 3;
-    }
-
-    if (freq_group == FR_ANN)
-    {
-        fmonth = freq - FR_ANN;
-        if (fmonth == 0) fmonth = 12;
-        if (month <= fmonth) {
-            return year - BASE_YEAR;
-        }
-        else {
-            return year - BASE_YEAR + 1;
-        }
-    }
-
-    Py_Error(PyExc_RuntimeError, "Unable to generate frequency ordinal");
-
-onError:
-    return INT_ERR_CODE;
-}
-
-/*
-   Returns the proleptic Gregorian ordinal of the date, as an integer.
-   This corresponds to the number of days since Jan., 1st, 1AD.
-   When the instance has a frequency less than daily, the proleptic date
-   is calculated for the last day of the period.
- */
-
-npy_int64 get_python_ordinal(npy_int64 period_ordinal, int freq)
-{
-    asfreq_info af_info;
-	freq_conv_func toDaily = NULL;
-
-    if (freq == FR_DAY)
-        return period_ordinal + ORD_OFFSET;
-
-    toDaily = get_asfreq_func(freq, FR_DAY);
-    get_asfreq_info(freq, FR_DAY, &af_info);
-
-    return toDaily(period_ordinal, 'E', &af_info) + ORD_OFFSET;
-}
-
-char *str_replace(const char *s, const char *old, const char *new) {
-    char *ret;
-    int i, count = 0;
-    size_t newlen = strlen(new);
-    size_t oldlen = strlen(old);
-
-    for (i = 0; s[i] != '\0'; i++) {
-        if (strstr(&s[i], old) == &s[i]) {
-            count++;
-            i += oldlen - 1;
-        }
-    }
-
-    ret = PyArray_malloc(i + 1 + count * (newlen - oldlen));
-    if (ret == NULL) {return (char *)PyErr_NoMemory();}
-
-    i = 0;
-    while (*s) {
-        if (strstr(s, old) == s) {
-            strcpy(&ret[i], new);
-            i += newlen;
-            s += oldlen;
-        } else {
-            ret[i++] = *s++;
-        }
-    }
-    ret[i] = '\0';
-
-    return ret;
-}
-
-// function to generate a nice string representation of the period
-// object, originally from DateObject_strftime
-
-char* c_strftime(struct date_info *tmp, char *fmt) {
-    struct tm c_date;
-    char* result;
-    struct date_info dinfo = *tmp;
-    int result_len = strlen(fmt) + 50;
-
-    c_date.tm_sec = (int)dinfo.second;
-    c_date.tm_min = dinfo.minute;
-    c_date.tm_hour = dinfo.hour;
-    c_date.tm_mday = dinfo.day;
-    c_date.tm_mon = dinfo.month - 1;
-    c_date.tm_year = dinfo.year - 1900;
-    c_date.tm_wday = (dinfo.day_of_week + 1) % 7;
-    c_date.tm_yday = dinfo.day_of_year - 1;
-    c_date.tm_isdst = -1;
-
-    result = malloc(result_len * sizeof(char));
-
-    strftime(result, result_len, fmt, &c_date);
-
-    return result;
-}
-
-int get_yq(npy_int64 ordinal, int freq, int *quarter, int *year) {
-    asfreq_info af_info;
-    int qtr_freq;
-    npy_int64 daily_ord;
-    npy_int64 (*toDaily)(npy_int64, char, asfreq_info*) = NULL;
-
-    toDaily = get_asfreq_func(freq, FR_DAY);
-    get_asfreq_info(freq, FR_DAY, &af_info);
-
-    daily_ord = toDaily(ordinal, 'E', &af_info);
-
-    if (get_freq_group(freq) == FR_QTR) {
-        qtr_freq = freq;
-    } else { qtr_freq = FR_QTR; }
-    get_asfreq_info(FR_DAY, qtr_freq, &af_info);
-
-    if(DtoQ_yq(daily_ord, &af_info, year, quarter) == INT_ERR_CODE)
-        return -1;
-
-    return 0;
-}
-
-
-
-
-
-static int _quarter_year(npy_int64 ordinal, int freq, int *year, int *quarter) {
-    asfreq_info af_info;
-    int qtr_freq;
-
-    ordinal = get_python_ordinal(ordinal, freq) - ORD_OFFSET;
-
-    if (get_freq_group(freq) == FR_QTR)
-        qtr_freq = freq;
-    else
-        qtr_freq = FR_QTR;
-
-    get_asfreq_info(FR_DAY, qtr_freq, &af_info);
-
-    if (DtoQ_yq(ordinal, &af_info, year, quarter) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-
-    if ((qtr_freq % 1000) > 12)
-        *year -= 1;
-
-    return 0;
-}
-
-static int _ISOWeek(struct date_info *dinfo)
-{
-    int week;
-
-    /* Estimate */
-    week = (dinfo->day_of_year-1) - dinfo->day_of_week + 3;
-    if (week >= 0) week = week / 7 + 1;
-
-    /* Verify */
-    if (week < 0) {
-        /* The day lies in last week of the previous year */
-        if ((week > -2) ||
-                (week == -2 && dInfoCalc_Leapyear(dinfo->year-1, dinfo->calendar)))
-            week = 53;
-        else
-            week = 52;
-    } else if (week == 53) {
-        /* Check if the week belongs to year or year+1 */
-        if (31-dinfo->day + dinfo->day_of_week < 3) {
-            week = 1;
-        }
-    }
-
-    return week;
-}
-
-int get_date_info(npy_int64 ordinal, int freq, struct date_info *dinfo)
-{
-    npy_int64 absdate = get_python_ordinal(ordinal, freq);
-    double abstime = get_abs_time(freq, absdate - ORD_OFFSET, ordinal);
-
-    while (abstime < 0) {
-        abstime += 86400;
-        absdate -= 1;
-    }
-    while (abstime >= 86400) {
-        abstime -= 86400;
-	absdate += 1;
-    }
-
-    if(dInfoCalc_SetFromAbsDateTime(dinfo, absdate,
-                abstime, GREGORIAN_CALENDAR))
-        return INT_ERR_CODE;
-
-    return 0;
-}
-
-int pyear(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    get_date_info(ordinal, freq, &dinfo);
-    return dinfo.year;
-}
-
-int pqyear(npy_int64 ordinal, int freq) {
-    int year, quarter;
-    if( _quarter_year(ordinal, freq, &year, &quarter) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return year;
-}
-
-int pquarter(npy_int64 ordinal, int freq) {
-    int year, quarter;
-    if(_quarter_year(ordinal, freq, &year, &quarter) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return quarter;
-}
-
-int pmonth(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if(get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.month;
-}
-
-int pday(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if(get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.day;
-}
-
-int pweekday(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if(get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.day_of_week;
-}
-
-int pday_of_week(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if(get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.day_of_week;
-}
-
-int pday_of_year(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if(get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.day_of_year;
-}
-
-int pweek(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if(get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return _ISOWeek(&dinfo);
-}
-
-int phour(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if(get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.hour;
-}
-
-int pminute(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if(get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.minute;
-}
-
-int psecond(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if(get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return (int)dinfo.second;
-}
-
-int pdays_in_month(npy_int64 ordinal, int freq) {
-    int days;
-    struct date_info dinfo;
-    if(get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    
-    days = days_in_month[dInfoCalc_Leapyear(dinfo.year, dinfo.calendar)][dinfo.month-1];
-    return days;
-}
diff --git a/pandas/src/period_helper.h b/pandas/src/period_helper.h
deleted file mode 100644
index 0351321926fa2..0000000000000
--- a/pandas/src/period_helper.h
+++ /dev/null
@@ -1,170 +0,0 @@
-/*
- * Borrowed and derived code from scikits.timeseries that we will expose via
- * Cython to pandas. This primarily concerns interval representation and
- * frequency conversion routines.
- */
-
-#ifndef C_PERIOD_H
-#define C_PERIOD_H
-
-#include <Python.h>
-#include "helper.h"
-#include "numpy/ndarraytypes.h"
-#include "headers/stdint.h"
-#include "limits.h"
-
-/*
- * declarations from period here
- */
-
-#define GREGORIAN_CALENDAR 0
-#define JULIAN_CALENDAR 1
-
-#define SECONDS_PER_DAY ((double) 86400.0)
-
-#define Py_AssertWithArg(x,errortype,errorstr,a1) {if (!(x)) {PyErr_Format(errortype,errorstr,a1);goto onError;}}
-#define Py_Error(errortype,errorstr) {PyErr_SetString(errortype,errorstr);goto onError;}
-
-/*** FREQUENCY CONSTANTS ***/
-
-// HIGHFREQ_ORIG is the datetime ordinal from which to begin the second
-// frequency ordinal sequence
-
-// typedef int64_t npy_int64;
-// begins second ordinal at 1/1/1970 unix epoch
-
-// #define HIGHFREQ_ORIG 62135683200LL
-#define BASE_YEAR 1970
-#define ORD_OFFSET 719163LL // days until 1970-01-01
-#define BDAY_OFFSET 513689LL // days until 1970-01-01
-#define WEEK_OFFSET 102737LL
-#define BASE_WEEK_TO_DAY_OFFSET 1 // difference between day 0 and end of week in days
-#define DAYS_PER_WEEK 7
-#define BUSINESS_DAYS_PER_WEEK 5
-#define HIGHFREQ_ORIG 0 // ORD_OFFSET * 86400LL // days until 1970-01-01
-
-#define FR_ANN  1000  /* Annual */
-#define FR_ANNDEC  FR_ANN  /* Annual - December year end*/
-#define FR_ANNJAN  1001  /* Annual - January year end*/
-#define FR_ANNFEB  1002  /* Annual - February year end*/
-#define FR_ANNMAR  1003  /* Annual - March year end*/
-#define FR_ANNAPR  1004  /* Annual - April year end*/
-#define FR_ANNMAY  1005  /* Annual - May year end*/
-#define FR_ANNJUN  1006  /* Annual - June year end*/
-#define FR_ANNJUL  1007  /* Annual - July year end*/
-#define FR_ANNAUG  1008  /* Annual - August year end*/
-#define FR_ANNSEP  1009  /* Annual - September year end*/
-#define FR_ANNOCT  1010  /* Annual - October year end*/
-#define FR_ANNNOV  1011  /* Annual - November year end*/
-
-/* The standard quarterly frequencies with various fiscal year ends
-   eg, Q42005 for Q@OCT runs Aug 1, 2005 to Oct 31, 2005 */
-#define FR_QTR  2000       /* Quarterly - December year end (default quarterly) */
-#define FR_QTRDEC  FR_QTR  /* Quarterly - December year end */
-#define FR_QTRJAN  2001    /* Quarterly - January year end */
-#define FR_QTRFEB  2002    /* Quarterly - February year end */
-#define FR_QTRMAR  2003    /* Quarterly - March year end */
-#define FR_QTRAPR  2004    /* Quarterly - April year end */
-#define FR_QTRMAY  2005    /* Quarterly - May year end */
-#define FR_QTRJUN  2006    /* Quarterly - June year end */
-#define FR_QTRJUL  2007    /* Quarterly - July year end */
-#define FR_QTRAUG  2008    /* Quarterly - August year end */
-#define FR_QTRSEP  2009    /* Quarterly - September year end */
-#define FR_QTROCT  2010    /* Quarterly - October year end */
-#define FR_QTRNOV  2011    /* Quarterly - November year end */
-
-#define FR_MTH  3000  /* Monthly */
-
-#define FR_WK   4000  /* Weekly */
-#define FR_WKSUN FR_WK /* Weekly - Sunday end of week */
-#define FR_WKMON 4001 /* Weekly - Monday end of week */
-#define FR_WKTUE 4002 /* Weekly - Tuesday end of week */
-#define FR_WKWED 4003 /* Weekly - Wednesday end of week */
-#define FR_WKTHU 4004 /* Weekly - Thursday end of week */
-#define FR_WKFRI 4005 /* Weekly - Friday end of week */
-#define FR_WKSAT 4006 /* Weekly - Saturday end of week */
-
-#define FR_BUS  5000  /* Business days */
-#define FR_DAY  6000  /* Daily */
-#define FR_HR   7000  /* Hourly */
-#define FR_MIN  8000  /* Minutely */
-#define FR_SEC  9000  /* Secondly */
-#define FR_MS 10000  /* Millisecondly */
-#define FR_US 11000  /* Microsecondly */
-#define FR_NS 12000  /* Nanosecondly */
-
-#define FR_UND  -10000 /* Undefined */
-
-#define INT_ERR_CODE INT32_MIN
-
-#define MEM_CHECK(item) if (item == NULL) { return PyErr_NoMemory(); }
-#define ERR_CHECK(item) if (item == NULL) { return NULL; }
-
-typedef struct asfreq_info {
-    int from_week_end;   // day the week ends on in the "from" frequency
-    int to_week_end;     // day the week ends on in the "to" frequency
-
-    int from_a_year_end; // month the year ends on in the "from" frequency
-    int to_a_year_end;   // month the year ends on in the "to" frequency
-
-    int from_q_year_end; // month the year ends on in the "from" frequency
-    int to_q_year_end;   // month the year ends on in the "to" frequency
-
-    npy_int64 intraday_conversion_factor;
-} asfreq_info;
-
-
-typedef struct date_info {
-    npy_int64 absdate;
-    double abstime;
-
-    double second;
-    int minute;
-    int hour;
-    int day;
-    int month;
-    int quarter;
-    int year;
-    int day_of_week;
-    int day_of_year;
-    int calendar;
-} date_info;
-
-typedef npy_int64 (*freq_conv_func)(npy_int64, char, asfreq_info*);
-
-/*
- * new pandas API helper functions here
- */
-
-npy_int64 asfreq(npy_int64 period_ordinal, int freq1, int freq2, char relation);
-
-npy_int64 get_period_ordinal(int year, int month, int day,
-                      int hour, int minute, int second, int microseconds, int picoseconds,
-                      int freq);
-
-npy_int64 get_python_ordinal(npy_int64 period_ordinal, int freq);
-
-int get_date_info(npy_int64 ordinal, int freq, struct date_info *dinfo);
-freq_conv_func get_asfreq_func(int fromFreq, int toFreq);
-void get_asfreq_info(int fromFreq, int toFreq, asfreq_info *af_info);
-
-int pyear(npy_int64 ordinal, int freq);
-int pqyear(npy_int64 ordinal, int freq);
-int pquarter(npy_int64 ordinal, int freq);
-int pmonth(npy_int64 ordinal, int freq);
-int pday(npy_int64 ordinal, int freq);
-int pweekday(npy_int64 ordinal, int freq);
-int pday_of_week(npy_int64 ordinal, int freq);
-int pday_of_year(npy_int64 ordinal, int freq);
-int pweek(npy_int64 ordinal, int freq);
-int phour(npy_int64 ordinal, int freq);
-int pminute(npy_int64 ordinal, int freq);
-int psecond(npy_int64 ordinal, int freq);
-int pdays_in_month(npy_int64 ordinal, int freq);
-
-double getAbsTime(int freq, npy_int64 dailyDate, npy_int64 originalDate);
-char *c_strftime(struct date_info *dinfo, char *fmt);
-int get_yq(npy_int64 ordinal, int freq, int *quarter, int *year);
-
-void initialize_daytime_conversion_factor_matrix(void);
-#endif
diff --git a/pandas/src/properties.pyx b/pandas/src/properties.pyx
deleted file mode 100644
index e619a3b6edd9a..0000000000000
--- a/pandas/src/properties.pyx
+++ /dev/null
@@ -1,65 +0,0 @@
-from cpython cimport PyDict_Contains, PyDict_GetItem, PyDict_GetItem
-
-
-cdef class cache_readonly(object):
-
-    cdef readonly:
-        object func, name, allow_setting
-
-    def __init__(self, func=None, allow_setting=False):
-        if func is not None:
-            self.func = func
-            self.name = func.__name__
-        self.allow_setting = allow_setting
-
-    def __call__(self, func, doc=None):
-        self.func = func
-        self.name = func.__name__
-        return self
-
-    def __get__(self, obj, typ):
-        # Get the cache or set a default one if needed
-
-        cache = getattr(obj, '_cache', None)
-        if cache is None:
-            try:
-                cache = obj._cache = {}
-            except (AttributeError):
-                return
-
-        if PyDict_Contains(cache, self.name):
-            # not necessary to Py_INCREF
-            val = <object> PyDict_GetItem(cache, self.name)
-        else:
-            val = self.func(obj)
-            PyDict_SetItem(cache, self.name, val)
-        return val
-
-    def __set__(self, obj, value):
-
-        if not self.allow_setting:
-            raise Exception("cannot set values for [%s]" % self.name)
-
-        # Get the cache or set a default one if needed
-        cache = getattr(obj, '_cache', None)
-        if cache is None:
-            try:
-                cache = obj._cache = {}
-            except (AttributeError):
-                return
-
-        PyDict_SetItem(cache, self.name, value)
-
-cdef class AxisProperty(object):
-    cdef:
-        Py_ssize_t axis
-
-    def __init__(self, axis=0):
-        self.axis = axis
-
-    def __get__(self, obj, type):
-        cdef list axes = obj._data.axes
-        return axes[self.axis]
-
-    def __set__(self, obj, value):
-        obj._set_axis(self.axis, value)
diff --git a/pandas/src/reduce.pyx b/pandas/src/reduce.pyx
deleted file mode 100644
index eb736e4569009..0000000000000
--- a/pandas/src/reduce.pyx
+++ /dev/null
@@ -1,613 +0,0 @@
-#cython=False
-from numpy cimport *
-import numpy as np
-
-from distutils.version import LooseVersion
-
-is_numpy_prior_1_6_2 = LooseVersion(np.__version__) < '1.6.2'
-
-cdef _get_result_array(object obj,
-                       Py_ssize_t size,
-                       Py_ssize_t cnt):
-
-    if isinstance(obj, np.ndarray) \
-            or isinstance(obj, list) and len(obj) == cnt \
-            or getattr(obj, 'shape', None) == (cnt,):
-        raise ValueError('function does not reduce')
-
-    return np.empty(size, dtype='O')
-
-
-cdef class Reducer:
-    '''
-    Performs generic reduction operation on a C or Fortran-contiguous ndarray
-    while avoiding ndarray construction overhead
-    '''
-    cdef:
-        Py_ssize_t increment, chunksize, nresults
-        object arr, dummy, f, labels, typ, ityp, index
-
-    def __init__(self, object arr, object f, axis=1, dummy=None,
-                 labels=None):
-        n, k = arr.shape
-
-        if axis == 0:
-            if not arr.flags.f_contiguous:
-                arr = arr.copy('F')
-
-            self.nresults = k
-            self.chunksize = n
-            self.increment = n * arr.dtype.itemsize
-        else:
-            if not arr.flags.c_contiguous:
-                arr = arr.copy('C')
-
-            self.nresults = n
-            self.chunksize = k
-            self.increment = k * arr.dtype.itemsize
-
-
-        self.f = f
-        self.arr = arr
-        self.labels = labels
-        self.dummy, self.typ, self.index, self.ityp = self._check_dummy(dummy=dummy)
-
-    def _check_dummy(self, dummy=None):
-        cdef object index=None, typ=None, ityp=None
-
-        if dummy is None:
-            dummy = np.empty(self.chunksize, dtype=self.arr.dtype)
-
-            # our ref is stolen later since we are creating this array
-            # in cython, so increment first
-            Py_INCREF(dummy)
-
-        else:
-
-            # we passed a series-like
-            if hasattr(dummy,'values'):
-
-                typ = type(dummy)
-                index = getattr(dummy,'index',None)
-                dummy = dummy.values
-
-            if dummy.dtype != self.arr.dtype:
-                raise ValueError('Dummy array must be same dtype')
-            if len(dummy) != self.chunksize:
-                raise ValueError('Dummy array must be length %d' % self.chunksize)
-
-        return dummy, typ, index, ityp
-
-    def get_result(self):
-        cdef:
-            char* dummy_buf
-            ndarray arr, result, chunk
-            Py_ssize_t i, incr
-            flatiter it
-            bint has_labels
-            object res, name, labels, index
-            object cached_typ=None
-
-        arr = self.arr
-        chunk = self.dummy
-        dummy_buf = chunk.data
-        chunk.data = arr.data
-        labels = self.labels
-        has_labels = labels is not None
-        has_index = self.index is not None
-        incr = self.increment
-
-        try:
-            for i in range(self.nresults):
-
-                if has_labels:
-                    name = util.get_value_at(labels, i)
-                else:
-                    name = None
-
-                # create the cached type
-                # each time just reassign the data
-                if i == 0:
-
-                    if self.typ is not None:
-
-                         # recreate with the index if supplied
-                         if has_index:
-
-                             cached_typ = self.typ(chunk, index=self.index, name=name)
-
-                         else:
-
-                             # use the passsed typ, sans index
-                             cached_typ = self.typ(chunk, name=name)
-
-                # use the cached_typ if possible
-                if cached_typ is not None:
-
-                    if has_index:
-                        object.__setattr__(cached_typ, 'index', self.index)
-
-                    object.__setattr__(cached_typ._data._block, 'values', chunk)
-                    object.__setattr__(cached_typ, 'name', name)
-                    res = self.f(cached_typ)
-                else:
-                    res = self.f(chunk)
-
-                if hasattr(res,'values') and isinstance(res.values, np.ndarray):
-                    res = res.values
-                if i == 0:
-                    result = _get_result_array(res,
-                                               self.nresults,
-                                               len(self.dummy))
-                    it = <flatiter> PyArray_IterNew(result)
-
-                PyArray_SETITEM(result, PyArray_ITER_DATA(it), res)
-                chunk.data = chunk.data + self.increment
-                PyArray_ITER_NEXT(it)
-        except Exception, e:
-            if hasattr(e, 'args'):
-                e.args = e.args + (i,)
-            raise
-        finally:
-            # so we don't free the wrong memory
-            chunk.data = dummy_buf
-
-        if result.dtype == np.object_:
-            result = maybe_convert_objects(result)
-
-        return result
-
-
-cdef class SeriesBinGrouper:
-    '''
-    Performs grouping operation according to bin edges, rather than labels
-    '''
-    cdef:
-        Py_ssize_t nresults, ngroups
-        bint passed_dummy
-
-    cdef public:
-        object arr, index, dummy_arr, dummy_index, values, f, bins, typ, ityp, name
-
-    def __init__(self, object series, object f, object bins, object dummy):
-        n = len(series)
-
-        self.bins = bins
-        self.f = f
-
-        values = series.values
-        if not values.flags.c_contiguous:
-            values = values.copy('C')
-        self.arr = values
-        self.typ = type(series)
-        self.ityp = type(series.index)
-        self.index = series.index.values
-        self.name = getattr(series,'name',None)
-
-        self.dummy_arr, self.dummy_index = self._check_dummy(dummy)
-        self.passed_dummy = dummy is not None
-
-        # kludge for #1688
-        if len(bins) > 0 and bins[-1] == len(series):
-            self.ngroups = len(bins)
-        else:
-            self.ngroups = len(bins) + 1
-
-    def _check_dummy(self, dummy=None):
-        # both values and index must be an ndarray!
-
-        if dummy is None:
-            values = np.empty(0, dtype=self.arr.dtype)
-            index = None
-        else:
-            values = dummy.values
-            if values.dtype != self.arr.dtype:
-                raise ValueError('Dummy array must be same dtype')
-            if not values.flags.contiguous:
-                values = values.copy()
-            index  = dummy.index.values
-            if not index.flags.contiguous:
-                index = index.copy()
-
-        return values, index
-
-    def get_result(self):
-        cdef:
-            ndarray arr, result
-            ndarray[int64_t] counts
-            Py_ssize_t i, n, group_size
-            object res
-            bint initialized = 0
-            Slider vslider, islider
-            object name, cached_typ=None, cached_ityp=None
-
-        counts = np.zeros(self.ngroups, dtype=np.int64)
-
-        if self.ngroups > 0:
-            counts[0] = self.bins[0]
-            for i in range(1, self.ngroups):
-                if i == self.ngroups - 1:
-                    counts[i] = len(self.arr) - self.bins[i-1]
-                else:
-                    counts[i] = self.bins[i] - self.bins[i-1]
-
-        group_size = 0
-        n = len(self.arr)
-        name = self.name
-
-        vslider = Slider(self.arr, self.dummy_arr)
-        islider = Slider(self.index, self.dummy_index)
-
-        try:
-            for i in range(self.ngroups):
-                group_size = counts[i]
-
-                islider.set_length(group_size)
-                vslider.set_length(group_size)
-
-                if cached_typ is None:
-                    cached_ityp = self.ityp(islider.buf)
-                    cached_typ = self.typ(vslider.buf, index=cached_ityp,
-                                          name=name)
-                else:
-                    object.__setattr__(cached_ityp, '_data', islider.buf)
-                    cached_ityp._engine.clear_mapping()
-                    object.__setattr__(cached_typ._data._block, 'values', vslider.buf)
-                    object.__setattr__(cached_typ, '_index', cached_ityp)
-                    object.__setattr__(cached_typ, 'name', name)
-
-                cached_ityp._engine.clear_mapping()
-                res = self.f(cached_typ)
-                res = _extract_result(res)
-                if not initialized:
-                    initialized = 1
-                    result = _get_result_array(res,
-                                               self.ngroups,
-                                               len(self.dummy_arr))
-
-                util.assign_value_1d(result, i, res)
-
-                islider.advance(group_size)
-                vslider.advance(group_size)
-
-        except:
-            raise
-        finally:
-            # so we don't free the wrong memory
-            islider.reset()
-            vslider.reset()
-
-        if result.dtype == np.object_:
-            result = maybe_convert_objects(result)
-
-        return result, counts
-
-
-cdef class SeriesGrouper:
-    '''
-    Performs generic grouping operation while avoiding ndarray construction
-    overhead
-    '''
-    cdef:
-        Py_ssize_t nresults, ngroups
-        bint passed_dummy
-
-    cdef public:
-        object arr, index, dummy_arr, dummy_index, f, labels, values, typ, ityp, name
-
-    def __init__(self, object series, object f, object labels,
-                 Py_ssize_t ngroups, object dummy):
-        n = len(series)
-
-        self.labels = labels
-        self.f = f
-
-        values = series.values
-        if not values.flags.c_contiguous:
-            values = values.copy('C')
-        self.arr = values
-        self.typ = type(series)
-        self.ityp = type(series.index)
-        self.index = series.index.values
-        self.name = getattr(series,'name',None)
-
-        self.dummy_arr, self.dummy_index = self._check_dummy(dummy)
-        self.passed_dummy = dummy is not None
-        self.ngroups = ngroups
-
-    def _check_dummy(self, dummy=None):
-        # both values and index must be an ndarray!
-
-        if dummy is None:
-            values = np.empty(0, dtype=self.arr.dtype)
-            index  = None
-        else:
-            values = dummy.values
-            if dummy.dtype != self.arr.dtype:
-                raise ValueError('Dummy array must be same dtype')
-            if not values.flags.contiguous:
-                values = values.copy()
-            index  = dummy.index.values
-            if not index.flags.contiguous:
-                index = index.copy()
-
-        return values, index
-
-    def get_result(self):
-        cdef:
-            ndarray arr, result
-            ndarray[int64_t] labels, counts
-            Py_ssize_t i, n, group_size, lab
-            object res
-            bint initialized = 0
-            Slider vslider, islider
-            object name, cached_typ=None, cached_ityp=None
-
-        labels = self.labels
-        counts = np.zeros(self.ngroups, dtype=np.int64)
-        group_size = 0
-        n = len(self.arr)
-        name = self.name
-
-        vslider = Slider(self.arr, self.dummy_arr)
-        islider = Slider(self.index, self.dummy_index)
-
-        try:
-            for i in range(n):
-                group_size += 1
-
-                lab = labels[i]
-
-                if i == n - 1 or lab != labels[i + 1]:
-                    if lab == -1:
-                        islider.advance(group_size)
-                        vslider.advance(group_size)
-                        group_size = 0
-                        continue
-
-                    islider.set_length(group_size)
-                    vslider.set_length(group_size)
-
-                    if cached_typ is None:
-                        cached_ityp = self.ityp(islider.buf)
-                        cached_typ = self.typ(vslider.buf, index=cached_ityp,
-                                              name=name)
-                    else:
-                        object.__setattr__(cached_ityp, '_data', islider.buf)
-                        cached_ityp._engine.clear_mapping()
-                        object.__setattr__(cached_typ._data._block, 'values', vslider.buf)
-                        object.__setattr__(cached_typ, '_index', cached_ityp)
-                        object.__setattr__(cached_typ, 'name', name)
-
-                    cached_ityp._engine.clear_mapping()
-                    res = self.f(cached_typ)
-                    res = _extract_result(res)
-                    if not initialized:
-                        initialized = 1
-                        result = _get_result_array(res,
-                                                   self.ngroups,
-                                                   len(self.dummy_arr))
-
-                    util.assign_value_1d(result, lab, res)
-                    counts[lab] = group_size
-                    islider.advance(group_size)
-                    vslider.advance(group_size)
-
-                    group_size = 0
-
-        except:
-            raise
-        finally:
-            # so we don't free the wrong memory
-            islider.reset()
-            vslider.reset()
-
-        if result.dtype == np.object_:
-            result = maybe_convert_objects(result)
-
-        return result, counts
-
-
-cdef inline _extract_result(object res):
-    ''' extract the result object, it might be a 0-dim ndarray
-        or a len-1 0-dim, or a scalar '''
-    if hasattr(res,'values'):
-       res = res.values
-    if not np.isscalar(res):
-       if isinstance(res, np.ndarray):
-          if res.ndim == 0:
-             res = res.item()
-          elif res.ndim == 1 and len(res) == 1:
-             res = res[0]
-    return res
-
-cdef class Slider:
-    '''
-    Only handles contiguous data for now
-    '''
-    cdef:
-        ndarray values, buf
-        Py_ssize_t stride, orig_len, orig_stride
-        char *orig_data
-
-    def __init__(self, object values, object buf):
-        assert(values.ndim == 1)
-
-        if not values.flags.contiguous:
-            values = values.copy()
-
-        assert(values.dtype == buf.dtype)
-        self.values = values
-        self.buf = buf
-        self.stride = values.strides[0]
-
-        self.orig_data = self.buf.data
-        self.orig_len = self.buf.shape[0]
-        self.orig_stride = self.buf.strides[0]
-
-        self.buf.data = self.values.data
-        self.buf.strides[0] = self.stride
-
-    cpdef advance(self, Py_ssize_t k):
-        self.buf.data = <char*> self.buf.data + self.stride * k
-
-    cdef move(self, int start, int end):
-        '''
-        For slicing
-        '''
-        self.buf.data = self.values.data + self.stride * start
-        self.buf.shape[0] = end - start
-
-    cpdef set_length(self, Py_ssize_t length):
-        self.buf.shape[0] = length
-
-    cpdef reset(self):
-
-        self.buf.shape[0] = self.orig_len
-        self.buf.data = self.orig_data
-        self.buf.strides[0] = self.orig_stride
-
-class InvalidApply(Exception):
-    pass
-
-def apply_frame_axis0(object frame, object f, object names,
-                      ndarray[int64_t] starts, ndarray[int64_t] ends):
-    cdef:
-        BlockSlider slider
-        Py_ssize_t i, n = len(starts)
-        list results
-        object piece
-        dict item_cache
-
-    if frame.index._has_complex_internals:
-        raise InvalidApply('Cannot modify frame index internals')
-
-
-    results = []
-
-    # Need to infer if our low-level mucking is going to cause a segfault
-    if n > 0:
-        chunk = frame.iloc[starts[0]:ends[0]]
-        shape_before = chunk.shape
-        try:
-            result = f(chunk)
-            if result is chunk:
-                raise InvalidApply('Function unsafe for fast apply')
-        except:
-            raise InvalidApply('Let this error raise above us')
-
-
-    slider = BlockSlider(frame)
-
-    mutated = False
-    item_cache = slider.dummy._item_cache
-    try:
-        for i in range(n):
-            slider.move(starts[i], ends[i])
-
-            item_cache.clear() # ugh
-
-            object.__setattr__(slider.dummy, 'name', names[i])
-            piece = f(slider.dummy)
-
-            # I'm paying the price for index-sharing, ugh
-            try:
-                if piece.index is slider.dummy.index:
-                    piece = piece.copy(deep='all')
-                else:
-                    mutated = True
-            except AttributeError:
-                pass
-
-            results.append(piece)
-    finally:
-        slider.reset()
-
-    return results, mutated
-
-cdef class BlockSlider:
-    '''
-    Only capable of sliding on axis=0
-    '''
-
-    cdef public:
-        object frame, dummy, index
-        int nblocks
-        Slider idx_slider
-        list blocks
-
-    cdef:
-        char **base_ptrs
-
-    def __init__(self, frame):
-        self.frame = frame
-        self.dummy = frame[:0]
-        self.index = self.dummy.index
-
-        self.blocks = [b.values for b in self.dummy._data.blocks]
-
-        for x in self.blocks:
-            util.set_array_not_contiguous(x)
-
-        self.nblocks = len(self.blocks)
-        self.idx_slider = Slider(self.frame.index.values, self.dummy.index.values)
-
-        self.base_ptrs = <char**> malloc(sizeof(char*) * len(self.blocks))
-        for i, block in enumerate(self.blocks):
-            self.base_ptrs[i] = (<ndarray> block).data
-
-    def __dealloc__(self):
-        free(self.base_ptrs)
-
-    cpdef move(self, int start, int end):
-        cdef:
-            ndarray arr
-            object index
-
-        # move blocks
-        for i in range(self.nblocks):
-            arr = self.blocks[i]
-
-            # axis=1 is the frame's axis=0
-            arr.data = self.base_ptrs[i] + arr.strides[1] * start
-            arr.shape[1] = end - start
-
-        # move and set the index
-        self.idx_slider.move(start, end)
-        object.__setattr__(self.index,'_data',self.idx_slider.buf)
-        self.index._engine.clear_mapping()
-
-    cdef reset(self):
-        cdef:
-            ndarray arr
-
-        # reset blocks
-        for i in range(self.nblocks):
-            arr = self.blocks[i]
-
-            # axis=1 is the frame's axis=0
-            arr.data = self.base_ptrs[i]
-            arr.shape[1] = 0
-
-def reduce(arr, f, axis=0, dummy=None, labels=None):
-    """
-
-    Paramaters
-    -----------
-    arr : NDFrame object
-    f : function
-    axis : integer axis
-    dummy : type of reduced output (series)
-    labels : Index or None
-    """
-
-    if labels is not None:
-        if labels._has_complex_internals:
-            raise Exception('Cannot use shortcut')
-
-        # pass as an ndarray
-        if hasattr(labels,'values'):
-            labels = labels.values
-
-    reducer = Reducer(arr, f, axis=axis, dummy=dummy, labels=labels)
-    return reducer.get_result()
diff --git a/pandas/src/skiplist.h b/pandas/src/skiplist.h
deleted file mode 100644
index 57b32005021b9..0000000000000
--- a/pandas/src/skiplist.h
+++ /dev/null
@@ -1,281 +0,0 @@
-
-/*
-  Flexibly-sized, indexable skiplist data structure for maintaining a sorted
-  list of values
-
-  Port of Wes McKinney's Cython version of Raymond Hettinger's original pure
-  Python recipe (http://rhettinger.wordpress.com/2010/02/06/lost-knowledge/)
- */
-
-// #include <numpy/arrayobject.h>
-// #include <numpy/npy_math.h>
-
-
-#include <stdio.h>
-#include <stdlib.h>
-#include <string.h>
-#include <math.h>
-
-#ifndef PANDAS_INLINE
-  #if defined(__GNUC__)
-    #define PANDAS_INLINE __inline__
-  #elif defined(_MSC_VER)
-    #define PANDAS_INLINE __inline
-  #elif defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
-    #define PANDAS_INLINE inline
-  #else
-    #define PANDAS_INLINE
-  #endif
-#endif
-
-PANDAS_INLINE static float __skiplist_nanf(void)
-{
-    const union { int __i; float __f;} __bint = {0x7fc00000UL};
-    return __bint.__f;
-}
-#define PANDAS_NAN ((double) __skiplist_nanf())
-
-
-static PANDAS_INLINE double Log2(double val) {
-  return log(val) / log(2.);
-}
-
-typedef struct node_t node_t;
-
-struct node_t {
-  double value;
-  int is_nil;
-  int levels;
-  node_t **next;
-  int *width;
-  int ref_count;
-};
-
-typedef struct {
-  node_t *head;
-  int size, maxlevels;
-  node_t **tmp_chain;
-  int *tmp_steps;
-} skiplist_t;
-
-static PANDAS_INLINE double urand(void) {
-  return rand() / ((double) RAND_MAX + 1);
-}
-
-static PANDAS_INLINE int int_min(int a, int b) {
-  return a < b ? a : b;
-}
-
-static PANDAS_INLINE node_t *node_init(double value, int levels) {
-  node_t *result;
-  result = (node_t*) calloc(1, sizeof(node_t));
-
-  result->value = value;
-  result->levels = levels;
-  result->is_nil = 0;
-  result->ref_count = 0;
-
-  result->next = (node_t**) malloc(levels * sizeof(node_t*));
-  result->width = (int*) malloc(levels * sizeof(int));
-
-  return result;
-}
-
-// do this ourselves
-
-static PANDAS_INLINE void node_incref(node_t *node) {
-  node->ref_count += 1;
-}
-
-static PANDAS_INLINE void node_decref(node_t *node) {
-  node->ref_count -= 1;
-}
-
-static void node_destroy(node_t *node) {
-  int i;
-  if (node) {
-    if (node->ref_count == 1) {
-      for (i = 0; i < node->levels; ++i) {
-        node_destroy(node->next[i]);
-      }
-      free(node->next);
-      free(node->width);
-      // printf("Reference count was 1, freeing\n");
-      free(node);
-    }
-    else {
-      node_decref(node);
-    }
-    // pretty sure that freeing the struct above will be enough
-  }
-}
-
-static PANDAS_INLINE skiplist_t *skiplist_init(int expected_size) {
-  skiplist_t *result;
-  node_t *NIL, *head;
-  int maxlevels, i;
-
-  maxlevels = Log2((double) expected_size);
-  result = (skiplist_t*) calloc(1, sizeof(skiplist_t));
-  result->tmp_chain = (node_t**) malloc(maxlevels * sizeof(node_t*));
-  result->tmp_steps = (int*) malloc(maxlevels * sizeof(int));
-  result->maxlevels = maxlevels;
-
-  head = result->head = node_init(PANDAS_NAN, maxlevels);
-  node_incref(head);
-
-  NIL = node_init(0, 0);
-  NIL->is_nil = 1;
-
-  for (i = 0; i < maxlevels; ++i)
-  {
-    head->next[i] = NIL;
-    head->width[i] = 1;
-    node_incref(NIL);
-  }
-
-  return result;
-}
-
-static PANDAS_INLINE void skiplist_destroy(skiplist_t *skp) {
-  if (skp) {
-    node_destroy(skp->head);
-    free(skp->tmp_steps);
-    free(skp->tmp_chain);
-    free(skp);
-  }
-}
-
-
-// 1 if left < right, 0 if left == right, -1 if left > right
-
-static PANDAS_INLINE int _node_cmp(node_t* node, double value){
-  if (node->is_nil || node->value > value) {
-    return -1;
-  }
-  else if (node->value < value) {
-    return 1;
-  }
-  else {
-    return 0;
-  }
-}
-
-static PANDAS_INLINE double skiplist_get(skiplist_t *skp, int i, int *ret) {
-  node_t *node;
-  int level;
-
-  if (i < 0 || i >= skp->size) {
-    *ret = 0;
-    return 0;
-  }
-
-  node = skp->head;
-  i++;
-  for (level = skp->maxlevels - 1; level >= 0; --level)
-  {
-    while (node->width[level] <= i)
-    {
-      i = i - node->width[level];
-      node = node->next[level];
-    }
-  }
-
-  *ret = 1;
-  return node->value;
-}
-
-static PANDAS_INLINE int skiplist_insert(skiplist_t *skp, double value) {
-  node_t *node, *prevnode, *newnode, *next_at_level;
-  int *steps_at_level;
-  int size, steps, level;
-  node_t **chain;
-
-  chain = skp->tmp_chain;
-
-  steps_at_level = skp->tmp_steps;
-  memset(steps_at_level, 0, skp->maxlevels * sizeof(int));
-
-  node = skp->head;
-
-  for (level = skp->maxlevels - 1; level >= 0; --level)
-  {
-    next_at_level = node->next[level];
-    while (_node_cmp(next_at_level, value) >= 0) {
-      steps_at_level[level] += node->width[level];
-      node = next_at_level;
-      next_at_level = node->next[level];
-    }
-    chain[level] = node;
-  }
-
-  size = int_min(skp->maxlevels, 1 - ((int) Log2(urand())));
-
-  newnode = node_init(value, size);
-  steps = 0;
-
-  for (level = 0; level < size; ++level) {
-    prevnode = chain[level];
-    newnode->next[level] = prevnode->next[level];
-
-    prevnode->next[level] = newnode;
-    node_incref(newnode); // increment the reference count
-
-    newnode->width[level] = prevnode->width[level] - steps;
-    prevnode->width[level] = steps + 1;
-
-    steps += steps_at_level[level];
-  }
-
-  for (level = size; level < skp->maxlevels; ++level) {
-    chain[level]->width[level] += 1;
-  }
-
-  skp->size++;
-
-  return 1;
-}
-
-static PANDAS_INLINE int skiplist_remove(skiplist_t *skp, double value) {
-  int level, size;
-  node_t *node, *prevnode, *tmpnode, *next_at_level;
-  node_t **chain;
-
-  chain = skp->tmp_chain;
-  node = skp->head;
-
-  for (level = skp->maxlevels - 1; level >= 0; --level)
-  {
-    next_at_level = node->next[level];
-    while (_node_cmp(next_at_level, value) > 0) {
-      node = next_at_level;
-      next_at_level = node->next[level];
-    }
-    chain[level] = node;
-  }
-
-  if (value != chain[0]->next[0]->value) {
-    return 0;
-  }
-
-  size = chain[0]->next[0]->levels;
-
-  for (level = 0; level < size; ++level) {
-    prevnode = chain[level];
-
-    tmpnode = prevnode->next[level];
-
-    prevnode->width[level] += tmpnode->width[level] - 1;
-    prevnode->next[level] = tmpnode->next[level];
-
-    tmpnode->next[level] = NULL;
-    node_destroy(tmpnode); // decrement refcount or free
-  }
-
-  for (level = size; level < skp->maxlevels; ++level) {
-    chain[level]->width[level] -= 1;
-  }
-
-  skp->size--;
-  return 1;
-}
diff --git a/pandas/src/skiplist.pxd b/pandas/src/skiplist.pxd
deleted file mode 100644
index c1221c4741c7b..0000000000000
--- a/pandas/src/skiplist.pxd
+++ /dev/null
@@ -1,21 +0,0 @@
-cdef extern from "skiplist.h":
-    ctypedef struct node_t:
-        double value
-        int is_nil
-        int levels
-        node_t **next
-        int *width
-        int ref_count
-
-    ctypedef struct skiplist_t:
-        node_t *head
-        int size, maxlevels
-        node_t **tmp_chain
-        int *tmp_steps
-
-    inline skiplist_t* skiplist_init(int)
-    inline void skiplist_destroy(skiplist_t*)
-    inline double skiplist_get(skiplist_t*, int, int*)
-    inline int skiplist_insert(skiplist_t*, double)
-    inline int skiplist_remove(skiplist_t*, double)
-
diff --git a/pandas/src/sparse.pyx b/pandas/src/sparse.pyx
deleted file mode 100644
index 579d473cae1b3..0000000000000
--- a/pandas/src/sparse.pyx
+++ /dev/null
@@ -1,1190 +0,0 @@
-from numpy cimport ndarray, int32_t, float64_t
-cimport numpy as np
-
-cimport cython
-
-import numpy as np
-import operator
-import sys
-
-np.import_array()
-np.import_ufunc()
-
-#-------------------------------------------------------------------------------
-# Preamble stuff
-
-cdef float64_t NaN = <float64_t> np.NaN
-cdef float64_t INF = <float64_t> np.inf
-
-cdef inline int int_max(int a, int b): return a if a >= b else b
-cdef inline int int_min(int a, int b): return a if a <= b else b
-
-#-------------------------------------------------------------------------------
-
-
-cdef class SparseIndex:
-    '''
-    Abstract superclass for sparse index types
-    '''
-    def __init__(self):
-        raise NotImplementedError
-
-
-cdef class IntIndex(SparseIndex):
-    '''
-    Object for holding exact integer sparse indexing information
-
-    Parameters
-    ----------
-    length : integer
-    indices : array-like
-        Contains integers corresponding to
-    '''
-    cdef readonly:
-        Py_ssize_t length, npoints
-        ndarray indices
-
-    def __init__(self, Py_ssize_t length, indices):
-        self.length = length
-        self.indices = np.ascontiguousarray(indices, dtype=np.int32)
-        self.npoints = len(self.indices)
-
-    def __reduce__(self):
-        args = (self.length, self.indices)
-        return (IntIndex, args)
-
-    def __repr__(self):
-        output = 'IntIndex\n'
-        output += 'Indices: %s\n' % repr(self.indices)
-        return output
-
-    def check_integrity(self):
-        '''
-        Only need be strictly ascending and nothing less than 0 or greater than
-        totall ength
-        '''
-        pass
-
-    def equals(self, other):
-        if not isinstance(other, IntIndex):
-            return False
-
-        if self is other:
-            return True
-
-        same_length = self.length == other.length
-        same_indices = np.array_equal(self.indices, other.indices)
-        return same_length and same_indices
-
-    @property
-    def ngaps(self):
-        return self.length - self.npoints
-
-    def to_int_index(self):
-        return self
-
-    def to_block_index(self):
-        locs, lens = get_blocks(self.indices)
-        return BlockIndex(self.length, locs, lens)
-
-    cpdef IntIndex intersect(self, SparseIndex y_):
-        cdef:
-            Py_ssize_t out_length, xi, yi = 0
-            int32_t xind
-            ndarray[int32_t, ndim=1] xindices, yindices
-            list new_list = []
-            IntIndex y
-
-        # if is one already, returns self
-        y = y_.to_int_index()
-
-        if self.length != y.length:
-            raise Exception('Indices must reference same underlying length')
-
-        xindices = self.indices
-        yindices = y.indices
-
-        for xi from 0 <= xi < self.npoints:
-            xind = xindices[xi]
-
-            while yi < y.npoints and yindices[yi] < xind:
-                yi += 1
-
-            if yi >= y.npoints:
-                break
-
-            # TODO: would a two-pass algorithm be faster?
-            if yindices[yi] == xind:
-                new_list.append(xind)
-
-        return IntIndex(self.length, new_list)
-
-    cpdef IntIndex make_union(self, SparseIndex y_):
-        cdef:
-            Py_ssize_t out_length, i, xi, yi
-            int32_t xind
-            ndarray[int32_t, ndim=1] xindices, yindices
-            list new_list = []
-            IntIndex x, y
-
-        x = self
-
-        # if is one already, returns self
-        y = y_.to_int_index()
-
-        if self.length != y.length:
-            raise Exception('Indices must reference same underlying length')
-
-        xindices = self.indices
-        yindices = y.indices
-
-        xi = yi = 0
-        while True:
-            if xi == x.npoints:
-                while yi < y.npoints:
-                    new_list.append(yindices[yi])
-                    yi += 1
-                break
-            elif yi == y.npoints:
-                while xi < x.npoints:
-                    new_list.append(xindices[xi])
-                    xi += 1
-                break
-
-            xind = xindices[xi]
-            yind = yindices[yi]
-
-            if xind == yind:
-                new_list.append(xind)
-                xi += 1
-                yi += 1
-            elif xind < yind:
-                new_list.append(xind)
-                xi += 1
-            else:
-                new_list.append(yind)
-                yi += 1
-
-        return IntIndex(x.length, new_list)
-
-    @cython.wraparound(False)
-    cpdef lookup(self, Py_ssize_t index):
-        cdef:
-            Py_ssize_t res, n, cum_len = 0
-            ndarray[int32_t, ndim=1] inds
-
-        inds = self.indices
-        res = inds.searchsorted(index)
-        if res == self.npoints:
-            return -1
-        elif inds[res] == index:
-            return res
-        else:
-            return -1
-
-    cpdef ndarray reindex(self, ndarray[float64_t, ndim=1] values,
-                          float64_t fill_value, SparseIndex other_):
-        cdef:
-            Py_ssize_t i = 0, j = 0
-            IntIndex other
-            ndarray[float64_t, ndim=1] result
-            ndarray[int32_t, ndim=1] sinds, oinds
-
-        other = other_.to_int_index()
-
-        oinds = other.indices
-        sinds = self.indices
-
-        result = np.empty(other.npoints, dtype=np.float64)
-        result.fill(fill_value)
-
-        for 0 <= i < other.npoints:
-            while oinds[i] > sinds[j] and j < self.npoints:
-                j += 1
-
-            if j == self.npoints:
-                break
-
-            if oinds[i] < sinds[j]:
-                continue
-            elif oinds[i] == sinds[j]:
-                result[i] = values[j]
-                j += 1
-
-        return result
-
-    cpdef put(self, ndarray[float64_t, ndim=1] values,
-              ndarray[int32_t, ndim=1] indices, object to_put):
-        pass
-
-    cpdef take(self, ndarray[float64_t, ndim=1] values,
-               ndarray[int32_t, ndim=1] indices):
-        pass
-
-cpdef get_blocks(ndarray[int32_t, ndim=1] indices):
-    cdef:
-        Py_ssize_t i, npoints
-        int32_t block, length = 1, cur, prev
-        list locs = [], lens = []
-
-    npoints = len(indices)
-
-    # just handle the special empty case separately
-    if npoints == 0:
-        return [], []
-
-    # TODO: two-pass algorithm faster?
-    prev = block = indices[0]
-    for i from 1 <= i < npoints:
-        cur = indices[i]
-        if cur - prev > 1:
-            # new block
-            locs.append(block)
-            lens.append(length)
-            block = cur
-            length = 1
-        else:
-            # same block, increment length
-            length += 1
-
-        prev = cur
-
-    locs.append(block)
-    lens.append(length)
-    return locs, lens
-
-#-------------------------------------------------------------------------------
-# BlockIndex
-
-cdef class BlockIndex(SparseIndex):
-    '''
-    Object for holding block-based sparse indexing information
-
-    Parameters
-    ----------
-    '''
-    cdef readonly:
-        Py_ssize_t nblocks, npoints, length
-        ndarray blocs, blengths
-
-    cdef:
-        object __weakref__ # need to be picklable
-        int32_t* locbuf, *lenbuf
-
-    def __init__(self, length, blocs, blengths):
-
-        self.blocs = np.ascontiguousarray(blocs, dtype=np.int32)
-        self.blengths = np.ascontiguousarray(blengths, dtype=np.int32)
-
-        # in case we need
-        self.locbuf = <int32_t*> self.blocs.data
-        self.lenbuf = <int32_t*> self.blengths.data
-
-        self.length = length
-        self.nblocks = len(self.blocs)
-        self.npoints = self.blengths.sum()
-
-        # self.block_start = blocs
-        # self.block_end = blocs + blengths
-
-        self.check_integrity()
-
-    def __reduce__(self):
-        args = (self.length, self.blocs, self.blengths)
-        return (BlockIndex, args)
-
-    def __repr__(self):
-        output = 'BlockIndex\n'
-        output += 'Block locations: %s\n' % repr(self.blocs)
-        output += 'Block lengths: %s' % repr(self.blengths)
-
-        return output
-
-    @property
-    def ngaps(self):
-        return self.length - self.npoints
-
-    cpdef check_integrity(self):
-        '''
-        Check:
-        - Locations are in ascending order
-        - No overlapping blocks
-        - Blocks to not start after end of index, nor extend beyond end
-        '''
-        cdef:
-            Py_ssize_t i
-            ndarray[int32_t, ndim=1] blocs, blengths
-
-        blocs = self.blocs
-        blengths = self.blengths
-
-        if len(blocs) != len(blengths):
-            raise ValueError('block bound arrays must be same length')
-
-        for i from 0 <= i < self.nblocks:
-            if i > 0:
-                if blocs[i] <= blocs[i-1]:
-                    raise ValueError('Locations not in ascending order')
-
-            if i < self.nblocks - 1:
-                if blocs[i] + blengths[i] > blocs[i + 1]:
-                    raise ValueError('Block %d overlaps' % i)
-            else:
-                if blocs[i] + blengths[i] > self.length:
-                    raise ValueError('Block %d extends beyond end' % i)
-
-            # no zero-length blocks
-            if blengths[i] == 0:
-                raise ValueError('Zero-length block %d' % i)
-
-    def equals(self, other):
-        if not isinstance(other, BlockIndex):
-            return False
-
-        if self is other:
-            return True
-
-        same_length = self.length == other.length
-        same_blocks = (np.array_equal(self.blocs, other.blocs) and
-                       np.array_equal(self.blengths, other.blengths))
-        return same_length and same_blocks
-
-    def to_block_index(self):
-        return self
-
-    def to_int_index(self):
-        cdef:
-            Py_ssize_t i = 0, j, b
-            int32_t offset
-            ndarray[int32_t, ndim=1] indices
-
-        indices = np.empty(self.npoints, dtype=np.int32)
-
-        for b from 0 <= b < self.nblocks:
-            offset = self.locbuf[b]
-
-            for j from 0 <= j < self.lenbuf[b]:
-                indices[i] = offset + j
-                i += 1
-
-        return IntIndex(self.length, indices)
-
-    cpdef BlockIndex intersect(self, SparseIndex other):
-        '''
-        Intersect two BlockIndex objects
-
-        Parameters
-        ----------
-
-        Returns
-        -------
-        intersection : BlockIndex
-        '''
-        cdef:
-            BlockIndex y
-            ndarray[int32_t, ndim=1] xloc, xlen, yloc, ylen
-
-            list out_blocs = []
-            list out_blengths = []
-
-            Py_ssize_t xi = 0, yi = 0
-            int32_t cur_loc, cur_length, diff
-
-        y = other.to_block_index()
-
-        if self.length != y.length:
-            raise Exception('Indices must reference same underlying length')
-
-        xloc = self.blocs
-        xlen = self.blengths
-        yloc = y.blocs
-        ylen = y.blengths
-
-        while True:
-            # we are done (or possibly never began)
-            if xi >= self.nblocks or yi >= y.nblocks:
-                break
-
-            # completely symmetric...would like to avoid code dup but oh well
-            if xloc[xi] >= yloc[yi]:
-                cur_loc = xloc[xi]
-                diff = xloc[xi] - yloc[yi]
-
-                if ylen[yi] <= diff:
-                    # have to skip this block
-                    yi += 1
-                    continue
-
-                if ylen[yi] - diff < xlen[xi]:
-                    # take end of y block, move onward
-                    cur_length = ylen[yi] - diff
-                    yi += 1
-                else:
-                    # take end of x block
-                    cur_length = xlen[xi]
-                    xi += 1
-
-            else: # xloc[xi] < yloc[yi]
-                cur_loc = yloc[yi]
-                diff = yloc[yi] - xloc[xi]
-
-                if xlen[xi] <= diff:
-                    # have to skip this block
-                    xi += 1
-                    continue
-
-                if xlen[xi] - diff < ylen[yi]:
-                    # take end of x block, move onward
-                    cur_length = xlen[xi] - diff
-                    xi += 1
-                else:
-                    # take end of y block
-                    cur_length = ylen[yi]
-                    yi += 1
-
-            out_blocs.append(cur_loc)
-            out_blengths.append(cur_length)
-
-        return BlockIndex(self.length, out_blocs, out_blengths)
-
-    cpdef BlockIndex make_union(self, SparseIndex y):
-        '''
-        Combine together two BlockIndex objects, accepting indices if contained
-        in one or the other
-
-        Parameters
-        ----------
-        other : SparseIndex
-
-        Notes
-        -----
-        union is a protected keyword in Cython, hence make_union
-
-        Returns
-        -------
-        union : BlockIndex
-        '''
-        return BlockUnion(self, y.to_block_index()).result
-
-    cpdef lookup(self, Py_ssize_t index):
-        '''
-
-        Returns -1 if not found
-        '''
-        cdef:
-            Py_ssize_t i, cum_len
-            ndarray[int32_t, ndim=1] locs, lens
-
-        locs = self.blocs
-        lens = self.blengths
-
-        if self.nblocks == 0:
-            return -1
-        elif index < locs[0]:
-            return -1
-
-        cum_len = 0
-        for i from 0 <= i < self.nblocks:
-            if index >= locs[i] and index < locs[i] + lens[i]:
-                return cum_len + index - locs[i]
-            cum_len += lens[i]
-
-        return -1
-
-    cpdef ndarray reindex(self, ndarray[float64_t, ndim=1] values,
-                          float64_t fill_value, SparseIndex other_):
-        cdef:
-            Py_ssize_t i = 0, j = 0, ocur, ocurlen
-            BlockIndex other
-            ndarray[float64_t, ndim=1] result
-            ndarray[int32_t, ndim=1] slocs, slens, olocs, olens
-
-        other = other_.to_block_index()
-
-        olocs = other.blocs
-        olens = other.blengths
-        slocs = self.blocs
-        slens = self.blengths
-
-        result = np.empty(other.npoints, dtype=np.float64)
-
-        for 0 <= i < other.nblocks:
-            ocur = olocs[i]
-            ocurlen = olens[i]
-
-            while slocs[j] + slens[j] < ocur:
-                j += 1
-
-    cpdef put(self, ndarray[float64_t, ndim=1] values,
-              ndarray[int32_t, ndim=1] indices, object to_put):
-        pass
-
-    cpdef take(self, ndarray[float64_t, ndim=1] values,
-               ndarray[int32_t, ndim=1] indices):
-        pass
-
-
-cdef class BlockMerge(object):
-    '''
-    Object-oriented approach makes sharing state between recursive functions a
-    lot easier and reduces code duplication
-    '''
-    cdef:
-        BlockIndex x, y, result
-        ndarray xstart, xlen, xend, ystart, ylen, yend
-        int32_t xi, yi # block indices
-
-    def __init__(self, BlockIndex x, BlockIndex y):
-        self.x = x
-        self.y = y
-
-        if x.length != y.length:
-            raise Exception('Indices must reference same underlying length')
-
-        self.xstart = self.x.blocs
-        self.ystart = self.y.blocs
-
-        self.xend = self.x.blocs + self.x.blengths
-        self.yend = self.y.blocs + self.y.blengths
-
-        # self.xlen = self.x.blengths
-        # self.ylen = self.y.blengths
-
-        self.xi = 0
-        self.yi = 0
-
-        self.result = self._make_merged_blocks()
-
-    cdef _make_merged_blocks(self):
-        raise NotImplementedError
-
-    cdef _set_current_indices(self, int32_t xi, int32_t yi, bint mode):
-        if mode == 0:
-            self.xi = xi
-            self.yi = yi
-        else:
-            self.xi = yi
-            self.yi = xi
-
-cdef class BlockIntersection(BlockMerge):
-    '''
-    not done yet
-    '''
-    pass
-
-cdef class BlockUnion(BlockMerge):
-    '''
-    Object-oriented approach makes sharing state between recursive functions a
-    lot easier and reduces code duplication
-    '''
-
-    cdef _make_merged_blocks(self):
-        cdef:
-            ndarray[int32_t, ndim=1] xstart, xend, ystart, yend
-            int32_t nstart, nend, diff
-            list out_blocs = [], out_blengths = []
-
-        xstart = self.xstart
-        xend = self.xend
-        ystart = self.ystart
-        yend = self.yend
-
-        while True:
-            # we are done (or possibly never began)
-            if self.xi >= self.x.nblocks and self.yi >= self.y.nblocks:
-                break
-            elif self.yi >= self.y.nblocks:
-                # through with y, just pass through x blocks
-                nstart = xstart[self.xi]
-                nend = xend[self.xi]
-                self.xi += 1
-            elif self.xi >= self.x.nblocks:
-                # through with x, just pass through y blocks
-                nstart = ystart[self.yi]
-                nend = yend[self.yi]
-                self.yi += 1
-            else:
-                # find end of new block
-                if xstart[self.xi] < ystart[self.yi]:
-                    nstart = xstart[self.xi]
-                    nend = self._find_next_block_end(0)
-                else:
-                    nstart = ystart[self.yi]
-                    nend = self._find_next_block_end(1)
-
-            out_blocs.append(nstart)
-            out_blengths.append(nend - nstart)
-
-        return BlockIndex(self.x.length, out_blocs, out_blengths)
-
-    cdef int32_t _find_next_block_end(self, bint mode) except -1:
-        '''
-        Wow, this got complicated in a hurry
-
-        mode 0: block started in index x
-        mode 1: block started in index y
-        '''
-        cdef:
-            ndarray[int32_t, ndim=1] xstart, xend, ystart, yend
-            int32_t xi, yi, xnblocks, ynblocks, nend
-
-        if mode != 0 and mode != 1:
-            raise Exception('Mode must be 0 or 1')
-
-        # so symmetric code will work
-        if mode == 0:
-            xstart = self.xstart
-            xend = self.xend
-            xi = self.xi
-
-            ystart = self.ystart
-            yend = self.yend
-            yi = self.yi
-            ynblocks = self.y.nblocks
-        else:
-            xstart = self.ystart
-            xend = self.yend
-            xi = self.yi
-
-            ystart = self.xstart
-            yend = self.xend
-            yi = self.xi
-            ynblocks = self.x.nblocks
-
-        nend = xend[xi]
-
-        # print 'here xi=%d, yi=%d, mode=%d, nend=%d' % (self.xi, self.yi,
-        #                                                mode, nend)
-
-        # done with y?
-        if yi == ynblocks:
-            self._set_current_indices(xi + 1, yi, mode)
-            return nend
-        elif nend < ystart[yi]:
-            # block ends before y block
-            self._set_current_indices(xi + 1, yi, mode)
-            return nend
-        else:
-            while yi < ynblocks and nend > yend[yi]:
-                yi += 1
-
-            self._set_current_indices(xi + 1, yi, mode)
-
-            if yi == ynblocks:
-                return nend
-
-            if nend < ystart[yi]:
-                # we're done, return the block end
-                return nend
-            else:
-                # merge blocks, continue searching
-                # this also catches the case where blocks
-                return self._find_next_block_end(1 - mode)
-
-
-#-------------------------------------------------------------------------------
-# Sparse arithmetic
-
-ctypedef float64_t (* double_func)(float64_t a, float64_t b)
-
-cdef inline tuple sparse_nancombine(ndarray x, SparseIndex xindex,
-                                    ndarray y, SparseIndex yindex,
-                                    double_func op):
-    # faster to convert to IntIndex
-    return int_nanop(x, xindex.to_int_index(),
-                     y, yindex.to_int_index(), op)
-
-    # if isinstance(xindex, BlockIndex):
-    #     return block_nanop(x, xindex.to_block_index(),
-    #                        y, yindex.to_block_index(), op)
-    # elif isinstance(xindex, IntIndex):
-    #     return int_nanop(x, xindex.to_int_index(),
-    #                      y, yindex.to_int_index(), op)
-
-
-cdef inline tuple sparse_combine(ndarray x, SparseIndex xindex, float64_t xfill,
-                                 ndarray y, SparseIndex yindex, float64_t yfill,
-                                 double_func op):
-    if isinstance(xindex, BlockIndex):
-        return block_op(x, xindex.to_block_index(), xfill,
-                        y, yindex.to_block_index(), yfill, op)
-    elif isinstance(xindex, IntIndex):
-        return int_op(x, xindex.to_int_index(), xfill,
-                      y, yindex.to_int_index(), yfill, op)
-
-# NaN-based arithmetic operation-- no handling of fill values
-# TODO: faster to convert everything to dense?
-
-@cython.boundscheck(False)
-cdef inline tuple block_nanop(ndarray x_, BlockIndex xindex,
-                              ndarray y_, BlockIndex yindex,
-                              double_func op):
-    cdef:
-        BlockIndex out_index
-        Py_ssize_t xi = 0, yi = 0, out_i = 0 # fp buf indices
-        Py_ssize_t xbp = 0, ybp = 0, obp = 0 # block positions
-        Py_ssize_t xblock = 0, yblock = 0, outblock = 0 # block numbers
-
-        ndarray[float64_t, ndim=1] x, y
-        ndarray[float64_t, ndim=1] out
-
-    # suppress Cython compiler warnings due to inlining
-    x = x_
-    y = y_
-
-    out_index = xindex.intersect(yindex)
-    out = np.empty(out_index.npoints, dtype=np.float64)
-
-    # walk the two SparseVectors, adding matched locations...
-    for out_i from 0 <= out_i < out_index.npoints:
-
-        # I have a feeling this is inefficient
-
-        # walk x
-        while xindex.locbuf[xblock] + xbp < out_index.locbuf[outblock] + obp:
-            xbp += 1
-            xi += 1
-            if xbp == xindex.lenbuf[xblock]:
-                xblock += 1
-                xbp = 0
-
-        # walk y
-        while yindex.locbuf[yblock] + ybp < out_index.locbuf[outblock] + obp:
-            ybp += 1
-            yi += 1
-            if ybp == yindex.lenbuf[yblock]:
-                yblock += 1
-                ybp = 0
-
-        out[out_i] = op(x[xi], y[yi])
-
-        # advance. strikes me as too complicated
-        xi += 1
-        yi += 1
-
-        xbp += 1
-        if xbp == xindex.lenbuf[xblock]:
-            xblock += 1
-            xbp = 0
-
-        ybp += 1
-        if ybp == yindex.lenbuf[yblock]:
-            yblock += 1
-            ybp = 0
-
-        obp += 1
-        if obp == out_index.lenbuf[outblock]:
-            outblock += 1
-            obp = 0
-
-    return out, out_index
-
-@cython.boundscheck(False)
-cdef inline tuple int_nanop(ndarray x_, IntIndex xindex,
-                            ndarray y_, IntIndex yindex,
-                            double_func op):
-    cdef:
-        IntIndex out_index
-        Py_ssize_t xi = 0, yi = 0, out_i = 0 # fp buf indices
-        ndarray[int32_t, ndim=1] xindices, yindices, out_indices
-        ndarray[float64_t, ndim=1] x, y
-        ndarray[float64_t, ndim=1] out
-
-    # suppress Cython compiler warnings due to inlining
-    x = x_
-    y = y_
-
-    # need to do this first to know size of result array
-    out_index = xindex.intersect(yindex)
-    out = np.empty(out_index.npoints, dtype=np.float64)
-
-    xindices = xindex.indices
-    yindices = yindex.indices
-    out_indices = out_index.indices
-
-    # walk the two SparseVectors, adding matched locations...
-    for out_i from 0 <= out_i < out_index.npoints:
-
-        # walk x
-        while xindices[xi] < out_indices[out_i]:
-            xi += 1
-
-        # walk y
-        while yindices[yi] < out_indices[out_i]:
-            yi += 1
-
-        out[out_i] = op(x[xi], y[yi])
-
-        # advance
-        xi += 1
-        yi += 1
-
-    return out, out_index
-
-
-@cython.boundscheck(False)
-cdef inline tuple block_op(ndarray x_, BlockIndex xindex, float64_t xfill,
-                           ndarray y_, BlockIndex yindex, float64_t yfill,
-                           double_func op):
-    '''
-    Binary operator on BlockIndex objects with fill values
-    '''
-
-    cdef:
-        BlockIndex out_index
-        Py_ssize_t xi = 0, yi = 0, out_i = 0 # fp buf indices
-        Py_ssize_t xbp = 0, ybp = 0 # block positions
-        int32_t xloc, yloc
-        Py_ssize_t xblock = 0, yblock = 0 # block numbers
-
-        ndarray[float64_t, ndim=1] x, y
-        ndarray[float64_t, ndim=1] out
-
-    # to suppress Cython warning
-    x = x_
-    y = y_
-
-    out_index = xindex.make_union(yindex)
-    out = np.empty(out_index.npoints, dtype=np.float64)
-
-    # Wow, what a hack job. Need to do something about this
-
-    # walk the two SparseVectors, adding matched locations...
-    for out_i from 0 <= out_i < out_index.npoints:
-        if yblock == yindex.nblocks:
-            # use y fill value
-            out[out_i] = op(x[xi], yfill)
-            xi += 1
-
-            # advance x location
-            xbp += 1
-            if xbp == xindex.lenbuf[xblock]:
-                xblock += 1
-                xbp = 0
-            continue
-
-        if xblock == xindex.nblocks:
-            # use x fill value
-            out[out_i] = op(xfill, y[yi])
-            yi += 1
-
-            # advance y location
-            ybp += 1
-            if ybp == yindex.lenbuf[yblock]:
-                yblock += 1
-                ybp = 0
-            continue
-
-        yloc = yindex.locbuf[yblock] + ybp
-        xloc = xindex.locbuf[xblock] + xbp
-
-        # each index in the out_index had to come from either x, y, or both
-        if xloc == yloc:
-            out[out_i] = op(x[xi], y[yi])
-            xi += 1
-            yi += 1
-
-            # advance both locations
-            xbp += 1
-            if xbp == xindex.lenbuf[xblock]:
-                xblock += 1
-                xbp = 0
-
-            ybp += 1
-            if ybp == yindex.lenbuf[yblock]:
-                yblock += 1
-                ybp = 0
-
-        elif xloc < yloc:
-            # use y fill value
-            out[out_i] = op(x[xi], yfill)
-            xi += 1
-
-            # advance x location
-            xbp += 1
-            if xbp == xindex.lenbuf[xblock]:
-                xblock += 1
-                xbp = 0
-        else:
-            # use x fill value
-            out[out_i] = op(xfill, y[yi])
-            yi += 1
-
-            # advance y location
-            ybp += 1
-            if ybp == yindex.lenbuf[yblock]:
-                yblock += 1
-                ybp = 0
-
-    return out, out_index
-
-
-@cython.boundscheck(False)
-cdef inline tuple int_op(ndarray x_, IntIndex xindex, float64_t xfill,
-                         ndarray y_, IntIndex yindex, float64_t yfill,
-                         double_func op):
-    cdef:
-        IntIndex out_index
-        Py_ssize_t xi = 0, yi = 0, out_i = 0 # fp buf indices
-        int32_t xloc, yloc
-        ndarray[int32_t, ndim=1] xindices, yindices, out_indices
-        ndarray[float64_t, ndim=1] x, y
-        ndarray[float64_t, ndim=1] out
-
-    # suppress Cython compiler warnings due to inlining
-    x = x_
-    y = y_
-
-    # need to do this first to know size of result array
-    out_index = xindex.make_union(yindex)
-    out = np.empty(out_index.npoints, dtype=np.float64)
-
-    xindices = xindex.indices
-    yindices = yindex.indices
-    out_indices = out_index.indices
-
-    # walk the two SparseVectors, adding matched locations...
-    for out_i from 0 <= out_i < out_index.npoints:
-        if xi == xindex.npoints:
-            # use x fill value
-            out[out_i] = op(xfill, y[yi])
-            yi += 1
-            continue
-
-        if yi == yindex.npoints:
-            # use y fill value
-            out[out_i] = op(x[xi], yfill)
-            xi += 1
-            continue
-
-        xloc = xindices[xi]
-        yloc = yindices[yi]
-
-        # each index in the out_index had to come from either x, y, or both
-        if xloc == yloc:
-            out[out_i] = op(x[xi], y[yi])
-            xi += 1
-            yi += 1
-        elif xloc < yloc:
-            # use y fill value
-            out[out_i] = op(x[xi], yfill)
-            xi += 1
-        else:
-            # use x fill value
-            out[out_i] = op(xfill, y[yi])
-            yi += 1
-
-    return out, out_index
-
-cdef inline float64_t __add(float64_t a, float64_t b):
-    return a + b
-
-cdef inline float64_t __sub(float64_t a, float64_t b):
-    return a - b
-
-cdef inline float64_t __rsub(float64_t a, float64_t b):
-    return b - a
-
-cdef inline float64_t __div(float64_t a, float64_t b):
-    if b == 0:
-        if a > 0:
-            return INF
-        elif a < 0:
-            return -INF
-        else:
-            return NaN
-    else:
-        return a / b
-
-cdef inline float64_t __rdiv(float64_t a, float64_t b):
-    return __div(b, a)
-
-cdef inline float64_t __floordiv(float64_t a, float64_t b):
-    if b == 0:
-        if a > 0:
-            return INF
-        elif a < 0:
-            return -INF
-        else:
-            return NaN
-    else:
-        return a // b
-
-cdef inline float64_t __rfloordiv(float64_t a, float64_t b):
-    return __floordiv(b, a)
-
-cdef inline float64_t __mul(float64_t a, float64_t b):
-    return a * b
-cdef inline float64_t __eq(float64_t a, float64_t b):
-    return a == b
-cdef inline float64_t __ne(float64_t a, float64_t b):
-    return a != b
-cdef inline float64_t __lt(float64_t a, float64_t b):
-    return a < b
-cdef inline float64_t __gt(float64_t a, float64_t b):
-    return a > b
-
-cdef inline float64_t __pow(float64_t a, float64_t b):
-    # NaN
-    if a != a or b != b:
-        return NaN
-    return a ** b
-
-cdef inline float64_t __rpow(float64_t a, float64_t b):
-    return __pow(b, a)
-
-
-# This probably needs to be "templated" to achieve maximum performance.
-# TODO: quantify performance boost to "templating"
-
-cpdef sparse_nanadd(ndarray x, SparseIndex xindex,
-                    ndarray y, SparseIndex yindex):
-    return sparse_nancombine(x, xindex, y, yindex, __add)
-
-cpdef sparse_nansub(ndarray x, SparseIndex xindex,
-                    ndarray y, SparseIndex yindex):
-    return sparse_nancombine(x, xindex, y, yindex, __sub)
-
-cpdef sparse_nanrsub(ndarray x, SparseIndex xindex,
-                    ndarray y, SparseIndex yindex):
-    return sparse_nancombine(x, xindex, y, yindex, __rsub)
-
-cpdef sparse_nanmul(ndarray x, SparseIndex xindex,
-                    ndarray y, SparseIndex yindex):
-    return sparse_nancombine(x, xindex, y, yindex, __mul)
-
-cpdef sparse_nandiv(ndarray x, SparseIndex xindex,
-                    ndarray y, SparseIndex yindex):
-    return sparse_nancombine(x, xindex, y, yindex, __div)
-
-cpdef sparse_nanrdiv(ndarray x, SparseIndex xindex,
-                    ndarray y, SparseIndex yindex):
-    return sparse_nancombine(x, xindex, y, yindex, __rdiv)
-
-sparse_nantruediv = sparse_nandiv
-sparse_nanrtruediv = sparse_nanrdiv
-
-cpdef sparse_nanfloordiv(ndarray x, SparseIndex xindex,
-                    ndarray y, SparseIndex yindex):
-    return sparse_nancombine(x, xindex, y, yindex, __floordiv)
-
-cpdef sparse_nanrfloordiv(ndarray x, SparseIndex xindex,
-                    ndarray y, SparseIndex yindex):
-    return sparse_nancombine(x, xindex, y, yindex, __rfloordiv)
-
-cpdef sparse_nanpow(ndarray x, SparseIndex xindex,
-                    ndarray y, SparseIndex yindex):
-    return sparse_nancombine(x, xindex, y, yindex, __pow)
-
-cpdef sparse_nanrpow(ndarray x, SparseIndex xindex,
-                    ndarray y, SparseIndex yindex):
-    return sparse_nancombine(x, xindex, y, yindex, __rpow)
-
-cpdef sparse_add(ndarray x, SparseIndex xindex, float64_t xfill,
-                 ndarray y, SparseIndex yindex, float64_t yfill):
-    return sparse_combine(x, xindex, xfill,
-                             y, yindex, yfill, __add)
-
-cpdef sparse_sub(ndarray x, SparseIndex xindex, float64_t xfill,
-                 ndarray y, SparseIndex yindex, float64_t yfill):
-    return sparse_combine(x, xindex, xfill,
-                             y, yindex, yfill, __sub)
-
-cpdef sparse_rsub(ndarray x, SparseIndex xindex, float64_t xfill,
-                 ndarray y, SparseIndex yindex, float64_t yfill):
-    return sparse_combine(x, xindex, xfill,
-                             y, yindex, yfill, __rsub)
-
-cpdef sparse_mul(ndarray x, SparseIndex xindex, float64_t xfill,
-                 ndarray y, SparseIndex yindex, float64_t yfill):
-    return sparse_combine(x, xindex, xfill,
-                             y, yindex, yfill, __mul)
-
-cpdef sparse_div(ndarray x, SparseIndex xindex, float64_t xfill,
-                 ndarray y, SparseIndex yindex, float64_t yfill):
-    return sparse_combine(x, xindex, xfill,
-                             y, yindex, yfill, __div)
-
-cpdef sparse_rdiv(ndarray x, SparseIndex xindex, float64_t xfill,
-                 ndarray y, SparseIndex yindex, float64_t yfill):
-    return sparse_combine(x, xindex, xfill,
-                             y, yindex, yfill, __rdiv)
-
-sparse_truediv = sparse_div
-sparse_rtruediv = sparse_rdiv
-
-cpdef sparse_floordiv(ndarray x, SparseIndex xindex, float64_t xfill,
-                 ndarray y, SparseIndex yindex, float64_t yfill):
-    return sparse_combine(x, xindex, xfill,
-                             y, yindex, yfill, __floordiv)
-
-cpdef sparse_rfloordiv(ndarray x, SparseIndex xindex, float64_t xfill,
-                 ndarray y, SparseIndex yindex, float64_t yfill):
-    return sparse_combine(x, xindex, xfill,
-                             y, yindex, yfill, __rfloordiv)
-
-cpdef sparse_pow(ndarray x, SparseIndex xindex, float64_t xfill,
-                 ndarray y, SparseIndex yindex, float64_t yfill):
-    return sparse_combine(x, xindex, xfill,
-                             y, yindex, yfill, __pow)
-
-cpdef sparse_rpow(ndarray x, SparseIndex xindex, float64_t xfill,
-                 ndarray y, SparseIndex yindex, float64_t yfill):
-    return sparse_combine(x, xindex, xfill,
-                             y, yindex, yfill, __rpow)
-
-
-#-------------------------------------------------------------------------------
-# Indexing operations
-
-def get_reindexer(ndarray[object, ndim=1] values, dict index_map):
-    cdef object idx
-    cdef Py_ssize_t i
-    cdef Py_ssize_t new_length = len(values)
-    cdef ndarray[int32_t, ndim=1] indexer
-
-    indexer = np.empty(new_length, dtype=np.int32)
-
-    for i in range(new_length):
-        idx = values[i]
-        if idx in index_map:
-            indexer[i] = index_map[idx]
-        else:
-            indexer[i] = -1
-
-    return indexer
-
-# def reindex_block(ndarray[float64_t, ndim=1] values,
-#                   BlockIndex sparse_index,
-#                   ndarray[int32_t, ndim=1] indexer):
-#     cdef:
-#         Py_ssize_t i, length
-#         ndarray[float64_t, ndim=1] out
-
-#     out = np.empty(length, dtype=np.float64)
-
-#     for i from 0 <= i < length:
-#         if indexer[i] == -1:
-#             pass
-
-
-# cdef class SparseCruncher(object):
-#     '''
-#     Class to acquire float pointer for convenient operations on sparse data
-#     structures
-#     '''
-#     cdef:
-#         SparseIndex index
-#         float64_t* buf
-
-#     def __init__(self, ndarray[float64_t, ndim=1, mode='c'] values,
-#                  SparseIndex index):
-
-#         self.index = index
-#         self.buf = <float64_t*> values.data
-
-
-def reindex_integer(ndarray[float64_t, ndim=1] values,
-                    IntIndex sparse_index,
-                    ndarray[int32_t, ndim=1] indexer):
-    pass
diff --git a/pandas/src/testing.pyx b/pandas/src/testing.pyx
deleted file mode 100644
index 9839c9f416160..0000000000000
--- a/pandas/src/testing.pyx
+++ /dev/null
@@ -1,202 +0,0 @@
-import numpy as np
-
-from pandas import compat
-from pandas.core.common import isnull, array_equivalent
-
-cdef NUMERIC_TYPES = (
-    bool,
-    int,
-    float,
-    np.bool,
-    np.int8,
-    np.int16,
-    np.int32,
-    np.int64,
-    np.uint8,
-    np.uint16,
-    np.uint32,
-    np.uint64,
-    np.float16,
-    np.float32,
-    np.float64,
-)
-
-cdef bint is_comparable_as_number(obj):
-    return isinstance(obj, NUMERIC_TYPES)
-
-cdef bint isiterable(obj):
-    return hasattr(obj, '__iter__')
-
-cdef bint has_length(obj):
-    return hasattr(obj, '__len__')
-
-cdef bint is_dictlike(obj):
-    return hasattr(obj, 'keys') and hasattr(obj, '__getitem__')
-
-cdef bint decimal_almost_equal(double desired, double actual, int decimal):
-    # Code from
-    # http://docs.scipy.org/doc/numpy/reference/generated
-    # /numpy.testing.assert_almost_equal.html
-    return abs(desired - actual) < (0.5 * 10.0 ** -decimal)
-
-cpdef assert_dict_equal(a, b, bint compare_keys=True):
-    assert is_dictlike(a) and is_dictlike(b), (
-        "Cannot compare dict objects, one or both is not dict-like"
-    )
-
-    a_keys = frozenset(a.keys())
-    b_keys = frozenset(b.keys())
-
-    if compare_keys:
-        assert a_keys == b_keys
-
-    for k in a_keys:
-        assert_almost_equal(a[k], b[k])
-
-    return True
-
-cpdef assert_almost_equal(a, b, bint check_less_precise=False,
-                          obj=None, lobj=None, robj=None):
-    """Check that left and right objects are almost equal.
-
-    Parameters
-    ----------
-    a : object
-    b : object
-    check_less_precise : bool, default False
-        Specify comparison precision.
-        5 digits (False) or 3 digits (True) after decimal points are compared.
-    obj : str, default None
-        Specify object name being compared, internally used to show appropriate
-        assertion message
-    lobj : str, default None
-        Specify left object name being compared, internally used to show
-        appropriate assertion message
-    robj : str, default None
-        Specify right object name being compared, internally used to show
-        appropriate assertion message
-    """
-
-    cdef:
-        int decimal
-        double diff = 0.0
-        Py_ssize_t i, na, nb
-        double fa, fb
-        bint is_unequal = False
-
-    if lobj is None:
-        lobj = a
-    if robj is None:
-        robj = b
-
-    if isinstance(a, dict) or isinstance(b, dict):
-        return assert_dict_equal(a, b)
-
-    if (isinstance(a, compat.string_types) or
-            isinstance(b, compat.string_types)):
-        assert a == b, "%r != %r" % (a, b)
-        return True
-
-    if isiterable(a):
-
-        if not isiterable(b):
-            from pandas.util.testing import raise_assert_detail
-            if obj is None:
-                obj = 'Iterable'
-            msg = "First object is iterable, second isn't"
-            raise_assert_detail(obj, msg, a, b)
-
-        assert has_length(a) and has_length(b), (
-            "Can't compare objects without length, one or both is invalid: "
-            "(%r, %r)" % (a, b)
-        )
-
-        if isinstance(a, np.ndarray) and isinstance(b, np.ndarray):
-            if obj is None:
-                obj = 'numpy array'
-            na, nb = a.size, b.size
-            if a.shape != b.shape:
-                from pandas.util.testing import raise_assert_detail
-                raise_assert_detail(obj, '{0} shapes are different'.format(obj),
-                                    a.shape, b.shape)
-            try:
-                if array_equivalent(a, b, strict_nan=True):
-                    return True
-            except:
-                pass
-        else:
-            if obj is None:
-                obj = 'Iterable'
-            na, nb = len(a), len(b)
-
-        if na != nb:
-            from pandas.util.testing import raise_assert_detail
-            raise_assert_detail(obj, '{0} length are different'.format(obj),
-                                na, nb)
-
-        for i in xrange(len(a)):
-            try:
-                assert_almost_equal(a[i], b[i], check_less_precise)
-            except AssertionError:
-                is_unequal = True
-                diff += 1
-
-        if is_unequal:
-            from pandas.util.testing import raise_assert_detail
-            msg = '{0} values are different ({1} %)'.format(obj, np.round(diff * 100.0 / na, 5))
-            raise_assert_detail(obj, msg, lobj, robj)
-
-        return True
-
-    elif isiterable(b):
-        from pandas.util.testing import raise_assert_detail
-        if obj is None:
-            obj = 'Iterable'
-        msg = "Second object is iterable, first isn't"
-        raise_assert_detail(obj, msg, a, b)
-
-    if isnull(a):
-        assert isnull(b), (
-            "First object is null, second isn't: %r != %r" % (a, b)
-        )
-        return True
-    elif isnull(b):
-        assert isnull(a), (
-            "First object is not null, second is null: %r != %r" % (a, b)
-        )
-        return True
-
-    if is_comparable_as_number(a):
-        assert is_comparable_as_number(b), (
-            "First object is numeric, second is not: %r != %r" % (a, b)
-        )
-
-        decimal = 5
-
-        # deal with differing dtypes
-        if check_less_precise:
-            decimal = 3
-
-        if np.isinf(a):
-            assert np.isinf(b), "First object is inf, second isn't"
-            if np.isposinf(a):
-                assert np.isposinf(b), "First object is positive inf, second is negative inf"
-            else:
-                assert np.isneginf(b), "First object is negative inf, second is positive inf"
-        else:
-            fa, fb = a, b
-
-            # case for zero
-            if abs(fa) < 1e-5:
-                if not decimal_almost_equal(fa, fb, decimal):
-                    assert False, (
-                        '(very low values) expected %.5f but got %.5f, with decimal %d' % (fb, fa, decimal)
-                    )
-            else:
-                if not decimal_almost_equal(1, fb / fa, decimal):
-                    assert False, 'expected %.5f but got %.5f, with decimal %d' % (fb, fa, decimal)
-
-    else:
-        assert a == b, "%r != %r" % (a, b)
-
-    return True
diff --git a/pandas/src/ujson/lib/ultrajsondec.c b/pandas/src/ujson/lib/ultrajsondec.c
deleted file mode 100644
index 9c2bb21612745..0000000000000
--- a/pandas/src/ujson/lib/ultrajsondec.c
+++ /dev/null
@@ -1,929 +0,0 @@
-/*
-Copyright (c) 2011-2013, ESN Social Software AB and Jonas Tarnstrom
-All rights reserved.
-
-Redistribution and use in source and binary forms, with or without
-modification, are permitted provided that the following conditions are met:
-* Redistributions of source code must retain the above copyright
-notice, this list of conditions and the following disclaimer.
-* Redistributions in binary form must reproduce the above copyright
-notice, this list of conditions and the following disclaimer in the
-documentation and/or other materials provided with the distribution.
-* Neither the name of the ESN Social Software AB nor the
-names of its contributors may be used to endorse or promote products
-derived from this software without specific prior written permission.
-
-THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
-ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE LIABLE
-FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
-(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
-LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
-ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
-SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-
-Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
-http://code.google.com/p/stringencoders/
-Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights reserved.
-
-Numeric decoder derived from from TCL library
-http://www.opensource.apple.com/source/tcl/tcl-14/tcl/license.terms
-* Copyright (c) 1988-1993 The Regents of the University of California.
-* Copyright (c) 1994 Sun Microsystems, Inc.
-*/
-
-#include "ultrajson.h"
-#include <math.h>
-#include <assert.h>
-#include <string.h>
-#include <limits.h>
-#include <wchar.h>
-#include <stdlib.h>
-#include <errno.h>
-#include <locale.h>
-
-#ifndef TRUE
-#define TRUE 1
-#define FALSE 0
-#endif
-#ifndef NULL
-#define NULL 0
-#endif
-
-struct DecoderState
-{
-  char *start;
-  char *end;
-  wchar_t *escStart;
-  wchar_t *escEnd;
-  int escHeap;
-  int lastType;
-  JSUINT32 objDepth;
-  void *prv;
-  JSONObjectDecoder *dec;
-};
-
-JSOBJ FASTCALL_MSVC decode_any( struct DecoderState *ds) FASTCALL_ATTR;
-typedef JSOBJ (*PFN_DECODER)( struct DecoderState *ds);
-
-static JSOBJ SetError( struct DecoderState *ds, int offset, const char *message)
-{
-  ds->dec->errorOffset = ds->start + offset;
-  ds->dec->errorStr = (char *) message;
-  return NULL;
-}
-
-static void ClearError( struct DecoderState *ds)
-{
-  ds->dec->errorOffset = 0;
-  ds->dec->errorStr = NULL;
-}
-
-double createDouble(double intNeg, double intValue, double frcValue, int frcDecimalCount)
-{
-  static const double g_pow10[] = {1.0, 0.1, 0.01, 0.001, 0.0001, 0.00001, 0.000001,0.0000001, 0.00000001, 0.000000001, 0.0000000001, 0.00000000001, 0.000000000001, 0.0000000000001, 0.00000000000001, 0.000000000000001};
-  return (intValue + (frcValue * g_pow10[frcDecimalCount])) * intNeg;
-}
-
-FASTCALL_ATTR JSOBJ FASTCALL_MSVC decodePreciseFloat(struct DecoderState *ds)
-{
-  char *end;
-  double value;
-  errno = 0;
-
-  value = strtod(ds->start, &end);
-
-  if (errno == ERANGE)
-  {
-    return SetError(ds, -1, "Range error when decoding numeric as double");
-  }
-
-  ds->start = end;
-  return ds->dec->newDouble(ds->prv, value);
-}
-
-FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_numeric (struct DecoderState *ds)
-{
-  int intNeg = 1;
-  int mantSize = 0;
-  JSUINT64 intValue;
-  int chr;
-  int decimalCount = 0;
-  double frcValue = 0.0;
-  double expNeg;
-  double expValue;
-  char *offset = ds->start;
-
-  JSUINT64 overflowLimit = LLONG_MAX;
-
-  if (*(offset) == '-')
-  {
-    offset ++;
-    intNeg = -1;
-    overflowLimit = LLONG_MIN;
-  }
-
-  // Scan integer part
-  intValue = 0;
-
-  while (1)
-  {
-    chr = (int) (unsigned char) *(offset);
-
-    switch (chr)
-    {
-      case '0':
-      case '1':
-      case '2':
-      case '3':
-      case '4':
-      case '5':
-      case '6':
-      case '7':
-      case '8':
-      case '9':
-      {
-        //FIXME: Check for arithemtic overflow here
-        //PERF: Don't do 64-bit arithmetic here unless we know we have to
-        intValue = intValue * 10ULL + (JSLONG) (chr - 48);
-
-        if (intValue > overflowLimit)
-        {
-          return SetError(ds, -1, overflowLimit == LLONG_MAX ? "Value is too big" : "Value is too small");
-        }
-
-        offset ++;
-        mantSize ++;
-        break;
-      }
-      case '.':
-      {
-        offset ++;
-        goto DECODE_FRACTION;
-        break;
-      }
-      case 'e':
-      case 'E':
-      {
-        offset ++;
-        goto DECODE_EXPONENT;
-        break;
-      }
-
-      default:
-      {
-        goto BREAK_INT_LOOP;
-        break;
-      }
-    }
-  }
-
-BREAK_INT_LOOP:
-
-  ds->lastType = JT_INT;
-  ds->start = offset;
-
-  if ((intValue >> 31))
-  {
-    return ds->dec->newLong(ds->prv, (JSINT64) (intValue * (JSINT64) intNeg));
-  }
-  else
-  {
-    return ds->dec->newInt(ds->prv, (JSINT32) (intValue * intNeg));
-  }
-
-DECODE_FRACTION:
-
-  if (ds->dec->preciseFloat)
-  {
-    return decodePreciseFloat(ds);
-  }
-
-  // Scan fraction part
-  frcValue = 0.0;
-  for (;;)
-  {
-    chr = (int) (unsigned char) *(offset);
-
-    switch (chr)
-    {
-      case '0':
-      case '1':
-      case '2':
-      case '3':
-      case '4':
-      case '5':
-      case '6':
-      case '7':
-      case '8':
-      case '9':
-      {
-        if (decimalCount < JSON_DOUBLE_MAX_DECIMALS)
-        {
-          frcValue = frcValue * 10.0 + (double) (chr - 48);
-          decimalCount ++;
-        }
-        offset ++;
-        break;
-      }
-      case 'e':
-      case 'E':
-      {
-        offset ++;
-        goto DECODE_EXPONENT;
-        break;
-      }
-      default:
-      {
-        goto BREAK_FRC_LOOP;
-      }
-    }
-  }
-
-BREAK_FRC_LOOP:
-  //FIXME: Check for arithemtic overflow here
-  ds->lastType = JT_DOUBLE;
-  ds->start = offset;
-  return ds->dec->newDouble (ds->prv, createDouble( (double) intNeg, (double) intValue, frcValue, decimalCount));
-
-DECODE_EXPONENT:
-  if (ds->dec->preciseFloat)
-  {
-    return decodePreciseFloat(ds);
-  }
-
-  expNeg = 1.0;
-
-  if (*(offset) == '-')
-  {
-    expNeg = -1.0;
-    offset ++;
-  }
-  else
-  if (*(offset) == '+')
-  {
-    expNeg = +1.0;
-    offset ++;
-  }
-
-  expValue = 0.0;
-
-  for (;;)
-  {
-    chr = (int) (unsigned char) *(offset);
-
-    switch (chr)
-    {
-      case '0':
-      case '1':
-      case '2':
-      case '3':
-      case '4':
-      case '5':
-      case '6':
-      case '7':
-      case '8':
-      case '9':
-      {
-        expValue = expValue * 10.0 + (double) (chr - 48);
-        offset ++;
-        break;
-      }
-      default:
-      {
-        goto BREAK_EXP_LOOP;
-      }
-    }
-  }
-
-BREAK_EXP_LOOP:
-  //FIXME: Check for arithemtic overflow here
-  ds->lastType = JT_DOUBLE;
-  ds->start = offset;
-  return ds->dec->newDouble (ds->prv, createDouble( (double) intNeg, (double) intValue , frcValue, decimalCount) * pow(10.0, expValue * expNeg));
-}
-
-FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_true ( struct DecoderState *ds)
-{
-  char *offset = ds->start;
-  offset ++;
-
-  if (*(offset++) != 'r')
-    goto SETERROR;
-  if (*(offset++) != 'u')
-    goto SETERROR;
-  if (*(offset++) != 'e')
-    goto SETERROR;
-
-  ds->lastType = JT_TRUE;
-  ds->start = offset;
-  return ds->dec->newTrue(ds->prv);
-
-SETERROR:
-  return SetError(ds, -1, "Unexpected character found when decoding 'true'");
-}
-
-FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_false ( struct DecoderState *ds)
-{
-  char *offset = ds->start;
-  offset ++;
-
-  if (*(offset++) != 'a')
-    goto SETERROR;
-  if (*(offset++) != 'l')
-    goto SETERROR;
-  if (*(offset++) != 's')
-    goto SETERROR;
-  if (*(offset++) != 'e')
-    goto SETERROR;
-
-  ds->lastType = JT_FALSE;
-  ds->start = offset;
-  return ds->dec->newFalse(ds->prv);
-
-SETERROR:
-  return SetError(ds, -1, "Unexpected character found when decoding 'false'");
-}
-
-FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_null ( struct DecoderState *ds)
-{
-  char *offset = ds->start;
-  offset ++;
-
-  if (*(offset++) != 'u')
-    goto SETERROR;
-  if (*(offset++) != 'l')
-    goto SETERROR;
-  if (*(offset++) != 'l')
-    goto SETERROR;
-
-  ds->lastType = JT_NULL;
-  ds->start = offset;
-  return ds->dec->newNull(ds->prv);
-
-SETERROR:
-  return SetError(ds, -1, "Unexpected character found when decoding 'null'");
-}
-
-FASTCALL_ATTR void FASTCALL_MSVC SkipWhitespace(struct DecoderState *ds)
-{
-  char *offset;
-
-  for (offset = ds->start; (ds->end - offset) > 0; offset ++)
-  {
-    switch (*offset)
-    {
-      case ' ':
-      case '\t':
-      case '\r':
-      case '\n':
-        break;
-
-      default:
-        ds->start = offset;
-        return;
-    }
-  }
-
-  if (offset == ds->end)
-  {
-    ds->start = ds->end;
-  }
-}
-
-enum DECODESTRINGSTATE
-{
-  DS_ISNULL = 0x32,
-  DS_ISQUOTE,
-  DS_ISESCAPE,
-  DS_UTFLENERROR,
-
-};
-
-static const JSUINT8 g_decoderLookup[256] =
-{
-  /* 0x00 */ DS_ISNULL, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-  /* 0x10 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-  /* 0x20 */ 1, 1, DS_ISQUOTE, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-  /* 0x30 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-  /* 0x40 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-  /* 0x50 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, DS_ISESCAPE, 1, 1, 1,
-  /* 0x60 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-  /* 0x70 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-  /* 0x80 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-  /* 0x90 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-  /* 0xa0 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-  /* 0xb0 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-  /* 0xc0 */ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
-  /* 0xd0 */ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
-  /* 0xe0 */ 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
-  /* 0xf0 */ 4, 4, 4, 4, 4, 4, 4, 4, DS_UTFLENERROR, DS_UTFLENERROR, DS_UTFLENERROR, DS_UTFLENERROR, DS_UTFLENERROR, DS_UTFLENERROR, DS_UTFLENERROR, DS_UTFLENERROR,
-};
-
-FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_string ( struct DecoderState *ds)
-{
-  JSUTF16 sur[2] = { 0 };
-  int iSur = 0;
-  int index;
-  wchar_t *escOffset;
-  wchar_t *escStart;
-  size_t escLen = (ds->escEnd - ds->escStart);
-  JSUINT8 *inputOffset;
-  JSUINT8 oct;
-  JSUTF32 ucs;
-  ds->lastType = JT_INVALID;
-  ds->start ++;
-
-  if ( (size_t) (ds->end - ds->start) > escLen)
-  {
-    size_t newSize = (ds->end - ds->start);
-
-    if (ds->escHeap)
-    {
-      if (newSize > (UINT_MAX / sizeof(wchar_t)))
-      {
-        return SetError(ds, -1, "Could not reserve memory block");
-      }
-      escStart = (wchar_t *)ds->dec->realloc(ds->escStart, newSize * sizeof(wchar_t));
-      if (!escStart)
-      {
-        ds->dec->free(ds->escStart);
-        return SetError(ds, -1, "Could not reserve memory block");
-      }
-      ds->escStart = escStart;
-    }
-    else
-    {
-      wchar_t *oldStart = ds->escStart;
-      ds->escHeap = 1;
-      if (newSize > (UINT_MAX / sizeof(wchar_t)))
-      {
-        return SetError(ds, -1, "Could not reserve memory block");
-      }
-      ds->escStart = (wchar_t *) ds->dec->malloc(newSize * sizeof(wchar_t));
-      if (!ds->escStart)
-      {
-        return SetError(ds, -1, "Could not reserve memory block");
-      }
-      memcpy(ds->escStart, oldStart, escLen * sizeof(wchar_t));
-    }
-
-    ds->escEnd = ds->escStart + newSize;
-  }
-
-  escOffset = ds->escStart;
-  inputOffset = (JSUINT8 *) ds->start;
-
-  for (;;)
-  {
-    switch (g_decoderLookup[(JSUINT8)(*inputOffset)])
-    {
-      case DS_ISNULL:
-      {
-        return SetError(ds, -1, "Unmatched ''\"' when when decoding 'string'");
-      }
-      case DS_ISQUOTE:
-      {
-        ds->lastType = JT_UTF8;
-        inputOffset ++;
-        ds->start += ( (char *) inputOffset - (ds->start));
-        return ds->dec->newString(ds->prv, ds->escStart, escOffset);
-      }
-      case DS_UTFLENERROR:
-      {
-        return SetError (ds, -1, "Invalid UTF-8 sequence length when decoding 'string'");
-      }
-      case DS_ISESCAPE:
-        inputOffset ++;
-        switch (*inputOffset)
-        {
-          case '\\': *(escOffset++) = L'\\'; inputOffset++; continue;
-          case '\"': *(escOffset++) = L'\"'; inputOffset++; continue;
-          case '/':  *(escOffset++) = L'/';  inputOffset++; continue;
-          case 'b':  *(escOffset++) = L'\b'; inputOffset++; continue;
-          case 'f':  *(escOffset++) = L'\f'; inputOffset++; continue;
-          case 'n':  *(escOffset++) = L'\n'; inputOffset++; continue;
-          case 'r':  *(escOffset++) = L'\r'; inputOffset++; continue;
-          case 't':  *(escOffset++) = L'\t'; inputOffset++; continue;
-
-          case 'u':
-          {
-            int index;
-            inputOffset ++;
-
-            for (index = 0; index < 4; index ++)
-            {
-              switch (*inputOffset)
-              {
-                case '\0': return SetError (ds, -1, "Unterminated unicode escape sequence when decoding 'string'");
-                default: return SetError (ds, -1, "Unexpected character in unicode escape sequence when decoding 'string'");
-
-                case '0':
-                case '1':
-                case '2':
-                case '3':
-                case '4':
-                case '5':
-                case '6':
-                case '7':
-                case '8':
-                case '9':
-                  sur[iSur] = (sur[iSur] << 4) + (JSUTF16) (*inputOffset - '0');
-                  break;
-
-                case 'a':
-                case 'b':
-                case 'c':
-                case 'd':
-                case 'e':
-                case 'f':
-                  sur[iSur] = (sur[iSur] << 4) + 10 + (JSUTF16) (*inputOffset - 'a');
-                  break;
-
-                case 'A':
-                case 'B':
-                case 'C':
-                case 'D':
-                case 'E':
-                case 'F':
-                  sur[iSur] = (sur[iSur] << 4) + 10 + (JSUTF16) (*inputOffset - 'A');
-                  break;
-              }
-
-              inputOffset ++;
-            }
-
-            if (iSur == 0)
-            {
-              if((sur[iSur] & 0xfc00) == 0xd800)
-              {
-                // First of a surrogate pair, continue parsing
-                iSur ++;
-                break;
-              }
-              (*escOffset++) = (wchar_t) sur[iSur];
-              iSur = 0;
-            }
-            else
-            {
-              // Decode pair
-              if ((sur[1] & 0xfc00) != 0xdc00)
-              {
-                return SetError (ds, -1, "Unpaired high surrogate when decoding 'string'");
-              }
-#if WCHAR_MAX == 0xffff
-              (*escOffset++) = (wchar_t) sur[0];
-              (*escOffset++) = (wchar_t) sur[1];
-#else
-              (*escOffset++) = (wchar_t) 0x10000 + (((sur[0] - 0xd800) << 10) | (sur[1] - 0xdc00));
-#endif
-              iSur = 0;
-            }
-          break;
-        }
-
-        case '\0': return SetError(ds, -1, "Unterminated escape sequence when decoding 'string'");
-        default: return SetError(ds, -1, "Unrecognized escape sequence when decoding 'string'");
-      }
-      break;
-
-      case 1:
-      {
-        *(escOffset++) = (wchar_t) (*inputOffset++);
-        break;
-      }
-
-      case 2:
-      {
-        ucs = (*inputOffset++) & 0x1f;
-        ucs <<= 6;
-        if (((*inputOffset) & 0x80) != 0x80)
-        {
-          return SetError(ds, -1, "Invalid octet in UTF-8 sequence when decoding 'string'");
-        }
-        ucs |= (*inputOffset++) & 0x3f;
-        if (ucs < 0x80) return SetError (ds, -1, "Overlong 2 byte UTF-8 sequence detected when decoding 'string'");
-        *(escOffset++) = (wchar_t) ucs;
-        break;
-      }
-
-      case 3:
-      {
-        JSUTF32 ucs = 0;
-        ucs |= (*inputOffset++) & 0x0f;
-
-        for (index = 0; index < 2; index ++)
-        {
-          ucs <<= 6;
-          oct = (*inputOffset++);
-
-          if ((oct & 0x80) != 0x80)
-          {
-            return SetError(ds, -1, "Invalid octet in UTF-8 sequence when decoding 'string'");
-          }
-
-          ucs |= oct & 0x3f;
-        }
-
-        if (ucs < 0x800) return SetError (ds, -1, "Overlong 3 byte UTF-8 sequence detected when encoding string");
-        *(escOffset++) = (wchar_t) ucs;
-        break;
-      }
-
-      case 4:
-      {
-        JSUTF32 ucs = 0;
-        ucs |= (*inputOffset++) & 0x07;
-
-        for (index = 0; index < 3; index ++)
-        {
-          ucs <<= 6;
-          oct = (*inputOffset++);
-
-          if ((oct & 0x80) != 0x80)
-          {
-            return SetError(ds, -1, "Invalid octet in UTF-8 sequence when decoding 'string'");
-          }
-
-          ucs |= oct & 0x3f;
-        }
-
-        if (ucs < 0x10000) return SetError (ds, -1, "Overlong 4 byte UTF-8 sequence detected when decoding 'string'");
-
-#if WCHAR_MAX == 0xffff
-        if (ucs >= 0x10000)
-        {
-          ucs -= 0x10000;
-          *(escOffset++) = (wchar_t) (ucs >> 10) + 0xd800;
-          *(escOffset++) = (wchar_t) (ucs & 0x3ff) + 0xdc00;
-        }
-        else
-        {
-          *(escOffset++) = (wchar_t) ucs;
-        }
-#else
-        *(escOffset++) = (wchar_t) ucs;
-#endif
-        break;
-      }
-    }
-  }
-}
-
-FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_array(struct DecoderState *ds)
-{
-  JSOBJ itemValue;
-  JSOBJ newObj;
-  int len;
-  ds->objDepth++;
-  if (ds->objDepth > JSON_MAX_OBJECT_DEPTH) {
-    return SetError(ds, -1, "Reached object decoding depth limit");
-  }
-
-  newObj = ds->dec->newArray(ds->prv, ds->dec);
-  len = 0;
-
-  ds->lastType = JT_INVALID;
-  ds->start ++;
-
-  for (;;)
-  {
-    SkipWhitespace(ds);
-
-    if ((*ds->start) == ']')
-    {
-      ds->objDepth--;
-      if (len == 0)
-      {
-        ds->start ++;
-        return ds->dec->endArray(ds->prv, newObj);
-      }
-
-      ds->dec->releaseObject(ds->prv, newObj, ds->dec);
-      return SetError(ds, -1, "Unexpected character found when decoding array value (1)");
-    }
-
-    itemValue = decode_any(ds);
-
-    if (itemValue == NULL)
-    {
-      ds->dec->releaseObject(ds->prv, newObj, ds->dec);
-      return NULL;
-    }
-
-    if (!ds->dec->arrayAddItem (ds->prv, newObj, itemValue))
-    {
-      ds->dec->releaseObject(ds->prv, newObj, ds->dec);
-      return NULL;
-    }
-
-    SkipWhitespace(ds);
-
-    switch (*(ds->start++))
-    {
-    case ']':
-    {
-      ds->objDepth--;
-      return ds->dec->endArray(ds->prv, newObj);
-    }
-    case ',':
-      break;
-
-    default:
-      ds->dec->releaseObject(ds->prv, newObj, ds->dec);
-      return SetError(ds, -1, "Unexpected character found when decoding array value (2)");
-    }
-
-    len ++;
-  }
-}
-
-FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_object( struct DecoderState *ds)
-{
-  JSOBJ itemName;
-  JSOBJ itemValue;
-  JSOBJ newObj;
-
-  ds->objDepth++;
-  if (ds->objDepth > JSON_MAX_OBJECT_DEPTH) {
-    return SetError(ds, -1, "Reached object decoding depth limit");
-  }
-
-  newObj = ds->dec->newObject(ds->prv, ds->dec);
-
-  ds->start ++;
-
-  for (;;)
-  {
-    SkipWhitespace(ds);
-
-    if ((*ds->start) == '}')
-    {
-      ds->objDepth--;
-      ds->start ++;
-      return ds->dec->endObject(ds->prv, newObj);
-    }
-
-    ds->lastType = JT_INVALID;
-    itemName = decode_any(ds);
-
-    if (itemName == NULL)
-    {
-      ds->dec->releaseObject(ds->prv, newObj, ds->dec);
-      return NULL;
-    }
-
-    if (ds->lastType != JT_UTF8)
-    {
-      ds->dec->releaseObject(ds->prv, newObj, ds->dec);
-      ds->dec->releaseObject(ds->prv, itemName, ds->dec);
-      return SetError(ds, -1, "Key name of object must be 'string' when decoding 'object'");
-    }
-
-    SkipWhitespace(ds);
-
-    if (*(ds->start++) != ':')
-    {
-      ds->dec->releaseObject(ds->prv, newObj, ds->dec);
-      ds->dec->releaseObject(ds->prv, itemName, ds->dec);
-      return SetError(ds, -1, "No ':' found when decoding object value");
-    }
-
-    SkipWhitespace(ds);
-
-    itemValue = decode_any(ds);
-
-    if (itemValue == NULL)
-    {
-      ds->dec->releaseObject(ds->prv, newObj, ds->dec);
-      ds->dec->releaseObject(ds->prv, itemName, ds->dec);
-      return NULL;
-    }
-
-  if (!ds->dec->objectAddKey (ds->prv, newObj, itemName, itemValue))
-  {
-    ds->dec->releaseObject(ds->prv, newObj, ds->dec);
-    ds->dec->releaseObject(ds->prv, itemName, ds->dec);
-    ds->dec->releaseObject(ds->prv, itemValue, ds->dec);
-    return NULL;
-  }
-
-    SkipWhitespace(ds);
-
-    switch (*(ds->start++))
-    {
-      case '}':
-      {
-        ds->objDepth--;
-        return ds->dec->endObject(ds->prv, newObj);
-      }
-      case ',':
-        break;
-
-      default:
-        ds->dec->releaseObject(ds->prv, newObj, ds->dec);
-        return SetError(ds, -1, "Unexpected character found when decoding object value");
-    }
-  }
-}
-
-FASTCALL_ATTR JSOBJ FASTCALL_MSVC decode_any(struct DecoderState *ds)
-{
-  for (;;)
-  {
-    switch (*ds->start)
-    {
-      case '\"':
-        return decode_string (ds);
-      case '0':
-      case '1':
-      case '2':
-      case '3':
-      case '4':
-      case '5':
-      case '6':
-      case '7':
-      case '8':
-      case '9':
-      case '-':
-        return decode_numeric (ds);
-
-      case '[': return decode_array (ds);
-      case '{': return decode_object (ds);
-      case 't': return decode_true (ds);
-      case 'f': return decode_false (ds);
-      case 'n': return decode_null (ds);
-
-      case ' ':
-      case '\t':
-      case '\r':
-      case '\n':
-        // White space
-        ds->start ++;
-        break;
-
-      default:
-        return SetError(ds, -1, "Expected object or value");
-    }
-  }
-}
-
-JSOBJ JSON_DecodeObject(JSONObjectDecoder *dec, const char *buffer, size_t cbBuffer)
-{
-  /*
-  FIXME: Base the size of escBuffer of that of cbBuffer so that the unicode escaping doesn't run into the wall each time */
-  char *locale;
-  struct DecoderState ds;
-  wchar_t escBuffer[(JSON_MAX_STACK_BUFFER_SIZE / sizeof(wchar_t))];
-  JSOBJ ret;
-
-  ds.start = (char *) buffer;
-  ds.end = ds.start + cbBuffer;
-
-  ds.escStart = escBuffer;
-  ds.escEnd = ds.escStart + (JSON_MAX_STACK_BUFFER_SIZE / sizeof(wchar_t));
-  ds.escHeap = 0;
-  ds.prv = dec->prv;
-  ds.dec = dec;
-  ds.dec->errorStr = NULL;
-  ds.dec->errorOffset = NULL;
-  ds.objDepth = 0;
-
-  ds.dec = dec;
-
-  locale = setlocale(LC_NUMERIC, NULL);
-  if (strcmp(locale, "C"))
-  {
-    locale = strdup(locale);
-    if (!locale)
-    {
-      return SetError(&ds, -1, "Could not reserve memory block");
-    }
-    setlocale(LC_NUMERIC, "C");
-    ret = decode_any (&ds);
-    setlocale(LC_NUMERIC, locale);
-    free(locale);
-  }
-  else
-  {
-    ret = decode_any (&ds);
-  }
-
-  if (ds.escHeap)
-  {
-    dec->free(ds.escStart);
-  }
-
-  SkipWhitespace(&ds);
-
-  if (ds.start != ds.end && ret)
-  {
-    dec->releaseObject(ds.prv, ret, ds.dec);
-    return SetError(&ds, -1, "Trailing data");
-  }
-
-  return ret;
-}
diff --git a/pandas/src/ujson/lib/ultrajsonenc.c b/pandas/src/ujson/lib/ultrajsonenc.c
deleted file mode 100644
index 5e2a226ae8d63..0000000000000
--- a/pandas/src/ujson/lib/ultrajsonenc.c
+++ /dev/null
@@ -1,947 +0,0 @@
-/*
-Copyright (c) 2011-2013, ESN Social Software AB and Jonas Tarnstrom
-All rights reserved.
-
-Redistribution and use in source and binary forms, with or without
-modification, are permitted provided that the following conditions are met:
-    * Redistributions of source code must retain the above copyright
-      notice, this list of conditions and the following disclaimer.
-    * Redistributions in binary form must reproduce the above copyright
-      notice, this list of conditions and the following disclaimer in the
-      documentation and/or other materials provided with the distribution.
-    * Neither the name of the ESN Social Software AB nor the
-      names of its contributors may be used to endorse or promote products
-      derived from this software without specific prior written permission.
-
-THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
-ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE LIABLE
-FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
-(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
-LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
-ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
-SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-
-Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
-http://code.google.com/p/stringencoders/
-Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights reserved.
-
-Numeric decoder derived from from TCL library
-http://www.opensource.apple.com/source/tcl/tcl-14/tcl/license.terms
- * Copyright (c) 1988-1993 The Regents of the University of California.
- * Copyright (c) 1994 Sun Microsystems, Inc.
-*/
-
-#include "ultrajson.h"
-#include <stdio.h>
-#include <assert.h>
-#include <string.h>
-#include <stdlib.h>
-#include <math.h>
-#include <locale.h>
-
-#include <float.h>
-
-#ifndef TRUE
-#define TRUE 1
-#endif
-#ifndef FALSE
-#define FALSE 0
-#endif
-
-/*
-Worst cases being:
-
-Control characters (ASCII < 32)
-0x00 (1 byte) input => \u0000 output (6 bytes)
-1 * 6 => 6 (6 bytes required)
-
-or UTF-16 surrogate pairs
-4 bytes input in UTF-8 => \uXXXX\uYYYY (12 bytes).
-
-4 * 6 => 24 bytes (12 bytes required)
-
-The extra 2 bytes are for the quotes around the string
-
-*/
-#define RESERVE_STRING(_len) (2 + ((_len) * 6))
-
-static const double g_pow10[] = {1, 10, 100, 1000, 10000, 100000, 1000000, 10000000, 100000000, 1000000000, 10000000000, 100000000000, 1000000000000, 10000000000000, 100000000000000, 1000000000000000};
-static const char g_hexChars[] = "0123456789abcdef";
-static const char g_escapeChars[] = "0123456789\\b\\t\\n\\f\\r\\\"\\\\\\/";
-
-/*
-FIXME: While this is fine dandy and working it's a magic value mess which probably only the author understands.
-Needs a cleanup and more documentation */
-
-/*
-Table for pure ascii output escaping all characters above 127 to \uXXXX */
-static const JSUINT8 g_asciiOutputTable[256] =
-{
-/* 0x00 */ 0, 30, 30, 30, 30, 30, 30, 30, 10, 12, 14, 30, 16, 18, 30, 30,
-/* 0x10 */ 30, 30, 30, 30, 30, 30, 30, 30, 30, 30, 30, 30, 30, 30, 30, 30,
-/* 0x20 */ 1, 1, 20, 1, 1, 1, 29, 1, 1, 1, 1, 1, 1, 1, 1, 24,
-/* 0x30 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 29, 1, 29, 1,
-/* 0x40 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-/* 0x50 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 22, 1, 1, 1,
-/* 0x60 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-/* 0x70 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-/* 0x80 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-/* 0x90 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-/* 0xa0 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-/* 0xb0 */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-/* 0xc0 */ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
-/* 0xd0 */ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
-/* 0xe0 */ 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
-/* 0xf0 */ 4, 4, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 6, 6, 1, 1
-};
-
-static void SetError (JSOBJ obj, JSONObjectEncoder *enc, const char *message)
-{
-  enc->errorMsg = message;
-  enc->errorObj = obj;
-}
-
-/*
-FIXME: Keep track of how big these get across several encoder calls and try to make an estimate
-That way we won't run our head into the wall each call */
-void Buffer_Realloc (JSONObjectEncoder *enc, size_t cbNeeded)
-{
-  size_t curSize = enc->end - enc->start;
-  size_t newSize = curSize * 2;
-  size_t offset = enc->offset - enc->start;
-
-  while (newSize < curSize + cbNeeded)
-  {
-    newSize *= 2;
-  }
-
-  if (enc->heap)
-  {
-    enc->start = (char *) enc->realloc (enc->start, newSize);
-    if (!enc->start)
-    {
-      SetError (NULL, enc, "Could not reserve memory block");
-      return;
-    }
-  }
-  else
-  {
-    char *oldStart = enc->start;
-    enc->heap = 1;
-    enc->start = (char *) enc->malloc (newSize);
-    if (!enc->start)
-    {
-      SetError (NULL, enc, "Could not reserve memory block");
-      return;
-    }
-    memcpy (enc->start, oldStart, offset);
-  }
-  enc->offset = enc->start + offset;
-  enc->end = enc->start + newSize;
-}
-
-FASTCALL_ATTR INLINE_PREFIX void FASTCALL_MSVC Buffer_AppendShortHexUnchecked (char *outputOffset, unsigned short value)
-{
-  *(outputOffset++) = g_hexChars[(value & 0xf000) >> 12];
-  *(outputOffset++) = g_hexChars[(value & 0x0f00) >> 8];
-  *(outputOffset++) = g_hexChars[(value & 0x00f0) >> 4];
-  *(outputOffset++) = g_hexChars[(value & 0x000f) >> 0];
-}
-
-int Buffer_EscapeStringUnvalidated (JSONObjectEncoder *enc, const char *io, const char *end)
-{
-  char *of = (char *) enc->offset;
-
-  for (;;)
-  {
-    switch (*io)
-    {
-      case 0x00:
-      {
-        if (io < end)
-        {
-          *(of++) = '\\';
-          *(of++) = 'u';
-          *(of++) = '0';
-          *(of++) = '0';
-          *(of++) = '0';
-          *(of++) = '0';
-          break;
-        }
-        else
-        {
-          enc->offset += (of - enc->offset);
-          return TRUE;
-        }
-      }
-      case '\"': (*of++) = '\\'; (*of++) = '\"'; break;
-      case '\\': (*of++) = '\\'; (*of++) = '\\'; break;
-      case '/':  (*of++) = '\\'; (*of++) = '/'; break;
-      case '\b': (*of++) = '\\'; (*of++) = 'b'; break;
-      case '\f': (*of++) = '\\'; (*of++) = 'f'; break;
-      case '\n': (*of++) = '\\'; (*of++) = 'n'; break;
-      case '\r': (*of++) = '\\'; (*of++) = 'r'; break;
-      case '\t': (*of++) = '\\'; (*of++) = 't'; break;
-
-      case 0x26: // '/'
-      case 0x3c: // '<'
-      case 0x3e: // '>'
-      {
-        if (enc->encodeHTMLChars)
-        {
-          // Fall through to \u00XX case below.
-        }
-        else
-        {
-          // Same as default case below.
-          (*of++) = (*io);
-          break;
-        }
-      }
-      case 0x01:
-      case 0x02:
-      case 0x03:
-      case 0x04:
-      case 0x05:
-      case 0x06:
-      case 0x07:
-      case 0x0b:
-      case 0x0e:
-      case 0x0f:
-      case 0x10:
-      case 0x11:
-      case 0x12:
-      case 0x13:
-      case 0x14:
-      case 0x15:
-      case 0x16:
-      case 0x17:
-      case 0x18:
-      case 0x19:
-      case 0x1a:
-      case 0x1b:
-      case 0x1c:
-      case 0x1d:
-      case 0x1e:
-      case 0x1f:
-      {
-        *(of++) = '\\';
-        *(of++) = 'u';
-        *(of++) = '0';
-        *(of++) = '0';
-        *(of++) = g_hexChars[ (unsigned char) (((*io) & 0xf0) >> 4)];
-        *(of++) = g_hexChars[ (unsigned char) ((*io) & 0x0f)];
-        break;
-      }
-      default: (*of++) = (*io); break;
-      }
-    io++;
-  }
-}
-
-int Buffer_EscapeStringValidated (JSOBJ obj, JSONObjectEncoder *enc, const char *io, const char *end)
-{
-  JSUTF32 ucs;
-  char *of = (char *) enc->offset;
-
-  for (;;)
-  {
-    JSUINT8 utflen = g_asciiOutputTable[(unsigned char) *io];
-
-    switch (utflen)
-    {
-      case 0:
-      {
-        if (io < end)
-        {
-          *(of++) = '\\';
-          *(of++) = 'u';
-          *(of++) = '0';
-          *(of++) = '0';
-          *(of++) = '0';
-          *(of++) = '0';
-          io ++;
-          continue;
-        }
-        else
-        {
-          enc->offset += (of - enc->offset);
-          return TRUE;
-        }
-      }
-
-      case 1:
-      {
-        *(of++)= (*io++);
-        continue;
-      }
-
-      case 2:
-      {
-        JSUTF32 in;
-        JSUTF16 in16;
-
-        if (end - io < 1)
-        {
-          enc->offset += (of - enc->offset);
-          SetError (obj, enc, "Unterminated UTF-8 sequence when encoding string");
-          return FALSE;
-        }
-
-        memcpy(&in16, io, sizeof(JSUTF16));
-        in = (JSUTF32) in16;
-
-#ifdef __LITTLE_ENDIAN__
-        ucs = ((in & 0x1f) << 6) | ((in >> 8) & 0x3f);
-#else
-        ucs = ((in & 0x1f00) >> 2) | (in & 0x3f);
-#endif
-
-        if (ucs < 0x80)
-        {
-          enc->offset += (of - enc->offset);
-          SetError (obj, enc, "Overlong 2 byte UTF-8 sequence detected when encoding string");
-          return FALSE;
-        }
-
-        io += 2;
-        break;
-      }
-
-      case 3:
-      {
-        JSUTF32 in;
-        JSUTF16 in16;
-        JSUINT8 in8;
-
-        if (end - io < 2)
-        {
-          enc->offset += (of - enc->offset);
-          SetError (obj, enc, "Unterminated UTF-8 sequence when encoding string");
-          return FALSE;
-        }
-
-        memcpy(&in16, io, sizeof(JSUTF16));
-        memcpy(&in8, io + 2, sizeof(JSUINT8));
-#ifdef __LITTLE_ENDIAN__
-        in = (JSUTF32) in16;
-        in |= in8 << 16;
-        ucs = ((in & 0x0f) << 12) | ((in & 0x3f00) >> 2) | ((in & 0x3f0000) >> 16);
-#else
-        in = in16 << 8;
-        in |= in8;
-        ucs = ((in & 0x0f0000) >> 4) | ((in & 0x3f00) >> 2) | (in & 0x3f);
-#endif
-
-        if (ucs < 0x800)
-        {
-          enc->offset += (of - enc->offset);
-          SetError (obj, enc, "Overlong 3 byte UTF-8 sequence detected when encoding string");
-          return FALSE;
-        }
-
-        io += 3;
-        break;
-      }
-      case 4:
-      {
-        JSUTF32 in;
-
-        if (end - io < 3)
-        {
-          enc->offset += (of - enc->offset);
-          SetError (obj, enc, "Unterminated UTF-8 sequence when encoding string");
-          return FALSE;
-        }
-
-        memcpy(&in, io, sizeof(JSUTF32));
-#ifdef __LITTLE_ENDIAN__
-        ucs = ((in & 0x07) << 18) | ((in & 0x3f00) << 4) | ((in & 0x3f0000) >> 10) | ((in & 0x3f000000) >> 24);
-#else
-        ucs = ((in & 0x07000000) >> 6) | ((in & 0x3f0000) >> 4) | ((in & 0x3f00) >> 2) | (in & 0x3f);
-#endif
-        if (ucs < 0x10000)
-        {
-          enc->offset += (of - enc->offset);
-          SetError (obj, enc, "Overlong 4 byte UTF-8 sequence detected when encoding string");
-          return FALSE;
-        }
-
-        io += 4;
-        break;
-      }
-
-
-      case 5:
-      case 6:
-      {
-        enc->offset += (of - enc->offset);
-        SetError (obj, enc, "Unsupported UTF-8 sequence length when encoding string");
-        return FALSE;
-      }
-
-      case 29:
-      {
-        if (enc->encodeHTMLChars)
-        {
-          // Fall through to \u00XX case 30 below.
-        }
-        else
-        {
-          // Same as case 1 above.
-          *(of++) = (*io++);
-          continue;
-        }
-      }
-
-      case 30:
-      {
-        // \uXXXX encode
-        *(of++) = '\\';
-        *(of++) = 'u';
-        *(of++) = '0';
-        *(of++) = '0';
-        *(of++) = g_hexChars[ (unsigned char) (((*io) & 0xf0) >> 4)];
-        *(of++) = g_hexChars[ (unsigned char) ((*io) & 0x0f)];
-        io ++;
-        continue;
-      }
-      case 10:
-      case 12:
-      case 14:
-      case 16:
-      case 18:
-      case 20:
-      case 22:
-      case 24:
-      {
-        *(of++) = *( (char *) (g_escapeChars + utflen + 0));
-        *(of++) = *( (char *) (g_escapeChars + utflen + 1));
-        io ++;
-        continue;
-      }
-      // This can never happen, it's here to make L4 VC++ happy
-      default:
-      {
-        ucs = 0;
-        break;
-      }
-    }
-
-    /*
-    If the character is a UTF8 sequence of length > 1 we end up here */
-    if (ucs >= 0x10000)
-    {
-      ucs -= 0x10000;
-      *(of++) = '\\';
-      *(of++) = 'u';
-      Buffer_AppendShortHexUnchecked(of, (unsigned short) (ucs >> 10) + 0xd800);
-      of += 4;
-
-      *(of++) = '\\';
-      *(of++) = 'u';
-      Buffer_AppendShortHexUnchecked(of, (unsigned short) (ucs & 0x3ff) + 0xdc00);
-      of += 4;
-    }
-    else
-    {
-      *(of++) = '\\';
-      *(of++) = 'u';
-      Buffer_AppendShortHexUnchecked(of, (unsigned short) ucs);
-      of += 4;
-    }
-  }
-}
-
-#define Buffer_Reserve(__enc, __len) \
-    if ( (size_t) ((__enc)->end - (__enc)->offset) < (size_t) (__len))  \
-    {   \
-      Buffer_Realloc((__enc), (__len));\
-    }   \
-
-
-#define Buffer_AppendCharUnchecked(__enc, __chr) \
-                *((__enc)->offset++) = __chr; \
-
-FASTCALL_ATTR INLINE_PREFIX void FASTCALL_MSVC strreverse(char* begin, char* end)
-{
-  char aux;
-  while (end > begin)
-  aux = *end, *end-- = *begin, *begin++ = aux;
-}
-
-void Buffer_AppendIntUnchecked(JSONObjectEncoder *enc, JSINT32 value)
-{
-  char* wstr;
-  JSUINT32 uvalue = (value < 0) ? -value : value;
-
-  wstr = enc->offset;
-  // Conversion. Number is reversed.
-
-  do *wstr++ = (char)(48 + (uvalue % 10)); while(uvalue /= 10);
-  if (value < 0) *wstr++ = '-';
-
-  // Reverse string
-  strreverse(enc->offset,wstr - 1);
-  enc->offset += (wstr - (enc->offset));
-}
-
-void Buffer_AppendLongUnchecked(JSONObjectEncoder *enc, JSINT64 value)
-{
-  char* wstr;
-  JSUINT64 uvalue = (value < 0) ? -value : value;
-
-  wstr = enc->offset;
-  // Conversion. Number is reversed.
-
-  do *wstr++ = (char)(48 + (uvalue % 10ULL)); while(uvalue /= 10ULL);
-  if (value < 0) *wstr++ = '-';
-
-  // Reverse string
-  strreverse(enc->offset,wstr - 1);
-  enc->offset += (wstr - (enc->offset));
-}
-
-int Buffer_AppendDoubleUnchecked(JSOBJ obj, JSONObjectEncoder *enc, double value)
-{
-  /* if input is beyond the thresholds, revert to exponential */
-  const double thres_max = (double) 1e16 - 1;
-  const double thres_min = (double) 1e-15;
-  char precision_str[20];
-  int count;
-  double diff = 0.0;
-  char* str = enc->offset;
-  char* wstr = str;
-  unsigned long long whole;
-  double tmp;
-  unsigned long long frac;
-  int neg;
-  double pow10;
-
-  if (value == HUGE_VAL || value == -HUGE_VAL)
-  {
-    SetError (obj, enc, "Invalid Inf value when encoding double");
-    return FALSE;
-  }
-
-  if (!(value == value))
-  {
-    SetError (obj, enc, "Invalid Nan value when encoding double");
-    return FALSE;
-  }
-
-  /* we'll work in positive values and deal with the
-  negative sign issue later */
-  neg = 0;
-  if (value < 0)
-  {
-    neg = 1;
-    value = -value;
-  }
-
-  /* 
-  for very large or small numbers switch back to native sprintf for 
-  exponentials.  anyone want to write code to replace this? */
-  if (value > thres_max || (value != 0.0 && fabs(value) <  thres_min))
-  {
-    precision_str[0] = '%';
-    precision_str[1] = '.';
-#if defined(_WIN32) && defined(_MSC_VER)
-    sprintf_s(precision_str+2, sizeof(precision_str)-2, "%ug", enc->doublePrecision);
-    enc->offset += sprintf_s(str, enc->end - enc->offset, precision_str, neg ? -value : value);
-#else
-    snprintf(precision_str+2, sizeof(precision_str)-2, "%ug", enc->doublePrecision);
-    enc->offset += snprintf(str, enc->end - enc->offset, precision_str, neg ? -value : value);
-#endif
-    return TRUE;
-  }
-
-  pow10 = g_pow10[enc->doublePrecision];
-
-  whole = (unsigned long long) value;
-  tmp = (value - whole) * pow10;
-  frac = (unsigned long long)(tmp);
-  diff = tmp - frac;
-
-  if (diff > 0.5)
-  {
-    ++frac;
-    /* handle rollover, e.g.  case 0.99 with prec 1 is 1.0  */
-    if (frac >= pow10)
-    {
-      frac = 0;
-      ++whole;
-    }
-  }
-  else
-  if (diff == 0.5 && ((frac == 0) || (frac & 1)))
-  {
-    /* if halfway, round up if odd, OR
-    if last digit is 0.  That last part is strange */
-    ++frac;
-  }
-
-  if (enc->doublePrecision == 0)
-  {
-    diff = value - whole;
-
-    if (diff > 0.5)
-    {
-      /* greater than 0.5, round up, e.g. 1.6 -> 2 */
-      ++whole;
-    }
-    else
-    if (diff == 0.5 && (whole & 1))
-    {
-      /* exactly 0.5 and ODD, then round up */
-      /* 1.5 -> 2, but 2.5 -> 2 */
-      ++whole;
-    }
-
-  //vvvvvvvvvvvvvvvvvvv  Diff from modp_dto2
-  }
-    else
-    if (frac)
-    {
-      count = enc->doublePrecision;
-      // now do fractional part, as an unsigned number
-      // we know it is not 0 but we can have leading zeros, these
-      // should be removed
-      while (!(frac % 10))
-      {
-        --count;
-        frac /= 10;
-      }
-      //^^^^^^^^^^^^^^^^^^^  Diff from modp_dto2
-
-      // now do fractional part, as an unsigned number
-      do
-      {
-        --count;
-        *wstr++ = (char)(48 + (frac % 10));
-      } while (frac /= 10);
-      // add extra 0s
-      while (count-- > 0)
-      {
-        *wstr++ = '0';
-      }
-      // add decimal
-      *wstr++ = '.';
-    }
-    else
-    {
-      *wstr++ = '0';
-      *wstr++ = '.';
-    }
-
-    // do whole part
-    // Take care of sign
-    // Conversion. Number is reversed.
-    do *wstr++ = (char)(48 + (whole % 10)); while (whole /= 10);
-
-    if (neg)
-    {
-      *wstr++ = '-';
-    }
-    strreverse(str, wstr-1);
-    enc->offset += (wstr - (enc->offset));
-
-    return TRUE;
-}
-
-/*
-FIXME:
-Handle integration functions returning NULL here */
-
-/*
-FIXME:
-Perhaps implement recursion detection */
-
-void encode(JSOBJ obj, JSONObjectEncoder *enc, const char *name, size_t cbName)
-{
-  const char *value;
-  char *objName;
-  int count;
-  JSOBJ iterObj;
-  size_t szlen;
-  JSONTypeContext tc;
-  tc.encoder = enc;
-
-  if (enc->level > enc->recursionMax)
-  {
-    SetError (obj, enc, "Maximum recursion level reached");
-    return;
-  }
-
-  /*
-  This reservation must hold
-
-  length of _name as encoded worst case +
-  maxLength of double to string OR maxLength of JSLONG to string
-  */
-
-  Buffer_Reserve(enc, 256 + RESERVE_STRING(cbName));
-  if (enc->errorMsg)
-  {
-    return;
-  }
-
-  if (name)
-  {
-    Buffer_AppendCharUnchecked(enc, '\"');
-
-    if (enc->forceASCII)
-    {
-      if (!Buffer_EscapeStringValidated(obj, enc, name, name + cbName))
-      {
-        return;
-      }
-    }
-    else
-    {
-      if (!Buffer_EscapeStringUnvalidated(enc, name, name + cbName))
-      {
-        return;
-      }
-    }
-
-    Buffer_AppendCharUnchecked(enc, '\"');
-
-    Buffer_AppendCharUnchecked (enc, ':');
-#ifndef JSON_NO_EXTRA_WHITESPACE
-    Buffer_AppendCharUnchecked (enc, ' ');
-#endif
-    }
-
-    enc->beginTypeContext(obj, &tc);
-
-    switch (tc.type)
-    {
-      case JT_INVALID:
-      {
-        return;
-      }
-
-      case JT_ARRAY:
-      {
-        count = 0;
-        enc->iterBegin(obj, &tc);
-
-        Buffer_AppendCharUnchecked (enc, '[');
-
-        while (enc->iterNext(obj, &tc))
-        {
-          if (count > 0)
-          {
-            Buffer_AppendCharUnchecked (enc, ',');
-#ifndef JSON_NO_EXTRA_WHITESPACE
-            Buffer_AppendCharUnchecked (buffer, ' ');
-#endif
-          }
-
-          iterObj = enc->iterGetValue(obj, &tc);
-
-          enc->level ++;
-          encode (iterObj, enc, NULL, 0);
-          count ++;
-      }
-
-      enc->iterEnd(obj, &tc);
-      Buffer_AppendCharUnchecked (enc, ']');
-      break;
-  }
-
-  case JT_OBJECT:
-  {
-    count = 0;
-    enc->iterBegin(obj, &tc);
-
-    Buffer_AppendCharUnchecked (enc, '{');
-
-    while (enc->iterNext(obj, &tc))
-    {
-      if (count > 0)
-      {
-        Buffer_AppendCharUnchecked (enc, ',');
-#ifndef JSON_NO_EXTRA_WHITESPACE
-        Buffer_AppendCharUnchecked (enc, ' ');
-#endif
-      }
-
-      iterObj = enc->iterGetValue(obj, &tc);
-      objName = enc->iterGetName(obj, &tc, &szlen);
-
-      enc->level ++;
-      encode (iterObj, enc, objName, szlen);
-      count ++;
-    }
-
-    enc->iterEnd(obj, &tc);
-    Buffer_AppendCharUnchecked (enc, '}');
-    break;
-  }
-
-  case JT_LONG:
-  {
-    Buffer_AppendLongUnchecked (enc, enc->getLongValue(obj, &tc));
-    break;
-  }
-
-  case JT_INT:
-  {
-    Buffer_AppendIntUnchecked (enc, enc->getIntValue(obj, &tc));
-    break;
-  }
-
-  case JT_TRUE:
-  {
-    Buffer_AppendCharUnchecked (enc, 't');
-    Buffer_AppendCharUnchecked (enc, 'r');
-    Buffer_AppendCharUnchecked (enc, 'u');
-    Buffer_AppendCharUnchecked (enc, 'e');
-    break;
-  }
-
-  case JT_FALSE:
-  {
-    Buffer_AppendCharUnchecked (enc, 'f');
-    Buffer_AppendCharUnchecked (enc, 'a');
-    Buffer_AppendCharUnchecked (enc, 'l');
-    Buffer_AppendCharUnchecked (enc, 's');
-    Buffer_AppendCharUnchecked (enc, 'e');
-    break;
-  }
-
-
-  case JT_NULL:
-  {
-    Buffer_AppendCharUnchecked (enc, 'n');
-    Buffer_AppendCharUnchecked (enc, 'u');
-    Buffer_AppendCharUnchecked (enc, 'l');
-    Buffer_AppendCharUnchecked (enc, 'l');
-    break;
-  }
-
-  case JT_DOUBLE:
-  {
-    if (!Buffer_AppendDoubleUnchecked (obj, enc, enc->getDoubleValue(obj, &tc)))
-    {
-      enc->endTypeContext(obj, &tc);
-      enc->level --;
-      return;
-    }
-    break;
-  }
-
-  case JT_UTF8:
-  {
-      value = enc->getStringValue(obj, &tc, &szlen);
-      Buffer_Reserve(enc, RESERVE_STRING(szlen));
-      if (enc->errorMsg)
-      {
-        enc->endTypeContext(obj, &tc);
-        return;
-      }
-      Buffer_AppendCharUnchecked (enc, '\"');
-
-      if (enc->forceASCII)
-      {
-        if (!Buffer_EscapeStringValidated(obj, enc, value, value + szlen))
-        {
-          enc->endTypeContext(obj, &tc);
-          enc->level --;
-          return;
-        }
-      }
-      else
-      {
-        if (!Buffer_EscapeStringUnvalidated(enc, value, value + szlen))
-        {
-          enc->endTypeContext(obj, &tc);
-          enc->level --;
-          return;
-        }
-      }
-
-      Buffer_AppendCharUnchecked (enc, '\"');
-      break;
-    }
-  }
-
-  enc->endTypeContext(obj, &tc);
-  enc->level --;
-}
-
-char *JSON_EncodeObject(JSOBJ obj, JSONObjectEncoder *enc, char *_buffer, size_t _cbBuffer)
-{
-  char *locale;
-  enc->malloc = enc->malloc ? enc->malloc : malloc;
-  enc->free =  enc->free ? enc->free : free;
-  enc->realloc = enc->realloc ? enc->realloc : realloc;
-  enc->errorMsg = NULL;
-  enc->errorObj = NULL;
-  enc->level = 0;
-
-  if (enc->recursionMax < 1)
-  {
-    enc->recursionMax = JSON_MAX_RECURSION_DEPTH;
-  }
-
-  if (enc->doublePrecision < 0 ||
-          enc->doublePrecision > JSON_DOUBLE_MAX_DECIMALS)
-  {
-    enc->doublePrecision = JSON_DOUBLE_MAX_DECIMALS;
-  }
-
-  if (_buffer == NULL)
-  {
-    _cbBuffer = 32768;
-    enc->start = (char *) enc->malloc (_cbBuffer);
-    if (!enc->start)
-    {
-      SetError(obj, enc, "Could not reserve memory block");
-      return NULL;
-    }
-    enc->heap = 1;
-  }
-  else
-  {
-    enc->start = _buffer;
-    enc->heap = 0;
-  }
-
-  enc->end = enc->start + _cbBuffer;
-  enc->offset = enc->start;
-
-  locale = setlocale(LC_NUMERIC, NULL);
-  if (strcmp(locale, "C"))
-  {
-    locale = strdup(locale);
-    if (!locale)
-    {
-      SetError(NULL, enc, "Could not reserve memory block");
-      return NULL;
-    }
-    setlocale(LC_NUMERIC, "C");
-    encode (obj, enc, NULL, 0);
-    setlocale(LC_NUMERIC, locale);
-    free(locale);
-  }
-  else 
-  {
-    encode (obj, enc, NULL, 0);
-  }
-
-  Buffer_Reserve(enc, 1);
-  if (enc->errorMsg)
-  {
-    return NULL;
-  }
-  Buffer_AppendCharUnchecked(enc, '\0');
-
-  return enc->start;
-}
diff --git a/pandas/src/ujson/python/JSONtoObj.c b/pandas/src/ujson/python/JSONtoObj.c
deleted file mode 100644
index 9c1b4febd9895..0000000000000
--- a/pandas/src/ujson/python/JSONtoObj.c
+++ /dev/null
@@ -1,736 +0,0 @@
-/*
-Copyright (c) 2011-2013, ESN Social Software AB and Jonas Tarnstrom
-All rights reserved.
-
-Redistribution and use in source and binary forms, with or without
-modification, are permitted provided that the following conditions are met:
-    * Redistributions of source code must retain the above copyright
-      notice, this list of conditions and the following disclaimer.
-    * Redistributions in binary form must reproduce the above copyright
-      notice, this list of conditions and the following disclaimer in the
-      documentation and/or other materials provided with the distribution.
-    * Neither the name of the ESN Social Software AB nor the
-      names of its contributors may be used to endorse or promote products
-      derived from this software without specific prior written permission.
-
-THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
-ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE LIABLE
-FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
-(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
-LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
-ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
-SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-
-Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
-http://code.google.com/p/stringencoders/
-Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights reserved.
-
-Numeric decoder derived from from TCL library
-http://www.opensource.apple.com/source/tcl/tcl-14/tcl/license.terms
- * Copyright (c) 1988-1993 The Regents of the University of California.
- * Copyright (c) 1994 Sun Microsystems, Inc.
-*/
-
-#include "py_defines.h"
-#define PY_ARRAY_UNIQUE_SYMBOL UJSON_NUMPY
-#define NO_IMPORT_ARRAY
-#include <numpy/arrayobject.h>
-#include <ultrajson.h>
-
-
-//#define PRINTMARK() fprintf(stderr, "%s: MARK(%d)\n", __FILE__, __LINE__)
-#define PRINTMARK()
-
-typedef struct __PyObjectDecoder
-{
-  JSONObjectDecoder dec;
-
-  void* npyarr;       // Numpy context buffer
-  void* npyarr_addr;  // Ref to npyarr ptr to track DECREF calls
-  npy_intp curdim;    // Current array dimension
-
-  PyArray_Descr* dtype;
-} PyObjectDecoder;
-
-typedef struct __NpyArrContext
-{
-  PyObject* ret;
-  PyObject* labels[2];
-  PyArray_Dims shape;
-
-  PyObjectDecoder* dec;
-
-  npy_intp i;
-  npy_intp elsize;
-  npy_intp elcount;
-} NpyArrContext;
-
-// Numpy handling based on numpy internal code, specifically the function
-// PyArray_FromIter.
-
-// numpy related functions are inter-dependent so declare them all here,
-// to ensure the compiler catches any errors
-
-// standard numpy array handling
-JSOBJ Object_npyNewArray(void *prv, void* decoder);
-JSOBJ Object_npyEndArray(void *prv, JSOBJ obj);
-int Object_npyArrayAddItem(void *prv, JSOBJ obj, JSOBJ value);
-
-// for more complex dtypes (object and string) fill a standard Python list
-// and convert to a numpy array when done.
-JSOBJ Object_npyNewArrayList(void *prv, void* decoder);
-JSOBJ Object_npyEndArrayList(void *prv, JSOBJ obj);
-int Object_npyArrayListAddItem(void *prv, JSOBJ obj, JSOBJ value);
-
-// labelled support, encode keys and values of JS object into separate numpy
-// arrays
-JSOBJ Object_npyNewObject(void *prv, void* decoder);
-JSOBJ Object_npyEndObject(void *prv, JSOBJ obj);
-int Object_npyObjectAddKey(void *prv, JSOBJ obj, JSOBJ name, JSOBJ value);
-
-// free the numpy context buffer
-void Npy_releaseContext(NpyArrContext* npyarr)
-{
-  PRINTMARK();
-  if (npyarr)
-  {
-    if (npyarr->shape.ptr)
-    {
-      PyObject_Free(npyarr->shape.ptr);
-    }
-    if (npyarr->dec)
-    {
-      npyarr->dec->npyarr = NULL;
-      npyarr->dec->curdim = 0;
-    }
-    Py_XDECREF(npyarr->labels[0]);
-    Py_XDECREF(npyarr->labels[1]);
-    Py_XDECREF(npyarr->ret);
-    PyObject_Free(npyarr);
-  }
-}
-
-JSOBJ Object_npyNewArray(void *prv, void* _decoder)
-{
-  NpyArrContext* npyarr;
-  PyObjectDecoder* decoder = (PyObjectDecoder*) _decoder;
-  PRINTMARK();
-  if (decoder->curdim <= 0)
-  {
-    // start of array - initialise the context buffer
-    npyarr = decoder->npyarr = PyObject_Malloc(sizeof(NpyArrContext));
-    decoder->npyarr_addr = npyarr;
-
-    if (!npyarr)
-    {
-      PyErr_NoMemory();
-      return NULL;
-    }
-
-    npyarr->dec = decoder;
-    npyarr->labels[0] = npyarr->labels[1] = NULL;
-
-    npyarr->shape.ptr = PyObject_Malloc(sizeof(npy_intp)*NPY_MAXDIMS);
-    npyarr->shape.len = 1;
-    npyarr->ret = NULL;
-
-    npyarr->elsize = 0;
-    npyarr->elcount = 4;
-    npyarr->i = 0;
-  }
-  else
-  {
-    // starting a new dimension continue the current array (and reshape after)
-    npyarr = (NpyArrContext*) decoder->npyarr;
-    if (decoder->curdim >= npyarr->shape.len)
-    {
-      npyarr->shape.len++;
-    }
-  }
-
-  npyarr->shape.ptr[decoder->curdim] = 0;
-  decoder->curdim++;
-  return npyarr;
-}
-
-PyObject* Npy_returnLabelled(NpyArrContext* npyarr)
-{
-  PyObject* ret = npyarr->ret;
-  npy_intp i;
-
-  if (npyarr->labels[0] || npyarr->labels[1])
-  {
-    // finished decoding, build tuple with values and labels
-    ret = PyTuple_New(npyarr->shape.len+1);
-    for (i = 0; i < npyarr->shape.len; i++)
-    {
-      if (npyarr->labels[i])
-      {
-        PyTuple_SET_ITEM(ret, i+1, npyarr->labels[i]);
-        npyarr->labels[i] = NULL;
-      }
-      else
-      {
-        Py_INCREF(Py_None);
-        PyTuple_SET_ITEM(ret, i+1, Py_None);
-      }
-    }
-    PyTuple_SET_ITEM(ret, 0, npyarr->ret);
-  }
-
-  return ret;
-}
-
-JSOBJ Object_npyEndArray(void *prv, JSOBJ obj)
-{
-  PyObject *ret;
-  char* new_data;
-  NpyArrContext* npyarr = (NpyArrContext*) obj;
-  int emptyType = NPY_DEFAULT_TYPE;
-  npy_intp i;
-  PRINTMARK();
-  if (!npyarr)
-  {
-    return NULL;
-  }
-
-  ret = npyarr->ret;
-  i = npyarr->i;
-
-  npyarr->dec->curdim--;
-
-  if (i == 0 || !npyarr->ret) {
-    // empty array would not have been initialised so do it now.
-    if (npyarr->dec->dtype)
-    {
-      emptyType = npyarr->dec->dtype->type_num;
-    }
-    npyarr->ret = ret = PyArray_EMPTY(npyarr->shape.len, npyarr->shape.ptr, emptyType, 0);
-  }
-  else if (npyarr->dec->curdim <= 0)
-  {
-    // realloc to final size
-    new_data = PyDataMem_RENEW(PyArray_DATA(ret), i * npyarr->elsize);
-    if (new_data == NULL) {
-      PyErr_NoMemory();
-      Npy_releaseContext(npyarr);
-      return NULL;
-    }
-    ((PyArrayObject*) ret)->data = (void*) new_data;
-    // PyArray_BYTES(ret) = new_data;
-  }
-
-  if (npyarr->dec->curdim <= 0)
-  {
-    // finished decoding array, reshape if necessary
-    if (npyarr->shape.len > 1)
-    {
-      npyarr->ret = PyArray_Newshape((PyArrayObject*) ret, &npyarr->shape, NPY_ANYORDER);
-      Py_DECREF(ret);
-    }
-
-    ret = Npy_returnLabelled(npyarr);
-
-    npyarr->ret = NULL;
-    Npy_releaseContext(npyarr);
-  }
-
-  return ret;
-}
-
-int Object_npyArrayAddItem(void *prv, JSOBJ obj, JSOBJ value)
-{
-  PyObject* type;
-  PyArray_Descr* dtype;
-  npy_intp i;
-  char *new_data, *item;
-  NpyArrContext* npyarr = (NpyArrContext*) obj;
-  PRINTMARK();
-  if (!npyarr)
-  {
-    return 0;
-  }
-
-  i = npyarr->i;
-
-  npyarr->shape.ptr[npyarr->dec->curdim-1]++;
-
-  if (PyArray_Check((PyObject*)value))
-  {
-    // multidimensional array, keep decoding values.
-    return 1;
-  }
-
-  if (!npyarr->ret)
-  {
-    // Array not initialised yet.
-    // We do it here so we can 'sniff' the data type if none was provided
-    if (!npyarr->dec->dtype)
-    {
-      type = PyObject_Type(value);
-      if(!PyArray_DescrConverter(type, &dtype))
-      {
-        Py_DECREF(type);
-        goto fail;
-      }
-      Py_INCREF(dtype);
-      Py_DECREF(type);
-    }
-    else
-    {
-      dtype = PyArray_DescrNew(npyarr->dec->dtype);
-    }
-
-    // If it's an object or string then fill a Python list and subsequently
-    // convert. Otherwise we would need to somehow mess about with
-    // reference counts when renewing memory.
-    npyarr->elsize = dtype->elsize;
-    if (PyDataType_REFCHK(dtype) || npyarr->elsize == 0)
-    {
-      Py_XDECREF(dtype);
-
-      if (npyarr->dec->curdim > 1)
-      {
-        PyErr_SetString(PyExc_ValueError, "Cannot decode multidimensional arrays with variable length elements to numpy");
-        goto fail;
-      }
-      npyarr->elcount = 0;
-      npyarr->ret = PyList_New(0);
-      if (!npyarr->ret)
-      {
-        goto fail;
-      }
-      ((JSONObjectDecoder*)npyarr->dec)->newArray = Object_npyNewArrayList;
-      ((JSONObjectDecoder*)npyarr->dec)->arrayAddItem = Object_npyArrayListAddItem;
-      ((JSONObjectDecoder*)npyarr->dec)->endArray = Object_npyEndArrayList;
-      return Object_npyArrayListAddItem(prv, obj, value);
-    }
-
-    npyarr->ret = PyArray_NewFromDescr(&PyArray_Type, dtype, 1,
-        &npyarr->elcount, NULL,NULL, 0, NULL);
-
-    if (!npyarr->ret)
-    {
-      goto fail;
-    }
-  }
-
-  if (i >= npyarr->elcount) {
-    // Grow PyArray_DATA(ret):
-    // this is similar for the strategy for PyListObject, but we use
-    // 50% overallocation => 0, 4, 8, 14, 23, 36, 56, 86 ...
-    if (npyarr->elsize == 0)
-    {
-      PyErr_SetString(PyExc_ValueError, "Cannot decode multidimensional arrays with variable length elements to numpy");
-      goto fail;
-    }
-
-    npyarr->elcount = (i >> 1) + (i < 4 ? 4 : 2) + i;
-    if (npyarr->elcount <= NPY_MAX_INTP/npyarr->elsize) {
-      new_data = PyDataMem_RENEW(PyArray_DATA(npyarr->ret), npyarr->elcount * npyarr->elsize);
-    }
-    else {
-      PyErr_NoMemory();
-      goto fail;
-    }
-    ((PyArrayObject*) npyarr->ret)->data = (void*) new_data;
-
-    // PyArray_BYTES(npyarr->ret) = new_data;
-  }
-
-  PyArray_DIMS(npyarr->ret)[0] = i + 1;
-
-  if ((item = PyArray_GETPTR1(npyarr->ret, i)) == NULL
-      || PyArray_SETITEM(npyarr->ret, item, value) == -1) {
-    goto fail;
-  }
-
-  Py_DECREF( (PyObject *) value);
-  npyarr->i++;
-  return 1;
-
-fail:
-
-  Npy_releaseContext(npyarr);
-  return 0;
-}
-
-JSOBJ Object_npyNewArrayList(void *prv, void* _decoder)
-{
-  PyObjectDecoder* decoder = (PyObjectDecoder*) _decoder;
-  PRINTMARK();
-  PyErr_SetString(PyExc_ValueError, "nesting not supported for object or variable length dtypes");
-  Npy_releaseContext(decoder->npyarr);
-  return NULL;
-}
-
-JSOBJ Object_npyEndArrayList(void *prv, JSOBJ obj)
-{
-  PyObject *list, *ret;
-  NpyArrContext* npyarr = (NpyArrContext*) obj;
-  PRINTMARK();
-  if (!npyarr)
-  {
-    return NULL;
-  }
-
-  // convert decoded list to numpy array
-  list = (PyObject *) npyarr->ret;
-  npyarr->ret = PyArray_FROM_O(list);
-
-  ret = Npy_returnLabelled(npyarr);
-  npyarr->ret = list;
-
-  ((JSONObjectDecoder*)npyarr->dec)->newArray = Object_npyNewArray;
-  ((JSONObjectDecoder*)npyarr->dec)->arrayAddItem = Object_npyArrayAddItem;
-  ((JSONObjectDecoder*)npyarr->dec)->endArray = Object_npyEndArray;
-  Npy_releaseContext(npyarr);
-  return ret;
-}
-
-int Object_npyArrayListAddItem(void *prv, JSOBJ obj, JSOBJ value)
-{
-  NpyArrContext* npyarr = (NpyArrContext*) obj;
-  PRINTMARK();
-  if (!npyarr)
-  {
-    return 0;
-  }
-  PyList_Append((PyObject*) npyarr->ret, value);
-  Py_DECREF( (PyObject *) value);
-  npyarr->elcount++;
-  return 1;
-}
-
-
-JSOBJ Object_npyNewObject(void *prv, void* _decoder)
-{
-  PyObjectDecoder* decoder = (PyObjectDecoder*) _decoder;
-  PRINTMARK();
-  if (decoder->curdim > 1)
-  {
-    PyErr_SetString(PyExc_ValueError, "labels only supported up to 2 dimensions");
-    return NULL;
-  }
-
-  return ((JSONObjectDecoder*)decoder)->newArray(prv, decoder);
-}
-
-JSOBJ Object_npyEndObject(void *prv, JSOBJ obj)
-{
-  PyObject *list;
-  npy_intp labelidx;
-  NpyArrContext* npyarr = (NpyArrContext*) obj;
-  PRINTMARK();
-  if (!npyarr)
-  {
-    return NULL;
-  }
-
-  labelidx = npyarr->dec->curdim-1;
-
-  list = npyarr->labels[labelidx];
-  if (list)
-  {
-    npyarr->labels[labelidx] = PyArray_FROM_O(list);
-    Py_DECREF(list);
-  }
-
-  return (PyObject*) ((JSONObjectDecoder*)npyarr->dec)->endArray(prv, obj);
-}
-
-int Object_npyObjectAddKey(void *prv, JSOBJ obj, JSOBJ name, JSOBJ value)
-{
-  PyObject *label;
-  npy_intp labelidx;
-  // add key to label array, value to values array
-  NpyArrContext* npyarr = (NpyArrContext*) obj;
-  PRINTMARK();
-  if (!npyarr)
-  {
-    return 0;
-  }
-
-  label = (PyObject*) name;
-  labelidx = npyarr->dec->curdim-1;
-
-  if (!npyarr->labels[labelidx])
-  {
-    npyarr->labels[labelidx] = PyList_New(0);
-  }
-
-  // only fill label array once, assumes all column labels are the same
-  // for 2-dimensional arrays.
-  if (PyList_GET_SIZE(npyarr->labels[labelidx]) <= npyarr->elcount)
-  {
-    PyList_Append(npyarr->labels[labelidx], label);
-  }
-
-  if(((JSONObjectDecoder*)npyarr->dec)->arrayAddItem(prv, obj, value))
-  {
-    Py_DECREF(label);
-    return 1;
-  }
-  return 0;
-}
-
-int Object_objectAddKey(void *prv, JSOBJ obj, JSOBJ name, JSOBJ value)
-{
-  PyDict_SetItem (obj, name, value);
-  Py_DECREF( (PyObject *) name);
-  Py_DECREF( (PyObject *) value);
-  return 1;
-}
-
-int Object_arrayAddItem(void *prv, JSOBJ obj, JSOBJ value)
-{
-  PyList_Append(obj, value);
-  Py_DECREF( (PyObject *) value);
-  return 1;
-}
-
-JSOBJ Object_newString(void *prv, wchar_t *start, wchar_t *end)
-{
-  return PyUnicode_FromWideChar (start, (end - start));
-}
-
-JSOBJ Object_newTrue(void *prv)
-{
-  Py_RETURN_TRUE;
-}
-
-JSOBJ Object_newFalse(void *prv)
-{
-  Py_RETURN_FALSE;
-}
-
-JSOBJ Object_newNull(void *prv)
-{
-  Py_RETURN_NONE;
-}
-
-JSOBJ Object_newObject(void *prv, void* decoder)
-{
-  return PyDict_New();
-}
-
-JSOBJ Object_endObject(void *prv, JSOBJ obj)
-{
-  return obj;
-}
-
-JSOBJ Object_newArray(void *prv, void* decoder)
-{
-  return PyList_New(0);
-}
-
-JSOBJ Object_endArray(void *prv, JSOBJ obj)
-{
-  return obj;
-}
-
-JSOBJ Object_newInteger(void *prv, JSINT32 value)
-{
-  return PyInt_FromLong( (long) value);
-}
-
-JSOBJ Object_newLong(void *prv, JSINT64 value)
-{
-  return PyLong_FromLongLong (value);
-}
-
-JSOBJ Object_newDouble(void *prv, double value)
-{
-  return PyFloat_FromDouble(value);
-}
-
-static void Object_releaseObject(void *prv, JSOBJ obj, void* _decoder)
-{
-  PyObjectDecoder* decoder = (PyObjectDecoder*) _decoder;
-  if (obj != decoder->npyarr_addr)
-  {
-    Py_XDECREF( ((PyObject *)obj));
-  }
-}
-
-static char *g_kwlist[] = {"obj", "precise_float", "numpy", "labelled", "dtype", NULL};
-
-PyObject* JSONToObj(PyObject* self, PyObject *args, PyObject *kwargs)
-{
-  PyObject *ret;
-  PyObject *sarg;
-  PyObject *arg;
-  PyObject *opreciseFloat = NULL;
-  JSONObjectDecoder *decoder;
-  PyObjectDecoder pyDecoder;
-  PyArray_Descr *dtype = NULL;
-  int numpy = 0, labelled = 0;
-
-  JSONObjectDecoder dec =
-  {
-    Object_newString,
-    Object_objectAddKey,
-    Object_arrayAddItem,
-    Object_newTrue,
-    Object_newFalse,
-    Object_newNull,
-    Object_newObject,
-    Object_endObject,
-    Object_newArray,
-    Object_endArray,
-    Object_newInteger,
-    Object_newLong,
-    Object_newDouble,
-    Object_releaseObject,
-    PyObject_Malloc,
-    PyObject_Free,
-    PyObject_Realloc
-  };
-
-  dec.preciseFloat = 0;
-  dec.prv = NULL;
-
-  pyDecoder.dec = dec;
-  pyDecoder.curdim = 0;
-  pyDecoder.npyarr = NULL;
-  pyDecoder.npyarr_addr = NULL;
-
-  decoder = (JSONObjectDecoder*) &pyDecoder;
-
-  if (!PyArg_ParseTupleAndKeywords(args, kwargs, "O|OiiO&", g_kwlist, &arg, &opreciseFloat, &numpy, &labelled, PyArray_DescrConverter2, &dtype))
-  {
-      Npy_releaseContext(pyDecoder.npyarr);
-      return NULL;
-  }
-
-  if (opreciseFloat && PyObject_IsTrue(opreciseFloat))
-  {
-      decoder->preciseFloat = 1;
-  }
-
-  if (PyString_Check(arg))
-  {
-      sarg = arg;
-  }
-  else
-  if (PyUnicode_Check(arg))
-  {
-    sarg = PyUnicode_AsUTF8String(arg);
-    if (sarg == NULL)
-    {
-      //Exception raised above us by codec according to docs
-      return NULL;
-    }
-  }
-  else
-  {
-    PyErr_Format(PyExc_TypeError, "Expected String or Unicode");
-    return NULL;
-  }
-
-  decoder->errorStr = NULL;
-  decoder->errorOffset = NULL;
-
-  if (numpy)
-  {
-    pyDecoder.dtype = dtype;
-    decoder->newArray = Object_npyNewArray;
-    decoder->endArray = Object_npyEndArray;
-    decoder->arrayAddItem = Object_npyArrayAddItem;
-
-    if (labelled)
-    {
-      decoder->newObject = Object_npyNewObject;
-      decoder->endObject = Object_npyEndObject;
-      decoder->objectAddKey = Object_npyObjectAddKey;
-    }
-  }
-
-  ret = JSON_DecodeObject(decoder, PyString_AS_STRING(sarg), PyString_GET_SIZE(sarg));
-
-  if (sarg != arg)
-  {
-    Py_DECREF(sarg);
-  }
-
-  if (PyErr_Occurred())
-  {    
-    if (ret)
-    {
-        Py_DECREF( (PyObject *) ret);
-    }
-    Npy_releaseContext(pyDecoder.npyarr);   
-    return NULL;
-  }
-
-  if (decoder->errorStr)
-  {
-    /*
-    FIXME: It's possible to give a much nicer error message here with actual failing element in input etc*/
-
-    PyErr_Format (PyExc_ValueError, "%s", decoder->errorStr);
-
-    if (ret)
-    {
-        Py_DECREF( (PyObject *) ret);
-    }
-    Npy_releaseContext(pyDecoder.npyarr);
-
-    return NULL;
-  }
-
-  return ret;
-}
-
-PyObject* JSONFileToObj(PyObject* self, PyObject *args, PyObject *kwargs)
-{
-  PyObject *read;
-  PyObject *string;
-  PyObject *result;
-  PyObject *file = NULL;
-  PyObject *argtuple;
-
-  if (!PyArg_ParseTuple (args, "O", &file))
-  {
-    return NULL;
-  }
-
-  if (!PyObject_HasAttrString (file, "read"))
-  {
-    PyErr_Format (PyExc_TypeError, "expected file");
-    return NULL;
-  }
-
-  read = PyObject_GetAttrString (file, "read");
-
-  if (!PyCallable_Check (read)) {
-    Py_XDECREF(read);
-    PyErr_Format (PyExc_TypeError, "expected file");
-    return NULL;
-  }
-
-  string = PyObject_CallObject (read, NULL);
-  Py_XDECREF(read);
-
-  if (string == NULL)
-  {
-    return NULL;
-  }
-
-  argtuple = PyTuple_Pack(1, string);
-
-  result = JSONToObj (self, argtuple, kwargs);
-
-  Py_XDECREF(argtuple);
-  Py_XDECREF(string);
-
-  if (result == NULL) {
-    return NULL;
-  }
-
-  return result;
-}
diff --git a/pandas/src/ujson/python/objToJSON.c b/pandas/src/ujson/python/objToJSON.c
deleted file mode 100644
index dcb509be696dc..0000000000000
--- a/pandas/src/ujson/python/objToJSON.c
+++ /dev/null
@@ -1,2769 +0,0 @@
-/*
-Copyright (c) 2011-2013, ESN Social Software AB and Jonas Tarnstrom
-All rights reserved.
-
-Redistribution and use in source and binary forms, with or without
-modification, are permitted provided that the following conditions are met:
-* Redistributions of source code must retain the above copyright
-notice, this list of conditions and the following disclaimer.
-* Redistributions in binary form must reproduce the above copyright
-notice, this list of conditions and the following disclaimer in the
-documentation and/or other materials provided with the distribution.
-* Neither the name of the ESN Social Software AB nor the
-names of its contributors may be used to endorse or promote products
-derived from this software without specific prior written permission.
-
-THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
-ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE LIABLE
-FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
-(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
-LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
-ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
-SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-
-Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
-http://code.google.com/p/stringencoders/
-Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights reserved.
-
-Numeric decoder derived from from TCL library
-http://www.opensource.apple.com/source/tcl/tcl-14/tcl/license.terms
-* Copyright (c) 1988-1993 The Regents of the University of California.
-* Copyright (c) 1994 Sun Microsystems, Inc.
-*/
-#define PY_ARRAY_UNIQUE_SYMBOL UJSON_NUMPY
-
-#include "py_defines.h"
-#include <numpy/arrayobject.h>
-#include <numpy/arrayscalars.h>
-#include <np_datetime.h>
-#include <np_datetime_strings.h>
-#include <datetime_helper.h>
-#include <numpy_helper.h>
-#include <numpy/npy_math.h>
-#include <math.h>
-#include <stdio.h>
-#include <ultrajson.h>
-
-static PyObject* type_decimal;
-
-#define NPY_JSON_BUFSIZE 32768
-
-static PyTypeObject* cls_dataframe;
-static PyTypeObject* cls_series;
-static PyTypeObject* cls_index;
-static PyTypeObject* cls_nat;
-
-typedef void *(*PFN_PyTypeToJSON)(JSOBJ obj, JSONTypeContext *ti, void *outValue, size_t *_outLen);
-
-#if (PY_VERSION_HEX < 0x02050000)
-typedef ssize_t Py_ssize_t;
-#endif
-
-
-typedef struct __NpyArrContext
-{
-  PyObject *array;
-  char* dataptr;
-  int curdim;         // current dimension in array's order
-  int stridedim;      // dimension we are striding over
-  int inc;            // stride dimension increment (+/- 1)
-  npy_intp dim;
-  npy_intp stride;
-  npy_intp ndim;
-  npy_intp index[NPY_MAXDIMS];
-  int type_num;
-  PyArray_GetItemFunc* getitem;
-
-  char** rowLabels;
-  char** columnLabels;
-} NpyArrContext;
-
-typedef struct __PdBlockContext
-{
-  int colIdx;
-  int ncols;
-  int transpose;
-
-  int* cindices;             // frame column -> block column map
-  NpyArrContext** npyCtxts;  // NpyArrContext for each column
-} PdBlockContext;
-
-typedef struct __TypeContext
-{
-  JSPFN_ITERBEGIN iterBegin;
-  JSPFN_ITEREND iterEnd;
-  JSPFN_ITERNEXT iterNext;
-  JSPFN_ITERGETNAME iterGetName;
-  JSPFN_ITERGETVALUE iterGetValue;
-  PFN_PyTypeToJSON PyTypeToJSON;
-  PyObject *newObj;
-  PyObject *dictObj;
-  Py_ssize_t index;
-  Py_ssize_t size;
-  PyObject *itemValue;
-  PyObject *itemName;
-  PyObject *attrList;
-  PyObject *iterator;
-
-  double doubleValue;
-  JSINT64 longValue;
-
-  char *cStr;
-  NpyArrContext *npyarr;
-  PdBlockContext *pdblock;
-  int transpose;
-  char** rowLabels;
-  char** columnLabels;
-  npy_intp rowLabelsLen;
-  npy_intp columnLabelsLen;
-} TypeContext;
-
-typedef struct __PyObjectEncoder
-{
-    JSONObjectEncoder enc;
-
-    // pass through the NpyArrContext when encoding multi-dimensional arrays
-    NpyArrContext* npyCtxtPassthru;
-
-    // pass through the PdBlockContext when encoding blocks
-    PdBlockContext* blkCtxtPassthru;
-
-    // pass-through to encode numpy data directly
-    int npyType;
-    void* npyValue;
-    TypeContext basicTypeContext;
-
-    int datetimeIso;
-    PANDAS_DATETIMEUNIT datetimeUnit;
-
-    // output format style for pandas data types
-    int outputFormat;
-    int originalOutputFormat;
-
-    PyObject *defaultHandler;
-} PyObjectEncoder;
-
-#define GET_TC(__ptrtc) ((TypeContext *)((__ptrtc)->prv))
-
-enum PANDAS_FORMAT
-{
-  SPLIT,
-  RECORDS,
-  INDEX,
-  COLUMNS,
-  VALUES
-};
-
-//#define PRINTMARK() fprintf(stderr, "%s: MARK(%d)\n", __FILE__, __LINE__)
-#define PRINTMARK()
-
-int PdBlock_iterNext(JSOBJ, JSONTypeContext *);
-
-// import_array() compat
-#if (PY_VERSION_HEX >= 0x03000000)
-void *initObjToJSON(void)
-
-#else
-void initObjToJSON(void)
-#endif
-{
-  PyObject *mod_pandas;
-  PyObject *mod_tslib;
-  PyObject* mod_decimal = PyImport_ImportModule("decimal");
-  type_decimal = PyObject_GetAttrString(mod_decimal, "Decimal");
-  Py_INCREF(type_decimal);
-  Py_DECREF(mod_decimal);
-
-  PyDateTime_IMPORT;
-
-  mod_pandas = PyImport_ImportModule("pandas");
-  if (mod_pandas)
-  {
-    cls_dataframe = (PyTypeObject*) PyObject_GetAttrString(mod_pandas, "DataFrame");
-    cls_index = (PyTypeObject*) PyObject_GetAttrString(mod_pandas, "Index");
-    cls_series = (PyTypeObject*) PyObject_GetAttrString(mod_pandas, "Series");
-    Py_DECREF(mod_pandas);
-  }
-
-  mod_tslib = PyImport_ImportModule("pandas.tslib");
-  if (mod_tslib)
-  {
-    cls_nat = (PyTypeObject*) PyObject_GetAttrString(mod_tslib, "NaTType");
-    Py_DECREF(mod_tslib);
-  }
-
-  /* Initialise numpy API and use 2/3 compatible return */
-  import_array();
-  return NUMPY_IMPORT_ARRAY_RETVAL;
-}
-
-static TypeContext* createTypeContext(void)
-{
-  TypeContext *pc;
-
-  pc = PyObject_Malloc(sizeof(TypeContext));
-  if (!pc)
-  {
-    PyErr_NoMemory();
-    return NULL;
-  }
-  pc->newObj = NULL;
-  pc->dictObj = NULL;
-  pc->itemValue = NULL;
-  pc->itemName = NULL;
-  pc->attrList = NULL;
-  pc->index = 0;
-  pc->size = 0;
-  pc->longValue = 0;
-  pc->doubleValue = 0.0;
-  pc->cStr = NULL;
-  pc->npyarr = NULL;
-  pc->pdblock = NULL;
-  pc->rowLabels = NULL;
-  pc->columnLabels = NULL;
-  pc->transpose = 0;
-  pc->rowLabelsLen = 0;
-  pc->columnLabelsLen = 0;
-
-  return pc;
-}
-
-static PyObject* get_sub_attr(PyObject *obj, char *attr, char *subAttr)
-{
-  PyObject *tmp = PyObject_GetAttrString(obj, attr);
-  PyObject *ret;
-
-  if (tmp == 0)
-  {
-    return 0;
-  }
-  ret = PyObject_GetAttrString(tmp, subAttr);
-  Py_DECREF(tmp);
-
-  return ret;
-}
-
-static int is_simple_frame(PyObject *obj)
-{
-  PyObject *check = get_sub_attr(obj, "_data", "is_mixed_type");
-  int ret = (check == Py_False);
-
-  if (!check)
-  {
-    return 0;
-  }
-
-  Py_DECREF(check);
-  return ret;
-}
-
-static Py_ssize_t get_attr_length(PyObject *obj, char *attr)
-{
-  PyObject *tmp = PyObject_GetAttrString(obj, attr);
-  Py_ssize_t ret;
-
-  if (tmp == 0)
-  {
-    return 0;
-  }
-  ret = PyObject_Length(tmp);
-  Py_DECREF(tmp);
-
-  if (ret == -1)
-  {
-    return 0;
-  }
-
-  return ret;
-}
-
-static PyObject* get_item(PyObject *obj, Py_ssize_t i)
-{
-  PyObject *tmp = PyInt_FromSsize_t(i);
-  PyObject *ret;
-
-  if (tmp == 0)
-  {
-    return 0;
-  }
-  ret = PyObject_GetItem(obj, tmp);
-  Py_DECREF(tmp);
-
-  return ret;
-}
-
-static void *CDouble(JSOBJ obj, JSONTypeContext *tc, void *outValue, size_t *_outLen)
-{
-  PRINTMARK();
-  *((double *) outValue) = GET_TC(tc)->doubleValue;
-  return NULL;
-}
-
-static void *CLong(JSOBJ obj, JSONTypeContext *tc, void *outValue, size_t *_outLen)
-{
-  PRINTMARK();
-  *((JSINT64 *) outValue) = GET_TC(tc)->longValue;
-  return NULL;
-}
-
-#ifdef _LP64
-static void *PyIntToINT64(JSOBJ _obj, JSONTypeContext *tc, void *outValue, size_t *_outLen)
-{
-  PyObject *obj = (PyObject *) _obj;
-  *((JSINT64 *) outValue) = PyInt_AS_LONG (obj);
-  return NULL;
-}
-#else
-static void *PyIntToINT32(JSOBJ _obj, JSONTypeContext *tc, void *outValue, size_t *_outLen)
-{
-  PyObject *obj = (PyObject *) _obj;
-  *((JSINT32 *) outValue) = PyInt_AS_LONG (obj);
-  return NULL;
-}
-#endif
-
-static void *PyLongToINT64(JSOBJ _obj, JSONTypeContext *tc, void *outValue, size_t *_outLen)
-{
-  *((JSINT64 *) outValue) = GET_TC(tc)->longValue;
-  return NULL;
-}
-
-static void *NpyFloatToDOUBLE(JSOBJ _obj, JSONTypeContext *tc, void *outValue, size_t *_outLen)
-{
-  PyObject *obj = (PyObject *) _obj;
-  PyArray_CastScalarToCtype(obj, outValue, PyArray_DescrFromType(NPY_DOUBLE));
-  return NULL;
-}
-
-static void *PyFloatToDOUBLE(JSOBJ _obj, JSONTypeContext *tc, void *outValue, size_t *_outLen)
-{
-  PyObject *obj = (PyObject *) _obj;
-  *((double *) outValue) = PyFloat_AsDouble (obj);
-  return NULL;
-}
-
-static void *PyStringToUTF8(JSOBJ _obj, JSONTypeContext *tc, void *outValue, size_t *_outLen)
-{
-  PyObject *obj = (PyObject *) _obj;
-  *_outLen = PyString_GET_SIZE(obj);
-  return PyString_AS_STRING(obj);
-}
-
-static void *PyUnicodeToUTF8(JSOBJ _obj, JSONTypeContext *tc, void *outValue, size_t *_outLen)
-{
-  PyObject *obj = (PyObject *) _obj;
-  PyObject *newObj = PyUnicode_EncodeUTF8 (PyUnicode_AS_UNICODE(obj), PyUnicode_GET_SIZE(obj), NULL);
-
-  GET_TC(tc)->newObj = newObj;
-
-  *_outLen = PyString_GET_SIZE(newObj);
-  return PyString_AS_STRING(newObj);
-}
-
-static void *PandasDateTimeStructToJSON(pandas_datetimestruct *dts, JSONTypeContext *tc, void *outValue, size_t *_outLen)
-{
-  int base = ((PyObjectEncoder*) tc->encoder)->datetimeUnit;
-
-  if (((PyObjectEncoder*) tc->encoder)->datetimeIso)
-  {
-    PRINTMARK();
-    *_outLen = (size_t) get_datetime_iso_8601_strlen(0, base);
-    GET_TC(tc)->cStr = PyObject_Malloc(sizeof(char) * (*_outLen));
-    if (!GET_TC(tc)->cStr)
-    {
-      PyErr_NoMemory();
-      ((JSONObjectEncoder*) tc->encoder)->errorMsg = "";
-      return NULL;
-    }
-
-    if (!make_iso_8601_datetime(dts, GET_TC(tc)->cStr, *_outLen, 0, base, -1, NPY_UNSAFE_CASTING))
-    {
-      PRINTMARK();
-      *_outLen = strlen(GET_TC(tc)->cStr);
-      return GET_TC(tc)->cStr;
-    }
-    else
-    {
-      PRINTMARK();
-      PyErr_SetString(PyExc_ValueError, "Could not convert datetime value to string");
-      ((JSONObjectEncoder*) tc->encoder)->errorMsg = "";
-      PyObject_Free(GET_TC(tc)->cStr);
-      return NULL;
-    }
-  }
-  else
-  {
-    PRINTMARK();
-    *((JSINT64*)outValue) = pandas_datetimestruct_to_datetime(base, dts);
-    return NULL;
-  }
-}
-
-static void *NpyDateTimeScalarToJSON(JSOBJ _obj, JSONTypeContext *tc, void *outValue, size_t *_outLen)
-{
-  pandas_datetimestruct dts;
-  PyDatetimeScalarObject *obj = (PyDatetimeScalarObject *) _obj;
-  PRINTMARK();
-
-  pandas_datetime_to_datetimestruct(obj->obval, obj->obmeta.base, &dts);
-  return PandasDateTimeStructToJSON(&dts, tc, outValue, _outLen);
-}
-
-static void *PyDateTimeToJSON(JSOBJ _obj, JSONTypeContext *tc, void *outValue, size_t *_outLen)
-{
-  pandas_datetimestruct dts;
-  PyObject *obj = (PyObject *) _obj;
-
-  PRINTMARK();
-
-  if (!convert_pydatetime_to_datetimestruct(obj, &dts, NULL, 1))
-  {
-    PRINTMARK();
-    return PandasDateTimeStructToJSON(&dts, tc, outValue, _outLen);
-  }
-  else
-  {
-    if (!PyErr_Occurred())
-    {
-      PyErr_SetString(PyExc_ValueError, "Could not convert datetime value to string");
-    }
-    ((JSONObjectEncoder*) tc->encoder)->errorMsg = "";
-    return NULL;
-  }
-}
-
-static void *NpyDatetime64ToJSON(JSOBJ _obj, JSONTypeContext *tc, void *outValue, size_t *_outLen)
-{
-  pandas_datetimestruct dts;
-  PRINTMARK();
-
-  pandas_datetime_to_datetimestruct(
-      (npy_datetime) GET_TC(tc)->longValue,
-      PANDAS_FR_ns, &dts);
-  return PandasDateTimeStructToJSON(&dts, tc, outValue, _outLen);
-}
-
-static void *PyTimeToJSON(JSOBJ _obj, JSONTypeContext *tc, void *outValue, size_t *outLen)
-{
-  PyObject *obj = (PyObject *) _obj;
-  PyObject *str;
-  PyObject *tmp;
-
-  str = PyObject_CallMethod(obj, "isoformat", NULL);
-  if (str == NULL) {
-    PRINTMARK();
-    PyErr_SetString(PyExc_ValueError, "Failed to convert time");
-    return NULL;
-  }
-  if (PyUnicode_Check(str))
-  {
-    tmp = str;
-    str = PyUnicode_AsUTF8String(str);
-    Py_DECREF(tmp);
-  }
-  outValue = (void *) PyString_AS_STRING (str);
-  *outLen = strlen ((char *) outValue);
-  Py_DECREF(str);
-  return outValue;
-}
-
-static int NpyTypeToJSONType(PyObject* obj, JSONTypeContext* tc, int npyType, void* value)
-{
-  PyArray_VectorUnaryFunc* castfunc;
-  npy_double doubleVal;
-  npy_int64 longVal;
-
-  if (PyTypeNum_ISFLOAT(npyType))
-  {
-    PRINTMARK();
-    castfunc = PyArray_GetCastFunc(PyArray_DescrFromType(npyType), NPY_DOUBLE);
-    if (!castfunc)
-    {
-      PyErr_Format (
-          PyExc_ValueError,
-          "Cannot cast numpy dtype %d to double",
-          npyType);
-    }
-    castfunc(value, &doubleVal, 1, NULL, NULL);
-    if (npy_isnan(doubleVal) || npy_isinf(doubleVal))
-    {
-      PRINTMARK();
-      return JT_NULL;
-    }
-    GET_TC(tc)->doubleValue = (double) doubleVal;
-    GET_TC(tc)->PyTypeToJSON = CDouble;
-    return JT_DOUBLE;
-  }
-
-  if (PyTypeNum_ISDATETIME(npyType))
-  {
-    PRINTMARK();
-    castfunc = PyArray_GetCastFunc(PyArray_DescrFromType(npyType), NPY_INT64);
-    if (!castfunc)
-    {
-      PyErr_Format (
-          PyExc_ValueError,
-          "Cannot cast numpy dtype %d to long",
-          npyType);
-    }
-    castfunc(value, &longVal, 1, NULL, NULL);
-    if (longVal == get_nat())
-    {
-      PRINTMARK();
-      return JT_NULL;
-    }
-    GET_TC(tc)->longValue = (JSINT64) longVal;
-    GET_TC(tc)->PyTypeToJSON = NpyDatetime64ToJSON;
-    return ((PyObjectEncoder *) tc->encoder)->datetimeIso ? JT_UTF8 : JT_LONG;
-  }
-
-  if (PyTypeNum_ISINTEGER(npyType))
-  {
-    PRINTMARK();
-    castfunc = PyArray_GetCastFunc(PyArray_DescrFromType(npyType), NPY_INT64);
-    if (!castfunc)
-    {
-      PyErr_Format (
-          PyExc_ValueError,
-          "Cannot cast numpy dtype %d to long",
-          npyType);
-    }
-    castfunc(value, &longVal, 1, NULL, NULL);
-    GET_TC(tc)->longValue = (JSINT64) longVal;
-    GET_TC(tc)->PyTypeToJSON = CLong;
-    return JT_LONG;
-  }
-
-  if (PyTypeNum_ISBOOL(npyType))
-  {
-    PRINTMARK();
-    return *((npy_bool *) value) == NPY_TRUE ? JT_TRUE : JT_FALSE;
-  }
-
-  PRINTMARK();
-  PyErr_Format (
-      PyExc_RuntimeError,
-      "Unhandled numpy dtype %d",
-      npyType);
-  return JT_INVALID;
-}
-
-
-//=============================================================================
-// Numpy array iteration functions
-//=============================================================================
-
-static void NpyArr_freeItemValue(JSOBJ _obj, JSONTypeContext *tc)
-{
-  if (GET_TC(tc)->npyarr && GET_TC(tc)->itemValue != GET_TC(tc)->npyarr->array)
-  {
-    PRINTMARK();
-    Py_XDECREF(GET_TC(tc)->itemValue);
-    GET_TC(tc)->itemValue = NULL;
-  }
-}
-
-int NpyArr_iterNextNone(JSOBJ _obj, JSONTypeContext *tc)
-{
-  return 0;
-}
-
-void NpyArr_iterBegin(JSOBJ _obj, JSONTypeContext *tc)
-{
-  PyArrayObject *obj;
-  NpyArrContext *npyarr;
-
-  if (GET_TC(tc)->newObj)
-  {
-    obj = (PyArrayObject *) GET_TC(tc)->newObj;
-  }
-  else
-  {
-    obj = (PyArrayObject *) _obj;
-  }
-
-  if (PyArray_SIZE(obj) < 0)
-  {
-    PRINTMARK();
-    GET_TC(tc)->iterNext = NpyArr_iterNextNone;
-  }
-  else
-  {
-    PRINTMARK();
-    npyarr = PyObject_Malloc(sizeof(NpyArrContext));
-    GET_TC(tc)->npyarr = npyarr;
-
-    if (!npyarr)
-    {
-      PyErr_NoMemory();
-      GET_TC(tc)->iterNext = NpyArr_iterNextNone;
-      return;
-    }
-
-    npyarr->array = (PyObject*) obj;
-    npyarr->getitem = (PyArray_GetItemFunc*) PyArray_DESCR(obj)->f->getitem;
-    npyarr->dataptr = PyArray_DATA(obj);
-    npyarr->ndim = PyArray_NDIM(obj) - 1;
-    npyarr->curdim = 0;
-    npyarr->type_num = PyArray_DESCR(obj)->type_num;
-
-    if (GET_TC(tc)->transpose)
-    {
-      npyarr->dim = PyArray_DIM(obj, npyarr->ndim);
-      npyarr->stride = PyArray_STRIDE(obj, npyarr->ndim);
-      npyarr->stridedim = npyarr->ndim;
-      npyarr->index[npyarr->ndim] = 0;
-      npyarr->inc = -1;
-    }
-    else
-    {
-      npyarr->dim = PyArray_DIM(obj, 0);
-      npyarr->stride = PyArray_STRIDE(obj, 0);
-      npyarr->stridedim = 0;
-      npyarr->index[0] = 0;
-      npyarr->inc = 1;
-    }
-
-    npyarr->columnLabels = GET_TC(tc)->columnLabels;
-    npyarr->rowLabels = GET_TC(tc)->rowLabels;
-  }
-}
-
-void NpyArr_iterEnd(JSOBJ obj, JSONTypeContext *tc)
-{
-  NpyArrContext *npyarr = GET_TC(tc)->npyarr;
-  PRINTMARK();
-
-  if (npyarr)
-  {
-    NpyArr_freeItemValue(obj, tc);
-    PyObject_Free(npyarr);
-  }
-}
-
-void NpyArrPassThru_iterBegin(JSOBJ obj, JSONTypeContext *tc)
-{
-  PRINTMARK();
-}
-
-void NpyArrPassThru_iterEnd(JSOBJ obj, JSONTypeContext *tc)
-{
-  NpyArrContext* npyarr = GET_TC(tc)->npyarr;
-  PRINTMARK();
-  // finished this dimension, reset the data pointer
-  npyarr->curdim--;
-  npyarr->dataptr -= npyarr->stride * npyarr->index[npyarr->stridedim];
-  npyarr->stridedim -= npyarr->inc;
-  npyarr->dim = PyArray_DIM(npyarr->array, npyarr->stridedim);
-  npyarr->stride = PyArray_STRIDE(npyarr->array, npyarr->stridedim);
-  npyarr->dataptr += npyarr->stride;
-
-  NpyArr_freeItemValue(obj, tc);
-}
-
-int NpyArr_iterNextItem(JSOBJ obj, JSONTypeContext *tc)
-{
-  NpyArrContext* npyarr = GET_TC(tc)->npyarr;
-  PRINTMARK();
-
-  if (PyErr_Occurred())
-  {
-    return 0;
-  }
-
-  if (npyarr->index[npyarr->stridedim] >= npyarr->dim)
-  {
-    PRINTMARK();
-    return 0;
-  }
-
-  NpyArr_freeItemValue(obj, tc);
-
-#if NPY_API_VERSION < 0x00000007
-  if(PyArray_ISDATETIME(npyarr->array))
-  {
-    PRINTMARK();
-    GET_TC(tc)->itemValue = PyArray_ToScalar(npyarr->dataptr, npyarr->array);
-  }
-  else
-  if (PyArray_ISNUMBER(npyarr->array))
-#else
-  if (PyArray_ISNUMBER(npyarr->array) || PyArray_ISDATETIME(npyarr->array))
-#endif
-  {
-    PRINTMARK();
-    GET_TC(tc)->itemValue = obj;
-    Py_INCREF(obj);
-    ((PyObjectEncoder*) tc->encoder)->npyType = PyArray_TYPE(npyarr->array);
-    ((PyObjectEncoder*) tc->encoder)->npyValue = npyarr->dataptr;
-  }
-  else
-  {
-    PRINTMARK();
-    GET_TC(tc)->itemValue = npyarr->getitem(npyarr->dataptr, npyarr->array);
-  }
-
-  npyarr->dataptr += npyarr->stride;
-  npyarr->index[npyarr->stridedim]++;
-  return 1;
-}
-
-int NpyArr_iterNext(JSOBJ _obj, JSONTypeContext *tc)
-{
-  NpyArrContext* npyarr = GET_TC(tc)->npyarr;
-  PRINTMARK();
-
-  if (PyErr_Occurred())
-  {
-    PRINTMARK();
-    return 0;
-  }
-
-  if (npyarr->curdim >= npyarr->ndim || npyarr->index[npyarr->stridedim] >= npyarr->dim)
-  {
-    PRINTMARK();
-    // innermost dimension, start retrieving item values
-    GET_TC(tc)->iterNext = NpyArr_iterNextItem;
-    return NpyArr_iterNextItem(_obj, tc);
-  }
-
-  // dig a dimension deeper
-  npyarr->index[npyarr->stridedim]++;
-
-  npyarr->curdim++;
-  npyarr->stridedim += npyarr->inc;
-  npyarr->dim = PyArray_DIM(npyarr->array, npyarr->stridedim);
-  npyarr->stride = PyArray_STRIDE(npyarr->array, npyarr->stridedim);
-  npyarr->index[npyarr->stridedim] = 0;
-
-  ((PyObjectEncoder*) tc->encoder)->npyCtxtPassthru = npyarr;
-  GET_TC(tc)->itemValue = npyarr->array;
-  return 1;
-}
-
-JSOBJ NpyArr_iterGetValue(JSOBJ obj, JSONTypeContext *tc)
-{
-  PRINTMARK();
-  return GET_TC(tc)->itemValue;
-}
-
-static void NpyArr_getLabel(JSOBJ obj, JSONTypeContext *tc, size_t *outLen, npy_intp idx, char** labels)
-{
-  JSONObjectEncoder* enc = (JSONObjectEncoder*) tc->encoder;
-  PRINTMARK();
-  *outLen = strlen(labels[idx]);
-  memcpy(enc->offset, labels[idx], sizeof(char)*(*outLen));
-  enc->offset += *outLen;
-  *outLen = 0;
-}
-
-char *NpyArr_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen)
-{
-  NpyArrContext* npyarr = GET_TC(tc)->npyarr;
-  npy_intp idx;
-  PRINTMARK();
-
-  if (GET_TC(tc)->iterNext == NpyArr_iterNextItem)
-  {
-    idx = npyarr->index[npyarr->stridedim] - 1;
-    NpyArr_getLabel(obj, tc, outLen, idx, npyarr->columnLabels);
-  }
-  else
-  {
-    idx = npyarr->index[npyarr->stridedim - npyarr->inc] - 1;
-    NpyArr_getLabel(obj, tc, outLen, idx, npyarr->rowLabels);
-  }
-  return NULL;
-}
-
-
-//=============================================================================
-// Pandas block iteration functions
-//
-// Serialises a DataFrame column by column to avoid unnecessary data copies and
-// more representative serialisation when dealing with mixed dtypes.
-//
-// Uses a dedicated NpyArrContext for each column.
-//=============================================================================
-
-
-void PdBlockPassThru_iterEnd(JSOBJ obj, JSONTypeContext *tc)
-{
-  PdBlockContext *blkCtxt = GET_TC(tc)->pdblock;
-  PRINTMARK();
-
-  if (blkCtxt->transpose)
-  {
-    blkCtxt->colIdx++;
-  }
-  else
-  {
-    blkCtxt->colIdx = 0;
-  }
-
-  NpyArr_freeItemValue(obj, tc);
-}
-
-int PdBlock_iterNextItem(JSOBJ obj, JSONTypeContext *tc)
-{
-  PdBlockContext *blkCtxt = GET_TC(tc)->pdblock;
-  PRINTMARK();
-
-  if (blkCtxt->colIdx >= blkCtxt->ncols)
-  {
-    return 0;
-  }
-
-  GET_TC(tc)->npyarr = blkCtxt->npyCtxts[blkCtxt->colIdx];
-  blkCtxt->colIdx++;
-  return NpyArr_iterNextItem(obj, tc);
-}
-
-char *PdBlock_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen)
-{
-  PdBlockContext *blkCtxt = GET_TC(tc)->pdblock;
-  NpyArrContext *npyarr = blkCtxt->npyCtxts[0];
-  npy_intp idx;
-  PRINTMARK();
-
-  if (GET_TC(tc)->iterNext == PdBlock_iterNextItem)
-  {
-    idx = blkCtxt->colIdx - 1;
-    NpyArr_getLabel(obj, tc, outLen, idx, npyarr->columnLabels);
-  }
-  else
-  {
-    idx = GET_TC(tc)->iterNext != PdBlock_iterNext
-        ? npyarr->index[npyarr->stridedim - npyarr->inc] - 1
-        : npyarr->index[npyarr->stridedim];
-
-    NpyArr_getLabel(obj, tc, outLen, idx, npyarr->rowLabels);
-  }
-  return NULL;
-}
-
-char *PdBlock_iterGetName_Transpose(JSOBJ obj, JSONTypeContext *tc, size_t *outLen)
-{
-  PdBlockContext *blkCtxt = GET_TC(tc)->pdblock;
-  NpyArrContext* npyarr = blkCtxt->npyCtxts[blkCtxt->colIdx];
-  npy_intp idx;
-  PRINTMARK();
-
-  if (GET_TC(tc)->iterNext == NpyArr_iterNextItem)
-  {
-    idx = npyarr->index[npyarr->stridedim] - 1;
-    NpyArr_getLabel(obj, tc, outLen, idx, npyarr->columnLabels);
-  }
-  else
-  {
-    idx = blkCtxt->colIdx;
-    NpyArr_getLabel(obj, tc, outLen, idx, npyarr->rowLabels);
-  }
-  return NULL;
-}
-
-int PdBlock_iterNext(JSOBJ obj, JSONTypeContext *tc)
-{
-  PdBlockContext *blkCtxt = GET_TC(tc)->pdblock;
-  NpyArrContext* npyarr;
-  PRINTMARK();
-
-  if (PyErr_Occurred())
-  {
-    return 0;
-  }
-
-  if (blkCtxt->transpose)
-  {
-    if (blkCtxt->colIdx >= blkCtxt->ncols)
-    {
-      return 0;
-    }
-  }
-  else
-  {
-    npyarr = blkCtxt->npyCtxts[0];
-    if (npyarr->index[npyarr->stridedim] >= npyarr->dim)
-    {
-      return 0;
-    }
-  }
-
-  ((PyObjectEncoder*) tc->encoder)->blkCtxtPassthru = blkCtxt;
-  GET_TC(tc)->itemValue = obj;
-
-  return 1;
-}
-
-void PdBlockPassThru_iterBegin(JSOBJ obj, JSONTypeContext *tc)
-{
-  PdBlockContext *blkCtxt = GET_TC(tc)->pdblock;
-  PRINTMARK();
-
-  if (blkCtxt->transpose)
-  {
-    // if transposed we exhaust each column before moving to the next
-    GET_TC(tc)->iterNext = NpyArr_iterNextItem;
-    GET_TC(tc)->iterGetName = PdBlock_iterGetName_Transpose;
-    GET_TC(tc)->npyarr = blkCtxt->npyCtxts[blkCtxt->colIdx];
-  }
-}
-
-void PdBlock_iterBegin(JSOBJ _obj, JSONTypeContext *tc)
-{
-  PyObject *obj, *blocks, *block, *values, *tmp;
-  PyArrayObject *locs;
-  PdBlockContext *blkCtxt;
-  NpyArrContext *npyarr;
-  Py_ssize_t i;
-  PyArray_Descr *dtype;
-  NpyIter *iter;
-  NpyIter_IterNextFunc *iternext;
-  npy_int64 **dataptr;
-  npy_int64 colIdx;
-  npy_intp idx;
-
-  PRINTMARK();
-
-  i = 0;
-  blocks = NULL;
-  dtype = PyArray_DescrFromType(NPY_INT64);
-  obj = (PyObject *)_obj;
-
-  GET_TC(tc)->iterGetName = GET_TC(tc)->transpose ? PdBlock_iterGetName_Transpose : PdBlock_iterGetName;
-
-  blkCtxt = PyObject_Malloc(sizeof(PdBlockContext));
-  if (!blkCtxt)
-  {
-    PyErr_NoMemory();
-    GET_TC(tc)->iterNext = NpyArr_iterNextNone;
-    goto BLKRET;
-  }
-  GET_TC(tc)->pdblock = blkCtxt;
-
-  blkCtxt->colIdx = 0;
-  blkCtxt->transpose = GET_TC(tc)->transpose;
-  blkCtxt->ncols = get_attr_length(obj, "columns");
-
-  if (blkCtxt->ncols == 0)
-  {
-    blkCtxt->npyCtxts = NULL;
-    blkCtxt->cindices = NULL;
-
-    GET_TC(tc)->iterNext = NpyArr_iterNextNone;
-    goto BLKRET;
-  }
-
-  blkCtxt->npyCtxts = PyObject_Malloc(sizeof(NpyArrContext*) * blkCtxt->ncols);
-  if (!blkCtxt->npyCtxts)
-  {
-    PyErr_NoMemory();
-    GET_TC(tc)->iterNext = NpyArr_iterNextNone;
-    goto BLKRET;
-  }
-  for (i = 0; i < blkCtxt->ncols; i++)
-  {
-    blkCtxt->npyCtxts[i] = NULL;
-  }
-
-  blkCtxt->cindices = PyObject_Malloc(sizeof(int) * blkCtxt->ncols);
-  if (!blkCtxt->cindices)
-  {
-    PyErr_NoMemory();
-    GET_TC(tc)->iterNext = NpyArr_iterNextNone;
-    goto BLKRET;
-  }
-
-  blocks = get_sub_attr(obj, "_data", "blocks");
-  if (!blocks)
-  {
-    GET_TC(tc)->iterNext = NpyArr_iterNextNone;
-    goto BLKRET;
-  }
-
-  // force transpose so each NpyArrContext strides down its column
-  GET_TC(tc)->transpose = 1;
-
-  for (i = 0; i < PyObject_Length(blocks); i++)
-  {
-    block = get_item(blocks, i);
-    if (!block)
-    {
-      GET_TC(tc)->iterNext = NpyArr_iterNextNone;
-      goto BLKRET;
-    }
-
-    tmp = PyObject_GetAttrString(block, "values");
-    if (!tmp)
-    {
-      Py_DECREF(block);
-      GET_TC(tc)->iterNext = NpyArr_iterNextNone;
-      goto BLKRET;
-    }
-    values = PyArray_Transpose((PyArrayObject*) tmp, NULL);
-    Py_DECREF(tmp);
-    if (!values)
-    {
-      Py_DECREF(block);
-      GET_TC(tc)->iterNext = NpyArr_iterNextNone;
-      goto BLKRET;
-    }
-
-
-    locs = (PyArrayObject*) get_sub_attr(block, "mgr_locs", "as_array");
-    if (!locs)
-    {
-      Py_DECREF(block);
-      Py_DECREF(values);
-      GET_TC(tc)->iterNext = NpyArr_iterNextNone;
-      goto BLKRET;
-    }
-
-    iter = NpyIter_New(locs, NPY_ITER_READONLY, NPY_KEEPORDER, NPY_NO_CASTING, dtype);
-    if (!iter)
-    {
-      Py_DECREF(block);
-      Py_DECREF(values);
-      Py_DECREF(locs);
-      GET_TC(tc)->iterNext = NpyArr_iterNextNone;
-      goto BLKRET;
-    }
-    iternext = NpyIter_GetIterNext(iter, NULL);
-    if (!iternext)
-    {
-      NpyIter_Deallocate(iter);
-      Py_DECREF(block);
-      Py_DECREF(values);
-      Py_DECREF(locs);
-      GET_TC(tc)->iterNext = NpyArr_iterNextNone;
-      goto BLKRET;
-    }
-    dataptr = (npy_int64 **) NpyIter_GetDataPtrArray(iter);
-    do
-    {
-        colIdx = **dataptr;
-        idx = NpyIter_GetIterIndex(iter);
-
-        blkCtxt->cindices[colIdx] = idx;
-
-        // Reference freed in Pdblock_iterend
-        Py_INCREF(values);
-        GET_TC(tc)->newObj = values;
-
-        // init a dedicated context for this column
-        NpyArr_iterBegin(obj, tc);
-        npyarr = GET_TC(tc)->npyarr;
-
-        // set the dataptr to our desired column and initialise
-        if (npyarr != NULL)
-        {
-            npyarr->dataptr += npyarr->stride * idx;
-            NpyArr_iterNext(obj, tc);
-        }
-        GET_TC(tc)->itemValue = NULL;
-        ((PyObjectEncoder*) tc->encoder)->npyCtxtPassthru = NULL;
-
-        blkCtxt->npyCtxts[colIdx] = npyarr;
-        GET_TC(tc)->newObj = NULL;
-
-    } while (iternext(iter));
-
-    NpyIter_Deallocate(iter);
-    Py_DECREF(block);
-    Py_DECREF(values);
-    Py_DECREF(locs);
-  }
-  GET_TC(tc)->npyarr = blkCtxt->npyCtxts[0];
-
-BLKRET:
-  Py_XDECREF(dtype);
-  Py_XDECREF(blocks);
-}
-
-void PdBlock_iterEnd(JSOBJ obj, JSONTypeContext *tc)
-{
-  PdBlockContext *blkCtxt;
-  NpyArrContext *npyarr;
-  int i;
-  PRINTMARK();
-
-  GET_TC(tc)->itemValue = NULL;
-  npyarr = GET_TC(tc)->npyarr;
-
-  blkCtxt = GET_TC(tc)->pdblock;
-
-  if (blkCtxt)
-  {
-    for (i = 0; i < blkCtxt->ncols; i++)
-    {
-      npyarr = blkCtxt->npyCtxts[i];
-      if (npyarr)
-      {
-        if (npyarr->array)
-        {
-          Py_DECREF(npyarr->array);
-          npyarr->array = NULL;
-        }
-
-        GET_TC(tc)->npyarr = npyarr;
-        NpyArr_iterEnd(obj, tc);
-
-        blkCtxt->npyCtxts[i] = NULL;
-      }
-    }
-
-    if (blkCtxt->npyCtxts)
-    {
-      PyObject_Free(blkCtxt->npyCtxts);
-    }
-    if (blkCtxt->cindices)
-    {
-      PyObject_Free(blkCtxt->cindices);
-    }
-    PyObject_Free(blkCtxt);
-  }
-}
-
-
-//=============================================================================
-// Tuple iteration functions
-// itemValue is borrowed reference, no ref counting
-//=============================================================================
-void Tuple_iterBegin(JSOBJ obj, JSONTypeContext *tc)
-{
-  GET_TC(tc)->index = 0;
-  GET_TC(tc)->size = PyTuple_GET_SIZE( (PyObject *) obj);
-  GET_TC(tc)->itemValue = NULL;
-}
-
-int Tuple_iterNext(JSOBJ obj, JSONTypeContext *tc)
-{
-  PyObject *item;
-
-  if (GET_TC(tc)->index >= GET_TC(tc)->size)
-  {
-    return 0;
-  }
-
-  item = PyTuple_GET_ITEM (obj, GET_TC(tc)->index);
-
-  GET_TC(tc)->itemValue = item;
-  GET_TC(tc)->index ++;
-  return 1;
-}
-
-void Tuple_iterEnd(JSOBJ obj, JSONTypeContext *tc)
-{
-}
-
-JSOBJ Tuple_iterGetValue(JSOBJ obj, JSONTypeContext *tc)
-{
-  return GET_TC(tc)->itemValue;
-}
-
-char *Tuple_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen)
-{
-  return NULL;
-}
-
-//=============================================================================
-// Iterator iteration functions
-// itemValue is borrowed reference, no ref counting
-//=============================================================================
-void Iter_iterBegin(JSOBJ obj, JSONTypeContext *tc)
-{
-  GET_TC(tc)->itemValue = NULL;
-  GET_TC(tc)->iterator = PyObject_GetIter(obj);
-}
-
-int Iter_iterNext(JSOBJ obj, JSONTypeContext *tc)
-{
-  PyObject *item;
-
-  if (GET_TC(tc)->itemValue)
-  {
-    Py_DECREF(GET_TC(tc)->itemValue);
-    GET_TC(tc)->itemValue = NULL;
-  }
-
-  item = PyIter_Next(GET_TC(tc)->iterator);
-
-  if (item == NULL)
-  {
-    return 0;
-  }
-
-  GET_TC(tc)->itemValue = item;
-  return 1;
-}
-
-void Iter_iterEnd(JSOBJ obj, JSONTypeContext *tc)
-{
-  if (GET_TC(tc)->itemValue)
-  {
-    Py_DECREF(GET_TC(tc)->itemValue);
-    GET_TC(tc)->itemValue = NULL;
-  }
-
-  if (GET_TC(tc)->iterator)
-  {
-    Py_DECREF(GET_TC(tc)->iterator);
-    GET_TC(tc)->iterator = NULL;
-  }
-}
-
-JSOBJ Iter_iterGetValue(JSOBJ obj, JSONTypeContext *tc)
-{
-  return GET_TC(tc)->itemValue;
-}
-
-char *Iter_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen)
-{
-  return NULL;
-}
-
-//=============================================================================
-// Dir iteration functions
-// itemName ref is borrowed from PyObject_Dir (attrList). No refcount
-// itemValue ref is from PyObject_GetAttr. Ref counted
-//=============================================================================
-void Dir_iterBegin(JSOBJ obj, JSONTypeContext *tc)
-{
-  GET_TC(tc)->attrList = PyObject_Dir(obj);
-  GET_TC(tc)->index = 0;
-  GET_TC(tc)->size = PyList_GET_SIZE(GET_TC(tc)->attrList);
-  PRINTMARK();
-}
-
-void Dir_iterEnd(JSOBJ obj, JSONTypeContext *tc)
-{
-  if (GET_TC(tc)->itemValue)
-  {
-    Py_DECREF(GET_TC(tc)->itemValue);
-    GET_TC(tc)->itemValue = NULL;
-  }
-
-  if (GET_TC(tc)->itemName)
-  {
-    Py_DECREF(GET_TC(tc)->itemName);
-    GET_TC(tc)->itemName = NULL;
-  }
-
-  Py_DECREF( (PyObject *) GET_TC(tc)->attrList);
-  PRINTMARK();
-}
-
-int Dir_iterNext(JSOBJ _obj, JSONTypeContext *tc)
-{
-  PyObject *obj = (PyObject *) _obj;
-  PyObject *itemValue = GET_TC(tc)->itemValue;
-  PyObject *itemName = GET_TC(tc)->itemName;
-  PyObject* attr;
-  PyObject* attrName;
-  char* attrStr;
-
-  if (itemValue)
-  {
-    Py_DECREF(GET_TC(tc)->itemValue);
-    GET_TC(tc)->itemValue = itemValue = NULL;
-  }
-
-  if (itemName)
-  {
-    Py_DECREF(GET_TC(tc)->itemName);
-    GET_TC(tc)->itemName = itemName = NULL;
-  }
-
-  for (; GET_TC(tc)->index  < GET_TC(tc)->size; GET_TC(tc)->index ++)
-  {
-    attrName = PyList_GET_ITEM(GET_TC(tc)->attrList, GET_TC(tc)->index);
-#if PY_MAJOR_VERSION >= 3
-    attr = PyUnicode_AsUTF8String(attrName);
-#else
-    attr = attrName;
-    Py_INCREF(attr);
-#endif
-    attrStr = PyString_AS_STRING(attr);
-
-    if (attrStr[0] == '_')
-    {
-      PRINTMARK();
-      Py_DECREF(attr);
-      continue;
-    }
-
-    itemValue = PyObject_GetAttr(obj, attrName);
-    if (itemValue == NULL)
-    {
-      PyErr_Clear();
-      Py_DECREF(attr);
-      PRINTMARK();
-      continue;
-    }
-
-    if (PyCallable_Check(itemValue))
-    {
-      Py_DECREF(itemValue);
-      Py_DECREF(attr);
-      PRINTMARK();
-      continue;
-    }
-
-    GET_TC(tc)->itemName = itemName;
-    GET_TC(tc)->itemValue = itemValue;
-    GET_TC(tc)->index ++;
-
-    PRINTMARK();
-    itemName = attr;
-    break;
-  }
-
-  if (itemName == NULL)
-  {
-    GET_TC(tc)->index = GET_TC(tc)->size;
-    GET_TC(tc)->itemValue = NULL;
-    return 0;
-  }
-
-  GET_TC(tc)->itemName = itemName;
-  GET_TC(tc)->itemValue = itemValue;
-  GET_TC(tc)->index ++;
-
-  PRINTMARK();
-  return 1;
-}
-
-JSOBJ Dir_iterGetValue(JSOBJ obj, JSONTypeContext *tc)
-{
-  PRINTMARK();
-  return GET_TC(tc)->itemValue;
-}
-
-char *Dir_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen)
-{
-  PRINTMARK();
-  *outLen = PyString_GET_SIZE(GET_TC(tc)->itemName);
-  return PyString_AS_STRING(GET_TC(tc)->itemName);
-}
-
-
-//=============================================================================
-// List iteration functions
-// itemValue is borrowed from object (which is list). No refcounting
-//=============================================================================
-void List_iterBegin(JSOBJ obj, JSONTypeContext *tc)
-{
-  GET_TC(tc)->index =  0;
-  GET_TC(tc)->size = PyList_GET_SIZE( (PyObject *) obj);
-}
-
-int List_iterNext(JSOBJ obj, JSONTypeContext *tc)
-{
-  if (GET_TC(tc)->index >= GET_TC(tc)->size)
-  {
-    PRINTMARK();
-    return 0;
-  }
-
-  GET_TC(tc)->itemValue = PyList_GET_ITEM (obj, GET_TC(tc)->index);
-  GET_TC(tc)->index ++;
-  return 1;
-}
-
-void List_iterEnd(JSOBJ obj, JSONTypeContext *tc)
-{
-}
-
-JSOBJ List_iterGetValue(JSOBJ obj, JSONTypeContext *tc)
-{
-  return GET_TC(tc)->itemValue;
-}
-
-char *List_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen)
-{
-  return NULL;
-}
-
-//=============================================================================
-// pandas Index iteration functions
-//=============================================================================
-void Index_iterBegin(JSOBJ obj, JSONTypeContext *tc)
-{
-  GET_TC(tc)->index = 0;
-  GET_TC(tc)->cStr = PyObject_Malloc(20 * sizeof(char));
-  if (!GET_TC(tc)->cStr)
-  {
-    PyErr_NoMemory();
-  }
-  PRINTMARK();
-}
-
-int Index_iterNext(JSOBJ obj, JSONTypeContext *tc)
-{
-  Py_ssize_t index;
-  if (!GET_TC(tc)->cStr)
-  {
-    return 0;
-  }
-
-  index = GET_TC(tc)->index;
-  Py_XDECREF(GET_TC(tc)->itemValue);
-  if (index == 0)
-  {
-    memcpy(GET_TC(tc)->cStr, "name", sizeof(char)*5);
-    GET_TC(tc)->itemValue = PyObject_GetAttrString(obj, "name");
-  }
-  else
-  if (index == 1)
-  {
-    memcpy(GET_TC(tc)->cStr, "data", sizeof(char)*5);
-    GET_TC(tc)->itemValue = PyObject_GetAttrString(obj, "values");
-  }
-  else
-  {
-    PRINTMARK();
-    return 0;
-  }
-
-  GET_TC(tc)->index++;
-  PRINTMARK();
-  return 1;
-}
-
-void Index_iterEnd(JSOBJ obj, JSONTypeContext *tc)
-{
-  PRINTMARK();
-}
-
-JSOBJ Index_iterGetValue(JSOBJ obj, JSONTypeContext *tc)
-{
-  return GET_TC(tc)->itemValue;
-}
-
-char *Index_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen)
-{
-  *outLen = strlen(GET_TC(tc)->cStr);
-  return GET_TC(tc)->cStr;
-}
-
-//=============================================================================
-// pandas Series iteration functions
-//=============================================================================
-void Series_iterBegin(JSOBJ obj, JSONTypeContext *tc)
-{
-  PyObjectEncoder* enc = (PyObjectEncoder*) tc->encoder;
-  GET_TC(tc)->index = 0;
-  GET_TC(tc)->cStr = PyObject_Malloc(20 * sizeof(char));
-  enc->outputFormat = VALUES; // for contained series
-  if (!GET_TC(tc)->cStr)
-  {
-    PyErr_NoMemory();
-  }
-  PRINTMARK();
-}
-
-int Series_iterNext(JSOBJ obj, JSONTypeContext *tc)
-{
-  Py_ssize_t index;
-  if (!GET_TC(tc)->cStr)
-  {
-    return 0;
-  }
-
-  index = GET_TC(tc)->index;
-  Py_XDECREF(GET_TC(tc)->itemValue);
-  if (index == 0)
-  {
-    memcpy(GET_TC(tc)->cStr, "name", sizeof(char)*5);
-    GET_TC(tc)->itemValue = PyObject_GetAttrString(obj, "name");
-  }
-  else
-  if (index == 1)
-  {
-    memcpy(GET_TC(tc)->cStr, "index", sizeof(char)*6);
-    GET_TC(tc)->itemValue = PyObject_GetAttrString(obj, "index");
-  }
-  else
-  if (index == 2)
-  {
-    memcpy(GET_TC(tc)->cStr, "data", sizeof(char)*5);
-    GET_TC(tc)->itemValue = PyObject_GetAttrString(obj, "values");
-  }
-  else
-  {
-    PRINTMARK();
-    return 0;
-  }
-
-  GET_TC(tc)->index++;
-  PRINTMARK();
-  return 1;
-}
-
-void Series_iterEnd(JSOBJ obj, JSONTypeContext *tc)
-{
-  PyObjectEncoder* enc = (PyObjectEncoder*) tc->encoder;
-  enc->outputFormat = enc->originalOutputFormat;
-  PRINTMARK();
-}
-
-JSOBJ Series_iterGetValue(JSOBJ obj, JSONTypeContext *tc)
-{
-  return GET_TC(tc)->itemValue;
-}
-
-char *Series_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen)
-{
-  *outLen = strlen(GET_TC(tc)->cStr);
-  return GET_TC(tc)->cStr;
-}
-
-//=============================================================================
-// pandas DataFrame iteration functions
-//=============================================================================
-void DataFrame_iterBegin(JSOBJ obj, JSONTypeContext *tc)
-{
-  PyObjectEncoder* enc = (PyObjectEncoder*) tc->encoder;
-  GET_TC(tc)->index = 0;
-  GET_TC(tc)->cStr = PyObject_Malloc(20 * sizeof(char));
-  enc->outputFormat = VALUES; // for contained series & index
-  if (!GET_TC(tc)->cStr)
-  {
-    PyErr_NoMemory();
-  }
-  PRINTMARK();
-}
-
-int DataFrame_iterNext(JSOBJ obj, JSONTypeContext *tc)
-{
-  Py_ssize_t index;
-  if (!GET_TC(tc)->cStr)
-  {
-    return 0;
-  }
-
-  index = GET_TC(tc)->index;
-  Py_XDECREF(GET_TC(tc)->itemValue);
-  if (index == 0)
-  {
-    memcpy(GET_TC(tc)->cStr, "columns", sizeof(char)*8);
-    GET_TC(tc)->itemValue = PyObject_GetAttrString(obj, "columns");
-  }
-  else
-  if (index == 1)
-  {
-    memcpy(GET_TC(tc)->cStr, "index", sizeof(char)*6);
-    GET_TC(tc)->itemValue = PyObject_GetAttrString(obj, "index");
-  }
-  else
-  if (index == 2)
-  {
-    memcpy(GET_TC(tc)->cStr, "data", sizeof(char)*5);
-    if (is_simple_frame(obj))
-    {
-      GET_TC(tc)->itemValue = PyObject_GetAttrString(obj, "values");
-    }
-    else
-    {
-      Py_INCREF(obj);
-      GET_TC(tc)->itemValue = obj;
-    }
-  }
-  else
-  {
-    PRINTMARK();
-    return 0;
-  }
-
-  GET_TC(tc)->index++;
-  PRINTMARK();
-  return 1;
-}
-
-void DataFrame_iterEnd(JSOBJ obj, JSONTypeContext *tc)
-{
-  PyObjectEncoder* enc = (PyObjectEncoder*) tc->encoder;
-  enc->outputFormat = enc->originalOutputFormat;
-  PRINTMARK();
-}
-
-JSOBJ DataFrame_iterGetValue(JSOBJ obj, JSONTypeContext *tc)
-{
-  return GET_TC(tc)->itemValue;
-}
-
-char *DataFrame_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen)
-{
-  *outLen = strlen(GET_TC(tc)->cStr);
-  return GET_TC(tc)->cStr;
-}
-
-//=============================================================================
-// Dict iteration functions
-// itemName might converted to string (Python_Str). Do refCounting
-// itemValue is borrowed from object (which is dict). No refCounting
-//=============================================================================
-void Dict_iterBegin(JSOBJ obj, JSONTypeContext *tc)
-{
-  GET_TC(tc)->index = 0;
-  PRINTMARK();
-}
-
-int Dict_iterNext(JSOBJ obj, JSONTypeContext *tc)
-{
-#if PY_MAJOR_VERSION >= 3
-  PyObject* itemNameTmp;
-#endif
-
-  if (GET_TC(tc)->itemName)
-  {
-    Py_DECREF(GET_TC(tc)->itemName);
-    GET_TC(tc)->itemName = NULL;
-  }
-
-
-  if (!PyDict_Next ( (PyObject *)GET_TC(tc)->dictObj, &GET_TC(tc)->index, &GET_TC(tc)->itemName, &GET_TC(tc)->itemValue))
-  {
-    PRINTMARK();
-    return 0;
-  }
-
-  if (PyUnicode_Check(GET_TC(tc)->itemName))
-  {
-    GET_TC(tc)->itemName = PyUnicode_AsUTF8String (GET_TC(tc)->itemName);
-  }
-  else
-    if (!PyString_Check(GET_TC(tc)->itemName))
-    {
-      GET_TC(tc)->itemName = PyObject_Str(GET_TC(tc)->itemName);
-#if PY_MAJOR_VERSION >= 3
-      itemNameTmp = GET_TC(tc)->itemName;
-      GET_TC(tc)->itemName = PyUnicode_AsUTF8String (GET_TC(tc)->itemName);
-      Py_DECREF(itemNameTmp);
-#endif
-    }
-    else
-    {
-      Py_INCREF(GET_TC(tc)->itemName);
-    }
-    PRINTMARK();
-    return 1;
-}
-
-void Dict_iterEnd(JSOBJ obj, JSONTypeContext *tc)
-{
-  if (GET_TC(tc)->itemName)
-  {
-    Py_DECREF(GET_TC(tc)->itemName);
-    GET_TC(tc)->itemName = NULL;
-  }
-  Py_DECREF(GET_TC(tc)->dictObj);
-  PRINTMARK();
-}
-
-JSOBJ Dict_iterGetValue(JSOBJ obj, JSONTypeContext *tc)
-{
-  return GET_TC(tc)->itemValue;
-}
-
-char *Dict_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen)
-{
-  *outLen = PyString_GET_SIZE(GET_TC(tc)->itemName);
-  return PyString_AS_STRING(GET_TC(tc)->itemName);
-}
-
-void NpyArr_freeLabels(char** labels, npy_intp len)
-{
-    npy_intp i;
-
-    if (labels)
-    {
-        for (i = 0; i < len; i++)
-        {
-            PyObject_Free(labels[i]);
-        }
-        PyObject_Free(labels);
-    }
-}
-
-char** NpyArr_encodeLabels(PyArrayObject* labels, JSONObjectEncoder* enc, npy_intp num)
-{
-    // NOTE this function steals a reference to labels.
-    PyObjectEncoder* pyenc = (PyObjectEncoder *) enc;
-    PyObject* item = NULL;
-    npy_intp i, stride, len, need_quotes;
-    char** ret;
-    char *dataptr, *cLabel, *origend, *origst, *origoffset;
-    char labelBuffer[NPY_JSON_BUFSIZE];
-    PyArray_GetItemFunc* getitem;
-    int type_num;
-    PRINTMARK();
-
-    if (!labels)
-    {
-      return 0;
-    }
-
-    if (PyArray_SIZE(labels) < num)
-    {
-        PyErr_SetString(PyExc_ValueError, "Label array sizes do not match corresponding data shape");
-        Py_DECREF(labels);
-        return 0;
-    }
-
-    ret = PyObject_Malloc(sizeof(char*)*num);
-    if (!ret)
-    {
-        PyErr_NoMemory();
-        Py_DECREF(labels);
-        return 0;
-    }
-
-    for (i = 0; i < num; i++)
-    {
-        ret[i] = NULL;
-    }
-
-    origst = enc->start;
-    origend = enc->end;
-    origoffset = enc->offset;
-
-    stride = PyArray_STRIDE(labels, 0);
-    dataptr = PyArray_DATA(labels);
-    getitem = (PyArray_GetItemFunc*) PyArray_DESCR(labels)->f->getitem;
-    type_num = PyArray_TYPE(labels);
-
-    for (i = 0; i < num; i++)
-    {
-#if NPY_API_VERSION < 0x00000007
-        if(PyTypeNum_ISDATETIME(type_num))
-        {
-          item = PyArray_ToScalar(dataptr, labels);
-        }
-        else if(PyTypeNum_ISNUMBER(type_num))
-#else
-        if(PyTypeNum_ISDATETIME(type_num) || PyTypeNum_ISNUMBER(type_num))
-#endif
-        {
-          item = (PyObject *) labels;
-          pyenc->npyType = type_num;
-          pyenc->npyValue = dataptr;
-        }
-        else
-        {
-          item = getitem(dataptr, labels);
-          if (!item)
-          {
-              NpyArr_freeLabels(ret, num);
-              ret = 0;
-              break;
-          }
-        }
-
-        cLabel = JSON_EncodeObject(item, enc, labelBuffer, NPY_JSON_BUFSIZE);
-
-        if (item != (PyObject *) labels)
-        {
-          Py_DECREF(item);
-        }
-
-        if (PyErr_Occurred() || enc->errorMsg)
-        {
-            NpyArr_freeLabels(ret, num);
-            ret = 0;
-            break;
-        }
-
-        need_quotes = ((*cLabel) != '"');
-        len = enc->offset - cLabel + 1 + 2 * need_quotes;
-        ret[i] = PyObject_Malloc(sizeof(char)*len);
-
-        if (!ret[i])
-        {
-            PyErr_NoMemory();
-            ret = 0;
-            break;
-        }
-
-        if (need_quotes)
-        {
-          ret[i][0] = '"';
-          memcpy(ret[i]+1, cLabel, sizeof(char)*(len-4));
-          ret[i][len-3] = '"';
-        }
-        else
-        {
-          memcpy(ret[i], cLabel, sizeof(char)*(len-2));
-        }
-        ret[i][len-2] = ':';
-        ret[i][len-1] = '\0';
-        dataptr += stride;
-    }
-
-    enc->start = origst;
-    enc->end = origend;
-    enc->offset = origoffset;
-
-    Py_DECREF(labels);
-    return ret;
-}
-
-void Object_beginTypeContext (JSOBJ _obj, JSONTypeContext *tc)
-{
-  PyObject *obj, *exc, *toDictFunc, *tmpObj, *getValuesFunc;
-  TypeContext *pc;
-  PyObjectEncoder *enc;
-  double val;
-  npy_int64 value;
-  int base;
-  PRINTMARK();
-
-  tc->prv = NULL;
-
-  if (!_obj) {
-    tc->type = JT_INVALID;
-    return;
-  }
-
-  obj = (PyObject*) _obj;
-  enc = (PyObjectEncoder*) tc->encoder;
-
-  if (enc->npyType >= 0)
-  {
-    PRINTMARK();
-    tc->prv = &(enc->basicTypeContext);
-    tc->type = NpyTypeToJSONType(obj, tc, enc->npyType, enc->npyValue);
-    enc->npyType = -1;
-    return;
-  }
-
-  if (PyBool_Check(obj))
-  {
-    PRINTMARK();
-    tc->type = (obj == Py_True) ? JT_TRUE : JT_FALSE;
-    return;
-  }
-  else
-  if (obj == Py_None)
-  {
-    PRINTMARK();
-    tc->type = JT_NULL;
-    return;
-  }
-
-  pc = createTypeContext();
-  if (!pc)
-  {
-    tc->type = JT_INVALID;
-    return;
-  }
-  tc->prv = pc;
-
-  if (PyIter_Check(obj) || (PyArray_Check(obj) && !PyArray_CheckScalar(obj) ))
-  {
-    PRINTMARK();
-    goto ISITERABLE;
-  }
-
-  if (PyLong_Check(obj))
-  {
-    PRINTMARK();
-    pc->PyTypeToJSON = PyLongToINT64;
-    tc->type = JT_LONG;
-    GET_TC(tc)->longValue = PyLong_AsLongLong(obj);
-
-    exc = PyErr_Occurred();
-
-    if (exc && PyErr_ExceptionMatches(PyExc_OverflowError))
-    {
-      PRINTMARK();
-      goto INVALID;
-    }
-
-    return;
-  }
-  else
-  if (PyInt_Check(obj))
-  {
-      PRINTMARK();
-
-#ifdef _LP64
-      pc->PyTypeToJSON = PyIntToINT64; tc->type = JT_LONG;
-#else
-      pc->PyTypeToJSON = PyIntToINT32; tc->type = JT_INT;
-#endif
-      return;
-  }
-  else
-  if (PyFloat_Check(obj))
-  {
-    PRINTMARK();
-    val = PyFloat_AS_DOUBLE (obj);
-    if (npy_isnan(val) || npy_isinf(val))
-    {
-      tc->type = JT_NULL;
-    }
-    else
-    {
-      pc->PyTypeToJSON = PyFloatToDOUBLE; tc->type = JT_DOUBLE;
-    }
-    return;
-  }
-  else
-  if (PyString_Check(obj))
-  {
-    PRINTMARK();
-    pc->PyTypeToJSON = PyStringToUTF8; tc->type = JT_UTF8;
-    return;
-  }
-  else
-  if (PyUnicode_Check(obj))
-  {
-    PRINTMARK();
-    pc->PyTypeToJSON = PyUnicodeToUTF8; tc->type = JT_UTF8;
-    return;
-  }
-  else
-  if (PyObject_IsInstance(obj, type_decimal))
-  {
-    PRINTMARK();
-    pc->PyTypeToJSON = PyFloatToDOUBLE; tc->type = JT_DOUBLE;
-    return;
-  }
-  else
-  if (PyDateTime_Check(obj) || PyDate_Check(obj))
-  {
-    if (PyObject_TypeCheck(obj, cls_nat))
-    {
-      PRINTMARK();
-      tc->type = JT_NULL;
-      return;
-    }
-
-    PRINTMARK();
-    pc->PyTypeToJSON = PyDateTimeToJSON;
-    if (enc->datetimeIso)
-    {
-      PRINTMARK();
-      tc->type = JT_UTF8;
-    }
-    else
-    {
-      PRINTMARK();
-      tc->type = JT_LONG;
-    }
-    return;
-  }
-  else
-  if (PyTime_Check(obj))
-  {
-    PRINTMARK();
-    pc->PyTypeToJSON = PyTimeToJSON; tc->type = JT_UTF8;
-    return;
-  }
-  else
-  if (PyArray_IsScalar(obj, Datetime))
-  {
-    PRINTMARK();
-    if (((PyDatetimeScalarObject*) obj)->obval == get_nat()) {
-      PRINTMARK();
-      tc->type = JT_NULL;
-      return;
-    }
-
-    PRINTMARK();
-    pc->PyTypeToJSON = NpyDateTimeScalarToJSON;
-    tc->type = enc->datetimeIso ? JT_UTF8 : JT_LONG;
-    return;
-  }
-  else
-  if (PyDelta_Check(obj))
-  {
-    if (PyObject_HasAttrString(obj, "value"))
-    {
-      PRINTMARK();
-      value = get_long_attr(obj, "value");
-    }
-    else
-    {
-      PRINTMARK();
-      value = total_seconds(obj) * 1000000000LL; // nanoseconds per second
-    }
-
-    base = ((PyObjectEncoder*) tc->encoder)->datetimeUnit;
-    switch (base)
-    {
-      case PANDAS_FR_ns:
-        break;
-      case PANDAS_FR_us:
-        value /= 1000LL;
-        break;
-      case PANDAS_FR_ms:
-        value /= 1000000LL;
-        break;
-      case PANDAS_FR_s:
-        value /= 1000000000LL;
-        break;
-    }
-
-    exc = PyErr_Occurred();
-
-    if (exc && PyErr_ExceptionMatches(PyExc_OverflowError))
-    {
-      PRINTMARK();
-      goto INVALID;
-    }
-
-    if (value == get_nat())
-    {
-      PRINTMARK();
-      tc->type = JT_NULL;
-      return;
-    }
-
-    GET_TC(tc)->longValue = value;
-
-    PRINTMARK();
-    pc->PyTypeToJSON = PyLongToINT64;
-    tc->type = JT_LONG;
-    return;
-  }
-  else
-  if (PyArray_IsScalar(obj, Integer))
-  {
-    PRINTMARK();
-    pc->PyTypeToJSON = PyLongToINT64;
-    tc->type = JT_LONG;
-    PyArray_CastScalarToCtype(obj, &(GET_TC(tc)->longValue), PyArray_DescrFromType(NPY_INT64));
-
-    exc = PyErr_Occurred();
-
-    if (exc && PyErr_ExceptionMatches(PyExc_OverflowError))
-    {
-      PRINTMARK();
-      goto INVALID;
-    }
-
-    return;
-  }
-  else
-  if (PyArray_IsScalar(obj, Bool))
-  {
-    PRINTMARK();
-    PyArray_CastScalarToCtype(obj, &(GET_TC(tc)->longValue), PyArray_DescrFromType(NPY_BOOL));
-    tc->type = (GET_TC(tc)->longValue) ? JT_TRUE : JT_FALSE;
-    return;
-  }
-  else
-  if (PyArray_IsScalar(obj, Float) || PyArray_IsScalar(obj, Double))
-  {
-    PRINTMARK();
-    pc->PyTypeToJSON = NpyFloatToDOUBLE; tc->type = JT_DOUBLE;
-    return;
-  }
-  else
-  if (PyArray_Check(obj) && PyArray_CheckScalar(obj)) {
-    #if PY_MAJOR_VERSION >= 3
-      PyErr_Format(
-        PyExc_TypeError,
-        "%R (0d array) is not JSON serializable at the moment",
-        obj
-      );
-    #else
-      PyErr_Format(
-        PyExc_TypeError,
-        "%s (0d array) is not JSON serializable at the moment",
-        PyString_AsString(PyObject_Repr(obj))
-      );
-    #endif
-    return;
-  }
-
-ISITERABLE:
-
-  if (PyObject_TypeCheck(obj, cls_index))
-  {
-    if (enc->outputFormat == SPLIT)
-    {
-      PRINTMARK();
-      tc->type = JT_OBJECT;
-      pc->iterBegin = Index_iterBegin;
-      pc->iterEnd = Index_iterEnd;
-      pc->iterNext = Index_iterNext;
-      pc->iterGetValue = Index_iterGetValue;
-      pc->iterGetName = Index_iterGetName;
-      return;
-    }
-
-    getValuesFunc = PyObject_GetAttrString(obj, "get_values");
-    if (getValuesFunc)
-    {
-      PRINTMARK();
-      tc->type = JT_ARRAY;
-      pc->newObj = PyObject_CallObject(getValuesFunc, NULL);
-      pc->iterBegin = NpyArr_iterBegin;
-      pc->iterEnd = NpyArr_iterEnd;
-      pc->iterNext = NpyArr_iterNext;
-      pc->iterGetValue = NpyArr_iterGetValue;
-      pc->iterGetName = NpyArr_iterGetName;
-
-      Py_DECREF(getValuesFunc);
-    }
-    else
-    {
-      goto INVALID;
-    }
-
-    return;
-  }
-  else
-  if (PyObject_TypeCheck(obj, cls_series))
-  {
-    if (enc->outputFormat == SPLIT)
-    {
-      PRINTMARK();
-      tc->type = JT_OBJECT;
-      pc->iterBegin = Series_iterBegin;
-      pc->iterEnd = Series_iterEnd;
-      pc->iterNext = Series_iterNext;
-      pc->iterGetValue = Series_iterGetValue;
-      pc->iterGetName = Series_iterGetName;
-      return;
-    }
-
-    pc->newObj = PyObject_GetAttrString(obj, "values");
-
-    if (enc->outputFormat == INDEX || enc->outputFormat == COLUMNS)
-    {
-      PRINTMARK();
-      tc->type = JT_OBJECT;
-      pc->columnLabelsLen = PyArray_DIM(pc->newObj, 0);
-      pc->columnLabels = NpyArr_encodeLabels((PyArrayObject*) PyObject_GetAttrString(PyObject_GetAttrString(obj, "index"), "values"), (JSONObjectEncoder*) enc, pc->columnLabelsLen);
-      if (!pc->columnLabels)
-      {
-        goto INVALID;
-      }
-    }
-    else
-    {
-      PRINTMARK();
-      tc->type = JT_ARRAY;
-    }
-    pc->iterBegin = NpyArr_iterBegin;
-    pc->iterEnd = NpyArr_iterEnd;
-    pc->iterNext = NpyArr_iterNext;
-    pc->iterGetValue = NpyArr_iterGetValue;
-    pc->iterGetName = NpyArr_iterGetName;
-    return;
-  }
-  else
-  if (PyArray_Check(obj))
-  {
-    if (enc->npyCtxtPassthru)
-    {
-      PRINTMARK();
-      pc->npyarr = enc->npyCtxtPassthru;
-      tc->type = (pc->npyarr->columnLabels ? JT_OBJECT : JT_ARRAY);
-
-      pc->iterBegin = NpyArrPassThru_iterBegin;
-      pc->iterNext = NpyArr_iterNext;
-      pc->iterEnd = NpyArrPassThru_iterEnd;
-      pc->iterGetValue = NpyArr_iterGetValue;
-      pc->iterGetName = NpyArr_iterGetName;
-
-      enc->npyCtxtPassthru = NULL;
-      return;
-    }
-
-    PRINTMARK();
-    tc->type = JT_ARRAY;
-    pc->iterBegin = NpyArr_iterBegin;
-    pc->iterEnd = NpyArr_iterEnd;
-    pc->iterNext = NpyArr_iterNext;
-    pc->iterGetValue = NpyArr_iterGetValue;
-    pc->iterGetName = NpyArr_iterGetName;
-    return;
-  }
-  else
-  if (PyObject_TypeCheck(obj, cls_dataframe))
-  {
-    if (enc->blkCtxtPassthru)
-    {
-      PRINTMARK();
-      pc->pdblock = enc->blkCtxtPassthru;
-      tc->type = (pc->pdblock->npyCtxts[0]->columnLabels ? JT_OBJECT : JT_ARRAY);
-
-      pc->iterBegin = PdBlockPassThru_iterBegin;
-      pc->iterEnd = PdBlockPassThru_iterEnd;
-      pc->iterNext = PdBlock_iterNextItem;
-      pc->iterGetName = PdBlock_iterGetName;
-      pc->iterGetValue = NpyArr_iterGetValue;
-
-      enc->blkCtxtPassthru = NULL;
-      return;
-    }
-
-    if (enc->outputFormat == SPLIT)
-    {
-      PRINTMARK();
-      tc->type = JT_OBJECT;
-      pc->iterBegin = DataFrame_iterBegin;
-      pc->iterEnd = DataFrame_iterEnd;
-      pc->iterNext = DataFrame_iterNext;
-      pc->iterGetValue = DataFrame_iterGetValue;
-      pc->iterGetName = DataFrame_iterGetName;
-      return;
-    }
-
-    PRINTMARK();
-    if (is_simple_frame(obj))
-    {
-      pc->iterBegin = NpyArr_iterBegin;
-      pc->iterEnd = NpyArr_iterEnd;
-      pc->iterNext = NpyArr_iterNext;
-      pc->iterGetName = NpyArr_iterGetName;
-
-      pc->newObj = PyObject_GetAttrString(obj, "values");
-    }
-    else
-    {
-      pc->iterBegin = PdBlock_iterBegin;
-      pc->iterEnd = PdBlock_iterEnd;
-      pc->iterNext = PdBlock_iterNext;
-      pc->iterGetName = PdBlock_iterGetName;
-    }
-    pc->iterGetValue = NpyArr_iterGetValue;
-
-    if (enc->outputFormat == VALUES)
-    {
-      PRINTMARK();
-      tc->type = JT_ARRAY;
-    }
-    else
-    if (enc->outputFormat == RECORDS)
-    {
-      PRINTMARK();
-      tc->type = JT_ARRAY;
-      tmpObj = PyObject_GetAttrString(obj, "columns");
-      if (!tmpObj)
-      {
-        goto INVALID;
-      }
-      pc->columnLabelsLen = PyObject_Size(tmpObj);
-      pc->columnLabels = NpyArr_encodeLabels((PyArrayObject*) PyObject_GetAttrString(tmpObj, "values"), (JSONObjectEncoder*) enc, pc->columnLabelsLen);
-      Py_DECREF(tmpObj);
-      if (!pc->columnLabels)
-      {
-        goto INVALID;
-      }
-    }
-    else
-    if (enc->outputFormat == INDEX || enc->outputFormat == COLUMNS)
-    {
-      PRINTMARK();
-      tc->type = JT_OBJECT;
-      tmpObj = (enc->outputFormat == INDEX ? PyObject_GetAttrString(obj, "index") : PyObject_GetAttrString(obj, "columns"));
-      if (!tmpObj)
-      {
-        goto INVALID;
-      }
-      pc->rowLabelsLen = PyObject_Size(tmpObj);
-      pc->rowLabels = NpyArr_encodeLabels((PyArrayObject*) PyObject_GetAttrString(tmpObj, "values"), (JSONObjectEncoder*) enc, pc->rowLabelsLen);
-      Py_DECREF(tmpObj);
-      if (!pc->rowLabels)
-      {
-        goto INVALID;
-      }
-      tmpObj = (enc->outputFormat == INDEX ? PyObject_GetAttrString(obj, "columns") : PyObject_GetAttrString(obj, "index"));
-      if (!tmpObj)
-      {
-        NpyArr_freeLabels(pc->rowLabels, pc->rowLabelsLen);
-        pc->rowLabels = NULL;
-        goto INVALID;
-      }
-      pc->columnLabelsLen = PyObject_Size(tmpObj);
-      pc->columnLabels = NpyArr_encodeLabels((PyArrayObject*) PyObject_GetAttrString(tmpObj, "values"), (JSONObjectEncoder*) enc, pc->columnLabelsLen);
-      Py_DECREF(tmpObj);
-      if (!pc->columnLabels)
-      {
-        NpyArr_freeLabels(pc->rowLabels, pc->rowLabelsLen);
-        pc->rowLabels = NULL;
-        goto INVALID;
-      }
-
-      if (enc->outputFormat == COLUMNS)
-      {
-        PRINTMARK();
-        pc->transpose = 1;
-      }
-    }
-    else
-    {
-      goto INVALID;
-    }
-    return;
-  }
-  else
-  if (PyDict_Check(obj))
-  {
-      PRINTMARK();
-      tc->type = JT_OBJECT;
-      pc->iterBegin = Dict_iterBegin;
-      pc->iterEnd = Dict_iterEnd;
-      pc->iterNext = Dict_iterNext;
-      pc->iterGetValue = Dict_iterGetValue;
-      pc->iterGetName = Dict_iterGetName;
-      pc->dictObj = obj;
-      Py_INCREF(obj);
-
-      return;
-  }
-  else
-  if (PyList_Check(obj))
-  {
-      PRINTMARK();
-      tc->type = JT_ARRAY;
-      pc->iterBegin = List_iterBegin;
-      pc->iterEnd = List_iterEnd;
-      pc->iterNext = List_iterNext;
-      pc->iterGetValue = List_iterGetValue;
-      pc->iterGetName = List_iterGetName;
-      return;
-  }
-  else
-  if (PyTuple_Check(obj))
-  {
-      PRINTMARK();
-      tc->type = JT_ARRAY;
-      pc->iterBegin = Tuple_iterBegin;
-      pc->iterEnd = Tuple_iterEnd;
-      pc->iterNext = Tuple_iterNext;
-      pc->iterGetValue = Tuple_iterGetValue;
-      pc->iterGetName = Tuple_iterGetName;
-      return;
-  }
-  else
-  if (PyAnySet_Check(obj))
-  {
-    PRINTMARK();
-    tc->type = JT_ARRAY;
-    pc->iterBegin = Iter_iterBegin;
-    pc->iterEnd = Iter_iterEnd;
-    pc->iterNext = Iter_iterNext;
-    pc->iterGetValue = Iter_iterGetValue;
-    pc->iterGetName = Iter_iterGetName;
-    return;
-  }
-
-  toDictFunc = PyObject_GetAttrString(obj, "toDict");
-
-  if (toDictFunc)
-  {
-    PyObject* tuple = PyTuple_New(0);
-    PyObject* toDictResult = PyObject_Call(toDictFunc, tuple, NULL);
-    Py_DECREF(tuple);
-    Py_DECREF(toDictFunc);
-
-    if (toDictResult == NULL)
-    {
-      PyErr_Clear();
-      tc->type = JT_NULL;
-      return;
-    }
-
-    if (!PyDict_Check(toDictResult))
-    {
-      Py_DECREF(toDictResult);
-      tc->type = JT_NULL;
-      return;
-    }
-
-    PRINTMARK();
-    tc->type = JT_OBJECT;
-    pc->iterBegin = Dict_iterBegin;
-    pc->iterEnd = Dict_iterEnd;
-    pc->iterNext = Dict_iterNext;
-    pc->iterGetValue = Dict_iterGetValue;
-    pc->iterGetName = Dict_iterGetName;
-    pc->dictObj = toDictResult;
-    return;
-  }
-
-  PyErr_Clear();
-
-  if (enc->defaultHandler)
-  {
-    PRINTMARK();
-    tmpObj = PyObject_CallFunctionObjArgs(enc->defaultHandler, obj, NULL);
-    if (tmpObj == NULL || PyErr_Occurred())
-    {
-      if (!PyErr_Occurred())
-      {
-        PyErr_SetString(PyExc_TypeError, "Failed to execute default handler");
-      }
-      goto INVALID;
-    }
-    encode (tmpObj, (JSONObjectEncoder*) enc, NULL, 0);
-    Py_DECREF(tmpObj);
-    goto INVALID;
-  }
-
-  PRINTMARK();
-  tc->type = JT_OBJECT;
-  pc->iterBegin = Dir_iterBegin;
-  pc->iterEnd = Dir_iterEnd;
-  pc->iterNext = Dir_iterNext;
-  pc->iterGetValue = Dir_iterGetValue;
-  pc->iterGetName = Dir_iterGetName;
-  return;
-
-INVALID:
-  tc->type = JT_INVALID;
-  PyObject_Free(tc->prv);
-  tc->prv = NULL;
-  return;
-}
-
-void Object_endTypeContext(JSOBJ obj, JSONTypeContext *tc)
-{
-  PRINTMARK();
-  if(tc->prv)
-  {
-    Py_XDECREF(GET_TC(tc)->newObj);
-    GET_TC(tc)->newObj = NULL;
-    NpyArr_freeLabels(GET_TC(tc)->rowLabels, GET_TC(tc)->rowLabelsLen);
-    GET_TC(tc)->rowLabels = NULL;
-    NpyArr_freeLabels(GET_TC(tc)->columnLabels, GET_TC(tc)->columnLabelsLen);
-    GET_TC(tc)->columnLabels = NULL;
-
-    PyObject_Free(GET_TC(tc)->cStr);
-    GET_TC(tc)->cStr = NULL;
-    if (tc->prv != &(((PyObjectEncoder*) tc->encoder)->basicTypeContext))
-    {
-      PyObject_Free(tc->prv);
-    }
-    tc->prv = NULL;
-  }
-}
-
-const char *Object_getStringValue(JSOBJ obj, JSONTypeContext *tc, size_t *_outLen)
-{
-  return GET_TC(tc)->PyTypeToJSON (obj, tc, NULL, _outLen);
-}
-
-JSINT64 Object_getLongValue(JSOBJ obj, JSONTypeContext *tc)
-{
-  JSINT64 ret;
-  GET_TC(tc)->PyTypeToJSON (obj, tc, &ret, NULL);
-  return ret;
-}
-
-JSINT32 Object_getIntValue(JSOBJ obj, JSONTypeContext *tc)
-{
-  JSINT32 ret;
-  GET_TC(tc)->PyTypeToJSON (obj, tc, &ret, NULL);
-  return ret;
-}
-
-double Object_getDoubleValue(JSOBJ obj, JSONTypeContext *tc)
-{
-  double ret;
-  GET_TC(tc)->PyTypeToJSON (obj, tc, &ret, NULL);
-  return ret;
-}
-
-static void Object_releaseObject(JSOBJ _obj)
-{
-  Py_DECREF( (PyObject *) _obj);
-}
-
-void Object_iterBegin(JSOBJ obj, JSONTypeContext *tc)
-{
-  GET_TC(tc)->iterBegin(obj, tc);
-}
-
-int Object_iterNext(JSOBJ obj, JSONTypeContext *tc)
-{
-  return GET_TC(tc)->iterNext(obj, tc);
-}
-
-void Object_iterEnd(JSOBJ obj, JSONTypeContext *tc)
-{
-  GET_TC(tc)->iterEnd(obj, tc);
-}
-
-JSOBJ Object_iterGetValue(JSOBJ obj, JSONTypeContext *tc)
-{
-  return GET_TC(tc)->iterGetValue(obj, tc);
-}
-
-char *Object_iterGetName(JSOBJ obj, JSONTypeContext *tc, size_t *outLen)
-{
-  return GET_TC(tc)->iterGetName(obj, tc, outLen);
-}
-
-PyObject* objToJSON(PyObject* self, PyObject *args, PyObject *kwargs)
-{
-  static char *kwlist[] = { "obj", "ensure_ascii", "double_precision", "encode_html_chars", "orient", "date_unit", "iso_dates", "default_handler", NULL};
-
-  char buffer[65536];
-  char *ret;
-  PyObject *newobj;
-  PyObject *oinput = NULL;
-  PyObject *oensureAscii = NULL;
-  int idoublePrecision = 10; // default double precision setting
-  PyObject *oencodeHTMLChars = NULL;
-  char *sOrient = NULL;
-  char *sdateFormat = NULL;
-  PyObject *oisoDates = 0;
-  PyObject *odefHandler = 0;
-
-  PyObjectEncoder pyEncoder =
-  {
-    {
-        Object_beginTypeContext,
-        Object_endTypeContext,
-        Object_getStringValue,
-        Object_getLongValue,
-        Object_getIntValue,
-        Object_getDoubleValue,
-        Object_iterBegin,
-        Object_iterNext,
-        Object_iterEnd,
-        Object_iterGetValue,
-        Object_iterGetName,
-        Object_releaseObject,
-        PyObject_Malloc,
-        PyObject_Realloc,
-        PyObject_Free,
-        -1, //recursionMax
-        idoublePrecision,
-        1, //forceAscii
-        0, //encodeHTMLChars
-    }
-  };
-  JSONObjectEncoder* encoder = (JSONObjectEncoder*) &pyEncoder;
-
-  pyEncoder.npyCtxtPassthru = NULL;
-  pyEncoder.blkCtxtPassthru = NULL;
-  pyEncoder.npyType = -1;
-  pyEncoder.npyValue = NULL;
-  pyEncoder.datetimeIso = 0;
-  pyEncoder.datetimeUnit = PANDAS_FR_ms;
-  pyEncoder.outputFormat = COLUMNS;
-  pyEncoder.defaultHandler = 0;
-  pyEncoder.basicTypeContext.newObj = NULL;
-  pyEncoder.basicTypeContext.dictObj = NULL;
-  pyEncoder.basicTypeContext.itemValue = NULL;
-  pyEncoder.basicTypeContext.itemName = NULL;
-  pyEncoder.basicTypeContext.attrList = NULL;
-  pyEncoder.basicTypeContext.iterator = NULL;
-  pyEncoder.basicTypeContext.cStr = NULL;
-  pyEncoder.basicTypeContext.npyarr = NULL;
-  pyEncoder.basicTypeContext.rowLabels = NULL;
-  pyEncoder.basicTypeContext.columnLabels = NULL;
-
-  PRINTMARK();
-
-  if (!PyArg_ParseTupleAndKeywords(args, kwargs, "O|OiOssOO", kwlist, &oinput, &oensureAscii, &idoublePrecision, &oencodeHTMLChars, &sOrient, &sdateFormat, &oisoDates, &odefHandler))
-  {
-    return NULL;
-  }
-
-  if (oensureAscii != NULL && !PyObject_IsTrue(oensureAscii))
-  {
-    encoder->forceASCII = 0;
-  }
-
-  if (oencodeHTMLChars != NULL && PyObject_IsTrue(oencodeHTMLChars))
-  {
-    encoder->encodeHTMLChars = 1;
-  }
-
-  if (idoublePrecision > JSON_DOUBLE_MAX_DECIMALS || idoublePrecision < 0)
-  {
-      PyErr_Format (
-          PyExc_ValueError,
-          "Invalid value '%d' for option 'double_precision', max is '%u'",
-          idoublePrecision,
-          JSON_DOUBLE_MAX_DECIMALS);
-      return NULL;
-  }
-  encoder->doublePrecision = idoublePrecision;
-
-  if (sOrient != NULL)
-  {
-    if (strcmp(sOrient, "records") == 0)
-    {
-      pyEncoder.outputFormat = RECORDS;
-    }
-    else
-    if (strcmp(sOrient, "index") == 0)
-    {
-      pyEncoder.outputFormat = INDEX;
-    }
-    else
-    if (strcmp(sOrient, "split") == 0)
-    {
-      pyEncoder.outputFormat = SPLIT;
-    }
-    else
-    if (strcmp(sOrient, "values") == 0)
-    {
-      pyEncoder.outputFormat = VALUES;
-    }
-    else
-    if (strcmp(sOrient, "columns") != 0)
-    {
-      PyErr_Format (PyExc_ValueError, "Invalid value '%s' for option 'orient'", sOrient);
-      return NULL;
-    }
-  }
-
-  if (sdateFormat != NULL)
-  {
-    if (strcmp(sdateFormat, "s") == 0)
-    {
-      pyEncoder.datetimeUnit = PANDAS_FR_s;
-    }
-    else
-    if (strcmp(sdateFormat, "ms") == 0)
-    {
-      pyEncoder.datetimeUnit = PANDAS_FR_ms;
-    }
-    else
-    if (strcmp(sdateFormat, "us") == 0)
-    {
-      pyEncoder.datetimeUnit = PANDAS_FR_us;
-    }
-    else
-    if (strcmp(sdateFormat, "ns") == 0)
-    {
-      pyEncoder.datetimeUnit = PANDAS_FR_ns;
-    }
-    else
-    {
-      PyErr_Format (PyExc_ValueError, "Invalid value '%s' for option 'date_unit'", sdateFormat);
-      return NULL;
-    }
-  }
-
-  if (oisoDates != NULL && PyObject_IsTrue(oisoDates))
-  {
-    pyEncoder.datetimeIso = 1;
-  }
-
-
-  if (odefHandler != NULL && odefHandler != Py_None)
-  {
-    if (!PyCallable_Check(odefHandler))
-    {
-      PyErr_SetString (PyExc_TypeError, "Default handler is not callable");
-      return NULL;
-    }
-    pyEncoder.defaultHandler = odefHandler;
-  }
-
-  pyEncoder.originalOutputFormat = pyEncoder.outputFormat;
-  PRINTMARK();
-  ret = JSON_EncodeObject (oinput, encoder, buffer, sizeof (buffer));
-  PRINTMARK();
-
-  if (PyErr_Occurred())
-  {
-    PRINTMARK();
-    return NULL;
-  }
-
-  if (encoder->errorMsg)
-  {
-    PRINTMARK();
-    if (ret != buffer)
-    {
-      encoder->free (ret);
-    }
-
-    PyErr_Format (PyExc_OverflowError, "%s", encoder->errorMsg);
-    return NULL;
-  }
-
-  newobj = PyString_FromString (ret);
-
-  if (ret != buffer)
-  {
-    encoder->free (ret);
-  }
-
-  PRINTMARK();
-
-  return newobj;
-}
-
-PyObject* objToJSONFile(PyObject* self, PyObject *args, PyObject *kwargs)
-{
-  PyObject *data;
-  PyObject *file;
-  PyObject *string;
-  PyObject *write;
-  PyObject *argtuple;
-
-  PRINTMARK();
-
-  if (!PyArg_ParseTuple (args, "OO", &data, &file))
-  {
-    return NULL;
-  }
-
-  if (!PyObject_HasAttrString (file, "write"))
-  {
-    PyErr_Format (PyExc_TypeError, "expected file");
-    return NULL;
-  }
-
-  write = PyObject_GetAttrString (file, "write");
-
-  if (!PyCallable_Check (write))
-  {
-    Py_XDECREF(write);
-    PyErr_Format (PyExc_TypeError, "expected file");
-    return NULL;
-  }
-
-  argtuple = PyTuple_Pack(1, data);
-
-  string = objToJSON (self, argtuple, kwargs);
-
-  if (string == NULL)
-  {
-    Py_XDECREF(write);
-    Py_XDECREF(argtuple);
-    return NULL;
-  }
-
-  Py_XDECREF(argtuple);
-
-  argtuple = PyTuple_Pack (1, string);
-  if (argtuple == NULL)
-  {
-    Py_XDECREF(write);
-    return NULL;
-  }
-  if (PyObject_CallObject (write, argtuple) == NULL)
-  {
-    Py_XDECREF(write);
-    Py_XDECREF(argtuple);
-    return NULL;
-  }
-
-  Py_XDECREF(write);
-  Py_DECREF(argtuple);
-  Py_XDECREF(string);
-
-  PRINTMARK();
-
-  Py_RETURN_NONE;
-}
diff --git a/pandas/src/ujson/python/ujson.c b/pandas/src/ujson/python/ujson.c
deleted file mode 100644
index 2eb8a80c0325c..0000000000000
--- a/pandas/src/ujson/python/ujson.c
+++ /dev/null
@@ -1,112 +0,0 @@
-/*
-Copyright (c) 2011-2013, ESN Social Software AB and Jonas Tarnstrom
-All rights reserved.
-
-Redistribution and use in source and binary forms, with or without
-modification, are permitted provided that the following conditions are met:
-* Redistributions of source code must retain the above copyright
-notice, this list of conditions and the following disclaimer.
-* Redistributions in binary form must reproduce the above copyright
-notice, this list of conditions and the following disclaimer in the
-documentation and/or other materials provided with the distribution.
-* Neither the name of the ESN Social Software AB nor the
-names of its contributors may be used to endorse or promote products
-derived from this software without specific prior written permission.
-
-THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
-ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-DISCLAIMED. IN NO EVENT SHALL ESN SOCIAL SOFTWARE AB OR JONAS TARNSTROM BE LIABLE
-FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
-(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
-LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
-ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
-SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-
-Portions of code from MODP_ASCII - Ascii transformations (upper/lower, etc)
-http://code.google.com/p/stringencoders/
-Copyright (c) 2007  Nick Galbreath -- nickg [at] modp [dot] com. All rights reserved.
-
-Numeric decoder derived from from TCL library
-http://www.opensource.apple.com/source/tcl/tcl-14/tcl/license.terms
-* Copyright (c) 1988-1993 The Regents of the University of California.
-* Copyright (c) 1994 Sun Microsystems, Inc.
-*/
-
-#include "py_defines.h"
-#include "version.h"
-
-/* objToJSON */
-PyObject* objToJSON(PyObject* self, PyObject *args, PyObject *kwargs);
-void initObjToJSON(void);
-
-/* JSONToObj */
-PyObject* JSONToObj(PyObject* self, PyObject *args, PyObject *kwargs);
-
-/* objToJSONFile */
-PyObject* objToJSONFile(PyObject* self, PyObject *args, PyObject *kwargs);
-
-/* JSONFileToObj */
-PyObject* JSONFileToObj(PyObject* self, PyObject *args, PyObject *kwargs);
-
-
-#define ENCODER_HELP_TEXT "Use ensure_ascii=false to output UTF-8. Pass in double_precision to alter the maximum digit precision of doubles. Set encode_html_chars=True to encode < > & as unicode escape sequences."
-
-static PyMethodDef ujsonMethods[] = {
-  {"encode", (PyCFunction) objToJSON, METH_VARARGS | METH_KEYWORDS, "Converts arbitrary object recursivly into JSON. " ENCODER_HELP_TEXT},
-  {"decode", (PyCFunction) JSONToObj, METH_VARARGS | METH_KEYWORDS, "Converts JSON as string to dict object structure. Use precise_float=True to use high precision float decoder."},
-  {"dumps", (PyCFunction) objToJSON, METH_VARARGS | METH_KEYWORDS,  "Converts arbitrary object recursivly into JSON. " ENCODER_HELP_TEXT},
-  {"loads", (PyCFunction) JSONToObj, METH_VARARGS | METH_KEYWORDS,  "Converts JSON as string to dict object structure. Use precise_float=True to use high precision float decoder."},
-  {"dump", (PyCFunction) objToJSONFile, METH_VARARGS | METH_KEYWORDS, "Converts arbitrary object recursively into JSON file. " ENCODER_HELP_TEXT},
-  {"load", (PyCFunction) JSONFileToObj, METH_VARARGS | METH_KEYWORDS, "Converts JSON as file to dict object structure. Use precise_float=True to use high precision float decoder."},
-  {NULL, NULL, 0, NULL}       /* Sentinel */
-};
-
-#if PY_MAJOR_VERSION >= 3
-
-static struct PyModuleDef moduledef = {
-  PyModuleDef_HEAD_INIT,
-  "_pandasujson",
-  0,              /* m_doc */
-  -1,             /* m_size */
-  ujsonMethods,   /* m_methods */
-  NULL,           /* m_reload */
-  NULL,           /* m_traverse */
-  NULL,           /* m_clear */
-  NULL            /* m_free */
-};
-
-#define PYMODINITFUNC       PyMODINIT_FUNC PyInit_json(void)
-#define PYMODULE_CREATE()   PyModule_Create(&moduledef)
-#define MODINITERROR        return NULL
-
-#else
-
-#define PYMODINITFUNC       PyMODINIT_FUNC initjson(void)
-#define PYMODULE_CREATE()   Py_InitModule("json", ujsonMethods)
-#define MODINITERROR        return
-
-#endif
-
-PYMODINITFUNC
-{
-  PyObject *module;
-  PyObject *version_string;
-
-  initObjToJSON();
-  module = PYMODULE_CREATE();
-
-  if (module == NULL)
-  {
-    MODINITERROR;
-  }
-
-  version_string = PyString_FromString (UJSON_VERSION);
-  PyModule_AddObject (module, "__version__", version_string);
-
-#if PY_MAJOR_VERSION >= 3
-  return module;
-#endif
-}
diff --git a/pandas/src/util.pxd b/pandas/src/util.pxd
deleted file mode 100644
index 84b331f1e8e6f..0000000000000
--- a/pandas/src/util.pxd
+++ /dev/null
@@ -1,87 +0,0 @@
-from numpy cimport ndarray
-cimport numpy as cnp
-cimport cpython
-
-cdef extern from "numpy_helper.h":
-    inline void set_array_owndata(ndarray ao)
-    inline void set_array_not_contiguous(ndarray ao)
-
-    inline int is_integer_object(object)
-    inline int is_float_object(object)
-    inline int is_complex_object(object)
-    inline int is_bool_object(object)
-    inline int is_string_object(object)
-    inline int is_datetime64_object(object)
-    inline int is_timedelta64_object(object)
-    inline int assign_value_1d(ndarray, Py_ssize_t, object) except -1
-    inline cnp.int64_t get_nat()
-    inline object get_value_1d(ndarray, Py_ssize_t)
-    inline int floatify(object, double*) except -1
-    inline char *get_c_string(object)
-    inline object char_to_string(char*)
-    inline void transfer_object_column(char *dst, char *src, size_t stride,
-                                       size_t length)
-    object sarr_from_data(cnp.dtype, int length, void* data)
-    inline object unbox_if_zerodim(object arr)
-
-cdef inline object get_value_at(ndarray arr, object loc):
-    cdef:
-        Py_ssize_t i, sz
-        void* data_ptr
-    if is_float_object(loc):
-        casted = int(loc)
-        if casted == loc:
-            loc = casted
-    i = <Py_ssize_t> loc
-    sz = cnp.PyArray_SIZE(arr)
-
-    if i < 0 and sz > 0:
-        i += sz
-    elif i >= sz or sz == 0:
-        raise IndexError('index out of bounds')
-
-    return get_value_1d(arr, i)
-
-cdef inline set_value_at(ndarray arr, object loc, object value):
-    cdef:
-        Py_ssize_t i, sz
-    if is_float_object(loc):
-        casted = int(loc)
-        if casted == loc:
-            loc = casted
-    i = <Py_ssize_t> loc
-    sz = cnp.PyArray_SIZE(arr)
-
-    if i < 0:
-        i += sz
-    elif i >= sz:
-        raise IndexError('index out of bounds')
-
-    assign_value_1d(arr, i, value)
-
-cdef inline int is_contiguous(ndarray arr):
-    return cnp.PyArray_CHKFLAGS(arr, cnp.NPY_C_CONTIGUOUS)
-
-cdef inline is_array(object o):
-    return cnp.PyArray_Check(o)
-
-cdef inline bint _checknull(object val):
-    try:
-        return val is None or (cpython.PyFloat_Check(val) and val != val)
-    except ValueError:
-        return False
-
-cdef inline bint _checknull_old(object val):
-    import numpy as np
-    cdef double INF = <double> np.inf
-    cdef double NEGINF = -INF
-    try:
-        return val is None or (cpython.PyFloat_Check(val) and (val != val or val == INF or val == NEGINF))
-    except ValueError:
-        return False
-
-cdef inline bint _checknan(object val):
-    return not cnp.PyArray_Check(val) and val != val
-
-cdef inline bint is_period_object(object val):
-    return getattr(val,'_typ','_typ') == 'period'
diff --git a/pandas/stats/api.py b/pandas/stats/api.py
deleted file mode 100644
index 3732f9ed39524..0000000000000
--- a/pandas/stats/api.py
+++ /dev/null
@@ -1,9 +0,0 @@
-"""
-Common namespace of statistical functions
-"""
-
-# pylint: disable-msg=W0611,W0614,W0401
-
-from pandas.stats.moments import *
-from pandas.stats.interface import ols
-from pandas.stats.fama_macbeth import fama_macbeth
diff --git a/pandas/stats/common.py b/pandas/stats/common.py
deleted file mode 100644
index c30b3e7a4bf61..0000000000000
--- a/pandas/stats/common.py
+++ /dev/null
@@ -1,41 +0,0 @@
-
-_WINDOW_TYPES = {
-    0: 'full_sample',
-    1: 'rolling',
-    2: 'expanding'
-}
-# also allow 'rolling' as key
-_WINDOW_TYPES.update((v, v) for k,v in list(_WINDOW_TYPES.items()))
-_ADDITIONAL_CLUSTER_TYPES = set(("entity", "time"))
-
-def _get_cluster_type(cluster_type):
-    # this was previous behavior
-    if cluster_type is None:
-        return cluster_type
-    try:
-        return _get_window_type(cluster_type)
-    except ValueError:
-        final_type = str(cluster_type).lower().replace("_", " ")
-        if final_type in _ADDITIONAL_CLUSTER_TYPES:
-            return final_type
-        raise ValueError('Unrecognized cluster type: %s' % cluster_type)
-
-def _get_window_type(window_type):
-    # e.g., 0, 1, 2
-    final_type = _WINDOW_TYPES.get(window_type)
-    # e.g., 'full_sample'
-    final_type = final_type or _WINDOW_TYPES.get(str(window_type).lower().replace(" ", "_"))
-    if final_type is None:
-        raise ValueError('Unrecognized window type: %s' % window_type)
-    return final_type
-
-def banner(text, width=80):
-    """
-
-    """
-    toFill = width - len(text)
-
-    left = toFill // 2
-    right = toFill - left
-
-    return '%s%s%s' % ('-' * left, text, '-' * right)
diff --git a/pandas/stats/fama_macbeth.py b/pandas/stats/fama_macbeth.py
deleted file mode 100644
index 38fb5894c94bb..0000000000000
--- a/pandas/stats/fama_macbeth.py
+++ /dev/null
@@ -1,226 +0,0 @@
-from pandas.core.base import StringMixin
-from pandas.compat import StringIO, range
-
-import numpy as np
-
-from pandas.core.api import Series, DataFrame
-import pandas.stats.common as common
-from pandas.util.decorators import cache_readonly
-
-
-def fama_macbeth(**kwargs):
-    """Runs Fama-MacBeth regression.
-
-    Parameters
-    ----------
-    Takes the same arguments as a panel OLS, in addition to:
-
-    nw_lags_beta: int
-       Newey-West adjusts the betas by the given lags
-    """
-    window_type = kwargs.get('window_type')
-    if window_type is None:
-        klass = FamaMacBeth
-    else:
-        klass = MovingFamaMacBeth
-
-    return klass(**kwargs)
-
-
-class FamaMacBeth(StringMixin):
-    def __init__(self, y, x, intercept=True, nw_lags=None,
-                 nw_lags_beta=None,
-                 entity_effects=False, time_effects=False, x_effects=None,
-                 cluster=None, dropped_dummies={}, verbose=False):
-        self._nw_lags_beta = nw_lags_beta
-
-        from pandas.stats.plm import MovingPanelOLS
-        self._ols_result = MovingPanelOLS(
-            y=y, x=x, window_type='rolling', window=1,
-            intercept=intercept,
-            nw_lags=nw_lags, entity_effects=entity_effects,
-            time_effects=time_effects, x_effects=x_effects, cluster=cluster,
-            dropped_dummies=dropped_dummies, verbose=verbose)
-
-        self._cols = self._ols_result._x.columns
-
-    @cache_readonly
-    def _beta_raw(self):
-        return self._ols_result._beta_raw
-
-    @cache_readonly
-    def _stats(self):
-        return _calc_t_stat(self._beta_raw, self._nw_lags_beta)
-
-    @cache_readonly
-    def _mean_beta_raw(self):
-        return self._stats[0]
-
-    @cache_readonly
-    def _std_beta_raw(self):
-        return self._stats[1]
-
-    @cache_readonly
-    def _t_stat_raw(self):
-        return self._stats[2]
-
-    def _make_result(self, result):
-        return Series(result, index=self._cols)
-
-    @cache_readonly
-    def mean_beta(self):
-        return self._make_result(self._mean_beta_raw)
-
-    @cache_readonly
-    def std_beta(self):
-        return self._make_result(self._std_beta_raw)
-
-    @cache_readonly
-    def t_stat(self):
-        return self._make_result(self._t_stat_raw)
-
-    @cache_readonly
-    def _results(self):
-        return {
-            'mean_beta': self._mean_beta_raw,
-            'std_beta': self._std_beta_raw,
-            't_stat': self._t_stat_raw,
-        }
-
-    @cache_readonly
-    def _coef_table(self):
-        buffer = StringIO()
-        buffer.write('%13s %13s %13s %13s %13s %13s\n' %
-                    ('Variable', 'Beta', 'Std Err', 't-stat', 'CI 2.5%', 'CI 97.5%'))
-        template = '%13s %13.4f %13.4f %13.2f %13.4f %13.4f\n'
-
-        for i, name in enumerate(self._cols):
-            if i and not (i % 5):
-                buffer.write('\n' + common.banner(''))
-
-            mean_beta = self._results['mean_beta'][i]
-            std_beta = self._results['std_beta'][i]
-            t_stat = self._results['t_stat'][i]
-            ci1 = mean_beta - 1.96 * std_beta
-            ci2 = mean_beta + 1.96 * std_beta
-
-            values = '(%s)' % name, mean_beta, std_beta, t_stat, ci1, ci2
-
-            buffer.write(template % values)
-
-        if self._nw_lags_beta is not None:
-            buffer.write('\n')
-            buffer.write('*** The Std Err, t-stat are Newey-West '
-                         'adjusted with Lags %5d\n' % self._nw_lags_beta)
-
-        return buffer.getvalue()
-
-    def __unicode__(self):
-        return self.summary
-
-    @cache_readonly
-    def summary(self):
-        template = """
-----------------------Summary of Fama-MacBeth Analysis-------------------------
-
-Formula: Y ~ %(formulaRHS)s
-# betas : %(nu)3d
-
-----------------------Summary of Estimated Coefficients------------------------
-%(coefTable)s
---------------------------------End of Summary---------------------------------
-"""
-        params = {
-            'formulaRHS': ' + '.join(self._cols),
-            'nu': len(self._beta_raw),
-            'coefTable': self._coef_table,
-        }
-
-        return template % params
-
-
-class MovingFamaMacBeth(FamaMacBeth):
-    def __init__(self, y, x, window_type='rolling', window=10,
-                 intercept=True, nw_lags=None, nw_lags_beta=None,
-                 entity_effects=False, time_effects=False, x_effects=None,
-                 cluster=None, dropped_dummies={}, verbose=False):
-        self._window_type = common._get_window_type(window_type)
-        self._window = window
-
-        FamaMacBeth.__init__(
-            self, y=y, x=x, intercept=intercept,
-            nw_lags=nw_lags, nw_lags_beta=nw_lags_beta,
-            entity_effects=entity_effects, time_effects=time_effects,
-            x_effects=x_effects, cluster=cluster,
-            dropped_dummies=dropped_dummies, verbose=verbose)
-
-        self._index = self._ols_result._index
-        self._T = len(self._index)
-
-    @property
-    def _is_rolling(self):
-        return self._window_type == 'rolling'
-
-    def _calc_stats(self):
-        mean_betas = []
-        std_betas = []
-        t_stats = []
-
-        # XXX
-
-        mask = self._ols_result._rolling_ols_call[2]
-        obs_total = mask.astype(int).cumsum()
-
-        start = self._window - 1
-        betas = self._beta_raw
-        for i in range(start, self._T):
-            if self._is_rolling:
-                begin = i - start
-            else:
-                begin = 0
-
-            B = betas[max(obs_total[begin] - 1, 0): obs_total[i]]
-            mean_beta, std_beta, t_stat = _calc_t_stat(B, self._nw_lags_beta)
-            mean_betas.append(mean_beta)
-            std_betas.append(std_beta)
-            t_stats.append(t_stat)
-
-        return np.array([mean_betas, std_betas, t_stats])
-
-    _stats = cache_readonly(_calc_stats)
-
-    def _make_result(self, result):
-        return DataFrame(result, index=self._result_index, columns=self._cols)
-
-    @cache_readonly
-    def _result_index(self):
-        mask = self._ols_result._rolling_ols_call[2]
-        # HACK XXX
-        return self._index[mask.cumsum() >= self._window]
-
-    @cache_readonly
-    def _results(self):
-        return {
-            'mean_beta': self._mean_beta_raw[-1],
-            'std_beta': self._std_beta_raw[-1],
-            't_stat': self._t_stat_raw[-1],
-        }
-
-
-def _calc_t_stat(beta, nw_lags_beta):
-    N = len(beta)
-    B = beta - beta.mean(0)
-    C = np.dot(B.T, B) / N
-
-    if nw_lags_beta is not None:
-        for i in range(nw_lags_beta + 1):
-
-            cov = np.dot(B[i:].T, B[:(N - i)]) / N
-            weight = i / (nw_lags_beta + 1)
-            C += 2 * (1 - weight) * cov
-
-    mean_beta = beta.mean(0)
-    std_beta = np.sqrt(np.diag(C)) / np.sqrt(N)
-    t_stat = mean_beta / std_beta
-
-    return mean_beta, std_beta, t_stat
diff --git a/pandas/stats/interface.py b/pandas/stats/interface.py
deleted file mode 100644
index 96b2b3e32be0d..0000000000000
--- a/pandas/stats/interface.py
+++ /dev/null
@@ -1,143 +0,0 @@
-from pandas.core.api import Series, DataFrame, Panel, MultiIndex
-from pandas.stats.ols import OLS, MovingOLS
-from pandas.stats.plm import PanelOLS, MovingPanelOLS, NonPooledPanelOLS
-import pandas.stats.common as common
-
-
-def ols(**kwargs):
-    """Returns the appropriate OLS object depending on whether you need
-    simple or panel OLS, and a full-sample or rolling/expanding OLS.
-
-    Will be a normal linear regression or a (pooled) panel regression depending
-    on the type of the inputs:
-
-    y : Series, x : DataFrame -> OLS
-    y : Series, x : dict of DataFrame -> OLS
-    y : DataFrame, x : DataFrame -> PanelOLS
-    y : DataFrame, x : dict of DataFrame/Panel -> PanelOLS
-    y : Series with MultiIndex, x : Panel/DataFrame + MultiIndex -> PanelOLS
-
-    Parameters
-    ----------
-    y: Series or DataFrame
-        See above for types
-    x: Series, DataFrame, dict of Series, dict of DataFrame, Panel
-    weights : Series or ndarray
-        The weights are presumed to be (proportional to) the inverse of the
-        variance of the observations.  That is, if the variables are to be
-        transformed by 1/sqrt(W) you must supply weights = 1/W
-    intercept: bool
-        True if you want an intercept.  Defaults to True.
-    nw_lags: None or int
-        Number of Newey-West lags.  Defaults to None.
-    nw_overlap: bool
-        Whether there are overlaps in the NW lags.  Defaults to False.
-    window_type: {'full sample', 'rolling', 'expanding'}
-        'full sample' by default
-    window: int
-        size of window (for rolling/expanding OLS). If window passed and no
-        explicit window_type, 'rolling" will be used as the window_type
-
-    Panel OLS options:
-        pool: bool
-            Whether to run pooled panel regression.  Defaults to true.
-        entity_effects: bool
-            Whether to account for entity fixed effects.  Defaults to false.
-        time_effects: bool
-            Whether to account for time fixed effects.  Defaults to false.
-        x_effects: list
-            List of x's to account for fixed effects.  Defaults to none.
-        dropped_dummies: dict
-            Key is the name of the variable for the fixed effect.
-            Value is the value of that variable for which we drop the dummy.
-
-            For entity fixed effects, key equals 'entity'.
-
-            By default, the first dummy is dropped if no dummy is specified.
-        cluster: {'time', 'entity'}
-            cluster variances
-
-    Examples
-    --------
-    # Run simple OLS.
-    result = ols(y=y, x=x)
-
-    # Run rolling simple OLS with window of size 10.
-    result = ols(y=y, x=x, window_type='rolling', window=10)
-    print(result.beta)
-
-    result = ols(y=y, x=x, nw_lags=1)
-
-    # Set up LHS and RHS for data across all items
-    y = A
-    x = {'B' : B, 'C' : C}
-
-    # Run panel OLS.
-    result = ols(y=y, x=x)
-
-    # Run expanding panel OLS with window 10 and entity clustering.
-    result = ols(y=y, x=x, cluster='entity', window_type='expanding', window=10)
-
-    Returns
-    -------
-    The appropriate OLS object, which allows you to obtain betas and various
-    statistics, such as std err, t-stat, etc.
-    """
-
-    if (kwargs.get('cluster') is not None and
-        kwargs.get('nw_lags') is not None):
-        raise ValueError(
-            'Pandas OLS does not work with Newey-West correction '
-            'and clustering.')
-
-
-    pool = kwargs.get('pool')
-    if 'pool' in kwargs:
-        del kwargs['pool']
-
-    window_type = kwargs.get('window_type')
-    window = kwargs.get('window')
-
-    if window_type is None:
-        if window is None:
-            window_type = 'full_sample'
-        else:
-            window_type = 'rolling'
-    else:
-        window_type = common._get_window_type(window_type)
-
-    if window_type != 'full_sample':
-        kwargs['window_type'] = common._get_window_type(window_type)
-
-    y = kwargs.get('y')
-    x = kwargs.get('x')
-
-    panel = False
-    if isinstance(y, DataFrame) or (isinstance(y, Series) and
-                                    isinstance(y.index, MultiIndex)):
-        panel = True
-    if isinstance(x, Panel):
-        panel = True
-
-    if window_type == 'full_sample':
-        for rolling_field in ('window_type', 'window', 'min_periods'):
-            if rolling_field in kwargs:
-                del kwargs[rolling_field]
-
-        if panel:
-            if pool is False:
-                klass = NonPooledPanelOLS
-            else:
-                klass = PanelOLS
-        else:
-            klass = OLS
-    else:
-        if panel:
-            if pool is False:
-                klass = NonPooledPanelOLS
-            else:
-                klass = MovingPanelOLS
-        else:
-            klass = MovingOLS
-
-    return klass(**kwargs)
diff --git a/pandas/stats/math.py b/pandas/stats/math.py
deleted file mode 100644
index 505415bebf89e..0000000000000
--- a/pandas/stats/math.py
+++ /dev/null
@@ -1,130 +0,0 @@
-# pylint: disable-msg=E1103
-# pylint: disable-msg=W0212
-
-from __future__ import division
-
-from pandas.compat import range
-import numpy as np
-import numpy.linalg as linalg
-
-
-def rank(X, cond=1.0e-12):
-    """
-    Return the rank of a matrix X based on its generalized inverse,
-    not the SVD.
-    """
-    X = np.asarray(X)
-    if len(X.shape) == 2:
-        import scipy.linalg as SL
-        D = SL.svdvals(X)
-        result = np.add.reduce(np.greater(D / D.max(), cond))
-        return int(result.astype(np.int32))
-    else:
-        return int(not np.alltrue(np.equal(X, 0.)))
-
-
-def solve(a, b):
-    """Returns the solution of A X = B."""
-    try:
-        return linalg.solve(a, b)
-    except linalg.LinAlgError:
-        return np.dot(linalg.pinv(a), b)
-
-
-def inv(a):
-    """Returns the inverse of A."""
-    try:
-        return np.linalg.inv(a)
-    except linalg.LinAlgError:
-        return np.linalg.pinv(a)
-
-
-def is_psd(m):
-    eigvals = linalg.eigvals(m)
-    return np.isreal(eigvals).all() and (eigvals >= 0).all()
-
-
-def newey_west(m, max_lags, nobs, df, nw_overlap=False):
-    """
-    Compute Newey-West adjusted covariance matrix, taking into account
-    specified number of leads / lags
-
-    Parameters
-    ----------
-    m : (N x K)
-    max_lags : int
-    nobs : int
-        Number of observations in model
-    df : int
-        Degrees of freedom in explanatory variables
-    nw_overlap : boolean, default False
-        Assume data is overlapping
-
-    Returns
-    -------
-    ndarray (K x K)
-
-    Reference
-    ---------
-    Newey, W. K. & West, K. D. (1987) A Simple, Positive
-    Semi-definite, Heteroskedasticity and Autocorrelation Consistent
-    Covariance Matrix, Econometrica, vol. 55(3), 703-708
-    """
-    Xeps = np.dot(m.T, m)
-    for lag in range(1, max_lags + 1):
-        auto_cov = np.dot(m[:-lag].T, m[lag:])
-        weight = lag / (max_lags + 1)
-        if nw_overlap:
-            weight = 0
-        bb = auto_cov + auto_cov.T
-        dd = (1 - weight) * bb
-        Xeps += dd
-
-    Xeps *= nobs / (nobs - df)
-
-    if nw_overlap and not is_psd(Xeps):
-        new_max_lags = int(np.ceil(max_lags * 1.5))
-#         print('nw_overlap is True and newey_west generated a non positive '
-#               'semidefinite matrix, so using newey_west with max_lags of %d.'
-#               % new_max_lags)
-        return newey_west(m, new_max_lags, nobs, df)
-
-    return Xeps
-
-
-def calc_F(R, r, beta, var_beta, nobs, df):
-    """
-    Computes the standard F-test statistic for linear restriction
-    hypothesis testing
-
-    Parameters
-    ----------
-    R: ndarray (N x N)
-        Restriction matrix
-    r: ndarray (N x 1)
-        Restriction vector
-    beta: ndarray (N x 1)
-        Estimated model coefficients
-    var_beta: ndarray (N x N)
-        Variance covariance matrix of regressors
-    nobs: int
-        Number of observations in model
-    df: int
-        Model degrees of freedom
-
-    Returns
-    -------
-    F value, (q, df_resid), p value
-    """
-    from scipy.stats import f
-
-    hyp = np.dot(R, beta.reshape(len(beta), 1)) - r
-    RSR = np.dot(R, np.dot(var_beta, R.T))
-
-    q = len(r)
-
-    F = np.dot(hyp.T, np.dot(inv(RSR), hyp)).squeeze() / q
-
-    p_value = 1 - f.cdf(F, q, nobs - df)
-
-    return F, (q, nobs - df), p_value
diff --git a/pandas/stats/misc.py b/pandas/stats/misc.py
deleted file mode 100644
index ef663b25e9ca0..0000000000000
--- a/pandas/stats/misc.py
+++ /dev/null
@@ -1,386 +0,0 @@
-from numpy import NaN
-from pandas import compat
-import numpy as np
-
-from pandas.core.api import Series, DataFrame, isnull, notnull
-from pandas.core.series import remove_na
-from pandas.compat import zip
-
-
-def zscore(series):
-    return (series - series.mean()) / np.std(series, ddof=0)
-
-
-def correl_ts(frame1, frame2):
-    """
-    Pairwise correlation of columns of two DataFrame objects
-
-    Parameters
-    ----------
-
-    Returns
-    -------
-    y : Series
-    """
-    results = {}
-    for col, series in compat.iteritems(frame1):
-        if col in frame2:
-            other = frame2[col]
-
-            idx1 = series.valid().index
-            idx2 = other.valid().index
-
-            common_index = idx1.intersection(idx2)
-
-            seriesStand = zscore(series.reindex(common_index))
-            otherStand = zscore(other.reindex(common_index))
-            results[col] = (seriesStand * otherStand).mean()
-
-    return Series(results)
-
-
-def correl_xs(frame1, frame2):
-    return correl_ts(frame1.T, frame2.T)
-
-def percentileofscore(a, score, kind='rank'):
-    """The percentile rank of a score relative to a list of scores.
-
-    A `percentileofscore` of, for example, 80% means that 80% of the
-    scores in `a` are below the given score. In the case of gaps or
-    ties, the exact definition depends on the optional keyword, `kind`.
-
-    Parameters
-    ----------
-    a: array like
-        Array of scores to which `score` is compared.
-    score: int or float
-        Score that is compared to the elements in `a`.
-    kind: {'rank', 'weak', 'strict', 'mean'}, optional
-        This optional parameter specifies the interpretation of the
-        resulting score:
-
-        - "rank": Average percentage ranking of score.  In case of
-                  multiple matches, average the percentage rankings of
-                  all matching scores.
-        - "weak": This kind corresponds to the definition of a cumulative
-                  distribution function.  A percentileofscore of 80%
-                  means that 80% of values are less than or equal
-                  to the provided score.
-        - "strict": Similar to "weak", except that only values that are
-                    strictly less than the given score are counted.
-        - "mean": The average of the "weak" and "strict" scores, often used in
-                  testing.  See
-
-                  http://en.wikipedia.org/wiki/Percentile_rank
-
-    Returns
-    -------
-    pcos : float
-        Percentile-position of score (0-100) relative to `a`.
-
-    Examples
-    --------
-    Three-quarters of the given values lie below a given score:
-
-    >>> percentileofscore([1, 2, 3, 4], 3)
-    75.0
-
-    With multiple matches, note how the scores of the two matches, 0.6
-    and 0.8 respectively, are averaged:
-
-    >>> percentileofscore([1, 2, 3, 3, 4], 3)
-    70.0
-
-    Only 2/5 values are strictly less than 3:
-
-    >>> percentileofscore([1, 2, 3, 3, 4], 3, kind='strict')
-    40.0
-
-    But 4/5 values are less than or equal to 3:
-
-    >>> percentileofscore([1, 2, 3, 3, 4], 3, kind='weak')
-    80.0
-
-    The average between the weak and the strict scores is
-
-    >>> percentileofscore([1, 2, 3, 3, 4], 3, kind='mean')
-    60.0
-
-    """
-    a = np.array(a)
-    n = len(a)
-
-    if kind == 'rank':
-        if not(np.any(a == score)):
-            a = np.append(a, score)
-            a_len = np.array(lrange(len(a)))
-        else:
-            a_len = np.array(lrange(len(a))) + 1.0
-
-        a = np.sort(a)
-        idx = [a == score]
-        pct = (np.mean(a_len[idx]) / n) * 100.0
-        return pct
-
-    elif kind == 'strict':
-        return sum(a < score) / float(n) * 100
-    elif kind == 'weak':
-        return sum(a <= score) / float(n) * 100
-    elif kind == 'mean':
-        return (sum(a < score) + sum(a <= score)) * 50 / float(n)
-    else:
-        raise ValueError("kind can only be 'rank', 'strict', 'weak' or 'mean'")
-
-def percentileRank(frame, column=None, kind='mean'):
-    """
-    Return score at percentile for each point in time (cross-section)
-
-    Parameters
-    ----------
-    frame: DataFrame
-    column: string or Series, optional
-       Column name or specific Series to compute percentiles for.
-       If not provided, percentiles are computed for all values at each
-       point in time. Note that this can take a LONG time.
-    kind: {'rank', 'weak', 'strict', 'mean'}, optional
-        This optional parameter specifies the interpretation of the
-        resulting score:
-
-        - "rank": Average percentage ranking of score.  In case of
-                  multiple matches, average the percentage rankings of
-                  all matching scores.
-        - "weak": This kind corresponds to the definition of a cumulative
-                  distribution function.  A percentileofscore of 80%
-                  means that 80% of values are less than or equal
-                  to the provided score.
-        - "strict": Similar to "weak", except that only values that are
-                    strictly less than the given score are counted.
-        - "mean": The average of the "weak" and "strict" scores, often used in
-                  testing.  See
-
-                  http://en.wikipedia.org/wiki/Percentile_rank
-
-    Returns
-    -------
-    TimeSeries or DataFrame, depending on input
-    """
-    fun = lambda xs, score: percentileofscore(remove_na(xs),
-                                              score, kind=kind)
-
-    results = {}
-    framet = frame.T
-    if column is not None:
-        if isinstance(column, Series):
-            for date, xs in compat.iteritems(frame.T):
-                results[date] = fun(xs, column.get(date, NaN))
-        else:
-            for date, xs in compat.iteritems(frame.T):
-                results[date] = fun(xs, xs[column])
-        results = Series(results)
-    else:
-        for column in frame.columns:
-            for date, xs in compat.iteritems(framet):
-                results.setdefault(date, {})[column] = fun(xs, xs[column])
-        results = DataFrame(results).T
-    return results
-
-
-def bucket(series, k, by=None):
-    """
-    Produce DataFrame representing quantiles of a Series
-
-    Parameters
-    ----------
-    series : Series
-    k : int
-        number of quantiles
-    by : Series or same-length array
-        bucket by value
-
-    Returns
-    -------
-    DataFrame
-    """
-    if by is None:
-        by = series
-    else:
-        by = by.reindex(series.index)
-
-    split = _split_quantile(by, k)
-    mat = np.empty((len(series), k), dtype=float) * np.NaN
-
-    for i, v in enumerate(split):
-        mat[:, i][v] = series.take(v)
-
-    return DataFrame(mat, index=series.index, columns=np.arange(k) + 1)
-
-
-def _split_quantile(arr, k):
-    arr = np.asarray(arr)
-    mask = np.isfinite(arr)
-    order = arr[mask].argsort()
-    n = len(arr)
-
-    return np.array_split(np.arange(n)[mask].take(order), k)
-
-
-def bucketcat(series, cats):
-    """
-    Produce DataFrame representing quantiles of a Series
-
-    Parameters
-    ----------
-    series : Series
-    cat : Series or same-length array
-        bucket by category; mutually exclusive with 'by'
-
-    Returns
-    -------
-    DataFrame
-    """
-    if not isinstance(series, Series):
-        series = Series(series, index=np.arange(len(series)))
-
-    cats = np.asarray(cats)
-
-    unique_labels = np.unique(cats)
-    unique_labels = unique_labels[com.notnull(unique_labels)]
-
-    # group by
-    data = {}
-
-    for label in unique_labels:
-        data[label] = series[cats == label]
-
-    return DataFrame(data, columns=unique_labels)
-
-
-def bucketpanel(series, bins=None, by=None, cat=None):
-    """
-    Bucket data by two Series to create summary panel
-
-    Parameters
-    ----------
-    series : Series
-    bins : tuple (length-2)
-        e.g. (2, 2)
-    by : tuple of Series
-        bucket by value
-    cat : tuple of Series
-        bucket by category; mutually exclusive with 'by'
-
-    Returns
-    -------
-    DataFrame
-    """
-    use_by = by is not None
-    use_cat = cat is not None
-
-    if use_by and use_cat:
-        raise Exception('must specify by or cat, but not both')
-    elif use_by:
-        if len(by) != 2:
-            raise Exception('must provide two bucketing series')
-
-        xby, yby = by
-        xbins, ybins = bins
-
-        return _bucketpanel_by(series, xby, yby, xbins, ybins)
-
-    elif use_cat:
-        xcat, ycat = cat
-        return _bucketpanel_cat(series, xcat, ycat)
-    else:
-        raise Exception('must specify either values or categories '
-                        'to bucket by')
-
-
-def _bucketpanel_by(series, xby, yby, xbins, ybins):
-    xby = xby.reindex(series.index)
-    yby = yby.reindex(series.index)
-
-    xlabels = _bucket_labels(xby.reindex(series.index), xbins)
-    ylabels = _bucket_labels(yby.reindex(series.index), ybins)
-
-    labels = _uniquify(xlabels, ylabels, xbins, ybins)
-
-    mask = com.isnull(labels)
-    labels[mask] = -1
-
-    unique_labels = np.unique(labels)
-    bucketed = bucketcat(series, labels)
-
-    _ulist = list(labels)
-    index_map = dict((x, _ulist.index(x)) for x in unique_labels)
-
-    def relabel(key):
-        pos = index_map[key]
-
-        xlab = xlabels[pos]
-        ylab = ylabels[pos]
-
-        return '%sx%s' % (int(xlab) if com.notnull(xlab) else 'NULL',
-                          int(ylab) if com.notnull(ylab) else 'NULL')
-
-    return bucketed.rename(columns=relabel)
-
-
-def _bucketpanel_cat(series, xcat, ycat):
-    xlabels, xmapping = _intern(xcat)
-    ylabels, ymapping = _intern(ycat)
-
-    shift = 10 ** (np.ceil(np.log10(ylabels.max())))
-    labels = xlabels * shift + ylabels
-
-    sorter = labels.argsort()
-    sorted_labels = labels.take(sorter)
-    sorted_xlabels = xlabels.take(sorter)
-    sorted_ylabels = ylabels.take(sorter)
-
-    unique_labels = np.unique(labels)
-    unique_labels = unique_labels[com.notnull(unique_labels)]
-
-    locs = sorted_labels.searchsorted(unique_labels)
-    xkeys = sorted_xlabels.take(locs)
-    ykeys = sorted_ylabels.take(locs)
-
-    stringified = ['(%s, %s)' % arg
-                   for arg in zip(xmapping.take(xkeys), ymapping.take(ykeys))]
-
-    result = bucketcat(series, labels)
-    result.columns = stringified
-
-    return result
-
-
-def _intern(values):
-    # assumed no NaN values
-    values = np.asarray(values)
-
-    uniqued = np.unique(values)
-    labels = uniqued.searchsorted(values)
-    return labels, uniqued
-
-
-def _uniquify(xlabels, ylabels, xbins, ybins):
-    # encode the stuff, create unique label
-    shifter = 10 ** max(xbins, ybins)
-    _xpiece = xlabels * shifter
-    _ypiece = ylabels
-
-    return _xpiece + _ypiece
-
-
-def _bucket_labels(series, k):
-    arr = np.asarray(series)
-    mask = np.isfinite(arr)
-    order = arr[mask].argsort()
-    n = len(series)
-
-    split = np.array_split(np.arange(n)[mask].take(order), k)
-
-    mat = np.empty(n, dtype=float) * np.NaN
-    for i, v in enumerate(split):
-        mat[v] = i
-
-    return mat + 1
diff --git a/pandas/stats/moments.py b/pandas/stats/moments.py
deleted file mode 100644
index c4791c43278b9..0000000000000
--- a/pandas/stats/moments.py
+++ /dev/null
@@ -1,1040 +0,0 @@
-"""
-Provides rolling statistical moments and related descriptive
-statistics implemented in Cython
-"""
-from __future__ import division
-
-from functools import wraps
-from collections import defaultdict
-
-from numpy import NaN
-import numpy as np
-
-from pandas.core.api import DataFrame, Series, Panel, notnull
-import pandas.algos as algos
-import pandas.core.common as pdcom
-
-from pandas.util.decorators import Substitution, Appender
-
-__all__ = ['rolling_count', 'rolling_max', 'rolling_min',
-           'rolling_sum', 'rolling_mean', 'rolling_std', 'rolling_cov',
-           'rolling_corr', 'rolling_var', 'rolling_skew', 'rolling_kurt',
-           'rolling_quantile', 'rolling_median', 'rolling_apply',
-           'rolling_corr_pairwise', 'rolling_window',
-           'ewma', 'ewmvar', 'ewmstd', 'ewmvol', 'ewmcorr', 'ewmcov',
-           'expanding_count', 'expanding_max', 'expanding_min',
-           'expanding_sum', 'expanding_mean', 'expanding_std',
-           'expanding_cov', 'expanding_corr', 'expanding_var',
-           'expanding_skew', 'expanding_kurt', 'expanding_quantile',
-           'expanding_median', 'expanding_apply', 'expanding_corr_pairwise']
-
-#------------------------------------------------------------------------------
-# Docs
-
-# The order of arguments for the _doc_template is:
-# (header, args, kwargs, returns, notes)
-
-_doc_template = """
-%s
-
-Parameters
-----------
-%s%s
-Returns
--------
-%s
-%s
-"""
-
-_roll_kw = """window : int
-    Size of the moving window. This is the number of observations used for
-    calculating the statistic.
-min_periods : int, default None
-    Minimum number of observations in window required to have a value
-    (otherwise result is NA).
-freq : string or DateOffset object, optional (default None)
-    Frequency to conform the data to before computing the statistic. Specified
-    as a frequency string or DateOffset object.
-center : boolean, default False
-    Set the labels at the center of the window.
-how : string, default '%s'
-    Method for down- or re-sampling
-"""
-
-_roll_notes = r"""
-Notes
------
-By default, the result is set to the right edge of the window. This can be
-changed to the center of the window by setting ``center=True``.
-
-The `freq` keyword is used to conform time series data to a specified
-frequency by resampling the data. This is done with the default parameters
-of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-"""
-
-
-_ewm_kw = r"""com : float. optional
-    Center of mass: :math:`\alpha = 1 / (1 + com)`,
-span : float, optional
-    Specify decay in terms of span, :math:`\alpha = 2 / (span + 1)`
-halflife : float, optional
-    Specify decay in terms of halflife, :math:`\alpha = 1 - exp(log(0.5) / halflife)`
-min_periods : int, default 0
-    Minimum number of observations in window required to have a value
-    (otherwise result is NA).
-freq : None or string alias / date offset object, default=None
-    Frequency to conform to before computing statistic
-adjust : boolean, default True
-    Divide by decaying adjustment factor in beginning periods to account for
-    imbalance in relative weightings (viewing EWMA as a moving average)
-how : string, default 'mean'
-    Method for down- or re-sampling
-ignore_na : boolean, default False
-    Ignore missing values when calculating weights;
-    specify True to reproduce pre-0.15.0 behavior
-"""
-
-_ewm_notes = r"""
-Notes
------
-Either center of mass, span or halflife must be specified
-
-EWMA is sometimes specified using a "span" parameter `s`, we have that the
-decay parameter :math:`\alpha` is related to the span as
-:math:`\alpha = 2 / (s + 1) = 1 / (1 + c)`
-
-where `c` is the center of mass. Given a span, the associated center of mass is
-:math:`c = (s - 1) / 2`
-
-So a "20-day EWMA" would have center 9.5.
-
-When adjust is True (default), weighted averages are calculated using weights
-    (1-alpha)**(n-1), (1-alpha)**(n-2), ..., 1-alpha, 1.
-
-When adjust is False, weighted averages are calculated recursively as:
-    weighted_average[0] = arg[0];
-    weighted_average[i] = (1-alpha)*weighted_average[i-1] + alpha*arg[i].
-
-When ignore_na is False (default), weights are based on absolute positions.
-For example, the weights of x and y used in calculating the final weighted
-average of [x, None, y] are (1-alpha)**2 and 1 (if adjust is True), and
-(1-alpha)**2 and alpha (if adjust is False).
-
-When ignore_na is True (reproducing pre-0.15.0 behavior), weights are based on
-relative positions. For example, the weights of x and y used in calculating
-the final weighted average of [x, None, y] are 1-alpha and 1 (if adjust is
-True), and 1-alpha and alpha (if adjust is False).
-"""
-
-_expanding_kw = """min_periods : int, default None
-    Minimum number of observations in window required to have a value
-    (otherwise result is NA).
-freq : string or DateOffset object, optional (default None)
-    Frequency to conform the data to before computing the statistic. Specified
-    as a frequency string or DateOffset object.
-"""
-
-
-_type_of_input_retval = "y : type of input argument"
-
-_flex_retval = """y : type depends on inputs
-    DataFrame / DataFrame -> DataFrame (matches on columns) or Panel (pairwise)
-    DataFrame / Series -> Computes result for each column
-    Series / Series -> Series"""
-
-_pairwise_retval = "y : Panel whose items are df1.index values"
-
-_unary_arg = "arg : Series, DataFrame\n"
-
-_binary_arg_flex = """arg1 : Series, DataFrame, or ndarray
-arg2 : Series, DataFrame, or ndarray, optional
-    if not supplied then will default to arg1 and produce pairwise output
-"""
-
-_binary_arg = """arg1 : Series, DataFrame, or ndarray
-arg2 : Series, DataFrame, or ndarray
-"""
-
-_pairwise_arg = """df1 : DataFrame
-df2 : DataFrame
-"""
-
-_pairwise_kw = """pairwise : bool, default False
-    If False then only matching columns between arg1 and arg2 will be used and
-    the output will be a DataFrame.
-    If True then all pairwise combinations will be calculated and the output
-    will be a Panel in the case of DataFrame inputs. In the case of missing
-    elements, only complete pairwise observations will be used.
-"""
-
-_ddof_kw = """ddof : int, default 1
-    Delta Degrees of Freedom.  The divisor used in calculations
-    is ``N - ddof``, where ``N`` represents the number of elements.
-"""
-
-_bias_kw = r"""bias : boolean, default False
-    Use a standard estimation bias correction
-"""
-
-
-def rolling_count(arg, window, freq=None, center=False, how=None):
-    """
-    Rolling count of number of non-NaN observations inside provided window.
-
-    Parameters
-    ----------
-    arg :  DataFrame or numpy ndarray-like
-    window : int
-        Size of the moving window. This is the number of observations used for
-        calculating the statistic.
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the statistic. Specified
-        as a frequency string or DateOffset object.
-    center : boolean, default False
-        Whether the label should correspond with center of window
-    how : string, default 'mean'
-        Method for down- or re-sampling
-
-    Returns
-    -------
-    rolling_count : type of caller
-
-    Notes
-    -----
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-    """
-    arg = _conv_timerule(arg, freq, how)
-    if not center:
-        window = min(window, len(arg))
-
-    return_hook, values = _process_data_structure(arg, kill_inf=False)
-
-    converted = np.isfinite(values).astype(float)
-    result = rolling_sum(converted, window, min_periods=0,
-                         center=center)  # already converted
-
-    # putmask here?
-    result[np.isnan(result)] = 0
-    return return_hook(result)
-
-
-@Substitution("Unbiased moving covariance.", _binary_arg_flex,
-              _roll_kw%'None'+_pairwise_kw+_ddof_kw, _flex_retval, _roll_notes)
-@Appender(_doc_template)
-def rolling_cov(arg1, arg2=None, window=None, min_periods=None, freq=None,
-                center=False, pairwise=None, how=None, ddof=1):
-    if window is None and isinstance(arg2, (int, float)):
-        window = arg2
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise  # only default unset
-    elif arg2 is None:
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise  # only default unset
-    arg1 = _conv_timerule(arg1, freq, how)
-    arg2 = _conv_timerule(arg2, freq, how)
-
-    def _get_cov(X, Y):
-        mean = lambda x: rolling_mean(x, window, min_periods, center=center)
-        count = rolling_count(X + Y, window, center=center)
-        bias_adj = count / (count - ddof)
-        return (mean(X * Y) - mean(X) * mean(Y)) * bias_adj
-    rs = _flex_binary_moment(arg1, arg2, _get_cov, pairwise=bool(pairwise))
-    return rs
-
-
-@Substitution("Moving sample correlation.", _binary_arg_flex,
-              _roll_kw%'None'+_pairwise_kw, _flex_retval, _roll_notes)
-@Appender(_doc_template)
-def rolling_corr(arg1, arg2=None, window=None, min_periods=None, freq=None,
-                 center=False, pairwise=None, how=None):
-    if window is None and isinstance(arg2, (int, float)):
-        window = arg2
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise  # only default unset
-    elif arg2 is None:
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise  # only default unset
-    arg1 = _conv_timerule(arg1, freq, how)
-    arg2 = _conv_timerule(arg2, freq, how)
-
-    def _get_corr(a, b):
-        num = rolling_cov(a, b, window, min_periods, freq=freq,
-                          center=center)
-        den = (rolling_std(a, window, min_periods, freq=freq,
-                           center=center) *
-               rolling_std(b, window, min_periods, freq=freq,
-                           center=center))
-        return num / den
-
-    return _flex_binary_moment(arg1, arg2, _get_corr, pairwise=bool(pairwise))
-
-
-def _flex_binary_moment(arg1, arg2, f, pairwise=False):
-    if not (isinstance(arg1,(np.ndarray, Series, DataFrame)) and
-            isinstance(arg2,(np.ndarray, Series, DataFrame))):
-        raise TypeError("arguments to moment function must be of type "
-                         "np.ndarray/Series/DataFrame")
-
-    if isinstance(arg1, (np.ndarray, Series)) and \
-            isinstance(arg2, (np.ndarray,Series)):
-        X, Y = _prep_binary(arg1, arg2)
-        return f(X, Y)
-
-    elif isinstance(arg1, DataFrame):
-        def dataframe_from_int_dict(data, frame_template):
-            result = DataFrame(data, index=frame_template.index)
-            if len(result.columns) > 0:
-                result.columns = frame_template.columns[result.columns]
-            return result
-
-        results = {}
-        if isinstance(arg2, DataFrame):
-            if pairwise is False:
-                if arg1 is arg2:
-                    # special case in order to handle duplicate column names
-                    for i, col in enumerate(arg1.columns):
-                        results[i] = f(arg1.iloc[:, i], arg2.iloc[:, i])
-                    return dataframe_from_int_dict(results, arg1)
-                else:
-                    if not arg1.columns.is_unique:
-                        raise ValueError("'arg1' columns are not unique")
-                    if not arg2.columns.is_unique:
-                        raise ValueError("'arg2' columns are not unique")
-                    X, Y = arg1.align(arg2, join='outer')
-                    X = X + 0 * Y
-                    Y = Y + 0 * X
-                    res_columns = arg1.columns.union(arg2.columns)
-                    for col in res_columns:
-                        if col in X and col in Y:
-                            results[col] = f(X[col], Y[col])
-                    return DataFrame(results, index=X.index, columns=res_columns)
-            elif pairwise is True:
-                results = defaultdict(dict)
-                for i, k1 in enumerate(arg1.columns):
-                    for j, k2 in enumerate(arg2.columns):
-                        if j<i and arg2 is arg1:
-                            # Symmetric case
-                            results[i][j] = results[j][i]
-                        else:
-                            results[i][j] = f(*_prep_binary(arg1.iloc[:, i], arg2.iloc[:, j]))
-                p = Panel.from_dict(results).swapaxes('items', 'major')
-                if len(p.major_axis) > 0:
-                    p.major_axis = arg1.columns[p.major_axis]
-                if len(p.minor_axis) > 0:
-                    p.minor_axis = arg2.columns[p.minor_axis]
-                return p
-            else:
-                raise ValueError("'pairwise' is not True/False")
-        else:
-            results = {}
-            for i, col in enumerate(arg1.columns):
-                results[i] = f(*_prep_binary(arg1.iloc[:, i], arg2))
-            return dataframe_from_int_dict(results, arg1)
-
-    else:
-        return _flex_binary_moment(arg2, arg1, f)
-
-
-@Substitution("Deprecated. Use rolling_corr(..., pairwise=True) instead.\n\n"
-              "Pairwise moving sample correlation", _pairwise_arg,
-              _roll_kw%'None', _pairwise_retval, _roll_notes)
-@Appender(_doc_template)
-def rolling_corr_pairwise(df1, df2=None, window=None, min_periods=None,
-                          freq=None, center=False):
-    import warnings
-    msg = "rolling_corr_pairwise is deprecated, use rolling_corr(..., pairwise=True)"
-    warnings.warn(msg, FutureWarning, stacklevel=2)
-    return rolling_corr(df1, df2, window=window, min_periods=min_periods,
-                        freq=freq, center=center,
-                        pairwise=True)
-
-
-def _rolling_moment(arg, window, func, minp, axis=0, freq=None, center=False,
-                    how=None, args=(), kwargs={}, **kwds):
-    """
-    Rolling statistical measure using supplied function. Designed to be
-    used with passed-in Cython array-based functions.
-
-    Parameters
-    ----------
-    arg :  DataFrame or numpy ndarray-like
-    window : Number of observations used for calculating statistic
-    func : Cython function to compute rolling statistic on raw series
-    minp : int
-        Minimum number of observations required to have a value
-    axis : int, default 0
-    freq : None or string alias / date offset object, default=None
-        Frequency to conform to before computing statistic
-    center : boolean, default False
-        Whether the label should correspond with center of window
-    how : string, default 'mean'
-        Method for down- or re-sampling
-    args : tuple
-        Passed on to func
-    kwargs : dict
-        Passed on to func
-
-    Returns
-    -------
-    y : type of input
-    """
-    arg = _conv_timerule(arg, freq, how)
-
-    return_hook, values = _process_data_structure(arg)
-
-    if values.size == 0:
-        result = values.copy()
-    else:
-        # actually calculate the moment. Faster way to do this?
-        offset = int((window - 1) / 2.) if center else 0
-        additional_nans = np.array([np.NaN] * offset)
-        calc = lambda x: func(np.concatenate((x, additional_nans)) if center else x,
-                              window, minp=minp, args=args, kwargs=kwargs,
-                              **kwds)
-        if values.ndim > 1:
-            result = np.apply_along_axis(calc, axis, values)
-        else:
-            result = calc(values)
-
-    if center:
-        result = _center_window(result, window, axis)
-
-    return return_hook(result)
-
-
-def _center_window(rs, window, axis):
-    if axis > rs.ndim-1:
-        raise ValueError("Requested axis is larger then no. of argument "
-                         "dimensions")
-
-    offset = int((window - 1) / 2.)
-    if offset > 0:
-        if isinstance(rs, (Series, DataFrame, Panel)):
-            rs = rs.slice_shift(-offset, axis=axis)
-        else:
-            lead_indexer = [slice(None)] * rs.ndim
-            lead_indexer[axis] = slice(offset, None)
-            rs = np.copy(rs[tuple(lead_indexer)])
-    return rs
-
-
-def _process_data_structure(arg, kill_inf=True):
-    if isinstance(arg, DataFrame):
-        return_hook = lambda v: type(arg)(v, index=arg.index,
-                                          columns=arg.columns)
-        values = arg.values
-    elif isinstance(arg, Series):
-        values = arg.values
-        return_hook = lambda v: Series(v, arg.index, name=arg.name)
-    else:
-        return_hook = lambda v: v
-        values = arg
-
-    if not issubclass(values.dtype.type, float):
-        values = values.astype(float)
-
-    if kill_inf:
-        values = values.copy()
-        values[np.isinf(values)] = np.NaN
-
-    return return_hook, values
-
-#------------------------------------------------------------------------------
-# Exponential moving moments
-
-
-def _get_center_of_mass(com, span, halflife):
-    valid_count = len([x for x in [com, span, halflife] if x is not None])
-    if valid_count > 1:
-        raise Exception("com, span, and halflife are mutually exclusive")
-
-    if span is not None:
-        # convert span to center of mass
-        com = (span - 1) / 2.
-    elif halflife is not None:
-        # convert halflife to center of mass
-        decay = 1 - np.exp(np.log(0.5) / halflife)
-        com = 1 / decay - 1
-    elif com is None:
-        raise Exception("Must pass one of com, span, or halflife")
-
-    return float(com)
-
-
-@Substitution("Exponentially-weighted moving average", _unary_arg, _ewm_kw,
-              _type_of_input_retval, _ewm_notes)
-@Appender(_doc_template)
-def ewma(arg, com=None, span=None, halflife=None, min_periods=0, freq=None,
-         adjust=True, how=None, ignore_na=False):
-    arg = _conv_timerule(arg, freq, how)
-    com = _get_center_of_mass(com, span, halflife)
-
-    def _ewma(v):
-        return algos.ewma(v, com, int(adjust), int(ignore_na), int(min_periods))
-
-    return_hook, values = _process_data_structure(arg)
-    if values.size == 0:
-        output = values.copy()
-    else:
-        output = np.apply_along_axis(_ewma, 0, values)
-    return return_hook(output)
-
-
-@Substitution("Exponentially-weighted moving variance", _unary_arg,
-              _ewm_kw+_bias_kw, _type_of_input_retval, _ewm_notes)
-@Appender(_doc_template)
-def ewmvar(arg, com=None, span=None, halflife=None, min_periods=0, bias=False,
-           freq=None, how=None, ignore_na=False, adjust=True):
-    arg = _conv_timerule(arg, freq, how)
-    com = _get_center_of_mass(com, span, halflife)
-
-    def _ewmvar(v):
-        return algos.ewmcov(v, v, com, int(adjust), int(ignore_na), int(min_periods), int(bias))
-
-    return_hook, values = _process_data_structure(arg)
-    if values.size == 0:
-        output = values.copy()
-    else:
-        output = np.apply_along_axis(_ewmvar, 0, values)
-    return return_hook(output)
-
-
-@Substitution("Exponentially-weighted moving std", _unary_arg,
-              _ewm_kw+_bias_kw, _type_of_input_retval, _ewm_notes)
-@Appender(_doc_template)
-def ewmstd(arg, com=None, span=None, halflife=None, min_periods=0, bias=False,
-           ignore_na=False, adjust=True):
-    result = ewmvar(arg, com=com, span=span, halflife=halflife,
-                    min_periods=min_periods, bias=bias, adjust=adjust, ignore_na=ignore_na)
-    return _zsqrt(result)
-
-ewmvol = ewmstd
-
-
-@Substitution("Exponentially-weighted moving covariance", _binary_arg_flex,
-              _ewm_kw+_pairwise_kw, _type_of_input_retval, _ewm_notes)
-@Appender(_doc_template)
-def ewmcov(arg1, arg2=None, com=None, span=None, halflife=None, min_periods=0,
-           bias=False, freq=None, pairwise=None, how=None, ignore_na=False, adjust=True):
-    if arg2 is None:
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    elif isinstance(arg2, (int, float)) and com is None:
-        com = arg2
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    arg1 = _conv_timerule(arg1, freq, how)
-    arg2 = _conv_timerule(arg2, freq, how)
-    com = _get_center_of_mass(com, span, halflife)
-
-    def _get_ewmcov(X, Y):
-        # X and Y have the same structure (and NaNs) when called from _flex_binary_moment()
-        return_hook, x_values = _process_data_structure(X)
-        return_hook, y_values = _process_data_structure(Y)
-        cov = algos.ewmcov(x_values, y_values, com, int(adjust), int(ignore_na), int(min_periods), int(bias))
-        return return_hook(cov)
-
-    result = _flex_binary_moment(arg1, arg2, _get_ewmcov,
-                                 pairwise=bool(pairwise))
-    return result
-
-
-@Substitution("Exponentially-weighted moving correlation", _binary_arg_flex,
-              _ewm_kw+_pairwise_kw, _type_of_input_retval, _ewm_notes)
-@Appender(_doc_template)
-def ewmcorr(arg1, arg2=None, com=None, span=None, halflife=None, min_periods=0,
-            freq=None, pairwise=None, how=None, ignore_na=False, adjust=True):
-    if arg2 is None:
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    elif isinstance(arg2, (int, float)) and com is None:
-        com = arg2
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    arg1 = _conv_timerule(arg1, freq, how)
-    arg2 = _conv_timerule(arg2, freq, how)
-    com = _get_center_of_mass(com, span, halflife)
-
-    def _get_ewmcorr(X, Y):
-        # X and Y have the same structure (and NaNs) when called from _flex_binary_moment()
-        return_hook, x_values = _process_data_structure(X)
-        return_hook, y_values = _process_data_structure(Y)
-        cov = algos.ewmcov(x_values, y_values, com, int(adjust), int(ignore_na), int(min_periods), 1)
-        x_var = algos.ewmcov(x_values, x_values, com, int(adjust), int(ignore_na), int(min_periods), 1)
-        y_var = algos.ewmcov(y_values, y_values, com, int(adjust), int(ignore_na), int(min_periods), 1)
-        corr = cov / _zsqrt(x_var * y_var)
-        return return_hook(corr)
-
-    result = _flex_binary_moment(arg1, arg2, _get_ewmcorr,
-                                 pairwise=bool(pairwise))
-    return result
-
-
-def _zsqrt(x):
-    result = np.sqrt(x)
-    mask = x < 0
-
-    if isinstance(x, DataFrame):
-        if mask.values.any():
-            result[mask] = 0
-    else:
-        if mask.any():
-            result[mask] = 0
-
-    return result
-
-
-def _prep_binary(arg1, arg2):
-    if not isinstance(arg2, type(arg1)):
-        raise Exception('Input arrays must be of the same type!')
-
-    # mask out values, this also makes a common index...
-    X = arg1 + 0 * arg2
-    Y = arg2 + 0 * arg1
-
-    return X, Y
-
-#----------------------------------------------------------------------
-# Python interface to Cython functions
-
-
-def _conv_timerule(arg, freq, how):
-
-    types = (DataFrame, Series)
-    if freq is not None and isinstance(arg, types):
-        # Conform to whatever frequency needed.
-        arg = arg.resample(freq, how=how)
-
-    return arg
-
-
-def _require_min_periods(p):
-    def _check_func(minp, window):
-        if minp is None:
-            return window
-        else:
-            return max(p, minp)
-    return _check_func
-
-
-def _use_window(minp, window):
-    if minp is None:
-        return window
-    else:
-        return minp
-
-
-def _rolling_func(func, desc, check_minp=_use_window, how=None, additional_kw=''):
-    if how is None:
-        how_arg_str = 'None'
-    else:
-        how_arg_str = "'%s"%how
-
-    @Substitution(desc, _unary_arg, _roll_kw%how_arg_str + additional_kw,
-                  _type_of_input_retval, _roll_notes)
-    @Appender(_doc_template)
-    @wraps(func)
-    def f(arg, window, min_periods=None, freq=None, center=False, how=how,
-          **kwargs):
-        def call_cython(arg, window, minp, args=(), kwargs={}, **kwds):
-            minp = check_minp(minp, window)
-            return func(arg, window, minp, **kwds)
-        return _rolling_moment(arg, window, call_cython, min_periods, freq=freq,
-                               center=center, how=how, **kwargs)
-
-    return f
-
-rolling_max = _rolling_func(algos.roll_max2, 'Moving maximum.', how='max')
-rolling_min = _rolling_func(algos.roll_min2, 'Moving minimum.', how='min')
-rolling_sum = _rolling_func(algos.roll_sum, 'Moving sum.')
-rolling_mean = _rolling_func(algos.roll_mean, 'Moving mean.')
-rolling_median = _rolling_func(algos.roll_median_cython, 'Moving median.',
-                               how='median')
-
-_ts_std = lambda *a, **kw: _zsqrt(algos.roll_var(*a, **kw))
-rolling_std = _rolling_func(_ts_std, 'Moving standard deviation.',
-                            check_minp=_require_min_periods(1),
-                            additional_kw=_ddof_kw)
-rolling_var = _rolling_func(algos.roll_var, 'Moving variance.',
-                            check_minp=_require_min_periods(1),
-                            additional_kw=_ddof_kw)
-rolling_skew = _rolling_func(algos.roll_skew, 'Unbiased moving skewness.',
-                             check_minp=_require_min_periods(3))
-rolling_kurt = _rolling_func(algos.roll_kurt, 'Unbiased moving kurtosis.',
-                             check_minp=_require_min_periods(4))
-
-
-def rolling_quantile(arg, window, quantile, min_periods=None, freq=None,
-                     center=False):
-    """Moving quantile.
-
-    Parameters
-    ----------
-    arg : Series, DataFrame
-    window : int
-        Size of the moving window. This is the number of observations used for
-        calculating the statistic.
-    quantile : float
-        0 <= quantile <= 1
-    min_periods : int, default None
-        Minimum number of observations in window required to have a value
-        (otherwise result is NA).
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the statistic. Specified
-        as a frequency string or DateOffset object.
-    center : boolean, default False
-        Whether the label should correspond with center of window
-
-    Returns
-    -------
-    y : type of input argument
-
-    Notes
-    -----
-    By default, the result is set to the right edge of the window. This can be
-    changed to the center of the window by setting ``center=True``.
-
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-    """
-
-    def call_cython(arg, window, minp, args=(), kwargs={}):
-        minp = _use_window(minp, window)
-        return algos.roll_quantile(arg, window, minp, quantile)
-    return _rolling_moment(arg, window, call_cython, min_periods, freq=freq,
-                           center=center)
-
-
-def rolling_apply(arg, window, func, min_periods=None, freq=None,
-                  center=False, args=(), kwargs={}):
-    """Generic moving function application.
-
-    Parameters
-    ----------
-    arg : Series, DataFrame
-    window : int
-        Size of the moving window. This is the number of observations used for
-        calculating the statistic.
-    func : function
-        Must produce a single value from an ndarray input
-    min_periods : int, default None
-        Minimum number of observations in window required to have a value
-        (otherwise result is NA).
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the statistic. Specified
-        as a frequency string or DateOffset object.
-    center : boolean, default False
-        Whether the label should correspond with center of window
-    args : tuple
-        Passed on to func
-    kwargs : dict
-        Passed on to func
-
-    Returns
-    -------
-    y : type of input argument
-
-    Notes
-    -----
-    By default, the result is set to the right edge of the window. This can be
-    changed to the center of the window by setting ``center=True``.
-
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-    """
-    offset = int((window - 1) / 2.) if center else 0
-    def call_cython(arg, window, minp, args, kwargs):
-        minp = _use_window(minp, window)
-        return algos.roll_generic(arg, window, minp, offset, func, args, kwargs)
-    return _rolling_moment(arg, window, call_cython, min_periods, freq=freq,
-                           center=False, args=args, kwargs=kwargs)
-
-
-def rolling_window(arg, window=None, win_type=None, min_periods=None,
-                   freq=None, center=False, mean=True,
-                   axis=0, how=None, **kwargs):
-    """
-    Applies a moving window of type ``window_type`` and size ``window``
-    on the data.
-
-    Parameters
-    ----------
-    arg : Series, DataFrame
-    window : int or ndarray
-        Weighting window specification. If the window is an integer, then it is
-        treated as the window length and win_type is required
-    win_type : str, default None
-        Window type (see Notes)
-    min_periods : int, default None
-        Minimum number of observations in window required to have a value
-        (otherwise result is NA).
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the statistic. Specified
-        as a frequency string or DateOffset object.
-    center : boolean, default False
-        Whether the label should correspond with center of window
-    mean : boolean, default True
-        If True computes weighted mean, else weighted sum
-    axis : {0, 1}, default 0
-    how : string, default 'mean'
-        Method for down- or re-sampling
-
-    Returns
-    -------
-    y : type of input argument
-
-    Notes
-    -----
-    The recognized window types are:
-
-    * ``boxcar``
-    * ``triang``
-    * ``blackman``
-    * ``hamming``
-    * ``bartlett``
-    * ``parzen``
-    * ``bohman``
-    * ``blackmanharris``
-    * ``nuttall``
-    * ``barthann``
-    * ``kaiser`` (needs beta)
-    * ``gaussian`` (needs std)
-    * ``general_gaussian`` (needs power, width)
-    * ``slepian`` (needs width).
-
-    By default, the result is set to the right edge of the window. This can be
-    changed to the center of the window by setting ``center=True``.
-
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-    """
-    if isinstance(window, (list, tuple, np.ndarray)):
-        if win_type is not None:
-            raise ValueError(('Do not specify window type if using custom '
-                              'weights'))
-        window = pdcom._asarray_tuplesafe(window).astype(float)
-    elif pdcom.is_integer(window):  # window size
-        if win_type is None:
-            raise ValueError('Must specify window type')
-        try:
-            import scipy.signal as sig
-        except ImportError:
-            raise ImportError('Please install scipy to generate window weight')
-        win_type = _validate_win_type(win_type, kwargs)  # may pop from kwargs
-        window = sig.get_window(win_type, window).astype(float)
-    else:
-        raise ValueError('Invalid window %s' % str(window))
-
-    minp = _use_window(min_periods, len(window))
-
-    arg = _conv_timerule(arg, freq, how)
-    return_hook, values = _process_data_structure(arg)
-
-    if values.size == 0:
-        result = values.copy()
-    else:
-        offset = int((len(window) - 1) / 2.) if center else 0
-        additional_nans = np.array([np.NaN] * offset)
-        f = lambda x: algos.roll_window(np.concatenate((x, additional_nans)) if center else x,
-                                        window, minp, avg=mean)
-        result = np.apply_along_axis(f, axis, values)
-
-    if center:
-        result = _center_window(result, len(window), axis)
-
-    return return_hook(result)
-
-
-def _validate_win_type(win_type, kwargs):
-    # may pop from kwargs
-    arg_map = {'kaiser': ['beta'],
-               'gaussian': ['std'],
-               'general_gaussian': ['power', 'width'],
-               'slepian': ['width']}
-    if win_type in arg_map:
-        return tuple([win_type] +
-                     _pop_args(win_type, arg_map[win_type], kwargs))
-    return win_type
-
-
-def _pop_args(win_type, arg_names, kwargs):
-    msg = '%s window requires %%s' % win_type
-    all_args = []
-    for n in arg_names:
-        if n not in kwargs:
-            raise ValueError(msg % n)
-        all_args.append(kwargs.pop(n))
-    return all_args
-
-
-def _expanding_func(func, desc, check_minp=_use_window, additional_kw=''):
-    @Substitution(desc, _unary_arg, _expanding_kw + additional_kw,
-                  _type_of_input_retval, "")
-    @Appender(_doc_template)
-    @wraps(func)
-    def f(arg, min_periods=1, freq=None, **kwargs):
-        window = max(len(arg), min_periods) if min_periods else len(arg)
-
-        def call_cython(arg, window, minp, args=(), kwargs={}, **kwds):
-            minp = check_minp(minp, window)
-            return func(arg, window, minp, **kwds)
-        return _rolling_moment(arg, window, call_cython, min_periods, freq=freq,
-                               **kwargs)
-
-    return f
-
-expanding_max = _expanding_func(algos.roll_max2, 'Expanding maximum.')
-expanding_min = _expanding_func(algos.roll_min2, 'Expanding minimum.')
-expanding_sum = _expanding_func(algos.roll_sum, 'Expanding sum.')
-expanding_mean = _expanding_func(algos.roll_mean, 'Expanding mean.')
-expanding_median = _expanding_func(algos.roll_median_cython, 'Expanding median.')
-
-expanding_std = _expanding_func(_ts_std, 'Expanding standard deviation.',
-                                check_minp=_require_min_periods(1),
-                                additional_kw=_ddof_kw)
-expanding_var = _expanding_func(algos.roll_var, 'Expanding variance.',
-                                check_minp=_require_min_periods(1),
-                                additional_kw=_ddof_kw)
-expanding_skew = _expanding_func(algos.roll_skew, 'Unbiased expanding skewness.',
-                                 check_minp=_require_min_periods(3))
-expanding_kurt = _expanding_func(algos.roll_kurt, 'Unbiased expanding kurtosis.',
-                                 check_minp=_require_min_periods(4))
-
-
-def expanding_count(arg, freq=None):
-    """
-    Expanding count of number of non-NaN observations.
-
-    Parameters
-    ----------
-    arg :  DataFrame or numpy ndarray-like
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the statistic. Specified
-        as a frequency string or DateOffset object.
-
-    Returns
-    -------
-    expanding_count : type of caller
-
-    Notes
-    -----
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-    """
-    return rolling_count(arg, len(arg), freq=freq)
-
-
-def expanding_quantile(arg, quantile, min_periods=1, freq=None):
-    """Expanding quantile.
-
-    Parameters
-    ----------
-    arg : Series, DataFrame
-    quantile : float
-        0 <= quantile <= 1
-    min_periods : int, default None
-        Minimum number of observations in window required to have a value
-        (otherwise result is NA).
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the statistic. Specified
-        as a frequency string or DateOffset object.
-
-    Returns
-    -------
-    y : type of input argument
-
-    Notes
-    -----
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-    """
-    return rolling_quantile(arg, len(arg), quantile, min_periods=min_periods,
-                            freq=freq)
-
-
-@Substitution("Unbiased expanding covariance.", _binary_arg_flex,
-              _expanding_kw+_pairwise_kw+_ddof_kw, _flex_retval, "")
-@Appender(_doc_template)
-def expanding_cov(arg1, arg2=None, min_periods=1, freq=None, pairwise=None, ddof=1):
-    if arg2 is None:
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    elif isinstance(arg2, (int, float)) and min_periods is None:
-        min_periods = arg2
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    window = max((len(arg1) + len(arg2)), min_periods) if min_periods else (len(arg1) + len(arg2))
-    return rolling_cov(arg1, arg2, window,
-                       min_periods=min_periods, freq=freq,
-                       pairwise=pairwise, ddof=ddof)
-
-
-@Substitution("Expanding sample correlation.", _binary_arg_flex,
-              _expanding_kw+_pairwise_kw, _flex_retval, "")
-@Appender(_doc_template)
-def expanding_corr(arg1, arg2=None, min_periods=1, freq=None, pairwise=None):
-    if arg2 is None:
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    elif isinstance(arg2, (int, float)) and min_periods is None:
-        min_periods = arg2
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    window = max((len(arg1) + len(arg2)), min_periods) if min_periods else (len(arg1) + len(arg2))
-    return rolling_corr(arg1, arg2, window,
-                        min_periods=min_periods,
-                        freq=freq, pairwise=pairwise)
-
-
-@Substitution("Deprecated. Use expanding_corr(..., pairwise=True) instead.\n\n"
-              "Pairwise expanding sample correlation", _pairwise_arg,
-              _expanding_kw, _pairwise_retval, "")
-@Appender(_doc_template)
-def expanding_corr_pairwise(df1, df2=None, min_periods=1, freq=None):
-    import warnings
-    msg = "expanding_corr_pairwise is deprecated, use expanding_corr(..., pairwise=True)"
-    warnings.warn(msg, FutureWarning, stacklevel=2)
-    return expanding_corr(df1, df2, min_periods=min_periods,
-                          freq=freq, pairwise=True)
-
-
-def expanding_apply(arg, func, min_periods=1, freq=None,
-                    args=(), kwargs={}):
-    """Generic expanding function application.
-
-    Parameters
-    ----------
-    arg : Series, DataFrame
-    func : function
-        Must produce a single value from an ndarray input
-    min_periods : int, default None
-        Minimum number of observations in window required to have a value
-        (otherwise result is NA).
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the statistic. Specified
-        as a frequency string or DateOffset object.
-    args : tuple
-        Passed on to func
-    kwargs : dict
-        Passed on to func
-
-    Returns
-    -------
-    y : type of input argument
-
-    Notes
-    -----
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-    """
-    window = max(len(arg), min_periods) if min_periods else len(arg)
-    return rolling_apply(arg, window, func, min_periods=min_periods, freq=freq,
-                         args=args, kwargs=kwargs)
diff --git a/pandas/stats/ols.py b/pandas/stats/ols.py
deleted file mode 100644
index d1d74442d8961..0000000000000
--- a/pandas/stats/ols.py
+++ /dev/null
@@ -1,1364 +0,0 @@
-"""
-Ordinary least squares regression
-"""
-
-# pylint: disable-msg=W0201
-
-from pandas.compat import zip, range, StringIO
-from itertools import starmap
-from pandas import compat
-import numpy as np
-
-from pandas.core.api import DataFrame, Series, isnull
-from pandas.core.base import StringMixin
-from pandas.core.common import _ensure_float64
-from pandas.core.index import MultiIndex
-from pandas.core.panel import Panel
-from pandas.util.decorators import cache_readonly
-
-import pandas.stats.common as scom
-import pandas.stats.math as math
-import pandas.stats.moments as moments
-
-_FP_ERR = 1e-8
-
-
-class OLS(StringMixin):
-    """
-    Runs a full sample ordinary least squares regression.
-
-    Parameters
-    ----------
-    y : Series
-    x : Series, DataFrame, dict of Series
-    intercept : bool
-        True if you want an intercept.
-    weights : array-like, optional
-        1d array of weights.  If you supply 1/W then the variables are pre-
-        multiplied by 1/sqrt(W).  If no weights are supplied the default value
-        is 1 and WLS reults are the same as OLS.
-    nw_lags : None or int
-        Number of Newey-West lags.
-    nw_overlap : boolean, default False
-        Assume data is overlapping when computing Newey-West estimator
-
-    """
-    _panel_model = False
-
-    def __init__(self, y, x, intercept=True, weights=None, nw_lags=None,
-                 nw_overlap=False):
-        try:
-            import statsmodels.api as sm
-        except ImportError:
-            import scikits.statsmodels.api as sm
-
-        self._x_orig = x
-        self._y_orig = y
-        self._weights_orig = weights
-        self._intercept = intercept
-        self._nw_lags = nw_lags
-        self._nw_overlap = nw_overlap
-
-        (self._y, self._x, self._weights, self._x_filtered,
-         self._index, self._time_has_obs) = self._prepare_data()
-
-        if self._weights is not None:
-            self._x_trans = self._x.mul(np.sqrt(self._weights), axis=0)
-            self._y_trans = self._y * np.sqrt(self._weights)
-            self.sm_ols = sm.WLS(self._y.get_values(),
-                                 self._x.get_values(),
-                                 weights=self._weights.values).fit()
-        else:
-            self._x_trans = self._x
-            self._y_trans = self._y
-            self.sm_ols = sm.OLS(self._y.get_values(),
-                                 self._x.get_values()).fit()
-
-    def _prepare_data(self):
-        """
-        Cleans the input for single OLS.
-
-        Parameters
-        ----------
-        lhs: Series
-            Dependent variable in the regression.
-        rhs: dict, whose values are Series, DataFrame, or dict
-            Explanatory variables of the regression.
-
-        Returns
-        -------
-        Series, DataFrame
-            Cleaned lhs and rhs
-        """
-        (filt_lhs, filt_rhs, filt_weights,
-         pre_filt_rhs, index, valid) = _filter_data(self._y_orig, self._x_orig,
-                                                    self._weights_orig)
-        if self._intercept:
-            filt_rhs['intercept'] = 1.
-            pre_filt_rhs['intercept'] = 1.
-
-        if hasattr(filt_weights,'to_dense'):
-            filt_weights = filt_weights.to_dense()
-
-        return (filt_lhs, filt_rhs, filt_weights,
-                pre_filt_rhs, index, valid)
-
-    @property
-    def nobs(self):
-        return self._nobs
-
-    @property
-    def _nobs(self):
-        return len(self._y)
-
-    @property
-    def nw_lags(self):
-        return self._nw_lags
-
-    @property
-    def x(self):
-        """Returns the filtered x used in the regression."""
-        return self._x
-
-    @property
-    def y(self):
-        """Returns the filtered y used in the regression."""
-        return self._y
-
-    @cache_readonly
-    def _beta_raw(self):
-        """Runs the regression and returns the beta."""
-        return self.sm_ols.params
-
-    @cache_readonly
-    def beta(self):
-        """Returns the betas in Series form."""
-        return Series(self._beta_raw, index=self._x.columns)
-
-    @cache_readonly
-    def _df_raw(self):
-        """Returns the degrees of freedom."""
-        return math.rank(self._x.values)
-
-    @cache_readonly
-    def df(self):
-        """Returns the degrees of freedom.
-
-        This equals the rank of the X matrix.
-        """
-        return self._df_raw
-
-    @cache_readonly
-    def _df_model_raw(self):
-        """Returns the raw model degrees of freedom."""
-        return self.sm_ols.df_model
-
-    @cache_readonly
-    def df_model(self):
-        """Returns the degrees of freedom of the model."""
-        return self._df_model_raw
-
-    @cache_readonly
-    def _df_resid_raw(self):
-        """Returns the raw residual degrees of freedom."""
-        return self.sm_ols.df_resid
-
-    @cache_readonly
-    def df_resid(self):
-        """Returns the degrees of freedom of the residuals."""
-        return self._df_resid_raw
-
-    @cache_readonly
-    def _f_stat_raw(self):
-        """Returns the raw f-stat value."""
-        from scipy.stats import f
-
-        cols = self._x.columns
-
-        if self._nw_lags is None:
-            F = self._r2_raw / (self._r2_raw - self._r2_adj_raw)
-
-            q = len(cols)
-            if 'intercept' in cols:
-                q -= 1
-
-            shape = q, self.df_resid
-            p_value = 1 - f.cdf(F, shape[0], shape[1])
-            return F, shape, p_value
-
-        k = len(cols)
-        R = np.eye(k)
-        r = np.zeros((k, 1))
-
-        try:
-            intercept = cols.get_loc('intercept')
-            R = np.concatenate((R[0: intercept], R[intercept + 1:]))
-            r = np.concatenate((r[0: intercept], r[intercept + 1:]))
-        except KeyError:
-            # no intercept
-            pass
-
-        return math.calc_F(R, r, self._beta_raw, self._var_beta_raw,
-                           self._nobs, self.df)
-
-    @cache_readonly
-    def f_stat(self):
-        """Returns the f-stat value."""
-        return f_stat_to_dict(self._f_stat_raw)
-
-    def f_test(self, hypothesis):
-        """Runs the F test, given a joint hypothesis.  The hypothesis is
-        represented by a collection of equations, in the form
-
-        A*x_1+B*x_2=C
-
-        You must provide the coefficients even if they're 1.  No spaces.
-
-        The equations can be passed as either a single string or a
-        list of strings.
-
-        Examples
-        --------
-        o = ols(...)
-        o.f_test('1*x1+2*x2=0,1*x3=0')
-        o.f_test(['1*x1+2*x2=0','1*x3=0'])
-        """
-
-        x_names = self._x.columns
-
-        R = []
-        r = []
-
-        if isinstance(hypothesis, str):
-            eqs = hypothesis.split(',')
-        elif isinstance(hypothesis, list):
-            eqs = hypothesis
-        else:  # pragma: no cover
-            raise Exception('hypothesis must be either string or list')
-        for equation in eqs:
-            row = np.zeros(len(x_names))
-            lhs, rhs = equation.split('=')
-            for s in lhs.split('+'):
-                ss = s.split('*')
-                coeff = float(ss[0])
-                x_name = ss[1]
-
-                if x_name not in x_names:
-                    raise Exception('no coefficient named %s' % x_name)
-                idx = x_names.get_loc(x_name)
-                row[idx] = coeff
-            rhs = float(rhs)
-
-            R.append(row)
-            r.append(rhs)
-
-        R = np.array(R)
-        q = len(r)
-        r = np.array(r).reshape(q, 1)
-
-        result = math.calc_F(R, r, self._beta_raw, self._var_beta_raw,
-                             self._nobs, self.df)
-
-        return f_stat_to_dict(result)
-
-    @cache_readonly
-    def _p_value_raw(self):
-        """Returns the raw p values."""
-        from scipy.stats import t
-
-        return 2 * t.sf(np.fabs(self._t_stat_raw),
-                        self._df_resid_raw)
-
-    @cache_readonly
-    def p_value(self):
-        """Returns the p values."""
-        return Series(self._p_value_raw, index=self.beta.index)
-
-    @cache_readonly
-    def _r2_raw(self):
-        """Returns the raw r-squared values."""
-        if self._use_centered_tss:
-            return 1 - self.sm_ols.ssr / self.sm_ols.centered_tss
-        else:
-            return 1 - self.sm_ols.ssr / self.sm_ols.uncentered_tss
-
-    @property
-    def _use_centered_tss(self):
-        # has_intercept = np.abs(self._resid_raw.sum()) < _FP_ERR
-        return self._intercept
-
-    @cache_readonly
-    def r2(self):
-        """Returns the r-squared values."""
-        return self._r2_raw
-
-    @cache_readonly
-    def _r2_adj_raw(self):
-        """Returns the raw r-squared adjusted values."""
-        return self.sm_ols.rsquared_adj
-
-    @cache_readonly
-    def r2_adj(self):
-        """Returns the r-squared adjusted values."""
-        return self._r2_adj_raw
-
-    @cache_readonly
-    def _resid_raw(self):
-        """Returns the raw residuals."""
-        return self.sm_ols.resid
-
-    @cache_readonly
-    def resid(self):
-        """Returns the residuals."""
-        return Series(self._resid_raw, index=self._x.index)
-
-    @cache_readonly
-    def _rmse_raw(self):
-        """Returns the raw rmse values."""
-        return np.sqrt(self.sm_ols.mse_resid)
-
-    @cache_readonly
-    def rmse(self):
-        """Returns the rmse value."""
-        return self._rmse_raw
-
-    @cache_readonly
-    def _std_err_raw(self):
-        """Returns the raw standard err values."""
-        return np.sqrt(np.diag(self._var_beta_raw))
-
-    @cache_readonly
-    def std_err(self):
-        """Returns the standard err values of the betas."""
-        return Series(self._std_err_raw, index=self.beta.index)
-
-    @cache_readonly
-    def _t_stat_raw(self):
-        """Returns the raw t-stat value."""
-        return self._beta_raw / self._std_err_raw
-
-    @cache_readonly
-    def t_stat(self):
-        """Returns the t-stat values of the betas."""
-        return Series(self._t_stat_raw, index=self.beta.index)
-
-    @cache_readonly
-    def _var_beta_raw(self):
-        """
-        Returns the raw covariance of beta.
-        """
-        x = self._x.values
-        y = self._y.values
-
-        xx = np.dot(x.T, x)
-
-        if self._nw_lags is None:
-            return math.inv(xx) * (self._rmse_raw ** 2)
-        else:
-            resid = y - np.dot(x, self._beta_raw)
-            m = (x.T * resid).T
-
-            xeps = math.newey_west(m, self._nw_lags, self._nobs, self._df_raw,
-                                   self._nw_overlap)
-
-            xx_inv = math.inv(xx)
-            return np.dot(xx_inv, np.dot(xeps, xx_inv))
-
-    @cache_readonly
-    def var_beta(self):
-        """Returns the variance-covariance matrix of beta."""
-        return DataFrame(self._var_beta_raw, index=self.beta.index,
-                         columns=self.beta.index)
-
-    @cache_readonly
-    def _y_fitted_raw(self):
-        """Returns the raw fitted y values."""
-        if self._weights is None:
-            X = self._x_filtered.values
-        else:
-            # XXX
-            return self.sm_ols.fittedvalues
-
-        b = self._beta_raw
-        return np.dot(X, b)
-
-    @cache_readonly
-    def y_fitted(self):
-        """Returns the fitted y values.  This equals BX."""
-        if self._weights is None:
-            index = self._x_filtered.index
-            orig_index = index
-        else:
-            index = self._y.index
-            orig_index = self._y_orig.index
-
-        result = Series(self._y_fitted_raw, index=index)
-        return result.reindex(orig_index)
-
-    @cache_readonly
-    def _y_predict_raw(self):
-        """Returns the raw predicted y values."""
-        return self._y_fitted_raw
-
-    @cache_readonly
-    def y_predict(self):
-        """Returns the predicted y values.
-
-        For in-sample, this is same as y_fitted."""
-        return self.y_fitted
-
-    def predict(self, beta=None, x=None, fill_value=None,
-                fill_method=None, axis=0):
-        """
-        Parameters
-        ----------
-        beta : Series
-        x : Series or DataFrame
-        fill_value : scalar or dict, default None
-        fill_method : {'backfill', 'bfill', 'pad', 'ffill', None}, default None
-        axis : {0, 1}, default 0
-            See DataFrame.fillna for more details
-
-        Notes
-        -----
-        1. If both fill_value and fill_method are None then NaNs are dropped
-        (this is the default behavior)
-        2. An intercept will be automatically added to the new_y_values if
-           the model was fitted using an intercept
-
-        Returns
-        -------
-        Series of predicted values
-        """
-        if beta is None and x is None:
-            return self.y_predict
-
-        if beta is None:
-            beta = self.beta
-        else:
-            beta = beta.reindex(self.beta.index)
-            if isnull(beta).any():
-                raise ValueError('Must supply betas for same variables')
-
-        if x is None:
-            x = self._x
-            orig_x = x
-        else:
-            orig_x = x
-            if fill_value is None and fill_method is None:
-                x = x.dropna(how='any')
-            else:
-                x = x.fillna(value=fill_value, method=fill_method, axis=axis)
-            if isinstance(x, Series):
-                x = DataFrame({'x': x})
-            if self._intercept:
-                x['intercept'] = 1.
-
-            x = x.reindex(columns=self._x.columns)
-
-        rs = np.dot(x.values, beta.values)
-        return Series(rs, x.index).reindex(orig_x.index)
-
-    RESULT_FIELDS = ['r2', 'r2_adj', 'df', 'df_model', 'df_resid', 'rmse',
-                     'f_stat', 'beta', 'std_err', 't_stat', 'p_value', 'nobs']
-
-    @cache_readonly
-    def _results(self):
-        results = {}
-        for result in self.RESULT_FIELDS:
-            results[result] = getattr(self, result)
-
-        return results
-
-    @cache_readonly
-    def _coef_table(self):
-        buf = StringIO()
-
-        buf.write('%14s %10s %10s %10s %10s %10s %10s\n' %
-                  ('Variable', 'Coef', 'Std Err', 't-stat',
-                   'p-value', 'CI 2.5%', 'CI 97.5%'))
-        buf.write(scom.banner(''))
-        coef_template = '\n%14s %10.4f %10.4f %10.2f %10.4f %10.4f %10.4f'
-
-        results = self._results
-
-        beta = results['beta']
-
-        for i, name in enumerate(beta.index):
-            if i and not (i % 5):
-                buf.write('\n' + scom.banner(''))
-
-            std_err = results['std_err'][name]
-            CI1 = beta[name] - 1.96 * std_err
-            CI2 = beta[name] + 1.96 * std_err
-
-            t_stat = results['t_stat'][name]
-            p_value = results['p_value'][name]
-
-            line = coef_template % (name,
-                                    beta[name], std_err, t_stat, p_value, CI1, CI2)
-
-            buf.write(line)
-
-        if self.nw_lags is not None:
-            buf.write('\n')
-            buf.write('*** The calculations are Newey-West '
-                      'adjusted with lags %5d\n' % self.nw_lags)
-
-        return buf.getvalue()
-
-    @cache_readonly
-    def summary_as_matrix(self):
-        """Returns the formatted results of the OLS as a DataFrame."""
-        results = self._results
-        beta = results['beta']
-        data = {'beta': results['beta'],
-                't-stat': results['t_stat'],
-                'p-value': results['p_value'],
-                'std err': results['std_err']}
-        return DataFrame(data, beta.index).T
-
-    @cache_readonly
-    def summary(self):
-        """
-        This returns the formatted result of the OLS computation
-        """
-        template = """
-%(bannerTop)s
-
-Formula: Y ~ %(formula)s
-
-Number of Observations:         %(nobs)d
-Number of Degrees of Freedom:   %(df)d
-
-R-squared:     %(r2)10.4f
-Adj R-squared: %(r2_adj)10.4f
-
-Rmse:          %(rmse)10.4f
-
-F-stat %(f_stat_shape)s: %(f_stat)10.4f, p-value: %(f_stat_p_value)10.4f
-
-Degrees of Freedom: model %(df_model)d, resid %(df_resid)d
-
-%(bannerCoef)s
-%(coef_table)s
-%(bannerEnd)s
-"""
-        coef_table = self._coef_table
-
-        results = self._results
-
-        f_stat = results['f_stat']
-
-        bracketed = ['<%s>' % str(c) for c in results['beta'].index]
-
-        formula = StringIO()
-        formula.write(bracketed[0])
-        tot = len(bracketed[0])
-        line = 1
-        for coef in bracketed[1:]:
-            tot = tot + len(coef) + 3
-
-            if tot // (68 * line):
-                formula.write('\n' + ' ' * 12)
-                line += 1
-
-            formula.write(' + ' + coef)
-
-        params = {
-            'bannerTop': scom.banner('Summary of Regression Analysis'),
-            'bannerCoef': scom.banner('Summary of Estimated Coefficients'),
-            'bannerEnd': scom.banner('End of Summary'),
-            'formula': formula.getvalue(),
-            'r2': results['r2'],
-            'r2_adj': results['r2_adj'],
-            'nobs': results['nobs'],
-            'df': results['df'],
-            'df_model': results['df_model'],
-            'df_resid': results['df_resid'],
-            'coef_table': coef_table,
-            'rmse': results['rmse'],
-            'f_stat': f_stat['f-stat'],
-            'f_stat_shape': '(%d, %d)' % (f_stat['DF X'], f_stat['DF Resid']),
-            'f_stat_p_value': f_stat['p-value'],
-        }
-
-        return template % params
-
-    def __unicode__(self):
-        return self.summary
-
-    @cache_readonly
-    def _time_obs_count(self):
-        # XXX
-        return self._time_has_obs.astype(int)
-
-    @property
-    def _total_times(self):
-        return self._time_has_obs.sum()
-
-
-class MovingOLS(OLS):
-    """
-    Runs a rolling/expanding simple OLS.
-
-    Parameters
-    ----------
-    y : Series
-    x : Series, DataFrame, or dict of Series
-    weights : array-like, optional
-        1d array of weights.  If None, equivalent to an unweighted OLS.
-    window_type : {'full sample', 'rolling', 'expanding'}
-        Default expanding
-    window : int
-        size of window (for rolling/expanding OLS)
-    min_periods : int
-        Threshold of non-null data points to require.
-        If None, defaults to size of window for window_type='rolling' and 1
-        otherwise
-    intercept : bool
-        True if you want an intercept.
-    nw_lags : None or int
-        Number of Newey-West lags.
-    nw_overlap : boolean, default False
-        Assume data is overlapping when computing Newey-West estimator
-
-    """
-    def __init__(self, y, x, weights=None, window_type='expanding',
-                 window=None, min_periods=None, intercept=True,
-                 nw_lags=None, nw_overlap=False):
-
-        self._args = dict(intercept=intercept, nw_lags=nw_lags,
-                          nw_overlap=nw_overlap)
-
-        OLS.__init__(self, y=y, x=x, weights=weights, **self._args)
-
-        self._set_window(window_type, window, min_periods)
-
-    def _set_window(self, window_type, window, min_periods):
-        self._window_type = scom._get_window_type(window_type)
-
-        if self._is_rolling:
-            if window is None:
-                raise AssertionError("Must specify window.")
-            if min_periods is None:
-                min_periods = window
-        else:
-            window = len(self._x)
-            if min_periods is None:
-                min_periods = 1
-
-        self._window = int(window)
-        self._min_periods = min_periods
-
-#------------------------------------------------------------------------------
-# "Public" results
-
-    @cache_readonly
-    def beta(self):
-        """Returns the betas in Series/DataFrame form."""
-        return DataFrame(self._beta_raw,
-                         index=self._result_index,
-                         columns=self._x.columns)
-
-    @cache_readonly
-    def rank(self):
-        return Series(self._rank_raw, index=self._result_index)
-
-    @cache_readonly
-    def df(self):
-        """Returns the degrees of freedom."""
-        return Series(self._df_raw, index=self._result_index)
-
-    @cache_readonly
-    def df_model(self):
-        """Returns the model degrees of freedom."""
-        return Series(self._df_model_raw, index=self._result_index)
-
-    @cache_readonly
-    def df_resid(self):
-        """Returns the residual degrees of freedom."""
-        return Series(self._df_resid_raw, index=self._result_index)
-
-    @cache_readonly
-    def f_stat(self):
-        """Returns the f-stat value."""
-        f_stat_dicts = dict((date, f_stat_to_dict(f_stat))
-                            for date, f_stat in zip(self.beta.index,
-                                                    self._f_stat_raw))
-
-        return DataFrame(f_stat_dicts).T
-
-    def f_test(self, hypothesis):
-        raise NotImplementedError('must use full sample')
-
-    @cache_readonly
-    def forecast_mean(self):
-        return Series(self._forecast_mean_raw, index=self._result_index)
-
-    @cache_readonly
-    def forecast_vol(self):
-        return Series(self._forecast_vol_raw, index=self._result_index)
-
-    @cache_readonly
-    def p_value(self):
-        """Returns the p values."""
-        cols = self.beta.columns
-        return DataFrame(self._p_value_raw, columns=cols,
-                         index=self._result_index)
-
-    @cache_readonly
-    def r2(self):
-        """Returns the r-squared values."""
-        return Series(self._r2_raw, index=self._result_index)
-
-    @cache_readonly
-    def resid(self):
-        """Returns the residuals."""
-        return Series(self._resid_raw[self._valid_obs_labels],
-                      index=self._result_index)
-
-    @cache_readonly
-    def r2_adj(self):
-        """Returns the r-squared adjusted values."""
-        index = self.r2.index
-
-        return Series(self._r2_adj_raw, index=index)
-
-    @cache_readonly
-    def rmse(self):
-        """Returns the rmse values."""
-        return Series(self._rmse_raw, index=self._result_index)
-
-    @cache_readonly
-    def std_err(self):
-        """Returns the standard err values."""
-        return DataFrame(self._std_err_raw, columns=self.beta.columns,
-                         index=self._result_index)
-
-    @cache_readonly
-    def t_stat(self):
-        """Returns the t-stat value."""
-        return DataFrame(self._t_stat_raw, columns=self.beta.columns,
-                         index=self._result_index)
-
-    @cache_readonly
-    def var_beta(self):
-        """Returns the covariance of beta."""
-        result = {}
-        result_index = self._result_index
-        for i in range(len(self._var_beta_raw)):
-            dm = DataFrame(self._var_beta_raw[i], columns=self.beta.columns,
-                           index=self.beta.columns)
-            result[result_index[i]] = dm
-
-        return Panel.from_dict(result, intersect=False)
-
-    @cache_readonly
-    def y_fitted(self):
-        """Returns the fitted y values."""
-        return Series(self._y_fitted_raw[self._valid_obs_labels],
-                      index=self._result_index)
-
-    @cache_readonly
-    def y_predict(self):
-        """Returns the predicted y values."""
-        return Series(self._y_predict_raw[self._valid_obs_labels],
-                      index=self._result_index)
-
-#------------------------------------------------------------------------------
-# "raw" attributes, calculations
-
-    @property
-    def _is_rolling(self):
-        return self._window_type == 'rolling'
-
-    @cache_readonly
-    def _beta_raw(self):
-        """Runs the regression and returns the beta."""
-        beta, indices, mask = self._rolling_ols_call
-
-        return beta[indices]
-
-    @cache_readonly
-    def _result_index(self):
-        return self._index[self._valid_indices]
-
-    @property
-    def _valid_indices(self):
-        return self._rolling_ols_call[1]
-
-    @cache_readonly
-    def _rolling_ols_call(self):
-        return self._calc_betas(self._x_trans, self._y_trans)
-
-    def _calc_betas(self, x, y):
-        N = len(self._index)
-        K = len(self._x.columns)
-
-        betas = np.empty((N, K), dtype=float)
-        betas[:] = np.NaN
-
-        valid = self._time_has_obs
-        enough = self._enough_obs
-        window = self._window
-
-        # Use transformed (demeaned) Y, X variables
-        cum_xx = self._cum_xx(x)
-        cum_xy = self._cum_xy(x, y)
-
-        for i in range(N):
-            if not valid[i] or not enough[i]:
-                continue
-
-            xx = cum_xx[i]
-            xy = cum_xy[i]
-            if self._is_rolling and i >= window:
-                xx = xx - cum_xx[i - window]
-                xy = xy - cum_xy[i - window]
-
-            betas[i] = math.solve(xx, xy)
-
-        mask = ~np.isnan(betas).any(axis=1)
-        have_betas = np.arange(N)[mask]
-
-        return betas, have_betas, mask
-
-    def _rolling_rank(self):
-        dates = self._index
-        window = self._window
-
-        ranks = np.empty(len(dates), dtype=float)
-        ranks[:] = np.NaN
-        for i, date in enumerate(dates):
-            if self._is_rolling and i >= window:
-                prior_date = dates[i - window + 1]
-            else:
-                prior_date = dates[0]
-
-            x_slice = self._x.truncate(before=prior_date, after=date).values
-
-            if len(x_slice) == 0:
-                continue
-
-            ranks[i] = math.rank(x_slice)
-
-        return ranks
-
-    def _cum_xx(self, x):
-        dates = self._index
-        K = len(x.columns)
-        valid = self._time_has_obs
-        cum_xx = []
-
-        slicer = lambda df, dt: df.truncate(dt, dt).values
-        if not self._panel_model:
-            _get_index = x.index.get_loc
-
-            def slicer(df, dt):
-                i = _get_index(dt)
-                return df.values[i:i + 1, :]
-
-        last = np.zeros((K, K))
-
-        for i, date in enumerate(dates):
-            if not valid[i]:
-                cum_xx.append(last)
-                continue
-
-            x_slice = slicer(x, date)
-            xx = last = last + np.dot(x_slice.T, x_slice)
-            cum_xx.append(xx)
-
-        return cum_xx
-
-    def _cum_xy(self, x, y):
-        dates = self._index
-        valid = self._time_has_obs
-        cum_xy = []
-
-        x_slicer = lambda df, dt: df.truncate(dt, dt).values
-        if not self._panel_model:
-            _get_index = x.index.get_loc
-
-            def x_slicer(df, dt):
-                i = _get_index(dt)
-                return df.values[i:i + 1]
-
-        _y_get_index = y.index.get_loc
-        _values = y.values
-        if isinstance(y.index, MultiIndex):
-            def y_slicer(df, dt):
-                loc = _y_get_index(dt)
-                return _values[loc]
-        else:
-            def y_slicer(df, dt):
-                i = _y_get_index(dt)
-                return _values[i:i + 1]
-
-        last = np.zeros(len(x.columns))
-        for i, date in enumerate(dates):
-            if not valid[i]:
-                cum_xy.append(last)
-                continue
-
-            x_slice = x_slicer(x, date)
-            y_slice = y_slicer(y, date)
-
-            xy = last = last + np.dot(x_slice.T, y_slice)
-            cum_xy.append(xy)
-
-        return cum_xy
-
-    @cache_readonly
-    def _rank_raw(self):
-        rank = self._rolling_rank()
-        return rank[self._valid_indices]
-
-    @cache_readonly
-    def _df_raw(self):
-        """Returns the degrees of freedom."""
-        return self._rank_raw
-
-    @cache_readonly
-    def _df_model_raw(self):
-        """Returns the raw model degrees of freedom."""
-        return self._df_raw - 1
-
-    @cache_readonly
-    def _df_resid_raw(self):
-        """Returns the raw residual degrees of freedom."""
-        return self._nobs - self._df_raw
-
-    @cache_readonly
-    def _f_stat_raw(self):
-        """Returns the raw f-stat value."""
-        from scipy.stats import f
-
-        items = self.beta.columns
-        nobs = self._nobs
-        df = self._df_raw
-        df_resid = nobs - df
-
-        # var_beta has not been newey-west adjusted
-        if self._nw_lags is None:
-            F = self._r2_raw / (self._r2_raw - self._r2_adj_raw)
-
-            q = len(items)
-            if 'intercept' in items:
-                q -= 1
-
-            def get_result_simple(Fst, d):
-                return Fst, (q, d), 1 - f.cdf(Fst, q, d)
-
-            # Compute the P-value for each pair
-            result = starmap(get_result_simple, zip(F, df_resid))
-
-            return list(result)
-
-        K = len(items)
-        R = np.eye(K)
-        r = np.zeros((K, 1))
-
-        try:
-            intercept = items.get_loc('intercept')
-            R = np.concatenate((R[0: intercept], R[intercept + 1:]))
-            r = np.concatenate((r[0: intercept], r[intercept + 1:]))
-        except KeyError:
-            # no intercept
-            pass
-
-        def get_result(beta, vcov, n, d):
-            return math.calc_F(R, r, beta, vcov, n, d)
-
-        results = starmap(get_result,
-                          zip(self._beta_raw, self._var_beta_raw, nobs, df))
-
-        return list(results)
-
-    @cache_readonly
-    def _p_value_raw(self):
-        """Returns the raw p values."""
-        from scipy.stats import t
-
-        result = [2 * t.sf(a, b)
-                  for a, b in zip(np.fabs(self._t_stat_raw),
-                                   self._df_resid_raw)]
-
-        return np.array(result)
-
-    @cache_readonly
-    def _resid_stats(self):
-        uncentered_sst = []
-        sst = []
-        sse = []
-
-        Yreg = self._y
-        Y = self._y_trans
-        X = self._x_trans
-        weights = self._weights
-
-        dates = self._index
-        window = self._window
-        for n, index in enumerate(self._valid_indices):
-            if self._is_rolling and index >= window:
-                prior_date = dates[index - window + 1]
-            else:
-                prior_date = dates[0]
-
-            date = dates[index]
-            beta = self._beta_raw[n]
-
-            X_slice = X.truncate(before=prior_date, after=date).values
-            Y_slice = _y_converter(Y.truncate(before=prior_date, after=date))
-
-            resid = Y_slice - np.dot(X_slice, beta)
-
-            if weights is not None:
-                Y_slice = _y_converter(Yreg.truncate(before=prior_date,
-                                                     after=date))
-                weights_slice = weights.truncate(prior_date, date)
-                demeaned = Y_slice - np.average(Y_slice, weights=weights_slice)
-                SS_total = (weights_slice * demeaned ** 2).sum()
-            else:
-                SS_total = ((Y_slice - Y_slice.mean()) ** 2).sum()
-
-            SS_err = (resid ** 2).sum()
-            SST_uncentered = (Y_slice ** 2).sum()
-
-            sse.append(SS_err)
-            sst.append(SS_total)
-            uncentered_sst.append(SST_uncentered)
-
-        return {
-            'sse': np.array(sse),
-            'centered_tss': np.array(sst),
-            'uncentered_tss': np.array(uncentered_sst),
-        }
-
-    @cache_readonly
-    def _rmse_raw(self):
-        """Returns the raw rmse values."""
-        return np.sqrt(self._resid_stats['sse'] / self._df_resid_raw)
-
-    @cache_readonly
-    def _r2_raw(self):
-        rs = self._resid_stats
-
-        if self._use_centered_tss:
-            return 1 - rs['sse'] / rs['centered_tss']
-        else:
-            return 1 - rs['sse'] / rs['uncentered_tss']
-
-    @cache_readonly
-    def _r2_adj_raw(self):
-        """Returns the raw r-squared adjusted values."""
-        nobs = self._nobs
-        factors = (nobs - 1) / (nobs - self._df_raw)
-        return 1 - (1 - self._r2_raw) * factors
-
-    @cache_readonly
-    def _resid_raw(self):
-        """Returns the raw residuals."""
-        return (self._y.values - self._y_fitted_raw)
-
-    @cache_readonly
-    def _std_err_raw(self):
-        """Returns the raw standard err values."""
-        results = []
-        for i in range(len(self._var_beta_raw)):
-            results.append(np.sqrt(np.diag(self._var_beta_raw[i])))
-
-        return np.array(results)
-
-    @cache_readonly
-    def _t_stat_raw(self):
-        """Returns the raw t-stat value."""
-        return self._beta_raw / self._std_err_raw
-
-    @cache_readonly
-    def _var_beta_raw(self):
-        """Returns the raw covariance of beta."""
-        x = self._x_trans
-        y = self._y_trans
-        dates = self._index
-        nobs = self._nobs
-        rmse = self._rmse_raw
-        beta = self._beta_raw
-        df = self._df_raw
-        window = self._window
-        cum_xx = self._cum_xx(self._x)
-
-        results = []
-        for n, i in enumerate(self._valid_indices):
-            xx = cum_xx[i]
-            date = dates[i]
-
-            if self._is_rolling and i >= window:
-                xx = xx - cum_xx[i - window]
-                prior_date = dates[i - window + 1]
-            else:
-                prior_date = dates[0]
-
-            x_slice = x.truncate(before=prior_date, after=date)
-            y_slice = y.truncate(before=prior_date, after=date)
-            xv = x_slice.values
-            yv = np.asarray(y_slice)
-
-            if self._nw_lags is None:
-                result = math.inv(xx) * (rmse[n] ** 2)
-            else:
-                resid = yv - np.dot(xv, beta[n])
-                m = (xv.T * resid).T
-
-                xeps = math.newey_west(m, self._nw_lags, nobs[n], df[n],
-                                       self._nw_overlap)
-
-                xx_inv = math.inv(xx)
-                result = np.dot(xx_inv, np.dot(xeps, xx_inv))
-
-            results.append(result)
-
-        return np.array(results)
-
-    @cache_readonly
-    def _forecast_mean_raw(self):
-        """Returns the raw covariance of beta."""
-        nobs = self._nobs
-        window = self._window
-
-        # x should be ones
-        dummy = DataFrame(index=self._y.index)
-        dummy['y'] = 1
-
-        cum_xy = self._cum_xy(dummy, self._y)
-
-        results = []
-        for n, i in enumerate(self._valid_indices):
-            sumy = cum_xy[i]
-
-            if self._is_rolling and i >= window:
-                sumy = sumy - cum_xy[i - window]
-
-            results.append(sumy[0] / nobs[n])
-
-        return np.array(results)
-
-    @cache_readonly
-    def _forecast_vol_raw(self):
-        """Returns the raw covariance of beta."""
-        beta = self._beta_raw
-        window = self._window
-        dates = self._index
-        x = self._x
-
-        results = []
-        for n, i in enumerate(self._valid_indices):
-            date = dates[i]
-            if self._is_rolling and i >= window:
-                prior_date = dates[i - window + 1]
-            else:
-                prior_date = dates[0]
-
-            x_slice = x.truncate(prior_date, date).values
-            x_demeaned = x_slice - x_slice.mean(0)
-            x_cov = np.dot(x_demeaned.T, x_demeaned) / (len(x_slice) - 1)
-
-            B = beta[n]
-            result = np.dot(B, np.dot(x_cov, B))
-            results.append(np.sqrt(result))
-
-        return np.array(results)
-
-    @cache_readonly
-    def _y_fitted_raw(self):
-        """Returns the raw fitted y values."""
-        return (self._x.values * self._beta_matrix(lag=0)).sum(1)
-
-    @cache_readonly
-    def _y_predict_raw(self):
-        """Returns the raw predicted y values."""
-        return (self._x.values * self._beta_matrix(lag=1)).sum(1)
-
-    @cache_readonly
-    def _results(self):
-        results = {}
-        for result in self.RESULT_FIELDS:
-            value = getattr(self, result)
-            if isinstance(value, Series):
-                value = value[self.beta.index[-1]]
-            elif isinstance(value, DataFrame):
-                value = value.xs(self.beta.index[-1])
-            else:  # pragma: no cover
-                raise Exception('Problem retrieving %s' % result)
-            results[result] = value
-
-        return results
-
-    @cache_readonly
-    def _window_time_obs(self):
-        window_obs = moments.rolling_sum(self._time_obs_count > 0,
-                                         self._window, min_periods=1)
-
-        window_obs[np.isnan(window_obs)] = 0
-        return window_obs.astype(int)
-
-    @cache_readonly
-    def _nobs_raw(self):
-        if self._is_rolling:
-            window = self._window
-        else:
-            # expanding case
-            window = len(self._index)
-
-        result = moments.rolling_sum(self._time_obs_count, window,
-                                     min_periods=1)
-
-        return result.astype(int)
-
-    def _beta_matrix(self, lag=0):
-        if lag < 0:
-            raise AssertionError("'lag' must be greater than or equal to 0, "
-                                 "input was {0}".format(lag))
-
-        betas = self._beta_raw
-
-        labels = np.arange(len(self._y)) - lag
-        indexer = self._valid_obs_labels.searchsorted(labels, side='left')
-        indexer[indexer == len(betas)] = len(betas) - 1
-
-        beta_matrix = betas[indexer]
-        beta_matrix[labels < self._valid_obs_labels[0]] = np.NaN
-
-        return beta_matrix
-
-    @cache_readonly
-    def _valid_obs_labels(self):
-        dates = self._index[self._valid_indices]
-        return self._y.index.searchsorted(dates)
-
-    @cache_readonly
-    def _nobs(self):
-        return self._nobs_raw[self._valid_indices]
-
-    @property
-    def nobs(self):
-        return Series(self._nobs, index=self._result_index)
-
-    @cache_readonly
-    def _enough_obs(self):
-        # XXX: what's the best way to determine where to start?
-        return self._nobs_raw >= max(self._min_periods,
-                                     len(self._x.columns) + 1)
-
-
-def _safe_update(d, other):
-    """
-    Combine dictionaries with non-overlapping keys
-    """
-    for k, v in compat.iteritems(other):
-        if k in d:
-            raise Exception('Duplicate regressor: %s' % k)
-
-        d[k] = v
-
-
-def _filter_data(lhs, rhs, weights=None):
-    """
-    Cleans the input for single OLS.
-
-    Parameters
-    ----------
-    lhs : Series
-        Dependent variable in the regression.
-    rhs : dict, whose values are Series, DataFrame, or dict
-        Explanatory variables of the regression.
-    weights : array-like, optional
-        1d array of weights.  If None, equivalent to an unweighted OLS.
-
-    Returns
-    -------
-    Series, DataFrame
-        Cleaned lhs and rhs
-    """
-    if not isinstance(lhs, Series):
-        if len(lhs) != len(rhs):
-            raise AssertionError("length of lhs must equal length of rhs")
-        lhs = Series(lhs, index=rhs.index)
-
-    rhs = _combine_rhs(rhs)
-    lhs = DataFrame({'__y__': lhs}, dtype=float)
-    pre_filt_rhs = rhs.dropna(how='any')
-
-    combined = rhs.join(lhs, how='outer')
-    if weights is not None:
-        combined['__weights__'] = weights
-
-    valid = (combined.count(1) == len(combined.columns)).values
-    index = combined.index
-    combined = combined[valid]
-
-    if weights is not None:
-        filt_weights = combined.pop('__weights__')
-    else:
-        filt_weights = None
-
-    filt_lhs = combined.pop('__y__')
-    filt_rhs = combined
-
-    if hasattr(filt_weights,'to_dense'):
-        filt_weights = filt_weights.to_dense()
-
-    return (filt_lhs.to_dense(), filt_rhs.to_dense(), filt_weights,
-            pre_filt_rhs.to_dense(), index, valid)
-
-
-def _combine_rhs(rhs):
-    """
-    Glue input X variables together while checking for potential
-    duplicates
-    """
-    series = {}
-
-    if isinstance(rhs, Series):
-        series['x'] = rhs
-    elif isinstance(rhs, DataFrame):
-        series = rhs.copy()
-    elif isinstance(rhs, dict):
-        for name, value in compat.iteritems(rhs):
-            if isinstance(value, Series):
-                _safe_update(series, {name: value})
-            elif isinstance(value, (dict, DataFrame)):
-                _safe_update(series, value)
-            else:  # pragma: no cover
-                raise Exception('Invalid RHS data type: %s' % type(value))
-    else:  # pragma: no cover
-        raise Exception('Invalid RHS type: %s' % type(rhs))
-
-    if not isinstance(series, DataFrame):
-        series = DataFrame(series, dtype=float)
-
-    return series
-
-# A little kludge so we can use this method for both
-# MovingOLS and MovingPanelOLS
-
-
-def _y_converter(y):
-    y = y.values.squeeze()
-    if y.ndim == 0:  # pragma: no cover
-        return np.array([y])
-    else:
-        return y
-
-
-def f_stat_to_dict(result):
-    f_stat, shape, p_value = result
-
-    result = {}
-    result['f-stat'] = f_stat
-    result['DF X'] = shape[0]
-    result['DF Resid'] = shape[1]
-    result['p-value'] = p_value
-
-    return result
diff --git a/pandas/stats/plm.py b/pandas/stats/plm.py
deleted file mode 100644
index 53b8cce64b74a..0000000000000
--- a/pandas/stats/plm.py
+++ /dev/null
@@ -1,847 +0,0 @@
-"""
-Linear regression objects for panel data
-"""
-
-# pylint: disable-msg=W0231
-# pylint: disable-msg=E1101,E1103
-
-from __future__ import division
-from pandas.compat import range
-from pandas import compat
-import warnings
-
-import numpy as np
-
-from pandas.core.panel import Panel
-from pandas.core.frame import DataFrame
-from pandas.core.reshape import get_dummies
-from pandas.core.series import Series
-from pandas.core.sparse import SparsePanel
-from pandas.stats.ols import OLS, MovingOLS
-import pandas.stats.common as com
-import pandas.stats.math as math
-from pandas.util.decorators import cache_readonly
-
-
-class PanelOLS(OLS):
-    """Implements panel OLS.
-
-    See ols function docs
-    """
-    _panel_model = True
-
-    def __init__(self, y, x, weights=None, intercept=True, nw_lags=None,
-                 entity_effects=False, time_effects=False, x_effects=None,
-                 cluster=None, dropped_dummies=None, verbose=False,
-                 nw_overlap=False):
-        self._x_orig = x
-        self._y_orig = y
-        self._weights = weights
-
-        self._intercept = intercept
-        self._nw_lags = nw_lags
-        self._nw_overlap = nw_overlap
-        self._entity_effects = entity_effects
-        self._time_effects = time_effects
-        self._x_effects = x_effects
-        self._dropped_dummies = dropped_dummies or {}
-        self._cluster = com._get_cluster_type(cluster)
-        self._verbose = verbose
-
-        (self._x, self._x_trans,
-         self._x_filtered, self._y,
-         self._y_trans) = self._prepare_data()
-
-        self._index = self._x.index.levels[0]
-
-        self._T = len(self._index)
-
-    def log(self, msg):
-        if self._verbose:  # pragma: no cover
-            print(msg)
-
-    def _prepare_data(self):
-        """Cleans and stacks input data into DataFrame objects
-
-        If time effects is True, then we turn off intercepts and omit an item
-        from every (entity and x) fixed effect.
-
-        Otherwise:
-           - If we have an intercept, we omit an item from every fixed effect.
-           - Else, we omit an item from every fixed effect except one of them.
-
-        The categorical variables will get dropped from x.
-        """
-        (x, x_filtered, y, weights, cat_mapping) = self._filter_data()
-
-        self.log('Adding dummies to X variables')
-        x = self._add_dummies(x, cat_mapping)
-
-        self.log('Adding dummies to filtered X variables')
-        x_filtered = self._add_dummies(x_filtered, cat_mapping)
-
-        if self._x_effects:
-            x = x.drop(self._x_effects, axis=1)
-            x_filtered = x_filtered.drop(self._x_effects, axis=1)
-
-        if self._time_effects:
-            x_regressor = x.sub(x.mean(level=0), level=0)
-
-            unstacked_y = y.unstack()
-            y_regressor = unstacked_y.sub(unstacked_y.mean(1), axis=0).stack()
-            y_regressor.index = y.index
-
-        elif self._intercept:
-            # only add intercept when no time effects
-            self.log('Adding intercept')
-            x = x_regressor = add_intercept(x)
-            x_filtered = add_intercept(x_filtered)
-            y_regressor = y
-        else:
-            self.log('No intercept added')
-            x_regressor = x
-            y_regressor = y
-
-        if weights is not None:
-            if not y_regressor.index.equals(weights.index):
-                raise AssertionError("y_regressor and weights must have the "
-                                     "same index")
-            if not x_regressor.index.equals(weights.index):
-                raise AssertionError("x_regressor and weights must have the "
-                                     "same index")
-
-            rt_weights = np.sqrt(weights)
-            y_regressor = y_regressor * rt_weights
-            x_regressor = x_regressor.mul(rt_weights, axis=0)
-
-        return x, x_regressor, x_filtered, y, y_regressor
-
-    def _filter_data(self):
-        """
-
-        """
-        data = self._x_orig
-        cat_mapping = {}
-
-        if isinstance(data, DataFrame):
-            data = data.to_panel()
-        else:
-            if isinstance(data, Panel):
-                data = data.copy()
-
-            if not isinstance(data, SparsePanel):
-                data, cat_mapping = self._convert_x(data)
-
-            if not isinstance(data, Panel):
-                data = Panel.from_dict(data, intersect=True)
-
-        x_names = data.items
-
-        if self._weights is not None:
-            data['__weights__'] = self._weights
-
-        # Filter x's without y (so we can make a prediction)
-        filtered = data.to_frame()
-
-        # Filter all data together using to_frame
-
-        # convert to DataFrame
-        y = self._y_orig
-        if isinstance(y, Series):
-            y = y.unstack()
-
-        data['__y__'] = y
-        data_long = data.to_frame()
-
-        x_filt = filtered.filter(x_names)
-        x = data_long.filter(x_names)
-        y = data_long['__y__']
-
-        if self._weights is not None and not self._weights.empty:
-            weights = data_long['__weights__']
-        else:
-            weights = None
-
-        return x, x_filt, y, weights, cat_mapping
-
-    def _convert_x(self, x):
-        # Converts non-numeric data in x to floats. x_converted is the
-        # DataFrame with converted values, and x_conversion is a dict that
-        # provides the reverse mapping.  For example, if 'A' was converted to 0
-        # for x named 'variety', then x_conversion['variety'][0] is 'A'.
-        x_converted = {}
-        cat_mapping = {}
-        # x can be either a dict or a Panel, but in Python 3, dicts don't have
-        # .iteritems
-        iteritems = getattr(x, 'iteritems', x.items)
-        for key, df in iteritems():
-            if not isinstance(df, DataFrame):
-                raise AssertionError("all input items must be DataFrames, "
-                                     "at least one is of "
-                                     "type {0}".format(type(df)))
-
-            if _is_numeric(df):
-                x_converted[key] = df
-            else:
-                try:
-                    df = df.astype(float)
-                except (TypeError, ValueError):
-                    values = df.values
-                    distinct_values = sorted(set(values.flat))
-                    cat_mapping[key] = dict(enumerate(distinct_values))
-                    new_values = np.searchsorted(distinct_values, values)
-                    x_converted[key] = DataFrame(new_values, index=df.index,
-                                                 columns=df.columns)
-
-        if len(cat_mapping) == 0:
-            x_converted = x
-
-        return x_converted, cat_mapping
-
-    def _add_dummies(self, panel, mapping):
-        """
-        Add entity and / or categorical dummies to input X DataFrame
-
-        Returns
-        -------
-        DataFrame
-        """
-        panel = self._add_entity_effects(panel)
-        panel = self._add_categorical_dummies(panel, mapping)
-
-        return panel
-
-    def _add_entity_effects(self, panel):
-        """
-        Add entity dummies to panel
-
-        Returns
-        -------
-        DataFrame
-        """
-        from pandas.core.reshape import make_axis_dummies
-
-        if not self._entity_effects:
-            return panel
-
-        self.log('-- Adding entity fixed effect dummies')
-
-        dummies = make_axis_dummies(panel, 'minor')
-
-        if not self._use_all_dummies:
-            if 'entity' in self._dropped_dummies:
-                to_exclude = str(self._dropped_dummies.get('entity'))
-            else:
-                to_exclude = dummies.columns[0]
-
-            if to_exclude not in dummies.columns:
-                raise Exception('%s not in %s' % (to_exclude,
-                                                  dummies.columns))
-
-            self.log('-- Excluding dummy for entity: %s' % to_exclude)
-
-            dummies = dummies.filter(dummies.columns.difference([to_exclude]))
-
-        dummies = dummies.add_prefix('FE_')
-        panel = panel.join(dummies)
-
-        return panel
-
-    def _add_categorical_dummies(self, panel, cat_mappings):
-        """
-        Add categorical dummies to panel
-
-        Returns
-        -------
-        DataFrame
-        """
-        if not self._x_effects:
-            return panel
-
-        dropped_dummy = (self._entity_effects and not self._use_all_dummies)
-
-        for effect in self._x_effects:
-            self.log('-- Adding fixed effect dummies for %s' % effect)
-
-            dummies = get_dummies(panel[effect])
-
-            val_map = cat_mappings.get(effect)
-            if val_map:
-                val_map = dict((v, k) for k, v in compat.iteritems(val_map))
-
-            if dropped_dummy or not self._use_all_dummies:
-                if effect in self._dropped_dummies:
-                    to_exclude = mapped_name = self._dropped_dummies.get(
-                        effect)
-
-                    if val_map:
-                        mapped_name = val_map[to_exclude]
-                else:
-                    to_exclude = mapped_name = dummies.columns[0]
-
-                if mapped_name not in dummies.columns:  # pragma: no cover
-                    raise Exception('%s not in %s' % (to_exclude,
-                                                      dummies.columns))
-
-                self.log(
-                    '-- Excluding dummy for %s: %s' % (effect, to_exclude))
-
-                dummies = dummies.filter(dummies.columns.difference([mapped_name]))
-                dropped_dummy = True
-
-            dummies = _convertDummies(dummies, cat_mappings.get(effect))
-            dummies = dummies.add_prefix('%s_' % effect)
-            panel = panel.join(dummies)
-
-        return panel
-
-    @property
-    def _use_all_dummies(self):
-        """
-        In the case of using an intercept or including time fixed
-        effects, completely partitioning the sample would make the X
-        not full rank.
-        """
-        return (not self._intercept and not self._time_effects)
-
-    @cache_readonly
-    def _beta_raw(self):
-        """Runs the regression and returns the beta."""
-        X = self._x_trans.values
-        Y = self._y_trans.values.squeeze()
-
-        beta, _, _, _ = np.linalg.lstsq(X, Y)
-
-        return beta
-
-    @cache_readonly
-    def beta(self):
-        return Series(self._beta_raw, index=self._x.columns)
-
-    @cache_readonly
-    def _df_model_raw(self):
-        """Returns the raw model degrees of freedom."""
-        return self._df_raw - 1
-
-    @cache_readonly
-    def _df_resid_raw(self):
-        """Returns the raw residual degrees of freedom."""
-        return self._nobs - self._df_raw
-
-    @cache_readonly
-    def _df_raw(self):
-        """Returns the degrees of freedom."""
-        df = math.rank(self._x_trans.values)
-        if self._time_effects:
-            df += self._total_times
-
-        return df
-
-    @cache_readonly
-    def _r2_raw(self):
-        Y = self._y_trans.values.squeeze()
-        X = self._x_trans.values
-
-        resid = Y - np.dot(X, self._beta_raw)
-
-        SSE = (resid ** 2).sum()
-
-        if self._use_centered_tss:
-            SST = ((Y - np.mean(Y)) ** 2).sum()
-        else:
-            SST = (Y ** 2).sum()
-
-        return 1 - SSE / SST
-
-    @property
-    def _use_centered_tss(self):
-        # has_intercept = np.abs(self._resid_raw.sum()) < _FP_ERR
-        return self._intercept or self._entity_effects or self._time_effects
-
-    @cache_readonly
-    def _r2_adj_raw(self):
-        """Returns the raw r-squared adjusted values."""
-        nobs = self._nobs
-        factors = (nobs - 1) / (nobs - self._df_raw)
-        return 1 - (1 - self._r2_raw) * factors
-
-    @cache_readonly
-    def _resid_raw(self):
-        Y = self._y.values.squeeze()
-        X = self._x.values
-        return Y - np.dot(X, self._beta_raw)
-
-    @cache_readonly
-    def resid(self):
-        return self._unstack_vector(self._resid_raw)
-
-    @cache_readonly
-    def _rmse_raw(self):
-        """Returns the raw rmse values."""
-        # X = self._x.values
-        # Y = self._y.values.squeeze()
-
-        X = self._x_trans.values
-        Y = self._y_trans.values.squeeze()
-
-        resid = Y - np.dot(X, self._beta_raw)
-        ss = (resid ** 2).sum()
-        return np.sqrt(ss / (self._nobs - self._df_raw))
-
-    @cache_readonly
-    def _var_beta_raw(self):
-        cluster_axis = None
-        if self._cluster == 'time':
-            cluster_axis = 0
-        elif self._cluster == 'entity':
-            cluster_axis = 1
-
-        x = self._x
-        y = self._y
-
-        if self._time_effects:
-            xx = _xx_time_effects(x, y)
-        else:
-            xx = np.dot(x.values.T, x.values)
-
-        return _var_beta_panel(y, x, self._beta_raw, xx,
-                               self._rmse_raw, cluster_axis, self._nw_lags,
-                               self._nobs, self._df_raw, self._nw_overlap)
-
-    @cache_readonly
-    def _y_fitted_raw(self):
-        """Returns the raw fitted y values."""
-        return np.dot(self._x.values, self._beta_raw)
-
-    @cache_readonly
-    def y_fitted(self):
-        return self._unstack_vector(self._y_fitted_raw, index=self._x.index)
-
-    def _unstack_vector(self, vec, index=None):
-        if index is None:
-            index = self._y_trans.index
-        panel = DataFrame(vec, index=index, columns=['dummy'])
-        return panel.to_panel()['dummy']
-
-    def _unstack_y(self, vec):
-        unstacked = self._unstack_vector(vec)
-        return unstacked.reindex(self.beta.index)
-
-    @cache_readonly
-    def _time_obs_count(self):
-        return self._y_trans.count(level=0).values
-
-    @cache_readonly
-    def _time_has_obs(self):
-        return self._time_obs_count > 0
-
-    @property
-    def _nobs(self):
-        return len(self._y)
-
-
-def _convertDummies(dummies, mapping):
-    # cleans up the names of the generated dummies
-    new_items = []
-    for item in dummies.columns:
-        if not mapping:
-            var = str(item)
-            if isinstance(item, float):
-                var = '%g' % item
-
-            new_items.append(var)
-        else:
-            # renames the dummies if a conversion dict is provided
-            new_items.append(mapping[int(item)])
-
-    dummies = DataFrame(dummies.values, index=dummies.index,
-                        columns=new_items)
-
-    return dummies
-
-
-def _is_numeric(df):
-    for col in df:
-        if df[col].dtype.name == 'object':
-            return False
-
-    return True
-
-
-def add_intercept(panel, name='intercept'):
-    """
-    Add column of ones to input panel
-
-    Parameters
-    ----------
-    panel: Panel / DataFrame
-    name: string, default 'intercept']
-
-    Returns
-    -------
-    New object (same type as input)
-    """
-    panel = panel.copy()
-    panel[name] = 1.
-
-    return panel.consolidate()
-
-
-class MovingPanelOLS(MovingOLS, PanelOLS):
-    """Implements rolling/expanding panel OLS.
-
-    See ols function docs
-    """
-    _panel_model = True
-
-    def __init__(self, y, x, weights=None,
-                 window_type='expanding', window=None,
-                 min_periods=None,
-                 min_obs=None,
-                 intercept=True,
-                 nw_lags=None, nw_overlap=False,
-                 entity_effects=False,
-                 time_effects=False,
-                 x_effects=None,
-                 cluster=None,
-                 dropped_dummies=None,
-                 verbose=False):
-
-        self._args = dict(intercept=intercept,
-                          nw_lags=nw_lags,
-                          nw_overlap=nw_overlap,
-                          entity_effects=entity_effects,
-                          time_effects=time_effects,
-                          x_effects=x_effects,
-                          cluster=cluster,
-                          dropped_dummies=dropped_dummies,
-                          verbose=verbose)
-
-        PanelOLS.__init__(self, y=y, x=x, weights=weights,
-                          **self._args)
-
-        self._set_window(window_type, window, min_periods)
-
-        if min_obs is None:
-            min_obs = len(self._x.columns) + 1
-
-        self._min_obs = min_obs
-
-    @cache_readonly
-    def resid(self):
-        return self._unstack_y(self._resid_raw)
-
-    @cache_readonly
-    def y_fitted(self):
-        return self._unstack_y(self._y_fitted_raw)
-
-    @cache_readonly
-    def y_predict(self):
-        """Returns the predicted y values."""
-        return self._unstack_y(self._y_predict_raw)
-
-    def lagged_y_predict(self, lag=1):
-        """
-        Compute forecast Y value lagging coefficient by input number
-        of time periods
-
-        Parameters
-        ----------
-        lag : int
-
-        Returns
-        -------
-        DataFrame
-        """
-        x = self._x.values
-        betas = self._beta_matrix(lag=lag)
-        return self._unstack_y((betas * x).sum(1))
-
-    @cache_readonly
-    def _rolling_ols_call(self):
-        return self._calc_betas(self._x_trans, self._y_trans)
-
-    @cache_readonly
-    def _df_raw(self):
-        """Returns the degrees of freedom."""
-        df = self._rolling_rank()
-
-        if self._time_effects:
-            df += self._window_time_obs
-
-        return df[self._valid_indices]
-
-    @cache_readonly
-    def _var_beta_raw(self):
-        """Returns the raw covariance of beta."""
-        x = self._x
-        y = self._y
-
-        dates = x.index.levels[0]
-
-        cluster_axis = None
-        if self._cluster == 'time':
-            cluster_axis = 0
-        elif self._cluster == 'entity':
-            cluster_axis = 1
-
-        nobs = self._nobs
-        rmse = self._rmse_raw
-        beta = self._beta_raw
-        df = self._df_raw
-        window = self._window
-
-        if not self._time_effects:
-            # Non-transformed X
-            cum_xx = self._cum_xx(x)
-
-        results = []
-        for n, i in enumerate(self._valid_indices):
-            if self._is_rolling and i >= window:
-                prior_date = dates[i - window + 1]
-            else:
-                prior_date = dates[0]
-
-            date = dates[i]
-
-            x_slice = x.truncate(prior_date, date)
-            y_slice = y.truncate(prior_date, date)
-
-            if self._time_effects:
-                xx = _xx_time_effects(x_slice, y_slice)
-            else:
-                xx = cum_xx[i]
-                if self._is_rolling and i >= window:
-                    xx = xx - cum_xx[i - window]
-
-            result = _var_beta_panel(y_slice, x_slice, beta[n], xx, rmse[n],
-                                     cluster_axis, self._nw_lags,
-                                     nobs[n], df[n], self._nw_overlap)
-
-            results.append(result)
-
-        return np.array(results)
-
-    @cache_readonly
-    def _resid_raw(self):
-        beta_matrix = self._beta_matrix(lag=0)
-
-        Y = self._y.values.squeeze()
-        X = self._x.values
-        resid = Y - (X * beta_matrix).sum(1)
-
-        return resid
-
-    @cache_readonly
-    def _y_fitted_raw(self):
-        x = self._x.values
-        betas = self._beta_matrix(lag=0)
-        return (betas * x).sum(1)
-
-    @cache_readonly
-    def _y_predict_raw(self):
-        """Returns the raw predicted y values."""
-        x = self._x.values
-        betas = self._beta_matrix(lag=1)
-        return (betas * x).sum(1)
-
-    def _beta_matrix(self, lag=0):
-        if lag < 0:
-            raise AssertionError("'lag' must be greater than or equal to 0, "
-                                 "input was {0}".format(lag))
-
-        index = self._y_trans.index
-        major_labels = index.labels[0]
-        labels = major_labels - lag
-        indexer = self._valid_indices.searchsorted(labels, side='left')
-
-        beta_matrix = self._beta_raw[indexer]
-        beta_matrix[labels < self._valid_indices[0]] = np.NaN
-
-        return beta_matrix
-
-    @cache_readonly
-    def _enough_obs(self):
-        # XXX: what's the best way to determine where to start?
-        # TODO: write unit tests for this
-
-        rank_threshold = len(self._x.columns) + 1
-        if self._min_obs < rank_threshold:  # pragma: no cover
-            warnings.warn('min_obs is smaller than rank of X matrix')
-
-        enough_observations = self._nobs_raw >= self._min_obs
-        enough_time_periods = self._window_time_obs >= self._min_periods
-        return enough_time_periods & enough_observations
-
-
-def create_ols_dict(attr):
-    def attr_getter(self):
-        d = {}
-        for k, v in compat.iteritems(self.results):
-            result = getattr(v, attr)
-            d[k] = result
-
-        return d
-
-    return attr_getter
-
-
-def create_ols_attr(attr):
-    return property(create_ols_dict(attr))
-
-
-class NonPooledPanelOLS(object):
-    """Implements non-pooled panel OLS.
-
-    Parameters
-    ----------
-    y : DataFrame
-    x : Series, DataFrame, or dict of Series
-    intercept : bool
-        True if you want an intercept.
-    nw_lags : None or int
-        Number of Newey-West lags.
-    window_type : {'full_sample', 'rolling', 'expanding'}
-        'full_sample' by default
-    window : int
-        size of window (for rolling/expanding OLS)
-    """
-
-    ATTRIBUTES = [
-        'beta',
-        'df',
-        'df_model',
-        'df_resid',
-        'f_stat',
-        'p_value',
-        'r2',
-        'r2_adj',
-        'resid',
-        'rmse',
-        'std_err',
-        'summary_as_matrix',
-        't_stat',
-        'var_beta',
-        'x',
-        'y',
-        'y_fitted',
-        'y_predict'
-    ]
-
-    def __init__(self, y, x, window_type='full_sample', window=None,
-                 min_periods=None, intercept=True, nw_lags=None,
-                 nw_overlap=False):
-
-        for attr in self.ATTRIBUTES:
-            setattr(self.__class__, attr, create_ols_attr(attr))
-
-        results = {}
-
-        for entity in y:
-            entity_y = y[entity]
-
-            entity_x = {}
-            for x_var in x:
-                entity_x[x_var] = x[x_var][entity]
-
-            from pandas.stats.interface import ols
-            results[entity] = ols(y=entity_y,
-                                  x=entity_x,
-                                  window_type=window_type,
-                                  window=window,
-                                  min_periods=min_periods,
-                                  intercept=intercept,
-                                  nw_lags=nw_lags,
-                                  nw_overlap=nw_overlap)
-
-        self.results = results
-
-
-def _var_beta_panel(y, x, beta, xx, rmse, cluster_axis,
-                    nw_lags, nobs, df, nw_overlap):
-    xx_inv = math.inv(xx)
-
-    yv = y.values
-
-    if cluster_axis is None:
-        if nw_lags is None:
-            return xx_inv * (rmse ** 2)
-        else:
-            resid = yv - np.dot(x.values, beta)
-            m = (x.values.T * resid).T
-
-            xeps = math.newey_west(m, nw_lags, nobs, df, nw_overlap)
-
-            return np.dot(xx_inv, np.dot(xeps, xx_inv))
-    else:
-        Xb = np.dot(x.values, beta).reshape((len(x.values), 1))
-        resid = DataFrame(yv[:, None] - Xb, index=y.index, columns=['resid'])
-
-        if cluster_axis == 1:
-            x = x.swaplevel(0, 1).sortlevel(0)
-            resid = resid.swaplevel(0, 1).sortlevel(0)
-
-        m = _group_agg(x.values * resid.values, x.index._bounds,
-                      lambda x: np.sum(x, axis=0))
-
-        if nw_lags is None:
-            nw_lags = 0
-
-        xox = 0
-        for i in range(len(x.index.levels[0])):
-            xox += math.newey_west(m[i: i + 1], nw_lags,
-                                   nobs, df, nw_overlap)
-
-        return np.dot(xx_inv, np.dot(xox, xx_inv))
-
-def _group_agg(values, bounds, f):
-    """
-    R-style aggregator
-
-    Parameters
-    ----------
-    values : N-length or N x K ndarray
-    bounds : B-length ndarray
-    f : ndarray aggregation function
-
-    Returns
-    -------
-    ndarray with same length as bounds array
-    """
-    if values.ndim == 1:
-        N = len(values)
-        result = np.empty(len(bounds), dtype=float)
-    elif values.ndim == 2:
-        N, K = values.shape
-        result = np.empty((len(bounds), K), dtype=float)
-
-    testagg = f(values[:min(1, len(values))])
-    if isinstance(testagg, np.ndarray) and testagg.ndim == 2:
-        raise AssertionError('Function must reduce')
-
-    for i, left_bound in enumerate(bounds):
-        if i == len(bounds) - 1:
-            right_bound = N
-        else:
-            right_bound = bounds[i + 1]
-
-        result[i] = f(values[left_bound:right_bound])
-
-    return result
-
-def _xx_time_effects(x, y):
-    """
-    Returns X'X - (X'T) (T'T)^-1 (T'X)
-    """
-    # X'X
-    xx = np.dot(x.values.T, x.values)
-    xt = x.sum(level=0).values
-
-    count = y.unstack().count(1).values
-    selector = count > 0
-
-    # X'X - (T'T)^-1 (T'X)
-    xt = xt[selector]
-    count = count[selector]
-
-    return xx - np.dot(xt.T / count, xt)
diff --git a/pandas/stats/tests/common.py b/pandas/stats/tests/common.py
deleted file mode 100644
index 717eb51292796..0000000000000
--- a/pandas/stats/tests/common.py
+++ /dev/null
@@ -1,160 +0,0 @@
-# pylint: disable-msg=W0611,W0402
-
-from datetime import datetime
-import string
-import nose
-
-import numpy as np
-
-from pandas import DataFrame, bdate_range
-from pandas.util.testing import assert_almost_equal  # imported in other tests
-import pandas.util.testing as tm
-
-N = 100
-K = 4
-
-start = datetime(2007, 1, 1)
-DATE_RANGE = bdate_range(start, periods=N)
-
-COLS = ['Col' + c for c in string.ascii_uppercase[:K]]
-
-
-def makeDataFrame():
-    data = DataFrame(np.random.randn(N, K),
-                     columns=COLS,
-                     index=DATE_RANGE)
-
-    return data
-
-
-def getBasicDatasets():
-    A = makeDataFrame()
-    B = makeDataFrame()
-    C = makeDataFrame()
-
-    return A, B, C
-
-
-def check_for_scipy():
-    try:
-        import scipy
-    except ImportError:
-        raise nose.SkipTest('no scipy')
-
-
-def check_for_statsmodels():
-    _have_statsmodels = True
-    try:
-        import statsmodels.api as sm
-    except ImportError:
-        try:
-            import scikits.statsmodels.api as sm
-        except ImportError:
-            raise nose.SkipTest('no statsmodels')
-
-
-class BaseTest(tm.TestCase):
-    def setUp(self):
-        check_for_scipy()
-        check_for_statsmodels()
-
-        self.A, self.B, self.C = getBasicDatasets()
-
-        self.createData1()
-        self.createData2()
-        self.createData3()
-
-    def createData1(self):
-        date = datetime(2007, 1, 1)
-        date2 = datetime(2007, 1, 15)
-        date3 = datetime(2007, 1, 22)
-
-        A = self.A.copy()
-        B = self.B.copy()
-        C = self.C.copy()
-
-        A['ColA'][date] = np.NaN
-        B['ColA'][date] = np.NaN
-        C['ColA'][date] = np.NaN
-        C['ColA'][date2] = np.NaN
-
-        # truncate data to save time
-        A = A[:30]
-        B = B[:30]
-        C = C[:30]
-
-        self.panel_y = A
-        self.panel_x = {'B': B, 'C': C}
-
-        self.series_panel_y = A.filter(['ColA'])
-        self.series_panel_x = {'B': B.filter(['ColA']),
-                               'C': C.filter(['ColA'])}
-        self.series_y = A['ColA']
-        self.series_x = {'B': B['ColA'],
-                         'C': C['ColA']}
-
-    def createData2(self):
-        y_data = [[1, np.NaN],
-                  [2, 3],
-                  [4, 5]]
-        y_index = [datetime(2000, 1, 1),
-                   datetime(2000, 1, 2),
-                   datetime(2000, 1, 3)]
-        y_cols = ['A', 'B']
-        self.panel_y2 = DataFrame(np.array(y_data), index=y_index,
-                                  columns=y_cols)
-
-        x1_data = [[6, np.NaN],
-                   [7, 8],
-                   [9, 30],
-                   [11, 12]]
-        x1_index = [datetime(2000, 1, 1),
-                    datetime(2000, 1, 2),
-                    datetime(2000, 1, 3),
-                    datetime(2000, 1, 4)]
-        x1_cols = ['A', 'B']
-        x1 = DataFrame(np.array(x1_data), index=x1_index,
-                       columns=x1_cols)
-
-        x2_data = [[13, 14, np.NaN],
-                   [15, np.NaN, np.NaN],
-                   [16, 17, 48],
-                   [19, 20, 21],
-                   [22, 23, 24]]
-        x2_index = [datetime(2000, 1, 1),
-                    datetime(2000, 1, 2),
-                    datetime(2000, 1, 3),
-                    datetime(2000, 1, 4),
-                    datetime(2000, 1, 5)]
-        x2_cols = ['C', 'A', 'B']
-        x2 = DataFrame(np.array(x2_data), index=x2_index,
-                       columns=x2_cols)
-
-        self.panel_x2 = {'x1': x1, 'x2': x2}
-
-    def createData3(self):
-        y_data = [[1, 2],
-                  [3, 4]]
-        y_index = [datetime(2000, 1, 1),
-                   datetime(2000, 1, 2)]
-        y_cols = ['A', 'B']
-        self.panel_y3 = DataFrame(np.array(y_data), index=y_index,
-                                  columns=y_cols)
-
-        x1_data = [['A', 'B'],
-                   ['C', 'A']]
-        x1_index = [datetime(2000, 1, 1),
-                    datetime(2000, 1, 2)]
-        x1_cols = ['A', 'B']
-        x1 = DataFrame(np.array(x1_data), index=x1_index,
-                       columns=x1_cols)
-
-        x2_data = [['foo', 'bar'],
-                   ['baz', 'foo']]
-        x2_index = [datetime(2000, 1, 1),
-                    datetime(2000, 1, 2)]
-        x2_cols = ['A', 'B']
-        x2 = DataFrame(np.array(x2_data), index=x2_index,
-                       columns=x2_cols)
-
-        self.panel_x3 = {'x1': x1, 'x2': x2}
diff --git a/pandas/stats/tests/test_fama_macbeth.py b/pandas/stats/tests/test_fama_macbeth.py
deleted file mode 100644
index dd2f196361226..0000000000000
--- a/pandas/stats/tests/test_fama_macbeth.py
+++ /dev/null
@@ -1,64 +0,0 @@
-from pandas import DataFrame, Panel
-from pandas.stats.api import fama_macbeth
-from .common import assert_almost_equal, BaseTest
-
-from pandas.compat import range
-from pandas import compat
-import numpy as np
-
-
-class TestFamaMacBeth(BaseTest):
-    def testFamaMacBethRolling(self):
-        # self.checkFamaMacBethExtended('rolling', self.panel_x, self.panel_y,
-        #                               nw_lags_beta=2)
-
-        # df = DataFrame(np.random.randn(50, 10))
-        x = dict((k, DataFrame(np.random.randn(50, 10))) for k in 'abcdefg')
-        x = Panel.from_dict(x)
-        y = (DataFrame(np.random.randn(50, 10)) +
-             DataFrame(0.01 * np.random.randn(50, 10)))
-        self.checkFamaMacBethExtended('rolling', x, y, nw_lags_beta=2)
-        self.checkFamaMacBethExtended('expanding', x, y, nw_lags_beta=2)
-
-    def checkFamaMacBethExtended(self, window_type, x, y, **kwds):
-        window = 25
-
-        result = fama_macbeth(y=y, x=x, window_type=window_type, window=window,
-                              **kwds)
-        self._check_stuff_works(result)
-
-        index = result._index
-        time = len(index)
-
-        for i in range(time - window + 1):
-            if window_type == 'rolling':
-                start = index[i]
-            else:
-                start = index[0]
-
-            end = index[i + window - 1]
-
-            x2 = {}
-            for k, v in compat.iteritems(x):
-                x2[k] = v.truncate(start, end)
-            y2 = y.truncate(start, end)
-
-            reference = fama_macbeth(y=y2, x=x2, **kwds)
-            assert_almost_equal(reference._stats, result._stats[:, i])
-
-        static = fama_macbeth(y=y2, x=x2, **kwds)
-        self._check_stuff_works(static)
-
-    def _check_stuff_works(self, result):
-        # does it work?
-        attrs = ['mean_beta', 'std_beta', 't_stat']
-        for attr in attrs:
-            getattr(result, attr)
-
-        # does it work?
-        result.summary
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/stats/tests/test_math.py b/pandas/stats/tests/test_math.py
deleted file mode 100644
index 1d1288e126418..0000000000000
--- a/pandas/stats/tests/test_math.py
+++ /dev/null
@@ -1,67 +0,0 @@
-import nose
-
-from datetime import datetime
-from numpy.random import randn
-import numpy as np
-
-from pandas.core.api import Series, DataFrame, date_range
-from pandas.util.testing import assert_almost_equal
-import pandas.core.datetools as datetools
-import pandas.stats.moments as mom
-import pandas.util.testing as tm
-import pandas.stats.math as pmath
-import pandas.tests.test_series as ts
-from pandas import ols
-
-N, K = 100, 10
-
-_have_statsmodels = True
-try:
-    import statsmodels.api as sm
-except ImportError:
-    try:
-        import scikits.statsmodels.api as sm
-    except ImportError:
-        _have_statsmodels = False
-
-
-class TestMath(tm.TestCase):
-
-    _nan_locs = np.arange(20, 40)
-    _inf_locs = np.array([])
-
-    def setUp(self):
-        arr = randn(N)
-        arr[self._nan_locs] = np.NaN
-
-        self.arr = arr
-        self.rng = date_range(datetime(2009, 1, 1), periods=N)
-
-        self.series = Series(arr.copy(), index=self.rng)
-
-        self.frame = DataFrame(randn(N, K), index=self.rng,
-                               columns=np.arange(K))
-
-    def test_rank_1d(self):
-        self.assertEqual(1, pmath.rank(self.series))
-        self.assertEqual(0, pmath.rank(Series(0, self.series.index)))
-
-    def test_solve_rect(self):
-        if not _have_statsmodels:
-            raise nose.SkipTest("no statsmodels")
-
-        b = Series(np.random.randn(N), self.frame.index)
-        result = pmath.solve(self.frame, b)
-        expected = ols(y=b, x=self.frame, intercept=False).beta
-        self.assertTrue(np.allclose(result, expected))
-
-    def test_inv_illformed(self):
-        singular = DataFrame(np.array([[1, 1], [2, 2]]))
-        rs = pmath.inv(singular)
-        expected = np.array([[0.1, 0.2], [0.1, 0.2]])
-        self.assertTrue(np.allclose(rs, expected))
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/stats/tests/test_moments.py b/pandas/stats/tests/test_moments.py
deleted file mode 100644
index 3615cc3dc8ad8..0000000000000
--- a/pandas/stats/tests/test_moments.py
+++ /dev/null
@@ -1,1933 +0,0 @@
-import nose
-import sys
-import functools
-import warnings
-
-from datetime import datetime
-from numpy.random import randn
-from numpy.testing.decorators import slow
-import numpy as np
-from distutils.version import LooseVersion
-
-from pandas import Series, DataFrame, Panel, bdate_range, isnull, notnull, concat
-from pandas.util.testing import (
-    assert_almost_equal, assert_series_equal, assert_frame_equal, assert_panel_equal, assert_index_equal
-)
-import pandas.core.datetools as datetools
-import pandas.stats.moments as mom
-import pandas.util.testing as tm
-from pandas.compat import range, zip, PY3, StringIO
-
-N, K = 100, 10
-
-class Base(tm.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    _nan_locs = np.arange(20, 40)
-    _inf_locs = np.array([])
-
-    def _create_data(self):
-        arr = randn(N)
-        arr[self._nan_locs] = np.NaN
-
-        self.arr = arr
-        self.rng = bdate_range(datetime(2009, 1, 1), periods=N)
-
-        self.series = Series(arr.copy(), index=self.rng)
-
-        self.frame = DataFrame(randn(N, K), index=self.rng,
-                               columns=np.arange(K))
-
-class TestMoments(Base):
-
-    def setUp(self):
-        self._create_data()
-        warnings.simplefilter("ignore", category=FutureWarning)
-
-    def test_centered_axis_validation(self):
-        # ok
-        mom.rolling_mean(Series(np.ones(10)),3,center=True ,axis=0)
-        # bad axis
-        self.assertRaises(ValueError, mom.rolling_mean,Series(np.ones(10)),3,center=True ,axis=1)
-
-        # ok ok
-        mom.rolling_mean(DataFrame(np.ones((10,10))),3,center=True ,axis=0)
-        mom.rolling_mean(DataFrame(np.ones((10,10))),3,center=True ,axis=1)
-        # bad axis
-        self.assertRaises(ValueError, mom.rolling_mean,DataFrame(np.ones((10,10))),3,center=True ,axis=2)
-
-    def test_rolling_sum(self):
-        self._check_moment_func(mom.rolling_sum, np.sum)
-
-    def test_rolling_count(self):
-        counter = lambda x: np.isfinite(x).astype(float).sum()
-        self._check_moment_func(mom.rolling_count, counter,
-                                has_min_periods=False,
-                                preserve_nan=False,
-                                fill_value=0)
-
-    def test_rolling_mean(self):
-        self._check_moment_func(mom.rolling_mean, np.mean)
-
-    def test_cmov_mean(self):
-        # GH 8238
-        tm._skip_if_no_scipy()
-
-        vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81, 13.49,
-                         16.68, 9.48, 10.63, 14.48])
-        xp = np.array([np.nan, np.nan, 9.962, 11.27 , 11.564, 12.516,
-                       12.818,  12.952, np.nan, np.nan])
-
-        rs = mom.rolling_mean(vals, 5, center=True)
-        assert_almost_equal(xp, rs)
-
-        xp = Series(rs)
-        rs = mom.rolling_mean(Series(vals), 5, center=True)
-        assert_series_equal(xp, rs)
-
-    def test_cmov_window(self):
-        # GH 8238
-        tm._skip_if_no_scipy()
-
-        vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81,
-                         13.49, 16.68, 9.48, 10.63, 14.48])
-        xp = np.array([np.nan, np.nan, 9.962, 11.27 , 11.564, 12.516,
-                       12.818,  12.952, np.nan, np.nan])
-
-        rs = mom.rolling_window(vals, 5, 'boxcar', center=True)
-        assert_almost_equal(xp, rs)
-
-        xp = Series(rs)
-        rs = mom.rolling_window(Series(vals), 5, 'boxcar', center=True)
-        assert_series_equal(xp, rs)
-
-    def test_cmov_window_corner(self):
-        # GH 8238
-        tm._skip_if_no_scipy()
-
-        # all nan
-        vals = np.empty(10, dtype=float)
-        vals.fill(np.nan)
-        rs = mom.rolling_window(vals, 5, 'boxcar', center=True)
-        self.assertTrue(np.isnan(rs).all())
-
-        # empty
-        vals = np.array([])
-        rs = mom.rolling_window(vals, 5, 'boxcar', center=True)
-        self.assertEqual(len(rs), 0)
-
-        # shorter than window
-        vals = np.random.randn(5)
-        rs = mom.rolling_window(vals, 10, 'boxcar')
-        self.assertTrue(np.isnan(rs).all())
-        self.assertEqual(len(rs), 5)
-
-    def test_cmov_window_frame(self):
-        # Gh 8238
-        tm._skip_if_no_scipy()
-
-        vals = np.array([[ 12.18,   3.64],
-                         [ 10.18,   9.16],
-                         [ 13.24,  14.61],
-                         [  4.51,   8.11],
-                         [  6.15,  11.44],
-                         [  9.14,   6.21],
-                         [ 11.31,  10.67],
-                         [  2.94,   6.51],
-                         [  9.42,   8.39],
-                         [ 12.44,   7.34 ]])
-
-        xp = np.array([[ np.nan,  np.nan],
-                       [ np.nan,  np.nan],
-                       [  9.252,   9.392],
-                       [  8.644,   9.906],
-                       [  8.87 ,  10.208],
-                       [  6.81 ,   8.588],
-                       [  7.792,   8.644],
-                       [  9.05 ,   7.824],
-                       [ np.nan,  np.nan],
-                       [ np.nan,  np.nan]])
-
-        # DataFrame
-        rs = mom.rolling_window(DataFrame(vals), 5, 'boxcar', center=True)
-        assert_frame_equal(DataFrame(xp), rs)
-
-    def test_cmov_window_na_min_periods(self):
-        tm._skip_if_no_scipy()
-
-        # min_periods
-        vals = Series(np.random.randn(10))
-        vals[4] = np.nan
-        vals[8] = np.nan
-
-        xp = mom.rolling_mean(vals, 5, min_periods=4, center=True)
-        rs = mom.rolling_window(vals, 5, 'boxcar', min_periods=4, center=True)
-
-        assert_series_equal(xp, rs)
-
-    def test_cmov_window_regular(self):
-        # GH 8238
-        tm._skip_if_no_scipy()
-
-        win_types = ['triang', 'blackman', 'hamming', 'bartlett', 'bohman',
-                     'blackmanharris', 'nuttall', 'barthann']
-
-        vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81,
-                         13.49, 16.68, 9.48, 10.63, 14.48])
-        xps = {
-            'hamming': [np.nan, np.nan, 8.71384, 9.56348, 12.38009,
-                        14.03687, 13.8567, 11.81473, np.nan, np.nan],
-            'triang': [np.nan, np.nan, 9.28667, 10.34667, 12.00556,
-                       13.33889, 13.38, 12.33667, np.nan, np.nan],
-            'barthann': [np.nan, np.nan, 8.4425, 9.1925, 12.5575,
-                         14.3675, 14.0825, 11.5675, np.nan, np.nan],
-            'bohman': [np.nan, np.nan, 7.61599, 9.1764, 12.83559,
-                       14.17267, 14.65923, 11.10401, np.nan, np.nan],
-            'blackmanharris': [np.nan, np.nan, 6.97691, 9.16438, 13.05052,
-                               14.02156, 15.10512, 10.74574, np.nan, np.nan],
-            'nuttall': [np.nan, np.nan, 7.04618, 9.16786, 13.02671,
-                        14.03559, 15.05657, 10.78514, np.nan, np.nan],
-            'blackman': [np.nan, np.nan, 7.73345, 9.17869, 12.79607,
-                         14.20036, 14.57726, 11.16988, np.nan, np.nan],
-            'bartlett': [np.nan, np.nan, 8.4425, 9.1925, 12.5575,
-                         14.3675, 14.0825, 11.5675, np.nan, np.nan]}
-
-        for wt in win_types:
-            xp = Series(xps[wt])
-            rs = mom.rolling_window(Series(vals), 5, wt, center=True)
-            assert_series_equal(xp, rs)
-
-    def test_cmov_window_regular_linear_range(self):
-        # GH 8238
-        tm._skip_if_no_scipy()
-
-        win_types = ['triang', 'blackman', 'hamming', 'bartlett', 'bohman',
-                     'blackmanharris', 'nuttall', 'barthann']
-
-        vals = np.array(range(10), dtype=np.float)
-        xp = vals.copy()
-        xp[:2] = np.nan
-        xp[-2:] = np.nan
-        xp = Series(xp)
-
-        for wt in win_types:
-            rs = mom.rolling_window(Series(vals), 5, wt, center=True)
-            assert_series_equal(xp, rs)
-
-    def test_cmov_window_regular_missing_data(self):
-        # GH 8238
-        tm._skip_if_no_scipy()
-
-        win_types = ['triang', 'blackman', 'hamming', 'bartlett', 'bohman',
-                     'blackmanharris', 'nuttall', 'barthann']
-
-        vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81,
-                         13.49, 16.68, np.nan, 10.63, 14.48])
-        xps = {
-            'bartlett': [np.nan, np.nan, 9.70333, 10.5225, 8.4425,
-                         9.1925, 12.5575, 14.3675, 15.61667, 13.655],
-            'blackman': [np.nan, np.nan, 9.04582, 11.41536, 7.73345,
-                         9.17869, 12.79607, 14.20036, 15.8706, 13.655],
-            'barthann': [np.nan, np.nan, 9.70333, 10.5225, 8.4425,
-                         9.1925, 12.5575, 14.3675, 15.61667, 13.655],
-            'bohman': [np.nan, np.nan, 8.9444, 11.56327, 7.61599,
-                       9.1764, 12.83559, 14.17267, 15.90976, 13.655],
-            'hamming': [np.nan, np.nan, 9.59321, 10.29694, 8.71384,
-                        9.56348, 12.38009, 14.20565, 15.24694, 13.69758],
-            'nuttall': [np.nan, np.nan, 8.47693, 12.2821, 7.04618,
-                        9.16786, 13.02671, 14.03673, 16.08759, 13.65553],
-            'triang': [np.nan, np.nan, 9.33167, 9.76125, 9.28667,
-                       10.34667, 12.00556, 13.82125, 14.49429, 13.765],
-            'blackmanharris': [np.nan, np.nan, 8.42526, 12.36824, 6.97691,
-                               9.16438, 13.05052, 14.02175, 16.1098,
-                               13.65509]
-            }
-
-        for wt in win_types:
-            xp = Series(xps[wt])
-            rs = mom.rolling_window(Series(vals), 5, wt, min_periods=3)
-            assert_series_equal(xp, rs)
-
-    def test_cmov_window_special(self):
-        # GH 8238
-        tm._skip_if_no_scipy()
-
-        win_types = ['kaiser', 'gaussian', 'general_gaussian', 'slepian']
-        kwds = [{'beta': 1.}, {'std': 1.}, {'power': 2., 'width': 2.},
-                {'width': 0.5}]
-
-        vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81,
-                         13.49, 16.68, 9.48, 10.63, 14.48])
-
-        xps = {
-            'gaussian': [np.nan, np.nan, 8.97297, 9.76077, 12.24763,
-                         13.89053, 13.65671, 12.01002, np.nan, np.nan],
-            'general_gaussian': [np.nan, np.nan, 9.85011, 10.71589,
-                                 11.73161, 13.08516, 12.95111, 12.74577,
-                                 np.nan, np.nan],
-            'slepian': [np.nan, np.nan, 9.81073, 10.89359, 11.70284,
-                        12.88331, 12.96079, 12.77008, np.nan, np.nan],
-            'kaiser': [np.nan, np.nan, 9.86851, 11.02969, 11.65161,
-                       12.75129, 12.90702, 12.83757, np.nan, np.nan]
-        }
-
-        for wt, k in zip(win_types, kwds):
-            xp = Series(xps[wt])
-
-            rs = mom.rolling_window(Series(vals), 5, wt, center=True,
-                                    **k)
-            assert_series_equal(xp, rs)
-
-    def test_cmov_window_special_linear_range(self):
-        # GH 8238
-        tm._skip_if_no_scipy()
-
-        win_types = ['kaiser', 'gaussian', 'general_gaussian', 'slepian']
-        kwds = [{'beta': 1.}, {'std': 1.}, {'power': 2., 'width': 2.},
-                {'width': 0.5}]
-
-        vals = np.array(range(10), dtype=np.float)
-        xp = vals.copy()
-        xp[:2] = np.nan
-        xp[-2:] = np.nan
-        xp = Series(xp)
-
-        for wt, k in zip(win_types, kwds):
-            rs = mom.rolling_window(Series(vals), 5, wt, center=True,
-                                    **k)
-            assert_series_equal(xp, rs)
-
-    def test_rolling_median(self):
-        self._check_moment_func(mom.rolling_median, np.median)
-
-    def test_rolling_min(self):
-        self._check_moment_func(mom.rolling_min, np.min)
-
-        a = np.array([1, 2, 3, 4, 5])
-        b = mom.rolling_min(a, window=100, min_periods=1)
-        assert_almost_equal(b, np.ones(len(a)))
-
-        self.assertRaises(ValueError, mom.rolling_min, np.array([1,
-                          2, 3]), window=3, min_periods=5)
-
-    def test_rolling_max(self):
-        self._check_moment_func(mom.rolling_max, np.max)
-
-        a = np.array([1, 2, 3, 4, 5])
-        b = mom.rolling_max(a, window=100, min_periods=1)
-        assert_almost_equal(a, b)
-
-        self.assertRaises(ValueError, mom.rolling_max, np.array([1,
-                          2, 3]), window=3, min_periods=5)
-
-    def test_rolling_quantile(self):
-        qs = [.1, .5, .9]
-
-        def scoreatpercentile(a, per):
-            values = np.sort(a, axis=0)
-
-            idx = per / 1. * (values.shape[0] - 1)
-            return values[int(idx)]
-
-        for q in qs:
-            def f(x, window, min_periods=None, freq=None, center=False):
-                return mom.rolling_quantile(x, window, q,
-                                            min_periods=min_periods,
-                                            freq=freq,
-                                            center=center)
-
-            def alt(x):
-                return scoreatpercentile(x, q)
-
-            self._check_moment_func(f, alt)
-
-    def test_rolling_apply(self):
-        # suppress warnings about empty slices, as we are deliberately testing with a 0-length Series
-        with warnings.catch_warnings():
-            warnings.filterwarnings("ignore", message=".*(empty slice|0 for slice).*", category=RuntimeWarning)
-
-            ser = Series([])
-            assert_series_equal(ser, mom.rolling_apply(ser, 10, lambda x: x.mean()))
-
-            def roll_mean(x, window, min_periods=None, freq=None, center=False):
-                return mom.rolling_apply(x, window,
-                                         lambda x: x[np.isfinite(x)].mean(),
-                                         min_periods=min_periods,
-                                         freq=freq,
-                                         center=center)
-            self._check_moment_func(roll_mean, np.mean)
-
-        # GH 8080
-        s = Series([None, None, None])
-        result = mom.rolling_apply(s, 2, lambda x: len(x), min_periods=0)
-        expected = Series([1., 2., 2.])
-        assert_series_equal(result, expected)
-
-    def test_rolling_apply_out_of_bounds(self):
-        # #1850
-        arr = np.arange(4)
-
-        # it works!
-        result = mom.rolling_apply(arr, 10, np.sum)
-        self.assertTrue(isnull(result).all())
-
-        result = mom.rolling_apply(arr, 10, np.sum, min_periods=1)
-        assert_almost_equal(result, result)
-
-    def test_rolling_std(self):
-        self._check_moment_func(mom.rolling_std,
-                                lambda x: np.std(x, ddof=1))
-        self._check_moment_func(functools.partial(mom.rolling_std, ddof=0),
-                                lambda x: np.std(x, ddof=0))
-
-    def test_rolling_std_1obs(self):
-        result = mom.rolling_std(np.array([1., 2., 3., 4., 5.]),
-                                 1, min_periods=1)
-        expected = np.array([np.nan] * 5)
-        assert_almost_equal(result, expected)
-
-        result = mom.rolling_std(np.array([1., 2., 3., 4., 5.]),
-                                 1, min_periods=1, ddof=0)
-        expected = np.zeros(5)
-        assert_almost_equal(result, expected)
-
-        result = mom.rolling_std(np.array([np.nan, np.nan, 3., 4., 5.]),
-                                 3, min_periods=2)
-        self.assertTrue(np.isnan(result[2]))
-
-    def test_rolling_std_neg_sqrt(self):
-        # unit test from Bottleneck
-
-        # Test move_nanstd for neg sqrt.
-
-        a = np.array([0.0011448196318903589,
-                      0.00028718669878572767,
-                      0.00028718669878572767,
-                      0.00028718669878572767,
-                      0.00028718669878572767])
-        b = mom.rolling_std(a, window=3)
-        self.assertTrue(np.isfinite(b[2:]).all())
-
-        b = mom.ewmstd(a, span=3)
-        self.assertTrue(np.isfinite(b[2:]).all())
-
-    def test_rolling_var(self):
-        self._check_moment_func(mom.rolling_var,
-                                lambda x: np.var(x, ddof=1),
-                                test_stable=True)
-        self._check_moment_func(functools.partial(mom.rolling_var, ddof=0),
-                                lambda x: np.var(x, ddof=0))
-
-    def test_rolling_skew(self):
-        try:
-            from scipy.stats import skew
-        except ImportError:
-            raise nose.SkipTest('no scipy')
-        self._check_moment_func(mom.rolling_skew,
-                                lambda x: skew(x, bias=False))
-
-    def test_rolling_kurt(self):
-        try:
-            from scipy.stats import kurtosis
-        except ImportError:
-            raise nose.SkipTest('no scipy')
-        self._check_moment_func(mom.rolling_kurt,
-                                lambda x: kurtosis(x, bias=False))
-
-    def test_fperr_robustness(self):
-        # TODO: remove this once python 2.5 out of picture
-        if PY3:
-            raise nose.SkipTest("doesn't work on python 3")
-
-        # #2114
-        data = '\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1a@\xaa\xaa\xaa\xaa\xaa\xaa\x02@8\x8e\xe38\x8e\xe3\xe8?z\t\xed%\xb4\x97\xd0?\xa2\x0c<\xdd\x9a\x1f\xb6?\x82\xbb\xfa&y\x7f\x9d?\xac\'\xa7\xc4P\xaa\x83?\x90\xdf\xde\xb0k8j?`\xea\xe9u\xf2zQ?*\xe37\x9d\x98N7?\xe2.\xf5&v\x13\x1f?\xec\xc9\xf8\x19\xa4\xb7\x04?\x90b\xf6w\x85\x9f\xeb>\xb5A\xa4\xfaXj\xd2>F\x02\xdb\xf8\xcb\x8d\xb8>.\xac<\xfb\x87^\xa0>\xe8:\xa6\xf9_\xd3\x85>\xfb?\xe2cUU\xfd?\xfc\x7fA\xed8\x8e\xe3?\xa5\xaa\xac\x91\xf6\x12\xca?n\x1cs\xb6\xf9a\xb1?\xe8%D\xf3L-\x97?5\xddZD\x11\xe7~?#>\xe7\x82\x0b\x9ad?\xd9R4Y\x0fxK?;7x;\nP2?N\xf4JO\xb8j\x18?4\xf81\x8a%G\x00?\x9a\xf5\x97\r2\xb4\xe5>\xcd\x9c\xca\xbcB\xf0\xcc>3\x13\x87(\xd7J\xb3>\x99\x19\xb4\xe0\x1e\xb9\x99>ff\xcd\x95\x14&\x81>\x88\x88\xbc\xc7p\xddf>`\x0b\xa6_\x96|N>@\xb2n\xea\x0eS4>U\x98\x938i\x19\x1b>\x8eeb\xd0\xf0\x10\x02>\xbd\xdc-k\x96\x16\xe8=(\x93\x1e\xf2\x0e\x0f\xd0=\xe0n\xd3Bii\xb5=*\xe9\x19Y\x8c\x8c\x9c=\xc6\xf0\xbb\x90]\x08\x83=]\x96\xfa\xc0|`i=>d\xfc\xd5\xfd\xeaP=R0\xfb\xc7\xa7\x8e6=\xc2\x95\xf9_\x8a\x13\x1e=\xd6c\xa6\xea\x06\r\x04=r\xda\xdd8\t\xbc\xea<\xf6\xe6\x93\xd0\xb0\xd2\xd1<\x9d\xdeok\x96\xc3\xb7<&~\xea9s\xaf\x9f<UUUUUU\x13@q\x1c\xc7q\x1c\xc7\xf9?\xf6\x12\xdaKh/\xe1?\xf2\xc3"e\xe0\xe9\xc6?\xed\xaf\x831+\x8d\xae?\xf3\x1f\xad\xcb\x1c^\x94?\x15\x1e\xdd\xbd>\xb8\x02@\xc6\xd2&\xfd\xa8\xf5\xe8?\xd9\xe1\x19\xfe\xc5\xa3\xd0?v\x82"\xa8\xb2/\xb6?\x9dX\x835\xee\x94\x9d?h\x90W\xce\x9e\xb8\x83?\x8a\xc0th~Kj?\\\x80\xf8\x9a\xa9\x87Q?%\xab\xa0\xce\x8c_7?1\xe4\x80\x13\x11*\x1f? \x98\x00\r\xb6\xc6\x04?\x80u\xabf\x9d\xb3\xeb>UNrD\xbew\xd2>\x1c\x13C[\xa8\x9f\xb8>\x12b\xd7<pj\xa0>m-\x1fQ@\xe3\x85>\xe6\x91)l\x00/m>Da\xc6\xf2\xaatS>\x05\xd7]\xee\xe3\xf09>'
-
-        arr = np.frombuffer(data, dtype='<f8')
-        if sys.byteorder != "little":
-            arr = arr.byteswap().newbyteorder()
-
-        result = mom.rolling_sum(arr, 2)
-        self.assertTrue((result[1:] >= 0).all())
-
-        result = mom.rolling_mean(arr, 2)
-        self.assertTrue((result[1:] >= 0).all())
-
-        result = mom.rolling_var(arr, 2)
-        self.assertTrue((result[1:] >= 0).all())
-
-        # #2527, ugh
-        arr = np.array([0.00012456, 0.0003, 0])
-        result = mom.rolling_mean(arr, 1)
-        self.assertTrue(result[-1] >= 0)
-
-        result = mom.rolling_mean(-arr, 1)
-        self.assertTrue(result[-1] <= 0)
-
-    def _check_moment_func(self, func, static_comp, window=50,
-                           has_min_periods=True,
-                           has_center=True,
-                           has_time_rule=True,
-                           preserve_nan=True,
-                           fill_value=None,
-                           test_stable=False):
-
-        self._check_ndarray(func, static_comp, window=window,
-                            has_min_periods=has_min_periods,
-                            preserve_nan=preserve_nan,
-                            has_center=has_center,
-                            fill_value=fill_value,
-                            test_stable=test_stable)
-
-        self._check_structures(func, static_comp,
-                               has_min_periods=has_min_periods,
-                               has_time_rule=has_time_rule,
-                               fill_value=fill_value,
-                               has_center=has_center)
-
-    def _check_ndarray(self, func, static_comp, window=50,
-                       has_min_periods=True,
-                       preserve_nan=True,
-                       has_center=True,
-                       fill_value=None,
-                       test_stable=False,
-                       test_window=True):
-
-        result = func(self.arr, window)
-        assert_almost_equal(result[-1],
-                            static_comp(self.arr[-50:]))
-
-        if preserve_nan:
-            assert(np.isnan(result[self._nan_locs]).all())
-
-        # excluding NaNs correctly
-        arr = randn(50)
-        arr[:10] = np.NaN
-        arr[-10:] = np.NaN
-
-        if has_min_periods:
-            result = func(arr, 50, min_periods=30)
-            assert_almost_equal(result[-1], static_comp(arr[10:-10]))
-
-            # min_periods is working correctly
-            result = func(arr, 20, min_periods=15)
-            self.assertTrue(np.isnan(result[23]))
-            self.assertFalse(np.isnan(result[24]))
-
-            self.assertFalse(np.isnan(result[-6]))
-            self.assertTrue(np.isnan(result[-5]))
-
-            arr2 = randn(20)
-            result = func(arr2, 10, min_periods=5)
-            self.assertTrue(isnull(result[3]))
-            self.assertTrue(notnull(result[4]))
-
-            # min_periods=0
-            result0 = func(arr, 20, min_periods=0)
-            result1 = func(arr, 20, min_periods=1)
-            assert_almost_equal(result0, result1)
-        else:
-            result = func(arr, 50)
-            assert_almost_equal(result[-1], static_comp(arr[10:-10]))
-
-        # GH 7925
-        if has_center:
-            if has_min_periods:
-                result = func(arr, 20, min_periods=15, center=True)
-                expected = func(np.concatenate((arr, np.array([np.NaN] * 9))), 20, min_periods=15)[9:]
-            else:
-                result = func(arr, 20, center=True)
-                expected = func(np.concatenate((arr, np.array([np.NaN] * 9))), 20)[9:]
-
-            self.assert_numpy_array_equal(result, expected)
-
-        if test_stable:
-            result = func(self.arr + 1e9, window)
-            assert_almost_equal(result[-1],
-                                static_comp(self.arr[-50:] + 1e9))
-
-        # Test window larger than array, #7297
-        if test_window:
-            if has_min_periods:
-                for minp in (0, len(self.arr)-1, len(self.arr)):
-                    result = func(self.arr, len(self.arr)+1, min_periods=minp)
-                    expected = func(self.arr, len(self.arr), min_periods=minp)
-                    nan_mask = np.isnan(result)
-                    self.assertTrue(np.array_equal(nan_mask,
-                                                   np.isnan(expected)))
-                    nan_mask = ~nan_mask
-                    assert_almost_equal(result[nan_mask], expected[nan_mask])
-            else:
-                result = func(self.arr, len(self.arr)+1)
-                expected = func(self.arr, len(self.arr))
-                nan_mask = np.isnan(result)
-                self.assertTrue(np.array_equal(nan_mask, np.isnan(expected)))
-                nan_mask = ~nan_mask
-                assert_almost_equal(result[nan_mask], expected[nan_mask])
-
-
-
-
-    def _check_structures(self, func, static_comp,
-                          has_min_periods=True, has_time_rule=True,
-                          has_center=True,
-                          fill_value=None):
-
-        series_result = func(self.series, 50)
-        tm.assertIsInstance(series_result, Series)
-
-        frame_result = func(self.frame, 50)
-        self.assertEqual(type(frame_result), DataFrame)
-
-        # check time_rule works
-        if has_time_rule:
-            win = 25
-            minp = 10
-
-            if has_min_periods:
-                series_result = func(self.series[::2], win, min_periods=minp,
-                                     freq='B')
-                frame_result = func(self.frame[::2], win, min_periods=minp,
-                                    freq='B')
-            else:
-                series_result = func(self.series[::2], win, freq='B')
-                frame_result = func(self.frame[::2], win, freq='B')
-
-            last_date = series_result.index[-1]
-            prev_date = last_date - 24 * datetools.bday
-
-            trunc_series = self.series[::2].truncate(prev_date, last_date)
-            trunc_frame = self.frame[::2].truncate(prev_date, last_date)
-
-            assert_almost_equal(series_result[-1], static_comp(trunc_series))
-
-            assert_almost_equal(frame_result.xs(last_date),
-                                trunc_frame.apply(static_comp))
-
-        # GH 7925
-        if has_center:
-            if has_min_periods:
-                minp = 10
-                series_xp = func(self.series.reindex(list(self.series.index)+['x%d'%x for x in range(12)]), 25, min_periods=minp).shift(-12).reindex(self.series.index)
-                frame_xp = func(self.frame.reindex(list(self.frame.index)+['x%d'%x for x in range(12)]), 25, min_periods=minp).shift(-12).reindex(self.frame.index)
-
-                series_rs = func(self.series, 25, min_periods=minp,
-                                 center=True)
-                frame_rs = func(self.frame, 25, min_periods=minp,
-                                center=True)
-
-            else:
-                series_xp = func(self.series.reindex(list(self.series.index)+['x%d'%x for x in range(12)]), 25).shift(-12).reindex(self.series.index)
-                frame_xp = func(self.frame.reindex(list(self.frame.index)+['x%d'%x for x in range(12)]), 25).shift(-12).reindex(self.frame.index)
-
-                series_rs = func(self.series, 25, center=True)
-                frame_rs = func(self.frame, 25, center=True)
-
-            if fill_value is not None:
-                series_xp = series_xp.fillna(fill_value)
-                frame_xp = frame_xp.fillna(fill_value)
-            assert_series_equal(series_xp, series_rs)
-            assert_frame_equal(frame_xp, frame_rs)
-
-    def test_ewma(self):
-        self._check_ew(mom.ewma)
-
-        arr = np.zeros(1000)
-        arr[5] = 1
-        result = mom.ewma(arr, span=100, adjust=False).sum()
-        self.assertTrue(np.abs(result - 1) < 1e-2)
-
-        s = Series([1.0, 2.0, 4.0, 8.0])
-
-        expected = Series([1.0, 1.6, 2.736842, 4.923077])
-        for f in [lambda s: mom.ewma(s, com=2.0, adjust=True),
-                  lambda s: mom.ewma(s, com=2.0, adjust=True, ignore_na=False),
-                  lambda s: mom.ewma(s, com=2.0, adjust=True, ignore_na=True),
-                 ]:
-            result = f(s)
-            assert_series_equal(result, expected)
-
-        expected = Series([1.0, 1.333333, 2.222222, 4.148148])
-        for f in [lambda s: mom.ewma(s, com=2.0, adjust=False),
-                  lambda s: mom.ewma(s, com=2.0, adjust=False, ignore_na=False),
-                  lambda s: mom.ewma(s, com=2.0, adjust=False, ignore_na=True),
-                 ]:
-            result = f(s)
-            assert_series_equal(result, expected)
-
-    def test_ewma_nan_handling(self):
-        s = Series([1.] + [np.nan] * 5 + [1.])
-        result = mom.ewma(s, com=5)
-        assert_almost_equal(result, [1.] * len(s))
-
-        s = Series([np.nan] * 2 + [1.] + [np.nan] * 2 + [1.])
-        result = mom.ewma(s, com=5)
-        assert_almost_equal(result, [np.nan] * 2 + [1.] * 4)
-
-        # GH 7603
-        s0 = Series([np.nan, 1., 101.])
-        s1 = Series([1., np.nan, 101.])
-        s2 = Series([np.nan, 1., np.nan, np.nan, 101., np.nan])
-        s3 = Series([1., np.nan, 101., 50.])
-        com = 2.
-        alpha = 1. / (1. + com)
-
-        def simple_wma(s, w):
-            return (s.multiply(w).cumsum() / w.cumsum()).fillna(method='ffill')
-
-        for (s, adjust, ignore_na, w) in [
-                (s0, True, False, [np.nan, (1. - alpha), 1.]),
-                (s0, True, True, [np.nan, (1. - alpha), 1.]),
-                (s0, False, False, [np.nan, (1. - alpha), alpha]),
-                (s0, False, True, [np.nan, (1. - alpha), alpha]),
-                (s1, True, False, [(1. - alpha)**2, np.nan, 1.]),
-                (s1, True, True, [(1. - alpha), np.nan, 1.]),
-                (s1, False, False, [(1. - alpha)**2, np.nan, alpha]),
-                (s1, False, True, [(1. - alpha), np.nan, alpha]),
-                (s2, True, False, [np.nan, (1. - alpha)**3, np.nan, np.nan, 1., np.nan]),
-                (s2, True, True, [np.nan, (1. - alpha), np.nan, np.nan, 1., np.nan]),
-                (s2, False, False, [np.nan, (1. - alpha)**3, np.nan, np.nan, alpha, np.nan]),
-                (s2, False, True, [np.nan, (1. - alpha), np.nan, np.nan, alpha, np.nan]),
-                (s3, True, False, [(1. - alpha)**3, np.nan, (1. - alpha), 1.]),
-                (s3, True, True, [(1. - alpha)**2, np.nan, (1. - alpha), 1.]),
-                (s3, False, False, [(1. - alpha)**3, np.nan, (1. - alpha) * alpha, alpha * ((1. - alpha)**2 + alpha)]),
-                (s3, False, True, [(1. - alpha)**2, np.nan, (1. - alpha) * alpha, alpha]),
-                ]:
-            expected = simple_wma(s, Series(w))
-            result = mom.ewma(s, com=com, adjust=adjust, ignore_na=ignore_na)
-            assert_series_equal(result, expected)
-            if ignore_na is False:
-                # check that ignore_na defaults to False
-                result = mom.ewma(s, com=com, adjust=adjust)
-                assert_series_equal(result, expected)
-
-    def test_ewmvar(self):
-        self._check_ew(mom.ewmvar)
-
-    def test_ewmvol(self):
-        self._check_ew(mom.ewmvol)
-
-    def test_ewma_span_com_args(self):
-        A = mom.ewma(self.arr, com=9.5)
-        B = mom.ewma(self.arr, span=20)
-        assert_almost_equal(A, B)
-
-        self.assertRaises(Exception, mom.ewma, self.arr, com=9.5, span=20)
-        self.assertRaises(Exception, mom.ewma, self.arr)
-
-    def test_ewma_halflife_arg(self):
-        A = mom.ewma(self.arr, com=13.932726172912965)
-        B = mom.ewma(self.arr, halflife=10.0)
-        assert_almost_equal(A, B)
-
-        self.assertRaises(Exception, mom.ewma, self.arr, span=20, halflife=50)
-        self.assertRaises(Exception, mom.ewma, self.arr, com=9.5, halflife=50)
-        self.assertRaises(Exception, mom.ewma, self.arr, com=9.5, span=20, halflife=50)
-        self.assertRaises(Exception, mom.ewma, self.arr)
-
-    def test_moment_preserve_series_name(self):
-        # GH 10565
-        s = Series(np.arange(100), name='foo')
-        s2 = mom.rolling_mean(s, 30)
-        s3 = mom.rolling_sum(s, 20)
-        self.assertEqual(s2.name, 'foo')
-        self.assertEqual(s3.name, 'foo')
-
-    def test_ew_empty_arrays(self):
-        arr = np.array([], dtype=np.float64)
-
-        funcs = [mom.ewma, mom.ewmvol, mom.ewmvar]
-        for f in funcs:
-            result = f(arr, 3)
-            assert_almost_equal(result, arr)
-
-    def _check_ew(self, func):
-        self._check_ew_ndarray(func)
-        self._check_ew_structures(func)
-
-    def _check_ew_ndarray(self, func, preserve_nan=False):
-        result = func(self.arr, com=10)
-        if preserve_nan:
-            assert(np.isnan(result[self._nan_locs]).all())
-
-        # excluding NaNs correctly
-        arr = randn(50)
-        arr[:10] = np.NaN
-        arr[-10:] = np.NaN
-        s = Series(arr)
-
-        # check min_periods
-        # GH 7898
-        result = func(s, 50, min_periods=2)
-        self.assertTrue(np.isnan(result.values[:11]).all())
-        self.assertFalse(np.isnan(result.values[11:]).any())
-
-        for min_periods in (0, 1):
-            result = func(s, 50, min_periods=min_periods)
-            if func == mom.ewma:
-                self.assertTrue(np.isnan(result.values[:10]).all())
-                self.assertFalse(np.isnan(result.values[10:]).any())
-            else:
-                # ewmstd, ewmvol, ewmvar (with bias=False) require at least two values
-                self.assertTrue(np.isnan(result.values[:11]).all())
-                self.assertFalse(np.isnan(result.values[11:]).any())
-
-            # check series of length 0
-            result = func(Series([]), 50, min_periods=min_periods)
-            assert_series_equal(result, Series([]))
-
-            # check series of length 1
-            result = func(Series([1.]), 50, min_periods=min_periods)
-            if func == mom.ewma:
-                assert_series_equal(result, Series([1.]))
-            else:
-                # ewmstd, ewmvol, ewmvar with bias=False require at least two values
-                assert_series_equal(result, Series([np.NaN]))
-
-        # pass in ints
-        result2 = func(np.arange(50), span=10)
-        self.assertEqual(result2.dtype, np.float_)
-
-    def _check_ew_structures(self, func):
-        series_result = func(self.series, com=10)
-        tm.assertIsInstance(series_result, Series)
-        frame_result = func(self.frame, com=10)
-        self.assertEqual(type(frame_result), DataFrame)
-
-# create the data only once as we are not setting it
-def _create_consistency_data():
-
-    def create_series():
-       return [Series(),
-               Series([np.nan]),
-               Series([np.nan, np.nan]),
-               Series([3.]),
-               Series([np.nan, 3.]),
-               Series([3., np.nan]),
-               Series([1., 3.]),
-               Series([2., 2.]),
-               Series([3., 1.]),
-               Series([5., 5., 5., 5., np.nan, np.nan, np.nan, 5., 5., np.nan, np.nan]),
-               Series([np.nan, 5., 5., 5., np.nan, np.nan, np.nan, 5., 5., np.nan, np.nan]),
-               Series([np.nan, np.nan, 5., 5., np.nan, np.nan, np.nan, 5., 5., np.nan, np.nan]),
-               Series([np.nan, 3., np.nan, 3., 4., 5., 6., np.nan, np.nan, 7., 12., 13., 14., 15.]),
-               Series([np.nan, 5., np.nan, 2., 4., 0., 9., np.nan, np.nan, 3., 12., 13., 14., 15.]),
-               Series([2., 3., np.nan, 3., 4., 5., 6., np.nan, np.nan, 7., 12., 13., 14., 15.]),
-               Series([2., 5., np.nan, 2., 4., 0., 9., np.nan, np.nan, 3., 12., 13., 14., 15.]),
-               Series(range(10)),
-               Series(range(20, 0, -2)),
-              ]
-
-    def create_dataframes():
-       return [DataFrame(),
-               DataFrame(columns=['a']),
-               DataFrame(columns=['a', 'a']),
-               DataFrame(columns=['a', 'b']),
-               DataFrame(np.arange(10).reshape((5, 2))),
-               DataFrame(np.arange(25).reshape((5, 5))),
-               DataFrame(np.arange(25).reshape((5, 5)), columns=['a', 'b', 99, 'd', 'd']),
-              ] + [DataFrame(s) for s in create_series()]
-
-    def is_constant(x):
-        values = x.values.ravel()
-        return len(set(values[notnull(values)])) == 1
-
-    def no_nans(x):
-        return x.notnull().all().all()
-
-    # data is a tuple(object, is_contant, no_nans)
-    data = create_series() + create_dataframes()
-
-    return [ (x, is_constant(x), no_nans(x)) for x in data ]
-_consistency_data = _create_consistency_data()
-
-class TestMomentsConsistency(Base):
-    base_functions = [
-        (lambda v: Series(v).count(), None, 'count'),
-        (lambda v: Series(v).max(), None, 'max'),
-        (lambda v: Series(v).min(), None, 'min'),
-        (lambda v: Series(v).sum(), None, 'sum'),
-        (lambda v: Series(v).mean(), None, 'mean'),
-        (lambda v: Series(v).std(), 1, 'std'),
-        (lambda v: Series(v).cov(Series(v)), None, 'cov'),
-        (lambda v: Series(v).corr(Series(v)), None, 'corr'),
-        (lambda v: Series(v).var(), 1, 'var'),
-        #(lambda v: Series(v).skew(), 3, 'skew'), # restore once GH 8086 is fixed
-        #(lambda v: Series(v).kurt(), 4, 'kurt'), # restore once GH 8086 is fixed
-        #(lambda x, min_periods: mom.expanding_quantile(x, 0.3, min_periods=min_periods, 'quantile'),
-        # lambda v: Series(v).quantile(0.3), None, 'quantile'), # restore once GH 8084 is fixed
-        (lambda v: Series(v).median(), None ,'median'),
-        (np.nanmax, 1, 'max'),
-        (np.nanmin, 1, 'min'),
-        (np.nansum, 1, 'sum'),
-        ]
-    if np.__version__ >= LooseVersion('1.8.0'):
-        base_functions += [
-            (np.nanmean, 1, 'mean'),
-            (lambda v: np.nanstd(v, ddof=1), 1 ,'std'),
-            (lambda v: np.nanvar(v, ddof=1), 1 ,'var'),
-        ]
-    if np.__version__ >= LooseVersion('1.9.0'):
-        base_functions += [
-            (np.nanmedian, 1, 'median'),
-            ]
-    no_nan_functions = [
-        (np.max, None, 'max'),
-        (np.min, None, 'min'),
-        (np.sum, None, 'sum'),
-        (np.mean, None, 'mean'),
-        (lambda v: np.std(v, ddof=1), 1 ,'std'),
-        (lambda v: np.var(v, ddof=1), 1 ,'var'),
-        (np.median, None, 'median'),
-    ]
-
-    def _create_data(self):
-        super(TestMomentsConsistency, self)._create_data()
-        self.data = _consistency_data
-
-    def setUp(self):
-        self._create_data()
-        warnings.simplefilter("ignore", category=FutureWarning)
-
-    def _test_moments_consistency(self,
-                                  min_periods,
-                                  count, mean, mock_mean, corr,
-                                  var_unbiased=None, std_unbiased=None, cov_unbiased=None,
-                                  var_biased=None, std_biased=None, cov_biased=None,
-                                  var_debiasing_factors=None):
-
-        def _non_null_values(x):
-            values = x.values.ravel()
-            return set(values[notnull(values)].tolist())
-
-        for (x, is_constant, no_nans) in self.data:
-            assert_equal = assert_series_equal if isinstance(x, Series) else assert_frame_equal
-            count_x = count(x)
-            mean_x = mean(x)
-
-            if mock_mean:
-                # check that mean equals mock_mean
-                expected = mock_mean(x)
-                assert_equal(mean_x, expected.astype('float64'))
-
-            # check that correlation of a series with itself is either 1 or NaN
-            corr_x_x = corr(x, x)
-            # self.assertTrue(_non_null_values(corr_x_x).issubset(set([1.]))) # restore once rolling_cov(x, x) is identically equal to var(x)
-
-            if is_constant:
-                exp = x.max() if isinstance(x, Series) else x.max().max()
-
-                # check mean of constant series
-                expected = x * np.nan
-                expected[count_x >= max(min_periods, 1)] = exp
-                assert_equal(mean_x, expected)
-
-                # check correlation of constant series with itself is NaN
-                expected[:] = np.nan
-                assert_equal(corr_x_x, expected)
-
-            if var_unbiased and var_biased and var_debiasing_factors:
-                # check variance debiasing factors
-                var_unbiased_x = var_unbiased(x)
-                var_biased_x = var_biased(x)
-                var_debiasing_factors_x = var_debiasing_factors(x)
-                assert_equal(var_unbiased_x, var_biased_x * var_debiasing_factors_x)
-
-            for (std, var, cov) in [(std_biased, var_biased, cov_biased),
-                                    (std_unbiased, var_unbiased, cov_unbiased)]:
-
-                # check that var(x), std(x), and cov(x) are all >= 0
-                var_x = var(x)
-                std_x = std(x)
-                self.assertFalse((var_x < 0).any().any())
-                self.assertFalse((std_x < 0).any().any())
-                if cov:
-                    cov_x_x = cov(x, x)
-                    self.assertFalse((cov_x_x < 0).any().any())
-
-                    # check that var(x) == cov(x, x)
-                    assert_equal(var_x, cov_x_x)
-
-                # check that var(x) == std(x)^2
-                assert_equal(var_x, std_x * std_x)
-
-                if var is var_biased:
-                    # check that biased var(x) == mean(x^2) - mean(x)^2
-                    mean_x2 = mean(x * x)
-                    assert_equal(var_x, mean_x2 - (mean_x * mean_x))
-
-                if is_constant:
-                    # check that variance of constant series is identically 0
-                    self.assertFalse((var_x > 0).any().any())
-                    expected = x * np.nan
-                    expected[count_x >= max(min_periods, 1)] = 0.
-                    if var is var_unbiased:
-                        expected[count_x < 2] = np.nan
-                    assert_equal(var_x, expected)
-
-                if isinstance(x, Series):
-                    for (y, is_constant, no_nans) in self.data:
-                        if not x.isnull().equals(y.isnull()):
-                            # can only easily test two Series with similar structure
-                            continue
-
-                        # check that cor(x, y) is symmetric
-                        corr_x_y = corr(x, y)
-                        corr_y_x = corr(y, x)
-                        assert_equal(corr_x_y, corr_y_x)
-
-                        if cov:
-                            # check that cov(x, y) is symmetric
-                            cov_x_y = cov(x, y)
-                            cov_y_x = cov(y, x)
-                            assert_equal(cov_x_y, cov_y_x)
-
-                            # check that cov(x, y) == (var(x+y) - var(x) - var(y)) / 2
-                            var_x_plus_y = var(x + y)
-                            var_y = var(y)
-                            assert_equal(cov_x_y, 0.5 * (var_x_plus_y - var_x - var_y))
-
-                            # check that corr(x, y) == cov(x, y) / (std(x) * std(y))
-                            std_y = std(y)
-                            assert_equal(corr_x_y, cov_x_y / (std_x * std_y))
-
-                            if cov is cov_biased:
-                                # check that biased cov(x, y) == mean(x*y) - mean(x)*mean(y)
-                                mean_y = mean(y)
-                                mean_x_times_y = mean(x * y)
-                                assert_equal(cov_x_y, mean_x_times_y - (mean_x * mean_y))
-
-    @slow
-    def test_ewm_consistency(self):
-
-        def _weights(s, com, adjust, ignore_na):
-            if isinstance(s, DataFrame):
-                if not len(s.columns):
-                    return DataFrame(index=s.index, columns=s.columns)
-                w = concat([ _weights(s.iloc[:, i],
-                                      com=com,
-                                      adjust=adjust,
-                                      ignore_na=ignore_na) for i, _ in enumerate(s.columns) ],
-                           axis=1)
-                w.index=s.index
-                w.columns=s.columns
-                return w
-
-            w = Series(np.nan, index=s.index)
-            alpha = 1. / (1. + com)
-            if ignore_na:
-                w[s.notnull()] = _weights(s[s.notnull()], com=com, adjust=adjust, ignore_na=False)
-            elif adjust:
-                for i in range(len(s)):
-                    if s.iat[i] == s.iat[i]:
-                        w.iat[i] = pow(1. / (1. - alpha), i)
-            else:
-                sum_wts = 0.
-                prev_i = -1
-                for i in range(len(s)):
-                    if s.iat[i] == s.iat[i]:
-                        if prev_i == -1:
-                            w.iat[i] = 1.
-                        else:
-                            w.iat[i] = alpha * sum_wts / pow(1. - alpha, i - prev_i)
-                        sum_wts += w.iat[i]
-                        prev_i = i
-            return w
-
-        def _variance_debiasing_factors(s, com, adjust, ignore_na):
-            weights = _weights(s, com=com, adjust=adjust, ignore_na=ignore_na)
-            cum_sum = weights.cumsum().fillna(method='ffill')
-            cum_sum_sq = (weights * weights).cumsum().fillna(method='ffill')
-            numerator = cum_sum * cum_sum
-            denominator = numerator - cum_sum_sq
-            denominator[denominator <= 0.] = np.nan
-            return numerator / denominator
-
-        def _ewma(s, com, min_periods, adjust, ignore_na):
-            weights = _weights(s, com=com, adjust=adjust, ignore_na=ignore_na)
-            result = s.multiply(weights).cumsum().divide(weights.cumsum()).fillna(method='ffill')
-            result[mom.expanding_count(s) < (max(min_periods, 1) if min_periods else 1)] = np.nan
-            return result
-
-        com = 3.
-        for min_periods in [0, 1, 2, 3, 4]:
-            for adjust in [True, False]:
-                for ignore_na in [False, True]:
-                    # test consistency between different ewm* moments
-                    self._test_moments_consistency(
-                        min_periods=min_periods,
-                        count=mom.expanding_count,
-                        mean=lambda x: mom.ewma(x, com=com, min_periods=min_periods, adjust=adjust, ignore_na=ignore_na),
-                        mock_mean=lambda x: _ewma(x, com=com, min_periods=min_periods, adjust=adjust, ignore_na=ignore_na),
-                        corr=lambda x, y: mom.ewmcorr(x, y, com=com, min_periods=min_periods, adjust=adjust, ignore_na=ignore_na),
-                        var_unbiased=lambda x: mom.ewmvar(x, com=com, min_periods=min_periods, adjust=adjust, ignore_na=ignore_na, bias=False),
-                        std_unbiased=lambda x: mom.ewmstd(x, com=com, min_periods=min_periods, adjust=adjust, ignore_na=ignore_na, bias=False),
-                        cov_unbiased=lambda x, y: mom.ewmcov(x, y, com=com, min_periods=min_periods, adjust=adjust, ignore_na=ignore_na, bias=False),
-                        var_biased=lambda x: mom.ewmvar(x, com=com, min_periods=min_periods, adjust=adjust, ignore_na=ignore_na, bias=True),
-                        std_biased=lambda x: mom.ewmstd(x, com=com, min_periods=min_periods, adjust=adjust, ignore_na=ignore_na, bias=True),
-                        cov_biased=lambda x, y: mom.ewmcov(x, y, com=com, min_periods=min_periods, adjust=adjust, ignore_na=ignore_na, bias=True),
-                        var_debiasing_factors=lambda x: _variance_debiasing_factors(x, com=com, adjust=adjust, ignore_na=ignore_na))
-
-    @slow
-    def test_expanding_consistency(self):
-
-        # suppress warnings about empty slices, as we are deliberately testing with empty/0-length Series/DataFrames
-        with warnings.catch_warnings():
-            warnings.filterwarnings("ignore", message=".*(empty slice|0 for slice).*", category=RuntimeWarning)
-
-            for min_periods in [0, 1, 2, 3, 4]:
-
-                # test consistency between different expanding_* moments
-                self._test_moments_consistency(
-                    min_periods=min_periods,
-                    count=mom.expanding_count,
-                    mean=lambda x: mom.expanding_mean(x, min_periods=min_periods),
-                    mock_mean=lambda x: mom.expanding_sum(x, min_periods=min_periods) / mom.expanding_count(x),
-                    corr=lambda x, y: mom.expanding_corr(x, y, min_periods=min_periods),
-                    var_unbiased=lambda x: mom.expanding_var(x, min_periods=min_periods),
-                    std_unbiased=lambda x: mom.expanding_std(x, min_periods=min_periods),
-                    cov_unbiased=lambda x, y: mom.expanding_cov(x, y, min_periods=min_periods),
-                    var_biased=lambda x: mom.expanding_var(x, min_periods=min_periods, ddof=0),
-                    std_biased=lambda x: mom.expanding_std(x, min_periods=min_periods, ddof=0),
-                    cov_biased=lambda x, y: mom.expanding_cov(x, y, min_periods=min_periods, ddof=0),
-                    var_debiasing_factors=lambda x: mom.expanding_count(x) / (mom.expanding_count(x) - 1.).replace(0., np.nan)
-                    )
-
-                # test consistency between expanding_xyz() and either (a) expanding_apply of Series.xyz(),
-                #                                                  or (b) expanding_apply of np.nanxyz()
-                for (x, is_constant, no_nans) in self.data:
-                    assert_equal = assert_series_equal if isinstance(x, Series) else assert_frame_equal
-                    functions = self.base_functions
-
-                    # GH 8269
-                    if no_nans:
-                        functions = self.base_functions + self.no_nan_functions
-                    for (f, require_min_periods, name) in functions:
-                        expanding_f = getattr(mom,'expanding_{0}'.format(name))
-
-                        if require_min_periods and (min_periods is not None) and (min_periods < require_min_periods):
-                            continue
-
-                        if expanding_f is mom.expanding_count:
-                            expanding_f_result = expanding_f(x)
-                            expanding_apply_f_result = mom.expanding_apply(x, func=f, min_periods=0)
-                        else:
-                            if expanding_f in [mom.expanding_cov, mom.expanding_corr]:
-                                expanding_f_result = expanding_f(x, min_periods=min_periods, pairwise=False)
-                            else:
-                                expanding_f_result = expanding_f(x, min_periods=min_periods)
-                            expanding_apply_f_result = mom.expanding_apply(x, func=f, min_periods=min_periods)
-
-                        if not tm._incompat_bottleneck_version(name):
-                            assert_equal(expanding_f_result, expanding_apply_f_result)
-
-                        if (expanding_f in [mom.expanding_cov, mom.expanding_corr]) and isinstance(x, DataFrame):
-                            # test pairwise=True
-                            expanding_f_result = expanding_f(x, x, min_periods=min_periods, pairwise=True)
-                            expected = Panel(items=x.index, major_axis=x.columns, minor_axis=x.columns)
-                            for i, _ in enumerate(x.columns):
-                                for j, _ in enumerate(x.columns):
-                                    expected.iloc[:, i, j] = expanding_f(x.iloc[:, i], x.iloc[:, j], min_periods=min_periods)
-                            assert_panel_equal(expanding_f_result, expected)
-
-    @slow
-    def test_rolling_consistency(self):
-
-        for window in [1, 2, 3, 10, 20]:
-            for min_periods in set([0, 1, 2, 3, 4, window]):
-                if min_periods and (min_periods > window):
-                    continue
-                for center in [False, True]:
-
-                    # test consistency between different rolling_* moments
-                    self._test_moments_consistency(
-                        min_periods=min_periods,
-                        count=lambda x: mom.rolling_count(x, window=window, center=center),
-                        mean=lambda x: mom.rolling_mean(x, window=window, min_periods=min_periods, center=center),
-                        mock_mean=lambda x: mom.rolling_sum(x, window=window, min_periods=min_periods, center=center).divide(
-                                            mom.rolling_count(x, window=window, center=center)),
-                        corr=lambda x, y: mom.rolling_corr(x, y, window=window, min_periods=min_periods, center=center),
-                        var_unbiased=lambda x: mom.rolling_var(x, window=window, min_periods=min_periods, center=center),
-                        std_unbiased=lambda x: mom.rolling_std(x, window=window, min_periods=min_periods, center=center),
-                        cov_unbiased=lambda x, y: mom.rolling_cov(x, y, window=window, min_periods=min_periods, center=center),
-                        var_biased=lambda x: mom.rolling_var(x, window=window, min_periods=min_periods, center=center, ddof=0),
-                        std_biased=lambda x: mom.rolling_std(x, window=window, min_periods=min_periods, center=center, ddof=0),
-                        cov_biased=lambda x, y: mom.rolling_cov(x, y, window=window, min_periods=min_periods, center=center, ddof=0),
-                        var_debiasing_factors=lambda x: mom.rolling_count(x, window=window, center=center).divide(
-                                                        (mom.rolling_count(x, window=window, center=center) - 1.).replace(0., np.nan)),
-                        )
-
-                    # test consistency between rolling_xyz() and either (a) rolling_apply of Series.xyz(),
-                    #                                                or (b) rolling_apply of np.nanxyz()
-                    for (x, is_constant, no_nans) in self.data:
-
-                        assert_equal = assert_series_equal if isinstance(x, Series) else assert_frame_equal
-                        functions = self.base_functions
-
-                        # GH 8269
-                        if no_nans:
-                            functions = self.base_functions + self.no_nan_functions
-                        for (f, require_min_periods, name) in functions:
-                            rolling_f = getattr(mom,'rolling_{0}'.format(name))
-
-                            if require_min_periods and (min_periods is not None) and (min_periods < require_min_periods):
-                                continue
-
-                            if rolling_f is mom.rolling_count:
-                                rolling_f_result = rolling_f(x, window=window, center=center)
-                                rolling_apply_f_result = mom.rolling_apply(x, window=window, func=f,
-                                                                           min_periods=0, center=center)
-                            else:
-                                if rolling_f in [mom.rolling_cov, mom.rolling_corr]:
-                                    rolling_f_result = rolling_f(x, window=window, min_periods=min_periods, center=center, pairwise=False)
-                                else:
-                                    rolling_f_result = rolling_f(x, window=window, min_periods=min_periods, center=center)
-                                rolling_apply_f_result = mom.rolling_apply(x, window=window, func=f,
-                                                                           min_periods=min_periods, center=center)
-                            if not tm._incompat_bottleneck_version(name):
-                                assert_equal(rolling_f_result, rolling_apply_f_result)
-
-                            if (rolling_f in [mom.rolling_cov, mom.rolling_corr]) and isinstance(x, DataFrame):
-                                # test pairwise=True
-                                rolling_f_result = rolling_f(x, x, window=window, min_periods=min_periods,
-                                                             center=center, pairwise=True)
-                                expected = Panel(items=x.index, major_axis=x.columns, minor_axis=x.columns)
-                                for i, _ in enumerate(x.columns):
-                                    for j, _ in enumerate(x.columns):
-                                        expected.iloc[:, i, j] = rolling_f(x.iloc[:, i], x.iloc[:, j],
-                                                                           window=window, min_periods=min_periods, center=center)
-                                assert_panel_equal(rolling_f_result, expected)
-
-    # binary moments
-    def test_rolling_cov(self):
-        A = self.series
-        B = A + randn(len(A))
-
-        result = mom.rolling_cov(A, B, 50, min_periods=25)
-        assert_almost_equal(result[-1], np.cov(A[-50:], B[-50:])[0, 1])
-
-    def test_rolling_cov_pairwise(self):
-        self._check_pairwise_moment(mom.rolling_cov, 10, min_periods=5)
-
-    def test_rolling_corr(self):
-        A = self.series
-        B = A + randn(len(A))
-
-        result = mom.rolling_corr(A, B, 50, min_periods=25)
-        assert_almost_equal(result[-1], np.corrcoef(A[-50:], B[-50:])[0, 1])
-
-        # test for correct bias correction
-        a = tm.makeTimeSeries()
-        b = tm.makeTimeSeries()
-        a[:5] = np.nan
-        b[:10] = np.nan
-
-        result = mom.rolling_corr(a, b, len(a), min_periods=1)
-        assert_almost_equal(result[-1], a.corr(b))
-
-    def test_rolling_corr_pairwise(self):
-        self._check_pairwise_moment(mom.rolling_corr, 10, min_periods=5)
-
-    def _check_pairwise_moment(self, func, *args, **kwargs):
-        panel = func(self.frame, *args, **kwargs)
-
-        actual = panel.ix[:, 1, 5]
-        expected = func(self.frame[1], self.frame[5], *args, **kwargs)
-        tm.assert_series_equal(actual, expected, check_names=False)
-        self.assertEqual(actual.name, 5)
-
-    def test_flex_binary_moment(self):
-        # GH3155
-        # don't blow the stack
-        self.assertRaises(TypeError, mom._flex_binary_moment,5,6,None)
-
-    def test_corr_sanity(self):
-        #GH 3155
-        df = DataFrame(
-            np.array(
-                    [[ 0.87024726,  0.18505595],
-                      [ 0.64355431,  0.3091617 ],
-                      [ 0.92372966,  0.50552513],
-                      [ 0.00203756,  0.04520709],
-                      [ 0.84780328,  0.33394331],
-                      [ 0.78369152,  0.63919667]])
-            )
-
-        res = mom.rolling_corr(df[0],df[1],5,center=True)
-        self.assertTrue(all([np.abs(np.nan_to_num(x)) <=1 for x in res]))
-
-        # and some fuzzing
-        for i in range(10):
-            df = DataFrame(np.random.rand(30,2))
-            res = mom.rolling_corr(df[0],df[1],5,center=True)
-            try:
-                self.assertTrue(all([np.abs(np.nan_to_num(x)) <=1 for x in res]))
-            except:
-                print(res)
-
-
-    def test_flex_binary_frame(self):
-        def _check(method):
-            series = self.frame[1]
-
-            res = method(series, self.frame, 10)
-            res2 = method(self.frame, series, 10)
-            exp = self.frame.apply(lambda x: method(series, x, 10))
-
-            tm.assert_frame_equal(res, exp)
-            tm.assert_frame_equal(res2, exp)
-
-            frame2 = self.frame.copy()
-            frame2.values[:] = np.random.randn(*frame2.shape)
-
-            res3 = method(self.frame, frame2, 10)
-            exp = DataFrame(dict((k, method(self.frame[k], frame2[k], 10))
-                                 for k in self.frame))
-            tm.assert_frame_equal(res3, exp)
-
-        methods = [mom.rolling_corr, mom.rolling_cov]
-        for meth in methods:
-            _check(meth)
-
-    def test_ewmcov(self):
-        self._check_binary_ew(mom.ewmcov)
-
-    def test_ewmcov_pairwise(self):
-        self._check_pairwise_moment(mom.ewmcov, span=10, min_periods=5)
-
-    def test_ewmcorr(self):
-        self._check_binary_ew(mom.ewmcorr)
-
-    def test_ewmcorr_pairwise(self):
-        self._check_pairwise_moment(mom.ewmcorr, span=10, min_periods=5)
-
-    def _check_binary_ew(self, func):
-        A = Series(randn(50), index=np.arange(50))
-        B = A[2:] + randn(48)
-
-        A[:10] = np.NaN
-        B[-10:] = np.NaN
-
-        result = func(A, B, 20, min_periods=5)
-        self.assertTrue(np.isnan(result.values[:14]).all())
-        self.assertFalse(np.isnan(result.values[14:]).any())
-
-        # GH 7898
-        for min_periods in (0, 1, 2):
-            result = func(A, B, 20, min_periods=min_periods)
-            # binary functions (ewmcov, ewmcorr) with bias=False require at least two values
-            self.assertTrue(np.isnan(result.values[:11]).all())
-            self.assertFalse(np.isnan(result.values[11:]).any())
-
-            # check series of length 0
-            result = func(Series([]), Series([]), 50, min_periods=min_periods)
-            assert_series_equal(result, Series([]))
-
-            # check series of length 1
-            result = func(Series([1.]), Series([1.]), 50, min_periods=min_periods)
-            assert_series_equal(result, Series([np.NaN]))
-
-        self.assertRaises(Exception, func, A, randn(50), 20, min_periods=5)
-
-    def test_expanding_apply(self):
-        ser = Series([])
-        assert_series_equal(ser, mom.expanding_apply(ser, lambda x: x.mean()))
-
-        def expanding_mean(x, min_periods=1, freq=None):
-            return mom.expanding_apply(x,
-                                       lambda x: x.mean(),
-                                       min_periods=min_periods,
-                                       freq=freq)
-        self._check_expanding(expanding_mean, np.mean)
-
-        # GH 8080
-        s = Series([None, None, None])
-        result = mom.expanding_apply(s, lambda x: len(x), min_periods=0)
-        expected = Series([1., 2., 3.])
-        assert_series_equal(result, expected)
-
-    def test_expanding_apply_args_kwargs(self):
-        def mean_w_arg(x, const):
-            return np.mean(x) + const
-
-        df = DataFrame(np.random.rand(20, 3))
-
-        expected = mom.expanding_apply(df, np.mean) + 20.
-
-        assert_frame_equal(mom.expanding_apply(df, mean_w_arg, args=(20,)),
-                            expected)
-        assert_frame_equal(mom.expanding_apply(df, mean_w_arg,
-                                               kwargs={'const' : 20}),
-                            expected)
-
-
-    def test_expanding_corr(self):
-        A = self.series.dropna()
-        B = (A + randn(len(A)))[:-5]
-
-        result = mom.expanding_corr(A, B)
-
-        rolling_result = mom.rolling_corr(A, B, len(A), min_periods=1)
-
-        assert_almost_equal(rolling_result, result)
-
-    def test_expanding_count(self):
-        result = mom.expanding_count(self.series)
-        assert_almost_equal(result, mom.rolling_count(self.series,
-                                                      len(self.series)))
-
-    def test_expanding_quantile(self):
-        result = mom.expanding_quantile(self.series, 0.5)
-
-        rolling_result = mom.rolling_quantile(self.series,
-                                              len(self.series),
-                                              0.5, min_periods=1)
-
-        assert_almost_equal(result, rolling_result)
-
-    def test_expanding_cov(self):
-        A = self.series
-        B = (A + randn(len(A)))[:-5]
-
-        result = mom.expanding_cov(A, B)
-
-        rolling_result = mom.rolling_cov(A, B, len(A), min_periods=1)
-
-        assert_almost_equal(rolling_result, result)
-
-    def test_expanding_max(self):
-        self._check_expanding(mom.expanding_max, np.max, preserve_nan=False)
-
-    def test_expanding_cov_pairwise(self):
-        result = mom.expanding_cov(self.frame)
-
-        rolling_result = mom.rolling_cov(self.frame, len(self.frame),
-                                         min_periods=1)
-
-        for i in result.items:
-            assert_almost_equal(result[i], rolling_result[i])
-
-    def test_expanding_corr_pairwise(self):
-        result = mom.expanding_corr(self.frame)
-
-        rolling_result = mom.rolling_corr(self.frame, len(self.frame),
-                                          min_periods=1)
-
-        for i in result.items:
-            assert_almost_equal(result[i], rolling_result[i])
-
-    def test_expanding_cov_diff_index(self):
-        # GH 7512
-        s1 = Series([1, 2, 3], index=[0, 1, 2])
-        s2 = Series([1, 3], index=[0, 2])
-        result = mom.expanding_cov(s1, s2)
-        expected = Series([None, None, 2.0])
-        assert_series_equal(result, expected)
-
-        s2a = Series([1, None, 3], index=[0, 1, 2])
-        result = mom.expanding_cov(s1, s2a)
-        assert_series_equal(result, expected)
-
-        s1 = Series([7, 8, 10], index=[0, 1, 3])
-        s2 = Series([7, 9, 10], index=[0, 2, 3])
-        result = mom.expanding_cov(s1, s2)
-        expected = Series([None, None, None, 4.5])
-        assert_series_equal(result, expected)
-
-    def test_expanding_corr_diff_index(self):
-        # GH 7512
-        s1 = Series([1, 2, 3], index=[0, 1, 2])
-        s2 = Series([1, 3], index=[0, 2])
-        result = mom.expanding_corr(s1, s2)
-        expected = Series([None, None, 1.0])
-        assert_series_equal(result, expected)
-
-        s2a = Series([1, None, 3], index=[0, 1, 2])
-        result = mom.expanding_corr(s1, s2a)
-        assert_series_equal(result, expected)
-
-        s1 = Series([7, 8, 10], index=[0, 1, 3])
-        s2 = Series([7, 9, 10], index=[0, 2, 3])
-        result = mom.expanding_corr(s1, s2)
-        expected = Series([None, None, None, 1.])
-        assert_series_equal(result, expected)
-
-    def test_rolling_cov_diff_length(self):
-        # GH 7512
-        s1 = Series([1, 2, 3], index=[0, 1, 2])
-        s2 = Series([1, 3], index=[0, 2])
-        result = mom.rolling_cov(s1, s2, window=3, min_periods=2)
-        expected = Series([None, None, 2.0])
-        assert_series_equal(result, expected)
-
-        s2a = Series([1, None, 3], index=[0, 1, 2])
-        result = mom.rolling_cov(s1, s2a, window=3, min_periods=2)
-        assert_series_equal(result, expected)
-
-    def test_rolling_corr_diff_length(self):
-        # GH 7512
-        s1 = Series([1, 2, 3], index=[0, 1, 2])
-        s2 = Series([1, 3], index=[0, 2])
-        result = mom.rolling_corr(s1, s2, window=3, min_periods=2)
-        expected = Series([None, None, 1.0])
-        assert_series_equal(result, expected)
-
-        s2a = Series([1, None, 3], index=[0, 1, 2])
-        result = mom.rolling_corr(s1, s2a, window=3, min_periods=2)
-        assert_series_equal(result, expected)
-
-    def test_rolling_functions_window_non_shrinkage(self):
-        # GH 7764
-        s = Series(range(4))
-        s_expected = Series(np.nan, index=s.index)
-        df = DataFrame([[1,5], [3, 2], [3,9], [-1,0]], columns=['A','B'])
-        df_expected = DataFrame(np.nan, index=df.index, columns=df.columns)
-        df_expected_panel = Panel(items=df.index, major_axis=df.columns, minor_axis=df.columns)
-
-        functions = [lambda x: mom.rolling_cov(x, x, pairwise=False, window=10, min_periods=5),
-                     lambda x: mom.rolling_corr(x, x, pairwise=False, window=10, min_periods=5),
-                     lambda x: mom.rolling_max(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_min(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_sum(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_mean(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_std(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_var(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_skew(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_kurt(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_quantile(x, quantile=0.5, window=10, min_periods=5),
-                     lambda x: mom.rolling_median(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_apply(x, func=sum, window=10, min_periods=5),
-                     lambda x: mom.rolling_window(x, win_type='boxcar', window=10, min_periods=5),
-                    ]
-        for f in functions:
-            try:
-                s_result = f(s)
-                assert_series_equal(s_result, s_expected)
-
-                df_result = f(df)
-                assert_frame_equal(df_result, df_expected)
-            except (ImportError):
-
-                # scipy needed for rolling_window
-                continue
-
-        functions = [lambda x: mom.rolling_cov(x, x, pairwise=True, window=10, min_periods=5),
-                     lambda x: mom.rolling_corr(x, x, pairwise=True, window=10, min_periods=5),
-                     # rolling_corr_pairwise is depracated, so the following line should be deleted
-                     # when rolling_corr_pairwise is removed.
-                     lambda x: mom.rolling_corr_pairwise(x, x, window=10, min_periods=5),
-                    ]
-        for f in functions:
-            df_result_panel = f(df)
-            assert_panel_equal(df_result_panel, df_expected_panel)
-
-    def test_moment_functions_zero_length(self):
-        # GH 8056
-        s = Series()
-        s_expected = s
-        df1 = DataFrame()
-        df1_expected = df1
-        df1_expected_panel = Panel(items=df1.index, major_axis=df1.columns, minor_axis=df1.columns)
-        df2 = DataFrame(columns=['a'])
-        df2['a'] = df2['a'].astype('float64')
-        df2_expected = df2
-        df2_expected_panel = Panel(items=df2.index, major_axis=df2.columns, minor_axis=df2.columns)
-
-        functions = [lambda x: mom.expanding_count(x),
-                     lambda x: mom.expanding_cov(x, x, pairwise=False, min_periods=5),
-                     lambda x: mom.expanding_corr(x, x, pairwise=False, min_periods=5),
-                     lambda x: mom.expanding_max(x, min_periods=5),
-                     lambda x: mom.expanding_min(x, min_periods=5),
-                     lambda x: mom.expanding_sum(x, min_periods=5),
-                     lambda x: mom.expanding_mean(x, min_periods=5),
-                     lambda x: mom.expanding_std(x, min_periods=5),
-                     lambda x: mom.expanding_var(x, min_periods=5),
-                     lambda x: mom.expanding_skew(x, min_periods=5),
-                     lambda x: mom.expanding_kurt(x, min_periods=5),
-                     lambda x: mom.expanding_quantile(x, quantile=0.5, min_periods=5),
-                     lambda x: mom.expanding_median(x, min_periods=5),
-                     lambda x: mom.expanding_apply(x, func=sum, min_periods=5),
-                     lambda x: mom.rolling_count(x, window=10),
-                     lambda x: mom.rolling_cov(x, x, pairwise=False, window=10, min_periods=5),
-                     lambda x: mom.rolling_corr(x, x, pairwise=False, window=10, min_periods=5),
-                     lambda x: mom.rolling_max(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_min(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_sum(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_mean(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_std(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_var(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_skew(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_kurt(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_quantile(x, quantile=0.5, window=10, min_periods=5),
-                     lambda x: mom.rolling_median(x, window=10, min_periods=5),
-                     lambda x: mom.rolling_apply(x, func=sum, window=10, min_periods=5),
-                     lambda x: mom.rolling_window(x, win_type='boxcar', window=10, min_periods=5),
-                    ]
-        for f in functions:
-            try:
-                s_result = f(s)
-                assert_series_equal(s_result, s_expected)
-
-                df1_result = f(df1)
-                assert_frame_equal(df1_result, df1_expected)
-
-                df2_result = f(df2)
-                assert_frame_equal(df2_result, df2_expected)
-            except (ImportError):
-
-                # scipy needed for rolling_window
-                continue
-
-        functions = [lambda x: mom.expanding_cov(x, x, pairwise=True, min_periods=5),
-                     lambda x: mom.expanding_corr(x, x, pairwise=True, min_periods=5),
-                     lambda x: mom.rolling_cov(x, x, pairwise=True, window=10, min_periods=5),
-                     lambda x: mom.rolling_corr(x, x, pairwise=True, window=10, min_periods=5),
-                     # rolling_corr_pairwise is depracated, so the following line should be deleted
-                     # when rolling_corr_pairwise is removed.
-                     lambda x: mom.rolling_corr_pairwise(x, x, window=10, min_periods=5),
-                    ]
-        for f in functions:
-            df1_result_panel = f(df1)
-            assert_panel_equal(df1_result_panel, df1_expected_panel)
-
-            df2_result_panel = f(df2)
-            assert_panel_equal(df2_result_panel, df2_expected_panel)
-
-    def test_expanding_cov_pairwise_diff_length(self):
-        # GH 7512
-        df1 = DataFrame([[1,5], [3, 2], [3,9]], columns=['A','B'])
-        df1a = DataFrame([[1,5], [3,9]], index=[0,2], columns=['A','B'])
-        df2 = DataFrame([[5,6], [None,None], [2,1]], columns=['X','Y'])
-        df2a = DataFrame([[5,6], [2,1]], index=[0,2], columns=['X','Y'])
-        result1 = mom.expanding_cov(df1, df2, pairwise=True)[2]
-        result2 = mom.expanding_cov(df1, df2a, pairwise=True)[2]
-        result3 = mom.expanding_cov(df1a, df2, pairwise=True)[2]
-        result4 = mom.expanding_cov(df1a, df2a, pairwise=True)[2]
-        expected = DataFrame([[-3., -5.], [-6., -10.]], index=['A','B'], columns=['X','Y'])
-        assert_frame_equal(result1, expected)
-        assert_frame_equal(result2, expected)
-        assert_frame_equal(result3, expected)
-        assert_frame_equal(result4, expected)
-
-    def test_expanding_corr_pairwise_diff_length(self):
-        # GH 7512
-        df1 = DataFrame([[1,2], [3, 2], [3,4]], columns=['A','B'])
-        df1a = DataFrame([[1,2], [3,4]], index=[0,2], columns=['A','B'])
-        df2 = DataFrame([[5,6], [None,None], [2,1]], columns=['X','Y'])
-        df2a = DataFrame([[5,6], [2,1]], index=[0,2], columns=['X','Y'])
-        result1 = mom.expanding_corr(df1, df2, pairwise=True)[2]
-        result2 = mom.expanding_corr(df1, df2a, pairwise=True)[2]
-        result3 = mom.expanding_corr(df1a, df2, pairwise=True)[2]
-        result4 = mom.expanding_corr(df1a, df2a, pairwise=True)[2]
-        expected = DataFrame([[-1.0, -1.0], [-1.0, -1.0]], index=['A','B'], columns=['X','Y'])
-        assert_frame_equal(result1, expected)
-        assert_frame_equal(result2, expected)
-        assert_frame_equal(result3, expected)
-        assert_frame_equal(result4, expected)
-
-    def test_pairwise_stats_column_names_order(self):
-        # GH 7738
-        df1s = [DataFrame([[2,4],[1,2],[5,2],[8,1]], columns=[0,1]),
-                DataFrame([[2,4],[1,2],[5,2],[8,1]], columns=[1,0]),
-                DataFrame([[2,4],[1,2],[5,2],[8,1]], columns=[1,1]),
-                DataFrame([[2,4],[1,2],[5,2],[8,1]], columns=['C','C']),
-                DataFrame([[2,4],[1,2],[5,2],[8,1]], columns=[1.,0]),
-                DataFrame([[2,4],[1,2],[5,2],[8,1]], columns=[0.,1]),
-                DataFrame([[2,4],[1,2],[5,2],[8,1]], columns=['C',1]),
-                DataFrame([[2.,4.],[1.,2.],[5.,2.],[8.,1.]], columns=[1,0.]),
-                DataFrame([[2,4.],[1,2.],[5,2.],[8,1.]], columns=[0,1.]),
-                DataFrame([[2,4],[1,2],[5,2],[8,1.]], columns=[1.,'X']),
-               ]
-        df2 = DataFrame([[None,1,1],[None,1,2],[None,3,2],[None,8,1]], columns=['Y','Z','X'])
-        s = Series([1,1,3,8])
-
-        # suppress warnings about incomparable objects, as we are deliberately testing with such column labels
-        with warnings.catch_warnings():
-            warnings.filterwarnings("ignore", message=".*incomparable objects.*", category=RuntimeWarning)
-
-            # DataFrame methods (which do not call _flex_binary_moment())
-            for f in [lambda x: x.cov(),
-                      lambda x: x.corr(),
-                     ]:
-                results = [f(df) for df in df1s]
-                for (df, result) in zip(df1s, results):
-                    assert_index_equal(result.index, df.columns)
-                    assert_index_equal(result.columns, df.columns)
-                for i, result in enumerate(results):
-                    if i > 0:
-                        self.assert_numpy_array_equal(result, results[0])
-
-            # DataFrame with itself, pairwise=True
-            for f in [lambda x: mom.expanding_cov(x, pairwise=True),
-                      lambda x: mom.expanding_corr(x, pairwise=True),
-                      lambda x: mom.rolling_cov(x, window=3, pairwise=True),
-                      lambda x: mom.rolling_corr(x, window=3, pairwise=True),
-                      lambda x: mom.ewmcov(x, com=3, pairwise=True),
-                      lambda x: mom.ewmcorr(x, com=3, pairwise=True),
-                     ]:
-                results = [f(df) for df in df1s]
-                for (df, result) in zip(df1s, results):
-                    assert_index_equal(result.items, df.index)
-                    assert_index_equal(result.major_axis, df.columns)
-                    assert_index_equal(result.minor_axis, df.columns)
-                for i, result in enumerate(results):
-                    if i > 0:
-                        self.assert_numpy_array_equal(result, results[0])
-
-            # DataFrame with itself, pairwise=False
-            for f in [lambda x: mom.expanding_cov(x, pairwise=False),
-                      lambda x: mom.expanding_corr(x, pairwise=False),
-                      lambda x: mom.rolling_cov(x, window=3, pairwise=False),
-                      lambda x: mom.rolling_corr(x, window=3, pairwise=False),
-                      lambda x: mom.ewmcov(x, com=3, pairwise=False),
-                      lambda x: mom.ewmcorr(x, com=3, pairwise=False),
-                     ]:
-                results = [f(df) for df in df1s]
-                for (df, result) in zip(df1s, results):
-                    assert_index_equal(result.index, df.index)
-                    assert_index_equal(result.columns, df.columns)
-                for i, result in enumerate(results):
-                    if i > 0:
-                        self.assert_numpy_array_equal(result, results[0])
-
-            # DataFrame with another DataFrame, pairwise=True
-            for f in [lambda x, y: mom.expanding_cov(x, y, pairwise=True),
-                      lambda x, y: mom.expanding_corr(x, y, pairwise=True),
-                      lambda x, y: mom.rolling_cov(x, y, window=3, pairwise=True),
-                      lambda x, y: mom.rolling_corr(x, y, window=3, pairwise=True),
-                      lambda x, y: mom.ewmcov(x, y, com=3, pairwise=True),
-                      lambda x, y: mom.ewmcorr(x, y, com=3, pairwise=True),
-                     ]:
-                results = [f(df, df2) for df in df1s]
-                for (df, result) in zip(df1s, results):
-                    assert_index_equal(result.items, df.index)
-                    assert_index_equal(result.major_axis, df.columns)
-                    assert_index_equal(result.minor_axis, df2.columns)
-                for i, result in enumerate(results):
-                    if i > 0:
-                        self.assert_numpy_array_equal(result, results[0])
-
-            # DataFrame with another DataFrame, pairwise=False
-            for f in [lambda x, y: mom.expanding_cov(x, y, pairwise=False),
-                      lambda x, y: mom.expanding_corr(x, y, pairwise=False),
-                      lambda x, y: mom.rolling_cov(x, y, window=3, pairwise=False),
-                      lambda x, y: mom.rolling_corr(x, y, window=3, pairwise=False),
-                      lambda x, y: mom.ewmcov(x, y, com=3, pairwise=False),
-                      lambda x, y: mom.ewmcorr(x, y, com=3, pairwise=False),
-                     ]:
-                results = [f(df, df2) if df.columns.is_unique else None for df in df1s]
-                for (df, result) in zip(df1s, results):
-                    if result is not None:
-                        expected_index = df.index.union(df2.index)
-                        expected_columns = df.columns.union(df2.columns)
-                        assert_index_equal(result.index, expected_index)
-                        assert_index_equal(result.columns, expected_columns)
-                    else:
-                        tm.assertRaisesRegexp(ValueError, "'arg1' columns are not unique", f, df, df2)
-                        tm.assertRaisesRegexp(ValueError, "'arg2' columns are not unique", f, df2, df)
-
-            # DataFrame with a Series
-            for f in [lambda x, y: mom.expanding_cov(x, y),
-                      lambda x, y: mom.expanding_corr(x, y),
-                      lambda x, y: mom.rolling_cov(x, y, window=3),
-                      lambda x, y: mom.rolling_corr(x, y, window=3),
-                      lambda x, y: mom.ewmcov(x, y, com=3),
-                      lambda x, y: mom.ewmcorr(x, y, com=3),
-                     ]:
-                results = [f(df, s) for df in df1s] + [f(s, df) for df in df1s]
-                for (df, result) in zip(df1s, results):
-                    assert_index_equal(result.index, df.index)
-                    assert_index_equal(result.columns, df.columns)
-                for i, result in enumerate(results):
-                    if i > 0:
-                        self.assert_numpy_array_equal(result, results[0])
-
-    def test_rolling_skew_edge_cases(self):
-
-        all_nan = Series([np.NaN] * 5)
-
-        # yields all NaN (0 variance)
-        d = Series([1] * 5)
-        x = mom.rolling_skew(d, window=5)
-        assert_series_equal(all_nan, x)
-
-        # yields all NaN (window too small)
-        d = Series(np.random.randn(5))
-        x = mom.rolling_skew(d, window=2)
-        assert_series_equal(all_nan, x)
-
-        # yields [NaN, NaN, NaN, 0.177994, 1.548824]
-        d = Series([-1.50837035, -0.1297039 ,  0.19501095,
-                       1.73508164,  0.41941401])
-        expected = Series([np.NaN, np.NaN, np.NaN,
-                              0.177994, 1.548824])
-        x = mom.rolling_skew(d, window=4)
-        assert_series_equal(expected, x)
-
-    def test_rolling_kurt_edge_cases(self):
-
-        all_nan = Series([np.NaN] * 5)
-
-        # yields all NaN (0 variance)
-        d = Series([1] * 5)
-        x = mom.rolling_kurt(d, window=5)
-        assert_series_equal(all_nan, x)
-
-        # yields all NaN (window too small)
-        d = Series(np.random.randn(5))
-        x = mom.rolling_kurt(d, window=3)
-        assert_series_equal(all_nan, x)
-
-        # yields [NaN, NaN, NaN, 1.224307, 2.671499]
-        d = Series([-1.50837035, -0.1297039 ,  0.19501095,
-                    1.73508164,  0.41941401])
-        expected = Series([np.NaN, np.NaN, np.NaN,
-                           1.224307, 2.671499])
-        x = mom.rolling_kurt(d, window=4)
-        assert_series_equal(expected, x)
-
-    def _check_expanding_ndarray(self, func, static_comp, has_min_periods=True,
-                                 has_time_rule=True, preserve_nan=True):
-        result = func(self.arr)
-
-        assert_almost_equal(result[10],
-                            static_comp(self.arr[:11]))
-
-        if preserve_nan:
-            assert(np.isnan(result[self._nan_locs]).all())
-
-        arr = randn(50)
-
-        if has_min_periods:
-            result = func(arr, min_periods=30)
-            assert(np.isnan(result[:29]).all())
-            assert_almost_equal(result[-1], static_comp(arr[:50]))
-
-            # min_periods is working correctly
-            result = func(arr, min_periods=15)
-            self.assertTrue(np.isnan(result[13]))
-            self.assertFalse(np.isnan(result[14]))
-
-            arr2 = randn(20)
-            result = func(arr2, min_periods=5)
-            self.assertTrue(isnull(result[3]))
-            self.assertTrue(notnull(result[4]))
-
-            # min_periods=0
-            result0 = func(arr, min_periods=0)
-            result1 = func(arr, min_periods=1)
-            assert_almost_equal(result0, result1)
-        else:
-            result = func(arr)
-            assert_almost_equal(result[-1], static_comp(arr[:50]))
-
-    def _check_expanding_structures(self, func):
-        series_result = func(self.series)
-        tm.assertIsInstance(series_result, Series)
-        frame_result = func(self.frame)
-        self.assertEqual(type(frame_result), DataFrame)
-
-    def _check_expanding(self, func, static_comp, has_min_periods=True,
-                         has_time_rule=True,
-                         preserve_nan=True):
-        self._check_expanding_ndarray(func, static_comp,
-                                      has_min_periods=has_min_periods,
-                                      has_time_rule=has_time_rule,
-                                      preserve_nan=preserve_nan)
-        self._check_expanding_structures(func)
-
-    def test_rolling_max_gh6297(self):
-        """Replicate result expected in GH #6297"""
-
-        indices = [datetime(1975, 1, i) for i in range(1, 6)]
-        # So that we can have 2 datapoints on one of the days
-        indices.append(datetime(1975, 1, 3, 6, 0))
-        series = Series(range(1, 7), index=indices)
-        # Use floats instead of ints as values
-        series = series.map(lambda x: float(x))
-        # Sort chronologically
-        series = series.sort_index()
-
-        expected = Series([1.0, 2.0, 6.0, 4.0, 5.0],
-                          index=[datetime(1975, 1, i, 0)
-                                 for i in range(1, 6)])
-        x = mom.rolling_max(series, window=1, freq='D')
-        assert_series_equal(expected, x)
-
-    def test_rolling_max_how_resample(self):
-
-        indices = [datetime(1975, 1, i) for i in range(1, 6)]
-        # So that we can have 3 datapoints on last day (4, 10, and 20)
-        indices.append(datetime(1975, 1, 5, 1))
-        indices.append(datetime(1975, 1, 5, 2))
-        series = Series(list(range(0, 5)) + [10, 20], index=indices)
-        # Use floats instead of ints as values
-        series = series.map(lambda x: float(x))
-        # Sort chronologically
-        series = series.sort_index()
-
-        # Default how should be max
-        expected = Series([0.0, 1.0, 2.0, 3.0, 20.0],
-                          index=[datetime(1975, 1, i, 0)
-                                 for i in range(1, 6)])
-        x = mom.rolling_max(series, window=1, freq='D')
-        assert_series_equal(expected, x)
-
-        # Now specify median (10.0)
-        expected = Series([0.0, 1.0, 2.0, 3.0, 10.0],
-                          index=[datetime(1975, 1, i, 0)
-                                 for i in range(1, 6)])
-        x = mom.rolling_max(series, window=1, freq='D', how='median')
-        assert_series_equal(expected, x)
-
-        # Now specify mean (4+10+20)/3
-        v = (4.0+10.0+20.0)/3.0
-        expected = Series([0.0, 1.0, 2.0, 3.0, v],
-                          index=[datetime(1975, 1, i, 0)
-                                 for i in range(1, 6)])
-        x = mom.rolling_max(series, window=1, freq='D', how='mean')
-        assert_series_equal(expected, x)
-
-
-    def test_rolling_min_how_resample(self):
-
-        indices = [datetime(1975, 1, i) for i in range(1, 6)]
-        # So that we can have 3 datapoints on last day (4, 10, and 20)
-        indices.append(datetime(1975, 1, 5, 1))
-        indices.append(datetime(1975, 1, 5, 2))
-        series = Series(list(range(0, 5)) + [10, 20], index=indices)
-        # Use floats instead of ints as values
-        series = series.map(lambda x: float(x))
-        # Sort chronologically
-        series = series.sort_index()
-
-        # Default how should be min
-        expected = Series([0.0, 1.0, 2.0, 3.0, 4.0],
-                          index=[datetime(1975, 1, i, 0)
-                                 for i in range(1, 6)])
-        x = mom.rolling_min(series, window=1, freq='D')
-        assert_series_equal(expected, x)
-
-    def test_rolling_median_how_resample(self):
-
-        indices = [datetime(1975, 1, i) for i in range(1, 6)]
-        # So that we can have 3 datapoints on last day (4, 10, and 20)
-        indices.append(datetime(1975, 1, 5, 1))
-        indices.append(datetime(1975, 1, 5, 2))
-        series = Series(list(range(0, 5)) + [10, 20], index=indices)
-        # Use floats instead of ints as values
-        series = series.map(lambda x: float(x))
-        # Sort chronologically
-        series = series.sort_index()
-
-        # Default how should be median
-        expected = Series([0.0, 1.0, 2.0, 3.0, 10],
-                          index=[datetime(1975, 1, i, 0)
-                                 for i in range(1, 6)])
-        x = mom.rolling_median(series, window=1, freq='D')
-        assert_series_equal(expected, x)
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/stats/tests/test_ols.py b/pandas/stats/tests/test_ols.py
deleted file mode 100644
index 60e976f09365b..0000000000000
--- a/pandas/stats/tests/test_ols.py
+++ /dev/null
@@ -1,907 +0,0 @@
-"""
-Unit test suite for OLS and PanelOLS classes
-"""
-
-# pylint: disable-msg=W0212
-
-from __future__ import division
-
-from datetime import datetime
-from pandas import compat
-from distutils.version import LooseVersion
-import nose
-import numpy as np
-from numpy.testing.decorators import slow
-
-from pandas import date_range, bdate_range
-from pandas.core.panel import Panel
-from pandas import DataFrame, Index, Series, notnull, datetools
-from pandas.stats.api import ols
-from pandas.stats.ols import _filter_data
-from pandas.stats.plm import NonPooledPanelOLS, PanelOLS
-from pandas.util.testing import (assert_almost_equal, assert_series_equal,
-                                 assert_frame_equal, assertRaisesRegexp)
-import pandas.util.testing as tm
-import pandas.compat as compat
-from .common import BaseTest
-
-_have_statsmodels = True
-try:
-    import statsmodels.api as sm
-except ImportError:
-    try:
-        import scikits.statsmodels.api as sm
-    except ImportError:
-        _have_statsmodels = False
-
-
-def _check_repr(obj):
-    repr(obj)
-    str(obj)
-
-
-def _compare_ols_results(model1, model2):
-    tm.assertIsInstance(model1, type(model2))
-
-    if hasattr(model1, '_window_type'):
-        _compare_moving_ols(model1, model2)
-    else:
-        _compare_fullsample_ols(model1, model2)
-
-
-def _compare_fullsample_ols(model1, model2):
-    assert_series_equal(model1.beta, model2.beta)
-
-
-def _compare_moving_ols(model1, model2):
-    assert_frame_equal(model1.beta, model2.beta)
-
-
-class TestOLS(BaseTest):
-
-    _multiprocess_can_split_ = True
-
-    # TODO: Add tests for OLS y predict
-    # TODO: Right now we just check for consistency between full-sample and
-    # rolling/expanding results of the panel OLS.  We should also cross-check
-    # with trusted implementations of panel OLS (e.g. R).
-    # TODO: Add tests for non pooled OLS.
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestOLS, cls).setUpClass()
-        try:
-            import matplotlib as mpl
-            mpl.use('Agg', warn=False)
-        except ImportError:
-            pass
-
-        if not _have_statsmodels:
-            raise nose.SkipTest("no statsmodels")
-
-    def testOLSWithDatasets_ccard(self):
-        self.checkDataSet(sm.datasets.ccard.load(), skip_moving=True)
-        self.checkDataSet(sm.datasets.cpunish.load(), skip_moving=True)
-        self.checkDataSet(sm.datasets.longley.load(), skip_moving=True)
-        self.checkDataSet(sm.datasets.stackloss.load(), skip_moving=True)
-
-    @slow
-    def testOLSWithDatasets_copper(self):
-        self.checkDataSet(sm.datasets.copper.load())
-
-    @slow
-    def testOLSWithDatasets_scotland(self):
-        self.checkDataSet(sm.datasets.scotland.load())
-
-        # degenerate case fails on some platforms
-        # self.checkDataSet(datasets.ccard.load(), 39, 49) # one col in X all
-        # 0s
-
-    def testWLS(self):
-        # WLS centered SS changed (fixed) in 0.5.0
-        sm_version = sm.version.version
-        if sm_version < LooseVersion('0.5.0'):
-            raise nose.SkipTest("WLS centered SS not fixed in statsmodels"
-                                " version {0}".format(sm_version))
-
-        X = DataFrame(np.random.randn(30, 4), columns=['A', 'B', 'C', 'D'])
-        Y = Series(np.random.randn(30))
-        weights = X.std(1)
-
-        self._check_wls(X, Y, weights)
-
-        weights.ix[[5, 15]] = np.nan
-        Y[[2, 21]] = np.nan
-        self._check_wls(X, Y, weights)
-
-    def _check_wls(self, x, y, weights):
-        result = ols(y=y, x=x, weights=1 / weights)
-
-        combined = x.copy()
-        combined['__y__'] = y
-        combined['__weights__'] = weights
-        combined = combined.dropna()
-
-        endog = combined.pop('__y__').values
-        aweights = combined.pop('__weights__').values
-        exog = sm.add_constant(combined.values, prepend=False)
-
-        sm_result = sm.WLS(endog, exog, weights=1 / aweights).fit()
-
-        assert_almost_equal(sm_result.params, result._beta_raw)
-        assert_almost_equal(sm_result.resid, result._resid_raw)
-
-        self.checkMovingOLS('rolling', x, y, weights=weights)
-        self.checkMovingOLS('expanding', x, y, weights=weights)
-
-    def checkDataSet(self, dataset, start=None, end=None, skip_moving=False):
-        exog = dataset.exog[start: end]
-        endog = dataset.endog[start: end]
-        x = DataFrame(exog, index=np.arange(exog.shape[0]),
-                      columns=np.arange(exog.shape[1]))
-        y = Series(endog, index=np.arange(len(endog)))
-
-        self.checkOLS(exog, endog, x, y)
-
-        if not skip_moving:
-            self.checkMovingOLS('rolling', x, y)
-            self.checkMovingOLS('rolling', x, y, nw_lags=0)
-            self.checkMovingOLS('expanding', x, y, nw_lags=0)
-            self.checkMovingOLS('rolling', x, y, nw_lags=1)
-            self.checkMovingOLS('expanding', x, y, nw_lags=1)
-            self.checkMovingOLS('expanding', x, y, nw_lags=1, nw_overlap=True)
-
-    def checkOLS(self, exog, endog, x, y):
-        reference = sm.OLS(endog, sm.add_constant(exog, prepend=False)).fit()
-        result = ols(y=y, x=x)
-
-        # check that sparse version is the same
-        sparse_result = ols(y=y.to_sparse(), x=x.to_sparse())
-        _compare_ols_results(result, sparse_result)
-
-        assert_almost_equal(reference.params, result._beta_raw)
-        assert_almost_equal(reference.df_model, result._df_model_raw)
-        assert_almost_equal(reference.df_resid, result._df_resid_raw)
-        assert_almost_equal(reference.fvalue, result._f_stat_raw[0])
-        assert_almost_equal(reference.pvalues, result._p_value_raw)
-        assert_almost_equal(reference.rsquared, result._r2_raw)
-        assert_almost_equal(reference.rsquared_adj, result._r2_adj_raw)
-        assert_almost_equal(reference.resid, result._resid_raw)
-        assert_almost_equal(reference.bse, result._std_err_raw)
-        assert_almost_equal(reference.tvalues, result._t_stat_raw)
-        assert_almost_equal(reference.cov_params(), result._var_beta_raw)
-        assert_almost_equal(reference.fittedvalues, result._y_fitted_raw)
-
-        _check_non_raw_results(result)
-
-    def checkMovingOLS(self, window_type, x, y, weights=None, **kwds):
-        window = sm.tools.tools.rank(x.values) * 2
-
-        moving = ols(y=y, x=x, weights=weights, window_type=window_type,
-                     window=window, **kwds)
-
-        # check that sparse version is the same
-        sparse_moving = ols(y=y.to_sparse(), x=x.to_sparse(),
-                            weights=weights,
-                            window_type=window_type,
-                            window=window, **kwds)
-        _compare_ols_results(moving, sparse_moving)
-
-        index = moving._index
-
-        for n, i in enumerate(moving._valid_indices):
-            if window_type == 'rolling' and i >= window:
-                prior_date = index[i - window + 1]
-            else:
-                prior_date = index[0]
-
-            date = index[i]
-
-            x_iter = {}
-            for k, v in compat.iteritems(x):
-                x_iter[k] = v.truncate(before=prior_date, after=date)
-            y_iter = y.truncate(before=prior_date, after=date)
-
-            static = ols(y=y_iter, x=x_iter, weights=weights, **kwds)
-
-            self.compare(static, moving, event_index=i,
-                         result_index=n)
-
-        _check_non_raw_results(moving)
-
-    FIELDS = ['beta', 'df', 'df_model', 'df_resid', 'f_stat', 'p_value',
-              'r2', 'r2_adj', 'rmse', 'std_err', 't_stat',
-              'var_beta']
-
-    def compare(self, static, moving, event_index=None,
-                result_index=None):
-
-        index = moving._index
-
-        # Check resid if we have a time index specified
-        if event_index is not None:
-            ref = static._resid_raw[-1]
-
-            label = index[event_index]
-
-            res = moving.resid[label]
-
-            assert_almost_equal(ref, res)
-
-            ref = static._y_fitted_raw[-1]
-            res = moving.y_fitted[label]
-
-            assert_almost_equal(ref, res)
-
-        # Check y_fitted
-
-        for field in self.FIELDS:
-            attr = '_%s_raw' % field
-
-            ref = getattr(static, attr)
-            res = getattr(moving, attr)
-
-            if result_index is not None:
-                res = res[result_index]
-
-            assert_almost_equal(ref, res)
-
-    def test_ols_object_dtype(self):
-        df = DataFrame(np.random.randn(20, 2), dtype=object)
-        model = ols(y=df[0], x=df[1])
-        summary = repr(model)
-
-
-class TestOLSMisc(tm.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    '''
-    For test coverage with faux data
-    '''
-    @classmethod
-    def setUpClass(cls):
-        super(TestOLSMisc, cls).setUpClass()
-        if not _have_statsmodels:
-            raise nose.SkipTest("no statsmodels")
-
-    def test_f_test(self):
-        x = tm.makeTimeDataFrame()
-        y = x.pop('A')
-
-        model = ols(y=y, x=x)
-
-        hyp = '1*B+1*C+1*D=0'
-        result = model.f_test(hyp)
-
-        hyp = ['1*B=0',
-               '1*C=0',
-               '1*D=0']
-        result = model.f_test(hyp)
-        assert_almost_equal(result['f-stat'], model.f_stat['f-stat'])
-
-        self.assertRaises(Exception, model.f_test, '1*A=0')
-
-    def test_r2_no_intercept(self):
-        y = tm.makeTimeSeries()
-        x = tm.makeTimeDataFrame()
-
-        x_with = x.copy()
-        x_with['intercept'] = 1.
-
-        model1 = ols(y=y, x=x)
-        model2 = ols(y=y, x=x_with, intercept=False)
-        assert_series_equal(model1.beta, model2.beta)
-
-        # TODO: can we infer whether the intercept is there...
-        self.assertNotEqual(model1.r2, model2.r2)
-
-        # rolling
-
-        model1 = ols(y=y, x=x, window=20)
-        model2 = ols(y=y, x=x_with, window=20, intercept=False)
-        assert_frame_equal(model1.beta, model2.beta)
-        self.assertTrue((model1.r2 != model2.r2).all())
-
-    def test_summary_many_terms(self):
-        x = DataFrame(np.random.randn(100, 20))
-        y = np.random.randn(100)
-        model = ols(y=y, x=x)
-        model.summary
-
-    def test_y_predict(self):
-        y = tm.makeTimeSeries()
-        x = tm.makeTimeDataFrame()
-        model1 = ols(y=y, x=x)
-        assert_series_equal(model1.y_predict, model1.y_fitted)
-        assert_almost_equal(model1._y_predict_raw, model1._y_fitted_raw)
-
-    def test_predict(self):
-        y = tm.makeTimeSeries()
-        x = tm.makeTimeDataFrame()
-        model1 = ols(y=y, x=x)
-        assert_series_equal(model1.predict(), model1.y_predict)
-        assert_series_equal(model1.predict(x=x), model1.y_predict)
-        assert_series_equal(model1.predict(beta=model1.beta), model1.y_predict)
-
-        exog = x.copy()
-        exog['intercept'] = 1.
-        rs = Series(np.dot(exog.values, model1.beta.values), x.index)
-        assert_series_equal(model1.y_predict, rs)
-
-        x2 = x.reindex(columns=x.columns[::-1])
-        assert_series_equal(model1.predict(x=x2), model1.y_predict)
-
-        x3 = x2 + 10
-        pred3 = model1.predict(x=x3)
-        x3['intercept'] = 1.
-        x3 = x3.reindex(columns=model1.beta.index)
-        expected = Series(np.dot(x3.values, model1.beta.values), x3.index)
-        assert_series_equal(expected, pred3)
-
-        beta = Series(0., model1.beta.index)
-        pred4 = model1.predict(beta=beta)
-        assert_series_equal(Series(0., pred4.index), pred4)
-
-    def test_predict_longer_exog(self):
-        exogenous = {"1998": "4760", "1999": "5904", "2000": "4504",
-                     "2001": "9808", "2002": "4241", "2003": "4086",
-                     "2004": "4687", "2005": "7686", "2006": "3740",
-                     "2007": "3075", "2008": "3753", "2009": "4679",
-                     "2010": "5468", "2011": "7154", "2012": "4292",
-                     "2013": "4283", "2014": "4595", "2015": "9194",
-                     "2016": "4221", "2017": "4520"}
-        endogenous = {"1998": "691", "1999": "1580", "2000": "80",
-                      "2001": "1450", "2002": "555", "2003": "956",
-                      "2004": "877", "2005": "614", "2006": "468",
-                      "2007": "191"}
-
-        endog = Series(endogenous)
-        exog = Series(exogenous)
-        model = ols(y=endog, x=exog)
-
-        pred = model.y_predict
-        self.assertTrue(pred.index.equals(exog.index))
-
-    def test_longpanel_series_combo(self):
-        wp = tm.makePanel()
-        lp = wp.to_frame()
-
-        y = lp.pop('ItemA')
-        model = ols(y=y, x=lp, entity_effects=True, window=20)
-        self.assertTrue(notnull(model.beta.values).all())
-        tm.assertIsInstance(model, PanelOLS)
-        model.summary
-
-    def test_series_rhs(self):
-        y = tm.makeTimeSeries()
-        x = tm.makeTimeSeries()
-        model = ols(y=y, x=x)
-        expected = ols(y=y, x={'x': x})
-        assert_series_equal(model.beta, expected.beta)
-
-        # GH 5233/5250
-        assert_series_equal(model.y_predict, model.predict(x=x))
-
-    def test_various_attributes(self):
-        # just make sure everything "works". test correctness elsewhere
-
-        x = DataFrame(np.random.randn(100, 5))
-        y = np.random.randn(100)
-        model = ols(y=y, x=x, window=20)
-
-        series_attrs = ['rank', 'df', 'forecast_mean', 'forecast_vol']
-
-        for attr in series_attrs:
-            value = getattr(model, attr)
-            tm.assertIsInstance(value, Series)
-
-        # works
-        model._results
-
-    def test_catch_regressor_overlap(self):
-        df1 = tm.makeTimeDataFrame().ix[:, ['A', 'B']]
-        df2 = tm.makeTimeDataFrame().ix[:, ['B', 'C', 'D']]
-        y = tm.makeTimeSeries()
-
-        data = {'foo': df1, 'bar': df2}
-        self.assertRaises(Exception, ols, y=y, x=data)
-
-    def test_plm_ctor(self):
-        y = tm.makeTimeDataFrame()
-        x = {'a': tm.makeTimeDataFrame(),
-             'b': tm.makeTimeDataFrame()}
-
-        model = ols(y=y, x=x, intercept=False)
-        model.summary
-
-        model = ols(y=y, x=Panel(x))
-        model.summary
-
-    def test_plm_attrs(self):
-        y = tm.makeTimeDataFrame()
-        x = {'a': tm.makeTimeDataFrame(),
-             'b': tm.makeTimeDataFrame()}
-
-        rmodel = ols(y=y, x=x, window=10)
-        model = ols(y=y, x=x)
-        model.resid
-        rmodel.resid
-
-    def test_plm_lagged_y_predict(self):
-        y = tm.makeTimeDataFrame()
-        x = {'a': tm.makeTimeDataFrame(),
-             'b': tm.makeTimeDataFrame()}
-
-        model = ols(y=y, x=x, window=10)
-        result = model.lagged_y_predict(2)
-
-    def test_plm_f_test(self):
-        y = tm.makeTimeDataFrame()
-        x = {'a': tm.makeTimeDataFrame(),
-             'b': tm.makeTimeDataFrame()}
-
-        model = ols(y=y, x=x)
-
-        hyp = '1*a+1*b=0'
-        result = model.f_test(hyp)
-
-        hyp = ['1*a=0',
-               '1*b=0']
-        result = model.f_test(hyp)
-        assert_almost_equal(result['f-stat'], model.f_stat['f-stat'])
-
-    def test_plm_exclude_dummy_corner(self):
-        y = tm.makeTimeDataFrame()
-        x = {'a': tm.makeTimeDataFrame(),
-             'b': tm.makeTimeDataFrame()}
-
-        model = ols(
-            y=y, x=x, entity_effects=True, dropped_dummies={'entity': 'D'})
-        model.summary
-
-        self.assertRaises(Exception, ols, y=y, x=x, entity_effects=True,
-                          dropped_dummies={'entity': 'E'})
-
-    def test_columns_tuples_summary(self):
-        # #1837
-        X = DataFrame(np.random.randn(10, 2), columns=[('a', 'b'), ('c', 'd')])
-        Y = Series(np.random.randn(10))
-
-        # it works!
-        model = ols(y=Y, x=X)
-        model.summary
-
-
-class TestPanelOLS(BaseTest):
-
-    _multiprocess_can_split_ = True
-
-    FIELDS = ['beta', 'df', 'df_model', 'df_resid', 'f_stat',
-              'p_value', 'r2', 'r2_adj', 'rmse', 'std_err',
-              't_stat', 'var_beta']
-
-    _other_fields = ['resid', 'y_fitted']
-
-    def testFiltering(self):
-        result = ols(y=self.panel_y2, x=self.panel_x2)
-
-        x = result._x
-        index = x.index.get_level_values(0)
-        index = Index(sorted(set(index)))
-        exp_index = Index([datetime(2000, 1, 1), datetime(2000, 1, 3)])
-        self.assertTrue
-        (exp_index.equals(index))
-
-        index = x.index.get_level_values(1)
-        index = Index(sorted(set(index)))
-        exp_index = Index(['A', 'B'])
-        self.assertTrue(exp_index.equals(index))
-
-        x = result._x_filtered
-        index = x.index.get_level_values(0)
-        index = Index(sorted(set(index)))
-        exp_index = Index([datetime(2000, 1, 1),
-                           datetime(2000, 1, 3),
-                           datetime(2000, 1, 4)])
-        self.assertTrue(exp_index.equals(index))
-
-        assert_almost_equal(result._y.values.flat, [1, 4, 5])
-
-        exp_x = [[6, 14, 1],
-                 [9, 17, 1],
-                 [30, 48, 1]]
-        assert_almost_equal(exp_x, result._x.values)
-
-        exp_x_filtered = [[6, 14, 1],
-                          [9, 17, 1],
-                          [30, 48, 1],
-                          [11, 20, 1],
-                          [12, 21, 1]]
-        assert_almost_equal(exp_x_filtered, result._x_filtered.values)
-
-        self.assertTrue(result._x_filtered.index.levels[0].equals(
-            result.y_fitted.index))
-
-    def test_wls_panel(self):
-        y = tm.makeTimeDataFrame()
-        x = Panel({'x1': tm.makeTimeDataFrame(),
-                   'x2': tm.makeTimeDataFrame()})
-
-        y.ix[[1, 7], 'A'] = np.nan
-        y.ix[[6, 15], 'B'] = np.nan
-        y.ix[[3, 20], 'C'] = np.nan
-        y.ix[[5, 11], 'D'] = np.nan
-
-        stack_y = y.stack()
-        stack_x = DataFrame(dict((k, v.stack())
-                                 for k, v in compat.iteritems(x)))
-
-        weights = x.std('items')
-        stack_weights = weights.stack()
-
-        stack_y.index = stack_y.index._tuple_index
-        stack_x.index = stack_x.index._tuple_index
-        stack_weights.index = stack_weights.index._tuple_index
-
-        result = ols(y=y, x=x, weights=1 / weights)
-        expected = ols(y=stack_y, x=stack_x, weights=1 / stack_weights)
-
-        assert_almost_equal(result.beta, expected.beta)
-
-        for attr in ['resid', 'y_fitted']:
-            rvals = getattr(result, attr).stack().values
-            evals = getattr(expected, attr).values
-            assert_almost_equal(rvals, evals)
-
-    def testWithTimeEffects(self):
-        result = ols(y=self.panel_y2, x=self.panel_x2, time_effects=True)
-
-        assert_almost_equal(result._y_trans.values.flat, [0, -0.5, 0.5])
-
-        exp_x = [[0, 0], [-10.5, -15.5], [10.5, 15.5]]
-        assert_almost_equal(result._x_trans.values, exp_x)
-
-        # _check_non_raw_results(result)
-
-    def testWithEntityEffects(self):
-        result = ols(y=self.panel_y2, x=self.panel_x2, entity_effects=True)
-
-        assert_almost_equal(result._y.values.flat, [1, 4, 5])
-
-        exp_x = DataFrame([[0., 6., 14., 1.], [0, 9, 17, 1], [1, 30, 48, 1]],
-                          index=result._x.index, columns=['FE_B', 'x1', 'x2',
-                                                          'intercept'],
-                          dtype=float)
-        tm.assert_frame_equal(result._x, exp_x.ix[:, result._x.columns])
-        # _check_non_raw_results(result)
-
-    def testWithEntityEffectsAndDroppedDummies(self):
-        result = ols(y=self.panel_y2, x=self.panel_x2, entity_effects=True,
-                     dropped_dummies={'entity': 'B'})
-
-        assert_almost_equal(result._y.values.flat, [1, 4, 5])
-        exp_x = DataFrame([[1., 6., 14., 1.], [1, 9, 17, 1], [0, 30, 48, 1]],
-                          index=result._x.index, columns=['FE_A', 'x1', 'x2',
-                                                          'intercept'],
-                          dtype=float)
-        tm.assert_frame_equal(result._x, exp_x.ix[:, result._x.columns])
-        # _check_non_raw_results(result)
-
-    def testWithXEffects(self):
-        result = ols(y=self.panel_y2, x=self.panel_x2, x_effects=['x1'])
-
-        assert_almost_equal(result._y.values.flat, [1, 4, 5])
-
-        res = result._x
-        exp_x = DataFrame([[0., 0., 14., 1.], [0, 1, 17, 1], [1, 0, 48, 1]],
-                          columns=['x1_30', 'x1_9', 'x2', 'intercept'],
-                          index=res.index, dtype=float)
-        assert_frame_equal(res, exp_x.reindex(columns=res.columns))
-
-    def testWithXEffectsAndDroppedDummies(self):
-        result = ols(y=self.panel_y2, x=self.panel_x2, x_effects=['x1'],
-                     dropped_dummies={'x1': 30})
-
-        res = result._x
-        assert_almost_equal(result._y.values.flat, [1, 4, 5])
-        exp_x = DataFrame([[1., 0., 14., 1.], [0, 1, 17, 1], [0, 0, 48, 1]],
-                          columns=['x1_6', 'x1_9', 'x2', 'intercept'],
-                          index=res.index, dtype=float)
-
-        assert_frame_equal(res, exp_x.reindex(columns=res.columns))
-
-    def testWithXEffectsAndConversion(self):
-        result = ols(y=self.panel_y3, x=self.panel_x3, x_effects=['x1', 'x2'])
-
-        assert_almost_equal(result._y.values.flat, [1, 2, 3, 4])
-        exp_x = [[0, 0, 0, 1, 1], [1, 0, 0, 0, 1], [0, 1, 1, 0, 1],
-                 [0, 0, 0, 1, 1]]
-        assert_almost_equal(result._x.values, exp_x)
-
-        exp_index = Index(['x1_B', 'x1_C', 'x2_baz', 'x2_foo', 'intercept'])
-        self.assertTrue(exp_index.equals(result._x.columns))
-
-        # _check_non_raw_results(result)
-
-    def testWithXEffectsAndConversionAndDroppedDummies(self):
-        result = ols(y=self.panel_y3, x=self.panel_x3, x_effects=['x1', 'x2'],
-                     dropped_dummies={'x2': 'foo'})
-
-        assert_almost_equal(result._y.values.flat, [1, 2, 3, 4])
-        exp_x = [[0, 0, 0, 0, 1], [1, 0, 1, 0, 1], [0, 1, 0, 1, 1],
-                 [0, 0, 0, 0, 1]]
-        assert_almost_equal(result._x.values, exp_x)
-
-        exp_index = Index(['x1_B', 'x1_C', 'x2_bar', 'x2_baz', 'intercept'])
-        self.assertTrue(exp_index.equals(result._x.columns))
-
-        # _check_non_raw_results(result)
-
-    def testForSeries(self):
-        self.checkForSeries(self.series_panel_x, self.series_panel_y,
-                            self.series_x, self.series_y)
-
-        self.checkForSeries(self.series_panel_x, self.series_panel_y,
-                            self.series_x, self.series_y, nw_lags=0)
-
-        self.checkForSeries(self.series_panel_x, self.series_panel_y,
-                            self.series_x, self.series_y, nw_lags=1,
-                            nw_overlap=True)
-
-    def testRolling(self):
-        self.checkMovingOLS(self.panel_x, self.panel_y)
-
-    def testRollingWithFixedEffects(self):
-        self.checkMovingOLS(self.panel_x, self.panel_y,
-                            entity_effects=True)
-        self.checkMovingOLS(self.panel_x, self.panel_y, intercept=False,
-                            entity_effects=True)
-
-    def testRollingWithTimeEffects(self):
-        self.checkMovingOLS(self.panel_x, self.panel_y,
-                            time_effects=True)
-
-    def testRollingWithNeweyWest(self):
-        self.checkMovingOLS(self.panel_x, self.panel_y,
-                            nw_lags=1)
-
-    def testRollingWithEntityCluster(self):
-        self.checkMovingOLS(self.panel_x, self.panel_y,
-                            cluster='entity')
-    def testUnknownClusterRaisesValueError(self):
-        assertRaisesRegexp(ValueError, "Unrecognized cluster.*ridiculous",
-                           self.checkMovingOLS, self.panel_x, self.panel_y,
-                                               cluster='ridiculous')
-    def testRollingWithTimeEffectsAndEntityCluster(self):
-        self.checkMovingOLS(self.panel_x, self.panel_y,
-                            time_effects=True, cluster='entity')
-
-    def testRollingWithTimeCluster(self):
-        self.checkMovingOLS(self.panel_x, self.panel_y,
-                            cluster='time')
-
-    def testRollingWithNeweyWestAndEntityCluster(self):
-        self.assertRaises(ValueError, self.checkMovingOLS,
-                          self.panel_x, self.panel_y,
-                          nw_lags=1, cluster='entity')
-
-    def testRollingWithNeweyWestAndTimeEffectsAndEntityCluster(self):
-        self.assertRaises(ValueError,
-                          self.checkMovingOLS, self.panel_x, self.panel_y,
-                          nw_lags=1, cluster='entity',
-                          time_effects=True)
-
-    def testExpanding(self):
-        self.checkMovingOLS(
-            self.panel_x, self.panel_y, window_type='expanding')
-
-    def testNonPooled(self):
-        self.checkNonPooled(y=self.panel_y, x=self.panel_x)
-        self.checkNonPooled(y=self.panel_y, x=self.panel_x,
-                            window_type='rolling', window=25, min_periods=10)
-    def testUnknownWindowType(self):
-        assertRaisesRegexp(ValueError, "window.*ridiculous",
-                           self.checkNonPooled, y=self.panel_y, x=self.panel_x,
-                           window_type='ridiculous', window=25, min_periods=10)
-
-    def checkNonPooled(self, x, y, **kwds):
-        # For now, just check that it doesn't crash
-        result = ols(y=y, x=x, pool=False, **kwds)
-
-        _check_repr(result)
-        for attr in NonPooledPanelOLS.ATTRIBUTES:
-            _check_repr(getattr(result, attr))
-
-    def checkMovingOLS(self, x, y, window_type='rolling', **kwds):
-        window = 25  # must be larger than rank of x
-
-        moving = ols(y=y, x=x, window_type=window_type,
-                     window=window, **kwds)
-
-        index = moving._index
-
-        for n, i in enumerate(moving._valid_indices):
-            if window_type == 'rolling' and i >= window:
-                prior_date = index[i - window + 1]
-            else:
-                prior_date = index[0]
-
-            date = index[i]
-
-            x_iter = {}
-            for k, v in compat.iteritems(x):
-                x_iter[k] = v.truncate(before=prior_date, after=date)
-            y_iter = y.truncate(before=prior_date, after=date)
-
-            static = ols(y=y_iter, x=x_iter, **kwds)
-
-            self.compare(static, moving, event_index=i,
-                         result_index=n)
-
-        _check_non_raw_results(moving)
-
-    def checkForSeries(self, x, y, series_x, series_y, **kwds):
-        # Consistency check with simple OLS.
-        result = ols(y=y, x=x, **kwds)
-        reference = ols(y=series_y, x=series_x, **kwds)
-
-        self.compare(reference, result)
-
-    def compare(self, static, moving, event_index=None,
-                result_index=None):
-
-        # Check resid if we have a time index specified
-        if event_index is not None:
-            staticSlice = _period_slice(static, -1)
-            movingSlice = _period_slice(moving, event_index)
-
-            ref = static._resid_raw[staticSlice]
-            res = moving._resid_raw[movingSlice]
-
-            assert_almost_equal(ref, res)
-
-            ref = static._y_fitted_raw[staticSlice]
-            res = moving._y_fitted_raw[movingSlice]
-
-            assert_almost_equal(ref, res)
-
-        # Check y_fitted
-
-        for field in self.FIELDS:
-            attr = '_%s_raw' % field
-
-            ref = getattr(static, attr)
-            res = getattr(moving, attr)
-
-            if result_index is not None:
-                res = res[result_index]
-
-            assert_almost_equal(ref, res)
-
-    def test_auto_rolling_window_type(self):
-        data = tm.makeTimeDataFrame()
-        y = data.pop('A')
-
-        window_model = ols(y=y, x=data, window=20, min_periods=10)
-        rolling_model = ols(y=y, x=data, window=20, min_periods=10,
-                            window_type='rolling')
-
-        assert_frame_equal(window_model.beta, rolling_model.beta)
-
-    def test_group_agg(self):
-        from pandas.stats.plm import _group_agg
-
-        values = np.ones((10, 2)) * np.arange(10).reshape((10, 1))
-        bounds = np.arange(5) * 2
-        f = lambda x: x.mean(axis=0)
-
-        agged = _group_agg(values, bounds, f)
-
-        assert(agged[1][0] == 2.5)
-        assert(agged[2][0] == 4.5)
-
-        # test a function that doesn't aggregate
-        f2 = lambda x: np.zeros((2, 2))
-        self.assertRaises(Exception, _group_agg, values, bounds, f2)
-
-def _check_non_raw_results(model):
-    _check_repr(model)
-    _check_repr(model.resid)
-    _check_repr(model.summary_as_matrix)
-    _check_repr(model.y_fitted)
-    _check_repr(model.y_predict)
-
-
-def _period_slice(panelModel, i):
-    index = panelModel._x_trans.index
-    period = index.levels[0][i]
-
-    L, R = index.get_major_bounds(period, period)
-
-    return slice(L, R)
-
-
-class TestOLSFilter(tm.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        date_index = date_range(datetime(2009, 12, 11), periods=3,
-                                freq=datetools.bday)
-        ts = Series([3, 1, 4], index=date_index)
-        self.TS1 = ts
-
-        date_index = date_range(datetime(2009, 12, 11), periods=5,
-                                freq=datetools.bday)
-        ts = Series([1, 5, 9, 2, 6], index=date_index)
-        self.TS2 = ts
-
-        date_index = date_range(datetime(2009, 12, 11), periods=3,
-                                freq=datetools.bday)
-        ts = Series([5, np.nan, 3], index=date_index)
-        self.TS3 = ts
-
-        date_index = date_range(datetime(2009, 12, 11), periods=5,
-                                freq=datetools.bday)
-        ts = Series([np.nan, 5, 8, 9, 7], index=date_index)
-        self.TS4 = ts
-
-        data = {'x1': self.TS2, 'x2': self.TS4}
-        self.DF1 = DataFrame(data=data)
-
-        data = {'x1': self.TS2, 'x2': self.TS4}
-        self.DICT1 = data
-
-    def testFilterWithSeriesRHS(self):
-        (lhs, rhs, weights, rhs_pre,
-         index, valid) = _filter_data(self.TS1, {'x1': self.TS2}, None)
-        self.tsAssertEqual(self.TS1, lhs)
-        self.tsAssertEqual(self.TS2[:3], rhs['x1'])
-        self.tsAssertEqual(self.TS2, rhs_pre['x1'])
-
-    def testFilterWithSeriesRHS2(self):
-        (lhs, rhs, weights, rhs_pre,
-         index, valid) = _filter_data(self.TS2, {'x1': self.TS1}, None)
-        self.tsAssertEqual(self.TS2[:3], lhs)
-        self.tsAssertEqual(self.TS1, rhs['x1'])
-        self.tsAssertEqual(self.TS1, rhs_pre['x1'])
-
-    def testFilterWithSeriesRHS3(self):
-        (lhs, rhs, weights, rhs_pre,
-         index, valid) = _filter_data(self.TS3, {'x1': self.TS4}, None)
-        exp_lhs = self.TS3[2:3]
-        exp_rhs = self.TS4[2:3]
-        exp_rhs_pre = self.TS4[1:]
-        self.tsAssertEqual(exp_lhs, lhs)
-        self.tsAssertEqual(exp_rhs, rhs['x1'])
-        self.tsAssertEqual(exp_rhs_pre, rhs_pre['x1'])
-
-    def testFilterWithDataFrameRHS(self):
-        (lhs, rhs, weights, rhs_pre,
-         index, valid) = _filter_data(self.TS1, self.DF1, None)
-        exp_lhs = self.TS1[1:]
-        exp_rhs1 = self.TS2[1:3]
-        exp_rhs2 = self.TS4[1:3]
-        self.tsAssertEqual(exp_lhs, lhs)
-        self.tsAssertEqual(exp_rhs1, rhs['x1'])
-        self.tsAssertEqual(exp_rhs2, rhs['x2'])
-
-    def testFilterWithDictRHS(self):
-        (lhs, rhs, weights, rhs_pre,
-         index, valid) = _filter_data(self.TS1, self.DICT1, None)
-        exp_lhs = self.TS1[1:]
-        exp_rhs1 = self.TS2[1:3]
-        exp_rhs2 = self.TS4[1:3]
-        self.tsAssertEqual(exp_lhs, lhs)
-        self.tsAssertEqual(exp_rhs1, rhs['x1'])
-        self.tsAssertEqual(exp_rhs2, rhs['x2'])
-
-    def tsAssertEqual(self, ts1, ts2):
-        self.assert_numpy_array_equal(ts1, ts2)
-
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/stats/tests/test_var.py b/pandas/stats/tests/test_var.py
deleted file mode 100644
index c6eca4041a61b..0000000000000
--- a/pandas/stats/tests/test_var.py
+++ /dev/null
@@ -1,93 +0,0 @@
-from __future__ import print_function
-from numpy.testing import run_module_suite, assert_equal, TestCase
-
-from pandas.util.testing import assert_almost_equal
-
-from pandas.compat import range
-import nose
-import unittest
-
-raise nose.SkipTest('skipping this for now')
-
-try:
-    import statsmodels.tsa.var as sm_var
-    import statsmodels as sm
-except ImportError:
-    import scikits.statsmodels.tsa.var as sm_var
-    import scikits.statsmodels as sm
-
-
-import pandas.stats.var as _pvar
-reload(_pvar)
-from pandas.stats.var import VAR
-
-DECIMAL_6 = 6
-DECIMAL_5 = 5
-DECIMAL_4 = 4
-DECIMAL_3 = 3
-DECIMAL_2 = 2
-
-
-class CheckVAR(object):
-    def test_params(self):
-        assert_almost_equal(self.res1.params, self.res2.params, DECIMAL_3)
-
-    def test_neqs(self):
-        assert_equal(self.res1.neqs, self.res2.neqs)
-
-    def test_nobs(self):
-        assert_equal(self.res1.avobs, self.res2.nobs)
-
-    def test_df_eq(self):
-        assert_equal(self.res1.df_eq, self.res2.df_eq)
-
-    def test_rmse(self):
-        results = self.res1.results
-        for i in range(len(results)):
-            assert_almost_equal(results[i].mse_resid ** .5,
-                                eval('self.res2.rmse_' + str(i + 1)), DECIMAL_6)
-
-    def test_rsquared(self):
-        results = self.res1.results
-        for i in range(len(results)):
-            assert_almost_equal(results[i].rsquared,
-                                eval('self.res2.rsquared_' + str(i + 1)), DECIMAL_3)
-
-    def test_llf(self):
-        results = self.res1.results
-        assert_almost_equal(self.res1.llf, self.res2.llf, DECIMAL_2)
-        for i in range(len(results)):
-            assert_almost_equal(results[i].llf,
-                                eval('self.res2.llf_' + str(i + 1)), DECIMAL_2)
-
-    def test_aic(self):
-        assert_almost_equal(self.res1.aic, self.res2.aic)
-
-    def test_bic(self):
-        assert_almost_equal(self.res1.bic, self.res2.bic)
-
-    def test_hqic(self):
-        assert_almost_equal(self.res1.hqic, self.res2.hqic)
-
-    def test_fpe(self):
-        assert_almost_equal(self.res1.fpe, self.res2.fpe)
-
-    def test_detsig(self):
-        assert_almost_equal(self.res1.detomega, self.res2.detsig)
-
-    def test_bse(self):
-        assert_almost_equal(self.res1.bse, self.res2.bse, DECIMAL_4)
-
-
-class Foo(object):
-    def __init__(self):
-        data = sm.datasets.macrodata.load()
-        data = data.data[['realinv', 'realgdp', 'realcons']].view((float, 3))
-        data = diff(log(data), axis=0)
-        self.res1 = VAR2(endog=data).fit(maxlag=2)
-        from results import results_var
-        self.res2 = results_var.MacrodataResults()
-
-
-if __name__ == '__main__':
-    unittest.main()
diff --git a/pandas/stats/var.py b/pandas/stats/var.py
deleted file mode 100644
index be55507f976cb..0000000000000
--- a/pandas/stats/var.py
+++ /dev/null
@@ -1,595 +0,0 @@
-from __future__ import division
-
-from pandas.compat import range, lrange, zip, reduce
-from pandas import compat
-import numpy as np
-from pandas.core.base import StringMixin
-from pandas.util.decorators import cache_readonly
-from pandas.core.frame import DataFrame
-from pandas.core.panel import Panel
-from pandas.core.series import Series
-import pandas.stats.common as common
-from pandas.stats.math import inv
-from pandas.stats.ols import _combine_rhs
-
-
-class VAR(StringMixin):
-    """
-    Estimates VAR(p) regression on multivariate time series data
-    presented in pandas data structures.
-
-    Parameters
-    ----------
-    data : DataFrame or dict of Series
-    p : lags to include
-
-    """
-
-    def __init__(self, data, p=1, intercept=True):
-        try:
-            import statsmodels.tsa.vector_ar.api as sm_var
-        except ImportError:
-            import scikits.statsmodels.tsa.var as sm_var
-
-        self._data = DataFrame(_combine_rhs(data))
-        self._p = p
-
-        self._columns = self._data.columns
-        self._index = self._data.index
-
-        self._intercept = intercept
-
-    @cache_readonly
-    def aic(self):
-        """Returns the Akaike information criterion."""
-        return self._ic['aic']
-
-    @cache_readonly
-    def bic(self):
-        """Returns the Bayesian information criterion."""
-        return self._ic['bic']
-
-    @cache_readonly
-    def beta(self):
-        """
-        Returns a DataFrame, where each column x1 contains the betas
-        calculated by regressing the x1 column of the VAR input with
-        the lagged input.
-
-        Returns
-        -------
-        DataFrame
-        """
-        d = dict([(key, value.beta)
-                  for (key, value) in compat.iteritems(self.ols_results)])
-        return DataFrame(d)
-
-    def forecast(self, h):
-        """
-        Returns a DataFrame containing the forecasts for 1, 2, ..., n time
-        steps.  Each column x1 contains the forecasts of the x1 column.
-
-        Parameters
-        ----------
-        n: int
-            Number of time steps ahead to forecast.
-
-        Returns
-        -------
-        DataFrame
-        """
-        forecast = self._forecast_raw(h)[:, 0, :]
-        return DataFrame(forecast, index=lrange(1, 1 + h),
-                         columns=self._columns)
-
-    def forecast_cov(self, h):
-        """
-        Returns the covariance of the forecast residuals.
-
-        Returns
-        -------
-        DataFrame
-        """
-        return [DataFrame(value, index=self._columns, columns=self._columns)
-                for value in self._forecast_cov_raw(h)]
-
-    def forecast_std_err(self, h):
-        """
-        Returns the standard errors of the forecast residuals.
-
-        Returns
-        -------
-        DataFrame
-        """
-        return DataFrame(self._forecast_std_err_raw(h),
-                         index=lrange(1, 1 + h), columns=self._columns)
-
-    @cache_readonly
-    def granger_causality(self):
-        """Returns the f-stats and p-values from the Granger Causality Test.
-
-        If the data consists of columns x1, x2, x3, then we perform the
-        following regressions:
-
-        x1 ~ L(x2, x3)
-        x1 ~ L(x1, x3)
-        x1 ~ L(x1, x2)
-
-        The f-stats of these results are placed in the 'x1' column of the
-        returned DataFrame.  We then repeat for x2, x3.
-
-        Returns
-        -------
-        Dict, where 'f-stat' returns the DataFrame containing the f-stats,
-        and 'p-value' returns the DataFrame containing the corresponding
-        p-values of the f-stats.
-        """
-        from pandas.stats.api import ols
-        from scipy.stats import f
-
-        d = {}
-        for col in self._columns:
-            d[col] = {}
-            for i in range(1, 1 + self._p):
-                lagged_data = self._lagged_data[i].filter(
-                    self._columns - [col])
-
-                for key, value in compat.iteritems(lagged_data):
-                    d[col][_make_param_name(i, key)] = value
-
-        f_stat_dict = {}
-        p_value_dict = {}
-
-        for col, y in compat.iteritems(self._data):
-            ssr_full = (self.resid[col] ** 2).sum()
-
-            f_stats = []
-            p_values = []
-
-            for col2 in self._columns:
-                result = ols(y=y, x=d[col2])
-
-                resid = result.resid
-                ssr_reduced = (resid ** 2).sum()
-
-                M = self._p
-                N = self._nobs
-                K = self._k * self._p + 1
-                f_stat = ((ssr_reduced - ssr_full) / M) / (ssr_full / (N - K))
-                f_stats.append(f_stat)
-
-                p_value = f.sf(f_stat, M, N - K)
-                p_values.append(p_value)
-
-            f_stat_dict[col] = Series(f_stats, self._columns)
-            p_value_dict[col] = Series(p_values, self._columns)
-
-        f_stat_mat = DataFrame(f_stat_dict)
-        p_value_mat = DataFrame(p_value_dict)
-
-        return {
-            'f-stat': f_stat_mat,
-            'p-value': p_value_mat,
-        }
-
-    @cache_readonly
-    def ols_results(self):
-        """
-        Returns the results of the regressions:
-        x_1 ~ L(X)
-        x_2 ~ L(X)
-        ...
-        x_k ~ L(X)
-
-        where X = [x_1, x_2, ..., x_k]
-        and L(X) represents the columns of X lagged 1, 2, ..., n lags
-        (n is the user-provided number of lags).
-
-        Returns
-        -------
-        dict
-        """
-        from pandas.stats.api import ols
-
-        d = {}
-        for i in range(1, 1 + self._p):
-            for col, series in compat.iteritems(self._lagged_data[i]):
-                d[_make_param_name(i, col)] = series
-
-        result = dict([(col, ols(y=y, x=d, intercept=self._intercept))
-                       for col, y in compat.iteritems(self._data)])
-
-        return result
-
-    @cache_readonly
-    def resid(self):
-        """
-        Returns the DataFrame containing the residuals of the VAR regressions.
-        Each column x1 contains the residuals generated by regressing the x1
-        column of the input against the lagged input.
-
-        Returns
-        -------
-        DataFrame
-        """
-        d = dict([(col, series.resid)
-                  for (col, series) in compat.iteritems(self.ols_results)])
-        return DataFrame(d, index=self._index)
-
-    @cache_readonly
-    def summary(self):
-        template = """
-%(banner_top)s
-
-Number of Observations:         %(nobs)d
-AIC:                            %(aic).3f
-BIC:                            %(bic).3f
-
-%(banner_coef)s
-%(coef_table)s
-%(banner_end)s
-"""
-        params = {
-            'banner_top': common.banner('Summary of VAR'),
-            'banner_coef': common.banner('Summary of Estimated Coefficients'),
-            'banner_end': common.banner('End of Summary'),
-            'coef_table': self.beta,
-            'aic': self.aic,
-            'bic': self.bic,
-            'nobs': self._nobs,
-        }
-
-        return template % params
-
-    @cache_readonly
-    def _alpha(self):
-        """
-        Returns array where the i-th element contains the intercept
-        when regressing the i-th column of self._data with the lagged data.
-        """
-        if self._intercept:
-            return self._beta_raw[-1]
-        else:
-            return np.zeros(self._k)
-
-    @cache_readonly
-    def _beta_raw(self):
-        return np.array([list(self.beta[col].values()) for col in self._columns]).T
-
-    def _trans_B(self, h):
-        """
-        Returns 0, 1, ..., (h-1)-th power of transpose of B as defined in
-        equation (4) on p. 142 of the Stata 11 Time Series reference book.
-        """
-        result = [np.eye(1 + self._k * self._p)]
-
-        row1 = np.zeros((1, 1 + self._k * self._p))
-        row1[0, 0] = 1
-
-        v = self._alpha.reshape((self._k, 1))
-        row2 = np.hstack(tuple([v] + self._lag_betas))
-
-        m = self._k * (self._p - 1)
-        row3 = np.hstack((
-            np.zeros((m, 1)),
-            np.eye(m),
-            np.zeros((m, self._k))
-        ))
-
-        trans_B = np.vstack((row1, row2, row3)).T
-
-        result.append(trans_B)
-
-        for i in range(2, h):
-            result.append(np.dot(trans_B, result[i - 1]))
-
-        return result
-
-    @cache_readonly
-    def _x(self):
-        values = np.array([
-            list(self._lagged_data[i][col].values())
-            for i in range(1, 1 + self._p)
-            for col in self._columns
-        ]).T
-
-        x = np.hstack((np.ones((len(values), 1)), values))[self._p:]
-
-        return x
-
-    @cache_readonly
-    def _cov_beta(self):
-        cov_resid = self._sigma
-
-        x = self._x
-
-        inv_cov_x = inv(np.dot(x.T, x))
-
-        return np.kron(inv_cov_x, cov_resid)
-
-    def _data_xs(self, i):
-        """
-        Returns the cross-section of the data at the given timestep.
-        """
-        return self._data.values[i]
-
-    def _forecast_cov_raw(self, n):
-        resid = self._forecast_cov_resid_raw(n)
-        # beta = self._forecast_cov_beta_raw(n)
-
-        # return [a + b for a, b in zip(resid, beta)]
-        # TODO: ignore the beta forecast std err until it's verified
-
-        return resid
-
-    def _forecast_cov_beta_raw(self, n):
-        """
-        Returns the covariance of the beta errors for the forecast at
-        1, 2, ..., n timesteps.
-        """
-        p = self._p
-
-        values = self._data.values
-        T = len(values) - self._p - 1
-
-        results = []
-
-        for h in range(1, n + 1):
-            psi = self._psi(h)
-            trans_B = self._trans_B(h)
-
-            sum = 0
-
-            cov_beta = self._cov_beta
-
-            for t in range(T + 1):
-                index = t + p
-                y = values.take(lrange(index, index - p, -1), axis=0).ravel()
-                trans_Z = np.hstack(([1], y))
-                trans_Z = trans_Z.reshape(1, len(trans_Z))
-
-                sum2 = 0
-                for i in range(h):
-                    ZB = np.dot(trans_Z, trans_B[h - 1 - i])
-
-                    prod = np.kron(ZB, psi[i])
-                    sum2 = sum2 + prod
-
-                sum = sum + chain_dot(sum2, cov_beta, sum2.T)
-
-            results.append(sum / (T + 1))
-
-        return results
-
-    def _forecast_cov_resid_raw(self, h):
-        """
-        Returns the covariance of the residual errors for the forecast at
-        1, 2, ..., h timesteps.
-        """
-        psi_values = self._psi(h)
-        sum = 0
-        result = []
-        for i in range(h):
-            psi = psi_values[i]
-            sum = sum + chain_dot(psi, self._sigma, psi.T)
-            result.append(sum)
-
-        return result
-
-    def _forecast_raw(self, h):
-        """
-        Returns the forecast at 1, 2, ..., h timesteps in the future.
-        """
-        k = self._k
-        result = []
-        for i in range(h):
-            sum = self._alpha.reshape(1, k)
-            for j in range(self._p):
-                beta = self._lag_betas[j]
-                idx = i - j
-                if idx > 0:
-                    y = result[idx - 1]
-                else:
-                    y = self._data_xs(idx - 1)
-
-                sum = sum + np.dot(beta, y.T).T
-            result.append(sum)
-
-        return np.array(result)
-
-    def _forecast_std_err_raw(self, h):
-        """
-        Returns the standard error of the forecasts
-        at 1, 2, ..., n timesteps.
-        """
-        return np.array([np.sqrt(np.diag(value))
-                         for value in self._forecast_cov_raw(h)])
-
-    @cache_readonly
-    def _ic(self):
-        """
-        Returns the Akaike/Bayesian information criteria.
-        """
-        RSS = self._rss
-        k = self._p * (self._k * self._p + 1)
-        n = self._nobs * self._k
-
-        return {'aic': 2 * k + n * np.log(RSS / n),
-                'bic': n * np.log(RSS / n) + k * np.log(n)}
-
-    @cache_readonly
-    def _k(self):
-        return len(self._columns)
-
-    @cache_readonly
-    def _lag_betas(self):
-        """
-        Returns list of B_i, where B_i represents the (k, k) matrix
-        with the j-th row containing the betas of regressing the j-th
-        column of self._data with self._data lagged i time steps.
-        First element is B_1, second element is B_2, etc.
-        """
-        k = self._k
-        b = self._beta_raw
-        return [b[k * i: k * (i + 1)].T for i in range(self._p)]
-
-    @cache_readonly
-    def _lagged_data(self):
-        return dict([(i, self._data.shift(i))
-                     for i in range(1, 1 + self._p)])
-
-    @cache_readonly
-    def _nobs(self):
-        return len(self._data) - self._p
-
-    def _psi(self, h):
-        """
-        psi value used for calculating standard error.
-
-        Returns [psi_0, psi_1, ..., psi_(h - 1)]
-        """
-        k = self._k
-        result = [np.eye(k)]
-        for i in range(1, h):
-            result.append(sum(
-                [np.dot(result[i - j], self._lag_betas[j - 1])
-                 for j in range(1, 1 + i)
-                 if j <= self._p]))
-
-        return result
-
-    @cache_readonly
-    def _resid_raw(self):
-        resid = np.array([self.ols_results[col]._resid_raw
-                          for col in self._columns])
-        return resid
-
-    @cache_readonly
-    def _rss(self):
-        """Returns the sum of the squares of the residuals."""
-        return (self._resid_raw ** 2).sum()
-
-    @cache_readonly
-    def _sigma(self):
-        """Returns covariance of resids."""
-        k = self._k
-        n = self._nobs
-
-        resid = self._resid_raw
-
-        return np.dot(resid, resid.T) / (n - k)
-
-    def __unicode__(self):
-        return self.summary
-
-
-def lag_select(data, max_lags=5, ic=None):
-    """
-    Select number of lags based on a variety of information criteria
-
-    Parameters
-    ----------
-    data : DataFrame-like
-    max_lags : int
-        Maximum number of lags to evaluate
-    ic : {None, 'aic', 'bic', ...}
-        Choosing None will just display the results
-
-    Returns
-    -------
-    None
-    """
-    pass
-
-
-class PanelVAR(VAR):
-    """
-    Performs Vector Autoregression on panel data.
-
-    Parameters
-    ----------
-    data: Panel or dict of DataFrame
-    lags: int
-    """
-    def __init__(self, data, lags, intercept=True):
-        self._data = _prep_panel_data(data)
-        self._p = lags
-        self._intercept = intercept
-
-        self._columns = self._data.items
-
-    @cache_readonly
-    def _nobs(self):
-        """Returns the number of observations."""
-        _, timesteps, entities = self._data.values.shape
-        return (timesteps - self._p) * entities
-
-    @cache_readonly
-    def _rss(self):
-        """Returns the sum of the squares of the residuals."""
-        return (self.resid.values ** 2).sum()
-
-    def forecast(self, h):
-        """
-        Returns the forecasts at 1, 2, ..., n timesteps in the future.
-        """
-        forecast = self._forecast_raw(h).T.swapaxes(1, 2)
-        index = lrange(1, 1 + h)
-        w = Panel(forecast, items=self._data.items, major_axis=index,
-                  minor_axis=self._data.minor_axis)
-        return w
-
-    @cache_readonly
-    def resid(self):
-        """
-        Returns the DataFrame containing the residuals of the VAR regressions.
-        Each column x1 contains the residuals generated by regressing the x1
-        column of the input against the lagged input.
-
-        Returns
-        -------
-        DataFrame
-        """
-        d = dict([(key, value.resid)
-                  for (key, value) in compat.iteritems(self.ols_results)])
-        return Panel.fromDict(d)
-
-    def _data_xs(self, i):
-        return self._data.values[:, i, :].T
-
-    @cache_readonly
-    def _sigma(self):
-        """Returns covariance of resids."""
-        k = self._k
-        resid = _drop_incomplete_rows(self.resid.toLong().values)
-        n = len(resid)
-        return np.dot(resid.T, resid) / (n - k)
-
-
-def _prep_panel_data(data):
-    """Converts the given data into a Panel."""
-    if isinstance(data, Panel):
-        return data
-
-    return Panel.fromDict(data)
-
-
-def _drop_incomplete_rows(array):
-    mask = np.isfinite(array).all(1)
-    indices = np.arange(len(array))[mask]
-    return array.take(indices, 0)
-
-
-def _make_param_name(lag, name):
-    return 'L%d.%s' % (lag, name)
-
-
-def chain_dot(*matrices):
-    """
-    Returns the dot product of the given matrices.
-
-    Parameters
-    ----------
-    matrices: argument list of ndarray
-    """
-    return reduce(lambda x, y: np.dot(y, x), matrices[::-1])
diff --git a/pandas/testing.py b/pandas/testing.py
new file mode 100644
index 0000000000000..3baf99957cb33
--- /dev/null
+++ b/pandas/testing.py
@@ -0,0 +1,8 @@
+# flake8: noqa
+
+"""
+Public testing utility functions.
+"""
+
+from pandas.util.testing import (
+    assert_frame_equal, assert_series_equal, assert_index_equal)
diff --git a/pandas/tests/test_msgpack/__init__.py b/pandas/tests/api/__init__.py
similarity index 100%
rename from pandas/tests/test_msgpack/__init__.py
rename to pandas/tests/api/__init__.py
diff --git a/pandas/tests/api/test_api.py b/pandas/tests/api/test_api.py
new file mode 100644
index 0000000000000..ddee4894456ea
--- /dev/null
+++ b/pandas/tests/api/test_api.py
@@ -0,0 +1,253 @@
+# -*- coding: utf-8 -*-
+import sys
+from warnings import catch_warnings
+
+import pytest
+import pandas as pd
+from pandas import api
+from pandas.util import testing as tm
+
+
+class Base(object):
+
+    def check(self, namespace, expected, ignored=None):
+        # see which names are in the namespace, minus optional
+        # ignored ones
+        # compare vs the expected
+
+        result = sorted([f for f in dir(namespace) if not f.startswith('_')])
+        if ignored is not None:
+            result = sorted(list(set(result) - set(ignored)))
+
+        expected = sorted(expected)
+        tm.assert_almost_equal(result, expected)
+
+
+class TestPDApi(Base):
+
+    # these are optionally imported based on testing
+    # & need to be ignored
+    ignored = ['tests', 'locale', 'conftest']
+
+    # top-level sub-packages
+    lib = ['api', 'compat', 'core', 'errors', 'pandas',
+           'plotting', 'test', 'testing', 'tools', 'tseries',
+           'util', 'options', 'io']
+
+    # these are already deprecated; awaiting removal
+    deprecated_modules = ['datetools', 'parser', 'json', 'lib', 'tslib']
+
+    # misc
+    misc = ['IndexSlice', 'NaT']
+
+    # top-level classes
+    classes = ['Categorical', 'CategoricalIndex', 'DataFrame', 'DateOffset',
+               'DatetimeIndex', 'ExcelFile', 'ExcelWriter', 'Float64Index',
+               'Grouper', 'HDFStore', 'Index', 'Int64Index', 'MultiIndex',
+               'Period', 'PeriodIndex', 'RangeIndex', 'UInt64Index',
+               'Series', 'SparseArray', 'SparseDataFrame',
+               'SparseSeries', 'Timedelta',
+               'TimedeltaIndex', 'Timestamp', 'Interval', 'IntervalIndex']
+
+    # these are already deprecated; awaiting removal
+    deprecated_classes = ['TimeGrouper', 'Expr', 'Term']
+
+    # these should be deprecated in the future
+    deprecated_classes_in_future = ['Panel']
+
+    # external modules exposed in pandas namespace
+    modules = ['np', 'datetime']
+
+    # top-level functions
+    funcs = ['bdate_range', 'concat', 'crosstab', 'cut',
+             'date_range', 'interval_range', 'eval',
+             'factorize', 'get_dummies',
+             'infer_freq', 'isna', 'isnull', 'lreshape',
+             'melt', 'notna', 'notnull', 'offsets',
+             'merge', 'merge_ordered', 'merge_asof',
+             'period_range',
+             'pivot', 'pivot_table', 'qcut',
+             'show_versions', 'timedelta_range', 'unique',
+             'value_counts', 'wide_to_long']
+
+    # top-level option funcs
+    funcs_option = ['reset_option', 'describe_option', 'get_option',
+                    'option_context', 'set_option',
+                    'set_eng_float_format']
+
+    # top-level read_* funcs
+    funcs_read = ['read_clipboard', 'read_csv', 'read_excel', 'read_fwf',
+                  'read_gbq', 'read_hdf', 'read_html', 'read_json',
+                  'read_msgpack', 'read_pickle', 'read_sas', 'read_sql',
+                  'read_sql_query', 'read_sql_table', 'read_stata',
+                  'read_table', 'read_feather', 'read_parquet']
+
+    # top-level to_* funcs
+    funcs_to = ['to_datetime', 'to_msgpack',
+                'to_numeric', 'to_pickle', 'to_timedelta']
+
+    # top-level to deprecate in the future
+    deprecated_funcs_in_future = []
+
+    # these are already deprecated; awaiting removal
+    deprecated_funcs = ['pnow', 'match', 'groupby', 'get_store',
+                        'plot_params', 'scatter_matrix']
+
+    def test_api(self):
+
+        self.check(pd,
+                   self.lib + self.misc +
+                   self.modules + self.deprecated_modules +
+                   self.classes + self.deprecated_classes +
+                   self.deprecated_classes_in_future +
+                   self.funcs + self.funcs_option +
+                   self.funcs_read + self.funcs_to +
+                   self.deprecated_funcs_in_future +
+                   self.deprecated_funcs,
+                   self.ignored)
+
+
+class TestApi(Base):
+
+    allowed = ['types', 'extensions']
+
+    def test_api(self):
+
+        self.check(api, self.allowed)
+
+
+class TestTesting(Base):
+
+    funcs = ['assert_frame_equal', 'assert_series_equal',
+             'assert_index_equal']
+
+    def test_testing(self):
+
+        from pandas import testing
+        self.check(testing, self.funcs)
+
+
+class TestDatetoolsDeprecation(object):
+
+    def test_deprecation_access_func(self):
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            pd.datetools.to_datetime('2016-01-01')
+
+    def test_deprecation_access_obj(self):
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            pd.datetools.monthEnd
+
+
+class TestTopLevelDeprecations(object):
+
+    # top-level API deprecations
+    # GH 13790
+
+    def test_pnow(self):
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            pd.pnow(freq='M')
+
+    def test_term(self):
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            pd.Term('index>=date')
+
+    def test_expr(self):
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            pd.Expr('2>1')
+
+    def test_match(self):
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            pd.match([1, 2, 3], [1])
+
+    def test_groupby(self):
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            pd.groupby(pd.Series([1, 2, 3]), [1, 1, 1])
+
+    def test_TimeGrouper(self):
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            pd.TimeGrouper(freq='D')
+
+    # GH 15940
+
+    def test_get_store(self):
+        pytest.importorskip('tables')
+        with tm.ensure_clean() as path:
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                s = pd.get_store(path)
+                s.close()
+
+
+class TestJson(object):
+
+    def test_deprecation_access_func(self):
+        with catch_warnings(record=True):
+            pd.json.dumps([])
+
+
+class TestParser(object):
+
+    def test_deprecation_access_func(self):
+        with catch_warnings(record=True):
+            pd.parser.na_values
+
+
+class TestLib(object):
+
+    def test_deprecation_access_func(self):
+        with catch_warnings(record=True):
+            pd.lib.infer_dtype('foo')
+
+
+class TestTSLib(object):
+
+    def test_deprecation_access_func(self):
+        with catch_warnings(record=True):
+            pd.tslib.Timestamp('20160101')
+
+
+class TestTypes(object):
+
+    def test_deprecation_access_func(self):
+        with tm.assert_produces_warning(
+                FutureWarning, check_stacklevel=False):
+            from pandas.types.concat import union_categoricals
+            c1 = pd.Categorical(list('aabc'))
+            c2 = pd.Categorical(list('abcd'))
+            union_categoricals(
+                [c1, c2],
+                sort_categories=True,
+                ignore_order=True)
+
+
+class TestCDateRange(object):
+
+    def test_deprecation_cdaterange(self):
+        # GH17596
+        from pandas.core.indexes.datetimes import cdate_range
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            cdate_range('2017-01-01', '2017-12-31')
+
+
+class TestCategoricalMove(object):
+
+    def test_categorical_move(self):
+        # May have been cached by another import, e.g. pickle tests.
+        sys.modules.pop("pandas.core.categorical", None)
+
+        with tm.assert_produces_warning(FutureWarning):
+            from pandas.core.categorical import Categorical  # noqa
+
+        sys.modules.pop("pandas.core.categorical", None)
+
+        with tm.assert_produces_warning(FutureWarning):
+            from pandas.core.categorical import CategoricalDtype  # noqa
diff --git a/pandas/tests/api/test_types.py b/pandas/tests/api/test_types.py
new file mode 100644
index 0000000000000..bd4891326c751
--- /dev/null
+++ b/pandas/tests/api/test_types.py
@@ -0,0 +1,65 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from warnings import catch_warnings
+
+import pandas
+from pandas.api import types
+from pandas.util import testing as tm
+
+from .test_api import Base
+
+
+class TestTypes(Base):
+
+    allowed = ['is_bool', 'is_bool_dtype',
+               'is_categorical', 'is_categorical_dtype', 'is_complex',
+               'is_complex_dtype', 'is_datetime64_any_dtype',
+               'is_datetime64_dtype', 'is_datetime64_ns_dtype',
+               'is_datetime64tz_dtype', 'is_datetimetz', 'is_dtype_equal',
+               'is_extension_type', 'is_float', 'is_float_dtype',
+               'is_int64_dtype', 'is_integer',
+               'is_integer_dtype', 'is_number', 'is_numeric_dtype',
+               'is_object_dtype', 'is_scalar', 'is_sparse',
+               'is_string_dtype', 'is_signed_integer_dtype',
+               'is_timedelta64_dtype', 'is_timedelta64_ns_dtype',
+               'is_unsigned_integer_dtype', 'is_period',
+               'is_period_dtype', 'is_interval', 'is_interval_dtype',
+               'is_re', 'is_re_compilable',
+               'is_dict_like', 'is_iterator', 'is_file_like',
+               'is_list_like', 'is_hashable', 'is_array_like',
+               'is_named_tuple',
+               'pandas_dtype', 'union_categoricals', 'infer_dtype']
+    deprecated = ['is_any_int_dtype', 'is_floating_dtype', 'is_sequence']
+    dtypes = ['CategoricalDtype', 'DatetimeTZDtype',
+              'PeriodDtype', 'IntervalDtype']
+
+    def test_types(self):
+
+        self.check(types, self.allowed + self.dtypes + self.deprecated)
+
+    def check_deprecation(self, fold, fnew):
+        with tm.assert_produces_warning(DeprecationWarning):
+            try:
+                result = fold('foo')
+                expected = fnew('foo')
+                assert result == expected
+            except TypeError:
+                pytest.raises(TypeError, lambda: fnew('foo'))
+            except AttributeError:
+                pytest.raises(AttributeError, lambda: fnew('foo'))
+
+    def test_deprecated_from_api_types(self):
+
+        for t in self.deprecated:
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                getattr(types, t)(1)
+
+
+def test_moved_infer_dtype():
+
+    with catch_warnings(record=True):
+        e = pandas.lib.infer_dtype('foo')
+        assert e is not None
diff --git a/pandas/tools/tests/__init__.py b/pandas/tests/categorical/__init__.py
similarity index 100%
rename from pandas/tools/tests/__init__.py
rename to pandas/tests/categorical/__init__.py
diff --git a/pandas/tests/categorical/common.py b/pandas/tests/categorical/common.py
new file mode 100644
index 0000000000000..9462482553ed8
--- /dev/null
+++ b/pandas/tests/categorical/common.py
@@ -0,0 +1,10 @@
+# -*- coding: utf-8 -*-
+
+from pandas import Categorical
+
+
+class TestCategorical(object):
+
+    def setup_method(self, method):
+        self.factor = Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'],
+                                  ordered=True)
diff --git a/pandas/tests/categorical/conftest.py b/pandas/tests/categorical/conftest.py
new file mode 100644
index 0000000000000..274389d484995
--- /dev/null
+++ b/pandas/tests/categorical/conftest.py
@@ -0,0 +1,13 @@
+import pytest
+
+
+@pytest.fixture(params=[True, False])
+def allow_fill(request):
+    """Boolean 'allow_fill' parameter for Categorical.take"""
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def ordered(request):
+    """Boolean 'ordered' parameter for Categorical."""
+    return request.param
diff --git a/pandas/tests/categorical/test_algos.py b/pandas/tests/categorical/test_algos.py
new file mode 100644
index 0000000000000..dcf2081ae32fe
--- /dev/null
+++ b/pandas/tests/categorical/test_algos.py
@@ -0,0 +1,113 @@
+import pytest
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize('ordered', [True, False])
+@pytest.mark.parametrize('categories', [
+    ['b', 'a', 'c'],
+    ['a', 'b', 'c', 'd'],
+])
+def test_factorize(categories, ordered):
+    cat = pd.Categorical(['b', 'b', 'a', 'c', None],
+                         categories=categories,
+                         ordered=ordered)
+    labels, uniques = pd.factorize(cat)
+    expected_labels = np.array([0, 0, 1, 2, -1], dtype=np.intp)
+    expected_uniques = pd.Categorical(['b', 'a', 'c'],
+                                      categories=categories,
+                                      ordered=ordered)
+
+    tm.assert_numpy_array_equal(labels, expected_labels)
+    tm.assert_categorical_equal(uniques, expected_uniques)
+
+
+def test_factorized_sort():
+    cat = pd.Categorical(['b', 'b', None, 'a'])
+    labels, uniques = pd.factorize(cat, sort=True)
+    expected_labels = np.array([1, 1, -1, 0], dtype=np.intp)
+    expected_uniques = pd.Categorical(['a', 'b'])
+
+    tm.assert_numpy_array_equal(labels, expected_labels)
+    tm.assert_categorical_equal(uniques, expected_uniques)
+
+
+def test_factorized_sort_ordered():
+    cat = pd.Categorical(['b', 'b', None, 'a'],
+                         categories=['c', 'b', 'a'],
+                         ordered=True)
+
+    labels, uniques = pd.factorize(cat, sort=True)
+    expected_labels = np.array([0, 0, -1, 1], dtype=np.intp)
+    expected_uniques = pd.Categorical(['b', 'a'],
+                                      categories=['c', 'b', 'a'],
+                                      ordered=True)
+
+    tm.assert_numpy_array_equal(labels, expected_labels)
+    tm.assert_categorical_equal(uniques, expected_uniques)
+
+
+def test_isin_cats():
+    # GH2003
+    cat = pd.Categorical(["a", "b", np.nan])
+
+    result = cat.isin(["a", np.nan])
+    expected = np.array([True, False, True], dtype=bool)
+    tm.assert_numpy_array_equal(expected, result)
+
+    result = cat.isin(["a", "c"])
+    expected = np.array([True, False, False], dtype=bool)
+    tm.assert_numpy_array_equal(expected, result)
+
+
+@pytest.mark.parametrize("empty", [[], pd.Series(), np.array([])])
+def test_isin_empty(empty):
+    s = pd.Categorical(["a", "b"])
+    expected = np.array([False, False], dtype=bool)
+
+    result = s.isin(empty)
+    tm.assert_numpy_array_equal(expected, result)
+
+
+class TestTake(object):
+    # https://github.com/pandas-dev/pandas/issues/20664
+
+    def test_take_warns(self):
+        cat = pd.Categorical(['a', 'b'])
+        with tm.assert_produces_warning(FutureWarning):
+            cat.take([0, -1])
+
+    def test_take_positive_no_warning(self):
+        cat = pd.Categorical(['a', 'b'])
+        with tm.assert_produces_warning(None):
+            cat.take([0, 0])
+
+    def test_take_bounds(self, allow_fill):
+        # https://github.com/pandas-dev/pandas/issues/20664
+        cat = pd.Categorical(['a', 'b', 'a'])
+        with pytest.raises(IndexError):
+            cat.take([4, 5], allow_fill=allow_fill)
+
+    def test_take_empty(self, allow_fill):
+        # https://github.com/pandas-dev/pandas/issues/20664
+        cat = pd.Categorical([], categories=['a', 'b'])
+        with pytest.raises(IndexError):
+            cat.take([0], allow_fill=allow_fill)
+
+    def test_positional_take(self, ordered):
+        cat = pd.Categorical(['a', 'a', 'b', 'b'], categories=['b', 'a'],
+                             ordered=ordered)
+        result = cat.take([0, 1, 2], allow_fill=False)
+        expected = pd.Categorical(['a', 'a', 'b'], categories=cat.categories,
+                                  ordered=ordered)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_positional_take_unobserved(self, ordered):
+        cat = pd.Categorical(['a', 'b'], categories=['a', 'b', 'c'],
+                             ordered=ordered)
+        result = cat.take([1, 0], allow_fill=False)
+        expected = pd.Categorical(['b', 'a'], categories=cat.categories,
+                                  ordered=ordered)
+        tm.assert_categorical_equal(result, expected)
diff --git a/pandas/tests/categorical/test_analytics.py b/pandas/tests/categorical/test_analytics.py
new file mode 100644
index 0000000000000..53d0e596a1d99
--- /dev/null
+++ b/pandas/tests/categorical/test_analytics.py
@@ -0,0 +1,320 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+import sys
+
+import numpy as np
+
+import pandas.util.testing as tm
+from pandas import Categorical, Index, Series
+
+from pandas.compat import PYPY
+
+
+class TestCategoricalAnalytics(object):
+
+    def test_min_max(self):
+
+        # unordered cats have no min/max
+        cat = Categorical(["a", "b", "c", "d"], ordered=False)
+        pytest.raises(TypeError, lambda: cat.min())
+        pytest.raises(TypeError, lambda: cat.max())
+
+        cat = Categorical(["a", "b", "c", "d"], ordered=True)
+        _min = cat.min()
+        _max = cat.max()
+        assert _min == "a"
+        assert _max == "d"
+
+        cat = Categorical(["a", "b", "c", "d"],
+                          categories=['d', 'c', 'b', 'a'], ordered=True)
+        _min = cat.min()
+        _max = cat.max()
+        assert _min == "d"
+        assert _max == "a"
+
+        cat = Categorical([np.nan, "b", "c", np.nan],
+                          categories=['d', 'c', 'b', 'a'], ordered=True)
+        _min = cat.min()
+        _max = cat.max()
+        assert np.isnan(_min)
+        assert _max == "b"
+
+        _min = cat.min(numeric_only=True)
+        assert _min == "c"
+        _max = cat.max(numeric_only=True)
+        assert _max == "b"
+
+        cat = Categorical([np.nan, 1, 2, np.nan], categories=[5, 4, 3, 2, 1],
+                          ordered=True)
+        _min = cat.min()
+        _max = cat.max()
+        assert np.isnan(_min)
+        assert _max == 1
+
+        _min = cat.min(numeric_only=True)
+        assert _min == 2
+        _max = cat.max(numeric_only=True)
+        assert _max == 1
+
+    @pytest.mark.parametrize("values,categories,exp_mode", [
+        ([1, 1, 2, 4, 5, 5, 5], [5, 4, 3, 2, 1], [5]),
+        ([1, 1, 1, 4, 5, 5, 5], [5, 4, 3, 2, 1], [5, 1]),
+        ([1, 2, 3, 4, 5], [5, 4, 3, 2, 1], [5, 4, 3, 2, 1]),
+        ([np.nan, np.nan, np.nan, 4, 5], [5, 4, 3, 2, 1], [5, 4]),
+        ([np.nan, np.nan, np.nan, 4, 5, 4], [5, 4, 3, 2, 1], [4]),
+        ([np.nan, np.nan, 4, 5, 4], [5, 4, 3, 2, 1], [4])])
+    def test_mode(self, values, categories, exp_mode):
+        s = Categorical(values, categories=categories, ordered=True)
+        res = s.mode()
+        exp = Categorical(exp_mode, categories=categories, ordered=True)
+        tm.assert_categorical_equal(res, exp)
+
+    def test_searchsorted(self):
+        # https://github.com/pandas-dev/pandas/issues/8420
+        # https://github.com/pandas-dev/pandas/issues/14522
+
+        c1 = Categorical(['cheese', 'milk', 'apple', 'bread', 'bread'],
+                         categories=['cheese', 'milk', 'apple', 'bread'],
+                         ordered=True)
+        s1 = Series(c1)
+        c2 = Categorical(['cheese', 'milk', 'apple', 'bread', 'bread'],
+                         categories=['cheese', 'milk', 'apple', 'bread'],
+                         ordered=False)
+        s2 = Series(c2)
+
+        # Searching for single item argument, side='left' (default)
+        res_cat = c1.searchsorted('apple')
+        res_ser = s1.searchsorted('apple')
+        exp = np.array([2], dtype=np.intp)
+        tm.assert_numpy_array_equal(res_cat, exp)
+        tm.assert_numpy_array_equal(res_ser, exp)
+
+        # Searching for single item array, side='left' (default)
+        res_cat = c1.searchsorted(['bread'])
+        res_ser = s1.searchsorted(['bread'])
+        exp = np.array([3], dtype=np.intp)
+        tm.assert_numpy_array_equal(res_cat, exp)
+        tm.assert_numpy_array_equal(res_ser, exp)
+
+        # Searching for several items array, side='right'
+        res_cat = c1.searchsorted(['apple', 'bread'], side='right')
+        res_ser = s1.searchsorted(['apple', 'bread'], side='right')
+        exp = np.array([3, 5], dtype=np.intp)
+        tm.assert_numpy_array_equal(res_cat, exp)
+        tm.assert_numpy_array_equal(res_ser, exp)
+
+        # Searching for a single value that is not from the Categorical
+        pytest.raises(ValueError, lambda: c1.searchsorted('cucumber'))
+        pytest.raises(ValueError, lambda: s1.searchsorted('cucumber'))
+
+        # Searching for multiple values one of each is not from the Categorical
+        pytest.raises(ValueError,
+                      lambda: c1.searchsorted(['bread', 'cucumber']))
+        pytest.raises(ValueError,
+                      lambda: s1.searchsorted(['bread', 'cucumber']))
+
+        # searchsorted call for unordered Categorical
+        pytest.raises(ValueError, lambda: c2.searchsorted('apple'))
+        pytest.raises(ValueError, lambda: s2.searchsorted('apple'))
+
+        with tm.assert_produces_warning(FutureWarning):
+            res = c1.searchsorted(v=['bread'])
+            exp = np.array([3], dtype=np.intp)
+            tm.assert_numpy_array_equal(res, exp)
+
+    def test_unique(self):
+        # categories are reordered based on value when ordered=False
+        cat = Categorical(["a", "b"])
+        exp = Index(["a", "b"])
+        res = cat.unique()
+        tm.assert_index_equal(res.categories, exp)
+        tm.assert_categorical_equal(res, cat)
+
+        cat = Categorical(["a", "b", "a", "a"], categories=["a", "b", "c"])
+        res = cat.unique()
+        tm.assert_index_equal(res.categories, exp)
+        tm.assert_categorical_equal(res, Categorical(exp))
+
+        cat = Categorical(["c", "a", "b", "a", "a"],
+                          categories=["a", "b", "c"])
+        exp = Index(["c", "a", "b"])
+        res = cat.unique()
+        tm.assert_index_equal(res.categories, exp)
+        exp_cat = Categorical(exp, categories=['c', 'a', 'b'])
+        tm.assert_categorical_equal(res, exp_cat)
+
+        # nan must be removed
+        cat = Categorical(["b", np.nan, "b", np.nan, "a"],
+                          categories=["a", "b", "c"])
+        res = cat.unique()
+        exp = Index(["b", "a"])
+        tm.assert_index_equal(res.categories, exp)
+        exp_cat = Categorical(["b", np.nan, "a"], categories=["b", "a"])
+        tm.assert_categorical_equal(res, exp_cat)
+
+    def test_unique_ordered(self):
+        # keep categories order when ordered=True
+        cat = Categorical(['b', 'a', 'b'], categories=['a', 'b'], ordered=True)
+        res = cat.unique()
+        exp_cat = Categorical(['b', 'a'], categories=['a', 'b'], ordered=True)
+        tm.assert_categorical_equal(res, exp_cat)
+
+        cat = Categorical(['c', 'b', 'a', 'a'], categories=['a', 'b', 'c'],
+                          ordered=True)
+        res = cat.unique()
+        exp_cat = Categorical(['c', 'b', 'a'], categories=['a', 'b', 'c'],
+                              ordered=True)
+        tm.assert_categorical_equal(res, exp_cat)
+
+        cat = Categorical(['b', 'a', 'a'], categories=['a', 'b', 'c'],
+                          ordered=True)
+        res = cat.unique()
+        exp_cat = Categorical(['b', 'a'], categories=['a', 'b'], ordered=True)
+        tm.assert_categorical_equal(res, exp_cat)
+
+        cat = Categorical(['b', 'b', np.nan, 'a'], categories=['a', 'b', 'c'],
+                          ordered=True)
+        res = cat.unique()
+        exp_cat = Categorical(['b', np.nan, 'a'], categories=['a', 'b'],
+                              ordered=True)
+        tm.assert_categorical_equal(res, exp_cat)
+
+    def test_unique_index_series(self):
+        c = Categorical([3, 1, 2, 2, 1], categories=[3, 2, 1])
+        # Categorical.unique sorts categories by appearance order
+        # if ordered=False
+        exp = Categorical([3, 1, 2], categories=[3, 1, 2])
+        tm.assert_categorical_equal(c.unique(), exp)
+
+        tm.assert_index_equal(Index(c).unique(), Index(exp))
+        tm.assert_categorical_equal(Series(c).unique(), exp)
+
+        c = Categorical([1, 1, 2, 2], categories=[3, 2, 1])
+        exp = Categorical([1, 2], categories=[1, 2])
+        tm.assert_categorical_equal(c.unique(), exp)
+        tm.assert_index_equal(Index(c).unique(), Index(exp))
+        tm.assert_categorical_equal(Series(c).unique(), exp)
+
+        c = Categorical([3, 1, 2, 2, 1], categories=[3, 2, 1], ordered=True)
+        # Categorical.unique keeps categories order if ordered=True
+        exp = Categorical([3, 1, 2], categories=[3, 2, 1], ordered=True)
+        tm.assert_categorical_equal(c.unique(), exp)
+
+        tm.assert_index_equal(Index(c).unique(), Index(exp))
+        tm.assert_categorical_equal(Series(c).unique(), exp)
+
+    def test_shift(self):
+        # GH 9416
+        cat = Categorical(['a', 'b', 'c', 'd', 'a'])
+
+        # shift forward
+        sp1 = cat.shift(1)
+        xp1 = Categorical([np.nan, 'a', 'b', 'c', 'd'])
+        tm.assert_categorical_equal(sp1, xp1)
+        tm.assert_categorical_equal(cat[:-1], sp1[1:])
+
+        # shift back
+        sn2 = cat.shift(-2)
+        xp2 = Categorical(['c', 'd', 'a', np.nan, np.nan],
+                          categories=['a', 'b', 'c', 'd'])
+        tm.assert_categorical_equal(sn2, xp2)
+        tm.assert_categorical_equal(cat[2:], sn2[:-2])
+
+        # shift by zero
+        tm.assert_categorical_equal(cat, cat.shift(0))
+
+    def test_nbytes(self):
+        cat = Categorical([1, 2, 3])
+        exp = 3 + 3 * 8  # 3 int8s for values + 3 int64s for categories
+        assert cat.nbytes == exp
+
+    def test_memory_usage(self):
+        cat = Categorical([1, 2, 3])
+
+        # .categories is an index, so we include the hashtable
+        assert 0 < cat.nbytes <= cat.memory_usage()
+        assert 0 < cat.nbytes <= cat.memory_usage(deep=True)
+
+        cat = Categorical(['foo', 'foo', 'bar'])
+        assert cat.memory_usage(deep=True) > cat.nbytes
+
+        if not PYPY:
+            # sys.getsizeof will call the .memory_usage with
+            # deep=True, and add on some GC overhead
+            diff = cat.memory_usage(deep=True) - sys.getsizeof(cat)
+            assert abs(diff) < 100
+
+    def test_map(self):
+        c = Categorical(list('ABABC'), categories=list('CBA'), ordered=True)
+        result = c.map(lambda x: x.lower())
+        exp = Categorical(list('ababc'), categories=list('cba'), ordered=True)
+        tm.assert_categorical_equal(result, exp)
+
+        c = Categorical(list('ABABC'), categories=list('ABC'), ordered=False)
+        result = c.map(lambda x: x.lower())
+        exp = Categorical(list('ababc'), categories=list('abc'), ordered=False)
+        tm.assert_categorical_equal(result, exp)
+
+        result = c.map(lambda x: 1)
+        # GH 12766: Return an index not an array
+        tm.assert_index_equal(result, Index(np.array([1] * 5, dtype=np.int64)))
+
+    def test_validate_inplace(self):
+        cat = Categorical(['A', 'B', 'B', 'C', 'A'])
+        invalid_values = [1, "True", [1, 2, 3], 5.0]
+
+        for value in invalid_values:
+            with pytest.raises(ValueError):
+                cat.set_ordered(value=True, inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.as_ordered(inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.as_unordered(inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.set_categories(['X', 'Y', 'Z'], rename=True, inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.rename_categories(['X', 'Y', 'Z'], inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.reorder_categories(
+                    ['X', 'Y', 'Z'], ordered=True, inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.add_categories(
+                    new_categories=['D', 'E', 'F'], inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.remove_categories(removals=['D', 'E', 'F'], inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.remove_unused_categories(inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.sort_values(inplace=value)
+
+    def test_repeat(self):
+        # GH10183
+        cat = Categorical(["a", "b"], categories=["a", "b"])
+        exp = Categorical(["a", "a", "b", "b"], categories=["a", "b"])
+        res = cat.repeat(2)
+        tm.assert_categorical_equal(res, exp)
+
+    def test_numpy_repeat(self):
+        cat = Categorical(["a", "b"], categories=["a", "b"])
+        exp = Categorical(["a", "a", "b", "b"], categories=["a", "b"])
+        tm.assert_categorical_equal(np.repeat(cat, 2), exp)
+
+        msg = "the 'axis' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.repeat, cat, 2, axis=1)
+
+    def test_isna(self):
+        exp = np.array([False, False, True])
+        c = Categorical(["a", "b", np.nan])
+        res = c.isna()
+
+        tm.assert_numpy_array_equal(res, exp)
diff --git a/pandas/tests/categorical/test_api.py b/pandas/tests/categorical/test_api.py
new file mode 100644
index 0000000000000..ad5b78b36438b
--- /dev/null
+++ b/pandas/tests/categorical/test_api.py
@@ -0,0 +1,518 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+import numpy as np
+
+import pandas.util.testing as tm
+from pandas import Categorical, CategoricalIndex, Index, Series, DataFrame
+
+from pandas.core.arrays.categorical import _recode_for_categories
+from pandas.tests.categorical.common import TestCategorical
+
+
+class TestCategoricalAPI(object):
+
+    def test_ordered_api(self):
+        # GH 9347
+        cat1 = Categorical(list('acb'), ordered=False)
+        tm.assert_index_equal(cat1.categories, Index(['a', 'b', 'c']))
+        assert not cat1.ordered
+
+        cat2 = Categorical(list('acb'), categories=list('bca'), ordered=False)
+        tm.assert_index_equal(cat2.categories, Index(['b', 'c', 'a']))
+        assert not cat2.ordered
+
+        cat3 = Categorical(list('acb'), ordered=True)
+        tm.assert_index_equal(cat3.categories, Index(['a', 'b', 'c']))
+        assert cat3.ordered
+
+        cat4 = Categorical(list('acb'), categories=list('bca'), ordered=True)
+        tm.assert_index_equal(cat4.categories, Index(['b', 'c', 'a']))
+        assert cat4.ordered
+
+    def test_set_ordered(self):
+
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+        cat2 = cat.as_unordered()
+        assert not cat2.ordered
+        cat2 = cat.as_ordered()
+        assert cat2.ordered
+        cat2.as_unordered(inplace=True)
+        assert not cat2.ordered
+        cat2.as_ordered(inplace=True)
+        assert cat2.ordered
+
+        assert cat2.set_ordered(True).ordered
+        assert not cat2.set_ordered(False).ordered
+        cat2.set_ordered(True, inplace=True)
+        assert cat2.ordered
+        cat2.set_ordered(False, inplace=True)
+        assert not cat2.ordered
+
+        # removed in 0.19.0
+        msg = "can\'t set attribute"
+        with tm.assert_raises_regex(AttributeError, msg):
+            cat.ordered = True
+        with tm.assert_raises_regex(AttributeError, msg):
+            cat.ordered = False
+
+    def test_rename_categories(self):
+        cat = Categorical(["a", "b", "c", "a"])
+
+        # inplace=False: the old one must not be changed
+        res = cat.rename_categories([1, 2, 3])
+        tm.assert_numpy_array_equal(res.__array__(), np.array([1, 2, 3, 1],
+                                                              dtype=np.int64))
+        tm.assert_index_equal(res.categories, Index([1, 2, 3]))
+
+        exp_cat = np.array(["a", "b", "c", "a"], dtype=np.object_)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_cat)
+
+        exp_cat = Index(["a", "b", "c"])
+        tm.assert_index_equal(cat.categories, exp_cat)
+
+        # GH18862 (let rename_categories take callables)
+        result = cat.rename_categories(lambda x: x.upper())
+        expected = Categorical(["A", "B", "C", "A"])
+        tm.assert_categorical_equal(result, expected)
+
+        # and now inplace
+        res = cat.rename_categories([1, 2, 3], inplace=True)
+        assert res is None
+        tm.assert_numpy_array_equal(cat.__array__(), np.array([1, 2, 3, 1],
+                                                              dtype=np.int64))
+        tm.assert_index_equal(cat.categories, Index([1, 2, 3]))
+
+        # Lengthen
+        with pytest.raises(ValueError):
+            cat.rename_categories([1, 2, 3, 4])
+
+        # Shorten
+        with pytest.raises(ValueError):
+            cat.rename_categories([1, 2])
+
+    def test_rename_categories_series(self):
+        # https://github.com/pandas-dev/pandas/issues/17981
+        c = Categorical(['a', 'b'])
+        xpr = "Treating Series 'new_categories' as a list-like "
+        with tm.assert_produces_warning(FutureWarning) as rec:
+            result = c.rename_categories(Series([0, 1]))
+
+        assert len(rec) == 1
+        assert xpr in str(rec[0].message)
+        expected = Categorical([0, 1])
+        tm.assert_categorical_equal(result, expected)
+
+    def test_rename_categories_dict(self):
+        # GH 17336
+        cat = Categorical(['a', 'b', 'c', 'd'])
+        res = cat.rename_categories({'a': 4, 'b': 3, 'c': 2, 'd': 1})
+        expected = Index([4, 3, 2, 1])
+        tm.assert_index_equal(res.categories, expected)
+
+        # Test for inplace
+        res = cat.rename_categories({'a': 4, 'b': 3, 'c': 2, 'd': 1},
+                                    inplace=True)
+        assert res is None
+        tm.assert_index_equal(cat.categories, expected)
+
+        # Test for dicts of smaller length
+        cat = Categorical(['a', 'b', 'c', 'd'])
+        res = cat.rename_categories({'a': 1, 'c': 3})
+
+        expected = Index([1, 'b', 3, 'd'])
+        tm.assert_index_equal(res.categories, expected)
+
+        # Test for dicts with bigger length
+        cat = Categorical(['a', 'b', 'c', 'd'])
+        res = cat.rename_categories({'a': 1, 'b': 2, 'c': 3,
+                                     'd': 4, 'e': 5, 'f': 6})
+        expected = Index([1, 2, 3, 4])
+        tm.assert_index_equal(res.categories, expected)
+
+        # Test for dicts with no items from old categories
+        cat = Categorical(['a', 'b', 'c', 'd'])
+        res = cat.rename_categories({'f': 1, 'g': 3})
+
+        expected = Index(['a', 'b', 'c', 'd'])
+        tm.assert_index_equal(res.categories, expected)
+
+    def test_reorder_categories(self):
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+        old = cat.copy()
+        new = Categorical(["a", "b", "c", "a"], categories=["c", "b", "a"],
+                          ordered=True)
+
+        # first inplace == False
+        res = cat.reorder_categories(["c", "b", "a"])
+        # cat must be the same as before
+        tm.assert_categorical_equal(cat, old)
+        # only res is changed
+        tm.assert_categorical_equal(res, new)
+
+        # inplace == True
+        res = cat.reorder_categories(["c", "b", "a"], inplace=True)
+        assert res is None
+        tm.assert_categorical_equal(cat, new)
+
+        # not all "old" included in "new"
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+
+        def f():
+            cat.reorder_categories(["a"])
+
+        pytest.raises(ValueError, f)
+
+        # still not all "old" in "new"
+        def f():
+            cat.reorder_categories(["a", "b", "d"])
+
+        pytest.raises(ValueError, f)
+
+        # all "old" included in "new", but too long
+        def f():
+            cat.reorder_categories(["a", "b", "c", "d"])
+
+        pytest.raises(ValueError, f)
+
+    def test_add_categories(self):
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+        old = cat.copy()
+        new = Categorical(["a", "b", "c", "a"],
+                          categories=["a", "b", "c", "d"], ordered=True)
+
+        # first inplace == False
+        res = cat.add_categories("d")
+        tm.assert_categorical_equal(cat, old)
+        tm.assert_categorical_equal(res, new)
+
+        res = cat.add_categories(["d"])
+        tm.assert_categorical_equal(cat, old)
+        tm.assert_categorical_equal(res, new)
+
+        # inplace == True
+        res = cat.add_categories("d", inplace=True)
+        tm.assert_categorical_equal(cat, new)
+        assert res is None
+
+        # new is in old categories
+        def f():
+            cat.add_categories(["d"])
+
+        pytest.raises(ValueError, f)
+
+        # GH 9927
+        cat = Categorical(list("abc"), ordered=True)
+        expected = Categorical(
+            list("abc"), categories=list("abcde"), ordered=True)
+        # test with Series, np.array, index, list
+        res = cat.add_categories(Series(["d", "e"]))
+        tm.assert_categorical_equal(res, expected)
+        res = cat.add_categories(np.array(["d", "e"]))
+        tm.assert_categorical_equal(res, expected)
+        res = cat.add_categories(Index(["d", "e"]))
+        tm.assert_categorical_equal(res, expected)
+        res = cat.add_categories(["d", "e"])
+        tm.assert_categorical_equal(res, expected)
+
+    def test_set_categories(self):
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+        exp_categories = Index(["c", "b", "a"])
+        exp_values = np.array(["a", "b", "c", "a"], dtype=np.object_)
+
+        res = cat.set_categories(["c", "b", "a"], inplace=True)
+        tm.assert_index_equal(cat.categories, exp_categories)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_values)
+        assert res is None
+
+        res = cat.set_categories(["a", "b", "c"])
+        # cat must be the same as before
+        tm.assert_index_equal(cat.categories, exp_categories)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_values)
+        # only res is changed
+        exp_categories_back = Index(["a", "b", "c"])
+        tm.assert_index_equal(res.categories, exp_categories_back)
+        tm.assert_numpy_array_equal(res.__array__(), exp_values)
+
+        # not all "old" included in "new" -> all not included ones are now
+        # np.nan
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+        res = cat.set_categories(["a"])
+        tm.assert_numpy_array_equal(res.codes, np.array([0, -1, -1, 0],
+                                                        dtype=np.int8))
+
+        # still not all "old" in "new"
+        res = cat.set_categories(["a", "b", "d"])
+        tm.assert_numpy_array_equal(res.codes, np.array([0, 1, -1, 0],
+                                                        dtype=np.int8))
+        tm.assert_index_equal(res.categories, Index(["a", "b", "d"]))
+
+        # all "old" included in "new"
+        cat = cat.set_categories(["a", "b", "c", "d"])
+        exp_categories = Index(["a", "b", "c", "d"])
+        tm.assert_index_equal(cat.categories, exp_categories)
+
+        # internals...
+        c = Categorical([1, 2, 3, 4, 1], categories=[1, 2, 3, 4], ordered=True)
+        tm.assert_numpy_array_equal(c._codes, np.array([0, 1, 2, 3, 0],
+                                                       dtype=np.int8))
+        tm.assert_index_equal(c.categories, Index([1, 2, 3, 4]))
+
+        exp = np.array([1, 2, 3, 4, 1], dtype=np.int64)
+        tm.assert_numpy_array_equal(c.get_values(), exp)
+
+        # all "pointers" to '4' must be changed from 3 to 0,...
+        c = c.set_categories([4, 3, 2, 1])
+
+        # positions are changed
+        tm.assert_numpy_array_equal(c._codes, np.array([3, 2, 1, 0, 3],
+                                                       dtype=np.int8))
+
+        # categories are now in new order
+        tm.assert_index_equal(c.categories, Index([4, 3, 2, 1]))
+
+        # output is the same
+        exp = np.array([1, 2, 3, 4, 1], dtype=np.int64)
+        tm.assert_numpy_array_equal(c.get_values(), exp)
+        assert c.min() == 4
+        assert c.max() == 1
+
+        # set_categories should set the ordering if specified
+        c2 = c.set_categories([4, 3, 2, 1], ordered=False)
+        assert not c2.ordered
+
+        tm.assert_numpy_array_equal(c.get_values(), c2.get_values())
+
+        # set_categories should pass thru the ordering
+        c2 = c.set_ordered(False).set_categories([4, 3, 2, 1])
+        assert not c2.ordered
+
+        tm.assert_numpy_array_equal(c.get_values(), c2.get_values())
+
+    @pytest.mark.parametrize('values, categories, new_categories', [
+        # No NaNs, same cats, same order
+        (['a', 'b', 'a'], ['a', 'b'], ['a', 'b'],),
+        # No NaNs, same cats, different order
+        (['a', 'b', 'a'], ['a', 'b'], ['b', 'a'],),
+        # Same, unsorted
+        (['b', 'a', 'a'], ['a', 'b'], ['a', 'b'],),
+        # No NaNs, same cats, different order
+        (['b', 'a', 'a'], ['a', 'b'], ['b', 'a'],),
+        # NaNs
+        (['a', 'b', 'c'], ['a', 'b'], ['a', 'b']),
+        (['a', 'b', 'c'], ['a', 'b'], ['b', 'a']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a', 'b']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a', 'b']),
+        # Introduce NaNs
+        (['a', 'b', 'c'], ['a', 'b'], ['a']),
+        (['a', 'b', 'c'], ['a', 'b'], ['b']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a']),
+        # No overlap
+        (['a', 'b', 'c'], ['a', 'b'], ['d', 'e']),
+    ])
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_set_categories_many(self, values, categories, new_categories,
+                                 ordered):
+        c = Categorical(values, categories)
+        expected = Categorical(values, new_categories, ordered)
+        result = c.set_categories(new_categories, ordered=ordered)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_set_categories_private(self):
+        cat = Categorical(['a', 'b', 'c'], categories=['a', 'b', 'c', 'd'])
+        cat._set_categories(['a', 'c', 'd', 'e'])
+        expected = Categorical(['a', 'c', 'd'], categories=list('acde'))
+        tm.assert_categorical_equal(cat, expected)
+
+        # fastpath
+        cat = Categorical(['a', 'b', 'c'], categories=['a', 'b', 'c', 'd'])
+        cat._set_categories(['a', 'c', 'd', 'e'], fastpath=True)
+        expected = Categorical(['a', 'c', 'd'], categories=list('acde'))
+        tm.assert_categorical_equal(cat, expected)
+
+    def test_remove_categories(self):
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+        old = cat.copy()
+        new = Categorical(["a", "b", np.nan, "a"], categories=["a", "b"],
+                          ordered=True)
+
+        # first inplace == False
+        res = cat.remove_categories("c")
+        tm.assert_categorical_equal(cat, old)
+        tm.assert_categorical_equal(res, new)
+
+        res = cat.remove_categories(["c"])
+        tm.assert_categorical_equal(cat, old)
+        tm.assert_categorical_equal(res, new)
+
+        # inplace == True
+        res = cat.remove_categories("c", inplace=True)
+        tm.assert_categorical_equal(cat, new)
+        assert res is None
+
+        # removal is not in categories
+        def f():
+            cat.remove_categories(["c"])
+
+        pytest.raises(ValueError, f)
+
+    def test_remove_unused_categories(self):
+        c = Categorical(["a", "b", "c", "d", "a"],
+                        categories=["a", "b", "c", "d", "e"])
+        exp_categories_all = Index(["a", "b", "c", "d", "e"])
+        exp_categories_dropped = Index(["a", "b", "c", "d"])
+
+        tm.assert_index_equal(c.categories, exp_categories_all)
+
+        res = c.remove_unused_categories()
+        tm.assert_index_equal(res.categories, exp_categories_dropped)
+        tm.assert_index_equal(c.categories, exp_categories_all)
+
+        res = c.remove_unused_categories(inplace=True)
+        tm.assert_index_equal(c.categories, exp_categories_dropped)
+        assert res is None
+
+        # with NaN values (GH11599)
+        c = Categorical(["a", "b", "c", np.nan],
+                        categories=["a", "b", "c", "d", "e"])
+        res = c.remove_unused_categories()
+        tm.assert_index_equal(res.categories,
+                              Index(np.array(["a", "b", "c"])))
+        exp_codes = np.array([0, 1, 2, -1], dtype=np.int8)
+        tm.assert_numpy_array_equal(res.codes, exp_codes)
+        tm.assert_index_equal(c.categories, exp_categories_all)
+
+        val = ['F', np.nan, 'D', 'B', 'D', 'F', np.nan]
+        cat = Categorical(values=val, categories=list('ABCDEFG'))
+        out = cat.remove_unused_categories()
+        tm.assert_index_equal(out.categories, Index(['B', 'D', 'F']))
+        exp_codes = np.array([2, -1, 1, 0, 1, 2, -1], dtype=np.int8)
+        tm.assert_numpy_array_equal(out.codes, exp_codes)
+        assert out.get_values().tolist() == val
+
+        alpha = list('abcdefghijklmnopqrstuvwxyz')
+        val = np.random.choice(alpha[::2], 10000).astype('object')
+        val[np.random.choice(len(val), 100)] = np.nan
+
+        cat = Categorical(values=val, categories=alpha)
+        out = cat.remove_unused_categories()
+        assert out.get_values().tolist() == val.tolist()
+
+
+class TestCategoricalAPIWithFactor(TestCategorical):
+
+    def test_describe(self):
+        # string type
+        desc = self.factor.describe()
+        assert self.factor.ordered
+        exp_index = CategoricalIndex(['a', 'b', 'c'], name='categories',
+                                     ordered=self.factor.ordered)
+        expected = DataFrame({'counts': [3, 2, 3],
+                              'freqs': [3 / 8., 2 / 8., 3 / 8.]},
+                             index=exp_index)
+        tm.assert_frame_equal(desc, expected)
+
+        # check unused categories
+        cat = self.factor.copy()
+        cat.set_categories(["a", "b", "c", "d"], inplace=True)
+        desc = cat.describe()
+
+        exp_index = CategoricalIndex(
+            list('abcd'), ordered=self.factor.ordered, name='categories')
+        expected = DataFrame({'counts': [3, 2, 3, 0],
+                              'freqs': [3 / 8., 2 / 8., 3 / 8., 0]},
+                             index=exp_index)
+        tm.assert_frame_equal(desc, expected)
+
+        # check an integer one
+        cat = Categorical([1, 2, 3, 1, 2, 3, 3, 2, 1, 1, 1])
+        desc = cat.describe()
+        exp_index = CategoricalIndex([1, 2, 3], ordered=cat.ordered,
+                                     name='categories')
+        expected = DataFrame({'counts': [5, 3, 3],
+                              'freqs': [5 / 11., 3 / 11., 3 / 11.]},
+                             index=exp_index)
+        tm.assert_frame_equal(desc, expected)
+
+        # https://github.com/pandas-dev/pandas/issues/3678
+        # describe should work with NaN
+        cat = Categorical([np.nan, 1, 2, 2])
+        desc = cat.describe()
+        expected = DataFrame({'counts': [1, 2, 1],
+                              'freqs': [1 / 4., 2 / 4., 1 / 4.]},
+                             index=CategoricalIndex([1, 2, np.nan],
+                                                    categories=[1, 2],
+                                                    name='categories'))
+        tm.assert_frame_equal(desc, expected)
+
+    def test_set_categories_inplace(self):
+        cat = self.factor.copy()
+        cat.set_categories(['a', 'b', 'c', 'd'], inplace=True)
+        tm.assert_index_equal(cat.categories, Index(['a', 'b', 'c', 'd']))
+
+
+class TestPrivateCategoricalAPI(object):
+
+    def test_codes_immutable(self):
+
+        # Codes should be read only
+        c = Categorical(["a", "b", "c", "a", np.nan])
+        exp = np.array([0, 1, 2, 0, -1], dtype='int8')
+        tm.assert_numpy_array_equal(c.codes, exp)
+
+        # Assignments to codes should raise
+        def f():
+            c.codes = np.array([0, 1, 2, 0, 1], dtype='int8')
+
+        pytest.raises(ValueError, f)
+
+        # changes in the codes array should raise
+        # np 1.6.1 raises RuntimeError rather than ValueError
+        codes = c.codes
+
+        def f():
+            codes[4] = 1
+
+        pytest.raises(ValueError, f)
+
+        # But even after getting the codes, the original array should still be
+        # writeable!
+        c[4] = "a"
+        exp = np.array([0, 1, 2, 0, 0], dtype='int8')
+        tm.assert_numpy_array_equal(c.codes, exp)
+        c._codes[4] = 2
+        exp = np.array([0, 1, 2, 0, 2], dtype='int8')
+        tm.assert_numpy_array_equal(c.codes, exp)
+
+    @pytest.mark.parametrize('codes, old, new, expected', [
+        ([0, 1], ['a', 'b'], ['a', 'b'], [0, 1]),
+        ([0, 1], ['b', 'a'], ['b', 'a'], [0, 1]),
+        ([0, 1], ['a', 'b'], ['b', 'a'], [1, 0]),
+        ([0, 1], ['b', 'a'], ['a', 'b'], [1, 0]),
+        ([0, 1, 0, 1], ['a', 'b'], ['a', 'b', 'c'], [0, 1, 0, 1]),
+        ([0, 1, 2, 2], ['a', 'b', 'c'], ['a', 'b'], [0, 1, -1, -1]),
+        ([0, 1, -1], ['a', 'b', 'c'], ['a', 'b', 'c'], [0, 1, -1]),
+        ([0, 1, -1], ['a', 'b', 'c'], ['b'], [-1, 0, -1]),
+        ([0, 1, -1], ['a', 'b', 'c'], ['d'], [-1, -1, -1]),
+        ([0, 1, -1], ['a', 'b', 'c'], [], [-1, -1, -1]),
+        ([-1, -1], [], ['a', 'b'], [-1, -1]),
+        ([1, 0], ['b', 'a'], ['a', 'b'], [0, 1]),
+    ])
+    def test_recode_to_categories(self, codes, old, new, expected):
+        codes = np.asanyarray(codes, dtype=np.int8)
+        expected = np.asanyarray(expected, dtype=np.int8)
+        old = Index(old)
+        new = Index(new)
+        result = _recode_for_categories(codes, old, new)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_recode_to_categories_large(self):
+        N = 1000
+        codes = np.arange(N)
+        old = Index(codes)
+        expected = np.arange(N - 1, -1, -1, dtype=np.int16)
+        new = Index(expected)
+        result = _recode_for_categories(codes, old, new)
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/categorical/test_constructors.py b/pandas/tests/categorical/test_constructors.py
new file mode 100644
index 0000000000000..6cc34770a65e0
--- /dev/null
+++ b/pandas/tests/categorical/test_constructors.py
@@ -0,0 +1,515 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+from datetime import datetime
+
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import (Categorical, Index, Series, Timestamp,
+                    CategoricalIndex, date_range, DatetimeIndex,
+                    period_range, timedelta_range, NaT,
+                    Interval, IntervalIndex)
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas.core.dtypes.common import is_float_dtype, is_integer_dtype
+
+
+class TestCategoricalConstructors(object):
+
+    def test_validate_ordered(self):
+        # see gh-14058
+        exp_msg = "'ordered' must either be 'True' or 'False'"
+        exp_err = TypeError
+
+        # This should be a boolean.
+        ordered = np.array([0, 1, 2])
+
+        with tm.assert_raises_regex(exp_err, exp_msg):
+            Categorical([1, 2, 3], ordered=ordered)
+
+        with tm.assert_raises_regex(exp_err, exp_msg):
+            Categorical.from_codes([0, 0, 1], categories=['a', 'b', 'c'],
+                                   ordered=ordered)
+
+    def test_constructor_empty(self):
+        # GH 17248
+        c = Categorical([])
+        expected = Index([])
+        tm.assert_index_equal(c.categories, expected)
+
+        c = Categorical([], categories=[1, 2, 3])
+        expected = pd.Int64Index([1, 2, 3])
+        tm.assert_index_equal(c.categories, expected)
+
+    def test_constructor_tuples(self):
+        values = np.array([(1,), (1, 2), (1,), (1, 2)], dtype=object)
+        result = Categorical(values)
+        expected = Index([(1,), (1, 2)], tupleize_cols=False)
+        tm.assert_index_equal(result.categories, expected)
+        assert result.ordered is False
+
+    def test_constructor_tuples_datetimes(self):
+        # numpy will auto reshape when all of the tuples are the
+        # same len, so add an extra one with 2 items and slice it off
+        values = np.array([(Timestamp('2010-01-01'),),
+                           (Timestamp('2010-01-02'),),
+                           (Timestamp('2010-01-01'),),
+                           (Timestamp('2010-01-02'),),
+                           ('a', 'b')], dtype=object)[:-1]
+        result = Categorical(values)
+        expected = Index([(Timestamp('2010-01-01'),),
+                          (Timestamp('2010-01-02'),)], tupleize_cols=False)
+        tm.assert_index_equal(result.categories, expected)
+
+    def test_constructor_unsortable(self):
+
+        # it works!
+        arr = np.array([1, 2, 3, datetime.now()], dtype='O')
+        factor = Categorical(arr, ordered=False)
+        assert not factor.ordered
+
+        # this however will raise as cannot be sorted
+        pytest.raises(
+            TypeError, lambda: Categorical(arr, ordered=True))
+
+    def test_constructor_interval(self):
+        result = Categorical([Interval(1, 2), Interval(2, 3), Interval(3, 6)],
+                             ordered=True)
+        ii = IntervalIndex([Interval(1, 2), Interval(2, 3), Interval(3, 6)])
+        exp = Categorical(ii, ordered=True)
+        tm.assert_categorical_equal(result, exp)
+        tm.assert_index_equal(result.categories, ii)
+
+    def test_constructor(self):
+
+        exp_arr = np.array(["a", "b", "c", "a", "b", "c"], dtype=np.object_)
+        c1 = Categorical(exp_arr)
+        tm.assert_numpy_array_equal(c1.__array__(), exp_arr)
+        c2 = Categorical(exp_arr, categories=["a", "b", "c"])
+        tm.assert_numpy_array_equal(c2.__array__(), exp_arr)
+        c2 = Categorical(exp_arr, categories=["c", "b", "a"])
+        tm.assert_numpy_array_equal(c2.__array__(), exp_arr)
+
+        # categories must be unique
+        def f():
+            Categorical([1, 2], [1, 2, 2])
+
+        pytest.raises(ValueError, f)
+
+        def f():
+            Categorical(["a", "b"], ["a", "b", "b"])
+
+        pytest.raises(ValueError, f)
+
+        # The default should be unordered
+        c1 = Categorical(["a", "b", "c", "a"])
+        assert not c1.ordered
+
+        # Categorical as input
+        c1 = Categorical(["a", "b", "c", "a"])
+        c2 = Categorical(c1)
+        tm.assert_categorical_equal(c1, c2)
+
+        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "b", "c", "d"])
+        c2 = Categorical(c1)
+        tm.assert_categorical_equal(c1, c2)
+
+        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "c", "b"])
+        c2 = Categorical(c1)
+        tm.assert_categorical_equal(c1, c2)
+
+        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "c", "b"])
+        c2 = Categorical(c1, categories=["a", "b", "c"])
+        tm.assert_numpy_array_equal(c1.__array__(), c2.__array__())
+        tm.assert_index_equal(c2.categories, Index(["a", "b", "c"]))
+
+        # Series of dtype category
+        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "b", "c", "d"])
+        c2 = Categorical(Series(c1))
+        tm.assert_categorical_equal(c1, c2)
+
+        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "c", "b"])
+        c2 = Categorical(Series(c1))
+        tm.assert_categorical_equal(c1, c2)
+
+        # Series
+        c1 = Categorical(["a", "b", "c", "a"])
+        c2 = Categorical(Series(["a", "b", "c", "a"]))
+        tm.assert_categorical_equal(c1, c2)
+
+        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "b", "c", "d"])
+        c2 = Categorical(Series(["a", "b", "c", "a"]),
+                         categories=["a", "b", "c", "d"])
+        tm.assert_categorical_equal(c1, c2)
+
+        # This should result in integer categories, not float!
+        cat = Categorical([1, 2, 3, np.nan], categories=[1, 2, 3])
+        assert is_integer_dtype(cat.categories)
+
+        # https://github.com/pandas-dev/pandas/issues/3678
+        cat = Categorical([np.nan, 1, 2, 3])
+        assert is_integer_dtype(cat.categories)
+
+        # this should result in floats
+        cat = Categorical([np.nan, 1, 2., 3])
+        assert is_float_dtype(cat.categories)
+
+        cat = Categorical([np.nan, 1., 2., 3.])
+        assert is_float_dtype(cat.categories)
+
+        # This doesn't work -> this would probably need some kind of "remember
+        # the original type" feature to try to cast the array interface result
+        # to...
+
+        # vals = np.asarray(cat[cat.notna()])
+        # assert is_integer_dtype(vals)
+
+        # corner cases
+        cat = Categorical([1])
+        assert len(cat.categories) == 1
+        assert cat.categories[0] == 1
+        assert len(cat.codes) == 1
+        assert cat.codes[0] == 0
+
+        cat = Categorical(["a"])
+        assert len(cat.categories) == 1
+        assert cat.categories[0] == "a"
+        assert len(cat.codes) == 1
+        assert cat.codes[0] == 0
+
+        # Scalars should be converted to lists
+        cat = Categorical(1)
+        assert len(cat.categories) == 1
+        assert cat.categories[0] == 1
+        assert len(cat.codes) == 1
+        assert cat.codes[0] == 0
+
+        # two arrays
+        #  - when the first is an integer dtype and the second is not
+        #  - when the resulting codes are all -1/NaN
+        with tm.assert_produces_warning(None):
+            c_old = Categorical([0, 1, 2, 0, 1, 2],
+                                categories=["a", "b", "c"])  # noqa
+
+        with tm.assert_produces_warning(None):
+            c_old = Categorical([0, 1, 2, 0, 1, 2],  # noqa
+                                categories=[3, 4, 5])
+
+        # the next one are from the old docs
+        with tm.assert_produces_warning(None):
+            c_old2 = Categorical([0, 1, 2, 0, 1, 2], [1, 2, 3])  # noqa
+            cat = Categorical([1, 2], categories=[1, 2, 3])
+
+        # this is a legitimate constructor
+        with tm.assert_produces_warning(None):
+            c = Categorical(np.array([], dtype='int64'),  # noqa
+                            categories=[3, 2, 1], ordered=True)
+
+    def test_constructor_not_sequence(self):
+        # https://github.com/pandas-dev/pandas/issues/16022
+        with pytest.raises(TypeError):
+            Categorical(['a', 'b'], categories='a')
+
+    def test_constructor_with_null(self):
+
+        # Cannot have NaN in categories
+        with pytest.raises(ValueError):
+            Categorical([np.nan, "a", "b", "c"],
+                        categories=[np.nan, "a", "b", "c"])
+
+        with pytest.raises(ValueError):
+            Categorical([None, "a", "b", "c"],
+                        categories=[None, "a", "b", "c"])
+
+        with pytest.raises(ValueError):
+            Categorical(DatetimeIndex(['nat', '20160101']),
+                        categories=[NaT, Timestamp('20160101')])
+
+    def test_constructor_with_index(self):
+        ci = CategoricalIndex(list('aabbca'), categories=list('cab'))
+        tm.assert_categorical_equal(ci.values, Categorical(ci))
+
+        ci = CategoricalIndex(list('aabbca'), categories=list('cab'))
+        tm.assert_categorical_equal(ci.values,
+                                    Categorical(ci.astype(object),
+                                                categories=ci.categories))
+
+    def test_constructor_with_generator(self):
+        # This was raising an Error in isna(single_val).any() because isna
+        # returned a scalar for a generator
+        xrange = range
+
+        exp = Categorical([0, 1, 2])
+        cat = Categorical((x for x in [0, 1, 2]))
+        tm.assert_categorical_equal(cat, exp)
+        cat = Categorical(xrange(3))
+        tm.assert_categorical_equal(cat, exp)
+
+        # This uses xrange internally
+        from pandas.core.index import MultiIndex
+        MultiIndex.from_product([range(5), ['a', 'b', 'c']])
+
+        # check that categories accept generators and sequences
+        cat = Categorical([0, 1, 2], categories=(x for x in [0, 1, 2]))
+        tm.assert_categorical_equal(cat, exp)
+        cat = Categorical([0, 1, 2], categories=xrange(3))
+        tm.assert_categorical_equal(cat, exp)
+
+    def test_constructor_with_datetimelike(self):
+
+        # 12077
+        # constructor wwth a datetimelike and NaT
+
+        for dtl in [date_range('1995-01-01 00:00:00', periods=5, freq='s'),
+                    date_range('1995-01-01 00:00:00', periods=5,
+                               freq='s', tz='US/Eastern'),
+                    timedelta_range('1 day', periods=5, freq='s')]:
+
+            s = Series(dtl)
+            c = Categorical(s)
+            expected = type(dtl)(s)
+            expected.freq = None
+            tm.assert_index_equal(c.categories, expected)
+            tm.assert_numpy_array_equal(c.codes, np.arange(5, dtype='int8'))
+
+            # with NaT
+            s2 = s.copy()
+            s2.iloc[-1] = NaT
+            c = Categorical(s2)
+            expected = type(dtl)(s2.dropna())
+            expected.freq = None
+            tm.assert_index_equal(c.categories, expected)
+
+            exp = np.array([0, 1, 2, 3, -1], dtype=np.int8)
+            tm.assert_numpy_array_equal(c.codes, exp)
+
+            result = repr(c)
+            assert 'NaT' in result
+
+    def test_constructor_from_index_series_datetimetz(self):
+        idx = date_range('2015-01-01 10:00', freq='D', periods=3,
+                         tz='US/Eastern')
+        result = Categorical(idx)
+        tm.assert_index_equal(result.categories, idx)
+
+        result = Categorical(Series(idx))
+        tm.assert_index_equal(result.categories, idx)
+
+    def test_constructor_from_index_series_timedelta(self):
+        idx = timedelta_range('1 days', freq='D', periods=3)
+        result = Categorical(idx)
+        tm.assert_index_equal(result.categories, idx)
+
+        result = Categorical(Series(idx))
+        tm.assert_index_equal(result.categories, idx)
+
+    def test_constructor_from_index_series_period(self):
+        idx = period_range('2015-01-01', freq='D', periods=3)
+        result = Categorical(idx)
+        tm.assert_index_equal(result.categories, idx)
+
+        result = Categorical(Series(idx))
+        tm.assert_index_equal(result.categories, idx)
+
+    def test_constructor_invariant(self):
+        # GH 14190
+        vals = [
+            np.array([1., 1.2, 1.8, np.nan]),
+            np.array([1, 2, 3], dtype='int64'),
+            ['a', 'b', 'c', np.nan],
+            [pd.Period('2014-01'), pd.Period('2014-02'), NaT],
+            [Timestamp('2014-01-01'), Timestamp('2014-01-02'), NaT],
+            [Timestamp('2014-01-01', tz='US/Eastern'),
+             Timestamp('2014-01-02', tz='US/Eastern'), NaT],
+        ]
+        for val in vals:
+            c = Categorical(val)
+            c2 = Categorical(c)
+            tm.assert_categorical_equal(c, c2)
+
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_constructor_with_dtype(self, ordered):
+        categories = ['b', 'a', 'c']
+        dtype = CategoricalDtype(categories, ordered=ordered)
+        result = Categorical(['a', 'b', 'a', 'c'], dtype=dtype)
+        expected = Categorical(['a', 'b', 'a', 'c'], categories=categories,
+                               ordered=ordered)
+        tm.assert_categorical_equal(result, expected)
+        assert result.ordered is ordered
+
+    def test_constructor_dtype_and_others_raises(self):
+        dtype = CategoricalDtype(['a', 'b'], ordered=True)
+        with tm.assert_raises_regex(ValueError, "Cannot"):
+            Categorical(['a', 'b'], categories=['a', 'b'], dtype=dtype)
+
+        with tm.assert_raises_regex(ValueError, "Cannot"):
+            Categorical(['a', 'b'], ordered=True, dtype=dtype)
+
+        with tm.assert_raises_regex(ValueError, "Cannot"):
+            Categorical(['a', 'b'], ordered=False, dtype=dtype)
+
+    @pytest.mark.parametrize('categories', [
+        None, ['a', 'b'], ['a', 'c'],
+    ])
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_constructor_str_category(self, categories, ordered):
+        result = Categorical(['a', 'b'], categories=categories,
+                             ordered=ordered, dtype='category')
+        expected = Categorical(['a', 'b'], categories=categories,
+                               ordered=ordered)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_constructor_str_unknown(self):
+        with tm.assert_raises_regex(ValueError, "Unknown `dtype`"):
+            Categorical([1, 2], dtype="foo")
+
+    def test_constructor_from_categorical_with_dtype(self):
+        dtype = CategoricalDtype(['a', 'b', 'c'], ordered=True)
+        values = Categorical(['a', 'b', 'd'])
+        result = Categorical(values, dtype=dtype)
+        # We use dtype.categories, not values.categories
+        expected = Categorical(['a', 'b', 'd'], categories=['a', 'b', 'c'],
+                               ordered=True)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_constructor_from_categorical_with_unknown_dtype(self):
+        dtype = CategoricalDtype(None, ordered=True)
+        values = Categorical(['a', 'b', 'd'])
+        result = Categorical(values, dtype=dtype)
+        # We use values.categories, not dtype.categories
+        expected = Categorical(['a', 'b', 'd'], categories=['a', 'b', 'd'],
+                               ordered=True)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_constructor_from_categorical_string(self):
+        values = Categorical(['a', 'b', 'd'])
+        # use categories, ordered
+        result = Categorical(values, categories=['a', 'b', 'c'], ordered=True,
+                             dtype='category')
+        expected = Categorical(['a', 'b', 'd'], categories=['a', 'b', 'c'],
+                               ordered=True)
+        tm.assert_categorical_equal(result, expected)
+
+        # No string
+        result = Categorical(values, categories=['a', 'b', 'c'], ordered=True)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_constructor_with_categorical_categories(self):
+        # GH17884
+        expected = Categorical(['a', 'b'], categories=['a', 'b', 'c'])
+
+        result = Categorical(
+            ['a', 'b'], categories=Categorical(['a', 'b', 'c']))
+        tm.assert_categorical_equal(result, expected)
+
+        result = Categorical(
+            ['a', 'b'], categories=CategoricalIndex(['a', 'b', 'c']))
+        tm.assert_categorical_equal(result, expected)
+
+    def test_from_codes(self):
+
+        # too few categories
+        def f():
+            Categorical.from_codes([1, 2], [1, 2])
+
+        pytest.raises(ValueError, f)
+
+        # no int codes
+        def f():
+            Categorical.from_codes(["a"], [1, 2])
+
+        pytest.raises(ValueError, f)
+
+        # no unique categories
+        def f():
+            Categorical.from_codes([0, 1, 2], ["a", "a", "b"])
+
+        pytest.raises(ValueError, f)
+
+        # NaN categories included
+        def f():
+            Categorical.from_codes([0, 1, 2], ["a", "b", np.nan])
+
+        pytest.raises(ValueError, f)
+
+        # too negative
+        def f():
+            Categorical.from_codes([-2, 1, 2], ["a", "b", "c"])
+
+        pytest.raises(ValueError, f)
+
+        exp = Categorical(["a", "b", "c"], ordered=False)
+        res = Categorical.from_codes([0, 1, 2], ["a", "b", "c"])
+        tm.assert_categorical_equal(exp, res)
+
+        # Not available in earlier numpy versions
+        if hasattr(np.random, "choice"):
+            codes = np.random.choice([0, 1], 5, p=[0.9, 0.1])
+            Categorical.from_codes(codes, categories=["train", "test"])
+
+    def test_from_codes_with_categorical_categories(self):
+        # GH17884
+        expected = Categorical(['a', 'b'], categories=['a', 'b', 'c'])
+
+        result = Categorical.from_codes(
+            [0, 1], categories=Categorical(['a', 'b', 'c']))
+        tm.assert_categorical_equal(result, expected)
+
+        result = Categorical.from_codes(
+            [0, 1], categories=CategoricalIndex(['a', 'b', 'c']))
+        tm.assert_categorical_equal(result, expected)
+
+        # non-unique Categorical still raises
+        with pytest.raises(ValueError):
+            Categorical.from_codes([0, 1], Categorical(['a', 'b', 'a']))
+
+    @pytest.mark.parametrize('dtype', [None, 'category'])
+    def test_from_inferred_categories(self, dtype):
+        cats = ['a', 'b']
+        codes = np.array([0, 0, 1, 1], dtype='i8')
+        result = Categorical._from_inferred_categories(cats, codes, dtype)
+        expected = Categorical.from_codes(codes, cats)
+        tm.assert_categorical_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [None, 'category'])
+    def test_from_inferred_categories_sorts(self, dtype):
+        cats = ['b', 'a']
+        codes = np.array([0, 1, 1, 1], dtype='i8')
+        result = Categorical._from_inferred_categories(cats, codes, dtype)
+        expected = Categorical.from_codes([1, 0, 0, 0], ['a', 'b'])
+        tm.assert_categorical_equal(result, expected)
+
+    def test_from_inferred_categories_dtype(self):
+        cats = ['a', 'b', 'd']
+        codes = np.array([0, 1, 0, 2], dtype='i8')
+        dtype = CategoricalDtype(['c', 'b', 'a'], ordered=True)
+        result = Categorical._from_inferred_categories(cats, codes, dtype)
+        expected = Categorical(['a', 'b', 'a', 'd'],
+                               categories=['c', 'b', 'a'],
+                               ordered=True)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_from_inferred_categories_coerces(self):
+        cats = ['1', '2', 'bad']
+        codes = np.array([0, 0, 1, 2], dtype='i8')
+        dtype = CategoricalDtype([1, 2])
+        result = Categorical._from_inferred_categories(cats, codes, dtype)
+        expected = Categorical([1, 1, 2, np.nan])
+        tm.assert_categorical_equal(result, expected)
+
+    def test_construction_with_ordered(self):
+        # GH 9347, 9190
+        cat = Categorical([0, 1, 2])
+        assert not cat.ordered
+        cat = Categorical([0, 1, 2], ordered=False)
+        assert not cat.ordered
+        cat = Categorical([0, 1, 2], ordered=True)
+        assert cat.ordered
+
+    @pytest.mark.xfail(reason="Imaginary values not supported in Categorical")
+    def test_constructor_imaginary(self):
+        values = [1, 2, 3 + 1j]
+        c1 = Categorical(values)
+        tm.assert_index_equal(c1.categories, Index(values))
+        tm.assert_numpy_array_equal(np.array(c1), np.array(values))
diff --git a/pandas/tests/categorical/test_dtypes.py b/pandas/tests/categorical/test_dtypes.py
new file mode 100644
index 0000000000000..00e99db628c2a
--- /dev/null
+++ b/pandas/tests/categorical/test_dtypes.py
@@ -0,0 +1,176 @@
+# -*- coding: utf-8 -*-
+import pytest
+
+import numpy as np
+
+import pandas.util.testing as tm
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas.compat import long
+from pandas import Categorical, Index, CategoricalIndex, Series, Timestamp
+
+
+class TestCategoricalDtypes(object):
+
+    def test_is_equal_dtype(self):
+
+        # test dtype comparisons between cats
+
+        c1 = Categorical(list('aabca'), categories=list('abc'), ordered=False)
+        c2 = Categorical(list('aabca'), categories=list('cab'), ordered=False)
+        c3 = Categorical(list('aabca'), categories=list('cab'), ordered=True)
+        assert c1.is_dtype_equal(c1)
+        assert c2.is_dtype_equal(c2)
+        assert c3.is_dtype_equal(c3)
+        assert c1.is_dtype_equal(c2)
+        assert not c1.is_dtype_equal(c3)
+        assert not c1.is_dtype_equal(Index(list('aabca')))
+        assert not c1.is_dtype_equal(c1.astype(object))
+        assert c1.is_dtype_equal(CategoricalIndex(c1))
+        assert (c1.is_dtype_equal(
+            CategoricalIndex(c1, categories=list('cab'))))
+        assert not c1.is_dtype_equal(CategoricalIndex(c1, ordered=True))
+
+        # GH 16659
+        s1 = Series(c1)
+        s2 = Series(c2)
+        s3 = Series(c3)
+        assert c1.is_dtype_equal(s1)
+        assert c2.is_dtype_equal(s2)
+        assert c3.is_dtype_equal(s3)
+        assert c1.is_dtype_equal(s2)
+        assert not c1.is_dtype_equal(s3)
+        assert not c1.is_dtype_equal(s1.astype(object))
+
+    def test_set_dtype_same(self):
+        c = Categorical(['a', 'b', 'c'])
+        result = c._set_dtype(CategoricalDtype(['a', 'b', 'c']))
+        tm.assert_categorical_equal(result, c)
+
+    def test_set_dtype_new_categories(self):
+        c = Categorical(['a', 'b', 'c'])
+        result = c._set_dtype(CategoricalDtype(list('abcd')))
+        tm.assert_numpy_array_equal(result.codes, c.codes)
+        tm.assert_index_equal(result.dtype.categories, Index(list('abcd')))
+
+    @pytest.mark.parametrize('values, categories, new_categories', [
+        # No NaNs, same cats, same order
+        (['a', 'b', 'a'], ['a', 'b'], ['a', 'b'],),
+        # No NaNs, same cats, different order
+        (['a', 'b', 'a'], ['a', 'b'], ['b', 'a'],),
+        # Same, unsorted
+        (['b', 'a', 'a'], ['a', 'b'], ['a', 'b'],),
+        # No NaNs, same cats, different order
+        (['b', 'a', 'a'], ['a', 'b'], ['b', 'a'],),
+        # NaNs
+        (['a', 'b', 'c'], ['a', 'b'], ['a', 'b']),
+        (['a', 'b', 'c'], ['a', 'b'], ['b', 'a']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a', 'b']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a', 'b']),
+        # Introduce NaNs
+        (['a', 'b', 'c'], ['a', 'b'], ['a']),
+        (['a', 'b', 'c'], ['a', 'b'], ['b']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a']),
+        # No overlap
+        (['a', 'b', 'c'], ['a', 'b'], ['d', 'e']),
+    ])
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_set_dtype_many(self, values, categories, new_categories,
+                            ordered):
+        c = Categorical(values, categories)
+        expected = Categorical(values, new_categories, ordered)
+        result = c._set_dtype(expected.dtype)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_set_dtype_no_overlap(self):
+        c = Categorical(['a', 'b', 'c'], ['d', 'e'])
+        result = c._set_dtype(CategoricalDtype(['a', 'b']))
+        expected = Categorical([None, None, None], categories=['a', 'b'])
+        tm.assert_categorical_equal(result, expected)
+
+    def test_codes_dtypes(self):
+
+        # GH 8453
+        result = Categorical(['foo', 'bar', 'baz'])
+        assert result.codes.dtype == 'int8'
+
+        result = Categorical(['foo%05d' % i for i in range(400)])
+        assert result.codes.dtype == 'int16'
+
+        result = Categorical(['foo%05d' % i for i in range(40000)])
+        assert result.codes.dtype == 'int32'
+
+        # adding cats
+        result = Categorical(['foo', 'bar', 'baz'])
+        assert result.codes.dtype == 'int8'
+        result = result.add_categories(['foo%05d' % i for i in range(400)])
+        assert result.codes.dtype == 'int16'
+
+        # removing cats
+        result = result.remove_categories(['foo%05d' % i for i in range(300)])
+        assert result.codes.dtype == 'int8'
+
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_astype(self, ordered):
+        # string
+        cat = Categorical(list('abbaaccc'), ordered=ordered)
+        result = cat.astype(object)
+        expected = np.array(cat)
+        tm.assert_numpy_array_equal(result, expected)
+
+        msg = 'could not convert string to float'
+        with tm.assert_raises_regex(ValueError, msg):
+            cat.astype(float)
+
+        # numeric
+        cat = Categorical([0, 1, 2, 2, 1, 0, 1, 0, 2], ordered=ordered)
+        result = cat.astype(object)
+        expected = np.array(cat, dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = cat.astype(int)
+        expected = np.array(cat, dtype=np.int)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = cat.astype(float)
+        expected = np.array(cat, dtype=np.float)
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype_ordered', [True, False])
+    @pytest.mark.parametrize('cat_ordered', [True, False])
+    def test_astype_category(self, dtype_ordered, cat_ordered):
+        # GH 10696/18593
+        data = list('abcaacbab')
+        cat = Categorical(data, categories=list('bac'), ordered=cat_ordered)
+
+        # standard categories
+        dtype = CategoricalDtype(ordered=dtype_ordered)
+        result = cat.astype(dtype)
+        expected = Categorical(
+            data, categories=cat.categories, ordered=dtype_ordered)
+        tm.assert_categorical_equal(result, expected)
+
+        # non-standard categories
+        dtype = CategoricalDtype(list('adc'), dtype_ordered)
+        result = cat.astype(dtype)
+        expected = Categorical(data, dtype=dtype)
+        tm.assert_categorical_equal(result, expected)
+
+        if dtype_ordered is False:
+            # dtype='category' can't specify ordered, so only test once
+            result = cat.astype('category')
+            expected = cat
+            tm.assert_categorical_equal(result, expected)
+
+    def test_iter_python_types(self):
+        # GH-19909
+        # TODO(Py2): Remove long
+        cat = Categorical([1, 2])
+        assert isinstance(list(cat)[0], (int, long))
+        assert isinstance(cat.tolist()[0], (int, long))
+
+    def test_iter_python_types_datetime(self):
+        cat = Categorical([Timestamp('2017-01-01'),
+                           Timestamp('2017-01-02')])
+        assert isinstance(list(cat)[0], Timestamp)
+        assert isinstance(cat.tolist()[0], Timestamp)
diff --git a/pandas/tests/categorical/test_indexing.py b/pandas/tests/categorical/test_indexing.py
new file mode 100644
index 0000000000000..cf7b5cfa55882
--- /dev/null
+++ b/pandas/tests/categorical/test_indexing.py
@@ -0,0 +1,123 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+import numpy as np
+
+import pandas.util.testing as tm
+from pandas import Categorical, Index, CategoricalIndex, PeriodIndex
+from pandas.tests.categorical.common import TestCategorical
+
+
+class TestCategoricalIndexingWithFactor(TestCategorical):
+
+    def test_getitem(self):
+        assert self.factor[0] == 'a'
+        assert self.factor[-1] == 'c'
+
+        subf = self.factor[[0, 1, 2]]
+        tm.assert_numpy_array_equal(subf._codes,
+                                    np.array([0, 1, 1], dtype=np.int8))
+
+        subf = self.factor[np.asarray(self.factor) == 'c']
+        tm.assert_numpy_array_equal(subf._codes,
+                                    np.array([2, 2, 2], dtype=np.int8))
+
+    def test_setitem(self):
+
+        # int/positional
+        c = self.factor.copy()
+        c[0] = 'b'
+        assert c[0] == 'b'
+        c[-1] = 'a'
+        assert c[-1] == 'a'
+
+        # boolean
+        c = self.factor.copy()
+        indexer = np.zeros(len(c), dtype='bool')
+        indexer[0] = True
+        indexer[-1] = True
+        c[indexer] = 'c'
+        expected = Categorical(['c', 'b', 'b', 'a', 'a', 'c', 'c', 'c'],
+                               ordered=True)
+
+        tm.assert_categorical_equal(c, expected)
+
+
+class TestCategoricalIndexing(object):
+
+    def test_getitem_listlike(self):
+
+        # GH 9469
+        # properly coerce the input indexers
+        np.random.seed(1)
+        c = Categorical(np.random.randint(0, 5, size=150000).astype(np.int8))
+        result = c.codes[np.array([100000]).astype(np.int64)]
+        expected = c[np.array([100000]).astype(np.int64)].codes
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_periodindex(self):
+        idx1 = PeriodIndex(['2014-01', '2014-01', '2014-02', '2014-02',
+                            '2014-03', '2014-03'], freq='M')
+
+        cat1 = Categorical(idx1)
+        str(cat1)
+        exp_arr = np.array([0, 0, 1, 1, 2, 2], dtype=np.int8)
+        exp_idx = PeriodIndex(['2014-01', '2014-02', '2014-03'], freq='M')
+        tm.assert_numpy_array_equal(cat1._codes, exp_arr)
+        tm.assert_index_equal(cat1.categories, exp_idx)
+
+        idx2 = PeriodIndex(['2014-03', '2014-03', '2014-02', '2014-01',
+                            '2014-03', '2014-01'], freq='M')
+        cat2 = Categorical(idx2, ordered=True)
+        str(cat2)
+        exp_arr = np.array([2, 2, 1, 0, 2, 0], dtype=np.int8)
+        exp_idx2 = PeriodIndex(['2014-01', '2014-02', '2014-03'], freq='M')
+        tm.assert_numpy_array_equal(cat2._codes, exp_arr)
+        tm.assert_index_equal(cat2.categories, exp_idx2)
+
+        idx3 = PeriodIndex(['2013-12', '2013-11', '2013-10', '2013-09',
+                            '2013-08', '2013-07', '2013-05'], freq='M')
+        cat3 = Categorical(idx3, ordered=True)
+        exp_arr = np.array([6, 5, 4, 3, 2, 1, 0], dtype=np.int8)
+        exp_idx = PeriodIndex(['2013-05', '2013-07', '2013-08', '2013-09',
+                               '2013-10', '2013-11', '2013-12'], freq='M')
+        tm.assert_numpy_array_equal(cat3._codes, exp_arr)
+        tm.assert_index_equal(cat3.categories, exp_idx)
+
+    def test_categories_assigments(self):
+        s = Categorical(["a", "b", "c", "a"])
+        exp = np.array([1, 2, 3, 1], dtype=np.int64)
+        s.categories = [1, 2, 3]
+        tm.assert_numpy_array_equal(s.__array__(), exp)
+        tm.assert_index_equal(s.categories, Index([1, 2, 3]))
+
+        # lengthen
+        def f():
+            s.categories = [1, 2, 3, 4]
+
+        pytest.raises(ValueError, f)
+
+        # shorten
+        def f():
+            s.categories = [1, 2]
+
+        pytest.raises(ValueError, f)
+
+    # Combinations of sorted/unique:
+    @pytest.mark.parametrize("idx_values", [[1, 2, 3, 4], [1, 3, 2, 4],
+                                            [1, 3, 3, 4], [1, 2, 2, 4]])
+    # Combinations of missing/unique
+    @pytest.mark.parametrize("key_values", [[1, 2], [1, 5], [1, 1], [5, 5]])
+    @pytest.mark.parametrize("key_class", [Categorical, CategoricalIndex])
+    def test_get_indexer_non_unique(self, idx_values, key_values, key_class):
+        # GH 21448
+        key = key_class(key_values, categories=range(1, 5))
+        # Test for flat index and CategoricalIndex with same/different cats:
+        for dtype in None, 'category', key.dtype:
+            idx = Index(idx_values, dtype=dtype)
+            expected, exp_miss = idx.get_indexer_non_unique(key_values)
+            result, res_miss = idx.get_indexer_non_unique(key)
+
+            tm.assert_numpy_array_equal(expected, result)
+            tm.assert_numpy_array_equal(exp_miss, res_miss)
diff --git a/pandas/tests/categorical/test_missing.py b/pandas/tests/categorical/test_missing.py
new file mode 100644
index 0000000000000..c78f02245a5b4
--- /dev/null
+++ b/pandas/tests/categorical/test_missing.py
@@ -0,0 +1,85 @@
+# -*- coding: utf-8 -*-
+import collections
+
+import numpy as np
+import pytest
+
+import pandas.util.testing as tm
+from pandas import Categorical, Index, isna
+from pandas.compat import lrange
+from pandas.core.dtypes.dtypes import CategoricalDtype
+
+
+class TestCategoricalMissing(object):
+
+    def test_na_flags_int_categories(self):
+        # #1457
+
+        categories = lrange(10)
+        labels = np.random.randint(0, 10, 20)
+        labels[::5] = -1
+
+        cat = Categorical(labels, categories, fastpath=True)
+        repr(cat)
+
+        tm.assert_numpy_array_equal(isna(cat), labels == -1)
+
+    def test_nan_handling(self):
+
+        # Nans are represented as -1 in codes
+        c = Categorical(["a", "b", np.nan, "a"])
+        tm.assert_index_equal(c.categories, Index(["a", "b"]))
+        tm.assert_numpy_array_equal(c._codes, np.array([0, 1, -1, 0],
+                                                       dtype=np.int8))
+        c[1] = np.nan
+        tm.assert_index_equal(c.categories, Index(["a", "b"]))
+        tm.assert_numpy_array_equal(c._codes, np.array([0, -1, -1, 0],
+                                                       dtype=np.int8))
+
+        # Adding nan to categories should make assigned nan point to the
+        # category!
+        c = Categorical(["a", "b", np.nan, "a"])
+        tm.assert_index_equal(c.categories, Index(["a", "b"]))
+        tm.assert_numpy_array_equal(c._codes, np.array([0, 1, -1, 0],
+                                                       dtype=np.int8))
+
+    def test_set_dtype_nans(self):
+        c = Categorical(['a', 'b', np.nan])
+        result = c._set_dtype(CategoricalDtype(['a', 'c']))
+        tm.assert_numpy_array_equal(result.codes, np.array([0, -1, -1],
+                                                           dtype='int8'))
+
+    def test_set_item_nan(self):
+        cat = Categorical([1, 2, 3])
+        cat[1] = np.nan
+
+        exp = Categorical([1, np.nan, 3], categories=[1, 2, 3])
+        tm.assert_categorical_equal(cat, exp)
+
+    @pytest.mark.parametrize('fillna_kwargs, msg', [
+        (dict(value=1, method='ffill'),
+         "Cannot specify both 'value' and 'method'."),
+        (dict(),
+         "Must specify a fill 'value' or 'method'."),
+        (dict(method='bad'),
+         "Invalid fill method. Expecting .* bad"),
+    ])
+    def test_fillna_raises(self, fillna_kwargs, msg):
+        # https://github.com/pandas-dev/pandas/issues/19682
+        cat = Categorical([1, 2, 3])
+
+        with tm.assert_raises_regex(ValueError, msg):
+            cat.fillna(**fillna_kwargs)
+
+    @pytest.mark.parametrize("named", [True, False])
+    def test_fillna_iterable_category(self, named):
+        # https://github.com/pandas-dev/pandas/issues/21097
+        if named:
+            Point = collections.namedtuple("Point", "x y")
+        else:
+            Point = lambda *args: args  # tuple
+        cat = Categorical([Point(0, 0), Point(0, 1), None])
+        result = cat.fillna(Point(0, 0))
+        expected = Categorical([Point(0, 0), Point(0, 1), Point(0, 0)])
+
+        tm.assert_categorical_equal(result, expected)
diff --git a/pandas/tests/categorical/test_operators.py b/pandas/tests/categorical/test_operators.py
new file mode 100644
index 0000000000000..a26de32d7446c
--- /dev/null
+++ b/pandas/tests/categorical/test_operators.py
@@ -0,0 +1,310 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+import pandas as pd
+import numpy as np
+
+import pandas.util.testing as tm
+from pandas import Categorical, Series, DataFrame, date_range
+from pandas.tests.categorical.common import TestCategorical
+
+
+class TestCategoricalOpsWithFactor(TestCategorical):
+
+    def test_categories_none_comparisons(self):
+        factor = Categorical(['a', 'b', 'b', 'a',
+                              'a', 'c', 'c', 'c'], ordered=True)
+        tm.assert_categorical_equal(factor, self.factor)
+
+    def test_comparisons(self):
+
+        result = self.factor[self.factor == 'a']
+        expected = self.factor[np.asarray(self.factor) == 'a']
+        tm.assert_categorical_equal(result, expected)
+
+        result = self.factor[self.factor != 'a']
+        expected = self.factor[np.asarray(self.factor) != 'a']
+        tm.assert_categorical_equal(result, expected)
+
+        result = self.factor[self.factor < 'c']
+        expected = self.factor[np.asarray(self.factor) < 'c']
+        tm.assert_categorical_equal(result, expected)
+
+        result = self.factor[self.factor > 'a']
+        expected = self.factor[np.asarray(self.factor) > 'a']
+        tm.assert_categorical_equal(result, expected)
+
+        result = self.factor[self.factor >= 'b']
+        expected = self.factor[np.asarray(self.factor) >= 'b']
+        tm.assert_categorical_equal(result, expected)
+
+        result = self.factor[self.factor <= 'b']
+        expected = self.factor[np.asarray(self.factor) <= 'b']
+        tm.assert_categorical_equal(result, expected)
+
+        n = len(self.factor)
+
+        other = self.factor[np.random.permutation(n)]
+        result = self.factor == other
+        expected = np.asarray(self.factor) == np.asarray(other)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = self.factor == 'd'
+        expected = np.repeat(False, len(self.factor))
+        tm.assert_numpy_array_equal(result, expected)
+
+        # comparisons with categoricals
+        cat_rev = Categorical(
+            ["a", "b", "c"], categories=["c", "b", "a"], ordered=True)
+        cat_rev_base = Categorical(
+            ["b", "b", "b"], categories=["c", "b", "a"], ordered=True)
+        cat = Categorical(["a", "b", "c"], ordered=True)
+        cat_base = Categorical(
+            ["b", "b", "b"], categories=cat.categories, ordered=True)
+
+        # comparisons need to take categories ordering into account
+        res_rev = cat_rev > cat_rev_base
+        exp_rev = np.array([True, False, False])
+        tm.assert_numpy_array_equal(res_rev, exp_rev)
+
+        res_rev = cat_rev < cat_rev_base
+        exp_rev = np.array([False, False, True])
+        tm.assert_numpy_array_equal(res_rev, exp_rev)
+
+        res = cat > cat_base
+        exp = np.array([False, False, True])
+        tm.assert_numpy_array_equal(res, exp)
+
+        # Only categories with same categories can be compared
+        def f():
+            cat > cat_rev
+
+        pytest.raises(TypeError, f)
+
+        cat_rev_base2 = Categorical(
+            ["b", "b", "b"], categories=["c", "b", "a", "d"])
+
+        def f():
+            cat_rev > cat_rev_base2
+
+        pytest.raises(TypeError, f)
+
+        # Only categories with same ordering information can be compared
+        cat_unorderd = cat.set_ordered(False)
+        assert not (cat > cat).any()
+
+        def f():
+            cat > cat_unorderd
+
+        pytest.raises(TypeError, f)
+
+        # comparison (in both directions) with Series will raise
+        s = Series(["b", "b", "b"])
+        pytest.raises(TypeError, lambda: cat > s)
+        pytest.raises(TypeError, lambda: cat_rev > s)
+        pytest.raises(TypeError, lambda: s < cat)
+        pytest.raises(TypeError, lambda: s < cat_rev)
+
+        # comparison with numpy.array will raise in both direction, but only on
+        # newer numpy versions
+        a = np.array(["b", "b", "b"])
+        pytest.raises(TypeError, lambda: cat > a)
+        pytest.raises(TypeError, lambda: cat_rev > a)
+
+        # Make sure that unequal comparison take the categories order in
+        # account
+        cat_rev = Categorical(
+            list("abc"), categories=list("cba"), ordered=True)
+        exp = np.array([True, False, False])
+        res = cat_rev > "b"
+        tm.assert_numpy_array_equal(res, exp)
+
+
+class TestCategoricalOps(object):
+
+    def test_datetime_categorical_comparison(self):
+        dt_cat = Categorical(date_range('2014-01-01', periods=3), ordered=True)
+        tm.assert_numpy_array_equal(dt_cat > dt_cat[0],
+                                    np.array([False, True, True]))
+        tm.assert_numpy_array_equal(dt_cat[0] < dt_cat,
+                                    np.array([False, True, True]))
+
+    def test_reflected_comparison_with_scalars(self):
+        # GH8658
+        cat = Categorical([1, 2, 3], ordered=True)
+        tm.assert_numpy_array_equal(cat > cat[0],
+                                    np.array([False, True, True]))
+        tm.assert_numpy_array_equal(cat[0] < cat,
+                                    np.array([False, True, True]))
+
+    def test_comparison_with_unknown_scalars(self):
+        # https://github.com/pandas-dev/pandas/issues/9836#issuecomment-92123057
+        # and following comparisons with scalars not in categories should raise
+        # for unequal comps, but not for equal/not equal
+        cat = Categorical([1, 2, 3], ordered=True)
+
+        pytest.raises(TypeError, lambda: cat < 4)
+        pytest.raises(TypeError, lambda: cat > 4)
+        pytest.raises(TypeError, lambda: 4 < cat)
+        pytest.raises(TypeError, lambda: 4 > cat)
+
+        tm.assert_numpy_array_equal(cat == 4,
+                                    np.array([False, False, False]))
+        tm.assert_numpy_array_equal(cat != 4,
+                                    np.array([True, True, True]))
+
+    @pytest.mark.parametrize('data,reverse,base', [
+        (list("abc"), list("cba"), list("bbb")),
+        ([1, 2, 3], [3, 2, 1], [2, 2, 2])]
+    )
+    def test_comparisons(self, data, reverse, base):
+        cat_rev = Series(
+            Categorical(data, categories=reverse, ordered=True))
+        cat_rev_base = Series(
+            Categorical(base, categories=reverse, ordered=True))
+        cat = Series(Categorical(data, ordered=True))
+        cat_base = Series(
+            Categorical(base, categories=cat.cat.categories, ordered=True))
+        s = Series(base)
+        a = np.array(base)
+
+        # comparisons need to take categories ordering into account
+        res_rev = cat_rev > cat_rev_base
+        exp_rev = Series([True, False, False])
+        tm.assert_series_equal(res_rev, exp_rev)
+
+        res_rev = cat_rev < cat_rev_base
+        exp_rev = Series([False, False, True])
+        tm.assert_series_equal(res_rev, exp_rev)
+
+        res = cat > cat_base
+        exp = Series([False, False, True])
+        tm.assert_series_equal(res, exp)
+
+        scalar = base[1]
+        res = cat > scalar
+        exp = Series([False, False, True])
+        exp2 = cat.values > scalar
+        tm.assert_series_equal(res, exp)
+        tm.assert_numpy_array_equal(res.values, exp2)
+        res_rev = cat_rev > scalar
+        exp_rev = Series([True, False, False])
+        exp_rev2 = cat_rev.values > scalar
+        tm.assert_series_equal(res_rev, exp_rev)
+        tm.assert_numpy_array_equal(res_rev.values, exp_rev2)
+
+        # Only categories with same categories can be compared
+        def f():
+            cat > cat_rev
+
+        pytest.raises(TypeError, f)
+
+        # categorical cannot be compared to Series or numpy array, and also
+        # not the other way around
+        pytest.raises(TypeError, lambda: cat > s)
+        pytest.raises(TypeError, lambda: cat_rev > s)
+        pytest.raises(TypeError, lambda: cat > a)
+        pytest.raises(TypeError, lambda: cat_rev > a)
+
+        pytest.raises(TypeError, lambda: s < cat)
+        pytest.raises(TypeError, lambda: s < cat_rev)
+
+        pytest.raises(TypeError, lambda: a < cat)
+        pytest.raises(TypeError, lambda: a < cat_rev)
+
+    @pytest.mark.parametrize('ctor', [
+        lambda *args, **kwargs: Categorical(*args, **kwargs),
+        lambda *args, **kwargs: Series(Categorical(*args, **kwargs)),
+    ])
+    def test_unordered_different_order_equal(self, ctor):
+        # https://github.com/pandas-dev/pandas/issues/16014
+        c1 = ctor(['a', 'b'], categories=['a', 'b'], ordered=False)
+        c2 = ctor(['a', 'b'], categories=['b', 'a'], ordered=False)
+        assert (c1 == c2).all()
+
+        c1 = ctor(['a', 'b'], categories=['a', 'b'], ordered=False)
+        c2 = ctor(['b', 'a'], categories=['b', 'a'], ordered=False)
+        assert (c1 != c2).all()
+
+        c1 = ctor(['a', 'a'], categories=['a', 'b'], ordered=False)
+        c2 = ctor(['b', 'b'], categories=['b', 'a'], ordered=False)
+        assert (c1 != c2).all()
+
+        c1 = ctor(['a', 'a'], categories=['a', 'b'], ordered=False)
+        c2 = ctor(['a', 'b'], categories=['b', 'a'], ordered=False)
+        result = c1 == c2
+        tm.assert_numpy_array_equal(np.array(result), np.array([True, False]))
+
+    def test_unordered_different_categories_raises(self):
+        c1 = Categorical(['a', 'b'], categories=['a', 'b'], ordered=False)
+        c2 = Categorical(['a', 'c'], categories=['c', 'a'], ordered=False)
+        with tm.assert_raises_regex(TypeError,
+                                    "Categoricals can only be compared"):
+            c1 == c2
+
+    def test_compare_different_lengths(self):
+        c1 = Categorical([], categories=['a', 'b'])
+        c2 = Categorical([], categories=['a'])
+        msg = "Categories are different lengths"
+        with tm.assert_raises_regex(TypeError, msg):
+            c1 == c2
+
+    def test_compare_unordered_different_order(self):
+        # https://github.com/pandas-dev/pandas/issues/16603#issuecomment-
+        # 349290078
+        a = pd.Categorical(['a'], categories=['a', 'b'])
+        b = pd.Categorical(['b'], categories=['b', 'a'])
+        assert not a.equals(b)
+
+    def test_numeric_like_ops(self):
+
+        df = DataFrame({'value': np.random.randint(0, 10000, 100)})
+        labels = ["{0} - {1}".format(i, i + 499) for i in range(0, 10000, 500)]
+        cat_labels = Categorical(labels, labels)
+
+        df = df.sort_values(by=['value'], ascending=True)
+        df['value_group'] = pd.cut(df.value, range(0, 10500, 500),
+                                   right=False, labels=cat_labels)
+
+        # numeric ops should not succeed
+        for op in ['__add__', '__sub__', '__mul__', '__truediv__']:
+            pytest.raises(TypeError,
+                          lambda: getattr(df, op)(df))
+
+        # reduction ops should not succeed (unless specifically defined, e.g.
+        # min/max)
+        s = df['value_group']
+        for op in ['kurt', 'skew', 'var', 'std', 'mean', 'sum', 'median']:
+            pytest.raises(TypeError,
+                          lambda: getattr(s, op)(numeric_only=False))
+
+        # mad technically works because it takes always the numeric data
+
+        # numpy ops
+        s = Series(Categorical([1, 2, 3, 4]))
+        pytest.raises(TypeError, lambda: np.sum(s))
+
+        # numeric ops on a Series
+        for op in ['__add__', '__sub__', '__mul__', '__truediv__']:
+            pytest.raises(TypeError, lambda: getattr(s, op)(2))
+
+        # invalid ufunc
+        pytest.raises(TypeError, lambda: np.log(s))
+
+    def test_contains(self):
+        # GH21508
+        c = pd.Categorical(list('aabbca'), categories=list('cab'))
+
+        assert 'b' in c
+        assert 'z' not in c
+        assert np.nan not in c
+        with pytest.raises(TypeError):
+            assert [1] in c
+
+        # assert codes NOT in index
+        assert 0 not in c
+        assert 1 not in c
+
+        c = pd.Categorical(list('aabbca') + [np.nan], categories=list('cab'))
+        assert np.nan in c
diff --git a/pandas/tests/categorical/test_repr.py b/pandas/tests/categorical/test_repr.py
new file mode 100644
index 0000000000000..0cadf66b24d46
--- /dev/null
+++ b/pandas/tests/categorical/test_repr.py
@@ -0,0 +1,517 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+
+from pandas import (Categorical, Series, CategoricalIndex, date_range,
+                    period_range, timedelta_range)
+from pandas.compat import u, PY3
+from pandas.core.config import option_context
+from pandas.tests.categorical.common import TestCategorical
+
+
+class TestCategoricalReprWithFactor(TestCategorical):
+
+    def test_print(self):
+        expected = ["[a, b, b, a, a, c, c, c]",
+                    "Categories (3, object): [a < b < c]"]
+        expected = "\n".join(expected)
+        actual = repr(self.factor)
+        assert actual == expected
+
+
+class TestCategoricalRepr(object):
+
+    def test_big_print(self):
+        factor = Categorical([0, 1, 2, 0, 1, 2] * 100, ['a', 'b', 'c'],
+                             fastpath=True)
+        expected = ["[a, b, c, a, b, ..., b, c, a, b, c]", "Length: 600",
+                    "Categories (3, object): [a, b, c]"]
+        expected = "\n".join(expected)
+
+        actual = repr(factor)
+
+        assert actual == expected
+
+    def test_empty_print(self):
+        factor = Categorical([], ["a", "b", "c"])
+        expected = ("[], Categories (3, object): [a, b, c]")
+        # hack because array_repr changed in numpy > 1.6.x
+        actual = repr(factor)
+        assert actual == expected
+
+        assert expected == actual
+        factor = Categorical([], ["a", "b", "c"], ordered=True)
+        expected = ("[], Categories (3, object): [a < b < c]")
+        actual = repr(factor)
+        assert expected == actual
+
+        factor = Categorical([], [])
+        expected = ("[], Categories (0, object): []")
+        assert expected == repr(factor)
+
+    def test_print_none_width(self):
+        # GH10087
+        a = Series(Categorical([1, 2, 3, 4]))
+        exp = u("0    1\n1    2\n2    3\n3    4\n" +
+                "dtype: category\nCategories (4, int64): [1, 2, 3, 4]")
+
+        with option_context("display.width", None):
+            assert exp == repr(a)
+
+    def test_unicode_print(self):
+        if PY3:
+            _rep = repr
+        else:
+            _rep = unicode  # noqa
+
+        c = Categorical(['aaaaa', 'bb', 'cccc'] * 20)
+        expected = u"""\
+[aaaaa, bb, cccc, aaaaa, bb, ..., bb, cccc, aaaaa, bb, cccc]
+Length: 60
+Categories (3, object): [aaaaa, bb, cccc]"""
+
+        assert _rep(c) == expected
+
+        c = Categorical([u'ああああ', u'いいいいい', u'ううううううう'] * 20)
+        expected = u"""\
+[ああああ, いいいいい, ううううううう, ああああ, いいいいい, ..., いいいいい, ううううううう, ああああ, いいいいい, ううううううう]
+Length: 60
+Categories (3, object): [ああああ, いいいいい, ううううううう]"""  # noqa
+
+        assert _rep(c) == expected
+
+        # unicode option should not affect to Categorical, as it doesn't care
+        # the repr width
+        with option_context('display.unicode.east_asian_width', True):
+
+            c = Categorical([u'ああああ', u'いいいいい', u'ううううううう'] * 20)
+            expected = u"""[ああああ, いいいいい, ううううううう, ああああ, いいいいい, ..., いいいいい, ううううううう, ああああ, いいいいい, ううううううう]
+Length: 60
+Categories (3, object): [ああああ, いいいいい, ううううううう]"""  # noqa
+
+            assert _rep(c) == expected
+
+    def test_categorical_repr(self):
+        c = Categorical([1, 2, 3])
+        exp = """[1, 2, 3]
+Categories (3, int64): [1, 2, 3]"""
+
+        assert repr(c) == exp
+
+        c = Categorical([1, 2, 3, 1, 2, 3], categories=[1, 2, 3])
+        exp = """[1, 2, 3, 1, 2, 3]
+Categories (3, int64): [1, 2, 3]"""
+
+        assert repr(c) == exp
+
+        c = Categorical([1, 2, 3, 4, 5] * 10)
+        exp = """[1, 2, 3, 4, 5, ..., 1, 2, 3, 4, 5]
+Length: 50
+Categories (5, int64): [1, 2, 3, 4, 5]"""
+
+        assert repr(c) == exp
+
+        c = Categorical(np.arange(20))
+        exp = """[0, 1, 2, 3, 4, ..., 15, 16, 17, 18, 19]
+Length: 20
+Categories (20, int64): [0, 1, 2, 3, ..., 16, 17, 18, 19]"""
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_ordered(self):
+        c = Categorical([1, 2, 3], ordered=True)
+        exp = """[1, 2, 3]
+Categories (3, int64): [1 < 2 < 3]"""
+
+        assert repr(c) == exp
+
+        c = Categorical([1, 2, 3, 1, 2, 3], categories=[1, 2, 3], ordered=True)
+        exp = """[1, 2, 3, 1, 2, 3]
+Categories (3, int64): [1 < 2 < 3]"""
+
+        assert repr(c) == exp
+
+        c = Categorical([1, 2, 3, 4, 5] * 10, ordered=True)
+        exp = """[1, 2, 3, 4, 5, ..., 1, 2, 3, 4, 5]
+Length: 50
+Categories (5, int64): [1 < 2 < 3 < 4 < 5]"""
+
+        assert repr(c) == exp
+
+        c = Categorical(np.arange(20), ordered=True)
+        exp = """[0, 1, 2, 3, 4, ..., 15, 16, 17, 18, 19]
+Length: 20
+Categories (20, int64): [0 < 1 < 2 < 3 ... 16 < 17 < 18 < 19]"""
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_datetime(self):
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5)
+        c = Categorical(idx)
+
+        # TODO(wesm): exceeding 80 characters in the console is not good
+        # behavior
+        exp = (
+            "[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, "
+            "2011-01-01 12:00:00, 2011-01-01 13:00:00]\n"
+            "Categories (5, datetime64[ns]): [2011-01-01 09:00:00, "
+            "2011-01-01 10:00:00, 2011-01-01 11:00:00,\n"
+            "                                 2011-01-01 12:00:00, "
+            "2011-01-01 13:00:00]""")
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx)
+        exp = (
+            "[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, "
+            "2011-01-01 12:00:00, 2011-01-01 13:00:00, 2011-01-01 09:00:00, "
+            "2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, "
+            "2011-01-01 13:00:00]\n"
+            "Categories (5, datetime64[ns]): [2011-01-01 09:00:00, "
+            "2011-01-01 10:00:00, 2011-01-01 11:00:00,\n"
+            "                                 2011-01-01 12:00:00, "
+            "2011-01-01 13:00:00]")
+
+        assert repr(c) == exp
+
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5,
+                         tz='US/Eastern')
+        c = Categorical(idx)
+        exp = (
+            "[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, "
+            "2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, "
+            "2011-01-01 13:00:00-05:00]\n"
+            "Categories (5, datetime64[ns, US/Eastern]): "
+            "[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00,\n"
+            "                                             "
+            "2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00,\n"
+            "                                             "
+            "2011-01-01 13:00:00-05:00]")
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx)
+        exp = (
+            "[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, "
+            "2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, "
+            "2011-01-01 13:00:00-05:00, 2011-01-01 09:00:00-05:00, "
+            "2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, "
+            "2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00]\n"
+            "Categories (5, datetime64[ns, US/Eastern]): "
+            "[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00,\n"
+            "                                             "
+            "2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00,\n"
+            "                                             "
+            "2011-01-01 13:00:00-05:00]")
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_datetime_ordered(self):
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5)
+        c = Categorical(idx, ordered=True)
+        exp = """[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00]
+Categories (5, datetime64[ns]): [2011-01-01 09:00:00 < 2011-01-01 10:00:00 < 2011-01-01 11:00:00 <
+                                 2011-01-01 12:00:00 < 2011-01-01 13:00:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx, ordered=True)
+        exp = """[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00, 2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00]
+Categories (5, datetime64[ns]): [2011-01-01 09:00:00 < 2011-01-01 10:00:00 < 2011-01-01 11:00:00 <
+                                 2011-01-01 12:00:00 < 2011-01-01 13:00:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5,
+                         tz='US/Eastern')
+        c = Categorical(idx, ordered=True)
+        exp = """[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00]
+Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00 < 2011-01-01 10:00:00-05:00 <
+                                             2011-01-01 11:00:00-05:00 < 2011-01-01 12:00:00-05:00 <
+                                             2011-01-01 13:00:00-05:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx, ordered=True)
+        exp = """[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00, 2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00]
+Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00 < 2011-01-01 10:00:00-05:00 <
+                                             2011-01-01 11:00:00-05:00 < 2011-01-01 12:00:00-05:00 <
+                                             2011-01-01 13:00:00-05:00]"""  # noqa
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_period(self):
+        idx = period_range('2011-01-01 09:00', freq='H', periods=5)
+        c = Categorical(idx)
+        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
+Categories (5, period[H]): [2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00,
+                            2011-01-01 13:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx)
+        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00, 2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
+Categories (5, period[H]): [2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00,
+                            2011-01-01 13:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        idx = period_range('2011-01', freq='M', periods=5)
+        c = Categorical(idx)
+        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
+Categories (5, period[M]): [2011-01, 2011-02, 2011-03, 2011-04, 2011-05]"""
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx)
+        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05, 2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
+Categories (5, period[M]): [2011-01, 2011-02, 2011-03, 2011-04, 2011-05]"""  # noqa
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_period_ordered(self):
+        idx = period_range('2011-01-01 09:00', freq='H', periods=5)
+        c = Categorical(idx, ordered=True)
+        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
+Categories (5, period[H]): [2011-01-01 09:00 < 2011-01-01 10:00 < 2011-01-01 11:00 < 2011-01-01 12:00 <
+                            2011-01-01 13:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx, ordered=True)
+        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00, 2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
+Categories (5, period[H]): [2011-01-01 09:00 < 2011-01-01 10:00 < 2011-01-01 11:00 < 2011-01-01 12:00 <
+                            2011-01-01 13:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        idx = period_range('2011-01', freq='M', periods=5)
+        c = Categorical(idx, ordered=True)
+        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
+Categories (5, period[M]): [2011-01 < 2011-02 < 2011-03 < 2011-04 < 2011-05]"""
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx, ordered=True)
+        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05, 2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
+Categories (5, period[M]): [2011-01 < 2011-02 < 2011-03 < 2011-04 < 2011-05]"""  # noqa
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_timedelta(self):
+        idx = timedelta_range('1 days', periods=5)
+        c = Categorical(idx)
+        exp = """[1 days, 2 days, 3 days, 4 days, 5 days]
+Categories (5, timedelta64[ns]): [1 days, 2 days, 3 days, 4 days, 5 days]"""
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx)
+        exp = """[1 days, 2 days, 3 days, 4 days, 5 days, 1 days, 2 days, 3 days, 4 days, 5 days]
+Categories (5, timedelta64[ns]): [1 days, 2 days, 3 days, 4 days, 5 days]"""  # noqa
+
+        assert repr(c) == exp
+
+        idx = timedelta_range('1 hours', periods=20)
+        c = Categorical(idx)
+        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
+Length: 20
+Categories (20, timedelta64[ns]): [0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00,
+                                   3 days 01:00:00, ..., 16 days 01:00:00, 17 days 01:00:00,
+                                   18 days 01:00:00, 19 days 01:00:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx)
+        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
+Length: 40
+Categories (20, timedelta64[ns]): [0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00,
+                                   3 days 01:00:00, ..., 16 days 01:00:00, 17 days 01:00:00,
+                                   18 days 01:00:00, 19 days 01:00:00]"""  # noqa
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_timedelta_ordered(self):
+        idx = timedelta_range('1 days', periods=5)
+        c = Categorical(idx, ordered=True)
+        exp = """[1 days, 2 days, 3 days, 4 days, 5 days]
+Categories (5, timedelta64[ns]): [1 days < 2 days < 3 days < 4 days < 5 days]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx, ordered=True)
+        exp = """[1 days, 2 days, 3 days, 4 days, 5 days, 1 days, 2 days, 3 days, 4 days, 5 days]
+Categories (5, timedelta64[ns]): [1 days < 2 days < 3 days < 4 days < 5 days]"""  # noqa
+
+        assert repr(c) == exp
+
+        idx = timedelta_range('1 hours', periods=20)
+        c = Categorical(idx, ordered=True)
+        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
+Length: 20
+Categories (20, timedelta64[ns]): [0 days 01:00:00 < 1 days 01:00:00 < 2 days 01:00:00 <
+                                   3 days 01:00:00 ... 16 days 01:00:00 < 17 days 01:00:00 <
+                                   18 days 01:00:00 < 19 days 01:00:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx, ordered=True)
+        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
+Length: 40
+Categories (20, timedelta64[ns]): [0 days 01:00:00 < 1 days 01:00:00 < 2 days 01:00:00 <
+                                   3 days 01:00:00 ... 16 days 01:00:00 < 17 days 01:00:00 <
+                                   18 days 01:00:00 < 19 days 01:00:00]"""  # noqa
+
+        assert repr(c) == exp
+
+    def test_categorical_index_repr(self):
+        idx = CategoricalIndex(Categorical([1, 2, 3]))
+        exp = """CategoricalIndex([1, 2, 3], categories=[1, 2, 3], ordered=False, dtype='category')"""  # noqa
+        assert repr(idx) == exp
+
+        i = CategoricalIndex(Categorical(np.arange(10)))
+        exp = """CategoricalIndex([0, 1, 2, 3, 4, 5, 6, 7, 8, 9], categories=[0, 1, 2, 3, 4, 5, 6, 7, ...], ordered=False, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_ordered(self):
+        i = CategoricalIndex(Categorical([1, 2, 3], ordered=True))
+        exp = """CategoricalIndex([1, 2, 3], categories=[1, 2, 3], ordered=True, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+        i = CategoricalIndex(Categorical(np.arange(10), ordered=True))
+        exp = """CategoricalIndex([0, 1, 2, 3, 4, 5, 6, 7, 8, 9], categories=[0, 1, 2, 3, 4, 5, 6, 7, ...], ordered=True, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_datetime(self):
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01-01 09:00:00', '2011-01-01 10:00:00',
+                  '2011-01-01 11:00:00', '2011-01-01 12:00:00',
+                  '2011-01-01 13:00:00'],
+                 categories=[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00], ordered=False, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5,
+                         tz='US/Eastern')
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01-01 09:00:00-05:00', '2011-01-01 10:00:00-05:00',
+                  '2011-01-01 11:00:00-05:00', '2011-01-01 12:00:00-05:00',
+                  '2011-01-01 13:00:00-05:00'],
+                 categories=[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00], ordered=False, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_datetime_ordered(self):
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5)
+        i = CategoricalIndex(Categorical(idx, ordered=True))
+        exp = """CategoricalIndex(['2011-01-01 09:00:00', '2011-01-01 10:00:00',
+                  '2011-01-01 11:00:00', '2011-01-01 12:00:00',
+                  '2011-01-01 13:00:00'],
+                 categories=[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00], ordered=True, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5,
+                         tz='US/Eastern')
+        i = CategoricalIndex(Categorical(idx, ordered=True))
+        exp = """CategoricalIndex(['2011-01-01 09:00:00-05:00', '2011-01-01 10:00:00-05:00',
+                  '2011-01-01 11:00:00-05:00', '2011-01-01 12:00:00-05:00',
+                  '2011-01-01 13:00:00-05:00'],
+                 categories=[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00], ordered=True, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+        i = CategoricalIndex(Categorical(idx.append(idx), ordered=True))
+        exp = """CategoricalIndex(['2011-01-01 09:00:00-05:00', '2011-01-01 10:00:00-05:00',
+                  '2011-01-01 11:00:00-05:00', '2011-01-01 12:00:00-05:00',
+                  '2011-01-01 13:00:00-05:00', '2011-01-01 09:00:00-05:00',
+                  '2011-01-01 10:00:00-05:00', '2011-01-01 11:00:00-05:00',
+                  '2011-01-01 12:00:00-05:00', '2011-01-01 13:00:00-05:00'],
+                 categories=[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00], ordered=True, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_period(self):
+        # test all length
+        idx = period_range('2011-01-01 09:00', freq='H', periods=1)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01-01 09:00'], categories=[2011-01-01 09:00], ordered=False, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+        idx = period_range('2011-01-01 09:00', freq='H', periods=2)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00'], categories=[2011-01-01 09:00, 2011-01-01 10:00], ordered=False, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+        idx = period_range('2011-01-01 09:00', freq='H', periods=3)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00'], categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00], ordered=False, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+        idx = period_range('2011-01-01 09:00', freq='H', periods=5)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00',
+                  '2011-01-01 12:00', '2011-01-01 13:00'],
+                 categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00], ordered=False, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+        i = CategoricalIndex(Categorical(idx.append(idx)))
+        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00',
+                  '2011-01-01 12:00', '2011-01-01 13:00', '2011-01-01 09:00',
+                  '2011-01-01 10:00', '2011-01-01 11:00', '2011-01-01 12:00',
+                  '2011-01-01 13:00'],
+                 categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00], ordered=False, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+        idx = period_range('2011-01', freq='M', periods=5)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01', '2011-02', '2011-03', '2011-04', '2011-05'], categories=[2011-01, 2011-02, 2011-03, 2011-04, 2011-05], ordered=False, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_period_ordered(self):
+        idx = period_range('2011-01-01 09:00', freq='H', periods=5)
+        i = CategoricalIndex(Categorical(idx, ordered=True))
+        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00',
+                  '2011-01-01 12:00', '2011-01-01 13:00'],
+                 categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00], ordered=True, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+        idx = period_range('2011-01', freq='M', periods=5)
+        i = CategoricalIndex(Categorical(idx, ordered=True))
+        exp = """CategoricalIndex(['2011-01', '2011-02', '2011-03', '2011-04', '2011-05'], categories=[2011-01, 2011-02, 2011-03, 2011-04, 2011-05], ordered=True, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_timedelta(self):
+        idx = timedelta_range('1 days', periods=5)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['1 days', '2 days', '3 days', '4 days', '5 days'], categories=[1 days 00:00:00, 2 days 00:00:00, 3 days 00:00:00, 4 days 00:00:00, 5 days 00:00:00], ordered=False, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+        idx = timedelta_range('1 hours', periods=10)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['0 days 01:00:00', '1 days 01:00:00', '2 days 01:00:00',
+                  '3 days 01:00:00', '4 days 01:00:00', '5 days 01:00:00',
+                  '6 days 01:00:00', '7 days 01:00:00', '8 days 01:00:00',
+                  '9 days 01:00:00'],
+                 categories=[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, 5 days 01:00:00, 6 days 01:00:00, 7 days 01:00:00, ...], ordered=False, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_timedelta_ordered(self):
+        idx = timedelta_range('1 days', periods=5)
+        i = CategoricalIndex(Categorical(idx, ordered=True))
+        exp = """CategoricalIndex(['1 days', '2 days', '3 days', '4 days', '5 days'], categories=[1 days 00:00:00, 2 days 00:00:00, 3 days 00:00:00, 4 days 00:00:00, 5 days 00:00:00], ordered=True, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+        idx = timedelta_range('1 hours', periods=10)
+        i = CategoricalIndex(Categorical(idx, ordered=True))
+        exp = """CategoricalIndex(['0 days 01:00:00', '1 days 01:00:00', '2 days 01:00:00',
+                  '3 days 01:00:00', '4 days 01:00:00', '5 days 01:00:00',
+                  '6 days 01:00:00', '7 days 01:00:00', '8 days 01:00:00',
+                  '9 days 01:00:00'],
+                 categories=[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, 5 days 01:00:00, 6 days 01:00:00, 7 days 01:00:00, ...], ordered=True, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
diff --git a/pandas/tests/categorical/test_sorting.py b/pandas/tests/categorical/test_sorting.py
new file mode 100644
index 0000000000000..88edb6c8f1348
--- /dev/null
+++ b/pandas/tests/categorical/test_sorting.py
@@ -0,0 +1,123 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+
+import pandas.util.testing as tm
+from pandas import Categorical, Index
+
+
+class TestCategoricalSort(object):
+
+    def test_argsort(self):
+        c = Categorical([5, 3, 1, 4, 2], ordered=True)
+
+        expected = np.array([2, 4, 1, 3, 0])
+        tm.assert_numpy_array_equal(c.argsort(ascending=True), expected,
+                                    check_dtype=False)
+
+        expected = expected[::-1]
+        tm.assert_numpy_array_equal(c.argsort(ascending=False), expected,
+                                    check_dtype=False)
+
+    def test_numpy_argsort(self):
+        c = Categorical([5, 3, 1, 4, 2], ordered=True)
+
+        expected = np.array([2, 4, 1, 3, 0])
+        tm.assert_numpy_array_equal(np.argsort(c), expected,
+                                    check_dtype=False)
+
+        tm.assert_numpy_array_equal(np.argsort(c, kind='mergesort'), expected,
+                                    check_dtype=False)
+
+        msg = "the 'axis' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.argsort,
+                               c, axis=0)
+
+        msg = "the 'order' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.argsort,
+                               c, order='C')
+
+    def test_sort_values(self):
+
+        # unordered cats are sortable
+        cat = Categorical(["a", "b", "b", "a"], ordered=False)
+        cat.sort_values()
+
+        cat = Categorical(["a", "c", "b", "d"], ordered=True)
+
+        # sort_values
+        res = cat.sort_values()
+        exp = np.array(["a", "b", "c", "d"], dtype=object)
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, cat.categories)
+
+        cat = Categorical(["a", "c", "b", "d"],
+                          categories=["a", "b", "c", "d"], ordered=True)
+        res = cat.sort_values()
+        exp = np.array(["a", "b", "c", "d"], dtype=object)
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, cat.categories)
+
+        res = cat.sort_values(ascending=False)
+        exp = np.array(["d", "c", "b", "a"], dtype=object)
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, cat.categories)
+
+        # sort (inplace order)
+        cat1 = cat.copy()
+        cat1.sort_values(inplace=True)
+        exp = np.array(["a", "b", "c", "d"], dtype=object)
+        tm.assert_numpy_array_equal(cat1.__array__(), exp)
+        tm.assert_index_equal(res.categories, cat.categories)
+
+        # reverse
+        cat = Categorical(["a", "c", "c", "b", "d"], ordered=True)
+        res = cat.sort_values(ascending=False)
+        exp_val = np.array(["d", "c", "c", "b", "a"], dtype=object)
+        exp_categories = Index(["a", "b", "c", "d"])
+        tm.assert_numpy_array_equal(res.__array__(), exp_val)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+    def test_sort_values_na_position(self):
+        # see gh-12882
+        cat = Categorical([5, 2, np.nan, 2, np.nan], ordered=True)
+        exp_categories = Index([2, 5])
+
+        exp = np.array([2.0, 2.0, 5.0, np.nan, np.nan])
+        res = cat.sort_values()  # default arguments
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+        exp = np.array([np.nan, np.nan, 2.0, 2.0, 5.0])
+        res = cat.sort_values(ascending=True, na_position='first')
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+        exp = np.array([np.nan, np.nan, 5.0, 2.0, 2.0])
+        res = cat.sort_values(ascending=False, na_position='first')
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+        exp = np.array([2.0, 2.0, 5.0, np.nan, np.nan])
+        res = cat.sort_values(ascending=True, na_position='last')
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+        exp = np.array([5.0, 2.0, 2.0, np.nan, np.nan])
+        res = cat.sort_values(ascending=False, na_position='last')
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+        cat = Categorical(["a", "c", "b", "d", np.nan], ordered=True)
+        res = cat.sort_values(ascending=False, na_position='last')
+        exp_val = np.array(["d", "c", "b", "a", np.nan], dtype=object)
+        exp_categories = Index(["a", "b", "c", "d"])
+        tm.assert_numpy_array_equal(res.__array__(), exp_val)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+        cat = Categorical(["a", "c", "b", "d", np.nan], ordered=True)
+        res = cat.sort_values(ascending=False, na_position='first')
+        exp_val = np.array([np.nan, "d", "c", "b", "a"], dtype=object)
+        exp_categories = Index(["a", "b", "c", "d"])
+        tm.assert_numpy_array_equal(res.__array__(), exp_val)
+        tm.assert_index_equal(res.categories, exp_categories)
diff --git a/pandas/tests/categorical/test_subclass.py b/pandas/tests/categorical/test_subclass.py
new file mode 100644
index 0000000000000..4060d2ebf633a
--- /dev/null
+++ b/pandas/tests/categorical/test_subclass.py
@@ -0,0 +1,26 @@
+# -*- coding: utf-8 -*-
+
+from pandas import Categorical
+
+import pandas.util.testing as tm
+
+
+class TestCategoricalSubclassing(object):
+
+    def test_constructor(self):
+        sc = tm.SubclassedCategorical(['a', 'b', 'c'])
+        assert isinstance(sc, tm.SubclassedCategorical)
+        tm.assert_categorical_equal(sc, Categorical(['a', 'b', 'c']))
+
+    def test_from_codes(self):
+        sc = tm.SubclassedCategorical.from_codes([1, 0, 2], ['a', 'b', 'c'])
+        assert isinstance(sc, tm.SubclassedCategorical)
+        exp = Categorical.from_codes([1, 0, 2], ['a', 'b', 'c'])
+        tm.assert_categorical_equal(sc, exp)
+
+    def test_map(self):
+        sc = tm.SubclassedCategorical(['a', 'b', 'c'])
+        res = sc.map(lambda x: x.upper())
+        assert isinstance(res, tm.SubclassedCategorical)
+        exp = Categorical(['A', 'B', 'C'])
+        tm.assert_categorical_equal(res, exp)
diff --git a/pandas/tests/categorical/test_warnings.py b/pandas/tests/categorical/test_warnings.py
new file mode 100644
index 0000000000000..91278580254aa
--- /dev/null
+++ b/pandas/tests/categorical/test_warnings.py
@@ -0,0 +1,18 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+import pandas.util.testing as tm
+
+
+class TestCategoricalWarnings(object):
+    def test_tab_complete_warning(self, ip):
+        # https://github.com/pandas-dev/pandas/issues/16409
+        pytest.importorskip('IPython', minversion="6.0.0")
+        from IPython.core.completer import provisionalcompleter
+
+        code = "import pandas as pd; c = Categorical([])"
+        ip.run_code(code)
+        with tm.assert_produces_warning(None):
+            with provisionalcompleter('ignore'):
+                list(ip.Completer.completions('c.', 1))
diff --git a/pandas/tseries/tests/__init__.py b/pandas/tests/computation/__init__.py
similarity index 100%
rename from pandas/tseries/tests/__init__.py
rename to pandas/tests/computation/__init__.py
diff --git a/pandas/tests/computation/test_compat.py b/pandas/tests/computation/test_compat.py
new file mode 100644
index 0000000000000..c25ef4bf38cab
--- /dev/null
+++ b/pandas/tests/computation/test_compat.py
@@ -0,0 +1,47 @@
+import pytest
+from distutils.version import LooseVersion
+
+import pandas as pd
+
+from pandas.core.computation.engines import _engines
+import pandas.core.computation.expr as expr
+from pandas.core.computation.check import _MIN_NUMEXPR_VERSION
+
+
+def test_compat():
+    # test we have compat with our version of nu
+
+    from pandas.core.computation.check import _NUMEXPR_INSTALLED
+    try:
+        import numexpr as ne
+        ver = ne.__version__
+        if LooseVersion(ver) < LooseVersion(_MIN_NUMEXPR_VERSION):
+            assert not _NUMEXPR_INSTALLED
+        else:
+            assert _NUMEXPR_INSTALLED
+    except ImportError:
+        pytest.skip("not testing numexpr version compat")
+
+
+@pytest.mark.parametrize('engine', _engines)
+@pytest.mark.parametrize('parser', expr._parsers)
+def test_invalid_numexpr_version(engine, parser):
+    def testit():
+        a, b = 1, 2  # noqa
+        res = pd.eval('a + b', engine=engine, parser=parser)
+        assert res == 3
+
+    if engine == 'numexpr':
+        try:
+            import numexpr as ne
+        except ImportError:
+            pytest.skip("no numexpr")
+        else:
+            if (LooseVersion(ne.__version__) <
+                    LooseVersion(_MIN_NUMEXPR_VERSION)):
+                with pytest.raises(ImportError):
+                    testit()
+            else:
+                testit()
+    else:
+        testit()
diff --git a/pandas/tests/computation/test_eval.py b/pandas/tests/computation/test_eval.py
new file mode 100644
index 0000000000000..07ba0b681418e
--- /dev/null
+++ b/pandas/tests/computation/test_eval.py
@@ -0,0 +1,1894 @@
+import warnings
+from warnings import catch_warnings
+import operator
+from itertools import product
+
+import pytest
+
+from numpy.random import randn, rand, randint
+import numpy as np
+
+from pandas.core.dtypes.common import is_bool, is_list_like, is_scalar
+import pandas as pd
+from pandas.core import common as com
+from pandas.errors import PerformanceWarning
+from pandas import DataFrame, Series, Panel, date_range
+from pandas.util.testing import makeCustomDataframe as mkdf
+
+from pandas.core.computation import pytables
+from pandas.core.computation.engines import _engines, NumExprClobberingError
+from pandas.core.computation.expr import PythonExprVisitor, PandasExprVisitor
+from pandas.core.computation.expressions import (
+    _USE_NUMEXPR, _NUMEXPR_INSTALLED)
+from pandas.core.computation.ops import (
+    _binary_ops_dict,
+    _special_case_arith_ops_syms,
+    _arith_ops_syms, _bool_ops_syms,
+    _unary_math_ops, _binary_math_ops)
+
+import pandas.core.computation.expr as expr
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas.util.testing import (assert_frame_equal, randbool,
+                                 assert_numpy_array_equal, assert_series_equal,
+                                 assert_produces_warning)
+from pandas.compat import PY3, reduce
+
+_series_frame_incompatible = _bool_ops_syms
+_scalar_skip = 'in', 'not in'
+
+
+@pytest.fixture(params=(
+    pytest.param(engine,
+                 marks=pytest.mark.skipif(
+                     engine == 'numexpr' and not _USE_NUMEXPR,
+                     reason='numexpr enabled->{enabled}, '
+                            'installed->{installed}'.format(
+                                enabled=_USE_NUMEXPR,
+                                installed=_NUMEXPR_INSTALLED)))
+                 for engine in _engines))  # noqa
+def engine(request):
+    return request.param
+
+
+@pytest.fixture(params=expr._parsers)
+def parser(request):
+    return request.param
+
+
+def engine_has_neg_frac(engine):
+    return _engines[engine].has_neg_frac
+
+
+def _eval_single_bin(lhs, cmp1, rhs, engine):
+    c = _binary_ops_dict[cmp1]
+    if engine_has_neg_frac(engine):
+        try:
+            return c(lhs, rhs)
+        except ValueError as e:
+            if str(e).startswith('negative number cannot be '
+                                 'raised to a fractional power'):
+                return np.nan
+            raise
+    return c(lhs, rhs)
+
+
+def _series_and_2d_ndarray(lhs, rhs):
+    return ((isinstance(lhs, Series) and
+             isinstance(rhs, np.ndarray) and rhs.ndim > 1) or
+            (isinstance(rhs, Series) and
+             isinstance(lhs, np.ndarray) and lhs.ndim > 1))
+
+
+def _series_and_frame(lhs, rhs):
+    return ((isinstance(lhs, Series) and isinstance(rhs, DataFrame)) or
+            (isinstance(rhs, Series) and isinstance(lhs, DataFrame)))
+
+
+def _bool_and_frame(lhs, rhs):
+    return isinstance(lhs, bool) and isinstance(rhs, pd.core.generic.NDFrame)
+
+
+def _is_py3_complex_incompat(result, expected):
+    return (PY3 and isinstance(expected, (complex, np.complexfloating)) and
+            np.isnan(result))
+
+
+_good_arith_ops = com.difference(_arith_ops_syms, _special_case_arith_ops_syms)
+
+
+@td.skip_if_no_ne
+class TestEvalNumexprPandas(object):
+
+    @classmethod
+    def setup_class(cls):
+        import numexpr as ne
+        cls.ne = ne
+        cls.engine = 'numexpr'
+        cls.parser = 'pandas'
+
+    @classmethod
+    def teardown_class(cls):
+        del cls.engine, cls.parser
+        if hasattr(cls, 'ne'):
+            del cls.ne
+
+    def setup_data(self):
+        nan_df1 = DataFrame(rand(10, 5))
+        nan_df1[nan_df1 > 0.5] = np.nan
+        nan_df2 = DataFrame(rand(10, 5))
+        nan_df2[nan_df2 > 0.5] = np.nan
+
+        self.pandas_lhses = (DataFrame(randn(10, 5)), Series(randn(5)),
+                             Series([1, 2, np.nan, np.nan, 5]), nan_df1)
+        self.pandas_rhses = (DataFrame(randn(10, 5)), Series(randn(5)),
+                             Series([1, 2, np.nan, np.nan, 5]), nan_df2)
+        self.scalar_lhses = randn(),
+        self.scalar_rhses = randn(),
+
+        self.lhses = self.pandas_lhses + self.scalar_lhses
+        self.rhses = self.pandas_rhses + self.scalar_rhses
+
+    def setup_ops(self):
+        self.cmp_ops = expr._cmp_ops_syms
+        self.cmp2_ops = self.cmp_ops[::-1]
+        self.bin_ops = expr._bool_ops_syms
+        self.special_case_ops = _special_case_arith_ops_syms
+        self.arith_ops = _good_arith_ops
+        self.unary_ops = '-', '~', 'not '
+
+    def setup_method(self, method):
+        self.setup_ops()
+        self.setup_data()
+        self.current_engines = filter(lambda x: x != self.engine, _engines)
+
+    def teardown_method(self, method):
+        del self.lhses, self.rhses, self.scalar_rhses, self.scalar_lhses
+        del self.pandas_rhses, self.pandas_lhses, self.current_engines
+
+    @pytest.mark.slow
+    def test_complex_cmp_ops(self):
+        cmp_ops = ('!=', '==', '<=', '>=', '<', '>')
+        cmp2_ops = ('>', '<')
+        for lhs, cmp1, rhs, binop, cmp2 in product(self.lhses, cmp_ops,
+                                                   self.rhses, self.bin_ops,
+                                                   cmp2_ops):
+            self.check_complex_cmp_op(lhs, cmp1, rhs, binop, cmp2)
+
+    def test_simple_cmp_ops(self):
+        bool_lhses = (DataFrame(randbool(size=(10, 5))),
+                      Series(randbool((5,))), randbool())
+        bool_rhses = (DataFrame(randbool(size=(10, 5))),
+                      Series(randbool((5,))), randbool())
+        for lhs, rhs, cmp_op in product(bool_lhses, bool_rhses, self.cmp_ops):
+            self.check_simple_cmp_op(lhs, cmp_op, rhs)
+
+    @pytest.mark.slow
+    def test_binary_arith_ops(self):
+        for lhs, op, rhs in product(self.lhses, self.arith_ops, self.rhses):
+            self.check_binary_arith_op(lhs, op, rhs)
+
+    def test_modulus(self):
+        for lhs, rhs in product(self.lhses, self.rhses):
+            self.check_modulus(lhs, '%', rhs)
+
+    def test_floor_division(self):
+        for lhs, rhs in product(self.lhses, self.rhses):
+            self.check_floor_division(lhs, '//', rhs)
+
+    @td.skip_if_windows
+    def test_pow(self):
+        # odd failure on win32 platform, so skip
+        for lhs, rhs in product(self.lhses, self.rhses):
+            self.check_pow(lhs, '**', rhs)
+
+    @pytest.mark.slow
+    def test_single_invert_op(self):
+        for lhs, op, rhs in product(self.lhses, self.cmp_ops, self.rhses):
+            self.check_single_invert_op(lhs, op, rhs)
+
+    @pytest.mark.slow
+    def test_compound_invert_op(self):
+        for lhs, op, rhs in product(self.lhses, self.cmp_ops, self.rhses):
+            self.check_compound_invert_op(lhs, op, rhs)
+
+    @pytest.mark.slow
+    def test_chained_cmp_op(self):
+        mids = self.lhses
+        cmp_ops = '<', '>'
+        for lhs, cmp1, mid, cmp2, rhs in product(self.lhses, cmp_ops,
+                                                 mids, cmp_ops, self.rhses):
+            self.check_chained_cmp_op(lhs, cmp1, mid, cmp2, rhs)
+
+    def check_equal(self, result, expected):
+        if isinstance(result, DataFrame):
+            tm.assert_frame_equal(result, expected)
+        elif isinstance(result, Series):
+            tm.assert_series_equal(result, expected)
+        elif isinstance(result, np.ndarray):
+            tm.assert_numpy_array_equal(result, expected)
+        else:
+            assert result == expected
+
+    def check_complex_cmp_op(self, lhs, cmp1, rhs, binop, cmp2):
+        skip_these = _scalar_skip
+        ex = '(lhs {cmp1} rhs) {binop} (lhs {cmp2} rhs)'.format(cmp1=cmp1,
+                                                                binop=binop,
+                                                                cmp2=cmp2)
+        scalar_with_in_notin = (is_scalar(rhs) and (cmp1 in skip_these or
+                                                    cmp2 in skip_these))
+        if scalar_with_in_notin:
+            with pytest.raises(TypeError):
+                pd.eval(ex, engine=self.engine, parser=self.parser)
+            with pytest.raises(TypeError):
+                pd.eval(ex, engine=self.engine, parser=self.parser,
+                        local_dict={'lhs': lhs, 'rhs': rhs})
+        else:
+            lhs_new = _eval_single_bin(lhs, cmp1, rhs, self.engine)
+            rhs_new = _eval_single_bin(lhs, cmp2, rhs, self.engine)
+            if (isinstance(lhs_new, Series) and
+                    isinstance(rhs_new, DataFrame) and
+                    binop in _series_frame_incompatible):
+                pass
+                # TODO: the code below should be added back when left and right
+                # hand side bool ops are fixed.
+                #
+                # try:
+                #     pytest.raises(Exception, pd.eval, ex,
+                #                   local_dict={'lhs': lhs, 'rhs': rhs},
+                #                   engine=self.engine, parser=self.parser)
+                # except AssertionError:
+                #     import ipdb
+                #
+                #     ipdb.set_trace()
+                #     raise
+            else:
+                expected = _eval_single_bin(
+                    lhs_new, binop, rhs_new, self.engine)
+                result = pd.eval(ex, engine=self.engine, parser=self.parser)
+                self.check_equal(result, expected)
+
+    def check_chained_cmp_op(self, lhs, cmp1, mid, cmp2, rhs):
+
+        def check_operands(left, right, cmp_op):
+            return _eval_single_bin(left, cmp_op, right, self.engine)
+
+        lhs_new = check_operands(lhs, mid, cmp1)
+        rhs_new = check_operands(mid, rhs, cmp2)
+
+        if lhs_new is not None and rhs_new is not None:
+            ex1 = 'lhs {0} mid {1} rhs'.format(cmp1, cmp2)
+            ex2 = 'lhs {0} mid and mid {1} rhs'.format(cmp1, cmp2)
+            ex3 = '(lhs {0} mid) & (mid {1} rhs)'.format(cmp1, cmp2)
+            expected = _eval_single_bin(lhs_new, '&', rhs_new, self.engine)
+
+            for ex in (ex1, ex2, ex3):
+                result = pd.eval(ex, engine=self.engine,
+                                 parser=self.parser)
+
+                tm.assert_almost_equal(result, expected)
+
+    def check_simple_cmp_op(self, lhs, cmp1, rhs):
+        ex = 'lhs {0} rhs'.format(cmp1)
+        if cmp1 in ('in', 'not in') and not is_list_like(rhs):
+            pytest.raises(TypeError, pd.eval, ex, engine=self.engine,
+                          parser=self.parser, local_dict={'lhs': lhs,
+                                                          'rhs': rhs})
+        else:
+            expected = _eval_single_bin(lhs, cmp1, rhs, self.engine)
+            result = pd.eval(ex, engine=self.engine, parser=self.parser)
+            self.check_equal(result, expected)
+
+    def check_binary_arith_op(self, lhs, arith1, rhs):
+        ex = 'lhs {0} rhs'.format(arith1)
+        result = pd.eval(ex, engine=self.engine, parser=self.parser)
+        expected = _eval_single_bin(lhs, arith1, rhs, self.engine)
+
+        tm.assert_almost_equal(result, expected)
+        ex = 'lhs {0} rhs {0} rhs'.format(arith1)
+        result = pd.eval(ex, engine=self.engine, parser=self.parser)
+        nlhs = _eval_single_bin(lhs, arith1, rhs,
+                                self.engine)
+        self.check_alignment(result, nlhs, rhs, arith1)
+
+    def check_alignment(self, result, nlhs, ghs, op):
+        try:
+            nlhs, ghs = nlhs.align(ghs)
+        except (ValueError, TypeError, AttributeError):
+            # ValueError: series frame or frame series align
+            # TypeError, AttributeError: series or frame with scalar align
+            pass
+        else:
+
+            # direct numpy comparison
+            expected = self.ne.evaluate('nlhs {0} ghs'.format(op))
+            tm.assert_numpy_array_equal(result.values, expected)
+
+    # modulus, pow, and floor division require special casing
+
+    def check_modulus(self, lhs, arith1, rhs):
+        ex = 'lhs {0} rhs'.format(arith1)
+        result = pd.eval(ex, engine=self.engine, parser=self.parser)
+        expected = lhs % rhs
+
+        tm.assert_almost_equal(result, expected)
+        expected = self.ne.evaluate('expected {0} rhs'.format(arith1))
+        if isinstance(result, (DataFrame, Series)):
+            tm.assert_almost_equal(result.values, expected)
+        else:
+            tm.assert_almost_equal(result, expected.item())
+
+    def check_floor_division(self, lhs, arith1, rhs):
+        ex = 'lhs {0} rhs'.format(arith1)
+
+        if self.engine == 'python':
+            res = pd.eval(ex, engine=self.engine, parser=self.parser)
+            expected = lhs // rhs
+            self.check_equal(res, expected)
+        else:
+            pytest.raises(TypeError, pd.eval, ex,
+                          local_dict={'lhs': lhs, 'rhs': rhs},
+                          engine=self.engine, parser=self.parser)
+
+    def get_expected_pow_result(self, lhs, rhs):
+        try:
+            expected = _eval_single_bin(lhs, '**', rhs, self.engine)
+        except ValueError as e:
+            if str(e).startswith('negative number cannot be '
+                                 'raised to a fractional power'):
+                if self.engine == 'python':
+                    pytest.skip(str(e))
+                else:
+                    expected = np.nan
+            else:
+                raise
+        return expected
+
+    def check_pow(self, lhs, arith1, rhs):
+        ex = 'lhs {0} rhs'.format(arith1)
+        expected = self.get_expected_pow_result(lhs, rhs)
+        result = pd.eval(ex, engine=self.engine, parser=self.parser)
+
+        if (is_scalar(lhs) and is_scalar(rhs) and
+                _is_py3_complex_incompat(result, expected)):
+            pytest.raises(AssertionError, tm.assert_numpy_array_equal,
+                          result, expected)
+        else:
+            tm.assert_almost_equal(result, expected)
+
+            ex = '(lhs {0} rhs) {0} rhs'.format(arith1)
+            result = pd.eval(ex, engine=self.engine, parser=self.parser)
+            expected = self.get_expected_pow_result(
+                self.get_expected_pow_result(lhs, rhs), rhs)
+            tm.assert_almost_equal(result, expected)
+
+    def check_single_invert_op(self, lhs, cmp1, rhs):
+        # simple
+        for el in (lhs, rhs):
+            try:
+                elb = el.astype(bool)
+            except AttributeError:
+                elb = np.array([bool(el)])
+            expected = ~elb
+            result = pd.eval('~elb', engine=self.engine, parser=self.parser)
+            tm.assert_almost_equal(expected, result)
+
+            for engine in self.current_engines:
+                tm.assert_almost_equal(result, pd.eval('~elb', engine=engine,
+                                                       parser=self.parser))
+
+    def check_compound_invert_op(self, lhs, cmp1, rhs):
+        skip_these = 'in', 'not in'
+        ex = '~(lhs {0} rhs)'.format(cmp1)
+
+        if is_scalar(rhs) and cmp1 in skip_these:
+            pytest.raises(TypeError, pd.eval, ex, engine=self.engine,
+                          parser=self.parser, local_dict={'lhs': lhs,
+                                                          'rhs': rhs})
+        else:
+            # compound
+            if is_scalar(lhs) and is_scalar(rhs):
+                lhs, rhs = map(lambda x: np.array([x]), (lhs, rhs))
+            expected = _eval_single_bin(lhs, cmp1, rhs, self.engine)
+            if is_scalar(expected):
+                expected = not expected
+            else:
+                expected = ~expected
+            result = pd.eval(ex, engine=self.engine, parser=self.parser)
+            tm.assert_almost_equal(expected, result)
+
+            # make sure the other engines work the same as this one
+            for engine in self.current_engines:
+                ev = pd.eval(ex, engine=self.engine, parser=self.parser)
+                tm.assert_almost_equal(ev, result)
+
+    def ex(self, op, var_name='lhs'):
+        return '{0}{1}'.format(op, var_name)
+
+    def test_frame_invert(self):
+        expr = self.ex('~')
+
+        # ~ ##
+        # frame
+        # float always raises
+        lhs = DataFrame(randn(5, 2))
+        if self.engine == 'numexpr':
+            with pytest.raises(NotImplementedError):
+                result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        else:
+            with pytest.raises(TypeError):
+                result = pd.eval(expr, engine=self.engine, parser=self.parser)
+
+        # int raises on numexpr
+        lhs = DataFrame(randint(5, size=(5, 2)))
+        if self.engine == 'numexpr':
+            with pytest.raises(NotImplementedError):
+                result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        else:
+            expect = ~lhs
+            result = pd.eval(expr, engine=self.engine, parser=self.parser)
+            assert_frame_equal(expect, result)
+
+        # bool always works
+        lhs = DataFrame(rand(5, 2) > 0.5)
+        expect = ~lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_frame_equal(expect, result)
+
+        # object raises
+        lhs = DataFrame({'b': ['a', 1, 2.0], 'c': rand(3) > 0.5})
+        if self.engine == 'numexpr':
+            with pytest.raises(ValueError):
+                result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        else:
+            with pytest.raises(TypeError):
+                result = pd.eval(expr, engine=self.engine, parser=self.parser)
+
+    def test_series_invert(self):
+        # ~ ####
+        expr = self.ex('~')
+
+        # series
+        # float raises
+        lhs = Series(randn(5))
+        if self.engine == 'numexpr':
+            with pytest.raises(NotImplementedError):
+                result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        else:
+            with pytest.raises(TypeError):
+                result = pd.eval(expr, engine=self.engine, parser=self.parser)
+
+        # int raises on numexpr
+        lhs = Series(randint(5, size=5))
+        if self.engine == 'numexpr':
+            with pytest.raises(NotImplementedError):
+                result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        else:
+            expect = ~lhs
+            result = pd.eval(expr, engine=self.engine, parser=self.parser)
+            assert_series_equal(expect, result)
+
+        # bool
+        lhs = Series(rand(5) > 0.5)
+        expect = ~lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_series_equal(expect, result)
+
+        # float
+        # int
+        # bool
+
+        # object
+        lhs = Series(['a', 1, 2.0])
+        if self.engine == 'numexpr':
+            with pytest.raises(ValueError):
+                result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        else:
+            with pytest.raises(TypeError):
+                result = pd.eval(expr, engine=self.engine, parser=self.parser)
+
+    def test_frame_negate(self):
+        expr = self.ex('-')
+
+        # float
+        lhs = DataFrame(randn(5, 2))
+        expect = -lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_frame_equal(expect, result)
+
+        # int
+        lhs = DataFrame(randint(5, size=(5, 2)))
+        expect = -lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_frame_equal(expect, result)
+
+        # bool doesn't work with numexpr but works elsewhere
+        lhs = DataFrame(rand(5, 2) > 0.5)
+        if self.engine == 'numexpr':
+            with pytest.raises(NotImplementedError):
+                result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        else:
+            expect = -lhs
+            result = pd.eval(expr, engine=self.engine, parser=self.parser)
+            assert_frame_equal(expect, result)
+
+    def test_series_negate(self):
+        expr = self.ex('-')
+
+        # float
+        lhs = Series(randn(5))
+        expect = -lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_series_equal(expect, result)
+
+        # int
+        lhs = Series(randint(5, size=5))
+        expect = -lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_series_equal(expect, result)
+
+        # bool doesn't work with numexpr but works elsewhere
+        lhs = Series(rand(5) > 0.5)
+        if self.engine == 'numexpr':
+            with pytest.raises(NotImplementedError):
+                result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        else:
+            expect = -lhs
+            result = pd.eval(expr, engine=self.engine, parser=self.parser)
+            assert_series_equal(expect, result)
+
+    def test_frame_pos(self):
+        expr = self.ex('+')
+
+        # float
+        lhs = DataFrame(randn(5, 2))
+        expect = lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_frame_equal(expect, result)
+
+        # int
+        lhs = DataFrame(randint(5, size=(5, 2)))
+        expect = lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_frame_equal(expect, result)
+
+        # bool doesn't work with numexpr but works elsewhere
+        lhs = DataFrame(rand(5, 2) > 0.5)
+        expect = lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_frame_equal(expect, result)
+
+    def test_series_pos(self):
+        expr = self.ex('+')
+
+        # float
+        lhs = Series(randn(5))
+        expect = lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_series_equal(expect, result)
+
+        # int
+        lhs = Series(randint(5, size=5))
+        expect = lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_series_equal(expect, result)
+
+        # bool doesn't work with numexpr but works elsewhere
+        lhs = Series(rand(5) > 0.5)
+        expect = lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_series_equal(expect, result)
+
+    def test_scalar_unary(self):
+        with pytest.raises(TypeError):
+            pd.eval('~1.0', engine=self.engine, parser=self.parser)
+
+        assert pd.eval('-1.0', parser=self.parser,
+                       engine=self.engine) == -1.0
+        assert pd.eval('+1.0', parser=self.parser,
+                       engine=self.engine) == +1.0
+        assert pd.eval('~1', parser=self.parser,
+                       engine=self.engine) == ~1
+        assert pd.eval('-1', parser=self.parser,
+                       engine=self.engine) == -1
+        assert pd.eval('+1', parser=self.parser,
+                       engine=self.engine) == +1
+        assert pd.eval('~True', parser=self.parser,
+                       engine=self.engine) == ~True
+        assert pd.eval('~False', parser=self.parser,
+                       engine=self.engine) == ~False
+        assert pd.eval('-True', parser=self.parser,
+                       engine=self.engine) == -True
+        assert pd.eval('-False', parser=self.parser,
+                       engine=self.engine) == -False
+        assert pd.eval('+True', parser=self.parser,
+                       engine=self.engine) == +True
+        assert pd.eval('+False', parser=self.parser,
+                       engine=self.engine) == +False
+
+    def test_unary_in_array(self):
+        # GH 11235
+        assert_numpy_array_equal(
+            pd.eval('[-True, True, ~True, +True,'
+                    '-False, False, ~False, +False,'
+                    '-37, 37, ~37, +37]'),
+            np.array([-True, True, ~True, +True,
+                      -False, False, ~False, +False,
+                      -37, 37, ~37, +37], dtype=np.object_))
+
+    def test_disallow_scalar_bool_ops(self):
+        exprs = '1 or 2', '1 and 2'
+        exprs += 'a and b', 'a or b'
+        exprs += '1 or 2 and (3 + 2) > 3',
+        exprs += '2 * x > 2 or 1 and 2',
+        exprs += '2 * df > 3 and 1 or a',
+
+        x, a, b, df = np.random.randn(3), 1, 2, DataFrame(randn(3, 2))  # noqa
+        for ex in exprs:
+            with pytest.raises(NotImplementedError):
+                pd.eval(ex, engine=self.engine, parser=self.parser)
+
+    def test_identical(self):
+        # see gh-10546
+        x = 1
+        result = pd.eval('x', engine=self.engine, parser=self.parser)
+        assert result == 1
+        assert is_scalar(result)
+
+        x = 1.5
+        result = pd.eval('x', engine=self.engine, parser=self.parser)
+        assert result == 1.5
+        assert is_scalar(result)
+
+        x = False
+        result = pd.eval('x', engine=self.engine, parser=self.parser)
+        assert not result
+        assert is_bool(result)
+        assert is_scalar(result)
+
+        x = np.array([1])
+        result = pd.eval('x', engine=self.engine, parser=self.parser)
+        tm.assert_numpy_array_equal(result, np.array([1]))
+        assert result.shape == (1, )
+
+        x = np.array([1.5])
+        result = pd.eval('x', engine=self.engine, parser=self.parser)
+        tm.assert_numpy_array_equal(result, np.array([1.5]))
+        assert result.shape == (1, )
+
+        x = np.array([False])  # noqa
+        result = pd.eval('x', engine=self.engine, parser=self.parser)
+        tm.assert_numpy_array_equal(result, np.array([False]))
+        assert result.shape == (1, )
+
+    def test_line_continuation(self):
+        # GH 11149
+        exp = """1 + 2 * \
+        5 - 1 + 2 """
+        result = pd.eval(exp, engine=self.engine, parser=self.parser)
+        assert result == 12
+
+    def test_float_truncation(self):
+        # GH 14241
+        exp = '1000000000.006'
+        result = pd.eval(exp, engine=self.engine, parser=self.parser)
+        expected = np.float64(exp)
+        assert result == expected
+
+        df = pd.DataFrame({'A': [1000000000.0009,
+                                 1000000000.0011,
+                                 1000000000.0015]})
+        cutoff = 1000000000.0006
+        result = df.query("A < %.4f" % cutoff)
+        assert result.empty
+
+        cutoff = 1000000000.0010
+        result = df.query("A > %.4f" % cutoff)
+        expected = df.loc[[1, 2], :]
+        tm.assert_frame_equal(expected, result)
+
+        exact = 1000000000.0011
+        result = df.query('A == %.4f' % exact)
+        expected = df.loc[[1], :]
+        tm.assert_frame_equal(expected, result)
+
+    def test_disallow_python_keywords(self):
+        # GH 18221
+        df = pd.DataFrame([[0, 0, 0]], columns=['foo', 'bar', 'class'])
+        msg = "Python keyword not valid identifier in numexpr query"
+        with tm.assert_raises_regex(SyntaxError, msg):
+            df.query('class == 0')
+
+        df = pd.DataFrame()
+        df.index.name = 'lambda'
+        with tm.assert_raises_regex(SyntaxError, msg):
+            df.query('lambda == 0')
+
+
+@td.skip_if_no_ne
+class TestEvalNumexprPython(TestEvalNumexprPandas):
+
+    @classmethod
+    def setup_class(cls):
+        super(TestEvalNumexprPython, cls).setup_class()
+        import numexpr as ne
+        cls.ne = ne
+        cls.engine = 'numexpr'
+        cls.parser = 'python'
+
+    def setup_ops(self):
+        self.cmp_ops = list(filter(lambda x: x not in ('in', 'not in'),
+                                   expr._cmp_ops_syms))
+        self.cmp2_ops = self.cmp_ops[::-1]
+        self.bin_ops = [s for s in expr._bool_ops_syms
+                        if s not in ('and', 'or')]
+        self.special_case_ops = _special_case_arith_ops_syms
+        self.arith_ops = _good_arith_ops
+        self.unary_ops = '+', '-', '~'
+
+    def check_chained_cmp_op(self, lhs, cmp1, mid, cmp2, rhs):
+        ex1 = 'lhs {0} mid {1} rhs'.format(cmp1, cmp2)
+        with pytest.raises(NotImplementedError):
+            pd.eval(ex1, engine=self.engine, parser=self.parser)
+
+
+class TestEvalPythonPython(TestEvalNumexprPython):
+
+    @classmethod
+    def setup_class(cls):
+        super(TestEvalPythonPython, cls).setup_class()
+        cls.engine = 'python'
+        cls.parser = 'python'
+
+    def check_modulus(self, lhs, arith1, rhs):
+        ex = 'lhs {0} rhs'.format(arith1)
+        result = pd.eval(ex, engine=self.engine, parser=self.parser)
+
+        expected = lhs % rhs
+        tm.assert_almost_equal(result, expected)
+
+        expected = _eval_single_bin(expected, arith1, rhs, self.engine)
+        tm.assert_almost_equal(result, expected)
+
+    def check_alignment(self, result, nlhs, ghs, op):
+        try:
+            nlhs, ghs = nlhs.align(ghs)
+        except (ValueError, TypeError, AttributeError):
+            # ValueError: series frame or frame series align
+            # TypeError, AttributeError: series or frame with scalar align
+            pass
+        else:
+            expected = eval('nlhs {0} ghs'.format(op))
+            tm.assert_almost_equal(result, expected)
+
+
+class TestEvalPythonPandas(TestEvalPythonPython):
+
+    @classmethod
+    def setup_class(cls):
+        super(TestEvalPythonPandas, cls).setup_class()
+        cls.engine = 'python'
+        cls.parser = 'pandas'
+
+    def check_chained_cmp_op(self, lhs, cmp1, mid, cmp2, rhs):
+        TestEvalNumexprPandas.check_chained_cmp_op(self, lhs, cmp1, mid, cmp2,
+                                                   rhs)
+
+
+f = lambda *args, **kwargs: np.random.randn()
+
+
+# -------------------------------------
+# gh-12388: Typecasting rules consistency with python
+
+
+class TestTypeCasting(object):
+    @pytest.mark.parametrize('op', ['+', '-', '*', '**', '/'])
+    # maybe someday... numexpr has too many upcasting rules now
+    # chain(*(np.sctypes[x] for x in ['uint', 'int', 'float']))
+    @pytest.mark.parametrize('dt', [np.float32, np.float64])
+    def test_binop_typecasting(self, engine, parser, op, dt):
+        df = mkdf(5, 3, data_gen_f=f, dtype=dt)
+        s = 'df {} 3'.format(op)
+        res = pd.eval(s, engine=engine, parser=parser)
+        assert df.values.dtype == dt
+        assert res.values.dtype == dt
+        assert_frame_equal(res, eval(s))
+
+        s = '3 {} df'.format(op)
+        res = pd.eval(s, engine=engine, parser=parser)
+        assert df.values.dtype == dt
+        assert res.values.dtype == dt
+        assert_frame_equal(res, eval(s))
+
+
+# -------------------------------------
+# Basic and complex alignment
+
+def _is_datetime(x):
+    return issubclass(x.dtype.type, np.datetime64)
+
+
+def should_warn(*args):
+    not_mono = not any(map(operator.attrgetter('is_monotonic'), args))
+    only_one_dt = reduce(operator.xor, map(_is_datetime, args))
+    return not_mono and only_one_dt
+
+
+class TestAlignment(object):
+
+    index_types = 'i', 'u', 'dt'
+    lhs_index_types = index_types + ('s',)  # 'p'
+
+    def test_align_nested_unary_op(self, engine, parser):
+        s = 'df * ~2'
+        df = mkdf(5, 3, data_gen_f=f)
+        res = pd.eval(s, engine=engine, parser=parser)
+        assert_frame_equal(res, df * ~2)
+
+    def test_basic_frame_alignment(self, engine, parser):
+        args = product(self.lhs_index_types, self.index_types,
+                       self.index_types)
+        with warnings.catch_warnings(record=True):
+            warnings.simplefilter('always', RuntimeWarning)
+            for lr_idx_type, rr_idx_type, c_idx_type in args:
+                df = mkdf(10, 10, data_gen_f=f, r_idx_type=lr_idx_type,
+                          c_idx_type=c_idx_type)
+                df2 = mkdf(20, 10, data_gen_f=f, r_idx_type=rr_idx_type,
+                           c_idx_type=c_idx_type)
+                # only warns if not monotonic and not sortable
+                if should_warn(df.index, df2.index):
+                    with tm.assert_produces_warning(RuntimeWarning):
+                        res = pd.eval('df + df2', engine=engine, parser=parser)
+                else:
+                    res = pd.eval('df + df2', engine=engine, parser=parser)
+                assert_frame_equal(res, df + df2)
+
+    def test_frame_comparison(self, engine, parser):
+        args = product(self.lhs_index_types, repeat=2)
+        for r_idx_type, c_idx_type in args:
+            df = mkdf(10, 10, data_gen_f=f, r_idx_type=r_idx_type,
+                      c_idx_type=c_idx_type)
+            res = pd.eval('df < 2', engine=engine, parser=parser)
+            assert_frame_equal(res, df < 2)
+
+            df3 = DataFrame(randn(*df.shape), index=df.index,
+                            columns=df.columns)
+            res = pd.eval('df < df3', engine=engine, parser=parser)
+            assert_frame_equal(res, df < df3)
+
+    @pytest.mark.slow
+    def test_medium_complex_frame_alignment(self, engine, parser):
+        args = product(self.lhs_index_types, self.index_types,
+                       self.index_types, self.index_types)
+
+        with warnings.catch_warnings(record=True):
+            warnings.simplefilter('always', RuntimeWarning)
+
+            for r1, c1, r2, c2 in args:
+                df = mkdf(3, 2, data_gen_f=f, r_idx_type=r1, c_idx_type=c1)
+                df2 = mkdf(4, 2, data_gen_f=f, r_idx_type=r2, c_idx_type=c2)
+                df3 = mkdf(5, 2, data_gen_f=f, r_idx_type=r2, c_idx_type=c2)
+                if should_warn(df.index, df2.index, df3.index):
+                    with tm.assert_produces_warning(RuntimeWarning):
+                        res = pd.eval('df + df2 + df3', engine=engine,
+                                      parser=parser)
+                else:
+                    res = pd.eval('df + df2 + df3',
+                                  engine=engine, parser=parser)
+                assert_frame_equal(res, df + df2 + df3)
+
+    def test_basic_frame_series_alignment(self, engine, parser):
+        def testit(r_idx_type, c_idx_type, index_name):
+            df = mkdf(10, 10, data_gen_f=f, r_idx_type=r_idx_type,
+                      c_idx_type=c_idx_type)
+            index = getattr(df, index_name)
+            s = Series(np.random.randn(5), index[:5])
+
+            if should_warn(df.index, s.index):
+                with tm.assert_produces_warning(RuntimeWarning):
+                    res = pd.eval('df + s', engine=engine, parser=parser)
+            else:
+                res = pd.eval('df + s', engine=engine, parser=parser)
+
+            if r_idx_type == 'dt' or c_idx_type == 'dt':
+                expected = df.add(s) if engine == 'numexpr' else df + s
+            else:
+                expected = df + s
+            assert_frame_equal(res, expected)
+
+        args = product(self.lhs_index_types, self.index_types,
+                       ('index', 'columns'))
+        with warnings.catch_warnings(record=True):
+            warnings.simplefilter('always', RuntimeWarning)
+            for r_idx_type, c_idx_type, index_name in args:
+                testit(r_idx_type, c_idx_type, index_name)
+
+    def test_basic_series_frame_alignment(self, engine, parser):
+        def testit(r_idx_type, c_idx_type, index_name):
+            df = mkdf(10, 7, data_gen_f=f, r_idx_type=r_idx_type,
+                      c_idx_type=c_idx_type)
+            index = getattr(df, index_name)
+            s = Series(np.random.randn(5), index[:5])
+            if should_warn(s.index, df.index):
+                with tm.assert_produces_warning(RuntimeWarning):
+                    res = pd.eval('s + df', engine=engine, parser=parser)
+            else:
+                res = pd.eval('s + df', engine=engine, parser=parser)
+
+            if r_idx_type == 'dt' or c_idx_type == 'dt':
+                expected = df.add(s) if engine == 'numexpr' else s + df
+            else:
+                expected = s + df
+            assert_frame_equal(res, expected)
+
+        # only test dt with dt, otherwise weird joins result
+        args = product(['i', 'u', 's'], ['i', 'u', 's'], ('index', 'columns'))
+        with warnings.catch_warnings(record=True):
+            for r_idx_type, c_idx_type, index_name in args:
+                testit(r_idx_type, c_idx_type, index_name)
+
+        # dt with dt
+        args = product(['dt'], ['dt'], ('index', 'columns'))
+        with warnings.catch_warnings(record=True):
+            for r_idx_type, c_idx_type, index_name in args:
+                testit(r_idx_type, c_idx_type, index_name)
+
+    def test_series_frame_commutativity(self, engine, parser):
+        args = product(self.lhs_index_types, self.index_types, ('+', '*'),
+                       ('index', 'columns'))
+
+        with warnings.catch_warnings(record=True):
+            warnings.simplefilter('always', RuntimeWarning)
+            for r_idx_type, c_idx_type, op, index_name in args:
+                df = mkdf(10, 10, data_gen_f=f, r_idx_type=r_idx_type,
+                          c_idx_type=c_idx_type)
+                index = getattr(df, index_name)
+                s = Series(np.random.randn(5), index[:5])
+
+                lhs = 's {0} df'.format(op)
+                rhs = 'df {0} s'.format(op)
+                if should_warn(df.index, s.index):
+                    with tm.assert_produces_warning(RuntimeWarning):
+                        a = pd.eval(lhs, engine=engine, parser=parser)
+                    with tm.assert_produces_warning(RuntimeWarning):
+                        b = pd.eval(rhs, engine=engine, parser=parser)
+                else:
+                    a = pd.eval(lhs, engine=engine, parser=parser)
+                    b = pd.eval(rhs, engine=engine, parser=parser)
+
+                if r_idx_type != 'dt' and c_idx_type != 'dt':
+                    if engine == 'numexpr':
+                        assert_frame_equal(a, b)
+
+    @pytest.mark.slow
+    def test_complex_series_frame_alignment(self, engine, parser):
+        import random
+        args = product(self.lhs_index_types, self.index_types,
+                       self.index_types, self.index_types)
+        n = 3
+        m1 = 5
+        m2 = 2 * m1
+
+        with warnings.catch_warnings(record=True):
+            warnings.simplefilter('always', RuntimeWarning)
+            for r1, r2, c1, c2 in args:
+                index_name = random.choice(['index', 'columns'])
+                obj_name = random.choice(['df', 'df2'])
+
+                df = mkdf(m1, n, data_gen_f=f, r_idx_type=r1, c_idx_type=c1)
+                df2 = mkdf(m2, n, data_gen_f=f, r_idx_type=r2, c_idx_type=c2)
+                index = getattr(locals().get(obj_name), index_name)
+                s = Series(np.random.randn(n), index[:n])
+
+                if r2 == 'dt' or c2 == 'dt':
+                    if engine == 'numexpr':
+                        expected2 = df2.add(s)
+                    else:
+                        expected2 = df2 + s
+                else:
+                    expected2 = df2 + s
+
+                if r1 == 'dt' or c1 == 'dt':
+                    if engine == 'numexpr':
+                        expected = expected2.add(df)
+                    else:
+                        expected = expected2 + df
+                else:
+                    expected = expected2 + df
+
+                if should_warn(df2.index, s.index, df.index):
+                    with tm.assert_produces_warning(RuntimeWarning):
+                        res = pd.eval('df2 + s + df', engine=engine,
+                                      parser=parser)
+                else:
+                    res = pd.eval('df2 + s + df', engine=engine, parser=parser)
+                assert res.shape == expected.shape
+                assert_frame_equal(res, expected)
+
+    def test_performance_warning_for_poor_alignment(self, engine, parser):
+        df = DataFrame(randn(1000, 10))
+        s = Series(randn(10000))
+        if engine == 'numexpr':
+            seen = PerformanceWarning
+        else:
+            seen = False
+
+        with assert_produces_warning(seen):
+            pd.eval('df + s', engine=engine, parser=parser)
+
+        s = Series(randn(1000))
+        with assert_produces_warning(False):
+            pd.eval('df + s', engine=engine, parser=parser)
+
+        df = DataFrame(randn(10, 10000))
+        s = Series(randn(10000))
+        with assert_produces_warning(False):
+            pd.eval('df + s', engine=engine, parser=parser)
+
+        df = DataFrame(randn(10, 10))
+        s = Series(randn(10000))
+
+        is_python_engine = engine == 'python'
+
+        if not is_python_engine:
+            wrn = PerformanceWarning
+        else:
+            wrn = False
+
+        with assert_produces_warning(wrn) as w:
+            pd.eval('df + s', engine=engine, parser=parser)
+
+            if not is_python_engine:
+                assert len(w) == 1
+                msg = str(w[0].message)
+                expected = ("Alignment difference on axis {0} is larger"
+                            " than an order of magnitude on term {1!r}, "
+                            "by more than {2:.4g}; performance may suffer"
+                            "".format(1, 'df', np.log10(s.size - df.shape[1])))
+                assert msg == expected
+
+
+# ------------------------------------
+# Slightly more complex ops
+
+@td.skip_if_no_ne
+class TestOperationsNumExprPandas(object):
+
+    @classmethod
+    def setup_class(cls):
+        cls.engine = 'numexpr'
+        cls.parser = 'pandas'
+        cls.arith_ops = expr._arith_ops_syms + expr._cmp_ops_syms
+
+    @classmethod
+    def teardown_class(cls):
+        del cls.engine, cls.parser
+
+    def eval(self, *args, **kwargs):
+        kwargs['engine'] = self.engine
+        kwargs['parser'] = self.parser
+        kwargs['level'] = kwargs.pop('level', 0) + 1
+        return pd.eval(*args, **kwargs)
+
+    def test_simple_arith_ops(self):
+        ops = self.arith_ops
+
+        for op in filter(lambda x: x != '//', ops):
+            ex = '1 {0} 1'.format(op)
+            ex2 = 'x {0} 1'.format(op)
+            ex3 = '1 {0} (x + 1)'.format(op)
+
+            if op in ('in', 'not in'):
+                pytest.raises(TypeError, pd.eval, ex,
+                              engine=self.engine, parser=self.parser)
+            else:
+                expec = _eval_single_bin(1, op, 1, self.engine)
+                x = self.eval(ex, engine=self.engine, parser=self.parser)
+                assert x == expec
+
+                expec = _eval_single_bin(x, op, 1, self.engine)
+                y = self.eval(ex2, local_dict={'x': x}, engine=self.engine,
+                              parser=self.parser)
+                assert y == expec
+
+                expec = _eval_single_bin(1, op, x + 1, self.engine)
+                y = self.eval(ex3, local_dict={'x': x},
+                              engine=self.engine, parser=self.parser)
+                assert y == expec
+
+    def test_simple_bool_ops(self):
+        for op, lhs, rhs in product(expr._bool_ops_syms, (True, False),
+                                    (True, False)):
+            ex = '{0} {1} {2}'.format(lhs, op, rhs)
+            res = self.eval(ex)
+            exp = eval(ex)
+            assert res == exp
+
+    def test_bool_ops_with_constants(self):
+        for op, lhs, rhs in product(expr._bool_ops_syms, ('True', 'False'),
+                                    ('True', 'False')):
+            ex = '{0} {1} {2}'.format(lhs, op, rhs)
+            res = self.eval(ex)
+            exp = eval(ex)
+            assert res == exp
+
+    def test_panel_fails(self):
+        with catch_warnings(record=True):
+            x = Panel(randn(3, 4, 5))
+            y = Series(randn(10))
+            with pytest.raises(NotImplementedError):
+                self.eval('x + y',
+                          local_dict={'x': x, 'y': y})
+
+    def test_4d_ndarray_fails(self):
+        x = randn(3, 4, 5, 6)
+        y = Series(randn(10))
+        with pytest.raises(NotImplementedError):
+            self.eval('x + y',
+                      local_dict={'x': x, 'y': y})
+
+    def test_constant(self):
+        x = self.eval('1')
+        assert x == 1
+
+    def test_single_variable(self):
+        df = DataFrame(randn(10, 2))
+        df2 = self.eval('df', local_dict={'df': df})
+        assert_frame_equal(df, df2)
+
+    def test_truediv(self):
+        s = np.array([1])
+        ex = 's / 1'
+        d = {'s': s}  # noqa
+
+        if PY3:
+            res = self.eval(ex, truediv=False)
+            tm.assert_numpy_array_equal(res, np.array([1.0]))
+
+            res = self.eval(ex, truediv=True)
+            tm.assert_numpy_array_equal(res, np.array([1.0]))
+
+            res = self.eval('1 / 2', truediv=True)
+            expec = 0.5
+            assert res == expec
+
+            res = self.eval('1 / 2', truediv=False)
+            expec = 0.5
+            assert res == expec
+
+            res = self.eval('s / 2', truediv=False)
+            expec = 0.5
+            assert res == expec
+
+            res = self.eval('s / 2', truediv=True)
+            expec = 0.5
+            assert res == expec
+        else:
+            res = self.eval(ex, truediv=False)
+            tm.assert_numpy_array_equal(res, np.array([1]))
+
+            res = self.eval(ex, truediv=True)
+            tm.assert_numpy_array_equal(res, np.array([1.0]))
+
+            res = self.eval('1 / 2', truediv=True)
+            expec = 0.5
+            assert res == expec
+
+            res = self.eval('1 / 2', truediv=False)
+            expec = 0
+            assert res == expec
+
+            res = self.eval('s / 2', truediv=False)
+            expec = 0
+            assert res == expec
+
+            res = self.eval('s / 2', truediv=True)
+            expec = 0.5
+            assert res == expec
+
+    def test_failing_subscript_with_name_error(self):
+        df = DataFrame(np.random.randn(5, 3))  # noqa
+        with pytest.raises(NameError):
+            self.eval('df[x > 2] > 2')
+
+    def test_lhs_expression_subscript(self):
+        df = DataFrame(np.random.randn(5, 3))
+        result = self.eval('(df + 1)[df > 2]', local_dict={'df': df})
+        expected = (df + 1)[df > 2]
+        assert_frame_equal(result, expected)
+
+    def test_attr_expression(self):
+        df = DataFrame(np.random.randn(5, 3), columns=list('abc'))
+        expr1 = 'df.a < df.b'
+        expec1 = df.a < df.b
+        expr2 = 'df.a + df.b + df.c'
+        expec2 = df.a + df.b + df.c
+        expr3 = 'df.a + df.b + df.c[df.b < 0]'
+        expec3 = df.a + df.b + df.c[df.b < 0]
+        exprs = expr1, expr2, expr3
+        expecs = expec1, expec2, expec3
+        for e, expec in zip(exprs, expecs):
+            assert_series_equal(expec, self.eval(e, local_dict={'df': df}))
+
+    def test_assignment_fails(self):
+        df = DataFrame(np.random.randn(5, 3), columns=list('abc'))
+        df2 = DataFrame(np.random.randn(5, 3))
+        expr1 = 'df = df2'
+        pytest.raises(ValueError, self.eval, expr1,
+                      local_dict={'df': df, 'df2': df2})
+
+    def test_assignment_column(self):
+        df = DataFrame(np.random.randn(5, 2), columns=list('ab'))
+        orig_df = df.copy()
+
+        # multiple assignees
+        pytest.raises(SyntaxError, df.eval, 'd c = a + b')
+
+        # invalid assignees
+        pytest.raises(SyntaxError, df.eval, 'd,c = a + b')
+        pytest.raises(SyntaxError, df.eval, 'Timestamp("20131001") = a + b')
+
+        # single assignment - existing variable
+        expected = orig_df.copy()
+        expected['a'] = expected['a'] + expected['b']
+        df = orig_df.copy()
+        df.eval('a = a + b', inplace=True)
+        assert_frame_equal(df, expected)
+
+        # single assignment - new variable
+        expected = orig_df.copy()
+        expected['c'] = expected['a'] + expected['b']
+        df = orig_df.copy()
+        df.eval('c = a + b', inplace=True)
+        assert_frame_equal(df, expected)
+
+        # with a local name overlap
+        def f():
+            df = orig_df.copy()
+            a = 1  # noqa
+            df.eval('a = 1 + b', inplace=True)
+            return df
+
+        df = f()
+        expected = orig_df.copy()
+        expected['a'] = 1 + expected['b']
+        assert_frame_equal(df, expected)
+
+        df = orig_df.copy()
+
+        def f():
+            a = 1  # noqa
+            old_a = df.a.copy()
+            df.eval('a = a + b', inplace=True)
+            result = old_a + df.b
+            assert_series_equal(result, df.a, check_names=False)
+            assert result.name is None
+
+        f()
+
+        # multiple assignment
+        df = orig_df.copy()
+        df.eval('c = a + b', inplace=True)
+        pytest.raises(SyntaxError, df.eval, 'c = a = b')
+
+        # explicit targets
+        df = orig_df.copy()
+        self.eval('c = df.a + df.b', local_dict={'df': df},
+                  target=df, inplace=True)
+        expected = orig_df.copy()
+        expected['c'] = expected['a'] + expected['b']
+        assert_frame_equal(df, expected)
+
+    def test_column_in(self):
+        # GH 11235
+        df = DataFrame({'a': [11], 'b': [-32]})
+        result = df.eval('a in [11, -32]')
+        expected = Series([True])
+        assert_series_equal(result, expected)
+
+    def assignment_not_inplace(self):
+        # see gh-9297
+        df = DataFrame(np.random.randn(5, 2), columns=list('ab'))
+
+        actual = df.eval('c = a + b', inplace=False)
+        assert actual is not None
+
+        expected = df.copy()
+        expected['c'] = expected['a'] + expected['b']
+        tm.assert_frame_equal(df, expected)
+
+    def test_multi_line_expression(self):
+        # GH 11149
+        df = pd.DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]})
+        expected = df.copy()
+
+        expected['c'] = expected['a'] + expected['b']
+        expected['d'] = expected['c'] + expected['b']
+        ans = df.eval("""
+        c = a + b
+        d = c + b""", inplace=True)
+        assert_frame_equal(expected, df)
+        assert ans is None
+
+        expected['a'] = expected['a'] - 1
+        expected['e'] = expected['a'] + 2
+        ans = df.eval("""
+        a = a - 1
+        e = a + 2""", inplace=True)
+        assert_frame_equal(expected, df)
+        assert ans is None
+
+        # multi-line not valid if not all assignments
+        with pytest.raises(ValueError):
+            df.eval("""
+            a = b + 2
+            b - 2""", inplace=False)
+
+    def test_multi_line_expression_not_inplace(self):
+        # GH 11149
+        df = pd.DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]})
+        expected = df.copy()
+
+        expected['c'] = expected['a'] + expected['b']
+        expected['d'] = expected['c'] + expected['b']
+        df = df.eval("""
+        c = a + b
+        d = c + b""", inplace=False)
+        assert_frame_equal(expected, df)
+
+        expected['a'] = expected['a'] - 1
+        expected['e'] = expected['a'] + 2
+        df = df.eval("""
+        a = a - 1
+        e = a + 2""", inplace=False)
+        assert_frame_equal(expected, df)
+
+    def test_multi_line_expression_local_variable(self):
+        # GH 15342
+        df = pd.DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]})
+        expected = df.copy()
+
+        local_var = 7
+        expected['c'] = expected['a'] * local_var
+        expected['d'] = expected['c'] + local_var
+        ans = df.eval("""
+        c = a * @local_var
+        d = c + @local_var
+        """, inplace=True)
+        assert_frame_equal(expected, df)
+        assert ans is None
+
+    def test_assignment_in_query(self):
+        # GH 8664
+        df = pd.DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]})
+        df_orig = df.copy()
+        with pytest.raises(ValueError):
+            df.query('a = 1')
+        assert_frame_equal(df, df_orig)
+
+    def test_query_inplace(self):
+        # see gh-11149
+        df = pd.DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]})
+        expected = df.copy()
+        expected = expected[expected['a'] == 2]
+        df.query('a == 2', inplace=True)
+        assert_frame_equal(expected, df)
+
+        df = {}
+        expected = {"a": 3}
+
+        self.eval("a = 1 + 2", target=df, inplace=True)
+        tm.assert_dict_equal(df, expected)
+
+    @pytest.mark.parametrize("invalid_target", [1, "cat", [1, 2],
+                                                np.array([]), (1, 3)])
+    def test_cannot_item_assign(self, invalid_target):
+        msg = "Cannot assign expression output to target"
+        expression = "a = 1 + 2"
+
+        with tm.assert_raises_regex(ValueError, msg):
+            self.eval(expression, target=invalid_target, inplace=True)
+
+        if hasattr(invalid_target, "copy"):
+            with tm.assert_raises_regex(ValueError, msg):
+                self.eval(expression, target=invalid_target, inplace=False)
+
+    @pytest.mark.parametrize("invalid_target", [1, "cat", (1, 3)])
+    def test_cannot_copy_item(self, invalid_target):
+        msg = "Cannot return a copy of the target"
+        expression = "a = 1 + 2"
+
+        with tm.assert_raises_regex(ValueError, msg):
+            self.eval(expression, target=invalid_target, inplace=False)
+
+    @pytest.mark.parametrize("target", [1, "cat", [1, 2],
+                                        np.array([]), (1, 3), {1: 2}])
+    def test_inplace_no_assignment(self, target):
+        expression = "1 + 2"
+
+        assert self.eval(expression, target=target, inplace=False) == 3
+
+        msg = "Cannot operate inplace if there is no assignment"
+        with tm.assert_raises_regex(ValueError, msg):
+            self.eval(expression, target=target, inplace=True)
+
+    def test_basic_period_index_boolean_expression(self):
+        df = mkdf(2, 2, data_gen_f=f, c_idx_type='p', r_idx_type='i')
+
+        e = df < 2
+        r = self.eval('df < 2', local_dict={'df': df})
+        x = df < 2
+
+        assert_frame_equal(r, e)
+        assert_frame_equal(x, e)
+
+    def test_basic_period_index_subscript_expression(self):
+        df = mkdf(2, 2, data_gen_f=f, c_idx_type='p', r_idx_type='i')
+        r = self.eval('df[df < 2 + 3]', local_dict={'df': df})
+        e = df[df < 2 + 3]
+        assert_frame_equal(r, e)
+
+    def test_nested_period_index_subscript_expression(self):
+        df = mkdf(2, 2, data_gen_f=f, c_idx_type='p', r_idx_type='i')
+        r = self.eval('df[df[df < 2] < 2] + df * 2', local_dict={'df': df})
+        e = df[df[df < 2] < 2] + df * 2
+        assert_frame_equal(r, e)
+
+    def test_date_boolean(self):
+        df = DataFrame(randn(5, 3))
+        df['dates1'] = date_range('1/1/2012', periods=5)
+        res = self.eval('df.dates1 < 20130101', local_dict={'df': df},
+                        engine=self.engine, parser=self.parser)
+        expec = df.dates1 < '20130101'
+        assert_series_equal(res, expec, check_names=False)
+
+    def test_simple_in_ops(self):
+        if self.parser != 'python':
+            res = pd.eval('1 in [1, 2]', engine=self.engine,
+                          parser=self.parser)
+            assert res
+
+            res = pd.eval('2 in (1, 2)', engine=self.engine,
+                          parser=self.parser)
+            assert res
+
+            res = pd.eval('3 in (1, 2)', engine=self.engine,
+                          parser=self.parser)
+            assert not res
+
+            res = pd.eval('3 not in (1, 2)', engine=self.engine,
+                          parser=self.parser)
+            assert res
+
+            res = pd.eval('[3] not in (1, 2)', engine=self.engine,
+                          parser=self.parser)
+            assert res
+
+            res = pd.eval('[3] in ([3], 2)', engine=self.engine,
+                          parser=self.parser)
+            assert res
+
+            res = pd.eval('[[3]] in [[[3]], 2]', engine=self.engine,
+                          parser=self.parser)
+            assert res
+
+            res = pd.eval('(3,) in [(3,), 2]', engine=self.engine,
+                          parser=self.parser)
+            assert res
+
+            res = pd.eval('(3,) not in [(3,), 2]', engine=self.engine,
+                          parser=self.parser)
+            assert not res
+
+            res = pd.eval('[(3,)] in [[(3,)], 2]', engine=self.engine,
+                          parser=self.parser)
+            assert res
+        else:
+            with pytest.raises(NotImplementedError):
+                pd.eval('1 in [1, 2]', engine=self.engine, parser=self.parser)
+            with pytest.raises(NotImplementedError):
+                pd.eval('2 in (1, 2)', engine=self.engine, parser=self.parser)
+            with pytest.raises(NotImplementedError):
+                pd.eval('3 in (1, 2)', engine=self.engine, parser=self.parser)
+            with pytest.raises(NotImplementedError):
+                pd.eval('3 not in (1, 2)', engine=self.engine,
+                        parser=self.parser)
+            with pytest.raises(NotImplementedError):
+                pd.eval('[(3,)] in (1, 2, [(3,)])', engine=self.engine,
+                        parser=self.parser)
+            with pytest.raises(NotImplementedError):
+                pd.eval('[3] not in (1, 2, [[3]])', engine=self.engine,
+                        parser=self.parser)
+
+
+@td.skip_if_no_ne
+class TestOperationsNumExprPython(TestOperationsNumExprPandas):
+
+    @classmethod
+    def setup_class(cls):
+        super(TestOperationsNumExprPython, cls).setup_class()
+        cls.engine = 'numexpr'
+        cls.parser = 'python'
+        cls.arith_ops = expr._arith_ops_syms + expr._cmp_ops_syms
+        cls.arith_ops = filter(lambda x: x not in ('in', 'not in'),
+                               cls.arith_ops)
+
+    def test_check_many_exprs(self):
+        a = 1  # noqa
+        expr = ' * '.join('a' * 33)
+        expected = 1
+        res = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert res == expected
+
+    def test_fails_and(self):
+        df = DataFrame(np.random.randn(5, 3))
+        pytest.raises(NotImplementedError, pd.eval, 'df > 2 and df > 3',
+                      local_dict={'df': df}, parser=self.parser,
+                      engine=self.engine)
+
+    def test_fails_or(self):
+        df = DataFrame(np.random.randn(5, 3))
+        pytest.raises(NotImplementedError, pd.eval, 'df > 2 or df > 3',
+                      local_dict={'df': df}, parser=self.parser,
+                      engine=self.engine)
+
+    def test_fails_not(self):
+        df = DataFrame(np.random.randn(5, 3))
+        pytest.raises(NotImplementedError, pd.eval, 'not df > 2',
+                      local_dict={'df': df}, parser=self.parser,
+                      engine=self.engine)
+
+    def test_fails_ampersand(self):
+        df = DataFrame(np.random.randn(5, 3))  # noqa
+        ex = '(df + 2)[df > 1] > 0 & (df > 0)'
+        with pytest.raises(NotImplementedError):
+            pd.eval(ex, parser=self.parser, engine=self.engine)
+
+    def test_fails_pipe(self):
+        df = DataFrame(np.random.randn(5, 3))  # noqa
+        ex = '(df + 2)[df > 1] > 0 | (df > 0)'
+        with pytest.raises(NotImplementedError):
+            pd.eval(ex, parser=self.parser, engine=self.engine)
+
+    def test_bool_ops_with_constants(self):
+        for op, lhs, rhs in product(expr._bool_ops_syms, ('True', 'False'),
+                                    ('True', 'False')):
+            ex = '{0} {1} {2}'.format(lhs, op, rhs)
+            if op in ('and', 'or'):
+                with pytest.raises(NotImplementedError):
+                    self.eval(ex)
+            else:
+                res = self.eval(ex)
+                exp = eval(ex)
+                assert res == exp
+
+    def test_simple_bool_ops(self):
+        for op, lhs, rhs in product(expr._bool_ops_syms, (True, False),
+                                    (True, False)):
+            ex = 'lhs {0} rhs'.format(op)
+            if op in ('and', 'or'):
+                with pytest.raises(NotImplementedError):
+                    pd.eval(ex, engine=self.engine, parser=self.parser)
+            else:
+                res = pd.eval(ex, engine=self.engine, parser=self.parser)
+                exp = eval(ex)
+                assert res == exp
+
+
+class TestOperationsPythonPython(TestOperationsNumExprPython):
+
+    @classmethod
+    def setup_class(cls):
+        super(TestOperationsPythonPython, cls).setup_class()
+        cls.engine = cls.parser = 'python'
+        cls.arith_ops = expr._arith_ops_syms + expr._cmp_ops_syms
+        cls.arith_ops = filter(lambda x: x not in ('in', 'not in'),
+                               cls.arith_ops)
+
+
+class TestOperationsPythonPandas(TestOperationsNumExprPandas):
+
+    @classmethod
+    def setup_class(cls):
+        super(TestOperationsPythonPandas, cls).setup_class()
+        cls.engine = 'python'
+        cls.parser = 'pandas'
+        cls.arith_ops = expr._arith_ops_syms + expr._cmp_ops_syms
+
+
+@td.skip_if_no_ne
+class TestMathPythonPython(object):
+
+    @classmethod
+    def setup_class(cls):
+        cls.engine = 'python'
+        cls.parser = 'pandas'
+        cls.unary_fns = _unary_math_ops
+        cls.binary_fns = _binary_math_ops
+
+    @classmethod
+    def teardown_class(cls):
+        del cls.engine, cls.parser
+
+    def eval(self, *args, **kwargs):
+        kwargs['engine'] = self.engine
+        kwargs['parser'] = self.parser
+        kwargs['level'] = kwargs.pop('level', 0) + 1
+        return pd.eval(*args, **kwargs)
+
+    def test_unary_functions(self):
+        df = DataFrame({'a': np.random.randn(10)})
+        a = df.a
+        for fn in self.unary_fns:
+            expr = "{0}(a)".format(fn)
+            got = self.eval(expr)
+            with np.errstate(all='ignore'):
+                expect = getattr(np, fn)(a)
+            tm.assert_series_equal(got, expect, check_names=False)
+
+    def test_binary_functions(self):
+        df = DataFrame({'a': np.random.randn(10),
+                        'b': np.random.randn(10)})
+        a = df.a
+        b = df.b
+        for fn in self.binary_fns:
+            expr = "{0}(a, b)".format(fn)
+            got = self.eval(expr)
+            with np.errstate(all='ignore'):
+                expect = getattr(np, fn)(a, b)
+            tm.assert_almost_equal(got, expect, check_names=False)
+
+    def test_df_use_case(self):
+        df = DataFrame({'a': np.random.randn(10),
+                        'b': np.random.randn(10)})
+        df.eval("e = arctan2(sin(a), b)",
+                engine=self.engine,
+                parser=self.parser, inplace=True)
+        got = df.e
+        expect = np.arctan2(np.sin(df.a), df.b)
+        tm.assert_series_equal(got, expect, check_names=False)
+
+    def test_df_arithmetic_subexpression(self):
+        df = DataFrame({'a': np.random.randn(10),
+                        'b': np.random.randn(10)})
+        df.eval("e = sin(a + b)",
+                engine=self.engine,
+                parser=self.parser, inplace=True)
+        got = df.e
+        expect = np.sin(df.a + df.b)
+        tm.assert_series_equal(got, expect, check_names=False)
+
+    def check_result_type(self, dtype, expect_dtype):
+        df = DataFrame({'a': np.random.randn(10).astype(dtype)})
+        assert df.a.dtype == dtype
+        df.eval("b = sin(a)",
+                engine=self.engine,
+                parser=self.parser, inplace=True)
+        got = df.b
+        expect = np.sin(df.a)
+        assert expect.dtype == got.dtype
+        assert expect_dtype == got.dtype
+        tm.assert_series_equal(got, expect, check_names=False)
+
+    def test_result_types(self):
+        self.check_result_type(np.int32, np.float64)
+        self.check_result_type(np.int64, np.float64)
+        self.check_result_type(np.float32, np.float32)
+        self.check_result_type(np.float64, np.float64)
+
+    def test_result_types2(self):
+        # xref https://github.com/pandas-dev/pandas/issues/12293
+        pytest.skip("unreliable tests on complex128")
+
+        # Did not test complex64 because DataFrame is converting it to
+        # complex128. Due to https://github.com/pandas-dev/pandas/issues/10952
+        self.check_result_type(np.complex128, np.complex128)
+
+    def test_undefined_func(self):
+        df = DataFrame({'a': np.random.randn(10)})
+        with tm.assert_raises_regex(
+                ValueError, "\"mysin\" is not a supported function"):
+            df.eval("mysin(a)",
+                    engine=self.engine,
+                    parser=self.parser)
+
+    def test_keyword_arg(self):
+        df = DataFrame({'a': np.random.randn(10)})
+        with tm.assert_raises_regex(TypeError,
+                                    "Function \"sin\" does not support "
+                                    "keyword arguments"):
+            df.eval("sin(x=a)",
+                    engine=self.engine,
+                    parser=self.parser)
+
+
+class TestMathPythonPandas(TestMathPythonPython):
+
+    @classmethod
+    def setup_class(cls):
+        super(TestMathPythonPandas, cls).setup_class()
+        cls.engine = 'python'
+        cls.parser = 'pandas'
+
+
+class TestMathNumExprPandas(TestMathPythonPython):
+
+    @classmethod
+    def setup_class(cls):
+        super(TestMathNumExprPandas, cls).setup_class()
+        cls.engine = 'numexpr'
+        cls.parser = 'pandas'
+
+
+class TestMathNumExprPython(TestMathPythonPython):
+
+    @classmethod
+    def setup_class(cls):
+        super(TestMathNumExprPython, cls).setup_class()
+        cls.engine = 'numexpr'
+        cls.parser = 'python'
+
+
+_var_s = randn(10)
+
+
+class TestScope(object):
+
+    def test_global_scope(self, engine, parser):
+        e = '_var_s * 2'
+        tm.assert_numpy_array_equal(_var_s * 2, pd.eval(e, engine=engine,
+                                                        parser=parser))
+
+    def test_no_new_locals(self, engine, parser):
+        x = 1  # noqa
+        lcls = locals().copy()
+        pd.eval('x + 1', local_dict=lcls, engine=engine, parser=parser)
+        lcls2 = locals().copy()
+        lcls2.pop('lcls')
+        assert lcls == lcls2
+
+    def test_no_new_globals(self, engine, parser):
+        x = 1  # noqa
+        gbls = globals().copy()
+        pd.eval('x + 1', engine=engine, parser=parser)
+        gbls2 = globals().copy()
+        assert gbls == gbls2
+
+
+@td.skip_if_no_ne
+def test_invalid_engine():
+    tm.assert_raises_regex(KeyError, 'Invalid engine \'asdf\' passed',
+                           pd.eval, 'x + y', local_dict={'x': 1, 'y': 2},
+                           engine='asdf')
+
+
+@td.skip_if_no_ne
+def test_invalid_parser():
+    tm.assert_raises_regex(KeyError, 'Invalid parser \'asdf\' passed',
+                           pd.eval, 'x + y', local_dict={'x': 1, 'y': 2},
+                           parser='asdf')
+
+
+_parsers = {'python': PythonExprVisitor, 'pytables': pytables.ExprVisitor,
+            'pandas': PandasExprVisitor}
+
+
+@pytest.mark.parametrize('engine', _engines)
+@pytest.mark.parametrize('parser', _parsers)
+def test_disallowed_nodes(engine, parser):
+    VisitorClass = _parsers[parser]
+    uns_ops = VisitorClass.unsupported_nodes
+    inst = VisitorClass('x + 1', engine, parser)
+
+    for ops in uns_ops:
+        with pytest.raises(NotImplementedError):
+            getattr(inst, ops)()
+
+
+def test_syntax_error_exprs(engine, parser):
+    e = 's +'
+    with pytest.raises(SyntaxError):
+        pd.eval(e, engine=engine, parser=parser)
+
+
+def test_name_error_exprs(engine, parser):
+    e = 's + t'
+    with pytest.raises(NameError):
+        pd.eval(e, engine=engine, parser=parser)
+
+
+def test_invalid_local_variable_reference(engine, parser):
+    a, b = 1, 2  # noqa
+    exprs = 'a + @b', '@a + b', '@a + @b'
+
+    for _expr in exprs:
+        if parser != 'pandas':
+            with tm.assert_raises_regex(SyntaxError,
+                                        "The '@' prefix is only"):
+                pd.eval(_expr, engine=engine, parser=parser)
+        else:
+            with tm.assert_raises_regex(SyntaxError,
+                                        "The '@' prefix is not"):
+                pd.eval(_expr, engine=engine, parser=parser)
+
+
+def test_numexpr_builtin_raises(engine, parser):
+    sin, dotted_line = 1, 2
+    if engine == 'numexpr':
+        with tm.assert_raises_regex(NumExprClobberingError,
+                                    'Variables in expression .+'):
+            pd.eval('sin + dotted_line', engine=engine, parser=parser)
+    else:
+        res = pd.eval('sin + dotted_line', engine=engine, parser=parser)
+        assert res == sin + dotted_line
+
+
+def test_bad_resolver_raises(engine, parser):
+    cannot_resolve = 42, 3.0
+    with tm.assert_raises_regex(TypeError, 'Resolver of type .+'):
+        pd.eval('1 + 2', resolvers=cannot_resolve, engine=engine,
+                parser=parser)
+
+
+def test_empty_string_raises(engine, parser):
+    # GH 13139
+    with tm.assert_raises_regex(ValueError,
+                                'expr cannot be an empty string'):
+        pd.eval('', engine=engine, parser=parser)
+
+
+def test_more_than_one_expression_raises(engine, parser):
+    with tm.assert_raises_regex(SyntaxError,
+                                'only a single expression is allowed'):
+        pd.eval('1 + 1; 2 + 2', engine=engine, parser=parser)
+
+
+@pytest.mark.parametrize('cmp', ('and', 'or'))
+@pytest.mark.parametrize('lhs', (int, float))
+@pytest.mark.parametrize('rhs', (int, float))
+def test_bool_ops_fails_on_scalars(lhs, cmp, rhs, engine, parser):
+    gen = {int: lambda: np.random.randint(10), float: np.random.randn}
+
+    mid = gen[lhs]()  # noqa
+    lhs = gen[lhs]()  # noqa
+    rhs = gen[rhs]()  # noqa
+
+    ex1 = 'lhs {0} mid {1} rhs'.format(cmp, cmp)
+    ex2 = 'lhs {0} mid and mid {1} rhs'.format(cmp, cmp)
+    ex3 = '(lhs {0} mid) & (mid {1} rhs)'.format(cmp, cmp)
+    for ex in (ex1, ex2, ex3):
+        with pytest.raises(NotImplementedError):
+            pd.eval(ex, engine=engine, parser=parser)
+
+
+def test_inf(engine, parser):
+    s = 'inf + 1'
+    expected = np.inf
+    result = pd.eval(s, engine=engine, parser=parser)
+    assert result == expected
+
+
+def test_negate_lt_eq_le(engine, parser):
+    df = pd.DataFrame([[0, 10], [1, 20]], columns=['cat', 'count'])
+    expected = df[~(df.cat > 0)]
+
+    result = df.query('~(cat > 0)', engine=engine, parser=parser)
+    tm.assert_frame_equal(result, expected)
+
+    if parser == 'python':
+        with pytest.raises(NotImplementedError):
+            df.query('not (cat > 0)', engine=engine, parser=parser)
+    else:
+        result = df.query('not (cat > 0)', engine=engine, parser=parser)
+        tm.assert_frame_equal(result, expected)
+
+
+class TestValidate(object):
+
+    def test_validate_bool_args(self):
+        invalid_values = [1, "True", [1, 2, 3], 5.0]
+
+        for value in invalid_values:
+            with pytest.raises(ValueError):
+                pd.eval("2+2", inplace=value)
diff --git a/pandas/tests/data/s1-0.12.0.pickle b/pandas/tests/data/s1-0.12.0.pickle
deleted file mode 100644
index 0ce9cfdf3aa94..0000000000000
Binary files a/pandas/tests/data/s1-0.12.0.pickle and /dev/null differ
diff --git a/pandas/tests/data/s2-0.12.0.pickle b/pandas/tests/data/s2-0.12.0.pickle
deleted file mode 100644
index 2318be2d9978b..0000000000000
Binary files a/pandas/tests/data/s2-0.12.0.pickle and /dev/null differ
diff --git a/bench/larry.py b/pandas/tests/dtypes/__init__.py
similarity index 100%
rename from bench/larry.py
rename to pandas/tests/dtypes/__init__.py
diff --git a/pandas/tests/dtypes/test_cast.py b/pandas/tests/dtypes/test_cast.py
new file mode 100644
index 0000000000000..0d6382424ccf5
--- /dev/null
+++ b/pandas/tests/dtypes/test_cast.py
@@ -0,0 +1,458 @@
+# -*- coding: utf-8 -*-
+
+"""
+These test the private routines in types/cast.py
+
+"""
+
+import pytest
+from datetime import datetime, timedelta, date
+import numpy as np
+
+import pandas as pd
+from pandas import (Timedelta, Timestamp, DatetimeIndex,
+                    DataFrame, NaT, Period, Series)
+
+from pandas.core.dtypes.cast import (
+    maybe_downcast_to_dtype,
+    maybe_convert_objects,
+    cast_scalar_to_array,
+    infer_dtype_from_scalar,
+    infer_dtype_from_array,
+    maybe_convert_string_to_object,
+    maybe_convert_scalar,
+    find_common_type,
+    construct_1d_object_array_from_listlike,
+    construct_1d_ndarray_preserving_na,
+    construct_1d_arraylike_from_scalar)
+from pandas.core.dtypes.dtypes import (
+    CategoricalDtype,
+    DatetimeTZDtype,
+    PeriodDtype)
+from pandas.core.dtypes.common import (
+    is_dtype_equal)
+from pandas.util import testing as tm
+
+
+class TestMaybeDowncast(object):
+
+    def test_downcast(self):
+        # test downcasting
+
+        arr = np.array([8.5, 8.6, 8.7, 8.8, 8.9999999999995])
+        result = maybe_downcast_to_dtype(arr, 'infer')
+        tm.assert_numpy_array_equal(result, arr)
+
+        arr = np.array([8., 8., 8., 8., 8.9999999999995])
+        result = maybe_downcast_to_dtype(arr, 'infer')
+        expected = np.array([8, 8, 8, 8, 9], dtype=np.int64)
+        tm.assert_numpy_array_equal(result, expected)
+
+        arr = np.array([8., 8., 8., 8., 9.0000000000005])
+        result = maybe_downcast_to_dtype(arr, 'infer')
+        expected = np.array([8, 8, 8, 8, 9], dtype=np.int64)
+        tm.assert_numpy_array_equal(result, expected)
+
+        # see gh-16875: coercing of booleans.
+        ser = Series([True, True, False])
+        result = maybe_downcast_to_dtype(ser, np.dtype(np.float64))
+        expected = ser
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("dtype", [np.float64, object, np.int64])
+    def test_downcast_conversion_no_nan(self, dtype):
+        expected = np.array([1, 2])
+        arr = np.array([1.0, 2.0], dtype=dtype)
+
+        result = maybe_downcast_to_dtype(arr, "infer")
+        tm.assert_almost_equal(result, expected, check_dtype=False)
+
+    @pytest.mark.parametrize("dtype", [np.float64, object])
+    def test_downcast_conversion_nan(self, dtype):
+        expected = np.array([1.0, 2.0, np.nan], dtype=dtype)
+        arr = np.array([1.0, 2.0, np.nan], dtype=dtype)
+
+        result = maybe_downcast_to_dtype(arr, "infer")
+        tm.assert_almost_equal(result, expected)
+
+    @pytest.mark.parametrize("dtype", [np.int32, np.float64, np.float32,
+                                       np.bool_, np.int64, object])
+    def test_downcast_conversion_empty(self, dtype):
+        arr = np.array([], dtype=dtype)
+        result = maybe_downcast_to_dtype(arr, "int64")
+        tm.assert_numpy_array_equal(result, np.array([], dtype=np.int64))
+
+    def test_datetimelikes_nan(self):
+        arr = np.array([1, 2, np.nan])
+        exp = np.array([1, 2, np.datetime64('NaT')], dtype='datetime64[ns]')
+        res = maybe_downcast_to_dtype(arr, 'datetime64[ns]')
+        tm.assert_numpy_array_equal(res, exp)
+
+        exp = np.array([1, 2, np.timedelta64('NaT')], dtype='timedelta64[ns]')
+        res = maybe_downcast_to_dtype(arr, 'timedelta64[ns]')
+        tm.assert_numpy_array_equal(res, exp)
+
+    def test_datetime_with_timezone(self):
+        # GH 15426
+        ts = Timestamp("2016-01-01 12:00:00", tz='US/Pacific')
+        exp = DatetimeIndex([ts, ts])
+        res = maybe_downcast_to_dtype(exp, exp.dtype)
+        tm.assert_index_equal(res, exp)
+
+        res = maybe_downcast_to_dtype(exp.asi8, exp.dtype)
+        tm.assert_index_equal(res, exp)
+
+
+class TestInferDtype(object):
+
+    def test_infer_dtype_from_int_scalar(self, any_int_dtype):
+        # Test that infer_dtype_from_scalar is
+        # returning correct dtype for int and float.
+        data = np.dtype(any_int_dtype).type(12)
+        dtype, val = infer_dtype_from_scalar(data)
+        assert dtype == type(data)
+
+    def test_infer_dtype_from_float_scalar(self, float_dtype):
+        float_dtype = np.dtype(float_dtype).type
+        data = float_dtype(12)
+
+        dtype, val = infer_dtype_from_scalar(data)
+        assert dtype == float_dtype
+
+    def test_infer_dtype_from_python_scalar(self):
+        data = 12
+        dtype, val = infer_dtype_from_scalar(data)
+        assert dtype == np.int64
+
+        data = np.float(12)
+        dtype, val = infer_dtype_from_scalar(data)
+        assert dtype == np.float64
+
+    @pytest.mark.parametrize("bool_val", [True, False])
+    def test_infer_dtype_from_boolean(self, bool_val):
+        dtype, val = infer_dtype_from_scalar(bool_val)
+        assert dtype == np.bool_
+
+    def test_infer_dtype_from_complex(self, complex_dtype):
+        data = np.dtype(complex_dtype).type(1)
+        dtype, val = infer_dtype_from_scalar(data)
+        assert dtype == np.complex_
+
+    @pytest.mark.parametrize("data", [np.datetime64(1, "ns"), Timestamp(1),
+                                      datetime(2000, 1, 1, 0, 0)])
+    def test_infer_dtype_from_datetime(self, data):
+        dtype, val = infer_dtype_from_scalar(data)
+        assert dtype == "M8[ns]"
+
+    @pytest.mark.parametrize("data", [np.timedelta64(1, "ns"), Timedelta(1),
+                                      timedelta(1)])
+    def test_infer_dtype_from_timedelta(self, data):
+        dtype, val = infer_dtype_from_scalar(data)
+        assert dtype == "m8[ns]"
+
+    @pytest.mark.parametrize("freq", ["M", "D"])
+    def test_infer_dtype_from_period(self, freq):
+        p = Period("2011-01-01", freq=freq)
+        dtype, val = infer_dtype_from_scalar(p, pandas_dtype=True)
+
+        assert dtype == "period[{0}]".format(freq)
+        assert val == p.ordinal
+
+        dtype, val = infer_dtype_from_scalar(p)
+        assert dtype == np.object_
+        assert val == p
+
+    @pytest.mark.parametrize("data", [date(2000, 1, 1), "foo",
+                                      Timestamp(1, tz="US/Eastern")])
+    def test_infer_dtype_misc(self, data):
+        dtype, val = infer_dtype_from_scalar(data)
+        assert dtype == np.object_
+
+    @pytest.mark.parametrize('tz', ['UTC', 'US/Eastern', 'Asia/Tokyo'])
+    def test_infer_from_scalar_tz(self, tz):
+        dt = Timestamp(1, tz=tz)
+        dtype, val = infer_dtype_from_scalar(dt, pandas_dtype=True)
+        assert dtype == 'datetime64[ns, {0}]'.format(tz)
+        assert val == dt.value
+
+        dtype, val = infer_dtype_from_scalar(dt)
+        assert dtype == np.object_
+        assert val == dt
+
+    def test_infer_dtype_from_scalar_errors(self):
+        with pytest.raises(ValueError):
+            infer_dtype_from_scalar(np.array([1]))
+
+    @pytest.mark.parametrize(
+        "arr, expected, pandas_dtype",
+        [('foo', np.object_, False),
+         (b'foo', np.object_, False),
+         (1, np.int_, False),
+         (1.5, np.float_, False),
+         ([1], np.int_, False),
+         (np.array([1], dtype=np.int64), np.int64, False),
+         ([np.nan, 1, ''], np.object_, False),
+         (np.array([[1.0, 2.0]]), np.float_, False),
+         (pd.Categorical(list('aabc')), np.object_, False),
+         (pd.Categorical([1, 2, 3]), np.int64, False),
+         (pd.Categorical(list('aabc')), 'category', True),
+         (pd.Categorical([1, 2, 3]), 'category', True),
+         (Timestamp('20160101'), np.object_, False),
+         (np.datetime64('2016-01-01'), np.dtype('=M8[D]'), False),
+         (pd.date_range('20160101', periods=3),
+          np.dtype('=M8[ns]'), False),
+         (pd.date_range('20160101', periods=3, tz='US/Eastern'),
+          'datetime64[ns, US/Eastern]', True),
+         (pd.Series([1., 2, 3]), np.float64, False),
+         (pd.Series(list('abc')), np.object_, False),
+         (pd.Series(pd.date_range('20160101', periods=3, tz='US/Eastern')),
+          'datetime64[ns, US/Eastern]', True)])
+    def test_infer_dtype_from_array(self, arr, expected, pandas_dtype):
+
+        dtype, _ = infer_dtype_from_array(arr, pandas_dtype=pandas_dtype)
+        assert is_dtype_equal(dtype, expected)
+
+    def test_cast_scalar_to_array(self):
+        arr = cast_scalar_to_array((3, 2), 1, dtype=np.int64)
+        exp = np.ones((3, 2), dtype=np.int64)
+        tm.assert_numpy_array_equal(arr, exp)
+
+        arr = cast_scalar_to_array((3, 2), 1.1)
+        exp = np.empty((3, 2), dtype=np.float64)
+        exp.fill(1.1)
+        tm.assert_numpy_array_equal(arr, exp)
+
+        arr = cast_scalar_to_array((2, 3), Timestamp('2011-01-01'))
+        exp = np.empty((2, 3), dtype='datetime64[ns]')
+        exp.fill(np.datetime64('2011-01-01'))
+        tm.assert_numpy_array_equal(arr, exp)
+
+        # pandas dtype is stored as object dtype
+        obj = Timestamp('2011-01-01', tz='US/Eastern')
+        arr = cast_scalar_to_array((2, 3), obj)
+        exp = np.empty((2, 3), dtype=np.object)
+        exp.fill(obj)
+        tm.assert_numpy_array_equal(arr, exp)
+
+        obj = Period('2011-01-01', freq='D')
+        arr = cast_scalar_to_array((2, 3), obj)
+        exp = np.empty((2, 3), dtype=np.object)
+        exp.fill(obj)
+        tm.assert_numpy_array_equal(arr, exp)
+
+
+class TestMaybe(object):
+
+    def test_maybe_convert_string_to_array(self):
+        result = maybe_convert_string_to_object('x')
+        tm.assert_numpy_array_equal(result, np.array(['x'], dtype=object))
+        assert result.dtype == object
+
+        result = maybe_convert_string_to_object(1)
+        assert result == 1
+
+        arr = np.array(['x', 'y'], dtype=str)
+        result = maybe_convert_string_to_object(arr)
+        tm.assert_numpy_array_equal(result, np.array(['x', 'y'], dtype=object))
+        assert result.dtype == object
+
+        # unicode
+        arr = np.array(['x', 'y']).astype('U')
+        result = maybe_convert_string_to_object(arr)
+        tm.assert_numpy_array_equal(result, np.array(['x', 'y'], dtype=object))
+        assert result.dtype == object
+
+        # object
+        arr = np.array(['x', 2], dtype=object)
+        result = maybe_convert_string_to_object(arr)
+        tm.assert_numpy_array_equal(result, np.array(['x', 2], dtype=object))
+        assert result.dtype == object
+
+    def test_maybe_convert_scalar(self):
+
+        # pass thru
+        result = maybe_convert_scalar('x')
+        assert result == 'x'
+        result = maybe_convert_scalar(np.array([1]))
+        assert result == np.array([1])
+
+        # leave scalar dtype
+        result = maybe_convert_scalar(np.int64(1))
+        assert result == np.int64(1)
+        result = maybe_convert_scalar(np.int32(1))
+        assert result == np.int32(1)
+        result = maybe_convert_scalar(np.float32(1))
+        assert result == np.float32(1)
+        result = maybe_convert_scalar(np.int64(1))
+        assert result == np.float64(1)
+
+        # coerce
+        result = maybe_convert_scalar(1)
+        assert result == np.int64(1)
+        result = maybe_convert_scalar(1.0)
+        assert result == np.float64(1)
+        result = maybe_convert_scalar(Timestamp('20130101'))
+        assert result == Timestamp('20130101').value
+        result = maybe_convert_scalar(datetime(2013, 1, 1))
+        assert result == Timestamp('20130101').value
+        result = maybe_convert_scalar(Timedelta('1 day 1 min'))
+        assert result == Timedelta('1 day 1 min').value
+
+    def test_maybe_infer_to_datetimelike(self):
+        # GH16362
+        # pandas=0.20.1 raises IndexError: tuple index out of range
+        result = DataFrame(np.array([[NaT, 'a', 'b', 0],
+                                     [NaT, 'b', 'c', 1]]))
+        assert result.size == 8
+        # this construction was fine
+        result = DataFrame(np.array([[NaT, 'a', 0],
+                                     [NaT, 'b', 1]]))
+        assert result.size == 6
+
+        # GH19671
+        result = Series(['M1701', Timestamp('20130101')])
+        assert result.dtype.kind == 'O'
+
+
+class TestConvert(object):
+
+    def test_maybe_convert_objects_copy(self):
+        values = np.array([1, 2])
+
+        out = maybe_convert_objects(values, copy=False)
+        assert values is out
+
+        out = maybe_convert_objects(values, copy=True)
+        assert values is not out
+
+        values = np.array(['apply', 'banana'])
+        out = maybe_convert_objects(values, copy=False)
+        assert values is out
+
+        out = maybe_convert_objects(values, copy=True)
+        assert values is not out
+
+
+class TestCommonTypes(object):
+
+    @pytest.mark.parametrize("source_dtypes,expected_common_dtype", [
+        ((np.int64,), np.int64),
+        ((np.uint64,), np.uint64),
+        ((np.float32,), np.float32),
+        ((np.object,), np.object),
+
+        # into ints
+        ((np.int16, np.int64), np.int64),
+        ((np.int32, np.uint32), np.int64),
+        ((np.uint16, np.uint64), np.uint64),
+
+        # into floats
+        ((np.float16, np.float32), np.float32),
+        ((np.float16, np.int16), np.float32),
+        ((np.float32, np.int16), np.float32),
+        ((np.uint64, np.int64), np.float64),
+        ((np.int16, np.float64), np.float64),
+        ((np.float16, np.int64), np.float64),
+
+        # into others
+        ((np.complex128, np.int32), np.complex128),
+        ((np.object, np.float32), np.object),
+        ((np.object, np.int16), np.object),
+
+        # bool with int
+        ((np.dtype('bool'), np.int64), np.object),
+        ((np.dtype('bool'), np.int32), np.object),
+        ((np.dtype('bool'), np.int16), np.object),
+        ((np.dtype('bool'), np.int8), np.object),
+        ((np.dtype('bool'), np.uint64), np.object),
+        ((np.dtype('bool'), np.uint32), np.object),
+        ((np.dtype('bool'), np.uint16), np.object),
+        ((np.dtype('bool'), np.uint8), np.object),
+
+        # bool with float
+        ((np.dtype('bool'), np.float64), np.object),
+        ((np.dtype('bool'), np.float32), np.object),
+
+        ((np.dtype('datetime64[ns]'), np.dtype('datetime64[ns]')),
+         np.dtype('datetime64[ns]')),
+        ((np.dtype('timedelta64[ns]'), np.dtype('timedelta64[ns]')),
+         np.dtype('timedelta64[ns]')),
+
+        ((np.dtype('datetime64[ns]'), np.dtype('datetime64[ms]')),
+         np.dtype('datetime64[ns]')),
+        ((np.dtype('timedelta64[ms]'), np.dtype('timedelta64[ns]')),
+         np.dtype('timedelta64[ns]')),
+
+        ((np.dtype('datetime64[ns]'), np.dtype('timedelta64[ns]')),
+         np.object),
+        ((np.dtype('datetime64[ns]'), np.int64), np.object)
+    ])
+    def test_numpy_dtypes(self, source_dtypes, expected_common_dtype):
+        assert find_common_type(source_dtypes) == expected_common_dtype
+
+    def test_raises_empty_input(self):
+        with pytest.raises(ValueError):
+            find_common_type([])
+
+    def test_categorical_dtype(self):
+        dtype = CategoricalDtype()
+        assert find_common_type([dtype]) == 'category'
+        assert find_common_type([dtype, dtype]) == 'category'
+        assert find_common_type([np.object, dtype]) == np.object
+
+    def test_datetimetz_dtype(self):
+        dtype = DatetimeTZDtype(unit='ns', tz='US/Eastern')
+        assert find_common_type([dtype, dtype]) == 'datetime64[ns, US/Eastern]'
+
+        for dtype2 in [DatetimeTZDtype(unit='ns', tz='Asia/Tokyo'),
+                       np.dtype('datetime64[ns]'), np.object, np.int64]:
+            assert find_common_type([dtype, dtype2]) == np.object
+            assert find_common_type([dtype2, dtype]) == np.object
+
+    def test_period_dtype(self):
+        dtype = PeriodDtype(freq='D')
+        assert find_common_type([dtype, dtype]) == 'period[D]'
+
+        for dtype2 in [DatetimeTZDtype(unit='ns', tz='Asia/Tokyo'),
+                       PeriodDtype(freq='2D'), PeriodDtype(freq='H'),
+                       np.dtype('datetime64[ns]'), np.object, np.int64]:
+            assert find_common_type([dtype, dtype2]) == np.object
+            assert find_common_type([dtype2, dtype]) == np.object
+
+    @pytest.mark.parametrize('datum1', [1, 2., "3", (4, 5), [6, 7], None])
+    @pytest.mark.parametrize('datum2', [8, 9., "10", (11, 12), [13, 14], None])
+    def test_cast_1d_array(self, datum1, datum2):
+        data = [datum1, datum2]
+        result = construct_1d_object_array_from_listlike(data)
+
+        # Direct comparison fails: https://github.com/numpy/numpy/issues/10218
+        assert result.dtype == 'object'
+        assert list(result) == data
+
+    @pytest.mark.parametrize('val', [1, 2., None])
+    def test_cast_1d_array_invalid_scalar(self, val):
+        pytest.raises(TypeError, construct_1d_object_array_from_listlike, val)
+
+    def test_cast_1d_arraylike_from_scalar_categorical(self):
+        # GH 19565 - Categorical result from scalar did not maintain categories
+        # and ordering of the passed dtype
+        cats = ['a', 'b', 'c']
+        cat_type = CategoricalDtype(categories=cats, ordered=False)
+        expected = pd.Categorical(['a', 'a'], categories=cats)
+        result = construct_1d_arraylike_from_scalar('a', len(expected),
+                                                    cat_type)
+        tm.assert_categorical_equal(result, expected,
+                                    check_category_order=True,
+                                    check_dtype=True)
+
+
+@pytest.mark.parametrize('values, dtype, expected', [
+    ([1, 2, 3], None, np.array([1, 2, 3])),
+    (np.array([1, 2, 3]), None, np.array([1, 2, 3])),
+    (['1', '2', None], None, np.array(['1', '2', None])),
+    (['1', '2', None], np.dtype('str'), np.array(['1', '2', None])),
+    ([1, 2, None], np.dtype('str'), np.array(['1', '2', None])),
+])
+def test_construct_1d_ndarray_preserving_na(values, dtype, expected):
+    result = construct_1d_ndarray_preserving_na(values, dtype=dtype)
+    tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/dtypes/test_common.py b/pandas/tests/dtypes/test_common.py
new file mode 100644
index 0000000000000..edabc177535fc
--- /dev/null
+++ b/pandas/tests/dtypes/test_common.py
@@ -0,0 +1,630 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+import numpy as np
+import pandas as pd
+
+from pandas.core.dtypes.dtypes import (DatetimeTZDtype, PeriodDtype,
+                                       CategoricalDtype, IntervalDtype)
+
+import pandas.core.dtypes.common as com
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+
+class TestPandasDtype(object):
+
+    # Passing invalid dtype, both as a string or object, must raise TypeError
+    # Per issue GH15520
+    @pytest.mark.parametrize('box', [pd.Timestamp, 'pd.Timestamp', list])
+    def test_invalid_dtype_error(self, box):
+        with tm.assert_raises_regex(TypeError, 'not understood'):
+            com.pandas_dtype(box)
+
+    @pytest.mark.parametrize('dtype', [
+        object, 'float64', np.object_, np.dtype('object'), 'O',
+        np.float64, float, np.dtype('float64')])
+    def test_pandas_dtype_valid(self, dtype):
+        assert com.pandas_dtype(dtype) == dtype
+
+    @pytest.mark.parametrize('dtype', [
+        'M8[ns]', 'm8[ns]', 'object', 'float64', 'int64'])
+    def test_numpy_dtype(self, dtype):
+        assert com.pandas_dtype(dtype) == np.dtype(dtype)
+
+    def test_numpy_string_dtype(self):
+        # do not parse freq-like string as period dtype
+        assert com.pandas_dtype('U') == np.dtype('U')
+        assert com.pandas_dtype('S') == np.dtype('S')
+
+    @pytest.mark.parametrize('dtype', [
+        'datetime64[ns, US/Eastern]',
+        'datetime64[ns, Asia/Tokyo]',
+        'datetime64[ns, UTC]'])
+    def test_datetimetz_dtype(self, dtype):
+        assert com.pandas_dtype(dtype) is DatetimeTZDtype(dtype)
+        assert com.pandas_dtype(dtype) == DatetimeTZDtype(dtype)
+        assert com.pandas_dtype(dtype) == dtype
+
+    def test_categorical_dtype(self):
+        assert com.pandas_dtype('category') == CategoricalDtype()
+
+    @pytest.mark.parametrize('dtype', [
+        'period[D]', 'period[3M]', 'period[U]',
+        'Period[D]', 'Period[3M]', 'Period[U]'])
+    def test_period_dtype(self, dtype):
+        assert com.pandas_dtype(dtype) is PeriodDtype(dtype)
+        assert com.pandas_dtype(dtype) == PeriodDtype(dtype)
+        assert com.pandas_dtype(dtype) == dtype
+
+
+dtypes = dict(datetime_tz=com.pandas_dtype('datetime64[ns, US/Eastern]'),
+              datetime=com.pandas_dtype('datetime64[ns]'),
+              timedelta=com.pandas_dtype('timedelta64[ns]'),
+              period=PeriodDtype('D'),
+              integer=np.dtype(np.int64),
+              float=np.dtype(np.float64),
+              object=np.dtype(np.object),
+              category=com.pandas_dtype('category'))
+
+
+@pytest.mark.parametrize('name1,dtype1',
+                         list(dtypes.items()),
+                         ids=lambda x: str(x))
+@pytest.mark.parametrize('name2,dtype2',
+                         list(dtypes.items()),
+                         ids=lambda x: str(x))
+def test_dtype_equal(name1, dtype1, name2, dtype2):
+
+    # match equal to self, but not equal to other
+    assert com.is_dtype_equal(dtype1, dtype1)
+    if name1 != name2:
+        assert not com.is_dtype_equal(dtype1, dtype2)
+
+
+def test_dtype_equal_strict():
+
+    # we are strict on kind equality
+    for dtype in [np.int8, np.int16, np.int32]:
+        assert not com.is_dtype_equal(np.int64, dtype)
+
+    for dtype in [np.float32]:
+        assert not com.is_dtype_equal(np.float64, dtype)
+
+    # strict w.r.t. PeriodDtype
+    assert not com.is_dtype_equal(PeriodDtype('D'), PeriodDtype('2D'))
+
+    # strict w.r.t. datetime64
+    assert not com.is_dtype_equal(
+        com.pandas_dtype('datetime64[ns, US/Eastern]'),
+        com.pandas_dtype('datetime64[ns, CET]'))
+
+    # see gh-15941: no exception should be raised
+    assert not com.is_dtype_equal(None, None)
+
+
+def get_is_dtype_funcs():
+    """
+    Get all functions in pandas.core.dtypes.common that
+    begin with 'is_' and end with 'dtype'
+
+    """
+
+    fnames = [f for f in dir(com) if (f.startswith('is_') and
+                                      f.endswith('dtype'))]
+    return [getattr(com, fname) for fname in fnames]
+
+
+@pytest.mark.parametrize('func',
+                         get_is_dtype_funcs(),
+                         ids=lambda x: x.__name__)
+def test_get_dtype_error_catch(func):
+    # see gh-15941
+    #
+    # No exception should be raised.
+
+    assert not func(None)
+
+
+def test_is_object():
+    assert com.is_object_dtype(object)
+    assert com.is_object_dtype(np.array([], dtype=object))
+
+    assert not com.is_object_dtype(int)
+    assert not com.is_object_dtype(np.array([], dtype=int))
+    assert not com.is_object_dtype([1, 2, 3])
+
+
+@pytest.mark.parametrize("check_scipy", [
+    False, pytest.param(True, marks=td.skip_if_no_scipy)
+])
+def test_is_sparse(check_scipy):
+    assert com.is_sparse(pd.SparseArray([1, 2, 3]))
+    assert com.is_sparse(pd.SparseSeries([1, 2, 3]))
+
+    assert not com.is_sparse(np.array([1, 2, 3]))
+
+    if check_scipy:
+        import scipy.sparse
+        assert not com.is_sparse(scipy.sparse.bsr_matrix([1, 2, 3]))
+
+
+@td.skip_if_no_scipy
+def test_is_scipy_sparse():
+    from scipy.sparse import bsr_matrix
+    assert com.is_scipy_sparse(bsr_matrix([1, 2, 3]))
+
+    assert not com.is_scipy_sparse(pd.SparseArray([1, 2, 3]))
+    assert not com.is_scipy_sparse(pd.SparseSeries([1, 2, 3]))
+
+
+def test_is_categorical():
+    cat = pd.Categorical([1, 2, 3])
+    assert com.is_categorical(cat)
+    assert com.is_categorical(pd.Series(cat))
+    assert com.is_categorical(pd.CategoricalIndex([1, 2, 3]))
+
+    assert not com.is_categorical([1, 2, 3])
+
+
+def test_is_datetimetz():
+    assert not com.is_datetimetz([1, 2, 3])
+    assert not com.is_datetimetz(pd.DatetimeIndex([1, 2, 3]))
+
+    assert com.is_datetimetz(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+
+    dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+    s = pd.Series([], dtype=dtype)
+    assert com.is_datetimetz(s)
+
+
+def test_is_period():
+    assert not com.is_period([1, 2, 3])
+    assert not com.is_period(pd.Index([1, 2, 3]))
+    assert com.is_period(pd.PeriodIndex(["2017-01-01"], freq="D"))
+
+
+def test_is_datetime64_dtype():
+    assert not com.is_datetime64_dtype(object)
+    assert not com.is_datetime64_dtype([1, 2, 3])
+    assert not com.is_datetime64_dtype(np.array([], dtype=int))
+
+    assert com.is_datetime64_dtype(np.datetime64)
+    assert com.is_datetime64_dtype(np.array([], dtype=np.datetime64))
+
+
+def test_is_datetime64tz_dtype():
+    assert not com.is_datetime64tz_dtype(object)
+    assert not com.is_datetime64tz_dtype([1, 2, 3])
+    assert not com.is_datetime64tz_dtype(pd.DatetimeIndex([1, 2, 3]))
+    assert com.is_datetime64tz_dtype(pd.DatetimeIndex(
+        [1, 2, 3], tz="US/Eastern"))
+
+
+def test_is_timedelta64_dtype():
+    assert not com.is_timedelta64_dtype(object)
+    assert not com.is_timedelta64_dtype(None)
+    assert not com.is_timedelta64_dtype([1, 2, 3])
+    assert not com.is_timedelta64_dtype(np.array([], dtype=np.datetime64))
+    assert not com.is_timedelta64_dtype('0 days')
+    assert not com.is_timedelta64_dtype("0 days 00:00:00")
+    assert not com.is_timedelta64_dtype(["0 days 00:00:00"])
+    assert not com.is_timedelta64_dtype("NO DATE")
+
+    assert com.is_timedelta64_dtype(np.timedelta64)
+    assert com.is_timedelta64_dtype(pd.Series([], dtype="timedelta64[ns]"))
+    assert com.is_timedelta64_dtype(pd.to_timedelta(['0 days', '1 days']))
+
+
+def test_is_period_dtype():
+    assert not com.is_period_dtype(object)
+    assert not com.is_period_dtype([1, 2, 3])
+    assert not com.is_period_dtype(pd.Period("2017-01-01"))
+
+    assert com.is_period_dtype(PeriodDtype(freq="D"))
+    assert com.is_period_dtype(pd.PeriodIndex([], freq="A"))
+
+
+def test_is_interval_dtype():
+    assert not com.is_interval_dtype(object)
+    assert not com.is_interval_dtype([1, 2, 3])
+
+    assert com.is_interval_dtype(IntervalDtype())
+
+    interval = pd.Interval(1, 2, closed="right")
+    assert not com.is_interval_dtype(interval)
+    assert com.is_interval_dtype(pd.IntervalIndex([interval]))
+
+
+def test_is_categorical_dtype():
+    assert not com.is_categorical_dtype(object)
+    assert not com.is_categorical_dtype([1, 2, 3])
+
+    assert com.is_categorical_dtype(CategoricalDtype())
+    assert com.is_categorical_dtype(pd.Categorical([1, 2, 3]))
+    assert com.is_categorical_dtype(pd.CategoricalIndex([1, 2, 3]))
+
+
+def test_is_string_dtype():
+    assert not com.is_string_dtype(int)
+    assert not com.is_string_dtype(pd.Series([1, 2]))
+
+    assert com.is_string_dtype(str)
+    assert com.is_string_dtype(object)
+    assert com.is_string_dtype(np.array(['a', 'b']))
+
+
+def test_is_period_arraylike():
+    assert not com.is_period_arraylike([1, 2, 3])
+    assert not com.is_period_arraylike(pd.Index([1, 2, 3]))
+    assert com.is_period_arraylike(pd.PeriodIndex(["2017-01-01"], freq="D"))
+
+
+def test_is_datetime_arraylike():
+    assert not com.is_datetime_arraylike([1, 2, 3])
+    assert not com.is_datetime_arraylike(pd.Index([1, 2, 3]))
+    assert com.is_datetime_arraylike(pd.DatetimeIndex([1, 2, 3]))
+
+
+def test_is_datetimelike():
+    assert not com.is_datetimelike([1, 2, 3])
+    assert not com.is_datetimelike(pd.Index([1, 2, 3]))
+
+    assert com.is_datetimelike(pd.DatetimeIndex([1, 2, 3]))
+    assert com.is_datetimelike(pd.PeriodIndex([], freq="A"))
+    assert com.is_datetimelike(np.array([], dtype=np.datetime64))
+    assert com.is_datetimelike(pd.Series([], dtype="timedelta64[ns]"))
+    assert com.is_datetimelike(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+
+    dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+    s = pd.Series([], dtype=dtype)
+    assert com.is_datetimelike(s)
+
+
+def test_is_integer_dtype():
+    assert not com.is_integer_dtype(str)
+    assert not com.is_integer_dtype(float)
+    assert not com.is_integer_dtype(np.datetime64)
+    assert not com.is_integer_dtype(np.timedelta64)
+    assert not com.is_integer_dtype(pd.Index([1, 2.]))
+    assert not com.is_integer_dtype(np.array(['a', 'b']))
+    assert not com.is_integer_dtype(np.array([], dtype=np.timedelta64))
+
+    assert com.is_integer_dtype(int)
+    assert com.is_integer_dtype(np.uint64)
+    assert com.is_integer_dtype(pd.Series([1, 2]))
+
+
+def test_is_signed_integer_dtype():
+    assert not com.is_signed_integer_dtype(str)
+    assert not com.is_signed_integer_dtype(float)
+    assert not com.is_signed_integer_dtype(np.uint64)
+    assert not com.is_signed_integer_dtype(np.datetime64)
+    assert not com.is_signed_integer_dtype(np.timedelta64)
+    assert not com.is_signed_integer_dtype(pd.Index([1, 2.]))
+    assert not com.is_signed_integer_dtype(np.array(['a', 'b']))
+    assert not com.is_signed_integer_dtype(np.array([1, 2], dtype=np.uint32))
+    assert not com.is_signed_integer_dtype(np.array([], dtype=np.timedelta64))
+
+    assert com.is_signed_integer_dtype(int)
+    assert com.is_signed_integer_dtype(pd.Series([1, 2]))
+
+
+def test_is_unsigned_integer_dtype():
+    assert not com.is_unsigned_integer_dtype(str)
+    assert not com.is_unsigned_integer_dtype(int)
+    assert not com.is_unsigned_integer_dtype(float)
+    assert not com.is_unsigned_integer_dtype(pd.Series([1, 2]))
+    assert not com.is_unsigned_integer_dtype(pd.Index([1, 2.]))
+    assert not com.is_unsigned_integer_dtype(np.array(['a', 'b']))
+
+    assert com.is_unsigned_integer_dtype(np.uint64)
+    assert com.is_unsigned_integer_dtype(np.array([1, 2], dtype=np.uint32))
+
+
+def test_is_int64_dtype():
+    assert not com.is_int64_dtype(str)
+    assert not com.is_int64_dtype(float)
+    assert not com.is_int64_dtype(np.int32)
+    assert not com.is_int64_dtype(np.uint64)
+    assert not com.is_int64_dtype(pd.Index([1, 2.]))
+    assert not com.is_int64_dtype(np.array(['a', 'b']))
+    assert not com.is_int64_dtype(np.array([1, 2], dtype=np.uint32))
+
+    assert com.is_int64_dtype(np.int64)
+    assert com.is_int64_dtype(np.array([1, 2], dtype=np.int64))
+
+
+def test_is_int_or_datetime_dtype():
+    assert not com.is_int_or_datetime_dtype(str)
+    assert not com.is_int_or_datetime_dtype(float)
+    assert not com.is_int_or_datetime_dtype(pd.Index([1, 2.]))
+    assert not com.is_int_or_datetime_dtype(np.array(['a', 'b']))
+
+    assert com.is_int_or_datetime_dtype(int)
+    assert com.is_int_or_datetime_dtype(np.uint64)
+    assert com.is_int_or_datetime_dtype(np.datetime64)
+    assert com.is_int_or_datetime_dtype(np.timedelta64)
+    assert com.is_int_or_datetime_dtype(pd.Series([1, 2]))
+    assert com.is_int_or_datetime_dtype(np.array([], dtype=np.datetime64))
+    assert com.is_int_or_datetime_dtype(np.array([], dtype=np.timedelta64))
+
+
+def test_is_datetime64_any_dtype():
+    assert not com.is_datetime64_any_dtype(int)
+    assert not com.is_datetime64_any_dtype(str)
+    assert not com.is_datetime64_any_dtype(np.array([1, 2]))
+    assert not com.is_datetime64_any_dtype(np.array(['a', 'b']))
+
+    assert com.is_datetime64_any_dtype(np.datetime64)
+    assert com.is_datetime64_any_dtype(np.array([], dtype=np.datetime64))
+    assert com.is_datetime64_any_dtype(DatetimeTZDtype("ns", "US/Eastern"))
+    assert com.is_datetime64_any_dtype(pd.DatetimeIndex([1, 2, 3],
+                                                        dtype=np.datetime64))
+
+
+def test_is_datetime64_ns_dtype():
+    assert not com.is_datetime64_ns_dtype(int)
+    assert not com.is_datetime64_ns_dtype(str)
+    assert not com.is_datetime64_ns_dtype(np.datetime64)
+    assert not com.is_datetime64_ns_dtype(np.array([1, 2]))
+    assert not com.is_datetime64_ns_dtype(np.array(['a', 'b']))
+    assert not com.is_datetime64_ns_dtype(np.array([], dtype=np.datetime64))
+
+    # This datetime array has the wrong unit (ps instead of ns)
+    assert not com.is_datetime64_ns_dtype(np.array([], dtype="datetime64[ps]"))
+
+    assert com.is_datetime64_ns_dtype(DatetimeTZDtype("ns", "US/Eastern"))
+    assert com.is_datetime64_ns_dtype(pd.DatetimeIndex([1, 2, 3],
+                                                       dtype=np.datetime64))
+
+
+def test_is_timedelta64_ns_dtype():
+    assert not com.is_timedelta64_ns_dtype(np.dtype('m8[ps]'))
+    assert not com.is_timedelta64_ns_dtype(
+        np.array([1, 2], dtype=np.timedelta64))
+
+    assert com.is_timedelta64_ns_dtype(np.dtype('m8[ns]'))
+    assert com.is_timedelta64_ns_dtype(np.array([1, 2], dtype='m8[ns]'))
+
+
+def test_is_datetime_or_timedelta_dtype():
+    assert not com.is_datetime_or_timedelta_dtype(int)
+    assert not com.is_datetime_or_timedelta_dtype(str)
+    assert not com.is_datetime_or_timedelta_dtype(pd.Series([1, 2]))
+    assert not com.is_datetime_or_timedelta_dtype(np.array(['a', 'b']))
+
+    assert com.is_datetime_or_timedelta_dtype(np.datetime64)
+    assert com.is_datetime_or_timedelta_dtype(np.timedelta64)
+    assert com.is_datetime_or_timedelta_dtype(
+        np.array([], dtype=np.timedelta64))
+    assert com.is_datetime_or_timedelta_dtype(
+        np.array([], dtype=np.datetime64))
+
+
+def test_is_numeric_v_string_like():
+    assert not com.is_numeric_v_string_like(1, 1)
+    assert not com.is_numeric_v_string_like(1, "foo")
+    assert not com.is_numeric_v_string_like("foo", "foo")
+    assert not com.is_numeric_v_string_like(np.array([1]), np.array([2]))
+    assert not com.is_numeric_v_string_like(
+        np.array(["foo"]), np.array(["foo"]))
+
+    assert com.is_numeric_v_string_like(np.array([1]), "foo")
+    assert com.is_numeric_v_string_like("foo", np.array([1]))
+    assert com.is_numeric_v_string_like(np.array([1, 2]), np.array(["foo"]))
+    assert com.is_numeric_v_string_like(np.array(["foo"]), np.array([1, 2]))
+
+
+def test_is_datetimelike_v_numeric():
+    dt = np.datetime64(pd.datetime(2017, 1, 1))
+
+    assert not com.is_datetimelike_v_numeric(1, 1)
+    assert not com.is_datetimelike_v_numeric(dt, dt)
+    assert not com.is_datetimelike_v_numeric(np.array([1]), np.array([2]))
+    assert not com.is_datetimelike_v_numeric(np.array([dt]), np.array([dt]))
+
+    assert com.is_datetimelike_v_numeric(1, dt)
+    assert com.is_datetimelike_v_numeric(1, dt)
+    assert com.is_datetimelike_v_numeric(np.array([dt]), 1)
+    assert com.is_datetimelike_v_numeric(np.array([1]), dt)
+    assert com.is_datetimelike_v_numeric(np.array([dt]), np.array([1]))
+
+
+def test_is_datetimelike_v_object():
+    obj = object()
+    dt = np.datetime64(pd.datetime(2017, 1, 1))
+
+    assert not com.is_datetimelike_v_object(dt, dt)
+    assert not com.is_datetimelike_v_object(obj, obj)
+    assert not com.is_datetimelike_v_object(np.array([dt]), np.array([1]))
+    assert not com.is_datetimelike_v_object(np.array([dt]), np.array([dt]))
+    assert not com.is_datetimelike_v_object(np.array([obj]), np.array([obj]))
+
+    assert com.is_datetimelike_v_object(dt, obj)
+    assert com.is_datetimelike_v_object(obj, dt)
+    assert com.is_datetimelike_v_object(np.array([dt]), obj)
+    assert com.is_datetimelike_v_object(np.array([obj]), dt)
+    assert com.is_datetimelike_v_object(np.array([dt]), np.array([obj]))
+
+
+def test_needs_i8_conversion():
+    assert not com.needs_i8_conversion(str)
+    assert not com.needs_i8_conversion(np.int64)
+    assert not com.needs_i8_conversion(pd.Series([1, 2]))
+    assert not com.needs_i8_conversion(np.array(['a', 'b']))
+
+    assert com.needs_i8_conversion(np.datetime64)
+    assert com.needs_i8_conversion(pd.Series([], dtype="timedelta64[ns]"))
+    assert com.needs_i8_conversion(pd.DatetimeIndex(
+        [1, 2, 3], tz="US/Eastern"))
+
+
+def test_is_numeric_dtype():
+    assert not com.is_numeric_dtype(str)
+    assert not com.is_numeric_dtype(np.datetime64)
+    assert not com.is_numeric_dtype(np.timedelta64)
+    assert not com.is_numeric_dtype(np.array(['a', 'b']))
+    assert not com.is_numeric_dtype(np.array([], dtype=np.timedelta64))
+
+    assert com.is_numeric_dtype(int)
+    assert com.is_numeric_dtype(float)
+    assert com.is_numeric_dtype(np.uint64)
+    assert com.is_numeric_dtype(pd.Series([1, 2]))
+    assert com.is_numeric_dtype(pd.Index([1, 2.]))
+
+
+def test_is_string_like_dtype():
+    assert not com.is_string_like_dtype(object)
+    assert not com.is_string_like_dtype(pd.Series([1, 2]))
+
+    assert com.is_string_like_dtype(str)
+    assert com.is_string_like_dtype(np.array(['a', 'b']))
+
+
+def test_is_float_dtype():
+    assert not com.is_float_dtype(str)
+    assert not com.is_float_dtype(int)
+    assert not com.is_float_dtype(pd.Series([1, 2]))
+    assert not com.is_float_dtype(np.array(['a', 'b']))
+
+    assert com.is_float_dtype(float)
+    assert com.is_float_dtype(pd.Index([1, 2.]))
+
+
+def test_is_bool_dtype():
+    assert not com.is_bool_dtype(int)
+    assert not com.is_bool_dtype(str)
+    assert not com.is_bool_dtype(pd.Series([1, 2]))
+    assert not com.is_bool_dtype(np.array(['a', 'b']))
+    assert not com.is_bool_dtype(pd.Index(['a', 'b']))
+
+    assert com.is_bool_dtype(bool)
+    assert com.is_bool_dtype(np.bool)
+    assert com.is_bool_dtype(np.array([True, False]))
+    assert com.is_bool_dtype(pd.Index([True, False]))
+
+
+@pytest.mark.parametrize("check_scipy", [
+    False, pytest.param(True, marks=td.skip_if_no_scipy)
+])
+def test_is_extension_type(check_scipy):
+    assert not com.is_extension_type([1, 2, 3])
+    assert not com.is_extension_type(np.array([1, 2, 3]))
+    assert not com.is_extension_type(pd.DatetimeIndex([1, 2, 3]))
+
+    cat = pd.Categorical([1, 2, 3])
+    assert com.is_extension_type(cat)
+    assert com.is_extension_type(pd.Series(cat))
+    assert com.is_extension_type(pd.SparseArray([1, 2, 3]))
+    assert com.is_extension_type(pd.SparseSeries([1, 2, 3]))
+    assert com.is_extension_type(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+
+    dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+    s = pd.Series([], dtype=dtype)
+    assert com.is_extension_type(s)
+
+    if check_scipy:
+        import scipy.sparse
+        assert not com.is_extension_type(scipy.sparse.bsr_matrix([1, 2, 3]))
+
+
+def test_is_complex_dtype():
+    assert not com.is_complex_dtype(int)
+    assert not com.is_complex_dtype(str)
+    assert not com.is_complex_dtype(pd.Series([1, 2]))
+    assert not com.is_complex_dtype(np.array(['a', 'b']))
+
+    assert com.is_complex_dtype(np.complex)
+    assert com.is_complex_dtype(np.array([1 + 1j, 5]))
+
+
+def test_is_offsetlike():
+    assert com.is_offsetlike(np.array([pd.DateOffset(month=3),
+                                       pd.offsets.Nano()]))
+    assert com.is_offsetlike(pd.offsets.MonthEnd())
+    assert com.is_offsetlike(pd.Index([pd.DateOffset(second=1)]))
+
+    assert not com.is_offsetlike(pd.Timedelta(1))
+    assert not com.is_offsetlike(np.array([1 + 1j, 5]))
+
+    # mixed case
+    assert not com.is_offsetlike(np.array([pd.DateOffset(), pd.Timestamp(0)]))
+
+
+@pytest.mark.parametrize('input_param,result', [
+    (int, np.dtype(int)),
+    ('int32', np.dtype('int32')),
+    (float, np.dtype(float)),
+    ('float64', np.dtype('float64')),
+    (np.dtype('float64'), np.dtype('float64')),
+    (str, np.dtype(str)),
+    (pd.Series([1, 2], dtype=np.dtype('int16')), np.dtype('int16')),
+    (pd.Series(['a', 'b']), np.dtype(object)),
+    (pd.Index([1, 2]), np.dtype('int64')),
+    (pd.Index(['a', 'b']), np.dtype(object)),
+    ('category', 'category'),
+    (pd.Categorical(['a', 'b']).dtype, CategoricalDtype(['a', 'b'])),
+    (pd.Categorical(['a', 'b']), CategoricalDtype(['a', 'b'])),
+    (pd.CategoricalIndex(['a', 'b']).dtype, CategoricalDtype(['a', 'b'])),
+    (pd.CategoricalIndex(['a', 'b']), CategoricalDtype(['a', 'b'])),
+    (CategoricalDtype(), CategoricalDtype()),
+    (CategoricalDtype(['a', 'b']), CategoricalDtype()),
+    (pd.DatetimeIndex([1, 2]), np.dtype('=M8[ns]')),
+    (pd.DatetimeIndex([1, 2]).dtype, np.dtype('=M8[ns]')),
+    ('<M8[ns]', np.dtype('<M8[ns]')),
+    ('datetime64[ns, Europe/London]', DatetimeTZDtype('ns', 'Europe/London')),
+    (pd.SparseSeries([1, 2], dtype='int32'), np.dtype('int32')),
+    (pd.SparseSeries([1, 2], dtype='int32').dtype, np.dtype('int32')),
+    (PeriodDtype(freq='D'), PeriodDtype(freq='D')),
+    ('period[D]', PeriodDtype(freq='D')),
+    (IntervalDtype(), IntervalDtype()),
+])
+def test__get_dtype(input_param, result):
+    assert com._get_dtype(input_param) == result
+
+
+@pytest.mark.parametrize('input_param', [None,
+                                         1, 1.2,
+                                         'random string',
+                                         pd.DataFrame([1, 2])])
+def test__get_dtype_fails(input_param):
+    # python objects
+    pytest.raises(TypeError, com._get_dtype, input_param)
+
+
+@pytest.mark.parametrize('input_param,result', [
+    (int, np.dtype(int).type),
+    ('int32', np.int32),
+    (float, np.dtype(float).type),
+    ('float64', np.float64),
+    (np.dtype('float64'), np.float64),
+    (str, np.dtype(str).type),
+    (pd.Series([1, 2], dtype=np.dtype('int16')), np.int16),
+    (pd.Series(['a', 'b']), np.object_),
+    (pd.Index([1, 2], dtype='int64'), np.int64),
+    (pd.Index(['a', 'b']), np.object_),
+    ('category', com.CategoricalDtypeType),
+    (pd.Categorical(['a', 'b']).dtype, com.CategoricalDtypeType),
+    (pd.Categorical(['a', 'b']), com.CategoricalDtypeType),
+    (pd.CategoricalIndex(['a', 'b']).dtype, com.CategoricalDtypeType),
+    (pd.CategoricalIndex(['a', 'b']), com.CategoricalDtypeType),
+    (pd.DatetimeIndex([1, 2]), np.datetime64),
+    (pd.DatetimeIndex([1, 2]).dtype, np.datetime64),
+    ('<M8[ns]', np.datetime64),
+    (pd.DatetimeIndex([1, 2], tz='Europe/London'), com.DatetimeTZDtypeType),
+    (pd.DatetimeIndex([1, 2], tz='Europe/London').dtype,
+     com.DatetimeTZDtypeType),
+    ('datetime64[ns, Europe/London]', com.DatetimeTZDtypeType),
+    (pd.SparseSeries([1, 2], dtype='int32'), np.int32),
+    (pd.SparseSeries([1, 2], dtype='int32').dtype, np.int32),
+    (PeriodDtype(freq='D'), com.PeriodDtypeType),
+    ('period[D]', com.PeriodDtypeType),
+    (IntervalDtype(), com.IntervalDtypeType),
+    (None, type(None)),
+    (1, type(None)),
+    (1.2, type(None)),
+    (pd.DataFrame([1, 2]), type(None)),  # composite dtype
+])
+def test__get_dtype_type(input_param, result):
+    assert com._get_dtype_type(input_param) == result
diff --git a/pandas/tests/dtypes/test_concat.py b/pandas/tests/dtypes/test_concat.py
new file mode 100644
index 0000000000000..b6c5c119ffb6f
--- /dev/null
+++ b/pandas/tests/dtypes/test_concat.py
@@ -0,0 +1,53 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+import pandas.core.dtypes.concat as _concat
+from pandas import (
+    Index, DatetimeIndex, PeriodIndex, TimedeltaIndex, Series, Period)
+
+
+@pytest.mark.parametrize('to_concat, expected', [
+    # int/float/str
+    ([['a'], [1, 2]], ['i', 'object']),
+    ([[3, 4], [1, 2]], ['i']),
+    ([[3, 4], [1, 2.1]], ['i', 'f']),
+
+    # datetimelike
+    ([DatetimeIndex(['2011-01-01']), DatetimeIndex(['2011-01-02'])],
+     ['datetime']),
+    ([TimedeltaIndex(['1 days']), TimedeltaIndex(['2 days'])],
+     ['timedelta']),
+
+    # datetimelike object
+    ([DatetimeIndex(['2011-01-01']),
+      DatetimeIndex(['2011-01-02'], tz='US/Eastern')],
+     ['datetime', 'datetime64[ns, US/Eastern]']),
+    ([DatetimeIndex(['2011-01-01'], tz='Asia/Tokyo'),
+      DatetimeIndex(['2011-01-02'], tz='US/Eastern')],
+     ['datetime64[ns, Asia/Tokyo]', 'datetime64[ns, US/Eastern]']),
+    ([TimedeltaIndex(['1 days']), TimedeltaIndex(['2 hours'])],
+     ['timedelta']),
+    ([DatetimeIndex(['2011-01-01'], tz='Asia/Tokyo'),
+      TimedeltaIndex(['1 days'])],
+     ['datetime64[ns, Asia/Tokyo]', 'timedelta'])])
+@pytest.mark.parametrize('klass', [Index, Series])
+def test_get_dtype_kinds(klass, to_concat, expected):
+    to_concat_klass = [klass(c) for c in to_concat]
+    result = _concat.get_dtype_kinds(to_concat_klass)
+    assert result == set(expected)
+
+
+@pytest.mark.parametrize('to_concat, expected', [
+    # because we don't have Period dtype (yet),
+    # Series results in object dtype
+    ([PeriodIndex(['2011-01'], freq='M'),
+      PeriodIndex(['2011-01'], freq='M')], ['period[M]']),
+    ([Series([Period('2011-01', freq='M')]),
+      Series([Period('2011-02', freq='M')])], ['object']),
+    ([PeriodIndex(['2011-01'], freq='M'),
+      PeriodIndex(['2011-01'], freq='D')], ['period[M]', 'period[D]']),
+    ([Series([Period('2011-01', freq='M')]),
+      Series([Period('2011-02', freq='D')])], ['object'])])
+def test_get_dtype_kinds_period(to_concat, expected):
+    result = _concat.get_dtype_kinds(to_concat)
+    assert result == set(expected)
diff --git a/pandas/tests/dtypes/test_dtypes.py b/pandas/tests/dtypes/test_dtypes.py
new file mode 100644
index 0000000000000..eee53a2fcac6a
--- /dev/null
+++ b/pandas/tests/dtypes/test_dtypes.py
@@ -0,0 +1,769 @@
+# -*- coding: utf-8 -*-
+import re
+import pytest
+
+import numpy as np
+import pandas as pd
+from pandas import (
+    Series, Categorical, CategoricalIndex, IntervalIndex, date_range)
+
+from pandas.compat import string_types
+from pandas.core.dtypes.dtypes import (
+    DatetimeTZDtype, PeriodDtype,
+    IntervalDtype, CategoricalDtype)
+from pandas.core.dtypes.common import (
+    is_categorical_dtype, is_categorical,
+    is_datetime64tz_dtype, is_datetimetz,
+    is_period_dtype, is_period,
+    is_dtype_equal, is_datetime64_ns_dtype,
+    is_datetime64_dtype, is_interval_dtype,
+    is_datetime64_any_dtype, is_string_dtype,
+    _coerce_to_dtype)
+import pandas.util.testing as tm
+
+
+@pytest.fixture(params=[True, False, None])
+def ordered(request):
+    return request.param
+
+
+class Base(object):
+
+    def setup_method(self, method):
+        self.dtype = self.create()
+
+    def test_hash(self):
+        hash(self.dtype)
+
+    def test_equality_invalid(self):
+        assert not self.dtype == 'foo'
+        assert not is_dtype_equal(self.dtype, np.int64)
+
+    def test_numpy_informed(self):
+        pytest.raises(TypeError, np.dtype, self.dtype)
+
+        assert not self.dtype == np.str_
+        assert not np.str_ == self.dtype
+
+    def test_pickle(self):
+        # make sure our cache is NOT pickled
+
+        # clear the cache
+        type(self.dtype).reset_cache()
+        assert not len(self.dtype._cache)
+
+        # force back to the cache
+        result = tm.round_trip_pickle(self.dtype)
+        assert not len(self.dtype._cache)
+        assert result == self.dtype
+
+
+class TestCategoricalDtype(Base):
+
+    def create(self):
+        return CategoricalDtype()
+
+    def test_pickle(self):
+        # make sure our cache is NOT pickled
+
+        # clear the cache
+        type(self.dtype).reset_cache()
+        assert not len(self.dtype._cache)
+
+        # force back to the cache
+        result = tm.round_trip_pickle(self.dtype)
+        assert result == self.dtype
+
+    def test_hash_vs_equality(self):
+        dtype = self.dtype
+        dtype2 = CategoricalDtype()
+        assert dtype == dtype2
+        assert dtype2 == dtype
+        assert hash(dtype) == hash(dtype2)
+
+    def test_equality(self):
+        assert is_dtype_equal(self.dtype, 'category')
+        assert is_dtype_equal(self.dtype, CategoricalDtype())
+        assert not is_dtype_equal(self.dtype, 'foo')
+
+    def test_construction_from_string(self):
+        result = CategoricalDtype.construct_from_string('category')
+        assert is_dtype_equal(self.dtype, result)
+        pytest.raises(
+            TypeError, lambda: CategoricalDtype.construct_from_string('foo'))
+
+    def test_constructor_invalid(self):
+        with tm.assert_raises_regex(TypeError,
+                                    "CategoricalIndex.* must be called"):
+            CategoricalDtype("category")
+
+    def test_is_dtype(self):
+        assert CategoricalDtype.is_dtype(self.dtype)
+        assert CategoricalDtype.is_dtype('category')
+        assert CategoricalDtype.is_dtype(CategoricalDtype())
+        assert not CategoricalDtype.is_dtype('foo')
+        assert not CategoricalDtype.is_dtype(np.float64)
+
+    def test_basic(self):
+
+        assert is_categorical_dtype(self.dtype)
+
+        factor = Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
+
+        s = Series(factor, name='A')
+
+        # dtypes
+        assert is_categorical_dtype(s.dtype)
+        assert is_categorical_dtype(s)
+        assert not is_categorical_dtype(np.dtype('float64'))
+
+        assert is_categorical(s.dtype)
+        assert is_categorical(s)
+        assert not is_categorical(np.dtype('float64'))
+        assert not is_categorical(1.0)
+
+    def test_tuple_categories(self):
+        categories = [(1, 'a'), (2, 'b'), (3, 'c')]
+        result = CategoricalDtype(categories)
+        assert all(result.categories == categories)
+
+
+class TestDatetimeTZDtype(Base):
+
+    def create(self):
+        return DatetimeTZDtype('ns', 'US/Eastern')
+
+    def test_hash_vs_equality(self):
+        # make sure that we satisfy is semantics
+        dtype = self.dtype
+        dtype2 = DatetimeTZDtype('ns', 'US/Eastern')
+        dtype3 = DatetimeTZDtype(dtype2)
+        assert dtype == dtype2
+        assert dtype2 == dtype
+        assert dtype3 == dtype
+        assert dtype is dtype2
+        assert dtype2 is dtype
+        assert dtype3 is dtype
+        assert hash(dtype) == hash(dtype2)
+        assert hash(dtype) == hash(dtype3)
+
+    def test_construction(self):
+        pytest.raises(ValueError,
+                      lambda: DatetimeTZDtype('ms', 'US/Eastern'))
+
+    def test_subclass(self):
+        a = DatetimeTZDtype('datetime64[ns, US/Eastern]')
+        b = DatetimeTZDtype('datetime64[ns, CET]')
+
+        assert issubclass(type(a), type(a))
+        assert issubclass(type(a), type(b))
+
+    def test_coerce_to_dtype(self):
+        assert (_coerce_to_dtype('datetime64[ns, US/Eastern]') ==
+                DatetimeTZDtype('ns', 'US/Eastern'))
+        assert (_coerce_to_dtype('datetime64[ns, Asia/Tokyo]') ==
+                DatetimeTZDtype('ns', 'Asia/Tokyo'))
+
+    def test_compat(self):
+        assert is_datetime64tz_dtype(self.dtype)
+        assert is_datetime64tz_dtype('datetime64[ns, US/Eastern]')
+        assert is_datetime64_any_dtype(self.dtype)
+        assert is_datetime64_any_dtype('datetime64[ns, US/Eastern]')
+        assert is_datetime64_ns_dtype(self.dtype)
+        assert is_datetime64_ns_dtype('datetime64[ns, US/Eastern]')
+        assert not is_datetime64_dtype(self.dtype)
+        assert not is_datetime64_dtype('datetime64[ns, US/Eastern]')
+
+    def test_construction_from_string(self):
+        result = DatetimeTZDtype('datetime64[ns, US/Eastern]')
+        assert is_dtype_equal(self.dtype, result)
+        result = DatetimeTZDtype.construct_from_string(
+            'datetime64[ns, US/Eastern]')
+        assert is_dtype_equal(self.dtype, result)
+        pytest.raises(TypeError,
+                      lambda: DatetimeTZDtype.construct_from_string('foo'))
+
+    def test_is_dtype(self):
+        assert not DatetimeTZDtype.is_dtype(None)
+        assert DatetimeTZDtype.is_dtype(self.dtype)
+        assert DatetimeTZDtype.is_dtype('datetime64[ns, US/Eastern]')
+        assert not DatetimeTZDtype.is_dtype('foo')
+        assert DatetimeTZDtype.is_dtype(DatetimeTZDtype('ns', 'US/Pacific'))
+        assert not DatetimeTZDtype.is_dtype(np.float64)
+
+    def test_equality(self):
+        assert is_dtype_equal(self.dtype, 'datetime64[ns, US/Eastern]')
+        assert is_dtype_equal(self.dtype, DatetimeTZDtype('ns', 'US/Eastern'))
+        assert not is_dtype_equal(self.dtype, 'foo')
+        assert not is_dtype_equal(self.dtype, DatetimeTZDtype('ns', 'CET'))
+        assert not is_dtype_equal(DatetimeTZDtype('ns', 'US/Eastern'),
+                                  DatetimeTZDtype('ns', 'US/Pacific'))
+
+        # numpy compat
+        assert is_dtype_equal(np.dtype("M8[ns]"), "datetime64[ns]")
+
+    def test_basic(self):
+
+        assert is_datetime64tz_dtype(self.dtype)
+
+        dr = date_range('20130101', periods=3, tz='US/Eastern')
+        s = Series(dr, name='A')
+
+        # dtypes
+        assert is_datetime64tz_dtype(s.dtype)
+        assert is_datetime64tz_dtype(s)
+        assert not is_datetime64tz_dtype(np.dtype('float64'))
+        assert not is_datetime64tz_dtype(1.0)
+
+        assert is_datetimetz(s)
+        assert is_datetimetz(s.dtype)
+        assert not is_datetimetz(np.dtype('float64'))
+        assert not is_datetimetz(1.0)
+
+    def test_dst(self):
+
+        dr1 = date_range('2013-01-01', periods=3, tz='US/Eastern')
+        s1 = Series(dr1, name='A')
+        assert is_datetimetz(s1)
+
+        dr2 = date_range('2013-08-01', periods=3, tz='US/Eastern')
+        s2 = Series(dr2, name='A')
+        assert is_datetimetz(s2)
+        assert s1.dtype == s2.dtype
+
+    @pytest.mark.parametrize('tz', ['UTC', 'US/Eastern'])
+    @pytest.mark.parametrize('constructor', ['M8', 'datetime64'])
+    def test_parser(self, tz, constructor):
+        # pr #11245
+        dtz_str = '{con}[ns, {tz}]'.format(con=constructor, tz=tz)
+        result = DatetimeTZDtype(dtz_str)
+        expected = DatetimeTZDtype('ns', tz)
+        assert result == expected
+
+    def test_empty(self):
+        dt = DatetimeTZDtype()
+        with pytest.raises(AttributeError):
+            str(dt)
+
+
+class TestPeriodDtype(Base):
+
+    def create(self):
+        return PeriodDtype('D')
+
+    def test_hash_vs_equality(self):
+        # make sure that we satisfy is semantics
+        dtype = self.dtype
+        dtype2 = PeriodDtype('D')
+        dtype3 = PeriodDtype(dtype2)
+        assert dtype == dtype2
+        assert dtype2 == dtype
+        assert dtype3 == dtype
+        assert dtype is dtype2
+        assert dtype2 is dtype
+        assert dtype3 is dtype
+        assert hash(dtype) == hash(dtype2)
+        assert hash(dtype) == hash(dtype3)
+
+    def test_construction(self):
+        with pytest.raises(ValueError):
+            PeriodDtype('xx')
+
+        for s in ['period[D]', 'Period[D]', 'D']:
+            dt = PeriodDtype(s)
+            assert dt.freq == pd.tseries.offsets.Day()
+            assert is_period_dtype(dt)
+
+        for s in ['period[3D]', 'Period[3D]', '3D']:
+            dt = PeriodDtype(s)
+            assert dt.freq == pd.tseries.offsets.Day(3)
+            assert is_period_dtype(dt)
+
+        for s in ['period[26H]', 'Period[26H]', '26H',
+                  'period[1D2H]', 'Period[1D2H]', '1D2H']:
+            dt = PeriodDtype(s)
+            assert dt.freq == pd.tseries.offsets.Hour(26)
+            assert is_period_dtype(dt)
+
+    def test_subclass(self):
+        a = PeriodDtype('period[D]')
+        b = PeriodDtype('period[3D]')
+
+        assert issubclass(type(a), type(a))
+        assert issubclass(type(a), type(b))
+
+    def test_identity(self):
+        assert PeriodDtype('period[D]') == PeriodDtype('period[D]')
+        assert PeriodDtype('period[D]') is PeriodDtype('period[D]')
+
+        assert PeriodDtype('period[3D]') == PeriodDtype('period[3D]')
+        assert PeriodDtype('period[3D]') is PeriodDtype('period[3D]')
+
+        assert PeriodDtype('period[1S1U]') == PeriodDtype('period[1000001U]')
+        assert PeriodDtype('period[1S1U]') is PeriodDtype('period[1000001U]')
+
+    def test_coerce_to_dtype(self):
+        assert _coerce_to_dtype('period[D]') == PeriodDtype('period[D]')
+        assert _coerce_to_dtype('period[3M]') == PeriodDtype('period[3M]')
+
+    def test_compat(self):
+        assert not is_datetime64_ns_dtype(self.dtype)
+        assert not is_datetime64_ns_dtype('period[D]')
+        assert not is_datetime64_dtype(self.dtype)
+        assert not is_datetime64_dtype('period[D]')
+
+    def test_construction_from_string(self):
+        result = PeriodDtype('period[D]')
+        assert is_dtype_equal(self.dtype, result)
+        result = PeriodDtype.construct_from_string('period[D]')
+        assert is_dtype_equal(self.dtype, result)
+        with pytest.raises(TypeError):
+            PeriodDtype.construct_from_string('foo')
+        with pytest.raises(TypeError):
+            PeriodDtype.construct_from_string('period[foo]')
+        with pytest.raises(TypeError):
+            PeriodDtype.construct_from_string('foo[D]')
+
+        with pytest.raises(TypeError):
+            PeriodDtype.construct_from_string('datetime64[ns]')
+        with pytest.raises(TypeError):
+            PeriodDtype.construct_from_string('datetime64[ns, US/Eastern]')
+
+    def test_is_dtype(self):
+        assert PeriodDtype.is_dtype(self.dtype)
+        assert PeriodDtype.is_dtype('period[D]')
+        assert PeriodDtype.is_dtype('period[3D]')
+        assert PeriodDtype.is_dtype(PeriodDtype('3D'))
+        assert PeriodDtype.is_dtype('period[U]')
+        assert PeriodDtype.is_dtype('period[S]')
+        assert PeriodDtype.is_dtype(PeriodDtype('U'))
+        assert PeriodDtype.is_dtype(PeriodDtype('S'))
+
+        assert not PeriodDtype.is_dtype('D')
+        assert not PeriodDtype.is_dtype('3D')
+        assert not PeriodDtype.is_dtype('U')
+        assert not PeriodDtype.is_dtype('S')
+        assert not PeriodDtype.is_dtype('foo')
+        assert not PeriodDtype.is_dtype(np.object_)
+        assert not PeriodDtype.is_dtype(np.int64)
+        assert not PeriodDtype.is_dtype(np.float64)
+
+    def test_equality(self):
+        assert is_dtype_equal(self.dtype, 'period[D]')
+        assert is_dtype_equal(self.dtype, PeriodDtype('D'))
+        assert is_dtype_equal(self.dtype, PeriodDtype('D'))
+        assert is_dtype_equal(PeriodDtype('D'), PeriodDtype('D'))
+
+        assert not is_dtype_equal(self.dtype, 'D')
+        assert not is_dtype_equal(PeriodDtype('D'), PeriodDtype('2D'))
+
+    def test_basic(self):
+        assert is_period_dtype(self.dtype)
+
+        pidx = pd.period_range('2013-01-01 09:00', periods=5, freq='H')
+
+        assert is_period_dtype(pidx.dtype)
+        assert is_period_dtype(pidx)
+        assert is_period(pidx)
+
+        s = Series(pidx, name='A')
+        # dtypes
+        # series results in object dtype currently,
+        # is_period checks period_arraylike
+        assert not is_period_dtype(s.dtype)
+        assert not is_period_dtype(s)
+        assert is_period(s)
+
+        assert not is_period_dtype(np.dtype('float64'))
+        assert not is_period_dtype(1.0)
+        assert not is_period(np.dtype('float64'))
+        assert not is_period(1.0)
+
+    def test_empty(self):
+        dt = PeriodDtype()
+        with pytest.raises(AttributeError):
+            str(dt)
+
+    def test_not_string(self):
+        # though PeriodDtype has object kind, it cannot be string
+        assert not is_string_dtype(PeriodDtype('D'))
+
+
+class TestIntervalDtype(Base):
+
+    def create(self):
+        return IntervalDtype('int64')
+
+    def test_hash_vs_equality(self):
+        # make sure that we satisfy is semantics
+        dtype = self.dtype
+        dtype2 = IntervalDtype('int64')
+        dtype3 = IntervalDtype(dtype2)
+        assert dtype == dtype2
+        assert dtype2 == dtype
+        assert dtype3 == dtype
+        assert dtype is dtype2
+        assert dtype2 is dtype3
+        assert dtype3 is dtype
+        assert hash(dtype) == hash(dtype2)
+        assert hash(dtype) == hash(dtype3)
+
+        dtype1 = IntervalDtype('interval')
+        dtype2 = IntervalDtype(dtype1)
+        dtype3 = IntervalDtype('interval')
+        assert dtype2 == dtype1
+        assert dtype2 == dtype2
+        assert dtype2 == dtype3
+        assert dtype2 is dtype1
+        assert dtype2 is dtype2
+        assert dtype2 is dtype3
+        assert hash(dtype2) == hash(dtype1)
+        assert hash(dtype2) == hash(dtype2)
+        assert hash(dtype2) == hash(dtype3)
+
+    @pytest.mark.parametrize('subtype', [
+        'interval[int64]', 'Interval[int64]', 'int64', np.dtype('int64')])
+    def test_construction(self, subtype):
+        i = IntervalDtype(subtype)
+        assert i.subtype == np.dtype('int64')
+        assert is_interval_dtype(i)
+
+    @pytest.mark.parametrize('subtype', [None, 'interval', 'Interval'])
+    def test_construction_generic(self, subtype):
+        # generic
+        i = IntervalDtype(subtype)
+        assert i.subtype is None
+        assert is_interval_dtype(i)
+
+    @pytest.mark.parametrize('subtype', [
+        CategoricalDtype(list('abc'), False),
+        CategoricalDtype(list('wxyz'), True),
+        object, str, '<U10', 'interval[category]', 'interval[object]'])
+    def test_construction_not_supported(self, subtype):
+        # GH 19016
+        msg = ('category, object, and string subtypes are not supported '
+               'for IntervalDtype')
+        with tm.assert_raises_regex(TypeError, msg):
+            IntervalDtype(subtype)
+
+    def test_construction_errors(self):
+        msg = 'could not construct IntervalDtype'
+        with tm.assert_raises_regex(ValueError, msg):
+            IntervalDtype('xx')
+
+    def test_construction_from_string(self):
+        result = IntervalDtype('interval[int64]')
+        assert is_dtype_equal(self.dtype, result)
+        result = IntervalDtype.construct_from_string('interval[int64]')
+        assert is_dtype_equal(self.dtype, result)
+
+    @pytest.mark.parametrize('string', [
+        'foo', 'interval[foo]', 'foo[int64]', 0, 3.14, ('a', 'b'), None])
+    def test_construction_from_string_errors(self, string):
+        if isinstance(string, string_types):
+            error, msg = ValueError, 'could not construct IntervalDtype'
+        else:
+            error, msg = TypeError, 'a string needs to be passed, got type'
+
+        with tm.assert_raises_regex(error, msg):
+            IntervalDtype.construct_from_string(string)
+
+    def test_subclass(self):
+        a = IntervalDtype('interval[int64]')
+        b = IntervalDtype('interval[int64]')
+
+        assert issubclass(type(a), type(a))
+        assert issubclass(type(a), type(b))
+
+    def test_is_dtype(self):
+        assert IntervalDtype.is_dtype(self.dtype)
+        assert IntervalDtype.is_dtype('interval')
+        assert IntervalDtype.is_dtype(IntervalDtype('float64'))
+        assert IntervalDtype.is_dtype(IntervalDtype('int64'))
+        assert IntervalDtype.is_dtype(IntervalDtype(np.int64))
+
+        assert not IntervalDtype.is_dtype('D')
+        assert not IntervalDtype.is_dtype('3D')
+        assert not IntervalDtype.is_dtype('U')
+        assert not IntervalDtype.is_dtype('S')
+        assert not IntervalDtype.is_dtype('foo')
+        assert not IntervalDtype.is_dtype(np.object_)
+        assert not IntervalDtype.is_dtype(np.int64)
+        assert not IntervalDtype.is_dtype(np.float64)
+
+    def test_coerce_to_dtype(self):
+        assert (_coerce_to_dtype('interval[int64]') ==
+                IntervalDtype('interval[int64]'))
+
+    def test_equality(self):
+        assert is_dtype_equal(self.dtype, 'interval[int64]')
+        assert is_dtype_equal(self.dtype, IntervalDtype('int64'))
+        assert is_dtype_equal(IntervalDtype('int64'), IntervalDtype('int64'))
+
+        assert not is_dtype_equal(self.dtype, 'int64')
+        assert not is_dtype_equal(IntervalDtype('int64'),
+                                  IntervalDtype('float64'))
+
+        # invalid subtype comparisons do not raise when directly compared
+        dtype1 = IntervalDtype('float64')
+        dtype2 = IntervalDtype('datetime64[ns, US/Eastern]')
+        assert dtype1 != dtype2
+        assert dtype2 != dtype1
+
+    @pytest.mark.parametrize('subtype', [
+        None, 'interval', 'Interval', 'int64', 'uint64', 'float64',
+        'complex128', 'datetime64', 'timedelta64', PeriodDtype('Q')])
+    def test_equality_generic(self, subtype):
+        # GH 18980
+        dtype = IntervalDtype(subtype)
+        assert is_dtype_equal(dtype, 'interval')
+        assert is_dtype_equal(dtype, IntervalDtype())
+
+    @pytest.mark.parametrize('subtype', [
+        'int64', 'uint64', 'float64', 'complex128', 'datetime64',
+        'timedelta64', PeriodDtype('Q')])
+    def test_name_repr(self, subtype):
+        # GH 18980
+        dtype = IntervalDtype(subtype)
+        expected = 'interval[{subtype}]'.format(subtype=subtype)
+        assert str(dtype) == expected
+        assert dtype.name == 'interval'
+
+    @pytest.mark.parametrize('subtype', [None, 'interval', 'Interval'])
+    def test_name_repr_generic(self, subtype):
+        # GH 18980
+        dtype = IntervalDtype(subtype)
+        assert str(dtype) == 'interval'
+        assert dtype.name == 'interval'
+
+    def test_basic(self):
+        assert is_interval_dtype(self.dtype)
+
+        ii = IntervalIndex.from_breaks(range(3))
+
+        assert is_interval_dtype(ii.dtype)
+        assert is_interval_dtype(ii)
+
+        s = Series(ii, name='A')
+
+        # dtypes
+        # series results in object dtype currently,
+        assert not is_interval_dtype(s.dtype)
+        assert not is_interval_dtype(s)
+
+    def test_basic_dtype(self):
+        assert is_interval_dtype('interval[int64]')
+        assert is_interval_dtype(IntervalIndex.from_tuples([(0, 1)]))
+        assert is_interval_dtype(IntervalIndex.from_breaks(np.arange(4)))
+        assert is_interval_dtype(IntervalIndex.from_breaks(
+            date_range('20130101', periods=3)))
+        assert not is_interval_dtype('U')
+        assert not is_interval_dtype('S')
+        assert not is_interval_dtype('foo')
+        assert not is_interval_dtype(np.object_)
+        assert not is_interval_dtype(np.int64)
+        assert not is_interval_dtype(np.float64)
+
+    def test_caching(self):
+        IntervalDtype.reset_cache()
+        dtype = IntervalDtype("int64")
+        assert len(IntervalDtype._cache) == 1
+
+        IntervalDtype("interval")
+        assert len(IntervalDtype._cache) == 2
+
+        IntervalDtype.reset_cache()
+        tm.round_trip_pickle(dtype)
+        assert len(IntervalDtype._cache) == 0
+
+
+class TestCategoricalDtypeParametrized(object):
+
+    @pytest.mark.parametrize('categories', [
+        list('abcd'),
+        np.arange(1000),
+        ['a', 'b', 10, 2, 1.3, True],
+        [True, False],
+        pd.date_range('2017', periods=4)])
+    def test_basic(self, categories, ordered):
+        c1 = CategoricalDtype(categories, ordered=ordered)
+        tm.assert_index_equal(c1.categories, pd.Index(categories))
+        assert c1.ordered is ordered
+
+    def test_order_matters(self):
+        categories = ['a', 'b']
+        c1 = CategoricalDtype(categories, ordered=True)
+        c2 = CategoricalDtype(categories, ordered=False)
+        c3 = CategoricalDtype(categories, ordered=None)
+        assert c1 is not c2
+        assert c1 is not c3
+
+    @pytest.mark.parametrize('ordered', [False, None])
+    def test_unordered_same(self, ordered):
+        c1 = CategoricalDtype(['a', 'b'], ordered=ordered)
+        c2 = CategoricalDtype(['b', 'a'], ordered=ordered)
+        assert hash(c1) == hash(c2)
+
+    def test_categories(self):
+        result = CategoricalDtype(['a', 'b', 'c'])
+        tm.assert_index_equal(result.categories, pd.Index(['a', 'b', 'c']))
+        assert result.ordered is None
+
+    def test_equal_but_different(self, ordered):
+        c1 = CategoricalDtype([1, 2, 3])
+        c2 = CategoricalDtype([1., 2., 3.])
+        assert c1 is not c2
+        assert c1 != c2
+
+    @pytest.mark.parametrize('v1, v2', [
+        ([1, 2, 3], [1, 2, 3]),
+        ([1, 2, 3], [3, 2, 1]),
+    ])
+    def test_order_hashes_different(self, v1, v2):
+        c1 = CategoricalDtype(v1, ordered=False)
+        c2 = CategoricalDtype(v2, ordered=True)
+        c3 = CategoricalDtype(v1, ordered=None)
+        assert c1 is not c2
+        assert c1 is not c3
+
+    def test_nan_invalid(self):
+        with pytest.raises(ValueError):
+            CategoricalDtype([1, 2, np.nan])
+
+    def test_non_unique_invalid(self):
+        with pytest.raises(ValueError):
+            CategoricalDtype([1, 2, 1])
+
+    def test_same_categories_different_order(self):
+        c1 = CategoricalDtype(['a', 'b'], ordered=True)
+        c2 = CategoricalDtype(['b', 'a'], ordered=True)
+        assert c1 is not c2
+
+    @pytest.mark.parametrize('ordered1', [True, False, None])
+    @pytest.mark.parametrize('ordered2', [True, False, None])
+    def test_categorical_equality(self, ordered1, ordered2):
+        # same categories, same order
+        # any combination of None/False are equal
+        # True/True is the only combination with True that are equal
+        c1 = CategoricalDtype(list('abc'), ordered1)
+        c2 = CategoricalDtype(list('abc'), ordered2)
+        result = c1 == c2
+        expected = bool(ordered1) is bool(ordered2)
+        assert result is expected
+
+        # same categories, different order
+        # any combination of None/False are equal (order doesn't matter)
+        # any combination with True are not equal (different order of cats)
+        c1 = CategoricalDtype(list('abc'), ordered1)
+        c2 = CategoricalDtype(list('cab'), ordered2)
+        result = c1 == c2
+        expected = (bool(ordered1) is False) and (bool(ordered2) is False)
+        assert result is expected
+
+        # different categories
+        c2 = CategoricalDtype([1, 2, 3], ordered2)
+        assert c1 != c2
+
+        # none categories
+        c1 = CategoricalDtype(list('abc'), ordered1)
+        c2 = CategoricalDtype(None, ordered2)
+        c3 = CategoricalDtype(None, ordered1)
+        assert c1 == c2
+        assert c2 == c1
+        assert c2 == c3
+
+    @pytest.mark.parametrize('categories', [list('abc'), None])
+    @pytest.mark.parametrize('other', ['category', 'not a category'])
+    def test_categorical_equality_strings(self, categories, ordered, other):
+        c1 = CategoricalDtype(categories, ordered)
+        result = c1 == other
+        expected = other == 'category'
+        assert result is expected
+
+    def test_invalid_raises(self):
+        with tm.assert_raises_regex(TypeError, 'ordered'):
+            CategoricalDtype(['a', 'b'], ordered='foo')
+
+        with tm.assert_raises_regex(TypeError, 'collection'):
+            CategoricalDtype('category')
+
+    def test_mixed(self):
+        a = CategoricalDtype(['a', 'b', 1, 2])
+        b = CategoricalDtype(['a', 'b', '1', '2'])
+        assert hash(a) != hash(b)
+
+    def test_from_categorical_dtype_identity(self):
+        c1 = Categorical([1, 2], categories=[1, 2, 3], ordered=True)
+        # Identity test for no changes
+        c2 = CategoricalDtype._from_categorical_dtype(c1)
+        assert c2 is c1
+
+    def test_from_categorical_dtype_categories(self):
+        c1 = Categorical([1, 2], categories=[1, 2, 3], ordered=True)
+        # override categories
+        result = CategoricalDtype._from_categorical_dtype(
+            c1, categories=[2, 3])
+        assert result == CategoricalDtype([2, 3], ordered=True)
+
+    def test_from_categorical_dtype_ordered(self):
+        c1 = Categorical([1, 2], categories=[1, 2, 3], ordered=True)
+        # override ordered
+        result = CategoricalDtype._from_categorical_dtype(
+            c1, ordered=False)
+        assert result == CategoricalDtype([1, 2, 3], ordered=False)
+
+    def test_from_categorical_dtype_both(self):
+        c1 = Categorical([1, 2], categories=[1, 2, 3], ordered=True)
+        # override ordered
+        result = CategoricalDtype._from_categorical_dtype(
+            c1, categories=[1, 2], ordered=False)
+        assert result == CategoricalDtype([1, 2], ordered=False)
+
+    def test_str_vs_repr(self, ordered):
+        c1 = CategoricalDtype(['a', 'b'], ordered=ordered)
+        assert str(c1) == 'category'
+        # Py2 will have unicode prefixes
+        pat = r"CategoricalDtype\(categories=\[.*\], ordered={ordered}\)"
+        assert re.match(pat.format(ordered=ordered), repr(c1))
+
+    def test_categorical_categories(self):
+        # GH17884
+        c1 = CategoricalDtype(Categorical(['a', 'b']))
+        tm.assert_index_equal(c1.categories, pd.Index(['a', 'b']))
+        c1 = CategoricalDtype(CategoricalIndex(['a', 'b']))
+        tm.assert_index_equal(c1.categories, pd.Index(['a', 'b']))
+
+    @pytest.mark.parametrize('new_categories', [
+        list('abc'), list('cba'), list('wxyz'), None])
+    @pytest.mark.parametrize('new_ordered', [True, False, None])
+    def test_update_dtype(self, ordered, new_categories, new_ordered):
+        dtype = CategoricalDtype(list('abc'), ordered)
+        new_dtype = CategoricalDtype(new_categories, new_ordered)
+
+        expected_categories = new_dtype.categories
+        if expected_categories is None:
+            expected_categories = dtype.categories
+
+        expected_ordered = new_dtype.ordered
+        if expected_ordered is None:
+            expected_ordered = dtype.ordered
+
+        result = dtype.update_dtype(new_dtype)
+        tm.assert_index_equal(result.categories, expected_categories)
+        assert result.ordered is expected_ordered
+
+    def test_update_dtype_string(self, ordered):
+        dtype = CategoricalDtype(list('abc'), ordered)
+        expected_categories = dtype.categories
+        expected_ordered = dtype.ordered
+        result = dtype.update_dtype('category')
+        tm.assert_index_equal(result.categories, expected_categories)
+        assert result.ordered is expected_ordered
+
+    @pytest.mark.parametrize('bad_dtype', [
+        'foo', object, np.int64, PeriodDtype('Q')])
+    def test_update_dtype_errors(self, bad_dtype):
+        dtype = CategoricalDtype(list('abc'), False)
+        msg = 'a CategoricalDtype must be passed to perform an update, '
+        with tm.assert_raises_regex(ValueError, msg):
+            dtype.update_dtype(bad_dtype)
diff --git a/pandas/tests/dtypes/test_generic.py b/pandas/tests/dtypes/test_generic.py
new file mode 100644
index 0000000000000..53f92b98f022e
--- /dev/null
+++ b/pandas/tests/dtypes/test_generic.py
@@ -0,0 +1,83 @@
+# -*- coding: utf-8 -*-
+
+from warnings import catch_warnings
+import numpy as np
+import pandas as pd
+from pandas.core.dtypes import generic as gt
+from pandas.util import testing as tm
+
+
+class TestABCClasses(object):
+    tuples = [[1, 2, 2], ['red', 'blue', 'red']]
+    multi_index = pd.MultiIndex.from_arrays(tuples, names=('number', 'color'))
+    datetime_index = pd.to_datetime(['2000/1/1', '2010/1/1'])
+    timedelta_index = pd.to_timedelta(np.arange(5), unit='s')
+    period_index = pd.period_range('2000/1/1', '2010/1/1/', freq='M')
+    categorical = pd.Categorical([1, 2, 3], categories=[2, 3, 1])
+    categorical_df = pd.DataFrame({"values": [1, 2, 3]}, index=categorical)
+    df = pd.DataFrame({'names': ['a', 'b', 'c']}, index=multi_index)
+    sparse_series = pd.Series([1, 2, 3]).to_sparse()
+    sparse_array = pd.SparseArray(np.random.randn(10))
+    sparse_frame = pd.SparseDataFrame({'a': [1, -1, None]})
+
+    def test_abc_types(self):
+        assert isinstance(pd.Index(['a', 'b', 'c']), gt.ABCIndex)
+        assert isinstance(pd.Int64Index([1, 2, 3]), gt.ABCInt64Index)
+        assert isinstance(pd.UInt64Index([1, 2, 3]), gt.ABCUInt64Index)
+        assert isinstance(pd.Float64Index([1, 2, 3]), gt.ABCFloat64Index)
+        assert isinstance(self.multi_index, gt.ABCMultiIndex)
+        assert isinstance(self.datetime_index, gt.ABCDatetimeIndex)
+        assert isinstance(self.timedelta_index, gt.ABCTimedeltaIndex)
+        assert isinstance(self.period_index, gt.ABCPeriodIndex)
+        assert isinstance(self.categorical_df.index, gt.ABCCategoricalIndex)
+        assert isinstance(pd.Index(['a', 'b', 'c']), gt.ABCIndexClass)
+        assert isinstance(pd.Int64Index([1, 2, 3]), gt.ABCIndexClass)
+        assert isinstance(pd.Series([1, 2, 3]), gt.ABCSeries)
+        assert isinstance(self.df, gt.ABCDataFrame)
+        with catch_warnings(record=True):
+            assert isinstance(self.df.to_panel(), gt.ABCPanel)
+        assert isinstance(self.sparse_series, gt.ABCSparseSeries)
+        assert isinstance(self.sparse_array, gt.ABCSparseArray)
+        assert isinstance(self.sparse_frame, gt.ABCSparseDataFrame)
+        assert isinstance(self.categorical, gt.ABCCategorical)
+        assert isinstance(pd.Period('2012', freq='A-DEC'), gt.ABCPeriod)
+
+        assert isinstance(pd.DateOffset(), gt.ABCDateOffset)
+        assert isinstance(pd.Period('2012', freq='A-DEC').freq,
+                          gt.ABCDateOffset)
+        assert not isinstance(pd.Period('2012', freq='A-DEC'),
+                              gt.ABCDateOffset)
+        assert isinstance(pd.Interval(0, 1.5), gt.ABCInterval)
+        assert not isinstance(pd.Period('2012', freq='A-DEC'), gt.ABCInterval)
+
+
+def test_setattr_warnings():
+    # GH7175 - GOTCHA: You can't use dot notation to add a column...
+    d = {'one': pd.Series([1., 2., 3.], index=['a', 'b', 'c']),
+         'two': pd.Series([1., 2., 3., 4.], index=['a', 'b', 'c', 'd'])}
+    df = pd.DataFrame(d)
+
+    with catch_warnings(record=True) as w:
+        #  successfully add new column
+        #  this should not raise a warning
+        df['three'] = df.two + 1
+        assert len(w) == 0
+        assert df.three.sum() > df.two.sum()
+
+    with catch_warnings(record=True) as w:
+        #  successfully modify column in place
+        #  this should not raise a warning
+        df.one += 1
+        assert len(w) == 0
+        assert df.one.iloc[0] == 2
+
+    with catch_warnings(record=True) as w:
+        #  successfully add an attribute to a series
+        #  this should not raise a warning
+        df.two.not_an_index = [1, 2]
+        assert len(w) == 0
+
+    with tm.assert_produces_warning(UserWarning):
+        #  warn when setting column to nonexistent name
+        df.four = df.two + 2
+        assert df.four.sum() > df.two.sum()
diff --git a/pandas/tests/dtypes/test_inference.py b/pandas/tests/dtypes/test_inference.py
new file mode 100644
index 0000000000000..65527ac1b278f
--- /dev/null
+++ b/pandas/tests/dtypes/test_inference.py
@@ -0,0 +1,1234 @@
+# -*- coding: utf-8 -*-
+
+"""
+These the test the public routines exposed in types/common.py
+related to inference and not otherwise tested in types/test_common.py
+
+"""
+from warnings import catch_warnings
+import collections
+import re
+from datetime import datetime, date, timedelta, time
+from decimal import Decimal
+import numpy as np
+import pytz
+import pytest
+
+import pandas as pd
+from pandas._libs import tslib, lib, missing as libmissing
+from pandas import (Series, Index, DataFrame, Timedelta,
+                    DatetimeIndex, TimedeltaIndex, Timestamp,
+                    Panel, Period, Categorical, isna, Interval,
+                    DateOffset)
+from pandas.compat import u, PY2, StringIO, lrange
+from pandas.core.dtypes import inference
+from pandas.core.dtypes.common import (
+    is_timedelta64_dtype,
+    is_timedelta64_ns_dtype,
+    is_datetime64_dtype,
+    is_datetime64_ns_dtype,
+    is_datetime64_any_dtype,
+    is_datetime64tz_dtype,
+    is_number,
+    is_integer,
+    is_float,
+    is_bool,
+    is_scalar,
+    is_scipy_sparse,
+    _ensure_int32,
+    _ensure_categorical)
+from pandas.util import testing as tm
+import pandas.util._test_decorators as td
+
+
+@pytest.fixture(params=[True, False], ids=str)
+def coerce(request):
+    return request.param
+
+
+def test_is_sequence():
+    is_seq = inference.is_sequence
+    assert (is_seq((1, 2)))
+    assert (is_seq([1, 2]))
+    assert (not is_seq("abcd"))
+    assert (not is_seq(u("abcd")))
+    assert (not is_seq(np.int64))
+
+    class A(object):
+
+        def __getitem__(self):
+            return 1
+
+    assert (not is_seq(A()))
+
+
+@pytest.mark.parametrize(
+    "ll",
+    [
+        [], [1], (1, ), (1, 2), {'a': 1},
+        set([1, 'a']), Series([1]),
+        Series([]), Series(['a']).str])
+def test_is_list_like_passes(ll):
+    assert inference.is_list_like(ll)
+
+
+@pytest.mark.parametrize(
+    "ll", [1, '2', object(), str])
+def test_is_list_like_fails(ll):
+    assert not inference.is_list_like(ll)
+
+
+def test_is_array_like():
+    assert inference.is_array_like(Series([]))
+    assert inference.is_array_like(Series([1, 2]))
+    assert inference.is_array_like(np.array(["a", "b"]))
+    assert inference.is_array_like(Index(["2016-01-01"]))
+
+    class DtypeList(list):
+        dtype = "special"
+
+    assert inference.is_array_like(DtypeList())
+
+    assert not inference.is_array_like([1, 2, 3])
+    assert not inference.is_array_like(tuple())
+    assert not inference.is_array_like("foo")
+    assert not inference.is_array_like(123)
+
+
+@pytest.mark.parametrize('inner', [
+    [], [1], (1, ), (1, 2), {'a': 1}, set([1, 'a']), Series([1]),
+    Series([]), Series(['a']).str, (x for x in range(5))
+])
+@pytest.mark.parametrize('outer', [
+    list, Series, np.array, tuple
+])
+def test_is_nested_list_like_passes(inner, outer):
+    result = outer([inner for _ in range(5)])
+    assert inference.is_list_like(result)
+
+
+@pytest.mark.parametrize('obj', [
+    'abc', [], [1], (1,), ['a'], 'a', {'a'},
+    [1, 2, 3], Series([1]), DataFrame({"A": [1]}),
+    ([1, 2] for _ in range(5)),
+])
+def test_is_nested_list_like_fails(obj):
+    assert not inference.is_nested_list_like(obj)
+
+
+@pytest.mark.parametrize(
+    "ll", [{}, {'A': 1}, Series([1])])
+def test_is_dict_like_passes(ll):
+    assert inference.is_dict_like(ll)
+
+
+@pytest.mark.parametrize(
+    "ll", ['1', 1, [1, 2], (1, 2), range(2), Index([1])])
+def test_is_dict_like_fails(ll):
+    assert not inference.is_dict_like(ll)
+
+
+def test_is_file_like(mock):
+    class MockFile(object):
+        pass
+
+    is_file = inference.is_file_like
+
+    data = StringIO("data")
+    assert is_file(data)
+
+    # No read / write attributes
+    # No iterator attributes
+    m = MockFile()
+    assert not is_file(m)
+
+    MockFile.write = lambda self: 0
+
+    # Write attribute but not an iterator
+    m = MockFile()
+    assert not is_file(m)
+
+    # gh-16530: Valid iterator just means we have the
+    # __iter__ attribute for our purposes.
+    MockFile.__iter__ = lambda self: self
+
+    # Valid write-only file
+    m = MockFile()
+    assert is_file(m)
+
+    del MockFile.write
+    MockFile.read = lambda self: 0
+
+    # Valid read-only file
+    m = MockFile()
+    assert is_file(m)
+
+    # Iterator but no read / write attributes
+    data = [1, 2, 3]
+    assert not is_file(data)
+    assert not is_file(mock.Mock())
+
+
+@pytest.mark.parametrize(
+    "ll", [collections.namedtuple('Test', list('abc'))(1, 2, 3)])
+def test_is_names_tuple_passes(ll):
+    assert inference.is_named_tuple(ll)
+
+
+@pytest.mark.parametrize(
+    "ll", [(1, 2, 3), 'a', Series({'pi': 3.14})])
+def test_is_names_tuple_fails(ll):
+    assert not inference.is_named_tuple(ll)
+
+
+def test_is_hashable():
+
+    # all new-style classes are hashable by default
+    class HashableClass(object):
+        pass
+
+    class UnhashableClass1(object):
+        __hash__ = None
+
+    class UnhashableClass2(object):
+
+        def __hash__(self):
+            raise TypeError("Not hashable")
+
+    hashable = (1,
+                3.14,
+                np.float64(3.14),
+                'a',
+                tuple(),
+                (1, ),
+                HashableClass(), )
+    not_hashable = ([], UnhashableClass1(), )
+    abc_hashable_not_really_hashable = (([], ), UnhashableClass2(), )
+
+    for i in hashable:
+        assert inference.is_hashable(i)
+    for i in not_hashable:
+        assert not inference.is_hashable(i)
+    for i in abc_hashable_not_really_hashable:
+        assert not inference.is_hashable(i)
+
+    # numpy.array is no longer collections.Hashable as of
+    # https://github.com/numpy/numpy/pull/5326, just test
+    # is_hashable()
+    assert not inference.is_hashable(np.array([]))
+
+    # old-style classes in Python 2 don't appear hashable to
+    # collections.Hashable but also seem to support hash() by default
+    if PY2:
+
+        class OldStyleClass():
+            pass
+
+        c = OldStyleClass()
+        assert not isinstance(c, collections.Hashable)
+        assert inference.is_hashable(c)
+        hash(c)  # this will not raise
+
+
+@pytest.mark.parametrize(
+    "ll", [re.compile('ad')])
+def test_is_re_passes(ll):
+    assert inference.is_re(ll)
+
+
+@pytest.mark.parametrize(
+    "ll", ['x', 2, 3, object()])
+def test_is_re_fails(ll):
+    assert not inference.is_re(ll)
+
+
+@pytest.mark.parametrize(
+    "ll", [r'a', u('x'),
+           r'asdf',
+           re.compile('adsf'),
+           u(r'\u2233\s*'),
+           re.compile(r'')])
+def test_is_recompilable_passes(ll):
+    assert inference.is_re_compilable(ll)
+
+
+@pytest.mark.parametrize(
+    "ll", [1, [], object()])
+def test_is_recompilable_fails(ll):
+    assert not inference.is_re_compilable(ll)
+
+
+class TestInference(object):
+
+    def test_infer_dtype_bytes(self):
+        compare = 'string' if PY2 else 'bytes'
+
+        # string array of bytes
+        arr = np.array(list('abc'), dtype='S1')
+        assert lib.infer_dtype(arr) == compare
+
+        # object array of bytes
+        arr = arr.astype(object)
+        assert lib.infer_dtype(arr) == compare
+
+        # object array of bytes with missing values
+        assert lib.infer_dtype([b'a', np.nan, b'c'], skipna=True) == compare
+
+    def test_isinf_scalar(self):
+        # GH 11352
+        assert libmissing.isposinf_scalar(float('inf'))
+        assert libmissing.isposinf_scalar(np.inf)
+        assert not libmissing.isposinf_scalar(-np.inf)
+        assert not libmissing.isposinf_scalar(1)
+        assert not libmissing.isposinf_scalar('a')
+
+        assert libmissing.isneginf_scalar(float('-inf'))
+        assert libmissing.isneginf_scalar(-np.inf)
+        assert not libmissing.isneginf_scalar(np.inf)
+        assert not libmissing.isneginf_scalar(1)
+        assert not libmissing.isneginf_scalar('a')
+
+    def test_maybe_convert_numeric_infinities(self):
+        # see gh-13274
+        infinities = ['inf', 'inF', 'iNf', 'Inf',
+                      'iNF', 'InF', 'INf', 'INF']
+        na_values = set(['', 'NULL', 'nan'])
+
+        pos = np.array(['inf'], dtype=np.float64)
+        neg = np.array(['-inf'], dtype=np.float64)
+
+        msg = "Unable to parse string"
+
+        for infinity in infinities:
+            for maybe_int in (True, False):
+                out = lib.maybe_convert_numeric(
+                    np.array([infinity], dtype=object),
+                    na_values, maybe_int)
+                tm.assert_numpy_array_equal(out, pos)
+
+                out = lib.maybe_convert_numeric(
+                    np.array(['-' + infinity], dtype=object),
+                    na_values, maybe_int)
+                tm.assert_numpy_array_equal(out, neg)
+
+                out = lib.maybe_convert_numeric(
+                    np.array([u(infinity)], dtype=object),
+                    na_values, maybe_int)
+                tm.assert_numpy_array_equal(out, pos)
+
+                out = lib.maybe_convert_numeric(
+                    np.array(['+' + infinity], dtype=object),
+                    na_values, maybe_int)
+                tm.assert_numpy_array_equal(out, pos)
+
+                # too many characters
+                with tm.assert_raises_regex(ValueError, msg):
+                    lib.maybe_convert_numeric(
+                        np.array(['foo_' + infinity], dtype=object),
+                        na_values, maybe_int)
+
+    def test_maybe_convert_numeric_post_floatify_nan(self, coerce):
+        # see gh-13314
+        data = np.array(['1.200', '-999.000', '4.500'], dtype=object)
+        expected = np.array([1.2, np.nan, 4.5], dtype=np.float64)
+        nan_values = set([-999, -999.0])
+
+        out = lib.maybe_convert_numeric(data, nan_values, coerce)
+        tm.assert_numpy_array_equal(out, expected)
+
+    def test_convert_infs(self):
+        arr = np.array(['inf', 'inf', 'inf'], dtype='O')
+        result = lib.maybe_convert_numeric(arr, set(), False)
+        assert result.dtype == np.float64
+
+        arr = np.array(['-inf', '-inf', '-inf'], dtype='O')
+        result = lib.maybe_convert_numeric(arr, set(), False)
+        assert result.dtype == np.float64
+
+    def test_scientific_no_exponent(self):
+        # See PR 12215
+        arr = np.array(['42E', '2E', '99e', '6e'], dtype='O')
+        result = lib.maybe_convert_numeric(arr, set(), False, True)
+        assert np.all(np.isnan(result))
+
+    def test_convert_non_hashable(self):
+        # GH13324
+        # make sure that we are handing non-hashables
+        arr = np.array([[10.0, 2], 1.0, 'apple'])
+        result = lib.maybe_convert_numeric(arr, set(), False, True)
+        tm.assert_numpy_array_equal(result, np.array([np.nan, 1.0, np.nan]))
+
+    def test_convert_numeric_uint64(self):
+        arr = np.array([2**63], dtype=object)
+        exp = np.array([2**63], dtype=np.uint64)
+        tm.assert_numpy_array_equal(lib.maybe_convert_numeric(arr, set()), exp)
+
+        arr = np.array([str(2**63)], dtype=object)
+        exp = np.array([2**63], dtype=np.uint64)
+        tm.assert_numpy_array_equal(lib.maybe_convert_numeric(arr, set()), exp)
+
+        arr = np.array([np.uint64(2**63)], dtype=object)
+        exp = np.array([2**63], dtype=np.uint64)
+        tm.assert_numpy_array_equal(lib.maybe_convert_numeric(arr, set()), exp)
+
+    @pytest.mark.parametrize("arr", [
+        np.array([2**63, np.nan], dtype=object),
+        np.array([str(2**63), np.nan], dtype=object),
+        np.array([np.nan, 2**63], dtype=object),
+        np.array([np.nan, str(2**63)], dtype=object)])
+    def test_convert_numeric_uint64_nan(self, coerce, arr):
+        expected = arr.astype(float) if coerce else arr.copy()
+        result = lib.maybe_convert_numeric(arr, set(),
+                                           coerce_numeric=coerce)
+        tm.assert_almost_equal(result, expected)
+
+    def test_convert_numeric_uint64_nan_values(self, coerce):
+        arr = np.array([2**63, 2**63 + 1], dtype=object)
+        na_values = set([2**63])
+
+        expected = (np.array([np.nan, 2**63 + 1], dtype=float)
+                    if coerce else arr.copy())
+        result = lib.maybe_convert_numeric(arr, na_values,
+                                           coerce_numeric=coerce)
+        tm.assert_almost_equal(result, expected)
+
+    @pytest.mark.parametrize("case", [
+        np.array([2**63, -1], dtype=object),
+        np.array([str(2**63), -1], dtype=object),
+        np.array([str(2**63), str(-1)], dtype=object),
+        np.array([-1, 2**63], dtype=object),
+        np.array([-1, str(2**63)], dtype=object),
+        np.array([str(-1), str(2**63)], dtype=object)])
+    def test_convert_numeric_int64_uint64(self, case, coerce):
+        expected = case.astype(float) if coerce else case.copy()
+        result = lib.maybe_convert_numeric(case, set(), coerce_numeric=coerce)
+        tm.assert_almost_equal(result, expected)
+
+    @pytest.mark.parametrize("value", [-2**63 - 1, 2**64])
+    def test_convert_int_overflow(self, value):
+        # see gh-18584
+        arr = np.array([value], dtype=object)
+        result = lib.maybe_convert_objects(arr)
+        tm.assert_numpy_array_equal(arr, result)
+
+    def test_maybe_convert_objects_uint64(self):
+        # see gh-4471
+        arr = np.array([2**63], dtype=object)
+        exp = np.array([2**63], dtype=np.uint64)
+        tm.assert_numpy_array_equal(lib.maybe_convert_objects(arr), exp)
+
+        # NumPy bug: can't compare uint64 to int64, as that
+        # results in both casting to float64, so we should
+        # make sure that this function is robust against it
+        arr = np.array([np.uint64(2**63)], dtype=object)
+        exp = np.array([2**63], dtype=np.uint64)
+        tm.assert_numpy_array_equal(lib.maybe_convert_objects(arr), exp)
+
+        arr = np.array([2, -1], dtype=object)
+        exp = np.array([2, -1], dtype=np.int64)
+        tm.assert_numpy_array_equal(lib.maybe_convert_objects(arr), exp)
+
+        arr = np.array([2**63, -1], dtype=object)
+        exp = np.array([2**63, -1], dtype=object)
+        tm.assert_numpy_array_equal(lib.maybe_convert_objects(arr), exp)
+
+    def test_mixed_dtypes_remain_object_array(self):
+        # GH14956
+        array = np.array([datetime(2015, 1, 1, tzinfo=pytz.utc), 1],
+                         dtype=object)
+        result = lib.maybe_convert_objects(array, convert_datetime=1)
+        tm.assert_numpy_array_equal(result, array)
+
+
+class TestTypeInference(object):
+
+    # Dummy class used for testing with Python objects
+    class Dummy():
+        pass
+
+    def test_length_zero(self):
+        result = lib.infer_dtype(np.array([], dtype='i4'))
+        assert result == 'integer'
+
+        result = lib.infer_dtype([])
+        assert result == 'empty'
+
+        # GH 18004
+        arr = np.array([np.array([], dtype=object),
+                        np.array([], dtype=object)])
+        result = lib.infer_dtype(arr)
+        assert result == 'empty'
+
+    def test_integers(self):
+        arr = np.array([1, 2, 3, np.int64(4), np.int32(5)], dtype='O')
+        result = lib.infer_dtype(arr)
+        assert result == 'integer'
+
+        arr = np.array([1, 2, 3, np.int64(4), np.int32(5), 'foo'], dtype='O')
+        result = lib.infer_dtype(arr)
+        assert result == 'mixed-integer'
+
+        arr = np.array([1, 2, 3, 4, 5], dtype='i4')
+        result = lib.infer_dtype(arr)
+        assert result == 'integer'
+
+    def test_bools(self):
+        arr = np.array([True, False, True, True, True], dtype='O')
+        result = lib.infer_dtype(arr)
+        assert result == 'boolean'
+
+        arr = np.array([np.bool_(True), np.bool_(False)], dtype='O')
+        result = lib.infer_dtype(arr)
+        assert result == 'boolean'
+
+        arr = np.array([True, False, True, 'foo'], dtype='O')
+        result = lib.infer_dtype(arr)
+        assert result == 'mixed'
+
+        arr = np.array([True, False, True], dtype=bool)
+        result = lib.infer_dtype(arr)
+        assert result == 'boolean'
+
+        arr = np.array([True, np.nan, False], dtype='O')
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'boolean'
+
+    def test_floats(self):
+        arr = np.array([1., 2., 3., np.float64(4), np.float32(5)], dtype='O')
+        result = lib.infer_dtype(arr)
+        assert result == 'floating'
+
+        arr = np.array([1, 2, 3, np.float64(4), np.float32(5), 'foo'],
+                       dtype='O')
+        result = lib.infer_dtype(arr)
+        assert result == 'mixed-integer'
+
+        arr = np.array([1, 2, 3, 4, 5], dtype='f4')
+        result = lib.infer_dtype(arr)
+        assert result == 'floating'
+
+        arr = np.array([1, 2, 3, 4, 5], dtype='f8')
+        result = lib.infer_dtype(arr)
+        assert result == 'floating'
+
+    def test_decimals(self):
+        # GH15690
+        arr = np.array([Decimal(1), Decimal(2), Decimal(3)])
+        result = lib.infer_dtype(arr)
+        assert result == 'decimal'
+
+        arr = np.array([1.0, 2.0, Decimal(3)])
+        result = lib.infer_dtype(arr)
+        assert result == 'mixed'
+
+        arr = np.array([Decimal(1), Decimal('NaN'), Decimal(3)])
+        result = lib.infer_dtype(arr)
+        assert result == 'decimal'
+
+        arr = np.array([Decimal(1), np.nan, Decimal(3)], dtype='O')
+        result = lib.infer_dtype(arr)
+        assert result == 'decimal'
+
+    def test_string(self):
+        pass
+
+    def test_unicode(self):
+        arr = [u'a', np.nan, u'c']
+        result = lib.infer_dtype(arr)
+        assert result == 'mixed'
+
+        arr = [u'a', np.nan, u'c']
+        result = lib.infer_dtype(arr, skipna=True)
+        expected = 'unicode' if PY2 else 'string'
+        assert result == expected
+
+    def test_datetime(self):
+
+        dates = [datetime(2012, 1, x) for x in range(1, 20)]
+        index = Index(dates)
+        assert index.inferred_type == 'datetime64'
+
+    def test_infer_dtype_datetime(self):
+
+        arr = np.array([Timestamp('2011-01-01'),
+                        Timestamp('2011-01-02')])
+        assert lib.infer_dtype(arr) == 'datetime'
+
+        arr = np.array([np.datetime64('2011-01-01'),
+                        np.datetime64('2011-01-01')], dtype=object)
+        assert lib.infer_dtype(arr) == 'datetime64'
+
+        arr = np.array([datetime(2011, 1, 1), datetime(2012, 2, 1)])
+        assert lib.infer_dtype(arr) == 'datetime'
+
+        # starts with nan
+        for n in [pd.NaT, np.nan]:
+            arr = np.array([n, pd.Timestamp('2011-01-02')])
+            assert lib.infer_dtype(arr) == 'datetime'
+
+            arr = np.array([n, np.datetime64('2011-01-02')])
+            assert lib.infer_dtype(arr) == 'datetime64'
+
+            arr = np.array([n, datetime(2011, 1, 1)])
+            assert lib.infer_dtype(arr) == 'datetime'
+
+            arr = np.array([n, pd.Timestamp('2011-01-02'), n])
+            assert lib.infer_dtype(arr) == 'datetime'
+
+            arr = np.array([n, np.datetime64('2011-01-02'), n])
+            assert lib.infer_dtype(arr) == 'datetime64'
+
+            arr = np.array([n, datetime(2011, 1, 1), n])
+            assert lib.infer_dtype(arr) == 'datetime'
+
+        # different type of nat
+        arr = np.array([np.timedelta64('nat'),
+                        np.datetime64('2011-01-02')], dtype=object)
+        assert lib.infer_dtype(arr) == 'mixed'
+
+        arr = np.array([np.datetime64('2011-01-02'),
+                        np.timedelta64('nat')], dtype=object)
+        assert lib.infer_dtype(arr) == 'mixed'
+
+        # mixed datetime
+        arr = np.array([datetime(2011, 1, 1),
+                        pd.Timestamp('2011-01-02')])
+        assert lib.infer_dtype(arr) == 'datetime'
+
+        # should be datetime?
+        arr = np.array([np.datetime64('2011-01-01'),
+                        pd.Timestamp('2011-01-02')])
+        assert lib.infer_dtype(arr) == 'mixed'
+
+        arr = np.array([pd.Timestamp('2011-01-02'),
+                        np.datetime64('2011-01-01')])
+        assert lib.infer_dtype(arr) == 'mixed'
+
+        arr = np.array([np.nan, pd.Timestamp('2011-01-02'), 1])
+        assert lib.infer_dtype(arr) == 'mixed-integer'
+
+        arr = np.array([np.nan, pd.Timestamp('2011-01-02'), 1.1])
+        assert lib.infer_dtype(arr) == 'mixed'
+
+        arr = np.array([np.nan, '2011-01-01', pd.Timestamp('2011-01-02')])
+        assert lib.infer_dtype(arr) == 'mixed'
+
+    def test_infer_dtype_timedelta(self):
+
+        arr = np.array([pd.Timedelta('1 days'),
+                        pd.Timedelta('2 days')])
+        assert lib.infer_dtype(arr) == 'timedelta'
+
+        arr = np.array([np.timedelta64(1, 'D'),
+                        np.timedelta64(2, 'D')], dtype=object)
+        assert lib.infer_dtype(arr) == 'timedelta'
+
+        arr = np.array([timedelta(1), timedelta(2)])
+        assert lib.infer_dtype(arr) == 'timedelta'
+
+        # starts with nan
+        for n in [pd.NaT, np.nan]:
+            arr = np.array([n, Timedelta('1 days')])
+            assert lib.infer_dtype(arr) == 'timedelta'
+
+            arr = np.array([n, np.timedelta64(1, 'D')])
+            assert lib.infer_dtype(arr) == 'timedelta'
+
+            arr = np.array([n, timedelta(1)])
+            assert lib.infer_dtype(arr) == 'timedelta'
+
+            arr = np.array([n, pd.Timedelta('1 days'), n])
+            assert lib.infer_dtype(arr) == 'timedelta'
+
+            arr = np.array([n, np.timedelta64(1, 'D'), n])
+            assert lib.infer_dtype(arr) == 'timedelta'
+
+            arr = np.array([n, timedelta(1), n])
+            assert lib.infer_dtype(arr) == 'timedelta'
+
+        # different type of nat
+        arr = np.array([np.datetime64('nat'), np.timedelta64(1, 'D')],
+                       dtype=object)
+        assert lib.infer_dtype(arr) == 'mixed'
+
+        arr = np.array([np.timedelta64(1, 'D'), np.datetime64('nat')],
+                       dtype=object)
+        assert lib.infer_dtype(arr) == 'mixed'
+
+    def test_infer_dtype_period(self):
+        # GH 13664
+        arr = np.array([pd.Period('2011-01', freq='D'),
+                        pd.Period('2011-02', freq='D')])
+        assert lib.infer_dtype(arr) == 'period'
+
+        arr = np.array([pd.Period('2011-01', freq='D'),
+                        pd.Period('2011-02', freq='M')])
+        assert lib.infer_dtype(arr) == 'period'
+
+        # starts with nan
+        for n in [pd.NaT, np.nan]:
+            arr = np.array([n, pd.Period('2011-01', freq='D')])
+            assert lib.infer_dtype(arr) == 'period'
+
+            arr = np.array([n, pd.Period('2011-01', freq='D'), n])
+            assert lib.infer_dtype(arr) == 'period'
+
+        # different type of nat
+        arr = np.array([np.datetime64('nat'), pd.Period('2011-01', freq='M')],
+                       dtype=object)
+        assert lib.infer_dtype(arr) == 'mixed'
+
+        arr = np.array([pd.Period('2011-01', freq='M'), np.datetime64('nat')],
+                       dtype=object)
+        assert lib.infer_dtype(arr) == 'mixed'
+
+    @pytest.mark.parametrize(
+        "data",
+        [
+            [datetime(2017, 6, 12, 19, 30), datetime(2017, 3, 11, 1, 15)],
+            [Timestamp("20170612"), Timestamp("20170311")],
+            [Timestamp("20170612", tz='US/Eastern'),
+             Timestamp("20170311", tz='US/Eastern')],
+            [date(2017, 6, 12),
+             Timestamp("20170311", tz='US/Eastern')],
+            [np.datetime64("2017-06-12"), np.datetime64("2017-03-11")],
+            [np.datetime64("2017-06-12"), datetime(2017, 3, 11, 1, 15)]
+        ]
+    )
+    def test_infer_datetimelike_array_datetime(self, data):
+        assert lib.infer_datetimelike_array(data) == "datetime"
+
+    @pytest.mark.parametrize(
+        "data",
+        [
+            [timedelta(2017, 6, 12), timedelta(2017, 3, 11)],
+            [timedelta(2017, 6, 12), date(2017, 3, 11)],
+            [np.timedelta64(2017, "D"), np.timedelta64(6, "s")],
+            [np.timedelta64(2017, "D"), timedelta(2017, 3, 11)]
+        ]
+    )
+    def test_infer_datetimelike_array_timedelta(self, data):
+        assert lib.infer_datetimelike_array(data) == "timedelta"
+
+    def test_infer_datetimelike_array_date(self):
+        arr = [date(2017, 6, 12), date(2017, 3, 11)]
+        assert lib.infer_datetimelike_array(arr) == "date"
+
+    @pytest.mark.parametrize(
+        "data",
+        [
+            ["2017-06-12", "2017-03-11"],
+            [20170612, 20170311],
+            [20170612.5, 20170311.8],
+            [Dummy(), Dummy()],
+            [Timestamp("20170612"), Timestamp("20170311", tz='US/Eastern')],
+            [Timestamp("20170612"), 20170311],
+            [timedelta(2017, 6, 12), Timestamp("20170311", tz='US/Eastern')]
+        ]
+    )
+    def test_infer_datetimelike_array_mixed(self, data):
+        assert lib.infer_datetimelike_array(data) == "mixed"
+
+    @pytest.mark.parametrize(
+        "first, expected",
+        [
+            [[None], "mixed"],
+            [[np.nan], "mixed"],
+            [[pd.NaT], "nat"],
+            [[datetime(2017, 6, 12, 19, 30), pd.NaT], "datetime"],
+            [[np.datetime64("2017-06-12"), pd.NaT], "datetime"],
+            [[date(2017, 6, 12), pd.NaT], "date"],
+            [[timedelta(2017, 6, 12), pd.NaT], "timedelta"],
+            [[np.timedelta64(2017, "D"), pd.NaT], "timedelta"]
+        ]
+    )
+    @pytest.mark.parametrize("second", [None, np.nan])
+    def test_infer_datetimelike_array_nan_nat_like(self, first, second,
+                                                   expected):
+        first.append(second)
+        assert lib.infer_datetimelike_array(first) == expected
+
+    def test_infer_dtype_all_nan_nat_like(self):
+        arr = np.array([np.nan, np.nan])
+        assert lib.infer_dtype(arr) == 'floating'
+
+        # nan and None mix are result in mixed
+        arr = np.array([np.nan, np.nan, None])
+        assert lib.infer_dtype(arr) == 'mixed'
+
+        arr = np.array([None, np.nan, np.nan])
+        assert lib.infer_dtype(arr) == 'mixed'
+
+        # pd.NaT
+        arr = np.array([pd.NaT])
+        assert lib.infer_dtype(arr) == 'datetime'
+
+        arr = np.array([pd.NaT, np.nan])
+        assert lib.infer_dtype(arr) == 'datetime'
+
+        arr = np.array([np.nan, pd.NaT])
+        assert lib.infer_dtype(arr) == 'datetime'
+
+        arr = np.array([np.nan, pd.NaT, np.nan])
+        assert lib.infer_dtype(arr) == 'datetime'
+
+        arr = np.array([None, pd.NaT, None])
+        assert lib.infer_dtype(arr) == 'datetime'
+
+        # np.datetime64(nat)
+        arr = np.array([np.datetime64('nat')])
+        assert lib.infer_dtype(arr) == 'datetime64'
+
+        for n in [np.nan, pd.NaT, None]:
+            arr = np.array([n, np.datetime64('nat'), n])
+            assert lib.infer_dtype(arr) == 'datetime64'
+
+            arr = np.array([pd.NaT, n, np.datetime64('nat'), n])
+            assert lib.infer_dtype(arr) == 'datetime64'
+
+        arr = np.array([np.timedelta64('nat')], dtype=object)
+        assert lib.infer_dtype(arr) == 'timedelta'
+
+        for n in [np.nan, pd.NaT, None]:
+            arr = np.array([n, np.timedelta64('nat'), n])
+            assert lib.infer_dtype(arr) == 'timedelta'
+
+            arr = np.array([pd.NaT, n, np.timedelta64('nat'), n])
+            assert lib.infer_dtype(arr) == 'timedelta'
+
+        # datetime / timedelta mixed
+        arr = np.array([pd.NaT, np.datetime64('nat'),
+                        np.timedelta64('nat'), np.nan])
+        assert lib.infer_dtype(arr) == 'mixed'
+
+        arr = np.array([np.timedelta64('nat'), np.datetime64('nat')],
+                       dtype=object)
+        assert lib.infer_dtype(arr) == 'mixed'
+
+    def test_is_datetimelike_array_all_nan_nat_like(self):
+        arr = np.array([np.nan, pd.NaT, np.datetime64('nat')])
+        assert lib.is_datetime_array(arr)
+        assert lib.is_datetime64_array(arr)
+        assert not lib.is_timedelta_array(arr)
+        assert not lib.is_timedelta64_array(arr)
+        assert not lib.is_timedelta_or_timedelta64_array(arr)
+
+        arr = np.array([np.nan, pd.NaT, np.timedelta64('nat')])
+        assert not lib.is_datetime_array(arr)
+        assert not lib.is_datetime64_array(arr)
+        assert lib.is_timedelta_array(arr)
+        assert lib.is_timedelta64_array(arr)
+        assert lib.is_timedelta_or_timedelta64_array(arr)
+
+        arr = np.array([np.nan, pd.NaT, np.datetime64('nat'),
+                        np.timedelta64('nat')])
+        assert not lib.is_datetime_array(arr)
+        assert not lib.is_datetime64_array(arr)
+        assert not lib.is_timedelta_array(arr)
+        assert not lib.is_timedelta64_array(arr)
+        assert not lib.is_timedelta_or_timedelta64_array(arr)
+
+        arr = np.array([np.nan, pd.NaT])
+        assert lib.is_datetime_array(arr)
+        assert lib.is_datetime64_array(arr)
+        assert lib.is_timedelta_array(arr)
+        assert lib.is_timedelta64_array(arr)
+        assert lib.is_timedelta_or_timedelta64_array(arr)
+
+        arr = np.array([np.nan, np.nan], dtype=object)
+        assert not lib.is_datetime_array(arr)
+        assert not lib.is_datetime64_array(arr)
+        assert not lib.is_timedelta_array(arr)
+        assert not lib.is_timedelta64_array(arr)
+        assert not lib.is_timedelta_or_timedelta64_array(arr)
+
+        assert lib.is_datetime_with_singletz_array(
+            np.array([pd.Timestamp('20130101', tz='US/Eastern'),
+                      pd.Timestamp('20130102', tz='US/Eastern')],
+                     dtype=object))
+        assert not lib.is_datetime_with_singletz_array(
+            np.array([pd.Timestamp('20130101', tz='US/Eastern'),
+                      pd.Timestamp('20130102', tz='CET')],
+                     dtype=object))
+
+    @pytest.mark.parametrize(
+        "func",
+        [
+            'is_datetime_array',
+            'is_datetime64_array',
+            'is_bool_array',
+            'is_timedelta_array',
+            'is_timedelta64_array',
+            'is_timedelta_or_timedelta64_array',
+            'is_date_array',
+            'is_time_array',
+            'is_interval_array',
+            'is_period_array'])
+    def test_other_dtypes_for_array(self, func):
+        func = getattr(lib, func)
+        arr = np.array(['foo', 'bar'])
+        assert not func(arr)
+
+        arr = np.array([1, 2])
+        assert not func(arr)
+
+    def test_date(self):
+
+        dates = [date(2012, 1, day) for day in range(1, 20)]
+        index = Index(dates)
+        assert index.inferred_type == 'date'
+
+        dates = [date(2012, 1, day) for day in range(1, 20)] + [np.nan]
+        result = lib.infer_dtype(dates)
+        assert result == 'mixed'
+
+        result = lib.infer_dtype(dates, skipna=True)
+        assert result == 'date'
+
+    def test_is_numeric_array(self):
+
+        assert lib.is_float_array(np.array([1, 2.0]))
+        assert lib.is_float_array(np.array([1, 2.0, np.nan]))
+        assert not lib.is_float_array(np.array([1, 2]))
+
+        assert lib.is_integer_array(np.array([1, 2]))
+        assert not lib.is_integer_array(np.array([1, 2.0]))
+
+    def test_is_string_array(self):
+
+        assert lib.is_string_array(np.array(['foo', 'bar']))
+        assert not lib.is_string_array(
+            np.array(['foo', 'bar', np.nan], dtype=object), skipna=False)
+        assert lib.is_string_array(
+            np.array(['foo', 'bar', np.nan], dtype=object), skipna=True)
+        assert not lib.is_string_array(np.array([1, 2]))
+
+    def test_to_object_array_tuples(self):
+        r = (5, 6)
+        values = [r]
+        result = lib.to_object_array_tuples(values)
+
+        try:
+            # make sure record array works
+            from collections import namedtuple
+            record = namedtuple('record', 'x y')
+            r = record(5, 6)
+            values = [r]
+            result = lib.to_object_array_tuples(values)  # noqa
+        except ImportError:
+            pass
+
+    def test_object(self):
+
+        # GH 7431
+        # cannot infer more than this as only a single element
+        arr = np.array([None], dtype='O')
+        result = lib.infer_dtype(arr)
+        assert result == 'mixed'
+
+    def test_to_object_array_width(self):
+        # see gh-13320
+        rows = [[1, 2, 3], [4, 5, 6]]
+
+        expected = np.array(rows, dtype=object)
+        out = lib.to_object_array(rows)
+        tm.assert_numpy_array_equal(out, expected)
+
+        expected = np.array(rows, dtype=object)
+        out = lib.to_object_array(rows, min_width=1)
+        tm.assert_numpy_array_equal(out, expected)
+
+        expected = np.array([[1, 2, 3, None, None],
+                             [4, 5, 6, None, None]], dtype=object)
+        out = lib.to_object_array(rows, min_width=5)
+        tm.assert_numpy_array_equal(out, expected)
+
+    def test_is_period(self):
+        assert lib.is_period(pd.Period('2011-01', freq='M'))
+        assert not lib.is_period(pd.PeriodIndex(['2011-01'], freq='M'))
+        assert not lib.is_period(pd.Timestamp('2011-01'))
+        assert not lib.is_period(1)
+        assert not lib.is_period(np.nan)
+
+    def test_categorical(self):
+
+        # GH 8974
+        from pandas import Categorical, Series
+        arr = Categorical(list('abc'))
+        result = lib.infer_dtype(arr)
+        assert result == 'categorical'
+
+        result = lib.infer_dtype(Series(arr))
+        assert result == 'categorical'
+
+        arr = Categorical(list('abc'), categories=['cegfab'], ordered=True)
+        result = lib.infer_dtype(arr)
+        assert result == 'categorical'
+
+        result = lib.infer_dtype(Series(arr))
+        assert result == 'categorical'
+
+
+class TestNumberScalar(object):
+
+    def test_is_number(self):
+
+        assert is_number(True)
+        assert is_number(1)
+        assert is_number(1.1)
+        assert is_number(1 + 3j)
+        assert is_number(np.bool(False))
+        assert is_number(np.int64(1))
+        assert is_number(np.float64(1.1))
+        assert is_number(np.complex128(1 + 3j))
+        assert is_number(np.nan)
+
+        assert not is_number(None)
+        assert not is_number('x')
+        assert not is_number(datetime(2011, 1, 1))
+        assert not is_number(np.datetime64('2011-01-01'))
+        assert not is_number(Timestamp('2011-01-01'))
+        assert not is_number(Timestamp('2011-01-01', tz='US/Eastern'))
+        assert not is_number(timedelta(1000))
+        assert not is_number(Timedelta('1 days'))
+
+        # questionable
+        assert not is_number(np.bool_(False))
+        assert is_number(np.timedelta64(1, 'D'))
+
+    def test_is_bool(self):
+        assert is_bool(True)
+        assert is_bool(np.bool(False))
+        assert is_bool(np.bool_(False))
+
+        assert not is_bool(1)
+        assert not is_bool(1.1)
+        assert not is_bool(1 + 3j)
+        assert not is_bool(np.int64(1))
+        assert not is_bool(np.float64(1.1))
+        assert not is_bool(np.complex128(1 + 3j))
+        assert not is_bool(np.nan)
+        assert not is_bool(None)
+        assert not is_bool('x')
+        assert not is_bool(datetime(2011, 1, 1))
+        assert not is_bool(np.datetime64('2011-01-01'))
+        assert not is_bool(Timestamp('2011-01-01'))
+        assert not is_bool(Timestamp('2011-01-01', tz='US/Eastern'))
+        assert not is_bool(timedelta(1000))
+        assert not is_bool(np.timedelta64(1, 'D'))
+        assert not is_bool(Timedelta('1 days'))
+
+    def test_is_integer(self):
+        assert is_integer(1)
+        assert is_integer(np.int64(1))
+
+        assert not is_integer(True)
+        assert not is_integer(1.1)
+        assert not is_integer(1 + 3j)
+        assert not is_integer(np.bool(False))
+        assert not is_integer(np.bool_(False))
+        assert not is_integer(np.float64(1.1))
+        assert not is_integer(np.complex128(1 + 3j))
+        assert not is_integer(np.nan)
+        assert not is_integer(None)
+        assert not is_integer('x')
+        assert not is_integer(datetime(2011, 1, 1))
+        assert not is_integer(np.datetime64('2011-01-01'))
+        assert not is_integer(Timestamp('2011-01-01'))
+        assert not is_integer(Timestamp('2011-01-01', tz='US/Eastern'))
+        assert not is_integer(timedelta(1000))
+        assert not is_integer(Timedelta('1 days'))
+
+        # questionable
+        assert is_integer(np.timedelta64(1, 'D'))
+
+    def test_is_float(self):
+        assert is_float(1.1)
+        assert is_float(np.float64(1.1))
+        assert is_float(np.nan)
+
+        assert not is_float(True)
+        assert not is_float(1)
+        assert not is_float(1 + 3j)
+        assert not is_float(np.bool(False))
+        assert not is_float(np.bool_(False))
+        assert not is_float(np.int64(1))
+        assert not is_float(np.complex128(1 + 3j))
+        assert not is_float(None)
+        assert not is_float('x')
+        assert not is_float(datetime(2011, 1, 1))
+        assert not is_float(np.datetime64('2011-01-01'))
+        assert not is_float(Timestamp('2011-01-01'))
+        assert not is_float(Timestamp('2011-01-01', tz='US/Eastern'))
+        assert not is_float(timedelta(1000))
+        assert not is_float(np.timedelta64(1, 'D'))
+        assert not is_float(Timedelta('1 days'))
+
+    def test_is_datetime_dtypes(self):
+
+        ts = pd.date_range('20130101', periods=3)
+        tsa = pd.date_range('20130101', periods=3, tz='US/Eastern')
+
+        assert is_datetime64_dtype('datetime64')
+        assert is_datetime64_dtype('datetime64[ns]')
+        assert is_datetime64_dtype(ts)
+        assert not is_datetime64_dtype(tsa)
+
+        assert not is_datetime64_ns_dtype('datetime64')
+        assert is_datetime64_ns_dtype('datetime64[ns]')
+        assert is_datetime64_ns_dtype(ts)
+        assert is_datetime64_ns_dtype(tsa)
+
+        assert is_datetime64_any_dtype('datetime64')
+        assert is_datetime64_any_dtype('datetime64[ns]')
+        assert is_datetime64_any_dtype(ts)
+        assert is_datetime64_any_dtype(tsa)
+
+        assert not is_datetime64tz_dtype('datetime64')
+        assert not is_datetime64tz_dtype('datetime64[ns]')
+        assert not is_datetime64tz_dtype(ts)
+        assert is_datetime64tz_dtype(tsa)
+
+        for tz in ['US/Eastern', 'UTC']:
+            dtype = 'datetime64[ns, {}]'.format(tz)
+            assert not is_datetime64_dtype(dtype)
+            assert is_datetime64tz_dtype(dtype)
+            assert is_datetime64_ns_dtype(dtype)
+            assert is_datetime64_any_dtype(dtype)
+
+    def test_is_timedelta(self):
+        assert is_timedelta64_dtype('timedelta64')
+        assert is_timedelta64_dtype('timedelta64[ns]')
+        assert not is_timedelta64_ns_dtype('timedelta64')
+        assert is_timedelta64_ns_dtype('timedelta64[ns]')
+
+        tdi = TimedeltaIndex([1e14, 2e14], dtype='timedelta64')
+        assert is_timedelta64_dtype(tdi)
+        assert is_timedelta64_ns_dtype(tdi)
+        assert is_timedelta64_ns_dtype(tdi.astype('timedelta64[ns]'))
+
+        # Conversion to Int64Index:
+        assert not is_timedelta64_ns_dtype(tdi.astype('timedelta64'))
+        assert not is_timedelta64_ns_dtype(tdi.astype('timedelta64[h]'))
+
+
+class TestIsScalar(object):
+
+    def test_is_scalar_builtin_scalars(self):
+        assert is_scalar(None)
+        assert is_scalar(True)
+        assert is_scalar(False)
+        assert is_scalar(0.)
+        assert is_scalar(np.nan)
+        assert is_scalar('foobar')
+        assert is_scalar(b'foobar')
+        assert is_scalar(u('efoobar'))
+        assert is_scalar(datetime(2014, 1, 1))
+        assert is_scalar(date(2014, 1, 1))
+        assert is_scalar(time(12, 0))
+        assert is_scalar(timedelta(hours=1))
+        assert is_scalar(pd.NaT)
+
+    def test_is_scalar_builtin_nonscalars(self):
+        assert not is_scalar({})
+        assert not is_scalar([])
+        assert not is_scalar([1])
+        assert not is_scalar(())
+        assert not is_scalar((1, ))
+        assert not is_scalar(slice(None))
+        assert not is_scalar(Ellipsis)
+
+    def test_is_scalar_numpy_array_scalars(self):
+        assert is_scalar(np.int64(1))
+        assert is_scalar(np.float64(1.))
+        assert is_scalar(np.int32(1))
+        assert is_scalar(np.object_('foobar'))
+        assert is_scalar(np.str_('foobar'))
+        assert is_scalar(np.unicode_(u('foobar')))
+        assert is_scalar(np.bytes_(b'foobar'))
+        assert is_scalar(np.datetime64('2014-01-01'))
+        assert is_scalar(np.timedelta64(1, 'h'))
+
+    def test_is_scalar_numpy_zerodim_arrays(self):
+        for zerodim in [np.array(1), np.array('foobar'),
+                        np.array(np.datetime64('2014-01-01')),
+                        np.array(np.timedelta64(1, 'h')),
+                        np.array(np.datetime64('NaT'))]:
+            assert not is_scalar(zerodim)
+            assert is_scalar(lib.item_from_zerodim(zerodim))
+
+    def test_is_scalar_numpy_arrays(self):
+        assert not is_scalar(np.array([]))
+        assert not is_scalar(np.array([[]]))
+        assert not is_scalar(np.matrix('1; 2'))
+
+    def test_is_scalar_pandas_scalars(self):
+        assert is_scalar(Timestamp('2014-01-01'))
+        assert is_scalar(Timedelta(hours=1))
+        assert is_scalar(Period('2014-01-01'))
+        assert is_scalar(Interval(left=0, right=1))
+        assert is_scalar(DateOffset(days=1))
+
+    def test_is_scalar_pandas_containers(self):
+        assert not is_scalar(Series())
+        assert not is_scalar(Series([1]))
+        assert not is_scalar(DataFrame())
+        assert not is_scalar(DataFrame([[1]]))
+        with catch_warnings(record=True):
+            assert not is_scalar(Panel())
+            assert not is_scalar(Panel([[[1]]]))
+        assert not is_scalar(Index([]))
+        assert not is_scalar(Index([1]))
+
+
+def test_datetimeindex_from_empty_datetime64_array():
+    for unit in ['ms', 'us', 'ns']:
+        idx = DatetimeIndex(np.array([], dtype='datetime64[%s]' % unit))
+        assert (len(idx) == 0)
+
+
+def test_nan_to_nat_conversions():
+
+    df = DataFrame(dict({
+        'A': np.asarray(
+            lrange(10), dtype='float64'),
+        'B': Timestamp('20010101')
+    }))
+    df.iloc[3:6, :] = np.nan
+    result = df.loc[4, 'B'].value
+    assert (result == tslib.iNaT)
+
+    s = df['B'].copy()
+    s._data = s._data.setitem(indexer=tuple([slice(8, 9)]), value=np.nan)
+    assert (isna(s[8]))
+
+    # numpy < 1.7.0 is wrong
+    from distutils.version import LooseVersion
+    if LooseVersion(np.__version__) >= LooseVersion('1.7.0'):
+        assert (s[8].value == np.datetime64('NaT').astype(np.int64))
+
+
+@td.skip_if_no_scipy
+def test_is_scipy_sparse(spmatrix):  # noqa: F811
+    assert is_scipy_sparse(spmatrix([[0, 1]]))
+    assert not is_scipy_sparse(np.array([1]))
+
+
+def test_ensure_int32():
+    values = np.arange(10, dtype=np.int32)
+    result = _ensure_int32(values)
+    assert (result.dtype == np.int32)
+
+    values = np.arange(10, dtype=np.int64)
+    result = _ensure_int32(values)
+    assert (result.dtype == np.int32)
+
+
+def test_ensure_categorical():
+    values = np.arange(10, dtype=np.int32)
+    result = _ensure_categorical(values)
+    assert (result.dtype == 'category')
+
+    values = Categorical(values)
+    result = _ensure_categorical(values)
+    tm.assert_categorical_equal(result, values)
diff --git a/pandas/tests/dtypes/test_missing.py b/pandas/tests/dtypes/test_missing.py
new file mode 100644
index 0000000000000..ca9a2dc81fcc6
--- /dev/null
+++ b/pandas/tests/dtypes/test_missing.py
@@ -0,0 +1,389 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+from warnings import catch_warnings
+import numpy as np
+from datetime import datetime
+from pandas.util import testing as tm
+
+import pandas as pd
+from pandas.core import config as cf
+from pandas.compat import u
+
+from pandas._libs import missing as libmissing
+from pandas._libs.tslib import iNaT
+from pandas import (NaT, Float64Index, Series,
+                    DatetimeIndex, TimedeltaIndex, date_range)
+from pandas.core.dtypes.common import is_scalar
+from pandas.core.dtypes.dtypes import (
+    DatetimeTZDtype, PeriodDtype, IntervalDtype)
+from pandas.core.dtypes.missing import (
+    array_equivalent, isna, notna, isnull, notnull,
+    na_value_for_dtype)
+
+
+@pytest.mark.parametrize('notna_f', [notna, notnull])
+def test_notna_notnull(notna_f):
+    assert notna_f(1.)
+    assert not notna_f(None)
+    assert not notna_f(np.NaN)
+
+    with cf.option_context("mode.use_inf_as_na", False):
+        assert notna_f(np.inf)
+        assert notna_f(-np.inf)
+
+        arr = np.array([1.5, np.inf, 3.5, -np.inf])
+        result = notna_f(arr)
+        assert result.all()
+
+    with cf.option_context("mode.use_inf_as_na", True):
+        assert not notna_f(np.inf)
+        assert not notna_f(-np.inf)
+
+        arr = np.array([1.5, np.inf, 3.5, -np.inf])
+        result = notna_f(arr)
+        assert result.sum() == 2
+
+    with cf.option_context("mode.use_inf_as_na", False):
+        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
+                  tm.makeObjectSeries(), tm.makeTimeSeries(),
+                  tm.makePeriodSeries()]:
+            assert (isinstance(notna_f(s), Series))
+
+
+class TestIsNA(object):
+
+    def test_0d_array(self):
+        assert isna(np.array(np.nan))
+        assert not isna(np.array(0.0))
+        assert not isna(np.array(0))
+        # test object dtype
+        assert isna(np.array(np.nan, dtype=object))
+        assert not isna(np.array(0.0, dtype=object))
+        assert not isna(np.array(0, dtype=object))
+
+    def test_empty_object(self):
+
+        for shape in [(4, 0), (4,)]:
+            arr = np.empty(shape=shape, dtype=object)
+            result = isna(arr)
+            expected = np.ones(shape=shape, dtype=bool)
+            tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('isna_f', [isna, isnull])
+    def test_isna_isnull(self, isna_f):
+        assert not isna_f(1.)
+        assert isna_f(None)
+        assert isna_f(np.NaN)
+        assert float('nan')
+        assert not isna_f(np.inf)
+        assert not isna_f(-np.inf)
+
+        # series
+        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
+                  tm.makeObjectSeries(), tm.makeTimeSeries(),
+                  tm.makePeriodSeries()]:
+            assert isinstance(isna_f(s), Series)
+
+        # frame
+        for df in [tm.makeTimeDataFrame(), tm.makePeriodFrame(),
+                   tm.makeMixedDataFrame()]:
+            result = isna_f(df)
+            expected = df.apply(isna_f)
+            tm.assert_frame_equal(result, expected)
+
+        # panel
+        with catch_warnings(record=True):
+            for p in [tm.makePanel(), tm.makePeriodPanel(),
+                      tm.add_nans(tm.makePanel())]:
+                result = isna_f(p)
+                expected = p.apply(isna_f)
+                tm.assert_panel_equal(result, expected)
+
+    def test_isna_lists(self):
+        result = isna([[False]])
+        exp = np.array([[False]])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = isna([[1], [2]])
+        exp = np.array([[False], [False]])
+        tm.assert_numpy_array_equal(result, exp)
+
+        # list of strings / unicode
+        result = isna(['foo', 'bar'])
+        exp = np.array([False, False])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = isna([u('foo'), u('bar')])
+        exp = np.array([False, False])
+        tm.assert_numpy_array_equal(result, exp)
+
+        # GH20675
+        result = isna([np.NaN, 'world'])
+        exp = np.array([True, False])
+        tm.assert_numpy_array_equal(result, exp)
+
+    def test_isna_nat(self):
+        result = isna([NaT])
+        exp = np.array([True])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = isna(np.array([NaT], dtype=object))
+        exp = np.array([True])
+        tm.assert_numpy_array_equal(result, exp)
+
+    def test_isna_numpy_nat(self):
+        arr = np.array([NaT, np.datetime64('NaT'), np.timedelta64('NaT'),
+                        np.datetime64('NaT', 's')])
+        result = isna(arr)
+        expected = np.array([True] * 4)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_isna_datetime(self):
+        assert not isna(datetime.now())
+        assert notna(datetime.now())
+
+        idx = date_range('1/1/1990', periods=20)
+        exp = np.ones(len(idx), dtype=bool)
+        tm.assert_numpy_array_equal(notna(idx), exp)
+
+        idx = np.asarray(idx)
+        idx[0] = iNaT
+        idx = DatetimeIndex(idx)
+        mask = isna(idx)
+        assert mask[0]
+        exp = np.array([True] + [False] * (len(idx) - 1), dtype=bool)
+        tm.assert_numpy_array_equal(mask, exp)
+
+        # GH 9129
+        pidx = idx.to_period(freq='M')
+        mask = isna(pidx)
+        assert mask[0]
+        exp = np.array([True] + [False] * (len(idx) - 1), dtype=bool)
+        tm.assert_numpy_array_equal(mask, exp)
+
+        mask = isna(pidx[1:])
+        exp = np.zeros(len(mask), dtype=bool)
+        tm.assert_numpy_array_equal(mask, exp)
+
+    @pytest.mark.parametrize(
+        "value, expected",
+        [(np.complex128(np.nan), True),
+         (np.float64(1), False),
+         (np.array([1, 1 + 0j, np.nan, 3]),
+          np.array([False, False, True, False])),
+         (np.array([1, 1 + 0j, np.nan, 3], dtype=object),
+          np.array([False, False, True, False])),
+         (np.array([1, 1 + 0j, np.nan, 3]).astype(object),
+          np.array([False, False, True, False]))])
+    def test_complex(self, value, expected):
+        result = isna(value)
+        if is_scalar(result):
+            assert result is expected
+        else:
+            tm.assert_numpy_array_equal(result, expected)
+
+    def test_datetime_other_units(self):
+        idx = pd.DatetimeIndex(['2011-01-01', 'NaT', '2011-01-02'])
+        exp = np.array([False, True, False])
+        tm.assert_numpy_array_equal(isna(idx), exp)
+        tm.assert_numpy_array_equal(notna(idx), ~exp)
+        tm.assert_numpy_array_equal(isna(idx.values), exp)
+        tm.assert_numpy_array_equal(notna(idx.values), ~exp)
+
+        for dtype in ['datetime64[D]', 'datetime64[h]', 'datetime64[m]',
+                      'datetime64[s]', 'datetime64[ms]', 'datetime64[us]',
+                      'datetime64[ns]']:
+            values = idx.values.astype(dtype)
+
+            exp = np.array([False, True, False])
+            tm.assert_numpy_array_equal(isna(values), exp)
+            tm.assert_numpy_array_equal(notna(values), ~exp)
+
+            exp = pd.Series([False, True, False])
+            s = pd.Series(values)
+            tm.assert_series_equal(isna(s), exp)
+            tm.assert_series_equal(notna(s), ~exp)
+            s = pd.Series(values, dtype=object)
+            tm.assert_series_equal(isna(s), exp)
+            tm.assert_series_equal(notna(s), ~exp)
+
+    def test_timedelta_other_units(self):
+        idx = pd.TimedeltaIndex(['1 days', 'NaT', '2 days'])
+        exp = np.array([False, True, False])
+        tm.assert_numpy_array_equal(isna(idx), exp)
+        tm.assert_numpy_array_equal(notna(idx), ~exp)
+        tm.assert_numpy_array_equal(isna(idx.values), exp)
+        tm.assert_numpy_array_equal(notna(idx.values), ~exp)
+
+        for dtype in ['timedelta64[D]', 'timedelta64[h]', 'timedelta64[m]',
+                      'timedelta64[s]', 'timedelta64[ms]', 'timedelta64[us]',
+                      'timedelta64[ns]']:
+            values = idx.values.astype(dtype)
+
+            exp = np.array([False, True, False])
+            tm.assert_numpy_array_equal(isna(values), exp)
+            tm.assert_numpy_array_equal(notna(values), ~exp)
+
+            exp = pd.Series([False, True, False])
+            s = pd.Series(values)
+            tm.assert_series_equal(isna(s), exp)
+            tm.assert_series_equal(notna(s), ~exp)
+            s = pd.Series(values, dtype=object)
+            tm.assert_series_equal(isna(s), exp)
+            tm.assert_series_equal(notna(s), ~exp)
+
+    def test_period(self):
+        idx = pd.PeriodIndex(['2011-01', 'NaT', '2012-01'], freq='M')
+        exp = np.array([False, True, False])
+        tm.assert_numpy_array_equal(isna(idx), exp)
+        tm.assert_numpy_array_equal(notna(idx), ~exp)
+
+        exp = pd.Series([False, True, False])
+        s = pd.Series(idx)
+        tm.assert_series_equal(isna(s), exp)
+        tm.assert_series_equal(notna(s), ~exp)
+        s = pd.Series(idx, dtype=object)
+        tm.assert_series_equal(isna(s), exp)
+        tm.assert_series_equal(notna(s), ~exp)
+
+
+def test_array_equivalent():
+    assert array_equivalent(np.array([np.nan, np.nan]),
+                            np.array([np.nan, np.nan]))
+    assert array_equivalent(np.array([np.nan, 1, np.nan]),
+                            np.array([np.nan, 1, np.nan]))
+    assert array_equivalent(np.array([np.nan, None], dtype='object'),
+                            np.array([np.nan, None], dtype='object'))
+    assert array_equivalent(np.array([np.nan, 1 + 1j], dtype='complex'),
+                            np.array([np.nan, 1 + 1j], dtype='complex'))
+    assert not array_equivalent(
+        np.array([np.nan, 1 + 1j], dtype='complex'), np.array(
+            [np.nan, 1 + 2j], dtype='complex'))
+    assert not array_equivalent(
+        np.array([np.nan, 1, np.nan]), np.array([np.nan, 2, np.nan]))
+    assert not array_equivalent(
+        np.array(['a', 'b', 'c', 'd']), np.array(['e', 'e']))
+    assert array_equivalent(Float64Index([0, np.nan]),
+                            Float64Index([0, np.nan]))
+    assert not array_equivalent(
+        Float64Index([0, np.nan]), Float64Index([1, np.nan]))
+    assert array_equivalent(DatetimeIndex([0, np.nan]),
+                            DatetimeIndex([0, np.nan]))
+    assert not array_equivalent(
+        DatetimeIndex([0, np.nan]), DatetimeIndex([1, np.nan]))
+    assert array_equivalent(TimedeltaIndex([0, np.nan]),
+                            TimedeltaIndex([0, np.nan]))
+    assert not array_equivalent(
+        TimedeltaIndex([0, np.nan]), TimedeltaIndex([1, np.nan]))
+    assert array_equivalent(DatetimeIndex([0, np.nan], tz='US/Eastern'),
+                            DatetimeIndex([0, np.nan], tz='US/Eastern'))
+    assert not array_equivalent(
+        DatetimeIndex([0, np.nan], tz='US/Eastern'), DatetimeIndex(
+            [1, np.nan], tz='US/Eastern'))
+    assert not array_equivalent(
+        DatetimeIndex([0, np.nan]), DatetimeIndex(
+            [0, np.nan], tz='US/Eastern'))
+    assert not array_equivalent(
+        DatetimeIndex([0, np.nan], tz='CET'), DatetimeIndex(
+            [0, np.nan], tz='US/Eastern'))
+    assert not array_equivalent(
+        DatetimeIndex([0, np.nan]), TimedeltaIndex([0, np.nan]))
+
+
+def test_array_equivalent_compat():
+    # see gh-13388
+    m = np.array([(1, 2), (3, 4)], dtype=[('a', int), ('b', float)])
+    n = np.array([(1, 2), (3, 4)], dtype=[('a', int), ('b', float)])
+    assert (array_equivalent(m, n, strict_nan=True))
+    assert (array_equivalent(m, n, strict_nan=False))
+
+    m = np.array([(1, 2), (3, 4)], dtype=[('a', int), ('b', float)])
+    n = np.array([(1, 2), (4, 3)], dtype=[('a', int), ('b', float)])
+    assert (not array_equivalent(m, n, strict_nan=True))
+    assert (not array_equivalent(m, n, strict_nan=False))
+
+    m = np.array([(1, 2), (3, 4)], dtype=[('a', int), ('b', float)])
+    n = np.array([(1, 2), (3, 4)], dtype=[('b', int), ('a', float)])
+    assert (not array_equivalent(m, n, strict_nan=True))
+    assert (not array_equivalent(m, n, strict_nan=False))
+
+
+def test_array_equivalent_str():
+    for dtype in ['O', 'S', 'U']:
+        assert array_equivalent(np.array(['A', 'B'], dtype=dtype),
+                                np.array(['A', 'B'], dtype=dtype))
+        assert not array_equivalent(np.array(['A', 'B'], dtype=dtype),
+                                    np.array(['A', 'X'], dtype=dtype))
+
+
+@pytest.mark.parametrize('dtype, na_value', [
+    # Datetime-like
+    (np.dtype("M8[ns]"), NaT),
+    (np.dtype("m8[ns]"), NaT),
+    (DatetimeTZDtype('datetime64[ns, US/Eastern]'), NaT),
+    (PeriodDtype("M"), NaT),
+    # Integer
+    ('u1', 0), ('u2', 0), ('u4', 0), ('u8', 0),
+    ('i1', 0), ('i2', 0), ('i4', 0), ('i8', 0),
+    # Bool
+    ('bool', False),
+    # Float
+    ('f2', np.nan), ('f4', np.nan), ('f8', np.nan),
+    # Object
+    ('O', np.nan),
+    # Interval
+    (IntervalDtype(), np.nan),
+])
+def test_na_value_for_dtype(dtype, na_value):
+    result = na_value_for_dtype(dtype)
+    assert result is na_value
+
+
+class TestNAObj(object):
+
+    _1d_methods = ['isnaobj', 'isnaobj_old']
+    _2d_methods = ['isnaobj2d', 'isnaobj2d_old']
+
+    def _check_behavior(self, arr, expected):
+        for method in TestNAObj._1d_methods:
+            result = getattr(libmissing, method)(arr)
+            tm.assert_numpy_array_equal(result, expected)
+
+        arr = np.atleast_2d(arr)
+        expected = np.atleast_2d(expected)
+
+        for method in TestNAObj._2d_methods:
+            result = getattr(libmissing, method)(arr)
+            tm.assert_numpy_array_equal(result, expected)
+
+    def test_basic(self):
+        arr = np.array([1, None, 'foo', -5.1, pd.NaT, np.nan])
+        expected = np.array([False, True, False, False, True, True])
+
+        self._check_behavior(arr, expected)
+
+    def test_non_obj_dtype(self):
+        arr = np.array([1, 3, np.nan, 5], dtype=float)
+        expected = np.array([False, False, True, False])
+
+        self._check_behavior(arr, expected)
+
+    def test_empty_arr(self):
+        arr = np.array([])
+        expected = np.array([], dtype=bool)
+
+        self._check_behavior(arr, expected)
+
+    def test_empty_str_inp(self):
+        arr = np.array([""])  # empty but not na
+        expected = np.array([False])
+
+        self._check_behavior(arr, expected)
+
+    def test_empty_like(self):
+        # see gh-13717: no segfaults!
+        arr = np.empty_like([None])
+        expected = np.array([True])
+
+        self._check_behavior(arr, expected)
diff --git a/ci/requirements-2.7_NUMPY_DEV_master.run b/pandas/tests/extension/__init__.py
similarity index 100%
rename from ci/requirements-2.7_NUMPY_DEV_master.run
rename to pandas/tests/extension/__init__.py
diff --git a/pandas/tests/extension/base/__init__.py b/pandas/tests/extension/base/__init__.py
new file mode 100644
index 0000000000000..640b894e2245f
--- /dev/null
+++ b/pandas/tests/extension/base/__init__.py
@@ -0,0 +1,53 @@
+"""Base test suite for extension arrays.
+
+These tests are intended for third-party libraries to subclass to validate
+that their extension arrays and dtypes satisfy the interface. Moving or
+renaming the tests should not be done lightly.
+
+Libraries are expected to implement a few pytest fixtures to provide data
+for the tests. The fixtures may be located in either
+
+* The same module as your test class.
+* A ``conftest.py`` in the same directory as your test class.
+
+The full list of fixtures may be found in the ``conftest.py`` next to this
+file.
+
+.. code-block:: python
+
+   import pytest
+   from pandas.tests.extension.base import BaseDtypeTests
+
+
+   @pytest.fixture
+   def dtype():
+       return MyDtype()
+
+
+   class TestMyDtype(BaseDtypeTests):
+       pass
+
+
+Your class ``TestDtype`` will inherit all the tests defined on
+``BaseDtypeTests``. pytest's fixture discover will supply your ``dtype``
+wherever the test requires it. You're free to implement additional tests.
+
+All the tests in these modules use ``self.assert_frame_equal`` or
+``self.assert_series_equal`` for dataframe or series comparisons. By default,
+they use the usual ``pandas.testing.assert_frame_equal`` and
+``pandas.testing.assert_series_equal``. You can override the checks used
+by defining the staticmethods ``assert_frame_equal`` and
+``assert_series_equal`` on your base test class.
+
+"""
+from .casting import BaseCastingTests  # noqa
+from .constructors import BaseConstructorsTests  # noqa
+from .dtype import BaseDtypeTests  # noqa
+from .getitem import BaseGetitemTests  # noqa
+from .groupby import BaseGroupbyTests  # noqa
+from .interface import BaseInterfaceTests  # noqa
+from .methods import BaseMethodsTests  # noqa
+from .ops import BaseArithmeticOpsTests, BaseComparisonOpsTests  # noqa
+from .missing import BaseMissingTests  # noqa
+from .reshaping import BaseReshapingTests  # noqa
+from .setitem import BaseSetitemTests  # noqa
diff --git a/pandas/tests/extension/base/base.py b/pandas/tests/extension/base/base.py
new file mode 100644
index 0000000000000..beb7948f2c14b
--- /dev/null
+++ b/pandas/tests/extension/base/base.py
@@ -0,0 +1,9 @@
+import pandas.util.testing as tm
+
+
+class BaseExtensionTests(object):
+    assert_series_equal = staticmethod(tm.assert_series_equal)
+    assert_frame_equal = staticmethod(tm.assert_frame_equal)
+    assert_extension_array_equal = staticmethod(
+        tm.assert_extension_array_equal
+    )
diff --git a/pandas/tests/extension/base/casting.py b/pandas/tests/extension/base/casting.py
new file mode 100644
index 0000000000000..7146443bf8de5
--- /dev/null
+++ b/pandas/tests/extension/base/casting.py
@@ -0,0 +1,23 @@
+import pandas as pd
+from pandas.core.internals import ObjectBlock
+
+from .base import BaseExtensionTests
+
+
+class BaseCastingTests(BaseExtensionTests):
+    """Casting to and from ExtensionDtypes"""
+
+    def test_astype_object_series(self, all_data):
+        ser = pd.Series({"A": all_data})
+        result = ser.astype(object)
+        assert isinstance(result._data.blocks[0], ObjectBlock)
+
+    def test_tolist(self, data):
+        result = pd.Series(data).tolist()
+        expected = list(data)
+        assert result == expected
+
+    def test_astype_str(self, data):
+        result = pd.Series(data[:5]).astype(str)
+        expected = pd.Series(data[:5].astype(str))
+        self.assert_series_equal(result, expected)
diff --git a/pandas/tests/extension/base/constructors.py b/pandas/tests/extension/base/constructors.py
new file mode 100644
index 0000000000000..489a430bb4020
--- /dev/null
+++ b/pandas/tests/extension/base/constructors.py
@@ -0,0 +1,47 @@
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.core.internals import ExtensionBlock
+
+from .base import BaseExtensionTests
+
+
+class BaseConstructorsTests(BaseExtensionTests):
+
+    def test_array_from_scalars(self, data):
+        scalars = [data[0], data[1], data[2]]
+        result = data._from_sequence(scalars)
+        assert isinstance(result, type(data))
+
+    def test_series_constructor(self, data):
+        result = pd.Series(data)
+        assert result.dtype == data.dtype
+        assert len(result) == len(data)
+        assert isinstance(result._data.blocks[0], ExtensionBlock)
+        assert result._data.blocks[0].values is data
+
+        # Series[EA] is unboxed / boxed correctly
+        result2 = pd.Series(result)
+        assert result2.dtype == data.dtype
+        assert isinstance(result2._data.blocks[0], ExtensionBlock)
+
+    @pytest.mark.parametrize("from_series", [True, False])
+    def test_dataframe_constructor_from_dict(self, data, from_series):
+        if from_series:
+            data = pd.Series(data)
+        result = pd.DataFrame({"A": data})
+        assert result.dtypes['A'] == data.dtype
+        assert result.shape == (len(data), 1)
+        assert isinstance(result._data.blocks[0], ExtensionBlock)
+
+    def test_dataframe_from_series(self, data):
+        result = pd.DataFrame(pd.Series(data))
+        assert result.dtypes[0] == data.dtype
+        assert result.shape == (len(data), 1)
+        assert isinstance(result._data.blocks[0], ExtensionBlock)
+
+    def test_series_given_mismatched_index_raises(self, data):
+        msg = 'Length of passed values is 3, index implies 5'
+        with tm.assert_raises_regex(ValueError, msg):
+            pd.Series(data[:3], index=[0, 1, 2, 3, 4])
diff --git a/pandas/tests/extension/base/dtype.py b/pandas/tests/extension/base/dtype.py
new file mode 100644
index 0000000000000..63d3d807c270c
--- /dev/null
+++ b/pandas/tests/extension/base/dtype.py
@@ -0,0 +1,48 @@
+import numpy as np
+import pandas as pd
+
+from .base import BaseExtensionTests
+
+
+class BaseDtypeTests(BaseExtensionTests):
+    """Base class for ExtensionDtype classes"""
+
+    def test_name(self, dtype):
+        assert isinstance(dtype.name, str)
+
+    def test_kind(self, dtype):
+        valid = set('biufcmMOSUV')
+        if dtype.kind is not None:
+            assert dtype.kind in valid
+
+    def test_construct_from_string_own_name(self, dtype):
+        result = dtype.construct_from_string(dtype.name)
+        assert type(result) is type(dtype)
+
+        # check OK as classmethod
+        result = type(dtype).construct_from_string(dtype.name)
+        assert type(result) is type(dtype)
+
+    def test_is_dtype_from_name(self, dtype):
+        result = type(dtype).is_dtype(dtype.name)
+        assert result is True
+
+    def test_is_dtype_unboxes_dtype(self, data, dtype):
+        assert dtype.is_dtype(data) is True
+
+    def test_is_dtype_from_self(self, dtype):
+        result = type(dtype).is_dtype(dtype)
+        assert result is True
+
+    def test_is_not_string_type(self, dtype):
+        return not pd.api.types.is_string_dtype(dtype)
+
+    def test_is_not_object_type(self, dtype):
+        return not pd.api.types.is_object_dtype(dtype)
+
+    def test_eq_with_str(self, dtype):
+        assert dtype == dtype.name
+        assert dtype != dtype.name + '-suffix'
+
+    def test_eq_with_numpy_object(self, dtype):
+        assert dtype != np.dtype('object')
diff --git a/pandas/tests/extension/base/getitem.py b/pandas/tests/extension/base/getitem.py
new file mode 100644
index 0000000000000..e9df49780f119
--- /dev/null
+++ b/pandas/tests/extension/base/getitem.py
@@ -0,0 +1,247 @@
+import pytest
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+
+from .base import BaseExtensionTests
+
+
+class BaseGetitemTests(BaseExtensionTests):
+    """Tests for ExtensionArray.__getitem__."""
+
+    def test_iloc_series(self, data):
+        ser = pd.Series(data)
+        result = ser.iloc[:4]
+        expected = pd.Series(data[:4])
+        self.assert_series_equal(result, expected)
+
+        result = ser.iloc[[0, 1, 2, 3]]
+        self.assert_series_equal(result, expected)
+
+    def test_iloc_frame(self, data):
+        df = pd.DataFrame({"A": data, 'B':
+                           np.arange(len(data), dtype='int64')})
+        expected = pd.DataFrame({"A": data[:4]})
+
+        # slice -> frame
+        result = df.iloc[:4, [0]]
+        self.assert_frame_equal(result, expected)
+
+        # sequence -> frame
+        result = df.iloc[[0, 1, 2, 3], [0]]
+        self.assert_frame_equal(result, expected)
+
+        expected = pd.Series(data[:4], name='A')
+
+        # slice -> series
+        result = df.iloc[:4, 0]
+        self.assert_series_equal(result, expected)
+
+        # sequence -> series
+        result = df.iloc[:4, 0]
+        self.assert_series_equal(result, expected)
+
+    def test_loc_series(self, data):
+        ser = pd.Series(data)
+        result = ser.loc[:3]
+        expected = pd.Series(data[:4])
+        self.assert_series_equal(result, expected)
+
+        result = ser.loc[[0, 1, 2, 3]]
+        self.assert_series_equal(result, expected)
+
+    def test_loc_frame(self, data):
+        df = pd.DataFrame({"A": data,
+                           'B': np.arange(len(data), dtype='int64')})
+        expected = pd.DataFrame({"A": data[:4]})
+
+        # slice -> frame
+        result = df.loc[:3, ['A']]
+        self.assert_frame_equal(result, expected)
+
+        # sequence -> frame
+        result = df.loc[[0, 1, 2, 3], ['A']]
+        self.assert_frame_equal(result, expected)
+
+        expected = pd.Series(data[:4], name='A')
+
+        # slice -> series
+        result = df.loc[:3, 'A']
+        self.assert_series_equal(result, expected)
+
+        # sequence -> series
+        result = df.loc[:3, 'A']
+        self.assert_series_equal(result, expected)
+
+    def test_getitem_scalar(self, data):
+        result = data[0]
+        assert isinstance(result, data.dtype.type)
+
+        result = pd.Series(data)[0]
+        assert isinstance(result, data.dtype.type)
+
+    def test_getitem_scalar_na(self, data_missing, na_cmp, na_value):
+        result = data_missing[0]
+        assert na_cmp(result, na_value)
+
+    def test_getitem_mask(self, data):
+        # Empty mask, raw array
+        mask = np.zeros(len(data), dtype=bool)
+        result = data[mask]
+        assert len(result) == 0
+        assert isinstance(result, type(data))
+
+        # Empty mask, in series
+        mask = np.zeros(len(data), dtype=bool)
+        result = pd.Series(data)[mask]
+        assert len(result) == 0
+        assert result.dtype == data.dtype
+
+        # non-empty mask, raw array
+        mask[0] = True
+        result = data[mask]
+        assert len(result) == 1
+        assert isinstance(result, type(data))
+
+        # non-empty mask, in series
+        result = pd.Series(data)[mask]
+        assert len(result) == 1
+        assert result.dtype == data.dtype
+
+    def test_getitem_slice(self, data):
+        # getitem[slice] should return an array
+        result = data[slice(0)]  # empty
+        assert isinstance(result, type(data))
+
+        result = data[slice(1)]  # scalar
+        assert isinstance(result, type(data))
+
+    def test_get(self, data):
+        # GH 20882
+        s = pd.Series(data, index=[2 * i for i in range(len(data))])
+        assert s.get(4) == s.iloc[2]
+
+        result = s.get([4, 6])
+        expected = s.iloc[[2, 3]]
+        self.assert_series_equal(result, expected)
+
+        result = s.get(slice(2))
+        expected = s.iloc[[0, 1]]
+        self.assert_series_equal(result, expected)
+
+        assert s.get(-1) is None
+        assert s.get(s.index.max() + 1) is None
+
+        s = pd.Series(data[:6], index=list('abcdef'))
+        assert s.get('c') == s.iloc[2]
+
+        result = s.get(slice('b', 'd'))
+        expected = s.iloc[[1, 2, 3]]
+        self.assert_series_equal(result, expected)
+
+        result = s.get('Z')
+        assert result is None
+
+        assert s.get(4) == s.iloc[4]
+        assert s.get(-1) == s.iloc[-1]
+        assert s.get(len(s)) is None
+
+        # GH 21257
+        s = pd.Series(data)
+        s2 = s[::2]
+        assert s2.get(1) is None
+
+    def test_take_sequence(self, data):
+        result = pd.Series(data)[[0, 1, 3]]
+        assert result.iloc[0] == data[0]
+        assert result.iloc[1] == data[1]
+        assert result.iloc[2] == data[3]
+
+    def test_take(self, data, na_value, na_cmp):
+        result = data.take([0, -1])
+        assert result.dtype == data.dtype
+        assert result[0] == data[0]
+        assert result[1] == data[-1]
+
+        result = data.take([0, -1], allow_fill=True, fill_value=na_value)
+        assert result[0] == data[0]
+        assert na_cmp(result[1], na_value)
+
+        with tm.assert_raises_regex(IndexError, "out of bounds"):
+            data.take([len(data) + 1])
+
+    def test_take_empty(self, data, na_value, na_cmp):
+        empty = data[:0]
+
+        result = empty.take([-1], allow_fill=True)
+        assert na_cmp(result[0], na_value)
+
+        with pytest.raises(IndexError):
+            empty.take([-1])
+
+        with tm.assert_raises_regex(IndexError, "cannot do a non-empty take"):
+            empty.take([0, 1])
+
+    def test_take_negative(self, data):
+        # https://github.com/pandas-dev/pandas/issues/20640
+        n = len(data)
+        result = data.take([0, -n, n - 1, -1])
+        expected = data.take([0, 0, n - 1, n - 1])
+        self.assert_extension_array_equal(result, expected)
+
+    def test_take_non_na_fill_value(self, data_missing):
+        fill_value = data_missing[1]  # valid
+        na = data_missing[0]
+
+        array = data_missing._from_sequence([na, fill_value, na])
+        result = array.take([-1, 1], fill_value=fill_value, allow_fill=True)
+        expected = array.take([1, 1])
+        self.assert_extension_array_equal(result, expected)
+
+    def test_take_pandas_style_negative_raises(self, data, na_value):
+        with pytest.raises(ValueError):
+            data.take([0, -2], fill_value=na_value, allow_fill=True)
+
+    @pytest.mark.parametrize('allow_fill', [True, False])
+    def test_take_out_of_bounds_raises(self, data, allow_fill):
+        arr = data[:3]
+        with pytest.raises(IndexError):
+            arr.take(np.asarray([0, 3]), allow_fill=allow_fill)
+
+    def test_take_series(self, data):
+        s = pd.Series(data)
+        result = s.take([0, -1])
+        expected = pd.Series(
+            data._from_sequence([data[0], data[len(data) - 1]]),
+            index=[0, len(data) - 1])
+        self.assert_series_equal(result, expected)
+
+    def test_reindex(self, data, na_value):
+        s = pd.Series(data)
+        result = s.reindex([0, 1, 3])
+        expected = pd.Series(data.take([0, 1, 3]), index=[0, 1, 3])
+        self.assert_series_equal(result, expected)
+
+        n = len(data)
+        result = s.reindex([-1, 0, n])
+        expected = pd.Series(
+            data._from_sequence([na_value, data[0], na_value]),
+            index=[-1, 0, n])
+        self.assert_series_equal(result, expected)
+
+        result = s.reindex([n, n + 1])
+        expected = pd.Series(data._from_sequence([na_value, na_value]),
+                             index=[n, n + 1])
+        self.assert_series_equal(result, expected)
+
+    def test_reindex_non_na_fill_value(self, data_missing):
+        valid = data_missing[1]
+        na = data_missing[0]
+
+        array = data_missing._from_sequence([na, valid])
+        ser = pd.Series(array)
+        result = ser.reindex([0, 1, 2], fill_value=valid)
+        expected = pd.Series(data_missing._from_sequence([na, valid, valid]))
+
+        self.assert_series_equal(result, expected)
diff --git a/pandas/tests/extension/base/groupby.py b/pandas/tests/extension/base/groupby.py
new file mode 100644
index 0000000000000..a29ef2a509a63
--- /dev/null
+++ b/pandas/tests/extension/base/groupby.py
@@ -0,0 +1,69 @@
+import pytest
+
+import pandas.util.testing as tm
+import pandas as pd
+from .base import BaseExtensionTests
+
+
+class BaseGroupbyTests(BaseExtensionTests):
+    """Groupby-specific tests."""
+
+    def test_grouping_grouper(self, data_for_grouping):
+        df = pd.DataFrame({
+            "A": ["B", "B", None, None, "A", "A", "B", "C"],
+            "B": data_for_grouping
+        })
+        gr1 = df.groupby("A").grouper.groupings[0]
+        gr2 = df.groupby("B").grouper.groupings[0]
+
+        tm.assert_numpy_array_equal(gr1.grouper, df.A.values)
+        tm.assert_extension_array_equal(gr2.grouper, data_for_grouping)
+
+    @pytest.mark.parametrize('as_index', [True, False])
+    def test_groupby_extension_agg(self, as_index, data_for_grouping):
+        df = pd.DataFrame({"A": [1, 1, 2, 2, 3, 3, 1, 4],
+                           "B": data_for_grouping})
+        result = df.groupby("B", as_index=as_index).A.mean()
+        _, index = pd.factorize(data_for_grouping, sort=True)
+        # TODO(ExtensionIndex): remove astype
+        index = pd.Index(index.astype(object), name="B")
+        expected = pd.Series([3, 1, 4], index=index, name="A")
+        if as_index:
+            self.assert_series_equal(result, expected)
+        else:
+            expected = expected.reset_index()
+            self.assert_frame_equal(result, expected)
+
+    def test_groupby_extension_no_sort(self, data_for_grouping):
+        df = pd.DataFrame({"A": [1, 1, 2, 2, 3, 3, 1, 4],
+                           "B": data_for_grouping})
+        result = df.groupby("B", sort=False).A.mean()
+        _, index = pd.factorize(data_for_grouping, sort=False)
+        # TODO(ExtensionIndex): remove astype
+        index = pd.Index(index.astype(object), name="B")
+        expected = pd.Series([1, 3, 4], index=index, name="A")
+        self.assert_series_equal(result, expected)
+
+    def test_groupby_extension_transform(self, data_for_grouping):
+        valid = data_for_grouping[~data_for_grouping.isna()]
+        df = pd.DataFrame({"A": [1, 1, 3, 3, 1, 4],
+                           "B": valid})
+
+        result = df.groupby("B").A.transform(len)
+        expected = pd.Series([3, 3, 2, 2, 3, 1], name="A")
+
+        self.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('op', [
+        lambda x: 1,
+        lambda x: [1] * len(x),
+        lambda x: pd.Series([1] * len(x)),
+        lambda x: x,
+    ], ids=['scalar', 'list', 'series', 'object'])
+    def test_groupby_extension_apply(self, data_for_grouping, op):
+        df = pd.DataFrame({"A": [1, 1, 2, 2, 3, 3, 1, 4],
+                           "B": data_for_grouping})
+        df.groupby("B").apply(op)
+        df.groupby("B").A.apply(op)
+        df.groupby("A").apply(op)
+        df.groupby("A").B.apply(op)
diff --git a/pandas/tests/extension/base/interface.py b/pandas/tests/extension/base/interface.py
new file mode 100644
index 0000000000000..8ef8debbdc666
--- /dev/null
+++ b/pandas/tests/extension/base/interface.py
@@ -0,0 +1,59 @@
+import numpy as np
+
+import pandas as pd
+from pandas.compat import StringIO
+from pandas.core.dtypes.common import is_extension_array_dtype
+from pandas.core.dtypes.dtypes import ExtensionDtype
+
+from .base import BaseExtensionTests
+
+
+class BaseInterfaceTests(BaseExtensionTests):
+    """Tests that the basic interface is satisfied."""
+    # ------------------------------------------------------------------------
+    # Interface
+    # ------------------------------------------------------------------------
+
+    def test_len(self, data):
+        assert len(data) == 100
+
+    def test_ndim(self, data):
+        assert data.ndim == 1
+
+    def test_can_hold_na_valid(self, data):
+        # GH-20761
+        assert data._can_hold_na is True
+
+    def test_memory_usage(self, data):
+        s = pd.Series(data)
+        result = s.memory_usage(index=False)
+        assert result == s.nbytes
+
+    def test_array_interface(self, data):
+        result = np.array(data)
+        assert result[0] == data[0]
+
+    def test_repr(self, data):
+        ser = pd.Series(data)
+        assert data.dtype.name in repr(ser)
+
+        df = pd.DataFrame({"A": data})
+        repr(df)
+
+    def test_dtype_name_in_info(self, data):
+        buf = StringIO()
+        pd.DataFrame({"A": data}).info(buf=buf)
+        result = buf.getvalue()
+        assert data.dtype.name in result
+
+    def test_is_extension_array_dtype(self, data):
+        assert is_extension_array_dtype(data)
+        assert is_extension_array_dtype(data.dtype)
+        assert is_extension_array_dtype(pd.Series(data))
+        assert isinstance(data.dtype, ExtensionDtype)
+
+    def test_no_values_attribute(self, data):
+        # GH-20735: EA's with .values attribute give problems with internal
+        # code, disallowing this for now until solved
+        assert not hasattr(data, 'values')
+        assert not hasattr(data, '_values')
diff --git a/pandas/tests/extension/base/methods.py b/pandas/tests/extension/base/methods.py
new file mode 100644
index 0000000000000..23227867ee4d7
--- /dev/null
+++ b/pandas/tests/extension/base/methods.py
@@ -0,0 +1,139 @@
+import pytest
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+
+from .base import BaseExtensionTests
+
+
+class BaseMethodsTests(BaseExtensionTests):
+    """Various Series and DataFrame methods."""
+
+    @pytest.mark.parametrize('dropna', [True, False])
+    def test_value_counts(self, all_data, dropna):
+        all_data = all_data[:10]
+        if dropna:
+            other = np.array(all_data[~all_data.isna()])
+        else:
+            other = all_data
+
+        result = pd.Series(all_data).value_counts(dropna=dropna).sort_index()
+        expected = pd.Series(other).value_counts(dropna=dropna).sort_index()
+
+        self.assert_series_equal(result, expected)
+
+    def test_count(self, data_missing):
+        df = pd.DataFrame({"A": data_missing})
+        result = df.count(axis='columns')
+        expected = pd.Series([0, 1])
+        self.assert_series_equal(result, expected)
+
+    def test_apply_simple_series(self, data):
+        result = pd.Series(data).apply(id)
+        assert isinstance(result, pd.Series)
+
+    def test_argsort(self, data_for_sorting):
+        result = pd.Series(data_for_sorting).argsort()
+        expected = pd.Series(np.array([2, 0, 1], dtype=np.int64))
+        self.assert_series_equal(result, expected)
+
+    def test_argsort_missing(self, data_missing_for_sorting):
+        result = pd.Series(data_missing_for_sorting).argsort()
+        expected = pd.Series(np.array([1, -1, 0], dtype=np.int64))
+        self.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('ascending', [True, False])
+    def test_sort_values(self, data_for_sorting, ascending):
+        ser = pd.Series(data_for_sorting)
+        result = ser.sort_values(ascending=ascending)
+        expected = ser.iloc[[2, 0, 1]]
+        if not ascending:
+            expected = expected[::-1]
+
+        self.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('ascending', [True, False])
+    def test_sort_values_missing(self, data_missing_for_sorting, ascending):
+        ser = pd.Series(data_missing_for_sorting)
+        result = ser.sort_values(ascending=ascending)
+        if ascending:
+            expected = ser.iloc[[2, 0, 1]]
+        else:
+            expected = ser.iloc[[0, 2, 1]]
+        self.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('ascending', [True, False])
+    def test_sort_values_frame(self, data_for_sorting, ascending):
+        df = pd.DataFrame({"A": [1, 2, 1],
+                           "B": data_for_sorting})
+        result = df.sort_values(['A', 'B'])
+        expected = pd.DataFrame({"A": [1, 1, 2],
+                                 'B': data_for_sorting.take([2, 0, 1])},
+                                index=[2, 0, 1])
+        self.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('box', [pd.Series, lambda x: x])
+    @pytest.mark.parametrize('method', [lambda x: x.unique(), pd.unique])
+    def test_unique(self, data, box, method):
+        duplicated = box(data._from_sequence([data[0], data[0]]))
+
+        result = method(duplicated)
+
+        assert len(result) == 1
+        assert isinstance(result, type(data))
+        assert result[0] == duplicated[0]
+
+    @pytest.mark.parametrize('na_sentinel', [-1, -2])
+    def test_factorize(self, data_for_grouping, na_sentinel):
+        labels, uniques = pd.factorize(data_for_grouping,
+                                       na_sentinel=na_sentinel)
+        expected_labels = np.array([0, 0, na_sentinel,
+                                   na_sentinel, 1, 1, 0, 2],
+                                   dtype=np.intp)
+        expected_uniques = data_for_grouping.take([0, 4, 7])
+
+        tm.assert_numpy_array_equal(labels, expected_labels)
+        self.assert_extension_array_equal(uniques, expected_uniques)
+
+    @pytest.mark.parametrize('na_sentinel', [-1, -2])
+    def test_factorize_equivalence(self, data_for_grouping, na_sentinel):
+        l1, u1 = pd.factorize(data_for_grouping, na_sentinel=na_sentinel)
+        l2, u2 = data_for_grouping.factorize(na_sentinel=na_sentinel)
+
+        tm.assert_numpy_array_equal(l1, l2)
+        self.assert_extension_array_equal(u1, u2)
+
+    def test_combine_le(self, data_repeated):
+        # GH 20825
+        # Test that combine works when doing a <= (le) comparison
+        orig_data1, orig_data2 = data_repeated(2)
+        s1 = pd.Series(orig_data1)
+        s2 = pd.Series(orig_data2)
+        result = s1.combine(s2, lambda x1, x2: x1 <= x2)
+        expected = pd.Series([a <= b for (a, b) in
+                              zip(list(orig_data1), list(orig_data2))])
+        self.assert_series_equal(result, expected)
+
+        val = s1.iloc[0]
+        result = s1.combine(val, lambda x1, x2: x1 <= x2)
+        expected = pd.Series([a <= val for a in list(orig_data1)])
+        self.assert_series_equal(result, expected)
+
+    def test_combine_add(self, data_repeated):
+        # GH 20825
+        orig_data1, orig_data2 = data_repeated(2)
+        s1 = pd.Series(orig_data1)
+        s2 = pd.Series(orig_data2)
+        result = s1.combine(s2, lambda x1, x2: x1 + x2)
+        expected = pd.Series(
+            orig_data1._from_sequence([a + b for (a, b) in
+                                       zip(list(orig_data1),
+                                           list(orig_data2))]))
+        self.assert_series_equal(result, expected)
+
+        val = s1.iloc[0]
+        result = s1.combine(val, lambda x1, x2: x1 + x2)
+        expected = pd.Series(
+            orig_data1._from_sequence([a + val for a in list(orig_data1)]))
+        self.assert_series_equal(result, expected)
diff --git a/pandas/tests/extension/base/missing.py b/pandas/tests/extension/base/missing.py
new file mode 100644
index 0000000000000..af26d83df3fe2
--- /dev/null
+++ b/pandas/tests/extension/base/missing.py
@@ -0,0 +1,126 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+
+from .base import BaseExtensionTests
+
+
+class BaseMissingTests(BaseExtensionTests):
+    def test_isna(self, data_missing):
+        expected = np.array([True, False])
+
+        result = pd.isna(data_missing)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = pd.Series(data_missing).isna()
+        expected = pd.Series(expected)
+        self.assert_series_equal(result, expected)
+
+        # GH 21189
+        result = pd.Series(data_missing).drop([0, 1]).isna()
+        expected = pd.Series([], dtype=bool)
+        self.assert_series_equal(result, expected)
+
+    def test_dropna_series(self, data_missing):
+        ser = pd.Series(data_missing)
+        result = ser.dropna()
+        expected = ser.iloc[[1]]
+        self.assert_series_equal(result, expected)
+
+    def test_dropna_frame(self, data_missing):
+        df = pd.DataFrame({"A": data_missing})
+
+        # defaults
+        result = df.dropna()
+        expected = df.iloc[[1]]
+        self.assert_frame_equal(result, expected)
+
+        # axis = 1
+        result = df.dropna(axis='columns')
+        expected = pd.DataFrame(index=[0, 1])
+        self.assert_frame_equal(result, expected)
+
+        # multiple
+        df = pd.DataFrame({"A": data_missing,
+                           "B": [1, np.nan]})
+        result = df.dropna()
+        expected = df.iloc[:0]
+        self.assert_frame_equal(result, expected)
+
+    def test_fillna_scalar(self, data_missing):
+        valid = data_missing[1]
+        result = data_missing.fillna(valid)
+        expected = data_missing.fillna(valid)
+        self.assert_extension_array_equal(result, expected)
+
+    def test_fillna_limit_pad(self, data_missing):
+        arr = data_missing.take([1, 0, 0, 0, 1])
+        result = pd.Series(arr).fillna(method='ffill', limit=2)
+        expected = pd.Series(data_missing.take([1, 1, 1, 0, 1]))
+        self.assert_series_equal(result, expected)
+
+    def test_fillna_limit_backfill(self, data_missing):
+        arr = data_missing.take([1, 0, 0, 0, 1])
+        result = pd.Series(arr).fillna(method='backfill', limit=2)
+        expected = pd.Series(data_missing.take([1, 0, 1, 1, 1]))
+        self.assert_series_equal(result, expected)
+
+    def test_fillna_series(self, data_missing):
+        fill_value = data_missing[1]
+        ser = pd.Series(data_missing)
+
+        result = ser.fillna(fill_value)
+        expected = pd.Series(
+            data_missing._from_sequence([fill_value, fill_value]))
+        self.assert_series_equal(result, expected)
+
+        # Fill with a series
+        result = ser.fillna(expected)
+        self.assert_series_equal(result, expected)
+
+        # Fill with a series not affecting the missing values
+        result = ser.fillna(ser)
+        self.assert_series_equal(result, ser)
+
+    @pytest.mark.parametrize('method', ['ffill', 'bfill'])
+    def test_fillna_series_method(self, data_missing, method):
+        fill_value = data_missing[1]
+
+        if method == 'ffill':
+            data_missing = type(data_missing)(data_missing[::-1])
+
+        result = pd.Series(data_missing).fillna(method=method)
+        expected = pd.Series(
+            data_missing._from_sequence([fill_value, fill_value]))
+
+        self.assert_series_equal(result, expected)
+
+    def test_fillna_frame(self, data_missing):
+        fill_value = data_missing[1]
+
+        result = pd.DataFrame({
+            "A": data_missing,
+            "B": [1, 2]
+        }).fillna(fill_value)
+
+        expected = pd.DataFrame({
+            "A": data_missing._from_sequence([fill_value, fill_value]),
+            "B": [1, 2],
+        })
+
+        self.assert_frame_equal(result, expected)
+
+    def test_fillna_fill_other(self, data):
+        result = pd.DataFrame({
+            "A": data,
+            "B": [np.nan] * len(data)
+        }).fillna({"B": 0.0})
+
+        expected = pd.DataFrame({
+            "A": data,
+            "B": [0.0] * len(result),
+        })
+
+        self.assert_frame_equal(result, expected)
diff --git a/pandas/tests/extension/base/ops.py b/pandas/tests/extension/base/ops.py
new file mode 100644
index 0000000000000..659b9757ac1e3
--- /dev/null
+++ b/pandas/tests/extension/base/ops.py
@@ -0,0 +1,94 @@
+import pytest
+
+import operator
+
+import pandas as pd
+from .base import BaseExtensionTests
+
+
+class BaseOpsUtil(BaseExtensionTests):
+    def get_op_from_name(self, op_name):
+        short_opname = op_name.strip('_')
+        try:
+            op = getattr(operator, short_opname)
+        except AttributeError:
+            # Assume it is the reverse operator
+            rop = getattr(operator, short_opname[1:])
+            op = lambda x, y: rop(y, x)
+
+        return op
+
+    def check_opname(self, s, op_name, other, exc=NotImplementedError):
+        op = self.get_op_from_name(op_name)
+
+        self._check_op(s, op, other, exc)
+
+    def _check_op(self, s, op, other, exc=NotImplementedError):
+        if exc is None:
+            result = op(s, other)
+            expected = s.combine(other, op)
+            self.assert_series_equal(result, expected)
+        else:
+            with pytest.raises(exc):
+                op(s, other)
+
+
+class BaseArithmeticOpsTests(BaseOpsUtil):
+    """Various Series and DataFrame arithmetic ops methods."""
+
+    def test_arith_scalar(self, data, all_arithmetic_operators):
+        # scalar
+        op_name = all_arithmetic_operators
+        s = pd.Series(data)
+        self.check_opname(s, op_name, s.iloc[0], exc=TypeError)
+
+    def test_arith_array(self, data, all_arithmetic_operators):
+        # ndarray & other series
+        op_name = all_arithmetic_operators
+        s = pd.Series(data)
+        self.check_opname(s, op_name, [s.iloc[0]] * len(s), exc=TypeError)
+
+    def test_divmod(self, data):
+        s = pd.Series(data)
+        self._check_op(s, divmod, 1, exc=TypeError)
+        self._check_op(1, divmod, s, exc=TypeError)
+
+    def test_error(self, data, all_arithmetic_operators):
+        # invalid ops
+        op_name = all_arithmetic_operators
+        with pytest.raises(AttributeError):
+            getattr(data, op_name)
+
+
+class BaseComparisonOpsTests(BaseOpsUtil):
+    """Various Series and DataFrame comparison ops methods."""
+
+    def _compare_other(self, s, data, op_name, other):
+        op = self.get_op_from_name(op_name)
+        if op_name == '__eq__':
+            assert getattr(data, op_name)(other) is NotImplemented
+            assert not op(s, other).all()
+        elif op_name == '__ne__':
+            assert getattr(data, op_name)(other) is NotImplemented
+            assert op(s, other).all()
+
+        else:
+
+            # array
+            assert getattr(data, op_name)(other) is NotImplemented
+
+            # series
+            s = pd.Series(data)
+            with pytest.raises(TypeError):
+                op(s, other)
+
+    def test_compare_scalar(self, data, all_compare_operators):
+        op_name = all_compare_operators
+        s = pd.Series(data)
+        self._compare_other(s, data, op_name, 0)
+
+    def test_compare_array(self, data, all_compare_operators):
+        op_name = all_compare_operators
+        s = pd.Series(data)
+        other = [0] * len(data)
+        self._compare_other(s, data, op_name, other)
diff --git a/pandas/tests/extension/base/reshaping.py b/pandas/tests/extension/base/reshaping.py
new file mode 100644
index 0000000000000..fe920a47ab740
--- /dev/null
+++ b/pandas/tests/extension/base/reshaping.py
@@ -0,0 +1,164 @@
+import pytest
+import numpy as np
+
+import pandas as pd
+from pandas.core.internals import ExtensionBlock
+
+from .base import BaseExtensionTests
+
+
+class BaseReshapingTests(BaseExtensionTests):
+    """Tests for reshaping and concatenation."""
+    @pytest.mark.parametrize('in_frame', [True, False])
+    def test_concat(self, data, in_frame):
+        wrapped = pd.Series(data)
+        if in_frame:
+            wrapped = pd.DataFrame(wrapped)
+        result = pd.concat([wrapped, wrapped], ignore_index=True)
+
+        assert len(result) == len(data) * 2
+
+        if in_frame:
+            dtype = result.dtypes[0]
+        else:
+            dtype = result.dtype
+
+        assert dtype == data.dtype
+        assert isinstance(result._data.blocks[0], ExtensionBlock)
+
+    @pytest.mark.parametrize('in_frame', [True, False])
+    def test_concat_all_na_block(self, data_missing, in_frame):
+        valid_block = pd.Series(data_missing.take([1, 1]), index=[0, 1])
+        na_block = pd.Series(data_missing.take([0, 0]), index=[2, 3])
+        if in_frame:
+            valid_block = pd.DataFrame({"a": valid_block})
+            na_block = pd.DataFrame({"a": na_block})
+        result = pd.concat([valid_block, na_block])
+        if in_frame:
+            expected = pd.DataFrame({"a": data_missing.take([1, 1, 0, 0])})
+            self.assert_frame_equal(result, expected)
+        else:
+            expected = pd.Series(data_missing.take([1, 1, 0, 0]))
+            self.assert_series_equal(result, expected)
+
+    def test_concat_mixed_dtypes(self, data):
+        # https://github.com/pandas-dev/pandas/issues/20762
+        df1 = pd.DataFrame({'A': data[:3]})
+        df2 = pd.DataFrame({"A": [1, 2, 3]})
+        df3 = pd.DataFrame({"A": ['a', 'b', 'c']}).astype('category')
+        df4 = pd.DataFrame({"A": pd.SparseArray([1, 2, 3])})
+        dfs = [df1, df2, df3, df4]
+
+        # dataframes
+        result = pd.concat(dfs)
+        expected = pd.concat([x.astype(object) for x in dfs])
+        self.assert_frame_equal(result, expected)
+
+        # series
+        result = pd.concat([x['A'] for x in dfs])
+        expected = pd.concat([x['A'].astype(object) for x in dfs])
+        self.assert_series_equal(result, expected)
+
+        # simple test for just EA and one other
+        result = pd.concat([df1, df2])
+        expected = pd.concat([df1.astype('object'), df2.astype('object')])
+        self.assert_frame_equal(result, expected)
+
+        result = pd.concat([df1['A'], df2['A']])
+        expected = pd.concat([df1['A'].astype('object'),
+                              df2['A'].astype('object')])
+        self.assert_series_equal(result, expected)
+
+    def test_concat_columns(self, data, na_value):
+        df1 = pd.DataFrame({'A': data[:3]})
+        df2 = pd.DataFrame({'B': [1, 2, 3]})
+
+        expected = pd.DataFrame({'A': data[:3], 'B': [1, 2, 3]})
+        result = pd.concat([df1, df2], axis=1)
+        self.assert_frame_equal(result, expected)
+        result = pd.concat([df1['A'], df2['B']], axis=1)
+        self.assert_frame_equal(result, expected)
+
+        # non-aligned
+        df2 = pd.DataFrame({'B': [1, 2, 3]}, index=[1, 2, 3])
+        expected = pd.DataFrame({
+            'A': data._from_sequence(list(data[:3]) + [na_value]),
+            'B': [np.nan, 1, 2, 3]})
+        result = pd.concat([df1, df2], axis=1)
+        self.assert_frame_equal(result, expected)
+        result = pd.concat([df1['A'], df2['B']], axis=1)
+        self.assert_frame_equal(result, expected)
+
+    def test_align(self, data, na_value):
+        a = data[:3]
+        b = data[2:5]
+        r1, r2 = pd.Series(a).align(pd.Series(b, index=[1, 2, 3]))
+
+        # Assumes that the ctor can take a list of scalars of the type
+        e1 = pd.Series(data._from_sequence(list(a) + [na_value]))
+        e2 = pd.Series(data._from_sequence([na_value] + list(b)))
+        self.assert_series_equal(r1, e1)
+        self.assert_series_equal(r2, e2)
+
+    def test_align_frame(self, data, na_value):
+        a = data[:3]
+        b = data[2:5]
+        r1, r2 = pd.DataFrame({'A': a}).align(
+            pd.DataFrame({'A': b}, index=[1, 2, 3])
+        )
+
+        # Assumes that the ctor can take a list of scalars of the type
+        e1 = pd.DataFrame({'A': data._from_sequence(list(a) + [na_value])})
+        e2 = pd.DataFrame({'A': data._from_sequence([na_value] + list(b))})
+        self.assert_frame_equal(r1, e1)
+        self.assert_frame_equal(r2, e2)
+
+    def test_align_series_frame(self, data, na_value):
+        # https://github.com/pandas-dev/pandas/issues/20576
+        ser = pd.Series(data, name='a')
+        df = pd.DataFrame({"col": np.arange(len(ser) + 1)})
+        r1, r2 = ser.align(df)
+
+        e1 = pd.Series(data._from_sequence(list(data) + [na_value]),
+                       name=ser.name)
+
+        self.assert_series_equal(r1, e1)
+        self.assert_frame_equal(r2, df)
+
+    def test_set_frame_expand_regular_with_extension(self, data):
+        df = pd.DataFrame({"A": [1] * len(data)})
+        df['B'] = data
+        expected = pd.DataFrame({"A": [1] * len(data), "B": data})
+        self.assert_frame_equal(df, expected)
+
+    def test_set_frame_expand_extension_with_regular(self, data):
+        df = pd.DataFrame({'A': data})
+        df['B'] = [1] * len(data)
+        expected = pd.DataFrame({"A": data, "B": [1] * len(data)})
+        self.assert_frame_equal(df, expected)
+
+    def test_set_frame_overwrite_object(self, data):
+        # https://github.com/pandas-dev/pandas/issues/20555
+        df = pd.DataFrame({"A": [1] * len(data)}, dtype=object)
+        df['A'] = data
+        assert df.dtypes['A'] == data.dtype
+
+    def test_merge(self, data, na_value):
+        # GH-20743
+        df1 = pd.DataFrame({'ext': data[:3], 'int1': [1, 2, 3],
+                            'key': [0, 1, 2]})
+        df2 = pd.DataFrame({'int2': [1, 2, 3, 4], 'key': [0, 0, 1, 3]})
+
+        res = pd.merge(df1, df2)
+        exp = pd.DataFrame(
+            {'int1': [1, 1, 2], 'int2': [1, 2, 3], 'key': [0, 0, 1],
+             'ext': data._from_sequence([data[0], data[0], data[1]])})
+        self.assert_frame_equal(res, exp[['ext', 'int1', 'key', 'int2']])
+
+        res = pd.merge(df1, df2, how='outer')
+        exp = pd.DataFrame(
+            {'int1': [1, 1, 2, 3, np.nan], 'int2': [1, 2, 3, np.nan, 4],
+             'key': [0, 0, 1, 2, 3],
+             'ext': data._from_sequence(
+                 [data[0], data[0], data[1], data[2], na_value])})
+        self.assert_frame_equal(res, exp[['ext', 'int1', 'key', 'int2']])
diff --git a/pandas/tests/extension/base/setitem.py b/pandas/tests/extension/base/setitem.py
new file mode 100644
index 0000000000000..4e27f1eca538f
--- /dev/null
+++ b/pandas/tests/extension/base/setitem.py
@@ -0,0 +1,167 @@
+import operator
+
+import numpy as np
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+from .base import BaseExtensionTests
+
+
+class BaseSetitemTests(BaseExtensionTests):
+    def test_setitem_scalar_series(self, data):
+        arr = pd.Series(data)
+        arr[0] = data[1]
+        assert arr[0] == data[1]
+
+    def test_setitem_sequence(self, data):
+        arr = pd.Series(data)
+        original = data.copy()
+
+        arr[[0, 1]] = [data[1], data[0]]
+        assert arr[0] == original[1]
+        assert arr[1] == original[0]
+
+    @pytest.mark.parametrize('as_array', [True, False])
+    def test_setitem_sequence_mismatched_length_raises(self, data, as_array):
+        ser = pd.Series(data)
+        value = [data[0]]
+        if as_array:
+            value = data._from_sequence(value)
+
+        xpr = 'cannot set using a {} indexer with a different length'
+        with tm.assert_raises_regex(ValueError, xpr.format('list-like')):
+            ser[[0, 1]] = value
+
+        with tm.assert_raises_regex(ValueError, xpr.format('slice')):
+            ser[slice(3)] = value
+
+    def test_setitem_empty_indxer(self, data):
+        ser = pd.Series(data)
+        original = ser.copy()
+        ser[[]] = []
+        self.assert_series_equal(ser, original)
+
+    def test_setitem_sequence_broadcasts(self, data):
+        arr = pd.Series(data)
+
+        arr[[0, 1]] = data[2]
+        assert arr[0] == data[2]
+        assert arr[1] == data[2]
+
+    @pytest.mark.parametrize('setter', ['loc', 'iloc'])
+    def test_setitem_scalar(self, data, setter):
+        arr = pd.Series(data)
+        setter = getattr(arr, setter)
+        operator.setitem(setter, 0, data[1])
+        assert arr[0] == data[1]
+
+    def test_setitem_loc_scalar_mixed(self, data):
+        df = pd.DataFrame({"A": np.arange(len(data)), "B": data})
+        df.loc[0, 'B'] = data[1]
+        assert df.loc[0, 'B'] == data[1]
+
+    def test_setitem_loc_scalar_single(self, data):
+        df = pd.DataFrame({"B": data})
+        df.loc[10, 'B'] = data[1]
+        assert df.loc[10, 'B'] == data[1]
+
+    def test_setitem_loc_scalar_multiple_homogoneous(self, data):
+        df = pd.DataFrame({"A": data, "B": data})
+        df.loc[10, 'B'] = data[1]
+        assert df.loc[10, 'B'] == data[1]
+
+    def test_setitem_iloc_scalar_mixed(self, data):
+        df = pd.DataFrame({"A": np.arange(len(data)), "B": data})
+        df.iloc[0, 1] = data[1]
+        assert df.loc[0, 'B'] == data[1]
+
+    def test_setitem_iloc_scalar_single(self, data):
+        df = pd.DataFrame({"B": data})
+        df.iloc[10, 0] = data[1]
+        assert df.loc[10, 'B'] == data[1]
+
+    def test_setitem_iloc_scalar_multiple_homogoneous(self, data):
+        df = pd.DataFrame({"A": data, "B": data})
+        df.iloc[10, 1] = data[1]
+        assert df.loc[10, 'B'] == data[1]
+
+    @pytest.mark.parametrize('as_callable', [True, False])
+    @pytest.mark.parametrize('setter', ['loc', None])
+    def test_setitem_mask_aligned(self, data, as_callable, setter):
+        ser = pd.Series(data)
+        mask = np.zeros(len(data), dtype=bool)
+        mask[:2] = True
+
+        if as_callable:
+            mask2 = lambda x: mask
+        else:
+            mask2 = mask
+
+        if setter:
+            # loc
+            target = getattr(ser, setter)
+        else:
+            # Series.__setitem__
+            target = ser
+
+        operator.setitem(target, mask2, data[5:7])
+
+        ser[mask2] = data[5:7]
+        assert ser[0] == data[5]
+        assert ser[1] == data[6]
+
+    @pytest.mark.parametrize('setter', ['loc', None])
+    def test_setitem_mask_broadcast(self, data, setter):
+        ser = pd.Series(data)
+        mask = np.zeros(len(data), dtype=bool)
+        mask[:2] = True
+
+        if setter:   # loc
+            target = getattr(ser, setter)
+        else:  # __setitem__
+            target = ser
+
+        operator.setitem(target, mask, data[10])
+        assert ser[0] == data[10]
+        assert ser[1] == data[10]
+
+    def test_setitem_expand_columns(self, data):
+        df = pd.DataFrame({"A": data})
+        result = df.copy()
+        result['B'] = 1
+        expected = pd.DataFrame({"A": data, "B": [1] * len(data)})
+        self.assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.loc[:, 'B'] = 1
+        self.assert_frame_equal(result, expected)
+
+        # overwrite with new type
+        result['B'] = data
+        expected = pd.DataFrame({"A": data, "B": data})
+        self.assert_frame_equal(result, expected)
+
+    def test_setitem_expand_with_extension(self, data):
+        df = pd.DataFrame({"A": [1] * len(data)})
+        result = df.copy()
+        result['B'] = data
+        expected = pd.DataFrame({"A": [1] * len(data), "B": data})
+        self.assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.loc[:, 'B'] = data
+        self.assert_frame_equal(result, expected)
+
+    def test_setitem_frame_invalid_length(self, data):
+        df = pd.DataFrame({"A": [1] * len(data)})
+        xpr = "Length of values does not match length of index"
+        with tm.assert_raises_regex(ValueError, xpr):
+            df['B'] = data[:5]
+
+    @pytest.mark.xfail(reason="GH-20441: setitem on extension types.")
+    def test_setitem_tuple_index(self, data):
+        s = pd.Series(data[:2], index=[(0, 0), (0, 1)])
+        expected = pd.Series(data.take([1, 1]), index=s.index)
+        s[(0, 1)] = data[1]
+        self.assert_series_equal(s, expected)
diff --git a/vb_suite/source/_static/stub b/pandas/tests/extension/category/__init__.py
similarity index 100%
rename from vb_suite/source/_static/stub
rename to pandas/tests/extension/category/__init__.py
diff --git a/pandas/tests/extension/category/test_categorical.py b/pandas/tests/extension/category/test_categorical.py
new file mode 100644
index 0000000000000..ae0d72c204d13
--- /dev/null
+++ b/pandas/tests/extension/category/test_categorical.py
@@ -0,0 +1,211 @@
+import string
+
+import pytest
+import pandas as pd
+import numpy as np
+
+from pandas.api.types import CategoricalDtype
+from pandas import Categorical
+from pandas.tests.extension import base
+
+
+def make_data():
+    return np.random.choice(list(string.ascii_letters), size=100)
+
+
+@pytest.fixture
+def dtype():
+    return CategoricalDtype()
+
+
+@pytest.fixture
+def data():
+    """Length-100 PeriodArray for semantics test."""
+    return Categorical(make_data())
+
+
+@pytest.fixture
+def data_missing():
+    """Length 2 array with [NA, Valid]"""
+    return Categorical([np.nan, 'A'])
+
+
+@pytest.fixture
+def data_repeated():
+    """Return different versions of data for count times"""
+    def gen(count):
+        for _ in range(count):
+            yield Categorical(make_data())
+    yield gen
+
+
+@pytest.fixture
+def data_for_sorting():
+    return Categorical(['A', 'B', 'C'], categories=['C', 'A', 'B'],
+                       ordered=True)
+
+
+@pytest.fixture
+def data_missing_for_sorting():
+    return Categorical(['A', None, 'B'], categories=['B', 'A'],
+                       ordered=True)
+
+
+@pytest.fixture
+def na_value():
+    return np.nan
+
+
+@pytest.fixture
+def data_for_grouping():
+    return Categorical(['a', 'a', None, None, 'b', 'b', 'a', 'c'])
+
+
+class TestDtype(base.BaseDtypeTests):
+    pass
+
+
+class TestInterface(base.BaseInterfaceTests):
+    @pytest.mark.skip(reason="Memory usage doesn't match")
+    def test_memory_usage(self):
+        # Is this deliberate?
+        pass
+
+
+class TestConstructors(base.BaseConstructorsTests):
+    pass
+
+
+class TestReshaping(base.BaseReshapingTests):
+    @pytest.mark.skip(reason="Unobserved categories preseved in concat.")
+    def test_concat_columns(self, data, na_value):
+        pass
+
+    @pytest.mark.skip(reason="Unobserved categories preseved in concat.")
+    def test_align(self, data, na_value):
+        pass
+
+    @pytest.mark.skip(reason="Unobserved categories preseved in concat.")
+    def test_align_frame(self, data, na_value):
+        pass
+
+    @pytest.mark.skip(reason="Unobserved categories preseved in concat.")
+    def test_merge(self, data, na_value):
+        pass
+
+
+class TestGetitem(base.BaseGetitemTests):
+    skip_take = pytest.mark.skip(reason="GH-20664.")
+
+    @pytest.mark.skip(reason="Backwards compatibility")
+    def test_getitem_scalar(self):
+        # CategoricalDtype.type isn't "correct" since it should
+        # be a parent of the elements (object). But don't want
+        # to break things by changing.
+        pass
+
+    @skip_take
+    def test_take(self):
+        # TODO remove this once Categorical.take is fixed
+        pass
+
+    @skip_take
+    def test_take_negative(self):
+        pass
+
+    @skip_take
+    def test_take_pandas_style_negative_raises(self):
+        pass
+
+    @skip_take
+    def test_take_non_na_fill_value(self):
+        pass
+
+    @skip_take
+    def test_take_out_of_bounds_raises(self):
+        pass
+
+    @pytest.mark.skip(reason="GH-20747. Unobserved categories.")
+    def test_take_series(self):
+        pass
+
+    @skip_take
+    def test_reindex_non_na_fill_value(self):
+        pass
+
+    @pytest.mark.xfail(reason="Categorical.take buggy")
+    def test_take_empty(self):
+        pass
+
+    @pytest.mark.xfail(reason="test not written correctly for categorical")
+    def test_reindex(self):
+        pass
+
+
+class TestSetitem(base.BaseSetitemTests):
+    pass
+
+
+class TestMissing(base.BaseMissingTests):
+
+    @pytest.mark.skip(reason="Not implemented")
+    def test_fillna_limit_pad(self):
+        pass
+
+    @pytest.mark.skip(reason="Not implemented")
+    def test_fillna_limit_backfill(self):
+        pass
+
+
+class TestMethods(base.BaseMethodsTests):
+    pass
+
+    @pytest.mark.skip(reason="Unobserved categories included")
+    def test_value_counts(self, all_data, dropna):
+        pass
+
+    def test_combine_add(self, data_repeated):
+        # GH 20825
+        # When adding categoricals in combine, result is a string
+        orig_data1, orig_data2 = data_repeated(2)
+        s1 = pd.Series(orig_data1)
+        s2 = pd.Series(orig_data2)
+        result = s1.combine(s2, lambda x1, x2: x1 + x2)
+        expected = pd.Series(([a + b for (a, b) in
+                               zip(list(orig_data1), list(orig_data2))]))
+        self.assert_series_equal(result, expected)
+
+        val = s1.iloc[0]
+        result = s1.combine(val, lambda x1, x2: x1 + x2)
+        expected = pd.Series([a + val for a in list(orig_data1)])
+        self.assert_series_equal(result, expected)
+
+
+class TestCasting(base.BaseCastingTests):
+    pass
+
+
+class TestArithmeticOps(base.BaseArithmeticOpsTests):
+
+    def test_arith_scalar(self, data, all_arithmetic_operators):
+
+        op_name = all_arithmetic_operators
+        if op_name != '__rmod__':
+            super(TestArithmeticOps, self).test_arith_scalar(data, op_name)
+        else:
+            pytest.skip('rmod never called when string is first argument')
+
+
+class TestComparisonOps(base.BaseComparisonOpsTests):
+
+    def _compare_other(self, s, data, op_name, other):
+        op = self.get_op_from_name(op_name)
+        if op_name == '__eq__':
+            assert not op(data, other).all()
+
+        elif op_name == '__ne__':
+            assert op(data, other).all()
+
+        else:
+            with pytest.raises(TypeError):
+                op(data, other)
diff --git a/pandas/tests/extension/conftest.py b/pandas/tests/extension/conftest.py
new file mode 100644
index 0000000000000..4bbbb7df2f399
--- /dev/null
+++ b/pandas/tests/extension/conftest.py
@@ -0,0 +1,88 @@
+import operator
+
+import pytest
+
+
+@pytest.fixture
+def dtype():
+    """A fixture providing the ExtensionDtype to validate."""
+    raise NotImplementedError
+
+
+@pytest.fixture
+def data():
+    """Length-100 array for this type."""
+    raise NotImplementedError
+
+
+@pytest.fixture
+def data_missing():
+    """Length-2 array with [NA, Valid]"""
+    raise NotImplementedError
+
+
+@pytest.fixture(params=['data', 'data_missing'])
+def all_data(request, data, data_missing):
+    """Parametrized fixture giving 'data' and 'data_missing'"""
+    if request.param == 'data':
+        return data
+    elif request.param == 'data_missing':
+        return data_missing
+
+
+@pytest.fixture
+def data_repeated():
+    """Return different versions of data for count times"""
+    def gen(count):
+        for _ in range(count):
+            yield NotImplementedError
+    yield gen
+
+
+@pytest.fixture
+def data_for_sorting():
+    """Length-3 array with a known sort order.
+
+    This should be three items [B, C, A] with
+    A < B < C
+    """
+    raise NotImplementedError
+
+
+@pytest.fixture
+def data_missing_for_sorting():
+    """Length-3 array with a known sort order.
+
+    This should be three items [B, NA, A] with
+    A < B and NA missing.
+    """
+    raise NotImplementedError
+
+
+@pytest.fixture
+def na_cmp():
+    """Binary operator for comparing NA values.
+
+    Should return a function of two arguments that returns
+    True if both arguments are (scalar) NA for your type.
+
+    By default, uses ``operator.is_``
+    """
+    return operator.is_
+
+
+@pytest.fixture
+def na_value():
+    """The scalar missing value for this type. Default 'None'"""
+    return None
+
+
+@pytest.fixture
+def data_for_grouping():
+    """Data for factorization, grouping, and unique tests.
+
+    Expected to be like [B, B, NA, NA, A, A, B, C]
+
+    Where A < B < C and NA is missing
+    """
+    raise NotImplementedError
diff --git a/pandas/tests/extension/decimal/__init__.py b/pandas/tests/extension/decimal/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/extension/decimal/array.py b/pandas/tests/extension/decimal/array.py
new file mode 100644
index 0000000000000..3f2f24cd26af0
--- /dev/null
+++ b/pandas/tests/extension/decimal/array.py
@@ -0,0 +1,113 @@
+import decimal
+import numbers
+import random
+import sys
+
+import numpy as np
+
+import pandas as pd
+from pandas.core.arrays import (ExtensionArray,
+                                ExtensionScalarOpsMixin)
+from pandas.core.dtypes.base import ExtensionDtype
+
+
+class DecimalDtype(ExtensionDtype):
+    type = decimal.Decimal
+    name = 'decimal'
+    na_value = decimal.Decimal('NaN')
+
+    @classmethod
+    def construct_from_string(cls, string):
+        if string == cls.name:
+            return cls()
+        else:
+            raise TypeError("Cannot construct a '{}' from "
+                            "'{}'".format(cls, string))
+
+
+class DecimalArray(ExtensionArray, ExtensionScalarOpsMixin):
+    dtype = DecimalDtype()
+
+    def __init__(self, values):
+        for val in values:
+            if not isinstance(val, self.dtype.type):
+                raise TypeError("All values must be of type " +
+                                str(self.dtype.type))
+        values = np.asarray(values, dtype=object)
+
+        self._data = values
+        # Some aliases for common attribute names to ensure pandas supports
+        # these
+        self._items = self.data = self._data
+        # those aliases are currently not working due to assumptions
+        # in internal code (GH-20735)
+        # self._values = self.values = self.data
+
+    @classmethod
+    def _from_sequence(cls, scalars):
+        return cls(scalars)
+
+    @classmethod
+    def _from_factorized(cls, values, original):
+        return cls(values)
+
+    def __getitem__(self, item):
+        if isinstance(item, numbers.Integral):
+            return self._data[item]
+        else:
+            return type(self)(self._data[item])
+
+    def take(self, indexer, allow_fill=False, fill_value=None):
+        from pandas.api.extensions import take
+
+        data = self._data
+        if allow_fill and fill_value is None:
+            fill_value = self.dtype.na_value
+
+        result = take(data, indexer, fill_value=fill_value,
+                      allow_fill=allow_fill)
+        return self._from_sequence(result)
+
+    def copy(self, deep=False):
+        if deep:
+            return type(self)(self._data.copy())
+        return type(self)(self)
+
+    def __setitem__(self, key, value):
+        if pd.api.types.is_list_like(value):
+            value = [decimal.Decimal(v) for v in value]
+        else:
+            value = decimal.Decimal(value)
+        self._data[key] = value
+
+    def __len__(self):
+        return len(self._data)
+
+    def __repr__(self):
+        return 'DecimalArray({!r})'.format(self._data)
+
+    @property
+    def nbytes(self):
+        n = len(self)
+        if n:
+            return n * sys.getsizeof(self[0])
+        return 0
+
+    def isna(self):
+        return np.array([x.is_nan() for x in self._data], dtype=bool)
+
+    @property
+    def _na_value(self):
+        return decimal.Decimal('NaN')
+
+    @classmethod
+    def _concat_same_type(cls, to_concat):
+        return cls(np.concatenate([x._data for x in to_concat]))
+
+
+DecimalArray._add_arithmetic_ops()
+DecimalArray._add_comparison_ops()
+
+
+def make_data():
+    return [decimal.Decimal(random.random()) for _ in range(100)]
diff --git a/pandas/tests/extension/decimal/test_decimal.py b/pandas/tests/extension/decimal/test_decimal.py
new file mode 100644
index 0000000000000..45ee7f227c4f0
--- /dev/null
+++ b/pandas/tests/extension/decimal/test_decimal.py
@@ -0,0 +1,254 @@
+import decimal
+
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+import pytest
+
+from pandas.tests.extension import base
+
+from .array import DecimalDtype, DecimalArray, make_data
+
+
+@pytest.fixture
+def dtype():
+    return DecimalDtype()
+
+
+@pytest.fixture
+def data():
+    return DecimalArray(make_data())
+
+
+@pytest.fixture
+def data_missing():
+    return DecimalArray([decimal.Decimal('NaN'), decimal.Decimal(1)])
+
+
+@pytest.fixture
+def data_repeated():
+    def gen(count):
+        for _ in range(count):
+            yield DecimalArray(make_data())
+    yield gen
+
+
+@pytest.fixture
+def data_for_sorting():
+    return DecimalArray([decimal.Decimal('1'),
+                         decimal.Decimal('2'),
+                         decimal.Decimal('0')])
+
+
+@pytest.fixture
+def data_missing_for_sorting():
+    return DecimalArray([decimal.Decimal('1'),
+                         decimal.Decimal('NaN'),
+                         decimal.Decimal('0')])
+
+
+@pytest.fixture
+def na_cmp():
+    return lambda x, y: x.is_nan() and y.is_nan()
+
+
+@pytest.fixture
+def na_value():
+    return decimal.Decimal("NaN")
+
+
+@pytest.fixture
+def data_for_grouping():
+    b = decimal.Decimal('1.0')
+    a = decimal.Decimal('0.0')
+    c = decimal.Decimal('2.0')
+    na = decimal.Decimal('NaN')
+    return DecimalArray([b, b, na, na, a, a, b, c])
+
+
+class BaseDecimal(object):
+
+    def assert_series_equal(self, left, right, *args, **kwargs):
+
+        left_na = left.isna()
+        right_na = right.isna()
+
+        tm.assert_series_equal(left_na, right_na)
+        return tm.assert_series_equal(left[~left_na],
+                                      right[~right_na],
+                                      *args, **kwargs)
+
+    def assert_frame_equal(self, left, right, *args, **kwargs):
+        # TODO(EA): select_dtypes
+        tm.assert_index_equal(
+            left.columns, right.columns,
+            exact=kwargs.get('check_column_type', 'equiv'),
+            check_names=kwargs.get('check_names', True),
+            check_exact=kwargs.get('check_exact', False),
+            check_categorical=kwargs.get('check_categorical', True),
+            obj='{obj}.columns'.format(obj=kwargs.get('obj', 'DataFrame')))
+
+        decimals = (left.dtypes == 'decimal').index
+
+        for col in decimals:
+            self.assert_series_equal(left[col], right[col],
+                                     *args, **kwargs)
+
+        left = left.drop(columns=decimals)
+        right = right.drop(columns=decimals)
+        tm.assert_frame_equal(left, right, *args, **kwargs)
+
+
+class TestDtype(BaseDecimal, base.BaseDtypeTests):
+    pass
+
+
+class TestInterface(BaseDecimal, base.BaseInterfaceTests):
+    pass
+
+
+class TestConstructors(BaseDecimal, base.BaseConstructorsTests):
+    pass
+
+
+class TestReshaping(BaseDecimal, base.BaseReshapingTests):
+    pass
+
+
+class TestGetitem(BaseDecimal, base.BaseGetitemTests):
+
+    def test_take_na_value_other_decimal(self):
+        arr = DecimalArray([decimal.Decimal('1.0'),
+                            decimal.Decimal('2.0')])
+        result = arr.take([0, -1], allow_fill=True,
+                          fill_value=decimal.Decimal('-1.0'))
+        expected = DecimalArray([decimal.Decimal('1.0'),
+                                 decimal.Decimal('-1.0')])
+        self.assert_extension_array_equal(result, expected)
+
+
+class TestMissing(BaseDecimal, base.BaseMissingTests):
+    pass
+
+
+class TestMethods(BaseDecimal, base.BaseMethodsTests):
+    @pytest.mark.parametrize('dropna', [True, False])
+    @pytest.mark.xfail(reason="value_counts not implemented yet.")
+    def test_value_counts(self, all_data, dropna):
+        all_data = all_data[:10]
+        if dropna:
+            other = np.array(all_data[~all_data.isna()])
+        else:
+            other = all_data
+
+        result = pd.Series(all_data).value_counts(dropna=dropna).sort_index()
+        expected = pd.Series(other).value_counts(dropna=dropna).sort_index()
+
+        tm.assert_series_equal(result, expected)
+
+
+class TestCasting(BaseDecimal, base.BaseCastingTests):
+    pass
+
+
+class TestGroupby(BaseDecimal, base.BaseGroupbyTests):
+    pass
+
+
+def test_series_constructor_coerce_data_to_extension_dtype_raises():
+    xpr = ("Cannot cast data to extension dtype 'decimal'. Pass the "
+           "extension array directly.")
+    with tm.assert_raises_regex(ValueError, xpr):
+        pd.Series([0, 1, 2], dtype=DecimalDtype())
+
+
+def test_series_constructor_with_same_dtype_ok():
+    arr = DecimalArray([decimal.Decimal('10.0')])
+    result = pd.Series(arr, dtype=DecimalDtype())
+    expected = pd.Series(arr)
+    tm.assert_series_equal(result, expected)
+
+
+def test_series_constructor_coerce_extension_array_to_dtype_raises():
+    arr = DecimalArray([decimal.Decimal('10.0')])
+    xpr = r"Cannot specify a dtype 'int64' .* \('decimal'\)."
+
+    with tm.assert_raises_regex(ValueError, xpr):
+        pd.Series(arr, dtype='int64')
+
+
+def test_dataframe_constructor_with_same_dtype_ok():
+    arr = DecimalArray([decimal.Decimal('10.0')])
+
+    result = pd.DataFrame({"A": arr}, dtype=DecimalDtype())
+    expected = pd.DataFrame({"A": arr})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_dataframe_constructor_with_different_dtype_raises():
+    arr = DecimalArray([decimal.Decimal('10.0')])
+
+    xpr = "Cannot coerce extension array to dtype 'int64'. "
+    with tm.assert_raises_regex(ValueError, xpr):
+        pd.DataFrame({"A": arr}, dtype='int64')
+
+
+class TestArithmeticOps(BaseDecimal, base.BaseArithmeticOpsTests):
+
+    def check_opname(self, s, op_name, other, exc=None):
+        super(TestArithmeticOps, self).check_opname(s, op_name,
+                                                    other, exc=None)
+
+    def test_arith_array(self, data, all_arithmetic_operators):
+        op_name = all_arithmetic_operators
+        s = pd.Series(data)
+
+        context = decimal.getcontext()
+        divbyzerotrap = context.traps[decimal.DivisionByZero]
+        invalidoptrap = context.traps[decimal.InvalidOperation]
+        context.traps[decimal.DivisionByZero] = 0
+        context.traps[decimal.InvalidOperation] = 0
+
+        # Decimal supports ops with int, but not float
+        other = pd.Series([int(d * 100) for d in data])
+        self.check_opname(s, op_name, other)
+
+        if "mod" not in op_name:
+            self.check_opname(s, op_name, s * 2)
+
+        self.check_opname(s, op_name, 0)
+        self.check_opname(s, op_name, 5)
+        context.traps[decimal.DivisionByZero] = divbyzerotrap
+        context.traps[decimal.InvalidOperation] = invalidoptrap
+
+    @pytest.mark.skip(reason="divmod not appropriate for decimal")
+    def test_divmod(self, data):
+        pass
+
+    def test_error(self):
+        pass
+
+
+class TestComparisonOps(BaseDecimal, base.BaseComparisonOpsTests):
+
+    def check_opname(self, s, op_name, other, exc=None):
+        super(TestComparisonOps, self).check_opname(s, op_name,
+                                                    other, exc=None)
+
+    def _compare_other(self, s, data, op_name, other):
+        self.check_opname(s, op_name, other)
+
+    def test_compare_scalar(self, data, all_compare_operators):
+        op_name = all_compare_operators
+        s = pd.Series(data)
+        self._compare_other(s, data, op_name, 0.5)
+
+    def test_compare_array(self, data, all_compare_operators):
+        op_name = all_compare_operators
+        s = pd.Series(data)
+
+        alter = np.random.choice([-1, 0, 1], len(data))
+        # Randomly double, halve or keep same value
+        other = pd.Series(data) * [decimal.Decimal(pow(2.0, i))
+                                   for i in alter]
+        self._compare_other(s, data, op_name, other)
diff --git a/pandas/tests/extension/json/__init__.py b/pandas/tests/extension/json/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/extension/json/array.py b/pandas/tests/extension/json/array.py
new file mode 100644
index 0000000000000..d3043bf0852d2
--- /dev/null
+++ b/pandas/tests/extension/json/array.py
@@ -0,0 +1,179 @@
+"""Test extension array for storing nested data in a pandas container.
+
+The JSONArray stores lists of dictionaries. The storage mechanism is a list,
+not an ndarray.
+
+Note:
+
+We currently store lists of UserDicts (Py3 only). Pandas has a few places
+internally that specifically check for dicts, and does non-scalar things
+in that case. We *want* the dictionaries to be treated as scalars, so we
+hack around pandas by using UserDicts.
+"""
+import collections
+import itertools
+import numbers
+import random
+import string
+import sys
+
+import numpy as np
+
+from pandas.core.dtypes.base import ExtensionDtype
+from pandas.core.arrays import ExtensionArray
+
+
+class JSONDtype(ExtensionDtype):
+    type = collections.Mapping
+    name = 'json'
+    try:
+        na_value = collections.UserDict()
+    except AttributeError:
+        # source compatibility with Py2.
+        na_value = {}
+
+    @classmethod
+    def construct_from_string(cls, string):
+        if string == cls.name:
+            return cls()
+        else:
+            raise TypeError("Cannot construct a '{}' from "
+                            "'{}'".format(cls, string))
+
+
+class JSONArray(ExtensionArray):
+    dtype = JSONDtype()
+
+    def __init__(self, values):
+        for val in values:
+            if not isinstance(val, self.dtype.type):
+                raise TypeError("All values must be of type " +
+                                str(self.dtype.type))
+        self.data = values
+
+        # Some aliases for common attribute names to ensure pandas supports
+        # these
+        self._items = self._data = self.data
+        # those aliases are currently not working due to assumptions
+        # in internal code (GH-20735)
+        # self._values = self.values = self.data
+
+    @classmethod
+    def _from_sequence(cls, scalars):
+        return cls(scalars)
+
+    @classmethod
+    def _from_factorized(cls, values, original):
+        return cls([collections.UserDict(x) for x in values if x != ()])
+
+    def __getitem__(self, item):
+        if isinstance(item, numbers.Integral):
+            return self.data[item]
+        elif isinstance(item, np.ndarray) and item.dtype == 'bool':
+            return self._from_sequence([x for x, m in zip(self, item) if m])
+        elif isinstance(item, collections.Iterable):
+            # fancy indexing
+            return type(self)([self.data[i] for i in item])
+        else:
+            # slice
+            return type(self)(self.data[item])
+
+    def __setitem__(self, key, value):
+        if isinstance(key, numbers.Integral):
+            self.data[key] = value
+        else:
+            if not isinstance(value, (type(self),
+                                      collections.Sequence)):
+                # broadcast value
+                value = itertools.cycle([value])
+
+            if isinstance(key, np.ndarray) and key.dtype == 'bool':
+                # masking
+                for i, (k, v) in enumerate(zip(key, value)):
+                    if k:
+                        assert isinstance(v, self.dtype.type)
+                        self.data[i] = v
+            else:
+                for k, v in zip(key, value):
+                    assert isinstance(v, self.dtype.type)
+                    self.data[k] = v
+
+    def __len__(self):
+        return len(self.data)
+
+    def __repr__(self):
+        return 'JSONArary({!r})'.format(self.data)
+
+    @property
+    def nbytes(self):
+        return sys.getsizeof(self.data)
+
+    def isna(self):
+        return np.array([x == self.dtype.na_value for x in self.data],
+                        dtype=bool)
+
+    def take(self, indexer, allow_fill=False, fill_value=None):
+        # re-implement here, since NumPy has trouble setting
+        # sized objects like UserDicts into scalar slots of
+        # an ndarary.
+        indexer = np.asarray(indexer)
+        msg = ("Index is out of bounds or cannot do a "
+               "non-empty take from an empty array.")
+
+        if allow_fill:
+            if fill_value is None:
+                fill_value = self.dtype.na_value
+            # bounds check
+            if (indexer < -1).any():
+                raise ValueError
+            try:
+                output = [self.data[loc] if loc != -1 else fill_value
+                          for loc in indexer]
+            except IndexError:
+                raise IndexError(msg)
+        else:
+            try:
+                output = [self.data[loc] for loc in indexer]
+            except IndexError:
+                raise IndexError(msg)
+
+        return self._from_sequence(output)
+
+    def copy(self, deep=False):
+        return type(self)(self.data[:])
+
+    def astype(self, dtype, copy=True):
+        # NumPy has issues when all the dicts are the same length.
+        # np.array([UserDict(...), UserDict(...)]) fails,
+        # but np.array([{...}, {...}]) works, so cast.
+        return np.array([dict(x) for x in self], dtype=dtype, copy=copy)
+
+    def unique(self):
+        # Parent method doesn't work since np.array will try to infer
+        # a 2-dim object.
+        return type(self)([
+            dict(x) for x in list(set(tuple(d.items()) for d in self.data))
+        ])
+
+    @classmethod
+    def _concat_same_type(cls, to_concat):
+        data = list(itertools.chain.from_iterable([x.data for x in to_concat]))
+        return cls(data)
+
+    def _values_for_factorize(self):
+        frozen = self._values_for_argsort()
+        return frozen, ()
+
+    def _values_for_argsort(self):
+        # Disable NumPy's shape inference by including an empty tuple...
+        # If all the elemnts of self are the same size P, NumPy will
+        # cast them to an (N, P) array, instead of an (N,) array of tuples.
+        frozen = [()] + list(tuple(x.items()) for x in self)
+        return np.array(frozen, dtype=object)[1:]
+
+
+def make_data():
+    # TODO: Use a regular dict. See _NDFrameIndexer._setitem_with_indexer
+    return [collections.UserDict([
+        (random.choice(string.ascii_letters), random.randint(0, 100))
+        for _ in range(random.randint(0, 10))]) for _ in range(100)]
diff --git a/pandas/tests/extension/json/test_json.py b/pandas/tests/extension/json/test_json.py
new file mode 100644
index 0000000000000..268134dc8c333
--- /dev/null
+++ b/pandas/tests/extension/json/test_json.py
@@ -0,0 +1,249 @@
+import operator
+import collections
+
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.compat import PY2, PY36
+from pandas.tests.extension import base
+
+from .array import JSONArray, JSONDtype, make_data
+
+pytestmark = pytest.mark.skipif(PY2, reason="Py2 doesn't have a UserDict")
+
+
+@pytest.fixture
+def dtype():
+    return JSONDtype()
+
+
+@pytest.fixture
+def data():
+    """Length-100 PeriodArray for semantics test."""
+    data = make_data()
+
+    # Why the while loop? NumPy is unable to construct an ndarray from
+    # equal-length ndarrays. Many of our operations involve coercing the
+    # EA to an ndarray of objects. To avoid random test failures, we ensure
+    # that our data is coercable to an ndarray. Several tests deal with only
+    # the first two elements, so that's what we'll check.
+
+    while len(data[0]) == len(data[1]):
+        data = make_data()
+
+    return JSONArray(data)
+
+
+@pytest.fixture
+def data_missing():
+    """Length 2 array with [NA, Valid]"""
+    return JSONArray([{}, {'a': 10}])
+
+
+@pytest.fixture
+def data_for_sorting():
+    return JSONArray([{'b': 1}, {'c': 4}, {'a': 2, 'c': 3}])
+
+
+@pytest.fixture
+def data_missing_for_sorting():
+    return JSONArray([{'b': 1}, {}, {'a': 4}])
+
+
+@pytest.fixture
+def na_value(dtype):
+    return dtype.na_value
+
+
+@pytest.fixture
+def na_cmp():
+    return operator.eq
+
+
+@pytest.fixture
+def data_for_grouping():
+    return JSONArray([
+        {'b': 1}, {'b': 1},
+        {}, {},
+        {'a': 0, 'c': 2}, {'a': 0, 'c': 2},
+        {'b': 1},
+        {'c': 2},
+    ])
+
+
+class BaseJSON(object):
+    # NumPy doesn't handle an array of equal-length UserDicts.
+    # The default assert_series_equal eventually does a
+    # Series.values, which raises. We work around it by
+    # converting the UserDicts to dicts.
+    def assert_series_equal(self, left, right, **kwargs):
+        if left.dtype.name == 'json':
+            assert left.dtype == right.dtype
+            left = pd.Series(JSONArray(left.values.astype(object)),
+                             index=left.index, name=left.name)
+            right = pd.Series(JSONArray(right.values.astype(object)),
+                              index=right.index, name=right.name)
+        tm.assert_series_equal(left, right, **kwargs)
+
+    def assert_frame_equal(self, left, right, *args, **kwargs):
+        tm.assert_index_equal(
+            left.columns, right.columns,
+            exact=kwargs.get('check_column_type', 'equiv'),
+            check_names=kwargs.get('check_names', True),
+            check_exact=kwargs.get('check_exact', False),
+            check_categorical=kwargs.get('check_categorical', True),
+            obj='{obj}.columns'.format(obj=kwargs.get('obj', 'DataFrame')))
+
+        jsons = (left.dtypes == 'json').index
+
+        for col in jsons:
+            self.assert_series_equal(left[col], right[col],
+                                     *args, **kwargs)
+
+        left = left.drop(columns=jsons)
+        right = right.drop(columns=jsons)
+        tm.assert_frame_equal(left, right, *args, **kwargs)
+
+
+class TestDtype(BaseJSON, base.BaseDtypeTests):
+    pass
+
+
+class TestInterface(BaseJSON, base.BaseInterfaceTests):
+    def test_custom_asserts(self):
+        # This would always trigger the KeyError from trying to put
+        # an array of equal-length UserDicts inside an ndarray.
+        data = JSONArray([collections.UserDict({'a': 1}),
+                          collections.UserDict({'b': 2}),
+                          collections.UserDict({'c': 3})])
+        a = pd.Series(data)
+        self.assert_series_equal(a, a)
+        self.assert_frame_equal(a.to_frame(), a.to_frame())
+
+        b = pd.Series(data.take([0, 0, 1]))
+        with pytest.raises(AssertionError):
+            self.assert_series_equal(a, b)
+
+        with pytest.raises(AssertionError):
+            self.assert_frame_equal(a.to_frame(), b.to_frame())
+
+
+class TestConstructors(BaseJSON, base.BaseConstructorsTests):
+    pass
+
+
+class TestReshaping(BaseJSON, base.BaseReshapingTests):
+    pass
+
+
+class TestGetitem(BaseJSON, base.BaseGetitemTests):
+    pass
+
+
+class TestMissing(BaseJSON, base.BaseMissingTests):
+    @pytest.mark.xfail(reason="Setting a dict as a scalar")
+    def test_fillna_series(self):
+        """We treat dictionaries as a mapping in fillna, not a scalar."""
+
+    @pytest.mark.xfail(reason="Setting a dict as a scalar")
+    def test_fillna_frame(self):
+        """We treat dictionaries as a mapping in fillna, not a scalar."""
+
+
+unhashable = pytest.mark.skip(reason="Unhashable")
+unstable = pytest.mark.skipif(not PY36,  # 3.6 or higher
+                              reason="Dictionary order unstable")
+
+
+class TestMethods(BaseJSON, base.BaseMethodsTests):
+    @unhashable
+    def test_value_counts(self, all_data, dropna):
+        pass
+
+    @unhashable
+    def test_sort_values_frame(self):
+        # TODO (EA.factorize): see if _values_for_factorize allows this.
+        pass
+
+    @unstable
+    def test_argsort(self, data_for_sorting):
+        super(TestMethods, self).test_argsort(data_for_sorting)
+
+    @unstable
+    def test_argsort_missing(self, data_missing_for_sorting):
+        super(TestMethods, self).test_argsort_missing(
+            data_missing_for_sorting)
+
+    @unstable
+    @pytest.mark.parametrize('ascending', [True, False])
+    def test_sort_values(self, data_for_sorting, ascending):
+        super(TestMethods, self).test_sort_values(
+            data_for_sorting, ascending)
+
+    @unstable
+    @pytest.mark.parametrize('ascending', [True, False])
+    def test_sort_values_missing(self, data_missing_for_sorting, ascending):
+        super(TestMethods, self).test_sort_values_missing(
+            data_missing_for_sorting, ascending)
+
+    @pytest.mark.skip(reason="combine for JSONArray not supported")
+    def test_combine_le(self, data_repeated):
+        pass
+
+    @pytest.mark.skip(reason="combine for JSONArray not supported")
+    def test_combine_add(self, data_repeated):
+        pass
+
+
+class TestCasting(BaseJSON, base.BaseCastingTests):
+    @pytest.mark.xfail
+    def test_astype_str(self):
+        """This currently fails in NumPy on np.array(self, dtype=str) with
+
+        *** ValueError: setting an array element with a sequence
+        """
+
+
+# We intentionally don't run base.BaseSetitemTests because pandas'
+# internals has trouble setting sequences of values into scalar positions.
+
+
+class TestGroupby(BaseJSON, base.BaseGroupbyTests):
+
+    @unhashable
+    def test_groupby_extension_transform(self):
+        """
+        This currently fails in Series.name.setter, since the
+        name must be hashable, but the value is a dictionary.
+        I think this is what we want, i.e. `.name` should be the original
+        values, and not the values for factorization.
+        """
+
+    @unhashable
+    def test_groupby_extension_apply(self):
+        """
+        This fails in Index._do_unique_check with
+
+        >   hash(val)
+        E   TypeError: unhashable type: 'UserDict' with
+
+        I suspect that once we support Index[ExtensionArray],
+        we'll be able to dispatch unique.
+        """
+
+    @unstable
+    @pytest.mark.parametrize('as_index', [True, False])
+    def test_groupby_extension_agg(self, as_index, data_for_grouping):
+        super(TestGroupby, self).test_groupby_extension_agg(
+            as_index, data_for_grouping
+        )
+
+
+class TestArithmeticOps(BaseJSON, base.BaseArithmeticOpsTests):
+    def test_error(self, data, all_arithmetic_operators):
+        pass
+
+
+class TestComparisonOps(BaseJSON, base.BaseComparisonOpsTests):
+    pass
diff --git a/pandas/tests/extension/test_common.py b/pandas/tests/extension/test_common.py
new file mode 100644
index 0000000000000..589134632c7e9
--- /dev/null
+++ b/pandas/tests/extension/test_common.py
@@ -0,0 +1,85 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.core.arrays import ExtensionArray
+from pandas.core.dtypes.common import is_extension_array_dtype
+from pandas.core.dtypes import dtypes
+
+
+class DummyDtype(dtypes.ExtensionDtype):
+    pass
+
+
+class DummyArray(ExtensionArray):
+
+    def __init__(self, data):
+        self.data = data
+
+    def __array__(self, dtype):
+        return self.data
+
+    @property
+    def dtype(self):
+        return self.data.dtype
+
+
+class TestExtensionArrayDtype(object):
+
+    @pytest.mark.parametrize('values', [
+        pd.Categorical([]),
+        pd.Categorical([]).dtype,
+        pd.Series(pd.Categorical([])),
+        DummyDtype(),
+        DummyArray(np.array([1, 2])),
+    ])
+    def test_is_extension_array_dtype(self, values):
+        assert is_extension_array_dtype(values)
+
+    @pytest.mark.parametrize('values', [
+        np.array([]),
+        pd.Series(np.array([])),
+    ])
+    def test_is_not_extension_array_dtype(self, values):
+        assert not is_extension_array_dtype(values)
+
+
+def test_astype():
+
+    arr = DummyArray(np.array([1, 2, 3]))
+    expected = np.array([1, 2, 3], dtype=object)
+
+    result = arr.astype(object)
+    tm.assert_numpy_array_equal(result, expected)
+
+    result = arr.astype('object')
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_astype_no_copy():
+    arr = DummyArray(np.array([1, 2, 3], dtype=np.int64))
+    result = arr.astype(arr.dtype, copy=False)
+
+    assert arr.data is result
+
+    result = arr.astype(arr.dtype)
+    assert arr.data is not result
+
+
+@pytest.mark.parametrize('dtype', [
+    dtypes.DatetimeTZDtype('ns', 'US/Central'),
+    dtypes.PeriodDtype("D"),
+    dtypes.IntervalDtype(),
+])
+def test_is_not_extension_array_dtype(dtype):
+    assert not isinstance(dtype, dtypes.ExtensionDtype)
+    assert not is_extension_array_dtype(dtype)
+
+
+@pytest.mark.parametrize('dtype', [
+    dtypes.CategoricalDtype(),
+])
+def test_is_extension_array_dtype(dtype):
+    assert isinstance(dtype, dtypes.ExtensionDtype)
+    assert is_extension_array_dtype(dtype)
diff --git a/pandas/tests/extension/test_external_block.py b/pandas/tests/extension/test_external_block.py
new file mode 100644
index 0000000000000..991da41168aa0
--- /dev/null
+++ b/pandas/tests/extension/test_external_block.py
@@ -0,0 +1,77 @@
+# -*- coding: utf-8 -*-
+# pylint: disable=W0102
+
+import numpy as np
+
+import pandas as pd
+from pandas.core.internals import (
+    BlockManager, SingleBlockManager, NonConsolidatableMixIn, Block)
+
+import pytest
+
+
+class CustomBlock(NonConsolidatableMixIn, Block):
+
+    _holder = np.ndarray
+
+    def formatting_values(self):
+        return np.array(["Val: {}".format(i) for i in self.values])
+
+    def concat_same_type(self, to_concat, placement=None):
+        """
+        Always concatenate disregarding self.ndim as the values are
+        always 1D in this custom Block
+        """
+        values = np.concatenate([blk.values for blk in to_concat])
+        return self.make_block_same_class(
+            values, placement=placement or slice(0, len(values), 1))
+
+
+@pytest.fixture
+def df():
+    df1 = pd.DataFrame({'a': [1, 2, 3]})
+    blocks = df1._data.blocks
+    values = np.arange(3, dtype='int64')
+    custom_block = CustomBlock(values, placement=slice(1, 2))
+    blocks = blocks + (custom_block,)
+    block_manager = BlockManager(blocks, [pd.Index(['a', 'b']), df1.index])
+    return pd.DataFrame(block_manager)
+
+
+def test_custom_repr():
+    values = np.arange(3, dtype='int64')
+
+    # series
+    block = CustomBlock(values, placement=slice(0, 3))
+
+    s = pd.Series(SingleBlockManager(block, pd.RangeIndex(3)))
+    assert repr(s) == '0    Val: 0\n1    Val: 1\n2    Val: 2\ndtype: int64'
+
+    # dataframe
+    block = CustomBlock(values, placement=slice(0, 1))
+    blk_mgr = BlockManager([block], [['col'], range(3)])
+    df = pd.DataFrame(blk_mgr)
+    assert repr(df) == '      col\n0  Val: 0\n1  Val: 1\n2  Val: 2'
+
+
+def test_concat_series():
+    # GH17728
+    values = np.arange(3, dtype='int64')
+    block = CustomBlock(values, placement=slice(0, 3))
+    s = pd.Series(block, pd.RangeIndex(3), fastpath=True)
+
+    res = pd.concat([s, s])
+    assert isinstance(res._data.blocks[0], CustomBlock)
+
+
+def test_concat_dataframe(df):
+    # GH17728
+    res = pd.concat([df, df])
+    assert isinstance(res._data.blocks[1], CustomBlock)
+
+
+def test_concat_axis1(df):
+    # GH17954
+    df2 = pd.DataFrame({'c': [.1, .2, .3]})
+    res = pd.concat([df, df2], axis=1)
+    assert isinstance(res._data.blocks[1], CustomBlock)
diff --git a/pandas/tests/frame/__init__.py b/pandas/tests/frame/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/frame/common.py b/pandas/tests/frame/common.py
new file mode 100644
index 0000000000000..c85fea3c3d71b
--- /dev/null
+++ b/pandas/tests/frame/common.py
@@ -0,0 +1,140 @@
+import numpy as np
+
+from pandas import compat
+from pandas.util._decorators import cache_readonly
+import pandas.util.testing as tm
+import pandas as pd
+
+_seriesd = tm.getSeriesData()
+_tsd = tm.getTimeSeriesData()
+
+_frame = pd.DataFrame(_seriesd)
+_frame2 = pd.DataFrame(_seriesd, columns=['D', 'C', 'B', 'A'])
+_intframe = pd.DataFrame({k: v.astype(int)
+                          for k, v in compat.iteritems(_seriesd)})
+
+_tsframe = pd.DataFrame(_tsd)
+
+_mixed_frame = _frame.copy()
+_mixed_frame['foo'] = 'bar'
+
+
+class TestData(object):
+
+    @cache_readonly
+    def frame(self):
+        return _frame.copy()
+
+    @cache_readonly
+    def frame2(self):
+        return _frame2.copy()
+
+    @cache_readonly
+    def intframe(self):
+        # force these all to int64 to avoid platform testing issues
+        return pd.DataFrame({c: s for c, s in compat.iteritems(_intframe)},
+                            dtype=np.int64)
+
+    @cache_readonly
+    def tsframe(self):
+        return _tsframe.copy()
+
+    @cache_readonly
+    def mixed_frame(self):
+        return _mixed_frame.copy()
+
+    @cache_readonly
+    def mixed_float(self):
+        return pd.DataFrame({'A': _frame['A'].copy().astype('float32'),
+                             'B': _frame['B'].copy().astype('float32'),
+                             'C': _frame['C'].copy().astype('float16'),
+                             'D': _frame['D'].copy().astype('float64')})
+
+    @cache_readonly
+    def mixed_float2(self):
+        return pd.DataFrame({'A': _frame2['A'].copy().astype('float32'),
+                             'B': _frame2['B'].copy().astype('float32'),
+                             'C': _frame2['C'].copy().astype('float16'),
+                             'D': _frame2['D'].copy().astype('float64')})
+
+    @cache_readonly
+    def mixed_int(self):
+        return pd.DataFrame({'A': _intframe['A'].copy().astype('int32'),
+                             'B': np.ones(len(_intframe['B']), dtype='uint64'),
+                             'C': _intframe['C'].copy().astype('uint8'),
+                             'D': _intframe['D'].copy().astype('int64')})
+
+    @cache_readonly
+    def all_mixed(self):
+        return pd.DataFrame({'a': 1., 'b': 2, 'c': 'foo',
+                             'float32': np.array([1.] * 10, dtype='float32'),
+                             'int32': np.array([1] * 10, dtype='int32')},
+                            index=np.arange(10))
+
+    @cache_readonly
+    def tzframe(self):
+        result = pd.DataFrame({'A': pd.date_range('20130101', periods=3),
+                               'B': pd.date_range('20130101', periods=3,
+                                                  tz='US/Eastern'),
+                               'C': pd.date_range('20130101', periods=3,
+                                                  tz='CET')})
+        result.iloc[1, 1] = pd.NaT
+        result.iloc[1, 2] = pd.NaT
+        return result
+
+    @cache_readonly
+    def empty(self):
+        return pd.DataFrame({})
+
+    @cache_readonly
+    def ts1(self):
+        return tm.makeTimeSeries(nper=30)
+
+    @cache_readonly
+    def ts2(self):
+        return tm.makeTimeSeries(nper=30)[5:]
+
+    @cache_readonly
+    def simple(self):
+        arr = np.array([[1., 2., 3.],
+                        [4., 5., 6.],
+                        [7., 8., 9.]])
+
+        return pd.DataFrame(arr, columns=['one', 'two', 'three'],
+                            index=['a', 'b', 'c'])
+
+# self.ts3 = tm.makeTimeSeries()[-5:]
+# self.ts4 = tm.makeTimeSeries()[1:-1]
+
+
+def _check_mixed_float(df, dtype=None):
+    # float16 are most likely to be upcasted to float32
+    dtypes = dict(A='float32', B='float32', C='float16', D='float64')
+    if isinstance(dtype, compat.string_types):
+        dtypes = {k: dtype for k, v in dtypes.items()}
+    elif isinstance(dtype, dict):
+        dtypes.update(dtype)
+    if dtypes.get('A'):
+        assert(df.dtypes['A'] == dtypes['A'])
+    if dtypes.get('B'):
+        assert(df.dtypes['B'] == dtypes['B'])
+    if dtypes.get('C'):
+        assert(df.dtypes['C'] == dtypes['C'])
+    if dtypes.get('D'):
+        assert(df.dtypes['D'] == dtypes['D'])
+
+
+def _check_mixed_int(df, dtype=None):
+    dtypes = dict(A='int32', B='uint64', C='uint8', D='int64')
+    if isinstance(dtype, compat.string_types):
+        dtypes = {k: dtype for k, v in dtypes.items()}
+    elif isinstance(dtype, dict):
+        dtypes.update(dtype)
+    if dtypes.get('A'):
+        assert(df.dtypes['A'] == dtypes['A'])
+    if dtypes.get('B'):
+        assert(df.dtypes['B'] == dtypes['B'])
+    if dtypes.get('C'):
+        assert(df.dtypes['C'] == dtypes['C'])
+    if dtypes.get('D'):
+        assert(df.dtypes['D'] == dtypes['D'])
diff --git a/pandas/tests/frame/test_alter_axes.py b/pandas/tests/frame/test_alter_axes.py
new file mode 100644
index 0000000000000..21961906c39bb
--- /dev/null
+++ b/pandas/tests/frame/test_alter_axes.py
@@ -0,0 +1,1166 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import inspect
+import pytest
+
+from datetime import datetime, timedelta
+
+import numpy as np
+
+from pandas.compat import lrange, PY2
+from pandas import (DataFrame, Series, Index, MultiIndex,
+                    RangeIndex, date_range, IntervalIndex,
+                    to_datetime)
+from pandas.core.dtypes.common import (
+    is_object_dtype,
+    is_categorical_dtype,
+    is_interval_dtype)
+import pandas as pd
+
+from pandas.util.testing import assert_series_equal, assert_frame_equal
+
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+class TestDataFrameAlterAxes(TestData):
+
+    def test_set_index(self):
+        idx = Index(np.arange(len(self.mixed_frame)))
+
+        # cache it
+        _ = self.mixed_frame['foo']  # noqa
+        self.mixed_frame.index = idx
+        assert self.mixed_frame['foo'].index is idx
+        with tm.assert_raises_regex(ValueError, 'Length mismatch'):
+            self.mixed_frame.index = idx[::2]
+
+    def test_set_index_cast(self):
+
+        # issue casting an index then set_index
+        df = DataFrame({'A': [1.1, 2.2, 3.3], 'B': [5.0, 6.1, 7.2]},
+                       index=[2010, 2011, 2012])
+        expected = df.loc[2010]
+        new_index = df.index.astype(np.int32)
+        df.index = new_index
+        result = df.loc[2010]
+        assert_series_equal(result, expected)
+
+    def test_set_index2(self):
+        df = DataFrame({'A': ['foo', 'foo', 'foo', 'bar', 'bar'],
+                        'B': ['one', 'two', 'three', 'one', 'two'],
+                        'C': ['a', 'b', 'c', 'd', 'e'],
+                        'D': np.random.randn(5),
+                        'E': np.random.randn(5)})
+
+        # new object, single-column
+        result = df.set_index('C')
+        result_nodrop = df.set_index('C', drop=False)
+
+        index = Index(df['C'], name='C')
+
+        expected = df.loc[:, ['A', 'B', 'D', 'E']]
+        expected.index = index
+
+        expected_nodrop = df.copy()
+        expected_nodrop.index = index
+
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result_nodrop, expected_nodrop)
+        assert result.index.name == index.name
+
+        # inplace, single
+        df2 = df.copy()
+
+        df2.set_index('C', inplace=True)
+
+        assert_frame_equal(df2, expected)
+
+        df3 = df.copy()
+        df3.set_index('C', drop=False, inplace=True)
+
+        assert_frame_equal(df3, expected_nodrop)
+
+        # create new object, multi-column
+        result = df.set_index(['A', 'B'])
+        result_nodrop = df.set_index(['A', 'B'], drop=False)
+
+        index = MultiIndex.from_arrays([df['A'], df['B']], names=['A', 'B'])
+
+        expected = df.loc[:, ['C', 'D', 'E']]
+        expected.index = index
+
+        expected_nodrop = df.copy()
+        expected_nodrop.index = index
+
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result_nodrop, expected_nodrop)
+        assert result.index.names == index.names
+
+        # inplace
+        df2 = df.copy()
+        df2.set_index(['A', 'B'], inplace=True)
+        assert_frame_equal(df2, expected)
+
+        df3 = df.copy()
+        df3.set_index(['A', 'B'], drop=False, inplace=True)
+        assert_frame_equal(df3, expected_nodrop)
+
+        # corner case
+        with tm.assert_raises_regex(ValueError,
+                                    'Index has duplicate keys'):
+            df.set_index('A', verify_integrity=True)
+
+        # append
+        result = df.set_index(['A', 'B'], append=True)
+        xp = df.reset_index().set_index(['index', 'A', 'B'])
+        xp.index.names = [None, 'A', 'B']
+        assert_frame_equal(result, xp)
+
+        # append to existing multiindex
+        rdf = df.set_index(['A'], append=True)
+        rdf = rdf.set_index(['B', 'C'], append=True)
+        expected = df.set_index(['A', 'B', 'C'], append=True)
+        assert_frame_equal(rdf, expected)
+
+        # Series
+        result = df.set_index(df.C)
+        assert result.index.name == 'C'
+
+    @pytest.mark.parametrize(
+        'level', ['a', pd.Series(range(0, 8, 2), name='a')])
+    def test_set_index_duplicate_names(self, level):
+        # GH18872 - GH19029
+        df = pd.DataFrame(np.arange(8).reshape(4, 2), columns=['a', 'b'])
+
+        # Pass an existing level name:
+        df.index.name = 'a'
+        expected = pd.MultiIndex.from_tuples([(0, 0), (1, 2), (2, 4), (3, 6)],
+                                             names=['a', 'a'])
+        result = df.set_index(level, append=True)
+        tm.assert_index_equal(result.index, expected)
+        result = df.set_index([level], append=True)
+        tm.assert_index_equal(result.index, expected)
+
+        # Pass twice the same level name (only works with passing actual data)
+        if isinstance(level, pd.Series):
+            result = df.set_index([level, level])
+            expected = pd.MultiIndex.from_tuples(
+                [(0, 0), (2, 2), (4, 4), (6, 6)], names=['a', 'a'])
+            tm.assert_index_equal(result.index, expected)
+
+    def test_set_index_nonuniq(self):
+        df = DataFrame({'A': ['foo', 'foo', 'foo', 'bar', 'bar'],
+                        'B': ['one', 'two', 'three', 'one', 'two'],
+                        'C': ['a', 'b', 'c', 'd', 'e'],
+                        'D': np.random.randn(5),
+                        'E': np.random.randn(5)})
+        with tm.assert_raises_regex(ValueError,
+                                    'Index has duplicate keys'):
+            df.set_index('A', verify_integrity=True, inplace=True)
+        assert 'A' in df
+
+    def test_set_index_bug(self):
+        # GH1590
+        df = DataFrame({'val': [0, 1, 2], 'key': ['a', 'b', 'c']})
+        xp = DataFrame({'val': [1, 2]},
+                       Index(['b', 'c'], name='key'))
+
+        df2 = df.loc[df.index.map(lambda indx: indx >= 1)]
+        rs = df2.set_index('key')
+        assert_frame_equal(rs, xp)
+
+    def test_set_index_pass_arrays(self):
+        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                              'foo', 'bar', 'foo', 'foo'],
+                        'B': ['one', 'one', 'two', 'three',
+                              'two', 'two', 'one', 'three'],
+                        'C': np.random.randn(8),
+                        'D': np.random.randn(8)})
+
+        # multiple columns
+        result = df.set_index(['A', df['B'].values], drop=False)
+        expected = df.set_index(['A', 'B'], drop=False)
+
+        # TODO should set_index check_names ?
+        assert_frame_equal(result, expected, check_names=False)
+
+    def test_construction_with_categorical_index(self):
+
+        ci = tm.makeCategoricalIndex(10)
+
+        # with Categorical
+        df = DataFrame({'A': np.random.randn(10),
+                        'B': ci.values})
+        idf = df.set_index('B')
+        str(idf)
+        tm.assert_index_equal(idf.index, ci, check_names=False)
+        assert idf.index.name == 'B'
+
+        # from a CategoricalIndex
+        df = DataFrame({'A': np.random.randn(10),
+                        'B': ci})
+        idf = df.set_index('B')
+        str(idf)
+        tm.assert_index_equal(idf.index, ci, check_names=False)
+        assert idf.index.name == 'B'
+
+        idf = df.set_index('B').reset_index().set_index('B')
+        str(idf)
+        tm.assert_index_equal(idf.index, ci, check_names=False)
+        assert idf.index.name == 'B'
+
+        new_df = idf.reset_index()
+        new_df.index = df.B
+        tm.assert_index_equal(new_df.index, ci, check_names=False)
+        assert idf.index.name == 'B'
+
+    def test_set_index_cast_datetimeindex(self):
+        df = DataFrame({'A': [datetime(2000, 1, 1) + timedelta(i)
+                              for i in range(1000)],
+                        'B': np.random.randn(1000)})
+
+        idf = df.set_index('A')
+        assert isinstance(idf.index, pd.DatetimeIndex)
+
+        # don't cast a DatetimeIndex WITH a tz, leave as object
+        # GH 6032
+        i = (pd.DatetimeIndex(
+            to_datetime(['2013-1-1 13:00',
+                         '2013-1-2 14:00'], errors="raise"))
+             .tz_localize('US/Pacific'))
+        df = DataFrame(np.random.randn(2, 1), columns=['A'])
+
+        expected = Series(np.array([pd.Timestamp('2013-01-01 13:00:00-0800',
+                                                 tz='US/Pacific'),
+                                    pd.Timestamp('2013-01-02 14:00:00-0800',
+                                                 tz='US/Pacific')],
+                                   dtype="object"))
+
+        # convert index to series
+        result = Series(i)
+        assert_series_equal(result, expected)
+
+        # assignt to frame
+        df['B'] = i
+        result = df['B']
+        assert_series_equal(result, expected, check_names=False)
+        assert result.name == 'B'
+
+        # keep the timezone
+        result = i.to_series(keep_tz=True)
+        assert_series_equal(result.reset_index(drop=True), expected)
+
+        # convert to utc
+        df['C'] = i.to_series().reset_index(drop=True)
+        result = df['C']
+        comp = pd.DatetimeIndex(expected.values)
+        comp = comp.tz_localize(None)
+        tm.assert_numpy_array_equal(result.values, comp.values)
+
+        # list of datetimes with a tz
+        df['D'] = i.to_pydatetime()
+        result = df['D']
+        assert_series_equal(result, expected, check_names=False)
+        assert result.name == 'D'
+
+        # GH 6785
+        # set the index manually
+        import pytz
+        df = DataFrame(
+            [{'ts': datetime(2014, 4, 1, tzinfo=pytz.utc), 'foo': 1}])
+        expected = df.set_index('ts')
+        df.index = df['ts']
+        df.pop('ts')
+        assert_frame_equal(df, expected)
+
+    def test_reset_index_tz(self, tz_aware_fixture):
+        # GH 3950
+        # reset_index with single level
+        tz = tz_aware_fixture
+        idx = pd.date_range('1/1/2011', periods=5,
+                            freq='D', tz=tz, name='idx')
+        df = pd.DataFrame(
+            {'a': range(5), 'b': ['A', 'B', 'C', 'D', 'E']}, index=idx)
+
+        expected = pd.DataFrame({'idx': [datetime(2011, 1, 1),
+                                         datetime(2011, 1, 2),
+                                         datetime(2011, 1, 3),
+                                         datetime(2011, 1, 4),
+                                         datetime(2011, 1, 5)],
+                                 'a': range(5),
+                                 'b': ['A', 'B', 'C', 'D', 'E']},
+                                columns=['idx', 'a', 'b'])
+        expected['idx'] = expected['idx'].apply(
+            lambda d: pd.Timestamp(d, tz=tz))
+        assert_frame_equal(df.reset_index(), expected)
+
+    def test_set_index_timezone(self):
+        # GH 12358
+        # tz-aware Series should retain the tz
+        i = pd.to_datetime(["2014-01-01 10:10:10"],
+                           utc=True).tz_convert('Europe/Rome')
+        df = DataFrame({'i': i})
+        assert df.set_index(i).index[0].hour == 11
+        assert pd.DatetimeIndex(pd.Series(df.i))[0].hour == 11
+        assert df.set_index(df.i).index[0].hour == 11
+
+    def test_set_index_dst(self):
+        di = pd.date_range('2006-10-29 00:00:00', periods=3,
+                           freq='H', tz='US/Pacific')
+
+        df = pd.DataFrame(data={'a': [0, 1, 2], 'b': [3, 4, 5]},
+                          index=di).reset_index()
+        # single level
+        res = df.set_index('index')
+        exp = pd.DataFrame(data={'a': [0, 1, 2], 'b': [3, 4, 5]},
+                           index=pd.Index(di, name='index'))
+        tm.assert_frame_equal(res, exp)
+
+        # GH 12920
+        res = df.set_index(['index', 'a'])
+        exp_index = pd.MultiIndex.from_arrays([di, [0, 1, 2]],
+                                              names=['index', 'a'])
+        exp = pd.DataFrame({'b': [3, 4, 5]}, index=exp_index)
+        tm.assert_frame_equal(res, exp)
+
+    def test_reset_index_with_intervals(self):
+        idx = pd.IntervalIndex.from_breaks(np.arange(11), name='x')
+        original = pd.DataFrame({'x': idx, 'y': np.arange(10)})[['x', 'y']]
+
+        result = original.set_index('x')
+        expected = pd.DataFrame({'y': np.arange(10)}, index=idx)
+        assert_frame_equal(result, expected)
+
+        result2 = result.reset_index()
+        assert_frame_equal(result2, original)
+
+    def test_set_index_multiindexcolumns(self):
+        columns = MultiIndex.from_tuples([('foo', 1), ('foo', 2), ('bar', 1)])
+        df = DataFrame(np.random.randn(3, 3), columns=columns)
+        rs = df.set_index(df.columns[0])
+        xp = df.iloc[:, 1:]
+        xp.index = df.iloc[:, 0].values
+        xp.index.names = [df.columns[0]]
+        assert_frame_equal(rs, xp)
+
+    def test_set_index_empty_column(self):
+        # #1971
+        df = DataFrame([
+            dict(a=1, p=0),
+            dict(a=2, m=10),
+            dict(a=3, m=11, p=20),
+            dict(a=4, m=12, p=21)
+        ], columns=('a', 'm', 'p', 'x'))
+
+        # it works!
+        result = df.set_index(['a', 'x'])
+        repr(result)
+
+    def test_set_columns(self):
+        cols = Index(np.arange(len(self.mixed_frame.columns)))
+        self.mixed_frame.columns = cols
+        with tm.assert_raises_regex(ValueError, 'Length mismatch'):
+            self.mixed_frame.columns = cols[::2]
+
+    def test_dti_set_index_reindex(self):
+        # GH 6631
+        df = DataFrame(np.random.random(6))
+        idx1 = date_range('2011/01/01', periods=6, freq='M', tz='US/Eastern')
+        idx2 = date_range('2013', periods=6, freq='A', tz='Asia/Tokyo')
+
+        df = df.set_index(idx1)
+        tm.assert_index_equal(df.index, idx1)
+        df = df.reindex(idx2)
+        tm.assert_index_equal(df.index, idx2)
+
+        # 11314
+        # with tz
+        index = date_range(datetime(2015, 10, 1),
+                           datetime(2015, 10, 1, 23),
+                           freq='H', tz='US/Eastern')
+        df = DataFrame(np.random.randn(24, 1), columns=['a'], index=index)
+        new_index = date_range(datetime(2015, 10, 2),
+                               datetime(2015, 10, 2, 23),
+                               freq='H', tz='US/Eastern')
+
+        # TODO: unused?
+        result = df.set_index(new_index)  # noqa
+
+        assert new_index.freq == index.freq
+
+    # Renaming
+
+    def test_rename(self):
+        mapping = {
+            'A': 'a',
+            'B': 'b',
+            'C': 'c',
+            'D': 'd'
+        }
+
+        renamed = self.frame.rename(columns=mapping)
+        renamed2 = self.frame.rename(columns=str.lower)
+
+        assert_frame_equal(renamed, renamed2)
+        assert_frame_equal(renamed2.rename(columns=str.upper),
+                           self.frame, check_names=False)
+
+        # index
+        data = {
+            'A': {'foo': 0, 'bar': 1}
+        }
+
+        # gets sorted alphabetical
+        df = DataFrame(data)
+        renamed = df.rename(index={'foo': 'bar', 'bar': 'foo'})
+        tm.assert_index_equal(renamed.index, pd.Index(['foo', 'bar']))
+
+        renamed = df.rename(index=str.upper)
+        tm.assert_index_equal(renamed.index, pd.Index(['BAR', 'FOO']))
+
+        # have to pass something
+        pytest.raises(TypeError, self.frame.rename)
+
+        # partial columns
+        renamed = self.frame.rename(columns={'C': 'foo', 'D': 'bar'})
+        tm.assert_index_equal(renamed.columns,
+                              pd.Index(['A', 'B', 'foo', 'bar']))
+
+        # other axis
+        renamed = self.frame.T.rename(index={'C': 'foo', 'D': 'bar'})
+        tm.assert_index_equal(renamed.index,
+                              pd.Index(['A', 'B', 'foo', 'bar']))
+
+        # index with name
+        index = Index(['foo', 'bar'], name='name')
+        renamer = DataFrame(data, index=index)
+        renamed = renamer.rename(index={'foo': 'bar', 'bar': 'foo'})
+        tm.assert_index_equal(renamed.index,
+                              pd.Index(['bar', 'foo'], name='name'))
+        assert renamed.index.name == renamer.index.name
+
+    def test_rename_axis_inplace(self):
+        # GH 15704
+        frame = self.frame.copy()
+        expected = frame.rename_axis('foo')
+        result = frame.copy()
+        no_return = result.rename_axis('foo', inplace=True)
+
+        assert no_return is None
+        assert_frame_equal(result, expected)
+
+        expected = frame.rename_axis('bar', axis=1)
+        result = frame.copy()
+        no_return = result.rename_axis('bar', axis=1, inplace=True)
+
+        assert no_return is None
+        assert_frame_equal(result, expected)
+
+    def test_rename_axis_warns(self):
+        # https://github.com/pandas-dev/pandas/issues/17833
+        df = pd.DataFrame({"A": [1, 2], "B": [1, 2]})
+        with tm.assert_produces_warning(FutureWarning) as w:
+            df.rename_axis(id, axis=0)
+            assert 'rename' in str(w[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as w:
+            df.rename_axis({0: 10, 1: 20}, axis=0)
+            assert 'rename' in str(w[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as w:
+            df.rename_axis(id, axis=1)
+            assert 'rename' in str(w[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as w:
+            df['A'].rename_axis(id)
+            assert 'rename' in str(w[0].message)
+
+    def test_rename_multiindex(self):
+
+        tuples_index = [('foo1', 'bar1'), ('foo2', 'bar2')]
+        tuples_columns = [('fizz1', 'buzz1'), ('fizz2', 'buzz2')]
+        index = MultiIndex.from_tuples(tuples_index, names=['foo', 'bar'])
+        columns = MultiIndex.from_tuples(
+            tuples_columns, names=['fizz', 'buzz'])
+        df = DataFrame([(0, 0), (1, 1)], index=index, columns=columns)
+
+        #
+        # without specifying level -> across all levels
+
+        renamed = df.rename(index={'foo1': 'foo3', 'bar2': 'bar3'},
+                            columns={'fizz1': 'fizz3', 'buzz2': 'buzz3'})
+        new_index = MultiIndex.from_tuples([('foo3', 'bar1'),
+                                            ('foo2', 'bar3')],
+                                           names=['foo', 'bar'])
+        new_columns = MultiIndex.from_tuples([('fizz3', 'buzz1'),
+                                              ('fizz2', 'buzz3')],
+                                             names=['fizz', 'buzz'])
+        tm.assert_index_equal(renamed.index, new_index)
+        tm.assert_index_equal(renamed.columns, new_columns)
+        assert renamed.index.names == df.index.names
+        assert renamed.columns.names == df.columns.names
+
+        #
+        # with specifying a level (GH13766)
+
+        # dict
+        new_columns = MultiIndex.from_tuples([('fizz3', 'buzz1'),
+                                              ('fizz2', 'buzz2')],
+                                             names=['fizz', 'buzz'])
+        renamed = df.rename(columns={'fizz1': 'fizz3', 'buzz2': 'buzz3'},
+                            level=0)
+        tm.assert_index_equal(renamed.columns, new_columns)
+        renamed = df.rename(columns={'fizz1': 'fizz3', 'buzz2': 'buzz3'},
+                            level='fizz')
+        tm.assert_index_equal(renamed.columns, new_columns)
+
+        new_columns = MultiIndex.from_tuples([('fizz1', 'buzz1'),
+                                              ('fizz2', 'buzz3')],
+                                             names=['fizz', 'buzz'])
+        renamed = df.rename(columns={'fizz1': 'fizz3', 'buzz2': 'buzz3'},
+                            level=1)
+        tm.assert_index_equal(renamed.columns, new_columns)
+        renamed = df.rename(columns={'fizz1': 'fizz3', 'buzz2': 'buzz3'},
+                            level='buzz')
+        tm.assert_index_equal(renamed.columns, new_columns)
+
+        # function
+        func = str.upper
+        new_columns = MultiIndex.from_tuples([('FIZZ1', 'buzz1'),
+                                              ('FIZZ2', 'buzz2')],
+                                             names=['fizz', 'buzz'])
+        renamed = df.rename(columns=func, level=0)
+        tm.assert_index_equal(renamed.columns, new_columns)
+        renamed = df.rename(columns=func, level='fizz')
+        tm.assert_index_equal(renamed.columns, new_columns)
+
+        new_columns = MultiIndex.from_tuples([('fizz1', 'BUZZ1'),
+                                              ('fizz2', 'BUZZ2')],
+                                             names=['fizz', 'buzz'])
+        renamed = df.rename(columns=func, level=1)
+        tm.assert_index_equal(renamed.columns, new_columns)
+        renamed = df.rename(columns=func, level='buzz')
+        tm.assert_index_equal(renamed.columns, new_columns)
+
+        # index
+        new_index = MultiIndex.from_tuples([('foo3', 'bar1'),
+                                            ('foo2', 'bar2')],
+                                           names=['foo', 'bar'])
+        renamed = df.rename(index={'foo1': 'foo3', 'bar2': 'bar3'},
+                            level=0)
+        tm.assert_index_equal(renamed.index, new_index)
+
+    def test_rename_nocopy(self):
+        renamed = self.frame.rename(columns={'C': 'foo'}, copy=False)
+        renamed['foo'] = 1.
+        assert (self.frame['C'] == 1.).all()
+
+    def test_rename_inplace(self):
+        self.frame.rename(columns={'C': 'foo'})
+        assert 'C' in self.frame
+        assert 'foo' not in self.frame
+
+        c_id = id(self.frame['C'])
+        frame = self.frame.copy()
+        frame.rename(columns={'C': 'foo'}, inplace=True)
+
+        assert 'C' not in frame
+        assert 'foo' in frame
+        assert id(frame['foo']) != c_id
+
+    def test_rename_bug(self):
+        # GH 5344
+        # rename set ref_locs, and set_index was not resetting
+        df = DataFrame({0: ['foo', 'bar'], 1: ['bah', 'bas'], 2: [1, 2]})
+        df = df.rename(columns={0: 'a'})
+        df = df.rename(columns={1: 'b'})
+        df = df.set_index(['a', 'b'])
+        df.columns = ['2001-01-01']
+        expected = DataFrame([[1], [2]],
+                             index=MultiIndex.from_tuples(
+                                 [('foo', 'bah'), ('bar', 'bas')],
+                                 names=['a', 'b']),
+                             columns=['2001-01-01'])
+        assert_frame_equal(df, expected)
+
+    def test_rename_bug2(self):
+        # GH 19497
+        # rename was changing Index to MultiIndex if Index contained tuples
+
+        df = DataFrame(data=np.arange(3), index=[(0, 0), (1, 1), (2, 2)],
+                       columns=["a"])
+        df = df.rename({(1, 1): (5, 4)}, axis="index")
+        expected = DataFrame(data=np.arange(3), index=[(0, 0), (5, 4), (2, 2)],
+                             columns=["a"])
+        assert_frame_equal(df, expected)
+
+    def test_reorder_levels(self):
+        index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
+                           labels=[[0, 0, 0, 0, 0, 0],
+                                   [0, 1, 2, 0, 1, 2],
+                                   [0, 1, 0, 1, 0, 1]],
+                           names=['L0', 'L1', 'L2'])
+        df = DataFrame({'A': np.arange(6), 'B': np.arange(6)}, index=index)
+
+        # no change, position
+        result = df.reorder_levels([0, 1, 2])
+        assert_frame_equal(df, result)
+
+        # no change, labels
+        result = df.reorder_levels(['L0', 'L1', 'L2'])
+        assert_frame_equal(df, result)
+
+        # rotate, position
+        result = df.reorder_levels([1, 2, 0])
+        e_idx = MultiIndex(levels=[['one', 'two', 'three'], [0, 1], ['bar']],
+                           labels=[[0, 1, 2, 0, 1, 2],
+                                   [0, 1, 0, 1, 0, 1],
+                                   [0, 0, 0, 0, 0, 0]],
+                           names=['L1', 'L2', 'L0'])
+        expected = DataFrame({'A': np.arange(6), 'B': np.arange(6)},
+                             index=e_idx)
+        assert_frame_equal(result, expected)
+
+        result = df.reorder_levels([0, 0, 0])
+        e_idx = MultiIndex(levels=[['bar'], ['bar'], ['bar']],
+                           labels=[[0, 0, 0, 0, 0, 0],
+                                   [0, 0, 0, 0, 0, 0],
+                                   [0, 0, 0, 0, 0, 0]],
+                           names=['L0', 'L0', 'L0'])
+        expected = DataFrame({'A': np.arange(6), 'B': np.arange(6)},
+                             index=e_idx)
+        assert_frame_equal(result, expected)
+
+        result = df.reorder_levels(['L0', 'L0', 'L0'])
+        assert_frame_equal(result, expected)
+
+    def test_reset_index(self):
+        stacked = self.frame.stack()[::2]
+        stacked = DataFrame({'foo': stacked, 'bar': stacked})
+
+        names = ['first', 'second']
+        stacked.index.names = names
+        deleveled = stacked.reset_index()
+        for i, (lev, lab) in enumerate(zip(stacked.index.levels,
+                                           stacked.index.labels)):
+            values = lev.take(lab)
+            name = names[i]
+            tm.assert_index_equal(values, Index(deleveled[name]))
+
+        stacked.index.names = [None, None]
+        deleveled2 = stacked.reset_index()
+        tm.assert_series_equal(deleveled['first'], deleveled2['level_0'],
+                               check_names=False)
+        tm.assert_series_equal(deleveled['second'], deleveled2['level_1'],
+                               check_names=False)
+
+        # default name assigned
+        rdf = self.frame.reset_index()
+        exp = pd.Series(self.frame.index.values, name='index')
+        tm.assert_series_equal(rdf['index'], exp)
+
+        # default name assigned, corner case
+        df = self.frame.copy()
+        df['index'] = 'foo'
+        rdf = df.reset_index()
+        exp = pd.Series(self.frame.index.values, name='level_0')
+        tm.assert_series_equal(rdf['level_0'], exp)
+
+        # but this is ok
+        self.frame.index.name = 'index'
+        deleveled = self.frame.reset_index()
+        tm.assert_series_equal(deleveled['index'],
+                               pd.Series(self.frame.index))
+        tm.assert_index_equal(deleveled.index,
+                              pd.Index(np.arange(len(deleveled))))
+
+        # preserve column names
+        self.frame.columns.name = 'columns'
+        resetted = self.frame.reset_index()
+        assert resetted.columns.name == 'columns'
+
+        # only remove certain columns
+        frame = self.frame.reset_index().set_index(['index', 'A', 'B'])
+        rs = frame.reset_index(['A', 'B'])
+
+        # TODO should reset_index check_names ?
+        assert_frame_equal(rs, self.frame, check_names=False)
+
+        rs = frame.reset_index(['index', 'A', 'B'])
+        assert_frame_equal(rs, self.frame.reset_index(), check_names=False)
+
+        rs = frame.reset_index(['index', 'A', 'B'])
+        assert_frame_equal(rs, self.frame.reset_index(), check_names=False)
+
+        rs = frame.reset_index('A')
+        xp = self.frame.reset_index().set_index(['index', 'B'])
+        assert_frame_equal(rs, xp, check_names=False)
+
+        # test resetting in place
+        df = self.frame.copy()
+        resetted = self.frame.reset_index()
+        df.reset_index(inplace=True)
+        assert_frame_equal(df, resetted, check_names=False)
+
+        frame = self.frame.reset_index().set_index(['index', 'A', 'B'])
+        rs = frame.reset_index('A', drop=True)
+        xp = self.frame.copy()
+        del xp['A']
+        xp = xp.set_index(['B'], append=True)
+        assert_frame_equal(rs, xp, check_names=False)
+
+    def test_reset_index_level(self):
+        df = pd.DataFrame([[1, 2, 3, 4], [5, 6, 7, 8]],
+                          columns=['A', 'B', 'C', 'D'])
+
+        for levels in ['A', 'B'], [0, 1]:
+            # With MultiIndex
+            result = df.set_index(['A', 'B']).reset_index(level=levels[0])
+            tm.assert_frame_equal(result, df.set_index('B'))
+
+            result = df.set_index(['A', 'B']).reset_index(level=levels[:1])
+            tm.assert_frame_equal(result, df.set_index('B'))
+
+            result = df.set_index(['A', 'B']).reset_index(level=levels)
+            tm.assert_frame_equal(result, df)
+
+            result = df.set_index(['A', 'B']).reset_index(level=levels,
+                                                          drop=True)
+            tm.assert_frame_equal(result, df[['C', 'D']])
+
+            # With single-level Index (GH 16263)
+            result = df.set_index('A').reset_index(level=levels[0])
+            tm.assert_frame_equal(result, df)
+
+            result = df.set_index('A').reset_index(level=levels[:1])
+            tm.assert_frame_equal(result, df)
+
+            result = df.set_index(['A']).reset_index(level=levels[0],
+                                                     drop=True)
+            tm.assert_frame_equal(result, df[['B', 'C', 'D']])
+
+        # Missing levels - for both MultiIndex and single-level Index:
+        for idx_lev in ['A', 'B'], ['A']:
+            with tm.assert_raises_regex(KeyError, 'Level E '):
+                df.set_index(idx_lev).reset_index(level=['A', 'E'])
+            with tm.assert_raises_regex(IndexError, 'Too many levels'):
+                df.set_index(idx_lev).reset_index(level=[0, 1, 2])
+
+    def test_reset_index_right_dtype(self):
+        time = np.arange(0.0, 10, np.sqrt(2) / 2)
+        s1 = Series((9.81 * time ** 2) / 2,
+                    index=Index(time, name='time'),
+                    name='speed')
+        df = DataFrame(s1)
+
+        resetted = s1.reset_index()
+        assert resetted['time'].dtype == np.float64
+
+        resetted = df.reset_index()
+        assert resetted['time'].dtype == np.float64
+
+    def test_reset_index_multiindex_col(self):
+        vals = np.random.randn(3, 3).astype(object)
+        idx = ['x', 'y', 'z']
+        full = np.hstack(([[x] for x in idx], vals))
+        df = DataFrame(vals, Index(idx, name='a'),
+                       columns=[['b', 'b', 'c'], ['mean', 'median', 'mean']])
+        rs = df.reset_index()
+        xp = DataFrame(full, columns=[['a', 'b', 'b', 'c'],
+                                      ['', 'mean', 'median', 'mean']])
+        assert_frame_equal(rs, xp)
+
+        rs = df.reset_index(col_fill=None)
+        xp = DataFrame(full, columns=[['a', 'b', 'b', 'c'],
+                                      ['a', 'mean', 'median', 'mean']])
+        assert_frame_equal(rs, xp)
+
+        rs = df.reset_index(col_level=1, col_fill='blah')
+        xp = DataFrame(full, columns=[['blah', 'b', 'b', 'c'],
+                                      ['a', 'mean', 'median', 'mean']])
+        assert_frame_equal(rs, xp)
+
+        df = DataFrame(vals,
+                       MultiIndex.from_arrays([[0, 1, 2], ['x', 'y', 'z']],
+                                              names=['d', 'a']),
+                       columns=[['b', 'b', 'c'], ['mean', 'median', 'mean']])
+        rs = df.reset_index('a', )
+        xp = DataFrame(full, Index([0, 1, 2], name='d'),
+                       columns=[['a', 'b', 'b', 'c'],
+                                ['', 'mean', 'median', 'mean']])
+        assert_frame_equal(rs, xp)
+
+        rs = df.reset_index('a', col_fill=None)
+        xp = DataFrame(full, Index(lrange(3), name='d'),
+                       columns=[['a', 'b', 'b', 'c'],
+                                ['a', 'mean', 'median', 'mean']])
+        assert_frame_equal(rs, xp)
+
+        rs = df.reset_index('a', col_fill='blah', col_level=1)
+        xp = DataFrame(full, Index(lrange(3), name='d'),
+                       columns=[['blah', 'b', 'b', 'c'],
+                                ['a', 'mean', 'median', 'mean']])
+        assert_frame_equal(rs, xp)
+
+    def test_reset_index_multiindex_nan(self):
+        # GH6322, testing reset_index on MultiIndexes
+        # when we have a nan or all nan
+        df = pd.DataFrame({'A': ['a', 'b', 'c'],
+                           'B': [0, 1, np.nan],
+                           'C': np.random.rand(3)})
+        rs = df.set_index(['A', 'B']).reset_index()
+        assert_frame_equal(rs, df)
+
+        df = pd.DataFrame({'A': [np.nan, 'b', 'c'],
+                           'B': [0, 1, 2],
+                           'C': np.random.rand(3)})
+        rs = df.set_index(['A', 'B']).reset_index()
+        assert_frame_equal(rs, df)
+
+        df = pd.DataFrame({'A': ['a', 'b', 'c'],
+                           'B': [0, 1, 2],
+                           'C': [np.nan, 1.1, 2.2]})
+        rs = df.set_index(['A', 'B']).reset_index()
+        assert_frame_equal(rs, df)
+
+        df = pd.DataFrame({'A': ['a', 'b', 'c'],
+                           'B': [np.nan, np.nan, np.nan],
+                           'C': np.random.rand(3)})
+        rs = df.set_index(['A', 'B']).reset_index()
+        assert_frame_equal(rs, df)
+
+    def test_reset_index_with_datetimeindex_cols(self):
+        # GH5818
+        #
+        df = pd.DataFrame([[1, 2], [3, 4]],
+                          columns=pd.date_range('1/1/2013', '1/2/2013'),
+                          index=['A', 'B'])
+
+        result = df.reset_index()
+        expected = pd.DataFrame([['A', 1, 2], ['B', 3, 4]],
+                                columns=['index', datetime(2013, 1, 1),
+                                         datetime(2013, 1, 2)])
+        assert_frame_equal(result, expected)
+
+    def test_reset_index_range(self):
+        # GH 12071
+        df = pd.DataFrame([[0, 0], [1, 1]], columns=['A', 'B'],
+                          index=RangeIndex(stop=2))
+        result = df.reset_index()
+        assert isinstance(result.index, RangeIndex)
+        expected = pd.DataFrame([[0, 0, 0], [1, 1, 1]],
+                                columns=['index', 'A', 'B'],
+                                index=RangeIndex(stop=2))
+        assert_frame_equal(result, expected)
+
+    def test_set_index_names(self):
+        df = pd.util.testing.makeDataFrame()
+        df.index.name = 'name'
+
+        assert df.set_index(df.index).index.names == ['name']
+
+        mi = MultiIndex.from_arrays(df[['A', 'B']].T.values, names=['A', 'B'])
+        mi2 = MultiIndex.from_arrays(df[['A', 'B', 'A', 'B']].T.values,
+                                     names=['A', 'B', 'C', 'D'])
+
+        df = df.set_index(['A', 'B'])
+
+        assert df.set_index(df.index).index.names == ['A', 'B']
+
+        # Check that set_index isn't converting a MultiIndex into an Index
+        assert isinstance(df.set_index(df.index).index, MultiIndex)
+
+        # Check actual equality
+        tm.assert_index_equal(df.set_index(df.index).index, mi)
+
+        idx2 = df.index.rename(['C', 'D'])
+
+        # Check that [MultiIndex, MultiIndex] yields a MultiIndex rather
+        # than a pair of tuples
+        assert isinstance(df.set_index([df.index, idx2]).index, MultiIndex)
+
+        # Check equality
+        tm.assert_index_equal(df.set_index([df.index, idx2]).index, mi2)
+
+    def test_rename_objects(self):
+        renamed = self.mixed_frame.rename(columns=str.upper)
+
+        assert 'FOO' in renamed
+        assert 'foo' not in renamed
+
+    def test_rename_axis_style(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        df = pd.DataFrame({"A": [1, 2], "B": [1, 2]}, index=['X', 'Y'])
+        expected = pd.DataFrame({"a": [1, 2], "b": [1, 2]}, index=['X', 'Y'])
+
+        result = df.rename(str.lower, axis=1)
+        assert_frame_equal(result, expected)
+
+        result = df.rename(str.lower, axis='columns')
+        assert_frame_equal(result, expected)
+
+        result = df.rename({"A": 'a', 'B': 'b'}, axis=1)
+        assert_frame_equal(result, expected)
+
+        result = df.rename({"A": 'a', 'B': 'b'}, axis='columns')
+        assert_frame_equal(result, expected)
+
+        # Index
+        expected = pd.DataFrame({"A": [1, 2], "B": [1, 2]}, index=['x', 'y'])
+        result = df.rename(str.lower, axis=0)
+        assert_frame_equal(result, expected)
+
+        result = df.rename(str.lower, axis='index')
+        assert_frame_equal(result, expected)
+
+        result = df.rename({'X': 'x', 'Y': 'y'}, axis=0)
+        assert_frame_equal(result, expected)
+
+        result = df.rename({'X': 'x', 'Y': 'y'}, axis='index')
+        assert_frame_equal(result, expected)
+
+        result = df.rename(mapper=str.lower, axis='index')
+        assert_frame_equal(result, expected)
+
+    def test_rename_mapper_multi(self):
+        df = pd.DataFrame({"A": ['a', 'b'], "B": ['c', 'd'],
+                           'C': [1, 2]}).set_index(["A", "B"])
+        result = df.rename(str.upper)
+        expected = df.rename(index=str.upper)
+        assert_frame_equal(result, expected)
+
+    def test_rename_positional_named(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        df = pd.DataFrame({"a": [1, 2], "b": [1, 2]}, index=['X', 'Y'])
+        result = df.rename(str.lower, columns=str.upper)
+        expected = pd.DataFrame({"A": [1, 2], "B": [1, 2]}, index=['x', 'y'])
+        assert_frame_equal(result, expected)
+
+    def test_rename_axis_style_raises(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        df = pd.DataFrame({"A": [1, 2], "B": [1, 2]}, index=['0', '1'])
+
+        # Named target and axis
+        with tm.assert_raises_regex(TypeError, None):
+            df.rename(index=str.lower, axis=1)
+
+        with tm.assert_raises_regex(TypeError, None):
+            df.rename(index=str.lower, axis='columns')
+
+        with tm.assert_raises_regex(TypeError, None):
+            df.rename(index=str.lower, axis='columns')
+
+        with tm.assert_raises_regex(TypeError, None):
+            df.rename(columns=str.lower, axis='columns')
+
+        with tm.assert_raises_regex(TypeError, None):
+            df.rename(index=str.lower, axis=0)
+
+        # Multiple targets and axis
+        with tm.assert_raises_regex(TypeError, None):
+            df.rename(str.lower, str.lower, axis='columns')
+
+        # Too many targets
+        with tm.assert_raises_regex(TypeError, None):
+            df.rename(str.lower, str.lower, str.lower)
+
+        # Duplicates
+        with tm.assert_raises_regex(TypeError, "multiple values"):
+            df.rename(id, mapper=id)
+
+    def test_reindex_api_equivalence(self):
+        # equivalence of the labels/axis and index/columns API's
+        df = DataFrame([[1, 2, 3], [3, 4, 5], [5, 6, 7]],
+                       index=['a', 'b', 'c'],
+                       columns=['d', 'e', 'f'])
+
+        res1 = df.reindex(['b', 'a'])
+        res2 = df.reindex(index=['b', 'a'])
+        res3 = df.reindex(labels=['b', 'a'])
+        res4 = df.reindex(labels=['b', 'a'], axis=0)
+        res5 = df.reindex(['b', 'a'], axis=0)
+        for res in [res2, res3, res4, res5]:
+            tm.assert_frame_equal(res1, res)
+
+        res1 = df.reindex(columns=['e', 'd'])
+        res2 = df.reindex(['e', 'd'], axis=1)
+        res3 = df.reindex(labels=['e', 'd'], axis=1)
+        for res in [res2, res3]:
+            tm.assert_frame_equal(res1, res)
+
+        res1 = df.reindex(index=['b', 'a'], columns=['e', 'd'])
+        res2 = df.reindex(columns=['e', 'd'], index=['b', 'a'])
+        res3 = df.reindex(labels=['b', 'a'], axis=0).reindex(labels=['e', 'd'],
+                                                             axis=1)
+        for res in [res2, res3]:
+            tm.assert_frame_equal(res1, res)
+
+    def test_rename_positional(self):
+        df = pd.DataFrame(columns=['A', 'B'])
+        with tm.assert_produces_warning(FutureWarning) as rec:
+            result = df.rename(None, str.lower)
+        expected = pd.DataFrame(columns=['a', 'b'])
+        assert_frame_equal(result, expected)
+        assert len(rec) == 1
+        message = str(rec[0].message)
+        assert 'rename' in message
+        assert 'Use named arguments' in message
+
+    def test_assign_columns(self):
+        self.frame['hi'] = 'there'
+
+        frame = self.frame.copy()
+        frame.columns = ['foo', 'bar', 'baz', 'quux', 'foo2']
+        assert_series_equal(self.frame['C'], frame['baz'], check_names=False)
+        assert_series_equal(self.frame['hi'], frame['foo2'], check_names=False)
+
+    def test_set_index_preserve_categorical_dtype(self):
+        # GH13743, GH13854
+        df = DataFrame({'A': [1, 2, 1, 1, 2],
+                        'B': [10, 16, 22, 28, 34],
+                        'C1': pd.Categorical(list("abaab"),
+                                             categories=list("bac"),
+                                             ordered=False),
+                        'C2': pd.Categorical(list("abaab"),
+                                             categories=list("bac"),
+                                             ordered=True)})
+        for cols in ['C1', 'C2', ['A', 'C1'], ['A', 'C2'], ['C1', 'C2']]:
+            result = df.set_index(cols).reset_index()
+            result = result.reindex(columns=df.columns)
+            tm.assert_frame_equal(result, df)
+
+    def test_ambiguous_warns(self):
+        df = pd.DataFrame({"A": [1, 2]})
+        with tm.assert_produces_warning(FutureWarning):
+            df.rename(id, id)
+
+        with tm.assert_produces_warning(FutureWarning):
+            df.rename({0: 10}, {"A": "B"})
+
+    @pytest.mark.skipif(PY2, reason="inspect.signature")
+    def test_rename_signature(self):
+        sig = inspect.signature(pd.DataFrame.rename)
+        parameters = set(sig.parameters)
+        assert parameters == {"self", "mapper", "index", "columns", "axis",
+                              "inplace", "copy", "level"}
+
+    @pytest.mark.skipif(PY2, reason="inspect.signature")
+    def test_reindex_signature(self):
+        sig = inspect.signature(pd.DataFrame.reindex)
+        parameters = set(sig.parameters)
+        assert parameters == {"self", "labels", "index", "columns", "axis",
+                              "limit", "copy", "level", "method",
+                              "fill_value", "tolerance"}
+
+
+class TestIntervalIndex(object):
+
+    def test_setitem(self):
+
+        df = DataFrame({'A': range(10)})
+        s = pd.cut(df.A, 5)
+        assert isinstance(s.cat.categories, IntervalIndex)
+
+        # B & D end up as Categoricals
+        # the remainer are converted to in-line objects
+        # contining an IntervalIndex.values
+        df['B'] = s
+        df['C'] = np.array(s)
+        df['D'] = s.values
+        df['E'] = np.array(s.values)
+
+        assert is_categorical_dtype(df['B'])
+        assert is_interval_dtype(df['B'].cat.categories)
+        assert is_categorical_dtype(df['D'])
+        assert is_interval_dtype(df['D'].cat.categories)
+
+        assert is_object_dtype(df['C'])
+        assert is_object_dtype(df['E'])
+
+        # they compare equal as Index
+        # when converted to numpy objects
+        c = lambda x: Index(np.array(x))
+        tm.assert_index_equal(c(df.B), c(df.B), check_names=False)
+        tm.assert_index_equal(c(df.B), c(df.C), check_names=False)
+        tm.assert_index_equal(c(df.B), c(df.D), check_names=False)
+        tm.assert_index_equal(c(df.B), c(df.D), check_names=False)
+
+        # B & D are the same Series
+        tm.assert_series_equal(df['B'], df['B'], check_names=False)
+        tm.assert_series_equal(df['B'], df['D'], check_names=False)
+
+        # C & E are the same Series
+        tm.assert_series_equal(df['C'], df['C'], check_names=False)
+        tm.assert_series_equal(df['C'], df['E'], check_names=False)
+
+    def test_set_reset_index(self):
+
+        df = DataFrame({'A': range(10)})
+        s = pd.cut(df.A, 5)
+        df['B'] = s
+        df = df.set_index('B')
+
+        df = df.reset_index()
+
+    def test_set_axis_inplace(self):
+        # GH14636
+        df = DataFrame({'A': [1.1, 2.2, 3.3],
+                        'B': [5.0, 6.1, 7.2],
+                        'C': [4.4, 5.5, 6.6]},
+                       index=[2010, 2011, 2012])
+
+        expected = {0: df.copy(),
+                    1: df.copy()}
+        expected[0].index = list('abc')
+        expected[1].columns = list('abc')
+        expected['index'] = expected[0]
+        expected['columns'] = expected[1]
+
+        for axis in expected:
+            # inplace=True
+            # The FutureWarning comes from the fact that we would like to have
+            # inplace default to False some day
+            for inplace, warn in (None, FutureWarning), (True, None):
+                kwargs = {'inplace': inplace}
+
+                result = df.copy()
+                with tm.assert_produces_warning(warn):
+                    result.set_axis(list('abc'), axis=axis, **kwargs)
+                tm.assert_frame_equal(result, expected[axis])
+
+            # inplace=False
+            result = df.set_axis(list('abc'), axis=axis, inplace=False)
+            tm.assert_frame_equal(expected[axis], result)
+
+        # omitting the "axis" parameter
+        with tm.assert_produces_warning(None):
+            result = df.set_axis(list('abc'), inplace=False)
+        tm.assert_frame_equal(result, expected[0])
+
+        # wrong values for the "axis" parameter
+        for axis in 3, 'foo':
+            with tm.assert_raises_regex(ValueError, 'No axis named'):
+                df.set_axis(list('abc'), axis=axis, inplace=False)
+
+    def test_set_axis_prior_to_deprecation_signature(self):
+        df = DataFrame({'A': [1.1, 2.2, 3.3],
+                        'B': [5.0, 6.1, 7.2],
+                        'C': [4.4, 5.5, 6.6]},
+                       index=[2010, 2011, 2012])
+
+        expected = {0: df.copy(),
+                    1: df.copy()}
+        expected[0].index = list('abc')
+        expected[1].columns = list('abc')
+        expected['index'] = expected[0]
+        expected['columns'] = expected[1]
+
+        # old signature
+        for axis in expected:
+            with tm.assert_produces_warning(FutureWarning):
+                result = df.set_axis(axis, list('abc'), inplace=False)
+            tm.assert_frame_equal(result, expected[axis])
diff --git a/pandas/tests/frame/test_analytics.py b/pandas/tests/frame/test_analytics.py
new file mode 100644
index 0000000000000..d357208813dd8
--- /dev/null
+++ b/pandas/tests/frame/test_analytics.py
@@ -0,0 +1,2500 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import warnings
+from datetime import timedelta
+import operator
+import pytest
+
+from string import ascii_lowercase
+from numpy import nan
+from numpy.random import randn
+import numpy as np
+
+from pandas.compat import lrange, PY35
+from pandas import (compat, isna, notna, DataFrame, Series,
+                    MultiIndex, date_range, Timestamp, Categorical,
+                    _np_version_under1p12,
+                    to_datetime, to_timedelta)
+import pandas as pd
+import pandas.core.nanops as nanops
+import pandas.core.algorithms as algorithms
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas.tests.frame.common import TestData
+
+
+class TestDataFrameAnalytics(TestData):
+
+    # ---------------------------------------------------------------------=
+    # Correlation and covariance
+
+    @td.skip_if_no_scipy
+    def test_corr_pearson(self):
+        self.frame['A'][:5] = nan
+        self.frame['B'][5:10] = nan
+
+        self._check_method('pearson')
+
+    @td.skip_if_no_scipy
+    def test_corr_kendall(self):
+        self.frame['A'][:5] = nan
+        self.frame['B'][5:10] = nan
+
+        self._check_method('kendall')
+
+    @td.skip_if_no_scipy
+    def test_corr_spearman(self):
+        self.frame['A'][:5] = nan
+        self.frame['B'][5:10] = nan
+
+        self._check_method('spearman')
+
+    def _check_method(self, method='pearson', check_minp=False):
+        if not check_minp:
+            correls = self.frame.corr(method=method)
+            exp = self.frame['A'].corr(self.frame['C'], method=method)
+            tm.assert_almost_equal(correls['A']['C'], exp)
+        else:
+            result = self.frame.corr(min_periods=len(self.frame) - 8)
+            expected = self.frame.corr()
+            expected.loc['A', 'B'] = expected.loc['B', 'A'] = nan
+            tm.assert_frame_equal(result, expected)
+
+    @td.skip_if_no_scipy
+    def test_corr_non_numeric(self):
+        self.frame['A'][:5] = nan
+        self.frame['B'][5:10] = nan
+
+        # exclude non-numeric types
+        result = self.mixed_frame.corr()
+        expected = self.mixed_frame.loc[:, ['A', 'B', 'C', 'D']].corr()
+        tm.assert_frame_equal(result, expected)
+
+    @td.skip_if_no_scipy
+    def test_corr_nooverlap(self):
+        # nothing in common
+        for meth in ['pearson', 'kendall', 'spearman']:
+            df = DataFrame({'A': [1, 1.5, 1, np.nan, np.nan, np.nan],
+                            'B': [np.nan, np.nan, np.nan, 1, 1.5, 1],
+                            'C': [np.nan, np.nan, np.nan, np.nan,
+                                  np.nan, np.nan]})
+            rs = df.corr(meth)
+            assert isna(rs.loc['A', 'B'])
+            assert isna(rs.loc['B', 'A'])
+            assert rs.loc['A', 'A'] == 1
+            assert rs.loc['B', 'B'] == 1
+            assert isna(rs.loc['C', 'C'])
+
+    @td.skip_if_no_scipy
+    def test_corr_constant(self):
+        # constant --> all NA
+
+        for meth in ['pearson', 'spearman']:
+            df = DataFrame({'A': [1, 1, 1, np.nan, np.nan, np.nan],
+                            'B': [np.nan, np.nan, np.nan, 1, 1, 1]})
+            rs = df.corr(meth)
+            assert isna(rs.values).all()
+
+    def test_corr_int(self):
+        # dtypes other than float64 #1761
+        df3 = DataFrame({"a": [1, 2, 3, 4], "b": [1, 2, 3, 4]})
+
+        df3.cov()
+        df3.corr()
+
+    @td.skip_if_no_scipy
+    def test_corr_int_and_boolean(self):
+        # when dtypes of pandas series are different
+        # then ndarray will have dtype=object,
+        # so it need to be properly handled
+        df = DataFrame({"a": [True, False], "b": [1, 0]})
+
+        expected = DataFrame(np.ones((2, 2)), index=[
+                             'a', 'b'], columns=['a', 'b'])
+        for meth in ['pearson', 'kendall', 'spearman']:
+
+            # RuntimeWarning
+            with warnings.catch_warnings(record=True):
+                result = df.corr(meth)
+            tm.assert_frame_equal(result, expected)
+
+    def test_corr_cov_independent_index_column(self):
+        # GH 14617
+        df = pd.DataFrame(np.random.randn(4 * 10).reshape(10, 4),
+                          columns=list("abcd"))
+        for method in ['cov', 'corr']:
+            result = getattr(df, method)()
+            assert result.index is not result.columns
+            assert result.index.equals(result.columns)
+
+    def test_cov(self):
+        # min_periods no NAs (corner case)
+        expected = self.frame.cov()
+        result = self.frame.cov(min_periods=len(self.frame))
+
+        tm.assert_frame_equal(expected, result)
+
+        result = self.frame.cov(min_periods=len(self.frame) + 1)
+        assert isna(result.values).all()
+
+        # with NAs
+        frame = self.frame.copy()
+        frame['A'][:5] = nan
+        frame['B'][5:10] = nan
+        result = self.frame.cov(min_periods=len(self.frame) - 8)
+        expected = self.frame.cov()
+        expected.loc['A', 'B'] = np.nan
+        expected.loc['B', 'A'] = np.nan
+
+        # regular
+        self.frame['A'][:5] = nan
+        self.frame['B'][:10] = nan
+        cov = self.frame.cov()
+
+        tm.assert_almost_equal(cov['A']['C'],
+                               self.frame['A'].cov(self.frame['C']))
+
+        # exclude non-numeric types
+        result = self.mixed_frame.cov()
+        expected = self.mixed_frame.loc[:, ['A', 'B', 'C', 'D']].cov()
+        tm.assert_frame_equal(result, expected)
+
+        # Single column frame
+        df = DataFrame(np.linspace(0.0, 1.0, 10))
+        result = df.cov()
+        expected = DataFrame(np.cov(df.values.T).reshape((1, 1)),
+                             index=df.columns, columns=df.columns)
+        tm.assert_frame_equal(result, expected)
+        df.loc[0] = np.nan
+        result = df.cov()
+        expected = DataFrame(np.cov(df.values[1:].T).reshape((1, 1)),
+                             index=df.columns, columns=df.columns)
+        tm.assert_frame_equal(result, expected)
+
+    def test_corrwith(self):
+        a = self.tsframe
+        noise = Series(randn(len(a)), index=a.index)
+
+        b = self.tsframe.add(noise, axis=0)
+
+        # make sure order does not matter
+        b = b.reindex(columns=b.columns[::-1], index=b.index[::-1][10:])
+        del b['B']
+
+        colcorr = a.corrwith(b, axis=0)
+        tm.assert_almost_equal(colcorr['A'], a['A'].corr(b['A']))
+
+        rowcorr = a.corrwith(b, axis=1)
+        tm.assert_series_equal(rowcorr, a.T.corrwith(b.T, axis=0))
+
+        dropped = a.corrwith(b, axis=0, drop=True)
+        tm.assert_almost_equal(dropped['A'], a['A'].corr(b['A']))
+        assert 'B' not in dropped
+
+        dropped = a.corrwith(b, axis=1, drop=True)
+        assert a.index[-1] not in dropped.index
+
+        # non time-series data
+        index = ['a', 'b', 'c', 'd', 'e']
+        columns = ['one', 'two', 'three', 'four']
+        df1 = DataFrame(randn(5, 4), index=index, columns=columns)
+        df2 = DataFrame(randn(4, 4), index=index[:4], columns=columns)
+        correls = df1.corrwith(df2, axis=1)
+        for row in index[:4]:
+            tm.assert_almost_equal(correls[row],
+                                   df1.loc[row].corr(df2.loc[row]))
+
+    def test_corrwith_with_objects(self):
+        df1 = tm.makeTimeDataFrame()
+        df2 = tm.makeTimeDataFrame()
+        cols = ['A', 'B', 'C', 'D']
+
+        df1['obj'] = 'foo'
+        df2['obj'] = 'bar'
+
+        result = df1.corrwith(df2)
+        expected = df1.loc[:, cols].corrwith(df2.loc[:, cols])
+        tm.assert_series_equal(result, expected)
+
+        result = df1.corrwith(df2, axis=1)
+        expected = df1.loc[:, cols].corrwith(df2.loc[:, cols], axis=1)
+        tm.assert_series_equal(result, expected)
+
+    def test_corrwith_series(self):
+        result = self.tsframe.corrwith(self.tsframe['A'])
+        expected = self.tsframe.apply(self.tsframe['A'].corr)
+
+        tm.assert_series_equal(result, expected)
+
+    def test_corrwith_matches_corrcoef(self):
+        df1 = DataFrame(np.arange(10000), columns=['a'])
+        df2 = DataFrame(np.arange(10000) ** 2, columns=['a'])
+        c1 = df1.corrwith(df2)['a']
+        c2 = np.corrcoef(df1['a'], df2['a'])[0][1]
+
+        tm.assert_almost_equal(c1, c2)
+        assert c1 < 1
+
+    def test_corrwith_mixed_dtypes(self):
+        # GH 18570
+        df = pd.DataFrame({'a': [1, 4, 3, 2], 'b': [4, 6, 7, 3],
+                           'c': ['a', 'b', 'c', 'd']})
+        s = pd.Series([0, 6, 7, 3])
+        result = df.corrwith(s)
+        corrs = [df['a'].corr(s), df['b'].corr(s)]
+        expected = pd.Series(data=corrs, index=['a', 'b'])
+        tm.assert_series_equal(result, expected)
+
+    def test_bool_describe_in_mixed_frame(self):
+        df = DataFrame({
+            'string_data': ['a', 'b', 'c', 'd', 'e'],
+            'bool_data': [True, True, False, False, False],
+            'int_data': [10, 20, 30, 40, 50],
+        })
+
+        # Integer data are included in .describe() output,
+        # Boolean and string data are not.
+        result = df.describe()
+        expected = DataFrame({'int_data': [5, 30, df.int_data.std(),
+                                           10, 20, 30, 40, 50]},
+                             index=['count', 'mean', 'std', 'min', '25%',
+                                    '50%', '75%', 'max'])
+        tm.assert_frame_equal(result, expected)
+
+        # Top value is a boolean value that is False
+        result = df.describe(include=['bool'])
+
+        expected = DataFrame({'bool_data': [5, 2, False, 3]},
+                             index=['count', 'unique', 'top', 'freq'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_describe_bool_frame(self):
+        # GH 13891
+        df = pd.DataFrame({
+            'bool_data_1': [False, False, True, True],
+            'bool_data_2': [False, True, True, True]
+        })
+        result = df.describe()
+        expected = DataFrame({'bool_data_1': [4, 2, True, 2],
+                              'bool_data_2': [4, 2, True, 3]},
+                             index=['count', 'unique', 'top', 'freq'])
+        tm.assert_frame_equal(result, expected)
+
+        df = pd.DataFrame({
+            'bool_data': [False, False, True, True, False],
+            'int_data': [0, 1, 2, 3, 4]
+        })
+        result = df.describe()
+        expected = DataFrame({'int_data': [5, 2, df.int_data.std(), 0, 1,
+                                           2, 3, 4]},
+                             index=['count', 'mean', 'std', 'min', '25%',
+                                    '50%', '75%', 'max'])
+        tm.assert_frame_equal(result, expected)
+
+        df = pd.DataFrame({
+            'bool_data': [False, False, True, True],
+            'str_data': ['a', 'b', 'c', 'a']
+        })
+        result = df.describe()
+        expected = DataFrame({'bool_data': [4, 2, True, 2],
+                              'str_data': [4, 3, 'a', 2]},
+                             index=['count', 'unique', 'top', 'freq'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_describe_categorical(self):
+        df = DataFrame({'value': np.random.randint(0, 10000, 100)})
+        labels = ["{0} - {1}".format(i, i + 499) for i in range(0, 10000, 500)]
+        cat_labels = Categorical(labels, labels)
+
+        df = df.sort_values(by=['value'], ascending=True)
+        df['value_group'] = pd.cut(df.value, range(0, 10500, 500),
+                                   right=False, labels=cat_labels)
+        cat = df
+
+        # Categoricals should not show up together with numerical columns
+        result = cat.describe()
+        assert len(result.columns) == 1
+
+        # In a frame, describe() for the cat should be the same as for string
+        # arrays (count, unique, top, freq)
+
+        cat = Categorical(["a", "b", "b", "b"], categories=['a', 'b', 'c'],
+                          ordered=True)
+        s = Series(cat)
+        result = s.describe()
+        expected = Series([4, 2, "b", 3],
+                          index=['count', 'unique', 'top', 'freq'])
+        tm.assert_series_equal(result, expected)
+
+        cat = Series(Categorical(["a", "b", "c", "c"]))
+        df3 = DataFrame({"cat": cat, "s": ["a", "b", "c", "c"]})
+        res = df3.describe()
+        tm.assert_numpy_array_equal(res["cat"].values, res["s"].values)
+
+    def test_describe_categorical_columns(self):
+        # GH 11558
+        columns = pd.CategoricalIndex(['int1', 'int2', 'obj'],
+                                      ordered=True, name='XXX')
+        df = DataFrame({'int1': [10, 20, 30, 40, 50],
+                        'int2': [10, 20, 30, 40, 50],
+                        'obj': ['A', 0, None, 'X', 1]},
+                       columns=columns)
+        result = df.describe()
+
+        exp_columns = pd.CategoricalIndex(['int1', 'int2'],
+                                          categories=['int1', 'int2', 'obj'],
+                                          ordered=True, name='XXX')
+        expected = DataFrame({'int1': [5, 30, df.int1.std(),
+                                       10, 20, 30, 40, 50],
+                              'int2': [5, 30, df.int2.std(),
+                                       10, 20, 30, 40, 50]},
+                             index=['count', 'mean', 'std', 'min', '25%',
+                                    '50%', '75%', 'max'],
+                             columns=exp_columns)
+        tm.assert_frame_equal(result, expected)
+        tm.assert_categorical_equal(result.columns.values,
+                                    expected.columns.values)
+
+    def test_describe_datetime_columns(self):
+        columns = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'],
+                                   freq='MS', tz='US/Eastern', name='XXX')
+        df = DataFrame({0: [10, 20, 30, 40, 50],
+                        1: [10, 20, 30, 40, 50],
+                        2: ['A', 0, None, 'X', 1]})
+        df.columns = columns
+        result = df.describe()
+
+        exp_columns = pd.DatetimeIndex(['2011-01-01', '2011-02-01'],
+                                       freq='MS', tz='US/Eastern', name='XXX')
+        expected = DataFrame({0: [5, 30, df.iloc[:, 0].std(),
+                                  10, 20, 30, 40, 50],
+                              1: [5, 30, df.iloc[:, 1].std(),
+                                  10, 20, 30, 40, 50]},
+                             index=['count', 'mean', 'std', 'min', '25%',
+                                    '50%', '75%', 'max'])
+        expected.columns = exp_columns
+        tm.assert_frame_equal(result, expected)
+        assert result.columns.freq == 'MS'
+        assert result.columns.tz == expected.columns.tz
+
+    def test_describe_timedelta_values(self):
+        # GH 6145
+        t1 = pd.timedelta_range('1 days', freq='D', periods=5)
+        t2 = pd.timedelta_range('1 hours', freq='H', periods=5)
+        df = pd.DataFrame({'t1': t1, 't2': t2})
+
+        expected = DataFrame({'t1': [5, pd.Timedelta('3 days'),
+                                     df.iloc[:, 0].std(),
+                                     pd.Timedelta('1 days'),
+                                     pd.Timedelta('2 days'),
+                                     pd.Timedelta('3 days'),
+                                     pd.Timedelta('4 days'),
+                                     pd.Timedelta('5 days')],
+                              't2': [5, pd.Timedelta('3 hours'),
+                                     df.iloc[:, 1].std(),
+                                     pd.Timedelta('1 hours'),
+                                     pd.Timedelta('2 hours'),
+                                     pd.Timedelta('3 hours'),
+                                     pd.Timedelta('4 hours'),
+                                     pd.Timedelta('5 hours')]},
+                             index=['count', 'mean', 'std', 'min', '25%',
+                                    '50%', '75%', 'max'])
+
+        res = df.describe()
+        tm.assert_frame_equal(res, expected)
+
+        exp_repr = ("                           t1                      t2\n"
+                    "count                       5                       5\n"
+                    "mean          3 days 00:00:00         0 days 03:00:00\n"
+                    "std    1 days 13:56:50.394919  0 days 01:34:52.099788\n"
+                    "min           1 days 00:00:00         0 days 01:00:00\n"
+                    "25%           2 days 00:00:00         0 days 02:00:00\n"
+                    "50%           3 days 00:00:00         0 days 03:00:00\n"
+                    "75%           4 days 00:00:00         0 days 04:00:00\n"
+                    "max           5 days 00:00:00         0 days 05:00:00")
+        assert repr(res) == exp_repr
+
+    def test_reduce_mixed_frame(self):
+        # GH 6806
+        df = DataFrame({
+            'bool_data': [True, True, False, False, False],
+            'int_data': [10, 20, 30, 40, 50],
+            'string_data': ['a', 'b', 'c', 'd', 'e'],
+        })
+        df.reindex(columns=['bool_data', 'int_data', 'string_data'])
+        test = df.sum(axis=0)
+        tm.assert_numpy_array_equal(test.values,
+                                    np.array([2, 150, 'abcde'], dtype=object))
+        tm.assert_series_equal(test, df.T.sum(axis=1))
+
+    def test_count(self):
+        f = lambda s: notna(s).sum()
+        self._check_stat_op('count', f,
+                            has_skipna=False,
+                            has_numeric_only=True,
+                            check_dtype=False,
+                            check_dates=True)
+
+        # corner case
+        frame = DataFrame()
+        ct1 = frame.count(1)
+        assert isinstance(ct1, Series)
+
+        ct2 = frame.count(0)
+        assert isinstance(ct2, Series)
+
+        # GH #423
+        df = DataFrame(index=lrange(10))
+        result = df.count(1)
+        expected = Series(0, index=df.index)
+        tm.assert_series_equal(result, expected)
+
+        df = DataFrame(columns=lrange(10))
+        result = df.count(0)
+        expected = Series(0, index=df.columns)
+        tm.assert_series_equal(result, expected)
+
+        df = DataFrame()
+        result = df.count()
+        expected = Series(0, index=[])
+        tm.assert_series_equal(result, expected)
+
+    def test_nunique(self):
+        f = lambda s: len(algorithms.unique1d(s.dropna()))
+        self._check_stat_op('nunique', f, has_skipna=False,
+                            check_dtype=False, check_dates=True)
+
+        df = DataFrame({'A': [1, 1, 1],
+                        'B': [1, 2, 3],
+                        'C': [1, np.nan, 3]})
+        tm.assert_series_equal(df.nunique(), Series({'A': 1, 'B': 3, 'C': 2}))
+        tm.assert_series_equal(df.nunique(dropna=False),
+                               Series({'A': 1, 'B': 3, 'C': 3}))
+        tm.assert_series_equal(df.nunique(axis=1), Series({0: 1, 1: 2, 2: 2}))
+        tm.assert_series_equal(df.nunique(axis=1, dropna=False),
+                               Series({0: 1, 1: 3, 2: 2}))
+
+    def test_sum(self):
+        self._check_stat_op('sum', np.sum, has_numeric_only=True,
+                            skipna_alternative=np.nansum)
+
+        # mixed types (with upcasting happening)
+        self._check_stat_op('sum', np.sum,
+                            frame=self.mixed_float.astype('float32'),
+                            has_numeric_only=True, check_dtype=False,
+                            check_less_precise=True)
+
+    @pytest.mark.parametrize(
+        "method", ['sum', 'mean', 'prod', 'var',
+                   'std', 'skew', 'min', 'max'])
+    def test_stat_operators_attempt_obj_array(self, method):
+        # GH #676
+        data = {
+            'a': [-0.00049987540199591344, -0.0016467257772919831,
+                  0.00067695870775883013],
+            'b': [-0, -0, 0.0],
+            'c': [0.00031111847529610595, 0.0014902627951905339,
+                  -0.00094099200035979691]
+        }
+        df1 = DataFrame(data, index=['foo', 'bar', 'baz'],
+                        dtype='O')
+
+        df2 = DataFrame({0: [np.nan, 2], 1: [np.nan, 3],
+                         2: [np.nan, 4]}, dtype=object)
+
+        for df in [df1, df2]:
+            assert df.values.dtype == np.object_
+            result = getattr(df, method)(1)
+            expected = getattr(df.astype('f8'), method)(1)
+
+            if method in ['sum', 'prod']:
+                tm.assert_series_equal(result, expected)
+
+    def test_mean(self):
+        self._check_stat_op('mean', np.mean, check_dates=True)
+
+    def test_product(self):
+        self._check_stat_op('product', np.prod)
+
+    def test_median(self):
+        def wrapper(x):
+            if isna(x).any():
+                return np.nan
+            return np.median(x)
+
+        self._check_stat_op('median', wrapper, check_dates=True)
+
+    def test_min(self):
+        with warnings.catch_warnings(record=True):
+            self._check_stat_op('min', np.min, check_dates=True)
+        self._check_stat_op('min', np.min, frame=self.intframe)
+
+    def test_cummin(self):
+        self.tsframe.loc[5:10, 0] = nan
+        self.tsframe.loc[10:15, 1] = nan
+        self.tsframe.loc[15:, 2] = nan
+
+        # axis = 0
+        cummin = self.tsframe.cummin()
+        expected = self.tsframe.apply(Series.cummin)
+        tm.assert_frame_equal(cummin, expected)
+
+        # axis = 1
+        cummin = self.tsframe.cummin(axis=1)
+        expected = self.tsframe.apply(Series.cummin, axis=1)
+        tm.assert_frame_equal(cummin, expected)
+
+        # it works
+        df = DataFrame({'A': np.arange(20)}, index=np.arange(20))
+        result = df.cummin()  # noqa
+
+        # fix issue
+        cummin_xs = self.tsframe.cummin(axis=1)
+        assert np.shape(cummin_xs) == np.shape(self.tsframe)
+
+    def test_cummax(self):
+        self.tsframe.loc[5:10, 0] = nan
+        self.tsframe.loc[10:15, 1] = nan
+        self.tsframe.loc[15:, 2] = nan
+
+        # axis = 0
+        cummax = self.tsframe.cummax()
+        expected = self.tsframe.apply(Series.cummax)
+        tm.assert_frame_equal(cummax, expected)
+
+        # axis = 1
+        cummax = self.tsframe.cummax(axis=1)
+        expected = self.tsframe.apply(Series.cummax, axis=1)
+        tm.assert_frame_equal(cummax, expected)
+
+        # it works
+        df = DataFrame({'A': np.arange(20)}, index=np.arange(20))
+        result = df.cummax()  # noqa
+
+        # fix issue
+        cummax_xs = self.tsframe.cummax(axis=1)
+        assert np.shape(cummax_xs) == np.shape(self.tsframe)
+
+    def test_max(self):
+        with warnings.catch_warnings(record=True):
+            self._check_stat_op('max', np.max, check_dates=True)
+        self._check_stat_op('max', np.max, frame=self.intframe)
+
+    def test_mad(self):
+        f = lambda x: np.abs(x - x.mean()).mean()
+        self._check_stat_op('mad', f)
+
+    def test_var_std(self):
+        alt = lambda x: np.var(x, ddof=1)
+        self._check_stat_op('var', alt)
+
+        alt = lambda x: np.std(x, ddof=1)
+        self._check_stat_op('std', alt)
+
+        result = self.tsframe.std(ddof=4)
+        expected = self.tsframe.apply(lambda x: x.std(ddof=4))
+        tm.assert_almost_equal(result, expected)
+
+        result = self.tsframe.var(ddof=4)
+        expected = self.tsframe.apply(lambda x: x.var(ddof=4))
+        tm.assert_almost_equal(result, expected)
+
+        arr = np.repeat(np.random.random((1, 1000)), 1000, 0)
+        result = nanops.nanvar(arr, axis=0)
+        assert not (result < 0).any()
+
+        with pd.option_context('use_bottleneck', False):
+            result = nanops.nanvar(arr, axis=0)
+            assert not (result < 0).any()
+
+    @pytest.mark.parametrize(
+        "meth", ['sem', 'var', 'std'])
+    def test_numeric_only_flag(self, meth):
+        # GH #9201
+        df1 = DataFrame(np.random.randn(5, 3), columns=['foo', 'bar', 'baz'])
+        # set one entry to a number in str format
+        df1.loc[0, 'foo'] = '100'
+
+        df2 = DataFrame(np.random.randn(5, 3), columns=['foo', 'bar', 'baz'])
+        # set one entry to a non-number str
+        df2.loc[0, 'foo'] = 'a'
+
+        result = getattr(df1, meth)(axis=1, numeric_only=True)
+        expected = getattr(df1[['bar', 'baz']], meth)(axis=1)
+        tm.assert_series_equal(expected, result)
+
+        result = getattr(df2, meth)(axis=1, numeric_only=True)
+        expected = getattr(df2[['bar', 'baz']], meth)(axis=1)
+        tm.assert_series_equal(expected, result)
+
+        # df1 has all numbers, df2 has a letter inside
+        pytest.raises(TypeError, lambda: getattr(df1, meth)(
+            axis=1, numeric_only=False))
+        pytest.raises(TypeError, lambda: getattr(df2, meth)(
+            axis=1, numeric_only=False))
+
+    def test_mixed_ops(self):
+        # GH 16116
+        df = DataFrame({'int': [1, 2, 3, 4],
+                        'float': [1., 2., 3., 4.],
+                        'str': ['a', 'b', 'c', 'd']})
+
+        for op in ['mean', 'std', 'var', 'skew',
+                   'kurt', 'sem']:
+            result = getattr(df, op)()
+            assert len(result) == 2
+
+            with pd.option_context('use_bottleneck', False):
+                result = getattr(df, op)()
+                assert len(result) == 2
+
+    def test_cumsum(self):
+        self.tsframe.loc[5:10, 0] = nan
+        self.tsframe.loc[10:15, 1] = nan
+        self.tsframe.loc[15:, 2] = nan
+
+        # axis = 0
+        cumsum = self.tsframe.cumsum()
+        expected = self.tsframe.apply(Series.cumsum)
+        tm.assert_frame_equal(cumsum, expected)
+
+        # axis = 1
+        cumsum = self.tsframe.cumsum(axis=1)
+        expected = self.tsframe.apply(Series.cumsum, axis=1)
+        tm.assert_frame_equal(cumsum, expected)
+
+        # works
+        df = DataFrame({'A': np.arange(20)}, index=np.arange(20))
+        result = df.cumsum()  # noqa
+
+        # fix issue
+        cumsum_xs = self.tsframe.cumsum(axis=1)
+        assert np.shape(cumsum_xs) == np.shape(self.tsframe)
+
+    def test_cumprod(self):
+        self.tsframe.loc[5:10, 0] = nan
+        self.tsframe.loc[10:15, 1] = nan
+        self.tsframe.loc[15:, 2] = nan
+
+        # axis = 0
+        cumprod = self.tsframe.cumprod()
+        expected = self.tsframe.apply(Series.cumprod)
+        tm.assert_frame_equal(cumprod, expected)
+
+        # axis = 1
+        cumprod = self.tsframe.cumprod(axis=1)
+        expected = self.tsframe.apply(Series.cumprod, axis=1)
+        tm.assert_frame_equal(cumprod, expected)
+
+        # fix issue
+        cumprod_xs = self.tsframe.cumprod(axis=1)
+        assert np.shape(cumprod_xs) == np.shape(self.tsframe)
+
+        # ints
+        df = self.tsframe.fillna(0).astype(int)
+        df.cumprod(0)
+        df.cumprod(1)
+
+        # ints32
+        df = self.tsframe.fillna(0).astype(np.int32)
+        df.cumprod(0)
+        df.cumprod(1)
+
+    def test_sem(self):
+        alt = lambda x: np.std(x, ddof=1) / np.sqrt(len(x))
+        self._check_stat_op('sem', alt)
+
+        result = self.tsframe.sem(ddof=4)
+        expected = self.tsframe.apply(
+            lambda x: x.std(ddof=4) / np.sqrt(len(x)))
+        tm.assert_almost_equal(result, expected)
+
+        arr = np.repeat(np.random.random((1, 1000)), 1000, 0)
+        result = nanops.nansem(arr, axis=0)
+        assert not (result < 0).any()
+
+        with pd.option_context('use_bottleneck', False):
+            result = nanops.nansem(arr, axis=0)
+            assert not (result < 0).any()
+
+    @td.skip_if_no_scipy
+    def test_skew(self):
+        from scipy.stats import skew
+
+        def alt(x):
+            if len(x) < 3:
+                return np.nan
+            return skew(x, bias=False)
+
+        self._check_stat_op('skew', alt)
+
+    @td.skip_if_no_scipy
+    def test_kurt(self):
+        from scipy.stats import kurtosis
+
+        def alt(x):
+            if len(x) < 4:
+                return np.nan
+            return kurtosis(x, bias=False)
+
+        self._check_stat_op('kurt', alt)
+
+        index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
+                           labels=[[0, 0, 0, 0, 0, 0],
+                                   [0, 1, 2, 0, 1, 2],
+                                   [0, 1, 0, 1, 0, 1]])
+        df = DataFrame(np.random.randn(6, 3), index=index)
+
+        kurt = df.kurt()
+        kurt2 = df.kurt(level=0).xs('bar')
+        tm.assert_series_equal(kurt, kurt2, check_names=False)
+        assert kurt.name is None
+        assert kurt2.name == 'bar'
+
+    def _check_stat_op(self, name, alternative, frame=None, has_skipna=True,
+                       has_numeric_only=False, check_dtype=True,
+                       check_dates=False, check_less_precise=False,
+                       skipna_alternative=None):
+        if frame is None:
+            frame = self.frame
+            # set some NAs
+            frame.loc[5:10] = np.nan
+            frame.loc[15:20, -2:] = np.nan
+
+        f = getattr(frame, name)
+
+        if check_dates:
+            df = DataFrame({'b': date_range('1/1/2001', periods=2)})
+            _f = getattr(df, name)
+            result = _f()
+            assert isinstance(result, Series)
+
+            df['a'] = lrange(len(df))
+            result = getattr(df, name)()
+            assert isinstance(result, Series)
+            assert len(result)
+
+        if has_skipna:
+            def wrapper(x):
+                return alternative(x.values)
+
+            skipna_wrapper = tm._make_skipna_wrapper(alternative,
+                                                     skipna_alternative)
+            result0 = f(axis=0, skipna=False)
+            result1 = f(axis=1, skipna=False)
+            tm.assert_series_equal(result0, frame.apply(wrapper),
+                                   check_dtype=check_dtype,
+                                   check_less_precise=check_less_precise)
+            # HACK: win32
+            tm.assert_series_equal(result1, frame.apply(wrapper, axis=1),
+                                   check_dtype=False,
+                                   check_less_precise=check_less_precise)
+        else:
+            skipna_wrapper = alternative
+            wrapper = alternative
+
+        result0 = f(axis=0)
+        result1 = f(axis=1)
+        tm.assert_series_equal(result0, frame.apply(skipna_wrapper),
+                               check_dtype=check_dtype,
+                               check_less_precise=check_less_precise)
+        if name in ['sum', 'prod']:
+            exp = frame.apply(skipna_wrapper, axis=1)
+            tm.assert_series_equal(result1, exp, check_dtype=False,
+                                   check_less_precise=check_less_precise)
+
+        # check dtypes
+        if check_dtype:
+            lcd_dtype = frame.values.dtype
+            assert lcd_dtype == result0.dtype
+            assert lcd_dtype == result1.dtype
+
+        # result = f(axis=1)
+        # comp = frame.apply(alternative, axis=1).reindex(result.index)
+        # assert_series_equal(result, comp)
+
+        # bad axis
+        tm.assert_raises_regex(ValueError, 'No axis named 2', f, axis=2)
+        # make sure works on mixed-type frame
+        getattr(self.mixed_frame, name)(axis=0)
+        getattr(self.mixed_frame, name)(axis=1)
+
+        if has_numeric_only:
+            getattr(self.mixed_frame, name)(axis=0, numeric_only=True)
+            getattr(self.mixed_frame, name)(axis=1, numeric_only=True)
+            getattr(self.frame, name)(axis=0, numeric_only=False)
+            getattr(self.frame, name)(axis=1, numeric_only=False)
+
+        # all NA case
+        if has_skipna:
+            all_na = self.frame * np.NaN
+            r0 = getattr(all_na, name)(axis=0)
+            r1 = getattr(all_na, name)(axis=1)
+            if name in ['sum', 'prod']:
+                unit = int(name == 'prod')
+                expected = pd.Series(unit, index=r0.index, dtype=r0.dtype)
+                tm.assert_series_equal(r0, expected)
+                expected = pd.Series(unit, index=r1.index, dtype=r1.dtype)
+                tm.assert_series_equal(r1, expected)
+
+    @pytest.mark.parametrize("dropna, expected", [
+        (True, {'A': [12],
+                'B': [10.0],
+                'C': [1.0],
+                'D': ['a'],
+                'E': Categorical(['a'], categories=['a']),
+                'F': to_datetime(['2000-1-2']),
+                'G': to_timedelta(['1 days'])}),
+        (False, {'A': [12],
+                 'B': [10.0],
+                 'C': [np.nan],
+                 'D': np.array([np.nan], dtype=object),
+                 'E': Categorical([np.nan], categories=['a']),
+                 'F': [pd.NaT],
+                 'G': to_timedelta([pd.NaT])}),
+        (True, {'H': [8, 9, np.nan, np.nan],
+                'I': [8, 9, np.nan, np.nan],
+                'J': [1, np.nan, np.nan, np.nan],
+                'K': Categorical(['a', np.nan, np.nan, np.nan],
+                                 categories=['a']),
+                'L': to_datetime(['2000-1-2', 'NaT', 'NaT', 'NaT']),
+                'M': to_timedelta(['1 days', 'nan', 'nan', 'nan']),
+                'N': [0, 1, 2, 3]}),
+        (False, {'H': [8, 9, np.nan, np.nan],
+                 'I': [8, 9, np.nan, np.nan],
+                 'J': [1, np.nan, np.nan, np.nan],
+                 'K': Categorical([np.nan, 'a', np.nan, np.nan],
+                                  categories=['a']),
+                 'L': to_datetime(['NaT', '2000-1-2', 'NaT', 'NaT']),
+                 'M': to_timedelta(['nan', '1 days', 'nan', 'nan']),
+                 'N': [0, 1, 2, 3]})
+    ])
+    def test_mode_dropna(self, dropna, expected):
+
+        df = DataFrame({"A": [12, 12, 19, 11],
+                        "B": [10, 10, np.nan, 3],
+                        "C": [1, np.nan, np.nan, np.nan],
+                        "D": [np.nan, np.nan, 'a', np.nan],
+                        "E": Categorical([np.nan, np.nan, 'a', np.nan]),
+                        "F": to_datetime(['NaT', '2000-1-2', 'NaT', 'NaT']),
+                        "G": to_timedelta(['1 days', 'nan', 'nan', 'nan']),
+                        "H": [8, 8, 9, 9],
+                        "I": [9, 9, 8, 8],
+                        "J": [1, 1, np.nan, np.nan],
+                        "K": Categorical(['a', np.nan, 'a', np.nan]),
+                        "L": to_datetime(['2000-1-2', '2000-1-2',
+                                          'NaT', 'NaT']),
+                        "M": to_timedelta(['1 days', 'nan',
+                                           '1 days', 'nan']),
+                        "N": np.arange(4, dtype='int64')})
+
+        result = df[sorted(list(expected.keys()))].mode(dropna=dropna)
+        expected = DataFrame(expected)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.skipif(not compat.PY3, reason="only PY3")
+    def test_mode_sortwarning(self):
+        # Check for the warning that is raised when the mode
+        # results cannot be sorted
+
+        df = DataFrame({"A": [np.nan, np.nan, 'a', 'a']})
+        expected = DataFrame({'A': ['a', np.nan]})
+
+        with tm.assert_produces_warning(UserWarning, check_stacklevel=False):
+            result = df.mode(dropna=False)
+            result = result.sort_values(by='A').reset_index(drop=True)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_operators_timedelta64(self):
+        from datetime import timedelta
+        df = DataFrame(dict(A=date_range('2012-1-1', periods=3, freq='D'),
+                            B=date_range('2012-1-2', periods=3, freq='D'),
+                            C=Timestamp('20120101') -
+                            timedelta(minutes=5, seconds=5)))
+
+        diffs = DataFrame(dict(A=df['A'] - df['C'],
+                               B=df['A'] - df['B']))
+
+        # min
+        result = diffs.min()
+        assert result[0] == diffs.loc[0, 'A']
+        assert result[1] == diffs.loc[0, 'B']
+
+        result = diffs.min(axis=1)
+        assert (result == diffs.loc[0, 'B']).all()
+
+        # max
+        result = diffs.max()
+        assert result[0] == diffs.loc[2, 'A']
+        assert result[1] == diffs.loc[2, 'B']
+
+        result = diffs.max(axis=1)
+        assert (result == diffs['A']).all()
+
+        # abs
+        result = diffs.abs()
+        result2 = abs(diffs)
+        expected = DataFrame(dict(A=df['A'] - df['C'],
+                                  B=df['B'] - df['A']))
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result2, expected)
+
+        # mixed frame
+        mixed = diffs.copy()
+        mixed['C'] = 'foo'
+        mixed['D'] = 1
+        mixed['E'] = 1.
+        mixed['F'] = Timestamp('20130101')
+
+        # results in an object array
+        from pandas.core.tools.timedeltas import (
+            _coerce_scalar_to_timedelta_type as _coerce)
+
+        result = mixed.min()
+        expected = Series([_coerce(timedelta(seconds=5 * 60 + 5)),
+                           _coerce(timedelta(days=-1)),
+                           'foo', 1, 1.0,
+                           Timestamp('20130101')],
+                          index=mixed.columns)
+        tm.assert_series_equal(result, expected)
+
+        # excludes numeric
+        result = mixed.min(axis=1)
+        expected = Series([1, 1, 1.], index=[0, 1, 2])
+        tm.assert_series_equal(result, expected)
+
+        # works when only those columns are selected
+        result = mixed[['A', 'B']].min(1)
+        expected = Series([timedelta(days=-1)] * 3)
+        tm.assert_series_equal(result, expected)
+
+        result = mixed[['A', 'B']].min()
+        expected = Series([timedelta(seconds=5 * 60 + 5),
+                           timedelta(days=-1)], index=['A', 'B'])
+        tm.assert_series_equal(result, expected)
+
+        # GH 3106
+        df = DataFrame({'time': date_range('20130102', periods=5),
+                        'time2': date_range('20130105', periods=5)})
+        df['off1'] = df['time2'] - df['time']
+        assert df['off1'].dtype == 'timedelta64[ns]'
+
+        df['off2'] = df['time'] - df['time2']
+        df._consolidate_inplace()
+        assert df['off1'].dtype == 'timedelta64[ns]'
+        assert df['off2'].dtype == 'timedelta64[ns]'
+
+    def test_sum_corner(self):
+        axis0 = self.empty.sum(0)
+        axis1 = self.empty.sum(1)
+        assert isinstance(axis0, Series)
+        assert isinstance(axis1, Series)
+        assert len(axis0) == 0
+        assert len(axis1) == 0
+
+    @pytest.mark.parametrize('method, unit', [
+        ('sum', 0),
+        ('prod', 1),
+    ])
+    def test_sum_prod_nanops(self, method, unit):
+        idx = ['a', 'b', 'c']
+        df = pd.DataFrame({"a": [unit, unit],
+                           "b": [unit, np.nan],
+                           "c": [np.nan, np.nan]})
+        # The default
+        result = getattr(df, method)
+        expected = pd.Series([unit, unit, unit], index=idx, dtype='float64')
+
+        # min_count=1
+        result = getattr(df, method)(min_count=1)
+        expected = pd.Series([unit, unit, np.nan], index=idx)
+        tm.assert_series_equal(result, expected)
+
+        # min_count=0
+        result = getattr(df, method)(min_count=0)
+        expected = pd.Series([unit, unit, unit], index=idx, dtype='float64')
+        tm.assert_series_equal(result, expected)
+
+        result = getattr(df.iloc[1:], method)(min_count=1)
+        expected = pd.Series([unit, np.nan, np.nan], index=idx)
+        tm.assert_series_equal(result, expected)
+
+        # min_count > 1
+        df = pd.DataFrame({"A": [unit] * 10, "B": [unit] * 5 + [np.nan] * 5})
+        result = getattr(df, method)(min_count=5)
+        expected = pd.Series(result, index=['A', 'B'])
+        tm.assert_series_equal(result, expected)
+
+        result = getattr(df, method)(min_count=6)
+        expected = pd.Series(result, index=['A', 'B'])
+        tm.assert_series_equal(result, expected)
+
+    def test_sum_nanops_timedelta(self):
+        # prod isn't defined on timedeltas
+        idx = ['a', 'b', 'c']
+        df = pd.DataFrame({"a": [0, 0],
+                           "b": [0, np.nan],
+                           "c": [np.nan, np.nan]})
+
+        df2 = df.apply(pd.to_timedelta)
+
+        # 0 by default
+        result = df2.sum()
+        expected = pd.Series([0, 0, 0], dtype='m8[ns]', index=idx)
+        tm.assert_series_equal(result, expected)
+
+        # min_count=0
+        result = df2.sum(min_count=0)
+        tm.assert_series_equal(result, expected)
+
+        # min_count=1
+        result = df2.sum(min_count=1)
+        expected = pd.Series([0, 0, np.nan], dtype='m8[ns]', index=idx)
+        tm.assert_series_equal(result, expected)
+
+    def test_sum_object(self):
+        values = self.frame.values.astype(int)
+        frame = DataFrame(values, index=self.frame.index,
+                          columns=self.frame.columns)
+        deltas = frame * timedelta(1)
+        deltas.sum()
+
+    def test_sum_bool(self):
+        # ensure this works, bug report
+        bools = np.isnan(self.frame)
+        bools.sum(1)
+        bools.sum(0)
+
+    def test_mean_corner(self):
+        # unit test when have object data
+        the_mean = self.mixed_frame.mean(axis=0)
+        the_sum = self.mixed_frame.sum(axis=0, numeric_only=True)
+        tm.assert_index_equal(the_sum.index, the_mean.index)
+        assert len(the_mean.index) < len(self.mixed_frame.columns)
+
+        # xs sum mixed type, just want to know it works...
+        the_mean = self.mixed_frame.mean(axis=1)
+        the_sum = self.mixed_frame.sum(axis=1, numeric_only=True)
+        tm.assert_index_equal(the_sum.index, the_mean.index)
+
+        # take mean of boolean column
+        self.frame['bool'] = self.frame['A'] > 0
+        means = self.frame.mean(0)
+        assert means['bool'] == self.frame['bool'].values.mean()
+
+    def test_stats_mixed_type(self):
+        # don't blow up
+        self.mixed_frame.std(1)
+        self.mixed_frame.var(1)
+        self.mixed_frame.mean(1)
+        self.mixed_frame.skew(1)
+
+    def test_median_corner(self):
+        def wrapper(x):
+            if isna(x).any():
+                return np.nan
+            return np.median(x)
+
+        self._check_stat_op('median', wrapper, frame=self.intframe,
+                            check_dtype=False, check_dates=True)
+
+    # Miscellanea
+
+    def test_count_objects(self):
+        dm = DataFrame(self.mixed_frame._series)
+        df = DataFrame(self.mixed_frame._series)
+
+        tm.assert_series_equal(dm.count(), df.count())
+        tm.assert_series_equal(dm.count(1), df.count(1))
+
+    def test_cumsum_corner(self):
+        dm = DataFrame(np.arange(20).reshape(4, 5),
+                       index=lrange(4), columns=lrange(5))
+        # ?(wesm)
+        result = dm.cumsum()  # noqa
+
+    def test_sum_bools(self):
+        df = DataFrame(index=lrange(1), columns=lrange(10))
+        bools = isna(df)
+        assert bools.sum(axis=1)[0] == 10
+
+    # Index of max / min
+
+    def test_idxmin(self):
+        frame = self.frame
+        frame.loc[5:10] = np.nan
+        frame.loc[15:20, -2:] = np.nan
+        for skipna in [True, False]:
+            for axis in [0, 1]:
+                for df in [frame, self.intframe]:
+                    result = df.idxmin(axis=axis, skipna=skipna)
+                    expected = df.apply(Series.idxmin, axis=axis,
+                                        skipna=skipna)
+                    tm.assert_series_equal(result, expected)
+
+        pytest.raises(ValueError, frame.idxmin, axis=2)
+
+    def test_idxmax(self):
+        frame = self.frame
+        frame.loc[5:10] = np.nan
+        frame.loc[15:20, -2:] = np.nan
+        for skipna in [True, False]:
+            for axis in [0, 1]:
+                for df in [frame, self.intframe]:
+                    result = df.idxmax(axis=axis, skipna=skipna)
+                    expected = df.apply(Series.idxmax, axis=axis,
+                                        skipna=skipna)
+                    tm.assert_series_equal(result, expected)
+
+        pytest.raises(ValueError, frame.idxmax, axis=2)
+
+    # ----------------------------------------------------------------------
+    # Logical reductions
+
+    def test_any_all(self):
+        self._check_bool_op('any', np.any, has_skipna=True, has_bool_only=True)
+        self._check_bool_op('all', np.all, has_skipna=True, has_bool_only=True)
+
+    def test_any_all_extra(self):
+        df = DataFrame({
+            'A': [True, False, False],
+            'B': [True, True, False],
+            'C': [True, True, True],
+        }, index=['a', 'b', 'c'])
+        result = df[['A', 'B']].any(1)
+        expected = Series([True, True, False], index=['a', 'b', 'c'])
+        tm.assert_series_equal(result, expected)
+
+        result = df[['A', 'B']].any(1, bool_only=True)
+        tm.assert_series_equal(result, expected)
+
+        result = df.all(1)
+        expected = Series([True, False, False], index=['a', 'b', 'c'])
+        tm.assert_series_equal(result, expected)
+
+        result = df.all(1, bool_only=True)
+        tm.assert_series_equal(result, expected)
+
+        # Axis is None
+        result = df.all(axis=None).item()
+        assert result is False
+
+        result = df.any(axis=None).item()
+        assert result is True
+
+        result = df[['C']].all(axis=None).item()
+        assert result is True
+
+        # skip pathological failure cases
+        # class CantNonzero(object):
+
+        #     def __nonzero__(self):
+        #         raise ValueError
+
+        # df[4] = CantNonzero()
+
+        # it works!
+        # df.any(1)
+        # df.all(1)
+        # df.any(1, bool_only=True)
+        # df.all(1, bool_only=True)
+
+        # df[4][4] = np.nan
+        # df.any(1)
+        # df.all(1)
+        # df.any(1, bool_only=True)
+        # df.all(1, bool_only=True)
+
+    @pytest.mark.parametrize('func, data, expected', [
+        (np.any, {}, False),
+        (np.all, {}, True),
+        (np.any, {'A': []}, False),
+        (np.all, {'A': []}, True),
+        (np.any, {'A': [False, False]}, False),
+        (np.all, {'A': [False, False]}, False),
+        (np.any, {'A': [True, False]}, True),
+        (np.all, {'A': [True, False]}, False),
+        (np.any, {'A': [True, True]}, True),
+        (np.all, {'A': [True, True]}, True),
+
+        (np.any, {'A': [False], 'B': [False]}, False),
+        (np.all, {'A': [False], 'B': [False]}, False),
+
+        (np.any, {'A': [False, False], 'B': [False, True]}, True),
+        (np.all, {'A': [False, False], 'B': [False, True]}, False),
+
+        # other types
+        (np.all, {'A': pd.Series([0.0, 1.0], dtype='float')}, False),
+        (np.any, {'A': pd.Series([0.0, 1.0], dtype='float')}, True),
+        (np.all, {'A': pd.Series([0, 1], dtype=int)}, False),
+        (np.any, {'A': pd.Series([0, 1], dtype=int)}, True),
+        pytest.param(np.all, {'A': pd.Series([0, 1], dtype='M8[ns]')}, False,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.any, {'A': pd.Series([0, 1], dtype='M8[ns]')}, True,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.all, {'A': pd.Series([1, 2], dtype='M8[ns]')}, True,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.any, {'A': pd.Series([1, 2], dtype='M8[ns]')}, True,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.all, {'A': pd.Series([0, 1], dtype='m8[ns]')}, False,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.any, {'A': pd.Series([0, 1], dtype='m8[ns]')}, True,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.all, {'A': pd.Series([1, 2], dtype='m8[ns]')}, True,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.any, {'A': pd.Series([1, 2], dtype='m8[ns]')}, True,
+                     marks=[td.skip_if_np_lt_115]),
+        (np.all, {'A': pd.Series([0, 1], dtype='category')}, False),
+        (np.any, {'A': pd.Series([0, 1], dtype='category')}, True),
+        (np.all, {'A': pd.Series([1, 2], dtype='category')}, True),
+        (np.any, {'A': pd.Series([1, 2], dtype='category')}, True),
+
+        # # Mix
+        # GH-21484
+        # (np.all, {'A': pd.Series([10, 20], dtype='M8[ns]'),
+        #           'B': pd.Series([10, 20], dtype='m8[ns]')}, True),
+    ])
+    def test_any_all_np_func(self, func, data, expected):
+        # https://github.com/pandas-dev/pandas/issues/19976
+        data = DataFrame(data)
+        result = func(data)
+        assert isinstance(result, np.bool_)
+        assert result.item() is expected
+
+        # method version
+        result = getattr(DataFrame(data), func.__name__)(axis=None)
+        assert isinstance(result, np.bool_)
+        assert result.item() is expected
+
+    def test_any_all_object(self):
+        # https://github.com/pandas-dev/pandas/issues/19976
+        result = np.all(DataFrame(columns=['a', 'b'])).item()
+        assert result is True
+
+        result = np.any(DataFrame(columns=['a', 'b'])).item()
+        assert result is False
+
+    @pytest.mark.parametrize('method', ['any', 'all'])
+    def test_any_all_level_axis_none_raises(self, method):
+        df = DataFrame(
+            {"A": 1},
+            index=MultiIndex.from_product([['A', 'B'], ['a', 'b']],
+                                          names=['out', 'in'])
+        )
+        xpr = "Must specify 'axis' when aggregating by level."
+        with tm.assert_raises_regex(ValueError, xpr):
+            getattr(df, method)(axis=None, level='out')
+
+    def _check_bool_op(self, name, alternative, frame=None, has_skipna=True,
+                       has_bool_only=False):
+        if frame is None:
+            frame = self.frame > 0
+            # set some NAs
+            frame = DataFrame(frame.values.astype(object), frame.index,
+                              frame.columns)
+            frame.loc[5:10] = np.nan
+            frame.loc[15:20, -2:] = np.nan
+
+        f = getattr(frame, name)
+
+        if has_skipna:
+            def skipna_wrapper(x):
+                nona = x.dropna().values
+                return alternative(nona)
+
+            def wrapper(x):
+                return alternative(x.values)
+
+            result0 = f(axis=0, skipna=False)
+            result1 = f(axis=1, skipna=False)
+            tm.assert_series_equal(result0, frame.apply(wrapper))
+            tm.assert_series_equal(result1, frame.apply(wrapper, axis=1),
+                                   check_dtype=False)  # HACK: win32
+        else:
+            skipna_wrapper = alternative
+            wrapper = alternative
+
+        result0 = f(axis=0)
+        result1 = f(axis=1)
+        tm.assert_series_equal(result0, frame.apply(skipna_wrapper))
+        tm.assert_series_equal(result1, frame.apply(skipna_wrapper, axis=1),
+                               check_dtype=False)
+
+        # result = f(axis=1)
+        # comp = frame.apply(alternative, axis=1).reindex(result.index)
+        # assert_series_equal(result, comp)
+
+        # bad axis
+        pytest.raises(ValueError, f, axis=2)
+
+        # make sure works on mixed-type frame
+        mixed = self.mixed_frame
+        mixed['_bool_'] = np.random.randn(len(mixed)) > 0
+        getattr(mixed, name)(axis=0)
+        getattr(mixed, name)(axis=1)
+
+        class NonzeroFail(object):
+
+            def __nonzero__(self):
+                raise ValueError
+
+        mixed['_nonzero_fail_'] = NonzeroFail()
+
+        if has_bool_only:
+            getattr(mixed, name)(axis=0, bool_only=True)
+            getattr(mixed, name)(axis=1, bool_only=True)
+            getattr(frame, name)(axis=0, bool_only=False)
+            getattr(frame, name)(axis=1, bool_only=False)
+
+        # all NA case
+        if has_skipna:
+            all_na = frame * np.NaN
+            r0 = getattr(all_na, name)(axis=0)
+            r1 = getattr(all_na, name)(axis=1)
+            if name == 'any':
+                assert not r0.any()
+                assert not r1.any()
+            else:
+                assert r0.all()
+                assert r1.all()
+
+    # ----------------------------------------------------------------------
+    # Isin
+
+    def test_isin(self):
+        # GH #4211
+        df = DataFrame({'vals': [1, 2, 3, 4], 'ids': ['a', 'b', 'f', 'n'],
+                        'ids2': ['a', 'n', 'c', 'n']},
+                       index=['foo', 'bar', 'baz', 'qux'])
+        other = ['a', 'b', 'c']
+
+        result = df.isin(other)
+        expected = DataFrame([df.loc[s].isin(other) for s in df.index])
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("empty", [[], Series(), np.array([])])
+    def test_isin_empty(self, empty):
+        # see gh-16991
+        df = DataFrame({'A': ['a', 'b', 'c'], 'B': ['a', 'e', 'f']})
+        expected = DataFrame(False, df.index, df.columns)
+
+        result = df.isin(empty)
+        tm.assert_frame_equal(result, expected)
+
+    def test_isin_dict(self):
+        df = DataFrame({'A': ['a', 'b', 'c'], 'B': ['a', 'e', 'f']})
+        d = {'A': ['a']}
+
+        expected = DataFrame(False, df.index, df.columns)
+        expected.loc[0, 'A'] = True
+
+        result = df.isin(d)
+        tm.assert_frame_equal(result, expected)
+
+        # non unique columns
+        df = DataFrame({'A': ['a', 'b', 'c'], 'B': ['a', 'e', 'f']})
+        df.columns = ['A', 'A']
+        expected = DataFrame(False, df.index, df.columns)
+        expected.loc[0, 'A'] = True
+        result = df.isin(d)
+        tm.assert_frame_equal(result, expected)
+
+    def test_isin_with_string_scalar(self):
+        # GH4763
+        df = DataFrame({'vals': [1, 2, 3, 4], 'ids': ['a', 'b', 'f', 'n'],
+                        'ids2': ['a', 'n', 'c', 'n']},
+                       index=['foo', 'bar', 'baz', 'qux'])
+        with pytest.raises(TypeError):
+            df.isin('a')
+
+        with pytest.raises(TypeError):
+            df.isin('aaa')
+
+    def test_isin_df(self):
+        df1 = DataFrame({'A': [1, 2, 3, 4], 'B': [2, np.nan, 4, 4]})
+        df2 = DataFrame({'A': [0, 2, 12, 4], 'B': [2, np.nan, 4, 5]})
+        expected = DataFrame(False, df1.index, df1.columns)
+        result = df1.isin(df2)
+        expected['A'].loc[[1, 3]] = True
+        expected['B'].loc[[0, 2]] = True
+        tm.assert_frame_equal(result, expected)
+
+        # partial overlapping columns
+        df2.columns = ['A', 'C']
+        result = df1.isin(df2)
+        expected['B'] = False
+        tm.assert_frame_equal(result, expected)
+
+    def test_isin_tuples(self):
+        # GH16394
+        df = pd.DataFrame({'A': [1, 2, 3], 'B': ['a', 'b', 'f']})
+        df['C'] = list(zip(df['A'], df['B']))
+        result = df['C'].isin([(1, 'a')])
+        tm.assert_series_equal(result,
+                               Series([True, False, False], name="C"))
+
+    def test_isin_df_dupe_values(self):
+        df1 = DataFrame({'A': [1, 2, 3, 4], 'B': [2, np.nan, 4, 4]})
+        # just cols duped
+        df2 = DataFrame([[0, 2], [12, 4], [2, np.nan], [4, 5]],
+                        columns=['B', 'B'])
+        with pytest.raises(ValueError):
+            df1.isin(df2)
+
+        # just index duped
+        df2 = DataFrame([[0, 2], [12, 4], [2, np.nan], [4, 5]],
+                        columns=['A', 'B'], index=[0, 0, 1, 1])
+        with pytest.raises(ValueError):
+            df1.isin(df2)
+
+        # cols and index:
+        df2.columns = ['B', 'B']
+        with pytest.raises(ValueError):
+            df1.isin(df2)
+
+    def test_isin_dupe_self(self):
+        other = DataFrame({'A': [1, 0, 1, 0], 'B': [1, 1, 0, 0]})
+        df = DataFrame([[1, 1], [1, 0], [0, 0]], columns=['A', 'A'])
+        result = df.isin(other)
+        expected = DataFrame(False, index=df.index, columns=df.columns)
+        expected.loc[0] = True
+        expected.iloc[1, 1] = True
+        tm.assert_frame_equal(result, expected)
+
+    def test_isin_against_series(self):
+        df = pd.DataFrame({'A': [1, 2, 3, 4], 'B': [2, np.nan, 4, 4]},
+                          index=['a', 'b', 'c', 'd'])
+        s = pd.Series([1, 3, 11, 4], index=['a', 'b', 'c', 'd'])
+        expected = DataFrame(False, index=df.index, columns=df.columns)
+        expected['A'].loc['a'] = True
+        expected.loc['d'] = True
+        result = df.isin(s)
+        tm.assert_frame_equal(result, expected)
+
+    def test_isin_multiIndex(self):
+        idx = MultiIndex.from_tuples([(0, 'a', 'foo'), (0, 'a', 'bar'),
+                                      (0, 'b', 'bar'), (0, 'b', 'baz'),
+                                      (2, 'a', 'foo'), (2, 'a', 'bar'),
+                                      (2, 'c', 'bar'), (2, 'c', 'baz'),
+                                      (1, 'b', 'foo'), (1, 'b', 'bar'),
+                                      (1, 'c', 'bar'), (1, 'c', 'baz')])
+        df1 = DataFrame({'A': np.ones(12),
+                         'B': np.zeros(12)}, index=idx)
+        df2 = DataFrame({'A': [1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1],
+                         'B': [1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1]})
+        # against regular index
+        expected = DataFrame(False, index=df1.index, columns=df1.columns)
+        result = df1.isin(df2)
+        tm.assert_frame_equal(result, expected)
+
+        df2.index = idx
+        expected = df2.values.astype(np.bool)
+        expected[:, 1] = ~expected[:, 1]
+        expected = DataFrame(expected, columns=['A', 'B'], index=idx)
+
+        result = df1.isin(df2)
+        tm.assert_frame_equal(result, expected)
+
+    def test_isin_empty_datetimelike(self):
+        # GH 15473
+        df1_ts = DataFrame({'date':
+                            pd.to_datetime(['2014-01-01', '2014-01-02'])})
+        df1_td = DataFrame({'date':
+                            [pd.Timedelta(1, 's'), pd.Timedelta(2, 's')]})
+        df2 = DataFrame({'date': []})
+        df3 = DataFrame()
+
+        expected = DataFrame({'date': [False, False]})
+
+        result = df1_ts.isin(df2)
+        tm.assert_frame_equal(result, expected)
+        result = df1_ts.isin(df3)
+        tm.assert_frame_equal(result, expected)
+
+        result = df1_td.isin(df2)
+        tm.assert_frame_equal(result, expected)
+        result = df1_td.isin(df3)
+        tm.assert_frame_equal(result, expected)
+
+    # ----------------------------------------------------------------------
+    # Row deduplication
+
+    def test_drop_duplicates(self):
+        df = DataFrame({'AAA': ['foo', 'bar', 'foo', 'bar',
+                                'foo', 'bar', 'bar', 'foo'],
+                        'B': ['one', 'one', 'two', 'two',
+                              'two', 'two', 'one', 'two'],
+                        'C': [1, 1, 2, 2, 2, 2, 1, 2],
+                        'D': lrange(8)})
+
+        # single column
+        result = df.drop_duplicates('AAA')
+        expected = df[:2]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates('AAA', keep='last')
+        expected = df.loc[[6, 7]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates('AAA', keep=False)
+        expected = df.loc[[]]
+        tm.assert_frame_equal(result, expected)
+        assert len(result) == 0
+
+        # multi column
+        expected = df.loc[[0, 1, 2, 3]]
+        result = df.drop_duplicates(np.array(['AAA', 'B']))
+        tm.assert_frame_equal(result, expected)
+        result = df.drop_duplicates(['AAA', 'B'])
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates(('AAA', 'B'), keep='last')
+        expected = df.loc[[0, 5, 6, 7]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates(('AAA', 'B'), keep=False)
+        expected = df.loc[[0]]
+        tm.assert_frame_equal(result, expected)
+
+        # consider everything
+        df2 = df.loc[:, ['AAA', 'B', 'C']]
+
+        result = df2.drop_duplicates()
+        # in this case only
+        expected = df2.drop_duplicates(['AAA', 'B'])
+        tm.assert_frame_equal(result, expected)
+
+        result = df2.drop_duplicates(keep='last')
+        expected = df2.drop_duplicates(['AAA', 'B'], keep='last')
+        tm.assert_frame_equal(result, expected)
+
+        result = df2.drop_duplicates(keep=False)
+        expected = df2.drop_duplicates(['AAA', 'B'], keep=False)
+        tm.assert_frame_equal(result, expected)
+
+        # integers
+        result = df.drop_duplicates('C')
+        expected = df.iloc[[0, 2]]
+        tm.assert_frame_equal(result, expected)
+        result = df.drop_duplicates('C', keep='last')
+        expected = df.iloc[[-2, -1]]
+        tm.assert_frame_equal(result, expected)
+
+        df['E'] = df['C'].astype('int8')
+        result = df.drop_duplicates('E')
+        expected = df.iloc[[0, 2]]
+        tm.assert_frame_equal(result, expected)
+        result = df.drop_duplicates('E', keep='last')
+        expected = df.iloc[[-2, -1]]
+        tm.assert_frame_equal(result, expected)
+
+        # GH 11376
+        df = pd.DataFrame({'x': [7, 6, 3, 3, 4, 8, 0],
+                           'y': [0, 6, 5, 5, 9, 1, 2]})
+        expected = df.loc[df.index != 3]
+        tm.assert_frame_equal(df.drop_duplicates(), expected)
+
+        df = pd.DataFrame([[1, 0], [0, 2]])
+        tm.assert_frame_equal(df.drop_duplicates(), df)
+
+        df = pd.DataFrame([[-2, 0], [0, -4]])
+        tm.assert_frame_equal(df.drop_duplicates(), df)
+
+        x = np.iinfo(np.int64).max / 3 * 2
+        df = pd.DataFrame([[-x, x], [0, x + 4]])
+        tm.assert_frame_equal(df.drop_duplicates(), df)
+
+        df = pd.DataFrame([[-x, x], [x, x + 4]])
+        tm.assert_frame_equal(df.drop_duplicates(), df)
+
+        # GH 11864
+        df = pd.DataFrame([i] * 9 for i in range(16))
+        df = df.append([[1] + [0] * 8], ignore_index=True)
+
+        for keep in ['first', 'last', False]:
+            assert df.duplicated(keep=keep).sum() == 0
+
+    @pytest.mark.parametrize('subset', ['a', ['a'], ['a', 'B']])
+    def test_duplicated_with_misspelled_column_name(self, subset):
+        # GH 19730
+        df = pd.DataFrame({'A': [0, 0, 1],
+                           'B': [0, 0, 1],
+                           'C': [0, 0, 1]})
+
+        with pytest.raises(KeyError):
+            df.duplicated(subset)
+
+        with pytest.raises(KeyError):
+            df.drop_duplicates(subset)
+
+    @pytest.mark.slow
+    def test_duplicated_do_not_fail_on_wide_dataframes(self):
+        # gh-21524
+        # Given the wide dataframe with a lot of columns
+        # with different (important!) values
+        data = {'col_{0:02d}'.format(i): np.random.randint(0, 1000, 30000)
+                for i in range(100)}
+        df = pd.DataFrame(data).T
+        result = df.duplicated()
+
+        # Then duplicates produce the bool pd.Series as a result
+        # and don't fail during calculation.
+        # Actual values doesn't matter here, though usually
+        # it's all False in this case
+        assert isinstance(result, pd.Series)
+        assert result.dtype == np.bool
+
+    def test_drop_duplicates_with_duplicate_column_names(self):
+        # GH17836
+        df = DataFrame([
+            [1, 2, 5],
+            [3, 4, 6],
+            [3, 4, 7]
+        ], columns=['a', 'a', 'b'])
+
+        result0 = df.drop_duplicates()
+        tm.assert_frame_equal(result0, df)
+
+        result1 = df.drop_duplicates('a')
+        expected1 = df[:2]
+        tm.assert_frame_equal(result1, expected1)
+
+    def test_drop_duplicates_for_take_all(self):
+        df = DataFrame({'AAA': ['foo', 'bar', 'baz', 'bar',
+                                'foo', 'bar', 'qux', 'foo'],
+                        'B': ['one', 'one', 'two', 'two',
+                              'two', 'two', 'one', 'two'],
+                        'C': [1, 1, 2, 2, 2, 2, 1, 2],
+                        'D': lrange(8)})
+
+        # single column
+        result = df.drop_duplicates('AAA')
+        expected = df.iloc[[0, 1, 2, 6]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates('AAA', keep='last')
+        expected = df.iloc[[2, 5, 6, 7]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates('AAA', keep=False)
+        expected = df.iloc[[2, 6]]
+        tm.assert_frame_equal(result, expected)
+
+        # multiple columns
+        result = df.drop_duplicates(['AAA', 'B'])
+        expected = df.iloc[[0, 1, 2, 3, 4, 6]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates(['AAA', 'B'], keep='last')
+        expected = df.iloc[[0, 1, 2, 5, 6, 7]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates(['AAA', 'B'], keep=False)
+        expected = df.iloc[[0, 1, 2, 6]]
+        tm.assert_frame_equal(result, expected)
+
+    def test_drop_duplicates_tuple(self):
+        df = DataFrame({('AA', 'AB'): ['foo', 'bar', 'foo', 'bar',
+                                       'foo', 'bar', 'bar', 'foo'],
+                        'B': ['one', 'one', 'two', 'two',
+                              'two', 'two', 'one', 'two'],
+                        'C': [1, 1, 2, 2, 2, 2, 1, 2],
+                        'D': lrange(8)})
+
+        # single column
+        result = df.drop_duplicates(('AA', 'AB'))
+        expected = df[:2]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates(('AA', 'AB'), keep='last')
+        expected = df.loc[[6, 7]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates(('AA', 'AB'), keep=False)
+        expected = df.loc[[]]  # empty df
+        assert len(result) == 0
+        tm.assert_frame_equal(result, expected)
+
+        # multi column
+        expected = df.loc[[0, 1, 2, 3]]
+        result = df.drop_duplicates((('AA', 'AB'), 'B'))
+        tm.assert_frame_equal(result, expected)
+
+    def test_drop_duplicates_NA(self):
+        # none
+        df = DataFrame({'A': [None, None, 'foo', 'bar',
+                              'foo', 'bar', 'bar', 'foo'],
+                        'B': ['one', 'one', 'two', 'two',
+                              'two', 'two', 'one', 'two'],
+                        'C': [1.0, np.nan, np.nan, np.nan, 1., 1., 1, 1.],
+                        'D': lrange(8)})
+
+        # single column
+        result = df.drop_duplicates('A')
+        expected = df.loc[[0, 2, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates('A', keep='last')
+        expected = df.loc[[1, 6, 7]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates('A', keep=False)
+        expected = df.loc[[]]  # empty df
+        tm.assert_frame_equal(result, expected)
+        assert len(result) == 0
+
+        # multi column
+        result = df.drop_duplicates(['A', 'B'])
+        expected = df.loc[[0, 2, 3, 6]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates(['A', 'B'], keep='last')
+        expected = df.loc[[1, 5, 6, 7]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates(['A', 'B'], keep=False)
+        expected = df.loc[[6]]
+        tm.assert_frame_equal(result, expected)
+
+        # nan
+        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                              'foo', 'bar', 'bar', 'foo'],
+                        'B': ['one', 'one', 'two', 'two',
+                              'two', 'two', 'one', 'two'],
+                        'C': [1.0, np.nan, np.nan, np.nan, 1., 1., 1, 1.],
+                        'D': lrange(8)})
+
+        # single column
+        result = df.drop_duplicates('C')
+        expected = df[:2]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates('C', keep='last')
+        expected = df.loc[[3, 7]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates('C', keep=False)
+        expected = df.loc[[]]  # empty df
+        tm.assert_frame_equal(result, expected)
+        assert len(result) == 0
+
+        # multi column
+        result = df.drop_duplicates(['C', 'B'])
+        expected = df.loc[[0, 1, 2, 4]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates(['C', 'B'], keep='last')
+        expected = df.loc[[1, 3, 6, 7]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates(['C', 'B'], keep=False)
+        expected = df.loc[[1]]
+        tm.assert_frame_equal(result, expected)
+
+    def test_drop_duplicates_NA_for_take_all(self):
+        # none
+        df = DataFrame({'A': [None, None, 'foo', 'bar',
+                              'foo', 'baz', 'bar', 'qux'],
+                        'C': [1.0, np.nan, np.nan, np.nan, 1., 2., 3, 1.]})
+
+        # single column
+        result = df.drop_duplicates('A')
+        expected = df.iloc[[0, 2, 3, 5, 7]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates('A', keep='last')
+        expected = df.iloc[[1, 4, 5, 6, 7]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates('A', keep=False)
+        expected = df.iloc[[5, 7]]
+        tm.assert_frame_equal(result, expected)
+
+        # nan
+
+        # single column
+        result = df.drop_duplicates('C')
+        expected = df.iloc[[0, 1, 5, 6]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates('C', keep='last')
+        expected = df.iloc[[3, 5, 6, 7]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.drop_duplicates('C', keep=False)
+        expected = df.iloc[[5, 6]]
+        tm.assert_frame_equal(result, expected)
+
+    def test_drop_duplicates_inplace(self):
+        orig = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                                'foo', 'bar', 'bar', 'foo'],
+                          'B': ['one', 'one', 'two', 'two',
+                                'two', 'two', 'one', 'two'],
+                          'C': [1, 1, 2, 2, 2, 2, 1, 2],
+                          'D': lrange(8)})
+
+        # single column
+        df = orig.copy()
+        df.drop_duplicates('A', inplace=True)
+        expected = orig[:2]
+        result = df
+        tm.assert_frame_equal(result, expected)
+
+        df = orig.copy()
+        df.drop_duplicates('A', keep='last', inplace=True)
+        expected = orig.loc[[6, 7]]
+        result = df
+        tm.assert_frame_equal(result, expected)
+
+        df = orig.copy()
+        df.drop_duplicates('A', keep=False, inplace=True)
+        expected = orig.loc[[]]
+        result = df
+        tm.assert_frame_equal(result, expected)
+        assert len(df) == 0
+
+        # multi column
+        df = orig.copy()
+        df.drop_duplicates(['A', 'B'], inplace=True)
+        expected = orig.loc[[0, 1, 2, 3]]
+        result = df
+        tm.assert_frame_equal(result, expected)
+
+        df = orig.copy()
+        df.drop_duplicates(['A', 'B'], keep='last', inplace=True)
+        expected = orig.loc[[0, 5, 6, 7]]
+        result = df
+        tm.assert_frame_equal(result, expected)
+
+        df = orig.copy()
+        df.drop_duplicates(['A', 'B'], keep=False, inplace=True)
+        expected = orig.loc[[0]]
+        result = df
+        tm.assert_frame_equal(result, expected)
+
+        # consider everything
+        orig2 = orig.loc[:, ['A', 'B', 'C']].copy()
+
+        df2 = orig2.copy()
+        df2.drop_duplicates(inplace=True)
+        # in this case only
+        expected = orig2.drop_duplicates(['A', 'B'])
+        result = df2
+        tm.assert_frame_equal(result, expected)
+
+        df2 = orig2.copy()
+        df2.drop_duplicates(keep='last', inplace=True)
+        expected = orig2.drop_duplicates(['A', 'B'], keep='last')
+        result = df2
+        tm.assert_frame_equal(result, expected)
+
+        df2 = orig2.copy()
+        df2.drop_duplicates(keep=False, inplace=True)
+        expected = orig2.drop_duplicates(['A', 'B'], keep=False)
+        result = df2
+        tm.assert_frame_equal(result, expected)
+
+    # Rounding
+    def test_round(self):
+        # GH 2665
+
+        # Test that rounding an empty DataFrame does nothing
+        df = DataFrame()
+        tm.assert_frame_equal(df, df.round())
+
+        # Here's the test frame we'll be working with
+        df = DataFrame({'col1': [1.123, 2.123, 3.123],
+                        'col2': [1.234, 2.234, 3.234]})
+
+        # Default round to integer (i.e. decimals=0)
+        expected_rounded = DataFrame(
+            {'col1': [1., 2., 3.], 'col2': [1., 2., 3.]})
+        tm.assert_frame_equal(df.round(), expected_rounded)
+
+        # Round with an integer
+        decimals = 2
+        expected_rounded = DataFrame({'col1': [1.12, 2.12, 3.12],
+                                      'col2': [1.23, 2.23, 3.23]})
+        tm.assert_frame_equal(df.round(decimals), expected_rounded)
+
+        # This should also work with np.round (since np.round dispatches to
+        # df.round)
+        tm.assert_frame_equal(np.round(df, decimals), expected_rounded)
+
+        # Round with a list
+        round_list = [1, 2]
+        with pytest.raises(TypeError):
+            df.round(round_list)
+
+        # Round with a dictionary
+        expected_rounded = DataFrame(
+            {'col1': [1.1, 2.1, 3.1], 'col2': [1.23, 2.23, 3.23]})
+        round_dict = {'col1': 1, 'col2': 2}
+        tm.assert_frame_equal(df.round(round_dict), expected_rounded)
+
+        # Incomplete dict
+        expected_partially_rounded = DataFrame(
+            {'col1': [1.123, 2.123, 3.123], 'col2': [1.2, 2.2, 3.2]})
+        partial_round_dict = {'col2': 1}
+        tm.assert_frame_equal(df.round(partial_round_dict),
+                              expected_partially_rounded)
+
+        # Dict with unknown elements
+        wrong_round_dict = {'col3': 2, 'col2': 1}
+        tm.assert_frame_equal(df.round(wrong_round_dict),
+                              expected_partially_rounded)
+
+        # float input to `decimals`
+        non_int_round_dict = {'col1': 1, 'col2': 0.5}
+        with pytest.raises(TypeError):
+            df.round(non_int_round_dict)
+
+        # String input
+        non_int_round_dict = {'col1': 1, 'col2': 'foo'}
+        with pytest.raises(TypeError):
+            df.round(non_int_round_dict)
+
+        non_int_round_Series = Series(non_int_round_dict)
+        with pytest.raises(TypeError):
+            df.round(non_int_round_Series)
+
+        # List input
+        non_int_round_dict = {'col1': 1, 'col2': [1, 2]}
+        with pytest.raises(TypeError):
+            df.round(non_int_round_dict)
+
+        non_int_round_Series = Series(non_int_round_dict)
+        with pytest.raises(TypeError):
+            df.round(non_int_round_Series)
+
+        # Non integer Series inputs
+        non_int_round_Series = Series(non_int_round_dict)
+        with pytest.raises(TypeError):
+            df.round(non_int_round_Series)
+
+        non_int_round_Series = Series(non_int_round_dict)
+        with pytest.raises(TypeError):
+            df.round(non_int_round_Series)
+
+        # Negative numbers
+        negative_round_dict = {'col1': -1, 'col2': -2}
+        big_df = df * 100
+        expected_neg_rounded = DataFrame(
+            {'col1': [110., 210, 310], 'col2': [100., 200, 300]})
+        tm.assert_frame_equal(big_df.round(negative_round_dict),
+                              expected_neg_rounded)
+
+        # nan in Series round
+        nan_round_Series = Series({'col1': nan, 'col2': 1})
+
+        # TODO(wesm): unused?
+        expected_nan_round = DataFrame({  # noqa
+            'col1': [1.123, 2.123, 3.123],
+            'col2': [1.2, 2.2, 3.2]})
+
+        with pytest.raises(TypeError):
+            df.round(nan_round_Series)
+
+        # Make sure this doesn't break existing Series.round
+        tm.assert_series_equal(df['col1'].round(1), expected_rounded['col1'])
+
+        # named columns
+        # GH 11986
+        decimals = 2
+        expected_rounded = DataFrame(
+            {'col1': [1.12, 2.12, 3.12], 'col2': [1.23, 2.23, 3.23]})
+        df.columns.name = "cols"
+        expected_rounded.columns.name = "cols"
+        tm.assert_frame_equal(df.round(decimals), expected_rounded)
+
+        # interaction of named columns & series
+        tm.assert_series_equal(df['col1'].round(decimals),
+                               expected_rounded['col1'])
+        tm.assert_series_equal(df.round(decimals)['col1'],
+                               expected_rounded['col1'])
+
+    def test_numpy_round(self):
+        # See gh-12600
+        df = DataFrame([[1.53, 1.36], [0.06, 7.01]])
+        out = np.round(df, decimals=0)
+        expected = DataFrame([[2., 1.], [0., 7.]])
+        tm.assert_frame_equal(out, expected)
+
+        msg = "the 'out' parameter is not supported"
+        with tm.assert_raises_regex(ValueError, msg):
+            np.round(df, decimals=0, out=df)
+
+    def test_round_mixed_type(self):
+        # GH11885
+        df = DataFrame({'col1': [1.1, 2.2, 3.3, 4.4],
+                        'col2': ['1', 'a', 'c', 'f'],
+                        'col3': date_range('20111111', periods=4)})
+        round_0 = DataFrame({'col1': [1., 2., 3., 4.],
+                             'col2': ['1', 'a', 'c', 'f'],
+                             'col3': date_range('20111111', periods=4)})
+        tm.assert_frame_equal(df.round(), round_0)
+        tm.assert_frame_equal(df.round(1), df)
+        tm.assert_frame_equal(df.round({'col1': 1}), df)
+        tm.assert_frame_equal(df.round({'col1': 0}), round_0)
+        tm.assert_frame_equal(df.round({'col1': 0, 'col2': 1}), round_0)
+        tm.assert_frame_equal(df.round({'col3': 1}), df)
+
+    def test_round_issue(self):
+        # GH11611
+
+        df = pd.DataFrame(np.random.random([3, 3]), columns=['A', 'B', 'C'],
+                          index=['first', 'second', 'third'])
+
+        dfs = pd.concat((df, df), axis=1)
+        rounded = dfs.round()
+        tm.assert_index_equal(rounded.index, dfs.index)
+
+        decimals = pd.Series([1, 0, 2], index=['A', 'B', 'A'])
+        pytest.raises(ValueError, df.round, decimals)
+
+    def test_built_in_round(self):
+        if not compat.PY3:
+            pytest.skip("build in round cannot be overridden "
+                        "prior to Python 3")
+
+        # GH11763
+        # Here's the test frame we'll be working with
+        df = DataFrame(
+            {'col1': [1.123, 2.123, 3.123], 'col2': [1.234, 2.234, 3.234]})
+
+        # Default round to integer (i.e. decimals=0)
+        expected_rounded = DataFrame(
+            {'col1': [1., 2., 3.], 'col2': [1., 2., 3.]})
+        tm.assert_frame_equal(round(df), expected_rounded)
+
+    def test_pct_change(self):
+        # GH 11150
+        pnl = DataFrame([np.arange(0, 40, 10), np.arange(0, 40, 10), np.arange(
+            0, 40, 10)]).astype(np.float64)
+        pnl.iat[1, 0] = np.nan
+        pnl.iat[1, 1] = np.nan
+        pnl.iat[2, 3] = 60
+
+        for axis in range(2):
+            expected = pnl.ffill(axis=axis) / pnl.ffill(axis=axis).shift(
+                axis=axis) - 1
+            result = pnl.pct_change(axis=axis, fill_method='pad')
+
+            tm.assert_frame_equal(result, expected)
+
+    # Clip
+
+    def test_clip(self):
+        median = self.frame.median().median()
+        original = self.frame.copy()
+
+        capped = self.frame.clip_upper(median)
+        assert not (capped.values > median).any()
+
+        floored = self.frame.clip_lower(median)
+        assert not (floored.values < median).any()
+
+        double = self.frame.clip(upper=median, lower=median)
+        assert not (double.values != median).any()
+
+        # Verify that self.frame was not changed inplace
+        assert (self.frame.values == original.values).all()
+
+    def test_inplace_clip(self):
+        # GH #15388
+        median = self.frame.median().median()
+        frame_copy = self.frame.copy()
+
+        frame_copy.clip_upper(median, inplace=True)
+        assert not (frame_copy.values > median).any()
+        frame_copy = self.frame.copy()
+
+        frame_copy.clip_lower(median, inplace=True)
+        assert not (frame_copy.values < median).any()
+        frame_copy = self.frame.copy()
+
+        frame_copy.clip(upper=median, lower=median, inplace=True)
+        assert not (frame_copy.values != median).any()
+
+    def test_dataframe_clip(self):
+        # GH #2747
+        df = DataFrame(np.random.randn(1000, 2))
+
+        for lb, ub in [(-1, 1), (1, -1)]:
+            clipped_df = df.clip(lb, ub)
+
+            lb, ub = min(lb, ub), max(ub, lb)
+            lb_mask = df.values <= lb
+            ub_mask = df.values >= ub
+            mask = ~lb_mask & ~ub_mask
+            assert (clipped_df.values[lb_mask] == lb).all()
+            assert (clipped_df.values[ub_mask] == ub).all()
+            assert (clipped_df.values[mask] == df.values[mask]).all()
+
+    def test_clip_mixed_numeric(self):
+        # TODO(jreback)
+        # clip on mixed integer or floats
+        # with integer clippers coerces to float
+        df = DataFrame({'A': [1, 2, 3],
+                        'B': [1., np.nan, 3.]})
+        result = df.clip(1, 2)
+        expected = DataFrame({'A': [1, 2, 2.],
+                              'B': [1., np.nan, 2.]})
+        tm.assert_frame_equal(result, expected, check_like=True)
+
+    @pytest.mark.parametrize("inplace", [True, False])
+    def test_clip_against_series(self, inplace):
+        # GH #6966
+
+        df = DataFrame(np.random.randn(1000, 2))
+        lb = Series(np.random.randn(1000))
+        ub = lb + 1
+
+        original = df.copy()
+        clipped_df = df.clip(lb, ub, axis=0, inplace=inplace)
+
+        if inplace:
+            clipped_df = df
+
+        for i in range(2):
+            lb_mask = original.iloc[:, i] <= lb
+            ub_mask = original.iloc[:, i] >= ub
+            mask = ~lb_mask & ~ub_mask
+
+            result = clipped_df.loc[lb_mask, i]
+            tm.assert_series_equal(result, lb[lb_mask], check_names=False)
+            assert result.name == i
+
+            result = clipped_df.loc[ub_mask, i]
+            tm.assert_series_equal(result, ub[ub_mask], check_names=False)
+            assert result.name == i
+
+            tm.assert_series_equal(clipped_df.loc[mask, i], df.loc[mask, i])
+
+    @pytest.mark.parametrize("inplace", [True, False])
+    @pytest.mark.parametrize("lower", [[2, 3, 4], np.asarray([2, 3, 4])])
+    @pytest.mark.parametrize("axis,res", [
+        (0, [[2., 2., 3.], [4., 5., 6.], [7., 7., 7.]]),
+        (1, [[2., 3., 4.], [4., 5., 6.], [5., 6., 7.]])
+    ])
+    def test_clip_against_list_like(self, inplace, lower, axis, res):
+        # GH #15390
+        original = self.simple.copy(deep=True)
+
+        result = original.clip(lower=lower, upper=[5, 6, 7],
+                               axis=axis, inplace=inplace)
+
+        expected = pd.DataFrame(res,
+                                columns=original.columns,
+                                index=original.index)
+        if inplace:
+            result = original
+        tm.assert_frame_equal(result, expected, check_exact=True)
+
+    @pytest.mark.parametrize("axis", [0, 1, None])
+    def test_clip_against_frame(self, axis):
+        df = DataFrame(np.random.randn(1000, 2))
+        lb = DataFrame(np.random.randn(1000, 2))
+        ub = lb + 1
+
+        clipped_df = df.clip(lb, ub, axis=axis)
+
+        lb_mask = df <= lb
+        ub_mask = df >= ub
+        mask = ~lb_mask & ~ub_mask
+
+        tm.assert_frame_equal(clipped_df[lb_mask], lb[lb_mask])
+        tm.assert_frame_equal(clipped_df[ub_mask], ub[ub_mask])
+        tm.assert_frame_equal(clipped_df[mask], df[mask])
+
+    def test_clip_with_na_args(self):
+        """Should process np.nan argument as None """
+        # GH # 17276
+        tm.assert_frame_equal(self.frame.clip(np.nan), self.frame)
+        tm.assert_frame_equal(self.frame.clip(upper=[1, 2, np.nan]),
+                              self.frame)
+        tm.assert_frame_equal(self.frame.clip(lower=[1, np.nan, 3]),
+                              self.frame)
+        tm.assert_frame_equal(self.frame.clip(upper=np.nan, lower=np.nan),
+                              self.frame)
+
+    # Matrix-like
+    def test_dot(self):
+        a = DataFrame(np.random.randn(3, 4), index=['a', 'b', 'c'],
+                      columns=['p', 'q', 'r', 's'])
+        b = DataFrame(np.random.randn(4, 2), index=['p', 'q', 'r', 's'],
+                      columns=['one', 'two'])
+
+        result = a.dot(b)
+        expected = DataFrame(np.dot(a.values, b.values),
+                             index=['a', 'b', 'c'],
+                             columns=['one', 'two'])
+        # Check alignment
+        b1 = b.reindex(index=reversed(b.index))
+        result = a.dot(b)
+        tm.assert_frame_equal(result, expected)
+
+        # Check series argument
+        result = a.dot(b['one'])
+        tm.assert_series_equal(result, expected['one'], check_names=False)
+        assert result.name is None
+
+        result = a.dot(b1['one'])
+        tm.assert_series_equal(result, expected['one'], check_names=False)
+        assert result.name is None
+
+        # can pass correct-length arrays
+        row = a.iloc[0].values
+
+        result = a.dot(row)
+        exp = a.dot(a.iloc[0])
+        tm.assert_series_equal(result, exp)
+
+        with tm.assert_raises_regex(ValueError,
+                                    'Dot product shape mismatch'):
+            a.dot(row[:-1])
+
+        a = np.random.rand(1, 5)
+        b = np.random.rand(5, 1)
+        A = DataFrame(a)
+
+        # TODO(wesm): unused
+        B = DataFrame(b)  # noqa
+
+        # it works
+        result = A.dot(b)
+
+        # unaligned
+        df = DataFrame(randn(3, 4), index=[1, 2, 3], columns=lrange(4))
+        df2 = DataFrame(randn(5, 3), index=lrange(5), columns=[1, 2, 3])
+
+        with tm.assert_raises_regex(ValueError, 'aligned'):
+            df.dot(df2)
+
+    @pytest.mark.skipif(not PY35,
+                        reason='matmul supported for Python>=3.5')
+    @pytest.mark.xfail(
+        _np_version_under1p12,
+        reason="unpredictable return types under numpy < 1.12")
+    def test_matmul(self):
+        # matmul test is for GH #10259
+        a = DataFrame(np.random.randn(3, 4), index=['a', 'b', 'c'],
+                      columns=['p', 'q', 'r', 's'])
+        b = DataFrame(np.random.randn(4, 2), index=['p', 'q', 'r', 's'],
+                      columns=['one', 'two'])
+
+        # DataFrame @ DataFrame
+        result = operator.matmul(a, b)
+        expected = DataFrame(np.dot(a.values, b.values),
+                             index=['a', 'b', 'c'],
+                             columns=['one', 'two'])
+        tm.assert_frame_equal(result, expected)
+
+        # DataFrame @ Series
+        result = operator.matmul(a, b.one)
+        expected = Series(np.dot(a.values, b.one.values),
+                          index=['a', 'b', 'c'])
+        tm.assert_series_equal(result, expected)
+
+        # np.array @ DataFrame
+        result = operator.matmul(a.values, b)
+        expected = np.dot(a.values, b.values)
+        tm.assert_almost_equal(result, expected)
+
+        # nested list @ DataFrame (__rmatmul__)
+        result = operator.matmul(a.values.tolist(), b)
+        expected = DataFrame(np.dot(a.values, b.values),
+                             index=['a', 'b', 'c'],
+                             columns=['one', 'two'])
+        tm.assert_almost_equal(result.values, expected.values)
+
+        # mixed dtype DataFrame @ DataFrame
+        a['q'] = a.q.round().astype(int)
+        result = operator.matmul(a, b)
+        expected = DataFrame(np.dot(a.values, b.values),
+                             index=['a', 'b', 'c'],
+                             columns=['one', 'two'])
+        tm.assert_frame_equal(result, expected)
+
+        # different dtypes DataFrame @ DataFrame
+        a = a.astype(int)
+        result = operator.matmul(a, b)
+        expected = DataFrame(np.dot(a.values, b.values),
+                             index=['a', 'b', 'c'],
+                             columns=['one', 'two'])
+        tm.assert_frame_equal(result, expected)
+
+        # unaligned
+        df = DataFrame(randn(3, 4), index=[1, 2, 3], columns=lrange(4))
+        df2 = DataFrame(randn(5, 3), index=lrange(5), columns=[1, 2, 3])
+
+        with tm.assert_raises_regex(ValueError, 'aligned'):
+            operator.matmul(df, df2)
+
+
+@pytest.fixture
+def df_duplicates():
+    return pd.DataFrame({'a': [1, 2, 3, 4, 4],
+                         'b': [1, 1, 1, 1, 1],
+                         'c': [0, 1, 2, 5, 4]},
+                        index=[0, 0, 1, 1, 1])
+
+
+@pytest.fixture
+def df_strings():
+    return pd.DataFrame({'a': np.random.permutation(10),
+                         'b': list(ascii_lowercase[:10]),
+                         'c': np.random.permutation(10).astype('float64')})
+
+
+@pytest.fixture
+def df_main_dtypes():
+    return pd.DataFrame(
+        {'group': [1, 1, 2],
+         'int': [1, 2, 3],
+         'float': [4., 5., 6.],
+         'string': list('abc'),
+         'category_string': pd.Series(list('abc')).astype('category'),
+         'category_int': [7, 8, 9],
+         'datetime': pd.date_range('20130101', periods=3),
+         'datetimetz': pd.date_range('20130101',
+                                     periods=3,
+                                     tz='US/Eastern'),
+         'timedelta': pd.timedelta_range('1 s', periods=3, freq='s')},
+        columns=['group', 'int', 'float', 'string',
+                 'category_string', 'category_int',
+                 'datetime', 'datetimetz',
+                 'timedelta'])
+
+
+class TestNLargestNSmallest(object):
+
+    dtype_error_msg_template = ("Column {column!r} has dtype {dtype}, cannot "
+                                "use method {method!r} with this dtype")
+
+    # ----------------------------------------------------------------------
+    # Top / bottom
+    @pytest.mark.parametrize('order', [
+        ['a'],
+        ['c'],
+        ['a', 'b'],
+        ['a', 'c'],
+        ['b', 'a'],
+        ['b', 'c'],
+        ['a', 'b', 'c'],
+        ['c', 'a', 'b'],
+        ['c', 'b', 'a'],
+        ['b', 'c', 'a'],
+        ['b', 'a', 'c'],
+
+        # dups!
+        ['b', 'c', 'c']])
+    @pytest.mark.parametrize('n', range(1, 11))
+    def test_n(self, df_strings, nselect_method, n, order):
+        # GH10393
+        df = df_strings
+        if 'b' in order:
+
+            error_msg = self.dtype_error_msg_template.format(
+                column='b', method=nselect_method, dtype='object')
+            with tm.assert_raises_regex(TypeError, error_msg):
+                getattr(df, nselect_method)(n, order)
+        else:
+            ascending = nselect_method == 'nsmallest'
+            result = getattr(df, nselect_method)(n, order)
+            expected = df.sort_values(order, ascending=ascending).head(n)
+            tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('columns', [
+        ('group', 'category_string'), ('group', 'string')])
+    def test_n_error(self, df_main_dtypes, nselect_method, columns):
+        df = df_main_dtypes
+        col = columns[1]
+        error_msg = self.dtype_error_msg_template.format(
+            column=col, method=nselect_method, dtype=df[col].dtype)
+        # escape some characters that may be in the repr
+        error_msg = (error_msg.replace('(', '\\(').replace(")", "\\)")
+                              .replace("[", "\\[").replace("]", "\\]"))
+        with tm.assert_raises_regex(TypeError, error_msg):
+            getattr(df, nselect_method)(2, columns)
+
+    def test_n_all_dtypes(self, df_main_dtypes):
+        df = df_main_dtypes
+        df.nsmallest(2, list(set(df) - {'category_string', 'string'}))
+        df.nlargest(2, list(set(df) - {'category_string', 'string'}))
+
+    def test_n_identical_values(self):
+        # GH15297
+        df = pd.DataFrame({'a': [1] * 5, 'b': [1, 2, 3, 4, 5]})
+
+        result = df.nlargest(3, 'a')
+        expected = pd.DataFrame(
+            {'a': [1] * 3, 'b': [1, 2, 3]}, index=[0, 1, 2]
+        )
+        tm.assert_frame_equal(result, expected)
+
+        result = df.nsmallest(3, 'a')
+        expected = pd.DataFrame({'a': [1] * 3, 'b': [1, 2, 3]})
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('order', [
+        ['a', 'b', 'c'],
+        ['c', 'b', 'a'],
+        ['a'],
+        ['b'],
+        ['a', 'b'],
+        ['c', 'b']])
+    @pytest.mark.parametrize('n', range(1, 6))
+    def test_n_duplicate_index(self, df_duplicates, n, order):
+        # GH 13412
+
+        df = df_duplicates
+        result = df.nsmallest(n, order)
+        expected = df.sort_values(order).head(n)
+        tm.assert_frame_equal(result, expected)
+
+        result = df.nlargest(n, order)
+        expected = df.sort_values(order, ascending=False).head(n)
+        tm.assert_frame_equal(result, expected)
+
+    def test_duplicate_keep_all_ties(self):
+        # see gh-16818
+        df = pd.DataFrame({'a': [5, 4, 4, 2, 3, 3, 3, 3],
+                           'b': [10, 9, 8, 7, 5, 50, 10, 20]})
+        result = df.nlargest(4, 'a', keep='all')
+        expected = pd.DataFrame({'a': {0: 5, 1: 4, 2: 4, 4: 3,
+                                       5: 3, 6: 3, 7: 3},
+                                 'b': {0: 10, 1: 9, 2: 8, 4: 5,
+                                       5: 50, 6: 10, 7: 20}})
+        tm.assert_frame_equal(result, expected)
+
+        result = df.nsmallest(2, 'a', keep='all')
+        expected = pd.DataFrame({'a': {3: 2, 4: 3, 5: 3, 6: 3, 7: 3},
+                                 'b': {3: 7, 4: 5, 5: 50, 6: 10, 7: 20}})
+        tm.assert_frame_equal(result, expected)
+
+    def test_series_broadcasting(self):
+        # smoke test for numpy warnings
+        # GH 16378, GH 16306
+        df = DataFrame([1.0, 1.0, 1.0])
+        df_nan = DataFrame({'A': [np.nan, 2.0, np.nan]})
+        s = Series([1, 1, 1])
+        s_nan = Series([np.nan, np.nan, 1])
+
+        with tm.assert_produces_warning(None):
+            df_nan.clip_lower(s, axis=0)
+            for op in ['lt', 'le', 'gt', 'ge', 'eq', 'ne']:
+                getattr(df, op)(s_nan, axis=0)
+
+    def test_series_nat_conversion(self):
+        # GH 18521
+        # Check rank does not mutate DataFrame
+        df = DataFrame(np.random.randn(10, 3), dtype='float64')
+        expected = df.copy()
+        df.rank()
+        result = df
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_api.py b/pandas/tests/frame/test_api.py
new file mode 100644
index 0000000000000..78a19029db567
--- /dev/null
+++ b/pandas/tests/frame/test_api.py
@@ -0,0 +1,515 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import pytest
+
+# pylint: disable-msg=W0612,E1101
+from copy import deepcopy
+import pydoc
+
+from pandas.compat import range, lrange, long
+from pandas import compat
+
+from numpy.random import randn
+import numpy as np
+
+from pandas import (DataFrame, Series, date_range, timedelta_range,
+                    Categorical, SparseDataFrame)
+import pandas as pd
+
+from pandas.util.testing import (assert_almost_equal,
+                                 assert_series_equal,
+                                 assert_frame_equal)
+
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+class SharedWithSparse(object):
+    """
+    A collection of tests DataFrame and SparseDataFrame can share.
+
+    In generic tests on this class, use ``self._assert_frame_equal()`` and
+    ``self._assert_series_equal()`` which are implemented in sub-classes
+    and dispatch correctly.
+    """
+    def _assert_frame_equal(self, left, right):
+        """Dispatch to frame class dependent assertion"""
+        raise NotImplementedError
+
+    def _assert_series_equal(self, left, right):
+        """Dispatch to series class dependent assertion"""
+        raise NotImplementedError
+
+    def test_copy_index_name_checking(self):
+        # don't want to be able to modify the index stored elsewhere after
+        # making a copy
+        for attr in ('index', 'columns'):
+            ind = getattr(self.frame, attr)
+            ind.name = None
+            cp = self.frame.copy()
+            getattr(cp, attr).name = 'foo'
+            assert getattr(self.frame, attr).name is None
+
+    def test_getitem_pop_assign_name(self):
+        s = self.frame['A']
+        assert s.name == 'A'
+
+        s = self.frame.pop('A')
+        assert s.name == 'A'
+
+        s = self.frame.loc[:, 'B']
+        assert s.name == 'B'
+
+        s2 = s.loc[:]
+        assert s2.name == 'B'
+
+    def test_get_value(self):
+        for idx in self.frame.index:
+            for col in self.frame.columns:
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    result = self.frame.get_value(idx, col)
+                expected = self.frame[col][idx]
+                tm.assert_almost_equal(result, expected)
+
+    def test_add_prefix_suffix(self):
+        with_prefix = self.frame.add_prefix('foo#')
+        expected = pd.Index(['foo#%s' % c for c in self.frame.columns])
+        tm.assert_index_equal(with_prefix.columns, expected)
+
+        with_suffix = self.frame.add_suffix('#foo')
+        expected = pd.Index(['%s#foo' % c for c in self.frame.columns])
+        tm.assert_index_equal(with_suffix.columns, expected)
+
+        with_pct_prefix = self.frame.add_prefix('%')
+        expected = pd.Index(['%{}'.format(c) for c in self.frame.columns])
+        tm.assert_index_equal(with_pct_prefix.columns, expected)
+
+        with_pct_suffix = self.frame.add_suffix('%')
+        expected = pd.Index(['{}%'.format(c) for c in self.frame.columns])
+        tm.assert_index_equal(with_pct_suffix.columns, expected)
+
+    def test_get_axis(self):
+        f = self.frame
+        assert f._get_axis_number(0) == 0
+        assert f._get_axis_number(1) == 1
+        assert f._get_axis_number('index') == 0
+        assert f._get_axis_number('rows') == 0
+        assert f._get_axis_number('columns') == 1
+
+        assert f._get_axis_name(0) == 'index'
+        assert f._get_axis_name(1) == 'columns'
+        assert f._get_axis_name('index') == 'index'
+        assert f._get_axis_name('rows') == 'index'
+        assert f._get_axis_name('columns') == 'columns'
+
+        assert f._get_axis(0) is f.index
+        assert f._get_axis(1) is f.columns
+
+        tm.assert_raises_regex(
+            ValueError, 'No axis named', f._get_axis_number, 2)
+        tm.assert_raises_regex(
+            ValueError, 'No axis.*foo', f._get_axis_name, 'foo')
+        tm.assert_raises_regex(
+            ValueError, 'No axis.*None', f._get_axis_name, None)
+        tm.assert_raises_regex(ValueError, 'No axis named',
+                               f._get_axis_number, None)
+
+    def test_keys(self):
+        getkeys = self.frame.keys
+        assert getkeys() is self.frame.columns
+
+    def test_column_contains_typeerror(self):
+        try:
+            self.frame.columns in self.frame
+        except TypeError:
+            pass
+
+    def test_tab_completion(self):
+        # DataFrame whose columns are identifiers shall have them in __dir__.
+        df = pd.DataFrame([list('abcd'), list('efgh')], columns=list('ABCD'))
+        for key in list('ABCD'):
+            assert key in dir(df)
+        assert isinstance(df.__getitem__('A'), pd.Series)
+
+        # DataFrame whose first-level columns are identifiers shall have
+        # them in __dir__.
+        df = pd.DataFrame(
+            [list('abcd'), list('efgh')],
+            columns=pd.MultiIndex.from_tuples(list(zip('ABCD', 'EFGH'))))
+        for key in list('ABCD'):
+            assert key in dir(df)
+        for key in list('EFGH'):
+            assert key not in dir(df)
+        assert isinstance(df.__getitem__('A'), pd.DataFrame)
+
+    def test_not_hashable(self):
+        df = self.klass([1])
+        pytest.raises(TypeError, hash, df)
+        pytest.raises(TypeError, hash, self.empty)
+
+    def test_new_empty_index(self):
+        df1 = self.klass(randn(0, 3))
+        df2 = self.klass(randn(0, 3))
+        df1.index.name = 'foo'
+        assert df2.index.name is None
+
+    def test_array_interface(self):
+        with np.errstate(all='ignore'):
+            result = np.sqrt(self.frame)
+        assert isinstance(result, type(self.frame))
+        assert result.index is self.frame.index
+        assert result.columns is self.frame.columns
+
+        self._assert_frame_equal(result, self.frame.apply(np.sqrt))
+
+    def test_get_agg_axis(self):
+        cols = self.frame._get_agg_axis(0)
+        assert cols is self.frame.columns
+
+        idx = self.frame._get_agg_axis(1)
+        assert idx is self.frame.index
+
+        pytest.raises(ValueError, self.frame._get_agg_axis, 2)
+
+    def test_nonzero(self):
+        assert self.empty.empty
+
+        assert not self.frame.empty
+        assert not self.mixed_frame.empty
+
+        # corner case
+        df = DataFrame({'A': [1., 2., 3.],
+                        'B': ['a', 'b', 'c']},
+                       index=np.arange(3))
+        del df['A']
+        assert not df.empty
+
+    def test_iteritems(self):
+        df = self.klass([[1, 2, 3], [4, 5, 6]], columns=['a', 'a', 'b'])
+        for k, v in compat.iteritems(df):
+            assert isinstance(v, self.klass._constructor_sliced)
+
+    def test_items(self):
+        # issue #17213, #13918
+        cols = ['a', 'b', 'c']
+        df = DataFrame([[1, 2, 3], [4, 5, 6]], columns=cols)
+        for c, (k, v) in zip(cols, df.items()):
+            assert c == k
+            assert isinstance(v, Series)
+            assert (df[k] == v).all()
+
+    def test_iter(self):
+        assert tm.equalContents(list(self.frame), self.frame.columns)
+
+    def test_iterrows(self):
+        for k, v in self.frame.iterrows():
+            exp = self.frame.loc[k]
+            self._assert_series_equal(v, exp)
+
+        for k, v in self.mixed_frame.iterrows():
+            exp = self.mixed_frame.loc[k]
+            self._assert_series_equal(v, exp)
+
+    def test_iterrows_iso8601(self):
+        # GH19671
+        if self.klass == SparseDataFrame:
+            pytest.xfail(reason='SparseBlock datetime type not implemented.')
+
+        s = self.klass(
+            {'non_iso8601': ['M1701', 'M1802', 'M1903', 'M2004'],
+             'iso8601': date_range('2000-01-01', periods=4, freq='M')})
+        for k, v in s.iterrows():
+            exp = s.loc[k]
+            self._assert_series_equal(v, exp)
+
+    def test_itertuples(self):
+        for i, tup in enumerate(self.frame.itertuples()):
+            s = self.klass._constructor_sliced(tup[1:])
+            s.name = tup[0]
+            expected = self.frame.iloc[i, :].reset_index(drop=True)
+            self._assert_series_equal(s, expected)
+
+        df = self.klass({'floats': np.random.randn(5),
+                         'ints': lrange(5)}, columns=['floats', 'ints'])
+
+        for tup in df.itertuples(index=False):
+            assert isinstance(tup[1], (int, long))
+
+        df = self.klass(data={"a": [1, 2, 3], "b": [4, 5, 6]})
+        dfaa = df[['a', 'a']]
+
+        assert (list(dfaa.itertuples()) ==
+                [(0, 1, 1), (1, 2, 2), (2, 3, 3)])
+
+        # repr with be int/long on 32-bit/windows
+        if not (compat.is_platform_windows() or compat.is_platform_32bit()):
+            assert (repr(list(df.itertuples(name=None))) ==
+                    '[(0, 1, 4), (1, 2, 5), (2, 3, 6)]')
+
+        tup = next(df.itertuples(name='TestName'))
+        assert tup._fields == ('Index', 'a', 'b')
+        assert (tup.Index, tup.a, tup.b) == tup
+        assert type(tup).__name__ == 'TestName'
+
+        df.columns = ['def', 'return']
+        tup2 = next(df.itertuples(name='TestName'))
+        assert tup2 == (0, 1, 4)
+        assert tup2._fields == ('Index', '_1', '_2')
+
+        df3 = DataFrame({'f' + str(i): [i] for i in range(1024)})
+        # will raise SyntaxError if trying to create namedtuple
+        tup3 = next(df3.itertuples())
+        assert not hasattr(tup3, '_fields')
+        assert isinstance(tup3, tuple)
+
+    def test_sequence_like_with_categorical(self):
+
+        # GH 7839
+        # make sure can iterate
+        df = DataFrame({"id": [1, 2, 3, 4, 5, 6],
+                        "raw_grade": ['a', 'b', 'b', 'a', 'a', 'e']})
+        df['grade'] = Categorical(df['raw_grade'])
+
+        # basic sequencing testing
+        result = list(df.grade.values)
+        expected = np.array(df.grade.values).tolist()
+        tm.assert_almost_equal(result, expected)
+
+        # iteration
+        for t in df.itertuples(index=False):
+            str(t)
+
+        for row, s in df.iterrows():
+            str(s)
+
+        for c, col in df.iteritems():
+            str(s)
+
+    def test_len(self):
+        assert len(self.frame) == len(self.frame.index)
+
+    def test_values(self):
+        frame = self.frame
+        arr = frame.values
+
+        frame_cols = frame.columns
+        for i, row in enumerate(arr):
+            for j, value in enumerate(row):
+                col = frame_cols[j]
+                if np.isnan(value):
+                    assert np.isnan(frame[col][i])
+                else:
+                    assert value == frame[col][i]
+
+        # mixed type
+        arr = self.mixed_frame[['foo', 'A']].values
+        assert arr[0, 0] == 'bar'
+
+        df = self.klass({'real': [1, 2, 3], 'complex': [1j, 2j, 3j]})
+        arr = df.values
+        assert arr[0, 0] == 1j
+
+        # single block corner case
+        arr = self.frame[['A', 'B']].values
+        expected = self.frame.reindex(columns=['A', 'B']).values
+        assert_almost_equal(arr, expected)
+
+    def test_transpose(self):
+        frame = self.frame
+        dft = frame.T
+        for idx, series in compat.iteritems(dft):
+            for col, value in compat.iteritems(series):
+                if np.isnan(value):
+                    assert np.isnan(frame[col][idx])
+                else:
+                    assert value == frame[col][idx]
+
+        # mixed type
+        index, data = tm.getMixedTypeDict()
+        mixed = self.klass(data, index=index)
+
+        mixed_T = mixed.T
+        for col, s in compat.iteritems(mixed_T):
+            assert s.dtype == np.object_
+
+    def test_swapaxes(self):
+        df = self.klass(np.random.randn(10, 5))
+        self._assert_frame_equal(df.T, df.swapaxes(0, 1))
+        self._assert_frame_equal(df.T, df.swapaxes(1, 0))
+        self._assert_frame_equal(df, df.swapaxes(0, 0))
+        pytest.raises(ValueError, df.swapaxes, 2, 5)
+
+    def test_axis_aliases(self):
+        f = self.frame
+
+        # reg name
+        expected = f.sum(axis=0)
+        result = f.sum(axis='index')
+        assert_series_equal(result, expected)
+
+        expected = f.sum(axis=1)
+        result = f.sum(axis='columns')
+        assert_series_equal(result, expected)
+
+    def test_class_axis(self):
+        # https://github.com/pandas-dev/pandas/issues/18147
+        # no exception and no empty docstring
+        assert pydoc.getdoc(DataFrame.index)
+        assert pydoc.getdoc(DataFrame.columns)
+
+    def test_more_values(self):
+        values = self.mixed_frame.values
+        assert values.shape[1] == len(self.mixed_frame.columns)
+
+    def test_repr_with_mi_nat(self):
+        df = self.klass({'X': [1, 2]},
+                        index=[[pd.NaT, pd.Timestamp('20130101')], ['a', 'b']])
+        res = repr(df)
+        exp = '              X\nNaT        a  1\n2013-01-01 b  2'
+        assert res == exp
+
+    def test_iteritems_names(self):
+        for k, v in compat.iteritems(self.mixed_frame):
+            assert v.name == k
+
+    def test_series_put_names(self):
+        series = self.mixed_frame._series
+        for k, v in compat.iteritems(series):
+            assert v.name == k
+
+    def test_empty_nonzero(self):
+        df = self.klass([1, 2, 3])
+        assert not df.empty
+        df = self.klass(index=[1], columns=[1])
+        assert not df.empty
+        df = self.klass(index=['a', 'b'], columns=['c', 'd']).dropna()
+        assert df.empty
+        assert df.T.empty
+        empty_frames = [self.klass(),
+                        self.klass(index=[1]),
+                        self.klass(columns=[1]),
+                        self.klass({1: []})]
+        for df in empty_frames:
+            assert df.empty
+            assert df.T.empty
+
+    def test_with_datetimelikes(self):
+
+        df = self.klass({'A': date_range('20130101', periods=10),
+                         'B': timedelta_range('1 day', periods=10)})
+        t = df.T
+
+        result = t.get_dtype_counts()
+        expected = Series({'object': 10})
+        tm.assert_series_equal(result, expected)
+
+
+class TestDataFrameMisc(SharedWithSparse, TestData):
+
+    klass = DataFrame
+    # SharedWithSparse tests use generic, klass-agnostic assertion
+    _assert_frame_equal = staticmethod(assert_frame_equal)
+    _assert_series_equal = staticmethod(assert_series_equal)
+
+    def test_values(self):
+        self.frame.values[:, 0] = 5.
+        assert (self.frame.values[:, 0] == 5).all()
+
+    def test_as_matrix_deprecated(self):
+        # GH18458
+        with tm.assert_produces_warning(FutureWarning):
+            result = self.frame.as_matrix(columns=self.frame.columns.tolist())
+        expected = self.frame.values
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_deepcopy(self):
+        cp = deepcopy(self.frame)
+        series = cp['A']
+        series[:] = 10
+        for idx, value in compat.iteritems(series):
+            assert self.frame['A'][idx] != value
+
+    def test_transpose_get_view(self):
+        dft = self.frame.T
+        dft.values[:, 5:10] = 5
+
+        assert (self.frame.values[5:10] == 5).all()
+
+    def test_inplace_return_self(self):
+        # re #1893
+
+        data = DataFrame({'a': ['foo', 'bar', 'baz', 'qux'],
+                          'b': [0, 0, 1, 1],
+                          'c': [1, 2, 3, 4]})
+
+        def _check_f(base, f):
+            result = f(base)
+            assert result is None
+
+        # -----DataFrame-----
+
+        # set_index
+        f = lambda x: x.set_index('a', inplace=True)
+        _check_f(data.copy(), f)
+
+        # reset_index
+        f = lambda x: x.reset_index(inplace=True)
+        _check_f(data.set_index('a'), f)
+
+        # drop_duplicates
+        f = lambda x: x.drop_duplicates(inplace=True)
+        _check_f(data.copy(), f)
+
+        # sort
+        f = lambda x: x.sort_values('b', inplace=True)
+        _check_f(data.copy(), f)
+
+        # sort_index
+        f = lambda x: x.sort_index(inplace=True)
+        _check_f(data.copy(), f)
+
+        # fillna
+        f = lambda x: x.fillna(0, inplace=True)
+        _check_f(data.copy(), f)
+
+        # replace
+        f = lambda x: x.replace(1, 0, inplace=True)
+        _check_f(data.copy(), f)
+
+        # rename
+        f = lambda x: x.rename({1: 'foo'}, inplace=True)
+        _check_f(data.copy(), f)
+
+        # -----Series-----
+        d = data.copy()['c']
+
+        # reset_index
+        f = lambda x: x.reset_index(inplace=True, drop=True)
+        _check_f(data.set_index('a')['c'], f)
+
+        # fillna
+        f = lambda x: x.fillna(0, inplace=True)
+        _check_f(d.copy(), f)
+
+        # replace
+        f = lambda x: x.replace(1, 0, inplace=True)
+        _check_f(d.copy(), f)
+
+        # rename
+        f = lambda x: x.rename({1: 'foo'}, inplace=True)
+        _check_f(d.copy(), f)
+
+    def test_tab_complete_warning(self, ip):
+        # https://github.com/pandas-dev/pandas/issues/16409
+        pytest.importorskip('IPython', minversion="6.0.0")
+        from IPython.core.completer import provisionalcompleter
+
+        code = "import pandas as pd; df = pd.DataFrame()"
+        ip.run_code(code)
+        with tm.assert_produces_warning(None):
+            with provisionalcompleter('ignore'):
+                list(ip.Completer.completions('df.', 1))
diff --git a/pandas/tests/frame/test_apply.py b/pandas/tests/frame/test_apply.py
new file mode 100644
index 0000000000000..dfb2961befe35
--- /dev/null
+++ b/pandas/tests/frame/test_apply.py
@@ -0,0 +1,1058 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import pytest
+
+import operator
+from datetime import datetime
+
+import warnings
+import numpy as np
+
+from pandas import (notna, DataFrame, Series, MultiIndex, date_range,
+                    Timestamp, compat)
+import pandas as pd
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas.core.apply import frame_apply
+from pandas.util.testing import (assert_series_equal,
+                                 assert_frame_equal)
+import pandas.util.testing as tm
+from pandas.tests.frame.common import TestData
+
+
+class TestDataFrameApply(TestData):
+
+    def test_apply(self):
+        with np.errstate(all='ignore'):
+            # ufunc
+            applied = self.frame.apply(np.sqrt)
+            tm.assert_series_equal(np.sqrt(self.frame['A']), applied['A'])
+
+            # aggregator
+            applied = self.frame.apply(np.mean)
+            assert applied['A'] == np.mean(self.frame['A'])
+
+            d = self.frame.index[0]
+            applied = self.frame.apply(np.mean, axis=1)
+            assert applied[d] == np.mean(self.frame.xs(d))
+            assert applied.index is self.frame.index  # want this
+
+        # invalid axis
+        df = DataFrame(
+            [[1, 2, 3], [4, 5, 6], [7, 8, 9]], index=['a', 'a', 'c'])
+        pytest.raises(ValueError, df.apply, lambda x: x, 2)
+
+        # see gh-9573
+        df = DataFrame({'c0': ['A', 'A', 'B', 'B'],
+                        'c1': ['C', 'C', 'D', 'D']})
+        df = df.apply(lambda ts: ts.astype('category'))
+
+        assert df.shape == (4, 2)
+        assert isinstance(df['c0'].dtype, CategoricalDtype)
+        assert isinstance(df['c1'].dtype, CategoricalDtype)
+
+    def test_apply_mixed_datetimelike(self):
+        # mixed datetimelike
+        # GH 7778
+        df = DataFrame({'A': date_range('20130101', periods=3),
+                        'B': pd.to_timedelta(np.arange(3), unit='s')})
+        result = df.apply(lambda x: x, axis=1)
+        assert_frame_equal(result, df)
+
+    def test_apply_empty(self):
+        # empty
+        applied = self.empty.apply(np.sqrt)
+        assert applied.empty
+
+        applied = self.empty.apply(np.mean)
+        assert applied.empty
+
+        no_rows = self.frame[:0]
+        result = no_rows.apply(lambda x: x.mean())
+        expected = Series(np.nan, index=self.frame.columns)
+        assert_series_equal(result, expected)
+
+        no_cols = self.frame.loc[:, []]
+        result = no_cols.apply(lambda x: x.mean(), axis=1)
+        expected = Series(np.nan, index=self.frame.index)
+        assert_series_equal(result, expected)
+
+        # 2476
+        xp = DataFrame(index=['a'])
+        rs = xp.apply(lambda x: x['a'], axis=1)
+        assert_frame_equal(xp, rs)
+
+    def test_apply_with_reduce_empty(self):
+        # reduce with an empty DataFrame
+        x = []
+        result = self.empty.apply(x.append, axis=1, result_type='expand')
+        assert_frame_equal(result, self.empty)
+        result = self.empty.apply(x.append, axis=1, result_type='reduce')
+        assert_series_equal(result, Series(
+            [], index=pd.Index([], dtype=object)))
+
+        empty_with_cols = DataFrame(columns=['a', 'b', 'c'])
+        result = empty_with_cols.apply(x.append, axis=1, result_type='expand')
+        assert_frame_equal(result, empty_with_cols)
+        result = empty_with_cols.apply(x.append, axis=1, result_type='reduce')
+        assert_series_equal(result, Series(
+            [], index=pd.Index([], dtype=object)))
+
+        # Ensure that x.append hasn't been called
+        assert x == []
+
+    def test_apply_deprecate_reduce(self):
+        with warnings.catch_warnings(record=True):
+            x = []
+            self.empty.apply(x.append, axis=1, result_type='reduce')
+
+    def test_apply_standard_nonunique(self):
+        df = DataFrame(
+            [[1, 2, 3], [4, 5, 6], [7, 8, 9]], index=['a', 'a', 'c'])
+        rs = df.apply(lambda s: s[0], axis=1)
+        xp = Series([1, 4, 7], ['a', 'a', 'c'])
+        assert_series_equal(rs, xp)
+
+        rs = df.T.apply(lambda s: s[0], axis=0)
+        assert_series_equal(rs, xp)
+
+    def test_with_string_args(self):
+
+        for arg in ['sum', 'mean', 'min', 'max', 'std']:
+            result = self.frame.apply(arg)
+            expected = getattr(self.frame, arg)()
+            tm.assert_series_equal(result, expected)
+
+            result = self.frame.apply(arg, axis=1)
+            expected = getattr(self.frame, arg)(axis=1)
+            tm.assert_series_equal(result, expected)
+
+    def test_apply_broadcast_deprecated(self):
+        with tm.assert_produces_warning(FutureWarning):
+            self.frame.apply(np.mean, broadcast=True)
+
+    def test_apply_broadcast(self):
+
+        # scalars
+        result = self.frame.apply(np.mean, result_type='broadcast')
+        expected = DataFrame([self.frame.mean()], index=self.frame.index)
+        tm.assert_frame_equal(result, expected)
+
+        result = self.frame.apply(np.mean, axis=1, result_type='broadcast')
+        m = self.frame.mean(axis=1)
+        expected = DataFrame({c: m for c in self.frame.columns})
+        tm.assert_frame_equal(result, expected)
+
+        # lists
+        result = self.frame.apply(
+            lambda x: list(range(len(self.frame.columns))),
+            axis=1,
+            result_type='broadcast')
+        m = list(range(len(self.frame.columns)))
+        expected = DataFrame([m] * len(self.frame.index),
+                             dtype='float64',
+                             index=self.frame.index,
+                             columns=self.frame.columns)
+        tm.assert_frame_equal(result, expected)
+
+        result = self.frame.apply(lambda x: list(range(len(self.frame.index))),
+                                  result_type='broadcast')
+        m = list(range(len(self.frame.index)))
+        expected = DataFrame({c: m for c in self.frame.columns},
+                             dtype='float64',
+                             index=self.frame.index)
+        tm.assert_frame_equal(result, expected)
+
+        # preserve columns
+        df = DataFrame(np.tile(np.arange(3), 6).reshape(6, -1) + 1,
+                       columns=list('ABC'))
+        result = df.apply(lambda x: [1, 2, 3],
+                          axis=1,
+                          result_type='broadcast')
+        tm.assert_frame_equal(result, df)
+
+        df = DataFrame(np.tile(np.arange(3), 6).reshape(6, -1) + 1,
+                       columns=list('ABC'))
+        result = df.apply(lambda x: Series([1, 2, 3], index=list('abc')),
+                          axis=1,
+                          result_type='broadcast')
+        expected = df.copy()
+        tm.assert_frame_equal(result, expected)
+
+    def test_apply_broadcast_error(self):
+        df = DataFrame(
+            np.tile(np.arange(3, dtype='int64'), 6).reshape(6, -1) + 1,
+            columns=['A', 'B', 'C'])
+
+        # > 1 ndim
+        with pytest.raises(ValueError):
+            df.apply(lambda x: np.array([1, 2]).reshape(-1, 2),
+                     axis=1,
+                     result_type='broadcast')
+
+        # cannot broadcast
+        with pytest.raises(ValueError):
+            df.apply(lambda x: [1, 2],
+                     axis=1,
+                     result_type='broadcast')
+
+        with pytest.raises(ValueError):
+            df.apply(lambda x: Series([1, 2]),
+                     axis=1,
+                     result_type='broadcast')
+
+    def test_apply_raw(self):
+        result0 = self.frame.apply(np.mean, raw=True)
+        result1 = self.frame.apply(np.mean, axis=1, raw=True)
+
+        expected0 = self.frame.apply(lambda x: x.values.mean())
+        expected1 = self.frame.apply(lambda x: x.values.mean(), axis=1)
+
+        assert_series_equal(result0, expected0)
+        assert_series_equal(result1, expected1)
+
+        # no reduction
+        result = self.frame.apply(lambda x: x * 2, raw=True)
+        expected = self.frame * 2
+        assert_frame_equal(result, expected)
+
+    def test_apply_axis1(self):
+        d = self.frame.index[0]
+        tapplied = self.frame.apply(np.mean, axis=1)
+        assert tapplied[d] == np.mean(self.frame.xs(d))
+
+    def test_apply_ignore_failures(self):
+        result = frame_apply(self.mixed_frame,
+                             np.mean, 0,
+                             ignore_failures=True).apply_standard()
+        expected = self.mixed_frame._get_numeric_data().apply(np.mean)
+        assert_series_equal(result, expected)
+
+    def test_apply_mixed_dtype_corner(self):
+        df = DataFrame({'A': ['foo'],
+                        'B': [1.]})
+        result = df[:0].apply(np.mean, axis=1)
+        # the result here is actually kind of ambiguous, should it be a Series
+        # or a DataFrame?
+        expected = Series(np.nan, index=pd.Index([], dtype='int64'))
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'A': ['foo'],
+                        'B': [1.]})
+        result = df.apply(lambda x: x['A'], axis=1)
+        expected = Series(['foo'], index=[0])
+        assert_series_equal(result, expected)
+
+        result = df.apply(lambda x: x['B'], axis=1)
+        expected = Series([1.], index=[0])
+        assert_series_equal(result, expected)
+
+    def test_apply_empty_infer_type(self):
+        no_cols = DataFrame(index=['a', 'b', 'c'])
+        no_index = DataFrame(columns=['a', 'b', 'c'])
+
+        def _check(df, f):
+            with warnings.catch_warnings(record=True):
+                test_res = f(np.array([], dtype='f8'))
+            is_reduction = not isinstance(test_res, np.ndarray)
+
+            def _checkit(axis=0, raw=False):
+                res = df.apply(f, axis=axis, raw=raw)
+                if is_reduction:
+                    agg_axis = df._get_agg_axis(axis)
+                    assert isinstance(res, Series)
+                    assert res.index is agg_axis
+                else:
+                    assert isinstance(res, DataFrame)
+
+            _checkit()
+            _checkit(axis=1)
+            _checkit(raw=True)
+            _checkit(axis=0, raw=True)
+
+        with np.errstate(all='ignore'):
+            _check(no_cols, lambda x: x)
+            _check(no_cols, lambda x: x.mean())
+            _check(no_index, lambda x: x)
+            _check(no_index, lambda x: x.mean())
+
+        result = no_cols.apply(lambda x: x.mean(), result_type='broadcast')
+        assert isinstance(result, DataFrame)
+
+    def test_apply_with_args_kwds(self):
+        def add_some(x, howmuch=0):
+            return x + howmuch
+
+        def agg_and_add(x, howmuch=0):
+            return x.mean() + howmuch
+
+        def subtract_and_divide(x, sub, divide=1):
+            return (x - sub) / divide
+
+        result = self.frame.apply(add_some, howmuch=2)
+        exp = self.frame.apply(lambda x: x + 2)
+        assert_frame_equal(result, exp)
+
+        result = self.frame.apply(agg_and_add, howmuch=2)
+        exp = self.frame.apply(lambda x: x.mean() + 2)
+        assert_series_equal(result, exp)
+
+        res = self.frame.apply(subtract_and_divide, args=(2,), divide=2)
+        exp = self.frame.apply(lambda x: (x - 2.) / 2.)
+        assert_frame_equal(res, exp)
+
+    def test_apply_yield_list(self):
+        result = self.frame.apply(list)
+        assert_frame_equal(result, self.frame)
+
+    def test_apply_reduce_Series(self):
+        self.frame.loc[::2, 'A'] = np.nan
+        expected = self.frame.mean(1)
+        result = self.frame.apply(np.mean, axis=1)
+        assert_series_equal(result, expected)
+
+    def test_apply_differently_indexed(self):
+        df = DataFrame(np.random.randn(20, 10))
+
+        result0 = df.apply(Series.describe, axis=0)
+        expected0 = DataFrame(dict((i, v.describe())
+                                   for i, v in compat.iteritems(df)),
+                              columns=df.columns)
+        assert_frame_equal(result0, expected0)
+
+        result1 = df.apply(Series.describe, axis=1)
+        expected1 = DataFrame(dict((i, v.describe())
+                                   for i, v in compat.iteritems(df.T)),
+                              columns=df.index).T
+        assert_frame_equal(result1, expected1)
+
+    def test_apply_modify_traceback(self):
+        data = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
+                                'bar', 'bar', 'bar', 'bar',
+                                'foo', 'foo', 'foo'],
+                          'B': ['one', 'one', 'one', 'two',
+                                'one', 'one', 'one', 'two',
+                                'two', 'two', 'one'],
+                          'C': ['dull', 'dull', 'shiny', 'dull',
+                                'dull', 'shiny', 'shiny', 'dull',
+                                'shiny', 'shiny', 'shiny'],
+                          'D': np.random.randn(11),
+                          'E': np.random.randn(11),
+                          'F': np.random.randn(11)})
+
+        data.loc[4, 'C'] = np.nan
+
+        def transform(row):
+            if row['C'].startswith('shin') and row['A'] == 'foo':
+                row['D'] = 7
+            return row
+
+        def transform2(row):
+            if (notna(row['C']) and row['C'].startswith('shin') and
+                    row['A'] == 'foo'):
+                row['D'] = 7
+            return row
+
+        try:
+            data.apply(transform, axis=1)
+        except AttributeError as e:
+            assert len(e.args) == 2
+            assert e.args[1] == 'occurred at index 4'
+            assert e.args[0] == "'float' object has no attribute 'startswith'"
+
+    def test_apply_bug(self):
+
+        # GH 6125
+        positions = pd.DataFrame([[1, 'ABC0', 50], [1, 'YUM0', 20],
+                                  [1, 'DEF0', 20], [2, 'ABC1', 50],
+                                  [2, 'YUM1', 20], [2, 'DEF1', 20]],
+                                 columns=['a', 'market', 'position'])
+
+        def f(r):
+            return r['market']
+        expected = positions.apply(f, axis=1)
+
+        positions = DataFrame([[datetime(2013, 1, 1), 'ABC0', 50],
+                               [datetime(2013, 1, 2), 'YUM0', 20],
+                               [datetime(2013, 1, 3), 'DEF0', 20],
+                               [datetime(2013, 1, 4), 'ABC1', 50],
+                               [datetime(2013, 1, 5), 'YUM1', 20],
+                               [datetime(2013, 1, 6), 'DEF1', 20]],
+                              columns=['a', 'market', 'position'])
+        result = positions.apply(f, axis=1)
+        assert_series_equal(result, expected)
+
+    def test_apply_convert_objects(self):
+        data = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
+                                'bar', 'bar', 'bar', 'bar',
+                                'foo', 'foo', 'foo'],
+                          'B': ['one', 'one', 'one', 'two',
+                                'one', 'one', 'one', 'two',
+                                'two', 'two', 'one'],
+                          'C': ['dull', 'dull', 'shiny', 'dull',
+                                'dull', 'shiny', 'shiny', 'dull',
+                                'shiny', 'shiny', 'shiny'],
+                          'D': np.random.randn(11),
+                          'E': np.random.randn(11),
+                          'F': np.random.randn(11)})
+
+        result = data.apply(lambda x: x, axis=1)
+        assert_frame_equal(result._convert(datetime=True), data)
+
+    def test_apply_attach_name(self):
+        result = self.frame.apply(lambda x: x.name)
+        expected = Series(self.frame.columns, index=self.frame.columns)
+        assert_series_equal(result, expected)
+
+        result = self.frame.apply(lambda x: x.name, axis=1)
+        expected = Series(self.frame.index, index=self.frame.index)
+        assert_series_equal(result, expected)
+
+        # non-reductions
+        result = self.frame.apply(lambda x: np.repeat(x.name, len(x)))
+        expected = DataFrame(np.tile(self.frame.columns,
+                                     (len(self.frame.index), 1)),
+                             index=self.frame.index,
+                             columns=self.frame.columns)
+        assert_frame_equal(result, expected)
+
+        result = self.frame.apply(lambda x: np.repeat(x.name, len(x)),
+                                  axis=1)
+        expected = Series(np.repeat(t[0], len(self.frame.columns))
+                          for t in self.frame.itertuples())
+        expected.index = self.frame.index
+        assert_series_equal(result, expected)
+
+    def test_apply_multi_index(self):
+        index = MultiIndex.from_arrays([['a', 'a', 'b'], ['c', 'd', 'd']])
+        s = DataFrame([[1, 2], [3, 4], [5, 6]],
+                      index=index,
+                      columns=['col1', 'col2'])
+        result = s.apply(
+            lambda x: Series({'min': min(x), 'max': max(x)}), 1)
+        expected = DataFrame([[1, 2], [3, 4], [5, 6]],
+                             index=index,
+                             columns=['min', 'max'])
+        assert_frame_equal(result, expected, check_like=True)
+
+    def test_apply_dict(self):
+
+        # GH 8735
+        A = DataFrame([['foo', 'bar'], ['spam', 'eggs']])
+        A_dicts = Series([dict([(0, 'foo'), (1, 'spam')]),
+                          dict([(0, 'bar'), (1, 'eggs')])])
+        B = DataFrame([[0, 1], [2, 3]])
+        B_dicts = Series([dict([(0, 0), (1, 2)]), dict([(0, 1), (1, 3)])])
+        fn = lambda x: x.to_dict()
+
+        for df, dicts in [(A, A_dicts), (B, B_dicts)]:
+            reduce_true = df.apply(fn, result_type='reduce')
+            reduce_false = df.apply(fn, result_type='expand')
+            reduce_none = df.apply(fn)
+
+            assert_series_equal(reduce_true, dicts)
+            assert_frame_equal(reduce_false, df)
+            assert_series_equal(reduce_none, dicts)
+
+    def test_applymap(self):
+        applied = self.frame.applymap(lambda x: x * 2)
+        tm.assert_frame_equal(applied, self.frame * 2)
+        self.frame.applymap(type)
+
+        # gh-465: function returning tuples
+        result = self.frame.applymap(lambda x: (x, x))
+        assert isinstance(result['A'][0], tuple)
+
+        # gh-2909: object conversion to float in constructor?
+        df = DataFrame(data=[1, 'a'])
+        result = df.applymap(lambda x: x)
+        assert result.dtypes[0] == object
+
+        df = DataFrame(data=[1., 'a'])
+        result = df.applymap(lambda x: x)
+        assert result.dtypes[0] == object
+
+        # see gh-2786
+        df = DataFrame(np.random.random((3, 4)))
+        df2 = df.copy()
+        cols = ['a', 'a', 'a', 'a']
+        df.columns = cols
+
+        expected = df2.applymap(str)
+        expected.columns = cols
+        result = df.applymap(str)
+        tm.assert_frame_equal(result, expected)
+
+        # datetime/timedelta
+        df['datetime'] = Timestamp('20130101')
+        df['timedelta'] = pd.Timedelta('1 min')
+        result = df.applymap(str)
+        for f in ['datetime', 'timedelta']:
+            assert result.loc[0, f] == str(df.loc[0, f])
+
+        # see gh-8222
+        empty_frames = [pd.DataFrame(),
+                        pd.DataFrame(columns=list('ABC')),
+                        pd.DataFrame(index=list('ABC')),
+                        pd.DataFrame({'A': [], 'B': [], 'C': []})]
+        for frame in empty_frames:
+            for func in [round, lambda x: x]:
+                result = frame.applymap(func)
+                tm.assert_frame_equal(result, frame)
+
+    def test_applymap_box_timestamps(self):
+        # #2689, #2627
+        ser = pd.Series(date_range('1/1/2000', periods=10))
+
+        def func(x):
+            return (x.hour, x.day, x.month)
+
+        # it works!
+        pd.DataFrame(ser).applymap(func)
+
+    def test_applymap_box(self):
+        # ufunc will not be boxed. Same test cases as the test_map_box
+        df = pd.DataFrame({'a': [pd.Timestamp('2011-01-01'),
+                                 pd.Timestamp('2011-01-02')],
+                           'b': [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+                                 pd.Timestamp('2011-01-02', tz='US/Eastern')],
+                           'c': [pd.Timedelta('1 days'),
+                                 pd.Timedelta('2 days')],
+                           'd': [pd.Period('2011-01-01', freq='M'),
+                                 pd.Period('2011-01-02', freq='M')]})
+
+        res = df.applymap(lambda x: '{0}'.format(x.__class__.__name__))
+        exp = pd.DataFrame({'a': ['Timestamp', 'Timestamp'],
+                            'b': ['Timestamp', 'Timestamp'],
+                            'c': ['Timedelta', 'Timedelta'],
+                            'd': ['Period', 'Period']})
+        tm.assert_frame_equal(res, exp)
+
+    def test_frame_apply_dont_convert_datetime64(self):
+        from pandas.tseries.offsets import BDay
+        df = DataFrame({'x1': [datetime(1996, 1, 1)]})
+
+        df = df.applymap(lambda x: x + BDay())
+        df = df.applymap(lambda x: x + BDay())
+
+        assert df.x1.dtype == 'M8[ns]'
+
+    def test_apply_non_numpy_dtype(self):
+        # See gh-12244
+        df = DataFrame({'dt': pd.date_range(
+            "2015-01-01", periods=3, tz='Europe/Brussels')})
+        result = df.apply(lambda x: x)
+        assert_frame_equal(result, df)
+
+        result = df.apply(lambda x: x + pd.Timedelta('1day'))
+        expected = DataFrame({'dt': pd.date_range(
+            "2015-01-02", periods=3, tz='Europe/Brussels')})
+        assert_frame_equal(result, expected)
+
+        df = DataFrame({'dt': ['a', 'b', 'c', 'a']}, dtype='category')
+        result = df.apply(lambda x: x)
+        assert_frame_equal(result, df)
+
+    def test_apply_dup_names_multi_agg(self):
+        # GH 21063
+        df = pd.DataFrame([[0, 1], [2, 3]], columns=['a', 'a'])
+        expected = pd.DataFrame([[0, 1]], columns=['a', 'a'], index=['min'])
+        result = df.agg(['min'])
+
+        tm.assert_frame_equal(result, expected)
+
+
+class TestInferOutputShape(object):
+    # the user has supplied an opaque UDF where
+    # they are transforming the input that requires
+    # us to infer the output
+
+    def test_infer_row_shape(self):
+        # gh-17437
+        # if row shape is changing, infer it
+        df = pd.DataFrame(np.random.rand(10, 2))
+        result = df.apply(np.fft.fft, axis=0)
+        assert result.shape == (10, 2)
+
+        result = df.apply(np.fft.rfft, axis=0)
+        assert result.shape == (6, 2)
+
+    def test_with_dictlike_columns(self):
+        # gh 17602
+        df = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+        result = df.apply(lambda x: {'s': x['a'] + x['b']},
+                          axis=1)
+        expected = Series([{'s': 3} for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+        df['tm'] = [pd.Timestamp('2017-05-01 00:00:00'),
+                    pd.Timestamp('2017-05-02 00:00:00')]
+        result = df.apply(lambda x: {'s': x['a'] + x['b']},
+                          axis=1)
+        assert_series_equal(result, expected)
+
+        # compose a series
+        result = (df['a'] + df['b']).apply(lambda x: {'s': x})
+        expected = Series([{'s': 3}, {'s': 3}])
+        assert_series_equal(result, expected)
+
+        # gh-18775
+        df = DataFrame()
+        df["author"] = ["X", "Y", "Z"]
+        df["publisher"] = ["BBC", "NBC", "N24"]
+        df["date"] = pd.to_datetime(['17-10-2010 07:15:30',
+                                     '13-05-2011 08:20:35',
+                                     '15-01-2013 09:09:09'])
+        result = df.apply(lambda x: {}, axis=1)
+        expected = Series([{}, {}, {}])
+        assert_series_equal(result, expected)
+
+    def test_with_dictlike_columns_with_infer(self):
+        # gh 17602
+        df = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+        result = df.apply(lambda x: {'s': x['a'] + x['b']},
+                          axis=1, result_type='expand')
+        expected = DataFrame({'s': [3, 3]})
+        assert_frame_equal(result, expected)
+
+        df['tm'] = [pd.Timestamp('2017-05-01 00:00:00'),
+                    pd.Timestamp('2017-05-02 00:00:00')]
+        result = df.apply(lambda x: {'s': x['a'] + x['b']},
+                          axis=1, result_type='expand')
+        assert_frame_equal(result, expected)
+
+    def test_with_listlike_columns(self):
+        # gh-17348
+        df = DataFrame({'a': Series(np.random.randn(4)),
+                        'b': ['a', 'list', 'of', 'words'],
+                        'ts': date_range('2016-10-01', periods=4, freq='H')})
+
+        result = df[['a', 'b']].apply(tuple, axis=1)
+        expected = Series([t[1:] for t in df[['a', 'b']].itertuples()])
+        assert_series_equal(result, expected)
+
+        result = df[['a', 'ts']].apply(tuple, axis=1)
+        expected = Series([t[1:] for t in df[['a', 'ts']].itertuples()])
+        assert_series_equal(result, expected)
+
+        # gh-18919
+        df = DataFrame({'x': Series([['a', 'b'], ['q']]),
+                        'y': Series([['z'], ['q', 't']])})
+        df.index = MultiIndex.from_tuples([('i0', 'j0'), ('i1', 'j1')])
+
+        result = df.apply(
+            lambda row: [el for el in row['x'] if el in row['y']],
+            axis=1)
+        expected = Series([[], ['q']], index=df.index)
+        assert_series_equal(result, expected)
+
+    def test_infer_output_shape_columns(self):
+        # gh-18573
+
+        df = DataFrame({'number': [1., 2.],
+                        'string': ['foo', 'bar'],
+                        'datetime': [pd.Timestamp('2017-11-29 03:30:00'),
+                                     pd.Timestamp('2017-11-29 03:45:00')]})
+        result = df.apply(lambda row: (row.number, row.string), axis=1)
+        expected = Series([(t.number, t.string) for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+    def test_infer_output_shape_listlike_columns(self):
+        # gh-16353
+
+        df = DataFrame(np.random.randn(6, 3), columns=['A', 'B', 'C'])
+
+        result = df.apply(lambda x: [1, 2, 3], axis=1)
+        expected = Series([[1, 2, 3] for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+        result = df.apply(lambda x: [1, 2], axis=1)
+        expected = Series([[1, 2] for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+        # gh-17970
+        df = DataFrame({"a": [1, 2, 3]}, index=list('abc'))
+
+        result = df.apply(lambda row: np.ones(1), axis=1)
+        expected = Series([np.ones(1) for t in df.itertuples()],
+                          index=df.index)
+        assert_series_equal(result, expected)
+
+        result = df.apply(lambda row: np.ones(2), axis=1)
+        expected = Series([np.ones(2) for t in df.itertuples()],
+                          index=df.index)
+        assert_series_equal(result, expected)
+
+        # gh-17892
+        df = pd.DataFrame({'a': [pd.Timestamp('2010-02-01'),
+                                 pd.Timestamp('2010-02-04'),
+                                 pd.Timestamp('2010-02-05'),
+                                 pd.Timestamp('2010-02-06')],
+                           'b': [9, 5, 4, 3],
+                           'c': [5, 3, 4, 2],
+                           'd': [1, 2, 3, 4]})
+
+        def fun(x):
+            return (1, 2)
+
+        result = df.apply(fun, axis=1)
+        expected = Series([(1, 2) for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+    def test_consistent_coerce_for_shapes(self):
+        # we want column names to NOT be propagated
+        # just because the shape matches the input shape
+        df = DataFrame(np.random.randn(4, 3), columns=['A', 'B', 'C'])
+
+        result = df.apply(lambda x: [1, 2, 3], axis=1)
+        expected = Series([[1, 2, 3] for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+        result = df.apply(lambda x: [1, 2], axis=1)
+        expected = Series([[1, 2] for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+    def test_consistent_names(self):
+        # if a Series is returned, we should use the resulting index names
+        df = DataFrame(
+            np.tile(np.arange(3, dtype='int64'), 6).reshape(6, -1) + 1,
+            columns=['A', 'B', 'C'])
+
+        result = df.apply(lambda x: Series([1, 2, 3],
+                                           index=['test', 'other', 'cols']),
+                          axis=1)
+        expected = DataFrame(
+            np.tile(np.arange(3, dtype='int64'), 6).reshape(6, -1) + 1,
+            columns=['test', 'other', 'cols'])
+        assert_frame_equal(result, expected)
+
+        result = df.apply(
+            lambda x: pd.Series([1, 2], index=['test', 'other']), axis=1)
+        expected = DataFrame(
+            np.tile(np.arange(2, dtype='int64'), 6).reshape(6, -1) + 1,
+            columns=['test', 'other'])
+        assert_frame_equal(result, expected)
+
+    def test_result_type(self):
+        # result_type should be consistent no matter which
+        # path we take in the code
+        df = DataFrame(
+            np.tile(np.arange(3, dtype='int64'), 6).reshape(6, -1) + 1,
+            columns=['A', 'B', 'C'])
+
+        result = df.apply(lambda x: [1, 2, 3], axis=1, result_type='expand')
+        expected = df.copy()
+        expected.columns = [0, 1, 2]
+        assert_frame_equal(result, expected)
+
+        result = df.apply(lambda x: [1, 2], axis=1, result_type='expand')
+        expected = df[['A', 'B']].copy()
+        expected.columns = [0, 1]
+        assert_frame_equal(result, expected)
+
+        # broadcast result
+        result = df.apply(lambda x: [1, 2, 3], axis=1, result_type='broadcast')
+        expected = df.copy()
+        assert_frame_equal(result, expected)
+
+        columns = ['other', 'col', 'names']
+        result = df.apply(
+            lambda x: pd.Series([1, 2, 3],
+                                index=columns),
+            axis=1,
+            result_type='broadcast')
+        expected = df.copy()
+        assert_frame_equal(result, expected)
+
+        # series result
+        result = df.apply(lambda x: Series([1, 2, 3], index=x.index), axis=1)
+        expected = df.copy()
+        assert_frame_equal(result, expected)
+
+        # series result with other index
+        columns = ['other', 'col', 'names']
+        result = df.apply(
+            lambda x: pd.Series([1, 2, 3], index=columns),
+            axis=1)
+        expected = df.copy()
+        expected.columns = columns
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("result_type", ['foo', 1])
+    def test_result_type_error(self, result_type):
+        # allowed result_type
+        df = DataFrame(
+            np.tile(np.arange(3, dtype='int64'), 6).reshape(6, -1) + 1,
+            columns=['A', 'B', 'C'])
+
+        with pytest.raises(ValueError):
+            df.apply(lambda x: [1, 2, 3],
+                     axis=1,
+                     result_type=result_type)
+
+    @pytest.mark.parametrize(
+        "box",
+        [lambda x: list(x),
+         lambda x: tuple(x),
+         lambda x: np.array(x, dtype='int64')],
+        ids=['list', 'tuple', 'array'])
+    def test_consistency_for_boxed(self, box):
+        # passing an array or list should not affect the output shape
+        df = DataFrame(
+            np.tile(np.arange(3, dtype='int64'), 6).reshape(6, -1) + 1,
+            columns=['A', 'B', 'C'])
+
+        result = df.apply(lambda x: box([1, 2]), axis=1)
+        expected = Series([box([1, 2]) for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+        result = df.apply(lambda x: box([1, 2]), axis=1, result_type='expand')
+        expected = DataFrame(
+            np.tile(np.arange(2, dtype='int64'), 6).reshape(6, -1) + 1)
+        assert_frame_equal(result, expected)
+
+
+def zip_frames(*frames):
+    """
+    take a list of frames, zip the columns together for each
+    assume that these all have the first frame columns
+
+    return a new frame
+    """
+    columns = frames[0].columns
+    zipped = [f[c] for c in columns for f in frames]
+    return pd.concat(zipped, axis=1)
+
+
+class TestDataFrameAggregate(TestData):
+
+    def test_agg_transform(self):
+
+        with np.errstate(all='ignore'):
+
+            f_sqrt = np.sqrt(self.frame)
+            f_abs = np.abs(self.frame)
+
+            # ufunc
+            result = self.frame.transform(np.sqrt)
+            expected = f_sqrt.copy()
+            assert_frame_equal(result, expected)
+
+            result = self.frame.apply(np.sqrt)
+            assert_frame_equal(result, expected)
+
+            result = self.frame.transform(np.sqrt)
+            assert_frame_equal(result, expected)
+
+            # list-like
+            result = self.frame.apply([np.sqrt])
+            expected = f_sqrt.copy()
+            expected.columns = pd.MultiIndex.from_product(
+                [self.frame.columns, ['sqrt']])
+            assert_frame_equal(result, expected)
+
+            result = self.frame.transform([np.sqrt])
+            assert_frame_equal(result, expected)
+
+            # multiple items in list
+            # these are in the order as if we are applying both
+            # functions per series and then concatting
+            expected = zip_frames(f_sqrt, f_abs)
+            expected.columns = pd.MultiIndex.from_product(
+                [self.frame.columns, ['sqrt', 'absolute']])
+            result = self.frame.apply([np.sqrt, np.abs])
+            assert_frame_equal(result, expected)
+
+            result = self.frame.transform(['sqrt', np.abs])
+            assert_frame_equal(result, expected)
+
+    def test_transform_and_agg_err(self):
+        # cannot both transform and agg
+        def f():
+            self.frame.transform(['max', 'min'])
+        pytest.raises(ValueError, f)
+
+        def f():
+            with np.errstate(all='ignore'):
+                self.frame.agg(['max', 'sqrt'])
+        pytest.raises(ValueError, f)
+
+        def f():
+            with np.errstate(all='ignore'):
+                self.frame.transform(['max', 'sqrt'])
+        pytest.raises(ValueError, f)
+
+        df = pd.DataFrame({'A': range(5), 'B': 5})
+
+        def f():
+            with np.errstate(all='ignore'):
+                df.agg({'A': ['abs', 'sum'], 'B': ['mean', 'max']})
+
+    @pytest.mark.parametrize('method', [
+        'abs', 'shift', 'pct_change', 'cumsum', 'rank',
+    ])
+    def test_transform_method_name(self, method):
+        # https://github.com/pandas-dev/pandas/issues/19760
+        df = pd.DataFrame({"A": [-1, 2]})
+        result = df.transform(method)
+        expected = operator.methodcaller(method)(df)
+        tm.assert_frame_equal(result, expected)
+
+    def test_demo(self):
+        # demonstration tests
+        df = pd.DataFrame({'A': range(5), 'B': 5})
+
+        result = df.agg(['min', 'max'])
+        expected = DataFrame({'A': [0, 4], 'B': [5, 5]},
+                             columns=['A', 'B'],
+                             index=['min', 'max'])
+        tm.assert_frame_equal(result, expected)
+
+        result = df.agg({'A': ['min', 'max'], 'B': ['sum', 'max']})
+        expected = DataFrame({'A': [4.0, 0.0, np.nan],
+                              'B': [5.0, np.nan, 25.0]},
+                             columns=['A', 'B'],
+                             index=['max', 'min', 'sum'])
+        tm.assert_frame_equal(result.reindex_like(expected), expected)
+
+    def test_agg_multiple_mixed_no_warning(self):
+        # https://github.com/pandas-dev/pandas/issues/20909
+        mdf = pd.DataFrame({'A': [1, 2, 3],
+                            'B': [1., 2., 3.],
+                            'C': ['foo', 'bar', 'baz'],
+                            'D': pd.date_range('20130101', periods=3)})
+        expected = pd.DataFrame({"A": [1, 6], 'B': [1.0, 6.0],
+                                 "C": ['bar', 'foobarbaz'],
+                                 "D": [pd.Timestamp('2013-01-01'), pd.NaT]},
+                                index=['min', 'sum'])
+        # sorted index
+        with tm.assert_produces_warning(None):
+            result = mdf.agg(['min', 'sum'])
+
+        tm.assert_frame_equal(result, expected)
+
+        with tm.assert_produces_warning(None):
+            result = mdf[['D', 'C', 'B', 'A']].agg(['sum', 'min'])
+
+        # For backwards compatibility, the result's index is
+        # still sorted by function name, so it's ['min', 'sum']
+        # not ['sum', 'min'].
+        expected = expected[['D', 'C', 'B', 'A']]
+        tm.assert_frame_equal(result, expected)
+
+    def test_agg_dict_nested_renaming_depr(self):
+
+        df = pd.DataFrame({'A': range(5), 'B': 5})
+
+        # nested renaming
+        with tm.assert_produces_warning(FutureWarning):
+            df.agg({'A': {'foo': 'min'},
+                    'B': {'bar': 'max'}})
+
+    def test_agg_reduce(self):
+        # all reducers
+        expected = zip_frames(self.frame.mean().to_frame(),
+                              self.frame.max().to_frame(),
+                              self.frame.sum().to_frame()).T
+        expected.index = ['mean', 'max', 'sum']
+        result = self.frame.agg(['mean', 'max', 'sum'])
+        assert_frame_equal(result, expected)
+
+        # dict input with scalars
+        result = self.frame.agg({'A': 'mean', 'B': 'sum'})
+        expected = Series([self.frame.A.mean(), self.frame.B.sum()],
+                          index=['A', 'B'])
+        assert_series_equal(result.reindex_like(expected), expected)
+
+        # dict input with lists
+        result = self.frame.agg({'A': ['mean'], 'B': ['sum']})
+        expected = DataFrame({'A': Series([self.frame.A.mean()],
+                                          index=['mean']),
+                              'B': Series([self.frame.B.sum()],
+                                          index=['sum'])})
+        assert_frame_equal(result.reindex_like(expected), expected)
+
+        # dict input with lists with multiple
+        result = self.frame.agg({'A': ['mean', 'sum'],
+                                 'B': ['sum', 'max']})
+        expected = DataFrame({'A': Series([self.frame.A.mean(),
+                                           self.frame.A.sum()],
+                                          index=['mean', 'sum']),
+                              'B': Series([self.frame.B.sum(),
+                                           self.frame.B.max()],
+                                          index=['sum', 'max'])})
+        assert_frame_equal(result.reindex_like(expected), expected)
+
+    def test_nuiscance_columns(self):
+
+        # GH 15015
+        df = DataFrame({'A': [1, 2, 3],
+                        'B': [1., 2., 3.],
+                        'C': ['foo', 'bar', 'baz'],
+                        'D': pd.date_range('20130101', periods=3)})
+
+        result = df.agg('min')
+        expected = Series([1, 1., 'bar', pd.Timestamp('20130101')],
+                          index=df.columns)
+        assert_series_equal(result, expected)
+
+        result = df.agg(['min'])
+        expected = DataFrame([[1, 1., 'bar', pd.Timestamp('20130101')]],
+                             index=['min'], columns=df.columns)
+        assert_frame_equal(result, expected)
+
+        result = df.agg('sum')
+        expected = Series([6, 6., 'foobarbaz'],
+                          index=['A', 'B', 'C'])
+        assert_series_equal(result, expected)
+
+        result = df.agg(['sum'])
+        expected = DataFrame([[6, 6., 'foobarbaz']],
+                             index=['sum'], columns=['A', 'B', 'C'])
+        assert_frame_equal(result, expected)
+
+    def test_non_callable_aggregates(self):
+
+        # GH 16405
+        # 'size' is a property of frame/series
+        # validate that this is working
+        df = DataFrame({'A': [None, 2, 3],
+                        'B': [1.0, np.nan, 3.0],
+                        'C': ['foo', None, 'bar']})
+
+        # Function aggregate
+        result = df.agg({'A': 'count'})
+        expected = Series({'A': 2})
+
+        assert_series_equal(result, expected)
+
+        # Non-function aggregate
+        result = df.agg({'A': 'size'})
+        expected = Series({'A': 3})
+
+        assert_series_equal(result, expected)
+
+        # Mix function and non-function aggs
+        result1 = df.agg(['count', 'size'])
+        result2 = df.agg({'A': ['count', 'size'],
+                          'B': ['count', 'size'],
+                          'C': ['count', 'size']})
+        expected = pd.DataFrame({'A': {'count': 2, 'size': 3},
+                                 'B': {'count': 2, 'size': 3},
+                                 'C': {'count': 2, 'size': 3}})
+
+        assert_frame_equal(result1, result2, check_like=True)
+        assert_frame_equal(result2, expected, check_like=True)
+
+        # Just functional string arg is same as calling df.arg()
+        result = df.agg('count')
+        expected = df.count()
+
+        assert_series_equal(result, expected)
+
+        # Just a string attribute arg same as calling df.arg
+        result = df.agg('size')
+        expected = df.size
+
+        assert result == expected
diff --git a/pandas/tests/frame/test_arithmetic.py b/pandas/tests/frame/test_arithmetic.py
new file mode 100644
index 0000000000000..fb381a5640519
--- /dev/null
+++ b/pandas/tests/frame/test_arithmetic.py
@@ -0,0 +1,278 @@
+# -*- coding: utf-8 -*-
+import pytest
+import numpy as np
+
+from pandas.compat import range
+
+import pandas as pd
+import pandas.util.testing as tm
+
+
+# -------------------------------------------------------------------
+# Comparisons
+
+class TestFrameComparisons(object):
+    def test_df_boolean_comparison_error(self):
+        # GH#4576
+        # boolean comparisons with a tuple/list give unexpected results
+        df = pd.DataFrame(np.arange(6).reshape((3, 2)))
+
+        # not shape compatible
+        with pytest.raises(ValueError):
+            df == (2, 2)
+        with pytest.raises(ValueError):
+            df == [2, 2]
+
+    def test_df_float_none_comparison(self):
+        df = pd.DataFrame(np.random.randn(8, 3), index=range(8),
+                          columns=['A', 'B', 'C'])
+
+        with pytest.raises(TypeError):
+            df.__eq__(None)
+
+    def test_df_string_comparison(self):
+        df = pd.DataFrame([{"a": 1, "b": "foo"}, {"a": 2, "b": "bar"}])
+        mask_a = df.a > 1
+        tm.assert_frame_equal(df[mask_a], df.loc[1:1, :])
+        tm.assert_frame_equal(df[-mask_a], df.loc[0:0, :])
+
+        mask_b = df.b == "foo"
+        tm.assert_frame_equal(df[mask_b], df.loc[0:0, :])
+        tm.assert_frame_equal(df[-mask_b], df.loc[1:1, :])
+
+    @pytest.mark.parametrize('opname', ['eq', 'ne', 'gt', 'lt', 'ge', 'le'])
+    def test_df_flex_cmp_constant_return_types(self, opname):
+        # GH#15077, non-empty DataFrame
+        df = pd.DataFrame({'x': [1, 2, 3], 'y': [1., 2., 3.]})
+        const = 2
+
+        result = getattr(df, opname)(const).get_dtype_counts()
+        tm.assert_series_equal(result, pd.Series([2], ['bool']))
+
+    @pytest.mark.parametrize('opname', ['eq', 'ne', 'gt', 'lt', 'ge', 'le'])
+    def test_df_flex_cmp_constant_return_types_empty(self, opname):
+        # GH#15077 empty DataFrame
+        df = pd.DataFrame({'x': [1, 2, 3], 'y': [1., 2., 3.]})
+        const = 2
+
+        empty = df.iloc[:0]
+        result = getattr(empty, opname)(const).get_dtype_counts()
+        tm.assert_series_equal(result, pd.Series([2], ['bool']))
+
+    @pytest.mark.parametrize('timestamps', [
+        [pd.Timestamp('2012-01-01 13:00:00+00:00')] * 2,
+        [pd.Timestamp('2012-01-01 13:00:00')] * 2])
+    def test_tz_aware_scalar_comparison(self, timestamps):
+        # Test for issue #15966
+        df = pd.DataFrame({'test': timestamps})
+        expected = pd.DataFrame({'test': [False, False]})
+        tm.assert_frame_equal(df == -1, expected)
+
+
+# -------------------------------------------------------------------
+# Arithmetic
+
+class TestFrameFlexArithmetic(object):
+    def test_df_add_flex_filled_mixed_dtypes(self):
+        # GH#19611
+        dti = pd.date_range('2016-01-01', periods=3)
+        ser = pd.Series(['1 Day', 'NaT', '2 Days'], dtype='timedelta64[ns]')
+        df = pd.DataFrame({'A': dti, 'B': ser})
+        other = pd.DataFrame({'A': ser, 'B': ser})
+        fill = pd.Timedelta(days=1).to_timedelta64()
+        result = df.add(other, fill_value=fill)
+
+        expected = pd.DataFrame(
+            {'A': pd.Series(['2016-01-02', '2016-01-03', '2016-01-05'],
+                            dtype='datetime64[ns]'),
+             'B': ser * 2})
+        tm.assert_frame_equal(result, expected)
+
+
+class TestFrameMulDiv(object):
+    """Tests for DataFrame multiplication and division"""
+    # ------------------------------------------------------------------
+    # Mod By Zero
+
+    def test_df_mod_zero_df(self):
+        # GH#3590, modulo as ints
+        df = pd.DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+
+        # this is technically wrong, as the integer portion is coerced to float
+        # ###
+        first = pd.Series([0, 0, 0, 0], dtype='float64')
+        second = pd.Series([np.nan, np.nan, np.nan, 0])
+        expected = pd.DataFrame({'first': first, 'second': second})
+        result = df % df
+        tm.assert_frame_equal(result, expected)
+
+    def test_df_mod_zero_array(self):
+        # GH#3590, modulo as ints
+        df = pd.DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+
+        # this is technically wrong, as the integer portion is coerced to float
+        # ###
+        first = pd.Series([0, 0, 0, 0], dtype='float64')
+        second = pd.Series([np.nan, np.nan, np.nan, 0])
+        expected = pd.DataFrame({'first': first, 'second': second})
+
+        # numpy has a slightly different (wrong) treatment
+        with np.errstate(all='ignore'):
+            arr = df.values % df.values
+        result2 = pd.DataFrame(arr, index=df.index,
+                               columns=df.columns, dtype='float64')
+        result2.iloc[0:3, 1] = np.nan
+        tm.assert_frame_equal(result2, expected)
+
+    def test_df_mod_zero_int(self):
+        # GH#3590, modulo as ints
+        df = pd.DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+
+        result = df % 0
+        expected = pd.DataFrame(np.nan, index=df.index, columns=df.columns)
+        tm.assert_frame_equal(result, expected)
+
+        # numpy has a slightly different (wrong) treatment
+        with np.errstate(all='ignore'):
+            arr = df.values.astype('float64') % 0
+        result2 = pd.DataFrame(arr, index=df.index, columns=df.columns)
+        tm.assert_frame_equal(result2, expected)
+
+    def test_df_mod_zero_series_does_not_commute(self):
+        # GH#3590, modulo as ints
+        # not commutative with series
+        df = pd.DataFrame(np.random.randn(10, 5))
+        ser = df[0]
+        res = ser % df
+        res2 = df % ser
+        assert not res.fillna(0).equals(res2.fillna(0))
+
+    # ------------------------------------------------------------------
+    # Division By Zero
+
+    def test_df_div_zero_df(self):
+        # integer div, but deal with the 0's (GH#9144)
+        df = pd.DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+        result = df / df
+
+        first = pd.Series([1.0, 1.0, 1.0, 1.0])
+        second = pd.Series([np.nan, np.nan, np.nan, 1])
+        expected = pd.DataFrame({'first': first, 'second': second})
+        tm.assert_frame_equal(result, expected)
+
+    def test_df_div_zero_array(self):
+        # integer div, but deal with the 0's (GH#9144)
+        df = pd.DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+
+        first = pd.Series([1.0, 1.0, 1.0, 1.0])
+        second = pd.Series([np.nan, np.nan, np.nan, 1])
+        expected = pd.DataFrame({'first': first, 'second': second})
+
+        with np.errstate(all='ignore'):
+            arr = df.values.astype('float') / df.values
+        result = pd.DataFrame(arr, index=df.index,
+                              columns=df.columns)
+        tm.assert_frame_equal(result, expected)
+
+    def test_df_div_zero_int(self):
+        # integer div, but deal with the 0's (GH#9144)
+        df = pd.DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+
+        result = df / 0
+        expected = pd.DataFrame(np.inf, index=df.index, columns=df.columns)
+        expected.iloc[0:3, 1] = np.nan
+        tm.assert_frame_equal(result, expected)
+
+        # numpy has a slightly different (wrong) treatment
+        with np.errstate(all='ignore'):
+            arr = df.values.astype('float64') / 0
+        result2 = pd.DataFrame(arr, index=df.index,
+                               columns=df.columns)
+        tm.assert_frame_equal(result2, expected)
+
+    def test_df_div_zero_series_does_not_commute(self):
+        # integer div, but deal with the 0's (GH#9144)
+        df = pd.DataFrame(np.random.randn(10, 5))
+        ser = df[0]
+        res = ser / df
+        res2 = df / ser
+        assert not res.fillna(0).equals(res2.fillna(0))
+
+
+class TestFrameArithmetic(object):
+
+    @pytest.mark.xfail(reason='GH#7996 datetime64 units not converted to nano')
+    def test_df_sub_datetime64_not_ns(self):
+        df = pd.DataFrame(pd.date_range('20130101', periods=3))
+        dt64 = np.datetime64('2013-01-01')
+        assert dt64.dtype == 'datetime64[D]'
+        res = df - dt64
+        expected = pd.DataFrame([pd.Timedelta(days=0), pd.Timedelta(days=1),
+                                 pd.Timedelta(days=2)])
+        tm.assert_frame_equal(res, expected)
+
+    @pytest.mark.parametrize('data', [
+        [1, 2, 3],
+        [1.1, 2.2, 3.3],
+        [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02'), pd.NaT],
+        ['x', 'y', 1]])
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_df_radd_str_invalid(self, dtype, data):
+        df = pd.DataFrame(data, dtype=dtype)
+        with pytest.raises(TypeError):
+            'foo_' + df
+
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_df_with_dtype_radd_int(self, dtype):
+        df = pd.DataFrame([1, 2, 3], dtype=dtype)
+        expected = pd.DataFrame([2, 3, 4], dtype=dtype)
+        result = 1 + df
+        tm.assert_frame_equal(result, expected)
+        result = df + 1
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_df_with_dtype_radd_nan(self, dtype):
+        df = pd.DataFrame([1, 2, 3], dtype=dtype)
+        expected = pd.DataFrame([np.nan, np.nan, np.nan], dtype=dtype)
+        result = np.nan + df
+        tm.assert_frame_equal(result, expected)
+        result = df + np.nan
+        tm.assert_frame_equal(result, expected)
+
+    def test_df_radd_str(self):
+        df = pd.DataFrame(['x', np.nan, 'x'])
+        tm.assert_frame_equal('a' + df, pd.DataFrame(['ax', np.nan, 'ax']))
+        tm.assert_frame_equal(df + 'a', pd.DataFrame(['xa', np.nan, 'xa']))
+
+
+class TestPeriodFrameArithmetic(object):
+
+    def test_ops_frame_period(self):
+        # GH 13043
+        df = pd.DataFrame({'A': [pd.Period('2015-01', freq='M'),
+                                 pd.Period('2015-02', freq='M')],
+                           'B': [pd.Period('2014-01', freq='M'),
+                                 pd.Period('2014-02', freq='M')]})
+        assert df['A'].dtype == object
+        assert df['B'].dtype == object
+
+        p = pd.Period('2015-03', freq='M')
+        off = p.freq
+        # dtype will be object because of original dtype
+        exp = pd.DataFrame({'A': np.array([2 * off, 1 * off], dtype=object),
+                            'B': np.array([14 * off, 13 * off], dtype=object)})
+        tm.assert_frame_equal(p - df, exp)
+        tm.assert_frame_equal(df - p, -1 * exp)
+
+        df2 = pd.DataFrame({'A': [pd.Period('2015-05', freq='M'),
+                                  pd.Period('2015-06', freq='M')],
+                            'B': [pd.Period('2015-05', freq='M'),
+                                  pd.Period('2015-06', freq='M')]})
+        assert df2['A'].dtype == object
+        assert df2['B'].dtype == object
+
+        exp = pd.DataFrame({'A': np.array([4 * off, 4 * off], dtype=object),
+                            'B': np.array([16 * off, 16 * off], dtype=object)})
+        tm.assert_frame_equal(df2 - df, exp)
+        tm.assert_frame_equal(df - df2, -1 * exp)
diff --git a/pandas/tests/frame/test_asof.py b/pandas/tests/frame/test_asof.py
new file mode 100644
index 0000000000000..fea6a5370109e
--- /dev/null
+++ b/pandas/tests/frame/test_asof.py
@@ -0,0 +1,108 @@
+# coding=utf-8
+
+import numpy as np
+from pandas import (DataFrame, date_range, Timestamp, Series,
+                    to_datetime)
+
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestFrameAsof(TestData):
+    def setup_method(self, method):
+        self.N = N = 50
+        self.rng = date_range('1/1/1990', periods=N, freq='53s')
+        self.df = DataFrame({'A': np.arange(N), 'B': np.arange(N)},
+                            index=self.rng)
+
+    def test_basic(self):
+        df = self.df.copy()
+        df.loc[15:30, 'A'] = np.nan
+        dates = date_range('1/1/1990', periods=self.N * 3,
+                           freq='25s')
+
+        result = df.asof(dates)
+        assert result.notna().all(1).all()
+        lb = df.index[14]
+        ub = df.index[30]
+
+        dates = list(dates)
+        result = df.asof(dates)
+        assert result.notna().all(1).all()
+
+        mask = (result.index >= lb) & (result.index < ub)
+        rs = result[mask]
+        assert (rs == 14).all(1).all()
+
+    def test_subset(self):
+        N = 10
+        rng = date_range('1/1/1990', periods=N, freq='53s')
+        df = DataFrame({'A': np.arange(N), 'B': np.arange(N)},
+                       index=rng)
+        df.loc[4:8, 'A'] = np.nan
+        dates = date_range('1/1/1990', periods=N * 3,
+                           freq='25s')
+
+        # with a subset of A should be the same
+        result = df.asof(dates, subset='A')
+        expected = df.asof(dates)
+        tm.assert_frame_equal(result, expected)
+
+        # same with A/B
+        result = df.asof(dates, subset=['A', 'B'])
+        expected = df.asof(dates)
+        tm.assert_frame_equal(result, expected)
+
+        # B gives self.df.asof
+        result = df.asof(dates, subset='B')
+        expected = df.resample('25s', closed='right').ffill().reindex(dates)
+        expected.iloc[20:] = 9
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_missing(self):
+        # GH 15118
+        # no match found - `where` value before earliest date in index
+        N = 10
+        rng = date_range('1/1/1990', periods=N, freq='53s')
+        df = DataFrame({'A': np.arange(N), 'B': np.arange(N)},
+                       index=rng)
+        result = df.asof('1989-12-31')
+
+        expected = Series(index=['A', 'B'], name=Timestamp('1989-12-31'))
+        tm.assert_series_equal(result, expected)
+
+        result = df.asof(to_datetime(['1989-12-31']))
+        expected = DataFrame(index=to_datetime(['1989-12-31']),
+                             columns=['A', 'B'], dtype='float64')
+        tm.assert_frame_equal(result, expected)
+
+    def test_all_nans(self):
+        # GH 15713
+        # DataFrame is all nans
+        result = DataFrame([np.nan]).asof([0])
+        expected = DataFrame([np.nan])
+        tm.assert_frame_equal(result, expected)
+
+        # testing non-default indexes, multiple inputs
+        dates = date_range('1/1/1990', periods=self.N * 3, freq='25s')
+        result = DataFrame(np.nan, index=self.rng, columns=['A']).asof(dates)
+        expected = DataFrame(np.nan, index=dates, columns=['A'])
+        tm.assert_frame_equal(result, expected)
+
+        # testing multiple columns
+        dates = date_range('1/1/1990', periods=self.N * 3, freq='25s')
+        result = DataFrame(np.nan, index=self.rng,
+                           columns=['A', 'B', 'C']).asof(dates)
+        expected = DataFrame(np.nan, index=dates, columns=['A', 'B', 'C'])
+        tm.assert_frame_equal(result, expected)
+
+        # testing scalar input
+        result = DataFrame(np.nan, index=[1, 2], columns=['A', 'B']).asof([3])
+        expected = DataFrame(np.nan, index=[3], columns=['A', 'B'])
+        tm.assert_frame_equal(result, expected)
+
+        result = DataFrame(np.nan, index=[1, 2], columns=['A', 'B']).asof(3)
+        expected = Series(np.nan, index=['A', 'B'], name=3)
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/frame/test_axis_select_reindex.py b/pandas/tests/frame/test_axis_select_reindex.py
new file mode 100644
index 0000000000000..0e0d6598f5101
--- /dev/null
+++ b/pandas/tests/frame/test_axis_select_reindex.py
@@ -0,0 +1,1168 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import pytest
+
+from datetime import datetime
+
+from numpy import random
+import numpy as np
+
+from pandas.compat import lrange, lzip, u
+from pandas import (compat, DataFrame, Series, Index, MultiIndex,
+                    date_range, isna)
+import pandas as pd
+
+from pandas.util.testing import assert_frame_equal
+
+from pandas.errors import PerformanceWarning
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+class TestDataFrameSelectReindex(TestData):
+    # These are specific reindex-based tests; other indexing tests should go in
+    # test_indexing
+
+    def test_drop_names(self):
+        df = DataFrame([[1, 2, 3], [3, 4, 5], [5, 6, 7]],
+                       index=['a', 'b', 'c'],
+                       columns=['d', 'e', 'f'])
+        df.index.name, df.columns.name = 'first', 'second'
+        df_dropped_b = df.drop('b')
+        df_dropped_e = df.drop('e', axis=1)
+        df_inplace_b, df_inplace_e = df.copy(), df.copy()
+        df_inplace_b.drop('b', inplace=True)
+        df_inplace_e.drop('e', axis=1, inplace=True)
+        for obj in (df_dropped_b, df_dropped_e, df_inplace_b, df_inplace_e):
+            assert obj.index.name == 'first'
+            assert obj.columns.name == 'second'
+        assert list(df.columns) == ['d', 'e', 'f']
+
+        pytest.raises(KeyError, df.drop, ['g'])
+        pytest.raises(KeyError, df.drop, ['g'], 1)
+
+        # errors = 'ignore'
+        dropped = df.drop(['g'], errors='ignore')
+        expected = Index(['a', 'b', 'c'], name='first')
+        tm.assert_index_equal(dropped.index, expected)
+
+        dropped = df.drop(['b', 'g'], errors='ignore')
+        expected = Index(['a', 'c'], name='first')
+        tm.assert_index_equal(dropped.index, expected)
+
+        dropped = df.drop(['g'], axis=1, errors='ignore')
+        expected = Index(['d', 'e', 'f'], name='second')
+        tm.assert_index_equal(dropped.columns, expected)
+
+        dropped = df.drop(['d', 'g'], axis=1, errors='ignore')
+        expected = Index(['e', 'f'], name='second')
+        tm.assert_index_equal(dropped.columns, expected)
+
+        # GH 16398
+        dropped = df.drop([], errors='ignore')
+        expected = Index(['a', 'b', 'c'], name='first')
+        tm.assert_index_equal(dropped.index, expected)
+
+    def test_drop_col_still_multiindex(self):
+        arrays = [['a', 'b', 'c', 'top'],
+                  ['', '', '', 'OD'],
+                  ['', '', '', 'wx']]
+
+        tuples = sorted(zip(*arrays))
+        index = MultiIndex.from_tuples(tuples)
+
+        df = DataFrame(np.random.randn(3, 4), columns=index)
+        del df[('a', '', '')]
+        assert(isinstance(df.columns, MultiIndex))
+
+    def test_drop(self):
+        simple = DataFrame({"A": [1, 2, 3, 4], "B": [0, 1, 2, 3]})
+        assert_frame_equal(simple.drop("A", axis=1), simple[['B']])
+        assert_frame_equal(simple.drop(["A", "B"], axis='columns'),
+                           simple[[]])
+        assert_frame_equal(simple.drop([0, 1, 3], axis=0), simple.loc[[2], :])
+        assert_frame_equal(simple.drop(
+            [0, 3], axis='index'), simple.loc[[1, 2], :])
+
+        pytest.raises(KeyError, simple.drop, 5)
+        pytest.raises(KeyError, simple.drop, 'C', 1)
+        pytest.raises(KeyError, simple.drop, [1, 5])
+        pytest.raises(KeyError, simple.drop, ['A', 'C'], 1)
+
+        # errors = 'ignore'
+        assert_frame_equal(simple.drop(5, errors='ignore'), simple)
+        assert_frame_equal(simple.drop([0, 5], errors='ignore'),
+                           simple.loc[[1, 2, 3], :])
+        assert_frame_equal(simple.drop('C', axis=1, errors='ignore'), simple)
+        assert_frame_equal(simple.drop(['A', 'C'], axis=1, errors='ignore'),
+                           simple[['B']])
+
+        # non-unique - wheee!
+        nu_df = DataFrame(lzip(range(3), range(-3, 1), list('abc')),
+                          columns=['a', 'a', 'b'])
+        assert_frame_equal(nu_df.drop('a', axis=1), nu_df[['b']])
+        assert_frame_equal(nu_df.drop('b', axis='columns'), nu_df['a'])
+        assert_frame_equal(nu_df.drop([]), nu_df)  # GH 16398
+
+        nu_df = nu_df.set_index(pd.Index(['X', 'Y', 'X']))
+        nu_df.columns = list('abc')
+        assert_frame_equal(nu_df.drop('X', axis='rows'), nu_df.loc[["Y"], :])
+        assert_frame_equal(nu_df.drop(['X', 'Y'], axis=0), nu_df.loc[[], :])
+
+        # inplace cache issue
+        # GH 5628
+        df = pd.DataFrame(np.random.randn(10, 3), columns=list('abc'))
+        expected = df[~(df.b > 0)]
+        df.drop(labels=df[df.b > 0].index, inplace=True)
+        assert_frame_equal(df, expected)
+
+    def test_drop_multiindex_not_lexsorted(self):
+        # GH 11640
+
+        # define the lexsorted version
+        lexsorted_mi = MultiIndex.from_tuples(
+            [('a', ''), ('b1', 'c1'), ('b2', 'c2')], names=['b', 'c'])
+        lexsorted_df = DataFrame([[1, 3, 4]], columns=lexsorted_mi)
+        assert lexsorted_df.columns.is_lexsorted()
+
+        # define the non-lexsorted version
+        not_lexsorted_df = DataFrame(columns=['a', 'b', 'c', 'd'],
+                                     data=[[1, 'b1', 'c1', 3],
+                                           [1, 'b2', 'c2', 4]])
+        not_lexsorted_df = not_lexsorted_df.pivot_table(
+            index='a', columns=['b', 'c'], values='d')
+        not_lexsorted_df = not_lexsorted_df.reset_index()
+        assert not not_lexsorted_df.columns.is_lexsorted()
+
+        # compare the results
+        tm.assert_frame_equal(lexsorted_df, not_lexsorted_df)
+
+        expected = lexsorted_df.drop('a', axis=1)
+        with tm.assert_produces_warning(PerformanceWarning):
+            result = not_lexsorted_df.drop('a', axis=1)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_drop_api_equivalence(self):
+        # equivalence of the labels/axis and index/columns API's (GH12392)
+        df = DataFrame([[1, 2, 3], [3, 4, 5], [5, 6, 7]],
+                       index=['a', 'b', 'c'],
+                       columns=['d', 'e', 'f'])
+
+        res1 = df.drop('a')
+        res2 = df.drop(index='a')
+        tm.assert_frame_equal(res1, res2)
+
+        res1 = df.drop('d', 1)
+        res2 = df.drop(columns='d')
+        tm.assert_frame_equal(res1, res2)
+
+        res1 = df.drop(labels='e', axis=1)
+        res2 = df.drop(columns='e')
+        tm.assert_frame_equal(res1, res2)
+
+        res1 = df.drop(['a'], axis=0)
+        res2 = df.drop(index=['a'])
+        tm.assert_frame_equal(res1, res2)
+
+        res1 = df.drop(['a'], axis=0).drop(['d'], axis=1)
+        res2 = df.drop(index=['a'], columns=['d'])
+        tm.assert_frame_equal(res1, res2)
+
+        with pytest.raises(ValueError):
+            df.drop(labels='a', index='b')
+
+        with pytest.raises(ValueError):
+            df.drop(labels='a', columns='b')
+
+        with pytest.raises(ValueError):
+            df.drop(axis=1)
+
+    def test_merge_join_different_levels(self):
+        # GH 9455
+
+        # first dataframe
+        df1 = DataFrame(columns=['a', 'b'], data=[[1, 11], [0, 22]])
+
+        # second dataframe
+        columns = MultiIndex.from_tuples([('a', ''), ('c', 'c1')])
+        df2 = DataFrame(columns=columns, data=[[1, 33], [0, 44]])
+
+        # merge
+        columns = ['a', 'b', ('c', 'c1')]
+        expected = DataFrame(columns=columns, data=[[1, 11, 33], [0, 22, 44]])
+        with tm.assert_produces_warning(UserWarning):
+            result = pd.merge(df1, df2, on='a')
+        tm.assert_frame_equal(result, expected)
+
+        # join, see discussion in GH 12219
+        columns = ['a', 'b', ('a', ''), ('c', 'c1')]
+        expected = DataFrame(columns=columns,
+                             data=[[1, 11, 0, 44], [0, 22, 1, 33]])
+        with tm.assert_produces_warning(UserWarning):
+            result = df1.join(df2, on='a')
+        tm.assert_frame_equal(result, expected)
+
+    def test_reindex(self):
+        newFrame = self.frame.reindex(self.ts1.index)
+
+        for col in newFrame.columns:
+            for idx, val in compat.iteritems(newFrame[col]):
+                if idx in self.frame.index:
+                    if np.isnan(val):
+                        assert np.isnan(self.frame[col][idx])
+                    else:
+                        assert val == self.frame[col][idx]
+                else:
+                    assert np.isnan(val)
+
+        for col, series in compat.iteritems(newFrame):
+            assert tm.equalContents(series.index, newFrame.index)
+        emptyFrame = self.frame.reindex(Index([]))
+        assert len(emptyFrame.index) == 0
+
+        # Cython code should be unit-tested directly
+        nonContigFrame = self.frame.reindex(self.ts1.index[::2])
+
+        for col in nonContigFrame.columns:
+            for idx, val in compat.iteritems(nonContigFrame[col]):
+                if idx in self.frame.index:
+                    if np.isnan(val):
+                        assert np.isnan(self.frame[col][idx])
+                    else:
+                        assert val == self.frame[col][idx]
+                else:
+                    assert np.isnan(val)
+
+        for col, series in compat.iteritems(nonContigFrame):
+            assert tm.equalContents(series.index, nonContigFrame.index)
+
+        # corner cases
+
+        # Same index, copies values but not index if copy=False
+        newFrame = self.frame.reindex(self.frame.index, copy=False)
+        assert newFrame.index is self.frame.index
+
+        # length zero
+        newFrame = self.frame.reindex([])
+        assert newFrame.empty
+        assert len(newFrame.columns) == len(self.frame.columns)
+
+        # length zero with columns reindexed with non-empty index
+        newFrame = self.frame.reindex([])
+        newFrame = newFrame.reindex(self.frame.index)
+        assert len(newFrame.index) == len(self.frame.index)
+        assert len(newFrame.columns) == len(self.frame.columns)
+
+        # pass non-Index
+        newFrame = self.frame.reindex(list(self.ts1.index))
+        tm.assert_index_equal(newFrame.index, self.ts1.index)
+
+        # copy with no axes
+        result = self.frame.reindex()
+        assert_frame_equal(result, self.frame)
+        assert result is not self.frame
+
+    def test_reindex_nan(self):
+        df = pd.DataFrame([[1, 2], [3, 5], [7, 11], [9, 23]],
+                          index=[2, np.nan, 1, 5],
+                          columns=['joe', 'jim'])
+
+        i, j = [np.nan, 5, 5, np.nan, 1, 2, np.nan], [1, 3, 3, 1, 2, 0, 1]
+        assert_frame_equal(df.reindex(i), df.iloc[j])
+
+        df.index = df.index.astype('object')
+        assert_frame_equal(df.reindex(i), df.iloc[j], check_index_type=False)
+
+        # GH10388
+        df = pd.DataFrame({'other': ['a', 'b', np.nan, 'c'],
+                           'date': ['2015-03-22', np.nan,
+                                    '2012-01-08', np.nan],
+                           'amount': [2, 3, 4, 5]})
+
+        df['date'] = pd.to_datetime(df.date)
+        df['delta'] = (pd.to_datetime('2015-06-18') - df['date']).shift(1)
+
+        left = df.set_index(['delta', 'other', 'date']).reset_index()
+        right = df.reindex(columns=['delta', 'other', 'date', 'amount'])
+        assert_frame_equal(left, right)
+
+    def test_reindex_name_remains(self):
+        s = Series(random.rand(10))
+        df = DataFrame(s, index=np.arange(len(s)))
+        i = Series(np.arange(10), name='iname')
+
+        df = df.reindex(i)
+        assert df.index.name == 'iname'
+
+        df = df.reindex(Index(np.arange(10), name='tmpname'))
+        assert df.index.name == 'tmpname'
+
+        s = Series(random.rand(10))
+        df = DataFrame(s.T, index=np.arange(len(s)))
+        i = Series(np.arange(10), name='iname')
+        df = df.reindex(columns=i)
+        assert df.columns.name == 'iname'
+
+    def test_reindex_int(self):
+        smaller = self.intframe.reindex(self.intframe.index[::2])
+
+        assert smaller['A'].dtype == np.int64
+
+        bigger = smaller.reindex(self.intframe.index)
+        assert bigger['A'].dtype == np.float64
+
+        smaller = self.intframe.reindex(columns=['A', 'B'])
+        assert smaller['A'].dtype == np.int64
+
+    def test_reindex_like(self):
+        other = self.frame.reindex(index=self.frame.index[:10],
+                                   columns=['C', 'B'])
+
+        assert_frame_equal(other, self.frame.reindex_like(other))
+
+    def test_reindex_columns(self):
+        new_frame = self.frame.reindex(columns=['A', 'B', 'E'])
+
+        tm.assert_series_equal(new_frame['B'], self.frame['B'])
+        assert np.isnan(new_frame['E']).all()
+        assert 'C' not in new_frame
+
+        # Length zero
+        new_frame = self.frame.reindex(columns=[])
+        assert new_frame.empty
+
+    def test_reindex_columns_method(self):
+
+        # GH 14992, reindexing over columns ignored method
+        df = DataFrame(data=[[11, 12, 13], [21, 22, 23], [31, 32, 33]],
+                       index=[1, 2, 4],
+                       columns=[1, 2, 4],
+                       dtype=float)
+
+        # default method
+        result = df.reindex(columns=range(6))
+        expected = DataFrame(data=[[np.nan, 11, 12, np.nan, 13, np.nan],
+                                   [np.nan, 21, 22, np.nan, 23, np.nan],
+                                   [np.nan, 31, 32, np.nan, 33, np.nan]],
+                             index=[1, 2, 4],
+                             columns=range(6),
+                             dtype=float)
+        assert_frame_equal(result, expected)
+
+        # method='ffill'
+        result = df.reindex(columns=range(6), method='ffill')
+        expected = DataFrame(data=[[np.nan, 11, 12, 12, 13, 13],
+                                   [np.nan, 21, 22, 22, 23, 23],
+                                   [np.nan, 31, 32, 32, 33, 33]],
+                             index=[1, 2, 4],
+                             columns=range(6),
+                             dtype=float)
+        assert_frame_equal(result, expected)
+
+        # method='bfill'
+        result = df.reindex(columns=range(6), method='bfill')
+        expected = DataFrame(data=[[11, 11, 12, 13, 13, np.nan],
+                                   [21, 21, 22, 23, 23, np.nan],
+                                   [31, 31, 32, 33, 33, np.nan]],
+                             index=[1, 2, 4],
+                             columns=range(6),
+                             dtype=float)
+        assert_frame_equal(result, expected)
+
+    def test_reindex_axes(self):
+        # GH 3317, reindexing by both axes loses freq of the index
+        df = DataFrame(np.ones((3, 3)),
+                       index=[datetime(2012, 1, 1),
+                              datetime(2012, 1, 2),
+                              datetime(2012, 1, 3)],
+                       columns=['a', 'b', 'c'])
+        time_freq = date_range('2012-01-01', '2012-01-03', freq='d')
+        some_cols = ['a', 'b']
+
+        index_freq = df.reindex(index=time_freq).index.freq
+        both_freq = df.reindex(index=time_freq, columns=some_cols).index.freq
+        seq_freq = df.reindex(index=time_freq).reindex(
+            columns=some_cols).index.freq
+        assert index_freq == both_freq
+        assert index_freq == seq_freq
+
+    def test_reindex_fill_value(self):
+        df = DataFrame(np.random.randn(10, 4))
+
+        # axis=0
+        result = df.reindex(lrange(15))
+        assert np.isnan(result.values[-5:]).all()
+
+        result = df.reindex(lrange(15), fill_value=0)
+        expected = df.reindex(lrange(15)).fillna(0)
+        assert_frame_equal(result, expected)
+
+        # axis=1
+        result = df.reindex(columns=lrange(5), fill_value=0.)
+        expected = df.copy()
+        expected[4] = 0.
+        assert_frame_equal(result, expected)
+
+        result = df.reindex(columns=lrange(5), fill_value=0)
+        expected = df.copy()
+        expected[4] = 0
+        assert_frame_equal(result, expected)
+
+        result = df.reindex(columns=lrange(5), fill_value='foo')
+        expected = df.copy()
+        expected[4] = 'foo'
+        assert_frame_equal(result, expected)
+
+        # reindex_axis
+        with tm.assert_produces_warning(FutureWarning):
+            result = df.reindex_axis(lrange(15), fill_value=0., axis=0)
+        expected = df.reindex(lrange(15)).fillna(0)
+        assert_frame_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning):
+            result = df.reindex_axis(lrange(5), fill_value=0., axis=1)
+        expected = df.reindex(columns=lrange(5)).fillna(0)
+        assert_frame_equal(result, expected)
+
+        # other dtypes
+        df['foo'] = 'foo'
+        result = df.reindex(lrange(15), fill_value=0)
+        expected = df.reindex(lrange(15)).fillna(0)
+        assert_frame_equal(result, expected)
+
+    def test_reindex_dups(self):
+
+        # GH4746, reindex on duplicate index error messages
+        arr = np.random.randn(10)
+        df = DataFrame(arr, index=[1, 2, 3, 4, 5, 1, 2, 3, 4, 5])
+
+        # set index is ok
+        result = df.copy()
+        result.index = list(range(len(df)))
+        expected = DataFrame(arr, index=list(range(len(df))))
+        assert_frame_equal(result, expected)
+
+        # reindex fails
+        pytest.raises(ValueError, df.reindex, index=list(range(len(df))))
+
+    def test_reindex_axis_style(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
+        expected = pd.DataFrame({"A": [1, 2, np.nan], "B": [4, 5, np.nan]},
+                                index=[0, 1, 3])
+        result = df.reindex([0, 1, 3])
+        assert_frame_equal(result, expected)
+
+        result = df.reindex([0, 1, 3], axis=0)
+        assert_frame_equal(result, expected)
+
+        result = df.reindex([0, 1, 3], axis='index')
+        assert_frame_equal(result, expected)
+
+    def test_reindex_positional_warns(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
+        expected = pd.DataFrame({"A": [1., 2], 'B': [4., 5],
+                                 "C": [np.nan, np.nan]})
+        with tm.assert_produces_warning(FutureWarning):
+            result = df.reindex([0, 1], ['A', 'B', 'C'])
+
+        assert_frame_equal(result, expected)
+
+    def test_reindex_axis_style_raises(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        df = pd.DataFrame({"A": [1, 2, 3], 'B': [4, 5, 6]})
+        with tm.assert_raises_regex(TypeError, "Cannot specify both 'axis'"):
+            df.reindex([0, 1], ['A'], axis=1)
+
+        with tm.assert_raises_regex(TypeError, "Cannot specify both 'axis'"):
+            df.reindex([0, 1], ['A'], axis='index')
+
+        with tm.assert_raises_regex(TypeError, "Cannot specify both 'axis'"):
+            df.reindex(index=[0, 1], axis='index')
+
+        with tm.assert_raises_regex(TypeError, "Cannot specify both 'axis'"):
+            df.reindex(index=[0, 1], axis='columns')
+
+        with tm.assert_raises_regex(TypeError, "Cannot specify both 'axis'"):
+            df.reindex(columns=[0, 1], axis='columns')
+
+        with tm.assert_raises_regex(TypeError, "Cannot specify both 'axis'"):
+            df.reindex(index=[0, 1], columns=[0, 1], axis='columns')
+
+        with tm.assert_raises_regex(TypeError, 'Cannot specify all'):
+            df.reindex([0, 1], [0], ['A'])
+
+        # Mixing styles
+        with tm.assert_raises_regex(TypeError, "Cannot specify both 'axis'"):
+            df.reindex(index=[0, 1], axis='index')
+
+        with tm.assert_raises_regex(TypeError, "Cannot specify both 'axis'"):
+            df.reindex(index=[0, 1], axis='columns')
+
+        # Duplicates
+        with tm.assert_raises_regex(TypeError, "multiple values"):
+            df.reindex([0, 1], labels=[0, 1])
+
+    def test_reindex_single_named_indexer(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        df = pd.DataFrame({"A": [1, 2, 3], "B": [1, 2, 3]})
+        result = df.reindex([0, 1], columns=['A'])
+        expected = pd.DataFrame({"A": [1, 2]})
+        assert_frame_equal(result, expected)
+
+    def test_reindex_api_equivalence(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        # equivalence of the labels/axis and index/columns API's
+        df = DataFrame([[1, 2, 3], [3, 4, 5], [5, 6, 7]],
+                       index=['a', 'b', 'c'],
+                       columns=['d', 'e', 'f'])
+
+        res1 = df.reindex(['b', 'a'])
+        res2 = df.reindex(index=['b', 'a'])
+        res3 = df.reindex(labels=['b', 'a'])
+        res4 = df.reindex(labels=['b', 'a'], axis=0)
+        res5 = df.reindex(['b', 'a'], axis=0)
+        for res in [res2, res3, res4, res5]:
+            tm.assert_frame_equal(res1, res)
+
+        res1 = df.reindex(columns=['e', 'd'])
+        res2 = df.reindex(['e', 'd'], axis=1)
+        res3 = df.reindex(labels=['e', 'd'], axis=1)
+        for res in [res2, res3]:
+            tm.assert_frame_equal(res1, res)
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            res1 = df.reindex(['b', 'a'], ['e', 'd'])
+        assert 'reindex' in str(m[0].message)
+        res2 = df.reindex(columns=['e', 'd'], index=['b', 'a'])
+        res3 = df.reindex(labels=['b', 'a'], axis=0).reindex(labels=['e', 'd'],
+                                                             axis=1)
+        for res in [res2, res3]:
+            tm.assert_frame_equal(res1, res)
+
+    def test_align(self):
+        af, bf = self.frame.align(self.frame)
+        assert af._data is not self.frame._data
+
+        af, bf = self.frame.align(self.frame, copy=False)
+        assert af._data is self.frame._data
+
+        # axis = 0
+        other = self.frame.iloc[:-5, :3]
+        af, bf = self.frame.align(other, axis=0, fill_value=-1)
+
+        tm.assert_index_equal(bf.columns, other.columns)
+
+        # test fill value
+        join_idx = self.frame.index.join(other.index)
+        diff_a = self.frame.index.difference(join_idx)
+        diff_b = other.index.difference(join_idx)
+        diff_a_vals = af.reindex(diff_a).values
+        diff_b_vals = bf.reindex(diff_b).values
+        assert (diff_a_vals == -1).all()
+
+        af, bf = self.frame.align(other, join='right', axis=0)
+        tm.assert_index_equal(bf.columns, other.columns)
+        tm.assert_index_equal(bf.index, other.index)
+        tm.assert_index_equal(af.index, other.index)
+
+        # axis = 1
+        other = self.frame.iloc[:-5, :3].copy()
+        af, bf = self.frame.align(other, axis=1)
+        tm.assert_index_equal(bf.columns, self.frame.columns)
+        tm.assert_index_equal(bf.index, other.index)
+
+        # test fill value
+        join_idx = self.frame.index.join(other.index)
+        diff_a = self.frame.index.difference(join_idx)
+        diff_b = other.index.difference(join_idx)
+        diff_a_vals = af.reindex(diff_a).values
+
+        # TODO(wesm): unused?
+        diff_b_vals = bf.reindex(diff_b).values  # noqa
+
+        assert (diff_a_vals == -1).all()
+
+        af, bf = self.frame.align(other, join='inner', axis=1)
+        tm.assert_index_equal(bf.columns, other.columns)
+
+        af, bf = self.frame.align(other, join='inner', axis=1, method='pad')
+        tm.assert_index_equal(bf.columns, other.columns)
+
+        # test other non-float types
+        af, bf = self.intframe.align(other, join='inner', axis=1, method='pad')
+        tm.assert_index_equal(bf.columns, other.columns)
+
+        af, bf = self.mixed_frame.align(self.mixed_frame,
+                                        join='inner', axis=1, method='pad')
+        tm.assert_index_equal(bf.columns, self.mixed_frame.columns)
+
+        af, bf = self.frame.align(other.iloc[:, 0], join='inner', axis=1,
+                                  method=None, fill_value=None)
+        tm.assert_index_equal(bf.index, Index([]))
+
+        af, bf = self.frame.align(other.iloc[:, 0], join='inner', axis=1,
+                                  method=None, fill_value=0)
+        tm.assert_index_equal(bf.index, Index([]))
+
+        # mixed floats/ints
+        af, bf = self.mixed_float.align(other.iloc[:, 0], join='inner', axis=1,
+                                        method=None, fill_value=0)
+        tm.assert_index_equal(bf.index, Index([]))
+
+        af, bf = self.mixed_int.align(other.iloc[:, 0], join='inner', axis=1,
+                                      method=None, fill_value=0)
+        tm.assert_index_equal(bf.index, Index([]))
+
+        # Try to align DataFrame to Series along bad axis
+        with pytest.raises(ValueError):
+            self.frame.align(af.iloc[0, :3], join='inner', axis=2)
+
+        # align dataframe to series with broadcast or not
+        idx = self.frame.index
+        s = Series(range(len(idx)), index=idx)
+
+        left, right = self.frame.align(s, axis=0)
+        tm.assert_index_equal(left.index, self.frame.index)
+        tm.assert_index_equal(right.index, self.frame.index)
+        assert isinstance(right, Series)
+
+        left, right = self.frame.align(s, broadcast_axis=1)
+        tm.assert_index_equal(left.index, self.frame.index)
+        expected = {}
+        for c in self.frame.columns:
+            expected[c] = s
+        expected = DataFrame(expected, index=self.frame.index,
+                             columns=self.frame.columns)
+        tm.assert_frame_equal(right, expected)
+
+        # see gh-9558
+        df = DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]})
+        result = df[df['a'] == 2]
+        expected = DataFrame([[2, 5]], index=[1], columns=['a', 'b'])
+        tm.assert_frame_equal(result, expected)
+
+        result = df.where(df['a'] == 2, 0)
+        expected = DataFrame({'a': [0, 2, 0], 'b': [0, 5, 0]})
+        tm.assert_frame_equal(result, expected)
+
+    def _check_align(self, a, b, axis, fill_axis, how, method, limit=None):
+        aa, ab = a.align(b, axis=axis, join=how, method=method, limit=limit,
+                         fill_axis=fill_axis)
+
+        join_index, join_columns = None, None
+
+        ea, eb = a, b
+        if axis is None or axis == 0:
+            join_index = a.index.join(b.index, how=how)
+            ea = ea.reindex(index=join_index)
+            eb = eb.reindex(index=join_index)
+
+        if axis is None or axis == 1:
+            join_columns = a.columns.join(b.columns, how=how)
+            ea = ea.reindex(columns=join_columns)
+            eb = eb.reindex(columns=join_columns)
+
+        ea = ea.fillna(axis=fill_axis, method=method, limit=limit)
+        eb = eb.fillna(axis=fill_axis, method=method, limit=limit)
+
+        assert_frame_equal(aa, ea)
+        assert_frame_equal(ab, eb)
+
+    def test_align_fill_method_inner(self):
+        for meth in ['pad', 'bfill']:
+            for ax in [0, 1, None]:
+                for fax in [0, 1]:
+                    self._check_align_fill('inner', meth, ax, fax)
+
+    def test_align_fill_method_outer(self):
+        for meth in ['pad', 'bfill']:
+            for ax in [0, 1, None]:
+                for fax in [0, 1]:
+                    self._check_align_fill('outer', meth, ax, fax)
+
+    def test_align_fill_method_left(self):
+        for meth in ['pad', 'bfill']:
+            for ax in [0, 1, None]:
+                for fax in [0, 1]:
+                    self._check_align_fill('left', meth, ax, fax)
+
+    def test_align_fill_method_right(self):
+        for meth in ['pad', 'bfill']:
+            for ax in [0, 1, None]:
+                for fax in [0, 1]:
+                    self._check_align_fill('right', meth, ax, fax)
+
+    def _check_align_fill(self, kind, meth, ax, fax):
+        left = self.frame.iloc[0:4, :10]
+        right = self.frame.iloc[2:, 6:]
+        empty = self.frame.iloc[:0, :0]
+
+        self._check_align(left, right, axis=ax, fill_axis=fax,
+                          how=kind, method=meth)
+        self._check_align(left, right, axis=ax, fill_axis=fax,
+                          how=kind, method=meth, limit=1)
+
+        # empty left
+        self._check_align(empty, right, axis=ax, fill_axis=fax,
+                          how=kind, method=meth)
+        self._check_align(empty, right, axis=ax, fill_axis=fax,
+                          how=kind, method=meth, limit=1)
+
+        # empty right
+        self._check_align(left, empty, axis=ax, fill_axis=fax,
+                          how=kind, method=meth)
+        self._check_align(left, empty, axis=ax, fill_axis=fax,
+                          how=kind, method=meth, limit=1)
+
+        # both empty
+        self._check_align(empty, empty, axis=ax, fill_axis=fax,
+                          how=kind, method=meth)
+        self._check_align(empty, empty, axis=ax, fill_axis=fax,
+                          how=kind, method=meth, limit=1)
+
+    def test_align_int_fill_bug(self):
+        # GH #910
+        X = np.arange(10 * 10, dtype='float64').reshape(10, 10)
+        Y = np.ones((10, 1), dtype=int)
+
+        df1 = DataFrame(X)
+        df1['0.X'] = Y.squeeze()
+
+        df2 = df1.astype(float)
+
+        result = df1 - df1.mean()
+        expected = df2 - df2.mean()
+        assert_frame_equal(result, expected)
+
+    def test_align_multiindex(self):
+        # GH 10665
+        # same test cases as test_align_multiindex in test_series.py
+
+        midx = pd.MultiIndex.from_product([range(2), range(3), range(2)],
+                                          names=('a', 'b', 'c'))
+        idx = pd.Index(range(2), name='b')
+        df1 = pd.DataFrame(np.arange(12, dtype='int64'), index=midx)
+        df2 = pd.DataFrame(np.arange(2, dtype='int64'), index=idx)
+
+        # these must be the same results (but flipped)
+        res1l, res1r = df1.align(df2, join='left')
+        res2l, res2r = df2.align(df1, join='right')
+
+        expl = df1
+        assert_frame_equal(expl, res1l)
+        assert_frame_equal(expl, res2r)
+        expr = pd.DataFrame([0, 0, 1, 1, np.nan, np.nan] * 2, index=midx)
+        assert_frame_equal(expr, res1r)
+        assert_frame_equal(expr, res2l)
+
+        res1l, res1r = df1.align(df2, join='right')
+        res2l, res2r = df2.align(df1, join='left')
+
+        exp_idx = pd.MultiIndex.from_product([range(2), range(2), range(2)],
+                                             names=('a', 'b', 'c'))
+        expl = pd.DataFrame([0, 1, 2, 3, 6, 7, 8, 9], index=exp_idx)
+        assert_frame_equal(expl, res1l)
+        assert_frame_equal(expl, res2r)
+        expr = pd.DataFrame([0, 0, 1, 1] * 2, index=exp_idx)
+        assert_frame_equal(expr, res1r)
+        assert_frame_equal(expr, res2l)
+
+    def test_align_series_combinations(self):
+        df = pd.DataFrame({'a': [1, 3, 5],
+                           'b': [1, 3, 5]}, index=list('ACE'))
+        s = pd.Series([1, 2, 4], index=list('ABD'), name='x')
+
+        # frame + series
+        res1, res2 = df.align(s, axis=0)
+        exp1 = pd.DataFrame({'a': [1, np.nan, 3, np.nan, 5],
+                             'b': [1, np.nan, 3, np.nan, 5]},
+                            index=list('ABCDE'))
+        exp2 = pd.Series([1, 2, np.nan, 4, np.nan],
+                         index=list('ABCDE'), name='x')
+
+        tm.assert_frame_equal(res1, exp1)
+        tm.assert_series_equal(res2, exp2)
+
+        # series + frame
+        res1, res2 = s.align(df)
+        tm.assert_series_equal(res1, exp2)
+        tm.assert_frame_equal(res2, exp1)
+
+    def test_filter(self):
+        # Items
+        filtered = self.frame.filter(['A', 'B', 'E'])
+        assert len(filtered.columns) == 2
+        assert 'E' not in filtered
+
+        filtered = self.frame.filter(['A', 'B', 'E'], axis='columns')
+        assert len(filtered.columns) == 2
+        assert 'E' not in filtered
+
+        # Other axis
+        idx = self.frame.index[0:4]
+        filtered = self.frame.filter(idx, axis='index')
+        expected = self.frame.reindex(index=idx)
+        tm.assert_frame_equal(filtered, expected)
+
+        # like
+        fcopy = self.frame.copy()
+        fcopy['AA'] = 1
+
+        filtered = fcopy.filter(like='A')
+        assert len(filtered.columns) == 2
+        assert 'AA' in filtered
+
+        # like with ints in column names
+        df = DataFrame(0., index=[0, 1, 2], columns=[0, 1, '_A', '_B'])
+        filtered = df.filter(like='_')
+        assert len(filtered.columns) == 2
+
+        # regex with ints in column names
+        # from PR #10384
+        df = DataFrame(0., index=[0, 1, 2], columns=['A1', 1, 'B', 2, 'C'])
+        expected = DataFrame(
+            0., index=[0, 1, 2], columns=pd.Index([1, 2], dtype=object))
+        filtered = df.filter(regex='^[0-9]+$')
+        tm.assert_frame_equal(filtered, expected)
+
+        expected = DataFrame(0., index=[0, 1, 2], columns=[0, '0', 1, '1'])
+        # shouldn't remove anything
+        filtered = expected.filter(regex='^[0-9]+$')
+        tm.assert_frame_equal(filtered, expected)
+
+        # pass in None
+        with tm.assert_raises_regex(TypeError, 'Must pass'):
+            self.frame.filter()
+        with tm.assert_raises_regex(TypeError, 'Must pass'):
+            self.frame.filter(items=None)
+        with tm.assert_raises_regex(TypeError, 'Must pass'):
+            self.frame.filter(axis=1)
+
+        # test mutually exclusive arguments
+        with tm.assert_raises_regex(TypeError, 'mutually exclusive'):
+            self.frame.filter(items=['one', 'three'], regex='e$', like='bbi')
+        with tm.assert_raises_regex(TypeError, 'mutually exclusive'):
+            self.frame.filter(items=['one', 'three'], regex='e$', axis=1)
+        with tm.assert_raises_regex(TypeError, 'mutually exclusive'):
+            self.frame.filter(items=['one', 'three'], regex='e$')
+        with tm.assert_raises_regex(TypeError, 'mutually exclusive'):
+            self.frame.filter(items=['one', 'three'], like='bbi', axis=0)
+        with tm.assert_raises_regex(TypeError, 'mutually exclusive'):
+            self.frame.filter(items=['one', 'three'], like='bbi')
+
+        # objects
+        filtered = self.mixed_frame.filter(like='foo')
+        assert 'foo' in filtered
+
+        # unicode columns, won't ascii-encode
+        df = self.frame.rename(columns={'B': u('\u2202')})
+        filtered = df.filter(like='C')
+        assert 'C' in filtered
+
+    def test_filter_regex_search(self):
+        fcopy = self.frame.copy()
+        fcopy['AA'] = 1
+
+        # regex
+        filtered = fcopy.filter(regex='[A]+')
+        assert len(filtered.columns) == 2
+        assert 'AA' in filtered
+
+        # doesn't have to be at beginning
+        df = DataFrame({'aBBa': [1, 2],
+                        'BBaBB': [1, 2],
+                        'aCCa': [1, 2],
+                        'aCCaBB': [1, 2]})
+
+        result = df.filter(regex='BB')
+        exp = df[[x for x in df.columns if 'BB' in x]]
+        assert_frame_equal(result, exp)
+
+    @pytest.mark.parametrize('name,expected', [
+        ('a', DataFrame({u'a': [1, 2]})),
+        (u'a', DataFrame({u'a': [1, 2]})),
+        (u'あ', DataFrame({u'あ': [3, 4]}))
+    ])
+    def test_filter_unicode(self, name, expected):
+        # GH13101
+        df = DataFrame({u'a': [1, 2], u'あ': [3, 4]})
+
+        assert_frame_equal(df.filter(like=name), expected)
+        assert_frame_equal(df.filter(regex=name), expected)
+
+    @pytest.mark.parametrize('name', ['a', u'a'])
+    def test_filter_bytestring(self, name):
+        # GH13101
+        df = DataFrame({b'a': [1, 2], b'b': [3, 4]})
+        expected = DataFrame({b'a': [1, 2]})
+
+        assert_frame_equal(df.filter(like=name), expected)
+        assert_frame_equal(df.filter(regex=name), expected)
+
+    def test_filter_corner(self):
+        empty = DataFrame()
+
+        result = empty.filter([])
+        assert_frame_equal(result, empty)
+
+        result = empty.filter(like='foo')
+        assert_frame_equal(result, empty)
+
+    def test_select(self):
+
+        # deprecated: gh-12410
+        f = lambda x: x.weekday() == 2
+        index = self.tsframe.index[[f(x) for x in self.tsframe.index]]
+        expected_weekdays = self.tsframe.reindex(index=index)
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = self.tsframe.select(f, axis=0)
+            assert_frame_equal(result, expected_weekdays)
+
+            result = self.frame.select(lambda x: x in ('B', 'D'), axis=1)
+            expected = self.frame.reindex(columns=['B', 'D'])
+            assert_frame_equal(result, expected, check_names=False)
+
+        # replacement
+        f = lambda x: x.weekday == 2
+        result = self.tsframe.loc(axis=0)[f(self.tsframe.index)]
+        assert_frame_equal(result, expected_weekdays)
+
+        crit = lambda x: x in ['B', 'D']
+        result = self.frame.loc(axis=1)[(self.frame.columns.map(crit))]
+        expected = self.frame.reindex(columns=['B', 'D'])
+        assert_frame_equal(result, expected, check_names=False)
+
+        # doc example
+        df = DataFrame({'A': [1, 2, 3]}, index=['foo', 'bar', 'baz'])
+
+        crit = lambda x: x in ['bar', 'baz']
+        with tm.assert_produces_warning(FutureWarning):
+            expected = df.select(crit)
+        result = df.loc[df.index.map(crit)]
+        assert_frame_equal(result, expected, check_names=False)
+
+    def test_take(self):
+        # homogeneous
+        order = [3, 1, 2, 0]
+        for df in [self.frame]:
+
+            result = df.take(order, axis=0)
+            expected = df.reindex(df.index.take(order))
+            assert_frame_equal(result, expected)
+
+            # axis = 1
+            result = df.take(order, axis=1)
+            expected = df.loc[:, ['D', 'B', 'C', 'A']]
+            assert_frame_equal(result, expected, check_names=False)
+
+        # negative indices
+        order = [2, 1, -1]
+        for df in [self.frame]:
+
+            result = df.take(order, axis=0)
+            expected = df.reindex(df.index.take(order))
+            assert_frame_equal(result, expected)
+
+            with tm.assert_produces_warning(FutureWarning):
+                result = df.take(order, convert=True, axis=0)
+                assert_frame_equal(result, expected)
+
+            with tm.assert_produces_warning(FutureWarning):
+                result = df.take(order, convert=False, axis=0)
+                assert_frame_equal(result, expected)
+
+            # axis = 1
+            result = df.take(order, axis=1)
+            expected = df.loc[:, ['C', 'B', 'D']]
+            assert_frame_equal(result, expected, check_names=False)
+
+        # illegal indices
+        pytest.raises(IndexError, df.take, [3, 1, 2, 30], axis=0)
+        pytest.raises(IndexError, df.take, [3, 1, 2, -31], axis=0)
+        pytest.raises(IndexError, df.take, [3, 1, 2, 5], axis=1)
+        pytest.raises(IndexError, df.take, [3, 1, 2, -5], axis=1)
+
+        # mixed-dtype
+        order = [4, 1, 2, 0, 3]
+        for df in [self.mixed_frame]:
+
+            result = df.take(order, axis=0)
+            expected = df.reindex(df.index.take(order))
+            assert_frame_equal(result, expected)
+
+            # axis = 1
+            result = df.take(order, axis=1)
+            expected = df.loc[:, ['foo', 'B', 'C', 'A', 'D']]
+            assert_frame_equal(result, expected)
+
+        # negative indices
+        order = [4, 1, -2]
+        for df in [self.mixed_frame]:
+
+            result = df.take(order, axis=0)
+            expected = df.reindex(df.index.take(order))
+            assert_frame_equal(result, expected)
+
+            # axis = 1
+            result = df.take(order, axis=1)
+            expected = df.loc[:, ['foo', 'B', 'D']]
+            assert_frame_equal(result, expected)
+
+        # by dtype
+        order = [1, 2, 0, 3]
+        for df in [self.mixed_float, self.mixed_int]:
+
+            result = df.take(order, axis=0)
+            expected = df.reindex(df.index.take(order))
+            assert_frame_equal(result, expected)
+
+            # axis = 1
+            result = df.take(order, axis=1)
+            expected = df.loc[:, ['B', 'C', 'A', 'D']]
+            assert_frame_equal(result, expected)
+
+    def test_reindex_boolean(self):
+        frame = DataFrame(np.ones((10, 2), dtype=bool),
+                          index=np.arange(0, 20, 2),
+                          columns=[0, 2])
+
+        reindexed = frame.reindex(np.arange(10))
+        assert reindexed.values.dtype == np.object_
+        assert isna(reindexed[0][1])
+
+        reindexed = frame.reindex(columns=lrange(3))
+        assert reindexed.values.dtype == np.object_
+        assert isna(reindexed[1]).all()
+
+    def test_reindex_objects(self):
+        reindexed = self.mixed_frame.reindex(columns=['foo', 'A', 'B'])
+        assert 'foo' in reindexed
+
+        reindexed = self.mixed_frame.reindex(columns=['A', 'B'])
+        assert 'foo' not in reindexed
+
+    def test_reindex_corner(self):
+        index = Index(['a', 'b', 'c'])
+        dm = self.empty.reindex(index=[1, 2, 3])
+        reindexed = dm.reindex(columns=index)
+        tm.assert_index_equal(reindexed.columns, index)
+
+        # ints are weird
+        smaller = self.intframe.reindex(columns=['A', 'B', 'E'])
+        assert smaller['E'].dtype == np.float64
+
+    def test_reindex_axis(self):
+        cols = ['A', 'B', 'E']
+        with tm.assert_produces_warning(FutureWarning) as m:
+            reindexed1 = self.intframe.reindex_axis(cols, axis=1)
+            assert 'reindex' in str(m[0].message)
+        reindexed2 = self.intframe.reindex(columns=cols)
+        assert_frame_equal(reindexed1, reindexed2)
+
+        rows = self.intframe.index[0:5]
+        with tm.assert_produces_warning(FutureWarning) as m:
+            reindexed1 = self.intframe.reindex_axis(rows, axis=0)
+            assert 'reindex' in str(m[0].message)
+        reindexed2 = self.intframe.reindex(index=rows)
+        assert_frame_equal(reindexed1, reindexed2)
+
+        pytest.raises(ValueError, self.intframe.reindex_axis, rows, axis=2)
+
+        # no-op case
+        cols = self.frame.columns.copy()
+        with tm.assert_produces_warning(FutureWarning) as m:
+            newFrame = self.frame.reindex_axis(cols, axis=1)
+            assert 'reindex' in str(m[0].message)
+        assert_frame_equal(newFrame, self.frame)
+
+    def test_reindex_with_nans(self):
+        df = DataFrame([[1, 2], [3, 4], [np.nan, np.nan], [7, 8], [9, 10]],
+                       columns=['a', 'b'],
+                       index=[100.0, 101.0, np.nan, 102.0, 103.0])
+
+        result = df.reindex(index=[101.0, 102.0, 103.0])
+        expected = df.iloc[[1, 3, 4]]
+        assert_frame_equal(result, expected)
+
+        result = df.reindex(index=[103.0])
+        expected = df.iloc[[4]]
+        assert_frame_equal(result, expected)
+
+        result = df.reindex(index=[101.0])
+        expected = df.iloc[[1]]
+        assert_frame_equal(result, expected)
+
+    def test_reindex_multi(self):
+        df = DataFrame(np.random.randn(3, 3))
+
+        result = df.reindex(index=lrange(4), columns=lrange(4))
+        expected = df.reindex(lrange(4)).reindex(columns=lrange(4))
+
+        assert_frame_equal(result, expected)
+
+        df = DataFrame(np.random.randint(0, 10, (3, 3)))
+
+        result = df.reindex(index=lrange(4), columns=lrange(4))
+        expected = df.reindex(lrange(4)).reindex(columns=lrange(4))
+
+        assert_frame_equal(result, expected)
+
+        df = DataFrame(np.random.randint(0, 10, (3, 3)))
+
+        result = df.reindex(index=lrange(2), columns=lrange(2))
+        expected = df.reindex(lrange(2)).reindex(columns=lrange(2))
+
+        assert_frame_equal(result, expected)
+
+        df = DataFrame(np.random.randn(5, 3) + 1j, columns=['a', 'b', 'c'])
+
+        result = df.reindex(index=[0, 1], columns=['a', 'b'])
+        expected = df.reindex([0, 1]).reindex(columns=['a', 'b'])
+
+        assert_frame_equal(result, expected)
+
+    data = [[1, 2, 3], [1, 2, 3]]
+
+    @pytest.mark.parametrize('actual', [
+        DataFrame(data=data, index=['a', 'a']),
+        DataFrame(data=data, index=['a', 'b']),
+        DataFrame(data=data, index=['a', 'b']).set_index([0, 1]),
+        DataFrame(data=data, index=['a', 'a']).set_index([0, 1])
+    ])
+    def test_raise_on_drop_duplicate_index(self, actual):
+
+        # issue 19186
+        level = 0 if isinstance(actual.index, MultiIndex) else None
+        with pytest.raises(KeyError):
+            actual.drop('c', level=level, axis=0)
+        with pytest.raises(KeyError):
+            actual.T.drop('c', level=level, axis=1)
+        expected_no_err = actual.drop('c', axis=0, level=level,
+                                      errors='ignore')
+        assert_frame_equal(expected_no_err, actual)
+        expected_no_err = actual.T.drop('c', axis=1, level=level,
+                                        errors='ignore')
+        assert_frame_equal(expected_no_err.T, actual)
+
+    @pytest.mark.parametrize('index', [[1, 2, 3], [1, 1, 2]])
+    @pytest.mark.parametrize('drop_labels', [[], [1], [2]])
+    def test_drop_empty_list(self, index, drop_labels):
+        # GH 21494
+        expected_index = [i for i in index if i not in drop_labels]
+        frame = pd.DataFrame(index=index).drop(drop_labels)
+        tm.assert_frame_equal(frame, pd.DataFrame(index=expected_index))
+
+    @pytest.mark.parametrize('index', [[1, 2, 3], [1, 2, 2]])
+    @pytest.mark.parametrize('drop_labels', [[1, 4], [4, 5]])
+    def test_drop_non_empty_list(self, index, drop_labels):
+        # GH 21494
+        with tm.assert_raises_regex(KeyError, 'not found in axis'):
+            pd.DataFrame(index=index).drop(drop_labels)
diff --git a/pandas/tests/frame/test_block_internals.py b/pandas/tests/frame/test_block_internals.py
new file mode 100644
index 0000000000000..8e012922d25f1
--- /dev/null
+++ b/pandas/tests/frame/test_block_internals.py
@@ -0,0 +1,560 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import pytest
+
+from datetime import datetime, timedelta
+import itertools
+
+from numpy import nan
+import numpy as np
+
+from pandas import (DataFrame, Series, Timestamp, date_range, compat,
+                    option_context)
+from pandas.compat import StringIO
+import pandas as pd
+
+from pandas.util.testing import (assert_almost_equal,
+                                 assert_series_equal,
+                                 assert_frame_equal)
+
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+# Segregated collection of methods that require the BlockManager internal data
+# structure
+
+
+class TestDataFrameBlockInternals(TestData):
+
+    def test_cast_internals(self):
+        casted = DataFrame(self.frame._data, dtype=int)
+        expected = DataFrame(self.frame._series, dtype=int)
+        assert_frame_equal(casted, expected)
+
+        casted = DataFrame(self.frame._data, dtype=np.int32)
+        expected = DataFrame(self.frame._series, dtype=np.int32)
+        assert_frame_equal(casted, expected)
+
+    def test_consolidate(self):
+        self.frame['E'] = 7.
+        consolidated = self.frame._consolidate()
+        assert len(consolidated._data.blocks) == 1
+
+        # Ensure copy, do I want this?
+        recons = consolidated._consolidate()
+        assert recons is not consolidated
+        tm.assert_frame_equal(recons, consolidated)
+
+        self.frame['F'] = 8.
+        assert len(self.frame._data.blocks) == 3
+
+        self.frame._consolidate(inplace=True)
+        assert len(self.frame._data.blocks) == 1
+
+    def test_consolidate_deprecation(self):
+        self.frame['E'] = 7
+        with tm.assert_produces_warning(FutureWarning):
+            self.frame.consolidate()
+
+    def test_consolidate_inplace(self):
+        frame = self.frame.copy()  # noqa
+
+        # triggers in-place consolidation
+        for letter in range(ord('A'), ord('Z')):
+            self.frame[chr(letter)] = chr(letter)
+
+    def test_values_consolidate(self):
+        self.frame['E'] = 7.
+        assert not self.frame._data.is_consolidated()
+        _ = self.frame.values  # noqa
+        assert self.frame._data.is_consolidated()
+
+    def test_modify_values(self):
+        self.frame.values[5] = 5
+        assert (self.frame.values[5] == 5).all()
+
+        # unconsolidated
+        self.frame['E'] = 7.
+        self.frame.values[6] = 6
+        assert (self.frame.values[6] == 6).all()
+
+    def test_boolean_set_uncons(self):
+        self.frame['E'] = 7.
+
+        expected = self.frame.values.copy()
+        expected[expected > 1] = 2
+
+        self.frame[self.frame > 1] = 2
+        assert_almost_equal(expected, self.frame.values)
+
+    def test_values_numeric_cols(self):
+        self.frame['foo'] = 'bar'
+
+        values = self.frame[['A', 'B', 'C', 'D']].values
+        assert values.dtype == np.float64
+
+    def test_values_lcd(self):
+
+        # mixed lcd
+        values = self.mixed_float[['A', 'B', 'C', 'D']].values
+        assert values.dtype == np.float64
+
+        values = self.mixed_float[['A', 'B', 'C']].values
+        assert values.dtype == np.float32
+
+        values = self.mixed_float[['C']].values
+        assert values.dtype == np.float16
+
+        # GH 10364
+        # B uint64 forces float because there are other signed int types
+        values = self.mixed_int[['A', 'B', 'C', 'D']].values
+        assert values.dtype == np.float64
+
+        values = self.mixed_int[['A', 'D']].values
+        assert values.dtype == np.int64
+
+        # B uint64 forces float because there are other signed int types
+        values = self.mixed_int[['A', 'B', 'C']].values
+        assert values.dtype == np.float64
+
+        # as B and C are both unsigned, no forcing to float is needed
+        values = self.mixed_int[['B', 'C']].values
+        assert values.dtype == np.uint64
+
+        values = self.mixed_int[['A', 'C']].values
+        assert values.dtype == np.int32
+
+        values = self.mixed_int[['C', 'D']].values
+        assert values.dtype == np.int64
+
+        values = self.mixed_int[['A']].values
+        assert values.dtype == np.int32
+
+        values = self.mixed_int[['C']].values
+        assert values.dtype == np.uint8
+
+    def test_constructor_with_convert(self):
+        # this is actually mostly a test of lib.maybe_convert_objects
+        # #2845
+        df = DataFrame({'A': [2 ** 63 - 1]})
+        result = df['A']
+        expected = Series(np.asarray([2 ** 63 - 1], np.int64), name='A')
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'A': [2 ** 63]})
+        result = df['A']
+        expected = Series(np.asarray([2 ** 63], np.uint64), name='A')
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'A': [datetime(2005, 1, 1), True]})
+        result = df['A']
+        expected = Series(np.asarray([datetime(2005, 1, 1), True], np.object_),
+                          name='A')
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'A': [None, 1]})
+        result = df['A']
+        expected = Series(np.asarray([np.nan, 1], np.float_), name='A')
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'A': [1.0, 2]})
+        result = df['A']
+        expected = Series(np.asarray([1.0, 2], np.float_), name='A')
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'A': [1.0 + 2.0j, 3]})
+        result = df['A']
+        expected = Series(np.asarray([1.0 + 2.0j, 3], np.complex_), name='A')
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'A': [1.0 + 2.0j, 3.0]})
+        result = df['A']
+        expected = Series(np.asarray([1.0 + 2.0j, 3.0], np.complex_), name='A')
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'A': [1.0 + 2.0j, True]})
+        result = df['A']
+        expected = Series(np.asarray([1.0 + 2.0j, True], np.object_), name='A')
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'A': [1.0, None]})
+        result = df['A']
+        expected = Series(np.asarray([1.0, np.nan], np.float_), name='A')
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'A': [1.0 + 2.0j, None]})
+        result = df['A']
+        expected = Series(np.asarray(
+            [1.0 + 2.0j, np.nan], np.complex_), name='A')
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'A': [2.0, 1, True, None]})
+        result = df['A']
+        expected = Series(np.asarray(
+            [2.0, 1, True, None], np.object_), name='A')
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'A': [2.0, 1, datetime(2006, 1, 1), None]})
+        result = df['A']
+        expected = Series(np.asarray([2.0, 1, datetime(2006, 1, 1),
+                                      None], np.object_), name='A')
+        assert_series_equal(result, expected)
+
+    def test_construction_with_mixed(self):
+        # test construction edge cases with mixed types
+
+        # f7u12, this does not work without extensive workaround
+        data = [[datetime(2001, 1, 5), nan, datetime(2001, 1, 2)],
+                [datetime(2000, 1, 2), datetime(2000, 1, 3),
+                 datetime(2000, 1, 1)]]
+        df = DataFrame(data)
+
+        # check dtypes
+        result = df.get_dtype_counts().sort_values()
+        expected = Series({'datetime64[ns]': 3})
+
+        # mixed-type frames
+        self.mixed_frame['datetime'] = datetime.now()
+        self.mixed_frame['timedelta'] = timedelta(days=1, seconds=1)
+        assert self.mixed_frame['datetime'].dtype == 'M8[ns]'
+        assert self.mixed_frame['timedelta'].dtype == 'm8[ns]'
+        result = self.mixed_frame.get_dtype_counts().sort_values()
+        expected = Series({'float64': 4,
+                           'object': 1,
+                           'datetime64[ns]': 1,
+                           'timedelta64[ns]': 1}).sort_values()
+        assert_series_equal(result, expected)
+
+    def test_construction_with_conversions(self):
+
+        # convert from a numpy array of non-ns timedelta64
+        arr = np.array([1, 2, 3], dtype='timedelta64[s]')
+        df = DataFrame(index=range(3))
+        df['A'] = arr
+        expected = DataFrame({'A': pd.timedelta_range('00:00:01', periods=3,
+                                                      freq='s')},
+                             index=range(3))
+        assert_frame_equal(df, expected)
+
+        expected = DataFrame({
+            'dt1': Timestamp('20130101'),
+            'dt2': date_range('20130101', periods=3),
+            # 'dt3' : date_range('20130101 00:00:01',periods=3,freq='s'),
+        }, index=range(3))
+
+        df = DataFrame(index=range(3))
+        df['dt1'] = np.datetime64('2013-01-01')
+        df['dt2'] = np.array(['2013-01-01', '2013-01-02', '2013-01-03'],
+                             dtype='datetime64[D]')
+
+        # df['dt3'] = np.array(['2013-01-01 00:00:01','2013-01-01
+        # 00:00:02','2013-01-01 00:00:03'],dtype='datetime64[s]')
+
+        assert_frame_equal(df, expected)
+
+    def test_constructor_compound_dtypes(self):
+        # GH 5191
+        # compound dtypes should raise not-implementederror
+
+        def f(dtype):
+            data = list(itertools.repeat((datetime(2001, 1, 1),
+                                          "aa", 20), 9))
+            return DataFrame(data=data,
+                             columns=["A", "B", "C"],
+                             dtype=dtype)
+
+        pytest.raises(NotImplementedError, f,
+                      [("A", "datetime64[h]"),
+                       ("B", "str"),
+                       ("C", "int32")])
+
+        # these work (though results may be unexpected)
+        f('int64')
+        f('float64')
+
+        # 10822
+        # invalid error message on dt inference
+        if not compat.is_platform_windows():
+            f('M8[ns]')
+
+    def test_equals_different_blocks(self):
+        # GH 9330
+        df0 = pd.DataFrame({"A": ["x", "y"], "B": [1, 2],
+                            "C": ["w", "z"]})
+        df1 = df0.reset_index()[["A", "B", "C"]]
+        # this assert verifies that the above operations have
+        # induced a block rearrangement
+        assert (df0._data.blocks[0].dtype != df1._data.blocks[0].dtype)
+
+        # do the real tests
+        assert_frame_equal(df0, df1)
+        assert df0.equals(df1)
+        assert df1.equals(df0)
+
+    def test_copy_blocks(self):
+        # API/ENH 9607
+        df = DataFrame(self.frame, copy=True)
+        column = df.columns[0]
+
+        # use the default copy=True, change a column
+
+        # deprecated 0.21.0
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            blocks = df.as_blocks()
+        for dtype, _df in blocks.items():
+            if column in _df:
+                _df.loc[:, column] = _df[column] + 1
+
+        # make sure we did not change the original DataFrame
+        assert not _df[column].equals(df[column])
+
+    def test_no_copy_blocks(self):
+        # API/ENH 9607
+        df = DataFrame(self.frame, copy=True)
+        column = df.columns[0]
+
+        # use the copy=False, change a column
+
+        # deprecated 0.21.0
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            blocks = df.as_blocks(copy=False)
+        for dtype, _df in blocks.items():
+            if column in _df:
+                _df.loc[:, column] = _df[column] + 1
+
+        # make sure we did change the original DataFrame
+        assert _df[column].equals(df[column])
+
+    def test_copy(self):
+        cop = self.frame.copy()
+        cop['E'] = cop['A']
+        assert 'E' not in self.frame
+
+        # copy objects
+        copy = self.mixed_frame.copy()
+        assert copy._data is not self.mixed_frame._data
+
+    def test_pickle(self):
+        unpickled = tm.round_trip_pickle(self.mixed_frame)
+        assert_frame_equal(self.mixed_frame, unpickled)
+
+        # buglet
+        self.mixed_frame._data.ndim
+
+        # empty
+        unpickled = tm.round_trip_pickle(self.empty)
+        repr(unpickled)
+
+        # tz frame
+        unpickled = tm.round_trip_pickle(self.tzframe)
+        assert_frame_equal(self.tzframe, unpickled)
+
+    def test_consolidate_datetime64(self):
+        # numpy vstack bug
+
+        data = """\
+starting,ending,measure
+2012-06-21 00:00,2012-06-23 07:00,77
+2012-06-23 07:00,2012-06-23 16:30,65
+2012-06-23 16:30,2012-06-25 08:00,77
+2012-06-25 08:00,2012-06-26 12:00,0
+2012-06-26 12:00,2012-06-27 08:00,77
+"""
+        df = pd.read_csv(StringIO(data), parse_dates=[0, 1])
+
+        ser_starting = df.starting
+        ser_starting.index = ser_starting.values
+        ser_starting = ser_starting.tz_localize('US/Eastern')
+        ser_starting = ser_starting.tz_convert('UTC')
+        ser_starting.index.name = 'starting'
+
+        ser_ending = df.ending
+        ser_ending.index = ser_ending.values
+        ser_ending = ser_ending.tz_localize('US/Eastern')
+        ser_ending = ser_ending.tz_convert('UTC')
+        ser_ending.index.name = 'ending'
+
+        df.starting = ser_starting.index
+        df.ending = ser_ending.index
+
+        tm.assert_index_equal(pd.DatetimeIndex(
+            df.starting), ser_starting.index)
+        tm.assert_index_equal(pd.DatetimeIndex(df.ending), ser_ending.index)
+
+    def test_is_mixed_type(self):
+        assert not self.frame._is_mixed_type
+        assert self.mixed_frame._is_mixed_type
+
+    def test_get_numeric_data(self):
+        # TODO(wesm): unused?
+        intname = np.dtype(np.int_).name  # noqa
+        floatname = np.dtype(np.float_).name  # noqa
+
+        datetime64name = np.dtype('M8[ns]').name
+        objectname = np.dtype(np.object_).name
+
+        df = DataFrame({'a': 1., 'b': 2, 'c': 'foo',
+                        'f': Timestamp('20010102')},
+                       index=np.arange(10))
+        result = df.get_dtype_counts()
+        expected = Series({'int64': 1, 'float64': 1,
+                           datetime64name: 1, objectname: 1})
+        result = result.sort_index()
+        expected = expected.sort_index()
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'a': 1., 'b': 2, 'c': 'foo',
+                        'd': np.array([1.] * 10, dtype='float32'),
+                        'e': np.array([1] * 10, dtype='int32'),
+                        'f': np.array([1] * 10, dtype='int16'),
+                        'g': Timestamp('20010102')},
+                       index=np.arange(10))
+
+        result = df._get_numeric_data()
+        expected = df.loc[:, ['a', 'b', 'd', 'e', 'f']]
+        assert_frame_equal(result, expected)
+
+        only_obj = df.loc[:, ['c', 'g']]
+        result = only_obj._get_numeric_data()
+        expected = df.loc[:, []]
+        assert_frame_equal(result, expected)
+
+        df = DataFrame.from_dict(
+            {'a': [1, 2], 'b': ['foo', 'bar'], 'c': [np.pi, np.e]})
+        result = df._get_numeric_data()
+        expected = DataFrame.from_dict({'a': [1, 2], 'c': [np.pi, np.e]})
+        assert_frame_equal(result, expected)
+
+        df = result.copy()
+        result = df._get_numeric_data()
+        expected = df
+        assert_frame_equal(result, expected)
+
+    def test_convert_objects(self):
+
+        oops = self.mixed_frame.T.T
+        converted = oops._convert(datetime=True)
+        assert_frame_equal(converted, self.mixed_frame)
+        assert converted['A'].dtype == np.float64
+
+        # force numeric conversion
+        self.mixed_frame['H'] = '1.'
+        self.mixed_frame['I'] = '1'
+
+        # add in some items that will be nan
+        length = len(self.mixed_frame)
+        self.mixed_frame['J'] = '1.'
+        self.mixed_frame['K'] = '1'
+        self.mixed_frame.loc[0:5, ['J', 'K']] = 'garbled'
+        converted = self.mixed_frame._convert(datetime=True, numeric=True)
+        assert converted['H'].dtype == 'float64'
+        assert converted['I'].dtype == 'int64'
+        assert converted['J'].dtype == 'float64'
+        assert converted['K'].dtype == 'float64'
+        assert len(converted['J'].dropna()) == length - 5
+        assert len(converted['K'].dropna()) == length - 5
+
+        # via astype
+        converted = self.mixed_frame.copy()
+        converted['H'] = converted['H'].astype('float64')
+        converted['I'] = converted['I'].astype('int64')
+        assert converted['H'].dtype == 'float64'
+        assert converted['I'].dtype == 'int64'
+
+        # via astype, but errors
+        converted = self.mixed_frame.copy()
+        with tm.assert_raises_regex(ValueError, 'invalid literal'):
+            converted['H'].astype('int32')
+
+        # mixed in a single column
+        df = DataFrame(dict(s=Series([1, 'na', 3, 4])))
+        result = df._convert(datetime=True, numeric=True)
+        expected = DataFrame(dict(s=Series([1, np.nan, 3, 4])))
+        assert_frame_equal(result, expected)
+
+    def test_convert_objects_no_conversion(self):
+        mixed1 = DataFrame(
+            {'a': [1, 2, 3], 'b': [4.0, 5, 6], 'c': ['x', 'y', 'z']})
+        mixed2 = mixed1._convert(datetime=True)
+        assert_frame_equal(mixed1, mixed2)
+
+    def test_infer_objects(self):
+        # GH 11221
+        df = DataFrame({'a': ['a', 1, 2, 3],
+                        'b': ['b', 2.0, 3.0, 4.1],
+                        'c': ['c', datetime(2016, 1, 1),
+                              datetime(2016, 1, 2),
+                              datetime(2016, 1, 3)],
+                        'd': [1, 2, 3, 'd']},
+                       columns=['a', 'b', 'c', 'd'])
+        df = df.iloc[1:].infer_objects()
+
+        assert df['a'].dtype == 'int64'
+        assert df['b'].dtype == 'float64'
+        assert df['c'].dtype == 'M8[ns]'
+        assert df['d'].dtype == 'object'
+
+        expected = DataFrame({'a': [1, 2, 3],
+                              'b': [2.0, 3.0, 4.1],
+                              'c': [datetime(2016, 1, 1),
+                                    datetime(2016, 1, 2),
+                                    datetime(2016, 1, 3)],
+                              'd': [2, 3, 'd']},
+                             columns=['a', 'b', 'c', 'd'])
+        # reconstruct frame to verify inference is same
+        tm.assert_frame_equal(df.reset_index(drop=True), expected)
+
+    def test_stale_cached_series_bug_473(self):
+
+        # this is chained, but ok
+        with option_context('chained_assignment', None):
+            Y = DataFrame(np.random.random((4, 4)), index=('a', 'b', 'c', 'd'),
+                          columns=('e', 'f', 'g', 'h'))
+            repr(Y)
+            Y['e'] = Y['e'].astype('object')
+            Y['g']['c'] = np.NaN
+            repr(Y)
+            result = Y.sum()  # noqa
+            exp = Y['g'].sum()  # noqa
+            assert pd.isna(Y['g']['c'])
+
+    def test_get_X_columns(self):
+        # numeric and object columns
+
+        df = DataFrame({'a': [1, 2, 3],
+                        'b': [True, False, True],
+                        'c': ['foo', 'bar', 'baz'],
+                        'd': [None, None, None],
+                        'e': [3.14, 0.577, 2.773]})
+
+        tm.assert_index_equal(df._get_numeric_data().columns,
+                              pd.Index(['a', 'b', 'e']))
+
+    def test_strange_column_corruption_issue(self):
+        # (wesm) Unclear how exactly this is related to internal matters
+        df = DataFrame(index=[0, 1])
+        df[0] = nan
+        wasCol = {}
+        # uncommenting these makes the results match
+        # for col in xrange(100, 200):
+        #    wasCol[col] = 1
+        #    df[col] = nan
+
+        for i, dt in enumerate(df.index):
+            for col in range(100, 200):
+                if col not in wasCol:
+                    wasCol[col] = 1
+                    df[col] = nan
+                df[col][dt] = i
+
+        myid = 100
+
+        first = len(df.loc[pd.isna(df[myid]), [myid]])
+        second = len(df.loc[pd.isna(df[myid]), [myid]])
+        assert first == second == 0
diff --git a/pandas/tests/frame/test_combine_concat.py b/pandas/tests/frame/test_combine_concat.py
new file mode 100644
index 0000000000000..15ca65395e4fc
--- /dev/null
+++ b/pandas/tests/frame/test_combine_concat.py
@@ -0,0 +1,788 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+from datetime import datetime
+
+import numpy as np
+from numpy import nan
+
+import pandas as pd
+
+from pandas import DataFrame, Index, Series, Timestamp, date_range
+from pandas.compat import lrange
+
+from pandas.tests.frame.common import TestData
+
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+
+
+class TestDataFrameConcatCommon(TestData):
+
+    def test_concat_multiple_frames_dtypes(self):
+
+        # GH 2759
+        A = DataFrame(data=np.ones((10, 2)), columns=[
+                      'foo', 'bar'], dtype=np.float64)
+        B = DataFrame(data=np.ones((10, 2)), dtype=np.float32)
+        results = pd.concat((A, B), axis=1).get_dtype_counts()
+        expected = Series(dict(float64=2, float32=2))
+        assert_series_equal(results, expected)
+
+    def test_concat_multiple_tzs(self):
+        # GH 12467
+        # combining datetime tz-aware and naive DataFrames
+        ts1 = Timestamp('2015-01-01', tz=None)
+        ts2 = Timestamp('2015-01-01', tz='UTC')
+        ts3 = Timestamp('2015-01-01', tz='EST')
+
+        df1 = DataFrame(dict(time=[ts1]))
+        df2 = DataFrame(dict(time=[ts2]))
+        df3 = DataFrame(dict(time=[ts3]))
+
+        results = pd.concat([df1, df2]).reset_index(drop=True)
+        expected = DataFrame(dict(time=[ts1, ts2]), dtype=object)
+        assert_frame_equal(results, expected)
+
+        results = pd.concat([df1, df3]).reset_index(drop=True)
+        expected = DataFrame(dict(time=[ts1, ts3]), dtype=object)
+        assert_frame_equal(results, expected)
+
+        results = pd.concat([df2, df3]).reset_index(drop=True)
+        expected = DataFrame(dict(time=[ts2, ts3]))
+        assert_frame_equal(results, expected)
+
+    def test_concat_tuple_keys(self):
+        # GH 14438
+        df1 = pd.DataFrame(np.ones((2, 2)), columns=list('AB'))
+        df2 = pd.DataFrame(np.ones((3, 2)) * 2, columns=list('AB'))
+        results = pd.concat((df1, df2), keys=[('bee', 'bah'), ('bee', 'boo')])
+        expected = pd.DataFrame(
+            {'A': {('bee', 'bah', 0): 1.0,
+                   ('bee', 'bah', 1): 1.0,
+                   ('bee', 'boo', 0): 2.0,
+                   ('bee', 'boo', 1): 2.0,
+                   ('bee', 'boo', 2): 2.0},
+             'B': {('bee', 'bah', 0): 1.0,
+                   ('bee', 'bah', 1): 1.0,
+                   ('bee', 'boo', 0): 2.0,
+                   ('bee', 'boo', 1): 2.0,
+                   ('bee', 'boo', 2): 2.0}})
+        assert_frame_equal(results, expected)
+
+    def test_append_series_dict(self):
+        df = DataFrame(np.random.randn(5, 4),
+                       columns=['foo', 'bar', 'baz', 'qux'])
+
+        series = df.loc[4]
+        with tm.assert_raises_regex(ValueError,
+                                    'Indexes have overlapping values'):
+            df.append(series, verify_integrity=True)
+        series.name = None
+        with tm.assert_raises_regex(TypeError,
+                                    'Can only append a Series if '
+                                    'ignore_index=True'):
+            df.append(series, verify_integrity=True)
+
+        result = df.append(series[::-1], ignore_index=True)
+        expected = df.append(DataFrame({0: series[::-1]}, index=df.columns).T,
+                             ignore_index=True)
+        assert_frame_equal(result, expected)
+
+        # dict
+        result = df.append(series.to_dict(), ignore_index=True)
+        assert_frame_equal(result, expected)
+
+        result = df.append(series[::-1][:3], ignore_index=True)
+        expected = df.append(DataFrame({0: series[::-1][:3]}).T,
+                             ignore_index=True, sort=True)
+        assert_frame_equal(result, expected.loc[:, result.columns])
+
+        # can append when name set
+        row = df.loc[4]
+        row.name = 5
+        result = df.append(row)
+        expected = df.append(df[-1:], ignore_index=True)
+        assert_frame_equal(result, expected)
+
+    def test_append_list_of_series_dicts(self):
+        df = DataFrame(np.random.randn(5, 4),
+                       columns=['foo', 'bar', 'baz', 'qux'])
+
+        dicts = [x.to_dict() for idx, x in df.iterrows()]
+
+        result = df.append(dicts, ignore_index=True)
+        expected = df.append(df, ignore_index=True)
+        assert_frame_equal(result, expected)
+
+        # different columns
+        dicts = [{'foo': 1, 'bar': 2, 'baz': 3, 'peekaboo': 4},
+                 {'foo': 5, 'bar': 6, 'baz': 7, 'peekaboo': 8}]
+        result = df.append(dicts, ignore_index=True, sort=True)
+        expected = df.append(DataFrame(dicts), ignore_index=True, sort=True)
+        assert_frame_equal(result, expected)
+
+    def test_append_empty_dataframe(self):
+
+        # Empty df append empty df
+        df1 = DataFrame([])
+        df2 = DataFrame([])
+        result = df1.append(df2)
+        expected = df1.copy()
+        assert_frame_equal(result, expected)
+
+        # Non-empty df append empty df
+        df1 = DataFrame(np.random.randn(5, 2))
+        df2 = DataFrame()
+        result = df1.append(df2)
+        expected = df1.copy()
+        assert_frame_equal(result, expected)
+
+        # Empty df with columns append empty df
+        df1 = DataFrame(columns=['bar', 'foo'])
+        df2 = DataFrame()
+        result = df1.append(df2)
+        expected = df1.copy()
+        assert_frame_equal(result, expected)
+
+        # Non-Empty df with columns append empty df
+        df1 = DataFrame(np.random.randn(5, 2), columns=['bar', 'foo'])
+        df2 = DataFrame()
+        result = df1.append(df2)
+        expected = df1.copy()
+        assert_frame_equal(result, expected)
+
+    def test_append_dtypes(self):
+
+        # GH 5754
+        # row appends of different dtypes (so need to do by-item)
+        # can sometimes infer the correct type
+
+        df1 = DataFrame({'bar': Timestamp('20130101')}, index=lrange(5))
+        df2 = DataFrame()
+        result = df1.append(df2)
+        expected = df1.copy()
+        assert_frame_equal(result, expected)
+
+        df1 = DataFrame({'bar': Timestamp('20130101')}, index=lrange(1))
+        df2 = DataFrame({'bar': 'foo'}, index=lrange(1, 2))
+        result = df1.append(df2)
+        expected = DataFrame({'bar': [Timestamp('20130101'), 'foo']})
+        assert_frame_equal(result, expected)
+
+        df1 = DataFrame({'bar': Timestamp('20130101')}, index=lrange(1))
+        df2 = DataFrame({'bar': np.nan}, index=lrange(1, 2))
+        result = df1.append(df2)
+        expected = DataFrame(
+            {'bar': Series([Timestamp('20130101'), np.nan], dtype='M8[ns]')})
+        assert_frame_equal(result, expected)
+
+        df1 = DataFrame({'bar': Timestamp('20130101')}, index=lrange(1))
+        df2 = DataFrame({'bar': np.nan}, index=lrange(1, 2), dtype=object)
+        result = df1.append(df2)
+        expected = DataFrame(
+            {'bar': Series([Timestamp('20130101'), np.nan], dtype='M8[ns]')})
+        assert_frame_equal(result, expected)
+
+        df1 = DataFrame({'bar': np.nan}, index=lrange(1))
+        df2 = DataFrame({'bar': Timestamp('20130101')}, index=lrange(1, 2))
+        result = df1.append(df2)
+        expected = DataFrame(
+            {'bar': Series([np.nan, Timestamp('20130101')], dtype='M8[ns]')})
+        assert_frame_equal(result, expected)
+
+        df1 = DataFrame({'bar': Timestamp('20130101')}, index=lrange(1))
+        df2 = DataFrame({'bar': 1}, index=lrange(1, 2), dtype=object)
+        result = df1.append(df2)
+        expected = DataFrame({'bar': Series([Timestamp('20130101'), 1])})
+        assert_frame_equal(result, expected)
+
+    def test_update(self):
+        df = DataFrame([[1.5, nan, 3.],
+                        [1.5, nan, 3.],
+                        [1.5, nan, 3],
+                        [1.5, nan, 3]])
+
+        other = DataFrame([[3.6, 2., np.nan],
+                           [np.nan, np.nan, 7]], index=[1, 3])
+
+        df.update(other)
+
+        expected = DataFrame([[1.5, nan, 3],
+                              [3.6, 2, 3],
+                              [1.5, nan, 3],
+                              [1.5, nan, 7.]])
+        assert_frame_equal(df, expected)
+
+    def test_update_dtypes(self):
+
+        # gh 3016
+        df = DataFrame([[1., 2., False, True], [4., 5., True, False]],
+                       columns=['A', 'B', 'bool1', 'bool2'])
+
+        other = DataFrame([[45, 45]], index=[0], columns=['A', 'B'])
+        df.update(other)
+
+        expected = DataFrame([[45., 45., False, True], [4., 5., True, False]],
+                             columns=['A', 'B', 'bool1', 'bool2'])
+        assert_frame_equal(df, expected)
+
+    def test_update_nooverwrite(self):
+        df = DataFrame([[1.5, nan, 3.],
+                        [1.5, nan, 3.],
+                        [1.5, nan, 3],
+                        [1.5, nan, 3]])
+
+        other = DataFrame([[3.6, 2., np.nan],
+                           [np.nan, np.nan, 7]], index=[1, 3])
+
+        df.update(other, overwrite=False)
+
+        expected = DataFrame([[1.5, nan, 3],
+                              [1.5, 2, 3],
+                              [1.5, nan, 3],
+                              [1.5, nan, 3.]])
+        assert_frame_equal(df, expected)
+
+    def test_update_filtered(self):
+        df = DataFrame([[1.5, nan, 3.],
+                        [1.5, nan, 3.],
+                        [1.5, nan, 3],
+                        [1.5, nan, 3]])
+
+        other = DataFrame([[3.6, 2., np.nan],
+                           [np.nan, np.nan, 7]], index=[1, 3])
+
+        df.update(other, filter_func=lambda x: x > 2)
+
+        expected = DataFrame([[1.5, nan, 3],
+                              [1.5, nan, 3],
+                              [1.5, nan, 3],
+                              [1.5, nan, 7.]])
+        assert_frame_equal(df, expected)
+
+    def test_update_raise(self):
+        df = DataFrame([[1.5, 1, 3.],
+                        [1.5, nan, 3.],
+                        [1.5, nan, 3],
+                        [1.5, nan, 3]])
+
+        other = DataFrame([[2., nan],
+                           [nan, 7]], index=[1, 3], columns=[1, 2])
+        with tm.assert_raises_regex(ValueError, "Data overlaps"):
+            df.update(other, raise_conflict=True)
+
+    def test_update_from_non_df(self):
+        d = {'a': Series([1, 2, 3, 4]), 'b': Series([5, 6, 7, 8])}
+        df = DataFrame(d)
+
+        d['a'] = Series([5, 6, 7, 8])
+        df.update(d)
+
+        expected = DataFrame(d)
+
+        assert_frame_equal(df, expected)
+
+        d = {'a': [1, 2, 3, 4], 'b': [5, 6, 7, 8]}
+        df = DataFrame(d)
+
+        d['a'] = [5, 6, 7, 8]
+        df.update(d)
+
+        expected = DataFrame(d)
+
+        assert_frame_equal(df, expected)
+
+    def test_join_str_datetime(self):
+        str_dates = ['20120209', '20120222']
+        dt_dates = [datetime(2012, 2, 9), datetime(2012, 2, 22)]
+
+        A = DataFrame(str_dates, index=lrange(2), columns=['aa'])
+        C = DataFrame([[1, 2], [3, 4]], index=str_dates, columns=dt_dates)
+
+        tst = A.join(C, on='aa')
+
+        assert len(tst.columns) == 3
+
+    def test_join_multiindex_leftright(self):
+        # GH 10741
+        df1 = (pd.DataFrame([['a', 'x', 0.471780], ['a', 'y', 0.774908],
+                             ['a', 'z', 0.563634], ['b', 'x', -0.353756],
+                             ['b', 'y', 0.368062], ['b', 'z', -1.721840],
+                             ['c', 'x', 1], ['c', 'y', 2], ['c', 'z', 3]],
+                            columns=['first', 'second', 'value1'])
+               .set_index(['first', 'second']))
+
+        df2 = (pd.DataFrame([['a', 10], ['b', 20]],
+                            columns=['first', 'value2'])
+               .set_index(['first']))
+
+        exp = pd.DataFrame([[0.471780, 10], [0.774908, 10], [0.563634, 10],
+                            [-0.353756, 20], [0.368062, 20],
+                            [-1.721840, 20],
+                            [1.000000, np.nan], [2.000000, np.nan],
+                            [3.000000, np.nan]],
+                           index=df1.index, columns=['value1', 'value2'])
+
+        # these must be the same results (but columns are flipped)
+        assert_frame_equal(df1.join(df2, how='left'), exp)
+        assert_frame_equal(df2.join(df1, how='right'),
+                           exp[['value2', 'value1']])
+
+        exp_idx = pd.MultiIndex.from_product([['a', 'b'], ['x', 'y', 'z']],
+                                             names=['first', 'second'])
+        exp = pd.DataFrame([[0.471780, 10], [0.774908, 10], [0.563634, 10],
+                            [-0.353756, 20], [0.368062, 20], [-1.721840, 20]],
+                           index=exp_idx, columns=['value1', 'value2'])
+
+        assert_frame_equal(df1.join(df2, how='right'), exp)
+        assert_frame_equal(df2.join(df1, how='left'),
+                           exp[['value2', 'value1']])
+
+    def test_concat_named_keys(self):
+        # GH 14252
+        df = pd.DataFrame({'foo': [1, 2], 'bar': [0.1, 0.2]})
+        index = Index(['a', 'b'], name='baz')
+        concatted_named_from_keys = pd.concat([df, df], keys=index)
+        expected_named = pd.DataFrame(
+            {'foo': [1, 2, 1, 2], 'bar': [0.1, 0.2, 0.1, 0.2]},
+            index=pd.MultiIndex.from_product((['a', 'b'], [0, 1]),
+                                             names=['baz', None]))
+        assert_frame_equal(concatted_named_from_keys, expected_named)
+
+        index_no_name = Index(['a', 'b'], name=None)
+        concatted_named_from_names = pd.concat(
+            [df, df], keys=index_no_name, names=['baz'])
+        assert_frame_equal(concatted_named_from_names, expected_named)
+
+        concatted_unnamed = pd.concat([df, df], keys=index_no_name)
+        expected_unnamed = pd.DataFrame(
+            {'foo': [1, 2, 1, 2], 'bar': [0.1, 0.2, 0.1, 0.2]},
+            index=pd.MultiIndex.from_product((['a', 'b'], [0, 1]),
+                                             names=[None, None]))
+        assert_frame_equal(concatted_unnamed, expected_unnamed)
+
+    def test_concat_axis_parameter(self):
+        # GH 14369
+        df1 = pd.DataFrame({'A': [0.1, 0.2]}, index=range(2))
+        df2 = pd.DataFrame({'A': [0.3, 0.4]}, index=range(2))
+
+        # Index/row/0 DataFrame
+        expected_index = pd.DataFrame(
+            {'A': [0.1, 0.2, 0.3, 0.4]}, index=[0, 1, 0, 1])
+
+        concatted_index = pd.concat([df1, df2], axis='index')
+        assert_frame_equal(concatted_index, expected_index)
+
+        concatted_row = pd.concat([df1, df2], axis='rows')
+        assert_frame_equal(concatted_row, expected_index)
+
+        concatted_0 = pd.concat([df1, df2], axis=0)
+        assert_frame_equal(concatted_0, expected_index)
+
+        # Columns/1 DataFrame
+        expected_columns = pd.DataFrame(
+            [[0.1, 0.3], [0.2, 0.4]], index=[0, 1], columns=['A', 'A'])
+
+        concatted_columns = pd.concat([df1, df2], axis='columns')
+        assert_frame_equal(concatted_columns, expected_columns)
+
+        concatted_1 = pd.concat([df1, df2], axis=1)
+        assert_frame_equal(concatted_1, expected_columns)
+
+        series1 = pd.Series([0.1, 0.2])
+        series2 = pd.Series([0.3, 0.4])
+
+        # Index/row/0 Series
+        expected_index_series = pd.Series(
+            [0.1, 0.2, 0.3, 0.4], index=[0, 1, 0, 1])
+
+        concatted_index_series = pd.concat([series1, series2], axis='index')
+        assert_series_equal(concatted_index_series, expected_index_series)
+
+        concatted_row_series = pd.concat([series1, series2], axis='rows')
+        assert_series_equal(concatted_row_series, expected_index_series)
+
+        concatted_0_series = pd.concat([series1, series2], axis=0)
+        assert_series_equal(concatted_0_series, expected_index_series)
+
+        # Columns/1 Series
+        expected_columns_series = pd.DataFrame(
+            [[0.1, 0.3], [0.2, 0.4]], index=[0, 1], columns=[0, 1])
+
+        concatted_columns_series = pd.concat(
+            [series1, series2], axis='columns')
+        assert_frame_equal(concatted_columns_series, expected_columns_series)
+
+        concatted_1_series = pd.concat([series1, series2], axis=1)
+        assert_frame_equal(concatted_1_series, expected_columns_series)
+
+        # Testing ValueError
+        with tm.assert_raises_regex(ValueError, 'No axis named'):
+            pd.concat([series1, series2], axis='something')
+
+    def test_concat_numerical_names(self):
+        # #15262  # #12223
+        df = pd.DataFrame({'col': range(9)},
+                          dtype='int32',
+                          index=(pd.MultiIndex
+                                 .from_product([['A0', 'A1', 'A2'],
+                                                ['B0', 'B1', 'B2']],
+                                               names=[1, 2])))
+        result = pd.concat((df.iloc[:2, :], df.iloc[-2:, :]))
+        expected = pd.DataFrame({'col': [0, 1, 7, 8]},
+                                dtype='int32',
+                                index=pd.MultiIndex.from_tuples([('A0', 'B0'),
+                                                                 ('A0', 'B1'),
+                                                                 ('A2', 'B1'),
+                                                                 ('A2', 'B2')],
+                                                                names=[1, 2]))
+        tm.assert_frame_equal(result, expected)
+
+
+class TestDataFrameCombineFirst(TestData):
+
+    def test_combine_first_mixed(self):
+        a = Series(['a', 'b'], index=lrange(2))
+        b = Series(lrange(2), index=lrange(2))
+        f = DataFrame({'A': a, 'B': b})
+
+        a = Series(['a', 'b'], index=lrange(5, 7))
+        b = Series(lrange(2), index=lrange(5, 7))
+        g = DataFrame({'A': a, 'B': b})
+
+        exp = pd.DataFrame({'A': list('abab'), 'B': [0., 1., 0., 1.]},
+                           index=[0, 1, 5, 6])
+        combined = f.combine_first(g)
+        tm.assert_frame_equal(combined, exp)
+
+    def test_combine_first(self):
+        # disjoint
+        head, tail = self.frame[:5], self.frame[5:]
+
+        combined = head.combine_first(tail)
+        reordered_frame = self.frame.reindex(combined.index)
+        assert_frame_equal(combined, reordered_frame)
+        assert tm.equalContents(combined.columns, self.frame.columns)
+        assert_series_equal(combined['A'], reordered_frame['A'])
+
+        # same index
+        fcopy = self.frame.copy()
+        fcopy['A'] = 1
+        del fcopy['C']
+
+        fcopy2 = self.frame.copy()
+        fcopy2['B'] = 0
+        del fcopy2['D']
+
+        combined = fcopy.combine_first(fcopy2)
+
+        assert (combined['A'] == 1).all()
+        assert_series_equal(combined['B'], fcopy['B'])
+        assert_series_equal(combined['C'], fcopy2['C'])
+        assert_series_equal(combined['D'], fcopy['D'])
+
+        # overlap
+        head, tail = reordered_frame[:10].copy(), reordered_frame
+        head['A'] = 1
+
+        combined = head.combine_first(tail)
+        assert (combined['A'][:10] == 1).all()
+
+        # reverse overlap
+        tail['A'][:10] = 0
+        combined = tail.combine_first(head)
+        assert (combined['A'][:10] == 0).all()
+
+        # no overlap
+        f = self.frame[:10]
+        g = self.frame[10:]
+        combined = f.combine_first(g)
+        assert_series_equal(combined['A'].reindex(f.index), f['A'])
+        assert_series_equal(combined['A'].reindex(g.index), g['A'])
+
+        # corner cases
+        comb = self.frame.combine_first(self.empty)
+        assert_frame_equal(comb, self.frame)
+
+        comb = self.empty.combine_first(self.frame)
+        assert_frame_equal(comb, self.frame)
+
+        comb = self.frame.combine_first(DataFrame(index=["faz", "boo"]))
+        assert "faz" in comb.index
+
+        # #2525
+        df = DataFrame({'a': [1]}, index=[datetime(2012, 1, 1)])
+        df2 = DataFrame({}, columns=['b'])
+        result = df.combine_first(df2)
+        assert 'b' in result
+
+    def test_combine_first_mixed_bug(self):
+        idx = Index(['a', 'b', 'c', 'e'])
+        ser1 = Series([5.0, -9.0, 4.0, 100.], index=idx)
+        ser2 = Series(['a', 'b', 'c', 'e'], index=idx)
+        ser3 = Series([12, 4, 5, 97], index=idx)
+
+        frame1 = DataFrame({"col0": ser1,
+                            "col2": ser2,
+                            "col3": ser3})
+
+        idx = Index(['a', 'b', 'c', 'f'])
+        ser1 = Series([5.0, -9.0, 4.0, 100.], index=idx)
+        ser2 = Series(['a', 'b', 'c', 'f'], index=idx)
+        ser3 = Series([12, 4, 5, 97], index=idx)
+
+        frame2 = DataFrame({"col1": ser1,
+                            "col2": ser2,
+                            "col5": ser3})
+
+        combined = frame1.combine_first(frame2)
+        assert len(combined.columns) == 5
+
+        # gh 3016 (same as in update)
+        df = DataFrame([[1., 2., False, True], [4., 5., True, False]],
+                       columns=['A', 'B', 'bool1', 'bool2'])
+
+        other = DataFrame([[45, 45]], index=[0], columns=['A', 'B'])
+        result = df.combine_first(other)
+        assert_frame_equal(result, df)
+
+        df.loc[0, 'A'] = np.nan
+        result = df.combine_first(other)
+        df.loc[0, 'A'] = 45
+        assert_frame_equal(result, df)
+
+        # doc example
+        df1 = DataFrame({'A': [1., np.nan, 3., 5., np.nan],
+                         'B': [np.nan, 2., 3., np.nan, 6.]})
+
+        df2 = DataFrame({'A': [5., 2., 4., np.nan, 3., 7.],
+                         'B': [np.nan, np.nan, 3., 4., 6., 8.]})
+
+        result = df1.combine_first(df2)
+        expected = DataFrame(
+            {'A': [1, 2, 3, 5, 3, 7.], 'B': [np.nan, 2, 3, 4, 6, 8]})
+        assert_frame_equal(result, expected)
+
+        # GH3552, return object dtype with bools
+        df1 = DataFrame(
+            [[np.nan, 3., True], [-4.6, np.nan, True], [np.nan, 7., False]])
+        df2 = DataFrame(
+            [[-42.6, np.nan, True], [-5., 1.6, False]], index=[1, 2])
+
+        result = df1.combine_first(df2)[2]
+        expected = Series([True, True, False], name=2)
+        assert_series_equal(result, expected)
+
+        # GH 3593, converting datetime64[ns] incorrecly
+        df0 = DataFrame({"a": [datetime(2000, 1, 1),
+                               datetime(2000, 1, 2),
+                               datetime(2000, 1, 3)]})
+        df1 = DataFrame({"a": [None, None, None]})
+        df2 = df1.combine_first(df0)
+        assert_frame_equal(df2, df0)
+
+        df2 = df0.combine_first(df1)
+        assert_frame_equal(df2, df0)
+
+        df0 = DataFrame({"a": [datetime(2000, 1, 1),
+                               datetime(2000, 1, 2),
+                               datetime(2000, 1, 3)]})
+        df1 = DataFrame({"a": [datetime(2000, 1, 2), None, None]})
+        df2 = df1.combine_first(df0)
+        result = df0.copy()
+        result.iloc[0, :] = df1.iloc[0, :]
+        assert_frame_equal(df2, result)
+
+        df2 = df0.combine_first(df1)
+        assert_frame_equal(df2, df0)
+
+    def test_combine_first_align_nan(self):
+        # GH 7509 (not fixed)
+        dfa = pd.DataFrame([[pd.Timestamp('2011-01-01'), 2]],
+                           columns=['a', 'b'])
+        dfb = pd.DataFrame([[4], [5]], columns=['b'])
+        assert dfa['a'].dtype == 'datetime64[ns]'
+        assert dfa['b'].dtype == 'int64'
+
+        res = dfa.combine_first(dfb)
+        exp = pd.DataFrame({'a': [pd.Timestamp('2011-01-01'), pd.NaT],
+                            'b': [2., 5.]}, columns=['a', 'b'])
+        tm.assert_frame_equal(res, exp)
+        assert res['a'].dtype == 'datetime64[ns]'
+        # ToDo: this must be int64
+        assert res['b'].dtype == 'float64'
+
+        res = dfa.iloc[:0].combine_first(dfb)
+        exp = pd.DataFrame({'a': [np.nan, np.nan],
+                            'b': [4, 5]}, columns=['a', 'b'])
+        tm.assert_frame_equal(res, exp)
+        # ToDo: this must be datetime64
+        assert res['a'].dtype == 'float64'
+        # ToDo: this must be int64
+        assert res['b'].dtype == 'int64'
+
+    def test_combine_first_timezone(self):
+        # see gh-7630
+        data1 = pd.to_datetime('20100101 01:01').tz_localize('UTC')
+        df1 = pd.DataFrame(columns=['UTCdatetime', 'abc'],
+                           data=data1,
+                           index=pd.date_range('20140627', periods=1))
+        data2 = pd.to_datetime('20121212 12:12').tz_localize('UTC')
+        df2 = pd.DataFrame(columns=['UTCdatetime', 'xyz'],
+                           data=data2,
+                           index=pd.date_range('20140628', periods=1))
+        res = df2[['UTCdatetime']].combine_first(df1)
+        exp = pd.DataFrame({'UTCdatetime': [pd.Timestamp('2010-01-01 01:01',
+                                                         tz='UTC'),
+                                            pd.Timestamp('2012-12-12 12:12',
+                                                         tz='UTC')],
+                            'abc': [pd.Timestamp('2010-01-01 01:01:00',
+                                                 tz='UTC'), pd.NaT]},
+                           columns=['UTCdatetime', 'abc'],
+                           index=pd.date_range('20140627', periods=2,
+                                               freq='D'))
+        tm.assert_frame_equal(res, exp)
+        assert res['UTCdatetime'].dtype == 'datetime64[ns, UTC]'
+        assert res['abc'].dtype == 'datetime64[ns, UTC]'
+
+        # see gh-10567
+        dts1 = pd.date_range('2015-01-01', '2015-01-05', tz='UTC')
+        df1 = pd.DataFrame({'DATE': dts1})
+        dts2 = pd.date_range('2015-01-03', '2015-01-05', tz='UTC')
+        df2 = pd.DataFrame({'DATE': dts2})
+
+        res = df1.combine_first(df2)
+        tm.assert_frame_equal(res, df1)
+        assert res['DATE'].dtype == 'datetime64[ns, UTC]'
+
+        dts1 = pd.DatetimeIndex(['2011-01-01', 'NaT', '2011-01-03',
+                                 '2011-01-04'], tz='US/Eastern')
+        df1 = pd.DataFrame({'DATE': dts1}, index=[1, 3, 5, 7])
+        dts2 = pd.DatetimeIndex(['2012-01-01', '2012-01-02',
+                                 '2012-01-03'], tz='US/Eastern')
+        df2 = pd.DataFrame({'DATE': dts2}, index=[2, 4, 5])
+
+        res = df1.combine_first(df2)
+        exp_dts = pd.DatetimeIndex(['2011-01-01', '2012-01-01', 'NaT',
+                                    '2012-01-02', '2011-01-03', '2011-01-04'],
+                                   tz='US/Eastern')
+        exp = pd.DataFrame({'DATE': exp_dts}, index=[1, 2, 3, 4, 5, 7])
+        tm.assert_frame_equal(res, exp)
+
+        # different tz
+        dts1 = pd.date_range('2015-01-01', '2015-01-05', tz='US/Eastern')
+        df1 = pd.DataFrame({'DATE': dts1})
+        dts2 = pd.date_range('2015-01-03', '2015-01-05')
+        df2 = pd.DataFrame({'DATE': dts2})
+
+        # if df1 doesn't have NaN, keep its dtype
+        res = df1.combine_first(df2)
+        tm.assert_frame_equal(res, df1)
+        assert res['DATE'].dtype == 'datetime64[ns, US/Eastern]'
+
+        dts1 = pd.date_range('2015-01-01', '2015-01-02', tz='US/Eastern')
+        df1 = pd.DataFrame({'DATE': dts1})
+        dts2 = pd.date_range('2015-01-01', '2015-01-03')
+        df2 = pd.DataFrame({'DATE': dts2})
+
+        res = df1.combine_first(df2)
+        exp_dts = [pd.Timestamp('2015-01-01', tz='US/Eastern'),
+                   pd.Timestamp('2015-01-02', tz='US/Eastern'),
+                   pd.Timestamp('2015-01-03')]
+        exp = pd.DataFrame({'DATE': exp_dts})
+        tm.assert_frame_equal(res, exp)
+        assert res['DATE'].dtype == 'object'
+
+    def test_combine_first_timedelta(self):
+        data1 = pd.TimedeltaIndex(['1 day', 'NaT', '3 day', '4day'])
+        df1 = pd.DataFrame({'TD': data1}, index=[1, 3, 5, 7])
+        data2 = pd.TimedeltaIndex(['10 day', '11 day', '12 day'])
+        df2 = pd.DataFrame({'TD': data2}, index=[2, 4, 5])
+
+        res = df1.combine_first(df2)
+        exp_dts = pd.TimedeltaIndex(['1 day', '10 day', 'NaT',
+                                     '11 day', '3 day', '4 day'])
+        exp = pd.DataFrame({'TD': exp_dts}, index=[1, 2, 3, 4, 5, 7])
+        tm.assert_frame_equal(res, exp)
+        assert res['TD'].dtype == 'timedelta64[ns]'
+
+    def test_combine_first_period(self):
+        data1 = pd.PeriodIndex(['2011-01', 'NaT', '2011-03',
+                                '2011-04'], freq='M')
+        df1 = pd.DataFrame({'P': data1}, index=[1, 3, 5, 7])
+        data2 = pd.PeriodIndex(['2012-01-01', '2012-02',
+                                '2012-03'], freq='M')
+        df2 = pd.DataFrame({'P': data2}, index=[2, 4, 5])
+
+        res = df1.combine_first(df2)
+        exp_dts = pd.PeriodIndex(['2011-01', '2012-01', 'NaT',
+                                  '2012-02', '2011-03', '2011-04'],
+                                 freq='M')
+        exp = pd.DataFrame({'P': exp_dts}, index=[1, 2, 3, 4, 5, 7])
+        tm.assert_frame_equal(res, exp)
+        assert res['P'].dtype == 'object'
+
+        # different freq
+        dts2 = pd.PeriodIndex(['2012-01-01', '2012-01-02',
+                               '2012-01-03'], freq='D')
+        df2 = pd.DataFrame({'P': dts2}, index=[2, 4, 5])
+
+        res = df1.combine_first(df2)
+        exp_dts = [pd.Period('2011-01', freq='M'),
+                   pd.Period('2012-01-01', freq='D'),
+                   pd.NaT,
+                   pd.Period('2012-01-02', freq='D'),
+                   pd.Period('2011-03', freq='M'),
+                   pd.Period('2011-04', freq='M')]
+        exp = pd.DataFrame({'P': exp_dts}, index=[1, 2, 3, 4, 5, 7])
+        tm.assert_frame_equal(res, exp)
+        assert res['P'].dtype == 'object'
+
+    def test_combine_first_int(self):
+        # GH14687 - integer series that do no align exactly
+
+        df1 = pd.DataFrame({'a': [0, 1, 3, 5]}, dtype='int64')
+        df2 = pd.DataFrame({'a': [1, 4]}, dtype='int64')
+
+        res = df1.combine_first(df2)
+        tm.assert_frame_equal(res, df1)
+        assert res['a'].dtype == 'int64'
+
+    def test_concat_datetime_datetime64_frame(self):
+        # #2624
+        rows = []
+        rows.append([datetime(2010, 1, 1), 1])
+        rows.append([datetime(2010, 1, 2), 'hi'])
+
+        df2_obj = DataFrame.from_records(rows, columns=['date', 'test'])
+
+        ind = date_range(start="2000/1/1", freq="D", periods=10)
+        df1 = DataFrame({'date': ind, 'test': lrange(10)})
+
+        # it works!
+        pd.concat([df1, df2_obj])
+
+
+class TestDataFrameUpdate(TestData):
+
+    def test_update_nan(self):
+        # #15593 #15617
+        # test 1
+        df1 = DataFrame({'A': [1.0, 2, 3], 'B': date_range('2000', periods=3)})
+        df2 = DataFrame({'A': [None, 2, 3]})
+        expected = df1.copy()
+        df1.update(df2, overwrite=False)
+
+        tm.assert_frame_equal(df1, expected)
+
+        # test 2
+        df1 = DataFrame({'A': [1.0, None, 3],
+                         'B': date_range('2000', periods=3)})
+        df2 = DataFrame({'A': [None, 2, 3]})
+        expected = DataFrame({'A': [1.0, 2, 3],
+                              'B': date_range('2000', periods=3)})
+        df1.update(df2, overwrite=False)
+
+        tm.assert_frame_equal(df1, expected)
diff --git a/pandas/tests/frame/test_constructors.py b/pandas/tests/frame/test_constructors.py
new file mode 100644
index 0000000000000..e7fb765128738
--- /dev/null
+++ b/pandas/tests/frame/test_constructors.py
@@ -0,0 +1,2232 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+from datetime import datetime, timedelta
+import functools
+import itertools
+
+import pytest
+from numpy.random import randn
+
+import numpy as np
+import numpy.ma as ma
+import numpy.ma.mrecords as mrecords
+
+from pandas.core.dtypes.common import is_integer_dtype
+from pandas.compat import (lmap, long, zip, range, lrange, lzip,
+                           OrderedDict, is_platform_little_endian, PY36)
+from pandas import compat
+from pandas import (DataFrame, Index, Series, isna,
+                    MultiIndex, Timedelta, Timestamp,
+                    date_range, Categorical)
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.core.dtypes.cast import construct_1d_object_array_from_listlike
+
+from pandas.tests.frame.common import TestData
+
+
+MIXED_FLOAT_DTYPES = ['float16', 'float32', 'float64']
+MIXED_INT_DTYPES = ['uint8', 'uint16', 'uint32', 'uint64', 'int8', 'int16',
+                    'int32', 'int64']
+
+
+class TestDataFrameConstructors(TestData):
+
+    def test_constructor(self):
+        df = DataFrame()
+        assert len(df.index) == 0
+
+        df = DataFrame(data={})
+        assert len(df.index) == 0
+
+    def test_constructor_mixed(self):
+        index, data = tm.getMixedTypeDict()
+
+        # TODO(wesm), incomplete test?
+        indexed_frame = DataFrame(data, index=index)  # noqa
+        unindexed_frame = DataFrame(data)  # noqa
+
+        assert self.mixed_frame['foo'].dtype == np.object_
+
+    def test_constructor_cast_failure(self):
+        foo = DataFrame({'a': ['a', 'b', 'c']}, dtype=np.float64)
+        assert foo['a'].dtype == object
+
+        # GH 3010, constructing with odd arrays
+        df = DataFrame(np.ones((4, 2)))
+
+        # this is ok
+        df['foo'] = np.ones((4, 2)).tolist()
+
+        # this is not ok
+        pytest.raises(ValueError, df.__setitem__, tuple(['test']),
+                      np.ones((4, 2)))
+
+        # this is ok
+        df['foo2'] = np.ones((4, 2)).tolist()
+
+    def test_constructor_dtype_copy(self):
+        orig_df = DataFrame({
+            'col1': [1.],
+            'col2': [2.],
+            'col3': [3.]})
+
+        new_df = pd.DataFrame(orig_df, dtype=float, copy=True)
+
+        new_df['col1'] = 200.
+        assert orig_df['col1'][0] == 1.
+
+    def test_constructor_dtype_nocast_view(self):
+        df = DataFrame([[1, 2]])
+        should_be_view = DataFrame(df, dtype=df[0].dtype)
+        should_be_view[0][0] = 99
+        assert df.values[0, 0] == 99
+
+        should_be_view = DataFrame(df.values, dtype=df[0].dtype)
+        should_be_view[0][0] = 97
+        assert df.values[0, 0] == 97
+
+    def test_constructor_dtype_list_data(self):
+        df = DataFrame([[1, '2'],
+                        [None, 'a']], dtype=object)
+        assert df.loc[1, 0] is None
+        assert df.loc[0, 1] == '2'
+
+    def test_constructor_list_frames(self):
+        # see gh-3243
+        result = DataFrame([DataFrame([])])
+        assert result.shape == (1, 0)
+
+        result = DataFrame([DataFrame(dict(A=lrange(5)))])
+        assert isinstance(result.iloc[0, 0], DataFrame)
+
+    def test_constructor_mixed_dtypes(self):
+
+        def _make_mixed_dtypes_df(typ, ad=None):
+
+            if typ == 'int':
+                dtypes = MIXED_INT_DTYPES
+                arrays = [np.array(np.random.rand(10), dtype=d)
+                          for d in dtypes]
+            elif typ == 'float':
+                dtypes = MIXED_FLOAT_DTYPES
+                arrays = [np.array(np.random.randint(
+                    10, size=10), dtype=d) for d in dtypes]
+
+            zipper = lzip(dtypes, arrays)
+            for d, a in zipper:
+                assert(a.dtype == d)
+            if ad is None:
+                ad = dict()
+            ad.update({d: a for d, a in zipper})
+            return DataFrame(ad)
+
+        def _check_mixed_dtypes(df, dtypes=None):
+            if dtypes is None:
+                dtypes = MIXED_FLOAT_DTYPES + MIXED_INT_DTYPES
+            for d in dtypes:
+                if d in df:
+                    assert(df.dtypes[d] == d)
+
+        # mixed floating and integer coexinst in the same frame
+        df = _make_mixed_dtypes_df('float')
+        _check_mixed_dtypes(df)
+
+        # add lots of types
+        df = _make_mixed_dtypes_df('float', dict(A=1, B='foo', C='bar'))
+        _check_mixed_dtypes(df)
+
+        # GH 622
+        df = _make_mixed_dtypes_df('int')
+        _check_mixed_dtypes(df)
+
+    def test_constructor_complex_dtypes(self):
+        # GH10952
+        a = np.random.rand(10).astype(np.complex64)
+        b = np.random.rand(10).astype(np.complex128)
+
+        df = DataFrame({'a': a, 'b': b})
+        assert a.dtype == df.a.dtype
+        assert b.dtype == df.b.dtype
+
+    def test_constructor_dtype_str_na_values(self, string_dtype):
+        # https://github.com/pandas-dev/pandas/issues/21083
+        df = DataFrame({'A': ['x', None]}, dtype=string_dtype)
+        result = df.isna()
+        expected = DataFrame({"A": [False, True]})
+        tm.assert_frame_equal(result, expected)
+        assert df.iloc[1, 0] is None
+
+        df = DataFrame({'A': ['x', np.nan]}, dtype=string_dtype)
+        assert np.isnan(df.iloc[1, 0])
+
+    def test_constructor_rec(self):
+        rec = self.frame.to_records(index=False)
+
+        # Assigning causes segfault in NumPy < 1.5.1
+        # rec.dtype.names = list(rec.dtype.names)[::-1]
+
+        index = self.frame.index
+
+        df = DataFrame(rec)
+        tm.assert_index_equal(df.columns, pd.Index(rec.dtype.names))
+
+        df2 = DataFrame(rec, index=index)
+        tm.assert_index_equal(df2.columns, pd.Index(rec.dtype.names))
+        tm.assert_index_equal(df2.index, index)
+
+        rng = np.arange(len(rec))[::-1]
+        df3 = DataFrame(rec, index=rng, columns=['C', 'B'])
+        expected = DataFrame(rec, index=rng).reindex(columns=['C', 'B'])
+        tm.assert_frame_equal(df3, expected)
+
+    def test_constructor_bool(self):
+        df = DataFrame({0: np.ones(10, dtype=bool),
+                        1: np.zeros(10, dtype=bool)})
+        assert df.values.dtype == np.bool_
+
+    def test_constructor_overflow_int64(self):
+        # see gh-14881
+        values = np.array([2 ** 64 - i for i in range(1, 10)],
+                          dtype=np.uint64)
+
+        result = DataFrame({'a': values})
+        assert result['a'].dtype == np.uint64
+
+        # see gh-2355
+        data_scores = [(6311132704823138710, 273), (2685045978526272070, 23),
+                       (8921811264899370420, 45),
+                       (long(17019687244989530680), 270),
+                       (long(9930107427299601010), 273)]
+        dtype = [('uid', 'u8'), ('score', 'u8')]
+        data = np.zeros((len(data_scores),), dtype=dtype)
+        data[:] = data_scores
+        df_crawls = DataFrame(data)
+        assert df_crawls['uid'].dtype == np.uint64
+
+    @pytest.mark.parametrize("values", [np.array([2**64], dtype=object),
+                                        np.array([2**65]), [2**64 + 1],
+                                        np.array([-2**63 - 4], dtype=object),
+                                        np.array([-2**64 - 1]), [-2**65 - 2]])
+    def test_constructor_int_overflow(self, values):
+        # see gh-18584
+        value = values[0]
+        result = DataFrame(values)
+
+        assert result[0].dtype == object
+        assert result[0][0] == value
+
+    def test_constructor_ordereddict(self):
+        import random
+        nitems = 100
+        nums = lrange(nitems)
+        random.shuffle(nums)
+        expected = ['A%d' % i for i in nums]
+        df = DataFrame(OrderedDict(zip(expected, [[0]] * nitems)))
+        assert expected == list(df.columns)
+
+    def test_constructor_dict(self):
+        frame = DataFrame({'col1': self.ts1,
+                           'col2': self.ts2})
+
+        # col2 is padded with NaN
+        assert len(self.ts1) == 30
+        assert len(self.ts2) == 25
+
+        tm.assert_series_equal(self.ts1, frame['col1'], check_names=False)
+
+        exp = pd.Series(np.concatenate([[np.nan] * 5, self.ts2.values]),
+                        index=self.ts1.index, name='col2')
+        tm.assert_series_equal(exp, frame['col2'])
+
+        frame = DataFrame({'col1': self.ts1,
+                           'col2': self.ts2},
+                          columns=['col2', 'col3', 'col4'])
+
+        assert len(frame) == len(self.ts2)
+        assert 'col1' not in frame
+        assert isna(frame['col3']).all()
+
+        # Corner cases
+        assert len(DataFrame({})) == 0
+
+        # mix dict and array, wrong size - no spec for which error should raise
+        # first
+        with pytest.raises(ValueError):
+            DataFrame({'A': {'a': 'a', 'b': 'b'}, 'B': ['a', 'b', 'c']})
+
+        # Length-one dict micro-optimization
+        frame = DataFrame({'A': {'1': 1, '2': 2}})
+        tm.assert_index_equal(frame.index, pd.Index(['1', '2']))
+
+        # empty dict plus index
+        idx = Index([0, 1, 2])
+        frame = DataFrame({}, index=idx)
+        assert frame.index is idx
+
+        # empty with index and columns
+        idx = Index([0, 1, 2])
+        frame = DataFrame({}, index=idx, columns=idx)
+        assert frame.index is idx
+        assert frame.columns is idx
+        assert len(frame._series) == 3
+
+        # with dict of empty list and Series
+        frame = DataFrame({'A': [], 'B': []}, columns=['A', 'B'])
+        tm.assert_index_equal(frame.index, Index([], dtype=np.int64))
+
+        # GH 14381
+        # Dict with None value
+        frame_none = DataFrame(dict(a=None), index=[0])
+        frame_none_list = DataFrame(dict(a=[None]), index=[0])
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert frame_none.get_value(0, 'a') is None
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert frame_none_list.get_value(0, 'a') is None
+        tm.assert_frame_equal(frame_none, frame_none_list)
+
+        # GH10856
+        # dict with scalar values should raise error, even if columns passed
+        msg = 'If using all scalar values, you must pass an index'
+        with tm.assert_raises_regex(ValueError, msg):
+            DataFrame({'a': 0.7})
+
+        with tm.assert_raises_regex(ValueError, msg):
+            DataFrame({'a': 0.7}, columns=['a'])
+
+    @pytest.mark.parametrize("scalar", [2, np.nan, None, 'D'])
+    def test_constructor_invalid_items_unused(self, scalar):
+        # No error if invalid (scalar) value is in fact not used:
+        result = DataFrame({'a': scalar}, columns=['b'])
+        expected = DataFrame(columns=['b'])
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("value", [2, np.nan, None, float('nan')])
+    def test_constructor_dict_nan_key(self, value):
+        # GH 18455
+        cols = [1, value, 3]
+        idx = ['a', value]
+        values = [[0, 3], [1, 4], [2, 5]]
+        data = {cols[c]: Series(values[c], index=idx) for c in range(3)}
+        result = DataFrame(data).sort_values(1).sort_values('a', axis=1)
+        expected = DataFrame(np.arange(6, dtype='int64').reshape(2, 3),
+                             index=idx, columns=cols)
+        tm.assert_frame_equal(result, expected)
+
+        result = DataFrame(data, index=idx).sort_values('a', axis=1)
+        tm.assert_frame_equal(result, expected)
+
+        result = DataFrame(data, index=idx, columns=cols)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("value", [np.nan, None, float('nan')])
+    def test_constructor_dict_nan_tuple_key(self, value):
+        # GH 18455
+        cols = Index([(11, 21), (value, 22), (13, value)])
+        idx = Index([('a', value), (value, 2)])
+        values = [[0, 3], [1, 4], [2, 5]]
+        data = {cols[c]: Series(values[c], index=idx) for c in range(3)}
+        result = (DataFrame(data)
+                  .sort_values((11, 21))
+                  .sort_values(('a', value), axis=1))
+        expected = DataFrame(np.arange(6, dtype='int64').reshape(2, 3),
+                             index=idx, columns=cols)
+        tm.assert_frame_equal(result, expected)
+
+        result = DataFrame(data, index=idx).sort_values(('a', value), axis=1)
+        tm.assert_frame_equal(result, expected)
+
+        result = DataFrame(data, index=idx, columns=cols)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.skipif(not PY36, reason='Insertion order for Python>=3.6')
+    def test_constructor_dict_order_insertion(self):
+        # GH19018
+        # initialization ordering: by insertion order if python>= 3.6
+        d = {'b': self.ts2, 'a': self.ts1}
+        frame = DataFrame(data=d)
+        expected = DataFrame(data=d, columns=list('ba'))
+        tm.assert_frame_equal(frame, expected)
+
+    @pytest.mark.skipif(PY36, reason='order by value for Python<3.6')
+    def test_constructor_dict_order_by_values(self):
+        # GH19018
+        # initialization ordering: by value if python<3.6
+        d = {'b': self.ts2, 'a': self.ts1}
+        frame = DataFrame(data=d)
+        expected = DataFrame(data=d, columns=list('ab'))
+        tm.assert_frame_equal(frame, expected)
+
+    def test_constructor_multi_index(self):
+        # GH 4078
+        # construction error with mi and all-nan frame
+        tuples = [(2, 3), (3, 3), (3, 3)]
+        mi = MultiIndex.from_tuples(tuples)
+        df = DataFrame(index=mi, columns=mi)
+        assert pd.isna(df).values.ravel().all()
+
+        tuples = [(3, 3), (2, 3), (3, 3)]
+        mi = MultiIndex.from_tuples(tuples)
+        df = DataFrame(index=mi, columns=mi)
+        assert pd.isna(df).values.ravel().all()
+
+    def test_constructor_error_msgs(self):
+        msg = "Empty data passed with indices specified."
+        # passing an empty array with columns specified.
+        with tm.assert_raises_regex(ValueError, msg):
+            DataFrame(np.empty(0), columns=list('abc'))
+
+        msg = "Mixing dicts with non-Series may lead to ambiguous ordering."
+        # mix dict and array, wrong size
+        with tm.assert_raises_regex(ValueError, msg):
+            DataFrame({'A': {'a': 'a', 'b': 'b'},
+                       'B': ['a', 'b', 'c']})
+
+        # wrong size ndarray, GH 3105
+        msg = r"Shape of passed values is \(3, 4\), indices imply \(3, 3\)"
+        with tm.assert_raises_regex(ValueError, msg):
+            DataFrame(np.arange(12).reshape((4, 3)),
+                      columns=['foo', 'bar', 'baz'],
+                      index=pd.date_range('2000-01-01', periods=3))
+
+        # higher dim raise exception
+        with tm.assert_raises_regex(ValueError, 'Must pass 2-d input'):
+            DataFrame(np.zeros((3, 3, 3)), columns=['A', 'B', 'C'], index=[1])
+
+        # wrong size axis labels
+        with tm.assert_raises_regex(ValueError, "Shape of passed values "
+                                    r"is \(3, 2\), indices "
+                                    r"imply \(3, 1\)"):
+            DataFrame(np.random.rand(2, 3), columns=['A', 'B', 'C'], index=[1])
+
+        with tm.assert_raises_regex(ValueError, "Shape of passed values "
+                                    r"is \(3, 2\), indices "
+                                    r"imply \(2, 2\)"):
+            DataFrame(np.random.rand(2, 3), columns=['A', 'B'], index=[1, 2])
+
+        with tm.assert_raises_regex(ValueError, "If using all scalar "
+                                    "values, you must pass "
+                                    "an index"):
+            DataFrame({'a': False, 'b': True})
+
+    def test_constructor_with_embedded_frames(self):
+
+        # embedded data frames
+        df1 = DataFrame({'a': [1, 2, 3], 'b': [3, 4, 5]})
+        df2 = DataFrame([df1, df1 + 10])
+
+        df2.dtypes
+        str(df2)
+
+        result = df2.loc[0, 0]
+        tm.assert_frame_equal(result, df1)
+
+        result = df2.loc[1, 0]
+        tm.assert_frame_equal(result, df1 + 10)
+
+    def test_constructor_subclass_dict(self):
+        # Test for passing dict subclass to constructor
+        data = {'col1': tm.TestSubDict((x, 10.0 * x) for x in range(10)),
+                'col2': tm.TestSubDict((x, 20.0 * x) for x in range(10))}
+        df = DataFrame(data)
+        refdf = DataFrame({col: dict(compat.iteritems(val))
+                           for col, val in compat.iteritems(data)})
+        tm.assert_frame_equal(refdf, df)
+
+        data = tm.TestSubDict(compat.iteritems(data))
+        df = DataFrame(data)
+        tm.assert_frame_equal(refdf, df)
+
+        # try with defaultdict
+        from collections import defaultdict
+        data = {}
+        self.frame['B'][:10] = np.nan
+        for k, v in compat.iteritems(self.frame):
+            dct = defaultdict(dict)
+            dct.update(v.to_dict())
+            data[k] = dct
+        frame = DataFrame(data)
+        tm.assert_frame_equal(self.frame.sort_index(), frame)
+
+    def test_constructor_dict_block(self):
+        expected = np.array([[4., 3., 2., 1.]])
+        df = DataFrame({'d': [4.], 'c': [3.], 'b': [2.], 'a': [1.]},
+                       columns=['d', 'c', 'b', 'a'])
+        tm.assert_numpy_array_equal(df.values, expected)
+
+    def test_constructor_dict_cast(self):
+        # cast float tests
+        test_data = {
+            'A': {'1': 1, '2': 2},
+            'B': {'1': '1', '2': '2', '3': '3'},
+        }
+        frame = DataFrame(test_data, dtype=float)
+        assert len(frame) == 3
+        assert frame['B'].dtype == np.float64
+        assert frame['A'].dtype == np.float64
+
+        frame = DataFrame(test_data)
+        assert len(frame) == 3
+        assert frame['B'].dtype == np.object_
+        assert frame['A'].dtype == np.float64
+
+        # can't cast to float
+        test_data = {
+            'A': dict(zip(range(20), tm.makeStringIndex(20))),
+            'B': dict(zip(range(15), randn(15)))
+        }
+        frame = DataFrame(test_data, dtype=float)
+        assert len(frame) == 20
+        assert frame['A'].dtype == np.object_
+        assert frame['B'].dtype == np.float64
+
+    def test_constructor_dict_dont_upcast(self):
+        d = {'Col1': {'Row1': 'A String', 'Row2': np.nan}}
+        df = DataFrame(d)
+        assert isinstance(df['Col1']['Row2'], float)
+
+        dm = DataFrame([[1, 2], ['a', 'b']], index=[1, 2], columns=[1, 2])
+        assert isinstance(dm[1][1], int)
+
+    def test_constructor_dict_of_tuples(self):
+        # GH #1491
+        data = {'a': (1, 2, 3), 'b': (4, 5, 6)}
+
+        result = DataFrame(data)
+        expected = DataFrame({k: list(v) for k, v in compat.iteritems(data)})
+        tm.assert_frame_equal(result, expected, check_dtype=False)
+
+    def test_constructor_dict_multiindex(self):
+        check = lambda result, expected: tm.assert_frame_equal(
+            result, expected, check_dtype=True, check_index_type=True,
+            check_column_type=True, check_names=True)
+        d = {('a', 'a'): {('i', 'i'): 0, ('i', 'j'): 1, ('j', 'i'): 2},
+             ('b', 'a'): {('i', 'i'): 6, ('i', 'j'): 5, ('j', 'i'): 4},
+             ('b', 'c'): {('i', 'i'): 7, ('i', 'j'): 8, ('j', 'i'): 9}}
+        _d = sorted(d.items())
+        df = DataFrame(d)
+        expected = DataFrame(
+            [x[1] for x in _d],
+            index=MultiIndex.from_tuples([x[0] for x in _d])).T
+        expected.index = MultiIndex.from_tuples(expected.index)
+        check(df, expected)
+
+        d['z'] = {'y': 123., ('i', 'i'): 111, ('i', 'j'): 111, ('j', 'i'): 111}
+        _d.insert(0, ('z', d['z']))
+        expected = DataFrame(
+            [x[1] for x in _d],
+            index=Index([x[0] for x in _d], tupleize_cols=False)).T
+        expected.index = Index(expected.index, tupleize_cols=False)
+        df = DataFrame(d)
+        df = df.reindex(columns=expected.columns, index=expected.index)
+        check(df, expected)
+
+    def test_constructor_dict_datetime64_index(self):
+        # GH 10160
+        dates_as_str = ['1984-02-19', '1988-11-06', '1989-12-03', '1990-03-15']
+
+        def create_data(constructor):
+            return {i: {constructor(s): 2 * i}
+                    for i, s in enumerate(dates_as_str)}
+
+        data_datetime64 = create_data(np.datetime64)
+        data_datetime = create_data(lambda x: datetime.strptime(x, '%Y-%m-%d'))
+        data_Timestamp = create_data(Timestamp)
+
+        expected = DataFrame([{0: 0, 1: None, 2: None, 3: None},
+                              {0: None, 1: 2, 2: None, 3: None},
+                              {0: None, 1: None, 2: 4, 3: None},
+                              {0: None, 1: None, 2: None, 3: 6}],
+                             index=[Timestamp(dt) for dt in dates_as_str])
+
+        result_datetime64 = DataFrame(data_datetime64)
+        result_datetime = DataFrame(data_datetime)
+        result_Timestamp = DataFrame(data_Timestamp)
+        tm.assert_frame_equal(result_datetime64, expected)
+        tm.assert_frame_equal(result_datetime, expected)
+        tm.assert_frame_equal(result_Timestamp, expected)
+
+    def test_constructor_dict_timedelta64_index(self):
+        # GH 10160
+        td_as_int = [1, 2, 3, 4]
+
+        def create_data(constructor):
+            return {i: {constructor(s): 2 * i}
+                    for i, s in enumerate(td_as_int)}
+
+        data_timedelta64 = create_data(lambda x: np.timedelta64(x, 'D'))
+        data_timedelta = create_data(lambda x: timedelta(days=x))
+        data_Timedelta = create_data(lambda x: Timedelta(x, 'D'))
+
+        expected = DataFrame([{0: 0, 1: None, 2: None, 3: None},
+                              {0: None, 1: 2, 2: None, 3: None},
+                              {0: None, 1: None, 2: 4, 3: None},
+                              {0: None, 1: None, 2: None, 3: 6}],
+                             index=[Timedelta(td, 'D') for td in td_as_int])
+
+        result_timedelta64 = DataFrame(data_timedelta64)
+        result_timedelta = DataFrame(data_timedelta)
+        result_Timedelta = DataFrame(data_Timedelta)
+        tm.assert_frame_equal(result_timedelta64, expected)
+        tm.assert_frame_equal(result_timedelta, expected)
+        tm.assert_frame_equal(result_Timedelta, expected)
+
+    def test_constructor_period(self):
+        # PeriodIndex
+        a = pd.PeriodIndex(['2012-01', 'NaT', '2012-04'], freq='M')
+        b = pd.PeriodIndex(['2012-02-01', '2012-03-01', 'NaT'], freq='D')
+        df = pd.DataFrame({'a': a, 'b': b})
+        assert df['a'].dtype == 'object'
+        assert df['b'].dtype == 'object'
+
+        # list of periods
+        df = pd.DataFrame({'a': a.astype(object).tolist(),
+                           'b': b.astype(object).tolist()})
+        assert df['a'].dtype == 'object'
+        assert df['b'].dtype == 'object'
+
+    def test_nested_dict_frame_constructor(self):
+        rng = pd.period_range('1/1/2000', periods=5)
+        df = DataFrame(randn(10, 5), columns=rng)
+
+        data = {}
+        for col in df.columns:
+            for row in df.index:
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    data.setdefault(col, {})[row] = df.get_value(row, col)
+
+        result = DataFrame(data, columns=rng)
+        tm.assert_frame_equal(result, df)
+
+        data = {}
+        for col in df.columns:
+            for row in df.index:
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    data.setdefault(row, {})[col] = df.get_value(row, col)
+
+        result = DataFrame(data, index=rng).T
+        tm.assert_frame_equal(result, df)
+
+    def _check_basic_constructor(self, empty):
+        # mat: 2d matrix with shape (3, 2) to input. empty - makes sized
+        # objects
+        mat = empty((2, 3), dtype=float)
+        # 2-D input
+        frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
+
+        assert len(frame.index) == 2
+        assert len(frame.columns) == 3
+
+        # 1-D input
+        frame = DataFrame(empty((3,)), columns=['A'], index=[1, 2, 3])
+        assert len(frame.index) == 3
+        assert len(frame.columns) == 1
+
+        # cast type
+        frame = DataFrame(mat, columns=['A', 'B', 'C'],
+                          index=[1, 2], dtype=np.int64)
+        assert frame.values.dtype == np.int64
+
+        # wrong size axis labels
+        msg = r'Shape of passed values is \(3, 2\), indices imply \(3, 1\)'
+        with tm.assert_raises_regex(ValueError, msg):
+            DataFrame(mat, columns=['A', 'B', 'C'], index=[1])
+        msg = r'Shape of passed values is \(3, 2\), indices imply \(2, 2\)'
+        with tm.assert_raises_regex(ValueError, msg):
+            DataFrame(mat, columns=['A', 'B'], index=[1, 2])
+
+        # higher dim raise exception
+        with tm.assert_raises_regex(ValueError, 'Must pass 2-d input'):
+            DataFrame(empty((3, 3, 3)), columns=['A', 'B', 'C'],
+                      index=[1])
+
+        # automatic labeling
+        frame = DataFrame(mat)
+        tm.assert_index_equal(frame.index, pd.Index(lrange(2)))
+        tm.assert_index_equal(frame.columns, pd.Index(lrange(3)))
+
+        frame = DataFrame(mat, index=[1, 2])
+        tm.assert_index_equal(frame.columns, pd.Index(lrange(3)))
+
+        frame = DataFrame(mat, columns=['A', 'B', 'C'])
+        tm.assert_index_equal(frame.index, pd.Index(lrange(2)))
+
+        # 0-length axis
+        frame = DataFrame(empty((0, 3)))
+        assert len(frame.index) == 0
+
+        frame = DataFrame(empty((3, 0)))
+        assert len(frame.columns) == 0
+
+    def test_constructor_ndarray(self):
+        self._check_basic_constructor(np.ones)
+
+        frame = DataFrame(['foo', 'bar'], index=[0, 1], columns=['A'])
+        assert len(frame) == 2
+
+    def test_constructor_maskedarray(self):
+        self._check_basic_constructor(ma.masked_all)
+
+        # Check non-masked values
+        mat = ma.masked_all((2, 3), dtype=float)
+        mat[0, 0] = 1.0
+        mat[1, 2] = 2.0
+        frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
+        assert 1.0 == frame['A'][1]
+        assert 2.0 == frame['C'][2]
+
+        # what is this even checking??
+        mat = ma.masked_all((2, 3), dtype=float)
+        frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
+        assert np.all(~np.asarray(frame == frame))
+
+    def test_constructor_maskedarray_nonfloat(self):
+        # masked int promoted to float
+        mat = ma.masked_all((2, 3), dtype=int)
+        # 2-D input
+        frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
+
+        assert len(frame.index) == 2
+        assert len(frame.columns) == 3
+        assert np.all(~np.asarray(frame == frame))
+
+        # cast type
+        frame = DataFrame(mat, columns=['A', 'B', 'C'],
+                          index=[1, 2], dtype=np.float64)
+        assert frame.values.dtype == np.float64
+
+        # Check non-masked values
+        mat2 = ma.copy(mat)
+        mat2[0, 0] = 1
+        mat2[1, 2] = 2
+        frame = DataFrame(mat2, columns=['A', 'B', 'C'], index=[1, 2])
+        assert 1 == frame['A'][1]
+        assert 2 == frame['C'][2]
+
+        # masked np.datetime64 stays (use lib.NaT as null)
+        mat = ma.masked_all((2, 3), dtype='M8[ns]')
+        # 2-D input
+        frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
+
+        assert len(frame.index) == 2
+        assert len(frame.columns) == 3
+        assert isna(frame).values.all()
+
+        # cast type
+        frame = DataFrame(mat, columns=['A', 'B', 'C'],
+                          index=[1, 2], dtype=np.int64)
+        assert frame.values.dtype == np.int64
+
+        # Check non-masked values
+        mat2 = ma.copy(mat)
+        mat2[0, 0] = 1
+        mat2[1, 2] = 2
+        frame = DataFrame(mat2, columns=['A', 'B', 'C'], index=[1, 2])
+        assert 1 == frame['A'].view('i8')[1]
+        assert 2 == frame['C'].view('i8')[2]
+
+        # masked bool promoted to object
+        mat = ma.masked_all((2, 3), dtype=bool)
+        # 2-D input
+        frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
+
+        assert len(frame.index) == 2
+        assert len(frame.columns) == 3
+        assert np.all(~np.asarray(frame == frame))
+
+        # cast type
+        frame = DataFrame(mat, columns=['A', 'B', 'C'],
+                          index=[1, 2], dtype=object)
+        assert frame.values.dtype == object
+
+        # Check non-masked values
+        mat2 = ma.copy(mat)
+        mat2[0, 0] = True
+        mat2[1, 2] = False
+        frame = DataFrame(mat2, columns=['A', 'B', 'C'], index=[1, 2])
+        assert frame['A'][1] is True
+        assert frame['C'][2] is False
+
+    def test_constructor_mrecarray(self):
+        # Ensure mrecarray produces frame identical to dict of masked arrays
+        # from GH3479
+
+        assert_fr_equal = functools.partial(tm.assert_frame_equal,
+                                            check_index_type=True,
+                                            check_column_type=True,
+                                            check_frame_type=True)
+        arrays = [
+            ('float', np.array([1.5, 2.0])),
+            ('int', np.array([1, 2])),
+            ('str', np.array(['abc', 'def'])),
+        ]
+        for name, arr in arrays[:]:
+            arrays.append(('masked1_' + name,
+                           np.ma.masked_array(arr, mask=[False, True])))
+        arrays.append(('masked_all', np.ma.masked_all((2,))))
+        arrays.append(('masked_none',
+                       np.ma.masked_array([1.0, 2.5], mask=False)))
+
+        # call assert_frame_equal for all selections of 3 arrays
+        for comb in itertools.combinations(arrays, 3):
+            names, data = zip(*comb)
+            mrecs = mrecords.fromarrays(data, names=names)
+
+            # fill the comb
+            comb = {k: (v.filled() if hasattr(v, 'filled') else v)
+                    for k, v in comb}
+
+            expected = DataFrame(comb, columns=names)
+            result = DataFrame(mrecs)
+            assert_fr_equal(result, expected)
+
+            # specify columns
+            expected = DataFrame(comb, columns=names[::-1])
+            result = DataFrame(mrecs, columns=names[::-1])
+            assert_fr_equal(result, expected)
+
+            # specify index
+            expected = DataFrame(comb, columns=names, index=[1, 2])
+            result = DataFrame(mrecs, index=[1, 2])
+            assert_fr_equal(result, expected)
+
+    def test_constructor_corner(self):
+        df = DataFrame(index=[])
+        assert df.values.shape == (0, 0)
+
+        # empty but with specified dtype
+        df = DataFrame(index=lrange(10), columns=['a', 'b'], dtype=object)
+        assert df.values.dtype == np.object_
+
+        # does not error but ends up float
+        df = DataFrame(index=lrange(10), columns=['a', 'b'], dtype=int)
+        assert df.values.dtype == np.dtype('float64')
+
+        # #1783 empty dtype object
+        df = DataFrame({}, columns=['foo', 'bar'])
+        assert df.values.dtype == np.object_
+
+        df = DataFrame({'b': 1}, index=lrange(10), columns=list('abc'),
+                       dtype=int)
+        assert df.values.dtype == np.dtype('float64')
+
+    def test_constructor_scalar_inference(self):
+        data = {'int': 1, 'bool': True,
+                'float': 3., 'complex': 4j, 'object': 'foo'}
+        df = DataFrame(data, index=np.arange(10))
+
+        assert df['int'].dtype == np.int64
+        assert df['bool'].dtype == np.bool_
+        assert df['float'].dtype == np.float64
+        assert df['complex'].dtype == np.complex128
+        assert df['object'].dtype == np.object_
+
+    def test_constructor_arrays_and_scalars(self):
+        df = DataFrame({'a': randn(10), 'b': True})
+        exp = DataFrame({'a': df['a'].values, 'b': [True] * 10})
+
+        tm.assert_frame_equal(df, exp)
+        with tm.assert_raises_regex(ValueError, 'must pass an index'):
+            DataFrame({'a': False, 'b': True})
+
+    def test_constructor_DataFrame(self):
+        df = DataFrame(self.frame)
+        tm.assert_frame_equal(df, self.frame)
+
+        df_casted = DataFrame(self.frame, dtype=np.int64)
+        assert df_casted.values.dtype == np.int64
+
+    def test_constructor_more(self):
+        # used to be in test_matrix.py
+        arr = randn(10)
+        dm = DataFrame(arr, columns=['A'], index=np.arange(10))
+        assert dm.values.ndim == 2
+
+        arr = randn(0)
+        dm = DataFrame(arr)
+        assert dm.values.ndim == 2
+        assert dm.values.ndim == 2
+
+        # no data specified
+        dm = DataFrame(columns=['A', 'B'], index=np.arange(10))
+        assert dm.values.shape == (10, 2)
+
+        dm = DataFrame(columns=['A', 'B'])
+        assert dm.values.shape == (0, 2)
+
+        dm = DataFrame(index=np.arange(10))
+        assert dm.values.shape == (10, 0)
+
+        # corner, silly
+        # TODO: Fix this Exception to be better...
+        with tm.assert_raises_regex(ValueError, 'constructor not '
+                                    'properly called'):
+            DataFrame((1, 2, 3))
+
+        # can't cast
+        mat = np.array(['foo', 'bar'], dtype=object).reshape(2, 1)
+        with tm.assert_raises_regex(ValueError, 'cast'):
+            DataFrame(mat, index=[0, 1], columns=[0], dtype=float)
+
+        dm = DataFrame(DataFrame(self.frame._series))
+        tm.assert_frame_equal(dm, self.frame)
+
+        # int cast
+        dm = DataFrame({'A': np.ones(10, dtype=int),
+                        'B': np.ones(10, dtype=np.float64)},
+                       index=np.arange(10))
+
+        assert len(dm.columns) == 2
+        assert dm.values.dtype == np.float64
+
+    def test_constructor_empty_list(self):
+        df = DataFrame([], index=[])
+        expected = DataFrame(index=[])
+        tm.assert_frame_equal(df, expected)
+
+        # GH 9939
+        df = DataFrame([], columns=['A', 'B'])
+        expected = DataFrame({}, columns=['A', 'B'])
+        tm.assert_frame_equal(df, expected)
+
+        # Empty generator: list(empty_gen()) == []
+        def empty_gen():
+            return
+            yield
+
+        df = DataFrame(empty_gen(), columns=['A', 'B'])
+        tm.assert_frame_equal(df, expected)
+
+    def test_constructor_list_of_lists(self):
+        # GH #484
+        l = [[1, 'a'], [2, 'b']]
+        df = DataFrame(data=l, columns=["num", "str"])
+        assert is_integer_dtype(df['num'])
+        assert df['str'].dtype == np.object_
+
+        # GH 4851
+        # list of 0-dim ndarrays
+        expected = DataFrame({0: np.arange(10)})
+        data = [np.array(x) for x in range(10)]
+        result = DataFrame(data)
+        tm.assert_frame_equal(result, expected)
+
+    def test_constructor_sequence_like(self):
+        # GH 3783
+        # collections.Squence like
+        import collections
+
+        class DummyContainer(collections.Sequence):
+
+            def __init__(self, lst):
+                self._lst = lst
+
+            def __getitem__(self, n):
+                return self._lst.__getitem__(n)
+
+            def __len__(self, n):
+                return self._lst.__len__()
+
+        l = [DummyContainer([1, 'a']), DummyContainer([2, 'b'])]
+        columns = ["num", "str"]
+        result = DataFrame(l, columns=columns)
+        expected = DataFrame([[1, 'a'], [2, 'b']], columns=columns)
+        tm.assert_frame_equal(result, expected, check_dtype=False)
+
+        # GH 4297
+        # support Array
+        import array
+        result = DataFrame({'A': array.array('i', range(10))})
+        expected = DataFrame({'A': list(range(10))})
+        tm.assert_frame_equal(result, expected, check_dtype=False)
+
+        expected = DataFrame([list(range(10)), list(range(10))])
+        result = DataFrame([array.array('i', range(10)),
+                            array.array('i', range(10))])
+        tm.assert_frame_equal(result, expected, check_dtype=False)
+
+    def test_constructor_iterator(self):
+
+        expected = DataFrame([list(range(10)), list(range(10))])
+        result = DataFrame([range(10), range(10)])
+        tm.assert_frame_equal(result, expected)
+
+    def test_constructor_generator(self):
+        # related #2305
+
+        gen1 = (i for i in range(10))
+        gen2 = (i for i in range(10))
+
+        expected = DataFrame([list(range(10)), list(range(10))])
+        result = DataFrame([gen1, gen2])
+        tm.assert_frame_equal(result, expected)
+
+        gen = ([i, 'a'] for i in range(10))
+        result = DataFrame(gen)
+        expected = DataFrame({0: range(10), 1: 'a'})
+        tm.assert_frame_equal(result, expected, check_dtype=False)
+
+    def test_constructor_list_of_dicts(self):
+        data = [OrderedDict([['a', 1.5], ['b', 3], ['c', 4], ['d', 6]]),
+                OrderedDict([['a', 1.5], ['b', 3], ['d', 6]]),
+                OrderedDict([['a', 1.5], ['d', 6]]),
+                OrderedDict(),
+                OrderedDict([['a', 1.5], ['b', 3], ['c', 4]]),
+                OrderedDict([['b', 3], ['c', 4], ['d', 6]])]
+
+        result = DataFrame(data)
+        expected = DataFrame.from_dict(dict(zip(range(len(data)), data)),
+                                       orient='index')
+        tm.assert_frame_equal(result, expected.reindex(result.index))
+
+        result = DataFrame([{}])
+        expected = DataFrame(index=[0])
+        tm.assert_frame_equal(result, expected)
+
+    def test_constructor_ordered_dict_preserve_order(self):
+        # see gh-13304
+        expected = DataFrame([[2, 1]], columns=['b', 'a'])
+
+        data = OrderedDict()
+        data['b'] = [2]
+        data['a'] = [1]
+
+        result = DataFrame(data)
+        tm.assert_frame_equal(result, expected)
+
+        data = OrderedDict()
+        data['b'] = 2
+        data['a'] = 1
+
+        result = DataFrame([data])
+        tm.assert_frame_equal(result, expected)
+
+    def test_constructor_ordered_dict_conflicting_orders(self):
+        # the first dict element sets the ordering for the DataFrame,
+        # even if there are conflicting orders from subsequent ones
+        row_one = OrderedDict()
+        row_one['b'] = 2
+        row_one['a'] = 1
+
+        row_two = OrderedDict()
+        row_two['a'] = 1
+        row_two['b'] = 2
+
+        row_three = {'b': 2, 'a': 1}
+
+        expected = DataFrame([[2, 1], [2, 1]], columns=['b', 'a'])
+        result = DataFrame([row_one, row_two])
+        tm.assert_frame_equal(result, expected)
+
+        expected = DataFrame([[2, 1], [2, 1], [2, 1]], columns=['b', 'a'])
+        result = DataFrame([row_one, row_two, row_three])
+        tm.assert_frame_equal(result, expected)
+
+    def test_constructor_list_of_series(self):
+        data = [OrderedDict([['a', 1.5], ['b', 3.0], ['c', 4.0]]),
+                OrderedDict([['a', 1.5], ['b', 3.0], ['c', 6.0]])]
+        sdict = OrderedDict(zip(['x', 'y'], data))
+        idx = Index(['a', 'b', 'c'])
+
+        # all named
+        data2 = [Series([1.5, 3, 4], idx, dtype='O', name='x'),
+                 Series([1.5, 3, 6], idx, name='y')]
+        result = DataFrame(data2)
+        expected = DataFrame.from_dict(sdict, orient='index')
+        tm.assert_frame_equal(result, expected)
+
+        # some unnamed
+        data2 = [Series([1.5, 3, 4], idx, dtype='O', name='x'),
+                 Series([1.5, 3, 6], idx)]
+        result = DataFrame(data2)
+
+        sdict = OrderedDict(zip(['x', 'Unnamed 0'], data))
+        expected = DataFrame.from_dict(sdict, orient='index')
+        tm.assert_frame_equal(result.sort_index(), expected)
+
+        # none named
+        data = [OrderedDict([['a', 1.5], ['b', 3], ['c', 4], ['d', 6]]),
+                OrderedDict([['a', 1.5], ['b', 3], ['d', 6]]),
+                OrderedDict([['a', 1.5], ['d', 6]]),
+                OrderedDict(),
+                OrderedDict([['a', 1.5], ['b', 3], ['c', 4]]),
+                OrderedDict([['b', 3], ['c', 4], ['d', 6]])]
+        data = [Series(d) for d in data]
+
+        result = DataFrame(data)
+        sdict = OrderedDict(zip(range(len(data)), data))
+        expected = DataFrame.from_dict(sdict, orient='index')
+        tm.assert_frame_equal(result, expected.reindex(result.index))
+
+        result2 = DataFrame(data, index=np.arange(6))
+        tm.assert_frame_equal(result, result2)
+
+        result = DataFrame([Series({})])
+        expected = DataFrame(index=[0])
+        tm.assert_frame_equal(result, expected)
+
+        data = [OrderedDict([['a', 1.5], ['b', 3.0], ['c', 4.0]]),
+                OrderedDict([['a', 1.5], ['b', 3.0], ['c', 6.0]])]
+        sdict = OrderedDict(zip(range(len(data)), data))
+
+        idx = Index(['a', 'b', 'c'])
+        data2 = [Series([1.5, 3, 4], idx, dtype='O'),
+                 Series([1.5, 3, 6], idx)]
+        result = DataFrame(data2)
+        expected = DataFrame.from_dict(sdict, orient='index')
+        tm.assert_frame_equal(result, expected)
+
+    def test_constructor_list_of_series_aligned_index(self):
+        series = [pd.Series(i, index=['b', 'a', 'c'], name=str(i))
+                  for i in range(3)]
+        result = pd.DataFrame(series)
+        expected = pd.DataFrame({'b': [0, 1, 2],
+                                 'a': [0, 1, 2],
+                                 'c': [0, 1, 2]},
+                                columns=['b', 'a', 'c'],
+                                index=['0', '1', '2'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_constructor_list_of_derived_dicts(self):
+        class CustomDict(dict):
+            pass
+        d = {'a': 1.5, 'b': 3}
+
+        data_custom = [CustomDict(d)]
+        data = [d]
+
+        result_custom = DataFrame(data_custom)
+        result = DataFrame(data)
+        tm.assert_frame_equal(result, result_custom)
+
+    def test_constructor_ragged(self):
+        data = {'A': randn(10),
+                'B': randn(8)}
+        with tm.assert_raises_regex(ValueError,
+                                    'arrays must all be same length'):
+            DataFrame(data)
+
+    def test_constructor_scalar(self):
+        idx = Index(lrange(3))
+        df = DataFrame({"a": 0}, index=idx)
+        expected = DataFrame({"a": [0, 0, 0]}, index=idx)
+        tm.assert_frame_equal(df, expected, check_dtype=False)
+
+    def test_constructor_Series_copy_bug(self):
+        df = DataFrame(self.frame['A'], index=self.frame.index, columns=['A'])
+        df.copy()
+
+    def test_constructor_mixed_dict_and_Series(self):
+        data = {}
+        data['A'] = {'foo': 1, 'bar': 2, 'baz': 3}
+        data['B'] = Series([4, 3, 2, 1], index=['bar', 'qux', 'baz', 'foo'])
+
+        result = DataFrame(data)
+        assert result.index.is_monotonic
+
+        # ordering ambiguous, raise exception
+        with tm.assert_raises_regex(ValueError, 'ambiguous ordering'):
+            DataFrame({'A': ['a', 'b'], 'B': {'a': 'a', 'b': 'b'}})
+
+        # this is OK though
+        result = DataFrame({'A': ['a', 'b'],
+                            'B': Series(['a', 'b'], index=['a', 'b'])})
+        expected = DataFrame({'A': ['a', 'b'], 'B': ['a', 'b']},
+                             index=['a', 'b'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_constructor_tuples(self):
+        result = DataFrame({'A': [(1, 2), (3, 4)]})
+        expected = DataFrame({'A': Series([(1, 2), (3, 4)])})
+        tm.assert_frame_equal(result, expected)
+
+    def test_constructor_namedtuples(self):
+        # GH11181
+        from collections import namedtuple
+        named_tuple = namedtuple("Pandas", list('ab'))
+        tuples = [named_tuple(1, 3), named_tuple(2, 4)]
+        expected = DataFrame({'a': [1, 2], 'b': [3, 4]})
+        result = DataFrame(tuples)
+        tm.assert_frame_equal(result, expected)
+
+        # with columns
+        expected = DataFrame({'y': [1, 2], 'z': [3, 4]})
+        result = DataFrame(tuples, columns=['y', 'z'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_constructor_orient(self):
+        data_dict = self.mixed_frame.T._series
+        recons = DataFrame.from_dict(data_dict, orient='index')
+        expected = self.mixed_frame.sort_index()
+        tm.assert_frame_equal(recons, expected)
+
+        # dict of sequence
+        a = {'hi': [32, 3, 3],
+             'there': [3, 5, 3]}
+        rs = DataFrame.from_dict(a, orient='index')
+        xp = DataFrame.from_dict(a).T.reindex(list(a.keys()))
+        tm.assert_frame_equal(rs, xp)
+
+    def test_from_dict_columns_parameter(self):
+        # GH 18529
+        # Test new columns parameter for from_dict that was added to make
+        # from_items(..., orient='index', columns=[...]) easier to replicate
+        result = DataFrame.from_dict(OrderedDict([('A', [1, 2]),
+                                                  ('B', [4, 5])]),
+                                     orient='index', columns=['one', 'two'])
+        expected = DataFrame([[1, 2], [4, 5]], index=['A', 'B'],
+                             columns=['one', 'two'])
+        tm.assert_frame_equal(result, expected)
+
+        msg = "cannot use columns parameter with orient='columns'"
+        with tm.assert_raises_regex(ValueError, msg):
+            DataFrame.from_dict(dict([('A', [1, 2]), ('B', [4, 5])]),
+                                orient='columns', columns=['one', 'two'])
+        with tm.assert_raises_regex(ValueError, msg):
+            DataFrame.from_dict(dict([('A', [1, 2]), ('B', [4, 5])]),
+                                columns=['one', 'two'])
+
+    def test_constructor_Series_named(self):
+        a = Series([1, 2, 3], index=['a', 'b', 'c'], name='x')
+        df = DataFrame(a)
+        assert df.columns[0] == 'x'
+        tm.assert_index_equal(df.index, a.index)
+
+        # ndarray like
+        arr = np.random.randn(10)
+        s = Series(arr, name='x')
+        df = DataFrame(s)
+        expected = DataFrame(dict(x=s))
+        tm.assert_frame_equal(df, expected)
+
+        s = Series(arr, index=range(3, 13))
+        df = DataFrame(s)
+        expected = DataFrame({0: s})
+        tm.assert_frame_equal(df, expected)
+
+        pytest.raises(ValueError, DataFrame, s, columns=[1, 2])
+
+        # #2234
+        a = Series([], name='x')
+        df = DataFrame(a)
+        assert df.columns[0] == 'x'
+
+        # series with name and w/o
+        s1 = Series(arr, name='x')
+        df = DataFrame([s1, arr]).T
+        expected = DataFrame({'x': s1, 'Unnamed 0': arr},
+                             columns=['x', 'Unnamed 0'])
+        tm.assert_frame_equal(df, expected)
+
+        # this is a bit non-intuitive here; the series collapse down to arrays
+        df = DataFrame([arr, s1]).T
+        expected = DataFrame({1: s1, 0: arr}, columns=[0, 1])
+        tm.assert_frame_equal(df, expected)
+
+    def test_constructor_Series_named_and_columns(self):
+        # GH 9232 validation
+
+        s0 = Series(range(5), name=0)
+        s1 = Series(range(5), name=1)
+
+        # matching name and column gives standard frame
+        tm.assert_frame_equal(pd.DataFrame(s0, columns=[0]),
+                              s0.to_frame())
+        tm.assert_frame_equal(pd.DataFrame(s1, columns=[1]),
+                              s1.to_frame())
+
+        # non-matching produces empty frame
+        assert pd.DataFrame(s0, columns=[1]).empty
+        assert pd.DataFrame(s1, columns=[0]).empty
+
+    def test_constructor_Series_differently_indexed(self):
+        # name
+        s1 = Series([1, 2, 3], index=['a', 'b', 'c'], name='x')
+
+        # no name
+        s2 = Series([1, 2, 3], index=['a', 'b', 'c'])
+
+        other_index = Index(['a', 'b'])
+
+        df1 = DataFrame(s1, index=other_index)
+        exp1 = DataFrame(s1.reindex(other_index))
+        assert df1.columns[0] == 'x'
+        tm.assert_frame_equal(df1, exp1)
+
+        df2 = DataFrame(s2, index=other_index)
+        exp2 = DataFrame(s2.reindex(other_index))
+        assert df2.columns[0] == 0
+        tm.assert_index_equal(df2.index, other_index)
+        tm.assert_frame_equal(df2, exp2)
+
+    def test_constructor_manager_resize(self):
+        index = list(self.frame.index[:5])
+        columns = list(self.frame.columns[:3])
+
+        result = DataFrame(self.frame._data, index=index,
+                           columns=columns)
+        tm.assert_index_equal(result.index, Index(index))
+        tm.assert_index_equal(result.columns, Index(columns))
+
+    def test_constructor_from_items(self):
+        items = [(c, self.frame[c]) for c in self.frame.columns]
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            recons = DataFrame.from_items(items)
+        tm.assert_frame_equal(recons, self.frame)
+
+        # pass some columns
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            recons = DataFrame.from_items(items, columns=['C', 'B', 'A'])
+        tm.assert_frame_equal(recons, self.frame.loc[:, ['C', 'B', 'A']])
+
+        # orient='index'
+
+        row_items = [(idx, self.mixed_frame.xs(idx))
+                     for idx in self.mixed_frame.index]
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            recons = DataFrame.from_items(row_items,
+                                          columns=self.mixed_frame.columns,
+                                          orient='index')
+        tm.assert_frame_equal(recons, self.mixed_frame)
+        assert recons['A'].dtype == np.float64
+
+        with tm.assert_raises_regex(TypeError,
+                                    "Must pass columns with "
+                                    "orient='index'"):
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                DataFrame.from_items(row_items, orient='index')
+
+        # orient='index', but thar be tuples
+        arr = construct_1d_object_array_from_listlike(
+            [('bar', 'baz')] * len(self.mixed_frame))
+        self.mixed_frame['foo'] = arr
+        row_items = [(idx, list(self.mixed_frame.xs(idx)))
+                     for idx in self.mixed_frame.index]
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            recons = DataFrame.from_items(row_items,
+                                          columns=self.mixed_frame.columns,
+                                          orient='index')
+        tm.assert_frame_equal(recons, self.mixed_frame)
+        assert isinstance(recons['foo'][0], tuple)
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            rs = DataFrame.from_items([('A', [1, 2, 3]), ('B', [4, 5, 6])],
+                                      orient='index',
+                                      columns=['one', 'two', 'three'])
+        xp = DataFrame([[1, 2, 3], [4, 5, 6]], index=['A', 'B'],
+                       columns=['one', 'two', 'three'])
+        tm.assert_frame_equal(rs, xp)
+
+    def test_constructor_from_items_scalars(self):
+        # GH 17312
+        with tm.assert_raises_regex(ValueError,
+                                    r'The value in each \(key, value\) '
+                                    'pair must be an array, Series, or dict'):
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                DataFrame.from_items([('A', 1), ('B', 4)])
+
+        with tm.assert_raises_regex(ValueError,
+                                    r'The value in each \(key, value\) '
+                                    'pair must be an array, Series, or dict'):
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                DataFrame.from_items([('A', 1), ('B', 2)], columns=['col1'],
+                                     orient='index')
+
+    def test_from_items_deprecation(self):
+        # GH 17320
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            DataFrame.from_items([('A', [1, 2, 3]), ('B', [4, 5, 6])])
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            DataFrame.from_items([('A', [1, 2, 3]), ('B', [4, 5, 6])],
+                                 columns=['col1', 'col2', 'col3'],
+                                 orient='index')
+
+    def test_constructor_mix_series_nonseries(self):
+        df = DataFrame({'A': self.frame['A'],
+                        'B': list(self.frame['B'])}, columns=['A', 'B'])
+        tm.assert_frame_equal(df, self.frame.loc[:, ['A', 'B']])
+
+        with tm.assert_raises_regex(ValueError, 'does not match '
+                                    'index length'):
+            DataFrame({'A': self.frame['A'], 'B': list(self.frame['B'])[:-2]})
+
+    def test_constructor_miscast_na_int_dtype(self):
+        df = DataFrame([[np.nan, 1], [1, 0]], dtype=np.int64)
+        expected = DataFrame([[np.nan, 1], [1, 0]])
+        tm.assert_frame_equal(df, expected)
+
+    def test_constructor_iterator_failure(self):
+        with tm.assert_raises_regex(TypeError, 'iterator'):
+            DataFrame(iter([1, 2, 3]))
+
+    def test_constructor_column_duplicates(self):
+        # it works! #2079
+        df = DataFrame([[8, 5]], columns=['a', 'a'])
+        edf = DataFrame([[8, 5]])
+        edf.columns = ['a', 'a']
+
+        tm.assert_frame_equal(df, edf)
+
+        idf = DataFrame.from_records([(8, 5)],
+                                     columns=['a', 'a'])
+
+        tm.assert_frame_equal(idf, edf)
+
+        pytest.raises(ValueError, DataFrame.from_dict,
+                      OrderedDict([('b', 8), ('a', 5), ('a', 6)]))
+
+    def test_constructor_empty_with_string_dtype(self):
+        # GH 9428
+        expected = DataFrame(index=[0, 1], columns=[0, 1], dtype=object)
+
+        df = DataFrame(index=[0, 1], columns=[0, 1], dtype=str)
+        tm.assert_frame_equal(df, expected)
+        df = DataFrame(index=[0, 1], columns=[0, 1], dtype=np.str_)
+        tm.assert_frame_equal(df, expected)
+        df = DataFrame(index=[0, 1], columns=[0, 1], dtype=np.unicode_)
+        tm.assert_frame_equal(df, expected)
+        df = DataFrame(index=[0, 1], columns=[0, 1], dtype='U5')
+        tm.assert_frame_equal(df, expected)
+
+    def test_constructor_single_value(self):
+        # expecting single value upcasting here
+        df = DataFrame(0., index=[1, 2, 3], columns=['a', 'b', 'c'])
+        tm.assert_frame_equal(df,
+                              DataFrame(np.zeros(df.shape).astype('float64'),
+                                        df.index, df.columns))
+
+        df = DataFrame(0, index=[1, 2, 3], columns=['a', 'b', 'c'])
+        tm.assert_frame_equal(df, DataFrame(np.zeros(df.shape).astype('int64'),
+                                            df.index, df.columns))
+
+        df = DataFrame('a', index=[1, 2], columns=['a', 'c'])
+        tm.assert_frame_equal(df, DataFrame(np.array([['a', 'a'], ['a', 'a']],
+                                                     dtype=object),
+                                            index=[1, 2], columns=['a', 'c']))
+
+        pytest.raises(ValueError, DataFrame, 'a', [1, 2])
+        pytest.raises(ValueError, DataFrame, 'a', columns=['a', 'c'])
+        with tm.assert_raises_regex(TypeError, 'incompatible data '
+                                    'and dtype'):
+            DataFrame('a', [1, 2], ['a', 'c'], float)
+
+    def test_constructor_with_datetimes(self):
+        intname = np.dtype(np.int_).name
+        floatname = np.dtype(np.float_).name
+        datetime64name = np.dtype('M8[ns]').name
+        objectname = np.dtype(np.object_).name
+
+        # single item
+        df = DataFrame({'A': 1, 'B': 'foo', 'C': 'bar',
+                        'D': Timestamp("20010101"),
+                        'E': datetime(2001, 1, 2, 0, 0)},
+                       index=np.arange(10))
+        result = df.get_dtype_counts()
+        expected = Series({'int64': 1, datetime64name: 2, objectname: 2})
+        result.sort_index()
+        expected.sort_index()
+        tm.assert_series_equal(result, expected)
+
+        # check with ndarray construction ndim==0 (e.g. we are passing a ndim 0
+        # ndarray with a dtype specified)
+        df = DataFrame({'a': 1., 'b': 2, 'c': 'foo',
+                        floatname: np.array(1., dtype=floatname),
+                        intname: np.array(1, dtype=intname)},
+                       index=np.arange(10))
+        result = df.get_dtype_counts()
+        expected = {objectname: 1}
+        if intname == 'int64':
+            expected['int64'] = 2
+        else:
+            expected['int64'] = 1
+            expected[intname] = 1
+        if floatname == 'float64':
+            expected['float64'] = 2
+        else:
+            expected['float64'] = 1
+            expected[floatname] = 1
+
+        result = result.sort_index()
+        expected = Series(expected).sort_index()
+        tm.assert_series_equal(result, expected)
+
+        # check with ndarray construction ndim>0
+        df = DataFrame({'a': 1., 'b': 2, 'c': 'foo',
+                        floatname: np.array([1.] * 10, dtype=floatname),
+                        intname: np.array([1] * 10, dtype=intname)},
+                       index=np.arange(10))
+        result = df.get_dtype_counts()
+        result = result.sort_index()
+        tm.assert_series_equal(result, expected)
+
+        # GH 2809
+        ind = date_range(start="2000-01-01", freq="D", periods=10)
+        datetimes = [ts.to_pydatetime() for ts in ind]
+        datetime_s = Series(datetimes)
+        assert datetime_s.dtype == 'M8[ns]'
+        df = DataFrame({'datetime_s': datetime_s})
+        result = df.get_dtype_counts()
+        expected = Series({datetime64name: 1})
+        result = result.sort_index()
+        expected = expected.sort_index()
+        tm.assert_series_equal(result, expected)
+
+        # GH 2810
+        ind = date_range(start="2000-01-01", freq="D", periods=10)
+        datetimes = [ts.to_pydatetime() for ts in ind]
+        dates = [ts.date() for ts in ind]
+        df = DataFrame({'datetimes': datetimes, 'dates': dates})
+        result = df.get_dtype_counts()
+        expected = Series({datetime64name: 1, objectname: 1})
+        result = result.sort_index()
+        expected = expected.sort_index()
+        tm.assert_series_equal(result, expected)
+
+        # GH 7594
+        # don't coerce tz-aware
+        import pytz
+        tz = pytz.timezone('US/Eastern')
+        dt = tz.localize(datetime(2012, 1, 1))
+
+        df = DataFrame({'End Date': dt}, index=[0])
+        assert df.iat[0, 0] == dt
+        tm.assert_series_equal(df.dtypes, Series(
+            {'End Date': 'datetime64[ns, US/Eastern]'}))
+
+        df = DataFrame([{'End Date': dt}])
+        assert df.iat[0, 0] == dt
+        tm.assert_series_equal(df.dtypes, Series(
+            {'End Date': 'datetime64[ns, US/Eastern]'}))
+
+        # tz-aware (UTC and other tz's)
+        # GH 8411
+        dr = date_range('20130101', periods=3)
+        df = DataFrame({'value': dr})
+        assert df.iat[0, 0].tz is None
+        dr = date_range('20130101', periods=3, tz='UTC')
+        df = DataFrame({'value': dr})
+        assert str(df.iat[0, 0].tz) == 'UTC'
+        dr = date_range('20130101', periods=3, tz='US/Eastern')
+        df = DataFrame({'value': dr})
+        assert str(df.iat[0, 0].tz) == 'US/Eastern'
+
+        # GH 7822
+        # preserver an index with a tz on dict construction
+        i = date_range('1/1/2011', periods=5, freq='10s', tz='US/Eastern')
+
+        expected = DataFrame(
+            {'a': i.to_series(keep_tz=True).reset_index(drop=True)})
+        df = DataFrame()
+        df['a'] = i
+        tm.assert_frame_equal(df, expected)
+
+        df = DataFrame({'a': i})
+        tm.assert_frame_equal(df, expected)
+
+        # multiples
+        i_no_tz = date_range('1/1/2011', periods=5, freq='10s')
+        df = DataFrame({'a': i, 'b': i_no_tz})
+        expected = DataFrame({'a': i.to_series(keep_tz=True)
+                              .reset_index(drop=True), 'b': i_no_tz})
+        tm.assert_frame_equal(df, expected)
+
+    def test_constructor_datetimes_with_nulls(self):
+        # gh-15869
+        for arr in [np.array([None, None, None, None,
+                              datetime.now(), None]),
+                    np.array([None, None, datetime.now(), None])]:
+            result = DataFrame(arr).get_dtype_counts()
+            expected = Series({'datetime64[ns]': 1})
+            tm.assert_series_equal(result, expected)
+
+    def test_constructor_for_list_with_dtypes(self):
+        # TODO(wesm): unused
+        intname = np.dtype(np.int_).name  # noqa
+        floatname = np.dtype(np.float_).name  # noqa
+        datetime64name = np.dtype('M8[ns]').name
+        objectname = np.dtype(np.object_).name
+
+        # test list of lists/ndarrays
+        df = DataFrame([np.arange(5) for x in range(5)])
+        result = df.get_dtype_counts()
+        expected = Series({'int64': 5})
+
+        df = DataFrame([np.array(np.arange(5), dtype='int32')
+                        for x in range(5)])
+        result = df.get_dtype_counts()
+        expected = Series({'int32': 5})
+
+        # overflow issue? (we always expecte int64 upcasting here)
+        df = DataFrame({'a': [2 ** 31, 2 ** 31 + 1]})
+        result = df.get_dtype_counts()
+        expected = Series({'int64': 1})
+        tm.assert_series_equal(result, expected)
+
+        # GH #2751 (construction with no index specified), make sure we cast to
+        # platform values
+        df = DataFrame([1, 2])
+        result = df.get_dtype_counts()
+        expected = Series({'int64': 1})
+        tm.assert_series_equal(result, expected)
+
+        df = DataFrame([1., 2.])
+        result = df.get_dtype_counts()
+        expected = Series({'float64': 1})
+        tm.assert_series_equal(result, expected)
+
+        df = DataFrame({'a': [1, 2]})
+        result = df.get_dtype_counts()
+        expected = Series({'int64': 1})
+        tm.assert_series_equal(result, expected)
+
+        df = DataFrame({'a': [1., 2.]})
+        result = df.get_dtype_counts()
+        expected = Series({'float64': 1})
+        tm.assert_series_equal(result, expected)
+
+        df = DataFrame({'a': 1}, index=lrange(3))
+        result = df.get_dtype_counts()
+        expected = Series({'int64': 1})
+        tm.assert_series_equal(result, expected)
+
+        df = DataFrame({'a': 1.}, index=lrange(3))
+        result = df.get_dtype_counts()
+        expected = Series({'float64': 1})
+        tm.assert_series_equal(result, expected)
+
+        # with object list
+        df = DataFrame({'a': [1, 2, 4, 7], 'b': [1.2, 2.3, 5.1, 6.3],
+                        'c': list('abcd'),
+                        'd': [datetime(2000, 1, 1) for i in range(4)],
+                        'e': [1., 2, 4., 7]})
+        result = df.get_dtype_counts()
+        expected = Series(
+            {'int64': 1, 'float64': 2, datetime64name: 1, objectname: 1})
+        result = result.sort_index()
+        expected = expected.sort_index()
+        tm.assert_series_equal(result, expected)
+
+    def test_constructor_frame_copy(self):
+        cop = DataFrame(self.frame, copy=True)
+        cop['A'] = 5
+        assert (cop['A'] == 5).all()
+        assert not (self.frame['A'] == 5).all()
+
+    def test_constructor_ndarray_copy(self):
+        df = DataFrame(self.frame.values)
+
+        self.frame.values[5] = 5
+        assert (df.values[5] == 5).all()
+
+        df = DataFrame(self.frame.values, copy=True)
+        self.frame.values[6] = 6
+        assert not (df.values[6] == 6).all()
+
+    def test_constructor_series_copy(self):
+        series = self.frame._series
+
+        df = DataFrame({'A': series['A']})
+        df['A'][:] = 5
+
+        assert not (series['A'] == 5).all()
+
+    def test_constructor_with_nas(self):
+        # GH 5016
+        # na's in indices
+
+        def check(df):
+            for i in range(len(df.columns)):
+                df.iloc[:, i]
+
+            # allow single nans to succeed
+            indexer = np.arange(len(df.columns))[isna(df.columns)]
+
+            if len(indexer) == 1:
+                tm.assert_series_equal(df.iloc[:, indexer[0]],
+                                       df.loc[:, np.nan])
+
+            # multiple nans should fail
+            else:
+
+                def f():
+                    df.loc[:, np.nan]
+                pytest.raises(TypeError, f)
+
+        df = DataFrame([[1, 2, 3], [4, 5, 6]], index=[1, np.nan])
+        check(df)
+
+        df = DataFrame([[1, 2, 3], [4, 5, 6]], columns=[1.1, 2.2, np.nan])
+        check(df)
+
+        df = DataFrame([[0, 1, 2, 3], [4, 5, 6, 7]],
+                       columns=[np.nan, 1.1, 2.2, np.nan])
+        check(df)
+
+        df = DataFrame([[0.0, 1, 2, 3.0], [4, 5, 6, 7]],
+                       columns=[np.nan, 1.1, 2.2, np.nan])
+        check(df)
+
+    def test_constructor_lists_to_object_dtype(self):
+        # from #1074
+        d = DataFrame({'a': [np.nan, False]})
+        assert d['a'].dtype == np.object_
+        assert not d['a'][1]
+
+    def test_constructor_categorical(self):
+
+        # GH8626
+
+        # dict creation
+        df = DataFrame({'A': list('abc')}, dtype='category')
+        expected = Series(list('abc'), dtype='category', name='A')
+        tm.assert_series_equal(df['A'], expected)
+
+        # to_frame
+        s = Series(list('abc'), dtype='category')
+        result = s.to_frame()
+        expected = Series(list('abc'), dtype='category', name=0)
+        tm.assert_series_equal(result[0], expected)
+        result = s.to_frame(name='foo')
+        expected = Series(list('abc'), dtype='category', name='foo')
+        tm.assert_series_equal(result['foo'], expected)
+
+        # list-like creation
+        df = DataFrame(list('abc'), dtype='category')
+        expected = Series(list('abc'), dtype='category', name=0)
+        tm.assert_series_equal(df[0], expected)
+
+        # ndim != 1
+        df = DataFrame([Categorical(list('abc'))])
+        expected = DataFrame({0: Series(list('abc'), dtype='category')})
+        tm.assert_frame_equal(df, expected)
+
+        df = DataFrame([Categorical(list('abc')), Categorical(list('abd'))])
+        expected = DataFrame({0: Series(list('abc'), dtype='category'),
+                              1: Series(list('abd'), dtype='category')},
+                             columns=[0, 1])
+        tm.assert_frame_equal(df, expected)
+
+        # mixed
+        df = DataFrame([Categorical(list('abc')), list('def')])
+        expected = DataFrame({0: Series(list('abc'), dtype='category'),
+                              1: list('def')}, columns=[0, 1])
+        tm.assert_frame_equal(df, expected)
+
+        # invalid (shape)
+        pytest.raises(ValueError,
+                      lambda: DataFrame([Categorical(list('abc')),
+                                         Categorical(list('abdefg'))]))
+
+        # ndim > 1
+        pytest.raises(NotImplementedError,
+                      lambda: Categorical(np.array([list('abcd')])))
+
+    def test_constructor_categorical_series(self):
+
+        l = [1, 2, 3, 1]
+        exp = Series(l).astype('category')
+        res = Series(l, dtype='category')
+        tm.assert_series_equal(res, exp)
+
+        l = ["a", "b", "c", "a"]
+        exp = Series(l).astype('category')
+        res = Series(l, dtype='category')
+        tm.assert_series_equal(res, exp)
+
+        # insert into frame with different index
+        # GH 8076
+        index = date_range('20000101', periods=3)
+        expected = Series(Categorical(values=[np.nan, np.nan, np.nan],
+                                      categories=['a', 'b', 'c']))
+        expected.index = index
+
+        expected = DataFrame({'x': expected})
+        df = DataFrame(
+            {'x': Series(['a', 'b', 'c'], dtype='category')}, index=index)
+        tm.assert_frame_equal(df, expected)
+
+    def test_from_records_to_records(self):
+        # from numpy documentation
+        arr = np.zeros((2,), dtype=('i4,f4,a10'))
+        arr[:] = [(1, 2., 'Hello'), (2, 3., "World")]
+
+        # TODO(wesm): unused
+        frame = DataFrame.from_records(arr)  # noqa
+
+        index = pd.Index(np.arange(len(arr))[::-1])
+        indexed_frame = DataFrame.from_records(arr, index=index)
+        tm.assert_index_equal(indexed_frame.index, index)
+
+        # without names, it should go to last ditch
+        arr2 = np.zeros((2, 3))
+        tm.assert_frame_equal(DataFrame.from_records(arr2), DataFrame(arr2))
+
+        # wrong length
+        msg = r'Shape of passed values is \(3, 2\), indices imply \(3, 1\)'
+        with tm.assert_raises_regex(ValueError, msg):
+            DataFrame.from_records(arr, index=index[:-1])
+
+        indexed_frame = DataFrame.from_records(arr, index='f1')
+
+        # what to do?
+        records = indexed_frame.to_records()
+        assert len(records.dtype.names) == 3
+
+        records = indexed_frame.to_records(index=False)
+        assert len(records.dtype.names) == 2
+        assert 'index' not in records.dtype.names
+
+    def test_from_records_nones(self):
+        tuples = [(1, 2, None, 3),
+                  (1, 2, None, 3),
+                  (None, 2, 5, 3)]
+
+        df = DataFrame.from_records(tuples, columns=['a', 'b', 'c', 'd'])
+        assert np.isnan(df['c'][0])
+
+    def test_from_records_iterator(self):
+        arr = np.array([(1.0, 1.0, 2, 2), (3.0, 3.0, 4, 4), (5., 5., 6, 6),
+                        (7., 7., 8, 8)],
+                       dtype=[('x', np.float64), ('u', np.float32),
+                              ('y', np.int64), ('z', np.int32)])
+        df = DataFrame.from_records(iter(arr), nrows=2)
+        xp = DataFrame({'x': np.array([1.0, 3.0], dtype=np.float64),
+                        'u': np.array([1.0, 3.0], dtype=np.float32),
+                        'y': np.array([2, 4], dtype=np.int64),
+                        'z': np.array([2, 4], dtype=np.int32)})
+        tm.assert_frame_equal(df.reindex_like(xp), xp)
+
+        # no dtypes specified here, so just compare with the default
+        arr = [(1.0, 2), (3.0, 4), (5., 6), (7., 8)]
+        df = DataFrame.from_records(iter(arr), columns=['x', 'y'],
+                                    nrows=2)
+        tm.assert_frame_equal(df, xp.reindex(columns=['x', 'y']),
+                              check_dtype=False)
+
+    def test_from_records_tuples_generator(self):
+        def tuple_generator(length):
+            for i in range(length):
+                letters = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
+                yield (i, letters[i % len(letters)], i / length)
+
+        columns_names = ['Integer', 'String', 'Float']
+        columns = [[i[j] for i in tuple_generator(
+            10)] for j in range(len(columns_names))]
+        data = {'Integer': columns[0],
+                'String': columns[1], 'Float': columns[2]}
+        expected = DataFrame(data, columns=columns_names)
+
+        generator = tuple_generator(10)
+        result = DataFrame.from_records(generator, columns=columns_names)
+        tm.assert_frame_equal(result, expected)
+
+    def test_from_records_lists_generator(self):
+        def list_generator(length):
+            for i in range(length):
+                letters = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
+                yield [i, letters[i % len(letters)], i / length]
+
+        columns_names = ['Integer', 'String', 'Float']
+        columns = [[i[j] for i in list_generator(
+            10)] for j in range(len(columns_names))]
+        data = {'Integer': columns[0],
+                'String': columns[1], 'Float': columns[2]}
+        expected = DataFrame(data, columns=columns_names)
+
+        generator = list_generator(10)
+        result = DataFrame.from_records(generator, columns=columns_names)
+        tm.assert_frame_equal(result, expected)
+
+    def test_from_records_columns_not_modified(self):
+        tuples = [(1, 2, 3),
+                  (1, 2, 3),
+                  (2, 5, 3)]
+
+        columns = ['a', 'b', 'c']
+        original_columns = list(columns)
+
+        df = DataFrame.from_records(tuples, columns=columns, index='a')  # noqa
+
+        assert columns == original_columns
+
+    def test_from_records_decimal(self):
+        from decimal import Decimal
+
+        tuples = [(Decimal('1.5'),), (Decimal('2.5'),), (None,)]
+
+        df = DataFrame.from_records(tuples, columns=['a'])
+        assert df['a'].dtype == object
+
+        df = DataFrame.from_records(tuples, columns=['a'], coerce_float=True)
+        assert df['a'].dtype == np.float64
+        assert np.isnan(df['a'].values[-1])
+
+    def test_from_records_duplicates(self):
+        result = DataFrame.from_records([(1, 2, 3), (4, 5, 6)],
+                                        columns=['a', 'b', 'a'])
+
+        expected = DataFrame([(1, 2, 3), (4, 5, 6)],
+                             columns=['a', 'b', 'a'])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_from_records_set_index_name(self):
+        def create_dict(order_id):
+            return {'order_id': order_id, 'quantity': np.random.randint(1, 10),
+                    'price': np.random.randint(1, 10)}
+        documents = [create_dict(i) for i in range(10)]
+        # demo missing data
+        documents.append({'order_id': 10, 'quantity': 5})
+
+        result = DataFrame.from_records(documents, index='order_id')
+        assert result.index.name == 'order_id'
+
+        # MultiIndex
+        result = DataFrame.from_records(documents,
+                                        index=['order_id', 'quantity'])
+        assert result.index.names == ('order_id', 'quantity')
+
+    def test_from_records_misc_brokenness(self):
+        # #2179
+
+        data = {1: ['foo'], 2: ['bar']}
+
+        result = DataFrame.from_records(data, columns=['a', 'b'])
+        exp = DataFrame(data, columns=['a', 'b'])
+        tm.assert_frame_equal(result, exp)
+
+        # overlap in index/index_names
+
+        data = {'a': [1, 2, 3], 'b': [4, 5, 6]}
+
+        result = DataFrame.from_records(data, index=['a', 'b', 'c'])
+        exp = DataFrame(data, index=['a', 'b', 'c'])
+        tm.assert_frame_equal(result, exp)
+
+        # GH 2623
+        rows = []
+        rows.append([datetime(2010, 1, 1), 1])
+        rows.append([datetime(2010, 1, 2), 'hi'])  # test col upconverts to obj
+        df2_obj = DataFrame.from_records(rows, columns=['date', 'test'])
+        results = df2_obj.get_dtype_counts()
+        expected = Series({'datetime64[ns]': 1, 'object': 1})
+
+        rows = []
+        rows.append([datetime(2010, 1, 1), 1])
+        rows.append([datetime(2010, 1, 2), 1])
+        df2_obj = DataFrame.from_records(rows, columns=['date', 'test'])
+        results = df2_obj.get_dtype_counts().sort_index()
+        expected = Series({'datetime64[ns]': 1, 'int64': 1})
+        tm.assert_series_equal(results, expected)
+
+    def test_from_records_empty(self):
+        # 3562
+        result = DataFrame.from_records([], columns=['a', 'b', 'c'])
+        expected = DataFrame(columns=['a', 'b', 'c'])
+        tm.assert_frame_equal(result, expected)
+
+        result = DataFrame.from_records([], columns=['a', 'b', 'b'])
+        expected = DataFrame(columns=['a', 'b', 'b'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_from_records_empty_with_nonempty_fields_gh3682(self):
+        a = np.array([(1, 2)], dtype=[('id', np.int64), ('value', np.int64)])
+        df = DataFrame.from_records(a, index='id')
+        tm.assert_index_equal(df.index, Index([1], name='id'))
+        assert df.index.name == 'id'
+        tm.assert_index_equal(df.columns, Index(['value']))
+
+        b = np.array([], dtype=[('id', np.int64), ('value', np.int64)])
+        df = DataFrame.from_records(b, index='id')
+        tm.assert_index_equal(df.index, Index([], name='id'))
+        assert df.index.name == 'id'
+
+    def test_from_records_with_datetimes(self):
+
+        # this may fail on certain platforms because of a numpy issue
+        # related GH6140
+        if not is_platform_little_endian():
+            pytest.skip("known failure of test on non-little endian")
+
+        # construction with a null in a recarray
+        # GH 6140
+        expected = DataFrame({'EXPIRY': [datetime(2005, 3, 1, 0, 0), None]})
+
+        arrdata = [np.array([datetime(2005, 3, 1, 0, 0), None])]
+        dtypes = [('EXPIRY', '<M8[ns]')]
+
+        try:
+            recarray = np.core.records.fromarrays(arrdata, dtype=dtypes)
+        except (ValueError):
+            pytest.skip("known failure of numpy rec array creation")
+
+        result = DataFrame.from_records(recarray)
+        tm.assert_frame_equal(result, expected)
+
+        # coercion should work too
+        arrdata = [np.array([datetime(2005, 3, 1, 0, 0), None])]
+        dtypes = [('EXPIRY', '<M8[m]')]
+        recarray = np.core.records.fromarrays(arrdata, dtype=dtypes)
+        result = DataFrame.from_records(recarray)
+        tm.assert_frame_equal(result, expected)
+
+    def test_from_records_sequencelike(self):
+        df = DataFrame({'A': np.array(np.random.randn(6), dtype=np.float64),
+                        'A1': np.array(np.random.randn(6), dtype=np.float64),
+                        'B': np.array(np.arange(6), dtype=np.int64),
+                        'C': ['foo'] * 6,
+                        'D': np.array([True, False] * 3, dtype=bool),
+                        'E': np.array(np.random.randn(6), dtype=np.float32),
+                        'E1': np.array(np.random.randn(6), dtype=np.float32),
+                        'F': np.array(np.arange(6), dtype=np.int32)})
+
+        # this is actually tricky to create the recordlike arrays and
+        # have the dtypes be intact
+        blocks = df._to_dict_of_blocks()
+        tuples = []
+        columns = []
+        dtypes = []
+        for dtype, b in compat.iteritems(blocks):
+            columns.extend(b.columns)
+            dtypes.extend([(c, np.dtype(dtype).descr[0][1])
+                           for c in b.columns])
+        for i in range(len(df.index)):
+            tup = []
+            for _, b in compat.iteritems(blocks):
+                tup.extend(b.iloc[i].values)
+            tuples.append(tuple(tup))
+
+        recarray = np.array(tuples, dtype=dtypes).view(np.recarray)
+        recarray2 = df.to_records()
+        lists = [list(x) for x in tuples]
+
+        # tuples (lose the dtype info)
+        result = (DataFrame.from_records(tuples, columns=columns)
+                  .reindex(columns=df.columns))
+
+        # created recarray and with to_records recarray (have dtype info)
+        result2 = (DataFrame.from_records(recarray, columns=columns)
+                   .reindex(columns=df.columns))
+        result3 = (DataFrame.from_records(recarray2, columns=columns)
+                   .reindex(columns=df.columns))
+
+        # list of tupels (no dtype info)
+        result4 = (DataFrame.from_records(lists, columns=columns)
+                   .reindex(columns=df.columns))
+
+        tm.assert_frame_equal(result, df, check_dtype=False)
+        tm.assert_frame_equal(result2, df)
+        tm.assert_frame_equal(result3, df)
+        tm.assert_frame_equal(result4, df, check_dtype=False)
+
+        # tuples is in the order of the columns
+        result = DataFrame.from_records(tuples)
+        tm.assert_index_equal(result.columns, pd.Index(lrange(8)))
+
+        # test exclude parameter & we are casting the results here (as we don't
+        # have dtype info to recover)
+        columns_to_test = [columns.index('C'), columns.index('E1')]
+
+        exclude = list(set(range(8)) - set(columns_to_test))
+        result = DataFrame.from_records(tuples, exclude=exclude)
+        result.columns = [columns[i] for i in sorted(columns_to_test)]
+        tm.assert_series_equal(result['C'], df['C'])
+        tm.assert_series_equal(result['E1'], df['E1'].astype('float64'))
+
+        # empty case
+        result = DataFrame.from_records([], columns=['foo', 'bar', 'baz'])
+        assert len(result) == 0
+        tm.assert_index_equal(result.columns,
+                              pd.Index(['foo', 'bar', 'baz']))
+
+        result = DataFrame.from_records([])
+        assert len(result) == 0
+        assert len(result.columns) == 0
+
+    def test_from_records_dictlike(self):
+
+        # test the dict methods
+        df = DataFrame({'A': np.array(np.random.randn(6), dtype=np.float64),
+                        'A1': np.array(np.random.randn(6), dtype=np.float64),
+                        'B': np.array(np.arange(6), dtype=np.int64),
+                        'C': ['foo'] * 6,
+                        'D': np.array([True, False] * 3, dtype=bool),
+                        'E': np.array(np.random.randn(6), dtype=np.float32),
+                        'E1': np.array(np.random.randn(6), dtype=np.float32),
+                        'F': np.array(np.arange(6), dtype=np.int32)})
+
+        # columns is in a different order here than the actual items iterated
+        # from the dict
+        blocks = df._to_dict_of_blocks()
+        columns = []
+        for dtype, b in compat.iteritems(blocks):
+            columns.extend(b.columns)
+
+        asdict = {x: y for x, y in compat.iteritems(df)}
+        asdict2 = {x: y.values for x, y in compat.iteritems(df)}
+
+        # dict of series & dict of ndarrays (have dtype info)
+        results = []
+        results.append(DataFrame.from_records(
+            asdict).reindex(columns=df.columns))
+        results.append(DataFrame.from_records(asdict, columns=columns)
+                       .reindex(columns=df.columns))
+        results.append(DataFrame.from_records(asdict2, columns=columns)
+                       .reindex(columns=df.columns))
+
+        for r in results:
+            tm.assert_frame_equal(r, df)
+
+    def test_from_records_with_index_data(self):
+        df = DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'])
+
+        data = np.random.randn(10)
+        df1 = DataFrame.from_records(df, index=data)
+        tm.assert_index_equal(df1.index, Index(data))
+
+    def test_from_records_bad_index_column(self):
+        df = DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'])
+
+        # should pass
+        df1 = DataFrame.from_records(df, index=['C'])
+        tm.assert_index_equal(df1.index, Index(df.C))
+
+        df1 = DataFrame.from_records(df, index='C')
+        tm.assert_index_equal(df1.index, Index(df.C))
+
+        # should fail
+        pytest.raises(ValueError, DataFrame.from_records, df, index=[2])
+        pytest.raises(KeyError, DataFrame.from_records, df, index=2)
+
+    def test_from_records_non_tuple(self):
+        class Record(object):
+
+            def __init__(self, *args):
+                self.args = args
+
+            def __getitem__(self, i):
+                return self.args[i]
+
+            def __iter__(self):
+                return iter(self.args)
+
+        recs = [Record(1, 2, 3), Record(4, 5, 6), Record(7, 8, 9)]
+        tups = lmap(tuple, recs)
+
+        result = DataFrame.from_records(recs)
+        expected = DataFrame.from_records(tups)
+        tm.assert_frame_equal(result, expected)
+
+    def test_from_records_len0_with_columns(self):
+        # #2633
+        result = DataFrame.from_records([], index='foo',
+                                        columns=['foo', 'bar'])
+        expected = Index(['bar'])
+
+        assert len(result) == 0
+        assert result.index.name == 'foo'
+        tm.assert_index_equal(result.columns, expected)
+
+    def test_to_frame_with_falsey_names(self):
+        # GH 16114
+        result = Series(name=0).to_frame().dtypes
+        expected = Series({0: np.float64})
+        tm.assert_series_equal(result, expected)
+
+        result = DataFrame(Series(name=0)).dtypes
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [None, 'uint8', 'category'])
+    def test_constructor_range_dtype(self, dtype):
+        # GH 16804
+        expected = DataFrame({'A': [0, 1, 2, 3, 4]}, dtype=dtype or 'int64')
+        result = DataFrame({'A': range(5)}, dtype=dtype)
+        tm.assert_frame_equal(result, expected)
+
+
+class TestDataFrameConstructorWithDatetimeTZ(TestData):
+
+    def test_from_dict(self):
+
+        # 8260
+        # support datetime64 with tz
+
+        idx = Index(date_range('20130101', periods=3, tz='US/Eastern'),
+                    name='foo')
+        dr = date_range('20130110', periods=3)
+
+        # construction
+        df = DataFrame({'A': idx, 'B': dr})
+        assert df['A'].dtype, 'M8[ns, US/Eastern'
+        assert df['A'].name == 'A'
+        tm.assert_series_equal(df['A'], Series(idx, name='A'))
+        tm.assert_series_equal(df['B'], Series(dr, name='B'))
+
+    def test_from_index(self):
+
+        # from index
+        idx2 = date_range('20130101', periods=3, tz='US/Eastern', name='foo')
+        df2 = DataFrame(idx2)
+        tm.assert_series_equal(df2['foo'], Series(idx2, name='foo'))
+        df2 = DataFrame(Series(idx2))
+        tm.assert_series_equal(df2['foo'], Series(idx2, name='foo'))
+
+        idx2 = date_range('20130101', periods=3, tz='US/Eastern')
+        df2 = DataFrame(idx2)
+        tm.assert_series_equal(df2[0], Series(idx2, name=0))
+        df2 = DataFrame(Series(idx2))
+        tm.assert_series_equal(df2[0], Series(idx2, name=0))
+
+    def test_frame_dict_constructor_datetime64_1680(self):
+        dr = date_range('1/1/2012', periods=10)
+        s = Series(dr, index=dr)
+
+        # it works!
+        DataFrame({'a': 'foo', 'b': s}, index=dr)
+        DataFrame({'a': 'foo', 'b': s.values}, index=dr)
+
+    def test_frame_datetime64_mixed_index_ctor_1681(self):
+        dr = date_range('2011/1/1', '2012/1/1', freq='W-FRI')
+        ts = Series(dr)
+
+        # it works!
+        d = DataFrame({'A': 'foo', 'B': ts}, index=dr)
+        assert d['B'].isna().all()
+
+    def test_frame_timeseries_to_records(self):
+        index = date_range('1/1/2000', periods=10)
+        df = DataFrame(np.random.randn(10, 3), index=index,
+                       columns=['a', 'b', 'c'])
+
+        result = df.to_records()
+        result['index'].dtype == 'M8[ns]'
+
+        result = df.to_records(index=False)
+
+    def test_frame_timeseries_column(self):
+        # GH19157
+        dr = date_range(start='20130101T10:00:00', periods=3, freq='T',
+                        tz='US/Eastern')
+        result = DataFrame(dr, columns=['timestamps'])
+        expected = DataFrame({'timestamps': [
+            Timestamp('20130101T10:00:00', tz='US/Eastern'),
+            Timestamp('20130101T10:01:00', tz='US/Eastern'),
+            Timestamp('20130101T10:02:00', tz='US/Eastern')]})
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_convert_to.py b/pandas/tests/frame/test_convert_to.py
new file mode 100644
index 0000000000000..2472022b862bc
--- /dev/null
+++ b/pandas/tests/frame/test_convert_to.py
@@ -0,0 +1,330 @@
+# -*- coding: utf-8 -*-
+
+from datetime import datetime
+
+import pytest
+import pytz
+import collections
+from collections import OrderedDict, defaultdict
+import numpy as np
+
+from pandas import compat
+from pandas.compat import long
+from pandas import (DataFrame, Series, MultiIndex, Timestamp,
+                    date_range)
+
+import pandas.util.testing as tm
+from pandas.tests.frame.common import TestData
+
+
+class TestDataFrameConvertTo(TestData):
+
+    def test_to_dict_timestamp(self):
+
+        # GH11247
+        # split/records producing np.datetime64 rather than Timestamps
+        # on datetime64[ns] dtypes only
+
+        tsmp = Timestamp('20130101')
+        test_data = DataFrame({'A': [tsmp, tsmp], 'B': [tsmp, tsmp]})
+        test_data_mixed = DataFrame({'A': [tsmp, tsmp], 'B': [1, 2]})
+
+        expected_records = [{'A': tsmp, 'B': tsmp},
+                            {'A': tsmp, 'B': tsmp}]
+        expected_records_mixed = [{'A': tsmp, 'B': 1},
+                                  {'A': tsmp, 'B': 2}]
+
+        assert (test_data.to_dict(orient='records') ==
+                expected_records)
+        assert (test_data_mixed.to_dict(orient='records') ==
+                expected_records_mixed)
+
+        expected_series = {
+            'A': Series([tsmp, tsmp], name='A'),
+            'B': Series([tsmp, tsmp], name='B'),
+        }
+        expected_series_mixed = {
+            'A': Series([tsmp, tsmp], name='A'),
+            'B': Series([1, 2], name='B'),
+        }
+
+        tm.assert_dict_equal(test_data.to_dict(orient='series'),
+                             expected_series)
+        tm.assert_dict_equal(test_data_mixed.to_dict(orient='series'),
+                             expected_series_mixed)
+
+        expected_split = {
+            'index': [0, 1],
+            'data': [[tsmp, tsmp],
+                     [tsmp, tsmp]],
+            'columns': ['A', 'B']
+        }
+        expected_split_mixed = {
+            'index': [0, 1],
+            'data': [[tsmp, 1],
+                     [tsmp, 2]],
+            'columns': ['A', 'B']
+        }
+
+        tm.assert_dict_equal(test_data.to_dict(orient='split'),
+                             expected_split)
+        tm.assert_dict_equal(test_data_mixed.to_dict(orient='split'),
+                             expected_split_mixed)
+
+    def test_to_dict_invalid_orient(self):
+        df = DataFrame({'A': [0, 1]})
+        pytest.raises(ValueError, df.to_dict, orient='xinvalid')
+
+    def test_to_records_dt64(self):
+        df = DataFrame([["one", "two", "three"],
+                        ["four", "five", "six"]],
+                       index=date_range("2012-01-01", "2012-01-02"))
+
+        # convert_datetime64 defaults to None
+        expected = df.index.values[0]
+        result = df.to_records()['index'][0]
+        assert expected == result
+
+        # check for FutureWarning if convert_datetime64=False is passed
+        with tm.assert_produces_warning(FutureWarning):
+            expected = df.index.values[0]
+            result = df.to_records(convert_datetime64=False)['index'][0]
+            assert expected == result
+
+        # check for FutureWarning if convert_datetime64=True is passed
+        with tm.assert_produces_warning(FutureWarning):
+            expected = df.index[0]
+            result = df.to_records(convert_datetime64=True)['index'][0]
+            assert expected == result
+
+    def test_to_records_with_multindex(self):
+        # GH3189
+        index = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+                 ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+        data = np.zeros((8, 4))
+        df = DataFrame(data, index=index)
+        r = df.to_records(index=True)['level_0']
+        assert 'bar' in r
+        assert 'one' not in r
+
+    def test_to_records_with_Mapping_type(self):
+        import email
+        from email.parser import Parser
+        import collections
+
+        collections.Mapping.register(email.message.Message)
+
+        headers = Parser().parsestr('From: <user@example.com>\n'
+                                    'To: <someone_else@example.com>\n'
+                                    'Subject: Test message\n'
+                                    '\n'
+                                    'Body would go here\n')
+
+        frame = DataFrame.from_records([headers])
+        all(x in frame for x in ['Type', 'Subject', 'From'])
+
+    def test_to_records_floats(self):
+        df = DataFrame(np.random.rand(10, 10))
+        df.to_records()
+
+    def test_to_records_index_name(self):
+        df = DataFrame(np.random.randn(3, 3))
+        df.index.name = 'X'
+        rs = df.to_records()
+        assert 'X' in rs.dtype.fields
+
+        df = DataFrame(np.random.randn(3, 3))
+        rs = df.to_records()
+        assert 'index' in rs.dtype.fields
+
+        df.index = MultiIndex.from_tuples([('a', 'x'), ('a', 'y'), ('b', 'z')])
+        df.index.names = ['A', None]
+        rs = df.to_records()
+        assert 'level_0' in rs.dtype.fields
+
+    def test_to_records_with_unicode_index(self):
+        # GH13172
+        # unicode_literals conflict with to_records
+        result = DataFrame([{u'a': u'x', u'b': 'y'}]).set_index(u'a')\
+            .to_records()
+        expected = np.rec.array([('x', 'y')], dtype=[('a', 'O'), ('b', 'O')])
+        tm.assert_almost_equal(result, expected)
+
+    def test_to_records_with_unicode_column_names(self):
+        # xref issue: https://github.com/numpy/numpy/issues/2407
+        # Issue #11879. to_records used to raise an exception when used
+        # with column names containing non-ascii characters in Python 2
+        result = DataFrame(data={u"accented_name_é": [1.0]}).to_records()
+
+        # Note that numpy allows for unicode field names but dtypes need
+        # to be specified using dictionary instead of list of tuples.
+        expected = np.rec.array(
+            [(0, 1.0)],
+            dtype={"names": ["index", u"accented_name_é"],
+                   "formats": ['=i8', '=f8']}
+        )
+        tm.assert_almost_equal(result, expected)
+
+    def test_to_records_with_categorical(self):
+
+        # GH8626
+
+        # dict creation
+        df = DataFrame({'A': list('abc')}, dtype='category')
+        expected = Series(list('abc'), dtype='category', name='A')
+        tm.assert_series_equal(df['A'], expected)
+
+        # list-like creation
+        df = DataFrame(list('abc'), dtype='category')
+        expected = Series(list('abc'), dtype='category', name=0)
+        tm.assert_series_equal(df[0], expected)
+
+        # to record array
+        # this coerces
+        result = df.to_records()
+        expected = np.rec.array([(0, 'a'), (1, 'b'), (2, 'c')],
+                                dtype=[('index', '=i8'), ('0', 'O')])
+        tm.assert_almost_equal(result, expected)
+
+    @pytest.mark.parametrize('mapping', [
+        dict,
+        collections.defaultdict(list),
+        collections.OrderedDict])
+    def test_to_dict(self, mapping):
+        test_data = {
+            'A': {'1': 1, '2': 2},
+            'B': {'1': '1', '2': '2', '3': '3'},
+        }
+
+        # GH16122
+        recons_data = DataFrame(test_data).to_dict(into=mapping)
+
+        for k, v in compat.iteritems(test_data):
+            for k2, v2 in compat.iteritems(v):
+                assert (v2 == recons_data[k][k2])
+
+        recons_data = DataFrame(test_data).to_dict("l", mapping)
+
+        for k, v in compat.iteritems(test_data):
+            for k2, v2 in compat.iteritems(v):
+                assert (v2 == recons_data[k][int(k2) - 1])
+
+        recons_data = DataFrame(test_data).to_dict("s", mapping)
+
+        for k, v in compat.iteritems(test_data):
+            for k2, v2 in compat.iteritems(v):
+                assert (v2 == recons_data[k][k2])
+
+        recons_data = DataFrame(test_data).to_dict("sp", mapping)
+        expected_split = {'columns': ['A', 'B'], 'index': ['1', '2', '3'],
+                          'data': [[1.0, '1'], [2.0, '2'], [np.nan, '3']]}
+        tm.assert_dict_equal(recons_data, expected_split)
+
+        recons_data = DataFrame(test_data).to_dict("r", mapping)
+        expected_records = [{'A': 1.0, 'B': '1'},
+                            {'A': 2.0, 'B': '2'},
+                            {'A': np.nan, 'B': '3'}]
+        assert isinstance(recons_data, list)
+        assert (len(recons_data) == 3)
+        for l, r in zip(recons_data, expected_records):
+            tm.assert_dict_equal(l, r)
+
+        # GH10844
+        recons_data = DataFrame(test_data).to_dict("i")
+
+        for k, v in compat.iteritems(test_data):
+            for k2, v2 in compat.iteritems(v):
+                assert (v2 == recons_data[k2][k])
+
+        df = DataFrame(test_data)
+        df['duped'] = df[df.columns[0]]
+        recons_data = df.to_dict("i")
+        comp_data = test_data.copy()
+        comp_data['duped'] = comp_data[df.columns[0]]
+        for k, v in compat.iteritems(comp_data):
+            for k2, v2 in compat.iteritems(v):
+                assert (v2 == recons_data[k2][k])
+
+    @pytest.mark.parametrize('mapping', [
+        list,
+        collections.defaultdict,
+        []])
+    def test_to_dict_errors(self, mapping):
+        # GH16122
+        df = DataFrame(np.random.randn(3, 3))
+        with pytest.raises(TypeError):
+            df.to_dict(into=mapping)
+
+    def test_to_dict_not_unique_warning(self):
+        # GH16927: When converting to a dict, if a column has a non-unique name
+        # it will be dropped, throwing a warning.
+        df = DataFrame([[1, 2, 3]], columns=['a', 'a', 'b'])
+        with tm.assert_produces_warning(UserWarning):
+            df.to_dict()
+
+    @pytest.mark.parametrize('tz', ['UTC', 'GMT', 'US/Eastern'])
+    def test_to_records_datetimeindex_with_tz(self, tz):
+        # GH13937
+        dr = date_range('2016-01-01', periods=10,
+                        freq='S', tz=tz)
+
+        df = DataFrame({'datetime': dr}, index=dr)
+
+        expected = df.to_records()
+        result = df.tz_convert("UTC").to_records()
+
+        # both converted to UTC, so they are equal
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_to_dict_box_scalars(self):
+        # 14216
+        # make sure that we are boxing properly
+        d = {'a': [1], 'b': ['b']}
+
+        result = DataFrame(d).to_dict()
+        assert isinstance(list(result['a'])[0], (int, long))
+        assert isinstance(list(result['b'])[0], (int, long))
+
+        result = DataFrame(d).to_dict(orient='records')
+        assert isinstance(result[0]['a'], (int, long))
+
+    def test_frame_to_dict_tz(self):
+        # GH18372 When converting to dict with orient='records' columns of
+        # datetime that are tz-aware were not converted to required arrays
+        data = [(datetime(2017, 11, 18, 21, 53, 0, 219225, tzinfo=pytz.utc),),
+                (datetime(2017, 11, 18, 22, 6, 30, 61810, tzinfo=pytz.utc,),)]
+        df = DataFrame(list(data), columns=["d", ])
+
+        result = df.to_dict(orient='records')
+        expected = [
+            {'d': Timestamp('2017-11-18 21:53:00.219225+0000', tz=pytz.utc)},
+            {'d': Timestamp('2017-11-18 22:06:30.061810+0000', tz=pytz.utc)},
+        ]
+        tm.assert_dict_equal(result[0], expected[0])
+        tm.assert_dict_equal(result[1], expected[1])
+
+    @pytest.mark.parametrize('into, expected', [
+        (dict, {0: {'int_col': 1, 'float_col': 1.0},
+                1: {'int_col': 2, 'float_col': 2.0},
+                2: {'int_col': 3, 'float_col': 3.0}}),
+        (OrderedDict, OrderedDict([(0, {'int_col': 1, 'float_col': 1.0}),
+                                   (1, {'int_col': 2, 'float_col': 2.0}),
+                                   (2, {'int_col': 3, 'float_col': 3.0})])),
+        (defaultdict(list), defaultdict(list,
+                                        {0: {'int_col': 1, 'float_col': 1.0},
+                                         1: {'int_col': 2, 'float_col': 2.0},
+                                         2: {'int_col': 3, 'float_col': 3.0}}))
+    ])
+    def test_to_dict_index_dtypes(self, into, expected):
+        # GH 18580
+        # When using to_dict(orient='index') on a dataframe with int
+        # and float columns only the int columns were cast to float
+
+        df = DataFrame({'int_col': [1, 2, 3],
+                        'float_col': [1.0, 2.0, 3.0]})
+
+        result = df.to_dict(orient='index', into=into)
+        cols = ['int_col', 'float_col']
+        result = DataFrame.from_dict(result, orient='index')[cols]
+        expected = DataFrame.from_dict(expected, orient='index')[cols]
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_dtypes.py b/pandas/tests/frame/test_dtypes.py
new file mode 100644
index 0000000000000..1eeeec0be3b8b
--- /dev/null
+++ b/pandas/tests/frame/test_dtypes.py
@@ -0,0 +1,906 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import pytest
+
+from datetime import timedelta
+
+import numpy as np
+from pandas import (DataFrame, Series, date_range, Timedelta, Timestamp,
+                    Categorical, compat, concat, option_context)
+from pandas.compat import u
+from pandas import _np_version_under1p14
+
+from pandas.core.dtypes.dtypes import DatetimeTZDtype, CategoricalDtype
+from pandas.tests.frame.common import TestData
+from pandas.util.testing import (assert_series_equal,
+                                 assert_frame_equal,
+                                 makeCustomDataframe as mkdf)
+import pandas.util.testing as tm
+import pandas as pd
+
+
+class TestDataFrameDataTypes(TestData):
+
+    def test_concat_empty_dataframe_dtypes(self):
+        df = DataFrame(columns=list("abc"))
+        df['a'] = df['a'].astype(np.bool_)
+        df['b'] = df['b'].astype(np.int32)
+        df['c'] = df['c'].astype(np.float64)
+
+        result = pd.concat([df, df])
+        assert result['a'].dtype == np.bool_
+        assert result['b'].dtype == np.int32
+        assert result['c'].dtype == np.float64
+
+        result = pd.concat([df, df.astype(np.float64)])
+        assert result['a'].dtype == np.object_
+        assert result['b'].dtype == np.float64
+        assert result['c'].dtype == np.float64
+
+    def test_empty_frame_dtypes_ftypes(self):
+        empty_df = pd.DataFrame()
+        assert_series_equal(empty_df.dtypes, pd.Series(dtype=np.object))
+        assert_series_equal(empty_df.ftypes, pd.Series(dtype=np.object))
+
+        nocols_df = pd.DataFrame(index=[1, 2, 3])
+        assert_series_equal(nocols_df.dtypes, pd.Series(dtype=np.object))
+        assert_series_equal(nocols_df.ftypes, pd.Series(dtype=np.object))
+
+        norows_df = pd.DataFrame(columns=list("abc"))
+        assert_series_equal(norows_df.dtypes, pd.Series(
+            np.object, index=list("abc")))
+        assert_series_equal(norows_df.ftypes, pd.Series(
+            'object:dense', index=list("abc")))
+
+        norows_int_df = pd.DataFrame(columns=list("abc")).astype(np.int32)
+        assert_series_equal(norows_int_df.dtypes, pd.Series(
+            np.dtype('int32'), index=list("abc")))
+        assert_series_equal(norows_int_df.ftypes, pd.Series(
+            'int32:dense', index=list("abc")))
+
+        odict = compat.OrderedDict
+        df = pd.DataFrame(odict([('a', 1), ('b', True), ('c', 1.0)]),
+                          index=[1, 2, 3])
+        ex_dtypes = pd.Series(odict([('a', np.int64),
+                                     ('b', np.bool),
+                                     ('c', np.float64)]))
+        ex_ftypes = pd.Series(odict([('a', 'int64:dense'),
+                                     ('b', 'bool:dense'),
+                                     ('c', 'float64:dense')]))
+        assert_series_equal(df.dtypes, ex_dtypes)
+        assert_series_equal(df.ftypes, ex_ftypes)
+
+        # same but for empty slice of df
+        assert_series_equal(df[:0].dtypes, ex_dtypes)
+        assert_series_equal(df[:0].ftypes, ex_ftypes)
+
+    def test_datetime_with_tz_dtypes(self):
+        tzframe = DataFrame({'A': date_range('20130101', periods=3),
+                             'B': date_range('20130101', periods=3,
+                                             tz='US/Eastern'),
+                             'C': date_range('20130101', periods=3, tz='CET')})
+        tzframe.iloc[1, 1] = pd.NaT
+        tzframe.iloc[1, 2] = pd.NaT
+        result = tzframe.dtypes.sort_index()
+        expected = Series([np.dtype('datetime64[ns]'),
+                           DatetimeTZDtype('datetime64[ns, US/Eastern]'),
+                           DatetimeTZDtype('datetime64[ns, CET]')],
+                          ['A', 'B', 'C'])
+
+        assert_series_equal(result, expected)
+
+    def test_dtypes_are_correct_after_column_slice(self):
+        # GH6525
+        df = pd.DataFrame(index=range(5), columns=list("abc"), dtype=np.float_)
+        odict = compat.OrderedDict
+        assert_series_equal(df.dtypes,
+                            pd.Series(odict([('a', np.float_),
+                                             ('b', np.float_),
+                                             ('c', np.float_)])))
+        assert_series_equal(df.iloc[:, 2:].dtypes,
+                            pd.Series(odict([('c', np.float_)])))
+        assert_series_equal(df.dtypes,
+                            pd.Series(odict([('a', np.float_),
+                                             ('b', np.float_),
+                                             ('c', np.float_)])))
+
+    def test_select_dtypes_include_using_list_like(self):
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.Categorical(list('abc')),
+                        'g': pd.date_range('20130101', periods=3),
+                        'h': pd.date_range('20130101', periods=3,
+                                           tz='US/Eastern'),
+                        'i': pd.date_range('20130101', periods=3,
+                                           tz='CET'),
+                        'j': pd.period_range('2013-01', periods=3,
+                                             freq='M'),
+                        'k': pd.timedelta_range('1 day', periods=3)})
+
+        ri = df.select_dtypes(include=[np.number])
+        ei = df[['b', 'c', 'd', 'k']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(include=[np.number], exclude=['timedelta'])
+        ei = df[['b', 'c', 'd']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(include=[np.number, 'category'],
+                              exclude=['timedelta'])
+        ei = df[['b', 'c', 'd', 'f']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(include=['datetime'])
+        ei = df[['g']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(include=['datetime64'])
+        ei = df[['g']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(include=['datetimetz'])
+        ei = df[['h', 'i']]
+        assert_frame_equal(ri, ei)
+
+        pytest.raises(NotImplementedError,
+                      lambda: df.select_dtypes(include=['period']))
+
+    def test_select_dtypes_exclude_using_list_like(self):
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True]})
+        re = df.select_dtypes(exclude=[np.number])
+        ee = df[['a', 'e']]
+        assert_frame_equal(re, ee)
+
+    def test_select_dtypes_exclude_include_using_list_like(self):
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.date_range('now', periods=3).values})
+        exclude = np.datetime64,
+        include = np.bool_, 'integer'
+        r = df.select_dtypes(include=include, exclude=exclude)
+        e = df[['b', 'c', 'e']]
+        assert_frame_equal(r, e)
+
+        exclude = 'datetime',
+        include = 'bool', 'int64', 'int32'
+        r = df.select_dtypes(include=include, exclude=exclude)
+        e = df[['b', 'e']]
+        assert_frame_equal(r, e)
+
+    def test_select_dtypes_include_using_scalars(self):
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.Categorical(list('abc')),
+                        'g': pd.date_range('20130101', periods=3),
+                        'h': pd.date_range('20130101', periods=3,
+                                           tz='US/Eastern'),
+                        'i': pd.date_range('20130101', periods=3,
+                                           tz='CET'),
+                        'j': pd.period_range('2013-01', periods=3,
+                                             freq='M'),
+                        'k': pd.timedelta_range('1 day', periods=3)})
+
+        ri = df.select_dtypes(include=np.number)
+        ei = df[['b', 'c', 'd', 'k']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(include='datetime')
+        ei = df[['g']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(include='datetime64')
+        ei = df[['g']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(include='category')
+        ei = df[['f']]
+        assert_frame_equal(ri, ei)
+
+        pytest.raises(NotImplementedError,
+                      lambda: df.select_dtypes(include='period'))
+
+    def test_select_dtypes_exclude_using_scalars(self):
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.Categorical(list('abc')),
+                        'g': pd.date_range('20130101', periods=3),
+                        'h': pd.date_range('20130101', periods=3,
+                                           tz='US/Eastern'),
+                        'i': pd.date_range('20130101', periods=3,
+                                           tz='CET'),
+                        'j': pd.period_range('2013-01', periods=3,
+                                             freq='M'),
+                        'k': pd.timedelta_range('1 day', periods=3)})
+
+        ri = df.select_dtypes(exclude=np.number)
+        ei = df[['a', 'e', 'f', 'g', 'h', 'i', 'j']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(exclude='category')
+        ei = df[['a', 'b', 'c', 'd', 'e', 'g', 'h', 'i', 'j', 'k']]
+        assert_frame_equal(ri, ei)
+
+        pytest.raises(NotImplementedError,
+                      lambda: df.select_dtypes(exclude='period'))
+
+    def test_select_dtypes_include_exclude_using_scalars(self):
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.Categorical(list('abc')),
+                        'g': pd.date_range('20130101', periods=3),
+                        'h': pd.date_range('20130101', periods=3,
+                                           tz='US/Eastern'),
+                        'i': pd.date_range('20130101', periods=3,
+                                           tz='CET'),
+                        'j': pd.period_range('2013-01', periods=3,
+                                             freq='M'),
+                        'k': pd.timedelta_range('1 day', periods=3)})
+
+        ri = df.select_dtypes(include=np.number, exclude='floating')
+        ei = df[['b', 'c', 'k']]
+        assert_frame_equal(ri, ei)
+
+    def test_select_dtypes_include_exclude_mixed_scalars_lists(self):
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.Categorical(list('abc')),
+                        'g': pd.date_range('20130101', periods=3),
+                        'h': pd.date_range('20130101', periods=3,
+                                           tz='US/Eastern'),
+                        'i': pd.date_range('20130101', periods=3,
+                                           tz='CET'),
+                        'j': pd.period_range('2013-01', periods=3,
+                                             freq='M'),
+                        'k': pd.timedelta_range('1 day', periods=3)})
+
+        ri = df.select_dtypes(include=np.number,
+                              exclude=['floating', 'timedelta'])
+        ei = df[['b', 'c']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(include=[np.number, 'category'],
+                              exclude='floating')
+        ei = df[['b', 'c', 'f', 'k']]
+        assert_frame_equal(ri, ei)
+
+    def test_select_dtypes_duplicate_columns(self):
+        # GH20839
+        odict = compat.OrderedDict
+        df = DataFrame(odict([('a', list('abc')),
+                              ('b', list(range(1, 4))),
+                              ('c', np.arange(3, 6).astype('u1')),
+                              ('d', np.arange(4.0, 7.0, dtype='float64')),
+                              ('e', [True, False, True]),
+                              ('f', pd.date_range('now', periods=3).values)]))
+        df.columns = ['a', 'a', 'b', 'b', 'b', 'c']
+
+        expected = DataFrame({'a': list(range(1, 4)),
+                              'b': np.arange(3, 6).astype('u1')})
+
+        result = df.select_dtypes(include=[np.number], exclude=['floating'])
+        assert_frame_equal(result, expected)
+
+    def test_select_dtypes_not_an_attr_but_still_valid_dtype(self):
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.date_range('now', periods=3).values})
+        df['g'] = df.f.diff()
+        assert not hasattr(np, 'u8')
+        r = df.select_dtypes(include=['i8', 'O'], exclude=['timedelta'])
+        e = df[['a', 'b']]
+        assert_frame_equal(r, e)
+
+        r = df.select_dtypes(include=['i8', 'O', 'timedelta64[ns]'])
+        e = df[['a', 'b', 'g']]
+        assert_frame_equal(r, e)
+
+    def test_select_dtypes_empty(self):
+        df = DataFrame({'a': list('abc'), 'b': list(range(1, 4))})
+        with tm.assert_raises_regex(ValueError, 'at least one of '
+                                    'include or exclude '
+                                    'must be nonempty'):
+            df.select_dtypes()
+
+    def test_select_dtypes_bad_datetime64(self):
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.date_range('now', periods=3).values})
+        with tm.assert_raises_regex(ValueError, '.+ is too specific'):
+            df.select_dtypes(include=['datetime64[D]'])
+
+        with tm.assert_raises_regex(ValueError, '.+ is too specific'):
+            df.select_dtypes(exclude=['datetime64[as]'])
+
+    def test_select_dtypes_datetime_with_tz(self):
+
+        df2 = DataFrame(dict(A=Timestamp('20130102', tz='US/Eastern'),
+                             B=Timestamp('20130603', tz='CET')),
+                        index=range(5))
+        df3 = pd.concat([df2.A.to_frame(), df2.B.to_frame()], axis=1)
+        result = df3.select_dtypes(include=['datetime64[ns]'])
+        expected = df3.reindex(columns=[])
+        assert_frame_equal(result, expected)
+
+    def test_select_dtypes_str_raises(self):
+        df = DataFrame({'a': list('abc'),
+                        'g': list(u('abc')),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.date_range('now', periods=3).values})
+        string_dtypes = set((str, 'str', np.string_, 'S1',
+                             'unicode', np.unicode_, 'U1'))
+        try:
+            string_dtypes.add(unicode)
+        except NameError:
+            pass
+        for dt in string_dtypes:
+            with tm.assert_raises_regex(TypeError,
+                                        'string dtypes are not allowed'):
+                df.select_dtypes(include=[dt])
+            with tm.assert_raises_regex(TypeError,
+                                        'string dtypes are not allowed'):
+                df.select_dtypes(exclude=[dt])
+
+    def test_select_dtypes_bad_arg_raises(self):
+        df = DataFrame({'a': list('abc'),
+                        'g': list(u('abc')),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.date_range('now', periods=3).values})
+        with tm.assert_raises_regex(TypeError, 'data type.'
+                                    '*not understood'):
+            df.select_dtypes(['blargy, blarg, blarg'])
+
+    def test_select_dtypes_typecodes(self):
+        # GH 11990
+        df = mkdf(30, 3, data_gen_f=lambda x, y: np.random.random())
+        expected = df
+        FLOAT_TYPES = list(np.typecodes['AllFloat'])
+        assert_frame_equal(df.select_dtypes(FLOAT_TYPES), expected)
+
+    def test_dtypes_gh8722(self):
+        self.mixed_frame['bool'] = self.mixed_frame['A'] > 0
+        result = self.mixed_frame.dtypes
+        expected = Series(dict((k, v.dtype)
+                               for k, v in compat.iteritems(self.mixed_frame)),
+                          index=result.index)
+        assert_series_equal(result, expected)
+
+        # compat, GH 8722
+        with option_context('use_inf_as_na', True):
+            df = DataFrame([[1]])
+            result = df.dtypes
+            assert_series_equal(result, Series({0: np.dtype('int64')}))
+
+    def test_ftypes(self):
+        frame = self.mixed_float
+        expected = Series(dict(A='float32:dense',
+                               B='float32:dense',
+                               C='float16:dense',
+                               D='float64:dense')).sort_values()
+        result = frame.ftypes.sort_values()
+        assert_series_equal(result, expected)
+
+    def test_astype(self):
+        casted = self.frame.astype(int)
+        expected = DataFrame(self.frame.values.astype(int),
+                             index=self.frame.index,
+                             columns=self.frame.columns)
+        assert_frame_equal(casted, expected)
+
+        casted = self.frame.astype(np.int32)
+        expected = DataFrame(self.frame.values.astype(np.int32),
+                             index=self.frame.index,
+                             columns=self.frame.columns)
+        assert_frame_equal(casted, expected)
+
+        self.frame['foo'] = '5'
+        casted = self.frame.astype(int)
+        expected = DataFrame(self.frame.values.astype(int),
+                             index=self.frame.index,
+                             columns=self.frame.columns)
+        assert_frame_equal(casted, expected)
+
+        # mixed casting
+        def _check_cast(df, v):
+            assert (list(set(s.dtype.name for
+                             _, s in compat.iteritems(df)))[0] == v)
+
+        mn = self.all_mixed._get_numeric_data().copy()
+        mn['little_float'] = np.array(12345., dtype='float16')
+        mn['big_float'] = np.array(123456789101112., dtype='float64')
+
+        casted = mn.astype('float64')
+        _check_cast(casted, 'float64')
+
+        casted = mn.astype('int64')
+        _check_cast(casted, 'int64')
+
+        casted = self.mixed_float.reindex(columns=['A', 'B']).astype('float32')
+        _check_cast(casted, 'float32')
+
+        casted = mn.reindex(columns=['little_float']).astype('float16')
+        _check_cast(casted, 'float16')
+
+        casted = self.mixed_float.reindex(columns=['A', 'B']).astype('float16')
+        _check_cast(casted, 'float16')
+
+        casted = mn.astype('float32')
+        _check_cast(casted, 'float32')
+
+        casted = mn.astype('int32')
+        _check_cast(casted, 'int32')
+
+        # to object
+        casted = mn.astype('O')
+        _check_cast(casted, 'object')
+
+    def test_astype_with_exclude_string(self):
+        df = self.frame.copy()
+        expected = self.frame.astype(int)
+        df['string'] = 'foo'
+        casted = df.astype(int, errors='ignore')
+
+        expected['string'] = 'foo'
+        assert_frame_equal(casted, expected)
+
+        df = self.frame.copy()
+        expected = self.frame.astype(np.int32)
+        df['string'] = 'foo'
+        casted = df.astype(np.int32, errors='ignore')
+
+        expected['string'] = 'foo'
+        assert_frame_equal(casted, expected)
+
+    def test_astype_with_view(self):
+
+        tf = self.mixed_float.reindex(columns=['A', 'B', 'C'])
+
+        casted = tf.astype(np.int64)
+
+        casted = tf.astype(np.float32)
+
+        # this is the only real reason to do it this way
+        tf = np.round(self.frame).astype(np.int32)
+        casted = tf.astype(np.float32, copy=False)
+
+        # TODO(wesm): verification?
+        tf = self.frame.astype(np.float64)
+        casted = tf.astype(np.int64, copy=False)  # noqa
+
+    def test_astype_cast_nan_inf_int(self):
+        # GH14265, check nan and inf raise error when converting to int
+        types = [np.int32, np.int64]
+        values = [np.nan, np.inf]
+        msg = 'Cannot convert non-finite values \\(NA or inf\\) to integer'
+
+        for this_type in types:
+            for this_val in values:
+                df = DataFrame([this_val])
+                with tm.assert_raises_regex(ValueError, msg):
+                    df.astype(this_type)
+
+    def test_astype_str(self):
+        # GH9757
+        a = Series(date_range('2010-01-04', periods=5))
+        b = Series(date_range('3/6/2012 00:00', periods=5, tz='US/Eastern'))
+        c = Series([Timedelta(x, unit='d') for x in range(5)])
+        d = Series(range(5))
+        e = Series([0.0, 0.2, 0.4, 0.6, 0.8])
+
+        df = DataFrame({'a': a, 'b': b, 'c': c, 'd': d, 'e': e})
+
+        # datetimelike
+        # Test str and unicode on python 2.x and just str on python 3.x
+        for tt in set([str, compat.text_type]):
+            result = df.astype(tt)
+
+            expected = DataFrame({
+                'a': list(map(tt, map(lambda x: Timestamp(x)._date_repr,
+                                      a._values))),
+                'b': list(map(tt, map(Timestamp, b._values))),
+                'c': list(map(tt, map(lambda x: Timedelta(x)
+                                      ._repr_base(format='all'), c._values))),
+                'd': list(map(tt, d._values)),
+                'e': list(map(tt, e._values)),
+            })
+
+            assert_frame_equal(result, expected)
+
+        # float/nan
+        # 11302
+        # consistency in astype(str)
+        for tt in set([str, compat.text_type]):
+            result = DataFrame([np.NaN]).astype(tt)
+            expected = DataFrame(['nan'])
+            assert_frame_equal(result, expected)
+
+            result = DataFrame([1.12345678901234567890]).astype(tt)
+            if _np_version_under1p14:
+                # < 1.14 truncates
+                expected = DataFrame(['1.12345678901'])
+            else:
+                # >= 1.14 preserves the full repr
+                expected = DataFrame(['1.1234567890123457'])
+            assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("dtype_class", [dict, Series])
+    def test_astype_dict_like(self, dtype_class):
+        # GH7271 & GH16717
+        a = Series(date_range('2010-01-04', periods=5))
+        b = Series(range(5))
+        c = Series([0.0, 0.2, 0.4, 0.6, 0.8])
+        d = Series(['1.0', '2', '3.14', '4', '5.4'])
+        df = DataFrame({'a': a, 'b': b, 'c': c, 'd': d})
+        original = df.copy(deep=True)
+
+        # change type of a subset of columns
+        dt1 = dtype_class({'b': 'str', 'd': 'float32'})
+        result = df.astype(dt1)
+        expected = DataFrame({
+            'a': a,
+            'b': Series(['0', '1', '2', '3', '4']),
+            'c': c,
+            'd': Series([1.0, 2.0, 3.14, 4.0, 5.4], dtype='float32')})
+        assert_frame_equal(result, expected)
+        assert_frame_equal(df, original)
+
+        dt2 = dtype_class({'b': np.float32, 'c': 'float32', 'd': np.float64})
+        result = df.astype(dt2)
+        expected = DataFrame({
+            'a': a,
+            'b': Series([0.0, 1.0, 2.0, 3.0, 4.0], dtype='float32'),
+            'c': Series([0.0, 0.2, 0.4, 0.6, 0.8], dtype='float32'),
+            'd': Series([1.0, 2.0, 3.14, 4.0, 5.4], dtype='float64')})
+        assert_frame_equal(result, expected)
+        assert_frame_equal(df, original)
+
+        # change all columns
+        dt3 = dtype_class({'a': str, 'b': str, 'c': str, 'd': str})
+        assert_frame_equal(df.astype(dt3),
+                           df.astype(str))
+        assert_frame_equal(df, original)
+
+        # error should be raised when using something other than column labels
+        # in the keys of the dtype dict
+        dt4 = dtype_class({'b': str, 2: str})
+        dt5 = dtype_class({'e': str})
+        pytest.raises(KeyError, df.astype, dt4)
+        pytest.raises(KeyError, df.astype, dt5)
+        assert_frame_equal(df, original)
+
+        # if the dtypes provided are the same as the original dtypes, the
+        # resulting DataFrame should be the same as the original DataFrame
+        dt6 = dtype_class({col: df[col].dtype for col in df.columns})
+        equiv = df.astype(dt6)
+        assert_frame_equal(df, equiv)
+        assert_frame_equal(df, original)
+
+        # GH 16717
+        # if dtypes provided is empty, the resulting DataFrame
+        # should be the same as the original DataFrame
+        dt7 = dtype_class({})
+        result = df.astype(dt7)
+        assert_frame_equal(df, equiv)
+        assert_frame_equal(df, original)
+
+    def test_astype_duplicate_col(self):
+        a1 = Series([1, 2, 3, 4, 5], name='a')
+        b = Series([0.1, 0.2, 0.4, 0.6, 0.8], name='b')
+        a2 = Series([0, 1, 2, 3, 4], name='a')
+        df = concat([a1, b, a2], axis=1)
+
+        result = df.astype(str)
+        a1_str = Series(['1', '2', '3', '4', '5'], dtype='str', name='a')
+        b_str = Series(['0.1', '0.2', '0.4', '0.6', '0.8'], dtype=str,
+                       name='b')
+        a2_str = Series(['0', '1', '2', '3', '4'], dtype='str', name='a')
+        expected = concat([a1_str, b_str, a2_str], axis=1)
+        assert_frame_equal(result, expected)
+
+        result = df.astype({'a': 'str'})
+        expected = concat([a1_str, b, a2_str], axis=1)
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [
+        'category',
+        CategoricalDtype(),
+        CategoricalDtype(ordered=True),
+        CategoricalDtype(ordered=False),
+        CategoricalDtype(categories=list('abcdef')),
+        CategoricalDtype(categories=list('edba'), ordered=False),
+        CategoricalDtype(categories=list('edcb'), ordered=True)], ids=repr)
+    def test_astype_categorical(self, dtype):
+        # GH 18099
+        d = {'A': list('abbc'), 'B': list('bccd'), 'C': list('cdde')}
+        df = DataFrame(d)
+        result = df.astype(dtype)
+        expected = DataFrame({k: Categorical(d[k], dtype=dtype) for k in d})
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("cls", [
+        pd.api.types.CategoricalDtype,
+        pd.api.types.DatetimeTZDtype,
+        pd.api.types.IntervalDtype
+    ])
+    def test_astype_categoricaldtype_class_raises(self, cls):
+        df = DataFrame({"A": ['a', 'a', 'b', 'c']})
+        xpr = "Expected an instance of {}".format(cls.__name__)
+        with tm.assert_raises_regex(TypeError, xpr):
+            df.astype({"A": cls})
+
+        with tm.assert_raises_regex(TypeError, xpr):
+            df['A'].astype(cls)
+
+    @pytest.mark.parametrize('dtype', [
+        {100: 'float64', 200: 'uint64'}, 'category', 'float64'])
+    def test_astype_column_metadata(self, dtype):
+        # GH 19920
+        columns = pd.UInt64Index([100, 200, 300], name='foo')
+        df = DataFrame(np.arange(15).reshape(5, 3), columns=columns)
+        df = df.astype(dtype)
+        tm.assert_index_equal(df.columns, columns)
+
+    @pytest.mark.parametrize("dtype", ["M8", "m8"])
+    @pytest.mark.parametrize("unit", ['ns', 'us', 'ms', 's', 'h', 'm', 'D'])
+    def test_astype_from_datetimelike_to_objectt(self, dtype, unit):
+        # tests astype to object dtype
+        # gh-19223 / gh-12425
+        dtype = "{}[{}]".format(dtype, unit)
+        arr = np.array([[1, 2, 3]], dtype=dtype)
+        df = DataFrame(arr)
+        result = df.astype(object)
+        assert (result.dtypes == object).all()
+
+        if dtype.startswith('M8'):
+            assert result.iloc[0, 0] == pd.to_datetime(1, unit=unit)
+        else:
+            assert result.iloc[0, 0] == pd.to_timedelta(1, unit=unit)
+
+    @pytest.mark.parametrize("arr_dtype", [np.int64, np.float64])
+    @pytest.mark.parametrize("dtype", ["M8", "m8"])
+    @pytest.mark.parametrize("unit", ['ns', 'us', 'ms', 's', 'h', 'm', 'D'])
+    def test_astype_to_datetimelike_unit(self, arr_dtype, dtype, unit):
+        # tests all units from numeric origination
+        # gh-19223 / gh-12425
+        dtype = "{}[{}]".format(dtype, unit)
+        arr = np.array([[1, 2, 3]], dtype=arr_dtype)
+        df = DataFrame(arr)
+        result = df.astype(dtype)
+        expected = DataFrame(arr.astype(dtype))
+
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("unit", ['ns', 'us', 'ms', 's', 'h', 'm', 'D'])
+    def test_astype_to_datetime_unit(self, unit):
+        # tests all units from datetime origination
+        # gh-19223
+        dtype = "M8[{}]".format(unit)
+        arr = np.array([[1, 2, 3]], dtype=dtype)
+        df = DataFrame(arr)
+        result = df.astype(dtype)
+        expected = DataFrame(arr.astype(dtype))
+
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("unit", ['ns'])
+    def test_astype_to_timedelta_unit_ns(self, unit):
+        # preserver the timedelta conversion
+        # gh-19223
+        dtype = "m8[{}]".format(unit)
+        arr = np.array([[1, 2, 3]], dtype=dtype)
+        df = DataFrame(arr)
+        result = df.astype(dtype)
+        expected = DataFrame(arr.astype(dtype))
+
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("unit", ['us', 'ms', 's', 'h', 'm', 'D'])
+    def test_astype_to_timedelta_unit(self, unit):
+        # coerce to float
+        # gh-19223
+        dtype = "m8[{}]".format(unit)
+        arr = np.array([[1, 2, 3]], dtype=dtype)
+        df = DataFrame(arr)
+        result = df.astype(dtype)
+        expected = DataFrame(df.values.astype(dtype).astype(float))
+
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("unit", ['ns', 'us', 'ms', 's', 'h', 'm', 'D'])
+    def test_astype_to_incorrect_datetimelike(self, unit):
+        # trying to astype a m to a M, or vice-versa
+        # gh-19224
+        dtype = "M8[{}]".format(unit)
+        other = "m8[{}]".format(unit)
+
+        df = DataFrame(np.array([[1, 2, 3]], dtype=dtype))
+        with pytest.raises(TypeError):
+            df.astype(other)
+
+        df = DataFrame(np.array([[1, 2, 3]], dtype=other))
+        with pytest.raises(TypeError):
+            df.astype(dtype)
+
+    def test_timedeltas(self):
+        df = DataFrame(dict(A=Series(date_range('2012-1-1', periods=3,
+                                                freq='D')),
+                            B=Series([timedelta(days=i) for i in range(3)])))
+        result = df.get_dtype_counts().sort_index()
+        expected = Series(
+            {'datetime64[ns]': 1, 'timedelta64[ns]': 1}).sort_index()
+        assert_series_equal(result, expected)
+
+        df['C'] = df['A'] + df['B']
+        expected = Series(
+            {'datetime64[ns]': 2, 'timedelta64[ns]': 1}).sort_values()
+        result = df.get_dtype_counts().sort_values()
+        assert_series_equal(result, expected)
+
+        # mixed int types
+        df['D'] = 1
+        expected = Series({'datetime64[ns]': 2,
+                           'timedelta64[ns]': 1,
+                           'int64': 1}).sort_values()
+        result = df.get_dtype_counts().sort_values()
+        assert_series_equal(result, expected)
+
+    def test_arg_for_errors_in_astype(self):
+        # issue #14878
+
+        df = DataFrame([1, 2, 3])
+
+        with pytest.raises(ValueError):
+            df.astype(np.float64, errors=True)
+
+        with tm.assert_produces_warning(FutureWarning):
+            df.astype(np.int8, raise_on_error=False)
+
+        df.astype(np.int8, errors='ignore')
+
+    @pytest.mark.parametrize('input_vals', [
+        ([1, 2]),
+        (['1', '2']),
+        (list(pd.date_range('1/1/2011', periods=2, freq='H'))),
+        (list(pd.date_range('1/1/2011', periods=2, freq='H',
+                            tz='US/Eastern'))),
+        ([pd.Interval(left=0, right=5)]),
+    ])
+    def test_constructor_list_str(self, input_vals, string_dtype):
+        # GH 16605
+        # Ensure that data elements are converted to strings when
+        # dtype is str, 'str', or 'U'
+
+        result = DataFrame({'A': input_vals}, dtype=string_dtype)
+        expected = DataFrame({'A': input_vals}).astype({'A': string_dtype})
+        assert_frame_equal(result, expected)
+
+    def test_constructor_list_str_na(self, string_dtype):
+
+        result = DataFrame({"A": [1.0, 2.0, None]}, dtype=string_dtype)
+        expected = DataFrame({"A": ['1.0', '2.0', None]}, dtype=object)
+        assert_frame_equal(result, expected)
+
+
+class TestDataFrameDatetimeWithTZ(TestData):
+
+    def test_interleave(self):
+
+        # interleave with object
+        result = self.tzframe.assign(D='foo').values
+        expected = np.array([[Timestamp('2013-01-01 00:00:00'),
+                              Timestamp('2013-01-02 00:00:00'),
+                              Timestamp('2013-01-03 00:00:00')],
+                             [Timestamp('2013-01-01 00:00:00-0500',
+                                        tz='US/Eastern'),
+                              pd.NaT,
+                              Timestamp('2013-01-03 00:00:00-0500',
+                                        tz='US/Eastern')],
+                             [Timestamp('2013-01-01 00:00:00+0100', tz='CET'),
+                              pd.NaT,
+                              Timestamp('2013-01-03 00:00:00+0100', tz='CET')],
+                             ['foo', 'foo', 'foo']], dtype=object).T
+        tm.assert_numpy_array_equal(result, expected)
+
+        # interleave with only datetime64[ns]
+        result = self.tzframe.values
+        expected = np.array([[Timestamp('2013-01-01 00:00:00'),
+                              Timestamp('2013-01-02 00:00:00'),
+                              Timestamp('2013-01-03 00:00:00')],
+                             [Timestamp('2013-01-01 00:00:00-0500',
+                                        tz='US/Eastern'),
+                              pd.NaT,
+                              Timestamp('2013-01-03 00:00:00-0500',
+                                        tz='US/Eastern')],
+                             [Timestamp('2013-01-01 00:00:00+0100', tz='CET'),
+                              pd.NaT,
+                              Timestamp('2013-01-03 00:00:00+0100',
+                                        tz='CET')]], dtype=object).T
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_astype(self):
+        # astype
+        expected = np.array([[Timestamp('2013-01-01 00:00:00'),
+                              Timestamp('2013-01-02 00:00:00'),
+                              Timestamp('2013-01-03 00:00:00')],
+                             [Timestamp('2013-01-01 00:00:00-0500',
+                                        tz='US/Eastern'),
+                              pd.NaT,
+                              Timestamp('2013-01-03 00:00:00-0500',
+                                        tz='US/Eastern')],
+                             [Timestamp('2013-01-01 00:00:00+0100', tz='CET'),
+                              pd.NaT,
+                              Timestamp('2013-01-03 00:00:00+0100',
+                                        tz='CET')]],
+                            dtype=object).T
+        result = self.tzframe.astype(object)
+        assert_frame_equal(result, DataFrame(
+            expected, index=self.tzframe.index, columns=self.tzframe.columns))
+
+        result = self.tzframe.astype('datetime64[ns]')
+        expected = DataFrame({'A': date_range('20130101', periods=3),
+                              'B': (date_range('20130101', periods=3,
+                                               tz='US/Eastern')
+                                    .tz_convert('UTC')
+                                    .tz_localize(None)),
+                              'C': (date_range('20130101', periods=3,
+                                               tz='CET')
+                                    .tz_convert('UTC')
+                                    .tz_localize(None))})
+        expected.iloc[1, 1] = pd.NaT
+        expected.iloc[1, 2] = pd.NaT
+        assert_frame_equal(result, expected)
+
+    def test_astype_str(self):
+        # str formatting
+        result = self.tzframe.astype(str)
+        expected = DataFrame([['2013-01-01', '2013-01-01 00:00:00-05:00',
+                               '2013-01-01 00:00:00+01:00'],
+                              ['2013-01-02', 'NaT', 'NaT'],
+                              ['2013-01-03', '2013-01-03 00:00:00-05:00',
+                               '2013-01-03 00:00:00+01:00']],
+                             columns=self.tzframe.columns)
+        tm.assert_frame_equal(result, expected)
+
+        with option_context('display.max_columns', 20):
+            result = str(self.tzframe)
+            assert ('0 2013-01-01 2013-01-01 00:00:00-05:00 '
+                    '2013-01-01 00:00:00+01:00') in result
+            assert ('1 2013-01-02                       '
+                    'NaT                       NaT') in result
+            assert ('2 2013-01-03 2013-01-03 00:00:00-05:00 '
+                    '2013-01-03 00:00:00+01:00') in result
diff --git a/pandas/tests/frame/test_indexing.py b/pandas/tests/frame/test_indexing.py
new file mode 100644
index 0000000000000..c7aaf900b17fa
--- /dev/null
+++ b/pandas/tests/frame/test_indexing.py
@@ -0,0 +1,3527 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+from warnings import catch_warnings
+
+from datetime import datetime, date, timedelta, time
+
+from pandas.compat import map, zip, range, lrange, lzip, long
+from pandas import compat
+
+from numpy import nan
+from numpy.random import randn
+
+import pytest
+import numpy as np
+
+import pandas.core.common as com
+from pandas import (DataFrame, Index, Series, notna, isna,
+                    MultiIndex, DatetimeIndex, Timestamp,
+                    date_range, Categorical)
+from pandas.core.dtypes.dtypes import CategoricalDtype
+
+import pandas as pd
+
+from pandas._libs.tslib import iNaT
+from pandas.tseries.offsets import BDay
+from pandas.core.dtypes.common import (
+    is_float_dtype,
+    is_integer,
+    is_scalar)
+from pandas.util.testing import (assert_almost_equal,
+                                 assert_series_equal,
+                                 assert_frame_equal)
+from pandas.core.indexing import IndexingError
+
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+class TestDataFrameIndexing(TestData):
+
+    def test_getitem(self):
+        # Slicing
+        sl = self.frame[:20]
+        assert len(sl.index) == 20
+
+        # Column access
+        for _, series in compat.iteritems(sl):
+            assert len(series.index) == 20
+            assert tm.equalContents(series.index, sl.index)
+
+        for key, _ in compat.iteritems(self.frame._series):
+            assert self.frame[key] is not None
+
+        assert 'random' not in self.frame
+        with tm.assert_raises_regex(KeyError, 'random'):
+            self.frame['random']
+
+        df = self.frame.copy()
+        df['$10'] = randn(len(df))
+
+        ad = randn(len(df))
+        df['@awesome_domain'] = ad
+
+        with pytest.raises(KeyError):
+            df.__getitem__('df["$10"]')
+
+        res = df['@awesome_domain']
+        tm.assert_numpy_array_equal(ad, res.values)
+
+    def test_getitem_dupe_cols(self):
+        df = DataFrame([[1, 2, 3], [4, 5, 6]], columns=['a', 'a', 'b'])
+        try:
+            df[['baf']]
+        except KeyError:
+            pass
+        else:
+            self.fail("Dataframe failed to raise KeyError")
+
+    def test_get(self):
+        b = self.frame.get('B')
+        assert_series_equal(b, self.frame['B'])
+
+        assert self.frame.get('foo') is None
+        assert_series_equal(self.frame.get('foo', self.frame['B']),
+                            self.frame['B'])
+        # None
+        # GH 5652
+        for df in [DataFrame(), DataFrame(columns=list('AB')),
+                   DataFrame(columns=list('AB'), index=range(3))]:
+            result = df.get(None)
+            assert result is None
+
+    def test_getitem_iterator(self):
+        idx = iter(['A', 'B', 'C'])
+        result = self.frame.loc[:, idx]
+        expected = self.frame.loc[:, ['A', 'B', 'C']]
+        assert_frame_equal(result, expected)
+
+        idx = iter(['A', 'B', 'C'])
+        result = self.frame.loc[:, idx]
+        expected = self.frame.loc[:, ['A', 'B', 'C']]
+        assert_frame_equal(result, expected)
+
+    def test_getitem_list(self):
+        self.frame.columns.name = 'foo'
+
+        result = self.frame[['B', 'A']]
+        result2 = self.frame[Index(['B', 'A'])]
+
+        expected = self.frame.loc[:, ['B', 'A']]
+        expected.columns.name = 'foo'
+
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result2, expected)
+
+        assert result.columns.name == 'foo'
+
+        with tm.assert_raises_regex(KeyError, 'not in index'):
+            self.frame[['B', 'A', 'food']]
+        with tm.assert_raises_regex(KeyError, 'not in index'):
+            self.frame[Index(['B', 'A', 'foo'])]
+
+        # tuples
+        df = DataFrame(randn(8, 3),
+                       columns=Index([('foo', 'bar'), ('baz', 'qux'),
+                                      ('peek', 'aboo')], name=('sth', 'sth2')))
+
+        result = df[[('foo', 'bar'), ('baz', 'qux')]]
+        expected = df.iloc[:, :2]
+        assert_frame_equal(result, expected)
+        assert result.columns.names == ('sth', 'sth2')
+
+    def test_getitem_callable(self):
+        # GH 12533
+        result = self.frame[lambda x: 'A']
+        tm.assert_series_equal(result, self.frame.loc[:, 'A'])
+
+        result = self.frame[lambda x: ['A', 'B']]
+        tm.assert_frame_equal(result, self.frame.loc[:, ['A', 'B']])
+
+        df = self.frame[:3]
+        result = df[lambda x: [True, False, True]]
+        tm.assert_frame_equal(result, self.frame.iloc[[0, 2], :])
+
+    def test_setitem_list(self):
+
+        self.frame['E'] = 'foo'
+        data = self.frame[['A', 'B']]
+        self.frame[['B', 'A']] = data
+
+        assert_series_equal(self.frame['B'], data['A'], check_names=False)
+        assert_series_equal(self.frame['A'], data['B'], check_names=False)
+
+        with tm.assert_raises_regex(ValueError,
+                                    'Columns must be same length as key'):
+            data[['A']] = self.frame[['A', 'B']]
+
+        with tm.assert_raises_regex(ValueError, 'Length of values '
+                                    'does not match '
+                                    'length of index'):
+            data['A'] = range(len(data.index) - 1)
+
+        df = DataFrame(0, lrange(3), ['tt1', 'tt2'], dtype=np.int_)
+        df.loc[1, ['tt1', 'tt2']] = [1, 2]
+
+        result = df.loc[df.index[1], ['tt1', 'tt2']]
+        expected = Series([1, 2], df.columns, dtype=np.int_, name=1)
+        assert_series_equal(result, expected)
+
+        df['tt1'] = df['tt2'] = '0'
+        df.loc[df.index[1], ['tt1', 'tt2']] = ['1', '2']
+        result = df.loc[df.index[1], ['tt1', 'tt2']]
+        expected = Series(['1', '2'], df.columns, name=1)
+        assert_series_equal(result, expected)
+
+    def test_setitem_list_not_dataframe(self):
+        data = np.random.randn(len(self.frame), 2)
+        self.frame[['A', 'B']] = data
+        assert_almost_equal(self.frame[['A', 'B']].values, data)
+
+    def test_setitem_list_of_tuples(self):
+        tuples = lzip(self.frame['A'], self.frame['B'])
+        self.frame['tuples'] = tuples
+
+        result = self.frame['tuples']
+        expected = Series(tuples, index=self.frame.index, name='tuples')
+        assert_series_equal(result, expected)
+
+    def test_setitem_mulit_index(self):
+        # GH7655, test that assigning to a sub-frame of a frame
+        # with multi-index columns aligns both rows and columns
+        it = ['jim', 'joe', 'jolie'], ['first', 'last'], \
+             ['left', 'center', 'right']
+
+        cols = MultiIndex.from_product(it)
+        index = pd.date_range('20141006', periods=20)
+        vals = np.random.randint(1, 1000, (len(index), len(cols)))
+        df = pd.DataFrame(vals, columns=cols, index=index)
+
+        i, j = df.index.values.copy(), it[-1][:]
+
+        np.random.shuffle(i)
+        df['jim'] = df['jolie'].loc[i, ::-1]
+        assert_frame_equal(df['jim'], df['jolie'])
+
+        np.random.shuffle(j)
+        df[('joe', 'first')] = df[('jolie', 'last')].loc[i, j]
+        assert_frame_equal(df[('joe', 'first')], df[('jolie', 'last')])
+
+        np.random.shuffle(j)
+        df[('joe', 'last')] = df[('jolie', 'first')].loc[i, j]
+        assert_frame_equal(df[('joe', 'last')], df[('jolie', 'first')])
+
+    def test_setitem_callable(self):
+        # GH 12533
+        df = pd.DataFrame({'A': [1, 2, 3, 4], 'B': [5, 6, 7, 8]})
+        df[lambda x: 'A'] = [11, 12, 13, 14]
+
+        exp = pd.DataFrame({'A': [11, 12, 13, 14], 'B': [5, 6, 7, 8]})
+        tm.assert_frame_equal(df, exp)
+
+    def test_setitem_other_callable(self):
+        # GH 13299
+        inc = lambda x: x + 1
+
+        df = pd.DataFrame([[-1, 1], [1, -1]])
+        df[df > 0] = inc
+
+        expected = pd.DataFrame([[-1, inc], [inc, -1]])
+        tm.assert_frame_equal(df, expected)
+
+    def test_getitem_boolean(self):
+        # boolean indexing
+        d = self.tsframe.index[10]
+        indexer = self.tsframe.index > d
+        indexer_obj = indexer.astype(object)
+
+        subindex = self.tsframe.index[indexer]
+        subframe = self.tsframe[indexer]
+
+        tm.assert_index_equal(subindex, subframe.index)
+        with tm.assert_raises_regex(ValueError, 'Item wrong length'):
+            self.tsframe[indexer[:-1]]
+
+        subframe_obj = self.tsframe[indexer_obj]
+        assert_frame_equal(subframe_obj, subframe)
+
+        with tm.assert_raises_regex(ValueError, 'boolean values only'):
+            self.tsframe[self.tsframe]
+
+        # test that Series work
+        indexer_obj = Series(indexer_obj, self.tsframe.index)
+
+        subframe_obj = self.tsframe[indexer_obj]
+        assert_frame_equal(subframe_obj, subframe)
+
+        # test that Series indexers reindex
+        # we are producing a warning that since the passed boolean
+        # key is not the same as the given index, we will reindex
+        # not sure this is really necessary
+        with tm.assert_produces_warning(UserWarning, check_stacklevel=False):
+            indexer_obj = indexer_obj.reindex(self.tsframe.index[::-1])
+            subframe_obj = self.tsframe[indexer_obj]
+            assert_frame_equal(subframe_obj, subframe)
+
+        # test df[df > 0]
+        for df in [self.tsframe, self.mixed_frame,
+                   self.mixed_float, self.mixed_int]:
+
+            data = df._get_numeric_data()
+            bif = df[df > 0]
+            bifw = DataFrame(dict((c, np.where(data[c] > 0, data[c], np.nan))
+                                  for c in data.columns),
+                             index=data.index, columns=data.columns)
+
+            # add back other columns to compare
+            for c in df.columns:
+                if c not in bifw:
+                    bifw[c] = df[c]
+            bifw = bifw.reindex(columns=df.columns)
+
+            assert_frame_equal(bif, bifw, check_dtype=False)
+            for c in df.columns:
+                if bif[c].dtype != bifw[c].dtype:
+                    assert bif[c].dtype == df[c].dtype
+
+    def test_getitem_boolean_casting(self):
+
+        # don't upcast if we don't need to
+        df = self.tsframe.copy()
+        df['E'] = 1
+        df['E'] = df['E'].astype('int32')
+        df['E1'] = df['E'].copy()
+        df['F'] = 1
+        df['F'] = df['F'].astype('int64')
+        df['F1'] = df['F'].copy()
+
+        casted = df[df > 0]
+        result = casted.get_dtype_counts()
+        expected = Series({'float64': 4, 'int32': 2, 'int64': 2})
+        assert_series_equal(result, expected)
+
+        # int block splitting
+        df.loc[df.index[1:3], ['E1', 'F1']] = 0
+        casted = df[df > 0]
+        result = casted.get_dtype_counts()
+        expected = Series({'float64': 6, 'int32': 1, 'int64': 1})
+        assert_series_equal(result, expected)
+
+        # where dtype conversions
+        # GH 3733
+        df = DataFrame(data=np.random.randn(100, 50))
+        df = df.where(df > 0)  # create nans
+        bools = df > 0
+        mask = isna(df)
+        expected = bools.astype(float).mask(mask)
+        result = bools.mask(mask)
+        assert_frame_equal(result, expected)
+
+    def test_getitem_boolean_list(self):
+        df = DataFrame(np.arange(12).reshape(3, 4))
+
+        def _checkit(lst):
+            result = df[lst]
+            expected = df.loc[df.index[lst]]
+            assert_frame_equal(result, expected)
+
+        _checkit([True, False, True])
+        _checkit([True, True, True])
+        _checkit([False, False, False])
+
+    def test_getitem_boolean_iadd(self):
+        arr = randn(5, 5)
+
+        df = DataFrame(arr.copy(), columns=['A', 'B', 'C', 'D', 'E'])
+
+        df[df < 0] += 1
+        arr[arr < 0] += 1
+
+        assert_almost_equal(df.values, arr)
+
+    def test_boolean_index_empty_corner(self):
+        # #2096
+        blah = DataFrame(np.empty([0, 1]), columns=['A'],
+                         index=DatetimeIndex([]))
+
+        # both of these should succeed trivially
+        k = np.array([], bool)
+
+        blah[k]
+        blah[k] = 0
+
+    def test_getitem_ix_mixed_integer(self):
+        df = DataFrame(np.random.randn(4, 3),
+                       index=[1, 10, 'C', 'E'], columns=[1, 2, 3])
+
+        result = df.iloc[:-1]
+        expected = df.loc[df.index[:-1]]
+        assert_frame_equal(result, expected)
+
+        with catch_warnings(record=True):
+            result = df.ix[[1, 10]]
+            expected = df.ix[Index([1, 10], dtype=object)]
+        assert_frame_equal(result, expected)
+
+        # 11320
+        df = pd.DataFrame({"rna": (1.5, 2.2, 3.2, 4.5),
+                           -1000: [11, 21, 36, 40],
+                           0: [10, 22, 43, 34],
+                           1000: [0, 10, 20, 30]},
+                          columns=['rna', -1000, 0, 1000])
+        result = df[[1000]]
+        expected = df.iloc[:, [3]]
+        assert_frame_equal(result, expected)
+        result = df[[-1000]]
+        expected = df.iloc[:, [1]]
+        assert_frame_equal(result, expected)
+
+    def test_getitem_setitem_ix_negative_integers(self):
+        with catch_warnings(record=True):
+            result = self.frame.ix[:, -1]
+        assert_series_equal(result, self.frame['D'])
+
+        with catch_warnings(record=True):
+            result = self.frame.ix[:, [-1]]
+        assert_frame_equal(result, self.frame[['D']])
+
+        with catch_warnings(record=True):
+            result = self.frame.ix[:, [-1, -2]]
+        assert_frame_equal(result, self.frame[['D', 'C']])
+
+        with catch_warnings(record=True):
+            self.frame.ix[:, [-1]] = 0
+        assert (self.frame['D'] == 0).all()
+
+        df = DataFrame(np.random.randn(8, 4))
+        # ix does label-based indexing when having an integer index
+        with catch_warnings(record=True):
+            with pytest.raises(KeyError):
+                df.ix[[-1]]
+
+        with catch_warnings(record=True):
+            with pytest.raises(KeyError):
+                df.ix[:, [-1]]
+
+        # #1942
+        a = DataFrame(randn(20, 2), index=[chr(x + 65) for x in range(20)])
+        with catch_warnings(record=True):
+            a.ix[-1] = a.ix[-2]
+
+        with catch_warnings(record=True):
+            assert_series_equal(a.ix[-1], a.ix[-2], check_names=False)
+            assert a.ix[-1].name == 'T'
+            assert a.ix[-2].name == 'S'
+
+    def test_getattr(self):
+        assert_series_equal(self.frame.A, self.frame['A'])
+        pytest.raises(AttributeError, getattr, self.frame,
+                      'NONEXISTENT_NAME')
+
+    def test_setattr_column(self):
+        df = DataFrame({'foobar': 1}, index=lrange(10))
+
+        df.foobar = 5
+        assert (df.foobar == 5).all()
+
+    def test_setitem(self):
+        # not sure what else to do here
+        series = self.frame['A'][::2]
+        self.frame['col5'] = series
+        assert 'col5' in self.frame
+
+        assert len(series) == 15
+        assert len(self.frame) == 30
+
+        exp = np.ravel(np.column_stack((series.values, [np.nan] * 15)))
+        exp = Series(exp, index=self.frame.index, name='col5')
+        tm.assert_series_equal(self.frame['col5'], exp)
+
+        series = self.frame['A']
+        self.frame['col6'] = series
+        tm.assert_series_equal(series, self.frame['col6'], check_names=False)
+
+        with pytest.raises(KeyError):
+            self.frame[randn(len(self.frame) + 1)] = 1
+
+        # set ndarray
+        arr = randn(len(self.frame))
+        self.frame['col9'] = arr
+        assert (self.frame['col9'] == arr).all()
+
+        self.frame['col7'] = 5
+        assert((self.frame['col7'] == 5).all())
+
+        self.frame['col0'] = 3.14
+        assert((self.frame['col0'] == 3.14).all())
+
+        self.frame['col8'] = 'foo'
+        assert((self.frame['col8'] == 'foo').all())
+
+        # this is partially a view (e.g. some blocks are view)
+        # so raise/warn
+        smaller = self.frame[:2]
+
+        def f():
+            smaller['col10'] = ['1', '2']
+        pytest.raises(com.SettingWithCopyError, f)
+        assert smaller['col10'].dtype == np.object_
+        assert (smaller['col10'] == ['1', '2']).all()
+
+        # with a dtype
+        for dtype in ['int32', 'int64', 'float32', 'float64']:
+            self.frame[dtype] = np.array(arr, dtype=dtype)
+            assert self.frame[dtype].dtype.name == dtype
+
+        # dtype changing GH4204
+        df = DataFrame([[0, 0]])
+        df.iloc[0] = np.nan
+        expected = DataFrame([[np.nan, np.nan]])
+        assert_frame_equal(df, expected)
+
+        df = DataFrame([[0, 0]])
+        df.loc[0] = np.nan
+        assert_frame_equal(df, expected)
+
+    def test_setitem_tuple(self):
+        self.frame['A', 'B'] = self.frame['A']
+        assert_series_equal(self.frame['A', 'B'], self.frame[
+                            'A'], check_names=False)
+
+    def test_setitem_always_copy(self):
+        s = self.frame['A'].copy()
+        self.frame['E'] = s
+
+        self.frame['E'][5:10] = nan
+        assert notna(s[5:10]).all()
+
+    def test_setitem_boolean(self):
+        df = self.frame.copy()
+        values = self.frame.values
+
+        df[df['A'] > 0] = 4
+        values[values[:, 0] > 0] = 4
+        assert_almost_equal(df.values, values)
+
+        # test that column reindexing works
+        series = df['A'] == 4
+        series = series.reindex(df.index[::-1])
+        df[series] = 1
+        values[values[:, 0] == 4] = 1
+        assert_almost_equal(df.values, values)
+
+        df[df > 0] = 5
+        values[values > 0] = 5
+        assert_almost_equal(df.values, values)
+
+        df[df == 5] = 0
+        values[values == 5] = 0
+        assert_almost_equal(df.values, values)
+
+        # a df that needs alignment first
+        df[df[:-1] < 0] = 2
+        np.putmask(values[:-1], values[:-1] < 0, 2)
+        assert_almost_equal(df.values, values)
+
+        # indexed with same shape but rows-reversed df
+        df[df[::-1] == 2] = 3
+        values[values == 2] = 3
+        assert_almost_equal(df.values, values)
+
+        msg = "Must pass DataFrame or 2-d ndarray with boolean values only"
+        with tm.assert_raises_regex(TypeError, msg):
+            df[df * 0] = 2
+
+        # index with DataFrame
+        mask = df > np.abs(df)
+        expected = df.copy()
+        df[df > np.abs(df)] = nan
+        expected.values[mask.values] = nan
+        assert_frame_equal(df, expected)
+
+        # set from DataFrame
+        expected = df.copy()
+        df[df > np.abs(df)] = df * 2
+        np.putmask(expected.values, mask.values, df.values * 2)
+        assert_frame_equal(df, expected)
+
+    @pytest.mark.parametrize(
+        "mask_type",
+        [lambda df: df > np.abs(df) / 2,
+         lambda df: (df > np.abs(df) / 2).values],
+        ids=['dataframe', 'array'])
+    def test_setitem_boolean_mask(self, mask_type):
+
+        # Test for issue #18582
+        df = self.frame.copy()
+        mask = mask_type(df)
+
+        # index with boolean mask
+        result = df.copy()
+        result[mask] = np.nan
+
+        expected = df.copy()
+        expected.values[np.array(mask)] = np.nan
+        assert_frame_equal(result, expected)
+
+    def test_setitem_cast(self):
+        self.frame['D'] = self.frame['D'].astype('i8')
+        assert self.frame['D'].dtype == np.int64
+
+        # #669, should not cast?
+        # this is now set to int64, which means a replacement of the column to
+        # the value dtype (and nothing to do with the existing dtype)
+        self.frame['B'] = 0
+        assert self.frame['B'].dtype == np.int64
+
+        # cast if pass array of course
+        self.frame['B'] = np.arange(len(self.frame))
+        assert issubclass(self.frame['B'].dtype.type, np.integer)
+
+        self.frame['foo'] = 'bar'
+        self.frame['foo'] = 0
+        assert self.frame['foo'].dtype == np.int64
+
+        self.frame['foo'] = 'bar'
+        self.frame['foo'] = 2.5
+        assert self.frame['foo'].dtype == np.float64
+
+        self.frame['something'] = 0
+        assert self.frame['something'].dtype == np.int64
+        self.frame['something'] = 2
+        assert self.frame['something'].dtype == np.int64
+        self.frame['something'] = 2.5
+        assert self.frame['something'].dtype == np.float64
+
+        # GH 7704
+        # dtype conversion on setting
+        df = DataFrame(np.random.rand(30, 3), columns=tuple('ABC'))
+        df['event'] = np.nan
+        df.loc[10, 'event'] = 'foo'
+        result = df.get_dtype_counts().sort_values()
+        expected = Series({'float64': 3, 'object': 1}).sort_values()
+        assert_series_equal(result, expected)
+
+        # Test that data type is preserved . #5782
+        df = DataFrame({'one': np.arange(6, dtype=np.int8)})
+        df.loc[1, 'one'] = 6
+        assert df.dtypes.one == np.dtype(np.int8)
+        df.one = np.int8(7)
+        assert df.dtypes.one == np.dtype(np.int8)
+
+    def test_setitem_boolean_column(self):
+        expected = self.frame.copy()
+        mask = self.frame['A'] > 0
+
+        self.frame.loc[mask, 'B'] = 0
+        expected.values[mask.values, 1] = 0
+
+        assert_frame_equal(self.frame, expected)
+
+    def test_frame_setitem_timestamp(self):
+        # GH#2155
+        columns = DatetimeIndex(start='1/1/2012', end='2/1/2012', freq=BDay())
+        index = lrange(10)
+        data = DataFrame(columns=columns, index=index)
+        t = datetime(2012, 11, 1)
+        ts = Timestamp(t)
+        data[ts] = np.nan  # works, mostly a smoke-test
+        assert np.isnan(data[ts]).all()
+
+    def test_setitem_corner(self):
+        # corner case
+        df = DataFrame({'B': [1., 2., 3.],
+                        'C': ['a', 'b', 'c']},
+                       index=np.arange(3))
+        del df['B']
+        df['B'] = [1., 2., 3.]
+        assert 'B' in df
+        assert len(df.columns) == 2
+
+        df['A'] = 'beginning'
+        df['E'] = 'foo'
+        df['D'] = 'bar'
+        df[datetime.now()] = 'date'
+        df[datetime.now()] = 5.
+
+        # what to do when empty frame with index
+        dm = DataFrame(index=self.frame.index)
+        dm['A'] = 'foo'
+        dm['B'] = 'bar'
+        assert len(dm.columns) == 2
+        assert dm.values.dtype == np.object_
+
+        # upcast
+        dm['C'] = 1
+        assert dm['C'].dtype == np.int64
+
+        dm['E'] = 1.
+        assert dm['E'].dtype == np.float64
+
+        # set existing column
+        dm['A'] = 'bar'
+        assert 'bar' == dm['A'][0]
+
+        dm = DataFrame(index=np.arange(3))
+        dm['A'] = 1
+        dm['foo'] = 'bar'
+        del dm['foo']
+        dm['foo'] = 'bar'
+        assert dm['foo'].dtype == np.object_
+
+        dm['coercable'] = ['1', '2', '3']
+        assert dm['coercable'].dtype == np.object_
+
+    def test_setitem_corner2(self):
+        data = {"title": ['foobar', 'bar', 'foobar'] + ['foobar'] * 17,
+                "cruft": np.random.random(20)}
+
+        df = DataFrame(data)
+        ix = df[df['title'] == 'bar'].index
+
+        df.loc[ix, ['title']] = 'foobar'
+        df.loc[ix, ['cruft']] = 0
+
+        assert df.loc[1, 'title'] == 'foobar'
+        assert df.loc[1, 'cruft'] == 0
+
+    def test_setitem_ambig(self):
+        # Difficulties with mixed-type data
+        from decimal import Decimal
+
+        # Created as float type
+        dm = DataFrame(index=lrange(3), columns=lrange(3))
+
+        coercable_series = Series([Decimal(1) for _ in range(3)],
+                                  index=lrange(3))
+        uncoercable_series = Series(['foo', 'bzr', 'baz'], index=lrange(3))
+
+        dm[0] = np.ones(3)
+        assert len(dm.columns) == 3
+
+        dm[1] = coercable_series
+        assert len(dm.columns) == 3
+
+        dm[2] = uncoercable_series
+        assert len(dm.columns) == 3
+        assert dm[2].dtype == np.object_
+
+    def test_setitem_clear_caches(self):
+        # see gh-304
+        df = DataFrame({'x': [1.1, 2.1, 3.1, 4.1], 'y': [5.1, 6.1, 7.1, 8.1]},
+                       index=[0, 1, 2, 3])
+        df.insert(2, 'z', np.nan)
+
+        # cache it
+        foo = df['z']
+        df.loc[df.index[2:], 'z'] = 42
+
+        expected = Series([np.nan, np.nan, 42, 42], index=df.index, name='z')
+
+        assert df['z'] is not foo
+        tm.assert_series_equal(df['z'], expected)
+
+    def test_setitem_None(self):
+        # GH #766
+        self.frame[None] = self.frame['A']
+        assert_series_equal(
+            self.frame.iloc[:, -1], self.frame['A'], check_names=False)
+        assert_series_equal(self.frame.loc[:, None], self.frame[
+                            'A'], check_names=False)
+        assert_series_equal(self.frame[None], self.frame[
+                            'A'], check_names=False)
+        repr(self.frame)
+
+    def test_setitem_empty(self):
+        # GH 9596
+        df = pd.DataFrame({'a': ['1', '2', '3'],
+                           'b': ['11', '22', '33'],
+                           'c': ['111', '222', '333']})
+
+        result = df.copy()
+        result.loc[result.b.isna(), 'a'] = result.a
+        assert_frame_equal(result, df)
+
+    def test_setitem_empty_frame_with_boolean(self):
+        # Test for issue #10126
+
+        for dtype in ('float', 'int64'):
+            for df in [
+                    pd.DataFrame(dtype=dtype),
+                    pd.DataFrame(dtype=dtype, index=[1]),
+                    pd.DataFrame(dtype=dtype, columns=['A']),
+            ]:
+                df2 = df.copy()
+                df[df > df2] = 47
+                assert_frame_equal(df, df2)
+
+    def test_setitem_scalars_no_index(self):
+        # GH16823 / 17894
+        df = DataFrame()
+        df['foo'] = 1
+        expected = DataFrame(columns=['foo']).astype(np.int64)
+        assert_frame_equal(df, expected)
+
+    def test_getitem_empty_frame_with_boolean(self):
+        # Test for issue #11859
+
+        df = pd.DataFrame()
+        df2 = df[df > 0]
+        assert_frame_equal(df, df2)
+
+    def test_delitem_corner(self):
+        f = self.frame.copy()
+        del f['D']
+        assert len(f.columns) == 3
+        pytest.raises(KeyError, f.__delitem__, 'D')
+        del f['B']
+        assert len(f.columns) == 2
+
+    def test_getitem_fancy_2d(self):
+        f = self.frame
+
+        with catch_warnings(record=True):
+            assert_frame_equal(f.ix[:, ['B', 'A']],
+                               f.reindex(columns=['B', 'A']))
+
+        subidx = self.frame.index[[5, 4, 1]]
+        with catch_warnings(record=True):
+            assert_frame_equal(f.ix[subidx, ['B', 'A']],
+                               f.reindex(index=subidx, columns=['B', 'A']))
+
+        # slicing rows, etc.
+        with catch_warnings(record=True):
+            assert_frame_equal(f.ix[5:10], f[5:10])
+            assert_frame_equal(f.ix[5:10, :], f[5:10])
+            assert_frame_equal(f.ix[:5, ['A', 'B']],
+                               f.reindex(index=f.index[:5],
+                                         columns=['A', 'B']))
+
+        # slice rows with labels, inclusive!
+        with catch_warnings(record=True):
+            expected = f.ix[5:11]
+            result = f.ix[f.index[5]:f.index[10]]
+        assert_frame_equal(expected, result)
+
+        # slice columns
+        with catch_warnings(record=True):
+            assert_frame_equal(f.ix[:, :2], f.reindex(columns=['A', 'B']))
+
+        # get view
+        with catch_warnings(record=True):
+            exp = f.copy()
+            f.ix[5:10].values[:] = 5
+            exp.values[5:10] = 5
+            assert_frame_equal(f, exp)
+
+        with catch_warnings(record=True):
+            pytest.raises(ValueError, f.ix.__getitem__, f > 0.5)
+
+    def test_slice_floats(self):
+        index = [52195.504153, 52196.303147, 52198.369883]
+        df = DataFrame(np.random.rand(3, 2), index=index)
+
+        s1 = df.loc[52195.1:52196.5]
+        assert len(s1) == 2
+
+        s1 = df.loc[52195.1:52196.6]
+        assert len(s1) == 2
+
+        s1 = df.loc[52195.1:52198.9]
+        assert len(s1) == 3
+
+    def test_getitem_fancy_slice_integers_step(self):
+        df = DataFrame(np.random.randn(10, 5))
+
+        # this is OK
+        result = df.iloc[:8:2]  # noqa
+        df.iloc[:8:2] = np.nan
+        assert isna(df.iloc[:8:2]).values.all()
+
+    def test_getitem_setitem_integer_slice_keyerrors(self):
+        df = DataFrame(np.random.randn(10, 5), index=lrange(0, 20, 2))
+
+        # this is OK
+        cp = df.copy()
+        cp.iloc[4:10] = 0
+        assert (cp.iloc[4:10] == 0).values.all()
+
+        # so is this
+        cp = df.copy()
+        cp.iloc[3:11] = 0
+        assert (cp.iloc[3:11] == 0).values.all()
+
+        result = df.iloc[2:6]
+        result2 = df.loc[3:11]
+        expected = df.reindex([4, 6, 8, 10])
+
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result2, expected)
+
+        # non-monotonic, raise KeyError
+        df2 = df.iloc[lrange(5) + lrange(5, 10)[::-1]]
+        pytest.raises(KeyError, df2.loc.__getitem__, slice(3, 11))
+        pytest.raises(KeyError, df2.loc.__setitem__, slice(3, 11), 0)
+
+    def test_setitem_fancy_2d(self):
+
+        # case 1
+        frame = self.frame.copy()
+        expected = frame.copy()
+
+        with catch_warnings(record=True):
+            frame.ix[:, ['B', 'A']] = 1
+        expected['B'] = 1.
+        expected['A'] = 1.
+        assert_frame_equal(frame, expected)
+
+        # case 2
+        frame = self.frame.copy()
+        frame2 = self.frame.copy()
+
+        expected = frame.copy()
+
+        subidx = self.frame.index[[5, 4, 1]]
+        values = randn(3, 2)
+
+        with catch_warnings(record=True):
+            frame.ix[subidx, ['B', 'A']] = values
+            frame2.ix[[5, 4, 1], ['B', 'A']] = values
+
+            expected['B'].ix[subidx] = values[:, 0]
+            expected['A'].ix[subidx] = values[:, 1]
+
+        assert_frame_equal(frame, expected)
+        assert_frame_equal(frame2, expected)
+
+        # case 3: slicing rows, etc.
+        frame = self.frame.copy()
+
+        with catch_warnings(record=True):
+            expected1 = self.frame.copy()
+            frame.ix[5:10] = 1.
+            expected1.values[5:10] = 1.
+        assert_frame_equal(frame, expected1)
+
+        with catch_warnings(record=True):
+            expected2 = self.frame.copy()
+            arr = randn(5, len(frame.columns))
+            frame.ix[5:10] = arr
+            expected2.values[5:10] = arr
+        assert_frame_equal(frame, expected2)
+
+        # case 4
+        with catch_warnings(record=True):
+            frame = self.frame.copy()
+            frame.ix[5:10, :] = 1.
+            assert_frame_equal(frame, expected1)
+            frame.ix[5:10, :] = arr
+        assert_frame_equal(frame, expected2)
+
+        # case 5
+        with catch_warnings(record=True):
+            frame = self.frame.copy()
+            frame2 = self.frame.copy()
+
+            expected = self.frame.copy()
+            values = randn(5, 2)
+
+            frame.ix[:5, ['A', 'B']] = values
+            expected['A'][:5] = values[:, 0]
+            expected['B'][:5] = values[:, 1]
+        assert_frame_equal(frame, expected)
+
+        with catch_warnings(record=True):
+            frame2.ix[:5, [0, 1]] = values
+        assert_frame_equal(frame2, expected)
+
+        # case 6: slice rows with labels, inclusive!
+        with catch_warnings(record=True):
+            frame = self.frame.copy()
+            expected = self.frame.copy()
+
+            frame.ix[frame.index[5]:frame.index[10]] = 5.
+            expected.values[5:11] = 5
+        assert_frame_equal(frame, expected)
+
+        # case 7: slice columns
+        with catch_warnings(record=True):
+            frame = self.frame.copy()
+            frame2 = self.frame.copy()
+            expected = self.frame.copy()
+
+            # slice indices
+            frame.ix[:, 1:3] = 4.
+            expected.values[:, 1:3] = 4.
+            assert_frame_equal(frame, expected)
+
+            # slice with labels
+            frame.ix[:, 'B':'C'] = 4.
+            assert_frame_equal(frame, expected)
+
+        # new corner case of boolean slicing / setting
+        frame = DataFrame(lzip([2, 3, 9, 6, 7], [np.nan] * 5),
+                          columns=['a', 'b'])
+        lst = [100]
+        lst.extend([np.nan] * 4)
+        expected = DataFrame(lzip([100, 3, 9, 6, 7], lst),
+                             columns=['a', 'b'])
+        frame[frame['a'] == 2] = 100
+        assert_frame_equal(frame, expected)
+
+    def test_fancy_getitem_slice_mixed(self):
+        sliced = self.mixed_frame.iloc[:, -3:]
+        assert sliced['D'].dtype == np.float64
+
+        # get view with single block
+        # setting it triggers setting with copy
+        sliced = self.frame.iloc[:, -3:]
+
+        def f():
+            sliced['C'] = 4.
+        pytest.raises(com.SettingWithCopyError, f)
+        assert (self.frame['C'] == 4).all()
+
+    def test_fancy_setitem_int_labels(self):
+        # integer index defers to label-based indexing
+
+        df = DataFrame(np.random.randn(10, 5), index=np.arange(0, 20, 2))
+
+        with catch_warnings(record=True):
+            tmp = df.copy()
+            exp = df.copy()
+            tmp.ix[[0, 2, 4]] = 5
+            exp.values[:3] = 5
+        assert_frame_equal(tmp, exp)
+
+        with catch_warnings(record=True):
+            tmp = df.copy()
+            exp = df.copy()
+            tmp.ix[6] = 5
+            exp.values[3] = 5
+        assert_frame_equal(tmp, exp)
+
+        with catch_warnings(record=True):
+            tmp = df.copy()
+            exp = df.copy()
+            tmp.ix[:, 2] = 5
+
+        # tmp correctly sets the dtype
+        # so match the exp way
+        exp[2] = 5
+        assert_frame_equal(tmp, exp)
+
+    def test_fancy_getitem_int_labels(self):
+        df = DataFrame(np.random.randn(10, 5), index=np.arange(0, 20, 2))
+
+        with catch_warnings(record=True):
+            result = df.ix[[4, 2, 0], [2, 0]]
+            expected = df.reindex(index=[4, 2, 0], columns=[2, 0])
+        assert_frame_equal(result, expected)
+
+        with catch_warnings(record=True):
+            result = df.ix[[4, 2, 0]]
+            expected = df.reindex(index=[4, 2, 0])
+        assert_frame_equal(result, expected)
+
+        with catch_warnings(record=True):
+            result = df.ix[4]
+            expected = df.xs(4)
+        assert_series_equal(result, expected)
+
+        with catch_warnings(record=True):
+            result = df.ix[:, 3]
+            expected = df[3]
+        assert_series_equal(result, expected)
+
+    def test_fancy_index_int_labels_exceptions(self):
+        df = DataFrame(np.random.randn(10, 5), index=np.arange(0, 20, 2))
+
+        with catch_warnings(record=True):
+
+            # labels that aren't contained
+            pytest.raises(KeyError, df.ix.__setitem__,
+                          ([0, 1, 2], [2, 3, 4]), 5)
+
+            # try to set indices not contained in frame
+            pytest.raises(KeyError, self.frame.ix.__setitem__,
+                          ['foo', 'bar', 'baz'], 1)
+            pytest.raises(KeyError, self.frame.ix.__setitem__,
+                          (slice(None, None), ['E']), 1)
+
+            # partial setting now allows this GH2578
+            # pytest.raises(KeyError, self.frame.ix.__setitem__,
+            #               (slice(None, None), 'E'), 1)
+
+    def test_setitem_fancy_mixed_2d(self):
+
+        with catch_warnings(record=True):
+            self.mixed_frame.ix[:5, ['C', 'B', 'A']] = 5
+            result = self.mixed_frame.ix[:5, ['C', 'B', 'A']]
+            assert (result.values == 5).all()
+
+            self.mixed_frame.ix[5] = np.nan
+            assert isna(self.mixed_frame.ix[5]).all()
+
+            self.mixed_frame.ix[5] = self.mixed_frame.ix[6]
+            assert_series_equal(self.mixed_frame.ix[5], self.mixed_frame.ix[6],
+                                check_names=False)
+
+        # #1432
+        with catch_warnings(record=True):
+            df = DataFrame({1: [1., 2., 3.],
+                            2: [3, 4, 5]})
+            assert df._is_mixed_type
+
+            df.ix[1] = [5, 10]
+
+            expected = DataFrame({1: [1., 5., 3.],
+                                  2: [3, 10, 5]})
+
+            assert_frame_equal(df, expected)
+
+    def test_ix_align(self):
+        b = Series(randn(10), name=0).sort_values()
+        df_orig = DataFrame(randn(10, 4))
+        df = df_orig.copy()
+
+        with catch_warnings(record=True):
+            df.ix[:, 0] = b
+            assert_series_equal(df.ix[:, 0].reindex(b.index), b)
+
+        with catch_warnings(record=True):
+            dft = df_orig.T
+            dft.ix[0, :] = b
+            assert_series_equal(dft.ix[0, :].reindex(b.index), b)
+
+        with catch_warnings(record=True):
+            df = df_orig.copy()
+            df.ix[:5, 0] = b
+            s = df.ix[:5, 0]
+            assert_series_equal(s, b.reindex(s.index))
+
+        with catch_warnings(record=True):
+            dft = df_orig.T
+            dft.ix[0, :5] = b
+            s = dft.ix[0, :5]
+            assert_series_equal(s, b.reindex(s.index))
+
+        with catch_warnings(record=True):
+            df = df_orig.copy()
+            idx = [0, 1, 3, 5]
+            df.ix[idx, 0] = b
+            s = df.ix[idx, 0]
+            assert_series_equal(s, b.reindex(s.index))
+
+        with catch_warnings(record=True):
+            dft = df_orig.T
+            dft.ix[0, idx] = b
+            s = dft.ix[0, idx]
+            assert_series_equal(s, b.reindex(s.index))
+
+    def test_ix_frame_align(self):
+        b = DataFrame(np.random.randn(3, 4))
+        df_orig = DataFrame(randn(10, 4))
+        df = df_orig.copy()
+
+        with catch_warnings(record=True):
+            df.ix[:3] = b
+            out = b.ix[:3]
+            assert_frame_equal(out, b)
+
+        b.sort_index(inplace=True)
+
+        with catch_warnings(record=True):
+            df = df_orig.copy()
+            df.ix[[0, 1, 2]] = b
+            out = df.ix[[0, 1, 2]].reindex(b.index)
+            assert_frame_equal(out, b)
+
+        with catch_warnings(record=True):
+            df = df_orig.copy()
+            df.ix[:3] = b
+            out = df.ix[:3]
+            assert_frame_equal(out, b.reindex(out.index))
+
+    def test_getitem_setitem_non_ix_labels(self):
+        df = tm.makeTimeDataFrame()
+
+        start, end = df.index[[5, 10]]
+
+        result = df.loc[start:end]
+        result2 = df[start:end]
+        expected = df[5:11]
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result2, expected)
+
+        result = df.copy()
+        result.loc[start:end] = 0
+        result2 = df.copy()
+        result2[start:end] = 0
+        expected = df.copy()
+        expected[5:11] = 0
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result2, expected)
+
+    def test_ix_multi_take(self):
+        df = DataFrame(np.random.randn(3, 2))
+        rs = df.loc[df.index == 0, :]
+        xp = df.reindex([0])
+        assert_frame_equal(rs, xp)
+
+        """ #1321
+        df = DataFrame(np.random.randn(3, 2))
+        rs = df.loc[df.index==0, df.columns==1]
+        xp = df.reindex([0], [1])
+        assert_frame_equal(rs, xp)
+        """
+
+    def test_ix_multi_take_nonint_index(self):
+        df = DataFrame(np.random.randn(3, 2), index=['x', 'y', 'z'],
+                       columns=['a', 'b'])
+        with catch_warnings(record=True):
+            rs = df.ix[[0], [0]]
+        xp = df.reindex(['x'], columns=['a'])
+        assert_frame_equal(rs, xp)
+
+    def test_ix_multi_take_multiindex(self):
+        df = DataFrame(np.random.randn(3, 2), index=['x', 'y', 'z'],
+                       columns=[['a', 'b'], ['1', '2']])
+        with catch_warnings(record=True):
+            rs = df.ix[[0], [0]]
+        xp = df.reindex(['x'], columns=[('a', '1')])
+        assert_frame_equal(rs, xp)
+
+    def test_ix_dup(self):
+        idx = Index(['a', 'a', 'b', 'c', 'd', 'd'])
+        df = DataFrame(np.random.randn(len(idx), 3), idx)
+
+        with catch_warnings(record=True):
+            sub = df.ix[:'d']
+            assert_frame_equal(sub, df)
+
+        with catch_warnings(record=True):
+            sub = df.ix['a':'c']
+            assert_frame_equal(sub, df.ix[0:4])
+
+        with catch_warnings(record=True):
+            sub = df.ix['b':'d']
+            assert_frame_equal(sub, df.ix[2:])
+
+    def test_getitem_fancy_1d(self):
+        f = self.frame
+
+        # return self if no slicing...for now
+        with catch_warnings(record=True):
+            assert f.ix[:, :] is f
+
+        # low dimensional slice
+        with catch_warnings(record=True):
+            xs1 = f.ix[2, ['C', 'B', 'A']]
+        xs2 = f.xs(f.index[2]).reindex(['C', 'B', 'A'])
+        tm.assert_series_equal(xs1, xs2)
+
+        with catch_warnings(record=True):
+            ts1 = f.ix[5:10, 2]
+        ts2 = f[f.columns[2]][5:10]
+        tm.assert_series_equal(ts1, ts2)
+
+        # positional xs
+        with catch_warnings(record=True):
+            xs1 = f.ix[0]
+        xs2 = f.xs(f.index[0])
+        tm.assert_series_equal(xs1, xs2)
+
+        with catch_warnings(record=True):
+            xs1 = f.ix[f.index[5]]
+        xs2 = f.xs(f.index[5])
+        tm.assert_series_equal(xs1, xs2)
+
+        # single column
+        with catch_warnings(record=True):
+            assert_series_equal(f.ix[:, 'A'], f['A'])
+
+        # return view
+        with catch_warnings(record=True):
+            exp = f.copy()
+            exp.values[5] = 4
+            f.ix[5][:] = 4
+        tm.assert_frame_equal(exp, f)
+
+        with catch_warnings(record=True):
+            exp.values[:, 1] = 6
+            f.ix[:, 1][:] = 6
+        tm.assert_frame_equal(exp, f)
+
+        # slice of mixed-frame
+        with catch_warnings(record=True):
+            xs = self.mixed_frame.ix[5]
+        exp = self.mixed_frame.xs(self.mixed_frame.index[5])
+        tm.assert_series_equal(xs, exp)
+
+    def test_setitem_fancy_1d(self):
+
+        # case 1: set cross-section for indices
+        frame = self.frame.copy()
+        expected = self.frame.copy()
+
+        with catch_warnings(record=True):
+            frame.ix[2, ['C', 'B', 'A']] = [1., 2., 3.]
+        expected['C'][2] = 1.
+        expected['B'][2] = 2.
+        expected['A'][2] = 3.
+        assert_frame_equal(frame, expected)
+
+        with catch_warnings(record=True):
+            frame2 = self.frame.copy()
+            frame2.ix[2, [3, 2, 1]] = [1., 2., 3.]
+        assert_frame_equal(frame, expected)
+
+        # case 2, set a section of a column
+        frame = self.frame.copy()
+        expected = self.frame.copy()
+
+        with catch_warnings(record=True):
+            vals = randn(5)
+            expected.values[5:10, 2] = vals
+            frame.ix[5:10, 2] = vals
+        assert_frame_equal(frame, expected)
+
+        with catch_warnings(record=True):
+            frame2 = self.frame.copy()
+            frame2.ix[5:10, 'B'] = vals
+        assert_frame_equal(frame, expected)
+
+        # case 3: full xs
+        frame = self.frame.copy()
+        expected = self.frame.copy()
+
+        with catch_warnings(record=True):
+            frame.ix[4] = 5.
+            expected.values[4] = 5.
+        assert_frame_equal(frame, expected)
+
+        with catch_warnings(record=True):
+            frame.ix[frame.index[4]] = 6.
+            expected.values[4] = 6.
+        assert_frame_equal(frame, expected)
+
+        # single column
+        frame = self.frame.copy()
+        expected = self.frame.copy()
+
+        with catch_warnings(record=True):
+            frame.ix[:, 'A'] = 7.
+            expected['A'] = 7.
+        assert_frame_equal(frame, expected)
+
+    def test_getitem_fancy_scalar(self):
+        f = self.frame
+        ix = f.loc
+
+        # individual value
+        for col in f.columns:
+            ts = f[col]
+            for idx in f.index[::5]:
+                assert ix[idx, col] == ts[idx]
+
+    def test_setitem_fancy_scalar(self):
+        f = self.frame
+        expected = self.frame.copy()
+        ix = f.loc
+
+        # individual value
+        for j, col in enumerate(f.columns):
+            ts = f[col]  # noqa
+            for idx in f.index[::5]:
+                i = f.index.get_loc(idx)
+                val = randn()
+                expected.values[i, j] = val
+
+                ix[idx, col] = val
+                assert_frame_equal(f, expected)
+
+    def test_getitem_fancy_boolean(self):
+        f = self.frame
+        ix = f.loc
+
+        expected = f.reindex(columns=['B', 'D'])
+        result = ix[:, [False, True, False, True]]
+        assert_frame_equal(result, expected)
+
+        expected = f.reindex(index=f.index[5:10], columns=['B', 'D'])
+        result = ix[f.index[5:10], [False, True, False, True]]
+        assert_frame_equal(result, expected)
+
+        boolvec = f.index > f.index[7]
+        expected = f.reindex(index=f.index[boolvec])
+        result = ix[boolvec]
+        assert_frame_equal(result, expected)
+        result = ix[boolvec, :]
+        assert_frame_equal(result, expected)
+
+        result = ix[boolvec, f.columns[2:]]
+        expected = f.reindex(index=f.index[boolvec],
+                             columns=['C', 'D'])
+        assert_frame_equal(result, expected)
+
+    def test_setitem_fancy_boolean(self):
+        # from 2d, set with booleans
+        frame = self.frame.copy()
+        expected = self.frame.copy()
+
+        mask = frame['A'] > 0
+        frame.loc[mask] = 0.
+        expected.values[mask.values] = 0.
+        assert_frame_equal(frame, expected)
+
+        frame = self.frame.copy()
+        expected = self.frame.copy()
+        frame.loc[mask, ['A', 'B']] = 0.
+        expected.values[mask.values, :2] = 0.
+        assert_frame_equal(frame, expected)
+
+    def test_getitem_fancy_ints(self):
+        result = self.frame.iloc[[1, 4, 7]]
+        expected = self.frame.loc[self.frame.index[[1, 4, 7]]]
+        assert_frame_equal(result, expected)
+
+        result = self.frame.iloc[:, [2, 0, 1]]
+        expected = self.frame.loc[:, self.frame.columns[[2, 0, 1]]]
+        assert_frame_equal(result, expected)
+
+    def test_getitem_setitem_fancy_exceptions(self):
+        ix = self.frame.iloc
+        with tm.assert_raises_regex(IndexingError, 'Too many indexers'):
+            ix[:, :, :]
+
+        with pytest.raises(IndexingError):
+            ix[:, :, :] = 1
+
+    def test_getitem_setitem_boolean_misaligned(self):
+        # boolean index misaligned labels
+        mask = self.frame['A'][::-1] > 1
+
+        result = self.frame.loc[mask]
+        expected = self.frame.loc[mask[::-1]]
+        assert_frame_equal(result, expected)
+
+        cp = self.frame.copy()
+        expected = self.frame.copy()
+        cp.loc[mask] = 0
+        expected.loc[mask] = 0
+        assert_frame_equal(cp, expected)
+
+    def test_getitem_setitem_boolean_multi(self):
+        df = DataFrame(np.random.randn(3, 2))
+
+        # get
+        k1 = np.array([True, False, True])
+        k2 = np.array([False, True])
+        result = df.loc[k1, k2]
+        expected = df.loc[[0, 2], [1]]
+        assert_frame_equal(result, expected)
+
+        expected = df.copy()
+        df.loc[np.array([True, False, True]),
+               np.array([False, True])] = 5
+        expected.loc[[0, 2], [1]] = 5
+        assert_frame_equal(df, expected)
+
+    def test_getitem_setitem_float_labels(self):
+        index = Index([1.5, 2, 3, 4, 5])
+        df = DataFrame(np.random.randn(5, 5), index=index)
+
+        result = df.loc[1.5:4]
+        expected = df.reindex([1.5, 2, 3, 4])
+        assert_frame_equal(result, expected)
+        assert len(result) == 4
+
+        result = df.loc[4:5]
+        expected = df.reindex([4, 5])  # reindex with int
+        assert_frame_equal(result, expected, check_index_type=False)
+        assert len(result) == 2
+
+        result = df.loc[4:5]
+        expected = df.reindex([4.0, 5.0])  # reindex with float
+        assert_frame_equal(result, expected)
+        assert len(result) == 2
+
+        # loc_float changes this to work properly
+        result = df.loc[1:2]
+        expected = df.iloc[0:2]
+        assert_frame_equal(result, expected)
+
+        df.loc[1:2] = 0
+        result = df[1:2]
+        assert (result == 0).all().all()
+
+        # #2727
+        index = Index([1.0, 2.5, 3.5, 4.5, 5.0])
+        df = DataFrame(np.random.randn(5, 5), index=index)
+
+        # positional slicing only via iloc!
+        pytest.raises(TypeError, lambda: df.iloc[1.0:5])
+
+        result = df.iloc[4:5]
+        expected = df.reindex([5.0])
+        assert_frame_equal(result, expected)
+        assert len(result) == 1
+
+        cp = df.copy()
+
+        def f():
+            cp.iloc[1.0:5] = 0
+        pytest.raises(TypeError, f)
+
+        def f():
+            result = cp.iloc[1.0:5] == 0  # noqa
+
+        pytest.raises(TypeError, f)
+        assert result.values.all()
+        assert (cp.iloc[0:1] == df.iloc[0:1]).values.all()
+
+        cp = df.copy()
+        cp.iloc[4:5] = 0
+        assert (cp.iloc[4:5] == 0).values.all()
+        assert (cp.iloc[0:4] == df.iloc[0:4]).values.all()
+
+        # float slicing
+        result = df.loc[1.0:5]
+        expected = df
+        assert_frame_equal(result, expected)
+        assert len(result) == 5
+
+        result = df.loc[1.1:5]
+        expected = df.reindex([2.5, 3.5, 4.5, 5.0])
+        assert_frame_equal(result, expected)
+        assert len(result) == 4
+
+        result = df.loc[4.51:5]
+        expected = df.reindex([5.0])
+        assert_frame_equal(result, expected)
+        assert len(result) == 1
+
+        result = df.loc[1.0:5.0]
+        expected = df.reindex([1.0, 2.5, 3.5, 4.5, 5.0])
+        assert_frame_equal(result, expected)
+        assert len(result) == 5
+
+        cp = df.copy()
+        cp.loc[1.0:5.0] = 0
+        result = cp.loc[1.0:5.0]
+        assert (result == 0).values.all()
+
+    def test_setitem_single_column_mixed(self):
+        df = DataFrame(randn(5, 3), index=['a', 'b', 'c', 'd', 'e'],
+                       columns=['foo', 'bar', 'baz'])
+        df['str'] = 'qux'
+        df.loc[df.index[::2], 'str'] = nan
+        expected = np.array([nan, 'qux', nan, 'qux', nan], dtype=object)
+        assert_almost_equal(df['str'].values, expected)
+
+    def test_setitem_single_column_mixed_datetime(self):
+        df = DataFrame(randn(5, 3), index=['a', 'b', 'c', 'd', 'e'],
+                       columns=['foo', 'bar', 'baz'])
+
+        df['timestamp'] = Timestamp('20010102')
+
+        # check our dtypes
+        result = df.get_dtype_counts()
+        expected = Series({'float64': 3, 'datetime64[ns]': 1})
+        assert_series_equal(result, expected)
+
+        # set an allowable datetime64 type
+        df.loc['b', 'timestamp'] = iNaT
+        assert isna(df.loc['b', 'timestamp'])
+
+        # allow this syntax
+        df.loc['c', 'timestamp'] = nan
+        assert isna(df.loc['c', 'timestamp'])
+
+        # allow this syntax
+        df.loc['d', :] = nan
+        assert not isna(df.loc['c', :]).all()
+
+        # as of GH 3216 this will now work!
+        # try to set with a list like item
+        # pytest.raises(
+        #    Exception, df.loc.__setitem__, ('d', 'timestamp'), [nan])
+
+    def test_setitem_mixed_datetime(self):
+        # GH 9336
+        expected = DataFrame({'a': [0, 0, 0, 0, 13, 14],
+                              'b': [pd.datetime(2012, 1, 1),
+                                    1,
+                                    'x',
+                                    'y',
+                                    pd.datetime(2013, 1, 1),
+                                    pd.datetime(2014, 1, 1)]})
+        df = pd.DataFrame(0, columns=list('ab'), index=range(6))
+        df['b'] = pd.NaT
+        df.loc[0, 'b'] = pd.datetime(2012, 1, 1)
+        df.loc[1, 'b'] = 1
+        df.loc[[2, 3], 'b'] = 'x', 'y'
+        A = np.array([[13, np.datetime64('2013-01-01T00:00:00')],
+                      [14, np.datetime64('2014-01-01T00:00:00')]])
+        df.loc[[4, 5], ['a', 'b']] = A
+        assert_frame_equal(df, expected)
+
+    def test_setitem_frame(self):
+        piece = self.frame.loc[self.frame.index[:2], ['A', 'B']]
+        self.frame.loc[self.frame.index[-2]:, ['A', 'B']] = piece.values
+        result = self.frame.loc[self.frame.index[-2:], ['A', 'B']].values
+        expected = piece.values
+        assert_almost_equal(result, expected)
+
+        # GH 3216
+
+        # already aligned
+        f = self.mixed_frame.copy()
+        piece = DataFrame([[1., 2.], [3., 4.]],
+                          index=f.index[0:2], columns=['A', 'B'])
+        key = (slice(None, 2), ['A', 'B'])
+        f.loc[key] = piece
+        assert_almost_equal(f.loc[f.index[0:2], ['A', 'B']].values,
+                            piece.values)
+
+        # rows unaligned
+        f = self.mixed_frame.copy()
+        piece = DataFrame([[1., 2.], [3., 4.], [5., 6.], [7., 8.]],
+                          index=list(f.index[0:2]) + ['foo', 'bar'],
+                          columns=['A', 'B'])
+        key = (slice(None, 2), ['A', 'B'])
+        f.loc[key] = piece
+        assert_almost_equal(f.loc[f.index[0:2:], ['A', 'B']].values,
+                            piece.values[0:2])
+
+        # key is unaligned with values
+        f = self.mixed_frame.copy()
+        piece = f.loc[f.index[:2], ['A']]
+        piece.index = f.index[-2:]
+        key = (slice(-2, None), ['A', 'B'])
+        f.loc[key] = piece
+        piece['B'] = np.nan
+        assert_almost_equal(f.loc[f.index[-2:], ['A', 'B']].values,
+                            piece.values)
+
+        # ndarray
+        f = self.mixed_frame.copy()
+        piece = self.mixed_frame.loc[f.index[:2], ['A', 'B']]
+        key = (slice(-2, None), ['A', 'B'])
+        f.loc[key] = piece.values
+        assert_almost_equal(f.loc[f.index[-2:], ['A', 'B']].values,
+                            piece.values)
+
+        # needs upcasting
+        df = DataFrame([[1, 2, 'foo'], [3, 4, 'bar']], columns=['A', 'B', 'C'])
+        df2 = df.copy()
+        df2.loc[:, ['A', 'B']] = df.loc[:, ['A', 'B']] + 0.5
+        expected = df.reindex(columns=['A', 'B'])
+        expected += 0.5
+        expected['C'] = df['C']
+        assert_frame_equal(df2, expected)
+
+    def test_setitem_frame_align(self):
+        piece = self.frame.loc[self.frame.index[:2], ['A', 'B']]
+        piece.index = self.frame.index[-2:]
+        piece.columns = ['A', 'B']
+        self.frame.loc[self.frame.index[-2:], ['A', 'B']] = piece
+        result = self.frame.loc[self.frame.index[-2:], ['A', 'B']].values
+        expected = piece.values
+        assert_almost_equal(result, expected)
+
+    def test_getitem_setitem_ix_duplicates(self):
+        # #1201
+        df = DataFrame(np.random.randn(5, 3),
+                       index=['foo', 'foo', 'bar', 'baz', 'bar'])
+
+        result = df.loc['foo']
+        expected = df[:2]
+        assert_frame_equal(result, expected)
+
+        result = df.loc['bar']
+        expected = df.iloc[[2, 4]]
+        assert_frame_equal(result, expected)
+
+        result = df.loc['baz']
+        expected = df.iloc[3]
+        assert_series_equal(result, expected)
+
+    def test_getitem_ix_boolean_duplicates_multiple(self):
+        # #1201
+        df = DataFrame(np.random.randn(5, 3),
+                       index=['foo', 'foo', 'bar', 'baz', 'bar'])
+
+        result = df.loc[['bar']]
+        exp = df.iloc[[2, 4]]
+        assert_frame_equal(result, exp)
+
+        result = df.loc[df[1] > 0]
+        exp = df[df[1] > 0]
+        assert_frame_equal(result, exp)
+
+        result = df.loc[df[0] > 0]
+        exp = df[df[0] > 0]
+        assert_frame_equal(result, exp)
+
+    def test_getitem_setitem_ix_bool_keyerror(self):
+        # #2199
+        df = DataFrame({'a': [1, 2, 3]})
+
+        pytest.raises(KeyError, df.loc.__getitem__, False)
+        pytest.raises(KeyError, df.loc.__getitem__, True)
+
+        pytest.raises(KeyError, df.loc.__setitem__, False, 0)
+        pytest.raises(KeyError, df.loc.__setitem__, True, 0)
+
+    def test_getitem_list_duplicates(self):
+        # #1943
+        df = DataFrame(np.random.randn(4, 4), columns=list('AABC'))
+        df.columns.name = 'foo'
+
+        result = df[['B', 'C']]
+        assert result.columns.name == 'foo'
+
+        expected = df.iloc[:, 2:]
+        assert_frame_equal(result, expected)
+
+    def test_get_value(self):
+        for idx in self.frame.index:
+            for col in self.frame.columns:
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    result = self.frame.get_value(idx, col)
+                expected = self.frame[col][idx]
+                assert result == expected
+
+    def test_lookup(self):
+        def alt(df, rows, cols, dtype):
+            result = []
+            for r, c in zip(rows, cols):
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    result.append(df.get_value(r, c))
+            return np.array(result, dtype=dtype)
+
+        def testit(df):
+            rows = list(df.index) * len(df.columns)
+            cols = list(df.columns) * len(df.index)
+            result = df.lookup(rows, cols)
+            expected = alt(df, rows, cols, dtype=np.object_)
+            tm.assert_almost_equal(result, expected, check_dtype=False)
+
+        testit(self.mixed_frame)
+        testit(self.frame)
+
+        df = DataFrame({'label': ['a', 'b', 'a', 'c'],
+                        'mask_a': [True, True, False, True],
+                        'mask_b': [True, False, False, False],
+                        'mask_c': [False, True, False, True]})
+        df['mask'] = df.lookup(df.index, 'mask_' + df['label'])
+        exp_mask = alt(df, df.index, 'mask_' + df['label'], dtype=np.bool_)
+        tm.assert_series_equal(df['mask'], pd.Series(exp_mask, name='mask'))
+        assert df['mask'].dtype == np.bool_
+
+        with pytest.raises(KeyError):
+            self.frame.lookup(['xyz'], ['A'])
+
+        with pytest.raises(KeyError):
+            self.frame.lookup([self.frame.index[0]], ['xyz'])
+
+        with tm.assert_raises_regex(ValueError, 'same size'):
+            self.frame.lookup(['a', 'b', 'c'], ['a'])
+
+    def test_set_value(self):
+        for idx in self.frame.index:
+            for col in self.frame.columns:
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    self.frame.set_value(idx, col, 1)
+                assert self.frame[col][idx] == 1
+
+    def test_set_value_resize(self):
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res = self.frame.set_value('foobar', 'B', 0)
+        assert res is self.frame
+        assert res.index[-1] == 'foobar'
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert res.get_value('foobar', 'B') == 0
+
+        self.frame.loc['foobar', 'qux'] = 0
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert self.frame.get_value('foobar', 'qux') == 0
+
+        res = self.frame.copy()
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res3 = res.set_value('foobar', 'baz', 'sam')
+        assert res3['baz'].dtype == np.object_
+
+        res = self.frame.copy()
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res3 = res.set_value('foobar', 'baz', True)
+        assert res3['baz'].dtype == np.object_
+
+        res = self.frame.copy()
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res3 = res.set_value('foobar', 'baz', 5)
+        assert is_float_dtype(res3['baz'])
+        assert isna(res3['baz'].drop(['foobar'])).all()
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            pytest.raises(ValueError, res3.set_value, 'foobar', 'baz', 'sam')
+
+    def test_set_value_with_index_dtype_change(self):
+        df_orig = DataFrame(randn(3, 3), index=lrange(3), columns=list('ABC'))
+
+        # this is actually ambiguous as the 2 is interpreted as a positional
+        # so column is not created
+        df = df_orig.copy()
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            df.set_value('C', 2, 1.0)
+        assert list(df.index) == list(df_orig.index) + ['C']
+        # assert list(df.columns) == list(df_orig.columns) + [2]
+
+        df = df_orig.copy()
+        df.loc['C', 2] = 1.0
+        assert list(df.index) == list(df_orig.index) + ['C']
+        # assert list(df.columns) == list(df_orig.columns) + [2]
+
+        # create both new
+        df = df_orig.copy()
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            df.set_value('C', 'D', 1.0)
+        assert list(df.index) == list(df_orig.index) + ['C']
+        assert list(df.columns) == list(df_orig.columns) + ['D']
+
+        df = df_orig.copy()
+        df.loc['C', 'D'] = 1.0
+        assert list(df.index) == list(df_orig.index) + ['C']
+        assert list(df.columns) == list(df_orig.columns) + ['D']
+
+    def test_get_set_value_no_partial_indexing(self):
+        # partial w/ MultiIndex raise exception
+        index = MultiIndex.from_tuples([(0, 1), (0, 2), (1, 1), (1, 2)])
+        df = DataFrame(index=index, columns=lrange(4))
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            pytest.raises(KeyError, df.get_value, 0, 1)
+
+    def test_single_element_ix_dont_upcast(self):
+        self.frame['E'] = 1
+        assert issubclass(self.frame['E'].dtype.type, (int, np.integer))
+
+        with catch_warnings(record=True):
+            result = self.frame.ix[self.frame.index[5], 'E']
+            assert is_integer(result)
+
+        result = self.frame.loc[self.frame.index[5], 'E']
+        assert is_integer(result)
+
+        # GH 11617
+        df = pd.DataFrame(dict(a=[1.23]))
+        df["b"] = 666
+
+        with catch_warnings(record=True):
+            result = df.ix[0, "b"]
+        assert is_integer(result)
+        result = df.loc[0, "b"]
+        assert is_integer(result)
+
+        expected = Series([666], [0], name='b')
+        with catch_warnings(record=True):
+            result = df.ix[[0], "b"]
+        assert_series_equal(result, expected)
+        result = df.loc[[0], "b"]
+        assert_series_equal(result, expected)
+
+    def test_iloc_row(self):
+        df = DataFrame(np.random.randn(10, 4), index=lrange(0, 20, 2))
+
+        result = df.iloc[1]
+        exp = df.loc[2]
+        assert_series_equal(result, exp)
+
+        result = df.iloc[2]
+        exp = df.loc[4]
+        assert_series_equal(result, exp)
+
+        # slice
+        result = df.iloc[slice(4, 8)]
+        expected = df.loc[8:14]
+        assert_frame_equal(result, expected)
+
+        # verify slice is view
+        # setting it makes it raise/warn
+        def f():
+            result[2] = 0.
+        pytest.raises(com.SettingWithCopyError, f)
+        exp_col = df[2].copy()
+        exp_col[4:8] = 0.
+        assert_series_equal(df[2], exp_col)
+
+        # list of integers
+        result = df.iloc[[1, 2, 4, 6]]
+        expected = df.reindex(df.index[[1, 2, 4, 6]])
+        assert_frame_equal(result, expected)
+
+    def test_iloc_col(self):
+
+        df = DataFrame(np.random.randn(4, 10), columns=lrange(0, 20, 2))
+
+        result = df.iloc[:, 1]
+        exp = df.loc[:, 2]
+        assert_series_equal(result, exp)
+
+        result = df.iloc[:, 2]
+        exp = df.loc[:, 4]
+        assert_series_equal(result, exp)
+
+        # slice
+        result = df.iloc[:, slice(4, 8)]
+        expected = df.loc[:, 8:14]
+        assert_frame_equal(result, expected)
+
+        # verify slice is view
+        # and that we are setting a copy
+        def f():
+            result[8] = 0.
+        pytest.raises(com.SettingWithCopyError, f)
+        assert (df[8] == 0).all()
+
+        # list of integers
+        result = df.iloc[:, [1, 2, 4, 6]]
+        expected = df.reindex(columns=df.columns[[1, 2, 4, 6]])
+        assert_frame_equal(result, expected)
+
+    def test_iloc_duplicates(self):
+
+        df = DataFrame(np.random.rand(3, 3), columns=list('ABC'),
+                       index=list('aab'))
+
+        result = df.iloc[0]
+        with catch_warnings(record=True):
+            result2 = df.ix[0]
+        assert isinstance(result, Series)
+        assert_almost_equal(result.values, df.values[0])
+        assert_series_equal(result, result2)
+
+        with catch_warnings(record=True):
+            result = df.T.iloc[:, 0]
+            result2 = df.T.ix[:, 0]
+        assert isinstance(result, Series)
+        assert_almost_equal(result.values, df.values[0])
+        assert_series_equal(result, result2)
+
+        # multiindex
+        df = DataFrame(np.random.randn(3, 3),
+                       columns=[['i', 'i', 'j'], ['A', 'A', 'B']],
+                       index=[['i', 'i', 'j'], ['X', 'X', 'Y']])
+
+        with catch_warnings(record=True):
+            rs = df.iloc[0]
+            xp = df.ix[0]
+        assert_series_equal(rs, xp)
+
+        with catch_warnings(record=True):
+            rs = df.iloc[:, 0]
+            xp = df.T.ix[0]
+        assert_series_equal(rs, xp)
+
+        with catch_warnings(record=True):
+            rs = df.iloc[:, [0]]
+            xp = df.ix[:, [0]]
+        assert_frame_equal(rs, xp)
+
+        # #2259
+        df = DataFrame([[1, 2, 3], [4, 5, 6]], columns=[1, 1, 2])
+        result = df.iloc[:, [0]]
+        expected = df.take([0], axis=1)
+        assert_frame_equal(result, expected)
+
+    def test_loc_duplicates(self):
+        # gh-17105
+
+        # insert a duplicate element to the index
+        trange = pd.date_range(start=pd.Timestamp(year=2017, month=1, day=1),
+                               end=pd.Timestamp(year=2017, month=1, day=5))
+
+        trange = trange.insert(loc=5,
+                               item=pd.Timestamp(year=2017, month=1, day=5))
+
+        df = pd.DataFrame(0, index=trange, columns=["A", "B"])
+        bool_idx = np.array([False, False, False, False, False, True])
+
+        # assignment
+        df.loc[trange[bool_idx], "A"] = 6
+
+        expected = pd.DataFrame({'A': [0, 0, 0, 0, 6, 6],
+                                 'B': [0, 0, 0, 0, 0, 0]},
+                                index=trange)
+        tm.assert_frame_equal(df, expected)
+
+        # in-place
+        df = pd.DataFrame(0, index=trange, columns=["A", "B"])
+        df.loc[trange[bool_idx], "A"] += 6
+        tm.assert_frame_equal(df, expected)
+
+    def test_iloc_sparse_propegate_fill_value(self):
+        from pandas.core.sparse.api import SparseDataFrame
+        df = SparseDataFrame({'A': [999, 1]}, default_fill_value=999)
+        assert len(df['A'].sp_values) == len(df.iloc[:, 0].sp_values)
+
+    def test_iat(self):
+
+        for i, row in enumerate(self.frame.index):
+            for j, col in enumerate(self.frame.columns):
+                result = self.frame.iat[i, j]
+                expected = self.frame.at[row, col]
+                assert result == expected
+
+    def test_nested_exception(self):
+        # Ignore the strange way of triggering the problem
+        # (which may get fixed), it's just a way to trigger
+        # the issue or reraising an outer exception without
+        # a named argument
+        df = DataFrame({"a": [1, 2, 3], "b": [4, 5, 6],
+                        "c": [7, 8, 9]}).set_index(["a", "b"])
+        l = list(df.index)
+        l[0] = ["a", "b"]
+        df.index = l
+
+        try:
+            repr(df)
+        except Exception as e:
+            assert type(e) != UnboundLocalError
+
+    def test_reindex_methods(self):
+        df = pd.DataFrame({'x': list(range(5))})
+        target = np.array([-0.1, 0.9, 1.1, 1.5])
+
+        for method, expected_values in [('nearest', [0, 1, 1, 2]),
+                                        ('pad', [np.nan, 0, 1, 1]),
+                                        ('backfill', [0, 1, 2, 2])]:
+            expected = pd.DataFrame({'x': expected_values}, index=target)
+            actual = df.reindex(target, method=method)
+            assert_frame_equal(expected, actual)
+
+            actual = df.reindex_like(df, method=method, tolerance=0)
+            assert_frame_equal(df, actual)
+            actual = df.reindex_like(df, method=method, tolerance=[0, 0, 0, 0])
+            assert_frame_equal(df, actual)
+
+            actual = df.reindex(target, method=method, tolerance=1)
+            assert_frame_equal(expected, actual)
+            actual = df.reindex(target, method=method, tolerance=[1, 1, 1, 1])
+            assert_frame_equal(expected, actual)
+
+            e2 = expected[::-1]
+            actual = df.reindex(target[::-1], method=method)
+            assert_frame_equal(e2, actual)
+
+            new_order = [3, 0, 2, 1]
+            e2 = expected.iloc[new_order]
+            actual = df.reindex(target[new_order], method=method)
+            assert_frame_equal(e2, actual)
+
+            switched_method = ('pad' if method == 'backfill'
+                               else 'backfill' if method == 'pad'
+                               else method)
+            actual = df[::-1].reindex(target, method=switched_method)
+            assert_frame_equal(expected, actual)
+
+        expected = pd.DataFrame({'x': [0, 1, 1, np.nan]}, index=target)
+        actual = df.reindex(target, method='nearest', tolerance=0.2)
+        assert_frame_equal(expected, actual)
+
+        expected = pd.DataFrame({'x': [0, np.nan, 1, np.nan]}, index=target)
+        actual = df.reindex(target, method='nearest',
+                            tolerance=[0.5, 0.01, 0.4, 0.1])
+        assert_frame_equal(expected, actual)
+
+    def test_reindex_frame_add_nat(self):
+        rng = date_range('1/1/2000 00:00:00', periods=10, freq='10s')
+        df = DataFrame({'A': np.random.randn(len(rng)), 'B': rng})
+
+        result = df.reindex(lrange(15))
+        assert np.issubdtype(result['B'].dtype, np.dtype('M8[ns]'))
+
+        mask = com.isna(result)['B']
+        assert mask[-5:].all()
+        assert not mask[:-5].any()
+
+    def test_set_dataframe_column_ns_dtype(self):
+        x = DataFrame([datetime.now(), datetime.now()])
+        assert x[0].dtype == np.dtype('M8[ns]')
+
+    def test_non_monotonic_reindex_methods(self):
+        dr = pd.date_range('2013-08-01', periods=6, freq='B')
+        data = np.random.randn(6, 1)
+        df = pd.DataFrame(data, index=dr, columns=list('A'))
+        df_rev = pd.DataFrame(data, index=dr[[3, 4, 5] + [0, 1, 2]],
+                              columns=list('A'))
+        # index is not monotonic increasing or decreasing
+        pytest.raises(ValueError, df_rev.reindex, df.index, method='pad')
+        pytest.raises(ValueError, df_rev.reindex, df.index, method='ffill')
+        pytest.raises(ValueError, df_rev.reindex, df.index, method='bfill')
+        pytest.raises(ValueError, df_rev.reindex, df.index, method='nearest')
+
+    def test_reindex_level(self):
+        from itertools import permutations
+        icol = ['jim', 'joe', 'jolie']
+
+        def verify_first_level(df, level, idx, check_index_type=True):
+            f = lambda val: np.nonzero(df[level] == val)[0]
+            i = np.concatenate(list(map(f, idx)))
+            left = df.set_index(icol).reindex(idx, level=level)
+            right = df.iloc[i].set_index(icol)
+            assert_frame_equal(left, right, check_index_type=check_index_type)
+
+        def verify(df, level, idx, indexer, check_index_type=True):
+            left = df.set_index(icol).reindex(idx, level=level)
+            right = df.iloc[indexer].set_index(icol)
+            assert_frame_equal(left, right, check_index_type=check_index_type)
+
+        df = pd.DataFrame({'jim': list('B' * 4 + 'A' * 2 + 'C' * 3),
+                           'joe': list('abcdeabcd')[::-1],
+                           'jolie': [10, 20, 30] * 3,
+                           'joline': np.random.randint(0, 1000, 9)})
+
+        target = [['C', 'B', 'A'], ['F', 'C', 'A', 'D'], ['A'],
+                  ['A', 'B', 'C'], ['C', 'A', 'B'], ['C', 'B'], ['C', 'A'],
+                  ['A', 'B'], ['B', 'A', 'C']]
+
+        for idx in target:
+            verify_first_level(df, 'jim', idx)
+
+        # reindex by these causes different MultiIndex levels
+        for idx in [['D', 'F'], ['A', 'C', 'B']]:
+            verify_first_level(df, 'jim', idx, check_index_type=False)
+
+        verify(df, 'joe', list('abcde'), [3, 2, 1, 0, 5, 4, 8, 7, 6])
+        verify(df, 'joe', list('abcd'), [3, 2, 1, 0, 5, 8, 7, 6])
+        verify(df, 'joe', list('abc'), [3, 2, 1, 8, 7, 6])
+        verify(df, 'joe', list('eca'), [1, 3, 4, 6, 8])
+        verify(df, 'joe', list('edc'), [0, 1, 4, 5, 6])
+        verify(df, 'joe', list('eadbc'), [3, 0, 2, 1, 4, 5, 8, 7, 6])
+        verify(df, 'joe', list('edwq'), [0, 4, 5])
+        verify(df, 'joe', list('wq'), [], check_index_type=False)
+
+        df = DataFrame({'jim': ['mid'] * 5 + ['btm'] * 8 + ['top'] * 7,
+                        'joe': ['3rd'] * 2 + ['1st'] * 3 + ['2nd'] * 3 +
+                        ['1st'] * 2 + ['3rd'] * 3 + ['1st'] * 2 +
+                        ['3rd'] * 3 + ['2nd'] * 2,
+                        # this needs to be jointly unique with jim and joe or
+                        # reindexing will fail ~1.5% of the time, this works
+                        # out to needing unique groups of same size as joe
+                        'jolie': np.concatenate([
+                            np.random.choice(1000, x, replace=False)
+                            for x in [2, 3, 3, 2, 3, 2, 3, 2]]),
+                        'joline': np.random.randn(20).round(3) * 10})
+
+        for idx in permutations(df['jim'].unique()):
+            for i in range(3):
+                verify_first_level(df, 'jim', idx[:i + 1])
+
+        i = [2, 3, 4, 0, 1, 8, 9, 5, 6, 7, 10,
+             11, 12, 13, 14, 18, 19, 15, 16, 17]
+        verify(df, 'joe', ['1st', '2nd', '3rd'], i)
+
+        i = [0, 1, 2, 3, 4, 10, 11, 12, 5, 6,
+             7, 8, 9, 15, 16, 17, 18, 19, 13, 14]
+        verify(df, 'joe', ['3rd', '2nd', '1st'], i)
+
+        i = [0, 1, 5, 6, 7, 10, 11, 12, 18, 19, 15, 16, 17]
+        verify(df, 'joe', ['2nd', '3rd'], i)
+
+        i = [0, 1, 2, 3, 4, 10, 11, 12, 8, 9, 15, 16, 17, 13, 14]
+        verify(df, 'joe', ['3rd', '1st'], i)
+
+    def test_getitem_ix_float_duplicates(self):
+        df = pd.DataFrame(np.random.randn(3, 3),
+                          index=[0.1, 0.2, 0.2], columns=list('abc'))
+        expect = df.iloc[1:]
+        assert_frame_equal(df.loc[0.2], expect)
+        with catch_warnings(record=True):
+            assert_frame_equal(df.ix[0.2], expect)
+
+        expect = df.iloc[1:, 0]
+        assert_series_equal(df.loc[0.2, 'a'], expect)
+
+        df.index = [1, 0.2, 0.2]
+        expect = df.iloc[1:]
+        assert_frame_equal(df.loc[0.2], expect)
+        with catch_warnings(record=True):
+            assert_frame_equal(df.ix[0.2], expect)
+
+        expect = df.iloc[1:, 0]
+        assert_series_equal(df.loc[0.2, 'a'], expect)
+
+        df = pd.DataFrame(np.random.randn(4, 3),
+                          index=[1, 0.2, 0.2, 1], columns=list('abc'))
+        expect = df.iloc[1:-1]
+        assert_frame_equal(df.loc[0.2], expect)
+        with catch_warnings(record=True):
+            assert_frame_equal(df.ix[0.2], expect)
+
+        expect = df.iloc[1:-1, 0]
+        assert_series_equal(df.loc[0.2, 'a'], expect)
+
+        df.index = [0.1, 0.2, 2, 0.2]
+        expect = df.iloc[[1, -1]]
+        assert_frame_equal(df.loc[0.2], expect)
+        with catch_warnings(record=True):
+            assert_frame_equal(df.ix[0.2], expect)
+
+        expect = df.iloc[[1, -1], 0]
+        assert_series_equal(df.loc[0.2, 'a'], expect)
+
+    def test_setitem_with_sparse_value(self):
+        # GH8131
+        df = pd.DataFrame({'c_1': ['a', 'b', 'c'], 'n_1': [1., 2., 3.]})
+        sp_series = pd.Series([0, 0, 1]).to_sparse(fill_value=0)
+        df['new_column'] = sp_series
+        assert_series_equal(df['new_column'], sp_series, check_names=False)
+
+    def test_setitem_with_unaligned_sparse_value(self):
+        df = pd.DataFrame({'c_1': ['a', 'b', 'c'], 'n_1': [1., 2., 3.]})
+        sp_series = (pd.Series([0, 0, 1], index=[2, 1, 0])
+                     .to_sparse(fill_value=0))
+        df['new_column'] = sp_series
+        exp = pd.Series([1, 0, 0], name='new_column')
+        assert_series_equal(df['new_column'], exp)
+
+    def test_setitem_with_unaligned_tz_aware_datetime_column(self):
+        # GH 12981
+        # Assignment of unaligned offset-aware datetime series.
+        # Make sure timezone isn't lost
+        column = pd.Series(pd.date_range('2015-01-01', periods=3, tz='utc'),
+                           name='dates')
+        df = pd.DataFrame({'dates': column})
+        df['dates'] = column[[1, 0, 2]]
+        assert_series_equal(df['dates'], column)
+
+        df = pd.DataFrame({'dates': column})
+        df.loc[[0, 1, 2], 'dates'] = column[[1, 0, 2]]
+        assert_series_equal(df['dates'], column)
+
+    def test_setitem_datetime_coercion(self):
+        # gh-1048
+        df = pd.DataFrame({'c': [pd.Timestamp('2010-10-01')] * 3})
+        df.loc[0:1, 'c'] = np.datetime64('2008-08-08')
+        assert pd.Timestamp('2008-08-08') == df.loc[0, 'c']
+        assert pd.Timestamp('2008-08-08') == df.loc[1, 'c']
+        df.loc[2, 'c'] = date(2005, 5, 5)
+        assert pd.Timestamp('2005-05-05') == df.loc[2, 'c']
+
+    def test_setitem_datetimelike_with_inference(self):
+        # GH 7592
+        # assignment of timedeltas with NaT
+
+        one_hour = timedelta(hours=1)
+        df = DataFrame(index=date_range('20130101', periods=4))
+        df['A'] = np.array([1 * one_hour] * 4, dtype='m8[ns]')
+        df.loc[:, 'B'] = np.array([2 * one_hour] * 4, dtype='m8[ns]')
+        df.loc[:3, 'C'] = np.array([3 * one_hour] * 3, dtype='m8[ns]')
+        df.loc[:, 'D'] = np.array([4 * one_hour] * 4, dtype='m8[ns]')
+        df.loc[df.index[:3], 'E'] = np.array([5 * one_hour] * 3,
+                                             dtype='m8[ns]')
+        df['F'] = np.timedelta64('NaT')
+        df.loc[df.index[:-1], 'F'] = np.array([6 * one_hour] * 3,
+                                              dtype='m8[ns]')
+        df.loc[df.index[-3]:, 'G'] = date_range('20130101', periods=3)
+        df['H'] = np.datetime64('NaT')
+        result = df.dtypes
+        expected = Series([np.dtype('timedelta64[ns]')] * 6 +
+                          [np.dtype('datetime64[ns]')] * 2,
+                          index=list('ABCDEFGH'))
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('idxer', ['var', ['var']])
+    def test_setitem_datetimeindex_tz(self, idxer, tz_naive_fixture):
+        # GH 11365
+        tz = tz_naive_fixture
+        idx = date_range(start='2015-07-12', periods=3, freq='H', tz=tz)
+        expected = DataFrame(1.2, index=idx, columns=['var'])
+        result = DataFrame(index=idx, columns=['var'])
+        result.loc[:, idxer] = expected
+        tm.assert_frame_equal(result, expected)
+
+    def test_at_time_between_time_datetimeindex(self):
+        index = date_range("2012-01-01", "2012-01-05", freq='30min')
+        df = DataFrame(randn(len(index), 5), index=index)
+        akey = time(12, 0, 0)
+        bkey = slice(time(13, 0, 0), time(14, 0, 0))
+        ainds = [24, 72, 120, 168]
+        binds = [26, 27, 28, 74, 75, 76, 122, 123, 124, 170, 171, 172]
+
+        result = df.at_time(akey)
+        expected = df.loc[akey]
+        expected2 = df.iloc[ainds]
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result, expected2)
+        assert len(result) == 4
+
+        result = df.between_time(bkey.start, bkey.stop)
+        expected = df.loc[bkey]
+        expected2 = df.iloc[binds]
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result, expected2)
+        assert len(result) == 12
+
+        result = df.copy()
+        result.loc[akey] = 0
+        result = result.loc[akey]
+        expected = df.loc[akey].copy()
+        expected.loc[:] = 0
+        assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.loc[akey] = 0
+        result.loc[akey] = df.iloc[ainds]
+        assert_frame_equal(result, df)
+
+        result = df.copy()
+        result.loc[bkey] = 0
+        result = result.loc[bkey]
+        expected = df.loc[bkey].copy()
+        expected.loc[:] = 0
+        assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.loc[bkey] = 0
+        result.loc[bkey] = df.iloc[binds]
+        assert_frame_equal(result, df)
+
+    def test_xs(self):
+        idx = self.frame.index[5]
+        xs = self.frame.xs(idx)
+        for item, value in compat.iteritems(xs):
+            if np.isnan(value):
+                assert np.isnan(self.frame[item][idx])
+            else:
+                assert value == self.frame[item][idx]
+
+        # mixed-type xs
+        test_data = {
+            'A': {'1': 1, '2': 2},
+            'B': {'1': '1', '2': '2', '3': '3'},
+        }
+        frame = DataFrame(test_data)
+        xs = frame.xs('1')
+        assert xs.dtype == np.object_
+        assert xs['A'] == 1
+        assert xs['B'] == '1'
+
+        with pytest.raises(KeyError):
+            self.tsframe.xs(self.tsframe.index[0] - BDay())
+
+        # xs get column
+        series = self.frame.xs('A', axis=1)
+        expected = self.frame['A']
+        assert_series_equal(series, expected)
+
+        # view is returned if possible
+        series = self.frame.xs('A', axis=1)
+        series[:] = 5
+        assert (expected == 5).all()
+
+    def test_xs_corner(self):
+        # pathological mixed-type reordering case
+        df = DataFrame(index=[0])
+        df['A'] = 1.
+        df['B'] = 'foo'
+        df['C'] = 2.
+        df['D'] = 'bar'
+        df['E'] = 3.
+
+        xs = df.xs(0)
+        exp = pd.Series([1., 'foo', 2., 'bar', 3.],
+                        index=list('ABCDE'), name=0)
+        tm.assert_series_equal(xs, exp)
+
+        # no columns but Index(dtype=object)
+        df = DataFrame(index=['a', 'b', 'c'])
+        result = df.xs('a')
+        expected = Series([], name='a', index=pd.Index([], dtype=object))
+        assert_series_equal(result, expected)
+
+    def test_xs_duplicates(self):
+        df = DataFrame(randn(5, 2), index=['b', 'b', 'c', 'b', 'a'])
+
+        cross = df.xs('c')
+        exp = df.iloc[2]
+        assert_series_equal(cross, exp)
+
+    def test_xs_keep_level(self):
+        df = (DataFrame({'day': {0: 'sat', 1: 'sun'},
+                         'flavour': {0: 'strawberry', 1: 'strawberry'},
+                         'sales': {0: 10, 1: 12},
+                         'year': {0: 2008, 1: 2008}})
+              .set_index(['year', 'flavour', 'day']))
+        result = df.xs('sat', level='day', drop_level=False)
+        expected = df[:1]
+        assert_frame_equal(result, expected)
+
+        result = df.xs([2008, 'sat'], level=['year', 'day'], drop_level=False)
+        assert_frame_equal(result, expected)
+
+    def test_xs_view(self):
+        # in 0.14 this will return a view if possible a copy otherwise, but
+        # this is numpy dependent
+
+        dm = DataFrame(np.arange(20.).reshape(4, 5),
+                       index=lrange(4), columns=lrange(5))
+
+        dm.xs(2)[:] = 10
+        assert (dm.xs(2) == 10).all()
+
+    def test_index_namedtuple(self):
+        from collections import namedtuple
+        IndexType = namedtuple("IndexType", ["a", "b"])
+        idx1 = IndexType("foo", "bar")
+        idx2 = IndexType("baz", "bof")
+        index = Index([idx1, idx2],
+                      name="composite_index", tupleize_cols=False)
+        df = DataFrame([(1, 2), (3, 4)], index=index, columns=["A", "B"])
+
+        with catch_warnings(record=True):
+            result = df.ix[IndexType("foo", "bar")]["A"]
+        assert result == 1
+
+        result = df.loc[IndexType("foo", "bar")]["A"]
+        assert result == 1
+
+    def test_boolean_indexing(self):
+        idx = lrange(3)
+        cols = ['A', 'B', 'C']
+        df1 = DataFrame(index=idx, columns=cols,
+                        data=np.array([[0.0, 0.5, 1.0],
+                                       [1.5, 2.0, 2.5],
+                                       [3.0, 3.5, 4.0]],
+                                      dtype=float))
+        df2 = DataFrame(index=idx, columns=cols,
+                        data=np.ones((len(idx), len(cols))))
+
+        expected = DataFrame(index=idx, columns=cols,
+                             data=np.array([[0.0, 0.5, 1.0],
+                                            [1.5, 2.0, -1],
+                                            [-1, -1, -1]], dtype=float))
+
+        df1[df1 > 2.0 * df2] = -1
+        assert_frame_equal(df1, expected)
+        with tm.assert_raises_regex(ValueError, 'Item wrong length'):
+            df1[df1.index[:-1] > 2] = -1
+
+    def test_boolean_indexing_mixed(self):
+        df = DataFrame({
+            long(0): {35: np.nan, 40: np.nan, 43: np.nan,
+                      49: np.nan, 50: np.nan},
+            long(1): {35: np.nan,
+                      40: 0.32632316859446198,
+                      43: np.nan,
+                      49: 0.32632316859446198,
+                      50: 0.39114724480578139},
+            long(2): {35: np.nan, 40: np.nan, 43: 0.29012581014105987,
+                      49: np.nan, 50: np.nan},
+            long(3): {35: np.nan, 40: np.nan, 43: np.nan, 49: np.nan,
+                      50: np.nan},
+            long(4): {35: 0.34215328467153283, 40: np.nan, 43: np.nan,
+                      49: np.nan, 50: np.nan},
+            'y': {35: 0, 40: 0, 43: 0, 49: 0, 50: 1}})
+
+        # mixed int/float ok
+        df2 = df.copy()
+        df2[df2 > 0.3] = 1
+        expected = df.copy()
+        expected.loc[40, 1] = 1
+        expected.loc[49, 1] = 1
+        expected.loc[50, 1] = 1
+        expected.loc[35, 4] = 1
+        assert_frame_equal(df2, expected)
+
+        df['foo'] = 'test'
+        with tm.assert_raises_regex(TypeError, 'boolean setting '
+                                    'on mixed-type'):
+            df[df > 0.3] = 1
+
+    def test_where(self):
+        default_frame = DataFrame(np.random.randn(5, 3),
+                                  columns=['A', 'B', 'C'])
+
+        def _safe_add(df):
+            # only add to the numeric items
+            def is_ok(s):
+                return (issubclass(s.dtype.type, (np.integer, np.floating)) and
+                        s.dtype != 'uint8')
+
+            return DataFrame(dict((c, s + 1) if is_ok(s) else (c, s)
+                                  for c, s in compat.iteritems(df)))
+
+        def _check_get(df, cond, check_dtypes=True):
+            other1 = _safe_add(df)
+            rs = df.where(cond, other1)
+            rs2 = df.where(cond.values, other1)
+            for k, v in rs.iteritems():
+                exp = Series(
+                    np.where(cond[k], df[k], other1[k]), index=v.index)
+                assert_series_equal(v, exp, check_names=False)
+            assert_frame_equal(rs, rs2)
+
+            # dtypes
+            if check_dtypes:
+                assert (rs.dtypes == df.dtypes).all()
+
+        # check getting
+        for df in [default_frame, self.mixed_frame,
+                   self.mixed_float, self.mixed_int]:
+            cond = df > 0
+            _check_get(df, cond)
+
+        # upcasting case (GH # 2794)
+        df = DataFrame(dict((c, Series([1] * 3, dtype=c))
+                            for c in ['float32', 'float64',
+                                      'int32', 'int64']))
+        df.iloc[1, :] = 0
+        result = df.where(df >= 0).get_dtype_counts()
+
+        # when we don't preserve boolean casts
+        #
+        # expected = Series({ 'float32' : 1, 'float64' : 3 })
+
+        expected = Series({'float32': 1, 'float64': 1, 'int32': 1, 'int64': 1})
+        assert_series_equal(result, expected)
+
+        # aligning
+        def _check_align(df, cond, other, check_dtypes=True):
+            rs = df.where(cond, other)
+            for i, k in enumerate(rs.columns):
+                result = rs[k]
+                d = df[k].values
+                c = cond[k].reindex(df[k].index).fillna(False).values
+
+                if is_scalar(other):
+                    o = other
+                else:
+                    if isinstance(other, np.ndarray):
+                        o = Series(other[:, i], index=result.index).values
+                    else:
+                        o = other[k].values
+
+                new_values = d if c.all() else np.where(c, d, o)
+                expected = Series(new_values, index=result.index, name=k)
+
+                # since we can't always have the correct numpy dtype
+                # as numpy doesn't know how to downcast, don't check
+                assert_series_equal(result, expected, check_dtype=False)
+
+            # dtypes
+            # can't check dtype when other is an ndarray
+
+            if check_dtypes and not isinstance(other, np.ndarray):
+                assert (rs.dtypes == df.dtypes).all()
+
+        for df in [self.mixed_frame, self.mixed_float, self.mixed_int]:
+
+            # other is a frame
+            cond = (df > 0)[1:]
+            _check_align(df, cond, _safe_add(df))
+
+            # check other is ndarray
+            cond = df > 0
+            _check_align(df, cond, (_safe_add(df).values))
+
+            # integers are upcast, so don't check the dtypes
+            cond = df > 0
+            check_dtypes = all(not issubclass(s.type, np.integer)
+                               for s in df.dtypes)
+            _check_align(df, cond, np.nan, check_dtypes=check_dtypes)
+
+        # invalid conditions
+        df = default_frame
+        err1 = (df + 1).values[0:2, :]
+        pytest.raises(ValueError, df.where, cond, err1)
+
+        err2 = cond.iloc[:2, :].values
+        other1 = _safe_add(df)
+        pytest.raises(ValueError, df.where, err2, other1)
+
+        pytest.raises(ValueError, df.mask, True)
+        pytest.raises(ValueError, df.mask, 0)
+
+        # where inplace
+        def _check_set(df, cond, check_dtypes=True):
+            dfi = df.copy()
+            econd = cond.reindex_like(df).fillna(True)
+            expected = dfi.mask(~econd)
+
+            dfi.where(cond, np.nan, inplace=True)
+            assert_frame_equal(dfi, expected)
+
+            # dtypes (and confirm upcasts)x
+            if check_dtypes:
+                for k, v in compat.iteritems(df.dtypes):
+                    if issubclass(v.type, np.integer) and not cond[k].all():
+                        v = np.dtype('float64')
+                    assert dfi[k].dtype == v
+
+        for df in [default_frame, self.mixed_frame, self.mixed_float,
+                   self.mixed_int]:
+
+            cond = df > 0
+            _check_set(df, cond)
+
+            cond = df >= 0
+            _check_set(df, cond)
+
+            # aligining
+            cond = (df >= 0)[1:]
+            _check_set(df, cond)
+
+        # GH 10218
+        # test DataFrame.where with Series slicing
+        df = DataFrame({'a': range(3), 'b': range(4, 7)})
+        result = df.where(df['a'] == 1)
+        expected = df[df['a'] == 1].reindex(df.index)
+        assert_frame_equal(result, expected)
+
+    def test_where_array_like(self):
+        # see gh-15414
+        klasses = [list, tuple, np.array]
+
+        df = DataFrame({'a': [1, 2, 3]})
+        cond = [[False], [True], [True]]
+        expected = DataFrame({'a': [np.nan, 2, 3]})
+
+        for klass in klasses:
+            result = df.where(klass(cond))
+            assert_frame_equal(result, expected)
+
+        df['b'] = 2
+        expected['b'] = [2, np.nan, 2]
+        cond = [[False, True], [True, False], [True, True]]
+
+        for klass in klasses:
+            result = df.where(klass(cond))
+            assert_frame_equal(result, expected)
+
+    def test_where_invalid_input(self):
+        # see gh-15414: only boolean arrays accepted
+        df = DataFrame({'a': [1, 2, 3]})
+        msg = "Boolean array expected for the condition"
+
+        conds = [
+            [[1], [0], [1]],
+            Series([[2], [5], [7]]),
+            DataFrame({'a': [2, 5, 7]}),
+            [["True"], ["False"], ["True"]],
+            [[Timestamp("2017-01-01")],
+             [pd.NaT], [Timestamp("2017-01-02")]]
+        ]
+
+        for cond in conds:
+            with tm.assert_raises_regex(ValueError, msg):
+                df.where(cond)
+
+        df['b'] = 2
+        conds = [
+            [[0, 1], [1, 0], [1, 1]],
+            Series([[0, 2], [5, 0], [4, 7]]),
+            [["False", "True"], ["True", "False"],
+             ["True", "True"]],
+            DataFrame({'a': [2, 5, 7], 'b': [4, 8, 9]}),
+            [[pd.NaT, Timestamp("2017-01-01")],
+             [Timestamp("2017-01-02"), pd.NaT],
+             [Timestamp("2017-01-03"), Timestamp("2017-01-03")]]
+        ]
+
+        for cond in conds:
+            with tm.assert_raises_regex(ValueError, msg):
+                df.where(cond)
+
+    def test_where_dataframe_col_match(self):
+        df = DataFrame([[1, 2, 3], [4, 5, 6]])
+        cond = DataFrame([[True, False, True], [False, False, True]])
+
+        result = df.where(cond)
+        expected = DataFrame([[1.0, np.nan, 3], [np.nan, np.nan, 6]])
+        tm.assert_frame_equal(result, expected)
+
+        # this *does* align, though has no matching columns
+        cond.columns = ["a", "b", "c"]
+        result = df.where(cond)
+        expected = DataFrame(np.nan, index=df.index, columns=df.columns)
+        tm.assert_frame_equal(result, expected)
+
+    def test_where_ndframe_align(self):
+        msg = "Array conditional must be same shape as self"
+        df = DataFrame([[1, 2, 3], [4, 5, 6]])
+
+        cond = [True]
+        with tm.assert_raises_regex(ValueError, msg):
+            df.where(cond)
+
+        expected = DataFrame([[1, 2, 3], [np.nan, np.nan, np.nan]])
+
+        out = df.where(Series(cond))
+        tm.assert_frame_equal(out, expected)
+
+        cond = np.array([False, True, False, True])
+        with tm.assert_raises_regex(ValueError, msg):
+            df.where(cond)
+
+        expected = DataFrame([[np.nan, np.nan, np.nan], [4, 5, 6]])
+
+        out = df.where(Series(cond))
+        tm.assert_frame_equal(out, expected)
+
+    def test_where_bug(self):
+
+        # GH 2793
+
+        df = DataFrame({'a': [1.0, 2.0, 3.0, 4.0], 'b': [
+                       4.0, 3.0, 2.0, 1.0]}, dtype='float64')
+        expected = DataFrame({'a': [np.nan, np.nan, 3.0, 4.0], 'b': [
+                             4.0, 3.0, np.nan, np.nan]}, dtype='float64')
+        result = df.where(df > 2, np.nan)
+        assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.where(result > 2, np.nan, inplace=True)
+        assert_frame_equal(result, expected)
+
+        # mixed
+        for dtype in ['int16', 'int8', 'int32', 'int64']:
+            df = DataFrame({'a': np.array([1, 2, 3, 4], dtype=dtype),
+                            'b': np.array([4.0, 3.0, 2.0, 1.0],
+                                          dtype='float64')})
+
+            expected = DataFrame({'a': [np.nan, np.nan, 3.0, 4.0],
+                                  'b': [4.0, 3.0, np.nan, np.nan]},
+                                 dtype='float64')
+
+            result = df.where(df > 2, np.nan)
+            assert_frame_equal(result, expected)
+
+            result = df.copy()
+            result.where(result > 2, np.nan, inplace=True)
+            assert_frame_equal(result, expected)
+
+        # transpositional issue
+        # GH7506
+        a = DataFrame({0: [1, 2], 1: [3, 4], 2: [5, 6]})
+        b = DataFrame({0: [np.nan, 8], 1: [9, np.nan], 2: [np.nan, np.nan]})
+        do_not_replace = b.isna() | (a > b)
+
+        expected = a.copy()
+        expected[~do_not_replace] = b
+
+        result = a.where(do_not_replace, b)
+        assert_frame_equal(result, expected)
+
+        a = DataFrame({0: [4, 6], 1: [1, 0]})
+        b = DataFrame({0: [np.nan, 3], 1: [3, np.nan]})
+        do_not_replace = b.isna() | (a > b)
+
+        expected = a.copy()
+        expected[~do_not_replace] = b
+
+        result = a.where(do_not_replace, b)
+        assert_frame_equal(result, expected)
+
+    def test_where_datetime(self):
+
+        # GH 3311
+        df = DataFrame(dict(A=date_range('20130102', periods=5),
+                            B=date_range('20130104', periods=5),
+                            C=np.random.randn(5)))
+
+        stamp = datetime(2013, 1, 3)
+        result = df[df > stamp]
+        expected = df.copy()
+        expected.loc[[0, 1], 'A'] = np.nan
+        assert_frame_equal(result, expected)
+
+    def test_where_none(self):
+        # GH 4667
+        # setting with None changes dtype
+        df = DataFrame({'series': Series(range(10))}).astype(float)
+        df[df > 7] = None
+        expected = DataFrame(
+            {'series': Series([0, 1, 2, 3, 4, 5, 6, 7, np.nan, np.nan])})
+        assert_frame_equal(df, expected)
+
+        # GH 7656
+        df = DataFrame([{'A': 1, 'B': np.nan, 'C': 'Test'}, {
+                       'A': np.nan, 'B': 'Test', 'C': np.nan}])
+        expected = df.where(~isna(df), None)
+        with tm.assert_raises_regex(TypeError, 'boolean setting '
+                                    'on mixed-type'):
+            df.where(~isna(df), None, inplace=True)
+
+    def test_where_align(self):
+
+        def create():
+            df = DataFrame(np.random.randn(10, 3))
+            df.iloc[3:5, 0] = np.nan
+            df.iloc[4:6, 1] = np.nan
+            df.iloc[5:8, 2] = np.nan
+            return df
+
+        # series
+        df = create()
+        expected = df.fillna(df.mean())
+        result = df.where(pd.notna(df), df.mean(), axis='columns')
+        assert_frame_equal(result, expected)
+
+        df.where(pd.notna(df), df.mean(), inplace=True, axis='columns')
+        assert_frame_equal(df, expected)
+
+        df = create().fillna(0)
+        expected = df.apply(lambda x, y: x.where(x > 0, y), y=df[0])
+        result = df.where(df > 0, df[0], axis='index')
+        assert_frame_equal(result, expected)
+        result = df.where(df > 0, df[0], axis='rows')
+        assert_frame_equal(result, expected)
+
+        # frame
+        df = create()
+        expected = df.fillna(1)
+        result = df.where(pd.notna(df), DataFrame(
+            1, index=df.index, columns=df.columns))
+        assert_frame_equal(result, expected)
+
+    def test_where_complex(self):
+        # GH 6345
+        expected = DataFrame(
+            [[1 + 1j, 2], [np.nan, 4 + 1j]], columns=['a', 'b'])
+        df = DataFrame([[1 + 1j, 2], [5 + 1j, 4 + 1j]], columns=['a', 'b'])
+        df[df.abs() >= 5] = np.nan
+        assert_frame_equal(df, expected)
+
+    def test_where_axis(self):
+        # GH 9736
+        df = DataFrame(np.random.randn(2, 2))
+        mask = DataFrame([[False, False], [False, False]])
+        s = Series([0, 1])
+
+        expected = DataFrame([[0, 0], [1, 1]], dtype='float64')
+        result = df.where(mask, s, axis='index')
+        assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.where(mask, s, axis='index', inplace=True)
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame([[0, 1], [0, 1]], dtype='float64')
+        result = df.where(mask, s, axis='columns')
+        assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.where(mask, s, axis='columns', inplace=True)
+        assert_frame_equal(result, expected)
+
+        # Upcast needed
+        df = DataFrame([[1, 2], [3, 4]], dtype='int64')
+        mask = DataFrame([[False, False], [False, False]])
+        s = Series([0, np.nan])
+
+        expected = DataFrame([[0, 0], [np.nan, np.nan]], dtype='float64')
+        result = df.where(mask, s, axis='index')
+        assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.where(mask, s, axis='index', inplace=True)
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame([[0, np.nan], [0, np.nan]])
+        result = df.where(mask, s, axis='columns')
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame({0: np.array([0, 0], dtype='int64'),
+                              1: np.array([np.nan, np.nan], dtype='float64')})
+        result = df.copy()
+        result.where(mask, s, axis='columns', inplace=True)
+        assert_frame_equal(result, expected)
+
+        # Multiple dtypes (=> multiple Blocks)
+        df = pd.concat([
+            DataFrame(np.random.randn(10, 2)),
+            DataFrame(np.random.randint(0, 10, size=(10, 2)), dtype='int64')],
+            ignore_index=True, axis=1)
+        mask = DataFrame(False, columns=df.columns, index=df.index)
+        s1 = Series(1, index=df.columns)
+        s2 = Series(2, index=df.index)
+
+        result = df.where(mask, s1, axis='columns')
+        expected = DataFrame(1.0, columns=df.columns, index=df.index)
+        expected[2] = expected[2].astype('int64')
+        expected[3] = expected[3].astype('int64')
+        assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.where(mask, s1, axis='columns', inplace=True)
+        assert_frame_equal(result, expected)
+
+        result = df.where(mask, s2, axis='index')
+        expected = DataFrame(2.0, columns=df.columns, index=df.index)
+        expected[2] = expected[2].astype('int64')
+        expected[3] = expected[3].astype('int64')
+        assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.where(mask, s2, axis='index', inplace=True)
+        assert_frame_equal(result, expected)
+
+        # DataFrame vs DataFrame
+        d1 = df.copy().drop(1, axis=0)
+        expected = df.copy()
+        expected.loc[1, :] = np.nan
+
+        result = df.where(mask, d1)
+        assert_frame_equal(result, expected)
+        result = df.where(mask, d1, axis='index')
+        assert_frame_equal(result, expected)
+        result = df.copy()
+        result.where(mask, d1, inplace=True)
+        assert_frame_equal(result, expected)
+        result = df.copy()
+        result.where(mask, d1, inplace=True, axis='index')
+        assert_frame_equal(result, expected)
+
+        d2 = df.copy().drop(1, axis=1)
+        expected = df.copy()
+        expected.loc[:, 1] = np.nan
+
+        result = df.where(mask, d2)
+        assert_frame_equal(result, expected)
+        result = df.where(mask, d2, axis='columns')
+        assert_frame_equal(result, expected)
+        result = df.copy()
+        result.where(mask, d2, inplace=True)
+        assert_frame_equal(result, expected)
+        result = df.copy()
+        result.where(mask, d2, inplace=True, axis='columns')
+        assert_frame_equal(result, expected)
+
+    def test_where_callable(self):
+        # GH 12533
+        df = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
+        result = df.where(lambda x: x > 4, lambda x: x + 1)
+        exp = DataFrame([[2, 3, 4], [5, 5, 6], [7, 8, 9]])
+        tm.assert_frame_equal(result, exp)
+        tm.assert_frame_equal(result, df.where(df > 4, df + 1))
+
+        # return ndarray and scalar
+        result = df.where(lambda x: (x % 2 == 0).values, lambda x: 99)
+        exp = DataFrame([[99, 2, 99], [4, 99, 6], [99, 8, 99]])
+        tm.assert_frame_equal(result, exp)
+        tm.assert_frame_equal(result, df.where(df % 2 == 0, 99))
+
+        # chain
+        result = (df + 2).where(lambda x: x > 8, lambda x: x + 10)
+        exp = DataFrame([[13, 14, 15], [16, 17, 18], [9, 10, 11]])
+        tm.assert_frame_equal(result, exp)
+        tm.assert_frame_equal(result,
+                              (df + 2).where((df + 2) > 8, (df + 2) + 10))
+
+    def test_mask(self):
+        df = DataFrame(np.random.randn(5, 3))
+        cond = df > 0
+
+        rs = df.where(cond, np.nan)
+        assert_frame_equal(rs, df.mask(df <= 0))
+        assert_frame_equal(rs, df.mask(~cond))
+
+        other = DataFrame(np.random.randn(5, 3))
+        rs = df.where(cond, other)
+        assert_frame_equal(rs, df.mask(df <= 0, other))
+        assert_frame_equal(rs, df.mask(~cond, other))
+
+    def test_mask_inplace(self):
+        # GH8801
+        df = DataFrame(np.random.randn(5, 3))
+        cond = df > 0
+
+        rdf = df.copy()
+
+        rdf.where(cond, inplace=True)
+        assert_frame_equal(rdf, df.where(cond))
+        assert_frame_equal(rdf, df.mask(~cond))
+
+        rdf = df.copy()
+        rdf.where(cond, -df, inplace=True)
+        assert_frame_equal(rdf, df.where(cond, -df))
+        assert_frame_equal(rdf, df.mask(~cond, -df))
+
+    def test_mask_edge_case_1xN_frame(self):
+        # GH4071
+        df = DataFrame([[1, 2]])
+        res = df.mask(DataFrame([[True, False]]))
+        expec = DataFrame([[nan, 2]])
+        assert_frame_equal(res, expec)
+
+    def test_mask_callable(self):
+        # GH 12533
+        df = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
+        result = df.mask(lambda x: x > 4, lambda x: x + 1)
+        exp = DataFrame([[1, 2, 3], [4, 6, 7], [8, 9, 10]])
+        tm.assert_frame_equal(result, exp)
+        tm.assert_frame_equal(result, df.mask(df > 4, df + 1))
+
+        # return ndarray and scalar
+        result = df.mask(lambda x: (x % 2 == 0).values, lambda x: 99)
+        exp = DataFrame([[1, 99, 3], [99, 5, 99], [7, 99, 9]])
+        tm.assert_frame_equal(result, exp)
+        tm.assert_frame_equal(result, df.mask(df % 2 == 0, 99))
+
+        # chain
+        result = (df + 2).mask(lambda x: x > 8, lambda x: x + 10)
+        exp = DataFrame([[3, 4, 5], [6, 7, 8], [19, 20, 21]])
+        tm.assert_frame_equal(result, exp)
+        tm.assert_frame_equal(result,
+                              (df + 2).mask((df + 2) > 8, (df + 2) + 10))
+
+    def test_head_tail(self):
+        assert_frame_equal(self.frame.head(), self.frame[:5])
+        assert_frame_equal(self.frame.tail(), self.frame[-5:])
+
+        assert_frame_equal(self.frame.head(0), self.frame[0:0])
+        assert_frame_equal(self.frame.tail(0), self.frame[0:0])
+
+        assert_frame_equal(self.frame.head(-1), self.frame[:-1])
+        assert_frame_equal(self.frame.tail(-1), self.frame[1:])
+        assert_frame_equal(self.frame.head(1), self.frame[:1])
+        assert_frame_equal(self.frame.tail(1), self.frame[-1:])
+        # with a float index
+        df = self.frame.copy()
+        df.index = np.arange(len(self.frame)) + 0.1
+        assert_frame_equal(df.head(), df.iloc[:5])
+        assert_frame_equal(df.tail(), df.iloc[-5:])
+        assert_frame_equal(df.head(0), df[0:0])
+        assert_frame_equal(df.tail(0), df[0:0])
+        assert_frame_equal(df.head(-1), df.iloc[:-1])
+        assert_frame_equal(df.tail(-1), df.iloc[1:])
+        # test empty dataframe
+        empty_df = DataFrame()
+        assert_frame_equal(empty_df.tail(), empty_df)
+        assert_frame_equal(empty_df.head(), empty_df)
+
+    def test_type_error_multiindex(self):
+        # See gh-12218
+        df = DataFrame(columns=['i', 'c', 'x', 'y'],
+                       data=[[0, 0, 1, 2], [1, 0, 3, 4],
+                             [0, 1, 1, 2], [1, 1, 3, 4]])
+        dg = df.pivot_table(index='i', columns='c',
+                            values=['x', 'y'])
+
+        with tm.assert_raises_regex(TypeError, "is an invalid key"):
+            str(dg[:, 0])
+
+        index = Index(range(2), name='i')
+        columns = MultiIndex(levels=[['x', 'y'], [0, 1]],
+                             labels=[[0, 1], [0, 0]],
+                             names=[None, 'c'])
+        expected = DataFrame([[1, 2], [3, 4]], columns=columns, index=index)
+
+        result = dg.loc[:, (slice(None), 0)]
+        assert_frame_equal(result, expected)
+
+        name = ('x', 0)
+        index = Index(range(2), name='i')
+        expected = Series([1, 3], index=index, name=name)
+
+        result = dg['x', 0]
+        assert_series_equal(result, expected)
+
+
+class TestDataFrameIndexingDatetimeWithTZ(TestData):
+
+    def setup_method(self, method):
+        self.idx = Index(date_range('20130101', periods=3, tz='US/Eastern'),
+                         name='foo')
+        self.dr = date_range('20130110', periods=3)
+        self.df = DataFrame({'A': self.idx, 'B': self.dr})
+
+    def test_setitem(self):
+
+        df = self.df
+        idx = self.idx
+
+        # setitem
+        df['C'] = idx
+        assert_series_equal(df['C'], Series(idx, name='C'))
+
+        df['D'] = 'foo'
+        df['D'] = idx
+        assert_series_equal(df['D'], Series(idx, name='D'))
+        del df['D']
+
+        # assert that A & C are not sharing the same base (e.g. they
+        # are copies)
+        b1 = df._data.blocks[1]
+        b2 = df._data.blocks[2]
+        assert b1.values.equals(b2.values)
+        assert id(b1.values.values.base) != id(b2.values.values.base)
+
+        # with nan
+        df2 = df.copy()
+        df2.iloc[1, 1] = pd.NaT
+        df2.iloc[1, 2] = pd.NaT
+        result = df2['B']
+        assert_series_equal(notna(result), Series(
+            [True, False, True], name='B'))
+        assert_series_equal(df2.dtypes, df.dtypes)
+
+    def test_set_reset(self):
+
+        idx = self.idx
+
+        # set/reset
+        df = DataFrame({'A': [0, 1, 2]}, index=idx)
+        result = df.reset_index()
+        assert result['foo'].dtype, 'M8[ns, US/Eastern'
+
+        df = result.set_index('foo')
+        tm.assert_index_equal(df.index, idx)
+
+    def test_transpose(self):
+
+        result = self.df.T
+        expected = DataFrame(self.df.values.T)
+        expected.index = ['A', 'B']
+        assert_frame_equal(result, expected)
+
+
+class TestDataFrameIndexingUInt64(TestData):
+
+    def setup_method(self, method):
+        self.ir = Index(np.arange(3), dtype=np.uint64)
+        self.idx = Index([2**63, 2**63 + 5, 2**63 + 10], name='foo')
+
+        self.df = DataFrame({'A': self.idx, 'B': self.ir})
+
+    def test_setitem(self):
+
+        df = self.df
+        idx = self.idx
+
+        # setitem
+        df['C'] = idx
+        assert_series_equal(df['C'], Series(idx, name='C'))
+
+        df['D'] = 'foo'
+        df['D'] = idx
+        assert_series_equal(df['D'], Series(idx, name='D'))
+        del df['D']
+
+        # With NaN: because uint64 has no NaN element,
+        # the column should be cast to object.
+        df2 = df.copy()
+        df2.iloc[1, 1] = pd.NaT
+        df2.iloc[1, 2] = pd.NaT
+        result = df2['B']
+        assert_series_equal(notna(result), Series(
+            [True, False, True], name='B'))
+        assert_series_equal(df2.dtypes, Series([np.dtype('uint64'),
+                                                np.dtype('O'), np.dtype('O')],
+                                               index=['A', 'B', 'C']))
+
+    def test_set_reset(self):
+
+        idx = self.idx
+
+        # set/reset
+        df = DataFrame({'A': [0, 1, 2]}, index=idx)
+        result = df.reset_index()
+        assert result['foo'].dtype == np.dtype('uint64')
+
+        df = result.set_index('foo')
+        tm.assert_index_equal(df.index, idx)
+
+    def test_transpose(self):
+
+        result = self.df.T
+        expected = DataFrame(self.df.values.T)
+        expected.index = ['A', 'B']
+        assert_frame_equal(result, expected)
+
+
+class TestDataFrameIndexingCategorical(object):
+
+    def test_assignment(self):
+        # assignment
+        df = DataFrame({'value': np.array(
+            np.random.randint(0, 10000, 100), dtype='int32')})
+        labels = Categorical(["{0} - {1}".format(i, i + 499)
+                              for i in range(0, 10000, 500)])
+
+        df = df.sort_values(by=['value'], ascending=True)
+        s = pd.cut(df.value, range(0, 10500, 500), right=False, labels=labels)
+        d = s.values
+        df['D'] = d
+        str(df)
+
+        result = df.dtypes
+        expected = Series(
+            [np.dtype('int32'), CategoricalDtype(categories=labels,
+                                                 ordered=False)],
+            index=['value', 'D'])
+        tm.assert_series_equal(result, expected)
+
+        df['E'] = s
+        str(df)
+
+        result = df.dtypes
+        expected = Series([np.dtype('int32'),
+                           CategoricalDtype(categories=labels, ordered=False),
+                           CategoricalDtype(categories=labels, ordered=False)],
+                          index=['value', 'D', 'E'])
+        tm.assert_series_equal(result, expected)
+
+        result1 = df['D']
+        result2 = df['E']
+        tm.assert_categorical_equal(result1._data._block.values, d)
+
+        # sorting
+        s.name = 'E'
+        tm.assert_series_equal(result2.sort_index(), s.sort_index())
+
+        cat = Categorical([1, 2, 3, 10], categories=[1, 2, 3, 4, 10])
+        df = DataFrame(Series(cat))
+
+    def test_assigning_ops(self):
+        # systematically test the assigning operations:
+        # for all slicing ops:
+        #  for value in categories and value not in categories:
+
+        #   - assign a single value -> exp_single_cats_value
+
+        #   - assign a complete row (mixed values) -> exp_single_row
+
+        # assign multiple rows (mixed values) (-> array) -> exp_multi_row
+
+        # assign a part of a column with dtype == categorical ->
+        # exp_parts_cats_col
+
+        # assign a part of a column with dtype != categorical ->
+        # exp_parts_cats_col
+
+        cats = Categorical(["a", "a", "a", "a", "a", "a", "a"],
+                           categories=["a", "b"])
+        idx = Index(["h", "i", "j", "k", "l", "m", "n"])
+        values = [1, 1, 1, 1, 1, 1, 1]
+        orig = DataFrame({"cats": cats, "values": values}, index=idx)
+
+        # the expected values
+        # changed single row
+        cats1 = Categorical(["a", "a", "b", "a", "a", "a", "a"],
+                            categories=["a", "b"])
+        idx1 = Index(["h", "i", "j", "k", "l", "m", "n"])
+        values1 = [1, 1, 2, 1, 1, 1, 1]
+        exp_single_row = DataFrame({"cats": cats1,
+                                    "values": values1}, index=idx1)
+
+        # changed multiple rows
+        cats2 = Categorical(["a", "a", "b", "b", "a", "a", "a"],
+                            categories=["a", "b"])
+        idx2 = Index(["h", "i", "j", "k", "l", "m", "n"])
+        values2 = [1, 1, 2, 2, 1, 1, 1]
+        exp_multi_row = DataFrame({"cats": cats2,
+                                   "values": values2}, index=idx2)
+
+        # changed part of the cats column
+        cats3 = Categorical(
+            ["a", "a", "b", "b", "a", "a", "a"], categories=["a", "b"])
+        idx3 = Index(["h", "i", "j", "k", "l", "m", "n"])
+        values3 = [1, 1, 1, 1, 1, 1, 1]
+        exp_parts_cats_col = DataFrame({"cats": cats3,
+                                        "values": values3}, index=idx3)
+
+        # changed single value in cats col
+        cats4 = Categorical(
+            ["a", "a", "b", "a", "a", "a", "a"], categories=["a", "b"])
+        idx4 = Index(["h", "i", "j", "k", "l", "m", "n"])
+        values4 = [1, 1, 1, 1, 1, 1, 1]
+        exp_single_cats_value = DataFrame({"cats": cats4,
+                                           "values": values4}, index=idx4)
+
+        #  iloc
+        # ###############
+        #   - assign a single value -> exp_single_cats_value
+        df = orig.copy()
+        df.iloc[2, 0] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        df = orig.copy()
+        df.iloc[df.index == "j", 0] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        #   - assign a single value not in the current categories set
+        def f():
+            df = orig.copy()
+            df.iloc[2, 0] = "c"
+
+        pytest.raises(ValueError, f)
+
+        #   - assign a complete row (mixed values) -> exp_single_row
+        df = orig.copy()
+        df.iloc[2, :] = ["b", 2]
+        tm.assert_frame_equal(df, exp_single_row)
+
+        #   - assign a complete row (mixed values) not in categories set
+        def f():
+            df = orig.copy()
+            df.iloc[2, :] = ["c", 2]
+
+        pytest.raises(ValueError, f)
+
+        #   - assign multiple rows (mixed values) -> exp_multi_row
+        df = orig.copy()
+        df.iloc[2:4, :] = [["b", 2], ["b", 2]]
+        tm.assert_frame_equal(df, exp_multi_row)
+
+        def f():
+            df = orig.copy()
+            df.iloc[2:4, :] = [["c", 2], ["c", 2]]
+
+        pytest.raises(ValueError, f)
+
+        # assign a part of a column with dtype == categorical ->
+        # exp_parts_cats_col
+        df = orig.copy()
+        df.iloc[2:4, 0] = Categorical(["b", "b"], categories=["a", "b"])
+        tm.assert_frame_equal(df, exp_parts_cats_col)
+
+        with pytest.raises(ValueError):
+            # different categories -> not sure if this should fail or pass
+            df = orig.copy()
+            df.iloc[2:4, 0] = Categorical(list('bb'), categories=list('abc'))
+
+        with pytest.raises(ValueError):
+            # different values
+            df = orig.copy()
+            df.iloc[2:4, 0] = Categorical(list('cc'), categories=list('abc'))
+
+        # assign a part of a column with dtype != categorical ->
+        # exp_parts_cats_col
+        df = orig.copy()
+        df.iloc[2:4, 0] = ["b", "b"]
+        tm.assert_frame_equal(df, exp_parts_cats_col)
+
+        with pytest.raises(ValueError):
+            df.iloc[2:4, 0] = ["c", "c"]
+
+        #  loc
+        # ##############
+        #   - assign a single value -> exp_single_cats_value
+        df = orig.copy()
+        df.loc["j", "cats"] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        df = orig.copy()
+        df.loc[df.index == "j", "cats"] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        #   - assign a single value not in the current categories set
+        def f():
+            df = orig.copy()
+            df.loc["j", "cats"] = "c"
+
+        pytest.raises(ValueError, f)
+
+        #   - assign a complete row (mixed values) -> exp_single_row
+        df = orig.copy()
+        df.loc["j", :] = ["b", 2]
+        tm.assert_frame_equal(df, exp_single_row)
+
+        #   - assign a complete row (mixed values) not in categories set
+        def f():
+            df = orig.copy()
+            df.loc["j", :] = ["c", 2]
+
+        pytest.raises(ValueError, f)
+
+        #   - assign multiple rows (mixed values) -> exp_multi_row
+        df = orig.copy()
+        df.loc["j":"k", :] = [["b", 2], ["b", 2]]
+        tm.assert_frame_equal(df, exp_multi_row)
+
+        def f():
+            df = orig.copy()
+            df.loc["j":"k", :] = [["c", 2], ["c", 2]]
+
+        pytest.raises(ValueError, f)
+
+        # assign a part of a column with dtype == categorical ->
+        # exp_parts_cats_col
+        df = orig.copy()
+        df.loc["j":"k", "cats"] = Categorical(
+            ["b", "b"], categories=["a", "b"])
+        tm.assert_frame_equal(df, exp_parts_cats_col)
+
+        with pytest.raises(ValueError):
+            # different categories -> not sure if this should fail or pass
+            df = orig.copy()
+            df.loc["j":"k", "cats"] = Categorical(
+                ["b", "b"], categories=["a", "b", "c"])
+
+        with pytest.raises(ValueError):
+            # different values
+            df = orig.copy()
+            df.loc["j":"k", "cats"] = Categorical(
+                ["c", "c"], categories=["a", "b", "c"])
+
+        # assign a part of a column with dtype != categorical ->
+        # exp_parts_cats_col
+        df = orig.copy()
+        df.loc["j":"k", "cats"] = ["b", "b"]
+        tm.assert_frame_equal(df, exp_parts_cats_col)
+
+        with pytest.raises(ValueError):
+            df.loc["j":"k", "cats"] = ["c", "c"]
+
+        #  loc
+        # ##############
+        #   - assign a single value -> exp_single_cats_value
+        df = orig.copy()
+        df.loc["j", df.columns[0]] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        df = orig.copy()
+        df.loc[df.index == "j", df.columns[0]] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        #   - assign a single value not in the current categories set
+        def f():
+            df = orig.copy()
+            df.loc["j", df.columns[0]] = "c"
+
+        pytest.raises(ValueError, f)
+
+        #   - assign a complete row (mixed values) -> exp_single_row
+        df = orig.copy()
+        df.loc["j", :] = ["b", 2]
+        tm.assert_frame_equal(df, exp_single_row)
+
+        #   - assign a complete row (mixed values) not in categories set
+        def f():
+            df = orig.copy()
+            df.loc["j", :] = ["c", 2]
+
+        pytest.raises(ValueError, f)
+
+        #   - assign multiple rows (mixed values) -> exp_multi_row
+        df = orig.copy()
+        df.loc["j":"k", :] = [["b", 2], ["b", 2]]
+        tm.assert_frame_equal(df, exp_multi_row)
+
+        def f():
+            df = orig.copy()
+            df.loc["j":"k", :] = [["c", 2], ["c", 2]]
+
+        pytest.raises(ValueError, f)
+
+        # assign a part of a column with dtype == categorical ->
+        # exp_parts_cats_col
+        df = orig.copy()
+        df.loc["j":"k", df.columns[0]] = Categorical(
+            ["b", "b"], categories=["a", "b"])
+        tm.assert_frame_equal(df, exp_parts_cats_col)
+
+        with pytest.raises(ValueError):
+            # different categories -> not sure if this should fail or pass
+            df = orig.copy()
+            df.loc["j":"k", df.columns[0]] = Categorical(
+                ["b", "b"], categories=["a", "b", "c"])
+
+        with pytest.raises(ValueError):
+            # different values
+            df = orig.copy()
+            df.loc["j":"k", df.columns[0]] = Categorical(
+                ["c", "c"], categories=["a", "b", "c"])
+
+        # assign a part of a column with dtype != categorical ->
+        # exp_parts_cats_col
+        df = orig.copy()
+        df.loc["j":"k", df.columns[0]] = ["b", "b"]
+        tm.assert_frame_equal(df, exp_parts_cats_col)
+
+        with pytest.raises(ValueError):
+            df.loc["j":"k", df.columns[0]] = ["c", "c"]
+
+        # iat
+        df = orig.copy()
+        df.iat[2, 0] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        #   - assign a single value not in the current categories set
+        def f():
+            df = orig.copy()
+            df.iat[2, 0] = "c"
+
+        pytest.raises(ValueError, f)
+
+        # at
+        #   - assign a single value -> exp_single_cats_value
+        df = orig.copy()
+        df.at["j", "cats"] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        #   - assign a single value not in the current categories set
+        def f():
+            df = orig.copy()
+            df.at["j", "cats"] = "c"
+
+        pytest.raises(ValueError, f)
+
+        # fancy indexing
+        catsf = Categorical(["a", "a", "c", "c", "a", "a", "a"],
+                            categories=["a", "b", "c"])
+        idxf = Index(["h", "i", "j", "k", "l", "m", "n"])
+        valuesf = [1, 1, 3, 3, 1, 1, 1]
+        df = DataFrame({"cats": catsf, "values": valuesf}, index=idxf)
+
+        exp_fancy = exp_multi_row.copy()
+        exp_fancy["cats"].cat.set_categories(["a", "b", "c"], inplace=True)
+
+        df[df["cats"] == "c"] = ["b", 2]
+        # category c is kept in .categories
+        tm.assert_frame_equal(df, exp_fancy)
+
+        # set_value
+        df = orig.copy()
+        df.at["j", "cats"] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        def f():
+            df = orig.copy()
+            df.at["j", "cats"] = "c"
+
+        pytest.raises(ValueError, f)
+
+        # Assigning a Category to parts of a int/... column uses the values of
+        # the Catgorical
+        df = DataFrame({"a": [1, 1, 1, 1, 1], "b": list("aaaaa")})
+        exp = DataFrame({"a": [1, "b", "b", 1, 1], "b": list("aabba")})
+        df.loc[1:2, "a"] = Categorical(["b", "b"], categories=["a", "b"])
+        df.loc[2:3, "b"] = Categorical(["b", "b"], categories=["a", "b"])
+        tm.assert_frame_equal(df, exp)
+
+    def test_functions_no_warnings(self):
+        df = DataFrame({'value': np.random.randint(0, 100, 20)})
+        labels = ["{0} - {1}".format(i, i + 9) for i in range(0, 100, 10)]
+        with tm.assert_produces_warning(False):
+            df['group'] = pd.cut(df.value, range(0, 105, 10), right=False,
+                                 labels=labels)
diff --git a/pandas/tests/frame/test_join.py b/pandas/tests/frame/test_join.py
new file mode 100644
index 0000000000000..ccdba6df2521a
--- /dev/null
+++ b/pandas/tests/frame/test_join.py
@@ -0,0 +1,184 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+import numpy as np
+
+from pandas import DataFrame, Index, PeriodIndex
+from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
+
+
+@pytest.fixture
+def frame_with_period_index():
+    return DataFrame(
+        data=np.arange(20).reshape(4, 5),
+        columns=list('abcde'),
+        index=PeriodIndex(start='2000', freq='A', periods=4))
+
+
+@pytest.fixture
+def frame():
+    return TestData().frame
+
+
+@pytest.fixture
+def left():
+    return DataFrame({'a': [20, 10, 0]}, index=[2, 1, 0])
+
+
+@pytest.fixture
+def right():
+    return DataFrame({'b': [300, 100, 200]}, index=[3, 1, 2])
+
+
+@pytest.mark.parametrize(
+    "how, sort, expected",
+    [('inner', False, DataFrame({'a': [20, 10],
+                                 'b': [200, 100]},
+                                index=[2, 1])),
+     ('inner', True, DataFrame({'a': [10, 20],
+                                'b': [100, 200]},
+                               index=[1, 2])),
+     ('left', False, DataFrame({'a': [20, 10, 0],
+                                'b': [200, 100, np.nan]},
+                               index=[2, 1, 0])),
+     ('left', True, DataFrame({'a': [0, 10, 20],
+                               'b': [np.nan, 100, 200]},
+                              index=[0, 1, 2])),
+     ('right', False, DataFrame({'a': [np.nan, 10, 20],
+                                 'b': [300, 100, 200]},
+                                index=[3, 1, 2])),
+     ('right', True, DataFrame({'a': [10, 20, np.nan],
+                                'b': [100, 200, 300]},
+                               index=[1, 2, 3])),
+     ('outer', False, DataFrame({'a': [0, 10, 20, np.nan],
+                                 'b': [np.nan, 100, 200, 300]},
+                                index=[0, 1, 2, 3])),
+     ('outer', True, DataFrame({'a': [0, 10, 20, np.nan],
+                                'b': [np.nan, 100, 200, 300]},
+                               index=[0, 1, 2, 3]))])
+def test_join(left, right, how, sort, expected):
+
+    result = left.join(right, how=how, sort=sort)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_join_index(frame):
+    # left / right
+
+    f = frame.loc[frame.index[:10], ['A', 'B']]
+    f2 = frame.loc[frame.index[5:], ['C', 'D']].iloc[::-1]
+
+    joined = f.join(f2)
+    tm.assert_index_equal(f.index, joined.index)
+    expected_columns = Index(['A', 'B', 'C', 'D'])
+    tm.assert_index_equal(joined.columns, expected_columns)
+
+    joined = f.join(f2, how='left')
+    tm.assert_index_equal(joined.index, f.index)
+    tm.assert_index_equal(joined.columns, expected_columns)
+
+    joined = f.join(f2, how='right')
+    tm.assert_index_equal(joined.index, f2.index)
+    tm.assert_index_equal(joined.columns, expected_columns)
+
+    # inner
+
+    joined = f.join(f2, how='inner')
+    tm.assert_index_equal(joined.index, f.index[5:10])
+    tm.assert_index_equal(joined.columns, expected_columns)
+
+    # outer
+
+    joined = f.join(f2, how='outer')
+    tm.assert_index_equal(joined.index, frame.index.sort_values())
+    tm.assert_index_equal(joined.columns, expected_columns)
+
+    tm.assert_raises_regex(
+        ValueError, 'join method', f.join, f2, how='foo')
+
+    # corner case - overlapping columns
+    for how in ('outer', 'left', 'inner'):
+        with tm.assert_raises_regex(ValueError, 'columns overlap but '
+                                    'no suffix'):
+            frame.join(frame, how=how)
+
+
+def test_join_index_more(frame):
+    af = frame.loc[:, ['A', 'B']]
+    bf = frame.loc[::2, ['C', 'D']]
+
+    expected = af.copy()
+    expected['C'] = frame['C'][::2]
+    expected['D'] = frame['D'][::2]
+
+    result = af.join(bf)
+    tm.assert_frame_equal(result, expected)
+
+    result = af.join(bf, how='right')
+    tm.assert_frame_equal(result, expected[::2])
+
+    result = bf.join(af, how='right')
+    tm.assert_frame_equal(result, expected.loc[:, result.columns])
+
+
+def test_join_index_series(frame):
+    df = frame.copy()
+    s = df.pop(frame.columns[-1])
+    joined = df.join(s)
+
+    # TODO should this check_names ?
+    tm.assert_frame_equal(joined, frame, check_names=False)
+
+    s.name = None
+    tm.assert_raises_regex(ValueError, 'must have a name', df.join, s)
+
+
+def test_join_overlap(frame):
+    df1 = frame.loc[:, ['A', 'B', 'C']]
+    df2 = frame.loc[:, ['B', 'C', 'D']]
+
+    joined = df1.join(df2, lsuffix='_df1', rsuffix='_df2')
+    df1_suf = df1.loc[:, ['B', 'C']].add_suffix('_df1')
+    df2_suf = df2.loc[:, ['B', 'C']].add_suffix('_df2')
+
+    no_overlap = frame.loc[:, ['A', 'D']]
+    expected = df1_suf.join(df2_suf).join(no_overlap)
+
+    # column order not necessarily sorted
+    tm.assert_frame_equal(joined, expected.loc[:, joined.columns])
+
+
+def test_join_period_index(frame_with_period_index):
+    other = frame_with_period_index.rename(
+        columns=lambda x: '{key}{key}'.format(key=x))
+
+    joined_values = np.concatenate(
+        [frame_with_period_index.values] * 2, axis=1)
+
+    joined_cols = frame_with_period_index.columns.append(other.columns)
+
+    joined = frame_with_period_index.join(other)
+    expected = DataFrame(
+        data=joined_values,
+        columns=joined_cols,
+        index=frame_with_period_index.index)
+
+    tm.assert_frame_equal(joined, expected)
+
+
+def test_join_left_sequence_non_unique_index():
+    # https://github.com/pandas-dev/pandas/issues/19607
+    df1 = DataFrame({'a': [0, 10, 20]}, index=[1, 2, 3])
+    df2 = DataFrame({'b': [100, 200, 300]}, index=[4, 3, 2])
+    df3 = DataFrame({'c': [400, 500, 600]}, index=[2, 2, 4])
+
+    joined = df1.join([df2, df3], how='left')
+
+    expected = DataFrame({
+        'a': [0, 10, 10, 20],
+        'b': [np.nan, 300, 300, 200],
+        'c': [np.nan, 400, 500, np.nan]
+    }, index=[1, 2, 2, 3])
+
+    tm.assert_frame_equal(joined, expected)
diff --git a/pandas/tests/frame/test_missing.py b/pandas/tests/frame/test_missing.py
new file mode 100644
index 0000000000000..f1113fd6debf2
--- /dev/null
+++ b/pandas/tests/frame/test_missing.py
@@ -0,0 +1,846 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import pytest
+
+from distutils.version import LooseVersion
+from numpy import nan, random
+import numpy as np
+
+import datetime
+import dateutil
+
+from pandas.compat import lrange
+from pandas import (DataFrame, Series, Timestamp,
+                    date_range, Categorical)
+import pandas as pd
+
+from pandas.util.testing import assert_series_equal, assert_frame_equal
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas.tests.frame.common import TestData, _check_mixed_float
+
+
+try:
+    import scipy
+    _is_scipy_ge_0190 = (LooseVersion(scipy.__version__) >=
+                         LooseVersion('0.19.0'))
+except:
+    _is_scipy_ge_0190 = False
+
+
+def _skip_if_no_pchip():
+    try:
+        from scipy.interpolate import pchip_interpolate  # noqa
+    except ImportError:
+        import pytest
+        pytest.skip('scipy.interpolate.pchip missing')
+
+
+class TestDataFrameMissingData(TestData):
+
+    def test_dropEmptyRows(self):
+        N = len(self.frame.index)
+        mat = random.randn(N)
+        mat[:5] = nan
+
+        frame = DataFrame({'foo': mat}, index=self.frame.index)
+        original = Series(mat, index=self.frame.index, name='foo')
+        expected = original.dropna()
+        inplace_frame1, inplace_frame2 = frame.copy(), frame.copy()
+
+        smaller_frame = frame.dropna(how='all')
+        # check that original was preserved
+        assert_series_equal(frame['foo'], original)
+        inplace_frame1.dropna(how='all', inplace=True)
+        assert_series_equal(smaller_frame['foo'], expected)
+        assert_series_equal(inplace_frame1['foo'], expected)
+
+        smaller_frame = frame.dropna(how='all', subset=['foo'])
+        inplace_frame2.dropna(how='all', subset=['foo'], inplace=True)
+        assert_series_equal(smaller_frame['foo'], expected)
+        assert_series_equal(inplace_frame2['foo'], expected)
+
+    def test_dropIncompleteRows(self):
+        N = len(self.frame.index)
+        mat = random.randn(N)
+        mat[:5] = nan
+
+        frame = DataFrame({'foo': mat}, index=self.frame.index)
+        frame['bar'] = 5
+        original = Series(mat, index=self.frame.index, name='foo')
+        inp_frame1, inp_frame2 = frame.copy(), frame.copy()
+
+        smaller_frame = frame.dropna()
+        assert_series_equal(frame['foo'], original)
+        inp_frame1.dropna(inplace=True)
+
+        exp = Series(mat[5:], index=self.frame.index[5:], name='foo')
+        tm.assert_series_equal(smaller_frame['foo'], exp)
+        tm.assert_series_equal(inp_frame1['foo'], exp)
+
+        samesize_frame = frame.dropna(subset=['bar'])
+        assert_series_equal(frame['foo'], original)
+        assert (frame['bar'] == 5).all()
+        inp_frame2.dropna(subset=['bar'], inplace=True)
+        tm.assert_index_equal(samesize_frame.index, self.frame.index)
+        tm.assert_index_equal(inp_frame2.index, self.frame.index)
+
+    def test_dropna(self):
+        df = DataFrame(np.random.randn(6, 4))
+        df[2][:2] = nan
+
+        dropped = df.dropna(axis=1)
+        expected = df.loc[:, [0, 1, 3]]
+        inp = df.copy()
+        inp.dropna(axis=1, inplace=True)
+        assert_frame_equal(dropped, expected)
+        assert_frame_equal(inp, expected)
+
+        dropped = df.dropna(axis=0)
+        expected = df.loc[lrange(2, 6)]
+        inp = df.copy()
+        inp.dropna(axis=0, inplace=True)
+        assert_frame_equal(dropped, expected)
+        assert_frame_equal(inp, expected)
+
+        # threshold
+        dropped = df.dropna(axis=1, thresh=5)
+        expected = df.loc[:, [0, 1, 3]]
+        inp = df.copy()
+        inp.dropna(axis=1, thresh=5, inplace=True)
+        assert_frame_equal(dropped, expected)
+        assert_frame_equal(inp, expected)
+
+        dropped = df.dropna(axis=0, thresh=4)
+        expected = df.loc[lrange(2, 6)]
+        inp = df.copy()
+        inp.dropna(axis=0, thresh=4, inplace=True)
+        assert_frame_equal(dropped, expected)
+        assert_frame_equal(inp, expected)
+
+        dropped = df.dropna(axis=1, thresh=4)
+        assert_frame_equal(dropped, df)
+
+        dropped = df.dropna(axis=1, thresh=3)
+        assert_frame_equal(dropped, df)
+
+        # subset
+        dropped = df.dropna(axis=0, subset=[0, 1, 3])
+        inp = df.copy()
+        inp.dropna(axis=0, subset=[0, 1, 3], inplace=True)
+        assert_frame_equal(dropped, df)
+        assert_frame_equal(inp, df)
+
+        # all
+        dropped = df.dropna(axis=1, how='all')
+        assert_frame_equal(dropped, df)
+
+        df[2] = nan
+        dropped = df.dropna(axis=1, how='all')
+        expected = df.loc[:, [0, 1, 3]]
+        assert_frame_equal(dropped, expected)
+
+        # bad input
+        pytest.raises(ValueError, df.dropna, axis=3)
+
+    def test_drop_and_dropna_caching(self):
+        # tst that cacher updates
+        original = Series([1, 2, np.nan], name='A')
+        expected = Series([1, 2], dtype=original.dtype, name='A')
+        df = pd.DataFrame({'A': original.values.copy()})
+        df2 = df.copy()
+        df['A'].dropna()
+        assert_series_equal(df['A'], original)
+        df['A'].dropna(inplace=True)
+        assert_series_equal(df['A'], expected)
+        df2['A'].drop([1])
+        assert_series_equal(df2['A'], original)
+        df2['A'].drop([1], inplace=True)
+        assert_series_equal(df2['A'], original.drop([1]))
+
+    def test_dropna_corner(self):
+        # bad input
+        pytest.raises(ValueError, self.frame.dropna, how='foo')
+        pytest.raises(TypeError, self.frame.dropna, how=None)
+        # non-existent column - 8303
+        pytest.raises(KeyError, self.frame.dropna, subset=['A', 'X'])
+
+    def test_dropna_multiple_axes(self):
+        df = DataFrame([[1, np.nan, 2, 3],
+                        [4, np.nan, 5, 6],
+                        [np.nan, np.nan, np.nan, np.nan],
+                        [7, np.nan, 8, 9]])
+        cp = df.copy()
+
+        # GH20987
+        with tm.assert_produces_warning(FutureWarning):
+            result = df.dropna(how='all', axis=[0, 1])
+        with tm.assert_produces_warning(FutureWarning):
+            result2 = df.dropna(how='all', axis=(0, 1))
+        expected = df.dropna(how='all').dropna(how='all', axis=1)
+
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result2, expected)
+        assert_frame_equal(df, cp)
+
+        inp = df.copy()
+        with tm.assert_produces_warning(FutureWarning):
+            inp.dropna(how='all', axis=(0, 1), inplace=True)
+        assert_frame_equal(inp, expected)
+
+    def test_dropna_tz_aware_datetime(self):
+        # GH13407
+        df = DataFrame()
+        dt1 = datetime.datetime(2015, 1, 1,
+                                tzinfo=dateutil.tz.tzutc())
+        dt2 = datetime.datetime(2015, 2, 2,
+                                tzinfo=dateutil.tz.tzutc())
+        df['Time'] = [dt1]
+        result = df.dropna(axis=0)
+        expected = DataFrame({'Time': [dt1]})
+        assert_frame_equal(result, expected)
+
+        # Ex2
+        df = DataFrame({'Time': [dt1, None, np.nan, dt2]})
+        result = df.dropna(axis=0)
+        expected = DataFrame([dt1, dt2],
+                             columns=['Time'],
+                             index=[0, 3])
+        assert_frame_equal(result, expected)
+
+    def test_fillna(self):
+        tf = self.tsframe
+        tf.loc[tf.index[:5], 'A'] = nan
+        tf.loc[tf.index[-5:], 'A'] = nan
+
+        zero_filled = self.tsframe.fillna(0)
+        assert (zero_filled.loc[zero_filled.index[:5], 'A'] == 0).all()
+
+        padded = self.tsframe.fillna(method='pad')
+        assert np.isnan(padded.loc[padded.index[:5], 'A']).all()
+        assert (padded.loc[padded.index[-5:], 'A'] ==
+                padded.loc[padded.index[-5], 'A']).all()
+
+        # mixed type
+        mf = self.mixed_frame
+        mf.loc[mf.index[5:20], 'foo'] = nan
+        mf.loc[mf.index[-10:], 'A'] = nan
+        result = self.mixed_frame.fillna(value=0)
+        result = self.mixed_frame.fillna(method='pad')
+
+        pytest.raises(ValueError, self.tsframe.fillna)
+        pytest.raises(ValueError, self.tsframe.fillna, 5, method='ffill')
+
+        # mixed numeric (but no float16)
+        mf = self.mixed_float.reindex(columns=['A', 'B', 'D'])
+        mf.loc[mf.index[-10:], 'A'] = nan
+        result = mf.fillna(value=0)
+        _check_mixed_float(result, dtype=dict(C=None))
+
+        result = mf.fillna(method='pad')
+        _check_mixed_float(result, dtype=dict(C=None))
+
+        # empty frame (GH #2778)
+        df = DataFrame(columns=['x'])
+        for m in ['pad', 'backfill']:
+            df.x.fillna(method=m, inplace=True)
+            df.x.fillna(method=m)
+
+        # with different dtype (GH3386)
+        df = DataFrame([['a', 'a', np.nan, 'a'], [
+                       'b', 'b', np.nan, 'b'], ['c', 'c', np.nan, 'c']])
+
+        result = df.fillna({2: 'foo'})
+        expected = DataFrame([['a', 'a', 'foo', 'a'],
+                              ['b', 'b', 'foo', 'b'],
+                              ['c', 'c', 'foo', 'c']])
+        assert_frame_equal(result, expected)
+
+        df.fillna({2: 'foo'}, inplace=True)
+        assert_frame_equal(df, expected)
+
+        # limit and value
+        df = DataFrame(np.random.randn(10, 3))
+        df.iloc[2:7, 0] = np.nan
+        df.iloc[3:5, 2] = np.nan
+
+        expected = df.copy()
+        expected.iloc[2, 0] = 999
+        expected.iloc[3, 2] = 999
+        result = df.fillna(999, limit=1)
+        assert_frame_equal(result, expected)
+
+        # with datelike
+        # GH 6344
+        df = DataFrame({
+            'Date': [pd.NaT, Timestamp("2014-1-1")],
+            'Date2': [Timestamp("2013-1-1"), pd.NaT]
+        })
+
+        expected = df.copy()
+        expected['Date'] = expected['Date'].fillna(
+            df.loc[df.index[0], 'Date2'])
+        result = df.fillna(value={'Date': df['Date2']})
+        assert_frame_equal(result, expected)
+
+        # with timezone
+        # GH 15855
+        df = pd.DataFrame({'A': [pd.Timestamp('2012-11-11 00:00:00+01:00'),
+                                 pd.NaT]})
+        exp = pd.DataFrame({'A': [pd.Timestamp('2012-11-11 00:00:00+01:00'),
+                                  pd.Timestamp('2012-11-11 00:00:00+01:00')]})
+        assert_frame_equal(df.fillna(method='pad'), exp)
+
+        df = pd.DataFrame({'A': [pd.NaT,
+                                 pd.Timestamp('2012-11-11 00:00:00+01:00')]})
+        exp = pd.DataFrame({'A': [pd.Timestamp('2012-11-11 00:00:00+01:00'),
+                                  pd.Timestamp('2012-11-11 00:00:00+01:00')]})
+        assert_frame_equal(df.fillna(method='bfill'), exp)
+
+    def test_na_actions_categorical(self):
+
+        cat = Categorical([1, 2, 3, np.nan], categories=[1, 2, 3])
+        vals = ["a", "b", np.nan, "d"]
+        df = DataFrame({"cats": cat, "vals": vals})
+        cat2 = Categorical([1, 2, 3, 3], categories=[1, 2, 3])
+        vals2 = ["a", "b", "b", "d"]
+        df_exp_fill = DataFrame({"cats": cat2, "vals": vals2})
+        cat3 = Categorical([1, 2, 3], categories=[1, 2, 3])
+        vals3 = ["a", "b", np.nan]
+        df_exp_drop_cats = DataFrame({"cats": cat3, "vals": vals3})
+        cat4 = Categorical([1, 2], categories=[1, 2, 3])
+        vals4 = ["a", "b"]
+        df_exp_drop_all = DataFrame({"cats": cat4, "vals": vals4})
+
+        # fillna
+        res = df.fillna(value={"cats": 3, "vals": "b"})
+        tm.assert_frame_equal(res, df_exp_fill)
+
+        with tm.assert_raises_regex(ValueError, "fill value must be "
+                                                "in categories"):
+            df.fillna(value={"cats": 4, "vals": "c"})
+
+        res = df.fillna(method='pad')
+        tm.assert_frame_equal(res, df_exp_fill)
+
+        # dropna
+        res = df.dropna(subset=["cats"])
+        tm.assert_frame_equal(res, df_exp_drop_cats)
+
+        res = df.dropna()
+        tm.assert_frame_equal(res, df_exp_drop_all)
+
+        # make sure that fillna takes missing values into account
+        c = Categorical([np.nan, "b", np.nan], categories=["a", "b"])
+        df = pd.DataFrame({"cats": c, "vals": [1, 2, 3]})
+
+        cat_exp = Categorical(["a", "b", "a"], categories=["a", "b"])
+        df_exp = DataFrame({"cats": cat_exp, "vals": [1, 2, 3]})
+
+        res = df.fillna("a")
+        tm.assert_frame_equal(res, df_exp)
+
+    def test_fillna_categorical_nan(self):
+        # GH 14021
+        # np.nan should always be a valid filler
+        cat = Categorical([np.nan, 2, np.nan])
+        val = Categorical([np.nan, np.nan, np.nan])
+        df = DataFrame({"cats": cat, "vals": val})
+        res = df.fillna(df.median())
+        v_exp = [np.nan, np.nan, np.nan]
+        df_exp = DataFrame({"cats": [2, 2, 2], "vals": v_exp},
+                           dtype='category')
+        tm.assert_frame_equal(res, df_exp)
+
+        result = df.cats.fillna(np.nan)
+        tm.assert_series_equal(result, df.cats)
+        result = df.vals.fillna(np.nan)
+        tm.assert_series_equal(result, df.vals)
+
+        idx = pd.DatetimeIndex(['2011-01-01 09:00', '2016-01-01 23:45',
+                                '2011-01-01 09:00', pd.NaT, pd.NaT])
+        df = DataFrame({'a': Categorical(idx)})
+        tm.assert_frame_equal(df.fillna(value=pd.NaT), df)
+
+        idx = pd.PeriodIndex(['2011-01', '2011-01', '2011-01',
+                              pd.NaT, pd.NaT], freq='M')
+        df = DataFrame({'a': Categorical(idx)})
+        tm.assert_frame_equal(df.fillna(value=pd.NaT), df)
+
+        idx = pd.TimedeltaIndex(['1 days', '2 days',
+                                 '1 days', pd.NaT, pd.NaT])
+        df = DataFrame({'a': Categorical(idx)})
+        tm.assert_frame_equal(df.fillna(value=pd.NaT), df)
+
+    def test_fillna_downcast(self):
+        # GH 15277
+        # infer int64 from float64
+        df = pd.DataFrame({'a': [1., np.nan]})
+        result = df.fillna(0, downcast='infer')
+        expected = pd.DataFrame({'a': [1, 0]})
+        assert_frame_equal(result, expected)
+
+        # infer int64 from float64 when fillna value is a dict
+        df = pd.DataFrame({'a': [1., np.nan]})
+        result = df.fillna({'a': 0}, downcast='infer')
+        expected = pd.DataFrame({'a': [1, 0]})
+        assert_frame_equal(result, expected)
+
+    def test_fillna_dtype_conversion(self):
+        # make sure that fillna on an empty frame works
+        df = DataFrame(index=["A", "B", "C"], columns=[1, 2, 3, 4, 5])
+        result = df.get_dtype_counts().sort_values()
+        expected = Series({'object': 5})
+        assert_series_equal(result, expected)
+
+        result = df.fillna(1)
+        expected = DataFrame(1, index=["A", "B", "C"], columns=[1, 2, 3, 4, 5])
+        result = result.get_dtype_counts().sort_values()
+        expected = Series({'int64': 5})
+        assert_series_equal(result, expected)
+
+        # empty block
+        df = DataFrame(index=lrange(3), columns=['A', 'B'], dtype='float64')
+        result = df.fillna('nan')
+        expected = DataFrame('nan', index=lrange(3), columns=['A', 'B'])
+        assert_frame_equal(result, expected)
+
+        # equiv of replace
+        df = DataFrame(dict(A=[1, np.nan], B=[1., 2.]))
+        for v in ['', 1, np.nan, 1.0]:
+            expected = df.replace(np.nan, v)
+            result = df.fillna(v)
+            assert_frame_equal(result, expected)
+
+    def test_fillna_datetime_columns(self):
+        # GH 7095
+        df = pd.DataFrame({'A': [-1, -2, np.nan],
+                           'B': date_range('20130101', periods=3),
+                           'C': ['foo', 'bar', None],
+                           'D': ['foo2', 'bar2', None]},
+                          index=date_range('20130110', periods=3))
+        result = df.fillna('?')
+        expected = pd.DataFrame({'A': [-1, -2, '?'],
+                                 'B': date_range('20130101', periods=3),
+                                 'C': ['foo', 'bar', '?'],
+                                 'D': ['foo2', 'bar2', '?']},
+                                index=date_range('20130110', periods=3))
+        tm.assert_frame_equal(result, expected)
+
+        df = pd.DataFrame({'A': [-1, -2, np.nan],
+                           'B': [pd.Timestamp('2013-01-01'),
+                                 pd.Timestamp('2013-01-02'), pd.NaT],
+                           'C': ['foo', 'bar', None],
+                           'D': ['foo2', 'bar2', None]},
+                          index=date_range('20130110', periods=3))
+        result = df.fillna('?')
+        expected = pd.DataFrame({'A': [-1, -2, '?'],
+                                 'B': [pd.Timestamp('2013-01-01'),
+                                       pd.Timestamp('2013-01-02'), '?'],
+                                 'C': ['foo', 'bar', '?'],
+                                 'D': ['foo2', 'bar2', '?']},
+                                index=pd.date_range('20130110', periods=3))
+        tm.assert_frame_equal(result, expected)
+
+    def test_ffill(self):
+        self.tsframe['A'][:5] = nan
+        self.tsframe['A'][-5:] = nan
+
+        assert_frame_equal(self.tsframe.ffill(),
+                           self.tsframe.fillna(method='ffill'))
+
+    def test_bfill(self):
+        self.tsframe['A'][:5] = nan
+        self.tsframe['A'][-5:] = nan
+
+        assert_frame_equal(self.tsframe.bfill(),
+                           self.tsframe.fillna(method='bfill'))
+
+    def test_frame_pad_backfill_limit(self):
+        index = np.arange(10)
+        df = DataFrame(np.random.randn(10, 4), index=index)
+
+        result = df[:2].reindex(index, method='pad', limit=5)
+
+        expected = df[:2].reindex(index).fillna(method='pad')
+        expected.values[-3:] = np.nan
+        tm.assert_frame_equal(result, expected)
+
+        result = df[-2:].reindex(index, method='backfill', limit=5)
+
+        expected = df[-2:].reindex(index).fillna(method='backfill')
+        expected.values[:3] = np.nan
+        tm.assert_frame_equal(result, expected)
+
+    def test_frame_fillna_limit(self):
+        index = np.arange(10)
+        df = DataFrame(np.random.randn(10, 4), index=index)
+
+        result = df[:2].reindex(index)
+        result = result.fillna(method='pad', limit=5)
+
+        expected = df[:2].reindex(index).fillna(method='pad')
+        expected.values[-3:] = np.nan
+        tm.assert_frame_equal(result, expected)
+
+        result = df[-2:].reindex(index)
+        result = result.fillna(method='backfill', limit=5)
+
+        expected = df[-2:].reindex(index).fillna(method='backfill')
+        expected.values[:3] = np.nan
+        tm.assert_frame_equal(result, expected)
+
+    def test_fillna_skip_certain_blocks(self):
+        # don't try to fill boolean, int blocks
+
+        df = DataFrame(np.random.randn(10, 4).astype(int))
+
+        # it works!
+        df.fillna(np.nan)
+
+    def test_fillna_inplace(self):
+        df = DataFrame(np.random.randn(10, 4))
+        df[1][:4] = np.nan
+        df[3][-4:] = np.nan
+
+        expected = df.fillna(value=0)
+        assert expected is not df
+
+        df.fillna(value=0, inplace=True)
+        tm.assert_frame_equal(df, expected)
+
+        expected = df.fillna(value={0: 0}, inplace=True)
+        assert expected is None
+
+        df[1][:4] = np.nan
+        df[3][-4:] = np.nan
+        expected = df.fillna(method='ffill')
+        assert expected is not df
+
+        df.fillna(method='ffill', inplace=True)
+        tm.assert_frame_equal(df, expected)
+
+    def test_fillna_dict_series(self):
+        df = DataFrame({'a': [nan, 1, 2, nan, nan],
+                        'b': [1, 2, 3, nan, nan],
+                        'c': [nan, 1, 2, 3, 4]})
+
+        result = df.fillna({'a': 0, 'b': 5})
+
+        expected = df.copy()
+        expected['a'] = expected['a'].fillna(0)
+        expected['b'] = expected['b'].fillna(5)
+        assert_frame_equal(result, expected)
+
+        # it works
+        result = df.fillna({'a': 0, 'b': 5, 'd': 7})
+
+        # Series treated same as dict
+        result = df.fillna(df.max())
+        expected = df.fillna(df.max().to_dict())
+        assert_frame_equal(result, expected)
+
+        # disable this for now
+        with tm.assert_raises_regex(NotImplementedError,
+                                    'column by column'):
+            df.fillna(df.max(1), axis=1)
+
+    def test_fillna_dataframe(self):
+        # GH 8377
+        df = DataFrame({'a': [nan, 1, 2, nan, nan],
+                        'b': [1, 2, 3, nan, nan],
+                        'c': [nan, 1, 2, 3, 4]},
+                       index=list('VWXYZ'))
+
+        # df2 may have different index and columns
+        df2 = DataFrame({'a': [nan, 10, 20, 30, 40],
+                         'b': [50, 60, 70, 80, 90],
+                         'foo': ['bar'] * 5},
+                        index=list('VWXuZ'))
+
+        result = df.fillna(df2)
+
+        # only those columns and indices which are shared get filled
+        expected = DataFrame({'a': [nan, 1, 2, nan, 40],
+                              'b': [1, 2, 3, nan, 90],
+                              'c': [nan, 1, 2, 3, 4]},
+                             index=list('VWXYZ'))
+
+        assert_frame_equal(result, expected)
+
+    def test_fillna_columns(self):
+        df = DataFrame(np.random.randn(10, 10))
+        df.values[:, ::2] = np.nan
+
+        result = df.fillna(method='ffill', axis=1)
+        expected = df.T.fillna(method='pad').T
+        assert_frame_equal(result, expected)
+
+        df.insert(6, 'foo', 5)
+        result = df.fillna(method='ffill', axis=1)
+        expected = df.astype(float).fillna(method='ffill', axis=1)
+        assert_frame_equal(result, expected)
+
+    def test_fillna_invalid_method(self):
+        with tm.assert_raises_regex(ValueError, 'ffil'):
+            self.frame.fillna(method='ffil')
+
+    def test_fillna_invalid_value(self):
+        # list
+        pytest.raises(TypeError, self.frame.fillna, [1, 2])
+        # tuple
+        pytest.raises(TypeError, self.frame.fillna, (1, 2))
+        # frame with series
+        pytest.raises(TypeError, self.frame.iloc[:, 0].fillna, self.frame)
+
+    def test_fillna_col_reordering(self):
+        cols = ["COL." + str(i) for i in range(5, 0, -1)]
+        data = np.random.rand(20, 5)
+        df = DataFrame(index=lrange(20), columns=cols, data=data)
+        filled = df.fillna(method='ffill')
+        assert df.columns.tolist() == filled.columns.tolist()
+
+    def test_fill_corner(self):
+        mf = self.mixed_frame
+        mf.loc[mf.index[5:20], 'foo'] = nan
+        mf.loc[mf.index[-10:], 'A'] = nan
+
+        filled = self.mixed_frame.fillna(value=0)
+        assert (filled.loc[filled.index[5:20], 'foo'] == 0).all()
+        del self.mixed_frame['foo']
+
+        empty_float = self.frame.reindex(columns=[])
+
+        # TODO(wesm): unused?
+        result = empty_float.fillna(value=0)  # noqa
+
+    def test_fill_value_when_combine_const(self):
+        # GH12723
+        dat = np.array([0, 1, np.nan, 3, 4, 5], dtype='float')
+        df = DataFrame({'foo': dat}, index=range(6))
+
+        exp = df.fillna(0).add(2)
+        res = df.add(2, fill_value=0)
+        assert_frame_equal(res, exp)
+
+
+class TestDataFrameInterpolate(TestData):
+
+    def test_interp_basic(self):
+        df = DataFrame({'A': [1, 2, np.nan, 4],
+                        'B': [1, 4, 9, np.nan],
+                        'C': [1, 2, 3, 5],
+                        'D': list('abcd')})
+        expected = DataFrame({'A': [1., 2., 3., 4.],
+                              'B': [1., 4., 9., 9.],
+                              'C': [1, 2, 3, 5],
+                              'D': list('abcd')})
+        result = df.interpolate()
+        assert_frame_equal(result, expected)
+
+        result = df.set_index('C').interpolate()
+        expected = df.set_index('C')
+        expected.loc[3, 'A'] = 3
+        expected.loc[5, 'B'] = 9
+        assert_frame_equal(result, expected)
+
+    def test_interp_bad_method(self):
+        df = DataFrame({'A': [1, 2, np.nan, 4],
+                        'B': [1, 4, 9, np.nan],
+                        'C': [1, 2, 3, 5],
+                        'D': list('abcd')})
+        with pytest.raises(ValueError):
+            df.interpolate(method='not_a_method')
+
+    def test_interp_combo(self):
+        df = DataFrame({'A': [1., 2., np.nan, 4.],
+                        'B': [1, 4, 9, np.nan],
+                        'C': [1, 2, 3, 5],
+                        'D': list('abcd')})
+
+        result = df['A'].interpolate()
+        expected = Series([1., 2., 3., 4.], name='A')
+        assert_series_equal(result, expected)
+
+        result = df['A'].interpolate(downcast='infer')
+        expected = Series([1, 2, 3, 4], name='A')
+        assert_series_equal(result, expected)
+
+    def test_interp_nan_idx(self):
+        df = DataFrame({'A': [1, 2, np.nan, 4], 'B': [np.nan, 2, 3, 4]})
+        df = df.set_index('A')
+        with pytest.raises(NotImplementedError):
+            df.interpolate(method='values')
+
+    @td.skip_if_no_scipy
+    def test_interp_various(self):
+        df = DataFrame({'A': [1, 2, np.nan, 4, 5, np.nan, 7],
+                        'C': [1, 2, 3, 5, 8, 13, 21]})
+        df = df.set_index('C')
+        expected = df.copy()
+        result = df.interpolate(method='polynomial', order=1)
+
+        expected.A.loc[3] = 2.66666667
+        expected.A.loc[13] = 5.76923076
+        assert_frame_equal(result, expected)
+
+        result = df.interpolate(method='cubic')
+        # GH #15662.
+        # new cubic and quadratic interpolation algorithms from scipy 0.19.0.
+        # previously `splmake` was used. See scipy/scipy#6710
+        if _is_scipy_ge_0190:
+            expected.A.loc[3] = 2.81547781
+            expected.A.loc[13] = 5.52964175
+        else:
+            expected.A.loc[3] = 2.81621174
+            expected.A.loc[13] = 5.64146581
+        assert_frame_equal(result, expected)
+
+        result = df.interpolate(method='nearest')
+        expected.A.loc[3] = 2
+        expected.A.loc[13] = 5
+        assert_frame_equal(result, expected, check_dtype=False)
+
+        result = df.interpolate(method='quadratic')
+        if _is_scipy_ge_0190:
+            expected.A.loc[3] = 2.82150771
+            expected.A.loc[13] = 6.12648668
+        else:
+            expected.A.loc[3] = 2.82533638
+            expected.A.loc[13] = 6.02817974
+        assert_frame_equal(result, expected)
+
+        result = df.interpolate(method='slinear')
+        expected.A.loc[3] = 2.66666667
+        expected.A.loc[13] = 5.76923077
+        assert_frame_equal(result, expected)
+
+        result = df.interpolate(method='zero')
+        expected.A.loc[3] = 2.
+        expected.A.loc[13] = 5
+        assert_frame_equal(result, expected, check_dtype=False)
+
+    @td.skip_if_no_scipy
+    def test_interp_alt_scipy(self):
+        df = DataFrame({'A': [1, 2, np.nan, 4, 5, np.nan, 7],
+                        'C': [1, 2, 3, 5, 8, 13, 21]})
+        result = df.interpolate(method='barycentric')
+        expected = df.copy()
+        expected.loc[2, 'A'] = 3
+        expected.loc[5, 'A'] = 6
+        assert_frame_equal(result, expected)
+
+        result = df.interpolate(method='barycentric', downcast='infer')
+        assert_frame_equal(result, expected.astype(np.int64))
+
+        result = df.interpolate(method='krogh')
+        expectedk = df.copy()
+        expectedk['A'] = expected['A']
+        assert_frame_equal(result, expectedk)
+
+        _skip_if_no_pchip()
+        import scipy
+        result = df.interpolate(method='pchip')
+        expected.loc[2, 'A'] = 3
+
+        if LooseVersion(scipy.__version__) >= LooseVersion('0.17.0'):
+            expected.loc[5, 'A'] = 6.0
+        else:
+            expected.loc[5, 'A'] = 6.125
+
+        assert_frame_equal(result, expected)
+
+    def test_interp_rowwise(self):
+        df = DataFrame({0: [1, 2, np.nan, 4],
+                        1: [2, 3, 4, np.nan],
+                        2: [np.nan, 4, 5, 6],
+                        3: [4, np.nan, 6, 7],
+                        4: [1, 2, 3, 4]})
+        result = df.interpolate(axis=1)
+        expected = df.copy()
+        expected.loc[3, 1] = 5
+        expected.loc[0, 2] = 3
+        expected.loc[1, 3] = 3
+        expected[4] = expected[4].astype(np.float64)
+        assert_frame_equal(result, expected)
+
+        result = df.interpolate(axis=1, method='values')
+        assert_frame_equal(result, expected)
+
+        result = df.interpolate(axis=0)
+        expected = df.interpolate()
+        assert_frame_equal(result, expected)
+
+    def test_rowwise_alt(self):
+        df = DataFrame({0: [0, .5, 1., np.nan, 4, 8, np.nan, np.nan, 64],
+                        1: [1, 2, 3, 4, 3, 2, 1, 0, -1]})
+        df.interpolate(axis=0)
+
+    @pytest.mark.parametrize("check_scipy", [
+        False, pytest.param(True, marks=td.skip_if_no_scipy)
+    ])
+    def test_interp_leading_nans(self, check_scipy):
+        df = DataFrame({"A": [np.nan, np.nan, .5, .25, 0],
+                        "B": [np.nan, -3, -3.5, np.nan, -4]})
+        result = df.interpolate()
+        expected = df.copy()
+        expected['B'].loc[3] = -3.75
+        assert_frame_equal(result, expected)
+
+        if check_scipy:
+            result = df.interpolate(method='polynomial', order=1)
+            assert_frame_equal(result, expected)
+
+    def test_interp_raise_on_only_mixed(self):
+        df = DataFrame({'A': [1, 2, np.nan, 4],
+                        'B': ['a', 'b', 'c', 'd'],
+                        'C': [np.nan, 2, 5, 7],
+                        'D': [np.nan, np.nan, 9, 9],
+                        'E': [1, 2, 3, 4]})
+        with pytest.raises(TypeError):
+            df.interpolate(axis=1)
+
+    def test_interp_inplace(self):
+        df = DataFrame({'a': [1., 2., np.nan, 4.]})
+        expected = DataFrame({'a': [1., 2., 3., 4.]})
+        result = df.copy()
+        result['a'].interpolate(inplace=True)
+        assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result['a'].interpolate(inplace=True, downcast='infer')
+        assert_frame_equal(result, expected.astype('int64'))
+
+    def test_interp_inplace_row(self):
+        # GH 10395
+        result = DataFrame({'a': [1., 2., 3., 4.],
+                            'b': [np.nan, 2., 3., 4.],
+                            'c': [3, 2, 2, 2]})
+        expected = result.interpolate(method='linear', axis=1, inplace=False)
+        result.interpolate(method='linear', axis=1, inplace=True)
+        assert_frame_equal(result, expected)
+
+    def test_interp_ignore_all_good(self):
+        # GH
+        df = DataFrame({'A': [1, 2, np.nan, 4],
+                        'B': [1, 2, 3, 4],
+                        'C': [1., 2., np.nan, 4.],
+                        'D': [1., 2., 3., 4.]})
+        expected = DataFrame({'A': np.array(
+            [1, 2, 3, 4], dtype='float64'),
+            'B': np.array(
+            [1, 2, 3, 4], dtype='int64'),
+            'C': np.array(
+            [1., 2., 3, 4.], dtype='float64'),
+            'D': np.array(
+            [1., 2., 3., 4.], dtype='float64')})
+
+        result = df.interpolate(downcast=None)
+        assert_frame_equal(result, expected)
+
+        # all good
+        result = df[['B', 'D']].interpolate(downcast=None)
+        assert_frame_equal(result, df[['B', 'D']])
diff --git a/pandas/tests/frame/test_mutate_columns.py b/pandas/tests/frame/test_mutate_columns.py
new file mode 100644
index 0000000000000..51ffe2966b4e5
--- /dev/null
+++ b/pandas/tests/frame/test_mutate_columns.py
@@ -0,0 +1,283 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+import pytest
+from pandas.compat import range, lrange
+import numpy as np
+from pandas.compat import PY36
+
+from pandas import DataFrame, Series, Index, MultiIndex
+
+from pandas.util.testing import assert_frame_equal
+
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+# Column add, remove, delete.
+
+
+class TestDataFrameMutateColumns(TestData):
+
+    def test_assign(self):
+        df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
+        original = df.copy()
+        result = df.assign(C=df.B / df.A)
+        expected = df.copy()
+        expected['C'] = [4, 2.5, 2]
+        assert_frame_equal(result, expected)
+
+        # lambda syntax
+        result = df.assign(C=lambda x: x.B / x.A)
+        assert_frame_equal(result, expected)
+
+        # original is unmodified
+        assert_frame_equal(df, original)
+
+        # Non-Series array-like
+        result = df.assign(C=[4, 2.5, 2])
+        assert_frame_equal(result, expected)
+        # original is unmodified
+        assert_frame_equal(df, original)
+
+        result = df.assign(B=df.B / df.A)
+        expected = expected.drop('B', axis=1).rename(columns={'C': 'B'})
+        assert_frame_equal(result, expected)
+
+        # overwrite
+        result = df.assign(A=df.A + df.B)
+        expected = df.copy()
+        expected['A'] = [5, 7, 9]
+        assert_frame_equal(result, expected)
+
+        # lambda
+        result = df.assign(A=lambda x: x.A + x.B)
+        assert_frame_equal(result, expected)
+
+    def test_assign_multiple(self):
+        df = DataFrame([[1, 4], [2, 5], [3, 6]], columns=['A', 'B'])
+        result = df.assign(C=[7, 8, 9], D=df.A, E=lambda x: x.B)
+        expected = DataFrame([[1, 4, 7, 1, 4], [2, 5, 8, 2, 5],
+                              [3, 6, 9, 3, 6]], columns=list('ABCDE'))
+        assert_frame_equal(result, expected)
+
+    def test_assign_order(self):
+        # GH 9818
+        df = DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
+        result = df.assign(D=df.A + df.B, C=df.A - df.B)
+
+        if PY36:
+            expected = DataFrame([[1, 2, 3, -1], [3, 4, 7, -1]],
+                                 columns=list('ABDC'))
+        else:
+            expected = DataFrame([[1, 2, -1, 3], [3, 4, -1, 7]],
+                                 columns=list('ABCD'))
+        assert_frame_equal(result, expected)
+        result = df.assign(C=df.A - df.B, D=df.A + df.B)
+
+        expected = DataFrame([[1, 2, -1, 3], [3, 4, -1, 7]],
+                             columns=list('ABCD'))
+
+        assert_frame_equal(result, expected)
+
+    def test_assign_bad(self):
+        df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
+
+        # non-keyword argument
+        with pytest.raises(TypeError):
+            df.assign(lambda x: x.A)
+        with pytest.raises(AttributeError):
+            df.assign(C=df.A, D=df.A + df.C)
+
+    @pytest.mark.skipif(PY36, reason="""Issue #14207: valid for python
+                        3.6 and above""")
+    def test_assign_dependent_old_python(self):
+        df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
+
+        # Key C does not exist at definition time of df
+        with pytest.raises(KeyError):
+            df.assign(C=lambda df: df.A,
+                      D=lambda df: df['A'] + df['C'])
+        with pytest.raises(KeyError):
+            df.assign(C=df.A, D=lambda x: x['A'] + x['C'])
+
+    @pytest.mark.skipif(not PY36, reason="""Issue #14207: not valid for
+                        python 3.5 and below""")
+    def test_assign_dependent(self):
+        df = DataFrame({'A': [1, 2], 'B': [3, 4]})
+
+        result = df.assign(C=df.A, D=lambda x: x['A'] + x['C'])
+        expected = DataFrame([[1, 3, 1, 2], [2, 4, 2, 4]],
+                             columns=list('ABCD'))
+        assert_frame_equal(result, expected)
+
+        result = df.assign(C=lambda df: df.A,
+                           D=lambda df: df['A'] + df['C'])
+        expected = DataFrame([[1, 3, 1, 2], [2, 4, 2, 4]],
+                             columns=list('ABCD'))
+        assert_frame_equal(result, expected)
+
+    def test_insert_error_msmgs(self):
+
+        # GH 7432
+        df = DataFrame({'foo': ['a', 'b', 'c'], 'bar': [
+                       1, 2, 3], 'baz': ['d', 'e', 'f']}).set_index('foo')
+        s = DataFrame({'foo': ['a', 'b', 'c', 'a'], 'fiz': [
+                      'g', 'h', 'i', 'j']}).set_index('foo')
+        msg = 'cannot reindex from a duplicate axis'
+        with tm.assert_raises_regex(ValueError, msg):
+            df['newcol'] = s
+
+        # GH 4107, more descriptive error message
+        df = DataFrame(np.random.randint(0, 2, (4, 4)),
+                       columns=['a', 'b', 'c', 'd'])
+
+        msg = 'incompatible index of inserted column with frame index'
+        with tm.assert_raises_regex(TypeError, msg):
+            df['gr'] = df.groupby(['b', 'c']).count()
+
+    def test_insert_benchmark(self):
+        # from the vb_suite/frame_methods/frame_insert_columns
+        N = 10
+        K = 5
+        df = DataFrame(index=lrange(N))
+        new_col = np.random.randn(N)
+        for i in range(K):
+            df[i] = new_col
+        expected = DataFrame(np.repeat(new_col, K).reshape(N, K),
+                             index=lrange(N))
+        assert_frame_equal(df, expected)
+
+    def test_insert(self):
+        df = DataFrame(np.random.randn(5, 3), index=np.arange(5),
+                       columns=['c', 'b', 'a'])
+
+        df.insert(0, 'foo', df['a'])
+        tm.assert_index_equal(df.columns, Index(['foo', 'c', 'b', 'a']))
+        tm.assert_series_equal(df['a'], df['foo'], check_names=False)
+
+        df.insert(2, 'bar', df['c'])
+        tm.assert_index_equal(df.columns,
+                              Index(['foo', 'c', 'bar', 'b', 'a']))
+        tm.assert_almost_equal(df['c'], df['bar'], check_names=False)
+
+        # diff dtype
+
+        # new item
+        df['x'] = df['a'].astype('float32')
+        result = Series(dict(float32=1, float64=5))
+        assert (df.get_dtype_counts().sort_index() == result).all()
+
+        # replacing current (in different block)
+        df['a'] = df['a'].astype('float32')
+        result = Series(dict(float32=2, float64=4))
+        assert (df.get_dtype_counts().sort_index() == result).all()
+
+        df['y'] = df['a'].astype('int32')
+        result = Series(dict(float32=2, float64=4, int32=1))
+        assert (df.get_dtype_counts().sort_index() == result).all()
+
+        with tm.assert_raises_regex(ValueError, 'already exists'):
+            df.insert(1, 'a', df['b'])
+        pytest.raises(ValueError, df.insert, 1, 'c', df['b'])
+
+        df.columns.name = 'some_name'
+        # preserve columns name field
+        df.insert(0, 'baz', df['c'])
+        assert df.columns.name == 'some_name'
+
+        # GH 13522
+        df = DataFrame(index=['A', 'B', 'C'])
+        df['X'] = df.index
+        df['X'] = ['x', 'y', 'z']
+        exp = DataFrame(data={'X': ['x', 'y', 'z']}, index=['A', 'B', 'C'])
+        assert_frame_equal(df, exp)
+
+    def test_delitem(self):
+        del self.frame['A']
+        assert 'A' not in self.frame
+
+    def test_delitem_multiindex(self):
+        midx = MultiIndex.from_product([['A', 'B'], [1, 2]])
+        df = DataFrame(np.random.randn(4, 4), columns=midx)
+        assert len(df.columns) == 4
+        assert ('A', ) in df.columns
+        assert 'A' in df.columns
+
+        result = df['A']
+        assert isinstance(result, DataFrame)
+        del df['A']
+
+        assert len(df.columns) == 2
+
+        # A still in the levels, BUT get a KeyError if trying
+        # to delete
+        assert ('A', ) not in df.columns
+        with pytest.raises(KeyError):
+            del df[('A',)]
+
+        # behavior of dropped/deleted MultiIndex levels changed from
+        # GH 2770 to GH 19027: MultiIndex no longer '.__contains__'
+        # levels which are dropped/deleted
+        assert 'A' not in df.columns
+        with pytest.raises(KeyError):
+            del df['A']
+
+    def test_pop(self):
+        self.frame.columns.name = 'baz'
+
+        self.frame.pop('A')
+        assert 'A' not in self.frame
+
+        self.frame['foo'] = 'bar'
+        self.frame.pop('foo')
+        assert 'foo' not in self.frame
+        # TODO assert self.frame.columns.name == 'baz'
+
+        # gh-10912: inplace ops cause caching issue
+        a = DataFrame([[1, 2, 3], [4, 5, 6]], columns=[
+                      'A', 'B', 'C'], index=['X', 'Y'])
+        b = a.pop('B')
+        b += 1
+
+        # original frame
+        expected = DataFrame([[1, 3], [4, 6]], columns=[
+                             'A', 'C'], index=['X', 'Y'])
+        tm.assert_frame_equal(a, expected)
+
+        # result
+        expected = Series([2, 5], index=['X', 'Y'], name='B') + 1
+        tm.assert_series_equal(b, expected)
+
+    def test_pop_non_unique_cols(self):
+        df = DataFrame({0: [0, 1], 1: [0, 1], 2: [4, 5]})
+        df.columns = ["a", "b", "a"]
+
+        res = df.pop("a")
+        assert type(res) == DataFrame
+        assert len(res) == 2
+        assert len(df.columns) == 1
+        assert "b" in df.columns
+        assert "a" not in df.columns
+        assert len(df.index) == 2
+
+    def test_insert_column_bug_4032(self):
+
+        # GH4032, inserting a column and renaming causing errors
+        df = DataFrame({'b': [1.1, 2.2]})
+        df = df.rename(columns={})
+        df.insert(0, 'a', [1, 2])
+
+        result = df.rename(columns={})
+        str(result)
+        expected = DataFrame([[1, 1.1], [2, 2.2]], columns=['a', 'b'])
+        assert_frame_equal(result, expected)
+        df.insert(0, 'c', [1.3, 2.3])
+
+        result = df.rename(columns={})
+        str(result)
+
+        expected = DataFrame([[1.3, 1, 1.1], [2.3, 2, 2.2]],
+                             columns=['c', 'a', 'b'])
+        assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_nonunique_indexes.py b/pandas/tests/frame/test_nonunique_indexes.py
new file mode 100644
index 0000000000000..0b32ec89d3909
--- /dev/null
+++ b/pandas/tests/frame/test_nonunique_indexes.py
@@ -0,0 +1,478 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import pytest
+import numpy as np
+
+from pandas.compat import lrange, u
+from pandas import DataFrame, Series, MultiIndex, date_range
+import pandas as pd
+
+from pandas.util.testing import assert_series_equal, assert_frame_equal
+
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+class TestDataFrameNonuniqueIndexes(TestData):
+
+    def test_column_dups_operations(self):
+
+        def check(result, expected=None):
+            if expected is not None:
+                assert_frame_equal(result, expected)
+            result.dtypes
+            str(result)
+
+        # assignment
+        # GH 3687
+        arr = np.random.randn(3, 2)
+        idx = lrange(2)
+        df = DataFrame(arr, columns=['A', 'A'])
+        df.columns = idx
+        expected = DataFrame(arr, columns=idx)
+        check(df, expected)
+
+        idx = date_range('20130101', periods=4, freq='Q-NOV')
+        df = DataFrame([[1, 1, 1, 5], [1, 1, 2, 5], [2, 1, 3, 5]],
+                       columns=['a', 'a', 'a', 'a'])
+        df.columns = idx
+        expected = DataFrame(
+            [[1, 1, 1, 5], [1, 1, 2, 5], [2, 1, 3, 5]], columns=idx)
+        check(df, expected)
+
+        # insert
+        df = DataFrame([[1, 1, 1, 5], [1, 1, 2, 5], [2, 1, 3, 5]],
+                       columns=['foo', 'bar', 'foo', 'hello'])
+        df['string'] = 'bah'
+        expected = DataFrame([[1, 1, 1, 5, 'bah'], [1, 1, 2, 5, 'bah'],
+                              [2, 1, 3, 5, 'bah']],
+                             columns=['foo', 'bar', 'foo', 'hello', 'string'])
+        check(df, expected)
+        with tm.assert_raises_regex(ValueError, 'Length of value'):
+            df.insert(0, 'AnotherColumn', range(len(df.index) - 1))
+
+        # insert same dtype
+        df['foo2'] = 3
+        expected = DataFrame([[1, 1, 1, 5, 'bah', 3], [1, 1, 2, 5, 'bah', 3],
+                              [2, 1, 3, 5, 'bah', 3]],
+                             columns=['foo', 'bar', 'foo', 'hello',
+                                      'string', 'foo2'])
+        check(df, expected)
+
+        # set (non-dup)
+        df['foo2'] = 4
+        expected = DataFrame([[1, 1, 1, 5, 'bah', 4], [1, 1, 2, 5, 'bah', 4],
+                              [2, 1, 3, 5, 'bah', 4]],
+                             columns=['foo', 'bar', 'foo', 'hello',
+                                      'string', 'foo2'])
+        check(df, expected)
+        df['foo2'] = 3
+
+        # delete (non dup)
+        del df['bar']
+        expected = DataFrame([[1, 1, 5, 'bah', 3], [1, 2, 5, 'bah', 3],
+                              [2, 3, 5, 'bah', 3]],
+                             columns=['foo', 'foo', 'hello', 'string', 'foo2'])
+        check(df, expected)
+
+        # try to delete again (its not consolidated)
+        del df['hello']
+        expected = DataFrame([[1, 1, 'bah', 3], [1, 2, 'bah', 3],
+                              [2, 3, 'bah', 3]],
+                             columns=['foo', 'foo', 'string', 'foo2'])
+        check(df, expected)
+
+        # consolidate
+        df = df._consolidate()
+        expected = DataFrame([[1, 1, 'bah', 3], [1, 2, 'bah', 3],
+                              [2, 3, 'bah', 3]],
+                             columns=['foo', 'foo', 'string', 'foo2'])
+        check(df, expected)
+
+        # insert
+        df.insert(2, 'new_col', 5.)
+        expected = DataFrame([[1, 1, 5., 'bah', 3], [1, 2, 5., 'bah', 3],
+                              [2, 3, 5., 'bah', 3]],
+                             columns=['foo', 'foo', 'new_col', 'string',
+                                      'foo2'])
+        check(df, expected)
+
+        # insert a dup
+        tm.assert_raises_regex(ValueError, 'cannot insert',
+                               df.insert, 2, 'new_col', 4.)
+        df.insert(2, 'new_col', 4., allow_duplicates=True)
+        expected = DataFrame([[1, 1, 4., 5., 'bah', 3],
+                              [1, 2, 4., 5., 'bah', 3],
+                              [2, 3, 4., 5., 'bah', 3]],
+                             columns=['foo', 'foo', 'new_col',
+                                      'new_col', 'string', 'foo2'])
+        check(df, expected)
+
+        # delete (dup)
+        del df['foo']
+        expected = DataFrame([[4., 5., 'bah', 3], [4., 5., 'bah', 3],
+                              [4., 5., 'bah', 3]],
+                             columns=['new_col', 'new_col', 'string', 'foo2'])
+        assert_frame_equal(df, expected)
+
+        # dup across dtypes
+        df = DataFrame([[1, 1, 1., 5], [1, 1, 2., 5], [2, 1, 3., 5]],
+                       columns=['foo', 'bar', 'foo', 'hello'])
+        check(df)
+
+        df['foo2'] = 7.
+        expected = DataFrame([[1, 1, 1., 5, 7.], [1, 1, 2., 5, 7.],
+                              [2, 1, 3., 5, 7.]],
+                             columns=['foo', 'bar', 'foo', 'hello', 'foo2'])
+        check(df, expected)
+
+        result = df['foo']
+        expected = DataFrame([[1, 1.], [1, 2.], [2, 3.]],
+                             columns=['foo', 'foo'])
+        check(result, expected)
+
+        # multiple replacements
+        df['foo'] = 'string'
+        expected = DataFrame([['string', 1, 'string', 5, 7.],
+                              ['string', 1, 'string', 5, 7.],
+                              ['string', 1, 'string', 5, 7.]],
+                             columns=['foo', 'bar', 'foo', 'hello', 'foo2'])
+        check(df, expected)
+
+        del df['foo']
+        expected = DataFrame([[1, 5, 7.], [1, 5, 7.], [1, 5, 7.]], columns=[
+                             'bar', 'hello', 'foo2'])
+        check(df, expected)
+
+        # values
+        df = DataFrame([[1, 2.5], [3, 4.5]], index=[1, 2], columns=['x', 'x'])
+        result = df.values
+        expected = np.array([[1, 2.5], [3, 4.5]])
+        assert (result == expected).all().all()
+
+        # rename, GH 4403
+        df4 = DataFrame(
+            {'RT': [0.0454],
+             'TClose': [22.02],
+             'TExg': [0.0422]},
+            index=MultiIndex.from_tuples([(600809, 20130331)],
+                                         names=['STK_ID', 'RPT_Date']))
+
+        df5 = DataFrame({'RPT_Date': [20120930, 20121231, 20130331],
+                         'STK_ID': [600809] * 3,
+                         'STK_Name': [u('饡驦'), u('饡驦'), u('饡驦')],
+                         'TClose': [38.05, 41.66, 30.01]},
+                        index=MultiIndex.from_tuples(
+                            [(600809, 20120930),
+                             (600809, 20121231),
+                             (600809, 20130331)],
+                            names=['STK_ID', 'RPT_Date']))
+
+        k = pd.merge(df4, df5, how='inner', left_index=True, right_index=True)
+        result = k.rename(
+            columns={'TClose_x': 'TClose', 'TClose_y': 'QT_Close'})
+        str(result)
+        result.dtypes
+
+        expected = (DataFrame([[0.0454, 22.02, 0.0422, 20130331, 600809,
+                                u('饡驦'), 30.01]],
+                              columns=['RT', 'TClose', 'TExg',
+                                       'RPT_Date', 'STK_ID', 'STK_Name',
+                                       'QT_Close'])
+                    .set_index(['STK_ID', 'RPT_Date'], drop=False))
+        assert_frame_equal(result, expected)
+
+        # reindex is invalid!
+        df = DataFrame([[1, 5, 7.], [1, 5, 7.], [1, 5, 7.]],
+                       columns=['bar', 'a', 'a'])
+        pytest.raises(ValueError, df.reindex, columns=['bar'])
+        pytest.raises(ValueError, df.reindex, columns=['bar', 'foo'])
+
+        # drop
+        df = DataFrame([[1, 5, 7.], [1, 5, 7.], [1, 5, 7.]],
+                       columns=['bar', 'a', 'a'])
+        result = df.drop(['a'], axis=1)
+        expected = DataFrame([[1], [1], [1]], columns=['bar'])
+        check(result, expected)
+        result = df.drop('a', axis=1)
+        check(result, expected)
+
+        # describe
+        df = DataFrame([[1, 1, 1], [2, 2, 2], [3, 3, 3]],
+                       columns=['bar', 'a', 'a'], dtype='float64')
+        result = df.describe()
+        s = df.iloc[:, 0].describe()
+        expected = pd.concat([s, s, s], keys=df.columns, axis=1)
+        check(result, expected)
+
+        # check column dups with index equal and not equal to df's index
+        df = DataFrame(np.random.randn(5, 3), index=['a', 'b', 'c', 'd', 'e'],
+                       columns=['A', 'B', 'A'])
+        for index in [df.index, pd.Index(list('edcba'))]:
+            this_df = df.copy()
+            expected_ser = pd.Series(index.values, index=this_df.index)
+            expected_df = DataFrame({'A': expected_ser,
+                                     'B': this_df['B'],
+                                     'A': expected_ser},
+                                    columns=['A', 'B', 'A'])
+            this_df['A'] = index
+            check(this_df, expected_df)
+
+        # operations
+        for op in ['__add__', '__mul__', '__sub__', '__truediv__']:
+            df = DataFrame(dict(A=np.arange(10), B=np.random.rand(10)))
+            expected = getattr(df, op)(df)
+            expected.columns = ['A', 'A']
+            df.columns = ['A', 'A']
+            result = getattr(df, op)(df)
+            check(result, expected)
+
+        # multiple assignments that change dtypes
+        # the location indexer is a slice
+        # GH 6120
+        df = DataFrame(np.random.randn(5, 2), columns=['that', 'that'])
+        expected = DataFrame(1.0, index=range(5), columns=['that', 'that'])
+
+        df['that'] = 1.0
+        check(df, expected)
+
+        df = DataFrame(np.random.rand(5, 2), columns=['that', 'that'])
+        expected = DataFrame(1, index=range(5), columns=['that', 'that'])
+
+        df['that'] = 1
+        check(df, expected)
+
+    def test_column_dups2(self):
+
+        # drop buggy GH 6240
+        df = DataFrame({'A': np.random.randn(5),
+                        'B': np.random.randn(5),
+                        'C': np.random.randn(5),
+                        'D': ['a', 'b', 'c', 'd', 'e']})
+
+        expected = df.take([0, 1, 1], axis=1)
+        df2 = df.take([2, 0, 1, 2, 1], axis=1)
+        result = df2.drop('C', axis=1)
+        assert_frame_equal(result, expected)
+
+        # dropna
+        df = DataFrame({'A': np.random.randn(5),
+                        'B': np.random.randn(5),
+                        'C': np.random.randn(5),
+                        'D': ['a', 'b', 'c', 'd', 'e']})
+        df.iloc[2, [0, 1, 2]] = np.nan
+        df.iloc[0, 0] = np.nan
+        df.iloc[1, 1] = np.nan
+        df.iloc[:, 3] = np.nan
+        expected = df.dropna(subset=['A', 'B', 'C'], how='all')
+        expected.columns = ['A', 'A', 'B', 'C']
+
+        df.columns = ['A', 'A', 'B', 'C']
+
+        result = df.dropna(subset=['A', 'C'], how='all')
+        assert_frame_equal(result, expected)
+
+    def test_column_dups_indexing(self):
+        def check(result, expected=None):
+            if expected is not None:
+                assert_frame_equal(result, expected)
+            result.dtypes
+            str(result)
+
+        # boolean indexing
+        # GH 4879
+        dups = ['A', 'A', 'C', 'D']
+        df = DataFrame(np.arange(12).reshape(3, 4), columns=[
+                       'A', 'B', 'C', 'D'], dtype='float64')
+        expected = df[df.C > 6]
+        expected.columns = dups
+        df = DataFrame(np.arange(12).reshape(3, 4),
+                       columns=dups, dtype='float64')
+        result = df[df.C > 6]
+        check(result, expected)
+
+        # where
+        df = DataFrame(np.arange(12).reshape(3, 4), columns=[
+                       'A', 'B', 'C', 'D'], dtype='float64')
+        expected = df[df > 6]
+        expected.columns = dups
+        df = DataFrame(np.arange(12).reshape(3, 4),
+                       columns=dups, dtype='float64')
+        result = df[df > 6]
+        check(result, expected)
+
+        # boolean with the duplicate raises
+        df = DataFrame(np.arange(12).reshape(3, 4),
+                       columns=dups, dtype='float64')
+        pytest.raises(ValueError, lambda: df[df.A > 6])
+
+        # dup aligining operations should work
+        # GH 5185
+        df1 = DataFrame([1, 2, 3, 4, 5], index=[1, 2, 1, 2, 3])
+        df2 = DataFrame([1, 2, 3], index=[1, 2, 3])
+        expected = DataFrame([0, 2, 0, 2, 2], index=[1, 1, 2, 2, 3])
+        result = df1.sub(df2)
+        assert_frame_equal(result, expected)
+
+        # equality
+        df1 = DataFrame([[1, 2], [2, np.nan], [3, 4], [4, 4]],
+                        columns=['A', 'B'])
+        df2 = DataFrame([[0, 1], [2, 4], [2, np.nan], [4, 5]],
+                        columns=['A', 'A'])
+
+        # not-comparing like-labelled
+        pytest.raises(ValueError, lambda: df1 == df2)
+
+        df1r = df1.reindex_like(df2)
+        result = df1r == df2
+        expected = DataFrame([[False, True], [True, False], [False, False], [
+                             True, False]], columns=['A', 'A'])
+        assert_frame_equal(result, expected)
+
+        # mixed column selection
+        # GH 5639
+        dfbool = DataFrame({'one': Series([True, True, False],
+                                          index=['a', 'b', 'c']),
+                            'two': Series([False, False, True, False],
+                                          index=['a', 'b', 'c', 'd']),
+                            'three': Series([False, True, True, True],
+                                            index=['a', 'b', 'c', 'd'])})
+        expected = pd.concat(
+            [dfbool['one'], dfbool['three'], dfbool['one']], axis=1)
+        result = dfbool[['one', 'three', 'one']]
+        check(result, expected)
+
+        # multi-axis dups
+        # GH 6121
+        df = DataFrame(np.arange(25.).reshape(5, 5),
+                       index=['a', 'b', 'c', 'd', 'e'],
+                       columns=['A', 'B', 'C', 'D', 'E'])
+        z = df[['A', 'C', 'A']].copy()
+        expected = z.loc[['a', 'c', 'a']]
+
+        df = DataFrame(np.arange(25.).reshape(5, 5),
+                       index=['a', 'b', 'c', 'd', 'e'],
+                       columns=['A', 'B', 'C', 'D', 'E'])
+        z = df[['A', 'C', 'A']]
+        result = z.loc[['a', 'c', 'a']]
+        check(result, expected)
+
+    def test_column_dups_indexing2(self):
+
+        # GH 8363
+        # datetime ops with a non-unique index
+        df = DataFrame({'A': np.arange(5, dtype='int64'),
+                        'B': np.arange(1, 6, dtype='int64')},
+                       index=[2, 2, 3, 3, 4])
+        result = df.B - df.A
+        expected = Series(1, index=[2, 2, 3, 3, 4])
+        assert_series_equal(result, expected)
+
+        df = DataFrame({'A': date_range('20130101', periods=5),
+                        'B': date_range('20130101 09:00:00', periods=5)},
+                       index=[2, 2, 3, 3, 4])
+        result = df.B - df.A
+        expected = Series(pd.Timedelta('9 hours'), index=[2, 2, 3, 3, 4])
+        assert_series_equal(result, expected)
+
+    def test_columns_with_dups(self):
+        # GH 3468 related
+
+        # basic
+        df = DataFrame([[1, 2]], columns=['a', 'a'])
+        df.columns = ['a', 'a.1']
+        str(df)
+        expected = DataFrame([[1, 2]], columns=['a', 'a.1'])
+        assert_frame_equal(df, expected)
+
+        df = DataFrame([[1, 2, 3]], columns=['b', 'a', 'a'])
+        df.columns = ['b', 'a', 'a.1']
+        str(df)
+        expected = DataFrame([[1, 2, 3]], columns=['b', 'a', 'a.1'])
+        assert_frame_equal(df, expected)
+
+        # with a dup index
+        df = DataFrame([[1, 2]], columns=['a', 'a'])
+        df.columns = ['b', 'b']
+        str(df)
+        expected = DataFrame([[1, 2]], columns=['b', 'b'])
+        assert_frame_equal(df, expected)
+
+        # multi-dtype
+        df = DataFrame([[1, 2, 1., 2., 3., 'foo', 'bar']],
+                       columns=['a', 'a', 'b', 'b', 'd', 'c', 'c'])
+        df.columns = list('ABCDEFG')
+        str(df)
+        expected = DataFrame(
+            [[1, 2, 1., 2., 3., 'foo', 'bar']], columns=list('ABCDEFG'))
+        assert_frame_equal(df, expected)
+
+        # this is an error because we cannot disambiguate the dup columns
+        pytest.raises(Exception, lambda x: DataFrame(
+            [[1, 2, 'foo', 'bar']], columns=['a', 'a', 'a', 'a']))
+
+        # dups across blocks
+        df_float = DataFrame(np.random.randn(10, 3), dtype='float64')
+        df_int = DataFrame(np.random.randn(10, 3), dtype='int64')
+        df_bool = DataFrame(True, index=df_float.index,
+                            columns=df_float.columns)
+        df_object = DataFrame('foo', index=df_float.index,
+                              columns=df_float.columns)
+        df_dt = DataFrame(pd.Timestamp('20010101'),
+                          index=df_float.index,
+                          columns=df_float.columns)
+        df = pd.concat([df_float, df_int, df_bool, df_object, df_dt], axis=1)
+
+        assert len(df._data._blknos) == len(df.columns)
+        assert len(df._data._blklocs) == len(df.columns)
+
+        # testing iloc
+        for i in range(len(df.columns)):
+            df.iloc[:, i]
+
+        # dup columns across dtype GH 2079/2194
+        vals = [[1, -1, 2.], [2, -2, 3.]]
+        rs = DataFrame(vals, columns=['A', 'A', 'B'])
+        xp = DataFrame(vals)
+        xp.columns = ['A', 'A', 'B']
+        assert_frame_equal(rs, xp)
+
+    def test_values_duplicates(self):
+        df = DataFrame([[1, 2, 'a', 'b'],
+                        [1, 2, 'a', 'b']],
+                       columns=['one', 'one', 'two', 'two'])
+
+        result = df.values
+        expected = np.array([[1, 2, 'a', 'b'], [1, 2, 'a', 'b']],
+                            dtype=object)
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_set_value_by_index(self):
+        # See gh-12344
+        df = DataFrame(np.arange(9).reshape(3, 3).T)
+        df.columns = list('AAA')
+        expected = df.iloc[:, 2]
+
+        df.iloc[:, 0] = 3
+        assert_series_equal(df.iloc[:, 2], expected)
+
+        df = DataFrame(np.arange(9).reshape(3, 3).T)
+        df.columns = [2, float(2), str(2)]
+        expected = df.iloc[:, 1]
+
+        df.iloc[:, 0] = 3
+        assert_series_equal(df.iloc[:, 1], expected)
+
+    def test_insert_with_columns_dups(self):
+        # GH 14291
+        df = pd.DataFrame()
+        df.insert(0, 'A', ['g', 'h', 'i'], allow_duplicates=True)
+        df.insert(0, 'A', ['d', 'e', 'f'], allow_duplicates=True)
+        df.insert(0, 'A', ['a', 'b', 'c'], allow_duplicates=True)
+        exp = pd.DataFrame([['a', 'd', 'g'], ['b', 'e', 'h'],
+                            ['c', 'f', 'i']], columns=['A', 'A', 'A'])
+        assert_frame_equal(df, exp)
diff --git a/pandas/tests/frame/test_operators.py b/pandas/tests/frame/test_operators.py
new file mode 100644
index 0000000000000..fdf50805ad818
--- /dev/null
+++ b/pandas/tests/frame/test_operators.py
@@ -0,0 +1,1210 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+from collections import deque
+from datetime import datetime
+from decimal import Decimal
+import operator
+
+import pytest
+
+from numpy import nan, random
+import numpy as np
+
+from pandas.compat import range
+from pandas import compat
+from pandas import (DataFrame, Series, MultiIndex, Timestamp,
+                    date_range)
+import pandas.core.common as com
+import pandas.io.formats.printing as printing
+import pandas as pd
+
+from pandas.util.testing import (assert_numpy_array_equal,
+                                 assert_series_equal,
+                                 assert_frame_equal)
+
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import (TestData, _check_mixed_float,
+                                       _check_mixed_int)
+
+
+class TestDataFrameOperators(TestData):
+
+    def test_operators(self):
+        garbage = random.random(4)
+        colSeries = Series(garbage, index=np.array(self.frame.columns))
+
+        idSum = self.frame + self.frame
+        seriesSum = self.frame + colSeries
+
+        for col, series in compat.iteritems(idSum):
+            for idx, val in compat.iteritems(series):
+                origVal = self.frame[col][idx] * 2
+                if not np.isnan(val):
+                    assert val == origVal
+                else:
+                    assert np.isnan(origVal)
+
+        for col, series in compat.iteritems(seriesSum):
+            for idx, val in compat.iteritems(series):
+                origVal = self.frame[col][idx] + colSeries[col]
+                if not np.isnan(val):
+                    assert val == origVal
+                else:
+                    assert np.isnan(origVal)
+
+        added = self.frame2 + self.frame2
+        expected = self.frame2 * 2
+        assert_frame_equal(added, expected)
+
+        df = DataFrame({'a': ['a', None, 'b']})
+        assert_frame_equal(df + df, DataFrame({'a': ['aa', np.nan, 'bb']}))
+
+        # Test for issue #10181
+        for dtype in ('float', 'int64'):
+            frames = [
+                DataFrame(dtype=dtype),
+                DataFrame(columns=['A'], dtype=dtype),
+                DataFrame(index=[0], dtype=dtype),
+            ]
+            for df in frames:
+                assert (df + df).equals(df)
+                assert_frame_equal(df + df, df)
+
+    def test_ops_np_scalar(self):
+        vals, xs = np.random.rand(5, 3), [nan, 7, -23, 2.718, -3.14, np.inf]
+        f = lambda x: DataFrame(x, index=list('ABCDE'),
+                                columns=['jim', 'joe', 'jolie'])
+
+        df = f(vals)
+
+        for x in xs:
+            assert_frame_equal(df / np.array(x), f(vals / x))
+            assert_frame_equal(np.array(x) * df, f(vals * x))
+            assert_frame_equal(df + np.array(x), f(vals + x))
+            assert_frame_equal(np.array(x) - df, f(x - vals))
+
+    def test_operators_boolean(self):
+
+        # GH 5808
+        # empty frames, non-mixed dtype
+
+        result = DataFrame(index=[1]) & DataFrame(index=[1])
+        assert_frame_equal(result, DataFrame(index=[1]))
+
+        result = DataFrame(index=[1]) | DataFrame(index=[1])
+        assert_frame_equal(result, DataFrame(index=[1]))
+
+        result = DataFrame(index=[1]) & DataFrame(index=[1, 2])
+        assert_frame_equal(result, DataFrame(index=[1, 2]))
+
+        result = DataFrame(index=[1], columns=['A']) & DataFrame(
+            index=[1], columns=['A'])
+        assert_frame_equal(result, DataFrame(index=[1], columns=['A']))
+
+        result = DataFrame(True, index=[1], columns=['A']) & DataFrame(
+            True, index=[1], columns=['A'])
+        assert_frame_equal(result, DataFrame(True, index=[1], columns=['A']))
+
+        result = DataFrame(True, index=[1], columns=['A']) | DataFrame(
+            True, index=[1], columns=['A'])
+        assert_frame_equal(result, DataFrame(True, index=[1], columns=['A']))
+
+        # boolean ops
+        result = DataFrame(1, index=[1], columns=['A']) | DataFrame(
+            True, index=[1], columns=['A'])
+        assert_frame_equal(result, DataFrame(1, index=[1], columns=['A']))
+
+        def f():
+            DataFrame(1.0, index=[1], columns=['A']) | DataFrame(
+                True, index=[1], columns=['A'])
+        pytest.raises(TypeError, f)
+
+        def f():
+            DataFrame('foo', index=[1], columns=['A']) | DataFrame(
+                True, index=[1], columns=['A'])
+        pytest.raises(TypeError, f)
+
+    def test_operators_none_as_na(self):
+        df = DataFrame({"col1": [2, 5.0, 123, None],
+                        "col2": [1, 2, 3, 4]}, dtype=object)
+
+        ops = [operator.add, operator.sub, operator.mul, operator.truediv]
+
+        # since filling converts dtypes from object, changed expected to be
+        # object
+        for op in ops:
+            filled = df.fillna(np.nan)
+            result = op(df, 3)
+            expected = op(filled, 3).astype(object)
+            expected[com.isna(expected)] = None
+            assert_frame_equal(result, expected)
+
+            result = op(df, df)
+            expected = op(filled, filled).astype(object)
+            expected[com.isna(expected)] = None
+            assert_frame_equal(result, expected)
+
+            result = op(df, df.fillna(7))
+            assert_frame_equal(result, expected)
+
+            result = op(df.fillna(7), df)
+            assert_frame_equal(result, expected, check_dtype=False)
+
+    def test_comparison_invalid(self):
+
+        def check(df, df2):
+
+            for (x, y) in [(df, df2), (df2, df)]:
+                pytest.raises(TypeError, lambda: x == y)
+                pytest.raises(TypeError, lambda: x != y)
+                pytest.raises(TypeError, lambda: x >= y)
+                pytest.raises(TypeError, lambda: x > y)
+                pytest.raises(TypeError, lambda: x < y)
+                pytest.raises(TypeError, lambda: x <= y)
+
+        # GH4968
+        # invalid date/int comparisons
+        df = DataFrame(np.random.randint(10, size=(10, 1)), columns=['a'])
+        df['dates'] = date_range('20010101', periods=len(df))
+
+        df2 = df.copy()
+        df2['dates'] = df['a']
+        check(df, df2)
+
+        df = DataFrame(np.random.randint(10, size=(10, 2)), columns=['a', 'b'])
+        df2 = DataFrame({'a': date_range('20010101', periods=len(
+            df)), 'b': date_range('20100101', periods=len(df))})
+        check(df, df2)
+
+    def test_timestamp_compare(self):
+        # make sure we can compare Timestamps on the right AND left hand side
+        # GH4982
+        df = DataFrame({'dates1': date_range('20010101', periods=10),
+                        'dates2': date_range('20010102', periods=10),
+                        'intcol': np.random.randint(1000000000, size=10),
+                        'floatcol': np.random.randn(10),
+                        'stringcol': list(tm.rands(10))})
+        df.loc[np.random.rand(len(df)) > 0.5, 'dates2'] = pd.NaT
+        ops = {'gt': 'lt', 'lt': 'gt', 'ge': 'le', 'le': 'ge', 'eq': 'eq',
+               'ne': 'ne'}
+
+        for left, right in ops.items():
+            left_f = getattr(operator, left)
+            right_f = getattr(operator, right)
+
+            # no nats
+            expected = left_f(df, Timestamp('20010109'))
+            result = right_f(Timestamp('20010109'), df)
+            assert_frame_equal(result, expected)
+
+            # nats
+            expected = left_f(df, Timestamp('nat'))
+            result = right_f(Timestamp('nat'), df)
+            assert_frame_equal(result, expected)
+
+    def test_logical_operators(self):
+
+        def _check_bin_op(op):
+            result = op(df1, df2)
+            expected = DataFrame(op(df1.values, df2.values), index=df1.index,
+                                 columns=df1.columns)
+            assert result.values.dtype == np.bool_
+            assert_frame_equal(result, expected)
+
+        def _check_unary_op(op):
+            result = op(df1)
+            expected = DataFrame(op(df1.values), index=df1.index,
+                                 columns=df1.columns)
+            assert result.values.dtype == np.bool_
+            assert_frame_equal(result, expected)
+
+        df1 = {'a': {'a': True, 'b': False, 'c': False, 'd': True, 'e': True},
+               'b': {'a': False, 'b': True, 'c': False,
+                     'd': False, 'e': False},
+               'c': {'a': False, 'b': False, 'c': True,
+                     'd': False, 'e': False},
+               'd': {'a': True, 'b': False, 'c': False, 'd': True, 'e': True},
+               'e': {'a': True, 'b': False, 'c': False, 'd': True, 'e': True}}
+
+        df2 = {'a': {'a': True, 'b': False, 'c': True, 'd': False, 'e': False},
+               'b': {'a': False, 'b': True, 'c': False,
+                     'd': False, 'e': False},
+               'c': {'a': True, 'b': False, 'c': True, 'd': False, 'e': False},
+               'd': {'a': False, 'b': False, 'c': False,
+                     'd': True, 'e': False},
+               'e': {'a': False, 'b': False, 'c': False,
+                     'd': False, 'e': True}}
+
+        df1 = DataFrame(df1)
+        df2 = DataFrame(df2)
+
+        _check_bin_op(operator.and_)
+        _check_bin_op(operator.or_)
+        _check_bin_op(operator.xor)
+
+        # operator.neg is deprecated in numpy >= 1.9
+        _check_unary_op(operator.inv)
+
+    @pytest.mark.parametrize('op,res', [('__eq__', False),
+                                        ('__ne__', True)])
+    def test_logical_typeerror_with_non_valid(self, op, res):
+        # we are comparing floats vs a string
+        result = getattr(self.frame, op)('foo')
+        assert bool(result.all().all()) is res
+
+    def test_logical_with_nas(self):
+        d = DataFrame({'a': [np.nan, False], 'b': [True, True]})
+
+        # GH4947
+        # bool comparisons should return bool
+        result = d['a'] | d['b']
+        expected = Series([False, True])
+        assert_series_equal(result, expected)
+
+        # GH4604, automatic casting here
+        result = d['a'].fillna(False) | d['b']
+        expected = Series([True, True])
+        assert_series_equal(result, expected)
+
+        result = d['a'].fillna(False, downcast=False) | d['b']
+        expected = Series([True, True])
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('df,expected', [
+        (pd.DataFrame({'a': [-1, 1]}), pd.DataFrame({'a': [1, -1]})),
+        (pd.DataFrame({'a': [False, True]}),
+            pd.DataFrame({'a': [True, False]})),
+        (pd.DataFrame({'a': pd.Series(pd.to_timedelta([-1, 1]))}),
+            pd.DataFrame({'a': pd.Series(pd.to_timedelta([1, -1]))}))
+    ])
+    def test_neg_numeric(self, df, expected):
+        assert_frame_equal(-df, expected)
+        assert_series_equal(-df['a'], expected['a'])
+
+    @pytest.mark.parametrize('df, expected', [
+        (np.array([1, 2], dtype=object), np.array([-1, -2], dtype=object)),
+        ([Decimal('1.0'), Decimal('2.0')], [Decimal('-1.0'), Decimal('-2.0')]),
+    ])
+    def test_neg_object(self, df, expected):
+        # GH 21380
+        df = pd.DataFrame({'a': df})
+        expected = pd.DataFrame({'a': expected})
+        assert_frame_equal(-df, expected)
+        assert_series_equal(-df['a'], expected['a'])
+
+    @pytest.mark.parametrize('df', [
+        pd.DataFrame({'a': ['a', 'b']}),
+        pd.DataFrame({'a': pd.to_datetime(['2017-01-22', '1970-01-01'])}),
+    ])
+    def test_neg_raises(self, df):
+        with pytest.raises(TypeError):
+            (- df)
+        with pytest.raises(TypeError):
+            (- df['a'])
+
+    def test_invert(self):
+        assert_frame_equal(-(self.frame < 0), ~(self.frame < 0))
+
+    @pytest.mark.parametrize('df', [
+        pd.DataFrame({'a': [-1, 1]}),
+        pd.DataFrame({'a': [False, True]}),
+        pd.DataFrame({'a': pd.Series(pd.to_timedelta([-1, 1]))}),
+    ])
+    def test_pos_numeric(self, df):
+        # GH 16073
+        assert_frame_equal(+df, df)
+        assert_series_equal(+df['a'], df['a'])
+
+    @pytest.mark.parametrize('df', [
+        pd.DataFrame({'a': ['a', 'b']}),
+        pd.DataFrame({'a': np.array([-1, 2], dtype=object)}),
+        pd.DataFrame({'a': [Decimal('-1.0'), Decimal('2.0')]}),
+    ])
+    def test_pos_object(self, df):
+        # GH 21380
+        assert_frame_equal(+df, df)
+        assert_series_equal(+df['a'], df['a'])
+
+    @pytest.mark.parametrize('df', [
+        pd.DataFrame({'a': pd.to_datetime(['2017-01-22', '1970-01-01'])}),
+    ])
+    def test_pos_raises(self, df):
+        with pytest.raises(TypeError):
+            (+ df)
+        with pytest.raises(TypeError):
+            (+ df['a'])
+
+    def test_arith_flex_frame(self):
+        ops = ['add', 'sub', 'mul', 'div', 'truediv', 'pow', 'floordiv', 'mod']
+        if not compat.PY3:
+            aliases = {}
+        else:
+            aliases = {'div': 'truediv'}
+
+        for op in ops:
+            try:
+                alias = aliases.get(op, op)
+                f = getattr(operator, alias)
+                result = getattr(self.frame, op)(2 * self.frame)
+                exp = f(self.frame, 2 * self.frame)
+                assert_frame_equal(result, exp)
+
+                # vs mix float
+                result = getattr(self.mixed_float, op)(2 * self.mixed_float)
+                exp = f(self.mixed_float, 2 * self.mixed_float)
+                assert_frame_equal(result, exp)
+                _check_mixed_float(result, dtype=dict(C=None))
+
+                # vs mix int
+                if op in ['add', 'sub', 'mul']:
+                    result = getattr(self.mixed_int, op)(2 + self.mixed_int)
+                    exp = f(self.mixed_int, 2 + self.mixed_int)
+
+                    # no overflow in the uint
+                    dtype = None
+                    if op in ['sub']:
+                        dtype = dict(B='uint64', C=None)
+                    elif op in ['add', 'mul']:
+                        dtype = dict(C=None)
+                    assert_frame_equal(result, exp)
+                    _check_mixed_int(result, dtype=dtype)
+
+                    # rops
+                    r_f = lambda x, y: f(y, x)
+                    result = getattr(self.frame, 'r' + op)(2 * self.frame)
+                    exp = r_f(self.frame, 2 * self.frame)
+                    assert_frame_equal(result, exp)
+
+                    # vs mix float
+                    result = getattr(self.mixed_float, op)(
+                        2 * self.mixed_float)
+                    exp = f(self.mixed_float, 2 * self.mixed_float)
+                    assert_frame_equal(result, exp)
+                    _check_mixed_float(result, dtype=dict(C=None))
+
+                    result = getattr(self.intframe, op)(2 * self.intframe)
+                    exp = f(self.intframe, 2 * self.intframe)
+                    assert_frame_equal(result, exp)
+
+                    # vs mix int
+                    if op in ['add', 'sub', 'mul']:
+                        result = getattr(self.mixed_int, op)(
+                            2 + self.mixed_int)
+                        exp = f(self.mixed_int, 2 + self.mixed_int)
+
+                        # no overflow in the uint
+                        dtype = None
+                        if op in ['sub']:
+                            dtype = dict(B='uint64', C=None)
+                        elif op in ['add', 'mul']:
+                            dtype = dict(C=None)
+                        assert_frame_equal(result, exp)
+                        _check_mixed_int(result, dtype=dtype)
+            except:
+                printing.pprint_thing("Failing operation %r" % op)
+                raise
+
+            # ndim >= 3
+            ndim_5 = np.ones(self.frame.shape + (3, 4, 5))
+            msg = "Unable to coerce to Series/DataFrame"
+            with tm.assert_raises_regex(ValueError, msg):
+                f(self.frame, ndim_5)
+
+            with tm.assert_raises_regex(ValueError, msg):
+                getattr(self.frame, op)(ndim_5)
+
+        # res_add = self.frame.add(self.frame)
+        # res_sub = self.frame.sub(self.frame)
+        # res_mul = self.frame.mul(self.frame)
+        # res_div = self.frame.div(2 * self.frame)
+
+        # assert_frame_equal(res_add, self.frame + self.frame)
+        # assert_frame_equal(res_sub, self.frame - self.frame)
+        # assert_frame_equal(res_mul, self.frame * self.frame)
+        # assert_frame_equal(res_div, self.frame / (2 * self.frame))
+
+        const_add = self.frame.add(1)
+        assert_frame_equal(const_add, self.frame + 1)
+
+        # corner cases
+        result = self.frame.add(self.frame[:0])
+        assert_frame_equal(result, self.frame * np.nan)
+
+        result = self.frame[:0].add(self.frame)
+        assert_frame_equal(result, self.frame * np.nan)
+        with tm.assert_raises_regex(NotImplementedError, 'fill_value'):
+            self.frame.add(self.frame.iloc[0], fill_value=3)
+        with tm.assert_raises_regex(NotImplementedError, 'fill_value'):
+            self.frame.add(self.frame.iloc[0], axis='index', fill_value=3)
+
+    def test_arith_flex_zero_len_raises(self):
+        # GH#19522 passing fill_value to frame flex arith methods should
+        # raise even in the zero-length special cases
+        ser_len0 = pd.Series([])
+        df_len0 = pd.DataFrame([], columns=['A', 'B'])
+        df = pd.DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
+
+        with tm.assert_raises_regex(NotImplementedError, 'fill_value'):
+            df.add(ser_len0, fill_value='E')
+
+        with tm.assert_raises_regex(NotImplementedError, 'fill_value'):
+            df_len0.sub(df['A'], axis=None, fill_value=3)
+
+    def test_binary_ops_align(self):
+
+        # test aligning binary ops
+
+        # GH 6681
+        index = MultiIndex.from_product([list('abc'),
+                                         ['one', 'two', 'three'],
+                                         [1, 2, 3]],
+                                        names=['first', 'second', 'third'])
+
+        df = DataFrame(np.arange(27 * 3).reshape(27, 3),
+                       index=index,
+                       columns=['value1', 'value2', 'value3']).sort_index()
+
+        idx = pd.IndexSlice
+        for op in ['add', 'sub', 'mul', 'div', 'truediv']:
+            opa = getattr(operator, op, None)
+            if opa is None:
+                continue
+
+            x = Series([1.0, 10.0, 100.0], [1, 2, 3])
+            result = getattr(df, op)(x, level='third', axis=0)
+
+            expected = pd.concat([opa(df.loc[idx[:, :, i], :], v)
+                                  for i, v in x.iteritems()]).sort_index()
+            assert_frame_equal(result, expected)
+
+            x = Series([1.0, 10.0], ['two', 'three'])
+            result = getattr(df, op)(x, level='second', axis=0)
+
+            expected = (pd.concat([opa(df.loc[idx[:, i], :], v)
+                                   for i, v in x.iteritems()])
+                        .reindex_like(df).sort_index())
+            assert_frame_equal(result, expected)
+
+        # GH9463 (alignment level of dataframe with series)
+
+        midx = MultiIndex.from_product([['A', 'B'], ['a', 'b']])
+        df = DataFrame(np.ones((2, 4), dtype='int64'), columns=midx)
+        s = pd.Series({'a': 1, 'b': 2})
+
+        df2 = df.copy()
+        df2.columns.names = ['lvl0', 'lvl1']
+        s2 = s.copy()
+        s2.index.name = 'lvl1'
+
+        # different cases of integer/string level names:
+        res1 = df.mul(s, axis=1, level=1)
+        res2 = df.mul(s2, axis=1, level=1)
+        res3 = df2.mul(s, axis=1, level=1)
+        res4 = df2.mul(s2, axis=1, level=1)
+        res5 = df2.mul(s, axis=1, level='lvl1')
+        res6 = df2.mul(s2, axis=1, level='lvl1')
+
+        exp = DataFrame(np.array([[1, 2, 1, 2], [1, 2, 1, 2]], dtype='int64'),
+                        columns=midx)
+
+        for res in [res1, res2]:
+            assert_frame_equal(res, exp)
+
+        exp.columns.names = ['lvl0', 'lvl1']
+        for res in [res3, res4, res5, res6]:
+            assert_frame_equal(res, exp)
+
+    def test_arith_mixed(self):
+
+        left = DataFrame({'A': ['a', 'b', 'c'],
+                          'B': [1, 2, 3]})
+
+        result = left + left
+        expected = DataFrame({'A': ['aa', 'bb', 'cc'],
+                              'B': [2, 4, 6]})
+        assert_frame_equal(result, expected)
+
+    def test_arith_getitem_commute(self):
+        df = DataFrame({'A': [1.1, 3.3], 'B': [2.5, -3.9]})
+
+        self._test_op(df, operator.add)
+        self._test_op(df, operator.sub)
+        self._test_op(df, operator.mul)
+        self._test_op(df, operator.truediv)
+        self._test_op(df, operator.floordiv)
+        self._test_op(df, operator.pow)
+
+        self._test_op(df, lambda x, y: y + x)
+        self._test_op(df, lambda x, y: y - x)
+        self._test_op(df, lambda x, y: y * x)
+        self._test_op(df, lambda x, y: y / x)
+        self._test_op(df, lambda x, y: y ** x)
+
+        self._test_op(df, lambda x, y: x + y)
+        self._test_op(df, lambda x, y: x - y)
+        self._test_op(df, lambda x, y: x * y)
+        self._test_op(df, lambda x, y: x / y)
+        self._test_op(df, lambda x, y: x ** y)
+
+    @staticmethod
+    def _test_op(df, op):
+        result = op(df, 1)
+
+        if not df.columns.is_unique:
+            raise ValueError("Only unique columns supported by this test")
+
+        for col in result.columns:
+            assert_series_equal(result[col], op(df[col], 1))
+
+    def test_bool_flex_frame(self):
+        data = np.random.randn(5, 3)
+        other_data = np.random.randn(5, 3)
+        df = DataFrame(data)
+        other = DataFrame(other_data)
+        ndim_5 = np.ones(df.shape + (1, 3))
+
+        # Unaligned
+        def _check_unaligned_frame(meth, op, df, other):
+            part_o = other.loc[3:, 1:].copy()
+            rs = meth(part_o)
+            xp = op(df, part_o.reindex(index=df.index, columns=df.columns))
+            assert_frame_equal(rs, xp)
+
+        # DataFrame
+        assert df.eq(df).values.all()
+        assert not df.ne(df).values.any()
+        for op in ['eq', 'ne', 'gt', 'lt', 'ge', 'le']:
+            f = getattr(df, op)
+            o = getattr(operator, op)
+            # No NAs
+            assert_frame_equal(f(other), o(df, other))
+            _check_unaligned_frame(f, o, df, other)
+            # ndarray
+            assert_frame_equal(f(other.values), o(df, other.values))
+            # scalar
+            assert_frame_equal(f(0), o(df, 0))
+            # NAs
+            msg = "Unable to coerce to Series/DataFrame"
+            assert_frame_equal(f(np.nan), o(df, np.nan))
+            with tm.assert_raises_regex(ValueError, msg):
+                f(ndim_5)
+
+        # Series
+        def _test_seq(df, idx_ser, col_ser):
+            idx_eq = df.eq(idx_ser, axis=0)
+            col_eq = df.eq(col_ser)
+            idx_ne = df.ne(idx_ser, axis=0)
+            col_ne = df.ne(col_ser)
+            assert_frame_equal(col_eq, df == Series(col_ser))
+            assert_frame_equal(col_eq, -col_ne)
+            assert_frame_equal(idx_eq, -idx_ne)
+            assert_frame_equal(idx_eq, df.T.eq(idx_ser).T)
+            assert_frame_equal(col_eq, df.eq(list(col_ser)))
+            assert_frame_equal(idx_eq, df.eq(Series(idx_ser), axis=0))
+            assert_frame_equal(idx_eq, df.eq(list(idx_ser), axis=0))
+
+            idx_gt = df.gt(idx_ser, axis=0)
+            col_gt = df.gt(col_ser)
+            idx_le = df.le(idx_ser, axis=0)
+            col_le = df.le(col_ser)
+
+            assert_frame_equal(col_gt, df > Series(col_ser))
+            assert_frame_equal(col_gt, -col_le)
+            assert_frame_equal(idx_gt, -idx_le)
+            assert_frame_equal(idx_gt, df.T.gt(idx_ser).T)
+
+            idx_ge = df.ge(idx_ser, axis=0)
+            col_ge = df.ge(col_ser)
+            idx_lt = df.lt(idx_ser, axis=0)
+            col_lt = df.lt(col_ser)
+            assert_frame_equal(col_ge, df >= Series(col_ser))
+            assert_frame_equal(col_ge, -col_lt)
+            assert_frame_equal(idx_ge, -idx_lt)
+            assert_frame_equal(idx_ge, df.T.ge(idx_ser).T)
+
+        idx_ser = Series(np.random.randn(5))
+        col_ser = Series(np.random.randn(3))
+        _test_seq(df, idx_ser, col_ser)
+
+        # list/tuple
+        _test_seq(df, idx_ser.values, col_ser.values)
+
+        # NA
+        df.loc[0, 0] = np.nan
+        rs = df.eq(df)
+        assert not rs.loc[0, 0]
+        rs = df.ne(df)
+        assert rs.loc[0, 0]
+        rs = df.gt(df)
+        assert not rs.loc[0, 0]
+        rs = df.lt(df)
+        assert not rs.loc[0, 0]
+        rs = df.ge(df)
+        assert not rs.loc[0, 0]
+        rs = df.le(df)
+        assert not rs.loc[0, 0]
+
+        # complex
+        arr = np.array([np.nan, 1, 6, np.nan])
+        arr2 = np.array([2j, np.nan, 7, None])
+        df = DataFrame({'a': arr})
+        df2 = DataFrame({'a': arr2})
+        rs = df.gt(df2)
+        assert not rs.values.any()
+        rs = df.ne(df2)
+        assert rs.values.all()
+
+        arr3 = np.array([2j, np.nan, None])
+        df3 = DataFrame({'a': arr3})
+        rs = df3.gt(2j)
+        assert not rs.values.any()
+
+        # corner, dtype=object
+        df1 = DataFrame({'col': ['foo', np.nan, 'bar']})
+        df2 = DataFrame({'col': ['foo', datetime.now(), 'bar']})
+        result = df1.ne(df2)
+        exp = DataFrame({'col': [False, True, False]})
+        assert_frame_equal(result, exp)
+
+    def test_dti_tz_convert_to_utc(self):
+        base = pd.DatetimeIndex(['2011-01-01', '2011-01-02',
+                                 '2011-01-03'], tz='UTC')
+        idx1 = base.tz_convert('Asia/Tokyo')[:2]
+        idx2 = base.tz_convert('US/Eastern')[1:]
+
+        df1 = DataFrame({'A': [1, 2]}, index=idx1)
+        df2 = DataFrame({'A': [1, 1]}, index=idx2)
+        exp = DataFrame({'A': [np.nan, 3, np.nan]}, index=base)
+        assert_frame_equal(df1 + df2, exp)
+
+    def test_arith_flex_series(self):
+        df = self.simple
+
+        row = df.xs('a')
+        col = df['two']
+        # after arithmetic refactor, add truediv here
+        ops = ['add', 'sub', 'mul', 'mod']
+        for op in ops:
+            f = getattr(df, op)
+            op = getattr(operator, op)
+            assert_frame_equal(f(row), op(df, row))
+            assert_frame_equal(f(col, axis=0), op(df.T, col).T)
+
+        # special case for some reason
+        assert_frame_equal(df.add(row, axis=None), df + row)
+
+        # cases which will be refactored after big arithmetic refactor
+        assert_frame_equal(df.div(row), df / row)
+        assert_frame_equal(df.div(col, axis=0), (df.T / col).T)
+
+        # broadcasting issue in GH7325
+        df = DataFrame(np.arange(3 * 2).reshape((3, 2)), dtype='int64')
+        expected = DataFrame([[nan, np.inf], [1.0, 1.5], [1.0, 1.25]])
+        result = df.div(df[0], axis='index')
+        assert_frame_equal(result, expected)
+
+        df = DataFrame(np.arange(3 * 2).reshape((3, 2)), dtype='float64')
+        expected = DataFrame([[np.nan, np.inf], [1.0, 1.5], [1.0, 1.25]])
+        result = df.div(df[0], axis='index')
+        assert_frame_equal(result, expected)
+
+    def test_arith_non_pandas_object(self):
+        df = self.simple
+
+        val1 = df.xs('a').values
+        added = DataFrame(df.values + val1, index=df.index, columns=df.columns)
+        assert_frame_equal(df + val1, added)
+
+        added = DataFrame((df.values.T + val1).T,
+                          index=df.index, columns=df.columns)
+        assert_frame_equal(df.add(val1, axis=0), added)
+
+        val2 = list(df['two'])
+
+        added = DataFrame(df.values + val2, index=df.index, columns=df.columns)
+        assert_frame_equal(df + val2, added)
+
+        added = DataFrame((df.values.T + val2).T, index=df.index,
+                          columns=df.columns)
+        assert_frame_equal(df.add(val2, axis='index'), added)
+
+        val3 = np.random.rand(*df.shape)
+        added = DataFrame(df.values + val3, index=df.index, columns=df.columns)
+        assert_frame_equal(df.add(val3), added)
+
+    @pytest.mark.parametrize('values', [[1, 2], (1, 2), np.array([1, 2]),
+                                        range(1, 3), deque([1, 2])])
+    def test_arith_alignment_non_pandas_object(self, values):
+        # GH 17901
+        df = DataFrame({'A': [1, 1], 'B': [1, 1]})
+        expected = DataFrame({'A': [2, 2], 'B': [3, 3]})
+        result = df + values
+        assert_frame_equal(result, expected)
+
+    def test_combineFrame(self):
+        frame_copy = self.frame.reindex(self.frame.index[::2])
+
+        del frame_copy['D']
+        frame_copy['C'][:5] = nan
+
+        added = self.frame + frame_copy
+
+        indexer = added['A'].dropna().index
+        exp = (self.frame['A'] * 2).copy()
+
+        tm.assert_series_equal(added['A'].dropna(), exp.loc[indexer])
+
+        exp.loc[~exp.index.isin(indexer)] = np.nan
+        tm.assert_series_equal(added['A'], exp.loc[added['A'].index])
+
+        assert np.isnan(added['C'].reindex(frame_copy.index)[:5]).all()
+
+        # assert(False)
+
+        assert np.isnan(added['D']).all()
+
+        self_added = self.frame + self.frame
+        tm.assert_index_equal(self_added.index, self.frame.index)
+
+        added_rev = frame_copy + self.frame
+        assert np.isnan(added['D']).all()
+        assert np.isnan(added_rev['D']).all()
+
+        # corner cases
+
+        # empty
+        plus_empty = self.frame + self.empty
+        assert np.isnan(plus_empty.values).all()
+
+        empty_plus = self.empty + self.frame
+        assert np.isnan(empty_plus.values).all()
+
+        empty_empty = self.empty + self.empty
+        assert empty_empty.empty
+
+        # out of order
+        reverse = self.frame.reindex(columns=self.frame.columns[::-1])
+
+        assert_frame_equal(reverse + self.frame, self.frame * 2)
+
+        # mix vs float64, upcast
+        added = self.frame + self.mixed_float
+        _check_mixed_float(added, dtype='float64')
+        added = self.mixed_float + self.frame
+        _check_mixed_float(added, dtype='float64')
+
+        # mix vs mix
+        added = self.mixed_float + self.mixed_float2
+        _check_mixed_float(added, dtype=dict(C=None))
+        added = self.mixed_float2 + self.mixed_float
+        _check_mixed_float(added, dtype=dict(C=None))
+
+        # with int
+        added = self.frame + self.mixed_int
+        _check_mixed_float(added, dtype='float64')
+
+    def test_combineSeries(self):
+
+        # Series
+        series = self.frame.xs(self.frame.index[0])
+
+        added = self.frame + series
+
+        for key, s in compat.iteritems(added):
+            assert_series_equal(s, self.frame[key] + series[key])
+
+        larger_series = series.to_dict()
+        larger_series['E'] = 1
+        larger_series = Series(larger_series)
+        larger_added = self.frame + larger_series
+
+        for key, s in compat.iteritems(self.frame):
+            assert_series_equal(larger_added[key], s + series[key])
+        assert 'E' in larger_added
+        assert np.isnan(larger_added['E']).all()
+
+        # no upcast needed
+        added = self.mixed_float + series
+        _check_mixed_float(added)
+
+        # vs mix (upcast) as needed
+        added = self.mixed_float + series.astype('float32')
+        _check_mixed_float(added, dtype=dict(C=None))
+        added = self.mixed_float + series.astype('float16')
+        _check_mixed_float(added, dtype=dict(C=None))
+
+        # these raise with numexpr.....as we are adding an int64 to an
+        # uint64....weird vs int
+
+        # added = self.mixed_int + (100*series).astype('int64')
+        # _check_mixed_int(added, dtype = dict(A = 'int64', B = 'float64', C =
+        # 'int64', D = 'int64'))
+        # added = self.mixed_int + (100*series).astype('int32')
+        # _check_mixed_int(added, dtype = dict(A = 'int32', B = 'float64', C =
+        # 'int32', D = 'int64'))
+
+        # TimeSeries
+        ts = self.tsframe['A']
+
+        # 10890
+        # we no longer allow auto timeseries broadcasting
+        # and require explicit broadcasting
+        added = self.tsframe.add(ts, axis='index')
+
+        for key, col in compat.iteritems(self.tsframe):
+            result = col + ts
+            assert_series_equal(added[key], result, check_names=False)
+            assert added[key].name == key
+            if col.name == ts.name:
+                assert result.name == 'A'
+            else:
+                assert result.name is None
+
+        smaller_frame = self.tsframe[:-5]
+        smaller_added = smaller_frame.add(ts, axis='index')
+
+        tm.assert_index_equal(smaller_added.index, self.tsframe.index)
+
+        smaller_ts = ts[:-5]
+        smaller_added2 = self.tsframe.add(smaller_ts, axis='index')
+        assert_frame_equal(smaller_added, smaller_added2)
+
+        # length 0, result is all-nan
+        result = self.tsframe.add(ts[:0], axis='index')
+        expected = DataFrame(np.nan, index=self.tsframe.index,
+                             columns=self.tsframe.columns)
+        assert_frame_equal(result, expected)
+
+        # Frame is all-nan
+        result = self.tsframe[:0].add(ts, axis='index')
+        expected = DataFrame(np.nan, index=self.tsframe.index,
+                             columns=self.tsframe.columns)
+        assert_frame_equal(result, expected)
+
+        # empty but with non-empty index
+        frame = self.tsframe[:1].reindex(columns=[])
+        result = frame.mul(ts, axis='index')
+        assert len(result) == len(ts)
+
+    def test_combineFunc(self):
+        result = self.frame * 2
+        tm.assert_numpy_array_equal(result.values, self.frame.values * 2)
+
+        # vs mix
+        result = self.mixed_float * 2
+        for c, s in compat.iteritems(result):
+            tm.assert_numpy_array_equal(
+                s.values, self.mixed_float[c].values * 2)
+        _check_mixed_float(result, dtype=dict(C=None))
+
+        result = self.empty * 2
+        assert result.index is self.empty.index
+        assert len(result.columns) == 0
+
+    def test_comparisons(self):
+        df1 = tm.makeTimeDataFrame()
+        df2 = tm.makeTimeDataFrame()
+
+        row = self.simple.xs('a')
+        ndim_5 = np.ones(df1.shape + (1, 1, 1))
+
+        def test_comp(func):
+            result = func(df1, df2)
+            tm.assert_numpy_array_equal(result.values,
+                                        func(df1.values, df2.values))
+            with tm.assert_raises_regex(ValueError,
+                                        'Wrong number of dimensions'):
+                func(df1, ndim_5)
+
+            result2 = func(self.simple, row)
+            tm.assert_numpy_array_equal(result2.values,
+                                        func(self.simple.values, row.values))
+
+            result3 = func(self.frame, 0)
+            tm.assert_numpy_array_equal(result3.values,
+                                        func(self.frame.values, 0))
+
+            with tm.assert_raises_regex(ValueError,
+                                        'Can only compare identically'
+                                        '-labeled DataFrame'):
+                func(self.simple, self.simple[:2])
+
+        test_comp(operator.eq)
+        test_comp(operator.ne)
+        test_comp(operator.lt)
+        test_comp(operator.gt)
+        test_comp(operator.ge)
+        test_comp(operator.le)
+
+    def test_comparison_protected_from_errstate(self):
+        missing_df = tm.makeDataFrame()
+        missing_df.iloc[0]['A'] = np.nan
+        with np.errstate(invalid='ignore'):
+            expected = missing_df.values < 0
+        with np.errstate(invalid='raise'):
+            result = (missing_df < 0).values
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_boolean_comparison(self):
+
+        # GH 4576
+        # boolean comparisons with a tuple/list give unexpected results
+        df = DataFrame(np.arange(6).reshape((3, 2)))
+        b = np.array([2, 2])
+        b_r = np.atleast_2d([2, 2])
+        b_c = b_r.T
+        l = (2, 2, 2)
+        tup = tuple(l)
+
+        # gt
+        expected = DataFrame([[False, False], [False, True], [True, True]])
+        result = df > b
+        assert_frame_equal(result, expected)
+
+        result = df.values > b
+        assert_numpy_array_equal(result, expected.values)
+
+        result = df > l
+        assert_frame_equal(result, expected)
+
+        result = df > tup
+        assert_frame_equal(result, expected)
+
+        result = df > b_r
+        assert_frame_equal(result, expected)
+
+        result = df.values > b_r
+        assert_numpy_array_equal(result, expected.values)
+
+        pytest.raises(ValueError, df.__gt__, b_c)
+        pytest.raises(ValueError, df.values.__gt__, b_c)
+
+        # ==
+        expected = DataFrame([[False, False], [True, False], [False, False]])
+        result = df == b
+        assert_frame_equal(result, expected)
+
+        result = df == l
+        assert_frame_equal(result, expected)
+
+        result = df == tup
+        assert_frame_equal(result, expected)
+
+        result = df == b_r
+        assert_frame_equal(result, expected)
+
+        result = df.values == b_r
+        assert_numpy_array_equal(result, expected.values)
+
+        pytest.raises(ValueError, lambda: df == b_c)
+        assert df.values.shape != b_c.shape
+
+        # with alignment
+        df = DataFrame(np.arange(6).reshape((3, 2)),
+                       columns=list('AB'), index=list('abc'))
+        expected.index = df.index
+        expected.columns = df.columns
+
+        result = df == l
+        assert_frame_equal(result, expected)
+
+        result = df == tup
+        assert_frame_equal(result, expected)
+
+    def test_combine_generic(self):
+        df1 = self.frame
+        df2 = self.frame.loc[self.frame.index[:-5], ['A', 'B', 'C']]
+
+        combined = df1.combine(df2, np.add)
+        combined2 = df2.combine(df1, np.add)
+        assert combined['D'].isna().all()
+        assert combined2['D'].isna().all()
+
+        chunk = combined.loc[combined.index[:-5], ['A', 'B', 'C']]
+        chunk2 = combined2.loc[combined2.index[:-5], ['A', 'B', 'C']]
+
+        exp = self.frame.loc[self.frame.index[:-5],
+                             ['A', 'B', 'C']].reindex_like(chunk) * 2
+        assert_frame_equal(chunk, exp)
+        assert_frame_equal(chunk2, exp)
+
+    def test_inplace_ops_alignment(self):
+
+        # inplace ops / ops alignment
+        # GH 8511
+
+        columns = list('abcdefg')
+        X_orig = DataFrame(np.arange(10 * len(columns))
+                           .reshape(-1, len(columns)),
+                           columns=columns, index=range(10))
+        Z = 100 * X_orig.iloc[:, 1:-1].copy()
+        block1 = list('bedcf')
+        subs = list('bcdef')
+
+        # add
+        X = X_orig.copy()
+        result1 = (X[block1] + Z).reindex(columns=subs)
+
+        X[block1] += Z
+        result2 = X.reindex(columns=subs)
+
+        X = X_orig.copy()
+        result3 = (X[block1] + Z[block1]).reindex(columns=subs)
+
+        X[block1] += Z[block1]
+        result4 = X.reindex(columns=subs)
+
+        assert_frame_equal(result1, result2)
+        assert_frame_equal(result1, result3)
+        assert_frame_equal(result1, result4)
+
+        # sub
+        X = X_orig.copy()
+        result1 = (X[block1] - Z).reindex(columns=subs)
+
+        X[block1] -= Z
+        result2 = X.reindex(columns=subs)
+
+        X = X_orig.copy()
+        result3 = (X[block1] - Z[block1]).reindex(columns=subs)
+
+        X[block1] -= Z[block1]
+        result4 = X.reindex(columns=subs)
+
+        assert_frame_equal(result1, result2)
+        assert_frame_equal(result1, result3)
+        assert_frame_equal(result1, result4)
+
+    def test_inplace_ops_identity(self):
+
+        # GH 5104
+        # make sure that we are actually changing the object
+        s_orig = Series([1, 2, 3])
+        df_orig = DataFrame(np.random.randint(0, 5, size=10).reshape(-1, 5))
+
+        # no dtype change
+        s = s_orig.copy()
+        s2 = s
+        s += 1
+        assert_series_equal(s, s2)
+        assert_series_equal(s_orig + 1, s)
+        assert s is s2
+        assert s._data is s2._data
+
+        df = df_orig.copy()
+        df2 = df
+        df += 1
+        assert_frame_equal(df, df2)
+        assert_frame_equal(df_orig + 1, df)
+        assert df is df2
+        assert df._data is df2._data
+
+        # dtype change
+        s = s_orig.copy()
+        s2 = s
+        s += 1.5
+        assert_series_equal(s, s2)
+        assert_series_equal(s_orig + 1.5, s)
+
+        df = df_orig.copy()
+        df2 = df
+        df += 1.5
+        assert_frame_equal(df, df2)
+        assert_frame_equal(df_orig + 1.5, df)
+        assert df is df2
+        assert df._data is df2._data
+
+        # mixed dtype
+        arr = np.random.randint(0, 10, size=5)
+        df_orig = DataFrame({'A': arr.copy(), 'B': 'foo'})
+        df = df_orig.copy()
+        df2 = df
+        df['A'] += 1
+        expected = DataFrame({'A': arr.copy() + 1, 'B': 'foo'})
+        assert_frame_equal(df, expected)
+        assert_frame_equal(df2, expected)
+        assert df._data is df2._data
+
+        df = df_orig.copy()
+        df2 = df
+        df['A'] += 1.5
+        expected = DataFrame({'A': arr.copy() + 1.5, 'B': 'foo'})
+        assert_frame_equal(df, expected)
+        assert_frame_equal(df2, expected)
+        assert df._data is df2._data
+
+    @pytest.mark.parametrize('op', ['add', 'and', 'div', 'floordiv', 'mod',
+                                    'mul', 'or', 'pow', 'sub', 'truediv',
+                                    'xor'])
+    def test_inplace_ops_identity2(self, op):
+
+        if compat.PY3 and op == 'div':
+            return
+
+        df = DataFrame({'a': [1., 2., 3.],
+                        'b': [1, 2, 3]})
+
+        operand = 2
+        if op in ('and', 'or', 'xor'):
+            # cannot use floats for boolean ops
+            df['a'] = [True, False, True]
+
+        df_copy = df.copy()
+        iop = '__i{}__'.format(op)
+        op = '__{}__'.format(op)
+
+        # no id change and value is correct
+        getattr(df, iop)(operand)
+        expected = getattr(df_copy, op)(operand)
+        assert_frame_equal(df, expected)
+        expected = id(df)
+        assert id(df) == expected
+
+    def test_alignment_non_pandas(self):
+        index = ['A', 'B', 'C']
+        columns = ['X', 'Y', 'Z']
+        df = pd.DataFrame(np.random.randn(3, 3), index=index, columns=columns)
+
+        align = pd.core.ops._align_method_FRAME
+        for val in [[1, 2, 3], (1, 2, 3), np.array([1, 2, 3], dtype=np.int64),
+                    range(1, 4)]:
+
+            tm.assert_series_equal(align(df, val, 'index'),
+                                   Series([1, 2, 3], index=df.index))
+            tm.assert_series_equal(align(df, val, 'columns'),
+                                   Series([1, 2, 3], index=df.columns))
+
+        # length mismatch
+        msg = 'Unable to coerce to Series, length must be 3: given 2'
+        for val in [[1, 2], (1, 2), np.array([1, 2]), range(1, 3)]:
+
+            with tm.assert_raises_regex(ValueError, msg):
+                align(df, val, 'index')
+
+            with tm.assert_raises_regex(ValueError, msg):
+                align(df, val, 'columns')
+
+        val = np.array([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
+        tm.assert_frame_equal(align(df, val, 'index'),
+                              DataFrame(val, index=df.index,
+                                        columns=df.columns))
+        tm.assert_frame_equal(align(df, val, 'columns'),
+                              DataFrame(val, index=df.index,
+                                        columns=df.columns))
+
+        # shape mismatch
+        msg = 'Unable to coerce to DataFrame, shape must be'
+        val = np.array([[1, 2, 3], [4, 5, 6]])
+        with tm.assert_raises_regex(ValueError, msg):
+            align(df, val, 'index')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            align(df, val, 'columns')
+
+        val = np.zeros((3, 3, 3))
+        with pytest.raises(ValueError):
+            align(df, val, 'index')
+        with pytest.raises(ValueError):
+            align(df, val, 'columns')
diff --git a/pandas/tests/frame/test_period.py b/pandas/tests/frame/test_period.py
new file mode 100644
index 0000000000000..482210966fe6b
--- /dev/null
+++ b/pandas/tests/frame/test_period.py
@@ -0,0 +1,140 @@
+import numpy as np
+from numpy.random import randn
+from datetime import timedelta
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import (PeriodIndex, period_range, DataFrame, date_range,
+                    Index, to_datetime, DatetimeIndex)
+
+
+def _permute(obj):
+    return obj.take(np.random.permutation(len(obj)))
+
+
+class TestPeriodIndex(object):
+
+    def setup_method(self, method):
+        pass
+
+    def test_as_frame_columns(self):
+        rng = period_range('1/1/2000', periods=5)
+        df = DataFrame(randn(10, 5), columns=rng)
+
+        ts = df[rng[0]]
+        tm.assert_series_equal(ts, df.iloc[:, 0])
+
+        # GH # 1211
+        repr(df)
+
+        ts = df['1/1/2000']
+        tm.assert_series_equal(ts, df.iloc[:, 0])
+
+    def test_frame_setitem(self):
+        rng = period_range('1/1/2000', periods=5, name='index')
+        df = DataFrame(randn(5, 3), index=rng)
+
+        df['Index'] = rng
+        rs = Index(df['Index'])
+        tm.assert_index_equal(rs, rng, check_names=False)
+        assert rs.name == 'Index'
+        assert rng.name == 'index'
+
+        rs = df.reset_index().set_index('index')
+        assert isinstance(rs.index, PeriodIndex)
+        tm.assert_index_equal(rs.index, rng)
+
+    def test_frame_to_time_stamp(self):
+        K = 5
+        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
+        df = DataFrame(randn(len(index), K), index=index)
+        df['mix'] = 'a'
+
+        exp_index = date_range('1/1/2001', end='12/31/2009', freq='A-DEC')
+        result = df.to_timestamp('D', 'end')
+        tm.assert_index_equal(result.index, exp_index)
+        tm.assert_numpy_array_equal(result.values, df.values)
+
+        exp_index = date_range('1/1/2001', end='1/1/2009', freq='AS-JAN')
+        result = df.to_timestamp('D', 'start')
+        tm.assert_index_equal(result.index, exp_index)
+
+        def _get_with_delta(delta, freq='A-DEC'):
+            return date_range(to_datetime('1/1/2001') + delta,
+                              to_datetime('12/31/2009') + delta, freq=freq)
+
+        delta = timedelta(hours=23)
+        result = df.to_timestamp('H', 'end')
+        exp_index = _get_with_delta(delta)
+        tm.assert_index_equal(result.index, exp_index)
+
+        delta = timedelta(hours=23, minutes=59)
+        result = df.to_timestamp('T', 'end')
+        exp_index = _get_with_delta(delta)
+        tm.assert_index_equal(result.index, exp_index)
+
+        result = df.to_timestamp('S', 'end')
+        delta = timedelta(hours=23, minutes=59, seconds=59)
+        exp_index = _get_with_delta(delta)
+        tm.assert_index_equal(result.index, exp_index)
+
+        # columns
+        df = df.T
+
+        exp_index = date_range('1/1/2001', end='12/31/2009', freq='A-DEC')
+        result = df.to_timestamp('D', 'end', axis=1)
+        tm.assert_index_equal(result.columns, exp_index)
+        tm.assert_numpy_array_equal(result.values, df.values)
+
+        exp_index = date_range('1/1/2001', end='1/1/2009', freq='AS-JAN')
+        result = df.to_timestamp('D', 'start', axis=1)
+        tm.assert_index_equal(result.columns, exp_index)
+
+        delta = timedelta(hours=23)
+        result = df.to_timestamp('H', 'end', axis=1)
+        exp_index = _get_with_delta(delta)
+        tm.assert_index_equal(result.columns, exp_index)
+
+        delta = timedelta(hours=23, minutes=59)
+        result = df.to_timestamp('T', 'end', axis=1)
+        exp_index = _get_with_delta(delta)
+        tm.assert_index_equal(result.columns, exp_index)
+
+        result = df.to_timestamp('S', 'end', axis=1)
+        delta = timedelta(hours=23, minutes=59, seconds=59)
+        exp_index = _get_with_delta(delta)
+        tm.assert_index_equal(result.columns, exp_index)
+
+        # invalid axis
+        tm.assert_raises_regex(
+            ValueError, 'axis', df.to_timestamp, axis=2)
+
+        result1 = df.to_timestamp('5t', axis=1)
+        result2 = df.to_timestamp('t', axis=1)
+        expected = pd.date_range('2001-01-01', '2009-01-01', freq='AS')
+        assert isinstance(result1.columns, DatetimeIndex)
+        assert isinstance(result2.columns, DatetimeIndex)
+        tm.assert_numpy_array_equal(result1.columns.asi8, expected.asi8)
+        tm.assert_numpy_array_equal(result2.columns.asi8, expected.asi8)
+        # PeriodIndex.to_timestamp always use 'infer'
+        assert result1.columns.freqstr == 'AS-JAN'
+        assert result2.columns.freqstr == 'AS-JAN'
+
+    def test_frame_index_to_string(self):
+        index = PeriodIndex(['2011-1', '2011-2', '2011-3'], freq='M')
+        frame = DataFrame(np.random.randn(3, 4), index=index)
+
+        # it works!
+        frame.to_string()
+
+    def test_align_frame(self):
+        rng = period_range('1/1/2000', '1/1/2010', freq='A')
+        ts = DataFrame(np.random.randn(len(rng), 3), index=rng)
+
+        result = ts + ts[::2]
+        expected = ts + ts
+        expected.values[1::2] = np.nan
+        tm.assert_frame_equal(result, expected)
+
+        result = ts + _permute(ts[::2])
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_quantile.py b/pandas/tests/frame/test_quantile.py
new file mode 100644
index 0000000000000..2f264874378bc
--- /dev/null
+++ b/pandas/tests/frame/test_quantile.py
@@ -0,0 +1,393 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+
+import pytest
+import numpy as np
+
+from pandas import (DataFrame, Series, Timestamp, _np_version_under1p11)
+import pandas as pd
+
+from pandas.util.testing import assert_series_equal, assert_frame_equal
+
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+class TestDataFrameQuantile(TestData):
+
+    def test_quantile(self):
+        from numpy import percentile
+
+        q = self.tsframe.quantile(0.1, axis=0)
+        assert q['A'] == percentile(self.tsframe['A'], 10)
+        tm.assert_index_equal(q.index, self.tsframe.columns)
+
+        q = self.tsframe.quantile(0.9, axis=1)
+        assert (q['2000-01-17'] ==
+                percentile(self.tsframe.loc['2000-01-17'], 90))
+        tm.assert_index_equal(q.index, self.tsframe.index)
+
+        # test degenerate case
+        q = DataFrame({'x': [], 'y': []}).quantile(0.1, axis=0)
+        assert(np.isnan(q['x']) and np.isnan(q['y']))
+
+        # non-numeric exclusion
+        df = DataFrame({'col1': ['A', 'A', 'B', 'B'], 'col2': [1, 2, 3, 4]})
+        rs = df.quantile(0.5)
+        xp = df.median().rename(0.5)
+        assert_series_equal(rs, xp)
+
+        # axis
+        df = DataFrame({"A": [1, 2, 3], "B": [2, 3, 4]}, index=[1, 2, 3])
+        result = df.quantile(.5, axis=1)
+        expected = Series([1.5, 2.5, 3.5], index=[1, 2, 3], name=0.5)
+        assert_series_equal(result, expected)
+
+        result = df.quantile([.5, .75], axis=1)
+        expected = DataFrame({1: [1.5, 1.75], 2: [2.5, 2.75],
+                              3: [3.5, 3.75]}, index=[0.5, 0.75])
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        # We may want to break API in the future to change this
+        # so that we exclude non-numeric along the same axis
+        # See GH #7312
+        df = DataFrame([[1, 2, 3],
+                        ['a', 'b', 4]])
+        result = df.quantile(.5, axis=1)
+        expected = Series([3., 4.], index=[0, 1], name=0.5)
+        assert_series_equal(result, expected)
+
+    def test_quantile_axis_mixed(self):
+
+        # mixed on axis=1
+        df = DataFrame({"A": [1, 2, 3],
+                        "B": [2., 3., 4.],
+                        "C": pd.date_range('20130101', periods=3),
+                        "D": ['foo', 'bar', 'baz']})
+        result = df.quantile(.5, axis=1)
+        expected = Series([1.5, 2.5, 3.5], name=0.5)
+        assert_series_equal(result, expected)
+
+        # must raise
+        def f():
+            df.quantile(.5, axis=1, numeric_only=False)
+        pytest.raises(TypeError, f)
+
+    def test_quantile_axis_parameter(self):
+        # GH 9543/9544
+
+        df = DataFrame({"A": [1, 2, 3], "B": [2, 3, 4]}, index=[1, 2, 3])
+
+        result = df.quantile(.5, axis=0)
+
+        expected = Series([2., 3.], index=["A", "B"], name=0.5)
+        assert_series_equal(result, expected)
+
+        expected = df.quantile(.5, axis="index")
+        assert_series_equal(result, expected)
+
+        result = df.quantile(.5, axis=1)
+
+        expected = Series([1.5, 2.5, 3.5], index=[1, 2, 3], name=0.5)
+        assert_series_equal(result, expected)
+
+        result = df.quantile(.5, axis="columns")
+        assert_series_equal(result, expected)
+
+        pytest.raises(ValueError, df.quantile, 0.1, axis=-1)
+        pytest.raises(ValueError, df.quantile, 0.1, axis="column")
+
+    def test_quantile_interpolation(self):
+        # see gh-10174
+        from numpy import percentile
+
+        # interpolation = linear (default case)
+        q = self.tsframe.quantile(0.1, axis=0, interpolation='linear')
+        assert q['A'] == percentile(self.tsframe['A'], 10)
+        q = self.intframe.quantile(0.1)
+        assert q['A'] == percentile(self.intframe['A'], 10)
+
+        # test with and without interpolation keyword
+        q1 = self.intframe.quantile(0.1)
+        assert q1['A'] == np.percentile(self.intframe['A'], 10)
+        tm.assert_series_equal(q, q1)
+
+        # interpolation method other than default linear
+        df = DataFrame({"A": [1, 2, 3], "B": [2, 3, 4]}, index=[1, 2, 3])
+        result = df.quantile(.5, axis=1, interpolation='nearest')
+        expected = Series([1, 2, 3], index=[1, 2, 3], name=0.5)
+        tm.assert_series_equal(result, expected)
+
+        # cross-check interpolation=nearest results in original dtype
+        exp = np.percentile(np.array([[1, 2, 3], [2, 3, 4]]), .5,
+                            axis=0, interpolation='nearest')
+        expected = Series(exp, index=[1, 2, 3], name=0.5, dtype='int64')
+        tm.assert_series_equal(result, expected)
+
+        # float
+        df = DataFrame({"A": [1., 2., 3.], "B": [2., 3., 4.]}, index=[1, 2, 3])
+        result = df.quantile(.5, axis=1, interpolation='nearest')
+        expected = Series([1., 2., 3.], index=[1, 2, 3], name=0.5)
+        tm.assert_series_equal(result, expected)
+        exp = np.percentile(np.array([[1., 2., 3.], [2., 3., 4.]]), .5,
+                            axis=0, interpolation='nearest')
+        expected = Series(exp, index=[1, 2, 3], name=0.5, dtype='float64')
+        assert_series_equal(result, expected)
+
+        # axis
+        result = df.quantile([.5, .75], axis=1, interpolation='lower')
+        expected = DataFrame({1: [1., 1.], 2: [2., 2.],
+                              3: [3., 3.]}, index=[0.5, 0.75])
+        assert_frame_equal(result, expected)
+
+        # test degenerate case
+        df = DataFrame({'x': [], 'y': []})
+        q = df.quantile(0.1, axis=0, interpolation='higher')
+        assert(np.isnan(q['x']) and np.isnan(q['y']))
+
+        # multi
+        df = DataFrame([[1, 1, 1], [2, 2, 2], [3, 3, 3]],
+                       columns=['a', 'b', 'c'])
+        result = df.quantile([.25, .5], interpolation='midpoint')
+
+        # https://github.com/numpy/numpy/issues/7163
+        if _np_version_under1p11:
+            expected = DataFrame([[1.5, 1.5, 1.5], [2.5, 2.5, 2.5]],
+                                 index=[.25, .5], columns=['a', 'b', 'c'])
+        else:
+            expected = DataFrame([[1.5, 1.5, 1.5], [2.0, 2.0, 2.0]],
+                                 index=[.25, .5], columns=['a', 'b', 'c'])
+        assert_frame_equal(result, expected)
+
+    def test_quantile_multi(self):
+        df = DataFrame([[1, 1, 1], [2, 2, 2], [3, 3, 3]],
+                       columns=['a', 'b', 'c'])
+        result = df.quantile([.25, .5])
+        expected = DataFrame([[1.5, 1.5, 1.5], [2., 2., 2.]],
+                             index=[.25, .5], columns=['a', 'b', 'c'])
+        assert_frame_equal(result, expected)
+
+        # axis = 1
+        result = df.quantile([.25, .5], axis=1)
+        expected = DataFrame([[1.5, 1.5, 1.5], [2., 2., 2.]],
+                             index=[.25, .5], columns=[0, 1, 2])
+
+        # empty
+        result = DataFrame({'x': [], 'y': []}).quantile([0.1, .9], axis=0)
+        expected = DataFrame({'x': [np.nan, np.nan], 'y': [np.nan, np.nan]},
+                             index=[.1, .9])
+        assert_frame_equal(result, expected)
+
+    def test_quantile_datetime(self):
+        df = DataFrame({'a': pd.to_datetime(['2010', '2011']), 'b': [0, 5]})
+
+        # exclude datetime
+        result = df.quantile(.5)
+        expected = Series([2.5], index=['b'])
+
+        # datetime
+        result = df.quantile(.5, numeric_only=False)
+        expected = Series([Timestamp('2010-07-02 12:00:00'), 2.5],
+                          index=['a', 'b'],
+                          name=0.5)
+        assert_series_equal(result, expected)
+
+        # datetime w/ multi
+        result = df.quantile([.5], numeric_only=False)
+        expected = DataFrame([[Timestamp('2010-07-02 12:00:00'), 2.5]],
+                             index=[.5], columns=['a', 'b'])
+        assert_frame_equal(result, expected)
+
+        # axis = 1
+        df['c'] = pd.to_datetime(['2011', '2012'])
+        result = df[['a', 'c']].quantile(.5, axis=1, numeric_only=False)
+        expected = Series([Timestamp('2010-07-02 12:00:00'),
+                           Timestamp('2011-07-02 12:00:00')],
+                          index=[0, 1],
+                          name=0.5)
+        assert_series_equal(result, expected)
+
+        result = df[['a', 'c']].quantile([.5], axis=1, numeric_only=False)
+        expected = DataFrame([[Timestamp('2010-07-02 12:00:00'),
+                               Timestamp('2011-07-02 12:00:00')]],
+                             index=[0.5], columns=[0, 1])
+        assert_frame_equal(result, expected)
+
+        # empty when numeric_only=True
+        # FIXME (gives empty frame in 0.18.1, broken in 0.19.0)
+        # result = df[['a', 'c']].quantile(.5)
+        # result = df[['a', 'c']].quantile([.5])
+
+    def test_quantile_invalid(self):
+        msg = 'percentiles should all be in the interval \\[0, 1\\]'
+        for invalid in [-1, 2, [0.5, -1], [0.5, 2]]:
+            with tm.assert_raises_regex(ValueError, msg):
+                self.tsframe.quantile(invalid)
+
+    def test_quantile_box(self):
+        df = DataFrame({'A': [pd.Timestamp('2011-01-01'),
+                              pd.Timestamp('2011-01-02'),
+                              pd.Timestamp('2011-01-03')],
+                        'B': [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+                              pd.Timestamp('2011-01-02', tz='US/Eastern'),
+                              pd.Timestamp('2011-01-03', tz='US/Eastern')],
+                        'C': [pd.Timedelta('1 days'),
+                              pd.Timedelta('2 days'),
+                              pd.Timedelta('3 days')]})
+
+        res = df.quantile(0.5, numeric_only=False)
+
+        exp = pd.Series([pd.Timestamp('2011-01-02'),
+                         pd.Timestamp('2011-01-02', tz='US/Eastern'),
+                         pd.Timedelta('2 days')],
+                        name=0.5, index=['A', 'B', 'C'])
+        tm.assert_series_equal(res, exp)
+
+        res = df.quantile([0.5], numeric_only=False)
+        exp = pd.DataFrame([[pd.Timestamp('2011-01-02'),
+                             pd.Timestamp('2011-01-02', tz='US/Eastern'),
+                             pd.Timedelta('2 days')]],
+                           index=[0.5], columns=['A', 'B', 'C'])
+        tm.assert_frame_equal(res, exp)
+
+        # DatetimeBlock may be consolidated and contain NaT in different loc
+        df = DataFrame({'A': [pd.Timestamp('2011-01-01'),
+                              pd.NaT,
+                              pd.Timestamp('2011-01-02'),
+                              pd.Timestamp('2011-01-03')],
+                        'a': [pd.Timestamp('2011-01-01'),
+                              pd.Timestamp('2011-01-02'),
+                              pd.NaT,
+                              pd.Timestamp('2011-01-03')],
+                        'B': [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+                              pd.NaT,
+                              pd.Timestamp('2011-01-02', tz='US/Eastern'),
+                              pd.Timestamp('2011-01-03', tz='US/Eastern')],
+                        'b': [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+                              pd.Timestamp('2011-01-02', tz='US/Eastern'),
+                              pd.NaT,
+                              pd.Timestamp('2011-01-03', tz='US/Eastern')],
+                        'C': [pd.Timedelta('1 days'),
+                              pd.Timedelta('2 days'),
+                              pd.Timedelta('3 days'),
+                              pd.NaT],
+                        'c': [pd.NaT,
+                              pd.Timedelta('1 days'),
+                              pd.Timedelta('2 days'),
+                              pd.Timedelta('3 days')]},
+                       columns=list('AaBbCc'))
+
+        res = df.quantile(0.5, numeric_only=False)
+        exp = pd.Series([pd.Timestamp('2011-01-02'),
+                         pd.Timestamp('2011-01-02'),
+                         pd.Timestamp('2011-01-02', tz='US/Eastern'),
+                         pd.Timestamp('2011-01-02', tz='US/Eastern'),
+                         pd.Timedelta('2 days'),
+                         pd.Timedelta('2 days')],
+                        name=0.5, index=list('AaBbCc'))
+        tm.assert_series_equal(res, exp)
+
+        res = df.quantile([0.5], numeric_only=False)
+        exp = pd.DataFrame([[pd.Timestamp('2011-01-02'),
+                             pd.Timestamp('2011-01-02'),
+                             pd.Timestamp('2011-01-02', tz='US/Eastern'),
+                             pd.Timestamp('2011-01-02', tz='US/Eastern'),
+                             pd.Timedelta('2 days'),
+                             pd.Timedelta('2 days')]],
+                           index=[0.5], columns=list('AaBbCc'))
+        tm.assert_frame_equal(res, exp)
+
+    def test_quantile_nan(self):
+
+        # GH 14357 - float block where some cols have missing values
+        df = DataFrame({'a': np.arange(1, 6.0), 'b': np.arange(1, 6.0)})
+        df.iloc[-1, 1] = np.nan
+
+        res = df.quantile(0.5)
+        exp = Series([3.0, 2.5], index=['a', 'b'], name=0.5)
+        tm.assert_series_equal(res, exp)
+
+        res = df.quantile([0.5, 0.75])
+        exp = DataFrame({'a': [3.0, 4.0], 'b': [2.5, 3.25]}, index=[0.5, 0.75])
+        tm.assert_frame_equal(res, exp)
+
+        res = df.quantile(0.5, axis=1)
+        exp = Series(np.arange(1.0, 6.0), name=0.5)
+        tm.assert_series_equal(res, exp)
+
+        res = df.quantile([0.5, 0.75], axis=1)
+        exp = DataFrame([np.arange(1.0, 6.0)] * 2, index=[0.5, 0.75])
+        tm.assert_frame_equal(res, exp)
+
+        # full-nan column
+        df['b'] = np.nan
+
+        res = df.quantile(0.5)
+        exp = Series([3.0, np.nan], index=['a', 'b'], name=0.5)
+        tm.assert_series_equal(res, exp)
+
+        res = df.quantile([0.5, 0.75])
+        exp = DataFrame({'a': [3.0, 4.0], 'b': [np.nan, np.nan]},
+                        index=[0.5, 0.75])
+        tm.assert_frame_equal(res, exp)
+
+    def test_quantile_nat(self):
+
+        # full NaT column
+        df = DataFrame({'a': [pd.NaT, pd.NaT, pd.NaT]})
+
+        res = df.quantile(0.5, numeric_only=False)
+        exp = Series([pd.NaT], index=['a'], name=0.5)
+        tm.assert_series_equal(res, exp)
+
+        res = df.quantile([0.5], numeric_only=False)
+        exp = DataFrame({'a': [pd.NaT]}, index=[0.5])
+        tm.assert_frame_equal(res, exp)
+
+        # mixed non-null / full null column
+        df = DataFrame({'a': [pd.Timestamp('2012-01-01'),
+                              pd.Timestamp('2012-01-02'),
+                              pd.Timestamp('2012-01-03')],
+                        'b': [pd.NaT, pd.NaT, pd.NaT]})
+
+        res = df.quantile(0.5, numeric_only=False)
+        exp = Series([pd.Timestamp('2012-01-02'), pd.NaT], index=['a', 'b'],
+                     name=0.5)
+        tm.assert_series_equal(res, exp)
+
+        res = df.quantile([0.5], numeric_only=False)
+        exp = DataFrame([[pd.Timestamp('2012-01-02'), pd.NaT]], index=[0.5],
+                        columns=['a', 'b'])
+        tm.assert_frame_equal(res, exp)
+
+    def test_quantile_empty(self):
+
+        # floats
+        df = DataFrame(columns=['a', 'b'], dtype='float64')
+
+        res = df.quantile(0.5)
+        exp = Series([np.nan, np.nan], index=['a', 'b'], name=0.5)
+        tm.assert_series_equal(res, exp)
+
+        res = df.quantile([0.5])
+        exp = DataFrame([[np.nan, np.nan]], columns=['a', 'b'], index=[0.5])
+        tm.assert_frame_equal(res, exp)
+
+        # FIXME (gives empty frame in 0.18.1, broken in 0.19.0)
+        # res = df.quantile(0.5, axis=1)
+        # res = df.quantile([0.5], axis=1)
+
+        # ints
+        df = DataFrame(columns=['a', 'b'], dtype='int64')
+
+        # FIXME (gives empty frame in 0.18.1, broken in 0.19.0)
+        # res = df.quantile(0.5)
+
+        # datetimes
+        df = DataFrame(columns=['a', 'b'], dtype='datetime64[ns]')
+
+        # FIXME (gives NaNs instead of NaT in 0.18.1 or 0.19.0)
+        # res = df.quantile(0.5, numeric_only=False)
diff --git a/pandas/tests/frame/test_query_eval.py b/pandas/tests/frame/test_query_eval.py
new file mode 100644
index 0000000000000..a226f8de3c8bd
--- /dev/null
+++ b/pandas/tests/frame/test_query_eval.py
@@ -0,0 +1,1039 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import operator
+import pytest
+
+from pandas.compat import (zip, range, lrange, StringIO)
+from pandas import DataFrame, Series, Index, MultiIndex, date_range
+import pandas as pd
+import numpy as np
+
+from numpy.random import randn
+
+from pandas.util.testing import (assert_series_equal,
+                                 assert_frame_equal,
+                                 makeCustomDataframe as mkdf)
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas.core.computation.check import _NUMEXPR_INSTALLED
+
+from pandas.tests.frame.common import TestData
+
+
+PARSERS = 'python', 'pandas'
+ENGINES = 'python', pytest.param('numexpr', marks=td.skip_if_no_ne)
+
+
+@pytest.fixture(params=PARSERS, ids=lambda x: x)
+def parser(request):
+    return request.param
+
+
+@pytest.fixture(params=ENGINES, ids=lambda x: x)
+def engine(request):
+    return request.param
+
+
+def skip_if_no_pandas_parser(parser):
+    if parser != 'pandas':
+        pytest.skip("cannot evaluate with parser {0!r}".format(parser))
+
+
+class TestCompat(object):
+
+    def setup_method(self, method):
+        self.df = DataFrame({'A': [1, 2, 3]})
+        self.expected1 = self.df[self.df.A > 0]
+        self.expected2 = self.df.A + 1
+
+    def test_query_default(self):
+
+        # GH 12749
+        # this should always work, whether _NUMEXPR_INSTALLED or not
+        df = self.df
+        result = df.query('A>0')
+        assert_frame_equal(result, self.expected1)
+        result = df.eval('A+1')
+        assert_series_equal(result, self.expected2, check_names=False)
+
+    def test_query_None(self):
+
+        df = self.df
+        result = df.query('A>0', engine=None)
+        assert_frame_equal(result, self.expected1)
+        result = df.eval('A+1', engine=None)
+        assert_series_equal(result, self.expected2, check_names=False)
+
+    def test_query_python(self):
+
+        df = self.df
+        result = df.query('A>0', engine='python')
+        assert_frame_equal(result, self.expected1)
+        result = df.eval('A+1', engine='python')
+        assert_series_equal(result, self.expected2, check_names=False)
+
+    def test_query_numexpr(self):
+
+        df = self.df
+        if _NUMEXPR_INSTALLED:
+            result = df.query('A>0', engine='numexpr')
+            assert_frame_equal(result, self.expected1)
+            result = df.eval('A+1', engine='numexpr')
+            assert_series_equal(result, self.expected2, check_names=False)
+        else:
+            pytest.raises(ImportError,
+                          lambda: df.query('A>0', engine='numexpr'))
+            pytest.raises(ImportError,
+                          lambda: df.eval('A+1', engine='numexpr'))
+
+
+class TestDataFrameEval(TestData):
+
+    def test_ops(self):
+
+        # tst ops and reversed ops in evaluation
+        # GH7198
+
+        # smaller hits python, larger hits numexpr
+        for n in [4, 4000]:
+
+            df = DataFrame(1, index=range(n), columns=list('abcd'))
+            df.iloc[0] = 2
+            m = df.mean()
+
+            for op_str, op, rop in [('+', '__add__', '__radd__'),
+                                    ('-', '__sub__', '__rsub__'),
+                                    ('*', '__mul__', '__rmul__'),
+                                    ('/', '__truediv__', '__rtruediv__')]:
+
+                base = (DataFrame(np.tile(m.values, n)  # noqa
+                                  .reshape(n, -1),
+                                  columns=list('abcd')))
+
+                expected = eval("base{op}df".format(op=op_str))
+
+                # ops as strings
+                result = eval("m{op}df".format(op=op_str))
+                assert_frame_equal(result, expected)
+
+                # these are commutative
+                if op in ['+', '*']:
+                    result = getattr(df, op)(m)
+                    assert_frame_equal(result, expected)
+
+                # these are not
+                elif op in ['-', '/']:
+                    result = getattr(df, rop)(m)
+                    assert_frame_equal(result, expected)
+
+        # GH7192
+        df = DataFrame(dict(A=np.random.randn(25000)))
+        df.iloc[0:5] = np.nan
+        expected = (1 - np.isnan(df.iloc[0:25]))
+        result = (1 - np.isnan(df)).iloc[0:25]
+        assert_frame_equal(result, expected)
+
+    def test_query_non_str(self):
+        # GH 11485
+        df = pd.DataFrame({'A': [1, 2, 3], 'B': ['a', 'b', 'b']})
+
+        msg = "expr must be a string to be evaluated"
+        with tm.assert_raises_regex(ValueError, msg):
+            df.query(lambda x: x.B == "b")
+
+        with tm.assert_raises_regex(ValueError, msg):
+            df.query(111)
+
+    def test_query_empty_string(self):
+        # GH 13139
+        df = pd.DataFrame({'A': [1, 2, 3]})
+
+        msg = "expr cannot be an empty string"
+        with tm.assert_raises_regex(ValueError, msg):
+            df.query('')
+
+    def test_eval_resolvers_as_list(self):
+        # GH 14095
+        df = DataFrame(randn(10, 2), columns=list('ab'))
+        dict1 = {'a': 1}
+        dict2 = {'b': 2}
+        assert (df.eval('a + b', resolvers=[dict1, dict2]) ==
+                dict1['a'] + dict2['b'])
+        assert (pd.eval('a + b', resolvers=[dict1, dict2]) ==
+                dict1['a'] + dict2['b'])
+
+
+class TestDataFrameQueryWithMultiIndex(object):
+
+    def test_query_with_named_multiindex(self, parser, engine):
+        skip_if_no_pandas_parser(parser)
+        a = np.random.choice(['red', 'green'], size=10)
+        b = np.random.choice(['eggs', 'ham'], size=10)
+        index = MultiIndex.from_arrays([a, b], names=['color', 'food'])
+        df = DataFrame(randn(10, 2), index=index)
+        ind = Series(df.index.get_level_values('color').values, index=index,
+                     name='color')
+
+        # equality
+        res1 = df.query('color == "red"', parser=parser, engine=engine)
+        res2 = df.query('"red" == color', parser=parser, engine=engine)
+        exp = df[ind == 'red']
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        # inequality
+        res1 = df.query('color != "red"', parser=parser, engine=engine)
+        res2 = df.query('"red" != color', parser=parser, engine=engine)
+        exp = df[ind != 'red']
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        # list equality (really just set membership)
+        res1 = df.query('color == ["red"]', parser=parser, engine=engine)
+        res2 = df.query('["red"] == color', parser=parser, engine=engine)
+        exp = df[ind.isin(['red'])]
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        res1 = df.query('color != ["red"]', parser=parser, engine=engine)
+        res2 = df.query('["red"] != color', parser=parser, engine=engine)
+        exp = df[~ind.isin(['red'])]
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        # in/not in ops
+        res1 = df.query('["red"] in color', parser=parser, engine=engine)
+        res2 = df.query('"red" in color', parser=parser, engine=engine)
+        exp = df[ind.isin(['red'])]
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        res1 = df.query('["red"] not in color', parser=parser, engine=engine)
+        res2 = df.query('"red" not in color', parser=parser, engine=engine)
+        exp = df[~ind.isin(['red'])]
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+    def test_query_with_unnamed_multiindex(self, parser, engine):
+        skip_if_no_pandas_parser(parser)
+        a = np.random.choice(['red', 'green'], size=10)
+        b = np.random.choice(['eggs', 'ham'], size=10)
+        index = MultiIndex.from_arrays([a, b])
+        df = DataFrame(randn(10, 2), index=index)
+        ind = Series(df.index.get_level_values(0).values, index=index)
+
+        res1 = df.query('ilevel_0 == "red"', parser=parser, engine=engine)
+        res2 = df.query('"red" == ilevel_0', parser=parser, engine=engine)
+        exp = df[ind == 'red']
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        # inequality
+        res1 = df.query('ilevel_0 != "red"', parser=parser, engine=engine)
+        res2 = df.query('"red" != ilevel_0', parser=parser, engine=engine)
+        exp = df[ind != 'red']
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        # list equality (really just set membership)
+        res1 = df.query('ilevel_0 == ["red"]', parser=parser, engine=engine)
+        res2 = df.query('["red"] == ilevel_0', parser=parser, engine=engine)
+        exp = df[ind.isin(['red'])]
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        res1 = df.query('ilevel_0 != ["red"]', parser=parser, engine=engine)
+        res2 = df.query('["red"] != ilevel_0', parser=parser, engine=engine)
+        exp = df[~ind.isin(['red'])]
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        # in/not in ops
+        res1 = df.query('["red"] in ilevel_0', parser=parser, engine=engine)
+        res2 = df.query('"red" in ilevel_0', parser=parser, engine=engine)
+        exp = df[ind.isin(['red'])]
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        res1 = df.query('["red"] not in ilevel_0', parser=parser,
+                        engine=engine)
+        res2 = df.query('"red" not in ilevel_0', parser=parser, engine=engine)
+        exp = df[~ind.isin(['red'])]
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        # ## LEVEL 1
+        ind = Series(df.index.get_level_values(1).values, index=index)
+        res1 = df.query('ilevel_1 == "eggs"', parser=parser, engine=engine)
+        res2 = df.query('"eggs" == ilevel_1', parser=parser, engine=engine)
+        exp = df[ind == 'eggs']
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        # inequality
+        res1 = df.query('ilevel_1 != "eggs"', parser=parser, engine=engine)
+        res2 = df.query('"eggs" != ilevel_1', parser=parser, engine=engine)
+        exp = df[ind != 'eggs']
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        # list equality (really just set membership)
+        res1 = df.query('ilevel_1 == ["eggs"]', parser=parser, engine=engine)
+        res2 = df.query('["eggs"] == ilevel_1', parser=parser, engine=engine)
+        exp = df[ind.isin(['eggs'])]
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        res1 = df.query('ilevel_1 != ["eggs"]', parser=parser, engine=engine)
+        res2 = df.query('["eggs"] != ilevel_1', parser=parser, engine=engine)
+        exp = df[~ind.isin(['eggs'])]
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        # in/not in ops
+        res1 = df.query('["eggs"] in ilevel_1', parser=parser, engine=engine)
+        res2 = df.query('"eggs" in ilevel_1', parser=parser, engine=engine)
+        exp = df[ind.isin(['eggs'])]
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+        res1 = df.query('["eggs"] not in ilevel_1', parser=parser,
+                        engine=engine)
+        res2 = df.query('"eggs" not in ilevel_1', parser=parser, engine=engine)
+        exp = df[~ind.isin(['eggs'])]
+        assert_frame_equal(res1, exp)
+        assert_frame_equal(res2, exp)
+
+    def test_query_with_partially_named_multiindex(self, parser, engine):
+        skip_if_no_pandas_parser(parser)
+        a = np.random.choice(['red', 'green'], size=10)
+        b = np.arange(10)
+        index = MultiIndex.from_arrays([a, b])
+        index.names = [None, 'rating']
+        df = DataFrame(randn(10, 2), index=index)
+        res = df.query('rating == 1', parser=parser, engine=engine)
+        ind = Series(df.index.get_level_values('rating').values, index=index,
+                     name='rating')
+        exp = df[ind == 1]
+        assert_frame_equal(res, exp)
+
+        res = df.query('rating != 1', parser=parser, engine=engine)
+        ind = Series(df.index.get_level_values('rating').values, index=index,
+                     name='rating')
+        exp = df[ind != 1]
+        assert_frame_equal(res, exp)
+
+        res = df.query('ilevel_0 == "red"', parser=parser, engine=engine)
+        ind = Series(df.index.get_level_values(0).values, index=index)
+        exp = df[ind == "red"]
+        assert_frame_equal(res, exp)
+
+        res = df.query('ilevel_0 != "red"', parser=parser, engine=engine)
+        ind = Series(df.index.get_level_values(0).values, index=index)
+        exp = df[ind != "red"]
+        assert_frame_equal(res, exp)
+
+    def test_query_multiindex_get_index_resolvers(self):
+        df = mkdf(10, 3, r_idx_nlevels=2, r_idx_names=['spam', 'eggs'])
+        resolvers = df._get_index_resolvers()
+
+        def to_series(mi, level):
+            level_values = mi.get_level_values(level)
+            s = level_values.to_series()
+            s.index = mi
+            return s
+
+        col_series = df.columns.to_series()
+        expected = {'index': df.index,
+                    'columns': col_series,
+                    'spam': to_series(df.index, 'spam'),
+                    'eggs': to_series(df.index, 'eggs'),
+                    'C0': col_series}
+        for k, v in resolvers.items():
+            if isinstance(v, Index):
+                assert v.is_(expected[k])
+            elif isinstance(v, Series):
+                assert_series_equal(v, expected[k])
+            else:
+                raise AssertionError("object must be a Series or Index")
+
+    def test_raise_on_panel_with_multiindex(self, parser, engine):
+        p = tm.makePanel(7)
+        p.items = tm.makeCustomIndex(len(p.items), nlevels=2)
+        with pytest.raises(NotImplementedError):
+            pd.eval('p + 1', parser=parser, engine=engine)
+
+
+@td.skip_if_no_ne
+class TestDataFrameQueryNumExprPandas(object):
+
+    @classmethod
+    def setup_class(cls):
+        cls.engine = 'numexpr'
+        cls.parser = 'pandas'
+
+    @classmethod
+    def teardown_class(cls):
+        del cls.engine, cls.parser
+
+    def test_date_query_with_attribute_access(self):
+        engine, parser = self.engine, self.parser
+        skip_if_no_pandas_parser(parser)
+        df = DataFrame(randn(5, 3))
+        df['dates1'] = date_range('1/1/2012', periods=5)
+        df['dates2'] = date_range('1/1/2013', periods=5)
+        df['dates3'] = date_range('1/1/2014', periods=5)
+        res = df.query('@df.dates1 < 20130101 < @df.dates3', engine=engine,
+                       parser=parser)
+        expec = df[(df.dates1 < '20130101') & ('20130101' < df.dates3)]
+        assert_frame_equal(res, expec)
+
+    def test_date_query_no_attribute_access(self):
+        engine, parser = self.engine, self.parser
+        df = DataFrame(randn(5, 3))
+        df['dates1'] = date_range('1/1/2012', periods=5)
+        df['dates2'] = date_range('1/1/2013', periods=5)
+        df['dates3'] = date_range('1/1/2014', periods=5)
+        res = df.query('dates1 < 20130101 < dates3', engine=engine,
+                       parser=parser)
+        expec = df[(df.dates1 < '20130101') & ('20130101' < df.dates3)]
+        assert_frame_equal(res, expec)
+
+    def test_date_query_with_NaT(self):
+        engine, parser = self.engine, self.parser
+        n = 10
+        df = DataFrame(randn(n, 3))
+        df['dates1'] = date_range('1/1/2012', periods=n)
+        df['dates2'] = date_range('1/1/2013', periods=n)
+        df['dates3'] = date_range('1/1/2014', periods=n)
+        df.loc[np.random.rand(n) > 0.5, 'dates1'] = pd.NaT
+        df.loc[np.random.rand(n) > 0.5, 'dates3'] = pd.NaT
+        res = df.query('dates1 < 20130101 < dates3', engine=engine,
+                       parser=parser)
+        expec = df[(df.dates1 < '20130101') & ('20130101' < df.dates3)]
+        assert_frame_equal(res, expec)
+
+    def test_date_index_query(self):
+        engine, parser = self.engine, self.parser
+        n = 10
+        df = DataFrame(randn(n, 3))
+        df['dates1'] = date_range('1/1/2012', periods=n)
+        df['dates3'] = date_range('1/1/2014', periods=n)
+        df.set_index('dates1', inplace=True, drop=True)
+        res = df.query('index < 20130101 < dates3', engine=engine,
+                       parser=parser)
+        expec = df[(df.index < '20130101') & ('20130101' < df.dates3)]
+        assert_frame_equal(res, expec)
+
+    def test_date_index_query_with_NaT(self):
+        engine, parser = self.engine, self.parser
+        n = 10
+        df = DataFrame(randn(n, 3))
+        df['dates1'] = date_range('1/1/2012', periods=n)
+        df['dates3'] = date_range('1/1/2014', periods=n)
+        df.iloc[0, 0] = pd.NaT
+        df.set_index('dates1', inplace=True, drop=True)
+        res = df.query('index < 20130101 < dates3', engine=engine,
+                       parser=parser)
+        expec = df[(df.index < '20130101') & ('20130101' < df.dates3)]
+        assert_frame_equal(res, expec)
+
+    def test_date_index_query_with_NaT_duplicates(self):
+        engine, parser = self.engine, self.parser
+        n = 10
+        d = {}
+        d['dates1'] = date_range('1/1/2012', periods=n)
+        d['dates3'] = date_range('1/1/2014', periods=n)
+        df = DataFrame(d)
+        df.loc[np.random.rand(n) > 0.5, 'dates1'] = pd.NaT
+        df.set_index('dates1', inplace=True, drop=True)
+        res = df.query('dates1 < 20130101 < dates3', engine=engine,
+                       parser=parser)
+        expec = df[(df.index.to_series() < '20130101') &
+                   ('20130101' < df.dates3)]
+        assert_frame_equal(res, expec)
+
+    def test_date_query_with_non_date(self):
+        engine, parser = self.engine, self.parser
+
+        n = 10
+        df = DataFrame({'dates': date_range('1/1/2012', periods=n),
+                        'nondate': np.arange(n)})
+
+        ops = '==', '!=', '<', '>', '<=', '>='
+
+        for op in ops:
+            with pytest.raises(TypeError):
+                df.query('dates %s nondate' % op, parser=parser, engine=engine)
+
+    def test_query_syntax_error(self):
+        engine, parser = self.engine, self.parser
+        df = DataFrame({"i": lrange(10), "+": lrange(3, 13),
+                        "r": lrange(4, 14)})
+        with pytest.raises(SyntaxError):
+            df.query('i - +', engine=engine, parser=parser)
+
+    def test_query_scope(self):
+        from pandas.core.computation.ops import UndefinedVariableError
+        engine, parser = self.engine, self.parser
+        skip_if_no_pandas_parser(parser)
+
+        df = DataFrame(np.random.randn(20, 2), columns=list('ab'))
+
+        a, b = 1, 2  # noqa
+        res = df.query('a > b', engine=engine, parser=parser)
+        expected = df[df.a > df.b]
+        assert_frame_equal(res, expected)
+
+        res = df.query('@a > b', engine=engine, parser=parser)
+        expected = df[a > df.b]
+        assert_frame_equal(res, expected)
+
+        # no local variable c
+        with pytest.raises(UndefinedVariableError):
+            df.query('@a > b > @c', engine=engine, parser=parser)
+
+        # no column named 'c'
+        with pytest.raises(UndefinedVariableError):
+            df.query('@a > b > c', engine=engine, parser=parser)
+
+    def test_query_doesnt_pickup_local(self):
+        from pandas.core.computation.ops import UndefinedVariableError
+
+        engine, parser = self.engine, self.parser
+        n = m = 10
+        df = DataFrame(np.random.randint(m, size=(n, 3)), columns=list('abc'))
+
+        # we don't pick up the local 'sin'
+        with pytest.raises(UndefinedVariableError):
+            df.query('sin > 5', engine=engine, parser=parser)
+
+    def test_query_builtin(self):
+        from pandas.core.computation.engines import NumExprClobberingError
+        engine, parser = self.engine, self.parser
+
+        n = m = 10
+        df = DataFrame(np.random.randint(m, size=(n, 3)), columns=list('abc'))
+
+        df.index.name = 'sin'
+        with tm.assert_raises_regex(NumExprClobberingError,
+                                    'Variables in expression.+'):
+            df.query('sin > 5', engine=engine, parser=parser)
+
+    def test_query(self):
+        engine, parser = self.engine, self.parser
+        df = DataFrame(np.random.randn(10, 3), columns=['a', 'b', 'c'])
+
+        assert_frame_equal(df.query('a < b', engine=engine, parser=parser),
+                           df[df.a < df.b])
+        assert_frame_equal(df.query('a + b > b * c', engine=engine,
+                                    parser=parser),
+                           df[df.a + df.b > df.b * df.c])
+
+    def test_query_index_with_name(self):
+        engine, parser = self.engine, self.parser
+        df = DataFrame(np.random.randint(10, size=(10, 3)),
+                       index=Index(range(10), name='blob'),
+                       columns=['a', 'b', 'c'])
+        res = df.query('(blob < 5) & (a < b)', engine=engine, parser=parser)
+        expec = df[(df.index < 5) & (df.a < df.b)]
+        assert_frame_equal(res, expec)
+
+        res = df.query('blob < b', engine=engine, parser=parser)
+        expec = df[df.index < df.b]
+
+        assert_frame_equal(res, expec)
+
+    def test_query_index_without_name(self):
+        engine, parser = self.engine, self.parser
+        df = DataFrame(np.random.randint(10, size=(10, 3)),
+                       index=range(10), columns=['a', 'b', 'c'])
+
+        # "index" should refer to the index
+        res = df.query('index < b', engine=engine, parser=parser)
+        expec = df[df.index < df.b]
+        assert_frame_equal(res, expec)
+
+        # test against a scalar
+        res = df.query('index < 5', engine=engine, parser=parser)
+        expec = df[df.index < 5]
+        assert_frame_equal(res, expec)
+
+    def test_nested_scope(self):
+        engine = self.engine
+        parser = self.parser
+
+        skip_if_no_pandas_parser(parser)
+
+        df = DataFrame(np.random.randn(5, 3))
+        df2 = DataFrame(np.random.randn(5, 3))
+        expected = df[(df > 0) & (df2 > 0)]
+
+        result = df.query('(@df > 0) & (@df2 > 0)', engine=engine,
+                          parser=parser)
+        assert_frame_equal(result, expected)
+
+        result = pd.eval('df[df > 0 and df2 > 0]', engine=engine,
+                         parser=parser)
+        assert_frame_equal(result, expected)
+
+        result = pd.eval('df[df > 0 and df2 > 0 and df[df > 0] > 0]',
+                         engine=engine, parser=parser)
+        expected = df[(df > 0) & (df2 > 0) & (df[df > 0] > 0)]
+        assert_frame_equal(result, expected)
+
+        result = pd.eval('df[(df>0) & (df2>0)]', engine=engine, parser=parser)
+        expected = df.query('(@df>0) & (@df2>0)', engine=engine, parser=parser)
+        assert_frame_equal(result, expected)
+
+    def test_nested_raises_on_local_self_reference(self):
+        from pandas.core.computation.ops import UndefinedVariableError
+
+        df = DataFrame(np.random.randn(5, 3))
+
+        # can't reference ourself b/c we're a local so @ is necessary
+        with pytest.raises(UndefinedVariableError):
+            df.query('df > 0', engine=self.engine, parser=self.parser)
+
+    def test_local_syntax(self):
+        skip_if_no_pandas_parser(self.parser)
+
+        engine, parser = self.engine, self.parser
+        df = DataFrame(randn(100, 10), columns=list('abcdefghij'))
+        b = 1
+        expect = df[df.a < b]
+        result = df.query('a < @b', engine=engine, parser=parser)
+        assert_frame_equal(result, expect)
+
+        expect = df[df.a < df.b]
+        result = df.query('a < b', engine=engine, parser=parser)
+        assert_frame_equal(result, expect)
+
+    def test_chained_cmp_and_in(self):
+        skip_if_no_pandas_parser(self.parser)
+        engine, parser = self.engine, self.parser
+        cols = list('abc')
+        df = DataFrame(randn(100, len(cols)), columns=cols)
+        res = df.query('a < b < c and a not in b not in c', engine=engine,
+                       parser=parser)
+        ind = (df.a < df.b) & (df.b < df.c) & ~df.b.isin(df.a) & ~df.c.isin(df.b)  # noqa
+        expec = df[ind]
+        assert_frame_equal(res, expec)
+
+    def test_local_variable_with_in(self):
+        engine, parser = self.engine, self.parser
+        skip_if_no_pandas_parser(parser)
+        a = Series(np.random.randint(3, size=15), name='a')
+        b = Series(np.random.randint(10, size=15), name='b')
+        df = DataFrame({'a': a, 'b': b})
+
+        expected = df.loc[(df.b - 1).isin(a)]
+        result = df.query('b - 1 in a', engine=engine, parser=parser)
+        assert_frame_equal(expected, result)
+
+        b = Series(np.random.randint(10, size=15), name='b')
+        expected = df.loc[(b - 1).isin(a)]
+        result = df.query('@b - 1 in a', engine=engine, parser=parser)
+        assert_frame_equal(expected, result)
+
+    def test_at_inside_string(self):
+        engine, parser = self.engine, self.parser
+        skip_if_no_pandas_parser(parser)
+        c = 1  # noqa
+        df = DataFrame({'a': ['a', 'a', 'b', 'b', '@c', '@c']})
+        result = df.query('a == "@c"', engine=engine, parser=parser)
+        expected = df[df.a == "@c"]
+        assert_frame_equal(result, expected)
+
+    def test_query_undefined_local(self):
+        from pandas.core.computation.ops import UndefinedVariableError
+        engine, parser = self.engine, self.parser
+        skip_if_no_pandas_parser(parser)
+        df = DataFrame(np.random.rand(10, 2), columns=list('ab'))
+        with tm.assert_raises_regex(UndefinedVariableError,
+                                    "local variable 'c' is not defined"):
+            df.query('a == @c', engine=engine, parser=parser)
+
+    def test_index_resolvers_come_after_columns_with_the_same_name(self):
+        n = 1  # noqa
+        a = np.r_[20:101:20]
+
+        df = DataFrame({'index': a, 'b': np.random.randn(a.size)})
+        df.index.name = 'index'
+        result = df.query('index > 5', engine=self.engine, parser=self.parser)
+        expected = df[df['index'] > 5]
+        assert_frame_equal(result, expected)
+
+        df = DataFrame({'index': a,
+                        'b': np.random.randn(a.size)})
+        result = df.query('ilevel_0 > 5', engine=self.engine,
+                          parser=self.parser)
+        expected = df.loc[df.index[df.index > 5]]
+        assert_frame_equal(result, expected)
+
+        df = DataFrame({'a': a, 'b': np.random.randn(a.size)})
+        df.index.name = 'a'
+        result = df.query('a > 5', engine=self.engine, parser=self.parser)
+        expected = df[df.a > 5]
+        assert_frame_equal(result, expected)
+
+        result = df.query('index > 5', engine=self.engine, parser=self.parser)
+        expected = df.loc[df.index[df.index > 5]]
+        assert_frame_equal(result, expected)
+
+    def test_inf(self):
+        n = 10
+        df = DataFrame({'a': np.random.rand(n), 'b': np.random.rand(n)})
+        df.loc[::2, 0] = np.inf
+        ops = '==', '!='
+        d = dict(zip(ops, (operator.eq, operator.ne)))
+        for op, f in d.items():
+            q = 'a %s inf' % op
+            expected = df[f(df.a, np.inf)]
+            result = df.query(q, engine=self.engine, parser=self.parser)
+            assert_frame_equal(result, expected)
+
+
+@td.skip_if_no_ne
+class TestDataFrameQueryNumExprPython(TestDataFrameQueryNumExprPandas):
+
+    @classmethod
+    def setup_class(cls):
+        super(TestDataFrameQueryNumExprPython, cls).setup_class()
+        cls.engine = 'numexpr'
+        cls.parser = 'python'
+        cls.frame = TestData().frame
+
+    def test_date_query_no_attribute_access(self):
+        engine, parser = self.engine, self.parser
+        df = DataFrame(randn(5, 3))
+        df['dates1'] = date_range('1/1/2012', periods=5)
+        df['dates2'] = date_range('1/1/2013', periods=5)
+        df['dates3'] = date_range('1/1/2014', periods=5)
+        res = df.query('(dates1 < 20130101) & (20130101 < dates3)',
+                       engine=engine, parser=parser)
+        expec = df[(df.dates1 < '20130101') & ('20130101' < df.dates3)]
+        assert_frame_equal(res, expec)
+
+    def test_date_query_with_NaT(self):
+        engine, parser = self.engine, self.parser
+        n = 10
+        df = DataFrame(randn(n, 3))
+        df['dates1'] = date_range('1/1/2012', periods=n)
+        df['dates2'] = date_range('1/1/2013', periods=n)
+        df['dates3'] = date_range('1/1/2014', periods=n)
+        df.loc[np.random.rand(n) > 0.5, 'dates1'] = pd.NaT
+        df.loc[np.random.rand(n) > 0.5, 'dates3'] = pd.NaT
+        res = df.query('(dates1 < 20130101) & (20130101 < dates3)',
+                       engine=engine, parser=parser)
+        expec = df[(df.dates1 < '20130101') & ('20130101' < df.dates3)]
+        assert_frame_equal(res, expec)
+
+    def test_date_index_query(self):
+        engine, parser = self.engine, self.parser
+        n = 10
+        df = DataFrame(randn(n, 3))
+        df['dates1'] = date_range('1/1/2012', periods=n)
+        df['dates3'] = date_range('1/1/2014', periods=n)
+        df.set_index('dates1', inplace=True, drop=True)
+        res = df.query('(index < 20130101) & (20130101 < dates3)',
+                       engine=engine, parser=parser)
+        expec = df[(df.index < '20130101') & ('20130101' < df.dates3)]
+        assert_frame_equal(res, expec)
+
+    def test_date_index_query_with_NaT(self):
+        engine, parser = self.engine, self.parser
+        n = 10
+        df = DataFrame(randn(n, 3))
+        df['dates1'] = date_range('1/1/2012', periods=n)
+        df['dates3'] = date_range('1/1/2014', periods=n)
+        df.iloc[0, 0] = pd.NaT
+        df.set_index('dates1', inplace=True, drop=True)
+        res = df.query('(index < 20130101) & (20130101 < dates3)',
+                       engine=engine, parser=parser)
+        expec = df[(df.index < '20130101') & ('20130101' < df.dates3)]
+        assert_frame_equal(res, expec)
+
+    def test_date_index_query_with_NaT_duplicates(self):
+        engine, parser = self.engine, self.parser
+        n = 10
+        df = DataFrame(randn(n, 3))
+        df['dates1'] = date_range('1/1/2012', periods=n)
+        df['dates3'] = date_range('1/1/2014', periods=n)
+        df.loc[np.random.rand(n) > 0.5, 'dates1'] = pd.NaT
+        df.set_index('dates1', inplace=True, drop=True)
+        with pytest.raises(NotImplementedError):
+            df.query('index < 20130101 < dates3', engine=engine, parser=parser)
+
+    def test_nested_scope(self):
+        from pandas.core.computation.ops import UndefinedVariableError
+        engine = self.engine
+        parser = self.parser
+        # smoke test
+        x = 1  # noqa
+        result = pd.eval('x + 1', engine=engine, parser=parser)
+        assert result == 2
+
+        df = DataFrame(np.random.randn(5, 3))
+        df2 = DataFrame(np.random.randn(5, 3))
+
+        # don't have the pandas parser
+        with pytest.raises(SyntaxError):
+            df.query('(@df>0) & (@df2>0)', engine=engine, parser=parser)
+
+        with pytest.raises(UndefinedVariableError):
+            df.query('(df>0) & (df2>0)', engine=engine, parser=parser)
+
+        expected = df[(df > 0) & (df2 > 0)]
+        result = pd.eval('df[(df > 0) & (df2 > 0)]', engine=engine,
+                         parser=parser)
+        assert_frame_equal(expected, result)
+
+        expected = df[(df > 0) & (df2 > 0) & (df[df > 0] > 0)]
+        result = pd.eval('df[(df > 0) & (df2 > 0) & (df[df > 0] > 0)]',
+                         engine=engine, parser=parser)
+        assert_frame_equal(expected, result)
+
+
+class TestDataFrameQueryPythonPandas(TestDataFrameQueryNumExprPandas):
+
+    @classmethod
+    def setup_class(cls):
+        super(TestDataFrameQueryPythonPandas, cls).setup_class()
+        cls.engine = 'python'
+        cls.parser = 'pandas'
+        cls.frame = TestData().frame
+
+    def test_query_builtin(self):
+        engine, parser = self.engine, self.parser
+
+        n = m = 10
+        df = DataFrame(np.random.randint(m, size=(n, 3)), columns=list('abc'))
+
+        df.index.name = 'sin'
+        expected = df[df.index > 5]
+        result = df.query('sin > 5', engine=engine, parser=parser)
+        assert_frame_equal(expected, result)
+
+
+class TestDataFrameQueryPythonPython(TestDataFrameQueryNumExprPython):
+
+    @classmethod
+    def setup_class(cls):
+        super(TestDataFrameQueryPythonPython, cls).setup_class()
+        cls.engine = cls.parser = 'python'
+        cls.frame = TestData().frame
+
+    def test_query_builtin(self):
+        engine, parser = self.engine, self.parser
+
+        n = m = 10
+        df = DataFrame(np.random.randint(m, size=(n, 3)), columns=list('abc'))
+
+        df.index.name = 'sin'
+        expected = df[df.index > 5]
+        result = df.query('sin > 5', engine=engine, parser=parser)
+        assert_frame_equal(expected, result)
+
+
+class TestDataFrameQueryStrings(object):
+
+    def test_str_query_method(self, parser, engine):
+        df = DataFrame(randn(10, 1), columns=['b'])
+        df['strings'] = Series(list('aabbccddee'))
+        expect = df[df.strings == 'a']
+
+        if parser != 'pandas':
+            col = 'strings'
+            lst = '"a"'
+
+            lhs = [col] * 2 + [lst] * 2
+            rhs = lhs[::-1]
+
+            eq, ne = '==', '!='
+            ops = 2 * ([eq] + [ne])
+
+            for lhs, op, rhs in zip(lhs, ops, rhs):
+                ex = '{lhs} {op} {rhs}'.format(lhs=lhs, op=op, rhs=rhs)
+                pytest.raises(NotImplementedError, df.query, ex,
+                              engine=engine, parser=parser,
+                              local_dict={'strings': df.strings})
+        else:
+            res = df.query('"a" == strings', engine=engine, parser=parser)
+            assert_frame_equal(res, expect)
+
+            res = df.query('strings == "a"', engine=engine, parser=parser)
+            assert_frame_equal(res, expect)
+            assert_frame_equal(res, df[df.strings.isin(['a'])])
+
+            expect = df[df.strings != 'a']
+            res = df.query('strings != "a"', engine=engine, parser=parser)
+            assert_frame_equal(res, expect)
+
+            res = df.query('"a" != strings', engine=engine, parser=parser)
+            assert_frame_equal(res, expect)
+            assert_frame_equal(res, df[~df.strings.isin(['a'])])
+
+    def test_str_list_query_method(self, parser, engine):
+        df = DataFrame(randn(10, 1), columns=['b'])
+        df['strings'] = Series(list('aabbccddee'))
+        expect = df[df.strings.isin(['a', 'b'])]
+
+        if parser != 'pandas':
+            col = 'strings'
+            lst = '["a", "b"]'
+
+            lhs = [col] * 2 + [lst] * 2
+            rhs = lhs[::-1]
+
+            eq, ne = '==', '!='
+            ops = 2 * ([eq] + [ne])
+
+            for lhs, op, rhs in zip(lhs, ops, rhs):
+                ex = '{lhs} {op} {rhs}'.format(lhs=lhs, op=op, rhs=rhs)
+                with pytest.raises(NotImplementedError):
+                    df.query(ex, engine=engine, parser=parser)
+        else:
+            res = df.query('strings == ["a", "b"]', engine=engine,
+                           parser=parser)
+            assert_frame_equal(res, expect)
+
+            res = df.query('["a", "b"] == strings', engine=engine,
+                           parser=parser)
+            assert_frame_equal(res, expect)
+
+            expect = df[~df.strings.isin(['a', 'b'])]
+
+            res = df.query('strings != ["a", "b"]', engine=engine,
+                           parser=parser)
+            assert_frame_equal(res, expect)
+
+            res = df.query('["a", "b"] != strings', engine=engine,
+                           parser=parser)
+            assert_frame_equal(res, expect)
+
+    def test_query_with_string_columns(self, parser, engine):
+        df = DataFrame({'a': list('aaaabbbbcccc'),
+                        'b': list('aabbccddeeff'),
+                        'c': np.random.randint(5, size=12),
+                        'd': np.random.randint(9, size=12)})
+        if parser == 'pandas':
+            res = df.query('a in b', parser=parser, engine=engine)
+            expec = df[df.a.isin(df.b)]
+            assert_frame_equal(res, expec)
+
+            res = df.query('a in b and c < d', parser=parser, engine=engine)
+            expec = df[df.a.isin(df.b) & (df.c < df.d)]
+            assert_frame_equal(res, expec)
+        else:
+            with pytest.raises(NotImplementedError):
+                df.query('a in b', parser=parser, engine=engine)
+
+            with pytest.raises(NotImplementedError):
+                df.query('a in b and c < d', parser=parser, engine=engine)
+
+    def test_object_array_eq_ne(self, parser, engine):
+        df = DataFrame({'a': list('aaaabbbbcccc'),
+                        'b': list('aabbccddeeff'),
+                        'c': np.random.randint(5, size=12),
+                        'd': np.random.randint(9, size=12)})
+        res = df.query('a == b', parser=parser, engine=engine)
+        exp = df[df.a == df.b]
+        assert_frame_equal(res, exp)
+
+        res = df.query('a != b', parser=parser, engine=engine)
+        exp = df[df.a != df.b]
+        assert_frame_equal(res, exp)
+
+    def test_query_with_nested_strings(self, parser, engine):
+        skip_if_no_pandas_parser(parser)
+        raw = """id          event          timestamp
+        1   "page 1 load"   1/1/2014 0:00:01
+        1   "page 1 exit"   1/1/2014 0:00:31
+        2   "page 2 load"   1/1/2014 0:01:01
+        2   "page 2 exit"   1/1/2014 0:01:31
+        3   "page 3 load"   1/1/2014 0:02:01
+        3   "page 3 exit"   1/1/2014 0:02:31
+        4   "page 1 load"   2/1/2014 1:00:01
+        4   "page 1 exit"   2/1/2014 1:00:31
+        5   "page 2 load"   2/1/2014 1:01:01
+        5   "page 2 exit"   2/1/2014 1:01:31
+        6   "page 3 load"   2/1/2014 1:02:01
+        6   "page 3 exit"   2/1/2014 1:02:31
+        """
+        df = pd.read_csv(StringIO(raw), sep=r'\s{2,}', engine='python',
+                         parse_dates=['timestamp'])
+        expected = df[df.event == '"page 1 load"']
+        res = df.query("""'"page 1 load"' in event""", parser=parser,
+                       engine=engine)
+        assert_frame_equal(expected, res)
+
+    def test_query_with_nested_special_character(self, parser, engine):
+        skip_if_no_pandas_parser(parser)
+        df = DataFrame({'a': ['a', 'b', 'test & test'],
+                        'b': [1, 2, 3]})
+        res = df.query('a == "test & test"', parser=parser, engine=engine)
+        expec = df[df.a == 'test & test']
+        assert_frame_equal(res, expec)
+
+    def test_query_lex_compare_strings(self, parser, engine):
+        import operator as opr
+
+        a = Series(np.random.choice(list('abcde'), 20))
+        b = Series(np.arange(a.size))
+        df = DataFrame({'X': a, 'Y': b})
+
+        ops = {'<': opr.lt, '>': opr.gt, '<=': opr.le, '>=': opr.ge}
+
+        for op, func in ops.items():
+            res = df.query('X %s "d"' % op, engine=engine, parser=parser)
+            expected = df[func(df.X, 'd')]
+            assert_frame_equal(res, expected)
+
+    def test_query_single_element_booleans(self, parser, engine):
+        columns = 'bid', 'bidsize', 'ask', 'asksize'
+        data = np.random.randint(2, size=(1, len(columns))).astype(bool)
+        df = DataFrame(data, columns=columns)
+        res = df.query('bid & ask', engine=engine, parser=parser)
+        expected = df[df.bid & df.ask]
+        assert_frame_equal(res, expected)
+
+    def test_query_string_scalar_variable(self, parser, engine):
+        skip_if_no_pandas_parser(parser)
+        df = pd.DataFrame({'Symbol': ['BUD US', 'BUD US', 'IBM US', 'IBM US'],
+                           'Price': [109.70, 109.72, 183.30, 183.35]})
+        e = df[df.Symbol == 'BUD US']
+        symb = 'BUD US'  # noqa
+        r = df.query('Symbol == @symb', parser=parser, engine=engine)
+        assert_frame_equal(e, r)
+
+
+class TestDataFrameEvalWithFrame(object):
+
+    def setup_method(self, method):
+        self.frame = DataFrame(randn(10, 3), columns=list('abc'))
+
+    def teardown_method(self, method):
+        del self.frame
+
+    def test_simple_expr(self, parser, engine):
+        res = self.frame.eval('a + b', engine=engine, parser=parser)
+        expect = self.frame.a + self.frame.b
+        assert_series_equal(res, expect)
+
+    def test_bool_arith_expr(self, parser, engine):
+        res = self.frame.eval('a[a < 1] + b', engine=engine, parser=parser)
+        expect = self.frame.a[self.frame.a < 1] + self.frame.b
+        assert_series_equal(res, expect)
+
+    def test_invalid_type_for_operator_raises(self, parser, engine):
+        df = DataFrame({'a': [1, 2], 'b': ['c', 'd']})
+        ops = '+', '-', '*', '/'
+        for op in ops:
+            with tm.assert_raises_regex(TypeError,
+                                        r"unsupported operand type\(s\) "
+                                        "for .+: '.+' and '.+'"):
+                df.eval('a {0} b'.format(op), engine=engine, parser=parser)
diff --git a/pandas/tests/frame/test_rank.py b/pandas/tests/frame/test_rank.py
new file mode 100644
index 0000000000000..a1210f1ed54e4
--- /dev/null
+++ b/pandas/tests/frame/test_rank.py
@@ -0,0 +1,301 @@
+# -*- coding: utf-8 -*-
+import pytest
+import numpy as np
+import pandas.util.testing as tm
+
+from distutils.version import LooseVersion
+from datetime import timedelta, datetime
+from numpy import nan
+
+from pandas.util.testing import assert_frame_equal
+from pandas.tests.frame.common import TestData
+from pandas import Series, DataFrame
+
+
+class TestRank(TestData):
+    s = Series([1, 3, 4, 2, nan, 2, 1, 5, nan, 3])
+    df = DataFrame({'A': s, 'B': s})
+
+    results = {
+        'average': np.array([1.5, 5.5, 7.0, 3.5, nan,
+                             3.5, 1.5, 8.0, nan, 5.5]),
+        'min': np.array([1, 5, 7, 3, nan, 3, 1, 8, nan, 5]),
+        'max': np.array([2, 6, 7, 4, nan, 4, 2, 8, nan, 6]),
+        'first': np.array([1, 5, 7, 3, nan, 4, 2, 8, nan, 6]),
+        'dense': np.array([1, 3, 4, 2, nan, 2, 1, 5, nan, 3]),
+    }
+
+    @pytest.fixture(params=['average', 'min', 'max', 'first', 'dense'])
+    def method(self, request):
+        """
+        Fixture for trying all rank methods
+        """
+        return request.param
+
+    def test_rank(self):
+        rankdata = pytest.importorskip('scipy.stats.rankdata')
+
+        self.frame['A'][::2] = np.nan
+        self.frame['B'][::3] = np.nan
+        self.frame['C'][::4] = np.nan
+        self.frame['D'][::5] = np.nan
+
+        ranks0 = self.frame.rank()
+        ranks1 = self.frame.rank(1)
+        mask = np.isnan(self.frame.values)
+
+        fvals = self.frame.fillna(np.inf).values
+
+        exp0 = np.apply_along_axis(rankdata, 0, fvals)
+        exp0[mask] = np.nan
+
+        exp1 = np.apply_along_axis(rankdata, 1, fvals)
+        exp1[mask] = np.nan
+
+        tm.assert_almost_equal(ranks0.values, exp0)
+        tm.assert_almost_equal(ranks1.values, exp1)
+
+        # integers
+        df = DataFrame(np.random.randint(0, 5, size=40).reshape((10, 4)))
+
+        result = df.rank()
+        exp = df.astype(float).rank()
+        tm.assert_frame_equal(result, exp)
+
+        result = df.rank(1)
+        exp = df.astype(float).rank(1)
+        tm.assert_frame_equal(result, exp)
+
+    def test_rank2(self):
+        df = DataFrame([[1, 3, 2], [1, 2, 3]])
+        expected = DataFrame([[1.0, 3.0, 2.0], [1, 2, 3]]) / 3.0
+        result = df.rank(1, pct=True)
+        tm.assert_frame_equal(result, expected)
+
+        df = DataFrame([[1, 3, 2], [1, 2, 3]])
+        expected = df.rank(0) / 2.0
+        result = df.rank(0, pct=True)
+        tm.assert_frame_equal(result, expected)
+
+        df = DataFrame([['b', 'c', 'a'], ['a', 'c', 'b']])
+        expected = DataFrame([[2.0, 3.0, 1.0], [1, 3, 2]])
+        result = df.rank(1, numeric_only=False)
+        tm.assert_frame_equal(result, expected)
+
+        expected = DataFrame([[2.0, 1.5, 1.0], [1, 1.5, 2]])
+        result = df.rank(0, numeric_only=False)
+        tm.assert_frame_equal(result, expected)
+
+        df = DataFrame([['b', np.nan, 'a'], ['a', 'c', 'b']])
+        expected = DataFrame([[2.0, nan, 1.0], [1.0, 3.0, 2.0]])
+        result = df.rank(1, numeric_only=False)
+        tm.assert_frame_equal(result, expected)
+
+        expected = DataFrame([[2.0, nan, 1.0], [1.0, 1.0, 2.0]])
+        result = df.rank(0, numeric_only=False)
+        tm.assert_frame_equal(result, expected)
+
+        # f7u12, this does not work without extensive workaround
+        data = [[datetime(2001, 1, 5), nan, datetime(2001, 1, 2)],
+                [datetime(2000, 1, 2), datetime(2000, 1, 3),
+                 datetime(2000, 1, 1)]]
+        df = DataFrame(data)
+
+        # check the rank
+        expected = DataFrame([[2., nan, 1.],
+                              [2., 3., 1.]])
+        result = df.rank(1, numeric_only=False, ascending=True)
+        tm.assert_frame_equal(result, expected)
+
+        expected = DataFrame([[1., nan, 2.],
+                              [2., 1., 3.]])
+        result = df.rank(1, numeric_only=False, ascending=False)
+        tm.assert_frame_equal(result, expected)
+
+        # mixed-type frames
+        self.mixed_frame['datetime'] = datetime.now()
+        self.mixed_frame['timedelta'] = timedelta(days=1, seconds=1)
+
+        result = self.mixed_frame.rank(1)
+        expected = self.mixed_frame.rank(1, numeric_only=True)
+        tm.assert_frame_equal(result, expected)
+
+        df = DataFrame({"a": [1e-20, -5, 1e-20 + 1e-40, 10,
+                              1e60, 1e80, 1e-30]})
+        exp = DataFrame({"a": [3.5, 1., 3.5, 5., 6., 7., 2.]})
+        tm.assert_frame_equal(df.rank(), exp)
+
+    def test_rank_na_option(self):
+        rankdata = pytest.importorskip('scipy.stats.rankdata')
+
+        self.frame['A'][::2] = np.nan
+        self.frame['B'][::3] = np.nan
+        self.frame['C'][::4] = np.nan
+        self.frame['D'][::5] = np.nan
+
+        # bottom
+        ranks0 = self.frame.rank(na_option='bottom')
+        ranks1 = self.frame.rank(1, na_option='bottom')
+
+        fvals = self.frame.fillna(np.inf).values
+
+        exp0 = np.apply_along_axis(rankdata, 0, fvals)
+        exp1 = np.apply_along_axis(rankdata, 1, fvals)
+
+        tm.assert_almost_equal(ranks0.values, exp0)
+        tm.assert_almost_equal(ranks1.values, exp1)
+
+        # top
+        ranks0 = self.frame.rank(na_option='top')
+        ranks1 = self.frame.rank(1, na_option='top')
+
+        fval0 = self.frame.fillna((self.frame.min() - 1).to_dict()).values
+        fval1 = self.frame.T
+        fval1 = fval1.fillna((fval1.min() - 1).to_dict()).T
+        fval1 = fval1.fillna(np.inf).values
+
+        exp0 = np.apply_along_axis(rankdata, 0, fval0)
+        exp1 = np.apply_along_axis(rankdata, 1, fval1)
+
+        tm.assert_almost_equal(ranks0.values, exp0)
+        tm.assert_almost_equal(ranks1.values, exp1)
+
+        # descending
+
+        # bottom
+        ranks0 = self.frame.rank(na_option='top', ascending=False)
+        ranks1 = self.frame.rank(1, na_option='top', ascending=False)
+
+        fvals = self.frame.fillna(np.inf).values
+
+        exp0 = np.apply_along_axis(rankdata, 0, -fvals)
+        exp1 = np.apply_along_axis(rankdata, 1, -fvals)
+
+        tm.assert_almost_equal(ranks0.values, exp0)
+        tm.assert_almost_equal(ranks1.values, exp1)
+
+        # descending
+
+        # top
+        ranks0 = self.frame.rank(na_option='bottom', ascending=False)
+        ranks1 = self.frame.rank(1, na_option='bottom', ascending=False)
+
+        fval0 = self.frame.fillna((self.frame.min() - 1).to_dict()).values
+        fval1 = self.frame.T
+        fval1 = fval1.fillna((fval1.min() - 1).to_dict()).T
+        fval1 = fval1.fillna(np.inf).values
+
+        exp0 = np.apply_along_axis(rankdata, 0, -fval0)
+        exp1 = np.apply_along_axis(rankdata, 1, -fval1)
+
+        tm.assert_numpy_array_equal(ranks0.values, exp0)
+        tm.assert_numpy_array_equal(ranks1.values, exp1)
+
+    def test_rank_axis(self):
+        # check if using axes' names gives the same result
+        df = DataFrame([[2, 1], [4, 3]])
+        tm.assert_frame_equal(df.rank(axis=0), df.rank(axis='index'))
+        tm.assert_frame_equal(df.rank(axis=1), df.rank(axis='columns'))
+
+    def test_rank_methods_frame(self):
+        pytest.importorskip('scipy.stats.special')
+        rankdata = pytest.importorskip('scipy.stats.rankdata')
+        import scipy
+
+        xs = np.random.randint(0, 21, (100, 26))
+        xs = (xs - 10.0) / 10.0
+        cols = [chr(ord('z') - i) for i in range(xs.shape[1])]
+
+        for vals in [xs, xs + 1e6, xs * 1e-6]:
+            df = DataFrame(vals, columns=cols)
+
+            for ax in [0, 1]:
+                for m in ['average', 'min', 'max', 'first', 'dense']:
+                    result = df.rank(axis=ax, method=m)
+                    sprank = np.apply_along_axis(
+                        rankdata, ax, vals,
+                        m if m != 'first' else 'ordinal')
+                    sprank = sprank.astype(np.float64)
+                    expected = DataFrame(sprank, columns=cols)
+
+                    if (LooseVersion(scipy.__version__) >=
+                            LooseVersion('0.17.0')):
+                        expected = expected.astype('float64')
+                    tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', ['O', 'f8', 'i8'])
+    def test_rank_descending(self, method, dtype):
+
+        if 'i' in dtype:
+            df = self.df.dropna()
+        else:
+            df = self.df.astype(dtype)
+
+        res = df.rank(ascending=False)
+        expected = (df.max() - df).rank()
+        assert_frame_equal(res, expected)
+
+        if method == 'first' and dtype == 'O':
+            return
+
+        expected = (df.max() - df).rank(method=method)
+
+        if dtype != 'O':
+            res2 = df.rank(method=method, ascending=False,
+                           numeric_only=True)
+            assert_frame_equal(res2, expected)
+
+        res3 = df.rank(method=method, ascending=False,
+                       numeric_only=False)
+        assert_frame_equal(res3, expected)
+
+    @pytest.mark.parametrize('axis', [0, 1])
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_rank_2d_tie_methods(self, method, axis, dtype):
+        df = self.df
+
+        def _check2d(df, expected, method='average', axis=0):
+            exp_df = DataFrame({'A': expected, 'B': expected})
+
+            if axis == 1:
+                df = df.T
+                exp_df = exp_df.T
+
+            result = df.rank(method=method, axis=axis)
+            assert_frame_equal(result, exp_df)
+
+        disabled = set([(object, 'first')])
+        if (dtype, method) in disabled:
+            return
+        frame = df if dtype is None else df.astype(dtype)
+        _check2d(frame, self.results[method], method=method, axis=axis)
+
+    @pytest.mark.parametrize(
+        "method,exp", [("dense",
+                        [[1., 1., 1.],
+                         [1., 0.5, 2. / 3],
+                         [1., 0.5, 1. / 3]]),
+                       ("min",
+                        [[1. / 3, 1., 1.],
+                         [1. / 3, 1. / 3, 2. / 3],
+                         [1. / 3, 1. / 3, 1. / 3]]),
+                       ("max",
+                        [[1., 1., 1.],
+                         [1., 2. / 3, 2. / 3],
+                         [1., 2. / 3, 1. / 3]]),
+                       ("average",
+                        [[2. / 3, 1., 1.],
+                         [2. / 3, 0.5, 2. / 3],
+                         [2. / 3, 0.5, 1. / 3]]),
+                       ("first",
+                        [[1. / 3, 1., 1.],
+                         [2. / 3, 1. / 3, 2. / 3],
+                         [3. / 3, 2. / 3, 1. / 3]])])
+    def test_rank_pct_true(self, method, exp):
+        # see gh-15630.
+
+        df = DataFrame([[2012, 66, 3], [2012, 65, 2], [2012, 65, 1]])
+        result = df.rank(method=method, pct=True)
+
+        expected = DataFrame(exp)
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_replace.py b/pandas/tests/frame/test_replace.py
new file mode 100644
index 0000000000000..dd83a94b7062a
--- /dev/null
+++ b/pandas/tests/frame/test_replace.py
@@ -0,0 +1,1103 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import pytest
+
+from datetime import datetime
+import re
+
+from pandas.compat import (zip, range, lrange, StringIO)
+from pandas import (DataFrame, Series, Index, date_range, compat,
+                    Timestamp)
+import pandas as pd
+
+from numpy import nan
+import numpy as np
+
+from pandas.util.testing import (assert_series_equal,
+                                 assert_frame_equal)
+
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+class TestDataFrameReplace(TestData):
+
+    def test_replace_inplace(self):
+        self.tsframe['A'][:5] = nan
+        self.tsframe['A'][-5:] = nan
+
+        tsframe = self.tsframe.copy()
+        tsframe.replace(nan, 0, inplace=True)
+        assert_frame_equal(tsframe, self.tsframe.fillna(0))
+
+        # mixed type
+        mf = self.mixed_frame
+        mf.iloc[5:20, mf.columns.get_loc('foo')] = nan
+        mf.iloc[-10:, mf.columns.get_loc('A')] = nan
+
+        result = self.mixed_frame.replace(np.nan, 0)
+        expected = self.mixed_frame.fillna(value=0)
+        assert_frame_equal(result, expected)
+
+        tsframe = self.tsframe.copy()
+        tsframe.replace([nan], [0], inplace=True)
+        assert_frame_equal(tsframe, self.tsframe.fillna(0))
+
+    def test_regex_replace_scalar(self):
+        obj = {'a': list('ab..'), 'b': list('efgh')}
+        dfobj = DataFrame(obj)
+        mix = {'a': lrange(4), 'b': list('ab..')}
+        dfmix = DataFrame(mix)
+
+        # simplest cases
+        # regex -> value
+        # obj frame
+        res = dfobj.replace(r'\s*\.\s*', nan, regex=True)
+        assert_frame_equal(dfobj, res.fillna('.'))
+
+        # mixed
+        res = dfmix.replace(r'\s*\.\s*', nan, regex=True)
+        assert_frame_equal(dfmix, res.fillna('.'))
+
+        # regex -> regex
+        # obj frame
+        res = dfobj.replace(r'\s*(\.)\s*', r'\1\1\1', regex=True)
+        objc = obj.copy()
+        objc['a'] = ['a', 'b', '...', '...']
+        expec = DataFrame(objc)
+        assert_frame_equal(res, expec)
+
+        # with mixed
+        res = dfmix.replace(r'\s*(\.)\s*', r'\1\1\1', regex=True)
+        mixc = mix.copy()
+        mixc['b'] = ['a', 'b', '...', '...']
+        expec = DataFrame(mixc)
+        assert_frame_equal(res, expec)
+
+        # everything with compiled regexs as well
+        res = dfobj.replace(re.compile(r'\s*\.\s*'), nan, regex=True)
+        assert_frame_equal(dfobj, res.fillna('.'))
+
+        # mixed
+        res = dfmix.replace(re.compile(r'\s*\.\s*'), nan, regex=True)
+        assert_frame_equal(dfmix, res.fillna('.'))
+
+        # regex -> regex
+        # obj frame
+        res = dfobj.replace(re.compile(r'\s*(\.)\s*'), r'\1\1\1')
+        objc = obj.copy()
+        objc['a'] = ['a', 'b', '...', '...']
+        expec = DataFrame(objc)
+        assert_frame_equal(res, expec)
+
+        # with mixed
+        res = dfmix.replace(re.compile(r'\s*(\.)\s*'), r'\1\1\1')
+        mixc = mix.copy()
+        mixc['b'] = ['a', 'b', '...', '...']
+        expec = DataFrame(mixc)
+        assert_frame_equal(res, expec)
+
+        res = dfmix.replace(regex=re.compile(r'\s*(\.)\s*'), value=r'\1\1\1')
+        mixc = mix.copy()
+        mixc['b'] = ['a', 'b', '...', '...']
+        expec = DataFrame(mixc)
+        assert_frame_equal(res, expec)
+
+        res = dfmix.replace(regex=r'\s*(\.)\s*', value=r'\1\1\1')
+        mixc = mix.copy()
+        mixc['b'] = ['a', 'b', '...', '...']
+        expec = DataFrame(mixc)
+        assert_frame_equal(res, expec)
+
+    def test_regex_replace_scalar_inplace(self):
+        obj = {'a': list('ab..'), 'b': list('efgh')}
+        dfobj = DataFrame(obj)
+        mix = {'a': lrange(4), 'b': list('ab..')}
+        dfmix = DataFrame(mix)
+
+        # simplest cases
+        # regex -> value
+        # obj frame
+        res = dfobj.copy()
+        res.replace(r'\s*\.\s*', nan, regex=True, inplace=True)
+        assert_frame_equal(dfobj, res.fillna('.'))
+
+        # mixed
+        res = dfmix.copy()
+        res.replace(r'\s*\.\s*', nan, regex=True, inplace=True)
+        assert_frame_equal(dfmix, res.fillna('.'))
+
+        # regex -> regex
+        # obj frame
+        res = dfobj.copy()
+        res.replace(r'\s*(\.)\s*', r'\1\1\1', regex=True, inplace=True)
+        objc = obj.copy()
+        objc['a'] = ['a', 'b', '...', '...']
+        expec = DataFrame(objc)
+        assert_frame_equal(res, expec)
+
+        # with mixed
+        res = dfmix.copy()
+        res.replace(r'\s*(\.)\s*', r'\1\1\1', regex=True, inplace=True)
+        mixc = mix.copy()
+        mixc['b'] = ['a', 'b', '...', '...']
+        expec = DataFrame(mixc)
+        assert_frame_equal(res, expec)
+
+        # everything with compiled regexs as well
+        res = dfobj.copy()
+        res.replace(re.compile(r'\s*\.\s*'), nan, regex=True, inplace=True)
+        assert_frame_equal(dfobj, res.fillna('.'))
+
+        # mixed
+        res = dfmix.copy()
+        res.replace(re.compile(r'\s*\.\s*'), nan, regex=True, inplace=True)
+        assert_frame_equal(dfmix, res.fillna('.'))
+
+        # regex -> regex
+        # obj frame
+        res = dfobj.copy()
+        res.replace(re.compile(r'\s*(\.)\s*'), r'\1\1\1', regex=True,
+                    inplace=True)
+        objc = obj.copy()
+        objc['a'] = ['a', 'b', '...', '...']
+        expec = DataFrame(objc)
+        assert_frame_equal(res, expec)
+
+        # with mixed
+        res = dfmix.copy()
+        res.replace(re.compile(r'\s*(\.)\s*'), r'\1\1\1', regex=True,
+                    inplace=True)
+        mixc = mix.copy()
+        mixc['b'] = ['a', 'b', '...', '...']
+        expec = DataFrame(mixc)
+        assert_frame_equal(res, expec)
+
+        res = dfobj.copy()
+        res.replace(regex=r'\s*\.\s*', value=nan, inplace=True)
+        assert_frame_equal(dfobj, res.fillna('.'))
+
+        # mixed
+        res = dfmix.copy()
+        res.replace(regex=r'\s*\.\s*', value=nan, inplace=True)
+        assert_frame_equal(dfmix, res.fillna('.'))
+
+        # regex -> regex
+        # obj frame
+        res = dfobj.copy()
+        res.replace(regex=r'\s*(\.)\s*', value=r'\1\1\1', inplace=True)
+        objc = obj.copy()
+        objc['a'] = ['a', 'b', '...', '...']
+        expec = DataFrame(objc)
+        assert_frame_equal(res, expec)
+
+        # with mixed
+        res = dfmix.copy()
+        res.replace(regex=r'\s*(\.)\s*', value=r'\1\1\1', inplace=True)
+        mixc = mix.copy()
+        mixc['b'] = ['a', 'b', '...', '...']
+        expec = DataFrame(mixc)
+        assert_frame_equal(res, expec)
+
+        # everything with compiled regexs as well
+        res = dfobj.copy()
+        res.replace(regex=re.compile(r'\s*\.\s*'), value=nan, inplace=True)
+        assert_frame_equal(dfobj, res.fillna('.'))
+
+        # mixed
+        res = dfmix.copy()
+        res.replace(regex=re.compile(r'\s*\.\s*'), value=nan, inplace=True)
+        assert_frame_equal(dfmix, res.fillna('.'))
+
+        # regex -> regex
+        # obj frame
+        res = dfobj.copy()
+        res.replace(regex=re.compile(r'\s*(\.)\s*'), value=r'\1\1\1',
+                    inplace=True)
+        objc = obj.copy()
+        objc['a'] = ['a', 'b', '...', '...']
+        expec = DataFrame(objc)
+        assert_frame_equal(res, expec)
+
+        # with mixed
+        res = dfmix.copy()
+        res.replace(regex=re.compile(r'\s*(\.)\s*'), value=r'\1\1\1',
+                    inplace=True)
+        mixc = mix.copy()
+        mixc['b'] = ['a', 'b', '...', '...']
+        expec = DataFrame(mixc)
+        assert_frame_equal(res, expec)
+
+    def test_regex_replace_list_obj(self):
+        obj = {'a': list('ab..'), 'b': list('efgh'), 'c': list('helo')}
+        dfobj = DataFrame(obj)
+
+        # lists of regexes and values
+        # list of [re1, re2, ..., reN] -> [v1, v2, ..., vN]
+        to_replace_res = [r'\s*\.\s*', r'e|f|g']
+        values = [nan, 'crap']
+        res = dfobj.replace(to_replace_res, values, regex=True)
+        expec = DataFrame({'a': ['a', 'b', nan, nan], 'b': ['crap'] * 3 +
+                           ['h'], 'c': ['h', 'crap', 'l', 'o']})
+        assert_frame_equal(res, expec)
+
+        # list of [re1, re2, ..., reN] -> [re1, re2, .., reN]
+        to_replace_res = [r'\s*(\.)\s*', r'(e|f|g)']
+        values = [r'\1\1', r'\1_crap']
+        res = dfobj.replace(to_replace_res, values, regex=True)
+        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['e_crap',
+                                                              'f_crap',
+                                                              'g_crap', 'h'],
+                           'c': ['h', 'e_crap', 'l', 'o']})
+
+        assert_frame_equal(res, expec)
+
+        # list of [re1, re2, ..., reN] -> [(re1 or v1), (re2 or v2), ..., (reN
+        # or vN)]
+        to_replace_res = [r'\s*(\.)\s*', r'e']
+        values = [r'\1\1', r'crap']
+        res = dfobj.replace(to_replace_res, values, regex=True)
+        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['crap', 'f', 'g',
+                                                              'h'],
+                           'c': ['h', 'crap', 'l', 'o']})
+        assert_frame_equal(res, expec)
+
+        to_replace_res = [r'\s*(\.)\s*', r'e']
+        values = [r'\1\1', r'crap']
+        res = dfobj.replace(value=values, regex=to_replace_res)
+        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['crap', 'f', 'g',
+                                                              'h'],
+                           'c': ['h', 'crap', 'l', 'o']})
+        assert_frame_equal(res, expec)
+
+    def test_regex_replace_list_obj_inplace(self):
+        # same as above with inplace=True
+        # lists of regexes and values
+        obj = {'a': list('ab..'), 'b': list('efgh'), 'c': list('helo')}
+        dfobj = DataFrame(obj)
+
+        # lists of regexes and values
+        # list of [re1, re2, ..., reN] -> [v1, v2, ..., vN]
+        to_replace_res = [r'\s*\.\s*', r'e|f|g']
+        values = [nan, 'crap']
+        res = dfobj.copy()
+        res.replace(to_replace_res, values, inplace=True, regex=True)
+        expec = DataFrame({'a': ['a', 'b', nan, nan], 'b': ['crap'] * 3 +
+                           ['h'], 'c': ['h', 'crap', 'l', 'o']})
+        assert_frame_equal(res, expec)
+
+        # list of [re1, re2, ..., reN] -> [re1, re2, .., reN]
+        to_replace_res = [r'\s*(\.)\s*', r'(e|f|g)']
+        values = [r'\1\1', r'\1_crap']
+        res = dfobj.copy()
+        res.replace(to_replace_res, values, inplace=True, regex=True)
+        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['e_crap',
+                                                              'f_crap',
+                                                              'g_crap', 'h'],
+                           'c': ['h', 'e_crap', 'l', 'o']})
+
+        assert_frame_equal(res, expec)
+
+        # list of [re1, re2, ..., reN] -> [(re1 or v1), (re2 or v2), ..., (reN
+        # or vN)]
+        to_replace_res = [r'\s*(\.)\s*', r'e']
+        values = [r'\1\1', r'crap']
+        res = dfobj.copy()
+        res.replace(to_replace_res, values, inplace=True, regex=True)
+        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['crap', 'f', 'g',
+                                                              'h'],
+                           'c': ['h', 'crap', 'l', 'o']})
+        assert_frame_equal(res, expec)
+
+        to_replace_res = [r'\s*(\.)\s*', r'e']
+        values = [r'\1\1', r'crap']
+        res = dfobj.copy()
+        res.replace(value=values, regex=to_replace_res, inplace=True)
+        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['crap', 'f', 'g',
+                                                              'h'],
+                           'c': ['h', 'crap', 'l', 'o']})
+        assert_frame_equal(res, expec)
+
+    def test_regex_replace_list_mixed(self):
+        # mixed frame to make sure this doesn't break things
+        mix = {'a': lrange(4), 'b': list('ab..')}
+        dfmix = DataFrame(mix)
+
+        # lists of regexes and values
+        # list of [re1, re2, ..., reN] -> [v1, v2, ..., vN]
+        to_replace_res = [r'\s*\.\s*', r'a']
+        values = [nan, 'crap']
+        mix2 = {'a': lrange(4), 'b': list('ab..'), 'c': list('halo')}
+        dfmix2 = DataFrame(mix2)
+        res = dfmix2.replace(to_replace_res, values, regex=True)
+        expec = DataFrame({'a': mix2['a'], 'b': ['crap', 'b', nan, nan],
+                           'c': ['h', 'crap', 'l', 'o']})
+        assert_frame_equal(res, expec)
+
+        # list of [re1, re2, ..., reN] -> [re1, re2, .., reN]
+        to_replace_res = [r'\s*(\.)\s*', r'(a|b)']
+        values = [r'\1\1', r'\1_crap']
+        res = dfmix.replace(to_replace_res, values, regex=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['a_crap', 'b_crap', '..',
+                                                '..']})
+
+        assert_frame_equal(res, expec)
+
+        # list of [re1, re2, ..., reN] -> [(re1 or v1), (re2 or v2), ..., (reN
+        # or vN)]
+        to_replace_res = [r'\s*(\.)\s*', r'a', r'(b)']
+        values = [r'\1\1', r'crap', r'\1_crap']
+        res = dfmix.replace(to_replace_res, values, regex=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['crap', 'b_crap', '..', '..']})
+        assert_frame_equal(res, expec)
+
+        to_replace_res = [r'\s*(\.)\s*', r'a', r'(b)']
+        values = [r'\1\1', r'crap', r'\1_crap']
+        res = dfmix.replace(regex=to_replace_res, value=values)
+        expec = DataFrame({'a': mix['a'], 'b': ['crap', 'b_crap', '..', '..']})
+        assert_frame_equal(res, expec)
+
+    def test_regex_replace_list_mixed_inplace(self):
+        mix = {'a': lrange(4), 'b': list('ab..')}
+        dfmix = DataFrame(mix)
+        # the same inplace
+        # lists of regexes and values
+        # list of [re1, re2, ..., reN] -> [v1, v2, ..., vN]
+        to_replace_res = [r'\s*\.\s*', r'a']
+        values = [nan, 'crap']
+        res = dfmix.copy()
+        res.replace(to_replace_res, values, inplace=True, regex=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['crap', 'b', nan, nan]})
+        assert_frame_equal(res, expec)
+
+        # list of [re1, re2, ..., reN] -> [re1, re2, .., reN]
+        to_replace_res = [r'\s*(\.)\s*', r'(a|b)']
+        values = [r'\1\1', r'\1_crap']
+        res = dfmix.copy()
+        res.replace(to_replace_res, values, inplace=True, regex=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['a_crap', 'b_crap', '..',
+                                                '..']})
+
+        assert_frame_equal(res, expec)
+
+        # list of [re1, re2, ..., reN] -> [(re1 or v1), (re2 or v2), ..., (reN
+        # or vN)]
+        to_replace_res = [r'\s*(\.)\s*', r'a', r'(b)']
+        values = [r'\1\1', r'crap', r'\1_crap']
+        res = dfmix.copy()
+        res.replace(to_replace_res, values, inplace=True, regex=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['crap', 'b_crap', '..', '..']})
+        assert_frame_equal(res, expec)
+
+        to_replace_res = [r'\s*(\.)\s*', r'a', r'(b)']
+        values = [r'\1\1', r'crap', r'\1_crap']
+        res = dfmix.copy()
+        res.replace(regex=to_replace_res, value=values, inplace=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['crap', 'b_crap', '..', '..']})
+        assert_frame_equal(res, expec)
+
+    def test_regex_replace_dict_mixed(self):
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        dfmix = DataFrame(mix)
+
+        # dicts
+        # single dict {re1: v1}, search the whole frame
+        # need test for this...
+
+        # list of dicts {re1: v1, re2: v2, ..., re3: v3}, search the whole
+        # frame
+        res = dfmix.replace({'b': r'\s*\.\s*'}, {'b': nan}, regex=True)
+        res2 = dfmix.copy()
+        res2.replace({'b': r'\s*\.\s*'}, {'b': nan}, inplace=True, regex=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', nan, nan], 'c':
+                           mix['c']})
+        assert_frame_equal(res, expec)
+        assert_frame_equal(res2, expec)
+
+        # list of dicts {re1: re11, re2: re12, ..., reN: re1N}, search the
+        # whole frame
+        res = dfmix.replace({'b': r'\s*(\.)\s*'}, {'b': r'\1ty'}, regex=True)
+        res2 = dfmix.copy()
+        res2.replace({'b': r'\s*(\.)\s*'}, {'b': r'\1ty'}, inplace=True,
+                     regex=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', '.ty', '.ty'], 'c':
+                           mix['c']})
+        assert_frame_equal(res, expec)
+        assert_frame_equal(res2, expec)
+
+        res = dfmix.replace(regex={'b': r'\s*(\.)\s*'}, value={'b': r'\1ty'})
+        res2 = dfmix.copy()
+        res2.replace(regex={'b': r'\s*(\.)\s*'}, value={'b': r'\1ty'},
+                     inplace=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', '.ty', '.ty'], 'c':
+                           mix['c']})
+        assert_frame_equal(res, expec)
+        assert_frame_equal(res2, expec)
+
+        # scalar -> dict
+        # to_replace regex, {value: value}
+        expec = DataFrame({'a': mix['a'], 'b': [nan, 'b', '.', '.'], 'c':
+                           mix['c']})
+        res = dfmix.replace('a', {'b': nan}, regex=True)
+        res2 = dfmix.copy()
+        res2.replace('a', {'b': nan}, regex=True, inplace=True)
+        assert_frame_equal(res, expec)
+        assert_frame_equal(res2, expec)
+
+        res = dfmix.replace('a', {'b': nan}, regex=True)
+        res2 = dfmix.copy()
+        res2.replace(regex='a', value={'b': nan}, inplace=True)
+        expec = DataFrame({'a': mix['a'], 'b': [nan, 'b', '.', '.'], 'c':
+                           mix['c']})
+        assert_frame_equal(res, expec)
+        assert_frame_equal(res2, expec)
+
+    def test_regex_replace_dict_nested(self):
+        # nested dicts will not work until this is implemented for Series
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        dfmix = DataFrame(mix)
+        res = dfmix.replace({'b': {r'\s*\.\s*': nan}}, regex=True)
+        res2 = dfmix.copy()
+        res4 = dfmix.copy()
+        res2.replace({'b': {r'\s*\.\s*': nan}}, inplace=True, regex=True)
+        res3 = dfmix.replace(regex={'b': {r'\s*\.\s*': nan}})
+        res4.replace(regex={'b': {r'\s*\.\s*': nan}}, inplace=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', nan, nan], 'c':
+                           mix['c']})
+        assert_frame_equal(res, expec)
+        assert_frame_equal(res2, expec)
+        assert_frame_equal(res3, expec)
+        assert_frame_equal(res4, expec)
+
+    def test_regex_replace_dict_nested_gh4115(self):
+        df = pd.DataFrame({'Type': ['Q', 'T', 'Q', 'Q', 'T'], 'tmp': 2})
+        expected = DataFrame({'Type': [0, 1, 0, 0, 1], 'tmp': 2})
+        result = df.replace({'Type': {'Q': 0, 'T': 1}})
+        assert_frame_equal(result, expected)
+
+    def test_regex_replace_list_to_scalar(self):
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        df = DataFrame(mix)
+        expec = DataFrame({'a': mix['a'], 'b': np.array([nan] * 4),
+                           'c': [nan, nan, nan, 'd']})
+
+        res = df.replace([r'\s*\.\s*', 'a|b'], nan, regex=True)
+        res2 = df.copy()
+        res3 = df.copy()
+        res2.replace([r'\s*\.\s*', 'a|b'], nan, regex=True, inplace=True)
+        res3.replace(regex=[r'\s*\.\s*', 'a|b'], value=nan, inplace=True)
+        assert_frame_equal(res, expec)
+        assert_frame_equal(res2, expec)
+        assert_frame_equal(res3, expec)
+
+    def test_regex_replace_str_to_numeric(self):
+        # what happens when you try to replace a numeric value with a regex?
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        df = DataFrame(mix)
+        res = df.replace(r'\s*\.\s*', 0, regex=True)
+        res2 = df.copy()
+        res2.replace(r'\s*\.\s*', 0, inplace=True, regex=True)
+        res3 = df.copy()
+        res3.replace(regex=r'\s*\.\s*', value=0, inplace=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', 0, 0], 'c':
+                           mix['c']})
+        assert_frame_equal(res, expec)
+        assert_frame_equal(res2, expec)
+        assert_frame_equal(res3, expec)
+
+    def test_regex_replace_regex_list_to_numeric(self):
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        df = DataFrame(mix)
+        res = df.replace([r'\s*\.\s*', 'b'], 0, regex=True)
+        res2 = df.copy()
+        res2.replace([r'\s*\.\s*', 'b'], 0, regex=True, inplace=True)
+        res3 = df.copy()
+        res3.replace(regex=[r'\s*\.\s*', 'b'], value=0, inplace=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['a', 0, 0, 0], 'c': ['a', 0,
+                                                                     nan,
+                                                                     'd']})
+        assert_frame_equal(res, expec)
+        assert_frame_equal(res2, expec)
+        assert_frame_equal(res3, expec)
+
+    def test_regex_replace_series_of_regexes(self):
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        df = DataFrame(mix)
+        s1 = Series({'b': r'\s*\.\s*'})
+        s2 = Series({'b': nan})
+        res = df.replace(s1, s2, regex=True)
+        res2 = df.copy()
+        res2.replace(s1, s2, inplace=True, regex=True)
+        res3 = df.copy()
+        res3.replace(regex=s1, value=s2, inplace=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', nan, nan], 'c':
+                           mix['c']})
+        assert_frame_equal(res, expec)
+        assert_frame_equal(res2, expec)
+        assert_frame_equal(res3, expec)
+
+    def test_regex_replace_numeric_to_object_conversion(self):
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        df = DataFrame(mix)
+        expec = DataFrame({'a': ['a', 1, 2, 3], 'b': mix['b'], 'c': mix['c']})
+        res = df.replace(0, 'a')
+        assert_frame_equal(res, expec)
+        assert res.a.dtype == np.object_
+
+    def test_replace_regex_metachar(self):
+        metachars = '[]', '()', r'\d', r'\w', r'\s'
+
+        for metachar in metachars:
+            df = DataFrame({'a': [metachar, 'else']})
+            result = df.replace({'a': {metachar: 'paren'}})
+            expected = DataFrame({'a': ['paren', 'else']})
+            assert_frame_equal(result, expected)
+
+    def test_replace(self):
+        self.tsframe['A'][:5] = nan
+        self.tsframe['A'][-5:] = nan
+
+        zero_filled = self.tsframe.replace(nan, -1e8)
+        assert_frame_equal(zero_filled, self.tsframe.fillna(-1e8))
+        assert_frame_equal(zero_filled.replace(-1e8, nan), self.tsframe)
+
+        self.tsframe['A'][:5] = nan
+        self.tsframe['A'][-5:] = nan
+        self.tsframe['B'][:5] = -1e8
+
+        # empty
+        df = DataFrame(index=['a', 'b'])
+        assert_frame_equal(df, df.replace(5, 7))
+
+        # GH 11698
+        # test for mixed data types.
+        df = pd.DataFrame([('-', pd.to_datetime('20150101')),
+                           ('a', pd.to_datetime('20150102'))])
+        df1 = df.replace('-', np.nan)
+        expected_df = pd.DataFrame([(np.nan, pd.to_datetime('20150101')),
+                                    ('a', pd.to_datetime('20150102'))])
+        assert_frame_equal(df1, expected_df)
+
+    def test_replace_list(self):
+        obj = {'a': list('ab..'), 'b': list('efgh'), 'c': list('helo')}
+        dfobj = DataFrame(obj)
+
+        # lists of regexes and values
+        # list of [v1, v2, ..., vN] -> [v1, v2, ..., vN]
+        to_replace_res = [r'.', r'e']
+        values = [nan, 'crap']
+        res = dfobj.replace(to_replace_res, values)
+        expec = DataFrame({'a': ['a', 'b', nan, nan],
+                           'b': ['crap', 'f', 'g', 'h'], 'c': ['h', 'crap',
+                                                               'l', 'o']})
+        assert_frame_equal(res, expec)
+
+        # list of [v1, v2, ..., vN] -> [v1, v2, .., vN]
+        to_replace_res = [r'.', r'f']
+        values = [r'..', r'crap']
+        res = dfobj.replace(to_replace_res, values)
+        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['e', 'crap', 'g',
+                                                              'h'],
+                           'c': ['h', 'e', 'l', 'o']})
+
+        assert_frame_equal(res, expec)
+
+    def test_replace_series_dict(self):
+        # from GH 3064
+        df = DataFrame({'zero': {'a': 0.0, 'b': 1}, 'one': {'a': 2.0, 'b': 0}})
+        result = df.replace(0, {'zero': 0.5, 'one': 1.0})
+        expected = DataFrame(
+            {'zero': {'a': 0.5, 'b': 1}, 'one': {'a': 2.0, 'b': 1.0}})
+        assert_frame_equal(result, expected)
+
+        result = df.replace(0, df.mean())
+        assert_frame_equal(result, expected)
+
+        # series to series/dict
+        df = DataFrame({'zero': {'a': 0.0, 'b': 1}, 'one': {'a': 2.0, 'b': 0}})
+        s = Series({'zero': 0.0, 'one': 2.0})
+        result = df.replace(s, {'zero': 0.5, 'one': 1.0})
+        expected = DataFrame(
+            {'zero': {'a': 0.5, 'b': 1}, 'one': {'a': 1.0, 'b': 0.0}})
+        assert_frame_equal(result, expected)
+
+        result = df.replace(s, df.mean())
+        assert_frame_equal(result, expected)
+
+    def test_replace_convert(self):
+        # gh 3907
+        df = DataFrame([['foo', 'bar', 'bah'], ['bar', 'foo', 'bah']])
+        m = {'foo': 1, 'bar': 2, 'bah': 3}
+        rep = df.replace(m)
+        expec = Series([np.int64] * 3)
+        res = rep.dtypes
+        assert_series_equal(expec, res)
+
+    def test_replace_mixed(self):
+        mf = self.mixed_frame
+        mf.iloc[5:20, mf.columns.get_loc('foo')] = nan
+        mf.iloc[-10:, mf.columns.get_loc('A')] = nan
+
+        result = self.mixed_frame.replace(np.nan, -18)
+        expected = self.mixed_frame.fillna(value=-18)
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result.replace(-18, nan), self.mixed_frame)
+
+        result = self.mixed_frame.replace(np.nan, -1e8)
+        expected = self.mixed_frame.fillna(value=-1e8)
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result.replace(-1e8, nan), self.mixed_frame)
+
+        # int block upcasting
+        df = DataFrame({'A': Series([1.0, 2.0], dtype='float64'),
+                        'B': Series([0, 1], dtype='int64')})
+        expected = DataFrame({'A': Series([1.0, 2.0], dtype='float64'),
+                              'B': Series([0.5, 1], dtype='float64')})
+        result = df.replace(0, 0.5)
+        assert_frame_equal(result, expected)
+
+        df.replace(0, 0.5, inplace=True)
+        assert_frame_equal(df, expected)
+
+        # int block splitting
+        df = DataFrame({'A': Series([1.0, 2.0], dtype='float64'),
+                        'B': Series([0, 1], dtype='int64'),
+                        'C': Series([1, 2], dtype='int64')})
+        expected = DataFrame({'A': Series([1.0, 2.0], dtype='float64'),
+                              'B': Series([0.5, 1], dtype='float64'),
+                              'C': Series([1, 2], dtype='int64')})
+        result = df.replace(0, 0.5)
+        assert_frame_equal(result, expected)
+
+        # to object block upcasting
+        df = DataFrame({'A': Series([1.0, 2.0], dtype='float64'),
+                        'B': Series([0, 1], dtype='int64')})
+        expected = DataFrame({'A': Series([1, 'foo'], dtype='object'),
+                              'B': Series([0, 1], dtype='int64')})
+        result = df.replace(2, 'foo')
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame({'A': Series(['foo', 'bar'], dtype='object'),
+                              'B': Series([0, 'foo'], dtype='object')})
+        result = df.replace([1, 2], ['foo', 'bar'])
+        assert_frame_equal(result, expected)
+
+        # test case from
+        df = DataFrame({'A': Series([3, 0], dtype='int64'),
+                        'B': Series([0, 3], dtype='int64')})
+        result = df.replace(3, df.mean().to_dict())
+        expected = df.copy().astype('float64')
+        m = df.mean()
+        expected.iloc[0, 0] = m[0]
+        expected.iloc[1, 1] = m[1]
+        assert_frame_equal(result, expected)
+
+    def test_replace_simple_nested_dict(self):
+        df = DataFrame({'col': range(1, 5)})
+        expected = DataFrame({'col': ['a', 2, 3, 'b']})
+
+        result = df.replace({'col': {1: 'a', 4: 'b'}})
+        assert_frame_equal(expected, result)
+
+        # in this case, should be the same as the not nested version
+        result = df.replace({1: 'a', 4: 'b'})
+        assert_frame_equal(expected, result)
+
+    def test_replace_simple_nested_dict_with_nonexistent_value(self):
+        df = DataFrame({'col': range(1, 5)})
+        expected = DataFrame({'col': ['a', 2, 3, 'b']})
+
+        result = df.replace({-1: '-', 1: 'a', 4: 'b'})
+        assert_frame_equal(expected, result)
+
+        result = df.replace({'col': {-1: '-', 1: 'a', 4: 'b'}})
+        assert_frame_equal(expected, result)
+
+    def test_replace_value_is_none(self):
+        orig_value = self.tsframe.iloc[0, 0]
+        orig2 = self.tsframe.iloc[1, 0]
+
+        self.tsframe.iloc[0, 0] = nan
+        self.tsframe.iloc[1, 0] = 1
+
+        result = self.tsframe.replace(to_replace={nan: 0})
+        expected = self.tsframe.T.replace(to_replace={nan: 0}).T
+        assert_frame_equal(result, expected)
+
+        result = self.tsframe.replace(to_replace={nan: 0, 1: -1e8})
+        tsframe = self.tsframe.copy()
+        tsframe.iloc[0, 0] = 0
+        tsframe.iloc[1, 0] = -1e8
+        expected = tsframe
+        assert_frame_equal(expected, result)
+        self.tsframe.iloc[0, 0] = orig_value
+        self.tsframe.iloc[1, 0] = orig2
+
+    def test_replace_for_new_dtypes(self):
+
+        # dtypes
+        tsframe = self.tsframe.copy().astype(np.float32)
+        tsframe['A'][:5] = nan
+        tsframe['A'][-5:] = nan
+
+        zero_filled = tsframe.replace(nan, -1e8)
+        assert_frame_equal(zero_filled, tsframe.fillna(-1e8))
+        assert_frame_equal(zero_filled.replace(-1e8, nan), tsframe)
+
+        tsframe['A'][:5] = nan
+        tsframe['A'][-5:] = nan
+        tsframe['B'][:5] = -1e8
+
+        b = tsframe['B']
+        b[b == -1e8] = nan
+        tsframe['B'] = b
+        result = tsframe.fillna(method='bfill')
+        assert_frame_equal(result, tsframe.fillna(method='bfill'))
+
+    def test_replace_dtypes(self):
+        # int
+        df = DataFrame({'ints': [1, 2, 3]})
+        result = df.replace(1, 0)
+        expected = DataFrame({'ints': [0, 2, 3]})
+        assert_frame_equal(result, expected)
+
+        df = DataFrame({'ints': [1, 2, 3]}, dtype=np.int32)
+        result = df.replace(1, 0)
+        expected = DataFrame({'ints': [0, 2, 3]}, dtype=np.int32)
+        assert_frame_equal(result, expected)
+
+        df = DataFrame({'ints': [1, 2, 3]}, dtype=np.int16)
+        result = df.replace(1, 0)
+        expected = DataFrame({'ints': [0, 2, 3]}, dtype=np.int16)
+        assert_frame_equal(result, expected)
+
+        # bools
+        df = DataFrame({'bools': [True, False, True]})
+        result = df.replace(False, True)
+        assert result.values.all()
+
+        # complex blocks
+        df = DataFrame({'complex': [1j, 2j, 3j]})
+        result = df.replace(1j, 0j)
+        expected = DataFrame({'complex': [0j, 2j, 3j]})
+        assert_frame_equal(result, expected)
+
+        # datetime blocks
+        prev = datetime.today()
+        now = datetime.today()
+        df = DataFrame({'datetime64': Index([prev, now, prev])})
+        result = df.replace(prev, now)
+        expected = DataFrame({'datetime64': Index([now] * 3)})
+        assert_frame_equal(result, expected)
+
+    def test_replace_input_formats_listlike(self):
+        # both dicts
+        to_rep = {'A': np.nan, 'B': 0, 'C': ''}
+        values = {'A': 0, 'B': -1, 'C': 'missing'}
+        df = DataFrame({'A': [np.nan, 0, np.inf], 'B': [0, 2, 5],
+                        'C': ['', 'asdf', 'fd']})
+        filled = df.replace(to_rep, values)
+        expected = {}
+        for k, v in compat.iteritems(df):
+            expected[k] = v.replace(to_rep[k], values[k])
+        assert_frame_equal(filled, DataFrame(expected))
+
+        result = df.replace([0, 2, 5], [5, 2, 0])
+        expected = DataFrame({'A': [np.nan, 5, np.inf], 'B': [5, 2, 0],
+                              'C': ['', 'asdf', 'fd']})
+        assert_frame_equal(result, expected)
+
+        # scalar to dict
+        values = {'A': 0, 'B': -1, 'C': 'missing'}
+        df = DataFrame({'A': [np.nan, 0, np.nan], 'B': [0, 2, 5],
+                        'C': ['', 'asdf', 'fd']})
+        filled = df.replace(np.nan, values)
+        expected = {}
+        for k, v in compat.iteritems(df):
+            expected[k] = v.replace(np.nan, values[k])
+        assert_frame_equal(filled, DataFrame(expected))
+
+        # list to list
+        to_rep = [np.nan, 0, '']
+        values = [-2, -1, 'missing']
+        result = df.replace(to_rep, values)
+        expected = df.copy()
+        for i in range(len(to_rep)):
+            expected.replace(to_rep[i], values[i], inplace=True)
+        assert_frame_equal(result, expected)
+
+        pytest.raises(ValueError, df.replace, to_rep, values[1:])
+
+    def test_replace_input_formats_scalar(self):
+        df = DataFrame({'A': [np.nan, 0, np.inf], 'B': [0, 2, 5],
+                        'C': ['', 'asdf', 'fd']})
+
+        # dict to scalar
+        to_rep = {'A': np.nan, 'B': 0, 'C': ''}
+        filled = df.replace(to_rep, 0)
+        expected = {}
+        for k, v in compat.iteritems(df):
+            expected[k] = v.replace(to_rep[k], 0)
+        assert_frame_equal(filled, DataFrame(expected))
+
+        pytest.raises(TypeError, df.replace, to_rep, [np.nan, 0, ''])
+
+        # list to scalar
+        to_rep = [np.nan, 0, '']
+        result = df.replace(to_rep, -1)
+        expected = df.copy()
+        for i in range(len(to_rep)):
+            expected.replace(to_rep[i], -1, inplace=True)
+        assert_frame_equal(result, expected)
+
+    def test_replace_limit(self):
+        pass
+
+    def test_replace_dict_no_regex(self):
+        answer = Series({0: 'Strongly Agree', 1: 'Agree', 2: 'Neutral', 3:
+                         'Disagree', 4: 'Strongly Disagree'})
+        weights = {'Agree': 4, 'Disagree': 2, 'Neutral': 3, 'Strongly Agree':
+                   5, 'Strongly Disagree': 1}
+        expected = Series({0: 5, 1: 4, 2: 3, 3: 2, 4: 1})
+        result = answer.replace(weights)
+        assert_series_equal(result, expected)
+
+    def test_replace_series_no_regex(self):
+        answer = Series({0: 'Strongly Agree', 1: 'Agree', 2: 'Neutral', 3:
+                         'Disagree', 4: 'Strongly Disagree'})
+        weights = Series({'Agree': 4, 'Disagree': 2, 'Neutral': 3,
+                          'Strongly Agree': 5, 'Strongly Disagree': 1})
+        expected = Series({0: 5, 1: 4, 2: 3, 3: 2, 4: 1})
+        result = answer.replace(weights)
+        assert_series_equal(result, expected)
+
+    def test_replace_dict_tuple_list_ordering_remains_the_same(self):
+        df = DataFrame(dict(A=[nan, 1]))
+        res1 = df.replace(to_replace={nan: 0, 1: -1e8})
+        res2 = df.replace(to_replace=(1, nan), value=[-1e8, 0])
+        res3 = df.replace(to_replace=[1, nan], value=[-1e8, 0])
+
+        expected = DataFrame({'A': [0, -1e8]})
+        assert_frame_equal(res1, res2)
+        assert_frame_equal(res2, res3)
+        assert_frame_equal(res3, expected)
+
+    def test_replace_doesnt_replace_without_regex(self):
+        raw = """fol T_opp T_Dir T_Enh
+        0    1     0     0    vo
+        1    2    vr     0     0
+        2    2     0     0     0
+        3    3     0    bt     0"""
+        df = pd.read_csv(StringIO(raw), sep=r'\s+')
+        res = df.replace({r'\D': 1})
+        assert_frame_equal(df, res)
+
+    def test_replace_bool_with_string(self):
+        df = DataFrame({'a': [True, False], 'b': list('ab')})
+        result = df.replace(True, 'a')
+        expected = DataFrame({'a': ['a', False], 'b': df.b})
+        assert_frame_equal(result, expected)
+
+    def test_replace_pure_bool_with_string_no_op(self):
+        df = DataFrame(np.random.rand(2, 2) > 0.5)
+        result = df.replace('asdf', 'fdsa')
+        assert_frame_equal(df, result)
+
+    def test_replace_bool_with_bool(self):
+        df = DataFrame(np.random.rand(2, 2) > 0.5)
+        result = df.replace(False, True)
+        expected = DataFrame(np.ones((2, 2), dtype=bool))
+        assert_frame_equal(result, expected)
+
+    def test_replace_with_dict_with_bool_keys(self):
+        df = DataFrame({0: [True, False], 1: [False, True]})
+        with tm.assert_raises_regex(TypeError, 'Cannot compare types .+'):
+            df.replace({'asdf': 'asdb', True: 'yes'})
+
+    def test_replace_truthy(self):
+        df = DataFrame({'a': [True, True]})
+        r = df.replace([np.inf, -np.inf], np.nan)
+        e = df
+        assert_frame_equal(r, e)
+
+    def test_replace_int_to_int_chain(self):
+        df = DataFrame({'a': lrange(1, 5)})
+        with tm.assert_raises_regex(ValueError,
+                                    "Replacement not allowed .+"):
+            df.replace({'a': dict(zip(range(1, 5), range(2, 6)))})
+
+    def test_replace_str_to_str_chain(self):
+        a = np.arange(1, 5)
+        astr = a.astype(str)
+        bstr = np.arange(2, 6).astype(str)
+        df = DataFrame({'a': astr})
+        with tm.assert_raises_regex(ValueError,
+                                    "Replacement not allowed .+"):
+            df.replace({'a': dict(zip(astr, bstr))})
+
+    def test_replace_swapping_bug(self):
+        df = pd.DataFrame({'a': [True, False, True]})
+        res = df.replace({'a': {True: 'Y', False: 'N'}})
+        expect = pd.DataFrame({'a': ['Y', 'N', 'Y']})
+        assert_frame_equal(res, expect)
+
+        df = pd.DataFrame({'a': [0, 1, 0]})
+        res = df.replace({'a': {0: 'Y', 1: 'N'}})
+        expect = pd.DataFrame({'a': ['Y', 'N', 'Y']})
+        assert_frame_equal(res, expect)
+
+    def test_replace_period(self):
+        d = {
+            'fname': {
+                'out_augmented_AUG_2011.json':
+                pd.Period(year=2011, month=8, freq='M'),
+                'out_augmented_JAN_2011.json':
+                pd.Period(year=2011, month=1, freq='M'),
+                'out_augmented_MAY_2012.json':
+                pd.Period(year=2012, month=5, freq='M'),
+                'out_augmented_SUBSIDY_WEEK.json':
+                pd.Period(year=2011, month=4, freq='M'),
+                'out_augmented_AUG_2012.json':
+                pd.Period(year=2012, month=8, freq='M'),
+                'out_augmented_MAY_2011.json':
+                pd.Period(year=2011, month=5, freq='M'),
+                'out_augmented_SEP_2013.json':
+                pd.Period(year=2013, month=9, freq='M')}}
+
+        df = pd.DataFrame(['out_augmented_AUG_2012.json',
+                           'out_augmented_SEP_2013.json',
+                           'out_augmented_SUBSIDY_WEEK.json',
+                           'out_augmented_MAY_2012.json',
+                           'out_augmented_MAY_2011.json',
+                           'out_augmented_AUG_2011.json',
+                           'out_augmented_JAN_2011.json'], columns=['fname'])
+        assert set(df.fname.values) == set(d['fname'].keys())
+        expected = DataFrame({'fname': [d['fname'][k]
+                                        for k in df.fname.values]})
+        result = df.replace(d)
+        assert_frame_equal(result, expected)
+
+    def test_replace_datetime(self):
+        d = {'fname':
+             {'out_augmented_AUG_2011.json': pd.Timestamp('2011-08'),
+              'out_augmented_JAN_2011.json': pd.Timestamp('2011-01'),
+              'out_augmented_MAY_2012.json': pd.Timestamp('2012-05'),
+              'out_augmented_SUBSIDY_WEEK.json': pd.Timestamp('2011-04'),
+              'out_augmented_AUG_2012.json': pd.Timestamp('2012-08'),
+              'out_augmented_MAY_2011.json': pd.Timestamp('2011-05'),
+              'out_augmented_SEP_2013.json': pd.Timestamp('2013-09')}}
+
+        df = pd.DataFrame(['out_augmented_AUG_2012.json',
+                           'out_augmented_SEP_2013.json',
+                           'out_augmented_SUBSIDY_WEEK.json',
+                           'out_augmented_MAY_2012.json',
+                           'out_augmented_MAY_2011.json',
+                           'out_augmented_AUG_2011.json',
+                           'out_augmented_JAN_2011.json'], columns=['fname'])
+        assert set(df.fname.values) == set(d['fname'].keys())
+        expected = DataFrame({'fname': [d['fname'][k]
+                                        for k in df.fname.values]})
+        result = df.replace(d)
+        assert_frame_equal(result, expected)
+
+    def test_replace_datetimetz(self):
+
+        # GH 11326
+        # behaving poorly when presented with a datetime64[ns, tz]
+        df = DataFrame({'A': date_range('20130101', periods=3,
+                                        tz='US/Eastern'),
+                        'B': [0, np.nan, 2]})
+        result = df.replace(np.nan, 1)
+        expected = DataFrame({'A': date_range('20130101', periods=3,
+                                              tz='US/Eastern'),
+                              'B': Series([0, 1, 2], dtype='float64')})
+        assert_frame_equal(result, expected)
+
+        result = df.fillna(1)
+        assert_frame_equal(result, expected)
+
+        result = df.replace(0, np.nan)
+        expected = DataFrame({'A': date_range('20130101', periods=3,
+                                              tz='US/Eastern'),
+                              'B': [np.nan, np.nan, 2]})
+        assert_frame_equal(result, expected)
+
+        result = df.replace(Timestamp('20130102', tz='US/Eastern'),
+                            Timestamp('20130104', tz='US/Eastern'))
+        expected = DataFrame({'A': [Timestamp('20130101', tz='US/Eastern'),
+                                    Timestamp('20130104', tz='US/Eastern'),
+                                    Timestamp('20130103', tz='US/Eastern')],
+                              'B': [0, np.nan, 2]})
+        assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.iloc[1, 0] = np.nan
+        result = result.replace(
+            {'A': pd.NaT}, Timestamp('20130104', tz='US/Eastern'))
+        assert_frame_equal(result, expected)
+
+        # coerce to object
+        result = df.copy()
+        result.iloc[1, 0] = np.nan
+        result = result.replace(
+            {'A': pd.NaT}, Timestamp('20130104', tz='US/Pacific'))
+        expected = DataFrame({'A': [Timestamp('20130101', tz='US/Eastern'),
+                                    Timestamp('20130104', tz='US/Pacific'),
+                                    Timestamp('20130103', tz='US/Eastern')],
+                              'B': [0, np.nan, 2]})
+        assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.iloc[1, 0] = np.nan
+        result = result.replace({'A': np.nan}, Timestamp('20130104'))
+        expected = DataFrame({'A': [Timestamp('20130101', tz='US/Eastern'),
+                                    Timestamp('20130104'),
+                                    Timestamp('20130103', tz='US/Eastern')],
+                              'B': [0, np.nan, 2]})
+        assert_frame_equal(result, expected)
+
+    def test_replace_with_empty_dictlike(self):
+        # GH 15289
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        df = DataFrame(mix)
+        assert_frame_equal(df, df.replace({}))
+        assert_frame_equal(df, df.replace(Series([])))
+
+        assert_frame_equal(df, df.replace({'b': {}}))
+        assert_frame_equal(df, df.replace(Series({'b': {}})))
+
+    @pytest.mark.parametrize("to_replace, method, expected", [
+        (0, 'bfill', {'A': [1, 1, 2],
+                      'B': [5, nan, 7],
+                      'C': ['a', 'b', 'c']}),
+        (nan, 'bfill', {'A': [0, 1, 2],
+                        'B': [5.0, 7.0, 7.0],
+                        'C': ['a', 'b', 'c']}),
+        ('d', 'ffill', {'A': [0, 1, 2],
+                        'B': [5, nan, 7],
+                        'C': ['a', 'b', 'c']}),
+        ([0, 2], 'bfill', {'A': [1, 1, 2],
+                           'B': [5, nan, 7],
+                           'C': ['a', 'b', 'c']}),
+        ([1, 2], 'pad', {'A': [0, 0, 0],
+                         'B': [5, nan, 7],
+                         'C': ['a', 'b', 'c']}),
+        ((1, 2), 'bfill', {'A': [0, 2, 2],
+                           'B': [5, nan, 7],
+                           'C': ['a', 'b', 'c']}),
+        (['b', 'c'], 'ffill', {'A': [0, 1, 2],
+                               'B': [5, nan, 7],
+                               'C': ['a', 'a', 'a']}),
+    ])
+    def test_replace_method(self, to_replace, method, expected):
+        # GH 19632
+        df = DataFrame({'A': [0, 1, 2],
+                        'B': [5, nan, 7],
+                        'C': ['a', 'b', 'c']})
+
+        result = df.replace(to_replace=to_replace, value=None, method=method)
+        expected = DataFrame(expected)
+        assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_repr_info.py b/pandas/tests/frame/test_repr_info.py
new file mode 100644
index 0000000000000..668613c494a47
--- /dev/null
+++ b/pandas/tests/frame/test_repr_info.py
@@ -0,0 +1,525 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+from datetime import datetime, timedelta
+import re
+import sys
+import textwrap
+
+from numpy import nan
+import numpy as np
+import pytest
+
+from pandas import (DataFrame, Series, compat, option_context,
+                    date_range, period_range, Categorical)
+from pandas.compat import StringIO, lrange, u, PYPY
+import pandas.io.formats.format as fmt
+import pandas as pd
+
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+# Segregated collection of methods that require the BlockManager internal data
+# structure
+
+
+class TestDataFrameReprInfoEtc(TestData):
+
+    def test_repr_empty(self):
+        # empty
+        foo = repr(self.empty)  # noqa
+
+        # empty with index
+        frame = DataFrame(index=np.arange(1000))
+        foo = repr(frame)  # noqa
+
+    def test_repr_mixed(self):
+        buf = StringIO()
+
+        # mixed
+        foo = repr(self.mixed_frame)  # noqa
+        self.mixed_frame.info(verbose=False, buf=buf)
+
+    @pytest.mark.slow
+    def test_repr_mixed_big(self):
+        # big mixed
+        biggie = DataFrame({'A': np.random.randn(200),
+                            'B': tm.makeStringIndex(200)},
+                           index=lrange(200))
+        biggie.loc[:20, 'A'] = nan
+        biggie.loc[:20, 'B'] = nan
+
+        foo = repr(biggie)  # noqa
+
+    def test_repr(self):
+        buf = StringIO()
+
+        # small one
+        foo = repr(self.frame)
+        self.frame.info(verbose=False, buf=buf)
+
+        # even smaller
+        self.frame.reindex(columns=['A']).info(verbose=False, buf=buf)
+        self.frame.reindex(columns=['A', 'B']).info(verbose=False, buf=buf)
+
+        # exhausting cases in DataFrame.info
+
+        # columns but no index
+        no_index = DataFrame(columns=[0, 1, 3])
+        foo = repr(no_index)  # noqa
+
+        # no columns or index
+        self.empty.info(buf=buf)
+
+        df = DataFrame(["a\n\r\tb"], columns=["a\n\r\td"], index=["a\n\r\tf"])
+        assert "\t" not in repr(df)
+        assert "\r" not in repr(df)
+        assert "a\n" not in repr(df)
+
+    def test_repr_dimensions(self):
+        df = DataFrame([[1, 2, ], [3, 4]])
+        with option_context('display.show_dimensions', True):
+            assert "2 rows x 2 columns" in repr(df)
+
+        with option_context('display.show_dimensions', False):
+            assert "2 rows x 2 columns" not in repr(df)
+
+        with option_context('display.show_dimensions', 'truncate'):
+            assert "2 rows x 2 columns" not in repr(df)
+
+    @pytest.mark.slow
+    def test_repr_big(self):
+        # big one
+        biggie = DataFrame(np.zeros((200, 4)), columns=lrange(4),
+                           index=lrange(200))
+        repr(biggie)
+
+    def test_repr_unsortable(self):
+        # columns are not sortable
+        import warnings
+        warn_filters = warnings.filters
+        warnings.filterwarnings('ignore',
+                                category=FutureWarning,
+                                module=".*format")
+
+        unsortable = DataFrame({'foo': [1] * 50,
+                                datetime.today(): [1] * 50,
+                                'bar': ['bar'] * 50,
+                                datetime.today() + timedelta(1): ['bar'] * 50},
+                               index=np.arange(50))
+        repr(unsortable)
+
+        fmt.set_option('display.precision', 3, 'display.column_space', 10)
+        repr(self.frame)
+
+        fmt.set_option('display.max_rows', 10, 'display.max_columns', 2)
+        repr(self.frame)
+
+        fmt.set_option('display.max_rows', 1000, 'display.max_columns', 1000)
+        repr(self.frame)
+
+        tm.reset_display_options()
+
+        warnings.filters = warn_filters
+
+    def test_repr_unicode(self):
+        uval = u('\u03c3\u03c3\u03c3\u03c3')
+
+        # TODO(wesm): is this supposed to be used?
+        bval = uval.encode('utf-8')  # noqa
+
+        df = DataFrame({'A': [uval, uval]})
+
+        result = repr(df)
+        ex_top = '      A'
+        assert result.split('\n')[0].rstrip() == ex_top
+
+        df = DataFrame({'A': [uval, uval]})
+        result = repr(df)
+        assert result.split('\n')[0].rstrip() == ex_top
+
+    def test_unicode_string_with_unicode(self):
+        df = DataFrame({'A': [u("\u05d0")]})
+
+        if compat.PY3:
+            str(df)
+        else:
+            compat.text_type(df)
+
+    def test_bytestring_with_unicode(self):
+        df = DataFrame({'A': [u("\u05d0")]})
+        if compat.PY3:
+            bytes(df)
+        else:
+            str(df)
+
+    def test_very_wide_info_repr(self):
+        df = DataFrame(np.random.randn(10, 20),
+                       columns=tm.rands_array(10, 20))
+        repr(df)
+
+    def test_repr_column_name_unicode_truncation_bug(self):
+        # #1906
+        df = DataFrame({'Id': [7117434],
+                        'StringCol': ('Is it possible to modify drop plot code'
+                                      ' so that the output graph is displayed '
+                                      'in iphone simulator, Is it possible to '
+                                      'modify drop plot code so that the '
+                                      'output graph is \xe2\x80\xa8displayed '
+                                      'in iphone simulator.Now we are adding '
+                                      'the CSV file externally. I want to Call'
+                                      ' the File through the code..')})
+
+        with option_context('display.max_columns', 20):
+            assert 'StringCol' in repr(df)
+
+    def test_latex_repr(self):
+        result = r"""\begin{tabular}{llll}
+\toprule
+{} &         0 &  1 &  2 \\
+\midrule
+0 &  $\alpha$ &  b &  c \\
+1 &         1 &  2 &  3 \\
+\bottomrule
+\end{tabular}
+"""
+        with option_context("display.latex.escape", False,
+                            'display.latex.repr', True):
+            df = DataFrame([[r'$\alpha$', 'b', 'c'], [1, 2, 3]])
+            assert result == df._repr_latex_()
+
+        # GH 12182
+        assert df._repr_latex_() is None
+
+    @tm.capture_stdout
+    def test_info(self):
+        io = StringIO()
+        self.frame.info(buf=io)
+        self.tsframe.info(buf=io)
+
+        frame = DataFrame(np.random.randn(5, 3))
+
+        frame.info()
+        frame.info(verbose=False)
+
+    def test_info_memory(self):
+        # https://github.com/pandas-dev/pandas/issues/21056
+        df = pd.DataFrame({'a': pd.Series([1, 2], dtype='i8')})
+        buf = StringIO()
+        df.info(buf=buf)
+        result = buf.getvalue()
+        bytes = float(df.memory_usage().sum())
+
+        expected = textwrap.dedent("""\
+        <class 'pandas.core.frame.DataFrame'>
+        RangeIndex: 2 entries, 0 to 1
+        Data columns (total 1 columns):
+        a    2 non-null int64
+        dtypes: int64(1)
+        memory usage: {} bytes
+        """.format(bytes))
+
+        assert result == expected
+
+    def test_info_wide(self):
+        from pandas import set_option, reset_option
+        io = StringIO()
+        df = DataFrame(np.random.randn(5, 101))
+        df.info(buf=io)
+
+        io = StringIO()
+        df.info(buf=io, max_cols=101)
+        rs = io.getvalue()
+        assert len(rs.splitlines()) > 100
+        xp = rs
+
+        set_option('display.max_info_columns', 101)
+        io = StringIO()
+        df.info(buf=io)
+        assert rs == xp
+        reset_option('display.max_info_columns')
+
+    def test_info_duplicate_columns(self):
+        io = StringIO()
+
+        # it works!
+        frame = DataFrame(np.random.randn(1500, 4),
+                          columns=['a', 'a', 'b', 'b'])
+        frame.info(buf=io)
+
+    def test_info_duplicate_columns_shows_correct_dtypes(self):
+        # GH11761
+        io = StringIO()
+
+        frame = DataFrame([[1, 2.0]],
+                          columns=['a', 'a'])
+        frame.info(buf=io)
+        io.seek(0)
+        lines = io.readlines()
+        assert 'a    1 non-null int64\n' == lines[3]
+        assert 'a    1 non-null float64\n' == lines[4]
+
+    def test_info_shows_column_dtypes(self):
+        dtypes = ['int64', 'float64', 'datetime64[ns]', 'timedelta64[ns]',
+                  'complex128', 'object', 'bool']
+        data = {}
+        n = 10
+        for i, dtype in enumerate(dtypes):
+            data[i] = np.random.randint(2, size=n).astype(dtype)
+        df = DataFrame(data)
+        buf = StringIO()
+        df.info(buf=buf)
+        res = buf.getvalue()
+        for i, dtype in enumerate(dtypes):
+            name = '%d    %d non-null %s' % (i, n, dtype)
+            assert name in res
+
+    def test_info_max_cols(self):
+        df = DataFrame(np.random.randn(10, 5))
+        for len_, verbose in [(5, None), (5, False), (10, True)]:
+            # For verbose always      ^ setting  ^ summarize ^ full output
+            with option_context('max_info_columns', 4):
+                buf = StringIO()
+                df.info(buf=buf, verbose=verbose)
+                res = buf.getvalue()
+                assert len(res.strip().split('\n')) == len_
+
+        for len_, verbose in [(10, None), (5, False), (10, True)]:
+
+            # max_cols no exceeded
+            with option_context('max_info_columns', 5):
+                buf = StringIO()
+                df.info(buf=buf, verbose=verbose)
+                res = buf.getvalue()
+                assert len(res.strip().split('\n')) == len_
+
+        for len_, max_cols in [(10, 5), (5, 4)]:
+            # setting truncates
+            with option_context('max_info_columns', 4):
+                buf = StringIO()
+                df.info(buf=buf, max_cols=max_cols)
+                res = buf.getvalue()
+                assert len(res.strip().split('\n')) == len_
+
+            # setting wouldn't truncate
+            with option_context('max_info_columns', 5):
+                buf = StringIO()
+                df.info(buf=buf, max_cols=max_cols)
+                res = buf.getvalue()
+                assert len(res.strip().split('\n')) == len_
+
+    def test_info_memory_usage(self):
+        # Ensure memory usage is displayed, when asserted, on the last line
+        dtypes = ['int64', 'float64', 'datetime64[ns]', 'timedelta64[ns]',
+                  'complex128', 'object', 'bool']
+        data = {}
+        n = 10
+        for i, dtype in enumerate(dtypes):
+            data[i] = np.random.randint(2, size=n).astype(dtype)
+        df = DataFrame(data)
+        buf = StringIO()
+
+        # display memory usage case
+        df.info(buf=buf, memory_usage=True)
+        res = buf.getvalue().splitlines()
+        assert "memory usage: " in res[-1]
+
+        # do not display memory usage case
+        df.info(buf=buf, memory_usage=False)
+        res = buf.getvalue().splitlines()
+        assert "memory usage: " not in res[-1]
+
+        df.info(buf=buf, memory_usage=True)
+        res = buf.getvalue().splitlines()
+
+        # memory usage is a lower bound, so print it as XYZ+ MB
+        assert re.match(r"memory usage: [^+]+\+", res[-1])
+
+        df.iloc[:, :5].info(buf=buf, memory_usage=True)
+        res = buf.getvalue().splitlines()
+
+        # excluded column with object dtype, so estimate is accurate
+        assert not re.match(r"memory usage: [^+]+\+", res[-1])
+
+        # Test a DataFrame with duplicate columns
+        dtypes = ['int64', 'int64', 'int64', 'float64']
+        data = {}
+        n = 100
+        for i, dtype in enumerate(dtypes):
+            data[i] = np.random.randint(2, size=n).astype(dtype)
+        df = DataFrame(data)
+        df.columns = dtypes
+
+        df_with_object_index = pd.DataFrame({'a': [1]}, index=['foo'])
+        df_with_object_index.info(buf=buf, memory_usage=True)
+        res = buf.getvalue().splitlines()
+        assert re.match(r"memory usage: [^+]+\+", res[-1])
+
+        df_with_object_index.info(buf=buf, memory_usage='deep')
+        res = buf.getvalue().splitlines()
+        assert re.match(r"memory usage: [^+]+$", res[-1])
+
+        # Ensure df size is as expected
+        # (cols * rows * bytes) + index size
+        df_size = df.memory_usage().sum()
+        exp_size = len(dtypes) * n * 8 + df.index.nbytes
+        assert df_size == exp_size
+
+        # Ensure number of cols in memory_usage is the same as df
+        size_df = np.size(df.columns.values) + 1  # index=True; default
+        assert size_df == np.size(df.memory_usage())
+
+        # assert deep works only on object
+        assert df.memory_usage().sum() == df.memory_usage(deep=True).sum()
+
+        # test for validity
+        DataFrame(1, index=['a'], columns=['A']
+                  ).memory_usage(index=True)
+        DataFrame(1, index=['a'], columns=['A']
+                  ).index.nbytes
+        df = DataFrame(
+            data=1,
+            index=pd.MultiIndex.from_product(
+                [['a'], range(1000)]),
+            columns=['A']
+        )
+        df.index.nbytes
+        df.memory_usage(index=True)
+        df.index.values.nbytes
+
+        mem = df.memory_usage(deep=True).sum()
+        assert mem > 0
+
+    @pytest.mark.skipif(PYPY,
+                        reason="on PyPy deep=True doesn't change result")
+    def test_info_memory_usage_deep_not_pypy(self):
+        df_with_object_index = pd.DataFrame({'a': [1]}, index=['foo'])
+        assert (df_with_object_index.memory_usage(
+                index=True, deep=True).sum() >
+                df_with_object_index.memory_usage(
+                    index=True).sum())
+
+        df_object = pd.DataFrame({'a': ['a']})
+        assert (df_object.memory_usage(deep=True).sum() >
+                df_object.memory_usage().sum())
+
+    @pytest.mark.skipif(not PYPY,
+                        reason="on PyPy deep=True does not change result")
+    def test_info_memory_usage_deep_pypy(self):
+        df_with_object_index = pd.DataFrame({'a': [1]}, index=['foo'])
+        assert (df_with_object_index.memory_usage(
+                index=True, deep=True).sum() ==
+                df_with_object_index.memory_usage(
+                    index=True).sum())
+
+        df_object = pd.DataFrame({'a': ['a']})
+        assert (df_object.memory_usage(deep=True).sum() ==
+                df_object.memory_usage().sum())
+
+    @pytest.mark.skipif(PYPY, reason="PyPy getsizeof() fails by design")
+    def test_usage_via_getsizeof(self):
+        df = DataFrame(
+            data=1,
+            index=pd.MultiIndex.from_product(
+                [['a'], range(1000)]),
+            columns=['A']
+        )
+        mem = df.memory_usage(deep=True).sum()
+        # sys.getsizeof will call the .memory_usage with
+        # deep=True, and add on some GC overhead
+        diff = mem - sys.getsizeof(df)
+        assert abs(diff) < 100
+
+    def test_info_memory_usage_qualified(self):
+
+        buf = StringIO()
+        df = DataFrame(1, columns=list('ab'),
+                       index=[1, 2, 3])
+        df.info(buf=buf)
+        assert '+' not in buf.getvalue()
+
+        buf = StringIO()
+        df = DataFrame(1, columns=list('ab'),
+                       index=list('ABC'))
+        df.info(buf=buf)
+        assert '+' in buf.getvalue()
+
+        buf = StringIO()
+        df = DataFrame(1, columns=list('ab'),
+                       index=pd.MultiIndex.from_product(
+                           [range(3), range(3)]))
+        df.info(buf=buf)
+        assert '+' not in buf.getvalue()
+
+        buf = StringIO()
+        df = DataFrame(1, columns=list('ab'),
+                       index=pd.MultiIndex.from_product(
+                           [range(3), ['foo', 'bar']]))
+        df.info(buf=buf)
+        assert '+' in buf.getvalue()
+
+    def test_info_memory_usage_bug_on_multiindex(self):
+        # GH 14308
+        # memory usage introspection should not materialize .values
+
+        from string import ascii_uppercase as uppercase
+
+        def memory_usage(f):
+            return f.memory_usage(deep=True).sum()
+
+        N = 100
+        M = len(uppercase)
+        index = pd.MultiIndex.from_product([list(uppercase),
+                                            pd.date_range('20160101',
+                                                          periods=N)],
+                                           names=['id', 'date'])
+        df = DataFrame({'value': np.random.randn(N * M)}, index=index)
+
+        unstacked = df.unstack('id')
+        assert df.values.nbytes == unstacked.values.nbytes
+        assert memory_usage(df) > memory_usage(unstacked)
+
+        # high upper bound
+        assert memory_usage(unstacked) - memory_usage(df) < 2000
+
+    def test_info_categorical(self):
+        # GH14298
+        idx = pd.CategoricalIndex(['a', 'b'])
+        df = pd.DataFrame(np.zeros((2, 2)), index=idx, columns=idx)
+
+        buf = StringIO()
+        df.info(buf=buf)
+
+    def test_info_categorical_column(self):
+
+        # make sure it works
+        n = 2500
+        df = DataFrame({'int64': np.random.randint(100, size=n)})
+        df['category'] = Series(np.array(list('abcdefghij')).take(
+            np.random.randint(0, 10, size=n))).astype('category')
+        df.isna()
+        buf = StringIO()
+        df.info(buf=buf)
+
+        df2 = df[df['category'] == 'd']
+        buf = compat.StringIO()
+        df2.info(buf=buf)
+
+    def test_repr_categorical_dates_periods(self):
+        # normal DataFrame
+        dt = date_range('2011-01-01 09:00', freq='H', periods=5,
+                        tz='US/Eastern')
+        p = period_range('2011-01', freq='M', periods=5)
+        df = DataFrame({'dt': dt, 'p': p})
+        exp = """                         dt       p
+0 2011-01-01 09:00:00-05:00 2011-01
+1 2011-01-01 10:00:00-05:00 2011-02
+2 2011-01-01 11:00:00-05:00 2011-03
+3 2011-01-01 12:00:00-05:00 2011-04
+4 2011-01-01 13:00:00-05:00 2011-05"""
+
+        df = DataFrame({'dt': Categorical(dt), 'p': Categorical(p)})
+        assert repr(df) == exp
diff --git a/pandas/tests/frame/test_reshape.py b/pandas/tests/frame/test_reshape.py
new file mode 100644
index 0000000000000..ebf6c5e37b916
--- /dev/null
+++ b/pandas/tests/frame/test_reshape.py
@@ -0,0 +1,912 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+from warnings import catch_warnings
+from datetime import datetime
+
+import itertools
+import pytest
+
+from numpy.random import randn
+from numpy import nan
+import numpy as np
+
+from pandas.compat import u
+from pandas import (DataFrame, Index, Series, MultiIndex, date_range,
+                    Timedelta, Period)
+import pandas as pd
+
+from pandas.util.testing import assert_series_equal, assert_frame_equal
+
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+class TestDataFrameReshape(TestData):
+
+    def test_pivot(self):
+        data = {
+            'index': ['A', 'B', 'C', 'C', 'B', 'A'],
+            'columns': ['One', 'One', 'One', 'Two', 'Two', 'Two'],
+            'values': [1., 2., 3., 3., 2., 1.]
+        }
+
+        frame = DataFrame(data)
+        pivoted = frame.pivot(
+            index='index', columns='columns', values='values')
+
+        expected = DataFrame({
+            'One': {'A': 1., 'B': 2., 'C': 3.},
+            'Two': {'A': 1., 'B': 2., 'C': 3.}
+        })
+
+        expected.index.name, expected.columns.name = 'index', 'columns'
+        tm.assert_frame_equal(pivoted, expected)
+
+        # name tracking
+        assert pivoted.index.name == 'index'
+        assert pivoted.columns.name == 'columns'
+
+        # don't specify values
+        pivoted = frame.pivot(index='index', columns='columns')
+        assert pivoted.index.name == 'index'
+        assert pivoted.columns.names == (None, 'columns')
+
+        with catch_warnings(record=True):
+            # pivot multiple columns
+            wp = tm.makePanel()
+            lp = wp.to_frame()
+            df = lp.reset_index()
+            tm.assert_frame_equal(df.pivot('major', 'minor'), lp.unstack())
+
+    def test_pivot_duplicates(self):
+        data = DataFrame({'a': ['bar', 'bar', 'foo', 'foo', 'foo'],
+                          'b': ['one', 'two', 'one', 'one', 'two'],
+                          'c': [1., 2., 3., 3., 4.]})
+        with tm.assert_raises_regex(ValueError, 'duplicate entries'):
+            data.pivot('a', 'b', 'c')
+
+    def test_pivot_empty(self):
+        df = DataFrame({}, columns=['a', 'b', 'c'])
+        result = df.pivot('a', 'b', 'c')
+        expected = DataFrame({})
+        tm.assert_frame_equal(result, expected, check_names=False)
+
+    def test_pivot_integer_bug(self):
+        df = DataFrame(data=[("A", "1", "A1"), ("B", "2", "B2")])
+
+        result = df.pivot(index=1, columns=0, values=2)
+        repr(result)
+        tm.assert_index_equal(result.columns, Index(['A', 'B'], name=0))
+
+    def test_pivot_index_none(self):
+        # gh-3962
+        data = {
+            'index': ['A', 'B', 'C', 'C', 'B', 'A'],
+            'columns': ['One', 'One', 'One', 'Two', 'Two', 'Two'],
+            'values': [1., 2., 3., 3., 2., 1.]
+        }
+
+        frame = DataFrame(data).set_index('index')
+        result = frame.pivot(columns='columns', values='values')
+        expected = DataFrame({
+            'One': {'A': 1., 'B': 2., 'C': 3.},
+            'Two': {'A': 1., 'B': 2., 'C': 3.}
+        })
+
+        expected.index.name, expected.columns.name = 'index', 'columns'
+        assert_frame_equal(result, expected)
+
+        # omit values
+        result = frame.pivot(columns='columns')
+
+        expected.columns = pd.MultiIndex.from_tuples([('values', 'One'),
+                                                      ('values', 'Two')],
+                                                     names=[None, 'columns'])
+        expected.index.name = 'index'
+        tm.assert_frame_equal(result, expected, check_names=False)
+        assert result.index.name == 'index'
+        assert result.columns.names == (None, 'columns')
+        expected.columns = expected.columns.droplevel(0)
+        result = frame.pivot(columns='columns', values='values')
+
+        expected.columns.name = 'columns'
+        tm.assert_frame_equal(result, expected)
+
+    def test_stack_unstack(self):
+        df = self.frame.copy()
+        df[:] = np.arange(np.prod(df.shape)).reshape(df.shape)
+
+        stacked = df.stack()
+        stacked_df = DataFrame({'foo': stacked, 'bar': stacked})
+
+        unstacked = stacked.unstack()
+        unstacked_df = stacked_df.unstack()
+
+        assert_frame_equal(unstacked, df)
+        assert_frame_equal(unstacked_df['bar'], df)
+
+        unstacked_cols = stacked.unstack(0)
+        unstacked_cols_df = stacked_df.unstack(0)
+        assert_frame_equal(unstacked_cols.T, df)
+        assert_frame_equal(unstacked_cols_df['bar'].T, df)
+
+    def test_stack_mixed_level(self):
+        # GH 18310
+        levels = [range(3), [3, 'a', 'b'], [1, 2]]
+
+        # flat columns:
+        df = DataFrame(1, index=levels[0], columns=levels[1])
+        result = df.stack()
+        expected = Series(1, index=MultiIndex.from_product(levels[:2]))
+        assert_series_equal(result, expected)
+
+        # MultiIndex columns:
+        df = DataFrame(1, index=levels[0],
+                       columns=MultiIndex.from_product(levels[1:]))
+        result = df.stack(1)
+        expected = DataFrame(1, index=MultiIndex.from_product([levels[0],
+                                                               levels[2]]),
+                             columns=levels[1])
+        assert_frame_equal(result, expected)
+
+        # as above, but used labels in level are actually of homogeneous type
+        result = df[['a', 'b']].stack(1)
+        expected = expected[['a', 'b']]
+        assert_frame_equal(result, expected)
+
+    def test_unstack_fill(self):
+
+        # GH #9746: fill_value keyword argument for Series
+        # and DataFrame unstack
+
+        # From a series
+        data = Series([1, 2, 4, 5], dtype=np.int16)
+        data.index = MultiIndex.from_tuples(
+            [('x', 'a'), ('x', 'b'), ('y', 'b'), ('z', 'a')])
+
+        result = data.unstack(fill_value=-1)
+        expected = DataFrame({'a': [1, -1, 5], 'b': [2, 4, -1]},
+                             index=['x', 'y', 'z'], dtype=np.int16)
+        assert_frame_equal(result, expected)
+
+        # From a series with incorrect data type for fill_value
+        result = data.unstack(fill_value=0.5)
+        expected = DataFrame({'a': [1, 0.5, 5], 'b': [2, 4, 0.5]},
+                             index=['x', 'y', 'z'], dtype=np.float)
+        assert_frame_equal(result, expected)
+
+        # GH #13971: fill_value when unstacking multiple levels:
+        df = DataFrame({'x': ['a', 'a', 'b'],
+                        'y': ['j', 'k', 'j'],
+                        'z': [0, 1, 2],
+                        'w': [0, 1, 2]}).set_index(['x', 'y', 'z'])
+        unstacked = df.unstack(['x', 'y'], fill_value=0)
+        key = ('w', 'b', 'j')
+        expected = unstacked[key]
+        result = pd.Series([0, 0, 2], index=unstacked.index, name=key)
+        assert_series_equal(result, expected)
+
+        stacked = unstacked.stack(['x', 'y'])
+        stacked.index = stacked.index.reorder_levels(df.index.names)
+        # Workaround for GH #17886 (unnecessarily casts to float):
+        stacked = stacked.astype(np.int64)
+        result = stacked.loc[df.index]
+        assert_frame_equal(result, df)
+
+        # From a series
+        s = df['w']
+        result = s.unstack(['x', 'y'], fill_value=0)
+        expected = unstacked['w']
+        assert_frame_equal(result, expected)
+
+    def test_unstack_fill_frame(self):
+
+        # From a dataframe
+        rows = [[1, 2], [3, 4], [5, 6], [7, 8]]
+        df = DataFrame(rows, columns=list('AB'), dtype=np.int32)
+        df.index = MultiIndex.from_tuples(
+            [('x', 'a'), ('x', 'b'), ('y', 'b'), ('z', 'a')])
+
+        result = df.unstack(fill_value=-1)
+
+        rows = [[1, 3, 2, 4], [-1, 5, -1, 6], [7, -1, 8, -1]]
+        expected = DataFrame(rows, index=list('xyz'), dtype=np.int32)
+        expected.columns = MultiIndex.from_tuples(
+            [('A', 'a'), ('A', 'b'), ('B', 'a'), ('B', 'b')])
+        assert_frame_equal(result, expected)
+
+        # From a mixed type dataframe
+        df['A'] = df['A'].astype(np.int16)
+        df['B'] = df['B'].astype(np.float64)
+
+        result = df.unstack(fill_value=-1)
+        expected['A'] = expected['A'].astype(np.int16)
+        expected['B'] = expected['B'].astype(np.float64)
+        assert_frame_equal(result, expected)
+
+        # From a dataframe with incorrect data type for fill_value
+        result = df.unstack(fill_value=0.5)
+
+        rows = [[1, 3, 2, 4], [0.5, 5, 0.5, 6], [7, 0.5, 8, 0.5]]
+        expected = DataFrame(rows, index=list('xyz'), dtype=np.float)
+        expected.columns = MultiIndex.from_tuples(
+            [('A', 'a'), ('A', 'b'), ('B', 'a'), ('B', 'b')])
+        assert_frame_equal(result, expected)
+
+    def test_unstack_fill_frame_datetime(self):
+
+        # Test unstacking with date times
+        dv = pd.date_range('2012-01-01', periods=4).values
+        data = Series(dv)
+        data.index = MultiIndex.from_tuples(
+            [('x', 'a'), ('x', 'b'), ('y', 'b'), ('z', 'a')])
+
+        result = data.unstack()
+        expected = DataFrame({'a': [dv[0], pd.NaT, dv[3]],
+                              'b': [dv[1], dv[2], pd.NaT]},
+                             index=['x', 'y', 'z'])
+        assert_frame_equal(result, expected)
+
+        result = data.unstack(fill_value=dv[0])
+        expected = DataFrame({'a': [dv[0], dv[0], dv[3]],
+                              'b': [dv[1], dv[2], dv[0]]},
+                             index=['x', 'y', 'z'])
+        assert_frame_equal(result, expected)
+
+    def test_unstack_fill_frame_timedelta(self):
+
+        # Test unstacking with time deltas
+        td = [Timedelta(days=i) for i in range(4)]
+        data = Series(td)
+        data.index = MultiIndex.from_tuples(
+            [('x', 'a'), ('x', 'b'), ('y', 'b'), ('z', 'a')])
+
+        result = data.unstack()
+        expected = DataFrame({'a': [td[0], pd.NaT, td[3]],
+                              'b': [td[1], td[2], pd.NaT]},
+                             index=['x', 'y', 'z'])
+        assert_frame_equal(result, expected)
+
+        result = data.unstack(fill_value=td[1])
+        expected = DataFrame({'a': [td[0], td[1], td[3]],
+                              'b': [td[1], td[2], td[1]]},
+                             index=['x', 'y', 'z'])
+        assert_frame_equal(result, expected)
+
+    def test_unstack_fill_frame_period(self):
+
+        # Test unstacking with period
+        periods = [Period('2012-01'), Period('2012-02'), Period('2012-03'),
+                   Period('2012-04')]
+        data = Series(periods)
+        data.index = MultiIndex.from_tuples(
+            [('x', 'a'), ('x', 'b'), ('y', 'b'), ('z', 'a')])
+
+        result = data.unstack()
+        expected = DataFrame({'a': [periods[0], None, periods[3]],
+                              'b': [periods[1], periods[2], None]},
+                             index=['x', 'y', 'z'])
+        assert_frame_equal(result, expected)
+
+        result = data.unstack(fill_value=periods[1])
+        expected = DataFrame({'a': [periods[0], periods[1], periods[3]],
+                              'b': [periods[1], periods[2], periods[1]]},
+                             index=['x', 'y', 'z'])
+        assert_frame_equal(result, expected)
+
+    def test_unstack_fill_frame_categorical(self):
+
+        # Test unstacking with categorical
+        data = pd.Series(['a', 'b', 'c', 'a'], dtype='category')
+        data.index = pd.MultiIndex.from_tuples(
+            [('x', 'a'), ('x', 'b'), ('y', 'b'), ('z', 'a')])
+
+        # By default missing values will be NaN
+        result = data.unstack()
+        expected = DataFrame({'a': pd.Categorical(list('axa'),
+                                                  categories=list('abc')),
+                              'b': pd.Categorical(list('bcx'),
+                                                  categories=list('abc'))},
+                             index=list('xyz'))
+        assert_frame_equal(result, expected)
+
+        # Fill with non-category results in NaN entries similar to above
+        result = data.unstack(fill_value='d')
+        assert_frame_equal(result, expected)
+
+        # Fill with category value replaces missing values as expected
+        result = data.unstack(fill_value='c')
+        expected = DataFrame({'a': pd.Categorical(list('aca'),
+                                                  categories=list('abc')),
+                              'b': pd.Categorical(list('bcc'),
+                                                  categories=list('abc'))},
+                             index=list('xyz'))
+        assert_frame_equal(result, expected)
+
+    def test_unstack_preserve_dtypes(self):
+        # Checks fix for #11847
+        df = pd.DataFrame(dict(state=['IL', 'MI', 'NC'],
+                               index=['a', 'b', 'c'],
+                               some_categories=pd.Series(['a', 'b', 'c']
+                                                         ).astype('category'),
+                               A=np.random.rand(3),
+                               B=1,
+                               C='foo',
+                               D=pd.Timestamp('20010102'),
+                               E=pd.Series([1.0, 50.0, 100.0]
+                                           ).astype('float32'),
+                               F=pd.Series([3.0, 4.0, 5.0]).astype('float64'),
+                               G=False,
+                               H=pd.Series([1, 200, 923442], dtype='int8')))
+
+        def unstack_and_compare(df, column_name):
+            unstacked1 = df.unstack([column_name])
+            unstacked2 = df.unstack(column_name)
+            assert_frame_equal(unstacked1, unstacked2)
+
+        df1 = df.set_index(['state', 'index'])
+        unstack_and_compare(df1, 'index')
+
+        df1 = df.set_index(['state', 'some_categories'])
+        unstack_and_compare(df1, 'some_categories')
+
+        df1 = df.set_index(['F', 'C'])
+        unstack_and_compare(df1, 'F')
+
+        df1 = df.set_index(['G', 'B', 'state'])
+        unstack_and_compare(df1, 'B')
+
+        df1 = df.set_index(['E', 'A'])
+        unstack_and_compare(df1, 'E')
+
+        df1 = df.set_index(['state', 'index'])
+        s = df1['A']
+        unstack_and_compare(s, 'index')
+
+    def test_stack_ints(self):
+        columns = MultiIndex.from_tuples(list(itertools.product(range(3),
+                                                                repeat=3)))
+        df = DataFrame(np.random.randn(30, 27), columns=columns)
+
+        assert_frame_equal(df.stack(level=[1, 2]),
+                           df.stack(level=1).stack(level=1))
+        assert_frame_equal(df.stack(level=[-2, -1]),
+                           df.stack(level=1).stack(level=1))
+
+        df_named = df.copy()
+        df_named.columns.set_names(range(3), inplace=True)
+
+        assert_frame_equal(df_named.stack(level=[1, 2]),
+                           df_named.stack(level=1).stack(level=1))
+
+    def test_stack_mixed_levels(self):
+        columns = MultiIndex.from_tuples(
+            [('A', 'cat', 'long'), ('B', 'cat', 'long'),
+             ('A', 'dog', 'short'), ('B', 'dog', 'short')],
+            names=['exp', 'animal', 'hair_length']
+        )
+        df = DataFrame(randn(4, 4), columns=columns)
+
+        animal_hair_stacked = df.stack(level=['animal', 'hair_length'])
+        exp_hair_stacked = df.stack(level=['exp', 'hair_length'])
+
+        # GH #8584: Need to check that stacking works when a number
+        # is passed that is both a level name and in the range of
+        # the level numbers
+        df2 = df.copy()
+        df2.columns.names = ['exp', 'animal', 1]
+        assert_frame_equal(df2.stack(level=['animal', 1]),
+                           animal_hair_stacked, check_names=False)
+        assert_frame_equal(df2.stack(level=['exp', 1]),
+                           exp_hair_stacked, check_names=False)
+
+        # When mixed types are passed and the ints are not level
+        # names, raise
+        pytest.raises(ValueError, df2.stack, level=['animal', 0])
+
+        # GH #8584: Having 0 in the level names could raise a
+        # strange error about lexsort depth
+        df3 = df.copy()
+        df3.columns.names = ['exp', 'animal', 0]
+        assert_frame_equal(df3.stack(level=['animal', 0]),
+                           animal_hair_stacked, check_names=False)
+
+    def test_stack_int_level_names(self):
+        columns = MultiIndex.from_tuples(
+            [('A', 'cat', 'long'), ('B', 'cat', 'long'),
+             ('A', 'dog', 'short'), ('B', 'dog', 'short')],
+            names=['exp', 'animal', 'hair_length']
+        )
+        df = DataFrame(randn(4, 4), columns=columns)
+
+        exp_animal_stacked = df.stack(level=['exp', 'animal'])
+        animal_hair_stacked = df.stack(level=['animal', 'hair_length'])
+        exp_hair_stacked = df.stack(level=['exp', 'hair_length'])
+
+        df2 = df.copy()
+        df2.columns.names = [0, 1, 2]
+        assert_frame_equal(df2.stack(level=[1, 2]), animal_hair_stacked,
+                           check_names=False)
+        assert_frame_equal(df2.stack(level=[0, 1]), exp_animal_stacked,
+                           check_names=False)
+        assert_frame_equal(df2.stack(level=[0, 2]), exp_hair_stacked,
+                           check_names=False)
+
+        # Out-of-order int column names
+        df3 = df.copy()
+        df3.columns.names = [2, 0, 1]
+        assert_frame_equal(df3.stack(level=[0, 1]), animal_hair_stacked,
+                           check_names=False)
+        assert_frame_equal(df3.stack(level=[2, 0]), exp_animal_stacked,
+                           check_names=False)
+        assert_frame_equal(df3.stack(level=[2, 1]), exp_hair_stacked,
+                           check_names=False)
+
+    def test_unstack_bool(self):
+        df = DataFrame([False, False],
+                       index=MultiIndex.from_arrays([['a', 'b'], ['c', 'l']]),
+                       columns=['col'])
+        rs = df.unstack()
+        xp = DataFrame(np.array([[False, np.nan], [np.nan, False]],
+                                dtype=object),
+                       index=['a', 'b'],
+                       columns=MultiIndex.from_arrays([['col', 'col'],
+                                                       ['c', 'l']]))
+        assert_frame_equal(rs, xp)
+
+    def test_unstack_level_binding(self):
+        # GH9856
+        mi = pd.MultiIndex(
+            levels=[[u('foo'), u('bar')], [u('one'), u('two')],
+                    [u('a'), u('b')]],
+            labels=[[0, 0, 1, 1], [0, 1, 0, 1], [1, 0, 1, 0]],
+            names=[u('first'), u('second'), u('third')])
+        s = pd.Series(0, index=mi)
+        result = s.unstack([1, 2]).stack(0)
+
+        expected_mi = pd.MultiIndex(
+            levels=[['foo', 'bar'], ['one', 'two']],
+            labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
+            names=['first', 'second'])
+
+        expected = pd.DataFrame(np.array([[np.nan, 0],
+                                          [0, np.nan],
+                                          [np.nan, 0],
+                                          [0, np.nan]],
+                                         dtype=np.float64),
+                                index=expected_mi,
+                                columns=pd.Index(['a', 'b'], name='third'))
+
+        assert_frame_equal(result, expected)
+
+    def test_unstack_to_series(self):
+        # check reversibility
+        data = self.frame.unstack()
+
+        assert isinstance(data, Series)
+        undo = data.unstack().T
+        assert_frame_equal(undo, self.frame)
+
+        # check NA handling
+        data = DataFrame({'x': [1, 2, np.NaN], 'y': [3.0, 4, np.NaN]})
+        data.index = Index(['a', 'b', 'c'])
+        result = data.unstack()
+
+        midx = MultiIndex(levels=[['x', 'y'], ['a', 'b', 'c']],
+                          labels=[[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 1, 2]])
+        expected = Series([1, 2, np.NaN, 3, 4, np.NaN], index=midx)
+
+        assert_series_equal(result, expected)
+
+        # check composability of unstack
+        old_data = data.copy()
+        for _ in range(4):
+            data = data.unstack()
+        assert_frame_equal(old_data, data)
+
+    def test_unstack_dtypes(self):
+
+        # GH 2929
+        rows = [[1, 1, 3, 4],
+                [1, 2, 3, 4],
+                [2, 1, 3, 4],
+                [2, 2, 3, 4]]
+
+        df = DataFrame(rows, columns=list('ABCD'))
+        result = df.get_dtype_counts()
+        expected = Series({'int64': 4})
+        assert_series_equal(result, expected)
+
+        # single dtype
+        df2 = df.set_index(['A', 'B'])
+        df3 = df2.unstack('B')
+        result = df3.get_dtype_counts()
+        expected = Series({'int64': 4})
+        assert_series_equal(result, expected)
+
+        # mixed
+        df2 = df.set_index(['A', 'B'])
+        df2['C'] = 3.
+        df3 = df2.unstack('B')
+        result = df3.get_dtype_counts()
+        expected = Series({'int64': 2, 'float64': 2})
+        assert_series_equal(result, expected)
+
+        df2['D'] = 'foo'
+        df3 = df2.unstack('B')
+        result = df3.get_dtype_counts()
+        expected = Series({'float64': 2, 'object': 2})
+        assert_series_equal(result, expected)
+
+        # GH7405
+        for c, d in (np.zeros(5), np.zeros(5)), \
+                    (np.arange(5, dtype='f8'), np.arange(5, 10, dtype='f8')):
+
+            df = DataFrame({'A': ['a'] * 5, 'C': c, 'D': d,
+                            'B': pd.date_range('2012-01-01', periods=5)})
+
+            right = df.iloc[:3].copy(deep=True)
+
+            df = df.set_index(['A', 'B'])
+            df['D'] = df['D'].astype('int64')
+
+            left = df.iloc[:3].unstack(0)
+            right = right.set_index(['A', 'B']).unstack(0)
+            right[('D', 'a')] = right[('D', 'a')].astype('int64')
+
+            assert left.shape == (3, 2)
+            tm.assert_frame_equal(left, right)
+
+    def test_unstack_non_unique_index_names(self):
+        idx = MultiIndex.from_tuples([('a', 'b'), ('c', 'd')],
+                                     names=['c1', 'c1'])
+        df = DataFrame([1, 2], index=idx)
+        with pytest.raises(ValueError):
+            df.unstack('c1')
+
+        with pytest.raises(ValueError):
+            df.T.stack('c1')
+
+    def test_unstack_unused_levels(self):
+        # GH 17845: unused labels in index make unstack() cast int to float
+        idx = pd.MultiIndex.from_product([['a'], ['A', 'B', 'C', 'D']])[:-1]
+        df = pd.DataFrame([[1, 0]] * 3, index=idx)
+
+        result = df.unstack()
+        exp_col = pd.MultiIndex.from_product([[0, 1], ['A', 'B', 'C']])
+        expected = pd.DataFrame([[1, 1, 1, 0, 0, 0]], index=['a'],
+                                columns=exp_col)
+        tm.assert_frame_equal(result, expected)
+        assert((result.columns.levels[1] == idx.levels[1]).all())
+
+        # Unused items on both levels
+        levels = [[0, 1, 7], [0, 1, 2, 3]]
+        labels = [[0, 0, 1, 1], [0, 2, 0, 2]]
+        idx = pd.MultiIndex(levels, labels)
+        block = np.arange(4).reshape(2, 2)
+        df = pd.DataFrame(np.concatenate([block, block + 4]), index=idx)
+        result = df.unstack()
+        expected = pd.DataFrame(np.concatenate([block * 2, block * 2 + 1],
+                                               axis=1),
+                                columns=idx)
+        tm.assert_frame_equal(result, expected)
+        assert((result.columns.levels[1] == idx.levels[1]).all())
+
+        # With mixed dtype and NaN
+        levels = [['a', 2, 'c'], [1, 3, 5, 7]]
+        labels = [[0, -1, 1, 1], [0, 2, -1, 2]]
+        idx = pd.MultiIndex(levels, labels)
+        data = np.arange(8)
+        df = pd.DataFrame(data.reshape(4, 2), index=idx)
+
+        cases = ((0, [13, 16, 6, 9, 2, 5, 8, 11],
+                  [np.nan, 'a', 2], [np.nan, 5, 1]),
+                 (1, [8, 11, 1, 4, 12, 15, 13, 16],
+                  [np.nan, 5, 1], [np.nan, 'a', 2]))
+        for level, idces, col_level, idx_level in cases:
+            result = df.unstack(level=level)
+            exp_data = np.zeros(18) * np.nan
+            exp_data[idces] = data
+            cols = pd.MultiIndex.from_product([[0, 1], col_level])
+            expected = pd.DataFrame(exp_data.reshape(3, 6),
+                                    index=idx_level, columns=cols)
+            tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("cols", [['A', 'C'], slice(None)])
+    def test_unstack_unused_level(self, cols):
+        # GH 18562 : unused labels on the unstacked level
+        df = pd.DataFrame([[2010, 'a', 'I'],
+                           [2011, 'b', 'II']],
+                          columns=['A', 'B', 'C'])
+
+        ind = df.set_index(['A', 'B', 'C'], drop=False)
+        selection = ind.loc[(slice(None), slice(None), 'I'), cols]
+        result = selection.unstack()
+
+        expected = ind.iloc[[0]][cols]
+        expected.columns = MultiIndex.from_product([expected.columns, ['I']],
+                                                   names=[None, 'C'])
+        expected.index = expected.index.droplevel('C')
+        tm.assert_frame_equal(result, expected)
+
+    def test_unstack_nan_index(self):  # GH7466
+        cast = lambda val: '{0:1}'.format('' if val != val else val)
+        nan = np.nan
+
+        def verify(df):
+            mk_list = lambda a: list(a) if isinstance(a, tuple) else [a]
+            rows, cols = df.notna().values.nonzero()
+            for i, j in zip(rows, cols):
+                left = sorted(df.iloc[i, j].split('.'))
+                right = mk_list(df.index[i]) + mk_list(df.columns[j])
+                right = sorted(list(map(cast, right)))
+                assert left == right
+
+        df = DataFrame({'jim': ['a', 'b', nan, 'd'],
+                        'joe': ['w', 'x', 'y', 'z'],
+                        'jolie': ['a.w', 'b.x', ' .y', 'd.z']})
+
+        left = df.set_index(['jim', 'joe']).unstack()['jolie']
+        right = df.set_index(['joe', 'jim']).unstack()['jolie'].T
+        assert_frame_equal(left, right)
+
+        for idx in itertools.permutations(df.columns[:2]):
+            mi = df.set_index(list(idx))
+            for lev in range(2):
+                udf = mi.unstack(level=lev)
+                assert udf.notna().values.sum() == len(df)
+                verify(udf['jolie'])
+
+        df = DataFrame({'1st': ['d'] * 3 + [nan] * 5 + ['a'] * 2 +
+                        ['c'] * 3 + ['e'] * 2 + ['b'] * 5,
+                        '2nd': ['y'] * 2 + ['w'] * 3 + [nan] * 3 +
+                        ['z'] * 4 + [nan] * 3 + ['x'] * 3 + [nan] * 2,
+                        '3rd': [67, 39, 53, 72, 57, 80, 31, 18, 11, 30, 59,
+                                50, 62, 59, 76, 52, 14, 53, 60, 51]})
+
+        df['4th'], df['5th'] = \
+            df.apply(lambda r: '.'.join(map(cast, r)), axis=1), \
+            df.apply(lambda r: '.'.join(map(cast, r.iloc[::-1])), axis=1)
+
+        for idx in itertools.permutations(['1st', '2nd', '3rd']):
+            mi = df.set_index(list(idx))
+            for lev in range(3):
+                udf = mi.unstack(level=lev)
+                assert udf.notna().values.sum() == 2 * len(df)
+                for col in ['4th', '5th']:
+                    verify(udf[col])
+
+        # GH7403
+        df = pd.DataFrame(
+            {'A': list('aaaabbbb'), 'B': range(8), 'C': range(8)})
+        df.iloc[3, 1] = np.NaN
+        left = df.set_index(['A', 'B']).unstack(0)
+
+        vals = [[3, 0, 1, 2, nan, nan, nan, nan],
+                [nan, nan, nan, nan, 4, 5, 6, 7]]
+        vals = list(map(list, zip(*vals)))
+        idx = Index([nan, 0, 1, 2, 4, 5, 6, 7], name='B')
+        cols = MultiIndex(levels=[['C'], ['a', 'b']],
+                          labels=[[0, 0], [0, 1]],
+                          names=[None, 'A'])
+
+        right = DataFrame(vals, columns=cols, index=idx)
+        assert_frame_equal(left, right)
+
+        df = DataFrame({'A': list('aaaabbbb'), 'B': list(range(4)) * 2,
+                        'C': range(8)})
+        df.iloc[2, 1] = np.NaN
+        left = df.set_index(['A', 'B']).unstack(0)
+
+        vals = [[2, nan], [0, 4], [1, 5], [nan, 6], [3, 7]]
+        cols = MultiIndex(levels=[['C'], ['a', 'b']],
+                          labels=[[0, 0], [0, 1]],
+                          names=[None, 'A'])
+        idx = Index([nan, 0, 1, 2, 3], name='B')
+        right = DataFrame(vals, columns=cols, index=idx)
+        assert_frame_equal(left, right)
+
+        df = pd.DataFrame({'A': list('aaaabbbb'), 'B': list(range(4)) * 2,
+                           'C': range(8)})
+        df.iloc[3, 1] = np.NaN
+        left = df.set_index(['A', 'B']).unstack(0)
+
+        vals = [[3, nan], [0, 4], [1, 5], [2, 6], [nan, 7]]
+        cols = MultiIndex(levels=[['C'], ['a', 'b']],
+                          labels=[[0, 0], [0, 1]],
+                          names=[None, 'A'])
+        idx = Index([nan, 0, 1, 2, 3], name='B')
+        right = DataFrame(vals, columns=cols, index=idx)
+        assert_frame_equal(left, right)
+
+        # GH7401
+        df = pd.DataFrame({'A': list('aaaaabbbbb'),
+                           'B': (date_range('2012-01-01', periods=5)
+                                 .tolist() * 2),
+                           'C': np.arange(10)})
+
+        df.iloc[3, 1] = np.NaN
+        left = df.set_index(['A', 'B']).unstack()
+
+        vals = np.array([[3, 0, 1, 2, nan, 4], [nan, 5, 6, 7, 8, 9]])
+        idx = Index(['a', 'b'], name='A')
+        cols = MultiIndex(levels=[['C'], date_range('2012-01-01', periods=5)],
+                          labels=[[0, 0, 0, 0, 0, 0], [-1, 0, 1, 2, 3, 4]],
+                          names=[None, 'B'])
+
+        right = DataFrame(vals, columns=cols, index=idx)
+        assert_frame_equal(left, right)
+
+        # GH4862
+        vals = [['Hg', nan, nan, 680585148],
+                ['U', 0.0, nan, 680585148],
+                ['Pb', 7.07e-06, nan, 680585148],
+                ['Sn', 2.3614e-05, 0.0133, 680607017],
+                ['Ag', 0.0, 0.0133, 680607017],
+                ['Hg', -0.00015, 0.0133, 680607017]]
+        df = DataFrame(vals, columns=['agent', 'change', 'dosage', 's_id'],
+                       index=[17263, 17264, 17265, 17266, 17267, 17268])
+
+        left = df.copy().set_index(['s_id', 'dosage', 'agent']).unstack()
+
+        vals = [[nan, nan, 7.07e-06, nan, 0.0],
+                [0.0, -0.00015, nan, 2.3614e-05, nan]]
+
+        idx = MultiIndex(levels=[[680585148, 680607017], [0.0133]],
+                         labels=[[0, 1], [-1, 0]],
+                         names=['s_id', 'dosage'])
+
+        cols = MultiIndex(levels=[['change'], ['Ag', 'Hg', 'Pb', 'Sn', 'U']],
+                          labels=[[0, 0, 0, 0, 0], [0, 1, 2, 3, 4]],
+                          names=[None, 'agent'])
+
+        right = DataFrame(vals, columns=cols, index=idx)
+        assert_frame_equal(left, right)
+
+        left = df.loc[17264:].copy().set_index(['s_id', 'dosage', 'agent'])
+        assert_frame_equal(left.unstack(), right)
+
+        # GH9497 - multiple unstack with nulls
+        df = DataFrame({'1st': [1, 2, 1, 2, 1, 2],
+                        '2nd': pd.date_range('2014-02-01', periods=6,
+                                             freq='D'),
+                        'jim': 100 + np.arange(6),
+                        'joe': (np.random.randn(6) * 10).round(2)})
+
+        df['3rd'] = df['2nd'] - pd.Timestamp('2014-02-02')
+        df.loc[1, '2nd'] = df.loc[3, '2nd'] = nan
+        df.loc[1, '3rd'] = df.loc[4, '3rd'] = nan
+
+        left = df.set_index(['1st', '2nd', '3rd']).unstack(['2nd', '3rd'])
+        assert left.notna().values.sum() == 2 * len(df)
+
+        for col in ['jim', 'joe']:
+            for _, r in df.iterrows():
+                key = r['1st'], (col, r['2nd'], r['3rd'])
+                assert r[col] == left.loc[key]
+
+    def test_stack_datetime_column_multiIndex(self):
+        # GH 8039
+        t = datetime(2014, 1, 1)
+        df = DataFrame(
+            [1, 2, 3, 4], columns=MultiIndex.from_tuples([(t, 'A', 'B')]))
+        result = df.stack()
+
+        eidx = MultiIndex.from_product([(0, 1, 2, 3), ('B',)])
+        ecols = MultiIndex.from_tuples([(t, 'A')])
+        expected = DataFrame([1, 2, 3, 4], index=eidx, columns=ecols)
+        assert_frame_equal(result, expected)
+
+    def test_stack_partial_multiIndex(self):
+        # GH 8844
+        def _test_stack_with_multiindex(multiindex):
+            df = DataFrame(np.arange(3 * len(multiindex))
+                           .reshape(3, len(multiindex)),
+                           columns=multiindex)
+            for level in (-1, 0, 1, [0, 1], [1, 0]):
+                result = df.stack(level=level, dropna=False)
+
+                if isinstance(level, int):
+                    # Stacking a single level should not make any all-NaN rows,
+                    # so df.stack(level=level, dropna=False) should be the same
+                    # as df.stack(level=level, dropna=True).
+                    expected = df.stack(level=level, dropna=True)
+                    if isinstance(expected, Series):
+                        assert_series_equal(result, expected)
+                    else:
+                        assert_frame_equal(result, expected)
+
+                df.columns = MultiIndex.from_tuples(df.columns.get_values(),
+                                                    names=df.columns.names)
+                expected = df.stack(level=level, dropna=False)
+                if isinstance(expected, Series):
+                    assert_series_equal(result, expected)
+                else:
+                    assert_frame_equal(result, expected)
+
+        full_multiindex = MultiIndex.from_tuples([('B', 'x'), ('B', 'z'),
+                                                  ('A', 'y'),
+                                                  ('C', 'x'), ('C', 'u')],
+                                                 names=['Upper', 'Lower'])
+        for multiindex_columns in ([0, 1, 2, 3, 4],
+                                   [0, 1, 2, 3], [0, 1, 2, 4],
+                                   [0, 1, 2], [1, 2, 3], [2, 3, 4],
+                                   [0, 1], [0, 2], [0, 3],
+                                   [0], [2], [4]):
+            _test_stack_with_multiindex(full_multiindex[multiindex_columns])
+            if len(multiindex_columns) > 1:
+                multiindex_columns.reverse()
+                _test_stack_with_multiindex(
+                    full_multiindex[multiindex_columns])
+
+        df = DataFrame(np.arange(6).reshape(2, 3),
+                       columns=full_multiindex[[0, 1, 3]])
+        result = df.stack(dropna=False)
+        expected = DataFrame([[0, 2], [1, nan], [3, 5], [4, nan]],
+                             index=MultiIndex(
+                                 levels=[[0, 1], ['u', 'x', 'y', 'z']],
+                                 labels=[[0, 0, 1, 1],
+                                         [1, 3, 1, 3]],
+                                 names=[None, 'Lower']),
+                             columns=Index(['B', 'C'], name='Upper'),
+                             dtype=df.dtypes[0])
+        assert_frame_equal(result, expected)
+
+    def test_stack_preserve_categorical_dtype(self):
+        # GH13854
+        for ordered in [False, True]:
+            for labels in [list("yxz"), list("yxy")]:
+                cidx = pd.CategoricalIndex(labels, categories=list("xyz"),
+                                           ordered=ordered)
+                df = DataFrame([[10, 11, 12]], columns=cidx)
+                result = df.stack()
+
+                # `MutliIndex.from_product` preserves categorical dtype -
+                # it's tested elsewhere.
+                midx = pd.MultiIndex.from_product([df.index, cidx])
+                expected = Series([10, 11, 12], index=midx)
+
+                tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("level", [0, 'baz'])
+    def test_unstack_swaplevel_sortlevel(self, level):
+        # GH 20994
+        mi = pd.MultiIndex.from_product([[0], ['d', 'c']],
+                                        names=['bar', 'baz'])
+        df = pd.DataFrame([[0, 2], [1, 3]], index=mi, columns=['B', 'A'])
+        df.columns.name = 'foo'
+
+        expected = pd.DataFrame([
+            [3, 1, 2, 0]], columns=pd.MultiIndex.from_tuples([
+                ('c', 'A'), ('c', 'B'), ('d', 'A'), ('d', 'B')], names=[
+                    'baz', 'foo']))
+        expected.index.name = 'bar'
+
+        result = df.unstack().swaplevel(axis=1).sort_index(axis=1, level=level)
+        tm.assert_frame_equal(result, expected)
+
+
+def test_unstack_fill_frame_object():
+    # GH12815 Test unstacking with object.
+    data = pd.Series(['a', 'b', 'c', 'a'], dtype='object')
+    data.index = pd.MultiIndex.from_tuples(
+        [('x', 'a'), ('x', 'b'), ('y', 'b'), ('z', 'a')])
+
+    # By default missing values will be NaN
+    result = data.unstack()
+    expected = pd.DataFrame(
+        {'a': ['a', np.nan, 'a'], 'b': ['b', 'c', np.nan]},
+        index=list('xyz')
+    )
+    assert_frame_equal(result, expected)
+
+    # Fill with any value replaces missing values as expected
+    result = data.unstack(fill_value='d')
+    expected = pd.DataFrame(
+        {'a': ['a', 'd', 'a'], 'b': ['b', 'c', 'd']},
+        index=list('xyz')
+    )
+    assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_sort_values_level_as_str.py b/pandas/tests/frame/test_sort_values_level_as_str.py
new file mode 100644
index 0000000000000..3b4eadfce81cd
--- /dev/null
+++ b/pandas/tests/frame/test_sort_values_level_as_str.py
@@ -0,0 +1,126 @@
+import numpy as np
+import pytest
+
+from pandas import DataFrame, Index
+from pandas.errors import PerformanceWarning
+from pandas.util import testing as tm
+from pandas.util.testing import assert_frame_equal
+
+
+@pytest.fixture
+def df_none():
+    return DataFrame({
+        'outer': ['a', 'a', 'a', 'b', 'b', 'b'],
+        'inner': [1, 2, 2, 2, 1, 1],
+        'A': np.arange(6, 0, -1),
+        ('B', 5): ['one', 'one', 'two', 'two', 'one', 'one']})
+
+
+@pytest.fixture(params=[
+    ['outer'],
+    ['outer', 'inner']
+])
+def df_idx(request, df_none):
+    levels = request.param
+    return df_none.set_index(levels)
+
+
+@pytest.fixture(params=[
+    'inner',     # index level
+    ['outer'],   # list of index level
+    'A',         # column
+    [('B', 5)],  # list of column
+    ['inner', 'outer'],   # two index levels
+    [('B', 5), 'outer'],  # index level and column
+    ['A', ('B', 5)],      # Two columns
+    ['inner', 'outer']    # two index levels and column
+])
+def sort_names(request):
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def ascending(request):
+    return request.param
+
+
+def test_sort_index_level_and_column_label(
+        df_none, df_idx, sort_names, ascending):
+
+    # GH 14353
+
+    # Get index levels from df_idx
+    levels = df_idx.index.names
+
+    # Compute expected by sorting on columns and the setting index
+    expected = df_none.sort_values(by=sort_names,
+                                   ascending=ascending,
+                                   axis=0).set_index(levels)
+
+    # Compute result sorting on mix on columns and index levels
+    result = df_idx.sort_values(by=sort_names,
+                                ascending=ascending,
+                                axis=0)
+
+    assert_frame_equal(result, expected)
+
+
+def test_sort_column_level_and_index_label(
+        df_none, df_idx, sort_names, ascending):
+
+    # GH 14353
+
+    # Get levels from df_idx
+    levels = df_idx.index.names
+
+    # Compute expected by sorting on axis=0, setting index levels, and then
+    # transposing. For some cases this will result in a frame with
+    # multiple column levels
+    expected = df_none.sort_values(by=sort_names,
+                                   ascending=ascending,
+                                   axis=0).set_index(levels).T
+
+    # Compute result by transposing and sorting on axis=1.
+    result = df_idx.T.sort_values(by=sort_names,
+                                  ascending=ascending,
+                                  axis=1)
+
+    if len(levels) > 1:
+        # Accessing multi-level columns that are not lexsorted raises a
+        # performance warning
+        with tm.assert_produces_warning(PerformanceWarning,
+                                        check_stacklevel=False):
+            assert_frame_equal(result, expected)
+    else:
+        assert_frame_equal(result, expected)
+
+
+def test_sort_values_column_index_level_precedence():
+    # GH 14353, when a string passed as the `by` parameter
+    # matches a column and an index level the column takes
+    # precedence
+
+    # Construct DataFrame with index and column named 'idx'
+    idx = Index(np.arange(1, 7), name='idx')
+    df = DataFrame({'A': np.arange(11, 17),
+                    'idx': np.arange(6, 0, -1)},
+                   index=idx)
+
+    # Sorting by 'idx' should sort by the idx column and raise a
+    # FutureWarning
+    with tm.assert_produces_warning(FutureWarning):
+        result = df.sort_values(by='idx')
+
+    # This should be equivalent to sorting by the 'idx' index level in
+    # descending order
+    expected = df.sort_index(level='idx', ascending=False)
+    assert_frame_equal(result, expected)
+
+    # Perform same test with MultiIndex
+    df_multi = df.set_index('A', append=True)
+
+    with tm.assert_produces_warning(FutureWarning):
+        result = df_multi.sort_values(by='idx')
+
+    expected = df_multi.sort_index(level='idx', ascending=False)
+    assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_sorting.py b/pandas/tests/frame/test_sorting.py
new file mode 100644
index 0000000000000..599ae683f914b
--- /dev/null
+++ b/pandas/tests/frame/test_sorting.py
@@ -0,0 +1,600 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import pytest
+import random
+import numpy as np
+
+import pandas as pd
+from pandas.compat import lrange
+from pandas.api.types import CategoricalDtype
+from pandas import (DataFrame, Series, MultiIndex, Timestamp,
+                    date_range, NaT, IntervalIndex)
+
+from pandas.util.testing import assert_series_equal, assert_frame_equal
+
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+class TestDataFrameSorting(TestData):
+
+    def test_sort(self):
+        frame = DataFrame(np.arange(16).reshape(4, 4), index=[1, 2, 3, 4],
+                          columns=['A', 'B', 'C', 'D'])
+
+        # see gh-9816
+        with tm.assert_produces_warning(FutureWarning):
+            frame.sortlevel()
+
+    def test_sort_values(self):
+        frame = DataFrame([[1, 1, 2], [3, 1, 0], [4, 5, 6]],
+                          index=[1, 2, 3], columns=list('ABC'))
+
+        # by column (axis=0)
+        sorted_df = frame.sort_values(by='A')
+        indexer = frame['A'].argsort().values
+        expected = frame.loc[frame.index[indexer]]
+        assert_frame_equal(sorted_df, expected)
+
+        sorted_df = frame.sort_values(by='A', ascending=False)
+        indexer = indexer[::-1]
+        expected = frame.loc[frame.index[indexer]]
+        assert_frame_equal(sorted_df, expected)
+
+        sorted_df = frame.sort_values(by='A', ascending=False)
+        assert_frame_equal(sorted_df, expected)
+
+        # GH4839
+        sorted_df = frame.sort_values(by=['A'], ascending=[False])
+        assert_frame_equal(sorted_df, expected)
+
+        # multiple bys
+        sorted_df = frame.sort_values(by=['B', 'C'])
+        expected = frame.loc[[2, 1, 3]]
+        assert_frame_equal(sorted_df, expected)
+
+        sorted_df = frame.sort_values(by=['B', 'C'], ascending=False)
+        assert_frame_equal(sorted_df, expected[::-1])
+
+        sorted_df = frame.sort_values(by=['B', 'A'], ascending=[True, False])
+        assert_frame_equal(sorted_df, expected)
+
+        pytest.raises(ValueError, lambda: frame.sort_values(
+            by=['A', 'B'], axis=2, inplace=True))
+
+        # by row (axis=1): GH 10806
+        sorted_df = frame.sort_values(by=3, axis=1)
+        expected = frame
+        assert_frame_equal(sorted_df, expected)
+
+        sorted_df = frame.sort_values(by=3, axis=1, ascending=False)
+        expected = frame.reindex(columns=['C', 'B', 'A'])
+        assert_frame_equal(sorted_df, expected)
+
+        sorted_df = frame.sort_values(by=[1, 2], axis='columns')
+        expected = frame.reindex(columns=['B', 'A', 'C'])
+        assert_frame_equal(sorted_df, expected)
+
+        sorted_df = frame.sort_values(by=[1, 3], axis=1,
+                                      ascending=[True, False])
+        assert_frame_equal(sorted_df, expected)
+
+        sorted_df = frame.sort_values(by=[1, 3], axis=1, ascending=False)
+        expected = frame.reindex(columns=['C', 'B', 'A'])
+        assert_frame_equal(sorted_df, expected)
+
+        msg = r'Length of ascending \(5\) != length of by \(2\)'
+        with tm.assert_raises_regex(ValueError, msg):
+            frame.sort_values(by=['A', 'B'], axis=0, ascending=[True] * 5)
+
+    def test_sort_values_inplace(self):
+        frame = DataFrame(np.random.randn(4, 4), index=[1, 2, 3, 4],
+                          columns=['A', 'B', 'C', 'D'])
+
+        sorted_df = frame.copy()
+        sorted_df.sort_values(by='A', inplace=True)
+        expected = frame.sort_values(by='A')
+        assert_frame_equal(sorted_df, expected)
+
+        sorted_df = frame.copy()
+        sorted_df.sort_values(by=1, axis=1, inplace=True)
+        expected = frame.sort_values(by=1, axis=1)
+        assert_frame_equal(sorted_df, expected)
+
+        sorted_df = frame.copy()
+        sorted_df.sort_values(by='A', ascending=False, inplace=True)
+        expected = frame.sort_values(by='A', ascending=False)
+        assert_frame_equal(sorted_df, expected)
+
+        sorted_df = frame.copy()
+        sorted_df.sort_values(by=['A', 'B'], ascending=False, inplace=True)
+        expected = frame.sort_values(by=['A', 'B'], ascending=False)
+        assert_frame_equal(sorted_df, expected)
+
+    def test_sort_nan(self):
+        # GH3917
+        nan = np.nan
+        df = DataFrame({'A': [1, 2, nan, 1, 6, 8, 4],
+                        'B': [9, nan, 5, 2, 5, 4, 5]})
+
+        # sort one column only
+        expected = DataFrame(
+            {'A': [nan, 1, 1, 2, 4, 6, 8],
+             'B': [5, 9, 2, nan, 5, 5, 4]},
+            index=[2, 0, 3, 1, 6, 4, 5])
+        sorted_df = df.sort_values(['A'], na_position='first')
+        assert_frame_equal(sorted_df, expected)
+
+        expected = DataFrame(
+            {'A': [nan, 8, 6, 4, 2, 1, 1],
+             'B': [5, 4, 5, 5, nan, 9, 2]},
+            index=[2, 5, 4, 6, 1, 0, 3])
+        sorted_df = df.sort_values(['A'], na_position='first', ascending=False)
+        assert_frame_equal(sorted_df, expected)
+
+        expected = df.reindex(columns=['B', 'A'])
+        sorted_df = df.sort_values(by=1, axis=1, na_position='first')
+        assert_frame_equal(sorted_df, expected)
+
+        # na_position='last', order
+        expected = DataFrame(
+            {'A': [1, 1, 2, 4, 6, 8, nan],
+             'B': [2, 9, nan, 5, 5, 4, 5]},
+            index=[3, 0, 1, 6, 4, 5, 2])
+        sorted_df = df.sort_values(['A', 'B'])
+        assert_frame_equal(sorted_df, expected)
+
+        # na_position='first', order
+        expected = DataFrame(
+            {'A': [nan, 1, 1, 2, 4, 6, 8],
+             'B': [5, 2, 9, nan, 5, 5, 4]},
+            index=[2, 3, 0, 1, 6, 4, 5])
+        sorted_df = df.sort_values(['A', 'B'], na_position='first')
+        assert_frame_equal(sorted_df, expected)
+
+        # na_position='first', not order
+        expected = DataFrame(
+            {'A': [nan, 1, 1, 2, 4, 6, 8],
+             'B': [5, 9, 2, nan, 5, 5, 4]},
+            index=[2, 0, 3, 1, 6, 4, 5])
+        sorted_df = df.sort_values(['A', 'B'], ascending=[
+                                   1, 0], na_position='first')
+        assert_frame_equal(sorted_df, expected)
+
+        # na_position='last', not order
+        expected = DataFrame(
+            {'A': [8, 6, 4, 2, 1, 1, nan],
+             'B': [4, 5, 5, nan, 2, 9, 5]},
+            index=[5, 4, 6, 1, 3, 0, 2])
+        sorted_df = df.sort_values(['A', 'B'], ascending=[
+                                   0, 1], na_position='last')
+        assert_frame_equal(sorted_df, expected)
+
+        # Test DataFrame with nan label
+        df = DataFrame({'A': [1, 2, nan, 1, 6, 8, 4],
+                        'B': [9, nan, 5, 2, 5, 4, 5]},
+                       index=[1, 2, 3, 4, 5, 6, nan])
+
+        # NaN label, ascending=True, na_position='last'
+        sorted_df = df.sort_index(
+            kind='quicksort', ascending=True, na_position='last')
+        expected = DataFrame({'A': [1, 2, nan, 1, 6, 8, 4],
+                              'B': [9, nan, 5, 2, 5, 4, 5]},
+                             index=[1, 2, 3, 4, 5, 6, nan])
+        assert_frame_equal(sorted_df, expected)
+
+        # NaN label, ascending=True, na_position='first'
+        sorted_df = df.sort_index(na_position='first')
+        expected = DataFrame({'A': [4, 1, 2, nan, 1, 6, 8],
+                              'B': [5, 9, nan, 5, 2, 5, 4]},
+                             index=[nan, 1, 2, 3, 4, 5, 6])
+        assert_frame_equal(sorted_df, expected)
+
+        # NaN label, ascending=False, na_position='last'
+        sorted_df = df.sort_index(kind='quicksort', ascending=False)
+        expected = DataFrame({'A': [8, 6, 1, nan, 2, 1, 4],
+                              'B': [4, 5, 2, 5, nan, 9, 5]},
+                             index=[6, 5, 4, 3, 2, 1, nan])
+        assert_frame_equal(sorted_df, expected)
+
+        # NaN label, ascending=False, na_position='first'
+        sorted_df = df.sort_index(
+            kind='quicksort', ascending=False, na_position='first')
+        expected = DataFrame({'A': [4, 8, 6, 1, nan, 2, 1],
+                              'B': [5, 4, 5, 2, 5, nan, 9]},
+                             index=[nan, 6, 5, 4, 3, 2, 1])
+        assert_frame_equal(sorted_df, expected)
+
+    def test_stable_descending_sort(self):
+        # GH #6399
+        df = DataFrame([[2, 'first'], [2, 'second'], [1, 'a'], [1, 'b']],
+                       columns=['sort_col', 'order'])
+        sorted_df = df.sort_values(by='sort_col', kind='mergesort',
+                                   ascending=False)
+        assert_frame_equal(df, sorted_df)
+
+    def test_stable_descending_multicolumn_sort(self):
+        nan = np.nan
+        df = DataFrame({'A': [1, 2, nan, 1, 6, 8, 4],
+                        'B': [9, nan, 5, 2, 5, 4, 5]})
+        # test stable mergesort
+        expected = DataFrame(
+            {'A': [nan, 8, 6, 4, 2, 1, 1],
+             'B': [5, 4, 5, 5, nan, 2, 9]},
+            index=[2, 5, 4, 6, 1, 3, 0])
+        sorted_df = df.sort_values(['A', 'B'], ascending=[0, 1],
+                                   na_position='first',
+                                   kind='mergesort')
+        assert_frame_equal(sorted_df, expected)
+
+        expected = DataFrame(
+            {'A': [nan, 8, 6, 4, 2, 1, 1],
+             'B': [5, 4, 5, 5, nan, 9, 2]},
+            index=[2, 5, 4, 6, 1, 0, 3])
+        sorted_df = df.sort_values(['A', 'B'], ascending=[0, 0],
+                                   na_position='first',
+                                   kind='mergesort')
+        assert_frame_equal(sorted_df, expected)
+
+    def test_stable_categorial(self):
+        # GH 16793
+        df = DataFrame({
+            'x': pd.Categorical(np.repeat([1, 2, 3, 4], 5), ordered=True)
+        })
+        expected = df.copy()
+        sorted_df = df.sort_values('x', kind='mergesort')
+        assert_frame_equal(sorted_df, expected)
+
+    def test_sort_datetimes(self):
+
+        # GH 3461, argsort / lexsort differences for a datetime column
+        df = DataFrame(['a', 'a', 'a', 'b', 'c', 'd', 'e', 'f', 'g'],
+                       columns=['A'],
+                       index=date_range('20130101', periods=9))
+        dts = [Timestamp(x)
+               for x in ['2004-02-11', '2004-01-21', '2004-01-26',
+                         '2005-09-20', '2010-10-04', '2009-05-12',
+                         '2008-11-12', '2010-09-28', '2010-09-28']]
+        df['B'] = dts[::2] + dts[1::2]
+        df['C'] = 2.
+        df['A1'] = 3.
+
+        df1 = df.sort_values(by='A')
+        df2 = df.sort_values(by=['A'])
+        assert_frame_equal(df1, df2)
+
+        df1 = df.sort_values(by='B')
+        df2 = df.sort_values(by=['B'])
+        assert_frame_equal(df1, df2)
+
+        df1 = df.sort_values(by='B')
+
+        df2 = df.sort_values(by=['C', 'B'])
+        assert_frame_equal(df1, df2)
+
+    def test_frame_column_inplace_sort_exception(self):
+        s = self.frame['A']
+        with tm.assert_raises_regex(ValueError, "This Series is a view"):
+            s.sort_values(inplace=True)
+
+        cp = s.copy()
+        cp.sort_values()  # it works!
+
+    def test_sort_nat_values_in_int_column(self):
+
+        # GH 14922: "sorting with large float and multiple columns incorrect"
+
+        # cause was that the int64 value NaT was considered as "na". Which is
+        # only correct for datetime64 columns.
+
+        int_values = (2, int(NaT))
+        float_values = (2.0, -1.797693e308)
+
+        df = DataFrame(dict(int=int_values, float=float_values),
+                       columns=["int", "float"])
+
+        df_reversed = DataFrame(dict(int=int_values[::-1],
+                                     float=float_values[::-1]),
+                                columns=["int", "float"],
+                                index=[1, 0])
+
+        # NaT is not a "na" for int64 columns, so na_position must not
+        # influence the result:
+        df_sorted = df.sort_values(["int", "float"], na_position="last")
+        assert_frame_equal(df_sorted, df_reversed)
+
+        df_sorted = df.sort_values(["int", "float"], na_position="first")
+        assert_frame_equal(df_sorted, df_reversed)
+
+        # reverse sorting order
+        df_sorted = df.sort_values(["int", "float"], ascending=False)
+        assert_frame_equal(df_sorted, df)
+
+        # and now check if NaT is still considered as "na" for datetime64
+        # columns:
+        df = DataFrame(dict(datetime=[Timestamp("2016-01-01"), NaT],
+                            float=float_values), columns=["datetime", "float"])
+
+        df_reversed = DataFrame(dict(datetime=[NaT, Timestamp("2016-01-01")],
+                                     float=float_values[::-1]),
+                                columns=["datetime", "float"],
+                                index=[1, 0])
+
+        df_sorted = df.sort_values(["datetime", "float"], na_position="first")
+        assert_frame_equal(df_sorted, df_reversed)
+
+        df_sorted = df.sort_values(["datetime", "float"], na_position="last")
+        assert_frame_equal(df_sorted, df)
+
+        # Ascending should not affect the results.
+        df_sorted = df.sort_values(["datetime", "float"], ascending=False)
+        assert_frame_equal(df_sorted, df)
+
+    def test_sort_nat(self):
+
+        # GH 16836
+
+        d1 = [Timestamp(x) for x in ['2016-01-01', '2015-01-01',
+                                     np.nan, '2016-01-01']]
+        d2 = [Timestamp(x) for x in ['2017-01-01', '2014-01-01',
+                                     '2016-01-01', '2015-01-01']]
+        df = pd.DataFrame({'a': d1, 'b': d2}, index=[0, 1, 2, 3])
+
+        d3 = [Timestamp(x) for x in ['2015-01-01', '2016-01-01',
+                                     '2016-01-01', np.nan]]
+        d4 = [Timestamp(x) for x in ['2014-01-01', '2015-01-01',
+                                     '2017-01-01', '2016-01-01']]
+        expected = pd.DataFrame({'a': d3, 'b': d4}, index=[1, 3, 0, 2])
+        sorted_df = df.sort_values(by=['a', 'b'], )
+        tm.assert_frame_equal(sorted_df, expected)
+
+
+class TestDataFrameSortIndexKinds(TestData):
+
+    def test_sort_index_multicolumn(self):
+        A = np.arange(5).repeat(20)
+        B = np.tile(np.arange(5), 20)
+        random.shuffle(A)
+        random.shuffle(B)
+        frame = DataFrame({'A': A, 'B': B,
+                           'C': np.random.randn(100)})
+
+        # use .sort_values #9816
+        with tm.assert_produces_warning(FutureWarning):
+            frame.sort_index(by=['A', 'B'])
+        result = frame.sort_values(by=['A', 'B'])
+        indexer = np.lexsort((frame['B'], frame['A']))
+        expected = frame.take(indexer)
+        assert_frame_equal(result, expected)
+
+        # use .sort_values #9816
+        with tm.assert_produces_warning(FutureWarning):
+            frame.sort_index(by=['A', 'B'], ascending=False)
+        result = frame.sort_values(by=['A', 'B'], ascending=False)
+        indexer = np.lexsort((frame['B'].rank(ascending=False),
+                              frame['A'].rank(ascending=False)))
+        expected = frame.take(indexer)
+        assert_frame_equal(result, expected)
+
+        # use .sort_values #9816
+        with tm.assert_produces_warning(FutureWarning):
+            frame.sort_index(by=['B', 'A'])
+        result = frame.sort_values(by=['B', 'A'])
+        indexer = np.lexsort((frame['A'], frame['B']))
+        expected = frame.take(indexer)
+        assert_frame_equal(result, expected)
+
+    def test_sort_index_inplace(self):
+        frame = DataFrame(np.random.randn(4, 4), index=[1, 2, 3, 4],
+                          columns=['A', 'B', 'C', 'D'])
+
+        # axis=0
+        unordered = frame.loc[[3, 2, 4, 1]]
+        a_id = id(unordered['A'])
+        df = unordered.copy()
+        df.sort_index(inplace=True)
+        expected = frame
+        assert_frame_equal(df, expected)
+        assert a_id != id(df['A'])
+
+        df = unordered.copy()
+        df.sort_index(ascending=False, inplace=True)
+        expected = frame[::-1]
+        assert_frame_equal(df, expected)
+
+        # axis=1
+        unordered = frame.loc[:, ['D', 'B', 'C', 'A']]
+        df = unordered.copy()
+        df.sort_index(axis=1, inplace=True)
+        expected = frame
+        assert_frame_equal(df, expected)
+
+        df = unordered.copy()
+        df.sort_index(axis=1, ascending=False, inplace=True)
+        expected = frame.iloc[:, ::-1]
+        assert_frame_equal(df, expected)
+
+    def test_sort_index_different_sortorder(self):
+        A = np.arange(20).repeat(5)
+        B = np.tile(np.arange(5), 20)
+
+        indexer = np.random.permutation(100)
+        A = A.take(indexer)
+        B = B.take(indexer)
+
+        df = DataFrame({'A': A, 'B': B,
+                        'C': np.random.randn(100)})
+
+        # use .sort_values #9816
+        with tm.assert_produces_warning(FutureWarning):
+            df.sort_index(by=['A', 'B'], ascending=[1, 0])
+        result = df.sort_values(by=['A', 'B'], ascending=[1, 0])
+
+        ex_indexer = np.lexsort((df.B.max() - df.B, df.A))
+        expected = df.take(ex_indexer)
+        assert_frame_equal(result, expected)
+
+        # test with multiindex, too
+        idf = df.set_index(['A', 'B'])
+
+        result = idf.sort_index(ascending=[1, 0])
+        expected = idf.take(ex_indexer)
+        assert_frame_equal(result, expected)
+
+        # also, Series!
+        result = idf['C'].sort_index(ascending=[1, 0])
+        assert_series_equal(result, expected['C'])
+
+    def test_sort_index_duplicates(self):
+
+        # with 9816, these are all translated to .sort_values
+
+        df = DataFrame([lrange(5, 9), lrange(4)],
+                       columns=['a', 'a', 'b', 'b'])
+
+        with tm.assert_raises_regex(ValueError, 'not unique'):
+            # use .sort_values #9816
+            with tm.assert_produces_warning(FutureWarning):
+                df.sort_index(by='a')
+        with tm.assert_raises_regex(ValueError, 'not unique'):
+            df.sort_values(by='a')
+
+        with tm.assert_raises_regex(ValueError, 'not unique'):
+            # use .sort_values #9816
+            with tm.assert_produces_warning(FutureWarning):
+                df.sort_index(by=['a'])
+        with tm.assert_raises_regex(ValueError, 'not unique'):
+            df.sort_values(by=['a'])
+
+        with tm.assert_raises_regex(ValueError, 'not unique'):
+            # use .sort_values #9816
+            with tm.assert_produces_warning(FutureWarning):
+                # multi-column 'by' is separate codepath
+                df.sort_index(by=['a', 'b'])
+        with tm.assert_raises_regex(ValueError, 'not unique'):
+            # multi-column 'by' is separate codepath
+            df.sort_values(by=['a', 'b'])
+
+        # with multi-index
+        # GH4370
+        df = DataFrame(np.random.randn(4, 2),
+                       columns=MultiIndex.from_tuples([('a', 0), ('a', 1)]))
+        with tm.assert_raises_regex(ValueError, 'level'):
+            # use .sort_values #9816
+            with tm.assert_produces_warning(FutureWarning):
+                df.sort_index(by='a')
+        with tm.assert_raises_regex(ValueError, 'level'):
+            df.sort_values(by='a')
+
+        # convert tuples to a list of tuples
+        # use .sort_values #9816
+        with tm.assert_produces_warning(FutureWarning):
+            df.sort_index(by=[('a', 1)])
+        expected = df.sort_values(by=[('a', 1)])
+
+        # use .sort_values #9816
+        with tm.assert_produces_warning(FutureWarning):
+            df.sort_index(by=('a', 1))
+        result = df.sort_values(by=('a', 1))
+        assert_frame_equal(result, expected)
+
+    def test_sort_index_level(self):
+        mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
+        df = DataFrame([[1, 2], [3, 4]], mi)
+        res = df.sort_index(level='A', sort_remaining=False)
+        assert_frame_equal(df, res)
+
+        res = df.sort_index(level=['A', 'B'], sort_remaining=False)
+        assert_frame_equal(df, res)
+
+    def test_sort_index_categorical_index(self):
+
+        df = (DataFrame({'A': np.arange(6, dtype='int64'),
+                         'B': Series(list('aabbca'))
+                         .astype(CategoricalDtype(list('cab')))})
+              .set_index('B'))
+
+        result = df.sort_index()
+        expected = df.iloc[[4, 0, 1, 5, 2, 3]]
+        assert_frame_equal(result, expected)
+
+        result = df.sort_index(ascending=False)
+        expected = df.iloc[[3, 2, 5, 1, 0, 4]]
+        assert_frame_equal(result, expected)
+
+    def test_sort_index(self):
+        # GH13496
+
+        frame = DataFrame(np.arange(16).reshape(4, 4), index=[1, 2, 3, 4],
+                          columns=['A', 'B', 'C', 'D'])
+
+        # axis=0 : sort rows by index labels
+        unordered = frame.loc[[3, 2, 4, 1]]
+        result = unordered.sort_index(axis=0)
+        expected = frame
+        assert_frame_equal(result, expected)
+
+        result = unordered.sort_index(ascending=False)
+        expected = frame[::-1]
+        assert_frame_equal(result, expected)
+
+        # axis=1 : sort columns by column names
+        unordered = frame.iloc[:, [2, 1, 3, 0]]
+        result = unordered.sort_index(axis=1)
+        assert_frame_equal(result, frame)
+
+        result = unordered.sort_index(axis=1, ascending=False)
+        expected = frame.iloc[:, ::-1]
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("level", ['A', 0])  # GH 21052
+    def test_sort_index_multiindex(self, level):
+        # GH13496
+
+        # sort rows by specified level of multi-index
+        mi = MultiIndex.from_tuples([
+            [2, 1, 3], [2, 1, 2], [1, 1, 1]], names=list('ABC'))
+        df = DataFrame([[1, 2], [3, 4], [5, 6]], index=mi)
+
+        expected_mi = MultiIndex.from_tuples([
+            [1, 1, 1],
+            [2, 1, 2],
+            [2, 1, 3]], names=list('ABC'))
+        expected = pd.DataFrame([
+            [5, 6],
+            [3, 4],
+            [1, 2]], index=expected_mi)
+        result = df.sort_index(level=level)
+        assert_frame_equal(result, expected)
+
+        # sort_remaining=False
+        expected_mi = MultiIndex.from_tuples([
+            [1, 1, 1],
+            [2, 1, 3],
+            [2, 1, 2]], names=list('ABC'))
+        expected = pd.DataFrame([
+            [5, 6],
+            [1, 2],
+            [3, 4]], index=expected_mi)
+        result = df.sort_index(level=level, sort_remaining=False)
+        assert_frame_equal(result, expected)
+
+    def test_sort_index_intervalindex(self):
+        # this is a de-facto sort via unstack
+        # confirming that we sort in the order of the bins
+        y = Series(np.random.randn(100))
+        x1 = Series(np.sign(np.random.randn(100)))
+        x2 = pd.cut(Series(np.random.randn(100)),
+                    bins=[-3, -0.5, 0, 0.5, 3])
+        model = pd.concat([y, x1, x2], axis=1, keys=['Y', 'X1', 'X2'])
+
+        result = model.groupby(['X1', 'X2'], observed=True).mean().unstack()
+        expected = IntervalIndex.from_tuples(
+            [(-3.0, -0.5), (-0.5, 0.0),
+             (0.0, 0.5), (0.5, 3.0)],
+            closed='right')
+        result = result.columns.levels[1].categories
+        tm.assert_index_equal(result, expected)
diff --git a/pandas/tests/frame/test_subclass.py b/pandas/tests/frame/test_subclass.py
new file mode 100644
index 0000000000000..caaa311e9ee96
--- /dev/null
+++ b/pandas/tests/frame/test_subclass.py
@@ -0,0 +1,572 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+from warnings import catch_warnings
+import numpy as np
+
+from pandas import DataFrame, Series, MultiIndex, Panel, Index
+import pandas as pd
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+class TestDataFrameSubclassing(TestData):
+
+    def test_frame_subclassing_and_slicing(self):
+        # Subclass frame and ensure it returns the right class on slicing it
+        # In reference to PR 9632
+
+        class CustomSeries(Series):
+
+            @property
+            def _constructor(self):
+                return CustomSeries
+
+            def custom_series_function(self):
+                return 'OK'
+
+        class CustomDataFrame(DataFrame):
+            """
+            Subclasses pandas DF, fills DF with simulation results, adds some
+            custom plotting functions.
+            """
+
+            def __init__(self, *args, **kw):
+                super(CustomDataFrame, self).__init__(*args, **kw)
+
+            @property
+            def _constructor(self):
+                return CustomDataFrame
+
+            _constructor_sliced = CustomSeries
+
+            def custom_frame_function(self):
+                return 'OK'
+
+        data = {'col1': range(10),
+                'col2': range(10)}
+        cdf = CustomDataFrame(data)
+
+        # Did we get back our own DF class?
+        assert isinstance(cdf, CustomDataFrame)
+
+        # Do we get back our own Series class after selecting a column?
+        cdf_series = cdf.col1
+        assert isinstance(cdf_series, CustomSeries)
+        assert cdf_series.custom_series_function() == 'OK'
+
+        # Do we get back our own DF class after slicing row-wise?
+        cdf_rows = cdf[1:5]
+        assert isinstance(cdf_rows, CustomDataFrame)
+        assert cdf_rows.custom_frame_function() == 'OK'
+
+        # Make sure sliced part of multi-index frame is custom class
+        mcol = pd.MultiIndex.from_tuples([('A', 'A'), ('A', 'B')])
+        cdf_multi = CustomDataFrame([[0, 1], [2, 3]], columns=mcol)
+        assert isinstance(cdf_multi['A'], CustomDataFrame)
+
+        mcol = pd.MultiIndex.from_tuples([('A', ''), ('B', '')])
+        cdf_multi2 = CustomDataFrame([[0, 1], [2, 3]], columns=mcol)
+        assert isinstance(cdf_multi2['A'], CustomSeries)
+
+    def test_dataframe_metadata(self):
+        df = tm.SubclassedDataFrame({'X': [1, 2, 3], 'Y': [1, 2, 3]},
+                                    index=['a', 'b', 'c'])
+        df.testattr = 'XXX'
+
+        assert df.testattr == 'XXX'
+        assert df[['X']].testattr == 'XXX'
+        assert df.loc[['a', 'b'], :].testattr == 'XXX'
+        assert df.iloc[[0, 1], :].testattr == 'XXX'
+
+        # see gh-9776
+        assert df.iloc[0:1, :].testattr == 'XXX'
+
+        # see gh-10553
+        unpickled = tm.round_trip_pickle(df)
+        tm.assert_frame_equal(df, unpickled)
+        assert df._metadata == unpickled._metadata
+        assert df.testattr == unpickled.testattr
+
+    def test_indexing_sliced(self):
+        # GH 11559
+        df = tm.SubclassedDataFrame({'X': [1, 2, 3],
+                                     'Y': [4, 5, 6],
+                                     'Z': [7, 8, 9]},
+                                    index=['a', 'b', 'c'])
+        res = df.loc[:, 'X']
+        exp = tm.SubclassedSeries([1, 2, 3], index=list('abc'), name='X')
+        tm.assert_series_equal(res, exp)
+        assert isinstance(res, tm.SubclassedSeries)
+
+        res = df.iloc[:, 1]
+        exp = tm.SubclassedSeries([4, 5, 6], index=list('abc'), name='Y')
+        tm.assert_series_equal(res, exp)
+        assert isinstance(res, tm.SubclassedSeries)
+
+        res = df.loc[:, 'Z']
+        exp = tm.SubclassedSeries([7, 8, 9], index=list('abc'), name='Z')
+        tm.assert_series_equal(res, exp)
+        assert isinstance(res, tm.SubclassedSeries)
+
+        res = df.loc['a', :]
+        exp = tm.SubclassedSeries([1, 4, 7], index=list('XYZ'), name='a')
+        tm.assert_series_equal(res, exp)
+        assert isinstance(res, tm.SubclassedSeries)
+
+        res = df.iloc[1, :]
+        exp = tm.SubclassedSeries([2, 5, 8], index=list('XYZ'), name='b')
+        tm.assert_series_equal(res, exp)
+        assert isinstance(res, tm.SubclassedSeries)
+
+        res = df.loc['c', :]
+        exp = tm.SubclassedSeries([3, 6, 9], index=list('XYZ'), name='c')
+        tm.assert_series_equal(res, exp)
+        assert isinstance(res, tm.SubclassedSeries)
+
+    def test_to_panel_expanddim(self):
+        # GH 9762
+
+        with catch_warnings(record=True):
+            class SubclassedFrame(DataFrame):
+
+                @property
+                def _constructor_expanddim(self):
+                    return SubclassedPanel
+
+            class SubclassedPanel(Panel):
+                pass
+
+            index = MultiIndex.from_tuples([(0, 0), (0, 1), (0, 2)])
+            df = SubclassedFrame({'X': [1, 2, 3], 'Y': [4, 5, 6]}, index=index)
+            result = df.to_panel()
+            assert isinstance(result, SubclassedPanel)
+            expected = SubclassedPanel([[[1, 2, 3]], [[4, 5, 6]]],
+                                       items=['X', 'Y'], major_axis=[0],
+                                       minor_axis=[0, 1, 2],
+                                       dtype='int64')
+            tm.assert_panel_equal(result, expected)
+
+    def test_subclass_attr_err_propagation(self):
+        # GH 11808
+        class A(DataFrame):
+
+            @property
+            def bar(self):
+                return self.i_dont_exist
+        with tm.assert_raises_regex(AttributeError, '.*i_dont_exist.*'):
+            A().bar
+
+    def test_subclass_align(self):
+        # GH 12983
+        df1 = tm.SubclassedDataFrame({'a': [1, 3, 5],
+                                      'b': [1, 3, 5]}, index=list('ACE'))
+        df2 = tm.SubclassedDataFrame({'c': [1, 2, 4],
+                                      'd': [1, 2, 4]}, index=list('ABD'))
+
+        res1, res2 = df1.align(df2, axis=0)
+        exp1 = tm.SubclassedDataFrame({'a': [1, np.nan, 3, np.nan, 5],
+                                       'b': [1, np.nan, 3, np.nan, 5]},
+                                      index=list('ABCDE'))
+        exp2 = tm.SubclassedDataFrame({'c': [1, 2, np.nan, 4, np.nan],
+                                       'd': [1, 2, np.nan, 4, np.nan]},
+                                      index=list('ABCDE'))
+        assert isinstance(res1, tm.SubclassedDataFrame)
+        tm.assert_frame_equal(res1, exp1)
+        assert isinstance(res2, tm.SubclassedDataFrame)
+        tm.assert_frame_equal(res2, exp2)
+
+        res1, res2 = df1.a.align(df2.c)
+        assert isinstance(res1, tm.SubclassedSeries)
+        tm.assert_series_equal(res1, exp1.a)
+        assert isinstance(res2, tm.SubclassedSeries)
+        tm.assert_series_equal(res2, exp2.c)
+
+    def test_subclass_align_combinations(self):
+        # GH 12983
+        df = tm.SubclassedDataFrame({'a': [1, 3, 5],
+                                     'b': [1, 3, 5]}, index=list('ACE'))
+        s = tm.SubclassedSeries([1, 2, 4], index=list('ABD'), name='x')
+
+        # frame + series
+        res1, res2 = df.align(s, axis=0)
+        exp1 = pd.DataFrame({'a': [1, np.nan, 3, np.nan, 5],
+                             'b': [1, np.nan, 3, np.nan, 5]},
+                            index=list('ABCDE'))
+        # name is lost when
+        exp2 = pd.Series([1, 2, np.nan, 4, np.nan],
+                         index=list('ABCDE'), name='x')
+
+        assert isinstance(res1, tm.SubclassedDataFrame)
+        tm.assert_frame_equal(res1, exp1)
+        assert isinstance(res2, tm.SubclassedSeries)
+        tm.assert_series_equal(res2, exp2)
+
+        # series + frame
+        res1, res2 = s.align(df)
+        assert isinstance(res1, tm.SubclassedSeries)
+        tm.assert_series_equal(res1, exp2)
+        assert isinstance(res2, tm.SubclassedDataFrame)
+        tm.assert_frame_equal(res2, exp1)
+
+    def test_subclass_iterrows(self):
+        # GH 13977
+        df = tm.SubclassedDataFrame({'a': [1]})
+        for i, row in df.iterrows():
+            assert isinstance(row, tm.SubclassedSeries)
+            tm.assert_series_equal(row, df.loc[i])
+
+    def test_subclass_sparse_slice(self):
+        rows = [[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]]
+        ssdf = tm.SubclassedSparseDataFrame(rows)
+        ssdf.testattr = "testattr"
+
+        tm.assert_sp_frame_equal(ssdf.loc[:2],
+                                 tm.SubclassedSparseDataFrame(rows[:3]))
+        tm.assert_sp_frame_equal(ssdf.iloc[:2],
+                                 tm.SubclassedSparseDataFrame(rows[:2]))
+        tm.assert_sp_frame_equal(ssdf[:2],
+                                 tm.SubclassedSparseDataFrame(rows[:2]))
+        assert ssdf.loc[:2].testattr == "testattr"
+        assert ssdf.iloc[:2].testattr == "testattr"
+        assert ssdf[:2].testattr == "testattr"
+
+        tm.assert_sp_series_equal(ssdf.loc[1],
+                                  tm.SubclassedSparseSeries(rows[1]),
+                                  check_names=False)
+        tm.assert_sp_series_equal(ssdf.iloc[1],
+                                  tm.SubclassedSparseSeries(rows[1]),
+                                  check_names=False)
+
+    def test_subclass_sparse_transpose(self):
+        ossdf = tm.SubclassedSparseDataFrame([[1, 2, 3],
+                                              [4, 5, 6]])
+        essdf = tm.SubclassedSparseDataFrame([[1, 4],
+                                              [2, 5],
+                                              [3, 6]])
+        tm.assert_sp_frame_equal(ossdf.T, essdf)
+
+    def test_subclass_stack(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                                    index=['a', 'b', 'c'],
+                                    columns=['X', 'Y', 'Z'])
+
+        res = df.stack()
+        exp = tm.SubclassedSeries(
+            [1, 2, 3, 4, 5, 6, 7, 8, 9],
+            index=[list('aaabbbccc'), list('XYZXYZXYZ')])
+
+        tm.assert_series_equal(res, exp)
+
+    def test_subclass_stack_multi(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame([
+            [10, 11, 12, 13],
+            [20, 21, 22, 23],
+            [30, 31, 32, 33],
+            [40, 41, 42, 43]],
+            index=MultiIndex.from_tuples(
+                list(zip(list('AABB'), list('cdcd'))),
+                names=['aaa', 'ccc']),
+            columns=MultiIndex.from_tuples(
+                list(zip(list('WWXX'), list('yzyz'))),
+                names=['www', 'yyy']))
+
+        exp = tm.SubclassedDataFrame([
+            [10, 12],
+            [11, 13],
+            [20, 22],
+            [21, 23],
+            [30, 32],
+            [31, 33],
+            [40, 42],
+            [41, 43]],
+            index=MultiIndex.from_tuples(list(zip(
+                list('AAAABBBB'), list('ccddccdd'), list('yzyzyzyz'))),
+                names=['aaa', 'ccc', 'yyy']),
+            columns=Index(['W', 'X'], name='www'))
+
+        res = df.stack()
+        tm.assert_frame_equal(res, exp)
+
+        res = df.stack('yyy')
+        tm.assert_frame_equal(res, exp)
+
+        exp = tm.SubclassedDataFrame([
+            [10, 11],
+            [12, 13],
+            [20, 21],
+            [22, 23],
+            [30, 31],
+            [32, 33],
+            [40, 41],
+            [42, 43]],
+            index=MultiIndex.from_tuples(list(zip(
+                list('AAAABBBB'), list('ccddccdd'), list('WXWXWXWX'))),
+                names=['aaa', 'ccc', 'www']),
+            columns=Index(['y', 'z'], name='yyy'))
+
+        res = df.stack('www')
+        tm.assert_frame_equal(res, exp)
+
+    def test_subclass_stack_multi_mixed(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame([
+            [10, 11, 12.0, 13.0],
+            [20, 21, 22.0, 23.0],
+            [30, 31, 32.0, 33.0],
+            [40, 41, 42.0, 43.0]],
+            index=MultiIndex.from_tuples(
+                list(zip(list('AABB'), list('cdcd'))),
+                names=['aaa', 'ccc']),
+            columns=MultiIndex.from_tuples(
+                list(zip(list('WWXX'), list('yzyz'))),
+                names=['www', 'yyy']))
+
+        exp = tm.SubclassedDataFrame([
+            [10, 12.0],
+            [11, 13.0],
+            [20, 22.0],
+            [21, 23.0],
+            [30, 32.0],
+            [31, 33.0],
+            [40, 42.0],
+            [41, 43.0]],
+            index=MultiIndex.from_tuples(list(zip(
+                list('AAAABBBB'), list('ccddccdd'), list('yzyzyzyz'))),
+                names=['aaa', 'ccc', 'yyy']),
+            columns=Index(['W', 'X'], name='www'))
+
+        res = df.stack()
+        tm.assert_frame_equal(res, exp)
+
+        res = df.stack('yyy')
+        tm.assert_frame_equal(res, exp)
+
+        exp = tm.SubclassedDataFrame([
+            [10.0, 11.0],
+            [12.0, 13.0],
+            [20.0, 21.0],
+            [22.0, 23.0],
+            [30.0, 31.0],
+            [32.0, 33.0],
+            [40.0, 41.0],
+            [42.0, 43.0]],
+            index=MultiIndex.from_tuples(list(zip(
+                list('AAAABBBB'), list('ccddccdd'), list('WXWXWXWX'))),
+                names=['aaa', 'ccc', 'www']),
+            columns=Index(['y', 'z'], name='yyy'))
+
+        res = df.stack('www')
+        tm.assert_frame_equal(res, exp)
+
+    def test_subclass_unstack(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                                    index=['a', 'b', 'c'],
+                                    columns=['X', 'Y', 'Z'])
+
+        res = df.unstack()
+        exp = tm.SubclassedSeries(
+            [1, 4, 7, 2, 5, 8, 3, 6, 9],
+            index=[list('XXXYYYZZZ'), list('abcabcabc')])
+
+        tm.assert_series_equal(res, exp)
+
+    def test_subclass_unstack_multi(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame([
+            [10, 11, 12, 13],
+            [20, 21, 22, 23],
+            [30, 31, 32, 33],
+            [40, 41, 42, 43]],
+            index=MultiIndex.from_tuples(
+                list(zip(list('AABB'), list('cdcd'))),
+                names=['aaa', 'ccc']),
+            columns=MultiIndex.from_tuples(
+                list(zip(list('WWXX'), list('yzyz'))),
+                names=['www', 'yyy']))
+
+        exp = tm.SubclassedDataFrame([
+            [10, 20, 11, 21, 12, 22, 13, 23],
+            [30, 40, 31, 41, 32, 42, 33, 43]],
+            index=Index(['A', 'B'], name='aaa'),
+            columns=MultiIndex.from_tuples(list(zip(
+                list('WWWWXXXX'), list('yyzzyyzz'), list('cdcdcdcd'))),
+            names=['www', 'yyy', 'ccc']))
+
+        res = df.unstack()
+        tm.assert_frame_equal(res, exp)
+
+        res = df.unstack('ccc')
+        tm.assert_frame_equal(res, exp)
+
+        exp = tm.SubclassedDataFrame([
+            [10, 30, 11, 31, 12, 32, 13, 33],
+            [20, 40, 21, 41, 22, 42, 23, 43]],
+            index=Index(['c', 'd'], name='ccc'),
+            columns=MultiIndex.from_tuples(list(zip(
+                list('WWWWXXXX'), list('yyzzyyzz'), list('ABABABAB'))),
+                names=['www', 'yyy', 'aaa']))
+
+        res = df.unstack('aaa')
+        tm.assert_frame_equal(res, exp)
+
+    def test_subclass_unstack_multi_mixed(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame([
+            [10, 11, 12.0, 13.0],
+            [20, 21, 22.0, 23.0],
+            [30, 31, 32.0, 33.0],
+            [40, 41, 42.0, 43.0]],
+            index=MultiIndex.from_tuples(
+                list(zip(list('AABB'), list('cdcd'))),
+                names=['aaa', 'ccc']),
+            columns=MultiIndex.from_tuples(
+                list(zip(list('WWXX'), list('yzyz'))),
+                names=['www', 'yyy']))
+
+        exp = tm.SubclassedDataFrame([
+            [10, 20, 11, 21, 12.0, 22.0, 13.0, 23.0],
+            [30, 40, 31, 41, 32.0, 42.0, 33.0, 43.0]],
+            index=Index(['A', 'B'], name='aaa'),
+            columns=MultiIndex.from_tuples(list(zip(
+                list('WWWWXXXX'), list('yyzzyyzz'), list('cdcdcdcd'))),
+            names=['www', 'yyy', 'ccc']))
+
+        res = df.unstack()
+        tm.assert_frame_equal(res, exp)
+
+        res = df.unstack('ccc')
+        tm.assert_frame_equal(res, exp)
+
+        exp = tm.SubclassedDataFrame([
+            [10, 30, 11, 31, 12.0, 32.0, 13.0, 33.0],
+            [20, 40, 21, 41, 22.0, 42.0, 23.0, 43.0]],
+            index=Index(['c', 'd'], name='ccc'),
+            columns=MultiIndex.from_tuples(list(zip(
+                list('WWWWXXXX'), list('yyzzyyzz'), list('ABABABAB'))),
+                names=['www', 'yyy', 'aaa']))
+
+        res = df.unstack('aaa')
+        tm.assert_frame_equal(res, exp)
+
+    def test_subclass_pivot(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame({
+            'index': ['A', 'B', 'C', 'C', 'B', 'A'],
+            'columns': ['One', 'One', 'One', 'Two', 'Two', 'Two'],
+            'values': [1., 2., 3., 3., 2., 1.]})
+
+        pivoted = df.pivot(
+            index='index', columns='columns', values='values')
+
+        expected = tm.SubclassedDataFrame({
+            'One': {'A': 1., 'B': 2., 'C': 3.},
+            'Two': {'A': 1., 'B': 2., 'C': 3.}})
+
+        expected.index.name, expected.columns.name = 'index', 'columns'
+
+        tm.assert_frame_equal(pivoted, expected)
+
+    def test_subclassed_melt(self):
+        # GH 15564
+        cheese = tm.SubclassedDataFrame({
+            'first': ['John', 'Mary'],
+            'last': ['Doe', 'Bo'],
+            'height': [5.5, 6.0],
+            'weight': [130, 150]})
+
+        melted = pd.melt(cheese, id_vars=['first', 'last'])
+
+        expected = tm.SubclassedDataFrame([
+            ['John', 'Doe', 'height', 5.5],
+            ['Mary', 'Bo', 'height', 6.0],
+            ['John', 'Doe', 'weight', 130],
+            ['Mary', 'Bo', 'weight', 150]],
+            columns=['first', 'last', 'variable', 'value'])
+
+        tm.assert_frame_equal(melted, expected)
+
+    def test_subclassed_wide_to_long(self):
+        # GH 9762
+
+        np.random.seed(123)
+        x = np.random.randn(3)
+        df = tm.SubclassedDataFrame({
+            "A1970": {0: "a", 1: "b", 2: "c"},
+            "A1980": {0: "d", 1: "e", 2: "f"},
+            "B1970": {0: 2.5, 1: 1.2, 2: .7},
+            "B1980": {0: 3.2, 1: 1.3, 2: .1},
+            "X": dict(zip(range(3), x))})
+
+        df["id"] = df.index
+        exp_data = {"X": x.tolist() + x.tolist(),
+                    "A": ['a', 'b', 'c', 'd', 'e', 'f'],
+                    "B": [2.5, 1.2, 0.7, 3.2, 1.3, 0.1],
+                    "year": [1970, 1970, 1970, 1980, 1980, 1980],
+                    "id": [0, 1, 2, 0, 1, 2]}
+        expected = tm.SubclassedDataFrame(exp_data)
+        expected = expected.set_index(['id', 'year'])[["X", "A", "B"]]
+        long_frame = pd.wide_to_long(df, ["A", "B"], i="id", j="year")
+
+        tm.assert_frame_equal(long_frame, expected)
+
+    def test_subclassed_apply(self):
+        # GH 19822
+
+        def check_row_subclass(row):
+            assert isinstance(row, tm.SubclassedSeries)
+
+        def strech(row):
+            if row["variable"] == "height":
+                row["value"] += 0.5
+            return row
+
+        df = tm.SubclassedDataFrame([
+            ['John', 'Doe', 'height', 5.5],
+            ['Mary', 'Bo', 'height', 6.0],
+            ['John', 'Doe', 'weight', 130],
+            ['Mary', 'Bo', 'weight', 150]],
+            columns=['first', 'last', 'variable', 'value'])
+
+        df.apply(lambda x: check_row_subclass(x))
+        df.apply(lambda x: check_row_subclass(x), axis=1)
+
+        expected = tm.SubclassedDataFrame([
+            ['John', 'Doe', 'height', 6.0],
+            ['Mary', 'Bo', 'height', 6.5],
+            ['John', 'Doe', 'weight', 130],
+            ['Mary', 'Bo', 'weight', 150]],
+            columns=['first', 'last', 'variable', 'value'])
+
+        result = df.apply(lambda x: strech(x), axis=1)
+        assert isinstance(result, tm.SubclassedDataFrame)
+        tm.assert_frame_equal(result, expected)
+
+        expected = tm.SubclassedDataFrame([
+            [1, 2, 3],
+            [1, 2, 3],
+            [1, 2, 3],
+            [1, 2, 3]])
+
+        result = df.apply(lambda x: tm.SubclassedSeries([1, 2, 3]), axis=1)
+        assert isinstance(result, tm.SubclassedDataFrame)
+        tm.assert_frame_equal(result, expected)
+
+        result = df.apply(lambda x: [1, 2, 3], axis=1, result_type="expand")
+        assert isinstance(result, tm.SubclassedDataFrame)
+        tm.assert_frame_equal(result, expected)
+
+        expected = tm.SubclassedSeries([
+            [1, 2, 3],
+            [1, 2, 3],
+            [1, 2, 3],
+            [1, 2, 3]])
+
+        result = df.apply(lambda x: [1, 2, 3], axis=1)
+        assert not isinstance(result, tm.SubclassedDataFrame)
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/frame/test_timeseries.py b/pandas/tests/frame/test_timeseries.py
new file mode 100644
index 0000000000000..fb9bd74d9876d
--- /dev/null
+++ b/pandas/tests/frame/test_timeseries.py
@@ -0,0 +1,847 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+from datetime import datetime, time
+
+import pytest
+
+from numpy import nan
+from numpy.random import randn
+import numpy as np
+
+from pandas import (DataFrame, Series, Index,
+                    Timestamp, DatetimeIndex, MultiIndex,
+                    to_datetime, date_range, period_range)
+import pandas as pd
+import pandas.tseries.offsets as offsets
+
+from pandas.util.testing import (assert_series_equal,
+                                 assert_frame_equal,
+                                 assert_index_equal,
+                                 assert_raises_regex)
+
+import pandas.util.testing as tm
+from pandas.compat import product
+
+from pandas.tests.frame.common import TestData
+
+
+class TestDataFrameTimeSeriesMethods(TestData):
+
+    def test_diff(self):
+        the_diff = self.tsframe.diff(1)
+
+        assert_series_equal(the_diff['A'],
+                            self.tsframe['A'] - self.tsframe['A'].shift(1))
+
+        # int dtype
+        a = 10000000000000000
+        b = a + 1
+        s = Series([a, b])
+
+        rs = DataFrame({'s': s}).diff()
+        assert rs.s[1] == 1
+
+        # mixed numeric
+        tf = self.tsframe.astype('float32')
+        the_diff = tf.diff(1)
+        assert_series_equal(the_diff['A'],
+                            tf['A'] - tf['A'].shift(1))
+
+        # issue 10907
+        df = pd.DataFrame({'y': pd.Series([2]), 'z': pd.Series([3])})
+        df.insert(0, 'x', 1)
+        result = df.diff(axis=1)
+        expected = pd.DataFrame({'x': np.nan, 'y': pd.Series(
+            1), 'z': pd.Series(1)}).astype('float64')
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('tz', [None, 'UTC'])
+    def test_diff_datetime_axis0(self, tz):
+        # GH 18578
+        df = DataFrame({0: date_range('2010', freq='D', periods=2, tz=tz),
+                        1: date_range('2010', freq='D', periods=2, tz=tz)})
+
+        result = df.diff(axis=0)
+        expected = DataFrame({0: pd.TimedeltaIndex(['NaT', '1 days']),
+                              1: pd.TimedeltaIndex(['NaT', '1 days'])})
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('tz', [None, 'UTC'])
+    def test_diff_datetime_axis1(self, tz):
+        # GH 18578
+        df = DataFrame({0: date_range('2010', freq='D', periods=2, tz=tz),
+                        1: date_range('2010', freq='D', periods=2, tz=tz)})
+        if tz is None:
+            result = df.diff(axis=1)
+            expected = DataFrame({0: pd.TimedeltaIndex(['NaT', 'NaT']),
+                                  1: pd.TimedeltaIndex(['0 days',
+                                                        '0 days'])})
+            assert_frame_equal(result, expected)
+        else:
+            with pytest.raises(NotImplementedError):
+                result = df.diff(axis=1)
+
+    def test_diff_timedelta(self):
+        # GH 4533
+        df = DataFrame(dict(time=[Timestamp('20130101 9:01'),
+                                  Timestamp('20130101 9:02')],
+                            value=[1.0, 2.0]))
+
+        res = df.diff()
+        exp = DataFrame([[pd.NaT, np.nan],
+                         [pd.Timedelta('00:01:00'), 1]],
+                        columns=['time', 'value'])
+        assert_frame_equal(res, exp)
+
+    def test_diff_mixed_dtype(self):
+        df = DataFrame(np.random.randn(5, 3))
+        df['A'] = np.array([1, 2, 3, 4, 5], dtype=object)
+
+        result = df.diff()
+        assert result[0].dtype == np.float64
+
+    def test_diff_neg_n(self):
+        rs = self.tsframe.diff(-1)
+        xp = self.tsframe - self.tsframe.shift(-1)
+        assert_frame_equal(rs, xp)
+
+    def test_diff_float_n(self):
+        rs = self.tsframe.diff(1.)
+        xp = self.tsframe.diff(1)
+        assert_frame_equal(rs, xp)
+
+    def test_diff_axis(self):
+        # GH 9727
+        df = DataFrame([[1., 2.], [3., 4.]])
+        assert_frame_equal(df.diff(axis=1), DataFrame(
+            [[np.nan, 1.], [np.nan, 1.]]))
+        assert_frame_equal(df.diff(axis=0), DataFrame(
+            [[np.nan, np.nan], [2., 2.]]))
+
+    def test_pct_change(self):
+        rs = self.tsframe.pct_change(fill_method=None)
+        assert_frame_equal(rs, self.tsframe / self.tsframe.shift(1) - 1)
+
+        rs = self.tsframe.pct_change(2)
+        filled = self.tsframe.fillna(method='pad')
+        assert_frame_equal(rs, filled / filled.shift(2) - 1)
+
+        rs = self.tsframe.pct_change(fill_method='bfill', limit=1)
+        filled = self.tsframe.fillna(method='bfill', limit=1)
+        assert_frame_equal(rs, filled / filled.shift(1) - 1)
+
+        rs = self.tsframe.pct_change(freq='5D')
+        filled = self.tsframe.fillna(method='pad')
+        assert_frame_equal(rs,
+                           (filled / filled.shift(freq='5D') - 1)
+                           .reindex_like(filled))
+
+    def test_pct_change_shift_over_nas(self):
+        s = Series([1., 1.5, np.nan, 2.5, 3.])
+
+        df = DataFrame({'a': s, 'b': s})
+
+        chg = df.pct_change()
+        expected = Series([np.nan, 0.5, 0., 2.5 / 1.5 - 1, .2])
+        edf = DataFrame({'a': expected, 'b': expected})
+        assert_frame_equal(chg, edf)
+
+    @pytest.mark.parametrize("freq, periods, fill_method, limit",
+                             [('5B', 5, None, None),
+                              ('3B', 3, None, None),
+                              ('3B', 3, 'bfill', None),
+                              ('7B', 7, 'pad', 1),
+                              ('7B', 7, 'bfill', 3),
+                              ('14B', 14, None, None)])
+    def test_pct_change_periods_freq(self, freq, periods, fill_method, limit):
+        # GH 7292
+        rs_freq = self.tsframe.pct_change(freq=freq,
+                                          fill_method=fill_method,
+                                          limit=limit)
+        rs_periods = self.tsframe.pct_change(periods,
+                                             fill_method=fill_method,
+                                             limit=limit)
+        assert_frame_equal(rs_freq, rs_periods)
+
+        empty_ts = DataFrame(index=self.tsframe.index,
+                             columns=self.tsframe.columns)
+        rs_freq = empty_ts.pct_change(freq=freq,
+                                      fill_method=fill_method,
+                                      limit=limit)
+        rs_periods = empty_ts.pct_change(periods,
+                                         fill_method=fill_method,
+                                         limit=limit)
+        assert_frame_equal(rs_freq, rs_periods)
+
+    def test_frame_ctor_datetime64_column(self):
+        rng = date_range('1/1/2000 00:00:00', '1/1/2000 1:59:50', freq='10s')
+        dates = np.asarray(rng)
+
+        df = DataFrame({'A': np.random.randn(len(rng)), 'B': dates})
+        assert np.issubdtype(df['B'].dtype, np.dtype('M8[ns]'))
+
+    def test_frame_add_datetime64_column(self):
+        rng = date_range('1/1/2000 00:00:00', '1/1/2000 1:59:50', freq='10s')
+        df = DataFrame(index=np.arange(len(rng)))
+
+        df['A'] = rng
+        assert np.issubdtype(df['A'].dtype, np.dtype('M8[ns]'))
+
+    def test_frame_datetime64_pre1900_repr(self):
+        df = DataFrame({'year': date_range('1/1/1700', periods=50,
+                                           freq='A-DEC')})
+        # it works!
+        repr(df)
+
+    def test_frame_add_datetime64_col_other_units(self):
+        n = 100
+
+        units = ['h', 'm', 's', 'ms', 'D', 'M', 'Y']
+
+        ns_dtype = np.dtype('M8[ns]')
+
+        for unit in units:
+            dtype = np.dtype('M8[%s]' % unit)
+            vals = np.arange(n, dtype=np.int64).view(dtype)
+
+            df = DataFrame({'ints': np.arange(n)}, index=np.arange(n))
+            df[unit] = vals
+
+            ex_vals = to_datetime(vals.astype('O')).values
+
+            assert df[unit].dtype == ns_dtype
+            assert (df[unit].values == ex_vals).all()
+
+        # Test insertion into existing datetime64 column
+        df = DataFrame({'ints': np.arange(n)}, index=np.arange(n))
+        df['dates'] = np.arange(n, dtype=np.int64).view(ns_dtype)
+
+        for unit in units:
+            dtype = np.dtype('M8[%s]' % unit)
+            vals = np.arange(n, dtype=np.int64).view(dtype)
+
+            tmp = df.copy()
+
+            tmp['dates'] = vals
+            ex_vals = to_datetime(vals.astype('O')).values
+
+            assert (tmp['dates'].values == ex_vals).all()
+
+    def test_shift(self):
+        # naive shift
+        shiftedFrame = self.tsframe.shift(5)
+        tm.assert_index_equal(shiftedFrame.index, self.tsframe.index)
+
+        shiftedSeries = self.tsframe['A'].shift(5)
+        assert_series_equal(shiftedFrame['A'], shiftedSeries)
+
+        shiftedFrame = self.tsframe.shift(-5)
+        tm.assert_index_equal(shiftedFrame.index, self.tsframe.index)
+
+        shiftedSeries = self.tsframe['A'].shift(-5)
+        assert_series_equal(shiftedFrame['A'], shiftedSeries)
+
+        # shift by 0
+        unshifted = self.tsframe.shift(0)
+        assert_frame_equal(unshifted, self.tsframe)
+
+        # shift by DateOffset
+        shiftedFrame = self.tsframe.shift(5, freq=offsets.BDay())
+        assert len(shiftedFrame) == len(self.tsframe)
+
+        shiftedFrame2 = self.tsframe.shift(5, freq='B')
+        assert_frame_equal(shiftedFrame, shiftedFrame2)
+
+        d = self.tsframe.index[0]
+        shifted_d = d + offsets.BDay(5)
+        assert_series_equal(self.tsframe.xs(d),
+                            shiftedFrame.xs(shifted_d), check_names=False)
+
+        # shift int frame
+        int_shifted = self.intframe.shift(1)  # noqa
+
+        # Shifting with PeriodIndex
+        ps = tm.makePeriodFrame()
+        shifted = ps.shift(1)
+        unshifted = shifted.shift(-1)
+        tm.assert_index_equal(shifted.index, ps.index)
+        tm.assert_index_equal(unshifted.index, ps.index)
+        tm.assert_numpy_array_equal(unshifted.iloc[:, 0].dropna().values,
+                                    ps.iloc[:-1, 0].values)
+
+        shifted2 = ps.shift(1, 'B')
+        shifted3 = ps.shift(1, offsets.BDay())
+        assert_frame_equal(shifted2, shifted3)
+        assert_frame_equal(ps, shifted2.shift(-1, 'B'))
+
+        tm.assert_raises_regex(ValueError,
+                               'does not match PeriodIndex freq',
+                               ps.shift, freq='D')
+
+        # shift other axis
+        # GH 6371
+        df = DataFrame(np.random.rand(10, 5))
+        expected = pd.concat([DataFrame(np.nan, index=df.index,
+                                        columns=[0]),
+                              df.iloc[:, 0:-1]],
+                             ignore_index=True, axis=1)
+        result = df.shift(1, axis=1)
+        assert_frame_equal(result, expected)
+
+        # shift named axis
+        df = DataFrame(np.random.rand(10, 5))
+        expected = pd.concat([DataFrame(np.nan, index=df.index,
+                                        columns=[0]),
+                              df.iloc[:, 0:-1]],
+                             ignore_index=True, axis=1)
+        result = df.shift(1, axis='columns')
+        assert_frame_equal(result, expected)
+
+    def test_shift_bool(self):
+        df = DataFrame({'high': [True, False],
+                        'low': [False, False]})
+        rs = df.shift(1)
+        xp = DataFrame(np.array([[np.nan, np.nan],
+                                 [True, False]], dtype=object),
+                       columns=['high', 'low'])
+        assert_frame_equal(rs, xp)
+
+    def test_shift_categorical(self):
+        # GH 9416
+        s1 = pd.Series(['a', 'b', 'c'], dtype='category')
+        s2 = pd.Series(['A', 'B', 'C'], dtype='category')
+        df = DataFrame({'one': s1, 'two': s2})
+        rs = df.shift(1)
+        xp = DataFrame({'one': s1.shift(1), 'two': s2.shift(1)})
+        assert_frame_equal(rs, xp)
+
+    def test_shift_empty(self):
+        # Regression test for #8019
+        df = DataFrame({'foo': []})
+        rs = df.shift(-1)
+
+        assert_frame_equal(df, rs)
+
+    def test_shift_duplicate_columns(self):
+        # GH 9092; verify that position-based shifting works
+        # in the presence of duplicate columns
+        column_lists = [list(range(5)), [1] * 5, [1, 1, 2, 2, 1]]
+        data = np.random.randn(20, 5)
+
+        shifted = []
+        for columns in column_lists:
+            df = pd.DataFrame(data.copy(), columns=columns)
+            for s in range(5):
+                df.iloc[:, s] = df.iloc[:, s].shift(s + 1)
+            df.columns = range(5)
+            shifted.append(df)
+
+        # sanity check the base case
+        nulls = shifted[0].isna().sum()
+        assert_series_equal(nulls, Series(range(1, 6), dtype='int64'))
+
+        # check all answers are the same
+        assert_frame_equal(shifted[0], shifted[1])
+        assert_frame_equal(shifted[0], shifted[2])
+
+    def test_tshift(self):
+        # PeriodIndex
+        ps = tm.makePeriodFrame()
+        shifted = ps.tshift(1)
+        unshifted = shifted.tshift(-1)
+
+        assert_frame_equal(unshifted, ps)
+
+        shifted2 = ps.tshift(freq='B')
+        assert_frame_equal(shifted, shifted2)
+
+        shifted3 = ps.tshift(freq=offsets.BDay())
+        assert_frame_equal(shifted, shifted3)
+
+        tm.assert_raises_regex(
+            ValueError, 'does not match', ps.tshift, freq='M')
+
+        # DatetimeIndex
+        shifted = self.tsframe.tshift(1)
+        unshifted = shifted.tshift(-1)
+
+        assert_frame_equal(self.tsframe, unshifted)
+
+        shifted2 = self.tsframe.tshift(freq=self.tsframe.index.freq)
+        assert_frame_equal(shifted, shifted2)
+
+        inferred_ts = DataFrame(self.tsframe.values,
+                                Index(np.asarray(self.tsframe.index)),
+                                columns=self.tsframe.columns)
+        shifted = inferred_ts.tshift(1)
+        unshifted = shifted.tshift(-1)
+        assert_frame_equal(shifted, self.tsframe.tshift(1))
+        assert_frame_equal(unshifted, inferred_ts)
+
+        no_freq = self.tsframe.iloc[[0, 5, 7], :]
+        pytest.raises(ValueError, no_freq.tshift)
+
+    def test_truncate(self):
+        ts = self.tsframe[::3]
+
+        start, end = self.tsframe.index[3], self.tsframe.index[6]
+
+        start_missing = self.tsframe.index[2]
+        end_missing = self.tsframe.index[7]
+
+        # neither specified
+        truncated = ts.truncate()
+        assert_frame_equal(truncated, ts)
+
+        # both specified
+        expected = ts[1:3]
+
+        truncated = ts.truncate(start, end)
+        assert_frame_equal(truncated, expected)
+
+        truncated = ts.truncate(start_missing, end_missing)
+        assert_frame_equal(truncated, expected)
+
+        # start specified
+        expected = ts[1:]
+
+        truncated = ts.truncate(before=start)
+        assert_frame_equal(truncated, expected)
+
+        truncated = ts.truncate(before=start_missing)
+        assert_frame_equal(truncated, expected)
+
+        # end specified
+        expected = ts[:3]
+
+        truncated = ts.truncate(after=end)
+        assert_frame_equal(truncated, expected)
+
+        truncated = ts.truncate(after=end_missing)
+        assert_frame_equal(truncated, expected)
+
+        pytest.raises(ValueError, ts.truncate,
+                      before=ts.index[-1] - 1,
+                      after=ts.index[0] + 1)
+
+    def test_truncate_copy(self):
+        index = self.tsframe.index
+        truncated = self.tsframe.truncate(index[5], index[10])
+        truncated.values[:] = 5.
+        assert not (self.tsframe.values[5:11] == 5).any()
+
+    def test_truncate_nonsortedindex(self):
+        # GH 17935
+
+        df = pd.DataFrame({'A': ['a', 'b', 'c', 'd', 'e']},
+                          index=[5, 3, 2, 9, 0])
+        with tm.assert_raises_regex(ValueError,
+                                    'truncate requires a sorted index'):
+            df.truncate(before=3, after=9)
+
+        rng = pd.date_range('2011-01-01', '2012-01-01', freq='W')
+        ts = pd.DataFrame({'A': np.random.randn(len(rng)),
+                           'B': np.random.randn(len(rng))},
+                          index=rng)
+        with tm.assert_raises_regex(ValueError,
+                                    'truncate requires a sorted index'):
+            ts.sort_values('A', ascending=False).truncate(before='2011-11',
+                                                          after='2011-12')
+
+        df = pd.DataFrame({3: np.random.randn(5),
+                           20: np.random.randn(5),
+                           2: np.random.randn(5),
+                           0: np.random.randn(5)},
+                          columns=[3, 20, 2, 0])
+        with tm.assert_raises_regex(ValueError,
+                                    'truncate requires a sorted index'):
+            df.truncate(before=2, after=20, axis=1)
+
+    def test_asfreq(self):
+        offset_monthly = self.tsframe.asfreq(offsets.BMonthEnd())
+        rule_monthly = self.tsframe.asfreq('BM')
+
+        tm.assert_almost_equal(offset_monthly['A'], rule_monthly['A'])
+
+        filled = rule_monthly.asfreq('B', method='pad')  # noqa
+        # TODO: actually check that this worked.
+
+        # don't forget!
+        filled_dep = rule_monthly.asfreq('B', method='pad')  # noqa
+
+        # test does not blow up on length-0 DataFrame
+        zero_length = self.tsframe.reindex([])
+        result = zero_length.asfreq('BM')
+        assert result is not zero_length
+
+    def test_asfreq_datetimeindex(self):
+        df = DataFrame({'A': [1, 2, 3]},
+                       index=[datetime(2011, 11, 1), datetime(2011, 11, 2),
+                              datetime(2011, 11, 3)])
+        df = df.asfreq('B')
+        assert isinstance(df.index, DatetimeIndex)
+
+        ts = df['A'].asfreq('B')
+        assert isinstance(ts.index, DatetimeIndex)
+
+    def test_asfreq_fillvalue(self):
+        # test for fill value during upsampling, related to issue 3715
+
+        # setup
+        rng = pd.date_range('1/1/2016', periods=10, freq='2S')
+        ts = pd.Series(np.arange(len(rng)), index=rng)
+        df = pd.DataFrame({'one': ts})
+
+        # insert pre-existing missing value
+        df.loc['2016-01-01 00:00:08', 'one'] = None
+
+        actual_df = df.asfreq(freq='1S', fill_value=9.0)
+        expected_df = df.asfreq(freq='1S').fillna(9.0)
+        expected_df.loc['2016-01-01 00:00:08', 'one'] = None
+        assert_frame_equal(expected_df, actual_df)
+
+        expected_series = ts.asfreq(freq='1S').fillna(9.0)
+        actual_series = ts.asfreq(freq='1S', fill_value=9.0)
+        assert_series_equal(expected_series, actual_series)
+
+    @pytest.mark.parametrize("data,idx,expected_first,expected_last", [
+        ({'A': [1, 2, 3]}, [1, 1, 2], 1, 2),
+        ({'A': [1, 2, 3]}, [1, 2, 2], 1, 2),
+        ({'A': [1, 2, 3, 4]}, ['d', 'd', 'd', 'd'], 'd', 'd'),
+        ({'A': [1, np.nan, 3]}, [1, 1, 2], 1, 2),
+        ({'A': [np.nan, np.nan, 3]}, [1, 1, 2], 2, 2),
+        ({'A': [1, np.nan, 3]}, [1, 2, 2], 1, 2)])
+    def test_first_last_valid(self, data, idx,
+                              expected_first, expected_last):
+        N = len(self.frame.index)
+        mat = randn(N)
+        mat[:5] = nan
+        mat[-5:] = nan
+
+        frame = DataFrame({'foo': mat}, index=self.frame.index)
+        index = frame.first_valid_index()
+
+        assert index == frame.index[5]
+
+        index = frame.last_valid_index()
+        assert index == frame.index[-6]
+
+        # GH12800
+        empty = DataFrame()
+        assert empty.last_valid_index() is None
+        assert empty.first_valid_index() is None
+
+        # GH17400: no valid entries
+        frame[:] = nan
+        assert frame.last_valid_index() is None
+        assert frame.first_valid_index() is None
+
+        # GH20499: its preserves freq with holes
+        frame.index = date_range("20110101", periods=N, freq="B")
+        frame.iloc[1] = 1
+        frame.iloc[-2] = 1
+        assert frame.first_valid_index() == frame.index[1]
+        assert frame.last_valid_index() == frame.index[-2]
+        assert frame.first_valid_index().freq == frame.index.freq
+        assert frame.last_valid_index().freq == frame.index.freq
+
+        # GH 21441
+        df = DataFrame(data, index=idx)
+        assert expected_first == df.first_valid_index()
+        assert expected_last == df.last_valid_index()
+
+    def test_first_subset(self):
+        ts = tm.makeTimeDataFrame(freq='12h')
+        result = ts.first('10d')
+        assert len(result) == 20
+
+        ts = tm.makeTimeDataFrame(freq='D')
+        result = ts.first('10d')
+        assert len(result) == 10
+
+        result = ts.first('3M')
+        expected = ts[:'3/31/2000']
+        assert_frame_equal(result, expected)
+
+        result = ts.first('21D')
+        expected = ts[:21]
+        assert_frame_equal(result, expected)
+
+        result = ts[:0].first('3M')
+        assert_frame_equal(result, ts[:0])
+
+    def test_first_raises(self):
+        # GH20725
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]])
+        with pytest.raises(TypeError):  # index is not a DatetimeIndex
+            df.first('1D')
+
+    def test_last_subset(self):
+        ts = tm.makeTimeDataFrame(freq='12h')
+        result = ts.last('10d')
+        assert len(result) == 20
+
+        ts = tm.makeTimeDataFrame(nper=30, freq='D')
+        result = ts.last('10d')
+        assert len(result) == 10
+
+        result = ts.last('21D')
+        expected = ts['2000-01-10':]
+        assert_frame_equal(result, expected)
+
+        result = ts.last('21D')
+        expected = ts[-21:]
+        assert_frame_equal(result, expected)
+
+        result = ts[:0].last('3M')
+        assert_frame_equal(result, ts[:0])
+
+    def test_last_raises(self):
+        # GH20725
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]])
+        with pytest.raises(TypeError):  # index is not a DatetimeIndex
+            df.last('1D')
+
+    def test_at_time(self):
+        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
+        ts = DataFrame(np.random.randn(len(rng), 2), index=rng)
+        rs = ts.at_time(rng[1])
+        assert (rs.index.hour == rng[1].hour).all()
+        assert (rs.index.minute == rng[1].minute).all()
+        assert (rs.index.second == rng[1].second).all()
+
+        result = ts.at_time('9:30')
+        expected = ts.at_time(time(9, 30))
+        assert_frame_equal(result, expected)
+
+        result = ts.loc[time(9, 30)]
+        expected = ts.loc[(rng.hour == 9) & (rng.minute == 30)]
+
+        assert_frame_equal(result, expected)
+
+        # midnight, everything
+        rng = date_range('1/1/2000', '1/31/2000')
+        ts = DataFrame(np.random.randn(len(rng), 3), index=rng)
+
+        result = ts.at_time(time(0, 0))
+        assert_frame_equal(result, ts)
+
+        # time doesn't exist
+        rng = date_range('1/1/2012', freq='23Min', periods=384)
+        ts = DataFrame(np.random.randn(len(rng), 2), rng)
+        rs = ts.at_time('16:00')
+        assert len(rs) == 0
+
+    def test_at_time_raises(self):
+        # GH20725
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]])
+        with pytest.raises(TypeError):  # index is not a DatetimeIndex
+            df.at_time('00:00')
+
+    def test_between_time(self):
+        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
+        ts = DataFrame(np.random.randn(len(rng), 2), index=rng)
+        stime = time(0, 0)
+        etime = time(1, 0)
+
+        close_open = product([True, False], [True, False])
+        for inc_start, inc_end in close_open:
+            filtered = ts.between_time(stime, etime, inc_start, inc_end)
+            exp_len = 13 * 4 + 1
+            if not inc_start:
+                exp_len -= 5
+            if not inc_end:
+                exp_len -= 4
+
+            assert len(filtered) == exp_len
+            for rs in filtered.index:
+                t = rs.time()
+                if inc_start:
+                    assert t >= stime
+                else:
+                    assert t > stime
+
+                if inc_end:
+                    assert t <= etime
+                else:
+                    assert t < etime
+
+        result = ts.between_time('00:00', '01:00')
+        expected = ts.between_time(stime, etime)
+        assert_frame_equal(result, expected)
+
+        # across midnight
+        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
+        ts = DataFrame(np.random.randn(len(rng), 2), index=rng)
+        stime = time(22, 0)
+        etime = time(9, 0)
+
+        close_open = product([True, False], [True, False])
+        for inc_start, inc_end in close_open:
+            filtered = ts.between_time(stime, etime, inc_start, inc_end)
+            exp_len = (12 * 11 + 1) * 4 + 1
+            if not inc_start:
+                exp_len -= 4
+            if not inc_end:
+                exp_len -= 4
+
+            assert len(filtered) == exp_len
+            for rs in filtered.index:
+                t = rs.time()
+                if inc_start:
+                    assert (t >= stime) or (t <= etime)
+                else:
+                    assert (t > stime) or (t <= etime)
+
+                if inc_end:
+                    assert (t <= etime) or (t >= stime)
+                else:
+                    assert (t < etime) or (t >= stime)
+
+    def test_between_time_raises(self):
+        # GH20725
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]])
+        with pytest.raises(TypeError):  # index is not a DatetimeIndex
+            df.between_time(start_time='00:00', end_time='12:00')
+
+    def test_operation_on_NaT(self):
+        # Both NaT and Timestamp are in DataFrame.
+        df = pd.DataFrame({'foo': [pd.NaT, pd.NaT,
+                                   pd.Timestamp('2012-05-01')]})
+
+        res = df.min()
+        exp = pd.Series([pd.Timestamp('2012-05-01')], index=["foo"])
+        tm.assert_series_equal(res, exp)
+
+        res = df.max()
+        exp = pd.Series([pd.Timestamp('2012-05-01')], index=["foo"])
+        tm.assert_series_equal(res, exp)
+
+        # GH12941, only NaTs are in DataFrame.
+        df = pd.DataFrame({'foo': [pd.NaT, pd.NaT]})
+
+        res = df.min()
+        exp = pd.Series([pd.NaT], index=["foo"])
+        tm.assert_series_equal(res, exp)
+
+        res = df.max()
+        exp = pd.Series([pd.NaT], index=["foo"])
+        tm.assert_series_equal(res, exp)
+
+    def test_datetime_assignment_with_NaT_and_diff_time_units(self):
+        # GH 7492
+        data_ns = np.array([1, 'nat'], dtype='datetime64[ns]')
+        result = pd.Series(data_ns).to_frame()
+        result['new'] = data_ns
+        expected = pd.DataFrame({0: [1, None],
+                                 'new': [1, None]}, dtype='datetime64[ns]')
+        tm.assert_frame_equal(result, expected)
+        # OutOfBoundsDatetime error shouldn't occur
+        data_s = np.array([1, 'nat'], dtype='datetime64[s]')
+        result['new'] = data_s
+        expected = pd.DataFrame({0: [1, None],
+                                 'new': [1e9, None]}, dtype='datetime64[ns]')
+        tm.assert_frame_equal(result, expected)
+
+    def test_frame_to_period(self):
+        K = 5
+        from pandas.core.indexes.period import period_range
+
+        dr = date_range('1/1/2000', '1/1/2001')
+        pr = period_range('1/1/2000', '1/1/2001')
+        df = DataFrame(randn(len(dr), K), index=dr)
+        df['mix'] = 'a'
+
+        pts = df.to_period()
+        exp = df.copy()
+        exp.index = pr
+        assert_frame_equal(pts, exp)
+
+        pts = df.to_period('M')
+        tm.assert_index_equal(pts.index, exp.index.asfreq('M'))
+
+        df = df.T
+        pts = df.to_period(axis=1)
+        exp = df.copy()
+        exp.columns = pr
+        assert_frame_equal(pts, exp)
+
+        pts = df.to_period('M', axis=1)
+        tm.assert_index_equal(pts.columns, exp.columns.asfreq('M'))
+
+        pytest.raises(ValueError, df.to_period, axis=2)
+
+    @pytest.mark.parametrize("fn", ['tz_localize', 'tz_convert'])
+    def test_tz_convert_and_localize(self, fn):
+        l0 = date_range('20140701', periods=5, freq='D')
+
+        # TODO: l1 should be a PeriodIndex for testing
+        #       after GH2106 is addressed
+        with pytest.raises(NotImplementedError):
+            period_range('20140701', periods=1).tz_convert('UTC')
+        with pytest.raises(NotImplementedError):
+            period_range('20140701', periods=1).tz_localize('UTC')
+        # l1 = period_range('20140701', periods=5, freq='D')
+        l1 = date_range('20140701', periods=5, freq='D')
+
+        int_idx = Index(range(5))
+
+        if fn == 'tz_convert':
+            l0 = l0.tz_localize('UTC')
+            l1 = l1.tz_localize('UTC')
+
+        for idx in [l0, l1]:
+
+            l0_expected = getattr(idx, fn)('US/Pacific')
+            l1_expected = getattr(idx, fn)('US/Pacific')
+
+            df1 = DataFrame(np.ones(5), index=l0)
+            df1 = getattr(df1, fn)('US/Pacific')
+            assert_index_equal(df1.index, l0_expected)
+
+            # MultiIndex
+            # GH7846
+            df2 = DataFrame(np.ones(5), MultiIndex.from_arrays([l0, l1]))
+
+            df3 = getattr(df2, fn)('US/Pacific', level=0)
+            assert not df3.index.levels[0].equals(l0)
+            assert_index_equal(df3.index.levels[0], l0_expected)
+            assert_index_equal(df3.index.levels[1], l1)
+            assert not df3.index.levels[1].equals(l1_expected)
+
+            df3 = getattr(df2, fn)('US/Pacific', level=1)
+            assert_index_equal(df3.index.levels[0], l0)
+            assert not df3.index.levels[0].equals(l0_expected)
+            assert_index_equal(df3.index.levels[1], l1_expected)
+            assert not df3.index.levels[1].equals(l1)
+
+            df4 = DataFrame(np.ones(5),
+                            MultiIndex.from_arrays([int_idx, l0]))
+
+            # TODO: untested
+            df5 = getattr(df4, fn)('US/Pacific', level=1)  # noqa
+
+            assert_index_equal(df3.index.levels[0], l0)
+            assert not df3.index.levels[0].equals(l0_expected)
+            assert_index_equal(df3.index.levels[1], l1_expected)
+            assert not df3.index.levels[1].equals(l1)
+
+        # Bad Inputs
+
+        # Not DatetimeIndex / PeriodIndex
+        with assert_raises_regex(TypeError, 'DatetimeIndex'):
+            df = DataFrame(index=int_idx)
+            df = getattr(df, fn)('US/Pacific')
+
+        # Not DatetimeIndex / PeriodIndex
+        with assert_raises_regex(TypeError, 'DatetimeIndex'):
+            df = DataFrame(np.ones(5),
+                           MultiIndex.from_arrays([int_idx, l0]))
+            df = getattr(df, fn)('US/Pacific', level=0)
+
+        # Invalid level
+        with assert_raises_regex(ValueError, 'not valid'):
+            df = DataFrame(index=l0)
+            df = getattr(df, fn)('US/Pacific', level=1)
diff --git a/pandas/tests/frame/test_timezones.py b/pandas/tests/frame/test_timezones.py
new file mode 100644
index 0000000000000..3956968173070
--- /dev/null
+++ b/pandas/tests/frame/test_timezones.py
@@ -0,0 +1,145 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for DataFrame timezone-related methods
+"""
+from datetime import datetime
+
+import pytest
+import pytz
+import numpy as np
+
+import pandas.util.testing as tm
+from pandas.compat import lrange
+from pandas.core.indexes.datetimes import date_range
+from pandas.core.dtypes.dtypes import DatetimeTZDtype
+from pandas import Series, DataFrame
+
+
+class TestDataFrameTimezones(object):
+    def test_frame_from_records_utc(self):
+        rec = {'datum': 1.5,
+               'begin_time': datetime(2006, 4, 27, tzinfo=pytz.utc)}
+
+        # it works
+        DataFrame.from_records([rec], index='begin_time')
+
+    def test_frame_tz_localize(self):
+        rng = date_range('1/1/2011', periods=100, freq='H')
+
+        df = DataFrame({'a': 1}, index=rng)
+        result = df.tz_localize('utc')
+        expected = DataFrame({'a': 1}, rng.tz_localize('UTC'))
+        assert result.index.tz.zone == 'UTC'
+        tm.assert_frame_equal(result, expected)
+
+        df = df.T
+        result = df.tz_localize('utc', axis=1)
+        assert result.columns.tz.zone == 'UTC'
+        tm.assert_frame_equal(result, expected.T)
+
+    def test_frame_tz_convert(self):
+        rng = date_range('1/1/2011', periods=200, freq='D', tz='US/Eastern')
+
+        df = DataFrame({'a': 1}, index=rng)
+        result = df.tz_convert('Europe/Berlin')
+        expected = DataFrame({'a': 1}, rng.tz_convert('Europe/Berlin'))
+        assert result.index.tz.zone == 'Europe/Berlin'
+        tm.assert_frame_equal(result, expected)
+
+        df = df.T
+        result = df.tz_convert('Europe/Berlin', axis=1)
+        assert result.columns.tz.zone == 'Europe/Berlin'
+        tm.assert_frame_equal(result, expected.T)
+
+    def test_frame_join_tzaware(self):
+        test1 = DataFrame(np.zeros((6, 3)),
+                          index=date_range("2012-11-15 00:00:00", periods=6,
+                                           freq="100L", tz="US/Central"))
+        test2 = DataFrame(np.zeros((3, 3)),
+                          index=date_range("2012-11-15 00:00:00", periods=3,
+                                           freq="250L", tz="US/Central"),
+                          columns=lrange(3, 6))
+
+        result = test1.join(test2, how='outer')
+        ex_index = test1.index.union(test2.index)
+
+        tm.assert_index_equal(result.index, ex_index)
+        assert result.index.tz.zone == 'US/Central'
+
+    def test_frame_add_tz_mismatch_converts_to_utc(self):
+        rng = date_range('1/1/2011', periods=10, freq='H', tz='US/Eastern')
+        df = DataFrame(np.random.randn(len(rng)), index=rng, columns=['a'])
+
+        df_moscow = df.tz_convert('Europe/Moscow')
+        result = df + df_moscow
+        assert result.index.tz is pytz.utc
+
+        result = df_moscow + df
+        assert result.index.tz is pytz.utc
+
+    def test_frame_align_aware(self):
+        idx1 = date_range('2001', periods=5, freq='H', tz='US/Eastern')
+        idx2 = date_range('2001', periods=5, freq='2H', tz='US/Eastern')
+        df1 = DataFrame(np.random.randn(len(idx1), 3), idx1)
+        df2 = DataFrame(np.random.randn(len(idx2), 3), idx2)
+        new1, new2 = df1.align(df2)
+        assert df1.index.tz == new1.index.tz
+        assert df2.index.tz == new2.index.tz
+
+        # different timezones convert to UTC
+
+        # frame with frame
+        df1_central = df1.tz_convert('US/Central')
+        new1, new2 = df1.align(df1_central)
+        assert new1.index.tz == pytz.UTC
+        assert new2.index.tz == pytz.UTC
+
+        # frame with Series
+        new1, new2 = df1.align(df1_central[0], axis=0)
+        assert new1.index.tz == pytz.UTC
+        assert new2.index.tz == pytz.UTC
+
+        df1[0].align(df1_central, axis=0)
+        assert new1.index.tz == pytz.UTC
+        assert new2.index.tz == pytz.UTC
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_frame_no_datetime64_dtype(self, tz):
+        # after GH#7822
+        # these retain the timezones on dict construction
+        dr = date_range('2011/1/1', '2012/1/1', freq='W-FRI')
+        dr_tz = dr.tz_localize(tz)
+        df = DataFrame({'A': 'foo', 'B': dr_tz}, index=dr)
+        tz_expected = DatetimeTZDtype('ns', dr_tz.tzinfo)
+        assert df['B'].dtype == tz_expected
+
+        # GH#2810 (with timezones)
+        datetimes_naive = [ts.to_pydatetime() for ts in dr]
+        datetimes_with_tz = [ts.to_pydatetime() for ts in dr_tz]
+        df = DataFrame({'dr': dr,
+                        'dr_tz': dr_tz,
+                        'datetimes_naive': datetimes_naive,
+                        'datetimes_with_tz': datetimes_with_tz})
+        result = df.get_dtype_counts().sort_index()
+        expected = Series({'datetime64[ns]': 2,
+                           str(tz_expected): 2}).sort_index()
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_frame_reset_index(self, tz):
+        dr = date_range('2012-06-02', periods=10, tz=tz)
+        df = DataFrame(np.random.randn(len(dr)), dr)
+        roundtripped = df.reset_index().set_index('index')
+        xp = df.index.tz
+        rs = roundtripped.index.tz
+        assert xp == rs
+
+    @pytest.mark.parametrize('tz', [None, 'America/New_York'])
+    def test_boolean_compare_transpose_tzindex_with_dst(self, tz):
+        # GH 19970
+        idx = date_range('20161101', '20161130', freq='4H', tz=tz)
+        df = DataFrame({'a': range(len(idx)), 'b': range(len(idx))},
+                       index=idx)
+        result = df.T == df.T
+        expected = DataFrame(True, index=list('ab'), columns=idx)
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_to_csv.py b/pandas/tests/frame/test_to_csv.py
new file mode 100644
index 0000000000000..3ad25ae73109e
--- /dev/null
+++ b/pandas/tests/frame/test_to_csv.py
@@ -0,0 +1,1179 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import csv
+import pytest
+
+from numpy import nan
+import numpy as np
+
+from pandas.compat import (lmap, range, lrange, StringIO, u)
+from pandas.io.common import _get_handle
+import pandas.core.common as com
+from pandas.errors import ParserError
+from pandas import (DataFrame, Index, Series, MultiIndex, Timestamp,
+                    date_range, read_csv, compat, to_datetime)
+import pandas as pd
+
+from pandas.util.testing import (assert_almost_equal,
+                                 assert_series_equal,
+                                 assert_frame_equal,
+                                 ensure_clean,
+                                 makeCustomDataframe as mkdf)
+import pandas.util.testing as tm
+
+from pandas.tests.frame.common import TestData
+
+
+MIXED_FLOAT_DTYPES = ['float16', 'float32', 'float64']
+MIXED_INT_DTYPES = ['uint8', 'uint16', 'uint32', 'uint64', 'int8', 'int16',
+                    'int32', 'int64']
+
+
+class TestDataFrameToCSV(TestData):
+
+    def read_csv(self, path, **kwargs):
+        params = dict(index_col=0, parse_dates=True)
+        params.update(**kwargs)
+
+        return pd.read_csv(path, **params)
+
+    def test_from_csv_deprecation(self):
+        # see gh-17812
+        with ensure_clean('__tmp_from_csv_deprecation__') as path:
+            self.tsframe.to_csv(path)
+
+            with tm.assert_produces_warning(FutureWarning):
+                depr_recons = DataFrame.from_csv(path)
+                assert_frame_equal(self.tsframe, depr_recons)
+
+    def test_to_csv_from_csv1(self):
+
+        with ensure_clean('__tmp_to_csv_from_csv1__') as path:
+            self.frame['A'][:5] = nan
+
+            self.frame.to_csv(path)
+            self.frame.to_csv(path, columns=['A', 'B'])
+            self.frame.to_csv(path, header=False)
+            self.frame.to_csv(path, index=False)
+
+            # test roundtrip
+            self.tsframe.to_csv(path)
+            recons = self.read_csv(path)
+            assert_frame_equal(self.tsframe, recons)
+
+            self.tsframe.to_csv(path, index_label='index')
+            recons = self.read_csv(path, index_col=None)
+
+            assert(len(recons.columns) == len(self.tsframe.columns) + 1)
+
+            # no index
+            self.tsframe.to_csv(path, index=False)
+            recons = self.read_csv(path, index_col=None)
+            assert_almost_equal(self.tsframe.values, recons.values)
+
+            # corner case
+            dm = DataFrame({'s1': Series(lrange(3), lrange(3)),
+                            's2': Series(lrange(2), lrange(2))})
+            dm.to_csv(path)
+
+            recons = self.read_csv(path)
+            assert_frame_equal(dm, recons)
+
+    def test_to_csv_from_csv2(self):
+
+        with ensure_clean('__tmp_to_csv_from_csv2__') as path:
+
+            # duplicate index
+            df = DataFrame(np.random.randn(3, 3), index=['a', 'a', 'b'],
+                           columns=['x', 'y', 'z'])
+            df.to_csv(path)
+            result = self.read_csv(path)
+            assert_frame_equal(result, df)
+
+            midx = MultiIndex.from_tuples(
+                [('A', 1, 2), ('A', 1, 2), ('B', 1, 2)])
+            df = DataFrame(np.random.randn(3, 3), index=midx,
+                           columns=['x', 'y', 'z'])
+
+            df.to_csv(path)
+            result = self.read_csv(path, index_col=[0, 1, 2],
+                                   parse_dates=False)
+            assert_frame_equal(result, df, check_names=False)
+
+            # column aliases
+            col_aliases = Index(['AA', 'X', 'Y', 'Z'])
+            self.frame2.to_csv(path, header=col_aliases)
+
+            rs = self.read_csv(path)
+            xp = self.frame2.copy()
+            xp.columns = col_aliases
+            assert_frame_equal(xp, rs)
+
+            pytest.raises(ValueError, self.frame2.to_csv, path,
+                          header=['AA', 'X'])
+
+    def test_to_csv_from_csv3(self):
+
+        with ensure_clean('__tmp_to_csv_from_csv3__') as path:
+            df1 = DataFrame(np.random.randn(3, 1))
+            df2 = DataFrame(np.random.randn(3, 1))
+
+            df1.to_csv(path)
+            df2.to_csv(path, mode='a', header=False)
+            xp = pd.concat([df1, df2])
+            rs = pd.read_csv(path, index_col=0)
+            rs.columns = lmap(int, rs.columns)
+            xp.columns = lmap(int, xp.columns)
+            assert_frame_equal(xp, rs)
+
+    def test_to_csv_from_csv4(self):
+
+        with ensure_clean('__tmp_to_csv_from_csv4__') as path:
+            # GH 10833 (TimedeltaIndex formatting)
+            dt = pd.Timedelta(seconds=1)
+            df = pd.DataFrame({'dt_data': [i * dt for i in range(3)]},
+                              index=pd.Index([i * dt for i in range(3)],
+                                             name='dt_index'))
+            df.to_csv(path)
+
+            result = pd.read_csv(path, index_col='dt_index')
+            result.index = pd.to_timedelta(result.index)
+            # TODO: remove renaming when GH 10875 is solved
+            result.index = result.index.rename('dt_index')
+            result['dt_data'] = pd.to_timedelta(result['dt_data'])
+
+            assert_frame_equal(df, result, check_index_type=True)
+
+    def test_to_csv_from_csv5(self):
+
+        # tz, 8260
+        with ensure_clean('__tmp_to_csv_from_csv5__') as path:
+
+            self.tzframe.to_csv(path)
+            result = pd.read_csv(path, index_col=0, parse_dates=['A'])
+
+            converter = lambda c: to_datetime(result[c]).dt.tz_localize(
+                'UTC').dt.tz_convert(self.tzframe[c].dt.tz)
+            result['B'] = converter('B')
+            result['C'] = converter('C')
+            assert_frame_equal(result, self.tzframe)
+
+    def test_to_csv_cols_reordering(self):
+        # GH3454
+        import pandas as pd
+
+        chunksize = 5
+        N = int(chunksize * 2.5)
+
+        df = mkdf(N, 3)
+        cs = df.columns
+        cols = [cs[2], cs[0]]
+
+        with ensure_clean() as path:
+            df.to_csv(path, columns=cols, chunksize=chunksize)
+            rs_c = pd.read_csv(path, index_col=0)
+
+        assert_frame_equal(df[cols], rs_c, check_names=False)
+
+    def test_to_csv_new_dupe_cols(self):
+        import pandas as pd
+
+        def _check_df(df, cols=None):
+            with ensure_clean() as path:
+                df.to_csv(path, columns=cols, chunksize=chunksize)
+                rs_c = pd.read_csv(path, index_col=0)
+
+                # we wrote them in a different order
+                # so compare them in that order
+                if cols is not None:
+
+                    if df.columns.is_unique:
+                        rs_c.columns = cols
+                    else:
+                        indexer, missing = df.columns.get_indexer_non_unique(
+                            cols)
+                        rs_c.columns = df.columns.take(indexer)
+
+                    for c in cols:
+                        obj_df = df[c]
+                        obj_rs = rs_c[c]
+                        if isinstance(obj_df, Series):
+                            assert_series_equal(obj_df, obj_rs)
+                        else:
+                            assert_frame_equal(
+                                obj_df, obj_rs, check_names=False)
+
+                # wrote in the same order
+                else:
+                    rs_c.columns = df.columns
+                    assert_frame_equal(df, rs_c, check_names=False)
+
+        chunksize = 5
+        N = int(chunksize * 2.5)
+
+        # dupe cols
+        df = mkdf(N, 3)
+        df.columns = ['a', 'a', 'b']
+        _check_df(df, None)
+
+        # dupe cols with selection
+        cols = ['b', 'a']
+        _check_df(df, cols)
+
+    @pytest.mark.slow
+    def test_to_csv_dtnat(self):
+        # GH3437
+        from pandas import NaT
+
+        def make_dtnat_arr(n, nnat=None):
+            if nnat is None:
+                nnat = int(n * 0.1)  # 10%
+            s = list(date_range('2000', freq='5min', periods=n))
+            if nnat:
+                for i in np.random.randint(0, len(s), nnat):
+                    s[i] = NaT
+                i = np.random.randint(100)
+                s[-i] = NaT
+                s[i] = NaT
+            return s
+
+        chunksize = 1000
+        # N=35000
+        s1 = make_dtnat_arr(chunksize + 5)
+        s2 = make_dtnat_arr(chunksize + 5, 0)
+
+        # s3=make_dtnjat_arr(chunksize+5,0)
+        with ensure_clean('1.csv') as pth:
+            df = DataFrame(dict(a=s1, b=s2))
+            df.to_csv(pth, chunksize=chunksize)
+
+            recons = self.read_csv(pth)._convert(datetime=True,
+                                                 coerce=True)
+            assert_frame_equal(df, recons, check_names=False,
+                               check_less_precise=True)
+
+    @pytest.mark.slow
+    def test_to_csv_moar(self):
+
+        def _do_test(df, r_dtype=None, c_dtype=None,
+                     rnlvl=None, cnlvl=None, dupe_col=False):
+
+            kwargs = dict(parse_dates=False)
+            if cnlvl:
+                if rnlvl is not None:
+                    kwargs['index_col'] = lrange(rnlvl)
+                kwargs['header'] = lrange(cnlvl)
+
+                with ensure_clean('__tmp_to_csv_moar__') as path:
+                    df.to_csv(path, encoding='utf8',
+                              chunksize=chunksize)
+                    recons = self.read_csv(path, **kwargs)
+            else:
+                kwargs['header'] = 0
+
+                with ensure_clean('__tmp_to_csv_moar__') as path:
+                    df.to_csv(path, encoding='utf8', chunksize=chunksize)
+                    recons = self.read_csv(path, **kwargs)
+
+            def _to_uni(x):
+                if not isinstance(x, compat.text_type):
+                    return x.decode('utf8')
+                return x
+            if dupe_col:
+                # read_Csv disambiguates the columns by
+                # labeling them dupe.1,dupe.2, etc'. monkey patch columns
+                recons.columns = df.columns
+            if rnlvl and not cnlvl:
+                delta_lvl = [recons.iloc[
+                    :, i].values for i in range(rnlvl - 1)]
+                ix = MultiIndex.from_arrays([list(recons.index)] + delta_lvl)
+                recons.index = ix
+                recons = recons.iloc[:, rnlvl - 1:]
+
+            type_map = dict(i='i', f='f', s='O', u='O', dt='O', p='O')
+            if r_dtype:
+                if r_dtype == 'u':  # unicode
+                    r_dtype = 'O'
+                    recons.index = np.array(lmap(_to_uni, recons.index),
+                                            dtype=r_dtype)
+                    df.index = np.array(lmap(_to_uni, df.index), dtype=r_dtype)
+                elif r_dtype == 'dt':  # unicode
+                    r_dtype = 'O'
+                    recons.index = np.array(lmap(Timestamp, recons.index),
+                                            dtype=r_dtype)
+                    df.index = np.array(
+                        lmap(Timestamp, df.index), dtype=r_dtype)
+                elif r_dtype == 'p':
+                    r_dtype = 'O'
+                    recons.index = np.array(
+                        list(map(Timestamp, to_datetime(recons.index))),
+                        dtype=r_dtype)
+                    df.index = np.array(
+                        list(map(Timestamp, df.index.to_timestamp())),
+                        dtype=r_dtype)
+                else:
+                    r_dtype = type_map.get(r_dtype)
+                    recons.index = np.array(recons.index, dtype=r_dtype)
+                    df.index = np.array(df.index, dtype=r_dtype)
+            if c_dtype:
+                if c_dtype == 'u':
+                    c_dtype = 'O'
+                    recons.columns = np.array(lmap(_to_uni, recons.columns),
+                                              dtype=c_dtype)
+                    df.columns = np.array(
+                        lmap(_to_uni, df.columns), dtype=c_dtype)
+                elif c_dtype == 'dt':
+                    c_dtype = 'O'
+                    recons.columns = np.array(lmap(Timestamp, recons.columns),
+                                              dtype=c_dtype)
+                    df.columns = np.array(
+                        lmap(Timestamp, df.columns), dtype=c_dtype)
+                elif c_dtype == 'p':
+                    c_dtype = 'O'
+                    recons.columns = np.array(
+                        lmap(Timestamp, to_datetime(recons.columns)),
+                        dtype=c_dtype)
+                    df.columns = np.array(
+                        lmap(Timestamp, df.columns.to_timestamp()),
+                        dtype=c_dtype)
+                else:
+                    c_dtype = type_map.get(c_dtype)
+                    recons.columns = np.array(recons.columns, dtype=c_dtype)
+                    df.columns = np.array(df.columns, dtype=c_dtype)
+
+            assert_frame_equal(df, recons, check_names=False,
+                               check_less_precise=True)
+
+        N = 100
+        chunksize = 1000
+
+        for ncols in [4]:
+            base = int((chunksize // ncols or 1) or 1)
+            for nrows in [2, 10, N - 1, N, N + 1, N + 2, 2 * N - 2,
+                          2 * N - 1, 2 * N, 2 * N + 1, 2 * N + 2,
+                          base - 1, base, base + 1]:
+                _do_test(mkdf(nrows, ncols, r_idx_type='dt',
+                              c_idx_type='s'), 'dt', 's')
+
+        for ncols in [4]:
+            base = int((chunksize // ncols or 1) or 1)
+            for nrows in [2, 10, N - 1, N, N + 1, N + 2, 2 * N - 2,
+                          2 * N - 1, 2 * N, 2 * N + 1, 2 * N + 2,
+                          base - 1, base, base + 1]:
+                _do_test(mkdf(nrows, ncols, r_idx_type='dt',
+                              c_idx_type='s'), 'dt', 's')
+                pass
+
+        for r_idx_type, c_idx_type in [('i', 'i'), ('s', 's'), ('u', 'dt'),
+                                       ('p', 'p')]:
+            for ncols in [1, 2, 3, 4]:
+                base = int((chunksize // ncols or 1) or 1)
+                for nrows in [2, 10, N - 1, N, N + 1, N + 2, 2 * N - 2,
+                              2 * N - 1, 2 * N, 2 * N + 1, 2 * N + 2,
+                              base - 1, base, base + 1]:
+                    _do_test(mkdf(nrows, ncols, r_idx_type=r_idx_type,
+                                  c_idx_type=c_idx_type),
+                             r_idx_type, c_idx_type)
+
+        for ncols in [1, 2, 3, 4]:
+            base = int((chunksize // ncols or 1) or 1)
+            for nrows in [10, N - 2, N - 1, N, N + 1, N + 2, 2 * N - 2,
+                          2 * N - 1, 2 * N, 2 * N + 1, 2 * N + 2,
+                          base - 1, base, base + 1]:
+                _do_test(mkdf(nrows, ncols))
+
+        for nrows in [10, N - 2, N - 1, N, N + 1, N + 2]:
+            df = mkdf(nrows, 3)
+            cols = list(df.columns)
+            cols[:2] = ["dupe", "dupe"]
+            cols[-2:] = ["dupe", "dupe"]
+            ix = list(df.index)
+            ix[:2] = ["rdupe", "rdupe"]
+            ix[-2:] = ["rdupe", "rdupe"]
+            df.index = ix
+            df.columns = cols
+            _do_test(df, dupe_col=True)
+
+        _do_test(DataFrame(index=lrange(10)))
+        _do_test(mkdf(chunksize // 2 + 1, 2, r_idx_nlevels=2), rnlvl=2)
+        for ncols in [2, 3, 4]:
+            base = int(chunksize // ncols)
+            for nrows in [10, N - 2, N - 1, N, N + 1, N + 2, 2 * N - 2,
+                          2 * N - 1, 2 * N, 2 * N + 1, 2 * N + 2,
+                          base - 1, base, base + 1]:
+                _do_test(mkdf(nrows, ncols, r_idx_nlevels=2), rnlvl=2)
+                _do_test(mkdf(nrows, ncols, c_idx_nlevels=2), cnlvl=2)
+                _do_test(mkdf(nrows, ncols, r_idx_nlevels=2, c_idx_nlevels=2),
+                         rnlvl=2, cnlvl=2)
+
+    def test_to_csv_from_csv_w_some_infs(self):
+
+        # test roundtrip with inf, -inf, nan, as full columns and mix
+        self.frame['G'] = np.nan
+        f = lambda x: [np.inf, np.nan][np.random.rand() < .5]
+        self.frame['H'] = self.frame.index.map(f)
+
+        with ensure_clean() as path:
+            self.frame.to_csv(path)
+            recons = self.read_csv(path)
+
+            # TODO to_csv drops column name
+            assert_frame_equal(self.frame, recons, check_names=False)
+            assert_frame_equal(np.isinf(self.frame),
+                               np.isinf(recons), check_names=False)
+
+    def test_to_csv_from_csv_w_all_infs(self):
+
+        # test roundtrip with inf, -inf, nan, as full columns and mix
+        self.frame['E'] = np.inf
+        self.frame['F'] = -np.inf
+
+        with ensure_clean() as path:
+            self.frame.to_csv(path)
+            recons = self.read_csv(path)
+
+            # TODO to_csv drops column name
+            assert_frame_equal(self.frame, recons, check_names=False)
+            assert_frame_equal(np.isinf(self.frame),
+                               np.isinf(recons), check_names=False)
+
+    def test_to_csv_no_index(self):
+        # GH 3624, after appending columns, to_csv fails
+        with ensure_clean('__tmp_to_csv_no_index__') as path:
+            df = DataFrame({'c1': [1, 2, 3], 'c2': [4, 5, 6]})
+            df.to_csv(path, index=False)
+            result = read_csv(path)
+            assert_frame_equal(df, result)
+            df['c3'] = Series([7, 8, 9], dtype='int64')
+            df.to_csv(path, index=False)
+            result = read_csv(path)
+            assert_frame_equal(df, result)
+
+    def test_to_csv_with_mix_columns(self):
+        # gh-11637: incorrect output when a mix of integer and string column
+        # names passed as columns parameter in to_csv
+
+        df = DataFrame({0: ['a', 'b', 'c'],
+                        1: ['aa', 'bb', 'cc']})
+        df['test'] = 'txt'
+        assert df.to_csv() == df.to_csv(columns=[0, 1, 'test'])
+
+    def test_to_csv_headers(self):
+        # GH6186, the presence or absence of `index` incorrectly
+        # causes to_csv to have different header semantics.
+        from_df = DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
+        to_df = DataFrame([[1, 2], [3, 4]], columns=['X', 'Y'])
+        with ensure_clean('__tmp_to_csv_headers__') as path:
+            from_df.to_csv(path, header=['X', 'Y'])
+            recons = self.read_csv(path)
+
+            assert_frame_equal(to_df, recons)
+
+            from_df.to_csv(path, index=False, header=['X', 'Y'])
+            recons = self.read_csv(path)
+
+            recons.reset_index(inplace=True)
+            assert_frame_equal(to_df, recons)
+
+    def test_to_csv_multiindex(self):
+
+        frame = self.frame
+        old_index = frame.index
+        arrays = np.arange(len(old_index) * 2).reshape(2, -1)
+        new_index = MultiIndex.from_arrays(arrays, names=['first', 'second'])
+        frame.index = new_index
+
+        with ensure_clean('__tmp_to_csv_multiindex__') as path:
+
+            frame.to_csv(path, header=False)
+            frame.to_csv(path, columns=['A', 'B'])
+
+            # round trip
+            frame.to_csv(path)
+
+            df = self.read_csv(path, index_col=[0, 1],
+                               parse_dates=False)
+
+            # TODO to_csv drops column name
+            assert_frame_equal(frame, df, check_names=False)
+            assert frame.index.names == df.index.names
+
+            # needed if setUp becomes a class method
+            self.frame.index = old_index
+
+            # try multiindex with dates
+            tsframe = self.tsframe
+            old_index = tsframe.index
+            new_index = [old_index, np.arange(len(old_index))]
+            tsframe.index = MultiIndex.from_arrays(new_index)
+
+            tsframe.to_csv(path, index_label=['time', 'foo'])
+            recons = self.read_csv(path, index_col=[0, 1])
+
+            # TODO to_csv drops column name
+            assert_frame_equal(tsframe, recons, check_names=False)
+
+            # do not load index
+            tsframe.to_csv(path)
+            recons = self.read_csv(path, index_col=None)
+            assert len(recons.columns) == len(tsframe.columns) + 2
+
+            # no index
+            tsframe.to_csv(path, index=False)
+            recons = self.read_csv(path, index_col=None)
+            assert_almost_equal(recons.values, self.tsframe.values)
+
+            # needed if setUp becomes class method
+            self.tsframe.index = old_index
+
+        with ensure_clean('__tmp_to_csv_multiindex__') as path:
+            # GH3571, GH1651, GH3141
+
+            def _make_frame(names=None):
+                if names is True:
+                    names = ['first', 'second']
+                return DataFrame(np.random.randint(0, 10, size=(3, 3)),
+                                 columns=MultiIndex.from_tuples(
+                                     [('bah', 'foo'),
+                                      ('bah', 'bar'),
+                                      ('ban', 'baz')], names=names),
+                                 dtype='int64')
+
+            # column & index are multi-index
+            df = mkdf(5, 3, r_idx_nlevels=2, c_idx_nlevels=4)
+            df.to_csv(path)
+            result = read_csv(path, header=[0, 1, 2, 3],
+                              index_col=[0, 1])
+            assert_frame_equal(df, result)
+
+            # column is mi
+            df = mkdf(5, 3, r_idx_nlevels=1, c_idx_nlevels=4)
+            df.to_csv(path)
+            result = read_csv(
+                path, header=[0, 1, 2, 3], index_col=0)
+            assert_frame_equal(df, result)
+
+            # dup column names?
+            df = mkdf(5, 3, r_idx_nlevels=3, c_idx_nlevels=4)
+            df.to_csv(path)
+            result = read_csv(path, header=[0, 1, 2, 3],
+                              index_col=[0, 1, 2])
+            assert_frame_equal(df, result)
+
+            # writing with no index
+            df = _make_frame()
+            df.to_csv(path, index=False)
+            result = read_csv(path, header=[0, 1])
+            assert_frame_equal(df, result)
+
+            # we lose the names here
+            df = _make_frame(True)
+            df.to_csv(path, index=False)
+            result = read_csv(path, header=[0, 1])
+            assert com._all_none(*result.columns.names)
+            result.columns.names = df.columns.names
+            assert_frame_equal(df, result)
+
+            # tupleize_cols=True and index=False
+            df = _make_frame(True)
+            with tm.assert_produces_warning(FutureWarning):
+                df.to_csv(path, tupleize_cols=True, index=False)
+
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = read_csv(path, header=0,
+                                  tupleize_cols=True,
+                                  index_col=None)
+            result.columns = df.columns
+            assert_frame_equal(df, result)
+
+            # whatsnew example
+            df = _make_frame()
+            df.to_csv(path)
+            result = read_csv(path, header=[0, 1],
+                              index_col=[0])
+            assert_frame_equal(df, result)
+
+            df = _make_frame(True)
+            df.to_csv(path)
+            result = read_csv(path, header=[0, 1],
+                              index_col=[0])
+            assert_frame_equal(df, result)
+
+            # column & index are multi-index (compatibility)
+            df = mkdf(5, 3, r_idx_nlevels=2, c_idx_nlevels=4)
+            with tm.assert_produces_warning(FutureWarning):
+                df.to_csv(path, tupleize_cols=True)
+
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = read_csv(path, header=0, index_col=[0, 1],
+                                  tupleize_cols=True)
+            result.columns = df.columns
+            assert_frame_equal(df, result)
+
+            # invalid options
+            df = _make_frame(True)
+            df.to_csv(path)
+
+            for i in [6, 7]:
+                msg = 'len of {i}, but only 5 lines in file'.format(i=i)
+                with tm.assert_raises_regex(ParserError, msg):
+                    read_csv(path, header=lrange(i), index_col=0)
+
+            # write with cols
+            with tm.assert_raises_regex(TypeError, 'cannot specify cols '
+                                        'with a MultiIndex'):
+                df.to_csv(path, columns=['foo', 'bar'])
+
+        with ensure_clean('__tmp_to_csv_multiindex__') as path:
+            # empty
+            tsframe[:0].to_csv(path)
+            recons = self.read_csv(path)
+
+            exp = tsframe[:0]
+            exp.index = []
+
+            tm.assert_index_equal(recons.columns, exp.columns)
+            assert len(recons) == 0
+
+    def test_to_csv_float32_nanrep(self):
+        df = DataFrame(np.random.randn(1, 4).astype(np.float32))
+        df[1] = np.nan
+
+        with ensure_clean('__tmp_to_csv_float32_nanrep__.csv') as path:
+            df.to_csv(path, na_rep=999)
+
+            with open(path) as f:
+                lines = f.readlines()
+                assert lines[1].split(',')[2] == '999'
+
+    def test_to_csv_withcommas(self):
+
+        # Commas inside fields should be correctly escaped when saving as CSV.
+        df = DataFrame({'A': [1, 2, 3], 'B': ['5,6', '7,8', '9,0']})
+
+        with ensure_clean('__tmp_to_csv_withcommas__.csv') as path:
+            df.to_csv(path)
+            df2 = self.read_csv(path)
+            assert_frame_equal(df2, df)
+
+    def test_to_csv_mixed(self):
+
+        def create_cols(name):
+            return ["%s%03d" % (name, i) for i in range(5)]
+
+        df_float = DataFrame(np.random.randn(
+            100, 5), dtype='float64', columns=create_cols('float'))
+        df_int = DataFrame(np.random.randn(100, 5),
+                           dtype='int64', columns=create_cols('int'))
+        df_bool = DataFrame(True, index=df_float.index,
+                            columns=create_cols('bool'))
+        df_object = DataFrame('foo', index=df_float.index,
+                              columns=create_cols('object'))
+        df_dt = DataFrame(Timestamp('20010101'),
+                          index=df_float.index, columns=create_cols('date'))
+
+        # add in some nans
+        df_float.loc[30:50, 1:3] = np.nan
+
+        # ## this is a bug in read_csv right now ####
+        # df_dt.loc[30:50,1:3] = np.nan
+
+        df = pd.concat([df_float, df_int, df_bool, df_object, df_dt], axis=1)
+
+        # dtype
+        dtypes = dict()
+        for n, dtype in [('float', np.float64), ('int', np.int64),
+                         ('bool', np.bool), ('object', np.object)]:
+            for c in create_cols(n):
+                dtypes[c] = dtype
+
+        with ensure_clean() as filename:
+            df.to_csv(filename)
+            rs = read_csv(filename, index_col=0, dtype=dtypes,
+                          parse_dates=create_cols('date'))
+            assert_frame_equal(rs, df)
+
+    def test_to_csv_dups_cols(self):
+
+        df = DataFrame(np.random.randn(1000, 30), columns=lrange(
+            15) + lrange(15), dtype='float64')
+
+        with ensure_clean() as filename:
+            df.to_csv(filename)  # single dtype, fine
+            result = read_csv(filename, index_col=0)
+            result.columns = df.columns
+            assert_frame_equal(result, df)
+
+        df_float = DataFrame(np.random.randn(1000, 3), dtype='float64')
+        df_int = DataFrame(np.random.randn(1000, 3), dtype='int64')
+        df_bool = DataFrame(True, index=df_float.index, columns=lrange(3))
+        df_object = DataFrame('foo', index=df_float.index, columns=lrange(3))
+        df_dt = DataFrame(Timestamp('20010101'),
+                          index=df_float.index, columns=lrange(3))
+        df = pd.concat([df_float, df_int, df_bool, df_object,
+                        df_dt], axis=1, ignore_index=True)
+
+        cols = []
+        for i in range(5):
+            cols.extend([0, 1, 2])
+        df.columns = cols
+
+        with ensure_clean() as filename:
+            df.to_csv(filename)
+            result = read_csv(filename, index_col=0)
+
+            # date cols
+            for i in ['0.4', '1.4', '2.4']:
+                result[i] = to_datetime(result[i])
+
+            result.columns = df.columns
+            assert_frame_equal(result, df)
+
+        # GH3457
+        from pandas.util.testing import makeCustomDataframe as mkdf
+
+        N = 10
+        df = mkdf(N, 3)
+        df.columns = ['a', 'a', 'b']
+
+        with ensure_clean() as filename:
+            df.to_csv(filename)
+
+            # read_csv will rename the dups columns
+            result = read_csv(filename, index_col=0)
+            result = result.rename(columns={'a.1': 'a'})
+            assert_frame_equal(result, df)
+
+    def test_to_csv_chunking(self):
+
+        aa = DataFrame({'A': lrange(100000)})
+        aa['B'] = aa.A + 1.0
+        aa['C'] = aa.A + 2.0
+        aa['D'] = aa.A + 3.0
+
+        for chunksize in [10000, 50000, 100000]:
+            with ensure_clean() as filename:
+                aa.to_csv(filename, chunksize=chunksize)
+                rs = read_csv(filename, index_col=0)
+                assert_frame_equal(rs, aa)
+
+    @pytest.mark.slow
+    def test_to_csv_wide_frame_formatting(self):
+        # Issue #8621
+        df = DataFrame(np.random.randn(1, 100010), columns=None, index=None)
+        with ensure_clean() as filename:
+            df.to_csv(filename, header=False, index=False)
+            rs = read_csv(filename, header=None)
+            assert_frame_equal(rs, df)
+
+    def test_to_csv_bug(self):
+        f1 = StringIO('a,1.0\nb,2.0')
+        df = self.read_csv(f1, header=None)
+        newdf = DataFrame({'t': df[df.columns[0]]})
+
+        with ensure_clean() as path:
+            newdf.to_csv(path)
+
+            recons = read_csv(path, index_col=0)
+            # don't check_names as t != 1
+            assert_frame_equal(recons, newdf, check_names=False)
+
+    def test_to_csv_unicode(self):
+
+        df = DataFrame({u('c/\u03c3'): [1, 2, 3]})
+        with ensure_clean() as path:
+
+            df.to_csv(path, encoding='UTF-8')
+            df2 = read_csv(path, index_col=0, encoding='UTF-8')
+            assert_frame_equal(df, df2)
+
+            df.to_csv(path, encoding='UTF-8', index=False)
+            df2 = read_csv(path, index_col=None, encoding='UTF-8')
+            assert_frame_equal(df, df2)
+
+    def test_to_csv_unicode_index_col(self):
+        buf = StringIO('')
+        df = DataFrame(
+            [[u("\u05d0"), "d2", "d3", "d4"], ["a1", "a2", "a3", "a4"]],
+            columns=[u("\u05d0"),
+                     u("\u05d1"), u("\u05d2"), u("\u05d3")],
+            index=[u("\u05d0"), u("\u05d1")])
+
+        df.to_csv(buf, encoding='UTF-8')
+        buf.seek(0)
+
+        df2 = read_csv(buf, index_col=0, encoding='UTF-8')
+        assert_frame_equal(df, df2)
+
+    def test_to_csv_stringio(self):
+        buf = StringIO()
+        self.frame.to_csv(buf)
+        buf.seek(0)
+        recons = read_csv(buf, index_col=0)
+        # TODO to_csv drops column name
+        assert_frame_equal(recons, self.frame, check_names=False)
+
+    def test_to_csv_float_format(self):
+
+        df = DataFrame([[0.123456, 0.234567, 0.567567],
+                        [12.32112, 123123.2, 321321.2]],
+                       index=['A', 'B'], columns=['X', 'Y', 'Z'])
+
+        with ensure_clean() as filename:
+
+            df.to_csv(filename, float_format='%.2f')
+
+            rs = read_csv(filename, index_col=0)
+            xp = DataFrame([[0.12, 0.23, 0.57],
+                            [12.32, 123123.20, 321321.20]],
+                           index=['A', 'B'], columns=['X', 'Y', 'Z'])
+            assert_frame_equal(rs, xp)
+
+    def test_to_csv_unicodewriter_quoting(self):
+        df = DataFrame({'A': [1, 2, 3], 'B': ['foo', 'bar', 'baz']})
+
+        buf = StringIO()
+        df.to_csv(buf, index=False, quoting=csv.QUOTE_NONNUMERIC,
+                  encoding='utf-8')
+
+        result = buf.getvalue()
+        expected = ('"A","B"\n'
+                    '1,"foo"\n'
+                    '2,"bar"\n'
+                    '3,"baz"\n')
+
+        assert result == expected
+
+    def test_to_csv_quote_none(self):
+        # GH4328
+        df = DataFrame({'A': ['hello', '{"hello"}']})
+        for encoding in (None, 'utf-8'):
+            buf = StringIO()
+            df.to_csv(buf, quoting=csv.QUOTE_NONE,
+                      encoding=encoding, index=False)
+            result = buf.getvalue()
+            expected = 'A\nhello\n{"hello"}\n'
+            assert result == expected
+
+    def test_to_csv_index_no_leading_comma(self):
+        df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
+                       index=['one', 'two', 'three'])
+
+        buf = StringIO()
+        df.to_csv(buf, index_label=False)
+        expected = ('A,B\n'
+                    'one,1,4\n'
+                    'two,2,5\n'
+                    'three,3,6\n')
+        assert buf.getvalue() == expected
+
+    def test_to_csv_line_terminators(self):
+        df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
+                       index=['one', 'two', 'three'])
+
+        buf = StringIO()
+        df.to_csv(buf, line_terminator='\r\n')
+        expected = (',A,B\r\n'
+                    'one,1,4\r\n'
+                    'two,2,5\r\n'
+                    'three,3,6\r\n')
+        assert buf.getvalue() == expected
+
+        buf = StringIO()
+        df.to_csv(buf)  # The default line terminator remains \n
+        expected = (',A,B\n'
+                    'one,1,4\n'
+                    'two,2,5\n'
+                    'three,3,6\n')
+        assert buf.getvalue() == expected
+
+    def test_to_csv_from_csv_categorical(self):
+
+        # CSV with categoricals should result in the same output as when one
+        # would add a "normal" Series/DataFrame.
+        s = Series(pd.Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c']))
+        s2 = Series(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
+        res = StringIO()
+        s.to_csv(res)
+        exp = StringIO()
+        s2.to_csv(exp)
+        assert res.getvalue() == exp.getvalue()
+
+        df = DataFrame({"s": s})
+        df2 = DataFrame({"s": s2})
+        res = StringIO()
+        df.to_csv(res)
+        exp = StringIO()
+        df2.to_csv(exp)
+        assert res.getvalue() == exp.getvalue()
+
+    def test_to_csv_path_is_none(self):
+        # GH 8215
+        # Make sure we return string for consistency with
+        # Series.to_csv()
+        csv_str = self.frame.to_csv(path_or_buf=None)
+        assert isinstance(csv_str, str)
+        recons = pd.read_csv(StringIO(csv_str), index_col=0)
+        assert_frame_equal(self.frame, recons)
+
+    @pytest.mark.parametrize('df,encoding', [
+        (DataFrame([[0.123456, 0.234567, 0.567567],
+                    [12.32112, 123123.2, 321321.2]],
+                   index=['A', 'B'], columns=['X', 'Y', 'Z']), None),
+        # GH 21241, 21118
+        (DataFrame([['abc', 'def', 'ghi']], columns=['X', 'Y', 'Z']), 'ascii'),
+        (DataFrame(5 * [[123, u"你好", u"世界"]],
+                   columns=['X', 'Y', 'Z']), 'gb2312'),
+        (DataFrame(5 * [[123, u"Γειά σου", u"Κόσμε"]],
+                   columns=['X', 'Y', 'Z']), 'cp737')
+    ])
+    def test_to_csv_compression(self, df, encoding, compression):
+
+        with ensure_clean() as filename:
+
+            df.to_csv(filename, compression=compression, encoding=encoding)
+            # test the round trip - to_csv -> read_csv
+            result = read_csv(filename, compression=compression,
+                              index_col=0, encoding=encoding)
+            assert_frame_equal(df, result)
+
+            # test the round trip using file handle - to_csv -> read_csv
+            f, _handles = _get_handle(filename, 'w', compression=compression,
+                                      encoding=encoding)
+            with f:
+                df.to_csv(f, encoding=encoding)
+            result = pd.read_csv(filename, compression=compression,
+                                 encoding=encoding, index_col=0, squeeze=True)
+            assert_frame_equal(df, result)
+
+            # explicitly make sure file is compressed
+            with tm.decompress_file(filename, compression) as fh:
+                text = fh.read().decode(encoding or 'utf8')
+                for col in df.columns:
+                    assert col in text
+
+            with tm.decompress_file(filename, compression) as fh:
+                assert_frame_equal(df, read_csv(fh,
+                                                index_col=0,
+                                                encoding=encoding))
+
+    def test_to_csv_date_format(self):
+        with ensure_clean('__tmp_to_csv_date_format__') as path:
+            dt_index = self.tsframe.index
+            datetime_frame = DataFrame(
+                {'A': dt_index, 'B': dt_index.shift(1)}, index=dt_index)
+            datetime_frame.to_csv(path, date_format='%Y%m%d')
+
+            # Check that the data was put in the specified format
+            test = read_csv(path, index_col=0)
+
+            datetime_frame_int = datetime_frame.applymap(
+                lambda x: int(x.strftime('%Y%m%d')))
+            datetime_frame_int.index = datetime_frame_int.index.map(
+                lambda x: int(x.strftime('%Y%m%d')))
+
+            assert_frame_equal(test, datetime_frame_int)
+
+            datetime_frame.to_csv(path, date_format='%Y-%m-%d')
+
+            # Check that the data was put in the specified format
+            test = read_csv(path, index_col=0)
+            datetime_frame_str = datetime_frame.applymap(
+                lambda x: x.strftime('%Y-%m-%d'))
+            datetime_frame_str.index = datetime_frame_str.index.map(
+                lambda x: x.strftime('%Y-%m-%d'))
+
+            assert_frame_equal(test, datetime_frame_str)
+
+            # Check that columns get converted
+            datetime_frame_columns = datetime_frame.T
+            datetime_frame_columns.to_csv(path, date_format='%Y%m%d')
+
+            test = read_csv(path, index_col=0)
+
+            datetime_frame_columns = datetime_frame_columns.applymap(
+                lambda x: int(x.strftime('%Y%m%d')))
+            # Columns don't get converted to ints by read_csv
+            datetime_frame_columns.columns = (
+                datetime_frame_columns.columns
+                .map(lambda x: x.strftime('%Y%m%d')))
+
+            assert_frame_equal(test, datetime_frame_columns)
+
+            # test NaTs
+            nat_index = to_datetime(
+                ['NaT'] * 10 + ['2000-01-01', '1/1/2000', '1-1-2000'])
+            nat_frame = DataFrame({'A': nat_index}, index=nat_index)
+            nat_frame.to_csv(path, date_format='%Y-%m-%d')
+
+            test = read_csv(path, parse_dates=[0, 1], index_col=0)
+
+            assert_frame_equal(test, nat_frame)
+
+    def test_to_csv_with_dst_transitions(self):
+
+        with ensure_clean('csv_date_format_with_dst') as path:
+            # make sure we are not failing on transitions
+            times = pd.date_range("2013-10-26 23:00", "2013-10-27 01:00",
+                                  tz="Europe/London",
+                                  freq="H",
+                                  ambiguous='infer')
+
+            for i in [times, times + pd.Timedelta('10s')]:
+                time_range = np.array(range(len(i)), dtype='int64')
+                df = DataFrame({'A': time_range}, index=i)
+                df.to_csv(path, index=True)
+
+                # we have to reconvert the index as we
+                # don't parse the tz's
+                result = read_csv(path, index_col=0)
+                result.index = to_datetime(result.index).tz_localize(
+                    'UTC').tz_convert('Europe/London')
+                assert_frame_equal(result, df)
+
+        # GH11619
+        idx = pd.date_range('2015-01-01', '2015-12-31',
+                            freq='H', tz='Europe/Paris')
+        df = DataFrame({'values': 1, 'idx': idx},
+                       index=idx)
+        with ensure_clean('csv_date_format_with_dst') as path:
+            df.to_csv(path, index=True)
+            result = read_csv(path, index_col=0)
+            result.index = to_datetime(result.index).tz_localize(
+                'UTC').tz_convert('Europe/Paris')
+            result['idx'] = to_datetime(result['idx']).astype(
+                'datetime64[ns, Europe/Paris]')
+            assert_frame_equal(result, df)
+
+        # assert working
+        df.astype(str)
+
+        with ensure_clean('csv_date_format_with_dst') as path:
+            df.to_pickle(path)
+            result = pd.read_pickle(path)
+            assert_frame_equal(result, df)
+
+    def test_to_csv_quoting(self):
+        df = DataFrame({
+            'c_bool': [True, False],
+            'c_float': [1.0, 3.2],
+            'c_int': [42, np.nan],
+            'c_string': ['a', 'b,c'],
+        })
+
+        expected = """\
+,c_bool,c_float,c_int,c_string
+0,True,1.0,42.0,a
+1,False,3.2,,"b,c"
+"""
+        result = df.to_csv()
+        assert result == expected
+
+        result = df.to_csv(quoting=None)
+        assert result == expected
+
+        result = df.to_csv(quoting=csv.QUOTE_MINIMAL)
+        assert result == expected
+
+        expected = """\
+"","c_bool","c_float","c_int","c_string"
+"0","True","1.0","42.0","a"
+"1","False","3.2","","b,c"
+"""
+        result = df.to_csv(quoting=csv.QUOTE_ALL)
+        assert result == expected
+
+        # see gh-12922, gh-13259: make sure changes to
+        # the formatters do not break this behaviour
+        expected = """\
+"","c_bool","c_float","c_int","c_string"
+0,True,1.0,42.0,"a"
+1,False,3.2,"","b,c"
+"""
+        result = df.to_csv(quoting=csv.QUOTE_NONNUMERIC)
+        assert result == expected
+
+        msg = "need to escape, but no escapechar set"
+        tm.assert_raises_regex(csv.Error, msg, df.to_csv,
+                               quoting=csv.QUOTE_NONE)
+        tm.assert_raises_regex(csv.Error, msg, df.to_csv,
+                               quoting=csv.QUOTE_NONE,
+                               escapechar=None)
+
+        expected = """\
+,c_bool,c_float,c_int,c_string
+0,True,1.0,42.0,a
+1,False,3.2,,b!,c
+"""
+        result = df.to_csv(quoting=csv.QUOTE_NONE,
+                           escapechar='!')
+        assert result == expected
+
+        expected = """\
+,c_bool,c_ffloat,c_int,c_string
+0,True,1.0,42.0,a
+1,False,3.2,,bf,c
+"""
+        result = df.to_csv(quoting=csv.QUOTE_NONE,
+                           escapechar='f')
+        assert result == expected
+
+        # see gh-3503: quoting Windows line terminators
+        # presents with encoding?
+        text = 'a,b,c\n1,"test \r\n",3\n'
+        df = pd.read_csv(StringIO(text))
+        buf = StringIO()
+        df.to_csv(buf, encoding='utf-8', index=False)
+        assert buf.getvalue() == text
+
+        # xref gh-7791: make sure the quoting parameter is passed through
+        # with multi-indexes
+        df = pd.DataFrame({'a': [1, 2], 'b': [3, 4], 'c': [5, 6]})
+        df = df.set_index(['a', 'b'])
+        expected = '"a","b","c"\n"1","3","5"\n"2","4","6"\n'
+        assert df.to_csv(quoting=csv.QUOTE_ALL) == expected
+
+    def test_period_index_date_overflow(self):
+        # see gh-15982
+
+        dates = ["1990-01-01", "2000-01-01", "3005-01-01"]
+        index = pd.PeriodIndex(dates, freq="D")
+
+        df = pd.DataFrame([4, 5, 6], index=index)
+        result = df.to_csv()
+
+        expected = ',0\n1990-01-01,4\n2000-01-01,5\n3005-01-01,6\n'
+        assert result == expected
+
+        date_format = "%m-%d-%Y"
+        result = df.to_csv(date_format=date_format)
+
+        expected = ',0\n01-01-1990,4\n01-01-2000,5\n01-01-3005,6\n'
+        assert result == expected
+
+        # Overflow with pd.NaT
+        dates = ["1990-01-01", pd.NaT, "3005-01-01"]
+        index = pd.PeriodIndex(dates, freq="D")
+
+        df = pd.DataFrame([4, 5, 6], index=index)
+        result = df.to_csv()
+
+        expected = ',0\n1990-01-01,4\n,5\n3005-01-01,6\n'
+        assert result == expected
+
+    def test_multi_index_header(self):
+        # see gh-5539
+        columns = pd.MultiIndex.from_tuples([("a", 1), ("a", 2),
+                                             ("b", 1), ("b", 2)])
+        df = pd.DataFrame([[1, 2, 3, 4], [5, 6, 7, 8]])
+        df.columns = columns
+
+        header = ["a", "b", "c", "d"]
+        result = df.to_csv(header=header)
+
+        expected = ",a,b,c,d\n0,1,2,3,4\n1,5,6,7,8\n"
+        assert result == expected
diff --git a/pandas/tests/frame/test_validate.py b/pandas/tests/frame/test_validate.py
new file mode 100644
index 0000000000000..2de0e866f6e70
--- /dev/null
+++ b/pandas/tests/frame/test_validate.py
@@ -0,0 +1,33 @@
+from pandas.core.frame import DataFrame
+
+import pytest
+import pandas.util.testing as tm
+
+
+@pytest.fixture
+def dataframe():
+    return DataFrame({'a': [1, 2], 'b': [3, 4]})
+
+
+class TestDataFrameValidate(object):
+    """Tests for error handling related to data types of method arguments."""
+
+    @pytest.mark.parametrize("func", ["query", "eval", "set_index",
+                                      "reset_index", "dropna",
+                                      "drop_duplicates", "sort_values"])
+    @pytest.mark.parametrize("inplace", [1, "True", [1, 2, 3], 5.0])
+    def test_validate_bool_args(self, dataframe, func, inplace):
+        msg = "For argument \"inplace\" expected type bool"
+        kwargs = dict(inplace=inplace)
+
+        if func == "query":
+            kwargs["expr"] = "a > b"
+        elif func == "eval":
+            kwargs["expr"] = "a + b"
+        elif func == "set_index":
+            kwargs["keys"] = ["a"]
+        elif func == "sort_values":
+            kwargs["by"] = ["a"]
+
+        with tm.assert_raises_regex(ValueError, msg):
+            getattr(dataframe, func)(**kwargs)
diff --git a/pandas/tests/generic/__init__.py b/pandas/tests/generic/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/generic/test_frame.py b/pandas/tests/generic/test_frame.py
new file mode 100644
index 0000000000000..9da59ca77d862
--- /dev/null
+++ b/pandas/tests/generic/test_frame.py
@@ -0,0 +1,270 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=E1101,W0612
+
+from operator import methodcaller
+from copy import deepcopy
+from distutils.version import LooseVersion
+
+import pytest
+import numpy as np
+import pandas as pd
+
+from pandas import Series, DataFrame, date_range, MultiIndex
+
+from pandas.compat import range
+from pandas.util.testing import (assert_series_equal,
+                                 assert_frame_equal,
+                                 assert_almost_equal)
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from .test_generic import Generic
+
+try:
+    import xarray
+    _XARRAY_INSTALLED = True
+except ImportError:
+    _XARRAY_INSTALLED = False
+
+
+class TestDataFrame(Generic):
+    _typ = DataFrame
+    _comparator = lambda self, x, y: assert_frame_equal(x, y)
+
+    def test_rename_mi(self):
+        df = DataFrame([
+            11, 21, 31
+        ], index=MultiIndex.from_tuples([("A", x) for x in ["a", "B", "c"]]))
+        df.rename(str.lower)
+
+    def test_set_axis_name(self):
+        df = pd.DataFrame([[1, 2], [3, 4]])
+        funcs = ['_set_axis_name', 'rename_axis']
+        for func in funcs:
+            result = methodcaller(func, 'foo')(df)
+            assert df.index.name is None
+            assert result.index.name == 'foo'
+
+            result = methodcaller(func, 'cols', axis=1)(df)
+            assert df.columns.name is None
+            assert result.columns.name == 'cols'
+
+    def test_set_axis_name_mi(self):
+        df = DataFrame(
+            np.empty((3, 3)),
+            index=MultiIndex.from_tuples([("A", x) for x in list('aBc')]),
+            columns=MultiIndex.from_tuples([('C', x) for x in list('xyz')])
+        )
+
+        level_names = ['L1', 'L2']
+        funcs = ['_set_axis_name', 'rename_axis']
+        for func in funcs:
+            result = methodcaller(func, level_names)(df)
+            assert result.index.names == level_names
+            assert result.columns.names == [None, None]
+
+            result = methodcaller(func, level_names, axis=1)(df)
+            assert result.columns.names == ["L1", "L2"]
+            assert result.index.names == [None, None]
+
+    def test_nonzero_single_element(self):
+
+        # allow single item via bool method
+        df = DataFrame([[True]])
+        assert df.bool()
+
+        df = DataFrame([[False]])
+        assert not df.bool()
+
+        df = DataFrame([[False, False]])
+        pytest.raises(ValueError, lambda: df.bool())
+        pytest.raises(ValueError, lambda: bool(df))
+
+    def test_get_numeric_data_preserve_dtype(self):
+
+        # get the numeric data
+        o = DataFrame({'A': [1, '2', 3.]})
+        result = o._get_numeric_data()
+        expected = DataFrame(index=[0, 1, 2], dtype=object)
+        self._compare(result, expected)
+
+    def test_metadata_propagation_indiv(self):
+
+        # groupby
+        df = DataFrame(
+            {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
+             'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
+             'C': np.random.randn(8),
+             'D': np.random.randn(8)})
+        result = df.groupby('A').sum()
+        self.check_metadata(df, result)
+
+        # resample
+        df = DataFrame(np.random.randn(1000, 2),
+                       index=date_range('20130101', periods=1000, freq='s'))
+        result = df.resample('1T')
+        self.check_metadata(df, result)
+
+        # merging with override
+        # GH 6923
+        _metadata = DataFrame._metadata
+        _finalize = DataFrame.__finalize__
+
+        np.random.seed(10)
+        df1 = DataFrame(np.random.randint(0, 4, (3, 2)), columns=['a', 'b'])
+        df2 = DataFrame(np.random.randint(0, 4, (3, 2)), columns=['c', 'd'])
+        DataFrame._metadata = ['filename']
+        df1.filename = 'fname1.csv'
+        df2.filename = 'fname2.csv'
+
+        def finalize(self, other, method=None, **kwargs):
+
+            for name in self._metadata:
+                if method == 'merge':
+                    left, right = other.left, other.right
+                    value = getattr(left, name, '') + '|' + getattr(right,
+                                                                    name, '')
+                    object.__setattr__(self, name, value)
+                else:
+                    object.__setattr__(self, name, getattr(other, name, ''))
+
+            return self
+
+        DataFrame.__finalize__ = finalize
+        result = df1.merge(df2, left_on=['a'], right_on=['c'], how='inner')
+        assert result.filename == 'fname1.csv|fname2.csv'
+
+        # concat
+        # GH 6927
+        DataFrame._metadata = ['filename']
+        df1 = DataFrame(np.random.randint(0, 4, (3, 2)), columns=list('ab'))
+        df1.filename = 'foo'
+
+        def finalize(self, other, method=None, **kwargs):
+            for name in self._metadata:
+                if method == 'concat':
+                    value = '+'.join([getattr(
+                        o, name) for o in other.objs if getattr(o, name, None)
+                    ])
+                    object.__setattr__(self, name, value)
+                else:
+                    object.__setattr__(self, name, getattr(other, name, None))
+
+            return self
+
+        DataFrame.__finalize__ = finalize
+
+        result = pd.concat([df1, df1])
+        assert result.filename == 'foo+foo'
+
+        # reset
+        DataFrame._metadata = _metadata
+        DataFrame.__finalize__ = _finalize
+
+    def test_set_attribute(self):
+        # Test for consistent setattr behavior when an attribute and a column
+        # have the same name (Issue #8994)
+        df = DataFrame({'x': [1, 2, 3]})
+
+        df.y = 2
+        df['y'] = [2, 4, 6]
+        df.y = 5
+
+        assert df.y == 5
+        assert_series_equal(df['y'], Series([2, 4, 6], name='y'))
+
+    @pytest.mark.skipif(not _XARRAY_INSTALLED or _XARRAY_INSTALLED and
+                        LooseVersion(xarray.__version__) <
+                        LooseVersion('0.10.0'),
+                        reason='xarray >= 0.10.0 required')
+    @pytest.mark.parametrize(
+        "index", ['FloatIndex', 'IntIndex',
+                  'StringIndex', 'UnicodeIndex',
+                  'DateIndex', 'PeriodIndex',
+                  'CategoricalIndex', 'TimedeltaIndex'])
+    def test_to_xarray_index_types(self, index):
+        from xarray import Dataset
+
+        index = getattr(tm, 'make{}'.format(index))
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.Categorical(list('abc')),
+                        'g': pd.date_range('20130101', periods=3),
+                        'h': pd.date_range('20130101',
+                                           periods=3,
+                                           tz='US/Eastern')}
+                       )
+
+        df.index = index(3)
+        df.index.name = 'foo'
+        df.columns.name = 'bar'
+        result = df.to_xarray()
+        assert result.dims['foo'] == 3
+        assert len(result.coords) == 1
+        assert len(result.data_vars) == 8
+        assert_almost_equal(list(result.coords.keys()), ['foo'])
+        assert isinstance(result, Dataset)
+
+        # idempotency
+        # categoricals are not preserved
+        # datetimes w/tz are not preserved
+        # column names are lost
+        expected = df.copy()
+        expected['f'] = expected['f'].astype(object)
+        expected['h'] = expected['h'].astype('datetime64[ns]')
+        expected.columns.name = None
+        assert_frame_equal(result.to_dataframe(), expected,
+                           check_index_type=False, check_categorical=False)
+
+    @td.skip_if_no('xarray', min_version='0.7.0')
+    def test_to_xarray(self):
+        from xarray import Dataset
+
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.Categorical(list('abc')),
+                        'g': pd.date_range('20130101', periods=3),
+                        'h': pd.date_range('20130101',
+                                           periods=3,
+                                           tz='US/Eastern')}
+                       )
+
+        df.index.name = 'foo'
+        result = df[0:0].to_xarray()
+        assert result.dims['foo'] == 0
+        assert isinstance(result, Dataset)
+
+        # available in 0.7.1
+        # MultiIndex
+        df.index = pd.MultiIndex.from_product([['a'], range(3)],
+                                              names=['one', 'two'])
+        result = df.to_xarray()
+        assert result.dims['one'] == 1
+        assert result.dims['two'] == 3
+        assert len(result.coords) == 2
+        assert len(result.data_vars) == 8
+        assert_almost_equal(list(result.coords.keys()), ['one', 'two'])
+        assert isinstance(result, Dataset)
+
+        result = result.to_dataframe()
+        expected = df.copy()
+        expected['f'] = expected['f'].astype(object)
+        expected['h'] = expected['h'].astype('datetime64[ns]')
+        expected.columns.name = None
+        assert_frame_equal(result,
+                           expected,
+                           check_index_type=False)
+
+    def test_deepcopy_empty(self):
+        # This test covers empty frame copying with non-empty column sets
+        # as reported in issue GH15370
+        empty_frame = DataFrame(data=[], index=[], columns=['A'])
+        empty_frame_copy = deepcopy(empty_frame)
+
+        self._compare(empty_frame_copy, empty_frame)
diff --git a/pandas/tests/generic/test_generic.py b/pandas/tests/generic/test_generic.py
new file mode 100644
index 0000000000000..533bff0384ad9
--- /dev/null
+++ b/pandas/tests/generic/test_generic.py
@@ -0,0 +1,1010 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=E1101,W0612
+
+from copy import copy, deepcopy
+from warnings import catch_warnings
+
+import pytest
+import numpy as np
+import pandas as pd
+
+from pandas.core.dtypes.common import is_scalar
+from pandas import (Series, DataFrame, Panel,
+                    date_range, MultiIndex)
+
+import pandas.io.formats.printing as printing
+
+from pandas.compat import range, zip, PY3
+from pandas.util.testing import (assert_raises_regex,
+                                 assert_series_equal,
+                                 assert_panel_equal,
+                                 assert_frame_equal)
+
+import pandas.util.testing as tm
+
+
+# ----------------------------------------------------------------------
+# Generic types test cases
+
+class Generic(object):
+
+    @property
+    def _ndim(self):
+        return self._typ._AXIS_LEN
+
+    def _axes(self):
+        """ return the axes for my object typ """
+        return self._typ._AXIS_ORDERS
+
+    def _construct(self, shape, value=None, dtype=None, **kwargs):
+        """ construct an object for the given shape
+            if value is specified use that if its a scalar
+            if value is an array, repeat it as needed """
+
+        if isinstance(shape, int):
+            shape = tuple([shape] * self._ndim)
+        if value is not None:
+            if is_scalar(value):
+                if value == 'empty':
+                    arr = None
+
+                    # remove the info axis
+                    kwargs.pop(self._typ._info_axis_name, None)
+                else:
+                    arr = np.empty(shape, dtype=dtype)
+                    arr.fill(value)
+            else:
+                fshape = np.prod(shape)
+                arr = value.ravel()
+                new_shape = fshape / arr.shape[0]
+                if fshape % arr.shape[0] != 0:
+                    raise Exception("invalid value passed in _construct")
+
+                arr = np.repeat(arr, new_shape).reshape(shape)
+        else:
+            arr = np.random.randn(*shape)
+        return self._typ(arr, dtype=dtype, **kwargs)
+
+    def _compare(self, result, expected):
+        self._comparator(result, expected)
+
+    def test_rename(self):
+
+        # single axis
+        idx = list('ABCD')
+        # relabeling values passed into self.rename
+        args = [
+            str.lower,
+            {x: x.lower() for x in idx},
+            Series({x: x.lower() for x in idx}),
+        ]
+
+        for axis in self._axes():
+            kwargs = {axis: idx}
+            obj = self._construct(4, **kwargs)
+
+            for arg in args:
+                # rename a single axis
+                result = obj.rename(**{axis: arg})
+                expected = obj.copy()
+                setattr(expected, axis, list('abcd'))
+                self._compare(result, expected)
+
+        # multiple axes at once
+
+    def test_get_numeric_data(self):
+
+        n = 4
+        kwargs = {}
+        for i in range(self._ndim):
+            kwargs[self._typ._AXIS_NAMES[i]] = list(range(n))
+
+        # get the numeric data
+        o = self._construct(n, **kwargs)
+        result = o._get_numeric_data()
+        self._compare(result, o)
+
+        # non-inclusion
+        result = o._get_bool_data()
+        expected = self._construct(n, value='empty', **kwargs)
+        self._compare(result, expected)
+
+        # get the bool data
+        arr = np.array([True, True, False, True])
+        o = self._construct(n, value=arr, **kwargs)
+        result = o._get_numeric_data()
+        self._compare(result, o)
+
+        # _get_numeric_data is includes _get_bool_data, so can't test for
+        # non-inclusion
+
+    def test_get_default(self):
+
+        # GH 7725
+        d0 = "a", "b", "c", "d"
+        d1 = np.arange(4, dtype='int64')
+        others = "e", 10
+
+        for data, index in ((d0, d1), (d1, d0)):
+            s = Series(data, index=index)
+            for i, d in zip(index, data):
+                assert s.get(i) == d
+                assert s.get(i, d) == d
+                assert s.get(i, "z") == d
+                for other in others:
+                    assert s.get(other, "z") == "z"
+                    assert s.get(other, other) == other
+
+    def test_nonzero(self):
+
+        # GH 4633
+        # look at the boolean/nonzero behavior for objects
+        obj = self._construct(shape=4)
+        pytest.raises(ValueError, lambda: bool(obj == 0))
+        pytest.raises(ValueError, lambda: bool(obj == 1))
+        pytest.raises(ValueError, lambda: bool(obj))
+
+        obj = self._construct(shape=4, value=1)
+        pytest.raises(ValueError, lambda: bool(obj == 0))
+        pytest.raises(ValueError, lambda: bool(obj == 1))
+        pytest.raises(ValueError, lambda: bool(obj))
+
+        obj = self._construct(shape=4, value=np.nan)
+        pytest.raises(ValueError, lambda: bool(obj == 0))
+        pytest.raises(ValueError, lambda: bool(obj == 1))
+        pytest.raises(ValueError, lambda: bool(obj))
+
+        # empty
+        obj = self._construct(shape=0)
+        pytest.raises(ValueError, lambda: bool(obj))
+
+        # invalid behaviors
+
+        obj1 = self._construct(shape=4, value=1)
+        obj2 = self._construct(shape=4, value=1)
+
+        def f():
+            if obj1:
+                printing.pprint_thing("this works and shouldn't")
+
+        pytest.raises(ValueError, f)
+        pytest.raises(ValueError, lambda: obj1 and obj2)
+        pytest.raises(ValueError, lambda: obj1 or obj2)
+        pytest.raises(ValueError, lambda: not obj1)
+
+    def test_downcast(self):
+        # test close downcasting
+
+        o = self._construct(shape=4, value=9, dtype=np.int64)
+        result = o.copy()
+        result._data = o._data.downcast(dtypes='infer')
+        self._compare(result, o)
+
+        o = self._construct(shape=4, value=9.)
+        expected = o.astype(np.int64)
+        result = o.copy()
+        result._data = o._data.downcast(dtypes='infer')
+        self._compare(result, expected)
+
+        o = self._construct(shape=4, value=9.5)
+        result = o.copy()
+        result._data = o._data.downcast(dtypes='infer')
+        self._compare(result, o)
+
+        # are close
+        o = self._construct(shape=4, value=9.000000000005)
+        result = o.copy()
+        result._data = o._data.downcast(dtypes='infer')
+        expected = o.astype(np.int64)
+        self._compare(result, expected)
+
+    def test_constructor_compound_dtypes(self):
+        # see gh-5191
+        # Compound dtypes should raise NotImplementedError.
+
+        def f(dtype):
+            return self._construct(shape=3, value=1, dtype=dtype)
+
+        pytest.raises(NotImplementedError, f, [("A", "datetime64[h]"),
+                                               ("B", "str"),
+                                               ("C", "int32")])
+
+        # these work (though results may be unexpected)
+        f('int64')
+        f('float64')
+        f('M8[ns]')
+
+    def check_metadata(self, x, y=None):
+        for m in x._metadata:
+            v = getattr(x, m, None)
+            if y is None:
+                assert v is None
+            else:
+                assert v == getattr(y, m, None)
+
+    def test_metadata_propagation(self):
+        # check that the metadata matches up on the resulting ops
+
+        o = self._construct(shape=3)
+        o.name = 'foo'
+        o2 = self._construct(shape=3)
+        o2.name = 'bar'
+
+        # TODO
+        # Once panel can do non-trivial combine operations
+        # (currently there is an a raise in the Panel arith_ops to prevent
+        # this, though it actually does work)
+        # can remove all of these try: except: blocks on the actual operations
+
+        # ----------
+        # preserving
+        # ----------
+
+        # simple ops with scalars
+        for op in ['__add__', '__sub__', '__truediv__', '__mul__']:
+            result = getattr(o, op)(1)
+            self.check_metadata(o, result)
+
+        # ops with like
+        for op in ['__add__', '__sub__', '__truediv__', '__mul__']:
+            try:
+                result = getattr(o, op)(o)
+                self.check_metadata(o, result)
+            except (ValueError, AttributeError):
+                pass
+
+        # simple boolean
+        for op in ['__eq__', '__le__', '__ge__']:
+            v1 = getattr(o, op)(o)
+            self.check_metadata(o, v1)
+
+            try:
+                self.check_metadata(o, v1 & v1)
+            except (ValueError):
+                pass
+
+            try:
+                self.check_metadata(o, v1 | v1)
+            except (ValueError):
+                pass
+
+        # combine_first
+        try:
+            result = o.combine_first(o2)
+            self.check_metadata(o, result)
+        except (AttributeError):
+            pass
+
+        # ---------------------------
+        # non-preserving (by default)
+        # ---------------------------
+
+        # add non-like
+        try:
+            result = o + o2
+            self.check_metadata(result)
+        except (ValueError, AttributeError):
+            pass
+
+        # simple boolean
+        for op in ['__eq__', '__le__', '__ge__']:
+
+            # this is a name matching op
+            v1 = getattr(o, op)(o)
+
+            v2 = getattr(o, op)(o2)
+            self.check_metadata(v2)
+
+            try:
+                self.check_metadata(v1 & v2)
+            except (ValueError):
+                pass
+
+            try:
+                self.check_metadata(v1 | v2)
+            except (ValueError):
+                pass
+
+    def test_head_tail(self):
+        # GH5370
+
+        o = self._construct(shape=10)
+
+        # check all index types
+        for index in [tm.makeFloatIndex, tm.makeIntIndex, tm.makeStringIndex,
+                      tm.makeUnicodeIndex, tm.makeDateIndex,
+                      tm.makePeriodIndex]:
+            axis = o._get_axis_name(0)
+            setattr(o, axis, index(len(getattr(o, axis))))
+
+            # Panel + dims
+            try:
+                o.head()
+            except (NotImplementedError):
+                pytest.skip('not implemented on {0}'.format(
+                    o.__class__.__name__))
+
+            self._compare(o.head(), o.iloc[:5])
+            self._compare(o.tail(), o.iloc[-5:])
+
+            # 0-len
+            self._compare(o.head(0), o.iloc[0:0])
+            self._compare(o.tail(0), o.iloc[0:0])
+
+            # bounded
+            self._compare(o.head(len(o) + 1), o)
+            self._compare(o.tail(len(o) + 1), o)
+
+            # neg index
+            self._compare(o.head(-3), o.head(7))
+            self._compare(o.tail(-3), o.tail(7))
+
+    def test_sample(self):
+        # Fixes issue: 2419
+
+        o = self._construct(shape=10)
+
+        ###
+        # Check behavior of random_state argument
+        ###
+
+        # Check for stability when receives seed or random state -- run 10
+        # times.
+        for test in range(10):
+            seed = np.random.randint(0, 100)
+            self._compare(
+                o.sample(n=4, random_state=seed), o.sample(n=4,
+                                                           random_state=seed))
+            self._compare(
+                o.sample(frac=0.7, random_state=seed), o.sample(
+                    frac=0.7, random_state=seed))
+
+            self._compare(
+                o.sample(n=4, random_state=np.random.RandomState(test)),
+                o.sample(n=4, random_state=np.random.RandomState(test)))
+
+            self._compare(
+                o.sample(frac=0.7, random_state=np.random.RandomState(test)),
+                o.sample(frac=0.7, random_state=np.random.RandomState(test)))
+
+            os1, os2 = [], []
+            for _ in range(2):
+                np.random.seed(test)
+                os1.append(o.sample(n=4))
+                os2.append(o.sample(frac=0.7))
+            self._compare(*os1)
+            self._compare(*os2)
+
+        # Check for error when random_state argument invalid.
+        with pytest.raises(ValueError):
+            o.sample(random_state='astring!')
+
+        ###
+        # Check behavior of `frac` and `N`
+        ###
+
+        # Giving both frac and N throws error
+        with pytest.raises(ValueError):
+            o.sample(n=3, frac=0.3)
+
+        # Check that raises right error for negative lengths
+        with pytest.raises(ValueError):
+            o.sample(n=-3)
+        with pytest.raises(ValueError):
+            o.sample(frac=-0.3)
+
+        # Make sure float values of `n` give error
+        with pytest.raises(ValueError):
+            o.sample(n=3.2)
+
+        # Check lengths are right
+        assert len(o.sample(n=4) == 4)
+        assert len(o.sample(frac=0.34) == 3)
+        assert len(o.sample(frac=0.36) == 4)
+
+        ###
+        # Check weights
+        ###
+
+        # Weight length must be right
+        with pytest.raises(ValueError):
+            o.sample(n=3, weights=[0, 1])
+
+        with pytest.raises(ValueError):
+            bad_weights = [0.5] * 11
+            o.sample(n=3, weights=bad_weights)
+
+        with pytest.raises(ValueError):
+            bad_weight_series = Series([0, 0, 0.2])
+            o.sample(n=4, weights=bad_weight_series)
+
+        # Check won't accept negative weights
+        with pytest.raises(ValueError):
+            bad_weights = [-0.1] * 10
+            o.sample(n=3, weights=bad_weights)
+
+        # Check inf and -inf throw errors:
+        with pytest.raises(ValueError):
+            weights_with_inf = [0.1] * 10
+            weights_with_inf[0] = np.inf
+            o.sample(n=3, weights=weights_with_inf)
+
+        with pytest.raises(ValueError):
+            weights_with_ninf = [0.1] * 10
+            weights_with_ninf[0] = -np.inf
+            o.sample(n=3, weights=weights_with_ninf)
+
+        # All zeros raises errors
+        zero_weights = [0] * 10
+        with pytest.raises(ValueError):
+            o.sample(n=3, weights=zero_weights)
+
+        # All missing weights
+        nan_weights = [np.nan] * 10
+        with pytest.raises(ValueError):
+            o.sample(n=3, weights=nan_weights)
+
+        # Check np.nan are replaced by zeros.
+        weights_with_nan = [np.nan] * 10
+        weights_with_nan[5] = 0.5
+        self._compare(
+            o.sample(n=1, axis=0, weights=weights_with_nan), o.iloc[5:6])
+
+        # Check None are also replaced by zeros.
+        weights_with_None = [None] * 10
+        weights_with_None[5] = 0.5
+        self._compare(
+            o.sample(n=1, axis=0, weights=weights_with_None), o.iloc[5:6])
+
+    def test_size_compat(self):
+        # GH8846
+        # size property should be defined
+
+        o = self._construct(shape=10)
+        assert o.size == np.prod(o.shape)
+        assert o.size == 10 ** len(o.axes)
+
+    def test_split_compat(self):
+        # xref GH8846
+        o = self._construct(shape=10)
+        assert len(np.array_split(o, 5)) == 5
+        assert len(np.array_split(o, 2)) == 2
+
+    def test_unexpected_keyword(self):  # GH8597
+        df = DataFrame(np.random.randn(5, 2), columns=['jim', 'joe'])
+        ca = pd.Categorical([0, 0, 2, 2, 3, np.nan])
+        ts = df['joe'].copy()
+        ts[2] = np.nan
+
+        with assert_raises_regex(TypeError, 'unexpected keyword'):
+            df.drop('joe', axis=1, in_place=True)
+
+        with assert_raises_regex(TypeError, 'unexpected keyword'):
+            df.reindex([1, 0], inplace=True)
+
+        with assert_raises_regex(TypeError, 'unexpected keyword'):
+            ca.fillna(0, inplace=True)
+
+        with assert_raises_regex(TypeError, 'unexpected keyword'):
+            ts.fillna(0, in_place=True)
+
+    # See gh-12301
+    def test_stat_unexpected_keyword(self):
+        obj = self._construct(5)
+        starwars = 'Star Wars'
+        errmsg = 'unexpected keyword'
+
+        with assert_raises_regex(TypeError, errmsg):
+            obj.max(epic=starwars)  # stat_function
+        with assert_raises_regex(TypeError, errmsg):
+            obj.var(epic=starwars)  # stat_function_ddof
+        with assert_raises_regex(TypeError, errmsg):
+            obj.sum(epic=starwars)  # cum_function
+        with assert_raises_regex(TypeError, errmsg):
+            obj.any(epic=starwars)  # logical_function
+
+    def test_api_compat(self):
+
+        # GH 12021
+        # compat for __name__, __qualname__
+
+        obj = self._construct(5)
+        for func in ['sum', 'cumsum', 'any', 'var']:
+            f = getattr(obj, func)
+            assert f.__name__ == func
+            if PY3:
+                assert f.__qualname__.endswith(func)
+
+    def test_stat_non_defaults_args(self):
+        obj = self._construct(5)
+        out = np.array([0])
+        errmsg = "the 'out' parameter is not supported"
+
+        with assert_raises_regex(ValueError, errmsg):
+            obj.max(out=out)  # stat_function
+        with assert_raises_regex(ValueError, errmsg):
+            obj.var(out=out)  # stat_function_ddof
+        with assert_raises_regex(ValueError, errmsg):
+            obj.sum(out=out)  # cum_function
+        with assert_raises_regex(ValueError, errmsg):
+            obj.any(out=out)  # logical_function
+
+    def test_truncate_out_of_bounds(self):
+        # GH11382
+
+        # small
+        shape = [int(2e3)] + ([1] * (self._ndim - 1))
+        small = self._construct(shape, dtype='int8', value=1)
+        self._compare(small.truncate(), small)
+        self._compare(small.truncate(before=0, after=3e3), small)
+        self._compare(small.truncate(before=-1, after=2e3), small)
+
+        # big
+        shape = [int(2e6)] + ([1] * (self._ndim - 1))
+        big = self._construct(shape, dtype='int8', value=1)
+        self._compare(big.truncate(), big)
+        self._compare(big.truncate(before=0, after=3e6), big)
+        self._compare(big.truncate(before=-1, after=2e6), big)
+
+    def test_validate_bool_args(self):
+        df = DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]})
+        invalid_values = [1, "True", [1, 2, 3], 5.0]
+
+        for value in invalid_values:
+            with pytest.raises(ValueError):
+                super(DataFrame, df).rename_axis(mapper={'a': 'x', 'b': 'y'},
+                                                 axis=1, inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df).drop('a', axis=1, inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df).sort_index(inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df)._consolidate(inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df).fillna(value=0, inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df).replace(to_replace=1, value=7,
+                                             inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df).interpolate(inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df)._where(cond=df.a > 2, inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df).mask(cond=df.a > 2, inplace=value)
+
+    def test_copy_and_deepcopy(self):
+        # GH 15444
+        for shape in [0, 1, 2]:
+            obj = self._construct(shape)
+            for func in [copy,
+                         deepcopy,
+                         lambda x: x.copy(deep=False),
+                         lambda x: x.copy(deep=True)]:
+                obj_copy = func(obj)
+                assert obj_copy is not obj
+                self._compare(obj_copy, obj)
+
+    @pytest.mark.parametrize("periods,fill_method,limit,exp", [
+        (1, "ffill", None, [np.nan, np.nan, np.nan, 1, 1, 1.5, 0, 0]),
+        (1, "ffill", 1, [np.nan, np.nan, np.nan, 1, 1, 1.5, 0, np.nan]),
+        (1, "bfill", None, [np.nan, 0, 0, 1, 1, 1.5, np.nan, np.nan]),
+        (1, "bfill", 1, [np.nan, np.nan, 0, 1, 1, 1.5, np.nan, np.nan]),
+        (-1, "ffill", None, [np.nan, np.nan, -.5, -.5, -.6, 0, 0, np.nan]),
+        (-1, "ffill", 1, [np.nan, np.nan, -.5, -.5, -.6, 0, np.nan, np.nan]),
+        (-1, "bfill", None, [0, 0, -.5, -.5, -.6, np.nan, np.nan, np.nan]),
+        (-1, "bfill", 1, [np.nan, 0, -.5, -.5, -.6, np.nan, np.nan, np.nan])
+    ])
+    def test_pct_change(self, periods, fill_method, limit, exp):
+        vals = [np.nan, np.nan, 1, 2, 4, 10, np.nan, np.nan]
+        obj = self._typ(vals)
+        func = getattr(obj, 'pct_change')
+        res = func(periods=periods, fill_method=fill_method, limit=limit)
+        if type(obj) is DataFrame:
+            tm.assert_frame_equal(res, DataFrame(exp))
+        else:
+            tm.assert_series_equal(res, Series(exp))
+
+
+class TestNDFrame(object):
+    # tests that don't fit elsewhere
+
+    def test_sample(sel):
+        # Fixes issue: 2419
+        # additional specific object based tests
+
+        # A few dataframe test with degenerate weights.
+        easy_weight_list = [0] * 10
+        easy_weight_list[5] = 1
+
+        df = pd.DataFrame({'col1': range(10, 20),
+                           'col2': range(20, 30),
+                           'colString': ['a'] * 10,
+                           'easyweights': easy_weight_list})
+        sample1 = df.sample(n=1, weights='easyweights')
+        assert_frame_equal(sample1, df.iloc[5:6])
+
+        # Ensure proper error if string given as weight for Series, panel, or
+        # DataFrame with axis = 1.
+        s = Series(range(10))
+        with pytest.raises(ValueError):
+            s.sample(n=3, weights='weight_column')
+
+        with catch_warnings(record=True):
+            panel = Panel(items=[0, 1, 2], major_axis=[2, 3, 4],
+                          minor_axis=[3, 4, 5])
+            with pytest.raises(ValueError):
+                panel.sample(n=1, weights='weight_column')
+
+        with pytest.raises(ValueError):
+            df.sample(n=1, weights='weight_column', axis=1)
+
+        # Check weighting key error
+        with pytest.raises(KeyError):
+            df.sample(n=3, weights='not_a_real_column_name')
+
+        # Check that re-normalizes weights that don't sum to one.
+        weights_less_than_1 = [0] * 10
+        weights_less_than_1[0] = 0.5
+        tm.assert_frame_equal(
+            df.sample(n=1, weights=weights_less_than_1), df.iloc[:1])
+
+        ###
+        # Test axis argument
+        ###
+
+        # Test axis argument
+        df = pd.DataFrame({'col1': range(10), 'col2': ['a'] * 10})
+        second_column_weight = [0, 1]
+        assert_frame_equal(
+            df.sample(n=1, axis=1, weights=second_column_weight), df[['col2']])
+
+        # Different axis arg types
+        assert_frame_equal(df.sample(n=1, axis='columns',
+                                     weights=second_column_weight),
+                           df[['col2']])
+
+        weight = [0] * 10
+        weight[5] = 0.5
+        assert_frame_equal(df.sample(n=1, axis='rows', weights=weight),
+                           df.iloc[5:6])
+        assert_frame_equal(df.sample(n=1, axis='index', weights=weight),
+                           df.iloc[5:6])
+
+        # Check out of range axis values
+        with pytest.raises(ValueError):
+            df.sample(n=1, axis=2)
+
+        with pytest.raises(ValueError):
+            df.sample(n=1, axis='not_a_name')
+
+        with pytest.raises(ValueError):
+            s = pd.Series(range(10))
+            s.sample(n=1, axis=1)
+
+        # Test weight length compared to correct axis
+        with pytest.raises(ValueError):
+            df.sample(n=1, axis=1, weights=[0.5] * 10)
+
+        # Check weights with axis = 1
+        easy_weight_list = [0] * 3
+        easy_weight_list[2] = 1
+
+        df = pd.DataFrame({'col1': range(10, 20),
+                           'col2': range(20, 30),
+                           'colString': ['a'] * 10})
+        sample1 = df.sample(n=1, axis=1, weights=easy_weight_list)
+        assert_frame_equal(sample1, df[['colString']])
+
+        # Test default axes
+        with catch_warnings(record=True):
+            p = Panel(items=['a', 'b', 'c'], major_axis=[2, 4, 6],
+                      minor_axis=[1, 3, 5])
+            assert_panel_equal(
+                p.sample(n=3, random_state=42), p.sample(n=3, axis=1,
+                                                         random_state=42))
+            assert_frame_equal(
+                df.sample(n=3, random_state=42), df.sample(n=3, axis=0,
+                                                           random_state=42))
+
+        # Test that function aligns weights with frame
+        df = DataFrame(
+            {'col1': [5, 6, 7],
+             'col2': ['a', 'b', 'c'], }, index=[9, 5, 3])
+        s = Series([1, 0, 0], index=[3, 5, 9])
+        assert_frame_equal(df.loc[[3]], df.sample(1, weights=s))
+
+        # Weights have index values to be dropped because not in
+        # sampled DataFrame
+        s2 = Series([0.001, 0, 10000], index=[3, 5, 10])
+        assert_frame_equal(df.loc[[3]], df.sample(1, weights=s2))
+
+        # Weights have empty values to be filed with zeros
+        s3 = Series([0.01, 0], index=[3, 5])
+        assert_frame_equal(df.loc[[3]], df.sample(1, weights=s3))
+
+        # No overlap in weight and sampled DataFrame indices
+        s4 = Series([1, 0], index=[1, 2])
+        with pytest.raises(ValueError):
+            df.sample(1, weights=s4)
+
+    def test_squeeze(self):
+        # noop
+        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
+                  tm.makeObjectSeries()]:
+            tm.assert_series_equal(s.squeeze(), s)
+        for df in [tm.makeTimeDataFrame()]:
+            tm.assert_frame_equal(df.squeeze(), df)
+        with catch_warnings(record=True):
+            for p in [tm.makePanel()]:
+                tm.assert_panel_equal(p.squeeze(), p)
+
+        # squeezing
+        df = tm.makeTimeDataFrame().reindex(columns=['A'])
+        tm.assert_series_equal(df.squeeze(), df['A'])
+
+        with catch_warnings(record=True):
+            p = tm.makePanel().reindex(items=['ItemA'])
+            tm.assert_frame_equal(p.squeeze(), p['ItemA'])
+
+            p = tm.makePanel().reindex(items=['ItemA'], minor_axis=['A'])
+            tm.assert_series_equal(p.squeeze(), p.loc['ItemA', :, 'A'])
+
+        # don't fail with 0 length dimensions GH11229 & GH8999
+        empty_series = Series([], name='five')
+        empty_frame = DataFrame([empty_series])
+        with catch_warnings(record=True):
+            empty_panel = Panel({'six': empty_frame})
+
+        [tm.assert_series_equal(empty_series, higher_dim.squeeze())
+         for higher_dim in [empty_series, empty_frame, empty_panel]]
+
+        # axis argument
+        df = tm.makeTimeDataFrame(nper=1).iloc[:, :1]
+        assert df.shape == (1, 1)
+        tm.assert_series_equal(df.squeeze(axis=0), df.iloc[0])
+        tm.assert_series_equal(df.squeeze(axis='index'), df.iloc[0])
+        tm.assert_series_equal(df.squeeze(axis=1), df.iloc[:, 0])
+        tm.assert_series_equal(df.squeeze(axis='columns'), df.iloc[:, 0])
+        assert df.squeeze() == df.iloc[0, 0]
+        pytest.raises(ValueError, df.squeeze, axis=2)
+        pytest.raises(ValueError, df.squeeze, axis='x')
+
+        df = tm.makeTimeDataFrame(3)
+        tm.assert_frame_equal(df.squeeze(axis=0), df)
+
+    def test_numpy_squeeze(self):
+        s = tm.makeFloatSeries()
+        tm.assert_series_equal(np.squeeze(s), s)
+
+        df = tm.makeTimeDataFrame().reindex(columns=['A'])
+        tm.assert_series_equal(np.squeeze(df), df['A'])
+
+    def test_transpose(self):
+        msg = (r"transpose\(\) got multiple values for "
+               r"keyword argument 'axes'")
+        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
+                  tm.makeObjectSeries()]:
+            # calls implementation in pandas/core/base.py
+            tm.assert_series_equal(s.transpose(), s)
+        for df in [tm.makeTimeDataFrame()]:
+            tm.assert_frame_equal(df.transpose().transpose(), df)
+
+        with catch_warnings(record=True):
+            for p in [tm.makePanel()]:
+                tm.assert_panel_equal(p.transpose(2, 0, 1)
+                                      .transpose(1, 2, 0), p)
+                tm.assert_raises_regex(TypeError, msg, p.transpose,
+                                       2, 0, 1, axes=(2, 0, 1))
+
+    def test_numpy_transpose(self):
+        msg = "the 'axes' parameter is not supported"
+
+        s = tm.makeFloatSeries()
+        tm.assert_series_equal(
+            np.transpose(s), s)
+        tm.assert_raises_regex(ValueError, msg,
+                               np.transpose, s, axes=1)
+
+        df = tm.makeTimeDataFrame()
+        tm.assert_frame_equal(np.transpose(
+            np.transpose(df)), df)
+        tm.assert_raises_regex(ValueError, msg,
+                               np.transpose, df, axes=1)
+
+        with catch_warnings(record=True):
+            p = tm.makePanel()
+            tm.assert_panel_equal(np.transpose(
+                np.transpose(p, axes=(2, 0, 1)),
+                axes=(1, 2, 0)), p)
+
+    def test_take(self):
+        indices = [1, 5, -2, 6, 3, -1]
+        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
+                  tm.makeObjectSeries()]:
+            out = s.take(indices)
+            expected = Series(data=s.values.take(indices),
+                              index=s.index.take(indices), dtype=s.dtype)
+            tm.assert_series_equal(out, expected)
+        for df in [tm.makeTimeDataFrame()]:
+            out = df.take(indices)
+            expected = DataFrame(data=df.values.take(indices, axis=0),
+                                 index=df.index.take(indices),
+                                 columns=df.columns)
+            tm.assert_frame_equal(out, expected)
+
+        indices = [-3, 2, 0, 1]
+        with catch_warnings(record=True):
+            for p in [tm.makePanel()]:
+                out = p.take(indices)
+                expected = Panel(data=p.values.take(indices, axis=0),
+                                 items=p.items.take(indices),
+                                 major_axis=p.major_axis,
+                                 minor_axis=p.minor_axis)
+                tm.assert_panel_equal(out, expected)
+
+    def test_take_invalid_kwargs(self):
+        indices = [-3, 2, 0, 1]
+        s = tm.makeFloatSeries()
+        df = tm.makeTimeDataFrame()
+
+        with catch_warnings(record=True):
+            p = tm.makePanel()
+
+        for obj in (s, df, p):
+            msg = r"take\(\) got an unexpected keyword argument 'foo'"
+            tm.assert_raises_regex(TypeError, msg, obj.take,
+                                   indices, foo=2)
+
+            msg = "the 'out' parameter is not supported"
+            tm.assert_raises_regex(ValueError, msg, obj.take,
+                                   indices, out=indices)
+
+            msg = "the 'mode' parameter is not supported"
+            tm.assert_raises_regex(ValueError, msg, obj.take,
+                                   indices, mode='clip')
+
+    def test_equals(self):
+        s1 = pd.Series([1, 2, 3], index=[0, 2, 1])
+        s2 = s1.copy()
+        assert s1.equals(s2)
+
+        s1[1] = 99
+        assert not s1.equals(s2)
+
+        # NaNs compare as equal
+        s1 = pd.Series([1, np.nan, 3, np.nan], index=[0, 2, 1, 3])
+        s2 = s1.copy()
+        assert s1.equals(s2)
+
+        s2[0] = 9.9
+        assert not s1.equals(s2)
+
+        idx = MultiIndex.from_tuples([(0, 'a'), (1, 'b'), (2, 'c')])
+        s1 = Series([1, 2, np.nan], index=idx)
+        s2 = s1.copy()
+        assert s1.equals(s2)
+
+        # Add object dtype column with nans
+        index = np.random.random(10)
+        df1 = DataFrame(
+            np.random.random(10, ), index=index, columns=['floats'])
+        df1['text'] = 'the sky is so blue. we could use more chocolate.'.split(
+        )
+        df1['start'] = date_range('2000-1-1', periods=10, freq='T')
+        df1['end'] = date_range('2000-1-1', periods=10, freq='D')
+        df1['diff'] = df1['end'] - df1['start']
+        df1['bool'] = (np.arange(10) % 3 == 0)
+        df1.loc[::2] = np.nan
+        df2 = df1.copy()
+        assert df1['text'].equals(df2['text'])
+        assert df1['start'].equals(df2['start'])
+        assert df1['end'].equals(df2['end'])
+        assert df1['diff'].equals(df2['diff'])
+        assert df1['bool'].equals(df2['bool'])
+        assert df1.equals(df2)
+        assert not df1.equals(object)
+
+        # different dtype
+        different = df1.copy()
+        different['floats'] = different['floats'].astype('float32')
+        assert not df1.equals(different)
+
+        # different index
+        different_index = -index
+        different = df2.set_index(different_index)
+        assert not df1.equals(different)
+
+        # different columns
+        different = df2.copy()
+        different.columns = df2.columns[::-1]
+        assert not df1.equals(different)
+
+        # DatetimeIndex
+        index = pd.date_range('2000-1-1', periods=10, freq='T')
+        df1 = df1.set_index(index)
+        df2 = df1.copy()
+        assert df1.equals(df2)
+
+        # MultiIndex
+        df3 = df1.set_index(['text'], append=True)
+        df2 = df1.set_index(['text'], append=True)
+        assert df3.equals(df2)
+
+        df2 = df1.set_index(['floats'], append=True)
+        assert not df3.equals(df2)
+
+        # NaN in index
+        df3 = df1.set_index(['floats'], append=True)
+        df2 = df1.set_index(['floats'], append=True)
+        assert df3.equals(df2)
+
+        # GH 8437
+        a = pd.Series([False, np.nan])
+        b = pd.Series([False, np.nan])
+        c = pd.Series(index=range(2))
+        d = pd.Series(index=range(2))
+        e = pd.Series(index=range(2))
+        f = pd.Series(index=range(2))
+        c[:-1] = d[:-1] = e[0] = f[0] = False
+        assert a.equals(a)
+        assert a.equals(b)
+        assert a.equals(c)
+        assert a.equals(d)
+        assert a.equals(e)
+        assert e.equals(f)
+
+    def test_describe_raises(self):
+        with catch_warnings(record=True):
+            with pytest.raises(NotImplementedError):
+                tm.makePanel().describe()
+
+    def test_pipe(self):
+        df = DataFrame({'A': [1, 2, 3]})
+        f = lambda x, y: x ** y
+        result = df.pipe(f, 2)
+        expected = DataFrame({'A': [1, 4, 9]})
+        assert_frame_equal(result, expected)
+
+        result = df.A.pipe(f, 2)
+        assert_series_equal(result, expected.A)
+
+    def test_pipe_tuple(self):
+        df = DataFrame({'A': [1, 2, 3]})
+        f = lambda x, y: y
+        result = df.pipe((f, 'y'), 0)
+        assert_frame_equal(result, df)
+
+        result = df.A.pipe((f, 'y'), 0)
+        assert_series_equal(result, df.A)
+
+    def test_pipe_tuple_error(self):
+        df = DataFrame({"A": [1, 2, 3]})
+        f = lambda x, y: y
+        with pytest.raises(ValueError):
+            df.pipe((f, 'y'), x=1, y=0)
+
+        with pytest.raises(ValueError):
+            df.A.pipe((f, 'y'), x=1, y=0)
+
+    def test_pipe_panel(self):
+        with catch_warnings(record=True):
+            wp = Panel({'r1': DataFrame({"A": [1, 2, 3]})})
+            f = lambda x, y: x + y
+            result = wp.pipe(f, 2)
+            expected = wp + 2
+            assert_panel_equal(result, expected)
+
+            result = wp.pipe((f, 'y'), x=1)
+            expected = wp + 1
+            assert_panel_equal(result, expected)
+
+            with pytest.raises(ValueError):
+                result = wp.pipe((f, 'y'), x=1, y=1)
diff --git a/pandas/tests/generic/test_label_or_level_utils.py b/pandas/tests/generic/test_label_or_level_utils.py
new file mode 100644
index 0000000000000..8b133e654a869
--- /dev/null
+++ b/pandas/tests/generic/test_label_or_level_utils.py
@@ -0,0 +1,430 @@
+import pytest
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.core.dtypes.missing import array_equivalent
+
+
+# Fixtures
+# ========
+@pytest.fixture
+def df():
+    """DataFrame with columns 'L1', 'L2', and 'L3' """
+    return pd.DataFrame({'L1': [1, 2, 3],
+                         'L2': [11, 12, 13],
+                         'L3': ['A', 'B', 'C']})
+
+
+@pytest.fixture(params=[[], ['L1'], ['L1', 'L2'], ['L1', 'L2', 'L3']])
+def df_levels(request, df):
+    """DataFrame with columns or index levels 'L1', 'L2', and 'L3' """
+    levels = request.param
+
+    if levels:
+        df = df.set_index(levels)
+
+    return df
+
+
+@pytest.fixture
+def df_ambig(df):
+    """DataFrame with levels 'L1' and 'L2' and labels 'L1' and 'L3' """
+    df = df.set_index(['L1', 'L2'])
+
+    df['L1'] = df['L3']
+
+    return df
+
+
+@pytest.fixture
+def df_duplabels(df):
+    """DataFrame with level 'L1' and labels 'L2', 'L3', and 'L2' """
+    df = df.set_index(['L1'])
+    df = pd.concat([df, df['L2']], axis=1)
+
+    return df
+
+
+@pytest.fixture
+def panel():
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        return pd.Panel()
+
+
+# Test is label/level reference
+# =============================
+def get_labels_levels(df_levels):
+    expected_labels = list(df_levels.columns)
+    expected_levels = [name for name in df_levels.index.names
+                       if name is not None]
+    return expected_labels, expected_levels
+
+
+def assert_label_reference(frame, labels, axis):
+    for label in labels:
+        assert frame._is_label_reference(label, axis=axis)
+        assert not frame._is_level_reference(label, axis=axis)
+        assert frame._is_label_or_level_reference(label, axis=axis)
+
+
+def assert_level_reference(frame, levels, axis):
+    for level in levels:
+        assert frame._is_level_reference(level, axis=axis)
+        assert not frame._is_label_reference(level, axis=axis)
+        assert frame._is_label_or_level_reference(level, axis=axis)
+
+
+# DataFrame
+# ---------
+@pytest.mark.parametrize('axis', [0, 1])
+def test_is_level_or_label_reference_df_simple(df_levels, axis):
+
+    # Compute expected labels and levels
+    expected_labels, expected_levels = get_labels_levels(df_levels)
+
+    # Transpose frame if axis == 1
+    if axis == 1:
+        df_levels = df_levels.T
+
+    # Perform checks
+    assert_level_reference(df_levels, expected_levels, axis=axis)
+    assert_label_reference(df_levels, expected_labels, axis=axis)
+
+
+@pytest.mark.parametrize('axis', [0, 1])
+def test_is_level_reference_df_ambig(df_ambig, axis):
+
+    # Transpose frame if axis == 1
+    if axis == 1:
+        df_ambig = df_ambig.T
+
+    # df has both an on-axis level and off-axis label named L1
+    # Therefore L1 should reference the label, not the level
+    assert_label_reference(df_ambig, ['L1'], axis=axis)
+
+    # df has an on-axis level named L2 and it is not ambiguous
+    # Therefore L2 is an level reference
+    assert_level_reference(df_ambig, ['L2'], axis=axis)
+
+    # df has a column named L3 and it not an level reference
+    assert_label_reference(df_ambig, ['L3'], axis=axis)
+
+
+# Series
+# ------
+def test_is_level_reference_series_simple_axis0(df):
+
+    # Make series with L1 as index
+    s = df.set_index('L1').L2
+    assert_level_reference(s, ['L1'], axis=0)
+    assert not s._is_level_reference('L2')
+
+    # Make series with L1 and L2 as index
+    s = df.set_index(['L1', 'L2']).L3
+    assert_level_reference(s, ['L1', 'L2'], axis=0)
+    assert not s._is_level_reference('L3')
+
+
+def test_is_level_reference_series_axis1_error(df):
+
+    # Make series with L1 as index
+    s = df.set_index('L1').L2
+
+    with tm.assert_raises_regex(ValueError, "No axis named 1"):
+        s._is_level_reference('L1', axis=1)
+
+
+# Panel
+# -----
+def test_is_level_reference_panel_error(panel):
+    msg = ("_is_level_reference is not implemented for {type}"
+           .format(type=type(panel)))
+
+    with tm.assert_raises_regex(NotImplementedError, msg):
+        panel._is_level_reference('L1', axis=0)
+
+
+def test_is_label_reference_panel_error(panel):
+    msg = ("_is_label_reference is not implemented for {type}"
+           .format(type=type(panel)))
+
+    with tm.assert_raises_regex(NotImplementedError, msg):
+        panel._is_label_reference('L1', axis=0)
+
+
+def test_is_label_or_level_reference_panel_error(panel):
+    msg = ("_is_label_or_level_reference is not implemented for {type}"
+           .format(type=type(panel)))
+
+    with tm.assert_raises_regex(NotImplementedError, msg):
+        panel._is_label_or_level_reference('L1', axis=0)
+
+
+# Test _check_label_or_level_ambiguity_df
+# =======================================
+
+# DataFrame
+# ---------
+@pytest.mark.parametrize('axis', [0, 1])
+def test_check_label_or_level_ambiguity_df(df_ambig, axis):
+
+    # Transpose frame if axis == 1
+    if axis == 1:
+        df_ambig = df_ambig.T
+
+    # df_ambig has both an on-axis level and off-axis label named L1
+    # Therefore L1 is ambiguous
+    with tm.assert_produces_warning(FutureWarning,
+                                    clear=True) as w:
+
+        assert df_ambig._check_label_or_level_ambiguity('L1', axis=axis)
+        warning_msg = w[0].message.args[0]
+        if axis == 0:
+            assert warning_msg.startswith("'L1' is both an index level "
+                                          "and a column label")
+        else:
+            assert warning_msg.startswith("'L1' is both a column level "
+                                          "and an index label")
+
+    # df_ambig has an on-axis level named L2 and it is not ambiguous
+    # No warning should be raised
+    with tm.assert_produces_warning(None):
+        assert not df_ambig._check_label_or_level_ambiguity('L2', axis=axis)
+
+    # df_ambig has an off-axis label named L3 and it is not ambiguous
+    with tm.assert_produces_warning(None):
+        assert not df_ambig._is_level_reference('L3', axis=axis)
+
+
+# Series
+# ------
+def test_check_label_or_level_ambiguity_series(df):
+
+    # A series has no columns and therefore references are never ambiguous
+
+    # Make series with L1 as index
+    s = df.set_index('L1').L2
+    with tm.assert_produces_warning(None):
+        assert not s._check_label_or_level_ambiguity('L1', axis=0)
+        assert not s._check_label_or_level_ambiguity('L2', axis=0)
+
+    # Make series with L1 and L2 as index
+    s = df.set_index(['L1', 'L2']).L3
+    with tm.assert_produces_warning(None):
+        assert not s._check_label_or_level_ambiguity('L1', axis=0)
+        assert not s._check_label_or_level_ambiguity('L2', axis=0)
+        assert not s._check_label_or_level_ambiguity('L3', axis=0)
+
+
+def test_check_label_or_level_ambiguity_series_axis1_error(df):
+
+    # Make series with L1 as index
+    s = df.set_index('L1').L2
+
+    with tm.assert_raises_regex(ValueError, "No axis named 1"):
+        s._check_label_or_level_ambiguity('L1', axis=1)
+
+
+# Panel
+# -----
+def test_check_label_or_level_ambiguity_panel_error(panel):
+    msg = ("_check_label_or_level_ambiguity is not implemented for {type}"
+           .format(type=type(panel)))
+
+    with tm.assert_raises_regex(NotImplementedError, msg):
+        panel._check_label_or_level_ambiguity('L1', axis=0)
+
+
+# Test _get_label_or_level_values
+# ===============================
+def assert_label_values(frame, labels, axis):
+    for label in labels:
+        if axis == 0:
+            expected = frame[label]._values
+        else:
+            expected = frame.loc[label]._values
+
+        result = frame._get_label_or_level_values(label, axis=axis,
+                                                  stacklevel=2)
+        assert array_equivalent(expected, result)
+
+
+def assert_level_values(frame, levels, axis):
+    for level in levels:
+        if axis == 0:
+            expected = frame.index.get_level_values(level=level)._values
+        else:
+            expected = (frame.columns
+                        .get_level_values(level=level)
+                        ._values)
+
+        result = frame._get_label_or_level_values(level, axis=axis)
+        assert array_equivalent(expected, result)
+
+
+# DataFrame
+# ---------
+@pytest.mark.parametrize('axis', [0, 1])
+def test_get_label_or_level_values_df_simple(df_levels, axis):
+
+    # Compute expected labels and levels
+    expected_labels, expected_levels = get_labels_levels(df_levels)
+
+    # Transpose frame if axis == 1
+    if axis == 1:
+        df_levels = df_levels.T
+
+    # Perform checks
+    assert_label_values(df_levels, expected_labels, axis=axis)
+    assert_level_values(df_levels, expected_levels, axis=axis)
+
+
+@pytest.mark.parametrize('axis', [0, 1])
+def test_get_label_or_level_values_df_ambig(df_ambig, axis):
+
+    # Transpose frame if axis == 1
+    if axis == 1:
+        df_ambig = df_ambig.T
+
+    # df has both an on-axis level and off-axis label named L1
+    # Therefore L1 is ambiguous but will default to label
+    with tm.assert_produces_warning(FutureWarning):
+        assert_label_values(df_ambig, ['L1'], axis=axis)
+
+    # df has an on-axis level named L2 and it is not ambiguous
+    with tm.assert_produces_warning(None):
+        assert_level_values(df_ambig, ['L2'], axis=axis)
+
+    # df has an off-axis label named L3 and it is not ambiguous
+    with tm.assert_produces_warning(None):
+        assert_label_values(df_ambig, ['L3'], axis=axis)
+
+
+@pytest.mark.parametrize('axis', [0, 1])
+def test_get_label_or_level_values_df_duplabels(df_duplabels, axis):
+
+    # Transpose frame if axis == 1
+    if axis == 1:
+        df_duplabels = df_duplabels.T
+
+    # df has unambiguous level 'L1'
+    assert_level_values(df_duplabels, ['L1'], axis=axis)
+
+    # df has unique label 'L3'
+    assert_label_values(df_duplabels, ['L3'], axis=axis)
+
+    # df has duplicate labels 'L2'
+    if axis == 0:
+        expected_msg = "The column label 'L2' is not unique"
+    else:
+        expected_msg = "The index label 'L2' is not unique"
+
+    with tm.assert_raises_regex(ValueError, expected_msg):
+        assert_label_values(df_duplabels, ['L2'], axis=axis)
+
+
+# Series
+# ------
+def test_get_label_or_level_values_series_axis0(df):
+
+    # Make series with L1 as index
+    s = df.set_index('L1').L2
+    assert_level_values(s, ['L1'], axis=0)
+
+    # Make series with L1 and L2 as index
+    s = df.set_index(['L1', 'L2']).L3
+    assert_level_values(s, ['L1', 'L2'], axis=0)
+
+
+def test_get_label_or_level_values_series_axis1_error(df):
+
+    # Make series with L1 as index
+    s = df.set_index('L1').L2
+
+    with tm.assert_raises_regex(ValueError, "No axis named 1"):
+        s._get_label_or_level_values('L1', axis=1)
+
+
+# Panel
+# -----
+def test_get_label_or_level_values_panel_error(panel):
+    msg = ("_get_label_or_level_values is not implemented for {type}"
+           .format(type=type(panel)))
+
+    with tm.assert_raises_regex(NotImplementedError, msg):
+        panel._get_label_or_level_values('L1', axis=0)
+
+
+# Test _drop_labels_or_levels
+# ===========================
+def assert_labels_dropped(frame, labels, axis):
+    for label in labels:
+        df_dropped = frame._drop_labels_or_levels(label, axis=axis)
+
+        if axis == 0:
+            assert label in frame.columns
+            assert label not in df_dropped.columns
+        else:
+            assert label in frame.index
+            assert label not in df_dropped.index
+
+
+def assert_levels_dropped(frame, levels, axis):
+    for level in levels:
+        df_dropped = frame._drop_labels_or_levels(level, axis=axis)
+
+        if axis == 0:
+            assert level in frame.index.names
+            assert level not in df_dropped.index.names
+        else:
+            assert level in frame.columns.names
+            assert level not in df_dropped.columns.names
+
+
+# DataFrame
+# ---------
+@pytest.mark.parametrize('axis', [0, 1])
+def test_drop_labels_or_levels_df(df_levels, axis):
+
+    # Compute expected labels and levels
+    expected_labels, expected_levels = get_labels_levels(df_levels)
+
+    # Transpose frame if axis == 1
+    if axis == 1:
+        df_levels = df_levels.T
+
+    # Perform checks
+    assert_labels_dropped(df_levels, expected_labels, axis=axis)
+    assert_levels_dropped(df_levels, expected_levels, axis=axis)
+
+    with tm.assert_raises_regex(ValueError, "not valid labels or levels"):
+        df_levels._drop_labels_or_levels('L4', axis=axis)
+
+
+# Series
+# ------
+def test_drop_labels_or_levels_series(df):
+
+    # Make series with L1 as index
+    s = df.set_index('L1').L2
+    assert_levels_dropped(s, ['L1'], axis=0)
+
+    with tm.assert_raises_regex(ValueError, "not valid labels or levels"):
+        s._drop_labels_or_levels('L4', axis=0)
+
+    # Make series with L1 and L2 as index
+    s = df.set_index(['L1', 'L2']).L3
+    assert_levels_dropped(s, ['L1', 'L2'], axis=0)
+
+    with tm.assert_raises_regex(ValueError, "not valid labels or levels"):
+        s._drop_labels_or_levels('L4', axis=0)
+
+
+# Panel
+# -----
+def test_drop_labels_or_levels_panel_error(panel):
+    msg = ("_drop_labels_or_levels is not implemented for {type}"
+           .format(type=type(panel)))
+
+    with tm.assert_raises_regex(NotImplementedError, msg):
+        panel._drop_labels_or_levels('L1', axis=0)
diff --git a/pandas/tests/generic/test_panel.py b/pandas/tests/generic/test_panel.py
new file mode 100644
index 0000000000000..49cb773a1bd10
--- /dev/null
+++ b/pandas/tests/generic/test_panel.py
@@ -0,0 +1,57 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=E1101,W0612
+
+from warnings import catch_warnings
+
+from pandas import Panel
+from pandas.util.testing import (assert_panel_equal,
+                                 assert_almost_equal)
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from .test_generic import Generic
+
+
+class TestPanel(Generic):
+    _typ = Panel
+    _comparator = lambda self, x, y: assert_panel_equal(x, y, by_blocks=True)
+
+    @td.skip_if_no('xarray', min_version='0.7.0')
+    def test_to_xarray(self):
+        from xarray import DataArray
+
+        with catch_warnings(record=True):
+            p = tm.makePanel()
+
+            result = p.to_xarray()
+            assert isinstance(result, DataArray)
+            assert len(result.coords) == 3
+            assert_almost_equal(list(result.coords.keys()),
+                                ['items', 'major_axis', 'minor_axis'])
+            assert len(result.dims) == 3
+
+            # idempotency
+            assert_panel_equal(result.to_pandas(), p)
+
+
+# run all the tests, but wrap each in a warning catcher
+for t in ['test_rename', 'test_get_numeric_data',
+          'test_get_default', 'test_nonzero',
+          'test_downcast', 'test_constructor_compound_dtypes',
+          'test_head_tail',
+          'test_size_compat', 'test_split_compat',
+          'test_unexpected_keyword',
+          'test_stat_unexpected_keyword', 'test_api_compat',
+          'test_stat_non_defaults_args',
+          'test_truncate_out_of_bounds',
+          'test_metadata_propagation', 'test_copy_and_deepcopy',
+          'test_pct_change', 'test_sample']:
+
+    def f():
+        def tester(self):
+            f = getattr(super(TestPanel, self), t)
+            with catch_warnings(record=True):
+                f()
+        return tester
+
+    setattr(TestPanel, t, f())
diff --git a/pandas/tests/generic/test_series.py b/pandas/tests/generic/test_series.py
new file mode 100644
index 0000000000000..3393d7704e411
--- /dev/null
+++ b/pandas/tests/generic/test_series.py
@@ -0,0 +1,229 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=E1101,W0612
+
+from operator import methodcaller
+
+import pytest
+import numpy as np
+import pandas as pd
+
+from distutils.version import LooseVersion
+from pandas import Series, date_range, MultiIndex
+
+from pandas.compat import range
+from pandas.util.testing import (assert_series_equal,
+                                 assert_almost_equal)
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from .test_generic import Generic
+
+try:
+    import xarray
+    _XARRAY_INSTALLED = True
+except ImportError:
+    _XARRAY_INSTALLED = False
+
+
+class TestSeries(Generic):
+    _typ = Series
+    _comparator = lambda self, x, y: assert_series_equal(x, y)
+
+    def setup_method(self):
+        self.ts = tm.makeTimeSeries()  # Was at top level in test_series
+        self.ts.name = 'ts'
+
+        self.series = tm.makeStringSeries()
+        self.series.name = 'series'
+
+    def test_rename_mi(self):
+        s = Series([11, 21, 31],
+                   index=MultiIndex.from_tuples(
+                       [("A", x) for x in ["a", "B", "c"]]))
+        s.rename(str.lower)
+
+    def test_set_axis_name(self):
+        s = Series([1, 2, 3], index=['a', 'b', 'c'])
+        funcs = ['rename_axis', '_set_axis_name']
+        name = 'foo'
+        for func in funcs:
+            result = methodcaller(func, name)(s)
+            assert s.index.name is None
+            assert result.index.name == name
+
+    def test_set_axis_name_mi(self):
+        s = Series([11, 21, 31], index=MultiIndex.from_tuples(
+            [("A", x) for x in ["a", "B", "c"]],
+            names=['l1', 'l2'])
+        )
+        funcs = ['rename_axis', '_set_axis_name']
+        for func in funcs:
+            result = methodcaller(func, ['L1', 'L2'])(s)
+            assert s.index.name is None
+            assert s.index.names == ['l1', 'l2']
+            assert result.index.name is None
+            assert result.index.names, ['L1', 'L2']
+
+    def test_set_axis_name_raises(self):
+        s = pd.Series([1])
+        with pytest.raises(ValueError):
+            s._set_axis_name(name='a', axis=1)
+
+    def test_get_numeric_data_preserve_dtype(self):
+
+        # get the numeric data
+        o = Series([1, 2, 3])
+        result = o._get_numeric_data()
+        self._compare(result, o)
+
+        o = Series([1, '2', 3.])
+        result = o._get_numeric_data()
+        expected = Series([], dtype=object, index=pd.Index([], dtype=object))
+        self._compare(result, expected)
+
+        o = Series([True, False, True])
+        result = o._get_numeric_data()
+        self._compare(result, o)
+
+        o = Series([True, False, True])
+        result = o._get_bool_data()
+        self._compare(result, o)
+
+        o = Series(date_range('20130101', periods=3))
+        result = o._get_numeric_data()
+        expected = Series([], dtype='M8[ns]', index=pd.Index([], dtype=object))
+        self._compare(result, expected)
+
+    def test_nonzero_single_element(self):
+
+        # allow single item via bool method
+        s = Series([True])
+        assert s.bool()
+
+        s = Series([False])
+        assert not s.bool()
+
+        # single item nan to raise
+        for s in [Series([np.nan]), Series([pd.NaT]), Series([True]),
+                  Series([False])]:
+            pytest.raises(ValueError, lambda: bool(s))
+
+        for s in [Series([np.nan]), Series([pd.NaT])]:
+            pytest.raises(ValueError, lambda: s.bool())
+
+        # multiple bool are still an error
+        for s in [Series([True, True]), Series([False, False])]:
+            pytest.raises(ValueError, lambda: bool(s))
+            pytest.raises(ValueError, lambda: s.bool())
+
+        # single non-bool are an error
+        for s in [Series([1]), Series([0]), Series(['a']), Series([0.0])]:
+            pytest.raises(ValueError, lambda: bool(s))
+            pytest.raises(ValueError, lambda: s.bool())
+
+    def test_metadata_propagation_indiv(self):
+        # check that the metadata matches up on the resulting ops
+
+        o = Series(range(3), range(3))
+        o.name = 'foo'
+        o2 = Series(range(3), range(3))
+        o2.name = 'bar'
+
+        result = o.T
+        self.check_metadata(o, result)
+
+        # resample
+        ts = Series(np.random.rand(1000),
+                    index=date_range('20130101', periods=1000, freq='s'),
+                    name='foo')
+        result = ts.resample('1T').mean()
+        self.check_metadata(ts, result)
+
+        result = ts.resample('1T').min()
+        self.check_metadata(ts, result)
+
+        result = ts.resample('1T').apply(lambda x: x.sum())
+        self.check_metadata(ts, result)
+
+        _metadata = Series._metadata
+        _finalize = Series.__finalize__
+        Series._metadata = ['name', 'filename']
+        o.filename = 'foo'
+        o2.filename = 'bar'
+
+        def finalize(self, other, method=None, **kwargs):
+            for name in self._metadata:
+                if method == 'concat' and name == 'filename':
+                    value = '+'.join([getattr(
+                        o, name) for o in other.objs if getattr(o, name, None)
+                    ])
+                    object.__setattr__(self, name, value)
+                else:
+                    object.__setattr__(self, name, getattr(other, name, None))
+
+            return self
+
+        Series.__finalize__ = finalize
+
+        result = pd.concat([o, o2])
+        assert result.filename == 'foo+bar'
+        assert result.name is None
+
+        # reset
+        Series._metadata = _metadata
+        Series.__finalize__ = _finalize
+
+    @pytest.mark.skipif(not _XARRAY_INSTALLED or _XARRAY_INSTALLED and
+                        LooseVersion(xarray.__version__) <
+                        LooseVersion('0.10.0'),
+                        reason='xarray >= 0.10.0 required')
+    @pytest.mark.parametrize(
+        "index",
+        ['FloatIndex', 'IntIndex',
+         'StringIndex', 'UnicodeIndex',
+         'DateIndex', 'PeriodIndex',
+         'TimedeltaIndex', 'CategoricalIndex'])
+    def test_to_xarray_index_types(self, index):
+        from xarray import DataArray
+
+        index = getattr(tm, 'make{}'.format(index))
+        s = Series(range(6), index=index(6))
+        s.index.name = 'foo'
+        result = s.to_xarray()
+        repr(result)
+        assert len(result) == 6
+        assert len(result.coords) == 1
+        assert_almost_equal(list(result.coords.keys()), ['foo'])
+        assert isinstance(result, DataArray)
+
+        # idempotency
+        assert_series_equal(result.to_series(), s,
+                            check_index_type=False,
+                            check_categorical=True)
+
+    @td.skip_if_no('xarray', min_version='0.7.0')
+    def test_to_xarray(self):
+        from xarray import DataArray
+
+        s = Series([])
+        s.index.name = 'foo'
+        result = s.to_xarray()
+        assert len(result) == 0
+        assert len(result.coords) == 1
+        assert_almost_equal(list(result.coords.keys()), ['foo'])
+        assert isinstance(result, DataArray)
+
+        s = Series(range(6))
+        s.index.name = 'foo'
+        s.index = pd.MultiIndex.from_product([['a', 'b'], range(3)],
+                                             names=['one', 'two'])
+        result = s.to_xarray()
+        assert len(result) == 2
+        assert_almost_equal(list(result.coords.keys()), ['one', 'two'])
+        assert isinstance(result, DataArray)
+        assert_series_equal(result.to_series(), s)
+
+    def test_valid_deprecated(self):
+        # GH18800
+        with tm.assert_produces_warning(FutureWarning):
+            pd.Series([]).valid()
diff --git a/pandas/tests/groupby/__init__.py b/pandas/tests/groupby/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/groupby/aggregate/__init__.py b/pandas/tests/groupby/aggregate/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/groupby/aggregate/test_aggregate.py b/pandas/tests/groupby/aggregate/test_aggregate.py
new file mode 100644
index 0000000000000..b2f18e11de8ee
--- /dev/null
+++ b/pandas/tests/groupby/aggregate/test_aggregate.py
@@ -0,0 +1,288 @@
+# -*- coding: utf-8 -*-
+
+"""
+test .agg behavior / note that .apply is tested generally in test_groupby.py
+"""
+
+import pytest
+
+import numpy as np
+import pandas as pd
+
+from pandas import concat, DataFrame, Index, MultiIndex, Series
+from pandas.core.groupby.groupby import Grouping, SpecificationError
+from pandas.compat import OrderedDict
+import pandas.util.testing as tm
+
+
+def test_agg_regression1(tsframe):
+    grouped = tsframe.groupby([lambda x: x.year, lambda x: x.month])
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_must_agg(df):
+    grouped = df.groupby('A')['C']
+
+    msg = "Must produce aggregated value"
+    with tm.assert_raises_regex(Exception, msg):
+        grouped.agg(lambda x: x.describe())
+    with tm.assert_raises_regex(Exception, msg):
+        grouped.agg(lambda x: x.index[:2])
+
+
+def test_agg_ser_multi_key(df):
+    # TODO(wesm): unused
+    ser = df.C  # noqa
+
+    f = lambda x: x.sum()
+    results = df.C.groupby([df.A, df.B]).aggregate(f)
+    expected = df.groupby(['A', 'B']).sum()['C']
+    tm.assert_series_equal(results, expected)
+
+
+def test_groupby_aggregation_mixed_dtype():
+
+    # GH 6212
+    expected = DataFrame({
+        'v1': [5, 5, 7, np.nan, 3, 3, 4, 1],
+        'v2': [55, 55, 77, np.nan, 33, 33, 44, 11]},
+        index=MultiIndex.from_tuples([(1, 95), (1, 99), (2, 95), (2, 99),
+                                      ('big', 'damp'),
+                                      ('blue', 'dry'),
+                                      ('red', 'red'), ('red', 'wet')],
+                                     names=['by1', 'by2']))
+
+    df = DataFrame({
+        'v1': [1, 3, 5, 7, 8, 3, 5, np.nan, 4, 5, 7, 9],
+        'v2': [11, 33, 55, 77, 88, 33, 55, np.nan, 44, 55, 77, 99],
+        'by1': ["red", "blue", 1, 2, np.nan, "big", 1, 2, "red", 1, np.nan,
+                12],
+        'by2': ["wet", "dry", 99, 95, np.nan, "damp", 95, 99, "red", 99,
+                np.nan, np.nan]
+    })
+
+    g = df.groupby(['by1', 'by2'])
+    result = g[['v1', 'v2']].mean()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_apply_corner(ts, tsframe):
+    # nothing to group, all NA
+    grouped = ts.groupby(ts * np.nan)
+    assert ts.dtype == np.float64
+
+    # groupby float64 values results in Float64Index
+    exp = Series([], dtype=np.float64,
+                 index=pd.Index([], dtype=np.float64))
+    tm.assert_series_equal(grouped.sum(), exp)
+    tm.assert_series_equal(grouped.agg(np.sum), exp)
+    tm.assert_series_equal(grouped.apply(np.sum), exp,
+                           check_index_type=False)
+
+    # DataFrame
+    grouped = tsframe.groupby(tsframe['A'] * np.nan)
+    exp_df = DataFrame(columns=tsframe.columns, dtype=float,
+                       index=pd.Index([], dtype=np.float64))
+    tm.assert_frame_equal(grouped.sum(), exp_df, check_names=False)
+    tm.assert_frame_equal(grouped.agg(np.sum), exp_df, check_names=False)
+    tm.assert_frame_equal(grouped.apply(np.sum), exp_df.iloc[:, :0],
+                          check_names=False)
+
+
+def test_agg_grouping_is_list_tuple(ts):
+    df = tm.makeTimeDataFrame()
+
+    grouped = df.groupby(lambda x: x.year)
+    grouper = grouped.grouper.groupings[0].grouper
+    grouped.grouper.groupings[0] = Grouping(ts.index, list(grouper))
+
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    tm.assert_frame_equal(result, expected)
+
+    grouped.grouper.groupings[0] = Grouping(ts.index, tuple(grouper))
+
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_python_multiindex(mframe):
+    grouped = mframe.groupby(['A', 'B'])
+
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('groupbyfunc', [
+    lambda x: x.weekday(),
+    [lambda x: x.month, lambda x: x.weekday()],
+])
+def test_aggregate_str_func(tsframe, groupbyfunc):
+    grouped = tsframe.groupby(groupbyfunc)
+
+    # single series
+    result = grouped['A'].agg('std')
+    expected = grouped['A'].std()
+    tm.assert_series_equal(result, expected)
+
+    # group frame by function name
+    result = grouped.aggregate('var')
+    expected = grouped.var()
+    tm.assert_frame_equal(result, expected)
+
+    # group frame by function dict
+    result = grouped.agg(OrderedDict([['A', 'var'],
+                                      ['B', 'std'],
+                                      ['C', 'mean'],
+                                      ['D', 'sem']]))
+    expected = DataFrame(OrderedDict([['A', grouped['A'].var()],
+                                      ['B', grouped['B'].std()],
+                                      ['C', grouped['C'].mean()],
+                                      ['D', grouped['D'].sem()]]))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_aggregate_item_by_item(df):
+    grouped = df.groupby('A')
+
+    aggfun = lambda ser: ser.size
+    result = grouped.agg(aggfun)
+    foo = (df.A == 'foo').sum()
+    bar = (df.A == 'bar').sum()
+    K = len(result.columns)
+
+    # GH5782
+    # odd comparisons can result here, so cast to make easy
+    exp = pd.Series(np.array([foo] * K), index=list('BCD'),
+                    dtype=np.float64, name='foo')
+    tm.assert_series_equal(result.xs('foo'), exp)
+
+    exp = pd.Series(np.array([bar] * K), index=list('BCD'),
+                    dtype=np.float64, name='bar')
+    tm.assert_almost_equal(result.xs('bar'), exp)
+
+    def aggfun(ser):
+        return ser.size
+
+    result = DataFrame().groupby(df.A).agg(aggfun)
+    assert isinstance(result, DataFrame)
+    assert len(result) == 0
+
+
+def test_wrap_agg_out(three_group):
+    grouped = three_group.groupby(['A', 'B'])
+
+    def func(ser):
+        if ser.dtype == np.object:
+            raise TypeError
+        else:
+            return ser.sum()
+
+    result = grouped.aggregate(func)
+    exp_grouped = three_group.loc[:, three_group.columns != 'C']
+    expected = exp_grouped.groupby(['A', 'B']).aggregate(func)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_multiple_functions_maintain_order(df):
+    # GH #610
+    funcs = [('mean', np.mean), ('max', np.max), ('min', np.min)]
+    result = df.groupby('A')['C'].agg(funcs)
+    exp_cols = Index(['mean', 'max', 'min'])
+
+    tm.assert_index_equal(result.columns, exp_cols)
+
+
+def test_multiple_functions_tuples_and_non_tuples(df):
+    # #1359
+    funcs = [('foo', 'mean'), 'std']
+    ex_funcs = [('foo', 'mean'), ('std', 'std')]
+
+    result = df.groupby('A')['C'].agg(funcs)
+    expected = df.groupby('A')['C'].agg(ex_funcs)
+    tm.assert_frame_equal(result, expected)
+
+    result = df.groupby('A').agg(funcs)
+    expected = df.groupby('A').agg(ex_funcs)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_multiple_functions_too_many_lambdas(df):
+    grouped = df.groupby('A')
+    funcs = ['mean', lambda x: x.mean(), lambda x: x.std()]
+
+    msg = 'Function names must be unique, found multiple named <lambda>'
+    with tm.assert_raises_regex(SpecificationError, msg):
+        grouped.agg(funcs)
+
+
+def test_more_flexible_frame_multi_function(df):
+    grouped = df.groupby('A')
+
+    exmean = grouped.agg(OrderedDict([['C', np.mean], ['D', np.mean]]))
+    exstd = grouped.agg(OrderedDict([['C', np.std], ['D', np.std]]))
+
+    expected = concat([exmean, exstd], keys=['mean', 'std'], axis=1)
+    expected = expected.swaplevel(0, 1, axis=1).sort_index(level=0, axis=1)
+
+    d = OrderedDict([['C', [np.mean, np.std]], ['D', [np.mean, np.std]]])
+    result = grouped.aggregate(d)
+
+    tm.assert_frame_equal(result, expected)
+
+    # be careful
+    result = grouped.aggregate(OrderedDict([['C', np.mean],
+                                            ['D', [np.mean, np.std]]]))
+    expected = grouped.aggregate(OrderedDict([['C', np.mean],
+                                              ['D', [np.mean, np.std]]]))
+    tm.assert_frame_equal(result, expected)
+
+    def foo(x):
+        return np.mean(x)
+
+    def bar(x):
+        return np.std(x, ddof=1)
+
+    # this uses column selection & renaming
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        d = OrderedDict([['C', np.mean],
+                         ['D', OrderedDict([['foo', np.mean],
+                                            ['bar', np.std]])]])
+        result = grouped.aggregate(d)
+
+    d = OrderedDict([['C', [np.mean]], ['D', [foo, bar]]])
+    expected = grouped.aggregate(d)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_multi_function_flexible_mix(df):
+    # GH #1268
+    grouped = df.groupby('A')
+
+    # Expected
+    d = OrderedDict([['C', OrderedDict([['foo', 'mean'], ['bar', 'std']])],
+                     ['D', {'sum': 'sum'}]])
+    # this uses column selection & renaming
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        expected = grouped.aggregate(d)
+
+    # Test 1
+    d = OrderedDict([['C', OrderedDict([['foo', 'mean'], ['bar', 'std']])],
+                     ['D', 'sum']])
+    # this uses column selection & renaming
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = grouped.aggregate(d)
+    tm.assert_frame_equal(result, expected)
+
+    # Test 2
+    d = OrderedDict([['C', OrderedDict([['foo', 'mean'], ['bar', 'std']])],
+                     ['D', ['sum']]])
+    # this uses column selection & renaming
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = grouped.aggregate(d)
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/groupby/aggregate/test_cython.py b/pandas/tests/groupby/aggregate/test_cython.py
new file mode 100644
index 0000000000000..48a45e93e1e8e
--- /dev/null
+++ b/pandas/tests/groupby/aggregate/test_cython.py
@@ -0,0 +1,217 @@
+# -*- coding: utf-8 -*-
+
+"""
+test cython .agg behavior
+"""
+
+from __future__ import print_function
+
+import pytest
+
+import numpy as np
+from numpy import nan
+import pandas as pd
+
+from pandas import (bdate_range, DataFrame, Index, Series, Timestamp,
+                    Timedelta, NaT)
+from pandas.core.groupby.groupby import DataError
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize('op_name', [
+    'count',
+    'sum',
+    'std',
+    'var',
+    'sem',
+    'mean',
+    'median',
+    'prod',
+    'min',
+    'max',
+])
+def test_cythonized_aggers(op_name):
+    data = {'A': [0, 0, 0, 0, 1, 1, 1, 1, 1, 1., nan, nan],
+            'B': ['A', 'B'] * 6,
+            'C': np.random.randn(12)}
+    df = DataFrame(data)
+    df.loc[2:10:2, 'C'] = nan
+
+    op = lambda x: getattr(x, op_name)()
+
+    # single column
+    grouped = df.drop(['B'], axis=1).groupby('A')
+    exp = {}
+    for cat, group in grouped:
+        exp[cat] = op(group['C'])
+    exp = DataFrame({'C': exp})
+    exp.index.name = 'A'
+    result = op(grouped)
+    tm.assert_frame_equal(result, exp)
+
+    # multiple columns
+    grouped = df.groupby(['A', 'B'])
+    expd = {}
+    for (cat1, cat2), group in grouped:
+        expd.setdefault(cat1, {})[cat2] = op(group['C'])
+    exp = DataFrame(expd).T.stack(dropna=False)
+    exp.index.names = ['A', 'B']
+    exp.name = 'C'
+
+    result = op(grouped)['C']
+    if op_name in ['sum', 'prod']:
+        tm.assert_series_equal(result, exp)
+
+
+def test_cython_agg_boolean():
+    frame = DataFrame({'a': np.random.randint(0, 5, 50),
+                       'b': np.random.randint(0, 2, 50).astype('bool')})
+    result = frame.groupby('a')['b'].mean()
+    expected = frame.groupby('a')['b'].agg(np.mean)
+
+    tm.assert_series_equal(result, expected)
+
+
+def test_cython_agg_nothing_to_agg():
+    frame = DataFrame({'a': np.random.randint(0, 5, 50),
+                       'b': ['foo', 'bar'] * 25})
+    msg = "No numeric types to aggregate"
+
+    with tm.assert_raises_regex(DataError, msg):
+        frame.groupby('a')['b'].mean()
+
+    frame = DataFrame({'a': np.random.randint(0, 5, 50),
+                       'b': ['foo', 'bar'] * 25})
+    with tm.assert_raises_regex(DataError, msg):
+        frame[['b']].groupby(frame['a']).mean()
+
+
+def test_cython_agg_nothing_to_agg_with_dates():
+    frame = DataFrame({'a': np.random.randint(0, 5, 50),
+                       'b': ['foo', 'bar'] * 25,
+                       'dates': pd.date_range('now', periods=50, freq='T')})
+    msg = "No numeric types to aggregate"
+    with tm.assert_raises_regex(DataError, msg):
+        frame.groupby('b').dates.mean()
+
+
+def test_cython_agg_frame_columns():
+    # #2113
+    df = DataFrame({'x': [1, 2, 3], 'y': [3, 4, 5]})
+
+    df.groupby(level=0, axis='columns').mean()
+    df.groupby(level=0, axis='columns').mean()
+    df.groupby(level=0, axis='columns').mean()
+    df.groupby(level=0, axis='columns').mean()
+
+
+def test_cython_agg_return_dict():
+    # GH 16741
+    df = DataFrame(
+        {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
+         'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
+         'C': np.random.randn(8),
+         'D': np.random.randn(8)})
+
+    ts = df.groupby('A')['B'].agg(lambda x: x.value_counts().to_dict())
+    expected = Series([{'two': 1, 'one': 1, 'three': 1},
+                       {'two': 2, 'one': 2, 'three': 1}],
+                      index=Index(['bar', 'foo'], name='A'),
+                      name='B')
+    tm.assert_series_equal(ts, expected)
+
+
+def test_cython_fail_agg():
+    dr = bdate_range('1/1/2000', periods=50)
+    ts = Series(['A', 'B', 'C', 'D', 'E'] * 10, index=dr)
+
+    grouped = ts.groupby(lambda x: x.month)
+    summed = grouped.sum()
+    expected = grouped.agg(np.sum)
+    tm.assert_series_equal(summed, expected)
+
+
+@pytest.mark.parametrize('op, targop', [
+    ('mean', np.mean),
+    ('median', np.median),
+    ('var', np.var),
+    ('add', np.sum),
+    ('prod', np.prod),
+    ('min', np.min),
+    ('max', np.max),
+    ('first', lambda x: x.iloc[0]),
+    ('last', lambda x: x.iloc[-1]),
+])
+def test__cython_agg_general(op, targop):
+    df = DataFrame(np.random.randn(1000))
+    labels = np.random.randint(0, 50, size=1000).astype(float)
+
+    result = df.groupby(labels)._cython_agg_general(op)
+    expected = df.groupby(labels).agg(targop)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('op, targop', [
+    ('mean', np.mean),
+    ('median', lambda x: np.median(x) if len(x) > 0 else np.nan),
+    ('var', lambda x: np.var(x, ddof=1)),
+    ('min', np.min),
+    ('max', np.max), ]
+)
+def test_cython_agg_empty_buckets(op, targop, observed):
+    df = pd.DataFrame([11, 12, 13])
+    grps = range(0, 55, 5)
+
+    # calling _cython_agg_general directly, instead of via the user API
+    # which sets different values for min_count, so do that here.
+    g = df.groupby(pd.cut(df[0], grps), observed=observed)
+    result = g._cython_agg_general(op)
+
+    g = df.groupby(pd.cut(df[0], grps), observed=observed)
+    expected = g.agg(lambda x: targop(x))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_cython_agg_empty_buckets_nanops(observed):
+    # GH-18869 can't call nanops on empty groups, so hardcode expected
+    # for these
+    df = pd.DataFrame([11, 12, 13], columns=['a'])
+    grps = range(0, 25, 5)
+    # add / sum
+    result = df.groupby(pd.cut(df['a'], grps),
+                        observed=observed)._cython_agg_general('add')
+    intervals = pd.interval_range(0, 20, freq=5)
+    expected = pd.DataFrame(
+        {"a": [0, 0, 36, 0]},
+        index=pd.CategoricalIndex(intervals, name='a', ordered=True))
+    if observed:
+        expected = expected[expected.a != 0]
+
+    tm.assert_frame_equal(result, expected)
+
+    # prod
+    result = df.groupby(pd.cut(df['a'], grps),
+                        observed=observed)._cython_agg_general('prod')
+    expected = pd.DataFrame(
+        {"a": [1, 1, 1716, 1]},
+        index=pd.CategoricalIndex(intervals, name='a', ordered=True))
+    if observed:
+        expected = expected[expected.a != 1]
+
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('op', ['first', 'last', 'max', 'min'])
+@pytest.mark.parametrize('data', [
+    Timestamp('2016-10-14 21:00:44.557'),
+    Timedelta('17088 days 21:00:44.557'), ])
+def test_cython_with_timestamp_and_nat(op, data):
+    # https://github.com/pandas-dev/pandas/issues/19526
+    df = DataFrame({'a': [0, 1], 'b': [data, NaT]})
+    index = Index([0, 1], name='a')
+
+    # We will group by a and test the cython aggregations
+    expected = DataFrame({'b': [data, NaT]}, index=index)
+
+    result = df.groupby('a').aggregate(op)
+    tm.assert_frame_equal(expected, result)
diff --git a/pandas/tests/groupby/aggregate/test_other.py b/pandas/tests/groupby/aggregate/test_other.py
new file mode 100644
index 0000000000000..34489051efc18
--- /dev/null
+++ b/pandas/tests/groupby/aggregate/test_other.py
@@ -0,0 +1,504 @@
+# -*- coding: utf-8 -*-
+
+"""
+test all other .agg behavior
+"""
+
+from __future__ import print_function
+
+import pytest
+from collections import OrderedDict
+
+import datetime as dt
+from functools import partial
+
+import numpy as np
+import pandas as pd
+
+from pandas import (
+    date_range, DataFrame, Index, MultiIndex, PeriodIndex, period_range, Series
+)
+from pandas.core.groupby.groupby import SpecificationError
+from pandas.io.formats.printing import pprint_thing
+import pandas.util.testing as tm
+
+
+def test_agg_api():
+    # GH 6337
+    # http://stackoverflow.com/questions/21706030/pandas-groupby-agg-function-column-dtype-error
+    # different api for agg when passed custom function with mixed frame
+
+    df = DataFrame({'data1': np.random.randn(5),
+                    'data2': np.random.randn(5),
+                    'key1': ['a', 'a', 'b', 'b', 'a'],
+                    'key2': ['one', 'two', 'one', 'two', 'one']})
+    grouped = df.groupby('key1')
+
+    def peak_to_peak(arr):
+        return arr.max() - arr.min()
+
+    expected = grouped.agg([peak_to_peak])
+    expected.columns = ['data1', 'data2']
+    result = grouped.agg(peak_to_peak)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_datetimes_mixed():
+    data = [[1, '2012-01-01', 1.0],
+            [2, '2012-01-02', 2.0],
+            [3, None, 3.0]]
+
+    df1 = DataFrame({'key': [x[0] for x in data],
+                     'date': [x[1] for x in data],
+                     'value': [x[2] for x in data]})
+
+    data = [[row[0],
+             (dt.datetime.strptime(row[1], '%Y-%m-%d').date()
+              if row[1] else None),
+             row[2]]
+            for row in data]
+
+    df2 = DataFrame({'key': [x[0] for x in data],
+                     'date': [x[1] for x in data],
+                     'value': [x[2] for x in data]})
+
+    df1['weights'] = df1['value'] / df1['value'].sum()
+    gb1 = df1.groupby('date').aggregate(np.sum)
+
+    df2['weights'] = df1['value'] / df1['value'].sum()
+    gb2 = df2.groupby('date').aggregate(np.sum)
+
+    assert (len(gb1) == len(gb2))
+
+
+def test_agg_period_index():
+    prng = period_range('2012-1-1', freq='M', periods=3)
+    df = DataFrame(np.random.randn(3, 2), index=prng)
+    rs = df.groupby(level=0).sum()
+    assert isinstance(rs.index, PeriodIndex)
+
+    # GH 3579
+    index = period_range(start='1999-01', periods=5, freq='M')
+    s1 = Series(np.random.rand(len(index)), index=index)
+    s2 = Series(np.random.rand(len(index)), index=index)
+    series = [('s1', s1), ('s2', s2)]
+    df = DataFrame.from_dict(OrderedDict(series))
+    grouped = df.groupby(df.index.month)
+    list(grouped)
+
+
+def test_agg_dict_parameter_cast_result_dtypes():
+    # GH 12821
+
+    df = DataFrame({'class': ['A', 'A', 'B', 'B', 'C', 'C', 'D', 'D'],
+                    'time': date_range('1/1/2011', periods=8, freq='H')})
+    df.loc[[0, 1, 2, 5], 'time'] = None
+
+    # test for `first` function
+    exp = df.loc[[0, 3, 4, 6]].set_index('class')
+    grouped = df.groupby('class')
+    tm.assert_frame_equal(grouped.first(), exp)
+    tm.assert_frame_equal(grouped.agg('first'), exp)
+    tm.assert_frame_equal(grouped.agg({'time': 'first'}), exp)
+    tm.assert_series_equal(grouped.time.first(), exp['time'])
+    tm.assert_series_equal(grouped.time.agg('first'), exp['time'])
+
+    # test for `last` function
+    exp = df.loc[[0, 3, 4, 7]].set_index('class')
+    grouped = df.groupby('class')
+    tm.assert_frame_equal(grouped.last(), exp)
+    tm.assert_frame_equal(grouped.agg('last'), exp)
+    tm.assert_frame_equal(grouped.agg({'time': 'last'}), exp)
+    tm.assert_series_equal(grouped.time.last(), exp['time'])
+    tm.assert_series_equal(grouped.time.agg('last'), exp['time'])
+
+    # count
+    exp = pd.Series([2, 2, 2, 2],
+                    index=Index(list('ABCD'), name='class'),
+                    name='time')
+    tm.assert_series_equal(grouped.time.agg(len), exp)
+    tm.assert_series_equal(grouped.time.size(), exp)
+
+    exp = pd.Series([0, 1, 1, 2],
+                    index=Index(list('ABCD'), name='class'),
+                    name='time')
+    tm.assert_series_equal(grouped.time.count(), exp)
+
+
+def test_agg_cast_results_dtypes():
+    # similar to GH12821
+    # xref #11444
+    u = [dt.datetime(2015, x + 1, 1) for x in range(12)]
+    v = list('aaabbbbbbccd')
+    df = pd.DataFrame({'X': v, 'Y': u})
+
+    result = df.groupby('X')['Y'].agg(len)
+    expected = df.groupby('X')['Y'].count()
+    tm.assert_series_equal(result, expected)
+
+
+def test_aggregate_float64_no_int64():
+    # see gh-11199
+    df = DataFrame({"a": [1, 2, 3, 4, 5],
+                    "b": [1, 2, 2, 4, 5],
+                    "c": [1, 2, 3, 4, 5]})
+
+    expected = DataFrame({"a": [1, 2.5, 4, 5]}, index=[1, 2, 4, 5])
+    expected.index.name = "b"
+
+    result = df.groupby("b")[["a"]].mean()
+    tm.assert_frame_equal(result, expected)
+
+    expected = DataFrame({"a": [1, 2.5, 4, 5], "c": [1, 2.5, 4, 5]},
+                         index=[1, 2, 4, 5])
+    expected.index.name = "b"
+
+    result = df.groupby("b")[["a", "c"]].mean()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_aggregate_api_consistency():
+    # GH 9052
+    # make sure that the aggregates via dict
+    # are consistent
+    df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                          'foo', 'bar', 'foo', 'foo'],
+                    'B': ['one', 'one', 'two', 'two',
+                          'two', 'two', 'one', 'two'],
+                    'C': np.random.randn(8) + 1.0,
+                    'D': np.arange(8)})
+
+    grouped = df.groupby(['A', 'B'])
+    c_mean = grouped['C'].mean()
+    c_sum = grouped['C'].sum()
+    d_mean = grouped['D'].mean()
+    d_sum = grouped['D'].sum()
+
+    result = grouped['D'].agg(['sum', 'mean'])
+    expected = pd.concat([d_sum, d_mean], axis=1)
+    expected.columns = ['sum', 'mean']
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+    result = grouped.agg([np.sum, np.mean])
+    expected = pd.concat([c_sum, c_mean, d_sum, d_mean], axis=1)
+    expected.columns = MultiIndex.from_product([['C', 'D'],
+                                                ['sum', 'mean']])
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+    result = grouped[['D', 'C']].agg([np.sum, np.mean])
+    expected = pd.concat([d_sum, d_mean, c_sum, c_mean], axis=1)
+    expected.columns = MultiIndex.from_product([['D', 'C'],
+                                                ['sum', 'mean']])
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+    result = grouped.agg({'C': 'mean', 'D': 'sum'})
+    expected = pd.concat([d_sum, c_mean], axis=1)
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+    result = grouped.agg({'C': ['mean', 'sum'],
+                          'D': ['mean', 'sum']})
+    expected = pd.concat([c_mean, c_sum, d_mean, d_sum], axis=1)
+    expected.columns = MultiIndex.from_product([['C', 'D'],
+                                                ['mean', 'sum']])
+
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = grouped[['D', 'C']].agg({'r': np.sum,
+                                          'r2': np.mean})
+    expected = pd.concat([d_sum, c_sum, d_mean, c_mean], axis=1)
+    expected.columns = MultiIndex.from_product([['r', 'r2'],
+                                                ['D', 'C']])
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+
+def test_agg_dict_renaming_deprecation():
+    # 15931
+    df = pd.DataFrame({'A': [1, 1, 1, 2, 2],
+                       'B': range(5),
+                       'C': range(5)})
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False) as w:
+        df.groupby('A').agg({'B': {'foo': ['sum', 'max']},
+                             'C': {'bar': ['count', 'min']}})
+        assert "using a dict with renaming" in str(w[0].message)
+
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        df.groupby('A')[['B', 'C']].agg({'ma': 'max'})
+
+    with tm.assert_produces_warning(FutureWarning) as w:
+        df.groupby('A').B.agg({'foo': 'count'})
+        assert "using a dict on a Series for aggregation" in str(w[0].message)
+
+
+def test_agg_compat():
+    # GH 12334
+    df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                          'foo', 'bar', 'foo', 'foo'],
+                    'B': ['one', 'one', 'two', 'two',
+                          'two', 'two', 'one', 'two'],
+                    'C': np.random.randn(8) + 1.0,
+                    'D': np.arange(8)})
+
+    g = df.groupby(['A', 'B'])
+
+    expected = pd.concat([g['D'].sum(), g['D'].std()], axis=1)
+    expected.columns = MultiIndex.from_tuples([('C', 'sum'),
+                                               ('C', 'std')])
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = g['D'].agg({'C': ['sum', 'std']})
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+    expected = pd.concat([g['D'].sum(), g['D'].std()], axis=1)
+    expected.columns = ['C', 'D']
+
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = g['D'].agg({'C': 'sum', 'D': 'std'})
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+
+def test_agg_nested_dicts():
+    # API change for disallowing these types of nested dicts
+    df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                          'foo', 'bar', 'foo', 'foo'],
+                    'B': ['one', 'one', 'two', 'two',
+                          'two', 'two', 'one', 'two'],
+                    'C': np.random.randn(8) + 1.0,
+                    'D': np.arange(8)})
+
+    g = df.groupby(['A', 'B'])
+
+    msg = r'cannot perform renaming for r[1-2] with a nested dictionary'
+    with tm.assert_raises_regex(SpecificationError, msg):
+        g.aggregate({'r1': {'C': ['mean', 'sum']},
+                     'r2': {'D': ['mean', 'sum']}})
+
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = g.agg({'C': {'ra': ['mean', 'std']},
+                        'D': {'rb': ['mean', 'std']}})
+    expected = pd.concat([g['C'].mean(), g['C'].std(),
+                          g['D'].mean(), g['D'].std()],
+                         axis=1)
+    expected.columns = pd.MultiIndex.from_tuples(
+        [('ra', 'mean'), ('ra', 'std'),
+         ('rb', 'mean'), ('rb', 'std')])
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+    # same name as the original column
+    # GH9052
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        expected = g['D'].agg({'result1': np.sum, 'result2': np.mean})
+    expected = expected.rename(columns={'result1': 'D'})
+
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = g['D'].agg({'D': np.sum, 'result2': np.mean})
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+
+def test_agg_item_by_item_raise_typeerror():
+    df = DataFrame(np.random.randint(10, size=(20, 10)))
+
+    def raiseException(df):
+        pprint_thing('----------------------------------------')
+        pprint_thing(df.to_string())
+        raise TypeError('test')
+
+    with tm.assert_raises_regex(TypeError, 'test'):
+        df.groupby(0).agg(raiseException)
+
+
+def test_series_agg_multikey():
+    ts = tm.makeTimeSeries()
+    grouped = ts.groupby([lambda x: x.year, lambda x: x.month])
+
+    result = grouped.agg(np.sum)
+    expected = grouped.sum()
+    tm.assert_series_equal(result, expected)
+
+
+def test_series_agg_multi_pure_python():
+    data = DataFrame(
+        {'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar', 'bar', 'bar',
+               'foo', 'foo', 'foo'],
+         'B': ['one', 'one', 'one', 'two', 'one', 'one', 'one', 'two',
+               'two', 'two', 'one'],
+         'C': ['dull', 'dull', 'shiny', 'dull', 'dull', 'shiny', 'shiny',
+               'dull', 'shiny', 'shiny', 'shiny'],
+         'D': np.random.randn(11),
+         'E': np.random.randn(11),
+         'F': np.random.randn(11)})
+
+    def bad(x):
+        assert (len(x.values.base) > 0)
+        return 'foo'
+
+    result = data.groupby(['A', 'B']).agg(bad)
+    expected = data.groupby(['A', 'B']).agg(lambda x: 'foo')
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_consistency():
+    # agg with ([]) and () not consistent
+    # GH 6715
+    def P1(a):
+        try:
+            return np.percentile(a.dropna(), q=1)
+        except Exception:
+            return np.nan
+
+    df = DataFrame({'col1': [1, 2, 3, 4],
+                    'col2': [10, 25, 26, 31],
+                    'date': [dt.date(2013, 2, 10), dt.date(2013, 2, 10),
+                             dt.date(2013, 2, 11), dt.date(2013, 2, 11)]})
+
+    g = df.groupby('date')
+
+    expected = g.agg([P1])
+    expected.columns = expected.columns.levels[0]
+
+    result = g.agg(P1)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_callables():
+    # GH 7929
+    df = DataFrame({'foo': [1, 2], 'bar': [3, 4]}).astype(np.int64)
+
+    class fn_class(object):
+
+        def __call__(self, x):
+            return sum(x)
+
+    equiv_callables = [sum,
+                       np.sum,
+                       lambda x: sum(x),
+                       lambda x: x.sum(),
+                       partial(sum),
+                       fn_class(), ]
+
+    expected = df.groupby("foo").agg(sum)
+    for ecall in equiv_callables:
+        result = df.groupby('foo').agg(ecall)
+        tm.assert_frame_equal(result, expected)
+
+
+def test_agg_over_numpy_arrays():
+    # GH 3788
+    df = pd.DataFrame([[1, np.array([10, 20, 30])],
+                       [1, np.array([40, 50, 60])],
+                       [2, np.array([20, 30, 40])]],
+                      columns=['category', 'arraydata'])
+    result = df.groupby('category').agg(sum)
+
+    expected_data = [[np.array([50, 70, 90])], [np.array([20, 30, 40])]]
+    expected_index = pd.Index([1, 2], name='category')
+    expected_column = ['arraydata']
+    expected = pd.DataFrame(expected_data,
+                            index=expected_index,
+                            columns=expected_column)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_timezone_round_trip():
+    # GH 15426
+    ts = pd.Timestamp("2016-01-01 12:00:00", tz='US/Pacific')
+    df = pd.DataFrame({'a': 1,
+                       'b': [ts + dt.timedelta(minutes=nn)
+                             for nn in range(10)]})
+
+    result1 = df.groupby('a')['b'].agg(np.min).iloc[0]
+    result2 = df.groupby('a')['b'].agg(lambda x: np.min(x)).iloc[0]
+    result3 = df.groupby('a')['b'].min().iloc[0]
+
+    assert result1 == ts
+    assert result2 == ts
+    assert result3 == ts
+
+    dates = [pd.Timestamp("2016-01-0%d 12:00:00" % i, tz='US/Pacific')
+             for i in range(1, 5)]
+    df = pd.DataFrame({'A': ['a', 'b'] * 2, 'B': dates})
+    grouped = df.groupby('A')
+
+    ts = df['B'].iloc[0]
+    assert ts == grouped.nth(0)['B'].iloc[0]
+    assert ts == grouped.head(1)['B'].iloc[0]
+    assert ts == grouped.first()['B'].iloc[0]
+    assert ts == grouped.apply(lambda x: x.iloc[0])[0]
+
+    ts = df['B'].iloc[2]
+    assert ts == grouped.last()['B'].iloc[0]
+    assert ts == grouped.apply(lambda x: x.iloc[-1])[0]
+
+
+def test_sum_uint64_overflow():
+    # see gh-14758
+    # Convert to uint64 and don't overflow
+    df = pd.DataFrame([[1, 2], [3, 4], [5, 6]], dtype=object)
+    df = df + 9223372036854775807
+
+    index = pd.Index([9223372036854775808,
+                      9223372036854775810,
+                      9223372036854775812],
+                     dtype=np.uint64)
+    expected = pd.DataFrame({1: [9223372036854775809,
+                                 9223372036854775811,
+                                 9223372036854775813]},
+                            index=index)
+
+    expected.index.name = 0
+    result = df.groupby(0).sum()
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("structure, expected", [
+    (tuple, pd.DataFrame({'C': {(1, 1): (1, 1, 1), (3, 4): (3, 4, 4)}})),
+    (list, pd.DataFrame({'C': {(1, 1): [1, 1, 1], (3, 4): [3, 4, 4]}})),
+    (lambda x: tuple(x), pd.DataFrame({'C': {(1, 1): (1, 1, 1),
+                                             (3, 4): (3, 4, 4)}})),
+    (lambda x: list(x), pd.DataFrame({'C': {(1, 1): [1, 1, 1],
+                                            (3, 4): [3, 4, 4]}}))
+])
+def test_agg_structs_dataframe(structure, expected):
+    df = pd.DataFrame({'A': [1, 1, 1, 3, 3, 3],
+                       'B': [1, 1, 1, 4, 4, 4],
+                       'C': [1, 1, 1, 3, 4, 4]})
+
+    result = df.groupby(['A', 'B']).aggregate(structure)
+    expected.index.names = ['A', 'B']
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("structure, expected", [
+    (tuple, pd.Series([(1, 1, 1), (3, 4, 4)], index=[1, 3], name='C')),
+    (list, pd.Series([[1, 1, 1], [3, 4, 4]], index=[1, 3], name='C')),
+    (lambda x: tuple(x), pd.Series([(1, 1, 1), (3, 4, 4)],
+                                   index=[1, 3], name='C')),
+    (lambda x: list(x), pd.Series([[1, 1, 1], [3, 4, 4]],
+                                  index=[1, 3], name='C'))
+])
+def test_agg_structs_series(structure, expected):
+    # Issue #18079
+    df = pd.DataFrame({'A': [1, 1, 1, 3, 3, 3],
+                       'B': [1, 1, 1, 4, 4, 4],
+                       'C': [1, 1, 1, 3, 4, 4]})
+
+    result = df.groupby('A')['C'].aggregate(structure)
+    expected.index.name = 'A'
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.xfail(reason="GH-18869: agg func not called on empty groups.")
+def test_agg_category_nansum(observed):
+    categories = ['a', 'b', 'c']
+    df = pd.DataFrame({"A": pd.Categorical(['a', 'a', 'b'],
+                                           categories=categories),
+                       'B': [1, 2, 3]})
+    result = df.groupby("A", observed=observed).B.agg(np.nansum)
+    expected = pd.Series([3, 3, 0],
+                         index=pd.CategoricalIndex(['a', 'b', 'c'],
+                                                   categories=categories,
+                                                   name='A'),
+                         name='B')
+    if observed:
+        expected = expected[expected != 0]
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/groupby/conftest.py b/pandas/tests/groupby/conftest.py
new file mode 100644
index 0000000000000..877aa835ac6f5
--- /dev/null
+++ b/pandas/tests/groupby/conftest.py
@@ -0,0 +1,77 @@
+import pytest
+import numpy as np
+from pandas import MultiIndex, DataFrame
+from pandas.util import testing as tm
+
+
+@pytest.fixture
+def mframe():
+    index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
+                                                              'three']],
+                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       names=['first', 'second'])
+    return DataFrame(np.random.randn(10, 3), index=index,
+                     columns=['A', 'B', 'C'])
+
+
+@pytest.fixture
+def df():
+    return DataFrame(
+        {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
+         'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
+         'C': np.random.randn(8),
+         'D': np.random.randn(8)})
+
+
+@pytest.fixture
+def ts():
+    return tm.makeTimeSeries()
+
+
+@pytest.fixture
+def seriesd():
+    return tm.getSeriesData()
+
+
+@pytest.fixture
+def tsd():
+    return tm.getTimeSeriesData()
+
+
+@pytest.fixture
+def frame(seriesd):
+    return DataFrame(seriesd)
+
+
+@pytest.fixture
+def tsframe(tsd):
+    return DataFrame(tsd)
+
+
+@pytest.fixture
+def df_mixed_floats():
+    return DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                            'foo', 'bar', 'foo', 'foo'],
+                      'B': ['one', 'one', 'two', 'three',
+                            'two', 'two', 'one', 'three'],
+                      'C': np.random.randn(8),
+                      'D': np.array(
+                          np.random.randn(8), dtype='float32')})
+
+
+@pytest.fixture
+def three_group():
+    return DataFrame({'A': ['foo', 'foo', 'foo',
+                            'foo', 'bar', 'bar',
+                            'bar', 'bar',
+                            'foo', 'foo', 'foo'],
+                      'B': ['one', 'one', 'one',
+                            'two', 'one', 'one', 'one', 'two',
+                            'two', 'two', 'one'],
+                      'C': ['dull', 'dull', 'shiny',
+                            'dull', 'dull', 'shiny', 'shiny',
+                            'dull', 'shiny', 'shiny', 'shiny'],
+                      'D': np.random.randn(11),
+                      'E': np.random.randn(11),
+                      'F': np.random.randn(11)})
diff --git a/pandas/tests/groupby/test_apply.py b/pandas/tests/groupby/test_apply.py
new file mode 100644
index 0000000000000..07eef2d87feb3
--- /dev/null
+++ b/pandas/tests/groupby/test_apply.py
@@ -0,0 +1,530 @@
+import pytest
+import numpy as np
+import pandas as pd
+from datetime import datetime
+from pandas.util import testing as tm
+from pandas import DataFrame, MultiIndex, compat, Series, bdate_range, Index
+
+
+def test_apply_issues():
+        # GH 5788
+
+    s = """2011.05.16,00:00,1.40893
+2011.05.16,01:00,1.40760
+2011.05.16,02:00,1.40750
+2011.05.16,03:00,1.40649
+2011.05.17,02:00,1.40893
+2011.05.17,03:00,1.40760
+2011.05.17,04:00,1.40750
+2011.05.17,05:00,1.40649
+2011.05.18,02:00,1.40893
+2011.05.18,03:00,1.40760
+2011.05.18,04:00,1.40750
+2011.05.18,05:00,1.40649"""
+
+    df = pd.read_csv(
+        compat.StringIO(s), header=None, names=['date', 'time', 'value'],
+        parse_dates=[['date', 'time']])
+    df = df.set_index('date_time')
+
+    expected = df.groupby(df.index.date).idxmax()
+    result = df.groupby(df.index.date).apply(lambda x: x.idxmax())
+    tm.assert_frame_equal(result, expected)
+
+    # GH 5789
+    # don't auto coerce dates
+    df = pd.read_csv(
+        compat.StringIO(s), header=None, names=['date', 'time', 'value'])
+    exp_idx = pd.Index(
+        ['2011.05.16', '2011.05.17', '2011.05.18'
+         ], dtype=object, name='date')
+    expected = Series(['00:00', '02:00', '02:00'], index=exp_idx)
+    result = df.groupby('date').apply(
+        lambda x: x['time'][x['value'].idxmax()])
+    tm.assert_series_equal(result, expected)
+
+
+def test_apply_trivial():
+    # GH 20066
+    # trivial apply: ignore input and return a constant dataframe.
+    df = pd.DataFrame({'key': ['a', 'a', 'b', 'b', 'a'],
+                       'data': [1.0, 2.0, 3.0, 4.0, 5.0]},
+                      columns=['key', 'data'])
+    expected = pd.concat([df.iloc[1:], df.iloc[1:]],
+                         axis=1, keys=['float64', 'object'])
+    result = df.groupby([str(x) for x in df.dtypes],
+                        axis=1).apply(lambda x: df.iloc[1:])
+
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.xfail(reason=("GH 20066; function passed into apply "
+                           "returns a DataFrame with the same index "
+                           "as the one to create GroupBy object."))
+def test_apply_trivial_fail():
+    # GH 20066
+    # trivial apply fails if the constant dataframe has the same index
+    # with the one used to create GroupBy object.
+    df = pd.DataFrame({'key': ['a', 'a', 'b', 'b', 'a'],
+                       'data': [1.0, 2.0, 3.0, 4.0, 5.0]},
+                      columns=['key', 'data'])
+    expected = pd.concat([df, df],
+                         axis=1, keys=['float64', 'object'])
+    result = df.groupby([str(x) for x in df.dtypes],
+                        axis=1).apply(lambda x: df)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_fast_apply():
+    # make sure that fast apply is correctly called
+    # rather than raising any kind of error
+    # otherwise the python path will be callsed
+    # which slows things down
+    N = 1000
+    labels = np.random.randint(0, 2000, size=N)
+    labels2 = np.random.randint(0, 3, size=N)
+    df = DataFrame({'key': labels,
+                    'key2': labels2,
+                    'value1': np.random.randn(N),
+                    'value2': ['foo', 'bar', 'baz', 'qux'] * (N // 4)})
+
+    def f(g):
+        return 1
+
+    g = df.groupby(['key', 'key2'])
+
+    grouper = g.grouper
+
+    splitter = grouper._get_splitter(g._selected_obj, axis=g.axis)
+    group_keys = grouper._get_group_keys()
+
+    values, mutated = splitter.fast_apply(f, group_keys)
+    assert not mutated
+
+
+def test_apply_with_mixed_dtype():
+    # GH3480, apply with mixed dtype on axis=1 breaks in 0.11
+    df = DataFrame({'foo1': np.random.randn(6),
+                    'foo2': ['one', 'two', 'two', 'three', 'one', 'two']})
+    result = df.apply(lambda x: x, axis=1)
+    tm.assert_series_equal(df.get_dtype_counts(), result.get_dtype_counts())
+
+    # GH 3610 incorrect dtype conversion with as_index=False
+    df = DataFrame({"c1": [1, 2, 6, 6, 8]})
+    df["c2"] = df.c1 / 2.0
+    result1 = df.groupby("c2").mean().reset_index().c2
+    result2 = df.groupby("c2", as_index=False).mean().c2
+    tm.assert_series_equal(result1, result2)
+
+
+def test_groupby_as_index_apply(df):
+    # GH #4648 and #3417
+    df = DataFrame({'item_id': ['b', 'b', 'a', 'c', 'a', 'b'],
+                    'user_id': [1, 2, 1, 1, 3, 1],
+                    'time': range(6)})
+
+    g_as = df.groupby('user_id', as_index=True)
+    g_not_as = df.groupby('user_id', as_index=False)
+
+    res_as = g_as.head(2).index
+    res_not_as = g_not_as.head(2).index
+    exp = Index([0, 1, 2, 4])
+    tm.assert_index_equal(res_as, exp)
+    tm.assert_index_equal(res_not_as, exp)
+
+    res_as_apply = g_as.apply(lambda x: x.head(2)).index
+    res_not_as_apply = g_not_as.apply(lambda x: x.head(2)).index
+
+    # apply doesn't maintain the original ordering
+    # changed in GH5610 as the as_index=False returns a MI here
+    exp_not_as_apply = MultiIndex.from_tuples([(0, 0), (0, 2), (1, 1), (
+        2, 4)])
+    tp = [(1, 0), (1, 2), (2, 1), (3, 4)]
+    exp_as_apply = MultiIndex.from_tuples(tp, names=['user_id', None])
+
+    tm.assert_index_equal(res_as_apply, exp_as_apply)
+    tm.assert_index_equal(res_not_as_apply, exp_not_as_apply)
+
+    ind = Index(list('abcde'))
+    df = DataFrame([[1, 2], [2, 3], [1, 4], [1, 5], [2, 6]], index=ind)
+    res = df.groupby(0, as_index=False).apply(lambda x: x).index
+    tm.assert_index_equal(res, ind)
+
+
+def test_apply_concat_preserve_names(three_group):
+    grouped = three_group.groupby(['A', 'B'])
+
+    def desc(group):
+        result = group.describe()
+        result.index.name = 'stat'
+        return result
+
+    def desc2(group):
+        result = group.describe()
+        result.index.name = 'stat'
+        result = result[:len(group)]
+        # weirdo
+        return result
+
+    def desc3(group):
+        result = group.describe()
+
+        # names are different
+        result.index.name = 'stat_%d' % len(group)
+
+        result = result[:len(group)]
+        # weirdo
+        return result
+
+    result = grouped.apply(desc)
+    assert result.index.names == ('A', 'B', 'stat')
+
+    result2 = grouped.apply(desc2)
+    assert result2.index.names == ('A', 'B', 'stat')
+
+    result3 = grouped.apply(desc3)
+    assert result3.index.names == ('A', 'B', None)
+
+
+def test_apply_series_to_frame():
+    def f(piece):
+        with np.errstate(invalid='ignore'):
+            logged = np.log(piece)
+        return DataFrame({'value': piece,
+                          'demeaned': piece - piece.mean(),
+                          'logged': logged})
+
+    dr = bdate_range('1/1/2000', periods=100)
+    ts = Series(np.random.randn(100), index=dr)
+
+    grouped = ts.groupby(lambda x: x.month)
+    result = grouped.apply(f)
+
+    assert isinstance(result, DataFrame)
+    tm.assert_index_equal(result.index, ts.index)
+
+
+def test_apply_series_yield_constant(df):
+    result = df.groupby(['A', 'B'])['C'].apply(len)
+    assert result.index.names[:2] == ('A', 'B')
+
+
+def test_apply_frame_yield_constant(df):
+    # GH13568
+    result = df.groupby(['A', 'B']).apply(len)
+    assert isinstance(result, Series)
+    assert result.name is None
+
+    result = df.groupby(['A', 'B'])[['C', 'D']].apply(len)
+    assert isinstance(result, Series)
+    assert result.name is None
+
+
+def test_apply_frame_to_series(df):
+    grouped = df.groupby(['A', 'B'])
+    result = grouped.apply(len)
+    expected = grouped.count()['C']
+    tm.assert_index_equal(result.index, expected.index)
+    tm.assert_numpy_array_equal(result.values, expected.values)
+
+
+def test_apply_frame_concat_series():
+    def trans(group):
+        return group.groupby('B')['C'].sum().sort_values()[:2]
+
+    def trans2(group):
+        grouped = group.groupby(df.reindex(group.index)['B'])
+        return grouped.sum().sort_values()[:2]
+
+    df = DataFrame({'A': np.random.randint(0, 5, 1000),
+                    'B': np.random.randint(0, 5, 1000),
+                    'C': np.random.randn(1000)})
+
+    result = df.groupby('A').apply(trans)
+    exp = df.groupby('A')['C'].apply(trans2)
+    tm.assert_series_equal(result, exp, check_names=False)
+    assert result.name == 'C'
+
+
+def test_apply_transform(ts):
+    grouped = ts.groupby(lambda x: x.month)
+    result = grouped.apply(lambda x: x * 2)
+    expected = grouped.transform(lambda x: x * 2)
+    tm.assert_series_equal(result, expected)
+
+
+def test_apply_multikey_corner(tsframe):
+    grouped = tsframe.groupby([lambda x: x.year, lambda x: x.month])
+
+    def f(group):
+        return group.sort_values('A')[-5:]
+
+    result = grouped.apply(f)
+    for key, group in grouped:
+        tm.assert_frame_equal(result.loc[key], f(group))
+
+
+def test_apply_chunk_view():
+    # Low level tinkering could be unsafe, make sure not
+    df = DataFrame({'key': [1, 1, 1, 2, 2, 2, 3, 3, 3],
+                    'value': compat.lrange(9)})
+
+    # return view
+    f = lambda x: x[:2]
+
+    result = df.groupby('key', group_keys=False).apply(f)
+    expected = df.take([0, 1, 3, 4, 6, 7])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_apply_no_name_column_conflict():
+    df = DataFrame({'name': [1, 1, 1, 1, 1, 1, 2, 2, 2, 2],
+                    'name2': [0, 0, 0, 1, 1, 1, 0, 0, 1, 1],
+                    'value': compat.lrange(10)[::-1]})
+
+    # it works! #2605
+    grouped = df.groupby(['name', 'name2'])
+    grouped.apply(lambda x: x.sort_values('value', inplace=True))
+
+
+def test_apply_typecast_fail():
+    df = DataFrame({'d': [1., 1., 1., 2., 2., 2.],
+                    'c': np.tile(
+                        ['a', 'b', 'c'], 2),
+                    'v': np.arange(1., 7.)})
+
+    def f(group):
+        v = group['v']
+        group['v2'] = (v - v.min()) / (v.max() - v.min())
+        return group
+
+    result = df.groupby('d').apply(f)
+
+    expected = df.copy()
+    expected['v2'] = np.tile([0., 0.5, 1], 2)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_apply_multiindex_fail():
+    index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1], [1, 2, 3, 1, 2, 3]
+                                    ])
+    df = DataFrame({'d': [1., 1., 1., 2., 2., 2.],
+                    'c': np.tile(['a', 'b', 'c'], 2),
+                    'v': np.arange(1., 7.)}, index=index)
+
+    def f(group):
+        v = group['v']
+        group['v2'] = (v - v.min()) / (v.max() - v.min())
+        return group
+
+    result = df.groupby('d').apply(f)
+
+    expected = df.copy()
+    expected['v2'] = np.tile([0., 0.5, 1], 2)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_apply_corner(tsframe):
+    result = tsframe.groupby(lambda x: x.year).apply(lambda x: x * 2)
+    expected = tsframe * 2
+    tm.assert_frame_equal(result, expected)
+
+
+def test_apply_without_copy():
+    # GH 5545
+    # returning a non-copy in an applied function fails
+
+    data = DataFrame({'id_field': [100, 100, 200, 300],
+                      'category': ['a', 'b', 'c', 'c'],
+                      'value': [1, 2, 3, 4]})
+
+    def filt1(x):
+        if x.shape[0] == 1:
+            return x.copy()
+        else:
+            return x[x.category == 'c']
+
+    def filt2(x):
+        if x.shape[0] == 1:
+            return x
+        else:
+            return x[x.category == 'c']
+
+    expected = data.groupby('id_field').apply(filt1)
+    result = data.groupby('id_field').apply(filt2)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_apply_corner_cases():
+    # #535, can't use sliding iterator
+
+    N = 1000
+    labels = np.random.randint(0, 100, size=N)
+    df = DataFrame({'key': labels,
+                    'value1': np.random.randn(N),
+                    'value2': ['foo', 'bar', 'baz', 'qux'] * (N // 4)})
+
+    grouped = df.groupby('key')
+
+    def f(g):
+        g['value3'] = g['value1'] * 2
+        return g
+
+    result = grouped.apply(f)
+    assert 'value3' in result
+
+
+def test_apply_numeric_coercion_when_datetime():
+    # In the past, group-by/apply operations have been over-eager
+    # in converting dtypes to numeric, in the presence of datetime
+    # columns.  Various GH issues were filed, the reproductions
+    # for which are here.
+
+    # GH 15670
+    df = pd.DataFrame({'Number': [1, 2],
+                       'Date': ["2017-03-02"] * 2,
+                       'Str': ["foo", "inf"]})
+    expected = df.groupby(['Number']).apply(lambda x: x.iloc[0])
+    df.Date = pd.to_datetime(df.Date)
+    result = df.groupby(['Number']).apply(lambda x: x.iloc[0])
+    tm.assert_series_equal(result['Str'], expected['Str'])
+
+    # GH 15421
+    df = pd.DataFrame({'A': [10, 20, 30],
+                       'B': ['foo', '3', '4'],
+                       'T': [pd.Timestamp("12:31:22")] * 3})
+
+    def get_B(g):
+        return g.iloc[0][['B']]
+    result = df.groupby('A').apply(get_B)['B']
+    expected = df.B
+    expected.index = df.A
+    tm.assert_series_equal(result, expected)
+
+    # GH 14423
+    def predictions(tool):
+        out = pd.Series(index=['p1', 'p2', 'useTime'], dtype=object)
+        if 'step1' in list(tool.State):
+            out['p1'] = str(tool[tool.State == 'step1'].Machine.values[0])
+        if 'step2' in list(tool.State):
+            out['p2'] = str(tool[tool.State == 'step2'].Machine.values[0])
+            out['useTime'] = str(
+                tool[tool.State == 'step2'].oTime.values[0])
+        return out
+    df1 = pd.DataFrame({'Key': ['B', 'B', 'A', 'A'],
+                        'State': ['step1', 'step2', 'step1', 'step2'],
+                        'oTime': ['', '2016-09-19 05:24:33',
+                                  '', '2016-09-19 23:59:04'],
+                        'Machine': ['23', '36L', '36R', '36R']})
+    df2 = df1.copy()
+    df2.oTime = pd.to_datetime(df2.oTime)
+    expected = df1.groupby('Key').apply(predictions).p1
+    result = df2.groupby('Key').apply(predictions).p1
+    tm.assert_series_equal(expected, result)
+
+
+def test_time_field_bug():
+    # Test a fix for the following error related to GH issue 11324 When
+    # non-key fields in a group-by dataframe contained time-based fields
+    # that were not returned by the apply function, an exception would be
+    # raised.
+
+    df = pd.DataFrame({'a': 1, 'b': [datetime.now() for nn in range(10)]})
+
+    def func_with_no_date(batch):
+        return pd.Series({'c': 2})
+
+    def func_with_date(batch):
+        return pd.Series({'b': datetime(2015, 1, 1), 'c': 2})
+
+    dfg_no_conversion = df.groupby(by=['a']).apply(func_with_no_date)
+    dfg_no_conversion_expected = pd.DataFrame({'c': 2}, index=[1])
+    dfg_no_conversion_expected.index.name = 'a'
+
+    dfg_conversion = df.groupby(by=['a']).apply(func_with_date)
+    dfg_conversion_expected = pd.DataFrame(
+        {'b': datetime(2015, 1, 1),
+         'c': 2}, index=[1])
+    dfg_conversion_expected.index.name = 'a'
+
+    tm.assert_frame_equal(dfg_no_conversion, dfg_no_conversion_expected)
+    tm.assert_frame_equal(dfg_conversion, dfg_conversion_expected)
+
+
+def test_gb_apply_list_of_unequal_len_arrays():
+
+    # GH1738
+    df = DataFrame({'group1': ['a', 'a', 'a', 'b', 'b', 'b', 'a', 'a', 'a',
+                               'b', 'b', 'b'],
+                    'group2': ['c', 'c', 'd', 'd', 'd', 'e', 'c', 'c', 'd',
+                               'd', 'd', 'e'],
+                    'weight': [1.1, 2, 3, 4, 5, 6, 2, 4, 6, 8, 1, 2],
+                    'value': [7.1, 8, 9, 10, 11, 12, 8, 7, 6, 5, 4, 3]})
+    df = df.set_index(['group1', 'group2'])
+    df_grouped = df.groupby(level=['group1', 'group2'], sort=True)
+
+    def noddy(value, weight):
+        out = np.array(value * weight).repeat(3)
+        return out
+
+    # the kernel function returns arrays of unequal length
+    # pandas sniffs the first one, sees it's an array and not
+    # a list, and assumed the rest are of equal length
+    # and so tries a vstack
+
+    # don't die
+    df_grouped.apply(lambda x: noddy(x.value, x.weight))
+
+
+def test_groupby_apply_all_none():
+    # Tests to make sure no errors if apply function returns all None
+    # values. Issue 9684.
+    test_df = DataFrame({'groups': [0, 0, 1, 1],
+                         'random_vars': [8, 7, 4, 5]})
+
+    def test_func(x):
+        pass
+
+    result = test_df.groupby('groups').apply(test_func)
+    expected = DataFrame()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_groupby_apply_none_first():
+    # GH 12824. Tests if apply returns None first.
+    test_df1 = DataFrame({'groups': [1, 1, 1, 2], 'vars': [0, 1, 2, 3]})
+    test_df2 = DataFrame({'groups': [1, 2, 2, 2], 'vars': [0, 1, 2, 3]})
+
+    def test_func(x):
+        if x.shape[0] < 2:
+            return None
+        return x.iloc[[0, -1]]
+
+    result1 = test_df1.groupby('groups').apply(test_func)
+    result2 = test_df2.groupby('groups').apply(test_func)
+    index1 = MultiIndex.from_arrays([[1, 1], [0, 2]],
+                                    names=['groups', None])
+    index2 = MultiIndex.from_arrays([[2, 2], [1, 3]],
+                                    names=['groups', None])
+    expected1 = DataFrame({'groups': [1, 1], 'vars': [0, 2]},
+                          index=index1)
+    expected2 = DataFrame({'groups': [2, 2], 'vars': [1, 3]},
+                          index=index2)
+    tm.assert_frame_equal(result1, expected1)
+    tm.assert_frame_equal(result2, expected2)
+
+
+def test_apply_with_mixed_types():
+    # gh-20949
+    df = pd.DataFrame({'A': 'a a b'.split(), 'B': [1, 2, 3], 'C': [4, 6, 5]})
+    g = df.groupby('A')
+
+    result = g.transform(lambda x: x / x.sum())
+    expected = pd.DataFrame({'B': [1 / 3., 2 / 3., 1], 'C': [0.4, 0.6, 1.0]})
+    tm.assert_frame_equal(result, expected)
+
+    result = g.apply(lambda x: x / x.sum())
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/groupby/test_bin_groupby.py b/pandas/tests/groupby/test_bin_groupby.py
new file mode 100644
index 0000000000000..c293f49c5bc2a
--- /dev/null
+++ b/pandas/tests/groupby/test_bin_groupby.py
@@ -0,0 +1,153 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from numpy import nan
+import numpy as np
+
+from pandas.core.dtypes.common import _ensure_int64
+from pandas import Index, isna
+from pandas.util.testing import assert_almost_equal
+import pandas.util.testing as tm
+from pandas._libs import lib, groupby, reduction
+
+
+def test_series_grouper():
+    from pandas import Series
+    obj = Series(np.random.randn(10))
+    dummy = obj[:0]
+
+    labels = np.array([-1, -1, -1, 0, 0, 0, 1, 1, 1, 1], dtype=np.int64)
+
+    grouper = reduction.SeriesGrouper(obj, np.mean, labels, 2, dummy)
+    result, counts = grouper.get_result()
+
+    expected = np.array([obj[3:6].mean(), obj[6:].mean()])
+    assert_almost_equal(result, expected)
+
+    exp_counts = np.array([3, 4], dtype=np.int64)
+    assert_almost_equal(counts, exp_counts)
+
+
+def test_series_bin_grouper():
+    from pandas import Series
+    obj = Series(np.random.randn(10))
+    dummy = obj[:0]
+
+    bins = np.array([3, 6])
+
+    grouper = reduction.SeriesBinGrouper(obj, np.mean, bins, dummy)
+    result, counts = grouper.get_result()
+
+    expected = np.array([obj[:3].mean(), obj[3:6].mean(), obj[6:].mean()])
+    assert_almost_equal(result, expected)
+
+    exp_counts = np.array([3, 3, 4], dtype=np.int64)
+    assert_almost_equal(counts, exp_counts)
+
+
+class TestBinGroupers(object):
+
+    def setup_method(self, method):
+        self.obj = np.random.randn(10, 1)
+        self.labels = np.array([0, 0, 0, 1, 1, 1, 2, 2, 2, 2], dtype=np.int64)
+        self.bins = np.array([3, 6], dtype=np.int64)
+
+    def test_generate_bins(self):
+        from pandas.core.groupby.groupby import generate_bins_generic
+        values = np.array([1, 2, 3, 4, 5, 6], dtype=np.int64)
+        binner = np.array([0, 3, 6, 9], dtype=np.int64)
+
+        for func in [lib.generate_bins_dt64, generate_bins_generic]:
+            bins = func(values, binner, closed='left')
+            assert ((bins == np.array([2, 5, 6])).all())
+
+            bins = func(values, binner, closed='right')
+            assert ((bins == np.array([3, 6, 6])).all())
+
+        for func in [lib.generate_bins_dt64, generate_bins_generic]:
+            values = np.array([1, 2, 3, 4, 5, 6], dtype=np.int64)
+            binner = np.array([0, 3, 6], dtype=np.int64)
+
+            bins = func(values, binner, closed='right')
+            assert ((bins == np.array([3, 6])).all())
+
+        pytest.raises(ValueError, generate_bins_generic, values, [],
+                      'right')
+        pytest.raises(ValueError, generate_bins_generic, values[:0],
+                      binner, 'right')
+
+        pytest.raises(ValueError, generate_bins_generic, values, [4],
+                      'right')
+        pytest.raises(ValueError, generate_bins_generic, values, [-3, -1],
+                      'right')
+
+
+def test_group_ohlc():
+    def _check(dtype):
+        obj = np.array(np.random.randn(20), dtype=dtype)
+
+        bins = np.array([6, 12, 20])
+        out = np.zeros((3, 4), dtype)
+        counts = np.zeros(len(out), dtype=np.int64)
+        labels = _ensure_int64(np.repeat(np.arange(3),
+                                         np.diff(np.r_[0, bins])))
+
+        func = getattr(groupby, 'group_ohlc_%s' % dtype)
+        func(out, counts, obj[:, None], labels)
+
+        def _ohlc(group):
+            if isna(group).all():
+                return np.repeat(nan, 4)
+            return [group[0], group.max(), group.min(), group[-1]]
+
+        expected = np.array([_ohlc(obj[:6]), _ohlc(obj[6:12]),
+                             _ohlc(obj[12:])])
+
+        assert_almost_equal(out, expected)
+        tm.assert_numpy_array_equal(counts,
+                                    np.array([6, 6, 8], dtype=np.int64))
+
+        obj[:6] = nan
+        func(out, counts, obj[:, None], labels)
+        expected[0] = nan
+        assert_almost_equal(out, expected)
+
+    _check('float32')
+    _check('float64')
+
+
+class TestMoments(object):
+    pass
+
+
+class TestReducer(object):
+
+    def test_int_index(self):
+        from pandas.core.series import Series
+
+        arr = np.random.randn(100, 4)
+        result = reduction.reduce(arr, np.sum, labels=Index(np.arange(4)))
+        expected = arr.sum(0)
+        assert_almost_equal(result, expected)
+
+        result = reduction.reduce(arr, np.sum, axis=1,
+                                  labels=Index(np.arange(100)))
+        expected = arr.sum(1)
+        assert_almost_equal(result, expected)
+
+        dummy = Series(0., index=np.arange(100))
+        result = reduction.reduce(arr, np.sum, dummy=dummy,
+                                  labels=Index(np.arange(4)))
+        expected = arr.sum(0)
+        assert_almost_equal(result, expected)
+
+        dummy = Series(0., index=np.arange(4))
+        result = reduction.reduce(arr, np.sum, axis=1, dummy=dummy,
+                                  labels=Index(np.arange(100)))
+        expected = arr.sum(1)
+        assert_almost_equal(result, expected)
+
+        result = reduction.reduce(arr, np.sum, axis=1, dummy=dummy,
+                                  labels=Index(np.arange(100)))
+        assert_almost_equal(result, expected)
diff --git a/pandas/tests/groupby/test_categorical.py b/pandas/tests/groupby/test_categorical.py
new file mode 100644
index 0000000000000..cb76195eacf40
--- /dev/null
+++ b/pandas/tests/groupby/test_categorical.py
@@ -0,0 +1,852 @@
+# -*- coding: utf-8 -*-
+from __future__ import print_function
+from datetime import datetime
+
+import pytest
+
+import numpy as np
+import pandas as pd
+from pandas.compat import PY37
+from pandas import (Index, MultiIndex, CategoricalIndex,
+                    DataFrame, Categorical, Series, qcut)
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+import pandas.util.testing as tm
+
+
+def cartesian_product_for_groupers(result, args, names):
+    """ Reindex to a cartesian production for the groupers,
+    preserving the nature (Categorical) of each grouper """
+
+    def f(a):
+        if isinstance(a, (CategoricalIndex, Categorical)):
+            categories = a.categories
+            a = Categorical.from_codes(np.arange(len(categories)),
+                                       categories=categories,
+                                       ordered=a.ordered)
+        return a
+
+    index = pd.MultiIndex.from_product(map(f, args), names=names)
+    return result.reindex(index).sort_index()
+
+
+def test_apply_use_categorical_name(df):
+    cats = qcut(df.C, 4)
+
+    def get_stats(group):
+        return {'min': group.min(),
+                'max': group.max(),
+                'count': group.count(),
+                'mean': group.mean()}
+
+    result = df.groupby(cats, observed=False).D.apply(get_stats)
+    assert result.index.names[0] == 'C'
+
+
+def test_basic():
+
+    cats = Categorical(["a", "a", "a", "b", "b", "b", "c", "c", "c"],
+                       categories=["a", "b", "c", "d"], ordered=True)
+    data = DataFrame({"a": [1, 1, 1, 2, 2, 2, 3, 4, 5], "b": cats})
+
+    exp_index = CategoricalIndex(list('abcd'), name='b', ordered=True)
+    expected = DataFrame({'a': [1, 2, 4, np.nan]}, index=exp_index)
+    result = data.groupby("b", observed=False).mean()
+    tm.assert_frame_equal(result, expected)
+
+    cat1 = Categorical(["a", "a", "b", "b"],
+                       categories=["a", "b", "z"], ordered=True)
+    cat2 = Categorical(["c", "d", "c", "d"],
+                       categories=["c", "d", "y"], ordered=True)
+    df = DataFrame({"A": cat1, "B": cat2, "values": [1, 2, 3, 4]})
+
+    # single grouper
+    gb = df.groupby("A", observed=False)
+    exp_idx = CategoricalIndex(['a', 'b', 'z'], name='A', ordered=True)
+    expected = DataFrame({'values': Series([3, 7, 0], index=exp_idx)})
+    result = gb.sum()
+    tm.assert_frame_equal(result, expected)
+
+    # GH 8623
+    x = DataFrame([[1, 'John P. Doe'], [2, 'Jane Dove'],
+                   [1, 'John P. Doe']],
+                  columns=['person_id', 'person_name'])
+    x['person_name'] = Categorical(x.person_name)
+
+    g = x.groupby(['person_id'], observed=False)
+    result = g.transform(lambda x: x)
+    tm.assert_frame_equal(result, x[['person_name']])
+
+    result = x.drop_duplicates('person_name')
+    expected = x.iloc[[0, 1]]
+    tm.assert_frame_equal(result, expected)
+
+    def f(x):
+        return x.drop_duplicates('person_name').iloc[0]
+
+    result = g.apply(f)
+    expected = x.iloc[[0, 1]].copy()
+    expected.index = Index([1, 2], name='person_id')
+    expected['person_name'] = expected['person_name'].astype('object')
+    tm.assert_frame_equal(result, expected)
+
+    # GH 9921
+    # Monotonic
+    df = DataFrame({"a": [5, 15, 25]})
+    c = pd.cut(df.a, bins=[0, 10, 20, 30, 40])
+
+    result = df.a.groupby(c, observed=False).transform(sum)
+    tm.assert_series_equal(result, df['a'])
+
+    tm.assert_series_equal(
+        df.a.groupby(c, observed=False).transform(lambda xs: np.sum(xs)),
+        df['a'])
+    tm.assert_frame_equal(
+        df.groupby(c, observed=False).transform(sum),
+        df[['a']])
+    tm.assert_frame_equal(
+        df.groupby(c, observed=False).transform(lambda xs: np.max(xs)),
+        df[['a']])
+
+    # Filter
+    tm.assert_series_equal(
+        df.a.groupby(c, observed=False).filter(np.all),
+        df['a'])
+    tm.assert_frame_equal(
+        df.groupby(c, observed=False).filter(np.all),
+        df)
+
+    # Non-monotonic
+    df = DataFrame({"a": [5, 15, 25, -5]})
+    c = pd.cut(df.a, bins=[-10, 0, 10, 20, 30, 40])
+
+    result = df.a.groupby(c, observed=False).transform(sum)
+    tm.assert_series_equal(result, df['a'])
+
+    tm.assert_series_equal(
+        df.a.groupby(c, observed=False).transform(lambda xs: np.sum(xs)),
+        df['a'])
+    tm.assert_frame_equal(
+        df.groupby(c, observed=False).transform(sum),
+        df[['a']])
+    tm.assert_frame_equal(
+        df.groupby(c, observed=False).transform(lambda xs: np.sum(xs)),
+        df[['a']])
+
+    # GH 9603
+    df = DataFrame({'a': [1, 0, 0, 0]})
+    c = pd.cut(df.a, [0, 1, 2, 3, 4], labels=Categorical(list('abcd')))
+    result = df.groupby(c, observed=False).apply(len)
+
+    exp_index = CategoricalIndex(
+        c.values.categories, ordered=c.values.ordered)
+    expected = Series([1, 0, 0, 0], index=exp_index)
+    expected.index.name = 'a'
+    tm.assert_series_equal(result, expected)
+
+    # more basic
+    levels = ['foo', 'bar', 'baz', 'qux']
+    codes = np.random.randint(0, 4, size=100)
+
+    cats = Categorical.from_codes(codes, levels, ordered=True)
+
+    data = DataFrame(np.random.randn(100, 4))
+
+    result = data.groupby(cats, observed=False).mean()
+
+    expected = data.groupby(np.asarray(cats), observed=False).mean()
+    exp_idx = CategoricalIndex(levels, categories=cats.categories,
+                               ordered=True)
+    expected = expected.reindex(exp_idx)
+
+    assert_frame_equal(result, expected)
+
+    grouped = data.groupby(cats, observed=False)
+    desc_result = grouped.describe()
+
+    idx = cats.codes.argsort()
+    ord_labels = np.asarray(cats).take(idx)
+    ord_data = data.take(idx)
+
+    exp_cats = Categorical(ord_labels, ordered=True,
+                           categories=['foo', 'bar', 'baz', 'qux'])
+    expected = ord_data.groupby(
+        exp_cats, sort=False, observed=False).describe()
+    assert_frame_equal(desc_result, expected)
+
+    # GH 10460
+    expc = Categorical.from_codes(np.arange(4).repeat(8),
+                                  levels, ordered=True)
+    exp = CategoricalIndex(expc)
+    tm.assert_index_equal((desc_result.stack().index
+                           .get_level_values(0)), exp)
+    exp = Index(['count', 'mean', 'std', 'min', '25%', '50%',
+                 '75%', 'max'] * 4)
+    tm.assert_index_equal((desc_result.stack().index
+                           .get_level_values(1)), exp)
+
+
+def test_level_get_group(observed):
+    # GH15155
+    df = DataFrame(data=np.arange(2, 22, 2),
+                   index=MultiIndex(
+                       levels=[pd.CategoricalIndex(["a", "b"]), range(10)],
+                       labels=[[0] * 5 + [1] * 5, range(10)],
+                       names=["Index1", "Index2"]))
+    g = df.groupby(level=["Index1"], observed=observed)
+
+    # expected should equal test.loc[["a"]]
+    # GH15166
+    expected = DataFrame(data=np.arange(2, 12, 2),
+                         index=pd.MultiIndex(levels=[pd.CategoricalIndex(
+                             ["a", "b"]), range(5)],
+        labels=[[0] * 5, range(5)],
+        names=["Index1", "Index2"]))
+    result = g.get_group('a')
+
+    assert_frame_equal(result, expected)
+
+
+@pytest.mark.xfail(PY37, reason="flaky on 3.7, xref gh-21636")
+@pytest.mark.parametrize('ordered', [True, False])
+def test_apply(ordered):
+    # GH 10138
+
+    dense = Categorical(list('abc'), ordered=ordered)
+
+    # 'b' is in the categories but not in the list
+    missing = Categorical(
+        list('aaa'), categories=['a', 'b'], ordered=ordered)
+    values = np.arange(len(dense))
+    df = DataFrame({'missing': missing,
+                    'dense': dense,
+                    'values': values})
+    grouped = df.groupby(['missing', 'dense'], observed=True)
+
+    # missing category 'b' should still exist in the output index
+    idx = MultiIndex.from_arrays(
+        [missing, dense], names=['missing', 'dense'])
+    expected = DataFrame([0, 1, 2.],
+                         index=idx,
+                         columns=['values'])
+
+    result = grouped.apply(lambda x: np.mean(x))
+    assert_frame_equal(result, expected)
+
+    # we coerce back to ints
+    expected = expected.astype('int')
+    result = grouped.mean()
+    assert_frame_equal(result, expected)
+
+    result = grouped.agg(np.mean)
+    assert_frame_equal(result, expected)
+
+    # but for transform we should still get back the original index
+    idx = MultiIndex.from_arrays([missing, dense],
+                                 names=['missing', 'dense'])
+    expected = Series(1, index=idx)
+    result = grouped.apply(lambda x: 1)
+    assert_series_equal(result, expected)
+
+
+def test_observed(observed):
+    # multiple groupers, don't re-expand the output space
+    # of the grouper
+    # gh-14942 (implement)
+    # gh-10132 (back-compat)
+    # gh-8138 (back-compat)
+    # gh-8869
+
+    cat1 = Categorical(["a", "a", "b", "b"],
+                       categories=["a", "b", "z"], ordered=True)
+    cat2 = Categorical(["c", "d", "c", "d"],
+                       categories=["c", "d", "y"], ordered=True)
+    df = DataFrame({"A": cat1, "B": cat2, "values": [1, 2, 3, 4]})
+    df['C'] = ['foo', 'bar'] * 2
+
+    # multiple groupers with a non-cat
+    gb = df.groupby(['A', 'B', 'C'], observed=observed)
+    exp_index = pd.MultiIndex.from_arrays(
+        [cat1, cat2, ['foo', 'bar'] * 2],
+        names=['A', 'B', 'C'])
+    expected = DataFrame({'values': Series(
+        [1, 2, 3, 4], index=exp_index)}).sort_index()
+    result = gb.sum()
+    if not observed:
+        expected = cartesian_product_for_groupers(
+            expected,
+            [cat1, cat2, ['foo', 'bar']],
+            list('ABC'))
+
+    tm.assert_frame_equal(result, expected)
+
+    gb = df.groupby(['A', 'B'], observed=observed)
+    exp_index = pd.MultiIndex.from_arrays(
+        [cat1, cat2],
+        names=['A', 'B'])
+    expected = DataFrame({'values': [1, 2, 3, 4]},
+                         index=exp_index)
+    result = gb.sum()
+    if not observed:
+        expected = cartesian_product_for_groupers(
+            expected,
+            [cat1, cat2],
+            list('AB'))
+
+    tm.assert_frame_equal(result, expected)
+
+    # https://github.com/pandas-dev/pandas/issues/8138
+    d = {'cat':
+         pd.Categorical(["a", "b", "a", "b"], categories=["a", "b", "c"],
+                        ordered=True),
+         'ints': [1, 1, 2, 2],
+         'val': [10, 20, 30, 40]}
+    df = pd.DataFrame(d)
+
+    # Grouping on a single column
+    groups_single_key = df.groupby("cat", observed=observed)
+    result = groups_single_key.mean()
+
+    exp_index = pd.CategoricalIndex(list('ab'), name="cat",
+                                    categories=list('abc'),
+                                    ordered=True)
+    expected = DataFrame({"ints": [1.5, 1.5], "val": [20., 30]},
+                         index=exp_index)
+    if not observed:
+        index = pd.CategoricalIndex(list('abc'), name="cat",
+                                    categories=list('abc'),
+                                    ordered=True)
+        expected = expected.reindex(index)
+
+    tm.assert_frame_equal(result, expected)
+
+    # Grouping on two columns
+    groups_double_key = df.groupby(["cat", "ints"], observed=observed)
+    result = groups_double_key.agg('mean')
+    expected = DataFrame(
+        {"val": [10, 30, 20, 40],
+         "cat": pd.Categorical(['a', 'a', 'b', 'b'],
+                               categories=['a', 'b', 'c'],
+                               ordered=True),
+         "ints": [1, 2, 1, 2]}).set_index(["cat", "ints"])
+    if not observed:
+        expected = cartesian_product_for_groupers(
+            expected,
+            [df.cat.values, [1, 2]],
+            ['cat', 'ints'])
+
+    tm.assert_frame_equal(result, expected)
+
+    # GH 10132
+    for key in [('a', 1), ('b', 2), ('b', 1), ('a', 2)]:
+        c, i = key
+        result = groups_double_key.get_group(key)
+        expected = df[(df.cat == c) & (df.ints == i)]
+        assert_frame_equal(result, expected)
+
+    # gh-8869
+    # with as_index
+    d = {'foo': [10, 8, 4, 8, 4, 1, 1], 'bar': [10, 20, 30, 40, 50, 60, 70],
+         'baz': ['d', 'c', 'e', 'a', 'a', 'd', 'c']}
+    df = pd.DataFrame(d)
+    cat = pd.cut(df['foo'], np.linspace(0, 10, 3))
+    df['range'] = cat
+    groups = df.groupby(['range', 'baz'], as_index=False, observed=observed)
+    result = groups.agg('mean')
+
+    groups2 = df.groupby(['range', 'baz'], as_index=True, observed=observed)
+    expected = groups2.agg('mean').reset_index()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_observed_codes_remap(observed):
+    d = {'C1': [3, 3, 4, 5], 'C2': [1, 2, 3, 4], 'C3': [10, 100, 200, 34]}
+    df = pd.DataFrame(d)
+    values = pd.cut(df['C1'], [1, 2, 3, 6])
+    values.name = "cat"
+    groups_double_key = df.groupby([values, 'C2'], observed=observed)
+
+    idx = MultiIndex.from_arrays([values, [1, 2, 3, 4]],
+                                 names=["cat", "C2"])
+    expected = DataFrame({"C1": [3, 3, 4, 5],
+                          "C3": [10, 100, 200, 34]}, index=idx)
+    if not observed:
+        expected = cartesian_product_for_groupers(
+            expected,
+            [values.values, [1, 2, 3, 4]],
+            ['cat', 'C2'])
+
+    result = groups_double_key.agg('mean')
+    tm.assert_frame_equal(result, expected)
+
+
+def test_observed_perf():
+    # we create a cartesian product, so this is
+    # non-performant if we don't use observed values
+    # gh-14942
+    df = DataFrame({
+        'cat': np.random.randint(0, 255, size=30000),
+        'int_id': np.random.randint(0, 255, size=30000),
+        'other_id': np.random.randint(0, 10000, size=30000),
+        'foo': 0})
+    df['cat'] = df.cat.astype(str).astype('category')
+
+    grouped = df.groupby(['cat', 'int_id', 'other_id'], observed=True)
+    result = grouped.count()
+    assert result.index.levels[0].nunique() == df.cat.nunique()
+    assert result.index.levels[1].nunique() == df.int_id.nunique()
+    assert result.index.levels[2].nunique() == df.other_id.nunique()
+
+
+def test_observed_groups(observed):
+    # gh-20583
+    # test that we have the appropriate groups
+
+    cat = pd.Categorical(['a', 'c', 'a'], categories=['a', 'b', 'c'])
+    df = pd.DataFrame({'cat': cat, 'vals': [1, 2, 3]})
+    g = df.groupby('cat', observed=observed)
+
+    result = g.groups
+    if observed:
+        expected = {'a': Index([0, 2], dtype='int64'),
+                    'c': Index([1], dtype='int64')}
+    else:
+        expected = {'a': Index([0, 2], dtype='int64'),
+                    'b': Index([], dtype='int64'),
+                    'c': Index([1], dtype='int64')}
+
+    tm.assert_dict_equal(result, expected)
+
+
+def test_datetime():
+    # GH9049: ensure backward compatibility
+    levels = pd.date_range('2014-01-01', periods=4)
+    codes = np.random.randint(0, 4, size=100)
+
+    cats = Categorical.from_codes(codes, levels, ordered=True)
+
+    data = DataFrame(np.random.randn(100, 4))
+    result = data.groupby(cats, observed=False).mean()
+
+    expected = data.groupby(np.asarray(cats), observed=False).mean()
+    expected = expected.reindex(levels)
+    expected.index = CategoricalIndex(expected.index,
+                                      categories=expected.index,
+                                      ordered=True)
+
+    assert_frame_equal(result, expected)
+
+    grouped = data.groupby(cats, observed=False)
+    desc_result = grouped.describe()
+
+    idx = cats.codes.argsort()
+    ord_labels = cats.take_nd(idx)
+    ord_data = data.take(idx)
+    expected = ord_data.groupby(ord_labels, observed=False).describe()
+    assert_frame_equal(desc_result, expected)
+    tm.assert_index_equal(desc_result.index, expected.index)
+    tm.assert_index_equal(
+        desc_result.index.get_level_values(0),
+        expected.index.get_level_values(0))
+
+    # GH 10460
+    expc = Categorical.from_codes(
+        np.arange(4).repeat(8), levels, ordered=True)
+    exp = CategoricalIndex(expc)
+    tm.assert_index_equal((desc_result.stack().index
+                           .get_level_values(0)), exp)
+    exp = Index(['count', 'mean', 'std', 'min', '25%', '50%',
+                 '75%', 'max'] * 4)
+    tm.assert_index_equal((desc_result.stack().index
+                           .get_level_values(1)), exp)
+
+
+def test_categorical_index():
+
+    s = np.random.RandomState(12345)
+    levels = ['foo', 'bar', 'baz', 'qux']
+    codes = s.randint(0, 4, size=20)
+    cats = Categorical.from_codes(codes, levels, ordered=True)
+    df = DataFrame(
+        np.repeat(
+            np.arange(20), 4).reshape(-1, 4), columns=list('abcd'))
+    df['cats'] = cats
+
+    # with a cat index
+    result = df.set_index('cats').groupby(level=0, observed=False).sum()
+    expected = df[list('abcd')].groupby(cats.codes, observed=False).sum()
+    expected.index = CategoricalIndex(
+        Categorical.from_codes(
+            [0, 1, 2, 3], levels, ordered=True), name='cats')
+    assert_frame_equal(result, expected)
+
+    # with a cat column, should produce a cat index
+    result = df.groupby('cats', observed=False).sum()
+    expected = df[list('abcd')].groupby(cats.codes, observed=False).sum()
+    expected.index = CategoricalIndex(
+        Categorical.from_codes(
+            [0, 1, 2, 3], levels, ordered=True), name='cats')
+    assert_frame_equal(result, expected)
+
+
+def test_describe_categorical_columns():
+    # GH 11558
+    cats = pd.CategoricalIndex(['qux', 'foo', 'baz', 'bar'],
+                               categories=['foo', 'bar', 'baz', 'qux'],
+                               ordered=True)
+    df = DataFrame(np.random.randn(20, 4), columns=cats)
+    result = df.groupby([1, 2, 3, 4] * 5).describe()
+
+    tm.assert_index_equal(result.stack().columns, cats)
+    tm.assert_categorical_equal(result.stack().columns.values, cats.values)
+
+
+def test_unstack_categorical():
+    # GH11558 (example is taken from the original issue)
+    df = pd.DataFrame({'a': range(10),
+                       'medium': ['A', 'B'] * 5,
+                       'artist': list('XYXXY') * 2})
+    df['medium'] = df['medium'].astype('category')
+
+    gcat = df.groupby(
+        ['artist', 'medium'], observed=False)['a'].count().unstack()
+    result = gcat.describe()
+
+    exp_columns = pd.CategoricalIndex(['A', 'B'], ordered=False,
+                                      name='medium')
+    tm.assert_index_equal(result.columns, exp_columns)
+    tm.assert_categorical_equal(result.columns.values, exp_columns.values)
+
+    result = gcat['A'] + gcat['B']
+    expected = pd.Series([6, 4], index=pd.Index(['X', 'Y'], name='artist'))
+    tm.assert_series_equal(result, expected)
+
+
+def test_bins_unequal_len():
+    # GH3011
+    series = Series([np.nan, np.nan, 1, 1, 2, 2, 3, 3, 4, 4])
+    bins = pd.cut(series.dropna().values, 4)
+
+    # len(bins) != len(series) here
+    def f():
+        series.groupby(bins).mean()
+    pytest.raises(ValueError, f)
+
+
+def test_as_index():
+    # GH13204
+    df = DataFrame({'cat': Categorical([1, 2, 2], [1, 2, 3]),
+                    'A': [10, 11, 11],
+                    'B': [101, 102, 103]})
+    result = df.groupby(['cat', 'A'], as_index=False, observed=True).sum()
+    expected = DataFrame(
+        {'cat': Categorical([1, 2], categories=df.cat.cat.categories),
+         'A': [10, 11],
+         'B': [101, 205]},
+        columns=['cat', 'A', 'B'])
+    tm.assert_frame_equal(result, expected)
+
+    # function grouper
+    f = lambda r: df.loc[r, 'A']
+    result = df.groupby(['cat', f], as_index=False, observed=True).sum()
+    expected = DataFrame(
+        {'cat': Categorical([1, 2], categories=df.cat.cat.categories),
+         'A': [10, 22],
+         'B': [101, 205]},
+        columns=['cat', 'A', 'B'])
+    tm.assert_frame_equal(result, expected)
+
+    # another not in-axis grouper (conflicting names in index)
+    s = Series(['a', 'b', 'b'], name='cat')
+    result = df.groupby(['cat', s], as_index=False, observed=True).sum()
+    tm.assert_frame_equal(result, expected)
+
+    # is original index dropped?
+    group_columns = ['cat', 'A']
+    expected = DataFrame(
+        {'cat': Categorical([1, 2], categories=df.cat.cat.categories),
+         'A': [10, 11],
+         'B': [101, 205]},
+        columns=['cat', 'A', 'B'])
+
+    for name in [None, 'X', 'B', 'cat']:
+        df.index = Index(list("abc"), name=name)
+
+        if name in group_columns and name in df.index.names:
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = df.groupby(
+                    group_columns, as_index=False, observed=True).sum()
+
+        else:
+            result = df.groupby(
+                group_columns, as_index=False, observed=True).sum()
+
+        tm.assert_frame_equal(result, expected)
+
+
+def test_preserve_categories():
+    # GH-13179
+    categories = list('abc')
+
+    # ordered=True
+    df = DataFrame({'A': pd.Categorical(list('ba'),
+                                        categories=categories,
+                                        ordered=True)})
+    index = pd.CategoricalIndex(categories, categories, ordered=True)
+    tm.assert_index_equal(
+        df.groupby('A', sort=True, observed=False).first().index, index)
+    tm.assert_index_equal(
+        df.groupby('A', sort=False, observed=False).first().index, index)
+
+    # ordered=False
+    df = DataFrame({'A': pd.Categorical(list('ba'),
+                                        categories=categories,
+                                        ordered=False)})
+    sort_index = pd.CategoricalIndex(categories, categories, ordered=False)
+    nosort_index = pd.CategoricalIndex(list('bac'), list('bac'),
+                                       ordered=False)
+    tm.assert_index_equal(
+        df.groupby('A', sort=True, observed=False).first().index,
+        sort_index)
+    tm.assert_index_equal(
+        df.groupby('A', sort=False, observed=False).first().index,
+        nosort_index)
+
+
+def test_preserve_categorical_dtype():
+    # GH13743, GH13854
+    df = DataFrame({'A': [1, 2, 1, 1, 2],
+                    'B': [10, 16, 22, 28, 34],
+                    'C1': Categorical(list("abaab"),
+                                      categories=list("bac"),
+                                      ordered=False),
+                    'C2': Categorical(list("abaab"),
+                                      categories=list("bac"),
+                                      ordered=True)})
+    # single grouper
+    exp_full = DataFrame({'A': [2.0, 1.0, np.nan],
+                          'B': [25.0, 20.0, np.nan],
+                          'C1': Categorical(list("bac"),
+                                            categories=list("bac"),
+                                            ordered=False),
+                          'C2': Categorical(list("bac"),
+                                            categories=list("bac"),
+                                            ordered=True)})
+    for col in ['C1', 'C2']:
+        result1 = df.groupby(by=col, as_index=False, observed=False).mean()
+        result2 = df.groupby(
+            by=col, as_index=True, observed=False).mean().reset_index()
+        expected = exp_full.reindex(columns=result1.columns)
+        tm.assert_frame_equal(result1, expected)
+        tm.assert_frame_equal(result2, expected)
+
+
+def test_categorical_no_compress():
+    data = Series(np.random.randn(9))
+
+    codes = np.array([0, 0, 0, 1, 1, 1, 2, 2, 2])
+    cats = Categorical.from_codes(codes, [0, 1, 2], ordered=True)
+
+    result = data.groupby(cats, observed=False).mean()
+    exp = data.groupby(codes, observed=False).mean()
+
+    exp.index = CategoricalIndex(exp.index, categories=cats.categories,
+                                 ordered=cats.ordered)
+    assert_series_equal(result, exp)
+
+    codes = np.array([0, 0, 0, 1, 1, 1, 3, 3, 3])
+    cats = Categorical.from_codes(codes, [0, 1, 2, 3], ordered=True)
+
+    result = data.groupby(cats, observed=False).mean()
+    exp = data.groupby(codes, observed=False).mean().reindex(cats.categories)
+    exp.index = CategoricalIndex(exp.index, categories=cats.categories,
+                                 ordered=cats.ordered)
+    assert_series_equal(result, exp)
+
+    cats = Categorical(["a", "a", "a", "b", "b", "b", "c", "c", "c"],
+                       categories=["a", "b", "c", "d"], ordered=True)
+    data = DataFrame({"a": [1, 1, 1, 2, 2, 2, 3, 4, 5], "b": cats})
+
+    result = data.groupby("b", observed=False).mean()
+    result = result["a"].values
+    exp = np.array([1, 2, 4, np.nan])
+    tm.assert_numpy_array_equal(result, exp)
+
+
+def test_sort():
+
+    # http://stackoverflow.com/questions/23814368/sorting-pandas-categorical-labels-after-groupby  # noqa: flake8
+    # This should result in a properly sorted Series so that the plot
+    # has a sorted x axis
+    # self.cat.groupby(['value_group'])['value_group'].count().plot(kind='bar')
+
+    df = DataFrame({'value': np.random.randint(0, 10000, 100)})
+    labels = ["{0} - {1}".format(i, i + 499) for i in range(0, 10000, 500)]
+    cat_labels = Categorical(labels, labels)
+
+    df = df.sort_values(by=['value'], ascending=True)
+    df['value_group'] = pd.cut(df.value, range(0, 10500, 500),
+                               right=False, labels=cat_labels)
+
+    res = df.groupby(['value_group'], observed=False)['value_group'].count()
+    exp = res[sorted(res.index, key=lambda x: float(x.split()[0]))]
+    exp.index = CategoricalIndex(exp.index, name=exp.index.name)
+    tm.assert_series_equal(res, exp)
+
+
+def test_sort2():
+    # dataframe groupby sort was being ignored # GH 8868
+    df = DataFrame([['(7.5, 10]', 10, 10],
+                    ['(7.5, 10]', 8, 20],
+                    ['(2.5, 5]', 5, 30],
+                    ['(5, 7.5]', 6, 40],
+                    ['(2.5, 5]', 4, 50],
+                    ['(0, 2.5]', 1, 60],
+                    ['(5, 7.5]', 7, 70]], columns=['range', 'foo', 'bar'])
+    df['range'] = Categorical(df['range'], ordered=True)
+    index = CategoricalIndex(['(0, 2.5]', '(2.5, 5]', '(5, 7.5]',
+                              '(7.5, 10]'], name='range', ordered=True)
+    expected_sort = DataFrame([[1, 60], [5, 30], [6, 40], [10, 10]],
+                              columns=['foo', 'bar'], index=index)
+
+    col = 'range'
+    result_sort = df.groupby(col, sort=True, observed=False).first()
+    assert_frame_equal(result_sort, expected_sort)
+
+    # when categories is ordered, group is ordered by category's order
+    expected_sort = result_sort
+    result_sort = df.groupby(col, sort=False, observed=False).first()
+    assert_frame_equal(result_sort, expected_sort)
+
+    df['range'] = Categorical(df['range'], ordered=False)
+    index = CategoricalIndex(['(0, 2.5]', '(2.5, 5]', '(5, 7.5]',
+                              '(7.5, 10]'], name='range')
+    expected_sort = DataFrame([[1, 60], [5, 30], [6, 40], [10, 10]],
+                              columns=['foo', 'bar'], index=index)
+
+    index = CategoricalIndex(['(7.5, 10]', '(2.5, 5]', '(5, 7.5]',
+                              '(0, 2.5]'],
+                             categories=['(7.5, 10]', '(2.5, 5]',
+                                         '(5, 7.5]', '(0, 2.5]'],
+                             name='range')
+    expected_nosort = DataFrame([[10, 10], [5, 30], [6, 40], [1, 60]],
+                                index=index, columns=['foo', 'bar'])
+
+    col = 'range'
+
+    # this is an unordered categorical, but we allow this ####
+    result_sort = df.groupby(col, sort=True, observed=False).first()
+    assert_frame_equal(result_sort, expected_sort)
+
+    result_nosort = df.groupby(col, sort=False, observed=False).first()
+    assert_frame_equal(result_nosort, expected_nosort)
+
+
+def test_sort_datetimelike():
+    # GH10505
+
+    # use same data as test_groupby_sort_categorical, which category is
+    # corresponding to datetime.month
+    df = DataFrame({'dt': [datetime(2011, 7, 1), datetime(2011, 7, 1),
+                           datetime(2011, 2, 1), datetime(2011, 5, 1),
+                           datetime(2011, 2, 1), datetime(2011, 1, 1),
+                           datetime(2011, 5, 1)],
+                    'foo': [10, 8, 5, 6, 4, 1, 7],
+                    'bar': [10, 20, 30, 40, 50, 60, 70]},
+                   columns=['dt', 'foo', 'bar'])
+
+    # ordered=True
+    df['dt'] = Categorical(df['dt'], ordered=True)
+    index = [datetime(2011, 1, 1), datetime(2011, 2, 1),
+             datetime(2011, 5, 1), datetime(2011, 7, 1)]
+    result_sort = DataFrame(
+        [[1, 60], [5, 30], [6, 40], [10, 10]], columns=['foo', 'bar'])
+    result_sort.index = CategoricalIndex(index, name='dt', ordered=True)
+
+    index = [datetime(2011, 7, 1), datetime(2011, 2, 1),
+             datetime(2011, 5, 1), datetime(2011, 1, 1)]
+    result_nosort = DataFrame([[10, 10], [5, 30], [6, 40], [1, 60]],
+                              columns=['foo', 'bar'])
+    result_nosort.index = CategoricalIndex(index, categories=index,
+                                           name='dt', ordered=True)
+
+    col = 'dt'
+    assert_frame_equal(
+        result_sort, df.groupby(col, sort=True, observed=False).first())
+
+    # when categories is ordered, group is ordered by category's order
+    assert_frame_equal(
+        result_sort, df.groupby(col, sort=False, observed=False).first())
+
+    # ordered = False
+    df['dt'] = Categorical(df['dt'], ordered=False)
+    index = [datetime(2011, 1, 1), datetime(2011, 2, 1),
+             datetime(2011, 5, 1), datetime(2011, 7, 1)]
+    result_sort = DataFrame(
+        [[1, 60], [5, 30], [6, 40], [10, 10]], columns=['foo', 'bar'])
+    result_sort.index = CategoricalIndex(index, name='dt')
+
+    index = [datetime(2011, 7, 1), datetime(2011, 2, 1),
+             datetime(2011, 5, 1), datetime(2011, 1, 1)]
+    result_nosort = DataFrame([[10, 10], [5, 30], [6, 40], [1, 60]],
+                              columns=['foo', 'bar'])
+    result_nosort.index = CategoricalIndex(index, categories=index,
+                                           name='dt')
+
+    col = 'dt'
+    assert_frame_equal(
+        result_sort, df.groupby(col, sort=True, observed=False).first())
+    assert_frame_equal(
+        result_nosort, df.groupby(col, sort=False, observed=False).first())
+
+
+def test_empty_sum():
+    # https://github.com/pandas-dev/pandas/issues/18678
+    df = pd.DataFrame({"A": pd.Categorical(['a', 'a', 'b'],
+                                           categories=['a', 'b', 'c']),
+                       'B': [1, 2, 1]})
+    expected_idx = pd.CategoricalIndex(['a', 'b', 'c'], name='A')
+
+    # 0 by default
+    result = df.groupby("A", observed=False).B.sum()
+    expected = pd.Series([3, 1, 0], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
+
+    # min_count=0
+    result = df.groupby("A", observed=False).B.sum(min_count=0)
+    expected = pd.Series([3, 1, 0], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
+
+    # min_count=1
+    result = df.groupby("A", observed=False).B.sum(min_count=1)
+    expected = pd.Series([3, 1, np.nan], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
+
+    # min_count>1
+    result = df.groupby("A", observed=False).B.sum(min_count=2)
+    expected = pd.Series([3, np.nan, np.nan], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
+
+
+def test_empty_prod():
+    # https://github.com/pandas-dev/pandas/issues/18678
+    df = pd.DataFrame({"A": pd.Categorical(['a', 'a', 'b'],
+                                           categories=['a', 'b', 'c']),
+                       'B': [1, 2, 1]})
+
+    expected_idx = pd.CategoricalIndex(['a', 'b', 'c'], name='A')
+
+    # 1 by default
+    result = df.groupby("A", observed=False).B.prod()
+    expected = pd.Series([2, 1, 1], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
+
+    # min_count=0
+    result = df.groupby("A", observed=False).B.prod(min_count=0)
+    expected = pd.Series([2, 1, 1], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
+
+    # min_count=1
+    result = df.groupby("A", observed=False).B.prod(min_count=1)
+    expected = pd.Series([2, 1, np.nan], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/groupby/test_counting.py b/pandas/tests/groupby/test_counting.py
new file mode 100644
index 0000000000000..787d99086873e
--- /dev/null
+++ b/pandas/tests/groupby/test_counting.py
@@ -0,0 +1,214 @@
+# -*- coding: utf-8 -*-
+from __future__ import print_function
+
+import numpy as np
+import pytest
+
+from pandas import (DataFrame, Series, MultiIndex, Timestamp, Timedelta,
+                    Period)
+from pandas.util.testing import (assert_series_equal, assert_frame_equal)
+from pandas.compat import (range, product as cart_product)
+
+
+class TestCounting(object):
+
+    def test_cumcount(self):
+        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'])
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series([0, 1, 2, 0, 3])
+
+        assert_series_equal(expected, g.cumcount())
+        assert_series_equal(expected, sg.cumcount())
+
+    def test_cumcount_empty(self):
+        ge = DataFrame().groupby(level=0)
+        se = Series().groupby(level=0)
+
+        # edge case, as this is usually considered float
+        e = Series(dtype='int64')
+
+        assert_series_equal(e, ge.cumcount())
+        assert_series_equal(e, se.cumcount())
+
+    def test_cumcount_dupe_index(self):
+        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'],
+                       index=[0] * 5)
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series([0, 1, 2, 0, 3], index=[0] * 5)
+
+        assert_series_equal(expected, g.cumcount())
+        assert_series_equal(expected, sg.cumcount())
+
+    def test_cumcount_mi(self):
+        mi = MultiIndex.from_tuples([[0, 1], [1, 2], [2, 2], [2, 2], [1, 0]])
+        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'],
+                       index=mi)
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series([0, 1, 2, 0, 3], index=mi)
+
+        assert_series_equal(expected, g.cumcount())
+        assert_series_equal(expected, sg.cumcount())
+
+    def test_cumcount_groupby_not_col(self):
+        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'],
+                       index=[0] * 5)
+        g = df.groupby([0, 0, 0, 1, 0])
+        sg = g.A
+
+        expected = Series([0, 1, 2, 0, 3], index=[0] * 5)
+
+        assert_series_equal(expected, g.cumcount())
+        assert_series_equal(expected, sg.cumcount())
+
+    def test_ngroup(self):
+        df = DataFrame({'A': list('aaaba')})
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series([0, 0, 0, 1, 0])
+
+        assert_series_equal(expected, g.ngroup())
+        assert_series_equal(expected, sg.ngroup())
+
+    def test_ngroup_distinct(self):
+        df = DataFrame({'A': list('abcde')})
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series(range(5), dtype='int64')
+
+        assert_series_equal(expected, g.ngroup())
+        assert_series_equal(expected, sg.ngroup())
+
+    def test_ngroup_one_group(self):
+        df = DataFrame({'A': [0] * 5})
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series([0] * 5)
+
+        assert_series_equal(expected, g.ngroup())
+        assert_series_equal(expected, sg.ngroup())
+
+    def test_ngroup_empty(self):
+        ge = DataFrame().groupby(level=0)
+        se = Series().groupby(level=0)
+
+        # edge case, as this is usually considered float
+        e = Series(dtype='int64')
+
+        assert_series_equal(e, ge.ngroup())
+        assert_series_equal(e, se.ngroup())
+
+    def test_ngroup_series_matches_frame(self):
+        df = DataFrame({'A': list('aaaba')})
+        s = Series(list('aaaba'))
+
+        assert_series_equal(df.groupby(s).ngroup(),
+                            s.groupby(s).ngroup())
+
+    def test_ngroup_dupe_index(self):
+        df = DataFrame({'A': list('aaaba')}, index=[0] * 5)
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series([0, 0, 0, 1, 0], index=[0] * 5)
+
+        assert_series_equal(expected, g.ngroup())
+        assert_series_equal(expected, sg.ngroup())
+
+    def test_ngroup_mi(self):
+        mi = MultiIndex.from_tuples([[0, 1], [1, 2], [2, 2], [2, 2], [1, 0]])
+        df = DataFrame({'A': list('aaaba')}, index=mi)
+        g = df.groupby('A')
+        sg = g.A
+        expected = Series([0, 0, 0, 1, 0], index=mi)
+
+        assert_series_equal(expected, g.ngroup())
+        assert_series_equal(expected, sg.ngroup())
+
+    def test_ngroup_groupby_not_col(self):
+        df = DataFrame({'A': list('aaaba')}, index=[0] * 5)
+        g = df.groupby([0, 0, 0, 1, 0])
+        sg = g.A
+
+        expected = Series([0, 0, 0, 1, 0], index=[0] * 5)
+
+        assert_series_equal(expected, g.ngroup())
+        assert_series_equal(expected, sg.ngroup())
+
+    def test_ngroup_descending(self):
+        df = DataFrame(['a', 'a', 'b', 'a', 'b'], columns=['A'])
+        g = df.groupby(['A'])
+
+        ascending = Series([0, 0, 1, 0, 1])
+        descending = Series([1, 1, 0, 1, 0])
+
+        assert_series_equal(descending, (g.ngroups - 1) - ascending)
+        assert_series_equal(ascending, g.ngroup(ascending=True))
+        assert_series_equal(descending, g.ngroup(ascending=False))
+
+    def test_ngroup_matches_cumcount(self):
+        # verify one manually-worked out case works
+        df = DataFrame([['a', 'x'], ['a', 'y'], ['b', 'x'],
+                        ['a', 'x'], ['b', 'y']], columns=['A', 'X'])
+        g = df.groupby(['A', 'X'])
+        g_ngroup = g.ngroup()
+        g_cumcount = g.cumcount()
+        expected_ngroup = Series([0, 1, 2, 0, 3])
+        expected_cumcount = Series([0, 0, 0, 1, 0])
+
+        assert_series_equal(g_ngroup, expected_ngroup)
+        assert_series_equal(g_cumcount, expected_cumcount)
+
+    def test_ngroup_cumcount_pair(self):
+        # brute force comparison for all small series
+        for p in cart_product(range(3), repeat=4):
+            df = DataFrame({'a': p})
+            g = df.groupby(['a'])
+
+            order = sorted(set(p))
+            ngroupd = [order.index(val) for val in p]
+            cumcounted = [p[:i].count(val) for i, val in enumerate(p)]
+
+            assert_series_equal(g.ngroup(), Series(ngroupd))
+            assert_series_equal(g.cumcount(), Series(cumcounted))
+
+    def test_ngroup_respects_groupby_order(self):
+        np.random.seed(0)
+        df = DataFrame({'a': np.random.choice(list('abcdef'), 100)})
+        for sort_flag in (False, True):
+            g = df.groupby(['a'], sort=sort_flag)
+            df['group_id'] = -1
+            df['group_index'] = -1
+
+            for i, (_, group) in enumerate(g):
+                df.loc[group.index, 'group_id'] = i
+                for j, ind in enumerate(group.index):
+                    df.loc[ind, 'group_index'] = j
+
+            assert_series_equal(Series(df['group_id'].values),
+                                g.ngroup())
+            assert_series_equal(Series(df['group_index'].values),
+                                g.cumcount())
+
+    @pytest.mark.parametrize('datetimelike', [
+        [Timestamp('2016-05-%02d 20:09:25+00:00' % i) for i in range(1, 4)],
+        [Timestamp('2016-05-%02d 20:09:25' % i) for i in range(1, 4)],
+        [Timedelta(x, unit="h") for x in range(1, 4)],
+        [Period(freq="2W", year=2017, month=x) for x in range(1, 4)]])
+    def test_count_with_datetimelike(self, datetimelike):
+        # test for #13393, where DataframeGroupBy.count() fails
+        # when counting a datetimelike column.
+
+        df = DataFrame({'x': ['a', 'a', 'b'], 'y': datetimelike})
+        res = df.groupby('x').count()
+        expected = DataFrame({'y': [2, 1]}, index=['a', 'b'])
+        expected.index.name = "x"
+        assert_frame_equal(expected, res)
diff --git a/pandas/tests/groupby/test_filters.py b/pandas/tests/groupby/test_filters.py
new file mode 100644
index 0000000000000..873d9f6076b69
--- /dev/null
+++ b/pandas/tests/groupby/test_filters.py
@@ -0,0 +1,576 @@
+# -*- coding: utf-8 -*-
+from __future__ import print_function
+import pytest
+
+import numpy as np
+import pandas.util.testing as tm
+from pandas import Timestamp, DataFrame, Series
+import pandas as pd
+
+
+def test_filter_series():
+    s = pd.Series([1, 3, 20, 5, 22, 24, 7])
+    expected_odd = pd.Series([1, 3, 5, 7], index=[0, 1, 3, 6])
+    expected_even = pd.Series([20, 22, 24], index=[2, 4, 5])
+    grouper = s.apply(lambda x: x % 2)
+    grouped = s.groupby(grouper)
+    tm.assert_series_equal(
+        grouped.filter(lambda x: x.mean() < 10), expected_odd)
+    tm.assert_series_equal(
+        grouped.filter(lambda x: x.mean() > 10), expected_even)
+    # Test dropna=False.
+    tm.assert_series_equal(
+        grouped.filter(lambda x: x.mean() < 10, dropna=False),
+        expected_odd.reindex(s.index))
+    tm.assert_series_equal(
+        grouped.filter(lambda x: x.mean() > 10, dropna=False),
+        expected_even.reindex(s.index))
+
+
+def test_filter_single_column_df():
+    df = pd.DataFrame([1, 3, 20, 5, 22, 24, 7])
+    expected_odd = pd.DataFrame([1, 3, 5, 7], index=[0, 1, 3, 6])
+    expected_even = pd.DataFrame([20, 22, 24], index=[2, 4, 5])
+    grouper = df[0].apply(lambda x: x % 2)
+    grouped = df.groupby(grouper)
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x.mean() < 10), expected_odd)
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x.mean() > 10), expected_even)
+    # Test dropna=False.
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x.mean() < 10, dropna=False),
+        expected_odd.reindex(df.index))
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x.mean() > 10, dropna=False),
+        expected_even.reindex(df.index))
+
+
+def test_filter_multi_column_df():
+    df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': [1, 1, 1, 1]})
+    grouper = df['A'].apply(lambda x: x % 2)
+    grouped = df.groupby(grouper)
+    expected = pd.DataFrame({'A': [12, 12], 'B': [1, 1]}, index=[1, 2])
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x['A'].sum() - x['B'].sum() > 10),
+        expected)
+
+
+def test_filter_mixed_df():
+    df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': 'a b c d'.split()})
+    grouper = df['A'].apply(lambda x: x % 2)
+    grouped = df.groupby(grouper)
+    expected = pd.DataFrame({'A': [12, 12], 'B': ['b', 'c']}, index=[1, 2])
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x['A'].sum() > 10), expected)
+
+
+def test_filter_out_all_groups():
+    s = pd.Series([1, 3, 20, 5, 22, 24, 7])
+    grouper = s.apply(lambda x: x % 2)
+    grouped = s.groupby(grouper)
+    tm.assert_series_equal(grouped.filter(lambda x: x.mean() > 1000), s[[]])
+    df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': 'a b c d'.split()})
+    grouper = df['A'].apply(lambda x: x % 2)
+    grouped = df.groupby(grouper)
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x['A'].sum() > 1000), df.loc[[]])
+
+
+def test_filter_out_no_groups():
+    s = pd.Series([1, 3, 20, 5, 22, 24, 7])
+    grouper = s.apply(lambda x: x % 2)
+    grouped = s.groupby(grouper)
+    filtered = grouped.filter(lambda x: x.mean() > 0)
+    tm.assert_series_equal(filtered, s)
+    df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': 'a b c d'.split()})
+    grouper = df['A'].apply(lambda x: x % 2)
+    grouped = df.groupby(grouper)
+    filtered = grouped.filter(lambda x: x['A'].mean() > 0)
+    tm.assert_frame_equal(filtered, df)
+
+
+def test_filter_out_all_groups_in_df():
+    # GH12768
+    df = pd.DataFrame({'a': [1, 1, 2], 'b': [1, 2, 0]})
+    res = df.groupby('a')
+    res = res.filter(lambda x: x['b'].sum() > 5, dropna=False)
+    expected = pd.DataFrame({'a': [np.nan] * 3, 'b': [np.nan] * 3})
+    tm.assert_frame_equal(expected, res)
+
+    df = pd.DataFrame({'a': [1, 1, 2], 'b': [1, 2, 0]})
+    res = df.groupby('a')
+    res = res.filter(lambda x: x['b'].sum() > 5, dropna=True)
+    expected = pd.DataFrame({'a': [], 'b': []}, dtype="int64")
+    tm.assert_frame_equal(expected, res)
+
+
+def test_filter_condition_raises():
+    def raise_if_sum_is_zero(x):
+        if x.sum() == 0:
+            raise ValueError
+        else:
+            return x.sum() > 0
+
+    s = pd.Series([-1, 0, 1, 2])
+    grouper = s.apply(lambda x: x % 2)
+    grouped = s.groupby(grouper)
+    pytest.raises(TypeError,
+                  lambda: grouped.filter(raise_if_sum_is_zero))
+
+
+def test_filter_with_axis_in_groupby():
+    # issue 11041
+    index = pd.MultiIndex.from_product([range(10), [0, 1]])
+    data = pd.DataFrame(
+        np.arange(100).reshape(-1, 20), columns=index, dtype='int64')
+    result = data.groupby(level=0,
+                          axis=1).filter(lambda x: x.iloc[0, 0] > 10)
+    expected = data.iloc[:, 12:20]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_filter_bad_shapes():
+    df = DataFrame({'A': np.arange(8),
+                    'B': list('aabbbbcc'),
+                    'C': np.arange(8)})
+    s = df['B']
+    g_df = df.groupby('B')
+    g_s = s.groupby(s)
+
+    f = lambda x: x
+    pytest.raises(TypeError, lambda: g_df.filter(f))
+    pytest.raises(TypeError, lambda: g_s.filter(f))
+
+    f = lambda x: x == 1
+    pytest.raises(TypeError, lambda: g_df.filter(f))
+    pytest.raises(TypeError, lambda: g_s.filter(f))
+
+    f = lambda x: np.outer(x, x)
+    pytest.raises(TypeError, lambda: g_df.filter(f))
+    pytest.raises(TypeError, lambda: g_s.filter(f))
+
+
+def test_filter_nan_is_false():
+    df = DataFrame({'A': np.arange(8),
+                    'B': list('aabbbbcc'),
+                    'C': np.arange(8)})
+    s = df['B']
+    g_df = df.groupby(df['B'])
+    g_s = s.groupby(s)
+
+    f = lambda x: np.nan
+    tm.assert_frame_equal(g_df.filter(f), df.loc[[]])
+    tm.assert_series_equal(g_s.filter(f), s[[]])
+
+
+def test_filter_against_workaround():
+    np.random.seed(0)
+    # Series of ints
+    s = Series(np.random.randint(0, 100, 1000))
+    grouper = s.apply(lambda x: np.round(x, -1))
+    grouped = s.groupby(grouper)
+    f = lambda x: x.mean() > 10
+
+    old_way = s[grouped.transform(f).astype('bool')]
+    new_way = grouped.filter(f)
+    tm.assert_series_equal(new_way.sort_values(), old_way.sort_values())
+
+    # Series of floats
+    s = 100 * Series(np.random.random(1000))
+    grouper = s.apply(lambda x: np.round(x, -1))
+    grouped = s.groupby(grouper)
+    f = lambda x: x.mean() > 10
+    old_way = s[grouped.transform(f).astype('bool')]
+    new_way = grouped.filter(f)
+    tm.assert_series_equal(new_way.sort_values(), old_way.sort_values())
+
+    # Set up DataFrame of ints, floats, strings.
+    from string import ascii_lowercase
+    letters = np.array(list(ascii_lowercase))
+    N = 1000
+    random_letters = letters.take(np.random.randint(0, 26, N))
+    df = DataFrame({'ints': Series(np.random.randint(0, 100, N)),
+                    'floats': N / 10 * Series(np.random.random(N)),
+                    'letters': Series(random_letters)})
+
+    # Group by ints; filter on floats.
+    grouped = df.groupby('ints')
+    old_way = df[grouped.floats.
+                 transform(lambda x: x.mean() > N / 20).astype('bool')]
+    new_way = grouped.filter(lambda x: x['floats'].mean() > N / 20)
+    tm.assert_frame_equal(new_way, old_way)
+
+    # Group by floats (rounded); filter on strings.
+    grouper = df.floats.apply(lambda x: np.round(x, -1))
+    grouped = df.groupby(grouper)
+    old_way = df[grouped.letters.
+                 transform(lambda x: len(x) < N / 10).astype('bool')]
+    new_way = grouped.filter(lambda x: len(x.letters) < N / 10)
+    tm.assert_frame_equal(new_way, old_way)
+
+    # Group by strings; filter on ints.
+    grouped = df.groupby('letters')
+    old_way = df[grouped.ints.
+                 transform(lambda x: x.mean() > N / 20).astype('bool')]
+    new_way = grouped.filter(lambda x: x['ints'].mean() > N / 20)
+    tm.assert_frame_equal(new_way, old_way)
+
+
+def test_filter_using_len():
+    # BUG GH4447
+    df = DataFrame({'A': np.arange(8),
+                    'B': list('aabbbbcc'),
+                    'C': np.arange(8)})
+    grouped = df.groupby('B')
+    actual = grouped.filter(lambda x: len(x) > 2)
+    expected = DataFrame(
+        {'A': np.arange(2, 6),
+         'B': list('bbbb'),
+         'C': np.arange(2, 6)}, index=np.arange(2, 6))
+    tm.assert_frame_equal(actual, expected)
+
+    actual = grouped.filter(lambda x: len(x) > 4)
+    expected = df.loc[[]]
+    tm.assert_frame_equal(actual, expected)
+
+    # Series have always worked properly, but we'll test anyway.
+    s = df['B']
+    grouped = s.groupby(s)
+    actual = grouped.filter(lambda x: len(x) > 2)
+    expected = Series(4 * ['b'], index=np.arange(2, 6), name='B')
+    tm.assert_series_equal(actual, expected)
+
+    actual = grouped.filter(lambda x: len(x) > 4)
+    expected = s[[]]
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_maintains_ordering():
+    # Simple case: index is sequential. #4621
+    df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
+                    'tag': [23, 45, 62, 24, 45, 34, 25, 62]})
+    s = df['pid']
+    grouped = df.groupby('tag')
+    actual = grouped.filter(lambda x: len(x) > 1)
+    expected = df.iloc[[1, 2, 4, 7]]
+    tm.assert_frame_equal(actual, expected)
+
+    grouped = s.groupby(df['tag'])
+    actual = grouped.filter(lambda x: len(x) > 1)
+    expected = s.iloc[[1, 2, 4, 7]]
+    tm.assert_series_equal(actual, expected)
+
+    # Now index is sequentially decreasing.
+    df.index = np.arange(len(df) - 1, -1, -1)
+    s = df['pid']
+    grouped = df.groupby('tag')
+    actual = grouped.filter(lambda x: len(x) > 1)
+    expected = df.iloc[[1, 2, 4, 7]]
+    tm.assert_frame_equal(actual, expected)
+
+    grouped = s.groupby(df['tag'])
+    actual = grouped.filter(lambda x: len(x) > 1)
+    expected = s.iloc[[1, 2, 4, 7]]
+    tm.assert_series_equal(actual, expected)
+
+    # Index is shuffled.
+    SHUFFLED = [4, 6, 7, 2, 1, 0, 5, 3]
+    df.index = df.index[SHUFFLED]
+    s = df['pid']
+    grouped = df.groupby('tag')
+    actual = grouped.filter(lambda x: len(x) > 1)
+    expected = df.iloc[[1, 2, 4, 7]]
+    tm.assert_frame_equal(actual, expected)
+
+    grouped = s.groupby(df['tag'])
+    actual = grouped.filter(lambda x: len(x) > 1)
+    expected = s.iloc[[1, 2, 4, 7]]
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_multiple_timestamp():
+    # GH 10114
+    df = DataFrame({'A': np.arange(5, dtype='int64'),
+                    'B': ['foo', 'bar', 'foo', 'bar', 'bar'],
+                    'C': Timestamp('20130101')})
+
+    grouped = df.groupby(['B', 'C'])
+
+    result = grouped['A'].filter(lambda x: True)
+    tm.assert_series_equal(df['A'], result)
+
+    result = grouped['A'].transform(len)
+    expected = Series([2, 3, 2, 3, 3], name='A')
+    tm.assert_series_equal(result, expected)
+
+    result = grouped.filter(lambda x: True)
+    tm.assert_frame_equal(df, result)
+
+    result = grouped.transform('sum')
+    expected = DataFrame({'A': [2, 8, 2, 8, 8]})
+    tm.assert_frame_equal(result, expected)
+
+    result = grouped.transform(len)
+    expected = DataFrame({'A': [2, 3, 2, 3, 3]})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_filter_and_transform_with_non_unique_int_index():
+    # GH4620
+    index = [1, 1, 1, 2, 1, 1, 0, 1]
+    df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
+                    'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
+    grouped_df = df.groupby('tag')
+    ser = df['pid']
+    grouped_ser = ser.groupby(df['tag'])
+    expected_indexes = [1, 2, 4, 7]
+
+    # Filter DataFrame
+    actual = grouped_df.filter(lambda x: len(x) > 1)
+    expected = df.iloc[expected_indexes]
+    tm.assert_frame_equal(actual, expected)
+
+    actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
+    expected = df.copy()
+    expected.iloc[[0, 3, 5, 6]] = np.nan
+    tm.assert_frame_equal(actual, expected)
+
+    # Filter Series
+    actual = grouped_ser.filter(lambda x: len(x) > 1)
+    expected = ser.take(expected_indexes)
+    tm.assert_series_equal(actual, expected)
+
+    actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
+    NA = np.nan
+    expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
+    # ^ made manually because this can get confusing!
+    tm.assert_series_equal(actual, expected)
+
+    # Transform Series
+    actual = grouped_ser.transform(len)
+    expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
+    tm.assert_series_equal(actual, expected)
+
+    # Transform (a column from) DataFrameGroupBy
+    actual = grouped_df.pid.transform(len)
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_and_transform_with_multiple_non_unique_int_index():
+    # GH4620
+    index = [1, 1, 1, 2, 0, 0, 0, 1]
+    df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
+                    'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
+    grouped_df = df.groupby('tag')
+    ser = df['pid']
+    grouped_ser = ser.groupby(df['tag'])
+    expected_indexes = [1, 2, 4, 7]
+
+    # Filter DataFrame
+    actual = grouped_df.filter(lambda x: len(x) > 1)
+    expected = df.iloc[expected_indexes]
+    tm.assert_frame_equal(actual, expected)
+
+    actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
+    expected = df.copy()
+    expected.iloc[[0, 3, 5, 6]] = np.nan
+    tm.assert_frame_equal(actual, expected)
+
+    # Filter Series
+    actual = grouped_ser.filter(lambda x: len(x) > 1)
+    expected = ser.take(expected_indexes)
+    tm.assert_series_equal(actual, expected)
+
+    actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
+    NA = np.nan
+    expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
+    # ^ made manually because this can get confusing!
+    tm.assert_series_equal(actual, expected)
+
+    # Transform Series
+    actual = grouped_ser.transform(len)
+    expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
+    tm.assert_series_equal(actual, expected)
+
+    # Transform (a column from) DataFrameGroupBy
+    actual = grouped_df.pid.transform(len)
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_and_transform_with_non_unique_float_index():
+    # GH4620
+    index = np.array([1, 1, 1, 2, 1, 1, 0, 1], dtype=float)
+    df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
+                    'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
+    grouped_df = df.groupby('tag')
+    ser = df['pid']
+    grouped_ser = ser.groupby(df['tag'])
+    expected_indexes = [1, 2, 4, 7]
+
+    # Filter DataFrame
+    actual = grouped_df.filter(lambda x: len(x) > 1)
+    expected = df.iloc[expected_indexes]
+    tm.assert_frame_equal(actual, expected)
+
+    actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
+    expected = df.copy()
+    expected.iloc[[0, 3, 5, 6]] = np.nan
+    tm.assert_frame_equal(actual, expected)
+
+    # Filter Series
+    actual = grouped_ser.filter(lambda x: len(x) > 1)
+    expected = ser.take(expected_indexes)
+    tm.assert_series_equal(actual, expected)
+
+    actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
+    NA = np.nan
+    expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
+    # ^ made manually because this can get confusing!
+    tm.assert_series_equal(actual, expected)
+
+    # Transform Series
+    actual = grouped_ser.transform(len)
+    expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
+    tm.assert_series_equal(actual, expected)
+
+    # Transform (a column from) DataFrameGroupBy
+    actual = grouped_df.pid.transform(len)
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_and_transform_with_non_unique_timestamp_index():
+    # GH4620
+    t0 = Timestamp('2013-09-30 00:05:00')
+    t1 = Timestamp('2013-10-30 00:05:00')
+    t2 = Timestamp('2013-11-30 00:05:00')
+    index = [t1, t1, t1, t2, t1, t1, t0, t1]
+    df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
+                    'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
+    grouped_df = df.groupby('tag')
+    ser = df['pid']
+    grouped_ser = ser.groupby(df['tag'])
+    expected_indexes = [1, 2, 4, 7]
+
+    # Filter DataFrame
+    actual = grouped_df.filter(lambda x: len(x) > 1)
+    expected = df.iloc[expected_indexes]
+    tm.assert_frame_equal(actual, expected)
+
+    actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
+    expected = df.copy()
+    expected.iloc[[0, 3, 5, 6]] = np.nan
+    tm.assert_frame_equal(actual, expected)
+
+    # Filter Series
+    actual = grouped_ser.filter(lambda x: len(x) > 1)
+    expected = ser.take(expected_indexes)
+    tm.assert_series_equal(actual, expected)
+
+    actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
+    NA = np.nan
+    expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
+    # ^ made manually because this can get confusing!
+    tm.assert_series_equal(actual, expected)
+
+    # Transform Series
+    actual = grouped_ser.transform(len)
+    expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
+    tm.assert_series_equal(actual, expected)
+
+    # Transform (a column from) DataFrameGroupBy
+    actual = grouped_df.pid.transform(len)
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_and_transform_with_non_unique_string_index():
+    # GH4620
+    index = list('bbbcbbab')
+    df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
+                    'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
+    grouped_df = df.groupby('tag')
+    ser = df['pid']
+    grouped_ser = ser.groupby(df['tag'])
+    expected_indexes = [1, 2, 4, 7]
+
+    # Filter DataFrame
+    actual = grouped_df.filter(lambda x: len(x) > 1)
+    expected = df.iloc[expected_indexes]
+    tm.assert_frame_equal(actual, expected)
+
+    actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
+    expected = df.copy()
+    expected.iloc[[0, 3, 5, 6]] = np.nan
+    tm.assert_frame_equal(actual, expected)
+
+    # Filter Series
+    actual = grouped_ser.filter(lambda x: len(x) > 1)
+    expected = ser.take(expected_indexes)
+    tm.assert_series_equal(actual, expected)
+
+    actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
+    NA = np.nan
+    expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
+    # ^ made manually because this can get confusing!
+    tm.assert_series_equal(actual, expected)
+
+    # Transform Series
+    actual = grouped_ser.transform(len)
+    expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
+    tm.assert_series_equal(actual, expected)
+
+    # Transform (a column from) DataFrameGroupBy
+    actual = grouped_df.pid.transform(len)
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_has_access_to_grouped_cols():
+    df = DataFrame([[1, 2], [1, 3], [5, 6]], columns=['A', 'B'])
+    g = df.groupby('A')
+    # previously didn't have access to col A #????
+    filt = g.filter(lambda x: x['A'].sum() == 2)
+    tm.assert_frame_equal(filt, df.iloc[[0, 1]])
+
+
+def test_filter_enforces_scalarness():
+    df = pd.DataFrame([
+        ['best', 'a', 'x'],
+        ['worst', 'b', 'y'],
+        ['best', 'c', 'x'],
+        ['best', 'd', 'y'],
+        ['worst', 'd', 'y'],
+        ['worst', 'd', 'y'],
+        ['best', 'd', 'z'],
+    ], columns=['a', 'b', 'c'])
+    with tm.assert_raises_regex(TypeError,
+                                'filter function returned a.*'):
+        df.groupby('c').filter(lambda g: g['a'] == 'best')
+
+
+def test_filter_non_bool_raises():
+    df = pd.DataFrame([
+        ['best', 'a', 1],
+        ['worst', 'b', 1],
+        ['best', 'c', 1],
+        ['best', 'd', 1],
+        ['worst', 'd', 1],
+        ['worst', 'd', 1],
+        ['best', 'd', 1],
+    ], columns=['a', 'b', 'c'])
+    with tm.assert_raises_regex(TypeError,
+                                'filter function returned a.*'):
+        df.groupby('a').filter(lambda g: g.c.mean())
+
+
+def test_filter_dropna_with_empty_groups():
+    # GH 10780
+    data = pd.Series(np.random.rand(9), index=np.repeat([1, 2, 3], 3))
+    groupped = data.groupby(level=0)
+    result_false = groupped.filter(lambda x: x.mean() > 1, dropna=False)
+    expected_false = pd.Series([np.nan] * 9,
+                               index=np.repeat([1, 2, 3], 3))
+    tm.assert_series_equal(result_false, expected_false)
+
+    result_true = groupped.filter(lambda x: x.mean() > 1, dropna=True)
+    expected_true = pd.Series(index=pd.Index([], dtype=int))
+    tm.assert_series_equal(result_true, expected_true)
diff --git a/pandas/tests/groupby/test_function.py b/pandas/tests/groupby/test_function.py
new file mode 100644
index 0000000000000..9df362a8e132f
--- /dev/null
+++ b/pandas/tests/groupby/test_function.py
@@ -0,0 +1,1121 @@
+import pytest
+
+import numpy as np
+import pandas as pd
+from pandas import (DataFrame, Index, compat, isna,
+                    Series, MultiIndex, Timestamp, date_range)
+from pandas.errors import UnsupportedFunctionCall
+from pandas.util import testing as tm
+import pandas.core.nanops as nanops
+from string import ascii_lowercase
+from pandas.compat import product as cart_product
+
+
+@pytest.mark.parametrize("agg_func", ['any', 'all'])
+@pytest.mark.parametrize("skipna", [True, False])
+@pytest.mark.parametrize("vals", [
+    ['foo', 'bar', 'baz'], ['foo', '', ''], ['', '', ''],
+    [1, 2, 3], [1, 0, 0], [0, 0, 0],
+    [1., 2., 3.], [1., 0., 0.], [0., 0., 0.],
+    [True, True, True], [True, False, False], [False, False, False],
+    [np.nan, np.nan, np.nan]
+])
+def test_groupby_bool_aggs(agg_func, skipna, vals):
+    df = DataFrame({'key': ['a'] * 3 + ['b'] * 3, 'val': vals * 2})
+
+    # Figure out expectation using Python builtin
+    exp = getattr(compat.builtins, agg_func)(vals)
+
+    # edge case for missing data with skipna and 'any'
+    if skipna and all(isna(vals)) and agg_func == 'any':
+        exp = False
+
+    exp_df = DataFrame([exp] * 2, columns=['val'], index=Index(
+        ['a', 'b'], name='key'))
+    result = getattr(df.groupby('key'), agg_func)(skipna=skipna)
+    tm.assert_frame_equal(result, exp_df)
+
+
+def test_max_min_non_numeric():
+    # #2700
+    aa = DataFrame({'nn': [11, 11, 22, 22],
+                    'ii': [1, 2, 3, 4],
+                    'ss': 4 * ['mama']})
+
+    result = aa.groupby('nn').max()
+    assert 'ss' in result
+
+    result = aa.groupby('nn').max(numeric_only=False)
+    assert 'ss' in result
+
+    result = aa.groupby('nn').min()
+    assert 'ss' in result
+
+    result = aa.groupby('nn').min(numeric_only=False)
+    assert 'ss' in result
+
+
+def test_intercept_builtin_sum():
+    s = Series([1., 2., np.nan, 3.])
+    grouped = s.groupby([0, 1, 2, 2])
+
+    result = grouped.agg(compat.builtins.sum)
+    result2 = grouped.apply(compat.builtins.sum)
+    expected = grouped.sum()
+    tm.assert_series_equal(result, expected)
+    tm.assert_series_equal(result2, expected)
+
+
+def test_builtins_apply():  # GH8155
+    df = pd.DataFrame(np.random.randint(1, 50, (1000, 2)),
+                      columns=['jim', 'joe'])
+    df['jolie'] = np.random.randn(1000)
+
+    for keys in ['jim', ['jim', 'joe']]:  # single key & multi-key
+        if keys == 'jim':
+            continue
+        for f in [max, min, sum]:
+            fname = f.__name__
+            result = df.groupby(keys).apply(f)
+            result.shape
+            ngroups = len(df.drop_duplicates(subset=keys))
+            assert result.shape == (ngroups, 3), 'invalid frame shape: '\
+                '{} (expected ({}, 3))'.format(result.shape, ngroups)
+
+            tm.assert_frame_equal(result,  # numpy's equivalent function
+                                  df.groupby(keys).apply(getattr(np, fname)))
+
+            if f != sum:
+                expected = df.groupby(keys).agg(fname).reset_index()
+                expected.set_index(keys, inplace=True, drop=False)
+                tm.assert_frame_equal(result, expected, check_dtype=False)
+
+            tm.assert_series_equal(getattr(result, fname)(),
+                                   getattr(df, fname)())
+
+
+def test_arg_passthru():
+    # make sure that we are passing thru kwargs
+    # to our agg functions
+
+    # GH3668
+    # GH5724
+    df = pd.DataFrame(
+        {'group': [1, 1, 2],
+         'int': [1, 2, 3],
+         'float': [4., 5., 6.],
+         'string': list('abc'),
+         'category_string': pd.Series(list('abc')).astype('category'),
+         'category_int': [7, 8, 9],
+         'datetime': pd.date_range('20130101', periods=3),
+         'datetimetz': pd.date_range('20130101',
+                                     periods=3,
+                                     tz='US/Eastern'),
+         'timedelta': pd.timedelta_range('1 s', periods=3, freq='s')},
+        columns=['group', 'int', 'float', 'string',
+                 'category_string', 'category_int',
+                 'datetime', 'datetimetz',
+                 'timedelta'])
+
+    expected_columns_numeric = Index(['int', 'float', 'category_int'])
+
+    # mean / median
+    expected = pd.DataFrame(
+        {'category_int': [7.5, 9],
+         'float': [4.5, 6.],
+         'timedelta': [pd.Timedelta('1.5s'),
+                       pd.Timedelta('3s')],
+         'int': [1.5, 3],
+         'datetime': [pd.Timestamp('2013-01-01 12:00:00'),
+                      pd.Timestamp('2013-01-03 00:00:00')],
+         'datetimetz': [
+             pd.Timestamp('2013-01-01 12:00:00', tz='US/Eastern'),
+             pd.Timestamp('2013-01-03 00:00:00', tz='US/Eastern')]},
+        index=Index([1, 2], name='group'),
+        columns=['int', 'float', 'category_int',
+                 'datetime', 'datetimetz', 'timedelta'])
+    for attr in ['mean', 'median']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        tm.assert_index_equal(result.columns, expected_columns_numeric)
+
+        result = f(numeric_only=False)
+        tm.assert_frame_equal(result.reindex_like(expected), expected)
+
+    # TODO: min, max *should* handle
+    # categorical (ordered) dtype
+    expected_columns = Index(['int', 'float', 'string',
+                              'category_int',
+                              'datetime', 'datetimetz',
+                              'timedelta'])
+    for attr in ['min', 'max']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        tm.assert_index_equal(result.columns, expected_columns)
+
+        result = f(numeric_only=False)
+        tm.assert_index_equal(result.columns, expected_columns)
+
+    expected_columns = Index(['int', 'float', 'string',
+                              'category_string', 'category_int',
+                              'datetime', 'datetimetz',
+                              'timedelta'])
+    for attr in ['first', 'last']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        tm.assert_index_equal(result.columns, expected_columns)
+
+        result = f(numeric_only=False)
+        tm.assert_index_equal(result.columns, expected_columns)
+
+    expected_columns = Index(['int', 'float', 'string',
+                              'category_int', 'timedelta'])
+    for attr in ['sum']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        tm.assert_index_equal(result.columns, expected_columns_numeric)
+
+        result = f(numeric_only=False)
+        tm.assert_index_equal(result.columns, expected_columns)
+
+    expected_columns = Index(['int', 'float', 'category_int'])
+    for attr in ['prod', 'cumprod']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        tm.assert_index_equal(result.columns, expected_columns_numeric)
+
+        result = f(numeric_only=False)
+        tm.assert_index_equal(result.columns, expected_columns)
+
+    # like min, max, but don't include strings
+    expected_columns = Index(['int', 'float',
+                              'category_int',
+                              'datetime', 'datetimetz',
+                              'timedelta'])
+    for attr in ['cummin', 'cummax']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        # GH 15561: numeric_only=False set by default like min/max
+        tm.assert_index_equal(result.columns, expected_columns)
+
+        result = f(numeric_only=False)
+        tm.assert_index_equal(result.columns, expected_columns)
+
+    expected_columns = Index(['int', 'float', 'category_int',
+                              'timedelta'])
+    for attr in ['cumsum']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        tm.assert_index_equal(result.columns, expected_columns_numeric)
+
+        result = f(numeric_only=False)
+        tm.assert_index_equal(result.columns, expected_columns)
+
+
+def test_non_cython_api():
+
+    # GH5610
+    # non-cython calls should not include the grouper
+
+    df = DataFrame(
+        [[1, 2, 'foo'],
+         [1, np.nan, 'bar'],
+         [3, np.nan, 'baz']],
+        columns=['A', 'B', 'C'])
+    g = df.groupby('A')
+    gni = df.groupby('A', as_index=False)
+
+    # mad
+    expected = DataFrame([[0], [np.nan]], columns=['B'], index=[1, 3])
+    expected.index.name = 'A'
+    result = g.mad()
+    tm.assert_frame_equal(result, expected)
+
+    expected = DataFrame([[0., 0.], [0, np.nan]], columns=['A', 'B'],
+                         index=[0, 1])
+    result = gni.mad()
+    tm.assert_frame_equal(result, expected)
+
+    # describe
+    expected_index = pd.Index([1, 3], name='A')
+    expected_col = pd.MultiIndex(levels=[['B'],
+                                         ['count', 'mean', 'std', 'min',
+                                          '25%', '50%', '75%', 'max']],
+                                 labels=[[0] * 8, list(range(8))])
+    expected = pd.DataFrame([[1.0, 2.0, np.nan, 2.0, 2.0, 2.0, 2.0, 2.0],
+                             [0.0, np.nan, np.nan, np.nan, np.nan, np.nan,
+                              np.nan, np.nan]],
+                            index=expected_index,
+                            columns=expected_col)
+    result = g.describe()
+    tm.assert_frame_equal(result, expected)
+
+    expected = pd.concat([df[df.A == 1].describe().unstack().to_frame().T,
+                          df[df.A == 3].describe().unstack().to_frame().T])
+    expected.index = pd.Index([0, 1])
+    result = gni.describe()
+    tm.assert_frame_equal(result, expected)
+
+    # any
+    expected = DataFrame([[True, True], [False, True]], columns=['B', 'C'],
+                         index=[1, 3])
+    expected.index.name = 'A'
+    result = g.any()
+    tm.assert_frame_equal(result, expected)
+
+    # idxmax
+    expected = DataFrame([[0.0], [np.nan]], columns=['B'], index=[1, 3])
+    expected.index.name = 'A'
+    result = g.idxmax()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_cython_api2():
+
+    # this takes the fast apply path
+
+    # cumsum (GH5614)
+    df = DataFrame(
+        [[1, 2, np.nan], [1, np.nan, 9], [3, 4, 9]
+         ], columns=['A', 'B', 'C'])
+    expected = DataFrame(
+        [[2, np.nan], [np.nan, 9], [4, 9]], columns=['B', 'C'])
+    result = df.groupby('A').cumsum()
+    tm.assert_frame_equal(result, expected)
+
+    # GH 5755 - cumsum is a transformer and should ignore as_index
+    result = df.groupby('A', as_index=False).cumsum()
+    tm.assert_frame_equal(result, expected)
+
+    # GH 13994
+    result = df.groupby('A').cumsum(axis=1)
+    expected = df.cumsum(axis=1)
+    tm.assert_frame_equal(result, expected)
+    result = df.groupby('A').cumprod(axis=1)
+    expected = df.cumprod(axis=1)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_cython_median():
+    df = DataFrame(np.random.randn(1000))
+    df.values[::2] = np.nan
+
+    labels = np.random.randint(0, 50, size=1000).astype(float)
+    labels[::17] = np.nan
+
+    result = df.groupby(labels).median()
+    exp = df.groupby(labels).agg(nanops.nanmedian)
+    tm.assert_frame_equal(result, exp)
+
+    df = DataFrame(np.random.randn(1000, 5))
+    rs = df.groupby(labels).agg(np.median)
+    xp = df.groupby(labels).median()
+    tm.assert_frame_equal(rs, xp)
+
+
+def test_median_empty_bins(observed):
+    df = pd.DataFrame(np.random.randint(0, 44, 500))
+
+    grps = range(0, 55, 5)
+    bins = pd.cut(df[0], grps)
+
+    result = df.groupby(bins, observed=observed).median()
+    expected = df.groupby(bins, observed=observed).agg(lambda x: x.median())
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("dtype", [
+    'int8', 'int16', 'int32', 'int64', 'float32', 'float64'])
+@pytest.mark.parametrize("method,data", [
+    ('first', {'df': [{'a': 1, 'b': 1}, {'a': 2, 'b': 3}]}),
+    ('last', {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 4}]}),
+    ('min', {'df': [{'a': 1, 'b': 1}, {'a': 2, 'b': 3}]}),
+    ('max', {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 4}]}),
+    ('nth', {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 4}],
+             'args': [1]}),
+    ('count', {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 2}],
+               'out_type': 'int64'})
+])
+def test_groupby_non_arithmetic_agg_types(dtype, method, data):
+    # GH9311, GH6620
+    df = pd.DataFrame(
+        [{'a': 1, 'b': 1},
+         {'a': 1, 'b': 2},
+         {'a': 2, 'b': 3},
+         {'a': 2, 'b': 4}])
+
+    df['b'] = df.b.astype(dtype)
+
+    if 'args' not in data:
+        data['args'] = []
+
+    if 'out_type' in data:
+        out_type = data['out_type']
+    else:
+        out_type = dtype
+
+    exp = data['df']
+    df_out = pd.DataFrame(exp)
+
+    df_out['b'] = df_out.b.astype(out_type)
+    df_out.set_index('a', inplace=True)
+
+    grpd = df.groupby('a')
+    t = getattr(grpd, method)(*data['args'])
+    tm.assert_frame_equal(t, df_out)
+
+
+def test_groupby_non_arithmetic_agg_intlike_precision():
+    # GH9311, GH6620
+    c = 24650000000000000
+
+    inputs = ((Timestamp('2011-01-15 12:50:28.502376'),
+               Timestamp('2011-01-20 12:50:28.593448')), (1 + c, 2 + c))
+
+    for i in inputs:
+        df = pd.DataFrame([{'a': 1, 'b': i[0]}, {'a': 1, 'b': i[1]}])
+
+        grp_exp = {'first': {'expected': i[0]},
+                   'last': {'expected': i[1]},
+                   'min': {'expected': i[0]},
+                   'max': {'expected': i[1]},
+                   'nth': {'expected': i[1],
+                           'args': [1]},
+                   'count': {'expected': 2}}
+
+        for method, data in compat.iteritems(grp_exp):
+            if 'args' not in data:
+                data['args'] = []
+
+            grpd = df.groupby('a')
+            res = getattr(grpd, method)(*data['args'])
+            assert res.iloc[0].b == data['expected']
+
+
+def test_fill_constistency():
+
+    # GH9221
+    # pass thru keyword arguments to the generated wrapper
+    # are set if the passed kw is None (only)
+    df = DataFrame(index=pd.MultiIndex.from_product(
+        [['value1', 'value2'], date_range('2014-01-01', '2014-01-06')]),
+        columns=Index(
+        ['1', '2'], name='id'))
+    df['1'] = [np.nan, 1, np.nan, np.nan, 11, np.nan, np.nan, 2, np.nan,
+               np.nan, 22, np.nan]
+    df['2'] = [np.nan, 3, np.nan, np.nan, 33, np.nan, np.nan, 4, np.nan,
+               np.nan, 44, np.nan]
+
+    expected = df.groupby(level=0, axis=0).fillna(method='ffill')
+    result = df.T.groupby(level=0, axis=1).fillna(method='ffill').T
+    tm.assert_frame_equal(result, expected)
+
+
+def test_groupby_cumprod():
+    # GH 4095
+    df = pd.DataFrame({'key': ['b'] * 10, 'value': 2})
+
+    actual = df.groupby('key')['value'].cumprod()
+    expected = df.groupby('key')['value'].apply(lambda x: x.cumprod())
+    expected.name = 'value'
+    tm.assert_series_equal(actual, expected)
+
+    df = pd.DataFrame({'key': ['b'] * 100, 'value': 2})
+    actual = df.groupby('key')['value'].cumprod()
+    # if overflows, groupby product casts to float
+    # while numpy passes back invalid values
+    df['value'] = df['value'].astype(float)
+    expected = df.groupby('key')['value'].apply(lambda x: x.cumprod())
+    expected.name = 'value'
+    tm.assert_series_equal(actual, expected)
+
+
+def test_ops_general():
+    ops = [('mean', np.mean),
+           ('median', np.median),
+           ('std', np.std),
+           ('var', np.var),
+           ('sum', np.sum),
+           ('prod', np.prod),
+           ('min', np.min),
+           ('max', np.max),
+           ('first', lambda x: x.iloc[0]),
+           ('last', lambda x: x.iloc[-1]),
+           ('count', np.size), ]
+    try:
+        from scipy.stats import sem
+    except ImportError:
+        pass
+    else:
+        ops.append(('sem', sem))
+    df = DataFrame(np.random.randn(1000))
+    labels = np.random.randint(0, 50, size=1000).astype(float)
+
+    for op, targop in ops:
+        result = getattr(df.groupby(labels), op)().astype(float)
+        expected = df.groupby(labels).agg(targop)
+        try:
+            tm.assert_frame_equal(result, expected)
+        except BaseException as exc:
+            exc.args += ('operation: %s' % op, )
+            raise
+
+
+def test_max_nan_bug():
+    raw = """,Date,app,File
+-04-23,2013-04-23 00:00:00,,log080001.log
+-05-06,2013-05-06 00:00:00,,log.log
+-05-07,2013-05-07 00:00:00,OE,xlsx"""
+
+    df = pd.read_csv(compat.StringIO(raw), parse_dates=[0])
+    gb = df.groupby('Date')
+    r = gb[['File']].max()
+    e = gb['File'].max().to_frame()
+    tm.assert_frame_equal(r, e)
+    assert not r['File'].isna().any()
+
+
+def test_nlargest():
+    a = Series([1, 3, 5, 7, 2, 9, 0, 4, 6, 10])
+    b = Series(list('a' * 5 + 'b' * 5))
+    gb = a.groupby(b)
+    r = gb.nlargest(3)
+    e = Series([
+        7, 5, 3, 10, 9, 6
+    ], index=MultiIndex.from_arrays([list('aaabbb'), [3, 2, 1, 9, 5, 8]]))
+    tm.assert_series_equal(r, e)
+
+    a = Series([1, 1, 3, 2, 0, 3, 3, 2, 1, 0])
+    gb = a.groupby(b)
+    e = Series([
+        3, 2, 1, 3, 3, 2
+    ], index=MultiIndex.from_arrays([list('aaabbb'), [2, 3, 1, 6, 5, 7]]))
+    tm.assert_series_equal(gb.nlargest(3, keep='last'), e)
+
+
+def test_nsmallest():
+    a = Series([1, 3, 5, 7, 2, 9, 0, 4, 6, 10])
+    b = Series(list('a' * 5 + 'b' * 5))
+    gb = a.groupby(b)
+    r = gb.nsmallest(3)
+    e = Series([
+        1, 2, 3, 0, 4, 6
+    ], index=MultiIndex.from_arrays([list('aaabbb'), [0, 4, 1, 6, 7, 8]]))
+    tm.assert_series_equal(r, e)
+
+    a = Series([1, 1, 3, 2, 0, 3, 3, 2, 1, 0])
+    gb = a.groupby(b)
+    e = Series([
+        0, 1, 1, 0, 1, 2
+    ], index=MultiIndex.from_arrays([list('aaabbb'), [4, 1, 0, 9, 8, 7]]))
+    tm.assert_series_equal(gb.nsmallest(3, keep='last'), e)
+
+
+def test_numpy_compat():
+    # see gh-12811
+    df = pd.DataFrame({'A': [1, 2, 1], 'B': [1, 2, 3]})
+    g = df.groupby('A')
+
+    msg = "numpy operations are not valid with groupby"
+
+    for func in ('mean', 'var', 'std', 'cumprod', 'cumsum'):
+        tm.assert_raises_regex(UnsupportedFunctionCall, msg,
+                               getattr(g, func), 1, 2, 3)
+        tm.assert_raises_regex(UnsupportedFunctionCall, msg,
+                               getattr(g, func), foo=1)
+
+
+def test_cummin_cummax():
+    # GH 15048
+    num_types = [np.int32, np.int64, np.float32, np.float64]
+    num_mins = [np.iinfo(np.int32).min, np.iinfo(np.int64).min,
+                np.finfo(np.float32).min, np.finfo(np.float64).min]
+    num_max = [np.iinfo(np.int32).max, np.iinfo(np.int64).max,
+               np.finfo(np.float32).max, np.finfo(np.float64).max]
+    base_df = pd.DataFrame({'A': [1, 1, 1, 1, 2, 2, 2, 2],
+                            'B': [3, 4, 3, 2, 2, 3, 2, 1]})
+    expected_mins = [3, 3, 3, 2, 2, 2, 2, 1]
+    expected_maxs = [3, 4, 4, 4, 2, 3, 3, 3]
+
+    for dtype, min_val, max_val in zip(num_types, num_mins, num_max):
+        df = base_df.astype(dtype)
+
+        # cummin
+        expected = pd.DataFrame({'B': expected_mins}).astype(dtype)
+        result = df.groupby('A').cummin()
+        tm.assert_frame_equal(result, expected)
+        result = df.groupby('A').B.apply(lambda x: x.cummin()).to_frame()
+        tm.assert_frame_equal(result, expected)
+
+        # Test cummin w/ min value for dtype
+        df.loc[[2, 6], 'B'] = min_val
+        expected.loc[[2, 3, 6, 7], 'B'] = min_val
+        result = df.groupby('A').cummin()
+        tm.assert_frame_equal(result, expected)
+        expected = df.groupby('A').B.apply(lambda x: x.cummin()).to_frame()
+        tm.assert_frame_equal(result, expected)
+
+        # cummax
+        expected = pd.DataFrame({'B': expected_maxs}).astype(dtype)
+        result = df.groupby('A').cummax()
+        tm.assert_frame_equal(result, expected)
+        result = df.groupby('A').B.apply(lambda x: x.cummax()).to_frame()
+        tm.assert_frame_equal(result, expected)
+
+        # Test cummax w/ max value for dtype
+        df.loc[[2, 6], 'B'] = max_val
+        expected.loc[[2, 3, 6, 7], 'B'] = max_val
+        result = df.groupby('A').cummax()
+        tm.assert_frame_equal(result, expected)
+        expected = df.groupby('A').B.apply(lambda x: x.cummax()).to_frame()
+        tm.assert_frame_equal(result, expected)
+
+    # Test nan in some values
+    base_df.loc[[0, 2, 4, 6], 'B'] = np.nan
+    expected = pd.DataFrame({'B': [np.nan, 4, np.nan, 2,
+                                   np.nan, 3, np.nan, 1]})
+    result = base_df.groupby('A').cummin()
+    tm.assert_frame_equal(result, expected)
+    expected = (base_df.groupby('A')
+                       .B
+                       .apply(lambda x: x.cummin())
+                       .to_frame())
+    tm.assert_frame_equal(result, expected)
+
+    expected = pd.DataFrame({'B': [np.nan, 4, np.nan, 4,
+                                   np.nan, 3, np.nan, 3]})
+    result = base_df.groupby('A').cummax()
+    tm.assert_frame_equal(result, expected)
+    expected = (base_df.groupby('A')
+                       .B
+                       .apply(lambda x: x.cummax())
+                       .to_frame())
+    tm.assert_frame_equal(result, expected)
+
+    # Test nan in entire column
+    base_df['B'] = np.nan
+    expected = pd.DataFrame({'B': [np.nan] * 8})
+    result = base_df.groupby('A').cummin()
+    tm.assert_frame_equal(expected, result)
+    result = base_df.groupby('A').B.apply(lambda x: x.cummin()).to_frame()
+    tm.assert_frame_equal(expected, result)
+    result = base_df.groupby('A').cummax()
+    tm.assert_frame_equal(expected, result)
+    result = base_df.groupby('A').B.apply(lambda x: x.cummax()).to_frame()
+    tm.assert_frame_equal(expected, result)
+
+    # GH 15561
+    df = pd.DataFrame(dict(a=[1], b=pd.to_datetime(['2001'])))
+    expected = pd.Series(pd.to_datetime('2001'), index=[0], name='b')
+    for method in ['cummax', 'cummin']:
+        result = getattr(df.groupby('a')['b'], method)()
+        tm.assert_series_equal(expected, result)
+
+    # GH 15635
+    df = pd.DataFrame(dict(a=[1, 2, 1], b=[2, 1, 1]))
+    result = df.groupby('a').b.cummax()
+    expected = pd.Series([2, 1, 2], name='b')
+    tm.assert_series_equal(result, expected)
+
+    df = pd.DataFrame(dict(a=[1, 2, 1], b=[1, 2, 2]))
+    result = df.groupby('a').b.cummin()
+    expected = pd.Series([1, 2, 1], name='b')
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('in_vals, out_vals', [
+
+    # Basics: strictly increasing (T), strictly decreasing (F),
+    # abs val increasing (F), non-strictly increasing (T)
+    ([1, 2, 5, 3, 2, 0, 4, 5, -6, 1, 1],
+     [True, False, False, True]),
+
+    # Test with inf vals
+    ([1, 2.1, np.inf, 3, 2, np.inf, -np.inf, 5, 11, 1, -np.inf],
+     [True, False, True, False]),
+
+    # Test with nan vals; should always be False
+    ([1, 2, np.nan, 3, 2, np.nan, np.nan, 5, -np.inf, 1, np.nan],
+     [False, False, False, False]),
+])
+def test_is_monotonic_increasing(in_vals, out_vals):
+    # GH 17015
+    source_dict = {
+        'A': ['1', '2', '3', '4', '5', '6', '7', '8', '9', '10', '11'],
+        'B': ['a', 'a', 'a', 'b', 'b', 'b', 'c', 'c', 'c', 'd', 'd'],
+        'C': in_vals}
+    df = pd.DataFrame(source_dict)
+    result = df.groupby('B').C.is_monotonic_increasing
+    index = Index(list('abcd'), name='B')
+    expected = pd.Series(index=index, data=out_vals, name='C')
+    tm.assert_series_equal(result, expected)
+
+    # Also check result equal to manually taking x.is_monotonic_increasing.
+    expected = (
+        df.groupby(['B']).C.apply(lambda x: x.is_monotonic_increasing))
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('in_vals, out_vals', [
+    # Basics: strictly decreasing (T), strictly increasing (F),
+    # abs val decreasing (F), non-strictly increasing (T)
+    ([10, 9, 7, 3, 4, 5, -3, 2, 0, 1, 1],
+     [True, False, False, True]),
+
+    # Test with inf vals
+    ([np.inf, 1, -np.inf, np.inf, 2, -3, -np.inf, 5, -3, -np.inf, -np.inf],
+     [True, True, False, True]),
+
+    # Test with nan vals; should always be False
+    ([1, 2, np.nan, 3, 2, np.nan, np.nan, 5, -np.inf, 1, np.nan],
+     [False, False, False, False]),
+])
+def test_is_monotonic_decreasing(in_vals, out_vals):
+    # GH 17015
+    source_dict = {
+        'A': ['1', '2', '3', '4', '5', '6', '7', '8', '9', '10', '11'],
+        'B': ['a', 'a', 'a', 'b', 'b', 'b', 'c', 'c', 'c', 'd', 'd'],
+        'C': in_vals}
+
+    df = pd.DataFrame(source_dict)
+    result = df.groupby('B').C.is_monotonic_decreasing
+    index = Index(list('abcd'), name='B')
+    expected = pd.Series(index=index, data=out_vals, name='C')
+    tm.assert_series_equal(result, expected)
+
+
+# describe
+# --------------------------------
+
+def test_apply_describe_bug(mframe):
+    grouped = mframe.groupby(level='first')
+    grouped.describe()  # it works!
+
+
+def test_series_describe_multikey():
+    ts = tm.makeTimeSeries()
+    grouped = ts.groupby([lambda x: x.year, lambda x: x.month])
+    result = grouped.describe()
+    tm.assert_series_equal(result['mean'], grouped.mean(),
+                           check_names=False)
+    tm.assert_series_equal(result['std'], grouped.std(), check_names=False)
+    tm.assert_series_equal(result['min'], grouped.min(), check_names=False)
+
+
+def test_series_describe_single():
+    ts = tm.makeTimeSeries()
+    grouped = ts.groupby(lambda x: x.month)
+    result = grouped.apply(lambda x: x.describe())
+    expected = grouped.describe().stack()
+    tm.assert_series_equal(result, expected)
+
+
+def test_series_index_name(df):
+    grouped = df.loc[:, ['C']].groupby(df['A'])
+    result = grouped.agg(lambda x: x.mean())
+    assert result.index.name == 'A'
+
+
+def test_frame_describe_multikey(tsframe):
+    grouped = tsframe.groupby([lambda x: x.year, lambda x: x.month])
+    result = grouped.describe()
+    desc_groups = []
+    for col in tsframe:
+        group = grouped[col].describe()
+        # GH 17464 - Remove duplicate MultiIndex levels
+        group_col = pd.MultiIndex(
+            levels=[[col], group.columns],
+            labels=[[0] * len(group.columns), range(len(group.columns))])
+        group = pd.DataFrame(group.values,
+                             columns=group_col,
+                             index=group.index)
+        desc_groups.append(group)
+    expected = pd.concat(desc_groups, axis=1)
+    tm.assert_frame_equal(result, expected)
+
+    groupedT = tsframe.groupby({'A': 0, 'B': 0,
+                                'C': 1, 'D': 1}, axis=1)
+    result = groupedT.describe()
+    expected = tsframe.describe().T
+    expected.index = pd.MultiIndex(
+        levels=[[0, 1], expected.index],
+        labels=[[0, 0, 1, 1], range(len(expected.index))])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_frame_describe_tupleindex():
+
+    # GH 14848 - regression from 0.19.0 to 0.19.1
+    df1 = DataFrame({'x': [1, 2, 3, 4, 5] * 3,
+                     'y': [10, 20, 30, 40, 50] * 3,
+                     'z': [100, 200, 300, 400, 500] * 3})
+    df1['k'] = [(0, 0, 1), (0, 1, 0), (1, 0, 0)] * 5
+    df2 = df1.rename(columns={'k': 'key'})
+    pytest.raises(ValueError, lambda: df1.groupby('k').describe())
+    pytest.raises(ValueError, lambda: df2.groupby('key').describe())
+
+
+def test_frame_describe_unstacked_format():
+    # GH 4792
+    prices = {pd.Timestamp('2011-01-06 10:59:05', tz=None): 24990,
+              pd.Timestamp('2011-01-06 12:43:33', tz=None): 25499,
+              pd.Timestamp('2011-01-06 12:54:09', tz=None): 25499}
+    volumes = {pd.Timestamp('2011-01-06 10:59:05', tz=None): 1500000000,
+               pd.Timestamp('2011-01-06 12:43:33', tz=None): 5000000000,
+               pd.Timestamp('2011-01-06 12:54:09', tz=None): 100000000}
+    df = pd.DataFrame({'PRICE': prices,
+                       'VOLUME': volumes})
+    result = df.groupby('PRICE').VOLUME.describe()
+    data = [df[df.PRICE == 24990].VOLUME.describe().values.tolist(),
+            df[df.PRICE == 25499].VOLUME.describe().values.tolist()]
+    expected = pd.DataFrame(data,
+                            index=pd.Index([24990, 25499], name='PRICE'),
+                            columns=['count', 'mean', 'std', 'min',
+                                     '25%', '50%', '75%', 'max'])
+    tm.assert_frame_equal(result, expected)
+
+
+# nunique
+# --------------------------------
+
+@pytest.mark.parametrize('n', 10 ** np.arange(2, 6))
+@pytest.mark.parametrize('m', [10, 100, 1000])
+@pytest.mark.parametrize('sort', [False, True])
+@pytest.mark.parametrize('dropna', [False, True])
+def test_series_groupby_nunique(n, m, sort, dropna):
+
+    def check_nunique(df, keys, as_index=True):
+        gr = df.groupby(keys, as_index=as_index, sort=sort)
+        left = gr['julie'].nunique(dropna=dropna)
+
+        gr = df.groupby(keys, as_index=as_index, sort=sort)
+        right = gr['julie'].apply(Series.nunique, dropna=dropna)
+        if not as_index:
+            right = right.reset_index(drop=True)
+
+        tm.assert_series_equal(left, right, check_names=False)
+
+    days = date_range('2015-08-23', periods=10)
+
+    frame = DataFrame({'jim': np.random.choice(list(ascii_lowercase), n),
+                       'joe': np.random.choice(days, n),
+                       'julie': np.random.randint(0, m, n)})
+
+    check_nunique(frame, ['jim'])
+    check_nunique(frame, ['jim', 'joe'])
+
+    frame.loc[1::17, 'jim'] = None
+    frame.loc[3::37, 'joe'] = None
+    frame.loc[7::19, 'julie'] = None
+    frame.loc[8::19, 'julie'] = None
+    frame.loc[9::19, 'julie'] = None
+
+    check_nunique(frame, ['jim'])
+    check_nunique(frame, ['jim', 'joe'])
+    check_nunique(frame, ['jim'], as_index=False)
+    check_nunique(frame, ['jim', 'joe'], as_index=False)
+
+
+def test_nunique():
+    df = DataFrame({
+        'A': list('abbacc'),
+        'B': list('abxacc'),
+        'C': list('abbacx'),
+    })
+
+    expected = DataFrame({'A': [1] * 3, 'B': [1, 2, 1], 'C': [1, 1, 2]})
+    result = df.groupby('A', as_index=False).nunique()
+    tm.assert_frame_equal(result, expected)
+
+    # as_index
+    expected.index = list('abc')
+    expected.index.name = 'A'
+    result = df.groupby('A').nunique()
+    tm.assert_frame_equal(result, expected)
+
+    # with na
+    result = df.replace({'x': None}).groupby('A').nunique(dropna=False)
+    tm.assert_frame_equal(result, expected)
+
+    # dropna
+    expected = DataFrame({'A': [1] * 3, 'B': [1] * 3, 'C': [1] * 3},
+                         index=list('abc'))
+    expected.index.name = 'A'
+    result = df.replace({'x': None}).groupby('A').nunique()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_nunique_with_object():
+    # GH 11077
+    data = pd.DataFrame(
+        [[100, 1, 'Alice'],
+         [200, 2, 'Bob'],
+         [300, 3, 'Charlie'],
+         [-400, 4, 'Dan'],
+         [500, 5, 'Edith']],
+        columns=['amount', 'id', 'name']
+    )
+
+    result = data.groupby(['id', 'amount'])['name'].nunique()
+    index = MultiIndex.from_arrays([data.id, data.amount])
+    expected = pd.Series([1] * 5, name='name', index=index)
+    tm.assert_series_equal(result, expected)
+
+
+def test_nunique_with_empty_series():
+    # GH 12553
+    data = pd.Series(name='name')
+    result = data.groupby(level=0).nunique()
+    expected = pd.Series(name='name', dtype='int64')
+    tm.assert_series_equal(result, expected)
+
+
+def test_nunique_with_timegrouper():
+    # GH 13453
+    test = pd.DataFrame({
+        'time': [Timestamp('2016-06-28 09:35:35'),
+                 Timestamp('2016-06-28 16:09:30'),
+                 Timestamp('2016-06-28 16:46:28')],
+        'data': ['1', '2', '3']}).set_index('time')
+    result = test.groupby(pd.Grouper(freq='h'))['data'].nunique()
+    expected = test.groupby(
+        pd.Grouper(freq='h')
+    )['data'].apply(pd.Series.nunique)
+    tm.assert_series_equal(result, expected)
+
+
+# count
+# --------------------------------
+
+def test_groupby_timedelta_cython_count():
+    df = DataFrame({'g': list('ab' * 2),
+                    'delt': np.arange(4).astype('timedelta64[ns]')})
+    expected = Series([
+        2, 2
+    ], index=pd.Index(['a', 'b'], name='g'), name='delt')
+    result = df.groupby('g').delt.count()
+    tm.assert_series_equal(expected, result)
+
+
+def test_count():
+    n = 1 << 15
+    dr = date_range('2015-08-30', periods=n // 10, freq='T')
+
+    df = DataFrame({
+        '1st': np.random.choice(
+            list(ascii_lowercase), n),
+        '2nd': np.random.randint(0, 5, n),
+        '3rd': np.random.randn(n).round(3),
+        '4th': np.random.randint(-10, 10, n),
+        '5th': np.random.choice(dr, n),
+        '6th': np.random.randn(n).round(3),
+        '7th': np.random.randn(n).round(3),
+        '8th': np.random.choice(dr, n) - np.random.choice(dr, 1),
+        '9th': np.random.choice(
+            list(ascii_lowercase), n)
+    })
+
+    for col in df.columns.drop(['1st', '2nd', '4th']):
+        df.loc[np.random.choice(n, n // 10), col] = np.nan
+
+    df['9th'] = df['9th'].astype('category')
+
+    for key in '1st', '2nd', ['1st', '2nd']:
+        left = df.groupby(key).count()
+        right = df.groupby(key).apply(DataFrame.count).drop(key, axis=1)
+        tm.assert_frame_equal(left, right)
+
+    # GH5610
+    # count counts non-nulls
+    df = pd.DataFrame([[1, 2, 'foo'],
+                       [1, np.nan, 'bar'],
+                       [3, np.nan, np.nan]],
+                      columns=['A', 'B', 'C'])
+
+    count_as = df.groupby('A').count()
+    count_not_as = df.groupby('A', as_index=False).count()
+
+    expected = DataFrame([[1, 2], [0, 0]], columns=['B', 'C'],
+                         index=[1, 3])
+    expected.index.name = 'A'
+    tm.assert_frame_equal(count_not_as, expected.reset_index())
+    tm.assert_frame_equal(count_as, expected)
+
+    count_B = df.groupby('A')['B'].count()
+    tm.assert_series_equal(count_B, expected['B'])
+
+
+def test_count_object():
+    df = pd.DataFrame({'a': ['a'] * 3 + ['b'] * 3, 'c': [2] * 3 + [3] * 3})
+    result = df.groupby('c').a.count()
+    expected = pd.Series([
+        3, 3
+    ], index=pd.Index([2, 3], name='c'), name='a')
+    tm.assert_series_equal(result, expected)
+
+    df = pd.DataFrame({'a': ['a', np.nan, np.nan] + ['b'] * 3,
+                       'c': [2] * 3 + [3] * 3})
+    result = df.groupby('c').a.count()
+    expected = pd.Series([
+        1, 3
+    ], index=pd.Index([2, 3], name='c'), name='a')
+    tm.assert_series_equal(result, expected)
+
+
+def test_count_cross_type():
+    # GH8169
+    vals = np.hstack((np.random.randint(0, 5, (100, 2)), np.random.randint(
+        0, 2, (100, 2))))
+
+    df = pd.DataFrame(vals, columns=['a', 'b', 'c', 'd'])
+    df[df == 2] = np.nan
+    expected = df.groupby(['c', 'd']).count()
+
+    for t in ['float32', 'object']:
+        df['a'] = df['a'].astype(t)
+        df['b'] = df['b'].astype(t)
+        result = df.groupby(['c', 'd']).count()
+        tm.assert_frame_equal(result, expected)
+
+
+def test_lower_int_prec_count():
+    df = DataFrame({'a': np.array(
+        [0, 1, 2, 100], np.int8),
+        'b': np.array(
+        [1, 2, 3, 6], np.uint32),
+        'c': np.array(
+        [4, 5, 6, 8], np.int16),
+        'grp': list('ab' * 2)})
+    result = df.groupby('grp').count()
+    expected = DataFrame({'a': [2, 2],
+                          'b': [2, 2],
+                          'c': [2, 2]}, index=pd.Index(list('ab'),
+                                                       name='grp'))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_count_uses_size_on_exception():
+    class RaisingObjectException(Exception):
+        pass
+
+    class RaisingObject(object):
+
+        def __init__(self, msg='I will raise inside Cython'):
+            super(RaisingObject, self).__init__()
+            self.msg = msg
+
+        def __eq__(self, other):
+            # gets called in Cython to check that raising calls the method
+            raise RaisingObjectException(self.msg)
+
+    df = DataFrame({'a': [RaisingObject() for _ in range(4)],
+                    'grp': list('ab' * 2)})
+    result = df.groupby('grp').count()
+    expected = DataFrame({'a': [2, 2]}, index=pd.Index(
+        list('ab'), name='grp'))
+    tm.assert_frame_equal(result, expected)
+
+
+# size
+# --------------------------------
+
+def test_size(df):
+    grouped = df.groupby(['A', 'B'])
+    result = grouped.size()
+    for key, group in grouped:
+        assert result[key] == len(group)
+
+    grouped = df.groupby('A')
+    result = grouped.size()
+    for key, group in grouped:
+        assert result[key] == len(group)
+
+    grouped = df.groupby('B')
+    result = grouped.size()
+    for key, group in grouped:
+        assert result[key] == len(group)
+
+    df = DataFrame(np.random.choice(20, (1000, 3)), columns=list('abc'))
+    for sort, key in cart_product((False, True), ('a', 'b', ['a', 'b'])):
+        left = df.groupby(key, sort=sort).size()
+        right = df.groupby(key, sort=sort)['c'].apply(lambda a: a.shape[0])
+        tm.assert_series_equal(left, right, check_names=False)
+
+    # GH11699
+    df = DataFrame([], columns=['A', 'B'])
+    out = Series([], dtype='int64', index=Index([], name='A'))
+    tm.assert_series_equal(df.groupby('A').size(), out)
+
+
+# pipe
+# --------------------------------
+
+def test_pipe():
+    # Test the pipe method of DataFrameGroupBy.
+    # Issue #17871
+
+    random_state = np.random.RandomState(1234567890)
+
+    df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                          'foo', 'bar', 'foo', 'foo'],
+                    'B': random_state.randn(8),
+                    'C': random_state.randn(8)})
+
+    def f(dfgb):
+        return dfgb.B.max() - dfgb.C.min().min()
+
+    def square(srs):
+        return srs ** 2
+
+    # Note that the transformations are
+    # GroupBy -> Series
+    # Series -> Series
+    # This then chains the GroupBy.pipe and the
+    # NDFrame.pipe methods
+    result = df.groupby('A').pipe(f).pipe(square)
+
+    index = Index([u'bar', u'foo'], dtype='object', name=u'A')
+    expected = pd.Series([8.99110003361, 8.17516964785], name='B',
+                         index=index)
+
+    tm.assert_series_equal(expected, result)
+
+
+def test_pipe_args():
+    # Test passing args to the pipe method of DataFrameGroupBy.
+    # Issue #17871
+
+    df = pd.DataFrame({'group': ['A', 'A', 'B', 'B', 'C'],
+                       'x': [1.0, 2.0, 3.0, 2.0, 5.0],
+                       'y': [10.0, 100.0, 1000.0, -100.0, -1000.0]})
+
+    def f(dfgb, arg1):
+        return (dfgb.filter(lambda grp: grp.y.mean() > arg1, dropna=False)
+                    .groupby(dfgb.grouper))
+
+    def g(dfgb, arg2):
+        return dfgb.sum() / dfgb.sum().sum() + arg2
+
+    def h(df, arg3):
+        return df.x + df.y - arg3
+
+    result = (df
+              .groupby('group')
+              .pipe(f, 0)
+              .pipe(g, 10)
+              .pipe(h, 100))
+
+    # Assert the results here
+    index = pd.Index(['A', 'B', 'C'], name='group')
+    expected = pd.Series([-79.5160891089, -78.4839108911, -80],
+                         index=index)
+
+    tm.assert_series_equal(expected, result)
+
+    # test SeriesGroupby.pipe
+    ser = pd.Series([1, 1, 2, 2, 3, 3])
+    result = ser.groupby(ser).pipe(lambda grp: grp.sum() * grp.count())
+
+    expected = pd.Series([4, 8, 12], index=pd.Int64Index([1, 2, 3]))
+
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/groupby/test_groupby.py b/pandas/tests/groupby/test_groupby.py
new file mode 100644
index 0000000000000..e05f9de5ea7f4
--- /dev/null
+++ b/pandas/tests/groupby/test_groupby.py
@@ -0,0 +1,1676 @@
+# -*- coding: utf-8 -*-
+from __future__ import print_function
+
+import pytest
+
+from warnings import catch_warnings
+from datetime import datetime
+from decimal import Decimal
+
+from pandas import (date_range, Timestamp,
+                    Index, MultiIndex, DataFrame, Series,
+                    Panel, DatetimeIndex, read_csv)
+from pandas.errors import PerformanceWarning
+from pandas.util.testing import (assert_frame_equal,
+                                 assert_series_equal, assert_almost_equal)
+from pandas.compat import (range, lrange, StringIO, lmap, lzip, map, zip,
+                           OrderedDict)
+from pandas import compat
+from collections import defaultdict
+import pandas.core.common as com
+import numpy as np
+
+import pandas.util.testing as tm
+import pandas as pd
+
+
+def test_repr():
+    # GH18203
+    result = repr(pd.Grouper(key='A', level='B'))
+    expected = "Grouper(key='A', level='B', axis=0, sort=False)"
+    assert result == expected
+
+
+@pytest.mark.parametrize('dtype', ['int64', 'int32', 'float64', 'float32'])
+def test_basic(dtype):
+
+    data = Series(np.arange(9) // 3, index=np.arange(9), dtype=dtype)
+
+    index = np.arange(9)
+    np.random.shuffle(index)
+    data = data.reindex(index)
+
+    grouped = data.groupby(lambda x: x // 3)
+
+    for k, v in grouped:
+        assert len(v) == 3
+
+    agged = grouped.aggregate(np.mean)
+    assert agged[1] == 1
+
+    assert_series_equal(agged, grouped.agg(np.mean))  # shorthand
+    assert_series_equal(agged, grouped.mean())
+    assert_series_equal(grouped.agg(np.sum), grouped.sum())
+
+    expected = grouped.apply(lambda x: x * x.sum())
+    transformed = grouped.transform(lambda x: x * x.sum())
+    assert transformed[7] == 12
+    assert_series_equal(transformed, expected)
+
+    value_grouped = data.groupby(data)
+    assert_series_equal(value_grouped.aggregate(np.mean), agged,
+                        check_index_type=False)
+
+    # complex agg
+    agged = grouped.aggregate([np.mean, np.std])
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        agged = grouped.aggregate({'one': np.mean, 'two': np.std})
+
+    group_constants = {0: 10, 1: 20, 2: 30}
+    agged = grouped.agg(lambda x: group_constants[x.name] + x.mean())
+    assert agged[1] == 21
+
+    # corner cases
+    pytest.raises(Exception, grouped.aggregate, lambda x: x * 2)
+
+
+def test_groupby_nonobject_dtype(mframe, df_mixed_floats):
+    key = mframe.index.labels[0]
+    grouped = mframe.groupby(key)
+    result = grouped.sum()
+
+    expected = mframe.groupby(key.astype('O')).sum()
+    assert_frame_equal(result, expected)
+
+    # GH 3911, mixed frame non-conversion
+    df = df_mixed_floats.copy()
+    df['value'] = lrange(len(df))
+
+    def max_value(group):
+        return group.loc[group['value'].idxmax()]
+
+    applied = df.groupby('A').apply(max_value)
+    result = applied.get_dtype_counts().sort_values()
+    expected = Series({'float64': 2,
+                       'int64': 1,
+                       'object': 2}).sort_values()
+    assert_series_equal(result, expected)
+
+
+def test_groupby_return_type():
+
+    # GH2893, return a reduced type
+    df1 = DataFrame(
+        [{"val1": 1, "val2": 20},
+         {"val1": 1, "val2": 19},
+         {"val1": 2, "val2": 27},
+         {"val1": 2, "val2": 12}
+         ])
+
+    def func(dataf):
+        return dataf["val2"] - dataf["val2"].mean()
+
+    result = df1.groupby("val1", squeeze=True).apply(func)
+    assert isinstance(result, Series)
+
+    df2 = DataFrame(
+        [{"val1": 1, "val2": 20},
+         {"val1": 1, "val2": 19},
+         {"val1": 1, "val2": 27},
+         {"val1": 1, "val2": 12}
+         ])
+
+    def func(dataf):
+        return dataf["val2"] - dataf["val2"].mean()
+
+    result = df2.groupby("val1", squeeze=True).apply(func)
+    assert isinstance(result, Series)
+
+    # GH3596, return a consistent type (regression in 0.11 from 0.10.1)
+    df = DataFrame([[1, 1], [1, 1]], columns=['X', 'Y'])
+    result = df.groupby('X', squeeze=False).count()
+    assert isinstance(result, DataFrame)
+
+    # GH5592
+    # inconcistent return type
+    df = DataFrame(dict(A=['Tiger', 'Tiger', 'Tiger', 'Lamb', 'Lamb',
+                           'Pony', 'Pony'], B=Series(
+                               np.arange(7), dtype='int64'), C=date_range(
+                                   '20130101', periods=7)))
+
+    def f(grp):
+        return grp.iloc[0]
+
+    expected = df.groupby('A').first()[['B']]
+    result = df.groupby('A').apply(f)[['B']]
+    assert_frame_equal(result, expected)
+
+    def f(grp):
+        if grp.name == 'Tiger':
+            return None
+        return grp.iloc[0]
+
+    result = df.groupby('A').apply(f)[['B']]
+    e = expected.copy()
+    e.loc['Tiger'] = np.nan
+    assert_frame_equal(result, e)
+
+    def f(grp):
+        if grp.name == 'Pony':
+            return None
+        return grp.iloc[0]
+
+    result = df.groupby('A').apply(f)[['B']]
+    e = expected.copy()
+    e.loc['Pony'] = np.nan
+    assert_frame_equal(result, e)
+
+    # 5592 revisited, with datetimes
+    def f(grp):
+        if grp.name == 'Pony':
+            return None
+        return grp.iloc[0]
+
+    result = df.groupby('A').apply(f)[['C']]
+    e = df.groupby('A').first()[['C']]
+    e.loc['Pony'] = pd.NaT
+    assert_frame_equal(result, e)
+
+    # scalar outputs
+    def f(grp):
+        if grp.name == 'Pony':
+            return None
+        return grp.iloc[0].loc['C']
+
+    result = df.groupby('A').apply(f)
+    e = df.groupby('A').first()['C'].copy()
+    e.loc['Pony'] = np.nan
+    e.name = None
+    assert_series_equal(result, e)
+
+
+def test_pass_args_kwargs(ts, tsframe):
+
+    def f(x, q=None, axis=0):
+        return np.percentile(x, q, axis=axis)
+
+    g = lambda x: np.percentile(x, 80, axis=0)
+
+    # Series
+    ts_grouped = ts.groupby(lambda x: x.month)
+    agg_result = ts_grouped.agg(np.percentile, 80, axis=0)
+    apply_result = ts_grouped.apply(np.percentile, 80, axis=0)
+    trans_result = ts_grouped.transform(np.percentile, 80, axis=0)
+
+    agg_expected = ts_grouped.quantile(.8)
+    trans_expected = ts_grouped.transform(g)
+
+    assert_series_equal(apply_result, agg_expected)
+    assert_series_equal(agg_result, agg_expected, check_names=False)
+    assert_series_equal(trans_result, trans_expected)
+
+    agg_result = ts_grouped.agg(f, q=80)
+    apply_result = ts_grouped.apply(f, q=80)
+    trans_result = ts_grouped.transform(f, q=80)
+    assert_series_equal(agg_result, agg_expected)
+    assert_series_equal(apply_result, agg_expected)
+    assert_series_equal(trans_result, trans_expected)
+
+    # DataFrame
+    df_grouped = tsframe.groupby(lambda x: x.month)
+    agg_result = df_grouped.agg(np.percentile, 80, axis=0)
+    apply_result = df_grouped.apply(DataFrame.quantile, .8)
+    expected = df_grouped.quantile(.8)
+    assert_frame_equal(apply_result, expected)
+    assert_frame_equal(agg_result, expected, check_names=False)
+
+    agg_result = df_grouped.agg(f, q=80)
+    apply_result = df_grouped.apply(DataFrame.quantile, q=.8)
+    assert_frame_equal(agg_result, expected, check_names=False)
+    assert_frame_equal(apply_result, expected)
+
+
+def test_len():
+    df = tm.makeTimeDataFrame()
+    grouped = df.groupby([lambda x: x.year, lambda x: x.month,
+                          lambda x: x.day])
+    assert len(grouped) == len(df)
+
+    grouped = df.groupby([lambda x: x.year, lambda x: x.month])
+    expected = len({(x.year, x.month) for x in df.index})
+    assert len(grouped) == expected
+
+    # issue 11016
+    df = pd.DataFrame(dict(a=[np.nan] * 3, b=[1, 2, 3]))
+    assert len(df.groupby(('a'))) == 0
+    assert len(df.groupby(('b'))) == 3
+    assert len(df.groupby(['a', 'b'])) == 3
+
+
+def test_basic_regression():
+    # regression
+    T = [1.0 * x for x in lrange(1, 10) * 10][:1095]
+    result = Series(T, lrange(0, len(T)))
+
+    groupings = np.random.random((1100, ))
+    groupings = Series(groupings, lrange(0, len(groupings))) * 10.
+
+    grouped = result.groupby(groupings)
+    grouped.mean()
+
+
+@pytest.mark.parametrize('dtype', ['float64', 'float32', 'int64',
+                                   'int32', 'int16', 'int8'])
+def test_with_na_groups(dtype):
+    index = Index(np.arange(10))
+    values = Series(np.ones(10), index, dtype=dtype)
+    labels = Series([np.nan, 'foo', 'bar', 'bar', np.nan, np.nan,
+                     'bar', 'bar', np.nan, 'foo'], index=index)
+
+    # this SHOULD be an int
+    grouped = values.groupby(labels)
+    agged = grouped.agg(len)
+    expected = Series([4, 2], index=['bar', 'foo'])
+
+    assert_series_equal(agged, expected, check_dtype=False)
+
+    # assert issubclass(agged.dtype.type, np.integer)
+
+    # explicitly return a float from my function
+    def f(x):
+        return float(len(x))
+
+    agged = grouped.agg(f)
+    expected = Series([4, 2], index=['bar', 'foo'])
+
+    assert_series_equal(agged, expected, check_dtype=False)
+    assert issubclass(agged.dtype.type, np.dtype(dtype).type)
+
+
+def test_indices_concatenation_order():
+
+    # GH 2808
+
+    def f1(x):
+        y = x[(x.b % 2) == 1] ** 2
+        if y.empty:
+            multiindex = MultiIndex(levels=[[]] * 2, labels=[[]] * 2,
+                                    names=['b', 'c'])
+            res = DataFrame(None, columns=['a'], index=multiindex)
+            return res
+        else:
+            y = y.set_index(['b', 'c'])
+            return y
+
+    def f2(x):
+        y = x[(x.b % 2) == 1] ** 2
+        if y.empty:
+            return DataFrame()
+        else:
+            y = y.set_index(['b', 'c'])
+            return y
+
+    def f3(x):
+        y = x[(x.b % 2) == 1] ** 2
+        if y.empty:
+            multiindex = MultiIndex(levels=[[]] * 2, labels=[[]] * 2,
+                                    names=['foo', 'bar'])
+            res = DataFrame(None, columns=['a', 'b'], index=multiindex)
+            return res
+        else:
+            return y
+
+    df = DataFrame({'a': [1, 2, 2, 2], 'b': lrange(4), 'c': lrange(5, 9)})
+
+    df2 = DataFrame({'a': [3, 2, 2, 2], 'b': lrange(4), 'c': lrange(5, 9)})
+
+    # correct result
+    result1 = df.groupby('a').apply(f1)
+    result2 = df2.groupby('a').apply(f1)
+    assert_frame_equal(result1, result2)
+
+    # should fail (not the same number of levels)
+    pytest.raises(AssertionError, df.groupby('a').apply, f2)
+    pytest.raises(AssertionError, df2.groupby('a').apply, f2)
+
+    # should fail (incorrect shape)
+    pytest.raises(AssertionError, df.groupby('a').apply, f3)
+    pytest.raises(AssertionError, df2.groupby('a').apply, f3)
+
+
+def test_attr_wrapper(ts):
+    grouped = ts.groupby(lambda x: x.weekday())
+
+    result = grouped.std()
+    expected = grouped.agg(lambda x: np.std(x, ddof=1))
+    assert_series_equal(result, expected)
+
+    # this is pretty cool
+    result = grouped.describe()
+    expected = {}
+    for name, gp in grouped:
+        expected[name] = gp.describe()
+    expected = DataFrame(expected).T
+    assert_frame_equal(result, expected)
+
+    # get attribute
+    result = grouped.dtype
+    expected = grouped.agg(lambda x: x.dtype)
+
+    # make sure raises error
+    pytest.raises(AttributeError, getattr, grouped, 'foo')
+
+
+def test_frame_groupby(tsframe):
+    grouped = tsframe.groupby(lambda x: x.weekday())
+
+    # aggregate
+    aggregated = grouped.aggregate(np.mean)
+    assert len(aggregated) == 5
+    assert len(aggregated.columns) == 4
+
+    # by string
+    tscopy = tsframe.copy()
+    tscopy['weekday'] = [x.weekday() for x in tscopy.index]
+    stragged = tscopy.groupby('weekday').aggregate(np.mean)
+    assert_frame_equal(stragged, aggregated, check_names=False)
+
+    # transform
+    grouped = tsframe.head(30).groupby(lambda x: x.weekday())
+    transformed = grouped.transform(lambda x: x - x.mean())
+    assert len(transformed) == 30
+    assert len(transformed.columns) == 4
+
+    # transform propagate
+    transformed = grouped.transform(lambda x: x.mean())
+    for name, group in grouped:
+        mean = group.mean()
+        for idx in group.index:
+            tm.assert_series_equal(transformed.xs(idx), mean,
+                                   check_names=False)
+
+    # iterate
+    for weekday, group in grouped:
+        assert group.index[0].weekday() == weekday
+
+    # groups / group_indices
+    groups = grouped.groups
+    indices = grouped.indices
+
+    for k, v in compat.iteritems(groups):
+        samething = tsframe.index.take(indices[k])
+        assert (samething == v).all()
+
+
+def test_frame_groupby_columns(tsframe):
+    mapping = {'A': 0, 'B': 0, 'C': 1, 'D': 1}
+    grouped = tsframe.groupby(mapping, axis=1)
+
+    # aggregate
+    aggregated = grouped.aggregate(np.mean)
+    assert len(aggregated) == len(tsframe)
+    assert len(aggregated.columns) == 2
+
+    # transform
+    tf = lambda x: x - x.mean()
+    groupedT = tsframe.T.groupby(mapping, axis=0)
+    assert_frame_equal(groupedT.transform(tf).T, grouped.transform(tf))
+
+    # iterate
+    for k, v in grouped:
+        assert len(v.columns) == 2
+
+
+def test_frame_set_name_single(df):
+    grouped = df.groupby('A')
+
+    result = grouped.mean()
+    assert result.index.name == 'A'
+
+    result = df.groupby('A', as_index=False).mean()
+    assert result.index.name != 'A'
+
+    result = grouped.agg(np.mean)
+    assert result.index.name == 'A'
+
+    result = grouped.agg({'C': np.mean, 'D': np.std})
+    assert result.index.name == 'A'
+
+    result = grouped['C'].mean()
+    assert result.index.name == 'A'
+    result = grouped['C'].agg(np.mean)
+    assert result.index.name == 'A'
+    result = grouped['C'].agg([np.mean, np.std])
+    assert result.index.name == 'A'
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        result = grouped['C'].agg({'foo': np.mean, 'bar': np.std})
+    assert result.index.name == 'A'
+
+
+def test_multi_func(df):
+    col1 = df['A']
+    col2 = df['B']
+
+    grouped = df.groupby([col1.get, col2.get])
+    agged = grouped.mean()
+    expected = df.groupby(['A', 'B']).mean()
+
+    # TODO groupby get drops names
+    assert_frame_equal(agged.loc[:, ['C', 'D']],
+                       expected.loc[:, ['C', 'D']],
+                       check_names=False)
+
+    # some "groups" with no data
+    df = DataFrame({'v1': np.random.randn(6),
+                    'v2': np.random.randn(6),
+                    'k1': np.array(['b', 'b', 'b', 'a', 'a', 'a']),
+                    'k2': np.array(['1', '1', '1', '2', '2', '2'])},
+                   index=['one', 'two', 'three', 'four', 'five', 'six'])
+    # only verify that it works for now
+    grouped = df.groupby(['k1', 'k2'])
+    grouped.agg(np.sum)
+
+
+def test_multi_key_multiple_functions(df):
+    grouped = df.groupby(['A', 'B'])['C']
+
+    agged = grouped.agg([np.mean, np.std])
+    expected = DataFrame({'mean': grouped.agg(np.mean),
+                          'std': grouped.agg(np.std)})
+    assert_frame_equal(agged, expected)
+
+
+def test_frame_multi_key_function_list():
+    data = DataFrame(
+        {'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar', 'bar', 'bar',
+               'foo', 'foo', 'foo'],
+         'B': ['one', 'one', 'one', 'two', 'one', 'one', 'one', 'two',
+               'two', 'two', 'one'],
+         'C': ['dull', 'dull', 'shiny', 'dull', 'dull', 'shiny', 'shiny',
+               'dull', 'shiny', 'shiny', 'shiny'],
+         'D': np.random.randn(11),
+         'E': np.random.randn(11),
+         'F': np.random.randn(11)})
+
+    grouped = data.groupby(['A', 'B'])
+    funcs = [np.mean, np.std]
+    agged = grouped.agg(funcs)
+    expected = pd.concat([grouped['D'].agg(funcs), grouped['E'].agg(funcs),
+                          grouped['F'].agg(funcs)],
+                         keys=['D', 'E', 'F'], axis=1)
+    assert (isinstance(agged.index, MultiIndex))
+    assert (isinstance(expected.index, MultiIndex))
+    assert_frame_equal(agged, expected)
+
+
+@pytest.mark.parametrize('op', [lambda x: x.sum(), lambda x: x.mean()])
+def test_groupby_multiple_columns(df, op):
+    data = df
+    grouped = data.groupby(['A', 'B'])
+
+    with catch_warnings(record=True):
+        result1 = op(grouped)
+
+        expected = defaultdict(dict)
+        for n1, gp1 in data.groupby('A'):
+            for n2, gp2 in gp1.groupby('B'):
+                expected[n1][n2] = op(gp2.loc[:, ['C', 'D']])
+        expected = dict((k, DataFrame(v))
+                        for k, v in compat.iteritems(expected))
+        expected = Panel.fromDict(expected).swapaxes(0, 1)
+        expected.major_axis.name, expected.minor_axis.name = 'A', 'B'
+
+        # a little bit crude
+        for col in ['C', 'D']:
+            result_col = op(grouped[col])
+            exp = expected[col]
+            pivoted = result1[col].unstack()
+            pivoted2 = result_col.unstack()
+            assert_frame_equal(pivoted.reindex_like(exp), exp)
+            assert_frame_equal(pivoted2.reindex_like(exp), exp)
+
+    # test single series works the same
+    result = data['C'].groupby([data['A'], data['B']]).mean()
+    expected = data.groupby(['A', 'B']).mean()['C']
+
+    assert_series_equal(result, expected)
+
+
+def test_groupby_as_index_agg(df):
+    grouped = df.groupby('A', as_index=False)
+
+    # single-key
+
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    assert_frame_equal(result, expected)
+
+    result2 = grouped.agg(OrderedDict([['C', np.mean], ['D', np.sum]]))
+    expected2 = grouped.mean()
+    expected2['D'] = grouped.sum()['D']
+    assert_frame_equal(result2, expected2)
+
+    grouped = df.groupby('A', as_index=True)
+    expected3 = grouped['C'].sum()
+    expected3 = DataFrame(expected3).rename(columns={'C': 'Q'})
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        result3 = grouped['C'].agg({'Q': np.sum})
+    assert_frame_equal(result3, expected3)
+
+    # multi-key
+
+    grouped = df.groupby(['A', 'B'], as_index=False)
+
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    assert_frame_equal(result, expected)
+
+    result2 = grouped.agg(OrderedDict([['C', np.mean], ['D', np.sum]]))
+    expected2 = grouped.mean()
+    expected2['D'] = grouped.sum()['D']
+    assert_frame_equal(result2, expected2)
+
+    expected3 = grouped['C'].sum()
+    expected3 = DataFrame(expected3).rename(columns={'C': 'Q'})
+    result3 = grouped['C'].agg({'Q': np.sum})
+    assert_frame_equal(result3, expected3)
+
+    # GH7115 & GH8112 & GH8582
+    df = DataFrame(np.random.randint(0, 100, (50, 3)),
+                   columns=['jim', 'joe', 'jolie'])
+    ts = Series(np.random.randint(5, 10, 50), name='jim')
+
+    gr = df.groupby(ts)
+    gr.nth(0)  # invokes set_selection_from_grouper internally
+    assert_frame_equal(gr.apply(sum), df.groupby(ts).apply(sum))
+
+    for attr in ['mean', 'max', 'count', 'idxmax', 'cumsum', 'all']:
+        gr = df.groupby(ts, as_index=False)
+        left = getattr(gr, attr)()
+
+        gr = df.groupby(ts.values, as_index=True)
+        right = getattr(gr, attr)().reset_index(drop=True)
+
+        assert_frame_equal(left, right)
+
+
+def test_as_index_series_return_frame(df):
+    grouped = df.groupby('A', as_index=False)
+    grouped2 = df.groupby(['A', 'B'], as_index=False)
+
+    result = grouped['C'].agg(np.sum)
+    expected = grouped.agg(np.sum).loc[:, ['A', 'C']]
+    assert isinstance(result, DataFrame)
+    assert_frame_equal(result, expected)
+
+    result2 = grouped2['C'].agg(np.sum)
+    expected2 = grouped2.agg(np.sum).loc[:, ['A', 'B', 'C']]
+    assert isinstance(result2, DataFrame)
+    assert_frame_equal(result2, expected2)
+
+    result = grouped['C'].sum()
+    expected = grouped.sum().loc[:, ['A', 'C']]
+    assert isinstance(result, DataFrame)
+    assert_frame_equal(result, expected)
+
+    result2 = grouped2['C'].sum()
+    expected2 = grouped2.sum().loc[:, ['A', 'B', 'C']]
+    assert isinstance(result2, DataFrame)
+    assert_frame_equal(result2, expected2)
+
+    # corner case
+    pytest.raises(Exception, grouped['C'].__getitem__, 'D')
+
+
+def test_groupby_as_index_cython(df):
+    data = df
+
+    # single-key
+    grouped = data.groupby('A', as_index=False)
+    result = grouped.mean()
+    expected = data.groupby(['A']).mean()
+    expected.insert(0, 'A', expected.index)
+    expected.index = np.arange(len(expected))
+    assert_frame_equal(result, expected)
+
+    # multi-key
+    grouped = data.groupby(['A', 'B'], as_index=False)
+    result = grouped.mean()
+    expected = data.groupby(['A', 'B']).mean()
+
+    arrays = lzip(*expected.index.values)
+    expected.insert(0, 'A', arrays[0])
+    expected.insert(1, 'B', arrays[1])
+    expected.index = np.arange(len(expected))
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_as_index_series_scalar(df):
+    grouped = df.groupby(['A', 'B'], as_index=False)
+
+    # GH #421
+
+    result = grouped['C'].agg(len)
+    expected = grouped.agg(len).loc[:, ['A', 'B', 'C']]
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_as_index_corner(df, ts):
+    pytest.raises(TypeError, ts.groupby, lambda x: x.weekday(),
+                  as_index=False)
+
+    pytest.raises(ValueError, df.groupby, lambda x: x.lower(),
+                  as_index=False, axis=1)
+
+
+def test_groupby_multiple_key(df):
+    df = tm.makeTimeDataFrame()
+    grouped = df.groupby([lambda x: x.year, lambda x: x.month,
+                          lambda x: x.day])
+    agged = grouped.sum()
+    assert_almost_equal(df.values, agged.values)
+
+    grouped = df.T.groupby([lambda x: x.year,
+                            lambda x: x.month,
+                            lambda x: x.day], axis=1)
+
+    agged = grouped.agg(lambda x: x.sum())
+    tm.assert_index_equal(agged.index, df.columns)
+    assert_almost_equal(df.T.values, agged.values)
+
+    agged = grouped.agg(lambda x: x.sum())
+    assert_almost_equal(df.T.values, agged.values)
+
+
+def test_groupby_multi_corner(df):
+    # test that having an all-NA column doesn't mess you up
+    df = df.copy()
+    df['bad'] = np.nan
+    agged = df.groupby(['A', 'B']).mean()
+
+    expected = df.groupby(['A', 'B']).mean()
+    expected['bad'] = np.nan
+
+    assert_frame_equal(agged, expected)
+
+
+def test_omit_nuisance(df):
+    grouped = df.groupby('A')
+
+    result = grouped.mean()
+    expected = df.loc[:, ['A', 'C', 'D']].groupby('A').mean()
+    assert_frame_equal(result, expected)
+
+    agged = grouped.agg(np.mean)
+    exp = grouped.mean()
+    assert_frame_equal(agged, exp)
+
+    df = df.loc[:, ['A', 'C', 'D']]
+    df['E'] = datetime.now()
+    grouped = df.groupby('A')
+    result = grouped.agg(np.sum)
+    expected = grouped.sum()
+    assert_frame_equal(result, expected)
+
+    # won't work with axis = 1
+    grouped = df.groupby({'A': 0, 'C': 0, 'D': 1, 'E': 1}, axis=1)
+    result = pytest.raises(TypeError, grouped.agg,
+                           lambda x: x.sum(0, numeric_only=False))
+
+
+def test_omit_nuisance_python_multiple(three_group):
+    grouped = three_group.groupby(['A', 'B'])
+
+    agged = grouped.agg(np.mean)
+    exp = grouped.mean()
+    assert_frame_equal(agged, exp)
+
+
+def test_empty_groups_corner(mframe):
+    # handle empty groups
+    df = DataFrame({'k1': np.array(['b', 'b', 'b', 'a', 'a', 'a']),
+                    'k2': np.array(['1', '1', '1', '2', '2', '2']),
+                    'k3': ['foo', 'bar'] * 3,
+                    'v1': np.random.randn(6),
+                    'v2': np.random.randn(6)})
+
+    grouped = df.groupby(['k1', 'k2'])
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    assert_frame_equal(result, expected)
+
+    grouped = mframe[3:5].groupby(level=0)
+    agged = grouped.apply(lambda x: x.mean())
+    agged_A = grouped['A'].apply(np.mean)
+    assert_series_equal(agged['A'], agged_A)
+    assert agged.index.name == 'first'
+
+
+def test_nonsense_func():
+    df = DataFrame([0])
+    pytest.raises(Exception, df.groupby, lambda x: x + 'foo')
+
+
+def test_wrap_aggregated_output_multindex(mframe):
+    df = mframe.T
+    df['baz', 'two'] = 'peekaboo'
+
+    keys = [np.array([0, 0, 1]), np.array([0, 0, 1])]
+    agged = df.groupby(keys).agg(np.mean)
+    assert isinstance(agged.columns, MultiIndex)
+
+    def aggfun(ser):
+        if ser.name == ('foo', 'one'):
+            raise TypeError
+        else:
+            return ser.sum()
+
+    agged2 = df.groupby(keys).aggregate(aggfun)
+    assert len(agged2.columns) + 1 == len(df.columns)
+
+
+def test_groupby_level_apply(mframe):
+
+    result = mframe.groupby(level=0).count()
+    assert result.index.name == 'first'
+    result = mframe.groupby(level=1).count()
+    assert result.index.name == 'second'
+
+    result = mframe['A'].groupby(level=0).count()
+    assert result.index.name == 'first'
+
+
+def test_groupby_level_mapper(mframe):
+    deleveled = mframe.reset_index()
+
+    mapper0 = {'foo': 0, 'bar': 0, 'baz': 1, 'qux': 1}
+    mapper1 = {'one': 0, 'two': 0, 'three': 1}
+
+    result0 = mframe.groupby(mapper0, level=0).sum()
+    result1 = mframe.groupby(mapper1, level=1).sum()
+
+    mapped_level0 = np.array([mapper0.get(x) for x in deleveled['first']])
+    mapped_level1 = np.array([mapper1.get(x) for x in deleveled['second']])
+    expected0 = mframe.groupby(mapped_level0).sum()
+    expected1 = mframe.groupby(mapped_level1).sum()
+    expected0.index.name, expected1.index.name = 'first', 'second'
+
+    assert_frame_equal(result0, expected0)
+    assert_frame_equal(result1, expected1)
+
+
+def test_groupby_level_nonmulti():
+    # GH 1313, GH 13901
+    s = Series([1, 2, 3, 10, 4, 5, 20, 6],
+               Index([1, 2, 3, 1, 4, 5, 2, 6], name='foo'))
+    expected = Series([11, 22, 3, 4, 5, 6],
+                      Index(range(1, 7), name='foo'))
+
+    result = s.groupby(level=0).sum()
+    tm.assert_series_equal(result, expected)
+    result = s.groupby(level=[0]).sum()
+    tm.assert_series_equal(result, expected)
+    result = s.groupby(level=-1).sum()
+    tm.assert_series_equal(result, expected)
+    result = s.groupby(level=[-1]).sum()
+    tm.assert_series_equal(result, expected)
+
+    pytest.raises(ValueError, s.groupby, level=1)
+    pytest.raises(ValueError, s.groupby, level=-2)
+    pytest.raises(ValueError, s.groupby, level=[])
+    pytest.raises(ValueError, s.groupby, level=[0, 0])
+    pytest.raises(ValueError, s.groupby, level=[0, 1])
+    pytest.raises(ValueError, s.groupby, level=[1])
+
+
+def test_groupby_complex():
+    # GH 12902
+    a = Series(data=np.arange(4) * (1 + 2j), index=[0, 0, 1, 1])
+    expected = Series((1 + 2j, 5 + 10j))
+
+    result = a.groupby(level=0).sum()
+    assert_series_equal(result, expected)
+
+    result = a.sum(level=0)
+    assert_series_equal(result, expected)
+
+
+def test_mutate_groups():
+
+    # GH3380
+
+    df = DataFrame({
+        'cat1': ['a'] * 8 + ['b'] * 6,
+        'cat2': ['c'] * 2 + ['d'] * 2 + ['e'] * 2 + ['f'] * 2 + ['c'] * 2 +
+        ['d'] * 2 + ['e'] * 2,
+        'cat3': lmap(lambda x: 'g%s' % x, lrange(1, 15)),
+        'val': np.random.randint(100, size=14),
+    })
+
+    def f_copy(x):
+        x = x.copy()
+        x['rank'] = x.val.rank(method='min')
+        return x.groupby('cat2')['rank'].min()
+
+    def f_no_copy(x):
+        x['rank'] = x.val.rank(method='min')
+        return x.groupby('cat2')['rank'].min()
+
+    grpby_copy = df.groupby('cat1').apply(f_copy)
+    grpby_no_copy = df.groupby('cat1').apply(f_no_copy)
+    assert_series_equal(grpby_copy, grpby_no_copy)
+
+
+def test_no_mutate_but_looks_like():
+
+    # GH 8467
+    # first show's mutation indicator
+    # second does not, but should yield the same results
+    df = DataFrame({'key': [1, 1, 1, 2, 2, 2, 3, 3, 3], 'value': range(9)})
+
+    result1 = df.groupby('key', group_keys=True).apply(lambda x: x[:].key)
+    result2 = df.groupby('key', group_keys=True).apply(lambda x: x.key)
+    assert_series_equal(result1, result2)
+
+
+def test_groupby_series_indexed_differently():
+    s1 = Series([5.0, -9.0, 4.0, 100., -5., 55., 6.7],
+                index=Index(['a', 'b', 'c', 'd', 'e', 'f', 'g']))
+    s2 = Series([1.0, 1.0, 4.0, 5.0, 5.0, 7.0],
+                index=Index(['a', 'b', 'd', 'f', 'g', 'h']))
+
+    grouped = s1.groupby(s2)
+    agged = grouped.mean()
+    exp = s1.groupby(s2.reindex(s1.index).get).mean()
+    assert_series_equal(agged, exp)
+
+
+def test_groupby_with_hier_columns():
+    tuples = list(zip(*[['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux',
+                         'qux'], ['one', 'two', 'one', 'two', 'one', 'two',
+                                  'one', 'two']]))
+    index = MultiIndex.from_tuples(tuples)
+    columns = MultiIndex.from_tuples([('A', 'cat'), ('B', 'dog'), (
+        'B', 'cat'), ('A', 'dog')])
+    df = DataFrame(np.random.randn(8, 4), index=index, columns=columns)
+
+    result = df.groupby(level=0).mean()
+    tm.assert_index_equal(result.columns, columns)
+
+    result = df.groupby(level=0, axis=1).mean()
+    tm.assert_index_equal(result.index, df.index)
+
+    result = df.groupby(level=0).agg(np.mean)
+    tm.assert_index_equal(result.columns, columns)
+
+    result = df.groupby(level=0).apply(lambda x: x.mean())
+    tm.assert_index_equal(result.columns, columns)
+
+    result = df.groupby(level=0, axis=1).agg(lambda x: x.mean(1))
+    tm.assert_index_equal(result.columns, Index(['A', 'B']))
+    tm.assert_index_equal(result.index, df.index)
+
+    # add a nuisance column
+    sorted_columns, _ = columns.sortlevel(0)
+    df['A', 'foo'] = 'bar'
+    result = df.groupby(level=0).mean()
+    tm.assert_index_equal(result.columns, df.columns[:-1])
+
+
+def test_grouping_ndarray(df):
+    grouped = df.groupby(df['A'].values)
+
+    result = grouped.sum()
+    expected = df.groupby('A').sum()
+    assert_frame_equal(result, expected, check_names=False
+                       )  # Note: no names when grouping by value
+
+
+def test_groupby_wrong_multi_labels():
+    data = """index,foo,bar,baz,spam,data
+0,foo1,bar1,baz1,spam2,20
+1,foo1,bar2,baz1,spam3,30
+2,foo2,bar2,baz1,spam2,40
+3,foo1,bar1,baz2,spam1,50
+4,foo3,bar1,baz2,spam1,60"""
+
+    data = read_csv(StringIO(data), index_col=0)
+
+    grouped = data.groupby(['foo', 'bar', 'baz', 'spam'])
+
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_series_with_name(df):
+    result = df.groupby(df['A']).mean()
+    result2 = df.groupby(df['A'], as_index=False).mean()
+    assert result.index.name == 'A'
+    assert 'A' in result2
+
+    result = df.groupby([df['A'], df['B']]).mean()
+    result2 = df.groupby([df['A'], df['B']],
+                         as_index=False).mean()
+    assert result.index.names == ('A', 'B')
+    assert 'A' in result2
+    assert 'B' in result2
+
+
+def test_seriesgroupby_name_attr(df):
+    # GH 6265
+    result = df.groupby('A')['C']
+    assert result.count().name == 'C'
+    assert result.mean().name == 'C'
+
+    testFunc = lambda x: np.sum(x) * 2
+    assert result.agg(testFunc).name == 'C'
+
+
+def test_consistency_name():
+    # GH 12363
+
+    df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                          'foo', 'bar', 'foo', 'foo'],
+                    'B': ['one', 'one', 'two', 'two',
+                          'two', 'two', 'one', 'two'],
+                    'C': np.random.randn(8) + 1.0,
+                    'D': np.arange(8)})
+
+    expected = df.groupby(['A']).B.count()
+    result = df.B.groupby(df.A).count()
+    assert_series_equal(result, expected)
+
+
+def test_groupby_name_propagation(df):
+    # GH 6124
+    def summarize(df, name=None):
+        return Series({'count': 1, 'mean': 2, 'omissions': 3, }, name=name)
+
+    def summarize_random_name(df):
+        # Provide a different name for each Series.  In this case, groupby
+        # should not attempt to propagate the Series name since they are
+        # inconsistent.
+        return Series({
+            'count': 1,
+            'mean': 2,
+            'omissions': 3,
+        }, name=df.iloc[0]['A'])
+
+    metrics = df.groupby('A').apply(summarize)
+    assert metrics.columns.name is None
+    metrics = df.groupby('A').apply(summarize, 'metrics')
+    assert metrics.columns.name == 'metrics'
+    metrics = df.groupby('A').apply(summarize_random_name)
+    assert metrics.columns.name is None
+
+
+def test_groupby_nonstring_columns():
+    df = DataFrame([np.arange(10) for x in range(10)])
+    grouped = df.groupby(0)
+    result = grouped.mean()
+    expected = df.groupby(df[0]).mean()
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_mixed_type_columns():
+    # GH 13432, unorderable types in py3
+    df = DataFrame([[0, 1, 2]], columns=['A', 'B', 0])
+    expected = DataFrame([[1, 2]], columns=['B', 0],
+                         index=Index([0], name='A'))
+
+    result = df.groupby('A').first()
+    tm.assert_frame_equal(result, expected)
+
+    result = df.groupby('A').sum()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_cython_grouper_series_bug_noncontig():
+    arr = np.empty((100, 100))
+    arr.fill(np.nan)
+    obj = Series(arr[:, 0], index=lrange(100))
+    inds = np.tile(lrange(10), 10)
+
+    result = obj.groupby(inds).agg(Series.median)
+    assert result.isna().all()
+
+
+def test_series_grouper_noncontig_index():
+    index = Index(tm.rands_array(10, 100))
+
+    values = Series(np.random.randn(50), index=index[::2])
+    labels = np.random.randint(0, 5, 50)
+
+    # it works!
+    grouped = values.groupby(labels)
+
+    # accessing the index elements causes segfault
+    f = lambda x: len(set(map(id, x.index)))
+    grouped.agg(f)
+
+
+def test_convert_objects_leave_decimal_alone():
+
+    s = Series(lrange(5))
+    labels = np.array(['a', 'b', 'c', 'd', 'e'], dtype='O')
+
+    def convert_fast(x):
+        return Decimal(str(x.mean()))
+
+    def convert_force_pure(x):
+        # base will be length 0
+        assert (len(x.values.base) > 0)
+        return Decimal(str(x.mean()))
+
+    grouped = s.groupby(labels)
+
+    result = grouped.agg(convert_fast)
+    assert result.dtype == np.object_
+    assert isinstance(result[0], Decimal)
+
+    result = grouped.agg(convert_force_pure)
+    assert result.dtype == np.object_
+    assert isinstance(result[0], Decimal)
+
+
+def test_groupby_dtype_inference_empty():
+    # GH 6733
+    df = DataFrame({'x': [], 'range': np.arange(0, dtype='int64')})
+    assert df['x'].dtype == np.float64
+
+    result = df.groupby('x').first()
+    exp_index = Index([], name='x', dtype=np.float64)
+    expected = DataFrame({'range': Series(
+        [], index=exp_index, dtype='int64')})
+    assert_frame_equal(result, expected, by_blocks=True)
+
+
+def test_groupby_list_infer_array_like(df):
+    result = df.groupby(list(df['A'])).mean()
+    expected = df.groupby(df['A']).mean()
+    assert_frame_equal(result, expected, check_names=False)
+
+    pytest.raises(Exception, df.groupby, list(df['A'][:-1]))
+
+    # pathological case of ambiguity
+    df = DataFrame({'foo': [0, 1],
+                    'bar': [3, 4],
+                    'val': np.random.randn(2)})
+
+    result = df.groupby(['foo', 'bar']).mean()
+    expected = df.groupby([df['foo'], df['bar']]).mean()[['val']]
+
+
+def test_groupby_keys_same_size_as_index():
+    # GH 11185
+    freq = 's'
+    index = pd.date_range(start=pd.Timestamp('2015-09-29T11:34:44-0700'),
+                          periods=2, freq=freq)
+    df = pd.DataFrame([['A', 10], ['B', 15]], columns=[
+        'metric', 'values'
+    ], index=index)
+    result = df.groupby([pd.Grouper(level=0, freq=freq), 'metric']).mean()
+    expected = df.set_index([df.index, 'metric'])
+
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_one_row():
+    # GH 11741
+    df1 = pd.DataFrame(np.random.randn(1, 4), columns=list('ABCD'))
+    pytest.raises(KeyError, df1.groupby, 'Z')
+    df2 = pd.DataFrame(np.random.randn(2, 4), columns=list('ABCD'))
+    pytest.raises(KeyError, df2.groupby, 'Z')
+
+
+def test_groupby_nat_exclude():
+    # GH 6992
+    df = pd.DataFrame(
+        {'values': np.random.randn(8),
+         'dt': [np.nan, pd.Timestamp('2013-01-01'), np.nan, pd.Timestamp(
+             '2013-02-01'), np.nan, pd.Timestamp('2013-02-01'), np.nan,
+            pd.Timestamp('2013-01-01')],
+         'str': [np.nan, 'a', np.nan, 'a', np.nan, 'a', np.nan, 'b']})
+    grouped = df.groupby('dt')
+
+    expected = [pd.Index([1, 7]), pd.Index([3, 5])]
+    keys = sorted(grouped.groups.keys())
+    assert len(keys) == 2
+    for k, e in zip(keys, expected):
+        # grouped.groups keys are np.datetime64 with system tz
+        # not to be affected by tz, only compare values
+        tm.assert_index_equal(grouped.groups[k], e)
+
+    # confirm obj is not filtered
+    tm.assert_frame_equal(grouped.grouper.groupings[0].obj, df)
+    assert grouped.ngroups == 2
+
+    expected = {
+        Timestamp('2013-01-01 00:00:00'): np.array([1, 7], dtype=np.int64),
+        Timestamp('2013-02-01 00:00:00'): np.array([3, 5], dtype=np.int64)
+    }
+
+    for k in grouped.indices:
+        tm.assert_numpy_array_equal(grouped.indices[k], expected[k])
+
+    tm.assert_frame_equal(
+        grouped.get_group(Timestamp('2013-01-01')), df.iloc[[1, 7]])
+    tm.assert_frame_equal(
+        grouped.get_group(Timestamp('2013-02-01')), df.iloc[[3, 5]])
+
+    pytest.raises(KeyError, grouped.get_group, pd.NaT)
+
+    nan_df = DataFrame({'nan': [np.nan, np.nan, np.nan],
+                        'nat': [pd.NaT, pd.NaT, pd.NaT]})
+    assert nan_df['nan'].dtype == 'float64'
+    assert nan_df['nat'].dtype == 'datetime64[ns]'
+
+    for key in ['nan', 'nat']:
+        grouped = nan_df.groupby(key)
+        assert grouped.groups == {}
+        assert grouped.ngroups == 0
+        assert grouped.indices == {}
+        pytest.raises(KeyError, grouped.get_group, np.nan)
+        pytest.raises(KeyError, grouped.get_group, pd.NaT)
+
+
+def test_sparse_friendly(df):
+    sdf = df[['C', 'D']].to_sparse()
+    with catch_warnings(record=True):
+        panel = tm.makePanel()
+        tm.add_nans(panel)
+
+    def _check_work(gp):
+        gp.mean()
+        gp.agg(np.mean)
+        dict(iter(gp))
+
+    # it works!
+    _check_work(sdf.groupby(lambda x: x // 2))
+    _check_work(sdf['C'].groupby(lambda x: x // 2))
+    _check_work(sdf.groupby(df['A']))
+
+    # do this someday
+    # _check_work(panel.groupby(lambda x: x.month, axis=1))
+
+
+def test_panel_groupby():
+    with catch_warnings(record=True):
+        panel = tm.makePanel()
+        tm.add_nans(panel)
+        grouped = panel.groupby({'ItemA': 0, 'ItemB': 0, 'ItemC': 1},
+                                axis='items')
+        agged = grouped.mean()
+        agged2 = grouped.agg(lambda x: x.mean('items'))
+
+        tm.assert_panel_equal(agged, agged2)
+
+        tm.assert_index_equal(agged.items, Index([0, 1]))
+
+        grouped = panel.groupby(lambda x: x.month, axis='major')
+        agged = grouped.mean()
+
+        exp = Index(sorted(list(set(panel.major_axis.month))))
+        tm.assert_index_equal(agged.major_axis, exp)
+
+        grouped = panel.groupby({'A': 0, 'B': 0, 'C': 1, 'D': 1},
+                                axis='minor')
+        agged = grouped.mean()
+        tm.assert_index_equal(agged.minor_axis, Index([0, 1]))
+
+
+def test_groupby_2d_malformed():
+    d = DataFrame(index=lrange(2))
+    d['group'] = ['g1', 'g2']
+    d['zeros'] = [0, 0]
+    d['ones'] = [1, 1]
+    d['label'] = ['l1', 'l2']
+    tmp = d.groupby(['group']).mean()
+    res_values = np.array([[0, 1], [0, 1]], dtype=np.int64)
+    tm.assert_index_equal(tmp.columns, Index(['zeros', 'ones']))
+    tm.assert_numpy_array_equal(tmp.values, res_values)
+
+
+def test_int32_overflow():
+    B = np.concatenate((np.arange(10000), np.arange(10000), np.arange(5000)
+                        ))
+    A = np.arange(25000)
+    df = DataFrame({'A': A,
+                    'B': B,
+                    'C': A,
+                    'D': B,
+                    'E': np.random.randn(25000)})
+
+    left = df.groupby(['A', 'B', 'C', 'D']).sum()
+    right = df.groupby(['D', 'C', 'B', 'A']).sum()
+    assert len(left) == len(right)
+
+
+def test_groupby_sort_multi():
+    df = DataFrame({'a': ['foo', 'bar', 'baz'],
+                    'b': [3, 2, 1],
+                    'c': [0, 1, 2],
+                    'd': np.random.randn(3)})
+
+    tups = lmap(tuple, df[['a', 'b', 'c']].values)
+    tups = com._asarray_tuplesafe(tups)
+    result = df.groupby(['a', 'b', 'c'], sort=True).sum()
+    tm.assert_numpy_array_equal(result.index.values, tups[[1, 2, 0]])
+
+    tups = lmap(tuple, df[['c', 'a', 'b']].values)
+    tups = com._asarray_tuplesafe(tups)
+    result = df.groupby(['c', 'a', 'b'], sort=True).sum()
+    tm.assert_numpy_array_equal(result.index.values, tups)
+
+    tups = lmap(tuple, df[['b', 'c', 'a']].values)
+    tups = com._asarray_tuplesafe(tups)
+    result = df.groupby(['b', 'c', 'a'], sort=True).sum()
+    tm.assert_numpy_array_equal(result.index.values, tups[[2, 1, 0]])
+
+    df = DataFrame({'a': [0, 1, 2, 0, 1, 2],
+                    'b': [0, 0, 0, 1, 1, 1],
+                    'd': np.random.randn(6)})
+    grouped = df.groupby(['a', 'b'])['d']
+    result = grouped.sum()
+
+    def _check_groupby(df, result, keys, field, f=lambda x: x.sum()):
+        tups = lmap(tuple, df[keys].values)
+        tups = com._asarray_tuplesafe(tups)
+        expected = f(df.groupby(tups)[field])
+        for k, v in compat.iteritems(expected):
+            assert (result[k] == v)
+
+    _check_groupby(df, result, ['a', 'b'], 'd')
+
+
+def test_dont_clobber_name_column():
+    df = DataFrame({'key': ['a', 'a', 'a', 'b', 'b', 'b'],
+                    'name': ['foo', 'bar', 'baz'] * 2})
+
+    result = df.groupby('key').apply(lambda x: x)
+    assert_frame_equal(result, df)
+
+
+def test_skip_group_keys():
+
+    tsf = tm.makeTimeDataFrame()
+
+    grouped = tsf.groupby(lambda x: x.month, group_keys=False)
+    result = grouped.apply(lambda x: x.sort_values(by='A')[:3])
+
+    pieces = []
+    for key, group in grouped:
+        pieces.append(group.sort_values(by='A')[:3])
+
+    expected = pd.concat(pieces)
+    assert_frame_equal(result, expected)
+
+    grouped = tsf['A'].groupby(lambda x: x.month, group_keys=False)
+    result = grouped.apply(lambda x: x.sort_values()[:3])
+
+    pieces = []
+    for key, group in grouped:
+        pieces.append(group.sort_values()[:3])
+
+    expected = pd.concat(pieces)
+    assert_series_equal(result, expected)
+
+
+def test_no_nonsense_name(frame):
+    # GH #995
+    s = frame['C'].copy()
+    s.name = None
+
+    result = s.groupby(frame['A']).agg(np.sum)
+    assert result.name is None
+
+
+def test_multifunc_sum_bug():
+    # GH #1065
+    x = DataFrame(np.arange(9).reshape(3, 3))
+    x['test'] = 0
+    x['fl'] = [1.3, 1.5, 1.6]
+
+    grouped = x.groupby('test')
+    result = grouped.agg({'fl': 'sum', 2: 'size'})
+    assert result['fl'].dtype == np.float64
+
+
+def test_handle_dict_return_value(df):
+    def f(group):
+        return {'max': group.max(), 'min': group.min()}
+
+    def g(group):
+        return Series({'max': group.max(), 'min': group.min()})
+
+    result = df.groupby('A')['C'].apply(f)
+    expected = df.groupby('A')['C'].apply(g)
+
+    assert isinstance(result, Series)
+    assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('grouper', ['A', ['A', 'B']])
+def test_set_group_name(df, grouper):
+    def f(group):
+        assert group.name is not None
+        return group
+
+    def freduce(group):
+        assert group.name is not None
+        return group.sum()
+
+    def foo(x):
+        return freduce(x)
+
+    grouped = df.groupby(grouper)
+
+    # make sure all these work
+    grouped.apply(f)
+    grouped.aggregate(freduce)
+    grouped.aggregate({'C': freduce, 'D': freduce})
+    grouped.transform(f)
+
+    grouped['C'].apply(f)
+    grouped['C'].aggregate(freduce)
+    grouped['C'].aggregate([freduce, foo])
+    grouped['C'].transform(f)
+
+
+def test_group_name_available_in_inference_pass():
+    # gh-15062
+    df = pd.DataFrame({'a': [0, 0, 1, 1, 2, 2], 'b': np.arange(6)})
+
+    names = []
+
+    def f(group):
+        names.append(group.name)
+        return group.copy()
+
+    df.groupby('a', sort=False, group_keys=False).apply(f)
+    # we expect 2 zeros because we call ``f`` once to see if a faster route
+    # can be used.
+    expected_names = [0, 0, 1, 2]
+    assert names == expected_names
+
+
+def test_no_dummy_key_names(df):
+    # see gh-1291
+    result = df.groupby(df['A'].values).sum()
+    assert result.index.name is None
+
+    result = df.groupby([df['A'].values, df['B'].values]).sum()
+    assert result.index.names == (None, None)
+
+
+def test_groupby_sort_multiindex_series():
+    # series multiindex groupby sort argument was not being passed through
+    # _compress_group_index
+    # GH 9444
+    index = MultiIndex(levels=[[1, 2], [1, 2]],
+                       labels=[[0, 0, 0, 0, 1, 1], [1, 1, 0, 0, 0, 0]],
+                       names=['a', 'b'])
+    mseries = Series([0, 1, 2, 3, 4, 5], index=index)
+    index = MultiIndex(levels=[[1, 2], [1, 2]],
+                       labels=[[0, 0, 1], [1, 0, 0]], names=['a', 'b'])
+    mseries_result = Series([0, 2, 4], index=index)
+
+    result = mseries.groupby(level=['a', 'b'], sort=False).first()
+    assert_series_equal(result, mseries_result)
+    result = mseries.groupby(level=['a', 'b'], sort=True).first()
+    assert_series_equal(result, mseries_result.sort_index())
+
+
+def test_groupby_reindex_inside_function():
+
+    periods = 1000
+    ind = DatetimeIndex(start='2012/1/1', freq='5min', periods=periods)
+    df = DataFrame({'high': np.arange(
+        periods), 'low': np.arange(periods)}, index=ind)
+
+    def agg_before(hour, func, fix=False):
+        """
+            Run an aggregate func on the subset of data.
+        """
+
+        def _func(data):
+            d = data.loc[data.index.map(
+                lambda x: x.hour < 11)].dropna()
+            if fix:
+                data[data.index[0]]
+            if len(d) == 0:
+                return None
+            return func(d)
+
+        return _func
+
+    def afunc(data):
+        d = data.select(lambda x: x.hour < 11).dropna()
+        return np.max(d)
+
+    grouped = df.groupby(lambda x: datetime(x.year, x.month, x.day))
+    closure_bad = grouped.agg({'high': agg_before(11, np.max)})
+    closure_good = grouped.agg({'high': agg_before(11, np.max, True)})
+
+    assert_frame_equal(closure_bad, closure_good)
+
+
+def test_groupby_multiindex_missing_pair():
+    # GH9049
+    df = DataFrame({'group1': ['a', 'a', 'a', 'b'],
+                    'group2': ['c', 'c', 'd', 'c'],
+                    'value': [1, 1, 1, 5]})
+    df = df.set_index(['group1', 'group2'])
+    df_grouped = df.groupby(level=['group1', 'group2'], sort=True)
+
+    res = df_grouped.agg('sum')
+    idx = MultiIndex.from_tuples(
+        [('a', 'c'), ('a', 'd'), ('b', 'c')], names=['group1', 'group2'])
+    exp = DataFrame([[2], [1], [5]], index=idx, columns=['value'])
+
+    tm.assert_frame_equal(res, exp)
+
+
+def test_groupby_multiindex_not_lexsorted():
+    # GH 11640
+
+    # define the lexsorted version
+    lexsorted_mi = MultiIndex.from_tuples(
+        [('a', ''), ('b1', 'c1'), ('b2', 'c2')], names=['b', 'c'])
+    lexsorted_df = DataFrame([[1, 3, 4]], columns=lexsorted_mi)
+    assert lexsorted_df.columns.is_lexsorted()
+
+    # define the non-lexsorted version
+    not_lexsorted_df = DataFrame(columns=['a', 'b', 'c', 'd'],
+                                 data=[[1, 'b1', 'c1', 3],
+                                       [1, 'b2', 'c2', 4]])
+    not_lexsorted_df = not_lexsorted_df.pivot_table(
+        index='a', columns=['b', 'c'], values='d')
+    not_lexsorted_df = not_lexsorted_df.reset_index()
+    assert not not_lexsorted_df.columns.is_lexsorted()
+
+    # compare the results
+    tm.assert_frame_equal(lexsorted_df, not_lexsorted_df)
+
+    expected = lexsorted_df.groupby('a').mean()
+    with tm.assert_produces_warning(PerformanceWarning):
+        result = not_lexsorted_df.groupby('a').mean()
+    tm.assert_frame_equal(expected, result)
+
+    # a transforming function should work regardless of sort
+    # GH 14776
+    df = DataFrame({'x': ['a', 'a', 'b', 'a'],
+                    'y': [1, 1, 2, 2],
+                    'z': [1, 2, 3, 4]}).set_index(['x', 'y'])
+    assert not df.index.is_lexsorted()
+
+    for level in [0, 1, [0, 1]]:
+        for sort in [False, True]:
+            result = df.groupby(level=level, sort=sort).apply(
+                DataFrame.drop_duplicates)
+            expected = df
+            tm.assert_frame_equal(expected, result)
+
+            result = df.sort_index().groupby(level=level, sort=sort).apply(
+                DataFrame.drop_duplicates)
+            expected = df.sort_index()
+            tm.assert_frame_equal(expected, result)
+
+
+def test_index_label_overlaps_location():
+    # checking we don't have any label/location confusion in the
+    # the wake of GH5375
+    df = DataFrame(list('ABCDE'), index=[2, 0, 2, 1, 1])
+    g = df.groupby(list('ababb'))
+    actual = g.filter(lambda x: len(x) > 2)
+    expected = df.iloc[[1, 3, 4]]
+    assert_frame_equal(actual, expected)
+
+    ser = df[0]
+    g = ser.groupby(list('ababb'))
+    actual = g.filter(lambda x: len(x) > 2)
+    expected = ser.take([1, 3, 4])
+    assert_series_equal(actual, expected)
+
+    # ... and again, with a generic Index of floats
+    df.index = df.index.astype(float)
+    g = df.groupby(list('ababb'))
+    actual = g.filter(lambda x: len(x) > 2)
+    expected = df.iloc[[1, 3, 4]]
+    assert_frame_equal(actual, expected)
+
+    ser = df[0]
+    g = ser.groupby(list('ababb'))
+    actual = g.filter(lambda x: len(x) > 2)
+    expected = ser.take([1, 3, 4])
+    assert_series_equal(actual, expected)
+
+
+def test_transform_doesnt_clobber_ints():
+    # GH 7972
+    n = 6
+    x = np.arange(n)
+    df = DataFrame({'a': x // 2, 'b': 2.0 * x, 'c': 3.0 * x})
+    df2 = DataFrame({'a': x // 2 * 1.0, 'b': 2.0 * x, 'c': 3.0 * x})
+
+    gb = df.groupby('a')
+    result = gb.transform('mean')
+
+    gb2 = df2.groupby('a')
+    expected = gb2.transform('mean')
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('sort_column', ['ints', 'floats', 'strings',
+                                         ['ints', 'floats'],
+                                         ['ints', 'strings']])
+@pytest.mark.parametrize('group_column', ['int_groups', 'string_groups',
+                                          ['int_groups', 'string_groups']])
+def test_groupby_preserves_sort(sort_column, group_column):
+    # Test to ensure that groupby always preserves sort order of original
+    # object. Issue #8588 and #9651
+
+    df = DataFrame(
+        {'int_groups': [3, 1, 0, 1, 0, 3, 3, 3],
+         'string_groups': ['z', 'a', 'z', 'a', 'a', 'g', 'g', 'g'],
+         'ints': [8, 7, 4, 5, 2, 9, 1, 1],
+         'floats': [2.3, 5.3, 6.2, -2.4, 2.2, 1.1, 1.1, 5],
+         'strings': ['z', 'd', 'a', 'e', 'word', 'word2', '42', '47']})
+
+    # Try sorting on different types and with different group types
+
+    df = df.sort_values(by=sort_column)
+    g = df.groupby(group_column)
+
+    def test_sort(x):
+        assert_frame_equal(x, x.sort_values(by=sort_column))
+    g.apply(test_sort)
+
+
+def test_group_shift_with_null_key():
+    # This test is designed to replicate the segfault in issue #13813.
+    n_rows = 1200
+
+    # Generate a moderately large dataframe with occasional missing
+    # values in column `B`, and then group by [`A`, `B`]. This should
+    # force `-1` in `labels` array of `g.grouper.group_info` exactly
+    # at those places, where the group-by key is partially missing.
+    df = DataFrame([(i % 12, i % 3 if i % 3 else np.nan, i)
+                    for i in range(n_rows)], dtype=float,
+                   columns=["A", "B", "Z"], index=None)
+    g = df.groupby(["A", "B"])
+
+    expected = DataFrame([(i + 12 if i % 3 and i < n_rows - 12
+                           else np.nan)
+                          for i in range(n_rows)], dtype=float,
+                         columns=["Z"], index=None)
+    result = g.shift(-1)
+
+    assert_frame_equal(result, expected)
+
+
+def test_pivot_table_values_key_error():
+    # This test is designed to replicate the error in issue #14938
+    df = pd.DataFrame({'eventDate':
+                       pd.date_range(pd.datetime.today(),
+                                     periods=20, freq='M').tolist(),
+                       'thename': range(0, 20)})
+
+    df['year'] = df.set_index('eventDate').index.year
+    df['month'] = df.set_index('eventDate').index.month
+
+    with pytest.raises(KeyError):
+        df.reset_index().pivot_table(index='year', columns='month',
+                                     values='badname', aggfunc='count')
+
+
+def test_empty_dataframe_groupby():
+    # GH8093
+    df = DataFrame(columns=['A', 'B', 'C'])
+
+    result = df.groupby('A').sum()
+    expected = DataFrame(columns=['B', 'C'], dtype=np.float64)
+    expected.index.name = 'A'
+
+    assert_frame_equal(result, expected)
+
+
+def test_tuple_warns():
+    # https://github.com/pandas-dev/pandas/issues/18314
+    df = pd.DataFrame({('a', 'b'): [1, 1, 2, 2], 'a': [1, 1, 1, 2],
+                       'b': [1, 2, 2, 2], 'c': [1, 1, 1, 1]})
+    with tm.assert_produces_warning(FutureWarning) as w:
+        df[['a', 'b', 'c']].groupby(('a', 'b')).c.mean()
+
+    assert "Interpreting tuple 'by' as a list" in str(w[0].message)
+
+    with tm.assert_produces_warning(None):
+        df.groupby(('a', 'b')).c.mean()
+
+
+def test_tuple_warns_unhashable():
+    # https://github.com/pandas-dev/pandas/issues/18314
+    business_dates = date_range(start='4/1/2014', end='6/30/2014',
+                                freq='B')
+    df = DataFrame(1, index=business_dates, columns=['a', 'b'])
+
+    with tm.assert_produces_warning(FutureWarning) as w:
+        df.groupby((df.index.year, df.index.month)).nth([0, 3, -1])
+
+    assert "Interpreting tuple 'by' as a list" in str(w[0].message)
+
+
+def test_tuple_correct_keyerror():
+    # https://github.com/pandas-dev/pandas/issues/18798
+    df = pd.DataFrame(1, index=range(3),
+                      columns=pd.MultiIndex.from_product([[1, 2],
+                                                          [3, 4]]))
+    with tm.assert_raises_regex(KeyError, "(7, 8)"):
+        df.groupby((7, 8)).mean()
diff --git a/pandas/tests/groupby/test_grouping.py b/pandas/tests/groupby/test_grouping.py
new file mode 100644
index 0000000000000..c0f5c43b2fd35
--- /dev/null
+++ b/pandas/tests/groupby/test_grouping.py
@@ -0,0 +1,809 @@
+# -*- coding: utf-8 -*-
+
+""" test where we are determining what we are grouping, or getting groups """
+
+import pytest
+
+from warnings import catch_warnings
+from pandas import (date_range, Timestamp,
+                    Index, MultiIndex, DataFrame, Series, CategoricalIndex)
+from pandas.util.testing import (assert_panel_equal, assert_frame_equal,
+                                 assert_series_equal, assert_almost_equal)
+from pandas.core.groupby.groupby import Grouping
+from pandas.compat import lrange, long
+
+from pandas import compat
+import numpy as np
+
+import pandas.util.testing as tm
+import pandas as pd
+
+
+# selection
+# --------------------------------
+
+class TestSelection():
+
+    def test_select_bad_cols(self):
+        df = DataFrame([[1, 2]], columns=['A', 'B'])
+        g = df.groupby('A')
+        pytest.raises(KeyError, g.__getitem__, ['C'])  # g[['C']]
+
+        pytest.raises(KeyError, g.__getitem__, ['A', 'C'])  # g[['A', 'C']]
+        with tm.assert_raises_regex(KeyError, '^[^A]+$'):
+            # A should not be referenced as a bad column...
+            # will have to rethink regex if you change message!
+            g[['A', 'C']]
+
+    def test_groupby_duplicated_column_errormsg(self):
+        # GH7511
+        df = DataFrame(columns=['A', 'B', 'A', 'C'],
+                       data=[range(4), range(2, 6), range(0, 8, 2)])
+
+        pytest.raises(ValueError, df.groupby, 'A')
+        pytest.raises(ValueError, df.groupby, ['A', 'B'])
+
+        grouped = df.groupby('B')
+        c = grouped.count()
+        assert c.columns.nlevels == 1
+        assert c.columns.size == 3
+
+    def test_column_select_via_attr(self, df):
+        result = df.groupby('A').C.sum()
+        expected = df.groupby('A')['C'].sum()
+        assert_series_equal(result, expected)
+
+        df['mean'] = 1.5
+        result = df.groupby('A').mean()
+        expected = df.groupby('A').agg(np.mean)
+        assert_frame_equal(result, expected)
+
+    def test_getitem_list_of_columns(self):
+        df = DataFrame(
+            {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
+             'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
+             'C': np.random.randn(8),
+             'D': np.random.randn(8),
+             'E': np.random.randn(8)})
+
+        result = df.groupby('A')[['C', 'D']].mean()
+        result2 = df.groupby('A')['C', 'D'].mean()
+        result3 = df.groupby('A')[df.columns[2:4]].mean()
+
+        expected = df.loc[:, ['A', 'C', 'D']].groupby('A').mean()
+
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result2, expected)
+        assert_frame_equal(result3, expected)
+
+    def test_getitem_numeric_column_names(self):
+        # GH #13731
+        df = DataFrame({0: list('abcd') * 2,
+                        2: np.random.randn(8),
+                        4: np.random.randn(8),
+                        6: np.random.randn(8)})
+        result = df.groupby(0)[df.columns[1:3]].mean()
+        result2 = df.groupby(0)[2, 4].mean()
+        result3 = df.groupby(0)[[2, 4]].mean()
+
+        expected = df.loc[:, [0, 2, 4]].groupby(0).mean()
+
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result2, expected)
+        assert_frame_equal(result3, expected)
+
+
+# grouping
+# --------------------------------
+
+class TestGrouping():
+
+    def test_grouper_index_types(self):
+        # related GH5375
+        # groupby misbehaving when using a Floatlike index
+        df = DataFrame(np.arange(10).reshape(5, 2), columns=list('AB'))
+        for index in [tm.makeFloatIndex, tm.makeStringIndex,
+                      tm.makeUnicodeIndex, tm.makeIntIndex, tm.makeDateIndex,
+                      tm.makePeriodIndex]:
+
+            df.index = index(len(df))
+            df.groupby(list('abcde')).apply(lambda x: x)
+
+            df.index = list(reversed(df.index.tolist()))
+            df.groupby(list('abcde')).apply(lambda x: x)
+
+    def test_grouper_multilevel_freq(self):
+
+        # GH 7885
+        # with level and freq specified in a pd.Grouper
+        from datetime import date, timedelta
+        d0 = date.today() - timedelta(days=14)
+        dates = date_range(d0, date.today())
+        date_index = pd.MultiIndex.from_product(
+            [dates, dates], names=['foo', 'bar'])
+        df = pd.DataFrame(np.random.randint(0, 100, 225), index=date_index)
+
+        # Check string level
+        expected = df.reset_index().groupby([pd.Grouper(
+            key='foo', freq='W'), pd.Grouper(key='bar', freq='W')]).sum()
+        # reset index changes columns dtype to object
+        expected.columns = pd.Index([0], dtype='int64')
+
+        result = df.groupby([pd.Grouper(level='foo', freq='W'), pd.Grouper(
+            level='bar', freq='W')]).sum()
+        assert_frame_equal(result, expected)
+
+        # Check integer level
+        result = df.groupby([pd.Grouper(level=0, freq='W'), pd.Grouper(
+            level=1, freq='W')]).sum()
+        assert_frame_equal(result, expected)
+
+    def test_grouper_creation_bug(self):
+
+        # GH 8795
+        df = DataFrame({'A': [0, 0, 1, 1, 2, 2], 'B': [1, 2, 3, 4, 5, 6]})
+        g = df.groupby('A')
+        expected = g.sum()
+
+        g = df.groupby(pd.Grouper(key='A'))
+        result = g.sum()
+        assert_frame_equal(result, expected)
+
+        result = g.apply(lambda x: x.sum())
+        assert_frame_equal(result, expected)
+
+        g = df.groupby(pd.Grouper(key='A', axis=0))
+        result = g.sum()
+        assert_frame_equal(result, expected)
+
+        # GH14334
+        # pd.Grouper(key=...) may be passed in a list
+        df = DataFrame({'A': [0, 0, 0, 1, 1, 1],
+                        'B': [1, 1, 2, 2, 3, 3],
+                        'C': [1, 2, 3, 4, 5, 6]})
+        # Group by single column
+        expected = df.groupby('A').sum()
+        g = df.groupby([pd.Grouper(key='A')])
+        result = g.sum()
+        assert_frame_equal(result, expected)
+
+        # Group by two columns
+        # using a combination of strings and Grouper objects
+        expected = df.groupby(['A', 'B']).sum()
+
+        # Group with two Grouper objects
+        g = df.groupby([pd.Grouper(key='A'), pd.Grouper(key='B')])
+        result = g.sum()
+        assert_frame_equal(result, expected)
+
+        # Group with a string and a Grouper object
+        g = df.groupby(['A', pd.Grouper(key='B')])
+        result = g.sum()
+        assert_frame_equal(result, expected)
+
+        # Group with a Grouper object and a string
+        g = df.groupby([pd.Grouper(key='A'), 'B'])
+        result = g.sum()
+        assert_frame_equal(result, expected)
+
+        # GH8866
+        s = Series(np.arange(8, dtype='int64'),
+                   index=pd.MultiIndex.from_product(
+                       [list('ab'), range(2),
+                        date_range('20130101', periods=2)],
+                       names=['one', 'two', 'three']))
+        result = s.groupby(pd.Grouper(level='three', freq='M')).sum()
+        expected = Series([28], index=Index(
+            [Timestamp('2013-01-31')], freq='M', name='three'))
+        assert_series_equal(result, expected)
+
+        # just specifying a level breaks
+        result = s.groupby(pd.Grouper(level='one')).sum()
+        expected = s.groupby(level='one').sum()
+        assert_series_equal(result, expected)
+
+    def test_grouper_column_and_index(self):
+        # GH 14327
+
+        # Grouping a multi-index frame by a column and an index level should
+        # be equivalent to resetting the index and grouping by two columns
+        idx = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('a', 3),
+                                         ('b', 1), ('b', 2), ('b', 3)])
+        idx.names = ['outer', 'inner']
+        df_multi = pd.DataFrame({"A": np.arange(6),
+                                 'B': ['one', 'one', 'two',
+                                       'two', 'one', 'one']},
+                                index=idx)
+        result = df_multi.groupby(['B', pd.Grouper(level='inner')]).mean()
+        expected = df_multi.reset_index().groupby(['B', 'inner']).mean()
+        assert_frame_equal(result, expected)
+
+        # Test the reverse grouping order
+        result = df_multi.groupby([pd.Grouper(level='inner'), 'B']).mean()
+        expected = df_multi.reset_index().groupby(['inner', 'B']).mean()
+        assert_frame_equal(result, expected)
+
+        # Grouping a single-index frame by a column and the index should
+        # be equivalent to resetting the index and grouping by two columns
+        df_single = df_multi.reset_index('outer')
+        result = df_single.groupby(['B', pd.Grouper(level='inner')]).mean()
+        expected = df_single.reset_index().groupby(['B', 'inner']).mean()
+        assert_frame_equal(result, expected)
+
+        # Test the reverse grouping order
+        result = df_single.groupby([pd.Grouper(level='inner'), 'B']).mean()
+        expected = df_single.reset_index().groupby(['inner', 'B']).mean()
+        assert_frame_equal(result, expected)
+
+    def test_groupby_levels_and_columns(self):
+        # GH9344, GH9049
+        idx_names = ['x', 'y']
+        idx = pd.MultiIndex.from_tuples(
+            [(1, 1), (1, 2), (3, 4), (5, 6)], names=idx_names)
+        df = pd.DataFrame(np.arange(12).reshape(-1, 3), index=idx)
+
+        by_levels = df.groupby(level=idx_names).mean()
+        # reset_index changes columns dtype to object
+        by_columns = df.reset_index().groupby(idx_names).mean()
+
+        tm.assert_frame_equal(by_levels, by_columns, check_column_type=False)
+
+        by_columns.columns = pd.Index(by_columns.columns, dtype=np.int64)
+        tm.assert_frame_equal(by_levels, by_columns)
+
+    def test_groupby_categorical_index_and_columns(self, observed):
+        # GH18432
+        columns = ['A', 'B', 'A', 'B']
+        categories = ['B', 'A']
+        data = np.ones((5, 4), int)
+        cat_columns = CategoricalIndex(columns,
+                                       categories=categories,
+                                       ordered=True)
+        df = DataFrame(data=data, columns=cat_columns)
+        result = df.groupby(axis=1, level=0, observed=observed).sum()
+        expected_data = 2 * np.ones((5, 2), int)
+
+        if observed:
+            # if we are not-observed we undergo a reindex
+            # so need to adjust the output as our expected sets us up
+            # to be non-observed
+            expected_columns = CategoricalIndex(['A', 'B'],
+                                                categories=categories,
+                                                ordered=True)
+        else:
+            expected_columns = CategoricalIndex(categories,
+                                                categories=categories,
+                                                ordered=True)
+        expected = DataFrame(data=expected_data, columns=expected_columns)
+        assert_frame_equal(result, expected)
+
+        # test transposed version
+        df = DataFrame(data.T, index=cat_columns)
+        result = df.groupby(axis=0, level=0, observed=observed).sum()
+        expected = DataFrame(data=expected_data.T, index=expected_columns)
+        assert_frame_equal(result, expected)
+
+    def test_grouper_getting_correct_binner(self):
+
+        # GH 10063
+        # using a non-time-based grouper and a time-based grouper
+        # and specifying levels
+        df = DataFrame({'A': 1}, index=pd.MultiIndex.from_product(
+            [list('ab'), date_range('20130101', periods=80)], names=['one',
+                                                                     'two']))
+        result = df.groupby([pd.Grouper(level='one'), pd.Grouper(
+            level='two', freq='M')]).sum()
+        expected = DataFrame({'A': [31, 28, 21, 31, 28, 21]},
+                             index=MultiIndex.from_product(
+                                 [list('ab'),
+                                  date_range('20130101', freq='M', periods=3)],
+                                 names=['one', 'two']))
+        assert_frame_equal(result, expected)
+
+    def test_grouper_iter(self, df):
+        assert sorted(df.groupby('A').grouper) == ['bar', 'foo']
+
+    def test_empty_groups(self, df):
+        # see gh-1048
+        pytest.raises(ValueError, df.groupby, [])
+
+    def test_groupby_grouper(self, df):
+        grouped = df.groupby('A')
+
+        result = df.groupby(grouped.grouper).mean()
+        expected = grouped.mean()
+        tm.assert_frame_equal(result, expected)
+
+    def test_groupby_dict_mapping(self):
+        # GH #679
+        from pandas import Series
+        s = Series({'T1': 5})
+        result = s.groupby({'T1': 'T2'}).agg(sum)
+        expected = s.groupby(['T2']).agg(sum)
+        assert_series_equal(result, expected)
+
+        s = Series([1., 2., 3., 4.], index=list('abcd'))
+        mapping = {'a': 0, 'b': 0, 'c': 1, 'd': 1}
+
+        result = s.groupby(mapping).mean()
+        result2 = s.groupby(mapping).agg(np.mean)
+        expected = s.groupby([0, 0, 1, 1]).mean()
+        expected2 = s.groupby([0, 0, 1, 1]).mean()
+        assert_series_equal(result, expected)
+        assert_series_equal(result, result2)
+        assert_series_equal(result, expected2)
+
+    def test_groupby_grouper_f_sanity_checked(self):
+        dates = date_range('01-Jan-2013', periods=12, freq='MS')
+        ts = Series(np.random.randn(12), index=dates)
+
+        # GH3035
+        # index.map is used to apply grouper to the index
+        # if it fails on the elements, map tries it on the entire index as
+        # a sequence. That can yield invalid results that cause trouble
+        # down the line.
+        # the surprise comes from using key[0:6] rather then str(key)[0:6]
+        # when the elements are Timestamp.
+        # the result is Index[0:6], very confusing.
+
+        pytest.raises(AssertionError, ts.groupby, lambda key: key[0:6])
+
+    def test_grouping_error_on_multidim_input(self, df):
+        pytest.raises(ValueError,
+                      Grouping, df.index, df[['A', 'A']])
+
+    def test_multiindex_passthru(self):
+
+        # GH 7997
+        # regression from 0.14.1
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
+        df.columns = pd.MultiIndex.from_tuples([(0, 1), (1, 1), (2, 1)])
+
+        result = df.groupby(axis=1, level=[0, 1]).first()
+        assert_frame_equal(result, df)
+
+    def test_multiindex_negative_level(self, mframe):
+        # GH 13901
+        result = mframe.groupby(level=-1).sum()
+        expected = mframe.groupby(level='second').sum()
+        assert_frame_equal(result, expected)
+
+        result = mframe.groupby(level=-2).sum()
+        expected = mframe.groupby(level='first').sum()
+        assert_frame_equal(result, expected)
+
+        result = mframe.groupby(level=[-2, -1]).sum()
+        expected = mframe
+        assert_frame_equal(result, expected)
+
+        result = mframe.groupby(level=[-1, 'first']).sum()
+        expected = mframe.groupby(level=['second', 'first']).sum()
+        assert_frame_equal(result, expected)
+
+    def test_multifunc_select_col_integer_cols(self, df):
+        df.columns = np.arange(len(df.columns))
+
+        # it works!
+        df.groupby(1, as_index=False)[2].agg({'Q': np.mean})
+
+    def test_multiindex_columns_empty_level(self):
+        lst = [['count', 'values'], ['to filter', '']]
+        midx = MultiIndex.from_tuples(lst)
+
+        df = DataFrame([[long(1), 'A']], columns=midx)
+
+        grouped = df.groupby('to filter').groups
+        assert grouped['A'] == [0]
+
+        grouped = df.groupby([('to filter', '')]).groups
+        assert grouped['A'] == [0]
+
+        df = DataFrame([[long(1), 'A'], [long(2), 'B']], columns=midx)
+
+        expected = df.groupby('to filter').groups
+        result = df.groupby([('to filter', '')]).groups
+        assert result == expected
+
+        df = DataFrame([[long(1), 'A'], [long(2), 'A']], columns=midx)
+
+        expected = df.groupby('to filter').groups
+        result = df.groupby([('to filter', '')]).groups
+        tm.assert_dict_equal(result, expected)
+
+    def test_groupby_multiindex_tuple(self):
+        # GH 17979
+        df = pd.DataFrame([[1, 2, 3, 4], [3, 4, 5, 6], [1, 4, 2, 3]],
+                          columns=pd.MultiIndex.from_arrays(
+                              [['a', 'b', 'b', 'c'],
+                               [1, 1, 2, 2]]))
+        expected = df.groupby([('b', 1)]).groups
+        result = df.groupby(('b', 1)).groups
+        tm.assert_dict_equal(expected, result)
+
+        df2 = pd.DataFrame(df.values,
+                           columns=pd.MultiIndex.from_arrays(
+                               [['a', 'b', 'b', 'c'],
+                                ['d', 'd', 'e', 'e']]))
+        expected = df2.groupby([('b', 'd')]).groups
+        result = df.groupby(('b', 1)).groups
+        tm.assert_dict_equal(expected, result)
+
+        df3 = pd.DataFrame(df.values,
+                           columns=[('a', 'd'), ('b', 'd'), ('b', 'e'), 'c'])
+        expected = df3.groupby([('b', 'd')]).groups
+        result = df.groupby(('b', 1)).groups
+        tm.assert_dict_equal(expected, result)
+
+    @pytest.mark.parametrize('sort', [True, False])
+    def test_groupby_level(self, sort, mframe, df):
+        # GH 17537
+        frame = mframe
+        deleveled = frame.reset_index()
+
+        result0 = frame.groupby(level=0, sort=sort).sum()
+        result1 = frame.groupby(level=1, sort=sort).sum()
+
+        expected0 = frame.groupby(deleveled['first'].values, sort=sort).sum()
+        expected1 = frame.groupby(deleveled['second'].values, sort=sort).sum()
+
+        expected0.index.name = 'first'
+        expected1.index.name = 'second'
+
+        assert result0.index.name == 'first'
+        assert result1.index.name == 'second'
+
+        assert_frame_equal(result0, expected0)
+        assert_frame_equal(result1, expected1)
+        assert result0.index.name == frame.index.names[0]
+        assert result1.index.name == frame.index.names[1]
+
+        # groupby level name
+        result0 = frame.groupby(level='first', sort=sort).sum()
+        result1 = frame.groupby(level='second', sort=sort).sum()
+        assert_frame_equal(result0, expected0)
+        assert_frame_equal(result1, expected1)
+
+        # axis=1
+
+        result0 = frame.T.groupby(level=0, axis=1, sort=sort).sum()
+        result1 = frame.T.groupby(level=1, axis=1, sort=sort).sum()
+        assert_frame_equal(result0, expected0.T)
+        assert_frame_equal(result1, expected1.T)
+
+        # raise exception for non-MultiIndex
+        pytest.raises(ValueError, df.groupby, level=1)
+
+    def test_groupby_level_index_names(self):
+        # GH4014 this used to raise ValueError since 'exp'>1 (in py2)
+        df = DataFrame({'exp': ['A'] * 3 + ['B'] * 3,
+                        'var1': lrange(6), }).set_index('exp')
+        df.groupby(level='exp')
+        pytest.raises(ValueError, df.groupby, level='foo')
+
+    @pytest.mark.parametrize('sort', [True, False])
+    def test_groupby_level_with_nas(self, sort):
+        # GH 17537
+        index = MultiIndex(levels=[[1, 0], [0, 1, 2, 3]],
+                           labels=[[1, 1, 1, 1, 0, 0, 0, 0], [0, 1, 2, 3, 0, 1,
+                                                              2, 3]])
+
+        # factorizing doesn't confuse things
+        s = Series(np.arange(8.), index=index)
+        result = s.groupby(level=0, sort=sort).sum()
+        expected = Series([6., 22.], index=[0, 1])
+        assert_series_equal(result, expected)
+
+        index = MultiIndex(levels=[[1, 0], [0, 1, 2, 3]],
+                           labels=[[1, 1, 1, 1, -1, 0, 0, 0], [0, 1, 2, 3, 0,
+                                                               1, 2, 3]])
+
+        # factorizing doesn't confuse things
+        s = Series(np.arange(8.), index=index)
+        result = s.groupby(level=0, sort=sort).sum()
+        expected = Series([6., 18.], index=[0.0, 1.0])
+        assert_series_equal(result, expected)
+
+    def test_groupby_args(self, mframe):
+        # PR8618 and issue 8015
+        frame = mframe
+
+        def j():
+            frame.groupby()
+
+        tm.assert_raises_regex(TypeError, "You have to supply one of "
+                               "'by' and 'level'", j)
+
+        def k():
+            frame.groupby(by=None, level=None)
+
+        tm.assert_raises_regex(TypeError, "You have to supply one of "
+                               "'by' and 'level'", k)
+
+    @pytest.mark.parametrize('sort,labels', [
+        [True, [2, 2, 2, 0, 0, 1, 1, 3, 3, 3]],
+        [False, [0, 0, 0, 1, 1, 2, 2, 3, 3, 3]]
+    ])
+    def test_level_preserve_order(self, sort, labels, mframe):
+        # GH 17537
+        grouped = mframe.groupby(level=0, sort=sort)
+        exp_labels = np.array(labels, np.intp)
+        assert_almost_equal(grouped.grouper.labels[0], exp_labels)
+
+    def test_grouping_labels(self, mframe):
+        grouped = mframe.groupby(mframe.index.get_level_values(0))
+        exp_labels = np.array([2, 2, 2, 0, 0, 1, 1, 3, 3, 3], dtype=np.intp)
+        assert_almost_equal(grouped.grouper.labels[0], exp_labels)
+
+
+# get_group
+# --------------------------------
+
+class TestGetGroup():
+
+    def test_get_group(self):
+        with catch_warnings(record=True):
+            wp = tm.makePanel()
+            grouped = wp.groupby(lambda x: x.month, axis='major')
+
+            gp = grouped.get_group(1)
+            expected = wp.reindex(
+                major=[x for x in wp.major_axis if x.month == 1])
+            assert_panel_equal(gp, expected)
+
+        # GH 5267
+        # be datelike friendly
+        df = DataFrame({'DATE': pd.to_datetime(
+            ['10-Oct-2013', '10-Oct-2013', '10-Oct-2013', '11-Oct-2013',
+             '11-Oct-2013', '11-Oct-2013']),
+            'label': ['foo', 'foo', 'bar', 'foo', 'foo', 'bar'],
+            'VAL': [1, 2, 3, 4, 5, 6]})
+
+        g = df.groupby('DATE')
+        key = list(g.groups)[0]
+        result1 = g.get_group(key)
+        result2 = g.get_group(Timestamp(key).to_pydatetime())
+        result3 = g.get_group(str(Timestamp(key)))
+        assert_frame_equal(result1, result2)
+        assert_frame_equal(result1, result3)
+
+        g = df.groupby(['DATE', 'label'])
+
+        key = list(g.groups)[0]
+        result1 = g.get_group(key)
+        result2 = g.get_group((Timestamp(key[0]).to_pydatetime(), key[1]))
+        result3 = g.get_group((str(Timestamp(key[0])), key[1]))
+        assert_frame_equal(result1, result2)
+        assert_frame_equal(result1, result3)
+
+        # must pass a same-length tuple with multiple keys
+        pytest.raises(ValueError, lambda: g.get_group('foo'))
+        pytest.raises(ValueError, lambda: g.get_group(('foo')))
+        pytest.raises(ValueError,
+                      lambda: g.get_group(('foo', 'bar', 'baz')))
+
+    def test_get_group_empty_bins(self, observed):
+
+        d = pd.DataFrame([3, 1, 7, 6])
+        bins = [0, 5, 10, 15]
+        g = d.groupby(pd.cut(d[0], bins), observed=observed)
+
+        # TODO: should prob allow a str of Interval work as well
+        # IOW '(0, 5]'
+        result = g.get_group(pd.Interval(0, 5))
+        expected = DataFrame([3, 1], index=[0, 1])
+        assert_frame_equal(result, expected)
+
+        pytest.raises(KeyError, lambda: g.get_group(pd.Interval(10, 15)))
+
+    def test_get_group_grouped_by_tuple(self):
+        # GH 8121
+        df = DataFrame([[(1, ), (1, 2), (1, ), (1, 2)]], index=['ids']).T
+        gr = df.groupby('ids')
+        expected = DataFrame({'ids': [(1, ), (1, )]}, index=[0, 2])
+        result = gr.get_group((1, ))
+        assert_frame_equal(result, expected)
+
+        dt = pd.to_datetime(['2010-01-01', '2010-01-02', '2010-01-01',
+                             '2010-01-02'])
+        df = DataFrame({'ids': [(x, ) for x in dt]})
+        gr = df.groupby('ids')
+        result = gr.get_group(('2010-01-01', ))
+        expected = DataFrame({'ids': [(dt[0], ), (dt[0], )]}, index=[0, 2])
+        assert_frame_equal(result, expected)
+
+    def test_groupby_with_empty(self):
+        index = pd.DatetimeIndex(())
+        data = ()
+        series = pd.Series(data, index)
+        grouper = pd.Grouper(freq='D')
+        grouped = series.groupby(grouper)
+        assert next(iter(grouped), None) is None
+
+    def test_groupby_with_single_column(self):
+        df = pd.DataFrame({'a': list('abssbab')})
+        tm.assert_frame_equal(df.groupby('a').get_group('a'), df.iloc[[0, 5]])
+        # GH 13530
+        exp = pd.DataFrame([], index=pd.Index(['a', 'b', 's'], name='a'))
+        tm.assert_frame_equal(df.groupby('a').count(), exp)
+        tm.assert_frame_equal(df.groupby('a').sum(), exp)
+        tm.assert_frame_equal(df.groupby('a').nth(1), exp)
+
+    def test_gb_key_len_equal_axis_len(self):
+            # GH16843
+            # test ensures that index and column keys are recognized correctly
+            # when number of keys equals axis length of groupby
+            df = pd.DataFrame([['foo', 'bar', 'B', 1],
+                               ['foo', 'bar', 'B', 2],
+                               ['foo', 'baz', 'C', 3]],
+                              columns=['first', 'second', 'third', 'one'])
+            df = df.set_index(['first', 'second'])
+            df = df.groupby(['first', 'second', 'third']).size()
+            assert df.loc[('foo', 'bar', 'B')] == 2
+            assert df.loc[('foo', 'baz', 'C')] == 1
+
+
+# groups & iteration
+# --------------------------------
+
+class TestIteration():
+
+    def test_groups(self, df):
+        grouped = df.groupby(['A'])
+        groups = grouped.groups
+        assert groups is grouped.groups  # caching works
+
+        for k, v in compat.iteritems(grouped.groups):
+            assert (df.loc[v]['A'] == k).all()
+
+        grouped = df.groupby(['A', 'B'])
+        groups = grouped.groups
+        assert groups is grouped.groups  # caching works
+
+        for k, v in compat.iteritems(grouped.groups):
+            assert (df.loc[v]['A'] == k[0]).all()
+            assert (df.loc[v]['B'] == k[1]).all()
+
+    def test_grouping_is_iterable(self, tsframe):
+        # this code path isn't used anywhere else
+        # not sure it's useful
+        grouped = tsframe.groupby([lambda x: x.weekday(), lambda x: x.year])
+
+        # test it works
+        for g in grouped.grouper.groupings[0]:
+            pass
+
+    def test_multi_iter(self):
+        s = Series(np.arange(6))
+        k1 = np.array(['a', 'a', 'a', 'b', 'b', 'b'])
+        k2 = np.array(['1', '2', '1', '2', '1', '2'])
+
+        grouped = s.groupby([k1, k2])
+
+        iterated = list(grouped)
+        expected = [('a', '1', s[[0, 2]]), ('a', '2', s[[1]]),
+                    ('b', '1', s[[4]]), ('b', '2', s[[3, 5]])]
+        for i, ((one, two), three) in enumerate(iterated):
+            e1, e2, e3 = expected[i]
+            assert e1 == one
+            assert e2 == two
+            assert_series_equal(three, e3)
+
+    def test_multi_iter_frame(self, three_group):
+        k1 = np.array(['b', 'b', 'b', 'a', 'a', 'a'])
+        k2 = np.array(['1', '2', '1', '2', '1', '2'])
+        df = DataFrame({'v1': np.random.randn(6),
+                        'v2': np.random.randn(6),
+                        'k1': k1, 'k2': k2},
+                       index=['one', 'two', 'three', 'four', 'five', 'six'])
+
+        grouped = df.groupby(['k1', 'k2'])
+
+        # things get sorted!
+        iterated = list(grouped)
+        idx = df.index
+        expected = [('a', '1', df.loc[idx[[4]]]),
+                    ('a', '2', df.loc[idx[[3, 5]]]),
+                    ('b', '1', df.loc[idx[[0, 2]]]),
+                    ('b', '2', df.loc[idx[[1]]])]
+        for i, ((one, two), three) in enumerate(iterated):
+            e1, e2, e3 = expected[i]
+            assert e1 == one
+            assert e2 == two
+            assert_frame_equal(three, e3)
+
+        # don't iterate through groups with no data
+        df['k1'] = np.array(['b', 'b', 'b', 'a', 'a', 'a'])
+        df['k2'] = np.array(['1', '1', '1', '2', '2', '2'])
+        grouped = df.groupby(['k1', 'k2'])
+        groups = {}
+        for key, gp in grouped:
+            groups[key] = gp
+        assert len(groups) == 2
+
+        # axis = 1
+        three_levels = three_group.groupby(['A', 'B', 'C']).mean()
+        grouped = three_levels.T.groupby(axis=1, level=(1, 2))
+        for key, group in grouped:
+            pass
+
+    def test_multi_iter_panel(self):
+        with catch_warnings(record=True):
+            wp = tm.makePanel()
+            grouped = wp.groupby([lambda x: x.month, lambda x: x.weekday()],
+                                 axis=1)
+
+            for (month, wd), group in grouped:
+                exp_axis = [x
+                            for x in wp.major_axis
+                            if x.month == month and x.weekday() == wd]
+                expected = wp.reindex(major=exp_axis)
+                assert_panel_equal(group, expected)
+
+    def test_dictify(self, df):
+        dict(iter(df.groupby('A')))
+        dict(iter(df.groupby(['A', 'B'])))
+        dict(iter(df['C'].groupby(df['A'])))
+        dict(iter(df['C'].groupby([df['A'], df['B']])))
+        dict(iter(df.groupby('A')['C']))
+        dict(iter(df.groupby(['A', 'B'])['C']))
+
+    def test_groupby_with_small_elem(self):
+        # GH 8542
+        # length=2
+        df = pd.DataFrame({'event': ['start', 'start'],
+                           'change': [1234, 5678]},
+                          index=pd.DatetimeIndex(['2014-09-10', '2013-10-10']))
+        grouped = df.groupby([pd.Grouper(freq='M'), 'event'])
+        assert len(grouped.groups) == 2
+        assert grouped.ngroups == 2
+        assert (pd.Timestamp('2014-09-30'), 'start') in grouped.groups
+        assert (pd.Timestamp('2013-10-31'), 'start') in grouped.groups
+
+        res = grouped.get_group((pd.Timestamp('2014-09-30'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[0], :])
+        res = grouped.get_group((pd.Timestamp('2013-10-31'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[1], :])
+
+        df = pd.DataFrame({'event': ['start', 'start', 'start'],
+                           'change': [1234, 5678, 9123]},
+                          index=pd.DatetimeIndex(['2014-09-10', '2013-10-10',
+                                                  '2014-09-15']))
+        grouped = df.groupby([pd.Grouper(freq='M'), 'event'])
+        assert len(grouped.groups) == 2
+        assert grouped.ngroups == 2
+        assert (pd.Timestamp('2014-09-30'), 'start') in grouped.groups
+        assert (pd.Timestamp('2013-10-31'), 'start') in grouped.groups
+
+        res = grouped.get_group((pd.Timestamp('2014-09-30'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[0, 2], :])
+        res = grouped.get_group((pd.Timestamp('2013-10-31'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[1], :])
+
+        # length=3
+        df = pd.DataFrame({'event': ['start', 'start', 'start'],
+                           'change': [1234, 5678, 9123]},
+                          index=pd.DatetimeIndex(['2014-09-10', '2013-10-10',
+                                                  '2014-08-05']))
+        grouped = df.groupby([pd.Grouper(freq='M'), 'event'])
+        assert len(grouped.groups) == 3
+        assert grouped.ngroups == 3
+        assert (pd.Timestamp('2014-09-30'), 'start') in grouped.groups
+        assert (pd.Timestamp('2013-10-31'), 'start') in grouped.groups
+        assert (pd.Timestamp('2014-08-31'), 'start') in grouped.groups
+
+        res = grouped.get_group((pd.Timestamp('2014-09-30'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[0], :])
+        res = grouped.get_group((pd.Timestamp('2013-10-31'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[1], :])
+        res = grouped.get_group((pd.Timestamp('2014-08-31'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[2], :])
+
+    def test_grouping_string_repr(self):
+        # GH 13394
+        mi = MultiIndex.from_arrays([list("AAB"), list("aba")])
+        df = DataFrame([[1, 2, 3]], columns=mi)
+        gr = df.groupby(df[('A', 'a')])
+
+        result = gr.grouper.groupings[0].__repr__()
+        expected = "Grouping(('A', 'a'))"
+        assert result == expected
diff --git a/pandas/tests/groupby/test_index_as_string.py b/pandas/tests/groupby/test_index_as_string.py
new file mode 100644
index 0000000000000..9fe677664049e
--- /dev/null
+++ b/pandas/tests/groupby/test_index_as_string.py
@@ -0,0 +1,116 @@
+import pytest
+import pandas as pd
+import numpy as np
+
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+import pandas.util.testing as tm
+
+
+@pytest.fixture(params=[['inner'], ['inner', 'outer']])
+def frame(request):
+    levels = request.param
+    df = pd.DataFrame({'outer': ['a', 'a', 'a', 'b', 'b', 'b'],
+                       'inner': [1, 2, 3, 1, 2, 3],
+                       'A': np.arange(6),
+                       'B': ['one', 'one', 'two', 'two', 'one', 'one']})
+    if levels:
+        df = df.set_index(levels)
+
+    return df
+
+
+@pytest.fixture()
+def series():
+    df = pd.DataFrame({'outer': ['a', 'a', 'a', 'b', 'b', 'b'],
+                       'inner': [1, 2, 3, 1, 2, 3],
+                       'A': np.arange(6),
+                       'B': ['one', 'one', 'two', 'two', 'one', 'one']})
+    s = df.set_index(['outer', 'inner', 'B'])['A']
+
+    return s
+
+
+@pytest.mark.parametrize('key_strs,groupers', [
+    ('inner',  # Index name
+     pd.Grouper(level='inner')
+     ),
+    (['inner'],  # List of index name
+     [pd.Grouper(level='inner')]
+     ),
+    (['B', 'inner'],  # Column and index
+     ['B', pd.Grouper(level='inner')]
+     ),
+    (['inner', 'B'],  # Index and column
+     [pd.Grouper(level='inner'), 'B'])])
+def test_grouper_index_level_as_string(frame, key_strs, groupers):
+    result = frame.groupby(key_strs).mean()
+    expected = frame.groupby(groupers).mean()
+    assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('levels', [
+    'inner', 'outer', 'B',
+    ['inner'], ['outer'], ['B'],
+    ['inner', 'outer'], ['outer', 'inner'],
+    ['inner', 'outer', 'B'], ['B', 'outer', 'inner']
+])
+def test_grouper_index_level_as_string_series(series, levels):
+
+    # Compute expected result
+    if isinstance(levels, list):
+        groupers = [pd.Grouper(level=lv) for lv in levels]
+    else:
+        groupers = pd.Grouper(level=levels)
+
+    expected = series.groupby(groupers).mean()
+
+    # Compute and check result
+    result = series.groupby(levels).mean()
+    assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('key_strs,key_groupers,level_groupers', [
+    ('inner',  # Index name
+     pd.Grouper(key='inner'),
+     pd.Grouper(level='inner'),
+     ),
+    (['inner'],  # List of index name
+     [pd.Grouper(key='inner')],
+     [pd.Grouper(level='inner')]
+     ),
+    (['B', 'inner'],  # Column and index
+     ['B', pd.Grouper(key='inner')],
+     ['B', pd.Grouper(level='inner')]
+     ),
+    (['inner', 'B'],  # Index and column
+     [pd.Grouper(key='inner'), 'B'],
+     [pd.Grouper(level='inner'), 'B'])])
+def test_grouper_column_index_level_precedence(frame,
+                                               key_strs,
+                                               key_groupers,
+                                               level_groupers):
+
+    # GH 5677, when a string passed as the `by` parameter
+    # matches a column and an index level the column takes
+    # precedence and a FutureWarning is raised
+
+    # Add 'inner' column to frame
+    # (frame already has an 'inner' index)
+    frame['inner'] = [1, 1, 1, 1, 1, 1]
+
+    # Performing a groupby with strings should produce warning
+    with tm.assert_produces_warning(FutureWarning):
+        result = frame.groupby(key_strs).mean()
+
+    # Grouping with key Grouper should produce the same result and no warning
+    with tm.assert_produces_warning(False):
+        expected = frame.groupby(key_groupers).mean()
+
+    assert_frame_equal(result, expected)
+
+    # Grouping with level Grouper should produce a different result but
+    # still no warning
+    with tm.assert_produces_warning(False):
+        not_expected = frame.groupby(level_groupers).mean()
+
+    assert not result.index.equals(not_expected.index)
diff --git a/pandas/tests/groupby/test_nth.py b/pandas/tests/groupby/test_nth.py
new file mode 100644
index 0000000000000..a1b748cd50e8f
--- /dev/null
+++ b/pandas/tests/groupby/test_nth.py
@@ -0,0 +1,392 @@
+import numpy as np
+import pandas as pd
+from pandas import DataFrame, MultiIndex, Index, Series, isna, Timestamp
+from pandas.compat import lrange
+from pandas.util.testing import (
+    assert_frame_equal,
+    assert_produces_warning,
+    assert_series_equal)
+import pytest
+
+
+def test_first_last_nth(df):
+    # tests for first / last / nth
+    grouped = df.groupby('A')
+    first = grouped.first()
+    expected = df.loc[[1, 0], ['B', 'C', 'D']]
+    expected.index = Index(['bar', 'foo'], name='A')
+    expected = expected.sort_index()
+    assert_frame_equal(first, expected)
+
+    nth = grouped.nth(0)
+    assert_frame_equal(nth, expected)
+
+    last = grouped.last()
+    expected = df.loc[[5, 7], ['B', 'C', 'D']]
+    expected.index = Index(['bar', 'foo'], name='A')
+    assert_frame_equal(last, expected)
+
+    nth = grouped.nth(-1)
+    assert_frame_equal(nth, expected)
+
+    nth = grouped.nth(1)
+    expected = df.loc[[2, 3], ['B', 'C', 'D']].copy()
+    expected.index = Index(['foo', 'bar'], name='A')
+    expected = expected.sort_index()
+    assert_frame_equal(nth, expected)
+
+    # it works!
+    grouped['B'].first()
+    grouped['B'].last()
+    grouped['B'].nth(0)
+
+    df.loc[df['A'] == 'foo', 'B'] = np.nan
+    assert isna(grouped['B'].first()['foo'])
+    assert isna(grouped['B'].last()['foo'])
+    assert isna(grouped['B'].nth(0)['foo'])
+
+    # v0.14.0 whatsnew
+    df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
+    g = df.groupby('A')
+    result = g.first()
+    expected = df.iloc[[1, 2]].set_index('A')
+    assert_frame_equal(result, expected)
+
+    expected = df.iloc[[1, 2]].set_index('A')
+    result = g.nth(0, dropna='any')
+    assert_frame_equal(result, expected)
+
+
+def test_first_last_nth_dtypes(df_mixed_floats):
+
+    df = df_mixed_floats.copy()
+    df['E'] = True
+    df['F'] = 1
+
+    # tests for first / last / nth
+    grouped = df.groupby('A')
+    first = grouped.first()
+    expected = df.loc[[1, 0], ['B', 'C', 'D', 'E', 'F']]
+    expected.index = Index(['bar', 'foo'], name='A')
+    expected = expected.sort_index()
+    assert_frame_equal(first, expected)
+
+    last = grouped.last()
+    expected = df.loc[[5, 7], ['B', 'C', 'D', 'E', 'F']]
+    expected.index = Index(['bar', 'foo'], name='A')
+    expected = expected.sort_index()
+    assert_frame_equal(last, expected)
+
+    nth = grouped.nth(1)
+    expected = df.loc[[3, 2], ['B', 'C', 'D', 'E', 'F']]
+    expected.index = Index(['bar', 'foo'], name='A')
+    expected = expected.sort_index()
+    assert_frame_equal(nth, expected)
+
+    # GH 2763, first/last shifting dtypes
+    idx = lrange(10)
+    idx.append(9)
+    s = Series(data=lrange(11), index=idx, name='IntCol')
+    assert s.dtype == 'int64'
+    f = s.groupby(level=0).first()
+    assert f.dtype == 'int64'
+
+
+def test_nth():
+    df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
+    g = df.groupby('A')
+
+    assert_frame_equal(g.nth(0), df.iloc[[0, 2]].set_index('A'))
+    assert_frame_equal(g.nth(1), df.iloc[[1]].set_index('A'))
+    assert_frame_equal(g.nth(2), df.loc[[]].set_index('A'))
+    assert_frame_equal(g.nth(-1), df.iloc[[1, 2]].set_index('A'))
+    assert_frame_equal(g.nth(-2), df.iloc[[0]].set_index('A'))
+    assert_frame_equal(g.nth(-3), df.loc[[]].set_index('A'))
+    assert_series_equal(g.B.nth(0), df.set_index('A').B.iloc[[0, 2]])
+    assert_series_equal(g.B.nth(1), df.set_index('A').B.iloc[[1]])
+    assert_frame_equal(g[['B']].nth(0),
+                       df.loc[[0, 2], ['A', 'B']].set_index('A'))
+
+    exp = df.set_index('A')
+    assert_frame_equal(g.nth(0, dropna='any'), exp.iloc[[1, 2]])
+    assert_frame_equal(g.nth(-1, dropna='any'), exp.iloc[[1, 2]])
+
+    exp['B'] = np.nan
+    assert_frame_equal(g.nth(7, dropna='any'), exp.iloc[[1, 2]])
+    assert_frame_equal(g.nth(2, dropna='any'), exp.iloc[[1, 2]])
+
+    # out of bounds, regression from 0.13.1
+    # GH 6621
+    df = DataFrame({'color': {0: 'green',
+                              1: 'green',
+                              2: 'red',
+                              3: 'red',
+                              4: 'red'},
+                    'food': {0: 'ham',
+                             1: 'eggs',
+                             2: 'eggs',
+                             3: 'ham',
+                             4: 'pork'},
+                    'two': {0: 1.5456590000000001,
+                            1: -0.070345000000000005,
+                            2: -2.4004539999999999,
+                            3: 0.46206000000000003,
+                            4: 0.52350799999999997},
+                    'one': {0: 0.56573799999999996,
+                            1: -0.9742360000000001,
+                            2: 1.033801,
+                            3: -0.78543499999999999,
+                            4: 0.70422799999999997}}).set_index(['color',
+                                                                 'food'])
+
+    result = df.groupby(level=0, as_index=False).nth(2)
+    expected = df.iloc[[-1]]
+    assert_frame_equal(result, expected)
+
+    result = df.groupby(level=0, as_index=False).nth(3)
+    expected = df.loc[[]]
+    assert_frame_equal(result, expected)
+
+    # GH 7559
+    # from the vbench
+    df = DataFrame(np.random.randint(1, 10, (100, 2)), dtype='int64')
+    s = df[1]
+    g = df[0]
+    expected = s.groupby(g).first()
+    expected2 = s.groupby(g).apply(lambda x: x.iloc[0])
+    assert_series_equal(expected2, expected, check_names=False)
+    assert expected.name == 1
+    assert expected2.name == 1
+
+    # validate first
+    v = s[g == 1].iloc[0]
+    assert expected.iloc[0] == v
+    assert expected2.iloc[0] == v
+
+    # this is NOT the same as .first (as sorted is default!)
+    # as it keeps the order in the series (and not the group order)
+    # related GH 7287
+    expected = s.groupby(g, sort=False).first()
+    result = s.groupby(g, sort=False).nth(0, dropna='all')
+    assert_series_equal(result, expected)
+
+    # doc example
+    df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
+    g = df.groupby('A')
+    # PR 17493, related to issue 11038
+    # test Series.nth with True for dropna produces FutureWarning
+    with assert_produces_warning(FutureWarning):
+        result = g.B.nth(0, dropna=True)
+    expected = g.B.first()
+    assert_series_equal(result, expected)
+
+    # test multiple nth values
+    df = DataFrame([[1, np.nan], [1, 3], [1, 4], [5, 6], [5, 7]],
+                   columns=['A', 'B'])
+    g = df.groupby('A')
+
+    assert_frame_equal(g.nth(0), df.iloc[[0, 3]].set_index('A'))
+    assert_frame_equal(g.nth([0]), df.iloc[[0, 3]].set_index('A'))
+    assert_frame_equal(g.nth([0, 1]), df.iloc[[0, 1, 3, 4]].set_index('A'))
+    assert_frame_equal(
+        g.nth([0, -1]), df.iloc[[0, 2, 3, 4]].set_index('A'))
+    assert_frame_equal(
+        g.nth([0, 1, 2]), df.iloc[[0, 1, 2, 3, 4]].set_index('A'))
+    assert_frame_equal(
+        g.nth([0, 1, -1]), df.iloc[[0, 1, 2, 3, 4]].set_index('A'))
+    assert_frame_equal(g.nth([2]), df.iloc[[2]].set_index('A'))
+    assert_frame_equal(g.nth([3, 4]), df.loc[[]].set_index('A'))
+
+    business_dates = pd.date_range(start='4/1/2014', end='6/30/2014',
+                                   freq='B')
+    df = DataFrame(1, index=business_dates, columns=['a', 'b'])
+    # get the first, fourth and last two business days for each month
+    key = [df.index.year, df.index.month]
+    result = df.groupby(key, as_index=False).nth([0, 3, -2, -1])
+    expected_dates = pd.to_datetime(
+        ['2014/4/1', '2014/4/4', '2014/4/29', '2014/4/30', '2014/5/1',
+         '2014/5/6', '2014/5/29', '2014/5/30', '2014/6/2', '2014/6/5',
+         '2014/6/27', '2014/6/30'])
+    expected = DataFrame(1, columns=['a', 'b'], index=expected_dates)
+    assert_frame_equal(result, expected)
+
+
+def test_nth_multi_index(three_group):
+    # PR 9090, related to issue 8979
+    # test nth on MultiIndex, should match .first()
+    grouped = three_group.groupby(['A', 'B'])
+    result = grouped.nth(0)
+    expected = grouped.first()
+    assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('data, expected_first, expected_last', [
+    ({'id': ['A'],
+      'time': Timestamp('2012-02-01 14:00:00',
+                        tz='US/Central'),
+      'foo': [1]},
+     {'id': ['A'],
+      'time': Timestamp('2012-02-01 14:00:00',
+                        tz='US/Central'),
+      'foo': [1]},
+     {'id': ['A'],
+      'time': Timestamp('2012-02-01 14:00:00',
+                        tz='US/Central'),
+      'foo': [1]}),
+    ({'id': ['A', 'B', 'A'],
+      'time': [Timestamp('2012-01-01 13:00:00',
+                         tz='America/New_York'),
+               Timestamp('2012-02-01 14:00:00',
+                         tz='US/Central'),
+               Timestamp('2012-03-01 12:00:00',
+                         tz='Europe/London')],
+      'foo': [1, 2, 3]},
+     {'id': ['A', 'B'],
+      'time': [Timestamp('2012-01-01 13:00:00',
+                         tz='America/New_York'),
+               Timestamp('2012-02-01 14:00:00',
+                         tz='US/Central')],
+      'foo': [1, 2]},
+     {'id': ['A', 'B'],
+      'time': [Timestamp('2012-03-01 12:00:00',
+                         tz='Europe/London'),
+               Timestamp('2012-02-01 14:00:00',
+                         tz='US/Central')],
+      'foo': [3, 2]})
+])
+def test_first_last_tz(data, expected_first, expected_last):
+    # GH15884
+    # Test that the timezone is retained when calling first
+    # or last on groupby with as_index=False
+
+    df = DataFrame(data)
+
+    result = df.groupby('id', as_index=False).first()
+    expected = DataFrame(expected_first)
+    cols = ['id', 'time', 'foo']
+    assert_frame_equal(result[cols], expected[cols])
+
+    result = df.groupby('id', as_index=False)['time'].first()
+    assert_frame_equal(result, expected[['id', 'time']])
+
+    result = df.groupby('id', as_index=False).last()
+    expected = DataFrame(expected_last)
+    cols = ['id', 'time', 'foo']
+    assert_frame_equal(result[cols], expected[cols])
+
+    result = df.groupby('id', as_index=False)['time'].last()
+    assert_frame_equal(result, expected[['id', 'time']])
+
+
+def test_nth_multi_index_as_expected():
+    # PR 9090, related to issue 8979
+    # test nth on MultiIndex
+    three_group = DataFrame(
+        {'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar', 'bar', 'bar',
+               'foo', 'foo', 'foo'],
+         'B': ['one', 'one', 'one', 'two', 'one', 'one', 'one', 'two',
+               'two', 'two', 'one'],
+         'C': ['dull', 'dull', 'shiny', 'dull', 'dull', 'shiny', 'shiny',
+               'dull', 'shiny', 'shiny', 'shiny']})
+    grouped = three_group.groupby(['A', 'B'])
+    result = grouped.nth(0)
+    expected = DataFrame(
+        {'C': ['dull', 'dull', 'dull', 'dull']},
+        index=MultiIndex.from_arrays([['bar', 'bar', 'foo', 'foo'],
+                                      ['one', 'two', 'one', 'two']],
+                                     names=['A', 'B']))
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_head_tail():
+    df = DataFrame([[1, 2], [1, 4], [5, 6]], columns=['A', 'B'])
+    g_as = df.groupby('A', as_index=True)
+    g_not_as = df.groupby('A', as_index=False)
+
+    # as_index= False, much easier
+    assert_frame_equal(df.loc[[0, 2]], g_not_as.head(1))
+    assert_frame_equal(df.loc[[1, 2]], g_not_as.tail(1))
+
+    empty_not_as = DataFrame(columns=df.columns,
+                             index=pd.Index([], dtype=df.index.dtype))
+    empty_not_as['A'] = empty_not_as['A'].astype(df.A.dtype)
+    empty_not_as['B'] = empty_not_as['B'].astype(df.B.dtype)
+    assert_frame_equal(empty_not_as, g_not_as.head(0))
+    assert_frame_equal(empty_not_as, g_not_as.tail(0))
+    assert_frame_equal(empty_not_as, g_not_as.head(-1))
+    assert_frame_equal(empty_not_as, g_not_as.tail(-1))
+
+    assert_frame_equal(df, g_not_as.head(7))  # contains all
+    assert_frame_equal(df, g_not_as.tail(7))
+
+    # as_index=True, (used to be different)
+    df_as = df
+
+    assert_frame_equal(df_as.loc[[0, 2]], g_as.head(1))
+    assert_frame_equal(df_as.loc[[1, 2]], g_as.tail(1))
+
+    empty_as = DataFrame(index=df_as.index[:0], columns=df.columns)
+    empty_as['A'] = empty_not_as['A'].astype(df.A.dtype)
+    empty_as['B'] = empty_not_as['B'].astype(df.B.dtype)
+    assert_frame_equal(empty_as, g_as.head(0))
+    assert_frame_equal(empty_as, g_as.tail(0))
+    assert_frame_equal(empty_as, g_as.head(-1))
+    assert_frame_equal(empty_as, g_as.tail(-1))
+
+    assert_frame_equal(df_as, g_as.head(7))  # contains all
+    assert_frame_equal(df_as, g_as.tail(7))
+
+    # test with selection
+    assert_frame_equal(g_as[[]].head(1), df_as.loc[[0, 2], []])
+    assert_frame_equal(g_as[['A']].head(1), df_as.loc[[0, 2], ['A']])
+    assert_frame_equal(g_as[['B']].head(1), df_as.loc[[0, 2], ['B']])
+    assert_frame_equal(g_as[['A', 'B']].head(1), df_as.loc[[0, 2]])
+
+    assert_frame_equal(g_not_as[[]].head(1), df_as.loc[[0, 2], []])
+    assert_frame_equal(g_not_as[['A']].head(1), df_as.loc[[0, 2], ['A']])
+    assert_frame_equal(g_not_as[['B']].head(1), df_as.loc[[0, 2], ['B']])
+    assert_frame_equal(g_not_as[['A', 'B']].head(1), df_as.loc[[0, 2]])
+
+
+def test_group_selection_cache():
+    # GH 12839 nth, head, and tail should return same result consistently
+    df = DataFrame([[1, 2], [1, 4], [5, 6]], columns=['A', 'B'])
+    expected = df.iloc[[0, 2]].set_index('A')
+
+    g = df.groupby('A')
+    result1 = g.head(n=2)
+    result2 = g.nth(0)
+    assert_frame_equal(result1, df)
+    assert_frame_equal(result2, expected)
+
+    g = df.groupby('A')
+    result1 = g.tail(n=2)
+    result2 = g.nth(0)
+    assert_frame_equal(result1, df)
+    assert_frame_equal(result2, expected)
+
+    g = df.groupby('A')
+    result1 = g.nth(0)
+    result2 = g.head(n=2)
+    assert_frame_equal(result1, expected)
+    assert_frame_equal(result2, df)
+
+    g = df.groupby('A')
+    result1 = g.nth(0)
+    result2 = g.tail(n=2)
+    assert_frame_equal(result1, expected)
+    assert_frame_equal(result2, df)
+
+
+def test_nth_empty():
+    # GH 16064
+    df = DataFrame(index=[0], columns=['a', 'b', 'c'])
+    result = df.groupby('a').nth(10)
+    expected = DataFrame(index=Index([], name='a'), columns=['b', 'c'])
+    assert_frame_equal(result, expected)
+
+    result = df.groupby(['a', 'b']).nth(10)
+    expected = DataFrame(index=MultiIndex([[], []], [[], []],
+                                          names=['a', 'b']),
+                         columns=['c'])
+    assert_frame_equal(result, expected)
diff --git a/pandas/tests/groupby/test_rank.py b/pandas/tests/groupby/test_rank.py
new file mode 100644
index 0000000000000..203c3c73bec94
--- /dev/null
+++ b/pandas/tests/groupby/test_rank.py
@@ -0,0 +1,254 @@
+import pytest
+import numpy as np
+import pandas as pd
+from pandas import DataFrame, concat
+from pandas.util import testing as tm
+
+
+def test_rank_apply():
+    lev1 = tm.rands_array(10, 100)
+    lev2 = tm.rands_array(10, 130)
+    lab1 = np.random.randint(0, 100, size=500)
+    lab2 = np.random.randint(0, 130, size=500)
+
+    df = DataFrame({'value': np.random.randn(500),
+                    'key1': lev1.take(lab1),
+                    'key2': lev2.take(lab2)})
+
+    result = df.groupby(['key1', 'key2']).value.rank()
+
+    expected = []
+    for key, piece in df.groupby(['key1', 'key2']):
+        expected.append(piece.value.rank())
+    expected = concat(expected, axis=0)
+    expected = expected.reindex(result.index)
+    tm.assert_series_equal(result, expected)
+
+    result = df.groupby(['key1', 'key2']).value.rank(pct=True)
+
+    expected = []
+    for key, piece in df.groupby(['key1', 'key2']):
+        expected.append(piece.value.rank(pct=True))
+    expected = concat(expected, axis=0)
+    expected = expected.reindex(result.index)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("grps", [
+    ['qux'], ['qux', 'quux']])
+@pytest.mark.parametrize("vals", [
+    [2, 2, 8, 2, 6],
+    [pd.Timestamp('2018-01-02'), pd.Timestamp('2018-01-02'),
+     pd.Timestamp('2018-01-08'), pd.Timestamp('2018-01-02'),
+     pd.Timestamp('2018-01-06')]])
+@pytest.mark.parametrize("ties_method,ascending,pct,exp", [
+    ('average', True, False, [2., 2., 5., 2., 4.]),
+    ('average', True, True, [0.4, 0.4, 1.0, 0.4, 0.8]),
+    ('average', False, False, [4., 4., 1., 4., 2.]),
+    ('average', False, True, [.8, .8, .2, .8, .4]),
+    ('min', True, False, [1., 1., 5., 1., 4.]),
+    ('min', True, True, [0.2, 0.2, 1.0, 0.2, 0.8]),
+    ('min', False, False, [3., 3., 1., 3., 2.]),
+    ('min', False, True, [.6, .6, .2, .6, .4]),
+    ('max', True, False, [3., 3., 5., 3., 4.]),
+    ('max', True, True, [0.6, 0.6, 1.0, 0.6, 0.8]),
+    ('max', False, False, [5., 5., 1., 5., 2.]),
+    ('max', False, True, [1., 1., .2, 1., .4]),
+    ('first', True, False, [1., 2., 5., 3., 4.]),
+    ('first', True, True, [0.2, 0.4, 1.0, 0.6, 0.8]),
+    ('first', False, False, [3., 4., 1., 5., 2.]),
+    ('first', False, True, [.6, .8, .2, 1., .4]),
+    ('dense', True, False, [1., 1., 3., 1., 2.]),
+    ('dense', True, True, [1. / 3., 1. / 3., 3. / 3., 1. / 3., 2. / 3.]),
+    ('dense', False, False, [3., 3., 1., 3., 2.]),
+    ('dense', False, True, [3. / 3., 3. / 3., 1. / 3., 3. / 3., 2. / 3.]),
+])
+def test_rank_args(grps, vals, ties_method, ascending, pct, exp):
+    key = np.repeat(grps, len(vals))
+    vals = vals * len(grps)
+    df = DataFrame({'key': key, 'val': vals})
+    result = df.groupby('key').rank(method=ties_method,
+                                    ascending=ascending, pct=pct)
+
+    exp_df = DataFrame(exp * len(grps), columns=['val'])
+    tm.assert_frame_equal(result, exp_df)
+
+
+@pytest.mark.parametrize("grps", [
+    ['qux'], ['qux', 'quux']])
+@pytest.mark.parametrize("vals", [
+    [-np.inf, -np.inf, np.nan, 1., np.nan, np.inf, np.inf],
+])
+@pytest.mark.parametrize("ties_method,ascending,na_option,exp", [
+    ('average', True, 'keep', [1.5, 1.5, np.nan, 3, np.nan, 4.5, 4.5]),
+    ('average', True, 'top', [3.5, 3.5, 1.5, 5., 1.5, 6.5, 6.5]),
+    ('average', True, 'bottom', [1.5, 1.5, 6.5, 3., 6.5, 4.5, 4.5]),
+    ('average', False, 'keep', [4.5, 4.5, np.nan, 3, np.nan, 1.5, 1.5]),
+    ('average', False, 'top', [6.5, 6.5, 1.5, 5., 1.5, 3.5, 3.5]),
+    ('average', False, 'bottom', [4.5, 4.5, 6.5, 3., 6.5, 1.5, 1.5]),
+    ('min', True, 'keep', [1., 1., np.nan, 3., np.nan, 4., 4.]),
+    ('min', True, 'top', [3., 3., 1., 5., 1., 6., 6.]),
+    ('min', True, 'bottom', [1., 1., 6., 3., 6., 4., 4.]),
+    ('min', False, 'keep', [4., 4., np.nan, 3., np.nan, 1., 1.]),
+    ('min', False, 'top', [6., 6., 1., 5., 1., 3., 3.]),
+    ('min', False, 'bottom', [4., 4., 6., 3., 6., 1., 1.]),
+    ('max', True, 'keep', [2., 2., np.nan, 3., np.nan, 5., 5.]),
+    ('max', True, 'top', [4., 4., 2., 5., 2., 7., 7.]),
+    ('max', True, 'bottom', [2., 2., 7., 3., 7., 5., 5.]),
+    ('max', False, 'keep', [5., 5., np.nan, 3., np.nan, 2., 2.]),
+    ('max', False, 'top', [7., 7., 2., 5., 2., 4., 4.]),
+    ('max', False, 'bottom', [5., 5., 7., 3., 7., 2., 2.]),
+    ('first', True, 'keep', [1., 2., np.nan, 3., np.nan, 4., 5.]),
+    ('first', True, 'top', [3., 4., 1., 5., 2., 6., 7.]),
+    ('first', True, 'bottom', [1., 2., 6., 3., 7., 4., 5.]),
+    ('first', False, 'keep', [4., 5., np.nan, 3., np.nan, 1., 2.]),
+    ('first', False, 'top', [6., 7., 1., 5., 2., 3., 4.]),
+    ('first', False, 'bottom', [4., 5., 6., 3., 7., 1., 2.]),
+    ('dense', True, 'keep', [1., 1., np.nan, 2., np.nan, 3., 3.]),
+    ('dense', True, 'top', [2., 2., 1., 3., 1., 4., 4.]),
+    ('dense', True, 'bottom', [1., 1., 4., 2., 4., 3., 3.]),
+    ('dense', False, 'keep', [3., 3., np.nan, 2., np.nan, 1., 1.]),
+    ('dense', False, 'top', [4., 4., 1., 3., 1., 2., 2.]),
+    ('dense', False, 'bottom', [3., 3., 4., 2., 4., 1., 1.])
+])
+def test_infs_n_nans(grps, vals, ties_method, ascending, na_option, exp):
+    # GH 20561
+    key = np.repeat(grps, len(vals))
+    vals = vals * len(grps)
+    df = DataFrame({'key': key, 'val': vals})
+    result = df.groupby('key').rank(method=ties_method,
+                                    ascending=ascending,
+                                    na_option=na_option)
+    exp_df = DataFrame(exp * len(grps), columns=['val'])
+    tm.assert_frame_equal(result, exp_df)
+
+
+@pytest.mark.parametrize("grps", [
+    ['qux'], ['qux', 'quux']])
+@pytest.mark.parametrize("vals", [
+    [2, 2, np.nan, 8, 2, 6, np.nan, np.nan],
+    [pd.Timestamp('2018-01-02'), pd.Timestamp('2018-01-02'), np.nan,
+     pd.Timestamp('2018-01-08'), pd.Timestamp('2018-01-02'),
+     pd.Timestamp('2018-01-06'), np.nan, np.nan]
+])
+@pytest.mark.parametrize("ties_method,ascending,na_option,pct,exp", [
+    ('average', True, 'keep', False,
+        [2., 2., np.nan, 5., 2., 4., np.nan, np.nan]),
+    ('average', True, 'keep', True,
+        [0.4, 0.4, np.nan, 1.0, 0.4, 0.8, np.nan, np.nan]),
+    ('average', False, 'keep', False,
+        [4., 4., np.nan, 1., 4., 2., np.nan, np.nan]),
+    ('average', False, 'keep', True,
+        [.8, 0.8, np.nan, 0.2, 0.8, 0.4, np.nan, np.nan]),
+    ('min', True, 'keep', False,
+        [1., 1., np.nan, 5., 1., 4., np.nan, np.nan]),
+    ('min', True, 'keep', True,
+        [0.2, 0.2, np.nan, 1.0, 0.2, 0.8, np.nan, np.nan]),
+    ('min', False, 'keep', False,
+        [3., 3., np.nan, 1., 3., 2., np.nan, np.nan]),
+    ('min', False, 'keep', True,
+        [.6, 0.6, np.nan, 0.2, 0.6, 0.4, np.nan, np.nan]),
+    ('max', True, 'keep', False,
+        [3., 3., np.nan, 5., 3., 4., np.nan, np.nan]),
+    ('max', True, 'keep', True,
+        [0.6, 0.6, np.nan, 1.0, 0.6, 0.8, np.nan, np.nan]),
+    ('max', False, 'keep', False,
+        [5., 5., np.nan, 1., 5., 2., np.nan, np.nan]),
+    ('max', False, 'keep', True,
+        [1., 1., np.nan, 0.2, 1., 0.4, np.nan, np.nan]),
+    ('first', True, 'keep', False,
+        [1., 2., np.nan, 5., 3., 4., np.nan, np.nan]),
+    ('first', True, 'keep', True,
+        [0.2, 0.4, np.nan, 1.0, 0.6, 0.8, np.nan, np.nan]),
+    ('first', False, 'keep', False,
+        [3., 4., np.nan, 1., 5., 2., np.nan, np.nan]),
+    ('first', False, 'keep', True,
+        [.6, 0.8, np.nan, 0.2, 1., 0.4, np.nan, np.nan]),
+    ('dense', True, 'keep', False,
+        [1., 1., np.nan, 3., 1., 2., np.nan, np.nan]),
+    ('dense', True, 'keep', True,
+        [1. / 3., 1. / 3., np.nan, 3. / 3., 1. / 3., 2. / 3., np.nan, np.nan]),
+    ('dense', False, 'keep', False,
+        [3., 3., np.nan, 1., 3., 2., np.nan, np.nan]),
+    ('dense', False, 'keep', True,
+        [3. / 3., 3. / 3., np.nan, 1. / 3., 3. / 3., 2. / 3., np.nan, np.nan]),
+    ('average', True, 'no_na', False, [2., 2., 7., 5., 2., 4., 7., 7.]),
+    ('average', True, 'no_na', True,
+        [0.25, 0.25, 0.875, 0.625, 0.25, 0.5, 0.875, 0.875]),
+    ('average', False, 'no_na', False, [4., 4., 7., 1., 4., 2., 7., 7.]),
+    ('average', False, 'no_na', True,
+        [0.5, 0.5, 0.875, 0.125, 0.5, 0.25, 0.875, 0.875]),
+    ('min', True, 'no_na', False, [1., 1., 6., 5., 1., 4., 6., 6.]),
+    ('min', True, 'no_na', True,
+        [0.125, 0.125, 0.75, 0.625, 0.125, 0.5, 0.75, 0.75]),
+    ('min', False, 'no_na', False, [3., 3., 6., 1., 3., 2., 6., 6.]),
+    ('min', False, 'no_na', True,
+        [0.375, 0.375, 0.75, 0.125, 0.375, 0.25, 0.75, 0.75]),
+    ('max', True, 'no_na', False, [3., 3., 8., 5., 3., 4., 8., 8.]),
+    ('max', True, 'no_na', True,
+        [0.375, 0.375, 1., 0.625, 0.375, 0.5, 1., 1.]),
+    ('max', False, 'no_na', False, [5., 5., 8., 1., 5., 2., 8., 8.]),
+    ('max', False, 'no_na', True,
+        [0.625, 0.625, 1., 0.125, 0.625, 0.25, 1., 1.]),
+    ('first', True, 'no_na', False, [1., 2., 6., 5., 3., 4., 7., 8.]),
+    ('first', True, 'no_na', True,
+        [0.125, 0.25, 0.75, 0.625, 0.375, 0.5, 0.875, 1.]),
+    ('first', False, 'no_na', False, [3., 4., 6., 1., 5., 2., 7., 8.]),
+    ('first', False, 'no_na', True,
+        [0.375, 0.5, 0.75, 0.125, 0.625, 0.25, 0.875, 1.]),
+    ('dense', True, 'no_na', False, [1., 1., 4., 3., 1., 2., 4., 4.]),
+    ('dense', True, 'no_na', True,
+     [0.25, 0.25, 1., 0.75, 0.25, 0.5, 1., 1.]),
+    ('dense', False, 'no_na', False, [3., 3., 4., 1., 3., 2., 4., 4.]),
+    ('dense', False, 'no_na', True,
+     [0.75, 0.75, 1., 0.25, 0.75, 0.5, 1., 1.])
+])
+def test_rank_args_missing(grps, vals, ties_method, ascending,
+                           na_option, pct, exp):
+    key = np.repeat(grps, len(vals))
+    vals = vals * len(grps)
+    df = DataFrame({'key': key, 'val': vals})
+    result = df.groupby('key').rank(method=ties_method,
+                                    ascending=ascending,
+                                    na_option=na_option, pct=pct)
+
+    exp_df = DataFrame(exp * len(grps), columns=['val'])
+    tm.assert_frame_equal(result, exp_df)
+
+
+@pytest.mark.parametrize("pct,exp", [
+    (False, [3., 3., 3., 3., 3.]),
+    (True, [.6, .6, .6, .6, .6])])
+def test_rank_resets_each_group(pct, exp):
+    df = DataFrame(
+        {'key': ['a', 'a', 'a', 'a', 'a', 'b', 'b', 'b', 'b', 'b'],
+         'val': [1] * 10}
+    )
+    result = df.groupby('key').rank(pct=pct)
+    exp_df = DataFrame(exp * 2, columns=['val'])
+    tm.assert_frame_equal(result, exp_df)
+
+
+def test_rank_avg_even_vals():
+    df = DataFrame({'key': ['a'] * 4, 'val': [1] * 4})
+    result = df.groupby('key').rank()
+    exp_df = DataFrame([2.5, 2.5, 2.5, 2.5], columns=['val'])
+    tm.assert_frame_equal(result, exp_df)
+
+
+@pytest.mark.parametrize("ties_method", [
+    'average', 'min', 'max', 'first', 'dense'])
+@pytest.mark.parametrize("ascending", [True, False])
+@pytest.mark.parametrize("na_option", ["keep", "top", "bottom"])
+@pytest.mark.parametrize("pct", [True, False])
+@pytest.mark.parametrize("vals", [
+    ['bar', 'bar', 'foo', 'bar', 'baz'],
+    ['bar', np.nan, 'foo', np.nan, 'baz']
+])
+def test_rank_object_raises(ties_method, ascending, na_option,
+                            pct, vals):
+    df = DataFrame({'key': ['foo'] * 5, 'val': vals})
+    with tm.assert_raises_regex(TypeError, "not callable"):
+        df.groupby('key').rank(method=ties_method,
+                               ascending=ascending,
+                               na_option=na_option, pct=pct)
diff --git a/pandas/tests/groupby/test_timegrouper.py b/pandas/tests/groupby/test_timegrouper.py
new file mode 100644
index 0000000000000..17ca5d31b6b59
--- /dev/null
+++ b/pandas/tests/groupby/test_timegrouper.py
@@ -0,0 +1,652 @@
+""" test with the TimeGrouper / grouping with datetimes """
+
+import pytest
+import pytz
+
+from datetime import datetime
+import numpy as np
+from numpy import nan
+
+import pandas as pd
+from pandas import (DataFrame, date_range, Index,
+                    Series, MultiIndex, Timestamp, DatetimeIndex)
+from pandas.compat import StringIO
+from pandas.util import testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+
+
+class TestGroupBy(object):
+
+    def test_groupby_with_timegrouper(self):
+        # GH 4161
+        # TimeGrouper requires a sorted index
+        # also verifies that the resultant index has the correct name
+        df_original = DataFrame({
+            'Buyer': 'Carl Carl Carl Carl Joe Carl'.split(),
+            'Quantity': [18, 3, 5, 1, 9, 3],
+            'Date': [
+                datetime(2013, 9, 1, 13, 0),
+                datetime(2013, 9, 1, 13, 5),
+                datetime(2013, 10, 1, 20, 0),
+                datetime(2013, 10, 3, 10, 0),
+                datetime(2013, 12, 2, 12, 0),
+                datetime(2013, 9, 2, 14, 0),
+            ]
+        })
+
+        # GH 6908 change target column's order
+        df_reordered = df_original.sort_values(by='Quantity')
+
+        for df in [df_original, df_reordered]:
+            df = df.set_index(['Date'])
+
+            expected = DataFrame(
+                {'Quantity': 0},
+                index=date_range('20130901 13:00:00',
+                                 '20131205 13:00:00', freq='5D',
+                                 name='Date', closed='left'))
+            expected.iloc[[0, 6, 18], 0] = np.array([24, 6, 9], dtype='int64')
+
+            result1 = df.resample('5D') .sum()
+            assert_frame_equal(result1, expected)
+
+            df_sorted = df.sort_index()
+            result2 = df_sorted.groupby(pd.Grouper(freq='5D')).sum()
+            assert_frame_equal(result2, expected)
+
+            result3 = df.groupby(pd.Grouper(freq='5D')).sum()
+            assert_frame_equal(result3, expected)
+
+    @pytest.mark.parametrize("should_sort", [True, False])
+    def test_groupby_with_timegrouper_methods(self, should_sort):
+        # GH 3881
+        # make sure API of timegrouper conforms
+
+        df = pd.DataFrame({
+            'Branch': 'A A A A A B'.split(),
+            'Buyer': 'Carl Mark Carl Joe Joe Carl'.split(),
+            'Quantity': [1, 3, 5, 8, 9, 3],
+            'Date': [
+                datetime(2013, 1, 1, 13, 0),
+                datetime(2013, 1, 1, 13, 5),
+                datetime(2013, 10, 1, 20, 0),
+                datetime(2013, 10, 2, 10, 0),
+                datetime(2013, 12, 2, 12, 0),
+                datetime(2013, 12, 2, 14, 0),
+            ]
+        })
+
+        if should_sort:
+            df = df.sort_values(by='Quantity', ascending=False)
+
+        df = df.set_index('Date', drop=False)
+        g = df.groupby(pd.Grouper(freq='6M'))
+        assert g.group_keys
+
+        import pandas.core.groupby.groupby
+        assert isinstance(g.grouper, pandas.core.groupby.groupby.BinGrouper)
+        groups = g.groups
+        assert isinstance(groups, dict)
+        assert len(groups) == 3
+
+    def test_timegrouper_with_reg_groups(self):
+
+        # GH 3794
+        # allow combinateion of timegrouper/reg groups
+
+        df_original = DataFrame({
+            'Branch': 'A A A A A A A B'.split(),
+            'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
+            'Quantity': [1, 3, 5, 1, 8, 1, 9, 3],
+            'Date': [
+                datetime(2013, 1, 1, 13, 0),
+                datetime(2013, 1, 1, 13, 5),
+                datetime(2013, 10, 1, 20, 0),
+                datetime(2013, 10, 2, 10, 0),
+                datetime(2013, 10, 1, 20, 0),
+                datetime(2013, 10, 2, 10, 0),
+                datetime(2013, 12, 2, 12, 0),
+                datetime(2013, 12, 2, 14, 0),
+            ]
+        }).set_index('Date')
+
+        df_sorted = df_original.sort_values(by='Quantity', ascending=False)
+
+        for df in [df_original, df_sorted]:
+            expected = DataFrame({
+                'Buyer': 'Carl Joe Mark'.split(),
+                'Quantity': [10, 18, 3],
+                'Date': [
+                    datetime(2013, 12, 31, 0, 0),
+                    datetime(2013, 12, 31, 0, 0),
+                    datetime(2013, 12, 31, 0, 0),
+                ]
+            }).set_index(['Date', 'Buyer'])
+
+            result = df.groupby([pd.Grouper(freq='A'), 'Buyer']).sum()
+            assert_frame_equal(result, expected)
+
+            expected = DataFrame({
+                'Buyer': 'Carl Mark Carl Joe'.split(),
+                'Quantity': [1, 3, 9, 18],
+                'Date': [
+                    datetime(2013, 1, 1, 0, 0),
+                    datetime(2013, 1, 1, 0, 0),
+                    datetime(2013, 7, 1, 0, 0),
+                    datetime(2013, 7, 1, 0, 0),
+                ]
+            }).set_index(['Date', 'Buyer'])
+            result = df.groupby([pd.Grouper(freq='6MS'), 'Buyer']).sum()
+            assert_frame_equal(result, expected)
+
+        df_original = DataFrame({
+            'Branch': 'A A A A A A A B'.split(),
+            'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
+            'Quantity': [1, 3, 5, 1, 8, 1, 9, 3],
+            'Date': [
+                datetime(2013, 10, 1, 13, 0),
+                datetime(2013, 10, 1, 13, 5),
+                datetime(2013, 10, 1, 20, 0),
+                datetime(2013, 10, 2, 10, 0),
+                datetime(2013, 10, 1, 20, 0),
+                datetime(2013, 10, 2, 10, 0),
+                datetime(2013, 10, 2, 12, 0),
+                datetime(2013, 10, 2, 14, 0),
+            ]
+        }).set_index('Date')
+
+        df_sorted = df_original.sort_values(by='Quantity', ascending=False)
+        for df in [df_original, df_sorted]:
+
+            expected = DataFrame({
+                'Buyer': 'Carl Joe Mark Carl Joe'.split(),
+                'Quantity': [6, 8, 3, 4, 10],
+                'Date': [
+                    datetime(2013, 10, 1, 0, 0),
+                    datetime(2013, 10, 1, 0, 0),
+                    datetime(2013, 10, 1, 0, 0),
+                    datetime(2013, 10, 2, 0, 0),
+                    datetime(2013, 10, 2, 0, 0),
+                ]
+            }).set_index(['Date', 'Buyer'])
+
+            result = df.groupby([pd.Grouper(freq='1D'), 'Buyer']).sum()
+            assert_frame_equal(result, expected)
+
+            result = df.groupby([pd.Grouper(freq='1M'), 'Buyer']).sum()
+            expected = DataFrame({
+                'Buyer': 'Carl Joe Mark'.split(),
+                'Quantity': [10, 18, 3],
+                'Date': [
+                    datetime(2013, 10, 31, 0, 0),
+                    datetime(2013, 10, 31, 0, 0),
+                    datetime(2013, 10, 31, 0, 0),
+                ]
+            }).set_index(['Date', 'Buyer'])
+            assert_frame_equal(result, expected)
+
+            # passing the name
+            df = df.reset_index()
+            result = df.groupby([pd.Grouper(freq='1M', key='Date'), 'Buyer'
+                                 ]).sum()
+            assert_frame_equal(result, expected)
+
+            with pytest.raises(KeyError):
+                df.groupby([pd.Grouper(freq='1M', key='foo'), 'Buyer']).sum()
+
+            # passing the level
+            df = df.set_index('Date')
+            result = df.groupby([pd.Grouper(freq='1M', level='Date'), 'Buyer'
+                                 ]).sum()
+            assert_frame_equal(result, expected)
+            result = df.groupby([pd.Grouper(freq='1M', level=0), 'Buyer']).sum(
+            )
+            assert_frame_equal(result, expected)
+
+            with pytest.raises(ValueError):
+                df.groupby([pd.Grouper(freq='1M', level='foo'),
+                            'Buyer']).sum()
+
+            # multi names
+            df = df.copy()
+            df['Date'] = df.index + pd.offsets.MonthEnd(2)
+            result = df.groupby([pd.Grouper(freq='1M', key='Date'), 'Buyer'
+                                 ]).sum()
+            expected = DataFrame({
+                'Buyer': 'Carl Joe Mark'.split(),
+                'Quantity': [10, 18, 3],
+                'Date': [
+                    datetime(2013, 11, 30, 0, 0),
+                    datetime(2013, 11, 30, 0, 0),
+                    datetime(2013, 11, 30, 0, 0),
+                ]
+            }).set_index(['Date', 'Buyer'])
+            assert_frame_equal(result, expected)
+
+            # error as we have both a level and a name!
+            with pytest.raises(ValueError):
+                df.groupby([pd.Grouper(freq='1M', key='Date',
+                                       level='Date'), 'Buyer']).sum()
+
+            # single groupers
+            expected = DataFrame({'Quantity': [31],
+                                  'Date': [datetime(2013, 10, 31, 0, 0)
+                                           ]}).set_index('Date')
+            result = df.groupby(pd.Grouper(freq='1M')).sum()
+            assert_frame_equal(result, expected)
+
+            result = df.groupby([pd.Grouper(freq='1M')]).sum()
+            assert_frame_equal(result, expected)
+
+            expected = DataFrame({'Quantity': [31],
+                                  'Date': [datetime(2013, 11, 30, 0, 0)
+                                           ]}).set_index('Date')
+            result = df.groupby(pd.Grouper(freq='1M', key='Date')).sum()
+            assert_frame_equal(result, expected)
+
+            result = df.groupby([pd.Grouper(freq='1M', key='Date')]).sum()
+            assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('freq', ['D', 'M', 'A', 'Q-APR'])
+    def test_timegrouper_with_reg_groups_freq(self, freq):
+        # GH 6764 multiple grouping with/without sort
+        df = DataFrame({
+            'date': pd.to_datetime([
+                '20121002', '20121007', '20130130', '20130202', '20130305',
+                '20121002', '20121207', '20130130', '20130202', '20130305',
+                '20130202', '20130305'
+            ]),
+            'user_id': [1, 1, 1, 1, 1, 3, 3, 3, 5, 5, 5, 5],
+            'whole_cost': [1790, 364, 280, 259, 201, 623, 90, 312, 359, 301,
+                           359, 801],
+            'cost1': [12, 15, 10, 24, 39, 1, 0, 90, 45, 34, 1, 12]
+        }).set_index('date')
+
+        expected = (
+            df.groupby('user_id')['whole_cost']
+              .resample(freq)
+              .sum(min_count=1)  # XXX
+              .dropna()
+              .reorder_levels(['date', 'user_id'])
+              .sort_index()
+              .astype('int64')
+        )
+        expected.name = 'whole_cost'
+
+        result1 = df.sort_index().groupby([pd.Grouper(freq=freq),
+                                           'user_id'])['whole_cost'].sum()
+        assert_series_equal(result1, expected)
+
+        result2 = df.groupby([pd.Grouper(freq=freq), 'user_id'])[
+            'whole_cost'].sum()
+        assert_series_equal(result2, expected)
+
+    def test_timegrouper_get_group(self):
+        # GH 6914
+
+        df_original = DataFrame({
+            'Buyer': 'Carl Joe Joe Carl Joe Carl'.split(),
+            'Quantity': [18, 3, 5, 1, 9, 3],
+            'Date': [datetime(2013, 9, 1, 13, 0),
+                     datetime(2013, 9, 1, 13, 5),
+                     datetime(2013, 10, 1, 20, 0),
+                     datetime(2013, 10, 3, 10, 0),
+                     datetime(2013, 12, 2, 12, 0),
+                     datetime(2013, 9, 2, 14, 0), ]
+        })
+        df_reordered = df_original.sort_values(by='Quantity')
+
+        # single grouping
+        expected_list = [df_original.iloc[[0, 1, 5]], df_original.iloc[[2, 3]],
+                         df_original.iloc[[4]]]
+        dt_list = ['2013-09-30', '2013-10-31', '2013-12-31']
+
+        for df in [df_original, df_reordered]:
+            grouped = df.groupby(pd.Grouper(freq='M', key='Date'))
+            for t, expected in zip(dt_list, expected_list):
+                dt = pd.Timestamp(t)
+                result = grouped.get_group(dt)
+                assert_frame_equal(result, expected)
+
+        # multiple grouping
+        expected_list = [df_original.iloc[[1]], df_original.iloc[[3]],
+                         df_original.iloc[[4]]]
+        g_list = [('Joe', '2013-09-30'), ('Carl', '2013-10-31'),
+                  ('Joe', '2013-12-31')]
+
+        for df in [df_original, df_reordered]:
+            grouped = df.groupby(['Buyer', pd.Grouper(freq='M', key='Date')])
+            for (b, t), expected in zip(g_list, expected_list):
+                dt = pd.Timestamp(t)
+                result = grouped.get_group((b, dt))
+                assert_frame_equal(result, expected)
+
+        # with index
+        df_original = df_original.set_index('Date')
+        df_reordered = df_original.sort_values(by='Quantity')
+
+        expected_list = [df_original.iloc[[0, 1, 5]], df_original.iloc[[2, 3]],
+                         df_original.iloc[[4]]]
+
+        for df in [df_original, df_reordered]:
+            grouped = df.groupby(pd.Grouper(freq='M'))
+            for t, expected in zip(dt_list, expected_list):
+                dt = pd.Timestamp(t)
+                result = grouped.get_group(dt)
+                assert_frame_equal(result, expected)
+
+    def test_timegrouper_apply_return_type_series(self):
+        # Using `apply` with the `TimeGrouper` should give the
+        # same return type as an `apply` with a `Grouper`.
+        # Issue #11742
+        df = pd.DataFrame({'date': ['10/10/2000', '11/10/2000'],
+                           'value': [10, 13]})
+        df_dt = df.copy()
+        df_dt['date'] = pd.to_datetime(df_dt['date'])
+
+        def sumfunc_series(x):
+            return pd.Series([x['value'].sum()], ('sum',))
+
+        expected = df.groupby(pd.Grouper(key='date')).apply(sumfunc_series)
+        result = (df_dt.groupby(pd.Grouper(freq='M', key='date'))
+                  .apply(sumfunc_series))
+        assert_frame_equal(result.reset_index(drop=True),
+                           expected.reset_index(drop=True))
+
+    def test_timegrouper_apply_return_type_value(self):
+        # Using `apply` with the `TimeGrouper` should give the
+        # same return type as an `apply` with a `Grouper`.
+        # Issue #11742
+        df = pd.DataFrame({'date': ['10/10/2000', '11/10/2000'],
+                           'value': [10, 13]})
+        df_dt = df.copy()
+        df_dt['date'] = pd.to_datetime(df_dt['date'])
+
+        def sumfunc_value(x):
+            return x.value.sum()
+
+        expected = df.groupby(pd.Grouper(key='date')).apply(sumfunc_value)
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = (df_dt.groupby(pd.TimeGrouper(freq='M', key='date'))
+                      .apply(sumfunc_value))
+        assert_series_equal(result.reset_index(drop=True),
+                            expected.reset_index(drop=True))
+
+    def test_groupby_groups_datetimeindex(self):
+        # #1430
+        periods = 1000
+        ind = DatetimeIndex(start='2012/1/1', freq='5min', periods=periods)
+        df = DataFrame({'high': np.arange(periods),
+                        'low': np.arange(periods)}, index=ind)
+        grouped = df.groupby(lambda x: datetime(x.year, x.month, x.day))
+
+        # it works!
+        groups = grouped.groups
+        assert isinstance(list(groups.keys())[0], datetime)
+
+        # GH 11442
+        index = pd.date_range('2015/01/01', periods=5, name='date')
+        df = pd.DataFrame({'A': [5, 6, 7, 8, 9],
+                           'B': [1, 2, 3, 4, 5]}, index=index)
+        result = df.groupby(level='date').groups
+        dates = ['2015-01-05', '2015-01-04', '2015-01-03',
+                 '2015-01-02', '2015-01-01']
+        expected = {pd.Timestamp(date): pd.DatetimeIndex([date], name='date')
+                    for date in dates}
+        tm.assert_dict_equal(result, expected)
+
+        grouped = df.groupby(level='date')
+        for date in dates:
+            result = grouped.get_group(date)
+            data = [[df.loc[date, 'A'], df.loc[date, 'B']]]
+            expected_index = pd.DatetimeIndex([date], name='date')
+            expected = pd.DataFrame(data,
+                                    columns=list('AB'),
+                                    index=expected_index)
+            tm.assert_frame_equal(result, expected)
+
+    def test_groupby_groups_datetimeindex_tz(self):
+        # GH 3950
+        dates = ['2011-07-19 07:00:00', '2011-07-19 08:00:00',
+                 '2011-07-19 09:00:00', '2011-07-19 07:00:00',
+                 '2011-07-19 08:00:00', '2011-07-19 09:00:00']
+        df = DataFrame({'label': ['a', 'a', 'a', 'b', 'b', 'b'],
+                        'datetime': dates,
+                        'value1': np.arange(6, dtype='int64'),
+                        'value2': [1, 2] * 3})
+        df['datetime'] = df['datetime'].apply(
+            lambda d: Timestamp(d, tz='US/Pacific'))
+
+        exp_idx1 = pd.DatetimeIndex(['2011-07-19 07:00:00',
+                                     '2011-07-19 07:00:00',
+                                     '2011-07-19 08:00:00',
+                                     '2011-07-19 08:00:00',
+                                     '2011-07-19 09:00:00',
+                                     '2011-07-19 09:00:00'],
+                                    tz='US/Pacific', name='datetime')
+        exp_idx2 = Index(['a', 'b'] * 3, name='label')
+        exp_idx = MultiIndex.from_arrays([exp_idx1, exp_idx2])
+        expected = DataFrame({'value1': [0, 3, 1, 4, 2, 5],
+                              'value2': [1, 2, 2, 1, 1, 2]},
+                             index=exp_idx, columns=['value1', 'value2'])
+
+        result = df.groupby(['datetime', 'label']).sum()
+        assert_frame_equal(result, expected)
+
+        # by level
+        didx = pd.DatetimeIndex(dates, tz='Asia/Tokyo')
+        df = DataFrame({'value1': np.arange(6, dtype='int64'),
+                        'value2': [1, 2, 3, 1, 2, 3]},
+                       index=didx)
+
+        exp_idx = pd.DatetimeIndex(['2011-07-19 07:00:00',
+                                    '2011-07-19 08:00:00',
+                                    '2011-07-19 09:00:00'], tz='Asia/Tokyo')
+        expected = DataFrame({'value1': [3, 5, 7], 'value2': [2, 4, 6]},
+                             index=exp_idx, columns=['value1', 'value2'])
+
+        result = df.groupby(level=0).sum()
+        assert_frame_equal(result, expected)
+
+    def test_frame_datetime64_handling_groupby(self):
+        # it works!
+        df = DataFrame([(3, np.datetime64('2012-07-03')),
+                        (3, np.datetime64('2012-07-04'))],
+                       columns=['a', 'date'])
+        result = df.groupby('a').first()
+        assert result['date'][3] == Timestamp('2012-07-03')
+
+    def test_groupby_multi_timezone(self):
+
+        # combining multiple / different timezones yields UTC
+
+        data = """0,2000-01-28 16:47:00,America/Chicago
+1,2000-01-29 16:48:00,America/Chicago
+2,2000-01-30 16:49:00,America/Los_Angeles
+3,2000-01-31 16:50:00,America/Chicago
+4,2000-01-01 16:50:00,America/New_York"""
+
+        df = pd.read_csv(StringIO(data), header=None,
+                         names=['value', 'date', 'tz'])
+        result = df.groupby('tz').date.apply(
+            lambda x: pd.to_datetime(x).dt.tz_localize(x.name))
+
+        expected = Series([Timestamp('2000-01-28 16:47:00-0600',
+                                     tz='America/Chicago'),
+                           Timestamp('2000-01-29 16:48:00-0600',
+                                     tz='America/Chicago'),
+                           Timestamp('2000-01-30 16:49:00-0800',
+                                     tz='America/Los_Angeles'),
+                           Timestamp('2000-01-31 16:50:00-0600',
+                                     tz='America/Chicago'),
+                           Timestamp('2000-01-01 16:50:00-0500',
+                                     tz='America/New_York')],
+                          name='date',
+                          dtype=object)
+        assert_series_equal(result, expected)
+
+        tz = 'America/Chicago'
+        res_values = df.groupby('tz').date.get_group(tz)
+        result = pd.to_datetime(res_values).dt.tz_localize(tz)
+        exp_values = Series(['2000-01-28 16:47:00', '2000-01-29 16:48:00',
+                             '2000-01-31 16:50:00'],
+                            index=[0, 1, 3], name='date')
+        expected = pd.to_datetime(exp_values).dt.tz_localize(tz)
+        assert_series_equal(result, expected)
+
+    def test_groupby_groups_periods(self):
+        dates = ['2011-07-19 07:00:00', '2011-07-19 08:00:00',
+                 '2011-07-19 09:00:00', '2011-07-19 07:00:00',
+                 '2011-07-19 08:00:00', '2011-07-19 09:00:00']
+        df = DataFrame({'label': ['a', 'a', 'a', 'b', 'b', 'b'],
+                        'period': [pd.Period(d, freq='H') for d in dates],
+                        'value1': np.arange(6, dtype='int64'),
+                        'value2': [1, 2] * 3})
+
+        exp_idx1 = pd.PeriodIndex(['2011-07-19 07:00:00',
+                                   '2011-07-19 07:00:00',
+                                   '2011-07-19 08:00:00',
+                                   '2011-07-19 08:00:00',
+                                   '2011-07-19 09:00:00',
+                                   '2011-07-19 09:00:00'],
+                                  freq='H', name='period')
+        exp_idx2 = Index(['a', 'b'] * 3, name='label')
+        exp_idx = MultiIndex.from_arrays([exp_idx1, exp_idx2])
+        expected = DataFrame({'value1': [0, 3, 1, 4, 2, 5],
+                              'value2': [1, 2, 2, 1, 1, 2]},
+                             index=exp_idx, columns=['value1', 'value2'])
+
+        result = df.groupby(['period', 'label']).sum()
+        assert_frame_equal(result, expected)
+
+        # by level
+        didx = pd.PeriodIndex(dates, freq='H')
+        df = DataFrame({'value1': np.arange(6, dtype='int64'),
+                        'value2': [1, 2, 3, 1, 2, 3]},
+                       index=didx)
+
+        exp_idx = pd.PeriodIndex(['2011-07-19 07:00:00',
+                                  '2011-07-19 08:00:00',
+                                  '2011-07-19 09:00:00'], freq='H')
+        expected = DataFrame({'value1': [3, 5, 7], 'value2': [2, 4, 6]},
+                             index=exp_idx, columns=['value1', 'value2'])
+
+        result = df.groupby(level=0).sum()
+        assert_frame_equal(result, expected)
+
+    def test_groupby_first_datetime64(self):
+        df = DataFrame([(1, 1351036800000000000), (2, 1351036800000000000)])
+        df[1] = df[1].view('M8[ns]')
+
+        assert issubclass(df[1].dtype.type, np.datetime64)
+
+        result = df.groupby(level=0).first()
+        got_dt = result[1].dtype
+        assert issubclass(got_dt.type, np.datetime64)
+
+        result = df[1].groupby(level=0).first()
+        got_dt = result.dtype
+        assert issubclass(got_dt.type, np.datetime64)
+
+    def test_groupby_max_datetime64(self):
+        # GH 5869
+        # datetimelike dtype conversion from int
+        df = DataFrame(dict(A=Timestamp('20130101'), B=np.arange(5)))
+        expected = df.groupby('A')['A'].apply(lambda x: x.max())
+        result = df.groupby('A')['A'].max()
+        assert_series_equal(result, expected)
+
+    def test_groupby_datetime64_32_bit(self):
+        # GH 6410 / numpy 4328
+        # 32-bit under 1.9-dev indexing issue
+
+        df = DataFrame({"A": range(2), "B": [pd.Timestamp('2000-01-1')] * 2})
+        result = df.groupby("A")["B"].transform(min)
+        expected = Series([pd.Timestamp('2000-01-1')] * 2, name='B')
+        assert_series_equal(result, expected)
+
+    def test_groupby_with_timezone_selection(self):
+        # GH 11616
+        # Test that column selection returns output in correct timezone.
+        np.random.seed(42)
+        df = pd.DataFrame({
+            'factor': np.random.randint(0, 3, size=60),
+            'time': pd.date_range('01/01/2000 00:00', periods=60,
+                                  freq='s', tz='UTC')
+        })
+        df1 = df.groupby('factor').max()['time']
+        df2 = df.groupby('factor')['time'].max()
+        tm.assert_series_equal(df1, df2)
+
+    def test_timezone_info(self):
+        # see gh-11682: Timezone info lost when broadcasting
+        # scalar datetime to DataFrame
+
+        df = pd.DataFrame({'a': [1], 'b': [datetime.now(pytz.utc)]})
+        assert df['b'][0].tzinfo == pytz.utc
+        df = pd.DataFrame({'a': [1, 2, 3]})
+        df['b'] = datetime.now(pytz.utc)
+        assert df['b'][0].tzinfo == pytz.utc
+
+    def test_datetime_count(self):
+        df = DataFrame({'a': [1, 2, 3] * 2,
+                        'dates': pd.date_range('now', periods=6, freq='T')})
+        result = df.groupby('a').dates.count()
+        expected = Series([
+            2, 2, 2
+        ], index=Index([1, 2, 3], name='a'), name='dates')
+        tm.assert_series_equal(result, expected)
+
+    def test_first_last_max_min_on_time_data(self):
+        # GH 10295
+        # Verify that NaT is not in the result of max, min, first and last on
+        # Dataframe with datetime or timedelta values.
+        from datetime import timedelta as td
+        df_test = DataFrame(
+            {'dt': [nan, '2015-07-24 10:10', '2015-07-25 11:11',
+                    '2015-07-23 12:12', nan],
+             'td': [nan, td(days=1), td(days=2), td(days=3), nan]})
+        df_test.dt = pd.to_datetime(df_test.dt)
+        df_test['group'] = 'A'
+        df_ref = df_test[df_test.dt.notna()]
+
+        grouped_test = df_test.groupby('group')
+        grouped_ref = df_ref.groupby('group')
+
+        assert_frame_equal(grouped_ref.max(), grouped_test.max())
+        assert_frame_equal(grouped_ref.min(), grouped_test.min())
+        assert_frame_equal(grouped_ref.first(), grouped_test.first())
+        assert_frame_equal(grouped_ref.last(), grouped_test.last())
+
+    def test_nunique_with_timegrouper_and_nat(self):
+        # GH 17575
+        test = pd.DataFrame({
+            'time': [Timestamp('2016-06-28 09:35:35'),
+                     pd.NaT,
+                     Timestamp('2016-06-28 16:46:28')],
+            'data': ['1', '2', '3']})
+
+        grouper = pd.Grouper(key='time', freq='h')
+        result = test.groupby(grouper)['data'].nunique()
+        expected = test[test.time.notnull()].groupby(grouper)['data'].nunique()
+        tm.assert_series_equal(result, expected)
+
+    def test_scalar_call_versus_list_call(self):
+        # Issue: 17530
+        data_frame = {
+            'location': ['shanghai', 'beijing', 'shanghai'],
+            'time': pd.Series(['2017-08-09 13:32:23', '2017-08-11 23:23:15',
+                               '2017-08-11 22:23:15'],
+                              dtype='datetime64[ns]'),
+            'value': [1, 2, 3]
+        }
+        data_frame = pd.DataFrame(data_frame).set_index('time')
+        grouper = pd.Grouper(freq='D')
+
+        grouped = data_frame.groupby(grouper)
+        result = grouped.count()
+        grouped = data_frame.groupby([grouper])
+        expected = grouped.count()
+
+        assert_frame_equal(result, expected)
diff --git a/pandas/tests/groupby/test_transform.py b/pandas/tests/groupby/test_transform.py
new file mode 100644
index 0000000000000..7fccf1f57a886
--- /dev/null
+++ b/pandas/tests/groupby/test_transform.py
@@ -0,0 +1,784 @@
+""" test with the .transform """
+
+import pytest
+
+import numpy as np
+import pandas as pd
+from pandas.util import testing as tm
+from pandas import Series, DataFrame, Timestamp, MultiIndex, concat, date_range
+from pandas.core.dtypes.common import (
+    _ensure_platform_int, is_timedelta64_dtype)
+from pandas.compat import StringIO
+from pandas._libs import groupby
+
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+from pandas.core.groupby.groupby import DataError
+from pandas.core.config import option_context
+
+
+def assert_fp_equal(a, b):
+    assert (np.abs(a - b) < 1e-12).all()
+
+
+def test_transform():
+    data = Series(np.arange(9) // 3, index=np.arange(9))
+
+    index = np.arange(9)
+    np.random.shuffle(index)
+    data = data.reindex(index)
+
+    grouped = data.groupby(lambda x: x // 3)
+
+    transformed = grouped.transform(lambda x: x * x.sum())
+    assert transformed[7] == 12
+
+    # GH 8046
+    # make sure that we preserve the input order
+
+    df = DataFrame(
+        np.arange(6, dtype='int64').reshape(
+            3, 2), columns=["a", "b"], index=[0, 2, 1])
+    key = [0, 0, 1]
+    expected = df.sort_index().groupby(key).transform(
+        lambda x: x - x.mean()).groupby(key).mean()
+    result = df.groupby(key).transform(lambda x: x - x.mean()).groupby(
+        key).mean()
+    assert_frame_equal(result, expected)
+
+    def demean(arr):
+        return arr - arr.mean()
+
+    people = DataFrame(np.random.randn(5, 5),
+                       columns=['a', 'b', 'c', 'd', 'e'],
+                       index=['Joe', 'Steve', 'Wes', 'Jim', 'Travis'])
+    key = ['one', 'two', 'one', 'two', 'one']
+    result = people.groupby(key).transform(demean).groupby(key).mean()
+    expected = people.groupby(key).apply(demean).groupby(key).mean()
+    assert_frame_equal(result, expected)
+
+    # GH 8430
+    df = tm.makeTimeDataFrame()
+    g = df.groupby(pd.Grouper(freq='M'))
+    g.transform(lambda x: x - 1)
+
+    # GH 9700
+    df = DataFrame({'a': range(5, 10), 'b': range(5)})
+    result = df.groupby('a').transform(max)
+    expected = DataFrame({'b': range(5)})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_transform_fast():
+
+    df = DataFrame({'id': np.arange(100000) / 3,
+                    'val': np.random.randn(100000)})
+
+    grp = df.groupby('id')['val']
+
+    values = np.repeat(grp.mean().values,
+                       _ensure_platform_int(grp.count().values))
+    expected = pd.Series(values, index=df.index, name='val')
+
+    result = grp.transform(np.mean)
+    assert_series_equal(result, expected)
+
+    result = grp.transform('mean')
+    assert_series_equal(result, expected)
+
+    # GH 12737
+    df = pd.DataFrame({'grouping': [0, 1, 1, 3], 'f': [1.1, 2.1, 3.1, 4.5],
+                       'd': pd.date_range('2014-1-1', '2014-1-4'),
+                       'i': [1, 2, 3, 4]},
+                      columns=['grouping', 'f', 'i', 'd'])
+    result = df.groupby('grouping').transform('first')
+
+    dates = [pd.Timestamp('2014-1-1'), pd.Timestamp('2014-1-2'),
+             pd.Timestamp('2014-1-2'), pd.Timestamp('2014-1-4')]
+    expected = pd.DataFrame({'f': [1.1, 2.1, 2.1, 4.5],
+                             'd': dates,
+                             'i': [1, 2, 2, 4]},
+                            columns=['f', 'i', 'd'])
+    assert_frame_equal(result, expected)
+
+    # selection
+    result = df.groupby('grouping')[['f', 'i']].transform('first')
+    expected = expected[['f', 'i']]
+    assert_frame_equal(result, expected)
+
+    # dup columns
+    df = pd.DataFrame([[1, 2, 3], [4, 5, 6]], columns=['g', 'a', 'a'])
+    result = df.groupby('g').transform('first')
+    expected = df.drop('g', axis=1)
+    assert_frame_equal(result, expected)
+
+
+def test_transform_broadcast(tsframe, ts):
+    grouped = ts.groupby(lambda x: x.month)
+    result = grouped.transform(np.mean)
+
+    tm.assert_index_equal(result.index, ts.index)
+    for _, gp in grouped:
+        assert_fp_equal(result.reindex(gp.index), gp.mean())
+
+    grouped = tsframe.groupby(lambda x: x.month)
+    result = grouped.transform(np.mean)
+    tm.assert_index_equal(result.index, tsframe.index)
+    for _, gp in grouped:
+        agged = gp.mean()
+        res = result.reindex(gp.index)
+        for col in tsframe:
+            assert_fp_equal(res[col], agged[col])
+
+    # group columns
+    grouped = tsframe.groupby({'A': 0, 'B': 0, 'C': 1, 'D': 1},
+                              axis=1)
+    result = grouped.transform(np.mean)
+    tm.assert_index_equal(result.index, tsframe.index)
+    tm.assert_index_equal(result.columns, tsframe.columns)
+    for _, gp in grouped:
+        agged = gp.mean(1)
+        res = result.reindex(columns=gp.columns)
+        for idx in gp.index:
+            assert_fp_equal(res.xs(idx), agged[idx])
+
+
+def test_transform_axis(tsframe):
+
+    # make sure that we are setting the axes
+    # correctly when on axis=0 or 1
+    # in the presence of a non-monotonic indexer
+    # GH12713
+
+    base = tsframe.iloc[0:5]
+    r = len(base.index)
+    c = len(base.columns)
+    tso = DataFrame(np.random.randn(r, c),
+                    index=base.index,
+                    columns=base.columns,
+                    dtype='float64')
+    # monotonic
+    ts = tso
+    grouped = ts.groupby(lambda x: x.weekday())
+    result = ts - grouped.transform('mean')
+    expected = grouped.apply(lambda x: x - x.mean())
+    assert_frame_equal(result, expected)
+
+    ts = ts.T
+    grouped = ts.groupby(lambda x: x.weekday(), axis=1)
+    result = ts - grouped.transform('mean')
+    expected = grouped.apply(lambda x: (x.T - x.mean(1)).T)
+    assert_frame_equal(result, expected)
+
+    # non-monotonic
+    ts = tso.iloc[[1, 0] + list(range(2, len(base)))]
+    grouped = ts.groupby(lambda x: x.weekday())
+    result = ts - grouped.transform('mean')
+    expected = grouped.apply(lambda x: x - x.mean())
+    assert_frame_equal(result, expected)
+
+    ts = ts.T
+    grouped = ts.groupby(lambda x: x.weekday(), axis=1)
+    result = ts - grouped.transform('mean')
+    expected = grouped.apply(lambda x: (x.T - x.mean(1)).T)
+    assert_frame_equal(result, expected)
+
+
+def test_transform_dtype():
+    # GH 9807
+    # Check transform dtype output is preserved
+    df = DataFrame([[1, 3], [2, 3]])
+    result = df.groupby(1).transform('mean')
+    expected = DataFrame([[1.5], [1.5]])
+    assert_frame_equal(result, expected)
+
+
+def test_transform_bug():
+    # GH 5712
+    # transforming on a datetime column
+    df = DataFrame(dict(A=Timestamp('20130101'), B=np.arange(5)))
+    result = df.groupby('A')['B'].transform(
+        lambda x: x.rank(ascending=False))
+    expected = Series(np.arange(5, 0, step=-1), name='B')
+    assert_series_equal(result, expected)
+
+
+def test_transform_numeric_to_boolean():
+    # GH 16875
+    # inconsistency in transforming boolean values
+    expected = pd.Series([True, True], name='A')
+
+    df = pd.DataFrame({'A': [1.1, 2.2], 'B': [1, 2]})
+    result = df.groupby('B').A.transform(lambda x: True)
+    assert_series_equal(result, expected)
+
+    df = pd.DataFrame({'A': [1, 2], 'B': [1, 2]})
+    result = df.groupby('B').A.transform(lambda x: True)
+    assert_series_equal(result, expected)
+
+
+def test_transform_datetime_to_timedelta():
+    # GH 15429
+    # transforming a datetime to timedelta
+    df = DataFrame(dict(A=Timestamp('20130101'), B=np.arange(5)))
+    expected = pd.Series([
+        Timestamp('20130101') - Timestamp('20130101')] * 5, name='A')
+
+    # this does date math without changing result type in transform
+    base_time = df['A'][0]
+    result = df.groupby('A')['A'].transform(
+        lambda x: x.max() - x.min() + base_time) - base_time
+    assert_series_equal(result, expected)
+
+    # this does date math and causes the transform to return timedelta
+    result = df.groupby('A')['A'].transform(lambda x: x.max() - x.min())
+    assert_series_equal(result, expected)
+
+
+def test_transform_datetime_to_numeric():
+    # GH 10972
+    # convert dt to float
+    df = DataFrame({
+        'a': 1, 'b': date_range('2015-01-01', periods=2, freq='D')})
+    result = df.groupby('a').b.transform(
+        lambda x: x.dt.dayofweek - x.dt.dayofweek.mean())
+
+    expected = Series([-0.5, 0.5], name='b')
+    assert_series_equal(result, expected)
+
+    # convert dt to int
+    df = DataFrame({
+        'a': 1, 'b': date_range('2015-01-01', periods=2, freq='D')})
+    result = df.groupby('a').b.transform(
+        lambda x: x.dt.dayofweek - x.dt.dayofweek.min())
+
+    expected = Series([0, 1], name='b')
+    assert_series_equal(result, expected)
+
+
+def test_transform_casting():
+    # 13046
+    data = """
+    idx     A         ID3              DATETIME
+    0   B-028  b76cd912ff "2014-10-08 13:43:27"
+    1   B-054  4a57ed0b02 "2014-10-08 14:26:19"
+    2   B-076  1a682034f8 "2014-10-08 14:29:01"
+    3   B-023  b76cd912ff "2014-10-08 18:39:34"
+    4   B-023  f88g8d7sds "2014-10-08 18:40:18"
+    5   B-033  b76cd912ff "2014-10-08 18:44:30"
+    6   B-032  b76cd912ff "2014-10-08 18:46:00"
+    7   B-037  b76cd912ff "2014-10-08 18:52:15"
+    8   B-046  db959faf02 "2014-10-08 18:59:59"
+    9   B-053  b76cd912ff "2014-10-08 19:17:48"
+    10  B-065  b76cd912ff "2014-10-08 19:21:38"
+    """
+    df = pd.read_csv(StringIO(data), sep=r'\s+',
+                     index_col=[0], parse_dates=['DATETIME'])
+
+    result = df.groupby('ID3')['DATETIME'].transform(lambda x: x.diff())
+    assert is_timedelta64_dtype(result.dtype)
+
+    result = df[['ID3', 'DATETIME']].groupby('ID3').transform(
+        lambda x: x.diff())
+    assert is_timedelta64_dtype(result.DATETIME.dtype)
+
+
+def test_transform_multiple(ts):
+    grouped = ts.groupby([lambda x: x.year, lambda x: x.month])
+
+    grouped.transform(lambda x: x * 2)
+    grouped.transform(np.mean)
+
+
+def test_dispatch_transform(tsframe):
+    df = tsframe[::5].reindex(tsframe.index)
+
+    grouped = df.groupby(lambda x: x.month)
+
+    filled = grouped.fillna(method='pad')
+    fillit = lambda x: x.fillna(method='pad')
+    expected = df.groupby(lambda x: x.month).transform(fillit)
+    assert_frame_equal(filled, expected)
+
+
+def test_transform_select_columns(df):
+    f = lambda x: x.mean()
+    result = df.groupby('A')['C', 'D'].transform(f)
+
+    selection = df[['C', 'D']]
+    expected = selection.groupby(df['A']).transform(f)
+
+    assert_frame_equal(result, expected)
+
+
+def test_transform_exclude_nuisance(df):
+
+    # this also tests orderings in transform between
+    # series/frame to make sure it's consistent
+    expected = {}
+    grouped = df.groupby('A')
+    expected['C'] = grouped['C'].transform(np.mean)
+    expected['D'] = grouped['D'].transform(np.mean)
+    expected = DataFrame(expected)
+    result = df.groupby('A').transform(np.mean)
+
+    assert_frame_equal(result, expected)
+
+
+def test_transform_function_aliases(df):
+    result = df.groupby('A').transform('mean')
+    expected = df.groupby('A').transform(np.mean)
+    assert_frame_equal(result, expected)
+
+    result = df.groupby('A')['C'].transform('mean')
+    expected = df.groupby('A')['C'].transform(np.mean)
+    assert_series_equal(result, expected)
+
+
+def test_series_fast_transform_date():
+    # GH 13191
+    df = pd.DataFrame({'grouping': [np.nan, 1, 1, 3],
+                       'd': pd.date_range('2014-1-1', '2014-1-4')})
+    result = df.groupby('grouping')['d'].transform('first')
+    dates = [pd.NaT, pd.Timestamp('2014-1-2'), pd.Timestamp('2014-1-2'),
+             pd.Timestamp('2014-1-4')]
+    expected = pd.Series(dates, name='d')
+    assert_series_equal(result, expected)
+
+
+def test_transform_length():
+    # GH 9697
+    df = pd.DataFrame({'col1': [1, 1, 2, 2], 'col2': [1, 2, 3, np.nan]})
+    expected = pd.Series([3.0] * 4)
+
+    def nsum(x):
+        return np.nansum(x)
+
+    results = [df.groupby('col1').transform(sum)['col2'],
+               df.groupby('col1')['col2'].transform(sum),
+               df.groupby('col1').transform(nsum)['col2'],
+               df.groupby('col1')['col2'].transform(nsum)]
+    for result in results:
+        assert_series_equal(result, expected, check_names=False)
+
+
+def test_transform_coercion():
+
+    # 14457
+    # when we are transforming be sure to not coerce
+    # via assignment
+    df = pd.DataFrame(dict(A=['a', 'a'], B=[0, 1]))
+    g = df.groupby('A')
+
+    expected = g.transform(np.mean)
+    result = g.transform(lambda x: np.mean(x))
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_transform_with_int():
+
+    # GH 3740, make sure that we might upcast on item-by-item transform
+
+    # floats
+    df = DataFrame(dict(A=[1, 1, 1, 2, 2, 2], B=Series(1, dtype='float64'),
+                        C=Series(
+                            [1, 2, 3, 1, 2, 3], dtype='float64'), D='foo'))
+    with np.errstate(all='ignore'):
+        result = df.groupby('A').transform(
+            lambda x: (x - x.mean()) / x.std())
+    expected = DataFrame(dict(B=np.nan, C=Series(
+        [-1, 0, 1, -1, 0, 1], dtype='float64')))
+    assert_frame_equal(result, expected)
+
+    # int case
+    df = DataFrame(dict(A=[1, 1, 1, 2, 2, 2], B=1,
+                        C=[1, 2, 3, 1, 2, 3], D='foo'))
+    with np.errstate(all='ignore'):
+        result = df.groupby('A').transform(
+            lambda x: (x - x.mean()) / x.std())
+    expected = DataFrame(dict(B=np.nan, C=[-1, 0, 1, -1, 0, 1]))
+    assert_frame_equal(result, expected)
+
+    # int that needs float conversion
+    s = Series([2, 3, 4, 10, 5, -1])
+    df = DataFrame(dict(A=[1, 1, 1, 2, 2, 2], B=1, C=s, D='foo'))
+    with np.errstate(all='ignore'):
+        result = df.groupby('A').transform(
+            lambda x: (x - x.mean()) / x.std())
+
+    s1 = s.iloc[0:3]
+    s1 = (s1 - s1.mean()) / s1.std()
+    s2 = s.iloc[3:6]
+    s2 = (s2 - s2.mean()) / s2.std()
+    expected = DataFrame(dict(B=np.nan, C=concat([s1, s2])))
+    assert_frame_equal(result, expected)
+
+    # int downcasting
+    result = df.groupby('A').transform(lambda x: x * 2 / 2)
+    expected = DataFrame(dict(B=1, C=[2, 3, 4, 10, 5, -1]))
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_transform_with_nan_group():
+    # GH 9941
+    df = pd.DataFrame({'a': range(10),
+                       'b': [1, 1, 2, 3, np.nan, 4, 4, 5, 5, 5]})
+    result = df.groupby(df.b)['a'].transform(max)
+    expected = pd.Series([1., 1., 2., 3., np.nan, 6., 6., 9., 9., 9.],
+                         name='a')
+    assert_series_equal(result, expected)
+
+
+def test_transform_mixed_type():
+    index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1], [1, 2, 3, 1, 2, 3]
+                                    ])
+    df = DataFrame({'d': [1., 1., 1., 2., 2., 2.],
+                    'c': np.tile(['a', 'b', 'c'], 2),
+                    'v': np.arange(1., 7.)}, index=index)
+
+    def f(group):
+        group['g'] = group['d'] * 2
+        return group[:1]
+
+    grouped = df.groupby('c')
+    result = grouped.apply(f)
+
+    assert result['d'].dtype == np.float64
+
+    # this is by definition a mutating operation!
+    with option_context('mode.chained_assignment', None):
+        for key, group in grouped:
+            res = f(group)
+            assert_frame_equal(res, result.loc[key])
+
+
+def test_cython_group_transform_algos():
+    # GH 4095
+    dtypes = [np.int8, np.int16, np.int32, np.int64, np.uint8, np.uint32,
+              np.uint64, np.float32, np.float64]
+
+    ops = [(groupby.group_cumprod_float64, np.cumproduct, [np.float64]),
+           (groupby.group_cumsum, np.cumsum, dtypes)]
+
+    is_datetimelike = False
+    for pd_op, np_op, dtypes in ops:
+        for dtype in dtypes:
+            data = np.array([[1], [2], [3], [4]], dtype=dtype)
+            ans = np.zeros_like(data)
+            labels = np.array([0, 0, 0, 0], dtype=np.int64)
+            pd_op(ans, data, labels, is_datetimelike)
+            tm.assert_numpy_array_equal(np_op(data), ans[:, 0],
+                                        check_dtype=False)
+
+    # with nans
+    labels = np.array([0, 0, 0, 0, 0], dtype=np.int64)
+
+    data = np.array([[1], [2], [3], [np.nan], [4]], dtype='float64')
+    actual = np.zeros_like(data)
+    actual.fill(np.nan)
+    groupby.group_cumprod_float64(actual, data, labels, is_datetimelike)
+    expected = np.array([1, 2, 6, np.nan, 24], dtype='float64')
+    tm.assert_numpy_array_equal(actual[:, 0], expected)
+
+    actual = np.zeros_like(data)
+    actual.fill(np.nan)
+    groupby.group_cumsum(actual, data, labels, is_datetimelike)
+    expected = np.array([1, 3, 6, np.nan, 10], dtype='float64')
+    tm.assert_numpy_array_equal(actual[:, 0], expected)
+
+    # timedelta
+    is_datetimelike = True
+    data = np.array([np.timedelta64(1, 'ns')] * 5, dtype='m8[ns]')[:, None]
+    actual = np.zeros_like(data, dtype='int64')
+    groupby.group_cumsum(actual, data.view('int64'), labels,
+                         is_datetimelike)
+    expected = np.array([np.timedelta64(1, 'ns'), np.timedelta64(
+        2, 'ns'), np.timedelta64(3, 'ns'), np.timedelta64(4, 'ns'),
+        np.timedelta64(5, 'ns')])
+    tm.assert_numpy_array_equal(actual[:, 0].view('m8[ns]'), expected)
+
+
+@pytest.mark.parametrize(
+    "op, args, targop",
+    [('cumprod', (), lambda x: x.cumprod()),
+     ('cumsum', (), lambda x: x.cumsum()),
+     ('shift', (-1, ), lambda x: x.shift(-1)),
+     ('shift', (1, ), lambda x: x.shift())])
+def test_cython_transform_series(op, args, targop):
+    # GH 4095
+    s = Series(np.random.randn(1000))
+    s_missing = s.copy()
+    s_missing.iloc[2:10] = np.nan
+    labels = np.random.randint(0, 50, size=1000).astype(float)
+
+    # series
+    for data in [s, s_missing]:
+        # print(data.head())
+        expected = data.groupby(labels).transform(targop)
+
+        tm.assert_series_equal(
+            expected,
+            data.groupby(labels).transform(op, *args))
+        tm.assert_series_equal(expected, getattr(
+            data.groupby(labels), op)(*args))
+
+
+@pytest.mark.parametrize("op", ['cumprod', 'cumsum'])
+@pytest.mark.parametrize("skipna", [False, True])
+@pytest.mark.parametrize('input, exp', [
+    # When everything is NaN
+    ({'key': ['b'] * 10, 'value': np.nan},
+     pd.Series([np.nan] * 10, name='value')),
+    # When there is a single NaN
+    ({'key': ['b'] * 10 + ['a'] * 2,
+      'value': [3] * 3 + [np.nan] + [3] * 8},
+     {('cumprod', False): [3.0, 9.0, 27.0] + [np.nan] * 7 + [3.0, 9.0],
+      ('cumprod', True): [3.0, 9.0, 27.0, np.nan, 81., 243., 729.,
+                          2187., 6561., 19683., 3.0, 9.0],
+      ('cumsum', False): [3.0, 6.0, 9.0] + [np.nan] * 7 + [3.0, 6.0],
+      ('cumsum', True): [3.0, 6.0, 9.0, np.nan, 12., 15., 18.,
+                         21., 24., 27., 3.0, 6.0]})])
+def test_groupby_cum_skipna(op, skipna, input, exp):
+    df = pd.DataFrame(input)
+    result = df.groupby('key')['value'].transform(op, skipna=skipna)
+    if isinstance(exp, dict):
+        expected = exp[(op, skipna)]
+    else:
+        expected = exp
+    expected = pd.Series(expected, name='value')
+    tm.assert_series_equal(expected, result)
+
+
+@pytest.mark.parametrize(
+    "op, args, targop",
+    [('cumprod', (), lambda x: x.cumprod()),
+     ('cumsum', (), lambda x: x.cumsum()),
+     ('shift', (-1, ), lambda x: x.shift(-1)),
+     ('shift', (1, ), lambda x: x.shift())])
+def test_cython_transform_frame(op, args, targop):
+    s = Series(np.random.randn(1000))
+    s_missing = s.copy()
+    s_missing.iloc[2:10] = np.nan
+    labels = np.random.randint(0, 50, size=1000).astype(float)
+    strings = list('qwertyuiopasdfghjklz')
+    strings_missing = strings[:]
+    strings_missing[5] = np.nan
+    df = DataFrame({'float': s,
+                    'float_missing': s_missing,
+                    'int': [1, 1, 1, 1, 2] * 200,
+                    'datetime': pd.date_range('1990-1-1', periods=1000),
+                    'timedelta': pd.timedelta_range(1, freq='s',
+                                                    periods=1000),
+                    'string': strings * 50,
+                    'string_missing': strings_missing * 50},
+                   columns=['float', 'float_missing', 'int', 'datetime',
+                            'timedelta', 'string', 'string_missing'])
+    df['cat'] = df['string'].astype('category')
+
+    df2 = df.copy()
+    df2.index = pd.MultiIndex.from_product([range(100), range(10)])
+
+    # DataFrame - Single and MultiIndex,
+    # group by values, index level, columns
+    for df in [df, df2]:
+        for gb_target in [dict(by=labels), dict(level=0), dict(by='string')
+                          ]:  # dict(by='string_missing')]:
+            # dict(by=['int','string'])]:
+
+            gb = df.groupby(**gb_target)
+            # whitelisted methods set the selection before applying
+            # bit a of hack to make sure the cythonized shift
+            # is equivalent to pre 0.17.1 behavior
+            if op == 'shift':
+                gb._set_group_selection()
+
+            if op != 'shift' and 'int' not in gb_target:
+                # numeric apply fastpath promotes dtype so have
+                # to apply separately and concat
+                i = gb[['int']].apply(targop)
+                f = gb[['float', 'float_missing']].apply(targop)
+                expected = pd.concat([f, i], axis=1)
+            else:
+                expected = gb.apply(targop)
+
+            expected = expected.sort_index(axis=1)
+            tm.assert_frame_equal(expected,
+                                  gb.transform(op, *args).sort_index(
+                                      axis=1))
+            tm.assert_frame_equal(
+                expected,
+                getattr(gb, op)(*args).sort_index(axis=1))
+            # individual columns
+            for c in df:
+                if c not in ['float', 'int', 'float_missing'
+                             ] and op != 'shift':
+                    pytest.raises(DataError, gb[c].transform, op)
+                    pytest.raises(DataError, getattr(gb[c], op))
+                else:
+                    expected = gb[c].apply(targop)
+                    expected.name = c
+                    tm.assert_series_equal(expected,
+                                           gb[c].transform(op, *args))
+                    tm.assert_series_equal(expected,
+                                           getattr(gb[c], op)(*args))
+
+
+def test_transform_with_non_scalar_group():
+    # GH 10165
+    cols = pd.MultiIndex.from_tuples([
+        ('syn', 'A'), ('mis', 'A'), ('non', 'A'),
+        ('syn', 'C'), ('mis', 'C'), ('non', 'C'),
+        ('syn', 'T'), ('mis', 'T'), ('non', 'T'),
+        ('syn', 'G'), ('mis', 'G'), ('non', 'G')])
+    df = pd.DataFrame(np.random.randint(1, 10, (4, 12)),
+                      columns=cols,
+                      index=['A', 'C', 'G', 'T'])
+    tm.assert_raises_regex(ValueError, 'transform must return '
+                           'a scalar value for each '
+                           'group.*',
+                           df.groupby(axis=1, level=1).transform,
+                           lambda z: z.div(z.sum(axis=1), axis=0))
+
+
+@pytest.mark.parametrize('cols,exp,comp_func', [
+    ('a', pd.Series([1, 1, 1], name='a'), tm.assert_series_equal),
+    (['a', 'c'], pd.DataFrame({'a': [1, 1, 1], 'c': [1, 1, 1]}),
+     tm.assert_frame_equal)
+])
+@pytest.mark.parametrize('agg_func', [
+    'count', 'rank', 'size'])
+def test_transform_numeric_ret(cols, exp, comp_func, agg_func):
+    if agg_func == 'size' and isinstance(cols, list):
+        pytest.xfail("'size' transformation not supported with "
+                     "NDFrameGroupy")
+
+    # GH 19200
+    df = pd.DataFrame(
+        {'a': pd.date_range('2018-01-01', periods=3),
+         'b': range(3),
+         'c': range(7, 10)})
+
+    result = df.groupby('b')[cols].transform(agg_func)
+
+    if agg_func == 'rank':
+        exp = exp.astype('float')
+
+    comp_func(result, exp)
+
+
+@pytest.mark.parametrize("mix_groupings", [True, False])
+@pytest.mark.parametrize("as_series", [True, False])
+@pytest.mark.parametrize("val1,val2", [
+    ('foo', 'bar'), (1, 2), (1., 2.)])
+@pytest.mark.parametrize("fill_method,limit,exp_vals", [
+    ("ffill", None,
+     [np.nan, np.nan, 'val1', 'val1', 'val1', 'val2', 'val2', 'val2']),
+    ("ffill", 1,
+     [np.nan, np.nan, 'val1', 'val1', np.nan, 'val2', 'val2', np.nan]),
+    ("bfill", None,
+     ['val1', 'val1', 'val1', 'val2', 'val2', 'val2', np.nan, np.nan]),
+    ("bfill", 1,
+     [np.nan, 'val1', 'val1', np.nan, 'val2', 'val2', np.nan, np.nan])
+])
+def test_group_fill_methods(mix_groupings, as_series, val1, val2,
+                            fill_method, limit, exp_vals):
+    vals = [np.nan, np.nan, val1, np.nan, np.nan, val2, np.nan, np.nan]
+    _exp_vals = list(exp_vals)
+    # Overwrite placeholder values
+    for index, exp_val in enumerate(_exp_vals):
+        if exp_val == 'val1':
+            _exp_vals[index] = val1
+        elif exp_val == 'val2':
+            _exp_vals[index] = val2
+
+    # Need to modify values and expectations depending on the
+    # Series / DataFrame that we ultimately want to generate
+    if mix_groupings:  # ['a', 'b', 'a, 'b', ...]
+        keys = ['a', 'b'] * len(vals)
+
+        def interweave(list_obj):
+            temp = list()
+            for x in list_obj:
+                temp.extend([x, x])
+
+            return temp
+
+        _exp_vals = interweave(_exp_vals)
+        vals = interweave(vals)
+    else:  # ['a', 'a', 'a', ... 'b', 'b', 'b']
+        keys = ['a'] * len(vals) + ['b'] * len(vals)
+        _exp_vals = _exp_vals * 2
+        vals = vals * 2
+
+    df = DataFrame({'key': keys, 'val': vals})
+    if as_series:
+        result = getattr(
+            df.groupby('key')['val'], fill_method)(limit=limit)
+        exp = Series(_exp_vals, name='val')
+        assert_series_equal(result, exp)
+    else:
+        result = getattr(df.groupby('key'), fill_method)(limit=limit)
+        exp = DataFrame({'key': keys, 'val': _exp_vals})
+        assert_frame_equal(result, exp)
+
+
+@pytest.mark.parametrize("fill_method", ['ffill', 'bfill'])
+def test_pad_stable_sorting(fill_method):
+    # GH 21207
+    x = [0] * 20
+    y = [np.nan] * 10 + [1] * 10
+
+    if fill_method == 'bfill':
+        y = y[::-1]
+
+    df = pd.DataFrame({'x': x, 'y': y})
+    expected = df.copy()
+
+    result = getattr(df.groupby('x'), fill_method)()
+
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("test_series", [True, False])
+@pytest.mark.parametrize("periods,fill_method,limit", [
+    (1, 'ffill', None), (1, 'ffill', 1),
+    (1, 'bfill', None), (1, 'bfill', 1),
+    (-1, 'ffill', None), (-1, 'ffill', 1),
+    (-1, 'bfill', None), (-1, 'bfill', 1)])
+def test_pct_change(test_series, periods, fill_method, limit):
+    vals = [np.nan, np.nan, 1, 2, 4, 10, np.nan, np.nan]
+    exp_vals = Series(vals).pct_change(periods=periods,
+                                       fill_method=fill_method,
+                                       limit=limit).tolist()
+
+    df = DataFrame({'key': ['a'] * len(vals) + ['b'] * len(vals),
+                    'vals': vals * 2})
+    grp = df.groupby('key')
+
+    def get_result(grp_obj):
+        return grp_obj.pct_change(periods=periods,
+                                  fill_method=fill_method,
+                                  limit=limit)
+
+    if test_series:
+        exp = pd.Series(exp_vals * 2)
+        exp.name = 'vals'
+        grp = grp['vals']
+        result = get_result(grp)
+        tm.assert_series_equal(result, exp)
+    else:
+        exp = DataFrame({'vals': exp_vals * 2})
+        result = get_result(grp)
+        tm.assert_frame_equal(result, exp)
+
+
+@pytest.mark.parametrize("func", [np.any, np.all])
+def test_any_all_np_func(func):
+    # GH 20653
+    df = pd.DataFrame([['foo', True],
+                       [np.nan, True],
+                       ['foo', True]], columns=['key', 'val'])
+
+    exp = pd.Series([True, np.nan, True], name='val')
+
+    res = df.groupby('key')['val'].transform(func)
+    tm.assert_series_equal(res, exp)
diff --git a/pandas/tests/groupby/test_value_counts.py b/pandas/tests/groupby/test_value_counts.py
new file mode 100644
index 0000000000000..1434656115d18
--- /dev/null
+++ b/pandas/tests/groupby/test_value_counts.py
@@ -0,0 +1,76 @@
+"""
+these are systematically testing all of the args to value_counts
+with different size combinations. This is to ensure stability of the sorting
+and proper parameter handling
+"""
+
+import pytest
+
+from itertools import product
+import numpy as np
+
+from pandas.util import testing as tm
+from pandas import MultiIndex, DataFrame, Series, date_range
+
+
+# our starting frame
+def seed_df(seed_nans, n, m):
+    np.random.seed(1234)
+    days = date_range('2015-08-24', periods=10)
+
+    frame = DataFrame({
+        '1st': np.random.choice(
+            list('abcd'), n),
+        '2nd': np.random.choice(days, n),
+        '3rd': np.random.randint(1, m + 1, n)
+    })
+
+    if seed_nans:
+        frame.loc[1::11, '1st'] = np.nan
+        frame.loc[3::17, '2nd'] = np.nan
+        frame.loc[7::19, '3rd'] = np.nan
+        frame.loc[8::19, '3rd'] = np.nan
+        frame.loc[9::19, '3rd'] = np.nan
+
+    return frame
+
+
+# create input df, keys, and the bins
+binned = []
+ids = []
+for seed_nans in [True, False]:
+    for n, m in product((100, 1000), (5, 20)):
+
+        df = seed_df(seed_nans, n, m)
+        bins = None, np.arange(0, max(5, df['3rd'].max()) + 1, 2)
+        keys = '1st', '2nd', ['1st', '2nd']
+        for k, b in product(keys, bins):
+            binned.append((df, k, b, n, m))
+            ids.append("{}-{}-{}".format(k, n, m))
+
+
+@pytest.mark.slow
+@pytest.mark.parametrize("df, keys, bins, n, m", binned, ids=ids)
+def test_series_groupby_value_counts(df, keys, bins, n, m):
+
+    def rebuild_index(df):
+        arr = list(map(df.index.get_level_values, range(df.index.nlevels)))
+        df.index = MultiIndex.from_arrays(arr, names=df.index.names)
+        return df
+
+    for isort, normalize, sort, ascending, dropna \
+            in product((False, True), repeat=5):
+
+        kwargs = dict(normalize=normalize, sort=sort,
+                      ascending=ascending, dropna=dropna, bins=bins)
+
+        gr = df.groupby(keys, sort=isort)
+        left = gr['3rd'].value_counts(**kwargs)
+
+        gr = df.groupby(keys, sort=isort)
+        right = gr['3rd'].apply(Series.value_counts, **kwargs)
+        right.index.names = right.index.names[:-1] + ['3rd']
+
+        # have to sort on index because of unstable sort on values
+        left, right = map(rebuild_index, (left, right))  # xref GH9212
+        tm.assert_series_equal(left.sort_index(), right.sort_index())
diff --git a/pandas/tests/groupby/test_whitelist.py b/pandas/tests/groupby/test_whitelist.py
new file mode 100644
index 0000000000000..f4a58b9cbe61b
--- /dev/null
+++ b/pandas/tests/groupby/test_whitelist.py
@@ -0,0 +1,311 @@
+"""
+test methods relating to generic function evaluation
+the so-called white/black lists
+"""
+
+import pytest
+from string import ascii_lowercase
+import numpy as np
+from pandas import DataFrame, Series, compat, date_range, Index, MultiIndex
+from pandas.util import testing as tm
+
+AGG_FUNCTIONS = ['sum', 'prod', 'min', 'max', 'median', 'mean', 'skew',
+                 'mad', 'std', 'var', 'sem']
+AGG_FUNCTIONS_WITH_SKIPNA = ['skew', 'mad']
+
+df_whitelist = frozenset([
+    'last',
+    'first',
+    'mean',
+    'sum',
+    'min',
+    'max',
+    'head',
+    'tail',
+    'cumcount',
+    'ngroup',
+    'resample',
+    'rank',
+    'quantile',
+    'fillna',
+    'mad',
+    'any',
+    'all',
+    'take',
+    'idxmax',
+    'idxmin',
+    'shift',
+    'tshift',
+    'ffill',
+    'bfill',
+    'pct_change',
+    'skew',
+    'plot',
+    'hist',
+    'median',
+    'dtypes',
+    'corrwith',
+    'corr',
+    'cov',
+    'diff',
+])
+
+s_whitelist = frozenset([
+    'last',
+    'first',
+    'mean',
+    'sum',
+    'min',
+    'max',
+    'head',
+    'tail',
+    'cumcount',
+    'ngroup',
+    'resample',
+    'rank',
+    'quantile',
+    'fillna',
+    'mad',
+    'any',
+    'all',
+    'take',
+    'idxmax',
+    'idxmin',
+    'shift',
+    'tshift',
+    'ffill',
+    'bfill',
+    'pct_change',
+    'skew',
+    'plot',
+    'hist',
+    'median',
+    'dtype',
+    'corr',
+    'cov',
+    'diff',
+    'unique',
+    'nlargest',
+    'nsmallest',
+    'is_monotonic_increasing',
+    'is_monotonic_decreasing',
+])
+
+
+@pytest.fixture
+def mframe():
+    index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
+                                                              'three']],
+                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       names=['first', 'second'])
+    return DataFrame(np.random.randn(10, 3), index=index,
+                     columns=['A', 'B', 'C'])
+
+
+@pytest.fixture
+def df():
+    return DataFrame(
+        {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
+         'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
+         'C': np.random.randn(8),
+         'D': np.random.randn(8)})
+
+
+@pytest.fixture
+def df_letters():
+    letters = np.array(list(ascii_lowercase))
+    N = 10
+    random_letters = letters.take(np.random.randint(0, 26, N))
+    df = DataFrame({'floats': N / 10 * Series(np.random.random(N)),
+                    'letters': Series(random_letters)})
+    return df
+
+
+@pytest.mark.parametrize(
+    "obj, whitelist", zip((df_letters(), df_letters().floats),
+                          (df_whitelist, s_whitelist)))
+def test_groupby_whitelist(df_letters, obj, whitelist):
+    df = df_letters
+
+    # these are aliases so ok to have the alias __name__
+    alias = {'bfill': 'backfill',
+             'ffill': 'pad',
+             'boxplot': None}
+
+    gb = obj.groupby(df.letters)
+
+    assert whitelist == gb._apply_whitelist
+    for m in whitelist:
+
+        m = alias.get(m, m)
+        if m is None:
+            continue
+
+        f = getattr(type(gb), m)
+
+        # name
+        try:
+            n = f.__name__
+        except AttributeError:
+            continue
+        assert n == m
+
+        # qualname
+        if compat.PY3:
+            try:
+                n = f.__qualname__
+            except AttributeError:
+                continue
+            assert n.endswith(m)
+
+
+@pytest.fixture
+def raw_frame():
+    index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
+                                                              'three']],
+                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       names=['first', 'second'])
+    raw_frame = DataFrame(np.random.randn(10, 3), index=index,
+                          columns=Index(['A', 'B', 'C'], name='exp'))
+    raw_frame.iloc[1, [1, 2]] = np.nan
+    raw_frame.iloc[7, [0, 1]] = np.nan
+    return raw_frame
+
+
+@pytest.mark.parametrize('op', AGG_FUNCTIONS)
+@pytest.mark.parametrize('level', [0, 1])
+@pytest.mark.parametrize('axis', [0, 1])
+@pytest.mark.parametrize('skipna', [True, False])
+@pytest.mark.parametrize('sort', [True, False])
+def test_regression_whitelist_methods(
+        raw_frame, op, level,
+        axis, skipna, sort):
+    # GH6944
+    # GH 17537
+    # explicitly test the whitelist methods
+
+    if axis == 0:
+        frame = raw_frame
+    else:
+        frame = raw_frame.T
+
+    if op in AGG_FUNCTIONS_WITH_SKIPNA:
+        grouped = frame.groupby(level=level, axis=axis, sort=sort)
+        result = getattr(grouped, op)(skipna=skipna)
+        expected = getattr(frame, op)(level=level, axis=axis,
+                                      skipna=skipna)
+        if sort:
+            expected = expected.sort_index(axis=axis, level=level)
+        tm.assert_frame_equal(result, expected)
+    else:
+        grouped = frame.groupby(level=level, axis=axis, sort=sort)
+        result = getattr(grouped, op)()
+        expected = getattr(frame, op)(level=level, axis=axis)
+        if sort:
+            expected = expected.sort_index(axis=axis, level=level)
+        tm.assert_frame_equal(result, expected)
+
+
+def test_groupby_blacklist(df_letters):
+    df = df_letters
+    s = df_letters.floats
+
+    blacklist = [
+        'eval', 'query', 'abs', 'where',
+        'mask', 'align', 'groupby', 'clip', 'astype',
+        'at', 'combine', 'consolidate', 'convert_objects',
+    ]
+    to_methods = [method for method in dir(df) if method.startswith('to_')]
+
+    blacklist.extend(to_methods)
+
+    # e.g., to_csv
+    defined_but_not_allowed = ("(?:^Cannot.+{0!r}.+{1!r}.+try using the "
+                               "'apply' method$)")
+
+    # e.g., query, eval
+    not_defined = "(?:^{1!r} object has no attribute {0!r}$)"
+    fmt = defined_but_not_allowed + '|' + not_defined
+    for bl in blacklist:
+        for obj in (df, s):
+            gb = obj.groupby(df.letters)
+            msg = fmt.format(bl, type(gb).__name__)
+            with tm.assert_raises_regex(AttributeError, msg):
+                getattr(gb, bl)
+
+
+def test_tab_completion(mframe):
+    grp = mframe.groupby(level='second')
+    results = {v for v in dir(grp) if not v.startswith('_')}
+    expected = {
+        'A', 'B', 'C', 'agg', 'aggregate', 'apply', 'boxplot', 'filter',
+        'first', 'get_group', 'groups', 'hist', 'indices', 'last', 'max',
+        'mean', 'median', 'min', 'ngroups', 'nth', 'ohlc', 'plot',
+        'prod', 'size', 'std', 'sum', 'transform', 'var', 'sem', 'count',
+        'nunique', 'head', 'describe', 'cummax', 'quantile',
+        'rank', 'cumprod', 'tail', 'resample', 'cummin', 'fillna',
+        'cumsum', 'cumcount', 'ngroup', 'all', 'shift', 'skew',
+        'take', 'tshift', 'pct_change', 'any', 'mad', 'corr', 'corrwith',
+        'cov', 'dtypes', 'ndim', 'diff', 'idxmax', 'idxmin',
+        'ffill', 'bfill', 'pad', 'backfill', 'rolling', 'expanding', 'pipe',
+    }
+    assert results == expected
+
+
+def test_groupby_function_rename(mframe):
+    grp = mframe.groupby(level='second')
+    for name in ['sum', 'prod', 'min', 'max', 'first', 'last']:
+        f = getattr(grp, name)
+        assert f.__name__ == name
+
+
+def test_groupby_selection_with_methods(df):
+    # some methods which require DatetimeIndex
+    rng = date_range('2014', periods=len(df))
+    df.index = rng
+
+    g = df.groupby(['A'])[['C']]
+    g_exp = df[['C']].groupby(df['A'])
+    # TODO check groupby with > 1 col ?
+
+    # methods which are called as .foo()
+    methods = ['count',
+               'corr',
+               'cummax',
+               'cummin',
+               'cumprod',
+               'describe',
+               'rank',
+               'quantile',
+               'diff',
+               'shift',
+               'all',
+               'any',
+               'idxmin',
+               'idxmax',
+               'ffill',
+               'bfill',
+               'pct_change',
+               'tshift']
+
+    for m in methods:
+        res = getattr(g, m)()
+        exp = getattr(g_exp, m)()
+
+        # should always be frames!
+        tm.assert_frame_equal(res, exp)
+
+    # methods which aren't just .foo()
+    tm.assert_frame_equal(g.fillna(0), g_exp.fillna(0))
+    tm.assert_frame_equal(g.dtypes, g_exp.dtypes)
+    tm.assert_frame_equal(g.apply(lambda x: x.sum()),
+                          g_exp.apply(lambda x: x.sum()))
+
+    tm.assert_frame_equal(g.resample('D').mean(), g_exp.resample('D').mean())
+    tm.assert_frame_equal(g.resample('D').ohlc(),
+                          g_exp.resample('D').ohlc())
+
+    tm.assert_frame_equal(g.filter(lambda x: len(x) == 3),
+                          g_exp.filter(lambda x: len(x) == 3))
diff --git a/pandas/tests/indexes/__init__.py b/pandas/tests/indexes/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/indexes/common.py b/pandas/tests/indexes/common.py
new file mode 100644
index 0000000000000..f78bd583288a4
--- /dev/null
+++ b/pandas/tests/indexes/common.py
@@ -0,0 +1,1110 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from pandas import compat
+from pandas.compat import PY3
+
+import numpy as np
+
+from pandas import (Series, Index, Float64Index, Int64Index, UInt64Index,
+                    RangeIndex, MultiIndex, CategoricalIndex, DatetimeIndex,
+                    TimedeltaIndex, PeriodIndex, IntervalIndex, isna)
+from pandas.core.indexes.base import InvalidIndexError
+from pandas.core.indexes.datetimelike import DatetimeIndexOpsMixin
+from pandas.core.dtypes.common import needs_i8_conversion
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas._libs.tslib import iNaT
+
+import pandas.util.testing as tm
+
+import pandas as pd
+
+
+class Base(object):
+    """ base class for index sub-class tests """
+    _holder = None
+    _compat_props = ['shape', 'ndim', 'size', 'nbytes']
+
+    def setup_indices(self):
+        for name, idx in self.indices.items():
+            setattr(self, name, idx)
+
+    def verify_pickle(self, indices):
+        unpickled = tm.round_trip_pickle(indices)
+        assert indices.equals(unpickled)
+
+    def test_pickle_compat_construction(self):
+        # this is testing for pickle compat
+        if self._holder is None:
+            return
+
+        # need an object to create with
+        pytest.raises(TypeError, self._holder)
+
+    def test_to_series(self):
+        # assert that we are creating a copy of the index
+
+        idx = self.create_index()
+        s = idx.to_series()
+        assert s.values is not idx.values
+        assert s.index is not idx
+        assert s.name == idx.name
+
+    def test_to_series_with_arguments(self):
+        # GH18699
+
+        # index kwarg
+        idx = self.create_index()
+        s = idx.to_series(index=idx)
+
+        assert s.values is not idx.values
+        assert s.index is idx
+        assert s.name == idx.name
+
+        # name kwarg
+        idx = self.create_index()
+        s = idx.to_series(name='__test')
+
+        assert s.values is not idx.values
+        assert s.index is not idx
+        assert s.name != idx.name
+
+    def test_to_frame(self):
+        # see gh-15230
+        idx = self.create_index()
+        name = idx.name or 0
+
+        df = idx.to_frame()
+
+        assert df.index is idx
+        assert len(df.columns) == 1
+        assert df.columns[0] == name
+        assert df[name].values is not idx.values
+
+        df = idx.to_frame(index=False)
+        assert df.index is not idx
+
+    def test_shift(self):
+
+        # GH8083 test the base class for shift
+        idx = self.create_index()
+        pytest.raises(NotImplementedError, idx.shift, 1)
+        pytest.raises(NotImplementedError, idx.shift, 1, 2)
+
+    def test_create_index_existing_name(self):
+
+        # GH11193, when an existing index is passed, and a new name is not
+        # specified, the new index should inherit the previous object name
+        expected = self.create_index()
+        if not isinstance(expected, MultiIndex):
+            expected.name = 'foo'
+            result = pd.Index(expected)
+            tm.assert_index_equal(result, expected)
+
+            result = pd.Index(expected, name='bar')
+            expected.name = 'bar'
+            tm.assert_index_equal(result, expected)
+        else:
+            expected.names = ['foo', 'bar']
+            result = pd.Index(expected)
+            tm.assert_index_equal(
+                result, Index(Index([('foo', 'one'), ('foo', 'two'),
+                                     ('bar', 'one'), ('baz', 'two'),
+                                     ('qux', 'one'), ('qux', 'two')],
+                                    dtype='object'),
+                              names=['foo', 'bar']))
+
+            result = pd.Index(expected, names=['A', 'B'])
+            tm.assert_index_equal(
+                result,
+                Index(Index([('foo', 'one'), ('foo', 'two'), ('bar', 'one'),
+                             ('baz', 'two'), ('qux', 'one'), ('qux', 'two')],
+                            dtype='object'), names=['A', 'B']))
+
+    def test_numeric_compat(self):
+
+        idx = self.create_index()
+        tm.assert_raises_regex(TypeError, "cannot perform __mul__",
+                               lambda: idx * 1)
+        tm.assert_raises_regex(TypeError, "cannot perform __rmul__",
+                               lambda: 1 * idx)
+
+        div_err = "cannot perform __truediv__" if PY3 \
+            else "cannot perform __div__"
+        tm.assert_raises_regex(TypeError, div_err, lambda: idx / 1)
+        div_err = div_err.replace(' __', ' __r')
+        tm.assert_raises_regex(TypeError, div_err, lambda: 1 / idx)
+        tm.assert_raises_regex(TypeError, "cannot perform __floordiv__",
+                               lambda: idx // 1)
+        tm.assert_raises_regex(TypeError, "cannot perform __rfloordiv__",
+                               lambda: 1 // idx)
+
+    def test_logical_compat(self):
+        idx = self.create_index()
+        tm.assert_raises_regex(TypeError, 'cannot perform all',
+                               lambda: idx.all())
+        tm.assert_raises_regex(TypeError, 'cannot perform any',
+                               lambda: idx.any())
+
+    def test_boolean_context_compat(self):
+
+        # boolean context compat
+        idx = self.create_index()
+
+        def f():
+            if idx:
+                pass
+
+        tm.assert_raises_regex(ValueError, 'The truth value of a', f)
+
+    def test_reindex_base(self):
+        idx = self.create_index()
+        expected = np.arange(idx.size, dtype=np.intp)
+
+        actual = idx.get_indexer(idx)
+        tm.assert_numpy_array_equal(expected, actual)
+
+        with tm.assert_raises_regex(ValueError, 'Invalid fill method'):
+            idx.get_indexer(idx, method='invalid')
+
+    def test_get_indexer_consistency(self):
+        # See GH 16819
+        for name, index in self.indices.items():
+            if isinstance(index, IntervalIndex):
+                continue
+
+            if index.is_unique or isinstance(index, CategoricalIndex):
+                indexer = index.get_indexer(index[0:2])
+                assert isinstance(indexer, np.ndarray)
+                assert indexer.dtype == np.intp
+            else:
+                e = "Reindexing only valid with uniquely valued Index objects"
+                with tm.assert_raises_regex(InvalidIndexError, e):
+                    indexer = index.get_indexer(index[0:2])
+
+            indexer, _ = index.get_indexer_non_unique(index[0:2])
+            assert isinstance(indexer, np.ndarray)
+            assert indexer.dtype == np.intp
+
+    def test_ndarray_compat_properties(self):
+        idx = self.create_index()
+        assert idx.T.equals(idx)
+        assert idx.transpose().equals(idx)
+
+        values = idx.values
+        for prop in self._compat_props:
+            assert getattr(idx, prop) == getattr(values, prop)
+
+        # test for validity
+        idx.nbytes
+        idx.values.nbytes
+
+    def test_repr_roundtrip(self):
+
+        idx = self.create_index()
+        tm.assert_index_equal(eval(repr(idx)), idx)
+
+    def test_str(self):
+
+        # test the string repr
+        idx = self.create_index()
+        idx.name = 'foo'
+        assert "'foo'" in str(idx)
+        assert idx.__class__.__name__ in str(idx)
+
+    def test_dtype_str(self, indices):
+        dtype = indices.dtype_str
+        assert isinstance(dtype, compat.string_types)
+        assert dtype == str(indices.dtype)
+
+    def test_repr_max_seq_item_setting(self):
+        # GH10182
+        idx = self.create_index()
+        idx = idx.repeat(50)
+        with pd.option_context("display.max_seq_items", None):
+            repr(idx)
+            assert '...' not in str(idx)
+
+    def test_wrong_number_names(self, indices):
+        def testit(ind):
+            ind.names = ["apple", "banana", "carrot"]
+        tm.assert_raises_regex(ValueError, "^Length", testit, indices)
+
+    def test_set_name_methods(self, indices):
+        new_name = "This is the new name for this index"
+
+        # don't tests a MultiIndex here (as its tested separated)
+        if isinstance(indices, MultiIndex):
+            return
+        original_name = indices.name
+        new_ind = indices.set_names([new_name])
+        assert new_ind.name == new_name
+        assert indices.name == original_name
+        res = indices.rename(new_name, inplace=True)
+
+        # should return None
+        assert res is None
+        assert indices.name == new_name
+        assert indices.names == [new_name]
+        # with tm.assert_raises_regex(TypeError, "list-like"):
+        #    # should still fail even if it would be the right length
+        #    ind.set_names("a")
+        with tm.assert_raises_regex(ValueError, "Level must be None"):
+            indices.set_names("a", level=0)
+
+        # rename in place just leaves tuples and other containers alone
+        name = ('A', 'B')
+        indices.rename(name, inplace=True)
+        assert indices.name == name
+        assert indices.names == [name]
+
+    def test_hash_error(self, indices):
+        index = indices
+        tm.assert_raises_regex(TypeError, "unhashable type: %r" %
+                               type(index).__name__, hash, indices)
+
+    def test_copy_name(self):
+        # gh-12309: Check that the "name" argument
+        # passed at initialization is honored.
+
+        for name, index in compat.iteritems(self.indices):
+            if isinstance(index, MultiIndex):
+                continue
+
+            first = index.__class__(index, copy=True, name='mario')
+            second = first.__class__(first, copy=False)
+
+            # Even though "copy=False", we want a new object.
+            assert first is not second
+
+            # Not using tm.assert_index_equal() since names differ.
+            assert index.equals(first)
+
+            assert first.name == 'mario'
+            assert second.name == 'mario'
+
+            s1 = Series(2, index=first)
+            s2 = Series(3, index=second[:-1])
+
+            if not isinstance(index, CategoricalIndex):
+                # See gh-13365
+                s3 = s1 * s2
+                assert s3.index.name == 'mario'
+
+    def test_ensure_copied_data(self):
+        # Check the "copy" argument of each Index.__new__ is honoured
+        # GH12309
+        for name, index in compat.iteritems(self.indices):
+            init_kwargs = {}
+            if isinstance(index, PeriodIndex):
+                # Needs "freq" specification:
+                init_kwargs['freq'] = index.freq
+            elif isinstance(index, (RangeIndex, MultiIndex, CategoricalIndex)):
+                # RangeIndex cannot be initialized from data
+                # MultiIndex and CategoricalIndex are tested separately
+                continue
+
+            index_type = index.__class__
+            result = index_type(index.values, copy=True, **init_kwargs)
+            tm.assert_index_equal(index, result)
+            tm.assert_numpy_array_equal(index.values, result.values,
+                                        check_same='copy')
+
+            if isinstance(index, PeriodIndex):
+                # .values an object array of Period, thus copied
+                result = index_type(ordinal=index.asi8, copy=False,
+                                    **init_kwargs)
+                tm.assert_numpy_array_equal(index._ndarray_values,
+                                            result._ndarray_values,
+                                            check_same='same')
+            elif isinstance(index, IntervalIndex):
+                # checked in test_interval.py
+                pass
+            else:
+                result = index_type(index.values, copy=False, **init_kwargs)
+                tm.assert_numpy_array_equal(index.values, result.values,
+                                            check_same='same')
+                tm.assert_numpy_array_equal(index._ndarray_values,
+                                            result._ndarray_values,
+                                            check_same='same')
+
+    def test_copy_and_deepcopy(self, indices):
+        from copy import copy, deepcopy
+
+        if isinstance(indices, MultiIndex):
+            return
+        for func in (copy, deepcopy):
+            idx_copy = func(indices)
+            assert idx_copy is not indices
+            assert idx_copy.equals(indices)
+
+        new_copy = indices.copy(deep=True, name="banana")
+        assert new_copy.name == "banana"
+
+    def test_duplicates(self, indices):
+        if type(indices) is not self._holder:
+            return
+        if not len(indices) or isinstance(indices, MultiIndex):
+            return
+        idx = self._holder([indices[0]] * 5)
+        assert not idx.is_unique
+        assert idx.has_duplicates
+
+    def test_unique(self, indices):
+        # don't test a MultiIndex here (as its tested separated)
+        # don't test a CategoricalIndex because categories change (GH 18291)
+        if isinstance(indices, (MultiIndex, CategoricalIndex)):
+            return
+
+        # GH 17896
+        expected = indices.drop_duplicates()
+        for level in 0, indices.name, None:
+            result = indices.unique(level=level)
+            tm.assert_index_equal(result, expected)
+
+        for level in 3, 'wrong':
+            pytest.raises((IndexError, KeyError), indices.unique, level=level)
+
+    def test_unique_na(self):
+        idx = pd.Index([2, np.nan, 2, 1], name='my_index')
+        expected = pd.Index([2, np.nan, 1], name='my_index')
+        result = idx.unique()
+        tm.assert_index_equal(result, expected)
+
+    def test_get_unique_index(self, indices):
+        # MultiIndex tested separately
+        if not len(indices) or isinstance(indices, MultiIndex):
+            return
+
+        idx = indices[[0] * 5]
+        idx_unique = indices[[0]]
+
+        # We test against `idx_unique`, so first we make sure it's unique
+        # and doesn't contain nans.
+        assert idx_unique.is_unique
+        try:
+            assert not idx_unique.hasnans
+        except NotImplementedError:
+            pass
+
+        for dropna in [False, True]:
+            result = idx._get_unique_index(dropna=dropna)
+            tm.assert_index_equal(result, idx_unique)
+
+        # nans:
+        if not indices._can_hold_na:
+            return
+
+        if needs_i8_conversion(indices):
+            vals = indices.asi8[[0] * 5]
+            vals[0] = iNaT
+        else:
+            vals = indices.values[[0] * 5]
+            vals[0] = np.nan
+
+        vals_unique = vals[:2]
+        idx_nan = indices._shallow_copy(vals)
+        idx_unique_nan = indices._shallow_copy(vals_unique)
+        assert idx_unique_nan.is_unique
+
+        assert idx_nan.dtype == indices.dtype
+        assert idx_unique_nan.dtype == indices.dtype
+
+        for dropna, expected in zip([False, True],
+                                    [idx_unique_nan,
+                                     idx_unique]):
+            for i in [idx_nan, idx_unique_nan]:
+                result = i._get_unique_index(dropna=dropna)
+                tm.assert_index_equal(result, expected)
+
+    def test_sort(self, indices):
+        pytest.raises(TypeError, indices.sort)
+
+    def test_mutability(self, indices):
+        if not len(indices):
+            return
+        pytest.raises(TypeError, indices.__setitem__, 0, indices[0])
+
+    def test_view(self, indices):
+        assert indices.view().name == indices.name
+
+    def test_compat(self, indices):
+        assert indices.tolist() == list(indices)
+
+    def test_memory_usage(self):
+        for name, index in compat.iteritems(self.indices):
+            result = index.memory_usage()
+            if len(index):
+                index.get_loc(index[0])
+                result2 = index.memory_usage()
+                result3 = index.memory_usage(deep=True)
+
+                # RangeIndex, IntervalIndex
+                # don't have engines
+                if not isinstance(index, (RangeIndex, IntervalIndex)):
+                    assert result2 > result
+
+                if index.inferred_type == 'object':
+                    assert result3 > result2
+
+            else:
+
+                # we report 0 for no-length
+                assert result == 0
+
+    def test_argsort(self):
+        for k, ind in self.indices.items():
+
+            # separately tested
+            if k in ['catIndex']:
+                continue
+
+            result = ind.argsort()
+            expected = np.array(ind).argsort()
+            tm.assert_numpy_array_equal(result, expected, check_dtype=False)
+
+    def test_numpy_argsort(self):
+        for k, ind in self.indices.items():
+            result = np.argsort(ind)
+            expected = ind.argsort()
+            tm.assert_numpy_array_equal(result, expected)
+
+            # these are the only two types that perform
+            # pandas compatibility input validation - the
+            # rest already perform separate (or no) such
+            # validation via their 'values' attribute as
+            # defined in pandas.core.indexes/base.py - they
+            # cannot be changed at the moment due to
+            # backwards compatibility concerns
+            if isinstance(type(ind), (CategoricalIndex, RangeIndex)):
+                msg = "the 'axis' parameter is not supported"
+                tm.assert_raises_regex(ValueError, msg,
+                                       np.argsort, ind, axis=1)
+
+                msg = "the 'kind' parameter is not supported"
+                tm.assert_raises_regex(ValueError, msg, np.argsort,
+                                       ind, kind='mergesort')
+
+                msg = "the 'order' parameter is not supported"
+                tm.assert_raises_regex(ValueError, msg, np.argsort,
+                                       ind, order=('a', 'b'))
+
+    def test_pickle(self, indices):
+        self.verify_pickle(indices)
+        original_name, indices.name = indices.name, 'foo'
+        self.verify_pickle(indices)
+        indices.name = original_name
+
+    def test_take(self):
+        indexer = [4, 3, 0, 2]
+        for k, ind in self.indices.items():
+
+            # separate
+            if k in ['boolIndex', 'tuples', 'empty']:
+                continue
+
+            result = ind.take(indexer)
+            expected = ind[indexer]
+            assert result.equals(expected)
+
+            if not isinstance(ind,
+                              (DatetimeIndex, PeriodIndex, TimedeltaIndex)):
+                # GH 10791
+                with pytest.raises(AttributeError):
+                    ind.freq
+
+    def test_take_invalid_kwargs(self):
+        idx = self.create_index()
+        indices = [1, 2]
+
+        msg = r"take\(\) got an unexpected keyword argument 'foo'"
+        tm.assert_raises_regex(TypeError, msg, idx.take,
+                               indices, foo=2)
+
+        msg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, idx.take,
+                               indices, out=indices)
+
+        msg = "the 'mode' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, idx.take,
+                               indices, mode='clip')
+
+    def test_repeat(self):
+        rep = 2
+        i = self.create_index()
+        expected = pd.Index(i.values.repeat(rep), name=i.name)
+        tm.assert_index_equal(i.repeat(rep), expected)
+
+        i = self.create_index()
+        rep = np.arange(len(i))
+        expected = pd.Index(i.values.repeat(rep), name=i.name)
+        tm.assert_index_equal(i.repeat(rep), expected)
+
+    def test_numpy_repeat(self):
+        rep = 2
+        i = self.create_index()
+        expected = i.repeat(rep)
+        tm.assert_index_equal(np.repeat(i, rep), expected)
+
+        msg = "the 'axis' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.repeat,
+                               i, rep, axis=0)
+
+    @pytest.mark.parametrize('klass', [list, tuple, np.array, Series])
+    def test_where(self, klass):
+        i = self.create_index()
+
+        cond = [True] * len(i)
+        result = i.where(klass(cond))
+        expected = i
+        tm.assert_index_equal(result, expected)
+
+        cond = [False] + [True] * len(i[1:])
+        expected = pd.Index([i._na_value] + i[1:].tolist(), dtype=i.dtype)
+        result = i.where(klass(cond))
+        tm.assert_index_equal(result, expected)
+
+    def test_setops_errorcases(self):
+        for name, idx in compat.iteritems(self.indices):
+            # # non-iterable input
+            cases = [0.5, 'xxx']
+            methods = [idx.intersection, idx.union, idx.difference,
+                       idx.symmetric_difference]
+
+            for method in methods:
+                for case in cases:
+                    tm.assert_raises_regex(TypeError,
+                                           "Input must be Index "
+                                           "or array-like",
+                                           method, case)
+
+    def test_intersection_base(self):
+        for name, idx in compat.iteritems(self.indices):
+            first = idx[:5]
+            second = idx[:3]
+            intersect = first.intersection(second)
+
+            if isinstance(idx, CategoricalIndex):
+                pass
+            else:
+                assert tm.equalContents(intersect, second)
+
+            # GH 10149
+            cases = [klass(second.values)
+                     for klass in [np.array, Series, list]]
+            for case in cases:
+                if isinstance(idx, PeriodIndex):
+                    msg = "can only call with other PeriodIndex-ed objects"
+                    with tm.assert_raises_regex(ValueError, msg):
+                        result = first.intersection(case)
+                elif isinstance(idx, CategoricalIndex):
+                    pass
+                else:
+                    result = first.intersection(case)
+                    assert tm.equalContents(result, second)
+
+            if isinstance(idx, MultiIndex):
+                msg = "other must be a MultiIndex or a list of tuples"
+                with tm.assert_raises_regex(TypeError, msg):
+                    result = first.intersection([1, 2, 3])
+
+    def test_union_base(self):
+        for name, idx in compat.iteritems(self.indices):
+            first = idx[3:]
+            second = idx[:5]
+            everything = idx
+            union = first.union(second)
+            assert tm.equalContents(union, everything)
+
+            # GH 10149
+            cases = [klass(second.values)
+                     for klass in [np.array, Series, list]]
+            for case in cases:
+                if isinstance(idx, PeriodIndex):
+                    msg = "can only call with other PeriodIndex-ed objects"
+                    with tm.assert_raises_regex(ValueError, msg):
+                        result = first.union(case)
+                elif isinstance(idx, CategoricalIndex):
+                    pass
+                else:
+                    result = first.union(case)
+                    assert tm.equalContents(result, everything)
+
+            if isinstance(idx, MultiIndex):
+                msg = "other must be a MultiIndex or a list of tuples"
+                with tm.assert_raises_regex(TypeError, msg):
+                    result = first.union([1, 2, 3])
+
+    def test_difference_base(self):
+        for name, idx in compat.iteritems(self.indices):
+            first = idx[2:]
+            second = idx[:4]
+            answer = idx[4:]
+            result = first.difference(second)
+
+            if isinstance(idx, CategoricalIndex):
+                pass
+            else:
+                assert tm.equalContents(result, answer)
+
+            # GH 10149
+            cases = [klass(second.values)
+                     for klass in [np.array, Series, list]]
+            for case in cases:
+                if isinstance(idx, PeriodIndex):
+                    msg = "can only call with other PeriodIndex-ed objects"
+                    with tm.assert_raises_regex(ValueError, msg):
+                        result = first.difference(case)
+                elif isinstance(idx, CategoricalIndex):
+                    pass
+                elif isinstance(idx, (DatetimeIndex, TimedeltaIndex)):
+                    assert result.__class__ == answer.__class__
+                    tm.assert_numpy_array_equal(result.sort_values().asi8,
+                                                answer.sort_values().asi8)
+                else:
+                    result = first.difference(case)
+                    assert tm.equalContents(result, answer)
+
+            if isinstance(idx, MultiIndex):
+                msg = "other must be a MultiIndex or a list of tuples"
+                with tm.assert_raises_regex(TypeError, msg):
+                    result = first.difference([1, 2, 3])
+
+    def test_symmetric_difference(self):
+        for name, idx in compat.iteritems(self.indices):
+            first = idx[1:]
+            second = idx[:-1]
+            if isinstance(idx, CategoricalIndex):
+                pass
+            else:
+                answer = idx[[0, -1]]
+                result = first.symmetric_difference(second)
+                assert tm.equalContents(result, answer)
+
+            # GH 10149
+            cases = [klass(second.values)
+                     for klass in [np.array, Series, list]]
+            for case in cases:
+                if isinstance(idx, PeriodIndex):
+                    msg = "can only call with other PeriodIndex-ed objects"
+                    with tm.assert_raises_regex(ValueError, msg):
+                        result = first.symmetric_difference(case)
+                elif isinstance(idx, CategoricalIndex):
+                    pass
+                else:
+                    result = first.symmetric_difference(case)
+                    assert tm.equalContents(result, answer)
+
+            if isinstance(idx, MultiIndex):
+                msg = "other must be a MultiIndex or a list of tuples"
+                with tm.assert_raises_regex(TypeError, msg):
+                    first.symmetric_difference([1, 2, 3])
+
+    def test_insert_base(self):
+
+        for name, idx in compat.iteritems(self.indices):
+            result = idx[1:4]
+
+            if not len(idx):
+                continue
+
+            # test 0th element
+            assert idx[0:4].equals(result.insert(0, idx[0]))
+
+    def test_delete_base(self):
+
+        for name, idx in compat.iteritems(self.indices):
+
+            if not len(idx):
+                continue
+
+            if isinstance(idx, RangeIndex):
+                # tested in class
+                continue
+
+            expected = idx[1:]
+            result = idx.delete(0)
+            assert result.equals(expected)
+            assert result.name == expected.name
+
+            expected = idx[:-1]
+            result = idx.delete(-1)
+            assert result.equals(expected)
+            assert result.name == expected.name
+
+            with pytest.raises((IndexError, ValueError)):
+                # either depending on numpy version
+                result = idx.delete(len(idx))
+
+    def test_equals(self):
+
+        for name, idx in compat.iteritems(self.indices):
+            assert idx.equals(idx)
+            assert idx.equals(idx.copy())
+            assert idx.equals(idx.astype(object))
+
+            assert not idx.equals(list(idx))
+            assert not idx.equals(np.array(idx))
+
+            # Cannot pass in non-int64 dtype to RangeIndex
+            if not isinstance(idx, RangeIndex):
+                same_values = Index(idx, dtype=object)
+                assert idx.equals(same_values)
+                assert same_values.equals(idx)
+
+            if idx.nlevels == 1:
+                # do not test MultiIndex
+                assert not idx.equals(pd.Series(idx))
+
+    def test_equals_op(self):
+        # GH9947, GH10637
+        index_a = self.create_index()
+        if isinstance(index_a, PeriodIndex):
+            return
+
+        n = len(index_a)
+        index_b = index_a[0:-1]
+        index_c = index_a[0:-1].append(index_a[-2:-1])
+        index_d = index_a[0:1]
+        with tm.assert_raises_regex(ValueError, "Lengths must match"):
+            index_a == index_b
+        expected1 = np.array([True] * n)
+        expected2 = np.array([True] * (n - 1) + [False])
+        tm.assert_numpy_array_equal(index_a == index_a, expected1)
+        tm.assert_numpy_array_equal(index_a == index_c, expected2)
+
+        # test comparisons with numpy arrays
+        array_a = np.array(index_a)
+        array_b = np.array(index_a[0:-1])
+        array_c = np.array(index_a[0:-1].append(index_a[-2:-1]))
+        array_d = np.array(index_a[0:1])
+        with tm.assert_raises_regex(ValueError, "Lengths must match"):
+            index_a == array_b
+        tm.assert_numpy_array_equal(index_a == array_a, expected1)
+        tm.assert_numpy_array_equal(index_a == array_c, expected2)
+
+        # test comparisons with Series
+        series_a = Series(array_a)
+        series_b = Series(array_b)
+        series_c = Series(array_c)
+        series_d = Series(array_d)
+        with tm.assert_raises_regex(ValueError, "Lengths must match"):
+            index_a == series_b
+
+        tm.assert_numpy_array_equal(index_a == series_a, expected1)
+        tm.assert_numpy_array_equal(index_a == series_c, expected2)
+
+        # cases where length is 1 for one of them
+        with tm.assert_raises_regex(ValueError, "Lengths must match"):
+            index_a == index_d
+        with tm.assert_raises_regex(ValueError, "Lengths must match"):
+            index_a == series_d
+        with tm.assert_raises_regex(ValueError, "Lengths must match"):
+            index_a == array_d
+        msg = "Can only compare identically-labeled Series objects"
+        with tm.assert_raises_regex(ValueError, msg):
+            series_a == series_d
+        with tm.assert_raises_regex(ValueError, "Lengths must match"):
+            series_a == array_d
+
+        # comparing with a scalar should broadcast; note that we are excluding
+        # MultiIndex because in this case each item in the index is a tuple of
+        # length 2, and therefore is considered an array of length 2 in the
+        # comparison instead of a scalar
+        if not isinstance(index_a, MultiIndex):
+            expected3 = np.array([False] * (len(index_a) - 2) + [True, False])
+            # assuming the 2nd to last item is unique in the data
+            item = index_a[-2]
+            tm.assert_numpy_array_equal(index_a == item, expected3)
+            tm.assert_series_equal(series_a == item, Series(expected3))
+
+    def test_numpy_ufuncs(self):
+        # test ufuncs of numpy 1.9.2. see:
+        # http://docs.scipy.org/doc/numpy/reference/ufuncs.html
+
+        # some functions are skipped because it may return different result
+        # for unicode input depending on numpy version
+
+        for name, idx in compat.iteritems(self.indices):
+            for func in [np.exp, np.exp2, np.expm1, np.log, np.log2, np.log10,
+                         np.log1p, np.sqrt, np.sin, np.cos, np.tan, np.arcsin,
+                         np.arccos, np.arctan, np.sinh, np.cosh, np.tanh,
+                         np.arcsinh, np.arccosh, np.arctanh, np.deg2rad,
+                         np.rad2deg]:
+                if isinstance(idx, DatetimeIndexOpsMixin):
+                    # raise TypeError or ValueError (PeriodIndex)
+                    # PeriodIndex behavior should be changed in future version
+                    with pytest.raises(Exception):
+                        with np.errstate(all='ignore'):
+                            func(idx)
+                elif isinstance(idx, (Float64Index, Int64Index, UInt64Index)):
+                    # coerces to float (e.g. np.sin)
+                    with np.errstate(all='ignore'):
+                        result = func(idx)
+                        exp = Index(func(idx.values), name=idx.name)
+
+                    tm.assert_index_equal(result, exp)
+                    assert isinstance(result, pd.Float64Index)
+                else:
+                    # raise AttributeError or TypeError
+                    if len(idx) == 0:
+                        continue
+                    else:
+                        with pytest.raises(Exception):
+                            with np.errstate(all='ignore'):
+                                func(idx)
+
+            for func in [np.isfinite, np.isinf, np.isnan, np.signbit]:
+                if isinstance(idx, DatetimeIndexOpsMixin):
+                    # raise TypeError or ValueError (PeriodIndex)
+                    with pytest.raises(Exception):
+                        func(idx)
+                elif isinstance(idx, (Float64Index, Int64Index, UInt64Index)):
+                    # Results in bool array
+                    result = func(idx)
+                    assert isinstance(result, np.ndarray)
+                    assert not isinstance(result, Index)
+                else:
+                    if len(idx) == 0:
+                        continue
+                    else:
+                        with pytest.raises(Exception):
+                            func(idx)
+
+    def test_hasnans_isnans(self):
+        # GH 11343, added tests for hasnans / isnans
+        for name, index in self.indices.items():
+            if isinstance(index, MultiIndex):
+                pass
+            else:
+                idx = index.copy()
+
+                # cases in indices doesn't include NaN
+                expected = np.array([False] * len(idx), dtype=bool)
+                tm.assert_numpy_array_equal(idx._isnan, expected)
+                assert not idx.hasnans
+
+                idx = index.copy()
+                values = idx.values
+
+                if len(index) == 0:
+                    continue
+                elif isinstance(index, DatetimeIndexOpsMixin):
+                    values[1] = iNaT
+                elif isinstance(index, (Int64Index, UInt64Index)):
+                    continue
+                else:
+                    values[1] = np.nan
+
+                if isinstance(index, PeriodIndex):
+                    idx = index.__class__(values, freq=index.freq)
+                else:
+                    idx = index.__class__(values)
+
+                expected = np.array([False] * len(idx), dtype=bool)
+                expected[1] = True
+                tm.assert_numpy_array_equal(idx._isnan, expected)
+                assert idx.hasnans
+
+    def test_fillna(self):
+        # GH 11343
+        for name, index in self.indices.items():
+            if len(index) == 0:
+                pass
+            elif isinstance(index, MultiIndex):
+                idx = index.copy()
+                msg = "isna is not defined for MultiIndex"
+                with tm.assert_raises_regex(NotImplementedError, msg):
+                    idx.fillna(idx[0])
+            else:
+                idx = index.copy()
+                result = idx.fillna(idx[0])
+                tm.assert_index_equal(result, idx)
+                assert result is not idx
+
+                msg = "'value' must be a scalar, passed: "
+                with tm.assert_raises_regex(TypeError, msg):
+                    idx.fillna([idx[0]])
+
+                idx = index.copy()
+                values = idx.values
+
+                if isinstance(index, DatetimeIndexOpsMixin):
+                    values[1] = iNaT
+                elif isinstance(index, (Int64Index, UInt64Index)):
+                    continue
+                else:
+                    values[1] = np.nan
+
+                if isinstance(index, PeriodIndex):
+                    idx = index.__class__(values, freq=index.freq)
+                else:
+                    idx = index.__class__(values)
+
+                expected = np.array([False] * len(idx), dtype=bool)
+                expected[1] = True
+                tm.assert_numpy_array_equal(idx._isnan, expected)
+                assert idx.hasnans
+
+    def test_nulls(self):
+        # this is really a smoke test for the methods
+        # as these are adequately tested for function elsewhere
+
+        for name, index in self.indices.items():
+            if len(index) == 0:
+                tm.assert_numpy_array_equal(
+                    index.isna(), np.array([], dtype=bool))
+            elif isinstance(index, MultiIndex):
+                idx = index.copy()
+                msg = "isna is not defined for MultiIndex"
+                with tm.assert_raises_regex(NotImplementedError, msg):
+                    idx.isna()
+            else:
+
+                if not index.hasnans:
+                    tm.assert_numpy_array_equal(
+                        index.isna(), np.zeros(len(index), dtype=bool))
+                    tm.assert_numpy_array_equal(
+                        index.notna(), np.ones(len(index), dtype=bool))
+                else:
+                    result = isna(index)
+                    tm.assert_numpy_array_equal(index.isna(), result)
+                    tm.assert_numpy_array_equal(index.notna(), ~result)
+
+    def test_empty(self):
+        # GH 15270
+        index = self.create_index()
+        assert not index.empty
+        assert index[:0].empty
+
+    def test_join_self_unique(self, join_type):
+        index = self.create_index()
+        if index.is_unique:
+            joined = index.join(index, how=join_type)
+            assert (index == joined).all()
+
+    def test_searchsorted_monotonic(self, indices):
+        # GH17271
+        # not implemented for tuple searches in MultiIndex
+        # or Intervals searches in IntervalIndex
+        if isinstance(indices, (MultiIndex, IntervalIndex)):
+            return
+
+        # nothing to test if the index is empty
+        if indices.empty:
+            return
+        value = indices[0]
+
+        # determine the expected results (handle dupes for 'right')
+        expected_left, expected_right = 0, (indices == value).argmin()
+        if expected_right == 0:
+            # all values are the same, expected_right should be length
+            expected_right = len(indices)
+
+        # test _searchsorted_monotonic in all cases
+        # test searchsorted only for increasing
+        if indices.is_monotonic_increasing:
+            ssm_left = indices._searchsorted_monotonic(value, side='left')
+            assert expected_left == ssm_left
+
+            ssm_right = indices._searchsorted_monotonic(value, side='right')
+            assert expected_right == ssm_right
+
+            ss_left = indices.searchsorted(value, side='left')
+            assert expected_left == ss_left
+
+            ss_right = indices.searchsorted(value, side='right')
+            assert expected_right == ss_right
+
+        elif indices.is_monotonic_decreasing:
+            ssm_left = indices._searchsorted_monotonic(value, side='left')
+            assert expected_left == ssm_left
+
+            ssm_right = indices._searchsorted_monotonic(value, side='right')
+            assert expected_right == ssm_right
+
+        else:
+            # non-monotonic should raise.
+            with pytest.raises(ValueError):
+                indices._searchsorted_monotonic(value, side='left')
+
+    def test_map(self):
+        # callable
+        index = self.create_index()
+
+        # we don't infer UInt64
+        if isinstance(index, pd.UInt64Index):
+            expected = index.astype('int64')
+        else:
+            expected = index
+
+        result = index.map(lambda x: x)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        "mapper",
+        [
+            lambda values, index: {i: e for e, i in zip(values, index)},
+            lambda values, index: pd.Series(values, index)])
+    def test_map_dictlike(self, mapper):
+
+        index = self.create_index()
+        if isinstance(index, (pd.CategoricalIndex, pd.IntervalIndex)):
+            pytest.skip("skipping tests for {}".format(type(index)))
+
+        identity = mapper(index.values, index)
+
+        # we don't infer to UInt64 for a dict
+        if isinstance(index, pd.UInt64Index) and isinstance(identity, dict):
+            expected = index.astype('int64')
+        else:
+            expected = index
+
+        result = index.map(identity)
+        tm.assert_index_equal(result, expected)
+
+        # empty mappable
+        expected = pd.Index([np.nan] * len(index))
+        result = index.map(mapper(expected, index))
+        tm.assert_index_equal(result, expected)
+
+    def test_putmask_with_wrong_mask(self):
+        # GH18368
+        index = self.create_index()
+
+        with pytest.raises(ValueError):
+            index.putmask(np.ones(len(index) + 1, np.bool), 1)
+
+        with pytest.raises(ValueError):
+            index.putmask(np.ones(len(index) - 1, np.bool), 1)
+
+        with pytest.raises(ValueError):
+            index.putmask('foo', 1)
+
+    @pytest.mark.parametrize('copy', [True, False])
+    @pytest.mark.parametrize('name', [None, 'foo'])
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_astype_category(self, copy, name, ordered):
+        # GH 18630
+        index = self.create_index()
+        if name:
+            index = index.rename(name)
+
+        # standard categories
+        dtype = CategoricalDtype(ordered=ordered)
+        result = index.astype(dtype, copy=copy)
+        expected = CategoricalIndex(index.values, name=name, ordered=ordered)
+        tm.assert_index_equal(result, expected)
+
+        # non-standard categories
+        dtype = CategoricalDtype(index.unique().tolist()[:-1], ordered)
+        result = index.astype(dtype, copy=copy)
+        expected = CategoricalIndex(index.values, name=name, dtype=dtype)
+        tm.assert_index_equal(result, expected)
+
+        if ordered is False:
+            # dtype='category' defaults to ordered=False, so only test once
+            result = index.astype('category', copy=copy)
+            expected = CategoricalIndex(index.values, name=name)
+            tm.assert_index_equal(result, expected)
diff --git a/pandas/tests/indexes/conftest.py b/pandas/tests/indexes/conftest.py
new file mode 100644
index 0000000000000..6d88ef0cfa6c5
--- /dev/null
+++ b/pandas/tests/indexes/conftest.py
@@ -0,0 +1,47 @@
+import pytest
+import numpy as np
+import pandas as pd
+
+import pandas.util.testing as tm
+from pandas.core.indexes.api import Index, MultiIndex
+from pandas.compat import lzip, long
+
+
+@pytest.fixture(params=[tm.makeUnicodeIndex(100),
+                        tm.makeStringIndex(100),
+                        tm.makeDateIndex(100),
+                        tm.makePeriodIndex(100),
+                        tm.makeTimedeltaIndex(100),
+                        tm.makeIntIndex(100),
+                        tm.makeUIntIndex(100),
+                        tm.makeFloatIndex(100),
+                        Index([True, False]),
+                        tm.makeCategoricalIndex(100),
+                        Index([]),
+                        MultiIndex.from_tuples(lzip(
+                            ['foo', 'bar', 'baz'], [1, 2, 3])),
+                        Index([0, 0, 1, 1, 2, 2])],
+                ids=lambda x: type(x).__name__)
+def indices(request):
+    return request.param
+
+
+@pytest.fixture(params=[1, np.array(1, dtype=np.int64)])
+def one(request):
+    # zero-dim integer array behaves like an integer
+    return request.param
+
+
+zeros = [box([0] * 5, dtype=dtype)
+         for box in [pd.Index, np.array]
+         for dtype in [np.int64, np.uint64, np.float64]]
+zeros.extend([np.array(0, dtype=dtype)
+              for dtype in [np.int64, np.uint64, np.float64]])
+zeros.extend([0, 0.0, long(0)])
+
+
+@pytest.fixture(params=zeros)
+def zero(request):
+    # For testing division by (or of) zero for Index with length 5, this
+    # gives several scalar-zeros and length-5 vector-zeros
+    return request.param
diff --git a/pandas/tests/data/mindex_073.pickle b/pandas/tests/indexes/data/mindex_073.pickle
similarity index 100%
rename from pandas/tests/data/mindex_073.pickle
rename to pandas/tests/indexes/data/mindex_073.pickle
diff --git a/pandas/tests/data/multiindex_v1.pickle b/pandas/tests/indexes/data/multiindex_v1.pickle
similarity index 100%
rename from pandas/tests/data/multiindex_v1.pickle
rename to pandas/tests/indexes/data/multiindex_v1.pickle
diff --git a/pandas/tests/indexes/datetimelike.py b/pandas/tests/indexes/datetimelike.py
new file mode 100644
index 0000000000000..e32e18ea0ec4a
--- /dev/null
+++ b/pandas/tests/indexes/datetimelike.py
@@ -0,0 +1,90 @@
+""" generic datetimelike tests """
+import pytest
+import numpy as np
+import pandas as pd
+from .common import Base
+import pandas.util.testing as tm
+
+
+class DatetimeLike(Base):
+
+    def test_can_hold_identifiers(self):
+        idx = self.create_index()
+        key = idx[0]
+        assert idx._can_hold_identifiers_and_holds_name(key) is False
+
+    def test_shift_identity(self):
+
+        idx = self.create_index()
+        tm.assert_index_equal(idx, idx.shift(0))
+
+    def test_str(self):
+
+        # test the string repr
+        idx = self.create_index()
+        idx.name = 'foo'
+        assert not "length=%s" % len(idx) in str(idx)
+        assert "'foo'" in str(idx)
+        assert idx.__class__.__name__ in str(idx)
+
+        if hasattr(idx, 'tz'):
+            if idx.tz is not None:
+                assert idx.tz in str(idx)
+        if hasattr(idx, 'freq'):
+            assert "freq='%s'" % idx.freqstr in str(idx)
+
+    def test_view(self, indices):
+        super(DatetimeLike, self).test_view(indices)
+
+        i = self.create_index()
+
+        i_view = i.view('i8')
+        result = self._holder(i)
+        tm.assert_index_equal(result, i)
+
+        i_view = i.view(self._holder)
+        result = self._holder(i)
+        tm.assert_index_equal(result, i_view)
+
+    def test_map_callable(self):
+
+        expected = self.index + 1
+        result = self.index.map(lambda x: x + 1)
+        tm.assert_index_equal(result, expected)
+
+        # map to NaT
+        result = self.index.map(lambda x: pd.NaT if x == self.index[0] else x)
+        expected = pd.Index([pd.NaT] + self.index[1:].tolist())
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        "mapper",
+        [
+            lambda values, index: {i: e for e, i in zip(values, index)},
+            lambda values, index: pd.Series(values, index)])
+    def test_map_dictlike(self, mapper):
+        expected = self.index + 1
+
+        # don't compare the freqs
+        if isinstance(expected, pd.DatetimeIndex):
+            expected.freq = None
+
+        result = self.index.map(mapper(expected, self.index))
+        tm.assert_index_equal(result, expected)
+
+        expected = pd.Index([pd.NaT] + self.index[1:].tolist())
+        result = self.index.map(mapper(expected, self.index))
+        tm.assert_index_equal(result, expected)
+
+        # empty map; these map to np.nan because we cannot know
+        # to re-infer things
+        expected = pd.Index([np.nan] * len(self.index))
+        result = self.index.map(mapper([], []))
+        tm.assert_index_equal(result, expected)
+
+    def test_asobject_deprecated(self):
+        # GH18572
+        d = self.create_index()
+        with tm.assert_produces_warning(FutureWarning):
+            i = d.asobject
+        assert isinstance(i, pd.Index)
diff --git a/pandas/tests/indexes/datetimes/__init__.py b/pandas/tests/indexes/datetimes/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/indexes/datetimes/test_arithmetic.py b/pandas/tests/indexes/datetimes/test_arithmetic.py
new file mode 100644
index 0000000000000..cb0715c32167a
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_arithmetic.py
@@ -0,0 +1,1134 @@
+# -*- coding: utf-8 -*-
+import warnings
+from datetime import datetime, timedelta
+import operator
+
+import pytest
+import pytz
+import numpy as np
+
+import pandas as pd
+from pandas.compat.numpy import np_datetime64_compat
+import pandas.util.testing as tm
+from pandas.errors import PerformanceWarning, NullFrequencyError
+from pandas import (Timestamp, Timedelta, Series,
+                    DatetimeIndex, TimedeltaIndex,
+                    date_range)
+from pandas.core import ops
+from pandas._libs import tslib
+from pandas._libs.tslibs.offsets import shift_months
+
+
+@pytest.fixture(params=[None, 'UTC', 'Asia/Tokyo',
+                        'US/Eastern', 'dateutil/Asia/Singapore',
+                        'dateutil/US/Pacific'])
+def tz(request):
+    return request.param
+
+
+@pytest.fixture(params=[pd.offsets.Hour(2), timedelta(hours=2),
+                        np.timedelta64(2, 'h'), Timedelta(hours=2)],
+                ids=str)
+def delta(request):
+    # Several ways of representing two hours
+    return request.param
+
+
+@pytest.fixture(
+    params=[
+        datetime(2011, 1, 1),
+        DatetimeIndex(['2011-01-01', '2011-01-02']),
+        DatetimeIndex(['2011-01-01', '2011-01-02']).tz_localize('US/Eastern'),
+        np.datetime64('2011-01-01'),
+        Timestamp('2011-01-01')],
+    ids=lambda x: type(x).__name__)
+def addend(request):
+    return request.param
+
+
+class TestDatetimeIndexComparisons(object):
+    @pytest.mark.parametrize('other', [datetime(2016, 1, 1),
+                                       Timestamp('2016-01-01'),
+                                       np.datetime64('2016-01-01')])
+    def test_dti_cmp_datetimelike(self, other, tz):
+        dti = pd.date_range('2016-01-01', periods=2, tz=tz)
+        if tz is not None:
+            if isinstance(other, np.datetime64):
+                # no tzaware version available
+                return
+            elif isinstance(other, Timestamp):
+                other = other.tz_localize(dti.tzinfo)
+            else:
+                other = tslib._localize_pydatetime(other, dti.tzinfo)
+
+        result = dti == other
+        expected = np.array([True, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = dti > other
+        expected = np.array([False, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = dti >= other
+        expected = np.array([True, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = dti < other
+        expected = np.array([False, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = dti <= other
+        expected = np.array([True, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+    def dti_cmp_non_datetime(self, tz):
+        # GH#19301 by convention datetime.date is not considered comparable
+        # to Timestamp or DatetimeIndex.  This may change in the future.
+        dti = pd.date_range('2016-01-01', periods=2, tz=tz)
+
+        other = datetime(2016, 1, 1).date()
+        assert not (dti == other).any()
+        assert (dti != other).all()
+        with pytest.raises(TypeError):
+            dti < other
+        with pytest.raises(TypeError):
+            dti <= other
+        with pytest.raises(TypeError):
+            dti > other
+        with pytest.raises(TypeError):
+            dti >= other
+
+    @pytest.mark.parametrize('other', [None, np.nan, pd.NaT])
+    def test_dti_eq_null_scalar(self, other, tz):
+        # GH#19301
+        dti = pd.date_range('2016-01-01', periods=2, tz=tz)
+        assert not (dti == other).any()
+
+    @pytest.mark.parametrize('other', [None, np.nan, pd.NaT])
+    def test_dti_ne_null_scalar(self, other, tz):
+        # GH#19301
+        dti = pd.date_range('2016-01-01', periods=2, tz=tz)
+        assert (dti != other).all()
+
+    @pytest.mark.parametrize('other', [None, np.nan])
+    def test_dti_cmp_null_scalar_inequality(self, tz, other):
+        # GH#19301
+        dti = pd.date_range('2016-01-01', periods=2, tz=tz)
+
+        with pytest.raises(TypeError):
+            dti < other
+        with pytest.raises(TypeError):
+            dti <= other
+        with pytest.raises(TypeError):
+            dti > other
+        with pytest.raises(TypeError):
+            dti >= other
+
+    def test_dti_cmp_nat(self):
+        left = pd.DatetimeIndex([pd.Timestamp('2011-01-01'), pd.NaT,
+                                 pd.Timestamp('2011-01-03')])
+        right = pd.DatetimeIndex([pd.NaT, pd.NaT, pd.Timestamp('2011-01-03')])
+
+        for lhs, rhs in [(left, right),
+                         (left.astype(object), right.astype(object))]:
+            result = rhs == lhs
+            expected = np.array([False, False, True])
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = lhs != rhs
+            expected = np.array([True, True, False])
+            tm.assert_numpy_array_equal(result, expected)
+
+            expected = np.array([False, False, False])
+            tm.assert_numpy_array_equal(lhs == pd.NaT, expected)
+            tm.assert_numpy_array_equal(pd.NaT == rhs, expected)
+
+            expected = np.array([True, True, True])
+            tm.assert_numpy_array_equal(lhs != pd.NaT, expected)
+            tm.assert_numpy_array_equal(pd.NaT != lhs, expected)
+
+            expected = np.array([False, False, False])
+            tm.assert_numpy_array_equal(lhs < pd.NaT, expected)
+            tm.assert_numpy_array_equal(pd.NaT > lhs, expected)
+
+    def test_dti_cmp_nat_behaves_like_float_cmp_nan(self):
+        fidx1 = pd.Index([1.0, np.nan, 3.0, np.nan, 5.0, 7.0])
+        fidx2 = pd.Index([2.0, 3.0, np.nan, np.nan, 6.0, 7.0])
+
+        didx1 = pd.DatetimeIndex(['2014-01-01', pd.NaT, '2014-03-01', pd.NaT,
+                                  '2014-05-01', '2014-07-01'])
+        didx2 = pd.DatetimeIndex(['2014-02-01', '2014-03-01', pd.NaT, pd.NaT,
+                                  '2014-06-01', '2014-07-01'])
+        darr = np.array([np_datetime64_compat('2014-02-01 00:00Z'),
+                         np_datetime64_compat('2014-03-01 00:00Z'),
+                         np_datetime64_compat('nat'), np.datetime64('nat'),
+                         np_datetime64_compat('2014-06-01 00:00Z'),
+                         np_datetime64_compat('2014-07-01 00:00Z')])
+
+        cases = [(fidx1, fidx2), (didx1, didx2), (didx1, darr)]
+
+        # Check pd.NaT is handles as the same as np.nan
+        with tm.assert_produces_warning(None):
+            for idx1, idx2 in cases:
+
+                result = idx1 < idx2
+                expected = np.array([True, False, False, False, True, False])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx2 > idx1
+                expected = np.array([True, False, False, False, True, False])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 <= idx2
+                expected = np.array([True, False, False, False, True, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx2 >= idx1
+                expected = np.array([True, False, False, False, True, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 == idx2
+                expected = np.array([False, False, False, False, False, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 != idx2
+                expected = np.array([True, True, True, True, True, False])
+                tm.assert_numpy_array_equal(result, expected)
+
+        with tm.assert_produces_warning(None):
+            for idx1, val in [(fidx1, np.nan), (didx1, pd.NaT)]:
+                result = idx1 < val
+                expected = np.array([False, False, False, False, False, False])
+                tm.assert_numpy_array_equal(result, expected)
+                result = idx1 > val
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 <= val
+                tm.assert_numpy_array_equal(result, expected)
+                result = idx1 >= val
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 == val
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 != val
+                expected = np.array([True, True, True, True, True, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+        # Check pd.NaT is handles as the same as np.nan
+        with tm.assert_produces_warning(None):
+            for idx1, val in [(fidx1, 3), (didx1, datetime(2014, 3, 1))]:
+                result = idx1 < val
+                expected = np.array([True, False, False, False, False, False])
+                tm.assert_numpy_array_equal(result, expected)
+                result = idx1 > val
+                expected = np.array([False, False, False, False, True, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 <= val
+                expected = np.array([True, False, True, False, False, False])
+                tm.assert_numpy_array_equal(result, expected)
+                result = idx1 >= val
+                expected = np.array([False, False, True, False, True, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 == val
+                expected = np.array([False, False, True, False, False, False])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 != val
+                expected = np.array([True, True, False, True, True, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('op', [operator.eq, operator.ne,
+                                    operator.gt, operator.ge,
+                                    operator.lt, operator.le])
+    def test_comparison_tzawareness_compat(self, op):
+        # GH#18162
+        dr = pd.date_range('2016-01-01', periods=6)
+        dz = dr.tz_localize('US/Pacific')
+
+        with pytest.raises(TypeError):
+            op(dr, dz)
+        with pytest.raises(TypeError):
+            op(dr, list(dz))
+        with pytest.raises(TypeError):
+            op(dz, dr)
+        with pytest.raises(TypeError):
+            op(dz, list(dr))
+
+        # Check that there isn't a problem aware-aware and naive-naive do not
+        # raise
+        assert (dr == dr).all()
+        assert (dr == list(dr)).all()
+        assert (dz == dz).all()
+        assert (dz == list(dz)).all()
+
+        # Check comparisons against scalar Timestamps
+        ts = pd.Timestamp('2000-03-14 01:59')
+        ts_tz = pd.Timestamp('2000-03-14 01:59', tz='Europe/Amsterdam')
+
+        assert (dr > ts).all()
+        with pytest.raises(TypeError):
+            op(dr, ts_tz)
+
+        assert (dz > ts_tz).all()
+        with pytest.raises(TypeError):
+            op(dz, ts)
+
+        # GH 12601: Check comparison against Timestamps and DatetimeIndex
+        with pytest.raises(TypeError):
+            op(ts, dz)
+
+    @pytest.mark.parametrize('op', [operator.eq, operator.ne,
+                                    operator.gt, operator.ge,
+                                    operator.lt, operator.le])
+    def test_nat_comparison_tzawareness(self, op):
+        # GH#19276
+        # tzaware DatetimeIndex should not raise when compared to NaT
+        dti = pd.DatetimeIndex(['2014-01-01', pd.NaT, '2014-03-01', pd.NaT,
+                                '2014-05-01', '2014-07-01'])
+        expected = np.array([op == operator.ne] * len(dti))
+        result = op(dti, pd.NaT)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = op(dti.tz_localize('US/Pacific'), pd.NaT)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_dti_cmp_int_raises(self):
+        rng = date_range('1/1/2000', periods=10)
+
+        # raise TypeError for now
+        with pytest.raises(TypeError):
+            rng < rng[3].value
+
+    def test_dti_cmp_list(self):
+        rng = date_range('1/1/2000', periods=10)
+
+        result = rng == list(rng)
+        expected = rng == rng
+        tm.assert_numpy_array_equal(result, expected)
+
+
+class TestDatetimeIndexArithmetic(object):
+
+    # -------------------------------------------------------------
+    # Invalid Operations
+
+    @pytest.mark.parametrize('other', [3.14, np.array([2.0, 3.0])])
+    @pytest.mark.parametrize('op', [operator.add, ops.radd,
+                                    operator.sub, ops.rsub])
+    def test_dti_add_sub_float(self, op, other):
+        dti = DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D')
+        with pytest.raises(TypeError):
+            op(dti, other)
+
+    def test_dti_add_timestamp_raises(self):
+        idx = DatetimeIndex(['2011-01-01', '2011-01-02'])
+        msg = "cannot add DatetimeIndex and Timestamp"
+        with tm.assert_raises_regex(TypeError, msg):
+            idx + Timestamp('2011-01-01')
+
+    def test_dti_radd_timestamp_raises(self):
+        idx = DatetimeIndex(['2011-01-01', '2011-01-02'])
+        msg = "cannot add DatetimeIndex and Timestamp"
+        with tm.assert_raises_regex(TypeError, msg):
+            Timestamp('2011-01-01') + idx
+
+    # -------------------------------------------------------------
+    # Binary operations DatetimeIndex and int
+
+    def test_dti_add_int(self, tz, one):
+        # Variants of `one` for #19012
+        rng = pd.date_range('2000-01-01 09:00', freq='H',
+                            periods=10, tz=tz)
+        result = rng + one
+        expected = pd.date_range('2000-01-01 10:00', freq='H',
+                                 periods=10, tz=tz)
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_iadd_int(self, tz, one):
+        rng = pd.date_range('2000-01-01 09:00', freq='H',
+                            periods=10, tz=tz)
+        expected = pd.date_range('2000-01-01 10:00', freq='H',
+                                 periods=10, tz=tz)
+        rng += one
+        tm.assert_index_equal(rng, expected)
+
+    def test_dti_sub_int(self, tz, one):
+        rng = pd.date_range('2000-01-01 09:00', freq='H',
+                            periods=10, tz=tz)
+        result = rng - one
+        expected = pd.date_range('2000-01-01 08:00', freq='H',
+                                 periods=10, tz=tz)
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_isub_int(self, tz, one):
+        rng = pd.date_range('2000-01-01 09:00', freq='H',
+                            periods=10, tz=tz)
+        expected = pd.date_range('2000-01-01 08:00', freq='H',
+                                 periods=10, tz=tz)
+        rng -= one
+        tm.assert_index_equal(rng, expected)
+
+    # -------------------------------------------------------------
+    # __add__/__sub__ with integer arrays
+
+    @pytest.mark.parametrize('freq', ['H', 'D'])
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_dti_add_intarray_tick(self, box, freq):
+        # GH#19959
+        dti = pd.date_range('2016-01-01', periods=2, freq=freq)
+        other = box([4, -1])
+        expected = DatetimeIndex([dti[n] + other[n] for n in range(len(dti))])
+        result = dti + other
+        tm.assert_index_equal(result, expected)
+        result = other + dti
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('freq', ['W', 'M', 'MS', 'Q'])
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_dti_add_intarray_non_tick(self, box, freq):
+        # GH#19959
+        dti = pd.date_range('2016-01-01', periods=2, freq=freq)
+        other = box([4, -1])
+        expected = DatetimeIndex([dti[n] + other[n] for n in range(len(dti))])
+        with tm.assert_produces_warning(PerformanceWarning):
+            result = dti + other
+        tm.assert_index_equal(result, expected)
+        with tm.assert_produces_warning(PerformanceWarning):
+            result = other + dti
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_dti_add_intarray_no_freq(self, box):
+        # GH#19959
+        dti = pd.DatetimeIndex(['2016-01-01', 'NaT', '2017-04-05 06:07:08'])
+        other = box([9, 4, -1])
+        with pytest.raises(NullFrequencyError):
+            dti + other
+        with pytest.raises(NullFrequencyError):
+            other + dti
+        with pytest.raises(NullFrequencyError):
+            dti - other
+        with pytest.raises(TypeError):
+            other - dti
+
+    # -------------------------------------------------------------
+    # DatetimeIndex.shift is used in integer addition
+
+    def test_dti_shift_tzaware(self, tz):
+        # GH#9903
+        idx = pd.DatetimeIndex([], name='xxx', tz=tz)
+        tm.assert_index_equal(idx.shift(0, freq='H'), idx)
+        tm.assert_index_equal(idx.shift(3, freq='H'), idx)
+
+        idx = pd.DatetimeIndex(['2011-01-01 10:00', '2011-01-01 11:00'
+                                '2011-01-01 12:00'], name='xxx', tz=tz)
+        tm.assert_index_equal(idx.shift(0, freq='H'), idx)
+        exp = pd.DatetimeIndex(['2011-01-01 13:00', '2011-01-01 14:00'
+                                '2011-01-01 15:00'], name='xxx', tz=tz)
+        tm.assert_index_equal(idx.shift(3, freq='H'), exp)
+        exp = pd.DatetimeIndex(['2011-01-01 07:00', '2011-01-01 08:00'
+                                '2011-01-01 09:00'], name='xxx', tz=tz)
+        tm.assert_index_equal(idx.shift(-3, freq='H'), exp)
+
+    def test_dti_shift_freqs(self):
+        # test shift for DatetimeIndex and non DatetimeIndex
+        # GH#8083
+        drange = pd.date_range('20130101', periods=5)
+        result = drange.shift(1)
+        expected = pd.DatetimeIndex(['2013-01-02', '2013-01-03', '2013-01-04',
+                                     '2013-01-05',
+                                     '2013-01-06'], freq='D')
+        tm.assert_index_equal(result, expected)
+
+        result = drange.shift(-1)
+        expected = pd.DatetimeIndex(['2012-12-31', '2013-01-01', '2013-01-02',
+                                     '2013-01-03', '2013-01-04'],
+                                    freq='D')
+        tm.assert_index_equal(result, expected)
+
+        result = drange.shift(3, freq='2D')
+        expected = pd.DatetimeIndex(['2013-01-07', '2013-01-08', '2013-01-09',
+                                     '2013-01-10',
+                                     '2013-01-11'], freq='D')
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_shift_int(self):
+        rng = date_range('1/1/2000', periods=20)
+
+        result = rng + 5
+        expected = rng.shift(5)
+        tm.assert_index_equal(result, expected)
+
+        result = rng - 5
+        expected = rng.shift(-5)
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_shift_no_freq(self):
+        # GH#19147
+        dti = pd.DatetimeIndex(['2011-01-01 10:00', '2011-01-01'], freq=None)
+        with pytest.raises(NullFrequencyError):
+            dti.shift(2)
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_shift_localized(self, tzstr):
+        dr = date_range('2011/1/1', '2012/1/1', freq='W-FRI')
+        dr_tz = dr.tz_localize(tzstr)
+
+        result = dr_tz.shift(1, '10T')
+        assert result.tz == dr_tz.tz
+
+    def test_dti_shift_across_dst(self):
+        # GH 8616
+        idx = date_range('2013-11-03', tz='America/Chicago',
+                         periods=7, freq='H')
+        s = Series(index=idx[:-1])
+        result = s.shift(freq='H')
+        expected = Series(index=idx[1:])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('shift, result_time', [
+        [0, '2014-11-14 00:00:00'],
+        [-1, '2014-11-13 23:00:00'],
+        [1, '2014-11-14 01:00:00']])
+    def test_dti_shift_near_midnight(self, shift, result_time):
+        # GH 8616
+        dt = datetime(2014, 11, 14, 0)
+        dt_est = pytz.timezone('EST').localize(dt)
+        s = Series(data=[1], index=[dt_est])
+        result = s.shift(shift, freq='H')
+        expected = Series(1, index=DatetimeIndex([result_time], tz='EST'))
+        tm.assert_series_equal(result, expected)
+
+    # -------------------------------------------------------------
+    # Binary operations DatetimeIndex and timedelta-like
+
+    def test_dti_add_timedeltalike(self, tz, delta):
+        rng = pd.date_range('2000-01-01', '2000-02-01', tz=tz)
+        result = rng + delta
+        expected = pd.date_range('2000-01-01 02:00',
+                                 '2000-02-01 02:00', tz=tz)
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_iadd_timedeltalike(self, tz, delta):
+        rng = pd.date_range('2000-01-01', '2000-02-01', tz=tz)
+        expected = pd.date_range('2000-01-01 02:00',
+                                 '2000-02-01 02:00', tz=tz)
+        rng += delta
+        tm.assert_index_equal(rng, expected)
+
+    def test_dti_sub_timedeltalike(self, tz, delta):
+        rng = pd.date_range('2000-01-01', '2000-02-01', tz=tz)
+        expected = pd.date_range('1999-12-31 22:00',
+                                 '2000-01-31 22:00', tz=tz)
+        result = rng - delta
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_isub_timedeltalike(self, tz, delta):
+        rng = pd.date_range('2000-01-01', '2000-02-01', tz=tz)
+        expected = pd.date_range('1999-12-31 22:00',
+                                 '2000-01-31 22:00', tz=tz)
+        rng -= delta
+        tm.assert_index_equal(rng, expected)
+
+    # -------------------------------------------------------------
+    # Binary operations DatetimeIndex and TimedeltaIndex/array
+    def test_dti_add_tdi(self, tz):
+        # GH 17558
+        dti = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        tdi = pd.timedelta_range('0 days', periods=10)
+        expected = pd.date_range('2017-01-01', periods=10, tz=tz)
+
+        # add with TimdeltaIndex
+        result = dti + tdi
+        tm.assert_index_equal(result, expected)
+
+        result = tdi + dti
+        tm.assert_index_equal(result, expected)
+
+        # add with timedelta64 array
+        result = dti + tdi.values
+        tm.assert_index_equal(result, expected)
+
+        result = tdi.values + dti
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_iadd_tdi(self, tz):
+        # GH 17558
+        dti = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        tdi = pd.timedelta_range('0 days', periods=10)
+        expected = pd.date_range('2017-01-01', periods=10, tz=tz)
+
+        # iadd with TimdeltaIndex
+        result = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        result += tdi
+        tm.assert_index_equal(result, expected)
+
+        result = pd.timedelta_range('0 days', periods=10)
+        result += dti
+        tm.assert_index_equal(result, expected)
+
+        # iadd with timedelta64 array
+        result = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        result += tdi.values
+        tm.assert_index_equal(result, expected)
+
+        result = pd.timedelta_range('0 days', periods=10)
+        result += dti
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_sub_tdi(self, tz):
+        # GH 17558
+        dti = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        tdi = pd.timedelta_range('0 days', periods=10)
+        expected = pd.date_range('2017-01-01', periods=10, tz=tz, freq='-1D')
+
+        # sub with TimedeltaIndex
+        result = dti - tdi
+        tm.assert_index_equal(result, expected)
+
+        msg = 'cannot subtract .*TimedeltaIndex'
+        with tm.assert_raises_regex(TypeError, msg):
+            tdi - dti
+
+        # sub with timedelta64 array
+        result = dti - tdi.values
+        tm.assert_index_equal(result, expected)
+
+        msg = 'cannot subtract DatetimeIndex from'
+        with tm.assert_raises_regex(TypeError, msg):
+            tdi.values - dti
+
+    def test_dti_isub_tdi(self, tz):
+        # GH 17558
+        dti = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        tdi = pd.timedelta_range('0 days', periods=10)
+        expected = pd.date_range('2017-01-01', periods=10, tz=tz, freq='-1D')
+
+        # isub with TimedeltaIndex
+        result = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        result -= tdi
+        tm.assert_index_equal(result, expected)
+
+        msg = 'cannot subtract .*TimedeltaIndex'
+        with tm.assert_raises_regex(TypeError, msg):
+            tdi -= dti
+
+        # isub with timedelta64 array
+        result = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        result -= tdi.values
+        tm.assert_index_equal(result, expected)
+
+        msg = '|'.join(['cannot perform __neg__ with this index type:',
+                        'ufunc subtract cannot use operands with types',
+                        'cannot subtract DatetimeIndex from'])
+        with tm.assert_raises_regex(TypeError, msg):
+            tdi.values -= dti
+
+    # -------------------------------------------------------------
+    # Binary Operations DatetimeIndex and datetime-like
+    # TODO: A couple other tests belong in this section.  Move them in
+    # A PR where there isn't already a giant diff.
+
+    def test_add_datetimelike_and_dti(self, addend):
+        # GH#9631
+        dti = DatetimeIndex(['2011-01-01', '2011-01-02'])
+        msg = 'cannot add DatetimeIndex and {0}'.format(
+            type(addend).__name__)
+        with tm.assert_raises_regex(TypeError, msg):
+            dti + addend
+        with tm.assert_raises_regex(TypeError, msg):
+            addend + dti
+
+    def test_add_datetimelike_and_dti_tz(self, addend):
+        # GH#9631
+        dti_tz = DatetimeIndex(['2011-01-01',
+                                '2011-01-02']).tz_localize('US/Eastern')
+        msg = 'cannot add DatetimeIndex and {0}'.format(
+            type(addend).__name__)
+        with tm.assert_raises_regex(TypeError, msg):
+            dti_tz + addend
+        with tm.assert_raises_regex(TypeError, msg):
+            addend + dti_tz
+
+    # -------------------------------------------------------------
+    # __add__/__sub__ with ndarray[datetime64] and ndarray[timedelta64]
+
+    def test_dti_add_dt64_array_raises(self, tz):
+        dti = pd.date_range('2016-01-01', periods=3, tz=tz)
+        dtarr = dti.values
+
+        with pytest.raises(TypeError):
+            dti + dtarr
+        with pytest.raises(TypeError):
+            dtarr + dti
+
+    def test_dti_sub_dt64_array_naive(self):
+        dti = pd.date_range('2016-01-01', periods=3, tz=None)
+        dtarr = dti.values
+
+        expected = dti - dti
+        result = dti - dtarr
+        tm.assert_index_equal(result, expected)
+        result = dtarr - dti
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_sub_dt64_array_aware_raises(self, tz):
+        if tz is None:
+            return
+        dti = pd.date_range('2016-01-01', periods=3, tz=tz)
+        dtarr = dti.values
+
+        with pytest.raises(TypeError):
+            dti - dtarr
+        with pytest.raises(TypeError):
+            dtarr - dti
+
+    def test_dti_add_td64_array(self, tz):
+        dti = pd.date_range('2016-01-01', periods=3, tz=tz)
+        tdi = dti - dti.shift(1)
+        tdarr = tdi.values
+
+        expected = dti + tdi
+        result = dti + tdarr
+        tm.assert_index_equal(result, expected)
+        result = tdarr + dti
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_sub_td64_array(self, tz):
+        dti = pd.date_range('2016-01-01', periods=3, tz=tz)
+        tdi = dti - dti.shift(1)
+        tdarr = tdi.values
+
+        expected = dti - tdi
+        result = dti - tdarr
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            tdarr - dti
+
+    # -------------------------------------------------------------
+
+    def test_sub_dti_dti(self):
+        # previously performed setop (deprecated in 0.16.0), now changed to
+        # return subtraction -> TimeDeltaIndex (GH ...)
+
+        dti = date_range('20130101', periods=3)
+        dti_tz = date_range('20130101', periods=3).tz_localize('US/Eastern')
+        dti_tz2 = date_range('20130101', periods=3).tz_localize('UTC')
+        expected = TimedeltaIndex([0, 0, 0])
+
+        result = dti - dti
+        tm.assert_index_equal(result, expected)
+
+        result = dti_tz - dti_tz
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            dti_tz - dti
+
+        with pytest.raises(TypeError):
+            dti - dti_tz
+
+        with pytest.raises(TypeError):
+            dti_tz - dti_tz2
+
+        # isub
+        dti -= dti
+        tm.assert_index_equal(dti, expected)
+
+        # different length raises ValueError
+        dti1 = date_range('20130101', periods=3)
+        dti2 = date_range('20130101', periods=4)
+        with pytest.raises(ValueError):
+            dti1 - dti2
+
+        # NaN propagation
+        dti1 = DatetimeIndex(['2012-01-01', np.nan, '2012-01-03'])
+        dti2 = DatetimeIndex(['2012-01-02', '2012-01-03', np.nan])
+        expected = TimedeltaIndex(['1 days', np.nan, np.nan])
+        result = dti2 - dti1
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('freq', [None, 'D'])
+    def test_sub_period(self, freq):
+        # GH#13078
+        # not supported, check TypeError
+        p = pd.Period('2011-01-01', freq='D')
+
+        idx = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], freq=freq)
+
+        with pytest.raises(TypeError):
+            idx - p
+
+        with pytest.raises(TypeError):
+            p - idx
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd,
+                                    operator.sub, ops.rsub])
+    @pytest.mark.parametrize('pi_freq', ['D', 'W', 'Q', 'H'])
+    @pytest.mark.parametrize('dti_freq', [None, 'D'])
+    def test_dti_sub_pi(self, dti_freq, pi_freq, op):
+        # GH#20049 subtracting PeriodIndex should raise TypeError
+        dti = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], freq=dti_freq)
+        pi = dti.to_period(pi_freq)
+        with pytest.raises(TypeError):
+            op(dti, pi)
+
+    def test_ufunc_coercions(self):
+        idx = date_range('2011-01-01', periods=3, freq='2D', name='x')
+
+        delta = np.timedelta64(1, 'D')
+        for result in [idx + delta, np.add(idx, delta)]:
+            assert isinstance(result, DatetimeIndex)
+            exp = date_range('2011-01-02', periods=3, freq='2D', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == '2D'
+
+        for result in [idx - delta, np.subtract(idx, delta)]:
+            assert isinstance(result, DatetimeIndex)
+            exp = date_range('2010-12-31', periods=3, freq='2D', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == '2D'
+
+        delta = np.array([np.timedelta64(1, 'D'), np.timedelta64(2, 'D'),
+                          np.timedelta64(3, 'D')])
+        for result in [idx + delta, np.add(idx, delta)]:
+            assert isinstance(result, DatetimeIndex)
+            exp = DatetimeIndex(['2011-01-02', '2011-01-05', '2011-01-08'],
+                                freq='3D', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == '3D'
+
+        for result in [idx - delta, np.subtract(idx, delta)]:
+            assert isinstance(result, DatetimeIndex)
+            exp = DatetimeIndex(['2010-12-31', '2011-01-01', '2011-01-02'],
+                                freq='D', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == 'D'
+
+    def test_datetimeindex_sub_timestamp_overflow(self):
+        dtimax = pd.to_datetime(['now', pd.Timestamp.max])
+        dtimin = pd.to_datetime(['now', pd.Timestamp.min])
+
+        tsneg = Timestamp('1950-01-01')
+        ts_neg_variants = [tsneg,
+                           tsneg.to_pydatetime(),
+                           tsneg.to_datetime64().astype('datetime64[ns]'),
+                           tsneg.to_datetime64().astype('datetime64[D]')]
+
+        tspos = Timestamp('1980-01-01')
+        ts_pos_variants = [tspos,
+                           tspos.to_pydatetime(),
+                           tspos.to_datetime64().astype('datetime64[ns]'),
+                           tspos.to_datetime64().astype('datetime64[D]')]
+
+        for variant in ts_neg_variants:
+            with pytest.raises(OverflowError):
+                dtimax - variant
+
+        expected = pd.Timestamp.max.value - tspos.value
+        for variant in ts_pos_variants:
+            res = dtimax - variant
+            assert res[1].value == expected
+
+        expected = pd.Timestamp.min.value - tsneg.value
+        for variant in ts_neg_variants:
+            res = dtimin - variant
+            assert res[1].value == expected
+
+        for variant in ts_pos_variants:
+            with pytest.raises(OverflowError):
+                dtimin - variant
+
+    @pytest.mark.parametrize('names', [('foo', None, None),
+                                       ('baz', 'bar', None),
+                                       ('bar', 'bar', 'bar')])
+    @pytest.mark.parametrize('tz', [None, 'America/Chicago'])
+    def test_dti_add_series(self, tz, names):
+        # GH#13905
+        index = DatetimeIndex(['2016-06-28 05:30', '2016-06-28 05:31'],
+                              tz=tz, name=names[0])
+        ser = Series([Timedelta(seconds=5)] * 2,
+                     index=index, name=names[1])
+        expected = Series(index + Timedelta(seconds=5),
+                          index=index, name=names[2])
+
+        # passing name arg isn't enough when names[2] is None
+        expected.name = names[2]
+        assert expected.dtype == index.dtype
+        result = ser + index
+        tm.assert_series_equal(result, expected)
+        result2 = index + ser
+        tm.assert_series_equal(result2, expected)
+
+        expected = index + Timedelta(seconds=5)
+        result3 = ser.values + index
+        tm.assert_index_equal(result3, expected)
+        result4 = index + ser.values
+        tm.assert_index_equal(result4, expected)
+
+    def test_dti_add_offset_array(self, tz):
+        # GH#18849
+        dti = pd.date_range('2017-01-01', periods=2, tz=tz)
+        other = np.array([pd.offsets.MonthEnd(), pd.offsets.Day(n=2)])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = dti + other
+        expected = DatetimeIndex([dti[n] + other[n] for n in range(len(dti))],
+                                 name=dti.name, freq='infer')
+        tm.assert_index_equal(res, expected)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res2 = other + dti
+        tm.assert_index_equal(res2, expected)
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('foo', 'foo', 'foo')])
+    def test_dti_add_offset_index(self, tz, names):
+        # GH#18849, GH#19744
+        dti = pd.date_range('2017-01-01', periods=2, tz=tz, name=names[0])
+        other = pd.Index([pd.offsets.MonthEnd(), pd.offsets.Day(n=2)],
+                         name=names[1])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = dti + other
+        expected = DatetimeIndex([dti[n] + other[n] for n in range(len(dti))],
+                                 name=names[2], freq='infer')
+        tm.assert_index_equal(res, expected)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res2 = other + dti
+        tm.assert_index_equal(res2, expected)
+
+    def test_dti_sub_offset_array(self, tz):
+        # GH#18824
+        dti = pd.date_range('2017-01-01', periods=2, tz=tz)
+        other = np.array([pd.offsets.MonthEnd(), pd.offsets.Day(n=2)])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = dti - other
+        expected = DatetimeIndex([dti[n] - other[n] for n in range(len(dti))],
+                                 name=dti.name, freq='infer')
+        tm.assert_index_equal(res, expected)
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('foo', 'foo', 'foo')])
+    def test_dti_sub_offset_index(self, tz, names):
+        # GH#18824, GH#19744
+        dti = pd.date_range('2017-01-01', periods=2, tz=tz, name=names[0])
+        other = pd.Index([pd.offsets.MonthEnd(), pd.offsets.Day(n=2)],
+                         name=names[1])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = dti - other
+        expected = DatetimeIndex([dti[n] - other[n] for n in range(len(dti))],
+                                 name=names[2], freq='infer')
+        tm.assert_index_equal(res, expected)
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('foo', 'foo', 'foo')])
+    def test_dti_with_offset_series(self, tz, names):
+        # GH#18849
+        dti = pd.date_range('2017-01-01', periods=2, tz=tz, name=names[0])
+        other = Series([pd.offsets.MonthEnd(), pd.offsets.Day(n=2)],
+                       name=names[1])
+
+        expected_add = Series([dti[n] + other[n] for n in range(len(dti))],
+                              name=names[2])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = dti + other
+        tm.assert_series_equal(res, expected_add)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res2 = other + dti
+        tm.assert_series_equal(res2, expected_add)
+
+        expected_sub = Series([dti[n] - other[n] for n in range(len(dti))],
+                              name=names[2])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res3 = dti - other
+        tm.assert_series_equal(res3, expected_sub)
+
+    def test_dti_add_offset_tzaware(self, tz_aware_fixture):
+        timezone = tz_aware_fixture
+        if timezone == 'US/Pacific':
+            dates = date_range('2012-11-01', periods=3, tz=timezone)
+            offset = dates + pd.offsets.Hour(5)
+            assert dates[0] + pd.offsets.Hour(5) == offset[0]
+
+        dates = date_range('2010-11-01 00:00',
+                           periods=3, tz=timezone, freq='H')
+        expected = DatetimeIndex(['2010-11-01 05:00', '2010-11-01 06:00',
+                                  '2010-11-01 07:00'], freq='H', tz=timezone)
+
+        offset = dates + pd.offsets.Hour(5)
+        tm.assert_index_equal(offset, expected)
+        offset = dates + np.timedelta64(5, 'h')
+        tm.assert_index_equal(offset, expected)
+        offset = dates + timedelta(hours=5)
+        tm.assert_index_equal(offset, expected)
+
+
+@pytest.mark.parametrize('klass,assert_func', [
+    (Series, tm.assert_series_equal),
+    (DatetimeIndex, tm.assert_index_equal)])
+def test_dt64_with_offset_array(klass, assert_func):
+    # GH#10699
+    # array of offsets
+    box = Series if klass is Series else pd.Index
+    with tm.assert_produces_warning(PerformanceWarning):
+        s = klass([Timestamp('2000-1-1'), Timestamp('2000-2-1')])
+        result = s + box([pd.offsets.DateOffset(years=1),
+                          pd.offsets.MonthEnd()])
+        exp = klass([Timestamp('2001-1-1'), Timestamp('2000-2-29')])
+        assert_func(result, exp)
+
+        # same offset
+        result = s + box([pd.offsets.DateOffset(years=1),
+                          pd.offsets.DateOffset(years=1)])
+        exp = klass([Timestamp('2001-1-1'), Timestamp('2001-2-1')])
+        assert_func(result, exp)
+
+
+@pytest.mark.parametrize('klass,assert_func', [
+    (Series, tm.assert_series_equal),
+    (DatetimeIndex, tm.assert_index_equal)])
+def test_dt64_with_DateOffsets_relativedelta(klass, assert_func):
+    # GH#10699
+    vec = klass([Timestamp('2000-01-05 00:15:00'),
+                 Timestamp('2000-01-31 00:23:00'),
+                 Timestamp('2000-01-01'),
+                 Timestamp('2000-03-31'),
+                 Timestamp('2000-02-29'),
+                 Timestamp('2000-12-31'),
+                 Timestamp('2000-05-15'),
+                 Timestamp('2001-06-15')])
+
+    # DateOffset relativedelta fastpath
+    relative_kwargs = [('years', 2), ('months', 5), ('days', 3),
+                       ('hours', 5), ('minutes', 10), ('seconds', 2),
+                       ('microseconds', 5)]
+    for i, kwd in enumerate(relative_kwargs):
+        op = pd.DateOffset(**dict([kwd]))
+        assert_func(klass([x + op for x in vec]), vec + op)
+        assert_func(klass([x - op for x in vec]), vec - op)
+        op = pd.DateOffset(**dict(relative_kwargs[:i + 1]))
+        assert_func(klass([x + op for x in vec]), vec + op)
+        assert_func(klass([x - op for x in vec]), vec - op)
+
+
+@pytest.mark.parametrize('cls_and_kwargs', [
+    'YearBegin', ('YearBegin', {'month': 5}),
+    'YearEnd', ('YearEnd', {'month': 5}),
+    'MonthBegin', 'MonthEnd',
+    'SemiMonthEnd', 'SemiMonthBegin',
+    'Week', ('Week', {'weekday': 3}),
+    'BusinessDay', 'BDay', 'QuarterEnd', 'QuarterBegin',
+    'CustomBusinessDay', 'CDay', 'CBMonthEnd',
+    'CBMonthBegin', 'BMonthBegin', 'BMonthEnd',
+    'BusinessHour', 'BYearBegin', 'BYearEnd',
+    'BQuarterBegin', ('LastWeekOfMonth', {'weekday': 2}),
+    ('FY5253Quarter', {'qtr_with_extra_week': 1,
+                       'startingMonth': 1,
+                       'weekday': 2,
+                       'variation': 'nearest'}),
+    ('FY5253', {'weekday': 0, 'startingMonth': 2, 'variation': 'nearest'}),
+    ('WeekOfMonth', {'weekday': 2, 'week': 2}),
+    'Easter', ('DateOffset', {'day': 4}),
+    ('DateOffset', {'month': 5})])
+@pytest.mark.parametrize('normalize', [True, False])
+@pytest.mark.parametrize('klass,assert_func', [
+    (Series, tm.assert_series_equal),
+    (DatetimeIndex, tm.assert_index_equal)])
+def test_dt64_with_DateOffsets(klass, assert_func, normalize, cls_and_kwargs):
+    # GH#10699
+    # assert these are equal on a piecewise basis
+    vec = klass([Timestamp('2000-01-05 00:15:00'),
+                 Timestamp('2000-01-31 00:23:00'),
+                 Timestamp('2000-01-01'),
+                 Timestamp('2000-03-31'),
+                 Timestamp('2000-02-29'),
+                 Timestamp('2000-12-31'),
+                 Timestamp('2000-05-15'),
+                 Timestamp('2001-06-15')])
+
+    if isinstance(cls_and_kwargs, tuple):
+        # If cls_name param is a tuple, then 2nd entry is kwargs for
+        # the offset constructor
+        cls_name, kwargs = cls_and_kwargs
+    else:
+        cls_name = cls_and_kwargs
+        kwargs = {}
+
+    offset_cls = getattr(pd.offsets, cls_name)
+
+    with warnings.catch_warnings(record=True):
+        for n in [0, 5]:
+            if (cls_name in ['WeekOfMonth', 'LastWeekOfMonth',
+                             'FY5253Quarter', 'FY5253'] and n == 0):
+                # passing n = 0 is invalid for these offset classes
+                continue
+
+            offset = offset_cls(n, normalize=normalize, **kwargs)
+            assert_func(klass([x + offset for x in vec]), vec + offset)
+            assert_func(klass([x - offset for x in vec]), vec - offset)
+            assert_func(klass([offset + x for x in vec]), offset + vec)
+
+
+# GH 10699
+@pytest.mark.parametrize('klass,assert_func', zip([Series, DatetimeIndex],
+                                                  [tm.assert_series_equal,
+                                                   tm.assert_index_equal]))
+def test_datetime64_with_DateOffset(klass, assert_func):
+    s = klass(date_range('2000-01-01', '2000-01-31'), name='a')
+    result = s + pd.DateOffset(years=1)
+    result2 = pd.DateOffset(years=1) + s
+    exp = klass(date_range('2001-01-01', '2001-01-31'), name='a')
+    assert_func(result, exp)
+    assert_func(result2, exp)
+
+    result = s - pd.DateOffset(years=1)
+    exp = klass(date_range('1999-01-01', '1999-01-31'), name='a')
+    assert_func(result, exp)
+
+    s = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
+               pd.Timestamp('2000-02-15', tz='US/Central')], name='a')
+    result = s + pd.offsets.Day()
+    result2 = pd.offsets.Day() + s
+    exp = klass([Timestamp('2000-01-16 00:15:00', tz='US/Central'),
+                 Timestamp('2000-02-16', tz='US/Central')], name='a')
+    assert_func(result, exp)
+    assert_func(result2, exp)
+
+    s = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
+               pd.Timestamp('2000-02-15', tz='US/Central')], name='a')
+    result = s + pd.offsets.MonthEnd()
+    result2 = pd.offsets.MonthEnd() + s
+    exp = klass([Timestamp('2000-01-31 00:15:00', tz='US/Central'),
+                 Timestamp('2000-02-29', tz='US/Central')], name='a')
+    assert_func(result, exp)
+    assert_func(result2, exp)
+
+
+@pytest.mark.parametrize('years', [-1, 0, 1])
+@pytest.mark.parametrize('months', [-2, 0, 2])
+def test_shift_months(years, months):
+    s = DatetimeIndex([Timestamp('2000-01-05 00:15:00'),
+                       Timestamp('2000-01-31 00:23:00'),
+                       Timestamp('2000-01-01'),
+                       Timestamp('2000-02-29'),
+                       Timestamp('2000-12-31')])
+    actual = DatetimeIndex(shift_months(s.asi8, years * 12 + months))
+
+    raw = [x + pd.offsets.DateOffset(years=years, months=months)
+           for x in s]
+    expected = DatetimeIndex(raw)
+    tm.assert_index_equal(actual, expected)
diff --git a/pandas/tests/indexes/datetimes/test_astype.py b/pandas/tests/indexes/datetimes/test_astype.py
new file mode 100644
index 0000000000000..64b8f48f6a4e1
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_astype.py
@@ -0,0 +1,359 @@
+import pytest
+
+import pytz
+import dateutil
+import numpy as np
+
+from datetime import datetime
+from dateutil.tz import tzlocal
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import (DatetimeIndex, date_range, Series, NaT, Index, Timestamp,
+                    Int64Index, Period)
+
+
+class TestDatetimeIndex(object):
+
+    def test_astype(self):
+        # GH 13149, GH 13209
+        idx = DatetimeIndex(['2016-05-16', 'NaT', NaT, np.NaN])
+
+        result = idx.astype(object)
+        expected = Index([Timestamp('2016-05-16')] + [NaT] * 3, dtype=object)
+        tm.assert_index_equal(result, expected)
+
+        result = idx.astype(int)
+        expected = Int64Index([1463356800000000000] +
+                              [-9223372036854775808] * 3, dtype=np.int64)
+        tm.assert_index_equal(result, expected)
+
+        rng = date_range('1/1/2000', periods=10)
+        result = rng.astype('i8')
+        tm.assert_index_equal(result, Index(rng.asi8))
+        tm.assert_numpy_array_equal(result.values, rng.asi8)
+
+    def test_astype_with_tz(self):
+
+        # with tz
+        rng = date_range('1/1/2000', periods=10, tz='US/Eastern')
+        result = rng.astype('datetime64[ns]')
+        expected = (date_range('1/1/2000', periods=10,
+                               tz='US/Eastern')
+                    .tz_convert('UTC').tz_localize(None))
+        tm.assert_index_equal(result, expected)
+
+        # BUG#10442 : testing astype(str) is correct for Series/DatetimeIndex
+        result = pd.Series(pd.date_range('2012-01-01', periods=3)).astype(str)
+        expected = pd.Series(
+            ['2012-01-01', '2012-01-02', '2012-01-03'], dtype=object)
+        tm.assert_series_equal(result, expected)
+
+        result = Series(pd.date_range('2012-01-01', periods=3,
+                                      tz='US/Eastern')).astype(str)
+        expected = Series(['2012-01-01 00:00:00-05:00',
+                           '2012-01-02 00:00:00-05:00',
+                           '2012-01-03 00:00:00-05:00'],
+                          dtype=object)
+        tm.assert_series_equal(result, expected)
+
+        # GH 18951: tz-aware to tz-aware
+        idx = date_range('20170101', periods=4, tz='US/Pacific')
+        result = idx.astype('datetime64[ns, US/Eastern]')
+        expected = date_range('20170101 03:00:00', periods=4, tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+        # GH 18951: tz-naive to tz-aware
+        idx = date_range('20170101', periods=4)
+        result = idx.astype('datetime64[ns, US/Eastern]')
+        expected = date_range('20170101', periods=4, tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+    def test_astype_str_compat(self):
+        # GH 13149, GH 13209
+        # verify that we are returning NaT as a string (and not unicode)
+
+        idx = DatetimeIndex(['2016-05-16', 'NaT', NaT, np.NaN])
+        result = idx.astype(str)
+        expected = Index(['2016-05-16', 'NaT', 'NaT', 'NaT'], dtype=object)
+        tm.assert_index_equal(result, expected)
+
+    def test_astype_str(self):
+        # test astype string - #10442
+        result = date_range('2012-01-01', periods=4,
+                            name='test_name').astype(str)
+        expected = Index(['2012-01-01', '2012-01-02', '2012-01-03',
+                          '2012-01-04'], name='test_name', dtype=object)
+        tm.assert_index_equal(result, expected)
+
+        # test astype string with tz and name
+        result = date_range('2012-01-01', periods=3, name='test_name',
+                            tz='US/Eastern').astype(str)
+        expected = Index(['2012-01-01 00:00:00-05:00',
+                          '2012-01-02 00:00:00-05:00',
+                          '2012-01-03 00:00:00-05:00'],
+                         name='test_name', dtype=object)
+        tm.assert_index_equal(result, expected)
+
+        # test astype string with freqH and name
+        result = date_range('1/1/2011', periods=3, freq='H',
+                            name='test_name').astype(str)
+        expected = Index(['2011-01-01 00:00:00', '2011-01-01 01:00:00',
+                          '2011-01-01 02:00:00'],
+                         name='test_name', dtype=object)
+        tm.assert_index_equal(result, expected)
+
+        # test astype string with freqH and timezone
+        result = date_range('3/6/2012 00:00', periods=2, freq='H',
+                            tz='Europe/London', name='test_name').astype(str)
+        expected = Index(['2012-03-06 00:00:00+00:00',
+                          '2012-03-06 01:00:00+00:00'],
+                         dtype=object, name='test_name')
+        tm.assert_index_equal(result, expected)
+
+    def test_astype_datetime64(self):
+        # GH 13149, GH 13209
+        idx = DatetimeIndex(['2016-05-16', 'NaT', NaT, np.NaN])
+
+        result = idx.astype('datetime64[ns]')
+        tm.assert_index_equal(result, idx)
+        assert result is not idx
+
+        result = idx.astype('datetime64[ns]', copy=False)
+        tm.assert_index_equal(result, idx)
+        assert result is idx
+
+        idx_tz = DatetimeIndex(['2016-05-16', 'NaT', NaT, np.NaN], tz='EST')
+        result = idx_tz.astype('datetime64[ns]')
+        expected = DatetimeIndex(['2016-05-16 05:00:00', 'NaT', 'NaT', 'NaT'],
+                                 dtype='datetime64[ns]')
+        tm.assert_index_equal(result, expected)
+
+    def test_astype_object(self):
+        rng = date_range('1/1/2000', periods=20)
+
+        casted = rng.astype('O')
+        exp_values = list(rng)
+
+        tm.assert_index_equal(casted, Index(exp_values, dtype=np.object_))
+        assert casted.tolist() == exp_values
+
+    @pytest.mark.parametrize('tz', [None, 'Asia/Tokyo'])
+    def test_astype_object_tz(self, tz):
+        idx = pd.date_range(start='2013-01-01', periods=4, freq='M',
+                            name='idx', tz=tz)
+        expected_list = [Timestamp('2013-01-31', tz=tz),
+                         Timestamp('2013-02-28', tz=tz),
+                         Timestamp('2013-03-31', tz=tz),
+                         Timestamp('2013-04-30', tz=tz)]
+        expected = pd.Index(expected_list, dtype=object, name='idx')
+        result = idx.astype(object)
+        tm.assert_index_equal(result, expected)
+        assert idx.tolist() == expected_list
+
+    def test_astype_object_with_nat(self):
+        idx = DatetimeIndex([datetime(2013, 1, 1), datetime(2013, 1, 2),
+                             pd.NaT, datetime(2013, 1, 4)], name='idx')
+        expected_list = [Timestamp('2013-01-01'),
+                         Timestamp('2013-01-02'), pd.NaT,
+                         Timestamp('2013-01-04')]
+        expected = pd.Index(expected_list, dtype=object, name='idx')
+        result = idx.astype(object)
+        tm.assert_index_equal(result, expected)
+        assert idx.tolist() == expected_list
+
+    @pytest.mark.parametrize('dtype', [
+        float, 'timedelta64', 'timedelta64[ns]', 'datetime64',
+        'datetime64[D]'])
+    def test_astype_raises(self, dtype):
+        # GH 13149, GH 13209
+        idx = DatetimeIndex(['2016-05-16', 'NaT', NaT, np.NaN])
+        msg = 'Cannot cast DatetimeIndex to dtype'
+        with tm.assert_raises_regex(TypeError, msg):
+            idx.astype(dtype)
+
+    def test_index_convert_to_datetime_array(self):
+        def _check_rng(rng):
+            converted = rng.to_pydatetime()
+            assert isinstance(converted, np.ndarray)
+            for x, stamp in zip(converted, rng):
+                assert isinstance(x, datetime)
+                assert x == stamp.to_pydatetime()
+                assert x.tzinfo == stamp.tzinfo
+
+        rng = date_range('20090415', '20090519')
+        rng_eastern = date_range('20090415', '20090519', tz='US/Eastern')
+        rng_utc = date_range('20090415', '20090519', tz='utc')
+
+        _check_rng(rng)
+        _check_rng(rng_eastern)
+        _check_rng(rng_utc)
+
+    def test_index_convert_to_datetime_array_explicit_pytz(self):
+        def _check_rng(rng):
+            converted = rng.to_pydatetime()
+            assert isinstance(converted, np.ndarray)
+            for x, stamp in zip(converted, rng):
+                assert isinstance(x, datetime)
+                assert x == stamp.to_pydatetime()
+                assert x.tzinfo == stamp.tzinfo
+
+        rng = date_range('20090415', '20090519')
+        rng_eastern = date_range('20090415', '20090519',
+                                 tz=pytz.timezone('US/Eastern'))
+        rng_utc = date_range('20090415', '20090519', tz=pytz.utc)
+
+        _check_rng(rng)
+        _check_rng(rng_eastern)
+        _check_rng(rng_utc)
+
+    def test_index_convert_to_datetime_array_dateutil(self):
+        def _check_rng(rng):
+            converted = rng.to_pydatetime()
+            assert isinstance(converted, np.ndarray)
+            for x, stamp in zip(converted, rng):
+                assert isinstance(x, datetime)
+                assert x == stamp.to_pydatetime()
+                assert x.tzinfo == stamp.tzinfo
+
+        rng = date_range('20090415', '20090519')
+        rng_eastern = date_range('20090415', '20090519',
+                                 tz='dateutil/US/Eastern')
+        rng_utc = date_range('20090415', '20090519', tz=dateutil.tz.tzutc())
+
+        _check_rng(rng)
+        _check_rng(rng_eastern)
+        _check_rng(rng_utc)
+
+    @pytest.mark.parametrize('tz, dtype', [
+        ['US/Pacific', 'datetime64[ns, US/Pacific]'],
+        [None, 'datetime64[ns]']])
+    def test_integer_index_astype_datetime(self, tz, dtype):
+        # GH 20997, 20964
+        val = [pd.Timestamp('2018-01-01', tz=tz).value]
+        result = pd.Index(val).astype(dtype)
+        expected = pd.DatetimeIndex(['2018-01-01'], tz=tz)
+        tm.assert_index_equal(result, expected)
+
+
+class TestToPeriod(object):
+
+    def setup_method(self, method):
+        data = [Timestamp('2007-01-01 10:11:12.123456Z'),
+                Timestamp('2007-01-01 10:11:13.789123Z')]
+        self.index = DatetimeIndex(data)
+
+    def test_to_period_millisecond(self):
+        index = self.index
+
+        period = index.to_period(freq='L')
+        assert 2 == len(period)
+        assert period[0] == Period('2007-01-01 10:11:12.123Z', 'L')
+        assert period[1] == Period('2007-01-01 10:11:13.789Z', 'L')
+
+    def test_to_period_microsecond(self):
+        index = self.index
+
+        period = index.to_period(freq='U')
+        assert 2 == len(period)
+        assert period[0] == Period('2007-01-01 10:11:12.123456Z', 'U')
+        assert period[1] == Period('2007-01-01 10:11:13.789123Z', 'U')
+
+    def test_to_period_tz_pytz(self):
+        from pytz import utc as UTC
+
+        xp = date_range('1/1/2000', '4/1/2000').to_period()
+
+        ts = date_range('1/1/2000', '4/1/2000', tz='US/Eastern')
+
+        result = ts.to_period()[0]
+        expected = ts[0].to_period()
+
+        assert result == expected
+        tm.assert_index_equal(ts.to_period(), xp)
+
+        ts = date_range('1/1/2000', '4/1/2000', tz=UTC)
+
+        result = ts.to_period()[0]
+        expected = ts[0].to_period()
+
+        assert result == expected
+        tm.assert_index_equal(ts.to_period(), xp)
+
+        ts = date_range('1/1/2000', '4/1/2000', tz=tzlocal())
+
+        result = ts.to_period()[0]
+        expected = ts[0].to_period()
+
+        assert result == expected
+        tm.assert_index_equal(ts.to_period(), xp)
+
+    def test_to_period_tz_explicit_pytz(self):
+        xp = date_range('1/1/2000', '4/1/2000').to_period()
+
+        ts = date_range('1/1/2000', '4/1/2000', tz=pytz.timezone('US/Eastern'))
+
+        result = ts.to_period()[0]
+        expected = ts[0].to_period()
+
+        assert result == expected
+        tm.assert_index_equal(ts.to_period(), xp)
+
+        ts = date_range('1/1/2000', '4/1/2000', tz=pytz.utc)
+
+        result = ts.to_period()[0]
+        expected = ts[0].to_period()
+
+        assert result == expected
+        tm.assert_index_equal(ts.to_period(), xp)
+
+        ts = date_range('1/1/2000', '4/1/2000', tz=tzlocal())
+
+        result = ts.to_period()[0]
+        expected = ts[0].to_period()
+
+        assert result == expected
+        tm.assert_index_equal(ts.to_period(), xp)
+
+    def test_to_period_tz_dateutil(self):
+        xp = date_range('1/1/2000', '4/1/2000').to_period()
+
+        ts = date_range('1/1/2000', '4/1/2000', tz='dateutil/US/Eastern')
+
+        result = ts.to_period()[0]
+        expected = ts[0].to_period()
+
+        assert result == expected
+        tm.assert_index_equal(ts.to_period(), xp)
+
+        ts = date_range('1/1/2000', '4/1/2000', tz=dateutil.tz.tzutc())
+
+        result = ts.to_period()[0]
+        expected = ts[0].to_period()
+
+        assert result == expected
+        tm.assert_index_equal(ts.to_period(), xp)
+
+        ts = date_range('1/1/2000', '4/1/2000', tz=tzlocal())
+
+        result = ts.to_period()[0]
+        expected = ts[0].to_period()
+
+        assert result == expected
+        tm.assert_index_equal(ts.to_period(), xp)
+
+    def test_to_period_nofreq(self):
+        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-04'])
+        pytest.raises(ValueError, idx.to_period)
+
+        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03'],
+                            freq='infer')
+        assert idx.freqstr == 'D'
+        expected = pd.PeriodIndex(['2000-01-01', '2000-01-02',
+                                   '2000-01-03'], freq='D')
+        tm.assert_index_equal(idx.to_period(), expected)
+
+        # GH 7606
+        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03'])
+        assert idx.freqstr is None
+        tm.assert_index_equal(idx.to_period(), expected)
diff --git a/pandas/tests/indexes/datetimes/test_construction.py b/pandas/tests/indexes/datetimes/test_construction.py
new file mode 100644
index 0000000000000..ae98510951845
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_construction.py
@@ -0,0 +1,639 @@
+from datetime import timedelta
+from operator import attrgetter
+from functools import partial
+
+import pytest
+import pytz
+import numpy as np
+
+import pandas as pd
+from pandas import offsets
+import pandas.util.testing as tm
+from pandas._libs.tslib import OutOfBoundsDatetime
+from pandas._libs.tslibs import conversion
+from pandas import (DatetimeIndex, Index, Timestamp, datetime, date_range,
+                    to_datetime)
+
+
+class TestDatetimeIndex(object):
+
+    def test_construction_caching(self):
+
+        df = pd.DataFrame({'dt': pd.date_range('20130101', periods=3),
+                           'dttz': pd.date_range('20130101', periods=3,
+                                                 tz='US/Eastern'),
+                           'dt_with_null': [pd.Timestamp('20130101'), pd.NaT,
+                                            pd.Timestamp('20130103')],
+                           'dtns': pd.date_range('20130101', periods=3,
+                                                 freq='ns')})
+        assert df.dttz.dtype.tz.zone == 'US/Eastern'
+
+    @pytest.mark.parametrize('kwargs', [
+        {'tz': 'dtype.tz'},
+        {'dtype': 'dtype'},
+        {'dtype': 'dtype', 'tz': 'dtype.tz'}])
+    def test_construction_with_alt(self, kwargs, tz_aware_fixture):
+        tz = tz_aware_fixture
+        i = pd.date_range('20130101', periods=5, freq='H', tz=tz)
+        kwargs = {key: attrgetter(val)(i) for key, val in kwargs.items()}
+        result = DatetimeIndex(i, **kwargs)
+        tm.assert_index_equal(i, result)
+
+    @pytest.mark.parametrize('kwargs', [
+        {'tz': 'dtype.tz'},
+        {'dtype': 'dtype'},
+        {'dtype': 'dtype', 'tz': 'dtype.tz'}])
+    def test_construction_with_alt_tz_localize(self, kwargs, tz_aware_fixture):
+        tz = tz_aware_fixture
+        i = pd.date_range('20130101', periods=5, freq='H', tz=tz)
+        kwargs = {key: attrgetter(val)(i) for key, val in kwargs.items()}
+        result = DatetimeIndex(i.tz_localize(None).asi8, **kwargs)
+        expected = i.tz_localize(None).tz_localize('UTC').tz_convert(tz)
+        tm.assert_index_equal(result, expected)
+
+        # localize into the provided tz
+        i2 = DatetimeIndex(i.tz_localize(None).asi8, tz='UTC')
+        expected = i.tz_localize(None).tz_localize('UTC')
+        tm.assert_index_equal(i2, expected)
+
+        # incompat tz/dtype
+        pytest.raises(ValueError, lambda: DatetimeIndex(
+            i.tz_localize(None).asi8, dtype=i.dtype, tz='US/Pacific'))
+
+    def test_construction_index_with_mixed_timezones(self):
+        # gh-11488: no tz results in DatetimeIndex
+        result = Index([Timestamp('2011-01-01'),
+                        Timestamp('2011-01-02')], name='idx')
+        exp = DatetimeIndex([Timestamp('2011-01-01'),
+                             Timestamp('2011-01-02')], name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is None
+
+        # same tz results in DatetimeIndex
+        result = Index([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
+                        Timestamp('2011-01-02 10:00', tz='Asia/Tokyo')],
+                       name='idx')
+        exp = DatetimeIndex(
+            [Timestamp('2011-01-01 10:00'), Timestamp('2011-01-02 10:00')
+             ], tz='Asia/Tokyo', name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is not None
+        assert result.tz == exp.tz
+
+        # same tz results in DatetimeIndex (DST)
+        result = Index([Timestamp('2011-01-01 10:00', tz='US/Eastern'),
+                        Timestamp('2011-08-01 10:00', tz='US/Eastern')],
+                       name='idx')
+        exp = DatetimeIndex([Timestamp('2011-01-01 10:00'),
+                             Timestamp('2011-08-01 10:00')],
+                            tz='US/Eastern', name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is not None
+        assert result.tz == exp.tz
+
+        # Different tz results in Index(dtype=object)
+        result = Index([Timestamp('2011-01-01 10:00'),
+                        Timestamp('2011-01-02 10:00', tz='US/Eastern')],
+                       name='idx')
+        exp = Index([Timestamp('2011-01-01 10:00'),
+                     Timestamp('2011-01-02 10:00', tz='US/Eastern')],
+                    dtype='object', name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert not isinstance(result, DatetimeIndex)
+
+        result = Index([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
+                        Timestamp('2011-01-02 10:00', tz='US/Eastern')],
+                       name='idx')
+        exp = Index([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
+                     Timestamp('2011-01-02 10:00', tz='US/Eastern')],
+                    dtype='object', name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert not isinstance(result, DatetimeIndex)
+
+        # length = 1
+        result = Index([Timestamp('2011-01-01')], name='idx')
+        exp = DatetimeIndex([Timestamp('2011-01-01')], name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is None
+
+        # length = 1 with tz
+        result = Index(
+            [Timestamp('2011-01-01 10:00', tz='Asia/Tokyo')], name='idx')
+        exp = DatetimeIndex([Timestamp('2011-01-01 10:00')], tz='Asia/Tokyo',
+                            name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is not None
+        assert result.tz == exp.tz
+
+    def test_construction_index_with_mixed_timezones_with_NaT(self):
+        # see gh-11488
+        result = Index([pd.NaT, Timestamp('2011-01-01'),
+                        pd.NaT, Timestamp('2011-01-02')], name='idx')
+        exp = DatetimeIndex([pd.NaT, Timestamp('2011-01-01'),
+                             pd.NaT, Timestamp('2011-01-02')], name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is None
+
+        # Same tz results in DatetimeIndex
+        result = Index([pd.NaT, Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
+                        pd.NaT, Timestamp('2011-01-02 10:00',
+                                          tz='Asia/Tokyo')],
+                       name='idx')
+        exp = DatetimeIndex([pd.NaT, Timestamp('2011-01-01 10:00'),
+                             pd.NaT, Timestamp('2011-01-02 10:00')],
+                            tz='Asia/Tokyo', name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is not None
+        assert result.tz == exp.tz
+
+        # same tz results in DatetimeIndex (DST)
+        result = Index([Timestamp('2011-01-01 10:00', tz='US/Eastern'),
+                        pd.NaT,
+                        Timestamp('2011-08-01 10:00', tz='US/Eastern')],
+                       name='idx')
+        exp = DatetimeIndex([Timestamp('2011-01-01 10:00'), pd.NaT,
+                             Timestamp('2011-08-01 10:00')],
+                            tz='US/Eastern', name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is not None
+        assert result.tz == exp.tz
+
+        # different tz results in Index(dtype=object)
+        result = Index([pd.NaT, Timestamp('2011-01-01 10:00'),
+                        pd.NaT, Timestamp('2011-01-02 10:00',
+                                          tz='US/Eastern')],
+                       name='idx')
+        exp = Index([pd.NaT, Timestamp('2011-01-01 10:00'),
+                     pd.NaT, Timestamp('2011-01-02 10:00', tz='US/Eastern')],
+                    dtype='object', name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert not isinstance(result, DatetimeIndex)
+
+        result = Index([pd.NaT, Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
+                        pd.NaT, Timestamp('2011-01-02 10:00',
+                                          tz='US/Eastern')], name='idx')
+        exp = Index([pd.NaT, Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
+                     pd.NaT, Timestamp('2011-01-02 10:00', tz='US/Eastern')],
+                    dtype='object', name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert not isinstance(result, DatetimeIndex)
+
+        # all NaT
+        result = Index([pd.NaT, pd.NaT], name='idx')
+        exp = DatetimeIndex([pd.NaT, pd.NaT], name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is None
+
+        # all NaT with tz
+        result = Index([pd.NaT, pd.NaT], tz='Asia/Tokyo', name='idx')
+        exp = DatetimeIndex([pd.NaT, pd.NaT], tz='Asia/Tokyo', name='idx')
+
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is not None
+        assert result.tz == exp.tz
+
+    def test_construction_dti_with_mixed_timezones(self):
+        # GH 11488 (not changed, added explicit tests)
+
+        # no tz results in DatetimeIndex
+        result = DatetimeIndex(
+            [Timestamp('2011-01-01'), Timestamp('2011-01-02')], name='idx')
+        exp = DatetimeIndex(
+            [Timestamp('2011-01-01'), Timestamp('2011-01-02')], name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+
+        # same tz results in DatetimeIndex
+        result = DatetimeIndex([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
+                                Timestamp('2011-01-02 10:00',
+                                          tz='Asia/Tokyo')],
+                               name='idx')
+        exp = DatetimeIndex([Timestamp('2011-01-01 10:00'),
+                             Timestamp('2011-01-02 10:00')],
+                            tz='Asia/Tokyo', name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+
+        # same tz results in DatetimeIndex (DST)
+        result = DatetimeIndex([Timestamp('2011-01-01 10:00', tz='US/Eastern'),
+                                Timestamp('2011-08-01 10:00',
+                                          tz='US/Eastern')],
+                               name='idx')
+        exp = DatetimeIndex([Timestamp('2011-01-01 10:00'),
+                             Timestamp('2011-08-01 10:00')],
+                            tz='US/Eastern', name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+
+        # different tz coerces tz-naive to tz-awareIndex(dtype=object)
+        result = DatetimeIndex([Timestamp('2011-01-01 10:00'),
+                                Timestamp('2011-01-02 10:00',
+                                          tz='US/Eastern')], name='idx')
+        exp = DatetimeIndex([Timestamp('2011-01-01 05:00'),
+                             Timestamp('2011-01-02 10:00')],
+                            tz='US/Eastern', name='idx')
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+
+        # tz mismatch affecting to tz-aware raises TypeError/ValueError
+
+        with pytest.raises(ValueError):
+            DatetimeIndex([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
+                           Timestamp('2011-01-02 10:00', tz='US/Eastern')],
+                          name='idx')
+
+        with tm.assert_raises_regex(TypeError,
+                                    'data is already tz-aware'):
+            DatetimeIndex([Timestamp('2011-01-01 10:00'),
+                           Timestamp('2011-01-02 10:00', tz='US/Eastern')],
+                          tz='Asia/Tokyo', name='idx')
+
+        with pytest.raises(ValueError):
+            DatetimeIndex([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
+                           Timestamp('2011-01-02 10:00', tz='US/Eastern')],
+                          tz='US/Eastern', name='idx')
+
+        with tm.assert_raises_regex(TypeError,
+                                    'data is already tz-aware'):
+            # passing tz should results in DatetimeIndex, then mismatch raises
+            # TypeError
+            Index([pd.NaT, Timestamp('2011-01-01 10:00'),
+                   pd.NaT, Timestamp('2011-01-02 10:00', tz='US/Eastern')],
+                  tz='Asia/Tokyo', name='idx')
+
+    def test_construction_base_constructor(self):
+        arr = [pd.Timestamp('2011-01-01'), pd.NaT, pd.Timestamp('2011-01-03')]
+        tm.assert_index_equal(pd.Index(arr), pd.DatetimeIndex(arr))
+        tm.assert_index_equal(pd.Index(np.array(arr)),
+                              pd.DatetimeIndex(np.array(arr)))
+
+        arr = [np.nan, pd.NaT, pd.Timestamp('2011-01-03')]
+        tm.assert_index_equal(pd.Index(arr), pd.DatetimeIndex(arr))
+        tm.assert_index_equal(pd.Index(np.array(arr)),
+                              pd.DatetimeIndex(np.array(arr)))
+
+    def test_construction_outofbounds(self):
+        # GH 13663
+        dates = [datetime(3000, 1, 1), datetime(4000, 1, 1),
+                 datetime(5000, 1, 1), datetime(6000, 1, 1)]
+        exp = Index(dates, dtype=object)
+        # coerces to object
+        tm.assert_index_equal(Index(dates), exp)
+
+        with pytest.raises(OutOfBoundsDatetime):
+            # can't create DatetimeIndex
+            DatetimeIndex(dates)
+
+    def test_construction_with_ndarray(self):
+        # GH 5152
+        dates = [datetime(2013, 10, 7),
+                 datetime(2013, 10, 8),
+                 datetime(2013, 10, 9)]
+        data = DatetimeIndex(dates, freq=pd.tseries.frequencies.BDay()).values
+        result = DatetimeIndex(data, freq=pd.tseries.frequencies.BDay())
+        expected = DatetimeIndex(['2013-10-07',
+                                  '2013-10-08',
+                                  '2013-10-09'],
+                                 freq='B')
+        tm.assert_index_equal(result, expected)
+
+    def test_constructor_coverage(self):
+        rng = date_range('1/1/2000', periods=10.5)
+        exp = date_range('1/1/2000', periods=10)
+        tm.assert_index_equal(rng, exp)
+
+        msg = 'periods must be a number, got foo'
+        with tm.assert_raises_regex(TypeError, msg):
+            DatetimeIndex(start='1/1/2000', periods='foo', freq='D')
+
+        pytest.raises(ValueError, DatetimeIndex, start='1/1/2000',
+                      end='1/10/2000')
+
+        pytest.raises(ValueError, DatetimeIndex, '1/1/2000')
+
+        # generator expression
+        gen = (datetime(2000, 1, 1) + timedelta(i) for i in range(10))
+        result = DatetimeIndex(gen)
+        expected = DatetimeIndex([datetime(2000, 1, 1) + timedelta(i)
+                                  for i in range(10)])
+        tm.assert_index_equal(result, expected)
+
+        # NumPy string array
+        strings = np.array(['2000-01-01', '2000-01-02', '2000-01-03'])
+        result = DatetimeIndex(strings)
+        expected = DatetimeIndex(strings.astype('O'))
+        tm.assert_index_equal(result, expected)
+
+        from_ints = DatetimeIndex(expected.asi8)
+        tm.assert_index_equal(from_ints, expected)
+
+        # string with NaT
+        strings = np.array(['2000-01-01', '2000-01-02', 'NaT'])
+        result = DatetimeIndex(strings)
+        expected = DatetimeIndex(strings.astype('O'))
+        tm.assert_index_equal(result, expected)
+
+        from_ints = DatetimeIndex(expected.asi8)
+        tm.assert_index_equal(from_ints, expected)
+
+        # non-conforming
+        pytest.raises(ValueError, DatetimeIndex,
+                      ['2000-01-01', '2000-01-02', '2000-01-04'], freq='D')
+
+        pytest.raises(ValueError, DatetimeIndex, start='2011-01-01',
+                      freq='b')
+        pytest.raises(ValueError, DatetimeIndex, end='2011-01-01',
+                      freq='B')
+        pytest.raises(ValueError, DatetimeIndex, periods=10, freq='D')
+
+    @pytest.mark.parametrize('freq', ['AS', 'W-SUN'])
+    def test_constructor_datetime64_tzformat(self, freq):
+        # see GH#6572: ISO 8601 format results in pytz.FixedOffset
+        idx = date_range('2013-01-01T00:00:00-05:00',
+                         '2016-01-01T23:59:59-05:00', freq=freq)
+        expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
+                              freq=freq, tz=pytz.FixedOffset(-300))
+        tm.assert_index_equal(idx, expected)
+        # Unable to use `US/Eastern` because of DST
+        expected_i8 = date_range('2013-01-01T00:00:00',
+                                 '2016-01-01T23:59:59', freq=freq,
+                                 tz='America/Lima')
+        tm.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
+
+        idx = date_range('2013-01-01T00:00:00+09:00',
+                         '2016-01-01T23:59:59+09:00', freq=freq)
+        expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
+                              freq=freq, tz=pytz.FixedOffset(540))
+        tm.assert_index_equal(idx, expected)
+        expected_i8 = date_range('2013-01-01T00:00:00',
+                                 '2016-01-01T23:59:59', freq=freq,
+                                 tz='Asia/Tokyo')
+        tm.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
+
+        # Non ISO 8601 format results in dateutil.tz.tzoffset
+        idx = date_range('2013/1/1 0:00:00-5:00', '2016/1/1 23:59:59-5:00',
+                         freq=freq)
+        expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
+                              freq=freq, tz=pytz.FixedOffset(-300))
+        tm.assert_index_equal(idx, expected)
+        # Unable to use `US/Eastern` because of DST
+        expected_i8 = date_range('2013-01-01T00:00:00',
+                                 '2016-01-01T23:59:59', freq=freq,
+                                 tz='America/Lima')
+        tm.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
+
+        idx = date_range('2013/1/1 0:00:00+9:00',
+                         '2016/1/1 23:59:59+09:00', freq=freq)
+        expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
+                              freq=freq, tz=pytz.FixedOffset(540))
+        tm.assert_index_equal(idx, expected)
+        expected_i8 = date_range('2013-01-01T00:00:00',
+                                 '2016-01-01T23:59:59', freq=freq,
+                                 tz='Asia/Tokyo')
+        tm.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
+
+    def test_constructor_dtype(self):
+
+        # passing a dtype with a tz should localize
+        idx = DatetimeIndex(['2013-01-01', '2013-01-02'],
+                            dtype='datetime64[ns, US/Eastern]')
+        expected = DatetimeIndex(['2013-01-01', '2013-01-02']
+                                 ).tz_localize('US/Eastern')
+        tm.assert_index_equal(idx, expected)
+
+        idx = DatetimeIndex(['2013-01-01', '2013-01-02'],
+                            tz='US/Eastern')
+        tm.assert_index_equal(idx, expected)
+
+        # if we already have a tz and its not the same, then raise
+        idx = DatetimeIndex(['2013-01-01', '2013-01-02'],
+                            dtype='datetime64[ns, US/Eastern]')
+
+        pytest.raises(ValueError,
+                      lambda: DatetimeIndex(idx,
+                                            dtype='datetime64[ns]'))
+
+        # this is effectively trying to convert tz's
+        pytest.raises(TypeError,
+                      lambda: DatetimeIndex(idx,
+                                            dtype='datetime64[ns, CET]'))
+        pytest.raises(ValueError,
+                      lambda: DatetimeIndex(
+                          idx, tz='CET',
+                          dtype='datetime64[ns, US/Eastern]'))
+        result = DatetimeIndex(idx, dtype='datetime64[ns, US/Eastern]')
+        tm.assert_index_equal(idx, result)
+
+    def test_constructor_name(self):
+        idx = DatetimeIndex(start='2000-01-01', periods=1, freq='A',
+                            name='TEST')
+        assert idx.name == 'TEST'
+
+    def test_000constructor_resolution(self):
+        # 2252
+        t1 = Timestamp((1352934390 * 1000000000) + 1000000 + 1000 + 1)
+        idx = DatetimeIndex([t1])
+
+        assert idx.nanosecond[0] == t1.nanosecond
+
+    def test_disallow_setting_tz(self):
+        # GH 3746
+        dti = DatetimeIndex(['2010'], tz='UTC')
+        with pytest.raises(AttributeError):
+            dti.tz = pytz.timezone('US/Pacific')
+
+    @pytest.mark.parametrize('tz', [
+        None, 'America/Los_Angeles', pytz.timezone('America/Los_Angeles'),
+        Timestamp('2000', tz='America/Los_Angeles').tz])
+    def test_constructor_start_end_with_tz(self, tz):
+        # GH 18595
+        start = Timestamp('2013-01-01 06:00:00', tz='America/Los_Angeles')
+        end = Timestamp('2013-01-02 06:00:00', tz='America/Los_Angeles')
+        result = DatetimeIndex(freq='D', start=start, end=end, tz=tz)
+        expected = DatetimeIndex(['2013-01-01 06:00:00',
+                                  '2013-01-02 06:00:00'],
+                                 tz='America/Los_Angeles')
+        tm.assert_index_equal(result, expected)
+        # Especially assert that the timezone is consistent for pytz
+        assert pytz.timezone('America/Los_Angeles') is result.tz
+
+    @pytest.mark.parametrize('tz', ['US/Pacific', 'US/Eastern', 'Asia/Tokyo'])
+    def test_constructor_with_non_normalized_pytz(self, tz):
+        # GH 18595
+        non_norm_tz = Timestamp('2010', tz=tz).tz
+        result = DatetimeIndex(['2010'], tz=non_norm_tz)
+        assert pytz.timezone(tz) is result.tz
+
+    def test_constructor_timestamp_near_dst(self):
+        # GH 20854
+        ts = [Timestamp('2016-10-30 03:00:00+0300', tz='Europe/Helsinki'),
+              Timestamp('2016-10-30 03:00:00+0200', tz='Europe/Helsinki')]
+        result = DatetimeIndex(ts)
+        expected = DatetimeIndex([ts[0].to_pydatetime(),
+                                  ts[1].to_pydatetime()])
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('klass', [Index, DatetimeIndex])
+    @pytest.mark.parametrize('box', [
+        np.array, partial(np.array, dtype=object), list])
+    @pytest.mark.parametrize('tz, dtype', [
+        ['US/Pacific', 'datetime64[ns, US/Pacific]'],
+        [None, 'datetime64[ns]']])
+    def test_constructor_with_int_tz(self, klass, box, tz, dtype):
+        # GH 20997, 20964
+        ts = Timestamp('2018-01-01', tz=tz)
+        result = klass(box([ts.value]), dtype=dtype)
+        expected = klass([ts])
+        assert result == expected
+
+
+class TestTimeSeries(object):
+
+    def test_dti_constructor_preserve_dti_freq(self):
+        rng = date_range('1/1/2000', '1/2/2000', freq='5min')
+
+        rng2 = DatetimeIndex(rng)
+        assert rng.freq == rng2.freq
+
+    def test_dti_constructor_years_only(self, tz_naive_fixture):
+        tz = tz_naive_fixture
+        # GH 6961
+        rng1 = date_range('2014', '2015', freq='M', tz=tz)
+        expected1 = date_range('2014-01-31', '2014-12-31', freq='M', tz=tz)
+
+        rng2 = date_range('2014', '2015', freq='MS', tz=tz)
+        expected2 = date_range('2014-01-01', '2015-01-01', freq='MS', tz=tz)
+
+        rng3 = date_range('2014', '2020', freq='A', tz=tz)
+        expected3 = date_range('2014-12-31', '2019-12-31', freq='A', tz=tz)
+
+        rng4 = date_range('2014', '2020', freq='AS', tz=tz)
+        expected4 = date_range('2014-01-01', '2020-01-01', freq='AS', tz=tz)
+
+        for rng, expected in [(rng1, expected1), (rng2, expected2),
+                              (rng3, expected3), (rng4, expected4)]:
+            tm.assert_index_equal(rng, expected)
+
+    def test_dti_constructor_small_int(self, any_int_dtype):
+        # see gh-13721
+        exp = DatetimeIndex(['1970-01-01 00:00:00.00000000',
+                             '1970-01-01 00:00:00.00000001',
+                             '1970-01-01 00:00:00.00000002'])
+
+        arr = np.array([0, 10, 20], dtype=any_int_dtype)
+        tm.assert_index_equal(DatetimeIndex(arr), exp)
+
+    def test_ctor_str_intraday(self):
+        rng = DatetimeIndex(['1-1-2000 00:00:01'])
+        assert rng[0].second == 1
+
+    def test_is_(self):
+        dti = DatetimeIndex(start='1/1/2005', end='12/1/2005', freq='M')
+        assert dti.is_(dti)
+        assert dti.is_(dti.view())
+        assert not dti.is_(dti.copy())
+
+    def test_index_cast_datetime64_other_units(self):
+        arr = np.arange(0, 100, 10, dtype=np.int64).view('M8[D]')
+        idx = Index(arr)
+
+        assert (idx.values == conversion.ensure_datetime64ns(arr)).all()
+
+    def test_constructor_int64_nocopy(self):
+        # GH#1624
+        arr = np.arange(1000, dtype=np.int64)
+        index = DatetimeIndex(arr)
+
+        arr[50:100] = -1
+        assert (index.asi8[50:100] == -1).all()
+
+        arr = np.arange(1000, dtype=np.int64)
+        index = DatetimeIndex(arr, copy=True)
+
+        arr[50:100] = -1
+        assert (index.asi8[50:100] != -1).all()
+
+    @pytest.mark.parametrize('freq', ['M', 'Q', 'A', 'D', 'B', 'BH',
+                                      'T', 'S', 'L', 'U', 'H', 'N', 'C'])
+    def test_from_freq_recreate_from_data(self, freq):
+        org = DatetimeIndex(start='2001/02/01 09:00', freq=freq, periods=1)
+        idx = DatetimeIndex(org, freq=freq)
+        tm.assert_index_equal(idx, org)
+
+        org = DatetimeIndex(start='2001/02/01 09:00', freq=freq,
+                            tz='US/Pacific', periods=1)
+        idx = DatetimeIndex(org, freq=freq, tz='US/Pacific')
+        tm.assert_index_equal(idx, org)
+
+    def test_datetimeindex_constructor_misc(self):
+        arr = ['1/1/2005', '1/2/2005', 'Jn 3, 2005', '2005-01-04']
+        pytest.raises(Exception, DatetimeIndex, arr)
+
+        arr = ['1/1/2005', '1/2/2005', '1/3/2005', '2005-01-04']
+        idx1 = DatetimeIndex(arr)
+
+        arr = [datetime(2005, 1, 1), '1/2/2005', '1/3/2005', '2005-01-04']
+        idx2 = DatetimeIndex(arr)
+
+        arr = [Timestamp(datetime(2005, 1, 1)), '1/2/2005', '1/3/2005',
+               '2005-01-04']
+        idx3 = DatetimeIndex(arr)
+
+        arr = np.array(['1/1/2005', '1/2/2005', '1/3/2005',
+                        '2005-01-04'], dtype='O')
+        idx4 = DatetimeIndex(arr)
+
+        arr = to_datetime(['1/1/2005', '1/2/2005', '1/3/2005', '2005-01-04'])
+        idx5 = DatetimeIndex(arr)
+
+        arr = to_datetime(['1/1/2005', '1/2/2005', 'Jan 3, 2005', '2005-01-04'
+                           ])
+        idx6 = DatetimeIndex(arr)
+
+        idx7 = DatetimeIndex(['12/05/2007', '25/01/2008'], dayfirst=True)
+        idx8 = DatetimeIndex(['2007/05/12', '2008/01/25'], dayfirst=False,
+                             yearfirst=True)
+        tm.assert_index_equal(idx7, idx8)
+
+        for other in [idx2, idx3, idx4, idx5, idx6]:
+            assert (idx1.values == other.values).all()
+
+        sdate = datetime(1999, 12, 25)
+        edate = datetime(2000, 1, 1)
+        idx = DatetimeIndex(start=sdate, freq='1B', periods=20)
+        assert len(idx) == 20
+        assert idx[0] == sdate + 0 * offsets.BDay()
+        assert idx.freq == 'B'
+
+        idx = DatetimeIndex(end=edate, freq=('D', 5), periods=20)
+        assert len(idx) == 20
+        assert idx[-1] == edate
+        assert idx.freq == '5D'
+
+        idx1 = DatetimeIndex(start=sdate, end=edate, freq='W-SUN')
+        idx2 = DatetimeIndex(start=sdate, end=edate,
+                             freq=offsets.Week(weekday=6))
+        assert len(idx1) == len(idx2)
+        assert idx1.freq == idx2.freq
+
+        idx1 = DatetimeIndex(start=sdate, end=edate, freq='QS')
+        idx2 = DatetimeIndex(start=sdate, end=edate,
+                             freq=offsets.QuarterBegin(startingMonth=1))
+        assert len(idx1) == len(idx2)
+        assert idx1.freq == idx2.freq
+
+        idx1 = DatetimeIndex(start=sdate, end=edate, freq='BQ')
+        idx2 = DatetimeIndex(start=sdate, end=edate,
+                             freq=offsets.BQuarterEnd(startingMonth=12))
+        assert len(idx1) == len(idx2)
+        assert idx1.freq == idx2.freq
diff --git a/pandas/tests/indexes/datetimes/test_date_range.py b/pandas/tests/indexes/datetimes/test_date_range.py
new file mode 100644
index 0000000000000..47d4d15420f1d
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_date_range.py
@@ -0,0 +1,772 @@
+"""
+test date_range, bdate_range construction from the convenience range functions
+"""
+
+import pytest
+
+import numpy as np
+import pytz
+from pytz import timezone
+from datetime import datetime, timedelta, time
+
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas import compat
+from pandas import date_range, bdate_range, offsets, DatetimeIndex, Timestamp
+from pandas.tseries.offsets import (generate_range, CDay, BDay, DateOffset,
+                                    MonthEnd, prefix_mapping)
+
+from pandas.tests.series.common import TestData
+
+START, END = datetime(2009, 1, 1), datetime(2010, 1, 1)
+
+
+class TestTimestampEquivDateRange(object):
+    # Older tests in TestTimeSeries constructed their `stamp` objects
+    # using `date_range` instead of the `Timestamp` constructor.
+    # TestTimestampEquivDateRange checks that these are equivalent in the
+    # pertinent cases.
+
+    def test_date_range_timestamp_equiv(self):
+        rng = date_range('20090415', '20090519', tz='US/Eastern')
+        stamp = rng[0]
+
+        ts = Timestamp('20090415', tz='US/Eastern', freq='D')
+        assert ts == stamp
+
+    def test_date_range_timestamp_equiv_dateutil(self):
+        rng = date_range('20090415', '20090519', tz='dateutil/US/Eastern')
+        stamp = rng[0]
+
+        ts = Timestamp('20090415', tz='dateutil/US/Eastern', freq='D')
+        assert ts == stamp
+
+    def test_date_range_timestamp_equiv_explicit_pytz(self):
+        rng = date_range('20090415', '20090519',
+                         tz=pytz.timezone('US/Eastern'))
+        stamp = rng[0]
+
+        ts = Timestamp('20090415', tz=pytz.timezone('US/Eastern'), freq='D')
+        assert ts == stamp
+
+    @td.skip_if_windows_python_3
+    def test_date_range_timestamp_equiv_explicit_dateutil(self):
+        from pandas._libs.tslibs.timezones import dateutil_gettz as gettz
+
+        rng = date_range('20090415', '20090519', tz=gettz('US/Eastern'))
+        stamp = rng[0]
+
+        ts = Timestamp('20090415', tz=gettz('US/Eastern'), freq='D')
+        assert ts == stamp
+
+    def test_date_range_timestamp_equiv_from_datetime_instance(self):
+        datetime_instance = datetime(2014, 3, 4)
+        # build a timestamp with a frequency, since then it supports
+        # addition/subtraction of integers
+        timestamp_instance = date_range(datetime_instance, periods=1,
+                                        freq='D')[0]
+
+        ts = Timestamp(datetime_instance, freq='D')
+        assert ts == timestamp_instance
+
+    def test_date_range_timestamp_equiv_preserve_frequency(self):
+        timestamp_instance = date_range('2014-03-05', periods=1, freq='D')[0]
+        ts = Timestamp('2014-03-05', freq='D')
+
+        assert timestamp_instance == ts
+
+
+class TestDateRanges(TestData):
+
+    def test_date_range_gen_error(self):
+        rng = date_range('1/1/2000 00:00', '1/1/2000 00:18', freq='5min')
+        assert len(rng) == 4
+
+    @pytest.mark.parametrize("freq", ["AS", "YS"])
+    def test_begin_year_alias(self, freq):
+        # see gh-9313
+        rng = date_range("1/1/2013", "7/1/2017", freq=freq)
+        exp = pd.DatetimeIndex(["2013-01-01", "2014-01-01",
+                                "2015-01-01", "2016-01-01",
+                                "2017-01-01"], freq=freq)
+        tm.assert_index_equal(rng, exp)
+
+    @pytest.mark.parametrize("freq", ["A", "Y"])
+    def test_end_year_alias(self, freq):
+        # see gh-9313
+        rng = date_range("1/1/2013", "7/1/2017", freq=freq)
+        exp = pd.DatetimeIndex(["2013-12-31", "2014-12-31",
+                                "2015-12-31", "2016-12-31"], freq=freq)
+        tm.assert_index_equal(rng, exp)
+
+    @pytest.mark.parametrize("freq", ["BA", "BY"])
+    def test_business_end_year_alias(self, freq):
+        # see gh-9313
+        rng = date_range("1/1/2013", "7/1/2017", freq=freq)
+        exp = pd.DatetimeIndex(["2013-12-31", "2014-12-31",
+                                "2015-12-31", "2016-12-30"], freq=freq)
+        tm.assert_index_equal(rng, exp)
+
+    def test_date_range_negative_freq(self):
+        # GH 11018
+        rng = date_range('2011-12-31', freq='-2A', periods=3)
+        exp = pd.DatetimeIndex(['2011-12-31', '2009-12-31',
+                                '2007-12-31'], freq='-2A')
+        tm.assert_index_equal(rng, exp)
+        assert rng.freq == '-2A'
+
+        rng = date_range('2011-01-31', freq='-2M', periods=3)
+        exp = pd.DatetimeIndex(['2011-01-31', '2010-11-30',
+                                '2010-09-30'], freq='-2M')
+        tm.assert_index_equal(rng, exp)
+        assert rng.freq == '-2M'
+
+    def test_date_range_bms_bug(self):
+        # #1645
+        rng = date_range('1/1/2000', periods=10, freq='BMS')
+
+        ex_first = Timestamp('2000-01-03')
+        assert rng[0] == ex_first
+
+    def test_date_range_normalize(self):
+        snap = datetime.today()
+        n = 50
+
+        rng = date_range(snap, periods=n, normalize=False, freq='2D')
+
+        offset = timedelta(2)
+        values = DatetimeIndex([snap + i * offset for i in range(n)])
+
+        tm.assert_index_equal(rng, values)
+
+        rng = date_range('1/1/2000 08:15', periods=n, normalize=False,
+                         freq='B')
+        the_time = time(8, 15)
+        for val in rng:
+            assert val.time() == the_time
+
+    def test_date_range_fy5252(self):
+        dr = date_range(start="2013-01-01", periods=2, freq=offsets.FY5253(
+            startingMonth=1, weekday=3, variation="nearest"))
+        assert dr[0] == Timestamp('2013-01-31')
+        assert dr[1] == Timestamp('2014-01-30')
+
+    def test_date_range_ambiguous_arguments(self):
+        # #2538
+        start = datetime(2011, 1, 1, 5, 3, 40)
+        end = datetime(2011, 1, 1, 8, 9, 40)
+
+        msg = ('Of the four parameters: start, end, periods, and '
+               'freq, exactly three must be specified')
+        with tm.assert_raises_regex(ValueError, msg):
+            date_range(start, end, periods=10, freq='s')
+
+    def test_date_range_convenience_periods(self):
+        # GH 20808
+        result = date_range('2018-04-24', '2018-04-27', periods=3)
+        expected = DatetimeIndex(['2018-04-24 00:00:00',
+                                  '2018-04-25 12:00:00',
+                                  '2018-04-27 00:00:00'], freq=None)
+
+        tm.assert_index_equal(result, expected)
+
+        # Test if spacing remains linear if tz changes to dst in range
+        result = date_range('2018-04-01 01:00:00',
+                            '2018-04-01 04:00:00',
+                            tz='Australia/Sydney',
+                            periods=3)
+        expected = DatetimeIndex([Timestamp('2018-04-01 01:00:00+1100',
+                                            tz='Australia/Sydney'),
+                                  Timestamp('2018-04-01 02:00:00+1000',
+                                            tz='Australia/Sydney'),
+                                  Timestamp('2018-04-01 04:00:00+1000',
+                                            tz='Australia/Sydney')])
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('start,end,result_tz', [
+        ['20180101', '20180103', 'US/Eastern'],
+        [datetime(2018, 1, 1), datetime(2018, 1, 3), 'US/Eastern'],
+        [Timestamp('20180101'), Timestamp('20180103'), 'US/Eastern'],
+        [Timestamp('20180101', tz='US/Eastern'),
+         Timestamp('20180103', tz='US/Eastern'), 'US/Eastern'],
+        [Timestamp('20180101', tz='US/Eastern'),
+         Timestamp('20180103', tz='US/Eastern'), None]])
+    def test_date_range_linspacing_tz(self, start, end, result_tz):
+        # GH 20983
+        result = date_range(start, end, periods=3, tz=result_tz)
+        expected = date_range('20180101', periods=3, freq='D', tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+    def test_date_range_businesshour(self):
+        idx = DatetimeIndex(['2014-07-04 09:00', '2014-07-04 10:00',
+                             '2014-07-04 11:00',
+                             '2014-07-04 12:00', '2014-07-04 13:00',
+                             '2014-07-04 14:00',
+                             '2014-07-04 15:00', '2014-07-04 16:00'],
+                            freq='BH')
+        rng = date_range('2014-07-04 09:00', '2014-07-04 16:00', freq='BH')
+        tm.assert_index_equal(idx, rng)
+
+        idx = DatetimeIndex(
+            ['2014-07-04 16:00', '2014-07-07 09:00'], freq='BH')
+        rng = date_range('2014-07-04 16:00', '2014-07-07 09:00', freq='BH')
+        tm.assert_index_equal(idx, rng)
+
+        idx = DatetimeIndex(['2014-07-04 09:00', '2014-07-04 10:00',
+                             '2014-07-04 11:00',
+                             '2014-07-04 12:00', '2014-07-04 13:00',
+                             '2014-07-04 14:00',
+                             '2014-07-04 15:00', '2014-07-04 16:00',
+                             '2014-07-07 09:00', '2014-07-07 10:00',
+                             '2014-07-07 11:00',
+                             '2014-07-07 12:00', '2014-07-07 13:00',
+                             '2014-07-07 14:00',
+                             '2014-07-07 15:00', '2014-07-07 16:00',
+                             '2014-07-08 09:00', '2014-07-08 10:00',
+                             '2014-07-08 11:00',
+                             '2014-07-08 12:00', '2014-07-08 13:00',
+                             '2014-07-08 14:00',
+                             '2014-07-08 15:00', '2014-07-08 16:00'],
+                            freq='BH')
+        rng = date_range('2014-07-04 09:00', '2014-07-08 16:00', freq='BH')
+        tm.assert_index_equal(idx, rng)
+
+    def test_range_misspecified(self):
+        # GH #1095
+        msg = ('Of the four parameters: start, end, periods, and '
+               'freq, exactly three must be specified')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            date_range(start='1/1/2000')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            date_range(end='1/1/2000')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            date_range(periods=10)
+
+        with tm.assert_raises_regex(ValueError, msg):
+            date_range(start='1/1/2000', freq='H')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            date_range(end='1/1/2000', freq='H')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            date_range(periods=10, freq='H')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            date_range()
+
+    @pytest.mark.parametrize('f', [compat.long, int])
+    def test_compat_replace(self, f):
+        # https://github.com/statsmodels/statsmodels/issues/3349
+        # replace should take ints/longs for compat
+        result = date_range(Timestamp('1960-04-01 00:00:00', freq='QS-JAN'),
+                            periods=f(76), freq='QS-JAN')
+        assert len(result) == 76
+
+    def test_catch_infinite_loop(self):
+        offset = offsets.DateOffset(minute=5)
+        # blow up, don't loop forever
+        pytest.raises(Exception, date_range, datetime(2011, 11, 11),
+                      datetime(2011, 11, 12), freq=offset)
+
+    @pytest.mark.parametrize('periods', (1, 2))
+    def test_wom_len(self, periods):
+        # https://github.com/pandas-dev/pandas/issues/20517
+        res = date_range(start='20110101', periods=periods, freq='WOM-1MON')
+        assert len(res) == periods
+
+    def test_construct_over_dst(self):
+        # GH 20854
+        pre_dst = Timestamp('2010-11-07 01:00:00').tz_localize('US/Pacific',
+                                                               ambiguous=True)
+        pst_dst = Timestamp('2010-11-07 01:00:00').tz_localize('US/Pacific',
+                                                               ambiguous=False)
+        expect_data = [Timestamp('2010-11-07 00:00:00', tz='US/Pacific'),
+                       pre_dst,
+                       pst_dst]
+        expected = DatetimeIndex(expect_data)
+        result = date_range(start='2010-11-7', periods=3,
+                            freq='H', tz='US/Pacific')
+        tm.assert_index_equal(result, expected)
+
+    def test_construct_with_different_start_end_string_format(self):
+        # GH 12064
+        result = date_range('2013-01-01 00:00:00+09:00',
+                            '2013/01/01 02:00:00+09:00', freq='H')
+        expected = DatetimeIndex([Timestamp('2013-01-01 00:00:00+09:00'),
+                                  Timestamp('2013-01-01 01:00:00+09:00'),
+                                  Timestamp('2013-01-01 02:00:00+09:00')])
+        tm.assert_index_equal(result, expected)
+
+
+class TestGenRangeGeneration(object):
+
+    def test_generate(self):
+        rng1 = list(generate_range(START, END, offset=BDay()))
+        rng2 = list(generate_range(START, END, time_rule='B'))
+        assert rng1 == rng2
+
+    def test_generate_cday(self):
+        rng1 = list(generate_range(START, END, offset=CDay()))
+        rng2 = list(generate_range(START, END, time_rule='C'))
+        assert rng1 == rng2
+
+    def test_1(self):
+        rng = list(generate_range(start=datetime(2009, 3, 25), periods=2))
+        expected = [datetime(2009, 3, 25), datetime(2009, 3, 26)]
+        assert rng == expected
+
+    def test_2(self):
+        rng = list(generate_range(start=datetime(2008, 1, 1),
+                                  end=datetime(2008, 1, 3)))
+        expected = [datetime(2008, 1, 1),
+                    datetime(2008, 1, 2),
+                    datetime(2008, 1, 3)]
+        assert rng == expected
+
+    def test_3(self):
+        rng = list(generate_range(start=datetime(2008, 1, 5),
+                                  end=datetime(2008, 1, 6)))
+        expected = []
+        assert rng == expected
+
+    def test_precision_finer_than_offset(self):
+        # GH 9907
+        result1 = DatetimeIndex(start='2015-04-15 00:00:03',
+                                end='2016-04-22 00:00:00', freq='Q')
+        result2 = DatetimeIndex(start='2015-04-15 00:00:03',
+                                end='2015-06-22 00:00:04', freq='W')
+        expected1_list = ['2015-06-30 00:00:03', '2015-09-30 00:00:03',
+                          '2015-12-31 00:00:03', '2016-03-31 00:00:03']
+        expected2_list = ['2015-04-19 00:00:03', '2015-04-26 00:00:03',
+                          '2015-05-03 00:00:03', '2015-05-10 00:00:03',
+                          '2015-05-17 00:00:03', '2015-05-24 00:00:03',
+                          '2015-05-31 00:00:03', '2015-06-07 00:00:03',
+                          '2015-06-14 00:00:03', '2015-06-21 00:00:03']
+        expected1 = DatetimeIndex(expected1_list, dtype='datetime64[ns]',
+                                  freq='Q-DEC', tz=None)
+        expected2 = DatetimeIndex(expected2_list, dtype='datetime64[ns]',
+                                  freq='W-SUN', tz=None)
+        tm.assert_index_equal(result1, expected1)
+        tm.assert_index_equal(result2, expected2)
+
+    dt1, dt2 = '2017-01-01', '2017-01-01'
+    tz1, tz2 = 'US/Eastern', 'Europe/London'
+
+    @pytest.mark.parametrize("start,end", [
+        (pd.Timestamp(dt1, tz=tz1), pd.Timestamp(dt2)),
+        (pd.Timestamp(dt1), pd.Timestamp(dt2, tz=tz2)),
+        (pd.Timestamp(dt1, tz=tz1), pd.Timestamp(dt2, tz=tz2)),
+        (pd.Timestamp(dt1, tz=tz2), pd.Timestamp(dt2, tz=tz1))
+    ])
+    def test_mismatching_tz_raises_err(self, start, end):
+        # issue 18488
+        with pytest.raises(TypeError):
+            pd.date_range(start, end)
+        with pytest.raises(TypeError):
+            pd.DatetimeIndex(start, end, freq=BDay())
+
+
+class TestBusinessDateRange(object):
+
+    def test_constructor(self):
+        bdate_range(START, END, freq=BDay())
+        bdate_range(START, periods=20, freq=BDay())
+        bdate_range(end=START, periods=20, freq=BDay())
+
+        msg = 'periods must be a number, got B'
+        with tm.assert_raises_regex(TypeError, msg):
+            date_range('2011-1-1', '2012-1-1', 'B')
+
+        with tm.assert_raises_regex(TypeError, msg):
+            bdate_range('2011-1-1', '2012-1-1', 'B')
+
+        msg = 'freq must be specified for bdate_range; use date_range instead'
+        with tm.assert_raises_regex(TypeError, msg):
+            bdate_range(START, END, periods=10, freq=None)
+
+    def test_naive_aware_conflicts(self):
+        naive = bdate_range(START, END, freq=BDay(), tz=None)
+        aware = bdate_range(START, END, freq=BDay(), tz="Asia/Hong_Kong")
+
+        msg = 'tz-naive.*tz-aware'
+        with tm.assert_raises_regex(TypeError, msg):
+            naive.join(aware)
+
+        with tm.assert_raises_regex(TypeError, msg):
+            aware.join(naive)
+
+    def test_cached_range(self):
+        DatetimeIndex._cached_range(START, END, freq=BDay())
+        DatetimeIndex._cached_range(START, periods=20, freq=BDay())
+        DatetimeIndex._cached_range(end=START, periods=20, freq=BDay())
+
+        with tm.assert_raises_regex(TypeError, "freq"):
+            DatetimeIndex._cached_range(START, END)
+
+        with tm.assert_raises_regex(TypeError, "specify period"):
+            DatetimeIndex._cached_range(START, freq=BDay())
+
+        with tm.assert_raises_regex(TypeError, "specify period"):
+            DatetimeIndex._cached_range(end=END, freq=BDay())
+
+        with tm.assert_raises_regex(TypeError, "start or end"):
+            DatetimeIndex._cached_range(periods=20, freq=BDay())
+
+    def test_cached_range_bug(self):
+        rng = date_range('2010-09-01 05:00:00', periods=50,
+                         freq=DateOffset(hours=6))
+        assert len(rng) == 50
+        assert rng[0] == datetime(2010, 9, 1, 5)
+
+    def test_timezone_comparaison_bug(self):
+        # smoke test
+        start = Timestamp('20130220 10:00', tz='US/Eastern')
+        result = date_range(start, periods=2, tz='US/Eastern')
+        assert len(result) == 2
+
+    def test_timezone_comparaison_assert(self):
+        start = Timestamp('20130220 10:00', tz='US/Eastern')
+        msg = 'Inferred time zone not equal to passed time zone'
+        with tm.assert_raises_regex(AssertionError, msg):
+            date_range(start, periods=2, tz='Europe/Berlin')
+
+    def test_misc(self):
+        end = datetime(2009, 5, 13)
+        dr = bdate_range(end=end, periods=20)
+        firstDate = end - 19 * BDay()
+
+        assert len(dr) == 20
+        assert dr[0] == firstDate
+        assert dr[-1] == end
+
+    def test_date_parse_failure(self):
+        badly_formed_date = '2007/100/1'
+
+        with pytest.raises(ValueError):
+            Timestamp(badly_formed_date)
+
+        with pytest.raises(ValueError):
+            bdate_range(start=badly_formed_date, periods=10)
+
+        with pytest.raises(ValueError):
+            bdate_range(end=badly_formed_date, periods=10)
+
+        with pytest.raises(ValueError):
+            bdate_range(badly_formed_date, badly_formed_date)
+
+    def test_daterange_bug_456(self):
+        # GH #456
+        rng1 = bdate_range('12/5/2011', '12/5/2011')
+        rng2 = bdate_range('12/2/2011', '12/5/2011')
+        rng2.freq = BDay()
+
+        result = rng1.union(rng2)
+        assert isinstance(result, DatetimeIndex)
+
+    def test_error_with_zero_monthends(self):
+        msg = r'Offset <0 \* MonthEnds> did not increment date'
+        with tm.assert_raises_regex(ValueError, msg):
+            date_range('1/1/2000', '1/1/2001', freq=MonthEnd(0))
+
+    def test_range_bug(self):
+        # GH #770
+        offset = DateOffset(months=3)
+        result = date_range("2011-1-1", "2012-1-31", freq=offset)
+
+        start = datetime(2011, 1, 1)
+        expected = DatetimeIndex([start + i * offset for i in range(5)])
+        tm.assert_index_equal(result, expected)
+
+    def test_range_tz_pytz(self):
+        # see gh-2906
+        tz = timezone('US/Eastern')
+        start = tz.localize(datetime(2011, 1, 1))
+        end = tz.localize(datetime(2011, 1, 3))
+
+        dr = date_range(start=start, periods=3)
+        assert dr.tz.zone == tz.zone
+        assert dr[0] == start
+        assert dr[2] == end
+
+        dr = date_range(end=end, periods=3)
+        assert dr.tz.zone == tz.zone
+        assert dr[0] == start
+        assert dr[2] == end
+
+        dr = date_range(start=start, end=end)
+        assert dr.tz.zone == tz.zone
+        assert dr[0] == start
+        assert dr[2] == end
+
+    def test_range_tz_dst_straddle_pytz(self):
+        tz = timezone('US/Eastern')
+        dates = [(tz.localize(datetime(2014, 3, 6)),
+                  tz.localize(datetime(2014, 3, 12))),
+                 (tz.localize(datetime(2013, 11, 1)),
+                  tz.localize(datetime(2013, 11, 6)))]
+        for (start, end) in dates:
+            dr = date_range(start, end, freq='D')
+            assert dr[0] == start
+            assert dr[-1] == end
+            assert np.all(dr.hour == 0)
+
+            dr = date_range(start, end, freq='D', tz='US/Eastern')
+            assert dr[0] == start
+            assert dr[-1] == end
+            assert np.all(dr.hour == 0)
+
+            dr = date_range(start.replace(tzinfo=None), end.replace(
+                tzinfo=None), freq='D', tz='US/Eastern')
+            assert dr[0] == start
+            assert dr[-1] == end
+            assert np.all(dr.hour == 0)
+
+    def test_range_tz_dateutil(self):
+        # see gh-2906
+
+        # Use maybe_get_tz to fix filename in tz under dateutil.
+        from pandas._libs.tslibs.timezones import maybe_get_tz
+        tz = lambda x: maybe_get_tz('dateutil/' + x)
+
+        start = datetime(2011, 1, 1, tzinfo=tz('US/Eastern'))
+        end = datetime(2011, 1, 3, tzinfo=tz('US/Eastern'))
+
+        dr = date_range(start=start, periods=3)
+        assert dr.tz == tz('US/Eastern')
+        assert dr[0] == start
+        assert dr[2] == end
+
+        dr = date_range(end=end, periods=3)
+        assert dr.tz == tz('US/Eastern')
+        assert dr[0] == start
+        assert dr[2] == end
+
+        dr = date_range(start=start, end=end)
+        assert dr.tz == tz('US/Eastern')
+        assert dr[0] == start
+        assert dr[2] == end
+
+    @pytest.mark.parametrize('freq', ["1D", "3D", "2M", "7W", "3H", "A"])
+    def test_range_closed(self, freq):
+        begin = datetime(2011, 1, 1)
+        end = datetime(2014, 1, 1)
+
+        closed = date_range(begin, end, closed=None, freq=freq)
+        left = date_range(begin, end, closed="left", freq=freq)
+        right = date_range(begin, end, closed="right", freq=freq)
+        expected_left = left
+        expected_right = right
+
+        if end == closed[-1]:
+            expected_left = closed[:-1]
+        if begin == closed[0]:
+            expected_right = closed[1:]
+
+        tm.assert_index_equal(expected_left, left)
+        tm.assert_index_equal(expected_right, right)
+
+    def test_range_closed_with_tz_aware_start_end(self):
+        # GH12409, GH12684
+        begin = Timestamp('2011/1/1', tz='US/Eastern')
+        end = Timestamp('2014/1/1', tz='US/Eastern')
+
+        for freq in ["1D", "3D", "2M", "7W", "3H", "A"]:
+            closed = date_range(begin, end, closed=None, freq=freq)
+            left = date_range(begin, end, closed="left", freq=freq)
+            right = date_range(begin, end, closed="right", freq=freq)
+            expected_left = left
+            expected_right = right
+
+            if end == closed[-1]:
+                expected_left = closed[:-1]
+            if begin == closed[0]:
+                expected_right = closed[1:]
+
+            tm.assert_index_equal(expected_left, left)
+            tm.assert_index_equal(expected_right, right)
+
+        begin = Timestamp('2011/1/1')
+        end = Timestamp('2014/1/1')
+        begintz = Timestamp('2011/1/1', tz='US/Eastern')
+        endtz = Timestamp('2014/1/1', tz='US/Eastern')
+
+        for freq in ["1D", "3D", "2M", "7W", "3H", "A"]:
+            closed = date_range(begin, end, closed=None, freq=freq,
+                                tz='US/Eastern')
+            left = date_range(begin, end, closed="left", freq=freq,
+                              tz='US/Eastern')
+            right = date_range(begin, end, closed="right", freq=freq,
+                               tz='US/Eastern')
+            expected_left = left
+            expected_right = right
+
+            if endtz == closed[-1]:
+                expected_left = closed[:-1]
+            if begintz == closed[0]:
+                expected_right = closed[1:]
+
+            tm.assert_index_equal(expected_left, left)
+            tm.assert_index_equal(expected_right, right)
+
+    @pytest.mark.parametrize('closed', ['right', 'left', None])
+    def test_range_closed_boundary(self, closed):
+        # GH#11804
+        right_boundary = date_range('2015-09-12', '2015-12-01',
+                                    freq='QS-MAR', closed=closed)
+        left_boundary = date_range('2015-09-01', '2015-09-12',
+                                   freq='QS-MAR', closed=closed)
+        both_boundary = date_range('2015-09-01', '2015-12-01',
+                                   freq='QS-MAR', closed=closed)
+        expected_right = expected_left = expected_both = both_boundary
+
+        if closed == 'right':
+            expected_left = both_boundary[1:]
+        if closed == 'left':
+            expected_right = both_boundary[:-1]
+        if closed is None:
+            expected_right = both_boundary[1:]
+            expected_left = both_boundary[:-1]
+
+        tm.assert_index_equal(right_boundary, expected_right)
+        tm.assert_index_equal(left_boundary, expected_left)
+        tm.assert_index_equal(both_boundary, expected_both)
+
+    def test_years_only(self):
+        # GH 6961
+        dr = date_range('2014', '2015', freq='M')
+        assert dr[0] == datetime(2014, 1, 31)
+        assert dr[-1] == datetime(2014, 12, 31)
+
+    def test_freq_divides_end_in_nanos(self):
+        # GH 10885
+        result_1 = date_range('2005-01-12 10:00', '2005-01-12 16:00',
+                              freq='345min')
+        result_2 = date_range('2005-01-13 10:00', '2005-01-13 16:00',
+                              freq='345min')
+        expected_1 = DatetimeIndex(['2005-01-12 10:00:00',
+                                    '2005-01-12 15:45:00'],
+                                   dtype='datetime64[ns]', freq='345T',
+                                   tz=None)
+        expected_2 = DatetimeIndex(['2005-01-13 10:00:00',
+                                    '2005-01-13 15:45:00'],
+                                   dtype='datetime64[ns]', freq='345T',
+                                   tz=None)
+        tm.assert_index_equal(result_1, expected_1)
+        tm.assert_index_equal(result_2, expected_2)
+
+
+class TestCustomDateRange(object):
+
+    def test_constructor(self):
+        bdate_range(START, END, freq=CDay())
+        bdate_range(START, periods=20, freq=CDay())
+        bdate_range(end=START, periods=20, freq=CDay())
+
+        msg = 'periods must be a number, got C'
+        with tm.assert_raises_regex(TypeError, msg):
+            date_range('2011-1-1', '2012-1-1', 'C')
+
+        with tm.assert_raises_regex(TypeError, msg):
+            bdate_range('2011-1-1', '2012-1-1', 'C')
+
+    def test_cached_range(self):
+        DatetimeIndex._cached_range(START, END, freq=CDay())
+        DatetimeIndex._cached_range(START, periods=20,
+                                    freq=CDay())
+        DatetimeIndex._cached_range(end=START, periods=20,
+                                    freq=CDay())
+
+        # with pytest.raises(TypeError):
+        with tm.assert_raises_regex(TypeError, "freq"):
+            DatetimeIndex._cached_range(START, END)
+
+        # with pytest.raises(TypeError):
+        with tm.assert_raises_regex(TypeError, "specify period"):
+            DatetimeIndex._cached_range(START, freq=CDay())
+
+        # with pytest.raises(TypeError):
+        with tm.assert_raises_regex(TypeError, "specify period"):
+            DatetimeIndex._cached_range(end=END, freq=CDay())
+
+        # with pytest.raises(TypeError):
+        with tm.assert_raises_regex(TypeError, "start or end"):
+            DatetimeIndex._cached_range(periods=20, freq=CDay())
+
+    def test_misc(self):
+        end = datetime(2009, 5, 13)
+        dr = bdate_range(end=end, periods=20, freq='C')
+        firstDate = end - 19 * CDay()
+
+        assert len(dr) == 20
+        assert dr[0] == firstDate
+        assert dr[-1] == end
+
+    def test_daterange_bug_456(self):
+        # GH #456
+        rng1 = bdate_range('12/5/2011', '12/5/2011', freq='C')
+        rng2 = bdate_range('12/2/2011', '12/5/2011', freq='C')
+        rng2.freq = CDay()
+
+        result = rng1.union(rng2)
+        assert isinstance(result, DatetimeIndex)
+
+    def test_cdaterange(self):
+        result = bdate_range('2013-05-01', periods=3, freq='C')
+        expected = DatetimeIndex(['2013-05-01', '2013-05-02', '2013-05-03'])
+        tm.assert_index_equal(result, expected)
+
+    def test_cdaterange_weekmask(self):
+        result = bdate_range('2013-05-01', periods=3, freq='C',
+                             weekmask='Sun Mon Tue Wed Thu')
+        expected = DatetimeIndex(['2013-05-01', '2013-05-02', '2013-05-05'])
+        tm.assert_index_equal(result, expected)
+
+        # raise with non-custom freq
+        msg = ('a custom frequency string is required when holidays or '
+               'weekmask are passed, got frequency B')
+        with tm.assert_raises_regex(ValueError, msg):
+            bdate_range('2013-05-01', periods=3,
+                        weekmask='Sun Mon Tue Wed Thu')
+
+    def test_cdaterange_holidays(self):
+        result = bdate_range('2013-05-01', periods=3, freq='C',
+                             holidays=['2013-05-01'])
+        expected = DatetimeIndex(['2013-05-02', '2013-05-03', '2013-05-06'])
+        tm.assert_index_equal(result, expected)
+
+        # raise with non-custom freq
+        msg = ('a custom frequency string is required when holidays or '
+               'weekmask are passed, got frequency B')
+        with tm.assert_raises_regex(ValueError, msg):
+            bdate_range('2013-05-01', periods=3, holidays=['2013-05-01'])
+
+    def test_cdaterange_weekmask_and_holidays(self):
+        result = bdate_range('2013-05-01', periods=3, freq='C',
+                             weekmask='Sun Mon Tue Wed Thu',
+                             holidays=['2013-05-01'])
+        expected = DatetimeIndex(['2013-05-02', '2013-05-05', '2013-05-06'])
+        tm.assert_index_equal(result, expected)
+
+        # raise with non-custom freq
+        msg = ('a custom frequency string is required when holidays or '
+               'weekmask are passed, got frequency B')
+        with tm.assert_raises_regex(ValueError, msg):
+            bdate_range('2013-05-01', periods=3,
+                        weekmask='Sun Mon Tue Wed Thu',
+                        holidays=['2013-05-01'])
+
+    @pytest.mark.parametrize('freq', [freq for freq in prefix_mapping
+                                      if freq.startswith('C')])
+    def test_all_custom_freq(self, freq):
+        # should not raise
+        bdate_range(START, END, freq=freq, weekmask='Mon Wed Fri',
+                    holidays=['2009-03-14'])
+
+        bad_freq = freq + 'FOO'
+        msg = 'invalid custom frequency string: {freq}'
+        with tm.assert_raises_regex(ValueError, msg.format(freq=bad_freq)):
+            bdate_range(START, END, freq=bad_freq)
diff --git a/pandas/tests/indexes/datetimes/test_datetime.py b/pandas/tests/indexes/datetimes/test_datetime.py
new file mode 100644
index 0000000000000..1a5f12103595c
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_datetime.py
@@ -0,0 +1,385 @@
+import warnings
+
+import pytest
+
+import numpy as np
+from datetime import date
+
+import dateutil
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.compat import lrange
+from pandas import (DatetimeIndex, Index, date_range, DataFrame,
+                    Timestamp, offsets)
+
+from pandas.util.testing import assert_almost_equal
+
+randn = np.random.randn
+
+
+class TestDatetimeIndex(object):
+
+    def test_roundtrip_pickle_with_tz(self):
+
+        # GH 8367
+        # round-trip of timezone
+        index = date_range('20130101', periods=3, tz='US/Eastern', name='foo')
+        unpickled = tm.round_trip_pickle(index)
+        tm.assert_index_equal(index, unpickled)
+
+    def test_reindex_preserves_tz_if_target_is_empty_list_or_array(self):
+        # GH7774
+        index = date_range('20130101', periods=3, tz='US/Eastern')
+        assert str(index.reindex([])[0].tz) == 'US/Eastern'
+        assert str(index.reindex(np.array([]))[0].tz) == 'US/Eastern'
+
+    def test_time_loc(self):  # GH8667
+        from datetime import time
+        from pandas._libs.index import _SIZE_CUTOFF
+
+        ns = _SIZE_CUTOFF + np.array([-100, 100], dtype=np.int64)
+        key = time(15, 11, 30)
+        start = key.hour * 3600 + key.minute * 60 + key.second
+        step = 24 * 3600
+
+        for n in ns:
+            idx = pd.date_range('2014-11-26', periods=n, freq='S')
+            ts = pd.Series(np.random.randn(n), index=idx)
+            i = np.arange(start, n, step)
+
+            tm.assert_numpy_array_equal(ts.index.get_loc(key), i,
+                                        check_dtype=False)
+            tm.assert_series_equal(ts[key], ts.iloc[i])
+
+            left, right = ts.copy(), ts.copy()
+            left[key] *= -10
+            right.iloc[i] *= -10
+            tm.assert_series_equal(left, right)
+
+    def test_time_overflow_for_32bit_machines(self):
+        # GH8943.  On some machines NumPy defaults to np.int32 (for example,
+        # 32-bit Linux machines).  In the function _generate_regular_range
+        # found in tseries/index.py, `periods` gets multiplied by `strides`
+        # (which has value 1e9) and since the max value for np.int32 is ~2e9,
+        # and since those machines won't promote np.int32 to np.int64, we get
+        # overflow.
+        periods = np.int_(1000)
+
+        idx1 = pd.date_range(start='2000', periods=periods, freq='S')
+        assert len(idx1) == periods
+
+        idx2 = pd.date_range(end='2000', periods=periods, freq='S')
+        assert len(idx2) == periods
+
+    def test_nat(self):
+        assert DatetimeIndex([np.nan])[0] is pd.NaT
+
+    def test_week_of_month_frequency(self):
+        # GH 5348: "ValueError: Could not evaluate WOM-1SUN" shouldn't raise
+        d1 = date(2002, 9, 1)
+        d2 = date(2013, 10, 27)
+        d3 = date(2012, 9, 30)
+        idx1 = DatetimeIndex([d1, d2])
+        idx2 = DatetimeIndex([d3])
+        result_append = idx1.append(idx2)
+        expected = DatetimeIndex([d1, d2, d3])
+        tm.assert_index_equal(result_append, expected)
+        result_union = idx1.union(idx2)
+        expected = DatetimeIndex([d1, d3, d2])
+        tm.assert_index_equal(result_union, expected)
+
+        # GH 5115
+        result = date_range("2013-1-1", periods=4, freq='WOM-1SAT')
+        dates = ['2013-01-05', '2013-02-02', '2013-03-02', '2013-04-06']
+        expected = DatetimeIndex(dates, freq='WOM-1SAT')
+        tm.assert_index_equal(result, expected)
+
+    def test_hash_error(self):
+        index = date_range('20010101', periods=10)
+        with tm.assert_raises_regex(TypeError, "unhashable type: %r" %
+                                    type(index).__name__):
+            hash(index)
+
+    def test_stringified_slice_with_tz(self):
+        # GH2658
+        import datetime
+        start = datetime.datetime.now()
+        idx = DatetimeIndex(start=start, freq="1d", periods=10)
+        df = DataFrame(lrange(10), index=idx)
+        df["2013-01-14 23:44:34.437768-05:00":]  # no exception here
+
+    def test_append_join_nondatetimeindex(self):
+        rng = date_range('1/1/2000', periods=10)
+        idx = Index(['a', 'b', 'c', 'd'])
+
+        result = rng.append(idx)
+        assert isinstance(result[0], Timestamp)
+
+        # it works
+        rng.join(idx, how='outer')
+
+    def test_map(self):
+        rng = date_range('1/1/2000', periods=10)
+
+        f = lambda x: x.strftime('%Y%m%d')
+        result = rng.map(f)
+        exp = Index([f(x) for x in rng], dtype='<U8')
+        tm.assert_index_equal(result, exp)
+
+    def test_iteration_preserves_tz(self):
+        # see gh-8890
+        index = date_range("2012-01-01", periods=3, freq='H', tz='US/Eastern')
+
+        for i, ts in enumerate(index):
+            result = ts
+            expected = index[i]
+            assert result == expected
+
+        index = date_range("2012-01-01", periods=3, freq='H',
+                           tz=dateutil.tz.tzoffset(None, -28800))
+
+        for i, ts in enumerate(index):
+            result = ts
+            expected = index[i]
+            assert result._repr_base == expected._repr_base
+            assert result == expected
+
+        # 9100
+        index = pd.DatetimeIndex(['2014-12-01 03:32:39.987000-08:00',
+                                  '2014-12-01 04:12:34.987000-08:00'])
+        for i, ts in enumerate(index):
+            result = ts
+            expected = index[i]
+            assert result._repr_base == expected._repr_base
+            assert result == expected
+
+    @pytest.mark.parametrize('periods', [0, 9999, 10000, 10001])
+    def test_iteration_over_chunksize(self, periods):
+        # GH21012
+
+        index = date_range('2000-01-01 00:00:00', periods=periods, freq='min')
+        num = 0
+        for stamp in index:
+            assert index[num] == stamp
+            num += 1
+        assert num == len(index)
+
+    def test_misc_coverage(self):
+        rng = date_range('1/1/2000', periods=5)
+        result = rng.groupby(rng.day)
+        assert isinstance(list(result.values())[0][0], Timestamp)
+
+        idx = DatetimeIndex(['2000-01-03', '2000-01-01', '2000-01-02'])
+        assert not idx.equals(list(idx))
+
+        non_datetime = Index(list('abc'))
+        assert not idx.equals(list(non_datetime))
+
+    def test_string_index_series_name_converted(self):
+        # #1644
+        df = DataFrame(np.random.randn(10, 4),
+                       index=date_range('1/1/2000', periods=10))
+
+        result = df.loc['1/3/2000']
+        assert result.name == df.index[2]
+
+        result = df.T['1/3/2000']
+        assert result.name == df.index[2]
+
+    def test_get_duplicates(self):
+        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-02',
+                             '2000-01-03', '2000-01-03', '2000-01-04'])
+
+        with warnings.catch_warnings(record=True):
+            # Deprecated - see GH20239
+            result = idx.get_duplicates()
+
+        ex = DatetimeIndex(['2000-01-02', '2000-01-03'])
+        tm.assert_index_equal(result, ex)
+
+    def test_argmin_argmax(self):
+        idx = DatetimeIndex(['2000-01-04', '2000-01-01', '2000-01-02'])
+        assert idx.argmin() == 1
+        assert idx.argmax() == 0
+
+    def test_sort_values(self):
+        idx = DatetimeIndex(['2000-01-04', '2000-01-01', '2000-01-02'])
+
+        ordered = idx.sort_values()
+        assert ordered.is_monotonic
+
+        ordered = idx.sort_values(ascending=False)
+        assert ordered[::-1].is_monotonic
+
+        ordered, dexer = idx.sort_values(return_indexer=True)
+        assert ordered.is_monotonic
+        tm.assert_numpy_array_equal(dexer, np.array([1, 2, 0], dtype=np.intp))
+
+        ordered, dexer = idx.sort_values(return_indexer=True, ascending=False)
+        assert ordered[::-1].is_monotonic
+        tm.assert_numpy_array_equal(dexer, np.array([0, 2, 1], dtype=np.intp))
+
+    def test_map_bug_1677(self):
+        index = DatetimeIndex(['2012-04-25 09:30:00.393000'])
+        f = index.asof
+
+        result = index.map(f)
+        expected = Index([f(index[0])])
+        tm.assert_index_equal(result, expected)
+
+    def test_groupby_function_tuple_1677(self):
+        df = DataFrame(np.random.rand(100),
+                       index=date_range("1/1/2000", periods=100))
+        monthly_group = df.groupby(lambda x: (x.year, x.month))
+
+        result = monthly_group.mean()
+        assert isinstance(result.index[0], tuple)
+
+    def test_append_numpy_bug_1681(self):
+        # another datetime64 bug
+        dr = date_range('2011/1/1', '2012/1/1', freq='W-FRI')
+        a = DataFrame()
+        c = DataFrame({'A': 'foo', 'B': dr}, index=dr)
+
+        result = a.append(c)
+        assert (result['B'] == dr).all()
+
+    def test_isin(self):
+        index = tm.makeDateIndex(4)
+        result = index.isin(index)
+        assert result.all()
+
+        result = index.isin(list(index))
+        assert result.all()
+
+        assert_almost_equal(index.isin([index[2], 5]),
+                            np.array([False, False, True, False]))
+
+    def test_does_not_convert_mixed_integer(self):
+        df = tm.makeCustomDataframe(10, 10,
+                                    data_gen_f=lambda *args, **kwargs: randn(),
+                                    r_idx_type='i', c_idx_type='dt')
+        cols = df.columns.join(df.index, how='outer')
+        joined = cols.join(df.columns)
+        assert cols.dtype == np.dtype('O')
+        assert cols.dtype == joined.dtype
+        tm.assert_numpy_array_equal(cols.values, joined.values)
+
+    def test_join_self(self, join_type):
+        index = date_range('1/1/2000', periods=10)
+        joined = index.join(index, how=join_type)
+        assert index is joined
+
+    def assert_index_parameters(self, index):
+        assert index.freq == '40960N'
+        assert index.inferred_freq == '40960N'
+
+    def test_ns_index(self):
+        nsamples = 400
+        ns = int(1e9 / 24414)
+        dtstart = np.datetime64('2012-09-20T00:00:00')
+
+        dt = dtstart + np.arange(nsamples) * np.timedelta64(ns, 'ns')
+        freq = ns * offsets.Nano()
+        index = pd.DatetimeIndex(dt, freq=freq, name='time')
+        self.assert_index_parameters(index)
+
+        new_index = pd.DatetimeIndex(start=index[0], end=index[-1],
+                                     freq=index.freq)
+        self.assert_index_parameters(new_index)
+
+    def test_join_with_period_index(self, join_type):
+        df = tm.makeCustomDataframe(
+            10, 10, data_gen_f=lambda *args: np.random.randint(2),
+            c_idx_type='p', r_idx_type='dt')
+        s = df.iloc[:5, 0]
+
+        with tm.assert_raises_regex(ValueError,
+                                    'can only call with other '
+                                    'PeriodIndex-ed objects'):
+            df.columns.join(s.index, how=join_type)
+
+    def test_factorize(self):
+        idx1 = DatetimeIndex(['2014-01', '2014-01', '2014-02', '2014-02',
+                              '2014-03', '2014-03'])
+
+        exp_arr = np.array([0, 0, 1, 1, 2, 2], dtype=np.intp)
+        exp_idx = DatetimeIndex(['2014-01', '2014-02', '2014-03'])
+
+        arr, idx = idx1.factorize()
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, exp_idx)
+
+        arr, idx = idx1.factorize(sort=True)
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, exp_idx)
+
+        # tz must be preserved
+        idx1 = idx1.tz_localize('Asia/Tokyo')
+        exp_idx = exp_idx.tz_localize('Asia/Tokyo')
+
+        arr, idx = idx1.factorize()
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, exp_idx)
+
+        idx2 = pd.DatetimeIndex(['2014-03', '2014-03', '2014-02', '2014-01',
+                                 '2014-03', '2014-01'])
+
+        exp_arr = np.array([2, 2, 1, 0, 2, 0], dtype=np.intp)
+        exp_idx = DatetimeIndex(['2014-01', '2014-02', '2014-03'])
+        arr, idx = idx2.factorize(sort=True)
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, exp_idx)
+
+        exp_arr = np.array([0, 0, 1, 2, 0, 2], dtype=np.intp)
+        exp_idx = DatetimeIndex(['2014-03', '2014-02', '2014-01'])
+        arr, idx = idx2.factorize()
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, exp_idx)
+
+        # freq must be preserved
+        idx3 = date_range('2000-01', periods=4, freq='M', tz='Asia/Tokyo')
+        exp_arr = np.array([0, 1, 2, 3], dtype=np.intp)
+        arr, idx = idx3.factorize()
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, idx3)
+
+    def test_factorize_tz(self, tz_naive_fixture):
+        tz = tz_naive_fixture
+        # GH#13750
+        base = pd.date_range('2016-11-05', freq='H', periods=100, tz=tz)
+        idx = base.repeat(5)
+
+        exp_arr = np.arange(100, dtype=np.intp).repeat(5)
+
+        for obj in [idx, pd.Series(idx)]:
+            arr, res = obj.factorize()
+            tm.assert_numpy_array_equal(arr, exp_arr)
+            tm.assert_index_equal(res, base)
+
+    def test_factorize_dst(self):
+        # GH 13750
+        idx = pd.date_range('2016-11-06', freq='H', periods=12,
+                            tz='US/Eastern')
+
+        for obj in [idx, pd.Series(idx)]:
+            arr, res = obj.factorize()
+            tm.assert_numpy_array_equal(arr, np.arange(12, dtype=np.intp))
+            tm.assert_index_equal(res, idx)
+
+        idx = pd.date_range('2016-06-13', freq='H', periods=12,
+                            tz='US/Eastern')
+
+        for obj in [idx, pd.Series(idx)]:
+            arr, res = obj.factorize()
+            tm.assert_numpy_array_equal(arr, np.arange(12, dtype=np.intp))
+            tm.assert_index_equal(res, idx)
+
+    @pytest.mark.parametrize('arr, expected', [
+        (pd.DatetimeIndex(['2017', '2017']), pd.DatetimeIndex(['2017'])),
+        (pd.DatetimeIndex(['2017', '2017'], tz='US/Eastern'),
+         pd.DatetimeIndex(['2017'], tz='US/Eastern')),
+    ])
+    def test_unique(self, arr, expected):
+        result = arr.unique()
+        tm.assert_index_equal(result, expected)
diff --git a/pandas/tests/indexes/datetimes/test_datetimelike.py b/pandas/tests/indexes/datetimes/test_datetimelike.py
new file mode 100644
index 0000000000000..c6b3a77773dc7
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_datetimelike.py
@@ -0,0 +1,31 @@
+""" generic tests from the Datetimelike class """
+
+from pandas.util import testing as tm
+from pandas import DatetimeIndex, date_range
+
+from ..datetimelike import DatetimeLike
+
+
+class TestDatetimeIndex(DatetimeLike):
+    _holder = DatetimeIndex
+
+    def setup_method(self, method):
+        self.indices = dict(index=tm.makeDateIndex(10),
+                            index_dec=date_range('20130110', periods=10,
+                                                 freq='-1D'))
+        self.setup_indices()
+
+    def create_index(self):
+        return date_range('20130101', periods=5)
+
+    def test_shift(self):
+        pass  # handled in test_ops
+
+    def test_pickle_compat_construction(self):
+        pass
+
+    def test_intersection(self):
+        pass  # handled in test_setops
+
+    def test_union(self):
+        pass  # handled in test_setops
diff --git a/pandas/tests/indexes/datetimes/test_formats.py b/pandas/tests/indexes/datetimes/test_formats.py
new file mode 100644
index 0000000000000..63d5338d88d76
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_formats.py
@@ -0,0 +1,221 @@
+from datetime import datetime
+from pandas import DatetimeIndex, Series
+
+import numpy as np
+import dateutil.tz
+import pytz
+import pytest
+
+import pandas.util.testing as tm
+import pandas as pd
+
+
+def test_to_native_types():
+    index = DatetimeIndex(freq='1D', periods=3, start='2017-01-01')
+
+    # First, with no arguments.
+    expected = np.array(['2017-01-01', '2017-01-02',
+                         '2017-01-03'], dtype=object)
+
+    result = index.to_native_types()
+    tm.assert_numpy_array_equal(result, expected)
+
+    # No NaN values, so na_rep has no effect
+    result = index.to_native_types(na_rep='pandas')
+    tm.assert_numpy_array_equal(result, expected)
+
+    # Make sure slicing works
+    expected = np.array(['2017-01-01', '2017-01-03'], dtype=object)
+
+    result = index.to_native_types([0, 2])
+    tm.assert_numpy_array_equal(result, expected)
+
+    # Make sure date formatting works
+    expected = np.array(['01-2017-01', '01-2017-02',
+                         '01-2017-03'], dtype=object)
+
+    result = index.to_native_types(date_format='%m-%Y-%d')
+    tm.assert_numpy_array_equal(result, expected)
+
+    # NULL object handling should work
+    index = DatetimeIndex(['2017-01-01', pd.NaT, '2017-01-03'])
+    expected = np.array(['2017-01-01', 'NaT', '2017-01-03'], dtype=object)
+
+    result = index.to_native_types()
+    tm.assert_numpy_array_equal(result, expected)
+
+    expected = np.array(['2017-01-01', 'pandas',
+                         '2017-01-03'], dtype=object)
+
+    result = index.to_native_types(na_rep='pandas')
+    tm.assert_numpy_array_equal(result, expected)
+
+
+class TestDatetimeIndexRendering(object):
+    def test_dti_repr_short(self):
+        dr = pd.date_range(start='1/1/2012', periods=1)
+        repr(dr)
+
+        dr = pd.date_range(start='1/1/2012', periods=2)
+        repr(dr)
+
+        dr = pd.date_range(start='1/1/2012', periods=3)
+        repr(dr)
+
+    @pytest.mark.parametrize('method', ['__repr__', '__unicode__', '__str__'])
+    def test_dti_representation(self, method):
+        idxs = []
+        idxs.append(DatetimeIndex([], freq='D'))
+        idxs.append(DatetimeIndex(['2011-01-01'], freq='D'))
+        idxs.append(DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D'))
+        idxs.append(DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
+                                  freq='D'))
+        idxs.append(DatetimeIndex(
+            ['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00'
+             ], freq='H', tz='Asia/Tokyo'))
+        idxs.append(DatetimeIndex(
+            ['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT], tz='US/Eastern'))
+        idxs.append(DatetimeIndex(
+            ['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT], tz='UTC'))
+
+        exp = []
+        exp.append("""DatetimeIndex([], dtype='datetime64[ns]', freq='D')""")
+        exp.append("DatetimeIndex(['2011-01-01'], dtype='datetime64[ns]', "
+                   "freq='D')")
+        exp.append("DatetimeIndex(['2011-01-01', '2011-01-02'], "
+                   "dtype='datetime64[ns]', freq='D')")
+        exp.append("DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'], "
+                   "dtype='datetime64[ns]', freq='D')")
+        exp.append("DatetimeIndex(['2011-01-01 09:00:00+09:00', "
+                   "'2011-01-01 10:00:00+09:00', '2011-01-01 11:00:00+09:00']"
+                   ", dtype='datetime64[ns, Asia/Tokyo]', freq='H')")
+        exp.append("DatetimeIndex(['2011-01-01 09:00:00-05:00', "
+                   "'2011-01-01 10:00:00-05:00', 'NaT'], "
+                   "dtype='datetime64[ns, US/Eastern]', freq=None)")
+        exp.append("DatetimeIndex(['2011-01-01 09:00:00+00:00', "
+                   "'2011-01-01 10:00:00+00:00', 'NaT'], "
+                   "dtype='datetime64[ns, UTC]', freq=None)""")
+
+        with pd.option_context('display.width', 300):
+            for indx, expected in zip(idxs, exp):
+                result = getattr(indx, method)()
+                assert result == expected
+
+    def test_dti_representation_to_series(self):
+        idx1 = DatetimeIndex([], freq='D')
+        idx2 = DatetimeIndex(['2011-01-01'], freq='D')
+        idx3 = DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D')
+        idx4 = DatetimeIndex(
+            ['2011-01-01', '2011-01-02', '2011-01-03'], freq='D')
+        idx5 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00',
+                              '2011-01-01 11:00'], freq='H', tz='Asia/Tokyo')
+        idx6 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT],
+                             tz='US/Eastern')
+        idx7 = DatetimeIndex(['2011-01-01 09:00', '2011-01-02 10:15'])
+
+        exp1 = """Series([], dtype: datetime64[ns])"""
+
+        exp2 = ("0   2011-01-01\n"
+                "dtype: datetime64[ns]")
+
+        exp3 = ("0   2011-01-01\n"
+                "1   2011-01-02\n"
+                "dtype: datetime64[ns]")
+
+        exp4 = ("0   2011-01-01\n"
+                "1   2011-01-02\n"
+                "2   2011-01-03\n"
+                "dtype: datetime64[ns]")
+
+        exp5 = ("0   2011-01-01 09:00:00+09:00\n"
+                "1   2011-01-01 10:00:00+09:00\n"
+                "2   2011-01-01 11:00:00+09:00\n"
+                "dtype: datetime64[ns, Asia/Tokyo]")
+
+        exp6 = ("0   2011-01-01 09:00:00-05:00\n"
+                "1   2011-01-01 10:00:00-05:00\n"
+                "2                         NaT\n"
+                "dtype: datetime64[ns, US/Eastern]")
+
+        exp7 = ("0   2011-01-01 09:00:00\n"
+                "1   2011-01-02 10:15:00\n"
+                "dtype: datetime64[ns]")
+
+        with pd.option_context('display.width', 300):
+            for idx, expected in zip([idx1, idx2, idx3, idx4,
+                                      idx5, idx6, idx7],
+                                     [exp1, exp2, exp3, exp4,
+                                      exp5, exp6, exp7]):
+                result = repr(Series(idx))
+                assert result == expected
+
+    def test_dti_summary(self):
+        # GH#9116
+        idx1 = DatetimeIndex([], freq='D')
+        idx2 = DatetimeIndex(['2011-01-01'], freq='D')
+        idx3 = DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D')
+        idx4 = DatetimeIndex(
+            ['2011-01-01', '2011-01-02', '2011-01-03'], freq='D')
+        idx5 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00',
+                              '2011-01-01 11:00'],
+                             freq='H', tz='Asia/Tokyo')
+        idx6 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT],
+                             tz='US/Eastern')
+
+        exp1 = ("DatetimeIndex: 0 entries\n"
+                "Freq: D")
+
+        exp2 = ("DatetimeIndex: 1 entries, 2011-01-01 to 2011-01-01\n"
+                "Freq: D")
+
+        exp3 = ("DatetimeIndex: 2 entries, 2011-01-01 to 2011-01-02\n"
+                "Freq: D")
+
+        exp4 = ("DatetimeIndex: 3 entries, 2011-01-01 to 2011-01-03\n"
+                "Freq: D")
+
+        exp5 = ("DatetimeIndex: 3 entries, 2011-01-01 09:00:00+09:00 "
+                "to 2011-01-01 11:00:00+09:00\n"
+                "Freq: H")
+
+        exp6 = """DatetimeIndex: 3 entries, 2011-01-01 09:00:00-05:00 to NaT"""
+
+        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5, idx6],
+                                 [exp1, exp2, exp3, exp4, exp5, exp6]):
+            result = idx._summary()
+            assert result == expected
+
+    def test_dti_business_repr(self):
+        # only really care that it works
+        repr(pd.bdate_range(datetime(2009, 1, 1), datetime(2010, 1, 1)))
+
+    def test_dti_business_summary(self):
+        rng = pd.bdate_range(datetime(2009, 1, 1), datetime(2010, 1, 1))
+        rng._summary()
+        rng[2:2]._summary()
+
+    def test_dti_business_summary_pytz(self):
+        pd.bdate_range('1/1/2005', '1/1/2009', tz=pytz.utc)._summary()
+
+    def test_dti_business_summary_dateutil(self):
+        pd.bdate_range('1/1/2005', '1/1/2009',
+                       tz=dateutil.tz.tzutc())._summary()
+
+    def test_dti_custom_business_repr(self):
+        # only really care that it works
+        repr(pd.bdate_range(datetime(2009, 1, 1), datetime(2010, 1, 1),
+                            freq='C'))
+
+    def test_dti_custom_business_summary(self):
+        rng = pd.bdate_range(datetime(2009, 1, 1), datetime(2010, 1, 1),
+                             freq='C')
+        rng._summary()
+        rng[2:2]._summary()
+
+    def test_dti_custom_business_summary_pytz(self):
+        pd.bdate_range('1/1/2005', '1/1/2009', freq='C',
+                       tz=pytz.utc)._summary()
+
+    def test_dti_custom_business_summary_dateutil(self):
+        pd.bdate_range('1/1/2005', '1/1/2009', freq='C',
+                       tz=dateutil.tz.tzutc())._summary()
diff --git a/pandas/tests/indexes/datetimes/test_indexing.py b/pandas/tests/indexes/datetimes/test_indexing.py
new file mode 100644
index 0000000000000..8cffa035721b0
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_indexing.py
@@ -0,0 +1,588 @@
+from datetime import datetime, timedelta, time
+import pytest
+
+import pytz
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.compat as compat
+from pandas import notna, Index, DatetimeIndex, date_range, Timestamp
+from pandas.tseries.offsets import CDay, BDay
+
+START, END = datetime(2009, 1, 1), datetime(2010, 1, 1)
+
+
+class TestGetItem(object):
+    def test_getitem(self):
+        idx1 = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
+        idx2 = pd.date_range('2011-01-01', '2011-01-31', freq='D',
+                             tz='Asia/Tokyo', name='idx')
+
+        for idx in [idx1, idx2]:
+            result = idx[0]
+            assert result == Timestamp('2011-01-01', tz=idx.tz)
+
+            result = idx[0:5]
+            expected = pd.date_range('2011-01-01', '2011-01-05', freq='D',
+                                     tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx[0:10:2]
+            expected = pd.date_range('2011-01-01', '2011-01-09', freq='2D',
+                                     tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx[-20:-5:3]
+            expected = pd.date_range('2011-01-12', '2011-01-24', freq='3D',
+                                     tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx[4::-1]
+            expected = DatetimeIndex(['2011-01-05', '2011-01-04', '2011-01-03',
+                                      '2011-01-02', '2011-01-01'],
+                                     freq='-1D', tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+    def test_dti_business_getitem(self):
+        rng = pd.bdate_range(START, END)
+        smaller = rng[:5]
+        exp = DatetimeIndex(rng.view(np.ndarray)[:5])
+        tm.assert_index_equal(smaller, exp)
+
+        assert smaller.freq == rng.freq
+
+        sliced = rng[::5]
+        assert sliced.freq == BDay() * 5
+
+        fancy_indexed = rng[[4, 3, 2, 1, 0]]
+        assert len(fancy_indexed) == 5
+        assert isinstance(fancy_indexed, DatetimeIndex)
+        assert fancy_indexed.freq is None
+
+        # 32-bit vs. 64-bit platforms
+        assert rng[4] == rng[np.int_(4)]
+
+    def test_dti_business_getitem_matplotlib_hackaround(self):
+        rng = pd.bdate_range(START, END)
+        values = rng[:, None]
+        expected = rng.values[:, None]
+        tm.assert_numpy_array_equal(values, expected)
+
+    def test_dti_custom_getitem(self):
+        rng = pd.bdate_range(START, END, freq='C')
+        smaller = rng[:5]
+        exp = DatetimeIndex(rng.view(np.ndarray)[:5])
+        tm.assert_index_equal(smaller, exp)
+        assert smaller.freq == rng.freq
+
+        sliced = rng[::5]
+        assert sliced.freq == CDay() * 5
+
+        fancy_indexed = rng[[4, 3, 2, 1, 0]]
+        assert len(fancy_indexed) == 5
+        assert isinstance(fancy_indexed, DatetimeIndex)
+        assert fancy_indexed.freq is None
+
+        # 32-bit vs. 64-bit platforms
+        assert rng[4] == rng[np.int_(4)]
+
+    def test_dti_custom_getitem_matplotlib_hackaround(self):
+        rng = pd.bdate_range(START, END, freq='C')
+        values = rng[:, None]
+        expected = rng.values[:, None]
+        tm.assert_numpy_array_equal(values, expected)
+
+
+class TestWhere(object):
+    def test_where_other(self):
+        # other is ndarray or Index
+        i = pd.date_range('20130101', periods=3, tz='US/Eastern')
+
+        for arr in [np.nan, pd.NaT]:
+            result = i.where(notna(i), other=np.nan)
+            expected = i
+            tm.assert_index_equal(result, expected)
+
+        i2 = i.copy()
+        i2 = Index([pd.NaT, pd.NaT] + i[2:].tolist())
+        result = i.where(notna(i2), i2)
+        tm.assert_index_equal(result, i2)
+
+        i2 = i.copy()
+        i2 = Index([pd.NaT, pd.NaT] + i[2:].tolist())
+        result = i.where(notna(i2), i2.values)
+        tm.assert_index_equal(result, i2)
+
+    def test_where_tz(self):
+        i = pd.date_range('20130101', periods=3, tz='US/Eastern')
+        result = i.where(notna(i))
+        expected = i
+        tm.assert_index_equal(result, expected)
+
+        i2 = i.copy()
+        i2 = Index([pd.NaT, pd.NaT] + i[2:].tolist())
+        result = i.where(notna(i2))
+        expected = i2
+        tm.assert_index_equal(result, expected)
+
+
+class TestTake(object):
+    def test_take(self):
+        # GH#10295
+        idx1 = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
+        idx2 = pd.date_range('2011-01-01', '2011-01-31', freq='D',
+                             tz='Asia/Tokyo', name='idx')
+
+        for idx in [idx1, idx2]:
+            result = idx.take([0])
+            assert result == Timestamp('2011-01-01', tz=idx.tz)
+
+            result = idx.take([0, 1, 2])
+            expected = pd.date_range('2011-01-01', '2011-01-03', freq='D',
+                                     tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx.take([0, 2, 4])
+            expected = pd.date_range('2011-01-01', '2011-01-05', freq='2D',
+                                     tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx.take([7, 4, 1])
+            expected = pd.date_range('2011-01-08', '2011-01-02', freq='-3D',
+                                     tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx.take([3, 2, 5])
+            expected = DatetimeIndex(['2011-01-04', '2011-01-03',
+                                      '2011-01-06'],
+                                     freq=None, tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq is None
+
+            result = idx.take([-3, 2, 5])
+            expected = DatetimeIndex(['2011-01-29', '2011-01-03',
+                                      '2011-01-06'],
+                                     freq=None, tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq is None
+
+    def test_take_invalid_kwargs(self):
+        idx = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
+        indices = [1, 6, 5, 9, 10, 13, 15, 3]
+
+        msg = r"take\(\) got an unexpected keyword argument 'foo'"
+        tm.assert_raises_regex(TypeError, msg, idx.take,
+                               indices, foo=2)
+
+        msg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, idx.take,
+                               indices, out=indices)
+
+        msg = "the 'mode' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, idx.take,
+                               indices, mode='clip')
+
+    # TODO: This method came from test_datetime; de-dup with version above
+    @pytest.mark.parametrize('tz', [None, 'US/Eastern', 'Asia/Tokyo'])
+    def test_take2(self, tz):
+        dates = [datetime(2010, 1, 1, 14), datetime(2010, 1, 1, 15),
+                 datetime(2010, 1, 1, 17), datetime(2010, 1, 1, 21)]
+
+        idx = DatetimeIndex(start='2010-01-01 09:00',
+                            end='2010-02-01 09:00', freq='H', tz=tz,
+                            name='idx')
+        expected = DatetimeIndex(dates, freq=None, name='idx', tz=tz)
+
+        taken1 = idx.take([5, 6, 8, 12])
+        taken2 = idx[[5, 6, 8, 12]]
+
+        for taken in [taken1, taken2]:
+            tm.assert_index_equal(taken, expected)
+            assert isinstance(taken, DatetimeIndex)
+            assert taken.freq is None
+            assert taken.tz == expected.tz
+            assert taken.name == expected.name
+
+    def test_take_fill_value(self):
+        # GH#12631
+        idx = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'],
+                               name='xxx')
+        result = idx.take(np.array([1, 0, -1]))
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
+                                    name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        # fill_value
+        result = idx.take(np.array([1, 0, -1]), fill_value=True)
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', 'NaT'],
+                                    name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
+                                    name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -2]), fill_value=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            idx.take(np.array([1, -5]))
+
+    def test_take_fill_value_with_timezone(self):
+        idx = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'],
+                               name='xxx', tz='US/Eastern')
+        result = idx.take(np.array([1, 0, -1]))
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
+                                    name='xxx', tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+        # fill_value
+        result = idx.take(np.array([1, 0, -1]), fill_value=True)
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', 'NaT'],
+                                    name='xxx', tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
+                                    name='xxx', tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -2]), fill_value=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            idx.take(np.array([1, -5]))
+
+
+class TestDatetimeIndex(object):
+    @pytest.mark.parametrize('null', [None, np.nan, pd.NaT])
+    @pytest.mark.parametrize('tz', [None, 'UTC', 'US/Eastern'])
+    def test_insert_nat(self, tz, null):
+        # GH#16537, GH#18295 (test missing)
+        idx = pd.DatetimeIndex(['2017-01-01'], tz=tz)
+        expected = pd.DatetimeIndex(['NaT', '2017-01-01'], tz=tz)
+        res = idx.insert(0, null)
+        tm.assert_index_equal(res, expected)
+
+    def test_insert(self):
+        idx = DatetimeIndex(
+            ['2000-01-04', '2000-01-01', '2000-01-02'], name='idx')
+
+        result = idx.insert(2, datetime(2000, 1, 5))
+        exp = DatetimeIndex(['2000-01-04', '2000-01-01', '2000-01-05',
+                             '2000-01-02'], name='idx')
+        tm.assert_index_equal(result, exp)
+
+        # insertion of non-datetime should coerce to object index
+        result = idx.insert(1, 'inserted')
+        expected = Index([datetime(2000, 1, 4), 'inserted',
+                          datetime(2000, 1, 1),
+                          datetime(2000, 1, 2)], name='idx')
+        assert not isinstance(result, DatetimeIndex)
+        tm.assert_index_equal(result, expected)
+        assert result.name == expected.name
+
+        idx = date_range('1/1/2000', periods=3, freq='M', name='idx')
+
+        # preserve freq
+        expected_0 = DatetimeIndex(['1999-12-31', '2000-01-31', '2000-02-29',
+                                    '2000-03-31'], name='idx', freq='M')
+        expected_3 = DatetimeIndex(['2000-01-31', '2000-02-29', '2000-03-31',
+                                    '2000-04-30'], name='idx', freq='M')
+
+        # reset freq to None
+        expected_1_nofreq = DatetimeIndex(['2000-01-31', '2000-01-31',
+                                           '2000-02-29',
+                                           '2000-03-31'], name='idx',
+                                          freq=None)
+        expected_3_nofreq = DatetimeIndex(['2000-01-31', '2000-02-29',
+                                           '2000-03-31',
+                                           '2000-01-02'], name='idx',
+                                          freq=None)
+
+        cases = [(0, datetime(1999, 12, 31), expected_0),
+                 (-3, datetime(1999, 12, 31), expected_0),
+                 (3, datetime(2000, 4, 30), expected_3),
+                 (1, datetime(2000, 1, 31), expected_1_nofreq),
+                 (3, datetime(2000, 1, 2), expected_3_nofreq)]
+
+        for n, d, expected in cases:
+            result = idx.insert(n, d)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+
+        # reset freq to None
+        result = idx.insert(3, datetime(2000, 1, 2))
+        expected = DatetimeIndex(['2000-01-31', '2000-02-29', '2000-03-31',
+                                  '2000-01-02'], name='idx', freq=None)
+        tm.assert_index_equal(result, expected)
+        assert result.name == expected.name
+        assert result.freq is None
+
+        # see gh-7299
+        idx = date_range('1/1/2000', periods=3, freq='D', tz='Asia/Tokyo',
+                         name='idx')
+        with pytest.raises(ValueError):
+            idx.insert(3, pd.Timestamp('2000-01-04'))
+        with pytest.raises(ValueError):
+            idx.insert(3, datetime(2000, 1, 4))
+        with pytest.raises(ValueError):
+            idx.insert(3, pd.Timestamp('2000-01-04', tz='US/Eastern'))
+        with pytest.raises(ValueError):
+            idx.insert(3, datetime(2000, 1, 4,
+                                   tzinfo=pytz.timezone('US/Eastern')))
+
+        for tz in ['US/Pacific', 'Asia/Singapore']:
+            idx = date_range('1/1/2000 09:00', periods=6, freq='H', tz=tz,
+                             name='idx')
+            # preserve freq
+            expected = date_range('1/1/2000 09:00', periods=7, freq='H', tz=tz,
+                                  name='idx')
+            for d in [pd.Timestamp('2000-01-01 15:00', tz=tz),
+                      pytz.timezone(tz).localize(datetime(2000, 1, 1, 15))]:
+
+                result = idx.insert(6, d)
+                tm.assert_index_equal(result, expected)
+                assert result.name == expected.name
+                assert result.freq == expected.freq
+                assert result.tz == expected.tz
+
+            expected = DatetimeIndex(['2000-01-01 09:00', '2000-01-01 10:00',
+                                      '2000-01-01 11:00',
+                                      '2000-01-01 12:00', '2000-01-01 13:00',
+                                      '2000-01-01 14:00',
+                                      '2000-01-01 10:00'], name='idx',
+                                     tz=tz, freq=None)
+            # reset freq to None
+            for d in [pd.Timestamp('2000-01-01 10:00', tz=tz),
+                      pytz.timezone(tz).localize(datetime(2000, 1, 1, 10))]:
+                result = idx.insert(6, d)
+                tm.assert_index_equal(result, expected)
+                assert result.name == expected.name
+                assert result.tz == expected.tz
+                assert result.freq is None
+
+    def test_delete(self):
+        idx = date_range(start='2000-01-01', periods=5, freq='M', name='idx')
+
+        # prserve freq
+        expected_0 = date_range(start='2000-02-01', periods=4, freq='M',
+                                name='idx')
+        expected_4 = date_range(start='2000-01-01', periods=4, freq='M',
+                                name='idx')
+
+        # reset freq to None
+        expected_1 = DatetimeIndex(['2000-01-31', '2000-03-31', '2000-04-30',
+                                    '2000-05-31'], freq=None, name='idx')
+
+        cases = {0: expected_0,
+                 -5: expected_0,
+                 -1: expected_4,
+                 4: expected_4,
+                 1: expected_1}
+        for n, expected in compat.iteritems(cases):
+            result = idx.delete(n)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+
+        with pytest.raises((IndexError, ValueError)):
+            # either depeidnig on numpy version
+            result = idx.delete(5)
+
+        for tz in [None, 'Asia/Tokyo', 'US/Pacific']:
+            idx = date_range(start='2000-01-01 09:00', periods=10, freq='H',
+                             name='idx', tz=tz)
+
+            expected = date_range(start='2000-01-01 10:00', periods=9,
+                                  freq='H', name='idx', tz=tz)
+            result = idx.delete(0)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freqstr == 'H'
+            assert result.tz == expected.tz
+
+            expected = date_range(start='2000-01-01 09:00', periods=9,
+                                  freq='H', name='idx', tz=tz)
+            result = idx.delete(-1)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freqstr == 'H'
+            assert result.tz == expected.tz
+
+    def test_delete_slice(self):
+        idx = date_range(start='2000-01-01', periods=10, freq='D', name='idx')
+
+        # prserve freq
+        expected_0_2 = date_range(start='2000-01-04', periods=7, freq='D',
+                                  name='idx')
+        expected_7_9 = date_range(start='2000-01-01', periods=7, freq='D',
+                                  name='idx')
+
+        # reset freq to None
+        expected_3_5 = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03',
+                                      '2000-01-07', '2000-01-08', '2000-01-09',
+                                      '2000-01-10'], freq=None, name='idx')
+
+        cases = {(0, 1, 2): expected_0_2,
+                 (7, 8, 9): expected_7_9,
+                 (3, 4, 5): expected_3_5}
+        for n, expected in compat.iteritems(cases):
+            result = idx.delete(n)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+
+            result = idx.delete(slice(n[0], n[-1] + 1))
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+
+        for tz in [None, 'Asia/Tokyo', 'US/Pacific']:
+            ts = pd.Series(1, index=pd.date_range(
+                '2000-01-01 09:00', periods=10, freq='H', name='idx', tz=tz))
+            # preserve freq
+            result = ts.drop(ts.index[:5]).index
+            expected = pd.date_range('2000-01-01 14:00', periods=5, freq='H',
+                                     name='idx', tz=tz)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+            assert result.tz == expected.tz
+
+            # reset freq to None
+            result = ts.drop(ts.index[[1, 3, 5, 7, 9]]).index
+            expected = DatetimeIndex(['2000-01-01 09:00', '2000-01-01 11:00',
+                                      '2000-01-01 13:00',
+                                      '2000-01-01 15:00', '2000-01-01 17:00'],
+                                     freq=None, name='idx', tz=tz)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+            assert result.tz == expected.tz
+
+    def test_get_loc(self):
+        idx = pd.date_range('2000-01-01', periods=3)
+
+        for method in [None, 'pad', 'backfill', 'nearest']:
+            assert idx.get_loc(idx[1], method) == 1
+            assert idx.get_loc(idx[1].to_pydatetime(), method) == 1
+            assert idx.get_loc(str(idx[1]), method) == 1
+
+            if method is not None:
+                assert idx.get_loc(idx[1], method,
+                                   tolerance=pd.Timedelta('0 days')) == 1
+
+        assert idx.get_loc('2000-01-01', method='nearest') == 0
+        assert idx.get_loc('2000-01-01T12', method='nearest') == 1
+
+        assert idx.get_loc('2000-01-01T12', method='nearest',
+                           tolerance='1 day') == 1
+        assert idx.get_loc('2000-01-01T12', method='nearest',
+                           tolerance=pd.Timedelta('1D')) == 1
+        assert idx.get_loc('2000-01-01T12', method='nearest',
+                           tolerance=np.timedelta64(1, 'D')) == 1
+        assert idx.get_loc('2000-01-01T12', method='nearest',
+                           tolerance=timedelta(1)) == 1
+        with tm.assert_raises_regex(ValueError,
+                                    'unit abbreviation w/o a number'):
+            idx.get_loc('2000-01-01T12', method='nearest', tolerance='foo')
+        with pytest.raises(KeyError):
+            idx.get_loc('2000-01-01T03', method='nearest', tolerance='2 hours')
+        with pytest.raises(
+                ValueError,
+                match='tolerance size must match target index size'):
+            idx.get_loc('2000-01-01', method='nearest',
+                        tolerance=[pd.Timedelta('1day').to_timedelta64(),
+                                   pd.Timedelta('1day').to_timedelta64()])
+
+        assert idx.get_loc('2000', method='nearest') == slice(0, 3)
+        assert idx.get_loc('2000-01', method='nearest') == slice(0, 3)
+
+        assert idx.get_loc('1999', method='nearest') == 0
+        assert idx.get_loc('2001', method='nearest') == 2
+
+        with pytest.raises(KeyError):
+            idx.get_loc('1999', method='pad')
+        with pytest.raises(KeyError):
+            idx.get_loc('2001', method='backfill')
+
+        with pytest.raises(KeyError):
+            idx.get_loc('foobar')
+        with pytest.raises(TypeError):
+            idx.get_loc(slice(2))
+
+        idx = pd.to_datetime(['2000-01-01', '2000-01-04'])
+        assert idx.get_loc('2000-01-02', method='nearest') == 0
+        assert idx.get_loc('2000-01-03', method='nearest') == 1
+        assert idx.get_loc('2000-01', method='nearest') == slice(0, 2)
+
+        # time indexing
+        idx = pd.date_range('2000-01-01', periods=24, freq='H')
+        tm.assert_numpy_array_equal(idx.get_loc(time(12)),
+                                    np.array([12]), check_dtype=False)
+        tm.assert_numpy_array_equal(idx.get_loc(time(12, 30)),
+                                    np.array([]), check_dtype=False)
+        with pytest.raises(NotImplementedError):
+            idx.get_loc(time(12, 30), method='pad')
+
+    def test_get_indexer(self):
+        idx = pd.date_range('2000-01-01', periods=3)
+        exp = np.array([0, 1, 2], dtype=np.intp)
+        tm.assert_numpy_array_equal(idx.get_indexer(idx), exp)
+
+        target = idx[0] + pd.to_timedelta(['-1 hour', '12 hours',
+                                           '1 day 1 hour'])
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'),
+                                    np.array([-1, 0, 1], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'),
+                                    np.array([0, 1, 2], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'),
+                                    np.array([0, 1, 1], dtype=np.intp))
+        tm.assert_numpy_array_equal(
+            idx.get_indexer(target, 'nearest',
+                            tolerance=pd.Timedelta('1 hour')),
+            np.array([0, -1, 1], dtype=np.intp))
+        tol_raw = [pd.Timedelta('1 hour'),
+                   pd.Timedelta('1 hour'),
+                   pd.Timedelta('1 hour').to_timedelta64(), ]
+        tm.assert_numpy_array_equal(
+            idx.get_indexer(target, 'nearest',
+                            tolerance=[np.timedelta64(x) for x in tol_raw]),
+            np.array([0, -1, 1], dtype=np.intp))
+        tol_bad = [pd.Timedelta('2 hour').to_timedelta64(),
+                   pd.Timedelta('1 hour').to_timedelta64(),
+                   'foo', ]
+        with pytest.raises(
+                ValueError, match='abbreviation w/o a number'):
+            idx.get_indexer(target, 'nearest', tolerance=tol_bad)
+        with pytest.raises(ValueError):
+            idx.get_indexer(idx[[0]], method='nearest', tolerance='foo')
+
+    def test_reasonable_keyerror(self):
+        # GH#1062
+        index = DatetimeIndex(['1/3/2000'])
+        with pytest.raises(KeyError) as excinfo:
+            index.get_loc('1/1/2000')
+        assert '2000' in str(excinfo.value)
diff --git a/pandas/tests/indexes/datetimes/test_misc.py b/pandas/tests/indexes/datetimes/test_misc.py
new file mode 100644
index 0000000000000..056924f2c6663
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_misc.py
@@ -0,0 +1,298 @@
+import locale
+import calendar
+
+import pytest
+
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import (Index, DatetimeIndex, datetime, offsets,
+                    date_range, Timestamp)
+
+
+class TestTimeSeries(object):
+
+    def test_pass_datetimeindex_to_index(self):
+        # Bugs in #1396
+        rng = date_range('1/1/2000', '3/1/2000')
+        idx = Index(rng, dtype=object)
+
+        expected = Index(rng.to_pydatetime(), dtype=object)
+
+        tm.assert_numpy_array_equal(idx.values, expected.values)
+
+    def test_range_edges(self):
+        # GH 13672
+        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:00:00.000000001'),
+                            end=Timestamp('1970-01-01 00:00:00.000000004'),
+                            freq='N')
+        exp = DatetimeIndex(['1970-01-01 00:00:00.000000001',
+                             '1970-01-01 00:00:00.000000002',
+                             '1970-01-01 00:00:00.000000003',
+                             '1970-01-01 00:00:00.000000004'])
+        tm.assert_index_equal(idx, exp)
+
+        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:00:00.000000004'),
+                            end=Timestamp('1970-01-01 00:00:00.000000001'),
+                            freq='N')
+        exp = DatetimeIndex([])
+        tm.assert_index_equal(idx, exp)
+
+        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:00:00.000000001'),
+                            end=Timestamp('1970-01-01 00:00:00.000000001'),
+                            freq='N')
+        exp = DatetimeIndex(['1970-01-01 00:00:00.000000001'])
+        tm.assert_index_equal(idx, exp)
+
+        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:00:00.000001'),
+                            end=Timestamp('1970-01-01 00:00:00.000004'),
+                            freq='U')
+        exp = DatetimeIndex(['1970-01-01 00:00:00.000001',
+                             '1970-01-01 00:00:00.000002',
+                             '1970-01-01 00:00:00.000003',
+                             '1970-01-01 00:00:00.000004'])
+        tm.assert_index_equal(idx, exp)
+
+        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:00:00.001'),
+                            end=Timestamp('1970-01-01 00:00:00.004'),
+                            freq='L')
+        exp = DatetimeIndex(['1970-01-01 00:00:00.001',
+                             '1970-01-01 00:00:00.002',
+                             '1970-01-01 00:00:00.003',
+                             '1970-01-01 00:00:00.004'])
+        tm.assert_index_equal(idx, exp)
+
+        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:00:01'),
+                            end=Timestamp('1970-01-01 00:00:04'), freq='S')
+        exp = DatetimeIndex(['1970-01-01 00:00:01', '1970-01-01 00:00:02',
+                             '1970-01-01 00:00:03', '1970-01-01 00:00:04'])
+        tm.assert_index_equal(idx, exp)
+
+        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:01'),
+                            end=Timestamp('1970-01-01 00:04'), freq='T')
+        exp = DatetimeIndex(['1970-01-01 00:01', '1970-01-01 00:02',
+                             '1970-01-01 00:03', '1970-01-01 00:04'])
+        tm.assert_index_equal(idx, exp)
+
+        idx = DatetimeIndex(start=Timestamp('1970-01-01 01:00'),
+                            end=Timestamp('1970-01-01 04:00'), freq='H')
+        exp = DatetimeIndex(['1970-01-01 01:00', '1970-01-01 02:00',
+                             '1970-01-01 03:00', '1970-01-01 04:00'])
+        tm.assert_index_equal(idx, exp)
+
+        idx = DatetimeIndex(start=Timestamp('1970-01-01'),
+                            end=Timestamp('1970-01-04'), freq='D')
+        exp = DatetimeIndex(['1970-01-01', '1970-01-02',
+                             '1970-01-03', '1970-01-04'])
+        tm.assert_index_equal(idx, exp)
+
+
+class TestDatetime64(object):
+
+    def test_datetimeindex_accessors(self):
+        dti_naive = DatetimeIndex(freq='D', start=datetime(1998, 1, 1),
+                                  periods=365)
+        # GH 13303
+        dti_tz = DatetimeIndex(freq='D', start=datetime(1998, 1, 1),
+                               periods=365, tz='US/Eastern')
+        for dti in [dti_naive, dti_tz]:
+
+            assert dti.year[0] == 1998
+            assert dti.month[0] == 1
+            assert dti.day[0] == 1
+            assert dti.hour[0] == 0
+            assert dti.minute[0] == 0
+            assert dti.second[0] == 0
+            assert dti.microsecond[0] == 0
+            assert dti.dayofweek[0] == 3
+
+            assert dti.dayofyear[0] == 1
+            assert dti.dayofyear[120] == 121
+
+            assert dti.weekofyear[0] == 1
+            assert dti.weekofyear[120] == 18
+
+            assert dti.quarter[0] == 1
+            assert dti.quarter[120] == 2
+
+            assert dti.days_in_month[0] == 31
+            assert dti.days_in_month[90] == 30
+
+            assert dti.is_month_start[0]
+            assert not dti.is_month_start[1]
+            assert dti.is_month_start[31]
+            assert dti.is_quarter_start[0]
+            assert dti.is_quarter_start[90]
+            assert dti.is_year_start[0]
+            assert not dti.is_year_start[364]
+            assert not dti.is_month_end[0]
+            assert dti.is_month_end[30]
+            assert not dti.is_month_end[31]
+            assert dti.is_month_end[364]
+            assert not dti.is_quarter_end[0]
+            assert not dti.is_quarter_end[30]
+            assert dti.is_quarter_end[89]
+            assert dti.is_quarter_end[364]
+            assert not dti.is_year_end[0]
+            assert dti.is_year_end[364]
+
+            assert len(dti.year) == 365
+            assert len(dti.month) == 365
+            assert len(dti.day) == 365
+            assert len(dti.hour) == 365
+            assert len(dti.minute) == 365
+            assert len(dti.second) == 365
+            assert len(dti.microsecond) == 365
+            assert len(dti.dayofweek) == 365
+            assert len(dti.dayofyear) == 365
+            assert len(dti.weekofyear) == 365
+            assert len(dti.quarter) == 365
+            assert len(dti.is_month_start) == 365
+            assert len(dti.is_month_end) == 365
+            assert len(dti.is_quarter_start) == 365
+            assert len(dti.is_quarter_end) == 365
+            assert len(dti.is_year_start) == 365
+            assert len(dti.is_year_end) == 365
+            assert len(dti.weekday_name) == 365
+
+            dti.name = 'name'
+
+            # non boolean accessors -> return Index
+            for accessor in DatetimeIndex._field_ops:
+                res = getattr(dti, accessor)
+                assert len(res) == 365
+                assert isinstance(res, Index)
+                assert res.name == 'name'
+
+            # boolean accessors -> return array
+            for accessor in DatetimeIndex._bool_ops:
+                res = getattr(dti, accessor)
+                assert len(res) == 365
+                assert isinstance(res, np.ndarray)
+
+            # test boolean indexing
+            res = dti[dti.is_quarter_start]
+            exp = dti[[0, 90, 181, 273]]
+            tm.assert_index_equal(res, exp)
+            res = dti[dti.is_leap_year]
+            exp = DatetimeIndex([], freq='D', tz=dti.tz, name='name')
+            tm.assert_index_equal(res, exp)
+
+        dti = DatetimeIndex(freq='BQ-FEB', start=datetime(1998, 1, 1),
+                            periods=4)
+
+        assert sum(dti.is_quarter_start) == 0
+        assert sum(dti.is_quarter_end) == 4
+        assert sum(dti.is_year_start) == 0
+        assert sum(dti.is_year_end) == 1
+
+        # Ensure is_start/end accessors throw ValueError for CustomBusinessDay,
+        # CBD requires np >= 1.7
+        bday_egypt = offsets.CustomBusinessDay(weekmask='Sun Mon Tue Wed Thu')
+        dti = date_range(datetime(2013, 4, 30), periods=5, freq=bday_egypt)
+        pytest.raises(ValueError, lambda: dti.is_month_start)
+
+        dti = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03'])
+
+        assert dti.is_month_start[0] == 1
+
+        tests = [
+            (Timestamp('2013-06-01', freq='M').is_month_start, 1),
+            (Timestamp('2013-06-01', freq='BM').is_month_start, 0),
+            (Timestamp('2013-06-03', freq='M').is_month_start, 0),
+            (Timestamp('2013-06-03', freq='BM').is_month_start, 1),
+            (Timestamp('2013-02-28', freq='Q-FEB').is_month_end, 1),
+            (Timestamp('2013-02-28', freq='Q-FEB').is_quarter_end, 1),
+            (Timestamp('2013-02-28', freq='Q-FEB').is_year_end, 1),
+            (Timestamp('2013-03-01', freq='Q-FEB').is_month_start, 1),
+            (Timestamp('2013-03-01', freq='Q-FEB').is_quarter_start, 1),
+            (Timestamp('2013-03-01', freq='Q-FEB').is_year_start, 1),
+            (Timestamp('2013-03-31', freq='QS-FEB').is_month_end, 1),
+            (Timestamp('2013-03-31', freq='QS-FEB').is_quarter_end, 0),
+            (Timestamp('2013-03-31', freq='QS-FEB').is_year_end, 0),
+            (Timestamp('2013-02-01', freq='QS-FEB').is_month_start, 1),
+            (Timestamp('2013-02-01', freq='QS-FEB').is_quarter_start, 1),
+            (Timestamp('2013-02-01', freq='QS-FEB').is_year_start, 1),
+            (Timestamp('2013-06-30', freq='BQ').is_month_end, 0),
+            (Timestamp('2013-06-30', freq='BQ').is_quarter_end, 0),
+            (Timestamp('2013-06-30', freq='BQ').is_year_end, 0),
+            (Timestamp('2013-06-28', freq='BQ').is_month_end, 1),
+            (Timestamp('2013-06-28', freq='BQ').is_quarter_end, 1),
+            (Timestamp('2013-06-28', freq='BQ').is_year_end, 0),
+            (Timestamp('2013-06-30', freq='BQS-APR').is_month_end, 0),
+            (Timestamp('2013-06-30', freq='BQS-APR').is_quarter_end, 0),
+            (Timestamp('2013-06-30', freq='BQS-APR').is_year_end, 0),
+            (Timestamp('2013-06-28', freq='BQS-APR').is_month_end, 1),
+            (Timestamp('2013-06-28', freq='BQS-APR').is_quarter_end, 1),
+            (Timestamp('2013-03-29', freq='BQS-APR').is_year_end, 1),
+            (Timestamp('2013-11-01', freq='AS-NOV').is_year_start, 1),
+            (Timestamp('2013-10-31', freq='AS-NOV').is_year_end, 1),
+            (Timestamp('2012-02-01').days_in_month, 29),
+            (Timestamp('2013-02-01').days_in_month, 28)]
+
+        for ts, value in tests:
+            assert ts == value
+
+        # GH 6538: Check that DatetimeIndex and its TimeStamp elements
+        # return the same weekofyear accessor close to new year w/ tz
+        dates = ["2013/12/29", "2013/12/30", "2013/12/31"]
+        dates = DatetimeIndex(dates, tz="Europe/Brussels")
+        expected = [52, 1, 1]
+        assert dates.weekofyear.tolist() == expected
+        assert [d.weekofyear for d in dates] == expected
+
+    # GH 12806
+    @pytest.mark.parametrize('time_locale', [
+        None] if tm.get_locales() is None else [None] + tm.get_locales())
+    def test_datetime_name_accessors(self, time_locale):
+        # Test Monday -> Sunday and January -> December, in that sequence
+        if time_locale is None:
+            # If the time_locale is None, day-name and month_name should
+            # return the english attributes
+            expected_days = ['Monday', 'Tuesday', 'Wednesday', 'Thursday',
+                             'Friday', 'Saturday', 'Sunday']
+            expected_months = ['January', 'February', 'March', 'April', 'May',
+                               'June', 'July', 'August', 'September',
+                               'October', 'November', 'December']
+        else:
+            with tm.set_locale(time_locale, locale.LC_TIME):
+                expected_days = calendar.day_name[:]
+                expected_months = calendar.month_name[1:]
+
+        # GH 11128
+        dti = DatetimeIndex(freq='D', start=datetime(1998, 1, 1),
+                            periods=365)
+        english_days = ['Monday', 'Tuesday', 'Wednesday', 'Thursday',
+                        'Friday', 'Saturday', 'Sunday']
+        for day, name, eng_name in zip(range(4, 11),
+                                       expected_days,
+                                       english_days):
+            name = name.capitalize()
+            assert dti.weekday_name[day] == eng_name
+            assert dti.day_name(locale=time_locale)[day] == name
+            ts = Timestamp(datetime(2016, 4, day))
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                assert ts.weekday_name == eng_name
+            assert ts.day_name(locale=time_locale) == name
+        dti = dti.append(DatetimeIndex([pd.NaT]))
+        assert np.isnan(dti.day_name(locale=time_locale)[-1])
+        ts = Timestamp(pd.NaT)
+        assert np.isnan(ts.day_name(locale=time_locale))
+
+        # GH 12805
+        dti = DatetimeIndex(freq='M', start='2012', end='2013')
+        result = dti.month_name(locale=time_locale)
+        expected = Index([month.capitalize() for month in expected_months])
+        tm.assert_index_equal(result, expected)
+        for date, expected in zip(dti, expected_months):
+            result = date.month_name(locale=time_locale)
+            assert result == expected.capitalize()
+        dti = dti.append(DatetimeIndex([pd.NaT]))
+        assert np.isnan(dti.month_name(locale=time_locale)[-1])
+
+    def test_nanosecond_field(self):
+        dti = DatetimeIndex(np.arange(10))
+
+        tm.assert_index_equal(dti.nanosecond,
+                              pd.Index(np.arange(10, dtype=np.int64)))
diff --git a/pandas/tests/indexes/datetimes/test_missing.py b/pandas/tests/indexes/datetimes/test_missing.py
new file mode 100644
index 0000000000000..c8d47caa7e947
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_missing.py
@@ -0,0 +1,52 @@
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+
+
+class TestDatetimeIndex(object):
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'Asia/Tokyo'])
+    def test_fillna_datetime64(self, tz):
+        # GH 11343
+        idx = pd.DatetimeIndex(['2011-01-01 09:00', pd.NaT,
+                                '2011-01-01 11:00'])
+
+        exp = pd.DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00',
+                                '2011-01-01 11:00'])
+        tm.assert_index_equal(
+            idx.fillna(pd.Timestamp('2011-01-01 10:00')), exp)
+
+        # tz mismatch
+        exp = pd.Index([pd.Timestamp('2011-01-01 09:00'),
+                        pd.Timestamp('2011-01-01 10:00', tz=tz),
+                        pd.Timestamp('2011-01-01 11:00')], dtype=object)
+        tm.assert_index_equal(
+            idx.fillna(pd.Timestamp('2011-01-01 10:00', tz=tz)), exp)
+
+        # object
+        exp = pd.Index([pd.Timestamp('2011-01-01 09:00'), 'x',
+                        pd.Timestamp('2011-01-01 11:00')], dtype=object)
+        tm.assert_index_equal(idx.fillna('x'), exp)
+
+        idx = pd.DatetimeIndex(['2011-01-01 09:00', pd.NaT,
+                                '2011-01-01 11:00'], tz=tz)
+
+        exp = pd.DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00',
+                                '2011-01-01 11:00'], tz=tz)
+        tm.assert_index_equal(
+            idx.fillna(pd.Timestamp('2011-01-01 10:00', tz=tz)), exp)
+
+        exp = pd.Index([pd.Timestamp('2011-01-01 09:00', tz=tz),
+                        pd.Timestamp('2011-01-01 10:00'),
+                        pd.Timestamp('2011-01-01 11:00', tz=tz)],
+                       dtype=object)
+        tm.assert_index_equal(
+            idx.fillna(pd.Timestamp('2011-01-01 10:00')), exp)
+
+        # object
+        exp = pd.Index([pd.Timestamp('2011-01-01 09:00', tz=tz),
+                        'x',
+                        pd.Timestamp('2011-01-01 11:00', tz=tz)],
+                       dtype=object)
+        tm.assert_index_equal(idx.fillna('x'), exp)
diff --git a/pandas/tests/indexes/datetimes/test_ops.py b/pandas/tests/indexes/datetimes/test_ops.py
new file mode 100644
index 0000000000000..c6334e70a1d2c
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_ops.py
@@ -0,0 +1,554 @@
+import pytest
+import warnings
+import numpy as np
+from datetime import datetime
+
+import pandas as pd
+import pandas._libs.tslib as tslib
+import pandas.util.testing as tm
+from pandas import (DatetimeIndex, PeriodIndex, Series, Timestamp,
+                    date_range, _np_version_under1p10, Index,
+                    bdate_range)
+from pandas.tseries.offsets import BMonthEnd, CDay, BDay, Day, Hour
+from pandas.tests.test_base import Ops
+from pandas.core.dtypes.generic import ABCDateOffset
+
+
+@pytest.fixture(params=[None, 'UTC', 'Asia/Tokyo', 'US/Eastern',
+                        'dateutil/Asia/Singapore',
+                        'dateutil/US/Pacific'])
+def tz_fixture(request):
+    return request.param
+
+
+START, END = datetime(2009, 1, 1), datetime(2010, 1, 1)
+
+
+class TestDatetimeIndexOps(Ops):
+
+    def setup_method(self, method):
+        super(TestDatetimeIndexOps, self).setup_method(method)
+        mask = lambda x: (isinstance(x, DatetimeIndex) or
+                          isinstance(x, PeriodIndex))
+        self.is_valid_objs = [o for o in self.objs if mask(o)]
+        self.not_valid_objs = [o for o in self.objs if not mask(o)]
+
+    def test_ops_properties(self):
+        f = lambda x: isinstance(x, DatetimeIndex)
+        self.check_ops_properties(DatetimeIndex._field_ops, f)
+        self.check_ops_properties(DatetimeIndex._object_ops, f)
+        self.check_ops_properties(DatetimeIndex._bool_ops, f)
+
+    def test_ops_properties_basic(self):
+
+        # sanity check that the behavior didn't change
+        # GH7206
+        for op in ['year', 'day', 'second', 'weekday']:
+            pytest.raises(TypeError, lambda x: getattr(self.dt_series, op))
+
+        # attribute access should still work!
+        s = Series(dict(year=2000, month=1, day=10))
+        assert s.year == 2000
+        assert s.month == 1
+        assert s.day == 10
+        pytest.raises(AttributeError, lambda: s.weekday)
+
+    def test_minmax_tz(self, tz_fixture):
+        tz = tz_fixture
+        # monotonic
+        idx1 = pd.DatetimeIndex(['2011-01-01', '2011-01-02',
+                                 '2011-01-03'], tz=tz)
+        assert idx1.is_monotonic
+
+        # non-monotonic
+        idx2 = pd.DatetimeIndex(['2011-01-01', pd.NaT, '2011-01-03',
+                                 '2011-01-02', pd.NaT], tz=tz)
+        assert not idx2.is_monotonic
+
+        for idx in [idx1, idx2]:
+            assert idx.min() == Timestamp('2011-01-01', tz=tz)
+            assert idx.max() == Timestamp('2011-01-03', tz=tz)
+            assert idx.argmin() == 0
+            assert idx.argmax() == 2
+
+    @pytest.mark.parametrize('op', ['min', 'max'])
+    def test_minmax_nat(self, op):
+        # Return NaT
+        obj = DatetimeIndex([])
+        assert pd.isna(getattr(obj, op)())
+
+        obj = DatetimeIndex([pd.NaT])
+        assert pd.isna(getattr(obj, op)())
+
+        obj = DatetimeIndex([pd.NaT, pd.NaT, pd.NaT])
+        assert pd.isna(getattr(obj, op)())
+
+    def test_numpy_minmax(self):
+        dr = pd.date_range(start='2016-01-15', end='2016-01-20')
+
+        assert np.min(dr) == Timestamp('2016-01-15 00:00:00', freq='D')
+        assert np.max(dr) == Timestamp('2016-01-20 00:00:00', freq='D')
+
+        errmsg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, errmsg, np.min, dr, out=0)
+        tm.assert_raises_regex(ValueError, errmsg, np.max, dr, out=0)
+
+        assert np.argmin(dr) == 0
+        assert np.argmax(dr) == 5
+
+        if not _np_version_under1p10:
+            errmsg = "the 'out' parameter is not supported"
+            tm.assert_raises_regex(
+                ValueError, errmsg, np.argmin, dr, out=0)
+            tm.assert_raises_regex(
+                ValueError, errmsg, np.argmax, dr, out=0)
+
+    def test_repeat_range(self, tz_fixture):
+        tz = tz_fixture
+        rng = date_range('1/1/2000', '1/1/2001')
+
+        result = rng.repeat(5)
+        assert result.freq is None
+        assert len(result) == 5 * len(rng)
+
+        index = pd.date_range('2001-01-01', periods=2, freq='D', tz=tz)
+        exp = pd.DatetimeIndex(['2001-01-01', '2001-01-01',
+                                '2001-01-02', '2001-01-02'], tz=tz)
+        for res in [index.repeat(2), np.repeat(index, 2)]:
+            tm.assert_index_equal(res, exp)
+            assert res.freq is None
+
+        index = pd.date_range('2001-01-01', periods=2, freq='2D', tz=tz)
+        exp = pd.DatetimeIndex(['2001-01-01', '2001-01-01',
+                                '2001-01-03', '2001-01-03'], tz=tz)
+        for res in [index.repeat(2), np.repeat(index, 2)]:
+            tm.assert_index_equal(res, exp)
+            assert res.freq is None
+
+        index = pd.DatetimeIndex(['2001-01-01', 'NaT', '2003-01-01'],
+                                 tz=tz)
+        exp = pd.DatetimeIndex(['2001-01-01', '2001-01-01', '2001-01-01',
+                                'NaT', 'NaT', 'NaT',
+                                '2003-01-01', '2003-01-01', '2003-01-01'],
+                               tz=tz)
+        for res in [index.repeat(3), np.repeat(index, 3)]:
+            tm.assert_index_equal(res, exp)
+            assert res.freq is None
+
+    def test_repeat(self, tz_fixture):
+        tz = tz_fixture
+        reps = 2
+        msg = "the 'axis' parameter is not supported"
+
+        rng = pd.date_range(start='2016-01-01', periods=2,
+                            freq='30Min', tz=tz)
+
+        expected_rng = DatetimeIndex([
+            Timestamp('2016-01-01 00:00:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 00:00:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 00:30:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 00:30:00', tz=tz, freq='30T'),
+        ])
+
+        res = rng.repeat(reps)
+        tm.assert_index_equal(res, expected_rng)
+        assert res.freq is None
+
+        tm.assert_index_equal(np.repeat(rng, reps), expected_rng)
+        tm.assert_raises_regex(ValueError, msg, np.repeat,
+                               rng, reps, axis=1)
+
+    def test_resolution(self, tz_fixture):
+        tz = tz_fixture
+        for freq, expected in zip(['A', 'Q', 'M', 'D', 'H', 'T',
+                                   'S', 'L', 'U'],
+                                  ['day', 'day', 'day', 'day', 'hour',
+                                   'minute', 'second', 'millisecond',
+                                   'microsecond']):
+            idx = pd.date_range(start='2013-04-01', periods=30, freq=freq,
+                                tz=tz)
+            assert idx.resolution == expected
+
+    def test_value_counts_unique(self, tz_fixture):
+        tz = tz_fixture
+        # GH 7735
+        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=10)
+        # create repeated values, 'n'th element is repeated by n+1 times
+        idx = DatetimeIndex(np.repeat(idx.values, range(1, len(idx) + 1)),
+                            tz=tz)
+
+        exp_idx = pd.date_range('2011-01-01 18:00', freq='-1H', periods=10,
+                                tz=tz)
+        expected = Series(range(10, 0, -1), index=exp_idx, dtype='int64')
+
+        for obj in [idx, Series(idx)]:
+            tm.assert_series_equal(obj.value_counts(), expected)
+
+        expected = pd.date_range('2011-01-01 09:00', freq='H', periods=10,
+                                 tz=tz)
+        tm.assert_index_equal(idx.unique(), expected)
+
+        idx = DatetimeIndex(['2013-01-01 09:00', '2013-01-01 09:00',
+                             '2013-01-01 09:00', '2013-01-01 08:00',
+                             '2013-01-01 08:00', pd.NaT], tz=tz)
+
+        exp_idx = DatetimeIndex(['2013-01-01 09:00', '2013-01-01 08:00'],
+                                tz=tz)
+        expected = Series([3, 2], index=exp_idx)
+
+        for obj in [idx, Series(idx)]:
+            tm.assert_series_equal(obj.value_counts(), expected)
+
+        exp_idx = DatetimeIndex(['2013-01-01 09:00', '2013-01-01 08:00',
+                                 pd.NaT], tz=tz)
+        expected = Series([3, 2, 1], index=exp_idx)
+
+        for obj in [idx, Series(idx)]:
+            tm.assert_series_equal(obj.value_counts(dropna=False),
+                                   expected)
+
+        tm.assert_index_equal(idx.unique(), exp_idx)
+
+    def test_nonunique_contains(self):
+        # GH 9512
+        for idx in map(DatetimeIndex,
+                       ([0, 1, 0], [0, 0, -1], [0, -1, -1],
+                        ['2015', '2015', '2016'], ['2015', '2015', '2014'])):
+            assert idx[0] in idx
+
+    @pytest.mark.parametrize('idx',
+                             [
+                                 DatetimeIndex(
+                                     ['2011-01-01',
+                                      '2011-01-02',
+                                      '2011-01-03'],
+                                     freq='D', name='idx'),
+                                 DatetimeIndex(
+                                     ['2011-01-01 09:00',
+                                      '2011-01-01 10:00',
+                                      '2011-01-01 11:00'],
+                                     freq='H', name='tzidx', tz='Asia/Tokyo')
+                             ])
+    def test_order_with_freq(self, idx):
+        ordered = idx.sort_values()
+        tm.assert_index_equal(ordered, idx)
+        assert ordered.freq == idx.freq
+
+        ordered = idx.sort_values(ascending=False)
+        expected = idx[::-1]
+        tm.assert_index_equal(ordered, expected)
+        assert ordered.freq == expected.freq
+        assert ordered.freq.n == -1
+
+        ordered, indexer = idx.sort_values(return_indexer=True)
+        tm.assert_index_equal(ordered, idx)
+        tm.assert_numpy_array_equal(indexer, np.array([0, 1, 2]),
+                                    check_dtype=False)
+        assert ordered.freq == idx.freq
+
+        ordered, indexer = idx.sort_values(return_indexer=True,
+                                           ascending=False)
+        expected = idx[::-1]
+        tm.assert_index_equal(ordered, expected)
+        tm.assert_numpy_array_equal(indexer,
+                                    np.array([2, 1, 0]),
+                                    check_dtype=False)
+        assert ordered.freq == expected.freq
+        assert ordered.freq.n == -1
+
+    @pytest.mark.parametrize('index_dates,expected_dates', [
+        (['2011-01-01', '2011-01-03', '2011-01-05',
+          '2011-01-02', '2011-01-01'],
+         ['2011-01-01', '2011-01-01', '2011-01-02',
+          '2011-01-03', '2011-01-05']),
+        (['2011-01-01', '2011-01-03', '2011-01-05',
+          '2011-01-02', '2011-01-01'],
+         ['2011-01-01', '2011-01-01', '2011-01-02',
+          '2011-01-03', '2011-01-05']),
+        ([pd.NaT, '2011-01-03', '2011-01-05',
+          '2011-01-02', pd.NaT],
+         [pd.NaT, pd.NaT, '2011-01-02', '2011-01-03',
+          '2011-01-05'])
+    ])
+    def test_order_without_freq(self, index_dates, expected_dates, tz_fixture):
+        tz = tz_fixture
+
+        # without freq
+        index = DatetimeIndex(index_dates, tz=tz, name='idx')
+        expected = DatetimeIndex(expected_dates, tz=tz, name='idx')
+
+        ordered = index.sort_values()
+        tm.assert_index_equal(ordered, expected)
+        assert ordered.freq is None
+
+        ordered = index.sort_values(ascending=False)
+        tm.assert_index_equal(ordered, expected[::-1])
+        assert ordered.freq is None
+
+        ordered, indexer = index.sort_values(return_indexer=True)
+        tm.assert_index_equal(ordered, expected)
+
+        exp = np.array([0, 4, 3, 1, 2])
+        tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+        assert ordered.freq is None
+
+        ordered, indexer = index.sort_values(return_indexer=True,
+                                             ascending=False)
+        tm.assert_index_equal(ordered, expected[::-1])
+
+        exp = np.array([2, 1, 3, 4, 0])
+        tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+        assert ordered.freq is None
+
+    def test_drop_duplicates_metadata(self):
+        # GH 10115
+        idx = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
+        result = idx.drop_duplicates()
+        tm.assert_index_equal(idx, result)
+        assert idx.freq == result.freq
+
+        idx_dup = idx.append(idx)
+        assert idx_dup.freq is None  # freq is reset
+        result = idx_dup.drop_duplicates()
+        tm.assert_index_equal(idx, result)
+        assert result.freq is None
+
+    def test_drop_duplicates(self):
+        # to check Index/Series compat
+        base = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
+        idx = base.append(base[:5])
+
+        res = idx.drop_duplicates()
+        tm.assert_index_equal(res, base)
+        res = Series(idx).drop_duplicates()
+        tm.assert_series_equal(res, Series(base))
+
+        res = idx.drop_duplicates(keep='last')
+        exp = base[5:].append(base[:5])
+        tm.assert_index_equal(res, exp)
+        res = Series(idx).drop_duplicates(keep='last')
+        tm.assert_series_equal(res, Series(exp, index=np.arange(5, 36)))
+
+        res = idx.drop_duplicates(keep=False)
+        tm.assert_index_equal(res, base[5:])
+        res = Series(idx).drop_duplicates(keep=False)
+        tm.assert_series_equal(res, Series(base[5:], index=np.arange(5, 31)))
+
+    @pytest.mark.parametrize('freq', [
+        'A', '2A', '-2A', 'Q', '-1Q', 'M', '-1M', 'D', '3D',
+        '-3D', 'W', '-1W', 'H', '2H', '-2H', 'T', '2T', 'S',
+        '-3S'])
+    def test_infer_freq(self, freq):
+        # GH 11018
+        idx = pd.date_range('2011-01-01 09:00:00', freq=freq, periods=10)
+        result = pd.DatetimeIndex(idx.asi8, freq='infer')
+        tm.assert_index_equal(idx, result)
+        assert result.freq == freq
+
+    def test_nat_new(self):
+        idx = pd.date_range('2011-01-01', freq='D', periods=5, name='x')
+        result = idx._nat_new()
+        exp = pd.DatetimeIndex([pd.NaT] * 5, name='x')
+        tm.assert_index_equal(result, exp)
+
+        result = idx._nat_new(box=False)
+        exp = np.array([tslib.iNaT] * 5, dtype=np.int64)
+        tm.assert_numpy_array_equal(result, exp)
+
+    def test_nat(self, tz_naive_fixture):
+        timezone = tz_naive_fixture
+        assert pd.DatetimeIndex._na_value is pd.NaT
+        assert pd.DatetimeIndex([])._na_value is pd.NaT
+
+        idx = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], tz=timezone)
+        assert idx._can_hold_na
+
+        tm.assert_numpy_array_equal(idx._isnan, np.array([False, False]))
+        assert not idx.hasnans
+        tm.assert_numpy_array_equal(idx._nan_idxs,
+                                    np.array([], dtype=np.intp))
+
+        idx = pd.DatetimeIndex(['2011-01-01', 'NaT'], tz=timezone)
+        assert idx._can_hold_na
+
+        tm.assert_numpy_array_equal(idx._isnan, np.array([False, True]))
+        assert idx.hasnans
+        tm.assert_numpy_array_equal(idx._nan_idxs,
+                                    np.array([1], dtype=np.intp))
+
+    def test_equals(self):
+        # GH 13107
+        idx = pd.DatetimeIndex(['2011-01-01', '2011-01-02', 'NaT'])
+        assert idx.equals(idx)
+        assert idx.equals(idx.copy())
+        assert idx.equals(idx.astype(object))
+        assert idx.astype(object).equals(idx)
+        assert idx.astype(object).equals(idx.astype(object))
+        assert not idx.equals(list(idx))
+        assert not idx.equals(pd.Series(idx))
+
+        idx2 = pd.DatetimeIndex(['2011-01-01', '2011-01-02', 'NaT'],
+                                tz='US/Pacific')
+        assert not idx.equals(idx2)
+        assert not idx.equals(idx2.copy())
+        assert not idx.equals(idx2.astype(object))
+        assert not idx.astype(object).equals(idx2)
+        assert not idx.equals(list(idx2))
+        assert not idx.equals(pd.Series(idx2))
+
+        # same internal, different tz
+        idx3 = pd.DatetimeIndex._simple_new(idx.asi8, tz='US/Pacific')
+        tm.assert_numpy_array_equal(idx.asi8, idx3.asi8)
+        assert not idx.equals(idx3)
+        assert not idx.equals(idx3.copy())
+        assert not idx.equals(idx3.astype(object))
+        assert not idx.astype(object).equals(idx3)
+        assert not idx.equals(list(idx3))
+        assert not idx.equals(pd.Series(idx3))
+
+    @pytest.mark.parametrize('values', [
+        ['20180101', '20180103', '20180105'], []])
+    @pytest.mark.parametrize('freq', [
+        '2D', Day(2), '2B', BDay(2), '48H', Hour(48)])
+    @pytest.mark.parametrize('tz', [None, 'US/Eastern'])
+    def test_freq_setter(self, values, freq, tz):
+        # GH 20678
+        idx = DatetimeIndex(values, tz=tz)
+
+        # can set to an offset, converting from string if necessary
+        idx.freq = freq
+        assert idx.freq == freq
+        assert isinstance(idx.freq, ABCDateOffset)
+
+        # can reset to None
+        idx.freq = None
+        assert idx.freq is None
+
+    def test_freq_setter_errors(self):
+        # GH 20678
+        idx = DatetimeIndex(['20180101', '20180103', '20180105'])
+
+        # setting with an incompatible freq
+        msg = ('Inferred frequency 2D from passed values does not conform to '
+               'passed frequency 5D')
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.freq = '5D'
+
+        # setting with non-freq string
+        with tm.assert_raises_regex(ValueError, 'Invalid frequency'):
+            idx.freq = 'foo'
+
+    def test_offset_deprecated(self):
+        # GH 20716
+        idx = pd.DatetimeIndex(['20180101', '20180102'])
+
+        # getter deprecated
+        with tm.assert_produces_warning(FutureWarning):
+            idx.offset
+
+        # setter deprecated
+        with tm.assert_produces_warning(FutureWarning):
+            idx.offset = BDay()
+
+
+class TestBusinessDatetimeIndex(object):
+
+    def setup_method(self, method):
+        self.rng = bdate_range(START, END)
+
+    def test_comparison(self):
+        d = self.rng[10]
+
+        comp = self.rng > d
+        assert comp[11]
+        assert not comp[9]
+
+    def test_pickle_unpickle(self):
+        unpickled = tm.round_trip_pickle(self.rng)
+        assert unpickled.freq is not None
+
+    def test_copy(self):
+        cp = self.rng.copy()
+        repr(cp)
+        tm.assert_index_equal(cp, self.rng)
+
+    def test_shift(self):
+        shifted = self.rng.shift(5)
+        assert shifted[0] == self.rng[5]
+        assert shifted.freq == self.rng.freq
+
+        shifted = self.rng.shift(-5)
+        assert shifted[5] == self.rng[0]
+        assert shifted.freq == self.rng.freq
+
+        shifted = self.rng.shift(0)
+        assert shifted[0] == self.rng[0]
+        assert shifted.freq == self.rng.freq
+
+        rng = date_range(START, END, freq=BMonthEnd())
+        shifted = rng.shift(1, freq=BDay())
+        assert shifted[0] == rng[0] + BDay()
+
+    def test_equals(self):
+        assert not self.rng.equals(list(self.rng))
+
+    def test_identical(self):
+        t1 = self.rng.copy()
+        t2 = self.rng.copy()
+        assert t1.identical(t2)
+
+        # name
+        t1 = t1.rename('foo')
+        assert t1.equals(t2)
+        assert not t1.identical(t2)
+        t2 = t2.rename('foo')
+        assert t1.identical(t2)
+
+        # freq
+        t2v = Index(t2.values)
+        assert t1.equals(t2v)
+        assert not t1.identical(t2v)
+
+
+class TestCustomDatetimeIndex(object):
+    def setup_method(self, method):
+        self.rng = bdate_range(START, END, freq='C')
+
+    def test_comparison(self):
+        d = self.rng[10]
+
+        comp = self.rng > d
+        assert comp[11]
+        assert not comp[9]
+
+    def test_copy(self):
+        cp = self.rng.copy()
+        repr(cp)
+        tm.assert_index_equal(cp, self.rng)
+
+    def test_shift(self):
+
+        shifted = self.rng.shift(5)
+        assert shifted[0] == self.rng[5]
+        assert shifted.freq == self.rng.freq
+
+        shifted = self.rng.shift(-5)
+        assert shifted[5] == self.rng[0]
+        assert shifted.freq == self.rng.freq
+
+        shifted = self.rng.shift(0)
+        assert shifted[0] == self.rng[0]
+        assert shifted.freq == self.rng.freq
+
+        # PerformanceWarning
+        with warnings.catch_warnings(record=True):
+            rng = date_range(START, END, freq=BMonthEnd())
+            shifted = rng.shift(1, freq=CDay())
+            assert shifted[0] == rng[0] + CDay()
+
+    def test_pickle_unpickle(self):
+        unpickled = tm.round_trip_pickle(self.rng)
+        assert unpickled.freq is not None
+
+    def test_equals(self):
+        assert not self.rng.equals(list(self.rng))
diff --git a/pandas/tests/indexes/datetimes/test_partial_slicing.py b/pandas/tests/indexes/datetimes/test_partial_slicing.py
new file mode 100644
index 0000000000000..e1e80e50e31f0
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_partial_slicing.py
@@ -0,0 +1,389 @@
+""" test partial slicing on Series/Frame """
+
+import pytest
+
+from datetime import datetime
+import numpy as np
+import pandas as pd
+import operator as op
+
+from pandas import (DatetimeIndex, Series, DataFrame,
+                    date_range, Index, Timedelta, Timestamp)
+from pandas.util import testing as tm
+
+from pandas.core.indexing import IndexingError
+
+
+class TestSlicing(object):
+    def test_dti_slicing(self):
+        dti = DatetimeIndex(start='1/1/2005', end='12/1/2005', freq='M')
+        dti2 = dti[[1, 3, 5]]
+
+        v1 = dti2[0]
+        v2 = dti2[1]
+        v3 = dti2[2]
+
+        assert v1 == Timestamp('2/28/2005')
+        assert v2 == Timestamp('4/30/2005')
+        assert v3 == Timestamp('6/30/2005')
+
+        # don't carry freq through irregular slicing
+        assert dti2.freq is None
+
+    def test_slice_keeps_name(self):
+        # GH4226
+        st = pd.Timestamp('2013-07-01 00:00:00', tz='America/Los_Angeles')
+        et = pd.Timestamp('2013-07-02 00:00:00', tz='America/Los_Angeles')
+        dr = pd.date_range(st, et, freq='H', name='timebucket')
+        assert dr[1:].name == dr.name
+
+    def test_slice_with_negative_step(self):
+        ts = Series(np.arange(20),
+                    date_range('2014-01-01', periods=20, freq='MS'))
+        SLC = pd.IndexSlice
+
+        def assert_slices_equivalent(l_slc, i_slc):
+            tm.assert_series_equal(ts[l_slc], ts.iloc[i_slc])
+            tm.assert_series_equal(ts.loc[l_slc], ts.iloc[i_slc])
+            tm.assert_series_equal(ts.loc[l_slc], ts.iloc[i_slc])
+
+        assert_slices_equivalent(SLC[Timestamp('2014-10-01')::-1], SLC[9::-1])
+        assert_slices_equivalent(SLC['2014-10-01'::-1], SLC[9::-1])
+
+        assert_slices_equivalent(SLC[:Timestamp('2014-10-01'):-1], SLC[:8:-1])
+        assert_slices_equivalent(SLC[:'2014-10-01':-1], SLC[:8:-1])
+
+        assert_slices_equivalent(SLC['2015-02-01':'2014-10-01':-1],
+                                 SLC[13:8:-1])
+        assert_slices_equivalent(SLC[Timestamp('2015-02-01'):Timestamp(
+            '2014-10-01'):-1], SLC[13:8:-1])
+        assert_slices_equivalent(SLC['2015-02-01':Timestamp('2014-10-01'):-1],
+                                 SLC[13:8:-1])
+        assert_slices_equivalent(SLC[Timestamp('2015-02-01'):'2014-10-01':-1],
+                                 SLC[13:8:-1])
+
+        assert_slices_equivalent(SLC['2014-10-01':'2015-02-01':-1], SLC[:0])
+
+    def test_slice_with_zero_step_raises(self):
+        ts = Series(np.arange(20),
+                    date_range('2014-01-01', periods=20, freq='MS'))
+        tm.assert_raises_regex(ValueError, 'slice step cannot be zero',
+                               lambda: ts[::0])
+        tm.assert_raises_regex(ValueError, 'slice step cannot be zero',
+                               lambda: ts.loc[::0])
+        tm.assert_raises_regex(ValueError, 'slice step cannot be zero',
+                               lambda: ts.loc[::0])
+
+    def test_slice_bounds_empty(self):
+        # GH 14354
+        empty_idx = DatetimeIndex(freq='1H', periods=0, end='2015')
+
+        right = empty_idx._maybe_cast_slice_bound('2015-01-02', 'right', 'loc')
+        exp = Timestamp('2015-01-02 23:59:59.999999999')
+        assert right == exp
+
+        left = empty_idx._maybe_cast_slice_bound('2015-01-02', 'left', 'loc')
+        exp = Timestamp('2015-01-02 00:00:00')
+        assert left == exp
+
+    def test_slice_duplicate_monotonic(self):
+        # https://github.com/pandas-dev/pandas/issues/16515
+        idx = pd.DatetimeIndex(['2017', '2017'])
+        result = idx._maybe_cast_slice_bound('2017-01-01', 'left', 'loc')
+        expected = Timestamp('2017-01-01')
+        assert result == expected
+
+    def test_monotone_DTI_indexing_bug(self):
+        # GH 19362
+        # Testing accessing the first element in a montononic descending
+        # partial string indexing.
+
+        df = pd.DataFrame(list(range(5)))
+        date_list = ['2018-01-02', '2017-02-10', '2016-03-10',
+                     '2015-03-15', '2014-03-16']
+        date_index = pd.to_datetime(date_list)
+        df['date'] = date_index
+        expected = pd.DataFrame({0: list(range(5)), 'date': date_index})
+        tm.assert_frame_equal(df, expected)
+
+        df = pd.DataFrame({'A': [1, 2, 3]},
+                          index=pd.date_range('20170101',
+                                              periods=3)[::-1])
+        expected = pd.DataFrame({'A': 1},
+                                index=pd.date_range('20170103',
+                                                    periods=1))
+        tm.assert_frame_equal(df.loc['2017-01-03'], expected)
+
+    def test_slice_year(self):
+        dti = DatetimeIndex(freq='B', start=datetime(2005, 1, 1), periods=500)
+
+        s = Series(np.arange(len(dti)), index=dti)
+        result = s['2005']
+        expected = s[s.index.year == 2005]
+        tm.assert_series_equal(result, expected)
+
+        df = DataFrame(np.random.rand(len(dti), 5), index=dti)
+        result = df.loc['2005']
+        expected = df[df.index.year == 2005]
+        tm.assert_frame_equal(result, expected)
+
+        rng = date_range('1/1/2000', '1/1/2010')
+
+        result = rng.get_loc('2009')
+        expected = slice(3288, 3653)
+        assert result == expected
+
+    def test_slice_quarter(self):
+        dti = DatetimeIndex(freq='D', start=datetime(2000, 6, 1), periods=500)
+
+        s = Series(np.arange(len(dti)), index=dti)
+        assert len(s['2001Q1']) == 90
+
+        df = DataFrame(np.random.rand(len(dti), 5), index=dti)
+        assert len(df.loc['1Q01']) == 90
+
+    def test_slice_month(self):
+        dti = DatetimeIndex(freq='D', start=datetime(2005, 1, 1), periods=500)
+        s = Series(np.arange(len(dti)), index=dti)
+        assert len(s['2005-11']) == 30
+
+        df = DataFrame(np.random.rand(len(dti), 5), index=dti)
+        assert len(df.loc['2005-11']) == 30
+
+        tm.assert_series_equal(s['2005-11'], s['11-2005'])
+
+    def test_partial_slice(self):
+        rng = DatetimeIndex(freq='D', start=datetime(2005, 1, 1), periods=500)
+        s = Series(np.arange(len(rng)), index=rng)
+
+        result = s['2005-05':'2006-02']
+        expected = s['20050501':'20060228']
+        tm.assert_series_equal(result, expected)
+
+        result = s['2005-05':]
+        expected = s['20050501':]
+        tm.assert_series_equal(result, expected)
+
+        result = s[:'2006-02']
+        expected = s[:'20060228']
+        tm.assert_series_equal(result, expected)
+
+        result = s['2005-1-1']
+        assert result == s.iloc[0]
+
+        pytest.raises(Exception, s.__getitem__, '2004-12-31')
+
+    def test_partial_slice_daily(self):
+        rng = DatetimeIndex(freq='H', start=datetime(2005, 1, 31), periods=500)
+        s = Series(np.arange(len(rng)), index=rng)
+
+        result = s['2005-1-31']
+        tm.assert_series_equal(result, s.iloc[:24])
+
+        pytest.raises(Exception, s.__getitem__, '2004-12-31 00')
+
+    def test_partial_slice_hourly(self):
+        rng = DatetimeIndex(freq='T', start=datetime(2005, 1, 1, 20, 0, 0),
+                            periods=500)
+        s = Series(np.arange(len(rng)), index=rng)
+
+        result = s['2005-1-1']
+        tm.assert_series_equal(result, s.iloc[:60 * 4])
+
+        result = s['2005-1-1 20']
+        tm.assert_series_equal(result, s.iloc[:60])
+
+        assert s['2005-1-1 20:00'] == s.iloc[0]
+        pytest.raises(Exception, s.__getitem__, '2004-12-31 00:15')
+
+    def test_partial_slice_minutely(self):
+        rng = DatetimeIndex(freq='S', start=datetime(2005, 1, 1, 23, 59, 0),
+                            periods=500)
+        s = Series(np.arange(len(rng)), index=rng)
+
+        result = s['2005-1-1 23:59']
+        tm.assert_series_equal(result, s.iloc[:60])
+
+        result = s['2005-1-1']
+        tm.assert_series_equal(result, s.iloc[:60])
+
+        assert s[Timestamp('2005-1-1 23:59:00')] == s.iloc[0]
+        pytest.raises(Exception, s.__getitem__, '2004-12-31 00:00:00')
+
+    def test_partial_slice_second_precision(self):
+        rng = DatetimeIndex(start=datetime(2005, 1, 1, 0, 0, 59,
+                                           microsecond=999990),
+                            periods=20, freq='US')
+        s = Series(np.arange(20), rng)
+
+        tm.assert_series_equal(s['2005-1-1 00:00'], s.iloc[:10])
+        tm.assert_series_equal(s['2005-1-1 00:00:59'], s.iloc[:10])
+
+        tm.assert_series_equal(s['2005-1-1 00:01'], s.iloc[10:])
+        tm.assert_series_equal(s['2005-1-1 00:01:00'], s.iloc[10:])
+
+        assert s[Timestamp('2005-1-1 00:00:59.999990')] == s.iloc[0]
+        tm.assert_raises_regex(KeyError, '2005-1-1 00:00:00',
+                               lambda: s['2005-1-1 00:00:00'])
+
+    def test_partial_slicing_dataframe(self):
+        # GH14856
+        # Test various combinations of string slicing resolution vs.
+        # index resolution
+        # - If string resolution is less precise than index resolution,
+        # string is considered a slice
+        # - If string resolution is equal to or more precise than index
+        # resolution, string is considered an exact match
+        formats = ['%Y', '%Y-%m', '%Y-%m-%d', '%Y-%m-%d %H',
+                   '%Y-%m-%d %H:%M', '%Y-%m-%d %H:%M:%S']
+        resolutions = ['year', 'month', 'day', 'hour', 'minute', 'second']
+        for rnum, resolution in enumerate(resolutions[2:], 2):
+            # we check only 'day', 'hour', 'minute' and 'second'
+            unit = Timedelta("1 " + resolution)
+            middate = datetime(2012, 1, 1, 0, 0, 0)
+            index = DatetimeIndex([middate - unit,
+                                   middate, middate + unit])
+            values = [1, 2, 3]
+            df = DataFrame({'a': values}, index, dtype=np.int64)
+            assert df.index.resolution == resolution
+
+            # Timestamp with the same resolution as index
+            # Should be exact match for Series (return scalar)
+            # and raise KeyError for Frame
+            for timestamp, expected in zip(index, values):
+                ts_string = timestamp.strftime(formats[rnum])
+                # make ts_string as precise as index
+                result = df['a'][ts_string]
+                assert isinstance(result, np.int64)
+                assert result == expected
+                pytest.raises(KeyError, df.__getitem__, ts_string)
+
+            # Timestamp with resolution less precise than index
+            for fmt in formats[:rnum]:
+                for element, theslice in [[0, slice(None, 1)],
+                                          [1, slice(1, None)]]:
+                    ts_string = index[element].strftime(fmt)
+
+                    # Series should return slice
+                    result = df['a'][ts_string]
+                    expected = df['a'][theslice]
+                    tm.assert_series_equal(result, expected)
+
+                    # Frame should return slice as well
+                    result = df[ts_string]
+                    expected = df[theslice]
+                    tm.assert_frame_equal(result, expected)
+
+            # Timestamp with resolution more precise than index
+            # Compatible with existing key
+            # Should return scalar for Series
+            # and raise KeyError for Frame
+            for fmt in formats[rnum + 1:]:
+                ts_string = index[1].strftime(fmt)
+                result = df['a'][ts_string]
+                assert isinstance(result, np.int64)
+                assert result == 2
+                pytest.raises(KeyError, df.__getitem__, ts_string)
+
+            # Not compatible with existing key
+            # Should raise KeyError
+            for fmt, res in list(zip(formats, resolutions))[rnum + 1:]:
+                ts = index[1] + Timedelta("1 " + res)
+                ts_string = ts.strftime(fmt)
+                pytest.raises(KeyError, df['a'].__getitem__, ts_string)
+                pytest.raises(KeyError, df.__getitem__, ts_string)
+
+    def test_partial_slicing_with_multiindex(self):
+
+        # GH 4758
+        # partial string indexing with a multi-index buggy
+        df = DataFrame({'ACCOUNT': ["ACCT1", "ACCT1", "ACCT1", "ACCT2"],
+                        'TICKER': ["ABC", "MNP", "XYZ", "XYZ"],
+                        'val': [1, 2, 3, 4]},
+                       index=date_range("2013-06-19 09:30:00",
+                                        periods=4, freq='5T'))
+        df_multi = df.set_index(['ACCOUNT', 'TICKER'], append=True)
+
+        expected = DataFrame([
+            [1]
+        ], index=Index(['ABC'], name='TICKER'), columns=['val'])
+        result = df_multi.loc[('2013-06-19 09:30:00', 'ACCT1')]
+        tm.assert_frame_equal(result, expected)
+
+        expected = df_multi.loc[
+            (pd.Timestamp('2013-06-19 09:30:00', tz=None), 'ACCT1', 'ABC')]
+        result = df_multi.loc[('2013-06-19 09:30:00', 'ACCT1', 'ABC')]
+        tm.assert_series_equal(result, expected)
+
+        # this is an IndexingError as we don't do partial string selection on
+        # multi-levels.
+        def f():
+            df_multi.loc[('2013-06-19', 'ACCT1', 'ABC')]
+
+        pytest.raises(IndexingError, f)
+
+        # GH 4294
+        # partial slice on a series mi
+        s = pd.DataFrame(np.random.rand(1000, 1000), index=pd.date_range(
+            '2000-1-1', periods=1000)).stack()
+
+        s2 = s[:-1].copy()
+        expected = s2['2000-1-4']
+        result = s2[pd.Timestamp('2000-1-4')]
+        tm.assert_series_equal(result, expected)
+
+        result = s[pd.Timestamp('2000-1-4')]
+        expected = s['2000-1-4']
+        tm.assert_series_equal(result, expected)
+
+        df2 = pd.DataFrame(s)
+        expected = df2.xs('2000-1-4')
+        result = df2.loc[pd.Timestamp('2000-1-4')]
+        tm.assert_frame_equal(result, expected)
+
+    def test_partial_slice_doesnt_require_monotonicity(self):
+        # For historical reasons.
+        s = pd.Series(np.arange(10), pd.date_range('2014-01-01', periods=10))
+
+        nonmonotonic = s[[3, 5, 4]]
+        expected = nonmonotonic.iloc[:0]
+        timestamp = pd.Timestamp('2014-01-10')
+
+        tm.assert_series_equal(nonmonotonic['2014-01-10':], expected)
+        tm.assert_raises_regex(KeyError,
+                               r"Timestamp\('2014-01-10 00:00:00'\)",
+                               lambda: nonmonotonic[timestamp:])
+
+        tm.assert_series_equal(nonmonotonic.loc['2014-01-10':], expected)
+        tm.assert_raises_regex(KeyError,
+                               r"Timestamp\('2014-01-10 00:00:00'\)",
+                               lambda: nonmonotonic.loc[timestamp:])
+
+    def test_loc_datetime_length_one(self):
+        # GH16071
+        df = pd.DataFrame(columns=['1'],
+                          index=pd.date_range('2016-10-01T00:00:00',
+                                              '2016-10-01T23:59:59'))
+        result = df.loc[datetime(2016, 10, 1):]
+        tm.assert_frame_equal(result, df)
+
+        result = df.loc['2016-10-01T00:00:00':]
+        tm.assert_frame_equal(result, df)
+
+    @pytest.mark.parametrize('datetimelike', [
+        Timestamp('20130101'), datetime(2013, 1, 1),
+        np.datetime64('2013-01-01T00:00', 'ns')])
+    @pytest.mark.parametrize('op,expected', [
+        (op.lt, [True, False, False, False]),
+        (op.le, [True, True, False, False]),
+        (op.eq, [False, True, False, False]),
+        (op.gt, [False, False, False, True])])
+    def test_selection_by_datetimelike(self, datetimelike, op, expected):
+        # GH issue #17965, test for ability to compare datetime64[ns] columns
+        # to datetimelike
+        df = DataFrame({'A': [pd.Timestamp('20120101'),
+                              pd.Timestamp('20130101'),
+                              np.nan, pd.Timestamp('20130103')]})
+        result = op(df.A, datetimelike)
+        expected = Series(expected, name='A')
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/indexes/datetimes/test_scalar_compat.py b/pandas/tests/indexes/datetimes/test_scalar_compat.py
new file mode 100644
index 0000000000000..801dcb91b124e
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_scalar_compat.py
@@ -0,0 +1,236 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for DatetimeIndex methods behaving like their Timestamp counterparts
+"""
+from datetime import datetime
+
+import numpy as np
+import pytest
+
+import pandas.util.testing as tm
+import pandas as pd
+
+from pandas import date_range, Timestamp, DatetimeIndex
+
+
+@pytest.fixture(params=[None, 'UTC', 'Asia/Tokyo',
+                        'US/Eastern', 'dateutil/Asia/Singapore',
+                        'dateutil/US/Pacific'])
+def tz(request):
+    return request.param
+
+
+class TestDatetimeIndexOps(object):
+    def test_dti_time(self):
+        rng = date_range('1/1/2000', freq='12min', periods=10)
+        result = pd.Index(rng).time
+        expected = [t.time() for t in rng]
+        assert (result == expected).all()
+
+    def test_dti_date(self):
+        rng = date_range('1/1/2000', freq='12H', periods=10)
+        result = pd.Index(rng).date
+        expected = [t.date() for t in rng]
+        assert (result == expected).all()
+
+    def test_dti_date_out_of_range(self):
+        # GH#1475
+        pytest.raises(ValueError, DatetimeIndex, ['1400-01-01'])
+        pytest.raises(ValueError, DatetimeIndex, [datetime(1400, 1, 1)])
+
+    @pytest.mark.parametrize('field', [
+        'dayofweek', 'dayofyear', 'week', 'weekofyear', 'quarter',
+        'days_in_month', 'is_month_start', 'is_month_end',
+        'is_quarter_start', 'is_quarter_end', 'is_year_start',
+        'is_year_end', 'weekday_name'])
+    def test_dti_timestamp_fields(self, field):
+        # extra fields from DatetimeIndex like quarter and week
+        idx = tm.makeDateIndex(100)
+        expected = getattr(idx, field)[-1]
+        if field == 'weekday_name':
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = getattr(Timestamp(idx[-1]), field)
+        else:
+            result = getattr(Timestamp(idx[-1]), field)
+        assert result == expected
+
+    def test_dti_timestamp_freq_fields(self):
+        # extra fields from DatetimeIndex like quarter and week
+        idx = tm.makeDateIndex(100)
+
+        assert idx.freq == Timestamp(idx[-1], idx.freq).freq
+        assert idx.freqstr == Timestamp(idx[-1], idx.freq).freqstr
+
+    # ----------------------------------------------------------------
+    # DatetimeIndex.round
+
+    def test_round_daily(self):
+        dti = date_range('20130101 09:10:11', periods=5)
+        result = dti.round('D')
+        expected = date_range('20130101', periods=5)
+        tm.assert_index_equal(result, expected)
+
+        dti = dti.tz_localize('UTC').tz_convert('US/Eastern')
+        result = dti.round('D')
+        expected = date_range('20130101',
+                              periods=5).tz_localize('US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+        result = dti.round('s')
+        tm.assert_index_equal(result, dti)
+
+        # invalid
+        for freq in ['Y', 'M', 'foobar']:
+            pytest.raises(ValueError, lambda: dti.round(freq))
+
+    def test_round(self, tz):
+        rng = date_range(start='2016-01-01', periods=5,
+                         freq='30Min', tz=tz)
+        elt = rng[1]
+
+        expected_rng = DatetimeIndex([
+            Timestamp('2016-01-01 00:00:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 00:00:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 01:00:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 02:00:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 02:00:00', tz=tz, freq='30T'),
+        ])
+        expected_elt = expected_rng[1]
+
+        tm.assert_index_equal(rng.round(freq='H'), expected_rng)
+        assert elt.round(freq='H') == expected_elt
+
+        msg = pd._libs.tslibs.frequencies._INVALID_FREQ_ERROR
+        with tm.assert_raises_regex(ValueError, msg):
+            rng.round(freq='foo')
+        with tm.assert_raises_regex(ValueError, msg):
+            elt.round(freq='foo')
+
+        msg = "<MonthEnd> is a non-fixed frequency"
+        tm.assert_raises_regex(ValueError, msg, rng.round, freq='M')
+        tm.assert_raises_regex(ValueError, msg, elt.round, freq='M')
+
+        # GH#14440 & GH#15578
+        index = DatetimeIndex(['2016-10-17 12:00:00.0015'], tz=tz)
+        result = index.round('ms')
+        expected = DatetimeIndex(['2016-10-17 12:00:00.002000'], tz=tz)
+        tm.assert_index_equal(result, expected)
+
+        for freq in ['us', 'ns']:
+            tm.assert_index_equal(index, index.round(freq))
+
+        index = DatetimeIndex(['2016-10-17 12:00:00.00149'], tz=tz)
+        result = index.round('ms')
+        expected = DatetimeIndex(['2016-10-17 12:00:00.001000'], tz=tz)
+        tm.assert_index_equal(result, expected)
+
+        index = DatetimeIndex(['2016-10-17 12:00:00.001501031'])
+        result = index.round('10ns')
+        expected = DatetimeIndex(['2016-10-17 12:00:00.001501030'])
+        tm.assert_index_equal(result, expected)
+
+        with tm.assert_produces_warning():
+            ts = '2016-10-17 12:00:00.001501031'
+            DatetimeIndex([ts]).round('1010ns')
+
+    def test_no_rounding_occurs(self, tz):
+        # GH 21262
+        rng = date_range(start='2016-01-01', periods=5,
+                         freq='2Min', tz=tz)
+
+        expected_rng = DatetimeIndex([
+            Timestamp('2016-01-01 00:00:00', tz=tz, freq='2T'),
+            Timestamp('2016-01-01 00:02:00', tz=tz, freq='2T'),
+            Timestamp('2016-01-01 00:04:00', tz=tz, freq='2T'),
+            Timestamp('2016-01-01 00:06:00', tz=tz, freq='2T'),
+            Timestamp('2016-01-01 00:08:00', tz=tz, freq='2T'),
+        ])
+
+        tm.assert_index_equal(rng.round(freq='2T'), expected_rng)
+
+    @pytest.mark.parametrize('test_input, rounder, freq, expected', [
+        (['2117-01-01 00:00:45'], 'floor', '15s', ['2117-01-01 00:00:45']),
+        (['2117-01-01 00:00:45'], 'ceil', '15s', ['2117-01-01 00:00:45']),
+        (['2117-01-01 00:00:45.000000012'], 'floor', '10ns',
+         ['2117-01-01 00:00:45.000000010']),
+        (['1823-01-01 00:00:01.000000012'], 'ceil', '10ns',
+         ['1823-01-01 00:00:01.000000020']),
+        (['1823-01-01 00:00:01'], 'floor', '1s', ['1823-01-01 00:00:01']),
+        (['1823-01-01 00:00:01'], 'ceil', '1s', ['1823-01-01 00:00:01']),
+        (['2018-01-01 00:15:00'], 'ceil', '15T', ['2018-01-01 00:15:00']),
+        (['2018-01-01 00:15:00'], 'floor', '15T', ['2018-01-01 00:15:00']),
+        (['1823-01-01 03:00:00'], 'ceil', '3H', ['1823-01-01 03:00:00']),
+        (['1823-01-01 03:00:00'], 'floor', '3H', ['1823-01-01 03:00:00']),
+        (('NaT', '1823-01-01 00:00:01'), 'floor', '1s',
+         ('NaT', '1823-01-01 00:00:01')),
+        (('NaT', '1823-01-01 00:00:01'), 'ceil', '1s',
+         ('NaT', '1823-01-01 00:00:01'))
+    ])
+    def test_ceil_floor_edge(self, tz, test_input, rounder, freq, expected):
+        dt = DatetimeIndex(list(test_input))
+        func = getattr(dt, rounder)
+        result = func(freq)
+        expected = DatetimeIndex(list(expected))
+        assert expected.equals(result)
+
+    # ----------------------------------------------------------------
+    # DatetimeIndex.normalize
+
+    def test_normalize(self):
+        rng = date_range('1/1/2000 9:30', periods=10, freq='D')
+
+        result = rng.normalize()
+        expected = date_range('1/1/2000', periods=10, freq='D')
+        tm.assert_index_equal(result, expected)
+
+        arr_ns = np.array([1380585623454345752,
+                           1380585612343234312]).astype("datetime64[ns]")
+        rng_ns = DatetimeIndex(arr_ns)
+        rng_ns_normalized = rng_ns.normalize()
+
+        arr_ns = np.array([1380585600000000000,
+                           1380585600000000000]).astype("datetime64[ns]")
+        expected = DatetimeIndex(arr_ns)
+        tm.assert_index_equal(rng_ns_normalized, expected)
+
+        assert result.is_normalized
+        assert not rng.is_normalized
+
+
+class TestDateTimeIndexToJulianDate(object):
+
+    def test_1700(self):
+        dr = date_range(start=Timestamp('1710-10-01'), periods=5, freq='D')
+        r1 = pd.Index([x.to_julian_date() for x in dr])
+        r2 = dr.to_julian_date()
+        assert isinstance(r2, pd.Float64Index)
+        tm.assert_index_equal(r1, r2)
+
+    def test_2000(self):
+        dr = date_range(start=Timestamp('2000-02-27'), periods=5, freq='D')
+        r1 = pd.Index([x.to_julian_date() for x in dr])
+        r2 = dr.to_julian_date()
+        assert isinstance(r2, pd.Float64Index)
+        tm.assert_index_equal(r1, r2)
+
+    def test_hour(self):
+        dr = date_range(start=Timestamp('2000-02-27'), periods=5, freq='H')
+        r1 = pd.Index([x.to_julian_date() for x in dr])
+        r2 = dr.to_julian_date()
+        assert isinstance(r2, pd.Float64Index)
+        tm.assert_index_equal(r1, r2)
+
+    def test_minute(self):
+        dr = date_range(start=Timestamp('2000-02-27'), periods=5, freq='T')
+        r1 = pd.Index([x.to_julian_date() for x in dr])
+        r2 = dr.to_julian_date()
+        assert isinstance(r2, pd.Float64Index)
+        tm.assert_index_equal(r1, r2)
+
+    def test_second(self):
+        dr = date_range(start=Timestamp('2000-02-27'), periods=5, freq='S')
+        r1 = pd.Index([x.to_julian_date() for x in dr])
+        r2 = dr.to_julian_date()
+        assert isinstance(r2, pd.Float64Index)
+        tm.assert_index_equal(r1, r2)
diff --git a/pandas/tests/indexes/datetimes/test_setops.py b/pandas/tests/indexes/datetimes/test_setops.py
new file mode 100644
index 0000000000000..cb9364edc0cc3
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_setops.py
@@ -0,0 +1,486 @@
+from datetime import datetime
+
+import pytest
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas import (DatetimeIndex, date_range, Series, bdate_range, DataFrame,
+                    Int64Index, Index, to_datetime)
+from pandas.tseries.offsets import Minute, BMonthEnd, MonthEnd
+
+START, END = datetime(2009, 1, 1), datetime(2010, 1, 1)
+
+
+class TestDatetimeIndexSetOps(object):
+    tz = [None, 'UTC', 'Asia/Tokyo', 'US/Eastern', 'dateutil/Asia/Singapore',
+          'dateutil/US/Pacific']
+
+    # TODO: moved from test_datetimelike; dedup with version below
+    def test_union2(self):
+        everything = tm.makeDateIndex(10)
+        first = everything[:5]
+        second = everything[5:]
+        union = first.union(second)
+        assert tm.equalContents(union, everything)
+
+        # GH 10149
+        cases = [klass(second.values) for klass in [np.array, Series, list]]
+        for case in cases:
+            result = first.union(case)
+            assert tm.equalContents(result, everything)
+
+    @pytest.mark.parametrize("tz", tz)
+    def test_union(self, tz):
+        rng1 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
+        other1 = pd.date_range('1/6/2000', freq='D', periods=5, tz=tz)
+        expected1 = pd.date_range('1/1/2000', freq='D', periods=10, tz=tz)
+
+        rng2 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
+        other2 = pd.date_range('1/4/2000', freq='D', periods=5, tz=tz)
+        expected2 = pd.date_range('1/1/2000', freq='D', periods=8, tz=tz)
+
+        rng3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
+        other3 = pd.DatetimeIndex([], tz=tz)
+        expected3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
+
+        for rng, other, expected in [(rng1, other1, expected1),
+                                     (rng2, other2, expected2),
+                                     (rng3, other3, expected3)]:
+
+            result_union = rng.union(other)
+            tm.assert_index_equal(result_union, expected)
+
+    def test_union_coverage(self):
+        idx = DatetimeIndex(['2000-01-03', '2000-01-01', '2000-01-02'])
+        ordered = DatetimeIndex(idx.sort_values(), freq='infer')
+        result = ordered.union(idx)
+        tm.assert_index_equal(result, ordered)
+
+        result = ordered[:0].union(ordered)
+        tm.assert_index_equal(result, ordered)
+        assert result.freq == ordered.freq
+
+    def test_union_bug_1730(self):
+        rng_a = date_range('1/1/2012', periods=4, freq='3H')
+        rng_b = date_range('1/1/2012', periods=4, freq='4H')
+
+        result = rng_a.union(rng_b)
+        exp = DatetimeIndex(sorted(set(list(rng_a)) | set(list(rng_b))))
+        tm.assert_index_equal(result, exp)
+
+    def test_union_bug_1745(self):
+        left = DatetimeIndex(['2012-05-11 15:19:49.695000'])
+        right = DatetimeIndex(['2012-05-29 13:04:21.322000',
+                               '2012-05-11 15:27:24.873000',
+                               '2012-05-11 15:31:05.350000'])
+
+        result = left.union(right)
+        exp = DatetimeIndex(sorted(set(list(left)) | set(list(right))))
+        tm.assert_index_equal(result, exp)
+
+    def test_union_bug_4564(self):
+        from pandas import DateOffset
+        left = date_range("2013-01-01", "2013-02-01")
+        right = left + DateOffset(minutes=15)
+
+        result = left.union(right)
+        exp = DatetimeIndex(sorted(set(list(left)) | set(list(right))))
+        tm.assert_index_equal(result, exp)
+
+    def test_union_freq_both_none(self):
+        # GH11086
+        expected = bdate_range('20150101', periods=10)
+        expected.freq = None
+
+        result = expected.union(expected)
+        tm.assert_index_equal(result, expected)
+        assert result.freq is None
+
+    def test_union_dataframe_index(self):
+        rng1 = date_range('1/1/1999', '1/1/2012', freq='MS')
+        s1 = Series(np.random.randn(len(rng1)), rng1)
+
+        rng2 = date_range('1/1/1980', '12/1/2001', freq='MS')
+        s2 = Series(np.random.randn(len(rng2)), rng2)
+        df = DataFrame({'s1': s1, 's2': s2})
+
+        exp = pd.date_range('1/1/1980', '1/1/2012', freq='MS')
+        tm.assert_index_equal(df.index, exp)
+
+    def test_union_with_DatetimeIndex(self):
+        i1 = Int64Index(np.arange(0, 20, 2))
+        i2 = DatetimeIndex(start='2012-01-03 00:00:00', periods=10, freq='D')
+        i1.union(i2)  # Works
+        i2.union(i1)  # Fails with "AttributeError: can't set attribute"
+
+    # TODO: moved from test_datetimelike; de-duplicate with version below
+    def test_intersection2(self):
+        first = tm.makeDateIndex(10)
+        second = first[5:]
+        intersect = first.intersection(second)
+        assert tm.equalContents(intersect, second)
+
+        # GH 10149
+        cases = [klass(second.values) for klass in [np.array, Series, list]]
+        for case in cases:
+            result = first.intersection(case)
+            assert tm.equalContents(result, second)
+
+        third = Index(['a', 'b', 'c'])
+        result = first.intersection(third)
+        expected = pd.Index([], dtype=object)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("tz", [None, 'Asia/Tokyo', 'US/Eastern',
+                                    'dateutil/US/Pacific'])
+    def test_intersection(self, tz):
+        # GH 4690 (with tz)
+        base = date_range('6/1/2000', '6/30/2000', freq='D', name='idx')
+
+        # if target has the same name, it is preserved
+        rng2 = date_range('5/15/2000', '6/20/2000', freq='D', name='idx')
+        expected2 = date_range('6/1/2000', '6/20/2000', freq='D', name='idx')
+
+        # if target name is different, it will be reset
+        rng3 = date_range('5/15/2000', '6/20/2000', freq='D', name='other')
+        expected3 = date_range('6/1/2000', '6/20/2000', freq='D', name=None)
+
+        rng4 = date_range('7/1/2000', '7/31/2000', freq='D', name='idx')
+        expected4 = DatetimeIndex([], name='idx')
+
+        for (rng, expected) in [(rng2, expected2), (rng3, expected3),
+                                (rng4, expected4)]:
+            result = base.intersection(rng)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+            assert result.tz == expected.tz
+
+        # non-monotonic
+        base = DatetimeIndex(['2011-01-05', '2011-01-04',
+                              '2011-01-02', '2011-01-03'],
+                             tz=tz, name='idx')
+
+        rng2 = DatetimeIndex(['2011-01-04', '2011-01-02',
+                              '2011-02-02', '2011-02-03'],
+                             tz=tz, name='idx')
+        expected2 = DatetimeIndex(['2011-01-04', '2011-01-02'],
+                                  tz=tz, name='idx')
+
+        rng3 = DatetimeIndex(['2011-01-04', '2011-01-02',
+                              '2011-02-02', '2011-02-03'],
+                             tz=tz, name='other')
+        expected3 = DatetimeIndex(['2011-01-04', '2011-01-02'],
+                                  tz=tz, name=None)
+
+        # GH 7880
+        rng4 = date_range('7/1/2000', '7/31/2000', freq='D', tz=tz,
+                          name='idx')
+        expected4 = DatetimeIndex([], tz=tz, name='idx')
+
+        for (rng, expected) in [(rng2, expected2), (rng3, expected3),
+                                (rng4, expected4)]:
+            result = base.intersection(rng)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq is None
+            assert result.tz == expected.tz
+
+    def test_intersection_empty(self):
+        # empty same freq GH2129
+        rng = date_range('6/1/2000', '6/15/2000', freq='T')
+        result = rng[0:0].intersection(rng)
+        assert len(result) == 0
+
+        result = rng.intersection(rng[0:0])
+        assert len(result) == 0
+
+    def test_intersection_bug_1708(self):
+        from pandas import DateOffset
+        index_1 = date_range('1/1/2012', periods=4, freq='12H')
+        index_2 = index_1 + DateOffset(hours=1)
+
+        result = index_1 & index_2
+        assert len(result) == 0
+
+    @pytest.mark.parametrize("tz", tz)
+    def test_difference(self, tz):
+        rng1 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
+        other1 = pd.date_range('1/6/2000', freq='D', periods=5, tz=tz)
+        expected1 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
+
+        rng2 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
+        other2 = pd.date_range('1/4/2000', freq='D', periods=5, tz=tz)
+        expected2 = pd.date_range('1/1/2000', freq='D', periods=3, tz=tz)
+
+        rng3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
+        other3 = pd.DatetimeIndex([], tz=tz)
+        expected3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
+
+        for rng, other, expected in [(rng1, other1, expected1),
+                                     (rng2, other2, expected2),
+                                     (rng3, other3, expected3)]:
+            result_diff = rng.difference(other)
+            tm.assert_index_equal(result_diff, expected)
+
+    def test_difference_freq(self):
+        # GH14323: difference of DatetimeIndex should not preserve frequency
+
+        index = date_range("20160920", "20160925", freq="D")
+        other = date_range("20160921", "20160924", freq="D")
+        expected = DatetimeIndex(["20160920", "20160925"], freq=None)
+        idx_diff = index.difference(other)
+        tm.assert_index_equal(idx_diff, expected)
+        tm.assert_attr_equal('freq', idx_diff, expected)
+
+        other = date_range("20160922", "20160925", freq="D")
+        idx_diff = index.difference(other)
+        expected = DatetimeIndex(["20160920", "20160921"], freq=None)
+        tm.assert_index_equal(idx_diff, expected)
+        tm.assert_attr_equal('freq', idx_diff, expected)
+
+    def test_datetimeindex_diff(self):
+        dti1 = DatetimeIndex(freq='Q-JAN', start=datetime(1997, 12, 31),
+                             periods=100)
+        dti2 = DatetimeIndex(freq='Q-JAN', start=datetime(1997, 12, 31),
+                             periods=98)
+        assert len(dti1.difference(dti2)) == 2
+
+    def test_datetimeindex_union_join_empty(self):
+        dti = DatetimeIndex(start='1/1/2001', end='2/1/2001', freq='D')
+        empty = Index([])
+
+        result = dti.union(empty)
+        assert isinstance(result, DatetimeIndex)
+        assert result is result
+
+        result = dti.join(empty)
+        assert isinstance(result, DatetimeIndex)
+
+    def test_join_nonunique(self):
+        idx1 = to_datetime(['2012-11-06 16:00:11.477563',
+                            '2012-11-06 16:00:11.477563'])
+        idx2 = to_datetime(['2012-11-06 15:11:09.006507',
+                            '2012-11-06 15:11:09.006507'])
+        rs = idx1.join(idx2, how='outer')
+        assert rs.is_monotonic
+
+
+class TestBusinessDatetimeIndex(object):
+
+    def setup_method(self, method):
+        self.rng = bdate_range(START, END)
+
+    def test_union(self):
+        # overlapping
+        left = self.rng[:10]
+        right = self.rng[5:10]
+
+        the_union = left.union(right)
+        assert isinstance(the_union, DatetimeIndex)
+
+        # non-overlapping, gap in middle
+        left = self.rng[:5]
+        right = self.rng[10:]
+
+        the_union = left.union(right)
+        assert isinstance(the_union, Index)
+
+        # non-overlapping, no gap
+        left = self.rng[:5]
+        right = self.rng[5:10]
+
+        the_union = left.union(right)
+        assert isinstance(the_union, DatetimeIndex)
+
+        # order does not matter
+        tm.assert_index_equal(right.union(left), the_union)
+
+        # overlapping, but different offset
+        rng = date_range(START, END, freq=BMonthEnd())
+
+        the_union = self.rng.union(rng)
+        assert isinstance(the_union, DatetimeIndex)
+
+    def test_outer_join(self):
+        # should just behave as union
+
+        # overlapping
+        left = self.rng[:10]
+        right = self.rng[5:10]
+
+        the_join = left.join(right, how='outer')
+        assert isinstance(the_join, DatetimeIndex)
+
+        # non-overlapping, gap in middle
+        left = self.rng[:5]
+        right = self.rng[10:]
+
+        the_join = left.join(right, how='outer')
+        assert isinstance(the_join, DatetimeIndex)
+        assert the_join.freq is None
+
+        # non-overlapping, no gap
+        left = self.rng[:5]
+        right = self.rng[5:10]
+
+        the_join = left.join(right, how='outer')
+        assert isinstance(the_join, DatetimeIndex)
+
+        # overlapping, but different offset
+        rng = date_range(START, END, freq=BMonthEnd())
+
+        the_join = self.rng.join(rng, how='outer')
+        assert isinstance(the_join, DatetimeIndex)
+        assert the_join.freq is None
+
+    def test_union_not_cacheable(self):
+        rng = date_range('1/1/2000', periods=50, freq=Minute())
+        rng1 = rng[10:]
+        rng2 = rng[:25]
+        the_union = rng1.union(rng2)
+        tm.assert_index_equal(the_union, rng)
+
+        rng1 = rng[10:]
+        rng2 = rng[15:35]
+        the_union = rng1.union(rng2)
+        expected = rng[10:]
+        tm.assert_index_equal(the_union, expected)
+
+    def test_intersection(self):
+        rng = date_range('1/1/2000', periods=50, freq=Minute())
+        rng1 = rng[10:]
+        rng2 = rng[:25]
+        the_int = rng1.intersection(rng2)
+        expected = rng[10:25]
+        tm.assert_index_equal(the_int, expected)
+        assert isinstance(the_int, DatetimeIndex)
+        assert the_int.freq == rng.freq
+
+        the_int = rng1.intersection(rng2.view(DatetimeIndex))
+        tm.assert_index_equal(the_int, expected)
+
+        # non-overlapping
+        the_int = rng[:10].intersection(rng[10:])
+        expected = DatetimeIndex([])
+        tm.assert_index_equal(the_int, expected)
+
+    def test_intersection_bug(self):
+        # GH #771
+        a = bdate_range('11/30/2011', '12/31/2011')
+        b = bdate_range('12/10/2011', '12/20/2011')
+        result = a.intersection(b)
+        tm.assert_index_equal(result, b)
+
+    def test_month_range_union_tz_pytz(self):
+        from pytz import timezone
+        tz = timezone('US/Eastern')
+
+        early_start = datetime(2011, 1, 1)
+        early_end = datetime(2011, 3, 1)
+
+        late_start = datetime(2011, 3, 1)
+        late_end = datetime(2011, 5, 1)
+
+        early_dr = date_range(start=early_start, end=early_end, tz=tz,
+                              freq=MonthEnd())
+        late_dr = date_range(start=late_start, end=late_end, tz=tz,
+                             freq=MonthEnd())
+
+        early_dr.union(late_dr)
+
+    @td.skip_if_windows_python_3
+    def test_month_range_union_tz_dateutil(self):
+        from pandas._libs.tslibs.timezones import dateutil_gettz
+        tz = dateutil_gettz('US/Eastern')
+
+        early_start = datetime(2011, 1, 1)
+        early_end = datetime(2011, 3, 1)
+
+        late_start = datetime(2011, 3, 1)
+        late_end = datetime(2011, 5, 1)
+
+        early_dr = date_range(start=early_start, end=early_end, tz=tz,
+                              freq=MonthEnd())
+        late_dr = date_range(start=late_start, end=late_end, tz=tz,
+                             freq=MonthEnd())
+
+        early_dr.union(late_dr)
+
+
+class TestCustomDatetimeIndex(object):
+
+    def setup_method(self, method):
+        self.rng = bdate_range(START, END, freq='C')
+
+    def test_union(self):
+        # overlapping
+        left = self.rng[:10]
+        right = self.rng[5:10]
+
+        the_union = left.union(right)
+        assert isinstance(the_union, DatetimeIndex)
+
+        # non-overlapping, gap in middle
+        left = self.rng[:5]
+        right = self.rng[10:]
+
+        the_union = left.union(right)
+        assert isinstance(the_union, Index)
+
+        # non-overlapping, no gap
+        left = self.rng[:5]
+        right = self.rng[5:10]
+
+        the_union = left.union(right)
+        assert isinstance(the_union, DatetimeIndex)
+
+        # order does not matter
+        tm.assert_index_equal(right.union(left), the_union)
+
+        # overlapping, but different offset
+        rng = date_range(START, END, freq=BMonthEnd())
+
+        the_union = self.rng.union(rng)
+        assert isinstance(the_union, DatetimeIndex)
+
+    def test_outer_join(self):
+        # should just behave as union
+
+        # overlapping
+        left = self.rng[:10]
+        right = self.rng[5:10]
+
+        the_join = left.join(right, how='outer')
+        assert isinstance(the_join, DatetimeIndex)
+
+        # non-overlapping, gap in middle
+        left = self.rng[:5]
+        right = self.rng[10:]
+
+        the_join = left.join(right, how='outer')
+        assert isinstance(the_join, DatetimeIndex)
+        assert the_join.freq is None
+
+        # non-overlapping, no gap
+        left = self.rng[:5]
+        right = self.rng[5:10]
+
+        the_join = left.join(right, how='outer')
+        assert isinstance(the_join, DatetimeIndex)
+
+        # overlapping, but different offset
+        rng = date_range(START, END, freq=BMonthEnd())
+
+        the_join = self.rng.join(rng, how='outer')
+        assert isinstance(the_join, DatetimeIndex)
+        assert the_join.freq is None
+
+    def test_intersection_bug(self):
+        # GH #771
+        a = bdate_range('11/30/2011', '12/31/2011', freq='C')
+        b = bdate_range('12/10/2011', '12/20/2011', freq='C')
+        result = a.intersection(b)
+        tm.assert_index_equal(result, b)
diff --git a/pandas/tests/indexes/datetimes/test_timezones.py b/pandas/tests/indexes/datetimes/test_timezones.py
new file mode 100644
index 0000000000000..573940edaa08f
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_timezones.py
@@ -0,0 +1,1046 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for DatetimeIndex timezone-related methods
+"""
+from datetime import datetime, timedelta, tzinfo, date, time
+from distutils.version import LooseVersion
+
+import pytest
+import pytz
+import dateutil
+from dateutil.tz import gettz, tzlocal
+import numpy as np
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+import pandas as pd
+from pandas._libs import tslib
+from pandas._libs.tslibs import timezones
+from pandas.compat import lrange, zip, PY3
+from pandas import (DatetimeIndex, date_range, bdate_range,
+                    Timestamp, isna, to_datetime, Index)
+
+
+class FixedOffset(tzinfo):
+    """Fixed offset in minutes east from UTC."""
+
+    def __init__(self, offset, name):
+        self.__offset = timedelta(minutes=offset)
+        self.__name = name
+
+    def utcoffset(self, dt):
+        return self.__offset
+
+    def tzname(self, dt):
+        return self.__name
+
+    def dst(self, dt):
+        return timedelta(0)
+
+
+fixed_off = FixedOffset(-420, '-07:00')
+fixed_off_no_name = FixedOffset(-330, None)
+
+
+class TestDatetimeIndexTimezones(object):
+    # -------------------------------------------------------------
+    # DatetimeIndex.tz_convert
+    def test_tz_convert_nat(self):
+        # GH#5546
+        dates = [pd.NaT]
+        idx = DatetimeIndex(dates)
+        idx = idx.tz_localize('US/Pacific')
+        tm.assert_index_equal(idx, DatetimeIndex(dates, tz='US/Pacific'))
+        idx = idx.tz_convert('US/Eastern')
+        tm.assert_index_equal(idx, DatetimeIndex(dates, tz='US/Eastern'))
+        idx = idx.tz_convert('UTC')
+        tm.assert_index_equal(idx, DatetimeIndex(dates, tz='UTC'))
+
+        dates = ['2010-12-01 00:00', '2010-12-02 00:00', pd.NaT]
+        idx = DatetimeIndex(dates)
+        idx = idx.tz_localize('US/Pacific')
+        tm.assert_index_equal(idx, DatetimeIndex(dates, tz='US/Pacific'))
+        idx = idx.tz_convert('US/Eastern')
+        expected = ['2010-12-01 03:00', '2010-12-02 03:00', pd.NaT]
+        tm.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Eastern'))
+
+        idx = idx + pd.offsets.Hour(5)
+        expected = ['2010-12-01 08:00', '2010-12-02 08:00', pd.NaT]
+        tm.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Eastern'))
+        idx = idx.tz_convert('US/Pacific')
+        expected = ['2010-12-01 05:00', '2010-12-02 05:00', pd.NaT]
+        tm.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Pacific'))
+
+        idx = idx + np.timedelta64(3, 'h')
+        expected = ['2010-12-01 08:00', '2010-12-02 08:00', pd.NaT]
+        tm.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Pacific'))
+
+        idx = idx.tz_convert('US/Eastern')
+        expected = ['2010-12-01 11:00', '2010-12-02 11:00', pd.NaT]
+        tm.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Eastern'))
+
+    @pytest.mark.parametrize('prefix', ['', 'dateutil/'])
+    def test_dti_tz_convert_compat_timestamp(self, prefix):
+        strdates = ['1/1/2012', '3/1/2012', '4/1/2012']
+        idx = DatetimeIndex(strdates, tz=prefix + 'US/Eastern')
+
+        conv = idx[0].tz_convert(prefix + 'US/Pacific')
+        expected = idx.tz_convert(prefix + 'US/Pacific')[0]
+
+        assert conv == expected
+
+    def test_dti_tz_convert_hour_overflow_dst(self):
+        # Regression test for:
+        # https://github.com/pandas-dev/pandas/issues/13306
+
+        # sorted case US/Eastern -> UTC
+        ts = ['2008-05-12 09:50:00',
+              '2008-12-12 09:50:35',
+              '2009-05-12 09:50:32']
+        tt = DatetimeIndex(ts).tz_localize('US/Eastern')
+        ut = tt.tz_convert('UTC')
+        expected = Index([13, 14, 13])
+        tm.assert_index_equal(ut.hour, expected)
+
+        # sorted case UTC -> US/Eastern
+        ts = ['2008-05-12 13:50:00',
+              '2008-12-12 14:50:35',
+              '2009-05-12 13:50:32']
+        tt = DatetimeIndex(ts).tz_localize('UTC')
+        ut = tt.tz_convert('US/Eastern')
+        expected = Index([9, 9, 9])
+        tm.assert_index_equal(ut.hour, expected)
+
+        # unsorted case US/Eastern -> UTC
+        ts = ['2008-05-12 09:50:00',
+              '2008-12-12 09:50:35',
+              '2008-05-12 09:50:32']
+        tt = DatetimeIndex(ts).tz_localize('US/Eastern')
+        ut = tt.tz_convert('UTC')
+        expected = Index([13, 14, 13])
+        tm.assert_index_equal(ut.hour, expected)
+
+        # unsorted case UTC -> US/Eastern
+        ts = ['2008-05-12 13:50:00',
+              '2008-12-12 14:50:35',
+              '2008-05-12 13:50:32']
+        tt = DatetimeIndex(ts).tz_localize('UTC')
+        ut = tt.tz_convert('US/Eastern')
+        expected = Index([9, 9, 9])
+        tm.assert_index_equal(ut.hour, expected)
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_tz_convert_hour_overflow_dst_timestamps(self, tz):
+        # Regression test for GH#13306
+
+        # sorted case US/Eastern -> UTC
+        ts = [Timestamp('2008-05-12 09:50:00', tz=tz),
+              Timestamp('2008-12-12 09:50:35', tz=tz),
+              Timestamp('2009-05-12 09:50:32', tz=tz)]
+        tt = DatetimeIndex(ts)
+        ut = tt.tz_convert('UTC')
+        expected = Index([13, 14, 13])
+        tm.assert_index_equal(ut.hour, expected)
+
+        # sorted case UTC -> US/Eastern
+        ts = [Timestamp('2008-05-12 13:50:00', tz='UTC'),
+              Timestamp('2008-12-12 14:50:35', tz='UTC'),
+              Timestamp('2009-05-12 13:50:32', tz='UTC')]
+        tt = DatetimeIndex(ts)
+        ut = tt.tz_convert('US/Eastern')
+        expected = Index([9, 9, 9])
+        tm.assert_index_equal(ut.hour, expected)
+
+        # unsorted case US/Eastern -> UTC
+        ts = [Timestamp('2008-05-12 09:50:00', tz=tz),
+              Timestamp('2008-12-12 09:50:35', tz=tz),
+              Timestamp('2008-05-12 09:50:32', tz=tz)]
+        tt = DatetimeIndex(ts)
+        ut = tt.tz_convert('UTC')
+        expected = Index([13, 14, 13])
+        tm.assert_index_equal(ut.hour, expected)
+
+        # unsorted case UTC -> US/Eastern
+        ts = [Timestamp('2008-05-12 13:50:00', tz='UTC'),
+              Timestamp('2008-12-12 14:50:35', tz='UTC'),
+              Timestamp('2008-05-12 13:50:32', tz='UTC')]
+        tt = DatetimeIndex(ts)
+        ut = tt.tz_convert('US/Eastern')
+        expected = Index([9, 9, 9])
+        tm.assert_index_equal(ut.hour, expected)
+
+    @pytest.mark.parametrize('freq, n', [('H', 1), ('T', 60), ('S', 3600)])
+    def test_dti_tz_convert_trans_pos_plus_1__bug(self, freq, n):
+        # Regression test for tslib.tz_convert(vals, tz1, tz2).
+        # See https://github.com/pandas-dev/pandas/issues/4496 for details.
+        idx = date_range(datetime(2011, 3, 26, 23),
+                         datetime(2011, 3, 27, 1), freq=freq)
+        idx = idx.tz_localize('UTC')
+        idx = idx.tz_convert('Europe/Moscow')
+
+        expected = np.repeat(np.array([3, 4, 5]), np.array([n, n, 1]))
+        tm.assert_index_equal(idx.hour, Index(expected))
+
+    def test_dti_tz_convert_dst(self):
+        for freq, n in [('H', 1), ('T', 60), ('S', 3600)]:
+            # Start DST
+            idx = date_range('2014-03-08 23:00', '2014-03-09 09:00', freq=freq,
+                             tz='UTC')
+            idx = idx.tz_convert('US/Eastern')
+            expected = np.repeat(np.array([18, 19, 20, 21, 22, 23,
+                                           0, 1, 3, 4, 5]),
+                                 np.array([n, n, n, n, n, n, n, n, n, n, 1]))
+            tm.assert_index_equal(idx.hour, Index(expected))
+
+            idx = date_range('2014-03-08 18:00', '2014-03-09 05:00', freq=freq,
+                             tz='US/Eastern')
+            idx = idx.tz_convert('UTC')
+            expected = np.repeat(np.array([23, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9]),
+                                 np.array([n, n, n, n, n, n, n, n, n, n, 1]))
+            tm.assert_index_equal(idx.hour, Index(expected))
+
+            # End DST
+            idx = date_range('2014-11-01 23:00', '2014-11-02 09:00', freq=freq,
+                             tz='UTC')
+            idx = idx.tz_convert('US/Eastern')
+            expected = np.repeat(np.array([19, 20, 21, 22, 23,
+                                           0, 1, 1, 2, 3, 4]),
+                                 np.array([n, n, n, n, n, n, n, n, n, n, 1]))
+            tm.assert_index_equal(idx.hour, Index(expected))
+
+            idx = date_range('2014-11-01 18:00', '2014-11-02 05:00', freq=freq,
+                             tz='US/Eastern')
+            idx = idx.tz_convert('UTC')
+            expected = np.repeat(np.array([22, 23, 0, 1, 2, 3, 4, 5, 6,
+                                           7, 8, 9, 10]),
+                                 np.array([n, n, n, n, n, n, n, n, n,
+                                           n, n, n, 1]))
+            tm.assert_index_equal(idx.hour, Index(expected))
+
+        # daily
+        # Start DST
+        idx = date_range('2014-03-08 00:00', '2014-03-09 00:00', freq='D',
+                         tz='UTC')
+        idx = idx.tz_convert('US/Eastern')
+        tm.assert_index_equal(idx.hour, Index([19, 19]))
+
+        idx = date_range('2014-03-08 00:00', '2014-03-09 00:00', freq='D',
+                         tz='US/Eastern')
+        idx = idx.tz_convert('UTC')
+        tm.assert_index_equal(idx.hour, Index([5, 5]))
+
+        # End DST
+        idx = date_range('2014-11-01 00:00', '2014-11-02 00:00', freq='D',
+                         tz='UTC')
+        idx = idx.tz_convert('US/Eastern')
+        tm.assert_index_equal(idx.hour, Index([20, 20]))
+
+        idx = date_range('2014-11-01 00:00', '2014-11-02 000:00', freq='D',
+                         tz='US/Eastern')
+        idx = idx.tz_convert('UTC')
+        tm.assert_index_equal(idx.hour, Index([4, 4]))
+
+    def test_tz_convert_roundtrip(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        idx1 = date_range(start='2014-01-01', end='2014-12-31', freq='M',
+                          tz='UTC')
+        exp1 = date_range(start='2014-01-01', end='2014-12-31', freq='M')
+
+        idx2 = date_range(start='2014-01-01', end='2014-12-31', freq='D',
+                          tz='UTC')
+        exp2 = date_range(start='2014-01-01', end='2014-12-31', freq='D')
+
+        idx3 = date_range(start='2014-01-01', end='2014-03-01', freq='H',
+                          tz='UTC')
+        exp3 = date_range(start='2014-01-01', end='2014-03-01', freq='H')
+
+        idx4 = date_range(start='2014-08-01', end='2014-10-31', freq='T',
+                          tz='UTC')
+        exp4 = date_range(start='2014-08-01', end='2014-10-31', freq='T')
+
+        for idx, expected in [(idx1, exp1), (idx2, exp2), (idx3, exp3),
+                              (idx4, exp4)]:
+            converted = idx.tz_convert(tz)
+            reset = converted.tz_convert(None)
+            tm.assert_index_equal(reset, expected)
+            assert reset.tzinfo is None
+            expected = converted.tz_convert('UTC').tz_localize(None)
+            tm.assert_index_equal(reset, expected)
+
+    def test_dti_tz_convert_tzlocal(self):
+        # GH#13583
+        # tz_convert doesn't affect to internal
+        dti = date_range(start='2001-01-01', end='2001-03-01', tz='UTC')
+        dti2 = dti.tz_convert(dateutil.tz.tzlocal())
+        tm.assert_numpy_array_equal(dti2.asi8, dti.asi8)
+
+        dti = date_range(start='2001-01-01', end='2001-03-01',
+                         tz=dateutil.tz.tzlocal())
+        dti2 = dti.tz_convert(None)
+        tm.assert_numpy_array_equal(dti2.asi8, dti.asi8)
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern',
+                                    pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_tz_convert_utc_to_local_no_modify(self, tz):
+        rng = date_range('3/11/2012', '3/12/2012', freq='H', tz='utc')
+        rng_eastern = rng.tz_convert(tz)
+
+        # Values are unmodified
+        tm.assert_numpy_array_equal(rng.asi8, rng_eastern.asi8)
+
+        assert timezones.tz_compare(rng_eastern.tz, timezones.maybe_get_tz(tz))
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_tz_convert_unsorted(self, tzstr):
+        dr = date_range('2012-03-09', freq='H', periods=100, tz='utc')
+        dr = dr.tz_convert(tzstr)
+
+        result = dr[::-1].hour
+        exp = dr.hour[::-1]
+        tm.assert_almost_equal(result, exp)
+
+    # -------------------------------------------------------------
+    # DatetimeIndex.tz_localize
+
+    def test_dti_tz_localize_nonexistent_raise_coerce(self):
+        # GH#13057
+        times = ['2015-03-08 01:00', '2015-03-08 02:00', '2015-03-08 03:00']
+        index = DatetimeIndex(times)
+        tz = 'US/Eastern'
+        with pytest.raises(pytz.NonExistentTimeError):
+            index.tz_localize(tz=tz)
+
+        with pytest.raises(pytz.NonExistentTimeError):
+            index.tz_localize(tz=tz, errors='raise')
+
+        result = index.tz_localize(tz=tz, errors='coerce')
+        test_times = ['2015-03-08 01:00-05:00', 'NaT',
+                      '2015-03-08 03:00-04:00']
+        dti = DatetimeIndex(test_times)
+        expected = dti.tz_localize('UTC').tz_convert('US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_tz_localize_ambiguous_infer(self, tz):
+        # November 6, 2011, fall back, repeat 2 AM hour
+        # With no repeated hours, we cannot infer the transition
+        dr = date_range(datetime(2011, 11, 6, 0), periods=5,
+                        freq=pd.offsets.Hour())
+        with pytest.raises(pytz.AmbiguousTimeError):
+            dr.tz_localize(tz)
+
+        # With repeated hours, we can infer the transition
+        dr = date_range(datetime(2011, 11, 6, 0), periods=5,
+                        freq=pd.offsets.Hour(), tz=tz)
+        times = ['11/06/2011 00:00', '11/06/2011 01:00', '11/06/2011 01:00',
+                 '11/06/2011 02:00', '11/06/2011 03:00']
+        di = DatetimeIndex(times)
+        localized = di.tz_localize(tz, ambiguous='infer')
+        tm.assert_index_equal(dr, localized)
+        tm.assert_index_equal(dr, DatetimeIndex(times, tz=tz,
+                                                ambiguous='infer'))
+
+        # When there is no dst transition, nothing special happens
+        dr = date_range(datetime(2011, 6, 1, 0), periods=10,
+                        freq=pd.offsets.Hour())
+        localized = dr.tz_localize(tz)
+        localized_infer = dr.tz_localize(tz, ambiguous='infer')
+        tm.assert_index_equal(localized, localized_infer)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_tz_localize_ambiguous_times(self, tz):
+        # March 13, 2011, spring forward, skip from 2 AM to 3 AM
+        dr = date_range(datetime(2011, 3, 13, 1, 30), periods=3,
+                        freq=pd.offsets.Hour())
+        with pytest.raises(pytz.NonExistentTimeError):
+            dr.tz_localize(tz)
+
+        # after dst transition, it works
+        dr = date_range(datetime(2011, 3, 13, 3, 30), periods=3,
+                        freq=pd.offsets.Hour(), tz=tz)
+
+        # November 6, 2011, fall back, repeat 2 AM hour
+        dr = date_range(datetime(2011, 11, 6, 1, 30), periods=3,
+                        freq=pd.offsets.Hour())
+        with pytest.raises(pytz.AmbiguousTimeError):
+            dr.tz_localize(tz)
+
+        # UTC is OK
+        dr = date_range(datetime(2011, 3, 13), periods=48,
+                        freq=pd.offsets.Minute(30), tz=pytz.utc)
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_tz_localize_pass_dates_to_utc(self, tzstr):
+        strdates = ['1/1/2012', '3/1/2012', '4/1/2012']
+
+        idx = DatetimeIndex(strdates)
+        conv = idx.tz_localize(tzstr)
+
+        fromdates = DatetimeIndex(strdates, tz=tzstr)
+
+        assert conv.tz == fromdates.tz
+        tm.assert_numpy_array_equal(conv.values, fromdates.values)
+
+    @pytest.mark.parametrize('prefix', ['', 'dateutil/'])
+    def test_dti_tz_localize(self, prefix):
+        tzstr = prefix + 'US/Eastern'
+        dti = DatetimeIndex(start='1/1/2005', end='1/1/2005 0:00:30.256',
+                            freq='L')
+        dti2 = dti.tz_localize(tzstr)
+
+        dti_utc = DatetimeIndex(start='1/1/2005 05:00',
+                                end='1/1/2005 5:00:30.256', freq='L', tz='utc')
+
+        tm.assert_numpy_array_equal(dti2.values, dti_utc.values)
+
+        dti3 = dti2.tz_convert(prefix + 'US/Pacific')
+        tm.assert_numpy_array_equal(dti3.values, dti_utc.values)
+
+        dti = DatetimeIndex(start='11/6/2011 1:59', end='11/6/2011 2:00',
+                            freq='L')
+        with pytest.raises(pytz.AmbiguousTimeError):
+            dti.tz_localize(tzstr)
+
+        dti = DatetimeIndex(start='3/13/2011 1:59', end='3/13/2011 2:00',
+                            freq='L')
+        with pytest.raises(pytz.NonExistentTimeError):
+            dti.tz_localize(tzstr)
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern',
+                                    pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_tz_localize_utc_conversion(self, tz):
+        # Localizing to time zone should:
+        #  1) check for DST ambiguities
+        #  2) convert to UTC
+
+        rng = date_range('3/10/2012', '3/11/2012', freq='30T')
+
+        converted = rng.tz_localize(tz)
+        expected_naive = rng + pd.offsets.Hour(5)
+        tm.assert_numpy_array_equal(converted.asi8, expected_naive.asi8)
+
+        # DST ambiguity, this should fail
+        rng = date_range('3/11/2012', '3/12/2012', freq='30T')
+        # Is this really how it should fail??
+        with pytest.raises(pytz.NonExistentTimeError):
+            rng.tz_localize(tz)
+
+    def test_dti_tz_localize_roundtrip(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+
+        idx1 = date_range(start='2014-01-01', end='2014-12-31', freq='M')
+        idx2 = date_range(start='2014-01-01', end='2014-12-31', freq='D')
+        idx3 = date_range(start='2014-01-01', end='2014-03-01', freq='H')
+        idx4 = date_range(start='2014-08-01', end='2014-10-31', freq='T')
+        for idx in [idx1, idx2, idx3, idx4]:
+            localized = idx.tz_localize(tz)
+            expected = date_range(start=idx[0], end=idx[-1], freq=idx.freq,
+                                  tz=tz)
+            tm.assert_index_equal(localized, expected)
+            with pytest.raises(TypeError):
+                localized.tz_localize(tz)
+
+            reset = localized.tz_localize(None)
+            tm.assert_index_equal(reset, idx)
+            assert reset.tzinfo is None
+
+    def test_dti_tz_localize_naive(self):
+        rng = date_range('1/1/2011', periods=100, freq='H')
+
+        conv = rng.tz_localize('US/Pacific')
+        exp = date_range('1/1/2011', periods=100, freq='H', tz='US/Pacific')
+
+        tm.assert_index_equal(conv, exp)
+
+    def test_dti_tz_localize_tzlocal(self):
+        # GH#13583
+        offset = dateutil.tz.tzlocal().utcoffset(datetime(2011, 1, 1))
+        offset = int(offset.total_seconds() * 1000000000)
+
+        dti = date_range(start='2001-01-01', end='2001-03-01')
+        dti2 = dti.tz_localize(dateutil.tz.tzlocal())
+        tm.assert_numpy_array_equal(dti2.asi8 + offset, dti.asi8)
+
+        dti = date_range(start='2001-01-01', end='2001-03-01',
+                         tz=dateutil.tz.tzlocal())
+        dti2 = dti.tz_localize(None)
+        tm.assert_numpy_array_equal(dti2.asi8 - offset, dti.asi8)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_tz_localize_ambiguous_nat(self, tz):
+        times = ['11/06/2011 00:00', '11/06/2011 01:00', '11/06/2011 01:00',
+                 '11/06/2011 02:00', '11/06/2011 03:00']
+        di = DatetimeIndex(times)
+        localized = di.tz_localize(tz, ambiguous='NaT')
+
+        times = ['11/06/2011 00:00', np.NaN, np.NaN, '11/06/2011 02:00',
+                 '11/06/2011 03:00']
+        di_test = DatetimeIndex(times, tz='US/Eastern')
+
+        # left dtype is datetime64[ns, US/Eastern]
+        # right is datetime64[ns, tzfile('/usr/share/zoneinfo/US/Eastern')]
+        tm.assert_numpy_array_equal(di_test.values, localized.values)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_tz_localize_ambiguous_flags(self, tz):
+        # November 6, 2011, fall back, repeat 2 AM hour
+
+        # Pass in flags to determine right dst transition
+        dr = date_range(datetime(2011, 11, 6, 0), periods=5,
+                        freq=pd.offsets.Hour(), tz=tz)
+        times = ['11/06/2011 00:00', '11/06/2011 01:00', '11/06/2011 01:00',
+                 '11/06/2011 02:00', '11/06/2011 03:00']
+
+        # Test tz_localize
+        di = DatetimeIndex(times)
+        is_dst = [1, 1, 0, 0, 0]
+        localized = di.tz_localize(tz, ambiguous=is_dst)
+        tm.assert_index_equal(dr, localized)
+        tm.assert_index_equal(dr, DatetimeIndex(times, tz=tz,
+                                                ambiguous=is_dst))
+
+        localized = di.tz_localize(tz, ambiguous=np.array(is_dst))
+        tm.assert_index_equal(dr, localized)
+
+        localized = di.tz_localize(tz,
+                                   ambiguous=np.array(is_dst).astype('bool'))
+        tm.assert_index_equal(dr, localized)
+
+        # Test constructor
+        localized = DatetimeIndex(times, tz=tz, ambiguous=is_dst)
+        tm.assert_index_equal(dr, localized)
+
+        # Test duplicate times where inferring the dst fails
+        times += times
+        di = DatetimeIndex(times)
+
+        # When the sizes are incompatible, make sure error is raised
+        with pytest.raises(Exception):
+            di.tz_localize(tz, ambiguous=is_dst)
+
+        # When sizes are compatible and there are repeats ('infer' won't work)
+        is_dst = np.hstack((is_dst, is_dst))
+        localized = di.tz_localize(tz, ambiguous=is_dst)
+        dr = dr.append(dr)
+        tm.assert_index_equal(dr, localized)
+
+        # When there is no dst transition, nothing special happens
+        dr = date_range(datetime(2011, 6, 1, 0), periods=10,
+                        freq=pd.offsets.Hour())
+        is_dst = np.array([1] * 10)
+        localized = dr.tz_localize(tz)
+        localized_is_dst = dr.tz_localize(tz, ambiguous=is_dst)
+        tm.assert_index_equal(localized, localized_is_dst)
+
+    # TODO: belongs outside tz_localize tests?
+    @pytest.mark.parametrize('tz', ['Europe/London', 'dateutil/Europe/London'])
+    def test_dti_construction_ambiguous_endpoint(self, tz):
+        # construction with an ambiguous end-point
+        # GH#11626
+
+        # FIXME: This next block fails to raise; it was taken from an older
+        # version of this test that had an indention mistake that caused it
+        # to not get executed.
+        # with pytest.raises(pytz.AmbiguousTimeError):
+        #    date_range("2013-10-26 23:00", "2013-10-27 01:00",
+        #               tz="Europe/London", freq="H")
+
+        times = date_range("2013-10-26 23:00", "2013-10-27 01:00", freq="H",
+                           tz=tz, ambiguous='infer')
+        assert times[0] == Timestamp('2013-10-26 23:00', tz=tz, freq="H")
+
+        if str(tz).startswith('dateutil'):
+            if LooseVersion(dateutil.__version__) < LooseVersion('2.6.0'):
+                # see GH#14621
+                assert times[-1] == Timestamp('2013-10-27 01:00:00+0000',
+                                              tz=tz, freq="H")
+            elif LooseVersion(dateutil.__version__) > LooseVersion('2.6.0'):
+                # fixed ambiguous behavior
+                assert times[-1] == Timestamp('2013-10-27 01:00:00+0100',
+                                              tz=tz, freq="H")
+        else:
+            assert times[-1] == Timestamp('2013-10-27 01:00:00+0000',
+                                          tz=tz, freq="H")
+
+    def test_dti_tz_localize_bdate_range(self):
+        dr = pd.bdate_range('1/1/2009', '1/1/2010')
+        dr_utc = pd.bdate_range('1/1/2009', '1/1/2010', tz=pytz.utc)
+        localized = dr.tz_localize(pytz.utc)
+        tm.assert_index_equal(dr_utc, localized)
+
+    # -------------------------------------------------------------
+    # DatetimeIndex.normalize
+
+    def test_normalize_tz(self):
+        rng = date_range('1/1/2000 9:30', periods=10, freq='D',
+                         tz='US/Eastern')
+
+        result = rng.normalize()
+        expected = date_range('1/1/2000', periods=10, freq='D',
+                              tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+        assert result.is_normalized
+        assert not rng.is_normalized
+
+        rng = date_range('1/1/2000 9:30', periods=10, freq='D', tz='UTC')
+
+        result = rng.normalize()
+        expected = date_range('1/1/2000', periods=10, freq='D', tz='UTC')
+        tm.assert_index_equal(result, expected)
+
+        assert result.is_normalized
+        assert not rng.is_normalized
+
+        rng = date_range('1/1/2000 9:30', periods=10, freq='D', tz=tzlocal())
+        result = rng.normalize()
+        expected = date_range('1/1/2000', periods=10, freq='D', tz=tzlocal())
+        tm.assert_index_equal(result, expected)
+
+        assert result.is_normalized
+        assert not rng.is_normalized
+
+    @td.skip_if_windows
+    @pytest.mark.parametrize('timezone', ['US/Pacific', 'US/Eastern', 'UTC',
+                                          'Asia/Kolkata', 'Asia/Shanghai',
+                                          'Australia/Canberra'])
+    def test_normalize_tz_local(self, timezone):
+        # GH#13459
+        with tm.set_timezone(timezone):
+            rng = date_range('1/1/2000 9:30', periods=10, freq='D',
+                             tz=tzlocal())
+
+            result = rng.normalize()
+            expected = date_range('1/1/2000', periods=10, freq='D',
+                                  tz=tzlocal())
+            tm.assert_index_equal(result, expected)
+
+            assert result.is_normalized
+            assert not rng.is_normalized
+
+    # ------------------------------------------------------------
+    # DatetimeIndex.__new__
+
+    @pytest.mark.parametrize('prefix', ['', 'dateutil/'])
+    def test_dti_constructor_static_tzinfo(self, prefix):
+        # it works!
+        index = DatetimeIndex([datetime(2012, 1, 1)], tz=prefix + 'EST')
+        index.hour
+        index[0]
+
+    def test_dti_constructor_with_fixed_tz(self):
+        off = FixedOffset(420, '+07:00')
+        start = datetime(2012, 3, 11, 5, 0, 0, tzinfo=off)
+        end = datetime(2012, 6, 11, 5, 0, 0, tzinfo=off)
+        rng = date_range(start=start, end=end)
+        assert off == rng.tz
+
+        rng2 = date_range(start, periods=len(rng), tz=off)
+        tm.assert_index_equal(rng, rng2)
+
+        rng3 = date_range('3/11/2012 05:00:00+07:00',
+                          '6/11/2012 05:00:00+07:00')
+        assert (rng.values == rng3.values).all()
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_convert_datetime_list(self, tzstr):
+        dr = date_range('2012-06-02', periods=10,
+                        tz=tzstr, name='foo')
+        dr2 = DatetimeIndex(list(dr), name='foo')
+        tm.assert_index_equal(dr, dr2)
+        assert dr.tz == dr2.tz
+        assert dr2.name == 'foo'
+
+    def test_dti_construction_univalent(self):
+        rng = date_range('03/12/2012 00:00', periods=10, freq='W-FRI',
+                         tz='US/Eastern')
+        rng2 = DatetimeIndex(data=rng, tz='US/Eastern')
+        tm.assert_index_equal(rng, rng2)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_from_tzaware_datetime(self, tz):
+        d = [datetime(2012, 8, 19, tzinfo=tz)]
+
+        index = DatetimeIndex(d)
+        assert timezones.tz_compare(index.tz, tz)
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_tz_constructors(self, tzstr):
+        """ Test different DatetimeIndex constructions with timezone
+        Follow-up of GH#4229
+        """
+
+        arr = ['11/10/2005 08:00:00', '11/10/2005 09:00:00']
+
+        idx1 = to_datetime(arr).tz_localize(tzstr)
+        idx2 = DatetimeIndex(start="2005-11-10 08:00:00", freq='H', periods=2,
+                             tz=tzstr)
+        idx3 = DatetimeIndex(arr, tz=tzstr)
+        idx4 = DatetimeIndex(np.array(arr), tz=tzstr)
+
+        for other in [idx2, idx3, idx4]:
+            tm.assert_index_equal(idx1, other)
+
+    # -------------------------------------------------------------
+    # Unsorted
+
+    def test_join_utc_convert(self, join_type):
+        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
+
+        left = rng.tz_convert('US/Eastern')
+        right = rng.tz_convert('Europe/Berlin')
+
+        result = left.join(left[:-5], how=join_type)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz == left.tz
+
+        result = left.join(right[:-5], how=join_type)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz.zone == 'UTC'
+
+    @pytest.mark.parametrize("dtype", [
+        None, 'datetime64[ns, CET]',
+        'datetime64[ns, EST]', 'datetime64[ns, UTC]'
+    ])
+    def test_date_accessor(self, dtype):
+        # Regression test for GH#21230
+        expected = np.array([date(2018, 6, 4), pd.NaT])
+
+        index = DatetimeIndex(['2018-06-04 10:00:00', pd.NaT], dtype=dtype)
+        result = index.date
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize("dtype", [
+        None, 'datetime64[ns, CET]',
+        'datetime64[ns, EST]', 'datetime64[ns, UTC]'
+    ])
+    def test_time_accessor(self, dtype):
+        # Regression test for GH#21267
+        expected = np.array([time(10, 20, 30), pd.NaT])
+
+        index = DatetimeIndex(['2018-06-04 10:20:30', pd.NaT], dtype=dtype)
+        result = index.time
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_dti_drop_dont_lose_tz(self):
+        # GH#2621
+        ind = date_range("2012-12-01", periods=10, tz="utc")
+        ind = ind.drop(ind[-1])
+
+        assert ind.tz is not None
+
+    def test_date_range_localize(self):
+        rng = date_range('3/11/2012 03:00', periods=15, freq='H',
+                         tz='US/Eastern')
+        rng2 = DatetimeIndex(['3/11/2012 03:00', '3/11/2012 04:00'],
+                             tz='US/Eastern')
+        rng3 = date_range('3/11/2012 03:00', periods=15, freq='H')
+        rng3 = rng3.tz_localize('US/Eastern')
+
+        tm.assert_index_equal(rng, rng3)
+
+        # DST transition time
+        val = rng[0]
+        exp = Timestamp('3/11/2012 03:00', tz='US/Eastern')
+
+        assert val.hour == 3
+        assert exp.hour == 3
+        assert val == exp  # same UTC value
+        tm.assert_index_equal(rng[:2], rng2)
+
+        # Right before the DST transition
+        rng = date_range('3/11/2012 00:00', periods=2, freq='H',
+                         tz='US/Eastern')
+        rng2 = DatetimeIndex(['3/11/2012 00:00', '3/11/2012 01:00'],
+                             tz='US/Eastern')
+        tm.assert_index_equal(rng, rng2)
+        exp = Timestamp('3/11/2012 00:00', tz='US/Eastern')
+        assert exp.hour == 0
+        assert rng[0] == exp
+        exp = Timestamp('3/11/2012 01:00', tz='US/Eastern')
+        assert exp.hour == 1
+        assert rng[1] == exp
+
+        rng = date_range('3/11/2012 00:00', periods=10, freq='H',
+                         tz='US/Eastern')
+        assert rng[2].hour == 3
+
+    def test_timestamp_equality_different_timezones(self):
+        utc_range = date_range('1/1/2000', periods=20, tz='UTC')
+        eastern_range = utc_range.tz_convert('US/Eastern')
+        berlin_range = utc_range.tz_convert('Europe/Berlin')
+
+        for a, b, c in zip(utc_range, eastern_range, berlin_range):
+            assert a == b
+            assert b == c
+            assert a == c
+
+        assert (utc_range == eastern_range).all()
+        assert (utc_range == berlin_range).all()
+        assert (berlin_range == eastern_range).all()
+
+    def test_dti_intersection(self):
+        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
+
+        left = rng[10:90][::-1]
+        right = rng[20:80][::-1]
+
+        assert left.tz == rng.tz
+        result = left.intersection(right)
+        assert result.tz == left.tz
+
+    def test_dti_equals_with_tz(self):
+        left = date_range('1/1/2011', periods=100, freq='H', tz='utc')
+        right = date_range('1/1/2011', periods=100, freq='H', tz='US/Eastern')
+
+        assert not left.equals(right)
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_tz_nat(self, tzstr):
+        idx = DatetimeIndex([Timestamp("2013-1-1", tz=tzstr), pd.NaT])
+
+        assert isna(idx[1])
+        assert idx[0].tzinfo is not None
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_astype_asobject_tzinfos(self, tzstr):
+        # GH#1345
+
+        # dates around a dst transition
+        rng = date_range('2/13/2010', '5/6/2010', tz=tzstr)
+
+        objs = rng.astype(object)
+        for i, x in enumerate(objs):
+            exval = rng[i]
+            assert x == exval
+            assert x.tzinfo == exval.tzinfo
+
+        objs = rng.astype(object)
+        for i, x in enumerate(objs):
+            exval = rng[i]
+            assert x == exval
+            assert x.tzinfo == exval.tzinfo
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_with_timezone_repr(self, tzstr):
+        rng = date_range('4/13/2010', '5/6/2010')
+
+        rng_eastern = rng.tz_localize(tzstr)
+
+        rng_repr = repr(rng_eastern)
+        assert '2010-04-13 00:00:00' in rng_repr
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_take_dont_lose_meta(self, tzstr):
+        rng = date_range('1/1/2000', periods=20, tz=tzstr)
+
+        result = rng.take(lrange(5))
+        assert result.tz == rng.tz
+        assert result.freq == rng.freq
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_utc_box_timestamp_and_localize(self, tzstr):
+        tz = timezones.maybe_get_tz(tzstr)
+
+        rng = date_range('3/11/2012', '3/12/2012', freq='H', tz='utc')
+        rng_eastern = rng.tz_convert(tzstr)
+
+        expected = rng[-1].astimezone(tz)
+
+        stamp = rng_eastern[-1]
+        assert stamp == expected
+        assert stamp.tzinfo == expected.tzinfo
+
+        # right tzinfo
+        rng = date_range('3/13/2012', '3/14/2012', freq='H', tz='utc')
+        rng_eastern = rng.tz_convert(tzstr)
+        # test not valid for dateutil timezones.
+        # assert 'EDT' in repr(rng_eastern[0].tzinfo)
+        assert ('EDT' in repr(rng_eastern[0].tzinfo) or
+                'tzfile' in repr(rng_eastern[0].tzinfo))
+
+    def test_dti_to_pydatetime(self):
+        dt = dateutil.parser.parse('2012-06-13T01:39:00Z')
+        dt = dt.replace(tzinfo=tzlocal())
+
+        arr = np.array([dt], dtype=object)
+
+        result = to_datetime(arr, utc=True)
+        assert result.tz is pytz.utc
+
+        rng = date_range('2012-11-03 03:00', '2012-11-05 03:00', tz=tzlocal())
+        arr = rng.to_pydatetime()
+        result = to_datetime(arr, utc=True)
+        assert result.tz is pytz.utc
+
+    def test_dti_to_pydatetime_fizedtz(self):
+        dates = np.array([datetime(2000, 1, 1, tzinfo=fixed_off),
+                          datetime(2000, 1, 2, tzinfo=fixed_off),
+                          datetime(2000, 1, 3, tzinfo=fixed_off)])
+        dti = DatetimeIndex(dates)
+
+        result = dti.to_pydatetime()
+        tm.assert_numpy_array_equal(dates, result)
+
+        result = dti._mpl_repr()
+        tm.assert_numpy_array_equal(dates, result)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Central'),
+                                    gettz('US/Central')])
+    def test_with_tz(self, tz):
+        # just want it to work
+        start = datetime(2011, 3, 12, tzinfo=pytz.utc)
+        dr = bdate_range(start, periods=50, freq=pd.offsets.Hour())
+        assert dr.tz is pytz.utc
+
+        # DateRange with naive datetimes
+        dr = bdate_range('1/1/2005', '1/1/2009', tz=pytz.utc)
+        dr = bdate_range('1/1/2005', '1/1/2009', tz=tz)
+
+        # normalized
+        central = dr.tz_convert(tz)
+        assert central.tz is tz
+        naive = central[0].to_pydatetime().replace(tzinfo=None)
+        comp = tslib._localize_pydatetime(naive, tz).tzinfo
+        assert central[0].tz is comp
+
+        # compare vs a localized tz
+        naive = dr[0].to_pydatetime().replace(tzinfo=None)
+        comp = tslib._localize_pydatetime(naive, tz).tzinfo
+        assert central[0].tz is comp
+
+        # datetimes with tzinfo set
+        dr = bdate_range(datetime(2005, 1, 1, tzinfo=pytz.utc),
+                         datetime(2009, 1, 1, tzinfo=pytz.utc))
+        with pytest.raises(Exception):
+            bdate_range(datetime(2005, 1, 1, tzinfo=pytz.utc), '1/1/2009',
+                        tz=tz)
+
+    @pytest.mark.parametrize('prefix', ['', 'dateutil/'])
+    def test_field_access_localize(self, prefix):
+        strdates = ['1/1/2012', '3/1/2012', '4/1/2012']
+        rng = DatetimeIndex(strdates, tz=prefix + 'US/Eastern')
+        assert (rng.hour == 0).all()
+
+        # a more unusual time zone, #1946
+        dr = date_range('2011-10-02 00:00', freq='h', periods=10,
+                        tz=prefix + 'America/Atikokan')
+
+        expected = Index(np.arange(10, dtype=np.int64))
+        tm.assert_index_equal(dr.hour, expected)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_convert_tz_aware_datetime_datetime(self, tz):
+        # GH#1581
+        dates = [datetime(2000, 1, 1), datetime(2000, 1, 2),
+                 datetime(2000, 1, 3)]
+
+        dates_aware = [tslib._localize_pydatetime(x, tz) for x in dates]
+        result = DatetimeIndex(dates_aware)
+        assert timezones.tz_compare(result.tz, tz)
+
+        converted = to_datetime(dates_aware, utc=True)
+        ex_vals = np.array([Timestamp(x).value for x in dates_aware])
+        tm.assert_numpy_array_equal(converted.asi8, ex_vals)
+        assert converted.tz is pytz.utc
+
+    def test_dti_union_aware(self):
+        # non-overlapping
+        rng = date_range("2012-11-15 00:00:00", periods=6, freq="H",
+                         tz="US/Central")
+
+        rng2 = date_range("2012-11-15 12:00:00", periods=6, freq="H",
+                          tz="US/Eastern")
+
+        result = rng.union(rng2)
+        assert result.tz.zone == 'UTC'
+
+    @pytest.mark.parametrize('tz', [None, 'UTC', "US/Central",
+                                    dateutil.tz.tzoffset(None, -28800)])
+    @pytest.mark.usefixtures("datetime_tz_utc")
+    @pytest.mark.skipif(not PY3, reason="datetime.timezone not in PY2")
+    def test_iteration_preserves_nanoseconds(self, tz):
+        # GH 19603
+        index = DatetimeIndex(["2018-02-08 15:00:00.168456358",
+                               "2018-02-08 15:00:00.168456359"], tz=tz)
+        for i, ts in enumerate(index):
+            assert ts == index[i]
+
+
+class TestDateRange(object):
+    """Tests for date_range with timezones"""
+    def test_hongkong_tz_convert(self):
+        # GH#1673 smoke test
+        dr = date_range('2012-01-01', '2012-01-10', freq='D', tz='Hongkong')
+
+        # it works!
+        dr.hour
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_date_range_span_dst_transition(self, tzstr):
+        # GH#1778
+
+        # Standard -> Daylight Savings Time
+        dr = date_range('03/06/2012 00:00', periods=200, freq='W-FRI',
+                        tz='US/Eastern')
+
+        assert (dr.hour == 0).all()
+
+        dr = date_range('2012-11-02', periods=10, tz=tzstr)
+        assert (dr.hour == 0).all()
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_date_range_timezone_str_argument(self, tzstr):
+        tz = timezones.maybe_get_tz(tzstr)
+        result = date_range('1/1/2000', periods=10, tz=tzstr)
+        expected = date_range('1/1/2000', periods=10, tz=tz)
+
+        tm.assert_index_equal(result, expected)
+
+    def test_date_range_with_fixedoffset_noname(self):
+        off = fixed_off_no_name
+        start = datetime(2012, 3, 11, 5, 0, 0, tzinfo=off)
+        end = datetime(2012, 6, 11, 5, 0, 0, tzinfo=off)
+        rng = date_range(start=start, end=end)
+        assert off == rng.tz
+
+        idx = Index([start, end])
+        assert off == idx.tz
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_date_range_with_tz(self, tzstr):
+        stamp = Timestamp('3/11/2012 05:00', tz=tzstr)
+        assert stamp.hour == 5
+
+        rng = date_range('3/11/2012 04:00', periods=10, freq='H',
+                         tz=tzstr)
+
+        assert stamp == rng[1]
+
+
+class TestToDatetime(object):
+    """Tests for the to_datetime constructor with timezones"""
+    def test_to_datetime_utc(self):
+        arr = np.array([dateutil.parser.parse('2012-06-13T01:39:00Z')],
+                       dtype=object)
+
+        result = to_datetime(arr, utc=True)
+        assert result.tz is pytz.utc
+
+    def test_to_datetime_fixed_offset(self):
+        dates = [datetime(2000, 1, 1, tzinfo=fixed_off),
+                 datetime(2000, 1, 2, tzinfo=fixed_off),
+                 datetime(2000, 1, 3, tzinfo=fixed_off)]
+        result = to_datetime(dates)
+        assert result.tz == fixed_off
diff --git a/pandas/tests/indexes/datetimes/test_tools.py b/pandas/tests/indexes/datetimes/test_tools.py
new file mode 100644
index 0000000000000..e09c1b3f19d1a
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_tools.py
@@ -0,0 +1,1652 @@
+""" test to_datetime """
+
+import pytz
+import pytest
+import locale
+import calendar
+import dateutil
+import numpy as np
+from dateutil.parser import parse
+from datetime import datetime, date, time
+from distutils.version import LooseVersion
+
+import pandas as pd
+from pandas._libs import tslib
+from pandas._libs.tslibs import parsing
+from pandas.core.tools import datetimes as tools
+
+from pandas.errors import OutOfBoundsDatetime
+from pandas.compat import lmap, PY3
+from pandas.core.dtypes.common import is_datetime64_ns_dtype
+from pandas.util import testing as tm
+import pandas.util._test_decorators as td
+from pandas.util.testing import assert_series_equal
+from pandas import (isna, to_datetime, Timestamp, Series, DataFrame,
+                    Index, DatetimeIndex, NaT, date_range, compat)
+
+
+class TestTimeConversionFormats(object):
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_format(self, cache):
+        values = ['1/1/2000', '1/2/2000', '1/3/2000']
+
+        results1 = [Timestamp('20000101'), Timestamp('20000201'),
+                    Timestamp('20000301')]
+        results2 = [Timestamp('20000101'), Timestamp('20000102'),
+                    Timestamp('20000103')]
+        for vals, expecteds in [(values, (Index(results1), Index(results2))),
+                                (Series(values),
+                                 (Series(results1), Series(results2))),
+                                (values[0], (results1[0], results2[0])),
+                                (values[1], (results1[1], results2[1])),
+                                (values[2], (results1[2], results2[2]))]:
+
+            for i, fmt in enumerate(['%d/%m/%Y', '%m/%d/%Y']):
+                result = to_datetime(vals, format=fmt, cache=cache)
+                expected = expecteds[i]
+
+                if isinstance(expected, Series):
+                    assert_series_equal(result, Series(expected))
+                elif isinstance(expected, Timestamp):
+                    assert result == expected
+                else:
+                    tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_format_YYYYMMDD(self, cache):
+        s = Series([19801222, 19801222] + [19810105] * 5)
+        expected = Series([Timestamp(x) for x in s.apply(str)])
+
+        result = to_datetime(s, format='%Y%m%d', cache=cache)
+        assert_series_equal(result, expected)
+
+        result = to_datetime(s.apply(str), format='%Y%m%d', cache=cache)
+        assert_series_equal(result, expected)
+
+        # with NaT
+        expected = Series([Timestamp("19801222"), Timestamp("19801222")] +
+                          [Timestamp("19810105")] * 5)
+        expected[2] = np.nan
+        s[2] = np.nan
+
+        result = to_datetime(s, format='%Y%m%d', cache=cache)
+        assert_series_equal(result, expected)
+
+        # string with NaT
+        s = s.apply(str)
+        s[2] = 'nat'
+        result = to_datetime(s, format='%Y%m%d', cache=cache)
+        assert_series_equal(result, expected)
+
+        # coercion
+        # GH 7930
+        s = Series([20121231, 20141231, 99991231])
+        result = pd.to_datetime(s, format='%Y%m%d', errors='ignore',
+                                cache=cache)
+        expected = Series([datetime(2012, 12, 31),
+                           datetime(2014, 12, 31), datetime(9999, 12, 31)],
+                          dtype=object)
+        tm.assert_series_equal(result, expected)
+
+        result = pd.to_datetime(s, format='%Y%m%d', errors='coerce',
+                                cache=cache)
+        expected = Series(['20121231', '20141231', 'NaT'], dtype='M8[ns]')
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_format_integer(self, cache):
+        # GH 10178
+        s = Series([2000, 2001, 2002])
+        expected = Series([Timestamp(x) for x in s.apply(str)])
+
+        result = to_datetime(s, format='%Y', cache=cache)
+        assert_series_equal(result, expected)
+
+        s = Series([200001, 200105, 200206])
+        expected = Series([Timestamp(x[:4] + '-' + x[4:]) for x in s.apply(str)
+                           ])
+
+        result = to_datetime(s, format='%Y%m', cache=cache)
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_format_microsecond(self, cache):
+
+        # these are locale dependent
+        lang, _ = locale.getlocale()
+        month_abbr = calendar.month_abbr[4]
+        val = '01-{}-2011 00:00:01.978'.format(month_abbr)
+
+        format = '%d-%b-%Y %H:%M:%S.%f'
+        result = to_datetime(val, format=format, cache=cache)
+        exp = datetime.strptime(val, format)
+        assert result == exp
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_format_time(self, cache):
+        data = [
+            ['01/10/2010 15:20', '%m/%d/%Y %H:%M',
+             Timestamp('2010-01-10 15:20')],
+            ['01/10/2010 05:43', '%m/%d/%Y %I:%M',
+             Timestamp('2010-01-10 05:43')],
+            ['01/10/2010 13:56:01', '%m/%d/%Y %H:%M:%S',
+             Timestamp('2010-01-10 13:56:01')]  # ,
+            # ['01/10/2010 08:14 PM', '%m/%d/%Y %I:%M %p',
+            #  Timestamp('2010-01-10 20:14')],
+            # ['01/10/2010 07:40 AM', '%m/%d/%Y %I:%M %p',
+            #  Timestamp('2010-01-10 07:40')],
+            # ['01/10/2010 09:12:56 AM', '%m/%d/%Y %I:%M:%S %p',
+            #  Timestamp('2010-01-10 09:12:56')]
+        ]
+        for s, format, dt in data:
+            assert to_datetime(s, format=format, cache=cache) == dt
+
+    @td.skip_if_has_locale
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_with_non_exact(self, cache):
+        # GH 10834
+        # 8904
+        # exact kw
+        s = Series(['19MAY11', 'foobar19MAY11', '19MAY11:00:00:00',
+                    '19MAY11 00:00:00Z'])
+        result = to_datetime(s, format='%d%b%y', exact=False, cache=cache)
+        expected = to_datetime(s.str.extract(r'(\d+\w+\d+)', expand=False),
+                               format='%d%b%y', cache=cache)
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_parse_nanoseconds_with_formula(self, cache):
+
+        # GH8989
+        # trunctaing the nanoseconds when a format was provided
+        for v in ["2012-01-01 09:00:00.000000001",
+                  "2012-01-01 09:00:00.000001",
+                  "2012-01-01 09:00:00.001",
+                  "2012-01-01 09:00:00.001000",
+                  "2012-01-01 09:00:00.001000000", ]:
+            expected = pd.to_datetime(v, cache=cache)
+            result = pd.to_datetime(v, format="%Y-%m-%d %H:%M:%S.%f",
+                                    cache=cache)
+            assert result == expected
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_format_weeks(self, cache):
+        data = [
+            ['2009324', '%Y%W%w', Timestamp('2009-08-13')],
+            ['2013020', '%Y%U%w', Timestamp('2013-01-13')]
+        ]
+        for s, format, dt in data:
+            assert to_datetime(s, format=format, cache=cache) == dt
+
+    @pytest.mark.parametrize("box,const,assert_equal", [
+        [True, pd.Index, 'assert_index_equal'],
+        [False, np.array, 'assert_numpy_array_equal']])
+    @pytest.mark.parametrize("fmt,dates,expected_dates", [
+        ['%Y-%m-%d %H:%M:%S %Z',
+         ['2010-01-01 12:00:00 UTC'] * 2,
+         [pd.Timestamp('2010-01-01 12:00:00', tz='UTC')] * 2],
+        ['%Y-%m-%d %H:%M:%S %Z',
+         ['2010-01-01 12:00:00 UTC',
+          '2010-01-01 12:00:00 GMT',
+          '2010-01-01 12:00:00 US/Pacific'],
+         [pd.Timestamp('2010-01-01 12:00:00', tz='UTC'),
+          pd.Timestamp('2010-01-01 12:00:00', tz='GMT'),
+          pd.Timestamp('2010-01-01 12:00:00', tz='US/Pacific')]],
+        ['%Y-%m-%d %H:%M:%S%z',
+         ['2010-01-01 12:00:00+0100'] * 2,
+         [pd.Timestamp('2010-01-01 12:00:00',
+                       tzinfo=pytz.FixedOffset(60))] * 2],
+        ['%Y-%m-%d %H:%M:%S %z',
+         ['2010-01-01 12:00:00 +0100'] * 2,
+         [pd.Timestamp('2010-01-01 12:00:00',
+                       tzinfo=pytz.FixedOffset(60))] * 2],
+        ['%Y-%m-%d %H:%M:%S %z',
+         ['2010-01-01 12:00:00 +0100', '2010-01-01 12:00:00 -0100'],
+         [pd.Timestamp('2010-01-01 12:00:00',
+                       tzinfo=pytz.FixedOffset(60)),
+          pd.Timestamp('2010-01-01 12:00:00',
+                       tzinfo=pytz.FixedOffset(-60))]],
+        ['%Y-%m-%d %H:%M:%S %z',
+         ['2010-01-01 12:00:00 Z', '2010-01-01 12:00:00 Z'],
+         [pd.Timestamp('2010-01-01 12:00:00',
+                       tzinfo=pytz.FixedOffset(0)),  # pytz coerces to UTC
+          pd.Timestamp('2010-01-01 12:00:00',
+                       tzinfo=pytz.FixedOffset(0))]]])
+    def test_to_datetime_parse_tzname_or_tzoffset(self, box, const,
+                                                  assert_equal, fmt,
+                                                  dates, expected_dates):
+        # GH 13486
+        result = pd.to_datetime(dates, format=fmt, box=box)
+        expected = const(expected_dates)
+        getattr(tm, assert_equal)(result, expected)
+
+        with pytest.raises(ValueError):
+            pd.to_datetime(dates, format=fmt, box=box, utc=True)
+
+    @pytest.mark.parametrize('offset', [
+        '+0', '-1foo', 'UTCbar', ':10', '+01:000:01', ''])
+    def test_to_datetime_parse_timezone_malformed(self, offset):
+        fmt = '%Y-%m-%d %H:%M:%S %z'
+        date = '2010-01-01 12:00:00 ' + offset
+        with pytest.raises(ValueError):
+            pd.to_datetime([date], format=fmt)
+
+
+class TestToDatetime(object):
+    def test_to_datetime_pydatetime(self):
+        actual = pd.to_datetime(datetime(2008, 1, 15))
+        assert actual == datetime(2008, 1, 15)
+
+    def test_to_datetime_YYYYMMDD(self):
+        actual = pd.to_datetime('20080115')
+        assert actual == datetime(2008, 1, 15)
+
+    def test_to_datetime_unparseable_ignore(self):
+        # unparseable
+        s = 'Month 1, 1999'
+        assert pd.to_datetime(s, errors='ignore') == s
+
+    @td.skip_if_windows  # `tm.set_timezone` does not work in windows
+    def test_to_datetime_now(self):
+        # See GH#18666
+        with tm.set_timezone('US/Eastern'):
+            npnow = np.datetime64('now').astype('datetime64[ns]')
+            pdnow = pd.to_datetime('now')
+            pdnow2 = pd.to_datetime(['now'])[0]
+
+            # These should all be equal with infinite perf; this gives
+            # a generous margin of 10 seconds
+            assert abs(pdnow.value - npnow.astype(np.int64)) < 1e10
+            assert abs(pdnow2.value - npnow.astype(np.int64)) < 1e10
+
+            assert pdnow.tzinfo is None
+            assert pdnow2.tzinfo is None
+
+    @td.skip_if_windows  # `tm.set_timezone` does not work in windows
+    def test_to_datetime_today(self):
+        # See GH#18666
+        # Test with one timezone far ahead of UTC and another far behind, so
+        # one of these will _almost_ alawys be in a different day from UTC.
+        # Unfortunately this test between 12 and 1 AM Samoa time
+        # this both of these timezones _and_ UTC will all be in the same day,
+        # so this test will not detect the regression introduced in #18666.
+        with tm.set_timezone('Pacific/Auckland'):  # 12-13 hours ahead of UTC
+            nptoday = np.datetime64('today')\
+                .astype('datetime64[ns]').astype(np.int64)
+            pdtoday = pd.to_datetime('today')
+            pdtoday2 = pd.to_datetime(['today'])[0]
+
+            tstoday = pd.Timestamp('today')
+            tstoday2 = pd.Timestamp.today()
+
+            # These should all be equal with infinite perf; this gives
+            # a generous margin of 10 seconds
+            assert abs(pdtoday.normalize().value - nptoday) < 1e10
+            assert abs(pdtoday2.normalize().value - nptoday) < 1e10
+            assert abs(pdtoday.value - tstoday.value) < 1e10
+            assert abs(pdtoday.value - tstoday2.value) < 1e10
+
+            assert pdtoday.tzinfo is None
+            assert pdtoday2.tzinfo is None
+
+        with tm.set_timezone('US/Samoa'):  # 11 hours behind UTC
+            nptoday = np.datetime64('today')\
+                .astype('datetime64[ns]').astype(np.int64)
+            pdtoday = pd.to_datetime('today')
+            pdtoday2 = pd.to_datetime(['today'])[0]
+
+            # These should all be equal with infinite perf; this gives
+            # a generous margin of 10 seconds
+            assert abs(pdtoday.normalize().value - nptoday) < 1e10
+            assert abs(pdtoday2.normalize().value - nptoday) < 1e10
+
+            assert pdtoday.tzinfo is None
+            assert pdtoday2.tzinfo is None
+
+    def test_to_datetime_today_now_unicode_bytes(self):
+        to_datetime([u'now'])
+        to_datetime([u'today'])
+        if not PY3:
+            to_datetime(['now'])
+            to_datetime(['today'])
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_dt64s(self, cache):
+        in_bound_dts = [
+            np.datetime64('2000-01-01'),
+            np.datetime64('2000-01-02'),
+        ]
+
+        for dt in in_bound_dts:
+            assert pd.to_datetime(dt, cache=cache) == Timestamp(dt)
+
+        oob_dts = [np.datetime64('1000-01-01'), np.datetime64('5000-01-02'), ]
+
+        for dt in oob_dts:
+            pytest.raises(ValueError, pd.to_datetime, dt, errors='raise')
+            pytest.raises(ValueError, Timestamp, dt)
+            assert pd.to_datetime(dt, errors='coerce', cache=cache) is NaT
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_array_of_dt64s(self, cache):
+        dts = [np.datetime64('2000-01-01'), np.datetime64('2000-01-02'), ]
+
+        # Assuming all datetimes are in bounds, to_datetime() returns
+        # an array that is equal to Timestamp() parsing
+        tm.assert_numpy_array_equal(
+            pd.to_datetime(dts, box=False, cache=cache),
+            np.array([Timestamp(x).asm8 for x in dts])
+        )
+
+        # A list of datetimes where the last one is out of bounds
+        dts_with_oob = dts + [np.datetime64('9999-01-01')]
+
+        pytest.raises(ValueError, pd.to_datetime, dts_with_oob,
+                      errors='raise')
+
+        tm.assert_numpy_array_equal(
+            pd.to_datetime(dts_with_oob, box=False, errors='coerce',
+                           cache=cache),
+            np.array(
+                [
+                    Timestamp(dts_with_oob[0]).asm8,
+                    Timestamp(dts_with_oob[1]).asm8,
+                    tslib.iNaT,
+                ],
+                dtype='M8'
+            )
+        )
+
+        # With errors='ignore', out of bounds datetime64s
+        # are converted to their .item(), which depending on the version of
+        # numpy is either a python datetime.datetime or datetime.date
+        tm.assert_numpy_array_equal(
+            pd.to_datetime(dts_with_oob, box=False, errors='ignore',
+                           cache=cache),
+            np.array(
+                [dt.item() for dt in dts_with_oob],
+                dtype='O'
+            )
+        )
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_tz(self, cache):
+
+        # xref 8260
+        # uniform returns a DatetimeIndex
+        arr = [pd.Timestamp('2013-01-01 13:00:00-0800', tz='US/Pacific'),
+               pd.Timestamp('2013-01-02 14:00:00-0800', tz='US/Pacific')]
+        result = pd.to_datetime(arr, cache=cache)
+        expected = DatetimeIndex(
+            ['2013-01-01 13:00:00', '2013-01-02 14:00:00'], tz='US/Pacific')
+        tm.assert_index_equal(result, expected)
+
+        # mixed tzs will raise
+        arr = [pd.Timestamp('2013-01-01 13:00:00', tz='US/Pacific'),
+               pd.Timestamp('2013-01-02 14:00:00', tz='US/Eastern')]
+        pytest.raises(ValueError, lambda: pd.to_datetime(arr, cache=cache))
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_tz_pytz(self, cache):
+        # see gh-8260
+        us_eastern = pytz.timezone('US/Eastern')
+        arr = np.array([us_eastern.localize(datetime(year=2000, month=1, day=1,
+                                                     hour=3, minute=0)),
+                        us_eastern.localize(datetime(year=2000, month=6, day=1,
+                                                     hour=3, minute=0))],
+                       dtype=object)
+        result = pd.to_datetime(arr, utc=True, cache=cache)
+        expected = DatetimeIndex(['2000-01-01 08:00:00+00:00',
+                                  '2000-06-01 07:00:00+00:00'],
+                                 dtype='datetime64[ns, UTC]', freq=None)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    @pytest.mark.parametrize("init_constructor, end_constructor, test_method",
+                             [(Index, DatetimeIndex, tm.assert_index_equal),
+                              (list, DatetimeIndex, tm.assert_index_equal),
+                              (np.array, DatetimeIndex, tm.assert_index_equal),
+                              (Series, Series, tm.assert_series_equal)])
+    def test_to_datetime_utc_true(self,
+                                  cache,
+                                  init_constructor,
+                                  end_constructor,
+                                  test_method):
+        # See gh-11934 & gh-6415
+        data = ['20100102 121314', '20100102 121315']
+        expected_data = [pd.Timestamp('2010-01-02 12:13:14', tz='utc'),
+                         pd.Timestamp('2010-01-02 12:13:15', tz='utc')]
+
+        result = pd.to_datetime(init_constructor(data),
+                                format='%Y%m%d %H%M%S',
+                                utc=True,
+                                cache=cache)
+        expected = end_constructor(expected_data)
+        test_method(result, expected)
+
+        # Test scalar case as well
+        for scalar, expected in zip(data, expected_data):
+            result = pd.to_datetime(scalar, format='%Y%m%d %H%M%S', utc=True,
+                                    cache=cache)
+            assert result == expected
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_utc_true_with_series_single_value(self, cache):
+        # GH 15760 UTC=True with Series
+        ts = 1.5e18
+        result = pd.to_datetime(pd.Series([ts]), utc=True, cache=cache)
+        expected = pd.Series([pd.Timestamp(ts, tz='utc')])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_utc_true_with_series_tzaware_string(self, cache):
+        ts = '2013-01-01 00:00:00-01:00'
+        expected_ts = '2013-01-01 01:00:00'
+        data = pd.Series([ts] * 3)
+        result = pd.to_datetime(data, utc=True, cache=cache)
+        expected = pd.Series([pd.Timestamp(expected_ts, tz='utc')] * 3)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    @pytest.mark.parametrize('date, dtype',
+                             [('2013-01-01 01:00:00', 'datetime64[ns]'),
+                              ('2013-01-01 01:00:00', 'datetime64[ns, UTC]')])
+    def test_to_datetime_utc_true_with_series_datetime_ns(self, cache, date,
+                                                          dtype):
+        expected = pd.Series([pd.Timestamp('2013-01-01 01:00:00', tz='UTC')])
+        result = pd.to_datetime(pd.Series([date], dtype=dtype), utc=True,
+                                cache=cache)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_tz_psycopg2(self, cache):
+
+        # xref 8260
+        try:
+            import psycopg2
+        except ImportError:
+            pytest.skip("no psycopg2 installed")
+
+        # misc cases
+        tz1 = psycopg2.tz.FixedOffsetTimezone(offset=-300, name=None)
+        tz2 = psycopg2.tz.FixedOffsetTimezone(offset=-240, name=None)
+        arr = np.array([datetime(2000, 1, 1, 3, 0, tzinfo=tz1),
+                        datetime(2000, 6, 1, 3, 0, tzinfo=tz2)],
+                       dtype=object)
+
+        result = pd.to_datetime(arr, errors='coerce', utc=True, cache=cache)
+        expected = DatetimeIndex(['2000-01-01 08:00:00+00:00',
+                                  '2000-06-01 07:00:00+00:00'],
+                                 dtype='datetime64[ns, UTC]', freq=None)
+        tm.assert_index_equal(result, expected)
+
+        # dtype coercion
+        i = pd.DatetimeIndex([
+            '2000-01-01 08:00:00+00:00'
+        ], tz=psycopg2.tz.FixedOffsetTimezone(offset=-300, name=None))
+        assert is_datetime64_ns_dtype(i)
+
+        # tz coerceion
+        result = pd.to_datetime(i, errors='coerce', cache=cache)
+        tm.assert_index_equal(result, i)
+
+        result = pd.to_datetime(i, errors='coerce', utc=True, cache=cache)
+        expected = pd.DatetimeIndex(['2000-01-01 13:00:00'],
+                                    dtype='datetime64[ns, UTC]')
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        'cache',
+        [pytest.param(True,
+                      marks=pytest.mark.skipif(True, reason="GH 18111")),
+         False])
+    def test_datetime_bool(self, cache):
+        # GH13176
+        with pytest.raises(TypeError):
+            to_datetime(False)
+        assert to_datetime(False, errors="coerce", cache=cache) is NaT
+        assert to_datetime(False, errors="ignore", cache=cache) is False
+        with pytest.raises(TypeError):
+            to_datetime(True)
+        assert to_datetime(True, errors="coerce", cache=cache) is NaT
+        assert to_datetime(True, errors="ignore", cache=cache) is True
+        with pytest.raises(TypeError):
+            to_datetime([False, datetime.today()], cache=cache)
+        with pytest.raises(TypeError):
+            to_datetime(['20130101', True], cache=cache)
+        tm.assert_index_equal(to_datetime([0, False, NaT, 0.0],
+                                          errors="coerce", cache=cache),
+                              DatetimeIndex([to_datetime(0, cache=cache),
+                                             NaT,
+                                             NaT,
+                                             to_datetime(0, cache=cache)]))
+
+    def test_datetime_invalid_datatype(self):
+        # GH13176
+
+        with pytest.raises(TypeError):
+            pd.to_datetime(bool)
+        with pytest.raises(TypeError):
+            pd.to_datetime(pd.to_datetime)
+
+    @pytest.mark.parametrize("utc", [True, None])
+    @pytest.mark.parametrize("format", ['%Y%m%d %H:%M:%S', None])
+    @pytest.mark.parametrize("box", [True, False])
+    @pytest.mark.parametrize("constructor", [list, tuple, np.array, pd.Index])
+    def test_to_datetime_cache(self, utc, format, box, constructor):
+        date = '20130101 00:00:00'
+        test_dates = [date] * 10**5
+        data = constructor(test_dates)
+        result = pd.to_datetime(data, utc=utc, format=format, box=box,
+                                cache=True)
+        expected = pd.to_datetime(data, utc=utc, format=format, box=box,
+                                  cache=False)
+        if box:
+            tm.assert_index_equal(result, expected)
+        else:
+            tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize("utc", [True, None])
+    @pytest.mark.parametrize("format", ['%Y%m%d %H:%M:%S', None])
+    def test_to_datetime_cache_series(self, utc, format):
+        date = '20130101 00:00:00'
+        test_dates = [date] * 10**5
+        data = pd.Series(test_dates)
+        result = pd.to_datetime(data, utc=utc, format=format, cache=True)
+        expected = pd.to_datetime(data, utc=utc, format=format, cache=False)
+        tm.assert_series_equal(result, expected)
+
+    def test_to_datetime_cache_scalar(self):
+        date = '20130101 00:00:00'
+        result = pd.to_datetime(date, cache=True)
+        expected = pd.Timestamp('20130101 00:00:00')
+        assert result == expected
+
+    @pytest.mark.parametrize('date, format',
+                             [('2017-20', '%Y-%W'),
+                              ('20 Sunday', '%W %A'),
+                              ('20 Sun', '%W %a'),
+                              ('2017-21', '%Y-%U'),
+                              ('20 Sunday', '%U %A'),
+                              ('20 Sun', '%U %a')])
+    def test_week_without_day_and_calendar_year(self, date, format):
+        # GH16774
+
+        msg = "Cannot use '%W' or '%U' without day and year"
+        with tm.assert_raises_regex(ValueError, msg):
+            pd.to_datetime(date, format=format)
+
+
+class TestToDatetimeUnit(object):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_unit(self, cache):
+        # GH 11758
+        # test proper behavior with erros
+
+        with pytest.raises(ValueError):
+            to_datetime([1], unit='D', format='%Y%m%d', cache=cache)
+
+        values = [11111111, 1, 1.0, tslib.iNaT, NaT, np.nan,
+                  'NaT', '']
+        result = to_datetime(values, unit='D', errors='ignore', cache=cache)
+        expected = Index([11111111, Timestamp('1970-01-02'),
+                          Timestamp('1970-01-02'), NaT,
+                          NaT, NaT, NaT, NaT],
+                         dtype=object)
+        tm.assert_index_equal(result, expected)
+
+        result = to_datetime(values, unit='D', errors='coerce', cache=cache)
+        expected = DatetimeIndex(['NaT', '1970-01-02', '1970-01-02',
+                                  'NaT', 'NaT', 'NaT', 'NaT', 'NaT'])
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(tslib.OutOfBoundsDatetime):
+            to_datetime(values, unit='D', errors='raise', cache=cache)
+
+        values = [1420043460000, tslib.iNaT, NaT, np.nan, 'NaT']
+
+        result = to_datetime(values, errors='ignore', unit='s', cache=cache)
+        expected = Index([1420043460000, NaT, NaT,
+                          NaT, NaT], dtype=object)
+        tm.assert_index_equal(result, expected)
+
+        result = to_datetime(values, errors='coerce', unit='s', cache=cache)
+        expected = DatetimeIndex(['NaT', 'NaT', 'NaT', 'NaT', 'NaT'])
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(tslib.OutOfBoundsDatetime):
+            to_datetime(values, errors='raise', unit='s', cache=cache)
+
+        # if we have a string, then we raise a ValueError
+        # and NOT an OutOfBoundsDatetime
+        for val in ['foo', Timestamp('20130101')]:
+            try:
+                to_datetime(val, errors='raise', unit='s', cache=cache)
+            except tslib.OutOfBoundsDatetime:
+                raise AssertionError("incorrect exception raised")
+            except ValueError:
+                pass
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_unit_consistency(self, cache):
+
+        # consistency of conversions
+        expected = Timestamp('1970-05-09 14:25:11')
+        result = pd.to_datetime(11111111, unit='s', errors='raise',
+                                cache=cache)
+        assert result == expected
+        assert isinstance(result, Timestamp)
+
+        result = pd.to_datetime(11111111, unit='s', errors='coerce',
+                                cache=cache)
+        assert result == expected
+        assert isinstance(result, Timestamp)
+
+        result = pd.to_datetime(11111111, unit='s', errors='ignore',
+                                cache=cache)
+        assert result == expected
+        assert isinstance(result, Timestamp)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_unit_with_numeric(self, cache):
+
+        # GH 13180
+        # coercions from floats/ints are ok
+        expected = DatetimeIndex(['2015-06-19 05:33:20',
+                                  '2015-05-27 22:33:20'])
+        arr1 = [1.434692e+18, 1.432766e+18]
+        arr2 = np.array(arr1).astype('int64')
+        for errors in ['ignore', 'raise', 'coerce']:
+            result = pd.to_datetime(arr1, errors=errors, cache=cache)
+            tm.assert_index_equal(result, expected)
+
+            result = pd.to_datetime(arr2, errors=errors, cache=cache)
+            tm.assert_index_equal(result, expected)
+
+        # but we want to make sure that we are coercing
+        # if we have ints/strings
+        expected = DatetimeIndex(['NaT',
+                                  '2015-06-19 05:33:20',
+                                  '2015-05-27 22:33:20'])
+        arr = ['foo', 1.434692e+18, 1.432766e+18]
+        result = pd.to_datetime(arr, errors='coerce', cache=cache)
+        tm.assert_index_equal(result, expected)
+
+        expected = DatetimeIndex(['2015-06-19 05:33:20',
+                                  '2015-05-27 22:33:20',
+                                  'NaT',
+                                  'NaT'])
+        arr = [1.434692e+18, 1.432766e+18, 'foo', 'NaT']
+        result = pd.to_datetime(arr, errors='coerce', cache=cache)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_unit_mixed(self, cache):
+
+        # mixed integers/datetimes
+        expected = DatetimeIndex(['2013-01-01', 'NaT', 'NaT'])
+        arr = [pd.Timestamp('20130101'), 1.434692e+18, 1.432766e+18]
+        result = pd.to_datetime(arr, errors='coerce', cache=cache)
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(ValueError):
+            pd.to_datetime(arr, errors='raise', cache=cache)
+
+        expected = DatetimeIndex(['NaT',
+                                  'NaT',
+                                  '2013-01-01'])
+        arr = [1.434692e+18, 1.432766e+18, pd.Timestamp('20130101')]
+        result = pd.to_datetime(arr, errors='coerce', cache=cache)
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(ValueError):
+            pd.to_datetime(arr, errors='raise', cache=cache)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_unit_rounding(self, cache):
+        # GH 14156: argument will incur floating point errors but no
+        # premature rounding
+        result = pd.to_datetime(1434743731.8770001, unit='s', cache=cache)
+        expected = pd.Timestamp('2015-06-19 19:55:31.877000093')
+        assert result == expected
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_dataframe(self, cache):
+
+        df = DataFrame({'year': [2015, 2016],
+                        'month': [2, 3],
+                        'day': [4, 5],
+                        'hour': [6, 7],
+                        'minute': [58, 59],
+                        'second': [10, 11],
+                        'ms': [1, 1],
+                        'us': [2, 2],
+                        'ns': [3, 3]})
+
+        result = to_datetime({'year': df['year'],
+                              'month': df['month'],
+                              'day': df['day']}, cache=cache)
+        expected = Series([Timestamp('20150204 00:00:00'),
+                           Timestamp('20160305 00:0:00')])
+        assert_series_equal(result, expected)
+
+        # dict-like
+        result = to_datetime(df[['year', 'month', 'day']].to_dict(),
+                             cache=cache)
+        assert_series_equal(result, expected)
+
+        # dict but with constructable
+        df2 = df[['year', 'month', 'day']].to_dict()
+        df2['month'] = 2
+        result = to_datetime(df2, cache=cache)
+        expected2 = Series([Timestamp('20150204 00:00:00'),
+                            Timestamp('20160205 00:0:00')])
+        assert_series_equal(result, expected2)
+
+        # unit mappings
+        units = [{'year': 'years',
+                  'month': 'months',
+                  'day': 'days',
+                  'hour': 'hours',
+                  'minute': 'minutes',
+                  'second': 'seconds'},
+                 {'year': 'year',
+                  'month': 'month',
+                  'day': 'day',
+                  'hour': 'hour',
+                  'minute': 'minute',
+                  'second': 'second'},
+                 ]
+
+        for d in units:
+            result = to_datetime(df[list(d.keys())].rename(columns=d),
+                                 cache=cache)
+            expected = Series([Timestamp('20150204 06:58:10'),
+                               Timestamp('20160305 07:59:11')])
+            assert_series_equal(result, expected)
+
+        d = {'year': 'year',
+             'month': 'month',
+             'day': 'day',
+             'hour': 'hour',
+             'minute': 'minute',
+             'second': 'second',
+             'ms': 'ms',
+             'us': 'us',
+             'ns': 'ns'}
+
+        result = to_datetime(df.rename(columns=d), cache=cache)
+        expected = Series([Timestamp('20150204 06:58:10.001002003'),
+                           Timestamp('20160305 07:59:11.001002003')])
+        assert_series_equal(result, expected)
+
+        # coerce back to int
+        result = to_datetime(df.astype(str), cache=cache)
+        assert_series_equal(result, expected)
+
+        # passing coerce
+        df2 = DataFrame({'year': [2015, 2016],
+                         'month': [2, 20],
+                         'day': [4, 5]})
+
+        msg = ("cannot assemble the datetimes: time data .+ does not "
+               r"match format '%Y%m%d' \(match\)")
+        with tm.assert_raises_regex(ValueError, msg):
+            to_datetime(df2, cache=cache)
+        result = to_datetime(df2, errors='coerce', cache=cache)
+        expected = Series([Timestamp('20150204 00:00:00'),
+                           NaT])
+        assert_series_equal(result, expected)
+
+        # extra columns
+        msg = ("extra keys have been passed to the datetime assemblage: "
+               r"\[foo\]")
+        with tm.assert_raises_regex(ValueError, msg):
+            df2 = df.copy()
+            df2['foo'] = 1
+            to_datetime(df2, cache=cache)
+
+        # not enough
+        msg = (r'to assemble mappings requires at least that \[year, month, '
+               r'day\] be specified: \[.+\] is missing')
+        for c in [['year'],
+                  ['year', 'month'],
+                  ['year', 'month', 'second'],
+                  ['month', 'day'],
+                  ['year', 'day', 'second']]:
+            with tm.assert_raises_regex(ValueError, msg):
+                to_datetime(df[c], cache=cache)
+
+        # duplicates
+        msg = 'cannot assemble with duplicate keys'
+        df2 = DataFrame({'year': [2015, 2016],
+                         'month': [2, 20],
+                         'day': [4, 5]})
+        df2.columns = ['year', 'year', 'day']
+        with tm.assert_raises_regex(ValueError, msg):
+            to_datetime(df2, cache=cache)
+
+        df2 = DataFrame({'year': [2015, 2016],
+                         'month': [2, 20],
+                         'day': [4, 5],
+                         'hour': [4, 5]})
+        df2.columns = ['year', 'month', 'day', 'day']
+        with tm.assert_raises_regex(ValueError, msg):
+            to_datetime(df2, cache=cache)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_dataframe_dtypes(self, cache):
+        # #13451
+        df = DataFrame({'year': [2015, 2016],
+                        'month': [2, 3],
+                        'day': [4, 5]})
+
+        # int16
+        result = to_datetime(df.astype('int16'), cache=cache)
+        expected = Series([Timestamp('20150204 00:00:00'),
+                           Timestamp('20160305 00:00:00')])
+        assert_series_equal(result, expected)
+
+        # mixed dtypes
+        df['month'] = df['month'].astype('int8')
+        df['day'] = df['day'].astype('int8')
+        result = to_datetime(df, cache=cache)
+        expected = Series([Timestamp('20150204 00:00:00'),
+                           Timestamp('20160305 00:00:00')])
+        assert_series_equal(result, expected)
+
+        # float
+        df = DataFrame({'year': [2000, 2001],
+                        'month': [1.5, 1],
+                        'day': [1, 1]})
+        with pytest.raises(ValueError):
+            to_datetime(df, cache=cache)
+
+
+class TestToDatetimeMisc(object):
+    def test_to_datetime_barely_out_of_bounds(self):
+        # GH#19529
+        # GH#19382 close enough to bounds that dropping nanos would result
+        # in an in-bounds datetime
+        arr = np.array(['2262-04-11 23:47:16.854775808'], dtype=object)
+
+        with pytest.raises(OutOfBoundsDatetime):
+            to_datetime(arr)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_iso8601(self, cache):
+        result = to_datetime(["2012-01-01 00:00:00"], cache=cache)
+        exp = Timestamp("2012-01-01 00:00:00")
+        assert result[0] == exp
+
+        result = to_datetime(['20121001'], cache=cache)  # bad iso 8601
+        exp = Timestamp('2012-10-01')
+        assert result[0] == exp
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_default(self, cache):
+        rs = to_datetime('2001', cache=cache)
+        xp = datetime(2001, 1, 1)
+        assert rs == xp
+
+        # dayfirst is essentially broken
+
+        # to_datetime('01-13-2012', dayfirst=True)
+        # pytest.raises(ValueError, to_datetime('01-13-2012',
+        #                   dayfirst=True))
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_on_datetime64_series(self, cache):
+        # #2699
+        s = Series(date_range('1/1/2000', periods=10))
+
+        result = to_datetime(s, cache=cache)
+        assert result[0] == s[0]
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_with_space_in_series(self, cache):
+        # GH 6428
+        s = Series(['10/18/2006', '10/18/2008', ' '])
+        pytest.raises(ValueError, lambda: to_datetime(s,
+                                                      errors='raise',
+                                                      cache=cache))
+        result_coerce = to_datetime(s, errors='coerce', cache=cache)
+        expected_coerce = Series([datetime(2006, 10, 18),
+                                  datetime(2008, 10, 18),
+                                  NaT])
+        tm.assert_series_equal(result_coerce, expected_coerce)
+        result_ignore = to_datetime(s, errors='ignore', cache=cache)
+        tm.assert_series_equal(result_ignore, s)
+
+    @td.skip_if_has_locale
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_with_apply(self, cache):
+        # this is only locale tested with US/None locales
+        # GH 5195
+        # with a format and coerce a single item to_datetime fails
+        td = Series(['May 04', 'Jun 02', 'Dec 11'], index=[1, 2, 3])
+        expected = pd.to_datetime(td, format='%b %y', cache=cache)
+        result = td.apply(pd.to_datetime, format='%b %y', cache=cache)
+        assert_series_equal(result, expected)
+
+        td = pd.Series(['May 04', 'Jun 02', ''], index=[1, 2, 3])
+        pytest.raises(ValueError,
+                      lambda: pd.to_datetime(td, format='%b %y',
+                                             errors='raise',
+                                             cache=cache))
+        pytest.raises(ValueError,
+                      lambda: td.apply(pd.to_datetime, format='%b %y',
+                                       errors='raise', cache=cache))
+        expected = pd.to_datetime(td, format='%b %y', errors='coerce',
+                                  cache=cache)
+
+        result = td.apply(
+            lambda x: pd.to_datetime(x, format='%b %y', errors='coerce',
+                                     cache=cache))
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_types(self, cache):
+
+        # empty string
+        result = to_datetime('', cache=cache)
+        assert result is NaT
+
+        result = to_datetime(['', ''], cache=cache)
+        assert isna(result).all()
+
+        # ints
+        result = Timestamp(0)
+        expected = to_datetime(0, cache=cache)
+        assert result == expected
+
+        # GH 3888 (strings)
+        expected = to_datetime(['2012'], cache=cache)[0]
+        result = to_datetime('2012', cache=cache)
+        assert result == expected
+
+        # array = ['2012','20120101','20120101 12:01:01']
+        array = ['20120101', '20120101 12:01:01']
+        expected = list(to_datetime(array, cache=cache))
+        result = lmap(Timestamp, array)
+        tm.assert_almost_equal(result, expected)
+
+        # currently fails ###
+        # result = Timestamp('2012')
+        # expected = to_datetime('2012')
+        # assert result == expected
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_unprocessable_input(self, cache):
+        # GH 4928
+        tm.assert_numpy_array_equal(
+            to_datetime([1, '1'], errors='ignore', cache=cache),
+            np.array([1, '1'], dtype='O')
+        )
+        pytest.raises(TypeError, to_datetime, [1, '1'], errors='raise',
+                      cache=cache)
+
+    def test_to_datetime_other_datetime64_units(self):
+        # 5/25/2012
+        scalar = np.int64(1337904000000000).view('M8[us]')
+        as_obj = scalar.astype('O')
+
+        index = DatetimeIndex([scalar])
+        assert index[0] == scalar.astype('O')
+
+        value = Timestamp(scalar)
+        assert value == as_obj
+
+    def test_to_datetime_list_of_integers(self):
+        rng = date_range('1/1/2000', periods=20)
+        rng = DatetimeIndex(rng.values)
+
+        ints = list(rng.asi8)
+
+        result = DatetimeIndex(ints)
+
+        tm.assert_index_equal(rng, result)
+
+    def test_to_datetime_overflow(self):
+        # gh-17637
+        # we are overflowing Timedelta range here
+
+        with pytest.raises(OverflowError):
+            date_range(start='1/1/1700', freq='B', periods=100000)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_string_na_nat_conversion(self, cache):
+        # GH #999, #858
+
+        from pandas.compat import parse_date
+
+        strings = np.array(['1/1/2000', '1/2/2000', np.nan,
+                            '1/4/2000, 12:34:56'], dtype=object)
+
+        expected = np.empty(4, dtype='M8[ns]')
+        for i, val in enumerate(strings):
+            if isna(val):
+                expected[i] = tslib.iNaT
+            else:
+                expected[i] = parse_date(val)
+
+        result = tslib.array_to_datetime(strings)
+        tm.assert_almost_equal(result, expected)
+
+        result2 = to_datetime(strings, cache=cache)
+        assert isinstance(result2, DatetimeIndex)
+        tm.assert_numpy_array_equal(result, result2.values)
+
+        malformed = np.array(['1/100/2000', np.nan], dtype=object)
+
+        # GH 10636, default is now 'raise'
+        pytest.raises(ValueError,
+                      lambda: to_datetime(malformed, errors='raise',
+                                          cache=cache))
+
+        result = to_datetime(malformed, errors='ignore', cache=cache)
+        tm.assert_numpy_array_equal(result, malformed)
+
+        pytest.raises(ValueError, to_datetime, malformed, errors='raise',
+                      cache=cache)
+
+        idx = ['a', 'b', 'c', 'd', 'e']
+        series = Series(['1/1/2000', np.nan, '1/3/2000', np.nan,
+                         '1/5/2000'], index=idx, name='foo')
+        dseries = Series([to_datetime('1/1/2000', cache=cache), np.nan,
+                          to_datetime('1/3/2000', cache=cache), np.nan,
+                          to_datetime('1/5/2000', cache=cache)],
+                         index=idx, name='foo')
+
+        result = to_datetime(series, cache=cache)
+        dresult = to_datetime(dseries, cache=cache)
+
+        expected = Series(np.empty(5, dtype='M8[ns]'), index=idx)
+        for i in range(5):
+            x = series[i]
+            if isna(x):
+                expected[i] = tslib.iNaT
+            else:
+                expected[i] = to_datetime(x, cache=cache)
+
+        assert_series_equal(result, expected, check_names=False)
+        assert result.name == 'foo'
+
+        assert_series_equal(dresult, expected, check_names=False)
+        assert dresult.name == 'foo'
+
+    @pytest.mark.parametrize('dtype', [
+        'datetime64[h]', 'datetime64[m]',
+        'datetime64[s]', 'datetime64[ms]',
+        'datetime64[us]', 'datetime64[ns]'])
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_dti_constructor_numpy_timeunits(self, cache, dtype):
+        # GH 9114
+        base = pd.to_datetime(['2000-01-01T00:00', '2000-01-02T00:00', 'NaT'],
+                              cache=cache)
+
+        values = base.values.astype(dtype)
+
+        tm.assert_index_equal(DatetimeIndex(values), base)
+        tm.assert_index_equal(to_datetime(values, cache=cache), base)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_dayfirst(self, cache):
+        # GH 5917
+        arr = ['10/02/2014', '11/02/2014', '12/02/2014']
+        expected = DatetimeIndex([datetime(2014, 2, 10), datetime(2014, 2, 11),
+                                  datetime(2014, 2, 12)])
+        idx1 = DatetimeIndex(arr, dayfirst=True)
+        idx2 = DatetimeIndex(np.array(arr), dayfirst=True)
+        idx3 = to_datetime(arr, dayfirst=True, cache=cache)
+        idx4 = to_datetime(np.array(arr), dayfirst=True, cache=cache)
+        idx5 = DatetimeIndex(Index(arr), dayfirst=True)
+        idx6 = DatetimeIndex(Series(arr), dayfirst=True)
+        tm.assert_index_equal(expected, idx1)
+        tm.assert_index_equal(expected, idx2)
+        tm.assert_index_equal(expected, idx3)
+        tm.assert_index_equal(expected, idx4)
+        tm.assert_index_equal(expected, idx5)
+        tm.assert_index_equal(expected, idx6)
+
+
+class TestGuessDatetimeFormat(object):
+
+    @td.skip_if_not_us_locale
+    def test_guess_datetime_format_for_array(self):
+        expected_format = '%Y-%m-%d %H:%M:%S.%f'
+        dt_string = datetime(2011, 12, 30, 0, 0, 0).strftime(expected_format)
+
+        test_arrays = [
+            np.array([dt_string, dt_string, dt_string], dtype='O'),
+            np.array([np.nan, np.nan, dt_string], dtype='O'),
+            np.array([dt_string, 'random_string'], dtype='O'),
+        ]
+
+        for test_array in test_arrays:
+            assert tools._guess_datetime_format_for_array(
+                test_array) == expected_format
+
+        format_for_string_of_nans = tools._guess_datetime_format_for_array(
+            np.array(
+                [np.nan, np.nan, np.nan], dtype='O'))
+        assert format_for_string_of_nans is None
+
+
+class TestToDatetimeInferFormat(object):
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_infer_datetime_format_consistent_format(self, cache):
+        s = pd.Series(pd.date_range('20000101', periods=50, freq='H'))
+
+        test_formats = ['%m-%d-%Y', '%m/%d/%Y %H:%M:%S.%f',
+                        '%Y-%m-%dT%H:%M:%S.%f']
+
+        for test_format in test_formats:
+            s_as_dt_strings = s.apply(lambda x: x.strftime(test_format))
+
+            with_format = pd.to_datetime(s_as_dt_strings, format=test_format,
+                                         cache=cache)
+            no_infer = pd.to_datetime(s_as_dt_strings,
+                                      infer_datetime_format=False,
+                                      cache=cache)
+            yes_infer = pd.to_datetime(s_as_dt_strings,
+                                       infer_datetime_format=True,
+                                       cache=cache)
+
+            # Whether the format is explicitly passed, it is inferred, or
+            # it is not inferred, the results should all be the same
+            tm.assert_series_equal(with_format, no_infer)
+            tm.assert_series_equal(no_infer, yes_infer)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_infer_datetime_format_inconsistent_format(self,
+                                                                   cache):
+        s = pd.Series(np.array(['01/01/2011 00:00:00',
+                                '01-02-2011 00:00:00',
+                                '2011-01-03T00:00:00']))
+
+        # When the format is inconsistent, infer_datetime_format should just
+        # fallback to the default parsing
+        tm.assert_series_equal(pd.to_datetime(s, infer_datetime_format=False,
+                                              cache=cache),
+                               pd.to_datetime(s, infer_datetime_format=True,
+                                              cache=cache))
+
+        s = pd.Series(np.array(['Jan/01/2011', 'Feb/01/2011', 'Mar/01/2011']))
+
+        tm.assert_series_equal(pd.to_datetime(s, infer_datetime_format=False,
+                                              cache=cache),
+                               pd.to_datetime(s, infer_datetime_format=True,
+                                              cache=cache))
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_infer_datetime_format_series_with_nans(self, cache):
+        s = pd.Series(np.array(['01/01/2011 00:00:00', np.nan,
+                                '01/03/2011 00:00:00', np.nan]))
+        tm.assert_series_equal(pd.to_datetime(s, infer_datetime_format=False,
+                                              cache=cache),
+                               pd.to_datetime(s, infer_datetime_format=True,
+                                              cache=cache))
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_infer_datetime_format_series_start_with_nans(self,
+                                                                      cache):
+        s = pd.Series(np.array([np.nan, np.nan, '01/01/2011 00:00:00',
+                                '01/02/2011 00:00:00', '01/03/2011 00:00:00']))
+
+        tm.assert_series_equal(pd.to_datetime(s, infer_datetime_format=False,
+                                              cache=cache),
+                               pd.to_datetime(s, infer_datetime_format=True,
+                                              cache=cache))
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_iso8601_noleading_0s(self, cache):
+        # GH 11871
+        s = pd.Series(['2014-1-1', '2014-2-2', '2015-3-3'])
+        expected = pd.Series([pd.Timestamp('2014-01-01'),
+                              pd.Timestamp('2014-02-02'),
+                              pd.Timestamp('2015-03-03')])
+        tm.assert_series_equal(pd.to_datetime(s, cache=cache), expected)
+        tm.assert_series_equal(pd.to_datetime(s, format='%Y-%m-%d',
+                                              cache=cache), expected)
+
+
+class TestDaysInMonth(object):
+    # tests for issue #10154
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_day_not_in_month_coerce(self, cache):
+        assert isna(to_datetime('2015-02-29', errors='coerce', cache=cache))
+        assert isna(to_datetime('2015-02-29', format="%Y-%m-%d",
+                                errors='coerce', cache=cache))
+        assert isna(to_datetime('2015-02-32', format="%Y-%m-%d",
+                                errors='coerce', cache=cache))
+        assert isna(to_datetime('2015-04-31', format="%Y-%m-%d",
+                                errors='coerce', cache=cache))
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_day_not_in_month_raise(self, cache):
+        pytest.raises(ValueError, to_datetime, '2015-02-29',
+                      errors='raise', cache=cache)
+        pytest.raises(ValueError, to_datetime, '2015-02-29',
+                      errors='raise', format="%Y-%m-%d", cache=cache)
+        pytest.raises(ValueError, to_datetime, '2015-02-32',
+                      errors='raise', format="%Y-%m-%d", cache=cache)
+        pytest.raises(ValueError, to_datetime, '2015-04-31',
+                      errors='raise', format="%Y-%m-%d", cache=cache)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_day_not_in_month_ignore(self, cache):
+        assert to_datetime('2015-02-29', errors='ignore',
+                           cache=cache) == '2015-02-29'
+        assert to_datetime('2015-02-29', errors='ignore',
+                           format="%Y-%m-%d", cache=cache) == '2015-02-29'
+        assert to_datetime('2015-02-32', errors='ignore',
+                           format="%Y-%m-%d", cache=cache) == '2015-02-32'
+        assert to_datetime('2015-04-31', errors='ignore',
+                           format="%Y-%m-%d", cache=cache) == '2015-04-31'
+
+
+class TestDatetimeParsingWrappers(object):
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_parsers(self, cache):
+
+        # dateutil >= 2.5.0 defaults to yearfirst=True
+        # https://github.com/dateutil/dateutil/issues/217
+        yearfirst = True
+
+        cases = {'2011-01-01': datetime(2011, 1, 1),
+                 '2Q2005': datetime(2005, 4, 1),
+                 '2Q05': datetime(2005, 4, 1),
+                 '2005Q1': datetime(2005, 1, 1),
+                 '05Q1': datetime(2005, 1, 1),
+                 '2011Q3': datetime(2011, 7, 1),
+                 '11Q3': datetime(2011, 7, 1),
+                 '3Q2011': datetime(2011, 7, 1),
+                 '3Q11': datetime(2011, 7, 1),
+
+                 # quarterly without space
+                 '2000Q4': datetime(2000, 10, 1),
+                 '00Q4': datetime(2000, 10, 1),
+                 '4Q2000': datetime(2000, 10, 1),
+                 '4Q00': datetime(2000, 10, 1),
+                 '2000q4': datetime(2000, 10, 1),
+                 '2000-Q4': datetime(2000, 10, 1),
+                 '00-Q4': datetime(2000, 10, 1),
+                 '4Q-2000': datetime(2000, 10, 1),
+                 '4Q-00': datetime(2000, 10, 1),
+                 '00q4': datetime(2000, 10, 1),
+                 '2005': datetime(2005, 1, 1),
+                 '2005-11': datetime(2005, 11, 1),
+                 '2005 11': datetime(2005, 11, 1),
+                 '11-2005': datetime(2005, 11, 1),
+                 '11 2005': datetime(2005, 11, 1),
+                 '200511': datetime(2020, 5, 11),
+                 '20051109': datetime(2005, 11, 9),
+                 '20051109 10:15': datetime(2005, 11, 9, 10, 15),
+                 '20051109 08H': datetime(2005, 11, 9, 8, 0),
+                 '2005-11-09 10:15': datetime(2005, 11, 9, 10, 15),
+                 '2005-11-09 08H': datetime(2005, 11, 9, 8, 0),
+                 '2005/11/09 10:15': datetime(2005, 11, 9, 10, 15),
+                 '2005/11/09 08H': datetime(2005, 11, 9, 8, 0),
+                 "Thu Sep 25 10:36:28 2003": datetime(2003, 9, 25, 10,
+                                                      36, 28),
+                 "Thu Sep 25 2003": datetime(2003, 9, 25),
+                 "Sep 25 2003": datetime(2003, 9, 25),
+                 "January 1 2014": datetime(2014, 1, 1),
+
+                 # GH 10537
+                 '2014-06': datetime(2014, 6, 1),
+                 '06-2014': datetime(2014, 6, 1),
+                 '2014-6': datetime(2014, 6, 1),
+                 '6-2014': datetime(2014, 6, 1),
+
+                 '20010101 12': datetime(2001, 1, 1, 12),
+                 '20010101 1234': datetime(2001, 1, 1, 12, 34),
+                 '20010101 123456': datetime(2001, 1, 1, 12, 34, 56),
+                 }
+
+        for date_str, expected in compat.iteritems(cases):
+            result1, _, _ = parsing.parse_time_string(date_str,
+                                                      yearfirst=yearfirst)
+            result2 = to_datetime(date_str, yearfirst=yearfirst)
+            result3 = to_datetime([date_str], yearfirst=yearfirst)
+            # result5 is used below
+            result4 = to_datetime(np.array([date_str], dtype=object),
+                                  yearfirst=yearfirst, cache=cache)
+            result6 = DatetimeIndex([date_str], yearfirst=yearfirst)
+            # result7 is used below
+            result8 = DatetimeIndex(Index([date_str]), yearfirst=yearfirst)
+            result9 = DatetimeIndex(Series([date_str]), yearfirst=yearfirst)
+
+            for res in [result1, result2]:
+                assert res == expected
+            for res in [result3, result4, result6, result8, result9]:
+                exp = DatetimeIndex([pd.Timestamp(expected)])
+                tm.assert_index_equal(res, exp)
+
+            # these really need to have yearfirst, but we don't support
+            if not yearfirst:
+                result5 = Timestamp(date_str)
+                assert result5 == expected
+                result7 = date_range(date_str, freq='S', periods=1,
+                                     yearfirst=yearfirst)
+                assert result7 == expected
+
+        # NaT
+        result1, _, _ = parsing.parse_time_string('NaT')
+        result2 = to_datetime('NaT')
+        result3 = Timestamp('NaT')
+        result4 = DatetimeIndex(['NaT'])[0]
+        assert result1 is tslib.NaT
+        assert result2 is tslib.NaT
+        assert result3 is tslib.NaT
+        assert result4 is tslib.NaT
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_parsers_dayfirst_yearfirst(self, cache):
+        # OK
+        # 2.5.1 10-11-12   [dayfirst=0, yearfirst=0] -> 2012-10-11 00:00:00
+        # 2.5.2 10-11-12   [dayfirst=0, yearfirst=1] -> 2012-10-11 00:00:00
+        # 2.5.3 10-11-12   [dayfirst=0, yearfirst=0] -> 2012-10-11 00:00:00
+
+        # OK
+        # 2.5.1 10-11-12   [dayfirst=0, yearfirst=1] -> 2010-11-12 00:00:00
+        # 2.5.2 10-11-12   [dayfirst=0, yearfirst=1] -> 2010-11-12 00:00:00
+        # 2.5.3 10-11-12   [dayfirst=0, yearfirst=1] -> 2010-11-12 00:00:00
+
+        # bug fix in 2.5.2
+        # 2.5.1 10-11-12   [dayfirst=1, yearfirst=1] -> 2010-11-12 00:00:00
+        # 2.5.2 10-11-12   [dayfirst=1, yearfirst=1] -> 2010-12-11 00:00:00
+        # 2.5.3 10-11-12   [dayfirst=1, yearfirst=1] -> 2010-12-11 00:00:00
+
+        # OK
+        # 2.5.1 10-11-12   [dayfirst=1, yearfirst=0] -> 2012-11-10 00:00:00
+        # 2.5.2 10-11-12   [dayfirst=1, yearfirst=0] -> 2012-11-10 00:00:00
+        # 2.5.3 10-11-12   [dayfirst=1, yearfirst=0] -> 2012-11-10 00:00:00
+
+        # OK
+        # 2.5.1 20/12/21   [dayfirst=0, yearfirst=0] -> 2021-12-20 00:00:00
+        # 2.5.2 20/12/21   [dayfirst=0, yearfirst=0] -> 2021-12-20 00:00:00
+        # 2.5.3 20/12/21   [dayfirst=0, yearfirst=0] -> 2021-12-20 00:00:00
+
+        # OK
+        # 2.5.1 20/12/21   [dayfirst=0, yearfirst=1] -> 2020-12-21 00:00:00
+        # 2.5.2 20/12/21   [dayfirst=0, yearfirst=1] -> 2020-12-21 00:00:00
+        # 2.5.3 20/12/21   [dayfirst=0, yearfirst=1] -> 2020-12-21 00:00:00
+
+        # revert of bug in 2.5.2
+        # 2.5.1 20/12/21   [dayfirst=1, yearfirst=1] -> 2020-12-21 00:00:00
+        # 2.5.2 20/12/21   [dayfirst=1, yearfirst=1] -> month must be in 1..12
+        # 2.5.3 20/12/21   [dayfirst=1, yearfirst=1] -> 2020-12-21 00:00:00
+
+        # OK
+        # 2.5.1 20/12/21   [dayfirst=1, yearfirst=0] -> 2021-12-20 00:00:00
+        # 2.5.2 20/12/21   [dayfirst=1, yearfirst=0] -> 2021-12-20 00:00:00
+        # 2.5.3 20/12/21   [dayfirst=1, yearfirst=0] -> 2021-12-20 00:00:00
+
+        is_lt_253 = LooseVersion(dateutil.__version__) < LooseVersion('2.5.3')
+
+        # str : dayfirst, yearfirst, expected
+        cases = {'10-11-12': [(False, False,
+                               datetime(2012, 10, 11)),
+                              (True, False,
+                               datetime(2012, 11, 10)),
+                              (False, True,
+                               datetime(2010, 11, 12)),
+                              (True, True,
+                               datetime(2010, 12, 11))],
+                 '20/12/21': [(False, False,
+                               datetime(2021, 12, 20)),
+                              (True, False,
+                               datetime(2021, 12, 20)),
+                              (False, True,
+                               datetime(2020, 12, 21)),
+                              (True, True,
+                               datetime(2020, 12, 21))]}
+
+        for date_str, values in compat.iteritems(cases):
+            for dayfirst, yearfirst, expected in values:
+
+                # odd comparisons across version
+                # let's just skip
+                if dayfirst and yearfirst and is_lt_253:
+                    continue
+
+                # compare with dateutil result
+                dateutil_result = parse(date_str, dayfirst=dayfirst,
+                                        yearfirst=yearfirst)
+                assert dateutil_result == expected
+
+                result1, _, _ = parsing.parse_time_string(date_str,
+                                                          dayfirst=dayfirst,
+                                                          yearfirst=yearfirst)
+
+                # we don't support dayfirst/yearfirst here:
+                if not dayfirst and not yearfirst:
+                    result2 = Timestamp(date_str)
+                    assert result2 == expected
+
+                result3 = to_datetime(date_str, dayfirst=dayfirst,
+                                      yearfirst=yearfirst, cache=cache)
+
+                result4 = DatetimeIndex([date_str], dayfirst=dayfirst,
+                                        yearfirst=yearfirst)[0]
+
+                assert result1 == expected
+                assert result3 == expected
+                assert result4 == expected
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_parsers_timestring(self, cache):
+        # must be the same as dateutil result
+        cases = {'10:15': (parse('10:15'), datetime(1, 1, 1, 10, 15)),
+                 '9:05': (parse('9:05'), datetime(1, 1, 1, 9, 5))}
+
+        for date_str, (exp_now, exp_def) in compat.iteritems(cases):
+            result1, _, _ = parsing.parse_time_string(date_str)
+            result2 = to_datetime(date_str)
+            result3 = to_datetime([date_str])
+            result4 = Timestamp(date_str)
+            result5 = DatetimeIndex([date_str])[0]
+            # parse time string return time string based on default date
+            # others are not, and can't be changed because it is used in
+            # time series plot
+            assert result1 == exp_def
+            assert result2 == exp_now
+            assert result3 == exp_now
+            assert result4 == exp_now
+            assert result5 == exp_now
+
+    @td.skip_if_has_locale
+    def test_parsers_time(self):
+        # GH11818
+        strings = ["14:15", "1415", "2:15pm", "0215pm", "14:15:00", "141500",
+                   "2:15:00pm", "021500pm", time(14, 15)]
+        expected = time(14, 15)
+
+        for time_string in strings:
+            assert tools.to_time(time_string) == expected
+
+        new_string = "14.15"
+        pytest.raises(ValueError, tools.to_time, new_string)
+        assert tools.to_time(new_string, format="%H.%M") == expected
+
+        arg = ["14:15", "20:20"]
+        expected_arr = [time(14, 15), time(20, 20)]
+        assert tools.to_time(arg) == expected_arr
+        assert tools.to_time(arg, format="%H:%M") == expected_arr
+        assert tools.to_time(arg, infer_time_format=True) == expected_arr
+        assert tools.to_time(arg, format="%I:%M%p",
+                             errors="coerce") == [None, None]
+
+        res = tools.to_time(arg, format="%I:%M%p", errors="ignore")
+        tm.assert_numpy_array_equal(res, np.array(arg, dtype=np.object_))
+
+        with pytest.raises(ValueError):
+            tools.to_time(arg, format="%I:%M%p", errors="raise")
+
+        tm.assert_series_equal(tools.to_time(Series(arg, name="test")),
+                               Series(expected_arr, name="test"))
+
+        res = tools.to_time(np.array(arg))
+        assert isinstance(res, list)
+        assert res == expected_arr
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_parsers_timezone_minute_offsets_roundtrip(self, cache):
+        # GH11708
+        base = to_datetime("2013-01-01 00:00:00", cache=cache)
+        dt_strings = [
+            ('2013-01-01 05:45+0545',
+             "Asia/Katmandu",
+             "Timestamp('2013-01-01 05:45:00+0545', tz='Asia/Katmandu')"),
+            ('2013-01-01 05:30+0530',
+             "Asia/Kolkata",
+             "Timestamp('2013-01-01 05:30:00+0530', tz='Asia/Kolkata')")
+        ]
+
+        for dt_string, tz, dt_string_repr in dt_strings:
+            dt_time = to_datetime(dt_string, cache=cache)
+            assert base == dt_time
+            converted_time = dt_time.tz_localize('UTC').tz_convert(tz)
+            assert dt_string_repr == repr(converted_time)
+
+
+def test_normalize_date():
+    value = date(2012, 9, 7)
+
+    result = tslib.normalize_date(value)
+    assert (result == datetime(2012, 9, 7))
+
+    value = datetime(2012, 9, 7, 12)
+
+    result = tslib.normalize_date(value)
+    assert (result == datetime(2012, 9, 7))
+
+
+@pytest.fixture(params=['D', 's', 'ms', 'us', 'ns'])
+def units(request):
+    return request.param
+
+
+@pytest.fixture
+def epoch_1960():
+    # for origin as 1960-01-01
+    return Timestamp('1960-01-01')
+
+
+@pytest.fixture
+def units_from_epochs():
+    return list(range(5))
+
+
+@pytest.fixture(params=[epoch_1960(),
+                        epoch_1960().to_pydatetime(),
+                        epoch_1960().to_datetime64(),
+                        str(epoch_1960())])
+def epochs(request):
+    return request.param
+
+
+@pytest.fixture
+def julian_dates():
+    return pd.date_range('2014-1-1', periods=10).to_julian_date().values
+
+
+class TestOrigin(object):
+
+    def test_to_basic(self, julian_dates):
+        # gh-11276, gh-11745
+        # for origin as julian
+
+        result = Series(pd.to_datetime(
+            julian_dates, unit='D', origin='julian'))
+        expected = Series(pd.to_datetime(
+            julian_dates - pd.Timestamp(0).to_julian_date(), unit='D'))
+        assert_series_equal(result, expected)
+
+        result = Series(pd.to_datetime(
+            [0, 1, 2], unit='D', origin='unix'))
+        expected = Series([Timestamp('1970-01-01'),
+                           Timestamp('1970-01-02'),
+                           Timestamp('1970-01-03')])
+        assert_series_equal(result, expected)
+
+        # default
+        result = Series(pd.to_datetime(
+            [0, 1, 2], unit='D'))
+        expected = Series([Timestamp('1970-01-01'),
+                           Timestamp('1970-01-02'),
+                           Timestamp('1970-01-03')])
+        assert_series_equal(result, expected)
+
+    def test_julian_round_trip(self):
+        result = pd.to_datetime(2456658, origin='julian', unit='D')
+        assert result.to_julian_date() == 2456658
+
+        # out-of-bounds
+        with pytest.raises(ValueError):
+            pd.to_datetime(1, origin="julian", unit='D')
+
+    def test_invalid_unit(self, units, julian_dates):
+
+        # checking for invalid combination of origin='julian' and unit != D
+        if units != 'D':
+            with pytest.raises(ValueError):
+                pd.to_datetime(julian_dates, unit=units, origin='julian')
+
+    def test_invalid_origin(self):
+
+        # need to have a numeric specified
+        with pytest.raises(ValueError):
+            pd.to_datetime("2005-01-01", origin="1960-01-01")
+
+        with pytest.raises(ValueError):
+            pd.to_datetime("2005-01-01", origin="1960-01-01", unit='D')
+
+    def test_epoch(self, units, epochs, epoch_1960, units_from_epochs):
+
+        expected = Series(
+            [pd.Timedelta(x, unit=units) +
+             epoch_1960 for x in units_from_epochs])
+
+        result = Series(pd.to_datetime(
+            units_from_epochs, unit=units, origin=epochs))
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("origin, exc",
+                             [('random_string', ValueError),
+                              ('epoch', ValueError),
+                              ('13-24-1990', ValueError),
+                              (datetime(1, 1, 1), tslib.OutOfBoundsDatetime)])
+    def test_invalid_origins(self, origin, exc, units, units_from_epochs):
+
+        with pytest.raises(exc):
+            pd.to_datetime(units_from_epochs, unit=units,
+                           origin=origin)
+
+    def test_invalid_origins_tzinfo(self):
+        # GH16842
+        with pytest.raises(ValueError):
+            pd.to_datetime(1, unit='D',
+                           origin=datetime(2000, 1, 1, tzinfo=pytz.utc))
+
+    def test_processing_order(self):
+        # make sure we handle out-of-bounds *before*
+        # constructing the dates
+
+        result = pd.to_datetime(200 * 365, unit='D')
+        expected = Timestamp('2169-11-13 00:00:00')
+        assert result == expected
+
+        result = pd.to_datetime(200 * 365, unit='D', origin='1870-01-01')
+        expected = Timestamp('2069-11-13 00:00:00')
+        assert result == expected
+
+        result = pd.to_datetime(300 * 365, unit='D', origin='1870-01-01')
+        expected = Timestamp('2169-10-20 00:00:00')
+        assert result == expected
diff --git a/pandas/tests/indexes/interval/__init__.py b/pandas/tests/indexes/interval/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/indexes/interval/test_astype.py b/pandas/tests/indexes/interval/test_astype.py
new file mode 100644
index 0000000000000..b3a4bfa878c3f
--- /dev/null
+++ b/pandas/tests/indexes/interval/test_astype.py
@@ -0,0 +1,209 @@
+from __future__ import division
+
+import pytest
+import numpy as np
+from pandas import (
+    Index,
+    IntervalIndex,
+    interval_range,
+    CategoricalIndex,
+    Timestamp,
+    Timedelta,
+    NaT)
+from pandas.core.dtypes.dtypes import CategoricalDtype, IntervalDtype
+import pandas.util.testing as tm
+
+
+class Base(object):
+    """Tests common to IntervalIndex with any subtype"""
+
+    def test_astype_idempotent(self, index):
+        result = index.astype('interval')
+        tm.assert_index_equal(result, index)
+
+        result = index.astype(index.dtype)
+        tm.assert_index_equal(result, index)
+
+    def test_astype_object(self, index):
+        result = index.astype(object)
+        expected = Index(index.values, dtype='object')
+        tm.assert_index_equal(result, expected)
+        assert not result.equals(index)
+
+    def test_astype_category(self, index):
+        result = index.astype('category')
+        expected = CategoricalIndex(index.values)
+        tm.assert_index_equal(result, expected)
+
+        result = index.astype(CategoricalDtype())
+        tm.assert_index_equal(result, expected)
+
+        # non-default params
+        categories = index.dropna().unique().values[:-1]
+        dtype = CategoricalDtype(categories=categories, ordered=True)
+        result = index.astype(dtype)
+        expected = CategoricalIndex(
+            index.values, categories=categories, ordered=True)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [
+        'int64', 'uint64', 'float64', 'complex128', 'period[M]',
+        'timedelta64', 'timedelta64[ns]', 'datetime64', 'datetime64[ns]',
+        'datetime64[ns, US/Eastern]'])
+    def test_astype_cannot_cast(self, index, dtype):
+        msg = 'Cannot cast IntervalIndex to dtype'
+        with tm.assert_raises_regex(TypeError, msg):
+            index.astype(dtype)
+
+    def test_astype_invalid_dtype(self, index):
+        msg = 'data type "fake_dtype" not understood'
+        with tm.assert_raises_regex(TypeError, msg):
+            index.astype('fake_dtype')
+
+
+class TestIntSubtype(Base):
+    """Tests specific to IntervalIndex with integer-like subtype"""
+
+    indexes = [
+        IntervalIndex.from_breaks(np.arange(-10, 11, dtype='int64')),
+        IntervalIndex.from_breaks(
+            np.arange(100, dtype='uint64'), closed='left'),
+    ]
+
+    @pytest.fixture(params=indexes)
+    def index(self, request):
+        return request.param
+
+    @pytest.mark.parametrize('subtype', [
+        'float64', 'datetime64[ns]', 'timedelta64[ns]'])
+    def test_subtype_conversion(self, index, subtype):
+        dtype = IntervalDtype(subtype)
+        result = index.astype(dtype)
+        expected = IntervalIndex.from_arrays(index.left.astype(subtype),
+                                             index.right.astype(subtype),
+                                             closed=index.closed)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('subtype_start, subtype_end', [
+        ('int64', 'uint64'), ('uint64', 'int64')])
+    def test_subtype_integer(self, subtype_start, subtype_end):
+        index = IntervalIndex.from_breaks(np.arange(100, dtype=subtype_start))
+        dtype = IntervalDtype(subtype_end)
+        result = index.astype(dtype)
+        expected = IntervalIndex.from_arrays(index.left.astype(subtype_end),
+                                             index.right.astype(subtype_end),
+                                             closed=index.closed)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.xfail(reason='GH 15832')
+    def test_subtype_integer_errors(self):
+        # int64 -> uint64 fails with negative values
+        index = interval_range(-10, 10)
+        dtype = IntervalDtype('uint64')
+        with pytest.raises(ValueError):
+            index.astype(dtype)
+
+
+class TestFloatSubtype(Base):
+    """Tests specific to IntervalIndex with float subtype"""
+
+    indexes = [
+        interval_range(-10.0, 10.0, closed='neither'),
+        IntervalIndex.from_arrays([-1.5, np.nan, 0., 0., 1.5],
+                                  [-0.5, np.nan, 1., 1., 3.],
+                                  closed='both'),
+    ]
+
+    @pytest.fixture(params=indexes)
+    def index(self, request):
+        return request.param
+
+    @pytest.mark.parametrize('subtype', ['int64', 'uint64'])
+    def test_subtype_integer(self, subtype):
+        index = interval_range(0.0, 10.0)
+        dtype = IntervalDtype(subtype)
+        result = index.astype(dtype)
+        expected = IntervalIndex.from_arrays(index.left.astype(subtype),
+                                             index.right.astype(subtype),
+                                             closed=index.closed)
+        tm.assert_index_equal(result, expected)
+
+        # raises with NA
+        msg = 'Cannot convert NA to integer'
+        with tm.assert_raises_regex(ValueError, msg):
+            index.insert(0, np.nan).astype(dtype)
+
+    @pytest.mark.xfail(reason='GH 15832')
+    def test_subtype_integer_errors(self):
+        # float64 -> uint64 fails with negative values
+        index = interval_range(-10.0, 10.0)
+        dtype = IntervalDtype('uint64')
+        with pytest.raises(ValueError):
+            index.astype(dtype)
+
+        # float64 -> integer-like fails with non-integer valued floats
+        index = interval_range(0.0, 10.0, freq=0.25)
+        dtype = IntervalDtype('int64')
+        with pytest.raises(ValueError):
+            index.astype(dtype)
+
+        dtype = IntervalDtype('uint64')
+        with pytest.raises(ValueError):
+            index.astype(dtype)
+
+    @pytest.mark.parametrize('subtype', ['datetime64[ns]', 'timedelta64[ns]'])
+    def test_subtype_datetimelike(self, index, subtype):
+        dtype = IntervalDtype(subtype)
+        msg = 'Cannot convert .* to .*; subtypes are incompatible'
+        with tm.assert_raises_regex(TypeError, msg):
+            index.astype(dtype)
+
+
+class TestDatetimelikeSubtype(Base):
+    """Tests specific to IntervalIndex with datetime-like subtype"""
+
+    indexes = [
+        interval_range(Timestamp('2018-01-01'), periods=10, closed='neither'),
+        interval_range(Timestamp('2018-01-01'), periods=10).insert(2, NaT),
+        interval_range(Timestamp('2018-01-01', tz='US/Eastern'), periods=10),
+        interval_range(Timedelta('0 days'), periods=10, closed='both'),
+        interval_range(Timedelta('0 days'), periods=10).insert(2, NaT),
+    ]
+
+    @pytest.fixture(params=indexes)
+    def index(self, request):
+        return request.param
+
+    @pytest.mark.parametrize('subtype', ['int64', 'uint64'])
+    def test_subtype_integer(self, index, subtype):
+        dtype = IntervalDtype(subtype)
+        result = index.astype(dtype)
+        expected = IntervalIndex.from_arrays(index.left.astype(subtype),
+                                             index.right.astype(subtype),
+                                             closed=index.closed)
+        tm.assert_index_equal(result, expected)
+
+    def test_subtype_float(self, index):
+        dtype = IntervalDtype('float64')
+        msg = 'Cannot convert .* to .*; subtypes are incompatible'
+        with tm.assert_raises_regex(TypeError, msg):
+            index.astype(dtype)
+
+    def test_subtype_datetimelike(self):
+        # datetime -> timedelta raises
+        dtype = IntervalDtype('timedelta64[ns]')
+        msg = 'Cannot convert .* to .*; subtypes are incompatible'
+
+        index = interval_range(Timestamp('2018-01-01'), periods=10)
+        with tm.assert_raises_regex(TypeError, msg):
+            index.astype(dtype)
+
+        index = interval_range(Timestamp('2018-01-01', tz='CET'), periods=10)
+        with tm.assert_raises_regex(TypeError, msg):
+            index.astype(dtype)
+
+        # timedelta -> datetime raises
+        dtype = IntervalDtype('datetime64[ns]')
+        index = interval_range(Timedelta('0 days'), periods=10)
+        with tm.assert_raises_regex(TypeError, msg):
+            index.astype(dtype)
diff --git a/pandas/tests/indexes/interval/test_construction.py b/pandas/tests/indexes/interval/test_construction.py
new file mode 100644
index 0000000000000..3745f79d7d65d
--- /dev/null
+++ b/pandas/tests/indexes/interval/test_construction.py
@@ -0,0 +1,370 @@
+from __future__ import division
+
+import pytest
+import numpy as np
+from functools import partial
+
+from pandas import (
+    Interval, IntervalIndex, Index, Int64Index, Float64Index, Categorical,
+    CategoricalIndex, date_range, timedelta_range, period_range, notna)
+from pandas.compat import lzip
+from pandas.core.dtypes.common import is_categorical_dtype
+from pandas.core.dtypes.dtypes import IntervalDtype
+import pandas.core.common as com
+import pandas.util.testing as tm
+
+
+@pytest.fixture(params=[None, 'foo'])
+def name(request):
+    return request.param
+
+
+class Base(object):
+    """
+    Common tests for all variations of IntervalIndex construction. Input data
+    to be supplied in breaks format, then converted by the subclass method
+    get_kwargs_from_breaks to the expected format.
+    """
+
+    @pytest.mark.parametrize('breaks', [
+        [3, 14, 15, 92, 653],
+        np.arange(10, dtype='int64'),
+        Int64Index(range(-10, 11)),
+        Float64Index(np.arange(20, 30, 0.5)),
+        date_range('20180101', periods=10),
+        date_range('20180101', periods=10, tz='US/Eastern'),
+        timedelta_range('1 day', periods=10)])
+    def test_constructor(self, constructor, breaks, closed, name):
+        result_kwargs = self.get_kwargs_from_breaks(breaks, closed)
+        result = constructor(closed=closed, name=name, **result_kwargs)
+
+        assert result.closed == closed
+        assert result.name == name
+        assert result.dtype.subtype == getattr(breaks, 'dtype', 'int64')
+        tm.assert_index_equal(result.left, Index(breaks[:-1]))
+        tm.assert_index_equal(result.right, Index(breaks[1:]))
+
+    @pytest.mark.parametrize('breaks, subtype', [
+        (Int64Index([0, 1, 2, 3, 4]), 'float64'),
+        (Int64Index([0, 1, 2, 3, 4]), 'datetime64[ns]'),
+        (Int64Index([0, 1, 2, 3, 4]), 'timedelta64[ns]'),
+        (Float64Index([0, 1, 2, 3, 4]), 'int64'),
+        (date_range('2017-01-01', periods=5), 'int64'),
+        (timedelta_range('1 day', periods=5), 'int64')])
+    def test_constructor_dtype(self, constructor, breaks, subtype):
+        # GH 19262: conversion via dtype parameter
+        expected_kwargs = self.get_kwargs_from_breaks(breaks.astype(subtype))
+        expected = constructor(**expected_kwargs)
+
+        result_kwargs = self.get_kwargs_from_breaks(breaks)
+        iv_dtype = IntervalDtype(subtype)
+        for dtype in (iv_dtype, str(iv_dtype)):
+            result = constructor(dtype=dtype, **result_kwargs)
+            tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('breaks', [
+        [np.nan] * 2, [np.nan] * 4, [np.nan] * 50])
+    def test_constructor_nan(self, constructor, breaks, closed):
+        # GH 18421
+        result_kwargs = self.get_kwargs_from_breaks(breaks)
+        result = constructor(closed=closed, **result_kwargs)
+
+        expected_subtype = np.float64
+        expected_values = np.array(breaks[:-1], dtype=object)
+
+        assert result.closed == closed
+        assert result.dtype.subtype == expected_subtype
+        tm.assert_numpy_array_equal(result.values, expected_values)
+
+    @pytest.mark.parametrize('breaks', [
+        [],
+        np.array([], dtype='int64'),
+        np.array([], dtype='float64'),
+        np.array([], dtype='datetime64[ns]'),
+        np.array([], dtype='timedelta64[ns]')])
+    def test_constructor_empty(self, constructor, breaks, closed):
+        # GH 18421
+        result_kwargs = self.get_kwargs_from_breaks(breaks)
+        result = constructor(closed=closed, **result_kwargs)
+
+        expected_values = np.array([], dtype=object)
+        expected_subtype = getattr(breaks, 'dtype', np.int64)
+
+        assert result.empty
+        assert result.closed == closed
+        assert result.dtype.subtype == expected_subtype
+        tm.assert_numpy_array_equal(result.values, expected_values)
+
+    @pytest.mark.parametrize('breaks', [
+        tuple('0123456789'),
+        list('abcdefghij'),
+        np.array(list('abcdefghij'), dtype=object),
+        np.array(list('abcdefghij'), dtype='<U1')])
+    def test_constructor_string(self, constructor, breaks):
+        # GH 19016
+        msg = ('category, object, and string subtypes are not supported '
+               'for IntervalIndex')
+        with tm.assert_raises_regex(TypeError, msg):
+            constructor(**self.get_kwargs_from_breaks(breaks))
+
+    @pytest.mark.parametrize('cat_constructor', [
+        Categorical, CategoricalIndex])
+    def test_constructor_categorical_valid(self, constructor, cat_constructor):
+        # GH 21243/21253
+        if isinstance(constructor, partial) and constructor.func is Index:
+            # Index is defined to create CategoricalIndex from categorical data
+            pytest.skip()
+
+        breaks = np.arange(10, dtype='int64')
+        expected = IntervalIndex.from_breaks(breaks)
+
+        cat_breaks = cat_constructor(breaks)
+        result_kwargs = self.get_kwargs_from_breaks(cat_breaks)
+        result = constructor(**result_kwargs)
+        tm.assert_index_equal(result, expected)
+
+    def test_generic_errors(self, constructor):
+        # filler input data to be used when supplying invalid kwargs
+        filler = self.get_kwargs_from_breaks(range(10))
+
+        # invalid closed
+        msg = "invalid option for 'closed': invalid"
+        with tm.assert_raises_regex(ValueError, msg):
+            constructor(closed='invalid', **filler)
+
+        # unsupported dtype
+        msg = 'dtype must be an IntervalDtype, got int64'
+        with tm.assert_raises_regex(TypeError, msg):
+            constructor(dtype='int64', **filler)
+
+        # invalid dtype
+        msg = 'data type "invalid" not understood'
+        with tm.assert_raises_regex(TypeError, msg):
+            constructor(dtype='invalid', **filler)
+
+        # no point in nesting periods in an IntervalIndex
+        periods = period_range('2000-01-01', periods=10)
+        periods_kwargs = self.get_kwargs_from_breaks(periods)
+        msg = 'Period dtypes are not supported, use a PeriodIndex instead'
+        with tm.assert_raises_regex(ValueError, msg):
+            constructor(**periods_kwargs)
+
+        # decreasing values
+        decreasing_kwargs = self.get_kwargs_from_breaks(range(10, -1, -1))
+        msg = 'left side of interval must be <= right side'
+        with tm.assert_raises_regex(ValueError, msg):
+            constructor(**decreasing_kwargs)
+
+
+class TestFromArrays(Base):
+    """Tests specific to IntervalIndex.from_arrays"""
+
+    @pytest.fixture
+    def constructor(self):
+        return IntervalIndex.from_arrays
+
+    def get_kwargs_from_breaks(self, breaks, closed='right'):
+        """
+        converts intervals in breaks format to a dictionary of kwargs to
+        specific to the format expected by IntervalIndex.from_arrays
+        """
+        return {'left': breaks[:-1], 'right': breaks[1:]}
+
+    def test_constructor_errors(self):
+        # GH 19016: categorical data
+        data = Categorical(list('01234abcde'), ordered=True)
+        msg = ('category, object, and string subtypes are not supported '
+               'for IntervalIndex')
+        with tm.assert_raises_regex(TypeError, msg):
+            IntervalIndex.from_arrays(data[:-1], data[1:])
+
+        # unequal length
+        left = [0, 1, 2]
+        right = [2, 3]
+        msg = 'left and right must have the same length'
+        with tm.assert_raises_regex(ValueError, msg):
+            IntervalIndex.from_arrays(left, right)
+
+    @pytest.mark.parametrize('left_subtype, right_subtype', [
+        (np.int64, np.float64), (np.float64, np.int64)])
+    def test_mixed_float_int(self, left_subtype, right_subtype):
+        """mixed int/float left/right results in float for both sides"""
+        left = np.arange(9, dtype=left_subtype)
+        right = np.arange(1, 10, dtype=right_subtype)
+        result = IntervalIndex.from_arrays(left, right)
+
+        expected_left = Float64Index(left)
+        expected_right = Float64Index(right)
+        expected_subtype = np.float64
+
+        tm.assert_index_equal(result.left, expected_left)
+        tm.assert_index_equal(result.right, expected_right)
+        assert result.dtype.subtype == expected_subtype
+
+
+class TestFromBreaks(Base):
+    """Tests specific to IntervalIndex.from_breaks"""
+
+    @pytest.fixture
+    def constructor(self):
+        return IntervalIndex.from_breaks
+
+    def get_kwargs_from_breaks(self, breaks, closed='right'):
+        """
+        converts intervals in breaks format to a dictionary of kwargs to
+        specific to the format expected by IntervalIndex.from_breaks
+        """
+        return {'breaks': breaks}
+
+    def test_constructor_errors(self):
+        # GH 19016: categorical data
+        data = Categorical(list('01234abcde'), ordered=True)
+        msg = ('category, object, and string subtypes are not supported '
+               'for IntervalIndex')
+        with tm.assert_raises_regex(TypeError, msg):
+            IntervalIndex.from_breaks(data)
+
+    def test_length_one(self):
+        """breaks of length one produce an empty IntervalIndex"""
+        breaks = [0]
+        result = IntervalIndex.from_breaks(breaks)
+        expected = IntervalIndex.from_breaks([])
+        tm.assert_index_equal(result, expected)
+
+
+class TestFromTuples(Base):
+    """Tests specific to IntervalIndex.from_tuples"""
+
+    @pytest.fixture
+    def constructor(self):
+        return IntervalIndex.from_tuples
+
+    def get_kwargs_from_breaks(self, breaks, closed='right'):
+        """
+        converts intervals in breaks format to a dictionary of kwargs to
+        specific to the format expected by IntervalIndex.from_tuples
+        """
+        if len(breaks) == 0:
+            return {'data': breaks}
+
+        tuples = lzip(breaks[:-1], breaks[1:])
+        if isinstance(breaks, (list, tuple)):
+            return {'data': tuples}
+        elif is_categorical_dtype(breaks):
+            return {'data': breaks._constructor(tuples)}
+        return {'data': com._asarray_tuplesafe(tuples)}
+
+    def test_constructor_errors(self):
+        # non-tuple
+        tuples = [(0, 1), 2, (3, 4)]
+        msg = 'IntervalIndex.from_tuples received an invalid item, 2'
+        with tm.assert_raises_regex(TypeError, msg.format(t=tuples)):
+            IntervalIndex.from_tuples(tuples)
+
+        # too few/many items
+        tuples = [(0, 1), (2,), (3, 4)]
+        msg = 'IntervalIndex.from_tuples requires tuples of length 2, got {t}'
+        with tm.assert_raises_regex(ValueError, msg.format(t=tuples)):
+            IntervalIndex.from_tuples(tuples)
+
+        tuples = [(0, 1), (2, 3, 4), (5, 6)]
+        with tm.assert_raises_regex(ValueError, msg.format(t=tuples)):
+            IntervalIndex.from_tuples(tuples)
+
+    def test_na_tuples(self):
+        # tuple (NA, NA) evaluates the same as NA as an elemenent
+        na_tuple = [(0, 1), (np.nan, np.nan), (2, 3)]
+        idx_na_tuple = IntervalIndex.from_tuples(na_tuple)
+        idx_na_element = IntervalIndex.from_tuples([(0, 1), np.nan, (2, 3)])
+        tm.assert_index_equal(idx_na_tuple, idx_na_element)
+
+
+class TestClassConstructors(Base):
+    """Tests specific to the IntervalIndex/Index constructors"""
+
+    @pytest.fixture(params=[IntervalIndex, partial(Index, dtype='interval')],
+                    ids=['IntervalIndex', 'Index'])
+    def constructor(self, request):
+        return request.param
+
+    def get_kwargs_from_breaks(self, breaks, closed='right'):
+        """
+        converts intervals in breaks format to a dictionary of kwargs to
+        specific to the format expected by the IntervalIndex/Index constructors
+        """
+        if len(breaks) == 0:
+            return {'data': breaks}
+
+        ivs = [Interval(l, r, closed) if notna(l) else l
+               for l, r in zip(breaks[:-1], breaks[1:])]
+
+        if isinstance(breaks, list):
+            return {'data': ivs}
+        elif is_categorical_dtype(breaks):
+            return {'data': breaks._constructor(ivs)}
+        return {'data': np.array(ivs, dtype=object)}
+
+    def test_generic_errors(self, constructor):
+        """
+        override the base class implementation since errors are handled
+        differently; checks unnecessary since caught at the Interval level
+        """
+        pass
+
+    def test_constructor_errors(self, constructor):
+        # mismatched closed within intervals with no constructor override
+        ivs = [Interval(0, 1, closed='right'), Interval(2, 3, closed='left')]
+        msg = 'intervals must all be closed on the same side'
+        with tm.assert_raises_regex(ValueError, msg):
+            constructor(ivs)
+
+        # scalar
+        msg = (r'IntervalIndex\(...\) must be called with a collection of '
+               'some kind, 5 was passed')
+        with tm.assert_raises_regex(TypeError, msg):
+            constructor(5)
+
+        # not an interval
+        msg = ("type <(class|type) 'numpy.int64'> with value 0 "
+               "is not an interval")
+        with tm.assert_raises_regex(TypeError, msg):
+            constructor([0, 1])
+
+    @pytest.mark.parametrize('data, closed', [
+        ([], 'both'),
+        ([np.nan, np.nan], 'neither'),
+        ([Interval(0, 3, closed='neither'),
+          Interval(2, 5, closed='neither')], 'left'),
+        ([Interval(0, 3, closed='left'),
+          Interval(2, 5, closed='right')], 'neither'),
+        (IntervalIndex.from_breaks(range(5), closed='both'), 'right')])
+    def test_override_inferred_closed(self, constructor, data, closed):
+        # GH 19370
+        if isinstance(data, IntervalIndex):
+            tuples = data.to_tuples()
+        else:
+            tuples = [(iv.left, iv.right) if notna(iv) else iv for iv in data]
+        expected = IntervalIndex.from_tuples(tuples, closed=closed)
+        result = constructor(data, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+
+class TestFromIntervals(TestClassConstructors):
+    """
+    Tests for IntervalIndex.from_intervals, which is deprecated in favor of the
+    IntervalIndex constructor.  Same tests as the IntervalIndex constructor,
+    plus deprecation test.  Should only need to delete this class when removed.
+    """
+
+    @pytest.fixture
+    def constructor(self):
+        def from_intervals_ignore_warnings(*args, **kwargs):
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                return IntervalIndex.from_intervals(*args, **kwargs)
+        return from_intervals_ignore_warnings
+
+    def test_deprecated(self):
+        ivs = [Interval(0, 1), Interval(1, 2)]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            IntervalIndex.from_intervals(ivs)
diff --git a/pandas/tests/indexes/interval/test_interval.py b/pandas/tests/indexes/interval/test_interval.py
new file mode 100644
index 0000000000000..6a7330f8cfb68
--- /dev/null
+++ b/pandas/tests/indexes/interval/test_interval.py
@@ -0,0 +1,979 @@
+from __future__ import division
+
+import pytest
+import numpy as np
+from pandas import (
+    Interval, IntervalIndex, Index, isna, notna, interval_range, Timestamp,
+    Timedelta, date_range, timedelta_range)
+from pandas.compat import lzip
+import pandas.core.common as com
+from pandas.tests.indexes.common import Base
+import pandas.util.testing as tm
+import pandas as pd
+
+
+@pytest.fixture(scope='class', params=[None, 'foo'])
+def name(request):
+    return request.param
+
+
+class TestIntervalIndex(Base):
+    _holder = IntervalIndex
+
+    def setup_method(self, method):
+        self.index = IntervalIndex.from_arrays([0, 1], [1, 2])
+        self.index_with_nan = IntervalIndex.from_tuples(
+            [(0, 1), np.nan, (1, 2)])
+        self.indices = dict(intervalIndex=tm.makeIntervalIndex(10))
+
+    def create_index(self, closed='right'):
+        return IntervalIndex.from_breaks(range(11), closed=closed)
+
+    def create_index_with_nan(self, closed='right'):
+        mask = [True, False] + [True] * 8
+        return IntervalIndex.from_arrays(
+            np.where(mask, np.arange(10), np.nan),
+            np.where(mask, np.arange(1, 11), np.nan), closed=closed)
+
+    def test_properties(self, closed):
+        index = self.create_index(closed=closed)
+        assert len(index) == 10
+        assert index.size == 10
+        assert index.shape == (10, )
+
+        tm.assert_index_equal(index.left, Index(np.arange(10)))
+        tm.assert_index_equal(index.right, Index(np.arange(1, 11)))
+        tm.assert_index_equal(index.mid, Index(np.arange(0.5, 10.5)))
+
+        assert index.closed == closed
+
+        ivs = [Interval(l, r, closed) for l, r in zip(range(10), range(1, 11))]
+        expected = np.array(ivs, dtype=object)
+        tm.assert_numpy_array_equal(np.asarray(index), expected)
+        tm.assert_numpy_array_equal(index.values, expected)
+
+        # with nans
+        index = self.create_index_with_nan(closed=closed)
+        assert len(index) == 10
+        assert index.size == 10
+        assert index.shape == (10, )
+
+        expected_left = Index([0, np.nan, 2, 3, 4, 5, 6, 7, 8, 9])
+        expected_right = expected_left + 1
+        expected_mid = expected_left + 0.5
+        tm.assert_index_equal(index.left, expected_left)
+        tm.assert_index_equal(index.right, expected_right)
+        tm.assert_index_equal(index.mid, expected_mid)
+
+        assert index.closed == closed
+
+        ivs = [Interval(l, r, closed) if notna(l) else np.nan
+               for l, r in zip(expected_left, expected_right)]
+        expected = np.array(ivs, dtype=object)
+        tm.assert_numpy_array_equal(np.asarray(index), expected)
+        tm.assert_numpy_array_equal(index.values, expected)
+
+    @pytest.mark.parametrize('breaks', [
+        [1, 1, 2, 5, 15, 53, 217, 1014, 5335, 31240, 201608],
+        [-np.inf, -100, -10, 0.5, 1, 1.5, 3.8, 101, 202, np.inf],
+        pd.to_datetime(['20170101', '20170202', '20170303', '20170404']),
+        pd.to_timedelta(['1ns', '2ms', '3s', '4M', '5H', '6D'])])
+    def test_length(self, closed, breaks):
+        # GH 18789
+        index = IntervalIndex.from_breaks(breaks, closed=closed)
+        result = index.length
+        expected = Index(iv.length for iv in index)
+        tm.assert_index_equal(result, expected)
+
+        # with NA
+        index = index.insert(1, np.nan)
+        result = index.length
+        expected = Index(iv.length if notna(iv) else iv for iv in index)
+        tm.assert_index_equal(result, expected)
+
+    def test_with_nans(self, closed):
+        index = self.create_index(closed=closed)
+        assert not index.hasnans
+
+        result = index.isna()
+        expected = np.repeat(False, len(index))
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = index.notna()
+        expected = np.repeat(True, len(index))
+        tm.assert_numpy_array_equal(result, expected)
+
+        index = self.create_index_with_nan(closed=closed)
+        assert index.hasnans
+
+        result = index.isna()
+        expected = np.array([False, True] + [False] * (len(index) - 2))
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = index.notna()
+        expected = np.array([True, False] + [True] * (len(index) - 2))
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_copy(self, closed):
+        expected = self.create_index(closed=closed)
+
+        result = expected.copy()
+        assert result.equals(expected)
+
+        result = expected.copy(deep=True)
+        assert result.equals(expected)
+        assert result.left is not expected.left
+
+    def test_ensure_copied_data(self, closed):
+        # exercise the copy flag in the constructor
+
+        # not copying
+        index = self.create_index(closed=closed)
+        result = IntervalIndex(index, copy=False)
+        tm.assert_numpy_array_equal(index.left.values, result.left.values,
+                                    check_same='same')
+        tm.assert_numpy_array_equal(index.right.values, result.right.values,
+                                    check_same='same')
+
+        # by-definition make a copy
+        result = IntervalIndex(index.values, copy=False)
+        tm.assert_numpy_array_equal(index.left.values, result.left.values,
+                                    check_same='copy')
+        tm.assert_numpy_array_equal(index.right.values, result.right.values,
+                                    check_same='copy')
+
+    def test_equals(self, closed):
+        expected = IntervalIndex.from_breaks(np.arange(5), closed=closed)
+        assert expected.equals(expected)
+        assert expected.equals(expected.copy())
+
+        assert not expected.equals(expected.astype(object))
+        assert not expected.equals(np.array(expected))
+        assert not expected.equals(list(expected))
+
+        assert not expected.equals([1, 2])
+        assert not expected.equals(np.array([1, 2]))
+        assert not expected.equals(pd.date_range('20130101', periods=2))
+
+        expected_name1 = IntervalIndex.from_breaks(
+            np.arange(5), closed=closed, name='foo')
+        expected_name2 = IntervalIndex.from_breaks(
+            np.arange(5), closed=closed, name='bar')
+        assert expected.equals(expected_name1)
+        assert expected_name1.equals(expected_name2)
+
+        for other_closed in {'left', 'right', 'both', 'neither'} - {closed}:
+            expected_other_closed = IntervalIndex.from_breaks(
+                np.arange(5), closed=other_closed)
+            assert not expected.equals(expected_other_closed)
+
+    @pytest.mark.parametrize('klass', [list, tuple, np.array, pd.Series])
+    def test_where(self, closed, klass):
+        idx = self.create_index(closed=closed)
+        cond = [True] * len(idx)
+        expected = idx
+        result = expected.where(klass(cond))
+        tm.assert_index_equal(result, expected)
+
+        cond = [False] + [True] * len(idx[1:])
+        expected = IntervalIndex([np.nan] + idx[1:].tolist())
+        result = idx.where(klass(cond))
+        tm.assert_index_equal(result, expected)
+
+    def test_delete(self, closed):
+        expected = IntervalIndex.from_breaks(np.arange(1, 11), closed=closed)
+        result = self.create_index(closed=closed).delete(0)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('data', [
+        interval_range(0, periods=10, closed='neither'),
+        interval_range(1.7, periods=8, freq=2.5, closed='both'),
+        interval_range(Timestamp('20170101'), periods=12, closed='left'),
+        interval_range(Timedelta('1 day'), periods=6, closed='right')])
+    def test_insert(self, data):
+        item = data[0]
+        idx_item = IntervalIndex([item])
+
+        # start
+        expected = idx_item.append(data)
+        result = data.insert(0, item)
+        tm.assert_index_equal(result, expected)
+
+        # end
+        expected = data.append(idx_item)
+        result = data.insert(len(data), item)
+        tm.assert_index_equal(result, expected)
+
+        # mid
+        expected = data[:3].append(idx_item).append(data[3:])
+        result = data.insert(3, item)
+        tm.assert_index_equal(result, expected)
+
+        # invalid type
+        msg = 'can only insert Interval objects and NA into an IntervalIndex'
+        with tm.assert_raises_regex(ValueError, msg):
+            data.insert(1, 'foo')
+
+        # invalid closed
+        msg = 'inserted item must be closed on the same side as the index'
+        for closed in {'left', 'right', 'both', 'neither'} - {item.closed}:
+            with tm.assert_raises_regex(ValueError, msg):
+                bad_item = Interval(item.left, item.right, closed=closed)
+                data.insert(1, bad_item)
+
+        # GH 18295 (test missing)
+        na_idx = IntervalIndex([np.nan], closed=data.closed)
+        for na in (np.nan, pd.NaT, None):
+            expected = data[:1].append(na_idx).append(data[1:])
+            result = data.insert(1, na)
+            tm.assert_index_equal(result, expected)
+
+    def test_take(self, closed):
+        index = self.create_index(closed=closed)
+
+        result = index.take(range(10))
+        tm.assert_index_equal(result, index)
+
+        result = index.take([0, 0, 1])
+        expected = IntervalIndex.from_arrays(
+            [0, 0, 1], [1, 1, 2], closed=closed)
+        tm.assert_index_equal(result, expected)
+
+    def test_unique(self, closed):
+        # unique non-overlapping
+        idx = IntervalIndex.from_tuples(
+            [(0, 1), (2, 3), (4, 5)], closed=closed)
+        assert idx.is_unique
+
+        # unique overlapping - distinct endpoints
+        idx = IntervalIndex.from_tuples([(0, 1), (0.5, 1.5)], closed=closed)
+        assert idx.is_unique
+
+        # unique overlapping - shared endpoints
+        idx = pd.IntervalIndex.from_tuples(
+            [(1, 2), (1, 3), (2, 3)], closed=closed)
+        assert idx.is_unique
+
+        # unique nested
+        idx = IntervalIndex.from_tuples([(-1, 1), (-2, 2)], closed=closed)
+        assert idx.is_unique
+
+        # duplicate
+        idx = IntervalIndex.from_tuples(
+            [(0, 1), (0, 1), (2, 3)], closed=closed)
+        assert not idx.is_unique
+
+        # empty
+        idx = IntervalIndex([], closed=closed)
+        assert idx.is_unique
+
+    def test_monotonic(self, closed):
+        # increasing non-overlapping
+        idx = IntervalIndex.from_tuples(
+            [(0, 1), (2, 3), (4, 5)], closed=closed)
+        assert idx.is_monotonic
+        assert idx._is_strictly_monotonic_increasing
+        assert not idx.is_monotonic_decreasing
+        assert not idx._is_strictly_monotonic_decreasing
+
+        # decreasing non-overlapping
+        idx = IntervalIndex.from_tuples(
+            [(4, 5), (2, 3), (1, 2)], closed=closed)
+        assert not idx.is_monotonic
+        assert not idx._is_strictly_monotonic_increasing
+        assert idx.is_monotonic_decreasing
+        assert idx._is_strictly_monotonic_decreasing
+
+        # unordered non-overlapping
+        idx = IntervalIndex.from_tuples(
+            [(0, 1), (4, 5), (2, 3)], closed=closed)
+        assert not idx.is_monotonic
+        assert not idx._is_strictly_monotonic_increasing
+        assert not idx.is_monotonic_decreasing
+        assert not idx._is_strictly_monotonic_decreasing
+
+        # increasing overlapping
+        idx = IntervalIndex.from_tuples(
+            [(0, 2), (0.5, 2.5), (1, 3)], closed=closed)
+        assert idx.is_monotonic
+        assert idx._is_strictly_monotonic_increasing
+        assert not idx.is_monotonic_decreasing
+        assert not idx._is_strictly_monotonic_decreasing
+
+        # decreasing overlapping
+        idx = IntervalIndex.from_tuples(
+            [(1, 3), (0.5, 2.5), (0, 2)], closed=closed)
+        assert not idx.is_monotonic
+        assert not idx._is_strictly_monotonic_increasing
+        assert idx.is_monotonic_decreasing
+        assert idx._is_strictly_monotonic_decreasing
+
+        # unordered overlapping
+        idx = IntervalIndex.from_tuples(
+            [(0.5, 2.5), (0, 2), (1, 3)], closed=closed)
+        assert not idx.is_monotonic
+        assert not idx._is_strictly_monotonic_increasing
+        assert not idx.is_monotonic_decreasing
+        assert not idx._is_strictly_monotonic_decreasing
+
+        # increasing overlapping shared endpoints
+        idx = pd.IntervalIndex.from_tuples(
+            [(1, 2), (1, 3), (2, 3)], closed=closed)
+        assert idx.is_monotonic
+        assert idx._is_strictly_monotonic_increasing
+        assert not idx.is_monotonic_decreasing
+        assert not idx._is_strictly_monotonic_decreasing
+
+        # decreasing overlapping shared endpoints
+        idx = pd.IntervalIndex.from_tuples(
+            [(2, 3), (1, 3), (1, 2)], closed=closed)
+        assert not idx.is_monotonic
+        assert not idx._is_strictly_monotonic_increasing
+        assert idx.is_monotonic_decreasing
+        assert idx._is_strictly_monotonic_decreasing
+
+        # stationary
+        idx = IntervalIndex.from_tuples([(0, 1), (0, 1)], closed=closed)
+        assert idx.is_monotonic
+        assert not idx._is_strictly_monotonic_increasing
+        assert idx.is_monotonic_decreasing
+        assert not idx._is_strictly_monotonic_decreasing
+
+        # empty
+        idx = IntervalIndex([], closed=closed)
+        assert idx.is_monotonic
+        assert idx._is_strictly_monotonic_increasing
+        assert idx.is_monotonic_decreasing
+        assert idx._is_strictly_monotonic_decreasing
+
+    @pytest.mark.skip(reason='not a valid repr as we use interval notation')
+    def test_repr(self):
+        i = IntervalIndex.from_tuples([(0, 1), (1, 2)], closed='right')
+        expected = ("IntervalIndex(left=[0, 1],"
+                    "\n              right=[1, 2],"
+                    "\n              closed='right',"
+                    "\n              dtype='interval[int64]')")
+        assert repr(i) == expected
+
+        i = IntervalIndex.from_tuples((Timestamp('20130101'),
+                                       Timestamp('20130102')),
+                                      (Timestamp('20130102'),
+                                       Timestamp('20130103')),
+                                      closed='right')
+        expected = ("IntervalIndex(left=['2013-01-01', '2013-01-02'],"
+                    "\n              right=['2013-01-02', '2013-01-03'],"
+                    "\n              closed='right',"
+                    "\n              dtype='interval[datetime64[ns]]')")
+        assert repr(i) == expected
+
+    @pytest.mark.skip(reason='not a valid repr as we use interval notation')
+    def test_repr_max_seq_item_setting(self):
+        super(TestIntervalIndex, self).test_repr_max_seq_item_setting()
+
+    @pytest.mark.skip(reason='not a valid repr as we use interval notation')
+    def test_repr_roundtrip(self):
+        super(TestIntervalIndex, self).test_repr_roundtrip()
+
+    # TODO: check this behavior is consistent with test_interval_new.py
+    def test_get_item(self, closed):
+        i = IntervalIndex.from_arrays((0, 1, np.nan), (1, 2, np.nan),
+                                      closed=closed)
+        assert i[0] == Interval(0.0, 1.0, closed=closed)
+        assert i[1] == Interval(1.0, 2.0, closed=closed)
+        assert isna(i[2])
+
+        result = i[0:1]
+        expected = IntervalIndex.from_arrays((0.,), (1.,), closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        result = i[0:2]
+        expected = IntervalIndex.from_arrays((0., 1), (1., 2.), closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        result = i[1:3]
+        expected = IntervalIndex.from_arrays((1., np.nan), (2., np.nan),
+                                             closed=closed)
+        tm.assert_index_equal(result, expected)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_get_loc_value(self):
+        pytest.raises(KeyError, self.index.get_loc, 0)
+        assert self.index.get_loc(0.5) == 0
+        assert self.index.get_loc(1) == 0
+        assert self.index.get_loc(1.5) == 1
+        assert self.index.get_loc(2) == 1
+        pytest.raises(KeyError, self.index.get_loc, -1)
+        pytest.raises(KeyError, self.index.get_loc, 3)
+
+        idx = IntervalIndex.from_tuples([(0, 2), (1, 3)])
+        assert idx.get_loc(0.5) == 0
+        assert idx.get_loc(1) == 0
+        tm.assert_numpy_array_equal(idx.get_loc(1.5),
+                                    np.array([0, 1], dtype='int64'))
+        tm.assert_numpy_array_equal(np.sort(idx.get_loc(2)),
+                                    np.array([0, 1], dtype='int64'))
+        assert idx.get_loc(3) == 1
+        pytest.raises(KeyError, idx.get_loc, 3.5)
+
+        idx = IntervalIndex.from_arrays([0, 2], [1, 3])
+        pytest.raises(KeyError, idx.get_loc, 1.5)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def slice_locs_cases(self, breaks):
+        # TODO: same tests for more index types
+        index = IntervalIndex.from_breaks([0, 1, 2], closed='right')
+        assert index.slice_locs() == (0, 2)
+        assert index.slice_locs(0, 1) == (0, 1)
+        assert index.slice_locs(1, 1) == (0, 1)
+        assert index.slice_locs(0, 2) == (0, 2)
+        assert index.slice_locs(0.5, 1.5) == (0, 2)
+        assert index.slice_locs(0, 0.5) == (0, 1)
+        assert index.slice_locs(start=1) == (0, 2)
+        assert index.slice_locs(start=1.2) == (1, 2)
+        assert index.slice_locs(end=1) == (0, 1)
+        assert index.slice_locs(end=1.1) == (0, 2)
+        assert index.slice_locs(end=1.0) == (0, 1)
+        assert index.slice_locs(-1, -1) == (0, 0)
+
+        index = IntervalIndex.from_breaks([0, 1, 2], closed='neither')
+        assert index.slice_locs(0, 1) == (0, 1)
+        assert index.slice_locs(0, 2) == (0, 2)
+        assert index.slice_locs(0.5, 1.5) == (0, 2)
+        assert index.slice_locs(1, 1) == (1, 1)
+        assert index.slice_locs(1, 2) == (1, 2)
+
+        index = IntervalIndex.from_tuples([(0, 1), (2, 3), (4, 5)],
+                                          closed='both')
+        assert index.slice_locs(1, 1) == (0, 1)
+        assert index.slice_locs(1, 2) == (0, 2)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_slice_locs_int64(self):
+        self.slice_locs_cases([0, 1, 2])
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_slice_locs_float64(self):
+        self.slice_locs_cases([0.0, 1.0, 2.0])
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def slice_locs_decreasing_cases(self, tuples):
+        index = IntervalIndex.from_tuples(tuples)
+        assert index.slice_locs(1.5, 0.5) == (1, 3)
+        assert index.slice_locs(2, 0) == (1, 3)
+        assert index.slice_locs(2, 1) == (1, 3)
+        assert index.slice_locs(3, 1.1) == (0, 3)
+        assert index.slice_locs(3, 3) == (0, 2)
+        assert index.slice_locs(3.5, 3.3) == (0, 1)
+        assert index.slice_locs(1, -3) == (2, 3)
+
+        slice_locs = index.slice_locs(-1, -1)
+        assert slice_locs[0] == slice_locs[1]
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_slice_locs_decreasing_int64(self):
+        self.slice_locs_cases([(2, 4), (1, 3), (0, 2)])
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_slice_locs_decreasing_float64(self):
+        self.slice_locs_cases([(2., 4.), (1., 3.), (0., 2.)])
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_slice_locs_fails(self):
+        index = IntervalIndex.from_tuples([(1, 2), (0, 1), (2, 3)])
+        with pytest.raises(KeyError):
+            index.slice_locs(1, 2)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_get_loc_interval(self):
+        assert self.index.get_loc(Interval(0, 1)) == 0
+        assert self.index.get_loc(Interval(0, 0.5)) == 0
+        assert self.index.get_loc(Interval(0, 1, 'left')) == 0
+        pytest.raises(KeyError, self.index.get_loc, Interval(2, 3))
+        pytest.raises(KeyError, self.index.get_loc,
+                      Interval(-1, 0, 'left'))
+
+    # Make consistent with test_interval_new.py (see #16316, #16386)
+    @pytest.mark.parametrize('item', [3, Interval(1, 4)])
+    def test_get_loc_length_one(self, item, closed):
+        # GH 20921
+        index = IntervalIndex.from_tuples([(0, 5)], closed=closed)
+        result = index.get_loc(item)
+        assert result == 0
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_get_indexer(self):
+        actual = self.index.get_indexer([-1, 0, 0.5, 1, 1.5, 2, 3])
+        expected = np.array([-1, -1, 0, 0, 1, 1, -1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index.get_indexer(self.index)
+        expected = np.array([0, 1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        index = IntervalIndex.from_breaks([0, 1, 2], closed='left')
+        actual = index.get_indexer([-1, 0, 0.5, 1, 1.5, 2, 3])
+        expected = np.array([-1, 0, 0, 1, 1, -1, -1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index.get_indexer(index[:1])
+        expected = np.array([0], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index.get_indexer(index)
+        expected = np.array([-1, 1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_get_indexer_subintervals(self):
+
+        # TODO: is this right?
+        # return indexers for wholly contained subintervals
+        target = IntervalIndex.from_breaks(np.linspace(0, 2, 5))
+        actual = self.index.get_indexer(target)
+        expected = np.array([0, 0, 1, 1], dtype='p')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        target = IntervalIndex.from_breaks([0, 0.67, 1.33, 2])
+        actual = self.index.get_indexer(target)
+        expected = np.array([0, 0, 1, 1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index.get_indexer(target[[0, -1]])
+        expected = np.array([0, 1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        target = IntervalIndex.from_breaks([0, 0.33, 0.67, 1], closed='left')
+        actual = self.index.get_indexer(target)
+        expected = np.array([0, 0, 0], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+    # Make consistent with test_interval_new.py (see #16316, #16386)
+    @pytest.mark.parametrize('item', [
+        [3], np.arange(1, 5), [Interval(1, 4)], interval_range(1, 4)])
+    def test_get_indexer_length_one(self, item, closed):
+        # GH 17284
+        index = IntervalIndex.from_tuples([(0, 5)], closed=closed)
+        result = index.get_indexer(item)
+        expected = np.array([0] * len(item), dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_contains(self):
+        # Only endpoints are valid.
+        i = IntervalIndex.from_arrays([0, 1], [1, 2])
+
+        # Invalid
+        assert 0 not in i
+        assert 1 not in i
+        assert 2 not in i
+
+        # Valid
+        assert Interval(0, 1) in i
+        assert Interval(0, 2) in i
+        assert Interval(0, 0.5) in i
+        assert Interval(3, 5) not in i
+        assert Interval(-1, 0, closed='left') not in i
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def testcontains(self):
+        # can select values that are IN the range of a value
+        i = IntervalIndex.from_arrays([0, 1], [1, 2])
+
+        assert i.contains(0.1)
+        assert i.contains(0.5)
+        assert i.contains(1)
+        assert i.contains(Interval(0, 1))
+        assert i.contains(Interval(0, 2))
+
+        # these overlaps completely
+        assert i.contains(Interval(0, 3))
+        assert i.contains(Interval(1, 3))
+
+        assert not i.contains(20)
+        assert not i.contains(-20)
+
+    def test_dropna(self, closed):
+
+        expected = IntervalIndex.from_tuples(
+            [(0.0, 1.0), (1.0, 2.0)], closed=closed)
+
+        ii = IntervalIndex.from_tuples([(0, 1), (1, 2), np.nan], closed=closed)
+        result = ii.dropna()
+        tm.assert_index_equal(result, expected)
+
+        ii = IntervalIndex.from_arrays(
+            [0, 1, np.nan], [1, 2, np.nan], closed=closed)
+        result = ii.dropna()
+        tm.assert_index_equal(result, expected)
+
+    # TODO: check this behavior is consistent with test_interval_new.py
+    def test_non_contiguous(self, closed):
+        index = IntervalIndex.from_tuples([(0, 1), (2, 3)], closed=closed)
+        target = [0.5, 1.5, 2.5]
+        actual = index.get_indexer(target)
+        expected = np.array([0, -1, 1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        assert 1.5 not in index
+
+    def test_union(self, closed):
+        index = self.create_index(closed=closed)
+        other = IntervalIndex.from_breaks(range(5, 13), closed=closed)
+
+        expected = IntervalIndex.from_breaks(range(13), closed=closed)
+        result = index.union(other)
+        tm.assert_index_equal(result, expected)
+
+        result = other.union(index)
+        tm.assert_index_equal(result, expected)
+
+        tm.assert_index_equal(index.union(index), index)
+        tm.assert_index_equal(index.union(index[:1]), index)
+
+        # GH 19101: empty result, same dtype
+        index = IntervalIndex(np.array([], dtype='int64'), closed=closed)
+        result = index.union(index)
+        tm.assert_index_equal(result, index)
+
+        # GH 19101: empty result, different dtypes
+        other = IntervalIndex(np.array([], dtype='float64'), closed=closed)
+        result = index.union(other)
+        tm.assert_index_equal(result, index)
+
+    def test_intersection(self, closed):
+        index = self.create_index(closed=closed)
+        other = IntervalIndex.from_breaks(range(5, 13), closed=closed)
+
+        expected = IntervalIndex.from_breaks(range(5, 11), closed=closed)
+        result = index.intersection(other)
+        tm.assert_index_equal(result, expected)
+
+        result = other.intersection(index)
+        tm.assert_index_equal(result, expected)
+
+        tm.assert_index_equal(index.intersection(index), index)
+
+        # GH 19101: empty result, same dtype
+        other = IntervalIndex.from_breaks(range(300, 314), closed=closed)
+        expected = IntervalIndex(np.array([], dtype='int64'), closed=closed)
+        result = index.intersection(other)
+        tm.assert_index_equal(result, expected)
+
+        # GH 19101: empty result, different dtypes
+        breaks = np.arange(300, 314, dtype='float64')
+        other = IntervalIndex.from_breaks(breaks, closed=closed)
+        result = index.intersection(other)
+        tm.assert_index_equal(result, expected)
+
+    def test_difference(self, closed):
+        index = self.create_index(closed=closed)
+        tm.assert_index_equal(index.difference(index[:1]), index[1:])
+
+        # GH 19101: empty result, same dtype
+        result = index.difference(index)
+        expected = IntervalIndex(np.array([], dtype='int64'), closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # GH 19101: empty result, different dtypes
+        other = IntervalIndex.from_arrays(index.left.astype('float64'),
+                                          index.right, closed=closed)
+        result = index.difference(other)
+        tm.assert_index_equal(result, expected)
+
+    def test_symmetric_difference(self, closed):
+        index = self.create_index(closed=closed)
+        result = index[1:].symmetric_difference(index[:-1])
+        expected = IntervalIndex([index[0], index[-1]])
+        tm.assert_index_equal(result, expected)
+
+        # GH 19101: empty result, same dtype
+        result = index.symmetric_difference(index)
+        expected = IntervalIndex(np.array([], dtype='int64'), closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # GH 19101: empty result, different dtypes
+        other = IntervalIndex.from_arrays(index.left.astype('float64'),
+                                          index.right, closed=closed)
+        result = index.symmetric_difference(other)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('op_name', [
+        'union', 'intersection', 'difference', 'symmetric_difference'])
+    def test_set_operation_errors(self, closed, op_name):
+        index = self.create_index(closed=closed)
+        set_op = getattr(index, op_name)
+
+        # non-IntervalIndex
+        msg = ('the other index needs to be an IntervalIndex too, but '
+               'was type Int64Index')
+        with tm.assert_raises_regex(TypeError, msg):
+            set_op(Index([1, 2, 3]))
+
+        # mixed closed
+        msg = ('can only do set operations between two IntervalIndex objects '
+               'that are closed on the same side')
+        for other_closed in {'right', 'left', 'both', 'neither'} - {closed}:
+            other = self.create_index(closed=other_closed)
+            with tm.assert_raises_regex(ValueError, msg):
+                set_op(other)
+
+        # GH 19016: incompatible dtypes
+        other = interval_range(Timestamp('20180101'), periods=9, closed=closed)
+        msg = ('can only do {op} between two IntervalIndex objects that have '
+               'compatible dtypes').format(op=op_name)
+        with tm.assert_raises_regex(TypeError, msg):
+            set_op(other)
+
+    def test_isin(self, closed):
+        index = self.create_index(closed=closed)
+
+        expected = np.array([True] + [False] * (len(index) - 1))
+        result = index.isin(index[:1])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = index.isin([index[0]])
+        tm.assert_numpy_array_equal(result, expected)
+
+        other = IntervalIndex.from_breaks(np.arange(-2, 10), closed=closed)
+        expected = np.array([True] * (len(index) - 1) + [False])
+        result = index.isin(other)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = index.isin(other.tolist())
+        tm.assert_numpy_array_equal(result, expected)
+
+        for other_closed in {'right', 'left', 'both', 'neither'}:
+            other = self.create_index(closed=other_closed)
+            expected = np.repeat(closed == other_closed, len(index))
+            result = index.isin(other)
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = index.isin(other.tolist())
+            tm.assert_numpy_array_equal(result, expected)
+
+    def test_comparison(self):
+        actual = Interval(0, 1) < self.index
+        expected = np.array([False, True])
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = Interval(0.5, 1.5) < self.index
+        expected = np.array([False, True])
+        tm.assert_numpy_array_equal(actual, expected)
+        actual = self.index > Interval(0.5, 1.5)
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index == self.index
+        expected = np.array([True, True])
+        tm.assert_numpy_array_equal(actual, expected)
+        actual = self.index <= self.index
+        tm.assert_numpy_array_equal(actual, expected)
+        actual = self.index >= self.index
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index < self.index
+        expected = np.array([False, False])
+        tm.assert_numpy_array_equal(actual, expected)
+        actual = self.index > self.index
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index == IntervalIndex.from_breaks([0, 1, 2], 'left')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index == self.index.values
+        tm.assert_numpy_array_equal(actual, np.array([True, True]))
+        actual = self.index.values == self.index
+        tm.assert_numpy_array_equal(actual, np.array([True, True]))
+        actual = self.index <= self.index.values
+        tm.assert_numpy_array_equal(actual, np.array([True, True]))
+        actual = self.index != self.index.values
+        tm.assert_numpy_array_equal(actual, np.array([False, False]))
+        actual = self.index > self.index.values
+        tm.assert_numpy_array_equal(actual, np.array([False, False]))
+        actual = self.index.values > self.index
+        tm.assert_numpy_array_equal(actual, np.array([False, False]))
+
+        # invalid comparisons
+        actual = self.index == 0
+        tm.assert_numpy_array_equal(actual, np.array([False, False]))
+        actual = self.index == self.index.left
+        tm.assert_numpy_array_equal(actual, np.array([False, False]))
+
+        with tm.assert_raises_regex(TypeError, 'unorderable types'):
+            self.index > 0
+        with tm.assert_raises_regex(TypeError, 'unorderable types'):
+            self.index <= 0
+        with pytest.raises(TypeError):
+            self.index > np.arange(2)
+        with pytest.raises(ValueError):
+            self.index > np.arange(3)
+
+    def test_missing_values(self, closed):
+        idx = Index([np.nan, Interval(0, 1, closed=closed),
+                     Interval(1, 2, closed=closed)])
+        idx2 = IntervalIndex.from_arrays(
+            [np.nan, 0, 1], [np.nan, 1, 2], closed=closed)
+        assert idx.equals(idx2)
+
+        with pytest.raises(ValueError):
+            IntervalIndex.from_arrays(
+                [np.nan, 0, 1], np.array([0, 1, 2]), closed=closed)
+
+        tm.assert_numpy_array_equal(isna(idx),
+                                    np.array([True, False, False]))
+
+    def test_sort_values(self, closed):
+        index = self.create_index(closed=closed)
+
+        result = index.sort_values()
+        tm.assert_index_equal(result, index)
+
+        result = index.sort_values(ascending=False)
+        tm.assert_index_equal(result, index[::-1])
+
+        # with nan
+        index = IntervalIndex([Interval(1, 2), np.nan, Interval(0, 1)])
+
+        result = index.sort_values()
+        expected = IntervalIndex([Interval(0, 1), Interval(1, 2), np.nan])
+        tm.assert_index_equal(result, expected)
+
+        result = index.sort_values(ascending=False)
+        expected = IntervalIndex([np.nan, Interval(1, 2), Interval(0, 1)])
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('tz', [None, 'US/Eastern'])
+    def test_datetime(self, tz):
+        start = Timestamp('2000-01-01', tz=tz)
+        dates = date_range(start=start, periods=10)
+        index = IntervalIndex.from_breaks(dates)
+
+        # test mid
+        start = Timestamp('2000-01-01T12:00', tz=tz)
+        expected = date_range(start=start, periods=9)
+        tm.assert_index_equal(index.mid, expected)
+
+        # __contains__ doesn't check individual points
+        assert Timestamp('2000-01-01', tz=tz) not in index
+        assert Timestamp('2000-01-01T12', tz=tz) not in index
+        assert Timestamp('2000-01-02', tz=tz) not in index
+        iv_true = Interval(Timestamp('2000-01-01T08', tz=tz),
+                           Timestamp('2000-01-01T18', tz=tz))
+        iv_false = Interval(Timestamp('1999-12-31', tz=tz),
+                            Timestamp('2000-01-01', tz=tz))
+        assert iv_true in index
+        assert iv_false not in index
+
+        # .contains does check individual points
+        assert not index.contains(Timestamp('2000-01-01', tz=tz))
+        assert index.contains(Timestamp('2000-01-01T12', tz=tz))
+        assert index.contains(Timestamp('2000-01-02', tz=tz))
+        assert index.contains(iv_true)
+        assert not index.contains(iv_false)
+
+        # test get_indexer
+        start = Timestamp('1999-12-31T12:00', tz=tz)
+        target = date_range(start=start, periods=7, freq='12H')
+        actual = index.get_indexer(target)
+        expected = np.array([-1, -1, 0, 0, 1, 1, 2], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        start = Timestamp('2000-01-08T18:00', tz=tz)
+        target = date_range(start=start, periods=7, freq='6H')
+        actual = index.get_indexer(target)
+        expected = np.array([7, 7, 8, 8, 8, 8, -1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+    def test_append(self, closed):
+
+        index1 = IntervalIndex.from_arrays([0, 1], [1, 2], closed=closed)
+        index2 = IntervalIndex.from_arrays([1, 2], [2, 3], closed=closed)
+
+        result = index1.append(index2)
+        expected = IntervalIndex.from_arrays(
+            [0, 1, 1, 2], [1, 2, 2, 3], closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        result = index1.append([index1, index2])
+        expected = IntervalIndex.from_arrays(
+            [0, 1, 0, 1, 1, 2], [1, 2, 1, 2, 2, 3], closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        msg = ('can only append two IntervalIndex objects that are closed '
+               'on the same side')
+        for other_closed in {'left', 'right', 'both', 'neither'} - {closed}:
+            index_other_closed = IntervalIndex.from_arrays(
+                [0, 1], [1, 2], closed=other_closed)
+            with tm.assert_raises_regex(ValueError, msg):
+                index1.append(index_other_closed)
+
+    def test_is_non_overlapping_monotonic(self, closed):
+        # Should be True in all cases
+        tpls = [(0, 1), (2, 3), (4, 5), (6, 7)]
+        idx = IntervalIndex.from_tuples(tpls, closed=closed)
+        assert idx.is_non_overlapping_monotonic is True
+
+        idx = IntervalIndex.from_tuples(tpls[::-1], closed=closed)
+        assert idx.is_non_overlapping_monotonic is True
+
+        # Should be False in all cases (overlapping)
+        tpls = [(0, 2), (1, 3), (4, 5), (6, 7)]
+        idx = IntervalIndex.from_tuples(tpls, closed=closed)
+        assert idx.is_non_overlapping_monotonic is False
+
+        idx = IntervalIndex.from_tuples(tpls[::-1], closed=closed)
+        assert idx.is_non_overlapping_monotonic is False
+
+        # Should be False in all cases (non-monotonic)
+        tpls = [(0, 1), (2, 3), (6, 7), (4, 5)]
+        idx = IntervalIndex.from_tuples(tpls, closed=closed)
+        assert idx.is_non_overlapping_monotonic is False
+
+        idx = IntervalIndex.from_tuples(tpls[::-1], closed=closed)
+        assert idx.is_non_overlapping_monotonic is False
+
+        # Should be False for closed='both', otherwise True (GH16560)
+        if closed == 'both':
+            idx = IntervalIndex.from_breaks(range(4), closed=closed)
+            assert idx.is_non_overlapping_monotonic is False
+        else:
+            idx = IntervalIndex.from_breaks(range(4), closed=closed)
+            assert idx.is_non_overlapping_monotonic is True
+
+    @pytest.mark.parametrize('tuples', [
+        lzip(range(10), range(1, 11)),
+        lzip(date_range('20170101', periods=10),
+             date_range('20170101', periods=10)),
+        lzip(timedelta_range('0 days', periods=10),
+             timedelta_range('1 day', periods=10))])
+    def test_to_tuples(self, tuples):
+        # GH 18756
+        idx = IntervalIndex.from_tuples(tuples)
+        result = idx.to_tuples()
+        expected = Index(com._asarray_tuplesafe(tuples))
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('tuples', [
+        lzip(range(10), range(1, 11)) + [np.nan],
+        lzip(date_range('20170101', periods=10),
+             date_range('20170101', periods=10)) + [np.nan],
+        lzip(timedelta_range('0 days', periods=10),
+             timedelta_range('1 day', periods=10)) + [np.nan]])
+    @pytest.mark.parametrize('na_tuple', [True, False])
+    def test_to_tuples_na(self, tuples, na_tuple):
+        # GH 18756
+        idx = IntervalIndex.from_tuples(tuples)
+        result = idx.to_tuples(na_tuple=na_tuple)
+
+        # check the non-NA portion
+        expected_notna = Index(com._asarray_tuplesafe(tuples[:-1]))
+        result_notna = result[:-1]
+        tm.assert_index_equal(result_notna, expected_notna)
+
+        # check the NA portion
+        result_na = result[-1]
+        if na_tuple:
+            assert isinstance(result_na, tuple)
+            assert len(result_na) == 2
+            assert all(isna(x) for x in result_na)
+        else:
+            assert isna(result_na)
diff --git a/pandas/tests/indexes/interval/test_interval_new.py b/pandas/tests/indexes/interval/test_interval_new.py
new file mode 100644
index 0000000000000..a0d11db46d316
--- /dev/null
+++ b/pandas/tests/indexes/interval/test_interval_new.py
@@ -0,0 +1,315 @@
+from __future__ import division
+
+import pytest
+import numpy as np
+
+from pandas import Interval, IntervalIndex, Int64Index
+import pandas.util.testing as tm
+
+
+pytestmark = pytest.mark.skip(reason="new indexing tests for issue 16316")
+
+
+class TestIntervalIndex(object):
+
+    def _compare_tuple_of_numpy_array(self, result, expected):
+        lidx, ridx = result
+        lidx_expected, ridx_expected = expected
+
+        tm.assert_numpy_array_equal(lidx, lidx_expected)
+        tm.assert_numpy_array_equal(ridx, ridx_expected)
+
+    @pytest.mark.parametrize("idx_side", ['right', 'left', 'both', 'neither'])
+    @pytest.mark.parametrize("side", ['right', 'left', 'both', 'neither'])
+    def test_get_loc_interval(self, idx_side, side):
+
+        idx = IntervalIndex.from_tuples([(0, 1), (2, 3)], closed=idx_side)
+
+        for bound in [[0, 1], [1, 2], [2, 3], [3, 4],
+                      [0, 2], [2.5, 3], [-1, 4]]:
+            # if get_loc is supplied an interval, it should only search
+            # for exact matches, not overlaps or covers, else KeyError.
+            if idx_side == side:
+                if bound == [0, 1]:
+                    assert idx.get_loc(Interval(0, 1, closed=side)) == 0
+                elif bound == [2, 3]:
+                    assert idx.get_loc(Interval(2, 3, closed=side)) == 1
+                else:
+                    with pytest.raises(KeyError):
+                        idx.get_loc(Interval(*bound, closed=side))
+            else:
+                with pytest.raises(KeyError):
+                    idx.get_loc(Interval(*bound, closed=side))
+
+    @pytest.mark.parametrize("idx_side", ['right', 'left', 'both', 'neither'])
+    @pytest.mark.parametrize("scalar", [-0.5, 0, 0.5, 1, 1.5, 2, 2.5, 3, 3.5])
+    def test_get_loc_scalar(self, idx_side, scalar):
+
+        # correct = {side: {query: answer}}.
+        # If query is not in the dict, that query should raise a KeyError
+        correct = {'right': {0.5: 0, 1: 0, 2.5: 1, 3: 1},
+                   'left': {0: 0, 0.5: 0, 2: 1, 2.5: 1},
+                   'both': {0: 0, 0.5: 0, 1: 0, 2: 1, 2.5: 1, 3: 1},
+                   'neither': {0.5: 0, 2.5: 1}}
+
+        idx = IntervalIndex.from_tuples([(0, 1), (2, 3)], closed=idx_side)
+
+        # if get_loc is supplied a scalar, it should return the index of
+        # the interval which contains the scalar, or KeyError.
+        if scalar in correct[idx_side].keys():
+            assert idx.get_loc(scalar) == correct[idx_side][scalar]
+        else:
+            pytest.raises(KeyError, idx.get_loc, scalar)
+
+    def test_slice_locs_with_interval(self):
+
+        # increasing monotonically
+        index = IntervalIndex.from_tuples([(0, 2), (1, 3), (2, 4)])
+
+        assert index.slice_locs(
+            start=Interval(0, 2), end=Interval(2, 4)) == (0, 3)
+        assert index.slice_locs(start=Interval(0, 2)) == (0, 3)
+        assert index.slice_locs(end=Interval(2, 4)) == (0, 3)
+        assert index.slice_locs(end=Interval(0, 2)) == (0, 1)
+        assert index.slice_locs(
+            start=Interval(2, 4), end=Interval(0, 2)) == (2, 1)
+
+        # decreasing monotonically
+        index = IntervalIndex.from_tuples([(2, 4), (1, 3), (0, 2)])
+
+        assert index.slice_locs(
+            start=Interval(0, 2), end=Interval(2, 4)) == (2, 1)
+        assert index.slice_locs(start=Interval(0, 2)) == (2, 3)
+        assert index.slice_locs(end=Interval(2, 4)) == (0, 1)
+        assert index.slice_locs(end=Interval(0, 2)) == (0, 3)
+        assert index.slice_locs(
+            start=Interval(2, 4), end=Interval(0, 2)) == (0, 3)
+
+        # sorted duplicates
+        index = IntervalIndex.from_tuples([(0, 2), (0, 2), (2, 4)])
+
+        assert index.slice_locs(
+            start=Interval(0, 2), end=Interval(2, 4)) == (0, 3)
+        assert index.slice_locs(start=Interval(0, 2)) == (0, 3)
+        assert index.slice_locs(end=Interval(2, 4)) == (0, 3)
+        assert index.slice_locs(end=Interval(0, 2)) == (0, 2)
+        assert index.slice_locs(
+            start=Interval(2, 4), end=Interval(0, 2)) == (2, 2)
+
+        # unsorted duplicates
+        index = IntervalIndex.from_tuples([(0, 2), (2, 4), (0, 2)])
+
+        pytest.raises(KeyError, index.slice_locs(
+            start=Interval(0, 2), end=Interval(2, 4)))
+        pytest.raises(KeyError, index.slice_locs(start=Interval(0, 2)))
+        assert index.slice_locs(end=Interval(2, 4)) == (0, 2)
+        pytest.raises(KeyError, index.slice_locs(end=Interval(0, 2)))
+        pytest.raises(KeyError, index.slice_locs(
+            start=Interval(2, 4), end=Interval(0, 2)))
+
+        # another unsorted duplicates
+        index = IntervalIndex.from_tuples([(0, 2), (0, 2), (2, 4), (1, 3)])
+
+        assert index.slice_locs(
+            start=Interval(0, 2), end=Interval(2, 4)) == (0, 3)
+        assert index.slice_locs(start=Interval(0, 2)) == (0, 4)
+        assert index.slice_locs(end=Interval(2, 4)) == (0, 3)
+        assert index.slice_locs(end=Interval(0, 2)) == (0, 2)
+        assert index.slice_locs(
+            start=Interval(2, 4), end=Interval(0, 2)) == (2, 2)
+
+    def test_slice_locs_with_ints_and_floats_succeeds(self):
+
+        # increasing non-overlapping
+        index = IntervalIndex.from_tuples([(0, 1), (1, 2), (3, 4)])
+
+        assert index.slice_locs(0, 1) == (0, 1)
+        assert index.slice_locs(0, 2) == (0, 2)
+        assert index.slice_locs(0, 3) == (0, 2)
+        assert index.slice_locs(3, 1) == (2, 1)
+        assert index.slice_locs(3, 4) == (2, 3)
+        assert index.slice_locs(0, 4) == (0, 3)
+
+        # decreasing non-overlapping
+        index = IntervalIndex.from_tuples([(3, 4), (1, 2), (0, 1)])
+        assert index.slice_locs(0, 1) == (3, 2)
+        assert index.slice_locs(0, 2) == (3, 1)
+        assert index.slice_locs(0, 3) == (3, 1)
+        assert index.slice_locs(3, 1) == (1, 2)
+        assert index.slice_locs(3, 4) == (1, 0)
+        assert index.slice_locs(0, 4) == (3, 0)
+
+    @pytest.mark.parametrize("query", [[0, 1], [0, 2], [0, 3],
+                                       [3, 1], [3, 4], [0, 4]])
+    def test_slice_locs_with_ints_and_floats_fails(self, query):
+
+        # increasing overlapping
+        index = IntervalIndex.from_tuples([(0, 2), (1, 3), (2, 4)])
+        pytest.raises(KeyError, index.slice_locs, query)
+
+        # decreasing overlapping
+        index = IntervalIndex.from_tuples([(2, 4), (1, 3), (0, 2)])
+        pytest.raises(KeyError, index.slice_locs, query)
+
+        # sorted duplicates
+        index = IntervalIndex.from_tuples([(0, 2), (0, 2), (2, 4)])
+        pytest.raises(KeyError, index.slice_locs, query)
+
+        # unsorted duplicates
+        index = IntervalIndex.from_tuples([(0, 2), (2, 4), (0, 2)])
+        pytest.raises(KeyError, index.slice_locs, query)
+
+        # another unsorted duplicates
+        index = IntervalIndex.from_tuples([(0, 2), (0, 2), (2, 4), (1, 3)])
+        pytest.raises(KeyError, index.slice_locs, query)
+
+    @pytest.mark.parametrize("query", [
+        Interval(1, 3, closed='right'),
+        Interval(1, 3, closed='left'),
+        Interval(1, 3, closed='both'),
+        Interval(1, 3, closed='neither'),
+        Interval(1, 4, closed='right'),
+        Interval(0, 4, closed='right'),
+        Interval(1, 2, closed='right')])
+    @pytest.mark.parametrize("expected_result", [1, -1, -1, -1, -1, -1, -1])
+    def test_get_indexer_with_interval_single_queries(
+            self, query, expected_result):
+
+        index = IntervalIndex.from_tuples(
+            [(0, 2.5), (1, 3), (2, 4)], closed='right')
+
+        result = index.get_indexer([query])
+        expect = np.array([expected_result], dtype='intp')
+        tm.assert_numpy_array_equal(result, expect)
+
+    @pytest.mark.parametrize("query", [
+        [Interval(2, 4, closed='right'), Interval(1, 3, closed='right')],
+        [Interval(1, 3, closed='right'), Interval(0, 2, closed='right')],
+        [Interval(1, 3, closed='right'), Interval(1, 3, closed='left')]])
+    @pytest.mark.parametrize("expected_result", [[2, 1], [1, -1], [1, -1]])
+    def test_get_indexer_with_interval_multiple_queries(
+            self, query, expected_result):
+
+        index = IntervalIndex.from_tuples(
+            [(0, 2.5), (1, 3), (2, 4)], closed='right')
+
+        result = index.get_indexer(query)
+        expect = np.array(expected_result, dtype='intp')
+        tm.assert_numpy_array_equal(result, expect)
+
+    @pytest.mark.parametrize(
+        "query",
+        [-0.5, 0, 0.5, 1, 1.5, 2, 2.5, 3, 3.5, 4, 4.5])
+    @pytest.mark.parametrize(
+        "expected_result",
+        [-1, -1, 0, 0, 1, 1, -1, -1, 2, 2, -1])
+    def test_get_indexer_with_ints_and_floats_single_queries(
+            self, query, expected_result):
+
+        index = IntervalIndex.from_tuples(
+            [(0, 1), (1, 2), (3, 4)], closed='right')
+
+        result = index.get_indexer([query])
+        expect = np.array([expected_result], dtype='intp')
+        tm.assert_numpy_array_equal(result, expect)
+
+    @pytest.mark.parametrize(
+        "query",
+        [[1, 2], [1, 2, 3], [1, 2, 3, 4], [1, 2, 3, 4, 2]])
+    @pytest.mark.parametrize(
+        "expected_result",
+        [[0, 1], [0, 1, -1], [0, 1, -1, 2], [0, 1, -1, 2, 1]])
+    def test_get_indexer_with_ints_and_floats_multiple_queries(
+            self, query, expected_result):
+
+        index = IntervalIndex.from_tuples(
+            [(0, 1), (1, 2), (3, 4)], closed='right')
+
+        result = index.get_indexer(query)
+        expect = np.array(expected_result, dtype='intp')
+        tm.assert_numpy_array_equal(result, expect)
+
+        index = IntervalIndex.from_tuples([(0, 2), (1, 3), (2, 4)])
+        # TODO: @shoyer believes this should raise, master branch doesn't
+
+    @pytest.mark.parametrize(
+        "query",
+        [-0.5, 0, 0.5, 1, 1.5, 2, 2.5, 3, 3.5, 4, 4.5])
+    @pytest.mark.parametrize("expected_result", [
+        (Int64Index([], dtype='int64'), np.array([0])),
+        (Int64Index([0], dtype='int64'), np.array([])),
+        (Int64Index([0], dtype='int64'), np.array([])),
+        (Int64Index([0, 1], dtype='int64'), np.array([])),
+        (Int64Index([0, 1], dtype='int64'), np.array([])),
+        (Int64Index([0, 1, 2], dtype='int64'), np.array([])),
+        (Int64Index([1, 2], dtype='int64'), np.array([])),
+        (Int64Index([2], dtype='int64'), np.array([])),
+        (Int64Index([2], dtype='int64'), np.array([])),
+        (Int64Index([], dtype='int64'), np.array([0])),
+        (Int64Index([], dtype='int64'), np.array([0]))])
+    def test_get_indexer_non_unique_with_ints_and_floats_single_queries(
+            self, query, expected_result):
+
+        index = IntervalIndex.from_tuples(
+            [(0, 2.5), (1, 3), (2, 4)], closed='left')
+
+        result = index.get_indexer_non_unique([query])
+        tm.assert_numpy_array_equal(result, expected_result)
+
+    @pytest.mark.parametrize(
+        "query",
+        [[1, 2], [1, 2, 3], [1, 2, 3, 4], [1, 2, 3, 4, 2]])
+    @pytest.mark.parametrize("expected_result", [
+        (Int64Index([0, 1, 0, 1, 2], dtype='int64'), np.array([])),
+        (Int64Index([0, 1, 0, 1, 2, 2], dtype='int64'), np.array([])),
+        (Int64Index([0, 1, 0, 1, 2, 2, -1], dtype='int64'), np.array([3])),
+        (Int64Index([0, 1, 0, 1, 2, 2, -1, 0, 1, 2], dtype='int64'),
+            np.array([3]))])
+    def test_get_indexer_non_unique_with_ints_and_floats_multiple_queries(
+            self, query, expected_result):
+
+        index = IntervalIndex.from_tuples(
+            [(0, 2.5), (1, 3), (2, 4)], closed='left')
+
+        result = index.get_indexer_non_unique(query)
+        tm.assert_numpy_array_equal(result, expected_result)
+
+        # TODO we may also want to test get_indexer for the case when
+        # the intervals are duplicated, decreasing, non-monotonic, etc..
+
+    def test_contains(self):
+
+        index = IntervalIndex.from_arrays([0, 1], [1, 2], closed='right')
+
+        # __contains__ requires perfect matches to intervals.
+        assert 0 not in index
+        assert 1 not in index
+        assert 2 not in index
+
+        assert Interval(0, 1, closed='right') in index
+        assert Interval(0, 2, closed='right') not in index
+        assert Interval(0, 0.5, closed='right') not in index
+        assert Interval(3, 5, closed='right') not in index
+        assert Interval(-1, 0, closed='left') not in index
+        assert Interval(0, 1, closed='left') not in index
+        assert Interval(0, 1, closed='both') not in index
+
+    def test_contains_method(self):
+
+        index = IntervalIndex.from_arrays([0, 1], [1, 2], closed='right')
+
+        assert not index.contains(0)
+        assert index.contains(0.1)
+        assert index.contains(0.5)
+        assert index.contains(1)
+
+        assert index.contains(Interval(0, 1), closed='right')
+        assert not index.contains(Interval(0, 1), closed='left')
+        assert not index.contains(Interval(0, 1), closed='both')
+        assert not index.contains(Interval(0, 2), closed='right')
+
+        assert not index.contains(Interval(0, 3), closed='right')
+        assert not index.contains(Interval(1, 3), closed='right')
+
+        assert not index.contains(20)
+        assert not index.contains(-20)
diff --git a/pandas/tests/indexes/interval/test_interval_range.py b/pandas/tests/indexes/interval/test_interval_range.py
new file mode 100644
index 0000000000000..447856e7e9d51
--- /dev/null
+++ b/pandas/tests/indexes/interval/test_interval_range.py
@@ -0,0 +1,312 @@
+from __future__ import division
+
+import pytest
+import numpy as np
+from datetime import timedelta
+from pandas import (
+    Interval, IntervalIndex, Timestamp, Timedelta, DateOffset,
+    interval_range, date_range, timedelta_range)
+from pandas.core.dtypes.common import is_integer
+from pandas.tseries.offsets import Day
+import pandas.util.testing as tm
+
+
+@pytest.fixture(scope='class', params=[None, 'foo'])
+def name(request):
+    return request.param
+
+
+class TestIntervalRange(object):
+
+    @pytest.mark.parametrize('freq, periods', [
+        (1, 100), (2.5, 40), (5, 20), (25, 4)])
+    def test_constructor_numeric(self, closed, name, freq, periods):
+        start, end = 0, 100
+        breaks = np.arange(101, step=freq)
+        expected = IntervalIndex.from_breaks(breaks, name=name, closed=closed)
+
+        # defined from start/end/freq
+        result = interval_range(
+            start=start, end=end, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # defined from start/periods/freq
+        result = interval_range(
+            start=start, periods=periods, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # defined from end/periods/freq
+        result = interval_range(
+            end=end, periods=periods, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # GH 20976: linspace behavior defined from start/end/periods
+        result = interval_range(
+            start=start, end=end, periods=periods, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('tz', [None, 'US/Eastern'])
+    @pytest.mark.parametrize('freq, periods', [
+        ('D', 364), ('2D', 182), ('22D18H', 16), ('M', 11)])
+    def test_constructor_timestamp(self, closed, name, freq, periods, tz):
+        start, end = Timestamp('20180101', tz=tz), Timestamp('20181231', tz=tz)
+        breaks = date_range(start=start, end=end, freq=freq)
+        expected = IntervalIndex.from_breaks(breaks, name=name, closed=closed)
+
+        # defined from start/end/freq
+        result = interval_range(
+            start=start, end=end, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # defined from start/periods/freq
+        result = interval_range(
+            start=start, periods=periods, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # defined from end/periods/freq
+        result = interval_range(
+            end=end, periods=periods, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # GH 20976: linspace behavior defined from start/end/periods
+        if not breaks.freq.isAnchored() and tz is None:
+            # matches expected only for non-anchored offsets and tz naive
+            # (anchored/DST transitions cause unequal spacing in expected)
+            result = interval_range(start=start, end=end, periods=periods,
+                                    name=name, closed=closed)
+            tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('freq, periods', [
+        ('D', 100), ('2D12H', 40), ('5D', 20), ('25D', 4)])
+    def test_constructor_timedelta(self, closed, name, freq, periods):
+        start, end = Timedelta('0 days'), Timedelta('100 days')
+        breaks = timedelta_range(start=start, end=end, freq=freq)
+        expected = IntervalIndex.from_breaks(breaks, name=name, closed=closed)
+
+        # defined from start/end/freq
+        result = interval_range(
+            start=start, end=end, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # defined from start/periods/freq
+        result = interval_range(
+            start=start, periods=periods, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # defined from end/periods/freq
+        result = interval_range(
+            end=end, periods=periods, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # GH 20976: linspace behavior defined from start/end/periods
+        result = interval_range(
+            start=start, end=end, periods=periods, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('start, end, freq, expected_endpoint', [
+        (0, 10, 3, 9),
+        (0, 10, 1.5, 9),
+        (0.5, 10, 3, 9.5),
+        (Timedelta('0D'), Timedelta('10D'), '2D4H', Timedelta('8D16H')),
+        (Timestamp('2018-01-01'),
+         Timestamp('2018-02-09'),
+         'MS',
+         Timestamp('2018-02-01')),
+        (Timestamp('2018-01-01', tz='US/Eastern'),
+         Timestamp('2018-01-20', tz='US/Eastern'),
+         '5D12H',
+         Timestamp('2018-01-17 12:00:00', tz='US/Eastern'))])
+    def test_early_truncation(self, start, end, freq, expected_endpoint):
+        # index truncates early if freq causes end to be skipped
+        result = interval_range(start=start, end=end, freq=freq)
+        result_endpoint = result.right[-1]
+        assert result_endpoint == expected_endpoint
+
+    @pytest.mark.parametrize('start, end, freq', [
+        (0.5, None, None),
+        (None, 4.5, None),
+        (0.5, None, 1.5),
+        (None, 6.5, 1.5)])
+    def test_no_invalid_float_truncation(self, start, end, freq):
+        # GH 21161
+        if freq is None:
+            breaks = [0.5, 1.5, 2.5, 3.5, 4.5]
+        else:
+            breaks = [0.5, 2.0, 3.5, 5.0, 6.5]
+        expected = IntervalIndex.from_breaks(breaks)
+
+        result = interval_range(start=start, end=end, periods=4, freq=freq)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('start, mid, end', [
+        (Timestamp('2018-03-10', tz='US/Eastern'),
+         Timestamp('2018-03-10 23:30:00', tz='US/Eastern'),
+         Timestamp('2018-03-12', tz='US/Eastern')),
+        (Timestamp('2018-11-03', tz='US/Eastern'),
+         Timestamp('2018-11-04 00:30:00', tz='US/Eastern'),
+         Timestamp('2018-11-05', tz='US/Eastern'))])
+    def test_linspace_dst_transition(self, start, mid, end):
+        # GH 20976: linspace behavior defined from start/end/periods
+        # accounts for the hour gained/lost during DST transition
+        result = interval_range(start=start, end=end, periods=2)
+        expected = IntervalIndex.from_breaks([start, mid, end])
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('freq', [2, 2.0])
+    @pytest.mark.parametrize('end', [10, 10.0])
+    @pytest.mark.parametrize('start', [0, 0.0])
+    def test_float_subtype(self, start, end, freq):
+        # Has float subtype if any of start/end/freq are float, even if all
+        # resulting endpoints can safely be upcast to integers
+
+        # defined from start/end/freq
+        index = interval_range(start=start, end=end, freq=freq)
+        result = index.dtype.subtype
+        expected = 'int64' if is_integer(start + end + freq) else 'float64'
+        assert result == expected
+
+        # defined from start/periods/freq
+        index = interval_range(start=start, periods=5, freq=freq)
+        result = index.dtype.subtype
+        expected = 'int64' if is_integer(start + freq) else 'float64'
+        assert result == expected
+
+        # defined from end/periods/freq
+        index = interval_range(end=end, periods=5, freq=freq)
+        result = index.dtype.subtype
+        expected = 'int64' if is_integer(end + freq) else 'float64'
+        assert result == expected
+
+        # GH 20976: linspace behavior defined from start/end/periods
+        index = interval_range(start=start, end=end, periods=5)
+        result = index.dtype.subtype
+        expected = 'int64' if is_integer(start + end) else 'float64'
+        assert result == expected
+
+    def test_constructor_coverage(self):
+        # float value for periods
+        expected = interval_range(start=0, periods=10)
+        result = interval_range(start=0, periods=10.5)
+        tm.assert_index_equal(result, expected)
+
+        # equivalent timestamp-like start/end
+        start, end = Timestamp('2017-01-01'), Timestamp('2017-01-15')
+        expected = interval_range(start=start, end=end)
+
+        result = interval_range(start=start.to_pydatetime(),
+                                end=end.to_pydatetime())
+        tm.assert_index_equal(result, expected)
+
+        result = interval_range(start=start.asm8, end=end.asm8)
+        tm.assert_index_equal(result, expected)
+
+        # equivalent freq with timestamp
+        equiv_freq = ['D', Day(), Timedelta(days=1), timedelta(days=1),
+                      DateOffset(days=1)]
+        for freq in equiv_freq:
+            result = interval_range(start=start, end=end, freq=freq)
+            tm.assert_index_equal(result, expected)
+
+        # equivalent timedelta-like start/end
+        start, end = Timedelta(days=1), Timedelta(days=10)
+        expected = interval_range(start=start, end=end)
+
+        result = interval_range(start=start.to_pytimedelta(),
+                                end=end.to_pytimedelta())
+        tm.assert_index_equal(result, expected)
+
+        result = interval_range(start=start.asm8, end=end.asm8)
+        tm.assert_index_equal(result, expected)
+
+        # equivalent freq with timedelta
+        equiv_freq = ['D', Day(), Timedelta(days=1), timedelta(days=1)]
+        for freq in equiv_freq:
+            result = interval_range(start=start, end=end, freq=freq)
+            tm.assert_index_equal(result, expected)
+
+    def test_errors(self):
+        # not enough params
+        msg = ('Of the four parameters: start, end, periods, and freq, '
+               'exactly three must be specified')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            interval_range(start=0)
+
+        with tm.assert_raises_regex(ValueError, msg):
+            interval_range(end=5)
+
+        with tm.assert_raises_regex(ValueError, msg):
+            interval_range(periods=2)
+
+        with tm.assert_raises_regex(ValueError, msg):
+            interval_range()
+
+        # too many params
+        with tm.assert_raises_regex(ValueError, msg):
+            interval_range(start=0, end=5, periods=6, freq=1.5)
+
+        # mixed units
+        msg = 'start, end, freq need to be type compatible'
+        with tm.assert_raises_regex(TypeError, msg):
+            interval_range(start=0, end=Timestamp('20130101'), freq=2)
+
+        with tm.assert_raises_regex(TypeError, msg):
+            interval_range(start=0, end=Timedelta('1 day'), freq=2)
+
+        with tm.assert_raises_regex(TypeError, msg):
+            interval_range(start=0, end=10, freq='D')
+
+        with tm.assert_raises_regex(TypeError, msg):
+            interval_range(start=Timestamp('20130101'), end=10, freq='D')
+
+        with tm.assert_raises_regex(TypeError, msg):
+            interval_range(start=Timestamp('20130101'),
+                           end=Timedelta('1 day'), freq='D')
+
+        with tm.assert_raises_regex(TypeError, msg):
+            interval_range(start=Timestamp('20130101'),
+                           end=Timestamp('20130110'), freq=2)
+
+        with tm.assert_raises_regex(TypeError, msg):
+            interval_range(start=Timedelta('1 day'), end=10, freq='D')
+
+        with tm.assert_raises_regex(TypeError, msg):
+            interval_range(start=Timedelta('1 day'),
+                           end=Timestamp('20130110'), freq='D')
+
+        with tm.assert_raises_regex(TypeError, msg):
+            interval_range(start=Timedelta('1 day'),
+                           end=Timedelta('10 days'), freq=2)
+
+        # invalid periods
+        msg = 'periods must be a number, got foo'
+        with tm.assert_raises_regex(TypeError, msg):
+            interval_range(start=0, periods='foo')
+
+        # invalid start
+        msg = 'start must be numeric or datetime-like, got foo'
+        with tm.assert_raises_regex(ValueError, msg):
+            interval_range(start='foo', periods=10)
+
+        # invalid end
+        msg = r'end must be numeric or datetime-like, got \(0, 1\]'
+        with tm.assert_raises_regex(ValueError, msg):
+            interval_range(end=Interval(0, 1), periods=10)
+
+        # invalid freq for datetime-like
+        msg = 'freq must be numeric or convertible to DateOffset, got foo'
+        with tm.assert_raises_regex(ValueError, msg):
+            interval_range(start=0, end=10, freq='foo')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            interval_range(start=Timestamp('20130101'), periods=10, freq='foo')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            interval_range(end=Timedelta('1 day'), periods=10, freq='foo')
+
+        # mixed tz
+        start = Timestamp('2017-01-01', tz='US/Eastern')
+        end = Timestamp('2017-01-07', tz='US/Pacific')
+        msg = 'Start and end cannot both be tz-aware with different timezones'
+        with tm.assert_raises_regex(TypeError, msg):
+            interval_range(start=start, end=end)
diff --git a/pandas/tests/indexes/interval/test_interval_tree.py b/pandas/tests/indexes/interval/test_interval_tree.py
new file mode 100644
index 0000000000000..5f248bf7725e5
--- /dev/null
+++ b/pandas/tests/indexes/interval/test_interval_tree.py
@@ -0,0 +1,90 @@
+from __future__ import division
+
+import pytest
+import numpy as np
+from pandas import compat
+from pandas._libs.interval import IntervalTree
+import pandas.util.testing as tm
+
+
+@pytest.fixture(
+    scope='class', params=['int32', 'int64', 'float32', 'float64', 'uint64'])
+def dtype(request):
+    return request.param
+
+
+@pytest.fixture(scope='class')
+def tree(dtype):
+    left = np.arange(5, dtype=dtype)
+    return IntervalTree(left, left + 2)
+
+
+class TestIntervalTree(object):
+
+    def test_get_loc(self, tree):
+        tm.assert_numpy_array_equal(tree.get_loc(1),
+                                    np.array([0], dtype='int64'))
+        tm.assert_numpy_array_equal(np.sort(tree.get_loc(2)),
+                                    np.array([0, 1], dtype='int64'))
+        with pytest.raises(KeyError):
+            tree.get_loc(-1)
+
+    def test_get_indexer(self, tree):
+        tm.assert_numpy_array_equal(
+            tree.get_indexer(np.array([1.0, 5.5, 6.5])),
+            np.array([0, 4, -1], dtype='int64'))
+        with pytest.raises(KeyError):
+            tree.get_indexer(np.array([3.0]))
+
+    def test_get_indexer_non_unique(self, tree):
+        indexer, missing = tree.get_indexer_non_unique(
+            np.array([1.0, 2.0, 6.5]))
+        tm.assert_numpy_array_equal(indexer[:1],
+                                    np.array([0], dtype='int64'))
+        tm.assert_numpy_array_equal(np.sort(indexer[1:3]),
+                                    np.array([0, 1], dtype='int64'))
+        tm.assert_numpy_array_equal(np.sort(indexer[3:]),
+                                    np.array([-1], dtype='int64'))
+        tm.assert_numpy_array_equal(missing, np.array([2], dtype='int64'))
+
+    def test_duplicates(self, dtype):
+        left = np.array([0, 0, 0], dtype=dtype)
+        tree = IntervalTree(left, left + 1)
+        tm.assert_numpy_array_equal(np.sort(tree.get_loc(0.5)),
+                                    np.array([0, 1, 2], dtype='int64'))
+
+        with pytest.raises(KeyError):
+            tree.get_indexer(np.array([0.5]))
+
+        indexer, missing = tree.get_indexer_non_unique(np.array([0.5]))
+        tm.assert_numpy_array_equal(np.sort(indexer),
+                                    np.array([0, 1, 2], dtype='int64'))
+        tm.assert_numpy_array_equal(missing, np.array([], dtype='int64'))
+
+    def test_get_loc_closed(self, closed):
+        tree = IntervalTree([0], [1], closed=closed)
+        for p, errors in [(0, tree.open_left),
+                          (1, tree.open_right)]:
+            if errors:
+                with pytest.raises(KeyError):
+                    tree.get_loc(p)
+            else:
+                tm.assert_numpy_array_equal(tree.get_loc(p),
+                                            np.array([0], dtype='int64'))
+
+    @pytest.mark.skipif(compat.is_platform_32bit(),
+                        reason="int type mismatch on 32bit")
+    @pytest.mark.parametrize('leaf_size', [1, 10, 100, 10000])
+    def test_get_indexer_closed(self, closed, leaf_size):
+        x = np.arange(1000, dtype='float64')
+        found = x.astype('intp')
+        not_found = (-1 * np.ones(1000)).astype('intp')
+
+        tree = IntervalTree(x, x + 0.5, closed=closed, leaf_size=leaf_size)
+        tm.assert_numpy_array_equal(found, tree.get_indexer(x + 0.25))
+
+        expected = found if tree.closed_left else not_found
+        tm.assert_numpy_array_equal(expected, tree.get_indexer(x + 0.0))
+
+        expected = found if tree.closed_right else not_found
+        tm.assert_numpy_array_equal(expected, tree.get_indexer(x + 0.5))
diff --git a/pandas/tests/indexes/period/__init__.py b/pandas/tests/indexes/period/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/indexes/period/test_arithmetic.py b/pandas/tests/indexes/period/test_arithmetic.py
new file mode 100644
index 0000000000000..1d3c8b94a6490
--- /dev/null
+++ b/pandas/tests/indexes/period/test_arithmetic.py
@@ -0,0 +1,941 @@
+# -*- coding: utf-8 -*-
+from datetime import timedelta
+import operator
+
+import pytest
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import (Timedelta,
+                    period_range, Period, PeriodIndex,
+                    _np_version_under1p10)
+import pandas.core.indexes.period as period
+from pandas.core import ops
+from pandas.errors import PerformanceWarning
+
+
+_common_mismatch = [pd.offsets.YearBegin(2),
+                    pd.offsets.MonthBegin(1),
+                    pd.offsets.Minute()]
+
+
+@pytest.fixture(params=[timedelta(minutes=30),
+                        np.timedelta64(30, 's'),
+                        Timedelta(seconds=30)] + _common_mismatch)
+def not_hourly(request):
+    """
+    Several timedelta-like and DateOffset instances that are _not_
+    compatible with Hourly frequencies.
+    """
+    return request.param
+
+
+@pytest.fixture(params=[np.timedelta64(4, 'h'),
+                        timedelta(hours=23),
+                        Timedelta('23:00:00')] + _common_mismatch)
+def not_daily(request):
+    """
+    Several timedelta-like and DateOffset instances that are _not_
+    compatible with Daily frequencies.
+    """
+    return request.param
+
+
+@pytest.fixture(params=[np.timedelta64(365, 'D'),
+                        timedelta(365),
+                        Timedelta(days=365)] + _common_mismatch)
+def mismatched(request):
+    """
+    Several timedelta-like and DateOffset instances that are _not_
+    compatible with Monthly or Annual frequencies.
+    """
+    return request.param
+
+
+@pytest.fixture(params=[pd.offsets.Day(3),
+                        timedelta(days=3),
+                        np.timedelta64(3, 'D'),
+                        pd.offsets.Hour(72),
+                        timedelta(minutes=60 * 24 * 3),
+                        np.timedelta64(72, 'h'),
+                        Timedelta('72:00:00')])
+def three_days(request):
+    """
+    Several timedelta-like and DateOffset objects that each represent
+    a 3-day timedelta
+    """
+    return request.param
+
+
+@pytest.fixture(params=[pd.offsets.Hour(2),
+                        timedelta(hours=2),
+                        np.timedelta64(2, 'h'),
+                        pd.offsets.Minute(120),
+                        timedelta(minutes=120),
+                        np.timedelta64(120, 'm')])
+def two_hours(request):
+    """
+    Several timedelta-like and DateOffset objects that each represent
+    a 2-hour timedelta
+    """
+    return request.param
+
+
+class TestPeriodIndexComparisons(object):
+    def test_pi_cmp_period(self):
+        idx = period_range('2007-01', periods=20, freq='M')
+
+        result = idx < idx[10]
+        exp = idx.values < idx.values[10]
+        tm.assert_numpy_array_equal(result, exp)
+
+    @pytest.mark.parametrize('freq', ['M', '2M', '3M'])
+    def test_pi_cmp_pi(self, freq):
+        base = PeriodIndex(['2011-01', '2011-02', '2011-03', '2011-04'],
+                           freq=freq)
+        per = Period('2011-02', freq=freq)
+
+        exp = np.array([False, True, False, False])
+        tm.assert_numpy_array_equal(base == per, exp)
+        tm.assert_numpy_array_equal(per == base, exp)
+
+        exp = np.array([True, False, True, True])
+        tm.assert_numpy_array_equal(base != per, exp)
+        tm.assert_numpy_array_equal(per != base, exp)
+
+        exp = np.array([False, False, True, True])
+        tm.assert_numpy_array_equal(base > per, exp)
+        tm.assert_numpy_array_equal(per < base, exp)
+
+        exp = np.array([True, False, False, False])
+        tm.assert_numpy_array_equal(base < per, exp)
+        tm.assert_numpy_array_equal(per > base, exp)
+
+        exp = np.array([False, True, True, True])
+        tm.assert_numpy_array_equal(base >= per, exp)
+        tm.assert_numpy_array_equal(per <= base, exp)
+
+        exp = np.array([True, True, False, False])
+        tm.assert_numpy_array_equal(base <= per, exp)
+        tm.assert_numpy_array_equal(per >= base, exp)
+
+        idx = PeriodIndex(['2011-02', '2011-01', '2011-03', '2011-05'],
+                          freq=freq)
+
+        exp = np.array([False, False, True, False])
+        tm.assert_numpy_array_equal(base == idx, exp)
+
+        exp = np.array([True, True, False, True])
+        tm.assert_numpy_array_equal(base != idx, exp)
+
+        exp = np.array([False, True, False, False])
+        tm.assert_numpy_array_equal(base > idx, exp)
+
+        exp = np.array([True, False, False, True])
+        tm.assert_numpy_array_equal(base < idx, exp)
+
+        exp = np.array([False, True, True, False])
+        tm.assert_numpy_array_equal(base >= idx, exp)
+
+        exp = np.array([True, False, True, True])
+        tm.assert_numpy_array_equal(base <= idx, exp)
+
+    @pytest.mark.parametrize('freq', ['M', '2M', '3M'])
+    def test_pi_cmp_pi_mismatched_freq_raises(self, freq):
+        # different base freq
+        base = PeriodIndex(['2011-01', '2011-02', '2011-03', '2011-04'],
+                           freq=freq)
+
+        msg = "Input has different freq=A-DEC from PeriodIndex"
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            base <= Period('2011', freq='A')
+
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            Period('2011', freq='A') >= base
+
+        idx = PeriodIndex(['2011', '2012', '2013', '2014'], freq='A')
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            base <= idx
+
+        # Different frequency
+        msg = "Input has different freq=4M from PeriodIndex"
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            base <= Period('2011', freq='4M')
+
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            Period('2011', freq='4M') >= base
+
+        idx = PeriodIndex(['2011', '2012', '2013', '2014'], freq='4M')
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            base <= idx
+
+    @pytest.mark.parametrize('freq', ['M', '2M', '3M'])
+    def test_pi_cmp_nat(self, freq):
+        idx1 = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-05'], freq=freq)
+
+        result = idx1 > Period('2011-02', freq=freq)
+        exp = np.array([False, False, False, True])
+        tm.assert_numpy_array_equal(result, exp)
+        result = Period('2011-02', freq=freq) < idx1
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = idx1 == Period('NaT', freq=freq)
+        exp = np.array([False, False, False, False])
+        tm.assert_numpy_array_equal(result, exp)
+        result = Period('NaT', freq=freq) == idx1
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = idx1 != Period('NaT', freq=freq)
+        exp = np.array([True, True, True, True])
+        tm.assert_numpy_array_equal(result, exp)
+        result = Period('NaT', freq=freq) != idx1
+        tm.assert_numpy_array_equal(result, exp)
+
+        idx2 = PeriodIndex(['2011-02', '2011-01', '2011-04', 'NaT'], freq=freq)
+        result = idx1 < idx2
+        exp = np.array([True, False, False, False])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = idx1 == idx2
+        exp = np.array([False, False, False, False])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = idx1 != idx2
+        exp = np.array([True, True, True, True])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = idx1 == idx1
+        exp = np.array([True, True, False, True])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = idx1 != idx1
+        exp = np.array([False, False, True, False])
+        tm.assert_numpy_array_equal(result, exp)
+
+    @pytest.mark.parametrize('freq', ['M', '2M', '3M'])
+    def test_pi_cmp_nat_mismatched_freq_raises(self, freq):
+        idx1 = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-05'], freq=freq)
+
+        diff = PeriodIndex(['2011-02', '2011-01', '2011-04', 'NaT'], freq='4M')
+        msg = "Input has different freq=4M from PeriodIndex"
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            idx1 > diff
+
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            idx1 == diff
+
+    # TODO: De-duplicate with test_pi_cmp_nat
+    @pytest.mark.parametrize('dtype', [object, None])
+    def test_comp_nat(self, dtype):
+        left = pd.PeriodIndex([pd.Period('2011-01-01'), pd.NaT,
+                               pd.Period('2011-01-03')])
+        right = pd.PeriodIndex([pd.NaT, pd.NaT, pd.Period('2011-01-03')])
+
+        if dtype is not None:
+            left = left.astype(dtype)
+            right = right.astype(dtype)
+
+        result = left == right
+        expected = np.array([False, False, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = left != right
+        expected = np.array([True, True, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+        expected = np.array([False, False, False])
+        tm.assert_numpy_array_equal(left == pd.NaT, expected)
+        tm.assert_numpy_array_equal(pd.NaT == right, expected)
+
+        expected = np.array([True, True, True])
+        tm.assert_numpy_array_equal(left != pd.NaT, expected)
+        tm.assert_numpy_array_equal(pd.NaT != left, expected)
+
+        expected = np.array([False, False, False])
+        tm.assert_numpy_array_equal(left < pd.NaT, expected)
+        tm.assert_numpy_array_equal(pd.NaT > left, expected)
+
+
+class TestPeriodIndexArithmetic(object):
+    # ---------------------------------------------------------------
+    # __add__/__sub__ with PeriodIndex
+    # PeriodIndex + other is defined for integers and timedelta-like others
+    # PeriodIndex - other is defined for integers, timedelta-like others,
+    #   and PeriodIndex (with matching freq)
+
+    def test_pi_add_iadd_pi_raises(self):
+        rng = pd.period_range('1/1/2000', freq='D', periods=5)
+        other = pd.period_range('1/6/2000', freq='D', periods=5)
+
+        # An earlier implementation of PeriodIndex addition performed
+        # a set operation (union).  This has since been changed to
+        # raise a TypeError. See GH#14164 and GH#13077 for historical
+        # reference.
+        with pytest.raises(TypeError):
+            rng + other
+
+        with pytest.raises(TypeError):
+            rng += other
+
+    def test_pi_sub_isub_pi(self):
+        # GH#20049
+        # For historical reference see GH#14164, GH#13077.
+        # PeriodIndex subtraction originally performed set difference,
+        # then changed to raise TypeError before being implemented in GH#20049
+        rng = pd.period_range('1/1/2000', freq='D', periods=5)
+        other = pd.period_range('1/6/2000', freq='D', periods=5)
+
+        off = rng.freq
+        expected = pd.Index([-5 * off] * 5)
+        result = rng - other
+        tm.assert_index_equal(result, expected)
+
+        rng -= other
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_sub_pi_with_nat(self):
+        rng = pd.period_range('1/1/2000', freq='D', periods=5)
+        other = rng[1:].insert(0, pd.NaT)
+        assert other[1:].equals(rng[1:])
+
+        result = rng - other
+        off = rng.freq
+        expected = pd.Index([pd.NaT, 0 * off, 0 * off, 0 * off, 0 * off])
+        tm.assert_index_equal(result, expected)
+
+    def test_pi_sub_pi_mismatched_freq(self):
+        rng = pd.period_range('1/1/2000', freq='D', periods=5)
+        other = pd.period_range('1/6/2000', freq='H', periods=5)
+        with pytest.raises(period.IncompatibleFrequency):
+            rng - other
+
+    # -------------------------------------------------------------
+    # Invalid Operations
+
+    @pytest.mark.parametrize('other', [3.14, np.array([2.0, 3.0])])
+    @pytest.mark.parametrize('op', [operator.add, ops.radd,
+                                    operator.sub, ops.rsub])
+    def test_pi_add_sub_float(self, op, other):
+        dti = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D')
+        pi = dti.to_period('D')
+        with pytest.raises(TypeError):
+            op(pi, other)
+
+    # -----------------------------------------------------------------
+    # __add__/__sub__ with ndarray[datetime64] and ndarray[timedelta64]
+
+    def test_pi_add_sub_dt64_array_raises(self):
+        rng = pd.period_range('1/1/2000', freq='D', periods=3)
+        dti = pd.date_range('2016-01-01', periods=3)
+        dtarr = dti.values
+
+        with pytest.raises(TypeError):
+            rng + dtarr
+        with pytest.raises(TypeError):
+            dtarr + rng
+
+        with pytest.raises(TypeError):
+            rng - dtarr
+        with pytest.raises(TypeError):
+            dtarr - rng
+
+    def test_pi_add_sub_td64_array_non_tick_raises(self):
+        rng = pd.period_range('1/1/2000', freq='Q', periods=3)
+        dti = pd.date_range('2016-01-01', periods=3)
+        tdi = dti - dti.shift(1)
+        tdarr = tdi.values
+
+        with pytest.raises(period.IncompatibleFrequency):
+            rng + tdarr
+        with pytest.raises(period.IncompatibleFrequency):
+            tdarr + rng
+
+        with pytest.raises(period.IncompatibleFrequency):
+            rng - tdarr
+        with pytest.raises(period.IncompatibleFrequency):
+            tdarr - rng
+
+    @pytest.mark.xfail(reason='op with TimedeltaIndex raises, with ndarray OK')
+    def test_pi_add_sub_td64_array_tick(self):
+        rng = pd.period_range('1/1/2000', freq='Q', periods=3)
+        dti = pd.date_range('2016-01-01', periods=3)
+        tdi = dti - dti.shift(1)
+        tdarr = tdi.values
+
+        expected = rng + tdi
+        result = rng + tdarr
+        tm.assert_index_equal(result, expected)
+        result = tdarr + rng
+        tm.assert_index_equal(result, expected)
+
+        expected = rng - tdi
+        result = rng - tdarr
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            tdarr - rng
+
+    # -----------------------------------------------------------------
+    # operations with array/Index of DateOffset objects
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_pi_add_offset_array(self, box):
+        # GH#18849
+        pi = pd.PeriodIndex([pd.Period('2015Q1'), pd.Period('2016Q2')])
+        offs = box([pd.offsets.QuarterEnd(n=1, startingMonth=12),
+                    pd.offsets.QuarterEnd(n=-2, startingMonth=12)])
+        expected = pd.PeriodIndex([pd.Period('2015Q2'), pd.Period('2015Q4')])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = pi + offs
+        tm.assert_index_equal(res, expected)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res2 = offs + pi
+        tm.assert_index_equal(res2, expected)
+
+        unanchored = np.array([pd.offsets.Hour(n=1),
+                               pd.offsets.Minute(n=-2)])
+        # addition/subtraction ops with incompatible offsets should issue
+        # a PerformanceWarning and _then_ raise a TypeError.
+        with pytest.raises(period.IncompatibleFrequency):
+            with tm.assert_produces_warning(PerformanceWarning):
+                pi + unanchored
+        with pytest.raises(period.IncompatibleFrequency):
+            with tm.assert_produces_warning(PerformanceWarning):
+                unanchored + pi
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_pi_sub_offset_array(self, box):
+        # GH#18824
+        pi = pd.PeriodIndex([pd.Period('2015Q1'), pd.Period('2016Q2')])
+        other = box([pd.offsets.QuarterEnd(n=1, startingMonth=12),
+                     pd.offsets.QuarterEnd(n=-2, startingMonth=12)])
+
+        expected = PeriodIndex([pi[n] - other[n] for n in range(len(pi))])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = pi - other
+        tm.assert_index_equal(res, expected)
+
+        anchored = box([pd.offsets.MonthEnd(), pd.offsets.Day(n=2)])
+
+        # addition/subtraction ops with anchored offsets should issue
+        # a PerformanceWarning and _then_ raise a TypeError.
+        with pytest.raises(period.IncompatibleFrequency):
+            with tm.assert_produces_warning(PerformanceWarning):
+                pi - anchored
+        with pytest.raises(period.IncompatibleFrequency):
+            with tm.assert_produces_warning(PerformanceWarning):
+                anchored - pi
+
+    def test_pi_add_iadd_int(self, one):
+        # Variants of `one` for #19012
+        rng = pd.period_range('2000-01-01 09:00', freq='H', periods=10)
+        result = rng + one
+        expected = pd.period_range('2000-01-01 10:00', freq='H', periods=10)
+        tm.assert_index_equal(result, expected)
+        rng += one
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_sub_isub_int(self, one):
+        """
+        PeriodIndex.__sub__ and __isub__ with several representations of
+        the integer 1, e.g. int, long, np.int64, np.uint8, ...
+        """
+        rng = pd.period_range('2000-01-01 09:00', freq='H', periods=10)
+        result = rng - one
+        expected = pd.period_range('2000-01-01 08:00', freq='H', periods=10)
+        tm.assert_index_equal(result, expected)
+        rng -= one
+        tm.assert_index_equal(rng, expected)
+
+    @pytest.mark.parametrize('five', [5, np.array(5, dtype=np.int64)])
+    def test_pi_sub_intlike(self, five):
+        rng = period_range('2007-01', periods=50)
+
+        result = rng - five
+        exp = rng + (-five)
+        tm.assert_index_equal(result, exp)
+
+    def test_pi_sub_isub_offset(self):
+        # offset
+        # DateOffset
+        rng = pd.period_range('2014', '2024', freq='A')
+        result = rng - pd.offsets.YearEnd(5)
+        expected = pd.period_range('2009', '2019', freq='A')
+        tm.assert_index_equal(result, expected)
+        rng -= pd.offsets.YearEnd(5)
+        tm.assert_index_equal(rng, expected)
+
+        rng = pd.period_range('2014-01', '2016-12', freq='M')
+        result = rng - pd.offsets.MonthEnd(5)
+        expected = pd.period_range('2013-08', '2016-07', freq='M')
+        tm.assert_index_equal(result, expected)
+
+        rng -= pd.offsets.MonthEnd(5)
+        tm.assert_index_equal(rng, expected)
+
+    # ---------------------------------------------------------------
+    # __add__/__sub__ with integer arrays
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_pi_add_intarray(self, box, op):
+        # GH#19959
+        pi = pd.PeriodIndex([pd.Period('2015Q1'), pd.Period('NaT')])
+        other = box([4, -1])
+        result = op(pi, other)
+        expected = pd.PeriodIndex([pd.Period('2016Q1'), pd.Period('NaT')])
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_pi_sub_intarray(self, box):
+        # GH#19959
+        pi = pd.PeriodIndex([pd.Period('2015Q1'), pd.Period('NaT')])
+        other = box([4, -1])
+        result = pi - other
+        expected = pd.PeriodIndex([pd.Period('2014Q1'), pd.Period('NaT')])
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            other - pi
+
+    # ---------------------------------------------------------------
+    # Timedelta-like (timedelta, timedelta64, Timedelta, Tick)
+    # TODO: Some of these are misnomers because of non-Tick DateOffsets
+
+    def test_pi_add_iadd_timedeltalike_daily(self, three_days):
+        # Tick
+        other = three_days
+        rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
+        expected = pd.period_range('2014-05-04', '2014-05-18', freq='D')
+
+        result = rng + other
+        tm.assert_index_equal(result, expected)
+
+        rng += other
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_sub_isub_timedeltalike_daily(self, three_days):
+        # Tick-like 3 Days
+        other = three_days
+        rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
+        expected = pd.period_range('2014-04-28', '2014-05-12', freq='D')
+
+        result = rng - other
+        tm.assert_index_equal(result, expected)
+
+        rng -= other
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_add_iadd_timedeltalike_freq_mismatch_daily(self, not_daily):
+        other = not_daily
+        rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
+        msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=D\\)'
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            rng + other
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            rng += other
+
+    def test_pi_sub_timedeltalike_freq_mismatch_daily(self, not_daily):
+        other = not_daily
+        rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
+        msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=D\\)'
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            rng - other
+
+    def test_pi_add_iadd_timedeltalike_hourly(self, two_hours):
+        other = two_hours
+        rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00', freq='H')
+        expected = pd.period_range('2014-01-01 12:00', '2014-01-05 12:00',
+                                   freq='H')
+
+        result = rng + other
+        tm.assert_index_equal(result, expected)
+
+        rng += other
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_add_timedeltalike_mismatched_freq_hourly(self, not_hourly):
+        other = not_hourly
+        rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00', freq='H')
+        msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=H\\)'
+
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            rng + other
+
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            rng += other
+
+    def test_pi_sub_isub_timedeltalike_hourly(self, two_hours):
+        other = two_hours
+        rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00', freq='H')
+        expected = pd.period_range('2014-01-01 08:00', '2014-01-05 08:00',
+                                   freq='H')
+
+        result = rng - other
+        tm.assert_index_equal(result, expected)
+
+        rng -= other
+        tm.assert_index_equal(rng, expected)
+
+    def test_add_iadd_timedeltalike_annual(self):
+        # offset
+        # DateOffset
+        rng = pd.period_range('2014', '2024', freq='A')
+        result = rng + pd.offsets.YearEnd(5)
+        expected = pd.period_range('2019', '2029', freq='A')
+        tm.assert_index_equal(result, expected)
+        rng += pd.offsets.YearEnd(5)
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_add_iadd_timedeltalike_freq_mismatch_annual(self, mismatched):
+        other = mismatched
+        rng = pd.period_range('2014', '2024', freq='A')
+        msg = ('Input has different freq(=.+)? '
+               'from PeriodIndex\\(freq=A-DEC\\)')
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            rng + other
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            rng += other
+
+    def test_pi_sub_isub_timedeltalike_freq_mismatch_annual(self, mismatched):
+        other = mismatched
+        rng = pd.period_range('2014', '2024', freq='A')
+        msg = ('Input has different freq(=.+)? '
+               'from PeriodIndex\\(freq=A-DEC\\)')
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            rng - other
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            rng -= other
+
+    def test_pi_add_iadd_timedeltalike_M(self):
+        rng = pd.period_range('2014-01', '2016-12', freq='M')
+        expected = pd.period_range('2014-06', '2017-05', freq='M')
+
+        result = rng + pd.offsets.MonthEnd(5)
+        tm.assert_index_equal(result, expected)
+
+        rng += pd.offsets.MonthEnd(5)
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_add_iadd_timedeltalike_freq_mismatch_monthly(self, mismatched):
+        other = mismatched
+        rng = pd.period_range('2014-01', '2016-12', freq='M')
+        msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=M\\)'
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            rng + other
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            rng += other
+
+    def test_pi_sub_isub_timedeltalike_freq_mismatch_monthly(self, mismatched):
+        other = mismatched
+        rng = pd.period_range('2014-01', '2016-12', freq='M')
+        msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=M\\)'
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            rng - other
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            rng -= other
+
+    # ---------------------------------------------------------------
+    # PeriodIndex.shift is used by __add__ and __sub__
+
+    def test_pi_shift_ndarray(self):
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'],
+                          freq='M', name='idx')
+        result = idx.shift(np.array([1, 2, 3, 4]))
+        expected = PeriodIndex(['2011-02', '2011-04', 'NaT', '2011-08'],
+                               freq='M', name='idx')
+        tm.assert_index_equal(result, expected)
+
+        result = idx.shift(np.array([1, -2, 3, -4]))
+        expected = PeriodIndex(['2011-02', '2010-12', 'NaT', '2010-12'],
+                               freq='M', name='idx')
+        tm.assert_index_equal(result, expected)
+
+    def test_shift(self):
+        pi1 = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
+        pi2 = PeriodIndex(freq='A', start='1/1/2002', end='12/1/2010')
+
+        tm.assert_index_equal(pi1.shift(0), pi1)
+
+        assert len(pi1) == len(pi2)
+        tm.assert_index_equal(pi1.shift(1), pi2)
+
+        pi1 = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
+        pi2 = PeriodIndex(freq='A', start='1/1/2000', end='12/1/2008')
+        assert len(pi1) == len(pi2)
+        tm.assert_index_equal(pi1.shift(-1), pi2)
+
+        pi1 = PeriodIndex(freq='M', start='1/1/2001', end='12/1/2009')
+        pi2 = PeriodIndex(freq='M', start='2/1/2001', end='1/1/2010')
+        assert len(pi1) == len(pi2)
+        tm.assert_index_equal(pi1.shift(1), pi2)
+
+        pi1 = PeriodIndex(freq='M', start='1/1/2001', end='12/1/2009')
+        pi2 = PeriodIndex(freq='M', start='12/1/2000', end='11/1/2009')
+        assert len(pi1) == len(pi2)
+        tm.assert_index_equal(pi1.shift(-1), pi2)
+
+        pi1 = PeriodIndex(freq='D', start='1/1/2001', end='12/1/2009')
+        pi2 = PeriodIndex(freq='D', start='1/2/2001', end='12/2/2009')
+        assert len(pi1) == len(pi2)
+        tm.assert_index_equal(pi1.shift(1), pi2)
+
+        pi1 = PeriodIndex(freq='D', start='1/1/2001', end='12/1/2009')
+        pi2 = PeriodIndex(freq='D', start='12/31/2000', end='11/30/2009')
+        assert len(pi1) == len(pi2)
+        tm.assert_index_equal(pi1.shift(-1), pi2)
+
+    def test_shift_corner_cases(self):
+        # GH#9903
+        idx = pd.PeriodIndex([], name='xxx', freq='H')
+
+        with pytest.raises(TypeError):
+            # period shift doesn't accept freq
+            idx.shift(1, freq='H')
+
+        tm.assert_index_equal(idx.shift(0), idx)
+        tm.assert_index_equal(idx.shift(3), idx)
+
+        idx = pd.PeriodIndex(['2011-01-01 10:00', '2011-01-01 11:00'
+                              '2011-01-01 12:00'], name='xxx', freq='H')
+        tm.assert_index_equal(idx.shift(0), idx)
+        exp = pd.PeriodIndex(['2011-01-01 13:00', '2011-01-01 14:00'
+                              '2011-01-01 15:00'], name='xxx', freq='H')
+        tm.assert_index_equal(idx.shift(3), exp)
+        exp = pd.PeriodIndex(['2011-01-01 07:00', '2011-01-01 08:00'
+                              '2011-01-01 09:00'], name='xxx', freq='H')
+        tm.assert_index_equal(idx.shift(-3), exp)
+
+    def test_shift_nat(self):
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'],
+                          freq='M', name='idx')
+        result = idx.shift(1)
+        expected = PeriodIndex(['2011-02', '2011-03', 'NaT', '2011-05'],
+                               freq='M', name='idx')
+        tm.assert_index_equal(result, expected)
+        assert result.name == expected.name
+
+    def test_shift_gh8083(self):
+        # test shift for PeriodIndex
+        # GH#8083
+        drange = pd.period_range('20130101', periods=5, freq='D')
+        result = drange.shift(1)
+        expected = PeriodIndex(['2013-01-02', '2013-01-03', '2013-01-04',
+                                '2013-01-05', '2013-01-06'], freq='D')
+        tm.assert_index_equal(result, expected)
+
+
+class TestPeriodIndexSeriesMethods(object):
+    """ Test PeriodIndex and Period Series Ops consistency """
+
+    def _check(self, values, func, expected):
+        idx = pd.PeriodIndex(values)
+        result = func(idx)
+        if isinstance(expected, pd.Index):
+            tm.assert_index_equal(result, expected)
+        else:
+            # comp op results in bool
+            tm.assert_numpy_array_equal(result, expected)
+
+        ser = pd.Series(values)
+        result = func(ser)
+
+        exp = pd.Series(expected, name=values.name)
+        tm.assert_series_equal(result, exp)
+
+    def test_pi_ops(self):
+        idx = PeriodIndex(['2011-01', '2011-02', '2011-03', '2011-04'],
+                          freq='M', name='idx')
+
+        expected = PeriodIndex(['2011-03', '2011-04', '2011-05', '2011-06'],
+                               freq='M', name='idx')
+        self._check(idx, lambda x: x + 2, expected)
+        self._check(idx, lambda x: 2 + x, expected)
+
+        self._check(idx + 2, lambda x: x - 2, idx)
+        result = idx - Period('2011-01', freq='M')
+        off = idx.freq
+        exp = pd.Index([0 * off, 1 * off, 2 * off, 3 * off], name='idx')
+        tm.assert_index_equal(result, exp)
+
+        result = Period('2011-01', freq='M') - idx
+        exp = pd.Index([0 * off, -1 * off, -2 * off, -3 * off], name='idx')
+        tm.assert_index_equal(result, exp)
+
+    @pytest.mark.parametrize('ng', ["str", 1.5])
+    def test_pi_ops_errors(self, ng):
+        idx = PeriodIndex(['2011-01', '2011-02', '2011-03', '2011-04'],
+                          freq='M', name='idx')
+        ser = pd.Series(idx)
+
+        msg = r"unsupported operand type\(s\)"
+
+        for obj in [idx, ser]:
+            with tm.assert_raises_regex(TypeError, msg):
+                obj + ng
+
+            with pytest.raises(TypeError):
+                # error message differs between PY2 and 3
+                ng + obj
+
+            with tm.assert_raises_regex(TypeError, msg):
+                obj - ng
+
+            with pytest.raises(TypeError):
+                np.add(obj, ng)
+
+            if _np_version_under1p10:
+                assert np.add(ng, obj) is NotImplemented
+            else:
+                with pytest.raises(TypeError):
+                    np.add(ng, obj)
+
+            with pytest.raises(TypeError):
+                np.subtract(obj, ng)
+
+            if _np_version_under1p10:
+                assert np.subtract(ng, obj) is NotImplemented
+            else:
+                with pytest.raises(TypeError):
+                    np.subtract(ng, obj)
+
+    def test_pi_ops_nat(self):
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'],
+                          freq='M', name='idx')
+        expected = PeriodIndex(['2011-03', '2011-04', 'NaT', '2011-06'],
+                               freq='M', name='idx')
+        self._check(idx, lambda x: x + 2, expected)
+        self._check(idx, lambda x: 2 + x, expected)
+        self._check(idx, lambda x: np.add(x, 2), expected)
+
+        self._check(idx + 2, lambda x: x - 2, idx)
+        self._check(idx + 2, lambda x: np.subtract(x, 2), idx)
+
+        # freq with mult
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'],
+                          freq='2M', name='idx')
+        expected = PeriodIndex(['2011-07', '2011-08', 'NaT', '2011-10'],
+                               freq='2M', name='idx')
+        self._check(idx, lambda x: x + 3, expected)
+        self._check(idx, lambda x: 3 + x, expected)
+        self._check(idx, lambda x: np.add(x, 3), expected)
+
+        self._check(idx + 3, lambda x: x - 3, idx)
+        self._check(idx + 3, lambda x: np.subtract(x, 3), idx)
+
+    def test_pi_ops_array_int(self):
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'],
+                          freq='M', name='idx')
+        f = lambda x: x + np.array([1, 2, 3, 4])
+        exp = PeriodIndex(['2011-02', '2011-04', 'NaT', '2011-08'],
+                          freq='M', name='idx')
+        self._check(idx, f, exp)
+
+        f = lambda x: np.add(x, np.array([4, -1, 1, 2]))
+        exp = PeriodIndex(['2011-05', '2011-01', 'NaT', '2011-06'],
+                          freq='M', name='idx')
+        self._check(idx, f, exp)
+
+        f = lambda x: x - np.array([1, 2, 3, 4])
+        exp = PeriodIndex(['2010-12', '2010-12', 'NaT', '2010-12'],
+                          freq='M', name='idx')
+        self._check(idx, f, exp)
+
+        f = lambda x: np.subtract(x, np.array([3, 2, 3, -2]))
+        exp = PeriodIndex(['2010-10', '2010-12', 'NaT', '2011-06'],
+                          freq='M', name='idx')
+        self._check(idx, f, exp)
+
+    def test_pi_ops_offset(self):
+        idx = PeriodIndex(['2011-01-01', '2011-02-01', '2011-03-01',
+                           '2011-04-01'], freq='D', name='idx')
+        f = lambda x: x + pd.offsets.Day()
+        exp = PeriodIndex(['2011-01-02', '2011-02-02', '2011-03-02',
+                           '2011-04-02'], freq='D', name='idx')
+        self._check(idx, f, exp)
+
+        f = lambda x: x + pd.offsets.Day(2)
+        exp = PeriodIndex(['2011-01-03', '2011-02-03', '2011-03-03',
+                           '2011-04-03'], freq='D', name='idx')
+        self._check(idx, f, exp)
+
+        f = lambda x: x - pd.offsets.Day(2)
+        exp = PeriodIndex(['2010-12-30', '2011-01-30', '2011-02-27',
+                           '2011-03-30'], freq='D', name='idx')
+        self._check(idx, f, exp)
+
+    def test_pi_offset_errors(self):
+        idx = PeriodIndex(['2011-01-01', '2011-02-01', '2011-03-01',
+                           '2011-04-01'], freq='D', name='idx')
+        ser = pd.Series(idx)
+
+        # Series op is applied per Period instance, thus error is raised
+        # from Period
+        msg_idx = r"Input has different freq from PeriodIndex\(freq=D\)"
+        msg_s = r"Input cannot be converted to Period\(freq=D\)"
+        for obj, msg in [(idx, msg_idx), (ser, msg_s)]:
+            with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+                obj + pd.offsets.Hour(2)
+
+            with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+                pd.offsets.Hour(2) + obj
+
+            with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+                obj - pd.offsets.Hour(2)
+
+    def test_pi_sub_period(self):
+        # GH 13071
+        idx = PeriodIndex(['2011-01', '2011-02', '2011-03', '2011-04'],
+                          freq='M', name='idx')
+
+        result = idx - pd.Period('2012-01', freq='M')
+        off = idx.freq
+        exp = pd.Index([-12 * off, -11 * off, -10 * off, -9 * off], name='idx')
+        tm.assert_index_equal(result, exp)
+
+        result = np.subtract(idx, pd.Period('2012-01', freq='M'))
+        tm.assert_index_equal(result, exp)
+
+        result = pd.Period('2012-01', freq='M') - idx
+        exp = pd.Index([12 * off, 11 * off, 10 * off, 9 * off], name='idx')
+        tm.assert_index_equal(result, exp)
+
+        result = np.subtract(pd.Period('2012-01', freq='M'), idx)
+        if _np_version_under1p10:
+            assert result is NotImplemented
+        else:
+            tm.assert_index_equal(result, exp)
+
+        exp = pd.TimedeltaIndex([np.nan, np.nan, np.nan, np.nan], name='idx')
+        tm.assert_index_equal(idx - pd.Period('NaT', freq='M'), exp)
+        tm.assert_index_equal(pd.Period('NaT', freq='M') - idx, exp)
+
+    def test_pi_sub_pdnat(self):
+        # GH 13071
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'],
+                          freq='M', name='idx')
+        exp = pd.TimedeltaIndex([pd.NaT] * 4, name='idx')
+        tm.assert_index_equal(pd.NaT - idx, exp)
+        tm.assert_index_equal(idx - pd.NaT, exp)
+
+    def test_pi_sub_period_nat(self):
+        # GH 13071
+        idx = PeriodIndex(['2011-01', 'NaT', '2011-03', '2011-04'],
+                          freq='M', name='idx')
+
+        result = idx - pd.Period('2012-01', freq='M')
+        off = idx.freq
+        exp = pd.Index([-12 * off, pd.NaT, -10 * off, -9 * off], name='idx')
+        tm.assert_index_equal(result, exp)
+
+        result = pd.Period('2012-01', freq='M') - idx
+        exp = pd.Index([12 * off, pd.NaT, 10 * off, 9 * off], name='idx')
+        tm.assert_index_equal(result, exp)
+
+        exp = pd.TimedeltaIndex([np.nan, np.nan, np.nan, np.nan], name='idx')
+        tm.assert_index_equal(idx - pd.Period('NaT', freq='M'), exp)
+        tm.assert_index_equal(pd.Period('NaT', freq='M') - idx, exp)
diff --git a/pandas/tests/indexes/period/test_asfreq.py b/pandas/tests/indexes/period/test_asfreq.py
new file mode 100644
index 0000000000000..ea59a57069faa
--- /dev/null
+++ b/pandas/tests/indexes/period/test_asfreq.py
@@ -0,0 +1,152 @@
+import pytest
+
+import numpy as np
+import pandas as pd
+from pandas.util import testing as tm
+from pandas import PeriodIndex, Series, DataFrame
+
+
+class TestPeriodIndex(object):
+
+    def test_asfreq(self):
+        pi1 = PeriodIndex(freq='A', start='1/1/2001', end='1/1/2001')
+        pi2 = PeriodIndex(freq='Q', start='1/1/2001', end='1/1/2001')
+        pi3 = PeriodIndex(freq='M', start='1/1/2001', end='1/1/2001')
+        pi4 = PeriodIndex(freq='D', start='1/1/2001', end='1/1/2001')
+        pi5 = PeriodIndex(freq='H', start='1/1/2001', end='1/1/2001 00:00')
+        pi6 = PeriodIndex(freq='Min', start='1/1/2001', end='1/1/2001 00:00')
+        pi7 = PeriodIndex(freq='S', start='1/1/2001', end='1/1/2001 00:00:00')
+
+        assert pi1.asfreq('Q', 'S') == pi2
+        assert pi1.asfreq('Q', 's') == pi2
+        assert pi1.asfreq('M', 'start') == pi3
+        assert pi1.asfreq('D', 'StarT') == pi4
+        assert pi1.asfreq('H', 'beGIN') == pi5
+        assert pi1.asfreq('Min', 'S') == pi6
+        assert pi1.asfreq('S', 'S') == pi7
+
+        assert pi2.asfreq('A', 'S') == pi1
+        assert pi2.asfreq('M', 'S') == pi3
+        assert pi2.asfreq('D', 'S') == pi4
+        assert pi2.asfreq('H', 'S') == pi5
+        assert pi2.asfreq('Min', 'S') == pi6
+        assert pi2.asfreq('S', 'S') == pi7
+
+        assert pi3.asfreq('A', 'S') == pi1
+        assert pi3.asfreq('Q', 'S') == pi2
+        assert pi3.asfreq('D', 'S') == pi4
+        assert pi3.asfreq('H', 'S') == pi5
+        assert pi3.asfreq('Min', 'S') == pi6
+        assert pi3.asfreq('S', 'S') == pi7
+
+        assert pi4.asfreq('A', 'S') == pi1
+        assert pi4.asfreq('Q', 'S') == pi2
+        assert pi4.asfreq('M', 'S') == pi3
+        assert pi4.asfreq('H', 'S') == pi5
+        assert pi4.asfreq('Min', 'S') == pi6
+        assert pi4.asfreq('S', 'S') == pi7
+
+        assert pi5.asfreq('A', 'S') == pi1
+        assert pi5.asfreq('Q', 'S') == pi2
+        assert pi5.asfreq('M', 'S') == pi3
+        assert pi5.asfreq('D', 'S') == pi4
+        assert pi5.asfreq('Min', 'S') == pi6
+        assert pi5.asfreq('S', 'S') == pi7
+
+        assert pi6.asfreq('A', 'S') == pi1
+        assert pi6.asfreq('Q', 'S') == pi2
+        assert pi6.asfreq('M', 'S') == pi3
+        assert pi6.asfreq('D', 'S') == pi4
+        assert pi6.asfreq('H', 'S') == pi5
+        assert pi6.asfreq('S', 'S') == pi7
+
+        assert pi7.asfreq('A', 'S') == pi1
+        assert pi7.asfreq('Q', 'S') == pi2
+        assert pi7.asfreq('M', 'S') == pi3
+        assert pi7.asfreq('D', 'S') == pi4
+        assert pi7.asfreq('H', 'S') == pi5
+        assert pi7.asfreq('Min', 'S') == pi6
+
+        pytest.raises(ValueError, pi7.asfreq, 'T', 'foo')
+        result1 = pi1.asfreq('3M')
+        result2 = pi1.asfreq('M')
+        expected = PeriodIndex(freq='M', start='2001-12', end='2001-12')
+        tm.assert_numpy_array_equal(result1.asi8, expected.asi8)
+        assert result1.freqstr == '3M'
+        tm.assert_numpy_array_equal(result2.asi8, expected.asi8)
+        assert result2.freqstr == 'M'
+
+    def test_asfreq_nat(self):
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'], freq='M')
+        result = idx.asfreq(freq='Q')
+        expected = PeriodIndex(['2011Q1', '2011Q1', 'NaT', '2011Q2'], freq='Q')
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('freq', ['D', '3D'])
+    def test_asfreq_mult_pi(self, freq):
+        pi = PeriodIndex(['2001-01', '2001-02', 'NaT', '2001-03'], freq='2M')
+
+        result = pi.asfreq(freq)
+        exp = PeriodIndex(['2001-02-28', '2001-03-31', 'NaT',
+                           '2001-04-30'], freq=freq)
+        tm.assert_index_equal(result, exp)
+        assert result.freq == exp.freq
+
+        result = pi.asfreq(freq, how='S')
+        exp = PeriodIndex(['2001-01-01', '2001-02-01', 'NaT',
+                           '2001-03-01'], freq=freq)
+        tm.assert_index_equal(result, exp)
+        assert result.freq == exp.freq
+
+    def test_asfreq_combined_pi(self):
+        pi = pd.PeriodIndex(['2001-01-01 00:00', '2001-01-02 02:00', 'NaT'],
+                            freq='H')
+        exp = PeriodIndex(['2001-01-01 00:00', '2001-01-02 02:00', 'NaT'],
+                          freq='25H')
+        for freq, how in zip(['1D1H', '1H1D'], ['S', 'E']):
+            result = pi.asfreq(freq, how=how)
+            tm.assert_index_equal(result, exp)
+            assert result.freq == exp.freq
+
+        for freq in ['1D1H', '1H1D']:
+            pi = pd.PeriodIndex(['2001-01-01 00:00', '2001-01-02 02:00',
+                                 'NaT'], freq=freq)
+            result = pi.asfreq('H')
+            exp = PeriodIndex(['2001-01-02 00:00', '2001-01-03 02:00', 'NaT'],
+                              freq='H')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == exp.freq
+
+            pi = pd.PeriodIndex(['2001-01-01 00:00', '2001-01-02 02:00',
+                                 'NaT'], freq=freq)
+            result = pi.asfreq('H', how='S')
+            exp = PeriodIndex(['2001-01-01 00:00', '2001-01-02 02:00', 'NaT'],
+                              freq='H')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == exp.freq
+
+    def test_asfreq_ts(self):
+        index = PeriodIndex(freq='A', start='1/1/2001', end='12/31/2010')
+        ts = Series(np.random.randn(len(index)), index=index)
+        df = DataFrame(np.random.randn(len(index), 3), index=index)
+
+        result = ts.asfreq('D', how='end')
+        df_result = df.asfreq('D', how='end')
+        exp_index = index.asfreq('D', how='end')
+        assert len(result) == len(ts)
+        tm.assert_index_equal(result.index, exp_index)
+        tm.assert_index_equal(df_result.index, exp_index)
+
+        result = ts.asfreq('D', how='start')
+        assert len(result) == len(ts)
+        tm.assert_index_equal(result.index, index.asfreq('D', how='start'))
+
+    def test_astype_asfreq(self):
+        pi1 = PeriodIndex(['2011-01-01', '2011-02-01', '2011-03-01'], freq='D')
+        exp = PeriodIndex(['2011-01', '2011-02', '2011-03'], freq='M')
+        tm.assert_index_equal(pi1.asfreq('M'), exp)
+        tm.assert_index_equal(pi1.astype('period[M]'), exp)
+
+        exp = PeriodIndex(['2011-01', '2011-02', '2011-03'], freq='3M')
+        tm.assert_index_equal(pi1.asfreq('3M'), exp)
+        tm.assert_index_equal(pi1.astype('period[3M]'), exp)
diff --git a/pandas/tests/indexes/period/test_astype.py b/pandas/tests/indexes/period/test_astype.py
new file mode 100644
index 0000000000000..f2126487496c4
--- /dev/null
+++ b/pandas/tests/indexes/period/test_astype.py
@@ -0,0 +1,99 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import NaT, Period, PeriodIndex, Int64Index, Index, period_range
+
+
+class TestPeriodIndexAsType(object):
+    @pytest.mark.parametrize('dtype', [
+        float, 'timedelta64', 'timedelta64[ns]'])
+    def test_astype_raises(self, dtype):
+        # GH#13149, GH#13209
+        idx = PeriodIndex(['2016-05-16', 'NaT', NaT, np.NaN], freq='D')
+        msg = 'Cannot cast PeriodIndex to dtype'
+        with tm.assert_raises_regex(TypeError, msg):
+            idx.astype(dtype)
+
+    def test_astype_conversion(self):
+        # GH#13149, GH#13209
+        idx = PeriodIndex(['2016-05-16', 'NaT', NaT, np.NaN], freq='D')
+
+        result = idx.astype(object)
+        expected = Index([Period('2016-05-16', freq='D')] +
+                         [Period(NaT, freq='D')] * 3, dtype='object')
+        tm.assert_index_equal(result, expected)
+
+        result = idx.astype(int)
+        expected = Int64Index([16937] + [-9223372036854775808] * 3,
+                              dtype=np.int64)
+        tm.assert_index_equal(result, expected)
+
+        result = idx.astype(str)
+        expected = Index(str(x) for x in idx)
+        tm.assert_index_equal(result, expected)
+
+        idx = period_range('1990', '2009', freq='A')
+        result = idx.astype('i8')
+        tm.assert_index_equal(result, Index(idx.asi8))
+        tm.assert_numpy_array_equal(result.values, idx.asi8)
+
+    def test_astype_object(self):
+        idx = pd.PeriodIndex([], freq='M')
+
+        exp = np.array([], dtype=object)
+        tm.assert_numpy_array_equal(idx.astype(object).values, exp)
+        tm.assert_numpy_array_equal(idx._mpl_repr(), exp)
+
+        idx = pd.PeriodIndex(['2011-01', pd.NaT], freq='M')
+
+        exp = np.array([pd.Period('2011-01', freq='M'), pd.NaT], dtype=object)
+        tm.assert_numpy_array_equal(idx.astype(object).values, exp)
+        tm.assert_numpy_array_equal(idx._mpl_repr(), exp)
+
+        exp = np.array([pd.Period('2011-01-01', freq='D'), pd.NaT],
+                       dtype=object)
+        idx = pd.PeriodIndex(['2011-01-01', pd.NaT], freq='D')
+        tm.assert_numpy_array_equal(idx.astype(object).values, exp)
+        tm.assert_numpy_array_equal(idx._mpl_repr(), exp)
+
+    # TODO: de-duplicate this version (from test_ops) with the one above
+    # (from test_period)
+    def test_astype_object2(self):
+        idx = pd.period_range(start='2013-01-01', periods=4, freq='M',
+                              name='idx')
+        expected_list = [pd.Period('2013-01-31', freq='M'),
+                         pd.Period('2013-02-28', freq='M'),
+                         pd.Period('2013-03-31', freq='M'),
+                         pd.Period('2013-04-30', freq='M')]
+        expected = pd.Index(expected_list, dtype=object, name='idx')
+        result = idx.astype(object)
+        assert isinstance(result, Index)
+        assert result.dtype == object
+        tm.assert_index_equal(result, expected)
+        assert result.name == expected.name
+        assert idx.tolist() == expected_list
+
+        idx = PeriodIndex(['2013-01-01', '2013-01-02', 'NaT',
+                           '2013-01-04'], freq='D', name='idx')
+        expected_list = [pd.Period('2013-01-01', freq='D'),
+                         pd.Period('2013-01-02', freq='D'),
+                         pd.Period('NaT', freq='D'),
+                         pd.Period('2013-01-04', freq='D')]
+        expected = pd.Index(expected_list, dtype=object, name='idx')
+        result = idx.astype(object)
+        assert isinstance(result, Index)
+        assert result.dtype == object
+        tm.assert_index_equal(result, expected)
+        for i in [0, 1, 3]:
+            assert result[i] == expected[i]
+        assert result[2] is pd.NaT
+        assert result.name == expected.name
+
+        result_list = idx.tolist()
+        for i in [0, 1, 3]:
+            assert result_list[i] == expected_list[i]
+        assert result_list[2] is pd.NaT
diff --git a/pandas/tests/indexes/period/test_construction.py b/pandas/tests/indexes/period/test_construction.py
new file mode 100644
index 0000000000000..be741592ec7a2
--- /dev/null
+++ b/pandas/tests/indexes/period/test_construction.py
@@ -0,0 +1,489 @@
+import pytest
+
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.core.indexes.period as period
+from pandas.compat import lrange, PY3, text_type, lmap
+from pandas import (Period, PeriodIndex, period_range, offsets, date_range,
+                    Series, Index)
+
+
+class TestPeriodIndex(object):
+
+    def setup_method(self, method):
+        pass
+
+    def test_construction_base_constructor(self):
+        # GH 13664
+        arr = [pd.Period('2011-01', freq='M'), pd.NaT,
+               pd.Period('2011-03', freq='M')]
+        tm.assert_index_equal(pd.Index(arr), pd.PeriodIndex(arr))
+        tm.assert_index_equal(pd.Index(np.array(arr)),
+                              pd.PeriodIndex(np.array(arr)))
+
+        arr = [np.nan, pd.NaT, pd.Period('2011-03', freq='M')]
+        tm.assert_index_equal(pd.Index(arr), pd.PeriodIndex(arr))
+        tm.assert_index_equal(pd.Index(np.array(arr)),
+                              pd.PeriodIndex(np.array(arr)))
+
+        arr = [pd.Period('2011-01', freq='M'), pd.NaT,
+               pd.Period('2011-03', freq='D')]
+        tm.assert_index_equal(pd.Index(arr), pd.Index(arr, dtype=object))
+
+        tm.assert_index_equal(pd.Index(np.array(arr)),
+                              pd.Index(np.array(arr), dtype=object))
+
+    def test_constructor_use_start_freq(self):
+        # GH #1118
+        p = Period('4/2/2012', freq='B')
+        index = PeriodIndex(start=p, periods=10)
+        expected = PeriodIndex(start='4/2/2012', periods=10, freq='B')
+        tm.assert_index_equal(index, expected)
+
+    def test_constructor_field_arrays(self):
+        # GH #1264
+
+        years = np.arange(1990, 2010).repeat(4)[2:-2]
+        quarters = np.tile(np.arange(1, 5), 20)[2:-2]
+
+        index = PeriodIndex(year=years, quarter=quarters, freq='Q-DEC')
+        expected = period_range('1990Q3', '2009Q2', freq='Q-DEC')
+        tm.assert_index_equal(index, expected)
+
+        index2 = PeriodIndex(year=years, quarter=quarters, freq='2Q-DEC')
+        tm.assert_numpy_array_equal(index.asi8, index2.asi8)
+
+        index = PeriodIndex(year=years, quarter=quarters)
+        tm.assert_index_equal(index, expected)
+
+        years = [2007, 2007, 2007]
+        months = [1, 2]
+        pytest.raises(ValueError, PeriodIndex, year=years, month=months,
+                      freq='M')
+        pytest.raises(ValueError, PeriodIndex, year=years, month=months,
+                      freq='2M')
+        pytest.raises(ValueError, PeriodIndex, year=years, month=months,
+                      freq='M', start=Period('2007-01', freq='M'))
+
+        years = [2007, 2007, 2007]
+        months = [1, 2, 3]
+        idx = PeriodIndex(year=years, month=months, freq='M')
+        exp = period_range('2007-01', periods=3, freq='M')
+        tm.assert_index_equal(idx, exp)
+
+    def test_constructor_U(self):
+        # U was used as undefined period
+        pytest.raises(ValueError, period_range, '2007-1-1', periods=500,
+                      freq='X')
+
+    def test_constructor_nano(self):
+        idx = period_range(start=Period(ordinal=1, freq='N'),
+                           end=Period(ordinal=4, freq='N'), freq='N')
+        exp = PeriodIndex([Period(ordinal=1, freq='N'),
+                           Period(ordinal=2, freq='N'),
+                           Period(ordinal=3, freq='N'),
+                           Period(ordinal=4, freq='N')], freq='N')
+        tm.assert_index_equal(idx, exp)
+
+    def test_constructor_arrays_negative_year(self):
+        years = np.arange(1960, 2000, dtype=np.int64).repeat(4)
+        quarters = np.tile(np.array([1, 2, 3, 4], dtype=np.int64), 40)
+
+        pindex = PeriodIndex(year=years, quarter=quarters)
+
+        tm.assert_index_equal(pindex.year, pd.Index(years))
+        tm.assert_index_equal(pindex.quarter, pd.Index(quarters))
+
+    def test_constructor_invalid_quarters(self):
+        pytest.raises(ValueError, PeriodIndex, year=lrange(2000, 2004),
+                      quarter=lrange(4), freq='Q-DEC')
+
+    def test_constructor_corner(self):
+        pytest.raises(ValueError, PeriodIndex, periods=10, freq='A')
+
+        start = Period('2007', freq='A-JUN')
+        end = Period('2010', freq='A-DEC')
+        pytest.raises(ValueError, PeriodIndex, start=start, end=end)
+        pytest.raises(ValueError, PeriodIndex, start=start)
+        pytest.raises(ValueError, PeriodIndex, end=end)
+
+        result = period_range('2007-01', periods=10.5, freq='M')
+        exp = period_range('2007-01', periods=10, freq='M')
+        tm.assert_index_equal(result, exp)
+
+    def test_constructor_fromarraylike(self):
+        idx = period_range('2007-01', periods=20, freq='M')
+
+        # values is an array of Period, thus can retrieve freq
+        tm.assert_index_equal(PeriodIndex(idx.values), idx)
+        tm.assert_index_equal(PeriodIndex(list(idx.values)), idx)
+
+        pytest.raises(ValueError, PeriodIndex, idx._ndarray_values)
+        pytest.raises(ValueError, PeriodIndex, list(idx._ndarray_values))
+        pytest.raises(TypeError, PeriodIndex,
+                      data=Period('2007', freq='A'))
+
+        result = PeriodIndex(iter(idx))
+        tm.assert_index_equal(result, idx)
+
+        result = PeriodIndex(idx)
+        tm.assert_index_equal(result, idx)
+
+        result = PeriodIndex(idx, freq='M')
+        tm.assert_index_equal(result, idx)
+
+        result = PeriodIndex(idx, freq=offsets.MonthEnd())
+        tm.assert_index_equal(result, idx)
+        assert result.freq == 'M'
+
+        result = PeriodIndex(idx, freq='2M')
+        tm.assert_index_equal(result, idx.asfreq('2M'))
+        assert result.freq == '2M'
+
+        result = PeriodIndex(idx, freq=offsets.MonthEnd(2))
+        tm.assert_index_equal(result, idx.asfreq('2M'))
+        assert result.freq == '2M'
+
+        result = PeriodIndex(idx, freq='D')
+        exp = idx.asfreq('D', 'e')
+        tm.assert_index_equal(result, exp)
+
+    def test_constructor_datetime64arr(self):
+        vals = np.arange(100000, 100000 + 10000, 100, dtype=np.int64)
+        vals = vals.view(np.dtype('M8[us]'))
+
+        pytest.raises(ValueError, PeriodIndex, vals, freq='D')
+
+    def test_constructor_dtype(self):
+        # passing a dtype with a tz should localize
+        idx = PeriodIndex(['2013-01', '2013-03'], dtype='period[M]')
+        exp = PeriodIndex(['2013-01', '2013-03'], freq='M')
+        tm.assert_index_equal(idx, exp)
+        assert idx.dtype == 'period[M]'
+
+        idx = PeriodIndex(['2013-01-05', '2013-03-05'], dtype='period[3D]')
+        exp = PeriodIndex(['2013-01-05', '2013-03-05'], freq='3D')
+        tm.assert_index_equal(idx, exp)
+        assert idx.dtype == 'period[3D]'
+
+        # if we already have a freq and its not the same, then asfreq
+        # (not changed)
+        idx = PeriodIndex(['2013-01-01', '2013-01-02'], freq='D')
+
+        res = PeriodIndex(idx, dtype='period[M]')
+        exp = PeriodIndex(['2013-01', '2013-01'], freq='M')
+        tm.assert_index_equal(res, exp)
+        assert res.dtype == 'period[M]'
+
+        res = PeriodIndex(idx, freq='M')
+        tm.assert_index_equal(res, exp)
+        assert res.dtype == 'period[M]'
+
+        msg = 'specified freq and dtype are different'
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            PeriodIndex(['2011-01'], freq='M', dtype='period[D]')
+
+    def test_constructor_empty(self):
+        idx = pd.PeriodIndex([], freq='M')
+        assert isinstance(idx, PeriodIndex)
+        assert len(idx) == 0
+        assert idx.freq == 'M'
+
+        with tm.assert_raises_regex(ValueError, 'freq not specified'):
+            pd.PeriodIndex([])
+
+    def test_constructor_pi_nat(self):
+        idx = PeriodIndex([Period('2011-01', freq='M'), pd.NaT,
+                           Period('2011-01', freq='M')])
+        exp = PeriodIndex(['2011-01', 'NaT', '2011-01'], freq='M')
+        tm.assert_index_equal(idx, exp)
+
+        idx = PeriodIndex(np.array([Period('2011-01', freq='M'), pd.NaT,
+                                    Period('2011-01', freq='M')]))
+        tm.assert_index_equal(idx, exp)
+
+        idx = PeriodIndex([pd.NaT, pd.NaT, Period('2011-01', freq='M'),
+                           Period('2011-01', freq='M')])
+        exp = PeriodIndex(['NaT', 'NaT', '2011-01', '2011-01'], freq='M')
+        tm.assert_index_equal(idx, exp)
+
+        idx = PeriodIndex(np.array([pd.NaT, pd.NaT,
+                                    Period('2011-01', freq='M'),
+                                    Period('2011-01', freq='M')]))
+        tm.assert_index_equal(idx, exp)
+
+        idx = PeriodIndex([pd.NaT, pd.NaT, '2011-01', '2011-01'], freq='M')
+        tm.assert_index_equal(idx, exp)
+
+        with tm.assert_raises_regex(ValueError, 'freq not specified'):
+            PeriodIndex([pd.NaT, pd.NaT])
+
+        with tm.assert_raises_regex(ValueError, 'freq not specified'):
+            PeriodIndex(np.array([pd.NaT, pd.NaT]))
+
+        with tm.assert_raises_regex(ValueError, 'freq not specified'):
+            PeriodIndex(['NaT', 'NaT'])
+
+        with tm.assert_raises_regex(ValueError, 'freq not specified'):
+            PeriodIndex(np.array(['NaT', 'NaT']))
+
+    def test_constructor_incompat_freq(self):
+        msg = "Input has different freq=D from PeriodIndex\\(freq=M\\)"
+
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            PeriodIndex([Period('2011-01', freq='M'), pd.NaT,
+                         Period('2011-01', freq='D')])
+
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            PeriodIndex(np.array([Period('2011-01', freq='M'), pd.NaT,
+                                  Period('2011-01', freq='D')]))
+
+        # first element is pd.NaT
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            PeriodIndex([pd.NaT, Period('2011-01', freq='M'),
+                         Period('2011-01', freq='D')])
+
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            PeriodIndex(np.array([pd.NaT, Period('2011-01', freq='M'),
+                                  Period('2011-01', freq='D')]))
+
+    def test_constructor_mixed(self):
+        idx = PeriodIndex(['2011-01', pd.NaT, Period('2011-01', freq='M')])
+        exp = PeriodIndex(['2011-01', 'NaT', '2011-01'], freq='M')
+        tm.assert_index_equal(idx, exp)
+
+        idx = PeriodIndex(['NaT', pd.NaT, Period('2011-01', freq='M')])
+        exp = PeriodIndex(['NaT', 'NaT', '2011-01'], freq='M')
+        tm.assert_index_equal(idx, exp)
+
+        idx = PeriodIndex([Period('2011-01-01', freq='D'), pd.NaT,
+                           '2012-01-01'])
+        exp = PeriodIndex(['2011-01-01', 'NaT', '2012-01-01'], freq='D')
+        tm.assert_index_equal(idx, exp)
+
+    def test_constructor_simple_new(self):
+        idx = period_range('2007-01', name='p', periods=2, freq='M')
+        result = idx._simple_new(idx, 'p', freq=idx.freq)
+        tm.assert_index_equal(result, idx)
+
+        result = idx._simple_new(idx.astype('i8'), 'p', freq=idx.freq)
+        tm.assert_index_equal(result, idx)
+
+        result = idx._simple_new([pd.Period('2007-01', freq='M'),
+                                  pd.Period('2007-02', freq='M')],
+                                 'p', freq=idx.freq)
+        tm.assert_index_equal(result, idx)
+
+        result = idx._simple_new(np.array([pd.Period('2007-01', freq='M'),
+                                           pd.Period('2007-02', freq='M')]),
+                                 'p', freq=idx.freq)
+        tm.assert_index_equal(result, idx)
+
+    def test_constructor_simple_new_empty(self):
+        # GH13079
+        idx = PeriodIndex([], freq='M', name='p')
+        result = idx._simple_new(idx, name='p', freq='M')
+        tm.assert_index_equal(result, idx)
+
+    @pytest.mark.parametrize('floats', [[1.1, 2.1], np.array([1.1, 2.1])])
+    def test_constructor_floats(self, floats):
+        # GH#13079
+        with pytest.raises(TypeError):
+            pd.PeriodIndex._simple_new(floats, freq='M')
+
+        with pytest.raises(TypeError):
+            pd.PeriodIndex(floats, freq='M')
+
+    def test_constructor_nat(self):
+        pytest.raises(ValueError, period_range, start='NaT',
+                      end='2011-01-01', freq='M')
+        pytest.raises(ValueError, period_range, start='2011-01-01',
+                      end='NaT', freq='M')
+
+    def test_constructor_year_and_quarter(self):
+        year = pd.Series([2001, 2002, 2003])
+        quarter = year - 2000
+        idx = PeriodIndex(year=year, quarter=quarter)
+        strs = ['%dQ%d' % t for t in zip(quarter, year)]
+        lops = list(map(Period, strs))
+        p = PeriodIndex(lops)
+        tm.assert_index_equal(p, idx)
+
+    def test_constructor_freq_mult(self):
+        # GH #7811
+        for func in [PeriodIndex, period_range]:
+            # must be the same, but for sure...
+            pidx = func(start='2014-01', freq='2M', periods=4)
+            expected = PeriodIndex(['2014-01', '2014-03',
+                                    '2014-05', '2014-07'], freq='2M')
+            tm.assert_index_equal(pidx, expected)
+
+            pidx = func(start='2014-01-02', end='2014-01-15', freq='3D')
+            expected = PeriodIndex(['2014-01-02', '2014-01-05',
+                                    '2014-01-08', '2014-01-11',
+                                    '2014-01-14'], freq='3D')
+            tm.assert_index_equal(pidx, expected)
+
+            pidx = func(end='2014-01-01 17:00', freq='4H', periods=3)
+            expected = PeriodIndex(['2014-01-01 09:00', '2014-01-01 13:00',
+                                    '2014-01-01 17:00'], freq='4H')
+            tm.assert_index_equal(pidx, expected)
+
+        msg = ('Frequency must be positive, because it'
+               ' represents span: -1M')
+        with tm.assert_raises_regex(ValueError, msg):
+            PeriodIndex(['2011-01'], freq='-1M')
+
+        msg = ('Frequency must be positive, because it' ' represents span: 0M')
+        with tm.assert_raises_regex(ValueError, msg):
+            PeriodIndex(['2011-01'], freq='0M')
+
+        msg = ('Frequency must be positive, because it' ' represents span: 0M')
+        with tm.assert_raises_regex(ValueError, msg):
+            period_range('2011-01', periods=3, freq='0M')
+
+    @pytest.mark.parametrize('freq', ['A', 'M', 'D', 'T', 'S'])
+    @pytest.mark.parametrize('mult', [1, 2, 3, 4, 5])
+    def test_constructor_freq_mult_dti_compat(self, mult, freq):
+        freqstr = str(mult) + freq
+        pidx = PeriodIndex(start='2014-04-01', freq=freqstr, periods=10)
+        expected = date_range(start='2014-04-01', freq=freqstr,
+                              periods=10).to_period(freqstr)
+        tm.assert_index_equal(pidx, expected)
+
+    def test_constructor_freq_combined(self):
+        for freq in ['1D1H', '1H1D']:
+            pidx = PeriodIndex(['2016-01-01', '2016-01-02'], freq=freq)
+            expected = PeriodIndex(['2016-01-01 00:00', '2016-01-02 00:00'],
+                                   freq='25H')
+        for freq, func in zip(['1D1H', '1H1D'], [PeriodIndex, period_range]):
+            pidx = func(start='2016-01-01', periods=2, freq=freq)
+            expected = PeriodIndex(['2016-01-01 00:00', '2016-01-02 01:00'],
+                                   freq='25H')
+            tm.assert_index_equal(pidx, expected)
+
+    def test_constructor(self):
+        pi = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
+        assert len(pi) == 9
+
+        pi = PeriodIndex(freq='Q', start='1/1/2001', end='12/1/2009')
+        assert len(pi) == 4 * 9
+
+        pi = PeriodIndex(freq='M', start='1/1/2001', end='12/1/2009')
+        assert len(pi) == 12 * 9
+
+        pi = PeriodIndex(freq='D', start='1/1/2001', end='12/31/2009')
+        assert len(pi) == 365 * 9 + 2
+
+        pi = PeriodIndex(freq='B', start='1/1/2001', end='12/31/2009')
+        assert len(pi) == 261 * 9
+
+        pi = PeriodIndex(freq='H', start='1/1/2001', end='12/31/2001 23:00')
+        assert len(pi) == 365 * 24
+
+        pi = PeriodIndex(freq='Min', start='1/1/2001', end='1/1/2001 23:59')
+        assert len(pi) == 24 * 60
+
+        pi = PeriodIndex(freq='S', start='1/1/2001', end='1/1/2001 23:59:59')
+        assert len(pi) == 24 * 60 * 60
+
+        start = Period('02-Apr-2005', 'B')
+        i1 = PeriodIndex(start=start, periods=20)
+        assert len(i1) == 20
+        assert i1.freq == start.freq
+        assert i1[0] == start
+
+        end_intv = Period('2006-12-31', 'W')
+        i1 = PeriodIndex(end=end_intv, periods=10)
+        assert len(i1) == 10
+        assert i1.freq == end_intv.freq
+        assert i1[-1] == end_intv
+
+        end_intv = Period('2006-12-31', '1w')
+        i2 = PeriodIndex(end=end_intv, periods=10)
+        assert len(i1) == len(i2)
+        assert (i1 == i2).all()
+        assert i1.freq == i2.freq
+
+        end_intv = Period('2006-12-31', ('w', 1))
+        i2 = PeriodIndex(end=end_intv, periods=10)
+        assert len(i1) == len(i2)
+        assert (i1 == i2).all()
+        assert i1.freq == i2.freq
+
+        end_intv = Period('2005-05-01', 'B')
+        i1 = PeriodIndex(start=start, end=end_intv)
+
+        # infer freq from first element
+        i2 = PeriodIndex([end_intv, Period('2005-05-05', 'B')])
+        assert len(i2) == 2
+        assert i2[0] == end_intv
+
+        i2 = PeriodIndex(np.array([end_intv, Period('2005-05-05', 'B')]))
+        assert len(i2) == 2
+        assert i2[0] == end_intv
+
+        # Mixed freq should fail
+        vals = [end_intv, Period('2006-12-31', 'w')]
+        pytest.raises(ValueError, PeriodIndex, vals)
+        vals = np.array(vals)
+        pytest.raises(ValueError, PeriodIndex, vals)
+
+    def test_constructor_error(self):
+        start = Period('02-Apr-2005', 'B')
+        end_intv = Period('2006-12-31', ('w', 1))
+
+        msg = 'start and end must have same freq'
+        with tm.assert_raises_regex(ValueError, msg):
+            PeriodIndex(start=start, end=end_intv)
+
+        msg = ('Of the three parameters: start, end, and periods, '
+               'exactly two must be specified')
+        with tm.assert_raises_regex(ValueError, msg):
+            PeriodIndex(start=start)
+
+    @pytest.mark.parametrize('freq', ['M', 'Q', 'A', 'D', 'B',
+                                      'T', 'S', 'L', 'U', 'N', 'H'])
+    def test_recreate_from_data(self, freq):
+        org = PeriodIndex(start='2001/04/01', freq=freq, periods=1)
+        idx = PeriodIndex(org.values, freq=freq)
+        tm.assert_index_equal(idx, org)
+
+    def test_map_with_string_constructor(self):
+        raw = [2005, 2007, 2009]
+        index = PeriodIndex(raw, freq='A')
+        types = str,
+
+        if PY3:
+            # unicode
+            types += text_type,
+
+        for t in types:
+            expected = Index(lmap(t, raw))
+            res = index.map(t)
+
+            # should return an Index
+            assert isinstance(res, Index)
+
+            # preserve element types
+            assert all(isinstance(resi, t) for resi in res)
+
+            # lastly, values should compare equal
+            tm.assert_index_equal(res, expected)
+
+
+class TestSeriesPeriod(object):
+
+    def setup_method(self, method):
+        self.series = Series(period_range('2000-01-01', periods=10, freq='D'))
+
+    def test_constructor_cant_cast_period(self):
+        with pytest.raises(TypeError):
+            Series(period_range('2000-01-01', periods=10, freq='D'),
+                   dtype=float)
+
+    def test_constructor_cast_object(self):
+        s = Series(period_range('1/1/2000', periods=10), dtype=object)
+        exp = Series(period_range('1/1/2000', periods=10))
+        tm.assert_series_equal(s, exp)
diff --git a/pandas/tests/indexes/period/test_formats.py b/pandas/tests/indexes/period/test_formats.py
new file mode 100644
index 0000000000000..daf44a559cf5c
--- /dev/null
+++ b/pandas/tests/indexes/period/test_formats.py
@@ -0,0 +1,209 @@
+from pandas import PeriodIndex
+
+import numpy as np
+import pytest
+
+import pandas.util.testing as tm
+import pandas as pd
+
+
+def test_to_native_types():
+    index = PeriodIndex(['2017-01-01', '2017-01-02',
+                         '2017-01-03'], freq='D')
+
+    # First, with no arguments.
+    expected = np.array(['2017-01-01', '2017-01-02',
+                         '2017-01-03'], dtype='=U10')
+
+    result = index.to_native_types()
+    tm.assert_numpy_array_equal(result, expected)
+
+    # No NaN values, so na_rep has no effect
+    result = index.to_native_types(na_rep='pandas')
+    tm.assert_numpy_array_equal(result, expected)
+
+    # Make sure slicing works
+    expected = np.array(['2017-01-01', '2017-01-03'], dtype='=U10')
+
+    result = index.to_native_types([0, 2])
+    tm.assert_numpy_array_equal(result, expected)
+
+    # Make sure date formatting works
+    expected = np.array(['01-2017-01', '01-2017-02',
+                         '01-2017-03'], dtype='=U10')
+
+    result = index.to_native_types(date_format='%m-%Y-%d')
+    tm.assert_numpy_array_equal(result, expected)
+
+    # NULL object handling should work
+    index = PeriodIndex(['2017-01-01', pd.NaT, '2017-01-03'], freq='D')
+    expected = np.array(['2017-01-01', 'NaT', '2017-01-03'], dtype=object)
+
+    result = index.to_native_types()
+    tm.assert_numpy_array_equal(result, expected)
+
+    expected = np.array(['2017-01-01', 'pandas',
+                         '2017-01-03'], dtype=object)
+
+    result = index.to_native_types(na_rep='pandas')
+    tm.assert_numpy_array_equal(result, expected)
+
+
+class TestPeriodIndexRendering(object):
+    @pytest.mark.parametrize('method', ['__repr__', '__unicode__', '__str__'])
+    def test_representation(self, method):
+        # GH#7601
+        idx1 = PeriodIndex([], freq='D')
+        idx2 = PeriodIndex(['2011-01-01'], freq='D')
+        idx3 = PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
+        idx4 = PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
+                           freq='D')
+        idx5 = PeriodIndex(['2011', '2012', '2013'], freq='A')
+        idx6 = PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'],
+                           freq='H')
+        idx7 = pd.period_range('2013Q1', periods=1, freq="Q")
+        idx8 = pd.period_range('2013Q1', periods=2, freq="Q")
+        idx9 = pd.period_range('2013Q1', periods=3, freq="Q")
+        idx10 = PeriodIndex(['2011-01-01', '2011-02-01'], freq='3D')
+
+        exp1 = """PeriodIndex([], dtype='period[D]', freq='D')"""
+
+        exp2 = """PeriodIndex(['2011-01-01'], dtype='period[D]', freq='D')"""
+
+        exp3 = ("PeriodIndex(['2011-01-01', '2011-01-02'], dtype='period[D]', "
+                "freq='D')")
+
+        exp4 = ("PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'], "
+                "dtype='period[D]', freq='D')")
+
+        exp5 = ("PeriodIndex(['2011', '2012', '2013'], dtype='period[A-DEC]', "
+                "freq='A-DEC')")
+
+        exp6 = ("PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'], "
+                "dtype='period[H]', freq='H')")
+
+        exp7 = ("PeriodIndex(['2013Q1'], dtype='period[Q-DEC]', "
+                "freq='Q-DEC')")
+
+        exp8 = ("PeriodIndex(['2013Q1', '2013Q2'], dtype='period[Q-DEC]', "
+                "freq='Q-DEC')")
+
+        exp9 = ("PeriodIndex(['2013Q1', '2013Q2', '2013Q3'], "
+                "dtype='period[Q-DEC]', freq='Q-DEC')")
+
+        exp10 = ("PeriodIndex(['2011-01-01', '2011-02-01'], "
+                 "dtype='period[3D]', freq='3D')")
+
+        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5,
+                                  idx6, idx7, idx8, idx9, idx10],
+                                 [exp1, exp2, exp3, exp4, exp5,
+                                  exp6, exp7, exp8, exp9, exp10]):
+            result = getattr(idx, method)()
+            assert result == expected
+
+    def test_representation_to_series(self):
+        # GH#10971
+        idx1 = PeriodIndex([], freq='D')
+        idx2 = PeriodIndex(['2011-01-01'], freq='D')
+        idx3 = PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
+        idx4 = PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
+                           freq='D')
+        idx5 = PeriodIndex(['2011', '2012', '2013'], freq='A')
+        idx6 = PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'],
+                           freq='H')
+
+        idx7 = pd.period_range('2013Q1', periods=1, freq="Q")
+        idx8 = pd.period_range('2013Q1', periods=2, freq="Q")
+        idx9 = pd.period_range('2013Q1', periods=3, freq="Q")
+
+        exp1 = """Series([], dtype: object)"""
+
+        exp2 = """0   2011-01-01
+dtype: object"""
+
+        exp3 = """0   2011-01-01
+1   2011-01-02
+dtype: object"""
+
+        exp4 = """0   2011-01-01
+1   2011-01-02
+2   2011-01-03
+dtype: object"""
+
+        exp5 = """0   2011
+1   2012
+2   2013
+dtype: object"""
+
+        exp6 = """0   2011-01-01 09:00
+1   2012-02-01 10:00
+2                NaT
+dtype: object"""
+
+        exp7 = """0   2013Q1
+dtype: object"""
+
+        exp8 = """0   2013Q1
+1   2013Q2
+dtype: object"""
+
+        exp9 = """0   2013Q1
+1   2013Q2
+2   2013Q3
+dtype: object"""
+
+        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5,
+                                  idx6, idx7, idx8, idx9],
+                                 [exp1, exp2, exp3, exp4, exp5,
+                                  exp6, exp7, exp8, exp9]):
+            result = repr(pd.Series(idx))
+            assert result == expected
+
+    def test_summary(self):
+        # GH#9116
+        idx1 = PeriodIndex([], freq='D')
+        idx2 = PeriodIndex(['2011-01-01'], freq='D')
+        idx3 = PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
+        idx4 = PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
+                           freq='D')
+        idx5 = PeriodIndex(['2011', '2012', '2013'], freq='A')
+        idx6 = PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'],
+                           freq='H')
+
+        idx7 = pd.period_range('2013Q1', periods=1, freq="Q")
+        idx8 = pd.period_range('2013Q1', periods=2, freq="Q")
+        idx9 = pd.period_range('2013Q1', periods=3, freq="Q")
+
+        exp1 = """PeriodIndex: 0 entries
+Freq: D"""
+
+        exp2 = """PeriodIndex: 1 entries, 2011-01-01 to 2011-01-01
+Freq: D"""
+
+        exp3 = """PeriodIndex: 2 entries, 2011-01-01 to 2011-01-02
+Freq: D"""
+
+        exp4 = """PeriodIndex: 3 entries, 2011-01-01 to 2011-01-03
+Freq: D"""
+
+        exp5 = """PeriodIndex: 3 entries, 2011 to 2013
+Freq: A-DEC"""
+
+        exp6 = """PeriodIndex: 3 entries, 2011-01-01 09:00 to NaT
+Freq: H"""
+
+        exp7 = """PeriodIndex: 1 entries, 2013Q1 to 2013Q1
+Freq: Q-DEC"""
+
+        exp8 = """PeriodIndex: 2 entries, 2013Q1 to 2013Q2
+Freq: Q-DEC"""
+
+        exp9 = """PeriodIndex: 3 entries, 2013Q1 to 2013Q3
+Freq: Q-DEC"""
+
+        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5,
+                                  idx6, idx7, idx8, idx9],
+                                 [exp1, exp2, exp3, exp4, exp5,
+                                  exp6, exp7, exp8, exp9]):
+            result = idx._summary()
+            assert result == expected
diff --git a/pandas/tests/indexes/period/test_indexing.py b/pandas/tests/indexes/period/test_indexing.py
new file mode 100644
index 0000000000000..6b8e2203e83fd
--- /dev/null
+++ b/pandas/tests/indexes/period/test_indexing.py
@@ -0,0 +1,635 @@
+from datetime import datetime, timedelta
+
+import pytest
+
+import numpy as np
+import pandas as pd
+from pandas.util import testing as tm
+from pandas.compat import lrange
+from pandas._libs import tslibs
+from pandas import (PeriodIndex, Series, DatetimeIndex,
+                    period_range, Period, notna)
+from pandas._libs.tslibs import period as libperiod
+
+
+class TestGetItem(object):
+
+    def test_getitem(self):
+        idx1 = pd.period_range('2011-01-01', '2011-01-31', freq='D',
+                               name='idx')
+
+        for idx in [idx1]:
+            result = idx[0]
+            assert result == pd.Period('2011-01-01', freq='D')
+
+            result = idx[-1]
+            assert result == pd.Period('2011-01-31', freq='D')
+
+            result = idx[0:5]
+            expected = pd.period_range('2011-01-01', '2011-01-05', freq='D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
+
+            result = idx[0:10:2]
+            expected = pd.PeriodIndex(['2011-01-01', '2011-01-03',
+                                       '2011-01-05',
+                                       '2011-01-07', '2011-01-09'],
+                                      freq='D', name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
+
+            result = idx[-20:-5:3]
+            expected = pd.PeriodIndex(['2011-01-12', '2011-01-15',
+                                       '2011-01-18',
+                                       '2011-01-21', '2011-01-24'],
+                                      freq='D', name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
+
+            result = idx[4::-1]
+            expected = PeriodIndex(['2011-01-05', '2011-01-04', '2011-01-03',
+                                    '2011-01-02', '2011-01-01'],
+                                   freq='D', name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
+
+    def test_getitem_index(self):
+        idx = period_range('2007-01', periods=10, freq='M', name='x')
+
+        result = idx[[1, 3, 5]]
+        exp = pd.PeriodIndex(['2007-02', '2007-04', '2007-06'],
+                             freq='M', name='x')
+        tm.assert_index_equal(result, exp)
+
+        result = idx[[True, True, False, False, False,
+                      True, True, False, False, False]]
+        exp = pd.PeriodIndex(['2007-01', '2007-02', '2007-06', '2007-07'],
+                             freq='M', name='x')
+        tm.assert_index_equal(result, exp)
+
+    def test_getitem_partial(self):
+        rng = period_range('2007-01', periods=50, freq='M')
+        ts = Series(np.random.randn(len(rng)), rng)
+
+        pytest.raises(KeyError, ts.__getitem__, '2006')
+
+        result = ts['2008']
+        assert (result.index.year == 2008).all()
+
+        result = ts['2008':'2009']
+        assert len(result) == 24
+
+        result = ts['2008-1':'2009-12']
+        assert len(result) == 24
+
+        result = ts['2008Q1':'2009Q4']
+        assert len(result) == 24
+
+        result = ts[:'2009']
+        assert len(result) == 36
+
+        result = ts['2009':]
+        assert len(result) == 50 - 24
+
+        exp = result
+        result = ts[24:]
+        tm.assert_series_equal(exp, result)
+
+        ts = ts[10:].append(ts[10:])
+        tm.assert_raises_regex(KeyError,
+                               "left slice bound for non-unique "
+                               "label: '2008'",
+                               ts.__getitem__, slice('2008', '2009'))
+
+    def test_getitem_datetime(self):
+        rng = period_range(start='2012-01-01', periods=10, freq='W-MON')
+        ts = Series(lrange(len(rng)), index=rng)
+
+        dt1 = datetime(2011, 10, 2)
+        dt4 = datetime(2012, 4, 20)
+
+        rs = ts[dt1:dt4]
+        tm.assert_series_equal(rs, ts)
+
+    def test_getitem_nat(self):
+        idx = pd.PeriodIndex(['2011-01', 'NaT', '2011-02'], freq='M')
+        assert idx[0] == pd.Period('2011-01', freq='M')
+        assert idx[1] is pd.NaT
+
+        s = pd.Series([0, 1, 2], index=idx)
+        assert s[pd.NaT] == 1
+
+        s = pd.Series(idx, index=idx)
+        assert (s[pd.Period('2011-01', freq='M')] ==
+                pd.Period('2011-01', freq='M'))
+        assert s[pd.NaT] is pd.NaT
+
+    def test_getitem_list_periods(self):
+        # GH 7710
+        rng = period_range(start='2012-01-01', periods=10, freq='D')
+        ts = Series(lrange(len(rng)), index=rng)
+        exp = ts.iloc[[1]]
+        tm.assert_series_equal(ts[[Period('2012-01-02', freq='D')]], exp)
+
+    def test_getitem_seconds(self):
+        # GH 6716
+        didx = DatetimeIndex(start='2013/01/01 09:00:00', freq='S',
+                             periods=4000)
+        pidx = PeriodIndex(start='2013/01/01 09:00:00', freq='S', periods=4000)
+
+        for idx in [didx, pidx]:
+            # getitem against index should raise ValueError
+            values = ['2014', '2013/02', '2013/01/02', '2013/02/01 9H',
+                      '2013/02/01 09:00']
+            for v in values:
+                # GH7116
+                # these show deprecations as we are trying
+                # to slice with non-integer indexers
+                # with pytest.raises(IndexError):
+                #    idx[v]
+                continue
+
+            s = Series(np.random.rand(len(idx)), index=idx)
+            tm.assert_series_equal(s['2013/01/01 10:00'], s[3600:3660])
+            tm.assert_series_equal(s['2013/01/01 9H'], s[:3600])
+            for d in ['2013/01/01', '2013/01', '2013']:
+                tm.assert_series_equal(s[d], s)
+
+    def test_getitem_day(self):
+        # GH 6716
+        # Confirm DatetimeIndex and PeriodIndex works identically
+        didx = DatetimeIndex(start='2013/01/01', freq='D', periods=400)
+        pidx = PeriodIndex(start='2013/01/01', freq='D', periods=400)
+
+        for idx in [didx, pidx]:
+            # getitem against index should raise ValueError
+            values = ['2014', '2013/02', '2013/01/02', '2013/02/01 9H',
+                      '2013/02/01 09:00']
+            for v in values:
+
+                # GH7116
+                # these show deprecations as we are trying
+                # to slice with non-integer indexers
+                # with pytest.raises(IndexError):
+                #    idx[v]
+                continue
+
+            s = Series(np.random.rand(len(idx)), index=idx)
+            tm.assert_series_equal(s['2013/01'], s[0:31])
+            tm.assert_series_equal(s['2013/02'], s[31:59])
+            tm.assert_series_equal(s['2014'], s[365:])
+
+            invalid = ['2013/02/01 9H', '2013/02/01 09:00']
+            for v in invalid:
+                with pytest.raises(KeyError):
+                    s[v]
+
+
+class TestWhere(object):
+    @pytest.mark.parametrize('klass', [list, tuple, np.array, Series])
+    def test_where(self, klass):
+        i = period_range('20130101', periods=5, freq='D')
+        cond = [True] * len(i)
+        expected = i
+        result = i.where(klass(cond))
+        tm.assert_index_equal(result, expected)
+
+        cond = [False] + [True] * (len(i) - 1)
+        expected = PeriodIndex([pd.NaT] + i[1:].tolist(), freq='D')
+        result = i.where(klass(cond))
+        tm.assert_index_equal(result, expected)
+
+    def test_where_other(self):
+        i = period_range('20130101', periods=5, freq='D')
+        for arr in [np.nan, pd.NaT]:
+            result = i.where(notna(i), other=np.nan)
+            expected = i
+            tm.assert_index_equal(result, expected)
+
+        i2 = i.copy()
+        i2 = pd.PeriodIndex([pd.NaT, pd.NaT] + i[2:].tolist(),
+                            freq='D')
+        result = i.where(notna(i2), i2)
+        tm.assert_index_equal(result, i2)
+
+        i2 = i.copy()
+        i2 = pd.PeriodIndex([pd.NaT, pd.NaT] + i[2:].tolist(),
+                            freq='D')
+        result = i.where(notna(i2), i2.values)
+        tm.assert_index_equal(result, i2)
+
+
+class TestTake(object):
+    def test_take(self):
+        # GH#10295
+        idx1 = pd.period_range('2011-01-01', '2011-01-31', freq='D',
+                               name='idx')
+
+        for idx in [idx1]:
+            result = idx.take([0])
+            assert result == pd.Period('2011-01-01', freq='D')
+
+            result = idx.take([5])
+            assert result == pd.Period('2011-01-06', freq='D')
+
+            result = idx.take([0, 1, 2])
+            expected = pd.period_range('2011-01-01', '2011-01-03', freq='D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == 'D'
+            assert result.freq == expected.freq
+
+            result = idx.take([0, 2, 4])
+            expected = pd.PeriodIndex(['2011-01-01', '2011-01-03',
+                                       '2011-01-05'], freq='D', name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
+
+            result = idx.take([7, 4, 1])
+            expected = pd.PeriodIndex(['2011-01-08', '2011-01-05',
+                                       '2011-01-02'],
+                                      freq='D', name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
+
+            result = idx.take([3, 2, 5])
+            expected = PeriodIndex(['2011-01-04', '2011-01-03', '2011-01-06'],
+                                   freq='D', name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
+
+            result = idx.take([-3, 2, 5])
+            expected = PeriodIndex(['2011-01-29', '2011-01-03', '2011-01-06'],
+                                   freq='D', name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
+
+    def test_take_misc(self):
+        index = PeriodIndex(start='1/1/10', end='12/31/12', freq='D',
+                            name='idx')
+        expected = PeriodIndex([datetime(2010, 1, 6), datetime(2010, 1, 7),
+                                datetime(2010, 1, 9), datetime(2010, 1, 13)],
+                               freq='D', name='idx')
+
+        taken1 = index.take([5, 6, 8, 12])
+        taken2 = index[[5, 6, 8, 12]]
+
+        for taken in [taken1, taken2]:
+            tm.assert_index_equal(taken, expected)
+            assert isinstance(taken, PeriodIndex)
+            assert taken.freq == index.freq
+            assert taken.name == expected.name
+
+    def test_take_fill_value(self):
+        # GH#12631
+        idx = pd.PeriodIndex(['2011-01-01', '2011-02-01', '2011-03-01'],
+                             name='xxx', freq='D')
+        result = idx.take(np.array([1, 0, -1]))
+        expected = pd.PeriodIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
+                                  name='xxx', freq='D')
+        tm.assert_index_equal(result, expected)
+
+        # fill_value
+        result = idx.take(np.array([1, 0, -1]), fill_value=True)
+        expected = pd.PeriodIndex(['2011-02-01', '2011-01-01', 'NaT'],
+                                  name='xxx', freq='D')
+        tm.assert_index_equal(result, expected)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        expected = pd.PeriodIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
+                                  name='xxx', freq='D')
+        tm.assert_index_equal(result, expected)
+
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -2]), fill_value=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            idx.take(np.array([1, -5]))
+
+
+class TestIndexing(object):
+
+    def test_get_loc_msg(self):
+        idx = period_range('2000-1-1', freq='A', periods=10)
+        bad_period = Period('2012', 'A')
+        pytest.raises(KeyError, idx.get_loc, bad_period)
+
+        try:
+            idx.get_loc(bad_period)
+        except KeyError as inst:
+            assert inst.args[0] == bad_period
+
+    def test_get_loc_nat(self):
+        didx = DatetimeIndex(['2011-01-01', 'NaT', '2011-01-03'])
+        pidx = PeriodIndex(['2011-01-01', 'NaT', '2011-01-03'], freq='M')
+
+        # check DatetimeIndex compat
+        for idx in [didx, pidx]:
+            assert idx.get_loc(pd.NaT) == 1
+            assert idx.get_loc(None) == 1
+            assert idx.get_loc(float('nan')) == 1
+            assert idx.get_loc(np.nan) == 1
+
+    def test_get_loc(self):
+        # GH 17717
+        p0 = pd.Period('2017-09-01')
+        p1 = pd.Period('2017-09-02')
+        p2 = pd.Period('2017-09-03')
+
+        # get the location of p1/p2 from
+        # monotonic increasing PeriodIndex with non-duplicate
+        idx0 = pd.PeriodIndex([p0, p1, p2])
+        expected_idx1_p1 = 1
+        expected_idx1_p2 = 2
+
+        assert idx0.get_loc(p1) == expected_idx1_p1
+        assert idx0.get_loc(str(p1)) == expected_idx1_p1
+        assert idx0.get_loc(p2) == expected_idx1_p2
+        assert idx0.get_loc(str(p2)) == expected_idx1_p2
+
+        pytest.raises(tslibs.parsing.DateParseError, idx0.get_loc, 'foo')
+        pytest.raises(KeyError, idx0.get_loc, 1.1)
+        pytest.raises(TypeError, idx0.get_loc, idx0)
+
+        # get the location of p1/p2 from
+        # monotonic increasing PeriodIndex with duplicate
+        idx1 = pd.PeriodIndex([p1, p1, p2])
+        expected_idx1_p1 = slice(0, 2)
+        expected_idx1_p2 = 2
+
+        assert idx1.get_loc(p1) == expected_idx1_p1
+        assert idx1.get_loc(str(p1)) == expected_idx1_p1
+        assert idx1.get_loc(p2) == expected_idx1_p2
+        assert idx1.get_loc(str(p2)) == expected_idx1_p2
+
+        pytest.raises(tslibs.parsing.DateParseError, idx1.get_loc, 'foo')
+        pytest.raises(KeyError, idx1.get_loc, 1.1)
+        pytest.raises(TypeError, idx1.get_loc, idx1)
+
+        # get the location of p1/p2 from
+        # non-monotonic increasing/decreasing PeriodIndex with duplicate
+        idx2 = pd.PeriodIndex([p2, p1, p2])
+        expected_idx2_p1 = 1
+        expected_idx2_p2 = np.array([True, False, True])
+
+        assert idx2.get_loc(p1) == expected_idx2_p1
+        assert idx2.get_loc(str(p1)) == expected_idx2_p1
+        tm.assert_numpy_array_equal(idx2.get_loc(p2), expected_idx2_p2)
+        tm.assert_numpy_array_equal(idx2.get_loc(str(p2)), expected_idx2_p2)
+
+    def test_is_monotonic_increasing(self):
+        # GH 17717
+        p0 = pd.Period('2017-09-01')
+        p1 = pd.Period('2017-09-02')
+        p2 = pd.Period('2017-09-03')
+
+        idx_inc0 = pd.PeriodIndex([p0, p1, p2])
+        idx_inc1 = pd.PeriodIndex([p0, p1, p1])
+        idx_dec0 = pd.PeriodIndex([p2, p1, p0])
+        idx_dec1 = pd.PeriodIndex([p2, p1, p1])
+        idx = pd.PeriodIndex([p1, p2, p0])
+
+        assert idx_inc0.is_monotonic_increasing
+        assert idx_inc1.is_monotonic_increasing
+        assert not idx_dec0.is_monotonic_increasing
+        assert not idx_dec1.is_monotonic_increasing
+        assert not idx.is_monotonic_increasing
+
+    def test_is_monotonic_decreasing(self):
+        # GH 17717
+        p0 = pd.Period('2017-09-01')
+        p1 = pd.Period('2017-09-02')
+        p2 = pd.Period('2017-09-03')
+
+        idx_inc0 = pd.PeriodIndex([p0, p1, p2])
+        idx_inc1 = pd.PeriodIndex([p0, p1, p1])
+        idx_dec0 = pd.PeriodIndex([p2, p1, p0])
+        idx_dec1 = pd.PeriodIndex([p2, p1, p1])
+        idx = pd.PeriodIndex([p1, p2, p0])
+
+        assert not idx_inc0.is_monotonic_decreasing
+        assert not idx_inc1.is_monotonic_decreasing
+        assert idx_dec0.is_monotonic_decreasing
+        assert idx_dec1.is_monotonic_decreasing
+        assert not idx.is_monotonic_decreasing
+
+    def test_is_unique(self):
+        # GH 17717
+        p0 = pd.Period('2017-09-01')
+        p1 = pd.Period('2017-09-02')
+        p2 = pd.Period('2017-09-03')
+
+        idx0 = pd.PeriodIndex([p0, p1, p2])
+        assert idx0.is_unique
+
+        idx1 = pd.PeriodIndex([p1, p1, p2])
+        assert not idx1.is_unique
+
+    def test_contains(self):
+        # GH 17717
+        p0 = pd.Period('2017-09-01')
+        p1 = pd.Period('2017-09-02')
+        p2 = pd.Period('2017-09-03')
+        p3 = pd.Period('2017-09-04')
+
+        ps0 = [p0, p1, p2]
+        idx0 = pd.PeriodIndex(ps0)
+
+        for p in ps0:
+            assert idx0.contains(p)
+            assert p in idx0
+
+            assert idx0.contains(str(p))
+            assert str(p) in idx0
+
+        assert idx0.contains('2017-09-01 00:00:01')
+        assert '2017-09-01 00:00:01' in idx0
+
+        assert idx0.contains('2017-09')
+        assert '2017-09' in idx0
+
+        assert not idx0.contains(p3)
+        assert p3 not in idx0
+
+    def test_get_value(self):
+        # GH 17717
+        p0 = pd.Period('2017-09-01')
+        p1 = pd.Period('2017-09-02')
+        p2 = pd.Period('2017-09-03')
+
+        idx0 = pd.PeriodIndex([p0, p1, p2])
+        input0 = np.array([1, 2, 3])
+        expected0 = 2
+
+        result0 = idx0.get_value(input0, p1)
+        assert result0 == expected0
+
+        idx1 = pd.PeriodIndex([p1, p1, p2])
+        input1 = np.array([1, 2, 3])
+        expected1 = np.array([1, 2])
+
+        result1 = idx1.get_value(input1, p1)
+        tm.assert_numpy_array_equal(result1, expected1)
+
+        idx2 = pd.PeriodIndex([p1, p2, p1])
+        input2 = np.array([1, 2, 3])
+        expected2 = np.array([1, 3])
+
+        result2 = idx2.get_value(input2, p1)
+        tm.assert_numpy_array_equal(result2, expected2)
+
+    def test_get_indexer(self):
+        # GH 17717
+        p1 = pd.Period('2017-09-01')
+        p2 = pd.Period('2017-09-04')
+        p3 = pd.Period('2017-09-07')
+
+        tp0 = pd.Period('2017-08-31')
+        tp1 = pd.Period('2017-09-02')
+        tp2 = pd.Period('2017-09-05')
+        tp3 = pd.Period('2017-09-09')
+
+        idx = pd.PeriodIndex([p1, p2, p3])
+
+        tm.assert_numpy_array_equal(idx.get_indexer(idx),
+                                    np.array([0, 1, 2], dtype=np.intp))
+
+        target = pd.PeriodIndex([tp0, tp1, tp2, tp3])
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'),
+                                    np.array([-1, 0, 1, 2], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'),
+                                    np.array([0, 1, 2, -1], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'),
+                                    np.array([0, 0, 1, 2], dtype=np.intp))
+
+        res = idx.get_indexer(target, 'nearest',
+                              tolerance=pd.Timedelta('1 day'))
+        tm.assert_numpy_array_equal(res,
+                                    np.array([0, 0, 1, -1], dtype=np.intp))
+
+    def test_get_indexer_non_unique(self):
+        # GH 17717
+        p1 = pd.Period('2017-09-02')
+        p2 = pd.Period('2017-09-03')
+        p3 = pd.Period('2017-09-04')
+        p4 = pd.Period('2017-09-05')
+
+        idx1 = pd.PeriodIndex([p1, p2, p1])
+        idx2 = pd.PeriodIndex([p2, p1, p3, p4])
+
+        result = idx1.get_indexer_non_unique(idx2)
+        expected_indexer = np.array([1, 0, 2, -1, -1], dtype=np.intp)
+        expected_missing = np.array([2, 3], dtype=np.int64)
+
+        tm.assert_numpy_array_equal(result[0], expected_indexer)
+        tm.assert_numpy_array_equal(result[1], expected_missing)
+
+    # TODO: This method came from test_period; de-dup with version above
+    def test_get_loc2(self):
+        idx = pd.period_range('2000-01-01', periods=3)
+
+        for method in [None, 'pad', 'backfill', 'nearest']:
+            assert idx.get_loc(idx[1], method) == 1
+            assert idx.get_loc(idx[1].asfreq('H', how='start'), method) == 1
+            assert idx.get_loc(idx[1].to_timestamp(), method) == 1
+            assert idx.get_loc(idx[1].to_timestamp()
+                               .to_pydatetime(), method) == 1
+            assert idx.get_loc(str(idx[1]), method) == 1
+
+        idx = pd.period_range('2000-01-01', periods=5)[::2]
+        assert idx.get_loc('2000-01-02T12', method='nearest',
+                           tolerance='1 day') == 1
+        assert idx.get_loc('2000-01-02T12', method='nearest',
+                           tolerance=pd.Timedelta('1D')) == 1
+        assert idx.get_loc('2000-01-02T12', method='nearest',
+                           tolerance=np.timedelta64(1, 'D')) == 1
+        assert idx.get_loc('2000-01-02T12', method='nearest',
+                           tolerance=timedelta(1)) == 1
+        with tm.assert_raises_regex(ValueError,
+                                    'unit abbreviation w/o a number'):
+            idx.get_loc('2000-01-10', method='nearest', tolerance='foo')
+
+        msg = 'Input has different freq from PeriodIndex\\(freq=D\\)'
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.get_loc('2000-01-10', method='nearest', tolerance='1 hour')
+        with pytest.raises(KeyError):
+            idx.get_loc('2000-01-10', method='nearest', tolerance='1 day')
+        with pytest.raises(
+                ValueError,
+                match='list-like tolerance size must match target index size'):
+            idx.get_loc('2000-01-10', method='nearest',
+                        tolerance=[pd.Timedelta('1 day').to_timedelta64(),
+                                   pd.Timedelta('1 day').to_timedelta64()])
+
+    # TODO: This method came from test_period; de-dup with version above
+    def test_get_indexer2(self):
+        idx = pd.period_range('2000-01-01', periods=3).asfreq('H', how='start')
+        tm.assert_numpy_array_equal(idx.get_indexer(idx),
+                                    np.array([0, 1, 2], dtype=np.intp))
+
+        target = pd.PeriodIndex(['1999-12-31T23', '2000-01-01T12',
+                                 '2000-01-02T01'], freq='H')
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'),
+                                    np.array([-1, 0, 1], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'),
+                                    np.array([0, 1, 2], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'),
+                                    np.array([0, 1, 1], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest',
+                                                    tolerance='1 hour'),
+                                    np.array([0, -1, 1], dtype=np.intp))
+
+        msg = 'Input has different freq from PeriodIndex\\(freq=H\\)'
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.get_indexer(target, 'nearest', tolerance='1 minute')
+
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest',
+                                                    tolerance='1 day'),
+                                    np.array([0, 1, 1], dtype=np.intp))
+        tol_raw = [pd.Timedelta('1 hour'),
+                   pd.Timedelta('1 hour'),
+                   np.timedelta64(1, 'D'), ]
+        tm.assert_numpy_array_equal(
+            idx.get_indexer(target, 'nearest',
+                            tolerance=[np.timedelta64(x) for x in tol_raw]),
+            np.array([0, -1, 1], dtype=np.intp))
+        tol_bad = [pd.Timedelta('2 hour').to_timedelta64(),
+                   pd.Timedelta('1 hour').to_timedelta64(),
+                   np.timedelta64(1, 'M'), ]
+        with pytest.raises(
+                libperiod.IncompatibleFrequency,
+                match='Input has different freq from'):
+            idx.get_indexer(target, 'nearest', tolerance=tol_bad)
+
+    def test_indexing(self):
+        # GH 4390, iat incorrectly indexing
+        index = period_range('1/1/2001', periods=10)
+        s = Series(np.random.randn(10), index=index)
+        expected = s[index[0]]
+        result = s.iat[0]
+        assert expected == result
+
+    def test_period_index_indexer(self):
+        # GH4125
+        idx = pd.period_range('2002-01', '2003-12', freq='M')
+        df = pd.DataFrame(pd.np.random.randn(24, 10), index=idx)
+        tm.assert_frame_equal(df, df.loc[idx])
+        tm.assert_frame_equal(df, df.loc[list(idx)])
+        tm.assert_frame_equal(df, df.loc[list(idx)])
+        tm.assert_frame_equal(df.iloc[0:5], df.loc[idx[0:5]])
+        tm.assert_frame_equal(df, df.loc[list(idx)])
diff --git a/pandas/tests/indexes/period/test_ops.py b/pandas/tests/indexes/period/test_ops.py
new file mode 100644
index 0000000000000..85aa3f6a38fb3
--- /dev/null
+++ b/pandas/tests/indexes/period/test_ops.py
@@ -0,0 +1,505 @@
+
+import numpy as np
+import pytest
+
+import pandas as pd
+import pandas._libs.tslib as tslib
+import pandas.util.testing as tm
+from pandas import (DatetimeIndex, PeriodIndex, Series, Period,
+                    _np_version_under1p10, Index)
+
+from pandas.tests.test_base import Ops
+
+
+class TestPeriodIndexOps(Ops):
+
+    def setup_method(self, method):
+        super(TestPeriodIndexOps, self).setup_method(method)
+        mask = lambda x: (isinstance(x, DatetimeIndex) or
+                          isinstance(x, PeriodIndex))
+        self.is_valid_objs = [o for o in self.objs if mask(o)]
+        self.not_valid_objs = [o for o in self.objs if not mask(o)]
+
+    def test_ops_properties(self):
+        f = lambda x: isinstance(x, PeriodIndex)
+        self.check_ops_properties(PeriodIndex._field_ops, f)
+        self.check_ops_properties(PeriodIndex._object_ops, f)
+        self.check_ops_properties(PeriodIndex._bool_ops, f)
+
+    def test_minmax(self):
+
+        # monotonic
+        idx1 = pd.PeriodIndex([pd.NaT, '2011-01-01', '2011-01-02',
+                               '2011-01-03'], freq='D')
+        assert idx1.is_monotonic
+
+        # non-monotonic
+        idx2 = pd.PeriodIndex(['2011-01-01', pd.NaT, '2011-01-03',
+                               '2011-01-02', pd.NaT], freq='D')
+        assert not idx2.is_monotonic
+
+        for idx in [idx1, idx2]:
+            assert idx.min() == pd.Period('2011-01-01', freq='D')
+            assert idx.max() == pd.Period('2011-01-03', freq='D')
+        assert idx1.argmin() == 1
+        assert idx2.argmin() == 0
+        assert idx1.argmax() == 3
+        assert idx2.argmax() == 2
+
+        for op in ['min', 'max']:
+            # Return NaT
+            obj = PeriodIndex([], freq='M')
+            result = getattr(obj, op)()
+            assert result is tslib.NaT
+
+            obj = PeriodIndex([pd.NaT], freq='M')
+            result = getattr(obj, op)()
+            assert result is tslib.NaT
+
+            obj = PeriodIndex([pd.NaT, pd.NaT, pd.NaT], freq='M')
+            result = getattr(obj, op)()
+            assert result is tslib.NaT
+
+    def test_numpy_minmax(self):
+        pr = pd.period_range(start='2016-01-15', end='2016-01-20')
+
+        assert np.min(pr) == Period('2016-01-15', freq='D')
+        assert np.max(pr) == Period('2016-01-20', freq='D')
+
+        errmsg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, errmsg, np.min, pr, out=0)
+        tm.assert_raises_regex(ValueError, errmsg, np.max, pr, out=0)
+
+        assert np.argmin(pr) == 0
+        assert np.argmax(pr) == 5
+
+        if not _np_version_under1p10:
+            errmsg = "the 'out' parameter is not supported"
+            tm.assert_raises_regex(
+                ValueError, errmsg, np.argmin, pr, out=0)
+            tm.assert_raises_regex(
+                ValueError, errmsg, np.argmax, pr, out=0)
+
+    def test_resolution(self):
+        for freq, expected in zip(['A', 'Q', 'M', 'D', 'H',
+                                   'T', 'S', 'L', 'U'],
+                                  ['day', 'day', 'day', 'day',
+                                   'hour', 'minute', 'second',
+                                   'millisecond', 'microsecond']):
+
+            idx = pd.period_range(start='2013-04-01', periods=30, freq=freq)
+            assert idx.resolution == expected
+
+    def test_value_counts_unique(self):
+        # GH 7735
+        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=10)
+        # create repeated values, 'n'th element is repeated by n+1 times
+        idx = PeriodIndex(np.repeat(idx.values, range(1, len(idx) + 1)),
+                          freq='H')
+
+        exp_idx = PeriodIndex(['2011-01-01 18:00', '2011-01-01 17:00',
+                               '2011-01-01 16:00', '2011-01-01 15:00',
+                               '2011-01-01 14:00', '2011-01-01 13:00',
+                               '2011-01-01 12:00', '2011-01-01 11:00',
+                               '2011-01-01 10:00',
+                               '2011-01-01 09:00'], freq='H')
+        expected = Series(range(10, 0, -1), index=exp_idx, dtype='int64')
+
+        for obj in [idx, Series(idx)]:
+            tm.assert_series_equal(obj.value_counts(), expected)
+
+        expected = pd.period_range('2011-01-01 09:00', freq='H',
+                                   periods=10)
+        tm.assert_index_equal(idx.unique(), expected)
+
+        idx = PeriodIndex(['2013-01-01 09:00', '2013-01-01 09:00',
+                           '2013-01-01 09:00', '2013-01-01 08:00',
+                           '2013-01-01 08:00', pd.NaT], freq='H')
+
+        exp_idx = PeriodIndex(['2013-01-01 09:00', '2013-01-01 08:00'],
+                              freq='H')
+        expected = Series([3, 2], index=exp_idx)
+
+        for obj in [idx, Series(idx)]:
+            tm.assert_series_equal(obj.value_counts(), expected)
+
+        exp_idx = PeriodIndex(['2013-01-01 09:00', '2013-01-01 08:00',
+                               pd.NaT], freq='H')
+        expected = Series([3, 2, 1], index=exp_idx)
+
+        for obj in [idx, Series(idx)]:
+            tm.assert_series_equal(obj.value_counts(dropna=False), expected)
+
+        tm.assert_index_equal(idx.unique(), exp_idx)
+
+    def test_drop_duplicates_metadata(self):
+        # GH 10115
+        idx = pd.period_range('2011-01-01', '2011-01-31', freq='D', name='idx')
+        result = idx.drop_duplicates()
+        tm.assert_index_equal(idx, result)
+        assert idx.freq == result.freq
+
+        idx_dup = idx.append(idx)  # freq will not be reset
+        result = idx_dup.drop_duplicates()
+        tm.assert_index_equal(idx, result)
+        assert idx.freq == result.freq
+
+    def test_drop_duplicates(self):
+        # to check Index/Series compat
+        base = pd.period_range('2011-01-01', '2011-01-31', freq='D',
+                               name='idx')
+        idx = base.append(base[:5])
+
+        res = idx.drop_duplicates()
+        tm.assert_index_equal(res, base)
+        res = Series(idx).drop_duplicates()
+        tm.assert_series_equal(res, Series(base))
+
+        res = idx.drop_duplicates(keep='last')
+        exp = base[5:].append(base[:5])
+        tm.assert_index_equal(res, exp)
+        res = Series(idx).drop_duplicates(keep='last')
+        tm.assert_series_equal(res, Series(exp, index=np.arange(5, 36)))
+
+        res = idx.drop_duplicates(keep=False)
+        tm.assert_index_equal(res, base[5:])
+        res = Series(idx).drop_duplicates(keep=False)
+        tm.assert_series_equal(res, Series(base[5:], index=np.arange(5, 31)))
+
+    def test_order_compat(self):
+        def _check_freq(index, expected_index):
+            if isinstance(index, PeriodIndex):
+                assert index.freq == expected_index.freq
+
+        pidx = PeriodIndex(['2011', '2012', '2013'], name='pidx', freq='A')
+        # for compatibility check
+        iidx = Index([2011, 2012, 2013], name='idx')
+        for idx in [pidx, iidx]:
+            ordered = idx.sort_values()
+            tm.assert_index_equal(ordered, idx)
+            _check_freq(ordered, idx)
+
+            ordered = idx.sort_values(ascending=False)
+            tm.assert_index_equal(ordered, idx[::-1])
+            _check_freq(ordered, idx[::-1])
+
+            ordered, indexer = idx.sort_values(return_indexer=True)
+            tm.assert_index_equal(ordered, idx)
+            tm.assert_numpy_array_equal(indexer, np.array([0, 1, 2]),
+                                        check_dtype=False)
+            _check_freq(ordered, idx)
+
+            ordered, indexer = idx.sort_values(return_indexer=True,
+                                               ascending=False)
+            tm.assert_index_equal(ordered, idx[::-1])
+            tm.assert_numpy_array_equal(indexer, np.array([2, 1, 0]),
+                                        check_dtype=False)
+            _check_freq(ordered, idx[::-1])
+
+        pidx = PeriodIndex(['2011', '2013', '2015', '2012',
+                            '2011'], name='pidx', freq='A')
+        pexpected = PeriodIndex(
+            ['2011', '2011', '2012', '2013', '2015'], name='pidx', freq='A')
+        # for compatibility check
+        iidx = Index([2011, 2013, 2015, 2012, 2011], name='idx')
+        iexpected = Index([2011, 2011, 2012, 2013, 2015], name='idx')
+        for idx, expected in [(pidx, pexpected), (iidx, iexpected)]:
+            ordered = idx.sort_values()
+            tm.assert_index_equal(ordered, expected)
+            _check_freq(ordered, idx)
+
+            ordered = idx.sort_values(ascending=False)
+            tm.assert_index_equal(ordered, expected[::-1])
+            _check_freq(ordered, idx)
+
+            ordered, indexer = idx.sort_values(return_indexer=True)
+            tm.assert_index_equal(ordered, expected)
+
+            exp = np.array([0, 4, 3, 1, 2])
+            tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+            _check_freq(ordered, idx)
+
+            ordered, indexer = idx.sort_values(return_indexer=True,
+                                               ascending=False)
+            tm.assert_index_equal(ordered, expected[::-1])
+
+            exp = np.array([2, 1, 3, 4, 0])
+            tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+            _check_freq(ordered, idx)
+
+        pidx = PeriodIndex(['2011', '2013', 'NaT', '2011'], name='pidx',
+                           freq='D')
+
+        result = pidx.sort_values()
+        expected = PeriodIndex(['NaT', '2011', '2011', '2013'],
+                               name='pidx', freq='D')
+        tm.assert_index_equal(result, expected)
+        assert result.freq == 'D'
+
+        result = pidx.sort_values(ascending=False)
+        expected = PeriodIndex(
+            ['2013', '2011', '2011', 'NaT'], name='pidx', freq='D')
+        tm.assert_index_equal(result, expected)
+        assert result.freq == 'D'
+
+    def test_order(self):
+        for freq in ['D', '2D', '4D']:
+            idx = PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
+                              freq=freq, name='idx')
+
+            ordered = idx.sort_values()
+            tm.assert_index_equal(ordered, idx)
+            assert ordered.freq == idx.freq
+
+            ordered = idx.sort_values(ascending=False)
+            expected = idx[::-1]
+            tm.assert_index_equal(ordered, expected)
+            assert ordered.freq == expected.freq
+            assert ordered.freq == freq
+
+            ordered, indexer = idx.sort_values(return_indexer=True)
+            tm.assert_index_equal(ordered, idx)
+            tm.assert_numpy_array_equal(indexer, np.array([0, 1, 2]),
+                                        check_dtype=False)
+            assert ordered.freq == idx.freq
+            assert ordered.freq == freq
+
+            ordered, indexer = idx.sort_values(return_indexer=True,
+                                               ascending=False)
+            expected = idx[::-1]
+            tm.assert_index_equal(ordered, expected)
+            tm.assert_numpy_array_equal(indexer, np.array([2, 1, 0]),
+                                        check_dtype=False)
+            assert ordered.freq == expected.freq
+            assert ordered.freq == freq
+
+        idx1 = PeriodIndex(['2011-01-01', '2011-01-03', '2011-01-05',
+                            '2011-01-02', '2011-01-01'], freq='D', name='idx1')
+        exp1 = PeriodIndex(['2011-01-01', '2011-01-01', '2011-01-02',
+                            '2011-01-03', '2011-01-05'], freq='D', name='idx1')
+
+        idx2 = PeriodIndex(['2011-01-01', '2011-01-03', '2011-01-05',
+                            '2011-01-02', '2011-01-01'],
+                           freq='D', name='idx2')
+        exp2 = PeriodIndex(['2011-01-01', '2011-01-01', '2011-01-02',
+                            '2011-01-03', '2011-01-05'],
+                           freq='D', name='idx2')
+
+        idx3 = PeriodIndex([pd.NaT, '2011-01-03', '2011-01-05',
+                            '2011-01-02', pd.NaT], freq='D', name='idx3')
+        exp3 = PeriodIndex([pd.NaT, pd.NaT, '2011-01-02', '2011-01-03',
+                            '2011-01-05'], freq='D', name='idx3')
+
+        for idx, expected in [(idx1, exp1), (idx2, exp2), (idx3, exp3)]:
+            ordered = idx.sort_values()
+            tm.assert_index_equal(ordered, expected)
+            assert ordered.freq == 'D'
+
+            ordered = idx.sort_values(ascending=False)
+            tm.assert_index_equal(ordered, expected[::-1])
+            assert ordered.freq == 'D'
+
+            ordered, indexer = idx.sort_values(return_indexer=True)
+            tm.assert_index_equal(ordered, expected)
+
+            exp = np.array([0, 4, 3, 1, 2])
+            tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+            assert ordered.freq == 'D'
+
+            ordered, indexer = idx.sort_values(return_indexer=True,
+                                               ascending=False)
+            tm.assert_index_equal(ordered, expected[::-1])
+
+            exp = np.array([2, 1, 3, 4, 0])
+            tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+            assert ordered.freq == 'D'
+
+    def test_nat_new(self):
+
+        idx = pd.period_range('2011-01', freq='M', periods=5, name='x')
+        result = idx._nat_new()
+        exp = pd.PeriodIndex([pd.NaT] * 5, freq='M', name='x')
+        tm.assert_index_equal(result, exp)
+
+        result = idx._nat_new(box=False)
+        exp = np.array([tslib.iNaT] * 5, dtype=np.int64)
+        tm.assert_numpy_array_equal(result, exp)
+
+    def test_shift(self):
+        # This is tested in test_arithmetic
+        pass
+
+    def test_repeat(self):
+        index = pd.period_range('2001-01-01', periods=2, freq='D')
+        exp = pd.PeriodIndex(['2001-01-01', '2001-01-01',
+                              '2001-01-02', '2001-01-02'], freq='D')
+        for res in [index.repeat(2), np.repeat(index, 2)]:
+            tm.assert_index_equal(res, exp)
+
+        index = pd.period_range('2001-01-01', periods=2, freq='2D')
+        exp = pd.PeriodIndex(['2001-01-01', '2001-01-01',
+                              '2001-01-03', '2001-01-03'], freq='2D')
+        for res in [index.repeat(2), np.repeat(index, 2)]:
+            tm.assert_index_equal(res, exp)
+
+        index = pd.PeriodIndex(['2001-01', 'NaT', '2003-01'], freq='M')
+        exp = pd.PeriodIndex(['2001-01', '2001-01', '2001-01',
+                              'NaT', 'NaT', 'NaT',
+                              '2003-01', '2003-01', '2003-01'], freq='M')
+        for res in [index.repeat(3), np.repeat(index, 3)]:
+            tm.assert_index_equal(res, exp)
+
+    def test_nat(self):
+        assert pd.PeriodIndex._na_value is pd.NaT
+        assert pd.PeriodIndex([], freq='M')._na_value is pd.NaT
+
+        idx = pd.PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
+        assert idx._can_hold_na
+
+        tm.assert_numpy_array_equal(idx._isnan, np.array([False, False]))
+        assert not idx.hasnans
+        tm.assert_numpy_array_equal(idx._nan_idxs,
+                                    np.array([], dtype=np.intp))
+
+        idx = pd.PeriodIndex(['2011-01-01', 'NaT'], freq='D')
+        assert idx._can_hold_na
+
+        tm.assert_numpy_array_equal(idx._isnan, np.array([False, True]))
+        assert idx.hasnans
+        tm.assert_numpy_array_equal(idx._nan_idxs,
+                                    np.array([1], dtype=np.intp))
+
+    @pytest.mark.parametrize('freq', ['D', 'M'])
+    def test_equals(self, freq):
+        # GH#13107
+        idx = pd.PeriodIndex(['2011-01-01', '2011-01-02', 'NaT'],
+                             freq=freq)
+        assert idx.equals(idx)
+        assert idx.equals(idx.copy())
+        assert idx.equals(idx.astype(object))
+        assert idx.astype(object).equals(idx)
+        assert idx.astype(object).equals(idx.astype(object))
+        assert not idx.equals(list(idx))
+        assert not idx.equals(pd.Series(idx))
+
+        idx2 = pd.PeriodIndex(['2011-01-01', '2011-01-02', 'NaT'],
+                              freq='H')
+        assert not idx.equals(idx2)
+        assert not idx.equals(idx2.copy())
+        assert not idx.equals(idx2.astype(object))
+        assert not idx.astype(object).equals(idx2)
+        assert not idx.equals(list(idx2))
+        assert not idx.equals(pd.Series(idx2))
+
+        # same internal, different tz
+        idx3 = pd.PeriodIndex._simple_new(idx.asi8, freq='H')
+        tm.assert_numpy_array_equal(idx.asi8, idx3.asi8)
+        assert not idx.equals(idx3)
+        assert not idx.equals(idx3.copy())
+        assert not idx.equals(idx3.astype(object))
+        assert not idx.astype(object).equals(idx3)
+        assert not idx.equals(list(idx3))
+        assert not idx.equals(pd.Series(idx3))
+
+    def test_freq_setter_deprecated(self):
+        # GH 20678
+        idx = pd.period_range('2018Q1', periods=4, freq='Q')
+
+        # no warning for getter
+        with tm.assert_produces_warning(None):
+            idx.freq
+
+        # warning for setter
+        with tm.assert_produces_warning(FutureWarning):
+            idx.freq = pd.offsets.Day()
+
+
+class TestPeriodIndexSeriesMethods(object):
+    """ Test PeriodIndex and Period Series Ops consistency """
+
+    def _check(self, values, func, expected):
+        idx = pd.PeriodIndex(values)
+        result = func(idx)
+        if isinstance(expected, pd.Index):
+            tm.assert_index_equal(result, expected)
+        else:
+            # comp op results in bool
+            tm.assert_numpy_array_equal(result, expected)
+
+        s = pd.Series(values)
+        result = func(s)
+
+        exp = pd.Series(expected, name=values.name)
+        tm.assert_series_equal(result, exp)
+
+    def test_pi_comp_period(self):
+        idx = PeriodIndex(['2011-01', '2011-02', '2011-03',
+                           '2011-04'], freq='M', name='idx')
+
+        f = lambda x: x == pd.Period('2011-03', freq='M')
+        exp = np.array([False, False, True, False], dtype=np.bool)
+        self._check(idx, f, exp)
+        f = lambda x: pd.Period('2011-03', freq='M') == x
+        self._check(idx, f, exp)
+
+        f = lambda x: x != pd.Period('2011-03', freq='M')
+        exp = np.array([True, True, False, True], dtype=np.bool)
+        self._check(idx, f, exp)
+        f = lambda x: pd.Period('2011-03', freq='M') != x
+        self._check(idx, f, exp)
+
+        f = lambda x: pd.Period('2011-03', freq='M') >= x
+        exp = np.array([True, True, True, False], dtype=np.bool)
+        self._check(idx, f, exp)
+
+        f = lambda x: x > pd.Period('2011-03', freq='M')
+        exp = np.array([False, False, False, True], dtype=np.bool)
+        self._check(idx, f, exp)
+
+        f = lambda x: pd.Period('2011-03', freq='M') >= x
+        exp = np.array([True, True, True, False], dtype=np.bool)
+        self._check(idx, f, exp)
+
+    def test_pi_comp_period_nat(self):
+        idx = PeriodIndex(['2011-01', 'NaT', '2011-03',
+                           '2011-04'], freq='M', name='idx')
+
+        f = lambda x: x == pd.Period('2011-03', freq='M')
+        exp = np.array([False, False, True, False], dtype=np.bool)
+        self._check(idx, f, exp)
+        f = lambda x: pd.Period('2011-03', freq='M') == x
+        self._check(idx, f, exp)
+
+        f = lambda x: x == tslib.NaT
+        exp = np.array([False, False, False, False], dtype=np.bool)
+        self._check(idx, f, exp)
+        f = lambda x: tslib.NaT == x
+        self._check(idx, f, exp)
+
+        f = lambda x: x != pd.Period('2011-03', freq='M')
+        exp = np.array([True, True, False, True], dtype=np.bool)
+        self._check(idx, f, exp)
+        f = lambda x: pd.Period('2011-03', freq='M') != x
+        self._check(idx, f, exp)
+
+        f = lambda x: x != tslib.NaT
+        exp = np.array([True, True, True, True], dtype=np.bool)
+        self._check(idx, f, exp)
+        f = lambda x: tslib.NaT != x
+        self._check(idx, f, exp)
+
+        f = lambda x: pd.Period('2011-03', freq='M') >= x
+        exp = np.array([True, False, True, False], dtype=np.bool)
+        self._check(idx, f, exp)
+
+        f = lambda x: x < pd.Period('2011-03', freq='M')
+        exp = np.array([True, False, False, False], dtype=np.bool)
+        self._check(idx, f, exp)
+
+        f = lambda x: x > tslib.NaT
+        exp = np.array([False, False, False, False], dtype=np.bool)
+        self._check(idx, f, exp)
+
+        f = lambda x: tslib.NaT >= x
+        exp = np.array([False, False, False, False], dtype=np.bool)
+        self._check(idx, f, exp)
diff --git a/pandas/tests/indexes/period/test_partial_slicing.py b/pandas/tests/indexes/period/test_partial_slicing.py
new file mode 100644
index 0000000000000..6d142722c315a
--- /dev/null
+++ b/pandas/tests/indexes/period/test_partial_slicing.py
@@ -0,0 +1,141 @@
+import pytest
+
+import numpy as np
+
+import pandas as pd
+from pandas.util import testing as tm
+from pandas import (Series, period_range, DatetimeIndex, PeriodIndex,
+                    DataFrame, _np_version_under1p12, Period)
+
+
+class TestPeriodIndex(object):
+
+    def setup_method(self, method):
+        pass
+
+    def test_slice_with_negative_step(self):
+        ts = Series(np.arange(20),
+                    period_range('2014-01', periods=20, freq='M'))
+        SLC = pd.IndexSlice
+
+        def assert_slices_equivalent(l_slc, i_slc):
+            tm.assert_series_equal(ts[l_slc], ts.iloc[i_slc])
+            tm.assert_series_equal(ts.loc[l_slc], ts.iloc[i_slc])
+            tm.assert_series_equal(ts.loc[l_slc], ts.iloc[i_slc])
+
+        assert_slices_equivalent(SLC[Period('2014-10')::-1], SLC[9::-1])
+        assert_slices_equivalent(SLC['2014-10'::-1], SLC[9::-1])
+
+        assert_slices_equivalent(SLC[:Period('2014-10'):-1], SLC[:8:-1])
+        assert_slices_equivalent(SLC[:'2014-10':-1], SLC[:8:-1])
+
+        assert_slices_equivalent(SLC['2015-02':'2014-10':-1], SLC[13:8:-1])
+        assert_slices_equivalent(SLC[Period('2015-02'):Period('2014-10'):-1],
+                                 SLC[13:8:-1])
+        assert_slices_equivalent(SLC['2015-02':Period('2014-10'):-1],
+                                 SLC[13:8:-1])
+        assert_slices_equivalent(SLC[Period('2015-02'):'2014-10':-1],
+                                 SLC[13:8:-1])
+
+        assert_slices_equivalent(SLC['2014-10':'2015-02':-1], SLC[:0])
+
+    def test_slice_with_zero_step_raises(self):
+        ts = Series(np.arange(20),
+                    period_range('2014-01', periods=20, freq='M'))
+        tm.assert_raises_regex(ValueError, 'slice step cannot be zero',
+                               lambda: ts[::0])
+        tm.assert_raises_regex(ValueError, 'slice step cannot be zero',
+                               lambda: ts.loc[::0])
+        tm.assert_raises_regex(ValueError, 'slice step cannot be zero',
+                               lambda: ts.loc[::0])
+
+    def test_slice_keep_name(self):
+        idx = period_range('20010101', periods=10, freq='D', name='bob')
+        assert idx.name == idx[1:].name
+
+    def test_pindex_slice_index(self):
+        pi = PeriodIndex(start='1/1/10', end='12/31/12', freq='M')
+        s = Series(np.random.rand(len(pi)), index=pi)
+        res = s['2010']
+        exp = s[0:12]
+        tm.assert_series_equal(res, exp)
+        res = s['2011']
+        exp = s[12:24]
+        tm.assert_series_equal(res, exp)
+
+    def test_range_slice_day(self):
+        # GH 6716
+        didx = DatetimeIndex(start='2013/01/01', freq='D', periods=400)
+        pidx = PeriodIndex(start='2013/01/01', freq='D', periods=400)
+
+        # changed to TypeError in 1.12
+        # https://github.com/numpy/numpy/pull/6271
+        exc = IndexError if _np_version_under1p12 else TypeError
+
+        for idx in [didx, pidx]:
+            # slices against index should raise IndexError
+            values = ['2014', '2013/02', '2013/01/02', '2013/02/01 9H',
+                      '2013/02/01 09:00']
+            for v in values:
+                with pytest.raises(exc):
+                    idx[v:]
+
+            s = Series(np.random.rand(len(idx)), index=idx)
+
+            tm.assert_series_equal(s['2013/01/02':], s[1:])
+            tm.assert_series_equal(s['2013/01/02':'2013/01/05'], s[1:5])
+            tm.assert_series_equal(s['2013/02':], s[31:])
+            tm.assert_series_equal(s['2014':], s[365:])
+
+            invalid = ['2013/02/01 9H', '2013/02/01 09:00']
+            for v in invalid:
+                with pytest.raises(exc):
+                    idx[v:]
+
+    def test_range_slice_seconds(self):
+        # GH 6716
+        didx = DatetimeIndex(start='2013/01/01 09:00:00', freq='S',
+                             periods=4000)
+        pidx = PeriodIndex(start='2013/01/01 09:00:00', freq='S', periods=4000)
+
+        # changed to TypeError in 1.12
+        # https://github.com/numpy/numpy/pull/6271
+        exc = IndexError if _np_version_under1p12 else TypeError
+
+        for idx in [didx, pidx]:
+            # slices against index should raise IndexError
+            values = ['2014', '2013/02', '2013/01/02', '2013/02/01 9H',
+                      '2013/02/01 09:00']
+            for v in values:
+                with pytest.raises(exc):
+                    idx[v:]
+
+            s = Series(np.random.rand(len(idx)), index=idx)
+
+            tm.assert_series_equal(s['2013/01/01 09:05':'2013/01/01 09:10'],
+                                   s[300:660])
+            tm.assert_series_equal(s['2013/01/01 10:00':'2013/01/01 10:05'],
+                                   s[3600:3960])
+            tm.assert_series_equal(s['2013/01/01 10H':], s[3600:])
+            tm.assert_series_equal(s[:'2013/01/01 09:30'], s[:1860])
+            for d in ['2013/01/01', '2013/01', '2013']:
+                tm.assert_series_equal(s[d:], s)
+
+    def test_range_slice_outofbounds(self):
+        # GH 5407
+        didx = DatetimeIndex(start='2013/10/01', freq='D', periods=10)
+        pidx = PeriodIndex(start='2013/10/01', freq='D', periods=10)
+
+        for idx in [didx, pidx]:
+            df = DataFrame(dict(units=[100 + i for i in range(10)]), index=idx)
+            empty = DataFrame(index=idx.__class__([], freq='D'),
+                              columns=['units'])
+            empty['units'] = empty['units'].astype('int64')
+
+            tm.assert_frame_equal(df['2013/09/01':'2013/09/30'], empty)
+            tm.assert_frame_equal(df['2013/09/30':'2013/10/02'], df.iloc[:2])
+            tm.assert_frame_equal(df['2013/10/01':'2013/10/02'], df.iloc[:2])
+            tm.assert_frame_equal(df['2013/10/02':'2013/09/30'], empty)
+            tm.assert_frame_equal(df['2013/10/15':'2013/10/17'], empty)
+            tm.assert_frame_equal(df['2013-06':'2013-09'], empty)
+            tm.assert_frame_equal(df['2013-11':'2013-12'], empty)
diff --git a/pandas/tests/indexes/period/test_period.py b/pandas/tests/indexes/period/test_period.py
new file mode 100644
index 0000000000000..923d826fe1a5e
--- /dev/null
+++ b/pandas/tests/indexes/period/test_period.py
@@ -0,0 +1,546 @@
+import pytest
+
+import numpy as np
+
+import pandas as pd
+import pandas.util._test_decorators as td
+from pandas.util import testing as tm
+from pandas import (PeriodIndex, period_range, DatetimeIndex, NaT,
+                    Index, Period, Series, DataFrame, date_range,
+                    offsets)
+
+from ..datetimelike import DatetimeLike
+
+
+class TestPeriodIndex(DatetimeLike):
+    _holder = PeriodIndex
+
+    def setup_method(self, method):
+        self.indices = dict(index=tm.makePeriodIndex(10),
+                            index_dec=period_range('20130101', periods=10,
+                                                   freq='D')[::-1])
+        self.setup_indices()
+
+    def create_index(self):
+        return period_range('20130101', periods=5, freq='D')
+
+    def test_pickle_compat_construction(self):
+        pass
+
+    @pytest.mark.parametrize('freq', ['D', 'M', 'A'])
+    def test_pickle_round_trip(self, freq):
+        idx = PeriodIndex(['2016-05-16', 'NaT', NaT, np.NaN], freq=freq)
+        result = tm.round_trip_pickle(idx)
+        tm.assert_index_equal(result, idx)
+
+    def test_where(self):
+        # This is handled in test_indexing
+        pass
+
+    def test_repeat(self):
+        # GH10183
+        idx = pd.period_range('2000-01-01', periods=3, freq='D')
+        res = idx.repeat(3)
+        exp = PeriodIndex(idx.values.repeat(3), freq='D')
+        tm.assert_index_equal(res, exp)
+        assert res.freqstr == 'D'
+
+    def test_fillna_period(self):
+        # GH 11343
+        idx = pd.PeriodIndex(['2011-01-01 09:00', pd.NaT,
+                              '2011-01-01 11:00'], freq='H')
+
+        exp = pd.PeriodIndex(['2011-01-01 09:00', '2011-01-01 10:00',
+                              '2011-01-01 11:00'], freq='H')
+        tm.assert_index_equal(
+            idx.fillna(pd.Period('2011-01-01 10:00', freq='H')), exp)
+
+        exp = pd.Index([pd.Period('2011-01-01 09:00', freq='H'), 'x',
+                        pd.Period('2011-01-01 11:00', freq='H')], dtype=object)
+        tm.assert_index_equal(idx.fillna('x'), exp)
+
+        exp = pd.Index([pd.Period('2011-01-01 09:00', freq='H'),
+                        pd.Period('2011-01-01', freq='D'),
+                        pd.Period('2011-01-01 11:00', freq='H')], dtype=object)
+        tm.assert_index_equal(idx.fillna(
+            pd.Period('2011-01-01', freq='D')), exp)
+
+    def test_no_millisecond_field(self):
+        with pytest.raises(AttributeError):
+            DatetimeIndex.millisecond
+
+        with pytest.raises(AttributeError):
+            DatetimeIndex([]).millisecond
+
+    def test_difference_freq(self):
+        # GH14323: difference of Period MUST preserve frequency
+        # but the ability to union results must be preserved
+
+        index = period_range("20160920", "20160925", freq="D")
+
+        other = period_range("20160921", "20160924", freq="D")
+        expected = PeriodIndex(["20160920", "20160925"], freq='D')
+        idx_diff = index.difference(other)
+        tm.assert_index_equal(idx_diff, expected)
+        tm.assert_attr_equal('freq', idx_diff, expected)
+
+        other = period_range("20160922", "20160925", freq="D")
+        idx_diff = index.difference(other)
+        expected = PeriodIndex(["20160920", "20160921"], freq='D')
+        tm.assert_index_equal(idx_diff, expected)
+        tm.assert_attr_equal('freq', idx_diff, expected)
+
+    def test_hash_error(self):
+        index = period_range('20010101', periods=10)
+        with tm.assert_raises_regex(TypeError, "unhashable type: %r" %
+                                    type(index).__name__):
+            hash(index)
+
+    def test_make_time_series(self):
+        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
+        series = Series(1, index=index)
+        assert isinstance(series, Series)
+
+    def test_shallow_copy_empty(self):
+
+        # GH13067
+        idx = PeriodIndex([], freq='M')
+        result = idx._shallow_copy()
+        expected = idx
+
+        tm.assert_index_equal(result, expected)
+
+    def test_dtype_str(self):
+        pi = pd.PeriodIndex([], freq='M')
+        assert pi.dtype_str == 'period[M]'
+        assert pi.dtype_str == str(pi.dtype)
+
+        pi = pd.PeriodIndex([], freq='3M')
+        assert pi.dtype_str == 'period[3M]'
+        assert pi.dtype_str == str(pi.dtype)
+
+    def test_view_asi8(self):
+        idx = pd.PeriodIndex([], freq='M')
+
+        exp = np.array([], dtype=np.int64)
+        tm.assert_numpy_array_equal(idx.view('i8'), exp)
+        tm.assert_numpy_array_equal(idx.asi8, exp)
+
+        idx = pd.PeriodIndex(['2011-01', pd.NaT], freq='M')
+
+        exp = np.array([492, -9223372036854775808], dtype=np.int64)
+        tm.assert_numpy_array_equal(idx.view('i8'), exp)
+        tm.assert_numpy_array_equal(idx.asi8, exp)
+
+        exp = np.array([14975, -9223372036854775808], dtype=np.int64)
+        idx = pd.PeriodIndex(['2011-01-01', pd.NaT], freq='D')
+        tm.assert_numpy_array_equal(idx.view('i8'), exp)
+        tm.assert_numpy_array_equal(idx.asi8, exp)
+
+    def test_values(self):
+        idx = pd.PeriodIndex([], freq='M')
+
+        exp = np.array([], dtype=np.object)
+        tm.assert_numpy_array_equal(idx.values, exp)
+        tm.assert_numpy_array_equal(idx.get_values(), exp)
+        exp = np.array([], dtype=np.int64)
+        tm.assert_numpy_array_equal(idx._ndarray_values, exp)
+
+        idx = pd.PeriodIndex(['2011-01', pd.NaT], freq='M')
+
+        exp = np.array([pd.Period('2011-01', freq='M'), pd.NaT], dtype=object)
+        tm.assert_numpy_array_equal(idx.values, exp)
+        tm.assert_numpy_array_equal(idx.get_values(), exp)
+        exp = np.array([492, -9223372036854775808], dtype=np.int64)
+        tm.assert_numpy_array_equal(idx._ndarray_values, exp)
+
+        idx = pd.PeriodIndex(['2011-01-01', pd.NaT], freq='D')
+
+        exp = np.array([pd.Period('2011-01-01', freq='D'), pd.NaT],
+                       dtype=object)
+        tm.assert_numpy_array_equal(idx.values, exp)
+        tm.assert_numpy_array_equal(idx.get_values(), exp)
+        exp = np.array([14975, -9223372036854775808], dtype=np.int64)
+        tm.assert_numpy_array_equal(idx._ndarray_values, exp)
+
+    def test_period_index_length(self):
+        pi = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
+        assert len(pi) == 9
+
+        pi = PeriodIndex(freq='Q', start='1/1/2001', end='12/1/2009')
+        assert len(pi) == 4 * 9
+
+        pi = PeriodIndex(freq='M', start='1/1/2001', end='12/1/2009')
+        assert len(pi) == 12 * 9
+
+        start = Period('02-Apr-2005', 'B')
+        i1 = PeriodIndex(start=start, periods=20)
+        assert len(i1) == 20
+        assert i1.freq == start.freq
+        assert i1[0] == start
+
+        end_intv = Period('2006-12-31', 'W')
+        i1 = PeriodIndex(end=end_intv, periods=10)
+        assert len(i1) == 10
+        assert i1.freq == end_intv.freq
+        assert i1[-1] == end_intv
+
+        end_intv = Period('2006-12-31', '1w')
+        i2 = PeriodIndex(end=end_intv, periods=10)
+        assert len(i1) == len(i2)
+        assert (i1 == i2).all()
+        assert i1.freq == i2.freq
+
+        end_intv = Period('2006-12-31', ('w', 1))
+        i2 = PeriodIndex(end=end_intv, periods=10)
+        assert len(i1) == len(i2)
+        assert (i1 == i2).all()
+        assert i1.freq == i2.freq
+
+        try:
+            PeriodIndex(start=start, end=end_intv)
+            raise AssertionError('Cannot allow mixed freq for start and end')
+        except ValueError:
+            pass
+
+        end_intv = Period('2005-05-01', 'B')
+        i1 = PeriodIndex(start=start, end=end_intv)
+
+        try:
+            PeriodIndex(start=start)
+            raise AssertionError(
+                'Must specify periods if missing start or end')
+        except ValueError:
+            pass
+
+        # infer freq from first element
+        i2 = PeriodIndex([end_intv, Period('2005-05-05', 'B')])
+        assert len(i2) == 2
+        assert i2[0] == end_intv
+
+        i2 = PeriodIndex(np.array([end_intv, Period('2005-05-05', 'B')]))
+        assert len(i2) == 2
+        assert i2[0] == end_intv
+
+        # Mixed freq should fail
+        vals = [end_intv, Period('2006-12-31', 'w')]
+        pytest.raises(ValueError, PeriodIndex, vals)
+        vals = np.array(vals)
+        pytest.raises(ValueError, PeriodIndex, vals)
+
+    def test_fields(self):
+        # year, month, day, hour, minute
+        # second, weekofyear, week, dayofweek, weekday, dayofyear, quarter
+        # qyear
+        pi = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2005')
+        self._check_all_fields(pi)
+
+        pi = PeriodIndex(freq='Q', start='1/1/2001', end='12/1/2002')
+        self._check_all_fields(pi)
+
+        pi = PeriodIndex(freq='M', start='1/1/2001', end='1/1/2002')
+        self._check_all_fields(pi)
+
+        pi = PeriodIndex(freq='D', start='12/1/2001', end='6/1/2001')
+        self._check_all_fields(pi)
+
+        pi = PeriodIndex(freq='B', start='12/1/2001', end='6/1/2001')
+        self._check_all_fields(pi)
+
+        pi = PeriodIndex(freq='H', start='12/31/2001', end='1/1/2002 23:00')
+        self._check_all_fields(pi)
+
+        pi = PeriodIndex(freq='Min', start='12/31/2001', end='1/1/2002 00:20')
+        self._check_all_fields(pi)
+
+        pi = PeriodIndex(freq='S', start='12/31/2001 00:00:00',
+                         end='12/31/2001 00:05:00')
+        self._check_all_fields(pi)
+
+        end_intv = Period('2006-12-31', 'W')
+        i1 = PeriodIndex(end=end_intv, periods=10)
+        self._check_all_fields(i1)
+
+    def _check_all_fields(self, periodindex):
+        fields = ['year', 'month', 'day', 'hour', 'minute', 'second',
+                  'weekofyear', 'week', 'dayofweek', 'dayofyear',
+                  'quarter', 'qyear', 'days_in_month']
+
+        periods = list(periodindex)
+        s = pd.Series(periodindex)
+
+        for field in fields:
+            field_idx = getattr(periodindex, field)
+            assert len(periodindex) == len(field_idx)
+            for x, val in zip(periods, field_idx):
+                assert getattr(x, field) == val
+
+            if len(s) == 0:
+                continue
+
+            field_s = getattr(s.dt, field)
+            assert len(periodindex) == len(field_s)
+            for x, val in zip(periods, field_s):
+                assert getattr(x, field) == val
+
+    def test_period_set_index_reindex(self):
+        # GH 6631
+        df = DataFrame(np.random.random(6))
+        idx1 = period_range('2011/01/01', periods=6, freq='M')
+        idx2 = period_range('2013', periods=6, freq='A')
+
+        df = df.set_index(idx1)
+        tm.assert_index_equal(df.index, idx1)
+        df = df.set_index(idx2)
+        tm.assert_index_equal(df.index, idx2)
+
+    def test_factorize(self):
+        idx1 = PeriodIndex(['2014-01', '2014-01', '2014-02', '2014-02',
+                            '2014-03', '2014-03'], freq='M')
+
+        exp_arr = np.array([0, 0, 1, 1, 2, 2], dtype=np.intp)
+        exp_idx = PeriodIndex(['2014-01', '2014-02', '2014-03'], freq='M')
+
+        arr, idx = idx1.factorize()
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, exp_idx)
+
+        arr, idx = idx1.factorize(sort=True)
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, exp_idx)
+
+        idx2 = pd.PeriodIndex(['2014-03', '2014-03', '2014-02', '2014-01',
+                               '2014-03', '2014-01'], freq='M')
+
+        exp_arr = np.array([2, 2, 1, 0, 2, 0], dtype=np.intp)
+        arr, idx = idx2.factorize(sort=True)
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, exp_idx)
+
+        exp_arr = np.array([0, 0, 1, 2, 0, 2], dtype=np.intp)
+        exp_idx = PeriodIndex(['2014-03', '2014-02', '2014-01'], freq='M')
+        arr, idx = idx2.factorize()
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, exp_idx)
+
+    def test_is_(self):
+        create_index = lambda: PeriodIndex(freq='A', start='1/1/2001',
+                                           end='12/1/2009')
+        index = create_index()
+        assert index.is_(index)
+        assert not index.is_(create_index())
+        assert index.is_(index.view())
+        assert index.is_(index.view().view().view().view().view())
+        assert index.view().is_(index)
+        ind2 = index.view()
+        index.name = "Apple"
+        assert ind2.is_(index)
+        assert not index.is_(index[:])
+        assert not index.is_(index.asfreq('M'))
+        assert not index.is_(index.asfreq('A'))
+        assert not index.is_(index - 2)
+        assert not index.is_(index - 0)
+
+    def test_contains(self):
+        rng = period_range('2007-01', freq='M', periods=10)
+
+        assert Period('2007-01', freq='M') in rng
+        assert not Period('2007-01', freq='D') in rng
+        assert not Period('2007-01', freq='2M') in rng
+
+    def test_contains_nat(self):
+        # see gh-13582
+        idx = period_range('2007-01', freq='M', periods=10)
+        assert pd.NaT not in idx
+        assert None not in idx
+        assert float('nan') not in idx
+        assert np.nan not in idx
+
+        idx = pd.PeriodIndex(['2011-01', 'NaT', '2011-02'], freq='M')
+        assert pd.NaT in idx
+        assert None in idx
+        assert float('nan') in idx
+        assert np.nan in idx
+
+    def test_periods_number_check(self):
+        with pytest.raises(ValueError):
+            period_range('2011-1-1', '2012-1-1', 'B')
+
+    def test_index_duplicate_periods(self):
+        # monotonic
+        idx = PeriodIndex([2000, 2007, 2007, 2009, 2009], freq='A-JUN')
+        ts = Series(np.random.randn(len(idx)), index=idx)
+
+        result = ts[2007]
+        expected = ts[1:3]
+        tm.assert_series_equal(result, expected)
+        result[:] = 1
+        assert (ts[1:3] == 1).all()
+
+        # not monotonic
+        idx = PeriodIndex([2000, 2007, 2007, 2009, 2007], freq='A-JUN')
+        ts = Series(np.random.randn(len(idx)), index=idx)
+
+        result = ts[2007]
+        expected = ts[idx == 2007]
+        tm.assert_series_equal(result, expected)
+
+    def test_index_unique(self):
+        idx = PeriodIndex([2000, 2007, 2007, 2009, 2009], freq='A-JUN')
+        expected = PeriodIndex([2000, 2007, 2009], freq='A-JUN')
+        tm.assert_index_equal(idx.unique(), expected)
+        assert idx.nunique() == 3
+
+        idx = PeriodIndex([2000, 2007, 2007, 2009, 2007], freq='A-JUN',
+                          tz='US/Eastern')
+        expected = PeriodIndex([2000, 2007, 2009], freq='A-JUN',
+                               tz='US/Eastern')
+        tm.assert_index_equal(idx.unique(), expected)
+        assert idx.nunique() == 3
+
+    def test_shift(self):
+        # This is tested in test_arithmetic
+        pass
+
+    @td.skip_if_32bit
+    def test_ndarray_compat_properties(self):
+        super(TestPeriodIndex, self).test_ndarray_compat_properties()
+
+    def test_negative_ordinals(self):
+        Period(ordinal=-1000, freq='A')
+        Period(ordinal=0, freq='A')
+
+        idx1 = PeriodIndex(ordinal=[-1, 0, 1], freq='A')
+        idx2 = PeriodIndex(ordinal=np.array([-1, 0, 1]), freq='A')
+        tm.assert_index_equal(idx1, idx2)
+
+    def test_pindex_fieldaccessor_nat(self):
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT',
+                           '2012-03', '2012-04'], freq='D', name='name')
+
+        exp = Index([2011, 2011, -1, 2012, 2012], dtype=np.int64, name='name')
+        tm.assert_index_equal(idx.year, exp)
+        exp = Index([1, 2, -1, 3, 4], dtype=np.int64, name='name')
+        tm.assert_index_equal(idx.month, exp)
+
+    def test_pindex_qaccess(self):
+        pi = PeriodIndex(['2Q05', '3Q05', '4Q05', '1Q06', '2Q06'], freq='Q')
+        s = Series(np.random.rand(len(pi)), index=pi).cumsum()
+        # Todo: fix these accessors!
+        assert s['05Q4'] == s[2]
+
+    def test_numpy_repeat(self):
+        index = period_range('20010101', periods=2)
+        expected = PeriodIndex([Period('2001-01-01'), Period('2001-01-01'),
+                                Period('2001-01-02'), Period('2001-01-02')])
+
+        tm.assert_index_equal(np.repeat(index, 2), expected)
+
+        msg = "the 'axis' parameter is not supported"
+        tm.assert_raises_regex(
+            ValueError, msg, np.repeat, index, 2, axis=1)
+
+    def test_pindex_multiples(self):
+        pi = PeriodIndex(start='1/1/11', end='12/31/11', freq='2M')
+        expected = PeriodIndex(['2011-01', '2011-03', '2011-05', '2011-07',
+                                '2011-09', '2011-11'], freq='2M')
+        tm.assert_index_equal(pi, expected)
+        assert pi.freq == offsets.MonthEnd(2)
+        assert pi.freqstr == '2M'
+
+        pi = period_range(start='1/1/11', end='12/31/11', freq='2M')
+        tm.assert_index_equal(pi, expected)
+        assert pi.freq == offsets.MonthEnd(2)
+        assert pi.freqstr == '2M'
+
+        pi = period_range(start='1/1/11', periods=6, freq='2M')
+        tm.assert_index_equal(pi, expected)
+        assert pi.freq == offsets.MonthEnd(2)
+        assert pi.freqstr == '2M'
+
+    def test_iteration(self):
+        index = PeriodIndex(start='1/1/10', periods=4, freq='B')
+
+        result = list(index)
+        assert isinstance(result[0], Period)
+        assert result[0].freq == index.freq
+
+    def test_is_full(self):
+        index = PeriodIndex([2005, 2007, 2009], freq='A')
+        assert not index.is_full
+
+        index = PeriodIndex([2005, 2006, 2007], freq='A')
+        assert index.is_full
+
+        index = PeriodIndex([2005, 2005, 2007], freq='A')
+        assert not index.is_full
+
+        index = PeriodIndex([2005, 2005, 2006], freq='A')
+        assert index.is_full
+
+        index = PeriodIndex([2006, 2005, 2005], freq='A')
+        pytest.raises(ValueError, getattr, index, 'is_full')
+
+        assert index[:0].is_full
+
+    def test_with_multi_index(self):
+        # #1705
+        index = date_range('1/1/2012', periods=4, freq='12H')
+        index_as_arrays = [index.to_period(freq='D'), index.hour]
+
+        s = Series([0, 1, 2, 3], index_as_arrays)
+
+        assert isinstance(s.index.levels[0], PeriodIndex)
+
+        assert isinstance(s.index.values[0][0], Period)
+
+    def test_convert_array_of_periods(self):
+        rng = period_range('1/1/2000', periods=20, freq='D')
+        periods = list(rng)
+
+        result = pd.Index(periods)
+        assert isinstance(result, PeriodIndex)
+
+    def test_append_concat(self):
+        # #1815
+        d1 = date_range('12/31/1990', '12/31/1999', freq='A-DEC')
+        d2 = date_range('12/31/2000', '12/31/2009', freq='A-DEC')
+
+        s1 = Series(np.random.randn(10), d1)
+        s2 = Series(np.random.randn(10), d2)
+
+        s1 = s1.to_period()
+        s2 = s2.to_period()
+
+        # drops index
+        result = pd.concat([s1, s2])
+        assert isinstance(result.index, PeriodIndex)
+        assert result.index[0] == s1.index[0]
+
+    def test_pickle_freq(self):
+        # GH2891
+        prng = period_range('1/1/2011', '1/1/2012', freq='M')
+        new_prng = tm.round_trip_pickle(prng)
+        assert new_prng.freq == offsets.MonthEnd()
+        assert new_prng.freqstr == 'M'
+
+    def test_map(self):
+        # test_map_dictlike generally tests
+
+        index = PeriodIndex([2005, 2007, 2009], freq='A')
+        result = index.map(lambda x: x.ordinal)
+        exp = Index([x.ordinal for x in index])
+        tm.assert_index_equal(result, exp)
+
+    def test_join_self(self, join_type):
+        index = period_range('1/1/2000', periods=10)
+        joined = index.join(index, how=join_type)
+        assert index is joined
+
+    def test_insert(self):
+        # GH 18295 (test missing)
+        expected = PeriodIndex(
+            ['2017Q1', pd.NaT, '2017Q2', '2017Q3', '2017Q4'], freq='Q')
+        for na in (np.nan, pd.NaT, None):
+            result = period_range('2017Q1', periods=4, freq='Q').insert(1, na)
+            tm.assert_index_equal(result, expected)
diff --git a/pandas/tests/indexes/period/test_period_range.py b/pandas/tests/indexes/period/test_period_range.py
new file mode 100644
index 0000000000000..640f24f67f72f
--- /dev/null
+++ b/pandas/tests/indexes/period/test_period_range.py
@@ -0,0 +1,94 @@
+import pytest
+import pandas.util.testing as tm
+from pandas import date_range, NaT, period_range, Period, PeriodIndex
+
+
+class TestPeriodRange(object):
+
+    @pytest.mark.parametrize('freq', ['D', 'W', 'M', 'Q', 'A'])
+    def test_construction_from_string(self, freq):
+        # non-empty
+        expected = date_range(start='2017-01-01', periods=5,
+                              freq=freq, name='foo').to_period()
+        start, end = str(expected[0]), str(expected[-1])
+
+        result = period_range(start=start, end=end, freq=freq, name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = period_range(start=start, periods=5, freq=freq, name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = period_range(end=end, periods=5, freq=freq, name='foo')
+        tm.assert_index_equal(result, expected)
+
+        # empty
+        expected = PeriodIndex([], freq=freq, name='foo')
+
+        result = period_range(start=start, periods=0, freq=freq, name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = period_range(end=end, periods=0, freq=freq, name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = period_range(start=end, end=start, freq=freq, name='foo')
+        tm.assert_index_equal(result, expected)
+
+    def test_construction_from_period(self):
+        # upsampling
+        start, end = Period('2017Q1', freq='Q'), Period('2018Q1', freq='Q')
+        expected = date_range(start='2017-03-31', end='2018-03-31', freq='M',
+                              name='foo').to_period()
+        result = period_range(start=start, end=end, freq='M', name='foo')
+        tm.assert_index_equal(result, expected)
+
+        # downsampling
+        start, end = Period('2017-1', freq='M'), Period('2019-12', freq='M')
+        expected = date_range(start='2017-01-31', end='2019-12-31', freq='Q',
+                              name='foo').to_period()
+        result = period_range(start=start, end=end, freq='Q', name='foo')
+        tm.assert_index_equal(result, expected)
+
+        # empty
+        expected = PeriodIndex([], freq='W', name='foo')
+
+        result = period_range(start=start, periods=0, freq='W', name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = period_range(end=end, periods=0, freq='W', name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = period_range(start=end, end=start, freq='W', name='foo')
+        tm.assert_index_equal(result, expected)
+
+    def test_errors(self):
+        # not enough params
+        msg = ('Of the three parameters: start, end, and periods, '
+               'exactly two must be specified')
+        with tm.assert_raises_regex(ValueError, msg):
+            period_range(start='2017Q1')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            period_range(end='2017Q1')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            period_range(periods=5)
+
+        with tm.assert_raises_regex(ValueError, msg):
+            period_range()
+
+        # too many params
+        with tm.assert_raises_regex(ValueError, msg):
+            period_range(start='2017Q1', end='2018Q1', periods=8, freq='Q')
+
+        # start/end NaT
+        msg = 'start and end must not be NaT'
+        with tm.assert_raises_regex(ValueError, msg):
+            period_range(start=NaT, end='2018Q1')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            period_range(start='2017Q1', end=NaT)
+
+        # invalid periods param
+        msg = 'periods must be a number, got foo'
+        with tm.assert_raises_regex(TypeError, msg):
+            period_range(start='2017Q1', periods='foo')
diff --git a/pandas/tests/indexes/period/test_scalar_compat.py b/pandas/tests/indexes/period/test_scalar_compat.py
new file mode 100644
index 0000000000000..56bd2adf58719
--- /dev/null
+++ b/pandas/tests/indexes/period/test_scalar_compat.py
@@ -0,0 +1,17 @@
+# -*- coding: utf-8 -*-
+"""Tests for PeriodIndex behaving like a vectorized Period scalar"""
+
+from pandas import PeriodIndex, date_range
+import pandas.util.testing as tm
+
+
+class TestPeriodIndexOps(object):
+    def test_start_time(self):
+        index = PeriodIndex(freq='M', start='2016-01-01', end='2016-05-31')
+        expected_index = date_range('2016-01-01', end='2016-05-31', freq='MS')
+        tm.assert_index_equal(index.start_time, expected_index)
+
+    def test_end_time(self):
+        index = PeriodIndex(freq='M', start='2016-01-01', end='2016-05-31')
+        expected_index = date_range('2016-01-01', end='2016-05-31', freq='M')
+        tm.assert_index_equal(index.end_time, expected_index)
diff --git a/pandas/tests/indexes/period/test_setops.py b/pandas/tests/indexes/period/test_setops.py
new file mode 100644
index 0000000000000..6598e0663fb9a
--- /dev/null
+++ b/pandas/tests/indexes/period/test_setops.py
@@ -0,0 +1,247 @@
+import pytest
+
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.core.indexes.period as period
+from pandas import period_range, PeriodIndex, Index, date_range
+
+
+def _permute(obj):
+    return obj.take(np.random.permutation(len(obj)))
+
+
+class TestPeriodIndex(object):
+
+    def test_joins(self, join_type):
+        index = period_range('1/1/2000', '1/20/2000', freq='D')
+
+        joined = index.join(index[:-5], how=join_type)
+
+        assert isinstance(joined, PeriodIndex)
+        assert joined.freq == index.freq
+
+    def test_join_self(self, join_type):
+        index = period_range('1/1/2000', '1/20/2000', freq='D')
+
+        res = index.join(index, how=join_type)
+        assert index is res
+
+    def test_join_does_not_recur(self):
+        df = tm.makeCustomDataframe(
+            3, 2, data_gen_f=lambda *args: np.random.randint(2),
+            c_idx_type='p', r_idx_type='dt')
+        s = df.iloc[:2, 0]
+
+        res = s.index.join(df.columns, how='outer')
+        expected = Index([s.index[0], s.index[1],
+                          df.columns[0], df.columns[1]], object)
+        tm.assert_index_equal(res, expected)
+
+    def test_union(self):
+        # union
+        rng1 = pd.period_range('1/1/2000', freq='D', periods=5)
+        other1 = pd.period_range('1/6/2000', freq='D', periods=5)
+        expected1 = pd.period_range('1/1/2000', freq='D', periods=10)
+
+        rng2 = pd.period_range('1/1/2000', freq='D', periods=5)
+        other2 = pd.period_range('1/4/2000', freq='D', periods=5)
+        expected2 = pd.period_range('1/1/2000', freq='D', periods=8)
+
+        rng3 = pd.period_range('1/1/2000', freq='D', periods=5)
+        other3 = pd.PeriodIndex([], freq='D')
+        expected3 = pd.period_range('1/1/2000', freq='D', periods=5)
+
+        rng4 = pd.period_range('2000-01-01 09:00', freq='H', periods=5)
+        other4 = pd.period_range('2000-01-02 09:00', freq='H', periods=5)
+        expected4 = pd.PeriodIndex(['2000-01-01 09:00', '2000-01-01 10:00',
+                                    '2000-01-01 11:00', '2000-01-01 12:00',
+                                    '2000-01-01 13:00', '2000-01-02 09:00',
+                                    '2000-01-02 10:00', '2000-01-02 11:00',
+                                    '2000-01-02 12:00', '2000-01-02 13:00'],
+                                   freq='H')
+
+        rng5 = pd.PeriodIndex(['2000-01-01 09:01', '2000-01-01 09:03',
+                               '2000-01-01 09:05'], freq='T')
+        other5 = pd.PeriodIndex(['2000-01-01 09:01', '2000-01-01 09:05'
+                                                     '2000-01-01 09:08'],
+                                freq='T')
+        expected5 = pd.PeriodIndex(['2000-01-01 09:01', '2000-01-01 09:03',
+                                    '2000-01-01 09:05', '2000-01-01 09:08'],
+                                   freq='T')
+
+        rng6 = pd.period_range('2000-01-01', freq='M', periods=7)
+        other6 = pd.period_range('2000-04-01', freq='M', periods=7)
+        expected6 = pd.period_range('2000-01-01', freq='M', periods=10)
+
+        rng7 = pd.period_range('2003-01-01', freq='A', periods=5)
+        other7 = pd.period_range('1998-01-01', freq='A', periods=8)
+        expected7 = pd.period_range('1998-01-01', freq='A', periods=10)
+
+        for rng, other, expected in [(rng1, other1, expected1),
+                                     (rng2, other2, expected2),
+                                     (rng3, other3, expected3), (rng4, other4,
+                                                                 expected4),
+                                     (rng5, other5, expected5), (rng6, other6,
+                                                                 expected6),
+                                     (rng7, other7, expected7)]:
+
+            result_union = rng.union(other)
+            tm.assert_index_equal(result_union, expected)
+
+    def test_union_misc(self):
+        index = period_range('1/1/2000', '1/20/2000', freq='D')
+
+        result = index[:-5].union(index[10:])
+        tm.assert_index_equal(result, index)
+
+        # not in order
+        result = _permute(index[:-5]).union(_permute(index[10:]))
+        tm.assert_index_equal(result, index)
+
+        # raise if different frequencies
+        index = period_range('1/1/2000', '1/20/2000', freq='D')
+        index2 = period_range('1/1/2000', '1/20/2000', freq='W-WED')
+        with pytest.raises(period.IncompatibleFrequency):
+            index.union(index2)
+
+        msg = 'can only call with other PeriodIndex-ed objects'
+        with tm.assert_raises_regex(ValueError, msg):
+            index.join(index.to_timestamp())
+
+        index3 = period_range('1/1/2000', '1/20/2000', freq='2D')
+        with pytest.raises(period.IncompatibleFrequency):
+            index.join(index3)
+
+    def test_union_dataframe_index(self):
+        rng1 = pd.period_range('1/1/1999', '1/1/2012', freq='M')
+        s1 = pd.Series(np.random.randn(len(rng1)), rng1)
+
+        rng2 = pd.period_range('1/1/1980', '12/1/2001', freq='M')
+        s2 = pd.Series(np.random.randn(len(rng2)), rng2)
+        df = pd.DataFrame({'s1': s1, 's2': s2})
+
+        exp = pd.period_range('1/1/1980', '1/1/2012', freq='M')
+        tm.assert_index_equal(df.index, exp)
+
+    def test_intersection(self):
+        index = period_range('1/1/2000', '1/20/2000', freq='D')
+
+        result = index[:-5].intersection(index[10:])
+        tm.assert_index_equal(result, index[10:-5])
+
+        # not in order
+        left = _permute(index[:-5])
+        right = _permute(index[10:])
+        result = left.intersection(right).sort_values()
+        tm.assert_index_equal(result, index[10:-5])
+
+        # raise if different frequencies
+        index = period_range('1/1/2000', '1/20/2000', freq='D')
+        index2 = period_range('1/1/2000', '1/20/2000', freq='W-WED')
+        with pytest.raises(period.IncompatibleFrequency):
+            index.intersection(index2)
+
+        index3 = period_range('1/1/2000', '1/20/2000', freq='2D')
+        with pytest.raises(period.IncompatibleFrequency):
+            index.intersection(index3)
+
+    def test_intersection_cases(self):
+        base = period_range('6/1/2000', '6/30/2000', freq='D', name='idx')
+
+        # if target has the same name, it is preserved
+        rng2 = period_range('5/15/2000', '6/20/2000', freq='D', name='idx')
+        expected2 = period_range('6/1/2000', '6/20/2000', freq='D',
+                                 name='idx')
+
+        # if target name is different, it will be reset
+        rng3 = period_range('5/15/2000', '6/20/2000', freq='D', name='other')
+        expected3 = period_range('6/1/2000', '6/20/2000', freq='D',
+                                 name=None)
+
+        rng4 = period_range('7/1/2000', '7/31/2000', freq='D', name='idx')
+        expected4 = PeriodIndex([], name='idx', freq='D')
+
+        for (rng, expected) in [(rng2, expected2), (rng3, expected3),
+                                (rng4, expected4)]:
+            result = base.intersection(rng)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+
+        # non-monotonic
+        base = PeriodIndex(['2011-01-05', '2011-01-04', '2011-01-02',
+                            '2011-01-03'], freq='D', name='idx')
+
+        rng2 = PeriodIndex(['2011-01-04', '2011-01-02',
+                            '2011-02-02', '2011-02-03'],
+                           freq='D', name='idx')
+        expected2 = PeriodIndex(['2011-01-04', '2011-01-02'], freq='D',
+                                name='idx')
+
+        rng3 = PeriodIndex(['2011-01-04', '2011-01-02', '2011-02-02',
+                            '2011-02-03'],
+                           freq='D', name='other')
+        expected3 = PeriodIndex(['2011-01-04', '2011-01-02'], freq='D',
+                                name=None)
+
+        rng4 = period_range('7/1/2000', '7/31/2000', freq='D', name='idx')
+        expected4 = PeriodIndex([], freq='D', name='idx')
+
+        for (rng, expected) in [(rng2, expected2), (rng3, expected3),
+                                (rng4, expected4)]:
+            result = base.intersection(rng)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == 'D'
+
+        # empty same freq
+        rng = date_range('6/1/2000', '6/15/2000', freq='T')
+        result = rng[0:0].intersection(rng)
+        assert len(result) == 0
+
+        result = rng.intersection(rng[0:0])
+        assert len(result) == 0
+
+    def test_difference(self):
+        # diff
+        rng1 = pd.period_range('1/1/2000', freq='D', periods=5)
+        other1 = pd.period_range('1/6/2000', freq='D', periods=5)
+        expected1 = pd.period_range('1/1/2000', freq='D', periods=5)
+
+        rng2 = pd.period_range('1/1/2000', freq='D', periods=5)
+        other2 = pd.period_range('1/4/2000', freq='D', periods=5)
+        expected2 = pd.period_range('1/1/2000', freq='D', periods=3)
+
+        rng3 = pd.period_range('1/1/2000', freq='D', periods=5)
+        other3 = pd.PeriodIndex([], freq='D')
+        expected3 = pd.period_range('1/1/2000', freq='D', periods=5)
+
+        rng4 = pd.period_range('2000-01-01 09:00', freq='H', periods=5)
+        other4 = pd.period_range('2000-01-02 09:00', freq='H', periods=5)
+        expected4 = rng4
+
+        rng5 = pd.PeriodIndex(['2000-01-01 09:01', '2000-01-01 09:03',
+                               '2000-01-01 09:05'], freq='T')
+        other5 = pd.PeriodIndex(
+            ['2000-01-01 09:01', '2000-01-01 09:05'], freq='T')
+        expected5 = pd.PeriodIndex(['2000-01-01 09:03'], freq='T')
+
+        rng6 = pd.period_range('2000-01-01', freq='M', periods=7)
+        other6 = pd.period_range('2000-04-01', freq='M', periods=7)
+        expected6 = pd.period_range('2000-01-01', freq='M', periods=3)
+
+        rng7 = pd.period_range('2003-01-01', freq='A', periods=5)
+        other7 = pd.period_range('1998-01-01', freq='A', periods=8)
+        expected7 = pd.period_range('2006-01-01', freq='A', periods=2)
+
+        for rng, other, expected in [(rng1, other1, expected1),
+                                     (rng2, other2, expected2),
+                                     (rng3, other3, expected3),
+                                     (rng4, other4, expected4),
+                                     (rng5, other5, expected5),
+                                     (rng6, other6, expected6),
+                                     (rng7, other7, expected7), ]:
+            result_union = rng.difference(other)
+            tm.assert_index_equal(result_union, expected)
diff --git a/pandas/tests/indexes/period/test_tools.py b/pandas/tests/indexes/period/test_tools.py
new file mode 100644
index 0000000000000..38c6f257b2206
--- /dev/null
+++ b/pandas/tests/indexes/period/test_tools.py
@@ -0,0 +1,331 @@
+import numpy as np
+from datetime import datetime, timedelta
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.core.indexes.period as period
+from pandas.compat import lrange
+
+from pandas._libs.tslibs.ccalendar import MONTHS
+
+from pandas import (PeriodIndex, Period, DatetimeIndex, Timestamp, Series,
+                    date_range, to_datetime, period_range)
+
+
+class TestPeriodRepresentation(object):
+    """
+    Wish to match NumPy units
+    """
+
+    def _check_freq(self, freq, base_date):
+        rng = PeriodIndex(start=base_date, periods=10, freq=freq)
+        exp = np.arange(10, dtype=np.int64)
+
+        tm.assert_numpy_array_equal(rng.asi8, exp)
+
+    def test_annual(self):
+        self._check_freq('A', 1970)
+
+    def test_monthly(self):
+        self._check_freq('M', '1970-01')
+
+    @pytest.mark.parametrize('freq', ['W-THU', 'D', 'B', 'H', 'T',
+                                      'S', 'L', 'U', 'N'])
+    def test_freq(self, freq):
+        self._check_freq(freq, '1970-01-01')
+
+    def test_negone_ordinals(self):
+        freqs = ['A', 'M', 'Q', 'D', 'H', 'T', 'S']
+
+        period = Period(ordinal=-1, freq='D')
+        for freq in freqs:
+            repr(period.asfreq(freq))
+
+        for freq in freqs:
+            period = Period(ordinal=-1, freq=freq)
+            repr(period)
+            assert period.year == 1969
+
+        period = Period(ordinal=-1, freq='B')
+        repr(period)
+        period = Period(ordinal=-1, freq='W')
+        repr(period)
+
+
+class TestPeriodIndex(object):
+    def test_to_timestamp(self):
+        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
+        series = Series(1, index=index, name='foo')
+
+        exp_index = date_range('1/1/2001', end='12/31/2009', freq='A-DEC')
+        result = series.to_timestamp(how='end')
+        tm.assert_index_equal(result.index, exp_index)
+        assert result.name == 'foo'
+
+        exp_index = date_range('1/1/2001', end='1/1/2009', freq='AS-JAN')
+        result = series.to_timestamp(how='start')
+        tm.assert_index_equal(result.index, exp_index)
+
+        def _get_with_delta(delta, freq='A-DEC'):
+            return date_range(to_datetime('1/1/2001') + delta,
+                              to_datetime('12/31/2009') + delta, freq=freq)
+
+        delta = timedelta(hours=23)
+        result = series.to_timestamp('H', 'end')
+        exp_index = _get_with_delta(delta)
+        tm.assert_index_equal(result.index, exp_index)
+
+        delta = timedelta(hours=23, minutes=59)
+        result = series.to_timestamp('T', 'end')
+        exp_index = _get_with_delta(delta)
+        tm.assert_index_equal(result.index, exp_index)
+
+        result = series.to_timestamp('S', 'end')
+        delta = timedelta(hours=23, minutes=59, seconds=59)
+        exp_index = _get_with_delta(delta)
+        tm.assert_index_equal(result.index, exp_index)
+
+        index = PeriodIndex(freq='H', start='1/1/2001', end='1/2/2001')
+        series = Series(1, index=index, name='foo')
+
+        exp_index = date_range('1/1/2001 00:59:59', end='1/2/2001 00:59:59',
+                               freq='H')
+        result = series.to_timestamp(how='end')
+        tm.assert_index_equal(result.index, exp_index)
+        assert result.name == 'foo'
+
+    def test_to_timestamp_repr_is_code(self):
+        zs = [Timestamp('99-04-17 00:00:00', tz='UTC'),
+              Timestamp('2001-04-17 00:00:00', tz='UTC'),
+              Timestamp('2001-04-17 00:00:00', tz='America/Los_Angeles'),
+              Timestamp('2001-04-17 00:00:00', tz=None)]
+        for z in zs:
+            assert eval(repr(z)) == z
+
+    def test_to_timestamp_to_period_astype(self):
+        idx = DatetimeIndex([pd.NaT, '2011-01-01', '2011-02-01'], name='idx')
+
+        res = idx.astype('period[M]')
+        exp = PeriodIndex(['NaT', '2011-01', '2011-02'], freq='M', name='idx')
+        tm.assert_index_equal(res, exp)
+
+        res = idx.astype('period[3M]')
+        exp = PeriodIndex(['NaT', '2011-01', '2011-02'], freq='3M', name='idx')
+        tm.assert_index_equal(res, exp)
+
+    def test_dti_to_period(self):
+        dti = DatetimeIndex(start='1/1/2005', end='12/1/2005', freq='M')
+        pi1 = dti.to_period()
+        pi2 = dti.to_period(freq='D')
+        pi3 = dti.to_period(freq='3D')
+
+        assert pi1[0] == Period('Jan 2005', freq='M')
+        assert pi2[0] == Period('1/31/2005', freq='D')
+        assert pi3[0] == Period('1/31/2005', freq='3D')
+
+        assert pi1[-1] == Period('Nov 2005', freq='M')
+        assert pi2[-1] == Period('11/30/2005', freq='D')
+        assert pi3[-1], Period('11/30/2005', freq='3D')
+
+        tm.assert_index_equal(pi1, period_range('1/1/2005', '11/1/2005',
+                                                freq='M'))
+        tm.assert_index_equal(pi2, period_range('1/1/2005', '11/1/2005',
+                                                freq='M').asfreq('D'))
+        tm.assert_index_equal(pi3, period_range('1/1/2005', '11/1/2005',
+                                                freq='M').asfreq('3D'))
+
+    @pytest.mark.parametrize('month', MONTHS)
+    def test_to_period_quarterly(self, month):
+        # make sure we can make the round trip
+        freq = 'Q-%s' % month
+        rng = period_range('1989Q3', '1991Q3', freq=freq)
+        stamps = rng.to_timestamp()
+        result = stamps.to_period(freq)
+        tm.assert_index_equal(rng, result)
+
+    @pytest.mark.parametrize('off', ['BQ', 'QS', 'BQS'])
+    def test_to_period_quarterlyish(self, off):
+        rng = date_range('01-Jan-2012', periods=8, freq=off)
+        prng = rng.to_period()
+        assert prng.freq == 'Q-DEC'
+
+    @pytest.mark.parametrize('off', ['BA', 'AS', 'BAS'])
+    def test_to_period_annualish(self, off):
+        rng = date_range('01-Jan-2012', periods=8, freq=off)
+        prng = rng.to_period()
+        assert prng.freq == 'A-DEC'
+
+    def test_to_period_monthish(self):
+        offsets = ['MS', 'BM']
+        for off in offsets:
+            rng = date_range('01-Jan-2012', periods=8, freq=off)
+            prng = rng.to_period()
+            assert prng.freq == 'M'
+
+        rng = date_range('01-Jan-2012', periods=8, freq='M')
+        prng = rng.to_period()
+        assert prng.freq == 'M'
+
+        msg = pd._libs.tslibs.frequencies._INVALID_FREQ_ERROR
+        with tm.assert_raises_regex(ValueError, msg):
+            date_range('01-Jan-2012', periods=8, freq='EOM')
+
+    def test_period_dt64_round_trip(self):
+        dti = date_range('1/1/2000', '1/7/2002', freq='B')
+        pi = dti.to_period()
+        tm.assert_index_equal(pi.to_timestamp(), dti)
+
+        dti = date_range('1/1/2000', '1/7/2002', freq='B')
+        pi = dti.to_period(freq='H')
+        tm.assert_index_equal(pi.to_timestamp(), dti)
+
+    def test_combine_first(self):
+        # GH 3367
+        didx = pd.DatetimeIndex(start='1950-01-31', end='1950-07-31', freq='M')
+        pidx = pd.PeriodIndex(start=pd.Period('1950-1'),
+                              end=pd.Period('1950-7'), freq='M')
+        # check to be consistent with DatetimeIndex
+        for idx in [didx, pidx]:
+            a = pd.Series([1, np.nan, np.nan, 4, 5, np.nan, 7], index=idx)
+            b = pd.Series([9, 9, 9, 9, 9, 9, 9], index=idx)
+
+            result = a.combine_first(b)
+            expected = pd.Series([1, 9, 9, 4, 5, 9, 7], index=idx,
+                                 dtype=np.float64)
+            tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('freq', ['D', '2D'])
+    def test_searchsorted(self, freq):
+        pidx = pd.PeriodIndex(['2014-01-01', '2014-01-02', '2014-01-03',
+                               '2014-01-04', '2014-01-05'], freq=freq)
+
+        p1 = pd.Period('2014-01-01', freq=freq)
+        assert pidx.searchsorted(p1) == 0
+
+        p2 = pd.Period('2014-01-04', freq=freq)
+        assert pidx.searchsorted(p2) == 3
+
+        msg = "Input has different freq=H from PeriodIndex"
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            pidx.searchsorted(pd.Period('2014-01-01', freq='H'))
+
+        msg = "Input has different freq=5D from PeriodIndex"
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            pidx.searchsorted(pd.Period('2014-01-01', freq='5D'))
+
+        with tm.assert_produces_warning(FutureWarning):
+            pidx.searchsorted(key=p2)
+
+
+class TestPeriodIndexConversion(object):
+    def test_tolist(self):
+        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
+        rs = index.tolist()
+        for x in rs:
+            assert isinstance(x, Period)
+
+        recon = PeriodIndex(rs)
+        tm.assert_index_equal(index, recon)
+
+    def test_to_timestamp_pi_nat(self):
+        # GH#7228
+        index = PeriodIndex(['NaT', '2011-01', '2011-02'], freq='M',
+                            name='idx')
+
+        result = index.to_timestamp('D')
+        expected = DatetimeIndex([pd.NaT, datetime(2011, 1, 1),
+                                  datetime(2011, 2, 1)], name='idx')
+        tm.assert_index_equal(result, expected)
+        assert result.name == 'idx'
+
+        result2 = result.to_period(freq='M')
+        tm.assert_index_equal(result2, index)
+        assert result2.name == 'idx'
+
+        result3 = result.to_period(freq='3M')
+        exp = PeriodIndex(['NaT', '2011-01', '2011-02'],
+                          freq='3M', name='idx')
+        tm.assert_index_equal(result3, exp)
+        assert result3.freqstr == '3M'
+
+        msg = ('Frequency must be positive, because it'
+               ' represents span: -2A')
+        with tm.assert_raises_regex(ValueError, msg):
+            result.to_period(freq='-2A')
+
+    def test_to_timestamp_preserve_name(self):
+        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009',
+                            name='foo')
+        assert index.name == 'foo'
+
+        conv = index.to_timestamp('D')
+        assert conv.name == 'foo'
+
+    def test_to_timestamp_quarterly_bug(self):
+        years = np.arange(1960, 2000).repeat(4)
+        quarters = np.tile(lrange(1, 5), 40)
+
+        pindex = PeriodIndex(year=years, quarter=quarters)
+
+        stamps = pindex.to_timestamp('D', 'end')
+        expected = DatetimeIndex([x.to_timestamp('D', 'end') for x in pindex])
+        tm.assert_index_equal(stamps, expected)
+
+    def test_to_timestamp_pi_mult(self):
+        idx = PeriodIndex(['2011-01', 'NaT', '2011-02'],
+                          freq='2M', name='idx')
+
+        result = idx.to_timestamp()
+        expected = DatetimeIndex(['2011-01-01', 'NaT', '2011-02-01'],
+                                 name='idx')
+        tm.assert_index_equal(result, expected)
+
+        result = idx.to_timestamp(how='E')
+        expected = DatetimeIndex(['2011-02-28', 'NaT', '2011-03-31'],
+                                 name='idx')
+        tm.assert_index_equal(result, expected)
+
+    def test_to_timestamp_pi_combined(self):
+        idx = PeriodIndex(start='2011', periods=2, freq='1D1H', name='idx')
+
+        result = idx.to_timestamp()
+        expected = DatetimeIndex(['2011-01-01 00:00', '2011-01-02 01:00'],
+                                 name='idx')
+        tm.assert_index_equal(result, expected)
+
+        result = idx.to_timestamp(how='E')
+        expected = DatetimeIndex(['2011-01-02 00:59:59',
+                                  '2011-01-03 01:59:59'],
+                                 name='idx')
+        tm.assert_index_equal(result, expected)
+
+        result = idx.to_timestamp(how='E', freq='H')
+        expected = DatetimeIndex(['2011-01-02 00:00', '2011-01-03 01:00'],
+                                 name='idx')
+        tm.assert_index_equal(result, expected)
+
+    def test_period_astype_to_timestamp(self):
+        pi = pd.PeriodIndex(['2011-01', '2011-02', '2011-03'], freq='M')
+
+        exp = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'])
+        tm.assert_index_equal(pi.astype('datetime64[ns]'), exp)
+
+        exp = pd.DatetimeIndex(['2011-01-31', '2011-02-28', '2011-03-31'])
+        tm.assert_index_equal(pi.astype('datetime64[ns]', how='end'), exp)
+
+        exp = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'],
+                               tz='US/Eastern')
+        res = pi.astype('datetime64[ns, US/Eastern]')
+        tm.assert_index_equal(pi.astype('datetime64[ns, US/Eastern]'), exp)
+
+        exp = pd.DatetimeIndex(['2011-01-31', '2011-02-28', '2011-03-31'],
+                               tz='US/Eastern')
+        res = pi.astype('datetime64[ns, US/Eastern]', how='end')
+        tm.assert_index_equal(res, exp)
+
+    def test_to_timestamp_1703(self):
+        index = period_range('1/1/2012', periods=4, freq='D')
+
+        result = index.to_timestamp()
+        assert result[0] == Timestamp('1/1/2012')
diff --git a/pandas/tests/indexes/test_base.py b/pandas/tests/indexes/test_base.py
new file mode 100644
index 0000000000000..daba56e0c1e29
--- /dev/null
+++ b/pandas/tests/indexes/test_base.py
@@ -0,0 +1,2482 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from datetime import datetime, timedelta
+
+from collections import defaultdict
+
+import pandas.util.testing as tm
+from pandas.core.dtypes.generic import ABCIndex
+from pandas.core.dtypes.common import is_unsigned_integer_dtype
+from pandas.core.indexes.api import Index, MultiIndex
+from pandas.tests.indexes.common import Base
+
+from pandas.compat import (range, lrange, lzip, u,
+                           text_type, zip, PY3, PY35, PY36, PYPY, StringIO)
+import operator
+import numpy as np
+
+from pandas import (period_range, date_range, Series,
+                    DataFrame, Float64Index, Int64Index, UInt64Index,
+                    CategoricalIndex, DatetimeIndex, TimedeltaIndex,
+                    PeriodIndex, RangeIndex, isna)
+from pandas.core.index import _get_combined_index, _ensure_index_from_sequences
+from pandas.util.testing import assert_almost_equal
+from pandas.compat.numpy import np_datetime64_compat
+
+import pandas.core.config as cf
+
+from pandas.core.indexes.datetimes import _to_m8
+
+import pandas as pd
+from pandas._libs.tslib import Timestamp
+
+
+class TestIndex(Base):
+    _holder = Index
+
+    def setup_method(self, method):
+        self.indices = dict(unicodeIndex=tm.makeUnicodeIndex(100),
+                            strIndex=tm.makeStringIndex(100),
+                            dateIndex=tm.makeDateIndex(100),
+                            periodIndex=tm.makePeriodIndex(100),
+                            tdIndex=tm.makeTimedeltaIndex(100),
+                            intIndex=tm.makeIntIndex(100),
+                            uintIndex=tm.makeUIntIndex(100),
+                            rangeIndex=tm.makeRangeIndex(100),
+                            floatIndex=tm.makeFloatIndex(100),
+                            boolIndex=Index([True, False]),
+                            catIndex=tm.makeCategoricalIndex(100),
+                            empty=Index([]),
+                            tuples=MultiIndex.from_tuples(lzip(
+                                ['foo', 'bar', 'baz'], [1, 2, 3])),
+                            repeats=Index([0, 0, 1, 1, 2, 2]))
+        self.setup_indices()
+
+    def create_index(self):
+        return Index(list('abcde'))
+
+    def generate_index_types(self, skip_index_keys=[]):
+        """
+        Return a generator of the various index types, leaving
+        out the ones with a key in skip_index_keys
+        """
+        for key, index in self.indices.items():
+            if key not in skip_index_keys:
+                yield key, index
+
+    def test_can_hold_identifiers(self):
+        index = self.create_index()
+        key = index[0]
+        assert index._can_hold_identifiers_and_holds_name(key) is True
+
+    def test_new_axis(self):
+        new_index = self.dateIndex[None, :]
+        assert new_index.ndim == 2
+        assert isinstance(new_index, np.ndarray)
+
+    def test_copy_and_deepcopy(self, indices):
+        super(TestIndex, self).test_copy_and_deepcopy(indices)
+
+        new_copy2 = self.intIndex.copy(dtype=int)
+        assert new_copy2.dtype.kind == 'i'
+
+    @pytest.mark.parametrize("attr", ['strIndex', 'dateIndex'])
+    def test_constructor_regular(self, attr):
+        # regular instance creation
+        index = getattr(self, attr)
+        tm.assert_contains_all(index, index)
+
+    def test_constructor_casting(self):
+        # casting
+        arr = np.array(self.strIndex)
+        index = Index(arr)
+        tm.assert_contains_all(arr, index)
+        tm.assert_index_equal(self.strIndex, index)
+
+    def test_constructor_copy(self):
+        # copy
+        arr = np.array(self.strIndex)
+        index = Index(arr, copy=True, name='name')
+        assert isinstance(index, Index)
+        assert index.name == 'name'
+        tm.assert_numpy_array_equal(arr, index.values)
+        arr[0] = "SOMEBIGLONGSTRING"
+        assert index[0] != "SOMEBIGLONGSTRING"
+
+        # what to do here?
+        # arr = np.array(5.)
+        # pytest.raises(Exception, arr.view, Index)
+
+    def test_constructor_corner(self):
+        # corner case
+        pytest.raises(TypeError, Index, 0)
+
+    @pytest.mark.parametrize("index_vals", [
+        [('A', 1), 'B'], ['B', ('A', 1)]])
+    def test_construction_list_mixed_tuples(self, index_vals):
+        # see gh-10697: if we are constructing from a mixed list of tuples,
+        # make sure that we are independent of the sorting order.
+        index = Index(index_vals)
+        assert isinstance(index, Index)
+        assert not isinstance(index, MultiIndex)
+
+    @pytest.mark.parametrize('na_value', [None, np.nan])
+    @pytest.mark.parametrize('vtype', [list, tuple, iter])
+    def test_construction_list_tuples_nan(self, na_value, vtype):
+        # GH 18505 : valid tuples containing NaN
+        values = [(1, 'two'), (3., na_value)]
+        result = Index(vtype(values))
+        expected = MultiIndex.from_tuples(values)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("cast_as_obj", [True, False])
+    @pytest.mark.parametrize("index", [
+        pd.date_range('2015-01-01 10:00', freq='D', periods=3,
+                      tz='US/Eastern'),  # DTI with tz
+        pd.date_range('2015-01-01 10:00', freq='D', periods=3),  # DTI no tz
+        pd.timedelta_range('1 days', freq='D', periods=3),  # td
+        pd.period_range('2015-01-01', freq='D', periods=3)  # period
+    ])
+    def test_constructor_from_index_dtlike(self, cast_as_obj, index):
+        if cast_as_obj:
+            result = pd.Index(index.astype(object))
+        else:
+            result = pd.Index(index)
+
+        tm.assert_index_equal(result, index)
+
+        if isinstance(index, pd.DatetimeIndex) and hasattr(index, 'tz'):
+            assert result.tz == index.tz
+
+    @pytest.mark.parametrize("index,has_tz", [
+        (pd.date_range('2015-01-01 10:00', freq='D', periods=3,
+                       tz='US/Eastern'), True),  # datetimetz
+        (pd.timedelta_range('1 days', freq='D', periods=3), False),  # td
+        (pd.period_range('2015-01-01', freq='D', periods=3), False)  # period
+    ])
+    def test_constructor_from_series_dtlike(self, index, has_tz):
+        result = pd.Index(pd.Series(index))
+        tm.assert_index_equal(result, index)
+
+        if has_tz:
+            assert result.tz == index.tz
+
+    @pytest.mark.parametrize("klass", [Index, DatetimeIndex])
+    def test_constructor_from_series(self, klass):
+        expected = DatetimeIndex([Timestamp('20110101'), Timestamp('20120101'),
+                                  Timestamp('20130101')])
+        s = Series([Timestamp('20110101'), Timestamp('20120101'),
+                    Timestamp('20130101')])
+        result = klass(s)
+        tm.assert_index_equal(result, expected)
+
+    def test_constructor_from_series_freq(self):
+        # GH 6273
+        # create from a series, passing a freq
+        dts = ['1-1-1990', '2-1-1990', '3-1-1990', '4-1-1990', '5-1-1990']
+        expected = DatetimeIndex(dts, freq='MS')
+
+        s = Series(pd.to_datetime(dts))
+        result = DatetimeIndex(s, freq='MS')
+
+        tm.assert_index_equal(result, expected)
+
+    def test_constructor_from_frame_series_freq(self):
+        # GH 6273
+        # create from a series, passing a freq
+        dts = ['1-1-1990', '2-1-1990', '3-1-1990', '4-1-1990', '5-1-1990']
+        expected = DatetimeIndex(dts, freq='MS')
+
+        df = pd.DataFrame(np.random.rand(5, 3))
+        df['date'] = dts
+        result = DatetimeIndex(df['date'], freq='MS')
+
+        assert df['date'].dtype == object
+        expected.name = 'date'
+        tm.assert_index_equal(result, expected)
+
+        expected = pd.Series(dts, name='date')
+        tm.assert_series_equal(df['date'], expected)
+
+        # GH 6274
+        # infer freq of same
+        freq = pd.infer_freq(df['date'])
+        assert freq == 'MS'
+
+    @pytest.mark.parametrize("array", [
+        np.arange(5), np.array(['a', 'b', 'c']), date_range(
+            '2000-01-01', periods=3).values
+    ])
+    def test_constructor_ndarray_like(self, array):
+        # GH 5460#issuecomment-44474502
+        # it should be possible to convert any object that satisfies the numpy
+        # ndarray interface directly into an Index
+        class ArrayLike(object):
+            def __init__(self, array):
+                self.array = array
+
+            def __array__(self, dtype=None):
+                return self.array
+
+        expected = pd.Index(array)
+        result = pd.Index(ArrayLike(array))
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [
+        int, 'int64', 'int32', 'int16', 'int8', 'uint64', 'uint32',
+        'uint16', 'uint8'])
+    def test_constructor_int_dtype_float(self, dtype):
+        # GH 18400
+        if is_unsigned_integer_dtype(dtype):
+            index_type = UInt64Index
+        else:
+            index_type = Int64Index
+
+        expected = index_type([0, 1, 2, 3])
+        result = Index([0., 1., 2., 3.], dtype=dtype)
+        tm.assert_index_equal(result, expected)
+
+    def test_constructor_int_dtype_nan(self):
+        # see gh-15187
+        data = [np.nan]
+        expected = Float64Index(data)
+        result = Index(data, dtype='float')
+        tm.assert_index_equal(result, expected)
+
+    def test_droplevel(self, indices):
+        # GH 21115
+        if isinstance(indices, MultiIndex):
+            # Tested separately in test_multi.py
+            return
+
+        assert indices.droplevel([]).equals(indices)
+
+        for level in indices.name, [indices.name]:
+            if isinstance(indices.name, tuple) and level is indices.name:
+                # GH 21121 : droplevel with tuple name
+                continue
+            with pytest.raises(ValueError):
+                indices.droplevel(level)
+
+        for level in 'wrong', ['wrong']:
+            with pytest.raises(KeyError):
+                indices.droplevel(level)
+
+    @pytest.mark.parametrize("dtype", ['int64', 'uint64'])
+    def test_constructor_int_dtype_nan_raises(self, dtype):
+        # see gh-15187
+        data = [np.nan]
+        msg = "cannot convert"
+        with tm.assert_raises_regex(ValueError, msg):
+            Index(data, dtype=dtype)
+
+    @pytest.mark.parametrize("klass,dtype,na_val", [
+        (pd.Float64Index, np.float64, np.nan),
+        (pd.DatetimeIndex, 'datetime64[ns]', pd.NaT)
+    ])
+    def test_index_ctor_infer_nan_nat(self, klass, dtype, na_val):
+        # GH 13467
+        na_list = [na_val, na_val]
+        expected = klass(na_list)
+        assert expected.dtype == dtype
+
+        result = Index(na_list)
+        tm.assert_index_equal(result, expected)
+
+        result = Index(np.array(na_list))
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("pos", [0, 1])
+    @pytest.mark.parametrize("klass,dtype,ctor", [
+        (pd.DatetimeIndex, 'datetime64[ns]', np.datetime64('nat')),
+        (pd.TimedeltaIndex, 'timedelta64[ns]', np.timedelta64('nat'))
+    ])
+    def test_index_ctor_infer_nat_dt_like(self, pos, klass, dtype, ctor,
+                                          nulls_fixture):
+        expected = klass([pd.NaT, pd.NaT])
+        assert expected.dtype == dtype
+        data = [ctor]
+        data.insert(pos, nulls_fixture)
+
+        result = Index(data)
+        tm.assert_index_equal(result, expected)
+
+        result = Index(np.array(data, dtype=object))
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("swap_objs", [True, False])
+    def test_index_ctor_nat_result(self, swap_objs):
+        # mixed np.datetime64/timedelta64 nat results in object
+        data = [np.datetime64('nat'), np.timedelta64('nat')]
+        if swap_objs:
+            data = data[::-1]
+
+        expected = pd.Index(data, dtype=object)
+        tm.assert_index_equal(Index(data), expected)
+        tm.assert_index_equal(Index(np.array(data, dtype=object)), expected)
+
+    def test_index_ctor_infer_periodindex(self):
+        xp = period_range('2012-1-1', freq='M', periods=3)
+        rs = Index(xp)
+        tm.assert_index_equal(rs, xp)
+        assert isinstance(rs, PeriodIndex)
+
+    @pytest.mark.parametrize("vals,dtype", [
+        ([1, 2, 3, 4, 5], 'int'), ([1.1, np.nan, 2.2, 3.0], 'float'),
+        (['A', 'B', 'C', np.nan], 'obj')
+    ])
+    def test_constructor_simple_new(self, vals, dtype):
+        index = Index(vals, name=dtype)
+        result = index._simple_new(index, dtype)
+        tm.assert_index_equal(result, index)
+
+    @pytest.mark.parametrize("vals", [
+        [1, 2, 3], np.array([1, 2, 3]), np.array([1, 2, 3], dtype=int),
+        # below should coerce
+        [1., 2., 3.], np.array([1., 2., 3.], dtype=float)
+    ])
+    def test_constructor_dtypes_to_int64(self, vals):
+        index = Index(vals, dtype=int)
+        assert isinstance(index, Int64Index)
+
+    @pytest.mark.parametrize("vals", [
+        [1, 2, 3], [1., 2., 3.], np.array([1., 2., 3.]),
+        np.array([1, 2, 3], dtype=int), np.array([1., 2., 3.], dtype=float)
+    ])
+    def test_constructor_dtypes_to_float64(self, vals):
+        index = Index(vals, dtype=float)
+        assert isinstance(index, Float64Index)
+
+    @pytest.mark.parametrize("cast_index", [True, False])
+    @pytest.mark.parametrize("vals", [
+        [True, False, True], np.array([True, False, True], dtype=bool)
+    ])
+    def test_constructor_dtypes_to_object(self, cast_index, vals):
+        if cast_index:
+            index = Index(vals, dtype=bool)
+        else:
+            index = Index(vals)
+
+        assert isinstance(index, Index)
+        assert index.dtype == object
+
+    @pytest.mark.parametrize("vals", [
+        [1, 2, 3], np.array([1, 2, 3], dtype=int),
+        np.array([np_datetime64_compat('2011-01-01'),
+                  np_datetime64_compat('2011-01-02')]),
+        [datetime(2011, 1, 1), datetime(2011, 1, 2)]
+    ])
+    def test_constructor_dtypes_to_categorical(self, vals):
+        index = Index(vals, dtype='category')
+        assert isinstance(index, CategoricalIndex)
+
+    @pytest.mark.parametrize("cast_index", [True, False])
+    @pytest.mark.parametrize("vals", [
+        Index(np.array([np_datetime64_compat('2011-01-01'),
+                        np_datetime64_compat('2011-01-02')])),
+        Index([datetime(2011, 1, 1), datetime(2011, 1, 2)])
+
+    ])
+    def test_constructor_dtypes_to_datetime(self, cast_index, vals):
+        if cast_index:
+            index = Index(vals, dtype=object)
+            assert isinstance(index, Index)
+            assert index.dtype == object
+        else:
+            index = Index(vals)
+            assert isinstance(index, DatetimeIndex)
+
+    @pytest.mark.parametrize("cast_index", [True, False])
+    @pytest.mark.parametrize("vals", [
+        np.array([np.timedelta64(1, 'D'), np.timedelta64(1, 'D')]),
+        [timedelta(1), timedelta(1)]
+    ])
+    def test_constructor_dtypes_to_timedelta(self, cast_index, vals):
+        if cast_index:
+            index = Index(vals, dtype=object)
+            assert isinstance(index, Index)
+            assert index.dtype == object
+        else:
+            index = Index(vals)
+            assert isinstance(index, TimedeltaIndex)
+
+    @pytest.mark.parametrize("attr, utc", [
+        ['values', False],
+        ['asi8', True]])
+    @pytest.mark.parametrize("klass", [pd.Index, pd.DatetimeIndex])
+    def test_constructor_dtypes_datetime(self, tz_naive_fixture, attr, utc,
+                                         klass):
+        # Test constructing with a datetimetz dtype
+        # .values produces numpy datetimes, so these are considered naive
+        # .asi8 produces integers, so these are considered epoch timestamps
+        index = pd.date_range('2011-01-01', periods=5)
+        arg = getattr(index, attr)
+        if utc:
+            index = index.tz_localize('UTC').tz_convert(tz_naive_fixture)
+        else:
+            index = index.tz_localize(tz_naive_fixture)
+        dtype = index.dtype
+
+        result = klass(arg, tz=tz_naive_fixture)
+        tm.assert_index_equal(result, index)
+
+        result = klass(arg, dtype=dtype)
+        tm.assert_index_equal(result, index)
+
+        result = klass(list(arg), tz=tz_naive_fixture)
+        tm.assert_index_equal(result, index)
+
+        result = klass(list(arg), dtype=dtype)
+        tm.assert_index_equal(result, index)
+
+    @pytest.mark.parametrize("attr", ['values', 'asi8'])
+    @pytest.mark.parametrize("klass", [pd.Index, pd.TimedeltaIndex])
+    def test_constructor_dtypes_timedelta(self, attr, klass):
+        index = pd.timedelta_range('1 days', periods=5)
+        dtype = index.dtype
+
+        values = getattr(index, attr)
+
+        result = klass(values, dtype=dtype)
+        tm.assert_index_equal(result, index)
+
+        result = klass(list(values), dtype=dtype)
+        tm.assert_index_equal(result, index)
+
+    @pytest.mark.parametrize("value", [[], iter([]), (x for x in [])])
+    @pytest.mark.parametrize("klass",
+                             [Index, Float64Index, Int64Index, UInt64Index,
+                              CategoricalIndex, DatetimeIndex, TimedeltaIndex])
+    def test_constructor_empty(self, value, klass):
+        empty = klass(value)
+        assert isinstance(empty, klass)
+        assert not len(empty)
+
+    @pytest.mark.parametrize("empty,klass", [
+        (PeriodIndex([], freq='B'), PeriodIndex),
+        (PeriodIndex(iter([]), freq='B'), PeriodIndex),
+        (PeriodIndex((x for x in []), freq='B'), PeriodIndex),
+        (RangeIndex(step=1), pd.RangeIndex),
+        (MultiIndex(levels=[[1, 2], ['blue', 'red']],
+                    labels=[[], []]), MultiIndex)
+    ])
+    def test_constructor_empty_special(self, empty, klass):
+        assert isinstance(empty, klass)
+        assert not len(empty)
+
+    def test_constructor_nonhashable_name(self, indices):
+        # GH 20527
+
+        if isinstance(indices, MultiIndex):
+            pytest.skip("multiindex handled in test_multi.py")
+
+        name = ['0']
+        message = "Index.name must be a hashable type"
+        tm.assert_raises_regex(TypeError, message, name=name)
+
+        # With .rename()
+        renamed = [['1']]
+        tm.assert_raises_regex(TypeError, message,
+                               indices.rename, name=renamed)
+        # With .set_names()
+        tm.assert_raises_regex(TypeError, message,
+                               indices.set_names, names=renamed)
+
+    def test_constructor_overflow_int64(self):
+        # see gh-15832
+        msg = ("The elements provided in the data cannot "
+               "all be casted to the dtype int64")
+        with tm.assert_raises_regex(OverflowError, msg):
+            Index([np.iinfo(np.uint64).max - 1], dtype="int64")
+
+    @pytest.mark.xfail(reason="see gh-21311: Index "
+                              "doesn't enforce dtype argument")
+    def test_constructor_cast(self):
+        msg = "could not convert string to float"
+        with tm.assert_raises_regex(ValueError, msg):
+            Index(["a", "b", "c"], dtype=float)
+
+    def test_view_with_args(self):
+
+        restricted = ['unicodeIndex', 'strIndex', 'catIndex', 'boolIndex',
+                      'empty']
+
+        for i in restricted:
+            ind = self.indices[i]
+
+            # with arguments
+            pytest.raises(TypeError, lambda: ind.view('i8'))
+
+        # these are ok
+        for i in list(set(self.indices.keys()) - set(restricted)):
+            ind = self.indices[i]
+
+            # with arguments
+            ind.view('i8')
+
+    def test_astype(self):
+        casted = self.intIndex.astype('i8')
+
+        # it works!
+        casted.get_loc(5)
+
+        # pass on name
+        self.intIndex.name = 'foobar'
+        casted = self.intIndex.astype('i8')
+        assert casted.name == 'foobar'
+
+    def test_equals_object(self):
+        # same
+        assert Index(['a', 'b', 'c']).equals(Index(['a', 'b', 'c']))
+
+    @pytest.mark.parametrize("comp", [
+        Index(['a', 'b']), Index(['a', 'b', 'd']), ['a', 'b', 'c']])
+    def test_not_equals_object(self, comp):
+        assert not Index(['a', 'b', 'c']).equals(comp)
+
+    def test_insert(self):
+
+        # GH 7256
+        # validate neg/pos inserts
+        result = Index(['b', 'c', 'd'])
+
+        # test 0th element
+        tm.assert_index_equal(Index(['a', 'b', 'c', 'd']),
+                              result.insert(0, 'a'))
+
+        # test Nth element that follows Python list behavior
+        tm.assert_index_equal(Index(['b', 'c', 'e', 'd']),
+                              result.insert(-1, 'e'))
+
+        # test loc +/- neq (0, -1)
+        tm.assert_index_equal(result.insert(1, 'z'), result.insert(-2, 'z'))
+
+        # test empty
+        null_index = Index([])
+        tm.assert_index_equal(Index(['a']), null_index.insert(0, 'a'))
+
+    def test_insert_missing(self, nulls_fixture):
+        # GH 18295 (test missing)
+        expected = Index(['a', np.nan, 'b', 'c'])
+        result = Index(list('abc')).insert(1, nulls_fixture)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("pos,expected", [
+        (0, Index(['b', 'c', 'd'], name='index')),
+        (-1, Index(['a', 'b', 'c'], name='index'))
+    ])
+    def test_delete(self, pos, expected):
+        index = Index(['a', 'b', 'c', 'd'], name='index')
+        result = index.delete(pos)
+        tm.assert_index_equal(result, expected)
+        assert result.name == expected.name
+
+    def test_delete_raises(self):
+        index = Index(['a', 'b', 'c', 'd'], name='index')
+        with pytest.raises((IndexError, ValueError)):
+            # either depending on numpy version
+            index.delete(5)
+
+    def test_identical(self):
+
+        # index
+        i1 = Index(['a', 'b', 'c'])
+        i2 = Index(['a', 'b', 'c'])
+
+        assert i1.identical(i2)
+
+        i1 = i1.rename('foo')
+        assert i1.equals(i2)
+        assert not i1.identical(i2)
+
+        i2 = i2.rename('foo')
+        assert i1.identical(i2)
+
+        i3 = Index([('a', 'a'), ('a', 'b'), ('b', 'a')])
+        i4 = Index([('a', 'a'), ('a', 'b'), ('b', 'a')], tupleize_cols=False)
+        assert not i3.identical(i4)
+
+    def test_is_(self):
+        ind = Index(range(10))
+        assert ind.is_(ind)
+        assert ind.is_(ind.view().view().view().view())
+        assert not ind.is_(Index(range(10)))
+        assert not ind.is_(ind.copy())
+        assert not ind.is_(ind.copy(deep=False))
+        assert not ind.is_(ind[:])
+        assert not ind.is_(np.array(range(10)))
+
+        # quasi-implementation dependent
+        assert ind.is_(ind.view())
+        ind2 = ind.view()
+        ind2.name = 'bob'
+        assert ind.is_(ind2)
+        assert ind2.is_(ind)
+        # doesn't matter if Indices are *actually* views of underlying data,
+        assert not ind.is_(Index(ind.values))
+        arr = np.array(range(1, 11))
+        ind1 = Index(arr, copy=False)
+        ind2 = Index(arr, copy=False)
+        assert not ind1.is_(ind2)
+
+    def test_asof(self):
+        d = self.dateIndex[0]
+        assert self.dateIndex.asof(d) == d
+        assert isna(self.dateIndex.asof(d - timedelta(1)))
+
+        d = self.dateIndex[-1]
+        assert self.dateIndex.asof(d + timedelta(1)) == d
+
+        d = self.dateIndex[0].to_pydatetime()
+        assert isinstance(self.dateIndex.asof(d), Timestamp)
+
+    def test_asof_datetime_partial(self):
+        index = pd.date_range('2010-01-01', periods=2, freq='m')
+        expected = Timestamp('2010-02-28')
+        result = index.asof('2010-02')
+        assert result == expected
+        assert not isinstance(result, Index)
+
+    def test_nanosecond_index_access(self):
+        s = Series([Timestamp('20130101')]).values.view('i8')[0]
+        r = DatetimeIndex([s + 50 + i for i in range(100)])
+        x = Series(np.random.randn(100), index=r)
+
+        first_value = x.asof(x.index[0])
+
+        # this does not yet work, as parsing strings is done via dateutil
+        # assert first_value == x['2013-01-01 00:00:00.000000050+0000']
+
+        expected_ts = np_datetime64_compat('2013-01-01 00:00:00.000000050+'
+                                           '0000', 'ns')
+        assert first_value == x[Timestamp(expected_ts)]
+
+    @pytest.mark.parametrize("op", [
+        operator.eq, operator.ne, operator.gt, operator.lt,
+        operator.ge, operator.le
+    ])
+    def test_comparators(self, op):
+        index = self.dateIndex
+        element = index[len(index) // 2]
+        element = _to_m8(element)
+
+        arr = np.array(index)
+        arr_result = op(arr, element)
+        index_result = op(index, element)
+
+        assert isinstance(index_result, np.ndarray)
+        tm.assert_numpy_array_equal(arr_result, index_result)
+
+    def test_booleanindex(self):
+        boolIndex = np.repeat(True, len(self.strIndex)).astype(bool)
+        boolIndex[5:30:2] = False
+
+        subIndex = self.strIndex[boolIndex]
+
+        for i, val in enumerate(subIndex):
+            assert subIndex.get_loc(val) == i
+
+        subIndex = self.strIndex[list(boolIndex)]
+        for i, val in enumerate(subIndex):
+            assert subIndex.get_loc(val) == i
+
+    def test_fancy(self):
+        sl = self.strIndex[[1, 2, 3]]
+        for i in sl:
+            assert i == sl[sl.get_loc(i)]
+
+    @pytest.mark.parametrize("attr", [
+        'strIndex', 'intIndex', 'floatIndex'])
+    @pytest.mark.parametrize("dtype", [np.int_, np.bool_])
+    def test_empty_fancy(self, attr, dtype):
+        empty_arr = np.array([], dtype=dtype)
+        index = getattr(self, attr)
+        empty_index = index.__class__([])
+
+        assert index[[]].identical(empty_index)
+        assert index[empty_arr].identical(empty_index)
+
+    @pytest.mark.parametrize("attr", [
+        'strIndex', 'intIndex', 'floatIndex'])
+    def test_empty_fancy_raises(self, attr):
+        # pd.DatetimeIndex is excluded, because it overrides getitem and should
+        # be tested separately.
+        empty_farr = np.array([], dtype=np.float_)
+        index = getattr(self, attr)
+        empty_index = index.__class__([])
+
+        assert index[[]].identical(empty_index)
+        # np.ndarray only accepts ndarray of int & bool dtypes, so should Index
+        pytest.raises(IndexError, index.__getitem__, empty_farr)
+
+    @pytest.mark.parametrize("itm", [101, 'no_int'])
+    def test_getitem_error(self, indices, itm):
+        with pytest.raises(IndexError):
+            indices[itm]
+
+    def test_intersection(self):
+        first = self.strIndex[:20]
+        second = self.strIndex[:10]
+        intersect = first.intersection(second)
+        assert tm.equalContents(intersect, second)
+
+        # Corner cases
+        inter = first.intersection(first)
+        assert inter is first
+
+    @pytest.mark.parametrize("index2,keeps_name", [
+        (Index([3, 4, 5, 6, 7], name="index"), True),  # preserve same name
+        (Index([3, 4, 5, 6, 7], name="other"), False),  # drop diff names
+        (Index([3, 4, 5, 6, 7]), False)])
+    def test_intersection_name_preservation(self, index2, keeps_name):
+        index1 = Index([1, 2, 3, 4, 5], name='index')
+        expected = Index([3, 4, 5])
+        result = index1.intersection(index2)
+
+        if keeps_name:
+            expected.name = 'index'
+
+        assert result.name == expected.name
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("first_name,second_name,expected_name", [
+        ('A', 'A', 'A'), ('A', 'B', None), (None, 'B', None)])
+    def test_intersection_name_preservation2(self, first_name, second_name,
+                                             expected_name):
+        first = self.strIndex[5:20]
+        second = self.strIndex[:10]
+        first.name = first_name
+        second.name = second_name
+        intersect = first.intersection(second)
+        assert intersect.name == expected_name
+
+    @pytest.mark.parametrize("index2,keeps_name", [
+        (Index([4, 7, 6, 5, 3], name='index'), True),
+        (Index([4, 7, 6, 5, 3], name='other'), False)])
+    def test_intersection_monotonic(self, index2, keeps_name):
+        index1 = Index([5, 3, 2, 4, 1], name='index')
+        expected = Index([5, 3, 4])
+
+        if keeps_name:
+            expected.name = "index"
+
+        result = index1.intersection(index2)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("index2,expected_arr", [
+        (Index(['B', 'D']), ['B']),
+        (Index(['B', 'D', 'A']), ['A', 'B', 'A'])])
+    def test_intersection_non_monotonic_non_unique(self, index2, expected_arr):
+        # non-monotonic non-unique
+        index1 = Index(['A', 'B', 'A', 'C'])
+        expected = Index(expected_arr, dtype='object')
+        result = index1.intersection(index2)
+        tm.assert_index_equal(result, expected)
+
+    def test_intersect_str_dates(self):
+        dt_dates = [datetime(2012, 2, 9), datetime(2012, 2, 22)]
+
+        i1 = Index(dt_dates, dtype=object)
+        i2 = Index(['aa'], dtype=object)
+        result = i2.intersection(i1)
+
+        assert len(result) == 0
+
+    def test_union(self):
+        # TODO: Replace with fixturesult
+        first = self.strIndex[5:20]
+        second = self.strIndex[:10]
+        everything = self.strIndex[:20]
+
+        union = first.union(second)
+        assert tm.equalContents(union, everything)
+
+    @pytest.mark.parametrize("klass", [
+        np.array, Series, list])
+    def test_union_from_iterables(self, klass):
+        # GH 10149
+        # TODO: Replace with fixturesult
+        first = self.strIndex[5:20]
+        second = self.strIndex[:10]
+        everything = self.strIndex[:20]
+
+        case = klass(second.values)
+        result = first.union(case)
+        assert tm.equalContents(result, everything)
+
+    def test_union_identity(self):
+        # TODO: replace with fixturesult
+        first = self.strIndex[5:20]
+
+        union = first.union(first)
+        assert union is first
+
+        union = first.union([])
+        assert union is first
+
+        union = Index([]).union(first)
+        assert union is first
+
+    @pytest.mark.parametrize("first_list", [list('ab'), list()])
+    @pytest.mark.parametrize("second_list", [list('ab'), list()])
+    @pytest.mark.parametrize("first_name, second_name, expected_name", [
+        ('A', 'B', None), (None, 'B', 'B'), ('A', None, 'A')])
+    def test_union_name_preservation(self, first_list, second_list, first_name,
+                                     second_name, expected_name):
+        first = Index(first_list, name=first_name)
+        second = Index(second_list, name=second_name)
+        union = first.union(second)
+
+        vals = sorted(set(first_list).union(second_list))
+        expected = Index(vals, name=expected_name)
+        tm.assert_index_equal(union, expected)
+
+    def test_union_dt_as_obj(self):
+        # TODO: Replace with fixturesult
+        with tm.assert_produces_warning(RuntimeWarning):
+            firstCat = self.strIndex.union(self.dateIndex)
+        secondCat = self.strIndex.union(self.strIndex)
+
+        if self.dateIndex.dtype == np.object_:
+            appended = np.append(self.strIndex, self.dateIndex)
+        else:
+            appended = np.append(self.strIndex, self.dateIndex.astype('O'))
+
+        assert tm.equalContents(firstCat, appended)
+        assert tm.equalContents(secondCat, self.strIndex)
+        tm.assert_contains_all(self.strIndex, firstCat)
+        tm.assert_contains_all(self.strIndex, secondCat)
+        tm.assert_contains_all(self.dateIndex, firstCat)
+
+    def test_add(self):
+        index = self.strIndex
+        expected = Index(self.strIndex.values * 2)
+        tm.assert_index_equal(index + index, expected)
+        tm.assert_index_equal(index + index.tolist(), expected)
+        tm.assert_index_equal(index.tolist() + index, expected)
+
+        # test add and radd
+        index = Index(list('abc'))
+        expected = Index(['a1', 'b1', 'c1'])
+        tm.assert_index_equal(index + '1', expected)
+        expected = Index(['1a', '1b', '1c'])
+        tm.assert_index_equal('1' + index, expected)
+
+    def test_sub(self):
+        index = self.strIndex
+        pytest.raises(TypeError, lambda: index - 'a')
+        pytest.raises(TypeError, lambda: index - index)
+        pytest.raises(TypeError, lambda: index - index.tolist())
+        pytest.raises(TypeError, lambda: index.tolist() - index)
+
+    def test_map_identity_mapping(self):
+        # GH 12766
+        # TODO: replace with fixture
+        for name, cur_index in self.indices.items():
+            tm.assert_index_equal(cur_index, cur_index.map(lambda x: x))
+
+    def test_map_with_tuples(self):
+        # GH 12766
+
+        # Test that returning a single tuple from an Index
+        #   returns an Index.
+        index = tm.makeIntIndex(3)
+        result = tm.makeIntIndex(3).map(lambda x: (x,))
+        expected = Index([(i,) for i in index])
+        tm.assert_index_equal(result, expected)
+
+        # Test that returning a tuple from a map of a single index
+        #   returns a MultiIndex object.
+        result = index.map(lambda x: (x, x == 1))
+        expected = MultiIndex.from_tuples([(i, i == 1) for i in index])
+        tm.assert_index_equal(result, expected)
+
+    def test_map_with_tuples_mi(self):
+        # Test that returning a single object from a MultiIndex
+        #   returns an Index.
+        first_level = ['foo', 'bar', 'baz']
+        multi_index = MultiIndex.from_tuples(lzip(first_level, [1, 2, 3]))
+        reduced_index = multi_index.map(lambda x: x[0])
+        tm.assert_index_equal(reduced_index, Index(first_level))
+
+    @pytest.mark.parametrize("attr", [
+        'makeDateIndex', 'makePeriodIndex', 'makeTimedeltaIndex'])
+    def test_map_tseries_indices_return_index(self, attr):
+        index = getattr(tm, attr)(10)
+        expected = Index([1] * 10)
+        result = index.map(lambda x: 1)
+        tm.assert_index_equal(expected, result)
+
+    def test_map_tseries_indices_accsr_return_index(self):
+        date_index = tm.makeDateIndex(24, freq='h', name='hourly')
+        expected = Index(range(24), name='hourly')
+        tm.assert_index_equal(expected, date_index.map(lambda x: x.hour))
+
+    @pytest.mark.parametrize(
+        "mapper",
+        [
+            lambda values, index: {i: e for e, i in zip(values, index)},
+            lambda values, index: pd.Series(values, index)])
+    def test_map_dictlike(self, mapper):
+        # GH 12756
+        expected = Index(['foo', 'bar', 'baz'])
+        index = tm.makeIntIndex(3)
+        result = index.map(mapper(expected.values, index))
+        tm.assert_index_equal(result, expected)
+
+        # TODO: replace with fixture
+        for name in self.indices.keys():
+            if name == 'catIndex':
+                # Tested in test_categorical
+                continue
+            elif name == 'repeats':
+                # Cannot map duplicated index
+                continue
+
+            index = self.indices[name]
+            expected = Index(np.arange(len(index), 0, -1))
+
+            # to match proper result coercion for uints
+            if name == 'empty':
+                expected = Index([])
+
+            result = index.map(mapper(expected, index))
+            tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("mapper", [
+        Series(['foo', 2., 'baz'], index=[0, 2, -1]),
+        {0: 'foo', 2: 2.0, -1: 'baz'}])
+    def test_map_with_non_function_missing_values(self, mapper):
+        # GH 12756
+        expected = Index([2., np.nan, 'foo'])
+        result = Index([2, 1, 0]).map(mapper)
+
+        tm.assert_index_equal(expected, result)
+
+    def test_map_na_exclusion(self):
+        index = Index([1.5, np.nan, 3, np.nan, 5])
+
+        result = index.map(lambda x: x * 2, na_action='ignore')
+        expected = index * 2
+        tm.assert_index_equal(result, expected)
+
+    def test_map_defaultdict(self):
+        index = Index([1, 2, 3])
+        default_dict = defaultdict(lambda: 'blank')
+        default_dict[1] = 'stuff'
+        result = index.map(default_dict)
+        expected = Index(['stuff', 'blank', 'blank'])
+        tm.assert_index_equal(result, expected)
+
+    def test_append_multiple(self):
+        index = Index(['a', 'b', 'c', 'd', 'e', 'f'])
+
+        foos = [index[:2], index[2:4], index[4:]]
+        result = foos[0].append(foos[1:])
+        tm.assert_index_equal(result, index)
+
+        # empty
+        result = index.append([])
+        tm.assert_index_equal(result, index)
+
+    @pytest.mark.parametrize("name,expected", [
+        ('foo', 'foo'), ('bar', None)])
+    def test_append_empty_preserve_name(self, name, expected):
+        left = Index([], name='foo')
+        right = Index([1, 2, 3], name=name)
+
+        result = left.append(right)
+        assert result.name == expected
+
+    def test_add_string(self):
+        # from bug report
+        index = Index(['a', 'b', 'c'])
+        index2 = index + 'foo'
+
+        assert 'a' not in index2
+        assert 'afoo' in index2
+
+    def test_iadd_string(self):
+        index = pd.Index(['a', 'b', 'c'])
+        # doesn't fail test unless there is a check before `+=`
+        assert 'a' in index
+
+        index += '_x'
+        assert 'a_x' in index
+
+    @pytest.mark.parametrize("second_name,expected", [
+        (None, None), ('name', 'name')])
+    def test_difference_name_preservation(self, second_name, expected):
+        # TODO: replace with fixturesult
+        first = self.strIndex[5:20]
+        second = self.strIndex[:10]
+        answer = self.strIndex[10:20]
+
+        first.name = 'name'
+        second.name = second_name
+        result = first.difference(second)
+
+        assert tm.equalContents(result, answer)
+
+        if expected is None:
+            assert result.name is None
+        else:
+            assert result.name == expected
+
+    def test_difference_empty_arg(self):
+        first = self.strIndex[5:20]
+        first.name == 'name'
+        result = first.difference([])
+
+        assert tm.equalContents(result, first)
+        assert result.name == first.name
+
+    def test_difference_identity(self):
+        first = self.strIndex[5:20]
+        first.name == 'name'
+        result = first.difference(first)
+
+        assert len(result) == 0
+        assert result.name == first.name
+
+    def test_symmetric_difference(self):
+        # smoke
+        index1 = Index([1, 2, 3, 4], name='index1')
+        index2 = Index([2, 3, 4, 5])
+        result = index1.symmetric_difference(index2)
+        expected = Index([1, 5])
+        assert tm.equalContents(result, expected)
+        assert result.name is None
+
+        # __xor__ syntax
+        expected = index1 ^ index2
+        assert tm.equalContents(result, expected)
+        assert result.name is None
+
+    def test_symmetric_difference_mi(self):
+        index1 = MultiIndex.from_tuples(self.tuples)
+        index2 = MultiIndex.from_tuples([('foo', 1), ('bar', 3)])
+        result = index1.symmetric_difference(index2)
+        expected = MultiIndex.from_tuples([('bar', 2), ('baz', 3), ('bar', 3)])
+        assert tm.equalContents(result, expected)
+
+    @pytest.mark.parametrize("index2,expected", [
+        (Index([0, 1, np.nan]), Index([0.0, 2.0, 3.0])),
+        (Index([0, 1]), Index([0.0, 2.0, 3.0, np.nan]))])
+    def test_symmetric_difference_missing(self, index2, expected):
+        # GH 13514 change: {nan} - {nan} == {}
+        # (GH 6444, sorting of nans, is no longer an issue)
+        index1 = Index([1, np.nan, 2, 3])
+
+        result = index1.symmetric_difference(index2)
+        tm.assert_index_equal(result, expected)
+
+    def test_symmetric_difference_non_index(self):
+        index1 = Index([1, 2, 3, 4], name='index1')
+        index2 = np.array([2, 3, 4, 5])
+        expected = Index([1, 5])
+        result = index1.symmetric_difference(index2)
+        assert tm.equalContents(result, expected)
+        assert result.name == 'index1'
+
+        result = index1.symmetric_difference(index2, result_name='new_name')
+        assert tm.equalContents(result, expected)
+        assert result.name == 'new_name'
+
+    def test_difference_type(self):
+        # GH 20040
+        # If taking difference of a set and itself, it
+        # needs to preserve the type of the index
+        skip_index_keys = ['repeats']
+        for key, index in self.generate_index_types(skip_index_keys):
+            result = index.difference(index)
+            expected = index.drop(index)
+            tm.assert_index_equal(result, expected)
+
+    def test_intersection_difference(self):
+        # GH 20040
+        # Test that the intersection of an index with an
+        # empty index produces the same index as the difference
+        # of an index with itself.  Test for all types
+        skip_index_keys = ['repeats']
+        for key, index in self.generate_index_types(skip_index_keys):
+            inter = index.intersection(index.drop(index))
+            diff = index.difference(index)
+            tm.assert_index_equal(inter, diff)
+
+    @pytest.mark.parametrize("attr,expected", [
+        ('strIndex', False), ('boolIndex', False), ('catIndex', False),
+        ('intIndex', True), ('dateIndex', False), ('floatIndex', True)])
+    def test_is_numeric(self, attr, expected):
+        assert getattr(self, attr).is_numeric() == expected
+
+    @pytest.mark.parametrize("attr,expected", [
+        ('strIndex', True), ('boolIndex', True), ('catIndex', False),
+        ('intIndex', False), ('dateIndex', False), ('floatIndex', False)])
+    def test_is_object(self, attr, expected):
+        assert getattr(self, attr).is_object() == expected
+
+    @pytest.mark.parametrize("attr,expected", [
+        ('strIndex', False), ('boolIndex', False), ('catIndex', False),
+        ('intIndex', False), ('dateIndex', True), ('floatIndex', False)])
+    def test_is_all_dates(self, attr, expected):
+        assert getattr(self, attr).is_all_dates == expected
+
+    def test_summary(self):
+        self._check_method_works(Index._summary)
+        # GH3869
+        ind = Index(['{other}%s', "~:{range}:0"], name='A')
+        result = ind._summary()
+        # shouldn't be formatted accidentally.
+        assert '~:{range}:0' in result
+        assert '{other}%s' in result
+
+    # GH18217
+    def test_summary_deprecated(self):
+        ind = Index(['{other}%s', "~:{range}:0"], name='A')
+
+        with tm.assert_produces_warning(FutureWarning):
+            ind.summary()
+
+    def test_format(self):
+        self._check_method_works(Index.format)
+
+        # GH 14626
+        # windows has different precision on datetime.datetime.now (it doesn't
+        # include us since the default for Timestamp shows these but Index
+        # formatting does not we are skipping)
+        now = datetime.now()
+        if not str(now).endswith("000"):
+            index = Index([now])
+            formatted = index.format()
+            expected = [str(index[0])]
+            assert formatted == expected
+
+        self.strIndex[:0].format()
+
+    @pytest.mark.parametrize("vals", [
+        [1, 2.0 + 3.0j, 4.], ['a', 'b', 'c']])
+    def test_format_missing(self, vals, nulls_fixture):
+        # 2845
+        vals = list(vals)  # Copy for each iteration
+        vals.append(nulls_fixture)
+        index = Index(vals)
+
+        formatted = index.format()
+        expected = [str(index[0]), str(index[1]), str(index[2]), u('NaN')]
+
+        assert formatted == expected
+        assert index[3] is nulls_fixture
+
+    def test_format_with_name_time_info(self):
+        # bug I fixed 12/20/2011
+        inc = timedelta(hours=4)
+        dates = Index([dt + inc for dt in self.dateIndex], name='something')
+
+        formatted = dates.format(name=True)
+        assert formatted[0] == 'something'
+
+    def test_format_datetime_with_time(self):
+        t = Index([datetime(2012, 2, 7), datetime(2012, 2, 7, 23)])
+
+        result = t.format()
+        expected = ['2012-02-07 00:00:00', '2012-02-07 23:00:00']
+        assert len(result) == 2
+        assert result == expected
+
+    @pytest.mark.parametrize("op", ['any', 'all'])
+    def test_logical_compat(self, op):
+        index = self.create_index()
+        assert getattr(index, op)() == getattr(index.values, op)()
+
+    def _check_method_works(self, method):
+        # TODO: make this a dedicated test with parametrized methods
+        method(self.empty)
+        method(self.dateIndex)
+        method(self.unicodeIndex)
+        method(self.strIndex)
+        method(self.intIndex)
+        method(self.tuples)
+        method(self.catIndex)
+
+    def test_get_indexer(self):
+        index1 = Index([1, 2, 3, 4, 5])
+        index2 = Index([2, 4, 6])
+
+        r1 = index1.get_indexer(index2)
+        e1 = np.array([1, 3, -1], dtype=np.intp)
+        assert_almost_equal(r1, e1)
+
+    @pytest.mark.parametrize("reverse", [True, False])
+    @pytest.mark.parametrize("expected,method", [
+        (np.array([-1, 0, 0, 1, 1], dtype=np.intp), 'pad'),
+        (np.array([-1, 0, 0, 1, 1], dtype=np.intp), 'ffill'),
+        (np.array([0, 0, 1, 1, 2], dtype=np.intp), 'backfill'),
+        (np.array([0, 0, 1, 1, 2], dtype=np.intp), 'bfill')])
+    def test_get_indexer_methods(self, reverse, expected, method):
+        index1 = Index([1, 2, 3, 4, 5])
+        index2 = Index([2, 4, 6])
+
+        if reverse:
+            index1 = index1[::-1]
+            expected = expected[::-1]
+
+        result = index2.get_indexer(index1, method=method)
+        assert_almost_equal(result, expected)
+
+    def test_get_indexer_invalid(self):
+        # GH10411
+        index = Index(np.arange(10))
+
+        with tm.assert_raises_regex(ValueError, 'tolerance argument'):
+            index.get_indexer([1, 0], tolerance=1)
+
+        with tm.assert_raises_regex(ValueError, 'limit argument'):
+            index.get_indexer([1, 0], limit=1)
+
+    @pytest.mark.parametrize(
+        'method, tolerance, indexer, expected',
+        [
+            ('pad', None, [0, 5, 9], [0, 5, 9]),
+            ('backfill', None, [0, 5, 9], [0, 5, 9]),
+            ('nearest', None, [0, 5, 9], [0, 5, 9]),
+            ('pad', 0, [0, 5, 9], [0, 5, 9]),
+            ('backfill', 0, [0, 5, 9], [0, 5, 9]),
+            ('nearest', 0, [0, 5, 9], [0, 5, 9]),
+
+            ('pad', None, [0.2, 1.8, 8.5], [0, 1, 8]),
+            ('backfill', None, [0.2, 1.8, 8.5], [1, 2, 9]),
+            ('nearest', None, [0.2, 1.8, 8.5], [0, 2, 9]),
+            ('pad', 1, [0.2, 1.8, 8.5], [0, 1, 8]),
+            ('backfill', 1, [0.2, 1.8, 8.5], [1, 2, 9]),
+            ('nearest', 1, [0.2, 1.8, 8.5], [0, 2, 9]),
+
+            ('pad', 0.2, [0.2, 1.8, 8.5], [0, -1, -1]),
+            ('backfill', 0.2, [0.2, 1.8, 8.5], [-1, 2, -1]),
+            ('nearest', 0.2, [0.2, 1.8, 8.5], [0, 2, -1])])
+    def test_get_indexer_nearest(self, method, tolerance, indexer, expected):
+        index = Index(np.arange(10))
+
+        actual = index.get_indexer(indexer, method=method, tolerance=tolerance)
+        tm.assert_numpy_array_equal(actual, np.array(expected,
+                                                     dtype=np.intp))
+
+    @pytest.mark.parametrize('listtype', [list, tuple, Series, np.array])
+    @pytest.mark.parametrize(
+        'tolerance, expected',
+        list(zip([[0.3, 0.3, 0.1], [0.2, 0.1, 0.1],
+                  [0.1, 0.5, 0.5]],
+                 [[0, 2, -1], [0, -1, -1],
+                  [-1, 2, 9]])))
+    def test_get_indexer_nearest_listlike_tolerance(self, tolerance,
+                                                    expected, listtype):
+        index = Index(np.arange(10))
+
+        actual = index.get_indexer([0.2, 1.8, 8.5], method='nearest',
+                                   tolerance=listtype(tolerance))
+        tm.assert_numpy_array_equal(actual, np.array(expected,
+                                                     dtype=np.intp))
+
+    def test_get_indexer_nearest_error(self):
+        index = Index(np.arange(10))
+        with tm.assert_raises_regex(ValueError, 'limit argument'):
+            index.get_indexer([1, 0], method='nearest', limit=1)
+
+        with pytest.raises(ValueError, match='tolerance size must match'):
+            index.get_indexer([1, 0], method='nearest',
+                              tolerance=[1, 2, 3])
+
+    @pytest.mark.parametrize("method,expected", [
+        ('pad', [8, 7, 0]), ('backfill', [9, 8, 1]), ('nearest', [9, 7, 0])])
+    def test_get_indexer_nearest_decreasing(self, method, expected):
+        index = Index(np.arange(10))[::-1]
+
+        actual = index.get_indexer([0, 5, 9], method=method)
+        tm.assert_numpy_array_equal(actual, np.array([9, 4, 0], dtype=np.intp))
+
+        actual = index.get_indexer([0.2, 1.8, 8.5], method=method)
+        tm.assert_numpy_array_equal(actual, np.array(expected, dtype=np.intp))
+
+    @pytest.mark.parametrize("method,expected", [
+        ('pad', np.array([-1, 0, 1, 1], dtype=np.intp)),
+        ('backfill', np.array([0, 0, 1, -1], dtype=np.intp))])
+    def test_get_indexer_strings(self, method, expected):
+        index = pd.Index(['b', 'c'])
+        actual = index.get_indexer(['a', 'b', 'c', 'd'], method=method)
+
+        tm.assert_numpy_array_equal(actual, expected)
+
+    def test_get_indexer_strings_raises(self):
+        index = pd.Index(['b', 'c'])
+
+        with pytest.raises(TypeError):
+            index.get_indexer(['a', 'b', 'c', 'd'], method='nearest')
+
+        with pytest.raises(TypeError):
+            index.get_indexer(['a', 'b', 'c', 'd'], method='pad', tolerance=2)
+
+        with pytest.raises(TypeError):
+            index.get_indexer(['a', 'b', 'c', 'd'], method='pad',
+                              tolerance=[2, 2, 2, 2])
+
+    def test_get_indexer_numeric_index_boolean_target(self):
+        # GH 16877
+        numeric_index = pd.Index(range(4))
+        result = numeric_index.get_indexer([True, False, True])
+        expected = np.array([-1, -1, -1], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize("method", [None, 'pad', 'backfill', 'nearest'])
+    def test_get_loc(self, method):
+        index = pd.Index([0, 1, 2])
+        assert index.get_loc(1, method=method) == 1
+
+        if method:
+            assert index.get_loc(1, method=method, tolerance=0) == 1
+
+    @pytest.mark.parametrize("method", [None, 'pad', 'backfill', 'nearest'])
+    def test_get_loc_raises_bad_label(self, method):
+        index = pd.Index([0, 1, 2])
+        if method:
+            # Messages vary across versions
+            if PY36:
+                msg = 'not supported between'
+            elif PY35:
+                msg = 'unorderable types'
+            else:
+                if method == 'nearest':
+                    msg = 'unsupported operand'
+                else:
+                    msg = 'requires scalar valued input'
+        else:
+            msg = 'invalid key'
+
+        with tm.assert_raises_regex(TypeError, msg):
+            index.get_loc([1, 2], method=method)
+
+    @pytest.mark.parametrize("method,loc", [
+        ('pad', 1), ('backfill', 2), ('nearest', 1)])
+    def test_get_loc_tolerance(self, method, loc):
+        index = pd.Index([0, 1, 2])
+        assert index.get_loc(1.1, method) == loc
+        assert index.get_loc(1.1, method, tolerance=1) == loc
+
+    @pytest.mark.parametrize("method", ['pad', 'backfill', 'nearest'])
+    def test_get_loc_outside_tolerance_raises(self, method):
+        index = pd.Index([0, 1, 2])
+        with tm.assert_raises_regex(KeyError, '1.1'):
+            index.get_loc(1.1, method, tolerance=0.05)
+
+    def test_get_loc_bad_tolerance_raises(self):
+        index = pd.Index([0, 1, 2])
+        with tm.assert_raises_regex(ValueError, 'must be numeric'):
+            index.get_loc(1.1, 'nearest', tolerance='invalid')
+
+    def test_get_loc_tolerance_no_method_raises(self):
+        index = pd.Index([0, 1, 2])
+        with tm.assert_raises_regex(ValueError, 'tolerance .* valid if'):
+            index.get_loc(1.1, tolerance=1)
+
+    def test_get_loc_raises_missized_tolerance(self):
+        index = pd.Index([0, 1, 2])
+        with tm.assert_raises_regex(ValueError, 'tolerance size must match'):
+            index.get_loc(1.1, 'nearest', tolerance=[1, 1])
+
+    def test_get_loc_raises_object_nearest(self):
+        index = pd.Index(['a', 'c'])
+        with tm.assert_raises_regex(TypeError, 'unsupported operand type'):
+            index.get_loc('a', method='nearest')
+
+    def test_get_loc_raises_object_tolerance(self):
+        index = pd.Index(['a', 'c'])
+        with tm.assert_raises_regex(TypeError, 'unsupported operand type'):
+            index.get_loc('a', method='pad', tolerance='invalid')
+
+    @pytest.mark.parametrize("dtype", [int, float])
+    def test_slice_locs(self, dtype):
+        index = Index(np.array([0, 1, 2, 5, 6, 7, 9, 10], dtype=dtype))
+        n = len(index)
+
+        assert index.slice_locs(start=2) == (2, n)
+        assert index.slice_locs(start=3) == (3, n)
+        assert index.slice_locs(3, 8) == (3, 6)
+        assert index.slice_locs(5, 10) == (3, n)
+        assert index.slice_locs(end=8) == (0, 6)
+        assert index.slice_locs(end=9) == (0, 7)
+
+        # reversed
+        index2 = index[::-1]
+        assert index2.slice_locs(8, 2) == (2, 6)
+        assert index2.slice_locs(7, 3) == (2, 5)
+
+    def test_slice_float_locs(self):
+        index = Index(np.array([0, 1, 2, 5, 6, 7, 9, 10], dtype=float))
+        n = len(index)
+        assert index.slice_locs(5.0, 10.0) == (3, n)
+        assert index.slice_locs(4.5, 10.5) == (3, 8)
+
+        index2 = index[::-1]
+        assert index2.slice_locs(8.5, 1.5) == (2, 6)
+        assert index2.slice_locs(10.5, -1) == (0, n)
+
+    @pytest.mark.xfail(reason="Assertions were not correct - see GH 20915")
+    def test_slice_ints_with_floats_raises(self):
+        # int slicing with floats
+        # GH 4892, these are all TypeErrors
+        index = Index(np.array([0, 1, 2, 5, 6, 7, 9, 10], dtype=int))
+        n = len(index)
+
+        pytest.raises(TypeError,
+                      lambda: index.slice_locs(5.0, 10.0))
+        pytest.raises(TypeError,
+                      lambda: index.slice_locs(4.5, 10.5))
+
+        index2 = index[::-1]
+        pytest.raises(TypeError,
+                      lambda: index2.slice_locs(8.5, 1.5), (2, 6))
+        pytest.raises(TypeError,
+                      lambda: index2.slice_locs(10.5, -1), (0, n))
+
+    def test_slice_locs_dup(self):
+        index = Index(['a', 'a', 'b', 'c', 'd', 'd'])
+        assert index.slice_locs('a', 'd') == (0, 6)
+        assert index.slice_locs(end='d') == (0, 6)
+        assert index.slice_locs('a', 'c') == (0, 4)
+        assert index.slice_locs('b', 'd') == (2, 6)
+
+        index2 = index[::-1]
+        assert index2.slice_locs('d', 'a') == (0, 6)
+        assert index2.slice_locs(end='a') == (0, 6)
+        assert index2.slice_locs('d', 'b') == (0, 4)
+        assert index2.slice_locs('c', 'a') == (2, 6)
+
+    @pytest.mark.parametrize("dtype", [int, float])
+    def test_slice_locs_dup_numeric(self, dtype):
+        index = Index(np.array([10, 12, 12, 14], dtype=dtype))
+        assert index.slice_locs(12, 12) == (1, 3)
+        assert index.slice_locs(11, 13) == (1, 3)
+
+        index2 = index[::-1]
+        assert index2.slice_locs(12, 12) == (1, 3)
+        assert index2.slice_locs(13, 11) == (1, 3)
+
+    def test_slice_locs_na(self):
+        index = Index([np.nan, 1, 2])
+        assert index.slice_locs(1) == (1, 3)
+        assert index.slice_locs(np.nan) == (0, 3)
+
+        index = Index([0, np.nan, np.nan, 1, 2])
+        assert index.slice_locs(np.nan) == (1, 5)
+
+    def test_slice_locs_na_raises(self):
+        index = Index([np.nan, 1, 2])
+        with tm.assert_raises_regex(KeyError, ''):
+            index.slice_locs(start=1.5)
+
+        with tm.assert_raises_regex(KeyError, ''):
+            index.slice_locs(end=1.5)
+
+    @pytest.mark.parametrize("in_slice,expected", [
+        (pd.IndexSlice[::-1], 'yxdcb'), (pd.IndexSlice['b':'y':-1], ''),
+        (pd.IndexSlice['b'::-1], 'b'), (pd.IndexSlice[:'b':-1], 'yxdcb'),
+        (pd.IndexSlice[:'y':-1], 'y'), (pd.IndexSlice['y'::-1], 'yxdcb'),
+        (pd.IndexSlice['y'::-4], 'yb'),
+        # absent labels
+        (pd.IndexSlice[:'a':-1], 'yxdcb'), (pd.IndexSlice[:'a':-2], 'ydb'),
+        (pd.IndexSlice['z'::-1], 'yxdcb'), (pd.IndexSlice['z'::-3], 'yc'),
+        (pd.IndexSlice['m'::-1], 'dcb'), (pd.IndexSlice[:'m':-1], 'yx'),
+        (pd.IndexSlice['a':'a':-1], ''), (pd.IndexSlice['z':'z':-1], ''),
+        (pd.IndexSlice['m':'m':-1], '')
+    ])
+    def test_slice_locs_negative_step(self, in_slice, expected):
+        index = Index(list('bcdxy'))
+
+        s_start, s_stop = index.slice_locs(in_slice.start, in_slice.stop,
+                                           in_slice.step)
+        result = index[s_start:s_stop:in_slice.step]
+        expected = pd.Index(list(expected))
+        tm.assert_index_equal(result, expected)
+
+    def test_drop_by_str_label(self):
+        # TODO: Parametrize these after replacing self.strIndex with fixture
+        n = len(self.strIndex)
+        drop = self.strIndex[lrange(5, 10)]
+        dropped = self.strIndex.drop(drop)
+
+        expected = self.strIndex[lrange(5) + lrange(10, n)]
+        tm.assert_index_equal(dropped, expected)
+
+        dropped = self.strIndex.drop(self.strIndex[0])
+        expected = self.strIndex[1:]
+        tm.assert_index_equal(dropped, expected)
+
+    @pytest.mark.parametrize("keys", [['foo', 'bar'], ['1', 'bar']])
+    def test_drop_by_str_label_raises_missing_keys(self, keys):
+        with tm.assert_raises_regex(KeyError, ''):
+            self.strIndex.drop(keys)
+
+    def test_drop_by_str_label_errors_ignore(self):
+        # TODO: Parametrize these after replacing self.strIndex with fixture
+
+        # errors='ignore'
+        n = len(self.strIndex)
+        drop = self.strIndex[lrange(5, 10)]
+        mixed = drop.tolist() + ['foo']
+        dropped = self.strIndex.drop(mixed, errors='ignore')
+
+        expected = self.strIndex[lrange(5) + lrange(10, n)]
+        tm.assert_index_equal(dropped, expected)
+
+        dropped = self.strIndex.drop(['foo', 'bar'], errors='ignore')
+        expected = self.strIndex[lrange(n)]
+        tm.assert_index_equal(dropped, expected)
+
+    def test_drop_by_numeric_label_loc(self):
+        # TODO: Parametrize numeric and str tests after self.strIndex fixture
+        index = Index([1, 2, 3])
+        dropped = index.drop(1)
+        expected = Index([2, 3])
+
+        tm.assert_index_equal(dropped, expected)
+
+    def test_drop_by_numeric_label_raises_missing_keys(self):
+        index = Index([1, 2, 3])
+        with tm.assert_raises_regex(KeyError, ''):
+            index.drop([3, 4])
+
+    @pytest.mark.parametrize("key,expected", [
+        (4, Index([1, 2, 3])), ([3, 4, 5], Index([1, 2]))])
+    def test_drop_by_numeric_label_errors_ignore(self, key, expected):
+        index = Index([1, 2, 3])
+        dropped = index.drop(key, errors='ignore')
+
+        tm.assert_index_equal(dropped, expected)
+
+    @pytest.mark.parametrize("values", [['a', 'b', ('c', 'd')],
+                                        ['a', ('c', 'd'), 'b'],
+                                        [('c', 'd'), 'a', 'b']])
+    @pytest.mark.parametrize("to_drop", [[('c', 'd'), 'a'], ['a', ('c', 'd')]])
+    def test_drop_tuple(self, values, to_drop):
+        # GH 18304
+        index = pd.Index(values)
+        expected = pd.Index(['b'])
+
+        result = index.drop(to_drop)
+        tm.assert_index_equal(result, expected)
+
+        removed = index.drop(to_drop[0])
+        for drop_me in to_drop[1], [to_drop[1]]:
+            result = removed.drop(drop_me)
+            tm.assert_index_equal(result, expected)
+
+        removed = index.drop(to_drop[1])
+        for drop_me in to_drop[1], [to_drop[1]]:
+            pytest.raises(KeyError, removed.drop, drop_me)
+
+    @pytest.mark.parametrize("method,expected", [
+        ('intersection', np.array([(1, 'A'), (2, 'A'), (1, 'B'), (2, 'B')],
+                                  dtype=[('num', int), ('let', 'a1')])),
+        ('union', np.array([(1, 'A'), (2, 'A'), (1, 'B'), (2, 'B'), (1, 'C'),
+                            (2, 'C')], dtype=[('num', int), ('let', 'a1')]))
+    ])
+    def test_tuple_union_bug(self, method, expected):
+        index1 = Index(np.array([(1, 'A'), (2, 'A'), (1, 'B'), (2, 'B')],
+                                dtype=[('num', int), ('let', 'a1')]))
+        index2 = Index(np.array([(1, 'A'), (2, 'A'), (1, 'B'),
+                                 (2, 'B'), (1, 'C'), (2, 'C')],
+                                dtype=[('num', int), ('let', 'a1')]))
+
+        result = getattr(index1, method)(index2)
+        assert result.ndim == 1
+
+        expected = Index(expected)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("attr", [
+        'is_monotonic_increasing', 'is_monotonic_decreasing',
+        '_is_strictly_monotonic_increasing',
+        '_is_strictly_monotonic_decreasing'])
+    def test_is_monotonic_incomparable(self, attr):
+        index = Index([5, datetime.now(), 7])
+        assert not getattr(index, attr)
+
+    def test_get_set_value(self):
+        # TODO: Remove function? GH 19728
+        values = np.random.randn(100)
+        date = self.dateIndex[67]
+
+        assert_almost_equal(self.dateIndex.get_value(values, date), values[67])
+
+        self.dateIndex.set_value(values, date, 10)
+        assert values[67] == 10
+
+    @pytest.mark.parametrize("values", [
+        ['foo', 'bar', 'quux'], {'foo', 'bar', 'quux'}])
+    @pytest.mark.parametrize("index,expected", [
+        (Index(['qux', 'baz', 'foo', 'bar']),
+         np.array([False, False, True, True])),
+        (Index([]), np.array([], dtype=bool))  # empty
+    ])
+    def test_isin(self, values, index, expected):
+        result = index.isin(values)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_isin_nan_common_object(self, nulls_fixture, nulls_fixture2):
+        # Test cartesian product of null fixtures and ensure that we don't
+        # mangle the various types (save a corner case with PyPy)
+
+        if PYPY and nulls_fixture is np.nan:  # np.nan is float('nan') on PyPy
+            tm.assert_numpy_array_equal(Index(['a', nulls_fixture]).isin(
+                [float('nan')]), np.array([False, True]))
+
+        elif nulls_fixture is nulls_fixture2:  # should preserve NA type
+            tm.assert_numpy_array_equal(Index(['a', nulls_fixture]).isin(
+                [nulls_fixture2]), np.array([False, True]))
+
+        else:
+            tm.assert_numpy_array_equal(Index(['a', nulls_fixture]).isin(
+                [nulls_fixture2]), np.array([False, False]))
+
+    def test_isin_nan_common_float64(self, nulls_fixture):
+        if nulls_fixture is pd.NaT:
+            pytest.skip("pd.NaT not compatible with Float64Index")
+
+        # Float64Index overrides isin, so must be checked separately
+        tm.assert_numpy_array_equal(Float64Index([1.0, nulls_fixture]).isin(
+            [np.nan]), np.array([False, True]))
+
+        # we cannot compare NaT with NaN
+        tm.assert_numpy_array_equal(Float64Index([1.0, nulls_fixture]).isin(
+            [pd.NaT]), np.array([False, False]))
+
+    @pytest.mark.parametrize("level", [0, -1])
+    @pytest.mark.parametrize("index", [
+        Index(['qux', 'baz', 'foo', 'bar']),
+        # Float64Index overrides isin, so must be checked separately
+        Float64Index([1.0, 2.0, 3.0, 4.0])])
+    def test_isin_level_kwarg(self, level, index):
+        values = index.tolist()[-2:] + ['nonexisting']
+
+        expected = np.array([False, False, True, True])
+        tm.assert_numpy_array_equal(expected, index.isin(values, level=level))
+
+        index.name = 'foobar'
+        tm.assert_numpy_array_equal(expected,
+                                    index.isin(values, level='foobar'))
+
+    @pytest.mark.parametrize("level", [1, 10, -2])
+    @pytest.mark.parametrize("index", [
+        Index(['qux', 'baz', 'foo', 'bar']),
+        # Float64Index overrides isin, so must be checked separately
+        Float64Index([1.0, 2.0, 3.0, 4.0])])
+    def test_isin_level_kwarg_raises_bad_index(self, level, index):
+        with tm.assert_raises_regex(IndexError, 'Too many levels'):
+            index.isin([], level=level)
+
+    @pytest.mark.parametrize("level", [1.0, 'foobar', 'xyzzy', np.nan])
+    @pytest.mark.parametrize("index", [
+        Index(['qux', 'baz', 'foo', 'bar']),
+        Float64Index([1.0, 2.0, 3.0, 4.0])])
+    def test_isin_level_kwarg_raises_key(self, level, index):
+        with tm.assert_raises_regex(KeyError, 'must be same as name'):
+            index.isin([], level=level)
+
+    @pytest.mark.parametrize("empty", [[], Series(), np.array([])])
+    def test_isin_empty(self, empty):
+        # see gh-16991
+        index = Index(["a", "b"])
+        expected = np.array([False, False])
+
+        result = index.isin(empty)
+        tm.assert_numpy_array_equal(expected, result)
+
+    @pytest.mark.parametrize("values", [
+        [1, 2, 3, 4],
+        [1., 2., 3., 4.],
+        [True, True, True, True],
+        ["foo", "bar", "baz", "qux"],
+        pd.date_range('2018-01-01', freq='D', periods=4)])
+    def test_boolean_cmp(self, values):
+        index = Index(values)
+        result = (index == values)
+        expected = np.array([True, True, True, True], dtype=bool)
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize("name,level", [
+        (None, 0), ('a', 'a')])
+    def test_get_level_values(self, name, level):
+        expected = self.strIndex.copy()
+        if name:
+            expected.name = name
+
+        result = expected.get_level_values(level)
+        tm.assert_index_equal(result, expected)
+
+    def test_slice_keep_name(self):
+        index = Index(['a', 'b'], name='asdf')
+        assert index.name == index[1:].name
+
+    # instance attributes of the form self.<name>Index
+    @pytest.mark.parametrize('index_kind',
+                             ['unicode', 'str', 'date', 'int', 'float'])
+    def test_join_self(self, join_type, index_kind):
+
+        res = getattr(self, '{0}Index'.format(index_kind))
+
+        joined = res.join(res, how=join_type)
+        assert res is joined
+
+    @pytest.mark.parametrize("method", ['strip', 'rstrip', 'lstrip'])
+    def test_str_attribute(self, method):
+        # GH9068
+        index = Index([' jack', 'jill ', ' jesse ', 'frank'])
+        expected = Index([getattr(str, method)(x) for x in index.values])
+
+        result = getattr(index.str, method)()
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("index", [
+        Index(range(5)), tm.makeDateIndex(10),
+        MultiIndex.from_tuples([('foo', '1'), ('bar', '3')]),
+        PeriodIndex(start='2000', end='2010', freq='A')])
+    def test_str_attribute_raises(self, index):
+        with tm.assert_raises_regex(AttributeError, 'only use .str accessor'):
+            index.str.repeat(2)
+
+    @pytest.mark.parametrize("expand,expected", [
+        (None, Index([['a', 'b', 'c'], ['d', 'e'], ['f']])),
+        (False, Index([['a', 'b', 'c'], ['d', 'e'], ['f']])),
+        (True, MultiIndex.from_tuples([('a', 'b', 'c'), ('d', 'e', np.nan),
+                                       ('f', np.nan, np.nan)]))])
+    def test_str_split(self, expand, expected):
+        index = Index(['a b c', 'd e', 'f'])
+        if expand is not None:
+            result = index.str.split(expand=expand)
+        else:
+            result = index.str.split()
+
+        tm.assert_index_equal(result, expected)
+
+    def test_str_bool_return(self):
+        # test boolean case, should return np.array instead of boolean Index
+        index = Index(['a1', 'a2', 'b1', 'b2'])
+        result = index.str.startswith('a')
+        expected = np.array([True, True, False, False])
+
+        tm.assert_numpy_array_equal(result, expected)
+        assert isinstance(result, np.ndarray)
+
+    def test_str_bool_series_indexing(self):
+        index = Index(['a1', 'a2', 'b1', 'b2'])
+        s = Series(range(4), index=index)
+
+        result = s[s.index.str.startswith('a')]
+        expected = Series(range(2), index=['a1', 'a2'])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("index,expected", [
+        (Index(list('abcd')), True), (Index(range(4)), False)])
+    def test_tab_completion(self, index, expected):
+        # GH 9910
+        result = 'str' in dir(index)
+        assert result == expected
+
+    def test_indexing_doesnt_change_class(self):
+        index = Index([1, 2, 3, 'a', 'b', 'c'])
+
+        assert index[1:3].identical(pd.Index([2, 3], dtype=np.object_))
+        assert index[[0, 1]].identical(pd.Index([1, 2], dtype=np.object_))
+
+    def test_outer_join_sort(self):
+        left_index = Index(np.random.permutation(15))
+        right_index = tm.makeDateIndex(10)
+
+        with tm.assert_produces_warning(RuntimeWarning):
+            result = left_index.join(right_index, how='outer')
+
+        # right_index in this case because DatetimeIndex has join precedence
+        # over Int64Index
+        with tm.assert_produces_warning(RuntimeWarning):
+            expected = right_index.astype(object).union(
+                left_index.astype(object))
+
+        tm.assert_index_equal(result, expected)
+
+    def test_nan_first_take_datetime(self):
+        index = Index([pd.NaT, Timestamp('20130101'), Timestamp('20130102')])
+        result = index.take([-1, 0, 1])
+        expected = Index([index[-1], index[0], index[1]])
+        tm.assert_index_equal(result, expected)
+
+    def test_take_fill_value(self):
+        # GH 12631
+        index = pd.Index(list('ABC'), name='xxx')
+        result = index.take(np.array([1, 0, -1]))
+        expected = pd.Index(list('BAC'), name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        # fill_value
+        result = index.take(np.array([1, 0, -1]), fill_value=True)
+        expected = pd.Index(['B', 'A', np.nan], name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        # allow_fill=False
+        result = index.take(np.array([1, 0, -1]), allow_fill=False,
+                            fill_value=True)
+        expected = pd.Index(['B', 'A', 'C'], name='xxx')
+        tm.assert_index_equal(result, expected)
+
+    def test_take_fill_value_none_raises(self):
+        index = pd.Index(list('ABC'), name='xxx')
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            index.take(np.array([1, 0, -2]), fill_value=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            index.take(np.array([1, 0, -5]), fill_value=True)
+
+    def test_take_bad_bounds_raises(self):
+        index = pd.Index(list('ABC'), name='xxx')
+        with tm.assert_raises_regex(IndexError, 'out of bounds'):
+            index.take(np.array([1, -5]))
+
+    @pytest.mark.parametrize("name", [None, 'foobar'])
+    @pytest.mark.parametrize("labels", [
+        [], np.array([]), ['A', 'B', 'C'], ['C', 'B', 'A'],
+        np.array(['A', 'B', 'C']), np.array(['C', 'B', 'A']),
+        # Must preserve name even if dtype changes
+        pd.date_range('20130101', periods=3).values,
+        pd.date_range('20130101', periods=3).tolist()])
+    def test_reindex_preserves_name_if_target_is_list_or_ndarray(self, name,
+                                                                 labels):
+        # GH6552
+        index = pd.Index([0, 1, 2])
+        index.name = name
+        assert index.reindex(labels)[0].name == name
+
+    @pytest.mark.parametrize("labels", [
+        [], np.array([]), np.array([], dtype=np.int64)])
+    def test_reindex_preserves_type_if_target_is_empty_list_or_array(self,
+                                                                     labels):
+        # GH7774
+        index = pd.Index(list('abc'))
+        assert index.reindex(labels)[0].dtype.type == np.object_
+
+    @pytest.mark.parametrize("labels,dtype", [
+        (pd.Int64Index([]), np.int64),
+        (pd.Float64Index([]), np.float64),
+        (pd.DatetimeIndex([]), np.datetime64)])
+    def test_reindex_doesnt_preserve_type_if_target_is_empty_index(self,
+                                                                   labels,
+                                                                   dtype):
+        # GH7774
+        index = pd.Index(list('abc'))
+        assert index.reindex(labels)[0].dtype.type == dtype
+
+    def test_reindex_no_type_preserve_target_empty_mi(self):
+        index = pd.Index(list('abc'))
+        result = index.reindex(pd.MultiIndex(
+            [pd.Int64Index([]), pd.Float64Index([])], [[], []]))[0]
+        assert result.levels[0].dtype.type == np.int64
+        assert result.levels[1].dtype.type == np.float64
+
+    def test_groupby(self):
+        index = Index(range(5))
+        result = index.groupby(np.array([1, 1, 2, 2, 2]))
+        expected = {1: pd.Index([0, 1]), 2: pd.Index([2, 3, 4])}
+
+        tm.assert_dict_equal(result, expected)
+
+    @pytest.mark.parametrize("mi,expected", [
+        (MultiIndex.from_tuples([(1, 2), (4, 5)]), np.array([True, True])),
+        (MultiIndex.from_tuples([(1, 2), (4, 6)]), np.array([True, False]))])
+    def test_equals_op_multiindex(self, mi, expected):
+        # GH9785
+        # test comparisons of multiindex
+        df = pd.read_csv(StringIO('a,b,c\n1,2,3\n4,5,6'), index_col=[0, 1])
+
+        result = df.index == mi
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_equals_op_multiindex_identify(self):
+        df = pd.read_csv(StringIO('a,b,c\n1,2,3\n4,5,6'), index_col=[0, 1])
+
+        result = df.index == df.index
+        expected = np.array([True, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize("index", [
+        MultiIndex.from_tuples([(1, 2), (4, 5), (8, 9)]),
+        Index(['foo', 'bar', 'baz'])])
+    def test_equals_op_mismatched_multiindex_raises(self, index):
+        df = pd.read_csv(StringIO('a,b,c\n1,2,3\n4,5,6'), index_col=[0, 1])
+
+        with tm.assert_raises_regex(ValueError, "Lengths must match"):
+            df.index == index
+
+    def test_equals_op_index_vs_mi_same_length(self):
+        mi = MultiIndex.from_tuples([(1, 2), (4, 5), (8, 9)])
+        index = Index(['foo', 'bar', 'baz'])
+
+        result = mi == index
+        expected = np.array([False, False, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize("dt_conv", [
+        pd.to_datetime, pd.to_timedelta])
+    def test_dt_conversion_preserves_name(self, dt_conv):
+        # GH 10875
+        index = pd.Index(['01:02:03', '01:02:04'], name='label')
+        assert index.name == dt_conv(index).name
+
+    @pytest.mark.skipif(not PY3, reason="compat test")
+    @pytest.mark.parametrize("index,expected", [
+        # ASCII
+        # short
+        (pd.Index(['a', 'bb', 'ccc']),
+         u"""Index(['a', 'bb', 'ccc'], dtype='object')"""),
+        # multiple lines
+        (pd.Index(['a', 'bb', 'ccc'] * 10),
+         u"""\
+Index(['a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc',
+       'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc',
+       'a', 'bb', 'ccc', 'a', 'bb', 'ccc'],
+      dtype='object')"""),
+        # truncated
+        (pd.Index(['a', 'bb', 'ccc'] * 100),
+         u"""\
+Index(['a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a',
+       ...
+       'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc'],
+      dtype='object', length=300)"""),
+
+        # Non-ASCII
+        # short
+        (pd.Index([u'あ', u'いい', u'ううう']),
+         u"""Index(['あ', 'いい', 'ううう'], dtype='object')"""),
+        # multiple lines
+        (pd.Index([u'あ', u'いい', u'ううう'] * 10),
+         (u"Index(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', "
+          u"'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',\n"
+          u"       'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', "
+          u"'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',\n"
+          u"       'あ', 'いい', 'ううう', 'あ', 'いい', "
+          u"'ううう'],\n"
+          u"      dtype='object')")),
+        # truncated
+        (pd.Index([u'あ', u'いい', u'ううう'] * 100),
+         (u"Index(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', "
+          u"'あ', 'いい', 'ううう', 'あ',\n"
+          u"       ...\n"
+          u"       'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', "
+          u"'ううう', 'あ', 'いい', 'ううう'],\n"
+          u"      dtype='object', length=300)"))])
+    def test_string_index_repr(self, index, expected):
+        result = repr(index)
+        assert result == expected
+
+    @pytest.mark.skipif(PY3, reason="compat test")
+    @pytest.mark.parametrize("index,expected", [
+        # ASCII
+        # short
+        (pd.Index(['a', 'bb', 'ccc']),
+         u"""Index([u'a', u'bb', u'ccc'], dtype='object')"""),
+        # multiple lines
+        (pd.Index(['a', 'bb', 'ccc'] * 10),
+         u"""\
+Index([u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a',
+       u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb',
+       u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc'],
+      dtype='object')"""),
+        # truncated
+        (pd.Index(['a', 'bb', 'ccc'] * 100),
+         u"""\
+Index([u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a',
+       ...
+       u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc'],
+      dtype='object', length=300)"""),
+
+        # Non-ASCII
+        # short
+        (pd.Index([u'あ', u'いい', u'ううう']),
+         u"""Index([u'あ', u'いい', u'ううう'], dtype='object')"""),
+        # multiple lines
+        (pd.Index([u'あ', u'いい', u'ううう'] * 10),
+         (u"Index([u'あ', u'いい', u'ううう', u'あ', u'いい', "
+          u"u'ううう', u'あ', u'いい', u'ううう', u'あ',\n"
+          u"       u'いい', u'ううう', u'あ', u'いい', u'ううう', "
+          u"u'あ', u'いい', u'ううう', u'あ', u'いい',\n"
+          u"       u'ううう', u'あ', u'いい', u'ううう', u'あ', "
+          u"u'いい', u'ううう', u'あ', u'いい', u'ううう'],\n"
+          u"      dtype='object')")),
+        # truncated
+        (pd.Index([u'あ', u'いい', u'ううう'] * 100),
+         (u"Index([u'あ', u'いい', u'ううう', u'あ', u'いい', "
+          u"u'ううう', u'あ', u'いい', u'ううう', u'あ',\n"
+          u"       ...\n"
+          u"       u'ううう', u'あ', u'いい', u'ううう', u'あ', "
+          u"u'いい', u'ううう', u'あ', u'いい', u'ううう'],\n"
+          u"      dtype='object', length=300)"))])
+    def test_string_index_repr_compat(self, index, expected):
+        result = unicode(index)  # noqa
+        assert result == expected
+
+    @pytest.mark.skipif(not PY3, reason="compat test")
+    @pytest.mark.parametrize("index,expected", [
+        # short
+        (pd.Index([u'あ', u'いい', u'ううう']),
+         (u"Index(['あ', 'いい', 'ううう'], "
+          u"dtype='object')")),
+        # multiple lines
+        (pd.Index([u'あ', u'いい', u'ううう'] * 10),
+         (u"Index(['あ', 'いい', 'ううう', 'あ', 'いい', "
+          u"'ううう', 'あ', 'いい', 'ううう',\n"
+          u"       'あ', 'いい', 'ううう', 'あ', 'いい', "
+          u"'ううう', 'あ', 'いい', 'ううう',\n"
+          u"       'あ', 'いい', 'ううう', 'あ', 'いい', "
+          u"'ううう', 'あ', 'いい', 'ううう',\n"
+          u"       'あ', 'いい', 'ううう'],\n"
+          u"      dtype='object')""")),
+        # truncated
+        (pd.Index([u'あ', u'いい', u'ううう'] * 100),
+         (u"Index(['あ', 'いい', 'ううう', 'あ', 'いい', "
+          u"'ううう', 'あ', 'いい', 'ううう',\n"
+          u"       'あ',\n"
+          u"       ...\n"
+          u"       'ううう', 'あ', 'いい', 'ううう', 'あ', "
+          u"'いい', 'ううう', 'あ', 'いい',\n"
+          u"       'ううう'],\n"
+          u"      dtype='object', length=300)"))])
+    def test_string_index_repr_with_unicode_option(self, index, expected):
+        # Enable Unicode option -----------------------------------------
+        with cf.option_context('display.unicode.east_asian_width', True):
+            result = repr(index)
+            assert result == expected
+
+    @pytest.mark.skipif(PY3, reason="compat test")
+    @pytest.mark.parametrize("index,expected", [
+        # short
+        (pd.Index([u'あ', u'いい', u'ううう']),
+         (u"Index([u'あ', u'いい', u'ううう'], "
+          u"dtype='object')")),
+        # multiple lines
+        (pd.Index([u'あ', u'いい', u'ううう'] * 10),
+         (u"Index([u'あ', u'いい', u'ううう', u'あ', u'いい', "
+          u"u'ううう', u'あ', u'いい',\n"
+          u"       u'ううう', u'あ', u'いい', u'ううう', "
+          u"u'あ', u'いい', u'ううう', u'あ',\n"
+          u"       u'いい', u'ううう', u'あ', u'いい', "
+          u"u'ううう', u'あ', u'いい',\n"
+          u"       u'ううう', u'あ', u'いい', u'ううう', "
+          u"u'あ', u'いい', u'ううう'],\n"
+          u"      dtype='object')")),
+        # truncated
+        (pd.Index([u'あ', u'いい', u'ううう'] * 100),
+         (u"Index([u'あ', u'いい', u'ううう', u'あ', u'いい', "
+          u"u'ううう', u'あ', u'いい',\n"
+          u"       u'ううう', u'あ',\n"
+          u"       ...\n"
+          u"       u'ううう', u'あ', u'いい', u'ううう', "
+          u"u'あ', u'いい', u'ううう', u'あ',\n"
+          u"       u'いい', u'ううう'],\n"
+          u"      dtype='object', length=300)"))])
+    def test_string_index_repr_with_unicode_option_compat(self, index,
+                                                          expected):
+        # Enable Unicode option -----------------------------------------
+        with cf.option_context('display.unicode.east_asian_width', True):
+            result = unicode(index)  # noqa
+            assert result == expected
+
+    @pytest.mark.parametrize('dtype', [np.int64, np.float64])
+    @pytest.mark.parametrize('delta', [1, 0, -1])
+    def test_addsub_arithmetic(self, dtype, delta):
+        # GH 8142
+        delta = dtype(delta)
+        index = pd.Index([10, 11, 12], dtype=dtype)
+        result = index + delta
+        expected = pd.Index(index.values + delta, dtype=dtype)
+        tm.assert_index_equal(result, expected)
+
+        # this subtraction used to fail
+        result = index - delta
+        expected = pd.Index(index.values - delta, dtype=dtype)
+        tm.assert_index_equal(result, expected)
+
+        tm.assert_index_equal(index + index, 2 * index)
+        tm.assert_index_equal(index - index, 0 * index)
+        assert not (index - index).empty
+
+    def test_iadd_preserves_name(self):
+        # GH#17067, GH#19723 __iadd__ and __isub__ should preserve index name
+        ser = pd.Series([1, 2, 3])
+        ser.index.name = 'foo'
+
+        ser.index += 1
+        assert ser.index.name == "foo"
+
+        ser.index -= 1
+        assert ser.index.name == "foo"
+
+    def test_cached_properties_not_settable(self):
+        index = pd.Index([1, 2, 3])
+        with tm.assert_raises_regex(AttributeError, "Can't set attribute"):
+            index.is_unique = False
+
+    def test_get_duplicates_deprecated(self):
+        index = pd.Index([1, 2, 3])
+        with tm.assert_produces_warning(FutureWarning):
+            index.get_duplicates()
+
+    def test_tab_complete_warning(self, ip):
+        # https://github.com/pandas-dev/pandas/issues/16409
+        pytest.importorskip('IPython', minversion="6.0.0")
+        from IPython.core.completer import provisionalcompleter
+
+        code = "import pandas as pd; idx = pd.Index([1, 2])"
+        ip.run_code(code)
+        with tm.assert_produces_warning(None):
+            with provisionalcompleter('ignore'):
+                list(ip.Completer.completions('idx.', 4))
+
+
+class TestMixedIntIndex(Base):
+    # Mostly the tests from common.py for which the results differ
+    # in py2 and py3 because ints and strings are uncomparable in py3
+    # (GH 13514)
+
+    _holder = Index
+
+    def setup_method(self, method):
+        self.indices = dict(mixedIndex=Index([0, 'a', 1, 'b', 2, 'c']))
+        self.setup_indices()
+
+    def create_index(self):
+        return self.mixedIndex
+
+    def test_argsort(self):
+        index = self.create_index()
+        if PY36:
+            with tm.assert_raises_regex(TypeError, "'>|<' not supported"):
+                result = index.argsort()
+        elif PY3:
+            with tm.assert_raises_regex(TypeError, "unorderable types"):
+                result = index.argsort()
+        else:
+            result = index.argsort()
+            expected = np.array(index).argsort()
+            tm.assert_numpy_array_equal(result, expected, check_dtype=False)
+
+    def test_numpy_argsort(self):
+        index = self.create_index()
+        if PY36:
+            with tm.assert_raises_regex(TypeError, "'>|<' not supported"):
+                result = np.argsort(index)
+        elif PY3:
+            with tm.assert_raises_regex(TypeError, "unorderable types"):
+                result = np.argsort(index)
+        else:
+            result = np.argsort(index)
+            expected = index.argsort()
+            tm.assert_numpy_array_equal(result, expected)
+
+    def test_copy_name(self):
+        # Check that "name" argument passed at initialization is honoured
+        # GH12309
+        index = self.create_index()
+
+        first = index.__class__(index, copy=True, name='mario')
+        second = first.__class__(first, copy=False)
+
+        # Even though "copy=False", we want a new object.
+        assert first is not second
+        tm.assert_index_equal(first, second)
+
+        assert first.name == 'mario'
+        assert second.name == 'mario'
+
+        s1 = Series(2, index=first)
+        s2 = Series(3, index=second[:-1])
+
+        warning_type = RuntimeWarning if PY3 else None
+        with tm.assert_produces_warning(warning_type):
+            # Python 3: Unorderable types
+            s3 = s1 * s2
+
+        assert s3.index.name == 'mario'
+
+    def test_copy_name2(self):
+        # Check that adding a "name" parameter to the copy is honored
+        # GH14302
+        index = pd.Index([1, 2], name='MyName')
+        index1 = index.copy()
+
+        tm.assert_index_equal(index, index1)
+
+        index2 = index.copy(name='NewName')
+        tm.assert_index_equal(index, index2, check_names=False)
+        assert index.name == 'MyName'
+        assert index2.name == 'NewName'
+
+        index3 = index.copy(names=['NewName'])
+        tm.assert_index_equal(index, index3, check_names=False)
+        assert index.name == 'MyName'
+        assert index.names == ['MyName']
+        assert index3.name == 'NewName'
+        assert index3.names == ['NewName']
+
+    def test_union_base(self):
+        index = self.create_index()
+        first = index[3:]
+        second = index[:5]
+
+        if PY3:
+            # unorderable types
+            warn_type = RuntimeWarning
+        else:
+            warn_type = None
+
+        with tm.assert_produces_warning(warn_type):
+            result = first.union(second)
+
+        expected = Index(['b', 2, 'c', 0, 'a', 1])
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("klass", [
+        np.array, Series, list])
+    def test_union_different_type_base(self, klass):
+        # GH 10149
+        index = self.create_index()
+        first = index[3:]
+        second = index[:5]
+
+        if PY3:
+            # unorderable types
+            warn_type = RuntimeWarning
+        else:
+            warn_type = None
+
+        with tm.assert_produces_warning(warn_type):
+            result = first.union(klass(second.values))
+
+        assert tm.equalContents(result, index)
+
+    def test_intersection_base(self):
+        # (same results for py2 and py3 but sortedness not tested elsewhere)
+        index = self.create_index()
+        first = index[:5]
+        second = index[:3]
+
+        result = first.intersection(second)
+        expected = Index([0, 'a', 1])
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("klass", [
+        np.array, Series, list])
+    def test_intersection_different_type_base(self, klass):
+        # GH 10149
+        index = self.create_index()
+        first = index[:5]
+        second = index[:3]
+
+        result = first.intersection(klass(second.values))
+        assert tm.equalContents(result, second)
+
+    def test_difference_base(self):
+        # (same results for py2 and py3 but sortedness not tested elsewhere)
+        index = self.create_index()
+        first = index[:4]
+        second = index[3:]
+
+        result = first.difference(second)
+        expected = Index([0, 1, 'a'])
+        tm.assert_index_equal(result, expected)
+
+    def test_symmetric_difference(self):
+        # (same results for py2 and py3 but sortedness not tested elsewhere)
+        index = self.create_index()
+        first = index[:4]
+        second = index[3:]
+
+        result = first.symmetric_difference(second)
+        expected = Index([0, 1, 2, 'a', 'c'])
+        tm.assert_index_equal(result, expected)
+
+    def test_logical_compat(self):
+        index = self.create_index()
+        assert index.all() == index.values.all()
+        assert index.any() == index.values.any()
+
+    @pytest.mark.parametrize("how", ['any', 'all'])
+    @pytest.mark.parametrize("dtype", [
+        None, object, 'category'])
+    @pytest.mark.parametrize("vals,expected", [
+        ([1, 2, 3], [1, 2, 3]), ([1., 2., 3.], [1., 2., 3.]),
+        ([1., 2., np.nan, 3.], [1., 2., 3.]),
+        (['A', 'B', 'C'], ['A', 'B', 'C']),
+        (['A', np.nan, 'B', 'C'], ['A', 'B', 'C'])])
+    def test_dropna(self, how, dtype, vals, expected):
+        # GH 6194
+        index = pd.Index(vals, dtype=dtype)
+        result = index.dropna(how=how)
+        expected = pd.Index(expected, dtype=dtype)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("how", ['any', 'all'])
+    @pytest.mark.parametrize("index,expected", [
+        (pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03']),
+         pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'])),
+        (pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03', pd.NaT]),
+         pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'])),
+        (pd.TimedeltaIndex(['1 days', '2 days', '3 days']),
+         pd.TimedeltaIndex(['1 days', '2 days', '3 days'])),
+        (pd.TimedeltaIndex([pd.NaT, '1 days', '2 days', '3 days', pd.NaT]),
+         pd.TimedeltaIndex(['1 days', '2 days', '3 days'])),
+        (pd.PeriodIndex(['2012-02', '2012-04', '2012-05'], freq='M'),
+         pd.PeriodIndex(['2012-02', '2012-04', '2012-05'], freq='M')),
+        (pd.PeriodIndex(['2012-02', '2012-04', 'NaT', '2012-05'], freq='M'),
+         pd.PeriodIndex(['2012-02', '2012-04', '2012-05'], freq='M'))])
+    def test_dropna_dt_like(self, how, index, expected):
+        result = index.dropna(how=how)
+        tm.assert_index_equal(result, expected)
+
+    def test_dropna_invalid_how_raises(self):
+        msg = "invalid how option: xxx"
+        with tm.assert_raises_regex(ValueError, msg):
+            pd.Index([1, 2, 3]).dropna(how='xxx')
+
+    def test_get_combined_index(self):
+        result = _get_combined_index([])
+        expected = Index([])
+        tm.assert_index_equal(result, expected)
+
+    def test_repeat(self):
+        repeats = 2
+        index = pd.Index([1, 2, 3])
+        expected = pd.Index([1, 1, 2, 2, 3, 3])
+
+        result = index.repeat(repeats)
+        tm.assert_index_equal(result, expected)
+
+    def test_repeat_warns_n_keyword(self):
+        index = pd.Index([1, 2, 3])
+        expected = pd.Index([1, 1, 2, 2, 3, 3])
+
+        with tm.assert_produces_warning(FutureWarning):
+            result = index.repeat(n=2)
+
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("index", [
+        pd.Index([np.nan]), pd.Index([np.nan, 1]),
+        pd.Index([1, 2, np.nan]), pd.Index(['a', 'b', np.nan]),
+        pd.to_datetime(['NaT']), pd.to_datetime(['NaT', '2000-01-01']),
+        pd.to_datetime(['2000-01-01', 'NaT', '2000-01-02']),
+        pd.to_timedelta(['1 day', 'NaT'])])
+    def test_is_monotonic_na(self, index):
+        assert not index.is_monotonic_increasing
+        assert not index.is_monotonic_decreasing
+        assert not index._is_strictly_monotonic_increasing
+        assert not index._is_strictly_monotonic_decreasing
+
+    def test_repr_summary(self):
+        with cf.option_context('display.max_seq_items', 10):
+            result = repr(pd.Index(np.arange(1000)))
+            assert len(result) < 200
+            assert "..." in result
+
+    @pytest.mark.parametrize("klass", [Series, DataFrame])
+    def test_int_name_format(self, klass):
+        index = Index(['a', 'b', 'c'], name=0)
+        result = klass(lrange(3), index=index)
+        assert '0' in repr(result)
+
+    def test_print_unicode_columns(self):
+        df = pd.DataFrame({u("\u05d0"): [1, 2, 3],
+                           "\u05d1": [4, 5, 6],
+                           "c": [7, 8, 9]})
+        repr(df.columns)  # should not raise UnicodeDecodeError
+
+    @pytest.mark.parametrize("func,compat_func", [
+        (str, text_type),  # unicode string
+        (bytes, str)  # byte string
+    ])
+    def test_with_unicode(self, func, compat_func):
+        index = Index(lrange(1000))
+
+        if PY3:
+            func(index)
+        else:
+            compat_func(index)
+
+    def test_intersect_str_dates(self):
+        dt_dates = [datetime(2012, 2, 9), datetime(2012, 2, 22)]
+
+        index1 = Index(dt_dates, dtype=object)
+        index2 = Index(['aa'], dtype=object)
+        result = index2.intersection(index1)
+
+        expected = Index([], dtype=object)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('op', [operator.eq, operator.ne,
+                                    operator.gt, operator.ge,
+                                    operator.lt, operator.le])
+    def test_comparison_tzawareness_compat(self, op):
+        # GH#18162
+        dr = pd.date_range('2016-01-01', periods=6)
+        dz = dr.tz_localize('US/Pacific')
+
+        # Check that there isn't a problem aware-aware and naive-naive do not
+        # raise
+        naive_series = Series(dr)
+        aware_series = Series(dz)
+        with pytest.raises(TypeError):
+            op(dz, naive_series)
+        with pytest.raises(TypeError):
+            op(dr, aware_series)
+
+        # TODO: implement _assert_tzawareness_compat for the reverse
+        # comparison with the Series on the left-hand side
+
+
+class TestIndexUtils(object):
+
+    @pytest.mark.parametrize('data, names, expected', [
+        ([[1, 2, 3]], None, Index([1, 2, 3])),
+        ([[1, 2, 3]], ['name'], Index([1, 2, 3], name='name')),
+        ([['a', 'a'], ['c', 'd']], None,
+         MultiIndex([['a'], ['c', 'd']], [[0, 0], [0, 1]])),
+        ([['a', 'a'], ['c', 'd']], ['L1', 'L2'],
+         MultiIndex([['a'], ['c', 'd']], [[0, 0], [0, 1]],
+                    names=['L1', 'L2'])),
+    ])
+    def test_ensure_index_from_sequences(self, data, names, expected):
+        result = _ensure_index_from_sequences(data, names)
+        tm.assert_index_equal(result, expected)
+
+
+@pytest.mark.parametrize('opname', ['eq', 'ne', 'le', 'lt', 'ge', 'gt',
+                                    'add', 'radd', 'sub', 'rsub',
+                                    'mul', 'rmul', 'truediv', 'rtruediv',
+                                    'floordiv', 'rfloordiv',
+                                    'pow', 'rpow', 'mod', 'divmod'])
+def test_generated_op_names(opname, indices):
+    index = indices
+    if isinstance(index, ABCIndex) and opname == 'rsub':
+        # pd.Index.__rsub__ does not exist; though the method does exist
+        # for subclasses.  see GH#19723
+        return
+    opname = '__{name}__'.format(name=opname)
+    method = getattr(index, opname)
+    assert method.__name__ == opname
+
+
+@pytest.mark.parametrize('index_maker', tm.index_subclass_makers_generator())
+def test_index_subclass_constructor_wrong_kwargs(index_maker):
+    # GH #19348
+    with tm.assert_raises_regex(TypeError, 'unexpected keyword argument'):
+        index_maker(foo='bar')
diff --git a/pandas/tests/indexes/test_category.py b/pandas/tests/indexes/test_category.py
new file mode 100644
index 0000000000000..a2a4170256088
--- /dev/null
+++ b/pandas/tests/indexes/test_category.py
@@ -0,0 +1,1110 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+import pandas.util.testing as tm
+from pandas.core.indexes.api import Index, CategoricalIndex
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from .common import Base
+
+from pandas.compat import range, PY3
+
+import numpy as np
+
+from pandas import Categorical, IntervalIndex, compat
+from pandas.util.testing import assert_almost_equal
+import pandas.core.config as cf
+import pandas as pd
+
+if PY3:
+    unicode = lambda x: x
+
+
+class TestCategoricalIndex(Base):
+    _holder = CategoricalIndex
+
+    def setup_method(self, method):
+        self.indices = dict(catIndex=tm.makeCategoricalIndex(100))
+        self.setup_indices()
+
+    def create_index(self, categories=None, ordered=False):
+        if categories is None:
+            categories = list('cab')
+        return CategoricalIndex(
+            list('aabbca'), categories=categories, ordered=ordered)
+
+    def test_can_hold_identifiers(self):
+        idx = self.create_index(categories=list('abcd'))
+        key = idx[0]
+        assert idx._can_hold_identifiers_and_holds_name(key) is True
+
+    def test_construction(self):
+
+        ci = self.create_index(categories=list('abcd'))
+        categories = ci.categories
+
+        result = Index(ci)
+        tm.assert_index_equal(result, ci, exact=True)
+        assert not result.ordered
+
+        result = Index(ci.values)
+        tm.assert_index_equal(result, ci, exact=True)
+        assert not result.ordered
+
+        # empty
+        result = CategoricalIndex(categories=categories)
+        tm.assert_index_equal(result.categories, Index(categories))
+        tm.assert_numpy_array_equal(result.codes, np.array([], dtype='int8'))
+        assert not result.ordered
+
+        # passing categories
+        result = CategoricalIndex(list('aabbca'), categories=categories)
+        tm.assert_index_equal(result.categories, Index(categories))
+        tm.assert_numpy_array_equal(result.codes,
+                                    np.array([0, 0, 1,
+                                              1, 2, 0], dtype='int8'))
+
+        c = pd.Categorical(list('aabbca'))
+        result = CategoricalIndex(c)
+        tm.assert_index_equal(result.categories, Index(list('abc')))
+        tm.assert_numpy_array_equal(result.codes,
+                                    np.array([0, 0, 1,
+                                              1, 2, 0], dtype='int8'))
+        assert not result.ordered
+
+        result = CategoricalIndex(c, categories=categories)
+        tm.assert_index_equal(result.categories, Index(categories))
+        tm.assert_numpy_array_equal(result.codes,
+                                    np.array([0, 0, 1,
+                                              1, 2, 0], dtype='int8'))
+        assert not result.ordered
+
+        ci = CategoricalIndex(c, categories=list('abcd'))
+        result = CategoricalIndex(ci)
+        tm.assert_index_equal(result.categories, Index(categories))
+        tm.assert_numpy_array_equal(result.codes,
+                                    np.array([0, 0, 1,
+                                              1, 2, 0], dtype='int8'))
+        assert not result.ordered
+
+        result = CategoricalIndex(ci, categories=list('ab'))
+        tm.assert_index_equal(result.categories, Index(list('ab')))
+        tm.assert_numpy_array_equal(result.codes,
+                                    np.array([0, 0, 1,
+                                              1, -1, 0], dtype='int8'))
+        assert not result.ordered
+
+        result = CategoricalIndex(ci, categories=list('ab'), ordered=True)
+        tm.assert_index_equal(result.categories, Index(list('ab')))
+        tm.assert_numpy_array_equal(result.codes,
+                                    np.array([0, 0, 1,
+                                              1, -1, 0], dtype='int8'))
+        assert result.ordered
+
+        result = pd.CategoricalIndex(ci, categories=list('ab'), ordered=True)
+        expected = pd.CategoricalIndex(ci, categories=list('ab'), ordered=True,
+                                       dtype='category')
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # turn me to an Index
+        result = Index(np.array(ci))
+        assert isinstance(result, Index)
+        assert not isinstance(result, CategoricalIndex)
+
+    def test_construction_with_dtype(self):
+
+        # specify dtype
+        ci = self.create_index(categories=list('abc'))
+
+        result = Index(np.array(ci), dtype='category')
+        tm.assert_index_equal(result, ci, exact=True)
+
+        result = Index(np.array(ci).tolist(), dtype='category')
+        tm.assert_index_equal(result, ci, exact=True)
+
+        # these are generally only equal when the categories are reordered
+        ci = self.create_index()
+
+        result = Index(
+            np.array(ci), dtype='category').reorder_categories(ci.categories)
+        tm.assert_index_equal(result, ci, exact=True)
+
+        # make sure indexes are handled
+        expected = CategoricalIndex([0, 1, 2], categories=[0, 1, 2],
+                                    ordered=True)
+        idx = Index(range(3))
+        result = CategoricalIndex(idx, categories=idx, ordered=True)
+        tm.assert_index_equal(result, expected, exact=True)
+
+    def test_construction_with_categorical_dtype(self):
+        # construction with CategoricalDtype
+        # GH18109
+        data, cats, ordered = 'a a b b'.split(), 'c b a'.split(), True
+        dtype = CategoricalDtype(categories=cats, ordered=ordered)
+
+        result = CategoricalIndex(data, dtype=dtype)
+        expected = CategoricalIndex(data, categories=cats, ordered=ordered)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # GH 19032
+        result = Index(data, dtype=dtype)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # error when combining categories/ordered and dtype kwargs
+        msg = 'Cannot specify both `dtype` and `categories` or `ordered`.'
+        with pytest.raises(ValueError, match=msg):
+            CategoricalIndex(data, categories=cats, dtype=dtype)
+
+        with pytest.raises(ValueError, match=msg):
+            Index(data, categories=cats, dtype=dtype)
+
+        with pytest.raises(ValueError, match=msg):
+            CategoricalIndex(data, ordered=ordered, dtype=dtype)
+
+        with pytest.raises(ValueError, match=msg):
+            Index(data, ordered=ordered, dtype=dtype)
+
+    def test_create_categorical(self):
+        # https://github.com/pandas-dev/pandas/pull/17513
+        # The public CI constructor doesn't hit this code path with
+        # instances of CategoricalIndex, but we still want to test the code
+        ci = CategoricalIndex(['a', 'b', 'c'])
+        # First ci is self, second ci is data.
+        result = CategoricalIndex._create_categorical(ci, ci)
+        expected = Categorical(['a', 'b', 'c'])
+        tm.assert_categorical_equal(result, expected)
+
+    def test_disallow_set_ops(self):
+
+        # GH 10039
+        # set ops (+/-) raise TypeError
+        idx = pd.Index(pd.Categorical(['a', 'b']))
+
+        pytest.raises(TypeError, lambda: idx - idx)
+        pytest.raises(TypeError, lambda: idx + idx)
+        pytest.raises(TypeError, lambda: idx - ['a', 'b'])
+        pytest.raises(TypeError, lambda: idx + ['a', 'b'])
+        pytest.raises(TypeError, lambda: ['a', 'b'] - idx)
+        pytest.raises(TypeError, lambda: ['a', 'b'] + idx)
+
+    def test_method_delegation(self):
+
+        ci = CategoricalIndex(list('aabbca'), categories=list('cabdef'))
+        result = ci.set_categories(list('cab'))
+        tm.assert_index_equal(result, CategoricalIndex(
+            list('aabbca'), categories=list('cab')))
+
+        ci = CategoricalIndex(list('aabbca'), categories=list('cab'))
+        result = ci.rename_categories(list('efg'))
+        tm.assert_index_equal(result, CategoricalIndex(
+            list('ffggef'), categories=list('efg')))
+
+        # GH18862 (let rename_categories take callables)
+        result = ci.rename_categories(lambda x: x.upper())
+        tm.assert_index_equal(result, CategoricalIndex(
+            list('AABBCA'), categories=list('CAB')))
+
+        ci = CategoricalIndex(list('aabbca'), categories=list('cab'))
+        result = ci.add_categories(['d'])
+        tm.assert_index_equal(result, CategoricalIndex(
+            list('aabbca'), categories=list('cabd')))
+
+        ci = CategoricalIndex(list('aabbca'), categories=list('cab'))
+        result = ci.remove_categories(['c'])
+        tm.assert_index_equal(result, CategoricalIndex(
+            list('aabb') + [np.nan] + ['a'], categories=list('ab')))
+
+        ci = CategoricalIndex(list('aabbca'), categories=list('cabdef'))
+        result = ci.as_unordered()
+        tm.assert_index_equal(result, ci)
+
+        ci = CategoricalIndex(list('aabbca'), categories=list('cabdef'))
+        result = ci.as_ordered()
+        tm.assert_index_equal(result, CategoricalIndex(
+            list('aabbca'), categories=list('cabdef'), ordered=True))
+
+        # invalid
+        pytest.raises(ValueError, lambda: ci.set_categories(
+            list('cab'), inplace=True))
+
+    def test_contains(self):
+
+        ci = self.create_index(categories=list('cabdef'))
+
+        assert 'a' in ci
+        assert 'z' not in ci
+        assert 'e' not in ci
+        assert np.nan not in ci
+
+        # assert codes NOT in index
+        assert 0 not in ci
+        assert 1 not in ci
+
+        ci = CategoricalIndex(
+            list('aabbca') + [np.nan], categories=list('cabdef'))
+        assert np.nan in ci
+
+    def test_min_max(self):
+
+        ci = self.create_index(ordered=False)
+        pytest.raises(TypeError, lambda: ci.min())
+        pytest.raises(TypeError, lambda: ci.max())
+
+        ci = self.create_index(ordered=True)
+
+        assert ci.min() == 'c'
+        assert ci.max() == 'b'
+
+    def test_map(self):
+        ci = pd.CategoricalIndex(list('ABABC'), categories=list('CBA'),
+                                 ordered=True)
+        result = ci.map(lambda x: x.lower())
+        exp = pd.CategoricalIndex(list('ababc'), categories=list('cba'),
+                                  ordered=True)
+        tm.assert_index_equal(result, exp)
+
+        ci = pd.CategoricalIndex(list('ABABC'), categories=list('BAC'),
+                                 ordered=False, name='XXX')
+        result = ci.map(lambda x: x.lower())
+        exp = pd.CategoricalIndex(list('ababc'), categories=list('bac'),
+                                  ordered=False, name='XXX')
+        tm.assert_index_equal(result, exp)
+
+        # GH 12766: Return an index not an array
+        tm.assert_index_equal(ci.map(lambda x: 1),
+                              Index(np.array([1] * 5, dtype=np.int64),
+                                    name='XXX'))
+
+        # change categories dtype
+        ci = pd.CategoricalIndex(list('ABABC'), categories=list('BAC'),
+                                 ordered=False)
+
+        def f(x):
+            return {'A': 10, 'B': 20, 'C': 30}.get(x)
+
+        result = ci.map(f)
+        exp = pd.CategoricalIndex([10, 20, 10, 20, 30],
+                                  categories=[20, 10, 30],
+                                  ordered=False)
+        tm.assert_index_equal(result, exp)
+
+        result = ci.map(pd.Series([10, 20, 30], index=['A', 'B', 'C']))
+        tm.assert_index_equal(result, exp)
+
+        result = ci.map({'A': 10, 'B': 20, 'C': 30})
+        tm.assert_index_equal(result, exp)
+
+    def test_map_with_categorical_series(self):
+        # GH 12756
+        a = pd.Index([1, 2, 3, 4])
+        b = pd.Series(["even", "odd", "even", "odd"],
+                      dtype="category")
+        c = pd.Series(["even", "odd", "even", "odd"])
+
+        exp = CategoricalIndex(["odd", "even", "odd", np.nan])
+        tm.assert_index_equal(a.map(b), exp)
+        exp = pd.Index(["odd", "even", "odd", np.nan])
+        tm.assert_index_equal(a.map(c), exp)
+
+    @pytest.mark.parametrize('klass', [list, tuple, np.array, pd.Series])
+    def test_where(self, klass):
+        i = self.create_index()
+        cond = [True] * len(i)
+        expected = i
+        result = i.where(klass(cond))
+        tm.assert_index_equal(result, expected)
+
+        cond = [False] + [True] * (len(i) - 1)
+        expected = CategoricalIndex([np.nan] + i[1:].tolist(),
+                                    categories=i.categories)
+        result = i.where(klass(cond))
+        tm.assert_index_equal(result, expected)
+
+    def test_append(self):
+
+        ci = self.create_index()
+        categories = ci.categories
+
+        # append cats with the same categories
+        result = ci[:3].append(ci[3:])
+        tm.assert_index_equal(result, ci, exact=True)
+
+        foos = [ci[:1], ci[1:3], ci[3:]]
+        result = foos[0].append(foos[1:])
+        tm.assert_index_equal(result, ci, exact=True)
+
+        # empty
+        result = ci.append([])
+        tm.assert_index_equal(result, ci, exact=True)
+
+        # appending with different categories or reoreded is not ok
+        pytest.raises(
+            TypeError,
+            lambda: ci.append(ci.values.set_categories(list('abcd'))))
+        pytest.raises(
+            TypeError,
+            lambda: ci.append(ci.values.reorder_categories(list('abc'))))
+
+        # with objects
+        result = ci.append(Index(['c', 'a']))
+        expected = CategoricalIndex(list('aabbcaca'), categories=categories)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # invalid objects
+        pytest.raises(TypeError, lambda: ci.append(Index(['a', 'd'])))
+
+        # GH14298 - if base object is not categorical -> coerce to object
+        result = Index(['c', 'a']).append(ci)
+        expected = Index(list('caaabbca'))
+        tm.assert_index_equal(result, expected, exact=True)
+
+    def test_append_to_another(self):
+        # hits _concat_index_asobject
+        fst = Index(['a', 'b'])
+        snd = CategoricalIndex(['d', 'e'])
+        result = fst.append(snd)
+        expected = Index(['a', 'b', 'd', 'e'])
+        tm.assert_index_equal(result, expected)
+
+    def test_insert(self):
+
+        ci = self.create_index()
+        categories = ci.categories
+
+        # test 0th element
+        result = ci.insert(0, 'a')
+        expected = CategoricalIndex(list('aaabbca'), categories=categories)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # test Nth element that follows Python list behavior
+        result = ci.insert(-1, 'a')
+        expected = CategoricalIndex(list('aabbcaa'), categories=categories)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # test empty
+        result = CategoricalIndex(categories=categories).insert(0, 'a')
+        expected = CategoricalIndex(['a'], categories=categories)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # invalid
+        pytest.raises(TypeError, lambda: ci.insert(0, 'd'))
+
+        # GH 18295 (test missing)
+        expected = CategoricalIndex(['a', np.nan, 'a', 'b', 'c', 'b'])
+        for na in (np.nan, pd.NaT, None):
+            result = CategoricalIndex(list('aabcb')).insert(1, na)
+            tm.assert_index_equal(result, expected)
+
+    def test_delete(self):
+
+        ci = self.create_index()
+        categories = ci.categories
+
+        result = ci.delete(0)
+        expected = CategoricalIndex(list('abbca'), categories=categories)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        result = ci.delete(-1)
+        expected = CategoricalIndex(list('aabbc'), categories=categories)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        with pytest.raises((IndexError, ValueError)):
+            # Either depending on NumPy version
+            ci.delete(10)
+
+    def test_astype(self):
+
+        ci = self.create_index()
+        result = ci.astype(object)
+        tm.assert_index_equal(result, Index(np.array(ci)))
+
+        # this IS equal, but not the same class
+        assert result.equals(ci)
+        assert isinstance(result, Index)
+        assert not isinstance(result, CategoricalIndex)
+
+        # interval
+        ii = IntervalIndex.from_arrays(left=[-0.001, 2.0],
+                                       right=[2, 4],
+                                       closed='right')
+
+        ci = CategoricalIndex(Categorical.from_codes(
+            [0, 1, -1], categories=ii, ordered=True))
+
+        result = ci.astype('interval')
+        expected = ii.take([0, 1, -1])
+        tm.assert_index_equal(result, expected)
+
+        result = IntervalIndex(result.values)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('name', [None, 'foo'])
+    @pytest.mark.parametrize('dtype_ordered', [True, False])
+    @pytest.mark.parametrize('index_ordered', [True, False])
+    def test_astype_category(self, name, dtype_ordered, index_ordered):
+        # GH 18630
+        index = self.create_index(ordered=index_ordered)
+        if name:
+            index = index.rename(name)
+
+        # standard categories
+        dtype = CategoricalDtype(ordered=dtype_ordered)
+        result = index.astype(dtype)
+        expected = CategoricalIndex(index.tolist(),
+                                    name=name,
+                                    categories=index.categories,
+                                    ordered=dtype_ordered)
+        tm.assert_index_equal(result, expected)
+
+        # non-standard categories
+        dtype = CategoricalDtype(index.unique().tolist()[:-1], dtype_ordered)
+        result = index.astype(dtype)
+        expected = CategoricalIndex(index.tolist(), name=name, dtype=dtype)
+        tm.assert_index_equal(result, expected)
+
+        if dtype_ordered is False:
+            # dtype='category' can't specify ordered, so only test once
+            result = index.astype('category')
+            expected = index
+            tm.assert_index_equal(result, expected)
+
+    def test_reindex_base(self):
+        # Determined by cat ordering.
+        idx = CategoricalIndex(list("cab"), categories=list("cab"))
+        expected = np.arange(len(idx), dtype=np.intp)
+
+        actual = idx.get_indexer(idx)
+        tm.assert_numpy_array_equal(expected, actual)
+
+        with tm.assert_raises_regex(ValueError, "Invalid fill method"):
+            idx.get_indexer(idx, method="invalid")
+
+    def test_reindexing(self):
+        np.random.seed(123456789)
+
+        ci = self.create_index()
+        oidx = Index(np.array(ci))
+
+        for n in [1, 2, 5, len(ci)]:
+            finder = oidx[np.random.randint(0, len(ci), size=n)]
+            expected = oidx.get_indexer_non_unique(finder)[0]
+
+            actual = ci.get_indexer(finder)
+            tm.assert_numpy_array_equal(expected, actual)
+
+        # see gh-17323
+        #
+        # Even when indexer is equal to the
+        # members in the index, we should
+        # respect duplicates instead of taking
+        # the fast-track path.
+        for finder in [list("aabbca"), list("aababca")]:
+            expected = oidx.get_indexer_non_unique(finder)[0]
+
+            actual = ci.get_indexer(finder)
+            tm.assert_numpy_array_equal(expected, actual)
+
+    def test_reindex_dtype(self):
+        c = CategoricalIndex(['a', 'b', 'c', 'a'])
+        res, indexer = c.reindex(['a', 'c'])
+        tm.assert_index_equal(res, Index(['a', 'a', 'c']), exact=True)
+        tm.assert_numpy_array_equal(indexer,
+                                    np.array([0, 3, 2], dtype=np.intp))
+
+        c = CategoricalIndex(['a', 'b', 'c', 'a'])
+        res, indexer = c.reindex(Categorical(['a', 'c']))
+
+        exp = CategoricalIndex(['a', 'a', 'c'], categories=['a', 'c'])
+        tm.assert_index_equal(res, exp, exact=True)
+        tm.assert_numpy_array_equal(indexer,
+                                    np.array([0, 3, 2], dtype=np.intp))
+
+        c = CategoricalIndex(['a', 'b', 'c', 'a'],
+                             categories=['a', 'b', 'c', 'd'])
+        res, indexer = c.reindex(['a', 'c'])
+        exp = Index(['a', 'a', 'c'], dtype='object')
+        tm.assert_index_equal(res, exp, exact=True)
+        tm.assert_numpy_array_equal(indexer,
+                                    np.array([0, 3, 2], dtype=np.intp))
+
+        c = CategoricalIndex(['a', 'b', 'c', 'a'],
+                             categories=['a', 'b', 'c', 'd'])
+        res, indexer = c.reindex(Categorical(['a', 'c']))
+        exp = CategoricalIndex(['a', 'a', 'c'], categories=['a', 'c'])
+        tm.assert_index_equal(res, exp, exact=True)
+        tm.assert_numpy_array_equal(indexer,
+                                    np.array([0, 3, 2], dtype=np.intp))
+
+    def test_reindex_empty_index(self):
+        # See GH16770
+        c = CategoricalIndex([])
+        res, indexer = c.reindex(['a', 'b'])
+        tm.assert_index_equal(res, Index(['a', 'b']), exact=True)
+        tm.assert_numpy_array_equal(indexer,
+                                    np.array([-1, -1], dtype=np.intp))
+
+    @pytest.mark.parametrize('data, non_lexsorted_data', [
+        [[1, 2, 3], [9, 0, 1, 2, 3]],
+        [list('abc'), list('fabcd')],
+    ])
+    def test_is_monotonic(self, data, non_lexsorted_data):
+        c = CategoricalIndex(data)
+        assert c.is_monotonic_increasing
+        assert not c.is_monotonic_decreasing
+
+        c = CategoricalIndex(data, ordered=True)
+        assert c.is_monotonic_increasing
+        assert not c.is_monotonic_decreasing
+
+        c = CategoricalIndex(data, categories=reversed(data))
+        assert not c.is_monotonic_increasing
+        assert c.is_monotonic_decreasing
+
+        c = CategoricalIndex(data, categories=reversed(data), ordered=True)
+        assert not c.is_monotonic_increasing
+        assert c.is_monotonic_decreasing
+
+        # test when data is neither monotonic increasing nor decreasing
+        reordered_data = [data[0], data[2], data[1]]
+        c = CategoricalIndex(reordered_data, categories=reversed(data))
+        assert not c.is_monotonic_increasing
+        assert not c.is_monotonic_decreasing
+
+        # non lexsorted categories
+        categories = non_lexsorted_data
+
+        c = CategoricalIndex(categories[:2], categories=categories)
+        assert c.is_monotonic_increasing
+        assert not c.is_monotonic_decreasing
+
+        c = CategoricalIndex(categories[1:3], categories=categories)
+        assert c.is_monotonic_increasing
+        assert not c.is_monotonic_decreasing
+
+    @pytest.mark.parametrize('values, expected', [
+        ([1, 2, 3], True),
+        ([1, 3, 1], False),
+        (list('abc'), True),
+        (list('aba'), False)])
+    def test_is_unique(self, values, expected):
+        ci = CategoricalIndex(values)
+        assert ci.is_unique is expected
+
+    def test_duplicates(self):
+
+        idx = CategoricalIndex([0, 0, 0], name='foo')
+        assert not idx.is_unique
+        assert idx.has_duplicates
+
+        expected = CategoricalIndex([0], name='foo')
+        tm.assert_index_equal(idx.drop_duplicates(), expected)
+        tm.assert_index_equal(idx.unique(), expected)
+
+    def test_get_indexer(self):
+
+        idx1 = CategoricalIndex(list('aabcde'), categories=list('edabc'))
+        idx2 = CategoricalIndex(list('abf'))
+
+        for indexer in [idx2, list('abf'), Index(list('abf'))]:
+            r1 = idx1.get_indexer(idx2)
+            assert_almost_equal(r1, np.array([0, 1, 2, -1], dtype=np.intp))
+
+        pytest.raises(NotImplementedError,
+                      lambda: idx2.get_indexer(idx1, method='pad'))
+        pytest.raises(NotImplementedError,
+                      lambda: idx2.get_indexer(idx1, method='backfill'))
+        pytest.raises(NotImplementedError,
+                      lambda: idx2.get_indexer(idx1, method='nearest'))
+
+    def test_get_loc(self):
+        # GH 12531
+        cidx1 = CategoricalIndex(list('abcde'), categories=list('edabc'))
+        idx1 = Index(list('abcde'))
+        assert cidx1.get_loc('a') == idx1.get_loc('a')
+        assert cidx1.get_loc('e') == idx1.get_loc('e')
+
+        for i in [cidx1, idx1]:
+            with pytest.raises(KeyError):
+                i.get_loc('NOT-EXIST')
+
+        # non-unique
+        cidx2 = CategoricalIndex(list('aacded'), categories=list('edabc'))
+        idx2 = Index(list('aacded'))
+
+        # results in bool array
+        res = cidx2.get_loc('d')
+        tm.assert_numpy_array_equal(res, idx2.get_loc('d'))
+        tm.assert_numpy_array_equal(res, np.array([False, False, False,
+                                                   True, False, True]))
+        # unique element results in scalar
+        res = cidx2.get_loc('e')
+        assert res == idx2.get_loc('e')
+        assert res == 4
+
+        for i in [cidx2, idx2]:
+            with pytest.raises(KeyError):
+                i.get_loc('NOT-EXIST')
+
+        # non-unique, slicable
+        cidx3 = CategoricalIndex(list('aabbb'), categories=list('abc'))
+        idx3 = Index(list('aabbb'))
+
+        # results in slice
+        res = cidx3.get_loc('a')
+        assert res == idx3.get_loc('a')
+        assert res == slice(0, 2, None)
+
+        res = cidx3.get_loc('b')
+        assert res == idx3.get_loc('b')
+        assert res == slice(2, 5, None)
+
+        for i in [cidx3, idx3]:
+            with pytest.raises(KeyError):
+                i.get_loc('c')
+
+    def test_repr_roundtrip(self):
+
+        ci = CategoricalIndex(['a', 'b'], categories=['a', 'b'], ordered=True)
+        str(ci)
+        tm.assert_index_equal(eval(repr(ci)), ci, exact=True)
+
+        # formatting
+        if PY3:
+            str(ci)
+        else:
+            compat.text_type(ci)
+
+        # long format
+        # this is not reprable
+        ci = CategoricalIndex(np.random.randint(0, 5, size=100))
+        if PY3:
+            str(ci)
+        else:
+            compat.text_type(ci)
+
+    def test_isin(self):
+
+        ci = CategoricalIndex(
+            list('aabca') + [np.nan], categories=['c', 'a', 'b'])
+        tm.assert_numpy_array_equal(
+            ci.isin(['c']),
+            np.array([False, False, False, True, False, False]))
+        tm.assert_numpy_array_equal(
+            ci.isin(['c', 'a', 'b']), np.array([True] * 5 + [False]))
+        tm.assert_numpy_array_equal(
+            ci.isin(['c', 'a', 'b', np.nan]), np.array([True] * 6))
+
+        # mismatched categorical -> coerced to ndarray so doesn't matter
+        result = ci.isin(ci.set_categories(list('abcdefghi')))
+        expected = np.array([True] * 6)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = ci.isin(ci.set_categories(list('defghi')))
+        expected = np.array([False] * 5 + [True])
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_identical(self):
+
+        ci1 = CategoricalIndex(['a', 'b'], categories=['a', 'b'], ordered=True)
+        ci2 = CategoricalIndex(['a', 'b'], categories=['a', 'b', 'c'],
+                               ordered=True)
+        assert ci1.identical(ci1)
+        assert ci1.identical(ci1.copy())
+        assert not ci1.identical(ci2)
+
+    def test_ensure_copied_data(self):
+        # gh-12309: Check the "copy" argument of each
+        # Index.__new__ is honored.
+        #
+        # Must be tested separately from other indexes because
+        # self.value is not an ndarray.
+        _base = lambda ar: ar if ar.base is None else ar.base
+
+        for index in self.indices.values():
+            result = CategoricalIndex(index.values, copy=True)
+            tm.assert_index_equal(index, result)
+            assert _base(index.values) is not _base(result.values)
+
+            result = CategoricalIndex(index.values, copy=False)
+            assert _base(index.values) is _base(result.values)
+
+    def test_equals_categorical(self):
+        ci1 = CategoricalIndex(['a', 'b'], categories=['a', 'b'], ordered=True)
+        ci2 = CategoricalIndex(['a', 'b'], categories=['a', 'b', 'c'],
+                               ordered=True)
+
+        assert ci1.equals(ci1)
+        assert not ci1.equals(ci2)
+        assert ci1.equals(ci1.astype(object))
+        assert ci1.astype(object).equals(ci1)
+
+        assert (ci1 == ci1).all()
+        assert not (ci1 != ci1).all()
+        assert not (ci1 > ci1).all()
+        assert not (ci1 < ci1).all()
+        assert (ci1 <= ci1).all()
+        assert (ci1 >= ci1).all()
+
+        assert not (ci1 == 1).all()
+        assert (ci1 == Index(['a', 'b'])).all()
+        assert (ci1 == ci1.values).all()
+
+        # invalid comparisons
+        with tm.assert_raises_regex(ValueError, "Lengths must match"):
+            ci1 == Index(['a', 'b', 'c'])
+        pytest.raises(TypeError, lambda: ci1 == ci2)
+        pytest.raises(
+            TypeError, lambda: ci1 == Categorical(ci1.values, ordered=False))
+        pytest.raises(
+            TypeError,
+            lambda: ci1 == Categorical(ci1.values, categories=list('abc')))
+
+        # tests
+        # make sure that we are testing for category inclusion properly
+        ci = CategoricalIndex(list('aabca'), categories=['c', 'a', 'b'])
+        assert not ci.equals(list('aabca'))
+        # Same categories, but different order
+        # Unordered
+        assert ci.equals(CategoricalIndex(list('aabca')))
+        # Ordered
+        assert not ci.equals(CategoricalIndex(list('aabca'), ordered=True))
+        assert ci.equals(ci.copy())
+
+        ci = CategoricalIndex(list('aabca') + [np.nan],
+                              categories=['c', 'a', 'b'])
+        assert not ci.equals(list('aabca'))
+        assert not ci.equals(CategoricalIndex(list('aabca')))
+        assert ci.equals(ci.copy())
+
+        ci = CategoricalIndex(list('aabca') + [np.nan],
+                              categories=['c', 'a', 'b'])
+        assert not ci.equals(list('aabca') + [np.nan])
+        assert ci.equals(CategoricalIndex(list('aabca') + [np.nan]))
+        assert not ci.equals(CategoricalIndex(list('aabca') + [np.nan],
+                                              ordered=True))
+        assert ci.equals(ci.copy())
+
+    def test_equals_categoridcal_unordered(self):
+        # https://github.com/pandas-dev/pandas/issues/16603
+        a = pd.CategoricalIndex(['A'], categories=['A', 'B'])
+        b = pd.CategoricalIndex(['A'], categories=['B', 'A'])
+        c = pd.CategoricalIndex(['C'], categories=['B', 'A'])
+        assert a.equals(b)
+        assert not a.equals(c)
+        assert not b.equals(c)
+
+    def test_string_categorical_index_repr(self):
+        # short
+        idx = pd.CategoricalIndex(['a', 'bb', 'ccc'])
+        if PY3:
+            expected = u"""CategoricalIndex(['a', 'bb', 'ccc'], categories=['a', 'bb', 'ccc'], ordered=False, dtype='category')"""  # noqa
+            assert repr(idx) == expected
+        else:
+            expected = u"""CategoricalIndex([u'a', u'bb', u'ccc'], categories=[u'a', u'bb', u'ccc'], ordered=False, dtype='category')"""  # noqa
+            assert unicode(idx) == expected
+
+        # multiple lines
+        idx = pd.CategoricalIndex(['a', 'bb', 'ccc'] * 10)
+        if PY3:
+            expected = u"""CategoricalIndex(['a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a',
+                  'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb',
+                  'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc'],
+                 categories=['a', 'bb', 'ccc'], ordered=False, dtype='category')"""  # noqa
+
+            assert repr(idx) == expected
+        else:
+            expected = u"""CategoricalIndex([u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb',
+                  u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a',
+                  u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc',
+                  u'a', u'bb', u'ccc', u'a', u'bb', u'ccc'],
+                 categories=[u'a', u'bb', u'ccc'], ordered=False, dtype='category')"""  # noqa
+
+            assert unicode(idx) == expected
+
+        # truncated
+        idx = pd.CategoricalIndex(['a', 'bb', 'ccc'] * 100)
+        if PY3:
+            expected = u"""CategoricalIndex(['a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a',
+                  ...
+                  'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc'],
+                 categories=['a', 'bb', 'ccc'], ordered=False, dtype='category', length=300)"""  # noqa
+
+            assert repr(idx) == expected
+        else:
+            expected = u"""CategoricalIndex([u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb',
+                  u'ccc', u'a',
+                  ...
+                  u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a',
+                  u'bb', u'ccc'],
+                 categories=[u'a', u'bb', u'ccc'], ordered=False, dtype='category', length=300)"""  # noqa
+
+            assert unicode(idx) == expected
+
+        # larger categories
+        idx = pd.CategoricalIndex(list('abcdefghijklmmo'))
+        if PY3:
+            expected = u"""CategoricalIndex(['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l',
+                  'm', 'm', 'o'],
+                 categories=['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', ...], ordered=False, dtype='category')"""  # noqa
+
+            assert repr(idx) == expected
+        else:
+            expected = u"""CategoricalIndex([u'a', u'b', u'c', u'd', u'e', u'f', u'g', u'h', u'i', u'j',
+                  u'k', u'l', u'm', u'm', u'o'],
+                 categories=[u'a', u'b', u'c', u'd', u'e', u'f', u'g', u'h', ...], ordered=False, dtype='category')"""  # noqa
+
+            assert unicode(idx) == expected
+
+        # short
+        idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'])
+        if PY3:
+            expected = u"""CategoricalIndex(['あ', 'いい', 'ううう'], categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""  # noqa
+            assert repr(idx) == expected
+        else:
+            expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう'], categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""  # noqa
+            assert unicode(idx) == expected
+
+        # multiple lines
+        idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'] * 10)
+        if PY3:
+            expected = u"""CategoricalIndex(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ',
+                  'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい',
+                  'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう'],
+                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""  # noqa
+
+            assert repr(idx) == expected
+        else:
+            expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい',
+                  u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
+                  u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう',
+                  u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう'],
+                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""  # noqa
+
+            assert unicode(idx) == expected
+
+        # truncated
+        idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'] * 100)
+        if PY3:
+            expected = u"""CategoricalIndex(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ',
+                  ...
+                  'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう'],
+                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category', length=300)"""  # noqa
+
+            assert repr(idx) == expected
+        else:
+            expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい',
+                  u'ううう', u'あ',
+                  ...
+                  u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
+                  u'いい', u'ううう'],
+                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category', length=300)"""  # noqa
+
+            assert unicode(idx) == expected
+
+        # larger categories
+        idx = pd.CategoricalIndex(list(u'あいうえおかきくけこさしすせそ'))
+        if PY3:
+            expected = u"""CategoricalIndex(['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', 'け', 'こ', 'さ', 'し',
+                  'す', 'せ', 'そ'],
+                 categories=['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', ...], ordered=False, dtype='category')"""  # noqa
+
+            assert repr(idx) == expected
+        else:
+            expected = u"""CategoricalIndex([u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く', u'け', u'こ',
+                  u'さ', u'し', u'す', u'せ', u'そ'],
+                 categories=[u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く', ...], ordered=False, dtype='category')"""  # noqa
+
+            assert unicode(idx) == expected
+
+        # Emable Unicode option -----------------------------------------
+        with cf.option_context('display.unicode.east_asian_width', True):
+
+            # short
+            idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'])
+            if PY3:
+                expected = u"""CategoricalIndex(['あ', 'いい', 'ううう'], categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""  # noqa
+                assert repr(idx) == expected
+            else:
+                expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう'], categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""  # noqa
+                assert unicode(idx) == expected
+
+            # multiple lines
+            idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'] * 10)
+            if PY3:
+                expected = u"""CategoricalIndex(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい',
+                  'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',
+                  'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい',
+                  'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう'],
+                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""  # noqa
+
+                assert repr(idx) == expected
+            else:
+                expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
+                  u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
+                  u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
+                  u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
+                  u'いい', u'ううう', u'あ', u'いい', u'ううう'],
+                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""  # noqa
+
+                assert unicode(idx) == expected
+
+            # truncated
+            idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'] * 100)
+            if PY3:
+                expected = u"""CategoricalIndex(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい',
+                  'ううう', 'あ',
+                  ...
+                  'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',
+                  'あ', 'いい', 'ううう'],
+                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category', length=300)"""  # noqa
+
+                assert repr(idx) == expected
+            else:
+                expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
+                  u'いい', u'ううう', u'あ',
+                  ...
+                  u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい',
+                  u'ううう', u'あ', u'いい', u'ううう'],
+                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category', length=300)"""  # noqa
+
+                assert unicode(idx) == expected
+
+            # larger categories
+            idx = pd.CategoricalIndex(list(u'あいうえおかきくけこさしすせそ'))
+            if PY3:
+                expected = u"""CategoricalIndex(['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', 'け', 'こ',
+                  'さ', 'し', 'す', 'せ', 'そ'],
+                 categories=['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', ...], ordered=False, dtype='category')"""  # noqa
+
+                assert repr(idx) == expected
+            else:
+                expected = u"""CategoricalIndex([u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く',
+                  u'け', u'こ', u'さ', u'し', u'す', u'せ', u'そ'],
+                 categories=[u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く', ...], ordered=False, dtype='category')"""  # noqa
+
+                assert unicode(idx) == expected
+
+    def test_fillna_categorical(self):
+        # GH 11343
+        idx = CategoricalIndex([1.0, np.nan, 3.0, 1.0], name='x')
+        # fill by value in categories
+        exp = CategoricalIndex([1.0, 1.0, 3.0, 1.0], name='x')
+        tm.assert_index_equal(idx.fillna(1.0), exp)
+
+        # fill by value not in categories raises ValueError
+        with tm.assert_raises_regex(ValueError,
+                                    'fill value must be in categories'):
+            idx.fillna(2.0)
+
+    def test_take_fill_value(self):
+        # GH 12631
+
+        # numeric category
+        idx = pd.CategoricalIndex([1, 2, 3], name='xxx')
+        result = idx.take(np.array([1, 0, -1]))
+        expected = pd.CategoricalIndex([2, 1, 3], name='xxx')
+        tm.assert_index_equal(result, expected)
+        tm.assert_categorical_equal(result.values, expected.values)
+
+        # fill_value
+        result = idx.take(np.array([1, 0, -1]), fill_value=True)
+        expected = pd.CategoricalIndex([2, 1, np.nan], categories=[1, 2, 3],
+                                       name='xxx')
+        tm.assert_index_equal(result, expected)
+        tm.assert_categorical_equal(result.values, expected.values)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        expected = pd.CategoricalIndex([2, 1, 3], name='xxx')
+        tm.assert_index_equal(result, expected)
+        tm.assert_categorical_equal(result.values, expected.values)
+
+        # object category
+        idx = pd.CategoricalIndex(list('CBA'), categories=list('ABC'),
+                                  ordered=True, name='xxx')
+        result = idx.take(np.array([1, 0, -1]))
+        expected = pd.CategoricalIndex(list('BCA'), categories=list('ABC'),
+                                       ordered=True, name='xxx')
+        tm.assert_index_equal(result, expected)
+        tm.assert_categorical_equal(result.values, expected.values)
+
+        # fill_value
+        result = idx.take(np.array([1, 0, -1]), fill_value=True)
+        expected = pd.CategoricalIndex(['B', 'C', np.nan],
+                                       categories=list('ABC'), ordered=True,
+                                       name='xxx')
+        tm.assert_index_equal(result, expected)
+        tm.assert_categorical_equal(result.values, expected.values)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        expected = pd.CategoricalIndex(list('BCA'), categories=list('ABC'),
+                                       ordered=True, name='xxx')
+        tm.assert_index_equal(result, expected)
+        tm.assert_categorical_equal(result.values, expected.values)
+
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -2]), fill_value=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            idx.take(np.array([1, -5]))
+
+    def test_take_fill_value_datetime(self):
+
+        # datetime category
+        idx = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'],
+                               name='xxx')
+        idx = pd.CategoricalIndex(idx)
+        result = idx.take(np.array([1, 0, -1]))
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
+                                    name='xxx')
+        expected = pd.CategoricalIndex(expected)
+        tm.assert_index_equal(result, expected)
+
+        # fill_value
+        result = idx.take(np.array([1, 0, -1]), fill_value=True)
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', 'NaT'],
+                                    name='xxx')
+        exp_cats = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'])
+        expected = pd.CategoricalIndex(expected, categories=exp_cats)
+        tm.assert_index_equal(result, expected)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
+                                    name='xxx')
+        expected = pd.CategoricalIndex(expected)
+        tm.assert_index_equal(result, expected)
+
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -2]), fill_value=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            idx.take(np.array([1, -5]))
+
+    def test_take_invalid_kwargs(self):
+        idx = pd.CategoricalIndex([1, 2, 3], name='foo')
+        indices = [1, 0, -1]
+
+        msg = r"take\(\) got an unexpected keyword argument 'foo'"
+        tm.assert_raises_regex(TypeError, msg, idx.take,
+                               indices, foo=2)
+
+        msg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, idx.take,
+                               indices, out=indices)
+
+        msg = "the 'mode' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, idx.take,
+                               indices, mode='clip')
diff --git a/pandas/tests/indexes/test_frozen.py b/pandas/tests/indexes/test_frozen.py
new file mode 100644
index 0000000000000..ca9841112b1d5
--- /dev/null
+++ b/pandas/tests/indexes/test_frozen.py
@@ -0,0 +1,71 @@
+import numpy as np
+from pandas.util import testing as tm
+from pandas.tests.test_base import CheckImmutable, CheckStringMixin
+from pandas.core.indexes.frozen import FrozenList, FrozenNDArray
+from pandas.compat import u
+
+
+class TestFrozenList(CheckImmutable, CheckStringMixin):
+    mutable_methods = ('extend', 'pop', 'remove', 'insert')
+    unicode_container = FrozenList([u("\u05d0"), u("\u05d1"), "c"])
+
+    def setup_method(self, method):
+        self.lst = [1, 2, 3, 4, 5]
+        self.container = FrozenList(self.lst)
+        self.klass = FrozenList
+
+    def test_add(self):
+        result = self.container + (1, 2, 3)
+        expected = FrozenList(self.lst + [1, 2, 3])
+        self.check_result(result, expected)
+
+        result = (1, 2, 3) + self.container
+        expected = FrozenList([1, 2, 3] + self.lst)
+        self.check_result(result, expected)
+
+    def test_inplace(self):
+        q = r = self.container
+        q += [5]
+        self.check_result(q, self.lst + [5])
+        # other shouldn't be mutated
+        self.check_result(r, self.lst)
+
+
+class TestFrozenNDArray(CheckImmutable, CheckStringMixin):
+    mutable_methods = ('put', 'itemset', 'fill')
+    unicode_container = FrozenNDArray([u("\u05d0"), u("\u05d1"), "c"])
+
+    def setup_method(self, method):
+        self.lst = [3, 5, 7, -2]
+        self.container = FrozenNDArray(self.lst)
+        self.klass = FrozenNDArray
+
+    def test_shallow_copying(self):
+        original = self.container.copy()
+        assert isinstance(self.container.view(), FrozenNDArray)
+        assert not isinstance(self.container.view(np.ndarray), FrozenNDArray)
+        assert self.container.view() is not self.container
+        tm.assert_numpy_array_equal(self.container, original)
+
+        # Shallow copy should be the same too
+        assert isinstance(self.container._shallow_copy(), FrozenNDArray)
+
+        # setting should not be allowed
+        def testit(container):
+            container[0] = 16
+
+        self.check_mutable_error(testit, self.container)
+
+    def test_values(self):
+        original = self.container.view(np.ndarray).copy()
+        n = original[0] + 15
+
+        vals = self.container.values()
+        tm.assert_numpy_array_equal(original, vals)
+
+        assert original is not vals
+        vals[0] = n
+
+        assert isinstance(self.container, FrozenNDArray)
+        tm.assert_numpy_array_equal(self.container.values(), original)
+        assert vals[0] == n
diff --git a/pandas/tests/indexes/test_multi.py b/pandas/tests/indexes/test_multi.py
new file mode 100644
index 0000000000000..1dc44677ab3ad
--- /dev/null
+++ b/pandas/tests/indexes/test_multi.py
@@ -0,0 +1,3334 @@
+# -*- coding: utf-8 -*-
+
+import re
+import warnings
+
+from datetime import timedelta
+from itertools import product
+
+import pytest
+
+import numpy as np
+
+import pandas as pd
+
+from pandas import (CategoricalIndex, DataFrame, Index, MultiIndex,
+                    compat, date_range, period_range)
+from pandas.compat import PY3, long, lrange, lzip, range, u, PYPY
+from pandas.errors import PerformanceWarning, UnsortedIndexError
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas.core.indexes.base import InvalidIndexError
+from pandas.core.dtypes.cast import construct_1d_object_array_from_listlike
+from pandas._libs.tslib import Timestamp
+
+import pandas.util.testing as tm
+
+from pandas.util.testing import assert_almost_equal, assert_copy
+
+from .common import Base
+
+
+class TestMultiIndex(Base):
+    _holder = MultiIndex
+    _compat_props = ['shape', 'ndim', 'size']
+
+    def setup_method(self, method):
+        major_axis = Index(['foo', 'bar', 'baz', 'qux'])
+        minor_axis = Index(['one', 'two'])
+
+        major_labels = np.array([0, 0, 1, 2, 3, 3])
+        minor_labels = np.array([0, 1, 0, 1, 0, 1])
+        self.index_names = ['first', 'second']
+        self.indices = dict(index=MultiIndex(levels=[major_axis, minor_axis],
+                                             labels=[major_labels, minor_labels
+                                                     ], names=self.index_names,
+                                             verify_integrity=False))
+        self.setup_indices()
+
+    def create_index(self):
+        return self.index
+
+    def test_can_hold_identifiers(self):
+        idx = self.create_index()
+        key = idx[0]
+        assert idx._can_hold_identifiers_and_holds_name(key) is True
+
+    def test_boolean_context_compat2(self):
+
+        # boolean context compat
+        # GH7897
+        i1 = MultiIndex.from_tuples([('A', 1), ('A', 2)])
+        i2 = MultiIndex.from_tuples([('A', 1), ('A', 3)])
+        common = i1.intersection(i2)
+
+        def f():
+            if common:
+                pass
+
+        tm.assert_raises_regex(ValueError, 'The truth value of a', f)
+
+    def test_labels_dtypes(self):
+
+        # GH 8456
+        i = MultiIndex.from_tuples([('A', 1), ('A', 2)])
+        assert i.labels[0].dtype == 'int8'
+        assert i.labels[1].dtype == 'int8'
+
+        i = MultiIndex.from_product([['a'], range(40)])
+        assert i.labels[1].dtype == 'int8'
+        i = MultiIndex.from_product([['a'], range(400)])
+        assert i.labels[1].dtype == 'int16'
+        i = MultiIndex.from_product([['a'], range(40000)])
+        assert i.labels[1].dtype == 'int32'
+
+        i = pd.MultiIndex.from_product([['a'], range(1000)])
+        assert (i.labels[0] >= 0).all()
+        assert (i.labels[1] >= 0).all()
+
+    def test_where(self):
+        i = MultiIndex.from_tuples([('A', 1), ('A', 2)])
+
+        def f():
+            i.where(True)
+
+        pytest.raises(NotImplementedError, f)
+
+    def test_where_array_like(self):
+        i = MultiIndex.from_tuples([('A', 1), ('A', 2)])
+        klasses = [list, tuple, np.array, pd.Series]
+        cond = [False, True]
+
+        for klass in klasses:
+            def f():
+                return i.where(klass(cond))
+            pytest.raises(NotImplementedError, f)
+
+    def test_repeat(self):
+        reps = 2
+        numbers = [1, 2, 3]
+        names = np.array(['foo', 'bar'])
+
+        m = MultiIndex.from_product([
+            numbers, names], names=names)
+        expected = MultiIndex.from_product([
+            numbers, names.repeat(reps)], names=names)
+        tm.assert_index_equal(m.repeat(reps), expected)
+
+        with tm.assert_produces_warning(FutureWarning):
+            result = m.repeat(n=reps)
+            tm.assert_index_equal(result, expected)
+
+    def test_numpy_repeat(self):
+        reps = 2
+        numbers = [1, 2, 3]
+        names = np.array(['foo', 'bar'])
+
+        m = MultiIndex.from_product([
+            numbers, names], names=names)
+        expected = MultiIndex.from_product([
+            numbers, names.repeat(reps)], names=names)
+        tm.assert_index_equal(np.repeat(m, reps), expected)
+
+        msg = "the 'axis' parameter is not supported"
+        tm.assert_raises_regex(
+            ValueError, msg, np.repeat, m, reps, axis=1)
+
+    def test_set_name_methods(self):
+        # so long as these are synonyms, we don't need to test set_names
+        assert self.index.rename == self.index.set_names
+        new_names = [name + "SUFFIX" for name in self.index_names]
+        ind = self.index.set_names(new_names)
+        assert self.index.names == self.index_names
+        assert ind.names == new_names
+        with tm.assert_raises_regex(ValueError, "^Length"):
+            ind.set_names(new_names + new_names)
+        new_names2 = [name + "SUFFIX2" for name in new_names]
+        res = ind.set_names(new_names2, inplace=True)
+        assert res is None
+        assert ind.names == new_names2
+
+        # set names for specific level (# GH7792)
+        ind = self.index.set_names(new_names[0], level=0)
+        assert self.index.names == self.index_names
+        assert ind.names == [new_names[0], self.index_names[1]]
+
+        res = ind.set_names(new_names2[0], level=0, inplace=True)
+        assert res is None
+        assert ind.names == [new_names2[0], self.index_names[1]]
+
+        # set names for multiple levels
+        ind = self.index.set_names(new_names, level=[0, 1])
+        assert self.index.names == self.index_names
+        assert ind.names == new_names
+
+        res = ind.set_names(new_names2, level=[0, 1], inplace=True)
+        assert res is None
+        assert ind.names == new_names2
+
+    @pytest.mark.parametrize('inplace', [True, False])
+    def test_set_names_with_nlevel_1(self, inplace):
+        # GH 21149
+        # Ensure that .set_names for MultiIndex with
+        # nlevels == 1 does not raise any errors
+        expected = pd.MultiIndex(levels=[[0, 1]],
+                                 labels=[[0, 1]],
+                                 names=['first'])
+        m = pd.MultiIndex.from_product([[0, 1]])
+        result = m.set_names('first', level=0, inplace=inplace)
+
+        if inplace:
+            result = m
+
+        tm.assert_index_equal(result, expected)
+
+    def test_set_levels_labels_directly(self):
+        # setting levels/labels directly raises AttributeError
+
+        levels = self.index.levels
+        new_levels = [[lev + 'a' for lev in level] for level in levels]
+
+        labels = self.index.labels
+        major_labels, minor_labels = labels
+        major_labels = [(x + 1) % 3 for x in major_labels]
+        minor_labels = [(x + 1) % 1 for x in minor_labels]
+        new_labels = [major_labels, minor_labels]
+
+        with pytest.raises(AttributeError):
+            self.index.levels = new_levels
+
+        with pytest.raises(AttributeError):
+            self.index.labels = new_labels
+
+    def test_set_levels(self):
+        # side note - you probably wouldn't want to use levels and labels
+        # directly like this - but it is possible.
+        levels = self.index.levels
+        new_levels = [[lev + 'a' for lev in level] for level in levels]
+
+        def assert_matching(actual, expected, check_dtype=False):
+            # avoid specifying internal representation
+            # as much as possible
+            assert len(actual) == len(expected)
+            for act, exp in zip(actual, expected):
+                act = np.asarray(act)
+                exp = np.asarray(exp)
+                tm.assert_numpy_array_equal(act, exp, check_dtype=check_dtype)
+
+        # level changing [w/o mutation]
+        ind2 = self.index.set_levels(new_levels)
+        assert_matching(ind2.levels, new_levels)
+        assert_matching(self.index.levels, levels)
+
+        # level changing [w/ mutation]
+        ind2 = self.index.copy()
+        inplace_return = ind2.set_levels(new_levels, inplace=True)
+        assert inplace_return is None
+        assert_matching(ind2.levels, new_levels)
+
+        # level changing specific level [w/o mutation]
+        ind2 = self.index.set_levels(new_levels[0], level=0)
+        assert_matching(ind2.levels, [new_levels[0], levels[1]])
+        assert_matching(self.index.levels, levels)
+
+        ind2 = self.index.set_levels(new_levels[1], level=1)
+        assert_matching(ind2.levels, [levels[0], new_levels[1]])
+        assert_matching(self.index.levels, levels)
+
+        # level changing multiple levels [w/o mutation]
+        ind2 = self.index.set_levels(new_levels, level=[0, 1])
+        assert_matching(ind2.levels, new_levels)
+        assert_matching(self.index.levels, levels)
+
+        # level changing specific level [w/ mutation]
+        ind2 = self.index.copy()
+        inplace_return = ind2.set_levels(new_levels[0], level=0, inplace=True)
+        assert inplace_return is None
+        assert_matching(ind2.levels, [new_levels[0], levels[1]])
+        assert_matching(self.index.levels, levels)
+
+        ind2 = self.index.copy()
+        inplace_return = ind2.set_levels(new_levels[1], level=1, inplace=True)
+        assert inplace_return is None
+        assert_matching(ind2.levels, [levels[0], new_levels[1]])
+        assert_matching(self.index.levels, levels)
+
+        # level changing multiple levels [w/ mutation]
+        ind2 = self.index.copy()
+        inplace_return = ind2.set_levels(new_levels, level=[0, 1],
+                                         inplace=True)
+        assert inplace_return is None
+        assert_matching(ind2.levels, new_levels)
+        assert_matching(self.index.levels, levels)
+
+        # illegal level changing should not change levels
+        # GH 13754
+        original_index = self.index.copy()
+        for inplace in [True, False]:
+            with tm.assert_raises_regex(ValueError, "^On"):
+                self.index.set_levels(['c'], level=0, inplace=inplace)
+            assert_matching(self.index.levels, original_index.levels,
+                            check_dtype=True)
+
+            with tm.assert_raises_regex(ValueError, "^On"):
+                self.index.set_labels([0, 1, 2, 3, 4, 5], level=0,
+                                      inplace=inplace)
+            assert_matching(self.index.labels, original_index.labels,
+                            check_dtype=True)
+
+            with tm.assert_raises_regex(TypeError, "^Levels"):
+                self.index.set_levels('c', level=0, inplace=inplace)
+            assert_matching(self.index.levels, original_index.levels,
+                            check_dtype=True)
+
+            with tm.assert_raises_regex(TypeError, "^Labels"):
+                self.index.set_labels(1, level=0, inplace=inplace)
+            assert_matching(self.index.labels, original_index.labels,
+                            check_dtype=True)
+
+    def test_set_labels(self):
+        # side note - you probably wouldn't want to use levels and labels
+        # directly like this - but it is possible.
+        labels = self.index.labels
+        major_labels, minor_labels = labels
+        major_labels = [(x + 1) % 3 for x in major_labels]
+        minor_labels = [(x + 1) % 1 for x in minor_labels]
+        new_labels = [major_labels, minor_labels]
+
+        def assert_matching(actual, expected):
+            # avoid specifying internal representation
+            # as much as possible
+            assert len(actual) == len(expected)
+            for act, exp in zip(actual, expected):
+                act = np.asarray(act)
+                exp = np.asarray(exp, dtype=np.int8)
+                tm.assert_numpy_array_equal(act, exp)
+
+        # label changing [w/o mutation]
+        ind2 = self.index.set_labels(new_labels)
+        assert_matching(ind2.labels, new_labels)
+        assert_matching(self.index.labels, labels)
+
+        # label changing [w/ mutation]
+        ind2 = self.index.copy()
+        inplace_return = ind2.set_labels(new_labels, inplace=True)
+        assert inplace_return is None
+        assert_matching(ind2.labels, new_labels)
+
+        # label changing specific level [w/o mutation]
+        ind2 = self.index.set_labels(new_labels[0], level=0)
+        assert_matching(ind2.labels, [new_labels[0], labels[1]])
+        assert_matching(self.index.labels, labels)
+
+        ind2 = self.index.set_labels(new_labels[1], level=1)
+        assert_matching(ind2.labels, [labels[0], new_labels[1]])
+        assert_matching(self.index.labels, labels)
+
+        # label changing multiple levels [w/o mutation]
+        ind2 = self.index.set_labels(new_labels, level=[0, 1])
+        assert_matching(ind2.labels, new_labels)
+        assert_matching(self.index.labels, labels)
+
+        # label changing specific level [w/ mutation]
+        ind2 = self.index.copy()
+        inplace_return = ind2.set_labels(new_labels[0], level=0, inplace=True)
+        assert inplace_return is None
+        assert_matching(ind2.labels, [new_labels[0], labels[1]])
+        assert_matching(self.index.labels, labels)
+
+        ind2 = self.index.copy()
+        inplace_return = ind2.set_labels(new_labels[1], level=1, inplace=True)
+        assert inplace_return is None
+        assert_matching(ind2.labels, [labels[0], new_labels[1]])
+        assert_matching(self.index.labels, labels)
+
+        # label changing multiple levels [w/ mutation]
+        ind2 = self.index.copy()
+        inplace_return = ind2.set_labels(new_labels, level=[0, 1],
+                                         inplace=True)
+        assert inplace_return is None
+        assert_matching(ind2.labels, new_labels)
+        assert_matching(self.index.labels, labels)
+
+        # label changing for levels of different magnitude of categories
+        ind = pd.MultiIndex.from_tuples([(0, i) for i in range(130)])
+        new_labels = range(129, -1, -1)
+        expected = pd.MultiIndex.from_tuples(
+            [(0, i) for i in new_labels])
+
+        # [w/o mutation]
+        result = ind.set_labels(labels=new_labels, level=1)
+        assert result.equals(expected)
+
+        # [w/ mutation]
+        result = ind.copy()
+        result.set_labels(labels=new_labels, level=1, inplace=True)
+        assert result.equals(expected)
+
+    def test_set_levels_labels_names_bad_input(self):
+        levels, labels = self.index.levels, self.index.labels
+        names = self.index.names
+
+        with tm.assert_raises_regex(ValueError, 'Length of levels'):
+            self.index.set_levels([levels[0]])
+
+        with tm.assert_raises_regex(ValueError, 'Length of labels'):
+            self.index.set_labels([labels[0]])
+
+        with tm.assert_raises_regex(ValueError, 'Length of names'):
+            self.index.set_names([names[0]])
+
+        # shouldn't scalar data error, instead should demand list-like
+        with tm.assert_raises_regex(TypeError, 'list of lists-like'):
+            self.index.set_levels(levels[0])
+
+        # shouldn't scalar data error, instead should demand list-like
+        with tm.assert_raises_regex(TypeError, 'list of lists-like'):
+            self.index.set_labels(labels[0])
+
+        # shouldn't scalar data error, instead should demand list-like
+        with tm.assert_raises_regex(TypeError, 'list-like'):
+            self.index.set_names(names[0])
+
+        # should have equal lengths
+        with tm.assert_raises_regex(TypeError, 'list of lists-like'):
+            self.index.set_levels(levels[0], level=[0, 1])
+
+        with tm.assert_raises_regex(TypeError, 'list-like'):
+            self.index.set_levels(levels, level=0)
+
+        # should have equal lengths
+        with tm.assert_raises_regex(TypeError, 'list of lists-like'):
+            self.index.set_labels(labels[0], level=[0, 1])
+
+        with tm.assert_raises_regex(TypeError, 'list-like'):
+            self.index.set_labels(labels, level=0)
+
+        # should have equal lengths
+        with tm.assert_raises_regex(ValueError, 'Length of names'):
+            self.index.set_names(names[0], level=[0, 1])
+
+        with tm.assert_raises_regex(TypeError, 'string'):
+            self.index.set_names(names, level=0)
+
+    def test_set_levels_categorical(self):
+        # GH13854
+        index = MultiIndex.from_arrays([list("xyzx"), [0, 1, 2, 3]])
+        for ordered in [False, True]:
+            cidx = CategoricalIndex(list("bac"), ordered=ordered)
+            result = index.set_levels(cidx, 0)
+            expected = MultiIndex(levels=[cidx, [0, 1, 2, 3]],
+                                  labels=index.labels)
+            tm.assert_index_equal(result, expected)
+
+            result_lvl = result.get_level_values(0)
+            expected_lvl = CategoricalIndex(list("bacb"),
+                                            categories=cidx.categories,
+                                            ordered=cidx.ordered)
+            tm.assert_index_equal(result_lvl, expected_lvl)
+
+    def test_metadata_immutable(self):
+        levels, labels = self.index.levels, self.index.labels
+        # shouldn't be able to set at either the top level or base level
+        mutable_regex = re.compile('does not support mutable operations')
+        with tm.assert_raises_regex(TypeError, mutable_regex):
+            levels[0] = levels[0]
+        with tm.assert_raises_regex(TypeError, mutable_regex):
+            levels[0][0] = levels[0][0]
+        # ditto for labels
+        with tm.assert_raises_regex(TypeError, mutable_regex):
+            labels[0] = labels[0]
+        with tm.assert_raises_regex(TypeError, mutable_regex):
+            labels[0][0] = labels[0][0]
+        # and for names
+        names = self.index.names
+        with tm.assert_raises_regex(TypeError, mutable_regex):
+            names[0] = names[0]
+
+    def test_inplace_mutation_resets_values(self):
+        levels = [['a', 'b', 'c'], [4]]
+        levels2 = [[1, 2, 3], ['a']]
+        labels = [[0, 1, 0, 2, 2, 0], [0, 0, 0, 0, 0, 0]]
+
+        mi1 = MultiIndex(levels=levels, labels=labels)
+        mi2 = MultiIndex(levels=levels2, labels=labels)
+        vals = mi1.values.copy()
+        vals2 = mi2.values.copy()
+
+        assert mi1._tuples is not None
+
+        # Make sure level setting works
+        new_vals = mi1.set_levels(levels2).values
+        tm.assert_almost_equal(vals2, new_vals)
+
+        # Non-inplace doesn't kill _tuples [implementation detail]
+        tm.assert_almost_equal(mi1._tuples, vals)
+
+        # ...and values is still same too
+        tm.assert_almost_equal(mi1.values, vals)
+
+        # Inplace should kill _tuples
+        mi1.set_levels(levels2, inplace=True)
+        tm.assert_almost_equal(mi1.values, vals2)
+
+        # Make sure label setting works too
+        labels2 = [[0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0]]
+        exp_values = np.empty((6,), dtype=object)
+        exp_values[:] = [(long(1), 'a')] * 6
+
+        # Must be 1d array of tuples
+        assert exp_values.shape == (6,)
+        new_values = mi2.set_labels(labels2).values
+
+        # Not inplace shouldn't change
+        tm.assert_almost_equal(mi2._tuples, vals2)
+
+        # Should have correct values
+        tm.assert_almost_equal(exp_values, new_values)
+
+        # ...and again setting inplace should kill _tuples, etc
+        mi2.set_labels(labels2, inplace=True)
+        tm.assert_almost_equal(mi2.values, new_values)
+
+    def test_copy_in_constructor(self):
+        levels = np.array(["a", "b", "c"])
+        labels = np.array([1, 1, 2, 0, 0, 1, 1])
+        val = labels[0]
+        mi = MultiIndex(levels=[levels, levels], labels=[labels, labels],
+                        copy=True)
+        assert mi.labels[0][0] == val
+        labels[0] = 15
+        assert mi.labels[0][0] == val
+        val = levels[0]
+        levels[0] = "PANDA"
+        assert mi.levels[0][0] == val
+
+    def test_set_value_keeps_names(self):
+        # motivating example from #3742
+        lev1 = ['hans', 'hans', 'hans', 'grethe', 'grethe', 'grethe']
+        lev2 = ['1', '2', '3'] * 2
+        idx = pd.MultiIndex.from_arrays([lev1, lev2], names=['Name', 'Number'])
+        df = pd.DataFrame(
+            np.random.randn(6, 4),
+            columns=['one', 'two', 'three', 'four'],
+            index=idx)
+        df = df.sort_index()
+        assert df._is_copy is None
+        assert df.index.names == ('Name', 'Number')
+        df.at[('grethe', '4'), 'one'] = 99.34
+        assert df._is_copy is None
+        assert df.index.names == ('Name', 'Number')
+
+    def test_copy_names(self):
+        # Check that adding a "names" parameter to the copy is honored
+        # GH14302
+        multi_idx = pd.Index([(1, 2), (3, 4)], names=['MyName1', 'MyName2'])
+        multi_idx1 = multi_idx.copy()
+
+        assert multi_idx.equals(multi_idx1)
+        assert multi_idx.names == ['MyName1', 'MyName2']
+        assert multi_idx1.names == ['MyName1', 'MyName2']
+
+        multi_idx2 = multi_idx.copy(names=['NewName1', 'NewName2'])
+
+        assert multi_idx.equals(multi_idx2)
+        assert multi_idx.names == ['MyName1', 'MyName2']
+        assert multi_idx2.names == ['NewName1', 'NewName2']
+
+        multi_idx3 = multi_idx.copy(name=['NewName1', 'NewName2'])
+
+        assert multi_idx.equals(multi_idx3)
+        assert multi_idx.names == ['MyName1', 'MyName2']
+        assert multi_idx3.names == ['NewName1', 'NewName2']
+
+    def test_names(self):
+
+        # names are assigned in setup
+        names = self.index_names
+        level_names = [level.name for level in self.index.levels]
+        assert names == level_names
+
+        # setting bad names on existing
+        index = self.index
+        tm.assert_raises_regex(ValueError, "^Length of names",
+                               setattr, index, "names",
+                               list(index.names) + ["third"])
+        tm.assert_raises_regex(ValueError, "^Length of names",
+                               setattr, index, "names", [])
+
+        # initializing with bad names (should always be equivalent)
+        major_axis, minor_axis = self.index.levels
+        major_labels, minor_labels = self.index.labels
+        tm.assert_raises_regex(ValueError, "^Length of names", MultiIndex,
+                               levels=[major_axis, minor_axis],
+                               labels=[major_labels, minor_labels],
+                               names=['first'])
+        tm.assert_raises_regex(ValueError, "^Length of names", MultiIndex,
+                               levels=[major_axis, minor_axis],
+                               labels=[major_labels, minor_labels],
+                               names=['first', 'second', 'third'])
+
+        # names are assigned
+        index.names = ["a", "b"]
+        ind_names = list(index.names)
+        level_names = [level.name for level in index.levels]
+        assert ind_names == level_names
+
+    def test_astype(self):
+        expected = self.index.copy()
+        actual = self.index.astype('O')
+        assert_copy(actual.levels, expected.levels)
+        assert_copy(actual.labels, expected.labels)
+        self.check_level_names(actual, expected.names)
+
+        with tm.assert_raises_regex(TypeError, "^Setting.*dtype.*object"):
+            self.index.astype(np.dtype(int))
+
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_astype_category(self, ordered):
+        # GH 18630
+        msg = '> 1 ndim Categorical are not supported at this time'
+        with tm.assert_raises_regex(NotImplementedError, msg):
+            self.index.astype(CategoricalDtype(ordered=ordered))
+
+        if ordered is False:
+            # dtype='category' defaults to ordered=False, so only test once
+            with tm.assert_raises_regex(NotImplementedError, msg):
+                self.index.astype('category')
+
+    def test_constructor_single_level(self):
+        result = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux']],
+                            labels=[[0, 1, 2, 3]], names=['first'])
+        assert isinstance(result, MultiIndex)
+        expected = Index(['foo', 'bar', 'baz', 'qux'], name='first')
+        tm.assert_index_equal(result.levels[0], expected)
+        assert result.names == ['first']
+
+    def test_constructor_no_levels(self):
+        tm.assert_raises_regex(ValueError, "non-zero number "
+                                           "of levels/labels",
+                               MultiIndex, levels=[], labels=[])
+        both_re = re.compile('Must pass both levels and labels')
+        with tm.assert_raises_regex(TypeError, both_re):
+            MultiIndex(levels=[])
+        with tm.assert_raises_regex(TypeError, both_re):
+            MultiIndex(labels=[])
+
+    def test_constructor_mismatched_label_levels(self):
+        labels = [np.array([1]), np.array([2]), np.array([3])]
+        levels = ["a"]
+        tm.assert_raises_regex(ValueError, "Length of levels and labels "
+                                           "must be the same", MultiIndex,
+                               levels=levels, labels=labels)
+        length_error = re.compile('>= length of level')
+        label_error = re.compile(r'Unequal label lengths: \[4, 2\]')
+
+        # important to check that it's looking at the right thing.
+        with tm.assert_raises_regex(ValueError, length_error):
+            MultiIndex(levels=[['a'], ['b']],
+                       labels=[[0, 1, 2, 3], [0, 3, 4, 1]])
+
+        with tm.assert_raises_regex(ValueError, label_error):
+            MultiIndex(levels=[['a'], ['b']], labels=[[0, 0, 0, 0], [0, 0]])
+
+        # external API
+        with tm.assert_raises_regex(ValueError, length_error):
+            self.index.copy().set_levels([['a'], ['b']])
+
+        with tm.assert_raises_regex(ValueError, label_error):
+            self.index.copy().set_labels([[0, 0, 0, 0], [0, 0]])
+
+    def test_constructor_nonhashable_names(self):
+        # GH 20527
+        levels = [[1, 2], [u'one', u'two']]
+        labels = [[0, 0, 1, 1], [0, 1, 0, 1]]
+        names = ((['foo'], ['bar']))
+        message = "MultiIndex.name must be a hashable type"
+        tm.assert_raises_regex(TypeError, message,
+                               MultiIndex, levels=levels,
+                               labels=labels, names=names)
+
+        # With .rename()
+        mi = MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                        labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                        names=('foo', 'bar'))
+        renamed = [['foor'], ['barr']]
+        tm.assert_raises_regex(TypeError, message, mi.rename, names=renamed)
+        # With .set_names()
+        tm.assert_raises_regex(TypeError, message, mi.set_names, names=renamed)
+
+    @pytest.mark.parametrize('names', [['a', 'b', 'a'], [1, 1, 2],
+                                       [1, 'a', 1]])
+    def test_duplicate_level_names(self, names):
+        # GH18872, GH19029
+        mi = pd.MultiIndex.from_product([[0, 1]] * 3, names=names)
+        assert mi.names == names
+
+        # With .rename()
+        mi = pd.MultiIndex.from_product([[0, 1]] * 3)
+        mi = mi.rename(names)
+        assert mi.names == names
+
+        # With .rename(., level=)
+        mi.rename(names[1], level=1, inplace=True)
+        mi = mi.rename([names[0], names[2]], level=[0, 2])
+        assert mi.names == names
+
+    def test_duplicate_level_names_access_raises(self):
+        self.index.names = ['foo', 'foo']
+        tm.assert_raises_regex(KeyError, 'Level foo not found',
+                               self.index._get_level_number, 'foo')
+
+    def assert_multiindex_copied(self, copy, original):
+        # Levels should be (at least, shallow copied)
+        tm.assert_copy(copy.levels, original.levels)
+        tm.assert_almost_equal(copy.labels, original.labels)
+
+        # Labels doesn't matter which way copied
+        tm.assert_almost_equal(copy.labels, original.labels)
+        assert copy.labels is not original.labels
+
+        # Names doesn't matter which way copied
+        assert copy.names == original.names
+        assert copy.names is not original.names
+
+        # Sort order should be copied
+        assert copy.sortorder == original.sortorder
+
+    def test_copy(self):
+        i_copy = self.index.copy()
+
+        self.assert_multiindex_copied(i_copy, self.index)
+
+    def test_shallow_copy(self):
+        i_copy = self.index._shallow_copy()
+
+        self.assert_multiindex_copied(i_copy, self.index)
+
+    def test_view(self):
+        i_view = self.index.view()
+
+        self.assert_multiindex_copied(i_view, self.index)
+
+    def check_level_names(self, index, names):
+        assert [level.name for level in index.levels] == list(names)
+
+    def test_changing_names(self):
+
+        # names should be applied to levels
+        level_names = [level.name for level in self.index.levels]
+        self.check_level_names(self.index, self.index.names)
+
+        view = self.index.view()
+        copy = self.index.copy()
+        shallow_copy = self.index._shallow_copy()
+
+        # changing names should change level names on object
+        new_names = [name + "a" for name in self.index.names]
+        self.index.names = new_names
+        self.check_level_names(self.index, new_names)
+
+        # but not on copies
+        self.check_level_names(view, level_names)
+        self.check_level_names(copy, level_names)
+        self.check_level_names(shallow_copy, level_names)
+
+        # and copies shouldn't change original
+        shallow_copy.names = [name + "c" for name in shallow_copy.names]
+        self.check_level_names(self.index, new_names)
+
+    def test_get_level_number_integer(self):
+        self.index.names = [1, 0]
+        assert self.index._get_level_number(1) == 0
+        assert self.index._get_level_number(0) == 1
+        pytest.raises(IndexError, self.index._get_level_number, 2)
+        tm.assert_raises_regex(KeyError, 'Level fourth not found',
+                               self.index._get_level_number, 'fourth')
+
+    def test_from_arrays(self):
+        arrays = []
+        for lev, lab in zip(self.index.levels, self.index.labels):
+            arrays.append(np.asarray(lev).take(lab))
+
+        # list of arrays as input
+        result = MultiIndex.from_arrays(arrays, names=self.index.names)
+        tm.assert_index_equal(result, self.index)
+
+        # infer correctly
+        result = MultiIndex.from_arrays([[pd.NaT, Timestamp('20130101')],
+                                         ['a', 'b']])
+        assert result.levels[0].equals(Index([Timestamp('20130101')]))
+        assert result.levels[1].equals(Index(['a', 'b']))
+
+    def test_from_arrays_iterator(self):
+        # GH 18434
+        arrays = []
+        for lev, lab in zip(self.index.levels, self.index.labels):
+            arrays.append(np.asarray(lev).take(lab))
+
+        # iterator as input
+        result = MultiIndex.from_arrays(iter(arrays), names=self.index.names)
+        tm.assert_index_equal(result, self.index)
+
+        # invalid iterator input
+        with tm.assert_raises_regex(
+                TypeError, "Input must be a list / sequence of array-likes."):
+            MultiIndex.from_arrays(0)
+
+    def test_from_arrays_index_series_datetimetz(self):
+        idx1 = pd.date_range('2015-01-01 10:00', freq='D', periods=3,
+                             tz='US/Eastern')
+        idx2 = pd.date_range('2015-01-01 10:00', freq='H', periods=3,
+                             tz='Asia/Tokyo')
+        result = pd.MultiIndex.from_arrays([idx1, idx2])
+        tm.assert_index_equal(result.get_level_values(0), idx1)
+        tm.assert_index_equal(result.get_level_values(1), idx2)
+
+        result2 = pd.MultiIndex.from_arrays([pd.Series(idx1), pd.Series(idx2)])
+        tm.assert_index_equal(result2.get_level_values(0), idx1)
+        tm.assert_index_equal(result2.get_level_values(1), idx2)
+
+        tm.assert_index_equal(result, result2)
+
+    def test_from_arrays_index_series_timedelta(self):
+        idx1 = pd.timedelta_range('1 days', freq='D', periods=3)
+        idx2 = pd.timedelta_range('2 hours', freq='H', periods=3)
+        result = pd.MultiIndex.from_arrays([idx1, idx2])
+        tm.assert_index_equal(result.get_level_values(0), idx1)
+        tm.assert_index_equal(result.get_level_values(1), idx2)
+
+        result2 = pd.MultiIndex.from_arrays([pd.Series(idx1), pd.Series(idx2)])
+        tm.assert_index_equal(result2.get_level_values(0), idx1)
+        tm.assert_index_equal(result2.get_level_values(1), idx2)
+
+        tm.assert_index_equal(result, result2)
+
+    def test_from_arrays_index_series_period(self):
+        idx1 = pd.period_range('2011-01-01', freq='D', periods=3)
+        idx2 = pd.period_range('2015-01-01', freq='H', periods=3)
+        result = pd.MultiIndex.from_arrays([idx1, idx2])
+        tm.assert_index_equal(result.get_level_values(0), idx1)
+        tm.assert_index_equal(result.get_level_values(1), idx2)
+
+        result2 = pd.MultiIndex.from_arrays([pd.Series(idx1), pd.Series(idx2)])
+        tm.assert_index_equal(result2.get_level_values(0), idx1)
+        tm.assert_index_equal(result2.get_level_values(1), idx2)
+
+        tm.assert_index_equal(result, result2)
+
+    def test_from_arrays_index_datetimelike_mixed(self):
+        idx1 = pd.date_range('2015-01-01 10:00', freq='D', periods=3,
+                             tz='US/Eastern')
+        idx2 = pd.date_range('2015-01-01 10:00', freq='H', periods=3)
+        idx3 = pd.timedelta_range('1 days', freq='D', periods=3)
+        idx4 = pd.period_range('2011-01-01', freq='D', periods=3)
+
+        result = pd.MultiIndex.from_arrays([idx1, idx2, idx3, idx4])
+        tm.assert_index_equal(result.get_level_values(0), idx1)
+        tm.assert_index_equal(result.get_level_values(1), idx2)
+        tm.assert_index_equal(result.get_level_values(2), idx3)
+        tm.assert_index_equal(result.get_level_values(3), idx4)
+
+        result2 = pd.MultiIndex.from_arrays([pd.Series(idx1),
+                                             pd.Series(idx2),
+                                             pd.Series(idx3),
+                                             pd.Series(idx4)])
+        tm.assert_index_equal(result2.get_level_values(0), idx1)
+        tm.assert_index_equal(result2.get_level_values(1), idx2)
+        tm.assert_index_equal(result2.get_level_values(2), idx3)
+        tm.assert_index_equal(result2.get_level_values(3), idx4)
+
+        tm.assert_index_equal(result, result2)
+
+    def test_from_arrays_index_series_categorical(self):
+        # GH13743
+        idx1 = pd.CategoricalIndex(list("abcaab"), categories=list("bac"),
+                                   ordered=False)
+        idx2 = pd.CategoricalIndex(list("abcaab"), categories=list("bac"),
+                                   ordered=True)
+
+        result = pd.MultiIndex.from_arrays([idx1, idx2])
+        tm.assert_index_equal(result.get_level_values(0), idx1)
+        tm.assert_index_equal(result.get_level_values(1), idx2)
+
+        result2 = pd.MultiIndex.from_arrays([pd.Series(idx1), pd.Series(idx2)])
+        tm.assert_index_equal(result2.get_level_values(0), idx1)
+        tm.assert_index_equal(result2.get_level_values(1), idx2)
+
+        result3 = pd.MultiIndex.from_arrays([idx1.values, idx2.values])
+        tm.assert_index_equal(result3.get_level_values(0), idx1)
+        tm.assert_index_equal(result3.get_level_values(1), idx2)
+
+    def test_from_arrays_empty(self):
+        # 0 levels
+        with tm.assert_raises_regex(
+                ValueError, "Must pass non-zero number of levels/labels"):
+            MultiIndex.from_arrays(arrays=[])
+
+        # 1 level
+        result = MultiIndex.from_arrays(arrays=[[]], names=['A'])
+        assert isinstance(result, MultiIndex)
+        expected = Index([], name='A')
+        tm.assert_index_equal(result.levels[0], expected)
+
+        # N levels
+        for N in [2, 3]:
+            arrays = [[]] * N
+            names = list('ABC')[:N]
+            result = MultiIndex.from_arrays(arrays=arrays, names=names)
+            expected = MultiIndex(levels=[[]] * N, labels=[[]] * N,
+                                  names=names)
+            tm.assert_index_equal(result, expected)
+
+    def test_from_arrays_invalid_input(self):
+        invalid_inputs = [1, [1], [1, 2], [[1], 2],
+                          'a', ['a'], ['a', 'b'], [['a'], 'b']]
+        for i in invalid_inputs:
+            pytest.raises(TypeError, MultiIndex.from_arrays, arrays=i)
+
+    def test_from_arrays_different_lengths(self):
+        # see gh-13599
+        idx1 = [1, 2, 3]
+        idx2 = ['a', 'b']
+        tm.assert_raises_regex(ValueError, '^all arrays must '
+                                           'be same length$',
+                               MultiIndex.from_arrays, [idx1, idx2])
+
+        idx1 = []
+        idx2 = ['a', 'b']
+        tm.assert_raises_regex(ValueError, '^all arrays must '
+                                           'be same length$',
+                               MultiIndex.from_arrays, [idx1, idx2])
+
+        idx1 = [1, 2, 3]
+        idx2 = []
+        tm.assert_raises_regex(ValueError, '^all arrays must '
+                                           'be same length$',
+                               MultiIndex.from_arrays, [idx1, idx2])
+
+    def test_from_product(self):
+
+        first = ['foo', 'bar', 'buz']
+        second = ['a', 'b', 'c']
+        names = ['first', 'second']
+        result = MultiIndex.from_product([first, second], names=names)
+
+        tuples = [('foo', 'a'), ('foo', 'b'), ('foo', 'c'), ('bar', 'a'),
+                  ('bar', 'b'), ('bar', 'c'), ('buz', 'a'), ('buz', 'b'),
+                  ('buz', 'c')]
+        expected = MultiIndex.from_tuples(tuples, names=names)
+
+        tm.assert_index_equal(result, expected)
+
+    def test_from_product_iterator(self):
+        # GH 18434
+        first = ['foo', 'bar', 'buz']
+        second = ['a', 'b', 'c']
+        names = ['first', 'second']
+        tuples = [('foo', 'a'), ('foo', 'b'), ('foo', 'c'), ('bar', 'a'),
+                  ('bar', 'b'), ('bar', 'c'), ('buz', 'a'), ('buz', 'b'),
+                  ('buz', 'c')]
+        expected = MultiIndex.from_tuples(tuples, names=names)
+
+        # iterator as input
+        result = MultiIndex.from_product(iter([first, second]), names=names)
+        tm.assert_index_equal(result, expected)
+
+        # Invalid non-iterable input
+        with tm.assert_raises_regex(
+                TypeError, "Input must be a list / sequence of iterables."):
+            MultiIndex.from_product(0)
+
+    def test_from_product_empty(self):
+        # 0 levels
+        with tm.assert_raises_regex(
+                ValueError, "Must pass non-zero number of levels/labels"):
+            MultiIndex.from_product([])
+
+        # 1 level
+        result = MultiIndex.from_product([[]], names=['A'])
+        expected = pd.Index([], name='A')
+        tm.assert_index_equal(result.levels[0], expected)
+
+        # 2 levels
+        l1 = [[], ['foo', 'bar', 'baz'], []]
+        l2 = [[], [], ['a', 'b', 'c']]
+        names = ['A', 'B']
+        for first, second in zip(l1, l2):
+            result = MultiIndex.from_product([first, second], names=names)
+            expected = MultiIndex(levels=[first, second],
+                                  labels=[[], []], names=names)
+            tm.assert_index_equal(result, expected)
+
+        # GH12258
+        names = ['A', 'B', 'C']
+        for N in range(4):
+            lvl2 = lrange(N)
+            result = MultiIndex.from_product([[], lvl2, []], names=names)
+            expected = MultiIndex(levels=[[], lvl2, []],
+                                  labels=[[], [], []], names=names)
+            tm.assert_index_equal(result, expected)
+
+    def test_from_product_invalid_input(self):
+        invalid_inputs = [1, [1], [1, 2], [[1], 2],
+                          'a', ['a'], ['a', 'b'], [['a'], 'b']]
+        for i in invalid_inputs:
+            pytest.raises(TypeError, MultiIndex.from_product, iterables=i)
+
+    def test_from_product_datetimeindex(self):
+        dt_index = date_range('2000-01-01', periods=2)
+        mi = pd.MultiIndex.from_product([[1, 2], dt_index])
+        etalon = construct_1d_object_array_from_listlike([(1, pd.Timestamp(
+            '2000-01-01')), (1, pd.Timestamp('2000-01-02')), (2, pd.Timestamp(
+                '2000-01-01')), (2, pd.Timestamp('2000-01-02'))])
+        tm.assert_numpy_array_equal(mi.values, etalon)
+
+    def test_from_product_index_series_categorical(self):
+        # GH13743
+        first = ['foo', 'bar']
+        for ordered in [False, True]:
+            idx = pd.CategoricalIndex(list("abcaab"), categories=list("bac"),
+                                      ordered=ordered)
+            expected = pd.CategoricalIndex(list("abcaab") + list("abcaab"),
+                                           categories=list("bac"),
+                                           ordered=ordered)
+
+            for arr in [idx, pd.Series(idx), idx.values]:
+                result = pd.MultiIndex.from_product([first, arr])
+                tm.assert_index_equal(result.get_level_values(1), expected)
+
+    def test_values_boxed(self):
+        tuples = [(1, pd.Timestamp('2000-01-01')), (2, pd.NaT),
+                  (3, pd.Timestamp('2000-01-03')),
+                  (1, pd.Timestamp('2000-01-04')),
+                  (2, pd.Timestamp('2000-01-02')),
+                  (3, pd.Timestamp('2000-01-03'))]
+        result = pd.MultiIndex.from_tuples(tuples)
+        expected = construct_1d_object_array_from_listlike(tuples)
+        tm.assert_numpy_array_equal(result.values, expected)
+        # Check that code branches for boxed values produce identical results
+        tm.assert_numpy_array_equal(result.values[:4], result[:4].values)
+
+    def test_values_multiindex_datetimeindex(self):
+        # Test to ensure we hit the boxing / nobox part of MI.values
+        ints = np.arange(10 ** 18, 10 ** 18 + 5)
+        naive = pd.DatetimeIndex(ints)
+        aware = pd.DatetimeIndex(ints, tz='US/Central')
+
+        idx = pd.MultiIndex.from_arrays([naive, aware])
+        result = idx.values
+
+        outer = pd.DatetimeIndex([x[0] for x in result])
+        tm.assert_index_equal(outer, naive)
+
+        inner = pd.DatetimeIndex([x[1] for x in result])
+        tm.assert_index_equal(inner, aware)
+
+        # n_lev > n_lab
+        result = idx[:2].values
+
+        outer = pd.DatetimeIndex([x[0] for x in result])
+        tm.assert_index_equal(outer, naive[:2])
+
+        inner = pd.DatetimeIndex([x[1] for x in result])
+        tm.assert_index_equal(inner, aware[:2])
+
+    def test_values_multiindex_periodindex(self):
+        # Test to ensure we hit the boxing / nobox part of MI.values
+        ints = np.arange(2007, 2012)
+        pidx = pd.PeriodIndex(ints, freq='D')
+
+        idx = pd.MultiIndex.from_arrays([ints, pidx])
+        result = idx.values
+
+        outer = pd.Int64Index([x[0] for x in result])
+        tm.assert_index_equal(outer, pd.Int64Index(ints))
+
+        inner = pd.PeriodIndex([x[1] for x in result])
+        tm.assert_index_equal(inner, pidx)
+
+        # n_lev > n_lab
+        result = idx[:2].values
+
+        outer = pd.Int64Index([x[0] for x in result])
+        tm.assert_index_equal(outer, pd.Int64Index(ints[:2]))
+
+        inner = pd.PeriodIndex([x[1] for x in result])
+        tm.assert_index_equal(inner, pidx[:2])
+
+    def test_append(self):
+        result = self.index[:3].append(self.index[3:])
+        assert result.equals(self.index)
+
+        foos = [self.index[:1], self.index[1:3], self.index[3:]]
+        result = foos[0].append(foos[1:])
+        assert result.equals(self.index)
+
+        # empty
+        result = self.index.append([])
+        assert result.equals(self.index)
+
+    def test_append_mixed_dtypes(self):
+        # GH 13660
+        dti = date_range('2011-01-01', freq='M', periods=3, )
+        dti_tz = date_range('2011-01-01', freq='M', periods=3, tz='US/Eastern')
+        pi = period_range('2011-01', freq='M', periods=3)
+
+        mi = MultiIndex.from_arrays([[1, 2, 3],
+                                     [1.1, np.nan, 3.3],
+                                     ['a', 'b', 'c'],
+                                     dti, dti_tz, pi])
+        assert mi.nlevels == 6
+
+        res = mi.append(mi)
+        exp = MultiIndex.from_arrays([[1, 2, 3, 1, 2, 3],
+                                      [1.1, np.nan, 3.3, 1.1, np.nan, 3.3],
+                                      ['a', 'b', 'c', 'a', 'b', 'c'],
+                                      dti.append(dti),
+                                      dti_tz.append(dti_tz),
+                                      pi.append(pi)])
+        tm.assert_index_equal(res, exp)
+
+        other = MultiIndex.from_arrays([['x', 'y', 'z'], ['x', 'y', 'z'],
+                                        ['x', 'y', 'z'], ['x', 'y', 'z'],
+                                        ['x', 'y', 'z'], ['x', 'y', 'z']])
+
+        res = mi.append(other)
+        exp = MultiIndex.from_arrays([[1, 2, 3, 'x', 'y', 'z'],
+                                      [1.1, np.nan, 3.3, 'x', 'y', 'z'],
+                                      ['a', 'b', 'c', 'x', 'y', 'z'],
+                                      dti.append(pd.Index(['x', 'y', 'z'])),
+                                      dti_tz.append(pd.Index(['x', 'y', 'z'])),
+                                      pi.append(pd.Index(['x', 'y', 'z']))])
+        tm.assert_index_equal(res, exp)
+
+    def test_get_level_values(self):
+        result = self.index.get_level_values(0)
+        expected = Index(['foo', 'foo', 'bar', 'baz', 'qux', 'qux'],
+                         name='first')
+        tm.assert_index_equal(result, expected)
+        assert result.name == 'first'
+
+        result = self.index.get_level_values('first')
+        expected = self.index.get_level_values(0)
+        tm.assert_index_equal(result, expected)
+
+        # GH 10460
+        index = MultiIndex(
+            levels=[CategoricalIndex(['A', 'B']),
+                    CategoricalIndex([1, 2, 3])],
+            labels=[np.array([0, 0, 0, 1, 1, 1]),
+                    np.array([0, 1, 2, 0, 1, 2])])
+
+        exp = CategoricalIndex(['A', 'A', 'A', 'B', 'B', 'B'])
+        tm.assert_index_equal(index.get_level_values(0), exp)
+        exp = CategoricalIndex([1, 2, 3, 1, 2, 3])
+        tm.assert_index_equal(index.get_level_values(1), exp)
+
+    def test_get_level_values_int_with_na(self):
+        # GH 17924
+        arrays = [['a', 'b', 'b'], [1, np.nan, 2]]
+        index = pd.MultiIndex.from_arrays(arrays)
+        result = index.get_level_values(1)
+        expected = Index([1, np.nan, 2])
+        tm.assert_index_equal(result, expected)
+
+        arrays = [['a', 'b', 'b'], [np.nan, np.nan, 2]]
+        index = pd.MultiIndex.from_arrays(arrays)
+        result = index.get_level_values(1)
+        expected = Index([np.nan, np.nan, 2])
+        tm.assert_index_equal(result, expected)
+
+    def test_get_level_values_na(self):
+        arrays = [[np.nan, np.nan, np.nan], ['a', np.nan, 1]]
+        index = pd.MultiIndex.from_arrays(arrays)
+        result = index.get_level_values(0)
+        expected = pd.Index([np.nan, np.nan, np.nan])
+        tm.assert_index_equal(result, expected)
+
+        result = index.get_level_values(1)
+        expected = pd.Index(['a', np.nan, 1])
+        tm.assert_index_equal(result, expected)
+
+        arrays = [['a', 'b', 'b'], pd.DatetimeIndex([0, 1, pd.NaT])]
+        index = pd.MultiIndex.from_arrays(arrays)
+        result = index.get_level_values(1)
+        expected = pd.DatetimeIndex([0, 1, pd.NaT])
+        tm.assert_index_equal(result, expected)
+
+        arrays = [[], []]
+        index = pd.MultiIndex.from_arrays(arrays)
+        result = index.get_level_values(0)
+        expected = pd.Index([], dtype=object)
+        tm.assert_index_equal(result, expected)
+
+    def test_get_level_values_all_na(self):
+        # GH 17924 when level entirely consists of nan
+        arrays = [[np.nan, np.nan, np.nan], ['a', np.nan, 1]]
+        index = pd.MultiIndex.from_arrays(arrays)
+        result = index.get_level_values(0)
+        expected = pd.Index([np.nan, np.nan, np.nan], dtype=np.float64)
+        tm.assert_index_equal(result, expected)
+
+        result = index.get_level_values(1)
+        expected = pd.Index(['a', np.nan, 1], dtype=object)
+        tm.assert_index_equal(result, expected)
+
+    def test_reorder_levels(self):
+        # this blows up
+        tm.assert_raises_regex(IndexError, '^Too many levels',
+                               self.index.reorder_levels, [2, 1, 0])
+
+    def test_nlevels(self):
+        assert self.index.nlevels == 2
+
+    def test_iter(self):
+        result = list(self.index)
+        expected = [('foo', 'one'), ('foo', 'two'), ('bar', 'one'),
+                    ('baz', 'two'), ('qux', 'one'), ('qux', 'two')]
+        assert result == expected
+
+    def test_legacy_pickle(self, datapath):
+        if PY3:
+            pytest.skip("testing for legacy pickles not "
+                        "support on py3")
+
+        path = datapath('indexes', 'data', 'multiindex_v1.pickle')
+        obj = pd.read_pickle(path)
+
+        obj2 = MultiIndex.from_tuples(obj.values)
+        assert obj.equals(obj2)
+
+        res = obj.get_indexer(obj)
+        exp = np.arange(len(obj), dtype=np.intp)
+        assert_almost_equal(res, exp)
+
+        res = obj.get_indexer(obj2[::-1])
+        exp = obj.get_indexer(obj[::-1])
+        exp2 = obj2.get_indexer(obj2[::-1])
+        assert_almost_equal(res, exp)
+        assert_almost_equal(exp, exp2)
+
+    def test_legacy_v2_unpickle(self, datapath):
+
+        # 0.7.3 -> 0.8.0 format manage
+        path = datapath('indexes', 'data', 'mindex_073.pickle')
+        obj = pd.read_pickle(path)
+
+        obj2 = MultiIndex.from_tuples(obj.values)
+        assert obj.equals(obj2)
+
+        res = obj.get_indexer(obj)
+        exp = np.arange(len(obj), dtype=np.intp)
+        assert_almost_equal(res, exp)
+
+        res = obj.get_indexer(obj2[::-1])
+        exp = obj.get_indexer(obj[::-1])
+        exp2 = obj2.get_indexer(obj2[::-1])
+        assert_almost_equal(res, exp)
+        assert_almost_equal(exp, exp2)
+
+    def test_roundtrip_pickle_with_tz(self):
+
+        # GH 8367
+        # round-trip of timezone
+        index = MultiIndex.from_product(
+            [[1, 2], ['a', 'b'], date_range('20130101', periods=3,
+                                            tz='US/Eastern')
+             ], names=['one', 'two', 'three'])
+        unpickled = tm.round_trip_pickle(index)
+        assert index.equal_levels(unpickled)
+
+    def test_from_tuples_index_values(self):
+        result = MultiIndex.from_tuples(self.index)
+        assert (result.values == self.index.values).all()
+
+    def test_contains(self):
+        assert ('foo', 'two') in self.index
+        assert ('bar', 'two') not in self.index
+        assert None not in self.index
+
+    def test_contains_top_level(self):
+        midx = MultiIndex.from_product([['A', 'B'], [1, 2]])
+        assert 'A' in midx
+        assert 'A' not in midx._engine
+
+    def test_contains_with_nat(self):
+        # MI with a NaT
+        mi = MultiIndex(levels=[['C'],
+                                pd.date_range('2012-01-01', periods=5)],
+                        labels=[[0, 0, 0, 0, 0, 0], [-1, 0, 1, 2, 3, 4]],
+                        names=[None, 'B'])
+        assert ('C', pd.Timestamp('2012-01-01')) in mi
+        for val in mi.values:
+            assert val in mi
+
+    def test_is_all_dates(self):
+        assert not self.index.is_all_dates
+
+    def test_is_numeric(self):
+        # MultiIndex is never numeric
+        assert not self.index.is_numeric()
+
+    def test_getitem(self):
+        # scalar
+        assert self.index[2] == ('bar', 'one')
+
+        # slice
+        result = self.index[2:5]
+        expected = self.index[[2, 3, 4]]
+        assert result.equals(expected)
+
+        # boolean
+        result = self.index[[True, False, True, False, True, True]]
+        result2 = self.index[np.array([True, False, True, False, True, True])]
+        expected = self.index[[0, 2, 4, 5]]
+        assert result.equals(expected)
+        assert result2.equals(expected)
+
+    def test_getitem_group_select(self):
+        sorted_idx, _ = self.index.sortlevel(0)
+        assert sorted_idx.get_loc('baz') == slice(3, 4)
+        assert sorted_idx.get_loc('foo') == slice(0, 2)
+
+    def test_get_loc(self):
+        assert self.index.get_loc(('foo', 'two')) == 1
+        assert self.index.get_loc(('baz', 'two')) == 3
+        pytest.raises(KeyError, self.index.get_loc, ('bar', 'two'))
+        pytest.raises(KeyError, self.index.get_loc, 'quux')
+
+        pytest.raises(NotImplementedError, self.index.get_loc, 'foo',
+                      method='nearest')
+
+        # 3 levels
+        index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
+            lrange(4))], labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
+                [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])])
+        pytest.raises(KeyError, index.get_loc, (1, 1))
+        assert index.get_loc((2, 0)) == slice(3, 5)
+
+    def test_get_loc_duplicates(self):
+        index = Index([2, 2, 2, 2])
+        result = index.get_loc(2)
+        expected = slice(0, 4)
+        assert result == expected
+        # pytest.raises(Exception, index.get_loc, 2)
+
+        index = Index(['c', 'a', 'a', 'b', 'b'])
+        rs = index.get_loc('c')
+        xp = 0
+        assert rs == xp
+
+    def test_get_value_duplicates(self):
+        index = MultiIndex(levels=[['D', 'B', 'C'],
+                                   [0, 26, 27, 37, 57, 67, 75, 82]],
+                           labels=[[0, 0, 0, 1, 2, 2, 2, 2, 2, 2],
+                                   [1, 3, 4, 6, 0, 2, 2, 3, 5, 7]],
+                           names=['tag', 'day'])
+
+        assert index.get_loc('D') == slice(0, 3)
+        with pytest.raises(KeyError):
+            index._engine.get_value(np.array([]), 'D')
+
+    def test_get_loc_level(self):
+        index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
+            lrange(4))], labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
+                [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])])
+
+        loc, new_index = index.get_loc_level((0, 1))
+        expected = slice(1, 2)
+        exp_index = index[expected].droplevel(0).droplevel(0)
+        assert loc == expected
+        assert new_index.equals(exp_index)
+
+        loc, new_index = index.get_loc_level((0, 1, 0))
+        expected = 1
+        assert loc == expected
+        assert new_index is None
+
+        pytest.raises(KeyError, index.get_loc_level, (2, 2))
+
+        index = MultiIndex(levels=[[2000], lrange(4)], labels=[np.array(
+            [0, 0, 0, 0]), np.array([0, 1, 2, 3])])
+        result, new_index = index.get_loc_level((2000, slice(None, None)))
+        expected = slice(None, None)
+        assert result == expected
+        assert new_index.equals(index.droplevel(0))
+
+    @pytest.mark.parametrize('level', [0, 1])
+    @pytest.mark.parametrize('null_val', [np.nan, pd.NaT, None])
+    def test_get_loc_nan(self, level, null_val):
+        # GH 18485 : NaN in MultiIndex
+        levels = [['a', 'b'], ['c', 'd']]
+        key = ['b', 'd']
+        levels[level] = np.array([0, null_val], dtype=type(null_val))
+        key[level] = null_val
+        idx = MultiIndex.from_product(levels)
+        assert idx.get_loc(tuple(key)) == 3
+
+    def test_get_loc_missing_nan(self):
+        # GH 8569
+        idx = MultiIndex.from_arrays([[1.0, 2.0], [3.0, 4.0]])
+        assert isinstance(idx.get_loc(1), slice)
+        pytest.raises(KeyError, idx.get_loc, 3)
+        pytest.raises(KeyError, idx.get_loc, np.nan)
+        pytest.raises(KeyError, idx.get_loc, [np.nan])
+
+    @pytest.mark.parametrize('dtype1', [int, float, bool, str])
+    @pytest.mark.parametrize('dtype2', [int, float, bool, str])
+    def test_get_loc_multiple_dtypes(self, dtype1, dtype2):
+        # GH 18520
+        levels = [np.array([0, 1]).astype(dtype1),
+                  np.array([0, 1]).astype(dtype2)]
+        idx = pd.MultiIndex.from_product(levels)
+        assert idx.get_loc(idx[2]) == 2
+
+    @pytest.mark.parametrize('level', [0, 1])
+    @pytest.mark.parametrize('dtypes', [[int, float], [float, int]])
+    def test_get_loc_implicit_cast(self, level, dtypes):
+        # GH 18818, GH 15994 : as flat index, cast int to float and vice-versa
+        levels = [['a', 'b'], ['c', 'd']]
+        key = ['b', 'd']
+        lev_dtype, key_dtype = dtypes
+        levels[level] = np.array([0, 1], dtype=lev_dtype)
+        key[level] = key_dtype(1)
+        idx = MultiIndex.from_product(levels)
+        assert idx.get_loc(tuple(key)) == 3
+
+    def test_get_loc_cast_bool(self):
+        # GH 19086 : int is casted to bool, but not vice-versa
+        levels = [[False, True], np.arange(2, dtype='int64')]
+        idx = MultiIndex.from_product(levels)
+
+        assert idx.get_loc((0, 1)) == 1
+        assert idx.get_loc((1, 0)) == 2
+
+        pytest.raises(KeyError, idx.get_loc, (False, True))
+        pytest.raises(KeyError, idx.get_loc, (True, False))
+
+    def test_slice_locs(self):
+        df = tm.makeTimeDataFrame()
+        stacked = df.stack()
+        idx = stacked.index
+
+        slob = slice(*idx.slice_locs(df.index[5], df.index[15]))
+        sliced = stacked[slob]
+        expected = df[5:16].stack()
+        tm.assert_almost_equal(sliced.values, expected.values)
+
+        slob = slice(*idx.slice_locs(df.index[5] + timedelta(seconds=30),
+                                     df.index[15] - timedelta(seconds=30)))
+        sliced = stacked[slob]
+        expected = df[6:15].stack()
+        tm.assert_almost_equal(sliced.values, expected.values)
+
+    def test_slice_locs_with_type_mismatch(self):
+        df = tm.makeTimeDataFrame()
+        stacked = df.stack()
+        idx = stacked.index
+        tm.assert_raises_regex(TypeError, '^Level type mismatch',
+                               idx.slice_locs, (1, 3))
+        tm.assert_raises_regex(TypeError, '^Level type mismatch',
+                               idx.slice_locs,
+                               df.index[5] + timedelta(
+                                   seconds=30), (5, 2))
+        df = tm.makeCustomDataframe(5, 5)
+        stacked = df.stack()
+        idx = stacked.index
+        with tm.assert_raises_regex(TypeError, '^Level type mismatch'):
+            idx.slice_locs(timedelta(seconds=30))
+        # TODO: Try creating a UnicodeDecodeError in exception message
+        with tm.assert_raises_regex(TypeError, '^Level type mismatch'):
+            idx.slice_locs(df.index[1], (16, "a"))
+
+    def test_slice_locs_not_sorted(self):
+        index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
+            lrange(4))], labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
+                [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])])
+
+        tm.assert_raises_regex(KeyError, "[Kk]ey length.*greater than "
+                                         "MultiIndex lexsort depth",
+                               index.slice_locs, (1, 0, 1), (2, 1, 0))
+
+        # works
+        sorted_index, _ = index.sortlevel(0)
+        # should there be a test case here???
+        sorted_index.slice_locs((1, 0, 1), (2, 1, 0))
+
+    def test_slice_locs_partial(self):
+        sorted_idx, _ = self.index.sortlevel(0)
+
+        result = sorted_idx.slice_locs(('foo', 'two'), ('qux', 'one'))
+        assert result == (1, 5)
+
+        result = sorted_idx.slice_locs(None, ('qux', 'one'))
+        assert result == (0, 5)
+
+        result = sorted_idx.slice_locs(('foo', 'two'), None)
+        assert result == (1, len(sorted_idx))
+
+        result = sorted_idx.slice_locs('bar', 'baz')
+        assert result == (2, 4)
+
+    def test_slice_locs_not_contained(self):
+        # some searchsorted action
+
+        index = MultiIndex(levels=[[0, 2, 4, 6], [0, 2, 4]],
+                           labels=[[0, 0, 0, 1, 1, 2, 3, 3, 3],
+                                   [0, 1, 2, 1, 2, 2, 0, 1, 2]], sortorder=0)
+
+        result = index.slice_locs((1, 0), (5, 2))
+        assert result == (3, 6)
+
+        result = index.slice_locs(1, 5)
+        assert result == (3, 6)
+
+        result = index.slice_locs((2, 2), (5, 2))
+        assert result == (3, 6)
+
+        result = index.slice_locs(2, 5)
+        assert result == (3, 6)
+
+        result = index.slice_locs((1, 0), (6, 3))
+        assert result == (3, 8)
+
+        result = index.slice_locs(-1, 10)
+        assert result == (0, len(index))
+
+    def test_consistency(self):
+        # need to construct an overflow
+        major_axis = lrange(70000)
+        minor_axis = lrange(10)
+
+        major_labels = np.arange(70000)
+        minor_labels = np.repeat(lrange(10), 7000)
+
+        # the fact that is works means it's consistent
+        index = MultiIndex(levels=[major_axis, minor_axis],
+                           labels=[major_labels, minor_labels])
+
+        # inconsistent
+        major_labels = np.array([0, 0, 1, 1, 1, 2, 2, 3, 3])
+        minor_labels = np.array([0, 1, 0, 1, 1, 0, 1, 0, 1])
+        index = MultiIndex(levels=[major_axis, minor_axis],
+                           labels=[major_labels, minor_labels])
+
+        assert not index.is_unique
+
+    def test_truncate(self):
+        major_axis = Index(lrange(4))
+        minor_axis = Index(lrange(2))
+
+        major_labels = np.array([0, 0, 1, 2, 3, 3])
+        minor_labels = np.array([0, 1, 0, 1, 0, 1])
+
+        index = MultiIndex(levels=[major_axis, minor_axis],
+                           labels=[major_labels, minor_labels])
+
+        result = index.truncate(before=1)
+        assert 'foo' not in result.levels[0]
+        assert 1 in result.levels[0]
+
+        result = index.truncate(after=1)
+        assert 2 not in result.levels[0]
+        assert 1 in result.levels[0]
+
+        result = index.truncate(before=1, after=2)
+        assert len(result.levels[0]) == 2
+
+        # after < before
+        pytest.raises(ValueError, index.truncate, 3, 1)
+
+    def test_get_indexer(self):
+        major_axis = Index(lrange(4))
+        minor_axis = Index(lrange(2))
+
+        major_labels = np.array([0, 0, 1, 2, 2, 3, 3], dtype=np.intp)
+        minor_labels = np.array([0, 1, 0, 0, 1, 0, 1], dtype=np.intp)
+
+        index = MultiIndex(levels=[major_axis, minor_axis],
+                           labels=[major_labels, minor_labels])
+        idx1 = index[:5]
+        idx2 = index[[1, 3, 5]]
+
+        r1 = idx1.get_indexer(idx2)
+        assert_almost_equal(r1, np.array([1, 3, -1], dtype=np.intp))
+
+        r1 = idx2.get_indexer(idx1, method='pad')
+        e1 = np.array([-1, 0, 0, 1, 1], dtype=np.intp)
+        assert_almost_equal(r1, e1)
+
+        r2 = idx2.get_indexer(idx1[::-1], method='pad')
+        assert_almost_equal(r2, e1[::-1])
+
+        rffill1 = idx2.get_indexer(idx1, method='ffill')
+        assert_almost_equal(r1, rffill1)
+
+        r1 = idx2.get_indexer(idx1, method='backfill')
+        e1 = np.array([0, 0, 1, 1, 2], dtype=np.intp)
+        assert_almost_equal(r1, e1)
+
+        r2 = idx2.get_indexer(idx1[::-1], method='backfill')
+        assert_almost_equal(r2, e1[::-1])
+
+        rbfill1 = idx2.get_indexer(idx1, method='bfill')
+        assert_almost_equal(r1, rbfill1)
+
+        # pass non-MultiIndex
+        r1 = idx1.get_indexer(idx2.values)
+        rexp1 = idx1.get_indexer(idx2)
+        assert_almost_equal(r1, rexp1)
+
+        r1 = idx1.get_indexer([1, 2, 3])
+        assert (r1 == [-1, -1, -1]).all()
+
+        # create index with duplicates
+        idx1 = Index(lrange(10) + lrange(10))
+        idx2 = Index(lrange(20))
+
+        msg = "Reindexing only valid with uniquely valued Index objects"
+        with tm.assert_raises_regex(InvalidIndexError, msg):
+            idx1.get_indexer(idx2)
+
+    def test_get_indexer_nearest(self):
+        midx = MultiIndex.from_tuples([('a', 1), ('b', 2)])
+        with pytest.raises(NotImplementedError):
+            midx.get_indexer(['a'], method='nearest')
+        with pytest.raises(NotImplementedError):
+            midx.get_indexer(['a'], method='pad', tolerance=2)
+
+    def test_hash_collisions(self):
+        # non-smoke test that we don't get hash collisions
+
+        index = MultiIndex.from_product([np.arange(1000), np.arange(1000)],
+                                        names=['one', 'two'])
+        result = index.get_indexer(index.values)
+        tm.assert_numpy_array_equal(result, np.arange(
+            len(index), dtype='intp'))
+
+        for i in [0, 1, len(index) - 2, len(index) - 1]:
+            result = index.get_loc(index[i])
+            assert result == i
+
+    def test_format(self):
+        self.index.format()
+        self.index[:0].format()
+
+    def test_format_integer_names(self):
+        index = MultiIndex(levels=[[0, 1], [0, 1]],
+                           labels=[[0, 0, 1, 1], [0, 1, 0, 1]], names=[0, 1])
+        index.format(names=True)
+
+    def test_format_sparse_display(self):
+        index = MultiIndex(levels=[[0, 1], [0, 1], [0, 1], [0]],
+                           labels=[[0, 0, 0, 1, 1, 1], [0, 0, 1, 0, 0, 1],
+                                   [0, 1, 0, 0, 1, 0], [0, 0, 0, 0, 0, 0]])
+
+        result = index.format()
+        assert result[3] == '1  0  0  0'
+
+    def test_format_sparse_config(self):
+        warn_filters = warnings.filters
+        warnings.filterwarnings('ignore', category=FutureWarning,
+                                module=".*format")
+        # GH1538
+        pd.set_option('display.multi_sparse', False)
+
+        result = self.index.format()
+        assert result[1] == 'foo  two'
+
+        tm.reset_display_options()
+
+        warnings.filters = warn_filters
+
+    def test_to_frame(self):
+        tuples = [(1, 'one'), (1, 'two'), (2, 'one'), (2, 'two')]
+
+        index = MultiIndex.from_tuples(tuples)
+        result = index.to_frame(index=False)
+        expected = DataFrame(tuples)
+        tm.assert_frame_equal(result, expected)
+
+        result = index.to_frame()
+        expected.index = index
+        tm.assert_frame_equal(result, expected)
+
+        tuples = [(1, 'one'), (1, 'two'), (2, 'one'), (2, 'two')]
+        index = MultiIndex.from_tuples(tuples, names=['first', 'second'])
+        result = index.to_frame(index=False)
+        expected = DataFrame(tuples)
+        expected.columns = ['first', 'second']
+        tm.assert_frame_equal(result, expected)
+
+        result = index.to_frame()
+        expected.index = index
+        tm.assert_frame_equal(result, expected)
+
+        index = MultiIndex.from_product([range(5),
+                                         pd.date_range('20130101', periods=3)])
+        result = index.to_frame(index=False)
+        expected = DataFrame(
+            {0: np.repeat(np.arange(5, dtype='int64'), 3),
+             1: np.tile(pd.date_range('20130101', periods=3), 5)})
+        tm.assert_frame_equal(result, expected)
+
+        index = MultiIndex.from_product([range(5),
+                                         pd.date_range('20130101', periods=3)])
+        result = index.to_frame()
+        expected.index = index
+        tm.assert_frame_equal(result, expected)
+
+    def test_to_hierarchical(self):
+        # GH21613
+        index = MultiIndex.from_tuples([(1, 'one'), (1, 'two'), (2, 'one'), (
+            2, 'two')])
+        with tm.assert_produces_warning(FutureWarning):
+            result = index.to_hierarchical(3)
+        expected = MultiIndex(levels=[[1, 2], ['one', 'two']],
+                              labels=[[0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1],
+                                      [0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1]])
+        tm.assert_index_equal(result, expected)
+        assert result.names == index.names
+
+        # K > 1
+        with tm.assert_produces_warning(FutureWarning):
+            result = index.to_hierarchical(3, 2)
+        expected = MultiIndex(levels=[[1, 2], ['one', 'two']],
+                              labels=[[0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1],
+                                      [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1]])
+        tm.assert_index_equal(result, expected)
+        assert result.names == index.names
+
+        # non-sorted
+        index = MultiIndex.from_tuples([(2, 'c'), (1, 'b'),
+                                        (2, 'a'), (2, 'b')],
+                                       names=['N1', 'N2'])
+        with tm.assert_produces_warning(FutureWarning):
+            result = index.to_hierarchical(2)
+        expected = MultiIndex.from_tuples([(2, 'c'), (2, 'c'), (1, 'b'),
+                                           (1, 'b'),
+                                           (2, 'a'), (2, 'a'),
+                                           (2, 'b'), (2, 'b')],
+                                          names=['N1', 'N2'])
+        tm.assert_index_equal(result, expected)
+        assert result.names == index.names
+
+    def test_bounds(self):
+        self.index._bounds
+
+    def test_equals_multi(self):
+        assert self.index.equals(self.index)
+        assert not self.index.equals(self.index.values)
+        assert self.index.equals(Index(self.index.values))
+
+        assert self.index.equal_levels(self.index)
+        assert not self.index.equals(self.index[:-1])
+        assert not self.index.equals(self.index[-1])
+
+        # different number of levels
+        index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
+            lrange(4))], labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
+                [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])])
+
+        index2 = MultiIndex(levels=index.levels[:-1], labels=index.labels[:-1])
+        assert not index.equals(index2)
+        assert not index.equal_levels(index2)
+
+        # levels are different
+        major_axis = Index(lrange(4))
+        minor_axis = Index(lrange(2))
+
+        major_labels = np.array([0, 0, 1, 2, 2, 3])
+        minor_labels = np.array([0, 1, 0, 0, 1, 0])
+
+        index = MultiIndex(levels=[major_axis, minor_axis],
+                           labels=[major_labels, minor_labels])
+        assert not self.index.equals(index)
+        assert not self.index.equal_levels(index)
+
+        # some of the labels are different
+        major_axis = Index(['foo', 'bar', 'baz', 'qux'])
+        minor_axis = Index(['one', 'two'])
+
+        major_labels = np.array([0, 0, 2, 2, 3, 3])
+        minor_labels = np.array([0, 1, 0, 1, 0, 1])
+
+        index = MultiIndex(levels=[major_axis, minor_axis],
+                           labels=[major_labels, minor_labels])
+        assert not self.index.equals(index)
+
+    def test_equals_missing_values(self):
+        # make sure take is not using -1
+        i = pd.MultiIndex.from_tuples([(0, pd.NaT),
+                                       (0, pd.Timestamp('20130101'))])
+        result = i[0:1].equals(i[0])
+        assert not result
+        result = i[1:2].equals(i[1])
+        assert not result
+
+    def test_identical(self):
+        mi = self.index.copy()
+        mi2 = self.index.copy()
+        assert mi.identical(mi2)
+
+        mi = mi.set_names(['new1', 'new2'])
+        assert mi.equals(mi2)
+        assert not mi.identical(mi2)
+
+        mi2 = mi2.set_names(['new1', 'new2'])
+        assert mi.identical(mi2)
+
+        mi3 = Index(mi.tolist(), names=mi.names)
+        mi4 = Index(mi.tolist(), names=mi.names, tupleize_cols=False)
+        assert mi.identical(mi3)
+        assert not mi.identical(mi4)
+        assert mi.equals(mi4)
+
+    def test_is_(self):
+        mi = MultiIndex.from_tuples(lzip(range(10), range(10)))
+        assert mi.is_(mi)
+        assert mi.is_(mi.view())
+        assert mi.is_(mi.view().view().view().view())
+        mi2 = mi.view()
+        # names are metadata, they don't change id
+        mi2.names = ["A", "B"]
+        assert mi2.is_(mi)
+        assert mi.is_(mi2)
+
+        assert mi.is_(mi.set_names(["C", "D"]))
+        mi2 = mi.view()
+        mi2.set_names(["E", "F"], inplace=True)
+        assert mi.is_(mi2)
+        # levels are inherent properties, they change identity
+        mi3 = mi2.set_levels([lrange(10), lrange(10)])
+        assert not mi3.is_(mi2)
+        # shouldn't change
+        assert mi2.is_(mi)
+        mi4 = mi3.view()
+
+        # GH 17464 - Remove duplicate MultiIndex levels
+        mi4.set_levels([lrange(10), lrange(10)], inplace=True)
+        assert not mi4.is_(mi3)
+        mi5 = mi.view()
+        mi5.set_levels(mi5.levels, inplace=True)
+        assert not mi5.is_(mi)
+
+    def test_union(self):
+        piece1 = self.index[:5][::-1]
+        piece2 = self.index[3:]
+
+        the_union = piece1 | piece2
+
+        tups = sorted(self.index.values)
+        expected = MultiIndex.from_tuples(tups)
+
+        assert the_union.equals(expected)
+
+        # corner case, pass self or empty thing:
+        the_union = self.index.union(self.index)
+        assert the_union is self.index
+
+        the_union = self.index.union(self.index[:0])
+        assert the_union is self.index
+
+        # won't work in python 3
+        # tuples = self.index.values
+        # result = self.index[:4] | tuples[4:]
+        # assert result.equals(tuples)
+
+        # not valid for python 3
+        # def test_union_with_regular_index(self):
+        #     other = Index(['A', 'B', 'C'])
+
+        #     result = other.union(self.index)
+        #     assert ('foo', 'one') in result
+        #     assert 'B' in result
+
+        #     result2 = self.index.union(other)
+        #     assert result.equals(result2)
+
+    def test_intersection(self):
+        piece1 = self.index[:5][::-1]
+        piece2 = self.index[3:]
+
+        the_int = piece1 & piece2
+        tups = sorted(self.index[3:5].values)
+        expected = MultiIndex.from_tuples(tups)
+        assert the_int.equals(expected)
+
+        # corner case, pass self
+        the_int = self.index.intersection(self.index)
+        assert the_int is self.index
+
+        # empty intersection: disjoint
+        empty = self.index[:2] & self.index[2:]
+        expected = self.index[:0]
+        assert empty.equals(expected)
+
+        # can't do in python 3
+        # tuples = self.index.values
+        # result = self.index & tuples
+        # assert result.equals(tuples)
+
+    def test_sub(self):
+
+        first = self.index
+
+        # - now raises (previously was set op difference)
+        with pytest.raises(TypeError):
+            first - self.index[-3:]
+        with pytest.raises(TypeError):
+            self.index[-3:] - first
+        with pytest.raises(TypeError):
+            self.index[-3:] - first.tolist()
+        with pytest.raises(TypeError):
+            first.tolist() - self.index[-3:]
+
+    def test_difference(self):
+
+        first = self.index
+        result = first.difference(self.index[-3:])
+        expected = MultiIndex.from_tuples(sorted(self.index[:-3].values),
+                                          sortorder=0,
+                                          names=self.index.names)
+
+        assert isinstance(result, MultiIndex)
+        assert result.equals(expected)
+        assert result.names == self.index.names
+
+        # empty difference: reflexive
+        result = self.index.difference(self.index)
+        expected = self.index[:0]
+        assert result.equals(expected)
+        assert result.names == self.index.names
+
+        # empty difference: superset
+        result = self.index[-3:].difference(self.index)
+        expected = self.index[:0]
+        assert result.equals(expected)
+        assert result.names == self.index.names
+
+        # empty difference: degenerate
+        result = self.index[:0].difference(self.index)
+        expected = self.index[:0]
+        assert result.equals(expected)
+        assert result.names == self.index.names
+
+        # names not the same
+        chunklet = self.index[-3:]
+        chunklet.names = ['foo', 'baz']
+        result = first.difference(chunklet)
+        assert result.names == (None, None)
+
+        # empty, but non-equal
+        result = self.index.difference(self.index.sortlevel(1)[0])
+        assert len(result) == 0
+
+        # raise Exception called with non-MultiIndex
+        result = first.difference(first.values)
+        assert result.equals(first[:0])
+
+        # name from empty array
+        result = first.difference([])
+        assert first.equals(result)
+        assert first.names == result.names
+
+        # name from non-empty array
+        result = first.difference([('foo', 'one')])
+        expected = pd.MultiIndex.from_tuples([('bar', 'one'), ('baz', 'two'), (
+            'foo', 'two'), ('qux', 'one'), ('qux', 'two')])
+        expected.names = first.names
+        assert first.names == result.names
+        tm.assert_raises_regex(TypeError, "other must be a MultiIndex "
+                                          "or a list of tuples",
+                               first.difference, [1, 2, 3, 4, 5])
+
+    def test_from_tuples(self):
+        tm.assert_raises_regex(TypeError, 'Cannot infer number of levels '
+                                          'from empty list',
+                               MultiIndex.from_tuples, [])
+
+        expected = MultiIndex(levels=[[1, 3], [2, 4]],
+                              labels=[[0, 1], [0, 1]],
+                              names=['a', 'b'])
+
+        # input tuples
+        result = MultiIndex.from_tuples(((1, 2), (3, 4)), names=['a', 'b'])
+        tm.assert_index_equal(result, expected)
+
+    def test_from_tuples_iterator(self):
+        # GH 18434
+        # input iterator for tuples
+        expected = MultiIndex(levels=[[1, 3], [2, 4]],
+                              labels=[[0, 1], [0, 1]],
+                              names=['a', 'b'])
+
+        result = MultiIndex.from_tuples(zip([1, 3], [2, 4]), names=['a', 'b'])
+        tm.assert_index_equal(result, expected)
+
+        # input non-iterables
+        with tm.assert_raises_regex(
+                TypeError, 'Input must be a list / sequence of tuple-likes.'):
+            MultiIndex.from_tuples(0)
+
+    def test_from_tuples_empty(self):
+        # GH 16777
+        result = MultiIndex.from_tuples([], names=['a', 'b'])
+        expected = MultiIndex.from_arrays(arrays=[[], []],
+                                          names=['a', 'b'])
+        tm.assert_index_equal(result, expected)
+
+    def test_argsort(self):
+        result = self.index.argsort()
+        expected = self.index.values.argsort()
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_sortlevel(self):
+        import random
+
+        tuples = list(self.index)
+        random.shuffle(tuples)
+
+        index = MultiIndex.from_tuples(tuples)
+
+        sorted_idx, _ = index.sortlevel(0)
+        expected = MultiIndex.from_tuples(sorted(tuples))
+        assert sorted_idx.equals(expected)
+
+        sorted_idx, _ = index.sortlevel(0, ascending=False)
+        assert sorted_idx.equals(expected[::-1])
+
+        sorted_idx, _ = index.sortlevel(1)
+        by1 = sorted(tuples, key=lambda x: (x[1], x[0]))
+        expected = MultiIndex.from_tuples(by1)
+        assert sorted_idx.equals(expected)
+
+        sorted_idx, _ = index.sortlevel(1, ascending=False)
+        assert sorted_idx.equals(expected[::-1])
+
+    def test_sortlevel_not_sort_remaining(self):
+        mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
+        sorted_idx, _ = mi.sortlevel('A', sort_remaining=False)
+        assert sorted_idx.equals(mi)
+
+    def test_sortlevel_deterministic(self):
+        tuples = [('bar', 'one'), ('foo', 'two'), ('qux', 'two'),
+                  ('foo', 'one'), ('baz', 'two'), ('qux', 'one')]
+
+        index = MultiIndex.from_tuples(tuples)
+
+        sorted_idx, _ = index.sortlevel(0)
+        expected = MultiIndex.from_tuples(sorted(tuples))
+        assert sorted_idx.equals(expected)
+
+        sorted_idx, _ = index.sortlevel(0, ascending=False)
+        assert sorted_idx.equals(expected[::-1])
+
+        sorted_idx, _ = index.sortlevel(1)
+        by1 = sorted(tuples, key=lambda x: (x[1], x[0]))
+        expected = MultiIndex.from_tuples(by1)
+        assert sorted_idx.equals(expected)
+
+        sorted_idx, _ = index.sortlevel(1, ascending=False)
+        assert sorted_idx.equals(expected[::-1])
+
+    def test_dims(self):
+        pass
+
+    def test_drop(self):
+        dropped = self.index.drop([('foo', 'two'), ('qux', 'one')])
+
+        index = MultiIndex.from_tuples([('foo', 'two'), ('qux', 'one')])
+        dropped2 = self.index.drop(index)
+
+        expected = self.index[[0, 2, 3, 5]]
+        tm.assert_index_equal(dropped, expected)
+        tm.assert_index_equal(dropped2, expected)
+
+        dropped = self.index.drop(['bar'])
+        expected = self.index[[0, 1, 3, 4, 5]]
+        tm.assert_index_equal(dropped, expected)
+
+        dropped = self.index.drop('foo')
+        expected = self.index[[2, 3, 4, 5]]
+        tm.assert_index_equal(dropped, expected)
+
+        index = MultiIndex.from_tuples([('bar', 'two')])
+        pytest.raises(KeyError, self.index.drop, [('bar', 'two')])
+        pytest.raises(KeyError, self.index.drop, index)
+        pytest.raises(KeyError, self.index.drop, ['foo', 'two'])
+
+        # partially correct argument
+        mixed_index = MultiIndex.from_tuples([('qux', 'one'), ('bar', 'two')])
+        pytest.raises(KeyError, self.index.drop, mixed_index)
+
+        # error='ignore'
+        dropped = self.index.drop(index, errors='ignore')
+        expected = self.index[[0, 1, 2, 3, 4, 5]]
+        tm.assert_index_equal(dropped, expected)
+
+        dropped = self.index.drop(mixed_index, errors='ignore')
+        expected = self.index[[0, 1, 2, 3, 5]]
+        tm.assert_index_equal(dropped, expected)
+
+        dropped = self.index.drop(['foo', 'two'], errors='ignore')
+        expected = self.index[[2, 3, 4, 5]]
+        tm.assert_index_equal(dropped, expected)
+
+        # mixed partial / full drop
+        dropped = self.index.drop(['foo', ('qux', 'one')])
+        expected = self.index[[2, 3, 5]]
+        tm.assert_index_equal(dropped, expected)
+
+        # mixed partial / full drop / error='ignore'
+        mixed_index = ['foo', ('qux', 'one'), 'two']
+        pytest.raises(KeyError, self.index.drop, mixed_index)
+        dropped = self.index.drop(mixed_index, errors='ignore')
+        expected = self.index[[2, 3, 5]]
+        tm.assert_index_equal(dropped, expected)
+
+    def test_droplevel_with_names(self):
+        index = self.index[self.index.get_loc('foo')]
+        dropped = index.droplevel(0)
+        assert dropped.name == 'second'
+
+        index = MultiIndex(
+            levels=[Index(lrange(4)), Index(lrange(4)), Index(lrange(4))],
+            labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
+                [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])],
+            names=['one', 'two', 'three'])
+        dropped = index.droplevel(0)
+        assert dropped.names == ('two', 'three')
+
+        dropped = index.droplevel('two')
+        expected = index.droplevel(1)
+        assert dropped.equals(expected)
+
+    def test_droplevel_list(self):
+        index = MultiIndex(
+            levels=[Index(lrange(4)), Index(lrange(4)), Index(lrange(4))],
+            labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
+                [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])],
+            names=['one', 'two', 'three'])
+
+        dropped = index[:2].droplevel(['three', 'one'])
+        expected = index[:2].droplevel(2).droplevel(0)
+        assert dropped.equals(expected)
+
+        dropped = index[:2].droplevel([])
+        expected = index[:2]
+        assert dropped.equals(expected)
+
+        with pytest.raises(ValueError):
+            index[:2].droplevel(['one', 'two', 'three'])
+
+        with pytest.raises(KeyError):
+            index[:2].droplevel(['one', 'four'])
+
+    def test_drop_not_lexsorted(self):
+        # GH 12078
+
+        # define the lexsorted version of the multi-index
+        tuples = [('a', ''), ('b1', 'c1'), ('b2', 'c2')]
+        lexsorted_mi = MultiIndex.from_tuples(tuples, names=['b', 'c'])
+        assert lexsorted_mi.is_lexsorted()
+
+        # and the not-lexsorted version
+        df = pd.DataFrame(columns=['a', 'b', 'c', 'd'],
+                          data=[[1, 'b1', 'c1', 3], [1, 'b2', 'c2', 4]])
+        df = df.pivot_table(index='a', columns=['b', 'c'], values='d')
+        df = df.reset_index()
+        not_lexsorted_mi = df.columns
+        assert not not_lexsorted_mi.is_lexsorted()
+
+        # compare the results
+        tm.assert_index_equal(lexsorted_mi, not_lexsorted_mi)
+        with tm.assert_produces_warning(PerformanceWarning):
+            tm.assert_index_equal(lexsorted_mi.drop('a'),
+                                  not_lexsorted_mi.drop('a'))
+
+    def test_insert(self):
+        # key contained in all levels
+        new_index = self.index.insert(0, ('bar', 'two'))
+        assert new_index.equal_levels(self.index)
+        assert new_index[0] == ('bar', 'two')
+
+        # key not contained in all levels
+        new_index = self.index.insert(0, ('abc', 'three'))
+
+        exp0 = Index(list(self.index.levels[0]) + ['abc'], name='first')
+        tm.assert_index_equal(new_index.levels[0], exp0)
+
+        exp1 = Index(list(self.index.levels[1]) + ['three'], name='second')
+        tm.assert_index_equal(new_index.levels[1], exp1)
+        assert new_index[0] == ('abc', 'three')
+
+        # key wrong length
+        msg = "Item must have length equal to number of levels"
+        with tm.assert_raises_regex(ValueError, msg):
+            self.index.insert(0, ('foo2',))
+
+        left = pd.DataFrame([['a', 'b', 0], ['b', 'd', 1]],
+                            columns=['1st', '2nd', '3rd'])
+        left.set_index(['1st', '2nd'], inplace=True)
+        ts = left['3rd'].copy(deep=True)
+
+        left.loc[('b', 'x'), '3rd'] = 2
+        left.loc[('b', 'a'), '3rd'] = -1
+        left.loc[('b', 'b'), '3rd'] = 3
+        left.loc[('a', 'x'), '3rd'] = 4
+        left.loc[('a', 'w'), '3rd'] = 5
+        left.loc[('a', 'a'), '3rd'] = 6
+
+        ts.loc[('b', 'x')] = 2
+        ts.loc['b', 'a'] = -1
+        ts.loc[('b', 'b')] = 3
+        ts.loc['a', 'x'] = 4
+        ts.loc[('a', 'w')] = 5
+        ts.loc['a', 'a'] = 6
+
+        right = pd.DataFrame([['a', 'b', 0], ['b', 'd', 1], ['b', 'x', 2],
+                              ['b', 'a', -1], ['b', 'b', 3], ['a', 'x', 4],
+                              ['a', 'w', 5], ['a', 'a', 6]],
+                             columns=['1st', '2nd', '3rd'])
+        right.set_index(['1st', '2nd'], inplace=True)
+        # FIXME data types changes to float because
+        # of intermediate nan insertion;
+        tm.assert_frame_equal(left, right, check_dtype=False)
+        tm.assert_series_equal(ts, right['3rd'])
+
+        # GH9250
+        idx = [('test1', i) for i in range(5)] + \
+              [('test2', i) for i in range(6)] + \
+              [('test', 17), ('test', 18)]
+
+        left = pd.Series(np.linspace(0, 10, 11),
+                         pd.MultiIndex.from_tuples(idx[:-2]))
+
+        left.loc[('test', 17)] = 11
+        left.loc[('test', 18)] = 12
+
+        right = pd.Series(np.linspace(0, 12, 13),
+                          pd.MultiIndex.from_tuples(idx))
+
+        tm.assert_series_equal(left, right)
+
+    def test_take_preserve_name(self):
+        taken = self.index.take([3, 0, 1])
+        assert taken.names == self.index.names
+
+    def test_take_fill_value(self):
+        # GH 12631
+        vals = [['A', 'B'],
+                [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02')]]
+        idx = pd.MultiIndex.from_product(vals, names=['str', 'dt'])
+
+        result = idx.take(np.array([1, 0, -1]))
+        exp_vals = [('A', pd.Timestamp('2011-01-02')),
+                    ('A', pd.Timestamp('2011-01-01')),
+                    ('B', pd.Timestamp('2011-01-02'))]
+        expected = pd.MultiIndex.from_tuples(exp_vals, names=['str', 'dt'])
+        tm.assert_index_equal(result, expected)
+
+        # fill_value
+        result = idx.take(np.array([1, 0, -1]), fill_value=True)
+        exp_vals = [('A', pd.Timestamp('2011-01-02')),
+                    ('A', pd.Timestamp('2011-01-01')),
+                    (np.nan, pd.NaT)]
+        expected = pd.MultiIndex.from_tuples(exp_vals, names=['str', 'dt'])
+        tm.assert_index_equal(result, expected)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        exp_vals = [('A', pd.Timestamp('2011-01-02')),
+                    ('A', pd.Timestamp('2011-01-01')),
+                    ('B', pd.Timestamp('2011-01-02'))]
+        expected = pd.MultiIndex.from_tuples(exp_vals, names=['str', 'dt'])
+        tm.assert_index_equal(result, expected)
+
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -2]), fill_value=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            idx.take(np.array([1, -5]))
+
+    def take_invalid_kwargs(self):
+        vals = [['A', 'B'],
+                [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02')]]
+        idx = pd.MultiIndex.from_product(vals, names=['str', 'dt'])
+        indices = [1, 2]
+
+        msg = r"take\(\) got an unexpected keyword argument 'foo'"
+        tm.assert_raises_regex(TypeError, msg, idx.take,
+                               indices, foo=2)
+
+        msg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, idx.take,
+                               indices, out=indices)
+
+        msg = "the 'mode' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, idx.take,
+                               indices, mode='clip')
+
+    @pytest.mark.parametrize('other',
+                             [Index(['three', 'one', 'two']),
+                              Index(['one']),
+                              Index(['one', 'three'])])
+    def test_join_level(self, other, join_type):
+        join_index, lidx, ridx = other.join(self.index, how=join_type,
+                                            level='second',
+                                            return_indexers=True)
+
+        exp_level = other.join(self.index.levels[1], how=join_type)
+        assert join_index.levels[0].equals(self.index.levels[0])
+        assert join_index.levels[1].equals(exp_level)
+
+        # pare down levels
+        mask = np.array(
+            [x[1] in exp_level for x in self.index], dtype=bool)
+        exp_values = self.index.values[mask]
+        tm.assert_numpy_array_equal(join_index.values, exp_values)
+
+        if join_type in ('outer', 'inner'):
+            join_index2, ridx2, lidx2 = \
+                self.index.join(other, how=join_type, level='second',
+                                return_indexers=True)
+
+            assert join_index.equals(join_index2)
+            tm.assert_numpy_array_equal(lidx, lidx2)
+            tm.assert_numpy_array_equal(ridx, ridx2)
+            tm.assert_numpy_array_equal(join_index2.values, exp_values)
+
+    def test_join_level_corner_case(self):
+        # some corner cases
+        idx = Index(['three', 'one', 'two'])
+        result = idx.join(self.index, level='second')
+        assert isinstance(result, MultiIndex)
+
+        tm.assert_raises_regex(TypeError, "Join.*MultiIndex.*ambiguous",
+                               self.index.join, self.index, level=1)
+
+    def test_join_self(self, join_type):
+        res = self.index
+        joined = res.join(res, how=join_type)
+        assert res is joined
+
+    def test_join_multi(self):
+        # GH 10665
+        midx = pd.MultiIndex.from_product(
+            [np.arange(4), np.arange(4)], names=['a', 'b'])
+        idx = pd.Index([1, 2, 5], name='b')
+
+        # inner
+        jidx, lidx, ridx = midx.join(idx, how='inner', return_indexers=True)
+        exp_idx = pd.MultiIndex.from_product(
+            [np.arange(4), [1, 2]], names=['a', 'b'])
+        exp_lidx = np.array([1, 2, 5, 6, 9, 10, 13, 14], dtype=np.intp)
+        exp_ridx = np.array([0, 1, 0, 1, 0, 1, 0, 1], dtype=np.intp)
+        tm.assert_index_equal(jidx, exp_idx)
+        tm.assert_numpy_array_equal(lidx, exp_lidx)
+        tm.assert_numpy_array_equal(ridx, exp_ridx)
+        # flip
+        jidx, ridx, lidx = idx.join(midx, how='inner', return_indexers=True)
+        tm.assert_index_equal(jidx, exp_idx)
+        tm.assert_numpy_array_equal(lidx, exp_lidx)
+        tm.assert_numpy_array_equal(ridx, exp_ridx)
+
+        # keep MultiIndex
+        jidx, lidx, ridx = midx.join(idx, how='left', return_indexers=True)
+        exp_ridx = np.array([-1, 0, 1, -1, -1, 0, 1, -1, -1, 0, 1, -1, -1, 0,
+                             1, -1], dtype=np.intp)
+        tm.assert_index_equal(jidx, midx)
+        assert lidx is None
+        tm.assert_numpy_array_equal(ridx, exp_ridx)
+        # flip
+        jidx, ridx, lidx = idx.join(midx, how='right', return_indexers=True)
+        tm.assert_index_equal(jidx, midx)
+        assert lidx is None
+        tm.assert_numpy_array_equal(ridx, exp_ridx)
+
+    def test_reindex(self):
+        result, indexer = self.index.reindex(list(self.index[:4]))
+        assert isinstance(result, MultiIndex)
+        self.check_level_names(result, self.index[:4].names)
+
+        result, indexer = self.index.reindex(list(self.index))
+        assert isinstance(result, MultiIndex)
+        assert indexer is None
+        self.check_level_names(result, self.index.names)
+
+    def test_reindex_level(self):
+        idx = Index(['one'])
+
+        target, indexer = self.index.reindex(idx, level='second')
+        target2, indexer2 = idx.reindex(self.index, level='second')
+
+        exp_index = self.index.join(idx, level='second', how='right')
+        exp_index2 = self.index.join(idx, level='second', how='left')
+
+        assert target.equals(exp_index)
+        exp_indexer = np.array([0, 2, 4])
+        tm.assert_numpy_array_equal(indexer, exp_indexer, check_dtype=False)
+
+        assert target2.equals(exp_index2)
+        exp_indexer2 = np.array([0, -1, 0, -1, 0, -1])
+        tm.assert_numpy_array_equal(indexer2, exp_indexer2, check_dtype=False)
+
+        tm.assert_raises_regex(TypeError, "Fill method not supported",
+                               self.index.reindex, self.index,
+                               method='pad', level='second')
+
+        tm.assert_raises_regex(TypeError, "Fill method not supported",
+                               idx.reindex, idx, method='bfill',
+                               level='first')
+
+    def test_duplicates(self):
+        assert not self.index.has_duplicates
+        assert self.index.append(self.index).has_duplicates
+
+        index = MultiIndex(levels=[[0, 1], [0, 1, 2]], labels=[
+            [0, 0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 0, 1, 2]])
+        assert index.has_duplicates
+
+        # GH 9075
+        t = [(u('x'), u('out'), u('z'), 5, u('y'), u('in'), u('z'), 169),
+             (u('x'), u('out'), u('z'), 7, u('y'), u('in'), u('z'), 119),
+             (u('x'), u('out'), u('z'), 9, u('y'), u('in'), u('z'), 135),
+             (u('x'), u('out'), u('z'), 13, u('y'), u('in'), u('z'), 145),
+             (u('x'), u('out'), u('z'), 14, u('y'), u('in'), u('z'), 158),
+             (u('x'), u('out'), u('z'), 16, u('y'), u('in'), u('z'), 122),
+             (u('x'), u('out'), u('z'), 17, u('y'), u('in'), u('z'), 160),
+             (u('x'), u('out'), u('z'), 18, u('y'), u('in'), u('z'), 180),
+             (u('x'), u('out'), u('z'), 20, u('y'), u('in'), u('z'), 143),
+             (u('x'), u('out'), u('z'), 21, u('y'), u('in'), u('z'), 128),
+             (u('x'), u('out'), u('z'), 22, u('y'), u('in'), u('z'), 129),
+             (u('x'), u('out'), u('z'), 25, u('y'), u('in'), u('z'), 111),
+             (u('x'), u('out'), u('z'), 28, u('y'), u('in'), u('z'), 114),
+             (u('x'), u('out'), u('z'), 29, u('y'), u('in'), u('z'), 121),
+             (u('x'), u('out'), u('z'), 31, u('y'), u('in'), u('z'), 126),
+             (u('x'), u('out'), u('z'), 32, u('y'), u('in'), u('z'), 155),
+             (u('x'), u('out'), u('z'), 33, u('y'), u('in'), u('z'), 123),
+             (u('x'), u('out'), u('z'), 12, u('y'), u('in'), u('z'), 144)]
+
+        index = pd.MultiIndex.from_tuples(t)
+        assert not index.has_duplicates
+
+        # handle int64 overflow if possible
+        def check(nlevels, with_nulls):
+            labels = np.tile(np.arange(500), 2)
+            level = np.arange(500)
+
+            if with_nulls:  # inject some null values
+                labels[500] = -1  # common nan value
+                labels = [labels.copy() for i in range(nlevels)]
+                for i in range(nlevels):
+                    labels[i][500 + i - nlevels // 2] = -1
+
+                labels += [np.array([-1, 1]).repeat(500)]
+            else:
+                labels = [labels] * nlevels + [np.arange(2).repeat(500)]
+
+            levels = [level] * nlevels + [[0, 1]]
+
+            # no dups
+            index = MultiIndex(levels=levels, labels=labels)
+            assert not index.has_duplicates
+
+            # with a dup
+            if with_nulls:
+                def f(a):
+                    return np.insert(a, 1000, a[0])
+                labels = list(map(f, labels))
+                index = MultiIndex(levels=levels, labels=labels)
+            else:
+                values = index.values.tolist()
+                index = MultiIndex.from_tuples(values + [values[0]])
+
+            assert index.has_duplicates
+
+        # no overflow
+        check(4, False)
+        check(4, True)
+
+        # overflow possible
+        check(8, False)
+        check(8, True)
+
+        # GH 9125
+        n, k = 200, 5000
+        levels = [np.arange(n), tm.makeStringIndex(n), 1000 + np.arange(n)]
+        labels = [np.random.choice(n, k * n) for lev in levels]
+        mi = MultiIndex(levels=levels, labels=labels)
+
+        for keep in ['first', 'last', False]:
+            left = mi.duplicated(keep=keep)
+            right = pd._libs.hashtable.duplicated_object(mi.values, keep=keep)
+            tm.assert_numpy_array_equal(left, right)
+
+        # GH5873
+        for a in [101, 102]:
+            mi = MultiIndex.from_arrays([[101, a], [3.5, np.nan]])
+            assert not mi.has_duplicates
+
+            with warnings.catch_warnings(record=True):
+                # Deprecated - see GH20239
+                assert mi.get_duplicates().equals(MultiIndex.from_arrays(
+                    [[], []]))
+
+            tm.assert_numpy_array_equal(mi.duplicated(), np.zeros(
+                2, dtype='bool'))
+
+        for n in range(1, 6):  # 1st level shape
+            for m in range(1, 5):  # 2nd level shape
+                # all possible unique combinations, including nan
+                lab = product(range(-1, n), range(-1, m))
+                mi = MultiIndex(levels=[list('abcde')[:n], list('WXYZ')[:m]],
+                                labels=np.random.permutation(list(lab)).T)
+                assert len(mi) == (n + 1) * (m + 1)
+                assert not mi.has_duplicates
+
+                with warnings.catch_warnings(record=True):
+                    # Deprecated - see GH20239
+                    assert mi.get_duplicates().equals(MultiIndex.from_arrays(
+                        [[], []]))
+
+                tm.assert_numpy_array_equal(mi.duplicated(), np.zeros(
+                    len(mi), dtype='bool'))
+
+    def test_duplicate_meta_data(self):
+        # GH 10115
+        index = MultiIndex(
+            levels=[[0, 1], [0, 1, 2]],
+            labels=[[0, 0, 0, 0, 1, 1, 1],
+                    [0, 1, 2, 0, 0, 1, 2]])
+
+        for idx in [index,
+                    index.set_names([None, None]),
+                    index.set_names([None, 'Num']),
+                    index.set_names(['Upper', 'Num']), ]:
+            assert idx.has_duplicates
+            assert idx.drop_duplicates().names == idx.names
+
+    def test_get_unique_index(self):
+        idx = self.index[[0, 1, 0, 1, 1, 0, 0]]
+        expected = self.index._shallow_copy(idx[[0, 1]])
+
+        for dropna in [False, True]:
+            result = idx._get_unique_index(dropna=dropna)
+            assert result.unique
+            tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('names', [None, ['first', 'second']])
+    def test_unique(self, names):
+        mi = pd.MultiIndex.from_arrays([[1, 2, 1, 2], [1, 1, 1, 2]],
+                                       names=names)
+
+        res = mi.unique()
+        exp = pd.MultiIndex.from_arrays([[1, 2, 2], [1, 1, 2]], names=mi.names)
+        tm.assert_index_equal(res, exp)
+
+        mi = pd.MultiIndex.from_arrays([list('aaaa'), list('abab')],
+                                       names=names)
+        res = mi.unique()
+        exp = pd.MultiIndex.from_arrays([list('aa'), list('ab')],
+                                        names=mi.names)
+        tm.assert_index_equal(res, exp)
+
+        mi = pd.MultiIndex.from_arrays([list('aaaa'), list('aaaa')],
+                                       names=names)
+        res = mi.unique()
+        exp = pd.MultiIndex.from_arrays([['a'], ['a']], names=mi.names)
+        tm.assert_index_equal(res, exp)
+
+        # GH #20568 - empty MI
+        mi = pd.MultiIndex.from_arrays([[], []], names=names)
+        res = mi.unique()
+        tm.assert_index_equal(mi, res)
+
+    @pytest.mark.parametrize('level', [0, 'first', 1, 'second'])
+    def test_unique_level(self, level):
+        # GH #17896 - with level= argument
+        result = self.index.unique(level=level)
+        expected = self.index.get_level_values(level).unique()
+        tm.assert_index_equal(result, expected)
+
+        # With already unique level
+        mi = pd.MultiIndex.from_arrays([[1, 3, 2, 4], [1, 3, 2, 5]],
+                                       names=['first', 'second'])
+        result = mi.unique(level=level)
+        expected = mi.get_level_values(level)
+        tm.assert_index_equal(result, expected)
+
+        # With empty MI
+        mi = pd.MultiIndex.from_arrays([[], []], names=['first', 'second'])
+        result = mi.unique(level=level)
+        expected = mi.get_level_values(level)
+
+    def test_unique_datetimelike(self):
+        idx1 = pd.DatetimeIndex(['2015-01-01', '2015-01-01', '2015-01-01',
+                                 '2015-01-01', 'NaT', 'NaT'])
+        idx2 = pd.DatetimeIndex(['2015-01-01', '2015-01-01', '2015-01-02',
+                                 '2015-01-02', 'NaT', '2015-01-01'],
+                                tz='Asia/Tokyo')
+        result = pd.MultiIndex.from_arrays([idx1, idx2]).unique()
+
+        eidx1 = pd.DatetimeIndex(['2015-01-01', '2015-01-01', 'NaT', 'NaT'])
+        eidx2 = pd.DatetimeIndex(['2015-01-01', '2015-01-02',
+                                  'NaT', '2015-01-01'],
+                                 tz='Asia/Tokyo')
+        exp = pd.MultiIndex.from_arrays([eidx1, eidx2])
+        tm.assert_index_equal(result, exp)
+
+    def test_tolist(self):
+        result = self.index.tolist()
+        exp = list(self.index.values)
+        assert result == exp
+
+    def test_repr_with_unicode_data(self):
+        with pd.core.config.option_context("display.encoding", 'UTF-8'):
+            d = {"a": [u("\u05d0"), 2, 3], "b": [4, 5, 6], "c": [7, 8, 9]}
+            index = pd.DataFrame(d).set_index(["a", "b"]).index
+            assert "\\u" not in repr(index)  # we don't want unicode-escaped
+
+    def test_repr_roundtrip(self):
+
+        mi = MultiIndex.from_product([list('ab'), range(3)],
+                                     names=['first', 'second'])
+        str(mi)
+
+        if PY3:
+            tm.assert_index_equal(eval(repr(mi)), mi, exact=True)
+        else:
+            result = eval(repr(mi))
+            # string coerces to unicode
+            tm.assert_index_equal(result, mi, exact=False)
+            assert mi.get_level_values('first').inferred_type == 'string'
+            assert result.get_level_values('first').inferred_type == 'unicode'
+
+        mi_u = MultiIndex.from_product(
+            [list(u'ab'), range(3)], names=['first', 'second'])
+        result = eval(repr(mi_u))
+        tm.assert_index_equal(result, mi_u, exact=True)
+
+        # formatting
+        if PY3:
+            str(mi)
+        else:
+            compat.text_type(mi)
+
+        # long format
+        mi = MultiIndex.from_product([list('abcdefg'), range(10)],
+                                     names=['first', 'second'])
+
+        if PY3:
+            tm.assert_index_equal(eval(repr(mi)), mi, exact=True)
+        else:
+            result = eval(repr(mi))
+            # string coerces to unicode
+            tm.assert_index_equal(result, mi, exact=False)
+            assert mi.get_level_values('first').inferred_type == 'string'
+            assert result.get_level_values('first').inferred_type == 'unicode'
+
+        result = eval(repr(mi_u))
+        tm.assert_index_equal(result, mi_u, exact=True)
+
+    def test_str(self):
+        # tested elsewhere
+        pass
+
+    def test_unicode_string_with_unicode(self):
+        d = {"a": [u("\u05d0"), 2, 3], "b": [4, 5, 6], "c": [7, 8, 9]}
+        idx = pd.DataFrame(d).set_index(["a", "b"]).index
+
+        if PY3:
+            str(idx)
+        else:
+            compat.text_type(idx)
+
+    def test_bytestring_with_unicode(self):
+        d = {"a": [u("\u05d0"), 2, 3], "b": [4, 5, 6], "c": [7, 8, 9]}
+        idx = pd.DataFrame(d).set_index(["a", "b"]).index
+
+        if PY3:
+            bytes(idx)
+        else:
+            str(idx)
+
+    def test_slice_keep_name(self):
+        x = MultiIndex.from_tuples([('a', 'b'), (1, 2), ('c', 'd')],
+                                   names=['x', 'y'])
+        assert x[1:].names == x.names
+
+    def test_isna_behavior(self):
+        # should not segfault GH5123
+        # NOTE: if MI representation changes, may make sense to allow
+        # isna(MI)
+        with pytest.raises(NotImplementedError):
+            pd.isna(self.index)
+
+    def test_level_setting_resets_attributes(self):
+        ind = pd.MultiIndex.from_arrays([
+            ['A', 'A', 'B', 'B', 'B'], [1, 2, 1, 2, 3]
+        ])
+        assert ind.is_monotonic
+        ind.set_levels([['A', 'B'], [1, 3, 2]], inplace=True)
+        # if this fails, probably didn't reset the cache correctly.
+        assert not ind.is_monotonic
+
+    def test_is_monotonic_increasing(self):
+        i = MultiIndex.from_product([np.arange(10),
+                                     np.arange(10)], names=['one', 'two'])
+        assert i.is_monotonic
+        assert i._is_strictly_monotonic_increasing
+        assert Index(i.values).is_monotonic
+        assert i._is_strictly_monotonic_increasing
+
+        i = MultiIndex.from_product([np.arange(10, 0, -1),
+                                     np.arange(10)], names=['one', 'two'])
+        assert not i.is_monotonic
+        assert not i._is_strictly_monotonic_increasing
+        assert not Index(i.values).is_monotonic
+        assert not Index(i.values)._is_strictly_monotonic_increasing
+
+        i = MultiIndex.from_product([np.arange(10),
+                                     np.arange(10, 0, -1)],
+                                    names=['one', 'two'])
+        assert not i.is_monotonic
+        assert not i._is_strictly_monotonic_increasing
+        assert not Index(i.values).is_monotonic
+        assert not Index(i.values)._is_strictly_monotonic_increasing
+
+        i = MultiIndex.from_product([[1.0, np.nan, 2.0], ['a', 'b', 'c']])
+        assert not i.is_monotonic
+        assert not i._is_strictly_monotonic_increasing
+        assert not Index(i.values).is_monotonic
+        assert not Index(i.values)._is_strictly_monotonic_increasing
+
+        # string ordering
+        i = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                               ['one', 'two', 'three']],
+                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       names=['first', 'second'])
+        assert not i.is_monotonic
+        assert not Index(i.values).is_monotonic
+        assert not i._is_strictly_monotonic_increasing
+        assert not Index(i.values)._is_strictly_monotonic_increasing
+
+        i = MultiIndex(levels=[['bar', 'baz', 'foo', 'qux'],
+                               ['mom', 'next', 'zenith']],
+                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       names=['first', 'second'])
+        assert i.is_monotonic
+        assert Index(i.values).is_monotonic
+        assert i._is_strictly_monotonic_increasing
+        assert Index(i.values)._is_strictly_monotonic_increasing
+
+        # mixed levels, hits the TypeError
+        i = MultiIndex(
+            levels=[[1, 2, 3, 4], ['gb00b03mlx29', 'lu0197800237',
+                                   'nl0000289783',
+                                   'nl0000289965', 'nl0000301109']],
+            labels=[[0, 1, 1, 2, 2, 2, 3], [4, 2, 0, 0, 1, 3, -1]],
+            names=['household_id', 'asset_id'])
+
+        assert not i.is_monotonic
+        assert not i._is_strictly_monotonic_increasing
+
+        # empty
+        i = MultiIndex.from_arrays([[], []])
+        assert i.is_monotonic
+        assert Index(i.values).is_monotonic
+        assert i._is_strictly_monotonic_increasing
+        assert Index(i.values)._is_strictly_monotonic_increasing
+
+    def test_is_monotonic_decreasing(self):
+        i = MultiIndex.from_product([np.arange(9, -1, -1),
+                                     np.arange(9, -1, -1)],
+                                    names=['one', 'two'])
+        assert i.is_monotonic_decreasing
+        assert i._is_strictly_monotonic_decreasing
+        assert Index(i.values).is_monotonic_decreasing
+        assert i._is_strictly_monotonic_decreasing
+
+        i = MultiIndex.from_product([np.arange(10),
+                                     np.arange(10, 0, -1)],
+                                    names=['one', 'two'])
+        assert not i.is_monotonic_decreasing
+        assert not i._is_strictly_monotonic_decreasing
+        assert not Index(i.values).is_monotonic_decreasing
+        assert not Index(i.values)._is_strictly_monotonic_decreasing
+
+        i = MultiIndex.from_product([np.arange(10, 0, -1),
+                                     np.arange(10)], names=['one', 'two'])
+        assert not i.is_monotonic_decreasing
+        assert not i._is_strictly_monotonic_decreasing
+        assert not Index(i.values).is_monotonic_decreasing
+        assert not Index(i.values)._is_strictly_monotonic_decreasing
+
+        i = MultiIndex.from_product([[2.0, np.nan, 1.0], ['c', 'b', 'a']])
+        assert not i.is_monotonic_decreasing
+        assert not i._is_strictly_monotonic_decreasing
+        assert not Index(i.values).is_monotonic_decreasing
+        assert not Index(i.values)._is_strictly_monotonic_decreasing
+
+        # string ordering
+        i = MultiIndex(levels=[['qux', 'foo', 'baz', 'bar'],
+                               ['three', 'two', 'one']],
+                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       names=['first', 'second'])
+        assert not i.is_monotonic_decreasing
+        assert not Index(i.values).is_monotonic_decreasing
+        assert not i._is_strictly_monotonic_decreasing
+        assert not Index(i.values)._is_strictly_monotonic_decreasing
+
+        i = MultiIndex(levels=[['qux', 'foo', 'baz', 'bar'],
+                               ['zenith', 'next', 'mom']],
+                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       names=['first', 'second'])
+        assert i.is_monotonic_decreasing
+        assert Index(i.values).is_monotonic_decreasing
+        assert i._is_strictly_monotonic_decreasing
+        assert Index(i.values)._is_strictly_monotonic_decreasing
+
+        # mixed levels, hits the TypeError
+        i = MultiIndex(
+            levels=[[4, 3, 2, 1], ['nl0000301109', 'nl0000289965',
+                                   'nl0000289783', 'lu0197800237',
+                                   'gb00b03mlx29']],
+            labels=[[0, 1, 1, 2, 2, 2, 3], [4, 2, 0, 0, 1, 3, -1]],
+            names=['household_id', 'asset_id'])
+
+        assert not i.is_monotonic_decreasing
+        assert not i._is_strictly_monotonic_decreasing
+
+        # empty
+        i = MultiIndex.from_arrays([[], []])
+        assert i.is_monotonic_decreasing
+        assert Index(i.values).is_monotonic_decreasing
+        assert i._is_strictly_monotonic_decreasing
+        assert Index(i.values)._is_strictly_monotonic_decreasing
+
+    def test_is_strictly_monotonic_increasing(self):
+        idx = pd.MultiIndex(levels=[['bar', 'baz'], ['mom', 'next']],
+                            labels=[[0, 0, 1, 1], [0, 0, 0, 1]])
+        assert idx.is_monotonic_increasing
+        assert not idx._is_strictly_monotonic_increasing
+
+    def test_is_strictly_monotonic_decreasing(self):
+        idx = pd.MultiIndex(levels=[['baz', 'bar'], ['next', 'mom']],
+                            labels=[[0, 0, 1, 1], [0, 0, 0, 1]])
+        assert idx.is_monotonic_decreasing
+        assert not idx._is_strictly_monotonic_decreasing
+
+    def test_reconstruct_sort(self):
+
+        # starts off lexsorted & monotonic
+        mi = MultiIndex.from_arrays([
+            ['A', 'A', 'B', 'B', 'B'], [1, 2, 1, 2, 3]
+        ])
+        assert mi.is_lexsorted()
+        assert mi.is_monotonic
+
+        recons = mi._sort_levels_monotonic()
+        assert recons.is_lexsorted()
+        assert recons.is_monotonic
+        assert mi is recons
+
+        assert mi.equals(recons)
+        assert Index(mi.values).equals(Index(recons.values))
+
+        # cannot convert to lexsorted
+        mi = pd.MultiIndex.from_tuples([('z', 'a'), ('x', 'a'), ('y', 'b'),
+                                        ('x', 'b'), ('y', 'a'), ('z', 'b')],
+                                       names=['one', 'two'])
+        assert not mi.is_lexsorted()
+        assert not mi.is_monotonic
+
+        recons = mi._sort_levels_monotonic()
+        assert not recons.is_lexsorted()
+        assert not recons.is_monotonic
+
+        assert mi.equals(recons)
+        assert Index(mi.values).equals(Index(recons.values))
+
+        # cannot convert to lexsorted
+        mi = MultiIndex(levels=[['b', 'd', 'a'], [1, 2, 3]],
+                        labels=[[0, 1, 0, 2], [2, 0, 0, 1]],
+                        names=['col1', 'col2'])
+        assert not mi.is_lexsorted()
+        assert not mi.is_monotonic
+
+        recons = mi._sort_levels_monotonic()
+        assert not recons.is_lexsorted()
+        assert not recons.is_monotonic
+
+        assert mi.equals(recons)
+        assert Index(mi.values).equals(Index(recons.values))
+
+    def test_reconstruct_remove_unused(self):
+        # xref to GH 2770
+        df = DataFrame([['deleteMe', 1, 9],
+                        ['keepMe', 2, 9],
+                        ['keepMeToo', 3, 9]],
+                       columns=['first', 'second', 'third'])
+        df2 = df.set_index(['first', 'second'], drop=False)
+        df2 = df2[df2['first'] != 'deleteMe']
+
+        # removed levels are there
+        expected = MultiIndex(levels=[['deleteMe', 'keepMe', 'keepMeToo'],
+                                      [1, 2, 3]],
+                              labels=[[1, 2], [1, 2]],
+                              names=['first', 'second'])
+        result = df2.index
+        tm.assert_index_equal(result, expected)
+
+        expected = MultiIndex(levels=[['keepMe', 'keepMeToo'],
+                                      [2, 3]],
+                              labels=[[0, 1], [0, 1]],
+                              names=['first', 'second'])
+        result = df2.index.remove_unused_levels()
+        tm.assert_index_equal(result, expected)
+
+        # idempotent
+        result2 = result.remove_unused_levels()
+        tm.assert_index_equal(result2, expected)
+        assert result2.is_(result)
+
+    @pytest.mark.parametrize('level0', [['a', 'd', 'b'],
+                                        ['a', 'd', 'b', 'unused']])
+    @pytest.mark.parametrize('level1', [['w', 'x', 'y', 'z'],
+                                        ['w', 'x', 'y', 'z', 'unused']])
+    def test_remove_unused_nan(self, level0, level1):
+        # GH 18417
+        mi = pd.MultiIndex(levels=[level0, level1],
+                           labels=[[0, 2, -1, 1, -1], [0, 1, 2, 3, 2]])
+
+        result = mi.remove_unused_levels()
+        tm.assert_index_equal(result, mi)
+        for level in 0, 1:
+            assert('unused' not in result.levels[level])
+
+    @pytest.mark.parametrize('first_type,second_type', [
+        ('int64', 'int64'),
+        ('datetime64[D]', 'str')])
+    def test_remove_unused_levels_large(self, first_type, second_type):
+        # GH16556
+
+        # because tests should be deterministic (and this test in particular
+        # checks that levels are removed, which is not the case for every
+        # random input):
+        rng = np.random.RandomState(4)  # seed is arbitrary value that works
+
+        size = 1 << 16
+        df = DataFrame(dict(
+            first=rng.randint(0, 1 << 13, size).astype(first_type),
+            second=rng.randint(0, 1 << 10, size).astype(second_type),
+            third=rng.rand(size)))
+        df = df.groupby(['first', 'second']).sum()
+        df = df[df.third < 0.1]
+
+        result = df.index.remove_unused_levels()
+        assert len(result.levels[0]) < len(df.index.levels[0])
+        assert len(result.levels[1]) < len(df.index.levels[1])
+        assert result.equals(df.index)
+
+        expected = df.reset_index().set_index(['first', 'second']).index
+        tm.assert_index_equal(result, expected)
+
+    def test_isin(self):
+        values = [('foo', 2), ('bar', 3), ('quux', 4)]
+
+        idx = MultiIndex.from_arrays([['qux', 'baz', 'foo', 'bar'], np.arange(
+            4)])
+        result = idx.isin(values)
+        expected = np.array([False, False, True, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+        # empty, return dtype bool
+        idx = MultiIndex.from_arrays([[], []])
+        result = idx.isin(values)
+        assert len(result) == 0
+        assert result.dtype == np.bool_
+
+    @pytest.mark.skipif(PYPY, reason="tuples cmp recursively on PyPy")
+    def test_isin_nan_not_pypy(self):
+        idx = MultiIndex.from_arrays([['foo', 'bar'], [1.0, np.nan]])
+        tm.assert_numpy_array_equal(idx.isin([('bar', np.nan)]),
+                                    np.array([False, False]))
+        tm.assert_numpy_array_equal(idx.isin([('bar', float('nan'))]),
+                                    np.array([False, False]))
+
+    @pytest.mark.skipif(not PYPY, reason="tuples cmp recursively on PyPy")
+    def test_isin_nan_pypy(self):
+        idx = MultiIndex.from_arrays([['foo', 'bar'], [1.0, np.nan]])
+        tm.assert_numpy_array_equal(idx.isin([('bar', np.nan)]),
+                                    np.array([False, True]))
+        tm.assert_numpy_array_equal(idx.isin([('bar', float('nan'))]),
+                                    np.array([False, True]))
+
+    def test_isin_level_kwarg(self):
+        idx = MultiIndex.from_arrays([['qux', 'baz', 'foo', 'bar'], np.arange(
+            4)])
+
+        vals_0 = ['foo', 'bar', 'quux']
+        vals_1 = [2, 3, 10]
+
+        expected = np.array([False, False, True, True])
+        tm.assert_numpy_array_equal(expected, idx.isin(vals_0, level=0))
+        tm.assert_numpy_array_equal(expected, idx.isin(vals_0, level=-2))
+
+        tm.assert_numpy_array_equal(expected, idx.isin(vals_1, level=1))
+        tm.assert_numpy_array_equal(expected, idx.isin(vals_1, level=-1))
+
+        pytest.raises(IndexError, idx.isin, vals_0, level=5)
+        pytest.raises(IndexError, idx.isin, vals_0, level=-5)
+
+        pytest.raises(KeyError, idx.isin, vals_0, level=1.0)
+        pytest.raises(KeyError, idx.isin, vals_1, level=-1.0)
+        pytest.raises(KeyError, idx.isin, vals_1, level='A')
+
+        idx.names = ['A', 'B']
+        tm.assert_numpy_array_equal(expected, idx.isin(vals_0, level='A'))
+        tm.assert_numpy_array_equal(expected, idx.isin(vals_1, level='B'))
+
+        pytest.raises(KeyError, idx.isin, vals_1, level='C')
+
+    def test_reindex_preserves_names_when_target_is_list_or_ndarray(self):
+        # GH6552
+        idx = self.index.copy()
+        target = idx.copy()
+        idx.names = target.names = [None, None]
+
+        other_dtype = pd.MultiIndex.from_product([[1, 2], [3, 4]])
+
+        # list & ndarray cases
+        assert idx.reindex([])[0].names == [None, None]
+        assert idx.reindex(np.array([]))[0].names == [None, None]
+        assert idx.reindex(target.tolist())[0].names == [None, None]
+        assert idx.reindex(target.values)[0].names == [None, None]
+        assert idx.reindex(other_dtype.tolist())[0].names == [None, None]
+        assert idx.reindex(other_dtype.values)[0].names == [None, None]
+
+        idx.names = ['foo', 'bar']
+        assert idx.reindex([])[0].names == ['foo', 'bar']
+        assert idx.reindex(np.array([]))[0].names == ['foo', 'bar']
+        assert idx.reindex(target.tolist())[0].names == ['foo', 'bar']
+        assert idx.reindex(target.values)[0].names == ['foo', 'bar']
+        assert idx.reindex(other_dtype.tolist())[0].names == ['foo', 'bar']
+        assert idx.reindex(other_dtype.values)[0].names == ['foo', 'bar']
+
+    def test_reindex_lvl_preserves_names_when_target_is_list_or_array(self):
+        # GH7774
+        idx = pd.MultiIndex.from_product([[0, 1], ['a', 'b']],
+                                         names=['foo', 'bar'])
+        assert idx.reindex([], level=0)[0].names == ['foo', 'bar']
+        assert idx.reindex([], level=1)[0].names == ['foo', 'bar']
+
+    def test_reindex_lvl_preserves_type_if_target_is_empty_list_or_array(self):
+        # GH7774
+        idx = pd.MultiIndex.from_product([[0, 1], ['a', 'b']])
+        assert idx.reindex([], level=0)[0].levels[0].dtype.type == np.int64
+        assert idx.reindex([], level=1)[0].levels[1].dtype.type == np.object_
+
+    def test_groupby(self):
+        groups = self.index.groupby(np.array([1, 1, 1, 2, 2, 2]))
+        labels = self.index.get_values().tolist()
+        exp = {1: labels[:3], 2: labels[3:]}
+        tm.assert_dict_equal(groups, exp)
+
+        # GH5620
+        groups = self.index.groupby(self.index)
+        exp = {key: [key] for key in self.index}
+        tm.assert_dict_equal(groups, exp)
+
+    def test_index_name_retained(self):
+        # GH9857
+        result = pd.DataFrame({'x': [1, 2, 6],
+                               'y': [2, 2, 8],
+                               'z': [-5, 0, 5]})
+        result = result.set_index('z')
+        result.loc[10] = [9, 10]
+        df_expected = pd.DataFrame({'x': [1, 2, 6, 9],
+                                    'y': [2, 2, 8, 10],
+                                    'z': [-5, 0, 5, 10]})
+        df_expected = df_expected.set_index('z')
+        tm.assert_frame_equal(result, df_expected)
+
+    def test_equals_operator(self):
+        # GH9785
+        assert (self.index == self.index).all()
+
+    def test_large_multiindex_error(self):
+        # GH12527
+        df_below_1000000 = pd.DataFrame(
+            1, index=pd.MultiIndex.from_product([[1, 2], range(499999)]),
+            columns=['dest'])
+        with pytest.raises(KeyError):
+            df_below_1000000.loc[(-1, 0), 'dest']
+        with pytest.raises(KeyError):
+            df_below_1000000.loc[(3, 0), 'dest']
+        df_above_1000000 = pd.DataFrame(
+            1, index=pd.MultiIndex.from_product([[1, 2], range(500001)]),
+            columns=['dest'])
+        with pytest.raises(KeyError):
+            df_above_1000000.loc[(-1, 0), 'dest']
+        with pytest.raises(KeyError):
+            df_above_1000000.loc[(3, 0), 'dest']
+
+    def test_partial_string_timestamp_multiindex(self):
+        # GH10331
+        dr = pd.date_range('2016-01-01', '2016-01-03', freq='12H')
+        abc = ['a', 'b', 'c']
+        ix = pd.MultiIndex.from_product([dr, abc])
+        df = pd.DataFrame({'c1': range(0, 15)}, index=ix)
+        idx = pd.IndexSlice
+
+        #                        c1
+        # 2016-01-01 00:00:00 a   0
+        #                     b   1
+        #                     c   2
+        # 2016-01-01 12:00:00 a   3
+        #                     b   4
+        #                     c   5
+        # 2016-01-02 00:00:00 a   6
+        #                     b   7
+        #                     c   8
+        # 2016-01-02 12:00:00 a   9
+        #                     b  10
+        #                     c  11
+        # 2016-01-03 00:00:00 a  12
+        #                     b  13
+        #                     c  14
+
+        # partial string matching on a single index
+        for df_swap in (df.swaplevel(),
+                        df.swaplevel(0),
+                        df.swaplevel(0, 1)):
+            df_swap = df_swap.sort_index()
+            just_a = df_swap.loc['a']
+            result = just_a.loc['2016-01-01']
+            expected = df.loc[idx[:, 'a'], :].iloc[0:2]
+            expected.index = expected.index.droplevel(1)
+            tm.assert_frame_equal(result, expected)
+
+        # indexing with IndexSlice
+        result = df.loc[idx['2016-01-01':'2016-02-01', :], :]
+        expected = df
+        tm.assert_frame_equal(result, expected)
+
+        # match on secondary index
+        result = df_swap.loc[idx[:, '2016-01-01':'2016-01-01'], :]
+        expected = df_swap.iloc[[0, 1, 5, 6, 10, 11]]
+        tm.assert_frame_equal(result, expected)
+
+        # Even though this syntax works on a single index, this is somewhat
+        # ambiguous and we don't want to extend this behavior forward to work
+        # in multi-indexes. This would amount to selecting a scalar from a
+        # column.
+        with pytest.raises(KeyError):
+            df['2016-01-01']
+
+        # partial string match on year only
+        result = df.loc['2016']
+        expected = df
+        tm.assert_frame_equal(result, expected)
+
+        # partial string match on date
+        result = df.loc['2016-01-01']
+        expected = df.iloc[0:6]
+        tm.assert_frame_equal(result, expected)
+
+        # partial string match on date and hour, from middle
+        result = df.loc['2016-01-02 12']
+        expected = df.iloc[9:12]
+        tm.assert_frame_equal(result, expected)
+
+        # partial string match on secondary index
+        result = df_swap.loc[idx[:, '2016-01-02'], :]
+        expected = df_swap.iloc[[2, 3, 7, 8, 12, 13]]
+        tm.assert_frame_equal(result, expected)
+
+        # tuple selector with partial string match on date
+        result = df.loc[('2016-01-01', 'a'), :]
+        expected = df.iloc[[0, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        # Slicing date on first level should break (of course)
+        with pytest.raises(KeyError):
+            df_swap.loc['2016-01-01']
+
+        # GH12685 (partial string with daily resolution or below)
+        dr = date_range('2013-01-01', periods=100, freq='D')
+        ix = MultiIndex.from_product([dr, ['a', 'b']])
+        df = DataFrame(np.random.randn(200, 1), columns=['A'], index=ix)
+
+        result = df.loc[idx['2013-03':'2013-03', :], :]
+        expected = df.iloc[118:180]
+        tm.assert_frame_equal(result, expected)
+
+    def test_rangeindex_fallback_coercion_bug(self):
+        # GH 12893
+        foo = pd.DataFrame(np.arange(100).reshape((10, 10)))
+        bar = pd.DataFrame(np.arange(100).reshape((10, 10)))
+        df = pd.concat({'foo': foo.stack(), 'bar': bar.stack()}, axis=1)
+        df.index.names = ['fizz', 'buzz']
+
+        str(df)
+        expected = pd.DataFrame({'bar': np.arange(100),
+                                 'foo': np.arange(100)},
+                                index=pd.MultiIndex.from_product(
+                                    [range(10), range(10)],
+                                    names=['fizz', 'buzz']))
+        tm.assert_frame_equal(df, expected, check_like=True)
+
+        result = df.index.get_level_values('fizz')
+        expected = pd.Int64Index(np.arange(10), name='fizz').repeat(10)
+        tm.assert_index_equal(result, expected)
+
+        result = df.index.get_level_values('buzz')
+        expected = pd.Int64Index(np.tile(np.arange(10), 10), name='buzz')
+        tm.assert_index_equal(result, expected)
+
+    def test_dropna(self):
+        # GH 6194
+        idx = pd.MultiIndex.from_arrays([[1, np.nan, 3, np.nan, 5],
+                                         [1, 2, np.nan, np.nan, 5],
+                                         ['a', 'b', 'c', np.nan, 'e']])
+
+        exp = pd.MultiIndex.from_arrays([[1, 5],
+                                         [1, 5],
+                                         ['a', 'e']])
+        tm.assert_index_equal(idx.dropna(), exp)
+        tm.assert_index_equal(idx.dropna(how='any'), exp)
+
+        exp = pd.MultiIndex.from_arrays([[1, np.nan, 3, 5],
+                                         [1, 2, np.nan, 5],
+                                         ['a', 'b', 'c', 'e']])
+        tm.assert_index_equal(idx.dropna(how='all'), exp)
+
+        msg = "invalid how option: xxx"
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.dropna(how='xxx')
+
+    def test_unsortedindex(self):
+        # GH 11897
+        mi = pd.MultiIndex.from_tuples([('z', 'a'), ('x', 'a'), ('y', 'b'),
+                                        ('x', 'b'), ('y', 'a'), ('z', 'b')],
+                                       names=['one', 'two'])
+        df = pd.DataFrame([[i, 10 * i] for i in lrange(6)], index=mi,
+                          columns=['one', 'two'])
+
+        # GH 16734: not sorted, but no real slicing
+        result = df.loc(axis=0)['z', 'a']
+        expected = df.iloc[0]
+        tm.assert_series_equal(result, expected)
+
+        with pytest.raises(UnsortedIndexError):
+            df.loc(axis=0)['z', slice('a')]
+        df.sort_index(inplace=True)
+        assert len(df.loc(axis=0)['z', :]) == 2
+
+        with pytest.raises(KeyError):
+            df.loc(axis=0)['q', :]
+
+    def test_unsortedindex_doc_examples(self):
+        # http://pandas.pydata.org/pandas-docs/stable/advanced.html#sorting-a-multiindex  # noqa
+        dfm = DataFrame({'jim': [0, 0, 1, 1],
+                         'joe': ['x', 'x', 'z', 'y'],
+                         'jolie': np.random.rand(4)})
+
+        dfm = dfm.set_index(['jim', 'joe'])
+        with tm.assert_produces_warning(PerformanceWarning):
+            dfm.loc[(1, 'z')]
+
+        with pytest.raises(UnsortedIndexError):
+            dfm.loc[(0, 'y'):(1, 'z')]
+
+        assert not dfm.index.is_lexsorted()
+        assert dfm.index.lexsort_depth == 1
+
+        # sort it
+        dfm = dfm.sort_index()
+        dfm.loc[(1, 'z')]
+        dfm.loc[(0, 'y'):(1, 'z')]
+
+        assert dfm.index.is_lexsorted()
+        assert dfm.index.lexsort_depth == 2
+
+    def test_tuples_with_name_string(self):
+        # GH 15110 and GH 14848
+
+        li = [(0, 0, 1), (0, 1, 0), (1, 0, 0)]
+        with pytest.raises(ValueError):
+            pd.Index(li, name='abc')
+        with pytest.raises(ValueError):
+            pd.Index(li, name='a')
+
+    def test_nan_stays_float(self):
+
+        # GH 7031
+        idx0 = pd.MultiIndex(levels=[["A", "B"], []],
+                             labels=[[1, 0], [-1, -1]],
+                             names=[0, 1])
+        idx1 = pd.MultiIndex(levels=[["C"], ["D"]],
+                             labels=[[0], [0]],
+                             names=[0, 1])
+        idxm = idx0.join(idx1, how='outer')
+        assert pd.isna(idx0.get_level_values(1)).all()
+        # the following failed in 0.14.1
+        assert pd.isna(idxm.get_level_values(1)[:-1]).all()
+
+        df0 = pd.DataFrame([[1, 2]], index=idx0)
+        df1 = pd.DataFrame([[3, 4]], index=idx1)
+        dfm = df0 - df1
+        assert pd.isna(df0.index.get_level_values(1)).all()
+        # the following failed in 0.14.1
+        assert pd.isna(dfm.index.get_level_values(1)[:-1]).all()
+
+    def test_million_record_attribute_error(self):
+        # GH 18165
+        r = list(range(1000000))
+        df = pd.DataFrame({'a': r, 'b': r},
+                          index=pd.MultiIndex.from_tuples([(x, x) for x in r]))
+
+        with tm.assert_raises_regex(AttributeError,
+                                    "'Series' object has no attribute 'foo'"):
+            df['a'].foo()
+
+    def test_duplicate_multiindex_labels(self):
+        # GH 17464
+        # Make sure that a MultiIndex with duplicate levels throws a ValueError
+        with pytest.raises(ValueError):
+            ind = pd.MultiIndex([['A'] * 10, range(10)], [[0] * 10, range(10)])
+
+        # And that using set_levels with duplicate levels fails
+        ind = MultiIndex.from_arrays([['A', 'A', 'B', 'B', 'B'],
+                                      [1, 2, 1, 2, 3]])
+        with pytest.raises(ValueError):
+            ind.set_levels([['A', 'B', 'A', 'A', 'B'], [2, 1, 3, -2, 5]],
+                           inplace=True)
+
+    def test_multiindex_compare(self):
+        # GH 21149
+        # Ensure comparison operations for MultiIndex with nlevels == 1
+        # behave consistently with those for MultiIndex with nlevels > 1
+
+        midx = pd.MultiIndex.from_product([[0, 1]])
+
+        # Equality self-test: MultiIndex object vs self
+        expected = pd.Series([True, True])
+        result = pd.Series(midx == midx)
+        tm.assert_series_equal(result, expected)
+
+        # Greater than comparison: MultiIndex object vs self
+        expected = pd.Series([False, False])
+        result = pd.Series(midx > midx)
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/indexes/test_numeric.py b/pandas/tests/indexes/test_numeric.py
new file mode 100644
index 0000000000000..166af4c89877d
--- /dev/null
+++ b/pandas/tests/indexes/test_numeric.py
@@ -0,0 +1,1348 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from datetime import datetime
+from pandas.compat import range, PY3
+
+import numpy as np
+
+from pandas import (date_range, Series, Index, Float64Index,
+                    Int64Index, UInt64Index, RangeIndex)
+
+import pandas.util.testing as tm
+
+import pandas as pd
+from pandas._libs.tslib import Timestamp, Timedelta
+
+from pandas.tests.indexes.common import Base
+
+
+def full_like(array, value):
+    """Compatibility for numpy<1.8.0
+    """
+    ret = np.empty(array.shape, dtype=np.array(value).dtype)
+    ret.fill(value)
+    return ret
+
+
+class TestIndexArithmeticWithTimedeltaScalar(object):
+
+    @pytest.mark.parametrize('index', [
+        Int64Index(range(1, 11)),
+        UInt64Index(range(1, 11)),
+        Float64Index(range(1, 11)),
+        RangeIndex(1, 11)])
+    @pytest.mark.parametrize('scalar_td', [Timedelta(days=1),
+                                           Timedelta(days=1).to_timedelta64(),
+                                           Timedelta(days=1).to_pytimedelta()])
+    def test_index_mul_timedelta(self, scalar_td, index):
+        # GH#19333
+        expected = pd.timedelta_range('1 days', '10 days')
+
+        result = index * scalar_td
+        tm.assert_index_equal(result, expected)
+        commute = scalar_td * index
+        tm.assert_index_equal(commute, expected)
+
+    @pytest.mark.parametrize('index', [Int64Index(range(1, 3)),
+                                       UInt64Index(range(1, 3)),
+                                       Float64Index(range(1, 3)),
+                                       RangeIndex(1, 3)])
+    @pytest.mark.parametrize('scalar_td', [Timedelta(days=1),
+                                           Timedelta(days=1).to_timedelta64(),
+                                           Timedelta(days=1).to_pytimedelta()])
+    def test_index_rdiv_timedelta(self, scalar_td, index):
+        expected = pd.TimedeltaIndex(['1 Day', '12 Hours'])
+
+        result = scalar_td / index
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            index / scalar_td
+
+
+class Numeric(Base):
+
+    def test_can_hold_identifiers(self):
+        idx = self.create_index()
+        key = idx[0]
+        assert idx._can_hold_identifiers_and_holds_name(key) is False
+
+    def test_numeric_compat(self):
+        pass  # override Base method
+
+    def test_mul_int(self):
+        idx = self.create_index()
+        result = idx * 1
+        tm.assert_index_equal(result, idx)
+
+    def test_rmul_int(self):
+        idx = self.create_index()
+
+        result = 1 * idx
+        tm.assert_index_equal(result, idx)
+
+    def test_div_int(self):
+        idx = self.create_index()
+
+        # truediv under PY3
+        result = idx / 1
+        expected = idx
+        if PY3:
+            expected = expected.astype('float64')
+        tm.assert_index_equal(result, expected)
+
+        result = idx / 2
+        if PY3:
+            expected = expected.astype('float64')
+        expected = Index(idx.values / 2)
+        tm.assert_index_equal(result, expected)
+
+    def test_floordiv_int(self):
+        idx = self.create_index()
+
+        result = idx // 1
+        tm.assert_index_equal(result, idx)
+
+    def test_mul_int_array(self):
+        idx = self.create_index()
+        didx = idx * idx
+
+        result = idx * np.array(5, dtype='int64')
+        tm.assert_index_equal(result, idx * 5)
+
+        arr_dtype = 'uint64' if isinstance(idx, UInt64Index) else 'int64'
+        result = idx * np.arange(5, dtype=arr_dtype)
+        tm.assert_index_equal(result, didx)
+
+    def test_mul_int_series(self):
+        idx = self.create_index()
+        didx = idx * idx
+
+        arr_dtype = 'uint64' if isinstance(idx, UInt64Index) else 'int64'
+        result = idx * Series(np.arange(5, dtype=arr_dtype))
+        tm.assert_series_equal(result, Series(didx))
+
+    def test_mul_float_series(self):
+        idx = self.create_index()
+        rng5 = np.arange(5, dtype='float64')
+
+        result = idx * Series(rng5 + 0.1)
+        expected = Series(rng5 * (rng5 + 0.1))
+        tm.assert_series_equal(result, expected)
+
+    def test_mul_index(self):
+        idx = self.create_index()
+
+        # in general not true for RangeIndex
+        if not isinstance(idx, RangeIndex):
+            result = idx * idx
+            tm.assert_index_equal(result, idx ** 2)
+
+    def test_mul_datelike_raises(self):
+        idx = self.create_index()
+        with pytest.raises(TypeError):
+            idx * date_range('20130101', periods=5)
+
+    def test_mul_size_mismatch_raises(self):
+        idx = self.create_index()
+
+        with pytest.raises(ValueError):
+            idx * idx[0:3]
+        with pytest.raises(ValueError):
+            idx * np.array([1, 2])
+
+    def test_divmod(self):
+        idx = self.create_index()
+
+        result = divmod(idx, 2)
+        with np.errstate(all='ignore'):
+            div, mod = divmod(idx.values, 2)
+            expected = Index(div), Index(mod)
+        for r, e in zip(result, expected):
+            tm.assert_index_equal(r, e)
+
+        result = divmod(idx, full_like(idx.values, 2))
+        with np.errstate(all='ignore'):
+            div, mod = divmod(idx.values, full_like(idx.values, 2))
+            expected = Index(div), Index(mod)
+        for r, e in zip(result, expected):
+            tm.assert_index_equal(r, e)
+
+    def test_pow_float(self):
+        # test power calculations both ways, GH 14973
+        idx = self.create_index()
+
+        expected = pd.Float64Index(idx.values**2.0)
+        result = idx**2.0
+        tm.assert_index_equal(result, expected)
+
+    def test_rpow_float(self):
+        # test power calculations both ways, GH 14973
+        idx = self.create_index()
+
+        expected = pd.Float64Index(2.0**idx.values)
+        result = 2.0**idx
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.xfail(reason='GH#19252 Series has no __rdivmod__')
+    def test_divmod_series(self):
+        idx = self.create_index()
+
+        result = divmod(idx, Series(full_like(idx.values, 2)))
+        with np.errstate(all='ignore'):
+            div, mod = divmod(idx.values, full_like(idx.values, 2))
+            expected = Series(div), Series(mod)
+
+        for r, e in zip(result, expected):
+            tm.assert_series_equal(r, e)
+
+    def test_div_zero(self, zero):
+        idx = self.create_index()
+
+        expected = Index([np.nan, np.inf, np.inf, np.inf, np.inf],
+                         dtype=np.float64)
+        result = idx / zero
+        tm.assert_index_equal(result, expected)
+        ser_compat = Series(idx).astype('i8') / np.array(zero).astype('i8')
+        tm.assert_series_equal(ser_compat, Series(result))
+
+    def test_floordiv_zero(self, zero):
+        idx = self.create_index()
+        expected = Index([np.nan, np.inf, np.inf, np.inf, np.inf],
+                         dtype=np.float64)
+
+        result = idx // zero
+        tm.assert_index_equal(result, expected)
+        ser_compat = Series(idx).astype('i8') // np.array(zero).astype('i8')
+        tm.assert_series_equal(ser_compat, Series(result))
+
+    def test_mod_zero(self, zero):
+        idx = self.create_index()
+
+        expected = Index([np.nan, np.nan, np.nan, np.nan, np.nan],
+                         dtype=np.float64)
+        result = idx % zero
+        tm.assert_index_equal(result, expected)
+        ser_compat = Series(idx).astype('i8') % np.array(zero).astype('i8')
+        tm.assert_series_equal(ser_compat, Series(result))
+
+    def test_divmod_zero(self, zero):
+        idx = self.create_index()
+
+        exleft = Index([np.nan, np.inf, np.inf, np.inf, np.inf],
+                       dtype=np.float64)
+        exright = Index([np.nan, np.nan, np.nan, np.nan, np.nan],
+                        dtype=np.float64)
+
+        result = divmod(idx, zero)
+        tm.assert_index_equal(result[0], exleft)
+        tm.assert_index_equal(result[1], exright)
+
+    def test_explicit_conversions(self):
+
+        # GH 8608
+        # add/sub are overridden explicitly for Float/Int Index
+        idx = self._holder(np.arange(5, dtype='int64'))
+
+        # float conversions
+        arr = np.arange(5, dtype='int64') * 3.2
+        expected = Float64Index(arr)
+        fidx = idx * 3.2
+        tm.assert_index_equal(fidx, expected)
+        fidx = 3.2 * idx
+        tm.assert_index_equal(fidx, expected)
+
+        # interops with numpy arrays
+        expected = Float64Index(arr)
+        a = np.zeros(5, dtype='float64')
+        result = fidx - a
+        tm.assert_index_equal(result, expected)
+
+        expected = Float64Index(-arr)
+        a = np.zeros(5, dtype='float64')
+        result = a - fidx
+        tm.assert_index_equal(result, expected)
+
+    def test_ufunc_compat(self):
+        idx = self._holder(np.arange(5, dtype='int64'))
+        result = np.sin(idx)
+        expected = Float64Index(np.sin(np.arange(5, dtype='int64')))
+        tm.assert_index_equal(result, expected)
+
+    def test_index_groupby(self):
+        int_idx = Index(range(6))
+        float_idx = Index(np.arange(0, 0.6, 0.1))
+        obj_idx = Index('A B C D E F'.split())
+        dt_idx = pd.date_range('2013-01-01', freq='M', periods=6)
+
+        for idx in [int_idx, float_idx, obj_idx, dt_idx]:
+            to_groupby = np.array([1, 2, np.nan, np.nan, 2, 1])
+            tm.assert_dict_equal(idx.groupby(to_groupby),
+                                 {1.0: idx[[0, 5]], 2.0: idx[[1, 4]]})
+
+            to_groupby = Index([datetime(2011, 11, 1),
+                                datetime(2011, 12, 1),
+                                pd.NaT,
+                                pd.NaT,
+                                datetime(2011, 12, 1),
+                                datetime(2011, 11, 1)],
+                               tz='UTC').values
+
+            ex_keys = [Timestamp('2011-11-01'), Timestamp('2011-12-01')]
+            expected = {ex_keys[0]: idx[[0, 5]],
+                        ex_keys[1]: idx[[1, 4]]}
+            tm.assert_dict_equal(idx.groupby(to_groupby), expected)
+
+    def test_modulo(self):
+        # GH 9244
+        index = self.create_index()
+        expected = Index(index.values % 2)
+        tm.assert_index_equal(index % 2, expected)
+
+    @pytest.mark.parametrize('klass', [list, tuple, np.array, Series])
+    def test_where(self, klass):
+        i = self.create_index()
+        cond = [True] * len(i)
+        expected = i
+        result = i.where(klass(cond))
+
+        cond = [False] + [True] * (len(i) - 1)
+        expected = Float64Index([i._na_value] + i[1:].tolist())
+        result = i.where(klass(cond))
+        tm.assert_index_equal(result, expected)
+
+    def test_insert(self):
+        # GH 18295 (test missing)
+        expected = Float64Index([0, np.nan, 1, 2, 3, 4])
+        for na in (np.nan, pd.NaT, None):
+            result = self.create_index().insert(1, na)
+            tm.assert_index_equal(result, expected)
+
+
+class TestFloat64Index(Numeric):
+    _holder = Float64Index
+
+    def setup_method(self, method):
+        self.indices = dict(mixed=Float64Index([1.5, 2, 3, 4, 5]),
+                            float=Float64Index(np.arange(5) * 2.5),
+                            mixed_dec=Float64Index([5, 4, 3, 2, 1.5]),
+                            float_dec=Float64Index(np.arange(4, -1, -1) * 2.5))
+        self.setup_indices()
+
+    def create_index(self):
+        return Float64Index(np.arange(5, dtype='float64'))
+
+    def test_repr_roundtrip(self):
+        for ind in (self.mixed, self.float):
+            tm.assert_index_equal(eval(repr(ind)), ind)
+
+    def check_is_index(self, i):
+        assert isinstance(i, Index)
+        assert not isinstance(i, Float64Index)
+
+    def check_coerce(self, a, b, is_float_index=True):
+        assert a.equals(b)
+        tm.assert_index_equal(a, b, exact=False)
+        if is_float_index:
+            assert isinstance(b, Float64Index)
+        else:
+            self.check_is_index(b)
+
+    def test_constructor(self):
+
+        # explicit construction
+        index = Float64Index([1, 2, 3, 4, 5])
+        assert isinstance(index, Float64Index)
+        expected = np.array([1, 2, 3, 4, 5], dtype='float64')
+        tm.assert_numpy_array_equal(index.values, expected)
+        index = Float64Index(np.array([1, 2, 3, 4, 5]))
+        assert isinstance(index, Float64Index)
+        index = Float64Index([1., 2, 3, 4, 5])
+        assert isinstance(index, Float64Index)
+        index = Float64Index(np.array([1., 2, 3, 4, 5]))
+        assert isinstance(index, Float64Index)
+        assert index.dtype == float
+
+        index = Float64Index(np.array([1., 2, 3, 4, 5]), dtype=np.float32)
+        assert isinstance(index, Float64Index)
+        assert index.dtype == np.float64
+
+        index = Float64Index(np.array([1, 2, 3, 4, 5]), dtype=np.float32)
+        assert isinstance(index, Float64Index)
+        assert index.dtype == np.float64
+
+        # nan handling
+        result = Float64Index([np.nan, np.nan])
+        assert pd.isna(result.values).all()
+        result = Float64Index(np.array([np.nan]))
+        assert pd.isna(result.values).all()
+        result = Index(np.array([np.nan]))
+        assert pd.isna(result.values).all()
+
+    def test_constructor_invalid(self):
+
+        # invalid
+        pytest.raises(TypeError, Float64Index, 0.)
+        pytest.raises(TypeError, Float64Index, ['a', 'b', 0.])
+        pytest.raises(TypeError, Float64Index, [Timestamp('20130101')])
+
+    def test_constructor_coerce(self):
+
+        self.check_coerce(self.mixed, Index([1.5, 2, 3, 4, 5]))
+        self.check_coerce(self.float, Index(np.arange(5) * 2.5))
+        self.check_coerce(self.float, Index(np.array(
+            np.arange(5) * 2.5, dtype=object)))
+
+    def test_constructor_explicit(self):
+
+        # these don't auto convert
+        self.check_coerce(self.float,
+                          Index((np.arange(5) * 2.5), dtype=object),
+                          is_float_index=False)
+        self.check_coerce(self.mixed, Index(
+            [1.5, 2, 3, 4, 5], dtype=object), is_float_index=False)
+
+    def test_astype(self):
+
+        result = self.float.astype(object)
+        assert result.equals(self.float)
+        assert self.float.equals(result)
+        self.check_is_index(result)
+
+        i = self.mixed.copy()
+        i.name = 'foo'
+        result = i.astype(object)
+        assert result.equals(i)
+        assert i.equals(result)
+        self.check_is_index(result)
+
+        # GH 12881
+        # a float astype int
+        for dtype in ['int16', 'int32', 'int64']:
+            i = Float64Index([0, 1, 2])
+            result = i.astype(dtype)
+            expected = Int64Index([0, 1, 2])
+            tm.assert_index_equal(result, expected)
+
+            i = Float64Index([0, 1.1, 2])
+            result = i.astype(dtype)
+            expected = Int64Index([0, 1, 2])
+            tm.assert_index_equal(result, expected)
+
+        for dtype in ['float32', 'float64']:
+            i = Float64Index([0, 1, 2])
+            result = i.astype(dtype)
+            expected = i
+            tm.assert_index_equal(result, expected)
+
+            i = Float64Index([0, 1.1, 2])
+            result = i.astype(dtype)
+            expected = Index(i.values.astype(dtype))
+            tm.assert_index_equal(result, expected)
+
+        # invalid
+        for dtype in ['M8[ns]', 'm8[ns]']:
+            pytest.raises(TypeError, lambda: i.astype(dtype))
+
+        # GH 13149
+        for dtype in ['int16', 'int32', 'int64']:
+            i = Float64Index([0, 1.1, np.NAN])
+            pytest.raises(ValueError, lambda: i.astype(dtype))
+
+    def test_type_coercion_fail(self, any_int_dtype):
+        # see gh-15832
+        msg = "Trying to coerce float values to integers"
+        with tm.assert_raises_regex(ValueError, msg):
+            Index([1, 2, 3.5], dtype=any_int_dtype)
+
+    def test_type_coercion_valid(self, float_dtype):
+        # There is no Float32Index, so we always
+        # generate Float64Index.
+        i = Index([1, 2, 3.5], dtype=float_dtype)
+        tm.assert_index_equal(i, Index([1, 2, 3.5]))
+
+    def test_equals_numeric(self):
+
+        i = Float64Index([1.0, 2.0])
+        assert i.equals(i)
+        assert i.identical(i)
+
+        i2 = Float64Index([1.0, 2.0])
+        assert i.equals(i2)
+
+        i = Float64Index([1.0, np.nan])
+        assert i.equals(i)
+        assert i.identical(i)
+
+        i2 = Float64Index([1.0, np.nan])
+        assert i.equals(i2)
+
+    def test_get_indexer(self):
+        idx = Float64Index([0.0, 1.0, 2.0])
+        tm.assert_numpy_array_equal(idx.get_indexer(idx),
+                                    np.array([0, 1, 2], dtype=np.intp))
+
+        target = [-0.1, 0.5, 1.1]
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'),
+                                    np.array([-1, 0, 1], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'),
+                                    np.array([0, 1, 2], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'),
+                                    np.array([0, 1, 1], dtype=np.intp))
+
+    def test_get_loc(self):
+        idx = Float64Index([0.0, 1.0, 2.0])
+        for method in [None, 'pad', 'backfill', 'nearest']:
+            assert idx.get_loc(1, method) == 1
+            if method is not None:
+                assert idx.get_loc(1, method, tolerance=0) == 1
+
+        for method, loc in [('pad', 1), ('backfill', 2), ('nearest', 1)]:
+            assert idx.get_loc(1.1, method) == loc
+            assert idx.get_loc(1.1, method, tolerance=0.9) == loc
+
+        pytest.raises(KeyError, idx.get_loc, 'foo')
+        pytest.raises(KeyError, idx.get_loc, 1.5)
+        pytest.raises(KeyError, idx.get_loc, 1.5, method='pad',
+                      tolerance=0.1)
+
+        with tm.assert_raises_regex(ValueError, 'must be numeric'):
+            idx.get_loc(1.4, method='nearest', tolerance='foo')
+
+        with pytest.raises(ValueError, match='must contain numeric elements'):
+            idx.get_loc(1.4, method='nearest', tolerance=np.array(['foo']))
+
+        with pytest.raises(
+                ValueError,
+                match='tolerance size must match target index size'):
+            idx.get_loc(1.4, method='nearest', tolerance=np.array([1, 2]))
+
+    def test_get_loc_na(self):
+        idx = Float64Index([np.nan, 1, 2])
+        assert idx.get_loc(1) == 1
+        assert idx.get_loc(np.nan) == 0
+
+        idx = Float64Index([np.nan, 1, np.nan])
+        assert idx.get_loc(1) == 1
+
+        # representable by slice [0:2:2]
+        # pytest.raises(KeyError, idx.slice_locs, np.nan)
+        sliced = idx.slice_locs(np.nan)
+        assert isinstance(sliced, tuple)
+        assert sliced == (0, 3)
+
+        # not representable by slice
+        idx = Float64Index([np.nan, 1, np.nan, np.nan])
+        assert idx.get_loc(1) == 1
+        pytest.raises(KeyError, idx.slice_locs, np.nan)
+
+    def test_get_loc_missing_nan(self):
+        # GH 8569
+        idx = Float64Index([1, 2])
+        assert idx.get_loc(1) == 0
+        pytest.raises(KeyError, idx.get_loc, 3)
+        pytest.raises(KeyError, idx.get_loc, np.nan)
+        pytest.raises(KeyError, idx.get_loc, [np.nan])
+
+    def test_contains_nans(self):
+        i = Float64Index([1.0, 2.0, np.nan])
+        assert np.nan in i
+
+    def test_contains_not_nans(self):
+        i = Float64Index([1.0, 2.0, np.nan])
+        assert 1.0 in i
+
+    def test_doesnt_contain_all_the_things(self):
+        i = Float64Index([np.nan])
+        assert not i.isin([0]).item()
+        assert not i.isin([1]).item()
+        assert i.isin([np.nan]).item()
+
+    def test_nan_multiple_containment(self):
+        i = Float64Index([1.0, np.nan])
+        tm.assert_numpy_array_equal(i.isin([1.0]), np.array([True, False]))
+        tm.assert_numpy_array_equal(i.isin([2.0, np.pi]),
+                                    np.array([False, False]))
+        tm.assert_numpy_array_equal(i.isin([np.nan]), np.array([False, True]))
+        tm.assert_numpy_array_equal(i.isin([1.0, np.nan]),
+                                    np.array([True, True]))
+        i = Float64Index([1.0, 2.0])
+        tm.assert_numpy_array_equal(i.isin([np.nan]), np.array([False, False]))
+
+    def test_astype_from_object(self):
+        index = Index([1.0, np.nan, 0.2], dtype='object')
+        result = index.astype(float)
+        expected = Float64Index([1.0, np.nan, 0.2])
+        assert result.dtype == expected.dtype
+        tm.assert_index_equal(result, expected)
+
+    def test_fillna_float64(self):
+        # GH 11343
+        idx = Index([1.0, np.nan, 3.0], dtype=float, name='x')
+        # can't downcast
+        exp = Index([1.0, 0.1, 3.0], name='x')
+        tm.assert_index_equal(idx.fillna(0.1), exp)
+
+        # downcast
+        exp = Float64Index([1.0, 2.0, 3.0], name='x')
+        tm.assert_index_equal(idx.fillna(2), exp)
+
+        # object
+        exp = Index([1.0, 'obj', 3.0], name='x')
+        tm.assert_index_equal(idx.fillna('obj'), exp)
+
+    def test_take_fill_value(self):
+        # GH 12631
+        idx = pd.Float64Index([1., 2., 3.], name='xxx')
+        result = idx.take(np.array([1, 0, -1]))
+        expected = pd.Float64Index([2., 1., 3.], name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        # fill_value
+        result = idx.take(np.array([1, 0, -1]), fill_value=True)
+        expected = pd.Float64Index([2., 1., np.nan], name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        expected = pd.Float64Index([2., 1., 3.], name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -2]), fill_value=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            idx.take(np.array([1, -5]))
+
+
+class NumericInt(Numeric):
+
+    def test_view(self, indices):
+        super(NumericInt, self).test_view(indices)
+
+        i = self._holder([], name='Foo')
+        i_view = i.view()
+        assert i_view.name == 'Foo'
+
+        i_view = i.view(self._dtype)
+        tm.assert_index_equal(i, self._holder(i_view, name='Foo'))
+
+        i_view = i.view(self._holder)
+        tm.assert_index_equal(i, self._holder(i_view, name='Foo'))
+
+    def test_is_monotonic(self):
+        assert self.index.is_monotonic
+        assert self.index.is_monotonic_increasing
+        assert self.index._is_strictly_monotonic_increasing
+        assert not self.index.is_monotonic_decreasing
+        assert not self.index._is_strictly_monotonic_decreasing
+
+        index = self._holder([4, 3, 2, 1])
+        assert not index.is_monotonic
+        assert not index._is_strictly_monotonic_increasing
+        assert index._is_strictly_monotonic_decreasing
+
+        index = self._holder([1])
+        assert index.is_monotonic
+        assert index.is_monotonic_increasing
+        assert index.is_monotonic_decreasing
+        assert index._is_strictly_monotonic_increasing
+        assert index._is_strictly_monotonic_decreasing
+
+    def test_is_strictly_monotonic(self):
+        index = self._holder([1, 1, 2, 3])
+        assert index.is_monotonic_increasing
+        assert not index._is_strictly_monotonic_increasing
+
+        index = self._holder([3, 2, 1, 1])
+        assert index.is_monotonic_decreasing
+        assert not index._is_strictly_monotonic_decreasing
+
+        index = self._holder([1, 1])
+        assert index.is_monotonic_increasing
+        assert index.is_monotonic_decreasing
+        assert not index._is_strictly_monotonic_increasing
+        assert not index._is_strictly_monotonic_decreasing
+
+    def test_logical_compat(self):
+        idx = self.create_index()
+        assert idx.all() == idx.values.all()
+        assert idx.any() == idx.values.any()
+
+    def test_identical(self):
+        i = Index(self.index.copy())
+        assert i.identical(self.index)
+
+        same_values_different_type = Index(i, dtype=object)
+        assert not i.identical(same_values_different_type)
+
+        i = self.index.copy(dtype=object)
+        i = i.rename('foo')
+        same_values = Index(i, dtype=object)
+        assert same_values.identical(i)
+
+        assert not i.identical(self.index)
+        assert Index(same_values, name='foo', dtype=object).identical(i)
+
+        assert not self.index.copy(dtype=object).identical(
+            self.index.copy(dtype=self._dtype))
+
+    def test_join_non_unique(self):
+        left = Index([4, 4, 3, 3])
+
+        joined, lidx, ridx = left.join(left, return_indexers=True)
+
+        exp_joined = Index([3, 3, 3, 3, 4, 4, 4, 4])
+        tm.assert_index_equal(joined, exp_joined)
+
+        exp_lidx = np.array([2, 2, 3, 3, 0, 0, 1, 1], dtype=np.intp)
+        tm.assert_numpy_array_equal(lidx, exp_lidx)
+
+        exp_ridx = np.array([2, 3, 2, 3, 0, 1, 0, 1], dtype=np.intp)
+        tm.assert_numpy_array_equal(ridx, exp_ridx)
+
+    def test_join_self(self):
+        kinds = 'outer', 'inner', 'left', 'right'
+        for kind in kinds:
+            joined = self.index.join(self.index, how=kind)
+            assert self.index is joined
+
+    def test_union_noncomparable(self):
+        from datetime import datetime, timedelta
+        # corner case, non-Int64Index
+        now = datetime.now()
+        other = Index([now + timedelta(i) for i in range(4)], dtype=object)
+        result = self.index.union(other)
+        expected = Index(np.concatenate((self.index, other)))
+        tm.assert_index_equal(result, expected)
+
+        result = other.union(self.index)
+        expected = Index(np.concatenate((other, self.index)))
+        tm.assert_index_equal(result, expected)
+
+    def test_cant_or_shouldnt_cast(self):
+        # can't
+        data = ['foo', 'bar', 'baz']
+        pytest.raises(TypeError, self._holder, data)
+
+        # shouldn't
+        data = ['0', '1', '2']
+        pytest.raises(TypeError, self._holder, data)
+
+    def test_view_index(self):
+        self.index.view(Index)
+
+    def test_prevent_casting(self):
+        result = self.index.astype('O')
+        assert result.dtype == np.object_
+
+    def test_take_preserve_name(self):
+        index = self._holder([1, 2, 3, 4], name='foo')
+        taken = index.take([3, 0, 1])
+        assert index.name == taken.name
+
+    def test_take_fill_value(self):
+        # see gh-12631
+        idx = self._holder([1, 2, 3], name='xxx')
+        result = idx.take(np.array([1, 0, -1]))
+        expected = self._holder([2, 1, 3], name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        name = self._holder.__name__
+        msg = ("Unable to fill values because "
+               "{name} cannot contain NA").format(name=name)
+
+        # fill_value=True
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -1]), fill_value=True)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        expected = self._holder([2, 1, 3], name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -2]), fill_value=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            idx.take(np.array([1, -5]))
+
+    def test_slice_keep_name(self):
+        idx = self._holder([1, 2], name='asdf')
+        assert idx.name == idx[1:].name
+
+    def test_ufunc_coercions(self):
+        idx = self._holder([1, 2, 3, 4, 5], name='x')
+
+        result = np.sqrt(idx)
+        assert isinstance(result, Float64Index)
+        exp = Float64Index(np.sqrt(np.array([1, 2, 3, 4, 5])), name='x')
+        tm.assert_index_equal(result, exp)
+
+        result = np.divide(idx, 2.)
+        assert isinstance(result, Float64Index)
+        exp = Float64Index([0.5, 1., 1.5, 2., 2.5], name='x')
+        tm.assert_index_equal(result, exp)
+
+        # _evaluate_numeric_binop
+        result = idx + 2.
+        assert isinstance(result, Float64Index)
+        exp = Float64Index([3., 4., 5., 6., 7.], name='x')
+        tm.assert_index_equal(result, exp)
+
+        result = idx - 2.
+        assert isinstance(result, Float64Index)
+        exp = Float64Index([-1., 0., 1., 2., 3.], name='x')
+        tm.assert_index_equal(result, exp)
+
+        result = idx * 1.
+        assert isinstance(result, Float64Index)
+        exp = Float64Index([1., 2., 3., 4., 5.], name='x')
+        tm.assert_index_equal(result, exp)
+
+        result = idx / 2.
+        assert isinstance(result, Float64Index)
+        exp = Float64Index([0.5, 1., 1.5, 2., 2.5], name='x')
+        tm.assert_index_equal(result, exp)
+
+
+class TestInt64Index(NumericInt):
+    _dtype = 'int64'
+    _holder = Int64Index
+
+    def setup_method(self, method):
+        self.indices = dict(index=Int64Index(np.arange(0, 20, 2)),
+                            index_dec=Int64Index(np.arange(19, -1, -1)))
+        self.setup_indices()
+
+    def create_index(self):
+        return Int64Index(np.arange(5, dtype='int64'))
+
+    def test_constructor(self):
+        # pass list, coerce fine
+        index = Int64Index([-5, 0, 1, 2])
+        expected = Index([-5, 0, 1, 2], dtype=np.int64)
+        tm.assert_index_equal(index, expected)
+
+        # from iterable
+        index = Int64Index(iter([-5, 0, 1, 2]))
+        tm.assert_index_equal(index, expected)
+
+        # scalar raise Exception
+        pytest.raises(TypeError, Int64Index, 5)
+
+        # copy
+        arr = self.index.values
+        new_index = Int64Index(arr, copy=True)
+        tm.assert_index_equal(new_index, self.index)
+        val = arr[0] + 3000
+
+        # this should not change index
+        arr[0] = val
+        assert new_index[0] != val
+
+        # interpret list-like
+        expected = Int64Index([5, 0])
+        for cls in [Index, Int64Index]:
+            for idx in [cls([5, 0], dtype='int64'),
+                        cls(np.array([5, 0]), dtype='int64'),
+                        cls(Series([5, 0]), dtype='int64')]:
+                tm.assert_index_equal(idx, expected)
+
+    def test_constructor_corner(self):
+        arr = np.array([1, 2, 3, 4], dtype=object)
+        index = Int64Index(arr)
+        assert index.values.dtype == np.int64
+        tm.assert_index_equal(index, Index(arr))
+
+        # preventing casting
+        arr = np.array([1, '2', 3, '4'], dtype=object)
+        with tm.assert_raises_regex(TypeError, 'casting'):
+            Int64Index(arr)
+
+        arr_with_floats = [0, 2, 3, 4, 5, 1.25, 3, -1]
+        with tm.assert_raises_regex(TypeError, 'casting'):
+            Int64Index(arr_with_floats)
+
+    def test_constructor_coercion_signed_to_unsigned(self, uint_dtype):
+
+        # see gh-15832
+        msg = "Trying to coerce negative values to unsigned integers"
+
+        with tm.assert_raises_regex(OverflowError, msg):
+            Index([-1], dtype=uint_dtype)
+
+    def test_coerce_list(self):
+        # coerce things
+        arr = Index([1, 2, 3, 4])
+        assert isinstance(arr, Int64Index)
+
+        # but not if explicit dtype passed
+        arr = Index([1, 2, 3, 4], dtype=object)
+        assert isinstance(arr, Index)
+
+    def test_get_indexer(self):
+        target = Int64Index(np.arange(10))
+        indexer = self.index.get_indexer(target)
+        expected = np.array([0, -1, 1, -1, 2, -1, 3, -1, 4, -1], dtype=np.intp)
+        tm.assert_numpy_array_equal(indexer, expected)
+
+        target = Int64Index(np.arange(10))
+        indexer = self.index.get_indexer(target, method='pad')
+        expected = np.array([0, 0, 1, 1, 2, 2, 3, 3, 4, 4], dtype=np.intp)
+        tm.assert_numpy_array_equal(indexer, expected)
+
+        target = Int64Index(np.arange(10))
+        indexer = self.index.get_indexer(target, method='backfill')
+        expected = np.array([0, 1, 1, 2, 2, 3, 3, 4, 4, 5], dtype=np.intp)
+        tm.assert_numpy_array_equal(indexer, expected)
+
+    def test_intersection(self):
+        other = Index([1, 2, 3, 4, 5])
+        result = self.index.intersection(other)
+        expected = Index(np.sort(np.intersect1d(self.index.values,
+                                                other.values)))
+        tm.assert_index_equal(result, expected)
+
+        result = other.intersection(self.index)
+        expected = Index(np.sort(np.asarray(np.intersect1d(self.index.values,
+                                                           other.values))))
+        tm.assert_index_equal(result, expected)
+
+    def test_join_inner(self):
+        other = Int64Index([7, 12, 25, 1, 2, 5])
+        other_mono = Int64Index([1, 2, 5, 7, 12, 25])
+
+        # not monotonic
+        res, lidx, ridx = self.index.join(other, how='inner',
+                                          return_indexers=True)
+
+        # no guarantee of sortedness, so sort for comparison purposes
+        ind = res.argsort()
+        res = res.take(ind)
+        lidx = lidx.take(ind)
+        ridx = ridx.take(ind)
+
+        eres = Int64Index([2, 12])
+        elidx = np.array([1, 6], dtype=np.intp)
+        eridx = np.array([4, 1], dtype=np.intp)
+
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+        # monotonic
+        res, lidx, ridx = self.index.join(other_mono, how='inner',
+                                          return_indexers=True)
+
+        res2 = self.index.intersection(other_mono)
+        tm.assert_index_equal(res, res2)
+
+        elidx = np.array([1, 6], dtype=np.intp)
+        eridx = np.array([1, 4], dtype=np.intp)
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+    def test_join_left(self):
+        other = Int64Index([7, 12, 25, 1, 2, 5])
+        other_mono = Int64Index([1, 2, 5, 7, 12, 25])
+
+        # not monotonic
+        res, lidx, ridx = self.index.join(other, how='left',
+                                          return_indexers=True)
+        eres = self.index
+        eridx = np.array([-1, 4, -1, -1, -1, -1, 1, -1, -1, -1],
+                         dtype=np.intp)
+
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
+        assert lidx is None
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+        # monotonic
+        res, lidx, ridx = self.index.join(other_mono, how='left',
+                                          return_indexers=True)
+        eridx = np.array([-1, 1, -1, -1, -1, -1, 4, -1, -1, -1],
+                         dtype=np.intp)
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
+        assert lidx is None
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+        # non-unique
+        idx = Index([1, 1, 2, 5])
+        idx2 = Index([1, 2, 5, 7, 9])
+        res, lidx, ridx = idx2.join(idx, how='left', return_indexers=True)
+        eres = Index([1, 1, 2, 5, 7, 9])  # 1 is in idx2, so it should be x2
+        eridx = np.array([0, 1, 2, 3, -1, -1], dtype=np.intp)
+        elidx = np.array([0, 0, 1, 2, 3, 4], dtype=np.intp)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+    def test_join_right(self):
+        other = Int64Index([7, 12, 25, 1, 2, 5])
+        other_mono = Int64Index([1, 2, 5, 7, 12, 25])
+
+        # not monotonic
+        res, lidx, ridx = self.index.join(other, how='right',
+                                          return_indexers=True)
+        eres = other
+        elidx = np.array([-1, 6, -1, -1, 1, -1], dtype=np.intp)
+
+        assert isinstance(other, Int64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        assert ridx is None
+
+        # monotonic
+        res, lidx, ridx = self.index.join(other_mono, how='right',
+                                          return_indexers=True)
+        eres = other_mono
+        elidx = np.array([-1, 1, -1, -1, 6, -1], dtype=np.intp)
+        assert isinstance(other, Int64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        assert ridx is None
+
+        # non-unique
+        idx = Index([1, 1, 2, 5])
+        idx2 = Index([1, 2, 5, 7, 9])
+        res, lidx, ridx = idx.join(idx2, how='right', return_indexers=True)
+        eres = Index([1, 1, 2, 5, 7, 9])  # 1 is in idx2, so it should be x2
+        elidx = np.array([0, 1, 2, 3, -1, -1], dtype=np.intp)
+        eridx = np.array([0, 0, 1, 2, 3, 4], dtype=np.intp)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+    def test_join_non_int_index(self):
+        other = Index([3, 6, 7, 8, 10], dtype=object)
+
+        outer = self.index.join(other, how='outer')
+        outer2 = other.join(self.index, how='outer')
+        expected = Index([0, 2, 3, 4, 6, 7, 8, 10, 12, 14, 16, 18])
+        tm.assert_index_equal(outer, outer2)
+        tm.assert_index_equal(outer, expected)
+
+        inner = self.index.join(other, how='inner')
+        inner2 = other.join(self.index, how='inner')
+        expected = Index([6, 8, 10])
+        tm.assert_index_equal(inner, inner2)
+        tm.assert_index_equal(inner, expected)
+
+        left = self.index.join(other, how='left')
+        tm.assert_index_equal(left, self.index.astype(object))
+
+        left2 = other.join(self.index, how='left')
+        tm.assert_index_equal(left2, other)
+
+        right = self.index.join(other, how='right')
+        tm.assert_index_equal(right, other)
+
+        right2 = other.join(self.index, how='right')
+        tm.assert_index_equal(right2, self.index.astype(object))
+
+    def test_join_outer(self):
+        other = Int64Index([7, 12, 25, 1, 2, 5])
+        other_mono = Int64Index([1, 2, 5, 7, 12, 25])
+
+        # not monotonic
+        # guarantee of sortedness
+        res, lidx, ridx = self.index.join(other, how='outer',
+                                          return_indexers=True)
+        noidx_res = self.index.join(other, how='outer')
+        tm.assert_index_equal(res, noidx_res)
+
+        eres = Int64Index([0, 1, 2, 4, 5, 6, 7, 8, 10, 12, 14, 16, 18, 25])
+        elidx = np.array([0, -1, 1, 2, -1, 3, -1, 4, 5, 6, 7, 8, 9, -1],
+                         dtype=np.intp)
+        eridx = np.array([-1, 3, 4, -1, 5, -1, 0, -1, -1, 1, -1, -1, -1, 2],
+                         dtype=np.intp)
+
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+        # monotonic
+        res, lidx, ridx = self.index.join(other_mono, how='outer',
+                                          return_indexers=True)
+        noidx_res = self.index.join(other_mono, how='outer')
+        tm.assert_index_equal(res, noidx_res)
+
+        elidx = np.array([0, -1, 1, 2, -1, 3, -1, 4, 5, 6, 7, 8, 9, -1],
+                         dtype=np.intp)
+        eridx = np.array([-1, 0, 1, -1, 2, -1, 3, -1, -1, 4, -1, -1, -1, 5],
+                         dtype=np.intp)
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+
+class TestUInt64Index(NumericInt):
+
+    _dtype = 'uint64'
+    _holder = UInt64Index
+
+    def setup_method(self, method):
+        vals = [2**63, 2**63 + 10, 2**63 + 15, 2**63 + 20, 2**63 + 25]
+        self.indices = dict(index=UInt64Index(vals),
+                            index_dec=UInt64Index(reversed(vals)))
+        self.setup_indices()
+
+    def create_index(self):
+        return UInt64Index(np.arange(5, dtype='uint64'))
+
+    def test_constructor(self):
+        idx = UInt64Index([1, 2, 3])
+        res = Index([1, 2, 3], dtype=np.uint64)
+        tm.assert_index_equal(res, idx)
+
+        idx = UInt64Index([1, 2**63])
+        res = Index([1, 2**63], dtype=np.uint64)
+        tm.assert_index_equal(res, idx)
+
+        idx = UInt64Index([1, 2**63])
+        res = Index([1, 2**63])
+        tm.assert_index_equal(res, idx)
+
+        idx = Index([-1, 2**63], dtype=object)
+        res = Index(np.array([-1, 2**63], dtype=object))
+        tm.assert_index_equal(res, idx)
+
+    def test_get_indexer(self):
+        target = UInt64Index(np.arange(10).astype('uint64') * 5 + 2**63)
+        indexer = self.index.get_indexer(target)
+        expected = np.array([0, -1, 1, 2, 3, 4,
+                             -1, -1, -1, -1], dtype=np.intp)
+        tm.assert_numpy_array_equal(indexer, expected)
+
+        target = UInt64Index(np.arange(10).astype('uint64') * 5 + 2**63)
+        indexer = self.index.get_indexer(target, method='pad')
+        expected = np.array([0, 0, 1, 2, 3, 4,
+                             4, 4, 4, 4], dtype=np.intp)
+        tm.assert_numpy_array_equal(indexer, expected)
+
+        target = UInt64Index(np.arange(10).astype('uint64') * 5 + 2**63)
+        indexer = self.index.get_indexer(target, method='backfill')
+        expected = np.array([0, 1, 1, 2, 3, 4,
+                             -1, -1, -1, -1], dtype=np.intp)
+        tm.assert_numpy_array_equal(indexer, expected)
+
+    def test_intersection(self):
+        other = Index([2**63, 2**63 + 5, 2**63 + 10, 2**63 + 15, 2**63 + 20])
+        result = self.index.intersection(other)
+        expected = Index(np.sort(np.intersect1d(self.index.values,
+                                                other.values)))
+        tm.assert_index_equal(result, expected)
+
+        result = other.intersection(self.index)
+        expected = Index(np.sort(np.asarray(np.intersect1d(self.index.values,
+                                                           other.values))))
+        tm.assert_index_equal(result, expected)
+
+    def test_join_inner(self):
+        other = UInt64Index(2**63 + np.array(
+            [7, 12, 25, 1, 2, 10], dtype='uint64'))
+        other_mono = UInt64Index(2**63 + np.array(
+            [1, 2, 7, 10, 12, 25], dtype='uint64'))
+
+        # not monotonic
+        res, lidx, ridx = self.index.join(other, how='inner',
+                                          return_indexers=True)
+
+        # no guarantee of sortedness, so sort for comparison purposes
+        ind = res.argsort()
+        res = res.take(ind)
+        lidx = lidx.take(ind)
+        ridx = ridx.take(ind)
+
+        eres = UInt64Index(2**63 + np.array([10, 25], dtype='uint64'))
+        elidx = np.array([1, 4], dtype=np.intp)
+        eridx = np.array([5, 2], dtype=np.intp)
+
+        assert isinstance(res, UInt64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+        # monotonic
+        res, lidx, ridx = self.index.join(other_mono, how='inner',
+                                          return_indexers=True)
+
+        res2 = self.index.intersection(other_mono)
+        tm.assert_index_equal(res, res2)
+
+        elidx = np.array([1, 4], dtype=np.intp)
+        eridx = np.array([3, 5], dtype=np.intp)
+
+        assert isinstance(res, UInt64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+    def test_join_left(self):
+        other = UInt64Index(2**63 + np.array(
+            [7, 12, 25, 1, 2, 10], dtype='uint64'))
+        other_mono = UInt64Index(2**63 + np.array(
+            [1, 2, 7, 10, 12, 25], dtype='uint64'))
+
+        # not monotonic
+        res, lidx, ridx = self.index.join(other, how='left',
+                                          return_indexers=True)
+        eres = self.index
+        eridx = np.array([-1, 5, -1, -1, 2], dtype=np.intp)
+
+        assert isinstance(res, UInt64Index)
+        tm.assert_index_equal(res, eres)
+        assert lidx is None
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+        # monotonic
+        res, lidx, ridx = self.index.join(other_mono, how='left',
+                                          return_indexers=True)
+        eridx = np.array([-1, 3, -1, -1, 5], dtype=np.intp)
+
+        assert isinstance(res, UInt64Index)
+        tm.assert_index_equal(res, eres)
+        assert lidx is None
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+        # non-unique
+        idx = UInt64Index(2**63 + np.array([1, 1, 2, 5], dtype='uint64'))
+        idx2 = UInt64Index(2**63 + np.array([1, 2, 5, 7, 9], dtype='uint64'))
+        res, lidx, ridx = idx2.join(idx, how='left', return_indexers=True)
+
+        # 1 is in idx2, so it should be x2
+        eres = UInt64Index(2**63 + np.array(
+            [1, 1, 2, 5, 7, 9], dtype='uint64'))
+        eridx = np.array([0, 1, 2, 3, -1, -1], dtype=np.intp)
+        elidx = np.array([0, 0, 1, 2, 3, 4], dtype=np.intp)
+
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+    def test_join_right(self):
+        other = UInt64Index(2**63 + np.array(
+            [7, 12, 25, 1, 2, 10], dtype='uint64'))
+        other_mono = UInt64Index(2**63 + np.array(
+            [1, 2, 7, 10, 12, 25], dtype='uint64'))
+
+        # not monotonic
+        res, lidx, ridx = self.index.join(other, how='right',
+                                          return_indexers=True)
+        eres = other
+        elidx = np.array([-1, -1, 4, -1, -1, 1], dtype=np.intp)
+
+        tm.assert_numpy_array_equal(lidx, elidx)
+        assert isinstance(other, UInt64Index)
+        tm.assert_index_equal(res, eres)
+        assert ridx is None
+
+        # monotonic
+        res, lidx, ridx = self.index.join(other_mono, how='right',
+                                          return_indexers=True)
+        eres = other_mono
+        elidx = np.array([-1, -1, -1, 1, -1, 4], dtype=np.intp)
+
+        assert isinstance(other, UInt64Index)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_index_equal(res, eres)
+        assert ridx is None
+
+        # non-unique
+        idx = UInt64Index(2**63 + np.array([1, 1, 2, 5], dtype='uint64'))
+        idx2 = UInt64Index(2**63 + np.array([1, 2, 5, 7, 9], dtype='uint64'))
+        res, lidx, ridx = idx.join(idx2, how='right', return_indexers=True)
+
+        # 1 is in idx2, so it should be x2
+        eres = UInt64Index(2**63 + np.array(
+            [1, 1, 2, 5, 7, 9], dtype='uint64'))
+        elidx = np.array([0, 1, 2, 3, -1, -1], dtype=np.intp)
+        eridx = np.array([0, 0, 1, 2, 3, 4], dtype=np.intp)
+
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+    def test_join_non_int_index(self):
+        other = Index(2**63 + np.array(
+            [1, 5, 7, 10, 20], dtype='uint64'), dtype=object)
+
+        outer = self.index.join(other, how='outer')
+        outer2 = other.join(self.index, how='outer')
+        expected = Index(2**63 + np.array(
+            [0, 1, 5, 7, 10, 15, 20, 25], dtype='uint64'))
+        tm.assert_index_equal(outer, outer2)
+        tm.assert_index_equal(outer, expected)
+
+        inner = self.index.join(other, how='inner')
+        inner2 = other.join(self.index, how='inner')
+        expected = Index(2**63 + np.array([10, 20], dtype='uint64'))
+        tm.assert_index_equal(inner, inner2)
+        tm.assert_index_equal(inner, expected)
+
+        left = self.index.join(other, how='left')
+        tm.assert_index_equal(left, self.index.astype(object))
+
+        left2 = other.join(self.index, how='left')
+        tm.assert_index_equal(left2, other)
+
+        right = self.index.join(other, how='right')
+        tm.assert_index_equal(right, other)
+
+        right2 = other.join(self.index, how='right')
+        tm.assert_index_equal(right2, self.index.astype(object))
+
+    def test_join_outer(self):
+        other = UInt64Index(2**63 + np.array(
+            [7, 12, 25, 1, 2, 10], dtype='uint64'))
+        other_mono = UInt64Index(2**63 + np.array(
+            [1, 2, 7, 10, 12, 25], dtype='uint64'))
+
+        # not monotonic
+        # guarantee of sortedness
+        res, lidx, ridx = self.index.join(other, how='outer',
+                                          return_indexers=True)
+        noidx_res = self.index.join(other, how='outer')
+        tm.assert_index_equal(res, noidx_res)
+
+        eres = UInt64Index(2**63 + np.array(
+            [0, 1, 2, 7, 10, 12, 15, 20, 25], dtype='uint64'))
+        elidx = np.array([0, -1, -1, -1, 1, -1, 2, 3, 4], dtype=np.intp)
+        eridx = np.array([-1, 3, 4, 0, 5, 1, -1, -1, 2], dtype=np.intp)
+
+        assert isinstance(res, UInt64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+        # monotonic
+        res, lidx, ridx = self.index.join(other_mono, how='outer',
+                                          return_indexers=True)
+        noidx_res = self.index.join(other_mono, how='outer')
+        tm.assert_index_equal(res, noidx_res)
+
+        elidx = np.array([0, -1, -1, -1, 1, -1, 2, 3, 4], dtype=np.intp)
+        eridx = np.array([-1, 0, 1, 2, 3, 4, -1, -1, 5], dtype=np.intp)
+
+        assert isinstance(res, UInt64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
diff --git a/pandas/tests/indexes/test_range.py b/pandas/tests/indexes/test_range.py
new file mode 100644
index 0000000000000..38f4b341116b8
--- /dev/null
+++ b/pandas/tests/indexes/test_range.py
@@ -0,0 +1,1001 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from datetime import datetime
+from itertools import combinations
+import operator
+
+from pandas.compat import range, u, PY3
+
+import numpy as np
+
+from pandas import (isna, Series, Index, Float64Index,
+                    Int64Index, RangeIndex)
+
+import pandas.util.testing as tm
+
+import pandas as pd
+
+from .test_numeric import Numeric
+
+
+class TestRangeIndex(Numeric):
+    _holder = RangeIndex
+    _compat_props = ['shape', 'ndim', 'size']
+
+    def setup_method(self, method):
+        self.indices = dict(index=RangeIndex(0, 20, 2, name='foo'),
+                            index_dec=RangeIndex(18, -1, -2, name='bar'))
+        self.setup_indices()
+
+    def create_index(self):
+        return RangeIndex(5)
+
+    def check_binop(self, ops, scalars, idxs):
+        for op in ops:
+            for a, b in combinations(idxs, 2):
+                result = op(a, b)
+                expected = op(Int64Index(a), Int64Index(b))
+                tm.assert_index_equal(result, expected)
+            for idx in idxs:
+                for scalar in scalars:
+                    result = op(idx, scalar)
+                    expected = op(Int64Index(idx), scalar)
+                    tm.assert_index_equal(result, expected)
+
+    def test_can_hold_identifiers(self):
+        idx = self.create_index()
+        key = idx[0]
+        assert idx._can_hold_identifiers_and_holds_name(key) is False
+
+    def test_binops(self):
+        ops = [operator.add, operator.sub, operator.mul, operator.floordiv,
+               operator.truediv]
+        scalars = [-1, 1, 2]
+        idxs = [RangeIndex(0, 10, 1), RangeIndex(0, 20, 2),
+                RangeIndex(-10, 10, 2), RangeIndex(5, -5, -1)]
+        self.check_binop(ops, scalars, idxs)
+
+    def test_binops_pow(self):
+        # later versions of numpy don't allow powers of negative integers
+        # so test separately
+        # https://github.com/numpy/numpy/pull/8127
+        ops = [pow]
+        scalars = [1, 2]
+        idxs = [RangeIndex(0, 10, 1), RangeIndex(0, 20, 2)]
+        self.check_binop(ops, scalars, idxs)
+
+    def test_too_many_names(self):
+        def testit():
+            self.index.names = ["roger", "harold"]
+
+        tm.assert_raises_regex(ValueError, "^Length", testit)
+
+    def test_constructor(self):
+        index = RangeIndex(5)
+        expected = np.arange(5, dtype=np.int64)
+        assert isinstance(index, RangeIndex)
+        assert index._start == 0
+        assert index._stop == 5
+        assert index._step == 1
+        assert index.name is None
+        tm.assert_index_equal(Index(expected), index)
+
+        index = RangeIndex(1, 5)
+        expected = np.arange(1, 5, dtype=np.int64)
+        assert isinstance(index, RangeIndex)
+        assert index._start == 1
+        tm.assert_index_equal(Index(expected), index)
+
+        index = RangeIndex(1, 5, 2)
+        expected = np.arange(1, 5, 2, dtype=np.int64)
+        assert isinstance(index, RangeIndex)
+        assert index._step == 2
+        tm.assert_index_equal(Index(expected), index)
+
+        msg = "RangeIndex\\(\\.\\.\\.\\) must be called with integers"
+        with tm.assert_raises_regex(TypeError, msg):
+            RangeIndex()
+
+        for index in [RangeIndex(0), RangeIndex(start=0), RangeIndex(stop=0),
+                      RangeIndex(0, 0)]:
+            expected = np.empty(0, dtype=np.int64)
+            assert isinstance(index, RangeIndex)
+            assert index._start == 0
+            assert index._stop == 0
+            assert index._step == 1
+            tm.assert_index_equal(Index(expected), index)
+
+        with tm.assert_raises_regex(TypeError, msg):
+            RangeIndex(name='Foo')
+
+        for index in [RangeIndex(0, name='Foo'),
+                      RangeIndex(start=0, name='Foo'),
+                      RangeIndex(stop=0, name='Foo'),
+                      RangeIndex(0, 0, name='Foo')]:
+            assert isinstance(index, RangeIndex)
+            assert index.name == 'Foo'
+
+        # we don't allow on a bare Index
+        pytest.raises(TypeError, lambda: Index(0, 1000))
+
+        # invalid args
+        for i in [Index(['a', 'b']), Series(['a', 'b']), np.array(['a', 'b']),
+                  [], 'foo', datetime(2000, 1, 1, 0, 0), np.arange(0, 10),
+                  np.array([1]), [1]]:
+            pytest.raises(TypeError, lambda: RangeIndex(i))
+
+    def test_constructor_same(self):
+
+        # pass thru w and w/o copy
+        index = RangeIndex(1, 5, 2)
+        result = RangeIndex(index, copy=False)
+        assert result.identical(index)
+
+        result = RangeIndex(index, copy=True)
+        tm.assert_index_equal(result, index, exact=True)
+
+        result = RangeIndex(index)
+        tm.assert_index_equal(result, index, exact=True)
+
+        pytest.raises(TypeError,
+                      lambda: RangeIndex(index, dtype='float64'))
+
+    def test_constructor_range(self):
+
+        pytest.raises(TypeError, lambda: RangeIndex(range(1, 5, 2)))
+
+        result = RangeIndex.from_range(range(1, 5, 2))
+        expected = RangeIndex(1, 5, 2)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        result = RangeIndex.from_range(range(5, 6))
+        expected = RangeIndex(5, 6, 1)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # an invalid range
+        result = RangeIndex.from_range(range(5, 1))
+        expected = RangeIndex(0, 0, 1)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        result = RangeIndex.from_range(range(5))
+        expected = RangeIndex(0, 5, 1)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        result = Index(range(1, 5, 2))
+        expected = RangeIndex(1, 5, 2)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        pytest.raises(TypeError,
+                      lambda: Index(range(1, 5, 2), dtype='float64'))
+
+    def test_constructor_name(self):
+        # GH12288
+        orig = RangeIndex(10)
+        orig.name = 'original'
+
+        copy = RangeIndex(orig)
+        copy.name = 'copy'
+
+        assert orig.name == 'original'
+        assert copy.name == 'copy'
+
+        new = Index(copy)
+        assert new.name == 'copy'
+
+        new.name = 'new'
+        assert orig.name == 'original'
+        assert copy.name == 'copy'
+        assert new.name == 'new'
+
+    def test_numeric_compat2(self):
+        # validate that we are handling the RangeIndex overrides to numeric ops
+        # and returning RangeIndex where possible
+
+        idx = RangeIndex(0, 10, 2)
+
+        result = idx * 2
+        expected = RangeIndex(0, 20, 4)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        result = idx + 2
+        expected = RangeIndex(2, 12, 2)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        result = idx - 2
+        expected = RangeIndex(-2, 8, 2)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # truediv under PY3
+        result = idx / 2
+
+        if PY3:
+            expected = RangeIndex(0, 5, 1).astype('float64')
+        else:
+            expected = RangeIndex(0, 5, 1)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        result = idx / 4
+        expected = RangeIndex(0, 10, 2) / 4
+        tm.assert_index_equal(result, expected, exact=True)
+
+        result = idx // 1
+        expected = idx
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # __mul__
+        result = idx * idx
+        expected = Index(idx.values * idx.values)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # __pow__
+        idx = RangeIndex(0, 1000, 2)
+        result = idx ** 2
+        expected = idx._int64index ** 2
+        tm.assert_index_equal(Index(result.values), expected, exact=True)
+
+        # __floordiv__
+        cases_exact = [(RangeIndex(0, 1000, 2), 2, RangeIndex(0, 500, 1)),
+                       (RangeIndex(-99, -201, -3), -3, RangeIndex(33, 67, 1)),
+                       (RangeIndex(0, 1000, 1), 2,
+                        RangeIndex(0, 1000, 1)._int64index // 2),
+                       (RangeIndex(0, 100, 1), 2.0,
+                        RangeIndex(0, 100, 1)._int64index // 2.0),
+                       (RangeIndex(0), 50, RangeIndex(0)),
+                       (RangeIndex(2, 4, 2), 3, RangeIndex(0, 1, 1)),
+                       (RangeIndex(-5, -10, -6), 4, RangeIndex(-2, -1, 1)),
+                       (RangeIndex(-100, -200, 3), 2, RangeIndex(0))]
+        for idx, div, expected in cases_exact:
+            tm.assert_index_equal(idx // div, expected, exact=True)
+
+    def test_constructor_corner(self):
+        arr = np.array([1, 2, 3, 4], dtype=object)
+        index = RangeIndex(1, 5)
+        assert index.values.dtype == np.int64
+        tm.assert_index_equal(index, Index(arr))
+
+        # non-int raise Exception
+        pytest.raises(TypeError, RangeIndex, '1', '10', '1')
+        pytest.raises(TypeError, RangeIndex, 1.1, 10.2, 1.3)
+
+        # invalid passed type
+        pytest.raises(TypeError, lambda: RangeIndex(1, 5, dtype='float64'))
+
+    def test_copy(self):
+        i = RangeIndex(5, name='Foo')
+        i_copy = i.copy()
+        assert i_copy is not i
+        assert i_copy.identical(i)
+        assert i_copy._start == 0
+        assert i_copy._stop == 5
+        assert i_copy._step == 1
+        assert i_copy.name == 'Foo'
+
+    def test_repr(self):
+        i = RangeIndex(5, name='Foo')
+        result = repr(i)
+        if PY3:
+            expected = "RangeIndex(start=0, stop=5, step=1, name='Foo')"
+        else:
+            expected = "RangeIndex(start=0, stop=5, step=1, name=u'Foo')"
+        assert result == expected
+
+        result = eval(result)
+        tm.assert_index_equal(result, i, exact=True)
+
+        i = RangeIndex(5, 0, -1)
+        result = repr(i)
+        expected = "RangeIndex(start=5, stop=0, step=-1)"
+        assert result == expected
+
+        result = eval(result)
+        tm.assert_index_equal(result, i, exact=True)
+
+    def test_insert(self):
+
+        idx = RangeIndex(5, name='Foo')
+        result = idx[1:4]
+
+        # test 0th element
+        tm.assert_index_equal(idx[0:4], result.insert(0, idx[0]))
+
+        # GH 18295 (test missing)
+        expected = Float64Index([0, np.nan, 1, 2, 3, 4])
+        for na in (np.nan, pd.NaT, None):
+            result = RangeIndex(5).insert(1, na)
+            tm.assert_index_equal(result, expected)
+
+    def test_delete(self):
+
+        idx = RangeIndex(5, name='Foo')
+        expected = idx[1:].astype(int)
+        result = idx.delete(0)
+        tm.assert_index_equal(result, expected)
+        assert result.name == expected.name
+
+        expected = idx[:-1].astype(int)
+        result = idx.delete(-1)
+        tm.assert_index_equal(result, expected)
+        assert result.name == expected.name
+
+        with pytest.raises((IndexError, ValueError)):
+            # either depending on numpy version
+            result = idx.delete(len(idx))
+
+    def test_view(self, indices):
+        super(TestRangeIndex, self).test_view(indices)
+
+        i = RangeIndex(0, name='Foo')
+        i_view = i.view()
+        assert i_view.name == 'Foo'
+
+        i_view = i.view('i8')
+        tm.assert_numpy_array_equal(i.values, i_view)
+
+        i_view = i.view(RangeIndex)
+        tm.assert_index_equal(i, i_view)
+
+    def test_dtype(self):
+        assert self.index.dtype == np.int64
+
+    def test_is_monotonic(self):
+        assert self.index.is_monotonic
+        assert self.index.is_monotonic_increasing
+        assert not self.index.is_monotonic_decreasing
+        assert self.index._is_strictly_monotonic_increasing
+        assert not self.index._is_strictly_monotonic_decreasing
+
+        index = RangeIndex(4, 0, -1)
+        assert not index.is_monotonic
+        assert not index._is_strictly_monotonic_increasing
+        assert index.is_monotonic_decreasing
+        assert index._is_strictly_monotonic_decreasing
+
+        index = RangeIndex(1, 2)
+        assert index.is_monotonic
+        assert index.is_monotonic_increasing
+        assert index.is_monotonic_decreasing
+        assert index._is_strictly_monotonic_increasing
+        assert index._is_strictly_monotonic_decreasing
+
+        index = RangeIndex(2, 1)
+        assert index.is_monotonic
+        assert index.is_monotonic_increasing
+        assert index.is_monotonic_decreasing
+        assert index._is_strictly_monotonic_increasing
+        assert index._is_strictly_monotonic_decreasing
+
+        index = RangeIndex(1, 1)
+        assert index.is_monotonic
+        assert index.is_monotonic_increasing
+        assert index.is_monotonic_decreasing
+        assert index._is_strictly_monotonic_increasing
+        assert index._is_strictly_monotonic_decreasing
+
+    def test_equals_range(self):
+        equiv_pairs = [(RangeIndex(0, 9, 2), RangeIndex(0, 10, 2)),
+                       (RangeIndex(0), RangeIndex(1, -1, 3)),
+                       (RangeIndex(1, 2, 3), RangeIndex(1, 3, 4)),
+                       (RangeIndex(0, -9, -2), RangeIndex(0, -10, -2))]
+        for left, right in equiv_pairs:
+            assert left.equals(right)
+            assert right.equals(left)
+
+    def test_logical_compat(self):
+        idx = self.create_index()
+        assert idx.all() == idx.values.all()
+        assert idx.any() == idx.values.any()
+
+    def test_identical(self):
+        i = Index(self.index.copy())
+        assert i.identical(self.index)
+
+        # we don't allow object dtype for RangeIndex
+        if isinstance(self.index, RangeIndex):
+            return
+
+        same_values_different_type = Index(i, dtype=object)
+        assert not i.identical(same_values_different_type)
+
+        i = self.index.copy(dtype=object)
+        i = i.rename('foo')
+        same_values = Index(i, dtype=object)
+        assert same_values.identical(self.index.copy(dtype=object))
+
+        assert not i.identical(self.index)
+        assert Index(same_values, name='foo', dtype=object).identical(i)
+
+        assert not self.index.copy(dtype=object).identical(
+            self.index.copy(dtype='int64'))
+
+    def test_get_indexer(self):
+        target = RangeIndex(10)
+        indexer = self.index.get_indexer(target)
+        expected = np.array([0, -1, 1, -1, 2, -1, 3, -1, 4, -1], dtype=np.intp)
+        tm.assert_numpy_array_equal(indexer, expected)
+
+    def test_get_indexer_pad(self):
+        target = RangeIndex(10)
+        indexer = self.index.get_indexer(target, method='pad')
+        expected = np.array([0, 0, 1, 1, 2, 2, 3, 3, 4, 4], dtype=np.intp)
+        tm.assert_numpy_array_equal(indexer, expected)
+
+    def test_get_indexer_backfill(self):
+        target = RangeIndex(10)
+        indexer = self.index.get_indexer(target, method='backfill')
+        expected = np.array([0, 1, 1, 2, 2, 3, 3, 4, 4, 5], dtype=np.intp)
+        tm.assert_numpy_array_equal(indexer, expected)
+
+    def test_join_outer(self):
+        # join with Int64Index
+        other = Int64Index(np.arange(25, 14, -1))
+
+        res, lidx, ridx = self.index.join(other, how='outer',
+                                          return_indexers=True)
+        noidx_res = self.index.join(other, how='outer')
+        tm.assert_index_equal(res, noidx_res)
+
+        eres = Int64Index([0, 2, 4, 6, 8, 10, 12, 14, 15, 16, 17, 18, 19, 20,
+                           21, 22, 23, 24, 25])
+        elidx = np.array([0, 1, 2, 3, 4, 5, 6, 7, -1, 8, -1, 9,
+                          -1, -1, -1, -1, -1, -1, -1], dtype=np.intp)
+        eridx = np.array([-1, -1, -1, -1, -1, -1, -1, -1, 10, 9, 8, 7, 6,
+                          5, 4, 3, 2, 1, 0], dtype=np.intp)
+
+        assert isinstance(res, Int64Index)
+        assert not isinstance(res, RangeIndex)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+        # join with RangeIndex
+        other = RangeIndex(25, 14, -1)
+
+        res, lidx, ridx = self.index.join(other, how='outer',
+                                          return_indexers=True)
+        noidx_res = self.index.join(other, how='outer')
+        tm.assert_index_equal(res, noidx_res)
+
+        assert isinstance(res, Int64Index)
+        assert not isinstance(res, RangeIndex)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+    def test_join_inner(self):
+        # Join with non-RangeIndex
+        other = Int64Index(np.arange(25, 14, -1))
+
+        res, lidx, ridx = self.index.join(other, how='inner',
+                                          return_indexers=True)
+
+        # no guarantee of sortedness, so sort for comparison purposes
+        ind = res.argsort()
+        res = res.take(ind)
+        lidx = lidx.take(ind)
+        ridx = ridx.take(ind)
+
+        eres = Int64Index([16, 18])
+        elidx = np.array([8, 9], dtype=np.intp)
+        eridx = np.array([9, 7], dtype=np.intp)
+
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+        # Join two RangeIndex
+        other = RangeIndex(25, 14, -1)
+
+        res, lidx, ridx = self.index.join(other, how='inner',
+                                          return_indexers=True)
+
+        assert isinstance(res, RangeIndex)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+    def test_join_left(self):
+        # Join with Int64Index
+        other = Int64Index(np.arange(25, 14, -1))
+
+        res, lidx, ridx = self.index.join(other, how='left',
+                                          return_indexers=True)
+        eres = self.index
+        eridx = np.array([-1, -1, -1, -1, -1, -1, -1, -1, 9, 7], dtype=np.intp)
+
+        assert isinstance(res, RangeIndex)
+        tm.assert_index_equal(res, eres)
+        assert lidx is None
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+        # Join withRangeIndex
+        other = Int64Index(np.arange(25, 14, -1))
+
+        res, lidx, ridx = self.index.join(other, how='left',
+                                          return_indexers=True)
+
+        assert isinstance(res, RangeIndex)
+        tm.assert_index_equal(res, eres)
+        assert lidx is None
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+    def test_join_right(self):
+        # Join with Int64Index
+        other = Int64Index(np.arange(25, 14, -1))
+
+        res, lidx, ridx = self.index.join(other, how='right',
+                                          return_indexers=True)
+        eres = other
+        elidx = np.array([-1, -1, -1, -1, -1, -1, -1, 9, -1, 8, -1],
+                         dtype=np.intp)
+
+        assert isinstance(other, Int64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        assert ridx is None
+
+        # Join withRangeIndex
+        other = RangeIndex(25, 14, -1)
+
+        res, lidx, ridx = self.index.join(other, how='right',
+                                          return_indexers=True)
+        eres = other
+
+        assert isinstance(other, RangeIndex)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        assert ridx is None
+
+    def test_join_non_int_index(self):
+        other = Index([3, 6, 7, 8, 10], dtype=object)
+
+        outer = self.index.join(other, how='outer')
+        outer2 = other.join(self.index, how='outer')
+        expected = Index([0, 2, 3, 4, 6, 7, 8, 10, 12, 14, 16, 18])
+        tm.assert_index_equal(outer, outer2)
+        tm.assert_index_equal(outer, expected)
+
+        inner = self.index.join(other, how='inner')
+        inner2 = other.join(self.index, how='inner')
+        expected = Index([6, 8, 10])
+        tm.assert_index_equal(inner, inner2)
+        tm.assert_index_equal(inner, expected)
+
+        left = self.index.join(other, how='left')
+        tm.assert_index_equal(left, self.index.astype(object))
+
+        left2 = other.join(self.index, how='left')
+        tm.assert_index_equal(left2, other)
+
+        right = self.index.join(other, how='right')
+        tm.assert_index_equal(right, other)
+
+        right2 = other.join(self.index, how='right')
+        tm.assert_index_equal(right2, self.index.astype(object))
+
+    def test_join_non_unique(self):
+        other = Index([4, 4, 3, 3])
+
+        res, lidx, ridx = self.index.join(other, return_indexers=True)
+
+        eres = Int64Index([0, 2, 4, 4, 6, 8, 10, 12, 14, 16, 18])
+        elidx = np.array([0, 1, 2, 2, 3, 4, 5, 6, 7, 8, 9], dtype=np.intp)
+        eridx = np.array([-1, -1, 0, 1, -1, -1, -1, -1, -1, -1, -1],
+                         dtype=np.intp)
+
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
+
+    def test_join_self(self):
+        kinds = 'outer', 'inner', 'left', 'right'
+        for kind in kinds:
+            joined = self.index.join(self.index, how=kind)
+            assert self.index is joined
+
+    def test_intersection(self):
+        # intersect with Int64Index
+        other = Index(np.arange(1, 6))
+        result = self.index.intersection(other)
+        expected = Index(np.sort(np.intersect1d(self.index.values,
+                                                other.values)))
+        tm.assert_index_equal(result, expected)
+
+        result = other.intersection(self.index)
+        expected = Index(np.sort(np.asarray(np.intersect1d(self.index.values,
+                                                           other.values))))
+        tm.assert_index_equal(result, expected)
+
+        # intersect with increasing RangeIndex
+        other = RangeIndex(1, 6)
+        result = self.index.intersection(other)
+        expected = Index(np.sort(np.intersect1d(self.index.values,
+                                                other.values)))
+        tm.assert_index_equal(result, expected)
+
+        # intersect with decreasing RangeIndex
+        other = RangeIndex(5, 0, -1)
+        result = self.index.intersection(other)
+        expected = Index(np.sort(np.intersect1d(self.index.values,
+                                                other.values)))
+        tm.assert_index_equal(result, expected)
+
+        # reversed (GH 17296)
+        result = other.intersection(self.index)
+        tm.assert_index_equal(result, expected)
+
+        # GH 17296: intersect two decreasing RangeIndexes
+        first = RangeIndex(10, -2, -2)
+        other = RangeIndex(5, -4, -1)
+        expected = first.astype(int).intersection(other.astype(int))
+        result = first.intersection(other).astype(int)
+        tm.assert_index_equal(result, expected)
+
+        # reversed
+        result = other.intersection(first).astype(int)
+        tm.assert_index_equal(result, expected)
+
+        index = RangeIndex(5)
+
+        # intersect of non-overlapping indices
+        other = RangeIndex(5, 10, 1)
+        result = index.intersection(other)
+        expected = RangeIndex(0, 0, 1)
+        tm.assert_index_equal(result, expected)
+
+        other = RangeIndex(-1, -5, -1)
+        result = index.intersection(other)
+        expected = RangeIndex(0, 0, 1)
+        tm.assert_index_equal(result, expected)
+
+        # intersection of empty indices
+        other = RangeIndex(0, 0, 1)
+        result = index.intersection(other)
+        expected = RangeIndex(0, 0, 1)
+        tm.assert_index_equal(result, expected)
+
+        result = other.intersection(index)
+        tm.assert_index_equal(result, expected)
+
+        # intersection of non-overlapping values based on start value and gcd
+        index = RangeIndex(1, 10, 2)
+        other = RangeIndex(0, 10, 4)
+        result = index.intersection(other)
+        expected = RangeIndex(0, 0, 1)
+        tm.assert_index_equal(result, expected)
+
+    def test_union_noncomparable(self):
+        from datetime import datetime, timedelta
+        # corner case, non-Int64Index
+        now = datetime.now()
+        other = Index([now + timedelta(i) for i in range(4)], dtype=object)
+        result = self.index.union(other)
+        expected = Index(np.concatenate((self.index, other)))
+        tm.assert_index_equal(result, expected)
+
+        result = other.union(self.index)
+        expected = Index(np.concatenate((other, self.index)))
+        tm.assert_index_equal(result, expected)
+
+    def test_union(self):
+        RI = RangeIndex
+        I64 = Int64Index
+        cases = [(RI(0, 10, 1), RI(0, 10, 1), RI(0, 10, 1)),
+                 (RI(0, 10, 1), RI(5, 20, 1), RI(0, 20, 1)),
+                 (RI(0, 10, 1), RI(10, 20, 1), RI(0, 20, 1)),
+                 (RI(0, -10, -1), RI(0, -10, -1), RI(0, -10, -1)),
+                 (RI(0, -10, -1), RI(-10, -20, -1), RI(-19, 1, 1)),
+                 (RI(0, 10, 2), RI(1, 10, 2), RI(0, 10, 1)),
+                 (RI(0, 11, 2), RI(1, 12, 2), RI(0, 12, 1)),
+                 (RI(0, 21, 4), RI(-2, 24, 4), RI(-2, 24, 2)),
+                 (RI(0, -20, -2), RI(-1, -21, -2), RI(-19, 1, 1)),
+                 (RI(0, 100, 5), RI(0, 100, 20), RI(0, 100, 5)),
+                 (RI(0, -100, -5), RI(5, -100, -20), RI(-95, 10, 5)),
+                 (RI(0, -11, -1), RI(1, -12, -4), RI(-11, 2, 1)),
+                 (RI(0), RI(0), RI(0)),
+                 (RI(0, -10, -2), RI(0), RI(0, -10, -2)),
+                 (RI(0, 100, 2), RI(100, 150, 200), RI(0, 102, 2)),
+                 (RI(0, -100, -2), RI(-100, 50, 102), RI(-100, 4, 2)),
+                 (RI(0, -100, -1), RI(0, -50, -3), RI(-99, 1, 1)),
+                 (RI(0, 1, 1), RI(5, 6, 10), RI(0, 6, 5)),
+                 (RI(0, 10, 5), RI(-5, -6, -20), RI(-5, 10, 5)),
+                 (RI(0, 3, 1), RI(4, 5, 1), I64([0, 1, 2, 4])),
+                 (RI(0, 10, 1), I64([]), RI(0, 10, 1)),
+                 (RI(0), I64([1, 5, 6]), I64([1, 5, 6]))]
+        for idx1, idx2, expected in cases:
+            res1 = idx1.union(idx2)
+            res2 = idx2.union(idx1)
+            res3 = idx1._int64index.union(idx2)
+            tm.assert_index_equal(res1, expected, exact=True)
+            tm.assert_index_equal(res2, expected, exact=True)
+            tm.assert_index_equal(res3, expected)
+
+    def test_nbytes(self):
+
+        # memory savings vs int index
+        i = RangeIndex(0, 1000)
+        assert i.nbytes < i._int64index.nbytes / 10
+
+        # constant memory usage
+        i2 = RangeIndex(0, 10)
+        assert i.nbytes == i2.nbytes
+
+    def test_cant_or_shouldnt_cast(self):
+        # can't
+        pytest.raises(TypeError, RangeIndex, 'foo', 'bar', 'baz')
+
+        # shouldn't
+        pytest.raises(TypeError, RangeIndex, '0', '1', '2')
+
+    def test_view_Index(self):
+        self.index.view(Index)
+
+    def test_prevent_casting(self):
+        result = self.index.astype('O')
+        assert result.dtype == np.object_
+
+    def test_take_preserve_name(self):
+        index = RangeIndex(1, 5, name='foo')
+        taken = index.take([3, 0, 1])
+        assert index.name == taken.name
+
+    def test_take_fill_value(self):
+        # GH 12631
+        idx = pd.RangeIndex(1, 4, name='xxx')
+        result = idx.take(np.array([1, 0, -1]))
+        expected = pd.Int64Index([2, 1, 3], name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        # fill_value
+        msg = "Unable to fill values because RangeIndex cannot contain NA"
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -1]), fill_value=True)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        expected = pd.Int64Index([2, 1, 3], name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        msg = "Unable to fill values because RangeIndex cannot contain NA"
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -2]), fill_value=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            idx.take(np.array([1, -5]))
+
+    def test_print_unicode_columns(self):
+        df = pd.DataFrame({u("\u05d0"): [1, 2, 3],
+                           "\u05d1": [4, 5, 6],
+                           "c": [7, 8, 9]})
+        repr(df.columns)  # should not raise UnicodeDecodeError
+
+    def test_repr_roundtrip(self):
+        tm.assert_index_equal(eval(repr(self.index)), self.index)
+
+    def test_slice_keep_name(self):
+        idx = RangeIndex(1, 2, name='asdf')
+        assert idx.name == idx[1:].name
+
+    def test_explicit_conversions(self):
+
+        # GH 8608
+        # add/sub are overridden explicitly for Float/Int Index
+        idx = RangeIndex(5)
+
+        # float conversions
+        arr = np.arange(5, dtype='int64') * 3.2
+        expected = Float64Index(arr)
+        fidx = idx * 3.2
+        tm.assert_index_equal(fidx, expected)
+        fidx = 3.2 * idx
+        tm.assert_index_equal(fidx, expected)
+
+        # interops with numpy arrays
+        expected = Float64Index(arr)
+        a = np.zeros(5, dtype='float64')
+        result = fidx - a
+        tm.assert_index_equal(result, expected)
+
+        expected = Float64Index(-arr)
+        a = np.zeros(5, dtype='float64')
+        result = a - fidx
+        tm.assert_index_equal(result, expected)
+
+    def test_duplicates(self):
+        for ind in self.indices:
+            if not len(ind):
+                continue
+            idx = self.indices[ind]
+            assert idx.is_unique
+            assert not idx.has_duplicates
+
+    def test_ufunc_compat(self):
+        idx = RangeIndex(5)
+        result = np.sin(idx)
+        expected = Float64Index(np.sin(np.arange(5, dtype='int64')))
+        tm.assert_index_equal(result, expected)
+
+    def test_extended_gcd(self):
+        result = self.index._extended_gcd(6, 10)
+        assert result[0] == result[1] * 6 + result[2] * 10
+        assert 2 == result[0]
+
+        result = self.index._extended_gcd(10, 6)
+        assert 2 == result[1] * 10 + result[2] * 6
+        assert 2 == result[0]
+
+    def test_min_fitting_element(self):
+        result = RangeIndex(0, 20, 2)._min_fitting_element(1)
+        assert 2 == result
+
+        result = RangeIndex(1, 6)._min_fitting_element(1)
+        assert 1 == result
+
+        result = RangeIndex(18, -2, -2)._min_fitting_element(1)
+        assert 2 == result
+
+        result = RangeIndex(5, 0, -1)._min_fitting_element(1)
+        assert 1 == result
+
+        big_num = 500000000000000000000000
+
+        result = RangeIndex(5, big_num * 2, 1)._min_fitting_element(big_num)
+        assert big_num == result
+
+    def test_max_fitting_element(self):
+        result = RangeIndex(0, 20, 2)._max_fitting_element(17)
+        assert 16 == result
+
+        result = RangeIndex(1, 6)._max_fitting_element(4)
+        assert 4 == result
+
+        result = RangeIndex(18, -2, -2)._max_fitting_element(17)
+        assert 16 == result
+
+        result = RangeIndex(5, 0, -1)._max_fitting_element(4)
+        assert 4 == result
+
+        big_num = 500000000000000000000000
+
+        result = RangeIndex(5, big_num * 2, 1)._max_fitting_element(big_num)
+        assert big_num == result
+
+    def test_pickle_compat_construction(self):
+        # RangeIndex() is a valid constructor
+        pass
+
+    def test_slice_specialised(self):
+
+        # scalar indexing
+        res = self.index[1]
+        expected = 2
+        assert res == expected
+
+        res = self.index[-1]
+        expected = 18
+        assert res == expected
+
+        # slicing
+        # slice value completion
+        index = self.index[:]
+        expected = self.index
+        tm.assert_index_equal(index, expected)
+
+        # positive slice values
+        index = self.index[7:10:2]
+        expected = Index(np.array([14, 18]), name='foo')
+        tm.assert_index_equal(index, expected)
+
+        # negative slice values
+        index = self.index[-1:-5:-2]
+        expected = Index(np.array([18, 14]), name='foo')
+        tm.assert_index_equal(index, expected)
+
+        # stop overshoot
+        index = self.index[2:100:4]
+        expected = Index(np.array([4, 12]), name='foo')
+        tm.assert_index_equal(index, expected)
+
+        # reverse
+        index = self.index[::-1]
+        expected = Index(self.index.values[::-1], name='foo')
+        tm.assert_index_equal(index, expected)
+
+        index = self.index[-8::-1]
+        expected = Index(np.array([4, 2, 0]), name='foo')
+        tm.assert_index_equal(index, expected)
+
+        index = self.index[-40::-1]
+        expected = Index(np.array([], dtype=np.int64), name='foo')
+        tm.assert_index_equal(index, expected)
+
+        index = self.index[40::-1]
+        expected = Index(self.index.values[40::-1], name='foo')
+        tm.assert_index_equal(index, expected)
+
+        index = self.index[10::-1]
+        expected = Index(self.index.values[::-1], name='foo')
+        tm.assert_index_equal(index, expected)
+
+    def test_len_specialised(self):
+
+        # make sure that our len is the same as
+        # np.arange calc
+
+        for step in np.arange(1, 6, 1):
+
+            arr = np.arange(0, 5, step)
+            i = RangeIndex(0, 5, step)
+            assert len(i) == len(arr)
+
+            i = RangeIndex(5, 0, step)
+            assert len(i) == 0
+
+        for step in np.arange(-6, -1, 1):
+
+            arr = np.arange(5, 0, step)
+            i = RangeIndex(5, 0, step)
+            assert len(i) == len(arr)
+
+            i = RangeIndex(0, 5, step)
+            assert len(i) == 0
+
+    def test_append(self):
+        # GH16212
+        RI = RangeIndex
+        I64 = Int64Index
+        F64 = Float64Index
+        OI = Index
+        cases = [([RI(1, 12, 5)], RI(1, 12, 5)),
+                 ([RI(0, 6, 4)], RI(0, 6, 4)),
+                 ([RI(1, 3), RI(3, 7)], RI(1, 7)),
+                 ([RI(1, 5, 2), RI(5, 6)], RI(1, 6, 2)),
+                 ([RI(1, 3, 2), RI(4, 7, 3)], RI(1, 7, 3)),
+                 ([RI(-4, 3, 2), RI(4, 7, 2)], RI(-4, 7, 2)),
+                 ([RI(-4, -8), RI(-8, -12)], RI(0, 0)),
+                 ([RI(-4, -8), RI(3, -4)], RI(0, 0)),
+                 ([RI(-4, -8), RI(3, 5)], RI(3, 5)),
+                 ([RI(-4, -2), RI(3, 5)], I64([-4, -3, 3, 4])),
+                 ([RI(-2,), RI(3, 5)], RI(3, 5)),
+                 ([RI(2,), RI(2)], I64([0, 1, 0, 1])),
+                 ([RI(2,), RI(2, 5), RI(5, 8, 4)], RI(0, 6)),
+                 ([RI(2,), RI(3, 5), RI(5, 8, 4)], I64([0, 1, 3, 4, 5])),
+                 ([RI(-2, 2), RI(2, 5), RI(5, 8, 4)], RI(-2, 6)),
+                 ([RI(3,), I64([-1, 3, 15])], I64([0, 1, 2, -1, 3, 15])),
+                 ([RI(3,), F64([-1, 3.1, 15.])], F64([0, 1, 2, -1, 3.1, 15.])),
+                 ([RI(3,), OI(['a', None, 14])], OI([0, 1, 2, 'a', None, 14])),
+                 ([RI(3, 1), OI(['a', None, 14])], OI(['a', None, 14]))
+                 ]
+
+        for indices, expected in cases:
+            result = indices[0].append(indices[1:])
+            tm.assert_index_equal(result, expected, exact=True)
+
+            if len(indices) == 2:
+                # Append single item rather than list
+                result2 = indices[0].append(indices[1])
+                tm.assert_index_equal(result2, expected, exact=True)
+
+    @pytest.mark.parametrize('start,stop,step',
+                             [(0, 400, 3), (500, 0, -6), (-10**6, 10**6, 4),
+                              (10**6, -10**6, -4), (0, 10, 20)])
+    def test_max_min(self, start, stop, step):
+        # GH17607
+        idx = RangeIndex(start, stop, step)
+        expected = idx._int64index.max()
+        result = idx.max()
+        assert result == expected
+
+        expected = idx._int64index.min()
+        result = idx.min()
+        assert result == expected
+
+        # empty
+        idx = RangeIndex(start, stop, -step)
+        assert isna(idx.max())
+        assert isna(idx.min())
diff --git a/pandas/tests/indexes/timedeltas/__init__.py b/pandas/tests/indexes/timedeltas/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/indexes/timedeltas/test_arithmetic.py b/pandas/tests/indexes/timedeltas/test_arithmetic.py
new file mode 100644
index 0000000000000..d47d75d2f3485
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_arithmetic.py
@@ -0,0 +1,1174 @@
+# -*- coding: utf-8 -*-
+import operator
+
+import pytest
+import numpy as np
+from datetime import timedelta
+from distutils.version import LooseVersion
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import (DatetimeIndex, TimedeltaIndex, Float64Index, Int64Index,
+                    to_timedelta, timedelta_range, date_range,
+                    Series,
+                    Timestamp, Timedelta)
+from pandas.errors import PerformanceWarning, NullFrequencyError
+from pandas.core import ops
+
+
+@pytest.fixture(params=[pd.offsets.Hour(2), timedelta(hours=2),
+                        np.timedelta64(2, 'h'), Timedelta(hours=2)],
+                ids=str)
+def delta(request):
+    # Several ways of representing two hours
+    return request.param
+
+
+@pytest.fixture(params=['B', 'D'])
+def freq(request):
+    return request.param
+
+
+class TestTimedeltaIndexComparisons(object):
+    def test_tdi_cmp_str_invalid(self):
+        # GH 13624
+        tdi = TimedeltaIndex(['1 day', '2 days'])
+
+        for left, right in [(tdi, 'a'), ('a', tdi)]:
+            with pytest.raises(TypeError):
+                left > right
+
+            with pytest.raises(TypeError):
+                left == right
+
+            with pytest.raises(TypeError):
+                left != right
+
+    def test_comparisons_coverage(self):
+        rng = timedelta_range('1 days', periods=10)
+
+        result = rng < rng[3]
+        exp = np.array([True, True, True] + [False] * 7)
+        tm.assert_numpy_array_equal(result, exp)
+
+        # raise TypeError for now
+        pytest.raises(TypeError, rng.__lt__, rng[3].value)
+
+        result = rng == list(rng)
+        exp = rng == rng
+        tm.assert_numpy_array_equal(result, exp)
+
+    def test_comp_nat(self):
+        left = pd.TimedeltaIndex([pd.Timedelta('1 days'), pd.NaT,
+                                  pd.Timedelta('3 days')])
+        right = pd.TimedeltaIndex([pd.NaT, pd.NaT, pd.Timedelta('3 days')])
+
+        for lhs, rhs in [(left, right),
+                         (left.astype(object), right.astype(object))]:
+            result = rhs == lhs
+            expected = np.array([False, False, True])
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = rhs != lhs
+            expected = np.array([True, True, False])
+            tm.assert_numpy_array_equal(result, expected)
+
+            expected = np.array([False, False, False])
+            tm.assert_numpy_array_equal(lhs == pd.NaT, expected)
+            tm.assert_numpy_array_equal(pd.NaT == rhs, expected)
+
+            expected = np.array([True, True, True])
+            tm.assert_numpy_array_equal(lhs != pd.NaT, expected)
+            tm.assert_numpy_array_equal(pd.NaT != lhs, expected)
+
+            expected = np.array([False, False, False])
+            tm.assert_numpy_array_equal(lhs < pd.NaT, expected)
+            tm.assert_numpy_array_equal(pd.NaT > lhs, expected)
+
+    def test_comparisons_nat(self):
+        tdidx1 = pd.TimedeltaIndex(['1 day', pd.NaT, '1 day 00:00:01', pd.NaT,
+                                    '1 day 00:00:01', '5 day 00:00:03'])
+        tdidx2 = pd.TimedeltaIndex(['2 day', '2 day', pd.NaT, pd.NaT,
+                                    '1 day 00:00:02', '5 days 00:00:03'])
+        tdarr = np.array([np.timedelta64(2, 'D'),
+                          np.timedelta64(2, 'D'), np.timedelta64('nat'),
+                          np.timedelta64('nat'),
+                          np.timedelta64(1, 'D') + np.timedelta64(2, 's'),
+                          np.timedelta64(5, 'D') + np.timedelta64(3, 's')])
+
+        cases = [(tdidx1, tdidx2), (tdidx1, tdarr)]
+
+        # Check pd.NaT is handles as the same as np.nan
+        for idx1, idx2 in cases:
+
+            result = idx1 < idx2
+            expected = np.array([True, False, False, False, True, False])
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = idx2 > idx1
+            expected = np.array([True, False, False, False, True, False])
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = idx1 <= idx2
+            expected = np.array([True, False, False, False, True, True])
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = idx2 >= idx1
+            expected = np.array([True, False, False, False, True, True])
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = idx1 == idx2
+            expected = np.array([False, False, False, False, False, True])
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = idx1 != idx2
+            expected = np.array([True, True, True, True, True, False])
+            tm.assert_numpy_array_equal(result, expected)
+
+
+class TestTimedeltaIndexMultiplicationDivision(object):
+    # __mul__, __rmul__,
+    # __div__, __rdiv__, __floordiv__, __rfloordiv__,
+    # __mod__, __rmod__, __divmod__, __rdivmod__
+
+    # -------------------------------------------------------------
+    # Multiplication
+    # organized with scalar others first, then array-like
+
+    def test_tdi_mul_int(self):
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        result = idx * 1
+        tm.assert_index_equal(result, idx)
+
+    def test_tdi_rmul_int(self):
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        result = 1 * idx
+        tm.assert_index_equal(result, idx)
+
+    def test_tdi_mul_tdlike_scalar_raises(self, delta):
+        rng = timedelta_range('1 days', '10 days', name='foo')
+        with pytest.raises(TypeError):
+            rng * delta
+
+    def test_tdi_mul_int_array_zerodim(self):
+        rng5 = np.arange(5, dtype='int64')
+        idx = TimedeltaIndex(rng5)
+        expected = TimedeltaIndex(rng5 * 5)
+        result = idx * np.array(5, dtype='int64')
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_mul_int_array(self):
+        rng5 = np.arange(5, dtype='int64')
+        idx = TimedeltaIndex(rng5)
+        didx = TimedeltaIndex(rng5 ** 2)
+
+        result = idx * rng5
+        tm.assert_index_equal(result, didx)
+
+    def test_tdi_mul_dti_raises(self):
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        with pytest.raises(TypeError):
+            idx * idx
+
+    def test_tdi_mul_too_short_raises(self):
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        with pytest.raises(TypeError):
+            idx * TimedeltaIndex(np.arange(3))
+        with pytest.raises(ValueError):
+            idx * np.array([1, 2])
+
+    def test_tdi_mul_int_series(self):
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        didx = TimedeltaIndex(np.arange(5, dtype='int64') ** 2)
+
+        result = idx * Series(np.arange(5, dtype='int64'))
+
+        tm.assert_series_equal(result, Series(didx))
+
+    def test_tdi_mul_float_series(self):
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+
+        rng5f = np.arange(5, dtype='float64')
+        result = idx * Series(rng5f + 0.1)
+        expected = Series(TimedeltaIndex(rng5f * (rng5f + 0.1)))
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('other', [np.arange(1, 11),
+                                       pd.Int64Index(range(1, 11)),
+                                       pd.UInt64Index(range(1, 11)),
+                                       pd.Float64Index(range(1, 11)),
+                                       pd.RangeIndex(1, 11)])
+    def test_tdi_rmul_arraylike(self, other):
+        tdi = TimedeltaIndex(['1 Day'] * 10)
+        expected = timedelta_range('1 days', '10 days')
+
+        result = other * tdi
+        tm.assert_index_equal(result, expected)
+        commute = tdi * other
+        tm.assert_index_equal(commute, expected)
+
+    # -------------------------------------------------------------
+    # TimedeltaIndex.__div__
+
+    def test_tdi_div_int(self):
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        result = idx / 1
+        tm.assert_index_equal(result, idx)
+
+    def test_tdi_div_tdlike_scalar(self, delta):
+        rng = timedelta_range('1 days', '10 days', name='foo')
+        expected = Int64Index((np.arange(10) + 1) * 12, name='foo')
+
+        result = rng / delta
+        tm.assert_index_equal(result, expected, exact=False)
+
+    def test_tdi_div_tdlike_scalar_with_nat(self, delta):
+        rng = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
+        expected = Float64Index([12, np.nan, 24], name='foo')
+        result = rng / delta
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_div_nat_raises(self):
+        # don't allow division by NaT (make could in the future)
+        rng = timedelta_range('1 days', '10 days', name='foo')
+        with pytest.raises(TypeError):
+            rng / pd.NaT
+
+    # -------------------------------------------------------------
+    # TimedeltaIndex.__floordiv__
+
+    def test_tdi_floordiv_int(self):
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        result = idx // 1
+        tm.assert_index_equal(result, idx)
+
+    def test_tdi_floordiv_tdlike_scalar(self, delta):
+        tdi = timedelta_range('1 days', '10 days', name='foo')
+        expected = Int64Index((np.arange(10) + 1) * 12, name='foo')
+
+        result = tdi // delta
+        tm.assert_index_equal(result, expected, exact=False)
+
+    @pytest.mark.parametrize('scalar_td', [
+        timedelta(minutes=10, seconds=7),
+        Timedelta('10m7s'),
+        Timedelta('10m7s').to_timedelta64()])
+    def test_tdi_floordiv_timedelta_scalar(self, scalar_td):
+        # GH#19125
+        tdi = TimedeltaIndex(['00:05:03', '00:05:03', pd.NaT], freq=None)
+        expected = pd.Index([2.0, 2.0, np.nan])
+
+        res = tdi.__rfloordiv__(scalar_td)
+        tm.assert_index_equal(res, expected)
+
+        expected = pd.Index([0.0, 0.0, np.nan])
+
+        res = tdi // (scalar_td)
+        tm.assert_index_equal(res, expected)
+
+
+class TestTimedeltaIndexArithmetic(object):
+    # Addition and Subtraction Operations
+
+    # -------------------------------------------------------------
+    # Invalid Operations
+
+    @pytest.mark.parametrize('other', [3.14, np.array([2.0, 3.0])])
+    @pytest.mark.parametrize('op', [operator.add, ops.radd,
+                                    operator.sub, ops.rsub])
+    def test_tdi_add_sub_float(self, op, other):
+        dti = DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D')
+        tdi = dti - dti.shift(1)
+        with pytest.raises(TypeError):
+            op(tdi, other)
+
+    def test_tdi_add_str_invalid(self):
+        # GH 13624
+        tdi = TimedeltaIndex(['1 day', '2 days'])
+
+        with pytest.raises(TypeError):
+            tdi + 'a'
+        with pytest.raises(TypeError):
+            'a' + tdi
+
+    @pytest.mark.parametrize('freq', [None, 'H'])
+    def test_tdi_sub_period(self, freq):
+        # GH#13078
+        # not supported, check TypeError
+        p = pd.Period('2011-01-01', freq='D')
+
+        idx = pd.TimedeltaIndex(['1 hours', '2 hours'], freq=freq)
+
+        with pytest.raises(TypeError):
+            idx - p
+
+        with pytest.raises(TypeError):
+            p - idx
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd,
+                                    operator.sub, ops.rsub])
+    @pytest.mark.parametrize('pi_freq', ['D', 'W', 'Q', 'H'])
+    @pytest.mark.parametrize('tdi_freq', [None, 'H'])
+    def test_dti_sub_pi(self, tdi_freq, pi_freq, op):
+        # GH#20049 subtracting PeriodIndex should raise TypeError
+        tdi = pd.TimedeltaIndex(['1 hours', '2 hours'], freq=tdi_freq)
+        dti = pd.Timestamp('2018-03-07 17:16:40') + tdi
+        pi = dti.to_period(pi_freq)
+        with pytest.raises(TypeError):
+            op(dti, pi)
+
+    # -------------------------------------------------------------
+    # TimedeltaIndex.shift is used by __add__/__sub__
+
+    def test_tdi_shift_empty(self):
+        # GH#9903
+        idx = pd.TimedeltaIndex([], name='xxx')
+        tm.assert_index_equal(idx.shift(0, freq='H'), idx)
+        tm.assert_index_equal(idx.shift(3, freq='H'), idx)
+
+    def test_tdi_shift_hours(self):
+        # GH#9903
+        idx = pd.TimedeltaIndex(['5 hours', '6 hours', '9 hours'], name='xxx')
+        tm.assert_index_equal(idx.shift(0, freq='H'), idx)
+        exp = pd.TimedeltaIndex(['8 hours', '9 hours', '12 hours'], name='xxx')
+        tm.assert_index_equal(idx.shift(3, freq='H'), exp)
+        exp = pd.TimedeltaIndex(['2 hours', '3 hours', '6 hours'], name='xxx')
+        tm.assert_index_equal(idx.shift(-3, freq='H'), exp)
+
+    def test_tdi_shift_minutes(self):
+        # GH#9903
+        idx = pd.TimedeltaIndex(['5 hours', '6 hours', '9 hours'], name='xxx')
+        tm.assert_index_equal(idx.shift(0, freq='T'), idx)
+        exp = pd.TimedeltaIndex(['05:03:00', '06:03:00', '9:03:00'],
+                                name='xxx')
+        tm.assert_index_equal(idx.shift(3, freq='T'), exp)
+        exp = pd.TimedeltaIndex(['04:57:00', '05:57:00', '8:57:00'],
+                                name='xxx')
+        tm.assert_index_equal(idx.shift(-3, freq='T'), exp)
+
+    def test_tdi_shift_int(self):
+        # GH#8083
+        trange = pd.to_timedelta(range(5), unit='d') + pd.offsets.Hour(1)
+        result = trange.shift(1)
+        expected = TimedeltaIndex(['1 days 01:00:00', '2 days 01:00:00',
+                                   '3 days 01:00:00',
+                                   '4 days 01:00:00', '5 days 01:00:00'],
+                                  freq='D')
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_shift_nonstandard_freq(self):
+        # GH#8083
+        trange = pd.to_timedelta(range(5), unit='d') + pd.offsets.Hour(1)
+        result = trange.shift(3, freq='2D 1s')
+        expected = TimedeltaIndex(['6 days 01:00:03', '7 days 01:00:03',
+                                   '8 days 01:00:03', '9 days 01:00:03',
+                                   '10 days 01:00:03'], freq='D')
+        tm.assert_index_equal(result, expected)
+
+    def test_shift_no_freq(self):
+        # GH#19147
+        tdi = TimedeltaIndex(['1 days 01:00:00', '2 days 01:00:00'], freq=None)
+        with pytest.raises(NullFrequencyError):
+            tdi.shift(2)
+
+    # -------------------------------------------------------------
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('foo', 'foo', 'foo')])
+    def test_tdi_add_offset_index(self, names):
+        # GH#18849, GH#19744
+        tdi = TimedeltaIndex(['1 days 00:00:00', '3 days 04:00:00'],
+                             name=names[0])
+        other = pd.Index([pd.offsets.Hour(n=1), pd.offsets.Minute(n=-2)],
+                         name=names[1])
+
+        expected = TimedeltaIndex([tdi[n] + other[n] for n in range(len(tdi))],
+                                  freq='infer', name=names[2])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = tdi + other
+        tm.assert_index_equal(res, expected)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res2 = other + tdi
+        tm.assert_index_equal(res2, expected)
+
+    def test_tdi_add_offset_array(self):
+        # GH#18849
+        tdi = TimedeltaIndex(['1 days 00:00:00', '3 days 04:00:00'])
+        other = np.array([pd.offsets.Hour(n=1), pd.offsets.Minute(n=-2)])
+
+        expected = TimedeltaIndex([tdi[n] + other[n] for n in range(len(tdi))],
+                                  freq='infer')
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = tdi + other
+        tm.assert_index_equal(res, expected)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res2 = other + tdi
+        tm.assert_index_equal(res2, expected)
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('foo', 'foo', 'foo')])
+    def test_tdi_sub_offset_index(self, names):
+        # GH#18824, GH#19744
+        tdi = TimedeltaIndex(['1 days 00:00:00', '3 days 04:00:00'],
+                             name=names[0])
+        other = pd.Index([pd.offsets.Hour(n=1), pd.offsets.Minute(n=-2)],
+                         name=names[1])
+
+        expected = TimedeltaIndex([tdi[n] - other[n] for n in range(len(tdi))],
+                                  freq='infer', name=names[2])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = tdi - other
+        tm.assert_index_equal(res, expected)
+
+    def test_tdi_sub_offset_array(self):
+        # GH#18824
+        tdi = TimedeltaIndex(['1 days 00:00:00', '3 days 04:00:00'])
+        other = np.array([pd.offsets.Hour(n=1), pd.offsets.Minute(n=-2)])
+
+        expected = TimedeltaIndex([tdi[n] - other[n] for n in range(len(tdi))],
+                                  freq='infer')
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = tdi - other
+        tm.assert_index_equal(res, expected)
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('foo', 'foo', 'foo')])
+    def test_tdi_with_offset_series(self, names):
+        # GH#18849
+        tdi = TimedeltaIndex(['1 days 00:00:00', '3 days 04:00:00'],
+                             name=names[0])
+        other = Series([pd.offsets.Hour(n=1), pd.offsets.Minute(n=-2)],
+                       name=names[1])
+
+        expected_add = Series([tdi[n] + other[n] for n in range(len(tdi))],
+                              name=names[2])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = tdi + other
+        tm.assert_series_equal(res, expected_add)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res2 = other + tdi
+        tm.assert_series_equal(res2, expected_add)
+
+        expected_sub = Series([tdi[n] - other[n] for n in range(len(tdi))],
+                              name=names[2])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res3 = tdi - other
+        tm.assert_series_equal(res3, expected_sub)
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index, pd.Series])
+    def test_tdi_add_sub_anchored_offset_arraylike(self, box):
+        # GH#18824
+        tdi = TimedeltaIndex(['1 days 00:00:00', '3 days 04:00:00'])
+
+        anchored = box([pd.offsets.MonthEnd(), pd.offsets.Day(n=2)])
+
+        # addition/subtraction ops with anchored offsets should issue
+        # a PerformanceWarning and _then_ raise a TypeError.
+        with pytest.raises(TypeError):
+            with tm.assert_produces_warning(PerformanceWarning):
+                tdi + anchored
+        with pytest.raises(TypeError):
+            with tm.assert_produces_warning(PerformanceWarning):
+                anchored + tdi
+        with pytest.raises(TypeError):
+            with tm.assert_produces_warning(PerformanceWarning):
+                tdi - anchored
+        with pytest.raises(TypeError):
+            with tm.assert_produces_warning(PerformanceWarning):
+                anchored - tdi
+
+    def test_ufunc_coercions(self):
+        # normal ops are also tested in tseries/test_timedeltas.py
+        idx = TimedeltaIndex(['2H', '4H', '6H', '8H', '10H'],
+                             freq='2H', name='x')
+
+        for result in [idx * 2, np.multiply(idx, 2)]:
+            assert isinstance(result, TimedeltaIndex)
+            exp = TimedeltaIndex(['4H', '8H', '12H', '16H', '20H'],
+                                 freq='4H', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == '4H'
+
+        for result in [idx / 2, np.divide(idx, 2)]:
+            assert isinstance(result, TimedeltaIndex)
+            exp = TimedeltaIndex(['1H', '2H', '3H', '4H', '5H'],
+                                 freq='H', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == 'H'
+
+        idx = TimedeltaIndex(['2H', '4H', '6H', '8H', '10H'],
+                             freq='2H', name='x')
+        for result in [-idx, np.negative(idx)]:
+            assert isinstance(result, TimedeltaIndex)
+            exp = TimedeltaIndex(['-2H', '-4H', '-6H', '-8H', '-10H'],
+                                 freq='-2H', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == '-2H'
+
+        idx = TimedeltaIndex(['-2H', '-1H', '0H', '1H', '2H'],
+                             freq='H', name='x')
+        for result in [abs(idx), np.absolute(idx)]:
+            assert isinstance(result, TimedeltaIndex)
+            exp = TimedeltaIndex(['2H', '1H', '0H', '1H', '2H'],
+                                 freq=None, name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq is None
+
+    # -------------------------------------------------------------
+    # Binary operations TimedeltaIndex and integer
+
+    def test_tdi_add_int(self, one):
+        # Variants of `one` for #19012
+        rng = timedelta_range('1 days 09:00:00', freq='H', periods=10)
+        result = rng + one
+        expected = timedelta_range('1 days 10:00:00', freq='H', periods=10)
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_iadd_int(self, one):
+        rng = timedelta_range('1 days 09:00:00', freq='H', periods=10)
+        expected = timedelta_range('1 days 10:00:00', freq='H', periods=10)
+        rng += one
+        tm.assert_index_equal(rng, expected)
+
+    def test_tdi_sub_int(self, one):
+        rng = timedelta_range('1 days 09:00:00', freq='H', periods=10)
+        result = rng - one
+        expected = timedelta_range('1 days 08:00:00', freq='H', periods=10)
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_isub_int(self, one):
+        rng = timedelta_range('1 days 09:00:00', freq='H', periods=10)
+        expected = timedelta_range('1 days 08:00:00', freq='H', periods=10)
+        rng -= one
+        tm.assert_index_equal(rng, expected)
+
+    # -------------------------------------------------------------
+    # __add__/__sub__ with integer arrays
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_tdi_add_integer_array(self, box):
+        # GH#19959
+        rng = timedelta_range('1 days 09:00:00', freq='H', periods=3)
+        other = box([4, 3, 2])
+        expected = TimedeltaIndex(['1 day 13:00:00'] * 3)
+        result = rng + other
+        tm.assert_index_equal(result, expected)
+        result = other + rng
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_tdi_sub_integer_array(self, box):
+        # GH#19959
+        rng = timedelta_range('9H', freq='H', periods=3)
+        other = box([4, 3, 2])
+        expected = TimedeltaIndex(['5H', '7H', '9H'])
+        result = rng - other
+        tm.assert_index_equal(result, expected)
+        result = other - rng
+        tm.assert_index_equal(result, -expected)
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_tdi_addsub_integer_array_no_freq(self, box):
+        # GH#19959
+        tdi = TimedeltaIndex(['1 Day', 'NaT', '3 Hours'])
+        other = box([14, -1, 16])
+        with pytest.raises(NullFrequencyError):
+            tdi + other
+        with pytest.raises(NullFrequencyError):
+            other + tdi
+        with pytest.raises(NullFrequencyError):
+            tdi - other
+        with pytest.raises(NullFrequencyError):
+            other - tdi
+
+    # -------------------------------------------------------------
+    # Binary operations TimedeltaIndex and timedelta-like
+
+    def test_tdi_add_timedeltalike(self, delta):
+        # only test adding/sub offsets as + is now numeric
+        rng = timedelta_range('1 days', '10 days')
+        result = rng + delta
+        expected = timedelta_range('1 days 02:00:00', '10 days 02:00:00',
+                                   freq='D')
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_iadd_timedeltalike(self, delta):
+        # only test adding/sub offsets as + is now numeric
+        rng = timedelta_range('1 days', '10 days')
+        expected = timedelta_range('1 days 02:00:00', '10 days 02:00:00',
+                                   freq='D')
+        rng += delta
+        tm.assert_index_equal(rng, expected)
+
+    def test_tdi_sub_timedeltalike(self, delta):
+        # only test adding/sub offsets as - is now numeric
+        rng = timedelta_range('1 days', '10 days')
+        result = rng - delta
+        expected = timedelta_range('0 days 22:00:00', '9 days 22:00:00')
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_isub_timedeltalike(self, delta):
+        # only test adding/sub offsets as - is now numeric
+        rng = timedelta_range('1 days', '10 days')
+        expected = timedelta_range('0 days 22:00:00', '9 days 22:00:00')
+        rng -= delta
+        tm.assert_index_equal(rng, expected)
+
+    # -------------------------------------------------------------
+    # Binary operations TimedeltaIndex and datetime-like
+
+    def test_tdi_sub_timestamp_raises(self):
+        idx = TimedeltaIndex(['1 day', '2 day'])
+        msg = "cannot subtract a datelike from a TimedeltaIndex"
+        with tm.assert_raises_regex(TypeError, msg):
+            idx - Timestamp('2011-01-01')
+
+    def test_tdi_add_timestamp(self):
+        idx = TimedeltaIndex(['1 day', '2 day'])
+
+        result = idx + Timestamp('2011-01-01')
+        expected = DatetimeIndex(['2011-01-02', '2011-01-03'])
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_radd_timestamp(self):
+        idx = TimedeltaIndex(['1 day', '2 day'])
+
+        result = Timestamp('2011-01-01') + idx
+        expected = DatetimeIndex(['2011-01-02', '2011-01-03'])
+        tm.assert_index_equal(result, expected)
+
+    # -------------------------------------------------------------
+    # __add__/__sub__ with ndarray[datetime64] and ndarray[timedelta64]
+
+    def test_tdi_sub_dt64_array(self):
+        dti = pd.date_range('2016-01-01', periods=3)
+        tdi = dti - dti.shift(1)
+        dtarr = dti.values
+
+        with pytest.raises(TypeError):
+            tdi - dtarr
+
+        # TimedeltaIndex.__rsub__
+        expected = pd.DatetimeIndex(dtarr) - tdi
+        result = dtarr - tdi
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_add_dt64_array(self):
+        dti = pd.date_range('2016-01-01', periods=3)
+        tdi = dti - dti.shift(1)
+        dtarr = dti.values
+
+        expected = pd.DatetimeIndex(dtarr) + tdi
+        result = tdi + dtarr
+        tm.assert_index_equal(result, expected)
+        result = dtarr + tdi
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_add_td64_array(self):
+        dti = pd.date_range('2016-01-01', periods=3)
+        tdi = dti - dti.shift(1)
+        tdarr = tdi.values
+
+        expected = 2 * tdi
+        result = tdi + tdarr
+        tm.assert_index_equal(result, expected)
+        result = tdarr + tdi
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_sub_td64_array(self):
+        dti = pd.date_range('2016-01-01', periods=3)
+        tdi = dti - dti.shift(1)
+        tdarr = tdi.values
+
+        expected = 0 * tdi
+        result = tdi - tdarr
+        tm.assert_index_equal(result, expected)
+        result = tdarr - tdi
+        tm.assert_index_equal(result, expected)
+
+    # -------------------------------------------------------------
+
+    def test_subtraction_ops(self):
+        # with datetimes/timedelta and tdi/dti
+        tdi = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
+        dti = date_range('20130101', periods=3, name='bar')
+        td = Timedelta('1 days')
+        dt = Timestamp('20130101')
+
+        pytest.raises(TypeError, lambda: tdi - dt)
+        pytest.raises(TypeError, lambda: tdi - dti)
+        pytest.raises(TypeError, lambda: td - dt)
+        pytest.raises(TypeError, lambda: td - dti)
+
+        result = dt - dti
+        expected = TimedeltaIndex(['0 days', '-1 days', '-2 days'], name='bar')
+        tm.assert_index_equal(result, expected)
+
+        result = dti - dt
+        expected = TimedeltaIndex(['0 days', '1 days', '2 days'], name='bar')
+        tm.assert_index_equal(result, expected)
+
+        result = tdi - td
+        expected = TimedeltaIndex(['0 days', pd.NaT, '1 days'], name='foo')
+        tm.assert_index_equal(result, expected, check_names=False)
+
+        result = td - tdi
+        expected = TimedeltaIndex(['0 days', pd.NaT, '-1 days'], name='foo')
+        tm.assert_index_equal(result, expected, check_names=False)
+
+        result = dti - td
+        expected = DatetimeIndex(
+            ['20121231', '20130101', '20130102'], name='bar')
+        tm.assert_index_equal(result, expected, check_names=False)
+
+        result = dt - tdi
+        expected = DatetimeIndex(['20121231', pd.NaT, '20121230'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+    def test_subtraction_ops_with_tz(self):
+
+        # check that dt/dti subtraction ops with tz are validated
+        dti = date_range('20130101', periods=3)
+        ts = Timestamp('20130101')
+        dt = ts.to_pydatetime()
+        dti_tz = date_range('20130101', periods=3).tz_localize('US/Eastern')
+        ts_tz = Timestamp('20130101').tz_localize('US/Eastern')
+        ts_tz2 = Timestamp('20130101').tz_localize('CET')
+        dt_tz = ts_tz.to_pydatetime()
+        td = Timedelta('1 days')
+
+        def _check(result, expected):
+            assert result == expected
+            assert isinstance(result, Timedelta)
+
+        # scalars
+        result = ts - ts
+        expected = Timedelta('0 days')
+        _check(result, expected)
+
+        result = dt_tz - ts_tz
+        expected = Timedelta('0 days')
+        _check(result, expected)
+
+        result = ts_tz - dt_tz
+        expected = Timedelta('0 days')
+        _check(result, expected)
+
+        # tz mismatches
+        pytest.raises(TypeError, lambda: dt_tz - ts)
+        pytest.raises(TypeError, lambda: dt_tz - dt)
+        pytest.raises(TypeError, lambda: dt_tz - ts_tz2)
+        pytest.raises(TypeError, lambda: dt - dt_tz)
+        pytest.raises(TypeError, lambda: ts - dt_tz)
+        pytest.raises(TypeError, lambda: ts_tz2 - ts)
+        pytest.raises(TypeError, lambda: ts_tz2 - dt)
+        pytest.raises(TypeError, lambda: ts_tz - ts_tz2)
+
+        # with dti
+        pytest.raises(TypeError, lambda: dti - ts_tz)
+        pytest.raises(TypeError, lambda: dti_tz - ts)
+        pytest.raises(TypeError, lambda: dti_tz - ts_tz2)
+
+        result = dti_tz - dt_tz
+        expected = TimedeltaIndex(['0 days', '1 days', '2 days'])
+        tm.assert_index_equal(result, expected)
+
+        result = dt_tz - dti_tz
+        expected = TimedeltaIndex(['0 days', '-1 days', '-2 days'])
+        tm.assert_index_equal(result, expected)
+
+        result = dti_tz - ts_tz
+        expected = TimedeltaIndex(['0 days', '1 days', '2 days'])
+        tm.assert_index_equal(result, expected)
+
+        result = ts_tz - dti_tz
+        expected = TimedeltaIndex(['0 days', '-1 days', '-2 days'])
+        tm.assert_index_equal(result, expected)
+
+        result = td - td
+        expected = Timedelta('0 days')
+        _check(result, expected)
+
+        result = dti_tz - td
+        expected = DatetimeIndex(
+            ['20121231', '20130101', '20130102'], tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_tdi_numeric_ops(self):
+        # These are normally union/diff set-like ops
+        tdi = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
+        dti = date_range('20130101', periods=3, name='bar')
+
+        # TODO(wesm): unused?
+        # td = Timedelta('1 days')
+        # dt = Timestamp('20130101')
+
+        result = tdi - tdi
+        expected = TimedeltaIndex(['0 days', pd.NaT, '0 days'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = tdi + tdi
+        expected = TimedeltaIndex(['2 days', pd.NaT, '4 days'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = dti - tdi  # name will be reset
+        expected = DatetimeIndex(['20121231', pd.NaT, '20130101'])
+        tm.assert_index_equal(result, expected)
+
+    def test_addition_ops(self):
+        # with datetimes/timedelta and tdi/dti
+        tdi = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
+        dti = date_range('20130101', periods=3, name='bar')
+        td = Timedelta('1 days')
+        dt = Timestamp('20130101')
+
+        result = tdi + dt
+        expected = DatetimeIndex(['20130102', pd.NaT, '20130103'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = dt + tdi
+        expected = DatetimeIndex(['20130102', pd.NaT, '20130103'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = td + tdi
+        expected = TimedeltaIndex(['2 days', pd.NaT, '3 days'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = tdi + td
+        expected = TimedeltaIndex(['2 days', pd.NaT, '3 days'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+        # unequal length
+        pytest.raises(ValueError, lambda: tdi + dti[0:1])
+        pytest.raises(ValueError, lambda: tdi[0:1] + dti)
+
+        # random indexes
+        pytest.raises(NullFrequencyError, lambda: tdi + Int64Index([1, 2, 3]))
+
+        # this is a union!
+        # pytest.raises(TypeError, lambda : Int64Index([1,2,3]) + tdi)
+
+        result = tdi + dti  # name will be reset
+        expected = DatetimeIndex(['20130102', pd.NaT, '20130105'])
+        tm.assert_index_equal(result, expected)
+
+        result = dti + tdi  # name will be reset
+        expected = DatetimeIndex(['20130102', pd.NaT, '20130105'])
+        tm.assert_index_equal(result, expected)
+
+        result = dt + td
+        expected = Timestamp('20130102')
+        assert result == expected
+
+        result = td + dt
+        expected = Timestamp('20130102')
+        assert result == expected
+
+    def test_ops_ndarray(self):
+        td = Timedelta('1 day')
+
+        # timedelta, timedelta
+        other = pd.to_timedelta(['1 day']).values
+        expected = pd.to_timedelta(['2 days']).values
+        tm.assert_numpy_array_equal(td + other, expected)
+        if LooseVersion(np.__version__) >= LooseVersion('1.8'):
+            tm.assert_numpy_array_equal(other + td, expected)
+        pytest.raises(TypeError, lambda: td + np.array([1]))
+        pytest.raises(TypeError, lambda: np.array([1]) + td)
+
+        expected = pd.to_timedelta(['0 days']).values
+        tm.assert_numpy_array_equal(td - other, expected)
+        if LooseVersion(np.__version__) >= LooseVersion('1.8'):
+            tm.assert_numpy_array_equal(-other + td, expected)
+        pytest.raises(TypeError, lambda: td - np.array([1]))
+        pytest.raises(TypeError, lambda: np.array([1]) - td)
+
+        expected = pd.to_timedelta(['2 days']).values
+        tm.assert_numpy_array_equal(td * np.array([2]), expected)
+        tm.assert_numpy_array_equal(np.array([2]) * td, expected)
+        pytest.raises(TypeError, lambda: td * other)
+        pytest.raises(TypeError, lambda: other * td)
+
+        tm.assert_numpy_array_equal(td / other,
+                                    np.array([1], dtype=np.float64))
+        if LooseVersion(np.__version__) >= LooseVersion('1.8'):
+            tm.assert_numpy_array_equal(other / td,
+                                        np.array([1], dtype=np.float64))
+
+        # timedelta, datetime
+        other = pd.to_datetime(['2000-01-01']).values
+        expected = pd.to_datetime(['2000-01-02']).values
+        tm.assert_numpy_array_equal(td + other, expected)
+        if LooseVersion(np.__version__) >= LooseVersion('1.8'):
+            tm.assert_numpy_array_equal(other + td, expected)
+
+        expected = pd.to_datetime(['1999-12-31']).values
+        tm.assert_numpy_array_equal(-td + other, expected)
+        if LooseVersion(np.__version__) >= LooseVersion('1.8'):
+            tm.assert_numpy_array_equal(other - td, expected)
+
+    def test_ops_series(self):
+        # regression test for GH8813
+        td = Timedelta('1 day')
+        other = pd.Series([1, 2])
+        expected = pd.Series(pd.to_timedelta(['1 day', '2 days']))
+        tm.assert_series_equal(expected, td * other)
+        tm.assert_series_equal(expected, other * td)
+
+    def test_ops_series_object(self):
+        # GH 13043
+        s = pd.Series([pd.Timestamp('2015-01-01', tz='US/Eastern'),
+                       pd.Timestamp('2015-01-01', tz='Asia/Tokyo')],
+                      name='xxx')
+        assert s.dtype == object
+
+        exp = pd.Series([pd.Timestamp('2015-01-02', tz='US/Eastern'),
+                         pd.Timestamp('2015-01-02', tz='Asia/Tokyo')],
+                        name='xxx')
+        tm.assert_series_equal(s + pd.Timedelta('1 days'), exp)
+        tm.assert_series_equal(pd.Timedelta('1 days') + s, exp)
+
+        # object series & object series
+        s2 = pd.Series([pd.Timestamp('2015-01-03', tz='US/Eastern'),
+                        pd.Timestamp('2015-01-05', tz='Asia/Tokyo')],
+                       name='xxx')
+        assert s2.dtype == object
+        exp = pd.Series([pd.Timedelta('2 days'), pd.Timedelta('4 days')],
+                        name='xxx')
+        tm.assert_series_equal(s2 - s, exp)
+        tm.assert_series_equal(s - s2, -exp)
+
+        s = pd.Series([pd.Timedelta('01:00:00'), pd.Timedelta('02:00:00')],
+                      name='xxx', dtype=object)
+        assert s.dtype == object
+
+        exp = pd.Series([pd.Timedelta('01:30:00'), pd.Timedelta('02:30:00')],
+                        name='xxx')
+        tm.assert_series_equal(s + pd.Timedelta('00:30:00'), exp)
+        tm.assert_series_equal(pd.Timedelta('00:30:00') + s, exp)
+
+    def test_timedelta_ops_with_missing_values(self):
+        # setup
+        s1 = pd.to_timedelta(Series(['00:00:01']))
+        s2 = pd.to_timedelta(Series(['00:00:02']))
+        sn = pd.to_timedelta(Series([pd.NaT]))
+        df1 = pd.DataFrame(['00:00:01']).apply(pd.to_timedelta)
+        df2 = pd.DataFrame(['00:00:02']).apply(pd.to_timedelta)
+        dfn = pd.DataFrame([pd.NaT]).apply(pd.to_timedelta)
+        scalar1 = pd.to_timedelta('00:00:01')
+        scalar2 = pd.to_timedelta('00:00:02')
+        timedelta_NaT = pd.to_timedelta('NaT')
+        NA = np.nan
+
+        actual = scalar1 + scalar1
+        assert actual == scalar2
+        actual = scalar2 - scalar1
+        assert actual == scalar1
+
+        actual = s1 + s1
+        tm.assert_series_equal(actual, s2)
+        actual = s2 - s1
+        tm.assert_series_equal(actual, s1)
+
+        actual = s1 + scalar1
+        tm.assert_series_equal(actual, s2)
+        actual = scalar1 + s1
+        tm.assert_series_equal(actual, s2)
+        actual = s2 - scalar1
+        tm.assert_series_equal(actual, s1)
+        actual = -scalar1 + s2
+        tm.assert_series_equal(actual, s1)
+
+        actual = s1 + timedelta_NaT
+        tm.assert_series_equal(actual, sn)
+        actual = timedelta_NaT + s1
+        tm.assert_series_equal(actual, sn)
+        actual = s1 - timedelta_NaT
+        tm.assert_series_equal(actual, sn)
+        actual = -timedelta_NaT + s1
+        tm.assert_series_equal(actual, sn)
+
+        with pytest.raises(TypeError):
+            s1 + np.nan
+        with pytest.raises(TypeError):
+            np.nan + s1
+        with pytest.raises(TypeError):
+            s1 - np.nan
+        with pytest.raises(TypeError):
+            -np.nan + s1
+
+        actual = s1 + pd.NaT
+        tm.assert_series_equal(actual, sn)
+        actual = s2 - pd.NaT
+        tm.assert_series_equal(actual, sn)
+
+        actual = s1 + df1
+        tm.assert_frame_equal(actual, df2)
+        actual = s2 - df1
+        tm.assert_frame_equal(actual, df1)
+        actual = df1 + s1
+        tm.assert_frame_equal(actual, df2)
+        actual = df2 - s1
+        tm.assert_frame_equal(actual, df1)
+
+        actual = df1 + df1
+        tm.assert_frame_equal(actual, df2)
+        actual = df2 - df1
+        tm.assert_frame_equal(actual, df1)
+
+        actual = df1 + scalar1
+        tm.assert_frame_equal(actual, df2)
+        actual = df2 - scalar1
+        tm.assert_frame_equal(actual, df1)
+
+        actual = df1 + timedelta_NaT
+        tm.assert_frame_equal(actual, dfn)
+        actual = df1 - timedelta_NaT
+        tm.assert_frame_equal(actual, dfn)
+
+        actual = df1 + NA
+        tm.assert_frame_equal(actual, dfn)
+        actual = df1 - NA
+        tm.assert_frame_equal(actual, dfn)
+
+        actual = df1 + pd.NaT  # NaT is datetime, not timedelta
+        tm.assert_frame_equal(actual, dfn)
+        actual = df1 - pd.NaT
+        tm.assert_frame_equal(actual, dfn)
+
+    def test_add_overflow(self):
+        # see gh-14068
+        msg = "too (big|large) to convert"
+        with tm.assert_raises_regex(OverflowError, msg):
+            to_timedelta(106580, 'D') + Timestamp('2000')
+        with tm.assert_raises_regex(OverflowError, msg):
+            Timestamp('2000') + to_timedelta(106580, 'D')
+
+        _NaT = int(pd.NaT) + 1
+        msg = "Overflow in int64 addition"
+        with tm.assert_raises_regex(OverflowError, msg):
+            to_timedelta([106580], 'D') + Timestamp('2000')
+        with tm.assert_raises_regex(OverflowError, msg):
+            Timestamp('2000') + to_timedelta([106580], 'D')
+        with tm.assert_raises_regex(OverflowError, msg):
+            to_timedelta([_NaT]) - Timedelta('1 days')
+        with tm.assert_raises_regex(OverflowError, msg):
+            to_timedelta(['5 days', _NaT]) - Timedelta('1 days')
+        with tm.assert_raises_regex(OverflowError, msg):
+            (to_timedelta([_NaT, '5 days', '1 hours']) -
+             to_timedelta(['7 seconds', _NaT, '4 hours']))
+
+        # These should not overflow!
+        exp = TimedeltaIndex([pd.NaT])
+        result = to_timedelta([pd.NaT]) - Timedelta('1 days')
+        tm.assert_index_equal(result, exp)
+
+        exp = TimedeltaIndex(['4 days', pd.NaT])
+        result = to_timedelta(['5 days', pd.NaT]) - Timedelta('1 days')
+        tm.assert_index_equal(result, exp)
+
+        exp = TimedeltaIndex([pd.NaT, pd.NaT, '5 hours'])
+        result = (to_timedelta([pd.NaT, '5 days', '1 hours']) +
+                  to_timedelta(['7 seconds', pd.NaT, '4 hours']))
+        tm.assert_index_equal(result, exp)
+
+    def test_timedeltaindex_add_timestamp_nat_masking(self):
+        # GH17991 checking for overflow-masking with NaT
+        tdinat = pd.to_timedelta(['24658 days 11:15:00', 'NaT'])
+
+        tsneg = Timestamp('1950-01-01')
+        ts_neg_variants = [tsneg,
+                           tsneg.to_pydatetime(),
+                           tsneg.to_datetime64().astype('datetime64[ns]'),
+                           tsneg.to_datetime64().astype('datetime64[D]')]
+
+        tspos = Timestamp('1980-01-01')
+        ts_pos_variants = [tspos,
+                           tspos.to_pydatetime(),
+                           tspos.to_datetime64().astype('datetime64[ns]'),
+                           tspos.to_datetime64().astype('datetime64[D]')]
+
+        for variant in ts_neg_variants + ts_pos_variants:
+            res = tdinat + variant
+            assert res[1] is pd.NaT
+
+    def test_tdi_ops_attributes(self):
+        rng = timedelta_range('2 days', periods=5, freq='2D', name='x')
+
+        result = rng + 1
+        exp = timedelta_range('4 days', periods=5, freq='2D', name='x')
+        tm.assert_index_equal(result, exp)
+        assert result.freq == '2D'
+
+        result = rng - 2
+        exp = timedelta_range('-2 days', periods=5, freq='2D', name='x')
+        tm.assert_index_equal(result, exp)
+        assert result.freq == '2D'
+
+        result = rng * 2
+        exp = timedelta_range('4 days', periods=5, freq='4D', name='x')
+        tm.assert_index_equal(result, exp)
+        assert result.freq == '4D'
+
+        result = rng / 2
+        exp = timedelta_range('1 days', periods=5, freq='D', name='x')
+        tm.assert_index_equal(result, exp)
+        assert result.freq == 'D'
+
+        result = -rng
+        exp = timedelta_range('-2 days', periods=5, freq='-2D', name='x')
+        tm.assert_index_equal(result, exp)
+        assert result.freq == '-2D'
+
+        rng = pd.timedelta_range('-2 days', periods=5, freq='D', name='x')
+
+        result = abs(rng)
+        exp = TimedeltaIndex(['2 days', '1 days', '0 days', '1 days',
+                              '2 days'], name='x')
+        tm.assert_index_equal(result, exp)
+        assert result.freq is None
+
+    # TODO: Needs more informative name, probably split up into
+    # more targeted tests
+    def test_timedelta(self, freq):
+        index = date_range('1/1/2000', periods=50, freq=freq)
+
+        shifted = index + timedelta(1)
+        back = shifted + timedelta(-1)
+        tm.assert_index_equal(index, back)
+
+        if freq == 'D':
+            expected = pd.tseries.offsets.Day(1)
+            assert index.freq == expected
+            assert shifted.freq == expected
+            assert back.freq == expected
+        else:  # freq == 'B'
+            assert index.freq == pd.tseries.offsets.BusinessDay(1)
+            assert shifted.freq is None
+            assert back.freq == pd.tseries.offsets.BusinessDay(1)
+
+        result = index - timedelta(1)
+        expected = index + timedelta(-1)
+        tm.assert_index_equal(result, expected)
+
+        # GH4134, buggy with timedeltas
+        rng = date_range('2013', '2014')
+        s = Series(rng)
+        result1 = rng - pd.offsets.Hour(1)
+        result2 = DatetimeIndex(s - np.timedelta64(100000000))
+        result3 = rng - np.timedelta64(100000000)
+        result4 = DatetimeIndex(s - pd.offsets.Hour(1))
+        tm.assert_index_equal(result1, result4)
+        tm.assert_index_equal(result2, result3)
diff --git a/pandas/tests/indexes/timedeltas/test_astype.py b/pandas/tests/indexes/timedeltas/test_astype.py
new file mode 100644
index 0000000000000..329f0c2467e8b
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_astype.py
@@ -0,0 +1,78 @@
+from datetime import timedelta
+
+import pytest
+
+import numpy as np
+
+import pandas.util.testing as tm
+from pandas import (TimedeltaIndex, timedelta_range, Int64Index, Float64Index,
+                    Index, Timedelta, NaT)
+
+
+class TestTimedeltaIndex(object):
+    def test_astype_object(self):
+        idx = timedelta_range(start='1 days', periods=4, freq='D', name='idx')
+        expected_list = [Timedelta('1 days'), Timedelta('2 days'),
+                         Timedelta('3 days'), Timedelta('4 days')]
+        result = idx.astype(object)
+        expected = Index(expected_list, dtype=object, name='idx')
+        tm.assert_index_equal(result, expected)
+        assert idx.tolist() == expected_list
+
+    def test_astype_object_with_nat(self):
+        idx = TimedeltaIndex([timedelta(days=1), timedelta(days=2), NaT,
+                              timedelta(days=4)], name='idx')
+        expected_list = [Timedelta('1 days'), Timedelta('2 days'), NaT,
+                         Timedelta('4 days')]
+        result = idx.astype(object)
+        expected = Index(expected_list, dtype=object, name='idx')
+        tm.assert_index_equal(result, expected)
+        assert idx.tolist() == expected_list
+
+    def test_astype(self):
+        # GH 13149, GH 13209
+        idx = TimedeltaIndex([1e14, 'NaT', NaT, np.NaN])
+
+        result = idx.astype(object)
+        expected = Index([Timedelta('1 days 03:46:40')] + [NaT] * 3,
+                         dtype=object)
+        tm.assert_index_equal(result, expected)
+
+        result = idx.astype(int)
+        expected = Int64Index([100000000000000] + [-9223372036854775808] * 3,
+                              dtype=np.int64)
+        tm.assert_index_equal(result, expected)
+
+        result = idx.astype(str)
+        expected = Index(str(x) for x in idx)
+        tm.assert_index_equal(result, expected)
+
+        rng = timedelta_range('1 days', periods=10)
+        result = rng.astype('i8')
+        tm.assert_index_equal(result, Index(rng.asi8))
+        tm.assert_numpy_array_equal(rng.asi8, result.values)
+
+    def test_astype_timedelta64(self):
+        # GH 13149, GH 13209
+        idx = TimedeltaIndex([1e14, 'NaT', NaT, np.NaN])
+
+        result = idx.astype('timedelta64')
+        expected = Float64Index([1e+14] + [np.NaN] * 3, dtype='float64')
+        tm.assert_index_equal(result, expected)
+
+        result = idx.astype('timedelta64[ns]')
+        tm.assert_index_equal(result, idx)
+        assert result is not idx
+
+        result = idx.astype('timedelta64[ns]', copy=False)
+        tm.assert_index_equal(result, idx)
+        assert result is idx
+
+    @pytest.mark.parametrize('dtype', [
+        float, 'datetime64', 'datetime64[ns]'])
+    def test_astype_raises(self, dtype):
+        # GH 13149, GH 13209
+        idx = TimedeltaIndex([1e14, 'NaT', NaT, np.NaN])
+        msg = 'Cannot cast TimedeltaIndex to dtype'
+        with tm.assert_raises_regex(TypeError, msg):
+            idx.astype(dtype)
diff --git a/pandas/tests/indexes/timedeltas/test_construction.py b/pandas/tests/indexes/timedeltas/test_construction.py
new file mode 100644
index 0000000000000..68dc0003e2312
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_construction.py
@@ -0,0 +1,88 @@
+import pytest
+
+import numpy as np
+from datetime import timedelta
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import TimedeltaIndex, timedelta_range, to_timedelta
+
+
+class TestTimedeltaIndex(object):
+
+    def test_construction_base_constructor(self):
+        arr = [pd.Timedelta('1 days'), pd.NaT, pd.Timedelta('3 days')]
+        tm.assert_index_equal(pd.Index(arr), pd.TimedeltaIndex(arr))
+        tm.assert_index_equal(pd.Index(np.array(arr)),
+                              pd.TimedeltaIndex(np.array(arr)))
+
+        arr = [np.nan, pd.NaT, pd.Timedelta('1 days')]
+        tm.assert_index_equal(pd.Index(arr), pd.TimedeltaIndex(arr))
+        tm.assert_index_equal(pd.Index(np.array(arr)),
+                              pd.TimedeltaIndex(np.array(arr)))
+
+    def test_constructor(self):
+        expected = TimedeltaIndex(['1 days', '1 days 00:00:05', '2 days',
+                                   '2 days 00:00:02', '0 days 00:00:03'])
+        result = TimedeltaIndex(['1 days', '1 days, 00:00:05', np.timedelta64(
+            2, 'D'), timedelta(days=2, seconds=2), pd.offsets.Second(3)])
+        tm.assert_index_equal(result, expected)
+
+        # unicode
+        result = TimedeltaIndex([u'1 days', '1 days, 00:00:05', np.timedelta64(
+            2, 'D'), timedelta(days=2, seconds=2), pd.offsets.Second(3)])
+
+        expected = TimedeltaIndex(['0 days 00:00:00', '0 days 00:00:01',
+                                   '0 days 00:00:02'])
+        tm.assert_index_equal(TimedeltaIndex(range(3), unit='s'), expected)
+        expected = TimedeltaIndex(['0 days 00:00:00', '0 days 00:00:05',
+                                   '0 days 00:00:09'])
+        tm.assert_index_equal(TimedeltaIndex([0, 5, 9], unit='s'), expected)
+        expected = TimedeltaIndex(
+            ['0 days 00:00:00.400', '0 days 00:00:00.450',
+             '0 days 00:00:01.200'])
+        tm.assert_index_equal(TimedeltaIndex([400, 450, 1200], unit='ms'),
+                              expected)
+
+    def test_constructor_coverage(self):
+        rng = timedelta_range('1 days', periods=10.5)
+        exp = timedelta_range('1 days', periods=10)
+        tm.assert_index_equal(rng, exp)
+
+        msg = 'periods must be a number, got foo'
+        with tm.assert_raises_regex(TypeError, msg):
+            TimedeltaIndex(start='1 days', periods='foo', freq='D')
+
+        pytest.raises(ValueError, TimedeltaIndex, start='1 days',
+                      end='10 days')
+
+        pytest.raises(ValueError, TimedeltaIndex, '1 days')
+
+        # generator expression
+        gen = (timedelta(i) for i in range(10))
+        result = TimedeltaIndex(gen)
+        expected = TimedeltaIndex([timedelta(i) for i in range(10)])
+        tm.assert_index_equal(result, expected)
+
+        # NumPy string array
+        strings = np.array(['1 days', '2 days', '3 days'])
+        result = TimedeltaIndex(strings)
+        expected = to_timedelta([1, 2, 3], unit='d')
+        tm.assert_index_equal(result, expected)
+
+        from_ints = TimedeltaIndex(expected.asi8)
+        tm.assert_index_equal(from_ints, expected)
+
+        # non-conforming freq
+        pytest.raises(ValueError, TimedeltaIndex,
+                      ['1 days', '2 days', '4 days'], freq='D')
+
+        pytest.raises(ValueError, TimedeltaIndex, periods=10, freq='D')
+
+    def test_constructor_name(self):
+        idx = TimedeltaIndex(start='1 days', periods=1, freq='D', name='TEST')
+        assert idx.name == 'TEST'
+
+        # GH10025
+        idx2 = TimedeltaIndex(idx, name='something else')
+        assert idx2.name == 'something else'
diff --git a/pandas/tests/indexes/timedeltas/test_formats.py b/pandas/tests/indexes/timedeltas/test_formats.py
new file mode 100644
index 0000000000000..09921fac80d22
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_formats.py
@@ -0,0 +1,96 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+import pandas as pd
+from pandas import TimedeltaIndex
+
+
+class TestTimedeltaIndexRendering(object):
+    @pytest.mark.parametrize('method', ['__repr__', '__unicode__', '__str__'])
+    def test_representation(self, method):
+        idx1 = TimedeltaIndex([], freq='D')
+        idx2 = TimedeltaIndex(['1 days'], freq='D')
+        idx3 = TimedeltaIndex(['1 days', '2 days'], freq='D')
+        idx4 = TimedeltaIndex(['1 days', '2 days', '3 days'], freq='D')
+        idx5 = TimedeltaIndex(['1 days 00:00:01', '2 days', '3 days'])
+
+        exp1 = """TimedeltaIndex([], dtype='timedelta64[ns]', freq='D')"""
+
+        exp2 = ("TimedeltaIndex(['1 days'], dtype='timedelta64[ns]', "
+                "freq='D')")
+
+        exp3 = ("TimedeltaIndex(['1 days', '2 days'], "
+                "dtype='timedelta64[ns]', freq='D')")
+
+        exp4 = ("TimedeltaIndex(['1 days', '2 days', '3 days'], "
+                "dtype='timedelta64[ns]', freq='D')")
+
+        exp5 = ("TimedeltaIndex(['1 days 00:00:01', '2 days 00:00:00', "
+                "'3 days 00:00:00'], dtype='timedelta64[ns]', freq=None)")
+
+        with pd.option_context('display.width', 300):
+            for idx, expected in zip([idx1, idx2, idx3, idx4, idx5],
+                                     [exp1, exp2, exp3, exp4, exp5]):
+                result = getattr(idx, method)()
+                assert result == expected
+
+    def test_representation_to_series(self):
+        idx1 = TimedeltaIndex([], freq='D')
+        idx2 = TimedeltaIndex(['1 days'], freq='D')
+        idx3 = TimedeltaIndex(['1 days', '2 days'], freq='D')
+        idx4 = TimedeltaIndex(['1 days', '2 days', '3 days'], freq='D')
+        idx5 = TimedeltaIndex(['1 days 00:00:01', '2 days', '3 days'])
+
+        exp1 = """Series([], dtype: timedelta64[ns])"""
+
+        exp2 = ("0   1 days\n"
+                "dtype: timedelta64[ns]")
+
+        exp3 = ("0   1 days\n"
+                "1   2 days\n"
+                "dtype: timedelta64[ns]")
+
+        exp4 = ("0   1 days\n"
+                "1   2 days\n"
+                "2   3 days\n"
+                "dtype: timedelta64[ns]")
+
+        exp5 = ("0   1 days 00:00:01\n"
+                "1   2 days 00:00:00\n"
+                "2   3 days 00:00:00\n"
+                "dtype: timedelta64[ns]")
+
+        with pd.option_context('display.width', 300):
+            for idx, expected in zip([idx1, idx2, idx3, idx4, idx5],
+                                     [exp1, exp2, exp3, exp4, exp5]):
+                result = repr(pd.Series(idx))
+                assert result == expected
+
+    def test_summary(self):
+        # GH#9116
+        idx1 = TimedeltaIndex([], freq='D')
+        idx2 = TimedeltaIndex(['1 days'], freq='D')
+        idx3 = TimedeltaIndex(['1 days', '2 days'], freq='D')
+        idx4 = TimedeltaIndex(['1 days', '2 days', '3 days'], freq='D')
+        idx5 = TimedeltaIndex(['1 days 00:00:01', '2 days', '3 days'])
+
+        exp1 = ("TimedeltaIndex: 0 entries\n"
+                "Freq: D")
+
+        exp2 = ("TimedeltaIndex: 1 entries, 1 days to 1 days\n"
+                "Freq: D")
+
+        exp3 = ("TimedeltaIndex: 2 entries, 1 days to 2 days\n"
+                "Freq: D")
+
+        exp4 = ("TimedeltaIndex: 3 entries, 1 days to 3 days\n"
+                "Freq: D")
+
+        exp5 = ("TimedeltaIndex: 3 entries, 1 days 00:00:01 to 3 days "
+                "00:00:00")
+
+        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5],
+                                 [exp1, exp2, exp3, exp4, exp5]):
+            result = idx._summary()
+            assert result == expected
diff --git a/pandas/tests/indexes/timedeltas/test_indexing.py b/pandas/tests/indexes/timedeltas/test_indexing.py
new file mode 100644
index 0000000000000..08992188265bd
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_indexing.py
@@ -0,0 +1,322 @@
+from datetime import timedelta
+
+import pytest
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import TimedeltaIndex, timedelta_range, compat, Index, Timedelta
+
+
+class TestGetItem(object):
+    def test_getitem(self):
+        idx1 = timedelta_range('1 day', '31 day', freq='D', name='idx')
+
+        for idx in [idx1]:
+            result = idx[0]
+            assert result == Timedelta('1 day')
+
+            result = idx[0:5]
+            expected = timedelta_range('1 day', '5 day', freq='D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx[0:10:2]
+            expected = timedelta_range('1 day', '9 day', freq='2D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx[-20:-5:3]
+            expected = timedelta_range('12 day', '24 day', freq='3D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx[4::-1]
+            expected = TimedeltaIndex(['5 day', '4 day', '3 day',
+                                       '2 day', '1 day'],
+                                      freq='-1D', name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+
+class TestWhere(object):
+    # placeholder for symmetry with DatetimeIndex and PeriodIndex tests
+    pass
+
+
+class TestTake(object):
+    def test_take(self):
+        # GH 10295
+        idx1 = timedelta_range('1 day', '31 day', freq='D', name='idx')
+
+        for idx in [idx1]:
+            result = idx.take([0])
+            assert result == Timedelta('1 day')
+
+            result = idx.take([-1])
+            assert result == Timedelta('31 day')
+
+            result = idx.take([0, 1, 2])
+            expected = timedelta_range('1 day', '3 day', freq='D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx.take([0, 2, 4])
+            expected = timedelta_range('1 day', '5 day', freq='2D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx.take([7, 4, 1])
+            expected = timedelta_range('8 day', '2 day', freq='-3D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx.take([3, 2, 5])
+            expected = TimedeltaIndex(['4 day', '3 day', '6 day'], name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq is None
+
+            result = idx.take([-3, 2, 5])
+            expected = TimedeltaIndex(['29 day', '3 day', '6 day'], name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq is None
+
+    def test_take_invalid_kwargs(self):
+        idx = timedelta_range('1 day', '31 day', freq='D', name='idx')
+        indices = [1, 6, 5, 9, 10, 13, 15, 3]
+
+        msg = r"take\(\) got an unexpected keyword argument 'foo'"
+        tm.assert_raises_regex(TypeError, msg, idx.take,
+                               indices, foo=2)
+
+        msg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, idx.take,
+                               indices, out=indices)
+
+        msg = "the 'mode' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, idx.take,
+                               indices, mode='clip')
+
+    # TODO: This method came from test_timedelta; de-dup with version above
+    def test_take2(self):
+        tds = ['1day 02:00:00', '1 day 04:00:00', '1 day 10:00:00']
+        idx = TimedeltaIndex(start='1d', end='2d', freq='H', name='idx')
+        expected = TimedeltaIndex(tds, freq=None, name='idx')
+
+        taken1 = idx.take([2, 4, 10])
+        taken2 = idx[[2, 4, 10]]
+
+        for taken in [taken1, taken2]:
+            tm.assert_index_equal(taken, expected)
+            assert isinstance(taken, TimedeltaIndex)
+            assert taken.freq is None
+            assert taken.name == expected.name
+
+    def test_take_fill_value(self):
+        # GH 12631
+        idx = TimedeltaIndex(['1 days', '2 days', '3 days'],
+                             name='xxx')
+        result = idx.take(np.array([1, 0, -1]))
+        expected = TimedeltaIndex(['2 days', '1 days', '3 days'],
+                                  name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        # fill_value
+        result = idx.take(np.array([1, 0, -1]), fill_value=True)
+        expected = TimedeltaIndex(['2 days', '1 days', 'NaT'],
+                                  name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        expected = TimedeltaIndex(['2 days', '1 days', '3 days'],
+                                  name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -2]), fill_value=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            idx.take(np.array([1, -5]))
+
+
+class TestTimedeltaIndex(object):
+
+    def test_insert(self):
+
+        idx = TimedeltaIndex(['4day', '1day', '2day'], name='idx')
+
+        result = idx.insert(2, timedelta(days=5))
+        exp = TimedeltaIndex(['4day', '1day', '5day', '2day'], name='idx')
+        tm.assert_index_equal(result, exp)
+
+        # insertion of non-datetime should coerce to object index
+        result = idx.insert(1, 'inserted')
+        expected = Index([Timedelta('4day'), 'inserted', Timedelta('1day'),
+                          Timedelta('2day')], name='idx')
+        assert not isinstance(result, TimedeltaIndex)
+        tm.assert_index_equal(result, expected)
+        assert result.name == expected.name
+
+        idx = timedelta_range('1day 00:00:01', periods=3, freq='s', name='idx')
+
+        # preserve freq
+        expected_0 = TimedeltaIndex(['1day', '1day 00:00:01', '1day 00:00:02',
+                                     '1day 00:00:03'],
+                                    name='idx', freq='s')
+        expected_3 = TimedeltaIndex(['1day 00:00:01', '1day 00:00:02',
+                                     '1day 00:00:03', '1day 00:00:04'],
+                                    name='idx', freq='s')
+
+        # reset freq to None
+        expected_1_nofreq = TimedeltaIndex(['1day 00:00:01', '1day 00:00:01',
+                                            '1day 00:00:02', '1day 00:00:03'],
+                                           name='idx', freq=None)
+        expected_3_nofreq = TimedeltaIndex(['1day 00:00:01', '1day 00:00:02',
+                                            '1day 00:00:03', '1day 00:00:05'],
+                                           name='idx', freq=None)
+
+        cases = [(0, Timedelta('1day'), expected_0),
+                 (-3, Timedelta('1day'), expected_0),
+                 (3, Timedelta('1day 00:00:04'), expected_3),
+                 (1, Timedelta('1day 00:00:01'), expected_1_nofreq),
+                 (3, Timedelta('1day 00:00:05'), expected_3_nofreq)]
+
+        for n, d, expected in cases:
+            result = idx.insert(n, d)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+
+        # GH 18295 (test missing)
+        expected = TimedeltaIndex(['1day', pd.NaT, '2day', '3day'])
+        for na in (np.nan, pd.NaT, None):
+            result = timedelta_range('1day', '3day').insert(1, na)
+            tm.assert_index_equal(result, expected)
+
+    def test_delete(self):
+        idx = timedelta_range(start='1 Days', periods=5, freq='D', name='idx')
+
+        # prserve freq
+        expected_0 = timedelta_range(start='2 Days', periods=4, freq='D',
+                                     name='idx')
+        expected_4 = timedelta_range(start='1 Days', periods=4, freq='D',
+                                     name='idx')
+
+        # reset freq to None
+        expected_1 = TimedeltaIndex(
+            ['1 day', '3 day', '4 day', '5 day'], freq=None, name='idx')
+
+        cases = {0: expected_0,
+                 -5: expected_0,
+                 -1: expected_4,
+                 4: expected_4,
+                 1: expected_1}
+        for n, expected in compat.iteritems(cases):
+            result = idx.delete(n)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+
+        with pytest.raises((IndexError, ValueError)):
+            # either depeidnig on numpy version
+            result = idx.delete(5)
+
+    def test_delete_slice(self):
+        idx = timedelta_range(start='1 days', periods=10, freq='D', name='idx')
+
+        # prserve freq
+        expected_0_2 = timedelta_range(start='4 days', periods=7, freq='D',
+                                       name='idx')
+        expected_7_9 = timedelta_range(start='1 days', periods=7, freq='D',
+                                       name='idx')
+
+        # reset freq to None
+        expected_3_5 = TimedeltaIndex(['1 d', '2 d', '3 d',
+                                       '7 d', '8 d', '9 d', '10d'],
+                                      freq=None, name='idx')
+
+        cases = {(0, 1, 2): expected_0_2,
+                 (7, 8, 9): expected_7_9,
+                 (3, 4, 5): expected_3_5}
+        for n, expected in compat.iteritems(cases):
+            result = idx.delete(n)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+
+            result = idx.delete(slice(n[0], n[-1] + 1))
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+
+    def test_get_loc(self):
+        idx = pd.to_timedelta(['0 days', '1 days', '2 days'])
+
+        for method in [None, 'pad', 'backfill', 'nearest']:
+            assert idx.get_loc(idx[1], method) == 1
+            assert idx.get_loc(idx[1].to_pytimedelta(), method) == 1
+            assert idx.get_loc(str(idx[1]), method) == 1
+
+        assert idx.get_loc(idx[1], 'pad',
+                           tolerance=Timedelta(0)) == 1
+        assert idx.get_loc(idx[1], 'pad',
+                           tolerance=np.timedelta64(0, 's')) == 1
+        assert idx.get_loc(idx[1], 'pad',
+                           tolerance=timedelta(0)) == 1
+
+        with tm.assert_raises_regex(ValueError,
+                                    'unit abbreviation w/o a number'):
+            idx.get_loc(idx[1], method='nearest', tolerance='foo')
+
+        with pytest.raises(
+                ValueError,
+                match='tolerance size must match'):
+            idx.get_loc(idx[1], method='nearest',
+                        tolerance=[Timedelta(0).to_timedelta64(),
+                                   Timedelta(0).to_timedelta64()])
+
+        for method, loc in [('pad', 1), ('backfill', 2), ('nearest', 1)]:
+            assert idx.get_loc('1 day 1 hour', method) == loc
+
+        # GH 16909
+        assert idx.get_loc(idx[1].to_timedelta64()) == 1
+
+        # GH 16896
+        assert idx.get_loc('0 days') == 0
+
+    def test_get_loc_nat(self):
+        tidx = TimedeltaIndex(['1 days 01:00:00', 'NaT', '2 days 01:00:00'])
+
+        assert tidx.get_loc(pd.NaT) == 1
+        assert tidx.get_loc(None) == 1
+        assert tidx.get_loc(float('nan')) == 1
+        assert tidx.get_loc(np.nan) == 1
+
+    def test_get_indexer(self):
+        idx = pd.to_timedelta(['0 days', '1 days', '2 days'])
+        tm.assert_numpy_array_equal(idx.get_indexer(idx),
+                                    np.array([0, 1, 2], dtype=np.intp))
+
+        target = pd.to_timedelta(['-1 hour', '12 hours', '1 day 1 hour'])
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'),
+                                    np.array([-1, 0, 1], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'),
+                                    np.array([0, 1, 2], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'),
+                                    np.array([0, 1, 1], dtype=np.intp))
+
+        res = idx.get_indexer(target, 'nearest',
+                              tolerance=Timedelta('1 hour'))
+        tm.assert_numpy_array_equal(res, np.array([0, -1, 1], dtype=np.intp))
diff --git a/pandas/tests/indexes/timedeltas/test_ops.py b/pandas/tests/indexes/timedeltas/test_ops.py
new file mode 100644
index 0000000000000..2e257bb8a500a
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_ops.py
@@ -0,0 +1,401 @@
+import pytest
+
+import numpy as np
+from datetime import timedelta
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import to_timedelta
+from pandas import (Series, Timedelta, Timestamp, TimedeltaIndex,
+                    timedelta_range,
+                    _np_version_under1p10)
+from pandas._libs.tslib import iNaT
+from pandas.tests.test_base import Ops
+from pandas.tseries.offsets import Day, Hour
+from pandas.core.dtypes.generic import ABCDateOffset
+
+
+class TestTimedeltaIndexOps(Ops):
+    def setup_method(self, method):
+        super(TestTimedeltaIndexOps, self).setup_method(method)
+        mask = lambda x: isinstance(x, TimedeltaIndex)
+        self.is_valid_objs = [o for o in self.objs if mask(o)]
+        self.not_valid_objs = []
+
+    def test_ops_properties(self):
+        f = lambda x: isinstance(x, TimedeltaIndex)
+        self.check_ops_properties(TimedeltaIndex._field_ops, f)
+        self.check_ops_properties(TimedeltaIndex._object_ops, f)
+
+    def test_minmax(self):
+
+        # monotonic
+        idx1 = TimedeltaIndex(['1 days', '2 days', '3 days'])
+        assert idx1.is_monotonic
+
+        # non-monotonic
+        idx2 = TimedeltaIndex(['1 days', np.nan, '3 days', 'NaT'])
+        assert not idx2.is_monotonic
+
+        for idx in [idx1, idx2]:
+            assert idx.min() == Timedelta('1 days')
+            assert idx.max() == Timedelta('3 days')
+            assert idx.argmin() == 0
+            assert idx.argmax() == 2
+
+        for op in ['min', 'max']:
+            # Return NaT
+            obj = TimedeltaIndex([])
+            assert pd.isna(getattr(obj, op)())
+
+            obj = TimedeltaIndex([pd.NaT])
+            assert pd.isna(getattr(obj, op)())
+
+            obj = TimedeltaIndex([pd.NaT, pd.NaT, pd.NaT])
+            assert pd.isna(getattr(obj, op)())
+
+    def test_numpy_minmax(self):
+        dr = pd.date_range(start='2016-01-15', end='2016-01-20')
+        td = TimedeltaIndex(np.asarray(dr))
+
+        assert np.min(td) == Timedelta('16815 days')
+        assert np.max(td) == Timedelta('16820 days')
+
+        errmsg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, errmsg, np.min, td, out=0)
+        tm.assert_raises_regex(ValueError, errmsg, np.max, td, out=0)
+
+        assert np.argmin(td) == 0
+        assert np.argmax(td) == 5
+
+        if not _np_version_under1p10:
+            errmsg = "the 'out' parameter is not supported"
+            tm.assert_raises_regex(
+                ValueError, errmsg, np.argmin, td, out=0)
+            tm.assert_raises_regex(
+                ValueError, errmsg, np.argmax, td, out=0)
+
+    def test_value_counts_unique(self):
+        # GH 7735
+
+        idx = timedelta_range('1 days 09:00:00', freq='H', periods=10)
+        # create repeated values, 'n'th element is repeated by n+1 times
+        idx = TimedeltaIndex(np.repeat(idx.values, range(1, len(idx) + 1)))
+
+        exp_idx = timedelta_range('1 days 18:00:00', freq='-1H', periods=10)
+        expected = Series(range(10, 0, -1), index=exp_idx, dtype='int64')
+
+        for obj in [idx, Series(idx)]:
+            tm.assert_series_equal(obj.value_counts(), expected)
+
+        expected = timedelta_range('1 days 09:00:00', freq='H', periods=10)
+        tm.assert_index_equal(idx.unique(), expected)
+
+        idx = TimedeltaIndex(['1 days 09:00:00', '1 days 09:00:00',
+                              '1 days 09:00:00', '1 days 08:00:00',
+                              '1 days 08:00:00', pd.NaT])
+
+        exp_idx = TimedeltaIndex(['1 days 09:00:00', '1 days 08:00:00'])
+        expected = Series([3, 2], index=exp_idx)
+
+        for obj in [idx, Series(idx)]:
+            tm.assert_series_equal(obj.value_counts(), expected)
+
+        exp_idx = TimedeltaIndex(['1 days 09:00:00', '1 days 08:00:00',
+                                  pd.NaT])
+        expected = Series([3, 2, 1], index=exp_idx)
+
+        for obj in [idx, Series(idx)]:
+            tm.assert_series_equal(obj.value_counts(dropna=False), expected)
+
+        tm.assert_index_equal(idx.unique(), exp_idx)
+
+    def test_nonunique_contains(self):
+        # GH 9512
+        for idx in map(TimedeltaIndex, ([0, 1, 0], [0, 0, -1], [0, -1, -1],
+                                        ['00:01:00', '00:01:00', '00:02:00'],
+                                        ['00:01:00', '00:01:00', '00:00:01'])):
+            assert idx[0] in idx
+
+    def test_unknown_attribute(self):
+        # see gh-9680
+        tdi = pd.timedelta_range(start=0, periods=10, freq='1s')
+        ts = pd.Series(np.random.normal(size=10), index=tdi)
+        assert 'foo' not in ts.__dict__.keys()
+        pytest.raises(AttributeError, lambda: ts.foo)
+
+    def test_order(self):
+        # GH 10295
+        idx1 = TimedeltaIndex(['1 day', '2 day', '3 day'], freq='D',
+                              name='idx')
+        idx2 = TimedeltaIndex(
+            ['1 hour', '2 hour', '3 hour'], freq='H', name='idx')
+
+        for idx in [idx1, idx2]:
+            ordered = idx.sort_values()
+            tm.assert_index_equal(ordered, idx)
+            assert ordered.freq == idx.freq
+
+            ordered = idx.sort_values(ascending=False)
+            expected = idx[::-1]
+            tm.assert_index_equal(ordered, expected)
+            assert ordered.freq == expected.freq
+            assert ordered.freq.n == -1
+
+            ordered, indexer = idx.sort_values(return_indexer=True)
+            tm.assert_index_equal(ordered, idx)
+            tm.assert_numpy_array_equal(indexer, np.array([0, 1, 2]),
+                                        check_dtype=False)
+            assert ordered.freq == idx.freq
+
+            ordered, indexer = idx.sort_values(return_indexer=True,
+                                               ascending=False)
+            tm.assert_index_equal(ordered, idx[::-1])
+            assert ordered.freq == expected.freq
+            assert ordered.freq.n == -1
+
+        idx1 = TimedeltaIndex(['1 hour', '3 hour', '5 hour',
+                               '2 hour ', '1 hour'], name='idx1')
+        exp1 = TimedeltaIndex(['1 hour', '1 hour', '2 hour',
+                               '3 hour', '5 hour'], name='idx1')
+
+        idx2 = TimedeltaIndex(['1 day', '3 day', '5 day',
+                               '2 day', '1 day'], name='idx2')
+
+        # TODO(wesm): unused?
+        # exp2 = TimedeltaIndex(['1 day', '1 day', '2 day',
+        #                        '3 day', '5 day'], name='idx2')
+
+        # idx3 = TimedeltaIndex([pd.NaT, '3 minute', '5 minute',
+        #                        '2 minute', pd.NaT], name='idx3')
+        # exp3 = TimedeltaIndex([pd.NaT, pd.NaT, '2 minute', '3 minute',
+        #                        '5 minute'], name='idx3')
+
+        for idx, expected in [(idx1, exp1), (idx1, exp1), (idx1, exp1)]:
+            ordered = idx.sort_values()
+            tm.assert_index_equal(ordered, expected)
+            assert ordered.freq is None
+
+            ordered = idx.sort_values(ascending=False)
+            tm.assert_index_equal(ordered, expected[::-1])
+            assert ordered.freq is None
+
+            ordered, indexer = idx.sort_values(return_indexer=True)
+            tm.assert_index_equal(ordered, expected)
+
+            exp = np.array([0, 4, 3, 1, 2])
+            tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+            assert ordered.freq is None
+
+            ordered, indexer = idx.sort_values(return_indexer=True,
+                                               ascending=False)
+            tm.assert_index_equal(ordered, expected[::-1])
+
+            exp = np.array([2, 1, 3, 4, 0])
+            tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+            assert ordered.freq is None
+
+    def test_drop_duplicates_metadata(self):
+        # GH 10115
+        idx = pd.timedelta_range('1 day', '31 day', freq='D', name='idx')
+        result = idx.drop_duplicates()
+        tm.assert_index_equal(idx, result)
+        assert idx.freq == result.freq
+
+        idx_dup = idx.append(idx)
+        assert idx_dup.freq is None  # freq is reset
+        result = idx_dup.drop_duplicates()
+        tm.assert_index_equal(idx, result)
+        assert result.freq is None
+
+    def test_drop_duplicates(self):
+        # to check Index/Series compat
+        base = pd.timedelta_range('1 day', '31 day', freq='D', name='idx')
+        idx = base.append(base[:5])
+
+        res = idx.drop_duplicates()
+        tm.assert_index_equal(res, base)
+        res = Series(idx).drop_duplicates()
+        tm.assert_series_equal(res, Series(base))
+
+        res = idx.drop_duplicates(keep='last')
+        exp = base[5:].append(base[:5])
+        tm.assert_index_equal(res, exp)
+        res = Series(idx).drop_duplicates(keep='last')
+        tm.assert_series_equal(res, Series(exp, index=np.arange(5, 36)))
+
+        res = idx.drop_duplicates(keep=False)
+        tm.assert_index_equal(res, base[5:])
+        res = Series(idx).drop_duplicates(keep=False)
+        tm.assert_series_equal(res, Series(base[5:], index=np.arange(5, 31)))
+
+    @pytest.mark.parametrize('freq', ['D', '3D', '-3D',
+                                      'H', '2H', '-2H',
+                                      'T', '2T', 'S', '-3S'])
+    def test_infer_freq(self, freq):
+        # GH#11018
+        idx = pd.timedelta_range('1', freq=freq, periods=10)
+        result = pd.TimedeltaIndex(idx.asi8, freq='infer')
+        tm.assert_index_equal(idx, result)
+        assert result.freq == freq
+
+    def test_nat_new(self):
+
+        idx = pd.timedelta_range('1', freq='D', periods=5, name='x')
+        result = idx._nat_new()
+        exp = pd.TimedeltaIndex([pd.NaT] * 5, name='x')
+        tm.assert_index_equal(result, exp)
+
+        result = idx._nat_new(box=False)
+        exp = np.array([iNaT] * 5, dtype=np.int64)
+        tm.assert_numpy_array_equal(result, exp)
+
+    def test_shift(self):
+        pass  # handled in test_arithmetic.py
+
+    def test_repeat(self):
+        index = pd.timedelta_range('1 days', periods=2, freq='D')
+        exp = pd.TimedeltaIndex(['1 days', '1 days', '2 days', '2 days'])
+        for res in [index.repeat(2), np.repeat(index, 2)]:
+            tm.assert_index_equal(res, exp)
+            assert res.freq is None
+
+        index = TimedeltaIndex(['1 days', 'NaT', '3 days'])
+        exp = TimedeltaIndex(['1 days', '1 days', '1 days',
+                              'NaT', 'NaT', 'NaT',
+                              '3 days', '3 days', '3 days'])
+        for res in [index.repeat(3), np.repeat(index, 3)]:
+            tm.assert_index_equal(res, exp)
+            assert res.freq is None
+
+    def test_nat(self):
+        assert pd.TimedeltaIndex._na_value is pd.NaT
+        assert pd.TimedeltaIndex([])._na_value is pd.NaT
+
+        idx = pd.TimedeltaIndex(['1 days', '2 days'])
+        assert idx._can_hold_na
+
+        tm.assert_numpy_array_equal(idx._isnan, np.array([False, False]))
+        assert not idx.hasnans
+        tm.assert_numpy_array_equal(idx._nan_idxs,
+                                    np.array([], dtype=np.intp))
+
+        idx = pd.TimedeltaIndex(['1 days', 'NaT'])
+        assert idx._can_hold_na
+
+        tm.assert_numpy_array_equal(idx._isnan, np.array([False, True]))
+        assert idx.hasnans
+        tm.assert_numpy_array_equal(idx._nan_idxs,
+                                    np.array([1], dtype=np.intp))
+
+    def test_equals(self):
+        # GH 13107
+        idx = pd.TimedeltaIndex(['1 days', '2 days', 'NaT'])
+        assert idx.equals(idx)
+        assert idx.equals(idx.copy())
+        assert idx.equals(idx.astype(object))
+        assert idx.astype(object).equals(idx)
+        assert idx.astype(object).equals(idx.astype(object))
+        assert not idx.equals(list(idx))
+        assert not idx.equals(pd.Series(idx))
+
+        idx2 = pd.TimedeltaIndex(['2 days', '1 days', 'NaT'])
+        assert not idx.equals(idx2)
+        assert not idx.equals(idx2.copy())
+        assert not idx.equals(idx2.astype(object))
+        assert not idx.astype(object).equals(idx2)
+        assert not idx.astype(object).equals(idx2.astype(object))
+        assert not idx.equals(list(idx2))
+        assert not idx.equals(pd.Series(idx2))
+
+    @pytest.mark.parametrize('values', [['0 days', '2 days', '4 days'], []])
+    @pytest.mark.parametrize('freq', ['2D', Day(2), '48H', Hour(48)])
+    def test_freq_setter(self, values, freq):
+        # GH 20678
+        idx = TimedeltaIndex(values)
+
+        # can set to an offset, converting from string if necessary
+        idx.freq = freq
+        assert idx.freq == freq
+        assert isinstance(idx.freq, ABCDateOffset)
+
+        # can reset to None
+        idx.freq = None
+        assert idx.freq is None
+
+    def test_freq_setter_errors(self):
+        # GH 20678
+        idx = TimedeltaIndex(['0 days', '2 days', '4 days'])
+
+        # setting with an incompatible freq
+        msg = ('Inferred frequency 2D from passed values does not conform to '
+               'passed frequency 5D')
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.freq = '5D'
+
+        # setting with a non-fixed frequency
+        msg = '<2 \* BusinessDays> is a non-fixed frequency'
+        with tm.assert_raises_regex(ValueError, msg):
+            idx.freq = '2B'
+
+        # setting with non-freq string
+        with tm.assert_raises_regex(ValueError, 'Invalid frequency'):
+            idx.freq = 'foo'
+
+
+class TestTimedeltas(object):
+
+    def test_timedelta_ops(self):
+        # GH4984
+        # make sure ops return Timedelta
+        s = Series([Timestamp('20130101') + timedelta(seconds=i * i)
+                    for i in range(10)])
+        td = s.diff()
+
+        result = td.mean()
+        expected = to_timedelta(timedelta(seconds=9))
+        assert result == expected
+
+        result = td.to_frame().mean()
+        assert result[0] == expected
+
+        result = td.quantile(.1)
+        expected = Timedelta(np.timedelta64(2600, 'ms'))
+        assert result == expected
+
+        result = td.median()
+        expected = to_timedelta('00:00:09')
+        assert result == expected
+
+        result = td.to_frame().median()
+        assert result[0] == expected
+
+        # GH 6462
+        # consistency in returned values for sum
+        result = td.sum()
+        expected = to_timedelta('00:01:21')
+        assert result == expected
+
+        result = td.to_frame().sum()
+        assert result[0] == expected
+
+        # std
+        result = td.std()
+        expected = to_timedelta(Series(td.dropna().values).std())
+        assert result == expected
+
+        result = td.to_frame().std()
+        assert result[0] == expected
+
+        # invalid ops
+        for op in ['skew', 'kurt', 'sem', 'prod']:
+            pytest.raises(TypeError, getattr(td, op))
+
+        # GH 10040
+        # make sure NaT is properly handled by median()
+        s = Series([Timestamp('2015-02-03'), Timestamp('2015-02-07')])
+        assert s.diff().median() == timedelta(days=4)
+
+        s = Series([Timestamp('2015-02-03'), Timestamp('2015-02-07'),
+                    Timestamp('2015-02-15')])
+        assert s.diff().median() == timedelta(days=6)
diff --git a/pandas/tests/indexes/timedeltas/test_partial_slicing.py b/pandas/tests/indexes/timedeltas/test_partial_slicing.py
new file mode 100644
index 0000000000000..7c5f82193da6d
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_partial_slicing.py
@@ -0,0 +1,87 @@
+import pytest
+
+import numpy as np
+import pandas.util.testing as tm
+
+import pandas as pd
+from pandas import Series, timedelta_range, Timedelta
+from pandas.util.testing import assert_series_equal
+
+
+class TestSlicing(object):
+    def test_slice_keeps_name(self):
+        # GH4226
+        dr = pd.timedelta_range('1d', '5d', freq='H', name='timebucket')
+        assert dr[1:].name == dr.name
+
+    def test_partial_slice(self):
+        rng = timedelta_range('1 day 10:11:12', freq='h', periods=500)
+        s = Series(np.arange(len(rng)), index=rng)
+
+        result = s['5 day':'6 day']
+        expected = s.iloc[86:134]
+        assert_series_equal(result, expected)
+
+        result = s['5 day':]
+        expected = s.iloc[86:]
+        assert_series_equal(result, expected)
+
+        result = s[:'6 day']
+        expected = s.iloc[:134]
+        assert_series_equal(result, expected)
+
+        result = s['6 days, 23:11:12']
+        assert result == s.iloc[133]
+
+        pytest.raises(KeyError, s.__getitem__, '50 days')
+
+    def test_partial_slice_high_reso(self):
+
+        # higher reso
+        rng = timedelta_range('1 day 10:11:12', freq='us', periods=2000)
+        s = Series(np.arange(len(rng)), index=rng)
+
+        result = s['1 day 10:11:12':]
+        expected = s.iloc[0:]
+        assert_series_equal(result, expected)
+
+        result = s['1 day 10:11:12.001':]
+        expected = s.iloc[1000:]
+        assert_series_equal(result, expected)
+
+        result = s['1 days, 10:11:12.001001']
+        assert result == s.iloc[1001]
+
+    def test_slice_with_negative_step(self):
+        ts = Series(np.arange(20), timedelta_range('0', periods=20, freq='H'))
+        SLC = pd.IndexSlice
+
+        def assert_slices_equivalent(l_slc, i_slc):
+            assert_series_equal(ts[l_slc], ts.iloc[i_slc])
+            assert_series_equal(ts.loc[l_slc], ts.iloc[i_slc])
+            assert_series_equal(ts.loc[l_slc], ts.iloc[i_slc])
+
+        assert_slices_equivalent(SLC[Timedelta(hours=7)::-1], SLC[7::-1])
+        assert_slices_equivalent(SLC['7 hours'::-1], SLC[7::-1])
+
+        assert_slices_equivalent(SLC[:Timedelta(hours=7):-1], SLC[:6:-1])
+        assert_slices_equivalent(SLC[:'7 hours':-1], SLC[:6:-1])
+
+        assert_slices_equivalent(SLC['15 hours':'7 hours':-1], SLC[15:6:-1])
+        assert_slices_equivalent(SLC[Timedelta(hours=15):Timedelta(hours=7):-
+                                     1], SLC[15:6:-1])
+        assert_slices_equivalent(SLC['15 hours':Timedelta(hours=7):-1],
+                                 SLC[15:6:-1])
+        assert_slices_equivalent(SLC[Timedelta(hours=15):'7 hours':-1],
+                                 SLC[15:6:-1])
+
+        assert_slices_equivalent(SLC['7 hours':'15 hours':-1], SLC[:0])
+
+    def test_slice_with_zero_step_raises(self):
+        ts = Series(np.arange(20), timedelta_range('0', periods=20, freq='H'))
+        tm.assert_raises_regex(ValueError, 'slice step cannot be zero',
+                               lambda: ts[::0])
+        tm.assert_raises_regex(ValueError, 'slice step cannot be zero',
+                               lambda: ts.loc[::0])
+        tm.assert_raises_regex(ValueError, 'slice step cannot be zero',
+                               lambda: ts.loc[::0])
diff --git a/pandas/tests/indexes/timedeltas/test_scalar_compat.py b/pandas/tests/indexes/timedeltas/test_scalar_compat.py
new file mode 100644
index 0000000000000..7d97e1fadea30
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_scalar_compat.py
@@ -0,0 +1,63 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for TimedeltaIndex methods behaving like their Timedelta counterparts
+"""
+
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import timedelta_range, Timedelta, TimedeltaIndex, Index, Series
+
+
+class TestVectorizedTimedelta(object):
+    def test_tdi_total_seconds(self):
+        # GH#10939
+        # test index
+        rng = timedelta_range('1 days, 10:11:12.100123456', periods=2,
+                              freq='s')
+        expt = [1 * 86400 + 10 * 3600 + 11 * 60 + 12 + 100123456. / 1e9,
+                1 * 86400 + 10 * 3600 + 11 * 60 + 13 + 100123456. / 1e9]
+        tm.assert_almost_equal(rng.total_seconds(), Index(expt))
+
+        # test Series
+        ser = Series(rng)
+        s_expt = Series(expt, index=[0, 1])
+        tm.assert_series_equal(ser.dt.total_seconds(), s_expt)
+
+        # with nat
+        ser[1] = np.nan
+        s_expt = Series([1 * 86400 + 10 * 3600 + 11 * 60 +
+                         12 + 100123456. / 1e9, np.nan], index=[0, 1])
+        tm.assert_series_equal(ser.dt.total_seconds(), s_expt)
+
+        # with both nat
+        ser = Series([np.nan, np.nan], dtype='timedelta64[ns]')
+        tm.assert_series_equal(ser.dt.total_seconds(),
+                               Series([np.nan, np.nan], index=[0, 1]))
+
+    def test_tdi_round(self):
+        td = pd.timedelta_range(start='16801 days', periods=5, freq='30Min')
+        elt = td[1]
+
+        expected_rng = TimedeltaIndex([Timedelta('16801 days 00:00:00'),
+                                       Timedelta('16801 days 00:00:00'),
+                                       Timedelta('16801 days 01:00:00'),
+                                       Timedelta('16801 days 02:00:00'),
+                                       Timedelta('16801 days 02:00:00')])
+        expected_elt = expected_rng[1]
+
+        tm.assert_index_equal(td.round(freq='H'), expected_rng)
+        assert elt.round(freq='H') == expected_elt
+
+        msg = pd._libs.tslibs.frequencies._INVALID_FREQ_ERROR
+        with tm.assert_raises_regex(ValueError, msg):
+            td.round(freq='foo')
+        with tm.assert_raises_regex(ValueError, msg):
+            elt.round(freq='foo')
+
+        msg = "<MonthEnd> is a non-fixed frequency"
+        with tm.assert_raises_regex(ValueError, msg):
+            td.round(freq='M')
+        with tm.assert_raises_regex(ValueError, msg):
+            elt.round(freq='M')
diff --git a/pandas/tests/indexes/timedeltas/test_setops.py b/pandas/tests/indexes/timedeltas/test_setops.py
new file mode 100644
index 0000000000000..020e9079b3436
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_setops.py
@@ -0,0 +1,75 @@
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import TimedeltaIndex, timedelta_range, Int64Index
+
+
+class TestTimedeltaIndex(object):
+
+    def test_union(self):
+
+        i1 = timedelta_range('1day', periods=5)
+        i2 = timedelta_range('3day', periods=5)
+        result = i1.union(i2)
+        expected = timedelta_range('1day', periods=7)
+        tm.assert_index_equal(result, expected)
+
+        i1 = Int64Index(np.arange(0, 20, 2))
+        i2 = TimedeltaIndex(start='1 day', periods=10, freq='D')
+        i1.union(i2)  # Works
+        i2.union(i1)  # Fails with "AttributeError: can't set attribute"
+
+    def test_union_coverage(self):
+
+        idx = TimedeltaIndex(['3d', '1d', '2d'])
+        ordered = TimedeltaIndex(idx.sort_values(), freq='infer')
+        result = ordered.union(idx)
+        tm.assert_index_equal(result, ordered)
+
+        result = ordered[:0].union(ordered)
+        tm.assert_index_equal(result, ordered)
+        assert result.freq == ordered.freq
+
+    def test_union_bug_1730(self):
+
+        rng_a = timedelta_range('1 day', periods=4, freq='3H')
+        rng_b = timedelta_range('1 day', periods=4, freq='4H')
+
+        result = rng_a.union(rng_b)
+        exp = TimedeltaIndex(sorted(set(list(rng_a)) | set(list(rng_b))))
+        tm.assert_index_equal(result, exp)
+
+    def test_union_bug_1745(self):
+
+        left = TimedeltaIndex(['1 day 15:19:49.695000'])
+        right = TimedeltaIndex(['2 day 13:04:21.322000',
+                                '1 day 15:27:24.873000',
+                                '1 day 15:31:05.350000'])
+
+        result = left.union(right)
+        exp = TimedeltaIndex(sorted(set(list(left)) | set(list(right))))
+        tm.assert_index_equal(result, exp)
+
+    def test_union_bug_4564(self):
+
+        left = timedelta_range("1 day", "30d")
+        right = left + pd.offsets.Minute(15)
+
+        result = left.union(right)
+        exp = TimedeltaIndex(sorted(set(list(left)) | set(list(right))))
+        tm.assert_index_equal(result, exp)
+
+    def test_intersection_bug_1708(self):
+        index_1 = timedelta_range('1 day', periods=4, freq='h')
+        index_2 = index_1 + pd.offsets.Hour(5)
+
+        result = index_1 & index_2
+        assert len(result) == 0
+
+        index_1 = timedelta_range('1 day', periods=4, freq='h')
+        index_2 = index_1 + pd.offsets.Hour(1)
+
+        result = index_1 & index_2
+        expected = timedelta_range('1 day 01:00:00', periods=3, freq='h')
+        tm.assert_index_equal(result, expected)
diff --git a/pandas/tests/indexes/timedeltas/test_timedelta.py b/pandas/tests/indexes/timedeltas/test_timedelta.py
new file mode 100644
index 0000000000000..d7745ffd94cd9
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_timedelta.py
@@ -0,0 +1,309 @@
+import warnings
+
+import pytest
+
+import numpy as np
+from datetime import timedelta
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import (timedelta_range, date_range, Series, Timedelta,
+                    TimedeltaIndex, Index, DataFrame,
+                    Int64Index)
+from pandas.util.testing import (assert_almost_equal, assert_series_equal,
+                                 assert_index_equal)
+
+from ..datetimelike import DatetimeLike
+
+randn = np.random.randn
+
+
+class TestTimedeltaIndex(DatetimeLike):
+    _holder = TimedeltaIndex
+
+    def setup_method(self, method):
+        self.indices = dict(index=tm.makeTimedeltaIndex(10))
+        self.setup_indices()
+
+    def create_index(self):
+        return pd.to_timedelta(range(5), unit='d') + pd.offsets.Hour(1)
+
+    def test_numeric_compat(self):
+        # Dummy method to override super's version; this test is now done
+        # in test_arithmetic.py
+        pass
+
+    def test_shift(self):
+        pass  # this is handled in test_arithmetic.py
+
+    def test_pickle_compat_construction(self):
+        pass
+
+    def test_fillna_timedelta(self):
+        # GH 11343
+        idx = pd.TimedeltaIndex(['1 day', pd.NaT, '3 day'])
+
+        exp = pd.TimedeltaIndex(['1 day', '2 day', '3 day'])
+        tm.assert_index_equal(idx.fillna(pd.Timedelta('2 day')), exp)
+
+        exp = pd.TimedeltaIndex(['1 day', '3 hour', '3 day'])
+        idx.fillna(pd.Timedelta('3 hour'))
+
+        exp = pd.Index(
+            [pd.Timedelta('1 day'), 'x', pd.Timedelta('3 day')], dtype=object)
+        tm.assert_index_equal(idx.fillna('x'), exp)
+
+    def test_difference_freq(self):
+        # GH14323: Difference of TimedeltaIndex should not preserve frequency
+
+        index = timedelta_range("0 days", "5 days", freq="D")
+
+        other = timedelta_range("1 days", "4 days", freq="D")
+        expected = TimedeltaIndex(["0 days", "5 days"], freq=None)
+        idx_diff = index.difference(other)
+        tm.assert_index_equal(idx_diff, expected)
+        tm.assert_attr_equal('freq', idx_diff, expected)
+
+        other = timedelta_range("2 days", "5 days", freq="D")
+        idx_diff = index.difference(other)
+        expected = TimedeltaIndex(["0 days", "1 days"], freq=None)
+        tm.assert_index_equal(idx_diff, expected)
+        tm.assert_attr_equal('freq', idx_diff, expected)
+
+    def test_isin(self):
+
+        index = tm.makeTimedeltaIndex(4)
+        result = index.isin(index)
+        assert result.all()
+
+        result = index.isin(list(index))
+        assert result.all()
+
+        assert_almost_equal(index.isin([index[2], 5]),
+                            np.array([False, False, True, False]))
+
+    def test_factorize(self):
+        idx1 = TimedeltaIndex(['1 day', '1 day', '2 day', '2 day', '3 day',
+                               '3 day'])
+
+        exp_arr = np.array([0, 0, 1, 1, 2, 2], dtype=np.intp)
+        exp_idx = TimedeltaIndex(['1 day', '2 day', '3 day'])
+
+        arr, idx = idx1.factorize()
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, exp_idx)
+
+        arr, idx = idx1.factorize(sort=True)
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, exp_idx)
+
+        # freq must be preserved
+        idx3 = timedelta_range('1 day', periods=4, freq='s')
+        exp_arr = np.array([0, 1, 2, 3], dtype=np.intp)
+        arr, idx = idx3.factorize()
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, idx3)
+
+    def test_join_self(self, join_type):
+        index = timedelta_range('1 day', periods=10)
+        joined = index.join(index, how=join_type)
+        tm.assert_index_equal(index, joined)
+
+    def test_does_not_convert_mixed_integer(self):
+        df = tm.makeCustomDataframe(10, 10,
+                                    data_gen_f=lambda *args, **kwargs: randn(),
+                                    r_idx_type='i', c_idx_type='td')
+        str(df)
+
+        cols = df.columns.join(df.index, how='outer')
+        joined = cols.join(df.columns)
+        assert cols.dtype == np.dtype('O')
+        assert cols.dtype == joined.dtype
+        tm.assert_index_equal(cols, joined)
+
+    def test_sort_values(self):
+
+        idx = TimedeltaIndex(['4d', '1d', '2d'])
+
+        ordered = idx.sort_values()
+        assert ordered.is_monotonic
+
+        ordered = idx.sort_values(ascending=False)
+        assert ordered[::-1].is_monotonic
+
+        ordered, dexer = idx.sort_values(return_indexer=True)
+        assert ordered.is_monotonic
+
+        tm.assert_numpy_array_equal(dexer, np.array([1, 2, 0]),
+                                    check_dtype=False)
+
+        ordered, dexer = idx.sort_values(return_indexer=True, ascending=False)
+        assert ordered[::-1].is_monotonic
+
+        tm.assert_numpy_array_equal(dexer, np.array([0, 2, 1]),
+                                    check_dtype=False)
+
+    def test_get_duplicates(self):
+        idx = TimedeltaIndex(['1 day', '2 day', '2 day', '3 day', '3day',
+                              '4day'])
+
+        with warnings.catch_warnings(record=True):
+            # Deprecated - see GH20239
+            result = idx.get_duplicates()
+
+        ex = TimedeltaIndex(['2 day', '3day'])
+        tm.assert_index_equal(result, ex)
+
+    def test_argmin_argmax(self):
+        idx = TimedeltaIndex(['1 day 00:00:05', '1 day 00:00:01',
+                              '1 day 00:00:02'])
+        assert idx.argmin() == 1
+        assert idx.argmax() == 0
+
+    def test_misc_coverage(self):
+
+        rng = timedelta_range('1 day', periods=5)
+        result = rng.groupby(rng.days)
+        assert isinstance(list(result.values())[0][0], Timedelta)
+
+        idx = TimedeltaIndex(['3d', '1d', '2d'])
+        assert not idx.equals(list(idx))
+
+        non_td = Index(list('abc'))
+        assert not idx.equals(list(non_td))
+
+    def test_map(self):
+        # test_map_dictlike generally tests
+
+        rng = timedelta_range('1 day', periods=10)
+
+        f = lambda x: x.days
+        result = rng.map(f)
+        exp = Int64Index([f(x) for x in rng])
+        tm.assert_index_equal(result, exp)
+
+    def test_pass_TimedeltaIndex_to_index(self):
+
+        rng = timedelta_range('1 days', '10 days')
+        idx = Index(rng, dtype=object)
+
+        expected = Index(rng.to_pytimedelta(), dtype=object)
+
+        tm.assert_numpy_array_equal(idx.values, expected.values)
+
+    def test_pickle(self):
+
+        rng = timedelta_range('1 days', periods=10)
+        rng_p = tm.round_trip_pickle(rng)
+        tm.assert_index_equal(rng, rng_p)
+
+    def test_hash_error(self):
+        index = timedelta_range('1 days', periods=10)
+        with tm.assert_raises_regex(TypeError, "unhashable type: %r" %
+                                    type(index).__name__):
+            hash(index)
+
+    def test_append_join_nondatetimeindex(self):
+        rng = timedelta_range('1 days', periods=10)
+        idx = Index(['a', 'b', 'c', 'd'])
+
+        result = rng.append(idx)
+        assert isinstance(result[0], Timedelta)
+
+        # it works
+        rng.join(idx, how='outer')
+
+    def test_append_numpy_bug_1681(self):
+
+        td = timedelta_range('1 days', '10 days', freq='2D')
+        a = DataFrame()
+        c = DataFrame({'A': 'foo', 'B': td}, index=td)
+        str(c)
+
+        result = a.append(c)
+        assert (result['B'] == td).all()
+
+    def test_fields(self):
+        rng = timedelta_range('1 days, 10:11:12.100123456', periods=2,
+                              freq='s')
+        tm.assert_index_equal(rng.days, Index([1, 1], dtype='int64'))
+        tm.assert_index_equal(
+            rng.seconds,
+            Index([10 * 3600 + 11 * 60 + 12, 10 * 3600 + 11 * 60 + 13],
+                  dtype='int64'))
+        tm.assert_index_equal(
+            rng.microseconds,
+            Index([100 * 1000 + 123, 100 * 1000 + 123], dtype='int64'))
+        tm.assert_index_equal(rng.nanoseconds,
+                              Index([456, 456], dtype='int64'))
+
+        pytest.raises(AttributeError, lambda: rng.hours)
+        pytest.raises(AttributeError, lambda: rng.minutes)
+        pytest.raises(AttributeError, lambda: rng.milliseconds)
+
+        # with nat
+        s = Series(rng)
+        s[1] = np.nan
+
+        tm.assert_series_equal(s.dt.days, Series([1, np.nan], index=[0, 1]))
+        tm.assert_series_equal(s.dt.seconds, Series(
+            [10 * 3600 + 11 * 60 + 12, np.nan], index=[0, 1]))
+
+        # preserve name (GH15589)
+        rng.name = 'name'
+        assert rng.days.name == 'name'
+
+    def test_freq_conversion(self):
+
+        # doc example
+
+        # series
+        td = Series(date_range('20130101', periods=4)) - \
+            Series(date_range('20121201', periods=4))
+        td[2] += timedelta(minutes=5, seconds=3)
+        td[3] = np.nan
+
+        result = td / np.timedelta64(1, 'D')
+        expected = Series([31, 31, (31 * 86400 + 5 * 60 + 3) / 86400.0, np.nan
+                           ])
+        assert_series_equal(result, expected)
+
+        result = td.astype('timedelta64[D]')
+        expected = Series([31, 31, 31, np.nan])
+        assert_series_equal(result, expected)
+
+        result = td / np.timedelta64(1, 's')
+        expected = Series([31 * 86400, 31 * 86400, 31 * 86400 + 5 * 60 + 3,
+                           np.nan])
+        assert_series_equal(result, expected)
+
+        result = td.astype('timedelta64[s]')
+        assert_series_equal(result, expected)
+
+        # tdi
+        td = TimedeltaIndex(td)
+
+        result = td / np.timedelta64(1, 'D')
+        expected = Index([31, 31, (31 * 86400 + 5 * 60 + 3) / 86400.0, np.nan])
+        assert_index_equal(result, expected)
+
+        result = td.astype('timedelta64[D]')
+        expected = Index([31, 31, 31, np.nan])
+        assert_index_equal(result, expected)
+
+        result = td / np.timedelta64(1, 's')
+        expected = Index([31 * 86400, 31 * 86400, 31 * 86400 + 5 * 60 + 3,
+                          np.nan])
+        assert_index_equal(result, expected)
+
+        result = td.astype('timedelta64[s]')
+        assert_index_equal(result, expected)
+
+
+class TestTimeSeries(object):
+
+    def test_series_box_timedelta(self):
+        rng = timedelta_range('1 day 1 s', periods=5, freq='h')
+        s = Series(rng)
+        assert isinstance(s[1], Timedelta)
+        assert isinstance(s.iat[2], Timedelta)
diff --git a/pandas/tests/indexes/timedeltas/test_timedelta_range.py b/pandas/tests/indexes/timedeltas/test_timedelta_range.py
new file mode 100644
index 0000000000000..87dff74cd04d7
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_timedelta_range.py
@@ -0,0 +1,77 @@
+import pytest
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.tseries.offsets import Day, Second
+from pandas import to_timedelta, timedelta_range
+
+
+class TestTimedeltas(object):
+
+    def test_timedelta_range(self):
+
+        expected = to_timedelta(np.arange(5), unit='D')
+        result = timedelta_range('0 days', periods=5, freq='D')
+        tm.assert_index_equal(result, expected)
+
+        expected = to_timedelta(np.arange(11), unit='D')
+        result = timedelta_range('0 days', '10 days', freq='D')
+        tm.assert_index_equal(result, expected)
+
+        expected = to_timedelta(np.arange(5), unit='D') + Second(2) + Day()
+        result = timedelta_range('1 days, 00:00:02', '5 days, 00:00:02',
+                                 freq='D')
+        tm.assert_index_equal(result, expected)
+
+        expected = to_timedelta([1, 3, 5, 7, 9], unit='D') + Second(2)
+        result = timedelta_range('1 days, 00:00:02', periods=5, freq='2D')
+        tm.assert_index_equal(result, expected)
+
+        expected = to_timedelta(np.arange(50), unit='T') * 30
+        result = timedelta_range('0 days', freq='30T', periods=50)
+        tm.assert_index_equal(result, expected)
+
+        # GH 11776
+        arr = np.arange(10).reshape(2, 5)
+        df = pd.DataFrame(np.arange(10).reshape(2, 5))
+        for arg in (arr, df):
+            with tm.assert_raises_regex(TypeError, "1-d array"):
+                to_timedelta(arg)
+            for errors in ['ignore', 'raise', 'coerce']:
+                with tm.assert_raises_regex(TypeError, "1-d array"):
+                    to_timedelta(arg, errors=errors)
+
+        # issue10583
+        df = pd.DataFrame(np.random.normal(size=(10, 4)))
+        df.index = pd.timedelta_range(start='0s', periods=10, freq='s')
+        expected = df.loc[pd.Timedelta('0s'):, :]
+        result = df.loc['0s':, :]
+        tm.assert_frame_equal(expected, result)
+
+    @pytest.mark.parametrize('periods, freq', [
+        (3, '2D'), (5, 'D'), (6, '19H12T'), (7, '16H'), (9, '12H')])
+    def test_linspace_behavior(self, periods, freq):
+        # GH 20976
+        result = timedelta_range(start='0 days', end='4 days', periods=periods)
+        expected = timedelta_range(start='0 days', end='4 days', freq=freq)
+        tm.assert_index_equal(result, expected)
+
+    def test_errors(self):
+        # not enough params
+        msg = ('Of the four parameters: start, end, periods, and freq, '
+               'exactly three must be specified')
+        with tm.assert_raises_regex(ValueError, msg):
+            timedelta_range(start='0 days')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            timedelta_range(end='5 days')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            timedelta_range(periods=2)
+
+        with tm.assert_raises_regex(ValueError, msg):
+            timedelta_range()
+
+        # too many params
+        with tm.assert_raises_regex(ValueError, msg):
+            timedelta_range(start='0 days', end='5 days', periods=10, freq='H')
diff --git a/pandas/tests/indexes/timedeltas/test_tools.py b/pandas/tests/indexes/timedeltas/test_tools.py
new file mode 100644
index 0000000000000..daa9739132d9e
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_tools.py
@@ -0,0 +1,174 @@
+import pytest
+
+from datetime import time, timedelta
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.util.testing import assert_series_equal
+from pandas import Series, to_timedelta, isna, TimedeltaIndex
+from pandas._libs.tslib import iNaT
+
+
+class TestTimedeltas(object):
+
+    def test_to_timedelta(self):
+        def conv(v):
+            return v.astype('m8[ns]')
+
+        d1 = np.timedelta64(1, 'D')
+
+        assert (to_timedelta('1 days 06:05:01.00003', box=False) ==
+                conv(d1 + np.timedelta64(6 * 3600 + 5 * 60 + 1, 's') +
+                     np.timedelta64(30, 'us')))
+        assert (to_timedelta('15.5us', box=False) ==
+                conv(np.timedelta64(15500, 'ns')))
+
+        # empty string
+        result = to_timedelta('', box=False)
+        assert result.astype('int64') == iNaT
+
+        result = to_timedelta(['', ''])
+        assert isna(result).all()
+
+        # pass thru
+        result = to_timedelta(np.array([np.timedelta64(1, 's')]))
+        expected = pd.Index(np.array([np.timedelta64(1, 's')]))
+        tm.assert_index_equal(result, expected)
+
+        # ints
+        result = np.timedelta64(0, 'ns')
+        expected = to_timedelta(0, box=False)
+        assert result == expected
+
+        # Series
+        expected = Series([timedelta(days=1), timedelta(days=1, seconds=1)])
+        result = to_timedelta(Series(['1d', '1days 00:00:01']))
+        tm.assert_series_equal(result, expected)
+
+        # with units
+        result = TimedeltaIndex([np.timedelta64(0, 'ns'), np.timedelta64(
+            10, 's').astype('m8[ns]')])
+        expected = to_timedelta([0, 10], unit='s')
+        tm.assert_index_equal(result, expected)
+
+        # single element conversion
+        v = timedelta(seconds=1)
+        result = to_timedelta(v, box=False)
+        expected = np.timedelta64(timedelta(seconds=1))
+        assert result == expected
+
+        v = np.timedelta64(timedelta(seconds=1))
+        result = to_timedelta(v, box=False)
+        expected = np.timedelta64(timedelta(seconds=1))
+        assert result == expected
+
+        # arrays of various dtypes
+        arr = np.array([1] * 5, dtype='int64')
+        result = to_timedelta(arr, unit='s')
+        expected = TimedeltaIndex([np.timedelta64(1, 's')] * 5)
+        tm.assert_index_equal(result, expected)
+
+        arr = np.array([1] * 5, dtype='int64')
+        result = to_timedelta(arr, unit='m')
+        expected = TimedeltaIndex([np.timedelta64(1, 'm')] * 5)
+        tm.assert_index_equal(result, expected)
+
+        arr = np.array([1] * 5, dtype='int64')
+        result = to_timedelta(arr, unit='h')
+        expected = TimedeltaIndex([np.timedelta64(1, 'h')] * 5)
+        tm.assert_index_equal(result, expected)
+
+        arr = np.array([1] * 5, dtype='timedelta64[s]')
+        result = to_timedelta(arr)
+        expected = TimedeltaIndex([np.timedelta64(1, 's')] * 5)
+        tm.assert_index_equal(result, expected)
+
+        arr = np.array([1] * 5, dtype='timedelta64[D]')
+        result = to_timedelta(arr)
+        expected = TimedeltaIndex([np.timedelta64(1, 'D')] * 5)
+        tm.assert_index_equal(result, expected)
+
+        # Test with lists as input when box=false
+        expected = np.array(np.arange(3) * 1000000000, dtype='timedelta64[ns]')
+        result = to_timedelta(range(3), unit='s', box=False)
+        tm.assert_numpy_array_equal(expected, result)
+
+        result = to_timedelta(np.arange(3), unit='s', box=False)
+        tm.assert_numpy_array_equal(expected, result)
+
+        result = to_timedelta([0, 1, 2], unit='s', box=False)
+        tm.assert_numpy_array_equal(expected, result)
+
+        # Tests with fractional seconds as input:
+        expected = np.array(
+            [0, 500000000, 800000000, 1200000000], dtype='timedelta64[ns]')
+        result = to_timedelta([0., 0.5, 0.8, 1.2], unit='s', box=False)
+        tm.assert_numpy_array_equal(expected, result)
+
+    def test_to_timedelta_invalid(self):
+
+        # bad value for errors parameter
+        msg = "errors must be one of"
+        tm.assert_raises_regex(ValueError, msg, to_timedelta,
+                               ['foo'], errors='never')
+
+        # these will error
+        pytest.raises(ValueError, lambda: to_timedelta([1, 2], unit='foo'))
+        pytest.raises(ValueError, lambda: to_timedelta(1, unit='foo'))
+
+        # time not supported ATM
+        pytest.raises(ValueError, lambda: to_timedelta(time(second=1)))
+        assert to_timedelta(time(second=1), errors='coerce') is pd.NaT
+
+        pytest.raises(ValueError, lambda: to_timedelta(['foo', 'bar']))
+        tm.assert_index_equal(TimedeltaIndex([pd.NaT, pd.NaT]),
+                              to_timedelta(['foo', 'bar'], errors='coerce'))
+
+        tm.assert_index_equal(TimedeltaIndex(['1 day', pd.NaT, '1 min']),
+                              to_timedelta(['1 day', 'bar', '1 min'],
+                                           errors='coerce'))
+
+        # gh-13613: these should not error because errors='ignore'
+        invalid_data = 'apple'
+        assert invalid_data == to_timedelta(invalid_data, errors='ignore')
+
+        invalid_data = ['apple', '1 days']
+        tm.assert_numpy_array_equal(
+            np.array(invalid_data, dtype=object),
+            to_timedelta(invalid_data, errors='ignore'))
+
+        invalid_data = pd.Index(['apple', '1 days'])
+        tm.assert_index_equal(invalid_data, to_timedelta(
+            invalid_data, errors='ignore'))
+
+        invalid_data = Series(['apple', '1 days'])
+        tm.assert_series_equal(invalid_data, to_timedelta(
+            invalid_data, errors='ignore'))
+
+    def test_to_timedelta_via_apply(self):
+        # GH 5458
+        expected = Series([np.timedelta64(1, 's')])
+        result = Series(['00:00:01']).apply(to_timedelta)
+        tm.assert_series_equal(result, expected)
+
+        result = Series([to_timedelta('00:00:01')])
+        tm.assert_series_equal(result, expected)
+
+    def test_to_timedelta_on_missing_values(self):
+        # GH5438
+        timedelta_NaT = np.timedelta64('NaT')
+
+        actual = pd.to_timedelta(Series(['00:00:01', np.nan]))
+        expected = Series([np.timedelta64(1000000000, 'ns'),
+                           timedelta_NaT], dtype='<m8[ns]')
+        assert_series_equal(actual, expected)
+
+        actual = pd.to_timedelta(Series(['00:00:01', pd.NaT]))
+        assert_series_equal(actual, expected)
+
+        actual = pd.to_timedelta(np.nan)
+        assert actual.value == timedelta_NaT.astype('int64')
+
+        actual = pd.to_timedelta(pd.NaT)
+        assert actual.value == timedelta_NaT.astype('int64')
diff --git a/pandas/tests/indexing/__init__.py b/pandas/tests/indexing/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/indexing/common.py b/pandas/tests/indexing/common.py
new file mode 100644
index 0000000000000..a77c170221bea
--- /dev/null
+++ b/pandas/tests/indexing/common.py
@@ -0,0 +1,307 @@
+""" common utilities """
+
+import itertools
+from warnings import catch_warnings, filterwarnings
+import numpy as np
+
+from pandas.compat import lrange
+from pandas.core.dtypes.common import is_scalar
+from pandas import (Series, DataFrame, Panel, date_range, UInt64Index,
+                    Float64Index, MultiIndex)
+from pandas.util import testing as tm
+from pandas.io.formats.printing import pprint_thing
+
+_verbose = False
+
+
+def _mklbl(prefix, n):
+    return ["%s%s" % (prefix, i) for i in range(n)]
+
+
+def _axify(obj, key, axis):
+    # create a tuple accessor
+    axes = [slice(None)] * obj.ndim
+    axes[axis] = key
+    return tuple(axes)
+
+
+class Base(object):
+    """ indexing comprehensive base class """
+
+    _objs = set(['series', 'frame', 'panel'])
+    _typs = set(['ints', 'uints', 'labels', 'mixed',
+                 'ts', 'floats', 'empty', 'ts_rev', 'multi'])
+
+    def setup_method(self, method):
+
+        self.series_ints = Series(np.random.rand(4), index=lrange(0, 8, 2))
+        self.frame_ints = DataFrame(np.random.randn(4, 4),
+                                    index=lrange(0, 8, 2),
+                                    columns=lrange(0, 12, 3))
+        with catch_warnings(record=True):
+            self.panel_ints = Panel(np.random.rand(4, 4, 4),
+                                    items=lrange(0, 8, 2),
+                                    major_axis=lrange(0, 12, 3),
+                                    minor_axis=lrange(0, 16, 4))
+
+        self.series_uints = Series(np.random.rand(4),
+                                   index=UInt64Index(lrange(0, 8, 2)))
+        self.frame_uints = DataFrame(np.random.randn(4, 4),
+                                     index=UInt64Index(lrange(0, 8, 2)),
+                                     columns=UInt64Index(lrange(0, 12, 3)))
+        with catch_warnings(record=True):
+            self.panel_uints = Panel(np.random.rand(4, 4, 4),
+                                     items=UInt64Index(lrange(0, 8, 2)),
+                                     major_axis=UInt64Index(lrange(0, 12, 3)),
+                                     minor_axis=UInt64Index(lrange(0, 16, 4)))
+
+        self.series_floats = Series(np.random.rand(4),
+                                    index=Float64Index(range(0, 8, 2)))
+        self.frame_floats = DataFrame(np.random.randn(4, 4),
+                                      index=Float64Index(range(0, 8, 2)),
+                                      columns=Float64Index(range(0, 12, 3)))
+        with catch_warnings(record=True):
+            self.panel_floats = Panel(np.random.rand(4, 4, 4),
+                                      items=Float64Index(range(0, 8, 2)),
+                                      major_axis=Float64Index(range(0, 12, 3)),
+                                      minor_axis=Float64Index(range(0, 16, 4)))
+
+        m_idces = [MultiIndex.from_product([[1, 2], [3, 4]]),
+                   MultiIndex.from_product([[5, 6], [7, 8]]),
+                   MultiIndex.from_product([[9, 10], [11, 12]])]
+
+        self.series_multi = Series(np.random.rand(4),
+                                   index=m_idces[0])
+        self.frame_multi = DataFrame(np.random.randn(4, 4),
+                                     index=m_idces[0],
+                                     columns=m_idces[1])
+        with catch_warnings(record=True):
+            self.panel_multi = Panel(np.random.rand(4, 4, 4),
+                                     items=m_idces[0],
+                                     major_axis=m_idces[1],
+                                     minor_axis=m_idces[2])
+
+        self.series_labels = Series(np.random.randn(4), index=list('abcd'))
+        self.frame_labels = DataFrame(np.random.randn(4, 4),
+                                      index=list('abcd'), columns=list('ABCD'))
+        with catch_warnings(record=True):
+            self.panel_labels = Panel(np.random.randn(4, 4, 4),
+                                      items=list('abcd'),
+                                      major_axis=list('ABCD'),
+                                      minor_axis=list('ZYXW'))
+
+        self.series_mixed = Series(np.random.randn(4), index=[2, 4, 'null', 8])
+        self.frame_mixed = DataFrame(np.random.randn(4, 4),
+                                     index=[2, 4, 'null', 8])
+        with catch_warnings(record=True):
+            self.panel_mixed = Panel(np.random.randn(4, 4, 4),
+                                     items=[2, 4, 'null', 8])
+
+        self.series_ts = Series(np.random.randn(4),
+                                index=date_range('20130101', periods=4))
+        self.frame_ts = DataFrame(np.random.randn(4, 4),
+                                  index=date_range('20130101', periods=4))
+        with catch_warnings(record=True):
+            self.panel_ts = Panel(np.random.randn(4, 4, 4),
+                                  items=date_range('20130101', periods=4))
+
+        dates_rev = (date_range('20130101', periods=4)
+                     .sort_values(ascending=False))
+        self.series_ts_rev = Series(np.random.randn(4),
+                                    index=dates_rev)
+        self.frame_ts_rev = DataFrame(np.random.randn(4, 4),
+                                      index=dates_rev)
+        with catch_warnings(record=True):
+            self.panel_ts_rev = Panel(np.random.randn(4, 4, 4),
+                                      items=dates_rev)
+
+        self.frame_empty = DataFrame({})
+        self.series_empty = Series({})
+        with catch_warnings(record=True):
+            self.panel_empty = Panel({})
+
+        # form agglomerates
+        for o in self._objs:
+
+            d = dict()
+            for t in self._typs:
+                d[t] = getattr(self, '%s_%s' % (o, t), None)
+
+            setattr(self, o, d)
+
+    def generate_indices(self, f, values=False):
+        """ generate the indices
+        if values is True , use the axis values
+        is False, use the range
+        """
+
+        axes = f.axes
+        if values:
+            axes = [lrange(len(a)) for a in axes]
+
+        return itertools.product(*axes)
+
+    def get_result(self, obj, method, key, axis):
+        """ return the result for this obj with this key and this axis """
+
+        if isinstance(key, dict):
+            key = key[axis]
+
+        # use an artificial conversion to map the key as integers to the labels
+        # so ix can work for comparisons
+        if method == 'indexer':
+            method = 'ix'
+            key = obj._get_axis(axis)[key]
+
+        # in case we actually want 0 index slicing
+        with catch_warnings(record=True):
+            try:
+                xp = getattr(obj, method).__getitem__(_axify(obj, key, axis))
+            except:
+                xp = getattr(obj, method).__getitem__(key)
+
+        return xp
+
+    def get_value(self, f, i, values=False):
+        """ return the value for the location i """
+
+        # check against values
+        if values:
+            return f.values[i]
+
+        # this is equiv of f[col][row].....
+        # v = f
+        # for a in reversed(i):
+        #    v = v.__getitem__(a)
+        # return v
+        with catch_warnings(record=True):
+            return f.ix[i]
+
+    def check_values(self, f, func, values=False):
+
+        if f is None:
+            return
+        axes = f.axes
+        indicies = itertools.product(*axes)
+
+        for i in indicies:
+            result = getattr(f, func)[i]
+
+            # check against values
+            if values:
+                expected = f.values[i]
+            else:
+                expected = f
+                for a in reversed(i):
+                    expected = expected.__getitem__(a)
+
+            tm.assert_almost_equal(result, expected)
+
+    def check_result(self, name, method1, key1, method2, key2, typs=None,
+                     objs=None, axes=None, fails=None):
+        def _eq(t, o, a, obj, k1, k2):
+            """ compare equal for these 2 keys """
+
+            if a is not None and a > obj.ndim - 1:
+                return
+
+            def _print(result, error=None):
+                if error is not None:
+                    error = str(error)
+                v = ("%-16.16s [%-16.16s]: [typ->%-8.8s,obj->%-8.8s,"
+                     "key1->(%-4.4s),key2->(%-4.4s),axis->%s] %s" %
+                     (name, result, t, o, method1, method2, a, error or ''))
+                if _verbose:
+                    pprint_thing(v)
+
+            try:
+                rs = getattr(obj, method1).__getitem__(_axify(obj, k1, a))
+
+                try:
+                    xp = self.get_result(obj, method2, k2, a)
+                except:
+                    result = 'no comp'
+                    _print(result)
+                    return
+
+                detail = None
+
+                try:
+                    if is_scalar(rs) and is_scalar(xp):
+                        assert rs == xp
+                    elif xp.ndim == 1:
+                        tm.assert_series_equal(rs, xp)
+                    elif xp.ndim == 2:
+                        tm.assert_frame_equal(rs, xp)
+                    elif xp.ndim == 3:
+                        tm.assert_panel_equal(rs, xp)
+                    result = 'ok'
+                except AssertionError as e:
+                    detail = str(e)
+                    result = 'fail'
+
+                # reverse the checks
+                if fails is True:
+                    if result == 'fail':
+                        result = 'ok (fail)'
+
+                _print(result)
+                if not result.startswith('ok'):
+                    raise AssertionError(detail)
+
+            except AssertionError:
+                raise
+            except Exception as detail:
+
+                # if we are in fails, the ok, otherwise raise it
+                if fails is not None:
+                    if isinstance(detail, fails):
+                        result = 'ok (%s)' % type(detail).__name__
+                        _print(result)
+                        return
+
+                result = type(detail).__name__
+                raise AssertionError(_print(result, error=detail))
+
+        if typs is None:
+            typs = self._typs
+
+        if objs is None:
+            objs = self._objs
+
+        if axes is not None:
+            if not isinstance(axes, (tuple, list)):
+                axes = [axes]
+            else:
+                axes = list(axes)
+        else:
+            axes = [0, 1, 2]
+
+        # check
+        for o in objs:
+            if o not in self._objs:
+                continue
+
+            d = getattr(self, o)
+            for a in axes:
+                for t in typs:
+                    if t not in self._typs:
+                        continue
+
+                    obj = d[t]
+                    if obj is None:
+                        continue
+
+                    def _call(obj=obj):
+                        obj = obj.copy()
+
+                        k2 = key2
+                        _eq(t, o, a, obj, key1, k2)
+
+                    # Panel deprecations
+                    if isinstance(obj, Panel):
+                        with catch_warnings():
+                            filterwarnings("ignore", "\nPanel*", FutureWarning)
+                            _call()
+                    else:
+                        _call()
diff --git a/pandas/tests/indexing/interval/__init__.py b/pandas/tests/indexing/interval/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/indexing/interval/test_interval.py b/pandas/tests/indexing/interval/test_interval.py
new file mode 100644
index 0000000000000..f2f59159032a2
--- /dev/null
+++ b/pandas/tests/indexing/interval/test_interval.py
@@ -0,0 +1,267 @@
+import pytest
+import numpy as np
+import pandas as pd
+
+from pandas import Series, DataFrame, IntervalIndex, Interval
+import pandas.util.testing as tm
+
+
+class TestIntervalIndex(object):
+
+    def setup_method(self, method):
+        self.s = Series(np.arange(5), IntervalIndex.from_breaks(np.arange(6)))
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_loc_with_scalar(self):
+
+        s = self.s
+
+        expected = s.iloc[:3]
+        tm.assert_series_equal(expected, s.loc[:3])
+        tm.assert_series_equal(expected, s.loc[:2.5])
+        tm.assert_series_equal(expected, s.loc[0.1:2.5])
+        tm.assert_series_equal(expected, s.loc[-1:3])
+
+        expected = s.iloc[1:4]
+        tm.assert_series_equal(expected, s.loc[[1.5, 2.5, 3.5]])
+        tm.assert_series_equal(expected, s.loc[[2, 3, 4]])
+        tm.assert_series_equal(expected, s.loc[[1.5, 3, 4]])
+
+        expected = s.iloc[2:5]
+        tm.assert_series_equal(expected, s.loc[s >= 2])
+
+    # TODO: check this behavior is consistent with test_interval_new.py
+    def test_getitem_with_scalar(self):
+
+        s = self.s
+
+        expected = s.iloc[:3]
+        tm.assert_series_equal(expected, s[:3])
+        tm.assert_series_equal(expected, s[:2.5])
+        tm.assert_series_equal(expected, s[0.1:2.5])
+        tm.assert_series_equal(expected, s[-1:3])
+
+        expected = s.iloc[1:4]
+        tm.assert_series_equal(expected, s[[1.5, 2.5, 3.5]])
+        tm.assert_series_equal(expected, s[[2, 3, 4]])
+        tm.assert_series_equal(expected, s[[1.5, 3, 4]])
+
+        expected = s.iloc[2:5]
+        tm.assert_series_equal(expected, s[s >= 2])
+
+    # TODO: check this behavior is consistent with test_interval_new.py
+    @pytest.mark.parametrize('direction', ['increasing', 'decreasing'])
+    def test_nonoverlapping_monotonic(self, direction, closed):
+        tpls = [(0, 1), (2, 3), (4, 5)]
+        if direction == 'decreasing':
+            tpls = tpls[::-1]
+
+        idx = IntervalIndex.from_tuples(tpls, closed=closed)
+        s = Series(list('abc'), idx)
+
+        for key, expected in zip(idx.left, s):
+            if idx.closed_left:
+                assert s[key] == expected
+                assert s.loc[key] == expected
+            else:
+                with pytest.raises(KeyError):
+                    s[key]
+                with pytest.raises(KeyError):
+                    s.loc[key]
+
+        for key, expected in zip(idx.right, s):
+            if idx.closed_right:
+                assert s[key] == expected
+                assert s.loc[key] == expected
+            else:
+                with pytest.raises(KeyError):
+                    s[key]
+                with pytest.raises(KeyError):
+                    s.loc[key]
+
+        for key, expected in zip(idx.mid, s):
+            assert s[key] == expected
+            assert s.loc[key] == expected
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_with_interval(self):
+
+        s = self.s
+        expected = 0
+
+        result = s.loc[Interval(0, 1)]
+        assert result == expected
+
+        result = s[Interval(0, 1)]
+        assert result == expected
+
+        expected = s.iloc[3:5]
+        result = s.loc[Interval(3, 6)]
+        tm.assert_series_equal(expected, result)
+
+        expected = s.iloc[3:5]
+        result = s.loc[[Interval(3, 6)]]
+        tm.assert_series_equal(expected, result)
+
+        expected = s.iloc[3:5]
+        result = s.loc[[Interval(3, 5)]]
+        tm.assert_series_equal(expected, result)
+
+        # missing
+        with pytest.raises(KeyError):
+            s.loc[Interval(-2, 0)]
+
+        with pytest.raises(KeyError):
+            s[Interval(-2, 0)]
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(5, 6)]
+
+        with pytest.raises(KeyError):
+            s[Interval(5, 6)]
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_with_slices(self):
+
+        s = self.s
+
+        # slice of interval
+        with pytest.raises(NotImplementedError):
+            s.loc[Interval(3, 6):]
+
+        with pytest.raises(NotImplementedError):
+            s[Interval(3, 6):]
+
+        expected = s.iloc[3:5]
+        result = s[[Interval(3, 6)]]
+        tm.assert_series_equal(expected, result)
+
+        # slice of scalar with step != 1
+        with pytest.raises(ValueError):
+            s[0:4:2]
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_with_overlaps(self):
+
+        s = self.s
+        expected = s.iloc[[3, 4, 3, 4]]
+        result = s.loc[[Interval(3, 6), Interval(3, 6)]]
+        tm.assert_series_equal(expected, result)
+
+        idx = IntervalIndex.from_tuples([(1, 5), (3, 7)])
+        s = Series(range(len(idx)), index=idx)
+
+        result = s[4]
+        expected = s
+        tm.assert_series_equal(expected, result)
+
+        result = s[[4]]
+        expected = s
+        tm.assert_series_equal(expected, result)
+
+        result = s.loc[[4]]
+        expected = s
+        tm.assert_series_equal(expected, result)
+
+        result = s[Interval(3, 5)]
+        expected = s
+        tm.assert_series_equal(expected, result)
+
+        result = s.loc[Interval(3, 5)]
+        expected = s
+        tm.assert_series_equal(expected, result)
+
+        # doesn't intersect unique set of intervals
+        with pytest.raises(KeyError):
+            s[[Interval(3, 5)]]
+
+        with pytest.raises(KeyError):
+            s.loc[[Interval(3, 5)]]
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_non_unique(self):
+
+        idx = IntervalIndex.from_tuples([(1, 3), (3, 7)])
+
+        s = Series(range(len(idx)), index=idx)
+
+        result = s.loc[Interval(1, 3)]
+        assert result == 0
+
+        result = s.loc[[Interval(1, 3)]]
+        expected = s.iloc[0:1]
+        tm.assert_series_equal(expected, result)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_non_unique_moar(self):
+
+        idx = IntervalIndex.from_tuples([(1, 3), (1, 3), (3, 7)])
+        s = Series(range(len(idx)), index=idx)
+
+        result = s.loc[Interval(1, 3)]
+        expected = s.iloc[[0, 1]]
+        tm.assert_series_equal(expected, result)
+
+        # non-unique index and slices not allowed
+        with pytest.raises(ValueError):
+            s.loc[Interval(1, 3):]
+
+        with pytest.raises(ValueError):
+            s[Interval(1, 3):]
+
+        # non-unique
+        with pytest.raises(ValueError):
+            s[[Interval(1, 3)]]
+
+    # TODO: check this behavior is consistent with test_interval_new.py
+    def test_non_matching(self):
+        s = self.s
+
+        # this is a departure from our current
+        # indexin scheme, but simpler
+        with pytest.raises(KeyError):
+            s.loc[[-1, 3, 4, 5]]
+
+        with pytest.raises(KeyError):
+            s.loc[[-1, 3]]
+
+    def test_large_series(self):
+        s = Series(np.arange(1000000),
+                   index=IntervalIndex.from_breaks(np.arange(1000001)))
+
+        result1 = s.loc[:80000]
+        result2 = s.loc[0:80000]
+        result3 = s.loc[0:80000:1]
+        tm.assert_series_equal(result1, result2)
+        tm.assert_series_equal(result1, result3)
+
+    def test_loc_getitem_frame(self):
+
+        df = DataFrame({'A': range(10)})
+        s = pd.cut(df.A, 5)
+        df['B'] = s
+        df = df.set_index('B')
+
+        result = df.loc[4]
+        expected = df.iloc[4:6]
+        tm.assert_frame_equal(result, expected)
+
+        with pytest.raises(KeyError):
+            df.loc[10]
+
+        # single list-like
+        result = df.loc[[4]]
+        expected = df.iloc[4:6]
+        tm.assert_frame_equal(result, expected)
+
+        # non-unique
+        result = df.loc[[4, 5]]
+        expected = df.take([4, 5, 4, 5])
+        tm.assert_frame_equal(result, expected)
+
+        with pytest.raises(KeyError):
+            df.loc[[10]]
+
+        # partial missing
+        with pytest.raises(KeyError):
+            df.loc[[10, 4]]
diff --git a/pandas/tests/indexing/interval/test_interval_new.py b/pandas/tests/indexing/interval/test_interval_new.py
new file mode 100644
index 0000000000000..3eb5f38ba0c80
--- /dev/null
+++ b/pandas/tests/indexing/interval/test_interval_new.py
@@ -0,0 +1,247 @@
+import pytest
+import numpy as np
+
+from pandas import Series, IntervalIndex, Interval
+import pandas.util.testing as tm
+
+
+pytestmark = pytest.mark.skip(reason="new indexing tests for issue 16316")
+
+
+class TestIntervalIndex(object):
+
+    def setup_method(self, method):
+        self.s = Series(np.arange(5), IntervalIndex.from_breaks(np.arange(6)))
+
+    def test_loc_with_interval(self):
+
+        # loc with single label / list of labels:
+        #   - Intervals: only exact matches
+        #   - scalars: those that contain it
+
+        s = self.s
+
+        expected = 0
+        result = s.loc[Interval(0, 1)]
+        assert result == expected
+        result = s[Interval(0, 1)]
+        assert result == expected
+
+        expected = s.iloc[3:5]
+        result = s.loc[[Interval(3, 4), Interval(4, 5)]]
+        tm.assert_series_equal(expected, result)
+        result = s[[Interval(3, 4), Interval(4, 5)]]
+        tm.assert_series_equal(expected, result)
+
+        # missing or not exact
+        with pytest.raises(KeyError):
+            s.loc[Interval(3, 5, closed='left')]
+
+        with pytest.raises(KeyError):
+            s[Interval(3, 5, closed='left')]
+
+        with pytest.raises(KeyError):
+            s[Interval(3, 5)]
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(3, 5)]
+
+        with pytest.raises(KeyError):
+            s[Interval(3, 5)]
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(-2, 0)]
+
+        with pytest.raises(KeyError):
+            s[Interval(-2, 0)]
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(5, 6)]
+
+        with pytest.raises(KeyError):
+            s[Interval(5, 6)]
+
+    def test_loc_with_scalar(self):
+
+        # loc with single label / list of labels:
+        #   - Intervals: only exact matches
+        #   - scalars: those that contain it
+
+        s = self.s
+
+        assert s.loc[1] == 0
+        assert s.loc[1.5] == 1
+        assert s.loc[2] == 1
+
+        # TODO with __getitem__ same rules as loc, or positional ?
+        # assert s[1] == 0
+        # assert s[1.5] == 1
+        # assert s[2] == 1
+
+        expected = s.iloc[1:4]
+        tm.assert_series_equal(expected, s.loc[[1.5, 2.5, 3.5]])
+        tm.assert_series_equal(expected, s.loc[[2, 3, 4]])
+        tm.assert_series_equal(expected, s.loc[[1.5, 3, 4]])
+
+        expected = s.iloc[[1, 1, 2, 1]]
+        tm.assert_series_equal(expected, s.loc[[1.5, 2, 2.5, 1.5]])
+
+        expected = s.iloc[2:5]
+        tm.assert_series_equal(expected, s.loc[s >= 2])
+
+    def test_loc_with_slices(self):
+
+        # loc with slices:
+        #   - Interval objects: only works with exact matches
+        #   - scalars: only works for non-overlapping, monotonic intervals,
+        #     and start/stop select location based on the interval that
+        #     contains them:
+        #    (slice_loc(start, stop) == (idx.get_loc(start), idx.get_loc(stop))
+
+        s = self.s
+
+        # slice of interval
+
+        expected = s.iloc[:3]
+        result = s.loc[Interval(0, 1):Interval(2, 3)]
+        tm.assert_series_equal(expected, result)
+        result = s[Interval(0, 1):Interval(2, 3)]
+        tm.assert_series_equal(expected, result)
+
+        expected = s.iloc[4:]
+        result = s.loc[Interval(3, 4):]
+        tm.assert_series_equal(expected, result)
+        result = s[Interval(3, 4):]
+        tm.assert_series_equal(expected, result)
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(3, 6):]
+
+        with pytest.raises(KeyError):
+            s[Interval(3, 6):]
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(3, 4, closed='left'):]
+
+        with pytest.raises(KeyError):
+            s[Interval(3, 4, closed='left'):]
+
+        # TODO with non-existing intervals ?
+        # s.loc[Interval(-1, 0):Interval(2, 3)]
+
+        # slice of scalar
+
+        expected = s.iloc[:3]
+        tm.assert_series_equal(expected, s.loc[:3])
+        tm.assert_series_equal(expected, s.loc[:2.5])
+        tm.assert_series_equal(expected, s.loc[0.1:2.5])
+
+        # TODO should this work? (-1 is not contained in any of the Intervals)
+        # tm.assert_series_equal(expected, s.loc[-1:3])
+
+        # TODO with __getitem__ same rules as loc, or positional ?
+        # tm.assert_series_equal(expected, s[:3])
+        # tm.assert_series_equal(expected, s[:2.5])
+        # tm.assert_series_equal(expected, s[0.1:2.5])
+
+        # slice of scalar with step != 1
+        with pytest.raises(NotImplementedError):
+            s[0:4:2]
+
+    def test_loc_with_overlap(self):
+
+        idx = IntervalIndex.from_tuples([(1, 5), (3, 7)])
+        s = Series(range(len(idx)), index=idx)
+
+        # scalar
+        expected = s
+        result = s.loc[4]
+        tm.assert_series_equal(expected, result)
+
+        result = s[4]
+        tm.assert_series_equal(expected, result)
+
+        result = s.loc[[4]]
+        tm.assert_series_equal(expected, result)
+
+        result = s[[4]]
+        tm.assert_series_equal(expected, result)
+
+        # interval
+        expected = 0
+        result = s.loc[Interval(1, 5)]
+        tm.assert_series_equal(expected, result)
+
+        result = s[Interval(1, 5)]
+        tm.assert_series_equal(expected, result)
+
+        expected = s
+        result = s.loc[[Interval(1, 5), Interval(3, 7)]]
+        tm.assert_series_equal(expected, result)
+
+        result = s[[Interval(1, 5), Interval(3, 7)]]
+        tm.assert_series_equal(expected, result)
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(3, 5)]
+
+        with pytest.raises(KeyError):
+            s.loc[[Interval(3, 5)]]
+
+        with pytest.raises(KeyError):
+            s[Interval(3, 5)]
+
+        with pytest.raises(KeyError):
+            s[[Interval(3, 5)]]
+
+        # slices with interval (only exact matches)
+        expected = s
+        result = s.loc[Interval(1, 5):Interval(3, 7)]
+        tm.assert_series_equal(expected, result)
+
+        result = s[Interval(1, 5):Interval(3, 7)]
+        tm.assert_series_equal(expected, result)
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(1, 6):Interval(3, 8)]
+
+        with pytest.raises(KeyError):
+            s[Interval(1, 6):Interval(3, 8)]
+
+        # slices with scalar raise for overlapping intervals
+        # TODO KeyError is the appropriate error?
+        with pytest.raises(KeyError):
+            s.loc[1:4]
+
+    def test_non_unique(self):
+
+        idx = IntervalIndex.from_tuples([(1, 3), (3, 7)])
+        s = Series(range(len(idx)), index=idx)
+
+        result = s.loc[Interval(1, 3)]
+        assert result == 0
+
+        result = s.loc[[Interval(1, 3)]]
+        expected = s.iloc[0:1]
+        tm.assert_series_equal(expected, result)
+
+    def test_non_unique_moar(self):
+
+        idx = IntervalIndex.from_tuples([(1, 3), (1, 3), (3, 7)])
+        s = Series(range(len(idx)), index=idx)
+
+        expected = s.iloc[[0, 1]]
+        result = s.loc[Interval(1, 3)]
+        tm.assert_series_equal(expected, result)
+
+        expected = s
+        result = s.loc[Interval(1, 3):]
+        tm.assert_series_equal(expected, result)
+
+        expected = s
+        result = s[Interval(1, 3):]
+        tm.assert_series_equal(expected, result)
+
+        expected = s.iloc[[0, 1]]
+        result = s[[Interval(1, 3)]]
+        tm.assert_series_equal(expected, result)
diff --git a/pandas/tests/indexing/test_callable.py b/pandas/tests/indexing/test_callable.py
new file mode 100644
index 0000000000000..95b406517be62
--- /dev/null
+++ b/pandas/tests/indexing/test_callable.py
@@ -0,0 +1,267 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=W0612,E1101
+
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+
+
+class TestIndexingCallable(object):
+
+    def test_frame_loc_ix_callable(self):
+        # GH 11485
+        df = pd.DataFrame({'A': [1, 2, 3, 4], 'B': list('aabb'),
+                           'C': [1, 2, 3, 4]})
+        # iloc cannot use boolean Series (see GH3635)
+
+        # return bool indexer
+        res = df.loc[lambda x: x.A > 2]
+        tm.assert_frame_equal(res, df.loc[df.A > 2])
+
+        res = df.loc[lambda x: x.A > 2]
+        tm.assert_frame_equal(res, df.loc[df.A > 2])
+
+        res = df.loc[lambda x: x.A > 2, ]
+        tm.assert_frame_equal(res, df.loc[df.A > 2, ])
+
+        res = df.loc[lambda x: x.A > 2, ]
+        tm.assert_frame_equal(res, df.loc[df.A > 2, ])
+
+        res = df.loc[lambda x: x.B == 'b', :]
+        tm.assert_frame_equal(res, df.loc[df.B == 'b', :])
+
+        res = df.loc[lambda x: x.B == 'b', :]
+        tm.assert_frame_equal(res, df.loc[df.B == 'b', :])
+
+        res = df.loc[lambda x: x.A > 2, lambda x: x.columns == 'B']
+        tm.assert_frame_equal(res, df.loc[df.A > 2, [False, True, False]])
+
+        res = df.loc[lambda x: x.A > 2, lambda x: x.columns == 'B']
+        tm.assert_frame_equal(res, df.loc[df.A > 2, [False, True, False]])
+
+        res = df.loc[lambda x: x.A > 2, lambda x: 'B']
+        tm.assert_series_equal(res, df.loc[df.A > 2, 'B'])
+
+        res = df.loc[lambda x: x.A > 2, lambda x: 'B']
+        tm.assert_series_equal(res, df.loc[df.A > 2, 'B'])
+
+        res = df.loc[lambda x: x.A > 2, lambda x: ['A', 'B']]
+        tm.assert_frame_equal(res, df.loc[df.A > 2, ['A', 'B']])
+
+        res = df.loc[lambda x: x.A > 2, lambda x: ['A', 'B']]
+        tm.assert_frame_equal(res, df.loc[df.A > 2, ['A', 'B']])
+
+        res = df.loc[lambda x: x.A == 2, lambda x: ['A', 'B']]
+        tm.assert_frame_equal(res, df.loc[df.A == 2, ['A', 'B']])
+
+        res = df.loc[lambda x: x.A == 2, lambda x: ['A', 'B']]
+        tm.assert_frame_equal(res, df.loc[df.A == 2, ['A', 'B']])
+
+        # scalar
+        res = df.loc[lambda x: 1, lambda x: 'A']
+        assert res == df.loc[1, 'A']
+
+        res = df.loc[lambda x: 1, lambda x: 'A']
+        assert res == df.loc[1, 'A']
+
+    def test_frame_loc_ix_callable_mixture(self):
+        # GH 11485
+        df = pd.DataFrame({'A': [1, 2, 3, 4], 'B': list('aabb'),
+                           'C': [1, 2, 3, 4]})
+
+        res = df.loc[lambda x: x.A > 2, ['A', 'B']]
+        tm.assert_frame_equal(res, df.loc[df.A > 2, ['A', 'B']])
+
+        res = df.loc[lambda x: x.A > 2, ['A', 'B']]
+        tm.assert_frame_equal(res, df.loc[df.A > 2, ['A', 'B']])
+
+        res = df.loc[[2, 3], lambda x: ['A', 'B']]
+        tm.assert_frame_equal(res, df.loc[[2, 3], ['A', 'B']])
+
+        res = df.loc[[2, 3], lambda x: ['A', 'B']]
+        tm.assert_frame_equal(res, df.loc[[2, 3], ['A', 'B']])
+
+        res = df.loc[3, lambda x: ['A', 'B']]
+        tm.assert_series_equal(res, df.loc[3, ['A', 'B']])
+
+        res = df.loc[3, lambda x: ['A', 'B']]
+        tm.assert_series_equal(res, df.loc[3, ['A', 'B']])
+
+    def test_frame_loc_callable(self):
+        # GH 11485
+        df = pd.DataFrame({'X': [1, 2, 3, 4],
+                           'Y': list('aabb')},
+                          index=list('ABCD'))
+
+        # return label
+        res = df.loc[lambda x: ['A', 'C']]
+        tm.assert_frame_equal(res, df.loc[['A', 'C']])
+
+        res = df.loc[lambda x: ['A', 'C'], ]
+        tm.assert_frame_equal(res, df.loc[['A', 'C'], ])
+
+        res = df.loc[lambda x: ['A', 'C'], :]
+        tm.assert_frame_equal(res, df.loc[['A', 'C'], :])
+
+        res = df.loc[lambda x: ['A', 'C'], lambda x: 'X']
+        tm.assert_series_equal(res, df.loc[['A', 'C'], 'X'])
+
+        res = df.loc[lambda x: ['A', 'C'], lambda x: ['X']]
+        tm.assert_frame_equal(res, df.loc[['A', 'C'], ['X']])
+
+        # mixture
+        res = df.loc[['A', 'C'], lambda x: 'X']
+        tm.assert_series_equal(res, df.loc[['A', 'C'], 'X'])
+
+        res = df.loc[['A', 'C'], lambda x: ['X']]
+        tm.assert_frame_equal(res, df.loc[['A', 'C'], ['X']])
+
+        res = df.loc[lambda x: ['A', 'C'], 'X']
+        tm.assert_series_equal(res, df.loc[['A', 'C'], 'X'])
+
+        res = df.loc[lambda x: ['A', 'C'], ['X']]
+        tm.assert_frame_equal(res, df.loc[['A', 'C'], ['X']])
+
+    def test_frame_loc_callable_setitem(self):
+        # GH 11485
+        df = pd.DataFrame({'X': [1, 2, 3, 4],
+                           'Y': list('aabb')},
+                          index=list('ABCD'))
+
+        # return label
+        res = df.copy()
+        res.loc[lambda x: ['A', 'C']] = -20
+        exp = df.copy()
+        exp.loc[['A', 'C']] = -20
+        tm.assert_frame_equal(res, exp)
+
+        res = df.copy()
+        res.loc[lambda x: ['A', 'C'], :] = 20
+        exp = df.copy()
+        exp.loc[['A', 'C'], :] = 20
+        tm.assert_frame_equal(res, exp)
+
+        res = df.copy()
+        res.loc[lambda x: ['A', 'C'], lambda x: 'X'] = -1
+        exp = df.copy()
+        exp.loc[['A', 'C'], 'X'] = -1
+        tm.assert_frame_equal(res, exp)
+
+        res = df.copy()
+        res.loc[lambda x: ['A', 'C'], lambda x: ['X']] = [5, 10]
+        exp = df.copy()
+        exp.loc[['A', 'C'], ['X']] = [5, 10]
+        tm.assert_frame_equal(res, exp)
+
+        # mixture
+        res = df.copy()
+        res.loc[['A', 'C'], lambda x: 'X'] = np.array([-1, -2])
+        exp = df.copy()
+        exp.loc[['A', 'C'], 'X'] = np.array([-1, -2])
+        tm.assert_frame_equal(res, exp)
+
+        res = df.copy()
+        res.loc[['A', 'C'], lambda x: ['X']] = 10
+        exp = df.copy()
+        exp.loc[['A', 'C'], ['X']] = 10
+        tm.assert_frame_equal(res, exp)
+
+        res = df.copy()
+        res.loc[lambda x: ['A', 'C'], 'X'] = -2
+        exp = df.copy()
+        exp.loc[['A', 'C'], 'X'] = -2
+        tm.assert_frame_equal(res, exp)
+
+        res = df.copy()
+        res.loc[lambda x: ['A', 'C'], ['X']] = -4
+        exp = df.copy()
+        exp.loc[['A', 'C'], ['X']] = -4
+        tm.assert_frame_equal(res, exp)
+
+    def test_frame_iloc_callable(self):
+        # GH 11485
+        df = pd.DataFrame({'X': [1, 2, 3, 4],
+                           'Y': list('aabb')},
+                          index=list('ABCD'))
+
+        # return location
+        res = df.iloc[lambda x: [1, 3]]
+        tm.assert_frame_equal(res, df.iloc[[1, 3]])
+
+        res = df.iloc[lambda x: [1, 3], :]
+        tm.assert_frame_equal(res, df.iloc[[1, 3], :])
+
+        res = df.iloc[lambda x: [1, 3], lambda x: 0]
+        tm.assert_series_equal(res, df.iloc[[1, 3], 0])
+
+        res = df.iloc[lambda x: [1, 3], lambda x: [0]]
+        tm.assert_frame_equal(res, df.iloc[[1, 3], [0]])
+
+        # mixture
+        res = df.iloc[[1, 3], lambda x: 0]
+        tm.assert_series_equal(res, df.iloc[[1, 3], 0])
+
+        res = df.iloc[[1, 3], lambda x: [0]]
+        tm.assert_frame_equal(res, df.iloc[[1, 3], [0]])
+
+        res = df.iloc[lambda x: [1, 3], 0]
+        tm.assert_series_equal(res, df.iloc[[1, 3], 0])
+
+        res = df.iloc[lambda x: [1, 3], [0]]
+        tm.assert_frame_equal(res, df.iloc[[1, 3], [0]])
+
+    def test_frame_iloc_callable_setitem(self):
+        # GH 11485
+        df = pd.DataFrame({'X': [1, 2, 3, 4],
+                           'Y': list('aabb')},
+                          index=list('ABCD'))
+
+        # return location
+        res = df.copy()
+        res.iloc[lambda x: [1, 3]] = 0
+        exp = df.copy()
+        exp.iloc[[1, 3]] = 0
+        tm.assert_frame_equal(res, exp)
+
+        res = df.copy()
+        res.iloc[lambda x: [1, 3], :] = -1
+        exp = df.copy()
+        exp.iloc[[1, 3], :] = -1
+        tm.assert_frame_equal(res, exp)
+
+        res = df.copy()
+        res.iloc[lambda x: [1, 3], lambda x: 0] = 5
+        exp = df.copy()
+        exp.iloc[[1, 3], 0] = 5
+        tm.assert_frame_equal(res, exp)
+
+        res = df.copy()
+        res.iloc[lambda x: [1, 3], lambda x: [0]] = 25
+        exp = df.copy()
+        exp.iloc[[1, 3], [0]] = 25
+        tm.assert_frame_equal(res, exp)
+
+        # mixture
+        res = df.copy()
+        res.iloc[[1, 3], lambda x: 0] = -3
+        exp = df.copy()
+        exp.iloc[[1, 3], 0] = -3
+        tm.assert_frame_equal(res, exp)
+
+        res = df.copy()
+        res.iloc[[1, 3], lambda x: [0]] = -5
+        exp = df.copy()
+        exp.iloc[[1, 3], [0]] = -5
+        tm.assert_frame_equal(res, exp)
+
+        res = df.copy()
+        res.iloc[lambda x: [1, 3], 0] = 10
+        exp = df.copy()
+        exp.iloc[[1, 3], 0] = 10
+        tm.assert_frame_equal(res, exp)
+
+        res = df.copy()
+        res.iloc[lambda x: [1, 3], [0]] = [-5, -5]
+        exp = df.copy()
+        exp.iloc[[1, 3], [0]] = [-5, -5]
+        tm.assert_frame_equal(res, exp)
diff --git a/pandas/tests/indexing/test_categorical.py b/pandas/tests/indexing/test_categorical.py
new file mode 100644
index 0000000000000..634ad0d8160ed
--- /dev/null
+++ b/pandas/tests/indexing/test_categorical.py
@@ -0,0 +1,717 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+import pandas as pd
+import pandas.compat as compat
+import numpy as np
+from pandas import (Series, DataFrame, Timestamp, Categorical,
+                    CategoricalIndex, Interval, Index)
+from pandas.util.testing import assert_series_equal, assert_frame_equal
+from pandas.util import testing as tm
+from pandas.core.dtypes.common import is_categorical_dtype
+from pandas.api.types import CategoricalDtype as CDT
+from pandas.core.dtypes.dtypes import CategoricalDtype
+
+
+class TestCategoricalIndex(object):
+
+    def setup_method(self, method):
+
+        self.df = DataFrame({'A': np.arange(6, dtype='int64'),
+                             'B': Series(list('aabbca')).astype(
+                                 CDT(list('cab')))}).set_index('B')
+        self.df2 = DataFrame({'A': np.arange(6, dtype='int64'),
+                              'B': Series(list('aabbca')).astype(
+                                  CDT(list('cabe')))}).set_index('B')
+        self.df3 = DataFrame({'A': np.arange(6, dtype='int64'),
+                              'B': (Series([1, 1, 2, 1, 3, 2])
+                                    .astype(CDT([3, 2, 1], ordered=True)))
+                              }).set_index('B')
+        self.df4 = DataFrame({'A': np.arange(6, dtype='int64'),
+                              'B': (Series([1, 1, 2, 1, 3, 2])
+                                    .astype(CDT([3, 2, 1], ordered=False)))
+                              }).set_index('B')
+
+    def test_loc_scalar(self):
+        result = self.df.loc['a']
+        expected = (DataFrame({'A': [0, 1, 5],
+                               'B': (Series(list('aaa'))
+                                     .astype(CDT(list('cab'))))})
+                    .set_index('B'))
+        assert_frame_equal(result, expected)
+
+        df = self.df.copy()
+        df.loc['a'] = 20
+        expected = (DataFrame({'A': [20, 20, 2, 3, 4, 20],
+                               'B': (Series(list('aabbca'))
+                                     .astype(CDT(list('cab'))))})
+                    .set_index('B'))
+        assert_frame_equal(df, expected)
+
+        # value not in the categories
+        pytest.raises(KeyError, lambda: df.loc['d'])
+
+        def f():
+            df.loc['d'] = 10
+
+        pytest.raises(TypeError, f)
+
+        def f():
+            df.loc['d', 'A'] = 10
+
+        pytest.raises(TypeError, f)
+
+        def f():
+            df.loc['d', 'C'] = 10
+
+        pytest.raises(TypeError, f)
+
+    def test_getitem_scalar(self):
+
+        cats = Categorical([Timestamp('12-31-1999'),
+                            Timestamp('12-31-2000')])
+
+        s = Series([1, 2], index=cats)
+
+        expected = s.iloc[0]
+        result = s[cats[0]]
+        assert result == expected
+
+    def test_slicing_directly(self):
+        cat = Categorical(["a", "b", "c", "d", "a", "b", "c"])
+        sliced = cat[3]
+        assert sliced == "d"
+        sliced = cat[3:5]
+        expected = Categorical(["d", "a"], categories=['a', 'b', 'c', 'd'])
+        tm.assert_numpy_array_equal(sliced._codes, expected._codes)
+        tm.assert_index_equal(sliced.categories, expected.categories)
+
+    def test_slicing(self):
+        cat = Series(Categorical([1, 2, 3, 4]))
+        reversed = cat[::-1]
+        exp = np.array([4, 3, 2, 1], dtype=np.int64)
+        tm.assert_numpy_array_equal(reversed.__array__(), exp)
+
+        df = DataFrame({'value': (np.arange(100) + 1).astype('int64')})
+        df['D'] = pd.cut(df.value, bins=[0, 25, 50, 75, 100])
+
+        expected = Series([11, Interval(0, 25)], index=['value', 'D'], name=10)
+        result = df.iloc[10]
+        tm.assert_series_equal(result, expected)
+
+        expected = DataFrame({'value': np.arange(11, 21).astype('int64')},
+                             index=np.arange(10, 20).astype('int64'))
+        expected['D'] = pd.cut(expected.value, bins=[0, 25, 50, 75, 100])
+        result = df.iloc[10:20]
+        tm.assert_frame_equal(result, expected)
+
+        expected = Series([9, Interval(0, 25)], index=['value', 'D'], name=8)
+        result = df.loc[8]
+        tm.assert_series_equal(result, expected)
+
+    def test_slicing_and_getting_ops(self):
+
+        # systematically test the slicing operations:
+        #  for all slicing ops:
+        #   - returning a dataframe
+        #   - returning a column
+        #   - returning a row
+        #   - returning a single value
+
+        cats = Categorical(
+            ["a", "c", "b", "c", "c", "c", "c"], categories=["a", "b", "c"])
+        idx = Index(["h", "i", "j", "k", "l", "m", "n"])
+        values = [1, 2, 3, 4, 5, 6, 7]
+        df = DataFrame({"cats": cats, "values": values}, index=idx)
+
+        # the expected values
+        cats2 = Categorical(["b", "c"], categories=["a", "b", "c"])
+        idx2 = Index(["j", "k"])
+        values2 = [3, 4]
+
+        # 2:4,: | "j":"k",:
+        exp_df = DataFrame({"cats": cats2, "values": values2}, index=idx2)
+
+        # :,"cats" | :,0
+        exp_col = Series(cats, index=idx, name='cats')
+
+        # "j",: | 2,:
+        exp_row = Series(["b", 3], index=["cats", "values"], dtype="object",
+                         name="j")
+
+        # "j","cats | 2,0
+        exp_val = "b"
+
+        # iloc
+        # frame
+        res_df = df.iloc[2:4, :]
+        tm.assert_frame_equal(res_df, exp_df)
+        assert is_categorical_dtype(res_df["cats"])
+
+        # row
+        res_row = df.iloc[2, :]
+        tm.assert_series_equal(res_row, exp_row)
+        assert isinstance(res_row["cats"], compat.string_types)
+
+        # col
+        res_col = df.iloc[:, 0]
+        tm.assert_series_equal(res_col, exp_col)
+        assert is_categorical_dtype(res_col)
+
+        # single value
+        res_val = df.iloc[2, 0]
+        assert res_val == exp_val
+
+        # loc
+        # frame
+        res_df = df.loc["j":"k", :]
+        tm.assert_frame_equal(res_df, exp_df)
+        assert is_categorical_dtype(res_df["cats"])
+
+        # row
+        res_row = df.loc["j", :]
+        tm.assert_series_equal(res_row, exp_row)
+        assert isinstance(res_row["cats"], compat.string_types)
+
+        # col
+        res_col = df.loc[:, "cats"]
+        tm.assert_series_equal(res_col, exp_col)
+        assert is_categorical_dtype(res_col)
+
+        # single value
+        res_val = df.loc["j", "cats"]
+        assert res_val == exp_val
+
+        # ix
+        # frame
+        # res_df = df.loc["j":"k",[0,1]] # doesn't work?
+        res_df = df.loc["j":"k", :]
+        tm.assert_frame_equal(res_df, exp_df)
+        assert is_categorical_dtype(res_df["cats"])
+
+        # row
+        res_row = df.loc["j", :]
+        tm.assert_series_equal(res_row, exp_row)
+        assert isinstance(res_row["cats"], compat.string_types)
+
+        # col
+        res_col = df.loc[:, "cats"]
+        tm.assert_series_equal(res_col, exp_col)
+        assert is_categorical_dtype(res_col)
+
+        # single value
+        res_val = df.loc["j", df.columns[0]]
+        assert res_val == exp_val
+
+        # iat
+        res_val = df.iat[2, 0]
+        assert res_val == exp_val
+
+        # at
+        res_val = df.at["j", "cats"]
+        assert res_val == exp_val
+
+        # fancy indexing
+        exp_fancy = df.iloc[[2]]
+
+        res_fancy = df[df["cats"] == "b"]
+        tm.assert_frame_equal(res_fancy, exp_fancy)
+        res_fancy = df[df["values"] == 3]
+        tm.assert_frame_equal(res_fancy, exp_fancy)
+
+        # get_value
+        res_val = df.at["j", "cats"]
+        assert res_val == exp_val
+
+        # i : int, slice, or sequence of integers
+        res_row = df.iloc[2]
+        tm.assert_series_equal(res_row, exp_row)
+        assert isinstance(res_row["cats"], compat.string_types)
+
+        res_df = df.iloc[slice(2, 4)]
+        tm.assert_frame_equal(res_df, exp_df)
+        assert is_categorical_dtype(res_df["cats"])
+
+        res_df = df.iloc[[2, 3]]
+        tm.assert_frame_equal(res_df, exp_df)
+        assert is_categorical_dtype(res_df["cats"])
+
+        res_col = df.iloc[:, 0]
+        tm.assert_series_equal(res_col, exp_col)
+        assert is_categorical_dtype(res_col)
+
+        res_df = df.iloc[:, slice(0, 2)]
+        tm.assert_frame_equal(res_df, df)
+        assert is_categorical_dtype(res_df["cats"])
+
+        res_df = df.iloc[:, [0, 1]]
+        tm.assert_frame_equal(res_df, df)
+        assert is_categorical_dtype(res_df["cats"])
+
+    def test_slicing_doc_examples(self):
+
+        # GH 7918
+        cats = Categorical(["a", "b", "b", "b", "c", "c", "c"],
+                           categories=["a", "b", "c"])
+        idx = Index(["h", "i", "j", "k", "l", "m", "n", ])
+        values = [1, 2, 2, 2, 3, 4, 5]
+        df = DataFrame({"cats": cats, "values": values}, index=idx)
+
+        result = df.iloc[2:4, :]
+        expected = DataFrame(
+            {"cats": Categorical(['b', 'b'], categories=['a', 'b', 'c']),
+             "values": [2, 2]}, index=['j', 'k'])
+        tm.assert_frame_equal(result, expected)
+
+        result = df.iloc[2:4, :].dtypes
+        expected = Series(['category', 'int64'], ['cats', 'values'])
+        tm.assert_series_equal(result, expected)
+
+        result = df.loc["h":"j", "cats"]
+        expected = Series(Categorical(['a', 'b', 'b'],
+                                      categories=['a', 'b', 'c']),
+                          index=['h', 'i', 'j'], name='cats')
+        tm.assert_series_equal(result, expected)
+
+        result = df.loc["h":"j", df.columns[0:1]]
+        expected = DataFrame({'cats': Categorical(['a', 'b', 'b'],
+                                                  categories=['a', 'b', 'c'])},
+                             index=['h', 'i', 'j'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_getitem_category_type(self):
+        # GH 14580
+        # test iloc() on Series with Categorical data
+
+        s = Series([1, 2, 3]).astype('category')
+
+        # get slice
+        result = s.iloc[0:2]
+        expected = Series([1, 2]).astype(CategoricalDtype([1, 2, 3]))
+        tm.assert_series_equal(result, expected)
+
+        # get list of indexes
+        result = s.iloc[[0, 1]]
+        expected = Series([1, 2]).astype(CategoricalDtype([1, 2, 3]))
+        tm.assert_series_equal(result, expected)
+
+        # get boolean array
+        result = s.iloc[[True, False, False]]
+        expected = Series([1]).astype(CategoricalDtype([1, 2, 3]))
+        tm.assert_series_equal(result, expected)
+
+    def test_loc_listlike(self):
+
+        # list of labels
+        result = self.df.loc[['c', 'a']]
+        expected = self.df.iloc[[4, 0, 1, 5]]
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        result = self.df2.loc[['a', 'b', 'e']]
+        exp_index = CategoricalIndex(
+            list('aaabbe'), categories=list('cabe'), name='B')
+        expected = DataFrame({'A': [0, 1, 5, 2, 3, np.nan]}, index=exp_index)
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        # element in the categories but not in the values
+        pytest.raises(KeyError, lambda: self.df2.loc['e'])
+
+        # assign is ok
+        df = self.df2.copy()
+        df.loc['e'] = 20
+        result = df.loc[['a', 'b', 'e']]
+        exp_index = CategoricalIndex(
+            list('aaabbe'), categories=list('cabe'), name='B')
+        expected = DataFrame({'A': [0, 1, 5, 2, 3, 20]}, index=exp_index)
+        assert_frame_equal(result, expected)
+
+        df = self.df2.copy()
+        result = df.loc[['a', 'b', 'e']]
+        exp_index = CategoricalIndex(
+            list('aaabbe'), categories=list('cabe'), name='B')
+        expected = DataFrame({'A': [0, 1, 5, 2, 3, np.nan]}, index=exp_index)
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        # not all labels in the categories
+        with pytest.raises(KeyError):
+            self.df2.loc[['a', 'd']]
+
+    def test_loc_listlike_dtypes(self):
+        # GH 11586
+
+        # unique categories and codes
+        index = CategoricalIndex(['a', 'b', 'c'])
+        df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]}, index=index)
+
+        # unique slice
+        res = df.loc[['a', 'b']]
+        exp_index = CategoricalIndex(['a', 'b'],
+                                     categories=index.categories)
+        exp = DataFrame({'A': [1, 2], 'B': [4, 5]}, index=exp_index)
+        tm.assert_frame_equal(res, exp, check_index_type=True)
+
+        # duplicated slice
+        res = df.loc[['a', 'a', 'b']]
+
+        exp_index = CategoricalIndex(['a', 'a', 'b'],
+                                     categories=index.categories)
+        exp = DataFrame({'A': [1, 1, 2], 'B': [4, 4, 5]}, index=exp_index)
+        tm.assert_frame_equal(res, exp, check_index_type=True)
+
+        with tm.assert_raises_regex(
+                KeyError,
+                'a list-indexer must only include values that are '
+                'in the categories'):
+            df.loc[['a', 'x']]
+
+        # duplicated categories and codes
+        index = CategoricalIndex(['a', 'b', 'a'])
+        df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]}, index=index)
+
+        # unique slice
+        res = df.loc[['a', 'b']]
+        exp = DataFrame({'A': [1, 3, 2],
+                         'B': [4, 6, 5]},
+                        index=CategoricalIndex(['a', 'a', 'b']))
+        tm.assert_frame_equal(res, exp, check_index_type=True)
+
+        # duplicated slice
+        res = df.loc[['a', 'a', 'b']]
+        exp = DataFrame(
+            {'A': [1, 3, 1, 3, 2],
+             'B': [4, 6, 4, 6, 5
+                   ]}, index=CategoricalIndex(['a', 'a', 'a', 'a', 'b']))
+        tm.assert_frame_equal(res, exp, check_index_type=True)
+
+        with tm.assert_raises_regex(
+                KeyError,
+                'a list-indexer must only include values '
+                'that are in the categories'):
+            df.loc[['a', 'x']]
+
+        # contains unused category
+        index = CategoricalIndex(
+            ['a', 'b', 'a', 'c'], categories=list('abcde'))
+        df = DataFrame({'A': [1, 2, 3, 4], 'B': [5, 6, 7, 8]}, index=index)
+
+        res = df.loc[['a', 'b']]
+        exp = DataFrame({'A': [1, 3, 2], 'B': [5, 7, 6]},
+                        index=CategoricalIndex(['a', 'a', 'b'],
+                                               categories=list('abcde')))
+        tm.assert_frame_equal(res, exp, check_index_type=True)
+
+        res = df.loc[['a', 'e']]
+        exp = DataFrame({'A': [1, 3, np.nan], 'B': [5, 7, np.nan]},
+                        index=CategoricalIndex(['a', 'a', 'e'],
+                                               categories=list('abcde')))
+        tm.assert_frame_equal(res, exp, check_index_type=True)
+
+        # duplicated slice
+        res = df.loc[['a', 'a', 'b']]
+        exp = DataFrame({'A': [1, 3, 1, 3, 2], 'B': [5, 7, 5, 7, 6]},
+                        index=CategoricalIndex(['a', 'a', 'a', 'a', 'b'],
+                                               categories=list('abcde')))
+        tm.assert_frame_equal(res, exp, check_index_type=True)
+
+        with tm.assert_raises_regex(
+                KeyError,
+                'a list-indexer must only include values '
+                'that are in the categories'):
+            df.loc[['a', 'x']]
+
+    def test_get_indexer_array(self):
+        arr = np.array([Timestamp('1999-12-31 00:00:00'),
+                        Timestamp('2000-12-31 00:00:00')], dtype=object)
+        cats = [Timestamp('1999-12-31 00:00:00'),
+                Timestamp('2000-12-31 00:00:00')]
+        ci = CategoricalIndex(cats,
+                              categories=cats,
+                              ordered=False, dtype='category')
+        result = ci.get_indexer(arr)
+        expected = np.array([0, 1], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_get_indexer_same_categories_same_order(self):
+        ci = CategoricalIndex(['a', 'b'], categories=['a', 'b'])
+
+        result = ci.get_indexer(CategoricalIndex(['b', 'b'],
+                                                 categories=['a', 'b']))
+        expected = np.array([1, 1], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_get_indexer_same_categories_different_order(self):
+        # https://github.com/pandas-dev/pandas/issues/19551
+        ci = CategoricalIndex(['a', 'b'], categories=['a', 'b'])
+
+        result = ci.get_indexer(CategoricalIndex(['b', 'b'],
+                                                 categories=['b', 'a']))
+        expected = np.array([1, 1], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_getitem_with_listlike(self):
+        # GH 16115
+        cats = Categorical([Timestamp('12-31-1999'),
+                            Timestamp('12-31-2000')])
+
+        expected = DataFrame([[1, 0], [0, 1]], dtype='uint8',
+                             index=[0, 1], columns=cats)
+        dummies = pd.get_dummies(cats)
+        result = dummies[[c for c in dummies.columns]]
+        assert_frame_equal(result, expected)
+
+    def test_setitem_listlike(self):
+
+        # GH 9469
+        # properly coerce the input indexers
+        np.random.seed(1)
+        c = Categorical(np.random.randint(0, 5, size=150000).astype(
+            np.int8)).add_categories([-1000])
+        indexer = np.array([100000]).astype(np.int64)
+        c[indexer] = -1000
+
+        # we are asserting the code result here
+        # which maps to the -1000 category
+        result = c.codes[np.array([100000]).astype(np.int64)]
+        tm.assert_numpy_array_equal(result, np.array([5], dtype='int8'))
+
+    def test_ix_categorical_index(self):
+        # GH 12531
+        df = DataFrame(np.random.randn(3, 3),
+                       index=list('ABC'), columns=list('XYZ'))
+        cdf = df.copy()
+        cdf.index = CategoricalIndex(df.index)
+        cdf.columns = CategoricalIndex(df.columns)
+
+        expect = Series(df.loc['A', :], index=cdf.columns, name='A')
+        assert_series_equal(cdf.loc['A', :], expect)
+
+        expect = Series(df.loc[:, 'X'], index=cdf.index, name='X')
+        assert_series_equal(cdf.loc[:, 'X'], expect)
+
+        exp_index = CategoricalIndex(list('AB'), categories=['A', 'B', 'C'])
+        expect = DataFrame(df.loc[['A', 'B'], :], columns=cdf.columns,
+                           index=exp_index)
+        assert_frame_equal(cdf.loc[['A', 'B'], :], expect)
+
+        exp_columns = CategoricalIndex(list('XY'),
+                                       categories=['X', 'Y', 'Z'])
+        expect = DataFrame(df.loc[:, ['X', 'Y']], index=cdf.index,
+                           columns=exp_columns)
+        assert_frame_equal(cdf.loc[:, ['X', 'Y']], expect)
+
+        # non-unique
+        df = DataFrame(np.random.randn(3, 3),
+                       index=list('ABA'), columns=list('XYX'))
+        cdf = df.copy()
+        cdf.index = CategoricalIndex(df.index)
+        cdf.columns = CategoricalIndex(df.columns)
+
+        exp_index = CategoricalIndex(list('AA'), categories=['A', 'B'])
+        expect = DataFrame(df.loc['A', :], columns=cdf.columns,
+                           index=exp_index)
+        assert_frame_equal(cdf.loc['A', :], expect)
+
+        exp_columns = CategoricalIndex(list('XX'), categories=['X', 'Y'])
+        expect = DataFrame(df.loc[:, 'X'], index=cdf.index,
+                           columns=exp_columns)
+        assert_frame_equal(cdf.loc[:, 'X'], expect)
+
+        expect = DataFrame(df.loc[['A', 'B'], :], columns=cdf.columns,
+                           index=CategoricalIndex(list('AAB')))
+        assert_frame_equal(cdf.loc[['A', 'B'], :], expect)
+
+        expect = DataFrame(df.loc[:, ['X', 'Y']], index=cdf.index,
+                           columns=CategoricalIndex(list('XXY')))
+        assert_frame_equal(cdf.loc[:, ['X', 'Y']], expect)
+
+    def test_read_only_source(self):
+        # GH 10043
+        rw_array = np.eye(10)
+        rw_df = DataFrame(rw_array)
+
+        ro_array = np.eye(10)
+        ro_array.setflags(write=False)
+        ro_df = DataFrame(ro_array)
+
+        assert_frame_equal(rw_df.iloc[[1, 2, 3]], ro_df.iloc[[1, 2, 3]])
+        assert_frame_equal(rw_df.iloc[[1]], ro_df.iloc[[1]])
+        assert_series_equal(rw_df.iloc[1], ro_df.iloc[1])
+        assert_frame_equal(rw_df.iloc[1:3], ro_df.iloc[1:3])
+
+        assert_frame_equal(rw_df.loc[[1, 2, 3]], ro_df.loc[[1, 2, 3]])
+        assert_frame_equal(rw_df.loc[[1]], ro_df.loc[[1]])
+        assert_series_equal(rw_df.loc[1], ro_df.loc[1])
+        assert_frame_equal(rw_df.loc[1:3], ro_df.loc[1:3])
+
+    def test_reindexing(self):
+
+        # reindexing
+        # convert to a regular index
+        result = self.df2.reindex(['a', 'b', 'e'])
+        expected = DataFrame({'A': [0, 1, 5, 2, 3, np.nan],
+                              'B': Series(list('aaabbe'))}).set_index('B')
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        result = self.df2.reindex(['a', 'b'])
+        expected = DataFrame({'A': [0, 1, 5, 2, 3],
+                              'B': Series(list('aaabb'))}).set_index('B')
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        result = self.df2.reindex(['e'])
+        expected = DataFrame({'A': [np.nan],
+                              'B': Series(['e'])}).set_index('B')
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        result = self.df2.reindex(['d'])
+        expected = DataFrame({'A': [np.nan],
+                              'B': Series(['d'])}).set_index('B')
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        # since we are actually reindexing with a Categorical
+        # then return a Categorical
+        cats = list('cabe')
+
+        result = self.df2.reindex(Categorical(['a', 'd'], categories=cats))
+        expected = DataFrame({'A': [0, 1, 5, np.nan],
+                              'B': Series(list('aaad')).astype(
+                                  CDT(cats))}).set_index('B')
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        result = self.df2.reindex(Categorical(['a'], categories=cats))
+        expected = DataFrame({'A': [0, 1, 5],
+                              'B': Series(list('aaa')).astype(
+                                  CDT(cats))}).set_index('B')
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        result = self.df2.reindex(['a', 'b', 'e'])
+        expected = DataFrame({'A': [0, 1, 5, 2, 3, np.nan],
+                              'B': Series(list('aaabbe'))}).set_index('B')
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        result = self.df2.reindex(['a', 'b'])
+        expected = DataFrame({'A': [0, 1, 5, 2, 3],
+                              'B': Series(list('aaabb'))}).set_index('B')
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        result = self.df2.reindex(['e'])
+        expected = DataFrame({'A': [np.nan],
+                              'B': Series(['e'])}).set_index('B')
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        # give back the type of categorical that we received
+        result = self.df2.reindex(Categorical(
+            ['a', 'd'], categories=cats, ordered=True))
+        expected = DataFrame(
+            {'A': [0, 1, 5, np.nan],
+             'B': Series(list('aaad')).astype(
+                 CDT(cats, ordered=True))}).set_index('B')
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        result = self.df2.reindex(Categorical(
+            ['a', 'd'], categories=['a', 'd']))
+        expected = DataFrame({'A': [0, 1, 5, np.nan],
+                              'B': Series(list('aaad')).astype(
+                                  CDT(['a', 'd']))}).set_index('B')
+        assert_frame_equal(result, expected, check_index_type=True)
+
+        # passed duplicate indexers are not allowed
+        pytest.raises(ValueError, lambda: self.df2.reindex(['a', 'a']))
+
+        # args NotImplemented ATM
+        pytest.raises(NotImplementedError,
+                      lambda: self.df2.reindex(['a'], method='ffill'))
+        pytest.raises(NotImplementedError,
+                      lambda: self.df2.reindex(['a'], level=1))
+        pytest.raises(NotImplementedError,
+                      lambda: self.df2.reindex(['a'], limit=2))
+
+    def test_loc_slice(self):
+        # slicing
+        # not implemented ATM
+        # GH9748
+
+        pytest.raises(TypeError, lambda: self.df.loc[1:5])
+
+        # result = df.loc[1:5]
+        # expected = df.iloc[[1,2,3,4]]
+        # assert_frame_equal(result, expected)
+
+    def test_boolean_selection(self):
+
+        df3 = self.df3
+        df4 = self.df4
+
+        result = df3[df3.index == 'a']
+        expected = df3.iloc[[]]
+        assert_frame_equal(result, expected)
+
+        result = df4[df4.index == 'a']
+        expected = df4.iloc[[]]
+        assert_frame_equal(result, expected)
+
+        result = df3[df3.index == 1]
+        expected = df3.iloc[[0, 1, 3]]
+        assert_frame_equal(result, expected)
+
+        result = df4[df4.index == 1]
+        expected = df4.iloc[[0, 1, 3]]
+        assert_frame_equal(result, expected)
+
+        # since we have an ordered categorical
+
+        # CategoricalIndex([1, 1, 2, 1, 3, 2],
+        #         categories=[3, 2, 1],
+        #         ordered=True,
+        #         name=u'B')
+        result = df3[df3.index < 2]
+        expected = df3.iloc[[4]]
+        assert_frame_equal(result, expected)
+
+        result = df3[df3.index > 1]
+        expected = df3.iloc[[]]
+        assert_frame_equal(result, expected)
+
+        # unordered
+        # cannot be compared
+
+        # CategoricalIndex([1, 1, 2, 1, 3, 2],
+        #         categories=[3, 2, 1],
+        #         ordered=False,
+        #         name=u'B')
+        pytest.raises(TypeError, lambda: df4[df4.index < 2])
+        pytest.raises(TypeError, lambda: df4[df4.index > 1])
+
+    def test_indexing_with_category(self):
+
+        # https://github.com/pandas-dev/pandas/issues/12564
+        # consistent result if comparing as Dataframe
+
+        cat = DataFrame({'A': ['foo', 'bar', 'baz']})
+        exp = DataFrame({'A': [True, False, False]})
+
+        res = (cat[['A']] == 'foo')
+        tm.assert_frame_equal(res, exp)
+
+        cat['A'] = cat['A'].astype('category')
+
+        res = (cat[['A']] == 'foo')
+        tm.assert_frame_equal(res, exp)
+
+    def test_map_with_dict_or_series(self):
+        orig_values = ['a', 'B', 1, 'a']
+        new_values = ['one', 2, 3.0, 'one']
+        cur_index = pd.CategoricalIndex(orig_values, name='XXX')
+        expected = pd.CategoricalIndex(new_values,
+                                       name='XXX', categories=[3.0, 2, 'one'])
+
+        mapper = pd.Series(new_values[:-1], index=orig_values[:-1])
+        output = cur_index.map(mapper)
+        # Order of categories in output can be different
+        tm.assert_index_equal(expected, output)
+
+        mapper = {o: n for o, n in
+                  zip(orig_values[:-1], new_values[:-1])}
+        output = cur_index.map(mapper)
+        # Order of categories in output can be different
+        tm.assert_index_equal(expected, output)
diff --git a/pandas/tests/indexing/test_chaining_and_caching.py b/pandas/tests/indexing/test_chaining_and_caching.py
new file mode 100644
index 0000000000000..0e396a3248e3f
--- /dev/null
+++ b/pandas/tests/indexing/test_chaining_and_caching.py
@@ -0,0 +1,431 @@
+from warnings import catch_warnings
+
+import pytest
+
+import numpy as np
+import pandas as pd
+from pandas.core import common as com
+from pandas import (compat, DataFrame, option_context,
+                    Series, MultiIndex, date_range, Timestamp)
+from pandas.util import testing as tm
+
+
+class TestCaching(object):
+
+    def test_slice_consolidate_invalidate_item_cache(self):
+
+        # this is chained assignment, but will 'work'
+        with option_context('chained_assignment', None):
+
+            # #3970
+            df = DataFrame({"aa": compat.lrange(5), "bb": [2.2] * 5})
+
+            # Creates a second float block
+            df["cc"] = 0.0
+
+            # caches a reference to the 'bb' series
+            df["bb"]
+
+            # repr machinery triggers consolidation
+            repr(df)
+
+            # Assignment to wrong series
+            df['bb'].iloc[0] = 0.17
+            df._clear_item_cache()
+            tm.assert_almost_equal(df['bb'][0], 0.17)
+
+    def test_setitem_cache_updating(self):
+        # GH 5424
+        cont = ['one', 'two', 'three', 'four', 'five', 'six', 'seven']
+
+        for do_ref in [False, False]:
+            df = DataFrame({'a': cont,
+                            "b": cont[3:] + cont[:3],
+                            'c': np.arange(7)})
+
+            # ref the cache
+            if do_ref:
+                df.loc[0, "c"]
+
+            # set it
+            df.loc[7, 'c'] = 1
+
+            assert df.loc[0, 'c'] == 0.0
+            assert df.loc[7, 'c'] == 1.0
+
+        # GH 7084
+        # not updating cache on series setting with slices
+        expected = DataFrame({'A': [600, 600, 600]},
+                             index=date_range('5/7/2014', '5/9/2014'))
+        out = DataFrame({'A': [0, 0, 0]},
+                        index=date_range('5/7/2014', '5/9/2014'))
+        df = DataFrame({'C': ['A', 'A', 'A'], 'D': [100, 200, 300]})
+
+        # loop through df to update out
+        six = Timestamp('5/7/2014')
+        eix = Timestamp('5/9/2014')
+        for ix, row in df.iterrows():
+            out.loc[six:eix, row['C']] = out.loc[six:eix, row['C']] + row['D']
+
+        tm.assert_frame_equal(out, expected)
+        tm.assert_series_equal(out['A'], expected['A'])
+
+        # try via a chain indexing
+        # this actually works
+        out = DataFrame({'A': [0, 0, 0]},
+                        index=date_range('5/7/2014', '5/9/2014'))
+        for ix, row in df.iterrows():
+            v = out[row['C']][six:eix] + row['D']
+            out[row['C']][six:eix] = v
+
+        tm.assert_frame_equal(out, expected)
+        tm.assert_series_equal(out['A'], expected['A'])
+
+        out = DataFrame({'A': [0, 0, 0]},
+                        index=date_range('5/7/2014', '5/9/2014'))
+        for ix, row in df.iterrows():
+            out.loc[six:eix, row['C']] += row['D']
+
+        tm.assert_frame_equal(out, expected)
+        tm.assert_series_equal(out['A'], expected['A'])
+
+
+class TestChaining(object):
+
+    def test_setitem_chained_setfault(self):
+
+        # GH6026
+        # setfaults under numpy 1.7.1 (ok on 1.8)
+        data = ['right', 'left', 'left', 'left', 'right', 'left', 'timeout']
+        mdata = ['right', 'left', 'left', 'left', 'right', 'left', 'none']
+
+        df = DataFrame({'response': np.array(data)})
+        mask = df.response == 'timeout'
+        df.response[mask] = 'none'
+        tm.assert_frame_equal(df, DataFrame({'response': mdata}))
+
+        recarray = np.rec.fromarrays([data], names=['response'])
+        df = DataFrame(recarray)
+        mask = df.response == 'timeout'
+        df.response[mask] = 'none'
+        tm.assert_frame_equal(df, DataFrame({'response': mdata}))
+
+        df = DataFrame({'response': data, 'response1': data})
+        mask = df.response == 'timeout'
+        df.response[mask] = 'none'
+        tm.assert_frame_equal(df, DataFrame({'response': mdata,
+                                             'response1': data}))
+
+        # GH 6056
+        expected = DataFrame(dict(A=[np.nan, 'bar', 'bah', 'foo', 'bar']))
+        df = DataFrame(dict(A=np.array(['foo', 'bar', 'bah', 'foo', 'bar'])))
+        df['A'].iloc[0] = np.nan
+        result = df.head()
+        tm.assert_frame_equal(result, expected)
+
+        df = DataFrame(dict(A=np.array(['foo', 'bar', 'bah', 'foo', 'bar'])))
+        df.A.iloc[0] = np.nan
+        result = df.head()
+        tm.assert_frame_equal(result, expected)
+
+    def test_detect_chained_assignment(self):
+
+        pd.set_option('chained_assignment', 'raise')
+
+        # work with the chain
+        expected = DataFrame([[-5, 1], [-6, 3]], columns=list('AB'))
+        df = DataFrame(np.arange(4).reshape(2, 2),
+                       columns=list('AB'), dtype='int64')
+        assert df._is_copy is None
+
+        df['A'][0] = -5
+        df['A'][1] = -6
+        tm.assert_frame_equal(df, expected)
+
+        # test with the chaining
+        df = DataFrame({'A': Series(range(2), dtype='int64'),
+                        'B': np.array(np.arange(2, 4), dtype=np.float64)})
+        assert df._is_copy is None
+
+        with pytest.raises(com.SettingWithCopyError):
+            df['A'][0] = -5
+
+        with pytest.raises(com.SettingWithCopyError):
+            df['A'][1] = np.nan
+
+        assert df['A']._is_copy is None
+
+        # Using a copy (the chain), fails
+        df = DataFrame({'A': Series(range(2), dtype='int64'),
+                        'B': np.array(np.arange(2, 4), dtype=np.float64)})
+
+        with pytest.raises(com.SettingWithCopyError):
+            df.loc[0]['A'] = -5
+
+        # Doc example
+        df = DataFrame({'a': ['one', 'one', 'two', 'three',
+                              'two', 'one', 'six'],
+                        'c': Series(range(7), dtype='int64')})
+        assert df._is_copy is None
+
+        with pytest.raises(com.SettingWithCopyError):
+            indexer = df.a.str.startswith('o')
+            df[indexer]['c'] = 42
+
+        expected = DataFrame({'A': [111, 'bbb', 'ccc'], 'B': [1, 2, 3]})
+        df = DataFrame({'A': ['aaa', 'bbb', 'ccc'], 'B': [1, 2, 3]})
+
+        with pytest.raises(com.SettingWithCopyError):
+            df['A'][0] = 111
+
+        with pytest.raises(com.SettingWithCopyError):
+            df.loc[0]['A'] = 111
+
+        df.loc[0, 'A'] = 111
+        tm.assert_frame_equal(df, expected)
+
+        # gh-5475: Make sure that is_copy is picked up reconstruction
+        df = DataFrame({"A": [1, 2]})
+        assert df._is_copy is None
+
+        with tm.ensure_clean('__tmp__pickle') as path:
+            df.to_pickle(path)
+            df2 = pd.read_pickle(path)
+            df2["B"] = df2["A"]
+            df2["B"] = df2["A"]
+
+        # gh-5597: a spurious raise as we are setting the entire column here
+        from string import ascii_letters as letters
+
+        def random_text(nobs=100):
+            df = []
+            for i in range(nobs):
+                idx = np.random.randint(len(letters), size=2)
+                idx.sort()
+
+                df.append([letters[idx[0]:idx[1]]])
+
+            return DataFrame(df, columns=['letters'])
+
+        df = random_text(100000)
+
+        # Always a copy
+        x = df.iloc[[0, 1, 2]]
+        assert x._is_copy is not None
+
+        x = df.iloc[[0, 1, 2, 4]]
+        assert x._is_copy is not None
+
+        # Explicitly copy
+        indexer = df.letters.apply(lambda x: len(x) > 10)
+        df = df.loc[indexer].copy()
+
+        assert df._is_copy is None
+        df['letters'] = df['letters'].apply(str.lower)
+
+        # Implicitly take
+        df = random_text(100000)
+        indexer = df.letters.apply(lambda x: len(x) > 10)
+        df = df.loc[indexer]
+
+        assert df._is_copy is not None
+        df['letters'] = df['letters'].apply(str.lower)
+
+        # Implicitly take 2
+        df = random_text(100000)
+        indexer = df.letters.apply(lambda x: len(x) > 10)
+
+        df = df.loc[indexer]
+        assert df._is_copy is not None
+        df.loc[:, 'letters'] = df['letters'].apply(str.lower)
+
+        # Should be ok even though it's a copy!
+        assert df._is_copy is None
+
+        df['letters'] = df['letters'].apply(str.lower)
+        assert df._is_copy is None
+
+        df = random_text(100000)
+        indexer = df.letters.apply(lambda x: len(x) > 10)
+        df.loc[indexer, 'letters'] = (
+            df.loc[indexer, 'letters'].apply(str.lower))
+
+        # an identical take, so no copy
+        df = DataFrame({'a': [1]}).dropna()
+        assert df._is_copy is None
+        df['a'] += 1
+
+        # Inplace ops, originally from:
+        # http://stackoverflow.com/questions/20508968/series-fillna-in-a-multiindex-dataframe-does-not-fill-is-this-a-bug
+        a = [12, 23]
+        b = [123, None]
+        c = [1234, 2345]
+        d = [12345, 23456]
+        tuples = [('eyes', 'left'), ('eyes', 'right'), ('ears', 'left'),
+                  ('ears', 'right')]
+        events = {('eyes', 'left'): a,
+                  ('eyes', 'right'): b,
+                  ('ears', 'left'): c,
+                  ('ears', 'right'): d}
+        multiind = MultiIndex.from_tuples(tuples, names=['part', 'side'])
+        zed = DataFrame(events, index=['a', 'b'], columns=multiind)
+
+        with pytest.raises(com.SettingWithCopyError):
+            zed['eyes']['right'].fillna(value=555, inplace=True)
+
+        df = DataFrame(np.random.randn(10, 4))
+        s = df.iloc[:, 0].sort_values()
+
+        tm.assert_series_equal(s, df.iloc[:, 0].sort_values())
+        tm.assert_series_equal(s, df[0].sort_values())
+
+        # see gh-6025: false positives
+        df = DataFrame({'column1': ['a', 'a', 'a'], 'column2': [4, 8, 9]})
+        str(df)
+
+        df['column1'] = df['column1'] + 'b'
+        str(df)
+
+        df = df[df['column2'] != 8]
+        str(df)
+
+        df['column1'] = df['column1'] + 'c'
+        str(df)
+
+        # from SO:
+        # http://stackoverflow.com/questions/24054495/potential-bug-setting-value-for-undefined-column-using-iloc
+        df = DataFrame(np.arange(0, 9), columns=['count'])
+        df['group'] = 'b'
+
+        with pytest.raises(com.SettingWithCopyError):
+            df.iloc[0:5]['group'] = 'a'
+
+        # Mixed type setting but same dtype & changing dtype
+        df = DataFrame(dict(A=date_range('20130101', periods=5),
+                            B=np.random.randn(5),
+                            C=np.arange(5, dtype='int64'),
+                            D=list('abcde')))
+
+        with pytest.raises(com.SettingWithCopyError):
+            df.loc[2]['D'] = 'foo'
+
+        with pytest.raises(com.SettingWithCopyError):
+            df.loc[2]['C'] = 'foo'
+
+        with pytest.raises(com.SettingWithCopyError):
+            df['C'][2] = 'foo'
+
+    def test_setting_with_copy_bug(self):
+
+        # operating on a copy
+        df = DataFrame({'a': list(range(4)),
+                        'b': list('ab..'),
+                        'c': ['a', 'b', np.nan, 'd']})
+        mask = pd.isna(df.c)
+
+        def f():
+            df[['c']][mask] = df[['b']][mask]
+
+        pytest.raises(com.SettingWithCopyError, f)
+
+        # invalid warning as we are returning a new object
+        # GH 8730
+        df1 = DataFrame({'x': Series(['a', 'b', 'c']),
+                         'y': Series(['d', 'e', 'f'])})
+        df2 = df1[['x']]
+
+        # this should not raise
+        df2['y'] = ['g', 'h', 'i']
+
+    def test_detect_chained_assignment_warnings(self):
+
+        # warnings
+        with option_context('chained_assignment', 'warn'):
+            df = DataFrame({'A': ['aaa', 'bbb', 'ccc'], 'B': [1, 2, 3]})
+            with tm.assert_produces_warning(
+                    expected_warning=com.SettingWithCopyWarning):
+                df.loc[0]['A'] = 111
+
+    def test_chained_getitem_with_lists(self):
+
+        # GH6394
+        # Regression in chained getitem indexing with embedded list-like from
+        # 0.12
+        def check(result, expected):
+            tm.assert_numpy_array_equal(result, expected)
+            assert isinstance(result, np.ndarray)
+
+        df = DataFrame({'A': 5 * [np.zeros(3)], 'B': 5 * [np.ones(3)]})
+        expected = df['A'].iloc[2]
+        result = df.loc[2, 'A']
+        check(result, expected)
+        result2 = df.iloc[2]['A']
+        check(result2, expected)
+        result3 = df['A'].loc[2]
+        check(result3, expected)
+        result4 = df['A'].iloc[2]
+        check(result4, expected)
+
+    def test_cache_updating(self):
+        # GH 4939, make sure to update the cache on setitem
+
+        df = tm.makeDataFrame()
+        df['A']  # cache series
+        with catch_warnings(record=True):
+            df.ix["Hello Friend"] = df.ix[0]
+        assert "Hello Friend" in df['A'].index
+        assert "Hello Friend" in df['B'].index
+
+        with catch_warnings(record=True):
+            panel = tm.makePanel()
+            panel.ix[0]  # get first item into cache
+            panel.ix[:, :, 'A+1'] = panel.ix[:, :, 'A'] + 1
+            assert "A+1" in panel.ix[0].columns
+            assert "A+1" in panel.ix[1].columns
+
+        # 5216
+        # make sure that we don't try to set a dead cache
+        a = np.random.rand(10, 3)
+        df = DataFrame(a, columns=['x', 'y', 'z'])
+        tuples = [(i, j) for i in range(5) for j in range(2)]
+        index = MultiIndex.from_tuples(tuples)
+        df.index = index
+
+        # setting via chained assignment
+        # but actually works, since everything is a view
+        df.loc[0]['z'].iloc[0] = 1.
+        result = df.loc[(0, 0), 'z']
+        assert result == 1
+
+        # correct setting
+        df.loc[(0, 0), 'z'] = 2
+        result = df.loc[(0, 0), 'z']
+        assert result == 2
+
+        # 10264
+        df = DataFrame(np.zeros((5, 5), dtype='int64'), columns=[
+                       'a', 'b', 'c', 'd', 'e'], index=range(5))
+        df['f'] = 0
+        df.f.values[3] = 1
+
+        # TODO(wesm): unused?
+        # y = df.iloc[np.arange(2, len(df))]
+
+        df.f.values[3] = 2
+        expected = DataFrame(np.zeros((5, 6), dtype='int64'), columns=[
+                             'a', 'b', 'c', 'd', 'e', 'f'], index=range(5))
+        expected.at[3, 'f'] = 2
+        tm.assert_frame_equal(df, expected)
+        expected = Series([0, 0, 0, 2, 0], name='f')
+        tm.assert_series_equal(df.f, expected)
+
+    def test_deprecate_is_copy(self):
+        # GH18801
+        df = DataFrame({"A": [1, 2, 3]})
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # getter
+            df.is_copy
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # setter
+            df.is_copy = "test deprecated is_copy"
diff --git a/pandas/tests/indexing/test_coercion.py b/pandas/tests/indexing/test_coercion.py
new file mode 100644
index 0000000000000..de756375db8cb
--- /dev/null
+++ b/pandas/tests/indexing/test_coercion.py
@@ -0,0 +1,920 @@
+# -*- coding: utf-8 -*-
+
+import itertools
+import pytest
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.compat as compat
+
+
+###############################################################
+# Index / Series common tests which may trigger dtype coercions
+###############################################################
+
+
+@pytest.fixture(autouse=True, scope='class')
+def check_comprehensiveness(request):
+    # Iterate over combination of dtype, method and klass
+    # and ensure that each are contained within a collected test
+    cls = request.cls
+    combos = itertools.product(cls.klasses, cls.dtypes, [cls.method])
+
+    def has_test(combo):
+        klass, dtype, method = combo
+        cls_funcs = request.node.session.items
+        return any(klass in x.name and dtype in x.name and
+                   method in x.name for x in cls_funcs)
+
+    for combo in combos:
+        if not has_test(combo):
+            msg = 'test method is not defined: {0}, {1}'
+            raise AssertionError(msg.format(type(cls), combo))
+
+    yield
+
+
+class CoercionBase(object):
+
+    klasses = ['index', 'series']
+    dtypes = ['object', 'int64', 'float64', 'complex128', 'bool',
+              'datetime64', 'datetime64tz', 'timedelta64', 'period']
+
+    @property
+    def method(self):
+        raise NotImplementedError(self)
+
+    def _assert(self, left, right, dtype):
+        # explicitly check dtype to avoid any unexpected result
+        if isinstance(left, pd.Series):
+            tm.assert_series_equal(left, right)
+        elif isinstance(left, pd.Index):
+            tm.assert_index_equal(left, right)
+        else:
+            raise NotImplementedError
+        assert left.dtype == dtype
+        assert right.dtype == dtype
+
+
+class TestSetitemCoercion(CoercionBase):
+
+    method = 'setitem'
+
+    def _assert_setitem_series_conversion(self, original_series, loc_value,
+                                          expected_series, expected_dtype):
+        """ test series value's coercion triggered by assignment """
+        temp = original_series.copy()
+        temp[1] = loc_value
+        tm.assert_series_equal(temp, expected_series)
+        # check dtype explicitly for sure
+        assert temp.dtype == expected_dtype
+
+        # .loc works different rule, temporary disable
+        # temp = original_series.copy()
+        # temp.loc[1] = loc_value
+        # tm.assert_series_equal(temp, expected_series)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (1, np.object),
+        (1.1, np.object),
+        (1 + 1j, np.object),
+        (True, np.object)])
+    def test_setitem_series_object(self, val, exp_dtype):
+        obj = pd.Series(list('abcd'))
+        assert obj.dtype == np.object
+
+        exp = pd.Series(['a', val, 'c', 'd'])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (1, np.int64),
+        (1.1, np.float64),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_setitem_series_int64(self, val, exp_dtype):
+        obj = pd.Series([1, 2, 3, 4])
+        assert obj.dtype == np.int64
+
+        if exp_dtype is np.float64:
+            exp = pd.Series([1, 1, 3, 4])
+            self._assert_setitem_series_conversion(obj, 1.1, exp, np.int64)
+            pytest.xfail("GH12747 The result must be float")
+
+        exp = pd.Series([1, val, 3, 4])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (np.int32(1), np.int8),
+        (np.int16(2**9), np.int16)])
+    def test_setitem_series_int8(self, val, exp_dtype):
+        obj = pd.Series([1, 2, 3, 4], dtype=np.int8)
+        assert obj.dtype == np.int8
+
+        if exp_dtype is np.int16:
+            exp = pd.Series([1, 0, 3, 4], dtype=np.int8)
+            self._assert_setitem_series_conversion(obj, val, exp, np.int8)
+            pytest.xfail("BUG: it must be Series([1, 1, 3, 4], dtype=np.int16")
+
+        exp = pd.Series([1, val, 3, 4], dtype=np.int8)
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (1, np.float64),
+        (1.1, np.float64),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_setitem_series_float64(self, val, exp_dtype):
+        obj = pd.Series([1.1, 2.2, 3.3, 4.4])
+        assert obj.dtype == np.float64
+
+        exp = pd.Series([1.1, val, 3.3, 4.4])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (1, np.complex128),
+        (1.1, np.complex128),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_setitem_series_complex128(self, val, exp_dtype):
+        obj = pd.Series([1 + 1j, 2 + 2j, 3 + 3j, 4 + 4j])
+        assert obj.dtype == np.complex128
+
+        exp = pd.Series([1 + 1j, val, 3 + 3j, 4 + 4j])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (1, np.int64),
+        (3, np.int64),
+        (1.1, np.float64),
+        (1 + 1j, np.complex128),
+        (True, np.bool)])
+    def test_setitem_series_bool(self, val, exp_dtype):
+        obj = pd.Series([True, False, True, False])
+        assert obj.dtype == np.bool
+
+        if exp_dtype is np.int64:
+            exp = pd.Series([True, True, True, False])
+            self._assert_setitem_series_conversion(obj, val, exp, np.bool)
+            pytest.xfail("TODO_GH12747 The result must be int")
+        elif exp_dtype is np.float64:
+            exp = pd.Series([True, True, True, False])
+            self._assert_setitem_series_conversion(obj, val, exp, np.bool)
+            pytest.xfail("TODO_GH12747 The result must be float")
+        elif exp_dtype is np.complex128:
+            exp = pd.Series([True, True, True, False])
+            self._assert_setitem_series_conversion(obj, val, exp, np.bool)
+            pytest.xfail("TODO_GH12747 The result must be complex")
+
+        exp = pd.Series([True, val, True, False])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (pd.Timestamp('2012-01-01'), 'datetime64[ns]'),
+        (1, np.object),
+        ('x', np.object)])
+    def test_setitem_series_datetime64(self, val, exp_dtype):
+        obj = pd.Series([pd.Timestamp('2011-01-01'),
+                         pd.Timestamp('2011-01-02'),
+                         pd.Timestamp('2011-01-03'),
+                         pd.Timestamp('2011-01-04')])
+        assert obj.dtype == 'datetime64[ns]'
+
+        exp = pd.Series([pd.Timestamp('2011-01-01'),
+                         val,
+                         pd.Timestamp('2011-01-03'),
+                         pd.Timestamp('2011-01-04')])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (pd.Timestamp('2012-01-01', tz='US/Eastern'),
+         'datetime64[ns, US/Eastern]'),
+        (pd.Timestamp('2012-01-01', tz='US/Pacific'), np.object),
+        (pd.Timestamp('2012-01-01'), np.object),
+        (1, np.object)])
+    def test_setitem_series_datetime64tz(self, val, exp_dtype):
+        tz = 'US/Eastern'
+        obj = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
+                         pd.Timestamp('2011-01-02', tz=tz),
+                         pd.Timestamp('2011-01-03', tz=tz),
+                         pd.Timestamp('2011-01-04', tz=tz)])
+        assert obj.dtype == 'datetime64[ns, US/Eastern]'
+
+        exp = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
+                         val,
+                         pd.Timestamp('2011-01-03', tz=tz),
+                         pd.Timestamp('2011-01-04', tz=tz)])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (pd.Timedelta('12 day'), 'timedelta64[ns]'),
+        (1, np.object),
+        ('x', np.object)])
+    def test_setitem_series_timedelta64(self, val, exp_dtype):
+        obj = pd.Series([pd.Timedelta('1 day'),
+                         pd.Timedelta('2 day'),
+                         pd.Timedelta('3 day'),
+                         pd.Timedelta('4 day')])
+        assert obj.dtype == 'timedelta64[ns]'
+
+        exp = pd.Series([pd.Timedelta('1 day'),
+                         val,
+                         pd.Timedelta('3 day'),
+                         pd.Timedelta('4 day')])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    def _assert_setitem_index_conversion(self, original_series, loc_key,
+                                         expected_index, expected_dtype):
+        """ test index's coercion triggered by assign key """
+        temp = original_series.copy()
+        temp[loc_key] = 5
+        exp = pd.Series([1, 2, 3, 4, 5], index=expected_index)
+        tm.assert_series_equal(temp, exp)
+        # check dtype explicitly for sure
+        assert temp.index.dtype == expected_dtype
+
+        temp = original_series.copy()
+        temp.loc[loc_key] = 5
+        exp = pd.Series([1, 2, 3, 4, 5], index=expected_index)
+        tm.assert_series_equal(temp, exp)
+        # check dtype explicitly for sure
+        assert temp.index.dtype == expected_dtype
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        ('x', np.object),
+        (5, IndexError),
+        (1.1, np.object)])
+    def test_setitem_index_object(self, val, exp_dtype):
+        obj = pd.Series([1, 2, 3, 4], index=list('abcd'))
+        assert obj.index.dtype == np.object
+
+        if exp_dtype is IndexError:
+            temp = obj.copy()
+            with pytest.raises(exp_dtype):
+                temp[5] = 5
+        else:
+            exp_index = pd.Index(list('abcd') + [val])
+            self._assert_setitem_index_conversion(obj, val, exp_index,
+                                                  exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (5, np.int64),
+        (1.1, np.float64),
+        ('x', np.object)])
+    def test_setitem_index_int64(self, val, exp_dtype):
+        obj = pd.Series([1, 2, 3, 4])
+        assert obj.index.dtype == np.int64
+
+        exp_index = pd.Index([0, 1, 2, 3, val])
+        self._assert_setitem_index_conversion(obj, val, exp_index, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (5, IndexError),
+        (5.1, np.float64),
+        ('x', np.object)])
+    def test_setitem_index_float64(self, val, exp_dtype):
+        obj = pd.Series([1, 2, 3, 4], index=[1.1, 2.1, 3.1, 4.1])
+        assert obj.index.dtype == np.float64
+
+        if exp_dtype is IndexError:
+            # float + int -> int
+            temp = obj.copy()
+            with pytest.raises(exp_dtype):
+                temp[5] = 5
+            pytest.xfail("TODO_GH12747 The result must be float")
+
+        exp_index = pd.Index([1.1, 2.1, 3.1, 4.1, val])
+        self._assert_setitem_index_conversion(obj, val, exp_index, exp_dtype)
+
+    def test_setitem_series_period(self):
+        pass
+
+    def test_setitem_index_complex128(self):
+        pass
+
+    def test_setitem_index_bool(self):
+        pass
+
+    def test_setitem_index_datetime64(self):
+        pass
+
+    def test_setitem_index_datetime64tz(self):
+        pass
+
+    def test_setitem_index_timedelta64(self):
+        pass
+
+    def test_setitem_index_period(self):
+        pass
+
+
+class TestInsertIndexCoercion(CoercionBase):
+
+    klasses = ['index']
+    method = 'insert'
+
+    def _assert_insert_conversion(self, original, value,
+                                  expected, expected_dtype):
+        """ test coercion triggered by insert """
+        target = original.copy()
+        res = target.insert(1, value)
+        tm.assert_index_equal(res, expected)
+        assert res.dtype == expected_dtype
+
+    @pytest.mark.parametrize("insert, coerced_val, coerced_dtype", [
+        (1, 1, np.object),
+        (1.1, 1.1, np.object),
+        (False, False, np.object),
+        ('x', 'x', np.object)])
+    def test_insert_index_object(self, insert, coerced_val, coerced_dtype):
+        obj = pd.Index(list('abcd'))
+        assert obj.dtype == np.object
+
+        exp = pd.Index(['a', coerced_val, 'b', 'c', 'd'])
+        self._assert_insert_conversion(obj, insert, exp, coerced_dtype)
+
+    @pytest.mark.parametrize("insert, coerced_val, coerced_dtype", [
+        (1, 1, np.int64),
+        (1.1, 1.1, np.float64),
+        (False, 0, np.int64),
+        ('x', 'x', np.object)])
+    def test_insert_index_int64(self, insert, coerced_val, coerced_dtype):
+        obj = pd.Int64Index([1, 2, 3, 4])
+        assert obj.dtype == np.int64
+
+        exp = pd.Index([1, coerced_val, 2, 3, 4])
+        self._assert_insert_conversion(obj, insert, exp, coerced_dtype)
+
+    @pytest.mark.parametrize("insert, coerced_val, coerced_dtype", [
+        (1, 1., np.float64),
+        (1.1, 1.1, np.float64),
+        (False, 0., np.float64),
+        ('x', 'x', np.object)])
+    def test_insert_index_float64(self, insert, coerced_val, coerced_dtype):
+        obj = pd.Float64Index([1., 2., 3., 4.])
+        assert obj.dtype == np.float64
+
+        exp = pd.Index([1., coerced_val, 2., 3., 4.])
+        self._assert_insert_conversion(obj, insert, exp, coerced_dtype)
+
+    @pytest.mark.parametrize('fill_val,exp_dtype', [
+        (pd.Timestamp('2012-01-01'), 'datetime64[ns]'),
+        (pd.Timestamp('2012-01-01', tz='US/Eastern'),
+         'datetime64[ns, US/Eastern]')],
+        ids=['datetime64', 'datetime64tz'])
+    def test_insert_index_datetimes(self, fill_val, exp_dtype):
+        obj = pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03',
+                                '2011-01-04'], tz=fill_val.tz)
+        assert obj.dtype == exp_dtype
+
+        exp = pd.DatetimeIndex(['2011-01-01', fill_val.date(), '2011-01-02',
+                                '2011-01-03', '2011-01-04'], tz=fill_val.tz)
+        self._assert_insert_conversion(obj, fill_val, exp, exp_dtype)
+
+        msg = "Passed item and index have different timezone"
+        if fill_val.tz:
+            with tm.assert_raises_regex(ValueError, msg):
+                obj.insert(1, pd.Timestamp('2012-01-01'))
+
+        with tm.assert_raises_regex(ValueError, msg):
+            obj.insert(1, pd.Timestamp('2012-01-01', tz='Asia/Tokyo'))
+
+        msg = "cannot insert DatetimeIndex with incompatible label"
+        with tm.assert_raises_regex(TypeError, msg):
+            obj.insert(1, 1)
+
+        pytest.xfail("ToDo: must coerce to object")
+
+    def test_insert_index_timedelta64(self):
+        obj = pd.TimedeltaIndex(['1 day', '2 day', '3 day', '4 day'])
+        assert obj.dtype == 'timedelta64[ns]'
+
+        # timedelta64 + timedelta64 => timedelta64
+        exp = pd.TimedeltaIndex(['1 day', '10 day', '2 day', '3 day', '4 day'])
+        self._assert_insert_conversion(obj, pd.Timedelta('10 day'),
+                                       exp, 'timedelta64[ns]')
+
+        # ToDo: must coerce to object
+        msg = "cannot insert TimedeltaIndex with incompatible label"
+        with tm.assert_raises_regex(TypeError, msg):
+            obj.insert(1, pd.Timestamp('2012-01-01'))
+
+        # ToDo: must coerce to object
+        msg = "cannot insert TimedeltaIndex with incompatible label"
+        with tm.assert_raises_regex(TypeError, msg):
+            obj.insert(1, 1)
+
+    @pytest.mark.parametrize("insert, coerced_val, coerced_dtype", [
+        (pd.Period('2012-01', freq='M'), '2012-01', 'period[M]'),
+        (pd.Timestamp('2012-01-01'), pd.Timestamp('2012-01-01'), np.object),
+        (1, 1, np.object),
+        ('x', 'x', np.object)])
+    def test_insert_index_period(self, insert, coerced_val, coerced_dtype):
+        obj = pd.PeriodIndex(['2011-01', '2011-02', '2011-03', '2011-04'],
+                             freq='M')
+        assert obj.dtype == 'period[M]'
+
+        if isinstance(insert, pd.Period):
+            index_type = pd.PeriodIndex
+        else:
+            index_type = pd.Index
+
+        exp = index_type([pd.Period('2011-01', freq='M'),
+                          coerced_val,
+                          pd.Period('2011-02', freq='M'),
+                          pd.Period('2011-03', freq='M'),
+                          pd.Period('2011-04', freq='M')], freq='M')
+        self._assert_insert_conversion(obj, insert, exp, coerced_dtype)
+
+    def test_insert_index_complex128(self):
+        pass
+
+    def test_insert_index_bool(self):
+        pass
+
+
+class TestWhereCoercion(CoercionBase):
+
+    method = 'where'
+
+    def _assert_where_conversion(self, original, cond, values,
+                                 expected, expected_dtype):
+        """ test coercion triggered by where """
+        target = original.copy()
+        res = target.where(cond, values)
+        self._assert(res, expected, expected_dtype)
+
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index],
+                             ids=['series', 'index'])
+    @pytest.mark.parametrize("fill_val,exp_dtype", [
+        (1, np.object),
+        (1.1, np.object),
+        (1 + 1j, np.object),
+        (True, np.object)])
+    def test_where_object(self, klass, fill_val, exp_dtype):
+        obj = klass(list('abcd'))
+        assert obj.dtype == np.object
+        cond = klass([True, False, True, False])
+
+        if fill_val is True and klass is pd.Series:
+            ret_val = 1
+        else:
+            ret_val = fill_val
+
+        exp = klass(['a', ret_val, 'c', ret_val])
+        self._assert_where_conversion(obj, cond, fill_val, exp, exp_dtype)
+
+        if fill_val is True:
+            values = klass([True, False, True, True])
+        else:
+            values = klass(fill_val * x for x in [5, 6, 7, 8])
+
+        exp = klass(['a', values[1], 'c', values[3]])
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index],
+                             ids=['series', 'index'])
+    @pytest.mark.parametrize("fill_val,exp_dtype", [
+        (1, np.int64),
+        (1.1, np.float64),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_where_int64(self, klass, fill_val, exp_dtype):
+        if klass is pd.Index and exp_dtype is np.complex128:
+            pytest.skip("Complex Index not supported")
+        obj = klass([1, 2, 3, 4])
+        assert obj.dtype == np.int64
+        cond = klass([True, False, True, False])
+
+        exp = klass([1, fill_val, 3, fill_val])
+        self._assert_where_conversion(obj, cond, fill_val, exp, exp_dtype)
+
+        if fill_val is True:
+            values = klass([True, False, True, True])
+        else:
+            values = klass(x * fill_val for x in [5, 6, 7, 8])
+        exp = klass([1, values[1], 3, values[3]])
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index],
+                             ids=['series', 'index'])
+    @pytest.mark.parametrize("fill_val, exp_dtype", [
+        (1, np.float64),
+        (1.1, np.float64),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_where_float64(self, klass, fill_val, exp_dtype):
+        if klass is pd.Index and exp_dtype is np.complex128:
+            pytest.skip("Complex Index not supported")
+        obj = klass([1.1, 2.2, 3.3, 4.4])
+        assert obj.dtype == np.float64
+        cond = klass([True, False, True, False])
+
+        exp = klass([1.1, fill_val, 3.3, fill_val])
+        self._assert_where_conversion(obj, cond, fill_val, exp, exp_dtype)
+
+        if fill_val is True:
+            values = klass([True, False, True, True])
+        else:
+            values = klass(x * fill_val for x in [5, 6, 7, 8])
+        exp = klass([1.1, values[1], 3.3, values[3]])
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+    @pytest.mark.parametrize("fill_val,exp_dtype", [
+        (1, np.complex128),
+        (1.1, np.complex128),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_where_series_complex128(self, fill_val, exp_dtype):
+        obj = pd.Series([1 + 1j, 2 + 2j, 3 + 3j, 4 + 4j])
+        assert obj.dtype == np.complex128
+        cond = pd.Series([True, False, True, False])
+
+        exp = pd.Series([1 + 1j, fill_val, 3 + 3j, fill_val])
+        self._assert_where_conversion(obj, cond, fill_val, exp, exp_dtype)
+
+        if fill_val is True:
+            values = pd.Series([True, False, True, True])
+        else:
+            values = pd.Series(x * fill_val for x in [5, 6, 7, 8])
+        exp = pd.Series([1 + 1j, values[1], 3 + 3j, values[3]])
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+    @pytest.mark.parametrize("fill_val,exp_dtype", [
+        (1, np.object),
+        (1.1, np.object),
+        (1 + 1j, np.object),
+        (True, np.bool)])
+    def test_where_series_bool(self, fill_val, exp_dtype):
+
+        obj = pd.Series([True, False, True, False])
+        assert obj.dtype == np.bool
+        cond = pd.Series([True, False, True, False])
+
+        exp = pd.Series([True, fill_val, True, fill_val])
+        self._assert_where_conversion(obj, cond, fill_val, exp, exp_dtype)
+
+        if fill_val is True:
+            values = pd.Series([True, False, True, True])
+        else:
+            values = pd.Series(x * fill_val for x in [5, 6, 7, 8])
+        exp = pd.Series([True, values[1], True, values[3]])
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+    @pytest.mark.parametrize("fill_val,exp_dtype", [
+        (pd.Timestamp('2012-01-01'), 'datetime64[ns]'),
+        (pd.Timestamp('2012-01-01', tz='US/Eastern'), np.object)],
+        ids=['datetime64', 'datetime64tz'])
+    def test_where_series_datetime64(self, fill_val, exp_dtype):
+        obj = pd.Series([pd.Timestamp('2011-01-01'),
+                         pd.Timestamp('2011-01-02'),
+                         pd.Timestamp('2011-01-03'),
+                         pd.Timestamp('2011-01-04')])
+        assert obj.dtype == 'datetime64[ns]'
+        cond = pd.Series([True, False, True, False])
+
+        exp = pd.Series([pd.Timestamp('2011-01-01'), fill_val,
+                         pd.Timestamp('2011-01-03'), fill_val])
+        self._assert_where_conversion(obj, cond, fill_val, exp, exp_dtype)
+
+        values = pd.Series(pd.date_range(fill_val, periods=4))
+        if fill_val.tz:
+            exp = pd.Series([pd.Timestamp('2011-01-01'),
+                             pd.Timestamp('2012-01-02 05:00'),
+                             pd.Timestamp('2011-01-03'),
+                             pd.Timestamp('2012-01-04 05:00')])
+            self._assert_where_conversion(obj, cond, values, exp,
+                                          'datetime64[ns]')
+            pytest.xfail("ToDo: do not coerce to UTC, must be object")
+
+        exp = pd.Series([pd.Timestamp('2011-01-01'), values[1],
+                         pd.Timestamp('2011-01-03'), values[3]])
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+    @pytest.mark.parametrize("fill_val,exp_dtype", [
+        (pd.Timestamp('2012-01-01'), 'datetime64[ns]'),
+        (pd.Timestamp('2012-01-01', tz='US/Eastern'), np.object)],
+        ids=['datetime64', 'datetime64tz'])
+    def test_where_index_datetime(self, fill_val, exp_dtype):
+        obj = pd.Index([pd.Timestamp('2011-01-01'),
+                        pd.Timestamp('2011-01-02'),
+                        pd.Timestamp('2011-01-03'),
+                        pd.Timestamp('2011-01-04')])
+        assert obj.dtype == 'datetime64[ns]'
+        cond = pd.Index([True, False, True, False])
+
+        msg = ("Index\\(\\.\\.\\.\\) must be called with a collection "
+               "of some kind")
+        with tm.assert_raises_regex(TypeError, msg):
+            obj.where(cond, fill_val)
+
+        values = pd.Index(pd.date_range(fill_val, periods=4))
+        exp = pd.Index([pd.Timestamp('2011-01-01'),
+                        pd.Timestamp('2012-01-02'),
+                        pd.Timestamp('2011-01-03'),
+                        pd.Timestamp('2012-01-04')])
+
+        if fill_val.tz:
+            self._assert_where_conversion(obj, cond, values, exp,
+                                          'datetime64[ns]')
+            pytest.xfail("ToDo: do not ignore timezone, must be object")
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+        pytest.xfail("datetime64 + datetime64 -> datetime64 must support"
+                     " scalar")
+
+    def test_where_index_complex128(self):
+        pass
+
+    def test_where_index_bool(self):
+        pass
+
+    def test_where_series_datetime64tz(self):
+        pass
+
+    def test_where_series_timedelta64(self):
+        pass
+
+    def test_where_series_period(self):
+        pass
+
+    def test_where_index_datetime64tz(self):
+        pass
+
+    def test_where_index_timedelta64(self):
+        pass
+
+    def test_where_index_period(self):
+        pass
+
+
+class TestFillnaSeriesCoercion(CoercionBase):
+
+    # not indexing, but place here for consisntency
+
+    method = 'fillna'
+
+    def test_has_comprehensive_tests(self):
+        pass
+
+    def _assert_fillna_conversion(self, original, value,
+                                  expected, expected_dtype):
+        """ test coercion triggered by fillna """
+        target = original.copy()
+        res = target.fillna(value)
+        self._assert(res, expected, expected_dtype)
+
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index],
+                             ids=['series', 'index'])
+    @pytest.mark.parametrize("fill_val, fill_dtype", [
+        (1, np.object),
+        (1.1, np.object),
+        (1 + 1j, np.object),
+        (True, np.object)])
+    def test_fillna_object(self, klass, fill_val, fill_dtype):
+        obj = klass(['a', np.nan, 'c', 'd'])
+        assert obj.dtype == np.object
+
+        exp = klass(['a', fill_val, 'c', 'd'])
+        self._assert_fillna_conversion(obj, fill_val, exp, fill_dtype)
+
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index],
+                             ids=['series', 'index'])
+    @pytest.mark.parametrize("fill_val,fill_dtype", [
+        (1, np.float64),
+        (1.1, np.float64),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_fillna_float64(self, klass, fill_val, fill_dtype):
+        obj = klass([1.1, np.nan, 3.3, 4.4])
+        assert obj.dtype == np.float64
+
+        exp = klass([1.1, fill_val, 3.3, 4.4])
+        # float + complex -> we don't support a complex Index
+        # complex for Series,
+        # object for Index
+        if fill_dtype == np.complex128 and klass == pd.Index:
+            fill_dtype = np.object
+        self._assert_fillna_conversion(obj, fill_val, exp, fill_dtype)
+
+    @pytest.mark.parametrize("fill_val,fill_dtype", [
+        (1, np.complex128),
+        (1.1, np.complex128),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_fillna_series_complex128(self, fill_val, fill_dtype):
+        obj = pd.Series([1 + 1j, np.nan, 3 + 3j, 4 + 4j])
+        assert obj.dtype == np.complex128
+
+        exp = pd.Series([1 + 1j, fill_val, 3 + 3j, 4 + 4j])
+        self._assert_fillna_conversion(obj, fill_val, exp, fill_dtype)
+
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index],
+                             ids=['series', 'index'])
+    @pytest.mark.parametrize("fill_val,fill_dtype", [
+        (pd.Timestamp('2012-01-01'), 'datetime64[ns]'),
+        (pd.Timestamp('2012-01-01', tz='US/Eastern'), np.object),
+        (1, np.object), ('x', np.object)],
+        ids=['datetime64', 'datetime64tz', 'object', 'object'])
+    def test_fillna_datetime(self, klass, fill_val, fill_dtype):
+        obj = klass([pd.Timestamp('2011-01-01'),
+                     pd.NaT,
+                     pd.Timestamp('2011-01-03'),
+                     pd.Timestamp('2011-01-04')])
+        assert obj.dtype == 'datetime64[ns]'
+
+        exp = klass([pd.Timestamp('2011-01-01'),
+                     fill_val,
+                     pd.Timestamp('2011-01-03'),
+                     pd.Timestamp('2011-01-04')])
+        self._assert_fillna_conversion(obj, fill_val, exp, fill_dtype)
+
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index])
+    @pytest.mark.parametrize("fill_val,fill_dtype", [
+        (pd.Timestamp('2012-01-01', tz='US/Eastern'),
+         'datetime64[ns, US/Eastern]'),
+        (pd.Timestamp('2012-01-01'), np.object),
+        (pd.Timestamp('2012-01-01', tz='Asia/Tokyo'), np.object),
+        (1, np.object),
+        ('x', np.object)])
+    def test_fillna_datetime64tz(self, klass, fill_val, fill_dtype):
+        tz = 'US/Eastern'
+
+        obj = klass([pd.Timestamp('2011-01-01', tz=tz),
+                     pd.NaT,
+                     pd.Timestamp('2011-01-03', tz=tz),
+                     pd.Timestamp('2011-01-04', tz=tz)])
+        assert obj.dtype == 'datetime64[ns, US/Eastern]'
+
+        exp = klass([pd.Timestamp('2011-01-01', tz=tz),
+                     fill_val,
+                     pd.Timestamp('2011-01-03', tz=tz),
+                     pd.Timestamp('2011-01-04', tz=tz)])
+        self._assert_fillna_conversion(obj, fill_val, exp, fill_dtype)
+
+    def test_fillna_series_int64(self):
+        pass
+
+    def test_fillna_index_int64(self):
+        pass
+
+    def test_fillna_series_bool(self):
+        pass
+
+    def test_fillna_index_bool(self):
+        pass
+
+    def test_fillna_series_timedelta64(self):
+        pass
+
+    def test_fillna_series_period(self):
+        pass
+
+    def test_fillna_index_timedelta64(self):
+        pass
+
+    def test_fillna_index_period(self):
+        pass
+
+
+class TestReplaceSeriesCoercion(CoercionBase):
+
+    klasses = ['series']
+    method = 'replace'
+
+    rep = {}
+    rep['object'] = ['a', 'b']
+    rep['int64'] = [4, 5]
+    rep['float64'] = [1.1, 2.2]
+    rep['complex128'] = [1 + 1j, 2 + 2j]
+    rep['bool'] = [True, False]
+    rep['datetime64[ns]'] = [pd.Timestamp('2011-01-01'),
+                             pd.Timestamp('2011-01-03')]
+
+    for tz in ['UTC', 'US/Eastern']:
+        # to test tz => different tz replacement
+        key = 'datetime64[ns, {0}]'.format(tz)
+        rep[key] = [pd.Timestamp('2011-01-01', tz=tz),
+                    pd.Timestamp('2011-01-03', tz=tz)]
+
+    rep['timedelta64[ns]'] = [pd.Timedelta('1 day'),
+                              pd.Timedelta('2 day')]
+
+    @pytest.mark.parametrize('how', ['dict', 'series'])
+    @pytest.mark.parametrize('to_key', [
+        'object', 'int64', 'float64', 'complex128', 'bool', 'datetime64[ns]',
+        'datetime64[ns, UTC]', 'datetime64[ns, US/Eastern]', 'timedelta64[ns]'
+    ], ids=['object', 'int64', 'float64', 'complex128', 'bool',
+            'datetime64', 'datetime64tz', 'datetime64tz', 'timedelta64'])
+    @pytest.mark.parametrize('from_key', [
+        'object', 'int64', 'float64', 'complex128', 'bool', 'datetime64[ns]',
+        'datetime64[ns, UTC]', 'datetime64[ns, US/Eastern]', 'timedelta64[ns]']
+    )
+    def test_replace_series(self, how, to_key, from_key):
+        if from_key == 'bool' and how == 'series' and compat.PY3:
+            # doesn't work in PY3, though ...dict_from_bool works fine
+            pytest.skip("doesn't work as in PY3")
+
+        index = pd.Index([3, 4], name='xxx')
+        obj = pd.Series(self.rep[from_key], index=index, name='yyy')
+        assert obj.dtype == from_key
+
+        if (from_key.startswith('datetime') and to_key.startswith('datetime')):
+            # tested below
+            return
+        elif from_key in ['datetime64[ns, US/Eastern]', 'datetime64[ns, UTC]']:
+            # tested below
+            return
+
+        if how == 'dict':
+            replacer = dict(zip(self.rep[from_key], self.rep[to_key]))
+        elif how == 'series':
+            replacer = pd.Series(self.rep[to_key], index=self.rep[from_key])
+        else:
+            raise ValueError
+
+        result = obj.replace(replacer)
+
+        if ((from_key == 'float64' and to_key in ('int64')) or
+            (from_key == 'complex128' and
+             to_key in ('int64', 'float64'))):
+
+            if compat.is_platform_32bit() or compat.is_platform_windows():
+                pytest.skip("32-bit platform buggy: {0} -> {1}".format
+                            (from_key, to_key))
+
+            # Expected: do not downcast by replacement
+            exp = pd.Series(self.rep[to_key], index=index,
+                            name='yyy', dtype=from_key)
+
+        else:
+            exp = pd.Series(self.rep[to_key], index=index, name='yyy')
+            assert exp.dtype == to_key
+
+        tm.assert_series_equal(result, exp)
+
+    # TODO(jbrockmendel) commented out to only have a single xfail printed
+    @pytest.mark.xfail(reason='GH #18376, tzawareness-compat bug '
+                              'in BlockManager.replace_list')
+    # @pytest.mark.parametrize('how', ['dict', 'series'])
+    # @pytest.mark.parametrize('to_key', ['timedelta64[ns]', 'bool', 'object',
+    #                                     'complex128', 'float64', 'int64'])
+    # @pytest.mark.parametrize('from_key', ['datetime64[ns, UTC]',
+    #                                       'datetime64[ns, US/Eastern]'])
+    # def test_replace_series_datetime_tz(self, how, to_key, from_key):
+    def test_replace_series_datetime_tz(self):
+        how = 'series'
+        from_key = 'datetime64[ns, US/Eastern]'
+        to_key = 'timedelta64[ns]'
+
+        index = pd.Index([3, 4], name='xxx')
+        obj = pd.Series(self.rep[from_key], index=index, name='yyy')
+        assert obj.dtype == from_key
+
+        if how == 'dict':
+            replacer = dict(zip(self.rep[from_key], self.rep[to_key]))
+        elif how == 'series':
+            replacer = pd.Series(self.rep[to_key], index=self.rep[from_key])
+        else:
+            raise ValueError
+
+        result = obj.replace(replacer)
+        exp = pd.Series(self.rep[to_key], index=index, name='yyy')
+        assert exp.dtype == to_key
+
+        tm.assert_series_equal(result, exp)
+
+    # TODO(jreback) commented out to only have a single xfail printed
+    @pytest.mark.xfail(reason="different tz, "
+                       "currently mask_missing raises SystemError")
+    # @pytest.mark.parametrize('how', ['dict', 'series'])
+    # @pytest.mark.parametrize('to_key', [
+    #     'datetime64[ns]', 'datetime64[ns, UTC]',
+    #     'datetime64[ns, US/Eastern]'])
+    # @pytest.mark.parametrize('from_key', [
+    #    'datetime64[ns]', 'datetime64[ns, UTC]',
+    #    'datetime64[ns, US/Eastern]'])
+    # def test_replace_series_datetime_datetime(self, how, to_key, from_key):
+    def test_replace_series_datetime_datetime(self):
+        how = 'dict'
+        to_key = 'datetime64[ns]'
+        from_key = 'datetime64[ns]'
+
+        index = pd.Index([3, 4], name='xxx')
+        obj = pd.Series(self.rep[from_key], index=index, name='yyy')
+        assert obj.dtype == from_key
+
+        if how == 'dict':
+            replacer = dict(zip(self.rep[from_key], self.rep[to_key]))
+        elif how == 'series':
+            replacer = pd.Series(self.rep[to_key], index=self.rep[from_key])
+        else:
+            raise ValueError
+
+        result = obj.replace(replacer)
+        exp = pd.Series(self.rep[to_key], index=index, name='yyy')
+        assert exp.dtype == to_key
+
+        tm.assert_series_equal(result, exp)
+
+    def test_replace_series_period(self):
+        pass
diff --git a/pandas/tests/indexing/test_datetime.py b/pandas/tests/indexing/test_datetime.py
new file mode 100644
index 0000000000000..751372380d262
--- /dev/null
+++ b/pandas/tests/indexing/test_datetime.py
@@ -0,0 +1,268 @@
+import numpy as np
+import pandas as pd
+from pandas import date_range, Index, DataFrame, Series, Timestamp
+from pandas.util import testing as tm
+
+
+class TestDatetimeIndex(object):
+
+    def test_setitem_with_datetime_tz(self):
+        # 16889
+        # support .loc with alignment and tz-aware DatetimeIndex
+        mask = np.array([True, False, True, False])
+
+        idx = date_range('20010101', periods=4, tz='UTC')
+        df = DataFrame({'a': np.arange(4)}, index=idx).astype('float64')
+
+        result = df.copy()
+        result.loc[mask, :] = df.loc[mask, :]
+        tm.assert_frame_equal(result, df)
+
+        result = df.copy()
+        result.loc[mask] = df.loc[mask]
+        tm.assert_frame_equal(result, df)
+
+        idx = date_range('20010101', periods=4)
+        df = DataFrame({'a': np.arange(4)}, index=idx).astype('float64')
+
+        result = df.copy()
+        result.loc[mask, :] = df.loc[mask, :]
+        tm.assert_frame_equal(result, df)
+
+        result = df.copy()
+        result.loc[mask] = df.loc[mask]
+        tm.assert_frame_equal(result, df)
+
+    def test_indexing_with_datetime_tz(self):
+
+        # 8260
+        # support datetime64 with tz
+
+        idx = Index(date_range('20130101', periods=3, tz='US/Eastern'),
+                    name='foo')
+        dr = date_range('20130110', periods=3)
+        df = DataFrame({'A': idx, 'B': dr})
+        df['C'] = idx
+        df.iloc[1, 1] = pd.NaT
+        df.iloc[1, 2] = pd.NaT
+
+        # indexing
+        result = df.iloc[1]
+        expected = Series([Timestamp('2013-01-02 00:00:00-0500',
+                                     tz='US/Eastern'), np.nan, np.nan],
+                          index=list('ABC'), dtype='object', name=1)
+        tm.assert_series_equal(result, expected)
+        result = df.loc[1]
+        expected = Series([Timestamp('2013-01-02 00:00:00-0500',
+                                     tz='US/Eastern'), np.nan, np.nan],
+                          index=list('ABC'), dtype='object', name=1)
+        tm.assert_series_equal(result, expected)
+
+        # indexing - fast_xs
+        df = DataFrame({'a': date_range('2014-01-01', periods=10, tz='UTC')})
+        result = df.iloc[5]
+        expected = Timestamp('2014-01-06 00:00:00+0000', tz='UTC', freq='D')
+        assert result == expected
+
+        result = df.loc[5]
+        assert result == expected
+
+        # indexing - boolean
+        result = df[df.a > df.a[3]]
+        expected = df.iloc[4:]
+        tm.assert_frame_equal(result, expected)
+
+        # indexing - setting an element
+        df = DataFrame(data=pd.to_datetime(
+            ['2015-03-30 20:12:32', '2015-03-12 00:11:11']), columns=['time'])
+        df['new_col'] = ['new', 'old']
+        df.time = df.set_index('time').index.tz_localize('UTC')
+        v = df[df.new_col == 'new'].set_index('time').index.tz_convert(
+            'US/Pacific')
+
+        # trying to set a single element on a part of a different timezone
+        # this converts to object
+        df2 = df.copy()
+        df2.loc[df2.new_col == 'new', 'time'] = v
+
+        expected = Series([v[0], df.loc[1, 'time']], name='time')
+        tm.assert_series_equal(df2.time, expected)
+
+        v = df.loc[df.new_col == 'new', 'time'] + pd.Timedelta('1s')
+        df.loc[df.new_col == 'new', 'time'] = v
+        tm.assert_series_equal(df.loc[df.new_col == 'new', 'time'], v)
+
+    def test_consistency_with_tz_aware_scalar(self):
+        # xef gh-12938
+        # various ways of indexing the same tz-aware scalar
+        df = Series([Timestamp('2016-03-30 14:35:25',
+                               tz='Europe/Brussels')]).to_frame()
+
+        df = pd.concat([df, df]).reset_index(drop=True)
+        expected = Timestamp('2016-03-30 14:35:25+0200',
+                             tz='Europe/Brussels')
+
+        result = df[0][0]
+        assert result == expected
+
+        result = df.iloc[0, 0]
+        assert result == expected
+
+        result = df.loc[0, 0]
+        assert result == expected
+
+        result = df.iat[0, 0]
+        assert result == expected
+
+        result = df.at[0, 0]
+        assert result == expected
+
+        result = df[0].loc[0]
+        assert result == expected
+
+        result = df[0].at[0]
+        assert result == expected
+
+    def test_indexing_with_datetimeindex_tz(self):
+
+        # GH 12050
+        # indexing on a series with a datetimeindex with tz
+        index = date_range('2015-01-01', periods=2, tz='utc')
+
+        ser = Series(range(2), index=index, dtype='int64')
+
+        # list-like indexing
+
+        for sel in (index, list(index)):
+            # getitem
+            tm.assert_series_equal(ser[sel], ser)
+
+            # setitem
+            result = ser.copy()
+            result[sel] = 1
+            expected = Series(1, index=index)
+            tm.assert_series_equal(result, expected)
+
+            # .loc getitem
+            tm.assert_series_equal(ser.loc[sel], ser)
+
+            # .loc setitem
+            result = ser.copy()
+            result.loc[sel] = 1
+            expected = Series(1, index=index)
+            tm.assert_series_equal(result, expected)
+
+        # single element indexing
+
+        # getitem
+        assert ser[index[1]] == 1
+
+        # setitem
+        result = ser.copy()
+        result[index[1]] = 5
+        expected = Series([0, 5], index=index)
+        tm.assert_series_equal(result, expected)
+
+        # .loc getitem
+        assert ser.loc[index[1]] == 1
+
+        # .loc setitem
+        result = ser.copy()
+        result.loc[index[1]] = 5
+        expected = Series([0, 5], index=index)
+        tm.assert_series_equal(result, expected)
+
+    def test_partial_setting_with_datetimelike_dtype(self):
+
+        # GH9478
+        # a datetimeindex alignment issue with partial setting
+        df = DataFrame(np.arange(6.).reshape(3, 2), columns=list('AB'),
+                       index=date_range('1/1/2000', periods=3, freq='1H'))
+        expected = df.copy()
+        expected['C'] = [expected.index[0]] + [pd.NaT, pd.NaT]
+
+        mask = df.A < 1
+        df.loc[mask, 'C'] = df.loc[mask].index
+        tm.assert_frame_equal(df, expected)
+
+    def test_loc_setitem_datetime(self):
+
+        # GH 9516
+        dt1 = Timestamp('20130101 09:00:00')
+        dt2 = Timestamp('20130101 10:00:00')
+
+        for conv in [lambda x: x, lambda x: x.to_datetime64(),
+                     lambda x: x.to_pydatetime(), lambda x: np.datetime64(x)]:
+
+            df = DataFrame()
+            df.loc[conv(dt1), 'one'] = 100
+            df.loc[conv(dt2), 'one'] = 200
+
+            expected = DataFrame({'one': [100.0, 200.0]}, index=[dt1, dt2])
+            tm.assert_frame_equal(df, expected)
+
+    def test_series_partial_set_datetime(self):
+        # GH 11497
+
+        idx = date_range('2011-01-01', '2011-01-02', freq='D', name='idx')
+        ser = Series([0.1, 0.2], index=idx, name='s')
+
+        result = ser.loc[[Timestamp('2011-01-01'), Timestamp('2011-01-02')]]
+        exp = Series([0.1, 0.2], index=idx, name='s')
+        tm.assert_series_equal(result, exp, check_index_type=True)
+
+        keys = [Timestamp('2011-01-02'), Timestamp('2011-01-02'),
+                Timestamp('2011-01-01')]
+        exp = Series([0.2, 0.2, 0.1], index=pd.DatetimeIndex(keys, name='idx'),
+                     name='s')
+        tm.assert_series_equal(ser.loc[keys], exp, check_index_type=True)
+
+        keys = [Timestamp('2011-01-03'), Timestamp('2011-01-02'),
+                Timestamp('2011-01-03')]
+        exp = Series([np.nan, 0.2, np.nan],
+                     index=pd.DatetimeIndex(keys, name='idx'), name='s')
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            tm.assert_series_equal(ser.loc[keys], exp, check_index_type=True)
+
+    def test_series_partial_set_period(self):
+        # GH 11497
+
+        idx = pd.period_range('2011-01-01', '2011-01-02', freq='D', name='idx')
+        ser = Series([0.1, 0.2], index=idx, name='s')
+
+        result = ser.loc[[pd.Period('2011-01-01', freq='D'),
+                          pd.Period('2011-01-02', freq='D')]]
+        exp = Series([0.1, 0.2], index=idx, name='s')
+        tm.assert_series_equal(result, exp, check_index_type=True)
+
+        keys = [pd.Period('2011-01-02', freq='D'),
+                pd.Period('2011-01-02', freq='D'),
+                pd.Period('2011-01-01', freq='D')]
+        exp = Series([0.2, 0.2, 0.1], index=pd.PeriodIndex(keys, name='idx'),
+                     name='s')
+        tm.assert_series_equal(ser.loc[keys], exp, check_index_type=True)
+
+        keys = [pd.Period('2011-01-03', freq='D'),
+                pd.Period('2011-01-02', freq='D'),
+                pd.Period('2011-01-03', freq='D')]
+        exp = Series([np.nan, 0.2, np.nan],
+                     index=pd.PeriodIndex(keys, name='idx'), name='s')
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = ser.loc[keys]
+        tm.assert_series_equal(result, exp)
+
+    def test_nanosecond_getitem_setitem_with_tz(self):
+        # GH 11679
+        data = ['2016-06-28 08:30:00.123456789']
+        index = pd.DatetimeIndex(data, dtype='datetime64[ns, America/Chicago]')
+        df = DataFrame({'a': [10]}, index=index)
+        result = df.loc[df.index[0]]
+        expected = Series(10, index=['a'], name=df.index[0])
+        tm.assert_series_equal(result, expected)
+
+        result = df.copy()
+        result.loc[df.index[0], 'a'] = -1
+        expected = DataFrame(-1, index=index, columns=['a'])
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/indexing/test_floats.py b/pandas/tests/indexing/test_floats.py
new file mode 100644
index 0000000000000..32a56aeafc6ad
--- /dev/null
+++ b/pandas/tests/indexing/test_floats.py
@@ -0,0 +1,890 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from warnings import catch_warnings
+import numpy as np
+from pandas import (Series, DataFrame, Index, Float64Index, Int64Index,
+                    RangeIndex)
+from pandas.util.testing import assert_series_equal, assert_almost_equal
+import pandas.util.testing as tm
+
+
+class TestFloatIndexers(object):
+
+    def check(self, result, original, indexer, getitem):
+        """
+        comparator for results
+        we need to take care if we are indexing on a
+        Series or a frame
+        """
+        if isinstance(original, Series):
+            expected = original.iloc[indexer]
+        else:
+            if getitem:
+                expected = original.iloc[:, indexer]
+            else:
+                expected = original.iloc[indexer]
+
+        assert_almost_equal(result, expected)
+
+    def test_scalar_error(self):
+
+        # GH 4892
+        # float_indexers should raise exceptions
+        # on appropriate Index types & accessors
+        # this duplicates the code below
+        # but is spefically testing for the error
+        # message
+
+        for index in [tm.makeStringIndex, tm.makeUnicodeIndex,
+                      tm.makeCategoricalIndex,
+                      tm.makeDateIndex, tm.makeTimedeltaIndex,
+                      tm.makePeriodIndex, tm.makeIntIndex,
+                      tm.makeRangeIndex]:
+
+            i = index(5)
+
+            s = Series(np.arange(len(i)), index=i)
+
+            def f():
+                s.iloc[3.0]
+            tm.assert_raises_regex(TypeError,
+                                   'cannot do positional indexing',
+                                   f)
+
+            def f():
+                s.iloc[3.0] = 0
+            pytest.raises(TypeError, f)
+
+    def test_scalar_non_numeric(self):
+
+        # GH 4892
+        # float_indexers should raise exceptions
+        # on appropriate Index types & accessors
+
+        for index in [tm.makeStringIndex, tm.makeUnicodeIndex,
+                      tm.makeCategoricalIndex,
+                      tm.makeDateIndex, tm.makeTimedeltaIndex,
+                      tm.makePeriodIndex]:
+
+            i = index(5)
+
+            for s in [Series(
+                    np.arange(len(i)), index=i), DataFrame(
+                        np.random.randn(
+                            len(i), len(i)), index=i, columns=i)]:
+
+                # getting
+                for idxr, getitem in [(lambda x: x.ix, False),
+                                      (lambda x: x.iloc, False),
+                                      (lambda x: x, True)]:
+
+                    def f():
+                        with catch_warnings(record=True):
+                            idxr(s)[3.0]
+
+                    # gettitem on a DataFrame is a KeyError as it is indexing
+                    # via labels on the columns
+                    if getitem and isinstance(s, DataFrame):
+                        error = KeyError
+                    else:
+                        error = TypeError
+                    pytest.raises(error, f)
+
+                # label based can be a TypeError or KeyError
+                def f():
+                    s.loc[3.0]
+
+                if s.index.inferred_type in ['string', 'unicode', 'mixed']:
+                    error = KeyError
+                else:
+                    error = TypeError
+                pytest.raises(error, f)
+
+                # contains
+                assert 3.0 not in s
+
+                # setting with a float fails with iloc
+                def f():
+                    s.iloc[3.0] = 0
+                pytest.raises(TypeError, f)
+
+                # setting with an indexer
+                if s.index.inferred_type in ['categorical']:
+                    # Value or Type Error
+                    pass
+                elif s.index.inferred_type in ['datetime64', 'timedelta64',
+                                               'period']:
+
+                    # these should prob work
+                    # and are inconsisten between series/dataframe ATM
+                    # for idxr in [lambda x: x.ix,
+                    #             lambda x: x]:
+                    #    s2 = s.copy()
+                    #    def f():
+                    #        idxr(s2)[3.0] = 0
+                    #    pytest.raises(TypeError, f)
+                    pass
+
+                else:
+
+                    s2 = s.copy()
+                    s2.loc[3.0] = 10
+                    assert s2.index.is_object()
+
+                    for idxr in [lambda x: x.ix,
+                                 lambda x: x]:
+                        s2 = s.copy()
+                        with catch_warnings(record=True):
+                            idxr(s2)[3.0] = 0
+                        assert s2.index.is_object()
+
+            # fallsback to position selection, series only
+            s = Series(np.arange(len(i)), index=i)
+            s[3]
+            pytest.raises(TypeError, lambda: s[3.0])
+
+    def test_scalar_with_mixed(self):
+
+        s2 = Series([1, 2, 3], index=['a', 'b', 'c'])
+        s3 = Series([1, 2, 3], index=['a', 'b', 1.5])
+
+        # lookup in a pure string index
+        # with an invalid indexer
+        for idxr in [lambda x: x.ix,
+                     lambda x: x,
+                     lambda x: x.iloc]:
+
+            def f():
+                with catch_warnings(record=True):
+                    idxr(s2)[1.0]
+
+            pytest.raises(TypeError, f)
+
+        pytest.raises(KeyError, lambda: s2.loc[1.0])
+
+        result = s2.loc['b']
+        expected = 2
+        assert result == expected
+
+        # mixed index so we have label
+        # indexing
+        for idxr in [lambda x: x]:
+
+            def f():
+                idxr(s3)[1.0]
+
+            pytest.raises(TypeError, f)
+
+            result = idxr(s3)[1]
+            expected = 2
+            assert result == expected
+
+        # mixed index so we have label
+        # indexing
+        for idxr in [lambda x: x.ix]:
+            with catch_warnings(record=True):
+
+                def f():
+                    idxr(s3)[1.0]
+
+                pytest.raises(TypeError, f)
+
+                result = idxr(s3)[1]
+                expected = 2
+                assert result == expected
+
+        pytest.raises(TypeError, lambda: s3.iloc[1.0])
+        pytest.raises(KeyError, lambda: s3.loc[1.0])
+
+        result = s3.loc[1.5]
+        expected = 3
+        assert result == expected
+
+    def test_scalar_integer(self):
+
+        # test how scalar float indexers work on int indexes
+
+        # integer index
+        for i in [Int64Index(range(5)), RangeIndex(5)]:
+
+            for s in [Series(np.arange(len(i))),
+                      DataFrame(np.random.randn(len(i), len(i)),
+                                index=i, columns=i)]:
+
+                # coerce to equal int
+                for idxr, getitem in [(lambda x: x.ix, False),
+                                      (lambda x: x.loc, False),
+                                      (lambda x: x, True)]:
+
+                    with catch_warnings(record=True):
+                        result = idxr(s)[3.0]
+                    self.check(result, s, 3, getitem)
+
+                # coerce to equal int
+                for idxr, getitem in [(lambda x: x.ix, False),
+                                      (lambda x: x.loc, False),
+                                      (lambda x: x, True)]:
+
+                    if isinstance(s, Series):
+                        def compare(x, y):
+                            assert x == y
+                        expected = 100
+                    else:
+                        compare = tm.assert_series_equal
+                        if getitem:
+                            expected = Series(100,
+                                              index=range(len(s)), name=3)
+                        else:
+                            expected = Series(100.,
+                                              index=range(len(s)), name=3)
+
+                    s2 = s.copy()
+                    with catch_warnings(record=True):
+                        idxr(s2)[3.0] = 100
+
+                        result = idxr(s2)[3.0]
+                        compare(result, expected)
+
+                        result = idxr(s2)[3]
+                        compare(result, expected)
+
+                # contains
+                # coerce to equal int
+                assert 3.0 in s
+
+    def test_scalar_float(self):
+
+        # scalar float indexers work on a float index
+        index = Index(np.arange(5.))
+        for s in [Series(np.arange(len(index)), index=index),
+                  DataFrame(np.random.randn(len(index), len(index)),
+                            index=index, columns=index)]:
+
+            # assert all operations except for iloc are ok
+            indexer = index[3]
+            for idxr, getitem in [(lambda x: x.ix, False),
+                                  (lambda x: x.loc, False),
+                                  (lambda x: x, True)]:
+
+                # getting
+                with catch_warnings(record=True):
+                    result = idxr(s)[indexer]
+                self.check(result, s, 3, getitem)
+
+                # setting
+                s2 = s.copy()
+
+                def f():
+                    with catch_warnings(record=True):
+                        idxr(s2)[indexer] = expected
+                with catch_warnings(record=True):
+                    result = idxr(s2)[indexer]
+                self.check(result, s, 3, getitem)
+
+                # random integer is a KeyError
+                with catch_warnings(record=True):
+                    pytest.raises(KeyError, lambda: idxr(s)[3.5])
+
+            # contains
+            assert 3.0 in s
+
+            # iloc succeeds with an integer
+            expected = s.iloc[3]
+            s2 = s.copy()
+
+            s2.iloc[3] = expected
+            result = s2.iloc[3]
+            self.check(result, s, 3, False)
+
+            # iloc raises with a float
+            pytest.raises(TypeError, lambda: s.iloc[3.0])
+
+            def g():
+                s2.iloc[3.0] = 0
+            pytest.raises(TypeError, g)
+
+    def test_slice_non_numeric(self):
+
+        # GH 4892
+        # float_indexers should raise exceptions
+        # on appropriate Index types & accessors
+
+        for index in [tm.makeStringIndex, tm.makeUnicodeIndex,
+                      tm.makeDateIndex, tm.makeTimedeltaIndex,
+                      tm.makePeriodIndex]:
+
+            index = index(5)
+            for s in [Series(range(5), index=index),
+                      DataFrame(np.random.randn(5, 2), index=index)]:
+
+                # getitem
+                for l in [slice(3.0, 4),
+                          slice(3, 4.0),
+                          slice(3.0, 4.0)]:
+
+                    def f():
+                        s.iloc[l]
+                    pytest.raises(TypeError, f)
+
+                    for idxr in [lambda x: x.ix,
+                                 lambda x: x.loc,
+                                 lambda x: x.iloc,
+                                 lambda x: x]:
+
+                        def f():
+                            with catch_warnings(record=True):
+                                idxr(s)[l]
+                        pytest.raises(TypeError, f)
+
+                # setitem
+                for l in [slice(3.0, 4),
+                          slice(3, 4.0),
+                          slice(3.0, 4.0)]:
+
+                    def f():
+                        s.iloc[l] = 0
+                    pytest.raises(TypeError, f)
+
+                    for idxr in [lambda x: x.ix,
+                                 lambda x: x.loc,
+                                 lambda x: x.iloc,
+                                 lambda x: x]:
+                        def f():
+                            with catch_warnings(record=True):
+                                idxr(s)[l] = 0
+                        pytest.raises(TypeError, f)
+
+    def test_slice_integer(self):
+
+        # same as above, but for Integer based indexes
+        # these coerce to a like integer
+        # oob indicates if we are out of bounds
+        # of positional indexing
+        for index, oob in [(Int64Index(range(5)), False),
+                           (RangeIndex(5), False),
+                           (Int64Index(range(5)) + 10, True)]:
+
+            # s is an in-range index
+            s = Series(range(5), index=index)
+
+            # getitem
+            for l in [slice(3.0, 4),
+                      slice(3, 4.0),
+                      slice(3.0, 4.0)]:
+
+                for idxr in [lambda x: x.loc,
+                             lambda x: x.ix]:
+
+                    with catch_warnings(record=True):
+                        result = idxr(s)[l]
+
+                    # these are all label indexing
+                    # except getitem which is positional
+                    # empty
+                    if oob:
+                        indexer = slice(0, 0)
+                    else:
+                        indexer = slice(3, 5)
+                    self.check(result, s, indexer, False)
+
+                # positional indexing
+                def f():
+                    s[l]
+
+                pytest.raises(TypeError, f)
+
+            # getitem out-of-bounds
+            for l in [slice(-6, 6),
+                      slice(-6.0, 6.0)]:
+
+                for idxr in [lambda x: x.loc,
+                             lambda x: x.ix]:
+                    with catch_warnings(record=True):
+                        result = idxr(s)[l]
+
+                    # these are all label indexing
+                    # except getitem which is positional
+                    # empty
+                    if oob:
+                        indexer = slice(0, 0)
+                    else:
+                        indexer = slice(-6, 6)
+                    self.check(result, s, indexer, False)
+
+            # positional indexing
+            def f():
+                s[slice(-6.0, 6.0)]
+
+            pytest.raises(TypeError, f)
+
+            # getitem odd floats
+            for l, res1 in [(slice(2.5, 4), slice(3, 5)),
+                            (slice(2, 3.5), slice(2, 4)),
+                            (slice(2.5, 3.5), slice(3, 4))]:
+
+                for idxr in [lambda x: x.loc,
+                             lambda x: x.ix]:
+
+                    with catch_warnings(record=True):
+                        result = idxr(s)[l]
+                    if oob:
+                        res = slice(0, 0)
+                    else:
+                        res = res1
+
+                    self.check(result, s, res, False)
+
+                # positional indexing
+                def f():
+                    s[l]
+
+                pytest.raises(TypeError, f)
+
+            # setitem
+            for l in [slice(3.0, 4),
+                      slice(3, 4.0),
+                      slice(3.0, 4.0)]:
+
+                for idxr in [lambda x: x.loc,
+                             lambda x: x.ix]:
+                    sc = s.copy()
+                    with catch_warnings(record=True):
+                        idxr(sc)[l] = 0
+                        result = idxr(sc)[l].values.ravel()
+                    assert (result == 0).all()
+
+                # positional indexing
+                def f():
+                    s[l] = 0
+
+                pytest.raises(TypeError, f)
+
+    def test_integer_positional_indexing(self):
+        """ make sure that we are raising on positional indexing
+        w.r.t. an integer index """
+
+        s = Series(range(2, 6), index=range(2, 6))
+
+        result = s[2:4]
+        expected = s.iloc[2:4]
+        assert_series_equal(result, expected)
+
+        for idxr in [lambda x: x,
+                     lambda x: x.iloc]:
+
+            for l in [slice(2, 4.0),
+                      slice(2.0, 4),
+                      slice(2.0, 4.0)]:
+
+                def f():
+                    idxr(s)[l]
+
+                pytest.raises(TypeError, f)
+
+    def test_slice_integer_frame_getitem(self):
+
+        # similar to above, but on the getitem dim (of a DataFrame)
+        for index in [Int64Index(range(5)), RangeIndex(5)]:
+
+            s = DataFrame(np.random.randn(5, 2), index=index)
+
+            def f(idxr):
+
+                # getitem
+                for l in [slice(0.0, 1),
+                          slice(0, 1.0),
+                          slice(0.0, 1.0)]:
+
+                    result = idxr(s)[l]
+                    indexer = slice(0, 2)
+                    self.check(result, s, indexer, False)
+
+                    # positional indexing
+                    def f():
+                        s[l]
+
+                    pytest.raises(TypeError, f)
+
+                # getitem out-of-bounds
+                for l in [slice(-10, 10),
+                          slice(-10.0, 10.0)]:
+
+                    result = idxr(s)[l]
+                    self.check(result, s, slice(-10, 10), True)
+
+                # positional indexing
+                def f():
+                    s[slice(-10.0, 10.0)]
+
+                pytest.raises(TypeError, f)
+
+                # getitem odd floats
+                for l, res in [(slice(0.5, 1), slice(1, 2)),
+                               (slice(0, 0.5), slice(0, 1)),
+                               (slice(0.5, 1.5), slice(1, 2))]:
+
+                    result = idxr(s)[l]
+                    self.check(result, s, res, False)
+
+                    # positional indexing
+                    def f():
+                        s[l]
+
+                    pytest.raises(TypeError, f)
+
+                # setitem
+                for l in [slice(3.0, 4),
+                          slice(3, 4.0),
+                          slice(3.0, 4.0)]:
+
+                    sc = s.copy()
+                    idxr(sc)[l] = 0
+                    result = idxr(sc)[l].values.ravel()
+                    assert (result == 0).all()
+
+                    # positional indexing
+                    def f():
+                        s[l] = 0
+
+                    pytest.raises(TypeError, f)
+
+            f(lambda x: x.loc)
+            with catch_warnings(record=True):
+                f(lambda x: x.ix)
+
+    def test_slice_float(self):
+
+        # same as above, but for floats
+        index = Index(np.arange(5.)) + 0.1
+        for s in [Series(range(5), index=index),
+                  DataFrame(np.random.randn(5, 2), index=index)]:
+
+            for l in [slice(3.0, 4),
+                      slice(3, 4.0),
+                      slice(3.0, 4.0)]:
+
+                expected = s.iloc[3:4]
+                for idxr in [lambda x: x.ix,
+                             lambda x: x.loc,
+                             lambda x: x]:
+
+                    # getitem
+                    with catch_warnings(record=True):
+                        result = idxr(s)[l]
+                    if isinstance(s, Series):
+                        tm.assert_series_equal(result, expected)
+                    else:
+                        tm.assert_frame_equal(result, expected)
+                    # setitem
+                    s2 = s.copy()
+                    with catch_warnings(record=True):
+                        idxr(s2)[l] = 0
+                        result = idxr(s2)[l].values.ravel()
+                    assert (result == 0).all()
+
+    def test_floating_index_doc_example(self):
+
+        index = Index([1.5, 2, 3, 4.5, 5])
+        s = Series(range(5), index=index)
+        assert s[3] == 2
+        assert s.loc[3] == 2
+        assert s.loc[3] == 2
+        assert s.iloc[3] == 3
+
+    def test_floating_misc(self):
+
+        # related 236
+        # scalar/slicing of a float index
+        s = Series(np.arange(5), index=np.arange(5) * 2.5, dtype=np.int64)
+
+        # label based slicing
+        result1 = s[1.0:3.0]
+        result2 = s.loc[1.0:3.0]
+        result3 = s.loc[1.0:3.0]
+        assert_series_equal(result1, result2)
+        assert_series_equal(result1, result3)
+
+        # exact indexing when found
+        result1 = s[5.0]
+        result2 = s.loc[5.0]
+        result3 = s.loc[5.0]
+        assert result1 == result2
+        assert result1 == result3
+
+        result1 = s[5]
+        result2 = s.loc[5]
+        result3 = s.loc[5]
+        assert result1 == result2
+        assert result1 == result3
+
+        assert s[5.0] == s[5]
+
+        # value not found (and no fallbacking at all)
+
+        # scalar integers
+        pytest.raises(KeyError, lambda: s.loc[4])
+        pytest.raises(KeyError, lambda: s.loc[4])
+        pytest.raises(KeyError, lambda: s[4])
+
+        # fancy floats/integers create the correct entry (as nan)
+        # fancy tests
+        expected = Series([2, 0], index=Float64Index([5.0, 0.0]))
+        for fancy_idx in [[5.0, 0.0], np.array([5.0, 0.0])]:  # float
+            assert_series_equal(s[fancy_idx], expected)
+            assert_series_equal(s.loc[fancy_idx], expected)
+            assert_series_equal(s.loc[fancy_idx], expected)
+
+        expected = Series([2, 0], index=Index([5, 0], dtype='int64'))
+        for fancy_idx in [[5, 0], np.array([5, 0])]:  # int
+            assert_series_equal(s[fancy_idx], expected)
+            assert_series_equal(s.loc[fancy_idx], expected)
+            assert_series_equal(s.loc[fancy_idx], expected)
+
+        # all should return the same as we are slicing 'the same'
+        result1 = s.loc[2:5]
+        result2 = s.loc[2.0:5.0]
+        result3 = s.loc[2.0:5]
+        result4 = s.loc[2.1:5]
+        assert_series_equal(result1, result2)
+        assert_series_equal(result1, result3)
+        assert_series_equal(result1, result4)
+
+        # previously this did fallback indexing
+        result1 = s[2:5]
+        result2 = s[2.0:5.0]
+        result3 = s[2.0:5]
+        result4 = s[2.1:5]
+        assert_series_equal(result1, result2)
+        assert_series_equal(result1, result3)
+        assert_series_equal(result1, result4)
+
+        result1 = s.loc[2:5]
+        result2 = s.loc[2.0:5.0]
+        result3 = s.loc[2.0:5]
+        result4 = s.loc[2.1:5]
+        assert_series_equal(result1, result2)
+        assert_series_equal(result1, result3)
+        assert_series_equal(result1, result4)
+
+        # combined test
+        result1 = s.loc[2:5]
+        result2 = s.loc[2:5]
+        result3 = s[2:5]
+
+        assert_series_equal(result1, result2)
+        assert_series_equal(result1, result3)
+
+        # list selection
+        result1 = s[[0.0, 5, 10]]
+        result2 = s.loc[[0.0, 5, 10]]
+        result3 = s.loc[[0.0, 5, 10]]
+        result4 = s.iloc[[0, 2, 4]]
+        assert_series_equal(result1, result2)
+        assert_series_equal(result1, result3)
+        assert_series_equal(result1, result4)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result1 = s[[1.6, 5, 10]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result2 = s.loc[[1.6, 5, 10]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result3 = s.loc[[1.6, 5, 10]]
+        assert_series_equal(result1, result2)
+        assert_series_equal(result1, result3)
+        assert_series_equal(result1, Series(
+            [np.nan, 2, 4], index=[1.6, 5, 10]))
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result1 = s[[0, 1, 2]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result2 = s.loc[[0, 1, 2]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result3 = s.loc[[0, 1, 2]]
+        assert_series_equal(result1, result2)
+        assert_series_equal(result1, result3)
+        assert_series_equal(result1, Series(
+            [0.0, np.nan, np.nan], index=[0, 1, 2]))
+
+        result1 = s.loc[[2.5, 5]]
+        result2 = s.loc[[2.5, 5]]
+        assert_series_equal(result1, result2)
+        assert_series_equal(result1, Series([1, 2], index=[2.5, 5.0]))
+
+        result1 = s[[2.5]]
+        result2 = s.loc[[2.5]]
+        result3 = s.loc[[2.5]]
+        assert_series_equal(result1, result2)
+        assert_series_equal(result1, result3)
+        assert_series_equal(result1, Series([1], index=[2.5]))
+
+    def test_floating_tuples(self):
+        # see gh-13509
+        s = Series([(1, 1), (2, 2), (3, 3)], index=[0.0, 0.1, 0.2], name='foo')
+
+        result = s[0.0]
+        assert result == (1, 1)
+
+        expected = Series([(1, 1), (2, 2)], index=[0.0, 0.0], name='foo')
+        s = Series([(1, 1), (2, 2), (3, 3)], index=[0.0, 0.0, 0.2], name='foo')
+
+        result = s[0.0]
+        tm.assert_series_equal(result, expected)
+
+    def test_float64index_slicing_bug(self):
+        # GH 5557, related to slicing a float index
+        ser = {256: 2321.0,
+               1: 78.0,
+               2: 2716.0,
+               3: 0.0,
+               4: 369.0,
+               5: 0.0,
+               6: 269.0,
+               7: 0.0,
+               8: 0.0,
+               9: 0.0,
+               10: 3536.0,
+               11: 0.0,
+               12: 24.0,
+               13: 0.0,
+               14: 931.0,
+               15: 0.0,
+               16: 101.0,
+               17: 78.0,
+               18: 9643.0,
+               19: 0.0,
+               20: 0.0,
+               21: 0.0,
+               22: 63761.0,
+               23: 0.0,
+               24: 446.0,
+               25: 0.0,
+               26: 34773.0,
+               27: 0.0,
+               28: 729.0,
+               29: 78.0,
+               30: 0.0,
+               31: 0.0,
+               32: 3374.0,
+               33: 0.0,
+               34: 1391.0,
+               35: 0.0,
+               36: 361.0,
+               37: 0.0,
+               38: 61808.0,
+               39: 0.0,
+               40: 0.0,
+               41: 0.0,
+               42: 6677.0,
+               43: 0.0,
+               44: 802.0,
+               45: 0.0,
+               46: 2691.0,
+               47: 0.0,
+               48: 3582.0,
+               49: 0.0,
+               50: 734.0,
+               51: 0.0,
+               52: 627.0,
+               53: 70.0,
+               54: 2584.0,
+               55: 0.0,
+               56: 324.0,
+               57: 0.0,
+               58: 605.0,
+               59: 0.0,
+               60: 0.0,
+               61: 0.0,
+               62: 3989.0,
+               63: 10.0,
+               64: 42.0,
+               65: 0.0,
+               66: 904.0,
+               67: 0.0,
+               68: 88.0,
+               69: 70.0,
+               70: 8172.0,
+               71: 0.0,
+               72: 0.0,
+               73: 0.0,
+               74: 64902.0,
+               75: 0.0,
+               76: 347.0,
+               77: 0.0,
+               78: 36605.0,
+               79: 0.0,
+               80: 379.0,
+               81: 70.0,
+               82: 0.0,
+               83: 0.0,
+               84: 3001.0,
+               85: 0.0,
+               86: 1630.0,
+               87: 7.0,
+               88: 364.0,
+               89: 0.0,
+               90: 67404.0,
+               91: 9.0,
+               92: 0.0,
+               93: 0.0,
+               94: 7685.0,
+               95: 0.0,
+               96: 1017.0,
+               97: 0.0,
+               98: 2831.0,
+               99: 0.0,
+               100: 2963.0,
+               101: 0.0,
+               102: 854.0,
+               103: 0.0,
+               104: 0.0,
+               105: 0.0,
+               106: 0.0,
+               107: 0.0,
+               108: 0.0,
+               109: 0.0,
+               110: 0.0,
+               111: 0.0,
+               112: 0.0,
+               113: 0.0,
+               114: 0.0,
+               115: 0.0,
+               116: 0.0,
+               117: 0.0,
+               118: 0.0,
+               119: 0.0,
+               120: 0.0,
+               121: 0.0,
+               122: 0.0,
+               123: 0.0,
+               124: 0.0,
+               125: 0.0,
+               126: 67744.0,
+               127: 22.0,
+               128: 264.0,
+               129: 0.0,
+               260: 197.0,
+               268: 0.0,
+               265: 0.0,
+               269: 0.0,
+               261: 0.0,
+               266: 1198.0,
+               267: 0.0,
+               262: 2629.0,
+               258: 775.0,
+               257: 0.0,
+               263: 0.0,
+               259: 0.0,
+               264: 163.0,
+               250: 10326.0,
+               251: 0.0,
+               252: 1228.0,
+               253: 0.0,
+               254: 2769.0,
+               255: 0.0}
+
+        # smoke test for the repr
+        s = Series(ser)
+        result = s.value_counts()
+        str(result)
diff --git a/pandas/tests/indexing/test_iloc.py b/pandas/tests/indexing/test_iloc.py
new file mode 100644
index 0000000000000..49047e1da0996
--- /dev/null
+++ b/pandas/tests/indexing/test_iloc.py
@@ -0,0 +1,668 @@
+""" test positional based indexing with iloc """
+
+import pytest
+
+from warnings import catch_warnings
+import numpy as np
+
+import pandas as pd
+from pandas.compat import lrange, lmap
+from pandas import Series, DataFrame, date_range, concat, isna
+from pandas.util import testing as tm
+from pandas.tests.indexing.common import Base
+from pandas.api.types import is_scalar
+
+
+class TestiLoc(Base):
+
+    def test_iloc_exceeds_bounds(self):
+
+        # GH6296
+        # iloc should allow indexers that exceed the bounds
+        df = DataFrame(np.random.random_sample((20, 5)), columns=list('ABCDE'))
+        expected = df
+
+        # lists of positions should raise IndexErrror!
+        with tm.assert_raises_regex(IndexError,
+                                    'positional indexers '
+                                    'are out-of-bounds'):
+            df.iloc[:, [0, 1, 2, 3, 4, 5]]
+        pytest.raises(IndexError, lambda: df.iloc[[1, 30]])
+        pytest.raises(IndexError, lambda: df.iloc[[1, -30]])
+        pytest.raises(IndexError, lambda: df.iloc[[100]])
+
+        s = df['A']
+        pytest.raises(IndexError, lambda: s.iloc[[100]])
+        pytest.raises(IndexError, lambda: s.iloc[[-100]])
+
+        # still raise on a single indexer
+        msg = 'single positional indexer is out-of-bounds'
+        with tm.assert_raises_regex(IndexError, msg):
+            df.iloc[30]
+        pytest.raises(IndexError, lambda: df.iloc[-30])
+
+        # GH10779
+        # single positive/negative indexer exceeding Series bounds should raise
+        # an IndexError
+        with tm.assert_raises_regex(IndexError, msg):
+            s.iloc[30]
+        pytest.raises(IndexError, lambda: s.iloc[-30])
+
+        # slices are ok
+        result = df.iloc[:, 4:10]  # 0 < start < len < stop
+        expected = df.iloc[:, 4:]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.iloc[:, -4:-10]  # stop < 0 < start < len
+        expected = df.iloc[:, :0]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.iloc[:, 10:4:-1]  # 0 < stop < len < start (down)
+        expected = df.iloc[:, :4:-1]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.iloc[:, 4:-10:-1]  # stop < 0 < start < len (down)
+        expected = df.iloc[:, 4::-1]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.iloc[:, -10:4]  # start < 0 < stop < len
+        expected = df.iloc[:, :4]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.iloc[:, 10:4]  # 0 < stop < len < start
+        expected = df.iloc[:, :0]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.iloc[:, -10:-11:-1]  # stop < start < 0 < len (down)
+        expected = df.iloc[:, :0]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.iloc[:, 10:11]  # 0 < len < start < stop
+        expected = df.iloc[:, :0]
+        tm.assert_frame_equal(result, expected)
+
+        # slice bounds exceeding is ok
+        result = s.iloc[18:30]
+        expected = s.iloc[18:]
+        tm.assert_series_equal(result, expected)
+
+        result = s.iloc[30:]
+        expected = s.iloc[:0]
+        tm.assert_series_equal(result, expected)
+
+        result = s.iloc[30::-1]
+        expected = s.iloc[::-1]
+        tm.assert_series_equal(result, expected)
+
+        # doc example
+        def check(result, expected):
+            str(result)
+            result.dtypes
+            tm.assert_frame_equal(result, expected)
+
+        dfl = DataFrame(np.random.randn(5, 2), columns=list('AB'))
+        check(dfl.iloc[:, 2:3], DataFrame(index=dfl.index))
+        check(dfl.iloc[:, 1:3], dfl.iloc[:, [1]])
+        check(dfl.iloc[4:6], dfl.iloc[[4]])
+
+        pytest.raises(IndexError, lambda: dfl.iloc[[4, 5, 6]])
+        pytest.raises(IndexError, lambda: dfl.iloc[:, 4])
+
+    def test_iloc_getitem_int(self):
+
+        # integer
+        self.check_result('integer', 'iloc', 2, 'ix',
+                          {0: 4, 1: 6, 2: 8}, typs=['ints', 'uints'])
+        self.check_result('integer', 'iloc', 2, 'indexer', 2,
+                          typs=['labels', 'mixed', 'ts', 'floats', 'empty'],
+                          fails=IndexError)
+
+    def test_iloc_getitem_neg_int(self):
+
+        # neg integer
+        self.check_result('neg int', 'iloc', -1, 'ix',
+                          {0: 6, 1: 9, 2: 12}, typs=['ints', 'uints'])
+        self.check_result('neg int', 'iloc', -1, 'indexer', -1,
+                          typs=['labels', 'mixed', 'ts', 'floats', 'empty'],
+                          fails=IndexError)
+
+    def test_iloc_getitem_list_int(self):
+
+        # list of ints
+        self.check_result('list int', 'iloc', [0, 1, 2], 'ix',
+                          {0: [0, 2, 4], 1: [0, 3, 6], 2: [0, 4, 8]},
+                          typs=['ints', 'uints'])
+        self.check_result('list int', 'iloc', [2], 'ix',
+                          {0: [4], 1: [6], 2: [8]}, typs=['ints', 'uints'])
+        self.check_result('list int', 'iloc', [0, 1, 2], 'indexer', [0, 1, 2],
+                          typs=['labels', 'mixed', 'ts', 'floats', 'empty'],
+                          fails=IndexError)
+
+        # array of ints (GH5006), make sure that a single indexer is returning
+        # the correct type
+        self.check_result('array int', 'iloc', np.array([0, 1, 2]), 'ix',
+                          {0: [0, 2, 4],
+                           1: [0, 3, 6],
+                           2: [0, 4, 8]}, typs=['ints', 'uints'])
+        self.check_result('array int', 'iloc', np.array([2]), 'ix',
+                          {0: [4], 1: [6], 2: [8]}, typs=['ints', 'uints'])
+        self.check_result('array int', 'iloc', np.array([0, 1, 2]), 'indexer',
+                          [0, 1, 2],
+                          typs=['labels', 'mixed', 'ts', 'floats', 'empty'],
+                          fails=IndexError)
+
+    def test_iloc_getitem_neg_int_can_reach_first_index(self):
+        # GH10547 and GH10779
+        # negative integers should be able to reach index 0
+        df = DataFrame({'A': [2, 3, 5], 'B': [7, 11, 13]})
+        s = df['A']
+
+        expected = df.iloc[0]
+        result = df.iloc[-3]
+        tm.assert_series_equal(result, expected)
+
+        expected = df.iloc[[0]]
+        result = df.iloc[[-3]]
+        tm.assert_frame_equal(result, expected)
+
+        expected = s.iloc[0]
+        result = s.iloc[-3]
+        assert result == expected
+
+        expected = s.iloc[[0]]
+        result = s.iloc[[-3]]
+        tm.assert_series_equal(result, expected)
+
+        # check the length 1 Series case highlighted in GH10547
+        expected = Series(['a'], index=['A'])
+        result = expected.iloc[[-1]]
+        tm.assert_series_equal(result, expected)
+
+    def test_iloc_getitem_dups(self):
+
+        # no dups in panel (bug?)
+        self.check_result('list int (dups)', 'iloc', [0, 1, 1, 3], 'ix',
+                          {0: [0, 2, 2, 6], 1: [0, 3, 3, 9]},
+                          objs=['series', 'frame'], typs=['ints', 'uints'])
+
+        # GH 6766
+        df1 = DataFrame([{'A': None, 'B': 1}, {'A': 2, 'B': 2}])
+        df2 = DataFrame([{'A': 3, 'B': 3}, {'A': 4, 'B': 4}])
+        df = concat([df1, df2], axis=1)
+
+        # cross-sectional indexing
+        result = df.iloc[0, 0]
+        assert isna(result)
+
+        result = df.iloc[0, :]
+        expected = Series([np.nan, 1, 3, 3], index=['A', 'B', 'A', 'B'],
+                          name=0)
+        tm.assert_series_equal(result, expected)
+
+    def test_iloc_getitem_array(self):
+
+        # array like
+        s = Series(index=lrange(1, 4))
+        self.check_result('array like', 'iloc', s.index, 'ix',
+                          {0: [2, 4, 6], 1: [3, 6, 9], 2: [4, 8, 12]},
+                          typs=['ints', 'uints'])
+
+    def test_iloc_getitem_bool(self):
+
+        # boolean indexers
+        b = [True, False, True, False, ]
+        self.check_result('bool', 'iloc', b, 'ix', b, typs=['ints', 'uints'])
+        self.check_result('bool', 'iloc', b, 'ix', b,
+                          typs=['labels', 'mixed', 'ts', 'floats', 'empty'],
+                          fails=IndexError)
+
+    def test_iloc_getitem_slice(self):
+
+        # slices
+        self.check_result('slice', 'iloc', slice(1, 3), 'ix',
+                          {0: [2, 4], 1: [3, 6], 2: [4, 8]},
+                          typs=['ints', 'uints'])
+        self.check_result('slice', 'iloc', slice(1, 3), 'indexer',
+                          slice(1, 3),
+                          typs=['labels', 'mixed', 'ts', 'floats', 'empty'],
+                          fails=IndexError)
+
+    def test_iloc_getitem_slice_dups(self):
+
+        df1 = DataFrame(np.random.randn(10, 4), columns=['A', 'A', 'B', 'B'])
+        df2 = DataFrame(np.random.randint(0, 10, size=20).reshape(10, 2),
+                        columns=['A', 'C'])
+
+        # axis=1
+        df = concat([df1, df2], axis=1)
+        tm.assert_frame_equal(df.iloc[:, :4], df1)
+        tm.assert_frame_equal(df.iloc[:, 4:], df2)
+
+        df = concat([df2, df1], axis=1)
+        tm.assert_frame_equal(df.iloc[:, :2], df2)
+        tm.assert_frame_equal(df.iloc[:, 2:], df1)
+
+        exp = concat([df2, df1.iloc[:, [0]]], axis=1)
+        tm.assert_frame_equal(df.iloc[:, 0:3], exp)
+
+        # axis=0
+        df = concat([df, df], axis=0)
+        tm.assert_frame_equal(df.iloc[0:10, :2], df2)
+        tm.assert_frame_equal(df.iloc[0:10, 2:], df1)
+        tm.assert_frame_equal(df.iloc[10:, :2], df2)
+        tm.assert_frame_equal(df.iloc[10:, 2:], df1)
+
+    def test_iloc_setitem(self):
+        df = self.frame_ints
+
+        df.iloc[1, 1] = 1
+        result = df.iloc[1, 1]
+        assert result == 1
+
+        df.iloc[:, 2:3] = 0
+        expected = df.iloc[:, 2:3]
+        result = df.iloc[:, 2:3]
+        tm.assert_frame_equal(result, expected)
+
+        # GH5771
+        s = Series(0, index=[4, 5, 6])
+        s.iloc[1:2] += 1
+        expected = Series([0, 1, 0], index=[4, 5, 6])
+        tm.assert_series_equal(s, expected)
+
+    @pytest.mark.parametrize(
+        'data, indexes, values, expected_k', [
+            # test without indexer value in first level of MultiIndex
+            ([[2, 22, 5], [2, 33, 6]], [0, -1, 1], [2, 3, 1], [7, 10]),
+            # test like code sample 1 in the issue
+            ([[1, 22, 555], [1, 33, 666]], [0, -1, 1], [200, 300, 100],
+                [755, 1066]),
+            # test like code sample 2 in the issue
+            ([[1, 3, 7], [2, 4, 8]], [0, -1, 1], [10, 10, 1000], [17, 1018]),
+            # test like code sample 3 in the issue
+            ([[1, 11, 4], [2, 22, 5], [3, 33, 6]], [0, -1, 1], [4, 7, 10],
+                [8, 15, 13])
+        ])
+    def test_iloc_setitem_int_multiindex_series(
+            self, data, indexes, values, expected_k):
+        # GH17148
+        df = DataFrame(data=data, columns=['i', 'j', 'k'])
+        df = df.set_index(['i', 'j'])
+
+        series = df.k.copy()
+        for i, v in zip(indexes, values):
+            series.iloc[i] += v
+
+        df['k'] = expected_k
+        expected = df.k
+        tm.assert_series_equal(series, expected)
+
+    def test_iloc_setitem_list(self):
+
+        # setitem with an iloc list
+        df = DataFrame(np.arange(9).reshape((3, 3)), index=["A", "B", "C"],
+                       columns=["A", "B", "C"])
+        df.iloc[[0, 1], [1, 2]]
+        df.iloc[[0, 1], [1, 2]] += 100
+
+        expected = DataFrame(
+            np.array([0, 101, 102, 3, 104, 105, 6, 7, 8]).reshape((3, 3)),
+            index=["A", "B", "C"], columns=["A", "B", "C"])
+        tm.assert_frame_equal(df, expected)
+
+    def test_iloc_setitem_pandas_object(self):
+        # GH 17193, affecting old numpy (1.7 and 1.8)
+        s_orig = Series([0, 1, 2, 3])
+        expected = Series([0, -1, -2, 3])
+
+        s = s_orig.copy()
+        s.iloc[Series([1, 2])] = [-1, -2]
+        tm.assert_series_equal(s, expected)
+
+        s = s_orig.copy()
+        s.iloc[pd.Index([1, 2])] = [-1, -2]
+        tm.assert_series_equal(s, expected)
+
+    def test_iloc_setitem_dups(self):
+
+        # GH 6766
+        # iloc with a mask aligning from another iloc
+        df1 = DataFrame([{'A': None, 'B': 1}, {'A': 2, 'B': 2}])
+        df2 = DataFrame([{'A': 3, 'B': 3}, {'A': 4, 'B': 4}])
+        df = concat([df1, df2], axis=1)
+
+        expected = df.fillna(3)
+        expected['A'] = expected['A'].astype('float64')
+        inds = np.isnan(df.iloc[:, 0])
+        mask = inds[inds].index
+        df.iloc[mask, 0] = df.iloc[mask, 2]
+        tm.assert_frame_equal(df, expected)
+
+        # del a dup column across blocks
+        expected = DataFrame({0: [1, 2], 1: [3, 4]})
+        expected.columns = ['B', 'B']
+        del df['A']
+        tm.assert_frame_equal(df, expected)
+
+        # assign back to self
+        df.iloc[[0, 1], [0, 1]] = df.iloc[[0, 1], [0, 1]]
+        tm.assert_frame_equal(df, expected)
+
+        # reversed x 2
+        df.iloc[[1, 0], [0, 1]] = df.iloc[[1, 0], [0, 1]].reset_index(
+            drop=True)
+        df.iloc[[1, 0], [0, 1]] = df.iloc[[1, 0], [0, 1]].reset_index(
+            drop=True)
+        tm.assert_frame_equal(df, expected)
+
+    def test_iloc_getitem_frame(self):
+        df = DataFrame(np.random.randn(10, 4), index=lrange(0, 20, 2),
+                       columns=lrange(0, 8, 2))
+
+        result = df.iloc[2]
+        with catch_warnings(record=True):
+            exp = df.ix[4]
+        tm.assert_series_equal(result, exp)
+
+        result = df.iloc[2, 2]
+        with catch_warnings(record=True):
+            exp = df.ix[4, 4]
+        assert result == exp
+
+        # slice
+        result = df.iloc[4:8]
+        with catch_warnings(record=True):
+            expected = df.ix[8:14]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.iloc[:, 2:3]
+        with catch_warnings(record=True):
+            expected = df.ix[:, 4:5]
+        tm.assert_frame_equal(result, expected)
+
+        # list of integers
+        result = df.iloc[[0, 1, 3]]
+        with catch_warnings(record=True):
+            expected = df.ix[[0, 2, 6]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.iloc[[0, 1, 3], [0, 1]]
+        with catch_warnings(record=True):
+            expected = df.ix[[0, 2, 6], [0, 2]]
+        tm.assert_frame_equal(result, expected)
+
+        # neg indices
+        result = df.iloc[[-1, 1, 3], [-1, 1]]
+        with catch_warnings(record=True):
+            expected = df.ix[[18, 2, 6], [6, 2]]
+        tm.assert_frame_equal(result, expected)
+
+        # dups indices
+        result = df.iloc[[-1, -1, 1, 3], [-1, 1]]
+        with catch_warnings(record=True):
+            expected = df.ix[[18, 18, 2, 6], [6, 2]]
+        tm.assert_frame_equal(result, expected)
+
+        # with index-like
+        s = Series(index=lrange(1, 5))
+        result = df.iloc[s.index]
+        with catch_warnings(record=True):
+            expected = df.ix[[2, 4, 6, 8]]
+        tm.assert_frame_equal(result, expected)
+
+    def test_iloc_getitem_labelled_frame(self):
+        # try with labelled frame
+        df = DataFrame(np.random.randn(10, 4),
+                       index=list('abcdefghij'), columns=list('ABCD'))
+
+        result = df.iloc[1, 1]
+        exp = df.loc['b', 'B']
+        assert result == exp
+
+        result = df.iloc[:, 2:3]
+        expected = df.loc[:, ['C']]
+        tm.assert_frame_equal(result, expected)
+
+        # negative indexing
+        result = df.iloc[-1, -1]
+        exp = df.loc['j', 'D']
+        assert result == exp
+
+        # out-of-bounds exception
+        pytest.raises(IndexError, df.iloc.__getitem__, tuple([10, 5]))
+
+        # trying to use a label
+        pytest.raises(ValueError, df.iloc.__getitem__, tuple(['j', 'D']))
+
+    def test_iloc_getitem_doc_issue(self):
+
+        # multi axis slicing issue with single block
+        # surfaced in GH 6059
+
+        arr = np.random.randn(6, 4)
+        index = date_range('20130101', periods=6)
+        columns = list('ABCD')
+        df = DataFrame(arr, index=index, columns=columns)
+
+        # defines ref_locs
+        df.describe()
+
+        result = df.iloc[3:5, 0:2]
+        str(result)
+        result.dtypes
+
+        expected = DataFrame(arr[3:5, 0:2], index=index[3:5],
+                             columns=columns[0:2])
+        tm.assert_frame_equal(result, expected)
+
+        # for dups
+        df.columns = list('aaaa')
+        result = df.iloc[3:5, 0:2]
+        str(result)
+        result.dtypes
+
+        expected = DataFrame(arr[3:5, 0:2], index=index[3:5],
+                             columns=list('aa'))
+        tm.assert_frame_equal(result, expected)
+
+        # related
+        arr = np.random.randn(6, 4)
+        index = list(range(0, 12, 2))
+        columns = list(range(0, 8, 2))
+        df = DataFrame(arr, index=index, columns=columns)
+
+        df._data.blocks[0].mgr_locs
+        result = df.iloc[1:5, 2:4]
+        str(result)
+        result.dtypes
+        expected = DataFrame(arr[1:5, 2:4], index=index[1:5],
+                             columns=columns[2:4])
+        tm.assert_frame_equal(result, expected)
+
+    def test_iloc_setitem_series(self):
+        df = DataFrame(np.random.randn(10, 4), index=list('abcdefghij'),
+                       columns=list('ABCD'))
+
+        df.iloc[1, 1] = 1
+        result = df.iloc[1, 1]
+        assert result == 1
+
+        df.iloc[:, 2:3] = 0
+        expected = df.iloc[:, 2:3]
+        result = df.iloc[:, 2:3]
+        tm.assert_frame_equal(result, expected)
+
+        s = Series(np.random.randn(10), index=lrange(0, 20, 2))
+
+        s.iloc[1] = 1
+        result = s.iloc[1]
+        assert result == 1
+
+        s.iloc[:4] = 0
+        expected = s.iloc[:4]
+        result = s.iloc[:4]
+        tm.assert_series_equal(result, expected)
+
+        s = Series([-1] * 6)
+        s.iloc[0::2] = [0, 2, 4]
+        s.iloc[1::2] = [1, 3, 5]
+        result = s
+        expected = Series([0, 1, 2, 3, 4, 5])
+        tm.assert_series_equal(result, expected)
+
+    def test_iloc_setitem_list_of_lists(self):
+
+        # GH 7551
+        # list-of-list is set incorrectly in mixed vs. single dtyped frames
+        df = DataFrame(dict(A=np.arange(5, dtype='int64'),
+                            B=np.arange(5, 10, dtype='int64')))
+        df.iloc[2:4] = [[10, 11], [12, 13]]
+        expected = DataFrame(dict(A=[0, 1, 10, 12, 4], B=[5, 6, 11, 13, 9]))
+        tm.assert_frame_equal(df, expected)
+
+        df = DataFrame(
+            dict(A=list('abcde'), B=np.arange(5, 10, dtype='int64')))
+        df.iloc[2:4] = [['x', 11], ['y', 13]]
+        expected = DataFrame(dict(A=['a', 'b', 'x', 'y', 'e'],
+                                  B=[5, 6, 11, 13, 9]))
+        tm.assert_frame_equal(df, expected)
+
+    @pytest.mark.parametrize(
+        'indexer', [[0], slice(None, 1, None), np.array([0])])
+    @pytest.mark.parametrize(
+        'value', [['Z'], np.array(['Z'])])
+    def test_iloc_setitem_with_scalar_index(self, indexer, value):
+        # GH #19474
+        # assigning like "df.iloc[0, [0]] = ['Z']" should be evaluated
+        # elementwisely, not using "setter('A', ['Z'])".
+
+        df = pd.DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
+        df.iloc[0, indexer] = value
+        result = df.iloc[0, 0]
+
+        assert is_scalar(result) and result == 'Z'
+
+    def test_iloc_mask(self):
+
+        # GH 3631, iloc with a mask (of a series) should raise
+        df = DataFrame(lrange(5), list('ABCDE'), columns=['a'])
+        mask = (df.a % 2 == 0)
+        pytest.raises(ValueError, df.iloc.__getitem__, tuple([mask]))
+        mask.index = lrange(len(mask))
+        pytest.raises(NotImplementedError, df.iloc.__getitem__,
+                      tuple([mask]))
+
+        # ndarray ok
+        result = df.iloc[np.array([True] * len(mask), dtype=bool)]
+        tm.assert_frame_equal(result, df)
+
+        # the possibilities
+        locs = np.arange(4)
+        nums = 2 ** locs
+        reps = lmap(bin, nums)
+        df = DataFrame({'locs': locs, 'nums': nums}, reps)
+
+        expected = {
+            (None, ''): '0b1100',
+            (None, '.loc'): '0b1100',
+            (None, '.iloc'): '0b1100',
+            ('index', ''): '0b11',
+            ('index', '.loc'): '0b11',
+            ('index', '.iloc'): ('iLocation based boolean indexing '
+                                 'cannot use an indexable as a mask'),
+            ('locs', ''): 'Unalignable boolean Series provided as indexer '
+                          '(index of the boolean Series and of the indexed '
+                          'object do not match',
+            ('locs', '.loc'): 'Unalignable boolean Series provided as indexer '
+                              '(index of the boolean Series and of the '
+                              'indexed object do not match',
+            ('locs', '.iloc'): ('iLocation based boolean indexing on an '
+                                'integer type is not available'),
+        }
+
+        # UserWarnings from reindex of a boolean mask
+        with catch_warnings(record=True):
+            result = dict()
+            for idx in [None, 'index', 'locs']:
+                mask = (df.nums > 2).values
+                if idx:
+                    mask = Series(mask, list(reversed(getattr(df, idx))))
+                for method in ['', '.loc', '.iloc']:
+                    try:
+                        if method:
+                            accessor = getattr(df, method[1:])
+                        else:
+                            accessor = df
+                        ans = str(bin(accessor[mask]['nums'].sum()))
+                    except Exception as e:
+                        ans = str(e)
+
+                    key = tuple([idx, method])
+                    r = expected.get(key)
+                    if r != ans:
+                        raise AssertionError(
+                            "[%s] does not match [%s], received [%s]"
+                            % (key, ans, r))
+
+    def test_iloc_non_unique_indexing(self):
+
+        # GH 4017, non-unique indexing (on the axis)
+        df = DataFrame({'A': [0.1] * 3000, 'B': [1] * 3000})
+        idx = np.array(lrange(30)) * 99
+        expected = df.iloc[idx]
+
+        df3 = concat([df, 2 * df, 3 * df])
+        result = df3.iloc[idx]
+
+        tm.assert_frame_equal(result, expected)
+
+        df2 = DataFrame({'A': [0.1] * 1000, 'B': [1] * 1000})
+        df2 = concat([df2, 2 * df2, 3 * df2])
+
+        sidx = df2.index.to_series()
+        expected = df2.iloc[idx[idx <= sidx.max()]]
+
+        new_list = []
+        for r, s in expected.iterrows():
+            new_list.append(s)
+            new_list.append(s * 2)
+            new_list.append(s * 3)
+
+        expected = DataFrame(new_list)
+        expected = concat([expected, DataFrame(index=idx[idx > sidx.max()])],
+                          sort=True)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df2.loc[idx]
+        tm.assert_frame_equal(result, expected, check_index_type=False)
+
+    def test_iloc_empty_list_indexer_is_ok(self):
+        from pandas.util.testing import makeCustomDataframe as mkdf
+        df = mkdf(5, 2)
+        # vertical empty
+        tm.assert_frame_equal(df.iloc[:, []], df.iloc[:, :0],
+                              check_index_type=True, check_column_type=True)
+        # horizontal empty
+        tm.assert_frame_equal(df.iloc[[], :], df.iloc[:0, :],
+                              check_index_type=True, check_column_type=True)
+        # horizontal empty
+        tm.assert_frame_equal(df.iloc[[]], df.iloc[:0, :],
+                              check_index_type=True,
+                              check_column_type=True)
+
+    def test_identity_slice_returns_new_object(self):
+        # GH13873
+        original_df = DataFrame({'a': [1, 2, 3]})
+        sliced_df = original_df.iloc[:]
+        assert sliced_df is not original_df
+
+        # should be a shallow copy
+        original_df['a'] = [4, 4, 4]
+        assert (sliced_df['a'] == 4).all()
+
+        original_series = Series([1, 2, 3, 4, 5, 6])
+        sliced_series = original_series.iloc[:]
+        assert sliced_series is not original_series
+
+        # should also be a shallow copy
+        original_series[:3] = [7, 8, 9]
+        assert all(sliced_series[:3] == [7, 8, 9])
diff --git a/pandas/tests/indexing/test_indexing.py b/pandas/tests/indexing/test_indexing.py
new file mode 100644
index 0000000000000..9c992770fc64c
--- /dev/null
+++ b/pandas/tests/indexing/test_indexing.py
@@ -0,0 +1,1020 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=W0612,E1101
+
+""" test fancy indexing & misc """
+
+import pytest
+
+import weakref
+from warnings import catch_warnings
+from datetime import datetime
+
+from pandas.core.dtypes.common import (
+    is_integer_dtype,
+    is_float_dtype)
+from pandas.compat import range, lrange, lzip, StringIO
+import numpy as np
+
+import pandas as pd
+from pandas.core.indexing import (_non_reducing_slice, _maybe_numeric_slice,
+                                  validate_indices)
+from pandas import NaT, DataFrame, Index, Series, MultiIndex
+import pandas.util.testing as tm
+from pandas.compat import PY2
+
+from pandas.tests.indexing.common import Base, _mklbl
+
+
+# ------------------------------------------------------------------------
+# Indexing test cases
+
+
+class TestFancy(Base):
+    """ pure get/set item & fancy indexing """
+
+    def test_setitem_ndarray_1d(self):
+        # GH5508
+
+        # len of indexer vs length of the 1d ndarray
+        df = DataFrame(index=Index(lrange(1, 11)))
+        df['foo'] = np.zeros(10, dtype=np.float64)
+        df['bar'] = np.zeros(10, dtype=np.complex)
+
+        # invalid
+        def f():
+            df.loc[df.index[2:5], 'bar'] = np.array([2.33j, 1.23 + 0.1j,
+                                                     2.2, 1.0])
+
+        pytest.raises(ValueError, f)
+
+        # valid
+        df.loc[df.index[2:6], 'bar'] = np.array([2.33j, 1.23 + 0.1j,
+                                                 2.2, 1.0])
+
+        result = df.loc[df.index[2:6], 'bar']
+        expected = Series([2.33j, 1.23 + 0.1j, 2.2, 1.0], index=[3, 4, 5, 6],
+                          name='bar')
+        tm.assert_series_equal(result, expected)
+
+        # dtype getting changed?
+        df = DataFrame(index=Index(lrange(1, 11)))
+        df['foo'] = np.zeros(10, dtype=np.float64)
+        df['bar'] = np.zeros(10, dtype=np.complex)
+
+        def f():
+            df[2:5] = np.arange(1, 4) * 1j
+
+        pytest.raises(ValueError, f)
+
+    def test_inf_upcast(self):
+        # GH 16957
+        # We should be able to use np.inf as a key
+        # np.inf should cause an index to convert to float
+
+        # Test with np.inf in rows
+        df = DataFrame(columns=[0])
+        df.loc[1] = 1
+        df.loc[2] = 2
+        df.loc[np.inf] = 3
+
+        # make sure we can look up the value
+        assert df.loc[np.inf, 0] == 3
+
+        result = df.index
+        expected = pd.Float64Index([1, 2, np.inf])
+        tm.assert_index_equal(result, expected)
+
+        # Test with np.inf in columns
+        df = DataFrame()
+        df.loc[0, 0] = 1
+        df.loc[1, 1] = 2
+        df.loc[0, np.inf] = 3
+
+        result = df.columns
+        expected = pd.Float64Index([0, 1, np.inf])
+        tm.assert_index_equal(result, expected)
+
+    def test_setitem_dtype_upcast(self):
+
+        # GH3216
+        df = DataFrame([{"a": 1}, {"a": 3, "b": 2}])
+        df['c'] = np.nan
+        assert df['c'].dtype == np.float64
+
+        df.loc[0, 'c'] = 'foo'
+        expected = DataFrame([{"a": 1, "c": 'foo'},
+                              {"a": 3, "b": 2, "c": np.nan}])
+        tm.assert_frame_equal(df, expected)
+
+        # GH10280
+        df = DataFrame(np.arange(6, dtype='int64').reshape(2, 3),
+                       index=list('ab'),
+                       columns=['foo', 'bar', 'baz'])
+
+        for val in [3.14, 'wxyz']:
+            left = df.copy()
+            left.loc['a', 'bar'] = val
+            right = DataFrame([[0, val, 2], [3, 4, 5]], index=list('ab'),
+                              columns=['foo', 'bar', 'baz'])
+
+            tm.assert_frame_equal(left, right)
+            assert is_integer_dtype(left['foo'])
+            assert is_integer_dtype(left['baz'])
+
+        left = DataFrame(np.arange(6, dtype='int64').reshape(2, 3) / 10.0,
+                         index=list('ab'),
+                         columns=['foo', 'bar', 'baz'])
+        left.loc['a', 'bar'] = 'wxyz'
+
+        right = DataFrame([[0, 'wxyz', .2], [.3, .4, .5]], index=list('ab'),
+                          columns=['foo', 'bar', 'baz'])
+
+        tm.assert_frame_equal(left, right)
+        assert is_float_dtype(left['foo'])
+        assert is_float_dtype(left['baz'])
+
+    def test_dups_fancy_indexing(self):
+
+        # GH 3455
+        from pandas.util.testing import makeCustomDataframe as mkdf
+        df = mkdf(10, 3)
+        df.columns = ['a', 'a', 'b']
+        result = df[['b', 'a']].columns
+        expected = Index(['b', 'a', 'a'])
+        tm.assert_index_equal(result, expected)
+
+        # across dtypes
+        df = DataFrame([[1, 2, 1., 2., 3., 'foo', 'bar']],
+                       columns=list('aaaaaaa'))
+        df.head()
+        str(df)
+        result = DataFrame([[1, 2, 1., 2., 3., 'foo', 'bar']])
+        result.columns = list('aaaaaaa')
+
+        # TODO(wesm): unused?
+        df_v = df.iloc[:, 4]  # noqa
+        res_v = result.iloc[:, 4]  # noqa
+
+        tm.assert_frame_equal(df, result)
+
+        # GH 3561, dups not in selected order
+        df = DataFrame(
+            {'test': [5, 7, 9, 11],
+             'test1': [4., 5, 6, 7],
+             'other': list('abcd')}, index=['A', 'A', 'B', 'C'])
+        rows = ['C', 'B']
+        expected = DataFrame(
+            {'test': [11, 9],
+             'test1': [7., 6],
+             'other': ['d', 'c']}, index=rows)
+        result = df.loc[rows]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[Index(rows)]
+        tm.assert_frame_equal(result, expected)
+
+        rows = ['C', 'B', 'E']
+        expected = DataFrame(
+            {'test': [11, 9, np.nan],
+             'test1': [7., 6, np.nan],
+             'other': ['d', 'c', np.nan]}, index=rows)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df.loc[rows]
+        tm.assert_frame_equal(result, expected)
+
+        # see GH5553, make sure we use the right indexer
+        rows = ['F', 'G', 'H', 'C', 'B', 'E']
+        expected = DataFrame({'test': [np.nan, np.nan, np.nan, 11, 9, np.nan],
+                              'test1': [np.nan, np.nan, np.nan, 7., 6, np.nan],
+                              'other': [np.nan, np.nan, np.nan,
+                                        'd', 'c', np.nan]},
+                             index=rows)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df.loc[rows]
+        tm.assert_frame_equal(result, expected)
+
+        # List containing only missing label
+        dfnu = DataFrame(np.random.randn(5, 3), index=list('AABCD'))
+        with pytest.raises(KeyError):
+            dfnu.loc[['E']]
+
+        # ToDo: check_index_type can be True after GH 11497
+
+        # GH 4619; duplicate indexer with missing label
+        df = DataFrame({"A": [0, 1, 2]})
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df.loc[[0, 8, 0]]
+        expected = DataFrame({"A": [0, np.nan, 0]}, index=[0, 8, 0])
+        tm.assert_frame_equal(result, expected, check_index_type=False)
+
+        df = DataFrame({"A": list('abc')})
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df.loc[[0, 8, 0]]
+        expected = DataFrame({"A": ['a', np.nan, 'a']}, index=[0, 8, 0])
+        tm.assert_frame_equal(result, expected, check_index_type=False)
+
+        # non unique with non unique selector
+        df = DataFrame({'test': [5, 7, 9, 11]}, index=['A', 'A', 'B', 'C'])
+        expected = DataFrame(
+            {'test': [5, 7, 5, 7, np.nan]}, index=['A', 'A', 'A', 'A', 'E'])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df.loc[['A', 'A', 'E']]
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.skipif(PY2,
+                        reason="GH-20770. Py2 unreliable warnings catching.")
+    def test_dups_fancy_indexing2(self):
+        # GH 5835
+        # dups on index and missing values
+        df = DataFrame(
+            np.random.randn(5, 5), columns=['A', 'B', 'B', 'B', 'A'])
+
+        expected = pd.concat(
+            [df.loc[:, ['A', 'B']], DataFrame(np.nan, columns=['C'],
+                                              index=df.index)], axis=1)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df.loc[:, ['A', 'B', 'C']]
+        tm.assert_frame_equal(result, expected)
+
+        # GH 6504, multi-axis indexing
+        df = DataFrame(np.random.randn(9, 2),
+                       index=[1, 1, 1, 2, 2, 2, 3, 3, 3], columns=['a', 'b'])
+
+        expected = df.iloc[0:6]
+        result = df.loc[[1, 2]]
+        tm.assert_frame_equal(result, expected)
+
+        expected = df
+        result = df.loc[:, ['a', 'b']]
+        tm.assert_frame_equal(result, expected)
+
+        expected = df.iloc[0:6, :]
+        result = df.loc[[1, 2], ['a', 'b']]
+        tm.assert_frame_equal(result, expected)
+
+    def test_indexing_mixed_frame_bug(self):
+
+        # GH3492
+        df = DataFrame({'a': {1: 'aaa', 2: 'bbb', 3: 'ccc'},
+                        'b': {1: 111, 2: 222, 3: 333}})
+
+        # this works, new column is created correctly
+        df['test'] = df['a'].apply(lambda x: '_' if x == 'aaa' else x)
+
+        # this does not work, ie column test is not changed
+        idx = df['test'] == '_'
+        temp = df.loc[idx, 'a'].apply(lambda x: '-----' if x == 'aaa' else x)
+        df.loc[idx, 'test'] = temp
+        assert df.iloc[0, 2] == '-----'
+
+        # if I look at df, then element [0,2] equals '_'. If instead I type
+        # df.ix[idx,'test'], I get '-----', finally by typing df.iloc[0,2] I
+        # get '_'.
+
+    def test_multitype_list_index_access(self):
+        # GH 10610
+        df = DataFrame(np.random.random((10, 5)),
+                       columns=["a"] + [20, 21, 22, 23])
+
+        with pytest.raises(KeyError):
+            df[[22, 26, -8]]
+        assert df[21].shape[0] == df.shape[0]
+
+    def test_set_index_nan(self):
+
+        # GH 3586
+        df = DataFrame({'PRuid': {17: 'nonQC',
+                                  18: 'nonQC',
+                                  19: 'nonQC',
+                                  20: '10',
+                                  21: '11',
+                                  22: '12',
+                                  23: '13',
+                                  24: '24',
+                                  25: '35',
+                                  26: '46',
+                                  27: '47',
+                                  28: '48',
+                                  29: '59',
+                                  30: '10'},
+                        'QC': {17: 0.0,
+                               18: 0.0,
+                               19: 0.0,
+                               20: np.nan,
+                               21: np.nan,
+                               22: np.nan,
+                               23: np.nan,
+                               24: 1.0,
+                               25: np.nan,
+                               26: np.nan,
+                               27: np.nan,
+                               28: np.nan,
+                               29: np.nan,
+                               30: np.nan},
+                        'data': {17: 7.9544899999999998,
+                                 18: 8.0142609999999994,
+                                 19: 7.8591520000000008,
+                                 20: 0.86140349999999999,
+                                 21: 0.87853110000000001,
+                                 22: 0.8427041999999999,
+                                 23: 0.78587700000000005,
+                                 24: 0.73062459999999996,
+                                 25: 0.81668560000000001,
+                                 26: 0.81927080000000008,
+                                 27: 0.80705009999999999,
+                                 28: 0.81440240000000008,
+                                 29: 0.80140849999999997,
+                                 30: 0.81307740000000006},
+                        'year': {17: 2006,
+                                 18: 2007,
+                                 19: 2008,
+                                 20: 1985,
+                                 21: 1985,
+                                 22: 1985,
+                                 23: 1985,
+                                 24: 1985,
+                                 25: 1985,
+                                 26: 1985,
+                                 27: 1985,
+                                 28: 1985,
+                                 29: 1985,
+                                 30: 1986}}).reset_index()
+
+        result = df.set_index(['year', 'PRuid', 'QC']).reset_index().reindex(
+            columns=df.columns)
+        tm.assert_frame_equal(result, df)
+
+    def test_multi_nan_indexing(self):
+
+        # GH 3588
+        df = DataFrame({"a": ['R1', 'R2', np.nan, 'R4'],
+                        'b': ["C1", "C2", "C3", "C4"],
+                        "c": [10, 15, np.nan, 20]})
+        result = df.set_index(['a', 'b'], drop=False)
+        expected = DataFrame({"a": ['R1', 'R2', np.nan, 'R4'],
+                              'b': ["C1", "C2", "C3", "C4"],
+                              "c": [10, 15, np.nan, 20]},
+                             index=[Index(['R1', 'R2', np.nan, 'R4'],
+                                          name='a'),
+                                    Index(['C1', 'C2', 'C3', 'C4'], name='b')])
+        tm.assert_frame_equal(result, expected)
+
+    def test_multi_assign(self):
+
+        # GH 3626, an assignment of a sub-df to a df
+        df = DataFrame({'FC': ['a', 'b', 'a', 'b', 'a', 'b'],
+                        'PF': [0, 0, 0, 0, 1, 1],
+                        'col1': lrange(6),
+                        'col2': lrange(6, 12)})
+        df.iloc[1, 0] = np.nan
+        df2 = df.copy()
+
+        mask = ~df2.FC.isna()
+        cols = ['col1', 'col2']
+
+        dft = df2 * 2
+        dft.iloc[3, 3] = np.nan
+
+        expected = DataFrame({'FC': ['a', np.nan, 'a', 'b', 'a', 'b'],
+                              'PF': [0, 0, 0, 0, 1, 1],
+                              'col1': Series([0, 1, 4, 6, 8, 10]),
+                              'col2': [12, 7, 16, np.nan, 20, 22]})
+
+        # frame on rhs
+        df2.loc[mask, cols] = dft.loc[mask, cols]
+        tm.assert_frame_equal(df2, expected)
+
+        df2.loc[mask, cols] = dft.loc[mask, cols]
+        tm.assert_frame_equal(df2, expected)
+
+        # with an ndarray on rhs
+        # coerces to float64 because values has float64 dtype
+        # GH 14001
+        expected = DataFrame({'FC': ['a', np.nan, 'a', 'b', 'a', 'b'],
+                              'PF': [0, 0, 0, 0, 1, 1],
+                              'col1': [0., 1., 4., 6., 8., 10.],
+                              'col2': [12, 7, 16, np.nan, 20, 22]})
+        df2 = df.copy()
+        df2.loc[mask, cols] = dft.loc[mask, cols].values
+        tm.assert_frame_equal(df2, expected)
+        df2.loc[mask, cols] = dft.loc[mask, cols].values
+        tm.assert_frame_equal(df2, expected)
+
+        # broadcasting on the rhs is required
+        df = DataFrame(dict(A=[1, 2, 0, 0, 0], B=[0, 0, 0, 10, 11], C=[
+                       0, 0, 0, 10, 11], D=[3, 4, 5, 6, 7]))
+
+        expected = df.copy()
+        mask = expected['A'] == 0
+        for col in ['A', 'B']:
+            expected.loc[mask, col] = df['D']
+
+        df.loc[df['A'] == 0, ['A', 'B']] = df['D']
+        tm.assert_frame_equal(df, expected)
+
+    def test_setitem_list(self):
+
+        # GH 6043
+        # ix with a list
+        df = DataFrame(index=[0, 1], columns=[0])
+        with catch_warnings(record=True):
+            df.ix[1, 0] = [1, 2, 3]
+            df.ix[1, 0] = [1, 2]
+
+        result = DataFrame(index=[0, 1], columns=[0])
+        with catch_warnings(record=True):
+            result.ix[1, 0] = [1, 2]
+
+        tm.assert_frame_equal(result, df)
+
+        # ix with an object
+        class TO(object):
+
+            def __init__(self, value):
+                self.value = value
+
+            def __str__(self):
+                return "[{0}]".format(self.value)
+
+            __repr__ = __str__
+
+            def __eq__(self, other):
+                return self.value == other.value
+
+            def view(self):
+                return self
+
+        df = DataFrame(index=[0, 1], columns=[0])
+        with catch_warnings(record=True):
+            df.ix[1, 0] = TO(1)
+            df.ix[1, 0] = TO(2)
+
+        result = DataFrame(index=[0, 1], columns=[0])
+        with catch_warnings(record=True):
+            result.ix[1, 0] = TO(2)
+
+        tm.assert_frame_equal(result, df)
+
+        # remains object dtype even after setting it back
+        df = DataFrame(index=[0, 1], columns=[0])
+        with catch_warnings(record=True):
+            df.ix[1, 0] = TO(1)
+            df.ix[1, 0] = np.nan
+        result = DataFrame(index=[0, 1], columns=[0])
+
+        tm.assert_frame_equal(result, df)
+
+    def test_string_slice(self):
+        # GH 14424
+        # string indexing against datetimelike with object
+        # dtype should properly raises KeyError
+        df = DataFrame([1], Index([pd.Timestamp('2011-01-01')], dtype=object))
+        assert df.index.is_all_dates
+        with pytest.raises(KeyError):
+            df['2011']
+
+        with pytest.raises(KeyError):
+            df.loc['2011', 0]
+
+        df = DataFrame()
+        assert not df.index.is_all_dates
+        with pytest.raises(KeyError):
+            df['2011']
+
+        with pytest.raises(KeyError):
+            df.loc['2011', 0]
+
+    def test_mi_access(self):
+
+        # GH 4145
+        data = """h1 main  h3 sub  h5
+0  a    A   1  A1   1
+1  b    B   2  B1   2
+2  c    B   3  A1   3
+3  d    A   4  B2   4
+4  e    A   5  B2   5
+5  f    B   6  A2   6
+"""
+
+        df = pd.read_csv(StringIO(data), sep=r'\s+', index_col=0)
+        df2 = df.set_index(['main', 'sub']).T.sort_index(1)
+        index = Index(['h1', 'h3', 'h5'])
+        columns = MultiIndex.from_tuples([('A', 'A1')], names=['main', 'sub'])
+        expected = DataFrame([['a', 1, 1]], index=columns, columns=index).T
+
+        result = df2.loc[:, ('A', 'A1')]
+        tm.assert_frame_equal(result, expected)
+
+        result = df2[('A', 'A1')]
+        tm.assert_frame_equal(result, expected)
+
+        # GH 4146, not returning a block manager when selecting a unique index
+        # from a duplicate index
+        # as of 4879, this returns a Series (which is similar to what happens
+        # with a non-unique)
+        expected = Series(['a', 1, 1], index=['h1', 'h3', 'h5'], name='A1')
+        result = df2['A']['A1']
+        tm.assert_series_equal(result, expected)
+
+        # selecting a non_unique from the 2nd level
+        expected = DataFrame([['d', 4, 4], ['e', 5, 5]],
+                             index=Index(['B2', 'B2'], name='sub'),
+                             columns=['h1', 'h3', 'h5'], ).T
+        result = df2['A']['B2']
+        tm.assert_frame_equal(result, expected)
+
+    def test_astype_assignment(self):
+
+        # GH4312 (iloc)
+        df_orig = DataFrame([['1', '2', '3', '.4', 5, 6., 'foo']],
+                            columns=list('ABCDEFG'))
+
+        df = df_orig.copy()
+        df.iloc[:, 0:2] = df.iloc[:, 0:2].astype(np.int64)
+        expected = DataFrame([[1, 2, '3', '.4', 5, 6., 'foo']],
+                             columns=list('ABCDEFG'))
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.iloc[:, 0:2] = df.iloc[:, 0:2]._convert(datetime=True, numeric=True)
+        expected = DataFrame([[1, 2, '3', '.4', 5, 6., 'foo']],
+                             columns=list('ABCDEFG'))
+        tm.assert_frame_equal(df, expected)
+
+        # GH5702 (loc)
+        df = df_orig.copy()
+        df.loc[:, 'A'] = df.loc[:, 'A'].astype(np.int64)
+        expected = DataFrame([[1, '2', '3', '.4', 5, 6., 'foo']],
+                             columns=list('ABCDEFG'))
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc[:, ['B', 'C']] = df.loc[:, ['B', 'C']].astype(np.int64)
+        expected = DataFrame([['1', 2, 3, '.4', 5, 6., 'foo']],
+                             columns=list('ABCDEFG'))
+        tm.assert_frame_equal(df, expected)
+
+        # full replacements / no nans
+        df = DataFrame({'A': [1., 2., 3., 4.]})
+        df.iloc[:, 0] = df['A'].astype(np.int64)
+        expected = DataFrame({'A': [1, 2, 3, 4]})
+        tm.assert_frame_equal(df, expected)
+
+        df = DataFrame({'A': [1., 2., 3., 4.]})
+        df.loc[:, 'A'] = df['A'].astype(np.int64)
+        expected = DataFrame({'A': [1, 2, 3, 4]})
+        tm.assert_frame_equal(df, expected)
+
+    def test_astype_assignment_with_dups(self):
+
+        # GH 4686
+        # assignment with dups that has a dtype change
+        cols = MultiIndex.from_tuples([('A', '1'), ('B', '1'), ('A', '2')])
+        df = DataFrame(np.arange(3).reshape((1, 3)),
+                       columns=cols, dtype=object)
+        index = df.index.copy()
+
+        df['A'] = df['A'].astype(np.float64)
+        tm.assert_index_equal(df.index, index)
+
+        # TODO(wesm): unused variables
+        # result = df.get_dtype_counts().sort_index()
+        # expected = Series({'float64': 2, 'object': 1}).sort_index()
+
+    @pytest.mark.parametrize("index,val", [
+        (Index([0, 1, 2]), 2),
+        (Index([0, 1, '2']), '2'),
+        (Index([0, 1, 2, np.inf, 4]), 4),
+        (Index([0, 1, 2, np.nan, 4]), 4),
+        (Index([0, 1, 2, np.inf]), np.inf),
+        (Index([0, 1, 2, np.nan]), np.nan),
+    ])
+    def test_index_contains(self, index, val):
+        assert val in index
+
+    @pytest.mark.parametrize("index,val", [
+        (Index([0, 1, 2]), '2'),
+        (Index([0, 1, '2']), 2),
+        (Index([0, 1, 2, np.inf]), 4),
+        (Index([0, 1, 2, np.nan]), 4),
+        (Index([0, 1, 2, np.inf]), np.nan),
+        (Index([0, 1, 2, np.nan]), np.inf),
+        # Checking if np.inf in Int64Index should not cause an OverflowError
+        # Related to GH 16957
+        (pd.Int64Index([0, 1, 2]), np.inf),
+        (pd.Int64Index([0, 1, 2]), np.nan),
+        (pd.UInt64Index([0, 1, 2]), np.inf),
+        (pd.UInt64Index([0, 1, 2]), np.nan),
+    ])
+    def test_index_not_contains(self, index, val):
+        assert val not in index
+
+    def test_index_type_coercion(self):
+
+        with catch_warnings(record=True):
+
+            # GH 11836
+            # if we have an index type and set it with something that looks
+            # to numpy like the same, but is actually, not
+            # (e.g. setting with a float or string '0')
+            # then we need to coerce to object
+
+            # integer indexes
+            for s in [Series(range(5)),
+                      Series(range(5), index=range(1, 6))]:
+
+                assert s.index.is_integer()
+
+                for indexer in [lambda x: x.ix,
+                                lambda x: x.loc,
+                                lambda x: x]:
+                    s2 = s.copy()
+                    indexer(s2)[0.1] = 0
+                    assert s2.index.is_floating()
+                    assert indexer(s2)[0.1] == 0
+
+                    s2 = s.copy()
+                    indexer(s2)[0.0] = 0
+                    exp = s.index
+                    if 0 not in s:
+                        exp = Index(s.index.tolist() + [0])
+                    tm.assert_index_equal(s2.index, exp)
+
+                    s2 = s.copy()
+                    indexer(s2)['0'] = 0
+                    assert s2.index.is_object()
+
+            for s in [Series(range(5), index=np.arange(5.))]:
+
+                assert s.index.is_floating()
+
+                for idxr in [lambda x: x.ix,
+                             lambda x: x.loc,
+                             lambda x: x]:
+
+                    s2 = s.copy()
+                    idxr(s2)[0.1] = 0
+                    assert s2.index.is_floating()
+                    assert idxr(s2)[0.1] == 0
+
+                    s2 = s.copy()
+                    idxr(s2)[0.0] = 0
+                    tm.assert_index_equal(s2.index, s.index)
+
+                    s2 = s.copy()
+                    idxr(s2)['0'] = 0
+                    assert s2.index.is_object()
+
+
+class TestMisc(Base):
+
+    def test_indexer_caching(self):
+        # GH5727
+        # make sure that indexers are in the _internal_names_set
+        n = 1000001
+        arrays = [lrange(n), lrange(n)]
+        index = MultiIndex.from_tuples(lzip(*arrays))
+        s = Series(np.zeros(n), index=index)
+        str(s)
+
+        # setitem
+        expected = Series(np.ones(n), index=index)
+        s = Series(np.zeros(n), index=index)
+        s[s == 0] = 1
+        tm.assert_series_equal(s, expected)
+
+    def test_float_index_to_mixed(self):
+        df = DataFrame({0.0: np.random.rand(10), 1.0: np.random.rand(10)})
+        df['a'] = 10
+        tm.assert_frame_equal(DataFrame({0.0: df[0.0],
+                                         1.0: df[1.0],
+                                         'a': [10] * 10}),
+                              df)
+
+    def test_float_index_non_scalar_assignment(self):
+        df = DataFrame({'a': [1, 2, 3], 'b': [3, 4, 5]}, index=[1., 2., 3.])
+        df.loc[df.index[:2]] = 1
+        expected = DataFrame({'a': [1, 1, 3], 'b': [1, 1, 5]}, index=df.index)
+        tm.assert_frame_equal(expected, df)
+
+        df = DataFrame({'a': [1, 2, 3], 'b': [3, 4, 5]}, index=[1., 2., 3.])
+        df2 = df.copy()
+        df.loc[df.index] = df.loc[df.index]
+        tm.assert_frame_equal(df, df2)
+
+    def test_float_index_at_iat(self):
+        s = Series([1, 2, 3], index=[0.1, 0.2, 0.3])
+        for el, item in s.iteritems():
+            assert s.at[el] == item
+        for i in range(len(s)):
+            assert s.iat[i] == i + 1
+
+    def test_rhs_alignment(self):
+        # GH8258, tests that both rows & columns are aligned to what is
+        # assigned to. covers both uniform data-type & multi-type cases
+        def run_tests(df, rhs, right):
+            # label, index, slice
+            r, i, s = list('bcd'), [1, 2, 3], slice(1, 4)
+            c, j, l = ['joe', 'jolie'], [1, 2], slice(1, 3)
+
+            left = df.copy()
+            left.loc[r, c] = rhs
+            tm.assert_frame_equal(left, right)
+
+            left = df.copy()
+            left.iloc[i, j] = rhs
+            tm.assert_frame_equal(left, right)
+
+            left = df.copy()
+            with catch_warnings(record=True):
+                left.ix[s, l] = rhs
+            tm.assert_frame_equal(left, right)
+
+            left = df.copy()
+            with catch_warnings(record=True):
+                left.ix[i, j] = rhs
+            tm.assert_frame_equal(left, right)
+
+            left = df.copy()
+            with catch_warnings(record=True):
+                left.ix[r, c] = rhs
+            tm.assert_frame_equal(left, right)
+
+        xs = np.arange(20).reshape(5, 4)
+        cols = ['jim', 'joe', 'jolie', 'joline']
+        df = DataFrame(xs, columns=cols, index=list('abcde'))
+
+        # right hand side; permute the indices and multiplpy by -2
+        rhs = -2 * df.iloc[3:0:-1, 2:0:-1]
+
+        # expected `right` result; just multiply by -2
+        right = df.copy()
+        right.iloc[1:4, 1:3] *= -2
+
+        # run tests with uniform dtypes
+        run_tests(df, rhs, right)
+
+        # make frames multi-type & re-run tests
+        for frame in [df, rhs, right]:
+            frame['joe'] = frame['joe'].astype('float64')
+            frame['jolie'] = frame['jolie'].map('@{0}'.format)
+
+        run_tests(df, rhs, right)
+
+    def test_str_label_slicing_with_negative_step(self):
+        SLC = pd.IndexSlice
+
+        def assert_slices_equivalent(l_slc, i_slc):
+            tm.assert_series_equal(s.loc[l_slc], s.iloc[i_slc])
+
+            if not idx.is_integer:
+                # For integer indices, ix and plain getitem are position-based.
+                tm.assert_series_equal(s[l_slc], s.iloc[i_slc])
+                tm.assert_series_equal(s.loc[l_slc], s.iloc[i_slc])
+
+        for idx in [_mklbl('A', 20), np.arange(20) + 100,
+                    np.linspace(100, 150, 20)]:
+            idx = Index(idx)
+            s = Series(np.arange(20), index=idx)
+            assert_slices_equivalent(SLC[idx[9]::-1], SLC[9::-1])
+            assert_slices_equivalent(SLC[:idx[9]:-1], SLC[:8:-1])
+            assert_slices_equivalent(SLC[idx[13]:idx[9]:-1], SLC[13:8:-1])
+            assert_slices_equivalent(SLC[idx[9]:idx[13]:-1], SLC[:0])
+
+    def test_slice_with_zero_step_raises(self):
+        s = Series(np.arange(20), index=_mklbl('A', 20))
+        tm.assert_raises_regex(ValueError, 'slice step cannot be zero',
+                               lambda: s[::0])
+        tm.assert_raises_regex(ValueError, 'slice step cannot be zero',
+                               lambda: s.loc[::0])
+        with catch_warnings(record=True):
+            tm.assert_raises_regex(ValueError,
+                                   'slice step cannot be zero',
+                                   lambda: s.ix[::0])
+
+    def test_indexing_assignment_dict_already_exists(self):
+        df = DataFrame({'x': [1, 2, 6],
+                        'y': [2, 2, 8],
+                        'z': [-5, 0, 5]}).set_index('z')
+        expected = df.copy()
+        rhs = dict(x=9, y=99)
+        df.loc[5] = rhs
+        expected.loc[5] = [9, 99]
+        tm.assert_frame_equal(df, expected)
+
+    def test_indexing_dtypes_on_empty(self):
+        # Check that .iloc and .ix return correct dtypes GH9983
+        df = DataFrame({'a': [1, 2, 3], 'b': ['b', 'b2', 'b3']})
+        with catch_warnings(record=True):
+            df2 = df.ix[[], :]
+
+        assert df2.loc[:, 'a'].dtype == np.int64
+        tm.assert_series_equal(df2.loc[:, 'a'], df2.iloc[:, 0])
+        with catch_warnings(record=True):
+            tm.assert_series_equal(df2.loc[:, 'a'], df2.ix[:, 0])
+
+    def test_range_in_series_indexing(self):
+        # range can cause an indexing error
+        # GH 11652
+        for x in [5, 999999, 1000000]:
+            s = Series(index=range(x))
+            s.loc[range(1)] = 42
+            tm.assert_series_equal(s.loc[range(1)], Series(42.0, index=[0]))
+
+            s.loc[range(2)] = 43
+            tm.assert_series_equal(s.loc[range(2)], Series(43.0, index=[0, 1]))
+
+    def test_non_reducing_slice(self):
+        df = DataFrame([[0, 1], [2, 3]])
+
+        slices = [
+            # pd.IndexSlice[:, :],
+            pd.IndexSlice[:, 1],
+            pd.IndexSlice[1, :],
+            pd.IndexSlice[[1], [1]],
+            pd.IndexSlice[1, [1]],
+            pd.IndexSlice[[1], 1],
+            pd.IndexSlice[1],
+            pd.IndexSlice[1, 1],
+            slice(None, None, None),
+            [0, 1],
+            np.array([0, 1]),
+            Series([0, 1])
+        ]
+        for slice_ in slices:
+            tslice_ = _non_reducing_slice(slice_)
+            assert isinstance(df.loc[tslice_], DataFrame)
+
+    def test_list_slice(self):
+        # like dataframe getitem
+        slices = [['A'], Series(['A']), np.array(['A'])]
+        df = DataFrame({'A': [1, 2], 'B': [3, 4]}, index=['A', 'B'])
+        expected = pd.IndexSlice[:, ['A']]
+        for subset in slices:
+            result = _non_reducing_slice(subset)
+            tm.assert_frame_equal(df.loc[result], df.loc[expected])
+
+    def test_maybe_numeric_slice(self):
+        df = DataFrame({'A': [1, 2], 'B': ['c', 'd'], 'C': [True, False]})
+        result = _maybe_numeric_slice(df, slice_=None)
+        expected = pd.IndexSlice[:, ['A']]
+        assert result == expected
+
+        result = _maybe_numeric_slice(df, None, include_bool=True)
+        expected = pd.IndexSlice[:, ['A', 'C']]
+        result = _maybe_numeric_slice(df, [1])
+        expected = [1]
+        assert result == expected
+
+    def test_partial_boolean_frame_indexing(self):
+        # GH 17170
+        df = DataFrame(np.arange(9.).reshape(3, 3),
+                       index=list('abc'), columns=list('ABC'))
+        index_df = DataFrame(1, index=list('ab'), columns=list('AB'))
+        result = df[index_df.notnull()]
+        expected = DataFrame(np.array([[0., 1., np.nan],
+                                       [3., 4., np.nan],
+                                       [np.nan] * 3]),
+                             index=list('abc'),
+                             columns=list('ABC'))
+        tm.assert_frame_equal(result, expected)
+
+    def test_no_reference_cycle(self):
+        df = DataFrame({'a': [0, 1], 'b': [2, 3]})
+        for name in ('loc', 'iloc', 'at', 'iat'):
+            getattr(df, name)
+        with catch_warnings(record=True):
+            getattr(df, 'ix')
+        wr = weakref.ref(df)
+        del df
+        assert wr() is None
+
+
+class TestSeriesNoneCoercion(object):
+    EXPECTED_RESULTS = [
+        # For numeric series, we should coerce to NaN.
+        ([1, 2, 3], [np.nan, 2, 3]),
+        ([1.0, 2.0, 3.0], [np.nan, 2.0, 3.0]),
+
+        # For datetime series, we should coerce to NaT.
+        ([datetime(2000, 1, 1), datetime(2000, 1, 2), datetime(2000, 1, 3)],
+         [NaT, datetime(2000, 1, 2), datetime(2000, 1, 3)]),
+
+        # For objects, we should preserve the None value.
+        (["foo", "bar", "baz"], [None, "bar", "baz"]),
+    ]
+
+    def test_coercion_with_setitem(self):
+        for start_data, expected_result in self.EXPECTED_RESULTS:
+            start_series = Series(start_data)
+            start_series[0] = None
+
+            expected_series = Series(expected_result)
+            tm.assert_series_equal(start_series, expected_series)
+
+    def test_coercion_with_loc_setitem(self):
+        for start_data, expected_result in self.EXPECTED_RESULTS:
+            start_series = Series(start_data)
+            start_series.loc[0] = None
+
+            expected_series = Series(expected_result)
+            tm.assert_series_equal(start_series, expected_series)
+
+    def test_coercion_with_setitem_and_series(self):
+        for start_data, expected_result in self.EXPECTED_RESULTS:
+            start_series = Series(start_data)
+            start_series[start_series == start_series[0]] = None
+
+            expected_series = Series(expected_result)
+            tm.assert_series_equal(start_series, expected_series)
+
+    def test_coercion_with_loc_and_series(self):
+        for start_data, expected_result in self.EXPECTED_RESULTS:
+            start_series = Series(start_data)
+            start_series.loc[start_series == start_series[0]] = None
+
+            expected_series = Series(expected_result)
+            tm.assert_series_equal(start_series, expected_series)
+
+
+class TestDataframeNoneCoercion(object):
+    EXPECTED_SINGLE_ROW_RESULTS = [
+        # For numeric series, we should coerce to NaN.
+        ([1, 2, 3], [np.nan, 2, 3]),
+        ([1.0, 2.0, 3.0], [np.nan, 2.0, 3.0]),
+
+        # For datetime series, we should coerce to NaT.
+        ([datetime(2000, 1, 1), datetime(2000, 1, 2), datetime(2000, 1, 3)],
+         [NaT, datetime(2000, 1, 2), datetime(2000, 1, 3)]),
+
+        # For objects, we should preserve the None value.
+        (["foo", "bar", "baz"], [None, "bar", "baz"]),
+    ]
+
+    def test_coercion_with_loc(self):
+        for start_data, expected_result, in self.EXPECTED_SINGLE_ROW_RESULTS:
+            start_dataframe = DataFrame({'foo': start_data})
+            start_dataframe.loc[0, ['foo']] = None
+
+            expected_dataframe = DataFrame({'foo': expected_result})
+            tm.assert_frame_equal(start_dataframe, expected_dataframe)
+
+    def test_coercion_with_setitem_and_dataframe(self):
+        for start_data, expected_result, in self.EXPECTED_SINGLE_ROW_RESULTS:
+            start_dataframe = DataFrame({'foo': start_data})
+            start_dataframe[start_dataframe['foo'] == start_dataframe['foo'][
+                0]] = None
+
+            expected_dataframe = DataFrame({'foo': expected_result})
+            tm.assert_frame_equal(start_dataframe, expected_dataframe)
+
+    def test_none_coercion_loc_and_dataframe(self):
+        for start_data, expected_result, in self.EXPECTED_SINGLE_ROW_RESULTS:
+            start_dataframe = DataFrame({'foo': start_data})
+            start_dataframe.loc[start_dataframe['foo'] == start_dataframe[
+                'foo'][0]] = None
+
+            expected_dataframe = DataFrame({'foo': expected_result})
+            tm.assert_frame_equal(start_dataframe, expected_dataframe)
+
+    def test_none_coercion_mixed_dtypes(self):
+        start_dataframe = DataFrame({
+            'a': [1, 2, 3],
+            'b': [1.0, 2.0, 3.0],
+            'c': [datetime(2000, 1, 1), datetime(2000, 1, 2), datetime(2000, 1,
+                                                                       3)],
+            'd': ['a', 'b', 'c']
+        })
+        start_dataframe.iloc[0] = None
+
+        exp = DataFrame({'a': [np.nan, 2, 3],
+                         'b': [np.nan, 2.0, 3.0],
+                         'c': [NaT, datetime(2000, 1, 2),
+                               datetime(2000, 1, 3)],
+                         'd': [None, 'b', 'c']})
+        tm.assert_frame_equal(start_dataframe, exp)
+
+
+def test_validate_indices_ok():
+    indices = np.asarray([0, 1])
+    validate_indices(indices, 2)
+    validate_indices(indices[:0], 0)
+    validate_indices(np.array([-1, -1]), 0)
+
+
+def test_validate_indices_low():
+    indices = np.asarray([0, -2])
+    with tm.assert_raises_regex(ValueError, "'indices' contains"):
+        validate_indices(indices, 2)
+
+
+def test_validate_indices_high():
+    indices = np.asarray([0, 1, 2])
+    with tm.assert_raises_regex(IndexError, "indices are out"):
+        validate_indices(indices, 2)
+
+
+def test_validate_indices_empty():
+    with tm.assert_raises_regex(IndexError, "indices are out"):
+        validate_indices(np.array([0, 1]), 0)
diff --git a/pandas/tests/indexing/test_indexing_slow.py b/pandas/tests/indexing/test_indexing_slow.py
new file mode 100644
index 0000000000000..f4d581f450363
--- /dev/null
+++ b/pandas/tests/indexing/test_indexing_slow.py
@@ -0,0 +1,96 @@
+# -*- coding: utf-8 -*-
+
+import warnings
+
+import numpy as np
+import pandas as pd
+from pandas.core.api import Series, DataFrame, MultiIndex
+import pandas.util.testing as tm
+import pytest
+
+
+class TestIndexingSlow(object):
+
+    @pytest.mark.slow
+    def test_multiindex_get_loc(self):  # GH7724, GH2646
+
+        with warnings.catch_warnings(record=True):
+
+            # test indexing into a multi-index before & past the lexsort depth
+            from numpy.random import randint, choice, randn
+            cols = ['jim', 'joe', 'jolie', 'joline', 'jolia']
+
+            def validate(mi, df, key):
+                mask = np.ones(len(df)).astype('bool')
+
+                # test for all partials of this key
+                for i, k in enumerate(key):
+                    mask &= df.iloc[:, i] == k
+
+                    if not mask.any():
+                        assert key[:i + 1] not in mi.index
+                        continue
+
+                    assert key[:i + 1] in mi.index
+                    right = df[mask].copy()
+
+                    if i + 1 != len(key):  # partial key
+                        right.drop(cols[:i + 1], axis=1, inplace=True)
+                        right.set_index(cols[i + 1:-1], inplace=True)
+                        tm.assert_frame_equal(mi.loc[key[:i + 1]], right)
+
+                    else:  # full key
+                        right.set_index(cols[:-1], inplace=True)
+                        if len(right) == 1:  # single hit
+                            right = Series(right['jolia'].values,
+                                           name=right.index[0],
+                                           index=['jolia'])
+                            tm.assert_series_equal(mi.loc[key[:i + 1]], right)
+                        else:  # multi hit
+                            tm.assert_frame_equal(mi.loc[key[:i + 1]], right)
+
+            def loop(mi, df, keys):
+                for key in keys:
+                    validate(mi, df, key)
+
+            n, m = 1000, 50
+
+            vals = [randint(0, 10, n), choice(
+                list('abcdefghij'), n), choice(
+                    pd.date_range('20141009', periods=10).tolist(), n), choice(
+                        list('ZYXWVUTSRQ'), n), randn(n)]
+            vals = list(map(tuple, zip(*vals)))
+
+            # bunch of keys for testing
+            keys = [randint(0, 11, m), choice(
+                list('abcdefghijk'), m), choice(
+                    pd.date_range('20141009', periods=11).tolist(), m), choice(
+                        list('ZYXWVUTSRQP'), m)]
+            keys = list(map(tuple, zip(*keys)))
+            keys += list(map(lambda t: t[:-1], vals[::n // m]))
+
+            # covers both unique index and non-unique index
+            df = DataFrame(vals, columns=cols)
+            a, b = pd.concat([df, df]), df.drop_duplicates(subset=cols[:-1])
+
+            for frame in a, b:
+                for i in range(5):  # lexsort depth
+                    df = frame.copy() if i == 0 else frame.sort_values(
+                        by=cols[:i])
+                    mi = df.set_index(cols[:-1])
+                    assert not mi.index.lexsort_depth < i
+                    loop(mi, df, keys)
+
+    @pytest.mark.slow
+    def test_large_dataframe_indexing(self):
+        # GH10692
+        result = DataFrame({'x': range(10 ** 6)}, dtype='int64')
+        result.loc[len(result)] = len(result) + 1
+        expected = DataFrame({'x': range(10 ** 6 + 1)}, dtype='int64')
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.slow
+    def test_large_mi_dataframe_indexing(self):
+        # GH10645
+        result = MultiIndex.from_arrays([range(10 ** 6), range(10 ** 6)])
+        assert (not (10 ** 6, 0) in result)
diff --git a/pandas/tests/indexing/test_ix.py b/pandas/tests/indexing/test_ix.py
new file mode 100644
index 0000000000000..c84576c984525
--- /dev/null
+++ b/pandas/tests/indexing/test_ix.py
@@ -0,0 +1,337 @@
+""" test indexing with ix """
+
+import pytest
+
+from warnings import catch_warnings
+
+import numpy as np
+import pandas as pd
+
+from pandas.core.dtypes.common import is_scalar
+from pandas.compat import lrange
+from pandas import Series, DataFrame, option_context, MultiIndex
+from pandas.util import testing as tm
+from pandas.errors import PerformanceWarning
+
+
+class TestIX(object):
+
+    def test_ix_deprecation(self):
+        # GH 15114
+
+        df = DataFrame({'A': [1, 2, 3]})
+        with tm.assert_produces_warning(DeprecationWarning,
+                                        check_stacklevel=False):
+            df.ix[1, 'A']
+
+    def test_ix_loc_setitem_consistency(self):
+
+        # GH 5771
+        # loc with slice and series
+        s = Series(0, index=[4, 5, 6])
+        s.loc[4:5] += 1
+        expected = Series([1, 1, 0], index=[4, 5, 6])
+        tm.assert_series_equal(s, expected)
+
+        # GH 5928
+        # chained indexing assignment
+        df = DataFrame({'a': [0, 1, 2]})
+        expected = df.copy()
+        with catch_warnings(record=True):
+            expected.ix[[0, 1, 2], 'a'] = -expected.ix[[0, 1, 2], 'a']
+
+        with catch_warnings(record=True):
+            df['a'].ix[[0, 1, 2]] = -df['a'].ix[[0, 1, 2]]
+        tm.assert_frame_equal(df, expected)
+
+        df = DataFrame({'a': [0, 1, 2], 'b': [0, 1, 2]})
+        with catch_warnings(record=True):
+            df['a'].ix[[0, 1, 2]] = -df['a'].ix[[0, 1, 2]].astype(
+                'float64') + 0.5
+        expected = DataFrame({'a': [0.5, -0.5, -1.5], 'b': [0, 1, 2]})
+        tm.assert_frame_equal(df, expected)
+
+        # GH 8607
+        # ix setitem consistency
+        df = DataFrame({'delta': [1174, 904, 161],
+                        'elapsed': [7673, 9277, 1470],
+                        'timestamp': [1413840976, 1413842580, 1413760580]})
+        expected = DataFrame({'delta': [1174, 904, 161],
+                              'elapsed': [7673, 9277, 1470],
+                              'timestamp': pd.to_datetime(
+                                  [1413840976, 1413842580, 1413760580],
+                                  unit='s')
+                              })
+
+        df2 = df.copy()
+        df2['timestamp'] = pd.to_datetime(df['timestamp'], unit='s')
+        tm.assert_frame_equal(df2, expected)
+
+        df2 = df.copy()
+        df2.loc[:, 'timestamp'] = pd.to_datetime(df['timestamp'], unit='s')
+        tm.assert_frame_equal(df2, expected)
+
+        df2 = df.copy()
+        with catch_warnings(record=True):
+            df2.ix[:, 2] = pd.to_datetime(df['timestamp'], unit='s')
+        tm.assert_frame_equal(df2, expected)
+
+    def test_ix_loc_consistency(self):
+
+        # GH 8613
+        # some edge cases where ix/loc should return the same
+        # this is not an exhaustive case
+
+        def compare(result, expected):
+            if is_scalar(expected):
+                assert result == expected
+            else:
+                assert expected.equals(result)
+
+        # failure cases for .loc, but these work for .ix
+        df = DataFrame(np.random.randn(5, 4), columns=list('ABCD'))
+        for key in [slice(1, 3), tuple([slice(0, 2), slice(0, 2)]),
+                    tuple([slice(0, 2), df.columns[0:2]])]:
+
+            for index in [tm.makeStringIndex, tm.makeUnicodeIndex,
+                          tm.makeDateIndex, tm.makePeriodIndex,
+                          tm.makeTimedeltaIndex]:
+                df.index = index(len(df.index))
+                with catch_warnings(record=True):
+                    df.ix[key]
+
+                pytest.raises(TypeError, lambda: df.loc[key])
+
+        df = DataFrame(np.random.randn(5, 4), columns=list('ABCD'),
+                       index=pd.date_range('2012-01-01', periods=5))
+
+        for key in ['2012-01-03',
+                    '2012-01-31',
+                    slice('2012-01-03', '2012-01-03'),
+                    slice('2012-01-03', '2012-01-04'),
+                    slice('2012-01-03', '2012-01-06', 2),
+                    slice('2012-01-03', '2012-01-31'),
+                    tuple([[True, True, True, False, True]]), ]:
+
+            # getitem
+
+            # if the expected raises, then compare the exceptions
+            try:
+                with catch_warnings(record=True):
+                    expected = df.ix[key]
+            except KeyError:
+                pytest.raises(KeyError, lambda: df.loc[key])
+                continue
+
+            result = df.loc[key]
+            compare(result, expected)
+
+            # setitem
+            df1 = df.copy()
+            df2 = df.copy()
+
+            with catch_warnings(record=True):
+                df1.ix[key] = 10
+            df2.loc[key] = 10
+            compare(df2, df1)
+
+        # edge cases
+        s = Series([1, 2, 3, 4], index=list('abde'))
+
+        result1 = s['a':'c']
+        with catch_warnings(record=True):
+            result2 = s.ix['a':'c']
+        result3 = s.loc['a':'c']
+        tm.assert_series_equal(result1, result2)
+        tm.assert_series_equal(result1, result3)
+
+        # now work rather than raising KeyError
+        s = Series(range(5), [-2, -1, 1, 2, 3])
+
+        with catch_warnings(record=True):
+            result1 = s.ix[-10:3]
+        result2 = s.loc[-10:3]
+        tm.assert_series_equal(result1, result2)
+
+        with catch_warnings(record=True):
+            result1 = s.ix[0:3]
+        result2 = s.loc[0:3]
+        tm.assert_series_equal(result1, result2)
+
+    def test_ix_weird_slicing(self):
+        # http://stackoverflow.com/q/17056560/1240268
+        df = DataFrame({'one': [1, 2, 3, np.nan, np.nan],
+                        'two': [1, 2, 3, 4, 5]})
+        df.loc[df['one'] > 1, 'two'] = -df['two']
+
+        expected = DataFrame({'one': {0: 1.0,
+                                      1: 2.0,
+                                      2: 3.0,
+                                      3: np.nan,
+                                      4: np.nan},
+                              'two': {0: 1,
+                                      1: -2,
+                                      2: -3,
+                                      3: 4,
+                                      4: 5}})
+        tm.assert_frame_equal(df, expected)
+
+    def test_ix_general(self):
+
+        # ix general issues
+
+        # GH 2817
+        data = {'amount': {0: 700, 1: 600, 2: 222, 3: 333, 4: 444},
+                'col': {0: 3.5, 1: 3.5, 2: 4.0, 3: 4.0, 4: 4.0},
+                'year': {0: 2012, 1: 2011, 2: 2012, 3: 2012, 4: 2012}}
+        df = DataFrame(data).set_index(keys=['col', 'year'])
+        key = 4.0, 2012
+
+        # emits a PerformanceWarning, ok
+        with tm.assert_produces_warning(PerformanceWarning):
+            tm.assert_frame_equal(df.loc[key], df.iloc[2:])
+
+        # this is ok
+        df.sort_index(inplace=True)
+        res = df.loc[key]
+
+        # col has float dtype, result should be Float64Index
+        index = MultiIndex.from_arrays([[4.] * 3, [2012] * 3],
+                                       names=['col', 'year'])
+        expected = DataFrame({'amount': [222, 333, 444]}, index=index)
+        tm.assert_frame_equal(res, expected)
+
+    def test_ix_assign_column_mixed(self):
+        # GH #1142
+        df = DataFrame(tm.getSeriesData())
+        df['foo'] = 'bar'
+
+        orig = df.loc[:, 'B'].copy()
+        df.loc[:, 'B'] = df.loc[:, 'B'] + 1
+        tm.assert_series_equal(df.B, orig + 1)
+
+        # GH 3668, mixed frame with series value
+        df = DataFrame({'x': lrange(10), 'y': lrange(10, 20), 'z': 'bar'})
+        expected = df.copy()
+
+        for i in range(5):
+            indexer = i * 2
+            v = 1000 + i * 200
+            expected.loc[indexer, 'y'] = v
+            assert expected.loc[indexer, 'y'] == v
+
+        df.loc[df.x % 2 == 0, 'y'] = df.loc[df.x % 2 == 0, 'y'] * 100
+        tm.assert_frame_equal(df, expected)
+
+        # GH 4508, making sure consistency of assignments
+        df = DataFrame({'a': [1, 2, 3], 'b': [0, 1, 2]})
+        df.loc[[0, 2, ], 'b'] = [100, -100]
+        expected = DataFrame({'a': [1, 2, 3], 'b': [100, 1, -100]})
+        tm.assert_frame_equal(df, expected)
+
+        df = DataFrame({'a': lrange(4)})
+        df['b'] = np.nan
+        df.loc[[1, 3], 'b'] = [100, -100]
+        expected = DataFrame({'a': [0, 1, 2, 3],
+                              'b': [np.nan, 100, np.nan, -100]})
+        tm.assert_frame_equal(df, expected)
+
+        # ok, but chained assignments are dangerous
+        # if we turn off chained assignment it will work
+        with option_context('chained_assignment', None):
+            df = DataFrame({'a': lrange(4)})
+            df['b'] = np.nan
+            df['b'].loc[[1, 3]] = [100, -100]
+            tm.assert_frame_equal(df, expected)
+
+    def test_ix_get_set_consistency(self):
+
+        # GH 4544
+        # ix/loc get/set not consistent when
+        # a mixed int/string index
+        df = DataFrame(np.arange(16).reshape((4, 4)),
+                       columns=['a', 'b', 8, 'c'],
+                       index=['e', 7, 'f', 'g'])
+
+        with catch_warnings(record=True):
+            assert df.ix['e', 8] == 2
+        assert df.loc['e', 8] == 2
+
+        with catch_warnings(record=True):
+            df.ix['e', 8] = 42
+            assert df.ix['e', 8] == 42
+        assert df.loc['e', 8] == 42
+
+        df.loc['e', 8] = 45
+        with catch_warnings(record=True):
+            assert df.ix['e', 8] == 45
+        assert df.loc['e', 8] == 45
+
+    def test_ix_slicing_strings(self):
+        # see gh-3836
+        data = {'Classification':
+                ['SA EQUITY CFD', 'bbb', 'SA EQUITY', 'SA SSF', 'aaa'],
+                'Random': [1, 2, 3, 4, 5],
+                'X': ['correct', 'wrong', 'correct', 'correct', 'wrong']}
+        df = DataFrame(data)
+        x = df[~df.Classification.isin(['SA EQUITY CFD', 'SA EQUITY', 'SA SSF'
+                                        ])]
+        with catch_warnings(record=True):
+            df.ix[x.index, 'X'] = df['Classification']
+
+        expected = DataFrame({'Classification': {0: 'SA EQUITY CFD',
+                                                 1: 'bbb',
+                                                 2: 'SA EQUITY',
+                                                 3: 'SA SSF',
+                                                 4: 'aaa'},
+                              'Random': {0: 1,
+                                         1: 2,
+                                         2: 3,
+                                         3: 4,
+                                         4: 5},
+                              'X': {0: 'correct',
+                                    1: 'bbb',
+                                    2: 'correct',
+                                    3: 'correct',
+                                    4: 'aaa'}})  # bug was 4: 'bbb'
+
+        tm.assert_frame_equal(df, expected)
+
+    def test_ix_setitem_out_of_bounds_axis_0(self):
+        df = DataFrame(
+            np.random.randn(2, 5), index=["row%s" % i for i in range(2)],
+            columns=["col%s" % i for i in range(5)])
+        with catch_warnings(record=True):
+            pytest.raises(ValueError, df.ix.__setitem__, (2, 0), 100)
+
+    def test_ix_setitem_out_of_bounds_axis_1(self):
+        df = DataFrame(
+            np.random.randn(5, 2), index=["row%s" % i for i in range(5)],
+            columns=["col%s" % i for i in range(2)])
+        with catch_warnings(record=True):
+            pytest.raises(ValueError, df.ix.__setitem__, (0, 2), 100)
+
+    def test_ix_empty_list_indexer_is_ok(self):
+        with catch_warnings(record=True):
+            from pandas.util.testing import makeCustomDataframe as mkdf
+            df = mkdf(5, 2)
+            # vertical empty
+            tm.assert_frame_equal(df.ix[:, []], df.iloc[:, :0],
+                                  check_index_type=True,
+                                  check_column_type=True)
+            # horizontal empty
+            tm.assert_frame_equal(df.ix[[], :], df.iloc[:0, :],
+                                  check_index_type=True,
+                                  check_column_type=True)
+            # horizontal empty
+            tm.assert_frame_equal(df.ix[[]], df.iloc[:0, :],
+                                  check_index_type=True,
+                                  check_column_type=True)
+
+    def test_ix_duplicate_returns_series(self):
+        df = DataFrame(np.random.randn(3, 3), index=[0.1, 0.2, 0.2],
+                       columns=list('abc'))
+        with catch_warnings(record=True):
+            r = df.ix[0.2, 'a']
+        e = df.loc[0.2, 'a']
+        tm.assert_series_equal(r, e)
diff --git a/pandas/tests/indexing/test_loc.py b/pandas/tests/indexing/test_loc.py
new file mode 100644
index 0000000000000..2e52154d7679b
--- /dev/null
+++ b/pandas/tests/indexing/test_loc.py
@@ -0,0 +1,805 @@
+""" test label based indexing with loc """
+
+import itertools
+import pytest
+
+from warnings import catch_warnings
+import numpy as np
+
+import pandas as pd
+from pandas.compat import lrange, StringIO
+from pandas import Series, DataFrame, Timestamp, date_range, MultiIndex, Index
+from pandas.util import testing as tm
+from pandas.tests.indexing.common import Base
+from pandas.api.types import is_scalar
+from pandas.compat import PY2
+
+
+class TestLoc(Base):
+
+    def test_loc_getitem_dups(self):
+        # GH 5678
+        # repeated gettitems on a dup index returning a ndarray
+        df = DataFrame(
+            np.random.random_sample((20, 5)),
+            index=['ABCDE' [x % 5] for x in range(20)])
+        expected = df.loc['A', 0]
+        result = df.loc[:, 0].loc['A']
+        tm.assert_series_equal(result, expected)
+
+    def test_loc_getitem_dups2(self):
+
+        # GH4726
+        # dup indexing with iloc/loc
+        df = DataFrame([[1, 2, 'foo', 'bar', Timestamp('20130101')]],
+                       columns=['a', 'a', 'a', 'a', 'a'], index=[1])
+        expected = Series([1, 2, 'foo', 'bar', Timestamp('20130101')],
+                          index=['a', 'a', 'a', 'a', 'a'], name=1)
+
+        result = df.iloc[0]
+        tm.assert_series_equal(result, expected)
+
+        result = df.loc[1]
+        tm.assert_series_equal(result, expected)
+
+    def test_loc_setitem_dups(self):
+
+        # GH 6541
+        df_orig = DataFrame(
+            {'me': list('rttti'),
+             'foo': list('aaade'),
+             'bar': np.arange(5, dtype='float64') * 1.34 + 2,
+             'bar2': np.arange(5, dtype='float64') * -.34 + 2}).set_index('me')
+
+        indexer = tuple(['r', ['bar', 'bar2']])
+        df = df_orig.copy()
+        df.loc[indexer] *= 2.0
+        tm.assert_series_equal(df.loc[indexer], 2.0 * df_orig.loc[indexer])
+
+        indexer = tuple(['r', 'bar'])
+        df = df_orig.copy()
+        df.loc[indexer] *= 2.0
+        assert df.loc[indexer] == 2.0 * df_orig.loc[indexer]
+
+        indexer = tuple(['t', ['bar', 'bar2']])
+        df = df_orig.copy()
+        df.loc[indexer] *= 2.0
+        tm.assert_frame_equal(df.loc[indexer], 2.0 * df_orig.loc[indexer])
+
+    def test_loc_setitem_slice(self):
+        # GH10503
+
+        # assigning the same type should not change the type
+        df1 = DataFrame({'a': [0, 1, 1],
+                         'b': Series([100, 200, 300], dtype='uint32')})
+        ix = df1['a'] == 1
+        newb1 = df1.loc[ix, 'b'] + 1
+        df1.loc[ix, 'b'] = newb1
+        expected = DataFrame({'a': [0, 1, 1],
+                              'b': Series([100, 201, 301], dtype='uint32')})
+        tm.assert_frame_equal(df1, expected)
+
+        # assigning a new type should get the inferred type
+        df2 = DataFrame({'a': [0, 1, 1], 'b': [100, 200, 300]},
+                        dtype='uint64')
+        ix = df1['a'] == 1
+        newb2 = df2.loc[ix, 'b']
+        df1.loc[ix, 'b'] = newb2
+        expected = DataFrame({'a': [0, 1, 1], 'b': [100, 200, 300]},
+                             dtype='uint64')
+        tm.assert_frame_equal(df2, expected)
+
+    def test_loc_getitem_int(self):
+
+        # int label
+        self.check_result('int label', 'loc', 2, 'ix', 2,
+                          typs=['ints', 'uints'], axes=0)
+        self.check_result('int label', 'loc', 3, 'ix', 3,
+                          typs=['ints', 'uints'], axes=1)
+        self.check_result('int label', 'loc', 4, 'ix', 4,
+                          typs=['ints', 'uints'], axes=2)
+        self.check_result('int label', 'loc', 2, 'ix', 2,
+                          typs=['label'], fails=KeyError)
+
+    def test_loc_getitem_label(self):
+
+        # label
+        self.check_result('label', 'loc', 'c', 'ix', 'c', typs=['labels'],
+                          axes=0)
+        self.check_result('label', 'loc', 'null', 'ix', 'null', typs=['mixed'],
+                          axes=0)
+        self.check_result('label', 'loc', 8, 'ix', 8, typs=['mixed'], axes=0)
+        self.check_result('label', 'loc', Timestamp('20130102'), 'ix', 1,
+                          typs=['ts'], axes=0)
+        self.check_result('label', 'loc', 'c', 'ix', 'c', typs=['empty'],
+                          fails=KeyError)
+
+    def test_loc_getitem_label_out_of_range(self):
+
+        # out of range label
+        self.check_result('label range', 'loc', 'f', 'ix', 'f',
+                          typs=['ints', 'uints', 'labels', 'mixed', 'ts'],
+                          fails=KeyError)
+        self.check_result('label range', 'loc', 'f', 'ix', 'f',
+                          typs=['floats'], fails=KeyError)
+        self.check_result('label range', 'loc', 20, 'ix', 20,
+                          typs=['ints', 'uints', 'mixed'], fails=KeyError)
+        self.check_result('label range', 'loc', 20, 'ix', 20,
+                          typs=['labels'], fails=TypeError)
+        self.check_result('label range', 'loc', 20, 'ix', 20, typs=['ts'],
+                          axes=0, fails=TypeError)
+        self.check_result('label range', 'loc', 20, 'ix', 20, typs=['floats'],
+                          axes=0, fails=KeyError)
+
+    def test_loc_getitem_label_list(self):
+
+        # list of labels
+        self.check_result('list lbl', 'loc', [0, 2, 4], 'ix', [0, 2, 4],
+                          typs=['ints', 'uints'], axes=0)
+        self.check_result('list lbl', 'loc', [3, 6, 9], 'ix', [3, 6, 9],
+                          typs=['ints', 'uints'], axes=1)
+        self.check_result('list lbl', 'loc', [4, 8, 12], 'ix', [4, 8, 12],
+                          typs=['ints', 'uints'], axes=2)
+        self.check_result('list lbl', 'loc', ['a', 'b', 'd'], 'ix',
+                          ['a', 'b', 'd'], typs=['labels'], axes=0)
+        self.check_result('list lbl', 'loc', ['A', 'B', 'C'], 'ix',
+                          ['A', 'B', 'C'], typs=['labels'], axes=1)
+        self.check_result('list lbl', 'loc', ['Z', 'Y', 'W'], 'ix',
+                          ['Z', 'Y', 'W'], typs=['labels'], axes=2)
+        self.check_result('list lbl', 'loc', [2, 8, 'null'], 'ix',
+                          [2, 8, 'null'], typs=['mixed'], axes=0)
+        self.check_result('list lbl', 'loc',
+                          [Timestamp('20130102'), Timestamp('20130103')], 'ix',
+                          [Timestamp('20130102'), Timestamp('20130103')],
+                          typs=['ts'], axes=0)
+
+    @pytest.mark.skipif(PY2, reason=("Catching warnings unreliable with "
+                                     "Python 2 (GH #20770)"))
+    def test_loc_getitem_label_list_with_missing(self):
+        self.check_result('list lbl', 'loc', [0, 1, 2], 'indexer', [0, 1, 2],
+                          typs=['empty'], fails=KeyError)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            self.check_result('list lbl', 'loc', [0, 2, 10], 'ix', [0, 2, 10],
+                              typs=['ints', 'uints', 'floats'],
+                              axes=0, fails=KeyError)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            self.check_result('list lbl', 'loc', [3, 6, 7], 'ix', [3, 6, 7],
+                              typs=['ints', 'uints', 'floats'],
+                              axes=1, fails=KeyError)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            self.check_result('list lbl', 'loc', [4, 8, 10], 'ix', [4, 8, 10],
+                              typs=['ints', 'uints', 'floats'],
+                              axes=2, fails=KeyError)
+
+        # GH 17758 - MultiIndex and missing keys
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            self.check_result('list lbl', 'loc', [(1, 3), (1, 4), (2, 5)],
+                              'ix', [(1, 3), (1, 4), (2, 5)],
+                              typs=['multi'],
+                              axes=0)
+
+    def test_getitem_label_list_with_missing(self):
+        s = Series(range(3), index=['a', 'b', 'c'])
+
+        # consistency
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            s[['a', 'd']]
+
+        s = Series(range(3))
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            s[[0, 3]]
+
+    def test_loc_getitem_label_list_fails(self):
+        # fails
+        self.check_result('list lbl', 'loc', [20, 30, 40], 'ix', [20, 30, 40],
+                          typs=['ints', 'uints'], axes=1, fails=KeyError)
+        self.check_result('list lbl', 'loc', [20, 30, 40], 'ix', [20, 30, 40],
+                          typs=['ints', 'uints'], axes=2, fails=KeyError)
+
+    def test_loc_getitem_label_array_like(self):
+        # array like
+        self.check_result('array like', 'loc', Series(index=[0, 2, 4]).index,
+                          'ix', [0, 2, 4], typs=['ints', 'uints'], axes=0)
+        self.check_result('array like', 'loc', Series(index=[3, 6, 9]).index,
+                          'ix', [3, 6, 9], typs=['ints', 'uints'], axes=1)
+        self.check_result('array like', 'loc', Series(index=[4, 8, 12]).index,
+                          'ix', [4, 8, 12], typs=['ints', 'uints'], axes=2)
+
+    def test_loc_getitem_bool(self):
+        # boolean indexers
+        b = [True, False, True, False]
+        self.check_result('bool', 'loc', b, 'ix', b,
+                          typs=['ints', 'uints', 'labels',
+                                'mixed', 'ts', 'floats'])
+        self.check_result('bool', 'loc', b, 'ix', b, typs=['empty'],
+                          fails=KeyError)
+
+    def test_loc_getitem_int_slice(self):
+
+        # ok
+        self.check_result('int slice2', 'loc', slice(2, 4), 'ix', [2, 4],
+                          typs=['ints', 'uints'], axes=0)
+        self.check_result('int slice2', 'loc', slice(3, 6), 'ix', [3, 6],
+                          typs=['ints', 'uints'], axes=1)
+        self.check_result('int slice2', 'loc', slice(4, 8), 'ix', [4, 8],
+                          typs=['ints', 'uints'], axes=2)
+
+        # GH 3053
+        # loc should treat integer slices like label slices
+
+        index = MultiIndex.from_tuples([t for t in itertools.product(
+            [6, 7, 8], ['a', 'b'])])
+        df = DataFrame(np.random.randn(6, 6), index, index)
+        result = df.loc[6:8, :]
+        expected = df
+        tm.assert_frame_equal(result, expected)
+
+        index = MultiIndex.from_tuples([t
+                                        for t in itertools.product(
+                                            [10, 20, 30], ['a', 'b'])])
+        df = DataFrame(np.random.randn(6, 6), index, index)
+        result = df.loc[20:30, :]
+        expected = df.iloc[2:]
+        tm.assert_frame_equal(result, expected)
+
+        # doc examples
+        result = df.loc[10, :]
+        expected = df.iloc[0:2]
+        expected.index = ['a', 'b']
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[:, 10]
+        # expected = df.ix[:,10] (this fails)
+        expected = df[10]
+        tm.assert_frame_equal(result, expected)
+
+    def test_loc_to_fail(self):
+
+        # GH3449
+        df = DataFrame(np.random.random((3, 3)),
+                       index=['a', 'b', 'c'],
+                       columns=['e', 'f', 'g'])
+
+        # raise a KeyError?
+        pytest.raises(KeyError, df.loc.__getitem__,
+                      tuple([[1, 2], [1, 2]]))
+
+        # GH  7496
+        # loc should not fallback
+
+        s = Series()
+        s.loc[1] = 1
+        s.loc['a'] = 2
+
+        pytest.raises(KeyError, lambda: s.loc[-1])
+        pytest.raises(KeyError, lambda: s.loc[[-1, -2]])
+
+        pytest.raises(KeyError, lambda: s.loc[['4']])
+
+        s.loc[-1] = 3
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = s.loc[[-1, -2]]
+        expected = Series([3, np.nan], index=[-1, -2])
+        tm.assert_series_equal(result, expected)
+
+        s['a'] = 2
+        pytest.raises(KeyError, lambda: s.loc[[-2]])
+
+        del s['a']
+
+        def f():
+            s.loc[[-2]] = 0
+
+        pytest.raises(KeyError, f)
+
+        # inconsistency between .loc[values] and .loc[values,:]
+        # GH 7999
+        df = DataFrame([['a'], ['b']], index=[1, 2], columns=['value'])
+
+        def f():
+            df.loc[[3], :]
+
+        pytest.raises(KeyError, f)
+
+        def f():
+            df.loc[[3]]
+
+        pytest.raises(KeyError, f)
+
+    def test_loc_getitem_list_with_fail(self):
+        # 15747
+        # should KeyError if *any* missing labels
+
+        s = Series([1, 2, 3])
+
+        s.loc[[2]]
+
+        with pytest.raises(KeyError):
+            s.loc[[3]]
+
+        # a non-match and a match
+        with tm.assert_produces_warning(FutureWarning):
+            expected = s.loc[[2, 3]]
+        result = s.reindex([2, 3])
+        tm.assert_series_equal(result, expected)
+
+    def test_loc_getitem_label_slice(self):
+
+        # label slices (with ints)
+        self.check_result('lab slice', 'loc', slice(1, 3),
+                          'ix', slice(1, 3),
+                          typs=['labels', 'mixed', 'empty', 'ts', 'floats'],
+                          fails=TypeError)
+
+        # real label slices
+        self.check_result('lab slice', 'loc', slice('a', 'c'),
+                          'ix', slice('a', 'c'), typs=['labels'], axes=0)
+        self.check_result('lab slice', 'loc', slice('A', 'C'),
+                          'ix', slice('A', 'C'), typs=['labels'], axes=1)
+        self.check_result('lab slice', 'loc', slice('W', 'Z'),
+                          'ix', slice('W', 'Z'), typs=['labels'], axes=2)
+
+        self.check_result('ts  slice', 'loc', slice('20130102', '20130104'),
+                          'ix', slice('20130102', '20130104'),
+                          typs=['ts'], axes=0)
+        self.check_result('ts  slice', 'loc', slice('20130102', '20130104'),
+                          'ix', slice('20130102', '20130104'),
+                          typs=['ts'], axes=1, fails=TypeError)
+        self.check_result('ts  slice', 'loc', slice('20130102', '20130104'),
+                          'ix', slice('20130102', '20130104'),
+                          typs=['ts'], axes=2, fails=TypeError)
+
+        # GH 14316
+        self.check_result('ts slice rev', 'loc', slice('20130104', '20130102'),
+                          'indexer', [0, 1, 2], typs=['ts_rev'], axes=0)
+
+        self.check_result('mixed slice', 'loc', slice(2, 8), 'ix', slice(2, 8),
+                          typs=['mixed'], axes=0, fails=TypeError)
+        self.check_result('mixed slice', 'loc', slice(2, 8), 'ix', slice(2, 8),
+                          typs=['mixed'], axes=1, fails=KeyError)
+        self.check_result('mixed slice', 'loc', slice(2, 8), 'ix', slice(2, 8),
+                          typs=['mixed'], axes=2, fails=KeyError)
+
+        self.check_result('mixed slice', 'loc', slice(2, 4, 2), 'ix', slice(
+            2, 4, 2), typs=['mixed'], axes=0, fails=TypeError)
+
+    def test_loc_index(self):
+        # gh-17131
+        # a boolean index should index like a boolean numpy array
+
+        df = DataFrame(
+            np.random.random(size=(5, 10)),
+            index=["alpha_0", "alpha_1", "alpha_2", "beta_0", "beta_1"])
+
+        mask = df.index.map(lambda x: "alpha" in x)
+        expected = df.loc[np.array(mask)]
+
+        result = df.loc[mask]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[mask.values]
+        tm.assert_frame_equal(result, expected)
+
+    def test_loc_general(self):
+
+        df = DataFrame(
+            np.random.rand(4, 4), columns=['A', 'B', 'C', 'D'],
+            index=['A', 'B', 'C', 'D'])
+
+        # want this to work
+        result = df.loc[:, "A":"B"].iloc[0:2, :]
+        assert (result.columns == ['A', 'B']).all()
+        assert (result.index == ['A', 'B']).all()
+
+        # mixed type
+        result = DataFrame({'a': [Timestamp('20130101')], 'b': [1]}).iloc[0]
+        expected = Series([Timestamp('20130101'), 1], index=['a', 'b'], name=0)
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == object
+
+    def test_loc_setitem_consistency(self):
+        # GH 6149
+        # coerce similarly for setitem and loc when rows have a null-slice
+        expected = DataFrame({'date': Series(0, index=range(5),
+                                             dtype=np.int64),
+                              'val': Series(range(5), dtype=np.int64)})
+
+        df = DataFrame({'date': date_range('2000-01-01', '2000-01-5'),
+                        'val': Series(
+                            range(5), dtype=np.int64)})
+        df.loc[:, 'date'] = 0
+        tm.assert_frame_equal(df, expected)
+
+        df = DataFrame({'date': date_range('2000-01-01', '2000-01-5'),
+                        'val': Series(range(5), dtype=np.int64)})
+        df.loc[:, 'date'] = np.array(0, dtype=np.int64)
+        tm.assert_frame_equal(df, expected)
+
+        df = DataFrame({'date': date_range('2000-01-01', '2000-01-5'),
+                        'val': Series(range(5), dtype=np.int64)})
+        df.loc[:, 'date'] = np.array([0, 0, 0, 0, 0], dtype=np.int64)
+        tm.assert_frame_equal(df, expected)
+
+        expected = DataFrame({'date': Series('foo', index=range(5)),
+                              'val': Series(range(5), dtype=np.int64)})
+        df = DataFrame({'date': date_range('2000-01-01', '2000-01-5'),
+                        'val': Series(range(5), dtype=np.int64)})
+        df.loc[:, 'date'] = 'foo'
+        tm.assert_frame_equal(df, expected)
+
+        expected = DataFrame({'date': Series(1.0, index=range(5)),
+                              'val': Series(range(5), dtype=np.int64)})
+        df = DataFrame({'date': date_range('2000-01-01', '2000-01-5'),
+                        'val': Series(range(5), dtype=np.int64)})
+        df.loc[:, 'date'] = 1.0
+        tm.assert_frame_equal(df, expected)
+
+        # GH 15494
+        # setting on frame with single row
+        df = DataFrame({'date': Series([Timestamp('20180101')])})
+        df.loc[:, 'date'] = 'string'
+        expected = DataFrame({'date': Series(['string'])})
+        tm.assert_frame_equal(df, expected)
+
+    def test_loc_setitem_consistency_empty(self):
+        # empty (essentially noops)
+        expected = DataFrame(columns=['x', 'y'])
+        expected['x'] = expected['x'].astype(np.int64)
+        df = DataFrame(columns=['x', 'y'])
+        df.loc[:, 'x'] = 1
+        tm.assert_frame_equal(df, expected)
+
+        df = DataFrame(columns=['x', 'y'])
+        df['x'] = 1
+        tm.assert_frame_equal(df, expected)
+
+    def test_loc_setitem_consistency_slice_column_len(self):
+        # .loc[:,column] setting with slice == len of the column
+        # GH10408
+        data = """Level_0,,,Respondent,Respondent,Respondent,OtherCat,OtherCat
+Level_1,,,Something,StartDate,EndDate,Yes/No,SomethingElse
+Region,Site,RespondentID,,,,,
+Region_1,Site_1,3987227376,A,5/25/2015 10:59,5/25/2015 11:22,Yes,
+Region_1,Site_1,3980680971,A,5/21/2015 9:40,5/21/2015 9:52,Yes,Yes
+Region_1,Site_2,3977723249,A,5/20/2015 8:27,5/20/2015 8:41,Yes,
+Region_1,Site_2,3977723089,A,5/20/2015 8:33,5/20/2015 9:09,Yes,No"""
+
+        df = pd.read_csv(StringIO(data), header=[0, 1], index_col=[0, 1, 2])
+        df.loc[:, ('Respondent', 'StartDate')] = pd.to_datetime(df.loc[:, (
+            'Respondent', 'StartDate')])
+        df.loc[:, ('Respondent', 'EndDate')] = pd.to_datetime(df.loc[:, (
+            'Respondent', 'EndDate')])
+        df.loc[:, ('Respondent', 'Duration')] = df.loc[:, (
+            'Respondent', 'EndDate')] - df.loc[:, ('Respondent', 'StartDate')]
+
+        df.loc[:, ('Respondent', 'Duration')] = df.loc[:, (
+            'Respondent', 'Duration')].astype('timedelta64[s]')
+        expected = Series([1380, 720, 840, 2160.], index=df.index,
+                          name=('Respondent', 'Duration'))
+        tm.assert_series_equal(df[('Respondent', 'Duration')], expected)
+
+    def test_loc_setitem_frame(self):
+        df = self.frame_labels
+
+        result = df.iloc[0, 0]
+
+        df.loc['a', 'A'] = 1
+        result = df.loc['a', 'A']
+        assert result == 1
+
+        result = df.iloc[0, 0]
+        assert result == 1
+
+        df.loc[:, 'B':'D'] = 0
+        expected = df.loc[:, 'B':'D']
+        result = df.iloc[:, 1:]
+        tm.assert_frame_equal(result, expected)
+
+        # GH 6254
+        # setting issue
+        df = DataFrame(index=[3, 5, 4], columns=['A'])
+        df.loc[[4, 3, 5], 'A'] = np.array([1, 2, 3], dtype='int64')
+        expected = DataFrame(dict(A=Series(
+            [1, 2, 3], index=[4, 3, 5]))).reindex(index=[3, 5, 4])
+        tm.assert_frame_equal(df, expected)
+
+        # GH 6252
+        # setting with an empty frame
+        keys1 = ['@' + str(i) for i in range(5)]
+        val1 = np.arange(5, dtype='int64')
+
+        keys2 = ['@' + str(i) for i in range(4)]
+        val2 = np.arange(4, dtype='int64')
+
+        index = list(set(keys1).union(keys2))
+        df = DataFrame(index=index)
+        df['A'] = np.nan
+        df.loc[keys1, 'A'] = val1
+
+        df['B'] = np.nan
+        df.loc[keys2, 'B'] = val2
+
+        expected = DataFrame(dict(A=Series(val1, index=keys1), B=Series(
+            val2, index=keys2))).reindex(index=index)
+        tm.assert_frame_equal(df, expected)
+
+        # GH 8669
+        # invalid coercion of nan -> int
+        df = DataFrame({'A': [1, 2, 3], 'B': np.nan})
+        df.loc[df.B > df.A, 'B'] = df.A
+        expected = DataFrame({'A': [1, 2, 3], 'B': np.nan})
+        tm.assert_frame_equal(df, expected)
+
+        # GH 6546
+        # setting with mixed labels
+        df = DataFrame({1: [1, 2], 2: [3, 4], 'a': ['a', 'b']})
+
+        result = df.loc[0, [1, 2]]
+        expected = Series([1, 3], index=[1, 2], dtype=object, name=0)
+        tm.assert_series_equal(result, expected)
+
+        expected = DataFrame({1: [5, 2], 2: [6, 4], 'a': ['a', 'b']})
+        df.loc[0, [1, 2]] = [5, 6]
+        tm.assert_frame_equal(df, expected)
+
+    def test_loc_setitem_frame_multiples(self):
+        # multiple setting
+        df = DataFrame({'A': ['foo', 'bar', 'baz'],
+                        'B': Series(
+                            range(3), dtype=np.int64)})
+        rhs = df.loc[1:2]
+        rhs.index = df.index[0:2]
+        df.loc[0:1] = rhs
+        expected = DataFrame({'A': ['bar', 'baz', 'baz'],
+                              'B': Series(
+                                  [1, 2, 2], dtype=np.int64)})
+        tm.assert_frame_equal(df, expected)
+
+        # multiple setting with frame on rhs (with M8)
+        df = DataFrame({'date': date_range('2000-01-01', '2000-01-5'),
+                        'val': Series(
+                            range(5), dtype=np.int64)})
+        expected = DataFrame({'date': [Timestamp('20000101'), Timestamp(
+            '20000102'), Timestamp('20000101'), Timestamp('20000102'),
+            Timestamp('20000103')],
+            'val': Series(
+            [0, 1, 0, 1, 2], dtype=np.int64)})
+        rhs = df.loc[0:2]
+        rhs.index = df.index[2:5]
+        df.loc[2:4] = rhs
+        tm.assert_frame_equal(df, expected)
+
+    @pytest.mark.parametrize(
+        'indexer', [['A'], slice(None, 'A', None), np.array(['A'])])
+    @pytest.mark.parametrize(
+        'value', [['Z'], np.array(['Z'])])
+    def test_loc_setitem_with_scalar_index(self, indexer, value):
+        # GH #19474
+        # assigning like "df.loc[0, ['A']] = ['Z']" should be evaluated
+        # elementwisely, not using "setter('A', ['Z'])".
+
+        df = pd.DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
+        df.loc[0, indexer] = value
+        result = df.loc[0, 'A']
+
+        assert is_scalar(result) and result == 'Z'
+
+    def test_loc_coerceion(self):
+
+        # 12411
+        df = DataFrame({'date': [Timestamp('20130101').tz_localize('UTC'),
+                                 pd.NaT]})
+        expected = df.dtypes
+
+        result = df.iloc[[0]]
+        tm.assert_series_equal(result.dtypes, expected)
+
+        result = df.iloc[[1]]
+        tm.assert_series_equal(result.dtypes, expected)
+
+        # 12045
+        import datetime
+        df = DataFrame({'date': [datetime.datetime(2012, 1, 1),
+                                 datetime.datetime(1012, 1, 2)]})
+        expected = df.dtypes
+
+        result = df.iloc[[0]]
+        tm.assert_series_equal(result.dtypes, expected)
+
+        result = df.iloc[[1]]
+        tm.assert_series_equal(result.dtypes, expected)
+
+        # 11594
+        df = DataFrame({'text': ['some words'] + [None] * 9})
+        expected = df.dtypes
+
+        result = df.iloc[0:2]
+        tm.assert_series_equal(result.dtypes, expected)
+
+        result = df.iloc[3:]
+        tm.assert_series_equal(result.dtypes, expected)
+
+    def test_loc_non_unique(self):
+        # GH3659
+        # non-unique indexer with loc slice
+        # https://groups.google.com/forum/?fromgroups#!topic/pydata/zTm2No0crYs
+
+        # these are going to raise because the we are non monotonic
+        df = DataFrame({'A': [1, 2, 3, 4, 5, 6],
+                        'B': [3, 4, 5, 6, 7, 8]}, index=[0, 1, 0, 1, 2, 3])
+        pytest.raises(KeyError, df.loc.__getitem__,
+                      tuple([slice(1, None)]))
+        pytest.raises(KeyError, df.loc.__getitem__,
+                      tuple([slice(0, None)]))
+        pytest.raises(KeyError, df.loc.__getitem__, tuple([slice(1, 2)]))
+
+        # monotonic are ok
+        df = DataFrame({'A': [1, 2, 3, 4, 5, 6],
+                        'B': [3, 4, 5, 6, 7, 8]},
+                       index=[0, 1, 0, 1, 2, 3]).sort_index(axis=0)
+        result = df.loc[1:]
+        expected = DataFrame({'A': [2, 4, 5, 6], 'B': [4, 6, 7, 8]},
+                             index=[1, 1, 2, 3])
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[0:]
+        tm.assert_frame_equal(result, df)
+
+        result = df.loc[1:2]
+        expected = DataFrame({'A': [2, 4, 5], 'B': [4, 6, 7]},
+                             index=[1, 1, 2])
+        tm.assert_frame_equal(result, expected)
+
+    def test_loc_non_unique_memory_error(self):
+
+        # GH 4280
+        # non_unique index with a large selection triggers a memory error
+
+        columns = list('ABCDEFG')
+
+        def gen_test(l, l2):
+            return pd.concat([
+                DataFrame(np.random.randn(l, len(columns)),
+                          index=lrange(l), columns=columns),
+                DataFrame(np.ones((l2, len(columns))),
+                          index=[0] * l2, columns=columns)])
+
+        def gen_expected(df, mask):
+            l = len(mask)
+            return pd.concat([df.take([0]),
+                              DataFrame(np.ones((l, len(columns))),
+                                        index=[0] * l,
+                                        columns=columns),
+                              df.take(mask[1:])])
+
+        df = gen_test(900, 100)
+        assert not df.index.is_unique
+
+        mask = np.arange(100)
+        result = df.loc[mask]
+        expected = gen_expected(df, mask)
+        tm.assert_frame_equal(result, expected)
+
+        df = gen_test(900000, 100000)
+        assert not df.index.is_unique
+
+        mask = np.arange(100000)
+        result = df.loc[mask]
+        expected = gen_expected(df, mask)
+        tm.assert_frame_equal(result, expected)
+
+    def test_loc_name(self):
+        # GH 3880
+        df = DataFrame([[1, 1], [1, 1]])
+        df.index.name = 'index_name'
+        result = df.iloc[[0, 1]].index.name
+        assert result == 'index_name'
+
+        with catch_warnings(record=True):
+            result = df.ix[[0, 1]].index.name
+        assert result == 'index_name'
+
+        result = df.loc[[0, 1]].index.name
+        assert result == 'index_name'
+
+    def test_loc_empty_list_indexer_is_ok(self):
+        from pandas.util.testing import makeCustomDataframe as mkdf
+        df = mkdf(5, 2)
+        # vertical empty
+        tm.assert_frame_equal(df.loc[:, []], df.iloc[:, :0],
+                              check_index_type=True, check_column_type=True)
+        # horizontal empty
+        tm.assert_frame_equal(df.loc[[], :], df.iloc[:0, :],
+                              check_index_type=True, check_column_type=True)
+        # horizontal empty
+        tm.assert_frame_equal(df.loc[[]], df.iloc[:0, :],
+                              check_index_type=True,
+                              check_column_type=True)
+
+    def test_identity_slice_returns_new_object(self):
+        # GH13873
+        original_df = DataFrame({'a': [1, 2, 3]})
+        sliced_df = original_df.loc[:]
+        assert sliced_df is not original_df
+        assert original_df[:] is not original_df
+
+        # should be a shallow copy
+        original_df['a'] = [4, 4, 4]
+        assert (sliced_df['a'] == 4).all()
+
+        # These should not return copies
+        assert original_df is original_df.loc[:, :]
+        df = DataFrame(np.random.randn(10, 4))
+        assert df[0] is df.loc[:, 0]
+
+        # Same tests for Series
+        original_series = Series([1, 2, 3, 4, 5, 6])
+        sliced_series = original_series.loc[:]
+        assert sliced_series is not original_series
+        assert original_series[:] is not original_series
+
+        original_series[:3] = [7, 8, 9]
+        assert all(sliced_series[:3] == [7, 8, 9])
+
+    @pytest.mark.parametrize(
+        'indexer_type_1',
+        (list, tuple, set, slice, np.ndarray, Series, Index))
+    @pytest.mark.parametrize(
+        'indexer_type_2',
+        (list, tuple, set, slice, np.ndarray, Series, Index))
+    def test_loc_getitem_nested_indexer(self, indexer_type_1, indexer_type_2):
+        # GH #19686
+        # .loc should work with nested indexers which can be
+        # any list-like objects (see `pandas.api.types.is_list_like`) or slices
+
+        def convert_nested_indexer(indexer_type, keys):
+            if indexer_type == np.ndarray:
+                return np.array(keys)
+            if indexer_type == slice:
+                return slice(*keys)
+            return indexer_type(keys)
+
+        a = [10, 20, 30]
+        b = [1, 2, 3]
+        index = pd.MultiIndex.from_product([a, b])
+        df = pd.DataFrame(
+            np.arange(len(index), dtype='int64'),
+            index=index, columns=['Data'])
+
+        keys = ([10, 20], [2, 3])
+        types = (indexer_type_1, indexer_type_2)
+
+        # check indexers with all the combinations of nested objects
+        # of all the valid types
+        indexer = tuple(
+            convert_nested_indexer(indexer_type, k)
+            for indexer_type, k in zip(types, keys))
+
+        result = df.loc[indexer, 'Data']
+        expected = pd.Series(
+            [1, 2, 4, 5], name='Data',
+            index=pd.MultiIndex.from_product(keys))
+
+        tm.assert_series_equal(result, expected)
+
+    def test_loc_uint64(self):
+        # GH20722
+        # Test whether loc accept uint64 max value as index.
+        s = pd.Series([1, 2],
+                      index=[np.iinfo('uint64').max - 1,
+                             np.iinfo('uint64').max])
+
+        result = s.loc[np.iinfo('uint64').max - 1]
+        expected = s.iloc[0]
+        assert result == expected
+
+        result = s.loc[[np.iinfo('uint64').max - 1]]
+        expected = s.iloc[[0]]
+        tm.assert_series_equal(result, expected)
+
+        result = s.loc[[np.iinfo('uint64').max - 1,
+                       np.iinfo('uint64').max]]
+        tm.assert_series_equal(result, s)
diff --git a/pandas/tests/indexing/test_multiindex.py b/pandas/tests/indexing/test_multiindex.py
new file mode 100644
index 0000000000000..d2c4c8f5e149b
--- /dev/null
+++ b/pandas/tests/indexing/test_multiindex.py
@@ -0,0 +1,1332 @@
+from warnings import catch_warnings
+import pytest
+import numpy as np
+import pandas as pd
+from pandas import (Panel, Series, MultiIndex, DataFrame,
+                    Timestamp, Index, date_range)
+from pandas.util import testing as tm
+from pandas.errors import PerformanceWarning, UnsortedIndexError
+from pandas.tests.indexing.common import _mklbl
+
+
+class TestMultiIndexBasic(object):
+
+    def test_iloc_getitem_multiindex2(self):
+        # TODO(wesm): fix this
+        pytest.skip('this test was being suppressed, '
+                    'needs to be fixed')
+
+        arr = np.random.randn(3, 3)
+        df = DataFrame(arr, columns=[[2, 2, 4], [6, 8, 10]],
+                       index=[[4, 4, 8], [8, 10, 12]])
+
+        rs = df.iloc[2]
+        xp = Series(arr[2], index=df.columns)
+        tm.assert_series_equal(rs, xp)
+
+        rs = df.iloc[:, 2]
+        xp = Series(arr[:, 2], index=df.index)
+        tm.assert_series_equal(rs, xp)
+
+        rs = df.iloc[2, 2]
+        xp = df.values[2, 2]
+        assert rs == xp
+
+        # for multiple items
+        # GH 5528
+        rs = df.iloc[[0, 1]]
+        xp = df.xs(4, drop_level=False)
+        tm.assert_frame_equal(rs, xp)
+
+        tup = zip(*[['a', 'a', 'b', 'b'], ['x', 'y', 'x', 'y']])
+        index = MultiIndex.from_tuples(tup)
+        df = DataFrame(np.random.randn(4, 4), index=index)
+        rs = df.iloc[[2, 3]]
+        xp = df.xs('b', drop_level=False)
+        tm.assert_frame_equal(rs, xp)
+
+    def test_setitem_multiindex(self):
+        with catch_warnings(record=True):
+
+            for index_fn in ('ix', 'loc'):
+
+                def assert_equal(a, b):
+                    assert a == b
+
+                def check(target, indexers, value, compare_fn, expected=None):
+                    fn = getattr(target, index_fn)
+                    fn.__setitem__(indexers, value)
+                    result = fn.__getitem__(indexers)
+                    if expected is None:
+                        expected = value
+                    compare_fn(result, expected)
+                # GH7190
+                index = MultiIndex.from_product([np.arange(0, 100),
+                                                 np.arange(0, 80)],
+                                                names=['time', 'firm'])
+                t, n = 0, 2
+                df = DataFrame(np.nan, columns=['A', 'w', 'l', 'a', 'x',
+                                                'X', 'd', 'profit'],
+                               index=index)
+                check(target=df, indexers=((t, n), 'X'), value=0,
+                      compare_fn=assert_equal)
+
+                df = DataFrame(-999, columns=['A', 'w', 'l', 'a', 'x',
+                                              'X', 'd', 'profit'],
+                               index=index)
+                check(target=df, indexers=((t, n), 'X'), value=1,
+                      compare_fn=assert_equal)
+
+                df = DataFrame(columns=['A', 'w', 'l', 'a', 'x',
+                                        'X', 'd', 'profit'],
+                               index=index)
+                check(target=df, indexers=((t, n), 'X'), value=2,
+                      compare_fn=assert_equal)
+
+                # gh-7218: assigning with 0-dim arrays
+                df = DataFrame(-999, columns=['A', 'w', 'l', 'a', 'x',
+                                              'X', 'd', 'profit'],
+                               index=index)
+                check(target=df,
+                      indexers=((t, n), 'X'),
+                      value=np.array(3),
+                      compare_fn=assert_equal,
+                      expected=3, )
+
+                # GH5206
+                df = DataFrame(np.arange(25).reshape(5, 5),
+                               columns='A,B,C,D,E'.split(','), dtype=float)
+                df['F'] = 99
+                row_selection = df['A'] % 2 == 0
+                col_selection = ['B', 'C']
+                with catch_warnings(record=True):
+                    df.ix[row_selection, col_selection] = df['F']
+                output = DataFrame(99., index=[0, 2, 4], columns=['B', 'C'])
+                with catch_warnings(record=True):
+                    tm.assert_frame_equal(df.ix[row_selection, col_selection],
+                                          output)
+                check(target=df,
+                      indexers=(row_selection, col_selection),
+                      value=df['F'],
+                      compare_fn=tm.assert_frame_equal,
+                      expected=output, )
+
+                # GH11372
+                idx = MultiIndex.from_product([
+                    ['A', 'B', 'C'],
+                    date_range('2015-01-01', '2015-04-01', freq='MS')])
+                cols = MultiIndex.from_product([
+                    ['foo', 'bar'],
+                    date_range('2016-01-01', '2016-02-01', freq='MS')])
+
+                df = DataFrame(np.random.random((12, 4)),
+                               index=idx, columns=cols)
+
+                subidx = MultiIndex.from_tuples(
+                    [('A', Timestamp('2015-01-01')),
+                     ('A', Timestamp('2015-02-01'))])
+                subcols = MultiIndex.from_tuples(
+                    [('foo', Timestamp('2016-01-01')),
+                     ('foo', Timestamp('2016-02-01'))])
+
+                vals = DataFrame(np.random.random((2, 2)),
+                                 index=subidx, columns=subcols)
+                check(target=df,
+                      indexers=(subidx, subcols),
+                      value=vals,
+                      compare_fn=tm.assert_frame_equal, )
+                # set all columns
+                vals = DataFrame(
+                    np.random.random((2, 4)), index=subidx, columns=cols)
+                check(target=df,
+                      indexers=(subidx, slice(None, None, None)),
+                      value=vals,
+                      compare_fn=tm.assert_frame_equal, )
+                # identity
+                copy = df.copy()
+                check(target=df, indexers=(df.index, df.columns), value=df,
+                      compare_fn=tm.assert_frame_equal, expected=copy)
+
+    def test_loc_getitem_series(self):
+        # GH14730
+        # passing a series as a key with a MultiIndex
+        index = MultiIndex.from_product([[1, 2, 3], ['A', 'B', 'C']])
+        x = Series(index=index, data=range(9), dtype=np.float64)
+        y = Series([1, 3])
+        expected = Series(
+            data=[0, 1, 2, 6, 7, 8],
+            index=MultiIndex.from_product([[1, 3], ['A', 'B', 'C']]),
+            dtype=np.float64)
+        result = x.loc[y]
+        tm.assert_series_equal(result, expected)
+
+        result = x.loc[[1, 3]]
+        tm.assert_series_equal(result, expected)
+
+        # GH15424
+        y1 = Series([1, 3], index=[1, 2])
+        result = x.loc[y1]
+        tm.assert_series_equal(result, expected)
+
+        empty = Series(data=[], dtype=np.float64)
+        expected = Series([], index=MultiIndex(
+            levels=index.levels, labels=[[], []], dtype=np.float64))
+        result = x.loc[empty]
+        tm.assert_series_equal(result, expected)
+
+    def test_loc_getitem_array(self):
+        # GH15434
+        # passing an array as a key with a MultiIndex
+        index = MultiIndex.from_product([[1, 2, 3], ['A', 'B', 'C']])
+        x = Series(index=index, data=range(9), dtype=np.float64)
+        y = np.array([1, 3])
+        expected = Series(
+            data=[0, 1, 2, 6, 7, 8],
+            index=MultiIndex.from_product([[1, 3], ['A', 'B', 'C']]),
+            dtype=np.float64)
+        result = x.loc[y]
+        tm.assert_series_equal(result, expected)
+
+        # empty array:
+        empty = np.array([])
+        expected = Series([], index=MultiIndex(
+            levels=index.levels, labels=[[], []], dtype=np.float64))
+        result = x.loc[empty]
+        tm.assert_series_equal(result, expected)
+
+        # 0-dim array (scalar):
+        scalar = np.int64(1)
+        expected = Series(
+            data=[0, 1, 2],
+            index=['A', 'B', 'C'],
+            dtype=np.float64)
+        result = x.loc[scalar]
+        tm.assert_series_equal(result, expected)
+
+    def test_iloc_getitem_multiindex(self):
+        mi_labels = DataFrame(np.random.randn(4, 3),
+                              columns=[['i', 'i', 'j'], ['A', 'A', 'B']],
+                              index=[['i', 'i', 'j', 'k'],
+                                     ['X', 'X', 'Y', 'Y']])
+
+        mi_int = DataFrame(np.random.randn(3, 3),
+                           columns=[[2, 2, 4], [6, 8, 10]],
+                           index=[[4, 4, 8], [8, 10, 12]])
+
+        # the first row
+        rs = mi_int.iloc[0]
+        with catch_warnings(record=True):
+            xp = mi_int.ix[4].ix[8]
+        tm.assert_series_equal(rs, xp, check_names=False)
+        assert rs.name == (4, 8)
+        assert xp.name == 8
+
+        # 2nd (last) columns
+        rs = mi_int.iloc[:, 2]
+        with catch_warnings(record=True):
+            xp = mi_int.ix[:, 2]
+        tm.assert_series_equal(rs, xp)
+
+        # corner column
+        rs = mi_int.iloc[2, 2]
+        with catch_warnings(record=True):
+            # First level is int - so use .loc rather than .ix (GH 21593)
+            xp = mi_int.loc[(8, 12), (4, 10)]
+        assert rs == xp
+
+        # this is basically regular indexing
+        rs = mi_labels.iloc[2, 2]
+        with catch_warnings(record=True):
+            xp = mi_labels.ix['j'].ix[:, 'j'].ix[0, 0]
+        assert rs == xp
+
+    def test_loc_multiindex(self):
+
+        mi_labels = DataFrame(np.random.randn(3, 3),
+                              columns=[['i', 'i', 'j'], ['A', 'A', 'B']],
+                              index=[['i', 'i', 'j'], ['X', 'X', 'Y']])
+
+        mi_int = DataFrame(np.random.randn(3, 3),
+                           columns=[[2, 2, 4], [6, 8, 10]],
+                           index=[[4, 4, 8], [8, 10, 12]])
+
+        # the first row
+        rs = mi_labels.loc['i']
+        with catch_warnings(record=True):
+            xp = mi_labels.ix['i']
+        tm.assert_frame_equal(rs, xp)
+
+        # 2nd (last) columns
+        rs = mi_labels.loc[:, 'j']
+        with catch_warnings(record=True):
+            xp = mi_labels.ix[:, 'j']
+        tm.assert_frame_equal(rs, xp)
+
+        # corner column
+        rs = mi_labels.loc['j'].loc[:, 'j']
+        with catch_warnings(record=True):
+            xp = mi_labels.ix['j'].ix[:, 'j']
+        tm.assert_frame_equal(rs, xp)
+
+        # with a tuple
+        rs = mi_labels.loc[('i', 'X')]
+        with catch_warnings(record=True):
+            xp = mi_labels.ix[('i', 'X')]
+        tm.assert_frame_equal(rs, xp)
+
+        rs = mi_int.loc[4]
+        with catch_warnings(record=True):
+            xp = mi_int.ix[4]
+        tm.assert_frame_equal(rs, xp)
+
+        # missing label
+        pytest.raises(KeyError, lambda: mi_int.loc[2])
+        with catch_warnings(record=True):
+            # GH 21593
+            pytest.raises(KeyError, lambda: mi_int.ix[2])
+
+    def test_getitem_partial_int(self):
+        # GH 12416
+        # with single item
+        l1 = [10, 20]
+        l2 = ['a', 'b']
+        df = DataFrame(index=range(2),
+                       columns=MultiIndex.from_product([l1, l2]))
+        expected = DataFrame(index=range(2),
+                             columns=l2)
+        result = df[20]
+        tm.assert_frame_equal(result, expected)
+
+        # with list
+        expected = DataFrame(index=range(2),
+                             columns=MultiIndex.from_product([l1[1:], l2]))
+        result = df[[20]]
+        tm.assert_frame_equal(result, expected)
+
+        # missing item:
+        with tm.assert_raises_regex(KeyError, '1'):
+            df[1]
+        with tm.assert_raises_regex(KeyError, r"'\[1\] not in index'"):
+            df[[1]]
+
+    def test_loc_multiindex_indexer_none(self):
+
+        # GH6788
+        # multi-index indexer is None (meaning take all)
+        attributes = ['Attribute' + str(i) for i in range(1)]
+        attribute_values = ['Value' + str(i) for i in range(5)]
+
+        index = MultiIndex.from_product([attributes, attribute_values])
+        df = 0.1 * np.random.randn(10, 1 * 5) + 0.5
+        df = DataFrame(df, columns=index)
+        result = df[attributes]
+        tm.assert_frame_equal(result, df)
+
+        # GH 7349
+        # loc with a multi-index seems to be doing fallback
+        df = DataFrame(np.arange(12).reshape(-1, 1),
+                       index=MultiIndex.from_product([[1, 2, 3, 4],
+                                                      [1, 2, 3]]))
+
+        expected = df.loc[([1, 2], ), :]
+        result = df.loc[[1, 2]]
+        tm.assert_frame_equal(result, expected)
+
+    def test_loc_multiindex_incomplete(self):
+
+        # GH 7399
+        # incomplete indexers
+        s = Series(np.arange(15, dtype='int64'),
+                   MultiIndex.from_product([range(5), ['a', 'b', 'c']]))
+        expected = s.loc[:, 'a':'c']
+
+        result = s.loc[0:4, 'a':'c']
+        tm.assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
+
+        result = s.loc[:4, 'a':'c']
+        tm.assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
+
+        result = s.loc[0:, 'a':'c']
+        tm.assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
+
+        # GH 7400
+        # multiindexer gettitem with list of indexers skips wrong element
+        s = Series(np.arange(15, dtype='int64'),
+                   MultiIndex.from_product([range(5), ['a', 'b', 'c']]))
+        expected = s.iloc[[6, 7, 8, 12, 13, 14]]
+        result = s.loc[2:4:2, 'a':'c']
+        tm.assert_series_equal(result, expected)
+
+    def test_multiindex_perf_warn(self):
+
+        df = DataFrame({'jim': [0, 0, 1, 1],
+                        'joe': ['x', 'x', 'z', 'y'],
+                        'jolie': np.random.rand(4)}).set_index(['jim', 'joe'])
+
+        with tm.assert_produces_warning(PerformanceWarning,
+                                        clear=[pd.core.index]):
+            df.loc[(1, 'z')]
+
+        df = df.iloc[[2, 1, 3, 0]]
+        with tm.assert_produces_warning(PerformanceWarning):
+            df.loc[(0, )]
+
+    def test_series_getitem_multiindex(self):
+
+        # GH 6018
+        # series regression getitem with a multi-index
+
+        s = Series([1, 2, 3])
+        s.index = MultiIndex.from_tuples([(0, 0), (1, 1), (2, 1)])
+
+        result = s[:, 0]
+        expected = Series([1], index=[0])
+        tm.assert_series_equal(result, expected)
+
+        result = s.loc[:, 1]
+        expected = Series([2, 3], index=[1, 2])
+        tm.assert_series_equal(result, expected)
+
+        # xs
+        result = s.xs(0, level=0)
+        expected = Series([1], index=[0])
+        tm.assert_series_equal(result, expected)
+
+        result = s.xs(1, level=1)
+        expected = Series([2, 3], index=[1, 2])
+        tm.assert_series_equal(result, expected)
+
+        # GH6258
+        dt = list(date_range('20130903', periods=3))
+        idx = MultiIndex.from_product([list('AB'), dt])
+        s = Series([1, 3, 4, 1, 3, 4], index=idx)
+
+        result = s.xs('20130903', level=1)
+        expected = Series([1, 1], index=list('AB'))
+        tm.assert_series_equal(result, expected)
+
+        # GH5684
+        idx = MultiIndex.from_tuples([('a', 'one'), ('a', 'two'), ('b', 'one'),
+                                      ('b', 'two')])
+        s = Series([1, 2, 3, 4], index=idx)
+        s.index.set_names(['L1', 'L2'], inplace=True)
+        result = s.xs('one', level='L2')
+        expected = Series([1, 3], index=['a', 'b'])
+        expected.index.set_names(['L1'], inplace=True)
+        tm.assert_series_equal(result, expected)
+
+    def test_xs_multiindex(self):
+
+        # GH2903
+        columns = MultiIndex.from_tuples(
+            [('a', 'foo'), ('a', 'bar'), ('b', 'hello'),
+             ('b', 'world')], names=['lvl0', 'lvl1'])
+        df = DataFrame(np.random.randn(4, 4), columns=columns)
+        df.sort_index(axis=1, inplace=True)
+        result = df.xs('a', level='lvl0', axis=1)
+        expected = df.iloc[:, 0:2].loc[:, 'a']
+        tm.assert_frame_equal(result, expected)
+
+        result = df.xs('foo', level='lvl1', axis=1)
+        expected = df.iloc[:, 1:2].copy()
+        expected.columns = expected.columns.droplevel('lvl1')
+        tm.assert_frame_equal(result, expected)
+
+    def test_multiindex_setitem(self):
+
+        # GH 3738
+        # setting with a multi-index right hand side
+        arrays = [np.array(['bar', 'bar', 'baz', 'qux', 'qux', 'bar']),
+                  np.array(['one', 'two', 'one', 'one', 'two', 'one']),
+                  np.arange(0, 6, 1)]
+
+        df_orig = DataFrame(np.random.randn(6, 3), index=arrays,
+                            columns=['A', 'B', 'C']).sort_index()
+
+        expected = df_orig.loc[['bar']] * 2
+        df = df_orig.copy()
+        df.loc[['bar']] *= 2
+        tm.assert_frame_equal(df.loc[['bar']], expected)
+
+        # raise because these have differing levels
+        def f():
+            df.loc['bar'] *= 2
+
+        pytest.raises(TypeError, f)
+
+        # from SO
+        # http://stackoverflow.com/questions/24572040/pandas-access-the-level-of-multiindex-for-inplace-operation
+        df_orig = DataFrame.from_dict({'price': {
+            ('DE', 'Coal', 'Stock'): 2,
+            ('DE', 'Gas', 'Stock'): 4,
+            ('DE', 'Elec', 'Demand'): 1,
+            ('FR', 'Gas', 'Stock'): 5,
+            ('FR', 'Solar', 'SupIm'): 0,
+            ('FR', 'Wind', 'SupIm'): 0
+        }})
+        df_orig.index = MultiIndex.from_tuples(df_orig.index,
+                                               names=['Sit', 'Com', 'Type'])
+
+        expected = df_orig.copy()
+        expected.iloc[[0, 2, 3]] *= 2
+
+        idx = pd.IndexSlice
+        df = df_orig.copy()
+        df.loc[idx[:, :, 'Stock'], :] *= 2
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc[idx[:, :, 'Stock'], 'price'] *= 2
+        tm.assert_frame_equal(df, expected)
+
+    def test_getitem_duplicates_multiindex(self):
+        # GH 5725 the 'A' happens to be a valid Timestamp so the doesn't raise
+        # the appropriate error, only in PY3 of course!
+
+        index = MultiIndex(levels=[['D', 'B', 'C'],
+                                   [0, 26, 27, 37, 57, 67, 75, 82]],
+                           labels=[[0, 0, 0, 1, 2, 2, 2, 2, 2, 2],
+                                   [1, 3, 4, 6, 0, 2, 2, 3, 5, 7]],
+                           names=['tag', 'day'])
+        arr = np.random.randn(len(index), 1)
+        df = DataFrame(arr, index=index, columns=['val'])
+        result = df.val['D']
+        expected = Series(arr.ravel()[0:3], name='val', index=Index(
+            [26, 37, 57], name='day'))
+        tm.assert_series_equal(result, expected)
+
+        def f():
+            df.val['A']
+
+        pytest.raises(KeyError, f)
+
+        def f():
+            df.val['X']
+
+        pytest.raises(KeyError, f)
+
+        # A is treated as a special Timestamp
+        index = MultiIndex(levels=[['A', 'B', 'C'],
+                                   [0, 26, 27, 37, 57, 67, 75, 82]],
+                           labels=[[0, 0, 0, 1, 2, 2, 2, 2, 2, 2],
+                                   [1, 3, 4, 6, 0, 2, 2, 3, 5, 7]],
+                           names=['tag', 'day'])
+        df = DataFrame(arr, index=index, columns=['val'])
+        result = df.val['A']
+        expected = Series(arr.ravel()[0:3], name='val', index=Index(
+            [26, 37, 57], name='day'))
+        tm.assert_series_equal(result, expected)
+
+        def f():
+            df.val['X']
+
+        pytest.raises(KeyError, f)
+
+        # GH 7866
+        # multi-index slicing with missing indexers
+        idx = MultiIndex.from_product([['A', 'B', 'C'],
+                                       ['foo', 'bar', 'baz']],
+                                      names=['one', 'two'])
+        s = Series(np.arange(9, dtype='int64'), index=idx).sort_index()
+
+        exp_idx = MultiIndex.from_product([['A'], ['foo', 'bar', 'baz']],
+                                          names=['one', 'two'])
+        expected = Series(np.arange(3, dtype='int64'),
+                          index=exp_idx).sort_index()
+
+        result = s.loc[['A']]
+        tm.assert_series_equal(result, expected)
+        result = s.loc[['A', 'D']]
+        tm.assert_series_equal(result, expected)
+
+        # not any values found
+        pytest.raises(KeyError, lambda: s.loc[['D']])
+
+        # empty ok
+        result = s.loc[[]]
+        expected = s.iloc[[]]
+        tm.assert_series_equal(result, expected)
+
+        idx = pd.IndexSlice
+        expected = Series([0, 3, 6], index=MultiIndex.from_product(
+            [['A', 'B', 'C'], ['foo']], names=['one', 'two'])).sort_index()
+
+        result = s.loc[idx[:, ['foo']]]
+        tm.assert_series_equal(result, expected)
+        result = s.loc[idx[:, ['foo', 'bah']]]
+        tm.assert_series_equal(result, expected)
+
+        # GH 8737
+        # empty indexer
+        multi_index = MultiIndex.from_product((['foo', 'bar', 'baz'],
+                                               ['alpha', 'beta']))
+        df = DataFrame(
+            np.random.randn(5, 6), index=range(5), columns=multi_index)
+        df = df.sort_index(level=0, axis=1)
+
+        expected = DataFrame(index=range(5),
+                             columns=multi_index.reindex([])[0])
+        result1 = df.loc[:, ([], slice(None))]
+        result2 = df.loc[:, (['foo'], [])]
+        tm.assert_frame_equal(result1, expected)
+        tm.assert_frame_equal(result2, expected)
+
+        # regression from < 0.14.0
+        # GH 7914
+        df = DataFrame([[np.mean, np.median], ['mean', 'median']],
+                       columns=MultiIndex.from_tuples([('functs', 'mean'),
+                                                       ('functs', 'median')]),
+                       index=['function', 'name'])
+        result = df.loc['function', ('functs', 'mean')]
+        assert result == np.mean
+
+    def test_multiindex_assignment(self):
+
+        # GH3777 part 2
+
+        # mixed dtype
+        df = DataFrame(np.random.randint(5, 10, size=9).reshape(3, 3),
+                       columns=list('abc'),
+                       index=[[4, 4, 8], [8, 10, 12]])
+        df['d'] = np.nan
+        arr = np.array([0., 1.])
+
+        with catch_warnings(record=True):
+            df.ix[4, 'd'] = arr
+            tm.assert_series_equal(df.ix[4, 'd'],
+                                   Series(arr, index=[8, 10], name='d'))
+
+        # single dtype
+        df = DataFrame(np.random.randint(5, 10, size=9).reshape(3, 3),
+                       columns=list('abc'),
+                       index=[[4, 4, 8], [8, 10, 12]])
+
+        with catch_warnings(record=True):
+            df.ix[4, 'c'] = arr
+            exp = Series(arr, index=[8, 10], name='c', dtype='float64')
+            tm.assert_series_equal(df.ix[4, 'c'], exp)
+
+        # scalar ok
+        with catch_warnings(record=True):
+            df.ix[4, 'c'] = 10
+            exp = Series(10, index=[8, 10], name='c', dtype='float64')
+            tm.assert_series_equal(df.ix[4, 'c'], exp)
+
+        # invalid assignments
+        def f():
+            with catch_warnings(record=True):
+                df.ix[4, 'c'] = [0, 1, 2, 3]
+
+        pytest.raises(ValueError, f)
+
+        def f():
+            with catch_warnings(record=True):
+                df.ix[4, 'c'] = [0]
+
+        pytest.raises(ValueError, f)
+
+        # groupby example
+        NUM_ROWS = 100
+        NUM_COLS = 10
+        col_names = ['A' + num for num in
+                     map(str, np.arange(NUM_COLS).tolist())]
+        index_cols = col_names[:5]
+
+        df = DataFrame(np.random.randint(5, size=(NUM_ROWS, NUM_COLS)),
+                       dtype=np.int64, columns=col_names)
+        df = df.set_index(index_cols).sort_index()
+        grp = df.groupby(level=index_cols[:4])
+        df['new_col'] = np.nan
+
+        f_index = np.arange(5)
+
+        def f(name, df2):
+            return Series(np.arange(df2.shape[0]),
+                          name=df2.index.values[0]).reindex(f_index)
+
+        # TODO(wesm): unused?
+        # new_df = pd.concat([f(name, df2) for name, df2 in grp], axis=1).T
+
+        # we are actually operating on a copy here
+        # but in this case, that's ok
+        for name, df2 in grp:
+            new_vals = np.arange(df2.shape[0])
+            with catch_warnings(record=True):
+                df.ix[name, 'new_col'] = new_vals
+
+    def test_multiindex_label_slicing_with_negative_step(self):
+        s = Series(np.arange(20),
+                   MultiIndex.from_product([list('abcde'), np.arange(4)]))
+        SLC = pd.IndexSlice
+
+        def assert_slices_equivalent(l_slc, i_slc):
+            tm.assert_series_equal(s.loc[l_slc], s.iloc[i_slc])
+            tm.assert_series_equal(s[l_slc], s.iloc[i_slc])
+            with catch_warnings(record=True):
+                tm.assert_series_equal(s.ix[l_slc], s.iloc[i_slc])
+
+        assert_slices_equivalent(SLC[::-1], SLC[::-1])
+
+        assert_slices_equivalent(SLC['d'::-1], SLC[15::-1])
+        assert_slices_equivalent(SLC[('d', )::-1], SLC[15::-1])
+
+        assert_slices_equivalent(SLC[:'d':-1], SLC[:11:-1])
+        assert_slices_equivalent(SLC[:('d', ):-1], SLC[:11:-1])
+
+        assert_slices_equivalent(SLC['d':'b':-1], SLC[15:3:-1])
+        assert_slices_equivalent(SLC[('d', ):'b':-1], SLC[15:3:-1])
+        assert_slices_equivalent(SLC['d':('b', ):-1], SLC[15:3:-1])
+        assert_slices_equivalent(SLC[('d', ):('b', ):-1], SLC[15:3:-1])
+        assert_slices_equivalent(SLC['b':'d':-1], SLC[:0])
+
+        assert_slices_equivalent(SLC[('c', 2)::-1], SLC[10::-1])
+        assert_slices_equivalent(SLC[:('c', 2):-1], SLC[:9:-1])
+        assert_slices_equivalent(SLC[('e', 0):('c', 2):-1], SLC[16:9:-1])
+
+    def test_multiindex_slice_first_level(self):
+        # GH 12697
+        freq = ['a', 'b', 'c', 'd']
+        idx = MultiIndex.from_product([freq, np.arange(500)])
+        df = DataFrame(list(range(2000)), index=idx, columns=['Test'])
+        df_slice = df.loc[pd.IndexSlice[:, 30:70], :]
+        result = df_slice.loc['a']
+        expected = DataFrame(list(range(30, 71)),
+                             columns=['Test'], index=range(30, 71))
+        tm.assert_frame_equal(result, expected)
+        result = df_slice.loc['d']
+        expected = DataFrame(list(range(1530, 1571)),
+                             columns=['Test'], index=range(30, 71))
+        tm.assert_frame_equal(result, expected)
+
+    def test_multiindex_symmetric_difference(self):
+        # GH 13490
+        idx = MultiIndex.from_product([['a', 'b'], ['A', 'B']],
+                                      names=['a', 'b'])
+        result = idx ^ idx
+        assert result.names == idx.names
+
+        idx2 = idx.copy().rename(['A', 'B'])
+        result = idx ^ idx2
+        assert result.names == [None, None]
+
+    def test_multiindex_contains_dropped(self):
+        # GH 19027
+        # test that dropped MultiIndex levels are not in the MultiIndex
+        # despite continuing to be in the MultiIndex's levels
+        idx = MultiIndex.from_product([[1, 2], [3, 4]])
+        assert 2 in idx
+        idx = idx.drop(2)
+
+        # drop implementation keeps 2 in the levels
+        assert 2 in idx.levels[0]
+        # but it should no longer be in the index itself
+        assert 2 not in idx
+
+        # also applies to strings
+        idx = MultiIndex.from_product([['a', 'b'], ['c', 'd']])
+        assert 'a' in idx
+        idx = idx.drop('a')
+        assert 'a' in idx.levels[0]
+        assert 'a' not in idx
+
+
+class TestMultiIndexSlicers(object):
+
+    def test_per_axis_per_level_getitem(self):
+
+        # GH6134
+        # example test case
+        ix = MultiIndex.from_product([_mklbl('A', 5), _mklbl('B', 7), _mklbl(
+            'C', 4), _mklbl('D', 2)])
+        df = DataFrame(np.arange(len(ix.get_values())), index=ix)
+
+        result = df.loc[(slice('A1', 'A3'), slice(None), ['C1', 'C3']), :]
+        expected = df.loc[[tuple([a, b, c, d])
+                           for a, b, c, d in df.index.values
+                           if (a == 'A1' or a == 'A2' or a == 'A3') and (
+                               c == 'C1' or c == 'C3')]]
+        tm.assert_frame_equal(result, expected)
+
+        expected = df.loc[[tuple([a, b, c, d])
+                           for a, b, c, d in df.index.values
+                           if (a == 'A1' or a == 'A2' or a == 'A3') and (
+                               c == 'C1' or c == 'C2' or c == 'C3')]]
+        result = df.loc[(slice('A1', 'A3'), slice(None), slice('C1', 'C3')), :]
+        tm.assert_frame_equal(result, expected)
+
+        # test multi-index slicing with per axis and per index controls
+        index = MultiIndex.from_tuples([('A', 1), ('A', 2),
+                                        ('A', 3), ('B', 1)],
+                                       names=['one', 'two'])
+        columns = MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
+                                          ('b', 'foo'), ('b', 'bah')],
+                                         names=['lvl0', 'lvl1'])
+
+        df = DataFrame(
+            np.arange(16, dtype='int64').reshape(
+                4, 4), index=index, columns=columns)
+        df = df.sort_index(axis=0).sort_index(axis=1)
+
+        # identity
+        result = df.loc[(slice(None), slice(None)), :]
+        tm.assert_frame_equal(result, df)
+        result = df.loc[(slice(None), slice(None)), (slice(None), slice(None))]
+        tm.assert_frame_equal(result, df)
+        result = df.loc[:, (slice(None), slice(None))]
+        tm.assert_frame_equal(result, df)
+
+        # index
+        result = df.loc[(slice(None), [1]), :]
+        expected = df.iloc[[0, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[(slice(None), 1), :]
+        expected = df.iloc[[0, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        # columns
+        result = df.loc[:, (slice(None), ['foo'])]
+        expected = df.iloc[:, [1, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        # both
+        result = df.loc[(slice(None), 1), (slice(None), ['foo'])]
+        expected = df.iloc[[0, 3], [1, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc['A', 'a']
+        expected = DataFrame(dict(bar=[1, 5, 9], foo=[0, 4, 8]),
+                             index=Index([1, 2, 3], name='two'),
+                             columns=Index(['bar', 'foo'], name='lvl1'))
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[(slice(None), [1, 2]), :]
+        expected = df.iloc[[0, 1, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        # multi-level series
+        s = Series(np.arange(len(ix.get_values())), index=ix)
+        result = s.loc['A1':'A3', :, ['C1', 'C3']]
+        expected = s.loc[[tuple([a, b, c, d])
+                          for a, b, c, d in s.index.values
+                          if (a == 'A1' or a == 'A2' or a == 'A3') and (
+                              c == 'C1' or c == 'C3')]]
+        tm.assert_series_equal(result, expected)
+
+        # boolean indexers
+        result = df.loc[(slice(None), df.loc[:, ('a', 'bar')] > 5), :]
+        expected = df.iloc[[2, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        def f():
+            df.loc[(slice(None), np.array([True, False])), :]
+
+        pytest.raises(ValueError, f)
+
+        # ambiguous cases
+        # these can be multiply interpreted (e.g. in this case
+        # as df.loc[slice(None),[1]] as well
+        pytest.raises(KeyError, lambda: df.loc[slice(None), [1]])
+
+        result = df.loc[(slice(None), [1]), :]
+        expected = df.iloc[[0, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        # not lexsorted
+        assert df.index.lexsort_depth == 2
+        df = df.sort_index(level=1, axis=0)
+        assert df.index.lexsort_depth == 0
+        with tm.assert_raises_regex(
+                UnsortedIndexError,
+                'MultiIndex slicing requires the index to be '
+                r'lexsorted: slicing on levels \[1\], lexsort depth 0'):
+            df.loc[(slice(None), slice('bar')), :]
+
+        # GH 16734: not sorted, but no real slicing
+        result = df.loc[(slice(None), df.loc[:, ('a', 'bar')] > 5), :]
+        tm.assert_frame_equal(result, df.iloc[[1, 3], :])
+
+    def test_multiindex_slicers_non_unique(self):
+
+        # GH 7106
+        # non-unique mi index support
+        df = (DataFrame(dict(A=['foo', 'foo', 'foo', 'foo'],
+                             B=['a', 'a', 'a', 'a'],
+                             C=[1, 2, 1, 3],
+                             D=[1, 2, 3, 4]))
+              .set_index(['A', 'B', 'C']).sort_index())
+        assert not df.index.is_unique
+        expected = (DataFrame(dict(A=['foo', 'foo'], B=['a', 'a'],
+                                   C=[1, 1], D=[1, 3]))
+                    .set_index(['A', 'B', 'C']).sort_index())
+        result = df.loc[(slice(None), slice(None), 1), :]
+        tm.assert_frame_equal(result, expected)
+
+        # this is equivalent of an xs expression
+        result = df.xs(1, level=2, drop_level=False)
+        tm.assert_frame_equal(result, expected)
+
+        df = (DataFrame(dict(A=['foo', 'foo', 'foo', 'foo'],
+                             B=['a', 'a', 'a', 'a'],
+                             C=[1, 2, 1, 2],
+                             D=[1, 2, 3, 4]))
+              .set_index(['A', 'B', 'C']).sort_index())
+        assert not df.index.is_unique
+        expected = (DataFrame(dict(A=['foo', 'foo'], B=['a', 'a'],
+                                   C=[1, 1], D=[1, 3]))
+                    .set_index(['A', 'B', 'C']).sort_index())
+        result = df.loc[(slice(None), slice(None), 1), :]
+        assert not result.index.is_unique
+        tm.assert_frame_equal(result, expected)
+
+        # GH12896
+        # numpy-implementation dependent bug
+        ints = [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 12, 13, 14, 14, 16,
+                17, 18, 19, 200000, 200000]
+        n = len(ints)
+        idx = MultiIndex.from_arrays([['a'] * n, ints])
+        result = Series([1] * n, index=idx)
+        result = result.sort_index()
+        result = result.loc[(slice(None), slice(100000))]
+        expected = Series([1] * (n - 2), index=idx[:-2]).sort_index()
+        tm.assert_series_equal(result, expected)
+
+    def test_multiindex_slicers_datetimelike(self):
+
+        # GH 7429
+        # buggy/inconsistent behavior when slicing with datetime-like
+        import datetime
+        dates = [datetime.datetime(2012, 1, 1, 12, 12, 12) +
+                 datetime.timedelta(days=i) for i in range(6)]
+        freq = [1, 2]
+        index = MultiIndex.from_product(
+            [dates, freq], names=['date', 'frequency'])
+
+        df = DataFrame(
+            np.arange(6 * 2 * 4, dtype='int64').reshape(
+                -1, 4), index=index, columns=list('ABCD'))
+
+        # multi-axis slicing
+        idx = pd.IndexSlice
+        expected = df.iloc[[0, 2, 4], [0, 1]]
+        result = df.loc[(slice(Timestamp('2012-01-01 12:12:12'),
+                               Timestamp('2012-01-03 12:12:12')),
+                         slice(1, 1)), slice('A', 'B')]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[(idx[Timestamp('2012-01-01 12:12:12'):Timestamp(
+            '2012-01-03 12:12:12')], idx[1:1]), slice('A', 'B')]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[(slice(Timestamp('2012-01-01 12:12:12'),
+                               Timestamp('2012-01-03 12:12:12')), 1),
+                        slice('A', 'B')]
+        tm.assert_frame_equal(result, expected)
+
+        # with strings
+        result = df.loc[(slice('2012-01-01 12:12:12', '2012-01-03 12:12:12'),
+                         slice(1, 1)), slice('A', 'B')]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[(idx['2012-01-01 12:12:12':'2012-01-03 12:12:12'], 1),
+                        idx['A', 'B']]
+        tm.assert_frame_equal(result, expected)
+
+    def test_multiindex_slicers_edges(self):
+        # GH 8132
+        # various edge cases
+        df = DataFrame(
+            {'A': ['A0'] * 5 + ['A1'] * 5 + ['A2'] * 5,
+             'B': ['B0', 'B0', 'B1', 'B1', 'B2'] * 3,
+             'DATE': ["2013-06-11", "2013-07-02", "2013-07-09", "2013-07-30",
+                      "2013-08-06", "2013-06-11", "2013-07-02", "2013-07-09",
+                      "2013-07-30", "2013-08-06", "2013-09-03", "2013-10-01",
+                      "2013-07-09", "2013-08-06", "2013-09-03"],
+             'VALUES': [22, 35, 14, 9, 4, 40, 18, 4, 2, 5, 1, 2, 3, 4, 2]})
+
+        df['DATE'] = pd.to_datetime(df['DATE'])
+        df1 = df.set_index(['A', 'B', 'DATE'])
+        df1 = df1.sort_index()
+
+        # A1 - Get all values under "A0" and "A1"
+        result = df1.loc[(slice('A1')), :]
+        expected = df1.iloc[0:10]
+        tm.assert_frame_equal(result, expected)
+
+        # A2 - Get all values from the start to "A2"
+        result = df1.loc[(slice('A2')), :]
+        expected = df1
+        tm.assert_frame_equal(result, expected)
+
+        # A3 - Get all values under "B1" or "B2"
+        result = df1.loc[(slice(None), slice('B1', 'B2')), :]
+        expected = df1.iloc[[2, 3, 4, 7, 8, 9, 12, 13, 14]]
+        tm.assert_frame_equal(result, expected)
+
+        # A4 - Get all values between 2013-07-02 and 2013-07-09
+        result = df1.loc[(slice(None), slice(None),
+                          slice('20130702', '20130709')), :]
+        expected = df1.iloc[[1, 2, 6, 7, 12]]
+        tm.assert_frame_equal(result, expected)
+
+        # B1 - Get all values in B0 that are also under A0, A1 and A2
+        result = df1.loc[(slice('A2'), slice('B0')), :]
+        expected = df1.iloc[[0, 1, 5, 6, 10, 11]]
+        tm.assert_frame_equal(result, expected)
+
+        # B2 - Get all values in B0, B1 and B2 (similar to what #2 is doing for
+        # the As)
+        result = df1.loc[(slice(None), slice('B2')), :]
+        expected = df1
+        tm.assert_frame_equal(result, expected)
+
+        # B3 - Get all values from B1 to B2 and up to 2013-08-06
+        result = df1.loc[(slice(None), slice('B1', 'B2'),
+                          slice('2013-08-06')), :]
+        expected = df1.iloc[[2, 3, 4, 7, 8, 9, 12, 13]]
+        tm.assert_frame_equal(result, expected)
+
+        # B4 - Same as A4 but the start of the date slice is not a key.
+        #      shows indexing on a partial selection slice
+        result = df1.loc[(slice(None), slice(None),
+                          slice('20130701', '20130709')), :]
+        expected = df1.iloc[[1, 2, 6, 7, 12]]
+        tm.assert_frame_equal(result, expected)
+
+    def test_per_axis_per_level_doc_examples(self):
+
+        # test index maker
+        idx = pd.IndexSlice
+
+        # from indexing.rst / advanced
+        index = MultiIndex.from_product([_mklbl('A', 4), _mklbl('B', 2),
+                                         _mklbl('C', 4), _mklbl('D', 2)])
+        columns = MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
+                                          ('b', 'foo'), ('b', 'bah')],
+                                         names=['lvl0', 'lvl1'])
+        df = DataFrame(np.arange(len(index) * len(columns), dtype='int64')
+                       .reshape((len(index), len(columns))),
+                       index=index, columns=columns)
+        result = df.loc[(slice('A1', 'A3'), slice(None), ['C1', 'C3']), :]
+        expected = df.loc[[tuple([a, b, c, d])
+                           for a, b, c, d in df.index.values
+                           if (a == 'A1' or a == 'A2' or a == 'A3') and (
+                               c == 'C1' or c == 'C3')]]
+        tm.assert_frame_equal(result, expected)
+        result = df.loc[idx['A1':'A3', :, ['C1', 'C3']], :]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[(slice(None), slice(None), ['C1', 'C3']), :]
+        expected = df.loc[[tuple([a, b, c, d])
+                           for a, b, c, d in df.index.values
+                           if (c == 'C1' or c == 'C3')]]
+        tm.assert_frame_equal(result, expected)
+        result = df.loc[idx[:, :, ['C1', 'C3']], :]
+        tm.assert_frame_equal(result, expected)
+
+        # not sorted
+        def f():
+            df.loc['A1', ('a', slice('foo'))]
+
+        pytest.raises(UnsortedIndexError, f)
+
+        # GH 16734: not sorted, but no real slicing
+        tm.assert_frame_equal(df.loc['A1', (slice(None), 'foo')],
+                              df.loc['A1'].iloc[:, [0, 2]])
+
+        df = df.sort_index(axis=1)
+
+        # slicing
+        df.loc['A1', (slice(None), 'foo')]
+        df.loc[(slice(None), slice(None), ['C1', 'C3']), (slice(None), 'foo')]
+
+        # setitem
+        df.loc(axis=0)[:, :, ['C1', 'C3']] = -10
+
+    def test_loc_axis_arguments(self):
+
+        index = MultiIndex.from_product([_mklbl('A', 4), _mklbl('B', 2),
+                                         _mklbl('C', 4), _mklbl('D', 2)])
+        columns = MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
+                                          ('b', 'foo'), ('b', 'bah')],
+                                         names=['lvl0', 'lvl1'])
+        df = DataFrame(np.arange(len(index) * len(columns), dtype='int64')
+                       .reshape((len(index), len(columns))),
+                       index=index,
+                       columns=columns).sort_index().sort_index(axis=1)
+
+        # axis 0
+        result = df.loc(axis=0)['A1':'A3', :, ['C1', 'C3']]
+        expected = df.loc[[tuple([a, b, c, d])
+                           for a, b, c, d in df.index.values
+                           if (a == 'A1' or a == 'A2' or a == 'A3') and (
+                               c == 'C1' or c == 'C3')]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc(axis='index')[:, :, ['C1', 'C3']]
+        expected = df.loc[[tuple([a, b, c, d])
+                           for a, b, c, d in df.index.values
+                           if (c == 'C1' or c == 'C3')]]
+        tm.assert_frame_equal(result, expected)
+
+        # axis 1
+        result = df.loc(axis=1)[:, 'foo']
+        expected = df.loc[:, (slice(None), 'foo')]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc(axis='columns')[:, 'foo']
+        expected = df.loc[:, (slice(None), 'foo')]
+        tm.assert_frame_equal(result, expected)
+
+        # invalid axis
+        def f():
+            df.loc(axis=-1)[:, :, ['C1', 'C3']]
+
+        pytest.raises(ValueError, f)
+
+        def f():
+            df.loc(axis=2)[:, :, ['C1', 'C3']]
+
+        pytest.raises(ValueError, f)
+
+        def f():
+            df.loc(axis='foo')[:, :, ['C1', 'C3']]
+
+        pytest.raises(ValueError, f)
+
+    def test_per_axis_per_level_setitem(self):
+
+        # test index maker
+        idx = pd.IndexSlice
+
+        # test multi-index slicing with per axis and per index controls
+        index = MultiIndex.from_tuples([('A', 1), ('A', 2),
+                                        ('A', 3), ('B', 1)],
+                                       names=['one', 'two'])
+        columns = MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
+                                          ('b', 'foo'), ('b', 'bah')],
+                                         names=['lvl0', 'lvl1'])
+
+        df_orig = DataFrame(
+            np.arange(16, dtype='int64').reshape(
+                4, 4), index=index, columns=columns)
+        df_orig = df_orig.sort_index(axis=0).sort_index(axis=1)
+
+        # identity
+        df = df_orig.copy()
+        df.loc[(slice(None), slice(None)), :] = 100
+        expected = df_orig.copy()
+        expected.iloc[:, :] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc(axis=0)[:, :] = 100
+        expected = df_orig.copy()
+        expected.iloc[:, :] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc[(slice(None), slice(None)), (slice(None), slice(None))] = 100
+        expected = df_orig.copy()
+        expected.iloc[:, :] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc[:, (slice(None), slice(None))] = 100
+        expected = df_orig.copy()
+        expected.iloc[:, :] = 100
+        tm.assert_frame_equal(df, expected)
+
+        # index
+        df = df_orig.copy()
+        df.loc[(slice(None), [1]), :] = 100
+        expected = df_orig.copy()
+        expected.iloc[[0, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc[(slice(None), 1), :] = 100
+        expected = df_orig.copy()
+        expected.iloc[[0, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc(axis=0)[:, 1] = 100
+        expected = df_orig.copy()
+        expected.iloc[[0, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        # columns
+        df = df_orig.copy()
+        df.loc[:, (slice(None), ['foo'])] = 100
+        expected = df_orig.copy()
+        expected.iloc[:, [1, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        # both
+        df = df_orig.copy()
+        df.loc[(slice(None), 1), (slice(None), ['foo'])] = 100
+        expected = df_orig.copy()
+        expected.iloc[[0, 3], [1, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc[idx[:, 1], idx[:, ['foo']]] = 100
+        expected = df_orig.copy()
+        expected.iloc[[0, 3], [1, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc['A', 'a'] = 100
+        expected = df_orig.copy()
+        expected.iloc[0:3, 0:2] = 100
+        tm.assert_frame_equal(df, expected)
+
+        # setting with a list-like
+        df = df_orig.copy()
+        df.loc[(slice(None), 1), (slice(None), ['foo'])] = np.array(
+            [[100, 100], [100, 100]], dtype='int64')
+        expected = df_orig.copy()
+        expected.iloc[[0, 3], [1, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        # not enough values
+        df = df_orig.copy()
+
+        def f():
+            df.loc[(slice(None), 1), (slice(None), ['foo'])] = np.array(
+                [[100], [100, 100]], dtype='int64')
+
+        pytest.raises(ValueError, f)
+
+        def f():
+            df.loc[(slice(None), 1), (slice(None), ['foo'])] = np.array(
+                [100, 100, 100, 100], dtype='int64')
+
+        pytest.raises(ValueError, f)
+
+        # with an alignable rhs
+        df = df_orig.copy()
+        df.loc[(slice(None), 1), (slice(None), ['foo'])] = df.loc[(slice(
+            None), 1), (slice(None), ['foo'])] * 5
+        expected = df_orig.copy()
+        expected.iloc[[0, 3], [1, 3]] = expected.iloc[[0, 3], [1, 3]] * 5
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc[(slice(None), 1), (slice(None), ['foo'])] *= df.loc[(slice(
+            None), 1), (slice(None), ['foo'])]
+        expected = df_orig.copy()
+        expected.iloc[[0, 3], [1, 3]] *= expected.iloc[[0, 3], [1, 3]]
+        tm.assert_frame_equal(df, expected)
+
+        rhs = df_orig.loc[(slice(None), 1), (slice(None), ['foo'])].copy()
+        rhs.loc[:, ('c', 'bah')] = 10
+        df = df_orig.copy()
+        df.loc[(slice(None), 1), (slice(None), ['foo'])] *= rhs
+        expected = df_orig.copy()
+        expected.iloc[[0, 3], [1, 3]] *= expected.iloc[[0, 3], [1, 3]]
+        tm.assert_frame_equal(df, expected)
+
+
+class TestMultiIndexPanel(object):
+
+    def test_iloc_getitem_panel_multiindex(self):
+
+        with catch_warnings(record=True):
+
+            # GH 7199
+            # Panel with multi-index
+            multi_index = MultiIndex.from_tuples([('ONE', 'one'),
+                                                  ('TWO', 'two'),
+                                                  ('THREE', 'three')],
+                                                 names=['UPPER', 'lower'])
+
+            simple_index = [x[0] for x in multi_index]
+            wd1 = Panel(items=['First', 'Second'],
+                        major_axis=['a', 'b', 'c', 'd'],
+                        minor_axis=multi_index)
+
+            wd2 = Panel(items=['First', 'Second'],
+                        major_axis=['a', 'b', 'c', 'd'],
+                        minor_axis=simple_index)
+
+            expected1 = wd1['First'].iloc[[True, True, True, False], [0, 2]]
+            result1 = wd1.iloc[0, [True, True, True, False], [0, 2]]  # WRONG
+            tm.assert_frame_equal(result1, expected1)
+
+            expected2 = wd2['First'].iloc[[True, True, True, False], [0, 2]]
+            result2 = wd2.iloc[0, [True, True, True, False], [0, 2]]
+            tm.assert_frame_equal(result2, expected2)
+
+            expected1 = DataFrame(index=['a'], columns=multi_index,
+                                  dtype='float64')
+            result1 = wd1.iloc[0, [0], [0, 1, 2]]
+            tm.assert_frame_equal(result1, expected1)
+
+            expected2 = DataFrame(index=['a'], columns=simple_index,
+                                  dtype='float64')
+            result2 = wd2.iloc[0, [0], [0, 1, 2]]
+            tm.assert_frame_equal(result2, expected2)
+
+            # GH 7516
+            mi = MultiIndex.from_tuples([(0, 'x'), (1, 'y'), (2, 'z')])
+            p = Panel(np.arange(3 * 3 * 3, dtype='int64').reshape(3, 3, 3),
+                      items=['a', 'b', 'c'], major_axis=mi,
+                      minor_axis=['u', 'v', 'w'])
+            result = p.iloc[:, 1, 0]
+            expected = Series([3, 12, 21], index=['a', 'b', 'c'], name='u')
+            tm.assert_series_equal(result, expected)
+
+            result = p.loc[:, (1, 'y'), 'u']
+            tm.assert_series_equal(result, expected)
+
+    def test_panel_setitem_with_multiindex(self):
+
+        with catch_warnings(record=True):
+            # 10360
+            # failing with a multi-index
+            arr = np.array([[[1, 2, 3], [0, 0, 0]],
+                            [[0, 0, 0], [0, 0, 0]]],
+                           dtype=np.float64)
+
+            # reg index
+            axes = dict(items=['A', 'B'], major_axis=[0, 1],
+                        minor_axis=['X', 'Y', 'Z'])
+            p1 = Panel(0., **axes)
+            p1.iloc[0, 0, :] = [1, 2, 3]
+            expected = Panel(arr, **axes)
+            tm.assert_panel_equal(p1, expected)
+
+            # multi-indexes
+            axes['items'] = MultiIndex.from_tuples(
+                [('A', 'a'), ('B', 'b')])
+            p2 = Panel(0., **axes)
+            p2.iloc[0, 0, :] = [1, 2, 3]
+            expected = Panel(arr, **axes)
+            tm.assert_panel_equal(p2, expected)
+
+            axes['major_axis'] = MultiIndex.from_tuples(
+                [('A', 1), ('A', 2)])
+            p3 = Panel(0., **axes)
+            p3.iloc[0, 0, :] = [1, 2, 3]
+            expected = Panel(arr, **axes)
+            tm.assert_panel_equal(p3, expected)
+
+            axes['minor_axis'] = MultiIndex.from_product(
+                [['X'], range(3)])
+            p4 = Panel(0., **axes)
+            p4.iloc[0, 0, :] = [1, 2, 3]
+            expected = Panel(arr, **axes)
+            tm.assert_panel_equal(p4, expected)
+
+            arr = np.array(
+                [[[1, 0, 0], [2, 0, 0]], [[0, 0, 0], [0, 0, 0]]],
+                dtype=np.float64)
+            p5 = Panel(0., **axes)
+            p5.iloc[0, :, 0] = [1, 2]
+            expected = Panel(arr, **axes)
+            tm.assert_panel_equal(p5, expected)
diff --git a/pandas/tests/indexing/test_panel.py b/pandas/tests/indexing/test_panel.py
new file mode 100644
index 0000000000000..1085e2a61be48
--- /dev/null
+++ b/pandas/tests/indexing/test_panel.py
@@ -0,0 +1,219 @@
+import pytest
+from warnings import catch_warnings
+
+import numpy as np
+from pandas.util import testing as tm
+from pandas import Panel, date_range, DataFrame
+
+
+class TestPanel(object):
+
+    def test_iloc_getitem_panel(self):
+
+        with catch_warnings(record=True):
+            # GH 7189
+            p = Panel(np.arange(4 * 3 * 2).reshape(4, 3, 2),
+                      items=['A', 'B', 'C', 'D'],
+                      major_axis=['a', 'b', 'c'],
+                      minor_axis=['one', 'two'])
+
+            result = p.iloc[1]
+            expected = p.loc['B']
+            tm.assert_frame_equal(result, expected)
+
+            result = p.iloc[1, 1]
+            expected = p.loc['B', 'b']
+            tm.assert_series_equal(result, expected)
+
+            result = p.iloc[1, 1, 1]
+            expected = p.loc['B', 'b', 'two']
+            assert result == expected
+
+            # slice
+            result = p.iloc[1:3]
+            expected = p.loc[['B', 'C']]
+            tm.assert_panel_equal(result, expected)
+
+            result = p.iloc[:, 0:2]
+            expected = p.loc[:, ['a', 'b']]
+            tm.assert_panel_equal(result, expected)
+
+            # list of integers
+            result = p.iloc[[0, 2]]
+            expected = p.loc[['A', 'C']]
+            tm.assert_panel_equal(result, expected)
+
+            # neg indices
+            result = p.iloc[[-1, 1], [-1, 1]]
+            expected = p.loc[['D', 'B'], ['c', 'b']]
+            tm.assert_panel_equal(result, expected)
+
+            # dups indices
+            result = p.iloc[[-1, -1, 1], [-1, 1]]
+            expected = p.loc[['D', 'D', 'B'], ['c', 'b']]
+            tm.assert_panel_equal(result, expected)
+
+            # combined
+            result = p.iloc[0, [True, True], [0, 1]]
+            expected = p.loc['A', ['a', 'b'], ['one', 'two']]
+            tm.assert_frame_equal(result, expected)
+
+            # out-of-bounds exception
+            with pytest.raises(IndexError):
+                p.iloc[tuple([10, 5])]
+
+            def f():
+                p.iloc[0, [True, True], [0, 1, 2]]
+
+            pytest.raises(IndexError, f)
+
+            # trying to use a label
+            with pytest.raises(ValueError):
+                p.iloc[tuple(['j', 'D'])]
+
+            # GH
+            p = Panel(
+                np.random.rand(4, 3, 2), items=['A', 'B', 'C', 'D'],
+                major_axis=['U', 'V', 'W'], minor_axis=['X', 'Y'])
+            expected = p['A']
+
+            result = p.iloc[0, :, :]
+            tm.assert_frame_equal(result, expected)
+
+            result = p.iloc[0, [True, True, True], :]
+            tm.assert_frame_equal(result, expected)
+
+            result = p.iloc[0, [True, True, True], [0, 1]]
+            tm.assert_frame_equal(result, expected)
+
+            def f():
+                p.iloc[0, [True, True, True], [0, 1, 2]]
+
+            pytest.raises(IndexError, f)
+
+            def f():
+                p.iloc[0, [True, True, True], [2]]
+
+            pytest.raises(IndexError, f)
+
+    def test_iloc_panel_issue(self):
+
+        with catch_warnings(record=True):
+            # see gh-3617
+            p = Panel(np.random.randn(4, 4, 4))
+
+            assert p.iloc[:3, :3, :3].shape == (3, 3, 3)
+            assert p.iloc[1, :3, :3].shape == (3, 3)
+            assert p.iloc[:3, 1, :3].shape == (3, 3)
+            assert p.iloc[:3, :3, 1].shape == (3, 3)
+            assert p.iloc[1, 1, :3].shape == (3, )
+            assert p.iloc[1, :3, 1].shape == (3, )
+            assert p.iloc[:3, 1, 1].shape == (3, )
+
+    def test_panel_getitem(self):
+
+        with catch_warnings(record=True):
+            # GH4016, date selection returns a frame when a partial string
+            # selection
+            ind = date_range(start="2000", freq="D", periods=1000)
+            df = DataFrame(
+                np.random.randn(
+                    len(ind), 5), index=ind, columns=list('ABCDE'))
+            panel = Panel({'frame_' + c: df for c in list('ABC')})
+
+            test2 = panel.loc[:, "2002":"2002-12-31"]
+            test1 = panel.loc[:, "2002"]
+            tm.assert_panel_equal(test1, test2)
+
+            # GH8710
+            # multi-element getting with a list
+            panel = tm.makePanel()
+
+            expected = panel.iloc[[0, 1]]
+
+            result = panel.loc[['ItemA', 'ItemB']]
+            tm.assert_panel_equal(result, expected)
+
+            result = panel.loc[['ItemA', 'ItemB'], :, :]
+            tm.assert_panel_equal(result, expected)
+
+            result = panel[['ItemA', 'ItemB']]
+            tm.assert_panel_equal(result, expected)
+
+            result = panel.loc['ItemA':'ItemB']
+            tm.assert_panel_equal(result, expected)
+
+            with catch_warnings(record=True):
+                result = panel.ix[['ItemA', 'ItemB']]
+            tm.assert_panel_equal(result, expected)
+
+            # with an object-like
+            # GH 9140
+            class TestObject(object):
+
+                def __str__(self):
+                    return "TestObject"
+
+            obj = TestObject()
+
+            p = Panel(np.random.randn(1, 5, 4), items=[obj],
+                      major_axis=date_range('1/1/2000', periods=5),
+                      minor_axis=['A', 'B', 'C', 'D'])
+
+            expected = p.iloc[0]
+            result = p[obj]
+            tm.assert_frame_equal(result, expected)
+
+    def test_panel_setitem(self):
+
+        with catch_warnings(record=True):
+            # GH 7763
+            # loc and setitem have setting differences
+            np.random.seed(0)
+            index = range(3)
+            columns = list('abc')
+
+            panel = Panel({'A': DataFrame(np.random.randn(3, 3),
+                                          index=index, columns=columns),
+                           'B': DataFrame(np.random.randn(3, 3),
+                                          index=index, columns=columns),
+                           'C': DataFrame(np.random.randn(3, 3),
+                                          index=index, columns=columns)})
+
+            replace = DataFrame(np.eye(3, 3), index=range(3), columns=columns)
+            expected = Panel({'A': replace, 'B': replace, 'C': replace})
+
+            p = panel.copy()
+            for idx in list('ABC'):
+                p[idx] = replace
+            tm.assert_panel_equal(p, expected)
+
+            p = panel.copy()
+            for idx in list('ABC'):
+                p.loc[idx, :, :] = replace
+            tm.assert_panel_equal(p, expected)
+
+    def test_panel_assignment(self):
+
+        with catch_warnings(record=True):
+            # GH3777
+            wp = Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
+                       major_axis=date_range('1/1/2000', periods=5),
+                       minor_axis=['A', 'B', 'C', 'D'])
+            wp2 = Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
+                        major_axis=date_range('1/1/2000', periods=5),
+                        minor_axis=['A', 'B', 'C', 'D'])
+
+            # TODO: unused?
+            # expected = wp.loc[['Item1', 'Item2'], :, ['A', 'B']]
+
+            def f():
+                wp.loc[['Item1', 'Item2'], :, ['A', 'B']] = wp2.loc[
+                    ['Item1', 'Item2'], :, ['A', 'B']]
+
+            pytest.raises(NotImplementedError, f)
+
+            # to_assign = wp2.loc[['Item1', 'Item2'], :, ['A', 'B']]
+            # wp.loc[['Item1', 'Item2'], :, ['A', 'B']] = to_assign
+            # result = wp.loc[['Item1', 'Item2'], :, ['A', 'B']]
+            # tm.assert_panel_equal(result,expected)
diff --git a/pandas/tests/indexing/test_partial.py b/pandas/tests/indexing/test_partial.py
new file mode 100644
index 0000000000000..3c7a7f070805d
--- /dev/null
+++ b/pandas/tests/indexing/test_partial.py
@@ -0,0 +1,640 @@
+"""
+test setting *parts* of objects both positionally and label based
+
+TOD: these should be split among the indexer tests
+"""
+
+import pytest
+
+from warnings import catch_warnings
+import numpy as np
+
+import pandas as pd
+from pandas import Series, DataFrame, Panel, Index, date_range
+from pandas.util import testing as tm
+
+
+class TestPartialSetting(object):
+
+    def test_partial_setting(self):
+
+        # GH2578, allow ix and friends to partially set
+
+        # series
+        s_orig = Series([1, 2, 3])
+
+        s = s_orig.copy()
+        s[5] = 5
+        expected = Series([1, 2, 3, 5], index=[0, 1, 2, 5])
+        tm.assert_series_equal(s, expected)
+
+        s = s_orig.copy()
+        s.loc[5] = 5
+        expected = Series([1, 2, 3, 5], index=[0, 1, 2, 5])
+        tm.assert_series_equal(s, expected)
+
+        s = s_orig.copy()
+        s[5] = 5.
+        expected = Series([1, 2, 3, 5.], index=[0, 1, 2, 5])
+        tm.assert_series_equal(s, expected)
+
+        s = s_orig.copy()
+        s.loc[5] = 5.
+        expected = Series([1, 2, 3, 5.], index=[0, 1, 2, 5])
+        tm.assert_series_equal(s, expected)
+
+        # iloc/iat raise
+        s = s_orig.copy()
+
+        def f():
+            s.iloc[3] = 5.
+
+        pytest.raises(IndexError, f)
+
+        def f():
+            s.iat[3] = 5.
+
+        pytest.raises(IndexError, f)
+
+        # ## frame ##
+
+        df_orig = DataFrame(
+            np.arange(6).reshape(3, 2), columns=['A', 'B'], dtype='int64')
+
+        # iloc/iat raise
+        df = df_orig.copy()
+
+        def f():
+            df.iloc[4, 2] = 5.
+
+        pytest.raises(IndexError, f)
+
+        def f():
+            df.iat[4, 2] = 5.
+
+        pytest.raises(IndexError, f)
+
+        # row setting where it exists
+        expected = DataFrame(dict({'A': [0, 4, 4], 'B': [1, 5, 5]}))
+        df = df_orig.copy()
+        df.iloc[1] = df.iloc[2]
+        tm.assert_frame_equal(df, expected)
+
+        expected = DataFrame(dict({'A': [0, 4, 4], 'B': [1, 5, 5]}))
+        df = df_orig.copy()
+        df.loc[1] = df.loc[2]
+        tm.assert_frame_equal(df, expected)
+
+        # like 2578, partial setting with dtype preservation
+        expected = DataFrame(dict({'A': [0, 2, 4, 4], 'B': [1, 3, 5, 5]}))
+        df = df_orig.copy()
+        df.loc[3] = df.loc[2]
+        tm.assert_frame_equal(df, expected)
+
+        # single dtype frame, overwrite
+        expected = DataFrame(dict({'A': [0, 2, 4], 'B': [0, 2, 4]}))
+        df = df_orig.copy()
+        with catch_warnings(record=True):
+            df.ix[:, 'B'] = df.ix[:, 'A']
+        tm.assert_frame_equal(df, expected)
+
+        # mixed dtype frame, overwrite
+        expected = DataFrame(dict({'A': [0, 2, 4], 'B': Series([0, 2, 4])}))
+        df = df_orig.copy()
+        df['B'] = df['B'].astype(np.float64)
+        with catch_warnings(record=True):
+            df.ix[:, 'B'] = df.ix[:, 'A']
+        tm.assert_frame_equal(df, expected)
+
+        # single dtype frame, partial setting
+        expected = df_orig.copy()
+        expected['C'] = df['A']
+        df = df_orig.copy()
+        with catch_warnings(record=True):
+            df.ix[:, 'C'] = df.ix[:, 'A']
+        tm.assert_frame_equal(df, expected)
+
+        # mixed frame, partial setting
+        expected = df_orig.copy()
+        expected['C'] = df['A']
+        df = df_orig.copy()
+        with catch_warnings(record=True):
+            df.ix[:, 'C'] = df.ix[:, 'A']
+        tm.assert_frame_equal(df, expected)
+
+        with catch_warnings(record=True):
+            # ## panel ##
+            p_orig = Panel(np.arange(16).reshape(2, 4, 2),
+                           items=['Item1', 'Item2'],
+                           major_axis=pd.date_range('2001/1/12', periods=4),
+                           minor_axis=['A', 'B'], dtype='float64')
+
+            # panel setting via item
+            p_orig = Panel(np.arange(16).reshape(2, 4, 2),
+                           items=['Item1', 'Item2'],
+                           major_axis=pd.date_range('2001/1/12', periods=4),
+                           minor_axis=['A', 'B'], dtype='float64')
+            expected = p_orig.copy()
+            expected['Item3'] = expected['Item1']
+            p = p_orig.copy()
+            p.loc['Item3'] = p['Item1']
+            tm.assert_panel_equal(p, expected)
+
+            # panel with aligned series
+            expected = p_orig.copy()
+            expected = expected.transpose(2, 1, 0)
+            expected['C'] = DataFrame({'Item1': [30, 30, 30, 30],
+                                       'Item2': [32, 32, 32, 32]},
+                                      index=p_orig.major_axis)
+            expected = expected.transpose(2, 1, 0)
+            p = p_orig.copy()
+            p.loc[:, :, 'C'] = Series([30, 32], index=p_orig.items)
+            tm.assert_panel_equal(p, expected)
+
+        # GH 8473
+        dates = date_range('1/1/2000', periods=8)
+        df_orig = DataFrame(np.random.randn(8, 4), index=dates,
+                            columns=['A', 'B', 'C', 'D'])
+
+        expected = pd.concat([df_orig,
+                              DataFrame({'A': 7}, index=[dates[-1] + 1])],
+                             sort=True)
+        df = df_orig.copy()
+        df.loc[dates[-1] + 1, 'A'] = 7
+        tm.assert_frame_equal(df, expected)
+        df = df_orig.copy()
+        df.at[dates[-1] + 1, 'A'] = 7
+        tm.assert_frame_equal(df, expected)
+
+        exp_other = DataFrame({0: 7}, index=[dates[-1] + 1])
+        expected = pd.concat([df_orig, exp_other], axis=1)
+
+        df = df_orig.copy()
+        df.loc[dates[-1] + 1, 0] = 7
+        tm.assert_frame_equal(df, expected)
+        df = df_orig.copy()
+        df.at[dates[-1] + 1, 0] = 7
+        tm.assert_frame_equal(df, expected)
+
+    def test_partial_setting_mixed_dtype(self):
+
+        # in a mixed dtype environment, try to preserve dtypes
+        # by appending
+        df = DataFrame([[True, 1], [False, 2]], columns=["female", "fitness"])
+
+        s = df.loc[1].copy()
+        s.name = 2
+        expected = df.append(s)
+
+        df.loc[2] = df.loc[1]
+        tm.assert_frame_equal(df, expected)
+
+        # columns will align
+        df = DataFrame(columns=['A', 'B'])
+        df.loc[0] = Series(1, index=range(4))
+        tm.assert_frame_equal(df, DataFrame(columns=['A', 'B'], index=[0]))
+
+        # columns will align
+        df = DataFrame(columns=['A', 'B'])
+        df.loc[0] = Series(1, index=['B'])
+
+        exp = DataFrame([[np.nan, 1]], columns=['A', 'B'],
+                        index=[0], dtype='float64')
+        tm.assert_frame_equal(df, exp)
+
+        # list-like must conform
+        df = DataFrame(columns=['A', 'B'])
+
+        def f():
+            df.loc[0] = [1, 2, 3]
+
+        pytest.raises(ValueError, f)
+
+        # TODO: #15657, these are left as object and not coerced
+        df = DataFrame(columns=['A', 'B'])
+        df.loc[3] = [6, 7]
+
+        exp = DataFrame([[6, 7]], index=[3], columns=['A', 'B'],
+                        dtype='object')
+        tm.assert_frame_equal(df, exp)
+
+    def test_series_partial_set(self):
+        # partial set with new index
+        # Regression from GH4825
+        ser = Series([0.1, 0.2], index=[1, 2])
+
+        # loc equiv to .reindex
+        expected = Series([np.nan, 0.2, np.nan], index=[3, 2, 3])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[3, 2, 3]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = ser.reindex([3, 2, 3])
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        expected = Series([np.nan, 0.2, np.nan, np.nan], index=[3, 2, 3, 'x'])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[3, 2, 3, 'x']]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = ser.reindex([3, 2, 3, 'x'])
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        expected = Series([0.2, 0.2, 0.1], index=[2, 2, 1])
+        result = ser.loc[[2, 2, 1]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        expected = Series([0.2, 0.2, np.nan, 0.1], index=[2, 2, 'x', 1])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[2, 2, 'x', 1]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = ser.reindex([2, 2, 'x', 1])
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        # raises as nothing in in the index
+        pytest.raises(KeyError, lambda: ser.loc[[3, 3, 3]])
+
+        expected = Series([0.2, 0.2, np.nan], index=[2, 2, 3])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[2, 2, 3]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = ser.reindex([2, 2, 3])
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        s = Series([0.1, 0.2, 0.3], index=[1, 2, 3])
+        expected = Series([0.3, np.nan, np.nan], index=[3, 4, 4])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.loc[[3, 4, 4]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = s.reindex([3, 4, 4])
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        s = Series([0.1, 0.2, 0.3, 0.4],
+                   index=[1, 2, 3, 4])
+        expected = Series([np.nan, 0.3, 0.3], index=[5, 3, 3])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.loc[[5, 3, 3]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = s.reindex([5, 3, 3])
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        s = Series([0.1, 0.2, 0.3, 0.4],
+                   index=[1, 2, 3, 4])
+        expected = Series([np.nan, 0.4, 0.4], index=[5, 4, 4])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.loc[[5, 4, 4]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = s.reindex([5, 4, 4])
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        s = Series([0.1, 0.2, 0.3, 0.4],
+                   index=[4, 5, 6, 7])
+        expected = Series([0.4, np.nan, np.nan], index=[7, 2, 2])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.loc[[7, 2, 2]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = s.reindex([7, 2, 2])
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        s = Series([0.1, 0.2, 0.3, 0.4],
+                   index=[1, 2, 3, 4])
+        expected = Series([0.4, np.nan, np.nan], index=[4, 5, 5])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.loc[[4, 5, 5]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = s.reindex([4, 5, 5])
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        # iloc
+        expected = Series([0.2, 0.2, 0.1, 0.1], index=[2, 2, 1, 1])
+        result = ser.iloc[[1, 1, 0, 0]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+    def test_series_partial_set_with_name(self):
+        # GH 11497
+
+        idx = Index([1, 2], dtype='int64', name='idx')
+        ser = Series([0.1, 0.2], index=idx, name='s')
+
+        # loc
+        exp_idx = Index([3, 2, 3], dtype='int64', name='idx')
+        expected = Series([np.nan, 0.2, np.nan], index=exp_idx, name='s')
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[3, 2, 3]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        exp_idx = Index([3, 2, 3, 'x'], dtype='object', name='idx')
+        expected = Series([np.nan, 0.2, np.nan, np.nan], index=exp_idx,
+                          name='s')
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[3, 2, 3, 'x']]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        exp_idx = Index([2, 2, 1], dtype='int64', name='idx')
+        expected = Series([0.2, 0.2, 0.1], index=exp_idx, name='s')
+        result = ser.loc[[2, 2, 1]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        exp_idx = Index([2, 2, 'x', 1], dtype='object', name='idx')
+        expected = Series([0.2, 0.2, np.nan, 0.1], index=exp_idx, name='s')
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[2, 2, 'x', 1]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        # raises as nothing in in the index
+        pytest.raises(KeyError, lambda: ser.loc[[3, 3, 3]])
+
+        exp_idx = Index([2, 2, 3], dtype='int64', name='idx')
+        expected = Series([0.2, 0.2, np.nan], index=exp_idx, name='s')
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[2, 2, 3]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        exp_idx = Index([3, 4, 4], dtype='int64', name='idx')
+        expected = Series([0.3, np.nan, np.nan], index=exp_idx, name='s')
+        idx = Index([1, 2, 3], dtype='int64', name='idx')
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = Series([0.1, 0.2, 0.3],
+                            index=idx,
+                            name='s').loc[[3, 4, 4]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        exp_idx = Index([5, 3, 3], dtype='int64', name='idx')
+        expected = Series([np.nan, 0.3, 0.3], index=exp_idx, name='s')
+        idx = Index([1, 2, 3, 4], dtype='int64', name='idx')
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = Series([0.1, 0.2, 0.3, 0.4], index=idx,
+                            name='s').loc[[5, 3, 3]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        exp_idx = Index([5, 4, 4], dtype='int64', name='idx')
+        expected = Series([np.nan, 0.4, 0.4], index=exp_idx, name='s')
+        idx = Index([1, 2, 3, 4], dtype='int64', name='idx')
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = Series([0.1, 0.2, 0.3, 0.4], index=idx,
+                            name='s').loc[[5, 4, 4]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        exp_idx = Index([7, 2, 2], dtype='int64', name='idx')
+        expected = Series([0.4, np.nan, np.nan], index=exp_idx, name='s')
+        idx = Index([4, 5, 6, 7], dtype='int64', name='idx')
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = Series([0.1, 0.2, 0.3, 0.4], index=idx,
+                            name='s').loc[[7, 2, 2]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        exp_idx = Index([4, 5, 5], dtype='int64', name='idx')
+        expected = Series([0.4, np.nan, np.nan], index=exp_idx, name='s')
+        idx = Index([1, 2, 3, 4], dtype='int64', name='idx')
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = Series([0.1, 0.2, 0.3, 0.4], index=idx,
+                            name='s').loc[[4, 5, 5]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        # iloc
+        exp_idx = Index([2, 2, 1, 1], dtype='int64', name='idx')
+        expected = Series([0.2, 0.2, 0.1, 0.1], index=exp_idx, name='s')
+        result = ser.iloc[[1, 1, 0, 0]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+    def test_partial_set_invalid(self):
+
+        # GH 4940
+        # allow only setting of 'valid' values
+
+        orig = tm.makeTimeDataFrame()
+        df = orig.copy()
+
+        # don't allow not string inserts
+        def f():
+            with catch_warnings(record=True):
+                df.loc[100.0, :] = df.ix[0]
+
+        pytest.raises(TypeError, f)
+
+        def f():
+            with catch_warnings(record=True):
+                df.loc[100, :] = df.ix[0]
+
+        pytest.raises(TypeError, f)
+
+        def f():
+            with catch_warnings(record=True):
+                df.ix[100.0, :] = df.ix[0]
+
+        pytest.raises(TypeError, f)
+
+        def f():
+            with catch_warnings(record=True):
+                df.ix[100, :] = df.ix[0]
+
+        pytest.raises(ValueError, f)
+
+        # allow object conversion here
+        df = orig.copy()
+        with catch_warnings(record=True):
+            df.loc['a', :] = df.ix[0]
+            exp = orig.append(Series(df.ix[0], name='a'))
+        tm.assert_frame_equal(df, exp)
+        tm.assert_index_equal(df.index, Index(orig.index.tolist() + ['a']))
+        assert df.index.dtype == 'object'
+
+    def test_partial_set_empty_series(self):
+
+        # GH5226
+
+        # partially set with an empty object series
+        s = Series()
+        s.loc[1] = 1
+        tm.assert_series_equal(s, Series([1], index=[1]))
+        s.loc[3] = 3
+        tm.assert_series_equal(s, Series([1, 3], index=[1, 3]))
+
+        s = Series()
+        s.loc[1] = 1.
+        tm.assert_series_equal(s, Series([1.], index=[1]))
+        s.loc[3] = 3.
+        tm.assert_series_equal(s, Series([1., 3.], index=[1, 3]))
+
+        s = Series()
+        s.loc['foo'] = 1
+        tm.assert_series_equal(s, Series([1], index=['foo']))
+        s.loc['bar'] = 3
+        tm.assert_series_equal(s, Series([1, 3], index=['foo', 'bar']))
+        s.loc[3] = 4
+        tm.assert_series_equal(s, Series([1, 3, 4], index=['foo', 'bar', 3]))
+
+    def test_partial_set_empty_frame(self):
+
+        # partially set with an empty object
+        # frame
+        df = DataFrame()
+
+        def f():
+            df.loc[1] = 1
+
+        pytest.raises(ValueError, f)
+
+        def f():
+            df.loc[1] = Series([1], index=['foo'])
+
+        pytest.raises(ValueError, f)
+
+        def f():
+            df.loc[:, 1] = 1
+
+        pytest.raises(ValueError, f)
+
+        # these work as they don't really change
+        # anything but the index
+        # GH5632
+        expected = DataFrame(columns=['foo'], index=Index([], dtype='int64'))
+
+        def f():
+            df = DataFrame()
+            df['foo'] = Series([], dtype='object')
+            return df
+
+        tm.assert_frame_equal(f(), expected)
+
+        def f():
+            df = DataFrame()
+            df['foo'] = Series(df.index)
+            return df
+
+        tm.assert_frame_equal(f(), expected)
+
+        def f():
+            df = DataFrame()
+            df['foo'] = df.index
+            return df
+
+        tm.assert_frame_equal(f(), expected)
+
+        expected = DataFrame(columns=['foo'], index=Index([], dtype='int64'))
+        expected['foo'] = expected['foo'].astype('float64')
+
+        def f():
+            df = DataFrame()
+            df['foo'] = []
+            return df
+
+        tm.assert_frame_equal(f(), expected)
+
+        def f():
+            df = DataFrame()
+            df['foo'] = Series(np.arange(len(df)), dtype='float64')
+            return df
+
+        tm.assert_frame_equal(f(), expected)
+
+        def f():
+            df = DataFrame()
+            tm.assert_index_equal(df.index, Index([], dtype='object'))
+            df['foo'] = range(len(df))
+            return df
+
+        expected = DataFrame(columns=['foo'], index=Index([], dtype='int64'))
+        expected['foo'] = expected['foo'].astype('float64')
+        tm.assert_frame_equal(f(), expected)
+
+        df = DataFrame()
+        tm.assert_index_equal(df.columns, Index([], dtype=object))
+        df2 = DataFrame()
+        df2[1] = Series([1], index=['foo'])
+        df.loc[:, 1] = Series([1], index=['foo'])
+        tm.assert_frame_equal(df, DataFrame([[1]], index=['foo'], columns=[1]))
+        tm.assert_frame_equal(df, df2)
+
+        # no index to start
+        expected = DataFrame({0: Series(1, index=range(4))},
+                             columns=['A', 'B', 0])
+
+        df = DataFrame(columns=['A', 'B'])
+        df[0] = Series(1, index=range(4))
+        df.dtypes
+        str(df)
+        tm.assert_frame_equal(df, expected)
+
+        df = DataFrame(columns=['A', 'B'])
+        df.loc[:, 0] = Series(1, index=range(4))
+        df.dtypes
+        str(df)
+        tm.assert_frame_equal(df, expected)
+
+    def test_partial_set_empty_frame_row(self):
+        # GH5720, GH5744
+        # don't create rows when empty
+        expected = DataFrame(columns=['A', 'B', 'New'],
+                             index=Index([], dtype='int64'))
+        expected['A'] = expected['A'].astype('int64')
+        expected['B'] = expected['B'].astype('float64')
+        expected['New'] = expected['New'].astype('float64')
+
+        df = DataFrame({"A": [1, 2, 3], "B": [1.2, 4.2, 5.2]})
+        y = df[df.A > 5]
+        y['New'] = np.nan
+        tm.assert_frame_equal(y, expected)
+        # tm.assert_frame_equal(y,expected)
+
+        expected = DataFrame(columns=['a', 'b', 'c c', 'd'])
+        expected['d'] = expected['d'].astype('int64')
+        df = DataFrame(columns=['a', 'b', 'c c'])
+        df['d'] = 3
+        tm.assert_frame_equal(df, expected)
+        tm.assert_series_equal(df['c c'], Series(name='c c', dtype=object))
+
+        # reindex columns is ok
+        df = DataFrame({"A": [1, 2, 3], "B": [1.2, 4.2, 5.2]})
+        y = df[df.A > 5]
+        result = y.reindex(columns=['A', 'B', 'C'])
+        expected = DataFrame(columns=['A', 'B', 'C'],
+                             index=Index([], dtype='int64'))
+        expected['A'] = expected['A'].astype('int64')
+        expected['B'] = expected['B'].astype('float64')
+        expected['C'] = expected['C'].astype('float64')
+        tm.assert_frame_equal(result, expected)
+
+    def test_partial_set_empty_frame_set_series(self):
+        # GH 5756
+        # setting with empty Series
+        df = DataFrame(Series())
+        tm.assert_frame_equal(df, DataFrame({0: Series()}))
+
+        df = DataFrame(Series(name='foo'))
+        tm.assert_frame_equal(df, DataFrame({'foo': Series()}))
+
+    def test_partial_set_empty_frame_empty_copy_assignment(self):
+        # GH 5932
+        # copy on empty with assignment fails
+        df = DataFrame(index=[0])
+        df = df.copy()
+        df['a'] = 0
+        expected = DataFrame(0, index=[0], columns=['a'])
+        tm.assert_frame_equal(df, expected)
+
+    def test_partial_set_empty_frame_empty_consistencies(self):
+        # GH 6171
+        # consistency on empty frames
+        df = DataFrame(columns=['x', 'y'])
+        df['x'] = [1, 2]
+        expected = DataFrame(dict(x=[1, 2], y=[np.nan, np.nan]))
+        tm.assert_frame_equal(df, expected, check_dtype=False)
+
+        df = DataFrame(columns=['x', 'y'])
+        df['x'] = ['1', '2']
+        expected = DataFrame(
+            dict(x=['1', '2'], y=[np.nan, np.nan]), dtype=object)
+        tm.assert_frame_equal(df, expected)
+
+        df = DataFrame(columns=['x', 'y'])
+        df.loc[0, 'x'] = 1
+        expected = DataFrame(dict(x=[1], y=[np.nan]))
+        tm.assert_frame_equal(df, expected, check_dtype=False)
diff --git a/pandas/tests/indexing/test_scalar.py b/pandas/tests/indexing/test_scalar.py
new file mode 100644
index 0000000000000..7314ff6619049
--- /dev/null
+++ b/pandas/tests/indexing/test_scalar.py
@@ -0,0 +1,172 @@
+""" test scalar indexing, including at and iat """
+
+import pytest
+
+import numpy as np
+
+from pandas import (Series, DataFrame, Timestamp,
+                    Timedelta, date_range)
+from pandas.util import testing as tm
+from pandas.tests.indexing.common import Base
+
+
+class TestScalar(Base):
+
+    def test_at_and_iat_get(self):
+        def _check(f, func, values=False):
+
+            if f is not None:
+                indicies = self.generate_indices(f, values)
+                for i in indicies:
+                    result = getattr(f, func)[i]
+                    expected = self.get_value(f, i, values)
+                    tm.assert_almost_equal(result, expected)
+
+        for o in self._objs:
+
+            d = getattr(self, o)
+
+            # iat
+            for f in [d['ints'], d['uints']]:
+                _check(f, 'iat', values=True)
+
+            for f in [d['labels'], d['ts'], d['floats']]:
+                if f is not None:
+                    pytest.raises(ValueError, self.check_values, f, 'iat')
+
+            # at
+            for f in [d['ints'], d['uints'], d['labels'],
+                      d['ts'], d['floats']]:
+                _check(f, 'at')
+
+    def test_at_and_iat_set(self):
+        def _check(f, func, values=False):
+
+            if f is not None:
+                indicies = self.generate_indices(f, values)
+                for i in indicies:
+                    getattr(f, func)[i] = 1
+                    expected = self.get_value(f, i, values)
+                    tm.assert_almost_equal(expected, 1)
+
+        for t in self._objs:
+
+            d = getattr(self, t)
+
+            # iat
+            for f in [d['ints'], d['uints']]:
+                _check(f, 'iat', values=True)
+
+            for f in [d['labels'], d['ts'], d['floats']]:
+                if f is not None:
+                    pytest.raises(ValueError, _check, f, 'iat')
+
+            # at
+            for f in [d['ints'], d['uints'], d['labels'],
+                      d['ts'], d['floats']]:
+                _check(f, 'at')
+
+    def test_at_iat_coercion(self):
+
+        # as timestamp is not a tuple!
+        dates = date_range('1/1/2000', periods=8)
+        df = DataFrame(np.random.randn(8, 4),
+                       index=dates,
+                       columns=['A', 'B', 'C', 'D'])
+        s = df['A']
+
+        result = s.at[dates[5]]
+        xp = s.values[5]
+        assert result == xp
+
+        # GH 7729
+        # make sure we are boxing the returns
+        s = Series(['2014-01-01', '2014-02-02'], dtype='datetime64[ns]')
+        expected = Timestamp('2014-02-02')
+
+        for r in [lambda: s.iat[1], lambda: s.iloc[1]]:
+            result = r()
+            assert result == expected
+
+        s = Series(['1 days', '2 days'], dtype='timedelta64[ns]')
+        expected = Timedelta('2 days')
+
+        for r in [lambda: s.iat[1], lambda: s.iloc[1]]:
+            result = r()
+            assert result == expected
+
+    def test_iat_invalid_args(self):
+        pass
+
+    def test_imethods_with_dups(self):
+
+        # GH6493
+        # iat/iloc with dups
+
+        s = Series(range(5), index=[1, 1, 2, 2, 3], dtype='int64')
+        result = s.iloc[2]
+        assert result == 2
+        result = s.iat[2]
+        assert result == 2
+
+        pytest.raises(IndexError, lambda: s.iat[10])
+        pytest.raises(IndexError, lambda: s.iat[-10])
+
+        result = s.iloc[[2, 3]]
+        expected = Series([2, 3], [2, 2], dtype='int64')
+        tm.assert_series_equal(result, expected)
+
+        df = s.to_frame()
+        result = df.iloc[2]
+        expected = Series(2, index=[0], name=2)
+        tm.assert_series_equal(result, expected)
+
+        result = df.iat[2, 0]
+        assert result == 2
+
+    def test_at_to_fail(self):
+        # at should not fallback
+        # GH 7814
+        s = Series([1, 2, 3], index=list('abc'))
+        result = s.at['a']
+        assert result == 1
+        pytest.raises(ValueError, lambda: s.at[0])
+
+        df = DataFrame({'A': [1, 2, 3]}, index=list('abc'))
+        result = df.at['a', 'A']
+        assert result == 1
+        pytest.raises(ValueError, lambda: df.at['a', 0])
+
+        s = Series([1, 2, 3], index=[3, 2, 1])
+        result = s.at[1]
+        assert result == 3
+        pytest.raises(ValueError, lambda: s.at['a'])
+
+        df = DataFrame({0: [1, 2, 3]}, index=[3, 2, 1])
+        result = df.at[1, 0]
+        assert result == 3
+        pytest.raises(ValueError, lambda: df.at['a', 0])
+
+        # GH 13822, incorrect error string with non-unique columns when missing
+        # column is accessed
+        df = DataFrame({'x': [1.], 'y': [2.], 'z': [3.]})
+        df.columns = ['x', 'x', 'z']
+
+        # Check that we get the correct value in the KeyError
+        tm.assert_raises_regex(KeyError, r"\['y'\] not in index",
+                               lambda: df[['x', 'y', 'z']])
+
+    def test_at_with_tz(self):
+        # gh-15822
+        df = DataFrame({'name': ['John', 'Anderson'],
+                        'date': [Timestamp(2017, 3, 13, 13, 32, 56),
+                                 Timestamp(2017, 2, 16, 12, 10, 3)]})
+        df['date'] = df['date'].dt.tz_localize('Asia/Shanghai')
+
+        expected = Timestamp('2017-03-13 13:32:56+0800', tz='Asia/Shanghai')
+
+        result = df.loc[0, 'date']
+        assert result == expected
+
+        result = df.at[0, 'date']
+        assert result == expected
diff --git a/pandas/tests/indexing/test_timedelta.py b/pandas/tests/indexing/test_timedelta.py
new file mode 100644
index 0000000000000..48ea49119356d
--- /dev/null
+++ b/pandas/tests/indexing/test_timedelta.py
@@ -0,0 +1,82 @@
+import pytest
+
+import pandas as pd
+from pandas.util import testing as tm
+import numpy as np
+
+
+class TestTimedeltaIndexing(object):
+    def test_boolean_indexing(self):
+        # GH 14946
+        df = pd.DataFrame({'x': range(10)})
+        df.index = pd.to_timedelta(range(10), unit='s')
+        conditions = [df['x'] > 3, df['x'] == 3, df['x'] < 3]
+        expected_data = [[0, 1, 2, 3, 10, 10, 10, 10, 10, 10],
+                         [0, 1, 2, 10, 4, 5, 6, 7, 8, 9],
+                         [10, 10, 10, 3, 4, 5, 6, 7, 8, 9]]
+        for cond, data in zip(conditions, expected_data):
+            result = df.assign(x=df.mask(cond, 10).astype('int64'))
+            expected = pd.DataFrame(data,
+                                    index=pd.to_timedelta(range(10), unit='s'),
+                                    columns=['x'],
+                                    dtype='int64')
+            tm.assert_frame_equal(expected, result)
+
+    @pytest.mark.parametrize(
+        "indexer, expected",
+        [(0, [20, 1, 2, 3, 4, 5, 6, 7, 8, 9]),
+         (slice(4, 8), [0, 1, 2, 3, 20, 20, 20, 20, 8, 9]),
+         ([3, 5], [0, 1, 2, 20, 4, 20, 6, 7, 8, 9])])
+    def test_list_like_indexing(self, indexer, expected):
+        # GH 16637
+        df = pd.DataFrame({'x': range(10)}, dtype="int64")
+        df.index = pd.to_timedelta(range(10), unit='s')
+
+        df.loc[df.index[indexer], 'x'] = 20
+
+        expected = pd.DataFrame(expected,
+                                index=pd.to_timedelta(range(10), unit='s'),
+                                columns=['x'],
+                                dtype="int64")
+
+        tm.assert_frame_equal(expected, df)
+
+    def test_string_indexing(self):
+        # GH 16896
+        df = pd.DataFrame({'x': range(3)},
+                          index=pd.to_timedelta(range(3), unit='days'))
+        expected = df.iloc[0]
+        sliced = df.loc['0 days']
+        tm.assert_series_equal(sliced, expected)
+
+    @pytest.mark.parametrize(
+        "value",
+        [None, pd.NaT, np.nan])
+    def test_masked_setitem(self, value):
+        # issue (#18586)
+        series = pd.Series([0, 1, 2], dtype='timedelta64[ns]')
+        series[series == series[0]] = value
+        expected = pd.Series([pd.NaT, 1, 2], dtype='timedelta64[ns]')
+        tm.assert_series_equal(series, expected)
+
+    @pytest.mark.parametrize(
+        "value",
+        [None, pd.NaT, np.nan])
+    def test_listlike_setitem(self, value):
+        # issue (#18586)
+        series = pd.Series([0, 1, 2], dtype='timedelta64[ns]')
+        series.iloc[0] = value
+        expected = pd.Series([pd.NaT, 1, 2], dtype='timedelta64[ns]')
+        tm.assert_series_equal(series, expected)
+
+    @pytest.mark.parametrize('start,stop, expected_slice', [
+        [np.timedelta64(0, 'ns'), None, slice(0, 11)],
+        [np.timedelta64(1, 'D'), np.timedelta64(6, 'D'), slice(1, 7)],
+        [None, np.timedelta64(4, 'D'), slice(0, 5)]])
+    def test_numpy_timedelta_scalar_indexing(self, start, stop,
+                                             expected_slice):
+        # GH 20393
+        s = pd.Series(range(11), pd.timedelta_range('0 days', '10 days'))
+        result = s.loc[slice(start, stop)]
+        expected = s.iloc[expected_slice]
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/internals/__init__.py b/pandas/tests/internals/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/internals/test_internals.py b/pandas/tests/internals/test_internals.py
new file mode 100644
index 0000000000000..7fbf7ec05e91e
--- /dev/null
+++ b/pandas/tests/internals/test_internals.py
@@ -0,0 +1,1295 @@
+# -*- coding: utf-8 -*-
+# pylint: disable=W0102
+
+from datetime import datetime, date
+import operator
+import sys
+import pytest
+import numpy as np
+
+import re
+from distutils.version import LooseVersion
+import itertools
+from pandas import (Index, MultiIndex, DataFrame, DatetimeIndex,
+                    Series, Categorical, TimedeltaIndex, SparseArray)
+from pandas.compat import OrderedDict, lrange
+from pandas.core.internals import (BlockPlacement, SingleBlockManager,
+                                   make_block, BlockManager)
+import pandas.core.algorithms as algos
+import pandas.util.testing as tm
+import pandas as pd
+from pandas.util.testing import (assert_almost_equal, assert_frame_equal,
+                                 randn, assert_series_equal)
+from pandas.compat import zip, u
+
+# in 3.6.1 a c-api slicing function changed, see src/compat_helper.h
+PY361 = LooseVersion(sys.version) >= LooseVersion('3.6.1')
+
+
+@pytest.fixture
+def mgr():
+    return create_mgr(
+        'a: f8; b: object; c: f8; d: object; e: f8;'
+        'f: bool; g: i8; h: complex; i: datetime-1; j: datetime-2;'
+        'k: M8[ns, US/Eastern]; l: M8[ns, CET];')
+
+
+def assert_block_equal(left, right):
+    tm.assert_numpy_array_equal(left.values, right.values)
+    assert left.dtype == right.dtype
+    assert isinstance(left.mgr_locs, BlockPlacement)
+    assert isinstance(right.mgr_locs, BlockPlacement)
+    tm.assert_numpy_array_equal(left.mgr_locs.as_array,
+                                right.mgr_locs.as_array)
+
+
+def get_numeric_mat(shape):
+    arr = np.arange(shape[0])
+    return np.lib.stride_tricks.as_strided(x=arr, shape=shape, strides=(
+        arr.itemsize, ) + (0, ) * (len(shape) - 1)).copy()
+
+
+N = 10
+
+
+def create_block(typestr, placement, item_shape=None, num_offset=0):
+    """
+    Supported typestr:
+
+        * float, f8, f4, f2
+        * int, i8, i4, i2, i1
+        * uint, u8, u4, u2, u1
+        * complex, c16, c8
+        * bool
+        * object, string, O
+        * datetime, dt, M8[ns], M8[ns, tz]
+        * timedelta, td, m8[ns]
+        * sparse (SparseArray with fill_value=0.0)
+        * sparse_na (SparseArray with fill_value=np.nan)
+        * category, category2
+
+    """
+    placement = BlockPlacement(placement)
+    num_items = len(placement)
+
+    if item_shape is None:
+        item_shape = (N, )
+
+    shape = (num_items, ) + item_shape
+
+    mat = get_numeric_mat(shape)
+
+    if typestr in ('float', 'f8', 'f4', 'f2', 'int', 'i8', 'i4', 'i2', 'i1',
+                   'uint', 'u8', 'u4', 'u2', 'u1'):
+        values = mat.astype(typestr) + num_offset
+    elif typestr in ('complex', 'c16', 'c8'):
+        values = 1.j * (mat.astype(typestr) + num_offset)
+    elif typestr in ('object', 'string', 'O'):
+        values = np.reshape(['A%d' % i for i in mat.ravel() + num_offset],
+                            shape)
+    elif typestr in ('b', 'bool', ):
+        values = np.ones(shape, dtype=np.bool_)
+    elif typestr in ('datetime', 'dt', 'M8[ns]'):
+        values = (mat * 1e9).astype('M8[ns]')
+    elif typestr.startswith('M8[ns'):
+        # datetime with tz
+        m = re.search(r'M8\[ns,\s*(\w+\/?\w*)\]', typestr)
+        assert m is not None, "incompatible typestr -> {0}".format(typestr)
+        tz = m.groups()[0]
+        assert num_items == 1, "must have only 1 num items for a tz-aware"
+        values = DatetimeIndex(np.arange(N) * 1e9, tz=tz)
+    elif typestr in ('timedelta', 'td', 'm8[ns]'):
+        values = (mat * 1).astype('m8[ns]')
+    elif typestr in ('category', ):
+        values = Categorical([1, 1, 2, 2, 3, 3, 3, 3, 4, 4])
+    elif typestr in ('category2', ):
+        values = Categorical(['a', 'a', 'a', 'a', 'b', 'b', 'c', 'c', 'c', 'd'
+                              ])
+    elif typestr in ('sparse', 'sparse_na'):
+        # FIXME: doesn't support num_rows != 10
+        assert shape[-1] == 10
+        assert all(s == 1 for s in shape[:-1])
+        if typestr.endswith('_na'):
+            fill_value = np.nan
+        else:
+            fill_value = 0.0
+        values = SparseArray([fill_value, fill_value, 1, 2, 3, fill_value,
+                              4, 5, fill_value, 6], fill_value=fill_value)
+        arr = values.sp_values.view()
+        arr += (num_offset - 1)
+    else:
+        raise ValueError('Unsupported typestr: "%s"' % typestr)
+
+    return make_block(values, placement=placement, ndim=len(shape))
+
+
+def create_single_mgr(typestr, num_rows=None):
+    if num_rows is None:
+        num_rows = N
+
+    return SingleBlockManager(
+        create_block(typestr, placement=slice(0, num_rows), item_shape=()),
+        np.arange(num_rows))
+
+
+def create_mgr(descr, item_shape=None):
+    """
+    Construct BlockManager from string description.
+
+    String description syntax looks similar to np.matrix initializer.  It looks
+    like this::
+
+        a,b,c: f8; d,e,f: i8
+
+    Rules are rather simple:
+
+    * see list of supported datatypes in `create_block` method
+    * components are semicolon-separated
+    * each component is `NAME,NAME,NAME: DTYPE_ID`
+    * whitespace around colons & semicolons are removed
+    * components with same DTYPE_ID are combined into single block
+    * to force multiple blocks with same dtype, use '-SUFFIX'::
+
+        'a:f8-1; b:f8-2; c:f8-foobar'
+
+    """
+    if item_shape is None:
+        item_shape = (N, )
+
+    offset = 0
+    mgr_items = []
+    block_placements = OrderedDict()
+    for d in descr.split(';'):
+        d = d.strip()
+        if not len(d):
+            continue
+        names, blockstr = d.partition(':')[::2]
+        blockstr = blockstr.strip()
+        names = names.strip().split(',')
+
+        mgr_items.extend(names)
+        placement = list(np.arange(len(names)) + offset)
+        try:
+            block_placements[blockstr].extend(placement)
+        except KeyError:
+            block_placements[blockstr] = placement
+        offset += len(names)
+
+    mgr_items = Index(mgr_items)
+
+    blocks = []
+    num_offset = 0
+    for blockstr, placement in block_placements.items():
+        typestr = blockstr.split('-')[0]
+        blocks.append(create_block(typestr,
+                                   placement,
+                                   item_shape=item_shape,
+                                   num_offset=num_offset, ))
+        num_offset += len(placement)
+
+    return BlockManager(sorted(blocks, key=lambda b: b.mgr_locs[0]),
+                        [mgr_items] + [np.arange(n) for n in item_shape])
+
+
+class TestBlock(object):
+
+    def setup_method(self, method):
+        # self.fblock = get_float_ex()  # a,c,e
+        # self.cblock = get_complex_ex() #
+        # self.oblock = get_obj_ex()
+        # self.bool_block = get_bool_ex()
+        # self.int_block = get_int_ex()
+
+        self.fblock = create_block('float', [0, 2, 4])
+        self.cblock = create_block('complex', [7])
+        self.oblock = create_block('object', [1, 3])
+        self.bool_block = create_block('bool', [5])
+        self.int_block = create_block('int', [6])
+
+    def test_constructor(self):
+        int32block = create_block('i4', [0])
+        assert int32block.dtype == np.int32
+
+    def test_pickle(self):
+        def _check(blk):
+            assert_block_equal(tm.round_trip_pickle(blk), blk)
+
+        _check(self.fblock)
+        _check(self.cblock)
+        _check(self.oblock)
+        _check(self.bool_block)
+
+    def test_mgr_locs(self):
+        assert isinstance(self.fblock.mgr_locs, BlockPlacement)
+        tm.assert_numpy_array_equal(self.fblock.mgr_locs.as_array,
+                                    np.array([0, 2, 4], dtype=np.int64))
+
+    def test_attrs(self):
+        assert self.fblock.shape == self.fblock.values.shape
+        assert self.fblock.dtype == self.fblock.values.dtype
+        assert len(self.fblock) == len(self.fblock.values)
+
+    def test_merge(self):
+        avals = randn(2, 10)
+        bvals = randn(2, 10)
+
+        ref_cols = Index(['e', 'a', 'b', 'd', 'f'])
+
+        ablock = make_block(avals, ref_cols.get_indexer(['e', 'b']))
+        bblock = make_block(bvals, ref_cols.get_indexer(['a', 'd']))
+        merged = ablock.merge(bblock)
+        tm.assert_numpy_array_equal(merged.mgr_locs.as_array,
+                                    np.array([0, 1, 2, 3], dtype=np.int64))
+        tm.assert_numpy_array_equal(merged.values[[0, 2]], np.array(avals))
+        tm.assert_numpy_array_equal(merged.values[[1, 3]], np.array(bvals))
+
+        # TODO: merge with mixed type?
+
+    def test_copy(self):
+        cop = self.fblock.copy()
+        assert cop is not self.fblock
+        assert_block_equal(self.fblock, cop)
+
+    def test_reindex_index(self):
+        pass
+
+    def test_reindex_cast(self):
+        pass
+
+    def test_insert(self):
+        pass
+
+    def test_delete(self):
+        newb = self.fblock.copy()
+        newb.delete(0)
+        assert isinstance(newb.mgr_locs, BlockPlacement)
+        tm.assert_numpy_array_equal(newb.mgr_locs.as_array,
+                                    np.array([2, 4], dtype=np.int64))
+        assert (newb.values[0] == 1).all()
+
+        newb = self.fblock.copy()
+        newb.delete(1)
+        assert isinstance(newb.mgr_locs, BlockPlacement)
+        tm.assert_numpy_array_equal(newb.mgr_locs.as_array,
+                                    np.array([0, 4], dtype=np.int64))
+        assert (newb.values[1] == 2).all()
+
+        newb = self.fblock.copy()
+        newb.delete(2)
+        tm.assert_numpy_array_equal(newb.mgr_locs.as_array,
+                                    np.array([0, 2], dtype=np.int64))
+        assert (newb.values[1] == 1).all()
+
+        newb = self.fblock.copy()
+        with pytest.raises(Exception):
+            newb.delete(3)
+
+    def test_make_block_same_class(self):
+        # issue 19431
+        block = create_block('M8[ns, US/Eastern]', [3])
+        with tm.assert_produces_warning(DeprecationWarning,
+                                        check_stacklevel=False):
+            block.make_block_same_class(block.values.values,
+                                        dtype=block.values.dtype)
+
+
+class TestDatetimeBlock(object):
+
+    def test_try_coerce_arg(self):
+        block = create_block('datetime', [0])
+
+        # coerce None
+        none_coerced = block._try_coerce_args(block.values, None)[2]
+        assert pd.Timestamp(none_coerced) is pd.NaT
+
+        # coerce different types of date bojects
+        vals = (np.datetime64('2010-10-10'), datetime(2010, 10, 10),
+                date(2010, 10, 10))
+        for val in vals:
+            coerced = block._try_coerce_args(block.values, val)[2]
+            assert np.int64 == type(coerced)
+            assert pd.Timestamp('2010-10-10') == pd.Timestamp(coerced)
+
+
+class TestBlockManager(object):
+
+    def test_constructor_corner(self):
+        pass
+
+    def test_attrs(self):
+        mgr = create_mgr('a,b,c: f8-1; d,e,f: f8-2')
+        assert mgr.nblocks == 2
+        assert len(mgr) == 6
+
+    def test_is_mixed_dtype(self):
+        assert not create_mgr('a,b:f8').is_mixed_type
+        assert not create_mgr('a:f8-1; b:f8-2').is_mixed_type
+
+        assert create_mgr('a,b:f8; c,d: f4').is_mixed_type
+        assert create_mgr('a,b:f8; c,d: object').is_mixed_type
+
+    def test_is_indexed_like(self):
+        mgr1 = create_mgr('a,b: f8')
+        mgr2 = create_mgr('a:i8; b:bool')
+        mgr3 = create_mgr('a,b,c: f8')
+        assert mgr1._is_indexed_like(mgr1)
+        assert mgr1._is_indexed_like(mgr2)
+        assert mgr1._is_indexed_like(mgr3)
+
+        assert not mgr1._is_indexed_like(mgr1.get_slice(
+            slice(-1), axis=1))
+
+    def test_duplicate_ref_loc_failure(self):
+        tmp_mgr = create_mgr('a:bool; a: f8')
+
+        axes, blocks = tmp_mgr.axes, tmp_mgr.blocks
+
+        blocks[0].mgr_locs = np.array([0])
+        blocks[1].mgr_locs = np.array([0])
+
+        # test trying to create block manager with overlapping ref locs
+        with pytest.raises(AssertionError):
+            BlockManager(blocks, axes)
+
+        blocks[0].mgr_locs = np.array([0])
+        blocks[1].mgr_locs = np.array([1])
+        mgr = BlockManager(blocks, axes)
+        mgr.iget(1)
+
+    def test_contains(self, mgr):
+        assert 'a' in mgr
+        assert 'baz' not in mgr
+
+    def test_pickle(self, mgr):
+
+        mgr2 = tm.round_trip_pickle(mgr)
+        assert_frame_equal(DataFrame(mgr), DataFrame(mgr2))
+
+        # share ref_items
+        # assert mgr2.blocks[0].ref_items is mgr2.blocks[1].ref_items
+
+        # GH2431
+        assert hasattr(mgr2, "_is_consolidated")
+        assert hasattr(mgr2, "_known_consolidated")
+
+        # reset to False on load
+        assert not mgr2._is_consolidated
+        assert not mgr2._known_consolidated
+
+    def test_non_unique_pickle(self):
+
+        mgr = create_mgr('a,a,a:f8')
+        mgr2 = tm.round_trip_pickle(mgr)
+        assert_frame_equal(DataFrame(mgr), DataFrame(mgr2))
+
+        mgr = create_mgr('a: f8; a: i8')
+        mgr2 = tm.round_trip_pickle(mgr)
+        assert_frame_equal(DataFrame(mgr), DataFrame(mgr2))
+
+    def test_categorical_block_pickle(self):
+        mgr = create_mgr('a: category')
+        mgr2 = tm.round_trip_pickle(mgr)
+        assert_frame_equal(DataFrame(mgr), DataFrame(mgr2))
+
+        smgr = create_single_mgr('category')
+        smgr2 = tm.round_trip_pickle(smgr)
+        assert_series_equal(Series(smgr), Series(smgr2))
+
+    def test_get_scalar(self, mgr):
+        for item in mgr.items:
+            for i, index in enumerate(mgr.axes[1]):
+                res = mgr.get_scalar((item, index))
+                exp = mgr.get(item, fastpath=False)[i]
+                assert res == exp
+                exp = mgr.get(item).internal_values()[i]
+                assert res == exp
+
+    def test_get(self):
+        cols = Index(list('abc'))
+        values = np.random.rand(3, 3)
+        block = make_block(values=values.copy(), placement=np.arange(3))
+        mgr = BlockManager(blocks=[block], axes=[cols, np.arange(3)])
+
+        assert_almost_equal(mgr.get('a', fastpath=False), values[0])
+        assert_almost_equal(mgr.get('b', fastpath=False), values[1])
+        assert_almost_equal(mgr.get('c', fastpath=False), values[2])
+        assert_almost_equal(mgr.get('a').internal_values(), values[0])
+        assert_almost_equal(mgr.get('b').internal_values(), values[1])
+        assert_almost_equal(mgr.get('c').internal_values(), values[2])
+
+    def test_set(self):
+        mgr = create_mgr('a,b,c: int', item_shape=(3, ))
+
+        mgr.set('d', np.array(['foo'] * 3))
+        mgr.set('b', np.array(['bar'] * 3))
+        tm.assert_numpy_array_equal(mgr.get('a').internal_values(),
+                                    np.array([0] * 3))
+        tm.assert_numpy_array_equal(mgr.get('b').internal_values(),
+                                    np.array(['bar'] * 3, dtype=np.object_))
+        tm.assert_numpy_array_equal(mgr.get('c').internal_values(),
+                                    np.array([2] * 3))
+        tm.assert_numpy_array_equal(mgr.get('d').internal_values(),
+                                    np.array(['foo'] * 3, dtype=np.object_))
+
+    def test_set_change_dtype(self, mgr):
+        mgr.set('baz', np.zeros(N, dtype=bool))
+
+        mgr.set('baz', np.repeat('foo', N))
+        assert mgr.get('baz').dtype == np.object_
+
+        mgr2 = mgr.consolidate()
+        mgr2.set('baz', np.repeat('foo', N))
+        assert mgr2.get('baz').dtype == np.object_
+
+        mgr2.set('quux', randn(N).astype(int))
+        assert mgr2.get('quux').dtype == np.int_
+
+        mgr2.set('quux', randn(N))
+        assert mgr2.get('quux').dtype == np.float_
+
+    def test_set_change_dtype_slice(self):  # GH8850
+        cols = MultiIndex.from_tuples([('1st', 'a'), ('2nd', 'b'), ('3rd', 'c')
+                                       ])
+        df = DataFrame([[1.0, 2, 3], [4.0, 5, 6]], columns=cols)
+        df['2nd'] = df['2nd'] * 2.0
+
+        blocks = df._to_dict_of_blocks()
+        assert sorted(blocks.keys()) == ['float64', 'int64']
+        assert_frame_equal(blocks['float64'], DataFrame(
+            [[1.0, 4.0], [4.0, 10.0]], columns=cols[:2]))
+        assert_frame_equal(blocks['int64'], DataFrame(
+            [[3], [6]], columns=cols[2:]))
+
+    def test_copy(self, mgr):
+        cp = mgr.copy(deep=False)
+        for blk, cp_blk in zip(mgr.blocks, cp.blocks):
+
+            # view assertion
+            assert cp_blk.equals(blk)
+            if isinstance(blk.values, np.ndarray):
+                assert cp_blk.values.base is blk.values.base
+            else:
+                # DatetimeTZBlock has DatetimeIndex values
+                assert cp_blk.values.values.base is blk.values.values.base
+
+        cp = mgr.copy(deep=True)
+        for blk, cp_blk in zip(mgr.blocks, cp.blocks):
+
+            # copy assertion we either have a None for a base or in case of
+            # some blocks it is an array (e.g. datetimetz), but was copied
+            assert cp_blk.equals(blk)
+            if not isinstance(cp_blk.values, np.ndarray):
+                assert cp_blk.values.values.base is not blk.values.values.base
+            else:
+                assert cp_blk.values.base is None and blk.values.base is None
+
+    def test_sparse(self):
+        mgr = create_mgr('a: sparse-1; b: sparse-2')
+        # what to test here?
+        assert mgr.as_array().dtype == np.float64
+
+    def test_sparse_mixed(self):
+        mgr = create_mgr('a: sparse-1; b: sparse-2; c: f8')
+        assert len(mgr.blocks) == 3
+        assert isinstance(mgr, BlockManager)
+
+        # what to test here?
+
+    def test_as_array_float(self):
+        mgr = create_mgr('c: f4; d: f2; e: f8')
+        assert mgr.as_array().dtype == np.float64
+
+        mgr = create_mgr('c: f4; d: f2')
+        assert mgr.as_array().dtype == np.float32
+
+    def test_as_array_int_bool(self):
+        mgr = create_mgr('a: bool-1; b: bool-2')
+        assert mgr.as_array().dtype == np.bool_
+
+        mgr = create_mgr('a: i8-1; b: i8-2; c: i4; d: i2; e: u1')
+        assert mgr.as_array().dtype == np.int64
+
+        mgr = create_mgr('c: i4; d: i2; e: u1')
+        assert mgr.as_array().dtype == np.int32
+
+    def test_as_array_datetime(self):
+        mgr = create_mgr('h: datetime-1; g: datetime-2')
+        assert mgr.as_array().dtype == 'M8[ns]'
+
+    def test_as_array_datetime_tz(self):
+        mgr = create_mgr('h: M8[ns, US/Eastern]; g: M8[ns, CET]')
+        assert mgr.get('h').dtype == 'datetime64[ns, US/Eastern]'
+        assert mgr.get('g').dtype == 'datetime64[ns, CET]'
+        assert mgr.as_array().dtype == 'object'
+
+    def test_astype(self):
+        # coerce all
+        mgr = create_mgr('c: f4; d: f2; e: f8')
+        for t in ['float16', 'float32', 'float64', 'int32', 'int64']:
+            t = np.dtype(t)
+            tmgr = mgr.astype(t)
+            assert tmgr.get('c').dtype.type == t
+            assert tmgr.get('d').dtype.type == t
+            assert tmgr.get('e').dtype.type == t
+
+        # mixed
+        mgr = create_mgr('a,b: object; c: bool; d: datetime;'
+                         'e: f4; f: f2; g: f8')
+        for t in ['float16', 'float32', 'float64', 'int32', 'int64']:
+            t = np.dtype(t)
+            tmgr = mgr.astype(t, errors='ignore')
+            assert tmgr.get('c').dtype.type == t
+            assert tmgr.get('e').dtype.type == t
+            assert tmgr.get('f').dtype.type == t
+            assert tmgr.get('g').dtype.type == t
+
+            assert tmgr.get('a').dtype.type == np.object_
+            assert tmgr.get('b').dtype.type == np.object_
+            if t != np.int64:
+                assert tmgr.get('d').dtype.type == np.datetime64
+            else:
+                assert tmgr.get('d').dtype.type == t
+
+    def test_convert(self):
+        def _compare(old_mgr, new_mgr):
+            """ compare the blocks, numeric compare ==, object don't """
+            old_blocks = set(old_mgr.blocks)
+            new_blocks = set(new_mgr.blocks)
+            assert len(old_blocks) == len(new_blocks)
+
+            # compare non-numeric
+            for b in old_blocks:
+                found = False
+                for nb in new_blocks:
+                    if (b.values == nb.values).all():
+                        found = True
+                        break
+                assert found
+
+            for b in new_blocks:
+                found = False
+                for ob in old_blocks:
+                    if (b.values == ob.values).all():
+                        found = True
+                        break
+                assert found
+
+        # noops
+        mgr = create_mgr('f: i8; g: f8')
+        new_mgr = mgr.convert()
+        _compare(mgr, new_mgr)
+
+        mgr = create_mgr('a, b: object; f: i8; g: f8')
+        new_mgr = mgr.convert()
+        _compare(mgr, new_mgr)
+
+        # convert
+        mgr = create_mgr('a,b,foo: object; f: i8; g: f8')
+        mgr.set('a', np.array(['1'] * N, dtype=np.object_))
+        mgr.set('b', np.array(['2.'] * N, dtype=np.object_))
+        mgr.set('foo', np.array(['foo.'] * N, dtype=np.object_))
+        new_mgr = mgr.convert(numeric=True)
+        assert new_mgr.get('a').dtype == np.int64
+        assert new_mgr.get('b').dtype == np.float64
+        assert new_mgr.get('foo').dtype == np.object_
+        assert new_mgr.get('f').dtype == np.int64
+        assert new_mgr.get('g').dtype == np.float64
+
+        mgr = create_mgr('a,b,foo: object; f: i4; bool: bool; dt: datetime;'
+                         'i: i8; g: f8; h: f2')
+        mgr.set('a', np.array(['1'] * N, dtype=np.object_))
+        mgr.set('b', np.array(['2.'] * N, dtype=np.object_))
+        mgr.set('foo', np.array(['foo.'] * N, dtype=np.object_))
+        new_mgr = mgr.convert(numeric=True)
+        assert new_mgr.get('a').dtype == np.int64
+        assert new_mgr.get('b').dtype == np.float64
+        assert new_mgr.get('foo').dtype == np.object_
+        assert new_mgr.get('f').dtype == np.int32
+        assert new_mgr.get('bool').dtype == np.bool_
+        assert new_mgr.get('dt').dtype.type, np.datetime64
+        assert new_mgr.get('i').dtype == np.int64
+        assert new_mgr.get('g').dtype == np.float64
+        assert new_mgr.get('h').dtype == np.float16
+
+    def test_interleave(self):
+
+        # self
+        for dtype in ['f8', 'i8', 'object', 'bool', 'complex', 'M8[ns]',
+                      'm8[ns]']:
+            mgr = create_mgr('a: {0}'.format(dtype))
+            assert mgr.as_array().dtype == dtype
+            mgr = create_mgr('a: {0}; b: {0}'.format(dtype))
+            assert mgr.as_array().dtype == dtype
+
+        # will be converted according the actual dtype of the underlying
+        mgr = create_mgr('a: category')
+        assert mgr.as_array().dtype == 'i8'
+        mgr = create_mgr('a: category; b: category')
+        assert mgr.as_array().dtype == 'i8'
+        mgr = create_mgr('a: category; b: category2')
+        assert mgr.as_array().dtype == 'object'
+        mgr = create_mgr('a: category2')
+        assert mgr.as_array().dtype == 'object'
+        mgr = create_mgr('a: category2; b: category2')
+        assert mgr.as_array().dtype == 'object'
+
+        # combinations
+        mgr = create_mgr('a: f8')
+        assert mgr.as_array().dtype == 'f8'
+        mgr = create_mgr('a: f8; b: i8')
+        assert mgr.as_array().dtype == 'f8'
+        mgr = create_mgr('a: f4; b: i8')
+        assert mgr.as_array().dtype == 'f8'
+        mgr = create_mgr('a: f4; b: i8; d: object')
+        assert mgr.as_array().dtype == 'object'
+        mgr = create_mgr('a: bool; b: i8')
+        assert mgr.as_array().dtype == 'object'
+        mgr = create_mgr('a: complex')
+        assert mgr.as_array().dtype == 'complex'
+        mgr = create_mgr('a: f8; b: category')
+        assert mgr.as_array().dtype == 'object'
+        mgr = create_mgr('a: M8[ns]; b: category')
+        assert mgr.as_array().dtype == 'object'
+        mgr = create_mgr('a: M8[ns]; b: bool')
+        assert mgr.as_array().dtype == 'object'
+        mgr = create_mgr('a: M8[ns]; b: i8')
+        assert mgr.as_array().dtype == 'object'
+        mgr = create_mgr('a: m8[ns]; b: bool')
+        assert mgr.as_array().dtype == 'object'
+        mgr = create_mgr('a: m8[ns]; b: i8')
+        assert mgr.as_array().dtype == 'object'
+        mgr = create_mgr('a: M8[ns]; b: m8[ns]')
+        assert mgr.as_array().dtype == 'object'
+
+    def test_interleave_non_unique_cols(self):
+        df = DataFrame([
+            [pd.Timestamp('20130101'), 3.5],
+            [pd.Timestamp('20130102'), 4.5]],
+            columns=['x', 'x'],
+            index=[1, 2])
+
+        df_unique = df.copy()
+        df_unique.columns = ['x', 'y']
+        assert df_unique.values.shape == df.values.shape
+        tm.assert_numpy_array_equal(df_unique.values[0], df.values[0])
+        tm.assert_numpy_array_equal(df_unique.values[1], df.values[1])
+
+    def test_consolidate(self):
+        pass
+
+    def test_consolidate_ordering_issues(self, mgr):
+        mgr.set('f', randn(N))
+        mgr.set('d', randn(N))
+        mgr.set('b', randn(N))
+        mgr.set('g', randn(N))
+        mgr.set('h', randn(N))
+
+        # we have datetime/tz blocks in mgr
+        cons = mgr.consolidate()
+        assert cons.nblocks == 4
+        cons = mgr.consolidate().get_numeric_data()
+        assert cons.nblocks == 1
+        assert isinstance(cons.blocks[0].mgr_locs, BlockPlacement)
+        tm.assert_numpy_array_equal(cons.blocks[0].mgr_locs.as_array,
+                                    np.arange(len(cons.items), dtype=np.int64))
+
+    def test_reindex_index(self):
+        pass
+
+    def test_reindex_items(self):
+        # mgr is not consolidated, f8 & f8-2 blocks
+        mgr = create_mgr('a: f8; b: i8; c: f8; d: i8; e: f8;'
+                         'f: bool; g: f8-2')
+
+        reindexed = mgr.reindex_axis(['g', 'c', 'a', 'd'], axis=0)
+        assert reindexed.nblocks == 2
+        tm.assert_index_equal(reindexed.items, pd.Index(['g', 'c', 'a', 'd']))
+        assert_almost_equal(
+            mgr.get('g', fastpath=False), reindexed.get('g', fastpath=False))
+        assert_almost_equal(
+            mgr.get('c', fastpath=False), reindexed.get('c', fastpath=False))
+        assert_almost_equal(
+            mgr.get('a', fastpath=False), reindexed.get('a', fastpath=False))
+        assert_almost_equal(
+            mgr.get('d', fastpath=False), reindexed.get('d', fastpath=False))
+        assert_almost_equal(
+            mgr.get('g').internal_values(),
+            reindexed.get('g').internal_values())
+        assert_almost_equal(
+            mgr.get('c').internal_values(),
+            reindexed.get('c').internal_values())
+        assert_almost_equal(
+            mgr.get('a').internal_values(),
+            reindexed.get('a').internal_values())
+        assert_almost_equal(
+            mgr.get('d').internal_values(),
+            reindexed.get('d').internal_values())
+
+    def test_multiindex_xs(self):
+        mgr = create_mgr('a,b,c: f8; d,e,f: i8')
+
+        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
+                                                                  'three']],
+                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           names=['first', 'second'])
+
+        mgr.set_axis(1, index)
+        result = mgr.xs('bar', axis=1)
+        assert result.shape == (6, 2)
+        assert result.axes[1][0] == ('bar', 'one')
+        assert result.axes[1][1] == ('bar', 'two')
+
+    def test_get_numeric_data(self):
+        mgr = create_mgr('int: int; float: float; complex: complex;'
+                         'str: object; bool: bool; obj: object; dt: datetime',
+                         item_shape=(3, ))
+        mgr.set('obj', np.array([1, 2, 3], dtype=np.object_))
+
+        numeric = mgr.get_numeric_data()
+        tm.assert_index_equal(numeric.items,
+                              pd.Index(['int', 'float', 'complex', 'bool']))
+        assert_almost_equal(
+            mgr.get('float', fastpath=False), numeric.get('float',
+                                                          fastpath=False))
+        assert_almost_equal(
+            mgr.get('float').internal_values(),
+            numeric.get('float').internal_values())
+
+        # Check sharing
+        numeric.set('float', np.array([100., 200., 300.]))
+        assert_almost_equal(
+            mgr.get('float', fastpath=False), np.array([100., 200., 300.]))
+        assert_almost_equal(
+            mgr.get('float').internal_values(), np.array([100., 200., 300.]))
+
+        numeric2 = mgr.get_numeric_data(copy=True)
+        tm.assert_index_equal(numeric.items,
+                              pd.Index(['int', 'float', 'complex', 'bool']))
+        numeric2.set('float', np.array([1000., 2000., 3000.]))
+        assert_almost_equal(
+            mgr.get('float', fastpath=False), np.array([100., 200., 300.]))
+        assert_almost_equal(
+            mgr.get('float').internal_values(), np.array([100., 200., 300.]))
+
+    def test_get_bool_data(self):
+        mgr = create_mgr('int: int; float: float; complex: complex;'
+                         'str: object; bool: bool; obj: object; dt: datetime',
+                         item_shape=(3, ))
+        mgr.set('obj', np.array([True, False, True], dtype=np.object_))
+
+        bools = mgr.get_bool_data()
+        tm.assert_index_equal(bools.items, pd.Index(['bool']))
+        assert_almost_equal(mgr.get('bool', fastpath=False),
+                            bools.get('bool', fastpath=False))
+        assert_almost_equal(
+            mgr.get('bool').internal_values(),
+            bools.get('bool').internal_values())
+
+        bools.set('bool', np.array([True, False, True]))
+        tm.assert_numpy_array_equal(mgr.get('bool', fastpath=False),
+                                    np.array([True, False, True]))
+        tm.assert_numpy_array_equal(mgr.get('bool').internal_values(),
+                                    np.array([True, False, True]))
+
+        # Check sharing
+        bools2 = mgr.get_bool_data(copy=True)
+        bools2.set('bool', np.array([False, True, False]))
+        tm.assert_numpy_array_equal(mgr.get('bool', fastpath=False),
+                                    np.array([True, False, True]))
+        tm.assert_numpy_array_equal(mgr.get('bool').internal_values(),
+                                    np.array([True, False, True]))
+
+    def test_unicode_repr_doesnt_raise(self):
+        repr(create_mgr(u('b,\u05d0: object')))
+
+    def test_missing_unicode_key(self):
+        df = DataFrame({"a": [1]})
+        try:
+            df.loc[:, u("\u05d0")]  # should not raise UnicodeEncodeError
+        except KeyError:
+            pass  # this is the expected exception
+
+    def test_equals(self):
+        # unique items
+        bm1 = create_mgr('a,b,c: i8-1; d,e,f: i8-2')
+        bm2 = BlockManager(bm1.blocks[::-1], bm1.axes)
+        assert bm1.equals(bm2)
+
+        bm1 = create_mgr('a,a,a: i8-1; b,b,b: i8-2')
+        bm2 = BlockManager(bm1.blocks[::-1], bm1.axes)
+        assert bm1.equals(bm2)
+
+    def test_equals_block_order_different_dtypes(self):
+        # GH 9330
+
+        mgr_strings = [
+            "a:i8;b:f8",  # basic case
+            "a:i8;b:f8;c:c8;d:b",  # many types
+            "a:i8;e:dt;f:td;g:string",  # more types
+            "a:i8;b:category;c:category2;d:category2",  # categories
+            "c:sparse;d:sparse_na;b:f8",  # sparse
+        ]
+
+        for mgr_string in mgr_strings:
+            bm = create_mgr(mgr_string)
+            block_perms = itertools.permutations(bm.blocks)
+            for bm_perm in block_perms:
+                bm_this = BlockManager(bm_perm, bm.axes)
+                assert bm.equals(bm_this)
+                assert bm_this.equals(bm)
+
+    def test_single_mgr_ctor(self):
+        mgr = create_single_mgr('f8', num_rows=5)
+        assert mgr.as_array().tolist() == [0., 1., 2., 3., 4.]
+
+    def test_validate_bool_args(self):
+        invalid_values = [1, "True", [1, 2, 3], 5.0]
+        bm1 = create_mgr('a,b,c: i8-1; d,e,f: i8-2')
+
+        for value in invalid_values:
+            with pytest.raises(ValueError):
+                bm1.replace_list([1], [2], inplace=value)
+
+
+class TestIndexing(object):
+    # Nosetests-style data-driven tests.
+    #
+    # This test applies different indexing routines to block managers and
+    # compares the outcome to the result of same operations on np.ndarray.
+    #
+    # NOTE: sparse (SparseBlock with fill_value != np.nan) fail a lot of tests
+    #       and are disabled.
+
+    MANAGERS = [
+        create_single_mgr('f8', N),
+        create_single_mgr('i8', N),
+        # create_single_mgr('sparse', N),
+        create_single_mgr('sparse_na', N),
+
+        # 2-dim
+        create_mgr('a,b,c,d,e,f: f8', item_shape=(N,)),
+        create_mgr('a,b,c,d,e,f: i8', item_shape=(N,)),
+        create_mgr('a,b: f8; c,d: i8; e,f: string', item_shape=(N,)),
+        create_mgr('a,b: f8; c,d: i8; e,f: f8', item_shape=(N,)),
+        # create_mgr('a: sparse', item_shape=(N,)),
+        create_mgr('a: sparse_na', item_shape=(N,)),
+
+        # 3-dim
+        create_mgr('a,b,c,d,e,f: f8', item_shape=(N, N)),
+        create_mgr('a,b,c,d,e,f: i8', item_shape=(N, N)),
+        create_mgr('a,b: f8; c,d: i8; e,f: string', item_shape=(N, N)),
+        create_mgr('a,b: f8; c,d: i8; e,f: f8', item_shape=(N, N)),
+        # create_mgr('a: sparse', item_shape=(1, N)),
+    ]
+
+    # MANAGERS = [MANAGERS[6]]
+
+    def test_get_slice(self):
+        def assert_slice_ok(mgr, axis, slobj):
+            # import pudb; pudb.set_trace()
+            mat = mgr.as_array()
+
+            # we maybe using an ndarray to test slicing and
+            # might not be the full length of the axis
+            if isinstance(slobj, np.ndarray):
+                ax = mgr.axes[axis]
+                if len(ax) and len(slobj) and len(slobj) != len(ax):
+                    slobj = np.concatenate([slobj, np.zeros(
+                        len(ax) - len(slobj), dtype=bool)])
+            sliced = mgr.get_slice(slobj, axis=axis)
+            mat_slobj = (slice(None), ) * axis + (slobj, )
+            tm.assert_numpy_array_equal(mat[mat_slobj], sliced.as_array(),
+                                        check_dtype=False)
+            tm.assert_index_equal(mgr.axes[axis][slobj], sliced.axes[axis])
+
+        for mgr in self.MANAGERS:
+            for ax in range(mgr.ndim):
+                # slice
+                assert_slice_ok(mgr, ax, slice(None))
+                assert_slice_ok(mgr, ax, slice(3))
+                assert_slice_ok(mgr, ax, slice(100))
+                assert_slice_ok(mgr, ax, slice(1, 4))
+                assert_slice_ok(mgr, ax, slice(3, 0, -2))
+
+                # boolean mask
+                assert_slice_ok(
+                    mgr, ax, np.array([], dtype=np.bool_))
+                assert_slice_ok(
+                    mgr, ax,
+                    np.ones(mgr.shape[ax], dtype=np.bool_))
+                assert_slice_ok(
+                    mgr, ax,
+                    np.zeros(mgr.shape[ax], dtype=np.bool_))
+
+                if mgr.shape[ax] >= 3:
+                    assert_slice_ok(
+                        mgr, ax,
+                        np.arange(mgr.shape[ax]) % 3 == 0)
+                    assert_slice_ok(
+                        mgr, ax, np.array(
+                            [True, True, False], dtype=np.bool_))
+
+                # fancy indexer
+                assert_slice_ok(mgr, ax, [])
+                assert_slice_ok(mgr, ax, lrange(mgr.shape[ax]))
+
+                if mgr.shape[ax] >= 3:
+                    assert_slice_ok(mgr, ax, [0, 1, 2])
+                    assert_slice_ok(mgr, ax, [-1, -2, -3])
+
+    def test_take(self):
+        def assert_take_ok(mgr, axis, indexer):
+            mat = mgr.as_array()
+            taken = mgr.take(indexer, axis)
+            tm.assert_numpy_array_equal(np.take(mat, indexer, axis),
+                                        taken.as_array(), check_dtype=False)
+            tm.assert_index_equal(mgr.axes[axis].take(indexer),
+                                  taken.axes[axis])
+
+        for mgr in self.MANAGERS:
+            for ax in range(mgr.ndim):
+                # take/fancy indexer
+                assert_take_ok(mgr, ax, [])
+                assert_take_ok(mgr, ax, [0, 0, 0])
+                assert_take_ok(mgr, ax, lrange(mgr.shape[ax]))
+
+                if mgr.shape[ax] >= 3:
+                    assert_take_ok(mgr, ax, [0, 1, 2])
+                    assert_take_ok(mgr, ax, [-1, -2, -3])
+
+    def test_reindex_axis(self):
+        def assert_reindex_axis_is_ok(mgr, axis, new_labels, fill_value):
+            mat = mgr.as_array()
+            indexer = mgr.axes[axis].get_indexer_for(new_labels)
+
+            reindexed = mgr.reindex_axis(new_labels, axis,
+                                         fill_value=fill_value)
+            tm.assert_numpy_array_equal(algos.take_nd(mat, indexer, axis,
+                                                      fill_value=fill_value),
+                                        reindexed.as_array(),
+                                        check_dtype=False)
+            tm.assert_index_equal(reindexed.axes[axis], new_labels)
+
+        for mgr in self.MANAGERS:
+            for ax in range(mgr.ndim):
+                for fill_value in (None, np.nan, 100.):
+                    assert_reindex_axis_is_ok(
+                        mgr, ax,
+                        pd.Index([]), fill_value)
+                    assert_reindex_axis_is_ok(
+                        mgr, ax, mgr.axes[ax],
+                        fill_value)
+                    assert_reindex_axis_is_ok(
+                        mgr, ax,
+                        mgr.axes[ax][[0, 0, 0]], fill_value)
+                    assert_reindex_axis_is_ok(
+                        mgr, ax,
+                        pd.Index(['foo', 'bar', 'baz']), fill_value)
+                    assert_reindex_axis_is_ok(
+                        mgr, ax,
+                        pd.Index(['foo', mgr.axes[ax][0], 'baz']),
+                        fill_value)
+
+                    if mgr.shape[ax] >= 3:
+                        assert_reindex_axis_is_ok(
+                            mgr, ax,
+                            mgr.axes[ax][:-3], fill_value)
+                        assert_reindex_axis_is_ok(
+                            mgr, ax,
+                            mgr.axes[ax][-3::-1], fill_value)
+                        assert_reindex_axis_is_ok(
+                            mgr, ax,
+                            mgr.axes[ax][[0, 1, 2, 0, 1, 2]], fill_value)
+
+    def test_reindex_indexer(self):
+
+        def assert_reindex_indexer_is_ok(mgr, axis, new_labels, indexer,
+                                         fill_value):
+            mat = mgr.as_array()
+            reindexed_mat = algos.take_nd(mat, indexer, axis,
+                                          fill_value=fill_value)
+            reindexed = mgr.reindex_indexer(new_labels, indexer, axis,
+                                            fill_value=fill_value)
+            tm.assert_numpy_array_equal(reindexed_mat,
+                                        reindexed.as_array(),
+                                        check_dtype=False)
+            tm.assert_index_equal(reindexed.axes[axis], new_labels)
+
+        for mgr in self.MANAGERS:
+            for ax in range(mgr.ndim):
+                for fill_value in (None, np.nan, 100.):
+                    assert_reindex_indexer_is_ok(
+                        mgr, ax,
+                        pd.Index([]), [], fill_value)
+                    assert_reindex_indexer_is_ok(
+                        mgr, ax,
+                        mgr.axes[ax], np.arange(mgr.shape[ax]), fill_value)
+                    assert_reindex_indexer_is_ok(
+                        mgr, ax,
+                        pd.Index(['foo'] * mgr.shape[ax]),
+                        np.arange(mgr.shape[ax]), fill_value)
+                    assert_reindex_indexer_is_ok(
+                        mgr, ax,
+                        mgr.axes[ax][::-1], np.arange(mgr.shape[ax]),
+                        fill_value)
+                    assert_reindex_indexer_is_ok(
+                        mgr, ax, mgr.axes[ax],
+                        np.arange(mgr.shape[ax])[::-1], fill_value)
+                    assert_reindex_indexer_is_ok(
+                        mgr, ax,
+                        pd.Index(['foo', 'bar', 'baz']),
+                        [0, 0, 0], fill_value)
+                    assert_reindex_indexer_is_ok(
+                        mgr, ax,
+                        pd.Index(['foo', 'bar', 'baz']),
+                        [-1, 0, -1], fill_value)
+                    assert_reindex_indexer_is_ok(
+                        mgr, ax,
+                        pd.Index(['foo', mgr.axes[ax][0], 'baz']),
+                        [-1, -1, -1], fill_value)
+
+                    if mgr.shape[ax] >= 3:
+                        assert_reindex_indexer_is_ok(
+                            mgr, ax,
+                            pd.Index(['foo', 'bar', 'baz']),
+                            [0, 1, 2], fill_value)
+
+    # test_get_slice(slice_like, axis)
+    # take(indexer, axis)
+    # reindex_axis(new_labels, axis)
+    # reindex_indexer(new_labels, indexer, axis)
+
+
+class TestBlockPlacement(object):
+
+    def test_slice_len(self):
+        assert len(BlockPlacement(slice(0, 4))) == 4
+        assert len(BlockPlacement(slice(0, 4, 2))) == 2
+        assert len(BlockPlacement(slice(0, 3, 2))) == 2
+
+        assert len(BlockPlacement(slice(0, 1, 2))) == 1
+        assert len(BlockPlacement(slice(1, 0, -1))) == 1
+
+    def test_zero_step_raises(self):
+        with pytest.raises(ValueError):
+            BlockPlacement(slice(1, 1, 0))
+        with pytest.raises(ValueError):
+            BlockPlacement(slice(1, 2, 0))
+
+    def test_unbounded_slice_raises(self):
+        def assert_unbounded_slice_error(slc):
+            tm.assert_raises_regex(ValueError, "unbounded slice",
+                                   lambda: BlockPlacement(slc))
+
+        assert_unbounded_slice_error(slice(None, None))
+        assert_unbounded_slice_error(slice(10, None))
+        assert_unbounded_slice_error(slice(None, None, -1))
+        assert_unbounded_slice_error(slice(None, 10, -1))
+
+        # These are "unbounded" because negative index will change depending on
+        # container shape.
+        assert_unbounded_slice_error(slice(-1, None))
+        assert_unbounded_slice_error(slice(None, -1))
+        assert_unbounded_slice_error(slice(-1, -1))
+        assert_unbounded_slice_error(slice(-1, None, -1))
+        assert_unbounded_slice_error(slice(None, -1, -1))
+        assert_unbounded_slice_error(slice(-1, -1, -1))
+
+    def test_not_slice_like_slices(self):
+        def assert_not_slice_like(slc):
+            assert not BlockPlacement(slc).is_slice_like
+
+        assert_not_slice_like(slice(0, 0))
+        assert_not_slice_like(slice(100, 0))
+
+        assert_not_slice_like(slice(100, 100, -1))
+        assert_not_slice_like(slice(0, 100, -1))
+
+        assert not BlockPlacement(slice(0, 0)).is_slice_like
+        assert not BlockPlacement(slice(100, 100)).is_slice_like
+
+    def test_array_to_slice_conversion(self):
+        def assert_as_slice_equals(arr, slc):
+            assert BlockPlacement(arr).as_slice == slc
+
+        assert_as_slice_equals([0], slice(0, 1, 1))
+        assert_as_slice_equals([100], slice(100, 101, 1))
+
+        assert_as_slice_equals([0, 1, 2], slice(0, 3, 1))
+        assert_as_slice_equals([0, 5, 10], slice(0, 15, 5))
+        assert_as_slice_equals([0, 100], slice(0, 200, 100))
+
+        assert_as_slice_equals([2, 1], slice(2, 0, -1))
+
+        if not PY361:
+            assert_as_slice_equals([2, 1, 0], slice(2, None, -1))
+            assert_as_slice_equals([100, 0], slice(100, None, -100))
+
+    def test_not_slice_like_arrays(self):
+        def assert_not_slice_like(arr):
+            assert not BlockPlacement(arr).is_slice_like
+
+        assert_not_slice_like([])
+        assert_not_slice_like([-1])
+        assert_not_slice_like([-1, -2, -3])
+        assert_not_slice_like([-10])
+        assert_not_slice_like([-1])
+        assert_not_slice_like([-1, 0, 1, 2])
+        assert_not_slice_like([-2, 0, 2, 4])
+        assert_not_slice_like([1, 0, -1])
+        assert_not_slice_like([1, 1, 1])
+
+    def test_slice_iter(self):
+        assert list(BlockPlacement(slice(0, 3))) == [0, 1, 2]
+        assert list(BlockPlacement(slice(0, 0))) == []
+        assert list(BlockPlacement(slice(3, 0))) == []
+
+        if not PY361:
+            assert list(BlockPlacement(slice(3, 0, -1))) == [3, 2, 1]
+            assert list(BlockPlacement(slice(3, None, -1))) == [3, 2, 1, 0]
+
+    def test_slice_to_array_conversion(self):
+        def assert_as_array_equals(slc, asarray):
+            tm.assert_numpy_array_equal(
+                BlockPlacement(slc).as_array,
+                np.asarray(asarray, dtype=np.int64))
+
+        assert_as_array_equals(slice(0, 3), [0, 1, 2])
+        assert_as_array_equals(slice(0, 0), [])
+        assert_as_array_equals(slice(3, 0), [])
+
+        assert_as_array_equals(slice(3, 0, -1), [3, 2, 1])
+
+        if not PY361:
+            assert_as_array_equals(slice(3, None, -1), [3, 2, 1, 0])
+            assert_as_array_equals(slice(31, None, -10), [31, 21, 11, 1])
+
+    def test_blockplacement_add(self):
+        bpl = BlockPlacement(slice(0, 5))
+        assert bpl.add(1).as_slice == slice(1, 6, 1)
+        assert bpl.add(np.arange(5)).as_slice == slice(0, 10, 2)
+        assert list(bpl.add(np.arange(5, 0, -1))) == [5, 5, 5, 5, 5]
+
+    def test_blockplacement_add_int(self):
+        def assert_add_equals(val, inc, result):
+            assert list(BlockPlacement(val).add(inc)) == result
+
+        assert_add_equals(slice(0, 0), 0, [])
+        assert_add_equals(slice(1, 4), 0, [1, 2, 3])
+        assert_add_equals(slice(3, 0, -1), 0, [3, 2, 1])
+        assert_add_equals([1, 2, 4], 0, [1, 2, 4])
+
+        assert_add_equals(slice(0, 0), 10, [])
+        assert_add_equals(slice(1, 4), 10, [11, 12, 13])
+        assert_add_equals(slice(3, 0, -1), 10, [13, 12, 11])
+        assert_add_equals([1, 2, 4], 10, [11, 12, 14])
+
+        assert_add_equals(slice(0, 0), -1, [])
+        assert_add_equals(slice(1, 4), -1, [0, 1, 2])
+        assert_add_equals([1, 2, 4], -1, [0, 1, 3])
+
+        with pytest.raises(ValueError):
+            BlockPlacement(slice(1, 4)).add(-10)
+        with pytest.raises(ValueError):
+            BlockPlacement([1, 2, 4]).add(-10)
+
+        if not PY361:
+            assert_add_equals(slice(3, 0, -1), -1, [2, 1, 0])
+            assert_add_equals(slice(2, None, -1), 0, [2, 1, 0])
+            assert_add_equals(slice(2, None, -1), 10, [12, 11, 10])
+
+            with pytest.raises(ValueError):
+                BlockPlacement(slice(2, None, -1)).add(-1)
+
+
+class DummyElement(object):
+    def __init__(self, value, dtype):
+        self.value = value
+        self.dtype = np.dtype(dtype)
+
+    def __array__(self):
+        return np.array(self.value, dtype=self.dtype)
+
+    def __str__(self):
+        return "DummyElement({}, {})".format(self.value, self.dtype)
+
+    def __repr__(self):
+        return str(self)
+
+    def astype(self, dtype, copy=False):
+        self.dtype = dtype
+        return self
+
+    def view(self, dtype):
+        return type(self)(self.value.view(dtype), dtype)
+
+    def any(self, axis=None):
+        return bool(self.value)
+
+
+class TestCanHoldElement(object):
+    @pytest.mark.parametrize('value, dtype', [
+        (1, 'i8'),
+        (1.0, 'f8'),
+        (2**63, 'f8'),
+        (1j, 'complex128'),
+        (2**63, 'complex128'),
+        (True, 'bool'),
+        (np.timedelta64(20, 'ns'), '<m8[ns]'),
+        (np.datetime64(20, 'ns'), '<M8[ns]'),
+    ])
+    @pytest.mark.parametrize('op', [
+        operator.add,
+        operator.sub,
+        operator.mul,
+        operator.truediv,
+        operator.mod,
+        operator.pow,
+    ], ids=lambda x: x.__name__)
+    def test_binop_other(self, op, value, dtype):
+        skip = {(operator.add, 'bool'),
+                (operator.sub, 'bool'),
+                (operator.mul, 'bool'),
+                (operator.truediv, 'bool'),
+                (operator.mod, 'i8'),
+                (operator.mod, 'complex128'),
+                (operator.mod, '<M8[ns]'),
+                (operator.mod, '<m8[ns]'),
+                (operator.pow, 'bool')}
+        if (op, dtype) in skip:
+            pytest.skip("Invalid combination {},{}".format(op, dtype))
+        e = DummyElement(value, dtype)
+        s = pd.DataFrame({"A": [e.value, e.value]}, dtype=e.dtype)
+        result = op(s, e).dtypes
+        expected = op(s, value).dtypes
+        assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('typestr, holder', [
+    ('category', Categorical),
+    ('M8[ns]', DatetimeIndex),
+    ('M8[ns, US/Central]', DatetimeIndex),
+    ('m8[ns]', TimedeltaIndex),
+    ('sparse', SparseArray),
+])
+def test_holder(typestr, holder):
+    blk = create_block(typestr, [1])
+    assert blk._holder is holder
+
+
+def test_deprecated_fastpath():
+    # GH#19265
+    values = np.random.rand(3, 3)
+    with tm.assert_produces_warning(DeprecationWarning,
+                                    check_stacklevel=False):
+        make_block(values, placement=np.arange(3), fastpath=True)
+
+
+def test_validate_ndim():
+    values = np.array([1.0, 2.0])
+    placement = slice(2)
+    msg = "Wrong number of dimensions. values.ndim != ndim \[1 != 2\]"
+
+    with tm.assert_raises_regex(ValueError, msg):
+        make_block(values, placement, ndim=2)
diff --git a/pandas/tests/io/__init__.py b/pandas/tests/io/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/io/conftest.py b/pandas/tests/io/conftest.py
new file mode 100644
index 0000000000000..7623587803b41
--- /dev/null
+++ b/pandas/tests/io/conftest.py
@@ -0,0 +1,74 @@
+import pytest
+from pandas.io.parsers import read_table
+
+
+@pytest.fixture
+def tips_file(datapath):
+    """Path to the tips dataset"""
+    return datapath('io', 'parser', 'data', 'tips.csv')
+
+
+@pytest.fixture
+def jsonl_file(datapath):
+    """Path a JSONL dataset"""
+    return datapath('io', 'parser', 'data', 'items.jsonl')
+
+
+@pytest.fixture
+def salaries_table(datapath):
+    """DataFrame with the salaries dataset"""
+    return read_table(datapath('io', 'parser', 'data', 'salaries.csv'))
+
+
+@pytest.fixture
+def s3_resource(tips_file, jsonl_file):
+    """Fixture for mocking S3 interaction.
+
+    The primary bucket name is "pandas-test". The following datasets
+    are loaded.
+
+    - tips.csv
+    - tips.csv.gz
+    - tips.csv.bz2
+    - items.jsonl
+
+    A private bucket "cant_get_it" is also created. The boto3 s3 resource
+    is yielded by the fixture.
+    """
+    pytest.importorskip('s3fs')
+    boto3 = pytest.importorskip('boto3')
+    moto = pytest.importorskip('moto')
+
+    test_s3_files = [
+        ('tips.csv', tips_file),
+        ('tips.csv.gz', tips_file + '.gz'),
+        ('tips.csv.bz2', tips_file + '.bz2'),
+        ('items.jsonl', jsonl_file),
+    ]
+
+    def add_tips_files(bucket_name):
+        for s3_key, file_name in test_s3_files:
+            with open(file_name, 'rb') as f:
+                conn.Bucket(bucket_name).put_object(
+                    Key=s3_key,
+                    Body=f)
+
+    try:
+
+        s3 = moto.mock_s3()
+        s3.start()
+
+        # see gh-16135
+        bucket = 'pandas-test'
+        conn = boto3.resource("s3", region_name="us-east-1")
+
+        conn.create_bucket(Bucket=bucket)
+        add_tips_files(bucket)
+
+        conn.create_bucket(Bucket='cant_get_it', ACL='private')
+        add_tips_files('cant_get_it')
+        yield conn
+    except:  # noqa: flake8
+        pytest.skip("failure to use s3 resource")
+    finally:
+        s3.stop()
diff --git a/pandas/tests/io/data/S4_EDUC1.dta b/pandas/tests/io/data/S4_EDUC1.dta
new file mode 100644
index 0000000000000..2d5533b7e621c
Binary files /dev/null and b/pandas/tests/io/data/S4_EDUC1.dta differ
diff --git a/pandas/io/tests/data/banklist.csv b/pandas/tests/io/data/banklist.csv
similarity index 100%
rename from pandas/io/tests/data/banklist.csv
rename to pandas/tests/io/data/banklist.csv
diff --git a/pandas/io/tests/data/banklist.html b/pandas/tests/io/data/banklist.html
similarity index 99%
rename from pandas/io/tests/data/banklist.html
rename to pandas/tests/io/data/banklist.html
index 8ec1561f8c394..c6f0e47c2a3ef 100644
--- a/pandas/io/tests/data/banklist.html
+++ b/pandas/tests/io/data/banklist.html
@@ -7,7 +7,7 @@
 <meta charset="UTF-8">
 <!-- Unicode character encoding -->
 <meta http-equiv="X-UA-Compatible" content="IE=edge">
-<!-- Turns off IE Compatiblity Mode -->
+<!-- Turns off IE Compatibility Mode -->
 <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
 <!-- Makes it so phones don't auto zoom out. -->
 <meta name="author" content="DRR">
@@ -340,6 +340,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="closing">April 19, 2013</td>
 				<td class="updated">April 23, 2013</td>
 			</tr>
+			<tr>
 				<td class="institution"><a href="goldcanyon.html">Gold Canyon Bank</a></td>
 				<td class="city">Gold Canyon</td>
 				<td class="state">AZ</td>
@@ -4849,7 +4850,7 @@ <h1 class="page_title">Failed Bank List</h1>
 		<ul>
 			<li><a href="/about/freedom/" title="Freedom of Information Act (FOIA) Service Center">Freedom of Information Act (FOIA) Service Center</a></li>
 			<li><a href="/open/" title="FDIC Open Government Webpage">FDIC Open Government Webpage</a></li>
-			<li><a href="/about/diversity/nofear/" title="No FEAR Act Data">No  FEAR Act Data</a></li>
+			<li><a href="/about/diversity/nofear/" title="No FEAR Act Data">No FEAR Act Data</a></li>
 		</ul>
 	</div>
 	<div id="responsive_footer-small">
diff --git a/pandas/io/tests/data/blank.xls b/pandas/tests/io/data/blank.xls
old mode 100755
new mode 100644
similarity index 100%
rename from pandas/io/tests/data/blank.xls
rename to pandas/tests/io/data/blank.xls
diff --git a/pandas/io/tests/data/blank.xlsm b/pandas/tests/io/data/blank.xlsm
old mode 100755
new mode 100644
similarity index 100%
rename from pandas/io/tests/data/blank.xlsm
rename to pandas/tests/io/data/blank.xlsm
diff --git a/pandas/io/tests/data/blank.xlsx b/pandas/tests/io/data/blank.xlsx
old mode 100755
new mode 100644
similarity index 100%
rename from pandas/io/tests/data/blank.xlsx
rename to pandas/tests/io/data/blank.xlsx
diff --git a/pandas/io/tests/data/blank_with_header.xls b/pandas/tests/io/data/blank_with_header.xls
old mode 100755
new mode 100644
similarity index 100%
rename from pandas/io/tests/data/blank_with_header.xls
rename to pandas/tests/io/data/blank_with_header.xls
diff --git a/pandas/io/tests/data/blank_with_header.xlsm b/pandas/tests/io/data/blank_with_header.xlsm
old mode 100755
new mode 100644
similarity index 100%
rename from pandas/io/tests/data/blank_with_header.xlsm
rename to pandas/tests/io/data/blank_with_header.xlsm
diff --git a/pandas/io/tests/data/blank_with_header.xlsx b/pandas/tests/io/data/blank_with_header.xlsx
old mode 100755
new mode 100644
similarity index 100%
rename from pandas/io/tests/data/blank_with_header.xlsx
rename to pandas/tests/io/data/blank_with_header.xlsx
diff --git a/pandas/tests/data/categorical_0_14_1.pickle b/pandas/tests/io/data/categorical_0_14_1.pickle
similarity index 100%
rename from pandas/tests/data/categorical_0_14_1.pickle
rename to pandas/tests/io/data/categorical_0_14_1.pickle
diff --git a/pandas/tests/data/categorical_0_15_2.pickle b/pandas/tests/io/data/categorical_0_15_2.pickle
similarity index 100%
rename from pandas/tests/data/categorical_0_15_2.pickle
rename to pandas/tests/io/data/categorical_0_15_2.pickle
diff --git a/pandas/io/tests/data/computer_sales_page.html b/pandas/tests/io/data/computer_sales_page.html
similarity index 100%
rename from pandas/io/tests/data/computer_sales_page.html
rename to pandas/tests/io/data/computer_sales_page.html
diff --git a/pandas/tests/io/data/feather-0_3_1.feather b/pandas/tests/io/data/feather-0_3_1.feather
new file mode 100644
index 0000000000000..5a2c7b3dcc684
Binary files /dev/null and b/pandas/tests/io/data/feather-0_3_1.feather differ
diff --git a/pandas/tests/io/data/fixed_width_format.txt b/pandas/tests/io/data/fixed_width_format.txt
new file mode 100644
index 0000000000000..bb487d8de7ef9
--- /dev/null
+++ b/pandas/tests/io/data/fixed_width_format.txt
@@ -0,0 +1,3 @@
+A   B   C
+1   2   3
+4   5   6
diff --git a/pandas/io/tests/data/gbq_fake_job.txt b/pandas/tests/io/data/gbq_fake_job.txt
similarity index 100%
rename from pandas/io/tests/data/gbq_fake_job.txt
rename to pandas/tests/io/data/gbq_fake_job.txt
diff --git a/pandas/io/tests/data/html_encoding/chinese_utf-16.html b/pandas/tests/io/data/html_encoding/chinese_utf-16.html
similarity index 100%
rename from pandas/io/tests/data/html_encoding/chinese_utf-16.html
rename to pandas/tests/io/data/html_encoding/chinese_utf-16.html
diff --git a/pandas/io/tests/data/html_encoding/chinese_utf-32.html b/pandas/tests/io/data/html_encoding/chinese_utf-32.html
similarity index 100%
rename from pandas/io/tests/data/html_encoding/chinese_utf-32.html
rename to pandas/tests/io/data/html_encoding/chinese_utf-32.html
diff --git a/pandas/io/tests/data/html_encoding/chinese_utf-8.html b/pandas/tests/io/data/html_encoding/chinese_utf-8.html
similarity index 100%
rename from pandas/io/tests/data/html_encoding/chinese_utf-8.html
rename to pandas/tests/io/data/html_encoding/chinese_utf-8.html
diff --git a/pandas/io/tests/data/html_encoding/letz_latin1.html b/pandas/tests/io/data/html_encoding/letz_latin1.html
similarity index 100%
rename from pandas/io/tests/data/html_encoding/letz_latin1.html
rename to pandas/tests/io/data/html_encoding/letz_latin1.html
diff --git a/pandas/io/tests/data/iris.csv b/pandas/tests/io/data/iris.csv
similarity index 100%
rename from pandas/io/tests/data/iris.csv
rename to pandas/tests/io/data/iris.csv
diff --git a/pandas/io/tests/data/legacy_hdf/datetimetz_object.h5 b/pandas/tests/io/data/legacy_hdf/datetimetz_object.h5
similarity index 100%
rename from pandas/io/tests/data/legacy_hdf/datetimetz_object.h5
rename to pandas/tests/io/data/legacy_hdf/datetimetz_object.h5
diff --git a/pandas/io/tests/data/legacy_hdf/legacy_table.h5 b/pandas/tests/io/data/legacy_hdf/legacy_table.h5
similarity index 100%
rename from pandas/io/tests/data/legacy_hdf/legacy_table.h5
rename to pandas/tests/io/data/legacy_hdf/legacy_table.h5
diff --git a/pandas/tests/io/data/legacy_hdf/periodindex_0.20.1_x86_64_darwin_2.7.13.h5 b/pandas/tests/io/data/legacy_hdf/periodindex_0.20.1_x86_64_darwin_2.7.13.h5
new file mode 100644
index 0000000000000..6fb92d3c564bd
Binary files /dev/null and b/pandas/tests/io/data/legacy_hdf/periodindex_0.20.1_x86_64_darwin_2.7.13.h5 differ
diff --git a/pandas/io/tests/data/legacy_hdf/pytables_native.h5 b/pandas/tests/io/data/legacy_hdf/pytables_native.h5
similarity index 100%
rename from pandas/io/tests/data/legacy_hdf/pytables_native.h5
rename to pandas/tests/io/data/legacy_hdf/pytables_native.h5
diff --git a/pandas/io/tests/data/legacy_hdf/pytables_native2.h5 b/pandas/tests/io/data/legacy_hdf/pytables_native2.h5
similarity index 100%
rename from pandas/io/tests/data/legacy_hdf/pytables_native2.h5
rename to pandas/tests/io/data/legacy_hdf/pytables_native2.h5
diff --git a/pandas/io/tests/data/legacy_msgpack/0.16.0/0.16.0_x86_64_darwin_2.7.9.msgpack b/pandas/tests/io/data/legacy_msgpack/0.16.0/0.16.0_x86_64_darwin_2.7.9.msgpack
similarity index 100%
rename from pandas/io/tests/data/legacy_msgpack/0.16.0/0.16.0_x86_64_darwin_2.7.9.msgpack
rename to pandas/tests/io/data/legacy_msgpack/0.16.0/0.16.0_x86_64_darwin_2.7.9.msgpack
diff --git a/pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_AMD64_windows_2.7.10.msgpack b/pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_AMD64_windows_2.7.10.msgpack
similarity index 100%
rename from pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_AMD64_windows_2.7.10.msgpack
rename to pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_AMD64_windows_2.7.10.msgpack
diff --git a/pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_AMD64_windows_3.4.3.msgpack b/pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_AMD64_windows_3.4.3.msgpack
similarity index 100%
rename from pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_AMD64_windows_3.4.3.msgpack
rename to pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_AMD64_windows_3.4.3.msgpack
diff --git a/pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_x86_64_darwin_2.7.10.msgpack b/pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_x86_64_darwin_2.7.10.msgpack
similarity index 100%
rename from pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_x86_64_darwin_2.7.10.msgpack
rename to pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_x86_64_darwin_2.7.10.msgpack
diff --git a/pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_x86_64_darwin_2.7.9.msgpack b/pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_x86_64_darwin_2.7.9.msgpack
similarity index 100%
rename from pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_x86_64_darwin_2.7.9.msgpack
rename to pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_x86_64_darwin_2.7.9.msgpack
diff --git a/pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_x86_64_darwin_3.4.3.msgpack b/pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_x86_64_darwin_3.4.3.msgpack
similarity index 100%
rename from pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_x86_64_darwin_3.4.3.msgpack
rename to pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_x86_64_darwin_3.4.3.msgpack
diff --git a/pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_x86_64_linux_2.7.10.msgpack b/pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_x86_64_linux_2.7.10.msgpack
similarity index 100%
rename from pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_x86_64_linux_2.7.10.msgpack
rename to pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_x86_64_linux_2.7.10.msgpack
diff --git a/pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_x86_64_linux_3.4.3.msgpack b/pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_x86_64_linux_3.4.3.msgpack
similarity index 100%
rename from pandas/io/tests/data/legacy_msgpack/0.16.2/0.16.2_x86_64_linux_3.4.3.msgpack
rename to pandas/tests/io/data/legacy_msgpack/0.16.2/0.16.2_x86_64_linux_3.4.3.msgpack
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_AMD64_windows_2.7.11.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_AMD64_windows_2.7.11.msgpack
new file mode 100644
index 0000000000000..590e11b14d88b
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_AMD64_windows_2.7.11.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_AMD64_windows_3.4.4.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_AMD64_windows_3.4.4.msgpack
new file mode 100644
index 0000000000000..009c52b3f5650
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_AMD64_windows_3.4.4.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_x86_64_darwin_2.7.11.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_x86_64_darwin_2.7.11.msgpack
new file mode 100644
index 0000000000000..16706a2229384
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_x86_64_darwin_2.7.11.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_x86_64_darwin_3.4.4.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_x86_64_darwin_3.4.4.msgpack
new file mode 100644
index 0000000000000..b9834a1c2a772
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_x86_64_darwin_3.4.4.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_x86_64_linux_2.7.11.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_x86_64_linux_2.7.11.msgpack
new file mode 100644
index 0000000000000..16706a2229384
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_x86_64_linux_2.7.11.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_x86_64_linux_3.4.4.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_x86_64_linux_3.4.4.msgpack
new file mode 100644
index 0000000000000..8d4f50799832f
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.0_x86_64_linux_3.4.4.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.1_AMD64_windows_2.7.11.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.1_AMD64_windows_2.7.11.msgpack
new file mode 100644
index 0000000000000..590e11b14d88b
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.1_AMD64_windows_2.7.11.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.1_AMD64_windows_3.5.1.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.1_AMD64_windows_3.5.1.msgpack
new file mode 100644
index 0000000000000..20682c9749dfb
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.0/0.17.1_AMD64_windows_3.5.1.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_AMD64_windows_2.7.11.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_AMD64_windows_2.7.11.msgpack
new file mode 100644
index 0000000000000..590e11b14d88b
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_AMD64_windows_2.7.11.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_AMD64_windows_3.5.1.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_AMD64_windows_3.5.1.msgpack
new file mode 100644
index 0000000000000..20682c9749dfb
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_AMD64_windows_3.5.1.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_x86_64_darwin_2.7.11.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_x86_64_darwin_2.7.11.msgpack
new file mode 100644
index 0000000000000..8cbb143434f61
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_x86_64_darwin_2.7.11.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_x86_64_darwin_3.5.1.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_x86_64_darwin_3.5.1.msgpack
new file mode 100644
index 0000000000000..c6fcd3c910881
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_x86_64_darwin_3.5.1.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_x86_64_linux_2.7.11.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_x86_64_linux_2.7.11.msgpack
new file mode 100644
index 0000000000000..e89b5dd99150e
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_x86_64_linux_2.7.11.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_x86_64_linux_3.4.4.msgpack b/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_x86_64_linux_3.4.4.msgpack
new file mode 100644
index 0000000000000..98efdabedea72
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.17.1/0.17.1_x86_64_linux_3.4.4.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.18.0/0.18.0_AMD64_windows_2.7.11.msgpack b/pandas/tests/io/data/legacy_msgpack/0.18.0/0.18.0_AMD64_windows_2.7.11.msgpack
new file mode 100644
index 0000000000000..9185ea93acbf2
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.18.0/0.18.0_AMD64_windows_2.7.11.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.18.0/0.18.0_AMD64_windows_3.5.1.msgpack b/pandas/tests/io/data/legacy_msgpack/0.18.0/0.18.0_AMD64_windows_3.5.1.msgpack
new file mode 100644
index 0000000000000..792ef27268aaf
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.18.0/0.18.0_AMD64_windows_3.5.1.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.18.0/0.18.0_x86_64_darwin_2.7.11.msgpack b/pandas/tests/io/data/legacy_msgpack/0.18.0/0.18.0_x86_64_darwin_2.7.11.msgpack
new file mode 100644
index 0000000000000..e3a57986656ab
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.18.0/0.18.0_x86_64_darwin_2.7.11.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.18.0/0.18.0_x86_64_darwin_3.5.1.msgpack b/pandas/tests/io/data/legacy_msgpack/0.18.0/0.18.0_x86_64_darwin_3.5.1.msgpack
new file mode 100644
index 0000000000000..33b71200258b2
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.18.0/0.18.0_x86_64_darwin_3.5.1.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.18.1/0.18.1_x86_64_darwin_2.7.12.msgpack b/pandas/tests/io/data/legacy_msgpack/0.18.1/0.18.1_x86_64_darwin_2.7.12.msgpack
new file mode 100644
index 0000000000000..978c2c5045314
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.18.1/0.18.1_x86_64_darwin_2.7.12.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.18.1/0.18.1_x86_64_darwin_3.5.2.msgpack b/pandas/tests/io/data/legacy_msgpack/0.18.1/0.18.1_x86_64_darwin_3.5.2.msgpack
new file mode 100644
index 0000000000000..ea8efdc86dd2d
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.18.1/0.18.1_x86_64_darwin_3.5.2.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.19.2/0.19.2_x86_64_darwin_2.7.12.msgpack b/pandas/tests/io/data/legacy_msgpack/0.19.2/0.19.2_x86_64_darwin_2.7.12.msgpack
new file mode 100644
index 0000000000000..f2dc38766025e
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.19.2/0.19.2_x86_64_darwin_2.7.12.msgpack differ
diff --git a/pandas/tests/io/data/legacy_msgpack/0.19.2/0.19.2_x86_64_darwin_3.6.1.msgpack b/pandas/tests/io/data/legacy_msgpack/0.19.2/0.19.2_x86_64_darwin_3.6.1.msgpack
new file mode 100644
index 0000000000000..4137629f53cf2
Binary files /dev/null and b/pandas/tests/io/data/legacy_msgpack/0.19.2/0.19.2_x86_64_darwin_3.6.1.msgpack differ
diff --git a/pandas/io/tests/data/legacy_pickle/0.10.1/AMD64_windows_2.7.3.pickle b/pandas/tests/io/data/legacy_pickle/0.10.1/AMD64_windows_2.7.3.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.10.1/AMD64_windows_2.7.3.pickle
rename to pandas/tests/io/data/legacy_pickle/0.10.1/AMD64_windows_2.7.3.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.10.1/x86_64_linux_2.7.3.pickle b/pandas/tests/io/data/legacy_pickle/0.10.1/x86_64_linux_2.7.3.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.10.1/x86_64_linux_2.7.3.pickle
rename to pandas/tests/io/data/legacy_pickle/0.10.1/x86_64_linux_2.7.3.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.11.0/0.11.0_x86_64_linux_3.3.0.pickle b/pandas/tests/io/data/legacy_pickle/0.11.0/0.11.0_x86_64_linux_3.3.0.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.11.0/0.11.0_x86_64_linux_3.3.0.pickle
rename to pandas/tests/io/data/legacy_pickle/0.11.0/0.11.0_x86_64_linux_3.3.0.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.11.0/x86_64_linux_2.7.3.pickle b/pandas/tests/io/data/legacy_pickle/0.11.0/x86_64_linux_2.7.3.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.11.0/x86_64_linux_2.7.3.pickle
rename to pandas/tests/io/data/legacy_pickle/0.11.0/x86_64_linux_2.7.3.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.11.0/x86_64_linux_3.3.0.pickle b/pandas/tests/io/data/legacy_pickle/0.11.0/x86_64_linux_3.3.0.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.11.0/x86_64_linux_3.3.0.pickle
rename to pandas/tests/io/data/legacy_pickle/0.11.0/x86_64_linux_3.3.0.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.12.0/0.12.0_AMD64_windows_2.7.3.pickle b/pandas/tests/io/data/legacy_pickle/0.12.0/0.12.0_AMD64_windows_2.7.3.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.12.0/0.12.0_AMD64_windows_2.7.3.pickle
rename to pandas/tests/io/data/legacy_pickle/0.12.0/0.12.0_AMD64_windows_2.7.3.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.12.0/0.12.0_x86_64_linux_2.7.3.pickle b/pandas/tests/io/data/legacy_pickle/0.12.0/0.12.0_x86_64_linux_2.7.3.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.12.0/0.12.0_x86_64_linux_2.7.3.pickle
rename to pandas/tests/io/data/legacy_pickle/0.12.0/0.12.0_x86_64_linux_2.7.3.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_AMD64_windows_2.7.3.pickle b/pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_AMD64_windows_2.7.3.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_AMD64_windows_2.7.3.pickle
rename to pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_AMD64_windows_2.7.3.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_i686_linux_2.6.5.pickle b/pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_i686_linux_2.6.5.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_i686_linux_2.6.5.pickle
rename to pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_i686_linux_2.6.5.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_i686_linux_2.7.3.pickle b/pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_i686_linux_2.7.3.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_i686_linux_2.7.3.pickle
rename to pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_i686_linux_2.7.3.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_i686_linux_3.2.3.pickle b/pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_i686_linux_3.2.3.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_i686_linux_3.2.3.pickle
rename to pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_i686_linux_3.2.3.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_x86_64_darwin_2.7.5.pickle b/pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_x86_64_darwin_2.7.5.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_x86_64_darwin_2.7.5.pickle
rename to pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_x86_64_darwin_2.7.5.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_x86_64_darwin_2.7.6.pickle b/pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_x86_64_darwin_2.7.6.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_x86_64_darwin_2.7.6.pickle
rename to pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_x86_64_darwin_2.7.6.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_x86_64_linux_2.7.3.pickle b/pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_x86_64_linux_2.7.3.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_x86_64_linux_2.7.3.pickle
rename to pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_x86_64_linux_2.7.3.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_x86_64_linux_2.7.8.pickle b/pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_x86_64_linux_2.7.8.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_x86_64_linux_2.7.8.pickle
rename to pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_x86_64_linux_2.7.8.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_x86_64_linux_3.3.0.pickle b/pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_x86_64_linux_3.3.0.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.13.0/0.13.0_x86_64_linux_3.3.0.pickle
rename to pandas/tests/io/data/legacy_pickle/0.13.0/0.13.0_x86_64_linux_3.3.0.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.14.0/0.14.0_x86_64_darwin_2.7.6.pickle b/pandas/tests/io/data/legacy_pickle/0.14.0/0.14.0_x86_64_darwin_2.7.6.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.14.0/0.14.0_x86_64_darwin_2.7.6.pickle
rename to pandas/tests/io/data/legacy_pickle/0.14.0/0.14.0_x86_64_darwin_2.7.6.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.14.0/0.14.0_x86_64_linux_2.7.8.pickle b/pandas/tests/io/data/legacy_pickle/0.14.0/0.14.0_x86_64_linux_2.7.8.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.14.0/0.14.0_x86_64_linux_2.7.8.pickle
rename to pandas/tests/io/data/legacy_pickle/0.14.0/0.14.0_x86_64_linux_2.7.8.pickle
diff --git a/pandas/tests/io/data/legacy_pickle/0.14.1/0.14.1_x86_64_darwin_2.7.12.pickle b/pandas/tests/io/data/legacy_pickle/0.14.1/0.14.1_x86_64_darwin_2.7.12.pickle
new file mode 100644
index 0000000000000..917ad2b0ff1a3
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.14.1/0.14.1_x86_64_darwin_2.7.12.pickle differ
diff --git a/pandas/io/tests/data/legacy_pickle/0.14.1/0.14.1_x86_64_linux_2.7.8.pickle b/pandas/tests/io/data/legacy_pickle/0.14.1/0.14.1_x86_64_linux_2.7.8.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.14.1/0.14.1_x86_64_linux_2.7.8.pickle
rename to pandas/tests/io/data/legacy_pickle/0.14.1/0.14.1_x86_64_linux_2.7.8.pickle
diff --git a/pandas/tests/io/data/legacy_pickle/0.15.0/0.15.0_x86_64_darwin_2.7.12.pickle b/pandas/tests/io/data/legacy_pickle/0.15.0/0.15.0_x86_64_darwin_2.7.12.pickle
new file mode 100644
index 0000000000000..c7a745cf9b458
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.15.0/0.15.0_x86_64_darwin_2.7.12.pickle differ
diff --git a/pandas/io/tests/data/legacy_pickle/0.15.0/0.15.0_x86_64_linux_2.7.8.pickle b/pandas/tests/io/data/legacy_pickle/0.15.0/0.15.0_x86_64_linux_2.7.8.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.15.0/0.15.0_x86_64_linux_2.7.8.pickle
rename to pandas/tests/io/data/legacy_pickle/0.15.0/0.15.0_x86_64_linux_2.7.8.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.15.2/0.15.2_x86_64_darwin_2.7.9.pickle b/pandas/tests/io/data/legacy_pickle/0.15.2/0.15.2_x86_64_darwin_2.7.9.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.15.2/0.15.2_x86_64_darwin_2.7.9.pickle
rename to pandas/tests/io/data/legacy_pickle/0.15.2/0.15.2_x86_64_darwin_2.7.9.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.16.0/0.16.0_x86_64_darwin_2.7.9.pickle b/pandas/tests/io/data/legacy_pickle/0.16.0/0.16.0_x86_64_darwin_2.7.9.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.16.0/0.16.0_x86_64_darwin_2.7.9.pickle
rename to pandas/tests/io/data/legacy_pickle/0.16.0/0.16.0_x86_64_darwin_2.7.9.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_2.7.10.pickle b/pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_2.7.10.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_2.7.10.pickle
rename to pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_2.7.10.pickle
diff --git a/pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_2.7.14.pickle b/pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_2.7.14.pickle
new file mode 100644
index 0000000000000..6341fa26d1f25
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_2.7.14.pickle differ
diff --git a/pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_3.4.3.pickle b/pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_3.4.3.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_3.4.3.pickle
rename to pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_3.4.3.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_x86_64_darwin_2.7.10.pickle b/pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_x86_64_darwin_2.7.10.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_x86_64_darwin_2.7.10.pickle
rename to pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_x86_64_darwin_2.7.10.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_x86_64_darwin_2.7.9.pickle b/pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_x86_64_darwin_2.7.9.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_x86_64_darwin_2.7.9.pickle
rename to pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_x86_64_darwin_2.7.9.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_x86_64_darwin_3.4.3.pickle b/pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_x86_64_darwin_3.4.3.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_x86_64_darwin_3.4.3.pickle
rename to pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_x86_64_darwin_3.4.3.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_x86_64_linux_2.7.10.pickle b/pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_x86_64_linux_2.7.10.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_x86_64_linux_2.7.10.pickle
rename to pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_x86_64_linux_2.7.10.pickle
diff --git a/pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_x86_64_linux_3.4.3.pickle b/pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_x86_64_linux_3.4.3.pickle
similarity index 100%
rename from pandas/io/tests/data/legacy_pickle/0.16.2/0.16.2_x86_64_linux_3.4.3.pickle
rename to pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_x86_64_linux_3.4.3.pickle
diff --git a/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_AMD64_windows_2.7.11.pickle b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_AMD64_windows_2.7.11.pickle
new file mode 100644
index 0000000000000..2b91b9ab5552b
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_AMD64_windows_2.7.11.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_AMD64_windows_3.4.4.pickle b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_AMD64_windows_3.4.4.pickle
new file mode 100644
index 0000000000000..1ee544f71adc2
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_AMD64_windows_3.4.4.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_darwin_2.7.11.pickle b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_darwin_2.7.11.pickle
new file mode 100644
index 0000000000000..7af7e67ce8c43
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_darwin_2.7.11.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_darwin_3.4.4.pickle b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_darwin_3.4.4.pickle
new file mode 100644
index 0000000000000..b4cce985f2f0b
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_darwin_3.4.4.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_darwin_3.5.3.pickle b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_darwin_3.5.3.pickle
new file mode 100644
index 0000000000000..537864af7028b
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_darwin_3.5.3.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_linux_2.7.11.pickle b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_linux_2.7.11.pickle
new file mode 100644
index 0000000000000..7af7e67ce8c43
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_linux_2.7.11.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_linux_3.4.4.pickle b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_linux_3.4.4.pickle
new file mode 100644
index 0000000000000..67a442c2be93b
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_linux_3.4.4.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.1_AMD64_windows_2.7.11.pickle b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.1_AMD64_windows_2.7.11.pickle
new file mode 100644
index 0000000000000..2b91b9ab5552b
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.1_AMD64_windows_2.7.11.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.17.1/0.17.1_AMD64_windows_2.7.11.pickle b/pandas/tests/io/data/legacy_pickle/0.17.1/0.17.1_AMD64_windows_2.7.11.pickle
new file mode 100644
index 0000000000000..2b91b9ab5552b
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.17.1/0.17.1_AMD64_windows_2.7.11.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.17.1/0.17.1_x86_64_darwin_2.7.11.pickle b/pandas/tests/io/data/legacy_pickle/0.17.1/0.17.1_x86_64_darwin_2.7.11.pickle
new file mode 100644
index 0000000000000..7af7e67ce8c43
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.17.1/0.17.1_x86_64_darwin_2.7.11.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.18.0/0.18.0_AMD64_windows_2.7.11.pickle b/pandas/tests/io/data/legacy_pickle/0.18.0/0.18.0_AMD64_windows_2.7.11.pickle
new file mode 100644
index 0000000000000..d244ce48b04c6
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.18.0/0.18.0_AMD64_windows_2.7.11.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.18.0/0.18.0_AMD64_windows_3.5.1.pickle b/pandas/tests/io/data/legacy_pickle/0.18.0/0.18.0_AMD64_windows_3.5.1.pickle
new file mode 100644
index 0000000000000..3733e16122709
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.18.0/0.18.0_AMD64_windows_3.5.1.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.18.0/0.18.0_x86_64_darwin_2.7.11.pickle b/pandas/tests/io/data/legacy_pickle/0.18.0/0.18.0_x86_64_darwin_2.7.11.pickle
new file mode 100644
index 0000000000000..3ce45c6949be0
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.18.0/0.18.0_x86_64_darwin_2.7.11.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.18.0/0.18.0_x86_64_darwin_3.5.1.pickle b/pandas/tests/io/data/legacy_pickle/0.18.0/0.18.0_x86_64_darwin_3.5.1.pickle
new file mode 100644
index 0000000000000..1eccef3903e01
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.18.0/0.18.0_x86_64_darwin_3.5.1.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.18.1/0.18.1_x86_64_darwin_2.7.12.pickle b/pandas/tests/io/data/legacy_pickle/0.18.1/0.18.1_x86_64_darwin_2.7.12.pickle
new file mode 100644
index 0000000000000..bb237f53476b5
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.18.1/0.18.1_x86_64_darwin_2.7.12.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.18.1/0.18.1_x86_64_darwin_3.5.2.pickle b/pandas/tests/io/data/legacy_pickle/0.18.1/0.18.1_x86_64_darwin_3.5.2.pickle
new file mode 100644
index 0000000000000..20af597c57a1b
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.18.1/0.18.1_x86_64_darwin_3.5.2.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_AMD64_windows_2.7.14.pickle b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_AMD64_windows_2.7.14.pickle
new file mode 100644
index 0000000000000..ddd88f77aa2a4
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_AMD64_windows_2.7.14.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_2.7.12.pickle b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_2.7.12.pickle
new file mode 100644
index 0000000000000..d702ab444df62
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_2.7.12.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_2.7.14.pickle b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_2.7.14.pickle
new file mode 100644
index 0000000000000..555be58cc33ac
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_2.7.14.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_3.6.1.pickle b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_3.6.1.pickle
new file mode 100644
index 0000000000000..75ea95ff402c4
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_3.6.1.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.20.3/0.20.3_x86_64_darwin_2.7.14.pickle b/pandas/tests/io/data/legacy_pickle/0.20.3/0.20.3_x86_64_darwin_2.7.14.pickle
new file mode 100644
index 0000000000000..963e533c4d2b4
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.20.3/0.20.3_x86_64_darwin_2.7.14.pickle differ
diff --git a/pandas/io/tests/data/macau.html b/pandas/tests/io/data/macau.html
similarity index 99%
rename from pandas/io/tests/data/macau.html
rename to pandas/tests/io/data/macau.html
index be62b3221518d..cfd1a0702460a 100644
--- a/pandas/io/tests/data/macau.html
+++ b/pandas/tests/io/data/macau.html
@@ -476,7 +476,7 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 	toggleclass: ["", "selected"], //Two CSS classes to be applied to the header when it's collapsed and expanded, respectively ["class1", "class2"]
 	togglehtml: ["", "", ""], //Additional HTML added to the header when it's collapsed and expanded, respectively  ["position", "html1", "html2"] (see docs)
 	animatespeed: "normal", //speed of animation: integer in milliseconds (ie: 200), or keywords "fast", "normal", or "slow"
-	oninit:function(headers, expandedindices){ //custom code to run when headers have initalized
+	oninit:function(headers, expandedindices){ //custom code to run when headers have initialized
 		//do nothing
 	},
 	onopenclose:function(header, index, state, isuseractivated){ //custom code to run whenever a header is opened or closed
diff --git a/pandas/io/tests/data/nyse_wsj.html b/pandas/tests/io/data/nyse_wsj.html
similarity index 100%
rename from pandas/io/tests/data/nyse_wsj.html
rename to pandas/tests/io/data/nyse_wsj.html
diff --git a/pandas/io/tests/data/spam.html b/pandas/tests/io/data/spam.html
similarity index 99%
rename from pandas/io/tests/data/spam.html
rename to pandas/tests/io/data/spam.html
index 935b39f6d6011..e4fadab6eafd2 100644
--- a/pandas/io/tests/data/spam.html
+++ b/pandas/tests/io/data/spam.html
@@ -208,7 +208,7 @@ <h1>Nutrient data for 07908, Luncheon meat, pork with ham, minced, canned, inclu
 	<table>
                 <thead>
                 
-                <tr><td colspan="6" style="vertical-align:middle;text-align:center;height:2em;" class="buttons"><input type="submit" name="_action_show" value="Apply Changes" class="calc" title="Click to recalculate measures" id="1732" /><a href="/ndb/help/contextHelp/measures" onclick="jQuery.ajax({type:'POST', url:'/ndb/help/contextHelp/measures',success:function(data,textStatus){jQuery('#helpDiv').html(data);},error:function(XMLHttpRequest,textStatus,errorThrown){},complete:function(XMLHttpRequest,textStatus){GRAILSUI.measuresHelpDialog.show();}});return false;" controller="help" action="contextHelp" id="measures"><img  title="Click for more information on calculating household measures" src="/ndb/static/images/skin/help.png" alt="Help" border="0" style="vertical-align:middle"/></a></span></td></tr>
+                <tr><td colspan="6" style="vertical-align:middle;text-align:center;height:2em;" class="buttons"><input type="submit" name="_action_show" value="Apply Changes" class="calc" title="Click to recalculate measures" id="1732" /><a href="/ndb/help/contextHelp/measures" onclick="jQuery.ajax({type:'POST', url:'/ndb/help/contextHelp/measures',success:function(data,textStatus){jQuery('#helpDiv').html(data);},error:function(XMLHttpRequest,textStatus,errorThrown){},complete:function(XMLHttpRequest,textStatus){GRAILSUI.measuresHelpDialog.show();}});return false;" controller="help" action="contextHelp" id="measures"><img title="Click for more information on calculating household measures" src="/ndb/static/images/skin/help.png" alt="Help" border="0" style="vertical-align:middle"/></a></span></td></tr>
                 <th style="vertical-align:middle">Nutrient</th>
 				<th style="vertical-align:middle" >Unit</th>
                 <th style="vertical-align:middle"><input type="text" name="Qv" style="width:30px;text-align:right;border-style:inset;height:15px" maxlength="5" value="1" id="Qv" /><br/>Value per 100.0g</th>
diff --git a/pandas/io/tests/data/stata10_115.dta b/pandas/tests/io/data/stata10_115.dta
old mode 100755
new mode 100644
similarity index 100%
rename from pandas/io/tests/data/stata10_115.dta
rename to pandas/tests/io/data/stata10_115.dta
diff --git a/pandas/io/tests/data/stata10_117.dta b/pandas/tests/io/data/stata10_117.dta
old mode 100755
new mode 100644
similarity index 100%
rename from pandas/io/tests/data/stata10_117.dta
rename to pandas/tests/io/data/stata10_117.dta
diff --git a/pandas/io/tests/data/stata11_115.dta b/pandas/tests/io/data/stata11_115.dta
old mode 100755
new mode 100644
similarity index 100%
rename from pandas/io/tests/data/stata11_115.dta
rename to pandas/tests/io/data/stata11_115.dta
diff --git a/pandas/io/tests/data/stata11_117.dta b/pandas/tests/io/data/stata11_117.dta
old mode 100755
new mode 100644
similarity index 100%
rename from pandas/io/tests/data/stata11_117.dta
rename to pandas/tests/io/data/stata11_117.dta
diff --git a/pandas/io/tests/data/stata12_117.dta b/pandas/tests/io/data/stata12_117.dta
similarity index 100%
rename from pandas/io/tests/data/stata12_117.dta
rename to pandas/tests/io/data/stata12_117.dta
diff --git a/pandas/tests/io/data/stata13_dates.dta b/pandas/tests/io/data/stata13_dates.dta
new file mode 100644
index 0000000000000..87b857559e501
Binary files /dev/null and b/pandas/tests/io/data/stata13_dates.dta differ
diff --git a/pandas/io/tests/data/stata14_118.dta b/pandas/tests/io/data/stata14_118.dta
similarity index 100%
rename from pandas/io/tests/data/stata14_118.dta
rename to pandas/tests/io/data/stata14_118.dta
diff --git a/pandas/tests/io/data/stata15.dta b/pandas/tests/io/data/stata15.dta
new file mode 100644
index 0000000000000..d13e2fa337db3
Binary files /dev/null and b/pandas/tests/io/data/stata15.dta differ
diff --git a/pandas/tests/io/data/stata16_118.dta b/pandas/tests/io/data/stata16_118.dta
new file mode 100644
index 0000000000000..49cfa49d1b302
Binary files /dev/null and b/pandas/tests/io/data/stata16_118.dta differ
diff --git a/pandas/io/tests/data/stata1_114.dta b/pandas/tests/io/data/stata1_114.dta
similarity index 100%
rename from pandas/io/tests/data/stata1_114.dta
rename to pandas/tests/io/data/stata1_114.dta
diff --git a/pandas/io/tests/data/stata1_117.dta b/pandas/tests/io/data/stata1_117.dta
similarity index 100%
rename from pandas/io/tests/data/stata1_117.dta
rename to pandas/tests/io/data/stata1_117.dta
diff --git a/pandas/io/tests/data/stata1_encoding.dta b/pandas/tests/io/data/stata1_encoding.dta
similarity index 100%
rename from pandas/io/tests/data/stata1_encoding.dta
rename to pandas/tests/io/data/stata1_encoding.dta
diff --git a/pandas/io/tests/data/stata2_113.dta b/pandas/tests/io/data/stata2_113.dta
similarity index 100%
rename from pandas/io/tests/data/stata2_113.dta
rename to pandas/tests/io/data/stata2_113.dta
diff --git a/pandas/io/tests/data/stata2_114.dta b/pandas/tests/io/data/stata2_114.dta
similarity index 100%
rename from pandas/io/tests/data/stata2_114.dta
rename to pandas/tests/io/data/stata2_114.dta
diff --git a/pandas/io/tests/data/stata2_115.dta b/pandas/tests/io/data/stata2_115.dta
similarity index 100%
rename from pandas/io/tests/data/stata2_115.dta
rename to pandas/tests/io/data/stata2_115.dta
diff --git a/pandas/io/tests/data/stata2_117.dta b/pandas/tests/io/data/stata2_117.dta
similarity index 100%
rename from pandas/io/tests/data/stata2_117.dta
rename to pandas/tests/io/data/stata2_117.dta
diff --git a/pandas/io/tests/data/stata3.csv b/pandas/tests/io/data/stata3.csv
similarity index 100%
rename from pandas/io/tests/data/stata3.csv
rename to pandas/tests/io/data/stata3.csv
diff --git a/pandas/io/tests/data/stata3_113.dta b/pandas/tests/io/data/stata3_113.dta
similarity index 100%
rename from pandas/io/tests/data/stata3_113.dta
rename to pandas/tests/io/data/stata3_113.dta
diff --git a/pandas/io/tests/data/stata3_114.dta b/pandas/tests/io/data/stata3_114.dta
similarity index 100%
rename from pandas/io/tests/data/stata3_114.dta
rename to pandas/tests/io/data/stata3_114.dta
diff --git a/pandas/io/tests/data/stata3_115.dta b/pandas/tests/io/data/stata3_115.dta
similarity index 100%
rename from pandas/io/tests/data/stata3_115.dta
rename to pandas/tests/io/data/stata3_115.dta
diff --git a/pandas/io/tests/data/stata3_117.dta b/pandas/tests/io/data/stata3_117.dta
similarity index 100%
rename from pandas/io/tests/data/stata3_117.dta
rename to pandas/tests/io/data/stata3_117.dta
diff --git a/pandas/io/tests/data/stata4_113.dta b/pandas/tests/io/data/stata4_113.dta
similarity index 100%
rename from pandas/io/tests/data/stata4_113.dta
rename to pandas/tests/io/data/stata4_113.dta
diff --git a/pandas/io/tests/data/stata4_114.dta b/pandas/tests/io/data/stata4_114.dta
similarity index 100%
rename from pandas/io/tests/data/stata4_114.dta
rename to pandas/tests/io/data/stata4_114.dta
diff --git a/pandas/io/tests/data/stata4_115.dta b/pandas/tests/io/data/stata4_115.dta
similarity index 100%
rename from pandas/io/tests/data/stata4_115.dta
rename to pandas/tests/io/data/stata4_115.dta
diff --git a/pandas/io/tests/data/stata4_117.dta b/pandas/tests/io/data/stata4_117.dta
similarity index 100%
rename from pandas/io/tests/data/stata4_117.dta
rename to pandas/tests/io/data/stata4_117.dta
diff --git a/pandas/io/tests/data/stata5.csv b/pandas/tests/io/data/stata5.csv
similarity index 100%
rename from pandas/io/tests/data/stata5.csv
rename to pandas/tests/io/data/stata5.csv
diff --git a/pandas/io/tests/data/stata5_113.dta b/pandas/tests/io/data/stata5_113.dta
similarity index 100%
rename from pandas/io/tests/data/stata5_113.dta
rename to pandas/tests/io/data/stata5_113.dta
diff --git a/pandas/io/tests/data/stata5_114.dta b/pandas/tests/io/data/stata5_114.dta
similarity index 100%
rename from pandas/io/tests/data/stata5_114.dta
rename to pandas/tests/io/data/stata5_114.dta
diff --git a/pandas/io/tests/data/stata5_115.dta b/pandas/tests/io/data/stata5_115.dta
similarity index 100%
rename from pandas/io/tests/data/stata5_115.dta
rename to pandas/tests/io/data/stata5_115.dta
diff --git a/pandas/io/tests/data/stata5_117.dta b/pandas/tests/io/data/stata5_117.dta
similarity index 100%
rename from pandas/io/tests/data/stata5_117.dta
rename to pandas/tests/io/data/stata5_117.dta
diff --git a/pandas/io/tests/data/stata6.csv b/pandas/tests/io/data/stata6.csv
similarity index 100%
rename from pandas/io/tests/data/stata6.csv
rename to pandas/tests/io/data/stata6.csv
diff --git a/pandas/io/tests/data/stata6_113.dta b/pandas/tests/io/data/stata6_113.dta
similarity index 100%
rename from pandas/io/tests/data/stata6_113.dta
rename to pandas/tests/io/data/stata6_113.dta
diff --git a/pandas/io/tests/data/stata6_114.dta b/pandas/tests/io/data/stata6_114.dta
similarity index 100%
rename from pandas/io/tests/data/stata6_114.dta
rename to pandas/tests/io/data/stata6_114.dta
diff --git a/pandas/io/tests/data/stata6_115.dta b/pandas/tests/io/data/stata6_115.dta
similarity index 100%
rename from pandas/io/tests/data/stata6_115.dta
rename to pandas/tests/io/data/stata6_115.dta
diff --git a/pandas/io/tests/data/stata6_117.dta b/pandas/tests/io/data/stata6_117.dta
similarity index 100%
rename from pandas/io/tests/data/stata6_117.dta
rename to pandas/tests/io/data/stata6_117.dta
diff --git a/pandas/tests/io/data/stata7_111.dta b/pandas/tests/io/data/stata7_111.dta
new file mode 100644
index 0000000000000..e87fa3a72ff8e
Binary files /dev/null and b/pandas/tests/io/data/stata7_111.dta differ
diff --git a/pandas/io/tests/data/stata7_115.dta b/pandas/tests/io/data/stata7_115.dta
similarity index 100%
rename from pandas/io/tests/data/stata7_115.dta
rename to pandas/tests/io/data/stata7_115.dta
diff --git a/pandas/io/tests/data/stata7_117.dta b/pandas/tests/io/data/stata7_117.dta
similarity index 100%
rename from pandas/io/tests/data/stata7_117.dta
rename to pandas/tests/io/data/stata7_117.dta
diff --git a/pandas/io/tests/data/stata8_113.dta b/pandas/tests/io/data/stata8_113.dta
similarity index 100%
rename from pandas/io/tests/data/stata8_113.dta
rename to pandas/tests/io/data/stata8_113.dta
diff --git a/pandas/io/tests/data/stata8_115.dta b/pandas/tests/io/data/stata8_115.dta
similarity index 100%
rename from pandas/io/tests/data/stata8_115.dta
rename to pandas/tests/io/data/stata8_115.dta
diff --git a/pandas/io/tests/data/stata8_117.dta b/pandas/tests/io/data/stata8_117.dta
similarity index 100%
rename from pandas/io/tests/data/stata8_117.dta
rename to pandas/tests/io/data/stata8_117.dta
diff --git a/pandas/io/tests/data/stata9_115.dta b/pandas/tests/io/data/stata9_115.dta
similarity index 100%
rename from pandas/io/tests/data/stata9_115.dta
rename to pandas/tests/io/data/stata9_115.dta
diff --git a/pandas/io/tests/data/stata9_117.dta b/pandas/tests/io/data/stata9_117.dta
similarity index 100%
rename from pandas/io/tests/data/stata9_117.dta
rename to pandas/tests/io/data/stata9_117.dta
diff --git a/pandas/io/tests/data/test1.csv b/pandas/tests/io/data/test1.csv
similarity index 100%
rename from pandas/io/tests/data/test1.csv
rename to pandas/tests/io/data/test1.csv
diff --git a/pandas/io/tests/data/test1.xls b/pandas/tests/io/data/test1.xls
similarity index 100%
rename from pandas/io/tests/data/test1.xls
rename to pandas/tests/io/data/test1.xls
diff --git a/pandas/io/tests/data/test1.xlsm b/pandas/tests/io/data/test1.xlsm
similarity index 100%
rename from pandas/io/tests/data/test1.xlsm
rename to pandas/tests/io/data/test1.xlsm
diff --git a/pandas/io/tests/data/test1.xlsx b/pandas/tests/io/data/test1.xlsx
similarity index 100%
rename from pandas/io/tests/data/test1.xlsx
rename to pandas/tests/io/data/test1.xlsx
diff --git a/pandas/io/tests/data/test2.xls b/pandas/tests/io/data/test2.xls
similarity index 100%
rename from pandas/io/tests/data/test2.xls
rename to pandas/tests/io/data/test2.xls
diff --git a/pandas/io/tests/data/test2.xlsm b/pandas/tests/io/data/test2.xlsm
similarity index 100%
rename from pandas/io/tests/data/test2.xlsm
rename to pandas/tests/io/data/test2.xlsm
diff --git a/pandas/io/tests/data/test2.xlsx b/pandas/tests/io/data/test2.xlsx
similarity index 100%
rename from pandas/io/tests/data/test2.xlsx
rename to pandas/tests/io/data/test2.xlsx
diff --git a/pandas/io/tests/data/test3.xls b/pandas/tests/io/data/test3.xls
similarity index 100%
rename from pandas/io/tests/data/test3.xls
rename to pandas/tests/io/data/test3.xls
diff --git a/pandas/io/tests/data/test3.xlsm b/pandas/tests/io/data/test3.xlsm
similarity index 100%
rename from pandas/io/tests/data/test3.xlsm
rename to pandas/tests/io/data/test3.xlsm
diff --git a/pandas/io/tests/data/test3.xlsx b/pandas/tests/io/data/test3.xlsx
similarity index 100%
rename from pandas/io/tests/data/test3.xlsx
rename to pandas/tests/io/data/test3.xlsx
diff --git a/pandas/io/tests/data/test4.xls b/pandas/tests/io/data/test4.xls
similarity index 100%
rename from pandas/io/tests/data/test4.xls
rename to pandas/tests/io/data/test4.xls
diff --git a/pandas/io/tests/data/test4.xlsm b/pandas/tests/io/data/test4.xlsm
similarity index 100%
rename from pandas/io/tests/data/test4.xlsm
rename to pandas/tests/io/data/test4.xlsm
diff --git a/pandas/io/tests/data/test4.xlsx b/pandas/tests/io/data/test4.xlsx
similarity index 100%
rename from pandas/io/tests/data/test4.xlsx
rename to pandas/tests/io/data/test4.xlsx
diff --git a/pandas/tests/io/data/test5.xls b/pandas/tests/io/data/test5.xls
new file mode 100644
index 0000000000000..4bb7cd4767dd7
Binary files /dev/null and b/pandas/tests/io/data/test5.xls differ
diff --git a/pandas/tests/io/data/test5.xlsm b/pandas/tests/io/data/test5.xlsm
new file mode 100644
index 0000000000000..845cec785b498
Binary files /dev/null and b/pandas/tests/io/data/test5.xlsm differ
diff --git a/pandas/tests/io/data/test5.xlsx b/pandas/tests/io/data/test5.xlsx
new file mode 100644
index 0000000000000..13781bb06048f
Binary files /dev/null and b/pandas/tests/io/data/test5.xlsx differ
diff --git a/pandas/io/tests/data/test_converters.xls b/pandas/tests/io/data/test_converters.xls
similarity index 100%
rename from pandas/io/tests/data/test_converters.xls
rename to pandas/tests/io/data/test_converters.xls
diff --git a/pandas/io/tests/data/test_converters.xlsm b/pandas/tests/io/data/test_converters.xlsm
similarity index 100%
rename from pandas/io/tests/data/test_converters.xlsm
rename to pandas/tests/io/data/test_converters.xlsm
diff --git a/pandas/io/tests/data/test_converters.xlsx b/pandas/tests/io/data/test_converters.xlsx
similarity index 100%
rename from pandas/io/tests/data/test_converters.xlsx
rename to pandas/tests/io/data/test_converters.xlsx
diff --git a/pandas/io/tests/data/test_index_name_pre17.xls b/pandas/tests/io/data/test_index_name_pre17.xls
similarity index 100%
rename from pandas/io/tests/data/test_index_name_pre17.xls
rename to pandas/tests/io/data/test_index_name_pre17.xls
diff --git a/pandas/io/tests/data/test_index_name_pre17.xlsm b/pandas/tests/io/data/test_index_name_pre17.xlsm
similarity index 100%
rename from pandas/io/tests/data/test_index_name_pre17.xlsm
rename to pandas/tests/io/data/test_index_name_pre17.xlsm
diff --git a/pandas/io/tests/data/test_index_name_pre17.xlsx b/pandas/tests/io/data/test_index_name_pre17.xlsx
similarity index 100%
rename from pandas/io/tests/data/test_index_name_pre17.xlsx
rename to pandas/tests/io/data/test_index_name_pre17.xlsx
diff --git a/pandas/tests/io/data/test_mmap.csv b/pandas/tests/io/data/test_mmap.csv
new file mode 100644
index 0000000000000..cc2cd7c30349b
--- /dev/null
+++ b/pandas/tests/io/data/test_mmap.csv
@@ -0,0 +1,5 @@
+a,b,c
+1,one,I
+2,two,II
+
+3,three,III
diff --git a/pandas/tests/io/data/test_multisheet.xls b/pandas/tests/io/data/test_multisheet.xls
new file mode 100644
index 0000000000000..7b4b9759a1a94
Binary files /dev/null and b/pandas/tests/io/data/test_multisheet.xls differ
diff --git a/pandas/tests/io/data/test_multisheet.xlsm b/pandas/tests/io/data/test_multisheet.xlsm
new file mode 100644
index 0000000000000..c6191bc61bc49
Binary files /dev/null and b/pandas/tests/io/data/test_multisheet.xlsm differ
diff --git a/pandas/tests/io/data/test_multisheet.xlsx b/pandas/tests/io/data/test_multisheet.xlsx
new file mode 100644
index 0000000000000..dc424a9963253
Binary files /dev/null and b/pandas/tests/io/data/test_multisheet.xlsx differ
diff --git a/pandas/tests/io/data/test_squeeze.xls b/pandas/tests/io/data/test_squeeze.xls
new file mode 100644
index 0000000000000..7261f4df13f08
Binary files /dev/null and b/pandas/tests/io/data/test_squeeze.xls differ
diff --git a/pandas/tests/io/data/test_squeeze.xlsm b/pandas/tests/io/data/test_squeeze.xlsm
new file mode 100644
index 0000000000000..d7fabe802ff52
Binary files /dev/null and b/pandas/tests/io/data/test_squeeze.xlsm differ
diff --git a/pandas/tests/io/data/test_squeeze.xlsx b/pandas/tests/io/data/test_squeeze.xlsx
new file mode 100644
index 0000000000000..89fc590cebcc7
Binary files /dev/null and b/pandas/tests/io/data/test_squeeze.xlsx differ
diff --git a/pandas/io/tests/data/test_types.xls b/pandas/tests/io/data/test_types.xls
similarity index 100%
rename from pandas/io/tests/data/test_types.xls
rename to pandas/tests/io/data/test_types.xls
diff --git a/pandas/io/tests/data/test_types.xlsm b/pandas/tests/io/data/test_types.xlsm
similarity index 100%
rename from pandas/io/tests/data/test_types.xlsm
rename to pandas/tests/io/data/test_types.xlsm
diff --git a/pandas/io/tests/data/test_types.xlsx b/pandas/tests/io/data/test_types.xlsx
similarity index 100%
rename from pandas/io/tests/data/test_types.xlsx
rename to pandas/tests/io/data/test_types.xlsx
diff --git a/pandas/tests/io/data/testdateoverflow.xls b/pandas/tests/io/data/testdateoverflow.xls
new file mode 100644
index 0000000000000..d63942f1b5f64
Binary files /dev/null and b/pandas/tests/io/data/testdateoverflow.xls differ
diff --git a/pandas/tests/io/data/testdateoverflow.xlsm b/pandas/tests/io/data/testdateoverflow.xlsm
new file mode 100644
index 0000000000000..0207549692e6a
Binary files /dev/null and b/pandas/tests/io/data/testdateoverflow.xlsm differ
diff --git a/pandas/tests/io/data/testdateoverflow.xlsx b/pandas/tests/io/data/testdateoverflow.xlsx
new file mode 100644
index 0000000000000..15f0e8825339e
Binary files /dev/null and b/pandas/tests/io/data/testdateoverflow.xlsx differ
diff --git a/pandas/tests/io/data/testdtype.xls b/pandas/tests/io/data/testdtype.xls
new file mode 100644
index 0000000000000..f63357524324f
Binary files /dev/null and b/pandas/tests/io/data/testdtype.xls differ
diff --git a/pandas/tests/io/data/testdtype.xlsm b/pandas/tests/io/data/testdtype.xlsm
new file mode 100644
index 0000000000000..20e658288d5ac
Binary files /dev/null and b/pandas/tests/io/data/testdtype.xlsm differ
diff --git a/pandas/tests/io/data/testdtype.xlsx b/pandas/tests/io/data/testdtype.xlsx
new file mode 100644
index 0000000000000..7c65263c373a3
Binary files /dev/null and b/pandas/tests/io/data/testdtype.xlsx differ
diff --git a/pandas/tests/io/data/testmultiindex.xls b/pandas/tests/io/data/testmultiindex.xls
new file mode 100644
index 0000000000000..51ef0f6c04cba
Binary files /dev/null and b/pandas/tests/io/data/testmultiindex.xls differ
diff --git a/pandas/tests/io/data/testmultiindex.xlsm b/pandas/tests/io/data/testmultiindex.xlsm
new file mode 100644
index 0000000000000..28c92a5f0be38
Binary files /dev/null and b/pandas/tests/io/data/testmultiindex.xlsm differ
diff --git a/pandas/tests/io/data/testmultiindex.xlsx b/pandas/tests/io/data/testmultiindex.xlsx
new file mode 100644
index 0000000000000..815f3b07342ca
Binary files /dev/null and b/pandas/tests/io/data/testmultiindex.xlsx differ
diff --git a/pandas/tests/io/data/testskiprows.xls b/pandas/tests/io/data/testskiprows.xls
new file mode 100644
index 0000000000000..21ccd30ec62da
Binary files /dev/null and b/pandas/tests/io/data/testskiprows.xls differ
diff --git a/pandas/tests/io/data/testskiprows.xlsm b/pandas/tests/io/data/testskiprows.xlsm
new file mode 100644
index 0000000000000..f5889ded4637a
Binary files /dev/null and b/pandas/tests/io/data/testskiprows.xlsm differ
diff --git a/pandas/tests/io/data/testskiprows.xlsx b/pandas/tests/io/data/testskiprows.xlsx
new file mode 100644
index 0000000000000..2d7ce943a7214
Binary files /dev/null and b/pandas/tests/io/data/testskiprows.xlsx differ
diff --git a/pandas/io/tests/data/times_1900.xls b/pandas/tests/io/data/times_1900.xls
similarity index 100%
rename from pandas/io/tests/data/times_1900.xls
rename to pandas/tests/io/data/times_1900.xls
diff --git a/pandas/io/tests/data/times_1900.xlsm b/pandas/tests/io/data/times_1900.xlsm
similarity index 100%
rename from pandas/io/tests/data/times_1900.xlsm
rename to pandas/tests/io/data/times_1900.xlsm
diff --git a/pandas/io/tests/data/times_1900.xlsx b/pandas/tests/io/data/times_1900.xlsx
similarity index 100%
rename from pandas/io/tests/data/times_1900.xlsx
rename to pandas/tests/io/data/times_1900.xlsx
diff --git a/pandas/io/tests/data/times_1904.xls b/pandas/tests/io/data/times_1904.xls
similarity index 100%
rename from pandas/io/tests/data/times_1904.xls
rename to pandas/tests/io/data/times_1904.xls
diff --git a/pandas/io/tests/data/times_1904.xlsm b/pandas/tests/io/data/times_1904.xlsm
similarity index 100%
rename from pandas/io/tests/data/times_1904.xlsm
rename to pandas/tests/io/data/times_1904.xlsm
diff --git a/pandas/io/tests/data/times_1904.xlsx b/pandas/tests/io/data/times_1904.xlsx
similarity index 100%
rename from pandas/io/tests/data/times_1904.xlsx
rename to pandas/tests/io/data/times_1904.xlsx
diff --git a/pandas/io/tests/data/tips.csv b/pandas/tests/io/data/tips.csv
similarity index 100%
rename from pandas/io/tests/data/tips.csv
rename to pandas/tests/io/data/tips.csv
diff --git a/pandas/io/tests/data/valid_markup.html b/pandas/tests/io/data/valid_markup.html
similarity index 100%
rename from pandas/io/tests/data/valid_markup.html
rename to pandas/tests/io/data/valid_markup.html
diff --git a/pandas/io/tests/data/wikipedia_states.html b/pandas/tests/io/data/wikipedia_states.html
similarity index 100%
rename from pandas/io/tests/data/wikipedia_states.html
rename to pandas/tests/io/data/wikipedia_states.html
diff --git a/pandas/tests/io/formats/__init__.py b/pandas/tests/io/formats/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/io/tests/data/unicode_series.csv b/pandas/tests/io/formats/data/unicode_series.csv
similarity index 100%
rename from pandas/io/tests/data/unicode_series.csv
rename to pandas/tests/io/formats/data/unicode_series.csv
diff --git a/pandas/tests/io/formats/test_css.py b/pandas/tests/io/formats/test_css.py
new file mode 100644
index 0000000000000..e7adfe4883d98
--- /dev/null
+++ b/pandas/tests/io/formats/test_css.py
@@ -0,0 +1,186 @@
+import pytest
+
+from pandas.util import testing as tm
+from pandas.io.formats.css import CSSResolver, CSSWarning
+
+
+def assert_resolves(css, props, inherited=None):
+    resolve = CSSResolver()
+    actual = resolve(css, inherited=inherited)
+    assert props == actual
+
+
+def assert_same_resolution(css1, css2, inherited=None):
+    resolve = CSSResolver()
+    resolved1 = resolve(css1, inherited=inherited)
+    resolved2 = resolve(css2, inherited=inherited)
+    assert resolved1 == resolved2
+
+
+@pytest.mark.parametrize('name,norm,abnorm', [
+    ('whitespace', 'hello: world; foo: bar',
+     ' \t hello \t :\n  world \n  ;  \n foo: \tbar\n\n'),
+    ('case', 'hello: world; foo: bar', 'Hello: WORLD; foO: bar'),
+    ('empty-decl', 'hello: world; foo: bar',
+     '; hello: world;; foo: bar;\n; ;'),
+    ('empty-list', '', ';'),
+])
+def test_css_parse_normalisation(name, norm, abnorm):
+    assert_same_resolution(norm, abnorm)
+
+
+@pytest.mark.parametrize(
+    'invalid_css,remainder', [
+        # No colon
+        ('hello-world', ''),
+        ('border-style: solid; hello-world', 'border-style: solid'),
+        ('border-style: solid; hello-world; font-weight: bold',
+         'border-style: solid; font-weight: bold'),
+        # Unclosed string fail
+        # Invalid size
+        ('font-size: blah', 'font-size: 1em'),
+        ('font-size: 1a2b', 'font-size: 1em'),
+        ('font-size: 1e5pt', 'font-size: 1em'),
+        ('font-size: 1+6pt', 'font-size: 1em'),
+        ('font-size: 1unknownunit', 'font-size: 1em'),
+        ('font-size: 10', 'font-size: 1em'),
+        ('font-size: 10 pt', 'font-size: 1em'),
+    ])
+def test_css_parse_invalid(invalid_css, remainder):
+    with tm.assert_produces_warning(CSSWarning):
+        assert_same_resolution(invalid_css, remainder)
+
+    # TODO: we should be checking that in other cases no warnings are raised
+
+
+@pytest.mark.parametrize(
+    'shorthand,expansions',
+    [('margin', ['margin-top', 'margin-right',
+                 'margin-bottom', 'margin-left']),
+     ('padding', ['padding-top', 'padding-right',
+                  'padding-bottom', 'padding-left']),
+     ('border-width', ['border-top-width', 'border-right-width',
+                       'border-bottom-width', 'border-left-width']),
+     ('border-color', ['border-top-color', 'border-right-color',
+                       'border-bottom-color', 'border-left-color']),
+     ('border-style', ['border-top-style', 'border-right-style',
+                       'border-bottom-style', 'border-left-style']),
+     ])
+def test_css_side_shorthands(shorthand, expansions):
+    top, right, bottom, left = expansions
+
+    assert_resolves('{shorthand}: 1pt'.format(shorthand=shorthand),
+                    {top: '1pt', right: '1pt',
+                     bottom: '1pt', left: '1pt'})
+
+    assert_resolves('{shorthand}: 1pt 4pt'.format(shorthand=shorthand),
+                    {top: '1pt', right: '4pt',
+                     bottom: '1pt', left: '4pt'})
+
+    assert_resolves('{shorthand}: 1pt 4pt 2pt'.format(shorthand=shorthand),
+                    {top: '1pt', right: '4pt',
+                     bottom: '2pt', left: '4pt'})
+
+    assert_resolves('{shorthand}: 1pt 4pt 2pt 0pt'.format(shorthand=shorthand),
+                    {top: '1pt', right: '4pt',
+                     bottom: '2pt', left: '0pt'})
+
+    with tm.assert_produces_warning(CSSWarning):
+        assert_resolves(
+            '{shorthand}: 1pt 1pt 1pt 1pt 1pt'.format(shorthand=shorthand), {})
+
+
+@pytest.mark.parametrize('style,inherited,equiv', [
+    ('margin: 1px; margin: 2px', '',
+     'margin: 2px'),
+    ('margin: 1px', 'margin: 2px',
+     'margin: 1px'),
+    ('margin: 1px; margin: inherit', 'margin: 2px',
+     'margin: 2px'),
+    ('margin: 1px; margin-top: 2px', '',
+     'margin-left: 1px; margin-right: 1px; ' +
+     'margin-bottom: 1px; margin-top: 2px'),
+    ('margin-top: 2px', 'margin: 1px',
+     'margin: 1px; margin-top: 2px'),
+    ('margin: 1px', 'margin-top: 2px',
+     'margin: 1px'),
+    ('margin: 1px; margin-top: inherit', 'margin: 2px',
+     'margin: 1px; margin-top: 2px'),
+])
+def test_css_precedence(style, inherited, equiv):
+    resolve = CSSResolver()
+    inherited_props = resolve(inherited)
+    style_props = resolve(style, inherited=inherited_props)
+    equiv_props = resolve(equiv)
+    assert style_props == equiv_props
+
+
+@pytest.mark.parametrize('style,equiv', [
+    ('margin: 1px; margin-top: inherit',
+     'margin-bottom: 1px; margin-right: 1px; margin-left: 1px'),
+    ('margin-top: inherit', ''),
+    ('margin-top: initial', ''),
+])
+def test_css_none_absent(style, equiv):
+    assert_same_resolution(style, equiv)
+
+
+@pytest.mark.parametrize('size,resolved', [
+    ('xx-small', '6pt'),
+    ('x-small', '{pt:f}pt'.format(pt=7.5)),
+    ('small', '{pt:f}pt'.format(pt=9.6)),
+    ('medium', '12pt'),
+    ('large', '{pt:f}pt'.format(pt=13.5)),
+    ('x-large', '18pt'),
+    ('xx-large', '24pt'),
+
+    ('8px', '6pt'),
+    ('1.25pc', '15pt'),
+    ('.25in', '18pt'),
+    ('02.54cm', '72pt'),
+    ('25.4mm', '72pt'),
+    ('101.6q', '72pt'),
+    ('101.6q', '72pt'),
+])
+@pytest.mark.parametrize('relative_to',  # invariant to inherited size
+                         [None, '16pt'])
+def test_css_absolute_font_size(size, relative_to, resolved):
+    if relative_to is None:
+        inherited = None
+    else:
+        inherited = {'font-size': relative_to}
+    assert_resolves('font-size: {size}'.format(size=size),
+                    {'font-size': resolved}, inherited=inherited)
+
+
+@pytest.mark.parametrize('size,relative_to,resolved', [
+    ('1em', None, '12pt'),
+    ('1.0em', None, '12pt'),
+    ('1.25em', None, '15pt'),
+    ('1em', '16pt', '16pt'),
+    ('1.0em', '16pt', '16pt'),
+    ('1.25em', '16pt', '20pt'),
+    ('1rem', '16pt', '12pt'),
+    ('1.0rem', '16pt', '12pt'),
+    ('1.25rem', '16pt', '15pt'),
+    ('100%', None, '12pt'),
+    ('125%', None, '15pt'),
+    ('100%', '16pt', '16pt'),
+    ('125%', '16pt', '20pt'),
+    ('2ex', None, '12pt'),
+    ('2.0ex', None, '12pt'),
+    ('2.50ex', None, '15pt'),
+    ('inherit', '16pt', '16pt'),
+
+    ('smaller', None, '10pt'),
+    ('smaller', '18pt', '15pt'),
+    ('larger', None, '{pt:f}pt'.format(pt=14.4)),
+    ('larger', '15pt', '18pt'),
+])
+def test_css_relative_font_size(size, relative_to, resolved):
+    if relative_to is None:
+        inherited = None
+    else:
+        inherited = {'font-size': relative_to}
+    assert_resolves('font-size: {size}'.format(size=size),
+                    {'font-size': resolved}, inherited=inherited)
diff --git a/pandas/tests/io/formats/test_eng_formatting.py b/pandas/tests/io/formats/test_eng_formatting.py
new file mode 100644
index 0000000000000..9d5773283176c
--- /dev/null
+++ b/pandas/tests/io/formats/test_eng_formatting.py
@@ -0,0 +1,193 @@
+import numpy as np
+import pandas as pd
+from pandas import DataFrame
+from pandas.compat import u
+import pandas.io.formats.format as fmt
+from pandas.util import testing as tm
+
+
+class TestEngFormatter(object):
+
+    def test_eng_float_formatter(self):
+        df = DataFrame({'A': [1.41, 141., 14100, 1410000.]})
+
+        fmt.set_eng_float_format()
+        result = df.to_string()
+        expected = ('             A\n'
+                    '0    1.410E+00\n'
+                    '1  141.000E+00\n'
+                    '2   14.100E+03\n'
+                    '3    1.410E+06')
+        assert result == expected
+
+        fmt.set_eng_float_format(use_eng_prefix=True)
+        result = df.to_string()
+        expected = ('         A\n'
+                    '0    1.410\n'
+                    '1  141.000\n'
+                    '2  14.100k\n'
+                    '3   1.410M')
+        assert result == expected
+
+        fmt.set_eng_float_format(accuracy=0)
+        result = df.to_string()
+        expected = ('         A\n'
+                    '0    1E+00\n'
+                    '1  141E+00\n'
+                    '2   14E+03\n'
+                    '3    1E+06')
+        assert result == expected
+
+        tm.reset_display_options()
+
+    def compare(self, formatter, input, output):
+        formatted_input = formatter(input)
+        assert formatted_input == output
+
+    def compare_all(self, formatter, in_out):
+        """
+        Parameters:
+        -----------
+        formatter: EngFormatter under test
+        in_out: list of tuples. Each tuple = (number, expected_formatting)
+
+        It is tested if 'formatter(number) == expected_formatting'.
+        *number* should be >= 0 because formatter(-number) == fmt is also
+        tested. *fmt* is derived from *expected_formatting*
+        """
+        for input, output in in_out:
+            self.compare(formatter, input, output)
+            self.compare(formatter, -input, "-" + output[1:])
+
+    def test_exponents_with_eng_prefix(self):
+        formatter = fmt.EngFormatter(accuracy=3, use_eng_prefix=True)
+        f = np.sqrt(2)
+        in_out = [
+            (f * 10 ** -24, " 1.414y"), (f * 10 ** -23, " 14.142y"),
+            (f * 10 ** -22, " 141.421y"), (f * 10 ** -21, " 1.414z"),
+            (f * 10 ** -20, " 14.142z"), (f * 10 ** -19, " 141.421z"),
+            (f * 10 ** -18, " 1.414a"), (f * 10 ** -17, " 14.142a"),
+            (f * 10 ** -16, " 141.421a"), (f * 10 ** -15, " 1.414f"),
+            (f * 10 ** -14, " 14.142f"), (f * 10 ** -13, " 141.421f"),
+            (f * 10 ** -12, " 1.414p"), (f * 10 ** -11, " 14.142p"),
+            (f * 10 ** -10, " 141.421p"), (f * 10 ** -9, " 1.414n"),
+            (f * 10 ** -8, " 14.142n"), (f * 10 ** -7, " 141.421n"),
+            (f * 10 ** -6, " 1.414u"), (f * 10 ** -5, " 14.142u"),
+            (f * 10 ** -4, " 141.421u"), (f * 10 ** -3, " 1.414m"),
+            (f * 10 ** -2, " 14.142m"), (f * 10 ** -1, " 141.421m"),
+            (f * 10 ** 0, " 1.414"), (f * 10 ** 1, " 14.142"),
+            (f * 10 ** 2, " 141.421"), (f * 10 ** 3, " 1.414k"),
+            (f * 10 ** 4, " 14.142k"), (f * 10 ** 5, " 141.421k"),
+            (f * 10 ** 6, " 1.414M"), (f * 10 ** 7, " 14.142M"),
+            (f * 10 ** 8, " 141.421M"), (f * 10 ** 9, " 1.414G"),
+            (f * 10 ** 10, " 14.142G"), (f * 10 ** 11, " 141.421G"),
+            (f * 10 ** 12, " 1.414T"), (f * 10 ** 13, " 14.142T"),
+            (f * 10 ** 14, " 141.421T"), (f * 10 ** 15, " 1.414P"),
+            (f * 10 ** 16, " 14.142P"), (f * 10 ** 17, " 141.421P"),
+            (f * 10 ** 18, " 1.414E"), (f * 10 ** 19, " 14.142E"),
+            (f * 10 ** 20, " 141.421E"), (f * 10 ** 21, " 1.414Z"),
+            (f * 10 ** 22, " 14.142Z"), (f * 10 ** 23, " 141.421Z"),
+            (f * 10 ** 24, " 1.414Y"), (f * 10 ** 25, " 14.142Y"),
+            (f * 10 ** 26, " 141.421Y")]
+        self.compare_all(formatter, in_out)
+
+    def test_exponents_without_eng_prefix(self):
+        formatter = fmt.EngFormatter(accuracy=4, use_eng_prefix=False)
+        f = np.pi
+        in_out = [
+            (f * 10 ** -24, " 3.1416E-24"),
+            (f * 10 ** -23, " 31.4159E-24"),
+            (f * 10 ** -22, " 314.1593E-24"),
+            (f * 10 ** -21, " 3.1416E-21"),
+            (f * 10 ** -20, " 31.4159E-21"),
+            (f * 10 ** -19, " 314.1593E-21"),
+            (f * 10 ** -18, " 3.1416E-18"),
+            (f * 10 ** -17, " 31.4159E-18"),
+            (f * 10 ** -16, " 314.1593E-18"),
+            (f * 10 ** -15, " 3.1416E-15"),
+            (f * 10 ** -14, " 31.4159E-15"),
+            (f * 10 ** -13, " 314.1593E-15"),
+            (f * 10 ** -12, " 3.1416E-12"),
+            (f * 10 ** -11, " 31.4159E-12"),
+            (f * 10 ** -10, " 314.1593E-12"),
+            (f * 10 ** -9, " 3.1416E-09"),
+            (f * 10 ** -8, " 31.4159E-09"),
+            (f * 10 ** -7, " 314.1593E-09"),
+            (f * 10 ** -6, " 3.1416E-06"),
+            (f * 10 ** -5, " 31.4159E-06"),
+            (f * 10 ** -4, " 314.1593E-06"),
+            (f * 10 ** -3, " 3.1416E-03"),
+            (f * 10 ** -2, " 31.4159E-03"),
+            (f * 10 ** -1, " 314.1593E-03"),
+            (f * 10 ** 0, " 3.1416E+00"),
+            (f * 10 ** 1, " 31.4159E+00"),
+            (f * 10 ** 2, " 314.1593E+00"),
+            (f * 10 ** 3, " 3.1416E+03"),
+            (f * 10 ** 4, " 31.4159E+03"),
+            (f * 10 ** 5, " 314.1593E+03"),
+            (f * 10 ** 6, " 3.1416E+06"),
+            (f * 10 ** 7, " 31.4159E+06"),
+            (f * 10 ** 8, " 314.1593E+06"),
+            (f * 10 ** 9, " 3.1416E+09"),
+            (f * 10 ** 10, " 31.4159E+09"),
+            (f * 10 ** 11, " 314.1593E+09"),
+            (f * 10 ** 12, " 3.1416E+12"),
+            (f * 10 ** 13, " 31.4159E+12"),
+            (f * 10 ** 14, " 314.1593E+12"),
+            (f * 10 ** 15, " 3.1416E+15"),
+            (f * 10 ** 16, " 31.4159E+15"),
+            (f * 10 ** 17, " 314.1593E+15"),
+            (f * 10 ** 18, " 3.1416E+18"),
+            (f * 10 ** 19, " 31.4159E+18"),
+            (f * 10 ** 20, " 314.1593E+18"),
+            (f * 10 ** 21, " 3.1416E+21"),
+            (f * 10 ** 22, " 31.4159E+21"),
+            (f * 10 ** 23, " 314.1593E+21"),
+            (f * 10 ** 24, " 3.1416E+24"),
+            (f * 10 ** 25, " 31.4159E+24"),
+            (f * 10 ** 26, " 314.1593E+24")]
+        self.compare_all(formatter, in_out)
+
+    def test_rounding(self):
+        formatter = fmt.EngFormatter(accuracy=3, use_eng_prefix=True)
+        in_out = [(5.55555, ' 5.556'), (55.5555, ' 55.556'),
+                  (555.555, ' 555.555'), (5555.55, ' 5.556k'),
+                  (55555.5, ' 55.556k'), (555555, ' 555.555k')]
+        self.compare_all(formatter, in_out)
+
+        formatter = fmt.EngFormatter(accuracy=1, use_eng_prefix=True)
+        in_out = [(5.55555, ' 5.6'), (55.5555, ' 55.6'), (555.555, ' 555.6'),
+                  (5555.55, ' 5.6k'), (55555.5, ' 55.6k'), (555555, ' 555.6k')]
+        self.compare_all(formatter, in_out)
+
+        formatter = fmt.EngFormatter(accuracy=0, use_eng_prefix=True)
+        in_out = [(5.55555, ' 6'), (55.5555, ' 56'), (555.555, ' 556'),
+                  (5555.55, ' 6k'), (55555.5, ' 56k'), (555555, ' 556k')]
+        self.compare_all(formatter, in_out)
+
+        formatter = fmt.EngFormatter(accuracy=3, use_eng_prefix=True)
+        result = formatter(0)
+        assert result == u(' 0.000')
+
+    def test_nan(self):
+        # Issue #11981
+
+        formatter = fmt.EngFormatter(accuracy=1, use_eng_prefix=True)
+        result = formatter(np.nan)
+        assert result == u('NaN')
+
+        df = pd.DataFrame({'a': [1.5, 10.3, 20.5],
+                           'b': [50.3, 60.67, 70.12],
+                           'c': [100.2, 101.33, 120.33]})
+        pt = df.pivot_table(values='a', index='b', columns='c')
+        fmt.set_eng_float_format(accuracy=1)
+        result = pt.to_string()
+        assert 'NaN' in result
+        tm.reset_display_options()
+
+    def test_inf(self):
+        # Issue #11981
+
+        formatter = fmt.EngFormatter(accuracy=1, use_eng_prefix=True)
+        result = formatter(np.inf)
+        assert result == u('inf')
diff --git a/pandas/tests/io/formats/test_format.py b/pandas/tests/io/formats/test_format.py
new file mode 100644
index 0000000000000..63b7cb3459069
--- /dev/null
+++ b/pandas/tests/io/formats/test_format.py
@@ -0,0 +1,2628 @@
+# -*- coding: utf-8 -*-
+
+"""
+Test output formatting for Series/DataFrame, including to_string & reprs
+"""
+
+from __future__ import print_function
+import re
+
+import pytz
+import dateutil
+import itertools
+from operator import methodcaller
+import os
+import sys
+import warnings
+from datetime import datetime
+
+import pytest
+
+import numpy as np
+import pandas as pd
+from pandas import (DataFrame, Series, Index, Timestamp, MultiIndex,
+                    date_range, NaT, read_table)
+from pandas.compat import (range, zip, lrange, StringIO, PY3,
+                           u, lzip, is_platform_windows,
+                           is_platform_32bit)
+import pandas.compat as compat
+
+import pandas.io.formats.format as fmt
+import pandas.io.formats.printing as printing
+
+import pandas.util.testing as tm
+from pandas.io.formats.terminal import get_terminal_size
+from pandas.core.config import (set_option, get_option, option_context,
+                                reset_option)
+
+use_32bit_repr = is_platform_windows() or is_platform_32bit()
+
+_frame = DataFrame(tm.getSeriesData())
+
+
+def curpath():
+    pth, _ = os.path.split(os.path.abspath(__file__))
+    return pth
+
+
+def has_info_repr(df):
+    r = repr(df)
+    c1 = r.split('\n')[0].startswith("<class")
+    c2 = r.split('\n')[0].startswith(r"&lt;class")  # _repr_html_
+    return c1 or c2
+
+
+def has_non_verbose_info_repr(df):
+    has_info = has_info_repr(df)
+    r = repr(df)
+
+    # 1. <class>
+    # 2. Index
+    # 3. Columns
+    # 4. dtype
+    # 5. memory usage
+    # 6. trailing newline
+    nv = len(r.split('\n')) == 6
+    return has_info and nv
+
+
+def has_horizontally_truncated_repr(df):
+    try:  # Check header row
+        fst_line = np.array(repr(df).splitlines()[0].split())
+        cand_col = np.where(fst_line == '...')[0][0]
+    except:
+        return False
+    # Make sure each row has this ... in the same place
+    r = repr(df)
+    for ix, l in enumerate(r.splitlines()):
+        if not r.split()[cand_col] == '...':
+            return False
+    return True
+
+
+def has_vertically_truncated_repr(df):
+    r = repr(df)
+    only_dot_row = False
+    for row in r.splitlines():
+        if re.match(r'^[\.\ ]+$', row):
+            only_dot_row = True
+    return only_dot_row
+
+
+def has_truncated_repr(df):
+    return has_horizontally_truncated_repr(
+        df) or has_vertically_truncated_repr(df)
+
+
+def has_doubly_truncated_repr(df):
+    return has_horizontally_truncated_repr(
+        df) and has_vertically_truncated_repr(df)
+
+
+def has_expanded_repr(df):
+    r = repr(df)
+    for line in r.split('\n'):
+        if line.endswith('\\'):
+            return True
+    return False
+
+
+class TestDataFrameFormatting(object):
+
+    def setup_method(self, method):
+        self.warn_filters = warnings.filters
+        warnings.filterwarnings('ignore', category=FutureWarning,
+                                module=".*format")
+
+        self.frame = _frame.copy()
+
+    def teardown_method(self, method):
+        warnings.filters = self.warn_filters
+
+    def test_repr_embedded_ndarray(self):
+        arr = np.empty(10, dtype=[('err', object)])
+        for i in range(len(arr)):
+            arr['err'][i] = np.random.randn(i)
+
+        df = DataFrame(arr)
+        repr(df['err'])
+        repr(df)
+        df.to_string()
+
+    def test_eng_float_formatter(self):
+        self.frame.loc[5] = 0
+
+        fmt.set_eng_float_format()
+        repr(self.frame)
+
+        fmt.set_eng_float_format(use_eng_prefix=True)
+        repr(self.frame)
+
+        fmt.set_eng_float_format(accuracy=0)
+        repr(self.frame)
+        tm.reset_display_options()
+
+    def test_show_null_counts(self):
+
+        df = DataFrame(1, columns=range(10), index=range(10))
+        df.iloc[1, 1] = np.nan
+
+        def check(null_counts, result):
+            buf = StringIO()
+            df.info(buf=buf, null_counts=null_counts)
+            assert ('non-null' in buf.getvalue()) is result
+
+        with option_context('display.max_info_rows', 20,
+                            'display.max_info_columns', 20):
+            check(None, True)
+            check(True, True)
+            check(False, False)
+
+        with option_context('display.max_info_rows', 5,
+                            'display.max_info_columns', 5):
+            check(None, False)
+            check(True, False)
+            check(False, False)
+
+    def test_repr_tuples(self):
+        buf = StringIO()
+
+        df = DataFrame({'tups': lzip(range(10), range(10))})
+        repr(df)
+        df.to_string(col_space=10, buf=buf)
+
+    def test_repr_truncation(self):
+        max_len = 20
+        with option_context("display.max_colwidth", max_len):
+            df = DataFrame({'A': np.random.randn(10),
+                            'B': [tm.rands(np.random.randint(
+                                max_len - 1, max_len + 1)) for i in range(10)
+            ]})
+            r = repr(df)
+            r = r[r.find('\n') + 1:]
+
+            adj = fmt._get_adjustment()
+
+            for line, value in lzip(r.split('\n'), df['B']):
+                if adj.len(value) + 1 > max_len:
+                    assert '...' in line
+                else:
+                    assert '...' not in line
+
+        with option_context("display.max_colwidth", 999999):
+            assert '...' not in repr(df)
+
+        with option_context("display.max_colwidth", max_len + 2):
+            assert '...' not in repr(df)
+
+    def test_repr_chop_threshold(self):
+        df = DataFrame([[0.1, 0.5], [0.5, -0.1]])
+        pd.reset_option("display.chop_threshold")  # default None
+        assert repr(df) == '     0    1\n0  0.1  0.5\n1  0.5 -0.1'
+
+        with option_context("display.chop_threshold", 0.2):
+            assert repr(df) == '     0    1\n0  0.0  0.5\n1  0.5  0.0'
+
+        with option_context("display.chop_threshold", 0.6):
+            assert repr(df) == '     0    1\n0  0.0  0.0\n1  0.0  0.0'
+
+        with option_context("display.chop_threshold", None):
+            assert repr(df) == '     0    1\n0  0.1  0.5\n1  0.5 -0.1'
+
+    def test_repr_chop_threshold_column_below(self):
+        # GH 6839: validation case
+
+        df = pd.DataFrame([[10, 20, 30, 40],
+                           [8e-10, -1e-11, 2e-9, -2e-11]]).T
+
+        with option_context("display.chop_threshold", 0):
+            assert repr(df) == ('      0             1\n'
+                                '0  10.0  8.000000e-10\n'
+                                '1  20.0 -1.000000e-11\n'
+                                '2  30.0  2.000000e-09\n'
+                                '3  40.0 -2.000000e-11')
+
+        with option_context("display.chop_threshold", 1e-8):
+            assert repr(df) == ('      0             1\n'
+                                '0  10.0  0.000000e+00\n'
+                                '1  20.0  0.000000e+00\n'
+                                '2  30.0  0.000000e+00\n'
+                                '3  40.0  0.000000e+00')
+
+        with option_context("display.chop_threshold", 5e-11):
+            assert repr(df) == ('      0             1\n'
+                                '0  10.0  8.000000e-10\n'
+                                '1  20.0  0.000000e+00\n'
+                                '2  30.0  2.000000e-09\n'
+                                '3  40.0  0.000000e+00')
+
+    def test_repr_obeys_max_seq_limit(self):
+        with option_context("display.max_seq_items", 2000):
+            assert len(printing.pprint_thing(lrange(1000))) > 1000
+
+        with option_context("display.max_seq_items", 5):
+            assert len(printing.pprint_thing(lrange(1000))) < 100
+
+    def test_repr_set(self):
+        assert printing.pprint_thing(set([1])) == '{1}'
+
+    def test_repr_is_valid_construction_code(self):
+        # for the case of Index, where the repr is traditional rather then
+        # stylized
+        idx = Index(['a', 'b'])
+        res = eval("pd." + repr(idx))
+        tm.assert_series_equal(Series(res), Series(idx))
+
+    def test_repr_should_return_str(self):
+        # https://docs.python.org/3/reference/datamodel.html#object.__repr__
+        # "...The return value must be a string object."
+
+        # (str on py2.x, str (unicode) on py3)
+
+        data = [8, 5, 3, 5]
+        index1 = [u("\u03c3"), u("\u03c4"), u("\u03c5"), u("\u03c6")]
+        cols = [u("\u03c8")]
+        df = DataFrame(data, columns=cols, index=index1)
+        assert type(df.__repr__()) == str  # both py2 / 3
+
+    def test_repr_no_backslash(self):
+        with option_context('mode.sim_interactive', True):
+            df = DataFrame(np.random.randn(10, 4))
+            assert '\\' not in repr(df)
+
+    def test_expand_frame_repr(self):
+        df_small = DataFrame('hello', [0], [0])
+        df_wide = DataFrame('hello', [0], lrange(10))
+        df_tall = DataFrame('hello', lrange(30), lrange(5))
+
+        with option_context('mode.sim_interactive', True):
+            with option_context('display.max_columns', 10, 'display.width', 20,
+                                'display.max_rows', 20,
+                                'display.show_dimensions', True):
+                with option_context('display.expand_frame_repr', True):
+                    assert not has_truncated_repr(df_small)
+                    assert not has_expanded_repr(df_small)
+                    assert not has_truncated_repr(df_wide)
+                    assert has_expanded_repr(df_wide)
+                    assert has_vertically_truncated_repr(df_tall)
+                    assert has_expanded_repr(df_tall)
+
+                with option_context('display.expand_frame_repr', False):
+                    assert not has_truncated_repr(df_small)
+                    assert not has_expanded_repr(df_small)
+                    assert not has_horizontally_truncated_repr(df_wide)
+                    assert not has_expanded_repr(df_wide)
+                    assert has_vertically_truncated_repr(df_tall)
+                    assert not has_expanded_repr(df_tall)
+
+    def test_repr_non_interactive(self):
+        # in non interactive mode, there can be no dependency on the
+        # result of terminal auto size detection
+        df = DataFrame('hello', lrange(1000), lrange(5))
+
+        with option_context('mode.sim_interactive', False, 'display.width', 0,
+                            'display.max_rows', 5000):
+            assert not has_truncated_repr(df)
+            assert not has_expanded_repr(df)
+
+    def test_repr_max_columns_max_rows(self):
+        term_width, term_height = get_terminal_size()
+        if term_width < 10 or term_height < 10:
+            pytest.skip("terminal size too small, "
+                        "{0} x {1}".format(term_width, term_height))
+
+        def mkframe(n):
+            index = ['{i:05d}'.format(i=i) for i in range(n)]
+            return DataFrame(0, index, index)
+
+        df6 = mkframe(6)
+        df10 = mkframe(10)
+        with option_context('mode.sim_interactive', True):
+            with option_context('display.width', term_width * 2):
+                with option_context('display.max_rows', 5,
+                                    'display.max_columns', 5):
+                    assert not has_expanded_repr(mkframe(4))
+                    assert not has_expanded_repr(mkframe(5))
+                    assert not has_expanded_repr(df6)
+                    assert has_doubly_truncated_repr(df6)
+
+                with option_context('display.max_rows', 20,
+                                    'display.max_columns', 10):
+                    # Out off max_columns boundary, but no extending
+                    # since not exceeding width
+                    assert not has_expanded_repr(df6)
+                    assert not has_truncated_repr(df6)
+
+                with option_context('display.max_rows', 9,
+                                    'display.max_columns', 10):
+                    # out vertical bounds can not result in exanded repr
+                    assert not has_expanded_repr(df10)
+                    assert has_vertically_truncated_repr(df10)
+
+            # width=None in terminal, auto detection
+            with option_context('display.max_columns', 100, 'display.max_rows',
+                                term_width * 20, 'display.width', None):
+                df = mkframe((term_width // 7) - 2)
+                assert not has_expanded_repr(df)
+                df = mkframe((term_width // 7) + 2)
+                printing.pprint_thing(df._repr_fits_horizontal_())
+                assert has_expanded_repr(df)
+
+    def test_str_max_colwidth(self):
+        # GH 7856
+        df = pd.DataFrame([{'a': 'foo',
+                            'b': 'bar',
+                            'c': 'uncomfortably long line with lots of stuff',
+                            'd': 1}, {'a': 'foo',
+                                      'b': 'bar',
+                                      'c': 'stuff',
+                                      'd': 1}])
+        df.set_index(['a', 'b', 'c'])
+        assert str(df) == (
+            '     a    b                                           c  d\n'
+            '0  foo  bar  uncomfortably long line with lots of stuff  1\n'
+            '1  foo  bar                                       stuff  1')
+        with option_context('max_colwidth', 20):
+            assert str(df) == ('     a    b                    c  d\n'
+                               '0  foo  bar  uncomfortably lo...  1\n'
+                               '1  foo  bar                stuff  1')
+
+    def test_auto_detect(self):
+        term_width, term_height = get_terminal_size()
+        fac = 1.05  # Arbitrary large factor to exceed term width
+        cols = range(int(term_width * fac))
+        index = range(10)
+        df = DataFrame(index=index, columns=cols)
+        with option_context('mode.sim_interactive', True):
+            with option_context('max_rows', None):
+                with option_context('max_columns', None):
+                    # Wrap around with None
+                    assert has_expanded_repr(df)
+            with option_context('max_rows', 0):
+                with option_context('max_columns', 0):
+                    # Truncate with auto detection.
+                    assert has_horizontally_truncated_repr(df)
+
+            index = range(int(term_height * fac))
+            df = DataFrame(index=index, columns=cols)
+            with option_context('max_rows', 0):
+                with option_context('max_columns', None):
+                    # Wrap around with None
+                    assert has_expanded_repr(df)
+                    # Truncate vertically
+                    assert has_vertically_truncated_repr(df)
+
+            with option_context('max_rows', None):
+                with option_context('max_columns', 0):
+                    assert has_horizontally_truncated_repr(df)
+
+    def test_to_string_repr_unicode(self):
+        buf = StringIO()
+
+        unicode_values = [u('\u03c3')] * 10
+        unicode_values = np.array(unicode_values, dtype=object)
+        df = DataFrame({'unicode': unicode_values})
+        df.to_string(col_space=10, buf=buf)
+
+        # it works!
+        repr(df)
+
+        idx = Index(['abc', u('\u03c3a'), 'aegdvg'])
+        ser = Series(np.random.randn(len(idx)), idx)
+        rs = repr(ser).split('\n')
+        line_len = len(rs[0])
+        for line in rs[1:]:
+            try:
+                line = line.decode(get_option("display.encoding"))
+            except:
+                pass
+            if not line.startswith('dtype:'):
+                assert len(line) == line_len
+
+        # it works even if sys.stdin in None
+        _stdin = sys.stdin
+        try:
+            sys.stdin = None
+            repr(df)
+        finally:
+            sys.stdin = _stdin
+
+    def test_to_string_unicode_columns(self):
+        df = DataFrame({u('\u03c3'): np.arange(10.)})
+
+        buf = StringIO()
+        df.to_string(buf=buf)
+        buf.getvalue()
+
+        buf = StringIO()
+        df.info(buf=buf)
+        buf.getvalue()
+
+        result = self.frame.to_string()
+        assert isinstance(result, compat.text_type)
+
+    def test_to_string_utf8_columns(self):
+        n = u("\u05d0").encode('utf-8')
+
+        with option_context('display.max_rows', 1):
+            df = DataFrame([1, 2], columns=[n])
+            repr(df)
+
+    def test_to_string_unicode_two(self):
+        dm = DataFrame({u('c/\u03c3'): []})
+        buf = StringIO()
+        dm.to_string(buf)
+
+    def test_to_string_unicode_three(self):
+        dm = DataFrame(['\xc2'])
+        buf = StringIO()
+        dm.to_string(buf)
+
+    def test_to_string_with_formatters(self):
+        df = DataFrame({'int': [1, 2, 3],
+                        'float': [1.0, 2.0, 3.0],
+                        'object': [(1, 2), True, False]},
+                       columns=['int', 'float', 'object'])
+
+        formatters = [('int', lambda x: '0x{x:x}'.format(x=x)),
+                      ('float', lambda x: '[{x: 4.1f}]'.format(x=x)),
+                      ('object', lambda x: '-{x!s}-'.format(x=x))]
+        result = df.to_string(formatters=dict(formatters))
+        result2 = df.to_string(formatters=lzip(*formatters)[1])
+        assert result == ('  int  float    object\n'
+                          '0 0x1 [ 1.0]  -(1, 2)-\n'
+                          '1 0x2 [ 2.0]    -True-\n'
+                          '2 0x3 [ 3.0]   -False-')
+        assert result == result2
+
+    def test_to_string_with_datetime64_monthformatter(self):
+        months = [datetime(2016, 1, 1), datetime(2016, 2, 2)]
+        x = DataFrame({'months': months})
+
+        def format_func(x):
+            return x.strftime('%Y-%m')
+        result = x.to_string(formatters={'months': format_func})
+        expected = 'months\n0 2016-01\n1 2016-02'
+        assert result.strip() == expected
+
+    def test_to_string_with_datetime64_hourformatter(self):
+
+        x = DataFrame({'hod': pd.to_datetime(['10:10:10.100', '12:12:12.120'],
+                                             format='%H:%M:%S.%f')})
+
+        def format_func(x):
+            return x.strftime('%H:%M')
+
+        result = x.to_string(formatters={'hod': format_func})
+        expected = 'hod\n0 10:10\n1 12:12'
+        assert result.strip() == expected
+
+    def test_to_string_with_formatters_unicode(self):
+        df = DataFrame({u('c/\u03c3'): [1, 2, 3]})
+        result = df.to_string(
+            formatters={u('c/\u03c3'): lambda x: '{x}'.format(x=x)})
+        assert result == u('  c/\u03c3\n') + '0   1\n1   2\n2   3'
+
+    def test_east_asian_unicode_frame(self):
+        if PY3:
+            _rep = repr
+        else:
+            _rep = unicode  # noqa
+
+        # not alighned properly because of east asian width
+
+        # mid col
+        df = DataFrame({'a': [u'あ', u'いいい', u'う', u'ええええええ'],
+                        'b': [1, 222, 33333, 4]},
+                       index=['a', 'bb', 'c', 'ddd'])
+        expected = (u"          a      b\na         あ      1\n"
+                    u"bb      いいい    222\nc         う  33333\n"
+                    u"ddd  ええええええ      4")
+        assert _rep(df) == expected
+
+        # last col
+        df = DataFrame({'a': [1, 222, 33333, 4],
+                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                       index=['a', 'bb', 'c', 'ddd'])
+        expected = (u"         a       b\na        1       あ\n"
+                    u"bb     222     いいい\nc    33333       う\n"
+                    u"ddd      4  ええええええ")
+        assert _rep(df) == expected
+
+        # all col
+        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                       index=['a', 'bb', 'c', 'ddd'])
+        expected = (u"         a       b\na    あああああ       あ\n"
+                    u"bb       い     いいい\nc        う       う\n"
+                    u"ddd    えええ  ええええええ")
+        assert _rep(df) == expected
+
+        # column name
+        df = DataFrame({'b': [u'あ', u'いいい', u'う', u'ええええええ'],
+                        u'あああああ': [1, 222, 33333, 4]},
+                       index=['a', 'bb', 'c', 'ddd'])
+        expected = (u"          b  あああああ\na         あ      1\n"
+                    u"bb      いいい    222\nc         う  33333\n"
+                    u"ddd  ええええええ      4")
+        assert _rep(df) == expected
+
+        # index
+        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                       index=[u'あああ', u'いいいいいい', u'うう', u'え'])
+        expected = (u"            a       b\nあああ     あああああ       あ\n"
+                    u"いいいいいい      い     いいい\nうう          う       う\n"
+                    u"え         えええ  ええええええ")
+        assert _rep(df) == expected
+
+        # index name
+        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                       index=pd.Index([u'あ', u'い', u'うう', u'え'],
+                                      name=u'おおおお'))
+        expected = (u"          a       b\n"
+                    u"おおおお               \n"
+                    u"あ     あああああ       あ\n"
+                    u"い         い     いいい\n"
+                    u"うう        う       う\n"
+                    u"え       えええ  ええええええ")
+        assert _rep(df) == expected
+
+        # all
+        df = DataFrame({u'あああ': [u'あああ', u'い', u'う', u'えええええ'],
+                        u'いいいいい': [u'あ', u'いいい', u'う', u'ええ']},
+                       index=pd.Index([u'あ', u'いいい', u'うう', u'え'],
+                                      name=u'お'))
+        expected = (u"       あああ いいいいい\n"
+                    u"お               \n"
+                    u"あ      あああ     あ\n"
+                    u"いいい      い   いいい\n"
+                    u"うう       う     う\n"
+                    u"え    えええええ    ええ")
+        assert _rep(df) == expected
+
+        # MultiIndex
+        idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'), (
+            u'おおお', u'かかかか'), (u'き', u'くく')])
+        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                       index=idx)
+        expected = (u"              a       b\n"
+                    u"あ   いい    あああああ       あ\n"
+                    u"う   え         い     いいい\n"
+                    u"おおお かかかか      う       う\n"
+                    u"き   くく      えええ  ええええええ")
+        assert _rep(df) == expected
+
+        # truncate
+        with option_context('display.max_rows', 3, 'display.max_columns', 3):
+            df = pd.DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                               'b': [u'あ', u'いいい', u'う', u'ええええええ'],
+                               'c': [u'お', u'か', u'ききき', u'くくくくくく'],
+                               u'ああああ': [u'さ', u'し', u'す', u'せ']},
+                              columns=['a', 'b', 'c', u'ああああ'])
+
+            expected = (u"        a ...  ああああ\n0   あああああ ...     さ\n"
+                        u"..    ... ...   ...\n3     えええ ...     せ\n"
+                        u"\n[4 rows x 4 columns]")
+            assert _rep(df) == expected
+
+            df.index = [u'あああ', u'いいいい', u'う', 'aaa']
+            expected = (u"         a ...  ああああ\nあああ  あああああ ...     さ\n"
+                        u"..     ... ...   ...\naaa    えええ ...     せ\n"
+                        u"\n[4 rows x 4 columns]")
+            assert _rep(df) == expected
+
+        # Emable Unicode option -----------------------------------------
+        with option_context('display.unicode.east_asian_width', True):
+
+            # mid col
+            df = DataFrame({'a': [u'あ', u'いいい', u'う', u'ええええええ'],
+                            'b': [1, 222, 33333, 4]},
+                           index=['a', 'bb', 'c', 'ddd'])
+            expected = (u"                a      b\na              あ      1\n"
+                        u"bb         いいい    222\nc              う  33333\n"
+                        u"ddd  ええええええ      4")
+            assert _rep(df) == expected
+
+            # last col
+            df = DataFrame({'a': [1, 222, 33333, 4],
+                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                           index=['a', 'bb', 'c', 'ddd'])
+            expected = (u"         a             b\na        1            あ\n"
+                        u"bb     222        いいい\nc    33333            う\n"
+                        u"ddd      4  ええええええ")
+            assert _rep(df) == expected
+
+            # all col
+            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                           index=['a', 'bb', 'c', 'ddd'])
+            expected = (u"              a             b\n"
+                        u"a    あああああ            あ\n"
+                        u"bb           い        いいい\n"
+                        u"c            う            う\n"
+                        u"ddd      えええ  ええええええ")
+            assert _rep(df) == expected
+
+            # column name
+            df = DataFrame({'b': [u'あ', u'いいい', u'う', u'ええええええ'],
+                            u'あああああ': [1, 222, 33333, 4]},
+                           index=['a', 'bb', 'c', 'ddd'])
+            expected = (u"                b  あああああ\n"
+                        u"a              あ           1\n"
+                        u"bb         いいい         222\n"
+                        u"c              う       33333\n"
+                        u"ddd  ええええええ           4")
+            assert _rep(df) == expected
+
+            # index
+            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                           index=[u'あああ', u'いいいいいい', u'うう', u'え'])
+            expected = (u"                       a             b\n"
+                        u"あああ        あああああ            あ\n"
+                        u"いいいいいい          い        いいい\n"
+                        u"うう                  う            う\n"
+                        u"え                えええ  ええええええ")
+            assert _rep(df) == expected
+
+            # index name
+            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                           index=pd.Index([u'あ', u'い', u'うう', u'え'],
+                                          name=u'おおおお'))
+            expected = (u"                   a             b\n"
+                        u"おおおお                          \n"
+                        u"あ        あああああ            あ\n"
+                        u"い                い        いいい\n"
+                        u"うう              う            う\n"
+                        u"え            えええ  ええええええ")
+            assert _rep(df) == expected
+
+            # all
+            df = DataFrame({u'あああ': [u'あああ', u'い', u'う', u'えええええ'],
+                            u'いいいいい': [u'あ', u'いいい', u'う', u'ええ']},
+                           index=pd.Index([u'あ', u'いいい', u'うう', u'え'],
+                                          name=u'お'))
+            expected = (u"            あああ いいいいい\n"
+                        u"お                           \n"
+                        u"あ          あああ         あ\n"
+                        u"いいい          い     いいい\n"
+                        u"うう            う         う\n"
+                        u"え      えええええ       ええ")
+            assert _rep(df) == expected
+
+            # MultiIndex
+            idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'), (
+                u'おおお', u'かかかか'), (u'き', u'くく')])
+            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                           index=idx)
+            expected = (u"                          a             b\n"
+                        u"あ     いい      あああああ            あ\n"
+                        u"う     え                い        いいい\n"
+                        u"おおお かかかか          う            う\n"
+                        u"き     くく          えええ  ええええええ")
+            assert _rep(df) == expected
+
+            # truncate
+            with option_context('display.max_rows', 3, 'display.max_columns',
+                                3):
+
+                df = pd.DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                                   'b': [u'あ', u'いいい', u'う', u'ええええええ'],
+                                   'c': [u'お', u'か', u'ききき', u'くくくくくく'],
+                                   u'ああああ': [u'さ', u'し', u'す', u'せ']},
+                                  columns=['a', 'b', 'c', u'ああああ'])
+
+                expected = (u"             a   ...    ああああ\n"
+                            u"0   あああああ   ...          さ\n"
+                            u"..         ...   ...         ...\n"
+                            u"3       えええ   ...          せ\n"
+                            u"\n[4 rows x 4 columns]")
+                assert _rep(df) == expected
+
+                df.index = [u'あああ', u'いいいい', u'う', 'aaa']
+                expected = (u"                 a   ...    ああああ\n"
+                            u"あああ  あああああ   ...          さ\n"
+                            u"...            ...   ...         ...\n"
+                            u"aaa         えええ   ...          せ\n"
+                            u"\n[4 rows x 4 columns]")
+                assert _rep(df) == expected
+
+            # ambiguous unicode
+            df = DataFrame({'b': [u'あ', u'いいい', u'¡¡', u'ええええええ'],
+                            u'あああああ': [1, 222, 33333, 4]},
+                           index=['a', 'bb', 'c', '¡¡¡'])
+            expected = (u"                b  あああああ\n"
+                        u"a              あ           1\n"
+                        u"bb         いいい         222\n"
+                        u"c              ¡¡       33333\n"
+                        u"¡¡¡  ええええええ           4")
+            assert _rep(df) == expected
+
+    def test_to_string_buffer_all_unicode(self):
+        buf = StringIO()
+
+        empty = DataFrame({u('c/\u03c3'): Series()})
+        nonempty = DataFrame({u('c/\u03c3'): Series([1, 2, 3])})
+
+        print(empty, file=buf)
+        print(nonempty, file=buf)
+
+        # this should work
+        buf.getvalue()
+
+    def test_to_string_with_col_space(self):
+        df = DataFrame(np.random.random(size=(1, 3)))
+        c10 = len(df.to_string(col_space=10).split("\n")[1])
+        c20 = len(df.to_string(col_space=20).split("\n")[1])
+        c30 = len(df.to_string(col_space=30).split("\n")[1])
+        assert c10 < c20 < c30
+
+        # GH 8230
+        # col_space wasn't being applied with header=False
+        with_header = df.to_string(col_space=20)
+        with_header_row1 = with_header.splitlines()[1]
+        no_header = df.to_string(col_space=20, header=False)
+        assert len(with_header_row1) == len(no_header)
+
+    def test_to_string_truncate_indices(self):
+        for index in [tm.makeStringIndex, tm.makeUnicodeIndex, tm.makeIntIndex,
+                      tm.makeDateIndex, tm.makePeriodIndex]:
+            for column in [tm.makeStringIndex]:
+                for h in [10, 20]:
+                    for w in [10, 20]:
+                        with option_context("display.expand_frame_repr",
+                                            False):
+                            df = DataFrame(index=index(h), columns=column(w))
+                            with option_context("display.max_rows", 15):
+                                if h == 20:
+                                    assert has_vertically_truncated_repr(df)
+                                else:
+                                    assert not has_vertically_truncated_repr(
+                                        df)
+                            with option_context("display.max_columns", 15):
+                                if w == 20:
+                                    assert has_horizontally_truncated_repr(df)
+                                else:
+                                    assert not (
+                                        has_horizontally_truncated_repr(df))
+                            with option_context("display.max_rows", 15,
+                                                "display.max_columns", 15):
+                                if h == 20 and w == 20:
+                                    assert has_doubly_truncated_repr(df)
+                                else:
+                                    assert not has_doubly_truncated_repr(
+                                        df)
+
+    def test_to_string_truncate_multilevel(self):
+        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+        df = DataFrame(index=arrays, columns=arrays)
+        with option_context("display.max_rows", 7, "display.max_columns", 7):
+            assert has_doubly_truncated_repr(df)
+
+    def test_truncate_with_different_dtypes(self):
+
+        # 11594, 12045
+        # when truncated the dtypes of the splits can differ
+
+        # 11594
+        import datetime
+        s = Series([datetime.datetime(2012, 1, 1)] * 10 +
+                   [datetime.datetime(1012, 1, 2)] + [
+            datetime.datetime(2012, 1, 3)] * 10)
+
+        with pd.option_context('display.max_rows', 8):
+            result = str(s)
+            assert 'object' in result
+
+        # 12045
+        df = DataFrame({'text': ['some words'] + [None] * 9})
+
+        with pd.option_context('display.max_rows', 8,
+                               'display.max_columns', 3):
+            result = str(df)
+            assert 'None' in result
+            assert 'NaN' not in result
+
+    def test_datetimelike_frame(self):
+
+        # GH 12211
+        df = DataFrame(
+            {'date': [pd.Timestamp('20130101').tz_localize('UTC')] +
+                     [pd.NaT] * 5})
+
+        with option_context("display.max_rows", 5):
+            result = str(df)
+            assert '2013-01-01 00:00:00+00:00' in result
+            assert 'NaT' in result
+            assert '...' in result
+            assert '[6 rows x 1 columns]' in result
+
+        dts = [pd.Timestamp('2011-01-01', tz='US/Eastern')] * 5 + [pd.NaT] * 5
+        df = pd.DataFrame({"dt": dts,
+                           "x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]})
+        with option_context('display.max_rows', 5):
+            expected = ('                          dt   x\n'
+                        '0  2011-01-01 00:00:00-05:00   1\n'
+                        '1  2011-01-01 00:00:00-05:00   2\n'
+                        '..                       ...  ..\n'
+                        '8                        NaT   9\n'
+                        '9                        NaT  10\n\n'
+                        '[10 rows x 2 columns]')
+            assert repr(df) == expected
+
+        dts = [pd.NaT] * 5 + [pd.Timestamp('2011-01-01', tz='US/Eastern')] * 5
+        df = pd.DataFrame({"dt": dts,
+                           "x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]})
+        with option_context('display.max_rows', 5):
+            expected = ('                          dt   x\n'
+                        '0                        NaT   1\n'
+                        '1                        NaT   2\n'
+                        '..                       ...  ..\n'
+                        '8  2011-01-01 00:00:00-05:00   9\n'
+                        '9  2011-01-01 00:00:00-05:00  10\n\n'
+                        '[10 rows x 2 columns]')
+            assert repr(df) == expected
+
+        dts = ([pd.Timestamp('2011-01-01', tz='Asia/Tokyo')] * 5 +
+               [pd.Timestamp('2011-01-01', tz='US/Eastern')] * 5)
+        df = pd.DataFrame({"dt": dts,
+                           "x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]})
+        with option_context('display.max_rows', 5):
+            expected = ('                           dt   x\n'
+                        '0   2011-01-01 00:00:00+09:00   1\n'
+                        '1   2011-01-01 00:00:00+09:00   2\n'
+                        '..                        ...  ..\n'
+                        '8   2011-01-01 00:00:00-05:00   9\n'
+                        '9   2011-01-01 00:00:00-05:00  10\n\n'
+                        '[10 rows x 2 columns]')
+            assert repr(df) == expected
+
+    @pytest.mark.parametrize('start_date', [
+        '2017-01-01 23:59:59.999999999',
+        '2017-01-01 23:59:59.99999999',
+        '2017-01-01 23:59:59.9999999',
+        '2017-01-01 23:59:59.999999',
+        '2017-01-01 23:59:59.99999',
+        '2017-01-01 23:59:59.9999',
+    ])
+    def test_datetimeindex_highprecision(self, start_date):
+        # GH19030
+        # Check that high-precision time values for the end of day are
+        # included in repr for DatetimeIndex
+        df = DataFrame({'A': date_range(start=start_date,
+                                        freq='D', periods=5)})
+        result = str(df)
+        assert start_date in result
+
+        dti = date_range(start=start_date,
+                         freq='D', periods=5)
+        df = DataFrame({'A': range(5)}, index=dti)
+        result = str(df.index)
+        assert start_date in result
+
+    def test_nonunicode_nonascii_alignment(self):
+        df = DataFrame([["aa\xc3\xa4\xc3\xa4", 1], ["bbbb", 2]])
+        rep_str = df.to_string()
+        lines = rep_str.split('\n')
+        assert len(lines[1]) == len(lines[2])
+
+    def test_unicode_problem_decoding_as_ascii(self):
+        dm = DataFrame({u('c/\u03c3'): Series({'test': np.nan})})
+        compat.text_type(dm.to_string())
+
+    def test_string_repr_encoding(self, datapath):
+        filepath = datapath('io', 'formats', 'data', 'unicode_series.csv')
+        df = pd.read_csv(filepath, header=None, encoding='latin1')
+        repr(df)
+        repr(df[1])
+
+    def test_repr_corner(self):
+        # representing infs poses no problems
+        df = DataFrame({'foo': [-np.inf, np.inf]})
+        repr(df)
+
+    def test_frame_info_encoding(self):
+        index = ['\'Til There Was You (1997)',
+                 'ldum klaka (Cold Fever) (1994)']
+        fmt.set_option('display.max_rows', 1)
+        df = DataFrame(columns=['a', 'b', 'c'], index=index)
+        repr(df)
+        repr(df.T)
+        fmt.set_option('display.max_rows', 200)
+
+    def test_pprint_thing(self):
+        from pandas.io.formats.printing import pprint_thing as pp_t
+
+        if PY3:
+            pytest.skip("doesn't work on Python 3")
+
+        assert pp_t('a') == u('a')
+        assert pp_t(u('a')) == u('a')
+        assert pp_t(None) == 'None'
+        assert pp_t(u('\u05d0'), quote_strings=True) == u("u'\u05d0'")
+        assert pp_t(u('\u05d0'), quote_strings=False) == u('\u05d0')
+        assert (pp_t((u('\u05d0'), u('\u05d1')), quote_strings=True) ==
+                u("(u'\u05d0', u'\u05d1')"))
+        assert (pp_t((u('\u05d0'), (u('\u05d1'), u('\u05d2'))),
+                     quote_strings=True) == u("(u'\u05d0', "
+                                              "(u'\u05d1', u'\u05d2'))"))
+        assert (pp_t(('foo', u('\u05d0'), (u('\u05d0'), u('\u05d0'))),
+                     quote_strings=True) == u("(u'foo', u'\u05d0', "
+                                              "(u'\u05d0', u'\u05d0'))"))
+
+        # gh-2038: escape embedded tabs in string
+        assert "\t" not in pp_t("a\tb", escape_chars=("\t", ))
+
+    def test_wide_repr(self):
+        with option_context('mode.sim_interactive', True,
+                            'display.show_dimensions', True,
+                            'display.max_columns', 20):
+            max_cols = get_option('display.max_columns')
+            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
+            set_option('display.expand_frame_repr', False)
+            rep_str = repr(df)
+
+            assert "10 rows x {c} columns".format(c=max_cols - 1) in rep_str
+            set_option('display.expand_frame_repr', True)
+            wide_repr = repr(df)
+            assert rep_str != wide_repr
+
+            with option_context('display.width', 120):
+                wider_repr = repr(df)
+                assert len(wider_repr) < len(wide_repr)
+
+        reset_option('display.expand_frame_repr')
+
+    def test_wide_repr_wide_columns(self):
+        with option_context('mode.sim_interactive', True,
+                            'display.max_columns', 20):
+            df = DataFrame(np.random.randn(5, 3),
+                           columns=['a' * 90, 'b' * 90, 'c' * 90])
+            rep_str = repr(df)
+
+            assert len(rep_str.splitlines()) == 20
+
+    def test_wide_repr_named(self):
+        with option_context('mode.sim_interactive', True,
+                            'display.max_columns', 20):
+            max_cols = get_option('display.max_columns')
+            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
+            df.index.name = 'DataFrame Index'
+            set_option('display.expand_frame_repr', False)
+
+            rep_str = repr(df)
+            set_option('display.expand_frame_repr', True)
+            wide_repr = repr(df)
+            assert rep_str != wide_repr
+
+            with option_context('display.width', 150):
+                wider_repr = repr(df)
+                assert len(wider_repr) < len(wide_repr)
+
+            for line in wide_repr.splitlines()[1::13]:
+                assert 'DataFrame Index' in line
+
+        reset_option('display.expand_frame_repr')
+
+    def test_wide_repr_multiindex(self):
+        with option_context('mode.sim_interactive', True,
+                            'display.max_columns', 20):
+            midx = MultiIndex.from_arrays(tm.rands_array(5, size=(2, 10)))
+            max_cols = get_option('display.max_columns')
+            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)),
+                           index=midx)
+            df.index.names = ['Level 0', 'Level 1']
+            set_option('display.expand_frame_repr', False)
+            rep_str = repr(df)
+            set_option('display.expand_frame_repr', True)
+            wide_repr = repr(df)
+            assert rep_str != wide_repr
+
+            with option_context('display.width', 150):
+                wider_repr = repr(df)
+                assert len(wider_repr) < len(wide_repr)
+
+            for line in wide_repr.splitlines()[1::13]:
+                assert 'Level 0 Level 1' in line
+
+        reset_option('display.expand_frame_repr')
+
+    def test_wide_repr_multiindex_cols(self):
+        with option_context('mode.sim_interactive', True,
+                            'display.max_columns', 20):
+            max_cols = get_option('display.max_columns')
+            midx = MultiIndex.from_arrays(tm.rands_array(5, size=(2, 10)))
+            mcols = MultiIndex.from_arrays(
+                tm.rands_array(3, size=(2, max_cols - 1)))
+            df = DataFrame(tm.rands_array(25, (10, max_cols - 1)),
+                           index=midx, columns=mcols)
+            df.index.names = ['Level 0', 'Level 1']
+            set_option('display.expand_frame_repr', False)
+            rep_str = repr(df)
+            set_option('display.expand_frame_repr', True)
+            wide_repr = repr(df)
+            assert rep_str != wide_repr
+
+        with option_context('display.width', 150, 'display.max_columns', 20):
+            wider_repr = repr(df)
+            assert len(wider_repr) < len(wide_repr)
+
+        reset_option('display.expand_frame_repr')
+
+    def test_wide_repr_unicode(self):
+        with option_context('mode.sim_interactive', True,
+                            'display.max_columns', 20):
+            max_cols = 20
+            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
+            set_option('display.expand_frame_repr', False)
+            rep_str = repr(df)
+            set_option('display.expand_frame_repr', True)
+            wide_repr = repr(df)
+            assert rep_str != wide_repr
+
+            with option_context('display.width', 150):
+                wider_repr = repr(df)
+                assert len(wider_repr) < len(wide_repr)
+
+        reset_option('display.expand_frame_repr')
+
+    def test_wide_repr_wide_long_columns(self):
+        with option_context('mode.sim_interactive', True):
+            df = DataFrame({'a': ['a' * 30, 'b' * 30],
+                            'b': ['c' * 70, 'd' * 80]})
+
+            result = repr(df)
+            assert 'ccccc' in result
+            assert 'ddddd' in result
+
+    def test_long_series(self):
+        n = 1000
+        s = Series(
+            np.random.randint(-50, 50, n),
+            index=['s{x:04d}'.format(x=x) for x in range(n)], dtype='int64')
+
+        import re
+        str_rep = str(s)
+        nmatches = len(re.findall('dtype', str_rep))
+        assert nmatches == 1
+
+    def test_index_with_nan(self):
+        #  GH 2850
+        df = DataFrame({'id1': {0: '1a3',
+                                1: '9h4'},
+                        'id2': {0: np.nan,
+                                1: 'd67'},
+                        'id3': {0: '78d',
+                                1: '79d'},
+                        'value': {0: 123,
+                                  1: 64}})
+
+        # multi-index
+        y = df.set_index(['id1', 'id2', 'id3'])
+        result = y.to_string()
+        expected = u(
+            '             value\nid1 id2 id3       \n'
+            '1a3 NaN 78d    123\n9h4 d67 79d     64')
+        assert result == expected
+
+        # index
+        y = df.set_index('id2')
+        result = y.to_string()
+        expected = u(
+            '     id1  id3  value\nid2                 \n'
+            'NaN  1a3  78d    123\nd67  9h4  79d     64')
+        assert result == expected
+
+        # with append (this failed in 0.12)
+        y = df.set_index(['id1', 'id2']).set_index('id3', append=True)
+        result = y.to_string()
+        expected = u(
+            '             value\nid1 id2 id3       \n'
+            '1a3 NaN 78d    123\n9h4 d67 79d     64')
+        assert result == expected
+
+        # all-nan in mi
+        df2 = df.copy()
+        df2.loc[:, 'id2'] = np.nan
+        y = df2.set_index('id2')
+        result = y.to_string()
+        expected = u(
+            '     id1  id3  value\nid2                 \n'
+            'NaN  1a3  78d    123\nNaN  9h4  79d     64')
+        assert result == expected
+
+        # partial nan in mi
+        df2 = df.copy()
+        df2.loc[:, 'id2'] = np.nan
+        y = df2.set_index(['id2', 'id3'])
+        result = y.to_string()
+        expected = u(
+            '         id1  value\nid2 id3            \n'
+            'NaN 78d  1a3    123\n    79d  9h4     64')
+        assert result == expected
+
+        df = DataFrame({'id1': {0: np.nan,
+                                1: '9h4'},
+                        'id2': {0: np.nan,
+                                1: 'd67'},
+                        'id3': {0: np.nan,
+                                1: '79d'},
+                        'value': {0: 123,
+                                  1: 64}})
+
+        y = df.set_index(['id1', 'id2', 'id3'])
+        result = y.to_string()
+        expected = u(
+            '             value\nid1 id2 id3       \n'
+            'NaN NaN NaN    123\n9h4 d67 79d     64')
+        assert result == expected
+
+    def test_to_string(self):
+
+        # big mixed
+        biggie = DataFrame({'A': np.random.randn(200),
+                            'B': tm.makeStringIndex(200)},
+                           index=lrange(200))
+
+        biggie.loc[:20, 'A'] = np.nan
+        biggie.loc[:20, 'B'] = np.nan
+        s = biggie.to_string()
+
+        buf = StringIO()
+        retval = biggie.to_string(buf=buf)
+        assert retval is None
+        assert buf.getvalue() == s
+
+        assert isinstance(s, compat.string_types)
+
+        # print in right order
+        result = biggie.to_string(columns=['B', 'A'], col_space=17,
+                                  float_format='%.5f'.__mod__)
+        lines = result.split('\n')
+        header = lines[0].strip().split()
+        joined = '\n'.join(re.sub(r'\s+', ' ', x).strip() for x in lines[1:])
+        recons = read_table(StringIO(joined), names=header,
+                            header=None, sep=' ')
+        tm.assert_series_equal(recons['B'], biggie['B'])
+        assert recons['A'].count() == biggie['A'].count()
+        assert (np.abs(recons['A'].dropna() -
+                       biggie['A'].dropna()) < 0.1).all()
+
+        # expected = ['B', 'A']
+        # assert header == expected
+
+        result = biggie.to_string(columns=['A'], col_space=17)
+        header = result.split('\n')[0].strip().split()
+        expected = ['A']
+        assert header == expected
+
+        biggie.to_string(columns=['B', 'A'],
+                         formatters={'A': lambda x: '{x:.1f}'.format(x=x)})
+
+        biggie.to_string(columns=['B', 'A'], float_format=str)
+        biggie.to_string(columns=['B', 'A'], col_space=12, float_format=str)
+
+        frame = DataFrame(index=np.arange(200))
+        frame.to_string()
+
+    def test_to_string_no_header(self):
+        df = DataFrame({'x': [1, 2, 3], 'y': [4, 5, 6]})
+
+        df_s = df.to_string(header=False)
+        expected = "0  1  4\n1  2  5\n2  3  6"
+
+        assert df_s == expected
+
+    def test_to_string_specified_header(self):
+        df = DataFrame({'x': [1, 2, 3], 'y': [4, 5, 6]})
+
+        df_s = df.to_string(header=['X', 'Y'])
+        expected = '   X  Y\n0  1  4\n1  2  5\n2  3  6'
+
+        assert df_s == expected
+
+        with pytest.raises(ValueError):
+            df.to_string(header=['X'])
+
+    def test_to_string_no_index(self):
+        df = DataFrame({'x': [1, 2, 3], 'y': [4, 5, 6]})
+
+        df_s = df.to_string(index=False)
+        expected = "x  y\n1  4\n2  5\n3  6"
+
+        assert df_s == expected
+
+    def test_to_string_line_width_no_index(self):
+        df = DataFrame({'x': [1, 2, 3], 'y': [4, 5, 6]})
+
+        df_s = df.to_string(line_width=1, index=False)
+        expected = "x  \\\n1   \n2   \n3   \n\ny  \n4  \n5  \n6"
+
+        assert df_s == expected
+
+    def test_to_string_float_formatting(self):
+        tm.reset_display_options()
+        fmt.set_option('display.precision', 5, 'display.column_space', 12,
+                       'display.notebook_repr_html', False)
+
+        df = DataFrame({'x': [0, 0.25, 3456.000, 12e+45, 1.64e+6, 1.7e+8,
+                              1.253456, np.pi, -1e6]})
+
+        df_s = df.to_string()
+
+        if _three_digit_exp():
+            expected = ('              x\n0  0.00000e+000\n1  2.50000e-001\n'
+                        '2  3.45600e+003\n3  1.20000e+046\n4  1.64000e+006\n'
+                        '5  1.70000e+008\n6  1.25346e+000\n7  3.14159e+000\n'
+                        '8 -1.00000e+006')
+        else:
+            expected = ('             x\n0  0.00000e+00\n1  2.50000e-01\n'
+                        '2  3.45600e+03\n3  1.20000e+46\n4  1.64000e+06\n'
+                        '5  1.70000e+08\n6  1.25346e+00\n7  3.14159e+00\n'
+                        '8 -1.00000e+06')
+        assert df_s == expected
+
+        df = DataFrame({'x': [3234, 0.253]})
+        df_s = df.to_string()
+
+        expected = ('          x\n' '0  3234.000\n' '1     0.253')
+        assert df_s == expected
+
+        tm.reset_display_options()
+        assert get_option("display.precision") == 6
+
+        df = DataFrame({'x': [1e9, 0.2512]})
+        df_s = df.to_string()
+
+        if _three_digit_exp():
+            expected = ('               x\n'
+                        '0  1.000000e+009\n'
+                        '1  2.512000e-001')
+        else:
+            expected = ('              x\n'
+                        '0  1.000000e+09\n'
+                        '1  2.512000e-01')
+        assert df_s == expected
+
+    def test_to_string_small_float_values(self):
+        df = DataFrame({'a': [1.5, 1e-17, -5.5e-7]})
+
+        result = df.to_string()
+        # sadness per above
+        if '{x:.4g}'.format(x=1.7e8) == '1.7e+008':
+            expected = ('               a\n'
+                        '0  1.500000e+000\n'
+                        '1  1.000000e-017\n'
+                        '2 -5.500000e-007')
+        else:
+            expected = ('              a\n'
+                        '0  1.500000e+00\n'
+                        '1  1.000000e-17\n'
+                        '2 -5.500000e-07')
+        assert result == expected
+
+        # but not all exactly zero
+        df = df * 0
+        result = df.to_string()
+        expected = ('   0\n' '0  0\n' '1  0\n' '2 -0')
+
+    def test_to_string_float_index(self):
+        index = Index([1.5, 2, 3, 4, 5])
+        df = DataFrame(lrange(5), index=index)
+
+        result = df.to_string()
+        expected = ('     0\n'
+                    '1.5  0\n'
+                    '2.0  1\n'
+                    '3.0  2\n'
+                    '4.0  3\n'
+                    '5.0  4')
+        assert result == expected
+
+    def test_to_string_ascii_error(self):
+        data = [('0  ', u('                        .gitignore '), u('     5 '),
+                 ' \xe2\x80\xa2\xe2\x80\xa2\xe2\x80'
+                 '\xa2\xe2\x80\xa2\xe2\x80\xa2')]
+        df = DataFrame(data)
+
+        # it works!
+        repr(df)
+
+    def test_to_string_int_formatting(self):
+        df = DataFrame({'x': [-15, 20, 25, -35]})
+        assert issubclass(df['x'].dtype.type, np.integer)
+
+        output = df.to_string()
+        expected = ('    x\n' '0 -15\n' '1  20\n' '2  25\n' '3 -35')
+        assert output == expected
+
+    def test_to_string_index_formatter(self):
+        df = DataFrame([lrange(5), lrange(5, 10), lrange(10, 15)])
+
+        rs = df.to_string(formatters={'__index__': lambda x: 'abc' [x]})
+
+        xp = """\
+    0   1   2   3   4
+a   0   1   2   3   4
+b   5   6   7   8   9
+c  10  11  12  13  14\
+"""
+
+        assert rs == xp
+
+    def test_to_string_left_justify_cols(self):
+        tm.reset_display_options()
+        df = DataFrame({'x': [3234, 0.253]})
+        df_s = df.to_string(justify='left')
+        expected = ('   x       \n' '0  3234.000\n' '1     0.253')
+        assert df_s == expected
+
+    def test_to_string_format_na(self):
+        tm.reset_display_options()
+        df = DataFrame({'A': [np.nan, -1, -2.1234, 3, 4],
+                        'B': [np.nan, 'foo', 'foooo', 'fooooo', 'bar']})
+        result = df.to_string()
+
+        expected = ('        A       B\n'
+                    '0     NaN     NaN\n'
+                    '1 -1.0000     foo\n'
+                    '2 -2.1234   foooo\n'
+                    '3  3.0000  fooooo\n'
+                    '4  4.0000     bar')
+        assert result == expected
+
+        df = DataFrame({'A': [np.nan, -1., -2., 3., 4.],
+                        'B': [np.nan, 'foo', 'foooo', 'fooooo', 'bar']})
+        result = df.to_string()
+
+        expected = ('     A       B\n'
+                    '0  NaN     NaN\n'
+                    '1 -1.0     foo\n'
+                    '2 -2.0   foooo\n'
+                    '3  3.0  fooooo\n'
+                    '4  4.0     bar')
+        assert result == expected
+
+    def test_to_string_line_width(self):
+        df = DataFrame(123, lrange(10, 15), lrange(30))
+        s = df.to_string(line_width=80)
+        assert max(len(l) for l in s.split('\n')) == 80
+
+    def test_show_dimensions(self):
+        df = DataFrame(123, lrange(10, 15), lrange(30))
+
+        with option_context('display.max_rows', 10, 'display.max_columns', 40,
+                            'display.width', 500, 'display.expand_frame_repr',
+                            'info', 'display.show_dimensions', True):
+            assert '5 rows' in str(df)
+            assert '5 rows' in df._repr_html_()
+        with option_context('display.max_rows', 10, 'display.max_columns', 40,
+                            'display.width', 500, 'display.expand_frame_repr',
+                            'info', 'display.show_dimensions', False):
+            assert '5 rows' not in str(df)
+            assert '5 rows' not in df._repr_html_()
+        with option_context('display.max_rows', 2, 'display.max_columns', 2,
+                            'display.width', 500, 'display.expand_frame_repr',
+                            'info', 'display.show_dimensions', 'truncate'):
+            assert '5 rows' in str(df)
+            assert '5 rows' in df._repr_html_()
+        with option_context('display.max_rows', 10, 'display.max_columns', 40,
+                            'display.width', 500, 'display.expand_frame_repr',
+                            'info', 'display.show_dimensions', 'truncate'):
+            assert '5 rows' not in str(df)
+            assert '5 rows' not in df._repr_html_()
+
+    def test_repr_html(self):
+        self.frame._repr_html_()
+
+        fmt.set_option('display.max_rows', 1, 'display.max_columns', 1)
+        self.frame._repr_html_()
+
+        fmt.set_option('display.notebook_repr_html', False)
+        self.frame._repr_html_()
+
+        tm.reset_display_options()
+
+        df = DataFrame([[1, 2], [3, 4]])
+        fmt.set_option('display.show_dimensions', True)
+        assert '2 rows' in df._repr_html_()
+        fmt.set_option('display.show_dimensions', False)
+        assert '2 rows' not in df._repr_html_()
+
+        tm.reset_display_options()
+
+    def test_repr_html_mathjax(self):
+        df = DataFrame([[1, 2], [3, 4]])
+        assert 'tex2jax_ignore' not in df._repr_html_()
+
+        with pd.option_context('display.html.use_mathjax', False):
+            assert 'tex2jax_ignore' in df._repr_html_()
+
+    def test_repr_html_wide(self):
+        max_cols = 20
+        df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
+        with option_context('display.max_rows', 60, 'display.max_columns', 20):
+            assert "..." not in df._repr_html_()
+
+        wide_df = DataFrame(tm.rands_array(25, size=(10, max_cols + 1)))
+        with option_context('display.max_rows', 60, 'display.max_columns', 20):
+            assert "..." in wide_df._repr_html_()
+
+    def test_repr_html_wide_multiindex_cols(self):
+        max_cols = 20
+
+        mcols = MultiIndex.from_product([np.arange(max_cols // 2),
+                                         ['foo', 'bar']],
+                                        names=['first', 'second'])
+        df = DataFrame(tm.rands_array(25, size=(10, len(mcols))),
+                       columns=mcols)
+        reg_repr = df._repr_html_()
+        assert '...' not in reg_repr
+
+        mcols = MultiIndex.from_product((np.arange(1 + (max_cols // 2)),
+                                         ['foo', 'bar']),
+                                        names=['first', 'second'])
+        df = DataFrame(tm.rands_array(25, size=(10, len(mcols))),
+                       columns=mcols)
+        with option_context('display.max_rows', 60, 'display.max_columns', 20):
+            assert '...' in df._repr_html_()
+
+    def test_repr_html_long(self):
+        with option_context('display.max_rows', 60):
+            max_rows = get_option('display.max_rows')
+            h = max_rows - 1
+            df = DataFrame({'A': np.arange(1, 1 + h),
+                            'B': np.arange(41, 41 + h)})
+            reg_repr = df._repr_html_()
+            assert '..' not in reg_repr
+            assert str(41 + max_rows // 2) in reg_repr
+
+            h = max_rows + 1
+            df = DataFrame({'A': np.arange(1, 1 + h),
+                            'B': np.arange(41, 41 + h)})
+            long_repr = df._repr_html_()
+            assert '..' in long_repr
+            assert str(41 + max_rows // 2) not in long_repr
+            assert u('{h} rows ').format(h=h) in long_repr
+            assert u('2 columns') in long_repr
+
+    def test_repr_html_float(self):
+        with option_context('display.max_rows', 60):
+
+            max_rows = get_option('display.max_rows')
+            h = max_rows - 1
+            df = DataFrame({'idx': np.linspace(-10, 10, h),
+                            'A': np.arange(1, 1 + h),
+                            'B': np.arange(41, 41 + h)}).set_index('idx')
+            reg_repr = df._repr_html_()
+            assert '..' not in reg_repr
+            assert '<td>{val}</td>'.format(val=str(40 + h)) in reg_repr
+
+            h = max_rows + 1
+            df = DataFrame({'idx': np.linspace(-10, 10, h),
+                            'A': np.arange(1, 1 + h),
+                            'B': np.arange(41, 41 + h)}).set_index('idx')
+            long_repr = df._repr_html_()
+            assert '..' in long_repr
+            assert '<td>{val}</td>'.format(val='31') not in long_repr
+            assert u('{h} rows ').format(h=h) in long_repr
+            assert u('2 columns') in long_repr
+
+    def test_repr_html_long_multiindex(self):
+        max_rows = 60
+        max_L1 = max_rows // 2
+
+        tuples = list(itertools.product(np.arange(max_L1), ['foo', 'bar']))
+        idx = MultiIndex.from_tuples(tuples, names=['first', 'second'])
+        df = DataFrame(np.random.randn(max_L1 * 2, 2), index=idx,
+                       columns=['A', 'B'])
+        with option_context('display.max_rows', 60, 'display.max_columns', 20):
+            reg_repr = df._repr_html_()
+        assert '...' not in reg_repr
+
+        tuples = list(itertools.product(np.arange(max_L1 + 1), ['foo', 'bar']))
+        idx = MultiIndex.from_tuples(tuples, names=['first', 'second'])
+        df = DataFrame(np.random.randn((max_L1 + 1) * 2, 2), index=idx,
+                       columns=['A', 'B'])
+        long_repr = df._repr_html_()
+        assert '...' in long_repr
+
+    def test_repr_html_long_and_wide(self):
+        max_cols = 20
+        max_rows = 60
+
+        h, w = max_rows - 1, max_cols - 1
+        df = DataFrame({k: np.arange(1, 1 + h) for k in np.arange(w)})
+        with option_context('display.max_rows', 60, 'display.max_columns', 20):
+            assert '...' not in df._repr_html_()
+
+        h, w = max_rows + 1, max_cols + 1
+        df = DataFrame({k: np.arange(1, 1 + h) for k in np.arange(w)})
+        with option_context('display.max_rows', 60, 'display.max_columns', 20):
+            assert '...' in df._repr_html_()
+
+    def test_info_repr(self):
+        max_rows = 60
+        max_cols = 20
+        # Long
+        h, w = max_rows + 1, max_cols - 1
+        df = DataFrame({k: np.arange(1, 1 + h) for k in np.arange(w)})
+        assert has_vertically_truncated_repr(df)
+        with option_context('display.large_repr', 'info'):
+            assert has_info_repr(df)
+
+        # Wide
+        h, w = max_rows - 1, max_cols + 1
+        df = DataFrame({k: np.arange(1, 1 + h) for k in np.arange(w)})
+        assert has_horizontally_truncated_repr(df)
+        with option_context('display.large_repr', 'info',
+                            'display.max_columns', max_cols):
+            assert has_info_repr(df)
+
+    def test_info_repr_max_cols(self):
+        # GH #6939
+        df = DataFrame(np.random.randn(10, 5))
+        with option_context('display.large_repr', 'info',
+                            'display.max_columns', 1,
+                            'display.max_info_columns', 4):
+            assert has_non_verbose_info_repr(df)
+
+        with option_context('display.large_repr', 'info',
+                            'display.max_columns', 1,
+                            'display.max_info_columns', 5):
+            assert not has_non_verbose_info_repr(df)
+
+        # test verbose overrides
+        # fmt.set_option('display.max_info_columns', 4)  # exceeded
+
+    def test_info_repr_html(self):
+        max_rows = 60
+        max_cols = 20
+        # Long
+        h, w = max_rows + 1, max_cols - 1
+        df = DataFrame({k: np.arange(1, 1 + h) for k in np.arange(w)})
+        assert r'&lt;class' not in df._repr_html_()
+        with option_context('display.large_repr', 'info'):
+            assert r'&lt;class' in df._repr_html_()
+
+        # Wide
+        h, w = max_rows - 1, max_cols + 1
+        df = DataFrame({k: np.arange(1, 1 + h) for k in np.arange(w)})
+        assert '<class' not in df._repr_html_()
+        with option_context('display.large_repr', 'info',
+                            'display.max_columns', max_cols):
+            assert '&lt;class' in df._repr_html_()
+
+    def test_fake_qtconsole_repr_html(self):
+        def get_ipython():
+            return {'config': {'KernelApp':
+                               {'parent_appname': 'ipython-qtconsole'}}}
+
+        repstr = self.frame._repr_html_()
+        assert repstr is not None
+
+        fmt.set_option('display.max_rows', 5, 'display.max_columns', 2)
+        repstr = self.frame._repr_html_()
+
+        assert 'class' in repstr  # info fallback
+        tm.reset_display_options()
+
+    def test_pprint_pathological_object(self):
+        """
+        If the test fails, it at least won't hang.
+        """
+
+        class A(object):
+            def __getitem__(self, key):
+                return 3  # obviously simplified
+
+        df = DataFrame([A()])
+        repr(df)  # just don't die
+
+    def test_float_trim_zeros(self):
+        vals = [2.08430917305e+10, 3.52205017305e+10, 2.30674817305e+10,
+                2.03954217305e+10, 5.59897817305e+10]
+        skip = True
+        for line in repr(DataFrame({'A': vals})).split('\n')[:-2]:
+            if line.startswith('dtype:'):
+                continue
+            if _three_digit_exp():
+                assert ('+010' in line) or skip
+            else:
+                assert ('+10' in line) or skip
+            skip = False
+
+    def test_dict_entries(self):
+        df = DataFrame({'A': [{'a': 1, 'b': 2}]})
+
+        val = df.to_string()
+        assert "'a': 1" in val
+        assert "'b': 2" in val
+
+    def test_period(self):
+        # GH 12615
+        df = pd.DataFrame({'A': pd.period_range('2013-01',
+                                                periods=4, freq='M'),
+                           'B': [pd.Period('2011-01', freq='M'),
+                                 pd.Period('2011-02-01', freq='D'),
+                                 pd.Period('2011-03-01 09:00', freq='H'),
+                                 pd.Period('2011-04', freq='M')],
+                           'C': list('abcd')})
+        exp = ("        A                B  C\n0 2013-01          2011-01  a\n"
+               "1 2013-02       2011-02-01  b\n2 2013-03 2011-03-01 09:00  c\n"
+               "3 2013-04          2011-04  d")
+        assert str(df) == exp
+
+
+def gen_series_formatting():
+    s1 = pd.Series(['a'] * 100)
+    s2 = pd.Series(['ab'] * 100)
+    s3 = pd.Series(['a', 'ab', 'abc', 'abcd', 'abcde', 'abcdef'])
+    s4 = s3[::-1]
+    test_sers = {'onel': s1, 'twol': s2, 'asc': s3, 'desc': s4}
+    return test_sers
+
+
+class TestSeriesFormatting(object):
+
+    def setup_method(self, method):
+        self.ts = tm.makeTimeSeries()
+
+    def test_repr_unicode(self):
+        s = Series([u('\u03c3')] * 10)
+        repr(s)
+
+        a = Series([u("\u05d0")] * 1000)
+        a.name = 'title1'
+        repr(a)
+
+    def test_to_string(self):
+        buf = StringIO()
+
+        s = self.ts.to_string()
+
+        retval = self.ts.to_string(buf=buf)
+        assert retval is None
+        assert buf.getvalue().strip() == s
+
+        # pass float_format
+        format = '%.4f'.__mod__
+        result = self.ts.to_string(float_format=format)
+        result = [x.split()[1] for x in result.split('\n')[:-1]]
+        expected = [format(x) for x in self.ts]
+        assert result == expected
+
+        # empty string
+        result = self.ts[:0].to_string()
+        assert result == 'Series([], Freq: B)'
+
+        result = self.ts[:0].to_string(length=0)
+        assert result == 'Series([], Freq: B)'
+
+        # name and length
+        cp = self.ts.copy()
+        cp.name = 'foo'
+        result = cp.to_string(length=True, name=True, dtype=True)
+        last_line = result.split('\n')[-1].strip()
+        assert last_line == ("Freq: B, Name: foo, "
+                             "Length: {cp}, dtype: float64".format(cp=len(cp)))
+
+    def test_freq_name_separation(self):
+        s = Series(np.random.randn(10),
+                   index=date_range('1/1/2000', periods=10), name=0)
+
+        result = repr(s)
+        assert 'Freq: D, Name: 0' in result
+
+    def test_to_string_mixed(self):
+        s = Series(['foo', np.nan, -1.23, 4.56])
+        result = s.to_string()
+        expected = (u('0     foo\n') + u('1     NaN\n') + u('2   -1.23\n') +
+                    u('3    4.56'))
+        assert result == expected
+
+        # but don't count NAs as floats
+        s = Series(['foo', np.nan, 'bar', 'baz'])
+        result = s.to_string()
+        expected = (u('0    foo\n') + '1    NaN\n' + '2    bar\n' + '3    baz')
+        assert result == expected
+
+        s = Series(['foo', 5, 'bar', 'baz'])
+        result = s.to_string()
+        expected = (u('0    foo\n') + '1      5\n' + '2    bar\n' + '3    baz')
+        assert result == expected
+
+    def test_to_string_float_na_spacing(self):
+        s = Series([0., 1.5678, 2., -3., 4.])
+        s[::2] = np.nan
+
+        result = s.to_string()
+        expected = (u('0       NaN\n') + '1    1.5678\n' + '2       NaN\n' +
+                    '3   -3.0000\n' + '4       NaN')
+        assert result == expected
+
+    def test_to_string_without_index(self):
+        # GH 11729 Test index=False option
+        s = Series([1, 2, 3, 4])
+        result = s.to_string(index=False)
+        expected = (u('1\n') + '2\n' + '3\n' + '4')
+        assert result == expected
+
+    def test_unicode_name_in_footer(self):
+        s = Series([1, 2], name=u('\u05e2\u05d1\u05e8\u05d9\u05ea'))
+        sf = fmt.SeriesFormatter(s, name=u('\u05e2\u05d1\u05e8\u05d9\u05ea'))
+        sf._get_footer()  # should not raise exception
+
+    def test_east_asian_unicode_series(self):
+        if PY3:
+            _rep = repr
+        else:
+            _rep = unicode  # noqa
+        # not aligned properly because of east asian width
+
+        # unicode index
+        s = Series(['a', 'bb', 'CCC', 'D'],
+                   index=[u'あ', u'いい', u'ううう', u'ええええ'])
+        expected = (u"あ         a\nいい       bb\nううう     CCC\n"
+                    u"ええええ      D\ndtype: object")
+        assert _rep(s) == expected
+
+        # unicode values
+        s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                   index=['a', 'bb', 'c', 'ddd'])
+        expected = (u"a         あ\nbb       いい\nc       ううう\n"
+                    u"ddd    ええええ\ndtype: object")
+        assert _rep(s) == expected
+
+        # both
+        s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                   index=[u'ああ', u'いいいい', u'う', u'えええ'])
+        expected = (u"ああ         あ\nいいいい      いい\nう        ううう\n"
+                    u"えええ     ええええ\ndtype: object")
+        assert _rep(s) == expected
+
+        # unicode footer
+        s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                   index=[u'ああ', u'いいいい', u'う', u'えええ'],
+                   name=u'おおおおおおお')
+        expected = (u"ああ         あ\nいいいい      いい\nう        ううう\n"
+                    u"えええ     ええええ\nName: おおおおおおお, dtype: object")
+        assert _rep(s) == expected
+
+        # MultiIndex
+        idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'), (
+            u'おおお', u'かかかか'), (u'き', u'くく')])
+        s = Series([1, 22, 3333, 44444], index=idx)
+        expected = (u"あ    いい          1\n"
+                    u"う    え          22\n"
+                    u"おおお  かかかか     3333\n"
+                    u"き    くく      44444\ndtype: int64")
+        assert _rep(s) == expected
+
+        # object dtype, shorter than unicode repr
+        s = Series([1, 22, 3333, 44444], index=[1, 'AB', np.nan, u'あああ'])
+        expected = (u"1          1\nAB        22\nNaN     3333\n"
+                    u"あああ    44444\ndtype: int64")
+        assert _rep(s) == expected
+
+        # object dtype, longer than unicode repr
+        s = Series([1, 22, 3333, 44444],
+                   index=[1, 'AB', pd.Timestamp('2011-01-01'), u'あああ'])
+        expected = (u"1                          1\n"
+                    u"AB                        22\n"
+                    u"2011-01-01 00:00:00     3333\n"
+                    u"あああ                    44444\ndtype: int64")
+        assert _rep(s) == expected
+
+        # truncate
+        with option_context('display.max_rows', 3):
+            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                       name=u'おおおおおおお')
+
+            expected = (u"0       あ\n     ... \n"
+                        u"3    ええええ\n"
+                        u"Name: おおおおおおお, Length: 4, dtype: object")
+            assert _rep(s) == expected
+
+            s.index = [u'ああ', u'いいいい', u'う', u'えええ']
+            expected = (u"ああ        あ\n       ... \n"
+                        u"えええ    ええええ\n"
+                        u"Name: おおおおおおお, Length: 4, dtype: object")
+            assert _rep(s) == expected
+
+        # Emable Unicode option -----------------------------------------
+        with option_context('display.unicode.east_asian_width', True):
+
+            # unicode index
+            s = Series(['a', 'bb', 'CCC', 'D'],
+                       index=[u'あ', u'いい', u'ううう', u'ええええ'])
+            expected = (u"あ            a\nいい         bb\nううう      CCC\n"
+                        u"ええええ      D\ndtype: object")
+            assert _rep(s) == expected
+
+            # unicode values
+            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                       index=['a', 'bb', 'c', 'ddd'])
+            expected = (u"a            あ\nbb         いい\nc        ううう\n"
+                        u"ddd    ええええ\ndtype: object")
+            assert _rep(s) == expected
+
+            # both
+            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                       index=[u'ああ', u'いいいい', u'う', u'えええ'])
+            expected = (u"ああ              あ\n"
+                        u"いいいい        いい\n"
+                        u"う            ううう\n"
+                        u"えええ      ええええ\ndtype: object")
+            assert _rep(s) == expected
+
+            # unicode footer
+            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                       index=[u'ああ', u'いいいい', u'う', u'えええ'],
+                       name=u'おおおおおおお')
+            expected = (u"ああ              あ\n"
+                        u"いいいい        いい\n"
+                        u"う            ううう\n"
+                        u"えええ      ええええ\n"
+                        u"Name: おおおおおおお, dtype: object")
+            assert _rep(s) == expected
+
+            # MultiIndex
+            idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'), (
+                u'おおお', u'かかかか'), (u'き', u'くく')])
+            s = Series([1, 22, 3333, 44444], index=idx)
+            expected = (u"あ      いい            1\n"
+                        u"う      え             22\n"
+                        u"おおお  かかかか     3333\n"
+                        u"き      くく        44444\n"
+                        u"dtype: int64")
+            assert _rep(s) == expected
+
+            # object dtype, shorter than unicode repr
+            s = Series([1, 22, 3333, 44444], index=[1, 'AB', np.nan, u'あああ'])
+            expected = (u"1             1\nAB           22\nNaN        3333\n"
+                        u"あああ    44444\ndtype: int64")
+            assert _rep(s) == expected
+
+            # object dtype, longer than unicode repr
+            s = Series([1, 22, 3333, 44444],
+                       index=[1, 'AB', pd.Timestamp('2011-01-01'), u'あああ'])
+            expected = (u"1                          1\n"
+                        u"AB                        22\n"
+                        u"2011-01-01 00:00:00     3333\n"
+                        u"あああ                 44444\ndtype: int64")
+            assert _rep(s) == expected
+
+            # truncate
+            with option_context('display.max_rows', 3):
+                s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                           name=u'おおおおおおお')
+                expected = (u"0          あ\n       ...   \n"
+                            u"3    ええええ\n"
+                            u"Name: おおおおおおお, Length: 4, dtype: object")
+                assert _rep(s) == expected
+
+                s.index = [u'ああ', u'いいいい', u'う', u'えええ']
+                expected = (u"ああ            あ\n"
+                            u"            ...   \n"
+                            u"えええ    ええええ\n"
+                            u"Name: おおおおおおお, Length: 4, dtype: object")
+                assert _rep(s) == expected
+
+            # ambiguous unicode
+            s = Series([u'¡¡', u'い¡¡', u'ううう', u'ええええ'],
+                       index=[u'ああ', u'¡¡¡¡いい', u'¡¡', u'えええ'])
+            expected = (u"ああ              ¡¡\n"
+                        u"¡¡¡¡いい        い¡¡\n"
+                        u"¡¡            ううう\n"
+                        u"えええ      ええええ\ndtype: object")
+            assert _rep(s) == expected
+
+    def test_float_trim_zeros(self):
+        vals = [2.08430917305e+10, 3.52205017305e+10, 2.30674817305e+10,
+                2.03954217305e+10, 5.59897817305e+10]
+        for line in repr(Series(vals)).split('\n'):
+            if line.startswith('dtype:'):
+                continue
+            if _three_digit_exp():
+                assert '+010' in line
+            else:
+                assert '+10' in line
+
+    def test_datetimeindex(self):
+
+        index = date_range('20130102', periods=6)
+        s = Series(1, index=index)
+        result = s.to_string()
+        assert '2013-01-02' in result
+
+        # nat in index
+        s2 = Series(2, index=[Timestamp('20130111'), NaT])
+        s = s2.append(s)
+        result = s.to_string()
+        assert 'NaT' in result
+
+        # nat in summary
+        result = str(s2.index)
+        assert 'NaT' in result
+
+    @pytest.mark.parametrize('start_date', [
+        '2017-01-01 23:59:59.999999999',
+        '2017-01-01 23:59:59.99999999',
+        '2017-01-01 23:59:59.9999999',
+        '2017-01-01 23:59:59.999999',
+        '2017-01-01 23:59:59.99999',
+        '2017-01-01 23:59:59.9999'
+    ])
+    def test_datetimeindex_highprecision(self, start_date):
+        # GH19030
+        # Check that high-precision time values for the end of day are
+        # included in repr for DatetimeIndex
+        s1 = Series(date_range(start=start_date, freq='D', periods=5))
+        result = str(s1)
+        assert start_date in result
+
+        dti = date_range(start=start_date, freq='D', periods=5)
+        s2 = Series(3, index=dti)
+        result = str(s2.index)
+        assert start_date in result
+
+    def test_timedelta64(self):
+
+        from datetime import datetime, timedelta
+
+        Series(np.array([1100, 20], dtype='timedelta64[ns]')).to_string()
+
+        s = Series(date_range('2012-1-1', periods=3, freq='D'))
+
+        # GH2146
+
+        # adding NaTs
+        y = s - s.shift(1)
+        result = y.to_string()
+        assert '1 days' in result
+        assert '00:00:00' not in result
+        assert 'NaT' in result
+
+        # with frac seconds
+        o = Series([datetime(2012, 1, 1, microsecond=150)] * 3)
+        y = s - o
+        result = y.to_string()
+        assert '-1 days +23:59:59.999850' in result
+
+        # rounding?
+        o = Series([datetime(2012, 1, 1, 1)] * 3)
+        y = s - o
+        result = y.to_string()
+        assert '-1 days +23:00:00' in result
+        assert '1 days 23:00:00' in result
+
+        o = Series([datetime(2012, 1, 1, 1, 1)] * 3)
+        y = s - o
+        result = y.to_string()
+        assert '-1 days +22:59:00' in result
+        assert '1 days 22:59:00' in result
+
+        o = Series([datetime(2012, 1, 1, 1, 1, microsecond=150)] * 3)
+        y = s - o
+        result = y.to_string()
+        assert '-1 days +22:58:59.999850' in result
+        assert '0 days 22:58:59.999850' in result
+
+        # neg time
+        td = timedelta(minutes=5, seconds=3)
+        s2 = Series(date_range('2012-1-1', periods=3, freq='D')) + td
+        y = s - s2
+        result = y.to_string()
+        assert '-1 days +23:54:57' in result
+
+        td = timedelta(microseconds=550)
+        s2 = Series(date_range('2012-1-1', periods=3, freq='D')) + td
+        y = s - td
+        result = y.to_string()
+        assert '2012-01-01 23:59:59.999450' in result
+
+        # no boxing of the actual elements
+        td = Series(pd.timedelta_range('1 days', periods=3))
+        result = td.to_string()
+        assert result == u("0   1 days\n1   2 days\n2   3 days")
+
+    def test_mixed_datetime64(self):
+        df = DataFrame({'A': [1, 2], 'B': ['2012-01-01', '2012-01-02']})
+        df['B'] = pd.to_datetime(df.B)
+
+        result = repr(df.loc[0])
+        assert '2012-01-01' in result
+
+    def test_period(self):
+        # GH 12615
+        index = pd.period_range('2013-01', periods=6, freq='M')
+        s = Series(np.arange(6, dtype='int64'), index=index)
+        exp = ("2013-01    0\n2013-02    1\n2013-03    2\n2013-04    3\n"
+               "2013-05    4\n2013-06    5\nFreq: M, dtype: int64")
+        assert str(s) == exp
+
+        s = Series(index)
+        exp = ("0   2013-01\n1   2013-02\n2   2013-03\n3   2013-04\n"
+               "4   2013-05\n5   2013-06\ndtype: object")
+        assert str(s) == exp
+
+        # periods with mixed freq
+        s = Series([pd.Period('2011-01', freq='M'),
+                    pd.Period('2011-02-01', freq='D'),
+                    pd.Period('2011-03-01 09:00', freq='H')])
+        exp = ("0            2011-01\n1         2011-02-01\n"
+               "2   2011-03-01 09:00\ndtype: object")
+        assert str(s) == exp
+
+    def test_max_multi_index_display(self):
+        # GH 7101
+
+        # doc example (indexing.rst)
+
+        # multi-index
+        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+        tuples = list(zip(*arrays))
+        index = MultiIndex.from_tuples(tuples, names=['first', 'second'])
+        s = Series(np.random.randn(8), index=index)
+
+        with option_context("display.max_rows", 10):
+            assert len(str(s).split('\n')) == 10
+        with option_context("display.max_rows", 3):
+            assert len(str(s).split('\n')) == 5
+        with option_context("display.max_rows", 2):
+            assert len(str(s).split('\n')) == 5
+        with option_context("display.max_rows", 1):
+            assert len(str(s).split('\n')) == 4
+        with option_context("display.max_rows", 0):
+            assert len(str(s).split('\n')) == 10
+
+        # index
+        s = Series(np.random.randn(8), None)
+
+        with option_context("display.max_rows", 10):
+            assert len(str(s).split('\n')) == 9
+        with option_context("display.max_rows", 3):
+            assert len(str(s).split('\n')) == 4
+        with option_context("display.max_rows", 2):
+            assert len(str(s).split('\n')) == 4
+        with option_context("display.max_rows", 1):
+            assert len(str(s).split('\n')) == 3
+        with option_context("display.max_rows", 0):
+            assert len(str(s).split('\n')) == 9
+
+    # Make sure #8532 is fixed
+    def test_consistent_format(self):
+        s = pd.Series([1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0.9999, 1, 1] * 10)
+        with option_context("display.max_rows", 10,
+                            "display.show_dimensions", False):
+            res = repr(s)
+        exp = ('0      1.0000\n1      1.0000\n2      1.0000\n3      '
+               '1.0000\n4      1.0000\n        ...  \n125    '
+               '1.0000\n126    1.0000\n127    0.9999\n128    '
+               '1.0000\n129    1.0000\ndtype: float64')
+        assert res == exp
+
+    def chck_ncols(self, s):
+        with option_context("display.max_rows", 10):
+            res = repr(s)
+        lines = res.split('\n')
+        lines = [line for line in repr(s).split('\n')
+                 if not re.match(r'[^\.]*\.+', line)][:-1]
+        ncolsizes = len({len(line.strip()) for line in lines})
+        assert ncolsizes == 1
+
+    def test_format_explicit(self):
+        test_sers = gen_series_formatting()
+        with option_context("display.max_rows", 4,
+                            "display.show_dimensions", False):
+            res = repr(test_sers['onel'])
+            exp = '0     a\n1     a\n     ..\n98    a\n99    a\ndtype: object'
+            assert exp == res
+            res = repr(test_sers['twol'])
+            exp = ('0     ab\n1     ab\n      ..\n98    ab\n99    ab\ndtype:'
+                   ' object')
+            assert exp == res
+            res = repr(test_sers['asc'])
+            exp = ('0         a\n1        ab\n      ...  \n4     abcde\n5'
+                   '    abcdef\ndtype: object')
+            assert exp == res
+            res = repr(test_sers['desc'])
+            exp = ('5    abcdef\n4     abcde\n      ...  \n1        ab\n0'
+                   '         a\ndtype: object')
+            assert exp == res
+
+    def test_ncols(self):
+        test_sers = gen_series_formatting()
+        for s in test_sers.values():
+            self.chck_ncols(s)
+
+    def test_max_rows_eq_one(self):
+        s = Series(range(10), dtype='int64')
+        with option_context("display.max_rows", 1):
+            strrepr = repr(s).split('\n')
+        exp1 = ['0', '0']
+        res1 = strrepr[0].split()
+        assert exp1 == res1
+        exp2 = ['..']
+        res2 = strrepr[1].split()
+        assert exp2 == res2
+
+    def test_truncate_ndots(self):
+        def getndots(s):
+            return len(re.match(r'[^\.]*(\.*)', s).groups()[0])
+
+        s = Series([0, 2, 3, 6])
+        with option_context("display.max_rows", 2):
+            strrepr = repr(s).replace('\n', '')
+        assert getndots(strrepr) == 2
+
+        s = Series([0, 100, 200, 400])
+        with option_context("display.max_rows", 2):
+            strrepr = repr(s).replace('\n', '')
+        assert getndots(strrepr) == 3
+
+    def test_show_dimensions(self):
+        # gh-7117
+        s = Series(range(5))
+
+        assert 'Length' not in repr(s)
+
+        with option_context("display.max_rows", 4):
+            assert 'Length' in repr(s)
+
+        with option_context("display.show_dimensions", True):
+            assert 'Length' in repr(s)
+
+        with option_context("display.max_rows", 4,
+                            "display.show_dimensions", False):
+            assert 'Length' not in repr(s)
+
+    def test_to_string_name(self):
+        s = Series(range(100), dtype='int64')
+        s.name = 'myser'
+        res = s.to_string(max_rows=2, name=True)
+        exp = '0      0\n      ..\n99    99\nName: myser'
+        assert res == exp
+        res = s.to_string(max_rows=2, name=False)
+        exp = '0      0\n      ..\n99    99'
+        assert res == exp
+
+    def test_to_string_dtype(self):
+        s = Series(range(100), dtype='int64')
+        res = s.to_string(max_rows=2, dtype=True)
+        exp = '0      0\n      ..\n99    99\ndtype: int64'
+        assert res == exp
+        res = s.to_string(max_rows=2, dtype=False)
+        exp = '0      0\n      ..\n99    99'
+        assert res == exp
+
+    def test_to_string_length(self):
+        s = Series(range(100), dtype='int64')
+        res = s.to_string(max_rows=2, length=True)
+        exp = '0      0\n      ..\n99    99\nLength: 100'
+        assert res == exp
+
+    def test_to_string_na_rep(self):
+        s = pd.Series(index=range(100))
+        res = s.to_string(na_rep='foo', max_rows=2)
+        exp = '0    foo\n      ..\n99   foo'
+        assert res == exp
+
+    def test_to_string_float_format(self):
+        s = pd.Series(range(10), dtype='float64')
+        res = s.to_string(float_format=lambda x: '{0:2.1f}'.format(x),
+                          max_rows=2)
+        exp = '0   0.0\n     ..\n9   9.0'
+        assert res == exp
+
+    def test_to_string_header(self):
+        s = pd.Series(range(10), dtype='int64')
+        s.index.name = 'foo'
+        res = s.to_string(header=True, max_rows=2)
+        exp = 'foo\n0    0\n    ..\n9    9'
+        assert res == exp
+        res = s.to_string(header=False, max_rows=2)
+        exp = '0    0\n    ..\n9    9'
+        assert res == exp
+
+
+def _three_digit_exp():
+    return '{x:.4g}'.format(x=1.7e8) == '1.7e+008'
+
+
+class TestFloatArrayFormatter(object):
+
+    def test_misc(self):
+        obj = fmt.FloatArrayFormatter(np.array([], dtype=np.float64))
+        result = obj.get_result()
+        assert len(result) == 0
+
+    def test_format(self):
+        obj = fmt.FloatArrayFormatter(np.array([12, 0], dtype=np.float64))
+        result = obj.get_result()
+        assert result[0] == " 12.0"
+        assert result[1] == "  0.0"
+
+    def test_output_significant_digits(self):
+        # Issue #9764
+
+        # In case default display precision changes:
+        with pd.option_context('display.precision', 6):
+            # DataFrame example from issue #9764
+            d = pd.DataFrame(
+                {'col1': [9.999e-8, 1e-7, 1.0001e-7, 2e-7, 4.999e-7, 5e-7,
+                          5.0001e-7, 6e-7, 9.999e-7, 1e-6, 1.0001e-6, 2e-6,
+                          4.999e-6, 5e-6, 5.0001e-6, 6e-6]})
+
+            expected_output = {
+                (0, 6):
+                '           col1\n'
+                '0  9.999000e-08\n'
+                '1  1.000000e-07\n'
+                '2  1.000100e-07\n'
+                '3  2.000000e-07\n'
+                '4  4.999000e-07\n'
+                '5  5.000000e-07',
+                (1, 6):
+                '           col1\n'
+                '1  1.000000e-07\n'
+                '2  1.000100e-07\n'
+                '3  2.000000e-07\n'
+                '4  4.999000e-07\n'
+                '5  5.000000e-07',
+                (1, 8):
+                '           col1\n'
+                '1  1.000000e-07\n'
+                '2  1.000100e-07\n'
+                '3  2.000000e-07\n'
+                '4  4.999000e-07\n'
+                '5  5.000000e-07\n'
+                '6  5.000100e-07\n'
+                '7  6.000000e-07',
+                (8, 16):
+                '            col1\n'
+                '8   9.999000e-07\n'
+                '9   1.000000e-06\n'
+                '10  1.000100e-06\n'
+                '11  2.000000e-06\n'
+                '12  4.999000e-06\n'
+                '13  5.000000e-06\n'
+                '14  5.000100e-06\n'
+                '15  6.000000e-06',
+                (9, 16):
+                '        col1\n'
+                '9   0.000001\n'
+                '10  0.000001\n'
+                '11  0.000002\n'
+                '12  0.000005\n'
+                '13  0.000005\n'
+                '14  0.000005\n'
+                '15  0.000006'
+            }
+
+            for (start, stop), v in expected_output.items():
+                assert str(d[start:stop]) == v
+
+    def test_too_long(self):
+        # GH 10451
+        with pd.option_context('display.precision', 4):
+            # need both a number > 1e6 and something that normally formats to
+            # having length > display.precision + 6
+            df = pd.DataFrame(dict(x=[12345.6789]))
+            assert str(df) == '            x\n0  12345.6789'
+            df = pd.DataFrame(dict(x=[2e6]))
+            assert str(df) == '           x\n0  2000000.0'
+            df = pd.DataFrame(dict(x=[12345.6789, 2e6]))
+            assert str(df) == '            x\n0  1.2346e+04\n1  2.0000e+06'
+
+
+class TestRepr_timedelta64(object):
+
+    def test_none(self):
+        delta_1d = pd.to_timedelta(1, unit='D')
+        delta_0d = pd.to_timedelta(0, unit='D')
+        delta_1s = pd.to_timedelta(1, unit='s')
+        delta_500ms = pd.to_timedelta(500, unit='ms')
+
+        drepr = lambda x: x._repr_base()
+        assert drepr(delta_1d) == "1 days"
+        assert drepr(-delta_1d) == "-1 days"
+        assert drepr(delta_0d) == "0 days"
+        assert drepr(delta_1s) == "0 days 00:00:01"
+        assert drepr(delta_500ms) == "0 days 00:00:00.500000"
+        assert drepr(delta_1d + delta_1s) == "1 days 00:00:01"
+        assert drepr(-delta_1d + delta_1s) == "-1 days +00:00:01"
+        assert drepr(delta_1d + delta_500ms) == "1 days 00:00:00.500000"
+        assert drepr(-delta_1d + delta_500ms) == "-1 days +00:00:00.500000"
+
+    def test_sub_day(self):
+        delta_1d = pd.to_timedelta(1, unit='D')
+        delta_0d = pd.to_timedelta(0, unit='D')
+        delta_1s = pd.to_timedelta(1, unit='s')
+        delta_500ms = pd.to_timedelta(500, unit='ms')
+
+        drepr = lambda x: x._repr_base(format='sub_day')
+        assert drepr(delta_1d) == "1 days"
+        assert drepr(-delta_1d) == "-1 days"
+        assert drepr(delta_0d) == "00:00:00"
+        assert drepr(delta_1s) == "00:00:01"
+        assert drepr(delta_500ms) == "00:00:00.500000"
+        assert drepr(delta_1d + delta_1s) == "1 days 00:00:01"
+        assert drepr(-delta_1d + delta_1s) == "-1 days +00:00:01"
+        assert drepr(delta_1d + delta_500ms) == "1 days 00:00:00.500000"
+        assert drepr(-delta_1d + delta_500ms) == "-1 days +00:00:00.500000"
+
+    def test_long(self):
+        delta_1d = pd.to_timedelta(1, unit='D')
+        delta_0d = pd.to_timedelta(0, unit='D')
+        delta_1s = pd.to_timedelta(1, unit='s')
+        delta_500ms = pd.to_timedelta(500, unit='ms')
+
+        drepr = lambda x: x._repr_base(format='long')
+        assert drepr(delta_1d) == "1 days 00:00:00"
+        assert drepr(-delta_1d) == "-1 days +00:00:00"
+        assert drepr(delta_0d) == "0 days 00:00:00"
+        assert drepr(delta_1s) == "0 days 00:00:01"
+        assert drepr(delta_500ms) == "0 days 00:00:00.500000"
+        assert drepr(delta_1d + delta_1s) == "1 days 00:00:01"
+        assert drepr(-delta_1d + delta_1s) == "-1 days +00:00:01"
+        assert drepr(delta_1d + delta_500ms) == "1 days 00:00:00.500000"
+        assert drepr(-delta_1d + delta_500ms) == "-1 days +00:00:00.500000"
+
+    def test_all(self):
+        delta_1d = pd.to_timedelta(1, unit='D')
+        delta_0d = pd.to_timedelta(0, unit='D')
+        delta_1ns = pd.to_timedelta(1, unit='ns')
+
+        drepr = lambda x: x._repr_base(format='all')
+        assert drepr(delta_1d) == "1 days 00:00:00.000000000"
+        assert drepr(-delta_1d) == "-1 days +00:00:00.000000000"
+        assert drepr(delta_0d) == "0 days 00:00:00.000000000"
+        assert drepr(delta_1ns) == "0 days 00:00:00.000000001"
+        assert drepr(-delta_1d + delta_1ns) == "-1 days +00:00:00.000000001"
+
+
+class TestTimedelta64Formatter(object):
+
+    def test_days(self):
+        x = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='D')
+        result = fmt.Timedelta64Formatter(x, box=True).get_result()
+        assert result[0].strip() == "'0 days'"
+        assert result[1].strip() == "'1 days'"
+
+        result = fmt.Timedelta64Formatter(x[1:2], box=True).get_result()
+        assert result[0].strip() == "'1 days'"
+
+        result = fmt.Timedelta64Formatter(x, box=False).get_result()
+        assert result[0].strip() == "0 days"
+        assert result[1].strip() == "1 days"
+
+        result = fmt.Timedelta64Formatter(x[1:2], box=False).get_result()
+        assert result[0].strip() == "1 days"
+
+    def test_days_neg(self):
+        x = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='D')
+        result = fmt.Timedelta64Formatter(-x, box=True).get_result()
+        assert result[0].strip() == "'0 days'"
+        assert result[1].strip() == "'-1 days'"
+
+    def test_subdays(self):
+        y = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='s')
+        result = fmt.Timedelta64Formatter(y, box=True).get_result()
+        assert result[0].strip() == "'00:00:00'"
+        assert result[1].strip() == "'00:00:01'"
+
+    def test_subdays_neg(self):
+        y = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='s')
+        result = fmt.Timedelta64Formatter(-y, box=True).get_result()
+        assert result[0].strip() == "'00:00:00'"
+        assert result[1].strip() == "'-1 days +23:59:59'"
+
+    def test_zero(self):
+        x = pd.to_timedelta(list(range(1)) + [pd.NaT], unit='D')
+        result = fmt.Timedelta64Formatter(x, box=True).get_result()
+        assert result[0].strip() == "'0 days'"
+
+        x = pd.to_timedelta(list(range(1)), unit='D')
+        result = fmt.Timedelta64Formatter(x, box=True).get_result()
+        assert result[0].strip() == "'0 days'"
+
+
+class TestDatetime64Formatter(object):
+
+    def test_mixed(self):
+        x = Series([datetime(2013, 1, 1), datetime(2013, 1, 1, 12), pd.NaT])
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01 00:00:00"
+        assert result[1].strip() == "2013-01-01 12:00:00"
+
+    def test_dates(self):
+        x = Series([datetime(2013, 1, 1), datetime(2013, 1, 2), pd.NaT])
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01"
+        assert result[1].strip() == "2013-01-02"
+
+    def test_date_nanos(self):
+        x = Series([Timestamp(200)])
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "1970-01-01 00:00:00.000000200"
+
+    def test_dates_display(self):
+
+        # 10170
+        # make sure that we are consistently display date formatting
+        x = Series(date_range('20130101 09:00:00', periods=5, freq='D'))
+        x.iloc[1] = np.nan
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01 09:00:00"
+        assert result[1].strip() == "NaT"
+        assert result[4].strip() == "2013-01-05 09:00:00"
+
+        x = Series(date_range('20130101 09:00:00', periods=5, freq='s'))
+        x.iloc[1] = np.nan
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01 09:00:00"
+        assert result[1].strip() == "NaT"
+        assert result[4].strip() == "2013-01-01 09:00:04"
+
+        x = Series(date_range('20130101 09:00:00', periods=5, freq='ms'))
+        x.iloc[1] = np.nan
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01 09:00:00.000"
+        assert result[1].strip() == "NaT"
+        assert result[4].strip() == "2013-01-01 09:00:00.004"
+
+        x = Series(date_range('20130101 09:00:00', periods=5, freq='us'))
+        x.iloc[1] = np.nan
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01 09:00:00.000000"
+        assert result[1].strip() == "NaT"
+        assert result[4].strip() == "2013-01-01 09:00:00.000004"
+
+        x = Series(date_range('20130101 09:00:00', periods=5, freq='N'))
+        x.iloc[1] = np.nan
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01 09:00:00.000000000"
+        assert result[1].strip() == "NaT"
+        assert result[4].strip() == "2013-01-01 09:00:00.000000004"
+
+    def test_datetime64formatter_yearmonth(self):
+        x = Series([datetime(2016, 1, 1), datetime(2016, 2, 2)])
+
+        def format_func(x):
+            return x.strftime('%Y-%m')
+
+        formatter = fmt.Datetime64Formatter(x, formatter=format_func)
+        result = formatter.get_result()
+        assert result == ['2016-01', '2016-02']
+
+    def test_datetime64formatter_hoursecond(self):
+
+        x = Series(pd.to_datetime(['10:10:10.100', '12:12:12.120'],
+                                  format='%H:%M:%S.%f'))
+
+        def format_func(x):
+            return x.strftime('%H:%M')
+
+        formatter = fmt.Datetime64Formatter(x, formatter=format_func)
+        result = formatter.get_result()
+        assert result == ['10:10', '12:12']
+
+
+class TestNaTFormatting(object):
+
+    def test_repr(self):
+        assert repr(pd.NaT) == "NaT"
+
+    def test_str(self):
+        assert str(pd.NaT) == "NaT"
+
+
+class TestDatetimeIndexFormat(object):
+
+    def test_datetime(self):
+        formatted = pd.to_datetime([datetime(2003, 1, 1, 12), pd.NaT]).format()
+        assert formatted[0] == "2003-01-01 12:00:00"
+        assert formatted[1] == "NaT"
+
+    def test_date(self):
+        formatted = pd.to_datetime([datetime(2003, 1, 1), pd.NaT]).format()
+        assert formatted[0] == "2003-01-01"
+        assert formatted[1] == "NaT"
+
+    def test_date_tz(self):
+        formatted = pd.to_datetime([datetime(2013, 1, 1)], utc=True).format()
+        assert formatted[0] == "2013-01-01 00:00:00+00:00"
+
+        formatted = pd.to_datetime(
+            [datetime(2013, 1, 1), pd.NaT], utc=True).format()
+        assert formatted[0] == "2013-01-01 00:00:00+00:00"
+
+    def test_date_explicit_date_format(self):
+        formatted = pd.to_datetime([datetime(2003, 2, 1), pd.NaT]).format(
+            date_format="%m-%d-%Y", na_rep="UT")
+        assert formatted[0] == "02-01-2003"
+        assert formatted[1] == "UT"
+
+
+class TestDatetimeIndexUnicode(object):
+
+    def test_dates(self):
+        text = str(pd.to_datetime([datetime(2013, 1, 1), datetime(2014, 1, 1)
+                                   ]))
+        assert "['2013-01-01'," in text
+        assert ", '2014-01-01']" in text
+
+    def test_mixed(self):
+        text = str(pd.to_datetime([datetime(2013, 1, 1), datetime(
+            2014, 1, 1, 12), datetime(2014, 1, 1)]))
+        assert "'2013-01-01 00:00:00'," in text
+        assert "'2014-01-01 00:00:00']" in text
+
+
+class TestStringRepTimestamp(object):
+
+    def test_no_tz(self):
+        dt_date = datetime(2013, 1, 2)
+        assert str(dt_date) == str(Timestamp(dt_date))
+
+        dt_datetime = datetime(2013, 1, 2, 12, 1, 3)
+        assert str(dt_datetime) == str(Timestamp(dt_datetime))
+
+        dt_datetime_us = datetime(2013, 1, 2, 12, 1, 3, 45)
+        assert str(dt_datetime_us) == str(Timestamp(dt_datetime_us))
+
+        ts_nanos_only = Timestamp(200)
+        assert str(ts_nanos_only) == "1970-01-01 00:00:00.000000200"
+
+        ts_nanos_micros = Timestamp(1200)
+        assert str(ts_nanos_micros) == "1970-01-01 00:00:00.000001200"
+
+    def test_tz_pytz(self):
+        dt_date = datetime(2013, 1, 2, tzinfo=pytz.utc)
+        assert str(dt_date) == str(Timestamp(dt_date))
+
+        dt_datetime = datetime(2013, 1, 2, 12, 1, 3, tzinfo=pytz.utc)
+        assert str(dt_datetime) == str(Timestamp(dt_datetime))
+
+        dt_datetime_us = datetime(2013, 1, 2, 12, 1, 3, 45, tzinfo=pytz.utc)
+        assert str(dt_datetime_us) == str(Timestamp(dt_datetime_us))
+
+    def test_tz_dateutil(self):
+        utc = dateutil.tz.tzutc()
+
+        dt_date = datetime(2013, 1, 2, tzinfo=utc)
+        assert str(dt_date) == str(Timestamp(dt_date))
+
+        dt_datetime = datetime(2013, 1, 2, 12, 1, 3, tzinfo=utc)
+        assert str(dt_datetime) == str(Timestamp(dt_datetime))
+
+        dt_datetime_us = datetime(2013, 1, 2, 12, 1, 3, 45, tzinfo=utc)
+        assert str(dt_datetime_us) == str(Timestamp(dt_datetime_us))
+
+    def test_nat_representations(self):
+        for f in (str, repr, methodcaller('isoformat')):
+            assert f(pd.NaT) == 'NaT'
+
+
+def test_format_percentiles():
+    result = fmt.format_percentiles([0.01999, 0.02001, 0.5, 0.666666, 0.9999])
+    expected = ['1.999%', '2.001%', '50%', '66.667%', '99.99%']
+    assert result == expected
+
+    result = fmt.format_percentiles([0, 0.5, 0.02001, 0.5, 0.666666, 0.9999])
+    expected = ['0%', '50%', '2.0%', '50%', '66.67%', '99.99%']
+    assert result == expected
+
+    pytest.raises(ValueError, fmt.format_percentiles, [0.1, np.nan, 0.5])
+    pytest.raises(ValueError, fmt.format_percentiles, [-0.001, 0.1, 0.5])
+    pytest.raises(ValueError, fmt.format_percentiles, [2, 0.1, 0.5])
+    pytest.raises(ValueError, fmt.format_percentiles, [0.1, 0.5, 'a'])
diff --git a/pandas/tests/io/formats/test_printing.py b/pandas/tests/io/formats/test_printing.py
new file mode 100644
index 0000000000000..c9c46d4a991ec
--- /dev/null
+++ b/pandas/tests/io/formats/test_printing.py
@@ -0,0 +1,204 @@
+# -*- coding: utf-8 -*-
+import pytest
+
+import numpy as np
+import pandas as pd
+
+from pandas import compat
+import pandas.io.formats.printing as printing
+import pandas.io.formats.format as fmt
+import pandas.core.config as cf
+
+
+def test_adjoin():
+    data = [['a', 'b', 'c'], ['dd', 'ee', 'ff'], ['ggg', 'hhh', 'iii']]
+    expected = 'a  dd  ggg\nb  ee  hhh\nc  ff  iii'
+
+    adjoined = printing.adjoin(2, *data)
+
+    assert (adjoined == expected)
+
+
+def test_repr_binary_type():
+    import string
+    letters = string.ascii_letters
+    btype = compat.binary_type
+    try:
+        raw = btype(letters, encoding=cf.get_option('display.encoding'))
+    except TypeError:
+        raw = btype(letters)
+    b = compat.text_type(compat.bytes_to_str(raw))
+    res = printing.pprint_thing(b, quote_strings=True)
+    assert res == repr(b)
+    res = printing.pprint_thing(b, quote_strings=False)
+    assert res == b
+
+
+class TestFormattBase(object):
+
+    def test_adjoin(self):
+        data = [['a', 'b', 'c'], ['dd', 'ee', 'ff'], ['ggg', 'hhh', 'iii']]
+        expected = 'a  dd  ggg\nb  ee  hhh\nc  ff  iii'
+
+        adjoined = printing.adjoin(2, *data)
+
+        assert adjoined == expected
+
+    def test_adjoin_unicode(self):
+        data = [[u'あ', 'b', 'c'], ['dd', u'ええ', 'ff'], ['ggg', 'hhh', u'いいい']]
+        expected = u'あ  dd  ggg\nb  ええ  hhh\nc  ff  いいい'
+        adjoined = printing.adjoin(2, *data)
+        assert adjoined == expected
+
+        adj = fmt.EastAsianTextAdjustment()
+
+        expected = u"""あ  dd    ggg
+b   ええ  hhh
+c   ff    いいい"""
+
+        adjoined = adj.adjoin(2, *data)
+        assert adjoined == expected
+        cols = adjoined.split('\n')
+        assert adj.len(cols[0]) == 13
+        assert adj.len(cols[1]) == 13
+        assert adj.len(cols[2]) == 16
+
+        expected = u"""あ       dd         ggg
+b        ええ       hhh
+c        ff         いいい"""
+
+        adjoined = adj.adjoin(7, *data)
+        assert adjoined == expected
+        cols = adjoined.split('\n')
+        assert adj.len(cols[0]) == 23
+        assert adj.len(cols[1]) == 23
+        assert adj.len(cols[2]) == 26
+
+    def test_justify(self):
+        adj = fmt.EastAsianTextAdjustment()
+
+        def just(x, *args, **kwargs):
+            # wrapper to test single str
+            return adj.justify([x], *args, **kwargs)[0]
+
+        assert just('abc', 5, mode='left') == 'abc  '
+        assert just('abc', 5, mode='center') == ' abc '
+        assert just('abc', 5, mode='right') == '  abc'
+        assert just(u'abc', 5, mode='left') == 'abc  '
+        assert just(u'abc', 5, mode='center') == ' abc '
+        assert just(u'abc', 5, mode='right') == '  abc'
+
+        assert just(u'パンダ', 5, mode='left') == u'パンダ'
+        assert just(u'パンダ', 5, mode='center') == u'パンダ'
+        assert just(u'パンダ', 5, mode='right') == u'パンダ'
+
+        assert just(u'パンダ', 10, mode='left') == u'パンダ    '
+        assert just(u'パンダ', 10, mode='center') == u'  パンダ  '
+        assert just(u'パンダ', 10, mode='right') == u'    パンダ'
+
+    def test_east_asian_len(self):
+        adj = fmt.EastAsianTextAdjustment()
+
+        assert adj.len('abc') == 3
+        assert adj.len(u'abc') == 3
+
+        assert adj.len(u'パンダ') == 6
+        assert adj.len(u'ﾊﾟﾝﾀﾞ') == 5
+        assert adj.len(u'パンダpanda') == 11
+        assert adj.len(u'ﾊﾟﾝﾀﾞpanda') == 10
+
+    def test_ambiguous_width(self):
+        adj = fmt.EastAsianTextAdjustment()
+        assert adj.len(u'¡¡ab') == 4
+
+        with cf.option_context('display.unicode.ambiguous_as_wide', True):
+            adj = fmt.EastAsianTextAdjustment()
+            assert adj.len(u'¡¡ab') == 6
+
+        data = [[u'あ', 'b', 'c'], ['dd', u'ええ', 'ff'],
+                ['ggg', u'¡¡ab', u'いいい']]
+        expected = u'あ  dd    ggg \nb   ええ  ¡¡ab\nc   ff    いいい'
+        adjoined = adj.adjoin(2, *data)
+        assert adjoined == expected
+
+
+class TestTableSchemaRepr(object):
+
+    @classmethod
+    def setup_class(cls):
+        pytest.importorskip('IPython')
+
+        from IPython.core.interactiveshell import InteractiveShell
+        cls.display_formatter = InteractiveShell.instance().display_formatter
+
+    def test_publishes(self):
+
+        df = pd.DataFrame({"A": [1, 2]})
+        objects = [df['A'], df, df]  # dataframe / series
+        expected_keys = [
+            {'text/plain', 'application/vnd.dataresource+json'},
+            {'text/plain', 'text/html', 'application/vnd.dataresource+json'},
+        ]
+
+        opt = pd.option_context('display.html.table_schema', True)
+        for obj, expected in zip(objects, expected_keys):
+            with opt:
+                formatted = self.display_formatter.format(obj)
+            assert set(formatted[0].keys()) == expected
+
+        with_latex = pd.option_context('display.latex.repr', True)
+
+        with opt, with_latex:
+            formatted = self.display_formatter.format(obj)
+
+        expected = {'text/plain', 'text/html', 'text/latex',
+                    'application/vnd.dataresource+json'}
+        assert set(formatted[0].keys()) == expected
+
+    def test_publishes_not_implemented(self):
+        # column MultiIndex
+        # GH 15996
+        midx = pd.MultiIndex.from_product([['A', 'B'], ['a', 'b', 'c']])
+        df = pd.DataFrame(np.random.randn(5, len(midx)), columns=midx)
+
+        opt = pd.option_context('display.html.table_schema', True)
+
+        with opt:
+            formatted = self.display_formatter.format(df)
+
+        expected = {'text/plain', 'text/html'}
+        assert set(formatted[0].keys()) == expected
+
+    def test_config_on(self):
+        df = pd.DataFrame({"A": [1, 2]})
+        with pd.option_context("display.html.table_schema", True):
+            result = df._repr_data_resource_()
+
+        assert result is not None
+
+    def test_config_default_off(self):
+        df = pd.DataFrame({"A": [1, 2]})
+        with pd.option_context("display.html.table_schema", False):
+            result = df._repr_data_resource_()
+
+        assert result is None
+
+    def test_enable_data_resource_formatter(self):
+        # GH 10491
+        formatters = self.display_formatter.formatters
+        mimetype = 'application/vnd.dataresource+json'
+
+        with pd.option_context('display.html.table_schema', True):
+            assert 'application/vnd.dataresource+json' in formatters
+            assert formatters[mimetype].enabled
+
+        # still there, just disabled
+        assert 'application/vnd.dataresource+json' in formatters
+        assert not formatters[mimetype].enabled
+
+        # able to re-set
+        with pd.option_context('display.html.table_schema', True):
+            assert 'application/vnd.dataresource+json' in formatters
+            assert formatters[mimetype].enabled
+            # smoke test that it works
+            self.display_formatter.format(cf)
diff --git a/pandas/tests/io/formats/test_style.py b/pandas/tests/io/formats/test_style.py
new file mode 100644
index 0000000000000..b355cda8df1bd
--- /dev/null
+++ b/pandas/tests/io/formats/test_style.py
@@ -0,0 +1,1094 @@
+import copy
+import textwrap
+import re
+
+import pytest
+import numpy as np
+import pandas as pd
+from pandas import DataFrame
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+jinja2 = pytest.importorskip('jinja2')
+from pandas.io.formats.style import Styler, _get_level_lengths  # noqa
+
+
+class TestStyler(object):
+
+    def setup_method(self, method):
+        np.random.seed(24)
+        self.s = DataFrame({'A': np.random.permutation(range(6))})
+        self.df = DataFrame({'A': [0, 1], 'B': np.random.randn(2)})
+        self.f = lambda x: x
+        self.g = lambda x: x
+
+        def h(x, foo='bar'):
+            return pd.Series(
+                'color: {foo}'.format(foo=foo), index=x.index, name=x.name)
+
+        self.h = h
+        self.styler = Styler(self.df)
+        self.attrs = pd.DataFrame({'A': ['color: red', 'color: blue']})
+        self.dataframes = [
+            self.df,
+            pd.DataFrame({'f': [1., 2.], 'o': ['a', 'b'],
+                          'c': pd.Categorical(['a', 'b'])})
+        ]
+
+    def test_init_non_pandas(self):
+        with pytest.raises(TypeError):
+            Styler([1, 2, 3])
+
+    def test_init_series(self):
+        result = Styler(pd.Series([1, 2]))
+        assert result.data.ndim == 2
+
+    def test_repr_html_ok(self):
+        self.styler._repr_html_()
+
+    def test_repr_html_mathjax(self):
+        # gh-19824
+        assert 'tex2jax_ignore' not in self.styler._repr_html_()
+
+        with pd.option_context('display.html.use_mathjax', False):
+            assert 'tex2jax_ignore' in self.styler._repr_html_()
+
+    def test_update_ctx(self):
+        self.styler._update_ctx(self.attrs)
+        expected = {(0, 0): ['color: red'],
+                    (1, 0): ['color: blue']}
+        assert self.styler.ctx == expected
+
+    def test_update_ctx_flatten_multi(self):
+        attrs = DataFrame({"A": ['color: red; foo: bar',
+                                 'color: blue; foo: baz']})
+        self.styler._update_ctx(attrs)
+        expected = {(0, 0): ['color: red', ' foo: bar'],
+                    (1, 0): ['color: blue', ' foo: baz']}
+        assert self.styler.ctx == expected
+
+    def test_update_ctx_flatten_multi_traliing_semi(self):
+        attrs = DataFrame({"A": ['color: red; foo: bar;',
+                                 'color: blue; foo: baz;']})
+        self.styler._update_ctx(attrs)
+        expected = {(0, 0): ['color: red', ' foo: bar'],
+                    (1, 0): ['color: blue', ' foo: baz']}
+        assert self.styler.ctx == expected
+
+    def test_copy(self):
+        s2 = copy.copy(self.styler)
+        assert self.styler is not s2
+        assert self.styler.ctx is s2.ctx  # shallow
+        assert self.styler._todo is s2._todo
+
+        self.styler._update_ctx(self.attrs)
+        self.styler.highlight_max()
+        assert self.styler.ctx == s2.ctx
+        assert self.styler._todo == s2._todo
+
+    def test_deepcopy(self):
+        s2 = copy.deepcopy(self.styler)
+        assert self.styler is not s2
+        assert self.styler.ctx is not s2.ctx
+        assert self.styler._todo is not s2._todo
+
+        self.styler._update_ctx(self.attrs)
+        self.styler.highlight_max()
+        assert self.styler.ctx != s2.ctx
+        assert s2._todo == []
+        assert self.styler._todo != s2._todo
+
+    def test_clear(self):
+        s = self.df.style.highlight_max()._compute()
+        assert len(s.ctx) > 0
+        assert len(s._todo) > 0
+        s.clear()
+        assert len(s.ctx) == 0
+        assert len(s._todo) == 0
+
+    def test_render(self):
+        df = pd.DataFrame({"A": [0, 1]})
+        style = lambda x: pd.Series(["color: red", "color: blue"], name=x.name)
+        s = Styler(df, uuid='AB').apply(style)
+        s.render()
+        # it worked?
+
+    def test_render_empty_dfs(self):
+        empty_df = DataFrame()
+        es = Styler(empty_df)
+        es.render()
+        # An index but no columns
+        DataFrame(columns=['a']).style.render()
+        # A column but no index
+        DataFrame(index=['a']).style.render()
+        # No IndexError raised?
+
+    def test_render_double(self):
+        df = pd.DataFrame({"A": [0, 1]})
+        style = lambda x: pd.Series(["color: red; border: 1px",
+                                     "color: blue; border: 2px"], name=x.name)
+        s = Styler(df, uuid='AB').apply(style)
+        s.render()
+        # it worked?
+
+    def test_set_properties(self):
+        df = pd.DataFrame({"A": [0, 1]})
+        result = df.style.set_properties(color='white',
+                                         size='10px')._compute().ctx
+        # order is deterministic
+        v = ["color: white", "size: 10px"]
+        expected = {(0, 0): v, (1, 0): v}
+        assert result.keys() == expected.keys()
+        for v1, v2 in zip(result.values(), expected.values()):
+            assert sorted(v1) == sorted(v2)
+
+    def test_set_properties_subset(self):
+        df = pd.DataFrame({'A': [0, 1]})
+        result = df.style.set_properties(subset=pd.IndexSlice[0, 'A'],
+                                         color='white')._compute().ctx
+        expected = {(0, 0): ['color: white']}
+        assert result == expected
+
+    def test_empty_index_name_doesnt_display(self):
+        # https://github.com/pandas-dev/pandas/pull/12090#issuecomment-180695902
+        df = pd.DataFrame({'A': [1, 2], 'B': [3, 4], 'C': [5, 6]})
+        result = df.style._translate()
+
+        expected = [[{'class': 'blank level0', 'type': 'th', 'value': '',
+                      'is_visible': True, 'display_value': ''},
+                     {'class': 'col_heading level0 col0',
+                      'display_value': 'A',
+                      'type': 'th',
+                      'value': 'A',
+                      'is_visible': True,
+                      },
+                     {'class': 'col_heading level0 col1',
+                      'display_value': 'B',
+                      'type': 'th',
+                      'value': 'B',
+                      'is_visible': True,
+                      },
+                     {'class': 'col_heading level0 col2',
+                      'display_value': 'C',
+                      'type': 'th',
+                      'value': 'C',
+                      'is_visible': True,
+                      }]]
+
+        assert result['head'] == expected
+
+    def test_index_name(self):
+        # https://github.com/pandas-dev/pandas/issues/11655
+        df = pd.DataFrame({'A': [1, 2], 'B': [3, 4], 'C': [5, 6]})
+        result = df.set_index('A').style._translate()
+
+        expected = [[{'class': 'blank level0', 'type': 'th', 'value': '',
+                      'display_value': '', 'is_visible': True},
+                     {'class': 'col_heading level0 col0', 'type': 'th',
+                      'value': 'B', 'display_value': 'B', 'is_visible': True},
+                     {'class': 'col_heading level0 col1', 'type': 'th',
+                      'value': 'C', 'display_value': 'C', 'is_visible': True}],
+                    [{'class': 'index_name level0', 'type': 'th',
+                      'value': 'A'},
+                     {'class': 'blank', 'type': 'th', 'value': ''},
+                     {'class': 'blank', 'type': 'th', 'value': ''}]]
+
+        assert result['head'] == expected
+
+    def test_multiindex_name(self):
+        # https://github.com/pandas-dev/pandas/issues/11655
+        df = pd.DataFrame({'A': [1, 2], 'B': [3, 4], 'C': [5, 6]})
+        result = df.set_index(['A', 'B']).style._translate()
+
+        expected = [[
+            {'class': 'blank', 'type': 'th', 'value': '',
+             'display_value': '', 'is_visible': True},
+            {'class': 'blank level0', 'type': 'th', 'value': '',
+             'display_value': '', 'is_visible': True},
+            {'class': 'col_heading level0 col0', 'type': 'th',
+             'value': 'C', 'display_value': 'C', 'is_visible': True}],
+            [{'class': 'index_name level0', 'type': 'th',
+              'value': 'A'},
+             {'class': 'index_name level1', 'type': 'th',
+              'value': 'B'},
+             {'class': 'blank', 'type': 'th', 'value': ''}]]
+
+        assert result['head'] == expected
+
+    def test_numeric_columns(self):
+        # https://github.com/pandas-dev/pandas/issues/12125
+        # smoke test for _translate
+        df = pd.DataFrame({0: [1, 2, 3]})
+        df.style._translate()
+
+    def test_apply_axis(self):
+        df = pd.DataFrame({'A': [0, 0], 'B': [1, 1]})
+        f = lambda x: ['val: {max}'.format(max=x.max()) for v in x]
+        result = df.style.apply(f, axis=1)
+        assert len(result._todo) == 1
+        assert len(result.ctx) == 0
+        result._compute()
+        expected = {(0, 0): ['val: 1'], (0, 1): ['val: 1'],
+                    (1, 0): ['val: 1'], (1, 1): ['val: 1']}
+        assert result.ctx == expected
+
+        result = df.style.apply(f, axis=0)
+        expected = {(0, 0): ['val: 0'], (0, 1): ['val: 1'],
+                    (1, 0): ['val: 0'], (1, 1): ['val: 1']}
+        result._compute()
+        assert result.ctx == expected
+        result = df.style.apply(f)  # default
+        result._compute()
+        assert result.ctx == expected
+
+    def test_apply_subset(self):
+        axes = [0, 1]
+        slices = [pd.IndexSlice[:], pd.IndexSlice[:, ['A']],
+                  pd.IndexSlice[[1], :], pd.IndexSlice[[1], ['A']],
+                  pd.IndexSlice[:2, ['A', 'B']]]
+        for ax in axes:
+            for slice_ in slices:
+                result = self.df.style.apply(self.h, axis=ax, subset=slice_,
+                                             foo='baz')._compute().ctx
+                expected = dict(((r, c), ['color: baz'])
+                                for r, row in enumerate(self.df.index)
+                                for c, col in enumerate(self.df.columns)
+                                if row in self.df.loc[slice_].index and
+                                col in self.df.loc[slice_].columns)
+                assert result == expected
+
+    def test_applymap_subset(self):
+        def f(x):
+            return 'foo: bar'
+
+        slices = [pd.IndexSlice[:], pd.IndexSlice[:, ['A']],
+                  pd.IndexSlice[[1], :], pd.IndexSlice[[1], ['A']],
+                  pd.IndexSlice[:2, ['A', 'B']]]
+
+        for slice_ in slices:
+            result = self.df.style.applymap(f, subset=slice_)._compute().ctx
+            expected = dict(((r, c), ['foo: bar'])
+                            for r, row in enumerate(self.df.index)
+                            for c, col in enumerate(self.df.columns)
+                            if row in self.df.loc[slice_].index and
+                            col in self.df.loc[slice_].columns)
+            assert result == expected
+
+    def test_where_with_one_style(self):
+        # GH 17474
+        def f(x):
+            return x > 0.5
+
+        style1 = 'foo: bar'
+
+        result = self.df.style.where(f, style1)._compute().ctx
+        expected = dict(((r, c),
+                        [style1 if f(self.df.loc[row, col]) else ''])
+                        for r, row in enumerate(self.df.index)
+                        for c, col in enumerate(self.df.columns))
+        assert result == expected
+
+    def test_where_subset(self):
+        # GH 17474
+        def f(x):
+            return x > 0.5
+
+        style1 = 'foo: bar'
+        style2 = 'baz: foo'
+
+        slices = [pd.IndexSlice[:], pd.IndexSlice[:, ['A']],
+                  pd.IndexSlice[[1], :], pd.IndexSlice[[1], ['A']],
+                  pd.IndexSlice[:2, ['A', 'B']]]
+
+        for slice_ in slices:
+            result = self.df.style.where(f, style1, style2,
+                                         subset=slice_)._compute().ctx
+            expected = dict(((r, c),
+                            [style1 if f(self.df.loc[row, col]) else style2])
+                            for r, row in enumerate(self.df.index)
+                            for c, col in enumerate(self.df.columns)
+                            if row in self.df.loc[slice_].index and
+                            col in self.df.loc[slice_].columns)
+            assert result == expected
+
+    def test_where_subset_compare_with_applymap(self):
+        # GH 17474
+        def f(x):
+            return x > 0.5
+
+        style1 = 'foo: bar'
+        style2 = 'baz: foo'
+
+        def g(x):
+            return style1 if f(x) else style2
+
+        slices = [pd.IndexSlice[:], pd.IndexSlice[:, ['A']],
+                  pd.IndexSlice[[1], :], pd.IndexSlice[[1], ['A']],
+                  pd.IndexSlice[:2, ['A', 'B']]]
+
+        for slice_ in slices:
+            result = self.df.style.where(f, style1, style2,
+                                         subset=slice_)._compute().ctx
+            expected = self.df.style.applymap(g, subset=slice_)._compute().ctx
+            assert result == expected
+
+    def test_empty(self):
+        df = pd.DataFrame({'A': [1, 0]})
+        s = df.style
+        s.ctx = {(0, 0): ['color: red'],
+                 (1, 0): ['']}
+
+        result = s._translate()['cellstyle']
+        expected = [{'props': [['color', ' red']], 'selector': 'row0_col0'},
+                    {'props': [['', '']], 'selector': 'row1_col0'}]
+        assert result == expected
+
+    def test_bar_align_left(self):
+        df = pd.DataFrame({'A': [0, 1, 2]})
+        result = df.style.bar()._compute().ctx
+        expected = {
+            (0, 0): ['width: 10em', ' height: 80%'],
+            (1, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient('
+                     '90deg,#d65f5f 50.0%, transparent 0%)'],
+            (2, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient('
+                     '90deg,#d65f5f 100.0%, transparent 0%)']
+        }
+        assert result == expected
+
+        result = df.style.bar(color='red', width=50)._compute().ctx
+        expected = {
+            (0, 0): ['width: 10em', ' height: 80%'],
+            (1, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient('
+                     '90deg,red 25.0%, transparent 0%)'],
+            (2, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient('
+                     '90deg,red 50.0%, transparent 0%)']
+        }
+        assert result == expected
+
+        df['C'] = ['a'] * len(df)
+        result = df.style.bar(color='red', width=50)._compute().ctx
+        assert result == expected
+        df['C'] = df['C'].astype('category')
+        result = df.style.bar(color='red', width=50)._compute().ctx
+        assert result == expected
+
+    def test_bar_align_left_0points(self):
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
+        result = df.style.bar()._compute().ctx
+        expected = {(0, 0): ['width: 10em', ' height: 80%'],
+                    (0, 1): ['width: 10em', ' height: 80%'],
+                    (0, 2): ['width: 10em', ' height: 80%'],
+                    (1, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 50.0%,'
+                             ' transparent 0%)'],
+                    (1, 1): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 50.0%,'
+                             ' transparent 0%)'],
+                    (1, 2): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 50.0%,'
+                             ' transparent 0%)'],
+                    (2, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 100.0%'
+                             ', transparent 0%)'],
+                    (2, 1): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 100.0%'
+                             ', transparent 0%)'],
+                    (2, 2): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 100.0%'
+                             ', transparent 0%)']}
+        assert result == expected
+
+        result = df.style.bar(axis=1)._compute().ctx
+        expected = {(0, 0): ['width: 10em', ' height: 80%'],
+                    (0, 1): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 50.0%,'
+                             ' transparent 0%)'],
+                    (0, 2): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 100.0%'
+                             ', transparent 0%)'],
+                    (1, 0): ['width: 10em', ' height: 80%'],
+                    (1, 1): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 50.0%'
+                             ', transparent 0%)'],
+                    (1, 2): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 100.0%'
+                             ', transparent 0%)'],
+                    (2, 0): ['width: 10em', ' height: 80%'],
+                    (2, 1): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 50.0%'
+                             ', transparent 0%)'],
+                    (2, 2): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 100.0%'
+                             ', transparent 0%)']}
+        assert result == expected
+
+    def test_bar_align_mid_pos_and_neg(self):
+        df = pd.DataFrame({'A': [-10, 0, 20, 90]})
+
+        result = df.style.bar(align='mid', color=[
+                              '#d65f5f', '#5fba7d'])._compute().ctx
+
+        expected = {(0, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 0.0%, #d65f5f 0.0%, '
+                             '#d65f5f 10.0%, transparent 10.0%)'],
+                    (1, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 10.0%, '
+                             '#d65f5f 10.0%, #d65f5f 10.0%, '
+                             'transparent 10.0%)'],
+                    (2, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 10.0%, #5fba7d 10.0%'
+                             ', #5fba7d 30.0%, transparent 30.0%)'],
+                    (3, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 10.0%, '
+                             '#5fba7d 10.0%, #5fba7d 100.0%, '
+                             'transparent 100.0%)']}
+
+        assert result == expected
+
+    def test_bar_align_mid_all_pos(self):
+        df = pd.DataFrame({'A': [10, 20, 50, 100]})
+
+        result = df.style.bar(align='mid', color=[
+                              '#d65f5f', '#5fba7d'])._compute().ctx
+
+        expected = {(0, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 0.0%, #5fba7d 0.0%, '
+                             '#5fba7d 10.0%, transparent 10.0%)'],
+                    (1, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 0.0%, #5fba7d 0.0%, '
+                             '#5fba7d 20.0%, transparent 20.0%)'],
+                    (2, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 0.0%, #5fba7d 0.0%, '
+                             '#5fba7d 50.0%, transparent 50.0%)'],
+                    (3, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 0.0%, #5fba7d 0.0%, '
+                             '#5fba7d 100.0%, transparent 100.0%)']}
+
+        assert result == expected
+
+    def test_bar_align_mid_all_neg(self):
+        df = pd.DataFrame({'A': [-100, -60, -30, -20]})
+
+        result = df.style.bar(align='mid', color=[
+                              '#d65f5f', '#5fba7d'])._compute().ctx
+
+        expected = {(0, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 0.0%, '
+                             '#d65f5f 0.0%, #d65f5f 100.0%, '
+                             'transparent 100.0%)'],
+                    (1, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 40.0%, '
+                             '#d65f5f 40.0%, #d65f5f 100.0%, '
+                             'transparent 100.0%)'],
+                    (2, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 70.0%, '
+                             '#d65f5f 70.0%, #d65f5f 100.0%, '
+                             'transparent 100.0%)'],
+                    (3, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 80.0%, '
+                             '#d65f5f 80.0%, #d65f5f 100.0%, '
+                             'transparent 100.0%)']}
+        assert result == expected
+
+    def test_bar_align_zero_pos_and_neg(self):
+        # See https://github.com/pandas-dev/pandas/pull/14757
+        df = pd.DataFrame({'A': [-10, 0, 20, 90]})
+
+        result = df.style.bar(align='zero', color=[
+                              '#d65f5f', '#5fba7d'], width=90)._compute().ctx
+
+        expected = {(0, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 45.0%, '
+                             '#d65f5f 45.0%, #d65f5f 50%, '
+                             'transparent 50%)'],
+                    (1, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 50%, '
+                             '#5fba7d 50%, #5fba7d 50.0%, '
+                             'transparent 50.0%)'],
+                    (2, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 50%, #5fba7d 50%, '
+                             '#5fba7d 60.0%, transparent 60.0%)'],
+                    (3, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 0%, transparent 50%, #5fba7d 50%, '
+                             '#5fba7d 95.0%, transparent 95.0%)']}
+        assert result == expected
+
+    def test_bar_bad_align_raises(self):
+        df = pd.DataFrame({'A': [-100, -60, -30, -20]})
+        with pytest.raises(ValueError):
+            df.style.bar(align='poorly', color=['#d65f5f', '#5fba7d'])
+
+    def test_highlight_null(self, null_color='red'):
+        df = pd.DataFrame({'A': [0, np.nan]})
+        result = df.style.highlight_null()._compute().ctx
+        expected = {(0, 0): [''],
+                    (1, 0): ['background-color: red']}
+        assert result == expected
+
+    def test_nonunique_raises(self):
+        df = pd.DataFrame([[1, 2]], columns=['A', 'A'])
+        with pytest.raises(ValueError):
+            df.style
+
+        with pytest.raises(ValueError):
+            Styler(df)
+
+    def test_caption(self):
+        styler = Styler(self.df, caption='foo')
+        result = styler.render()
+        assert all(['caption' in result, 'foo' in result])
+
+        styler = self.df.style
+        result = styler.set_caption('baz')
+        assert styler is result
+        assert styler.caption == 'baz'
+
+    def test_uuid(self):
+        styler = Styler(self.df, uuid='abc123')
+        result = styler.render()
+        assert 'abc123' in result
+
+        styler = self.df.style
+        result = styler.set_uuid('aaa')
+        assert result is styler
+        assert result.uuid == 'aaa'
+
+    def test_unique_id(self):
+        # See https://github.com/pandas-dev/pandas/issues/16780
+        df = pd.DataFrame({'a': [1, 3, 5, 6], 'b': [2, 4, 12, 21]})
+        result = df.style.render(uuid='test')
+        assert 'test' in result
+        ids = re.findall('id="(.*?)"', result)
+        assert np.unique(ids).size == len(ids)
+
+    def test_table_styles(self):
+        style = [{'selector': 'th', 'props': [('foo', 'bar')]}]
+        styler = Styler(self.df, table_styles=style)
+        result = ' '.join(styler.render().split())
+        assert 'th { foo: bar; }' in result
+
+        styler = self.df.style
+        result = styler.set_table_styles(style)
+        assert styler is result
+        assert styler.table_styles == style
+
+    def test_table_attributes(self):
+        attributes = 'class="foo" data-bar'
+        styler = Styler(self.df, table_attributes=attributes)
+        result = styler.render()
+        assert 'class="foo" data-bar' in result
+
+        result = self.df.style.set_table_attributes(attributes).render()
+        assert 'class="foo" data-bar' in result
+
+    def test_precision(self):
+        with pd.option_context('display.precision', 10):
+            s = Styler(self.df)
+        assert s.precision == 10
+        s = Styler(self.df, precision=2)
+        assert s.precision == 2
+
+        s2 = s.set_precision(4)
+        assert s is s2
+        assert s.precision == 4
+
+    def test_apply_none(self):
+        def f(x):
+            return pd.DataFrame(np.where(x == x.max(), 'color: red', ''),
+                                index=x.index, columns=x.columns)
+        result = (pd.DataFrame([[1, 2], [3, 4]])
+                  .style.apply(f, axis=None)._compute().ctx)
+        assert result[(1, 1)] == ['color: red']
+
+    def test_trim(self):
+        result = self.df.style.render()  # trim=True
+        assert result.count('#') == 0
+
+        result = self.df.style.highlight_max().render()
+        assert result.count('#') == len(self.df.columns)
+
+    def test_highlight_max(self):
+        df = pd.DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
+        # max(df) = min(-df)
+        for max_ in [True, False]:
+            if max_:
+                attr = 'highlight_max'
+            else:
+                df = -df
+                attr = 'highlight_min'
+            result = getattr(df.style, attr)()._compute().ctx
+            assert result[(1, 1)] == ['background-color: yellow']
+
+            result = getattr(df.style, attr)(color='green')._compute().ctx
+            assert result[(1, 1)] == ['background-color: green']
+
+            result = getattr(df.style, attr)(subset='A')._compute().ctx
+            assert result[(1, 0)] == ['background-color: yellow']
+
+            result = getattr(df.style, attr)(axis=0)._compute().ctx
+            expected = {(1, 0): ['background-color: yellow'],
+                        (1, 1): ['background-color: yellow'],
+                        (0, 1): [''], (0, 0): ['']}
+            assert result == expected
+
+            result = getattr(df.style, attr)(axis=1)._compute().ctx
+            expected = {(0, 1): ['background-color: yellow'],
+                        (1, 1): ['background-color: yellow'],
+                        (0, 0): [''], (1, 0): ['']}
+            assert result == expected
+
+        # separate since we can't negate the strs
+        df['C'] = ['a', 'b']
+        result = df.style.highlight_max()._compute().ctx
+        expected = {(1, 1): ['background-color: yellow']}
+
+        result = df.style.highlight_min()._compute().ctx
+        expected = {(0, 0): ['background-color: yellow']}
+
+    def test_export(self):
+        f = lambda x: 'color: red' if x > 0 else 'color: blue'
+        g = lambda x, y, z: 'color: {z}'.format(z=z) \
+            if x > 0 else 'color: {z}'.format(z=z)
+        style1 = self.styler
+        style1.applymap(f)\
+            .applymap(g, y='a', z='b')\
+            .highlight_max()
+        result = style1.export()
+        style2 = self.df.style
+        style2.use(result)
+        assert style1._todo == style2._todo
+        style2.render()
+
+    def test_display_format(self):
+        df = pd.DataFrame(np.random.random(size=(2, 2)))
+        ctx = df.style.format("{:0.1f}")._translate()
+
+        assert all(['display_value' in c for c in row]
+                   for row in ctx['body'])
+        assert all([len(c['display_value']) <= 3 for c in row[1:]]
+                   for row in ctx['body'])
+        assert len(ctx['body'][0][1]['display_value'].lstrip('-')) <= 3
+
+    def test_display_format_raises(self):
+        df = pd.DataFrame(np.random.randn(2, 2))
+        with pytest.raises(TypeError):
+            df.style.format(5)
+        with pytest.raises(TypeError):
+            df.style.format(True)
+
+    def test_display_subset(self):
+        df = pd.DataFrame([[.1234, .1234], [1.1234, 1.1234]],
+                          columns=['a', 'b'])
+        ctx = df.style.format({"a": "{:0.1f}", "b": "{0:.2%}"},
+                              subset=pd.IndexSlice[0, :])._translate()
+        expected = '0.1'
+        assert ctx['body'][0][1]['display_value'] == expected
+        assert ctx['body'][1][1]['display_value'] == '1.1234'
+        assert ctx['body'][0][2]['display_value'] == '12.34%'
+
+        raw_11 = '1.1234'
+        ctx = df.style.format("{:0.1f}",
+                              subset=pd.IndexSlice[0, :])._translate()
+        assert ctx['body'][0][1]['display_value'] == expected
+        assert ctx['body'][1][1]['display_value'] == raw_11
+
+        ctx = df.style.format("{:0.1f}",
+                              subset=pd.IndexSlice[0, :])._translate()
+        assert ctx['body'][0][1]['display_value'] == expected
+        assert ctx['body'][1][1]['display_value'] == raw_11
+
+        ctx = df.style.format("{:0.1f}",
+                              subset=pd.IndexSlice['a'])._translate()
+        assert ctx['body'][0][1]['display_value'] == expected
+        assert ctx['body'][0][2]['display_value'] == '0.1234'
+
+        ctx = df.style.format("{:0.1f}",
+                              subset=pd.IndexSlice[0, 'a'])._translate()
+        assert ctx['body'][0][1]['display_value'] == expected
+        assert ctx['body'][1][1]['display_value'] == raw_11
+
+        ctx = df.style.format("{:0.1f}",
+                              subset=pd.IndexSlice[[0, 1], ['a']])._translate()
+        assert ctx['body'][0][1]['display_value'] == expected
+        assert ctx['body'][1][1]['display_value'] == '1.1'
+        assert ctx['body'][0][2]['display_value'] == '0.1234'
+        assert ctx['body'][1][2]['display_value'] == '1.1234'
+
+    def test_display_dict(self):
+        df = pd.DataFrame([[.1234, .1234], [1.1234, 1.1234]],
+                          columns=['a', 'b'])
+        ctx = df.style.format({"a": "{:0.1f}", "b": "{0:.2%}"})._translate()
+        assert ctx['body'][0][1]['display_value'] == '0.1'
+        assert ctx['body'][0][2]['display_value'] == '12.34%'
+        df['c'] = ['aaa', 'bbb']
+        ctx = df.style.format({"a": "{:0.1f}", "c": str.upper})._translate()
+        assert ctx['body'][0][1]['display_value'] == '0.1'
+        assert ctx['body'][0][3]['display_value'] == 'AAA'
+
+    def test_bad_apply_shape(self):
+        df = pd.DataFrame([[1, 2], [3, 4]])
+        with pytest.raises(ValueError):
+            df.style._apply(lambda x: 'x', subset=pd.IndexSlice[[0, 1], :])
+
+        with pytest.raises(ValueError):
+            df.style._apply(lambda x: [''], subset=pd.IndexSlice[[0, 1], :])
+
+        with pytest.raises(ValueError):
+            df.style._apply(lambda x: ['', '', '', ''])
+
+        with pytest.raises(ValueError):
+            df.style._apply(lambda x: ['', '', ''], subset=1)
+
+        with pytest.raises(ValueError):
+            df.style._apply(lambda x: ['', '', ''], axis=1)
+
+    def test_apply_bad_return(self):
+        def f(x):
+            return ''
+        df = pd.DataFrame([[1, 2], [3, 4]])
+        with pytest.raises(TypeError):
+            df.style._apply(f, axis=None)
+
+    def test_apply_bad_labels(self):
+        def f(x):
+            return pd.DataFrame(index=[1, 2], columns=['a', 'b'])
+        df = pd.DataFrame([[1, 2], [3, 4]])
+        with pytest.raises(ValueError):
+            df.style._apply(f, axis=None)
+
+    def test_get_level_lengths(self):
+        index = pd.MultiIndex.from_product([['a', 'b'], [0, 1, 2]])
+        expected = {(0, 0): 3, (0, 3): 3, (1, 0): 1, (1, 1): 1, (1, 2): 1,
+                    (1, 3): 1, (1, 4): 1, (1, 5): 1}
+        result = _get_level_lengths(index)
+        tm.assert_dict_equal(result, expected)
+
+    def test_get_level_lengths_un_sorted(self):
+        index = pd.MultiIndex.from_arrays([
+            [1, 1, 2, 1],
+            ['a', 'b', 'b', 'd']
+        ])
+        expected = {(0, 0): 2, (0, 2): 1, (0, 3): 1,
+                    (1, 0): 1, (1, 1): 1, (1, 2): 1, (1, 3): 1}
+        result = _get_level_lengths(index)
+        tm.assert_dict_equal(result, expected)
+
+    def test_mi_sparse(self):
+        df = pd.DataFrame({'A': [1, 2]},
+                          index=pd.MultiIndex.from_arrays([['a', 'a'],
+                                                           [0, 1]]))
+
+        result = df.style._translate()
+        body_0 = result['body'][0][0]
+        expected_0 = {
+            "value": "a", "display_value": "a", "is_visible": True,
+            "type": "th", "attributes": ["rowspan=2"],
+            "class": "row_heading level0 row0", "id": "level0_row0"
+        }
+        tm.assert_dict_equal(body_0, expected_0)
+
+        body_1 = result['body'][0][1]
+        expected_1 = {
+            "value": 0, "display_value": 0, "is_visible": True,
+            "type": "th", "class": "row_heading level1 row0",
+            "id": "level1_row0"
+        }
+        tm.assert_dict_equal(body_1, expected_1)
+
+        body_10 = result['body'][1][0]
+        expected_10 = {
+            "value": 'a', "display_value": 'a', "is_visible": False,
+            "type": "th", "class": "row_heading level0 row1",
+            "id": "level0_row1"
+        }
+        tm.assert_dict_equal(body_10, expected_10)
+
+        head = result['head'][0]
+        expected = [
+            {'type': 'th', 'class': 'blank', 'value': '',
+             'is_visible': True, "display_value": ''},
+            {'type': 'th', 'class': 'blank level0', 'value': '',
+             'is_visible': True, 'display_value': ''},
+            {'type': 'th', 'class': 'col_heading level0 col0', 'value': 'A',
+             'is_visible': True, 'display_value': 'A'}]
+        assert head == expected
+
+    def test_mi_sparse_disabled(self):
+        with pd.option_context('display.multi_sparse', False):
+            df = pd.DataFrame({'A': [1, 2]},
+                              index=pd.MultiIndex.from_arrays([['a', 'a'],
+                                                               [0, 1]]))
+            result = df.style._translate()
+        body = result['body']
+        for row in body:
+            assert 'attributes' not in row[0]
+
+    def test_mi_sparse_index_names(self):
+        df = pd.DataFrame({'A': [1, 2]}, index=pd.MultiIndex.from_arrays(
+            [['a', 'a'], [0, 1]],
+            names=['idx_level_0', 'idx_level_1'])
+        )
+        result = df.style._translate()
+        head = result['head'][1]
+        expected = [{
+            'class': 'index_name level0', 'value': 'idx_level_0',
+            'type': 'th'},
+            {'class': 'index_name level1', 'value': 'idx_level_1',
+             'type': 'th'},
+            {'class': 'blank', 'value': '', 'type': 'th'}]
+
+        assert head == expected
+
+    def test_mi_sparse_column_names(self):
+        df = pd.DataFrame(
+            np.arange(16).reshape(4, 4),
+            index=pd.MultiIndex.from_arrays(
+                [['a', 'a', 'b', 'a'], [0, 1, 1, 2]],
+                names=['idx_level_0', 'idx_level_1']),
+            columns=pd.MultiIndex.from_arrays(
+                [['C1', 'C1', 'C2', 'C2'], [1, 0, 1, 0]],
+                names=['col_0', 'col_1']
+            )
+        )
+        result = df.style._translate()
+        head = result['head'][1]
+        expected = [
+            {'class': 'blank', 'value': '', 'display_value': '',
+             'type': 'th', 'is_visible': True},
+            {'class': 'index_name level1', 'value': 'col_1',
+             'display_value': 'col_1', 'is_visible': True, 'type': 'th'},
+            {'class': 'col_heading level1 col0',
+             'display_value': 1,
+             'is_visible': True,
+             'type': 'th',
+             'value': 1},
+            {'class': 'col_heading level1 col1',
+             'display_value': 0,
+             'is_visible': True,
+             'type': 'th',
+             'value': 0},
+
+            {'class': 'col_heading level1 col2',
+             'display_value': 1,
+             'is_visible': True,
+             'type': 'th',
+             'value': 1},
+
+            {'class': 'col_heading level1 col3',
+             'display_value': 0,
+             'is_visible': True,
+             'type': 'th',
+             'value': 0},
+        ]
+        assert head == expected
+
+    def test_hide_single_index(self):
+        # GH 14194
+        # single unnamed index
+        ctx = self.df.style._translate()
+        assert ctx['body'][0][0]['is_visible']
+        assert ctx['head'][0][0]['is_visible']
+        ctx2 = self.df.style.hide_index()._translate()
+        assert not ctx2['body'][0][0]['is_visible']
+        assert not ctx2['head'][0][0]['is_visible']
+
+        # single named index
+        ctx3 = self.df.set_index('A').style._translate()
+        assert ctx3['body'][0][0]['is_visible']
+        assert len(ctx3['head']) == 2  # 2 header levels
+        assert ctx3['head'][0][0]['is_visible']
+
+        ctx4 = self.df.set_index('A').style.hide_index()._translate()
+        assert not ctx4['body'][0][0]['is_visible']
+        assert len(ctx4['head']) == 1  # only 1 header levels
+        assert not ctx4['head'][0][0]['is_visible']
+
+    def test_hide_multiindex(self):
+        # GH 14194
+        df = pd.DataFrame({'A': [1, 2]}, index=pd.MultiIndex.from_arrays(
+            [['a', 'a'], [0, 1]],
+            names=['idx_level_0', 'idx_level_1'])
+        )
+        ctx1 = df.style._translate()
+        # tests for 'a' and '0'
+        assert ctx1['body'][0][0]['is_visible']
+        assert ctx1['body'][0][1]['is_visible']
+        # check for blank header rows
+        assert ctx1['head'][0][0]['is_visible']
+        assert ctx1['head'][0][1]['is_visible']
+
+        ctx2 = df.style.hide_index()._translate()
+        # tests for 'a' and '0'
+        assert not ctx2['body'][0][0]['is_visible']
+        assert not ctx2['body'][0][1]['is_visible']
+        # check for blank header rows
+        assert not ctx2['head'][0][0]['is_visible']
+        assert not ctx2['head'][0][1]['is_visible']
+
+    def test_hide_columns_single_level(self):
+        # GH 14194
+        # test hiding single column
+        ctx = self.df.style._translate()
+        assert ctx['head'][0][1]['is_visible']
+        assert ctx['head'][0][1]['display_value'] == 'A'
+        assert ctx['head'][0][2]['is_visible']
+        assert ctx['head'][0][2]['display_value'] == 'B'
+        assert ctx['body'][0][1]['is_visible']  # col A, row 1
+        assert ctx['body'][1][2]['is_visible']  # col B, row 1
+
+        ctx = self.df.style.hide_columns('A')._translate()
+        assert not ctx['head'][0][1]['is_visible']
+        assert not ctx['body'][0][1]['is_visible']  # col A, row 1
+        assert ctx['body'][1][2]['is_visible']  # col B, row 1
+
+        # test hiding mulitiple columns
+        ctx = self.df.style.hide_columns(['A', 'B'])._translate()
+        assert not ctx['head'][0][1]['is_visible']
+        assert not ctx['head'][0][2]['is_visible']
+        assert not ctx['body'][0][1]['is_visible']  # col A, row 1
+        assert not ctx['body'][1][2]['is_visible']  # col B, row 1
+
+    def test_hide_columns_mult_levels(self):
+        # GH 14194
+        # setup dataframe with multiple column levels and indices
+        i1 = pd.MultiIndex.from_arrays([['a', 'a'], [0, 1]],
+                                       names=['idx_level_0',
+                                              'idx_level_1'])
+        i2 = pd.MultiIndex.from_arrays([['b', 'b'], [0, 1]],
+                                       names=['col_level_0',
+                                              'col_level_1'])
+        df = pd.DataFrame([[1, 2], [3, 4]], index=i1, columns=i2)
+        ctx = df.style._translate()
+        # column headers
+        assert ctx['head'][0][2]['is_visible']
+        assert ctx['head'][1][2]['is_visible']
+        assert ctx['head'][1][3]['display_value'] == 1
+        # indices
+        assert ctx['body'][0][0]['is_visible']
+        # data
+        assert ctx['body'][1][2]['is_visible']
+        assert ctx['body'][1][2]['display_value'] == 3
+        assert ctx['body'][1][3]['is_visible']
+        assert ctx['body'][1][3]['display_value'] == 4
+
+        # hide top column level, which hides both columns
+        ctx = df.style.hide_columns('b')._translate()
+        assert not ctx['head'][0][2]['is_visible']  # b
+        assert not ctx['head'][1][2]['is_visible']  # 0
+        assert not ctx['body'][1][2]['is_visible']  # 3
+        assert ctx['body'][0][0]['is_visible']  # index
+
+        # hide first column only
+        ctx = df.style.hide_columns([('b', 0)])._translate()
+        assert ctx['head'][0][2]['is_visible']  # b
+        assert not ctx['head'][1][2]['is_visible']  # 0
+        assert not ctx['body'][1][2]['is_visible']  # 3
+        assert ctx['body'][1][3]['is_visible']
+        assert ctx['body'][1][3]['display_value'] == 4
+
+        # hide second column and index
+        ctx = df.style.hide_columns([('b', 1)]).hide_index()._translate()
+        assert not ctx['body'][0][0]['is_visible']  # index
+        assert ctx['head'][0][2]['is_visible']  # b
+        assert ctx['head'][1][2]['is_visible']  # 0
+        assert not ctx['head'][1][3]['is_visible']  # 1
+        assert not ctx['body'][1][3]['is_visible']  # 4
+        assert ctx['body'][1][2]['is_visible']
+        assert ctx['body'][1][2]['display_value'] == 3
+
+
+@td.skip_if_no_mpl
+class TestStylerMatplotlibDep(object):
+
+    def test_background_gradient(self):
+        df = pd.DataFrame([[1, 2], [2, 4]], columns=['A', 'B'])
+
+        for c_map in [None, 'YlOrRd']:
+            result = df.style.background_gradient(cmap=c_map)._compute().ctx
+            assert all("#" in x[0] for x in result.values())
+            assert result[(0, 0)] == result[(0, 1)]
+            assert result[(1, 0)] == result[(1, 1)]
+
+        result = df.style.background_gradient(
+            subset=pd.IndexSlice[1, 'A'])._compute().ctx
+
+        assert result[(1, 0)] == ['background-color: #fff7fb',
+                                  'color: #000000']
+
+    @pytest.mark.parametrize(
+        'c_map,expected', [
+            (None, {
+                (0, 0): ['background-color: #440154', 'color: #f1f1f1'],
+                (1, 0): ['background-color: #fde725', 'color: #000000']}),
+            ('YlOrRd', {
+                (0, 0): ['background-color: #ffffcc', 'color: #000000'],
+                (1, 0): ['background-color: #800026', 'color: #f1f1f1']})])
+    def test_text_color_threshold(self, c_map, expected):
+        df = pd.DataFrame([1, 2], columns=['A'])
+        result = df.style.background_gradient(cmap=c_map)._compute().ctx
+        assert result == expected
+
+    @pytest.mark.parametrize("text_color_threshold", [1.1, '1', -1, [2, 2]])
+    def test_text_color_threshold_raises(self, text_color_threshold):
+        df = pd.DataFrame([[1, 2], [2, 4]], columns=['A', 'B'])
+        msg = "`text_color_threshold` must be a value from 0 to 1."
+        with tm.assert_raises_regex(ValueError, msg):
+            df.style.background_gradient(
+                text_color_threshold=text_color_threshold)._compute()
+
+
+def test_block_names():
+    # catch accidental removal of a block
+    expected = {
+        'before_style', 'style', 'table_styles', 'before_cellstyle',
+        'cellstyle', 'before_table', 'table', 'caption', 'thead', 'tbody',
+        'after_table', 'before_head_rows', 'head_tr', 'after_head_rows',
+        'before_rows', 'tr', 'after_rows',
+    }
+    result = set(Styler.template.blocks)
+    assert result == expected
+
+
+def test_from_custom_template(tmpdir):
+    p = tmpdir.mkdir("templates").join("myhtml.tpl")
+    p.write(textwrap.dedent("""\
+        {% extends "html.tpl" %}
+        {% block table %}
+        <h1>{{ table_title|default("My Table") }}</h1>
+        {{ super() }}
+        {% endblock table %}"""))
+    result = Styler.from_custom_template(str(tmpdir.join('templates')),
+                                         'myhtml.tpl')
+    assert issubclass(result, Styler)
+    assert result.env is not Styler.env
+    assert result.template is not Styler.template
+    styler = result(pd.DataFrame({"A": [1, 2]}))
+    assert styler.render()
+
+
+def test_shim():
+    # https://github.com/pandas-dev/pandas/pull/16059
+    # Remove in 0.21
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        from pandas.formats.style import Styler as _styler  # noqa
diff --git a/pandas/tests/io/formats/test_to_csv.py b/pandas/tests/io/formats/test_to_csv.py
new file mode 100644
index 0000000000000..36c4ae547ad4e
--- /dev/null
+++ b/pandas/tests/io/formats/test_to_csv.py
@@ -0,0 +1,302 @@
+# -*- coding: utf-8 -*-
+
+import sys
+import numpy as np
+import pandas as pd
+import pytest
+from pandas import DataFrame
+from pandas.util import testing as tm
+
+
+class TestToCSV(object):
+
+    @pytest.mark.xfail((3, 6, 5) > sys.version_info >= (3, 5),
+                       reason=("Python csv library bug "
+                               "(see https://bugs.python.org/issue32255)"))
+    def test_to_csv_with_single_column(self):
+        # see gh-18676, https://bugs.python.org/issue32255
+        #
+        # Python's CSV library adds an extraneous '""'
+        # before the newline when the NaN-value is in
+        # the first row. Otherwise, only the newline
+        # character is added. This behavior is inconsistent
+        # and was patched in https://bugs.python.org/pull_request4672.
+        df1 = DataFrame([None, 1])
+        expected1 = """\
+""
+1.0
+"""
+        with tm.ensure_clean('test.csv') as path:
+            df1.to_csv(path, header=None, index=None)
+            with open(path, 'r') as f:
+                assert f.read() == expected1
+
+        df2 = DataFrame([1, None])
+        expected2 = """\
+1.0
+""
+"""
+        with tm.ensure_clean('test.csv') as path:
+            df2.to_csv(path, header=None, index=None)
+            with open(path, 'r') as f:
+                assert f.read() == expected2
+
+    def test_to_csv_defualt_encoding(self):
+        # GH17097
+        df = DataFrame({'col': [u"AAAAA", u"ÄÄÄÄÄ", u"ßßßßß", u"聞聞聞聞聞"]})
+
+        with tm.ensure_clean('test.csv') as path:
+            # the default to_csv encoding in Python 2 is ascii, and that in
+            # Python 3 is uft-8.
+            if pd.compat.PY2:
+                # the encoding argument parameter should be utf-8
+                with tm.assert_raises_regex(UnicodeEncodeError, 'ascii'):
+                    df.to_csv(path)
+            else:
+                df.to_csv(path)
+                tm.assert_frame_equal(pd.read_csv(path, index_col=0), df)
+
+    def test_to_csv_quotechar(self):
+        df = DataFrame({'col': [1, 2]})
+        expected = """\
+"","col"
+"0","1"
+"1","2"
+"""
+
+        with tm.ensure_clean('test.csv') as path:
+            df.to_csv(path, quoting=1)  # 1=QUOTE_ALL
+            with open(path, 'r') as f:
+                assert f.read() == expected
+
+        expected = """\
+$$,$col$
+$0$,$1$
+$1$,$2$
+"""
+
+        with tm.ensure_clean('test.csv') as path:
+            df.to_csv(path, quoting=1, quotechar="$")
+            with open(path, 'r') as f:
+                assert f.read() == expected
+
+        with tm.ensure_clean('test.csv') as path:
+            with tm.assert_raises_regex(TypeError, 'quotechar'):
+                df.to_csv(path, quoting=1, quotechar=None)
+
+    def test_to_csv_doublequote(self):
+        df = DataFrame({'col': ['a"a', '"bb"']})
+        expected = '''\
+"","col"
+"0","a""a"
+"1","""bb"""
+'''
+
+        with tm.ensure_clean('test.csv') as path:
+            df.to_csv(path, quoting=1, doublequote=True)  # QUOTE_ALL
+            with open(path, 'r') as f:
+                assert f.read() == expected
+
+        from _csv import Error
+        with tm.ensure_clean('test.csv') as path:
+            with tm.assert_raises_regex(Error, 'escapechar'):
+                df.to_csv(path, doublequote=False)  # no escapechar set
+
+    def test_to_csv_escapechar(self):
+        df = DataFrame({'col': ['a"a', '"bb"']})
+        expected = '''\
+"","col"
+"0","a\\"a"
+"1","\\"bb\\""
+'''
+
+        with tm.ensure_clean('test.csv') as path:  # QUOTE_ALL
+            df.to_csv(path, quoting=1, doublequote=False, escapechar='\\')
+            with open(path, 'r') as f:
+                assert f.read() == expected
+
+        df = DataFrame({'col': ['a,a', ',bb,']})
+        expected = """\
+,col
+0,a\\,a
+1,\\,bb\\,
+"""
+
+        with tm.ensure_clean('test.csv') as path:
+            df.to_csv(path, quoting=3, escapechar='\\')  # QUOTE_NONE
+            with open(path, 'r') as f:
+                assert f.read() == expected
+
+    def test_csv_to_string(self):
+        df = DataFrame({'col': [1, 2]})
+        expected = ',col\n0,1\n1,2\n'
+        assert df.to_csv() == expected
+
+    def test_to_csv_decimal(self):
+        # GH 781
+        df = DataFrame({'col1': [1], 'col2': ['a'], 'col3': [10.1]})
+
+        expected_default = ',col1,col2,col3\n0,1,a,10.1\n'
+        assert df.to_csv() == expected_default
+
+        expected_european_excel = ';col1;col2;col3\n0;1;a;10,1\n'
+        assert df.to_csv(decimal=',', sep=';') == expected_european_excel
+
+        expected_float_format_default = ',col1,col2,col3\n0,1,a,10.10\n'
+        assert df.to_csv(float_format='%.2f') == expected_float_format_default
+
+        expected_float_format = ';col1;col2;col3\n0;1;a;10,10\n'
+        assert df.to_csv(decimal=',', sep=';',
+                         float_format='%.2f') == expected_float_format
+
+        # GH 11553: testing if decimal is taken into account for '0.0'
+        df = pd.DataFrame({'a': [0, 1.1], 'b': [2.2, 3.3], 'c': 1})
+        expected = 'a,b,c\n0^0,2^2,1\n1^1,3^3,1\n'
+        assert df.to_csv(index=False, decimal='^') == expected
+
+        # same but for an index
+        assert df.set_index('a').to_csv(decimal='^') == expected
+
+        # same for a multi-index
+        assert df.set_index(['a', 'b']).to_csv(decimal="^") == expected
+
+    def test_to_csv_float_format(self):
+        # testing if float_format is taken into account for the index
+        # GH 11553
+        df = pd.DataFrame({'a': [0, 1], 'b': [2.2, 3.3], 'c': 1})
+        expected = 'a,b,c\n0,2.20,1\n1,3.30,1\n'
+        assert df.set_index('a').to_csv(float_format='%.2f') == expected
+
+        # same for a multi-index
+        assert df.set_index(['a', 'b']).to_csv(
+            float_format='%.2f') == expected
+
+    def test_to_csv_na_rep(self):
+        # testing if NaN values are correctly represented in the index
+        # GH 11553
+        df = DataFrame({'a': [0, np.NaN], 'b': [0, 1], 'c': [2, 3]})
+        expected = "a,b,c\n0.0,0,2\n_,1,3\n"
+        assert df.set_index('a').to_csv(na_rep='_') == expected
+        assert df.set_index(['a', 'b']).to_csv(na_rep='_') == expected
+
+        # now with an index containing only NaNs
+        df = DataFrame({'a': np.NaN, 'b': [0, 1], 'c': [2, 3]})
+        expected = "a,b,c\n_,0,2\n_,1,3\n"
+        assert df.set_index('a').to_csv(na_rep='_') == expected
+        assert df.set_index(['a', 'b']).to_csv(na_rep='_') == expected
+
+        # check if na_rep parameter does not break anything when no NaN
+        df = DataFrame({'a': 0, 'b': [0, 1], 'c': [2, 3]})
+        expected = "a,b,c\n0,0,2\n0,1,3\n"
+        assert df.set_index('a').to_csv(na_rep='_') == expected
+        assert df.set_index(['a', 'b']).to_csv(na_rep='_') == expected
+
+    def test_to_csv_date_format(self):
+        # GH 10209
+        df_sec = DataFrame({'A': pd.date_range('20130101', periods=5, freq='s')
+                            })
+        df_day = DataFrame({'A': pd.date_range('20130101', periods=5, freq='d')
+                            })
+
+        expected_default_sec = (',A\n0,2013-01-01 00:00:00\n1,'
+                                '2013-01-01 00:00:01\n2,2013-01-01 00:00:02'
+                                '\n3,2013-01-01 00:00:03\n4,'
+                                '2013-01-01 00:00:04\n')
+        assert df_sec.to_csv() == expected_default_sec
+
+        expected_ymdhms_day = (',A\n0,2013-01-01 00:00:00\n1,'
+                               '2013-01-02 00:00:00\n2,2013-01-03 00:00:00'
+                               '\n3,2013-01-04 00:00:00\n4,'
+                               '2013-01-05 00:00:00\n')
+        assert (df_day.to_csv(date_format='%Y-%m-%d %H:%M:%S') ==
+                expected_ymdhms_day)
+
+        expected_ymd_sec = (',A\n0,2013-01-01\n1,2013-01-01\n2,'
+                            '2013-01-01\n3,2013-01-01\n4,2013-01-01\n')
+        assert df_sec.to_csv(date_format='%Y-%m-%d') == expected_ymd_sec
+
+        expected_default_day = (',A\n0,2013-01-01\n1,2013-01-02\n2,'
+                                '2013-01-03\n3,2013-01-04\n4,2013-01-05\n')
+        assert df_day.to_csv() == expected_default_day
+        assert df_day.to_csv(date_format='%Y-%m-%d') == expected_default_day
+
+        # testing if date_format parameter is taken into account for
+        # multi-indexed dataframes (GH 7791)
+        df_sec['B'] = 0
+        df_sec['C'] = 1
+        expected_ymd_sec = 'A,B,C\n2013-01-01,0,1\n'
+        df_sec_grouped = df_sec.groupby([pd.Grouper(key='A', freq='1h'), 'B'])
+        assert (df_sec_grouped.mean().to_csv(date_format='%Y-%m-%d') ==
+                expected_ymd_sec)
+
+    def test_to_csv_multi_index(self):
+        # GH 6618
+        df = DataFrame([1], columns=pd.MultiIndex.from_arrays([[1], [2]]))
+
+        exp = ",1\n,2\n0,1\n"
+        assert df.to_csv() == exp
+
+        exp = "1\n2\n1\n"
+        assert df.to_csv(index=False) == exp
+
+        df = DataFrame([1], columns=pd.MultiIndex.from_arrays([[1], [2]]),
+                       index=pd.MultiIndex.from_arrays([[1], [2]]))
+
+        exp = ",,1\n,,2\n1,2,1\n"
+        assert df.to_csv() == exp
+
+        exp = "1\n2\n1\n"
+        assert df.to_csv(index=False) == exp
+
+        df = DataFrame(
+            [1], columns=pd.MultiIndex.from_arrays([['foo'], ['bar']]))
+
+        exp = ",foo\n,bar\n0,1\n"
+        assert df.to_csv() == exp
+
+        exp = "foo\nbar\n1\n"
+        assert df.to_csv(index=False) == exp
+
+    def test_to_csv_string_array_ascii(self):
+        # GH 10813
+        str_array = [{'names': ['foo', 'bar']}, {'names': ['baz', 'qux']}]
+        df = pd.DataFrame(str_array)
+        expected_ascii = '''\
+,names
+0,"['foo', 'bar']"
+1,"['baz', 'qux']"
+'''
+        with tm.ensure_clean('str_test.csv') as path:
+            df.to_csv(path, encoding='ascii')
+            with open(path, 'r') as f:
+                assert f.read() == expected_ascii
+
+    @pytest.mark.xfail
+    def test_to_csv_string_array_utf8(self):
+        # GH 10813
+        str_array = [{'names': ['foo', 'bar']}, {'names': ['baz', 'qux']}]
+        df = pd.DataFrame(str_array)
+        expected_utf8 = '''\
+,names
+0,"[u'foo', u'bar']"
+1,"[u'baz', u'qux']"
+'''
+        with tm.ensure_clean('unicode_test.csv') as path:
+            df.to_csv(path, encoding='utf-8')
+            with open(path, 'r') as f:
+                assert f.read() == expected_utf8
+
+    @tm.capture_stdout
+    def test_to_csv_stdout_file(self):
+        # GH 21561
+        df = pd.DataFrame([['foo', 'bar'], ['baz', 'qux']],
+                          columns=['name_1', 'name_2'])
+        expected_ascii = '''\
+,name_1,name_2
+0,foo,bar
+1,baz,qux
+'''
+        df.to_csv(sys.stdout, encoding='ascii')
+        output = sys.stdout.getvalue()
+        assert output == expected_ascii
+        assert not sys.stdout.closed
diff --git a/pandas/tests/io/formats/test_to_excel.py b/pandas/tests/io/formats/test_to_excel.py
new file mode 100644
index 0000000000000..2d691bf2c5d8e
--- /dev/null
+++ b/pandas/tests/io/formats/test_to_excel.py
@@ -0,0 +1,274 @@
+"""Tests formatting as writer-agnostic ExcelCells
+
+ExcelFormatter is tested implicitly in pandas/tests/io/test_excel.py
+"""
+
+import pytest
+import pandas.util.testing as tm
+
+from warnings import catch_warnings
+from pandas.io.formats.excel import CSSToExcelConverter
+
+
+@pytest.mark.parametrize('css,expected', [
+    # FONT
+    # - name
+    ('font-family: foo,bar', {'font': {'name': 'foo'}}),
+    ('font-family: "foo bar",baz', {'font': {'name': 'foo bar'}}),
+    ('font-family: foo,\nbar', {'font': {'name': 'foo'}}),
+    ('font-family: foo, bar,    baz', {'font': {'name': 'foo'}}),
+    ('font-family: bar, foo', {'font': {'name': 'bar'}}),
+    ('font-family: \'foo bar\', baz', {'font': {'name': 'foo bar'}}),
+    ('font-family: \'foo \\\'bar\', baz', {'font': {'name': 'foo \'bar'}}),
+    ('font-family: "foo \\"bar", baz', {'font': {'name': 'foo "bar'}}),
+    ('font-family: "foo ,bar", baz', {'font': {'name': 'foo ,bar'}}),
+    # - family
+    ('font-family: serif', {'font': {'name': 'serif', 'family': 1}}),
+    ('font-family: Serif', {'font': {'name': 'serif', 'family': 1}}),
+    ('font-family: roman, serif', {'font': {'name': 'roman', 'family': 1}}),
+    ('font-family: roman, sans-serif', {'font': {'name': 'roman',
+                                                 'family': 2}}),
+    ('font-family: roman, sans serif', {'font': {'name': 'roman'}}),
+    ('font-family: roman, sansserif', {'font': {'name': 'roman'}}),
+    ('font-family: roman, cursive', {'font': {'name': 'roman', 'family': 4}}),
+    ('font-family: roman, fantasy', {'font': {'name': 'roman', 'family': 5}}),
+    # - size
+    ('font-size: 1em', {'font': {'size': 12}}),
+    ('font-size: xx-small', {'font': {'size': 6}}),
+    ('font-size: x-small', {'font': {'size': 7.5}}),
+    ('font-size: small', {'font': {'size': 9.6}}),
+    ('font-size: medium', {'font': {'size': 12}}),
+    ('font-size: large', {'font': {'size': 13.5}}),
+    ('font-size: x-large', {'font': {'size': 18}}),
+    ('font-size: xx-large', {'font': {'size': 24}}),
+    ('font-size: 50%', {'font': {'size': 6}}),
+    # - bold
+    ('font-weight: 100', {'font': {'bold': False}}),
+    ('font-weight: 200', {'font': {'bold': False}}),
+    ('font-weight: 300', {'font': {'bold': False}}),
+    ('font-weight: 400', {'font': {'bold': False}}),
+    ('font-weight: normal', {'font': {'bold': False}}),
+    ('font-weight: lighter', {'font': {'bold': False}}),
+    ('font-weight: bold', {'font': {'bold': True}}),
+    ('font-weight: bolder', {'font': {'bold': True}}),
+    ('font-weight: 700', {'font': {'bold': True}}),
+    ('font-weight: 800', {'font': {'bold': True}}),
+    ('font-weight: 900', {'font': {'bold': True}}),
+    # - italic
+    ('font-style: italic', {'font': {'italic': True}}),
+    ('font-style: oblique', {'font': {'italic': True}}),
+    # - underline
+    ('text-decoration: underline',
+     {'font': {'underline': 'single'}}),
+    ('text-decoration: overline',
+     {}),
+    ('text-decoration: none',
+     {}),
+    # - strike
+    ('text-decoration: line-through',
+     {'font': {'strike': True}}),
+    ('text-decoration: underline line-through',
+     {'font': {'strike': True, 'underline': 'single'}}),
+    ('text-decoration: underline; text-decoration: line-through',
+     {'font': {'strike': True}}),
+    # - color
+    ('color: red', {'font': {'color': 'FF0000'}}),
+    ('color: #ff0000', {'font': {'color': 'FF0000'}}),
+    ('color: #f0a', {'font': {'color': 'FF00AA'}}),
+    # - shadow
+    ('text-shadow: none', {'font': {'shadow': False}}),
+    ('text-shadow: 0px -0em 0px #CCC', {'font': {'shadow': False}}),
+    ('text-shadow: 0px -0em 0px #999', {'font': {'shadow': False}}),
+    ('text-shadow: 0px -0em 0px', {'font': {'shadow': False}}),
+    ('text-shadow: 2px -0em 0px #CCC', {'font': {'shadow': True}}),
+    ('text-shadow: 0px -2em 0px #CCC', {'font': {'shadow': True}}),
+    ('text-shadow: 0px -0em 2px #CCC', {'font': {'shadow': True}}),
+    ('text-shadow: 0px -0em 2px', {'font': {'shadow': True}}),
+    ('text-shadow: 0px -2em', {'font': {'shadow': True}}),
+
+    # FILL
+    # - color, fillType
+    ('background-color: red', {'fill': {'fgColor': 'FF0000',
+                                        'patternType': 'solid'}}),
+    ('background-color: #ff0000', {'fill': {'fgColor': 'FF0000',
+                                            'patternType': 'solid'}}),
+    ('background-color: #f0a', {'fill': {'fgColor': 'FF00AA',
+                                         'patternType': 'solid'}}),
+    # BORDER
+    # - style
+    ('border-style: solid',
+     {'border': {'top': {'style': 'medium'},
+                 'bottom': {'style': 'medium'},
+                 'left': {'style': 'medium'},
+                 'right': {'style': 'medium'}}}),
+    ('border-style: solid; border-width: thin',
+     {'border': {'top': {'style': 'thin'},
+                 'bottom': {'style': 'thin'},
+                 'left': {'style': 'thin'},
+                 'right': {'style': 'thin'}}}),
+
+    ('border-top-style: solid; border-top-width: thin',
+     {'border': {'top': {'style': 'thin'}}}),
+    ('border-top-style: solid; border-top-width: 1pt',
+     {'border': {'top': {'style': 'thin'}}}),
+    ('border-top-style: solid',
+     {'border': {'top': {'style': 'medium'}}}),
+    ('border-top-style: solid; border-top-width: medium',
+     {'border': {'top': {'style': 'medium'}}}),
+    ('border-top-style: solid; border-top-width: 2pt',
+     {'border': {'top': {'style': 'medium'}}}),
+    ('border-top-style: solid; border-top-width: thick',
+     {'border': {'top': {'style': 'thick'}}}),
+    ('border-top-style: solid; border-top-width: 4pt',
+     {'border': {'top': {'style': 'thick'}}}),
+
+    ('border-top-style: dotted',
+     {'border': {'top': {'style': 'mediumDashDotDot'}}}),
+    ('border-top-style: dotted; border-top-width: thin',
+     {'border': {'top': {'style': 'dotted'}}}),
+    ('border-top-style: dashed',
+     {'border': {'top': {'style': 'mediumDashed'}}}),
+    ('border-top-style: dashed; border-top-width: thin',
+     {'border': {'top': {'style': 'dashed'}}}),
+    ('border-top-style: double',
+     {'border': {'top': {'style': 'double'}}}),
+    # - color
+    ('border-style: solid; border-color: #0000ff',
+     {'border': {'top': {'style': 'medium', 'color': '0000FF'},
+                 'right': {'style': 'medium', 'color': '0000FF'},
+                 'bottom': {'style': 'medium', 'color': '0000FF'},
+                 'left': {'style': 'medium', 'color': '0000FF'}}}),
+    ('border-top-style: double; border-top-color: blue',
+     {'border': {'top': {'style': 'double', 'color': '0000FF'}}}),
+    ('border-top-style: solid; border-top-color: #06c',
+     {'border': {'top': {'style': 'medium', 'color': '0066CC'}}}),
+    # ALIGNMENT
+    # - horizontal
+    ('text-align: center',
+     {'alignment': {'horizontal': 'center'}}),
+    ('text-align: left',
+     {'alignment': {'horizontal': 'left'}}),
+    ('text-align: right',
+     {'alignment': {'horizontal': 'right'}}),
+    ('text-align: justify',
+     {'alignment': {'horizontal': 'justify'}}),
+    # - vertical
+    ('vertical-align: top',
+     {'alignment': {'vertical': 'top'}}),
+    ('vertical-align: text-top',
+     {'alignment': {'vertical': 'top'}}),
+    ('vertical-align: middle',
+     {'alignment': {'vertical': 'center'}}),
+    ('vertical-align: bottom',
+     {'alignment': {'vertical': 'bottom'}}),
+    ('vertical-align: text-bottom',
+     {'alignment': {'vertical': 'bottom'}}),
+    # - wrap_text
+    ('white-space: nowrap',
+     {'alignment': {'wrap_text': False}}),
+    ('white-space: pre',
+     {'alignment': {'wrap_text': False}}),
+    ('white-space: pre-line',
+     {'alignment': {'wrap_text': False}}),
+    ('white-space: normal',
+     {'alignment': {'wrap_text': True}}),
+])
+def test_css_to_excel(css, expected):
+    convert = CSSToExcelConverter()
+    assert expected == convert(css)
+
+
+def test_css_to_excel_multiple():
+    convert = CSSToExcelConverter()
+    actual = convert('''
+        font-weight: bold;
+        text-decoration: underline;
+        color: red;
+        border-width: thin;
+        text-align: center;
+        vertical-align: top;
+        unused: something;
+    ''')
+    assert {"font": {"bold": True, "underline": "single", "color": "FF0000"},
+            "border": {"top": {"style": "thin"},
+                       "right": {"style": "thin"},
+                       "bottom": {"style": "thin"},
+                       "left": {"style": "thin"}},
+            "alignment": {"horizontal": "center",
+                          "vertical": "top"}} == actual
+
+
+@pytest.mark.parametrize('css,inherited,expected', [
+    ('font-weight: bold', '',
+     {'font': {'bold': True}}),
+    ('', 'font-weight: bold',
+     {'font': {'bold': True}}),
+    ('font-weight: bold', 'font-style: italic',
+     {'font': {'bold': True, 'italic': True}}),
+    ('font-style: normal', 'font-style: italic',
+     {'font': {'italic': False}}),
+    ('font-style: inherit', '', {}),
+    ('font-style: normal; font-style: inherit', 'font-style: italic',
+     {'font': {'italic': True}}),
+])
+def test_css_to_excel_inherited(css, inherited, expected):
+    convert = CSSToExcelConverter(inherited)
+    assert expected == convert(css)
+
+
+@pytest.mark.parametrize("input_color,output_color", (
+    [(name, rgb) for name, rgb in CSSToExcelConverter.NAMED_COLORS.items()] +
+    [("#" + rgb, rgb) for rgb in CSSToExcelConverter.NAMED_COLORS.values()] +
+    [("#F0F", "FF00FF"), ("#ABC", "AABBCC")])
+)
+def test_css_to_excel_good_colors(input_color, output_color):
+    # see gh-18392
+    css = ("border-top-color: {color}; "
+           "border-right-color: {color}; "
+           "border-bottom-color: {color}; "
+           "border-left-color: {color}; "
+           "background-color: {color}; "
+           "color: {color}").format(color=input_color)
+
+    expected = dict()
+
+    expected["fill"] = {
+        "patternType": "solid",
+        "fgColor": output_color
+    }
+
+    expected["font"] = {
+        "color": output_color
+    }
+
+    expected["border"] = {
+        k: {
+            "color": output_color,
+        } for k in ("top", "right", "bottom", "left")
+    }
+
+    with tm.assert_produces_warning(None):
+        convert = CSSToExcelConverter()
+        assert expected == convert(css)
+
+
+@pytest.mark.parametrize("input_color", [None, "not-a-color"])
+def test_css_to_excel_bad_colors(input_color):
+    # see gh-18392
+    css = ("border-top-color: {color}; "
+           "border-right-color: {color}; "
+           "border-bottom-color: {color}; "
+           "border-left-color: {color}; "
+           "background-color: {color}; "
+           "color: {color}").format(color=input_color)
+
+    expected = dict()
+
+    if input_color is not None:
+        expected["fill"] = {
+            "patternType": "solid"
+        }
+
+    with catch_warnings(record=True):
+        convert = CSSToExcelConverter()
+        assert expected == convert(css)
diff --git a/pandas/tests/io/formats/test_to_html.py b/pandas/tests/io/formats/test_to_html.py
new file mode 100644
index 0000000000000..f69cac62513d4
--- /dev/null
+++ b/pandas/tests/io/formats/test_to_html.py
@@ -0,0 +1,1873 @@
+# -*- coding: utf-8 -*-
+
+import re
+from textwrap import dedent
+from datetime import datetime
+from distutils.version import LooseVersion
+
+import pytest
+import numpy as np
+import pandas as pd
+from pandas import compat, DataFrame, MultiIndex, option_context, Index
+from pandas.compat import u, lrange, StringIO
+from pandas.util import testing as tm
+import pandas.io.formats.format as fmt
+
+div_style = ''
+try:
+    import IPython
+    if LooseVersion(IPython.__version__) < LooseVersion('3.0.0'):
+        div_style = ' style="max-width:1500px;overflow:auto;"'
+except (ImportError, AttributeError):
+    pass
+
+
+class TestToHTML(object):
+
+    def test_to_html_with_col_space(self):
+        def check_with_width(df, col_space):
+            # check that col_space affects HTML generation
+            # and be very brittle about it.
+            html = df.to_html(col_space=col_space)
+            hdrs = [x for x in html.split(r"\n") if re.search(r"<th[>\s]", x)]
+            assert len(hdrs) > 0
+            for h in hdrs:
+                assert "min-width" in h
+                assert str(col_space) in h
+
+        df = DataFrame(np.random.random(size=(1, 3)))
+
+        check_with_width(df, 30)
+        check_with_width(df, 50)
+
+    def test_to_html_with_empty_string_label(self):
+        # GH3547, to_html regards empty string labels as repeated labels
+        data = {'c1': ['a', 'b'], 'c2': ['a', ''], 'data': [1, 2]}
+        df = DataFrame(data).set_index(['c1', 'c2'])
+        res = df.to_html()
+        assert "rowspan" not in res
+
+    def test_to_html_unicode(self):
+        df = DataFrame({u('\u03c3'): np.arange(10.)})
+        expected = u'<table border="1" class="dataframe">\n  <thead>\n    <tr style="text-align: right;">\n      <th></th>\n      <th>\u03c3</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>0</th>\n      <td>0.0</td>\n    </tr>\n    <tr>\n      <th>1</th>\n      <td>1.0</td>\n    </tr>\n    <tr>\n      <th>2</th>\n      <td>2.0</td>\n    </tr>\n    <tr>\n      <th>3</th>\n      <td>3.0</td>\n    </tr>\n    <tr>\n      <th>4</th>\n      <td>4.0</td>\n    </tr>\n    <tr>\n      <th>5</th>\n      <td>5.0</td>\n    </tr>\n    <tr>\n      <th>6</th>\n      <td>6.0</td>\n    </tr>\n    <tr>\n      <th>7</th>\n      <td>7.0</td>\n    </tr>\n    <tr>\n      <th>8</th>\n      <td>8.0</td>\n    </tr>\n    <tr>\n      <th>9</th>\n      <td>9.0</td>\n    </tr>\n  </tbody>\n</table>'  # noqa
+        assert df.to_html() == expected
+        df = DataFrame({'A': [u('\u03c3')]})
+        expected = u'<table border="1" class="dataframe">\n  <thead>\n    <tr style="text-align: right;">\n      <th></th>\n      <th>A</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>0</th>\n      <td>\u03c3</td>\n    </tr>\n  </tbody>\n</table>'  # noqa
+        assert df.to_html() == expected
+
+    def test_to_html_decimal(self):
+        # GH 12031
+        df = DataFrame({'A': [6.0, 3.1, 2.2]})
+        result = df.to_html(decimal=',')
+        expected = ('<table border="1" class="dataframe">\n'
+                    '  <thead>\n'
+                    '    <tr style="text-align: right;">\n'
+                    '      <th></th>\n'
+                    '      <th>A</th>\n'
+                    '    </tr>\n'
+                    '  </thead>\n'
+                    '  <tbody>\n'
+                    '    <tr>\n'
+                    '      <th>0</th>\n'
+                    '      <td>6,0</td>\n'
+                    '    </tr>\n'
+                    '    <tr>\n'
+                    '      <th>1</th>\n'
+                    '      <td>3,1</td>\n'
+                    '    </tr>\n'
+                    '    <tr>\n'
+                    '      <th>2</th>\n'
+                    '      <td>2,2</td>\n'
+                    '    </tr>\n'
+                    '  </tbody>\n'
+                    '</table>')
+        assert result == expected
+
+    def test_to_html_escaped(self):
+        a = 'str<ing1 &amp;'
+        b = 'stri>ng2 &amp;'
+
+        test_dict = {'co<l1': {a: "<type 'str'>",
+                               b: "<type 'str'>"},
+                     'co>l2': {a: "<type 'str'>",
+                               b: "<type 'str'>"}}
+        rs = DataFrame(test_dict).to_html()
+        xp = """<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>co&lt;l1</th>
+      <th>co&gt;l2</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>str&lt;ing1 &amp;amp;</th>
+      <td>&lt;type 'str'&gt;</td>
+      <td>&lt;type 'str'&gt;</td>
+    </tr>
+    <tr>
+      <th>stri&gt;ng2 &amp;amp;</th>
+      <td>&lt;type 'str'&gt;</td>
+      <td>&lt;type 'str'&gt;</td>
+    </tr>
+  </tbody>
+</table>"""
+
+        assert xp == rs
+
+    def test_to_html_escape_disabled(self):
+        a = 'str<ing1 &amp;'
+        b = 'stri>ng2 &amp;'
+
+        test_dict = {'co<l1': {a: "<b>bold</b>",
+                               b: "<b>bold</b>"},
+                     'co>l2': {a: "<b>bold</b>",
+                               b: "<b>bold</b>"}}
+        rs = DataFrame(test_dict).to_html(escape=False)
+        xp = """<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>co<l1</th>
+      <th>co>l2</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>str<ing1 &amp;</th>
+      <td><b>bold</b></td>
+      <td><b>bold</b></td>
+    </tr>
+    <tr>
+      <th>stri>ng2 &amp;</th>
+      <td><b>bold</b></td>
+      <td><b>bold</b></td>
+    </tr>
+  </tbody>
+</table>"""
+
+        assert xp == rs
+
+    def test_to_html_multiindex_index_false(self):
+        # issue 8452
+        df = DataFrame({
+            'a': range(2),
+            'b': range(3, 5),
+            'c': range(5, 7),
+            'd': range(3, 5)
+        })
+        df.columns = MultiIndex.from_product([['a', 'b'], ['c', 'd']])
+        result = df.to_html(index=False)
+        expected = """\
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th colspan="2" halign="left">a</th>
+      <th colspan="2" halign="left">b</th>
+    </tr>
+    <tr>
+      <th>c</th>
+      <th>d</th>
+      <th>c</th>
+      <th>d</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <td>0</td>
+      <td>3</td>
+      <td>5</td>
+      <td>3</td>
+    </tr>
+    <tr>
+      <td>1</td>
+      <td>4</td>
+      <td>6</td>
+      <td>4</td>
+    </tr>
+  </tbody>
+</table>"""
+
+        assert result == expected
+
+        df.index = Index(df.index.values, name='idx')
+        result = df.to_html(index=False)
+        assert result == expected
+
+    def test_to_html_multiindex_sparsify_false_multi_sparse(self):
+        with option_context('display.multi_sparse', False):
+            index = MultiIndex.from_arrays([[0, 0, 1, 1], [0, 1, 0, 1]],
+                                           names=['foo', None])
+
+            df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]], index=index)
+
+            result = df.to_html()
+            expected = """\
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>0</th>
+      <th>1</th>
+      <td>2</td>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <th>0</th>
+      <td>4</td>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <th>1</th>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+  </tbody>
+</table>"""
+
+            assert result == expected
+
+            df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]],
+                           columns=index[::2], index=index)
+
+            result = df.to_html()
+            expected = """\
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th>foo</th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>0</th>
+      <th>0</th>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>0</th>
+      <th>1</th>
+      <td>2</td>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <th>0</th>
+      <td>4</td>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <th>1</th>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+  </tbody>
+</table>"""
+
+            assert result == expected
+
+    def test_to_html_multiindex_sparsify(self):
+        index = MultiIndex.from_arrays([[0, 0, 1, 1], [0, 1, 0, 1]],
+                                       names=['foo', None])
+
+        df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]], index=index)
+
+        result = df.to_html()
+        expected = """<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">0</th>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>2</td>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">1</th>
+      <th>0</th>
+      <td>4</td>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+  </tbody>
+</table>"""
+
+        assert result == expected
+
+        df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]], columns=index[::2],
+                       index=index)
+
+        result = df.to_html()
+        expected = """\
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th>foo</th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>0</th>
+      <th>0</th>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">0</th>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>2</td>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">1</th>
+      <th>0</th>
+      <td>4</td>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+  </tbody>
+</table>"""
+
+        assert result == expected
+
+    def test_to_html_multiindex_odd_even_truncate(self):
+        # GH 14882 - Issue on truncation with odd length DataFrame
+        mi = MultiIndex.from_product([[100, 200, 300],
+                                      [10, 20, 30],
+                                      [1, 2, 3, 4, 5, 6, 7]],
+                                     names=['a', 'b', 'c'])
+        df = DataFrame({'n': range(len(mi))}, index=mi)
+        result = df.to_html(max_rows=60)
+        expected = """\
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th></th>
+      <th>n</th>
+    </tr>
+    <tr>
+      <th>a</th>
+      <th>b</th>
+      <th>c</th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="21" valign="top">100</th>
+      <th rowspan="7" valign="top">10</th>
+      <th>1</th>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>2</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>4</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>6</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">20</th>
+      <th>1</th>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>8</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>9</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>10</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>11</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>12</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>13</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">30</th>
+      <th>1</th>
+      <td>14</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>16</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>17</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>18</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>19</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>20</td>
+    </tr>
+    <tr>
+      <th rowspan="19" valign="top">200</th>
+      <th rowspan="7" valign="top">10</th>
+      <th>1</th>
+      <td>21</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>22</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>23</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>24</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>25</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>26</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>27</td>
+    </tr>
+    <tr>
+      <th rowspan="5" valign="top">20</th>
+      <th>1</th>
+      <td>28</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>29</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>33</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>34</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">30</th>
+      <th>1</th>
+      <td>35</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>36</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>37</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>38</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>39</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>40</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>41</td>
+    </tr>
+    <tr>
+      <th rowspan="21" valign="top">300</th>
+      <th rowspan="7" valign="top">10</th>
+      <th>1</th>
+      <td>42</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>43</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>44</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>45</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>46</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>47</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>48</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">20</th>
+      <th>1</th>
+      <td>49</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>50</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>51</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>52</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>53</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>54</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">30</th>
+      <th>1</th>
+      <td>56</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>57</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>58</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>59</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>60</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>61</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>62</td>
+    </tr>
+  </tbody>
+</table>"""
+        assert result == expected
+
+        # Test that ... appears in a middle level
+        result = df.to_html(max_rows=56)
+        expected = """\
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th></th>
+      <th>n</th>
+    </tr>
+    <tr>
+      <th>a</th>
+      <th>b</th>
+      <th>c</th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="21" valign="top">100</th>
+      <th rowspan="7" valign="top">10</th>
+      <th>1</th>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>2</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>4</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>6</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">20</th>
+      <th>1</th>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>8</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>9</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>10</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>11</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>12</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>13</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">30</th>
+      <th>1</th>
+      <td>14</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>16</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>17</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>18</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>19</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>20</td>
+    </tr>
+    <tr>
+      <th rowspan="15" valign="top">200</th>
+      <th rowspan="7" valign="top">10</th>
+      <th>1</th>
+      <td>21</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>22</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>23</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>24</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>25</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>26</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>27</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">30</th>
+      <th>1</th>
+      <td>35</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>36</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>37</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>38</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>39</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>40</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>41</td>
+    </tr>
+    <tr>
+      <th rowspan="21" valign="top">300</th>
+      <th rowspan="7" valign="top">10</th>
+      <th>1</th>
+      <td>42</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>43</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>44</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>45</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>46</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>47</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>48</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">20</th>
+      <th>1</th>
+      <td>49</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>50</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>51</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>52</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>53</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>54</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">30</th>
+      <th>1</th>
+      <td>56</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>57</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>58</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>59</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>60</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>61</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>62</td>
+    </tr>
+  </tbody>
+</table>"""
+        assert result == expected
+
+    def test_to_html_index_formatter(self):
+        df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]], columns=['foo', None],
+                       index=lrange(4))
+
+        f = lambda x: 'abcd' [x]
+        result = df.to_html(formatters={'__index__': f})
+        expected = """\
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>foo</th>
+      <th>None</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>a</th>
+      <td>0</td>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>b</th>
+      <td>2</td>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th>c</th>
+      <td>4</td>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>d</th>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+  </tbody>
+</table>"""
+
+        assert result == expected
+
+    def test_to_html_datetime64_monthformatter(self):
+        months = [datetime(2016, 1, 1), datetime(2016, 2, 2)]
+        x = DataFrame({'months': months})
+
+        def format_func(x):
+            return x.strftime('%Y-%m')
+        result = x.to_html(formatters={'months': format_func})
+        expected = """\
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>months</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>2016-01</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>2016-02</td>
+    </tr>
+  </tbody>
+</table>"""
+        assert result == expected
+
+    def test_to_html_datetime64_hourformatter(self):
+
+        x = DataFrame({'hod': pd.to_datetime(['10:10:10.100', '12:12:12.120'],
+                                             format='%H:%M:%S.%f')})
+
+        def format_func(x):
+            return x.strftime('%H:%M')
+        result = x.to_html(formatters={'hod': format_func})
+        expected = """\
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>hod</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>10:10</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>12:12</td>
+    </tr>
+  </tbody>
+</table>"""
+        assert result == expected
+
+    def test_to_html_regression_GH6098(self):
+        df = DataFrame({
+            u('clé1'): [u('a'), u('a'), u('b'), u('b'), u('a')],
+            u('clé2'): [u('1er'), u('2ème'), u('1er'), u('2ème'), u('1er')],
+            'données1': np.random.randn(5),
+            'données2': np.random.randn(5)})
+
+        # it works
+        df.pivot_table(index=[u('clé1')], columns=[u('clé2')])._repr_html_()
+
+    def test_to_html_truncate(self):
+        pytest.skip("unreliable on travis")
+        index = pd.DatetimeIndex(start='20010101', freq='D', periods=20)
+        df = DataFrame(index=index, columns=range(20))
+        fmt.set_option('display.max_rows', 8)
+        fmt.set_option('display.max_columns', 4)
+        result = df._repr_html_()
+        expected = '''\
+<div{0}>
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>18</th>
+      <th>19</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>2001-01-01</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>2001-01-02</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>2001-01-03</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>2001-01-04</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>2001-01-17</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>2001-01-18</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>2001-01-19</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>2001-01-20</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+  </tbody>
+</table>
+<p>20 rows × 20 columns</p>
+</div>'''.format(div_style)
+        if compat.PY2:
+            expected = expected.decode('utf-8')
+        assert result == expected
+
+    def test_to_html_truncate_multi_index(self):
+        pytest.skip("unreliable on travis")
+        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+        df = DataFrame(index=arrays, columns=arrays)
+        fmt.set_option('display.max_rows', 7)
+        fmt.set_option('display.max_columns', 7)
+        result = df._repr_html_()
+        expected = '''\
+<div{0}>
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th></th>
+      <th colspan="2" halign="left">bar</th>
+      <th>baz</th>
+      <th>...</th>
+      <th>foo</th>
+      <th colspan="2" halign="left">qux</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>one</th>
+      <th>two</th>
+      <th>one</th>
+      <th>...</th>
+      <th>two</th>
+      <th>one</th>
+      <th>two</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">bar</th>
+      <th>one</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>two</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>baz</th>
+      <th>one</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th>two</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">qux</th>
+      <th>one</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>two</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+  </tbody>
+</table>
+<p>8 rows × 8 columns</p>
+</div>'''.format(div_style)
+        if compat.PY2:
+            expected = expected.decode('utf-8')
+        assert result == expected
+
+    def test_to_html_truncate_multi_index_sparse_off(self):
+        pytest.skip("unreliable on travis")
+        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+        df = DataFrame(index=arrays, columns=arrays)
+        fmt.set_option('display.max_rows', 7)
+        fmt.set_option('display.max_columns', 7)
+        fmt.set_option('display.multi_sparse', False)
+        result = df._repr_html_()
+        expected = '''\
+<div{0}>
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>bar</th>
+      <th>bar</th>
+      <th>baz</th>
+      <th>...</th>
+      <th>foo</th>
+      <th>qux</th>
+      <th>qux</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>one</th>
+      <th>two</th>
+      <th>one</th>
+      <th>...</th>
+      <th>two</th>
+      <th>one</th>
+      <th>two</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>bar</th>
+      <th>one</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>bar</th>
+      <th>two</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>baz</th>
+      <th>one</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th>two</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>qux</th>
+      <th>one</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>qux</th>
+      <th>two</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+  </tbody>
+</table>
+<p>8 rows × 8 columns</p>
+</div>'''.format(div_style)
+        if compat.PY2:
+            expected = expected.decode('utf-8')
+        assert result == expected
+
+    def test_to_html_border(self):
+        df = DataFrame({'A': [1, 2]})
+        result = df.to_html()
+        assert 'border="1"' in result
+
+    def test_to_html_border_option(self):
+        df = DataFrame({'A': [1, 2]})
+        with pd.option_context('display.html.border', 0):
+            result = df.to_html()
+            assert 'border="0"' in result
+            assert 'border="0"' in df._repr_html_()
+
+    def test_to_html_border_zero(self):
+        df = DataFrame({'A': [1, 2]})
+        result = df.to_html(border=0)
+        assert 'border="0"' in result
+
+    @tm.capture_stdout
+    def test_display_option_warning(self):
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            pd.options.html.border
+
+    def test_to_html(self):
+        # big mixed
+        biggie = DataFrame({'A': np.random.randn(200),
+                            'B': tm.makeStringIndex(200)},
+                           index=lrange(200))
+
+        biggie.loc[:20, 'A'] = np.nan
+        biggie.loc[:20, 'B'] = np.nan
+        s = biggie.to_html()
+
+        buf = StringIO()
+        retval = biggie.to_html(buf=buf)
+        assert retval is None
+        assert buf.getvalue() == s
+
+        assert isinstance(s, compat.string_types)
+
+        biggie.to_html(columns=['B', 'A'], col_space=17)
+        biggie.to_html(columns=['B', 'A'],
+                       formatters={'A': lambda x: '{x:.1f}'.format(x=x)})
+
+        biggie.to_html(columns=['B', 'A'], float_format=str)
+        biggie.to_html(columns=['B', 'A'], col_space=12, float_format=str)
+
+        frame = DataFrame(index=np.arange(200))
+        frame.to_html()
+
+    def test_to_html_filename(self):
+        biggie = DataFrame({'A': np.random.randn(200),
+                            'B': tm.makeStringIndex(200)},
+                           index=lrange(200))
+
+        biggie.loc[:20, 'A'] = np.nan
+        biggie.loc[:20, 'B'] = np.nan
+        with tm.ensure_clean('test.html') as path:
+            biggie.to_html(path)
+            with open(path, 'r') as f:
+                s = biggie.to_html()
+                s2 = f.read()
+                assert s == s2
+
+        frame = DataFrame(index=np.arange(200))
+        with tm.ensure_clean('test.html') as path:
+            frame.to_html(path)
+            with open(path, 'r') as f:
+                assert frame.to_html() == f.read()
+
+    def test_to_html_with_no_bold(self):
+        x = DataFrame({'x': np.random.randn(5)})
+        ashtml = x.to_html(bold_rows=False)
+        assert '<strong' not in ashtml[ashtml.find("</thead>")]
+
+    def test_to_html_columns_arg(self):
+        frame = DataFrame(tm.getSeriesData())
+        result = frame.to_html(columns=['A'])
+        assert '<th>B</th>' not in result
+
+    def test_to_html_multiindex(self):
+        columns = MultiIndex.from_tuples(list(zip(np.arange(2).repeat(2),
+                                                  np.mod(lrange(4), 2))),
+                                         names=['CL0', 'CL1'])
+        df = DataFrame([list('abcd'), list('efgh')], columns=columns)
+        result = df.to_html(justify='left')
+        expected = ('<table border="1" class="dataframe">\n'
+                    '  <thead>\n'
+                    '    <tr>\n'
+                    '      <th>CL0</th>\n'
+                    '      <th colspan="2" halign="left">0</th>\n'
+                    '      <th colspan="2" halign="left">1</th>\n'
+                    '    </tr>\n'
+                    '    <tr>\n'
+                    '      <th>CL1</th>\n'
+                    '      <th>0</th>\n'
+                    '      <th>1</th>\n'
+                    '      <th>0</th>\n'
+                    '      <th>1</th>\n'
+                    '    </tr>\n'
+                    '  </thead>\n'
+                    '  <tbody>\n'
+                    '    <tr>\n'
+                    '      <th>0</th>\n'
+                    '      <td>a</td>\n'
+                    '      <td>b</td>\n'
+                    '      <td>c</td>\n'
+                    '      <td>d</td>\n'
+                    '    </tr>\n'
+                    '    <tr>\n'
+                    '      <th>1</th>\n'
+                    '      <td>e</td>\n'
+                    '      <td>f</td>\n'
+                    '      <td>g</td>\n'
+                    '      <td>h</td>\n'
+                    '    </tr>\n'
+                    '  </tbody>\n'
+                    '</table>')
+
+        assert result == expected
+
+        columns = MultiIndex.from_tuples(list(zip(
+            range(4), np.mod(
+                lrange(4), 2))))
+        df = DataFrame([list('abcd'), list('efgh')], columns=columns)
+
+        result = df.to_html(justify='right')
+        expected = ('<table border="1" class="dataframe">\n'
+                    '  <thead>\n'
+                    '    <tr>\n'
+                    '      <th></th>\n'
+                    '      <th>0</th>\n'
+                    '      <th>1</th>\n'
+                    '      <th>2</th>\n'
+                    '      <th>3</th>\n'
+                    '    </tr>\n'
+                    '    <tr>\n'
+                    '      <th></th>\n'
+                    '      <th>0</th>\n'
+                    '      <th>1</th>\n'
+                    '      <th>0</th>\n'
+                    '      <th>1</th>\n'
+                    '    </tr>\n'
+                    '  </thead>\n'
+                    '  <tbody>\n'
+                    '    <tr>\n'
+                    '      <th>0</th>\n'
+                    '      <td>a</td>\n'
+                    '      <td>b</td>\n'
+                    '      <td>c</td>\n'
+                    '      <td>d</td>\n'
+                    '    </tr>\n'
+                    '    <tr>\n'
+                    '      <th>1</th>\n'
+                    '      <td>e</td>\n'
+                    '      <td>f</td>\n'
+                    '      <td>g</td>\n'
+                    '      <td>h</td>\n'
+                    '    </tr>\n'
+                    '  </tbody>\n'
+                    '</table>')
+
+        assert result == expected
+
+    @pytest.mark.parametrize("justify", fmt._VALID_JUSTIFY_PARAMETERS)
+    def test_to_html_justify(self, justify):
+        df = DataFrame({'A': [6, 30000, 2],
+                        'B': [1, 2, 70000],
+                        'C': [223442, 0, 1]},
+                       columns=['A', 'B', 'C'])
+        result = df.to_html(justify=justify)
+        expected = ('<table border="1" class="dataframe">\n'
+                    '  <thead>\n'
+                    '    <tr style="text-align: {justify};">\n'
+                    '      <th></th>\n'
+                    '      <th>A</th>\n'
+                    '      <th>B</th>\n'
+                    '      <th>C</th>\n'
+                    '    </tr>\n'
+                    '  </thead>\n'
+                    '  <tbody>\n'
+                    '    <tr>\n'
+                    '      <th>0</th>\n'
+                    '      <td>6</td>\n'
+                    '      <td>1</td>\n'
+                    '      <td>223442</td>\n'
+                    '    </tr>\n'
+                    '    <tr>\n'
+                    '      <th>1</th>\n'
+                    '      <td>30000</td>\n'
+                    '      <td>2</td>\n'
+                    '      <td>0</td>\n'
+                    '    </tr>\n'
+                    '    <tr>\n'
+                    '      <th>2</th>\n'
+                    '      <td>2</td>\n'
+                    '      <td>70000</td>\n'
+                    '      <td>1</td>\n'
+                    '    </tr>\n'
+                    '  </tbody>\n'
+                    '</table>'.format(justify=justify))
+        assert result == expected
+
+    @pytest.mark.parametrize("justify", ["super-right", "small-left",
+                                         "noinherit", "tiny", "pandas"])
+    def test_to_html_invalid_justify(self, justify):
+        # see gh-17527
+        df = DataFrame()
+        msg = "Invalid value for justify parameter"
+
+        with tm.assert_raises_regex(ValueError, msg):
+            df.to_html(justify=justify)
+
+    def test_to_html_index(self):
+        index = ['foo', 'bar', 'baz']
+        df = DataFrame({'A': [1, 2, 3],
+                        'B': [1.2, 3.4, 5.6],
+                        'C': ['one', 'two', np.nan]},
+                       columns=['A', 'B', 'C'],
+                       index=index)
+        expected_with_index = ('<table border="1" class="dataframe">\n'
+                               '  <thead>\n'
+                               '    <tr style="text-align: right;">\n'
+                               '      <th></th>\n'
+                               '      <th>A</th>\n'
+                               '      <th>B</th>\n'
+                               '      <th>C</th>\n'
+                               '    </tr>\n'
+                               '  </thead>\n'
+                               '  <tbody>\n'
+                               '    <tr>\n'
+                               '      <th>foo</th>\n'
+                               '      <td>1</td>\n'
+                               '      <td>1.2</td>\n'
+                               '      <td>one</td>\n'
+                               '    </tr>\n'
+                               '    <tr>\n'
+                               '      <th>bar</th>\n'
+                               '      <td>2</td>\n'
+                               '      <td>3.4</td>\n'
+                               '      <td>two</td>\n'
+                               '    </tr>\n'
+                               '    <tr>\n'
+                               '      <th>baz</th>\n'
+                               '      <td>3</td>\n'
+                               '      <td>5.6</td>\n'
+                               '      <td>NaN</td>\n'
+                               '    </tr>\n'
+                               '  </tbody>\n'
+                               '</table>')
+        assert df.to_html() == expected_with_index
+
+        expected_without_index = ('<table border="1" class="dataframe">\n'
+                                  '  <thead>\n'
+                                  '    <tr style="text-align: right;">\n'
+                                  '      <th>A</th>\n'
+                                  '      <th>B</th>\n'
+                                  '      <th>C</th>\n'
+                                  '    </tr>\n'
+                                  '  </thead>\n'
+                                  '  <tbody>\n'
+                                  '    <tr>\n'
+                                  '      <td>1</td>\n'
+                                  '      <td>1.2</td>\n'
+                                  '      <td>one</td>\n'
+                                  '    </tr>\n'
+                                  '    <tr>\n'
+                                  '      <td>2</td>\n'
+                                  '      <td>3.4</td>\n'
+                                  '      <td>two</td>\n'
+                                  '    </tr>\n'
+                                  '    <tr>\n'
+                                  '      <td>3</td>\n'
+                                  '      <td>5.6</td>\n'
+                                  '      <td>NaN</td>\n'
+                                  '    </tr>\n'
+                                  '  </tbody>\n'
+                                  '</table>')
+        result = df.to_html(index=False)
+        for i in index:
+            assert i not in result
+        assert result == expected_without_index
+        df.index = Index(['foo', 'bar', 'baz'], name='idx')
+        expected_with_index = ('<table border="1" class="dataframe">\n'
+                               '  <thead>\n'
+                               '    <tr style="text-align: right;">\n'
+                               '      <th></th>\n'
+                               '      <th>A</th>\n'
+                               '      <th>B</th>\n'
+                               '      <th>C</th>\n'
+                               '    </tr>\n'
+                               '    <tr>\n'
+                               '      <th>idx</th>\n'
+                               '      <th></th>\n'
+                               '      <th></th>\n'
+                               '      <th></th>\n'
+                               '    </tr>\n'
+                               '  </thead>\n'
+                               '  <tbody>\n'
+                               '    <tr>\n'
+                               '      <th>foo</th>\n'
+                               '      <td>1</td>\n'
+                               '      <td>1.2</td>\n'
+                               '      <td>one</td>\n'
+                               '    </tr>\n'
+                               '    <tr>\n'
+                               '      <th>bar</th>\n'
+                               '      <td>2</td>\n'
+                               '      <td>3.4</td>\n'
+                               '      <td>two</td>\n'
+                               '    </tr>\n'
+                               '    <tr>\n'
+                               '      <th>baz</th>\n'
+                               '      <td>3</td>\n'
+                               '      <td>5.6</td>\n'
+                               '      <td>NaN</td>\n'
+                               '    </tr>\n'
+                               '  </tbody>\n'
+                               '</table>')
+        assert df.to_html() == expected_with_index
+        assert df.to_html(index=False) == expected_without_index
+
+        tuples = [('foo', 'car'), ('foo', 'bike'), ('bar', 'car')]
+        df.index = MultiIndex.from_tuples(tuples)
+
+        expected_with_index = ('<table border="1" class="dataframe">\n'
+                               '  <thead>\n'
+                               '    <tr style="text-align: right;">\n'
+                               '      <th></th>\n'
+                               '      <th></th>\n'
+                               '      <th>A</th>\n'
+                               '      <th>B</th>\n'
+                               '      <th>C</th>\n'
+                               '    </tr>\n'
+                               '  </thead>\n'
+                               '  <tbody>\n'
+                               '    <tr>\n'
+                               '      <th rowspan="2" valign="top">foo</th>\n'
+                               '      <th>car</th>\n'
+                               '      <td>1</td>\n'
+                               '      <td>1.2</td>\n'
+                               '      <td>one</td>\n'
+                               '    </tr>\n'
+                               '    <tr>\n'
+                               '      <th>bike</th>\n'
+                               '      <td>2</td>\n'
+                               '      <td>3.4</td>\n'
+                               '      <td>two</td>\n'
+                               '    </tr>\n'
+                               '    <tr>\n'
+                               '      <th>bar</th>\n'
+                               '      <th>car</th>\n'
+                               '      <td>3</td>\n'
+                               '      <td>5.6</td>\n'
+                               '      <td>NaN</td>\n'
+                               '    </tr>\n'
+                               '  </tbody>\n'
+                               '</table>')
+        assert df.to_html() == expected_with_index
+
+        result = df.to_html(index=False)
+        for i in ['foo', 'bar', 'car', 'bike']:
+            assert i not in result
+        # must be the same result as normal index
+        assert result == expected_without_index
+
+        df.index = MultiIndex.from_tuples(tuples, names=['idx1', 'idx2'])
+        expected_with_index = ('<table border="1" class="dataframe">\n'
+                               '  <thead>\n'
+                               '    <tr style="text-align: right;">\n'
+                               '      <th></th>\n'
+                               '      <th></th>\n'
+                               '      <th>A</th>\n'
+                               '      <th>B</th>\n'
+                               '      <th>C</th>\n'
+                               '    </tr>\n'
+                               '    <tr>\n'
+                               '      <th>idx1</th>\n'
+                               '      <th>idx2</th>\n'
+                               '      <th></th>\n'
+                               '      <th></th>\n'
+                               '      <th></th>\n'
+                               '    </tr>\n'
+                               '  </thead>\n'
+                               '  <tbody>\n'
+                               '    <tr>\n'
+                               '      <th rowspan="2" valign="top">foo</th>\n'
+                               '      <th>car</th>\n'
+                               '      <td>1</td>\n'
+                               '      <td>1.2</td>\n'
+                               '      <td>one</td>\n'
+                               '    </tr>\n'
+                               '    <tr>\n'
+                               '      <th>bike</th>\n'
+                               '      <td>2</td>\n'
+                               '      <td>3.4</td>\n'
+                               '      <td>two</td>\n'
+                               '    </tr>\n'
+                               '    <tr>\n'
+                               '      <th>bar</th>\n'
+                               '      <th>car</th>\n'
+                               '      <td>3</td>\n'
+                               '      <td>5.6</td>\n'
+                               '      <td>NaN</td>\n'
+                               '    </tr>\n'
+                               '  </tbody>\n'
+                               '</table>')
+        assert df.to_html() == expected_with_index
+        assert df.to_html(index=False) == expected_without_index
+
+    def test_to_html_with_classes(self):
+        df = DataFrame()
+        result = df.to_html(classes="sortable draggable")
+        expected = dedent("""
+
+            <table border="1" class="dataframe sortable draggable">
+              <thead>
+                <tr style="text-align: right;">
+                  <th></th>
+                </tr>
+              </thead>
+              <tbody>
+              </tbody>
+            </table>
+
+        """).strip()
+        assert result == expected
+
+        result = df.to_html(classes=["sortable", "draggable"])
+        assert result == expected
+
+    def test_to_html_no_index_max_rows(self):
+        # GH https://github.com/pandas-dev/pandas/issues/14998
+        df = DataFrame({"A": [1, 2, 3, 4]})
+        result = df.to_html(index=False, max_rows=1)
+        expected = dedent("""\
+        <table border="1" class="dataframe">
+          <thead>
+            <tr style="text-align: right;">
+              <th>A</th>
+            </tr>
+          </thead>
+          <tbody>
+            <tr>
+              <td>1</td>
+            </tr>
+          </tbody>
+        </table>""")
+        assert result == expected
+
+    def test_to_html_notebook_has_style(self):
+        df = pd.DataFrame({"A": [1, 2, 3]})
+        result = df.to_html(notebook=True)
+        assert "tbody tr th:only-of-type" in result
+        assert "vertical-align: middle;" in result
+        assert "thead th" in result
+
+    def test_to_html_notebook_has_no_style(self):
+        df = pd.DataFrame({"A": [1, 2, 3]})
+        result = df.to_html()
+        assert "tbody tr th:only-of-type" not in result
+        assert "vertical-align: middle;" not in result
+        assert "thead th" not in result
+
+    def test_to_html_with_index_names_false(self):
+        # gh-16493
+        df = pd.DataFrame({"A": [1, 2]}, index=pd.Index(['a', 'b'],
+                                                        name='myindexname'))
+        result = df.to_html(index_names=False)
+        assert 'myindexname' not in result
+
+    def test_to_html_with_id(self):
+        # gh-8496
+        df = pd.DataFrame({"A": [1, 2]}, index=pd.Index(['a', 'b'],
+                                                        name='myindexname'))
+        result = df.to_html(index_names=False, table_id="TEST_ID")
+        assert ' id="TEST_ID"' in result
diff --git a/pandas/tests/io/formats/test_to_latex.py b/pandas/tests/io/formats/test_to_latex.py
new file mode 100644
index 0000000000000..73517890565c7
--- /dev/null
+++ b/pandas/tests/io/formats/test_to_latex.py
@@ -0,0 +1,710 @@
+from datetime import datetime
+
+import pytest
+
+import pandas as pd
+from pandas import DataFrame, compat, Series
+from pandas.util import testing as tm
+from pandas.compat import u
+import codecs
+
+
+@pytest.fixture
+def frame():
+    return DataFrame(tm.getSeriesData())
+
+
+class TestToLatex(object):
+
+    def test_to_latex_filename(self, frame):
+        with tm.ensure_clean('test.tex') as path:
+            frame.to_latex(path)
+
+            with open(path, 'r') as f:
+                assert frame.to_latex() == f.read()
+
+        # test with utf-8 and encoding option (GH 7061)
+        df = DataFrame([[u'au\xdfgangen']])
+        with tm.ensure_clean('test.tex') as path:
+            df.to_latex(path, encoding='utf-8')
+            with codecs.open(path, 'r', encoding='utf-8') as f:
+                assert df.to_latex() == f.read()
+
+        # test with utf-8 without encoding option
+        if compat.PY3:  # python3: pandas default encoding is utf-8
+            with tm.ensure_clean('test.tex') as path:
+                df.to_latex(path)
+                with codecs.open(path, 'r', encoding='utf-8') as f:
+                    assert df.to_latex() == f.read()
+        else:
+            # python2 default encoding is ascii, so an error should be raised
+            with tm.ensure_clean('test.tex') as path:
+                with pytest.raises(UnicodeEncodeError):
+                    df.to_latex(path)
+
+    def test_to_latex(self, frame):
+        # it works!
+        frame.to_latex()
+
+        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        withindex_result = df.to_latex()
+        withindex_expected = r"""\begin{tabular}{lrl}
+\toprule
+{} &  a &   b \\
+\midrule
+0 &  1 &  b1 \\
+1 &  2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withindex_result == withindex_expected
+
+        withoutindex_result = df.to_latex(index=False)
+        withoutindex_expected = r"""\begin{tabular}{rl}
+\toprule
+ a &   b \\
+\midrule
+ 1 &  b1 \\
+ 2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withoutindex_result == withoutindex_expected
+
+    def test_to_latex_format(self, frame):
+        # GH Bug #9402
+        frame.to_latex(column_format='ccc')
+
+        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        withindex_result = df.to_latex(column_format='ccc')
+        withindex_expected = r"""\begin{tabular}{ccc}
+\toprule
+{} &  a &   b \\
+\midrule
+0 &  1 &  b1 \\
+1 &  2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withindex_result == withindex_expected
+
+    def test_to_latex_empty(self):
+        df = DataFrame()
+        result = df.to_latex()
+        expected = r"""\begin{tabular}{l}
+\toprule
+Empty DataFrame
+Columns: Index([], dtype='object')
+Index: Index([], dtype='object') \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+        result = df.to_latex(longtable=True)
+        expected = r"""\begin{longtable}{l}
+\toprule
+Empty DataFrame
+Columns: Index([], dtype='object')
+Index: Index([], dtype='object') \\
+\end{longtable}
+"""
+        assert result == expected
+
+    def test_to_latex_with_formatters(self):
+        df = DataFrame({'datetime64': [datetime(2016, 1, 1),
+                                       datetime(2016, 2, 5),
+                                       datetime(2016, 3, 3)],
+                        'float': [1.0, 2.0, 3.0],
+                        'int': [1, 2, 3],
+                        'object': [(1, 2), True, False],
+                        })
+
+        formatters = {'datetime64': lambda x: x.strftime('%Y-%m'),
+                      'float': lambda x: '[{x: 4.1f}]'.format(x=x),
+                      'int': lambda x: '0x{x:x}'.format(x=x),
+                      'object': lambda x: '-{x!s}-'.format(x=x),
+                      '__index__': lambda x: 'index: {x}'.format(x=x)}
+        result = df.to_latex(formatters=dict(formatters))
+
+        expected = r"""\begin{tabular}{llrrl}
+\toprule
+{} & datetime64 &  float & int &    object \\
+\midrule
+index: 0 &    2016-01 & [ 1.0] & 0x1 &  -(1, 2)- \\
+index: 1 &    2016-02 & [ 2.0] & 0x2 &    -True- \\
+index: 2 &    2016-03 & [ 3.0] & 0x3 &   -False- \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+    def test_to_latex_multiindex(self):
+        df = DataFrame({('x', 'y'): ['a']})
+        result = df.to_latex()
+        expected = r"""\begin{tabular}{ll}
+\toprule
+{} &  x \\
+{} &  y \\
+\midrule
+0 &  a \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert result == expected
+
+        result = df.T.to_latex()
+        expected = r"""\begin{tabular}{lll}
+\toprule
+  &   &  0 \\
+\midrule
+x & y &  a \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert result == expected
+
+        df = DataFrame.from_dict({
+            ('c1', 0): pd.Series({x: x for x in range(4)}),
+            ('c1', 1): pd.Series({x: x + 4 for x in range(4)}),
+            ('c2', 0): pd.Series({x: x for x in range(4)}),
+            ('c2', 1): pd.Series({x: x + 4 for x in range(4)}),
+            ('c3', 0): pd.Series({x: x for x in range(4)}),
+        }).T
+        result = df.to_latex()
+        expected = r"""\begin{tabular}{llrrrr}
+\toprule
+   &   &  0 &  1 &  2 &  3 \\
+\midrule
+c1 & 0 &  0 &  1 &  2 &  3 \\
+   & 1 &  4 &  5 &  6 &  7 \\
+c2 & 0 &  0 &  1 &  2 &  3 \\
+   & 1 &  4 &  5 &  6 &  7 \\
+c3 & 0 &  0 &  1 &  2 &  3 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert result == expected
+
+        # GH 14184
+        df = df.T
+        df.columns.names = ['a', 'b']
+        result = df.to_latex()
+        expected = r"""\begin{tabular}{lrrrrr}
+\toprule
+a & \multicolumn{2}{l}{c1} & \multicolumn{2}{l}{c2} & c3 \\
+b &  0 &  1 &  0 &  1 &  0 \\
+\midrule
+0 &  0 &  4 &  0 &  4 &  0 \\
+1 &  1 &  5 &  1 &  5 &  1 \\
+2 &  2 &  6 &  2 &  6 &  2 \\
+3 &  3 &  7 &  3 &  7 &  3 \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+        # GH 10660
+        df = pd.DataFrame({'a': [0, 0, 1, 1],
+                           'b': list('abab'),
+                           'c': [1, 2, 3, 4]})
+        result = df.set_index(['a', 'b']).to_latex()
+        expected = r"""\begin{tabular}{llr}
+\toprule
+  &   &  c \\
+a & b &    \\
+\midrule
+0 & a &  1 \\
+  & b &  2 \\
+1 & a &  3 \\
+  & b &  4 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert result == expected
+
+        result = df.groupby('a').describe().to_latex()
+        expected = r"""\begin{tabular}{lrrrrrrrr}
+\toprule
+{} & \multicolumn{8}{l}{c} \\
+{} & count & mean &       std &  min &   25\% &  50\% &   75\% &  max \\
+a &       &      &           &      &       &      &       &      \\
+\midrule
+0 &   2.0 &  1.5 &  0.707107 &  1.0 &  1.25 &  1.5 &  1.75 &  2.0 \\
+1 &   2.0 &  3.5 &  0.707107 &  3.0 &  3.25 &  3.5 &  3.75 &  4.0 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert result == expected
+
+    def test_to_latex_multiindex_dupe_level(self):
+        # see gh-14484
+        #
+        # If an index is repeated in subsequent rows, it should be
+        # replaced with a blank in the created table. This should
+        # ONLY happen if all higher order indices (to the left) are
+        # equal too. In this test, 'c' has to be printed both times
+        # because the higher order index 'A' != 'B'.
+        df = pd.DataFrame(index=pd.MultiIndex.from_tuples(
+            [('A', 'c'), ('B', 'c')]), columns=['col'])
+        result = df.to_latex()
+        expected = r"""\begin{tabular}{lll}
+\toprule
+  &   &  col \\
+\midrule
+A & c &  NaN \\
+B & c &  NaN \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+    def test_to_latex_multicolumnrow(self):
+        df = pd.DataFrame({
+            ('c1', 0): {x: x for x in range(5)},
+            ('c1', 1): {x: x + 5 for x in range(5)},
+            ('c2', 0): {x: x for x in range(5)},
+            ('c2', 1): {x: x + 5 for x in range(5)},
+            ('c3', 0): {x: x for x in range(5)}
+        })
+        result = df.to_latex()
+        expected = r"""\begin{tabular}{lrrrrr}
+\toprule
+{} & \multicolumn{2}{l}{c1} & \multicolumn{2}{l}{c2} & c3 \\
+{} &  0 &  1 &  0 &  1 &  0 \\
+\midrule
+0 &  0 &  5 &  0 &  5 &  0 \\
+1 &  1 &  6 &  1 &  6 &  1 \\
+2 &  2 &  7 &  2 &  7 &  2 \\
+3 &  3 &  8 &  3 &  8 &  3 \\
+4 &  4 &  9 &  4 &  9 &  4 \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+        result = df.to_latex(multicolumn=False)
+        expected = r"""\begin{tabular}{lrrrrr}
+\toprule
+{} & c1 &    & c2 &    & c3 \\
+{} &  0 &  1 &  0 &  1 &  0 \\
+\midrule
+0 &  0 &  5 &  0 &  5 &  0 \\
+1 &  1 &  6 &  1 &  6 &  1 \\
+2 &  2 &  7 &  2 &  7 &  2 \\
+3 &  3 &  8 &  3 &  8 &  3 \\
+4 &  4 &  9 &  4 &  9 &  4 \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+        result = df.T.to_latex(multirow=True)
+        expected = r"""\begin{tabular}{llrrrrr}
+\toprule
+   &   &  0 &  1 &  2 &  3 &  4 \\
+\midrule
+\multirow{2}{*}{c1} & 0 &  0 &  1 &  2 &  3 &  4 \\
+   & 1 &  5 &  6 &  7 &  8 &  9 \\
+\cline{1-7}
+\multirow{2}{*}{c2} & 0 &  0 &  1 &  2 &  3 &  4 \\
+   & 1 &  5 &  6 &  7 &  8 &  9 \\
+\cline{1-7}
+c3 & 0 &  0 &  1 &  2 &  3 &  4 \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+        df.index = df.T.index
+        result = df.T.to_latex(multirow=True, multicolumn=True,
+                               multicolumn_format='c')
+        expected = r"""\begin{tabular}{llrrrrr}
+\toprule
+   &   & \multicolumn{2}{c}{c1} & \multicolumn{2}{c}{c2} & c3 \\
+   &   &  0 &  1 &  0 &  1 &  0 \\
+\midrule
+\multirow{2}{*}{c1} & 0 &  0 &  1 &  2 &  3 &  4 \\
+   & 1 &  5 &  6 &  7 &  8 &  9 \\
+\cline{1-7}
+\multirow{2}{*}{c2} & 0 &  0 &  1 &  2 &  3 &  4 \\
+   & 1 &  5 &  6 &  7 &  8 &  9 \\
+\cline{1-7}
+c3 & 0 &  0 &  1 &  2 &  3 &  4 \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+    def test_to_latex_escape(self):
+        a = 'a'
+        b = 'b'
+
+        test_dict = {u('co$e^x$'): {a: "a",
+                                    b: "b"},
+                     u('co^l1'): {a: "a",
+                                  b: "b"}}
+
+        unescaped_result = DataFrame(test_dict).to_latex(escape=False)
+        escaped_result = DataFrame(test_dict).to_latex(
+        )  # default: escape=True
+
+        unescaped_expected = r'''\begin{tabular}{lll}
+\toprule
+{} & co$e^x$ & co^l1 \\
+\midrule
+a &       a &     a \\
+b &       b &     b \\
+\bottomrule
+\end{tabular}
+'''
+
+        escaped_expected = r'''\begin{tabular}{lll}
+\toprule
+{} & co\$e\textasciicircum x\$ & co\textasciicircum l1 \\
+\midrule
+a &       a &     a \\
+b &       b &     b \\
+\bottomrule
+\end{tabular}
+'''
+
+        assert unescaped_result == unescaped_expected
+        assert escaped_result == escaped_expected
+
+    def test_to_latex_special_escape(self):
+        df = DataFrame([r"a\b\c", r"^a^b^c", r"~a~b~c"])
+
+        escaped_result = df.to_latex()
+        escaped_expected = r"""\begin{tabular}{ll}
+\toprule
+{} &       0 \\
+\midrule
+0 &   a\textbackslash b\textbackslash c \\
+1 &  \textasciicircum a\textasciicircum b\textasciicircum c \\
+2 &  \textasciitilde a\textasciitilde b\textasciitilde c \\
+\bottomrule
+\end{tabular}
+"""
+        assert escaped_result == escaped_expected
+
+    def test_to_latex_longtable(self, frame):
+        frame.to_latex(longtable=True)
+
+        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        withindex_result = df.to_latex(longtable=True)
+        withindex_expected = r"""\begin{longtable}{lrl}
+\toprule
+{} &  a &   b \\
+\midrule
+\endhead
+\midrule
+\multicolumn{3}{r}{{Continued on next page}} \\
+\midrule
+\endfoot
+
+\bottomrule
+\endlastfoot
+0 &  1 &  b1 \\
+1 &  2 &  b2 \\
+\end{longtable}
+"""
+        assert withindex_result == withindex_expected
+
+        withoutindex_result = df.to_latex(index=False, longtable=True)
+        withoutindex_expected = r"""\begin{longtable}{rl}
+\toprule
+ a &   b \\
+\midrule
+\endhead
+\midrule
+\multicolumn{2}{r}{{Continued on next page}} \\
+\midrule
+\endfoot
+
+\bottomrule
+\endlastfoot
+ 1 &  b1 \\
+ 2 &  b2 \\
+\end{longtable}
+"""
+
+        assert withoutindex_result == withoutindex_expected
+
+        df = DataFrame({'a': [1, 2]})
+        with1column_result = df.to_latex(index=False, longtable=True)
+        assert r"\multicolumn{1}" in with1column_result
+
+        df = DataFrame({'a': [1, 2], 'b': [3, 4], 'c': [5, 6]})
+        with3columns_result = df.to_latex(index=False, longtable=True)
+        assert r"\multicolumn{3}" in with3columns_result
+
+    def test_to_latex_escape_special_chars(self):
+        special_characters = ['&', '%', '$', '#', '_', '{', '}', '~', '^',
+                              '\\']
+        df = DataFrame(data=special_characters)
+        observed = df.to_latex()
+        expected = r"""\begin{tabular}{ll}
+\toprule
+{} &  0 \\
+\midrule
+0 &  \& \\
+1 &  \% \\
+2 &  \$ \\
+3 &  \# \\
+4 &  \_ \\
+5 &  \{ \\
+6 &  \} \\
+7 &  \textasciitilde  \\
+8 &  \textasciicircum  \\
+9 &  \textbackslash  \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert observed == expected
+
+    def test_to_latex_no_header(self):
+        # GH 7124
+        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        withindex_result = df.to_latex(header=False)
+        withindex_expected = r"""\begin{tabular}{lrl}
+\toprule
+0 &  1 &  b1 \\
+1 &  2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withindex_result == withindex_expected
+
+        withoutindex_result = df.to_latex(index=False, header=False)
+        withoutindex_expected = r"""\begin{tabular}{rl}
+\toprule
+ 1 &  b1 \\
+ 2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withoutindex_result == withoutindex_expected
+
+    def test_to_latex_specified_header(self):
+        # GH 7124
+        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        withindex_result = df.to_latex(header=['AA', 'BB'])
+        withindex_expected = r"""\begin{tabular}{lrl}
+\toprule
+{} & AA &  BB \\
+\midrule
+0 &  1 &  b1 \\
+1 &  2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withindex_result == withindex_expected
+
+        withoutindex_result = df.to_latex(header=['AA', 'BB'], index=False)
+        withoutindex_expected = r"""\begin{tabular}{rl}
+\toprule
+AA &  BB \\
+\midrule
+ 1 &  b1 \\
+ 2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withoutindex_result == withoutindex_expected
+
+        withoutescape_result = df.to_latex(header=['$A$', '$B$'], escape=False)
+        withoutescape_expected = r"""\begin{tabular}{lrl}
+\toprule
+{} & $A$ & $B$ \\
+\midrule
+0 &   1 &  b1 \\
+1 &   2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withoutescape_result == withoutescape_expected
+
+        with pytest.raises(ValueError):
+            df.to_latex(header=['A'])
+
+    def test_to_latex_decimal(self, frame):
+        # GH 12031
+        frame.to_latex()
+
+        df = DataFrame({'a': [1.0, 2.1], 'b': ['b1', 'b2']})
+        withindex_result = df.to_latex(decimal=',')
+
+        withindex_expected = r"""\begin{tabular}{lrl}
+\toprule
+{} &    a &   b \\
+\midrule
+0 &  1,0 &  b1 \\
+1 &  2,1 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withindex_result == withindex_expected
+
+    def test_to_latex_series(self):
+        s = Series(['a', 'b', 'c'])
+        withindex_result = s.to_latex()
+        withindex_expected = r"""\begin{tabular}{ll}
+\toprule
+{} &  0 \\
+\midrule
+0 &  a \\
+1 &  b \\
+2 &  c \\
+\bottomrule
+\end{tabular}
+"""
+        assert withindex_result == withindex_expected
+
+    def test_to_latex_bold_rows(self):
+        # GH 16707
+        df = pd.DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        observed = df.to_latex(bold_rows=True)
+        expected = r"""\begin{tabular}{lrl}
+\toprule
+{} &  a &   b \\
+\midrule
+\textbf{0} &  1 &  b1 \\
+\textbf{1} &  2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+        assert observed == expected
+
+    def test_to_latex_no_bold_rows(self):
+        # GH 16707
+        df = pd.DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        observed = df.to_latex(bold_rows=False)
+        expected = r"""\begin{tabular}{lrl}
+\toprule
+{} &  a &   b \\
+\midrule
+0 &  1 &  b1 \\
+1 &  2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+        assert observed == expected
+
+    @pytest.mark.parametrize('name0', [None, 'named0'])
+    @pytest.mark.parametrize('name1', [None, 'named1'])
+    @pytest.mark.parametrize('axes', [[0], [1], [0, 1]])
+    def test_to_latex_multiindex_names(self, name0, name1, axes):
+        # GH 18667
+        names = [name0, name1]
+        mi = pd.MultiIndex.from_product([[1, 2], [3, 4]])
+        df = pd.DataFrame(-1, index=mi.copy(), columns=mi.copy())
+        for idx in axes:
+            df.axes[idx].names = names
+
+        idx_names = tuple(n or '{}' for n in names)
+        idx_names_row = ('%s & %s &    &    &    &    \\\\\n' % idx_names
+                         if (0 in axes and any(names)) else '')
+        placeholder = '{}' if any(names) and 1 in axes else ' '
+        col_names = [n if (bool(n) and 1 in axes) else placeholder
+                     for n in names]
+        observed = df.to_latex()
+        expected = r"""\begin{tabular}{llrrrr}
+\toprule
+  & %s & \multicolumn{2}{l}{1} & \multicolumn{2}{l}{2} \\
+  & %s &  3 &  4 &  3 &  4 \\
+%s\midrule
+1 & 3 & -1 & -1 & -1 & -1 \\
+  & 4 & -1 & -1 & -1 & -1 \\
+2 & 3 & -1 & -1 & -1 & -1 \\
+  & 4 & -1 & -1 & -1 & -1 \\
+\bottomrule
+\end{tabular}
+""" % tuple(list(col_names) + [idx_names_row])
+        assert observed == expected
+
+    @pytest.mark.parametrize('one_row', [True, False])
+    def test_to_latex_multiindex_nans(self, one_row):
+        # GH 14249
+        df = pd.DataFrame({'a': [None, 1], 'b': [2, 3], 'c': [4, 5]})
+        if one_row:
+            df = df.iloc[[0]]
+        observed = df.set_index(['a', 'b']).to_latex()
+        expected = r"""\begin{tabular}{llr}
+\toprule
+    &   &  c \\
+a & b &    \\
+\midrule
+NaN & 2 &  4 \\
+"""
+        if not one_row:
+            expected += r"""1.0 & 3 &  5 \\
+"""
+        expected += r"""\bottomrule
+\end{tabular}
+"""
+        assert observed == expected
+
+    def test_to_latex_non_string_index(self):
+        # GH 19981
+        observed = pd.DataFrame([[1, 2, 3]] * 2).set_index([0, 1]).to_latex()
+        expected = r"""\begin{tabular}{llr}
+\toprule
+  &   &  2 \\
+0 & 1 &    \\
+\midrule
+1 & 2 &  3 \\
+  & 2 &  3 \\
+\bottomrule
+\end{tabular}
+"""
+        assert observed == expected
+
+    def test_to_latex_midrule_location(self):
+        # GH 18326
+        df = pd.DataFrame({'a': [1, 2]})
+        df.index.name = 'foo'
+        observed = df.to_latex(index_names=False)
+        expected = r"""\begin{tabular}{lr}
+\toprule
+{} &  a \\
+\midrule
+0 &  1 \\
+1 &  2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert observed == expected
+
+    def test_to_latex_multiindex_empty_name(self):
+        # GH 18669
+        mi = pd.MultiIndex.from_product([[1, 2]], names=[''])
+        df = pd.DataFrame(-1, index=mi, columns=range(4))
+        observed = df.to_latex()
+        expected = r"""\begin{tabular}{lrrrr}
+\toprule
+  &  0 &  1 &  2 &  3 \\
+{} &    &    &    &    \\
+\midrule
+1 & -1 & -1 & -1 & -1 \\
+2 & -1 & -1 & -1 & -1 \\
+\bottomrule
+\end{tabular}
+"""
+        assert observed == expected
diff --git a/pandas/tests/io/generate_legacy_storage_files.py b/pandas/tests/io/generate_legacy_storage_files.py
new file mode 100755
index 0000000000000..eb40e5521f7f1
--- /dev/null
+++ b/pandas/tests/io/generate_legacy_storage_files.py
@@ -0,0 +1,367 @@
+#!/usr/bin/env python
+
+"""
+self-contained to write legacy storage (pickle/msgpack) files
+
+To use this script. Create an environment where you want
+generate pickles, say its for 0.18.1, with your pandas clone
+in ~/pandas
+
+. activate pandas_0.18.1
+cd ~/
+
+$ python pandas/pandas/tests/io/generate_legacy_storage_files.py \
+    pandas/pandas/tests/io/data/legacy_pickle/0.18.1/ pickle
+
+This script generates a storage file for the current arch, system,
+and python version
+  pandas version: 0.18.1
+  output dir    : pandas/pandas/tests/io/data/legacy_pickle/0.18.1/
+  storage format: pickle
+created pickle file: 0.18.1_x86_64_darwin_3.5.2.pickle
+
+The idea here is you are using the *current* version of the
+generate_legacy_storage_files with an *older* version of pandas to
+generate a pickle file. We will then check this file into a current
+branch, and test using test_pickle.py. This will load the *older*
+pickles and test versus the current data that is generated
+(with master). These are then compared.
+
+If we have cases where we changed the signature (e.g. we renamed
+offset -> freq in Timestamp). Then we have to conditionally execute
+in the generate_legacy_storage_files.py to make it
+run under the older AND the newer version.
+
+"""
+
+from __future__ import print_function
+from warnings import catch_warnings
+from distutils.version import LooseVersion
+from pandas import (Series, DataFrame, Panel,
+                    SparseSeries, SparseDataFrame,
+                    Index, MultiIndex, bdate_range, to_msgpack,
+                    date_range, period_range, timedelta_range,
+                    Timestamp, NaT, Categorical, Period)
+from pandas.tseries.offsets import (
+    DateOffset, Hour, Minute, Day,
+    MonthBegin, MonthEnd, YearBegin,
+    YearEnd, Week, WeekOfMonth, LastWeekOfMonth,
+    BusinessDay, BusinessHour, CustomBusinessDay, FY5253,
+    Easter,
+    SemiMonthEnd, SemiMonthBegin,
+    QuarterBegin, QuarterEnd)
+from pandas.compat import u
+import os
+import sys
+import numpy as np
+import pandas
+import platform as pl
+from datetime import timedelta
+
+_loose_version = LooseVersion(pandas.__version__)
+
+
+def _create_sp_series():
+    nan = np.nan
+
+    # nan-based
+    arr = np.arange(15, dtype=np.float64)
+    arr[7:12] = nan
+    arr[-1:] = nan
+
+    bseries = SparseSeries(arr, kind='block')
+    bseries.name = u'bseries'
+    return bseries
+
+
+def _create_sp_tsseries():
+    nan = np.nan
+
+    # nan-based
+    arr = np.arange(15, dtype=np.float64)
+    arr[7:12] = nan
+    arr[-1:] = nan
+
+    date_index = bdate_range('1/1/2011', periods=len(arr))
+    bseries = SparseSeries(arr, index=date_index, kind='block')
+    bseries.name = u'btsseries'
+    return bseries
+
+
+def _create_sp_frame():
+    nan = np.nan
+
+    data = {u'A': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
+            u'B': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
+            u'C': np.arange(10).astype(np.int64),
+            u'D': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]}
+
+    dates = bdate_range('1/1/2011', periods=10)
+    return SparseDataFrame(data, index=dates)
+
+
+def create_data():
+    """ create the pickle/msgpack data """
+
+    data = {
+        u'A': [0., 1., 2., 3., np.nan],
+        u'B': [0, 1, 0, 1, 0],
+        u'C': [u'foo1', u'foo2', u'foo3', u'foo4', u'foo5'],
+        u'D': date_range('1/1/2009', periods=5),
+        u'E': [0., 1, Timestamp('20100101'), u'foo', 2.]
+    }
+
+    scalars = dict(timestamp=Timestamp('20130101'),
+                   period=Period('2012', 'M'))
+
+    index = dict(int=Index(np.arange(10)),
+                 date=date_range('20130101', periods=10),
+                 period=period_range('2013-01-01', freq='M', periods=10),
+                 float=Index(np.arange(10, dtype=np.float64)),
+                 uint=Index(np.arange(10, dtype=np.uint64)),
+                 timedelta=timedelta_range('00:00:00', freq='30T', periods=10))
+
+    if _loose_version >= LooseVersion('0.18'):
+        from pandas import RangeIndex
+        index['range'] = RangeIndex(10)
+
+    if _loose_version >= LooseVersion('0.21'):
+        from pandas import interval_range
+        index['interval'] = interval_range(0, periods=10)
+
+    mi = dict(reg2=MultiIndex.from_tuples(
+        tuple(zip(*[[u'bar', u'bar', u'baz', u'baz', u'foo',
+                     u'foo', u'qux', u'qux'],
+                    [u'one', u'two', u'one', u'two', u'one',
+                     u'two', u'one', u'two']])),
+        names=[u'first', u'second']))
+
+    series = dict(float=Series(data[u'A']),
+                  int=Series(data[u'B']),
+                  mixed=Series(data[u'E']),
+                  ts=Series(np.arange(10).astype(np.int64),
+                            index=date_range('20130101', periods=10)),
+                  mi=Series(np.arange(5).astype(np.float64),
+                            index=MultiIndex.from_tuples(
+                                tuple(zip(*[[1, 1, 2, 2, 2],
+                                            [3, 4, 3, 4, 5]])),
+                                names=[u'one', u'two'])),
+                  dup=Series(np.arange(5).astype(np.float64),
+                             index=[u'A', u'B', u'C', u'D', u'A']),
+                  cat=Series(Categorical([u'foo', u'bar', u'baz'])),
+                  dt=Series(date_range('20130101', periods=5)),
+                  dt_tz=Series(date_range('20130101', periods=5,
+                                          tz='US/Eastern')),
+                  period=Series([Period('2000Q1')] * 5))
+
+    mixed_dup_df = DataFrame(data)
+    mixed_dup_df.columns = list(u"ABCDA")
+    frame = dict(float=DataFrame({u'A': series[u'float'],
+                                  u'B': series[u'float'] + 1}),
+                 int=DataFrame({u'A': series[u'int'],
+                                u'B': series[u'int'] + 1}),
+                 mixed=DataFrame({k: data[k]
+                                  for k in [u'A', u'B', u'C', u'D']}),
+                 mi=DataFrame({u'A': np.arange(5).astype(np.float64),
+                               u'B': np.arange(5).astype(np.int64)},
+                              index=MultiIndex.from_tuples(
+                                  tuple(zip(*[[u'bar', u'bar', u'baz',
+                                               u'baz', u'baz'],
+                                              [u'one', u'two', u'one',
+                                               u'two', u'three']])),
+                                  names=[u'first', u'second'])),
+                 dup=DataFrame(np.arange(15).reshape(5, 3).astype(np.float64),
+                               columns=[u'A', u'B', u'A']),
+                 cat_onecol=DataFrame({u'A': Categorical([u'foo', u'bar'])}),
+                 cat_and_float=DataFrame({
+                     u'A': Categorical([u'foo', u'bar', u'baz']),
+                     u'B': np.arange(3).astype(np.int64)}),
+                 mixed_dup=mixed_dup_df,
+                 dt_mixed_tzs=DataFrame({
+                     u'A': Timestamp('20130102', tz='US/Eastern'),
+                     u'B': Timestamp('20130603', tz='CET')}, index=range(5)),
+                 dt_mixed2_tzs=DataFrame({
+                     u'A': Timestamp('20130102', tz='US/Eastern'),
+                     u'B': Timestamp('20130603', tz='CET'),
+                     u'C': Timestamp('20130603', tz='UTC')}, index=range(5))
+                 )
+
+    with catch_warnings(record=True):
+        mixed_dup_panel = Panel({u'ItemA': frame[u'float'],
+                                 u'ItemB': frame[u'int']})
+        mixed_dup_panel.items = [u'ItemA', u'ItemA']
+        panel = dict(float=Panel({u'ItemA': frame[u'float'],
+                                  u'ItemB': frame[u'float'] + 1}),
+                     dup=Panel(
+                         np.arange(30).reshape(3, 5, 2).astype(np.float64),
+                         items=[u'A', u'B', u'A']),
+                     mixed_dup=mixed_dup_panel)
+
+    cat = dict(int8=Categorical(list('abcdefg')),
+               int16=Categorical(np.arange(1000)),
+               int32=Categorical(np.arange(10000)))
+
+    timestamp = dict(normal=Timestamp('2011-01-01'),
+                     nat=NaT,
+                     tz=Timestamp('2011-01-01', tz='US/Eastern'))
+
+    if _loose_version < LooseVersion('0.19.2'):
+        timestamp['freq'] = Timestamp('2011-01-01', offset='D')
+        timestamp['both'] = Timestamp('2011-01-01', tz='Asia/Tokyo',
+                                      offset='M')
+    else:
+        timestamp['freq'] = Timestamp('2011-01-01', freq='D')
+        timestamp['both'] = Timestamp('2011-01-01', tz='Asia/Tokyo',
+                                      freq='M')
+
+    off = {'DateOffset': DateOffset(years=1),
+           'DateOffset_h_ns': DateOffset(hour=6, nanoseconds=5824),
+           'BusinessDay': BusinessDay(offset=timedelta(seconds=9)),
+           'BusinessHour': BusinessHour(normalize=True, n=6, end='15:14'),
+           'CustomBusinessDay': CustomBusinessDay(weekmask='Mon Fri'),
+           'SemiMonthBegin': SemiMonthBegin(day_of_month=9),
+           'SemiMonthEnd': SemiMonthEnd(day_of_month=24),
+           'MonthBegin': MonthBegin(1),
+           'MonthEnd': MonthEnd(1),
+           'QuarterBegin': QuarterBegin(1),
+           'QuarterEnd': QuarterEnd(1),
+           'Day': Day(1),
+           'YearBegin': YearBegin(1),
+           'YearEnd': YearEnd(1),
+           'Week': Week(1),
+           'Week_Tues': Week(2, normalize=False, weekday=1),
+           'WeekOfMonth': WeekOfMonth(week=3, weekday=4),
+           'LastWeekOfMonth': LastWeekOfMonth(n=1, weekday=3),
+           'FY5253': FY5253(n=2, weekday=6, startingMonth=7, variation="last"),
+           'Easter': Easter(),
+           'Hour': Hour(1),
+           'Minute': Minute(1)}
+
+    return dict(series=series,
+                frame=frame,
+                panel=panel,
+                index=index,
+                scalars=scalars,
+                mi=mi,
+                sp_series=dict(float=_create_sp_series(),
+                               ts=_create_sp_tsseries()),
+                sp_frame=dict(float=_create_sp_frame()),
+                cat=cat,
+                timestamp=timestamp,
+                offsets=off)
+
+
+def create_pickle_data():
+    data = create_data()
+
+    # Pre-0.14.1 versions generated non-unpicklable mixed-type frames and
+    # panels if their columns/items were non-unique.
+    if _loose_version < LooseVersion('0.14.1'):
+        del data['frame']['mixed_dup']
+        del data['panel']['mixed_dup']
+    if _loose_version < LooseVersion('0.17.0'):
+        del data['series']['period']
+        del data['scalars']['period']
+    return data
+
+
+def _u(x):
+    return {u(k): _u(x[k]) for k in x} if isinstance(x, dict) else x
+
+
+def create_msgpack_data():
+    data = create_data()
+    if _loose_version < LooseVersion('0.17.0'):
+        del data['frame']['mixed_dup']
+        del data['panel']['mixed_dup']
+        del data['frame']['dup']
+        del data['panel']['dup']
+    if _loose_version < LooseVersion('0.18.0'):
+        del data['series']['dt_tz']
+        del data['frame']['dt_mixed_tzs']
+    # Not supported
+    del data['sp_series']
+    del data['sp_frame']
+    del data['series']['cat']
+    del data['series']['period']
+    del data['frame']['cat_onecol']
+    del data['frame']['cat_and_float']
+    del data['scalars']['period']
+    if _loose_version < LooseVersion('0.23.0'):
+        del data['index']['interval']
+    del data['offsets']
+    return _u(data)
+
+
+def platform_name():
+    return '_'.join([str(pandas.__version__), str(pl.machine()),
+                     str(pl.system().lower()), str(pl.python_version())])
+
+
+def write_legacy_pickles(output_dir):
+
+    # make sure we are < 0.13 compat (in py3)
+    try:
+        from pandas.compat import zip, cPickle as pickle  # noqa
+    except:
+        import pickle
+
+    version = pandas.__version__
+
+    print("This script generates a storage file for the current arch, system, "
+          "and python version")
+    print("  pandas version: {0}".format(version))
+    print("  output dir    : {0}".format(output_dir))
+    print("  storage format: pickle")
+
+    pth = '{0}.pickle'.format(platform_name())
+
+    fh = open(os.path.join(output_dir, pth), 'wb')
+    pickle.dump(create_pickle_data(), fh, pickle.HIGHEST_PROTOCOL)
+    fh.close()
+
+    print("created pickle file: %s" % pth)
+
+
+def write_legacy_msgpack(output_dir, compress):
+
+    version = pandas.__version__
+
+    print("This script generates a storage file for the current arch, "
+          "system, and python version")
+    print("  pandas version: {0}".format(version))
+    print("  output dir    : {0}".format(output_dir))
+    print("  storage format: msgpack")
+    pth = '{0}.msgpack'.format(platform_name())
+    to_msgpack(os.path.join(output_dir, pth), create_msgpack_data(),
+               compress=compress)
+
+    print("created msgpack file: %s" % pth)
+
+
+def write_legacy_file():
+    # force our cwd to be the first searched
+    sys.path.insert(0, '.')
+
+    if not (3 <= len(sys.argv) <= 4):
+        exit("Specify output directory and storage type: generate_legacy_"
+             "storage_files.py <output_dir> <storage_type> "
+             "<msgpack_compress_type>")
+
+    output_dir = str(sys.argv[1])
+    storage_type = str(sys.argv[2])
+    try:
+        compress_type = str(sys.argv[3])
+    except IndexError:
+        compress_type = None
+
+    if storage_type == 'pickle':
+        write_legacy_pickles(output_dir=output_dir)
+    elif storage_type == 'msgpack':
+        write_legacy_msgpack(output_dir=output_dir, compress=compress_type)
+    else:
+        exit("storage_type must be one of {'pickle', 'msgpack'}")
+
+
+if __name__ == '__main__':
+    write_legacy_file()
diff --git a/pandas/tests/io/json/__init__.py b/pandas/tests/io/json/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/io/tests/test_json/data/tsframe_iso_v012.json b/pandas/tests/io/json/data/tsframe_iso_v012.json
similarity index 100%
rename from pandas/io/tests/test_json/data/tsframe_iso_v012.json
rename to pandas/tests/io/json/data/tsframe_iso_v012.json
diff --git a/pandas/io/tests/test_json/data/tsframe_v012.json b/pandas/tests/io/json/data/tsframe_v012.json
similarity index 100%
rename from pandas/io/tests/test_json/data/tsframe_v012.json
rename to pandas/tests/io/json/data/tsframe_v012.json
diff --git a/pandas/tests/io/json/data/tsframe_v012.json.zip b/pandas/tests/io/json/data/tsframe_v012.json.zip
new file mode 100644
index 0000000000000..100ba0c87b2ba
Binary files /dev/null and b/pandas/tests/io/json/data/tsframe_v012.json.zip differ
diff --git a/pandas/tests/io/json/test_compression.py b/pandas/tests/io/json/test_compression.py
new file mode 100644
index 0000000000000..05ceace20f5a4
--- /dev/null
+++ b/pandas/tests/io/json/test_compression.py
@@ -0,0 +1,90 @@
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_raises_regex
+
+
+def test_compression_roundtrip(compression):
+    df = pd.DataFrame([[0.123456, 0.234567, 0.567567],
+                       [12.32112, 123123.2, 321321.2]],
+                      index=['A', 'B'], columns=['X', 'Y', 'Z'])
+
+    with tm.ensure_clean() as path:
+        df.to_json(path, compression=compression)
+        assert_frame_equal(df, pd.read_json(path,
+                                            compression=compression))
+
+        # explicitly ensure file was compressed.
+        with tm.decompress_file(path, compression) as fh:
+            result = fh.read().decode('utf8')
+        assert_frame_equal(df, pd.read_json(result))
+
+
+def test_read_zipped_json(datapath):
+    uncompressed_path = datapath("io", "json", "data", "tsframe_v012.json")
+    uncompressed_df = pd.read_json(uncompressed_path)
+
+    compressed_path = datapath("io", "json", "data", "tsframe_v012.json.zip")
+    compressed_df = pd.read_json(compressed_path, compression='zip')
+
+    assert_frame_equal(uncompressed_df, compressed_df)
+
+
+def test_with_s3_url(compression):
+    boto3 = pytest.importorskip('boto3')
+    pytest.importorskip('s3fs')
+    moto = pytest.importorskip('moto')
+
+    df = pd.read_json('{"a": [1, 2, 3], "b": [4, 5, 6]}')
+    with moto.mock_s3():
+        conn = boto3.resource("s3", region_name="us-east-1")
+        bucket = conn.create_bucket(Bucket="pandas-test")
+
+        with tm.ensure_clean() as path:
+            df.to_json(path, compression=compression)
+            with open(path, 'rb') as f:
+                bucket.put_object(Key='test-1', Body=f)
+
+        roundtripped_df = pd.read_json('s3://pandas-test/test-1',
+                                       compression=compression)
+        assert_frame_equal(df, roundtripped_df)
+
+
+def test_lines_with_compression(compression):
+
+    with tm.ensure_clean() as path:
+        df = pd.read_json('{"a": [1, 2, 3], "b": [4, 5, 6]}')
+        df.to_json(path, orient='records', lines=True,
+                   compression=compression)
+        roundtripped_df = pd.read_json(path, lines=True,
+                                       compression=compression)
+        assert_frame_equal(df, roundtripped_df)
+
+
+def test_chunksize_with_compression(compression):
+
+    with tm.ensure_clean() as path:
+        df = pd.read_json('{"a": ["foo", "bar", "baz"], "b": [4, 5, 6]}')
+        df.to_json(path, orient='records', lines=True,
+                   compression=compression)
+
+        res = pd.read_json(path, lines=True, chunksize=1,
+                           compression=compression)
+        roundtripped_df = pd.concat(res)
+        assert_frame_equal(df, roundtripped_df)
+
+
+def test_write_unsupported_compression_type():
+    df = pd.read_json('{"a": [1, 2, 3], "b": [4, 5, 6]}')
+    with tm.ensure_clean() as path:
+        msg = "Unrecognized compression type: unsupported"
+        assert_raises_regex(ValueError, msg, df.to_json,
+                            path, compression="unsupported")
+
+
+def test_read_unsupported_compression_type():
+    with tm.ensure_clean() as path:
+        msg = "Unrecognized compression type: unsupported"
+        assert_raises_regex(ValueError, msg, pd.read_json,
+                            path, compression="unsupported")
diff --git a/pandas/tests/io/json/test_json_table_schema.py b/pandas/tests/io/json/test_json_table_schema.py
new file mode 100644
index 0000000000000..b6483d0e978ba
--- /dev/null
+++ b/pandas/tests/io/json/test_json_table_schema.py
@@ -0,0 +1,575 @@
+"""Tests for Table Schema integration."""
+import json
+from collections import OrderedDict
+
+import numpy as np
+import pandas as pd
+import pytest
+
+from pandas import DataFrame
+from pandas.core.dtypes.dtypes import (
+    PeriodDtype, CategoricalDtype, DatetimeTZDtype)
+from pandas.io.json.table_schema import (
+    as_json_table_type,
+    build_table_schema,
+    convert_pandas_type_to_json_field,
+    convert_json_field_to_pandas_type,
+    set_default_names)
+import pandas.util.testing as tm
+
+
+class TestBuildSchema(object):
+
+    def setup_method(self, method):
+        self.df = DataFrame(
+            {'A': [1, 2, 3, 4],
+             'B': ['a', 'b', 'c', 'c'],
+             'C': pd.date_range('2016-01-01', freq='d', periods=4),
+             'D': pd.timedelta_range('1H', periods=4, freq='T'),
+             },
+            index=pd.Index(range(4), name='idx'))
+
+    def test_build_table_schema(self):
+        result = build_table_schema(self.df, version=False)
+        expected = {
+            'fields': [{'name': 'idx', 'type': 'integer'},
+                       {'name': 'A', 'type': 'integer'},
+                       {'name': 'B', 'type': 'string'},
+                       {'name': 'C', 'type': 'datetime'},
+                       {'name': 'D', 'type': 'duration'},
+                       ],
+            'primaryKey': ['idx']
+        }
+        assert result == expected
+        result = build_table_schema(self.df)
+        assert "pandas_version" in result
+
+    def test_series(self):
+        s = pd.Series([1, 2, 3], name='foo')
+        result = build_table_schema(s, version=False)
+        expected = {'fields': [{'name': 'index', 'type': 'integer'},
+                               {'name': 'foo', 'type': 'integer'}],
+                    'primaryKey': ['index']}
+        assert result == expected
+        result = build_table_schema(s)
+        assert 'pandas_version' in result
+
+    def test_series_unnamed(self):
+        result = build_table_schema(pd.Series([1, 2, 3]), version=False)
+        expected = {'fields': [{'name': 'index', 'type': 'integer'},
+                               {'name': 'values', 'type': 'integer'}],
+                    'primaryKey': ['index']}
+        assert result == expected
+
+    def test_multiindex(self):
+        df = self.df.copy()
+        idx = pd.MultiIndex.from_product([('a', 'b'), (1, 2)])
+        df.index = idx
+
+        result = build_table_schema(df, version=False)
+        expected = {
+            'fields': [{'name': 'level_0', 'type': 'string'},
+                       {'name': 'level_1', 'type': 'integer'},
+                       {'name': 'A', 'type': 'integer'},
+                       {'name': 'B', 'type': 'string'},
+                       {'name': 'C', 'type': 'datetime'},
+                       {'name': 'D', 'type': 'duration'},
+                       ],
+            'primaryKey': ['level_0', 'level_1']
+        }
+        assert result == expected
+
+        df.index.names = ['idx0', None]
+        expected['fields'][0]['name'] = 'idx0'
+        expected['primaryKey'] = ['idx0', 'level_1']
+        result = build_table_schema(df, version=False)
+        assert result == expected
+
+
+class TestTableSchemaType(object):
+
+    @pytest.mark.parametrize('int_type', [
+        np.int, np.int16, np.int32, np.int64])
+    def test_as_json_table_type_int_data(self, int_type):
+        int_data = [1, 2, 3]
+        assert as_json_table_type(np.array(
+            int_data, dtype=int_type)) == 'integer'
+
+    @pytest.mark.parametrize('float_type', [
+        np.float, np.float16, np.float32, np.float64])
+    def test_as_json_table_type_float_data(self, float_type):
+        float_data = [1., 2., 3.]
+        assert as_json_table_type(np.array(
+            float_data, dtype=float_type)) == 'number'
+
+    @pytest.mark.parametrize('bool_type', [bool, np.bool])
+    def test_as_json_table_type_bool_data(self, bool_type):
+        bool_data = [True, False]
+        assert as_json_table_type(np.array(
+            bool_data, dtype=bool_type)) == 'boolean'
+
+    @pytest.mark.parametrize('date_data', [
+        pd.to_datetime(['2016']),
+        pd.to_datetime(['2016'], utc=True),
+        pd.Series(pd.to_datetime(['2016'])),
+        pd.Series(pd.to_datetime(['2016'], utc=True)),
+        pd.period_range('2016', freq='A', periods=3)
+    ])
+    def test_as_json_table_type_date_data(self, date_data):
+        assert as_json_table_type(date_data) == 'datetime'
+
+    @pytest.mark.parametrize('str_data', [
+        pd.Series(['a', 'b']), pd.Index(['a', 'b'])])
+    def test_as_json_table_type_string_data(self, str_data):
+        assert as_json_table_type(str_data) == 'string'
+
+    @pytest.mark.parametrize('cat_data', [
+        pd.Categorical(['a']),
+        pd.Categorical([1]),
+        pd.Series(pd.Categorical([1])),
+        pd.CategoricalIndex([1]),
+        pd.Categorical([1])])
+    def test_as_json_table_type_categorical_data(self, cat_data):
+        assert as_json_table_type(cat_data) == 'any'
+
+    # ------
+    # dtypes
+    # ------
+    @pytest.mark.parametrize('int_dtype', [
+        np.int, np.int16, np.int32, np.int64])
+    def test_as_json_table_type_int_dtypes(self, int_dtype):
+        assert as_json_table_type(int_dtype) == 'integer'
+
+    @pytest.mark.parametrize('float_dtype', [
+        np.float, np.float16, np.float32, np.float64])
+    def test_as_json_table_type_float_dtypes(self, float_dtype):
+        assert as_json_table_type(float_dtype) == 'number'
+
+    @pytest.mark.parametrize('bool_dtype', [bool, np.bool])
+    def test_as_json_table_type_bool_dtypes(self, bool_dtype):
+        assert as_json_table_type(bool_dtype) == 'boolean'
+
+    @pytest.mark.parametrize('date_dtype', [
+        np.datetime64, np.dtype("<M8[ns]"), PeriodDtype(),
+        DatetimeTZDtype('ns', 'US/Central')])
+    def test_as_json_table_type_date_dtypes(self, date_dtype):
+        # TODO: datedate.date? datetime.time?
+        assert as_json_table_type(date_dtype) == 'datetime'
+
+    @pytest.mark.parametrize('td_dtype', [
+        np.timedelta64, np.dtype("<m8[ns]")])
+    def test_as_json_table_type_timedelta_dtypes(self, td_dtype):
+        assert as_json_table_type(td_dtype) == 'duration'
+
+    @pytest.mark.parametrize('str_dtype', [object])  # TODO
+    def test_as_json_table_type_string_dtypes(self, str_dtype):
+        assert as_json_table_type(str_dtype) == 'string'
+
+    def test_as_json_table_type_categorical_dtypes(self):
+        # TODO: I think before is_categorical_dtype(Categorical)
+        # returned True, but now it's False. Figure out why or
+        # if it matters
+        assert as_json_table_type(pd.Categorical(['a'])) == 'any'
+        assert as_json_table_type(CategoricalDtype()) == 'any'
+
+
+class TestTableOrient(object):
+
+    def setup_method(self, method):
+        self.df = DataFrame(
+            {'A': [1, 2, 3, 4],
+             'B': ['a', 'b', 'c', 'c'],
+             'C': pd.date_range('2016-01-01', freq='d', periods=4),
+             'D': pd.timedelta_range('1H', periods=4, freq='T'),
+             'E': pd.Series(pd.Categorical(['a', 'b', 'c', 'c'])),
+             'F': pd.Series(pd.Categorical(['a', 'b', 'c', 'c'],
+                                           ordered=True)),
+             'G': [1., 2., 3, 4.],
+             'H': pd.date_range('2016-01-01', freq='d', periods=4,
+                                tz='US/Central'),
+             },
+            index=pd.Index(range(4), name='idx'))
+
+    def test_build_series(self):
+        s = pd.Series([1, 2], name='a')
+        s.index.name = 'id'
+        result = s.to_json(orient='table', date_format='iso')
+        result = json.loads(result, object_pairs_hook=OrderedDict)
+
+        assert "pandas_version" in result['schema']
+        result['schema'].pop('pandas_version')
+
+        fields = [{'name': 'id', 'type': 'integer'},
+                  {'name': 'a', 'type': 'integer'}]
+
+        schema = {
+            'fields': fields,
+            'primaryKey': ['id'],
+        }
+
+        expected = OrderedDict([
+            ('schema', schema),
+            ('data', [OrderedDict([('id', 0), ('a', 1)]),
+                      OrderedDict([('id', 1), ('a', 2)])])])
+        assert result == expected
+
+    def test_to_json(self):
+        df = self.df.copy()
+        df.index.name = 'idx'
+        result = df.to_json(orient='table', date_format='iso')
+        result = json.loads(result, object_pairs_hook=OrderedDict)
+
+        assert "pandas_version" in result['schema']
+        result['schema'].pop('pandas_version')
+
+        fields = [
+            {'name': 'idx', 'type': 'integer'},
+            {'name': 'A', 'type': 'integer'},
+            {'name': 'B', 'type': 'string'},
+            {'name': 'C', 'type': 'datetime'},
+            {'name': 'D', 'type': 'duration'},
+            {'constraints': {'enum': ['a', 'b', 'c']},
+             'name': 'E',
+             'ordered': False,
+             'type': 'any'},
+            {'constraints': {'enum': ['a', 'b', 'c']},
+             'name': 'F',
+             'ordered': True,
+             'type': 'any'},
+            {'name': 'G', 'type': 'number'},
+            {'name': 'H', 'type': 'datetime', 'tz': 'US/Central'}
+        ]
+
+        schema = {
+            'fields': fields,
+            'primaryKey': ['idx'],
+        }
+        data = [
+            OrderedDict([('idx', 0), ('A', 1), ('B', 'a'),
+                         ('C', '2016-01-01T00:00:00.000Z'),
+                         ('D', 'P0DT1H0M0S'),
+                         ('E', 'a'), ('F', 'a'), ('G', 1.),
+                         ('H', '2016-01-01T06:00:00.000Z')
+                         ]),
+            OrderedDict([('idx', 1), ('A', 2), ('B', 'b'),
+                         ('C', '2016-01-02T00:00:00.000Z'),
+                         ('D', 'P0DT1H1M0S'),
+                         ('E', 'b'), ('F', 'b'), ('G', 2.),
+                         ('H', '2016-01-02T06:00:00.000Z')
+                         ]),
+            OrderedDict([('idx', 2), ('A', 3), ('B', 'c'),
+                         ('C', '2016-01-03T00:00:00.000Z'),
+                         ('D', 'P0DT1H2M0S'),
+                         ('E', 'c'), ('F', 'c'), ('G', 3.),
+                         ('H', '2016-01-03T06:00:00.000Z')
+                         ]),
+            OrderedDict([('idx', 3), ('A', 4), ('B', 'c'),
+                         ('C', '2016-01-04T00:00:00.000Z'),
+                         ('D', 'P0DT1H3M0S'),
+                         ('E', 'c'), ('F', 'c'), ('G', 4.),
+                         ('H', '2016-01-04T06:00:00.000Z')
+                         ]),
+        ]
+        expected = OrderedDict([('schema', schema), ('data', data)])
+        assert result == expected
+
+    def test_to_json_float_index(self):
+        data = pd.Series(1, index=[1., 2.])
+        result = data.to_json(orient='table', date_format='iso')
+        result = json.loads(result, object_pairs_hook=OrderedDict)
+        result['schema'].pop('pandas_version')
+
+        expected = (
+            OrderedDict([('schema', {
+                'fields': [{'name': 'index', 'type': 'number'},
+                           {'name': 'values', 'type': 'integer'}],
+                'primaryKey': ['index']
+            }),
+                ('data', [OrderedDict([('index', 1.0), ('values', 1)]),
+                          OrderedDict([('index', 2.0), ('values', 1)])])])
+        )
+        assert result == expected
+
+    def test_to_json_period_index(self):
+        idx = pd.period_range('2016', freq='Q-JAN', periods=2)
+        data = pd.Series(1, idx)
+        result = data.to_json(orient='table', date_format='iso')
+        result = json.loads(result, object_pairs_hook=OrderedDict)
+        result['schema'].pop('pandas_version')
+
+        fields = [{'freq': 'Q-JAN', 'name': 'index', 'type': 'datetime'},
+                  {'name': 'values', 'type': 'integer'}]
+
+        schema = {'fields': fields, 'primaryKey': ['index']}
+        data = [OrderedDict([('index', '2015-11-01T00:00:00.000Z'),
+                             ('values', 1)]),
+                OrderedDict([('index', '2016-02-01T00:00:00.000Z'),
+                             ('values', 1)])]
+        expected = OrderedDict([('schema', schema), ('data', data)])
+        assert result == expected
+
+    def test_to_json_categorical_index(self):
+        data = pd.Series(1, pd.CategoricalIndex(['a', 'b']))
+        result = data.to_json(orient='table', date_format='iso')
+        result = json.loads(result, object_pairs_hook=OrderedDict)
+        result['schema'].pop('pandas_version')
+
+        expected = (
+            OrderedDict([('schema',
+                          {'fields': [{'name': 'index', 'type': 'any',
+                                       'constraints': {'enum': ['a', 'b']},
+                                       'ordered': False},
+                                      {'name': 'values', 'type': 'integer'}],
+                           'primaryKey': ['index']}),
+                         ('data', [
+                             OrderedDict([('index', 'a'),
+                                          ('values', 1)]),
+                             OrderedDict([('index', 'b'), ('values', 1)])])])
+        )
+        assert result == expected
+
+    def test_date_format_raises(self):
+        with pytest.raises(ValueError):
+            self.df.to_json(orient='table', date_format='epoch')
+
+        # others work
+        self.df.to_json(orient='table', date_format='iso')
+        self.df.to_json(orient='table')
+
+    @pytest.mark.parametrize('kind', [pd.Series, pd.Index])
+    def test_convert_pandas_type_to_json_field_int(self, kind):
+        data = [1, 2, 3]
+        result = convert_pandas_type_to_json_field(kind(data, name='name'))
+        expected = {"name": "name", "type": "integer"}
+        assert result == expected
+
+    @pytest.mark.parametrize('kind', [pd.Series, pd.Index])
+    def test_convert_pandas_type_to_json_field_float(self, kind):
+        data = [1., 2., 3.]
+        result = convert_pandas_type_to_json_field(kind(data, name='name'))
+        expected = {"name": "name", "type": "number"}
+        assert result == expected
+
+    @pytest.mark.parametrize('dt_args,extra_exp', [
+        ({}, {}), ({'utc': True}, {'tz': 'UTC'})])
+    @pytest.mark.parametrize('wrapper', [None, pd.Series])
+    def test_convert_pandas_type_to_json_field_datetime(self, dt_args,
+                                                        extra_exp, wrapper):
+        data = [1., 2., 3.]
+        data = pd.to_datetime(data, **dt_args)
+        if wrapper is pd.Series:
+            data = pd.Series(data, name='values')
+        result = convert_pandas_type_to_json_field(data)
+        expected = {"name": "values", "type": 'datetime'}
+        expected.update(extra_exp)
+        assert result == expected
+
+    def test_convert_pandas_type_to_json_period_range(self):
+        arr = pd.period_range('2016', freq='A-DEC', periods=4)
+        result = convert_pandas_type_to_json_field(arr)
+        expected = {"name": "values", "type": 'datetime', "freq": "A-DEC"}
+        assert result == expected
+
+    @pytest.mark.parametrize('kind', [pd.Categorical, pd.CategoricalIndex])
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_convert_pandas_type_to_json_field_categorical(self, kind,
+                                                           ordered):
+        data = ['a', 'b', 'c']
+        if kind is pd.Categorical:
+            arr = pd.Series(kind(data, ordered=ordered), name='cats')
+        elif kind is pd.CategoricalIndex:
+            arr = kind(data, ordered=ordered, name='cats')
+
+        result = convert_pandas_type_to_json_field(arr)
+        expected = {"name": "cats", "type": "any",
+                    "constraints": {"enum": data},
+                    "ordered": ordered}
+        assert result == expected
+
+    @pytest.mark.parametrize("inp,exp", [
+        ({'type': 'integer'}, 'int64'),
+        ({'type': 'number'}, 'float64'),
+        ({'type': 'boolean'}, 'bool'),
+        ({'type': 'duration'}, 'timedelta64'),
+        ({'type': 'datetime'}, 'datetime64[ns]'),
+        ({'type': 'datetime', 'tz': 'US/Hawaii'}, 'datetime64[ns, US/Hawaii]'),
+        ({'type': 'any'}, 'object'),
+        ({'type': 'any', 'constraints': {'enum': ['a', 'b', 'c']},
+          'ordered': False}, CategoricalDtype(categories=['a', 'b', 'c'],
+                                              ordered=False)),
+        ({'type': 'any', 'constraints': {'enum': ['a', 'b', 'c']},
+          'ordered': True}, CategoricalDtype(categories=['a', 'b', 'c'],
+                                             ordered=True)),
+        ({'type': 'string'}, 'object')])
+    def test_convert_json_field_to_pandas_type(self, inp, exp):
+        field = {'name': 'foo'}
+        field.update(inp)
+        assert convert_json_field_to_pandas_type(field) == exp
+
+    @pytest.mark.parametrize("inp", ["geopoint", "geojson", "fake_type"])
+    def test_convert_json_field_to_pandas_type_raises(self, inp):
+        field = {'type': inp}
+        with tm.assert_raises_regex(ValueError, "Unsupported or invalid field "
+                                    "type: {}".format(inp)):
+            convert_json_field_to_pandas_type(field)
+
+    def test_categorical(self):
+        s = pd.Series(pd.Categorical(['a', 'b', 'a']))
+        s.index.name = 'idx'
+        result = s.to_json(orient='table', date_format='iso')
+        result = json.loads(result, object_pairs_hook=OrderedDict)
+        result['schema'].pop('pandas_version')
+
+        fields = [{'name': 'idx', 'type': 'integer'},
+                  {'constraints': {'enum': ['a', 'b']},
+                   'name': 'values',
+                   'ordered': False,
+                   'type': 'any'}]
+
+        expected = OrderedDict([
+            ('schema', {'fields': fields,
+                        'primaryKey': ['idx']}),
+            ('data', [OrderedDict([('idx', 0), ('values', 'a')]),
+                      OrderedDict([('idx', 1), ('values', 'b')]),
+                      OrderedDict([('idx', 2), ('values', 'a')])])])
+        assert result == expected
+
+    @pytest.mark.parametrize('idx,nm,prop', [
+        (pd.Index([1]), 'index', 'name'),
+        (pd.Index([1], name='myname'), 'myname', 'name'),
+        (pd.MultiIndex.from_product([('a', 'b'), ('c', 'd')]),
+         ['level_0', 'level_1'], 'names'),
+        (pd.MultiIndex.from_product([('a', 'b'), ('c', 'd')],
+                                    names=['n1', 'n2']),
+         ['n1', 'n2'], 'names'),
+        (pd.MultiIndex.from_product([('a', 'b'), ('c', 'd')],
+                                    names=['n1', None]),
+         ['n1', 'level_1'], 'names')
+    ])
+    def test_set_names_unset(self, idx, nm, prop):
+        data = pd.Series(1, idx)
+        result = set_default_names(data)
+        assert getattr(result.index, prop) == nm
+
+    @pytest.mark.parametrize("idx", [
+        pd.Index([], name='index'),
+        pd.MultiIndex.from_arrays([['foo'], ['bar']],
+                                  names=('level_0', 'level_1')),
+        pd.MultiIndex.from_arrays([['foo'], ['bar']],
+                                  names=('foo', 'level_1'))
+    ])
+    def test_warns_non_roundtrippable_names(self, idx):
+        # GH 19130
+        df = pd.DataFrame([[]], index=idx)
+        df.index.name = 'index'
+        with tm.assert_produces_warning():
+            set_default_names(df)
+
+    def test_timestamp_in_columns(self):
+        df = pd.DataFrame([[1, 2]], columns=[pd.Timestamp('2016'),
+                                             pd.Timedelta(10, unit='s')])
+        result = df.to_json(orient="table")
+        js = json.loads(result)
+        assert js['schema']['fields'][1]['name'] == 1451606400000
+        assert js['schema']['fields'][2]['name'] == 10000
+
+    @pytest.mark.parametrize('case', [
+        pd.Series([1], index=pd.Index([1], name='a'), name='a'),
+        pd.DataFrame({"A": [1]}, index=pd.Index([1], name="A")),
+        pd.DataFrame({"A": [1]}, index=pd.MultiIndex.from_arrays([
+            ['a'], [1]], names=["A", "a"]))
+    ])
+    def test_overlapping_names(self, case):
+        with tm.assert_raises_regex(ValueError, 'Overlapping'):
+            case.to_json(orient='table')
+
+    def test_mi_falsey_name(self):
+        # GH 16203
+        df = pd.DataFrame(np.random.randn(4, 4),
+                          index=pd.MultiIndex.from_product([('A', 'B'),
+                                                            ('a', 'b')]))
+        result = [x['name'] for x in build_table_schema(df)['fields']]
+        assert result == ['level_0', 'level_1', 0, 1, 2, 3]
+
+
+class TestTableOrientReader(object):
+
+    @pytest.mark.parametrize("index_nm", [
+        None, "idx", pytest.param("index", marks=pytest.mark.xfail),
+        'level_0'])
+    @pytest.mark.parametrize("vals", [
+        {'ints': [1, 2, 3, 4]},
+        {'objects': ['a', 'b', 'c', 'd']},
+        {'date_ranges': pd.date_range('2016-01-01', freq='d', periods=4)},
+        {'categoricals': pd.Series(pd.Categorical(['a', 'b', 'c', 'c']))},
+        {'ordered_cats': pd.Series(pd.Categorical(['a', 'b', 'c', 'c'],
+                                                  ordered=True))},
+        pytest.param({'floats': [1., 2., 3., 4.]}, marks=pytest.mark.xfail),
+        {'floats': [1.1, 2.2, 3.3, 4.4]},
+        {'bools': [True, False, False, True]}])
+    def test_read_json_table_orient(self, index_nm, vals, recwarn):
+        df = DataFrame(vals, index=pd.Index(range(4), name=index_nm))
+        out = df.to_json(orient="table")
+        result = pd.read_json(out, orient="table")
+        tm.assert_frame_equal(df, result)
+
+    @pytest.mark.parametrize("index_nm", [
+        None, "idx", "index"])
+    @pytest.mark.parametrize("vals", [
+        {'timedeltas': pd.timedelta_range('1H', periods=4, freq='T')},
+        {'timezones': pd.date_range('2016-01-01', freq='d', periods=4,
+                                    tz='US/Central')}])
+    def test_read_json_table_orient_raises(self, index_nm, vals, recwarn):
+        df = DataFrame(vals, index=pd.Index(range(4), name=index_nm))
+        out = df.to_json(orient="table")
+        with tm.assert_raises_regex(NotImplementedError, 'can not yet read '):
+            pd.read_json(out, orient="table")
+
+    def test_comprehensive(self):
+        df = DataFrame(
+            {'A': [1, 2, 3, 4],
+             'B': ['a', 'b', 'c', 'c'],
+             'C': pd.date_range('2016-01-01', freq='d', periods=4),
+             # 'D': pd.timedelta_range('1H', periods=4, freq='T'),
+             'E': pd.Series(pd.Categorical(['a', 'b', 'c', 'c'])),
+             'F': pd.Series(pd.Categorical(['a', 'b', 'c', 'c'],
+                                           ordered=True)),
+             'G': [1.1, 2.2, 3.3, 4.4],
+             # 'H': pd.date_range('2016-01-01', freq='d', periods=4,
+             #                   tz='US/Central'),
+             'I': [True, False, False, True],
+             },
+            index=pd.Index(range(4), name='idx'))
+
+        out = df.to_json(orient="table")
+        result = pd.read_json(out, orient="table")
+        tm.assert_frame_equal(df, result)
+
+    @pytest.mark.parametrize("index_names", [
+        [None, None], ['foo', 'bar'], ['foo', None], [None, 'foo'],
+        ['index', 'foo']])
+    def test_multiindex(self, index_names):
+        # GH 18912
+        df = pd.DataFrame(
+            [["Arr", "alpha", [1, 2, 3, 4]],
+             ["Bee", "Beta", [10, 20, 30, 40]]],
+            index=[["A", "B"], ["Null", "Eins"]],
+            columns=["Aussprache", "Griechisch", "Args"]
+        )
+        df.index.names = index_names
+        out = df.to_json(orient="table")
+        result = pd.read_json(out, orient="table")
+        tm.assert_frame_equal(df, result)
+
+    @pytest.mark.parametrize("strict_check", [
+        pytest.param(True, marks=pytest.mark.xfail), False])
+    def test_empty_frame_roundtrip(self, strict_check):
+        # GH 21287
+        df = pd.DataFrame([], columns=['a', 'b', 'c'])
+        expected = df.copy()
+        out = df.to_json(orient='table')
+        result = pd.read_json(out, orient='table')
+        # TODO: When DF coercion issue (#21345) is resolved tighten type checks
+        tm.assert_frame_equal(expected, result,
+                              check_dtype=strict_check,
+                              check_index_type=strict_check)
diff --git a/pandas/tests/io/json/test_normalize.py b/pandas/tests/io/json/test_normalize.py
new file mode 100644
index 0000000000000..200a853c48900
--- /dev/null
+++ b/pandas/tests/io/json/test_normalize.py
@@ -0,0 +1,442 @@
+import pytest
+import numpy as np
+import json
+
+import pandas.util.testing as tm
+from pandas import compat, Index, DataFrame
+
+from pandas.io.json import json_normalize
+from pandas.io.json.normalize import nested_to_record
+
+
+@pytest.fixture
+def deep_nested():
+    # deeply nested data
+    return [{'country': 'USA',
+             'states': [{'name': 'California',
+                         'cities': [{'name': 'San Francisco',
+                                     'pop': 12345},
+                                    {'name': 'Los Angeles',
+                                     'pop': 12346}]
+                         },
+                        {'name': 'Ohio',
+                         'cities': [{'name': 'Columbus',
+                                     'pop': 1234},
+                                    {'name': 'Cleveland',
+                                     'pop': 1236}]}
+                        ]
+             },
+            {'country': 'Germany',
+             'states': [{'name': 'Bayern',
+                         'cities': [{'name': 'Munich', 'pop': 12347}]
+                         },
+                        {'name': 'Nordrhein-Westfalen',
+                         'cities': [{'name': 'Duesseldorf', 'pop': 1238},
+                                    {'name': 'Koeln', 'pop': 1239}]}
+                        ]
+             }
+            ]
+
+
+@pytest.fixture
+def state_data():
+    return [
+        {'counties': [{'name': 'Dade', 'population': 12345},
+                      {'name': 'Broward', 'population': 40000},
+                      {'name': 'Palm Beach', 'population': 60000}],
+         'info': {'governor': 'Rick Scott'},
+         'shortname': 'FL',
+         'state': 'Florida'},
+        {'counties': [{'name': 'Summit', 'population': 1234},
+                      {'name': 'Cuyahoga', 'population': 1337}],
+         'info': {'governor': 'John Kasich'},
+         'shortname': 'OH',
+         'state': 'Ohio'}]
+
+
+@pytest.fixture
+def author_missing_data():
+    return [
+        {'info': None},
+        {'info':
+            {'created_at': '11/08/1993', 'last_updated': '26/05/2012'},
+            'author_name':
+         {'first': 'Jane', 'last_name': 'Doe'}
+         }]
+
+
+class TestJSONNormalize(object):
+
+    def test_simple_records(self):
+        recs = [{'a': 1, 'b': 2, 'c': 3},
+                {'a': 4, 'b': 5, 'c': 6},
+                {'a': 7, 'b': 8, 'c': 9},
+                {'a': 10, 'b': 11, 'c': 12}]
+
+        result = json_normalize(recs)
+        expected = DataFrame(recs)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_simple_normalize(self, state_data):
+        result = json_normalize(state_data[0], 'counties')
+        expected = DataFrame(state_data[0]['counties'])
+        tm.assert_frame_equal(result, expected)
+
+        result = json_normalize(state_data, 'counties')
+
+        expected = []
+        for rec in state_data:
+            expected.extend(rec['counties'])
+        expected = DataFrame(expected)
+
+        tm.assert_frame_equal(result, expected)
+
+        result = json_normalize(state_data, 'counties', meta='state')
+        expected['state'] = np.array(['Florida', 'Ohio']).repeat([3, 2])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_empty_array(self):
+        result = json_normalize([])
+        expected = DataFrame()
+        tm.assert_frame_equal(result, expected)
+
+    def test_simple_normalize_with_separator(self, deep_nested):
+        # GH 14883
+        result = json_normalize({'A': {'A': 1, 'B': 2}})
+        expected = DataFrame([[1, 2]], columns=['A.A', 'A.B'])
+        tm.assert_frame_equal(result.reindex_like(expected), expected)
+
+        result = json_normalize({'A': {'A': 1, 'B': 2}}, sep='_')
+        expected = DataFrame([[1, 2]], columns=['A_A', 'A_B'])
+        tm.assert_frame_equal(result.reindex_like(expected), expected)
+
+        result = json_normalize({'A': {'A': 1, 'B': 2}}, sep=u'\u03c3')
+        expected = DataFrame([[1, 2]], columns=[u'A\u03c3A', u'A\u03c3B'])
+        tm.assert_frame_equal(result.reindex_like(expected), expected)
+
+        result = json_normalize(deep_nested, ['states', 'cities'],
+                                meta=['country', ['states', 'name']],
+                                sep='_')
+        expected = Index(['name', 'pop',
+                          'country', 'states_name']).sort_values()
+        assert result.columns.sort_values().equals(expected)
+
+    def test_value_array_record_prefix(self):
+        # GH 21536
+        result = json_normalize({'A': [1, 2]}, 'A', record_prefix='Prefix.')
+        expected = DataFrame([[1], [2]], columns=['Prefix.0'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_more_deeply_nested(self, deep_nested):
+
+        result = json_normalize(deep_nested, ['states', 'cities'],
+                                meta=['country', ['states', 'name']])
+        # meta_prefix={'states': 'state_'})
+
+        ex_data = {'country': ['USA'] * 4 + ['Germany'] * 3,
+                   'states.name': ['California', 'California', 'Ohio', 'Ohio',
+                                   'Bayern', 'Nordrhein-Westfalen',
+                                   'Nordrhein-Westfalen'],
+                   'name': ['San Francisco', 'Los Angeles', 'Columbus',
+                            'Cleveland', 'Munich', 'Duesseldorf', 'Koeln'],
+                   'pop': [12345, 12346, 1234, 1236, 12347, 1238, 1239]}
+
+        expected = DataFrame(ex_data, columns=result.columns)
+        tm.assert_frame_equal(result, expected)
+
+    def test_shallow_nested(self):
+        data = [{'state': 'Florida',
+                 'shortname': 'FL',
+                 'info': {
+                     'governor': 'Rick Scott'
+                 },
+                 'counties': [{'name': 'Dade', 'population': 12345},
+                              {'name': 'Broward', 'population': 40000},
+                              {'name': 'Palm Beach', 'population': 60000}]},
+                {'state': 'Ohio',
+                 'shortname': 'OH',
+                 'info': {
+                     'governor': 'John Kasich'
+                 },
+                 'counties': [{'name': 'Summit', 'population': 1234},
+                              {'name': 'Cuyahoga', 'population': 1337}]}]
+
+        result = json_normalize(data, 'counties',
+                                ['state', 'shortname',
+                                 ['info', 'governor']])
+        ex_data = {'name': ['Dade', 'Broward', 'Palm Beach', 'Summit',
+                            'Cuyahoga'],
+                   'state': ['Florida'] * 3 + ['Ohio'] * 2,
+                   'shortname': ['FL', 'FL', 'FL', 'OH', 'OH'],
+                   'info.governor': ['Rick Scott'] * 3 + ['John Kasich'] * 2,
+                   'population': [12345, 40000, 60000, 1234, 1337]}
+        expected = DataFrame(ex_data, columns=result.columns)
+        tm.assert_frame_equal(result, expected)
+
+    def test_meta_name_conflict(self):
+        data = [{'foo': 'hello',
+                 'bar': 'there',
+                 'data': [{'foo': 'something', 'bar': 'else'},
+                          {'foo': 'something2', 'bar': 'else2'}]}]
+
+        with pytest.raises(ValueError):
+            json_normalize(data, 'data', meta=['foo', 'bar'])
+
+        result = json_normalize(data, 'data', meta=['foo', 'bar'],
+                                meta_prefix='meta')
+
+        for val in ['metafoo', 'metabar', 'foo', 'bar']:
+            assert val in result
+
+    def test_meta_parameter_not_modified(self):
+        # GH 18610
+        data = [{'foo': 'hello',
+                 'bar': 'there',
+                 'data': [{'foo': 'something', 'bar': 'else'},
+                          {'foo': 'something2', 'bar': 'else2'}]}]
+
+        COLUMNS = ['foo', 'bar']
+        result = json_normalize(data, 'data', meta=COLUMNS,
+                                meta_prefix='meta')
+
+        assert COLUMNS == ['foo', 'bar']
+        for val in ['metafoo', 'metabar', 'foo', 'bar']:
+            assert val in result
+
+    def test_record_prefix(self, state_data):
+        result = json_normalize(state_data[0], 'counties')
+        expected = DataFrame(state_data[0]['counties'])
+        tm.assert_frame_equal(result, expected)
+
+        result = json_normalize(state_data, 'counties',
+                                meta='state',
+                                record_prefix='county_')
+
+        expected = []
+        for rec in state_data:
+            expected.extend(rec['counties'])
+        expected = DataFrame(expected)
+        expected = expected.rename(columns=lambda x: 'county_' + x)
+        expected['state'] = np.array(['Florida', 'Ohio']).repeat([3, 2])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_non_ascii_key(self):
+        if compat.PY3:
+            testjson = (
+                b'[{"\xc3\x9cnic\xc3\xb8de":0,"sub":{"A":1, "B":2}},' +
+                b'{"\xc3\x9cnic\xc3\xb8de":1,"sub":{"A":3, "B":4}}]'
+            ).decode('utf8')
+        else:
+            testjson = ('[{"\xc3\x9cnic\xc3\xb8de":0,"sub":{"A":1, "B":2}},'
+                        '{"\xc3\x9cnic\xc3\xb8de":1,"sub":{"A":3, "B":4}}]')
+
+        testdata = {
+            u'sub.A': [1, 3],
+            u'sub.B': [2, 4],
+            b"\xc3\x9cnic\xc3\xb8de".decode('utf8'): [0, 1]
+        }
+        expected = DataFrame(testdata)
+
+        result = json_normalize(json.loads(testjson))
+        tm.assert_frame_equal(result, expected)
+
+    def test_missing_field(self, author_missing_data):
+        # GH20030:
+        result = json_normalize(author_missing_data)
+        ex_data = [
+            {'info': np.nan,
+             'author_name.first': np.nan,
+             'author_name.last_name': np.nan,
+             'info.created_at': np.nan,
+             'info.last_updated': np.nan},
+            {'info': None,
+             'author_name.first': 'Jane',
+             'author_name.last_name': 'Doe',
+             'info.created_at': '11/08/1993',
+             'info.last_updated': '26/05/2012'}
+        ]
+        expected = DataFrame(ex_data)
+        tm.assert_frame_equal(result, expected)
+
+
+class TestNestedToRecord(object):
+
+    def test_flat_stays_flat(self):
+        recs = [dict(flat1=1, flat2=2),
+                dict(flat1=3, flat2=4),
+                ]
+
+        result = nested_to_record(recs)
+        expected = recs
+        assert result == expected
+
+    def test_one_level_deep_flattens(self):
+        data = dict(flat1=1,
+                    dict1=dict(c=1, d=2))
+
+        result = nested_to_record(data)
+        expected = {'dict1.c': 1,
+                    'dict1.d': 2,
+                    'flat1': 1}
+
+        assert result == expected
+
+    def test_nested_flattens(self):
+        data = dict(flat1=1,
+                    dict1=dict(c=1, d=2),
+                    nested=dict(e=dict(c=1, d=2),
+                                d=2))
+
+        result = nested_to_record(data)
+        expected = {'dict1.c': 1,
+                    'dict1.d': 2,
+                    'flat1': 1,
+                    'nested.d': 2,
+                    'nested.e.c': 1,
+                    'nested.e.d': 2}
+
+        assert result == expected
+
+    def test_json_normalize_errors(self):
+        # GH14583: If meta keys are not always present
+        # a new option to set errors='ignore' has been implemented
+        i = {
+            "Trades": [{
+                "general": {
+                    "tradeid": 100,
+                    "trade_version": 1,
+                    "stocks": [{
+
+                        "symbol": "AAPL",
+                        "name": "Apple",
+                        "price": "0"
+                    }, {
+                        "symbol": "GOOG",
+                        "name": "Google",
+                        "price": "0"
+                    }
+                    ]
+                }
+            }, {
+                "general": {
+                    "tradeid": 100,
+                    "stocks": [{
+                        "symbol": "AAPL",
+                        "name": "Apple",
+                        "price": "0"
+                    }, {
+                        "symbol": "GOOG",
+                        "name": "Google",
+                        "price": "0"
+                    }
+                    ]
+                }
+            }
+            ]
+        }
+        j = json_normalize(data=i['Trades'],
+                           record_path=[['general', 'stocks']],
+                           meta=[['general', 'tradeid'],
+                                 ['general', 'trade_version']],
+                           errors='ignore')
+        expected = {'general.trade_version': {0: 1.0, 1: 1.0, 2: '', 3: ''},
+                    'general.tradeid': {0: 100, 1: 100, 2: 100, 3: 100},
+                    'name': {0: 'Apple', 1: 'Google', 2: 'Apple', 3: 'Google'},
+                    'price': {0: '0', 1: '0', 2: '0', 3: '0'},
+                    'symbol': {0: 'AAPL', 1: 'GOOG', 2: 'AAPL', 3: 'GOOG'}}
+
+        assert j.fillna('').to_dict() == expected
+
+        pytest.raises(KeyError,
+                      json_normalize, data=i['Trades'],
+                      record_path=[['general', 'stocks']],
+                      meta=[['general', 'tradeid'],
+                            ['general', 'trade_version']],
+                      errors='raise'
+                      )
+
+    def test_donot_drop_nonevalues(self):
+        # GH21356
+        data = [
+            {'info': None,
+             'author_name':
+             {'first': 'Smith', 'last_name': 'Appleseed'}
+             },
+            {'info':
+                {'created_at': '11/08/1993', 'last_updated': '26/05/2012'},
+             'author_name':
+                {'first': 'Jane', 'last_name': 'Doe'}
+             }
+        ]
+        result = nested_to_record(data)
+        expected = [
+            {'info': None,
+             'author_name.first': 'Smith',
+             'author_name.last_name': 'Appleseed'},
+            {'author_name.first': 'Jane',
+             'author_name.last_name': 'Doe',
+             'info.created_at': '11/08/1993',
+             'info.last_updated': '26/05/2012'}]
+
+        assert result == expected
+
+    def test_nonetype_top_level_bottom_level(self):
+        # GH21158: If inner level json has a key with a null value
+        # make sure it doesnt do a new_d.pop twice and except
+        data = {
+            "id": None,
+            "location": {
+                "country": {
+                    "state": {
+                        "id": None,
+                        "town.info": {
+                            "id": None,
+                            "region": None,
+                            "x": 49.151580810546875,
+                            "y": -33.148521423339844,
+                            "z": 27.572303771972656}}}
+            }
+        }
+        result = nested_to_record(data)
+        expected = {
+            'id': None,
+            'location.country.state.id': None,
+            'location.country.state.town.info.id': None,
+            'location.country.state.town.info.region': None,
+            'location.country.state.town.info.x': 49.151580810546875,
+            'location.country.state.town.info.y': -33.148521423339844,
+            'location.country.state.town.info.z': 27.572303771972656}
+        assert result == expected
+
+    def test_nonetype_multiple_levels(self):
+        # GH21158: If inner level json has a key with a null value
+        # make sure it doesnt do a new_d.pop twice and except
+        data = {
+            "id": None,
+            "location": {
+                "id": None,
+                "country": {
+                    "id": None,
+                    "state": {
+                        "id": None,
+                        "town.info": {
+                            "region": None,
+                            "x": 49.151580810546875,
+                            "y": -33.148521423339844,
+                            "z": 27.572303771972656}}}
+            }
+        }
+        result = nested_to_record(data)
+        expected = {
+            'id': None,
+            'location.id': None,
+            'location.country.id': None,
+            'location.country.state.id': None,
+            'location.country.state.town.info.region': None,
+            'location.country.state.town.info.x': 49.151580810546875,
+            'location.country.state.town.info.y': -33.148521423339844,
+            'location.country.state.town.info.z': 27.572303771972656}
+        assert result == expected
diff --git a/pandas/tests/io/json/test_pandas.py b/pandas/tests/io/json/test_pandas.py
new file mode 100644
index 0000000000000..bcbac4400c953
--- /dev/null
+++ b/pandas/tests/io/json/test_pandas.py
@@ -0,0 +1,1226 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=W0612,E1101
+import pytest
+from pandas.compat import (range, lrange, StringIO,
+                           OrderedDict, is_platform_32bit)
+import os
+import numpy as np
+from pandas import (Series, DataFrame, DatetimeIndex, Timestamp,
+                    read_json, compat)
+from datetime import timedelta
+import pandas as pd
+import json
+
+from pandas.util.testing import (assert_almost_equal, assert_frame_equal,
+                                 assert_series_equal, network,
+                                 ensure_clean, assert_index_equal)
+import pandas.util.testing as tm
+
+_seriesd = tm.getSeriesData()
+_tsd = tm.getTimeSeriesData()
+
+_frame = DataFrame(_seriesd)
+_frame2 = DataFrame(_seriesd, columns=['D', 'C', 'B', 'A'])
+_intframe = DataFrame(dict((k, v.astype(np.int64))
+                           for k, v in compat.iteritems(_seriesd)))
+
+_tsframe = DataFrame(_tsd)
+_cat_frame = _frame.copy()
+cat = ['bah'] * 5 + ['bar'] * 5 + ['baz'] * \
+    5 + ['foo'] * (len(_cat_frame) - 15)
+_cat_frame.index = pd.CategoricalIndex(cat, name='E')
+_cat_frame['E'] = list(reversed(cat))
+_cat_frame['sort'] = np.arange(len(_cat_frame), dtype='int64')
+
+_mixed_frame = _frame.copy()
+
+
+class TestPandasContainer(object):
+
+    @pytest.fixture(scope="function", autouse=True)
+    def setup(self, datapath):
+        self.dirpath = datapath("io", "json", "data")
+
+        self.ts = tm.makeTimeSeries()
+        self.ts.name = 'ts'
+
+        self.series = tm.makeStringSeries()
+        self.series.name = 'series'
+
+        self.objSeries = tm.makeObjectSeries()
+        self.objSeries.name = 'objects'
+
+        self.empty_series = Series([], index=[])
+        self.empty_frame = DataFrame({})
+
+        self.frame = _frame.copy()
+        self.frame2 = _frame2.copy()
+        self.intframe = _intframe.copy()
+        self.tsframe = _tsframe.copy()
+        self.mixed_frame = _mixed_frame.copy()
+        self.categorical = _cat_frame.copy()
+
+        yield
+
+        del self.dirpath
+
+        del self.ts
+
+        del self.series
+
+        del self.objSeries
+
+        del self.empty_series
+        del self.empty_frame
+
+        del self.frame
+        del self.frame2
+        del self.intframe
+        del self.tsframe
+        del self.mixed_frame
+
+    def test_frame_double_encoded_labels(self):
+        df = DataFrame([['a', 'b'], ['c', 'd']],
+                       index=['index " 1', 'index / 2'],
+                       columns=['a \\ b', 'y / z'])
+
+        assert_frame_equal(df, read_json(df.to_json(orient='split'),
+                                         orient='split'))
+        assert_frame_equal(df, read_json(df.to_json(orient='columns'),
+                                         orient='columns'))
+        assert_frame_equal(df, read_json(df.to_json(orient='index'),
+                                         orient='index'))
+        df_unser = read_json(df.to_json(orient='records'), orient='records')
+        assert_index_equal(df.columns, df_unser.columns)
+        tm.assert_numpy_array_equal(df.values, df_unser.values)
+
+    def test_frame_non_unique_index(self):
+        df = DataFrame([['a', 'b'], ['c', 'd']], index=[1, 1],
+                       columns=['x', 'y'])
+
+        pytest.raises(ValueError, df.to_json, orient='index')
+        pytest.raises(ValueError, df.to_json, orient='columns')
+
+        assert_frame_equal(df, read_json(df.to_json(orient='split'),
+                                         orient='split'))
+        unser = read_json(df.to_json(orient='records'), orient='records')
+        tm.assert_index_equal(df.columns, unser.columns)
+        tm.assert_almost_equal(df.values, unser.values)
+        unser = read_json(df.to_json(orient='values'), orient='values')
+        tm.assert_numpy_array_equal(df.values, unser.values)
+
+    def test_frame_non_unique_columns(self):
+        df = DataFrame([['a', 'b'], ['c', 'd']], index=[1, 2],
+                       columns=['x', 'x'])
+
+        pytest.raises(ValueError, df.to_json, orient='index')
+        pytest.raises(ValueError, df.to_json, orient='columns')
+        pytest.raises(ValueError, df.to_json, orient='records')
+
+        assert_frame_equal(df, read_json(df.to_json(orient='split'),
+                                         orient='split', dtype=False))
+        unser = read_json(df.to_json(orient='values'), orient='values')
+        tm.assert_numpy_array_equal(df.values, unser.values)
+
+        # GH4377; duplicate columns not processing correctly
+        df = DataFrame([['a', 'b'], ['c', 'd']], index=[
+                       1, 2], columns=['x', 'y'])
+        result = read_json(df.to_json(orient='split'), orient='split')
+        assert_frame_equal(result, df)
+
+        def _check(df):
+            result = read_json(df.to_json(orient='split'), orient='split',
+                               convert_dates=['x'])
+            assert_frame_equal(result, df)
+
+        for o in [[['a', 'b'], ['c', 'd']],
+                  [[1.5, 2.5], [3.5, 4.5]],
+                  [[1, 2.5], [3, 4.5]],
+                  [[Timestamp('20130101'), 3.5],
+                   [Timestamp('20130102'), 4.5]]]:
+            _check(DataFrame(o, index=[1, 2], columns=['x', 'x']))
+
+    def test_frame_from_json_to_json(self):
+        def _check_orient(df, orient, dtype=None, numpy=False,
+                          convert_axes=True, check_dtype=True, raise_ok=None,
+                          sort=None, check_index_type=True,
+                          check_column_type=True, check_numpy_dtype=False):
+            if sort is not None:
+                df = df.sort_values(sort)
+            else:
+                df = df.sort_index()
+
+            # if we are not unique, then check that we are raising ValueError
+            # for the appropriate orients
+            if not df.index.is_unique and orient in ['index', 'columns']:
+                pytest.raises(
+                    ValueError, lambda: df.to_json(orient=orient))
+                return
+            if (not df.columns.is_unique and
+                    orient in ['index', 'columns', 'records']):
+                pytest.raises(
+                    ValueError, lambda: df.to_json(orient=orient))
+                return
+
+            dfjson = df.to_json(orient=orient)
+
+            try:
+                unser = read_json(dfjson, orient=orient, dtype=dtype,
+                                  numpy=numpy, convert_axes=convert_axes)
+            except Exception as detail:
+                if raise_ok is not None:
+                    if isinstance(detail, raise_ok):
+                        return
+                raise
+
+            if sort is not None and sort in unser.columns:
+                unser = unser.sort_values(sort)
+            else:
+                unser = unser.sort_index()
+
+            if dtype is False:
+                check_dtype = False
+
+            if not convert_axes and df.index.dtype.type == np.datetime64:
+                unser.index = DatetimeIndex(
+                    unser.index.values.astype('i8') * 1e6)
+            if orient == "records":
+                # index is not captured in this orientation
+                tm.assert_almost_equal(df.values, unser.values,
+                                       check_dtype=check_numpy_dtype)
+                tm.assert_index_equal(df.columns, unser.columns,
+                                      exact=check_column_type)
+            elif orient == "values":
+                # index and cols are not captured in this orientation
+                if numpy is True and df.shape == (0, 0):
+                    assert unser.shape[0] == 0
+                else:
+                    tm.assert_almost_equal(df.values, unser.values,
+                                           check_dtype=check_numpy_dtype)
+            elif orient == "split":
+                # index and col labels might not be strings
+                unser.index = [str(i) for i in unser.index]
+                unser.columns = [str(i) for i in unser.columns]
+
+                if sort is None:
+                    unser = unser.sort_index()
+                tm.assert_almost_equal(df.values, unser.values,
+                                       check_dtype=check_numpy_dtype)
+            else:
+                if convert_axes:
+                    tm.assert_frame_equal(df, unser, check_dtype=check_dtype,
+                                          check_index_type=check_index_type,
+                                          check_column_type=check_column_type)
+                else:
+                    tm.assert_frame_equal(df, unser, check_less_precise=False,
+                                          check_dtype=check_dtype)
+
+        def _check_all_orients(df, dtype=None, convert_axes=True,
+                               raise_ok=None, sort=None, check_index_type=True,
+                               check_column_type=True):
+
+            # numpy=False
+            if convert_axes:
+                _check_orient(df, "columns", dtype=dtype, sort=sort,
+                              check_index_type=False, check_column_type=False)
+                _check_orient(df, "records", dtype=dtype, sort=sort,
+                              check_index_type=False, check_column_type=False)
+                _check_orient(df, "split", dtype=dtype, sort=sort,
+                              check_index_type=False, check_column_type=False)
+                _check_orient(df, "index", dtype=dtype, sort=sort,
+                              check_index_type=False, check_column_type=False)
+                _check_orient(df, "values", dtype=dtype, sort=sort,
+                              check_index_type=False, check_column_type=False)
+
+            _check_orient(df, "columns", dtype=dtype,
+                          convert_axes=False, sort=sort)
+            _check_orient(df, "records", dtype=dtype,
+                          convert_axes=False, sort=sort)
+            _check_orient(df, "split", dtype=dtype,
+                          convert_axes=False, sort=sort)
+            _check_orient(df, "index", dtype=dtype,
+                          convert_axes=False, sort=sort)
+            _check_orient(df, "values", dtype=dtype,
+                          convert_axes=False, sort=sort)
+
+            # numpy=True and raise_ok might be not None, so ignore the error
+            if convert_axes:
+                _check_orient(df, "columns", dtype=dtype, numpy=True,
+                              raise_ok=raise_ok, sort=sort,
+                              check_index_type=False, check_column_type=False)
+                _check_orient(df, "records", dtype=dtype, numpy=True,
+                              raise_ok=raise_ok, sort=sort,
+                              check_index_type=False, check_column_type=False)
+                _check_orient(df, "split", dtype=dtype, numpy=True,
+                              raise_ok=raise_ok, sort=sort,
+                              check_index_type=False, check_column_type=False)
+                _check_orient(df, "index", dtype=dtype, numpy=True,
+                              raise_ok=raise_ok, sort=sort,
+                              check_index_type=False, check_column_type=False)
+                _check_orient(df, "values", dtype=dtype, numpy=True,
+                              raise_ok=raise_ok, sort=sort,
+                              check_index_type=False, check_column_type=False)
+
+            _check_orient(df, "columns", dtype=dtype, numpy=True,
+                          convert_axes=False, raise_ok=raise_ok, sort=sort)
+            _check_orient(df, "records", dtype=dtype, numpy=True,
+                          convert_axes=False, raise_ok=raise_ok, sort=sort)
+            _check_orient(df, "split", dtype=dtype, numpy=True,
+                          convert_axes=False, raise_ok=raise_ok, sort=sort)
+            _check_orient(df, "index", dtype=dtype, numpy=True,
+                          convert_axes=False, raise_ok=raise_ok, sort=sort)
+            _check_orient(df, "values", dtype=dtype, numpy=True,
+                          convert_axes=False, raise_ok=raise_ok, sort=sort)
+
+        # basic
+        _check_all_orients(self.frame)
+        assert self.frame.to_json() == self.frame.to_json(orient="columns")
+
+        _check_all_orients(self.intframe, dtype=self.intframe.values.dtype)
+        _check_all_orients(self.intframe, dtype=False)
+
+        # big one
+        # index and columns are strings as all unserialised JSON object keys
+        # are assumed to be strings
+        biggie = DataFrame(np.zeros((200, 4)),
+                           columns=[str(i) for i in range(4)],
+                           index=[str(i) for i in range(200)])
+        _check_all_orients(biggie, dtype=False, convert_axes=False)
+
+        # dtypes
+        _check_all_orients(DataFrame(biggie, dtype=np.float64),
+                           dtype=np.float64, convert_axes=False)
+        _check_all_orients(DataFrame(biggie, dtype=np.int), dtype=np.int,
+                           convert_axes=False)
+        _check_all_orients(DataFrame(biggie, dtype='U3'), dtype='U3',
+                           convert_axes=False, raise_ok=ValueError)
+
+        # categorical
+        _check_all_orients(self.categorical, sort='sort', raise_ok=ValueError)
+
+        # empty
+        _check_all_orients(self.empty_frame, check_index_type=False,
+                           check_column_type=False)
+
+        # time series data
+        _check_all_orients(self.tsframe)
+
+        # mixed data
+        index = pd.Index(['a', 'b', 'c', 'd', 'e'])
+        data = {'A': [0., 1., 2., 3., 4.],
+                'B': [0., 1., 0., 1., 0.],
+                'C': ['foo1', 'foo2', 'foo3', 'foo4', 'foo5'],
+                'D': [True, False, True, False, True]}
+        df = DataFrame(data=data, index=index)
+        _check_orient(df, "split", check_dtype=False)
+        _check_orient(df, "records", check_dtype=False)
+        _check_orient(df, "values", check_dtype=False)
+        _check_orient(df, "columns", check_dtype=False)
+        # index oriented is problematic as it is read back in in a transposed
+        # state, so the columns are interpreted as having mixed data and
+        # given object dtypes.
+        # force everything to have object dtype beforehand
+        _check_orient(df.transpose().transpose(), "index", dtype=False)
+
+    def test_frame_from_json_bad_data(self):
+        pytest.raises(ValueError, read_json, StringIO('{"key":b:a:d}'))
+
+        # too few indices
+        json = StringIO('{"columns":["A","B"],'
+                        '"index":["2","3"],'
+                        '"data":[[1.0,"1"],[2.0,"2"],[null,"3"]]}')
+        pytest.raises(ValueError, read_json, json,
+                      orient="split")
+
+        # too many columns
+        json = StringIO('{"columns":["A","B","C"],'
+                        '"index":["1","2","3"],'
+                        '"data":[[1.0,"1"],[2.0,"2"],[null,"3"]]}')
+        pytest.raises(AssertionError, read_json, json,
+                      orient="split")
+
+        # bad key
+        json = StringIO('{"badkey":["A","B"],'
+                        '"index":["2","3"],'
+                        '"data":[[1.0,"1"],[2.0,"2"],[null,"3"]]}')
+        with tm.assert_raises_regex(ValueError,
+                                    r"unexpected key\(s\): badkey"):
+            read_json(json, orient="split")
+
+    def test_frame_from_json_nones(self):
+        df = DataFrame([[1, 2], [4, 5, 6]])
+        unser = read_json(df.to_json())
+        assert np.isnan(unser[2][0])
+
+        df = DataFrame([['1', '2'], ['4', '5', '6']])
+        unser = read_json(df.to_json())
+        assert np.isnan(unser[2][0])
+        unser = read_json(df.to_json(), dtype=False)
+        assert unser[2][0] is None
+        unser = read_json(df.to_json(), convert_axes=False, dtype=False)
+        assert unser['2']['0'] is None
+
+        unser = read_json(df.to_json(), numpy=False)
+        assert np.isnan(unser[2][0])
+        unser = read_json(df.to_json(), numpy=False, dtype=False)
+        assert unser[2][0] is None
+        unser = read_json(df.to_json(), numpy=False,
+                          convert_axes=False, dtype=False)
+        assert unser['2']['0'] is None
+
+        # infinities get mapped to nulls which get mapped to NaNs during
+        # deserialisation
+        df = DataFrame([[1, 2], [4, 5, 6]])
+        df.loc[0, 2] = np.inf
+        unser = read_json(df.to_json())
+        assert np.isnan(unser[2][0])
+        unser = read_json(df.to_json(), dtype=False)
+        assert np.isnan(unser[2][0])
+
+        df.loc[0, 2] = np.NINF
+        unser = read_json(df.to_json())
+        assert np.isnan(unser[2][0])
+        unser = read_json(df.to_json(), dtype=False)
+        assert np.isnan(unser[2][0])
+
+    @pytest.mark.skipif(is_platform_32bit(),
+                        reason="not compliant on 32-bit, xref #15865")
+    def test_frame_to_json_float_precision(self):
+        df = pd.DataFrame([dict(a_float=0.95)])
+        encoded = df.to_json(double_precision=1)
+        assert encoded == '{"a_float":{"0":1.0}}'
+
+        df = pd.DataFrame([dict(a_float=1.95)])
+        encoded = df.to_json(double_precision=1)
+        assert encoded == '{"a_float":{"0":2.0}}'
+
+        df = pd.DataFrame([dict(a_float=-1.95)])
+        encoded = df.to_json(double_precision=1)
+        assert encoded == '{"a_float":{"0":-2.0}}'
+
+        df = pd.DataFrame([dict(a_float=0.995)])
+        encoded = df.to_json(double_precision=2)
+        assert encoded == '{"a_float":{"0":1.0}}'
+
+        df = pd.DataFrame([dict(a_float=0.9995)])
+        encoded = df.to_json(double_precision=3)
+        assert encoded == '{"a_float":{"0":1.0}}'
+
+        df = pd.DataFrame([dict(a_float=0.99999999999999944)])
+        encoded = df.to_json(double_precision=15)
+        assert encoded == '{"a_float":{"0":1.0}}'
+
+    def test_frame_to_json_except(self):
+        df = DataFrame([1, 2, 3])
+        pytest.raises(ValueError, df.to_json, orient="garbage")
+
+    def test_frame_empty(self):
+        df = DataFrame(columns=['jim', 'joe'])
+        assert not df._is_mixed_type
+        assert_frame_equal(read_json(df.to_json(), dtype=dict(df.dtypes)), df,
+                           check_index_type=False)
+        # GH 7445
+        result = pd.DataFrame({'test': []}, index=[]).to_json(orient='columns')
+        expected = '{"test":{}}'
+        assert result == expected
+
+    def test_frame_empty_mixedtype(self):
+        # mixed type
+        df = DataFrame(columns=['jim', 'joe'])
+        df['joe'] = df['joe'].astype('i8')
+        assert df._is_mixed_type
+        assert_frame_equal(read_json(df.to_json(), dtype=dict(df.dtypes)), df,
+                           check_index_type=False)
+
+    def test_frame_mixedtype_orient(self):  # GH10289
+        vals = [[10, 1, 'foo', .1, .01],
+                [20, 2, 'bar', .2, .02],
+                [30, 3, 'baz', .3, .03],
+                [40, 4, 'qux', .4, .04]]
+
+        df = DataFrame(vals, index=list('abcd'),
+                       columns=['1st', '2nd', '3rd', '4th', '5th'])
+
+        assert df._is_mixed_type
+        right = df.copy()
+
+        for orient in ['split', 'index', 'columns']:
+            inp = df.to_json(orient=orient)
+            left = read_json(inp, orient=orient, convert_axes=False)
+            assert_frame_equal(left, right)
+
+        right.index = np.arange(len(df))
+        inp = df.to_json(orient='records')
+        left = read_json(inp, orient='records', convert_axes=False)
+        assert_frame_equal(left, right)
+
+        right.columns = np.arange(df.shape[1])
+        inp = df.to_json(orient='values')
+        left = read_json(inp, orient='values', convert_axes=False)
+        assert_frame_equal(left, right)
+
+    def test_v12_compat(self):
+        df = DataFrame(
+            [[1.56808523, 0.65727391, 1.81021139, -0.17251653],
+             [-0.2550111, -0.08072427, -0.03202878, -0.17581665],
+             [1.51493992, 0.11805825, 1.629455, -1.31506612],
+             [-0.02765498, 0.44679743, 0.33192641, -0.27885413],
+             [0.05951614, -2.69652057, 1.28163262, 0.34703478]],
+            columns=['A', 'B', 'C', 'D'],
+            index=pd.date_range('2000-01-03', '2000-01-07'))
+        df['date'] = pd.Timestamp('19920106 18:21:32.12')
+        df.iloc[3, df.columns.get_loc('date')] = pd.Timestamp('20130101')
+        df['modified'] = df['date']
+        df.iloc[1, df.columns.get_loc('modified')] = pd.NaT
+
+        v12_json = os.path.join(self.dirpath, 'tsframe_v012.json')
+        df_unser = pd.read_json(v12_json)
+        assert_frame_equal(df, df_unser)
+
+        df_iso = df.drop(['modified'], axis=1)
+        v12_iso_json = os.path.join(self.dirpath, 'tsframe_iso_v012.json')
+        df_unser_iso = pd.read_json(v12_iso_json)
+        assert_frame_equal(df_iso, df_unser_iso)
+
+    def test_blocks_compat_GH9037(self):
+        index = pd.date_range('20000101', periods=10, freq='H')
+        df_mixed = DataFrame(OrderedDict(
+            float_1=[-0.92077639, 0.77434435, 1.25234727, 0.61485564,
+                     -0.60316077, 0.24653374, 0.28668979, -2.51969012,
+                     0.95748401, -1.02970536],
+            int_1=[19680418, 75337055, 99973684, 65103179, 79373900,
+                   40314334, 21290235, 4991321, 41903419, 16008365],
+            str_1=['78c608f1', '64a99743', '13d2ff52', 'ca7f4af2', '97236474',
+                   'bde7e214', '1a6bde47', 'b1190be5', '7a669144', '8d64d068'],
+            float_2=[-0.0428278, -1.80872357, 3.36042349, -0.7573685,
+                     -0.48217572, 0.86229683, 1.08935819, 0.93898739,
+                     -0.03030452, 1.43366348],
+            str_2=['14f04af9', 'd085da90', '4bcfac83', '81504caf', '2ffef4a9',
+                   '08e2f5c4', '07e1af03', 'addbd4a7', '1f6a09ba', '4bfc4d87'],
+            int_2=[86967717, 98098830, 51927505, 20372254, 12601730, 20884027,
+                   34193846, 10561746, 24867120, 76131025]
+        ), index=index)
+
+        # JSON deserialisation always creates unicode strings
+        df_mixed.columns = df_mixed.columns.astype('unicode')
+
+        df_roundtrip = pd.read_json(df_mixed.to_json(orient='split'),
+                                    orient='split')
+        assert_frame_equal(df_mixed, df_roundtrip,
+                           check_index_type=True,
+                           check_column_type=True,
+                           check_frame_type=True,
+                           by_blocks=True,
+                           check_exact=True)
+
+    def test_frame_nonprintable_bytes(self):
+        # GH14256: failing column caused segfaults, if it is not the last one
+
+        class BinaryThing(object):
+
+            def __init__(self, hexed):
+                self.hexed = hexed
+                if compat.PY2:
+                    self.binary = hexed.decode('hex')
+                else:
+                    self.binary = bytes.fromhex(hexed)
+
+            def __str__(self):
+                return self.hexed
+
+        hexed = '574b4454ba8c5eb4f98a8f45'
+        binthing = BinaryThing(hexed)
+
+        # verify the proper conversion of printable content
+        df_printable = DataFrame({'A': [binthing.hexed]})
+        assert df_printable.to_json() == \
+            '{{"A":{{"0":"{hex}"}}}}'.format(hex=hexed)
+
+        # check if non-printable content throws appropriate Exception
+        df_nonprintable = DataFrame({'A': [binthing]})
+        with pytest.raises(OverflowError):
+            df_nonprintable.to_json()
+
+        # the same with multiple columns threw segfaults
+        df_mixed = DataFrame({'A': [binthing], 'B': [1]},
+                             columns=['A', 'B'])
+        with pytest.raises(OverflowError):
+            df_mixed.to_json()
+
+        # default_handler should resolve exceptions for non-string types
+        assert df_nonprintable.to_json(default_handler=str) == \
+            '{{"A":{{"0":"{hex}"}}}}'.format(hex=hexed)
+        assert df_mixed.to_json(default_handler=str) == \
+            '{{"A":{{"0":"{hex}"}},"B":{{"0":1}}}}'.format(hex=hexed)
+
+    def test_label_overflow(self):
+        # GH14256: buffer length not checked when writing label
+        df = pd.DataFrame({'bar' * 100000: [1], 'foo': [1337]})
+        assert df.to_json() == \
+            '{{"{bar}":{{"0":1}},"foo":{{"0":1337}}}}'.format(
+                bar=('bar' * 100000))
+
+    def test_series_non_unique_index(self):
+        s = Series(['a', 'b'], index=[1, 1])
+
+        pytest.raises(ValueError, s.to_json, orient='index')
+
+        assert_series_equal(s, read_json(s.to_json(orient='split'),
+                                         orient='split', typ='series'))
+        unser = read_json(s.to_json(orient='records'),
+                          orient='records', typ='series')
+        tm.assert_numpy_array_equal(s.values, unser.values)
+
+    def test_series_from_json_to_json(self):
+
+        def _check_orient(series, orient, dtype=None, numpy=False,
+                          check_index_type=True):
+            series = series.sort_index()
+            unser = read_json(series.to_json(orient=orient),
+                              typ='series', orient=orient, numpy=numpy,
+                              dtype=dtype)
+            unser = unser.sort_index()
+            if orient == "records" or orient == "values":
+                assert_almost_equal(series.values, unser.values)
+            else:
+                if orient == "split":
+                    assert_series_equal(series, unser,
+                                        check_index_type=check_index_type)
+                else:
+                    assert_series_equal(series, unser, check_names=False,
+                                        check_index_type=check_index_type)
+
+        def _check_all_orients(series, dtype=None, check_index_type=True):
+            _check_orient(series, "columns", dtype=dtype,
+                          check_index_type=check_index_type)
+            _check_orient(series, "records", dtype=dtype,
+                          check_index_type=check_index_type)
+            _check_orient(series, "split", dtype=dtype,
+                          check_index_type=check_index_type)
+            _check_orient(series, "index", dtype=dtype,
+                          check_index_type=check_index_type)
+            _check_orient(series, "values", dtype=dtype)
+
+            _check_orient(series, "columns", dtype=dtype, numpy=True,
+                          check_index_type=check_index_type)
+            _check_orient(series, "records", dtype=dtype, numpy=True,
+                          check_index_type=check_index_type)
+            _check_orient(series, "split", dtype=dtype, numpy=True,
+                          check_index_type=check_index_type)
+            _check_orient(series, "index", dtype=dtype, numpy=True,
+                          check_index_type=check_index_type)
+            _check_orient(series, "values", dtype=dtype, numpy=True,
+                          check_index_type=check_index_type)
+
+        # basic
+        _check_all_orients(self.series)
+        assert self.series.to_json() == self.series.to_json(orient="index")
+
+        objSeries = Series([str(d) for d in self.objSeries],
+                           index=self.objSeries.index,
+                           name=self.objSeries.name)
+        _check_all_orients(objSeries, dtype=False)
+
+        # empty_series has empty index with object dtype
+        # which cannot be revert
+        assert self.empty_series.index.dtype == np.object_
+        _check_all_orients(self.empty_series, check_index_type=False)
+
+        _check_all_orients(self.ts)
+
+        # dtype
+        s = Series(lrange(6), index=['a', 'b', 'c', 'd', 'e', 'f'])
+        _check_all_orients(Series(s, dtype=np.float64), dtype=np.float64)
+        _check_all_orients(Series(s, dtype=np.int), dtype=np.int)
+
+    def test_series_to_json_except(self):
+        s = Series([1, 2, 3])
+        pytest.raises(ValueError, s.to_json, orient="garbage")
+
+    def test_series_from_json_precise_float(self):
+        s = Series([4.56, 4.56, 4.56])
+        result = read_json(s.to_json(), typ='series', precise_float=True)
+        assert_series_equal(result, s, check_index_type=False)
+
+    def test_frame_from_json_precise_float(self):
+        df = DataFrame([[4.56, 4.56, 4.56], [4.56, 4.56, 4.56]])
+        result = read_json(df.to_json(), precise_float=True)
+        assert_frame_equal(result, df, check_index_type=False,
+                           check_column_type=False)
+
+    def test_typ(self):
+
+        s = Series(lrange(6), index=['a', 'b', 'c',
+                                     'd', 'e', 'f'], dtype='int64')
+        result = read_json(s.to_json(), typ=None)
+        assert_series_equal(result, s)
+
+    def test_reconstruction_index(self):
+
+        df = DataFrame([[1, 2, 3], [4, 5, 6]])
+        result = read_json(df.to_json())
+
+        assert_frame_equal(result, df)
+
+        df = DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]}, index=['A', 'B', 'C'])
+        result = read_json(df.to_json())
+        assert_frame_equal(result, df)
+
+    def test_path(self):
+        with ensure_clean('test.json') as path:
+            for df in [self.frame, self.frame2, self.intframe, self.tsframe,
+                       self.mixed_frame]:
+                df.to_json(path)
+                read_json(path)
+
+    def test_axis_dates(self):
+
+        # frame
+        json = self.tsframe.to_json()
+        result = read_json(json)
+        assert_frame_equal(result, self.tsframe)
+
+        # series
+        json = self.ts.to_json()
+        result = read_json(json, typ='series')
+        assert_series_equal(result, self.ts, check_names=False)
+        assert result.name is None
+
+    def test_convert_dates(self):
+
+        # frame
+        df = self.tsframe.copy()
+        df['date'] = Timestamp('20130101')
+
+        json = df.to_json()
+        result = read_json(json)
+        assert_frame_equal(result, df)
+
+        df['foo'] = 1.
+        json = df.to_json(date_unit='ns')
+
+        result = read_json(json, convert_dates=False)
+        expected = df.copy()
+        expected['date'] = expected['date'].values.view('i8')
+        expected['foo'] = expected['foo'].astype('int64')
+        assert_frame_equal(result, expected)
+
+        # series
+        ts = Series(Timestamp('20130101'), index=self.ts.index)
+        json = ts.to_json()
+        result = read_json(json, typ='series')
+        assert_series_equal(result, ts)
+
+    def test_convert_dates_infer(self):
+        # GH10747
+        from pandas.io.json import dumps
+        infer_words = ['trade_time', 'date', 'datetime', 'sold_at',
+                       'modified', 'timestamp', 'timestamps']
+        for infer_word in infer_words:
+            data = [{'id': 1, infer_word: 1036713600000}, {'id': 2}]
+            expected = DataFrame([[1, Timestamp('2002-11-08')], [2, pd.NaT]],
+                                 columns=['id', infer_word])
+            result = read_json(dumps(data))[['id', infer_word]]
+            assert_frame_equal(result, expected)
+
+    def test_date_format_frame(self):
+        df = self.tsframe.copy()
+
+        def test_w_date(date, date_unit=None):
+            df['date'] = Timestamp(date)
+            df.iloc[1, df.columns.get_loc('date')] = pd.NaT
+            df.iloc[5, df.columns.get_loc('date')] = pd.NaT
+            if date_unit:
+                json = df.to_json(date_format='iso', date_unit=date_unit)
+            else:
+                json = df.to_json(date_format='iso')
+            result = read_json(json)
+            assert_frame_equal(result, df)
+
+        test_w_date('20130101 20:43:42.123')
+        test_w_date('20130101 20:43:42', date_unit='s')
+        test_w_date('20130101 20:43:42.123', date_unit='ms')
+        test_w_date('20130101 20:43:42.123456', date_unit='us')
+        test_w_date('20130101 20:43:42.123456789', date_unit='ns')
+
+        pytest.raises(ValueError, df.to_json, date_format='iso',
+                      date_unit='foo')
+
+    def test_date_format_series(self):
+        def test_w_date(date, date_unit=None):
+            ts = Series(Timestamp(date), index=self.ts.index)
+            ts.iloc[1] = pd.NaT
+            ts.iloc[5] = pd.NaT
+            if date_unit:
+                json = ts.to_json(date_format='iso', date_unit=date_unit)
+            else:
+                json = ts.to_json(date_format='iso')
+            result = read_json(json, typ='series')
+            assert_series_equal(result, ts)
+
+        test_w_date('20130101 20:43:42.123')
+        test_w_date('20130101 20:43:42', date_unit='s')
+        test_w_date('20130101 20:43:42.123', date_unit='ms')
+        test_w_date('20130101 20:43:42.123456', date_unit='us')
+        test_w_date('20130101 20:43:42.123456789', date_unit='ns')
+
+        ts = Series(Timestamp('20130101 20:43:42.123'), index=self.ts.index)
+        pytest.raises(ValueError, ts.to_json, date_format='iso',
+                      date_unit='foo')
+
+    def test_date_unit(self):
+        df = self.tsframe.copy()
+        df['date'] = Timestamp('20130101 20:43:42')
+        dl = df.columns.get_loc('date')
+        df.iloc[1, dl] = Timestamp('19710101 20:43:42')
+        df.iloc[2, dl] = Timestamp('21460101 20:43:42')
+        df.iloc[4, dl] = pd.NaT
+
+        for unit in ('s', 'ms', 'us', 'ns'):
+            json = df.to_json(date_format='epoch', date_unit=unit)
+
+            # force date unit
+            result = read_json(json, date_unit=unit)
+            assert_frame_equal(result, df)
+
+            # detect date unit
+            result = read_json(json, date_unit=None)
+            assert_frame_equal(result, df)
+
+    def test_weird_nested_json(self):
+        # this used to core dump the parser
+        s = r'''{
+        "status": "success",
+        "data": {
+        "posts": [
+            {
+            "id": 1,
+            "title": "A blog post",
+            "body": "Some useful content"
+            },
+            {
+            "id": 2,
+            "title": "Another blog post",
+            "body": "More content"
+            }
+           ]
+          }
+        }'''
+
+        read_json(s)
+
+    def test_doc_example(self):
+        dfj2 = DataFrame(np.random.randn(5, 2), columns=list('AB'))
+        dfj2['date'] = Timestamp('20130101')
+        dfj2['ints'] = lrange(5)
+        dfj2['bools'] = True
+        dfj2.index = pd.date_range('20130101', periods=5)
+
+        json = dfj2.to_json()
+        result = read_json(json, dtype={'ints': np.int64, 'bools': np.bool_})
+        assert_frame_equal(result, result)
+
+    def test_misc_example(self):
+
+        # parsing unordered input fails
+        result = read_json('[{"a": 1, "b": 2}, {"b":2, "a" :1}]', numpy=True)
+        expected = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+
+        error_msg = """DataFrame\\.index are different
+
+DataFrame\\.index values are different \\(100\\.0 %\\)
+\\[left\\]:  Index\\(\\[u?'a', u?'b'\\], dtype='object'\\)
+\\[right\\]: RangeIndex\\(start=0, stop=2, step=1\\)"""
+        with tm.assert_raises_regex(AssertionError, error_msg):
+            assert_frame_equal(result, expected, check_index_type=False)
+
+        result = read_json('[{"a": 1, "b": 2}, {"b":2, "a" :1}]')
+        expected = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+        assert_frame_equal(result, expected)
+
+    @network
+    def test_round_trip_exception_(self):
+        # GH 3867
+        csv = 'https://raw.github.com/hayd/lahman2012/master/csvs/Teams.csv'
+        df = pd.read_csv(csv)
+        s = df.to_json()
+        result = pd.read_json(s)
+        assert_frame_equal(result.reindex(
+            index=df.index, columns=df.columns), df)
+
+    @network
+    def test_url(self):
+        url = 'https://api.github.com/repos/pandas-dev/pandas/issues?per_page=5'  # noqa
+        result = read_json(url, convert_dates=True)
+        for c in ['created_at', 'closed_at', 'updated_at']:
+            assert result[c].dtype == 'datetime64[ns]'
+
+    def test_timedelta(self):
+        converter = lambda x: pd.to_timedelta(x, unit='ms')
+
+        s = Series([timedelta(23), timedelta(seconds=5)])
+        assert s.dtype == 'timedelta64[ns]'
+
+        result = pd.read_json(s.to_json(), typ='series').apply(converter)
+        assert_series_equal(result, s)
+
+        s = Series([timedelta(23), timedelta(seconds=5)],
+                   index=pd.Index([0, 1]))
+        assert s.dtype == 'timedelta64[ns]'
+        result = pd.read_json(s.to_json(), typ='series').apply(converter)
+        assert_series_equal(result, s)
+
+        frame = DataFrame([timedelta(23), timedelta(seconds=5)])
+        assert frame[0].dtype == 'timedelta64[ns]'
+        assert_frame_equal(frame, pd.read_json(frame.to_json())
+                           .apply(converter))
+
+        frame = DataFrame({'a': [timedelta(days=23), timedelta(seconds=5)],
+                           'b': [1, 2],
+                           'c': pd.date_range(start='20130101', periods=2)})
+
+        result = pd.read_json(frame.to_json(date_unit='ns'))
+        result['a'] = pd.to_timedelta(result.a, unit='ns')
+        result['c'] = pd.to_datetime(result.c)
+        assert_frame_equal(frame, result)
+
+    def test_mixed_timedelta_datetime(self):
+        frame = DataFrame({'a': [timedelta(23), pd.Timestamp('20130101')]},
+                          dtype=object)
+
+        expected = DataFrame({'a': [pd.Timedelta(frame.a[0]).value,
+                                    pd.Timestamp(frame.a[1]).value]})
+        result = pd.read_json(frame.to_json(date_unit='ns'),
+                              dtype={'a': 'int64'})
+        assert_frame_equal(result, expected, check_index_type=False)
+
+    def test_default_handler(self):
+        value = object()
+        frame = DataFrame({'a': [7, value]})
+        expected = DataFrame({'a': [7, str(value)]})
+        result = pd.read_json(frame.to_json(default_handler=str))
+        assert_frame_equal(expected, result, check_index_type=False)
+
+    def test_default_handler_indirect(self):
+        from pandas.io.json import dumps
+
+        def default(obj):
+            if isinstance(obj, complex):
+                return [('mathjs', 'Complex'),
+                        ('re', obj.real),
+                        ('im', obj.imag)]
+            return str(obj)
+        df_list = [9, DataFrame({'a': [1, 'STR', complex(4, -5)],
+                                 'b': [float('nan'), None, 'N/A']},
+                                columns=['a', 'b'])]
+        expected = ('[9,[[1,null],["STR",null],[[["mathjs","Complex"],'
+                    '["re",4.0],["im",-5.0]],"N\\/A"]]]')
+        assert dumps(df_list, default_handler=default,
+                     orient="values") == expected
+
+    def test_default_handler_numpy_unsupported_dtype(self):
+        # GH12554 to_json raises 'Unhandled numpy dtype 15'
+        df = DataFrame({'a': [1, 2.3, complex(4, -5)],
+                        'b': [float('nan'), None, complex(1.2, 0)]},
+                       columns=['a', 'b'])
+        expected = ('[["(1+0j)","(nan+0j)"],'
+                    '["(2.3+0j)","(nan+0j)"],'
+                    '["(4-5j)","(1.2+0j)"]]')
+        assert df.to_json(default_handler=str, orient="values") == expected
+
+    def test_default_handler_raises(self):
+        def my_handler_raises(obj):
+            raise TypeError("raisin")
+        pytest.raises(TypeError,
+                      DataFrame({'a': [1, 2, object()]}).to_json,
+                      default_handler=my_handler_raises)
+        pytest.raises(TypeError,
+                      DataFrame({'a': [1, 2, complex(4, -5)]}).to_json,
+                      default_handler=my_handler_raises)
+
+    def test_categorical(self):
+        # GH4377 df.to_json segfaults with non-ndarray blocks
+        df = DataFrame({"A": ["a", "b", "c", "a", "b", "b", "a"]})
+        df["B"] = df["A"]
+        expected = df.to_json()
+
+        df["B"] = df["A"].astype('category')
+        assert expected == df.to_json()
+
+        s = df["A"]
+        sc = df["B"]
+        assert s.to_json() == sc.to_json()
+
+    def test_datetime_tz(self):
+        # GH4377 df.to_json segfaults with non-ndarray blocks
+        tz_range = pd.date_range('20130101', periods=3, tz='US/Eastern')
+        tz_naive = tz_range.tz_convert('utc').tz_localize(None)
+
+        df = DataFrame({
+            'A': tz_range,
+            'B': pd.date_range('20130101', periods=3)})
+
+        df_naive = df.copy()
+        df_naive['A'] = tz_naive
+        expected = df_naive.to_json()
+        assert expected == df.to_json()
+
+        stz = Series(tz_range)
+        s_naive = Series(tz_naive)
+        assert stz.to_json() == s_naive.to_json()
+
+    def test_sparse(self):
+        # GH4377 df.to_json segfaults with non-ndarray blocks
+        df = pd.DataFrame(np.random.randn(10, 4))
+        df.loc[:8] = np.nan
+
+        sdf = df.to_sparse()
+        expected = df.to_json()
+        assert expected == sdf.to_json()
+
+        s = pd.Series(np.random.randn(10))
+        s.loc[:8] = np.nan
+        ss = s.to_sparse()
+
+        expected = s.to_json()
+        assert expected == ss.to_json()
+
+    def test_tz_is_utc(self):
+        from pandas.io.json import dumps
+        exp = '"2013-01-10T05:00:00.000Z"'
+
+        ts = Timestamp('2013-01-10 05:00:00Z')
+        assert dumps(ts, iso_dates=True) == exp
+        dt = ts.to_pydatetime()
+        assert dumps(dt, iso_dates=True) == exp
+
+        ts = Timestamp('2013-01-10 00:00:00', tz='US/Eastern')
+        assert dumps(ts, iso_dates=True) == exp
+        dt = ts.to_pydatetime()
+        assert dumps(dt, iso_dates=True) == exp
+
+        ts = Timestamp('2013-01-10 00:00:00-0500')
+        assert dumps(ts, iso_dates=True) == exp
+        dt = ts.to_pydatetime()
+        assert dumps(dt, iso_dates=True) == exp
+
+    def test_tz_range_is_utc(self):
+        from pandas.io.json import dumps
+
+        exp = '["2013-01-01T05:00:00.000Z","2013-01-02T05:00:00.000Z"]'
+        dfexp = ('{"DT":{'
+                 '"0":"2013-01-01T05:00:00.000Z",'
+                 '"1":"2013-01-02T05:00:00.000Z"}}')
+
+        tz_range = pd.date_range('2013-01-01 05:00:00Z', periods=2)
+        assert dumps(tz_range, iso_dates=True) == exp
+        dti = pd.DatetimeIndex(tz_range)
+        assert dumps(dti, iso_dates=True) == exp
+        df = DataFrame({'DT': dti})
+        assert dumps(df, iso_dates=True) == dfexp
+
+        tz_range = pd.date_range('2013-01-01 00:00:00', periods=2,
+                                 tz='US/Eastern')
+        assert dumps(tz_range, iso_dates=True) == exp
+        dti = pd.DatetimeIndex(tz_range)
+        assert dumps(dti, iso_dates=True) == exp
+        df = DataFrame({'DT': dti})
+        assert dumps(df, iso_dates=True) == dfexp
+
+        tz_range = pd.date_range('2013-01-01 00:00:00-0500', periods=2)
+        assert dumps(tz_range, iso_dates=True) == exp
+        dti = pd.DatetimeIndex(tz_range)
+        assert dumps(dti, iso_dates=True) == exp
+        df = DataFrame({'DT': dti})
+        assert dumps(df, iso_dates=True) == dfexp
+
+    def test_read_inline_jsonl(self):
+        # GH9180
+        result = read_json('{"a": 1, "b": 2}\n{"b":2, "a" :1}\n', lines=True)
+        expected = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+        assert_frame_equal(result, expected)
+
+    def test_read_s3_jsonl(self, s3_resource):
+        # GH17200
+
+        result = read_json('s3n://pandas-test/items.jsonl', lines=True)
+        expected = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+        assert_frame_equal(result, expected)
+
+    def test_read_local_jsonl(self):
+        # GH17200
+        with ensure_clean('tmp_items.json') as path:
+            with open(path, 'w') as infile:
+                infile.write('{"a": 1, "b": 2}\n{"b":2, "a" :1}\n')
+            result = read_json(path, lines=True)
+            expected = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+            assert_frame_equal(result, expected)
+
+    def test_read_jsonl_unicode_chars(self):
+        # GH15132: non-ascii unicode characters
+        # \u201d == RIGHT DOUBLE QUOTATION MARK
+
+        # simulate file handle
+        json = '{"a": "foo”", "b": "bar"}\n{"a": "foo", "b": "bar"}\n'
+        json = StringIO(json)
+        result = read_json(json, lines=True)
+        expected = DataFrame([[u"foo\u201d", "bar"], ["foo", "bar"]],
+                             columns=['a', 'b'])
+        assert_frame_equal(result, expected)
+
+        # simulate string
+        json = '{"a": "foo”", "b": "bar"}\n{"a": "foo", "b": "bar"}\n'
+        result = read_json(json, lines=True)
+        expected = DataFrame([[u"foo\u201d", "bar"], ["foo", "bar"]],
+                             columns=['a', 'b'])
+        assert_frame_equal(result, expected)
+
+    def test_read_json_large_numbers(self):
+        # GH18842
+        json = '{"articleId": "1404366058080022500245"}'
+        json = StringIO(json)
+        result = read_json(json, typ="series")
+        expected = Series(1.404366e+21, index=['articleId'])
+        assert_series_equal(result, expected)
+
+        json = '{"0": {"articleId": "1404366058080022500245"}}'
+        json = StringIO(json)
+        result = read_json(json)
+        expected = DataFrame(1.404366e+21, index=['articleId'], columns=[0])
+        assert_frame_equal(result, expected)
+
+    def test_to_jsonl(self):
+        # GH9180
+        df = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+        result = df.to_json(orient="records", lines=True)
+        expected = '{"a":1,"b":2}\n{"a":1,"b":2}'
+        assert result == expected
+
+        df = DataFrame([["foo}", "bar"], ['foo"', "bar"]], columns=['a', 'b'])
+        result = df.to_json(orient="records", lines=True)
+        expected = '{"a":"foo}","b":"bar"}\n{"a":"foo\\"","b":"bar"}'
+        assert result == expected
+        assert_frame_equal(pd.read_json(result, lines=True), df)
+
+        # GH15096: escaped characters in columns and data
+        df = DataFrame([["foo\\", "bar"], ['foo"', "bar"]],
+                       columns=["a\\", 'b'])
+        result = df.to_json(orient="records", lines=True)
+        expected = ('{"a\\\\":"foo\\\\","b":"bar"}\n'
+                    '{"a\\\\":"foo\\"","b":"bar"}')
+        assert result == expected
+        assert_frame_equal(pd.read_json(result, lines=True), df)
+
+    def test_latin_encoding(self):
+        if compat.PY2:
+            tm.assert_raises_regex(
+                TypeError, r'\[unicode\] is not implemented as a table column')
+            return
+
+        # GH 13774
+        pytest.skip("encoding not implemented in .to_json(), "
+                    "xref #13774")
+
+        values = [[b'E\xc9, 17', b'', b'a', b'b', b'c'],
+                  [b'E\xc9, 17', b'a', b'b', b'c'],
+                  [b'EE, 17', b'', b'a', b'b', b'c'],
+                  [b'E\xc9, 17', b'\xf8\xfc', b'a', b'b', b'c'],
+                  [b'', b'a', b'b', b'c'],
+                  [b'\xf8\xfc', b'a', b'b', b'c'],
+                  [b'A\xf8\xfc', b'', b'a', b'b', b'c'],
+                  [np.nan, b'', b'b', b'c'],
+                  [b'A\xf8\xfc', np.nan, b'', b'b', b'c']]
+
+        def _try_decode(x, encoding='latin-1'):
+            try:
+                return x.decode(encoding)
+            except AttributeError:
+                return x
+
+        # not sure how to remove latin-1 from code in python 2 and 3
+        values = [[_try_decode(x) for x in y] for y in values]
+
+        examples = []
+        for dtype in ['category', object]:
+            for val in values:
+                examples.append(Series(val, dtype=dtype))
+
+        def roundtrip(s, encoding='latin-1'):
+            with ensure_clean('test.json') as path:
+                s.to_json(path, encoding=encoding)
+                retr = read_json(path, encoding=encoding)
+                assert_series_equal(s, retr, check_categorical=False)
+
+        for s in examples:
+            roundtrip(s)
+
+    def test_data_frame_size_after_to_json(self):
+        # GH15344
+        df = DataFrame({'a': [str(1)]})
+
+        size_before = df.memory_usage(index=True, deep=True).sum()
+        df.to_json()
+        size_after = df.memory_usage(index=True, deep=True).sum()
+
+        assert size_before == size_after
+
+    @pytest.mark.parametrize('data, expected', [
+        (DataFrame([[1, 2], [4, 5]], columns=['a', 'b']),
+            {'columns': ['a', 'b'], 'data': [[1, 2], [4, 5]]}),
+        (DataFrame([[1, 2], [4, 5]], columns=['a', 'b']).rename_axis('foo'),
+            {'columns': ['a', 'b'], 'data': [[1, 2], [4, 5]]}),
+        (DataFrame([[1, 2], [4, 5]], columns=['a', 'b'],
+                   index=[['a', 'b'], ['c', 'd']]),
+            {'columns': ['a', 'b'], 'data': [[1, 2], [4, 5]]}),
+        (Series([1, 2, 3], name='A'),
+            {'name': 'A', 'data': [1, 2, 3]}),
+        (Series([1, 2, 3], name='A').rename_axis('foo'),
+            {'name': 'A', 'data': [1, 2, 3]}),
+        (Series([1, 2], name='A', index=[['a', 'b'], ['c', 'd']]),
+            {'name': 'A', 'data': [1, 2]}),
+    ])
+    def test_index_false_to_json_split(self, data, expected):
+        # GH 17394
+        # Testing index=False in to_json with orient='split'
+
+        result = data.to_json(orient='split', index=False)
+        result = json.loads(result)
+
+        assert result == expected
+
+    @pytest.mark.parametrize('data', [
+        (DataFrame([[1, 2], [4, 5]], columns=['a', 'b'])),
+        (DataFrame([[1, 2], [4, 5]], columns=['a', 'b']).rename_axis('foo')),
+        (DataFrame([[1, 2], [4, 5]], columns=['a', 'b'],
+                   index=[['a', 'b'], ['c', 'd']])),
+        (Series([1, 2, 3], name='A')),
+        (Series([1, 2, 3], name='A').rename_axis('foo')),
+        (Series([1, 2], name='A', index=[['a', 'b'], ['c', 'd']])),
+    ])
+    def test_index_false_to_json_table(self, data):
+        # GH 17394
+        # Testing index=False in to_json with orient='table'
+
+        result = data.to_json(orient='table', index=False)
+        result = json.loads(result)
+
+        expected = {
+            'schema': pd.io.json.build_table_schema(data, index=False),
+            'data': DataFrame(data).to_dict(orient='records')
+        }
+
+        assert result == expected
+
+    @pytest.mark.parametrize('orient', [
+        'records', 'index', 'columns', 'values'
+    ])
+    def test_index_false_error_to_json(self, orient):
+        # GH 17394
+        # Testing error message from to_json with index=False
+
+        df = pd.DataFrame([[1, 2], [4, 5]], columns=['a', 'b'])
+
+        with tm.assert_raises_regex(ValueError, "'index=False' is only "
+                                                "valid when 'orient' is "
+                                                "'split' or 'table'"):
+            df.to_json(orient=orient, index=False)
diff --git a/pandas/tests/io/json/test_readlines.py b/pandas/tests/io/json/test_readlines.py
new file mode 100644
index 0000000000000..3f61f702b7c9c
--- /dev/null
+++ b/pandas/tests/io/json/test_readlines.py
@@ -0,0 +1,169 @@
+# -*- coding: utf-8 -*-
+import pytest
+import pandas as pd
+from pandas import DataFrame, read_json
+from pandas.compat import StringIO
+from pandas.io.json.json import JsonReader
+import pandas.util.testing as tm
+from pandas.util.testing import (assert_frame_equal, assert_series_equal,
+                                 ensure_clean)
+
+
+@pytest.fixture
+def lines_json_df():
+    df = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
+    return df.to_json(lines=True, orient="records")
+
+
+def test_read_jsonl():
+    # GH9180
+    result = read_json('{"a": 1, "b": 2}\n{"b":2, "a" :1}\n', lines=True)
+    expected = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+    assert_frame_equal(result, expected)
+
+
+def test_read_jsonl_unicode_chars():
+    # GH15132: non-ascii unicode characters
+    # \u201d == RIGHT DOUBLE QUOTATION MARK
+
+    # simulate file handle
+    json = '{"a": "foo”", "b": "bar"}\n{"a": "foo", "b": "bar"}\n'
+    json = StringIO(json)
+    result = read_json(json, lines=True)
+    expected = DataFrame([[u"foo\u201d", "bar"], ["foo", "bar"]],
+                         columns=['a', 'b'])
+    assert_frame_equal(result, expected)
+
+    # simulate string
+    json = '{"a": "foo”", "b": "bar"}\n{"a": "foo", "b": "bar"}\n'
+    result = read_json(json, lines=True)
+    expected = DataFrame([[u"foo\u201d", "bar"], ["foo", "bar"]],
+                         columns=['a', 'b'])
+    assert_frame_equal(result, expected)
+
+
+def test_to_jsonl():
+    # GH9180
+    df = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+    result = df.to_json(orient="records", lines=True)
+    expected = '{"a":1,"b":2}\n{"a":1,"b":2}'
+    assert result == expected
+
+    df = DataFrame([["foo}", "bar"], ['foo"', "bar"]], columns=['a', 'b'])
+    result = df.to_json(orient="records", lines=True)
+    expected = '{"a":"foo}","b":"bar"}\n{"a":"foo\\"","b":"bar"}'
+    assert result == expected
+    assert_frame_equal(read_json(result, lines=True), df)
+
+    # GH15096: escaped characters in columns and data
+    df = DataFrame([["foo\\", "bar"], ['foo"', "bar"]],
+                   columns=["a\\", 'b'])
+    result = df.to_json(orient="records", lines=True)
+    expected = ('{"a\\\\":"foo\\\\","b":"bar"}\n'
+                '{"a\\\\":"foo\\"","b":"bar"}')
+    assert result == expected
+    assert_frame_equal(read_json(result, lines=True), df)
+
+
+@pytest.mark.parametrize("chunksize", [1, 1.0])
+def test_readjson_chunks(lines_json_df, chunksize):
+    # Basic test that read_json(chunks=True) gives the same result as
+    # read_json(chunks=False)
+    # GH17048: memory usage when lines=True
+
+    unchunked = read_json(StringIO(lines_json_df), lines=True)
+    reader = read_json(StringIO(lines_json_df), lines=True,
+                       chunksize=chunksize)
+    chunked = pd.concat(reader)
+
+    assert_frame_equal(chunked, unchunked)
+
+
+def test_readjson_chunksize_requires_lines(lines_json_df):
+    msg = "chunksize can only be passed if lines=True"
+    with tm.assert_raises_regex(ValueError, msg):
+        pd.read_json(StringIO(lines_json_df), lines=False, chunksize=2)
+
+
+def test_readjson_chunks_series():
+    # Test reading line-format JSON to Series with chunksize param
+    s = pd.Series({'A': 1, 'B': 2})
+
+    strio = StringIO(s.to_json(lines=True, orient="records"))
+    unchunked = pd.read_json(strio, lines=True, typ='Series')
+
+    strio = StringIO(s.to_json(lines=True, orient="records"))
+    chunked = pd.concat(pd.read_json(
+        strio, lines=True, typ='Series', chunksize=1
+    ))
+
+    assert_series_equal(chunked, unchunked)
+
+
+def test_readjson_each_chunk(lines_json_df):
+    # Other tests check that the final result of read_json(chunksize=True)
+    # is correct. This checks the intermediate chunks.
+    chunks = list(
+        pd.read_json(StringIO(lines_json_df), lines=True, chunksize=2)
+    )
+    assert chunks[0].shape == (2, 2)
+    assert chunks[1].shape == (1, 2)
+
+
+def test_readjson_chunks_from_file():
+    with ensure_clean('test.json') as path:
+        df = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
+        df.to_json(path, lines=True, orient="records")
+        chunked = pd.concat(pd.read_json(path, lines=True, chunksize=1))
+        unchunked = pd.read_json(path, lines=True)
+        assert_frame_equal(unchunked, chunked)
+
+
+@pytest.mark.parametrize("chunksize", [None, 1])
+def test_readjson_chunks_closes(chunksize):
+    with ensure_clean('test.json') as path:
+        df = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
+        df.to_json(path, lines=True, orient="records")
+        reader = JsonReader(
+            path, orient=None, typ="frame", dtype=True, convert_axes=True,
+            convert_dates=True, keep_default_dates=True, numpy=False,
+            precise_float=False, date_unit=None, encoding=None,
+            lines=True, chunksize=chunksize, compression=None)
+        reader.read()
+        assert reader.open_stream.closed, "didn't close stream with \
+            chunksize = {chunksize}".format(chunksize=chunksize)
+
+
+@pytest.mark.parametrize("chunksize", [0, -1, 2.2, "foo"])
+def test_readjson_invalid_chunksize(lines_json_df, chunksize):
+    msg = r"'chunksize' must be an integer >=1"
+
+    with tm.assert_raises_regex(ValueError, msg):
+        pd.read_json(StringIO(lines_json_df), lines=True,
+                     chunksize=chunksize)
+
+
+@pytest.mark.parametrize("chunksize", [None, 1, 2])
+def test_readjson_chunks_multiple_empty_lines(chunksize):
+    j = """
+
+    {"A":1,"B":4}
+
+
+
+    {"A":2,"B":5}
+
+
+
+
+
+
+
+    {"A":3,"B":6}
+    """
+    orig = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
+    test = pd.read_json(j, lines=True, chunksize=chunksize)
+    if chunksize is not None:
+        test = pd.concat(test)
+    tm.assert_frame_equal(
+        orig, test, obj="chunksize: {chunksize}".format(chunksize=chunksize))
diff --git a/pandas/tests/io/json/test_ujson.py b/pandas/tests/io/json/test_ujson.py
new file mode 100644
index 0000000000000..89acbfdc9a746
--- /dev/null
+++ b/pandas/tests/io/json/test_ujson.py
@@ -0,0 +1,1646 @@
+# -*- coding: utf-8 -*-
+
+try:
+    import json
+except ImportError:
+    import simplejson as json
+import math
+import pytz
+import pytest
+import time
+import datetime
+import calendar
+import re
+import decimal
+import dateutil
+from functools import partial
+from pandas.compat import range, zip, StringIO, u
+import pandas._libs.json as ujson
+import pandas.compat as compat
+
+import numpy as np
+from pandas import DataFrame, Series, Index, NaT, DatetimeIndex
+import pandas.util.testing as tm
+
+
+json_unicode = (json.dumps if compat.PY3
+                else partial(json.dumps, encoding="utf-8"))
+
+
+class TestUltraJSONTests(object):
+
+    @pytest.mark.skipif(compat.is_platform_32bit(),
+                        reason="not compliant on 32-bit, xref #15865")
+    def test_encodeDecimal(self):
+        sut = decimal.Decimal("1337.1337")
+        encoded = ujson.encode(sut, double_precision=15)
+        decoded = ujson.decode(encoded)
+        assert decoded == 1337.1337
+
+        sut = decimal.Decimal("0.95")
+        encoded = ujson.encode(sut, double_precision=1)
+        assert encoded == "1.0"
+        decoded = ujson.decode(encoded)
+        assert decoded == 1.0
+
+        sut = decimal.Decimal("0.94")
+        encoded = ujson.encode(sut, double_precision=1)
+        assert encoded == "0.9"
+        decoded = ujson.decode(encoded)
+        assert decoded == 0.9
+
+        sut = decimal.Decimal("1.95")
+        encoded = ujson.encode(sut, double_precision=1)
+        assert encoded == "2.0"
+        decoded = ujson.decode(encoded)
+        assert decoded == 2.0
+
+        sut = decimal.Decimal("-1.95")
+        encoded = ujson.encode(sut, double_precision=1)
+        assert encoded == "-2.0"
+        decoded = ujson.decode(encoded)
+        assert decoded == -2.0
+
+        sut = decimal.Decimal("0.995")
+        encoded = ujson.encode(sut, double_precision=2)
+        assert encoded == "1.0"
+        decoded = ujson.decode(encoded)
+        assert decoded == 1.0
+
+        sut = decimal.Decimal("0.9995")
+        encoded = ujson.encode(sut, double_precision=3)
+        assert encoded == "1.0"
+        decoded = ujson.decode(encoded)
+        assert decoded == 1.0
+
+        sut = decimal.Decimal("0.99999999999999944")
+        encoded = ujson.encode(sut, double_precision=15)
+        assert encoded == "1.0"
+        decoded = ujson.decode(encoded)
+        assert decoded == 1.0
+
+    def test_encodeStringConversion(self):
+        input = "A string \\ / \b \f \n \r \t </script> &"
+        not_html_encoded = ('"A string \\\\ \\/ \\b \\f \\n '
+                            '\\r \\t <\\/script> &"')
+        html_encoded = ('"A string \\\\ \\/ \\b \\f \\n \\r \\t '
+                        '\\u003c\\/script\\u003e \\u0026"')
+
+        def helper(expected_output, **encode_kwargs):
+            output = ujson.encode(input, **encode_kwargs)
+            assert input == json.loads(output)
+            assert output == expected_output
+            assert input == ujson.decode(output)
+
+        # Default behavior assumes encode_html_chars=False.
+        helper(not_html_encoded, ensure_ascii=True)
+        helper(not_html_encoded, ensure_ascii=False)
+
+        # Make sure explicit encode_html_chars=False works.
+        helper(not_html_encoded, ensure_ascii=True, encode_html_chars=False)
+        helper(not_html_encoded, ensure_ascii=False, encode_html_chars=False)
+
+        # Make sure explicit encode_html_chars=True does the encoding.
+        helper(html_encoded, ensure_ascii=True, encode_html_chars=True)
+        helper(html_encoded, ensure_ascii=False, encode_html_chars=True)
+
+    def test_doubleLongIssue(self):
+        sut = {u('a'): -4342969734183514}
+        encoded = json.dumps(sut)
+        decoded = json.loads(encoded)
+        assert sut == decoded
+        encoded = ujson.encode(sut, double_precision=15)
+        decoded = ujson.decode(encoded)
+        assert sut == decoded
+
+    def test_doubleLongDecimalIssue(self):
+        sut = {u('a'): -12345678901234.56789012}
+        encoded = json.dumps(sut)
+        decoded = json.loads(encoded)
+        assert sut == decoded
+        encoded = ujson.encode(sut, double_precision=15)
+        decoded = ujson.decode(encoded)
+        assert sut == decoded
+
+    def test_encodeNonCLocale(self):
+        import locale
+        savedlocale = locale.getlocale(locale.LC_NUMERIC)
+        try:
+            locale.setlocale(locale.LC_NUMERIC, 'it_IT.UTF-8')
+        except:
+            try:
+                locale.setlocale(locale.LC_NUMERIC, 'Italian_Italy')
+            except:
+                pytest.skip('Could not set locale for testing')
+        assert ujson.loads(ujson.dumps(4.78e60)) == 4.78e60
+        assert ujson.loads('4.78', precise_float=True) == 4.78
+        locale.setlocale(locale.LC_NUMERIC, savedlocale)
+
+    def test_encodeDecodeLongDecimal(self):
+        sut = {u('a'): -528656961.4399388}
+        encoded = ujson.dumps(sut, double_precision=15)
+        ujson.decode(encoded)
+
+    def test_decimalDecodeTestPrecise(self):
+        sut = {u('a'): 4.56}
+        encoded = ujson.encode(sut)
+        decoded = ujson.decode(encoded, precise_float=True)
+        assert sut == decoded
+
+    @pytest.mark.skipif(compat.is_platform_windows() and not compat.PY3,
+                        reason="buggy on win-64 for py2")
+    def test_encodeDoubleTinyExponential(self):
+        num = 1e-40
+        assert num == ujson.decode(ujson.encode(num))
+        num = 1e-100
+        assert num == ujson.decode(ujson.encode(num))
+        num = -1e-45
+        assert num == ujson.decode(ujson.encode(num))
+        num = -1e-145
+        assert np.allclose(num, ujson.decode(ujson.encode(num)))
+
+    def test_encodeDictWithUnicodeKeys(self):
+        input = {u("key1"): u("value1"), u("key1"):
+                 u("value1"), u("key1"): u("value1"),
+                 u("key1"): u("value1"), u("key1"):
+                 u("value1"), u("key1"): u("value1")}
+        output = ujson.encode(input)
+
+        input = {u("بن"): u("value1"), u("بن"): u("value1"),
+                 u("بن"): u("value1"), u("بن"): u("value1"),
+                 u("بن"): u("value1"), u("بن"): u("value1"),
+                 u("بن"): u("value1")}
+        output = ujson.encode(input)  # noqa
+
+    def test_encodeDoubleConversion(self):
+        input = math.pi
+        output = ujson.encode(input)
+        assert round(input, 5) == round(json.loads(output), 5)
+        assert round(input, 5) == round(ujson.decode(output), 5)
+
+    def test_encodeWithDecimal(self):
+        input = 1.0
+        output = ujson.encode(input)
+        assert output == "1.0"
+
+    def test_encodeDoubleNegConversion(self):
+        input = -math.pi
+        output = ujson.encode(input)
+
+        assert round(input, 5) == round(json.loads(output), 5)
+        assert round(input, 5) == round(ujson.decode(output), 5)
+
+    def test_encodeArrayOfNestedArrays(self):
+        input = [[[[]]]] * 20
+        output = ujson.encode(input)
+        assert input == json.loads(output)
+        # assert output == json.dumps(input)
+        assert input == ujson.decode(output)
+        input = np.array(input)
+        tm.assert_numpy_array_equal(input, ujson.decode(
+            output, numpy=True, dtype=input.dtype))
+
+    def test_encodeArrayOfDoubles(self):
+        input = [31337.31337, 31337.31337, 31337.31337, 31337.31337] * 10
+        output = ujson.encode(input)
+        assert input == json.loads(output)
+        # assert output == json.dumps(input)
+        assert input == ujson.decode(output)
+        tm.assert_numpy_array_equal(
+            np.array(input), ujson.decode(output, numpy=True))
+
+    def test_doublePrecisionTest(self):
+        input = 30.012345678901234
+        output = ujson.encode(input, double_precision=15)
+        assert input == json.loads(output)
+        assert input == ujson.decode(output)
+
+        output = ujson.encode(input, double_precision=9)
+        assert round(input, 9) == json.loads(output)
+        assert round(input, 9) == ujson.decode(output)
+
+        output = ujson.encode(input, double_precision=3)
+        assert round(input, 3) == json.loads(output)
+        assert round(input, 3) == ujson.decode(output)
+
+    def test_invalidDoublePrecision(self):
+        input = 30.12345678901234567890
+
+        pytest.raises(ValueError, ujson.encode, input, double_precision=20)
+        pytest.raises(ValueError, ujson.encode, input, double_precision=-1)
+
+        # will throw typeError
+        pytest.raises(TypeError, ujson.encode, input, double_precision='9')
+        # will throw typeError
+        pytest.raises(TypeError, ujson.encode,
+                      input, double_precision=None)
+
+    def test_encodeStringConversion2(self):
+        input = "A string \\ / \b \f \n \r \t"
+        output = ujson.encode(input)
+        assert input == json.loads(output)
+        assert output == '"A string \\\\ \\/ \\b \\f \\n \\r \\t"'
+        assert input == ujson.decode(output)
+        pass
+
+    def test_decodeUnicodeConversion(self):
+        pass
+
+    def test_encodeUnicodeConversion1(self):
+        input = "Räksmörgås اسامة بن محمد بن عوض بن لادن"
+        enc = ujson.encode(input)
+        dec = ujson.decode(enc)
+        assert enc == json_unicode(input)
+        assert dec == json.loads(enc)
+
+    def test_encodeControlEscaping(self):
+        input = "\x19"
+        enc = ujson.encode(input)
+        dec = ujson.decode(enc)
+        assert input == dec
+        assert enc == json_unicode(input)
+
+    def test_encodeUnicodeConversion2(self):
+        input = "\xe6\x97\xa5\xd1\x88"
+        enc = ujson.encode(input)
+        dec = ujson.decode(enc)
+        assert enc == json_unicode(input)
+        assert dec == json.loads(enc)
+
+    def test_encodeUnicodeSurrogatePair(self):
+        input = "\xf0\x90\x8d\x86"
+        enc = ujson.encode(input)
+        dec = ujson.decode(enc)
+
+        assert enc == json_unicode(input)
+        assert dec == json.loads(enc)
+
+    def test_encodeUnicode4BytesUTF8(self):
+        input = "\xf0\x91\x80\xb0TRAILINGNORMAL"
+        enc = ujson.encode(input)
+        dec = ujson.decode(enc)
+
+        assert enc == json_unicode(input)
+        assert dec == json.loads(enc)
+
+    def test_encodeUnicode4BytesUTF8Highest(self):
+        input = "\xf3\xbf\xbf\xbfTRAILINGNORMAL"
+        enc = ujson.encode(input)
+
+        dec = ujson.decode(enc)
+
+        assert enc == json_unicode(input)
+        assert dec == json.loads(enc)
+
+    def test_encodeArrayInArray(self):
+        input = [[[[]]]]
+        output = ujson.encode(input)
+
+        assert input == json.loads(output)
+        assert output == json.dumps(input)
+        assert input == ujson.decode(output)
+        tm.assert_numpy_array_equal(
+            np.array(input), ujson.decode(output, numpy=True))
+        pass
+
+    def test_encodeIntConversion(self):
+        input = 31337
+        output = ujson.encode(input)
+        assert input == json.loads(output)
+        assert output == json.dumps(input)
+        assert input == ujson.decode(output)
+        pass
+
+    def test_encodeIntNegConversion(self):
+        input = -31337
+        output = ujson.encode(input)
+        assert input == json.loads(output)
+        assert output == json.dumps(input)
+        assert input == ujson.decode(output)
+        pass
+
+    def test_encodeLongNegConversion(self):
+        input = -9223372036854775808
+        output = ujson.encode(input)
+
+        assert input == json.loads(output)
+        assert output == json.dumps(input)
+        assert input == ujson.decode(output)
+
+    def test_encodeListConversion(self):
+        input = [1, 2, 3, 4]
+        output = ujson.encode(input)
+        assert input == json.loads(output)
+        assert input == ujson.decode(output)
+        tm.assert_numpy_array_equal(
+            np.array(input), ujson.decode(output, numpy=True))
+        pass
+
+    def test_encodeDictConversion(self):
+        input = {"k1": 1, "k2": 2, "k3": 3, "k4": 4}
+        output = ujson.encode(input)  # noqa
+        assert input == json.loads(output)
+        assert input == ujson.decode(output)
+        assert input == ujson.decode(output)
+        pass
+
+    def test_encodeNoneConversion(self):
+        input = None
+        output = ujson.encode(input)
+        assert input == json.loads(output)
+        assert output == json.dumps(input)
+        assert input == ujson.decode(output)
+        pass
+
+    def test_encodeTrueConversion(self):
+        input = True
+        output = ujson.encode(input)
+        assert input == json.loads(output)
+        assert output == json.dumps(input)
+        assert input == ujson.decode(output)
+        pass
+
+    def test_encodeFalseConversion(self):
+        input = False
+        output = ujson.encode(input)
+        assert input == json.loads(output)
+        assert output == json.dumps(input)
+        assert input == ujson.decode(output)
+
+    def test_encodeDatetimeConversion(self):
+        ts = time.time()
+        input = datetime.datetime.fromtimestamp(ts)
+        output = ujson.encode(input, date_unit='s')
+        expected = calendar.timegm(input.utctimetuple())
+        assert int(expected) == json.loads(output)
+        assert int(expected) == ujson.decode(output)
+
+    def test_encodeDateConversion(self):
+        ts = time.time()
+        input = datetime.date.fromtimestamp(ts)
+
+        output = ujson.encode(input, date_unit='s')
+        tup = (input.year, input.month, input.day, 0, 0, 0)
+
+        expected = calendar.timegm(tup)
+        assert int(expected) == json.loads(output)
+        assert int(expected) == ujson.decode(output)
+
+    def test_encodeTimeConversion(self):
+        tests = [
+            datetime.time(),
+            datetime.time(1, 2, 3),
+            datetime.time(10, 12, 15, 343243),
+        ]
+        for test in tests:
+            output = ujson.encode(test)
+            expected = '"{iso}"'.format(iso=test.isoformat())
+            assert expected == output
+
+    def test_encodeTimeConversion_pytz(self):
+        # see gh-11473: to_json segfaults with timezone-aware datetimes
+        test = datetime.time(10, 12, 15, 343243, pytz.utc)
+        output = ujson.encode(test)
+        expected = '"{iso}"'.format(iso=test.isoformat())
+        assert expected == output
+
+    def test_encodeTimeConversion_dateutil(self):
+        # see gh-11473: to_json segfaults with timezone-aware datetimes
+        test = datetime.time(10, 12, 15, 343243, dateutil.tz.tzutc())
+        output = ujson.encode(test)
+        expected = '"{iso}"'.format(iso=test.isoformat())
+        assert expected == output
+
+    def test_nat(self):
+        input = NaT
+        assert ujson.encode(input) == 'null', "Expected null"
+
+    def test_npy_nat(self):
+        from distutils.version import LooseVersion
+        if LooseVersion(np.__version__) < LooseVersion('1.7.0'):
+            pytest.skip("numpy version < 1.7.0, is "
+                        "{0}".format(np.__version__))
+
+        input = np.datetime64('NaT')
+        assert ujson.encode(input) == 'null', "Expected null"
+
+    def test_datetime_units(self):
+        from pandas._libs.tslib import Timestamp
+
+        val = datetime.datetime(2013, 8, 17, 21, 17, 12, 215504)
+        stamp = Timestamp(val)
+
+        roundtrip = ujson.decode(ujson.encode(val, date_unit='s'))
+        assert roundtrip == stamp.value // 10**9
+
+        roundtrip = ujson.decode(ujson.encode(val, date_unit='ms'))
+        assert roundtrip == stamp.value // 10**6
+
+        roundtrip = ujson.decode(ujson.encode(val, date_unit='us'))
+        assert roundtrip == stamp.value // 10**3
+
+        roundtrip = ujson.decode(ujson.encode(val, date_unit='ns'))
+        assert roundtrip == stamp.value
+
+        pytest.raises(ValueError, ujson.encode, val, date_unit='foo')
+
+    def test_encodeToUTF8(self):
+        input = "\xe6\x97\xa5\xd1\x88"
+        enc = ujson.encode(input, ensure_ascii=False)
+        dec = ujson.decode(enc)
+        assert enc == json_unicode(input, ensure_ascii=False)
+        assert dec == json.loads(enc)
+
+    def test_decodeFromUnicode(self):
+        input = u("{\"obj\": 31337}")
+        dec1 = ujson.decode(input)
+        dec2 = ujson.decode(str(input))
+        assert dec1 == dec2
+
+    def test_encodeRecursionMax(self):
+        # 8 is the max recursion depth
+
+        class O2(object):
+            member = 0
+            pass
+
+        class O1(object):
+            member = 0
+            pass
+
+        input = O1()
+        input.member = O2()
+        input.member.member = input
+
+        try:
+            output = ujson.encode(input)  # noqa
+            assert False, "Expected overflow exception"
+        except(OverflowError):
+            pass
+
+    def test_encodeDoubleNan(self):
+        input = np.nan
+        assert ujson.encode(input) == 'null', "Expected null"
+
+    def test_encodeDoubleInf(self):
+        input = np.inf
+        assert ujson.encode(input) == 'null', "Expected null"
+
+    def test_encodeDoubleNegInf(self):
+        input = -np.inf
+        assert ujson.encode(input) == 'null', "Expected null"
+
+    def test_decodeJibberish(self):
+        input = "fdsa sda v9sa fdsa"
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+        assert False, "Wrong exception"
+
+    def test_decodeBrokenArrayStart(self):
+        input = "["
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+        assert False, "Wrong exception"
+
+    def test_decodeBrokenObjectStart(self):
+        input = "{"
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+        assert False, "Wrong exception"
+
+    def test_decodeBrokenArrayEnd(self):
+        input = "]"
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+        assert False, "Wrong exception"
+
+    def test_decodeArrayDepthTooBig(self):
+        input = '[' * (1024 * 1024)
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+        assert False, "Wrong exception"
+
+    def test_decodeBrokenObjectEnd(self):
+        input = "}"
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+        assert False, "Wrong exception"
+
+    def test_decodeObjectDepthTooBig(self):
+        input = '{' * (1024 * 1024)
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+        assert False, "Wrong exception"
+
+    def test_decodeStringUnterminated(self):
+        input = "\"TESTING"
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+        assert False, "Wrong exception"
+
+    def test_decodeStringUntermEscapeSequence(self):
+        input = "\"TESTING\\\""
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+        assert False, "Wrong exception"
+
+    def test_decodeStringBadEscape(self):
+        input = "\"TESTING\\\""
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+        assert False, "Wrong exception"
+
+    def test_decodeTrueBroken(self):
+        input = "tru"
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+        assert False, "Wrong exception"
+
+    def test_decodeFalseBroken(self):
+        input = "fa"
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+        assert False, "Wrong exception"
+
+    def test_decodeNullBroken(self):
+        input = "n"
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+        assert False, "Wrong exception"
+
+    def test_decodeBrokenDictKeyTypeLeakTest(self):
+        input = '{{1337:""}}'
+        for x in range(1000):
+            try:
+                ujson.decode(input)
+                assert False, "Expected exception!"
+            except ValueError:
+                continue
+
+            assert False, "Wrong exception"
+
+    def test_decodeBrokenDictLeakTest(self):
+        input = '{{"key":"}'
+        for x in range(1000):
+            try:
+                ujson.decode(input)
+                assert False, "Expected exception!"
+            except(ValueError):
+                continue
+
+            assert False, "Wrong exception"
+
+    def test_decodeBrokenListLeakTest(self):
+        input = '[[[true'
+        for x in range(1000):
+            try:
+                ujson.decode(input)
+                assert False, "Expected exception!"
+            except(ValueError):
+                continue
+
+            assert False, "Wrong exception"
+
+    def test_decodeDictWithNoKey(self):
+        input = "{{{{31337}}}}"
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+
+        assert False, "Wrong exception"
+
+    def test_decodeDictWithNoColonOrValue(self):
+        input = "{{{{\"key\"}}}}"
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+
+        assert False, "Wrong exception"
+
+    def test_decodeDictWithNoValue(self):
+        input = "{{{{\"key\":}}}}"
+        try:
+            ujson.decode(input)
+            assert False, "Expected exception!"
+        except(ValueError):
+            return
+
+        assert False, "Wrong exception"
+
+    def test_decodeNumericIntPos(self):
+        input = "31337"
+        assert 31337 == ujson.decode(input)
+
+    def test_decodeNumericIntNeg(self):
+        input = "-31337"
+        assert -31337 == ujson.decode(input)
+
+    @pytest.mark.skipif(compat.PY3, reason="only PY2")
+    def test_encodeUnicode4BytesUTF8Fail(self):
+        input = "\xfd\xbf\xbf\xbf\xbf\xbf"
+        try:
+            enc = ujson.encode(input)  # noqa
+            assert False, "Expected exception"
+        except OverflowError:
+            pass
+
+    def test_encodeNullCharacter(self):
+        input = "31337 \x00 1337"
+        output = ujson.encode(input)
+        assert input == json.loads(output)
+        assert output == json.dumps(input)
+        assert input == ujson.decode(output)
+
+        input = "\x00"
+        output = ujson.encode(input)
+        assert input == json.loads(output)
+        assert output == json.dumps(input)
+        assert input == ujson.decode(output)
+
+        assert '"  \\u0000\\r\\n "' == ujson.dumps(u("  \u0000\r\n "))
+        pass
+
+    def test_decodeNullCharacter(self):
+        input = "\"31337 \\u0000 31337\""
+        assert ujson.decode(input) == json.loads(input)
+
+    def test_encodeListLongConversion(self):
+        input = [9223372036854775807, 9223372036854775807, 9223372036854775807,
+                 9223372036854775807, 9223372036854775807, 9223372036854775807]
+        output = ujson.encode(input)
+        assert input == json.loads(output)
+        assert input == ujson.decode(output)
+        tm.assert_numpy_array_equal(np.array(input),
+                                    ujson.decode(output, numpy=True,
+                                                 dtype=np.int64))
+        pass
+
+    def test_encodeLongConversion(self):
+        input = 9223372036854775807
+        output = ujson.encode(input)
+        assert input == json.loads(output)
+        assert output == json.dumps(input)
+        assert input == ujson.decode(output)
+        pass
+
+    def test_numericIntExp(self):
+        input = "1337E40"
+        output = ujson.decode(input)
+        assert output == json.loads(input)
+
+    def test_numericIntFrcExp(self):
+        input = "1.337E40"
+        output = ujson.decode(input)
+        tm.assert_almost_equal(output, json.loads(input))
+
+    def test_decodeNumericIntExpEPLUS(self):
+        input = "1337E+9"
+        output = ujson.decode(input)
+        tm.assert_almost_equal(output, json.loads(input))
+
+    def test_decodeNumericIntExpePLUS(self):
+        input = "1.337e+40"
+        output = ujson.decode(input)
+        tm.assert_almost_equal(output, json.loads(input))
+
+    def test_decodeNumericIntExpE(self):
+        input = "1337E40"
+        output = ujson.decode(input)
+        tm.assert_almost_equal(output, json.loads(input))
+
+    def test_decodeNumericIntExpe(self):
+        input = "1337e40"
+        output = ujson.decode(input)
+        tm.assert_almost_equal(output, json.loads(input))
+
+    def test_decodeNumericIntExpEMinus(self):
+        input = "1.337E-4"
+        output = ujson.decode(input)
+        tm.assert_almost_equal(output, json.loads(input))
+
+    def test_decodeNumericIntExpeMinus(self):
+        input = "1.337e-4"
+        output = ujson.decode(input)
+        tm.assert_almost_equal(output, json.loads(input))
+
+    def test_dumpToFile(self):
+        f = StringIO()
+        ujson.dump([1, 2, 3], f)
+        assert "[1,2,3]" == f.getvalue()
+
+    def test_dumpToFileLikeObject(self):
+        class FileLike(object):
+
+            def __init__(self):
+                self.bytes = ''
+
+            def write(self, bytes):
+                self.bytes += bytes
+        f = FileLike()
+        ujson.dump([1, 2, 3], f)
+        assert "[1,2,3]" == f.bytes
+
+    def test_dumpFileArgsError(self):
+        try:
+            ujson.dump([], '')
+        except TypeError:
+            pass
+        else:
+            assert False, 'expected TypeError'
+
+    def test_loadFile(self):
+        f = StringIO("[1,2,3,4]")
+        assert [1, 2, 3, 4] == ujson.load(f)
+
+        f = StringIO("[1,2,3,4]")
+        tm.assert_numpy_array_equal(
+            np.array([1, 2, 3, 4]), ujson.load(f, numpy=True))
+
+    def test_loadFileLikeObject(self):
+        class FileLike(object):
+
+            def read(self):
+                try:
+                    self.end
+                except AttributeError:
+                    self.end = True
+                    return "[1,2,3,4]"
+        f = FileLike()
+        assert [1, 2, 3, 4] == ujson.load(f)
+
+        f = FileLike()
+        tm.assert_numpy_array_equal(
+            np.array([1, 2, 3, 4]), ujson.load(f, numpy=True))
+
+    def test_loadFileArgsError(self):
+        try:
+            ujson.load("[]")
+        except TypeError:
+            pass
+        else:
+            assert False, "expected TypeError"
+
+    def test_version(self):
+        assert re.match(r'^\d+\.\d+(\.\d+)?$', ujson.__version__), \
+            "ujson.__version__ must be a string like '1.4.0'"
+
+    def test_encodeNumericOverflow(self):
+        try:
+            ujson.encode(12839128391289382193812939)
+        except OverflowError:
+            pass
+        else:
+            assert False, "expected OverflowError"
+
+    def test_encodeNumericOverflowNested(self):
+        for n in range(0, 100):
+            class Nested(object):
+                x = 12839128391289382193812939
+
+            nested = Nested()
+
+            try:
+                ujson.encode(nested)
+            except OverflowError:
+                pass
+            else:
+                assert False, "expected OverflowError"
+
+    def test_decodeNumberWith32bitSignBit(self):
+        # Test that numbers that fit within 32 bits but would have the
+        # sign bit set (2**31 <= x < 2**32) are decoded properly.
+        boundary1 = 2**31  # noqa
+        boundary2 = 2**32  # noqa
+        docs = (
+            '{"id": 3590016419}',
+            '{{"id": {low}}}'.format(low=2**31),
+            '{{"id": {high}}}'.format(high=2**32),
+            '{{"id": {one_less}}}'.format(one_less=(2**32) - 1),
+        )
+        results = (3590016419, 2**31, 2**32, 2**32 - 1)
+        for doc, result in zip(docs, results):
+            assert ujson.decode(doc)['id'] == result
+
+    def test_encodeBigEscape(self):
+        for x in range(10):
+            if compat.PY3:
+                base = '\u00e5'.encode('utf-8')
+            else:
+                base = "\xc3\xa5"
+            input = base * 1024 * 1024 * 2
+            output = ujson.encode(input)  # noqa
+
+    def test_decodeBigEscape(self):
+        for x in range(10):
+            if compat.PY3:
+                base = '\u00e5'.encode('utf-8')
+            else:
+                base = "\xc3\xa5"
+            quote = compat.str_to_bytes("\"")
+            input = quote + (base * 1024 * 1024 * 2) + quote
+            output = ujson.decode(input)  # noqa
+
+    def test_toDict(self):
+        d = {u("key"): 31337}
+
+        class DictTest(object):
+
+            def toDict(self):
+                return d
+
+        o = DictTest()
+        output = ujson.encode(o)
+        dec = ujson.decode(output)
+        assert dec == d
+
+    def test_defaultHandler(self):
+
+        class _TestObject(object):
+
+            def __init__(self, val):
+                self.val = val
+
+            @property
+            def recursive_attr(self):
+                return _TestObject("recursive_attr")
+
+            def __str__(self):
+                return str(self.val)
+
+        pytest.raises(OverflowError, ujson.encode, _TestObject("foo"))
+        assert '"foo"' == ujson.encode(_TestObject("foo"),
+                                       default_handler=str)
+
+        def my_handler(obj):
+            return "foobar"
+
+        assert '"foobar"' == ujson.encode(_TestObject("foo"),
+                                          default_handler=my_handler)
+
+        def my_handler_raises(obj):
+            raise TypeError("I raise for anything")
+
+        with tm.assert_raises_regex(TypeError, "I raise for anything"):
+            ujson.encode(_TestObject("foo"), default_handler=my_handler_raises)
+
+        def my_int_handler(obj):
+            return 42
+
+        assert ujson.decode(ujson.encode(
+            _TestObject("foo"), default_handler=my_int_handler)) == 42
+
+        def my_obj_handler(obj):
+            return datetime.datetime(2013, 2, 3)
+
+        assert (ujson.decode(ujson.encode(datetime.datetime(2013, 2, 3))) ==
+                ujson.decode(ujson.encode(_TestObject("foo"),
+                                          default_handler=my_obj_handler)))
+
+        l = [_TestObject("foo"), _TestObject("bar")]
+        assert (json.loads(json.dumps(l, default=str)) ==
+                ujson.decode(ujson.encode(l, default_handler=str)))
+
+
+class TestNumpyJSONTests(object):
+
+    def test_Bool(self):
+        b = np.bool(True)
+        assert ujson.decode(ujson.encode(b)) == b
+
+    def test_BoolArray(self):
+        inpt = np.array([True, False, True, True, False, True, False, False],
+                        dtype=np.bool)
+        outp = np.array(ujson.decode(ujson.encode(inpt)), dtype=np.bool)
+        tm.assert_numpy_array_equal(inpt, outp)
+
+    def test_Int(self):
+        num = np.int(2562010)
+        assert np.int(ujson.decode(ujson.encode(num))) == num
+
+        num = np.int8(127)
+        assert np.int8(ujson.decode(ujson.encode(num))) == num
+
+        num = np.int16(2562010)
+        assert np.int16(ujson.decode(ujson.encode(num))) == num
+
+        num = np.int32(2562010)
+        assert np.int32(ujson.decode(ujson.encode(num))) == num
+
+        num = np.int64(2562010)
+        assert np.int64(ujson.decode(ujson.encode(num))) == num
+
+        num = np.uint8(255)
+        assert np.uint8(ujson.decode(ujson.encode(num))) == num
+
+        num = np.uint16(2562010)
+        assert np.uint16(ujson.decode(ujson.encode(num))) == num
+
+        num = np.uint32(2562010)
+        assert np.uint32(ujson.decode(ujson.encode(num))) == num
+
+        num = np.uint64(2562010)
+        assert np.uint64(ujson.decode(ujson.encode(num))) == num
+
+    def test_IntArray(self):
+        arr = np.arange(100, dtype=np.int)
+        dtypes = (np.int, np.int8, np.int16, np.int32, np.int64,
+                  np.uint, np.uint8, np.uint16, np.uint32, np.uint64)
+        for dtype in dtypes:
+            inpt = arr.astype(dtype)
+            outp = np.array(ujson.decode(ujson.encode(inpt)), dtype=dtype)
+            tm.assert_numpy_array_equal(inpt, outp)
+
+    def test_IntMax(self):
+        num = np.int(np.iinfo(np.int).max)
+        assert np.int(ujson.decode(ujson.encode(num))) == num
+
+        num = np.int8(np.iinfo(np.int8).max)
+        assert np.int8(ujson.decode(ujson.encode(num))) == num
+
+        num = np.int16(np.iinfo(np.int16).max)
+        assert np.int16(ujson.decode(ujson.encode(num))) == num
+
+        num = np.int32(np.iinfo(np.int32).max)
+        assert np.int32(ujson.decode(ujson.encode(num))) == num
+
+        num = np.uint8(np.iinfo(np.uint8).max)
+        assert np.uint8(ujson.decode(ujson.encode(num))) == num
+
+        num = np.uint16(np.iinfo(np.uint16).max)
+        assert np.uint16(ujson.decode(ujson.encode(num))) == num
+
+        num = np.uint32(np.iinfo(np.uint32).max)
+        assert np.uint32(ujson.decode(ujson.encode(num))) == num
+
+        if not compat.is_platform_32bit():
+            num = np.int64(np.iinfo(np.int64).max)
+            assert np.int64(ujson.decode(ujson.encode(num))) == num
+
+            # uint64 max will always overflow as it's encoded to signed
+            num = np.uint64(np.iinfo(np.int64).max)
+            assert np.uint64(ujson.decode(ujson.encode(num))) == num
+
+    def test_Float(self):
+        num = np.float(256.2013)
+        assert np.float(ujson.decode(ujson.encode(num))) == num
+
+        num = np.float32(256.2013)
+        assert np.float32(ujson.decode(ujson.encode(num))) == num
+
+        num = np.float64(256.2013)
+        assert np.float64(ujson.decode(ujson.encode(num))) == num
+
+    def test_FloatArray(self):
+        arr = np.arange(12.5, 185.72, 1.7322, dtype=np.float)
+        dtypes = (np.float, np.float32, np.float64)
+
+        for dtype in dtypes:
+            inpt = arr.astype(dtype)
+            outp = np.array(ujson.decode(ujson.encode(
+                inpt, double_precision=15)), dtype=dtype)
+            tm.assert_almost_equal(inpt, outp)
+
+    def test_FloatMax(self):
+        num = np.float(np.finfo(np.float).max / 10)
+        tm.assert_almost_equal(np.float(ujson.decode(
+            ujson.encode(num, double_precision=15))), num, 15)
+
+        num = np.float32(np.finfo(np.float32).max / 10)
+        tm.assert_almost_equal(np.float32(ujson.decode(
+            ujson.encode(num, double_precision=15))), num, 15)
+
+        num = np.float64(np.finfo(np.float64).max / 10)
+        tm.assert_almost_equal(np.float64(ujson.decode(
+            ujson.encode(num, double_precision=15))), num, 15)
+
+    def test_Arrays(self):
+        arr = np.arange(100)
+
+        arr = arr.reshape((10, 10))
+        tm.assert_numpy_array_equal(
+            np.array(ujson.decode(ujson.encode(arr))), arr)
+        tm.assert_numpy_array_equal(ujson.decode(
+            ujson.encode(arr), numpy=True), arr)
+
+        arr = arr.reshape((5, 5, 4))
+        tm.assert_numpy_array_equal(
+            np.array(ujson.decode(ujson.encode(arr))), arr)
+        tm.assert_numpy_array_equal(ujson.decode(
+            ujson.encode(arr), numpy=True), arr)
+
+        arr = arr.reshape((100, 1))
+        tm.assert_numpy_array_equal(
+            np.array(ujson.decode(ujson.encode(arr))), arr)
+        tm.assert_numpy_array_equal(ujson.decode(
+            ujson.encode(arr), numpy=True), arr)
+
+        arr = np.arange(96)
+        arr = arr.reshape((2, 2, 2, 2, 3, 2))
+        tm.assert_numpy_array_equal(
+            np.array(ujson.decode(ujson.encode(arr))), arr)
+        tm.assert_numpy_array_equal(ujson.decode(
+            ujson.encode(arr), numpy=True), arr)
+
+        l = ['a', list(), dict(), dict(), list(),
+             42, 97.8, ['a', 'b'], {'key': 'val'}]
+        arr = np.array(l)
+        tm.assert_numpy_array_equal(
+            np.array(ujson.decode(ujson.encode(arr))), arr)
+
+        arr = np.arange(100.202, 200.202, 1, dtype=np.float32)
+        arr = arr.reshape((5, 5, 4))
+        outp = np.array(ujson.decode(ujson.encode(arr)), dtype=np.float32)
+        tm.assert_almost_equal(arr, outp)
+        outp = ujson.decode(ujson.encode(arr), numpy=True, dtype=np.float32)
+        tm.assert_almost_equal(arr, outp)
+
+    def test_OdArray(self):
+        def will_raise():
+            ujson.encode(np.array(1))
+
+        pytest.raises(TypeError, will_raise)
+
+    def test_ArrayNumpyExcept(self):
+
+        input = ujson.dumps([42, {}, 'a'])
+        try:
+            ujson.decode(input, numpy=True)
+            assert False, "Expected exception!"
+        except(TypeError):
+            pass
+        except:
+            assert False, "Wrong exception"
+
+        input = ujson.dumps(['a', 'b', [], 'c'])
+        try:
+            ujson.decode(input, numpy=True)
+            assert False, "Expected exception!"
+        except(ValueError):
+            pass
+        except:
+            assert False, "Wrong exception"
+
+        input = ujson.dumps([['a'], 42])
+        try:
+            ujson.decode(input, numpy=True)
+            assert False, "Expected exception!"
+        except(ValueError):
+            pass
+        except:
+            assert False, "Wrong exception"
+
+        input = ujson.dumps([42, ['a'], 42])
+        try:
+            ujson.decode(input, numpy=True)
+            assert False, "Expected exception!"
+        except(ValueError):
+            pass
+        except:
+            assert False, "Wrong exception"
+
+        input = ujson.dumps([{}, []])
+        try:
+            ujson.decode(input, numpy=True)
+            assert False, "Expected exception!"
+        except(ValueError):
+            pass
+        except:
+            assert False, "Wrong exception"
+
+        input = ujson.dumps([42, None])
+        try:
+            ujson.decode(input, numpy=True)
+            assert False, "Expected exception!"
+        except(TypeError):
+            pass
+        except:
+            assert False, "Wrong exception"
+
+        input = ujson.dumps([{'a': 'b'}])
+        try:
+            ujson.decode(input, numpy=True, labelled=True)
+            assert False, "Expected exception!"
+        except(ValueError):
+            pass
+        except:
+            assert False, "Wrong exception"
+
+        input = ujson.dumps({'a': {'b': {'c': 42}}})
+        try:
+            ujson.decode(input, numpy=True, labelled=True)
+            assert False, "Expected exception!"
+        except(ValueError):
+            pass
+        except:
+            assert False, "Wrong exception"
+
+        input = ujson.dumps([{'a': 42, 'b': 23}, {'c': 17}])
+        try:
+            ujson.decode(input, numpy=True, labelled=True)
+            assert False, "Expected exception!"
+        except(ValueError):
+            pass
+        except:
+            assert False, "Wrong exception"
+
+    def test_ArrayNumpyLabelled(self):
+        input = {'a': []}
+        output = ujson.loads(ujson.dumps(input), numpy=True, labelled=True)
+        assert (np.empty((1, 0)) == output[0]).all()
+        assert (np.array(['a']) == output[1]).all()
+        assert output[2] is None
+
+        input = [{'a': 42}]
+        output = ujson.loads(ujson.dumps(input), numpy=True, labelled=True)
+        assert (np.array([42]) == output[0]).all()
+        assert output[1] is None
+        assert (np.array([u('a')]) == output[2]).all()
+
+        # Write out the dump explicitly so there is no dependency on iteration
+        # order GH10837
+        input_dumps = ('[{"a": 42, "b":31}, {"a": 24, "c": 99}, '
+                       '{"a": 2.4, "b": 78}]')
+        output = ujson.loads(input_dumps, numpy=True, labelled=True)
+        expectedvals = np.array(
+            [42, 31, 24, 99, 2.4, 78], dtype=int).reshape((3, 2))
+        assert (expectedvals == output[0]).all()
+        assert output[1] is None
+        assert (np.array([u('a'), 'b']) == output[2]).all()
+
+        input_dumps = ('{"1": {"a": 42, "b":31}, "2": {"a": 24, "c": 99}, '
+                       '"3": {"a": 2.4, "b": 78}}')
+        output = ujson.loads(input_dumps, numpy=True, labelled=True)
+        expectedvals = np.array(
+            [42, 31, 24, 99, 2.4, 78], dtype=int).reshape((3, 2))
+        assert (expectedvals == output[0]).all()
+        assert (np.array(['1', '2', '3']) == output[1]).all()
+        assert (np.array(['a', 'b']) == output[2]).all()
+
+
+class TestPandasJSONTests(object):
+
+    def test_DataFrame(self):
+        df = DataFrame([[1, 2, 3], [4, 5, 6]], index=[
+                       'a', 'b'], columns=['x', 'y', 'z'])
+
+        # column indexed
+        outp = DataFrame(ujson.decode(ujson.encode(df)))
+        assert (df == outp).values.all()
+        tm.assert_index_equal(df.columns, outp.columns)
+        tm.assert_index_equal(df.index, outp.index)
+
+        dec = _clean_dict(ujson.decode(ujson.encode(df, orient="split")))
+        outp = DataFrame(**dec)
+        assert (df == outp).values.all()
+        tm.assert_index_equal(df.columns, outp.columns)
+        tm.assert_index_equal(df.index, outp.index)
+
+        outp = DataFrame(ujson.decode(ujson.encode(df, orient="records")))
+        outp.index = df.index
+        assert (df == outp).values.all()
+        tm.assert_index_equal(df.columns, outp.columns)
+
+        outp = DataFrame(ujson.decode(ujson.encode(df, orient="values")))
+        outp.index = df.index
+        assert (df.values == outp.values).all()
+
+        outp = DataFrame(ujson.decode(ujson.encode(df, orient="index")))
+        assert (df.transpose() == outp).values.all()
+        tm.assert_index_equal(df.transpose().columns, outp.columns)
+        tm.assert_index_equal(df.transpose().index, outp.index)
+
+    def test_DataFrameNumpy(self):
+        df = DataFrame([[1, 2, 3], [4, 5, 6]], index=[
+                       'a', 'b'], columns=['x', 'y', 'z'])
+
+        # column indexed
+        outp = DataFrame(ujson.decode(ujson.encode(df), numpy=True))
+        assert (df == outp).values.all()
+        tm.assert_index_equal(df.columns, outp.columns)
+        tm.assert_index_equal(df.index, outp.index)
+
+        dec = _clean_dict(ujson.decode(ujson.encode(df, orient="split"),
+                                       numpy=True))
+        outp = DataFrame(**dec)
+        assert (df == outp).values.all()
+        tm.assert_index_equal(df.columns, outp.columns)
+        tm.assert_index_equal(df.index, outp.index)
+
+        outp = DataFrame(ujson.decode(ujson.encode(df, orient="index"),
+                                      numpy=True))
+        assert (df.transpose() == outp).values.all()
+        tm.assert_index_equal(df.transpose().columns, outp.columns)
+        tm.assert_index_equal(df.transpose().index, outp.index)
+
+    def test_DataFrameNested(self):
+        df = DataFrame([[1, 2, 3], [4, 5, 6]], index=[
+                       'a', 'b'], columns=['x', 'y', 'z'])
+
+        nested = {'df1': df, 'df2': df.copy()}
+
+        exp = {'df1': ujson.decode(ujson.encode(df)),
+               'df2': ujson.decode(ujson.encode(df))}
+        assert ujson.decode(ujson.encode(nested)) == exp
+
+        exp = {'df1': ujson.decode(ujson.encode(df, orient="index")),
+               'df2': ujson.decode(ujson.encode(df, orient="index"))}
+        assert ujson.decode(ujson.encode(nested, orient="index")) == exp
+
+        exp = {'df1': ujson.decode(ujson.encode(df, orient="records")),
+               'df2': ujson.decode(ujson.encode(df, orient="records"))}
+        assert ujson.decode(ujson.encode(nested, orient="records")) == exp
+
+        exp = {'df1': ujson.decode(ujson.encode(df, orient="values")),
+               'df2': ujson.decode(ujson.encode(df, orient="values"))}
+        assert ujson.decode(ujson.encode(nested, orient="values")) == exp
+
+        exp = {'df1': ujson.decode(ujson.encode(df, orient="split")),
+               'df2': ujson.decode(ujson.encode(df, orient="split"))}
+        assert ujson.decode(ujson.encode(nested, orient="split")) == exp
+
+    def test_DataFrameNumpyLabelled(self):
+        df = DataFrame([[1, 2, 3], [4, 5, 6]], index=[
+                       'a', 'b'], columns=['x', 'y', 'z'])
+
+        # column indexed
+        outp = DataFrame(*ujson.decode(ujson.encode(df),
+                                       numpy=True, labelled=True))
+        assert (df.T == outp).values.all()
+        tm.assert_index_equal(df.T.columns, outp.columns)
+        tm.assert_index_equal(df.T.index, outp.index)
+
+        outp = DataFrame(*ujson.decode(ujson.encode(df, orient="records"),
+                                       numpy=True, labelled=True))
+        outp.index = df.index
+        assert (df == outp).values.all()
+        tm.assert_index_equal(df.columns, outp.columns)
+
+        outp = DataFrame(*ujson.decode(ujson.encode(df, orient="index"),
+                                       numpy=True, labelled=True))
+        assert (df == outp).values.all()
+        tm.assert_index_equal(df.columns, outp.columns)
+        tm.assert_index_equal(df.index, outp.index)
+
+    def test_Series(self):
+        s = Series([10, 20, 30, 40, 50, 60], name="series",
+                   index=[6, 7, 8, 9, 10, 15]).sort_values()
+
+        # column indexed
+        outp = Series(ujson.decode(ujson.encode(s))).sort_values()
+        exp = Series([10, 20, 30, 40, 50, 60],
+                     index=['6', '7', '8', '9', '10', '15'])
+        tm.assert_series_equal(outp, exp)
+
+        outp = Series(ujson.decode(ujson.encode(s), numpy=True)).sort_values()
+        tm.assert_series_equal(outp, exp)
+
+        dec = _clean_dict(ujson.decode(ujson.encode(s, orient="split")))
+        outp = Series(**dec)
+        tm.assert_series_equal(outp, s)
+
+        dec = _clean_dict(ujson.decode(ujson.encode(s, orient="split"),
+                                       numpy=True))
+        outp = Series(**dec)
+
+        exp_np = Series(np.array([10, 20, 30, 40, 50, 60]))
+        exp_pd = Series([10, 20, 30, 40, 50, 60])
+        outp = Series(ujson.decode(ujson.encode(s, orient="records"),
+                                   numpy=True))
+        tm.assert_series_equal(outp, exp_np)
+
+        outp = Series(ujson.decode(ujson.encode(s, orient="records")))
+        exp = Series([10, 20, 30, 40, 50, 60])
+        tm.assert_series_equal(outp, exp_pd)
+
+        outp = Series(ujson.decode(ujson.encode(s, orient="values"),
+                                   numpy=True))
+        tm.assert_series_equal(outp, exp_np)
+
+        outp = Series(ujson.decode(ujson.encode(s, orient="values")))
+        tm.assert_series_equal(outp, exp_pd)
+
+        outp = Series(ujson.decode(ujson.encode(
+            s, orient="index"))).sort_values()
+        exp = Series([10, 20, 30, 40, 50, 60],
+                     index=['6', '7', '8', '9', '10', '15'])
+        tm.assert_series_equal(outp, exp)
+
+        outp = Series(ujson.decode(ujson.encode(
+            s, orient="index"), numpy=True)).sort_values()
+        tm.assert_series_equal(outp, exp)
+
+    def test_SeriesNested(self):
+        s = Series([10, 20, 30, 40, 50, 60], name="series",
+                   index=[6, 7, 8, 9, 10, 15]).sort_values()
+
+        nested = {'s1': s, 's2': s.copy()}
+
+        exp = {'s1': ujson.decode(ujson.encode(s)),
+               's2': ujson.decode(ujson.encode(s))}
+        assert ujson.decode(ujson.encode(nested)) == exp
+
+        exp = {'s1': ujson.decode(ujson.encode(s, orient="split")),
+               's2': ujson.decode(ujson.encode(s, orient="split"))}
+        assert ujson.decode(ujson.encode(nested, orient="split")) == exp
+
+        exp = {'s1': ujson.decode(ujson.encode(s, orient="records")),
+               's2': ujson.decode(ujson.encode(s, orient="records"))}
+        assert ujson.decode(ujson.encode(nested, orient="records")) == exp
+
+        exp = {'s1': ujson.decode(ujson.encode(s, orient="values")),
+               's2': ujson.decode(ujson.encode(s, orient="values"))}
+        assert ujson.decode(ujson.encode(nested, orient="values")) == exp
+
+        exp = {'s1': ujson.decode(ujson.encode(s, orient="index")),
+               's2': ujson.decode(ujson.encode(s, orient="index"))}
+        assert ujson.decode(ujson.encode(nested, orient="index")) == exp
+
+    def test_Index(self):
+        i = Index([23, 45, 18, 98, 43, 11], name="index")
+
+        # column indexed
+        outp = Index(ujson.decode(ujson.encode(i)), name='index')
+        tm.assert_index_equal(i, outp)
+
+        outp = Index(ujson.decode(ujson.encode(i), numpy=True), name='index')
+        tm.assert_index_equal(i, outp)
+
+        dec = _clean_dict(ujson.decode(ujson.encode(i, orient="split")))
+        outp = Index(**dec)
+        tm.assert_index_equal(i, outp)
+        assert i.name == outp.name
+
+        dec = _clean_dict(ujson.decode(ujson.encode(i, orient="split"),
+                                       numpy=True))
+        outp = Index(**dec)
+        tm.assert_index_equal(i, outp)
+        assert i.name == outp.name
+
+        outp = Index(ujson.decode(ujson.encode(i, orient="values")),
+                     name='index')
+        tm.assert_index_equal(i, outp)
+
+        outp = Index(ujson.decode(ujson.encode(i, orient="values"),
+                                  numpy=True), name='index')
+        tm.assert_index_equal(i, outp)
+
+        outp = Index(ujson.decode(ujson.encode(i, orient="records")),
+                     name='index')
+        tm.assert_index_equal(i, outp)
+
+        outp = Index(ujson.decode(ujson.encode(i, orient="records"),
+                                  numpy=True), name='index')
+        tm.assert_index_equal(i, outp)
+
+        outp = Index(ujson.decode(ujson.encode(i, orient="index")),
+                     name='index')
+        tm.assert_index_equal(i, outp)
+
+        outp = Index(ujson.decode(ujson.encode(i, orient="index"),
+                                  numpy=True), name='index')
+        tm.assert_index_equal(i, outp)
+
+    def test_datetimeindex(self):
+        from pandas.core.indexes.datetimes import date_range
+
+        rng = date_range('1/1/2000', periods=20)
+
+        encoded = ujson.encode(rng, date_unit='ns')
+        decoded = DatetimeIndex(np.array(ujson.decode(encoded)))
+
+        tm.assert_index_equal(rng, decoded)
+
+        ts = Series(np.random.randn(len(rng)), index=rng)
+        decoded = Series(ujson.decode(ujson.encode(ts, date_unit='ns')))
+        idx_values = decoded.index.values.astype(np.int64)
+        decoded.index = DatetimeIndex(idx_values)
+        tm.assert_series_equal(ts, decoded)
+
+    def test_decodeArrayTrailingCommaFail(self):
+        input = "[31337,]"
+        try:
+            ujson.decode(input)
+        except ValueError:
+            pass
+        else:
+            assert False, "expected ValueError"
+
+    def test_decodeArrayLeadingCommaFail(self):
+        input = "[,31337]"
+        try:
+            ujson.decode(input)
+        except ValueError:
+            pass
+        else:
+            assert False, "expected ValueError"
+
+    def test_decodeArrayOnlyCommaFail(self):
+        input = "[,]"
+        try:
+            ujson.decode(input)
+        except ValueError:
+            pass
+        else:
+            assert False, "expected ValueError"
+
+    def test_decodeArrayUnmatchedBracketFail(self):
+        input = "[]]"
+        try:
+            ujson.decode(input)
+        except ValueError:
+            pass
+        else:
+            assert False, "expected ValueError"
+
+    def test_decodeArrayEmpty(self):
+        input = "[]"
+        ujson.decode(input)
+
+    def test_decodeArrayOneItem(self):
+        input = "[31337]"
+        ujson.decode(input)
+
+    def test_decodeBigValue(self):
+        input = "9223372036854775807"
+        ujson.decode(input)
+
+    def test_decodeSmallValue(self):
+        input = "-9223372036854775808"
+        ujson.decode(input)
+
+    def test_decodeTooBigValue(self):
+        try:
+            input = "9223372036854775808"
+            ujson.decode(input)
+        except ValueError:
+            pass
+        else:
+            assert False, "expected ValueError"
+
+    def test_decodeTooSmallValue(self):
+        try:
+            input = "-90223372036854775809"
+            ujson.decode(input)
+        except ValueError:
+            pass
+        else:
+            assert False, "expected ValueError"
+
+    def test_decodeVeryTooBigValue(self):
+        try:
+            input = "9223372036854775808"
+            ujson.decode(input)
+        except ValueError:
+            pass
+        else:
+            assert False, "expected ValueError"
+
+    def test_decodeVeryTooSmallValue(self):
+        try:
+            input = "-90223372036854775809"
+            ujson.decode(input)
+        except ValueError:
+            pass
+        else:
+            assert False, "expected ValueError"
+
+    def test_decodeWithTrailingWhitespaces(self):
+        input = "{}\n\t "
+        ujson.decode(input)
+
+    def test_decodeWithTrailingNonWhitespaces(self):
+        try:
+            input = "{}\n\t a"
+            ujson.decode(input)
+        except ValueError:
+            pass
+        else:
+            assert False, "expected ValueError"
+
+    def test_decodeArrayWithBigInt(self):
+        try:
+            ujson.loads('[18446098363113800555]')
+        except ValueError:
+            pass
+        else:
+            assert False, "expected ValueError"
+
+    def test_decodeArrayFaultyUnicode(self):
+        try:
+            ujson.loads('[18446098363113800555]')
+        except ValueError:
+            pass
+        else:
+            assert False, "expected ValueError"
+
+    def test_decodeFloatingPointAdditionalTests(self):
+        places = 15
+
+        tm.assert_almost_equal(-1.1234567893,
+                               ujson.loads("-1.1234567893"),
+                               check_less_precise=places)
+        tm.assert_almost_equal(-1.234567893,
+                               ujson.loads("-1.234567893"),
+                               check_less_precise=places)
+        tm.assert_almost_equal(-1.34567893,
+                               ujson.loads("-1.34567893"),
+                               check_less_precise=places)
+        tm.assert_almost_equal(-1.4567893,
+                               ujson.loads("-1.4567893"),
+                               check_less_precise=places)
+        tm.assert_almost_equal(-1.567893,
+                               ujson.loads("-1.567893"),
+                               check_less_precise=places)
+        tm.assert_almost_equal(-1.67893,
+                               ujson.loads("-1.67893"),
+                               check_less_precise=places)
+        tm.assert_almost_equal(-1.7893, ujson.loads("-1.7893"),
+                               check_less_precise=places)
+        tm.assert_almost_equal(-1.893, ujson.loads("-1.893"),
+                               check_less_precise=places)
+        tm.assert_almost_equal(-1.3, ujson.loads("-1.3"),
+                               check_less_precise=places)
+
+        tm.assert_almost_equal(1.1234567893, ujson.loads(
+            "1.1234567893"), check_less_precise=places)
+        tm.assert_almost_equal(1.234567893, ujson.loads(
+            "1.234567893"), check_less_precise=places)
+        tm.assert_almost_equal(
+            1.34567893, ujson.loads("1.34567893"), check_less_precise=places)
+        tm.assert_almost_equal(
+            1.4567893, ujson.loads("1.4567893"), check_less_precise=places)
+        tm.assert_almost_equal(
+            1.567893, ujson.loads("1.567893"), check_less_precise=places)
+        tm.assert_almost_equal(1.67893, ujson.loads("1.67893"),
+                               check_less_precise=places)
+        tm.assert_almost_equal(1.7893, ujson.loads("1.7893"),
+                               check_less_precise=places)
+        tm.assert_almost_equal(1.893, ujson.loads("1.893"),
+                               check_less_precise=places)
+        tm.assert_almost_equal(1.3, ujson.loads("1.3"),
+                               check_less_precise=places)
+
+    def test_encodeBigSet(self):
+        s = set()
+        for x in range(0, 100000):
+            s.add(x)
+        ujson.encode(s)
+
+    def test_encodeEmptySet(self):
+        s = set()
+        assert "[]" == ujson.encode(s)
+
+    def test_encodeSet(self):
+        s = set([1, 2, 3, 4, 5, 6, 7, 8, 9])
+        enc = ujson.encode(s)
+        dec = ujson.decode(enc)
+
+        for v in dec:
+            assert v in s
+
+
+def _clean_dict(d):
+    return {str(k): v for k, v in compat.iteritems(d)}
diff --git a/pandas/tests/io/msgpack/__init__.py b/pandas/tests/io/msgpack/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/io/msgpack/common.py b/pandas/tests/io/msgpack/common.py
new file mode 100644
index 0000000000000..b770d12cffbfa
--- /dev/null
+++ b/pandas/tests/io/msgpack/common.py
@@ -0,0 +1,10 @@
+from pandas.compat import PY3
+
+
+# array compat
+if PY3:
+    frombytes = lambda obj, data: obj.frombytes(data)
+    tobytes = lambda obj: obj.tobytes()
+else:
+    frombytes = lambda obj, data: obj.fromstring(data)
+    tobytes = lambda obj: obj.tostring()
diff --git a/pandas/tests/io/msgpack/data/frame.mp b/pandas/tests/io/msgpack/data/frame.mp
new file mode 100644
index 0000000000000..21e20d262b26c
Binary files /dev/null and b/pandas/tests/io/msgpack/data/frame.mp differ
diff --git a/pandas/tests/test_msgpack/test_buffer.py b/pandas/tests/io/msgpack/test_buffer.py
similarity index 76%
rename from pandas/tests/test_msgpack/test_buffer.py
rename to pandas/tests/io/msgpack/test_buffer.py
index 43f5e64012885..8ebec734f1d3d 100644
--- a/pandas/tests/test_msgpack/test_buffer.py
+++ b/pandas/tests/io/msgpack/test_buffer.py
@@ -1,13 +1,13 @@
-#!/usr/bin/env python
 # coding: utf-8
 
-from pandas.msgpack import packb, unpackb
+from pandas.io.msgpack import packb, unpackb
+from .common import frombytes
 
 
 def test_unpack_buffer():
     from array import array
     buf = array('b')
-    buf.fromstring(packb((b'foo', b'bar')))
+    frombytes(buf, packb((b'foo', b'bar')))
     obj = unpackb(buf, use_list=1)
     assert [b'foo', b'bar'] == obj
 
diff --git a/pandas/tests/io/msgpack/test_case.py b/pandas/tests/io/msgpack/test_case.py
new file mode 100644
index 0000000000000..c0e76b37ee46d
--- /dev/null
+++ b/pandas/tests/io/msgpack/test_case.py
@@ -0,0 +1,115 @@
+# coding: utf-8
+
+from pandas.io.msgpack import packb, unpackb
+
+
+def check(length, obj):
+    v = packb(obj)
+    assert len(v) == length, \
+        "%r length should be %r but get %r" % (obj, length, len(v))
+    assert unpackb(v, use_list=0) == obj
+
+
+def test_1():
+    for o in [None, True, False, 0, 1, (1 << 6), (1 << 7) - 1, -1,
+              -((1 << 5) - 1), -(1 << 5)]:
+        check(1, o)
+
+
+def test_2():
+    for o in [1 << 7, (1 << 8) - 1, -((1 << 5) + 1), -(1 << 7)]:
+        check(2, o)
+
+
+def test_3():
+    for o in [1 << 8, (1 << 16) - 1, -((1 << 7) + 1), -(1 << 15)]:
+        check(3, o)
+
+
+def test_5():
+    for o in [1 << 16, (1 << 32) - 1, -((1 << 15) + 1), -(1 << 31)]:
+        check(5, o)
+
+
+def test_9():
+    for o in [1 << 32, (1 << 64) - 1, -((1 << 31) + 1), -(1 << 63), 1.0, 0.1,
+              -0.1, -1.0]:
+        check(9, o)
+
+
+def check_raw(overhead, num):
+    check(num + overhead, b" " * num)
+
+
+def test_fixraw():
+    check_raw(1, 0)
+    check_raw(1, (1 << 5) - 1)
+
+
+def test_raw16():
+    check_raw(3, 1 << 5)
+    check_raw(3, (1 << 16) - 1)
+
+
+def test_raw32():
+    check_raw(5, 1 << 16)
+
+
+def check_array(overhead, num):
+    check(num + overhead, (None, ) * num)
+
+
+def test_fixarray():
+    check_array(1, 0)
+    check_array(1, (1 << 4) - 1)
+
+
+def test_array16():
+    check_array(3, 1 << 4)
+    check_array(3, (1 << 16) - 1)
+
+
+def test_array32():
+    check_array(5, (1 << 16))
+
+
+def match(obj, buf):
+    assert packb(obj) == buf
+    assert unpackb(buf, use_list=0) == obj
+
+
+def test_match():
+    cases = [
+        (None, b'\xc0'),
+        (False, b'\xc2'),
+        (True, b'\xc3'),
+        (0, b'\x00'),
+        (127, b'\x7f'),
+        (128, b'\xcc\x80'),
+        (256, b'\xcd\x01\x00'),
+        (-1, b'\xff'),
+        (-33, b'\xd0\xdf'),
+        (-129, b'\xd1\xff\x7f'),
+        ({1: 1}, b'\x81\x01\x01'),
+        (1.0, b"\xcb\x3f\xf0\x00\x00\x00\x00\x00\x00"),
+        ((), b'\x90'),
+        (tuple(range(15)), (b"\x9f\x00\x01\x02\x03\x04\x05\x06\x07\x08\x09"
+                            b"\x0a\x0b\x0c\x0d\x0e")),
+        (tuple(range(16)), (b"\xdc\x00\x10\x00\x01\x02\x03\x04\x05\x06\x07"
+                            b"\x08\x09\x0a\x0b\x0c\x0d\x0e\x0f")),
+        ({}, b'\x80'),
+        ({x: x for x in range(15)},
+         (b'\x8f\x00\x00\x01\x01\x02\x02\x03\x03\x04\x04\x05\x05\x06\x06\x07'
+          b'\x07\x08\x08\t\t\n\n\x0b\x0b\x0c\x0c\r\r\x0e\x0e')),
+        ({x: x for x in range(16)},
+         (b'\xde\x00\x10\x00\x00\x01\x01\x02\x02\x03\x03\x04\x04\x05\x05\x06'
+          b'\x06\x07\x07\x08\x08\t\t\n\n\x0b\x0b\x0c\x0c\r\r\x0e\x0e'
+          b'\x0f\x0f')),
+    ]
+
+    for v, p in cases:
+        match(v, p)
+
+
+def test_unicode():
+    assert unpackb(packb('foobar'), use_list=1) == b'foobar'
diff --git a/pandas/tests/io/msgpack/test_except.py b/pandas/tests/io/msgpack/test_except.py
new file mode 100644
index 0000000000000..5a803c5eba34b
--- /dev/null
+++ b/pandas/tests/io/msgpack/test_except.py
@@ -0,0 +1,39 @@
+# coding: utf-8
+
+from datetime import datetime
+from pandas.io.msgpack import packb, unpackb
+
+import pytest
+import pandas.util.testing as tm
+
+
+class DummyException(Exception):
+    pass
+
+
+class TestExceptions(object):
+
+    def test_raise_on_find_unsupported_value(self):
+        msg = "can\'t serialize datetime"
+        with tm.assert_raises_regex(TypeError, msg):
+            packb(datetime.now())
+
+    def test_raise_from_object_hook(self):
+        def hook(_):
+            raise DummyException()
+
+        pytest.raises(DummyException, unpackb, packb({}), object_hook=hook)
+        pytest.raises(DummyException, unpackb, packb({'fizz': 'buzz'}),
+                      object_hook=hook)
+        pytest.raises(DummyException, unpackb, packb({'fizz': 'buzz'}),
+                      object_pairs_hook=hook)
+        pytest.raises(DummyException, unpackb,
+                      packb({'fizz': {'buzz': 'spam'}}), object_hook=hook)
+        pytest.raises(DummyException, unpackb,
+                      packb({'fizz': {'buzz': 'spam'}}),
+                      object_pairs_hook=hook)
+
+    def test_invalid_value(self):
+        msg = "Unpack failed: error"
+        with tm.assert_raises_regex(ValueError, msg):
+            unpackb(b"\xd9\x97#DL_")
diff --git a/pandas/tests/io/msgpack/test_extension.py b/pandas/tests/io/msgpack/test_extension.py
new file mode 100644
index 0000000000000..2ee72c8a55cb4
--- /dev/null
+++ b/pandas/tests/io/msgpack/test_extension.py
@@ -0,0 +1,61 @@
+from __future__ import print_function
+import array
+
+import pandas.io.msgpack as msgpack
+from pandas.io.msgpack import ExtType
+from .common import frombytes, tobytes
+
+
+def test_pack_ext_type():
+    def p(s):
+        packer = msgpack.Packer()
+        packer.pack_ext_type(0x42, s)
+        return packer.bytes()
+
+    assert p(b'A') == b'\xd4\x42A'  # fixext 1
+    assert p(b'AB') == b'\xd5\x42AB'  # fixext 2
+    assert p(b'ABCD') == b'\xd6\x42ABCD'  # fixext 4
+    assert p(b'ABCDEFGH') == b'\xd7\x42ABCDEFGH'  # fixext 8
+    assert p(b'A' * 16) == b'\xd8\x42' + b'A' * 16  # fixext 16
+    assert p(b'ABC') == b'\xc7\x03\x42ABC'  # ext 8
+    assert p(b'A' * 0x0123) == b'\xc8\x01\x23\x42' + b'A' * 0x0123  # ext 16
+    assert (p(b'A' * 0x00012345) ==
+            b'\xc9\x00\x01\x23\x45\x42' + b'A' * 0x00012345)  # ext 32
+
+
+def test_unpack_ext_type():
+    def check(b, expected):
+        assert msgpack.unpackb(b) == expected
+
+    check(b'\xd4\x42A', ExtType(0x42, b'A'))  # fixext 1
+    check(b'\xd5\x42AB', ExtType(0x42, b'AB'))  # fixext 2
+    check(b'\xd6\x42ABCD', ExtType(0x42, b'ABCD'))  # fixext 4
+    check(b'\xd7\x42ABCDEFGH', ExtType(0x42, b'ABCDEFGH'))  # fixext 8
+    check(b'\xd8\x42' + b'A' * 16, ExtType(0x42, b'A' * 16))  # fixext 16
+    check(b'\xc7\x03\x42ABC', ExtType(0x42, b'ABC'))  # ext 8
+    check(b'\xc8\x01\x23\x42' + b'A' * 0x0123,
+          ExtType(0x42, b'A' * 0x0123))  # ext 16
+    check(b'\xc9\x00\x01\x23\x45\x42' + b'A' * 0x00012345,
+          ExtType(0x42, b'A' * 0x00012345))  # ext 32
+
+
+def test_extension_type():
+    def default(obj):
+        print('default called', obj)
+        if isinstance(obj, array.array):
+            typecode = 123  # application specific typecode
+            data = tobytes(obj)
+            return ExtType(typecode, data)
+        raise TypeError("Unknown type object %r" % (obj, ))
+
+    def ext_hook(code, data):
+        print('ext_hook called', code, data)
+        assert code == 123
+        obj = array.array('d')
+        frombytes(obj, data)
+        return obj
+
+    obj = [42, b'hello', array.array('d', [1.1, 2.2, 3.3])]
+    s = msgpack.packb(obj, default=default)
+    obj2 = msgpack.unpackb(s, ext_hook=ext_hook)
+    assert obj == obj2
diff --git a/pandas/tests/io/msgpack/test_format.py b/pandas/tests/io/msgpack/test_format.py
new file mode 100644
index 0000000000000..3659602e1381f
--- /dev/null
+++ b/pandas/tests/io/msgpack/test_format.py
@@ -0,0 +1,91 @@
+# coding: utf-8
+
+from pandas.io.msgpack import unpackb
+
+
+def check(src, should, use_list=0):
+    assert unpackb(src, use_list=use_list) == should
+
+
+def testSimpleValue():
+    check(b"\x93\xc0\xc2\xc3", (None, False, True, ))
+
+
+def testFixnum():
+    check(b"\x92\x93\x00\x40\x7f\x93\xe0\xf0\xff", ((0,
+                                                     64,
+                                                     127, ),
+                                                    (-32,
+                                                     -16,
+                                                     -1, ), ))
+
+
+def testFixArray():
+    check(b"\x92\x90\x91\x91\xc0", ((), ((None, ), ), ), )
+
+
+def testFixRaw():
+    check(b"\x94\xa0\xa1a\xa2bc\xa3def", (b"", b"a", b"bc", b"def", ), )
+
+
+def testFixMap():
+    check(b"\x82\xc2\x81\xc0\xc0\xc3\x81\xc0\x80",
+          {False: {None: None},
+           True: {None: {}}}, )
+
+
+def testUnsignedInt():
+    check(b"\x99\xcc\x00\xcc\x80\xcc\xff\xcd\x00\x00\xcd\x80\x00"
+          b"\xcd\xff\xff\xce\x00\x00\x00\x00\xce\x80\x00\x00\x00"
+          b"\xce\xff\xff\xff\xff",
+          (0,
+           128,
+           255,
+           0,
+           32768,
+           65535,
+           0,
+           2147483648,
+           4294967295, ), )
+
+
+def testSignedInt():
+    check(b"\x99\xd0\x00\xd0\x80\xd0\xff\xd1\x00\x00\xd1\x80\x00"
+          b"\xd1\xff\xff\xd2\x00\x00\x00\x00\xd2\x80\x00\x00\x00"
+          b"\xd2\xff\xff\xff\xff", (0,
+                                    -128,
+                                    -1,
+                                    0,
+                                    -32768,
+                                    -1,
+                                    0,
+                                    -2147483648,
+                                    -1, ))
+
+
+def testRaw():
+    check(b"\x96\xda\x00\x00\xda\x00\x01a\xda\x00\x02ab\xdb\x00\x00"
+          b"\x00\x00\xdb\x00\x00\x00\x01a\xdb\x00\x00\x00\x02ab",
+          (b"", b"a", b"ab", b"", b"a", b"ab"))
+
+
+def testArray():
+    check(b"\x96\xdc\x00\x00\xdc\x00\x01\xc0\xdc\x00\x02\xc2\xc3\xdd\x00"
+          b"\x00\x00\x00\xdd\x00\x00\x00\x01\xc0\xdd\x00\x00\x00\x02"
+          b"\xc2\xc3", ((), (None, ), (False, True), (), (None, ),
+                        (False, True)))
+
+
+def testMap():
+    check(b"\x96"
+          b"\xde\x00\x00"
+          b"\xde\x00\x01\xc0\xc2"
+          b"\xde\x00\x02\xc0\xc2\xc3\xc2"
+          b"\xdf\x00\x00\x00\x00"
+          b"\xdf\x00\x00\x00\x01\xc0\xc2"
+          b"\xdf\x00\x00\x00\x02\xc0\xc2\xc3\xc2", ({}, {None: False},
+                                                    {True: False,
+                                                     None: False}, {},
+                                                    {None: False},
+                                                    {True: False,
+                                                     None: False}))
diff --git a/pandas/tests/io/msgpack/test_limits.py b/pandas/tests/io/msgpack/test_limits.py
new file mode 100644
index 0000000000000..e4abd4ddb8d13
--- /dev/null
+++ b/pandas/tests/io/msgpack/test_limits.py
@@ -0,0 +1,105 @@
+# coding: utf-8
+from __future__ import (absolute_import, division, print_function,
+                        unicode_literals)
+from pandas.io.msgpack import packb, unpackb, Packer, Unpacker, ExtType
+
+import pytest
+import pandas.util.testing as tm
+
+
+class TestLimits(object):
+
+    def test_integer(self):
+        x = -(2 ** 63)
+        assert unpackb(packb(x)) == x
+        pytest.raises((OverflowError, ValueError), packb, x - 1)
+        x = 2 ** 64 - 1
+        assert unpackb(packb(x)) == x
+        pytest.raises((OverflowError, ValueError), packb, x + 1)
+
+    def test_array_header(self):
+        packer = Packer()
+        packer.pack_array_header(2 ** 32 - 1)
+        pytest.raises((OverflowError, ValueError),
+                      packer.pack_array_header, 2 ** 32)
+
+    def test_map_header(self):
+        packer = Packer()
+        packer.pack_map_header(2 ** 32 - 1)
+        pytest.raises((OverflowError, ValueError),
+                      packer.pack_array_header, 2 ** 32)
+
+    def test_max_str_len(self):
+        d = 'x' * 3
+        packed = packb(d)
+
+        unpacker = Unpacker(max_str_len=3, encoding='utf-8')
+        unpacker.feed(packed)
+        assert unpacker.unpack() == d
+
+        unpacker = Unpacker(max_str_len=2, encoding='utf-8')
+        unpacker.feed(packed)
+
+        msg = "3 exceeds max_str_len"
+        with tm.assert_raises_regex(ValueError, msg):
+            unpacker.unpack()
+
+    def test_max_bin_len(self):
+        d = b'x' * 3
+        packed = packb(d, use_bin_type=True)
+
+        unpacker = Unpacker(max_bin_len=3)
+        unpacker.feed(packed)
+        assert unpacker.unpack() == d
+
+        unpacker = Unpacker(max_bin_len=2)
+        unpacker.feed(packed)
+
+        msg = "3 exceeds max_bin_len"
+        with tm.assert_raises_regex(ValueError, msg):
+            unpacker.unpack()
+
+    def test_max_array_len(self):
+        d = [1, 2, 3]
+        packed = packb(d)
+
+        unpacker = Unpacker(max_array_len=3)
+        unpacker.feed(packed)
+        assert unpacker.unpack() == d
+
+        unpacker = Unpacker(max_array_len=2)
+        unpacker.feed(packed)
+
+        msg = "3 exceeds max_array_len"
+        with tm.assert_raises_regex(ValueError, msg):
+            unpacker.unpack()
+
+    def test_max_map_len(self):
+        d = {1: 2, 3: 4, 5: 6}
+        packed = packb(d)
+
+        unpacker = Unpacker(max_map_len=3)
+        unpacker.feed(packed)
+        assert unpacker.unpack() == d
+
+        unpacker = Unpacker(max_map_len=2)
+        unpacker.feed(packed)
+
+        msg = "3 exceeds max_map_len"
+        with tm.assert_raises_regex(ValueError, msg):
+            unpacker.unpack()
+
+    def test_max_ext_len(self):
+        d = ExtType(42, b"abc")
+        packed = packb(d)
+
+        unpacker = Unpacker(max_ext_len=3)
+        unpacker.feed(packed)
+        assert unpacker.unpack() == d
+
+        unpacker = Unpacker(max_ext_len=2)
+        unpacker.feed(packed)
+
+        msg = "4 exceeds max_ext_len"
+        with tm.assert_raises_regex(ValueError, msg):
+            unpacker.unpack()
diff --git a/pandas/tests/io/msgpack/test_newspec.py b/pandas/tests/io/msgpack/test_newspec.py
new file mode 100644
index 0000000000000..783bfc1b364f8
--- /dev/null
+++ b/pandas/tests/io/msgpack/test_newspec.py
@@ -0,0 +1,92 @@
+# coding: utf-8
+
+from pandas.io.msgpack import packb, unpackb, ExtType
+
+
+def test_str8():
+    header = b'\xd9'
+    data = b'x' * 32
+    b = packb(data.decode(), use_bin_type=True)
+    assert len(b) == len(data) + 2
+    assert b[0:2] == header + b'\x20'
+    assert b[2:] == data
+    assert unpackb(b) == data
+
+    data = b'x' * 255
+    b = packb(data.decode(), use_bin_type=True)
+    assert len(b) == len(data) + 2
+    assert b[0:2] == header + b'\xff'
+    assert b[2:] == data
+    assert unpackb(b) == data
+
+
+def test_bin8():
+    header = b'\xc4'
+    data = b''
+    b = packb(data, use_bin_type=True)
+    assert len(b) == len(data) + 2
+    assert b[0:2] == header + b'\x00'
+    assert b[2:] == data
+    assert unpackb(b) == data
+
+    data = b'x' * 255
+    b = packb(data, use_bin_type=True)
+    assert len(b) == len(data) + 2
+    assert b[0:2] == header + b'\xff'
+    assert b[2:] == data
+    assert unpackb(b) == data
+
+
+def test_bin16():
+    header = b'\xc5'
+    data = b'x' * 256
+    b = packb(data, use_bin_type=True)
+    assert len(b) == len(data) + 3
+    assert b[0:1] == header
+    assert b[1:3] == b'\x01\x00'
+    assert b[3:] == data
+    assert unpackb(b) == data
+
+    data = b'x' * 65535
+    b = packb(data, use_bin_type=True)
+    assert len(b) == len(data) + 3
+    assert b[0:1] == header
+    assert b[1:3] == b'\xff\xff'
+    assert b[3:] == data
+    assert unpackb(b) == data
+
+
+def test_bin32():
+    header = b'\xc6'
+    data = b'x' * 65536
+    b = packb(data, use_bin_type=True)
+    assert len(b) == len(data) + 5
+    assert b[0:1] == header
+    assert b[1:5] == b'\x00\x01\x00\x00'
+    assert b[5:] == data
+    assert unpackb(b) == data
+
+
+def test_ext():
+    def check(ext, packed):
+        assert packb(ext) == packed
+        assert unpackb(packed) == ext
+
+    check(ExtType(0x42, b'Z'), b'\xd4\x42Z')  # fixext 1
+    check(ExtType(0x42, b'ZZ'), b'\xd5\x42ZZ')  # fixext 2
+    check(ExtType(0x42, b'Z' * 4), b'\xd6\x42' + b'Z' * 4)  # fixext 4
+    check(ExtType(0x42, b'Z' * 8), b'\xd7\x42' + b'Z' * 8)  # fixext 8
+    check(ExtType(0x42, b'Z' * 16), b'\xd8\x42' + b'Z' * 16)  # fixext 16
+    # ext 8
+    check(ExtType(0x42, b''), b'\xc7\x00\x42')
+    check(ExtType(0x42, b'Z' * 255), b'\xc7\xff\x42' + b'Z' * 255)
+    # ext 16
+    check(ExtType(0x42, b'Z' * 256), b'\xc8\x01\x00\x42' + b'Z' * 256)
+    check(ExtType(0x42, b'Z' * 0xffff), b'\xc8\xff\xff\x42' + b'Z' * 0xffff)
+    # ext 32
+    check(
+        ExtType(0x42, b'Z' *
+                0x10000), b'\xc9\x00\x01\x00\x00\x42' + b'Z' * 0x10000)
+    # needs large memory
+    # check(ExtType(0x42, b'Z'*0xffffffff),
+    #              b'\xc9\xff\xff\xff\xff\x42' + b'Z'*0xffffffff)
diff --git a/pandas/tests/io/msgpack/test_obj.py b/pandas/tests/io/msgpack/test_obj.py
new file mode 100644
index 0000000000000..4a6b89907954e
--- /dev/null
+++ b/pandas/tests/io/msgpack/test_obj.py
@@ -0,0 +1,77 @@
+# coding: utf-8
+
+import pytest
+
+from pandas.io.msgpack import packb, unpackb
+
+
+class DecodeError(Exception):
+    pass
+
+
+class TestObj(object):
+
+    def _arr_to_str(self, arr):
+        return ''.join(str(c) for c in arr)
+
+    def bad_complex_decoder(self, o):
+        raise DecodeError("Ooops!")
+
+    def _decode_complex(self, obj):
+        if b'__complex__' in obj:
+            return complex(obj[b'real'], obj[b'imag'])
+        return obj
+
+    def _encode_complex(self, obj):
+        if isinstance(obj, complex):
+            return {b'__complex__': True, b'real': 1, b'imag': 2}
+        return obj
+
+    def test_encode_hook(self):
+        packed = packb([3, 1 + 2j], default=self._encode_complex)
+        unpacked = unpackb(packed, use_list=1)
+        assert unpacked[1] == {b'__complex__': True, b'real': 1, b'imag': 2}
+
+    def test_decode_hook(self):
+        packed = packb([3, {b'__complex__': True, b'real': 1, b'imag': 2}])
+        unpacked = unpackb(packed, object_hook=self._decode_complex,
+                           use_list=1)
+        assert unpacked[1] == 1 + 2j
+
+    def test_decode_pairs_hook(self):
+        packed = packb([3, {1: 2, 3: 4}])
+        prod_sum = 1 * 2 + 3 * 4
+        unpacked = unpackb(
+            packed, object_pairs_hook=lambda l: sum(k * v for k, v in l),
+            use_list=1)
+        assert unpacked[1] == prod_sum
+
+    def test_only_one_obj_hook(self):
+        pytest.raises(TypeError, unpackb, b'', object_hook=lambda x: x,
+                      object_pairs_hook=lambda x: x)
+
+    def test_bad_hook(self):
+        def f():
+            packed = packb([3, 1 + 2j], default=lambda o: o)
+            unpacked = unpackb(packed, use_list=1)  # noqa
+
+        pytest.raises(TypeError, f)
+
+    def test_array_hook(self):
+        packed = packb([1, 2, 3])
+        unpacked = unpackb(packed, list_hook=self._arr_to_str, use_list=1)
+        assert unpacked == '123'
+
+    def test_an_exception_in_objecthook1(self):
+        def f():
+            packed = packb({1: {'__complex__': True, 'real': 1, 'imag': 2}})
+            unpackb(packed, object_hook=self.bad_complex_decoder)
+
+        pytest.raises(DecodeError, f)
+
+    def test_an_exception_in_objecthook2(self):
+        def f():
+            packed = packb({1: [{'__complex__': True, 'real': 1, 'imag': 2}]})
+            unpackb(packed, list_hook=self.bad_complex_decoder, use_list=1)
+
+        pytest.raises(DecodeError, f)
diff --git a/pandas/tests/io/msgpack/test_pack.py b/pandas/tests/io/msgpack/test_pack.py
new file mode 100644
index 0000000000000..3afd1fc086b33
--- /dev/null
+++ b/pandas/tests/io/msgpack/test_pack.py
@@ -0,0 +1,153 @@
+# coding: utf-8
+
+import pytest
+
+import struct
+
+from pandas import compat
+from pandas.compat import u, OrderedDict
+from pandas.io.msgpack import packb, unpackb, Unpacker, Packer
+
+
+class TestPack(object):
+
+    def check(self, data, use_list=False):
+        re = unpackb(packb(data), use_list=use_list)
+        assert re == data
+
+    def testPack(self):
+        test_data = [
+            0, 1, 127, 128, 255, 256, 65535, 65536,
+            -1, -32, -33, -128, -129, -32768, -32769,
+            1.0,
+            b"", b"a", b"a" * 31, b"a" * 32,
+            None, True, False,
+            (), ((),), ((), None,),
+            {None: 0},
+            (1 << 23),
+        ]
+        for td in test_data:
+            self.check(td)
+
+    def testPackUnicode(self):
+        test_data = [u(""), u("abcd"), [u("defgh")], u("Русский текст"), ]
+        for td in test_data:
+            re = unpackb(
+                packb(td, encoding='utf-8'), use_list=1, encoding='utf-8')
+            assert re == td
+            packer = Packer(encoding='utf-8')
+            data = packer.pack(td)
+            re = Unpacker(
+                compat.BytesIO(data), encoding='utf-8', use_list=1).unpack()
+            assert re == td
+
+    def testPackUTF32(self):
+        test_data = [
+            compat.u(""),
+            compat.u("abcd"),
+            [compat.u("defgh")],
+            compat.u("Русский текст"),
+        ]
+        for td in test_data:
+            re = unpackb(
+                packb(td, encoding='utf-32'), use_list=1, encoding='utf-32')
+            assert re == td
+
+    def testPackBytes(self):
+        test_data = [b"", b"abcd", (b"defgh", ), ]
+        for td in test_data:
+            self.check(td)
+
+    def testIgnoreUnicodeErrors(self):
+        re = unpackb(
+            packb(b'abc\xeddef'), encoding='utf-8', unicode_errors='ignore',
+            use_list=1)
+        assert re == "abcdef"
+
+    def testStrictUnicodeUnpack(self):
+        pytest.raises(UnicodeDecodeError, unpackb, packb(b'abc\xeddef'),
+                      encoding='utf-8', use_list=1)
+
+    def testStrictUnicodePack(self):
+        pytest.raises(UnicodeEncodeError, packb, compat.u("abc\xeddef"),
+                      encoding='ascii', unicode_errors='strict')
+
+    def testIgnoreErrorsPack(self):
+        re = unpackb(
+            packb(
+                compat.u("abcФФФdef"), encoding='ascii',
+                unicode_errors='ignore'), encoding='utf-8', use_list=1)
+        assert re == compat.u("abcdef")
+
+    def testNoEncoding(self):
+        pytest.raises(TypeError, packb, compat.u("abc"), encoding=None)
+
+    def testDecodeBinary(self):
+        re = unpackb(packb("abc"), encoding=None, use_list=1)
+        assert re == b"abc"
+
+    def testPackFloat(self):
+        assert packb(1.0,
+                     use_single_float=True) == b'\xca' + struct.pack('>f', 1.0)
+        assert packb(
+            1.0, use_single_float=False) == b'\xcb' + struct.pack('>d', 1.0)
+
+    def testArraySize(self, sizes=[0, 5, 50, 1000]):
+        bio = compat.BytesIO()
+        packer = Packer()
+        for size in sizes:
+            bio.write(packer.pack_array_header(size))
+            for i in range(size):
+                bio.write(packer.pack(i))
+
+        bio.seek(0)
+        unpacker = Unpacker(bio, use_list=1)
+        for size in sizes:
+            assert unpacker.unpack() == list(range(size))
+
+    def test_manualreset(self, sizes=[0, 5, 50, 1000]):
+        packer = Packer(autoreset=False)
+        for size in sizes:
+            packer.pack_array_header(size)
+            for i in range(size):
+                packer.pack(i)
+
+        bio = compat.BytesIO(packer.bytes())
+        unpacker = Unpacker(bio, use_list=1)
+        for size in sizes:
+            assert unpacker.unpack() == list(range(size))
+
+        packer.reset()
+        assert packer.bytes() == b''
+
+    def testMapSize(self, sizes=[0, 5, 50, 1000]):
+        bio = compat.BytesIO()
+        packer = Packer()
+        for size in sizes:
+            bio.write(packer.pack_map_header(size))
+            for i in range(size):
+                bio.write(packer.pack(i))  # key
+                bio.write(packer.pack(i * 2))  # value
+
+        bio.seek(0)
+        unpacker = Unpacker(bio)
+        for size in sizes:
+            assert unpacker.unpack() == {i: i * 2 for i in range(size)}
+
+    def test_odict(self):
+        seq = [(b'one', 1), (b'two', 2), (b'three', 3), (b'four', 4)]
+        od = OrderedDict(seq)
+        assert unpackb(packb(od), use_list=1) == dict(seq)
+
+        def pair_hook(seq):
+            return list(seq)
+
+        assert unpackb(
+            packb(od), object_pairs_hook=pair_hook, use_list=1) == seq
+
+    def test_pairlist(self):
+        pairlist = [(b'a', 1), (2, b'b'), (b'foo', b'bar')]
+        packer = Packer()
+        packed = packer.pack_map_pairs(pairlist)
+        unpacked = unpackb(packed, object_pairs_hook=list)
+        assert pairlist == unpacked
diff --git a/pandas/tests/test_msgpack/test_read_size.py b/pandas/tests/io/msgpack/test_read_size.py
similarity index 96%
rename from pandas/tests/test_msgpack/test_read_size.py
rename to pandas/tests/io/msgpack/test_read_size.py
index 7cbb9c9807201..ef521fa345637 100644
--- a/pandas/tests/test_msgpack/test_read_size.py
+++ b/pandas/tests/io/msgpack/test_read_size.py
@@ -1,7 +1,8 @@
 """Test Unpacker's read_array_header and read_map_header methods"""
-from pandas.msgpack import packb, Unpacker, OutOfData
+from pandas.io.msgpack import packb, Unpacker, OutOfData
 UnexpectedTypeException = ValueError
 
+
 def test_read_array_header():
     unpacker = Unpacker()
     unpacker.feed(packb(['a', 'b', 'c']))
@@ -28,6 +29,7 @@ def test_read_map_header():
     except OutOfData:
         assert 1, 'okay'
 
+
 def test_incorrect_type_array():
     unpacker = Unpacker()
     unpacker.feed(packb(1))
@@ -37,6 +39,7 @@ def test_incorrect_type_array():
     except UnexpectedTypeException:
         assert 1, 'okay'
 
+
 def test_incorrect_type_map():
     unpacker = Unpacker()
     unpacker.feed(packb(1))
@@ -46,6 +49,7 @@ def test_incorrect_type_map():
     except UnexpectedTypeException:
         assert 1, 'okay'
 
+
 def test_correct_type_nested_array():
     unpacker = Unpacker()
     unpacker.feed(packb({'a': ['b', 'c', 'd']}))
@@ -55,6 +59,7 @@ def test_correct_type_nested_array():
     except UnexpectedTypeException:
         assert 1, 'okay'
 
+
 def test_incorrect_type_nested_map():
     unpacker = Unpacker()
     unpacker.feed(packb([{'a': 'b'}]))
@@ -63,4 +68,3 @@ def test_incorrect_type_nested_map():
         assert 0, 'should raise exception'
     except UnexpectedTypeException:
         assert 1, 'okay'
-
diff --git a/pandas/tests/io/msgpack/test_seq.py b/pandas/tests/io/msgpack/test_seq.py
new file mode 100644
index 0000000000000..06e9872a22777
--- /dev/null
+++ b/pandas/tests/io/msgpack/test_seq.py
@@ -0,0 +1,46 @@
+# coding: utf-8
+
+import io
+import pandas.io.msgpack as msgpack
+
+binarydata = bytes(bytearray(range(256)))
+
+
+def gen_binary_data(idx):
+    return binarydata[:idx % 300]
+
+
+def test_exceeding_unpacker_read_size():
+    dumpf = io.BytesIO()
+
+    packer = msgpack.Packer()
+
+    NUMBER_OF_STRINGS = 6
+    read_size = 16
+
+    # 5 ok for read_size=16, while 6 glibc detected *** python: double free or
+    # corruption (fasttop):
+
+    # 20 ok for read_size=256, while 25 segfaults / glibc detected *** python:
+    # double free or corruption (!prev)
+
+    # 40 ok for read_size=1024, while 50 introduces errors
+    # 7000 ok for read_size=1024*1024, while 8000 leads to glibc detected ***
+    # python: double free or corruption (!prev):
+
+    for idx in range(NUMBER_OF_STRINGS):
+        data = gen_binary_data(idx)
+        dumpf.write(packer.pack(data))
+
+    f = io.BytesIO(dumpf.getvalue())
+    dumpf.close()
+
+    unpacker = msgpack.Unpacker(f, read_size=read_size, use_list=1)
+
+    read_count = 0
+    for idx, o in enumerate(unpacker):
+        assert type(o) == bytes
+        assert o == gen_binary_data(idx)
+        read_count += 1
+
+    assert read_count == NUMBER_OF_STRINGS
diff --git a/pandas/tests/io/msgpack/test_sequnpack.py b/pandas/tests/io/msgpack/test_sequnpack.py
new file mode 100644
index 0000000000000..dc6fc5ef916b4
--- /dev/null
+++ b/pandas/tests/io/msgpack/test_sequnpack.py
@@ -0,0 +1,93 @@
+# coding: utf-8
+
+from pandas import compat
+from pandas.io.msgpack import Unpacker, BufferFull
+from pandas.io.msgpack import OutOfData
+
+import pytest
+import pandas.util.testing as tm
+
+
+class TestPack(object):
+
+    def test_partial_data(self):
+        unpacker = Unpacker()
+        msg = "No more data to unpack"
+
+        for data in [b"\xa5", b"h", b"a", b"l", b"l"]:
+            unpacker.feed(data)
+            with tm.assert_raises_regex(StopIteration, msg):
+                next(iter(unpacker))
+
+        unpacker.feed(b"o")
+        assert next(iter(unpacker)) == b"hallo"
+
+    def test_foobar(self):
+        unpacker = Unpacker(read_size=3, use_list=1)
+        unpacker.feed(b'foobar')
+        assert unpacker.unpack() == ord(b'f')
+        assert unpacker.unpack() == ord(b'o')
+        assert unpacker.unpack() == ord(b'o')
+        assert unpacker.unpack() == ord(b'b')
+        assert unpacker.unpack() == ord(b'a')
+        assert unpacker.unpack() == ord(b'r')
+        pytest.raises(OutOfData, unpacker.unpack)
+
+        unpacker.feed(b'foo')
+        unpacker.feed(b'bar')
+
+        k = 0
+        for o, e in zip(unpacker, 'foobarbaz'):
+            assert o == ord(e)
+            k += 1
+        assert k == len(b'foobar')
+
+    def test_foobar_skip(self):
+        unpacker = Unpacker(read_size=3, use_list=1)
+        unpacker.feed(b'foobar')
+        assert unpacker.unpack() == ord(b'f')
+        unpacker.skip()
+        assert unpacker.unpack() == ord(b'o')
+        unpacker.skip()
+        assert unpacker.unpack() == ord(b'a')
+        unpacker.skip()
+        pytest.raises(OutOfData, unpacker.unpack)
+
+    def test_maxbuffersize(self):
+        pytest.raises(ValueError, Unpacker, read_size=5, max_buffer_size=3)
+        unpacker = Unpacker(read_size=3, max_buffer_size=3, use_list=1)
+        unpacker.feed(b'fo')
+        pytest.raises(BufferFull, unpacker.feed, b'ob')
+        unpacker.feed(b'o')
+        assert ord('f') == next(unpacker)
+        unpacker.feed(b'b')
+        assert ord('o') == next(unpacker)
+        assert ord('o') == next(unpacker)
+        assert ord('b') == next(unpacker)
+
+    def test_readbytes(self):
+        unpacker = Unpacker(read_size=3)
+        unpacker.feed(b'foobar')
+        assert unpacker.unpack() == ord(b'f')
+        assert unpacker.read_bytes(3) == b'oob'
+        assert unpacker.unpack() == ord(b'a')
+        assert unpacker.unpack() == ord(b'r')
+
+        # Test buffer refill
+        unpacker = Unpacker(compat.BytesIO(b'foobar'), read_size=3)
+        assert unpacker.unpack() == ord(b'f')
+        assert unpacker.read_bytes(3) == b'oob'
+        assert unpacker.unpack() == ord(b'a')
+        assert unpacker.unpack() == ord(b'r')
+
+    def test_issue124(self):
+        unpacker = Unpacker()
+        unpacker.feed(b'\xa1?\xa1!')
+        assert tuple(unpacker) == (b'?', b'!')
+        assert tuple(unpacker) == ()
+        unpacker.feed(b"\xa1?\xa1")
+        assert tuple(unpacker) == (b'?', )
+        assert tuple(unpacker) == ()
+        unpacker.feed(b"!")
+        assert tuple(unpacker) == (b'!', )
+        assert tuple(unpacker) == ()
diff --git a/pandas/tests/test_msgpack/test_subtype.py b/pandas/tests/io/msgpack/test_subtype.py
similarity index 84%
rename from pandas/tests/test_msgpack/test_subtype.py
rename to pandas/tests/io/msgpack/test_subtype.py
index 0934b31cebeda..e27ec66c63e1f 100644
--- a/pandas/tests/test_msgpack/test_subtype.py
+++ b/pandas/tests/io/msgpack/test_subtype.py
@@ -1,20 +1,24 @@
-#!/usr/bin/env python
 # coding: utf-8
 
-from pandas.msgpack import packb, unpackb
+from pandas.io.msgpack import packb
 from collections import namedtuple
 
+
 class MyList(list):
     pass
 
+
 class MyDict(dict):
     pass
 
+
 class MyTuple(tuple):
     pass
 
+
 MyNamedTuple = namedtuple('MyNamedTuple', 'x y')
 
+
 def test_types():
     assert packb(MyDict()) == packb(dict())
     assert packb(MyList()) == packb(list())
diff --git a/pandas/tests/test_msgpack/test_unpack.py b/pandas/tests/io/msgpack/test_unpack.py
similarity index 85%
rename from pandas/tests/test_msgpack/test_unpack.py
rename to pandas/tests/io/msgpack/test_unpack.py
index fe840083ae1c2..c056f8d800e11 100644
--- a/pandas/tests/test_msgpack/test_unpack.py
+++ b/pandas/tests/io/msgpack/test_unpack.py
@@ -1,24 +1,24 @@
 from io import BytesIO
 import sys
-from pandas.msgpack import Unpacker, packb, OutOfData, ExtType
-import pandas.util.testing as tm
-import nose
+from pandas.io.msgpack import Unpacker, packb, OutOfData, ExtType
+import pytest
+
+
+class TestUnpack(object):
 
-class TestUnpack(tm.TestCase):
     def test_unpack_array_header_from_file(self):
-        f = BytesIO(packb([1,2,3,4]))
+        f = BytesIO(packb([1, 2, 3, 4]))
         unpacker = Unpacker(f)
         assert unpacker.read_array_header() == 4
         assert unpacker.unpack() == 1
         assert unpacker.unpack() == 2
         assert unpacker.unpack() == 3
         assert unpacker.unpack() == 4
-        self.assertRaises(OutOfData, unpacker.unpack)
-
+        pytest.raises(OutOfData, unpacker.unpack)
 
     def test_unpacker_hook_refcnt(self):
         if not hasattr(sys, 'getrefcount'):
-            raise nose.SkipTest('no sys.getrefcount()')
+            pytest.skip('no sys.getrefcount()')
         result = []
 
         def hook(x):
@@ -41,9 +41,7 @@ def hook(x):
 
         assert sys.getrefcount(hook) == basecnt
 
-
     def test_unpacker_ext_hook(self):
-
         class MyUnpacker(Unpacker):
 
             def __init__(self):
diff --git a/pandas/tests/test_msgpack/test_unpack_raw.py b/pandas/tests/io/msgpack/test_unpack_raw.py
similarity index 94%
rename from pandas/tests/test_msgpack/test_unpack_raw.py
rename to pandas/tests/io/msgpack/test_unpack_raw.py
index c6bf747c8d992..a261bf4cbbcd7 100644
--- a/pandas/tests/test_msgpack/test_unpack_raw.py
+++ b/pandas/tests/io/msgpack/test_unpack_raw.py
@@ -1,7 +1,7 @@
 """Tests for cases where the user seeks to obtain packed msgpack objects"""
 
 import io
-from pandas.msgpack import Unpacker, packb
+from pandas.io.msgpack import Unpacker, packb
 
 
 def test_write_bytes():
diff --git a/pandas/tests/io/parser/__init__.py b/pandas/tests/io/parser/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/io/parser/c_parser_only.py b/pandas/tests/io/parser/c_parser_only.py
new file mode 100644
index 0000000000000..9dc7b070f889d
--- /dev/null
+++ b/pandas/tests/io/parser/c_parser_only.py
@@ -0,0 +1,485 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that apply specifically to the CParser. Unless specifically stated
+as a CParser-specific issue, the goal is to eventually move as many of
+these tests out of this module as soon as the Python parser can accept
+further arguments when parsing.
+"""
+
+import os
+import sys
+import tarfile
+
+import pytest
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas import DataFrame
+from pandas.compat import StringIO, range, lrange
+
+
+class CParserTests(object):
+
+    @pytest.mark.parametrize(
+        'malf',
+        ['1\r1\r1\r 1\r 1\r',
+         '1\r1\r1\r 1\r 1\r11\r',
+         '1\r1\r1\r 1\r 1\r11\r1\r'],
+        ids=['words pointer', 'stream pointer', 'lines pointer'])
+    def test_buffer_overflow(self, malf):
+        # see gh-9205: test certain malformed input files that cause
+        # buffer overflows in tokenizer.c
+        cperr = 'Buffer overflow caught - possible malformed input file.'
+        with pytest.raises(pd.errors.ParserError) as excinfo:
+            self.read_table(StringIO(malf))
+        assert cperr in str(excinfo.value)
+
+    def test_buffer_rd_bytes(self):
+        # see gh-12098: src->buffer in the C parser can be freed twice leading
+        # to a segfault if a corrupt gzip file is read with 'read_csv' and the
+        # buffer is filled more than once before gzip throws an exception
+
+        data = '\x1F\x8B\x08\x00\x00\x00\x00\x00\x00\x03\xED\xC3\x41\x09' \
+               '\x00\x00\x08\x00\xB1\xB7\xB6\xBA\xFE\xA5\xCC\x21\x6C\xB0' \
+               '\xA6\x4D' + '\x55' * 267 + \
+               '\x7D\xF7\x00\x91\xE0\x47\x97\x14\x38\x04\x00' \
+               '\x1f\x8b\x08\x00VT\x97V\x00\x03\xed]\xefO'
+        for i in range(100):
+            try:
+                self.read_csv(StringIO(data),
+                              compression='gzip',
+                              delim_whitespace=True)
+            except Exception:
+                pass
+
+    def test_delim_whitespace_custom_terminator(self):
+        # See gh-12912
+        data = """a b c~1 2 3~4 5 6~7 8 9"""
+        df = self.read_csv(StringIO(data), lineterminator='~',
+                           delim_whitespace=True)
+        expected = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                             columns=['a', 'b', 'c'])
+        tm.assert_frame_equal(df, expected)
+
+    def test_dtype_and_names_error(self):
+        # see gh-8833: passing both dtype and names
+        # resulting in an error reporting issue
+        data = """
+1.0 1
+2.0 2
+3.0 3
+"""
+        # base cases
+        result = self.read_csv(StringIO(data), sep=r'\s+', header=None)
+        expected = DataFrame([[1.0, 1], [2.0, 2], [3.0, 3]])
+        tm.assert_frame_equal(result, expected)
+
+        result = self.read_csv(StringIO(data), sep=r'\s+',
+                               header=None, names=['a', 'b'])
+        expected = DataFrame(
+            [[1.0, 1], [2.0, 2], [3.0, 3]], columns=['a', 'b'])
+        tm.assert_frame_equal(result, expected)
+
+        # fallback casting
+        result = self.read_csv(StringIO(
+            data), sep=r'\s+', header=None,
+            names=['a', 'b'], dtype={'a': np.int32})
+        expected = DataFrame([[1, 1], [2, 2], [3, 3]],
+                             columns=['a', 'b'])
+        expected['a'] = expected['a'].astype(np.int32)
+        tm.assert_frame_equal(result, expected)
+
+        data = """
+1.0 1
+nan 2
+3.0 3
+"""
+        # fallback casting, but not castable
+        with tm.assert_raises_regex(ValueError, 'cannot safely convert'):
+            self.read_csv(StringIO(data), sep=r'\s+', header=None,
+                          names=['a', 'b'], dtype={'a': np.int32})
+
+    def test_unsupported_dtype(self):
+        df = DataFrame(np.random.rand(5, 2), columns=list(
+            'AB'), index=['1A', '1B', '1C', '1D', '1E'])
+
+        with tm.ensure_clean('__unsupported_dtype__.csv') as path:
+            df.to_csv(path)
+
+            # valid but we don't support it (date)
+            pytest.raises(TypeError, self.read_csv, path,
+                          dtype={'A': 'datetime64', 'B': 'float64'},
+                          index_col=0)
+            pytest.raises(TypeError, self.read_csv, path,
+                          dtype={'A': 'datetime64', 'B': 'float64'},
+                          index_col=0, parse_dates=['B'])
+
+            # valid but we don't support it
+            pytest.raises(TypeError, self.read_csv, path,
+                          dtype={'A': 'timedelta64', 'B': 'float64'},
+                          index_col=0)
+
+            # valid but unsupported - fixed width unicode string
+            pytest.raises(TypeError, self.read_csv, path,
+                          dtype={'A': 'U8'},
+                          index_col=0)
+
+    @td.skip_if_32bit
+    def test_precise_conversion(self):
+        from decimal import Decimal
+
+        normal_errors = []
+        precise_errors = []
+
+        # test numbers between 1 and 2
+        for num in np.linspace(1., 2., num=500):
+            # 25 decimal digits of precision
+            text = 'a\n{0:.25}'.format(num)
+
+            normal_val = float(self.read_csv(StringIO(text))['a'][0])
+            precise_val = float(self.read_csv(
+                StringIO(text), float_precision='high')['a'][0])
+            roundtrip_val = float(self.read_csv(
+                StringIO(text), float_precision='round_trip')['a'][0])
+            actual_val = Decimal(text[2:])
+
+            def error(val):
+                return abs(Decimal('{0:.100}'.format(val)) - actual_val)
+
+            normal_errors.append(error(normal_val))
+            precise_errors.append(error(precise_val))
+
+            # round-trip should match float()
+            assert roundtrip_val == float(text[2:])
+
+        assert sum(precise_errors) <= sum(normal_errors)
+        assert max(precise_errors) <= max(normal_errors)
+
+    def test_usecols_dtypes(self):
+        data = """\
+1,2,3
+4,5,6
+7,8,9
+10,11,12"""
+
+        result = self.read_csv(StringIO(data), usecols=(0, 1, 2),
+                               names=('a', 'b', 'c'),
+                               header=None,
+                               converters={'a': str},
+                               dtype={'b': int, 'c': float},
+                               )
+        result2 = self.read_csv(StringIO(data), usecols=(0, 2),
+                                names=('a', 'b', 'c'),
+                                header=None,
+                                converters={'a': str},
+                                dtype={'b': int, 'c': float},
+                                )
+        assert (result.dtypes == [object, np.int, np.float]).all()
+        assert (result2.dtypes == [object, np.float]).all()
+
+    def test_disable_bool_parsing(self):
+        # #2090
+
+        data = """A,B,C
+Yes,No,Yes
+No,Yes,Yes
+Yes,,Yes
+No,No,No"""
+
+        result = self.read_csv(StringIO(data), dtype=object)
+        assert (result.dtypes == object).all()
+
+        result = self.read_csv(StringIO(data), dtype=object, na_filter=False)
+        assert result['B'][2] == ''
+
+    def test_custom_lineterminator(self):
+        data = 'a,b,c~1,2,3~4,5,6'
+
+        result = self.read_csv(StringIO(data), lineterminator='~')
+        expected = self.read_csv(StringIO(data.replace('~', '\n')))
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_parse_ragged_csv(self):
+        data = """1,2,3
+1,2,3,4
+1,2,3,4,5
+1,2
+1,2,3,4"""
+
+        nice_data = """1,2,3,,
+1,2,3,4,
+1,2,3,4,5
+1,2,,,
+1,2,3,4,"""
+        result = self.read_csv(StringIO(data), header=None,
+                               names=['a', 'b', 'c', 'd', 'e'])
+
+        expected = self.read_csv(StringIO(nice_data), header=None,
+                                 names=['a', 'b', 'c', 'd', 'e'])
+
+        tm.assert_frame_equal(result, expected)
+
+        # too many columns, cause segfault if not careful
+        data = "1,2\n3,4,5"
+
+        result = self.read_csv(StringIO(data), header=None,
+                               names=lrange(50))
+        expected = self.read_csv(StringIO(data), header=None,
+                                 names=lrange(3)).reindex(columns=lrange(50))
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_tokenize_CR_with_quoting(self):
+        # see gh-3453
+
+        data = ' a,b,c\r"a,b","e,d","f,f"'
+
+        result = self.read_csv(StringIO(data), header=None)
+        expected = self.read_csv(StringIO(data.replace('\r', '\n')),
+                                 header=None)
+        tm.assert_frame_equal(result, expected)
+
+        result = self.read_csv(StringIO(data))
+        expected = self.read_csv(StringIO(data.replace('\r', '\n')))
+        tm.assert_frame_equal(result, expected)
+
+    def test_grow_boundary_at_cap(self):
+        # See gh-12494
+        #
+        # Cause of error was that the C parser
+        # was not increasing the buffer size when
+        # the desired space would fill the buffer
+        # to capacity, which would later cause a
+        # buffer overflow error when checking the
+        # EOF terminator of the CSV stream
+        def test_empty_header_read(count):
+            s = StringIO(',' * count)
+            expected = DataFrame(columns=[
+                'Unnamed: {i}'.format(i=i)
+                for i in range(count + 1)])
+            df = self.read_csv(s)
+            tm.assert_frame_equal(df, expected)
+
+        for count in range(1, 101):
+            test_empty_header_read(count)
+
+    def test_parse_trim_buffers(self):
+        # This test is part of a bugfix for issue #13703. It attempts to
+        # to stress the system memory allocator, to cause it to move the
+        # stream buffer and either let the OS reclaim the region, or let
+        # other memory requests of parser otherwise modify the contents
+        # of memory space, where it was formally located.
+        # This test is designed to cause a `segfault` with unpatched
+        # `tokenizer.c`. Sometimes the test fails on `segfault`, other
+        # times it fails due to memory corruption, which causes the
+        # loaded DataFrame to differ from the expected one.
+
+        # Generate a large mixed-type CSV file on-the-fly (one record is
+        # approx 1.5KiB).
+        record_ = \
+            """9999-9,99:99,,,,ZZ,ZZ,,,ZZZ-ZZZZ,.Z-ZZZZ,-9.99,,,9.99,Z""" \
+            """ZZZZ,,-99,9,ZZZ-ZZZZ,ZZ-ZZZZ,,9.99,ZZZ-ZZZZZ,ZZZ-ZZZZZ,""" \
+            """ZZZ-ZZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,9""" \
+            """99,ZZZ-ZZZZ,,ZZ-ZZZZ,,,,,ZZZZ,ZZZ-ZZZZZ,ZZZ-ZZZZ,,,9,9,""" \
+            """9,9,99,99,999,999,ZZZZZ,ZZZ-ZZZZZ,ZZZ-ZZZZ,9,ZZ-ZZZZ,9.""" \
+            """99,ZZ-ZZZZ,ZZ-ZZZZ,,,,ZZZZ,,,ZZ,ZZ,,,,,,,,,,,,,9,,,999.""" \
+            """99,999.99,,,ZZZZZ,,,Z9,,,,,,,ZZZ,ZZZ,,,,,,,,,,,ZZZZZ,ZZ""" \
+            """ZZZ,ZZZ-ZZZZZZ,ZZZ-ZZZZZZ,ZZ-ZZZZ,ZZ-ZZZZ,ZZ-ZZZZ,ZZ-ZZ""" \
+            """ZZ,,,999999,999999,ZZZ,ZZZ,,,ZZZ,ZZZ,999.99,999.99,,,,Z""" \
+            """ZZ-ZZZ,ZZZ-ZZZ,-9.99,-9.99,9,9,,99,,9.99,9.99,9,9,9.99,""" \
+            """9.99,,,,9.99,9.99,,99,,99,9.99,9.99,,,ZZZ,ZZZ,,999.99,,""" \
+            """999.99,ZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,,,ZZZZZ,ZZZZZ,ZZZ,ZZZ,9,9,""" \
+            """,,,,,ZZZ-ZZZZ,ZZZ999Z,,,999.99,,999.99,ZZZ-ZZZZ,,,9.999""" \
+            """,9.999,9.999,9.999,-9.999,-9.999,-9.999,-9.999,9.999,9.""" \
+            """999,9.999,9.999,9.999,9.999,9.999,9.999,99999,ZZZ-ZZZZ,""" \
+            """,9.99,ZZZ,,,,,,,,ZZZ,,,,,9,,,,9,,,,,,,,,,ZZZ-ZZZZ,ZZZ-Z""" \
+            """ZZZ,,ZZZZZ,ZZZZZ,ZZZZZ,ZZZZZ,,,9.99,,ZZ-ZZZZ,ZZ-ZZZZ,ZZ""" \
+            """,999,,,,ZZ-ZZZZ,ZZZ,ZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,,,99.99,99.99""" \
+            """,,,9.99,9.99,9.99,9.99,ZZZ-ZZZZ,,,ZZZ-ZZZZZ,,,,,-9.99,-""" \
+            """9.99,-9.99,-9.99,,,,,,,,,ZZZ-ZZZZ,,9,9.99,9.99,99ZZ,,-9""" \
+            """.99,-9.99,ZZZ-ZZZZ,,,,,,,ZZZ-ZZZZ,9.99,9.99,9999,,,,,,,""" \
+            """,,,-9.9,Z/Z-ZZZZ,999.99,9.99,,999.99,ZZ-ZZZZ,ZZ-ZZZZ,9.""" \
+            """99,9.99,9.99,9.99,9.99,9.99,,ZZZ-ZZZZZ,ZZZ-ZZZZZ,ZZZ-ZZ""" \
+            """ZZZ,ZZZ-ZZZZZ,ZZZ-ZZZZZ,ZZZ,ZZZ,ZZZ,ZZZ,9.99,,,-9.99,ZZ""" \
+            """-ZZZZ,-999.99,,-9999,,999.99,,,,999.99,99.99,,,ZZ-ZZZZZ""" \
+            """ZZZ,ZZ-ZZZZ-ZZZZZZZ,,,,ZZ-ZZ-ZZZZZZZZ,ZZZZZZZZ,ZZZ-ZZZZ""" \
+            """,9999,999.99,ZZZ-ZZZZ,-9.99,-9.99,ZZZ-ZZZZ,99:99:99,,99""" \
+            """,99,,9.99,,-99.99,,,,,,9.99,ZZZ-ZZZZ,-9.99,-9.99,9.99,9""" \
+            """.99,,ZZZ,,,,,,,ZZZ,ZZZ,,,,,"""
+
+        # Set the number of lines so that a call to `parser_trim_buffers`
+        # is triggered: after a couple of full chunks are consumed a
+        # relatively small 'residual' chunk would cause reallocation
+        # within the parser.
+        chunksize, n_lines = 128, 2 * 128 + 15
+        csv_data = "\n".join([record_] * n_lines) + "\n"
+
+        # We will use StringIO to load the CSV from this text buffer.
+        # pd.read_csv() will iterate over the file in chunks and will
+        # finally read a residual chunk of really small size.
+
+        # Generate the expected output: manually create the dataframe
+        # by splitting by comma and repeating the `n_lines` times.
+        row = tuple(val_ if val_ else np.nan
+                    for val_ in record_.split(","))
+        expected = pd.DataFrame([row for _ in range(n_lines)],
+                                dtype=object, columns=None, index=None)
+
+        # Iterate over the CSV file in chunks of `chunksize` lines
+        chunks_ = self.read_csv(StringIO(csv_data), header=None,
+                                dtype=object, chunksize=chunksize)
+        result = pd.concat(chunks_, axis=0, ignore_index=True)
+
+        # Check for data corruption if there was no segfault
+        tm.assert_frame_equal(result, expected)
+
+        # This extra test was added to replicate the fault in gh-5291.
+        # Force 'utf-8' encoding, so that `_string_convert` would take
+        # a different execution branch.
+        chunks_ = self.read_csv(StringIO(csv_data), header=None,
+                                dtype=object, chunksize=chunksize,
+                                encoding='utf_8')
+        result = pd.concat(chunks_, axis=0, ignore_index=True)
+        tm.assert_frame_equal(result, expected)
+
+    def test_internal_null_byte(self):
+        # see gh-14012
+        #
+        # The null byte ('\x00') should not be used as a
+        # true line terminator, escape character, or comment
+        # character, only as a placeholder to indicate that
+        # none was specified.
+        #
+        # This test should be moved to common.py ONLY when
+        # Python's csv class supports parsing '\x00'.
+        names = ['a', 'b', 'c']
+        data = "1,2,3\n4,\x00,6\n7,8,9"
+        expected = pd.DataFrame([[1, 2.0, 3], [4, np.nan, 6],
+                                 [7, 8, 9]], columns=names)
+
+        result = self.read_csv(StringIO(data), names=names)
+        tm.assert_frame_equal(result, expected)
+
+    def test_read_nrows_large(self):
+        # gh-7626 - Read only nrows of data in for large inputs (>262144b)
+        header_narrow = '\t'.join(['COL_HEADER_' + str(i)
+                                   for i in range(10)]) + '\n'
+        data_narrow = '\t'.join(['somedatasomedatasomedata1'
+                                 for i in range(10)]) + '\n'
+        header_wide = '\t'.join(['COL_HEADER_' + str(i)
+                                 for i in range(15)]) + '\n'
+        data_wide = '\t'.join(['somedatasomedatasomedata2'
+                               for i in range(15)]) + '\n'
+        test_input = (header_narrow + data_narrow * 1050 +
+                      header_wide + data_wide * 2)
+
+        df = self.read_csv(StringIO(test_input), sep='\t', nrows=1010)
+
+        assert df.size == 1010 * 10
+
+    def test_float_precision_round_trip_with_text(self):
+        # gh-15140 - This should not segfault on Python 2.7+
+        df = self.read_csv(StringIO('a'),
+                           float_precision='round_trip',
+                           header=None)
+        tm.assert_frame_equal(df, DataFrame({0: ['a']}))
+
+    def test_large_difference_in_columns(self):
+        # gh-14125
+        count = 10000
+        large_row = ('X,' * count)[:-1] + '\n'
+        normal_row = 'XXXXXX XXXXXX,111111111111111\n'
+        test_input = (large_row + normal_row * 6)[:-1]
+        result = self.read_csv(StringIO(test_input), header=None, usecols=[0])
+        rows = test_input.split('\n')
+        expected = DataFrame([row.split(',')[0] for row in rows])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_data_after_quote(self):
+        # see gh-15910
+
+        data = 'a\n1\n"b"a'
+        result = self.read_csv(StringIO(data))
+        expected = DataFrame({'a': ['1', 'ba']})
+
+        tm.assert_frame_equal(result, expected)
+
+    @tm.capture_stderr
+    def test_comment_whitespace_delimited(self):
+        test_input = """\
+1 2
+2 2 3
+3 2 3 # 3 fields
+4 2 3# 3 fields
+5 2 # 2 fields
+6 2# 2 fields
+7 # 1 field, NaN
+8# 1 field, NaN
+9 2 3 # skipped line
+# comment"""
+        df = self.read_csv(StringIO(test_input), comment='#', header=None,
+                           delimiter='\\s+', skiprows=0,
+                           error_bad_lines=False)
+        error = sys.stderr.getvalue()
+        # skipped lines 2, 3, 4, 9
+        for line_num in (2, 3, 4, 9):
+            assert 'Skipping line {}'.format(line_num) in error, error
+        expected = DataFrame([[1, 2],
+                              [5, 2],
+                              [6, 2],
+                              [7, np.nan],
+                              [8, np.nan]])
+        tm.assert_frame_equal(df, expected)
+
+    def test_file_like_no_next(self):
+        # gh-16530: the file-like need not have a "next" or "__next__"
+        # attribute despite having an "__iter__" attribute.
+        #
+        # NOTE: This is only true for the C engine, not Python engine.
+        class NoNextBuffer(StringIO):
+            def __next__(self):
+                raise AttributeError("No next method")
+
+            next = __next__
+
+        data = "a\n1"
+
+        expected = pd.DataFrame({"a": [1]})
+        result = self.read_csv(NoNextBuffer(data))
+
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("tar_suffix", [".tar", ".tar.gz"])
+    def test_read_tarfile(self, tar_suffix):
+        # see gh-16530
+        #
+        # Unfortunately, Python's CSV library can't handle
+        # tarfile objects (expects string, not bytes when
+        # iterating through a file-like).
+        tar_path = os.path.join(self.dirpath, "tar_csv" + tar_suffix)
+
+        with tarfile.open(tar_path, "r") as tar:
+            data_file = tar.extractfile("tar_data.csv")
+
+            out = self.read_csv(data_file)
+            expected = pd.DataFrame({"a": [1]})
+            tm.assert_frame_equal(out, expected)
+
+    @pytest.mark.high_memory
+    def test_bytes_exceed_2gb(self):
+        """Read from a "CSV" that has a column larger than 2GB.
+
+        GH 16798
+        """
+        if self.low_memory:
+            pytest.skip("not a high_memory test")
+
+        csv = StringIO('strings\n' + '\n'.join(
+            ['x' * (1 << 20) for _ in range(2100)]))
+        df = self.read_csv(csv, low_memory=False)
+        assert not df.empty
diff --git a/pandas/tests/io/parser/comment.py b/pandas/tests/io/parser/comment.py
new file mode 100644
index 0000000000000..9987a017cf985
--- /dev/null
+++ b/pandas/tests/io/parser/comment.py
@@ -0,0 +1,118 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that comments are properly handled during parsing
+for all of the parsers defined in parsers.py
+"""
+
+import numpy as np
+import pandas.util.testing as tm
+
+from pandas import DataFrame
+from pandas.compat import StringIO
+
+
+class CommentTests(object):
+
+    def test_comment(self):
+        data = """A,B,C
+1,2.,4.#hello world
+5.,NaN,10.0
+"""
+        expected = np.array([[1., 2., 4.],
+                             [5., np.nan, 10.]])
+        df = self.read_csv(StringIO(data), comment='#')
+        tm.assert_numpy_array_equal(df.values, expected)
+
+        df = self.read_table(StringIO(data), sep=',', comment='#',
+                             na_values=['NaN'])
+        tm.assert_numpy_array_equal(df.values, expected)
+
+    def test_line_comment(self):
+        data = """# empty
+A,B,C
+1,2.,4.#hello world
+#ignore this line
+5.,NaN,10.0
+"""
+        expected = np.array([[1., 2., 4.],
+                             [5., np.nan, 10.]])
+        df = self.read_csv(StringIO(data), comment='#')
+        tm.assert_numpy_array_equal(df.values, expected)
+
+        # check with delim_whitespace=True
+        df = self.read_csv(StringIO(data.replace(',', ' ')), comment='#',
+                           delim_whitespace=True)
+        tm.assert_almost_equal(df.values, expected)
+
+        # custom line terminator is not supported
+        # with the Python parser yet
+        if self.engine == 'c':
+            expected = np.array([[1., 2., 4.],
+                                 [5., np.nan, 10.]])
+            df = self.read_csv(StringIO(data.replace('\n', '*')),
+                               comment='#', lineterminator='*')
+            tm.assert_numpy_array_equal(df.values, expected)
+
+    def test_comment_skiprows(self):
+        data = """# empty
+random line
+# second empty line
+1,2,3
+A,B,C
+1,2.,4.
+5.,NaN,10.0
+"""
+        # this should ignore the first four lines (including comments)
+        expected = np.array([[1., 2., 4.], [5., np.nan, 10.]])
+        df = self.read_csv(StringIO(data), comment='#', skiprows=4)
+        tm.assert_numpy_array_equal(df.values, expected)
+
+    def test_comment_header(self):
+        data = """# empty
+# second empty line
+1,2,3
+A,B,C
+1,2.,4.
+5.,NaN,10.0
+"""
+        # header should begin at the second non-comment line
+        expected = np.array([[1., 2., 4.], [5., np.nan, 10.]])
+        df = self.read_csv(StringIO(data), comment='#', header=1)
+        tm.assert_numpy_array_equal(df.values, expected)
+
+    def test_comment_skiprows_header(self):
+        data = """# empty
+# second empty line
+# third empty line
+X,Y,Z
+1,2,3
+A,B,C
+1,2.,4.
+5.,NaN,10.0
+"""
+        # skiprows should skip the first 4 lines (including comments), while
+        # header should start from the second non-commented line starting
+        # with line 5
+        expected = np.array([[1., 2., 4.], [5., np.nan, 10.]])
+        df = self.read_csv(StringIO(data), comment='#', skiprows=4, header=1)
+        tm.assert_numpy_array_equal(df.values, expected)
+
+    def test_custom_comment_char(self):
+        data = "a,b,c\n1,2,3#ignore this!\n4,5,6#ignorethistoo"
+
+        result = self.read_csv(StringIO(data), comment='#')
+        expected = DataFrame({'a': [1, 4], 'b': [2, 5], 'c': [3, 6]})
+        tm.assert_frame_equal(result, expected)
+
+    def test_commment_first_line(self):
+        # see gh-4623
+        data = '# notes\na,b,c\n# more notes\n1,2,3'
+
+        expected = DataFrame([[1, 2, 3]], columns=['a', 'b', 'c'])
+        result = self.read_csv(StringIO(data), comment='#')
+        tm.assert_frame_equal(result, expected)
+
+        expected = DataFrame({0: ['a', '1'], 1: ['b', '2'], 2: ['c', '3']})
+        result = self.read_csv(StringIO(data), comment='#', header=None)
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/common.py b/pandas/tests/io/parser/common.py
new file mode 100644
index 0000000000000..9e871d27f0ce8
--- /dev/null
+++ b/pandas/tests/io/parser/common.py
@@ -0,0 +1,1611 @@
+# -*- coding: utf-8 -*-
+
+import csv
+import os
+import platform
+import codecs
+
+import re
+import sys
+from datetime import datetime
+from collections import OrderedDict
+
+import pytest
+import numpy as np
+from pandas._libs.tslib import Timestamp
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import DataFrame, Series, Index, MultiIndex
+from pandas import compat
+from pandas.compat import (StringIO, BytesIO, PY3,
+                           range, lrange, u)
+from pandas.errors import DtypeWarning, EmptyDataError, ParserError
+from pandas.io.common import URLError
+from pandas.io.parsers import TextFileReader, TextParser
+
+
+class ParserTests(object):
+    """
+    Want to be able to test either C+Cython or Python+Cython parsers
+    """
+    data1 = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+
+    def test_empty_decimal_marker(self):
+        data = """A|B|C
+1|2,334|5
+10|13|10.
+"""
+        # Parsers support only length-1 decimals
+        msg = 'Only length-1 decimal markers supported'
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(data), decimal='')
+
+    def test_bad_stream_exception(self):
+        # Issue 13652:
+        # This test validates that both python engine
+        # and C engine will raise UnicodeDecodeError instead of
+        # c engine raising ParserError and swallowing exception
+        # that caused read to fail.
+        codec = codecs.lookup("utf-8")
+        utf8 = codecs.lookup('utf-8')
+
+        if compat.PY3:
+            msg = "'utf-8' codec can't decode byte"
+        else:
+            msg = "'utf8' codec can't decode byte"
+
+        # stream must be binary UTF8
+        with open(self.csv_shiftjs, "rb") as handle, codecs.StreamRecoder(
+                handle, utf8.encode, utf8.decode, codec.streamreader,
+                codec.streamwriter) as stream:
+
+            with tm.assert_raises_regex(UnicodeDecodeError, msg):
+                self.read_csv(stream)
+
+    def test_read_csv(self):
+        if not compat.PY3:
+            if compat.is_platform_windows():
+                prefix = u("file:///")
+            else:
+                prefix = u("file://")
+
+            fname = prefix + compat.text_type(os.path.abspath(self.csv1))
+            self.read_csv(fname, index_col=0, parse_dates=True)
+
+    def test_1000_sep(self):
+        data = """A|B|C
+1|2,334|5
+10|13|10.
+"""
+        expected = DataFrame({
+            'A': [1, 10],
+            'B': [2334, 13],
+            'C': [5, 10.]
+        })
+
+        df = self.read_csv(StringIO(data), sep='|', thousands=',')
+        tm.assert_frame_equal(df, expected)
+
+        df = self.read_table(StringIO(data), sep='|', thousands=',')
+        tm.assert_frame_equal(df, expected)
+
+    def test_squeeze(self):
+        data = """\
+a,1
+b,2
+c,3
+"""
+        idx = Index(['a', 'b', 'c'], name=0)
+        expected = Series([1, 2, 3], name=1, index=idx)
+        result = self.read_table(StringIO(data), sep=',', index_col=0,
+                                 header=None, squeeze=True)
+        assert isinstance(result, Series)
+        tm.assert_series_equal(result, expected)
+
+    def test_squeeze_no_view(self):
+        # see gh-8217
+        # Series should not be a view
+        data = """time,data\n0,10\n1,11\n2,12\n4,14\n5,15\n3,13"""
+        result = self.read_csv(StringIO(data), index_col='time', squeeze=True)
+        assert not result._is_view
+
+    def test_malformed(self):
+        # see gh-6607
+
+        # all
+        data = """ignore
+A,B,C
+1,2,3 # comment
+1,2,3,4,5
+2,3,4
+"""
+        msg = 'Expected 3 fields in line 4, saw 5'
+        with tm.assert_raises_regex(Exception, msg):
+            self.read_table(StringIO(data), sep=',',
+                            header=1, comment='#')
+
+        # first chunk
+        data = """ignore
+A,B,C
+skip
+1,2,3
+3,5,10 # comment
+1,2,3,4,5
+2,3,4
+"""
+        msg = 'Expected 3 fields in line 6, saw 5'
+        with tm.assert_raises_regex(Exception, msg):
+            it = self.read_table(StringIO(data), sep=',',
+                                 header=1, comment='#',
+                                 iterator=True, chunksize=1,
+                                 skiprows=[2])
+            it.read(5)
+
+        # middle chunk
+        data = """ignore
+A,B,C
+skip
+1,2,3
+3,5,10 # comment
+1,2,3,4,5
+2,3,4
+"""
+        msg = 'Expected 3 fields in line 6, saw 5'
+        with tm.assert_raises_regex(Exception, msg):
+            it = self.read_table(StringIO(data), sep=',', header=1,
+                                 comment='#', iterator=True, chunksize=1,
+                                 skiprows=[2])
+            it.read(3)
+
+        # last chunk
+        data = """ignore
+A,B,C
+skip
+1,2,3
+3,5,10 # comment
+1,2,3,4,5
+2,3,4
+"""
+        msg = 'Expected 3 fields in line 6, saw 5'
+        with tm.assert_raises_regex(Exception, msg):
+            it = self.read_table(StringIO(data), sep=',', header=1,
+                                 comment='#', iterator=True, chunksize=1,
+                                 skiprows=[2])
+            it.read()
+
+        # skipfooter is not supported with the C parser yet
+        if self.engine == 'python':
+            # skipfooter
+            data = """ignore
+A,B,C
+1,2,3 # comment
+1,2,3,4,5
+2,3,4
+footer
+"""
+            msg = 'Expected 3 fields in line 4, saw 5'
+            with tm.assert_raises_regex(Exception, msg):
+                self.read_table(StringIO(data), sep=',',
+                                header=1, comment='#',
+                                skipfooter=1)
+
+    def test_quoting(self):
+        bad_line_small = """printer\tresult\tvariant_name
+Klosterdruckerei\tKlosterdruckerei <Salem> (1611-1804)\tMuller, Jacob
+Klosterdruckerei\tKlosterdruckerei <Salem> (1611-1804)\tMuller, Jakob
+Klosterdruckerei\tKlosterdruckerei <Kempten> (1609-1805)\t"Furststiftische Hofdruckerei,  <Kempten""
+Klosterdruckerei\tKlosterdruckerei <Kempten> (1609-1805)\tGaller, Alois
+Klosterdruckerei\tKlosterdruckerei <Kempten> (1609-1805)\tHochfurstliche Buchhandlung <Kempten>"""  # noqa
+        pytest.raises(Exception, self.read_table, StringIO(bad_line_small),
+                      sep='\t')
+
+        good_line_small = bad_line_small + '"'
+        df = self.read_table(StringIO(good_line_small), sep='\t')
+        assert len(df) == 3
+
+    def test_unnamed_columns(self):
+        data = """A,B,C,,
+1,2,3,4,5
+6,7,8,9,10
+11,12,13,14,15
+"""
+        expected = np.array([[1, 2, 3, 4, 5],
+                             [6, 7, 8, 9, 10],
+                             [11, 12, 13, 14, 15]], dtype=np.int64)
+        df = self.read_table(StringIO(data), sep=',')
+        tm.assert_almost_equal(df.values, expected)
+        tm.assert_index_equal(df.columns,
+                              Index(['A', 'B', 'C', 'Unnamed: 3',
+                                     'Unnamed: 4']))
+
+    def test_csv_mixed_type(self):
+        data = """A,B,C
+a,1,2
+b,3,4
+c,4,5
+"""
+        expected = DataFrame({'A': ['a', 'b', 'c'],
+                              'B': [1, 3, 4],
+                              'C': [2, 4, 5]})
+        out = self.read_csv(StringIO(data))
+        tm.assert_frame_equal(out, expected)
+
+    def test_read_csv_low_memory_no_rows_with_index(self):
+        if self.engine == "c" and not self.low_memory:
+            pytest.skip("This is a low-memory specific test")
+
+        # see gh-21141
+        data = """A,B,C
+1,1,1,2
+2,2,3,4
+3,3,4,5
+"""
+        out = self.read_csv(StringIO(data), low_memory=True,
+                            index_col=0, nrows=0)
+        expected = DataFrame(columns=["A", "B", "C"])
+        tm.assert_frame_equal(out, expected)
+
+    def test_read_csv_dataframe(self):
+        df = self.read_csv(self.csv1, index_col=0, parse_dates=True)
+        df2 = self.read_table(self.csv1, sep=',', index_col=0,
+                              parse_dates=True)
+        tm.assert_index_equal(df.columns, pd.Index(['A', 'B', 'C', 'D']))
+        assert df.index.name == 'index'
+        assert isinstance(
+            df.index[0], (datetime, np.datetime64, Timestamp))
+        assert df.values.dtype == np.float64
+        tm.assert_frame_equal(df, df2)
+
+    def test_read_csv_no_index_name(self):
+        df = self.read_csv(self.csv2, index_col=0, parse_dates=True)
+        df2 = self.read_table(self.csv2, sep=',', index_col=0,
+                              parse_dates=True)
+        tm.assert_index_equal(df.columns,
+                              pd.Index(['A', 'B', 'C', 'D', 'E']))
+        assert isinstance(df.index[0], (datetime, np.datetime64, Timestamp))
+        assert df.loc[:, ['A', 'B', 'C', 'D']].values.dtype == np.float64
+        tm.assert_frame_equal(df, df2)
+
+    def test_read_table_unicode(self):
+        fin = BytesIO(u('\u0141aski, Jan;1').encode('utf-8'))
+        df1 = self.read_table(fin, sep=";", encoding="utf-8", header=None)
+        assert isinstance(df1[0].values[0], compat.text_type)
+
+    def test_read_table_wrong_num_columns(self):
+        # too few!
+        data = """A,B,C,D,E,F
+1,2,3,4,5,6
+6,7,8,9,10,11,12
+11,12,13,14,15,16
+"""
+        pytest.raises(ValueError, self.read_csv, StringIO(data))
+
+    def test_read_duplicate_index_explicit(self):
+        data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo,12,13,14,15
+bar,12,13,14,15
+"""
+
+        result = self.read_csv(StringIO(data), index_col=0)
+        expected = self.read_csv(StringIO(data)).set_index(
+            'index', verify_integrity=False)
+        tm.assert_frame_equal(result, expected)
+
+        result = self.read_table(StringIO(data), sep=',', index_col=0)
+        expected = self.read_table(StringIO(data), sep=',', ).set_index(
+            'index', verify_integrity=False)
+        tm.assert_frame_equal(result, expected)
+
+    def test_read_duplicate_index_implicit(self):
+        data = """A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo,12,13,14,15
+bar,12,13,14,15
+"""
+
+        # make sure an error isn't thrown
+        self.read_csv(StringIO(data))
+        self.read_table(StringIO(data), sep=',')
+
+    def test_parse_bools(self):
+        data = """A,B
+True,1
+False,2
+True,3
+"""
+        data = self.read_csv(StringIO(data))
+        assert data['A'].dtype == np.bool_
+
+        data = """A,B
+YES,1
+no,2
+yes,3
+No,3
+Yes,3
+"""
+        data = self.read_csv(StringIO(data),
+                             true_values=['yes', 'Yes', 'YES'],
+                             false_values=['no', 'NO', 'No'])
+        assert data['A'].dtype == np.bool_
+
+        data = """A,B
+TRUE,1
+FALSE,2
+TRUE,3
+"""
+        data = self.read_csv(StringIO(data))
+        assert data['A'].dtype == np.bool_
+
+        data = """A,B
+foo,bar
+bar,foo"""
+        result = self.read_csv(StringIO(data), true_values=['foo'],
+                               false_values=['bar'])
+        expected = DataFrame({'A': [True, False], 'B': [False, True]})
+        tm.assert_frame_equal(result, expected)
+
+    def test_int_conversion(self):
+        data = """A,B
+1.0,1
+2.0,2
+3.0,3
+"""
+        data = self.read_csv(StringIO(data))
+        assert data['A'].dtype == np.float64
+        assert data['B'].dtype == np.int64
+
+    def test_read_nrows(self):
+        expected = self.read_csv(StringIO(self.data1))[:3]
+
+        df = self.read_csv(StringIO(self.data1), nrows=3)
+        tm.assert_frame_equal(df, expected)
+
+        # see gh-10476
+        df = self.read_csv(StringIO(self.data1), nrows=3.0)
+        tm.assert_frame_equal(df, expected)
+
+        msg = r"'nrows' must be an integer >=0"
+
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(self.data1), nrows=1.2)
+
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(self.data1), nrows='foo')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(self.data1), nrows=-1)
+
+    def test_read_chunksize(self):
+        reader = self.read_csv(StringIO(self.data1), index_col=0, chunksize=2)
+        df = self.read_csv(StringIO(self.data1), index_col=0)
+
+        chunks = list(reader)
+
+        tm.assert_frame_equal(chunks[0], df[:2])
+        tm.assert_frame_equal(chunks[1], df[2:4])
+        tm.assert_frame_equal(chunks[2], df[4:])
+
+        # with invalid chunksize value:
+        msg = r"'chunksize' must be an integer >=1"
+
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(self.data1), chunksize=1.3)
+
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(self.data1), chunksize='foo')
+
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(self.data1), chunksize=0)
+
+    def test_read_chunksize_and_nrows(self):
+
+        # gh-15755
+        # With nrows
+        reader = self.read_csv(StringIO(self.data1), index_col=0,
+                               chunksize=2, nrows=5)
+        df = self.read_csv(StringIO(self.data1), index_col=0, nrows=5)
+
+        tm.assert_frame_equal(pd.concat(reader), df)
+
+        # chunksize > nrows
+        reader = self.read_csv(StringIO(self.data1), index_col=0,
+                               chunksize=8, nrows=5)
+        df = self.read_csv(StringIO(self.data1), index_col=0, nrows=5)
+
+        tm.assert_frame_equal(pd.concat(reader), df)
+
+        # with changing "size":
+        reader = self.read_csv(StringIO(self.data1), index_col=0,
+                               chunksize=8, nrows=5)
+        df = self.read_csv(StringIO(self.data1), index_col=0, nrows=5)
+
+        tm.assert_frame_equal(reader.get_chunk(size=2), df.iloc[:2])
+        tm.assert_frame_equal(reader.get_chunk(size=4), df.iloc[2:5])
+        with pytest.raises(StopIteration):
+            reader.get_chunk(size=3)
+
+    def test_read_chunksize_named(self):
+        reader = self.read_csv(
+            StringIO(self.data1), index_col='index', chunksize=2)
+        df = self.read_csv(StringIO(self.data1), index_col='index')
+
+        chunks = list(reader)
+
+        tm.assert_frame_equal(chunks[0], df[:2])
+        tm.assert_frame_equal(chunks[1], df[2:4])
+        tm.assert_frame_equal(chunks[2], df[4:])
+
+    def test_get_chunk_passed_chunksize(self):
+        data = """A,B,C
+1,2,3
+4,5,6
+7,8,9
+1,2,3"""
+        result = self.read_csv(StringIO(data), chunksize=2)
+
+        piece = result.get_chunk()
+        assert len(piece) == 2
+
+    def test_read_chunksize_generated_index(self):
+        # GH 12185
+        reader = self.read_csv(StringIO(self.data1), chunksize=2)
+        df = self.read_csv(StringIO(self.data1))
+
+        tm.assert_frame_equal(pd.concat(reader), df)
+
+        reader = self.read_csv(StringIO(self.data1), chunksize=2, index_col=0)
+        df = self.read_csv(StringIO(self.data1), index_col=0)
+
+        tm.assert_frame_equal(pd.concat(reader), df)
+
+    def test_read_text_list(self):
+        data = """A,B,C\nfoo,1,2,3\nbar,4,5,6"""
+        as_list = [['A', 'B', 'C'], ['foo', '1', '2', '3'], ['bar',
+                                                             '4', '5', '6']]
+        df = self.read_csv(StringIO(data), index_col=0)
+
+        parser = TextParser(as_list, index_col=0, chunksize=2)
+        chunk = parser.read(None)
+
+        tm.assert_frame_equal(chunk, df)
+
+    def test_iterator(self):
+        # See gh-6607
+        reader = self.read_csv(StringIO(self.data1), index_col=0,
+                               iterator=True)
+        df = self.read_csv(StringIO(self.data1), index_col=0)
+
+        chunk = reader.read(3)
+        tm.assert_frame_equal(chunk, df[:3])
+
+        last_chunk = reader.read(5)
+        tm.assert_frame_equal(last_chunk, df[3:])
+
+        # pass list
+        lines = list(csv.reader(StringIO(self.data1)))
+        parser = TextParser(lines, index_col=0, chunksize=2)
+
+        df = self.read_csv(StringIO(self.data1), index_col=0)
+
+        chunks = list(parser)
+        tm.assert_frame_equal(chunks[0], df[:2])
+        tm.assert_frame_equal(chunks[1], df[2:4])
+        tm.assert_frame_equal(chunks[2], df[4:])
+
+        # pass skiprows
+        parser = TextParser(lines, index_col=0, chunksize=2, skiprows=[1])
+        chunks = list(parser)
+        tm.assert_frame_equal(chunks[0], df[1:3])
+
+        treader = self.read_table(StringIO(self.data1), sep=',', index_col=0,
+                                  iterator=True)
+        assert isinstance(treader, TextFileReader)
+
+        # gh-3967: stopping iteration when chunksize is specified
+        data = """A,B,C
+foo,1,2,3
+bar,4,5,6
+baz,7,8,9
+"""
+        reader = self.read_csv(StringIO(data), iterator=True)
+        result = list(reader)
+        expected = DataFrame(dict(A=[1, 4, 7], B=[2, 5, 8], C=[
+            3, 6, 9]), index=['foo', 'bar', 'baz'])
+        tm.assert_frame_equal(result[0], expected)
+
+        # chunksize = 1
+        reader = self.read_csv(StringIO(data), chunksize=1)
+        result = list(reader)
+        expected = DataFrame(dict(A=[1, 4, 7], B=[2, 5, 8], C=[
+            3, 6, 9]), index=['foo', 'bar', 'baz'])
+        assert len(result) == 3
+        tm.assert_frame_equal(pd.concat(result), expected)
+
+        # skipfooter is not supported with the C parser yet
+        if self.engine == 'python':
+            # test bad parameter (skipfooter)
+            reader = self.read_csv(StringIO(self.data1), index_col=0,
+                                   iterator=True, skipfooter=1)
+            pytest.raises(ValueError, reader.read, 3)
+
+    def test_pass_names_with_index(self):
+        lines = self.data1.split('\n')
+        no_header = '\n'.join(lines[1:])
+
+        # regular index
+        names = ['index', 'A', 'B', 'C', 'D']
+        df = self.read_csv(StringIO(no_header), index_col=0, names=names)
+        expected = self.read_csv(StringIO(self.data1), index_col=0)
+        tm.assert_frame_equal(df, expected)
+
+        # multi index
+        data = """index1,index2,A,B,C,D
+foo,one,2,3,4,5
+foo,two,7,8,9,10
+foo,three,12,13,14,15
+bar,one,12,13,14,15
+bar,two,12,13,14,15
+"""
+        lines = data.split('\n')
+        no_header = '\n'.join(lines[1:])
+        names = ['index1', 'index2', 'A', 'B', 'C', 'D']
+        df = self.read_csv(StringIO(no_header), index_col=[0, 1],
+                           names=names)
+        expected = self.read_csv(StringIO(data), index_col=[0, 1])
+        tm.assert_frame_equal(df, expected)
+
+        df = self.read_csv(StringIO(data), index_col=['index1', 'index2'])
+        tm.assert_frame_equal(df, expected)
+
+    def test_multi_index_no_level_names(self):
+        data = """index1,index2,A,B,C,D
+foo,one,2,3,4,5
+foo,two,7,8,9,10
+foo,three,12,13,14,15
+bar,one,12,13,14,15
+bar,two,12,13,14,15
+"""
+
+        data2 = """A,B,C,D
+foo,one,2,3,4,5
+foo,two,7,8,9,10
+foo,three,12,13,14,15
+bar,one,12,13,14,15
+bar,two,12,13,14,15
+"""
+
+        lines = data.split('\n')
+        no_header = '\n'.join(lines[1:])
+        names = ['A', 'B', 'C', 'D']
+
+        df = self.read_csv(StringIO(no_header), index_col=[0, 1],
+                           header=None, names=names)
+        expected = self.read_csv(StringIO(data), index_col=[0, 1])
+        tm.assert_frame_equal(df, expected, check_names=False)
+
+        # 2 implicit first cols
+        df2 = self.read_csv(StringIO(data2))
+        tm.assert_frame_equal(df2, df)
+
+        # reverse order of index
+        df = self.read_csv(StringIO(no_header), index_col=[1, 0], names=names,
+                           header=None)
+        expected = self.read_csv(StringIO(data), index_col=[1, 0])
+        tm.assert_frame_equal(df, expected, check_names=False)
+
+    def test_multi_index_blank_df(self):
+        # GH 14545
+        data = """a,b
+"""
+        df = self.read_csv(StringIO(data), header=[0])
+        expected = DataFrame(columns=['a', 'b'])
+        tm.assert_frame_equal(df, expected)
+        round_trip = self.read_csv(StringIO(
+            expected.to_csv(index=False)), header=[0])
+        tm.assert_frame_equal(round_trip, expected)
+
+        data_multiline = """a,b
+c,d
+"""
+        df2 = self.read_csv(StringIO(data_multiline), header=[0, 1])
+        cols = MultiIndex.from_tuples([('a', 'c'), ('b', 'd')])
+        expected2 = DataFrame(columns=cols)
+        tm.assert_frame_equal(df2, expected2)
+        round_trip = self.read_csv(StringIO(
+            expected2.to_csv(index=False)), header=[0, 1])
+        tm.assert_frame_equal(round_trip, expected2)
+
+    def test_no_unnamed_index(self):
+        data = """ id c0 c1 c2
+0 1 0 a b
+1 2 0 c d
+2 2 2 e f
+"""
+        df = self.read_table(StringIO(data), sep=' ')
+        assert df.index.name is None
+
+    def test_read_csv_parse_simple_list(self):
+        text = """foo
+bar baz
+qux foo
+foo
+bar"""
+        df = self.read_csv(StringIO(text), header=None)
+        expected = DataFrame({0: ['foo', 'bar baz', 'qux foo',
+                                  'foo', 'bar']})
+        tm.assert_frame_equal(df, expected)
+
+    @tm.network
+    def test_url(self, datapath):
+        # HTTP(S)
+        url = ('https://raw.github.com/pandas-dev/pandas/master/'
+               'pandas/tests/io/parser/data/salaries.csv')
+        url_table = self.read_table(url)
+        localtable = datapath('io', 'parser', 'data', 'salaries.csv')
+        local_table = self.read_table(localtable)
+        tm.assert_frame_equal(url_table, local_table)
+        # TODO: ftp testing
+
+    @pytest.mark.slow
+    def test_file(self, datapath):
+        localtable = datapath('io', 'parser', 'data', 'salaries.csv')
+        local_table = self.read_table(localtable)
+
+        try:
+            url_table = self.read_table('file://localhost/' + localtable)
+        except URLError:
+            # fails on some systems
+            pytest.skip("failing on %s" %
+                        ' '.join(platform.uname()).strip())
+
+        tm.assert_frame_equal(url_table, local_table)
+
+    def test_path_pathlib(self):
+        df = tm.makeDataFrame()
+        result = tm.round_trip_pathlib(df.to_csv,
+                                       lambda p: self.read_csv(p, index_col=0))
+        tm.assert_frame_equal(df, result)
+
+    def test_path_localpath(self):
+        df = tm.makeDataFrame()
+        result = tm.round_trip_localpath(
+            df.to_csv,
+            lambda p: self.read_csv(p, index_col=0))
+        tm.assert_frame_equal(df, result)
+
+    def test_nonexistent_path(self):
+        # gh-2428: pls no segfault
+        # gh-14086: raise more helpful FileNotFoundError
+        path = '%s.csv' % tm.rands(10)
+        pytest.raises(compat.FileNotFoundError, self.read_csv, path)
+
+    def test_missing_trailing_delimiters(self):
+        data = """A,B,C,D
+1,2,3,4
+1,3,3,
+1,4,5"""
+        result = self.read_csv(StringIO(data))
+        assert result['D'].isna()[1:].all()
+
+    def test_skipinitialspace(self):
+        s = ('"09-Apr-2012", "01:10:18.300", 2456026.548822908, 12849, '
+             '1.00361,  1.12551, 330.65659, 0355626618.16711,  73.48821, '
+             '314.11625,  1917.09447,   179.71425,  80.000, 240.000, -350,  '
+             '70.06056, 344.98370, 1,   1, -0.689265, -0.692787,  '
+             '0.212036,    14.7674,   41.605,   -9999.0,   -9999.0,   '
+             '-9999.0,   -9999.0,   -9999.0,  -9999.0, 000, 012, 128')
+
+        sfile = StringIO(s)
+        # it's 33 columns
+        result = self.read_csv(sfile, names=lrange(33), na_values=['-9999.0'],
+                               header=None, skipinitialspace=True)
+        assert pd.isna(result.iloc[0, 29])
+
+    def test_utf16_bom_skiprows(self):
+        # #2298
+        data = u("""skip this
+skip this too
+A\tB\tC
+1\t2\t3
+4\t5\t6""")
+
+        data2 = u("""skip this
+skip this too
+A,B,C
+1,2,3
+4,5,6""")
+
+        path = '__%s__.csv' % tm.rands(10)
+
+        with tm.ensure_clean(path) as path:
+            for sep, dat in [('\t', data), (',', data2)]:
+                for enc in ['utf-16', 'utf-16le', 'utf-16be']:
+                    bytes = dat.encode(enc)
+                    with open(path, 'wb') as f:
+                        f.write(bytes)
+
+                    s = BytesIO(dat.encode('utf-8'))
+                    if compat.PY3:
+                        # somewhat False since the code never sees bytes
+                        from io import TextIOWrapper
+                        s = TextIOWrapper(s, encoding='utf-8')
+
+                    result = self.read_csv(path, encoding=enc, skiprows=2,
+                                           sep=sep)
+                    expected = self.read_csv(s, encoding='utf-8', skiprows=2,
+                                             sep=sep)
+                    s.close()
+
+                    tm.assert_frame_equal(result, expected)
+
+    def test_utf16_example(self, datapath):
+        path = datapath('io', 'parser', 'data', 'utf16_ex.txt')
+
+        # it works! and is the right length
+        result = self.read_table(path, encoding='utf-16')
+        assert len(result) == 50
+
+        if not compat.PY3:
+            buf = BytesIO(open(path, 'rb').read())
+            result = self.read_table(buf, encoding='utf-16')
+            assert len(result) == 50
+
+    def test_unicode_encoding(self, datapath):
+        pth = datapath('io', 'parser', 'data', 'unicode_series.csv')
+
+        result = self.read_csv(pth, header=None, encoding='latin-1')
+        result = result.set_index(0)
+
+        got = result[1][1632]
+        expected = u('\xc1 k\xf6ldum klaka (Cold Fever) (1994)')
+
+        assert got == expected
+
+    def test_trailing_delimiters(self):
+        # #2442. grumble grumble
+        data = """A,B,C
+1,2,3,
+4,5,6,
+7,8,9,"""
+        result = self.read_csv(StringIO(data), index_col=False)
+
+        expected = DataFrame({'A': [1, 4, 7], 'B': [2, 5, 8],
+                              'C': [3, 6, 9]})
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_escapechar(self):
+        # http://stackoverflow.com/questions/13824840/feature-request-for-
+        # pandas-read-csv
+        data = '''SEARCH_TERM,ACTUAL_URL
+"bra tv bord","http://www.ikea.com/se/sv/catalog/categories/departments/living_room/10475/?se%7cps%7cnonbranded%7cvardagsrum%7cgoogle%7ctv_bord"
+"tv p\xc3\xa5 hjul","http://www.ikea.com/se/sv/catalog/categories/departments/living_room/10475/?se%7cps%7cnonbranded%7cvardagsrum%7cgoogle%7ctv_bord"
+"SLAGBORD, \\"Bergslagen\\", IKEA:s 1700-tals serie","http://www.ikea.com/se/sv/catalog/categories/departments/living_room/10475/?se%7cps%7cnonbranded%7cvardagsrum%7cgoogle%7ctv_bord"'''  # noqa
+
+        result = self.read_csv(StringIO(data), escapechar='\\',
+                               quotechar='"', encoding='utf-8')
+        assert result['SEARCH_TERM'][2] == ('SLAGBORD, "Bergslagen", '
+                                            'IKEA:s 1700-tals serie')
+        tm.assert_index_equal(result.columns,
+                              Index(['SEARCH_TERM', 'ACTUAL_URL']))
+
+    def test_int64_min_issues(self):
+        # #2599
+        data = 'A,B\n0,0\n0,'
+
+        result = self.read_csv(StringIO(data))
+        expected = DataFrame({'A': [0, 0], 'B': [0, np.nan]})
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_parse_integers_above_fp_precision(self):
+        data = """Numbers
+17007000002000191
+17007000002000191
+17007000002000191
+17007000002000191
+17007000002000192
+17007000002000192
+17007000002000192
+17007000002000192
+17007000002000192
+17007000002000194"""
+
+        result = self.read_csv(StringIO(data))
+        expected = DataFrame({'Numbers': [17007000002000191,
+                                          17007000002000191,
+                                          17007000002000191,
+                                          17007000002000191,
+                                          17007000002000192,
+                                          17007000002000192,
+                                          17007000002000192,
+                                          17007000002000192,
+                                          17007000002000192,
+                                          17007000002000194]})
+
+        tm.assert_series_equal(result['Numbers'], expected['Numbers'])
+
+    def test_chunks_have_consistent_numerical_type(self):
+        integers = [str(i) for i in range(499999)]
+        data = "a\n" + "\n".join(integers + ["1.0", "2.0"] + integers)
+
+        with tm.assert_produces_warning(False):
+            df = self.read_csv(StringIO(data))
+        # Assert that types were coerced.
+        assert type(df.a[0]) is np.float64
+        assert df.a.dtype == np.float
+
+    def test_warn_if_chunks_have_mismatched_type(self):
+        warning_type = False
+        integers = [str(i) for i in range(499999)]
+        data = "a\n" + "\n".join(integers + ['a', 'b'] + integers)
+
+        # see gh-3866: if chunks are different types and can't
+        # be coerced using numerical types, then issue warning.
+        if self.engine == 'c' and self.low_memory:
+            warning_type = DtypeWarning
+
+        with tm.assert_produces_warning(warning_type):
+            df = self.read_csv(StringIO(data))
+        assert df.a.dtype == np.object
+
+    def test_integer_overflow_bug(self):
+        # see gh-2601
+        data = "65248E10 11\n55555E55 22\n"
+
+        result = self.read_csv(StringIO(data), header=None, sep=' ')
+        assert result[0].dtype == np.float64
+
+        result = self.read_csv(StringIO(data), header=None, sep=r'\s+')
+        assert result[0].dtype == np.float64
+
+    def test_catch_too_many_names(self):
+        # see gh-5156
+        data = """\
+1,2,3
+4,,6
+7,8,9
+10,11,12\n"""
+        pytest.raises(ValueError, self.read_csv, StringIO(data),
+                      header=0, names=['a', 'b', 'c', 'd'])
+
+    def test_ignore_leading_whitespace(self):
+        # see gh-3374, gh-6607
+        data = ' a b c\n 1 2 3\n 4 5 6\n 7 8 9'
+        result = self.read_table(StringIO(data), sep=r'\s+')
+        expected = DataFrame({'a': [1, 4, 7], 'b': [2, 5, 8], 'c': [3, 6, 9]})
+        tm.assert_frame_equal(result, expected)
+
+    def test_chunk_begins_with_newline_whitespace(self):
+        # see gh-10022
+        data = '\n hello\nworld\n'
+        result = self.read_csv(StringIO(data), header=None)
+        assert len(result) == 2
+
+        # see gh-9735: this issue is C parser-specific (bug when
+        # parsing whitespace and characters at chunk boundary)
+        if self.engine == 'c':
+            chunk1 = 'a' * (1024 * 256 - 2) + '\na'
+            chunk2 = '\n a'
+            result = self.read_csv(StringIO(chunk1 + chunk2), header=None)
+            expected = DataFrame(['a' * (1024 * 256 - 2), 'a', ' a'])
+            tm.assert_frame_equal(result, expected)
+
+    def test_empty_with_index(self):
+        # see gh-10184
+        data = 'x,y'
+        result = self.read_csv(StringIO(data), index_col=0)
+        expected = DataFrame([], columns=['y'], index=Index([], name='x'))
+        tm.assert_frame_equal(result, expected)
+
+    def test_empty_with_multiindex(self):
+        # see gh-10467
+        data = 'x,y,z'
+        result = self.read_csv(StringIO(data), index_col=['x', 'y'])
+        expected = DataFrame([], columns=['z'],
+                             index=MultiIndex.from_arrays(
+                                 [[]] * 2, names=['x', 'y']))
+        tm.assert_frame_equal(result, expected, check_index_type=False)
+
+    def test_empty_with_reversed_multiindex(self):
+        data = 'x,y,z'
+        result = self.read_csv(StringIO(data), index_col=[1, 0])
+        expected = DataFrame([], columns=['z'],
+                             index=MultiIndex.from_arrays(
+                                 [[]] * 2, names=['y', 'x']))
+        tm.assert_frame_equal(result, expected, check_index_type=False)
+
+    def test_float_parser(self):
+        # see gh-9565
+        data = '45e-1,4.5,45.,inf,-inf'
+        result = self.read_csv(StringIO(data), header=None)
+        expected = DataFrame([[float(s) for s in data.split(',')]])
+        tm.assert_frame_equal(result, expected)
+
+    def test_scientific_no_exponent(self):
+        # see gh-12215
+        df = DataFrame.from_dict(OrderedDict([('w', ['2e']), ('x', ['3E']),
+                                              ('y', ['42e']),
+                                              ('z', ['632E'])]))
+        data = df.to_csv(index=False)
+        for prec in self.float_precision_choices:
+            df_roundtrip = self.read_csv(
+                StringIO(data), float_precision=prec)
+            tm.assert_frame_equal(df_roundtrip, df)
+
+    def test_int64_overflow(self):
+        data = """ID
+00013007854817840016671868
+00013007854817840016749251
+00013007854817840016754630
+00013007854817840016781876
+00013007854817840017028824
+00013007854817840017963235
+00013007854817840018860166"""
+
+        # 13007854817840016671868 > UINT64_MAX, so this
+        # will overflow and return object as the dtype.
+        result = self.read_csv(StringIO(data))
+        assert result['ID'].dtype == object
+
+        # 13007854817840016671868 > UINT64_MAX, so attempts
+        # to cast to either int64 or uint64 will result in
+        # an OverflowError being raised.
+        for conv in (np.int64, np.uint64):
+            pytest.raises(OverflowError, self.read_csv,
+                          StringIO(data), converters={'ID': conv})
+
+        # These numbers fall right inside the int64-uint64 range,
+        # so they should be parsed as string.
+        ui_max = np.iinfo(np.uint64).max
+        i_max = np.iinfo(np.int64).max
+        i_min = np.iinfo(np.int64).min
+
+        for x in [i_max, i_min, ui_max]:
+            result = self.read_csv(StringIO(str(x)), header=None)
+            expected = DataFrame([x])
+            tm.assert_frame_equal(result, expected)
+
+        # These numbers fall just outside the int64-uint64 range,
+        # so they should be parsed as string.
+        too_big = ui_max + 1
+        too_small = i_min - 1
+
+        for x in [too_big, too_small]:
+            result = self.read_csv(StringIO(str(x)), header=None)
+            expected = DataFrame([str(x)])
+            tm.assert_frame_equal(result, expected)
+
+        # No numerical dtype can hold both negative and uint64 values,
+        # so they should be cast as string.
+        data = '-1\n' + str(2**63)
+        expected = DataFrame([str(-1), str(2**63)])
+        result = self.read_csv(StringIO(data), header=None)
+        tm.assert_frame_equal(result, expected)
+
+        data = str(2**63) + '\n-1'
+        expected = DataFrame([str(2**63), str(-1)])
+        result = self.read_csv(StringIO(data), header=None)
+        tm.assert_frame_equal(result, expected)
+
+    def test_empty_with_nrows_chunksize(self):
+        # see gh-9535
+        expected = DataFrame([], columns=['foo', 'bar'])
+        result = self.read_csv(StringIO('foo,bar\n'), nrows=10)
+        tm.assert_frame_equal(result, expected)
+
+        result = next(iter(self.read_csv(
+            StringIO('foo,bar\n'), chunksize=10)))
+        tm.assert_frame_equal(result, expected)
+
+    def test_eof_states(self):
+        # see gh-10728, gh-10548
+
+        # With skip_blank_lines = True
+        expected = DataFrame([[4, 5, 6]], columns=['a', 'b', 'c'])
+
+        # gh-10728: WHITESPACE_LINE
+        data = 'a,b,c\n4,5,6\n '
+        result = self.read_csv(StringIO(data))
+        tm.assert_frame_equal(result, expected)
+
+        # gh-10548: EAT_LINE_COMMENT
+        data = 'a,b,c\n4,5,6\n#comment'
+        result = self.read_csv(StringIO(data), comment='#')
+        tm.assert_frame_equal(result, expected)
+
+        # EAT_CRNL_NOP
+        data = 'a,b,c\n4,5,6\n\r'
+        result = self.read_csv(StringIO(data))
+        tm.assert_frame_equal(result, expected)
+
+        # EAT_COMMENT
+        data = 'a,b,c\n4,5,6#comment'
+        result = self.read_csv(StringIO(data), comment='#')
+        tm.assert_frame_equal(result, expected)
+
+        # SKIP_LINE
+        data = 'a,b,c\n4,5,6\nskipme'
+        result = self.read_csv(StringIO(data), skiprows=[2])
+        tm.assert_frame_equal(result, expected)
+
+        # With skip_blank_lines = False
+
+        # EAT_LINE_COMMENT
+        data = 'a,b,c\n4,5,6\n#comment'
+        result = self.read_csv(
+            StringIO(data), comment='#', skip_blank_lines=False)
+        expected = DataFrame([[4, 5, 6]], columns=['a', 'b', 'c'])
+        tm.assert_frame_equal(result, expected)
+
+        # IN_FIELD
+        data = 'a,b,c\n4,5,6\n '
+        result = self.read_csv(StringIO(data), skip_blank_lines=False)
+        expected = DataFrame(
+            [['4', 5, 6], [' ', None, None]], columns=['a', 'b', 'c'])
+        tm.assert_frame_equal(result, expected)
+
+        # EAT_CRNL
+        data = 'a,b,c\n4,5,6\n\r'
+        result = self.read_csv(StringIO(data), skip_blank_lines=False)
+        expected = DataFrame(
+            [[4, 5, 6], [None, None, None]], columns=['a', 'b', 'c'])
+        tm.assert_frame_equal(result, expected)
+
+        # Should produce exceptions
+
+        # ESCAPED_CHAR
+        data = "a,b,c\n4,5,6\n\\"
+        pytest.raises(Exception, self.read_csv,
+                      StringIO(data), escapechar='\\')
+
+        # ESCAPE_IN_QUOTED_FIELD
+        data = 'a,b,c\n4,5,6\n"\\'
+        pytest.raises(Exception, self.read_csv,
+                      StringIO(data), escapechar='\\')
+
+        # IN_QUOTED_FIELD
+        data = 'a,b,c\n4,5,6\n"'
+        pytest.raises(Exception, self.read_csv,
+                      StringIO(data), escapechar='\\')
+
+    def test_uneven_lines_with_usecols(self):
+        # See gh-12203
+        csv = r"""a,b,c
+        0,1,2
+        3,4,5,6,7
+        8,9,10
+        """
+
+        # make sure that an error is still thrown
+        # when the 'usecols' parameter is not provided
+        msg = r"Expected \d+ fields in line \d+, saw \d+"
+        with tm.assert_raises_regex(ValueError, msg):
+            df = self.read_csv(StringIO(csv))
+
+        expected = DataFrame({
+            'a': [0, 3, 8],
+            'b': [1, 4, 9]
+        })
+
+        usecols = [0, 1]
+        df = self.read_csv(StringIO(csv), usecols=usecols)
+        tm.assert_frame_equal(df, expected)
+
+        usecols = ['a', 'b']
+        df = self.read_csv(StringIO(csv), usecols=usecols)
+        tm.assert_frame_equal(df, expected)
+
+    def test_read_empty_with_usecols(self):
+        # See gh-12493
+        names = ['Dummy', 'X', 'Dummy_2']
+        usecols = names[1:2]  # ['X']
+
+        # first, check to see that the response of
+        # parser when faced with no provided columns
+        # throws the correct error, with or without usecols
+        errmsg = "No columns to parse from file"
+
+        with tm.assert_raises_regex(EmptyDataError, errmsg):
+            self.read_csv(StringIO(''))
+
+        with tm.assert_raises_regex(EmptyDataError, errmsg):
+            self.read_csv(StringIO(''), usecols=usecols)
+
+        expected = DataFrame(columns=usecols, index=[0], dtype=np.float64)
+        df = self.read_csv(StringIO(',,'), names=names, usecols=usecols)
+        tm.assert_frame_equal(df, expected)
+
+        expected = DataFrame(columns=usecols)
+        df = self.read_csv(StringIO(''), names=names, usecols=usecols)
+        tm.assert_frame_equal(df, expected)
+
+    def test_trailing_spaces(self):
+        data = "A B C  \nrandom line with trailing spaces    \nskip\n1,2,3\n1,2.,4.\nrandom line with trailing tabs\t\t\t\n   \n5.1,NaN,10.0\n"  # noqa
+        expected = DataFrame([[1., 2., 4.],
+                              [5.1, np.nan, 10.]])
+
+        # gh-8661, gh-8679: this should ignore six lines including
+        # lines with trailing whitespace and blank lines
+        df = self.read_csv(StringIO(data.replace(',', '  ')),
+                           header=None, delim_whitespace=True,
+                           skiprows=[0, 1, 2, 3, 5, 6], skip_blank_lines=True)
+        tm.assert_frame_equal(df, expected)
+        df = self.read_table(StringIO(data.replace(',', '  ')),
+                             header=None, delim_whitespace=True,
+                             skiprows=[0, 1, 2, 3, 5, 6],
+                             skip_blank_lines=True)
+        tm.assert_frame_equal(df, expected)
+
+        # gh-8983: test skipping set of rows after a row with trailing spaces
+        expected = DataFrame({"A": [1., 5.1], "B": [2., np.nan],
+                              "C": [4., 10]})
+        df = self.read_table(StringIO(data.replace(',', '  ')),
+                             delim_whitespace=True,
+                             skiprows=[1, 2, 3, 5, 6], skip_blank_lines=True)
+        tm.assert_frame_equal(df, expected)
+
+    def test_raise_on_sep_with_delim_whitespace(self):
+        # see gh-6607
+        data = 'a b c\n1 2 3'
+        with tm.assert_raises_regex(ValueError,
+                                    'you can only specify one'):
+            self.read_table(StringIO(data), sep=r'\s', delim_whitespace=True)
+
+    def test_single_char_leading_whitespace(self):
+        # see gh-9710
+        data = """\
+MyColumn
+   a
+   b
+   a
+   b\n"""
+
+        expected = DataFrame({'MyColumn': list('abab')})
+
+        result = self.read_csv(StringIO(data), delim_whitespace=True,
+                               skipinitialspace=True)
+        tm.assert_frame_equal(result, expected)
+
+        result = self.read_csv(StringIO(data), skipinitialspace=True)
+        tm.assert_frame_equal(result, expected)
+
+    def test_empty_lines(self):
+        data = """\
+A,B,C
+1,2.,4.
+
+
+5.,NaN,10.0
+
+-70,.4,1
+"""
+        expected = np.array([[1., 2., 4.],
+                             [5., np.nan, 10.],
+                             [-70., .4, 1.]])
+        df = self.read_csv(StringIO(data))
+        tm.assert_numpy_array_equal(df.values, expected)
+        df = self.read_csv(StringIO(data.replace(',', '  ')), sep=r'\s+')
+        tm.assert_numpy_array_equal(df.values, expected)
+        expected = np.array([[1., 2., 4.],
+                             [np.nan, np.nan, np.nan],
+                             [np.nan, np.nan, np.nan],
+                             [5., np.nan, 10.],
+                             [np.nan, np.nan, np.nan],
+                             [-70., .4, 1.]])
+        df = self.read_csv(StringIO(data), skip_blank_lines=False)
+        tm.assert_numpy_array_equal(df.values, expected)
+
+    def test_whitespace_lines(self):
+        data = """
+
+\t  \t\t
+  \t
+A,B,C
+  \t    1,2.,4.
+5.,NaN,10.0
+"""
+        expected = np.array([[1, 2., 4.],
+                             [5., np.nan, 10.]])
+        df = self.read_csv(StringIO(data))
+        tm.assert_numpy_array_equal(df.values, expected)
+
+    def test_regex_separator(self):
+        # see gh-6607
+        data = """   A   B   C   D
+a   1   2   3   4
+b   1   2   3   4
+c   1   2   3   4
+"""
+        df = self.read_table(StringIO(data), sep=r'\s+')
+        expected = self.read_csv(StringIO(re.sub('[ ]+', ',', data)),
+                                 index_col=0)
+        assert expected.index.name is None
+        tm.assert_frame_equal(df, expected)
+
+        data = '    a b c\n1 2 3 \n4 5  6\n 7 8 9'
+        result = self.read_table(StringIO(data), sep=r'\s+')
+        expected = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                             columns=['a', 'b', 'c'])
+        tm.assert_frame_equal(result, expected)
+
+    @tm.capture_stdout
+    def test_verbose_import(self):
+        text = """a,b,c,d
+one,1,2,3
+one,1,2,3
+,1,2,3
+one,1,2,3
+,1,2,3
+,1,2,3
+one,1,2,3
+two,1,2,3"""
+
+        # Engines are verbose in different ways.
+        self.read_csv(StringIO(text), verbose=True)
+        output = sys.stdout.getvalue()
+
+        if self.engine == 'c':
+            assert 'Tokenization took:' in output
+            assert 'Parser memory cleanup took:' in output
+        else:  # Python engine
+            assert output == 'Filled 3 NA values in column a\n'
+
+        # Reset the stdout buffer.
+        sys.stdout = StringIO()
+
+        text = """a,b,c,d
+one,1,2,3
+two,1,2,3
+three,1,2,3
+four,1,2,3
+five,1,2,3
+,1,2,3
+seven,1,2,3
+eight,1,2,3"""
+
+        self.read_csv(StringIO(text), verbose=True, index_col=0)
+        output = sys.stdout.getvalue()
+
+        # Engines are verbose in different ways.
+        if self.engine == 'c':
+            assert 'Tokenization took:' in output
+            assert 'Parser memory cleanup took:' in output
+        else:  # Python engine
+            assert output == 'Filled 1 NA values in column a\n'
+
+    @pytest.mark.skipif(PY3, reason="won't work in Python 3")
+    def test_iteration_open_handle(self):
+
+        with tm.ensure_clean() as path:
+            with open(path, 'wb') as f:
+                f.write('AAA\nBBB\nCCC\nDDD\nEEE\nFFF\nGGG')
+
+            with open(path, 'rb') as f:
+                for line in f:
+                    if 'CCC' in line:
+                        break
+
+                if self.engine == 'c':
+                    pytest.raises(Exception, self.read_table,
+                                  f, squeeze=True, header=None)
+                else:
+                    result = self.read_table(f, squeeze=True, header=None)
+                    expected = Series(['DDD', 'EEE', 'FFF', 'GGG'], name=0)
+                    tm.assert_series_equal(result, expected)
+
+    def test_1000_sep_with_decimal(self):
+        data = """A|B|C
+1|2,334.01|5
+10|13|10.
+"""
+        expected = DataFrame({
+            'A': [1, 10],
+            'B': [2334.01, 13],
+            'C': [5, 10.]
+        })
+
+        assert expected.A.dtype == 'int64'
+        assert expected.B.dtype == 'float'
+        assert expected.C.dtype == 'float'
+
+        df = self.read_csv(StringIO(data), sep='|', thousands=',', decimal='.')
+        tm.assert_frame_equal(df, expected)
+
+        df = self.read_table(StringIO(data), sep='|',
+                             thousands=',', decimal='.')
+        tm.assert_frame_equal(df, expected)
+
+        data_with_odd_sep = """A|B|C
+1|2.334,01|5
+10|13|10,
+"""
+        df = self.read_csv(StringIO(data_with_odd_sep),
+                           sep='|', thousands='.', decimal=',')
+        tm.assert_frame_equal(df, expected)
+
+        df = self.read_table(StringIO(data_with_odd_sep),
+                             sep='|', thousands='.', decimal=',')
+        tm.assert_frame_equal(df, expected)
+
+    def test_euro_decimal_format(self):
+        data = """Id;Number1;Number2;Text1;Text2;Number3
+1;1521,1541;187101,9543;ABC;poi;4,738797819
+2;121,12;14897,76;DEF;uyt;0,377320872
+3;878,158;108013,434;GHI;rez;2,735694704"""
+
+        df2 = self.read_csv(StringIO(data), sep=';', decimal=',')
+        assert df2['Number1'].dtype == float
+        assert df2['Number2'].dtype == float
+        assert df2['Number3'].dtype == float
+
+    def test_inf_parsing(self):
+        data = """\
+,A
+a,inf
+b,-inf
+c,+Inf
+d,-Inf
+e,INF
+f,-INF
+g,+INf
+h,-INf
+i,inF
+j,-inF"""
+        inf = float('inf')
+        expected = Series([inf, -inf] * 5)
+
+        df = self.read_csv(StringIO(data), index_col=0)
+        tm.assert_almost_equal(df['A'].values, expected.values)
+
+        df = self.read_csv(StringIO(data), index_col=0, na_filter=False)
+        tm.assert_almost_equal(df['A'].values, expected.values)
+
+    def test_raise_on_no_columns(self):
+        # single newline
+        data = "\n"
+        pytest.raises(EmptyDataError, self.read_csv, StringIO(data))
+
+        # test with more than a single newline
+        data = "\n\n\n"
+        pytest.raises(EmptyDataError, self.read_csv, StringIO(data))
+
+    def test_memory_map(self):
+        mmap_file = os.path.join(self.dirpath, 'test_mmap.csv')
+        expected = DataFrame({
+            'a': [1, 2, 3],
+            'b': ['one', 'two', 'three'],
+            'c': ['I', 'II', 'III']
+        })
+
+        out = self.read_csv(mmap_file, memory_map=True)
+        tm.assert_frame_equal(out, expected)
+
+    def test_null_byte_char(self):
+        # see gh-2741
+        data = '\x00,foo'
+        cols = ['a', 'b']
+
+        expected = DataFrame([[np.nan, 'foo']],
+                             columns=cols)
+
+        if self.engine == 'c':
+            out = self.read_csv(StringIO(data), names=cols)
+            tm.assert_frame_equal(out, expected)
+        else:
+            msg = "NULL byte detected"
+            with tm.assert_raises_regex(ParserError, msg):
+                self.read_csv(StringIO(data), names=cols)
+
+    def test_utf8_bom(self):
+        # see gh-4793
+        bom = u('\ufeff')
+        utf8 = 'utf-8'
+
+        def _encode_data_with_bom(_data):
+            bom_data = (bom + _data).encode(utf8)
+            return BytesIO(bom_data)
+
+        # basic test
+        data = 'a\n1'
+        expected = DataFrame({'a': [1]})
+
+        out = self.read_csv(_encode_data_with_bom(data),
+                            encoding=utf8)
+        tm.assert_frame_equal(out, expected)
+
+        # test with "regular" quoting
+        data = '"a"\n1'
+        expected = DataFrame({'a': [1]})
+
+        out = self.read_csv(_encode_data_with_bom(data),
+                            encoding=utf8, quotechar='"')
+        tm.assert_frame_equal(out, expected)
+
+        # test in a data row instead of header
+        data = 'b\n1'
+        expected = DataFrame({'a': ['b', '1']})
+
+        out = self.read_csv(_encode_data_with_bom(data),
+                            encoding=utf8, names=['a'])
+        tm.assert_frame_equal(out, expected)
+
+        # test in empty data row with skipping
+        data = '\n1'
+        expected = DataFrame({'a': [1]})
+
+        out = self.read_csv(_encode_data_with_bom(data),
+                            encoding=utf8, names=['a'],
+                            skip_blank_lines=True)
+        tm.assert_frame_equal(out, expected)
+
+        # test in empty data row without skipping
+        data = '\n1'
+        expected = DataFrame({'a': [np.nan, 1.0]})
+
+        out = self.read_csv(_encode_data_with_bom(data),
+                            encoding=utf8, names=['a'],
+                            skip_blank_lines=False)
+        tm.assert_frame_equal(out, expected)
+
+    def test_temporary_file(self):
+        # see gh-13398
+        data1 = "0 0"
+
+        from tempfile import TemporaryFile
+        new_file = TemporaryFile("w+")
+        new_file.write(data1)
+        new_file.flush()
+        new_file.seek(0)
+
+        result = self.read_csv(new_file, sep=r'\s+', header=None)
+        new_file.close()
+        expected = DataFrame([[0, 0]])
+        tm.assert_frame_equal(result, expected)
+
+    def test_read_csv_utf_aliases(self):
+        # see gh issue 13549
+        expected = pd.DataFrame({'mb_num': [4.8], 'multibyte': ['test']})
+        for byte in [8, 16]:
+            for fmt in ['utf-{0}', 'utf_{0}', 'UTF-{0}', 'UTF_{0}']:
+                encoding = fmt.format(byte)
+                data = 'mb_num,multibyte\n4.8,test'.encode(encoding)
+                result = self.read_csv(BytesIO(data), encoding=encoding)
+                tm.assert_frame_equal(result, expected)
+
+    def test_internal_eof_byte(self):
+        # see gh-5500
+        data = "a,b\n1\x1a,2"
+
+        expected = pd.DataFrame([["1\x1a", 2]], columns=['a', 'b'])
+        result = self.read_csv(StringIO(data))
+        tm.assert_frame_equal(result, expected)
+
+    def test_internal_eof_byte_to_file(self):
+        # see gh-16559
+        data = b'c1,c2\r\n"test \x1a    test", test\r\n'
+        expected = pd.DataFrame([["test \x1a    test", " test"]],
+                                columns=["c1", "c2"])
+
+        path = '__%s__.csv' % tm.rands(10)
+
+        with tm.ensure_clean(path) as path:
+            with open(path, "wb") as f:
+                f.write(data)
+
+            result = self.read_csv(path)
+            tm.assert_frame_equal(result, expected)
+
+    def test_sub_character(self, datapath):
+        # see gh-16893
+        filename = datapath('io', 'parser', 'data', 'sub_char.csv')
+
+        expected = DataFrame([[1, 2, 3]], columns=["a", "\x1ab", "c"])
+        result = self.read_csv(filename)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_file_handles(self):
+        # GH 14418 - don't close user provided file handles
+
+        fh = StringIO('a,b\n1,2')
+        self.read_csv(fh)
+        assert not fh.closed
+
+        with open(self.csv1, 'r') as f:
+            self.read_csv(f)
+            assert not f.closed
+
+        # mmap not working with python engine
+        if self.engine != 'python':
+
+            import mmap
+            with open(self.csv1, 'r') as f:
+                m = mmap.mmap(f.fileno(), 0, access=mmap.ACCESS_READ)
+                self.read_csv(m)
+                # closed attribute new in python 3.2
+                if PY3:
+                    assert not m.closed
+                m.close()
+
+    def test_invalid_file_buffer(self, mock):
+        # see gh-15337
+
+        class InvalidBuffer(object):
+            pass
+
+        msg = "Invalid file path or buffer object type"
+
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(InvalidBuffer())
+
+        # gh-16135: we want to ensure that "tell" and "seek"
+        # aren't actually being used when we call `read_csv`
+        #
+        # Thus, while the object may look "invalid" (these
+        # methods are attributes of the `StringIO` class),
+        # it is still a valid file-object for our purposes.
+        class NoSeekTellBuffer(StringIO):
+            def tell(self):
+                raise AttributeError("No tell method")
+
+            def seek(self, pos, whence=0):
+                raise AttributeError("No seek method")
+
+        data = "a\n1"
+
+        expected = pd.DataFrame({"a": [1]})
+        result = self.read_csv(NoSeekTellBuffer(data))
+
+        tm.assert_frame_equal(result, expected)
+
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(mock.Mock())
+
+    @tm.capture_stderr
+    def test_skip_bad_lines(self):
+        # see gh-15925
+        data = 'a\n1\n1,2,3\n4\n5,6,7'
+
+        with pytest.raises(ParserError):
+            self.read_csv(StringIO(data))
+
+        with pytest.raises(ParserError):
+            self.read_csv(StringIO(data), error_bad_lines=True)
+
+        expected = DataFrame({'a': [1, 4]})
+
+        out = self.read_csv(StringIO(data),
+                            error_bad_lines=False,
+                            warn_bad_lines=False)
+        tm.assert_frame_equal(out, expected)
+
+        val = sys.stderr.getvalue()
+        assert val == ''
+
+        # Reset the stderr buffer.
+        sys.stderr = StringIO()
+
+        out = self.read_csv(StringIO(data),
+                            error_bad_lines=False,
+                            warn_bad_lines=True)
+        tm.assert_frame_equal(out, expected)
+
+        val = sys.stderr.getvalue()
+        assert 'Skipping line 3' in val
+        assert 'Skipping line 5' in val
diff --git a/pandas/tests/io/parser/compression.py b/pandas/tests/io/parser/compression.py
new file mode 100644
index 0000000000000..e4950af19ea95
--- /dev/null
+++ b/pandas/tests/io/parser/compression.py
@@ -0,0 +1,139 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests compressed data parsing functionality for all
+of the parsers defined in parsers.py
+"""
+
+import pytest
+
+import pandas as pd
+import pandas.compat as compat
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+import gzip
+import bz2
+try:
+    lzma = compat.import_lzma()
+except ImportError:
+    lzma = None
+
+
+class CompressionTests(object):
+
+    def test_zip(self):
+        import zipfile
+
+        with open(self.csv1, 'rb') as data_file:
+            data = data_file.read()
+            expected = self.read_csv(self.csv1)
+
+        with tm.ensure_clean('test_file.zip') as path:
+            tmp = zipfile.ZipFile(path, mode='w')
+            tmp.writestr('test_file', data)
+            tmp.close()
+
+            result = self.read_csv(path, compression='zip')
+            tm.assert_frame_equal(result, expected)
+
+            result = self.read_csv(path, compression='infer')
+            tm.assert_frame_equal(result, expected)
+
+            if self.engine is not 'python':
+                with open(path, 'rb') as f:
+                    result = self.read_csv(f, compression='zip')
+                    tm.assert_frame_equal(result, expected)
+
+        with tm.ensure_clean('combined_zip.zip') as path:
+            inner_file_names = ['test_file', 'second_file']
+            tmp = zipfile.ZipFile(path, mode='w')
+            for file_name in inner_file_names:
+                tmp.writestr(file_name, data)
+            tmp.close()
+
+            tm.assert_raises_regex(ValueError, 'Multiple files',
+                                   self.read_csv, path, compression='zip')
+
+            tm.assert_raises_regex(ValueError, 'Multiple files',
+                                   self.read_csv, path,
+                                   compression='infer')
+
+        with tm.ensure_clean() as path:
+            tmp = zipfile.ZipFile(path, mode='w')
+            tmp.close()
+
+            tm.assert_raises_regex(ValueError, 'Zero files',
+                                   self.read_csv, path, compression='zip')
+
+        with tm.ensure_clean() as path:
+            with open(path, 'wb') as f:
+                pytest.raises(zipfile.BadZipfile, self.read_csv,
+                              f, compression='zip')
+
+    @pytest.mark.parametrize('compress_type, compress_method, ext', [
+        ('gzip', gzip.GzipFile, 'gz'),
+        ('bz2', bz2.BZ2File, 'bz2'),
+        pytest.param('xz', getattr(lzma, 'LZMAFile', None), 'xz',
+                     marks=td.skip_if_no_lzma)
+    ])
+    def test_other_compression(self, compress_type, compress_method, ext):
+
+        with open(self.csv1, 'rb') as data_file:
+            data = data_file.read()
+            expected = self.read_csv(self.csv1)
+
+        with tm.ensure_clean() as path:
+            tmp = compress_method(path, mode='wb')
+            tmp.write(data)
+            tmp.close()
+
+            result = self.read_csv(path, compression=compress_type)
+            tm.assert_frame_equal(result, expected)
+
+            if compress_type == 'bz2':
+                pytest.raises(ValueError, self.read_csv,
+                              path, compression='bz3')
+
+            with open(path, 'rb') as fin:
+                result = self.read_csv(fin, compression=compress_type)
+                tm.assert_frame_equal(result, expected)
+
+        with tm.ensure_clean('test.{}'.format(ext)) as path:
+            tmp = compress_method(path, mode='wb')
+            tmp.write(data)
+            tmp.close()
+            result = self.read_csv(path, compression='infer')
+            tm.assert_frame_equal(result, expected)
+
+    def test_read_csv_infer_compression(self):
+        # see gh-9770
+        expected = self.read_csv(self.csv1, index_col=0, parse_dates=True)
+
+        with open(self.csv1) as f:
+            inputs = [self.csv1, self.csv1 + '.gz',
+                      self.csv1 + '.bz2', f]
+
+            for inp in inputs:
+                df = self.read_csv(inp, index_col=0, parse_dates=True,
+                                   compression='infer')
+
+                tm.assert_frame_equal(expected, df)
+
+    def test_read_csv_compressed_utf16_example(self, datapath):
+        # GH18071
+        path = datapath('io', 'parser', 'data', 'utf16_ex_small.zip')
+
+        result = self.read_csv(path, encoding='utf-16',
+                               compression='zip', sep='\t')
+        expected = pd.DataFrame({
+            u'Country': [u'Venezuela', u'Venezuela'],
+            u'Twitter': [u'Hugo Chávez Frías', u'Henrique Capriles R.']
+        })
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_invalid_compression(self):
+        msg = 'Unrecognized compression type: sfark'
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv('test_file.zip', compression='sfark')
diff --git a/pandas/tests/io/parser/converters.py b/pandas/tests/io/parser/converters.py
new file mode 100644
index 0000000000000..ae35d45591dc5
--- /dev/null
+++ b/pandas/tests/io/parser/converters.py
@@ -0,0 +1,153 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests column conversion functionality during parsing
+for all of the parsers defined in parsers.py
+"""
+
+from datetime import datetime
+
+import pytest
+
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+
+from pandas._libs.tslib import Timestamp
+from pandas import DataFrame, Index
+from pandas.compat import parse_date, StringIO, lmap
+
+
+class ConverterTests(object):
+
+    def test_converters_type_must_be_dict(self):
+        data = """index,A,B,C,D
+foo,2,3,4,5
+"""
+        with tm.assert_raises_regex(TypeError, 'Type converters.+'):
+            self.read_csv(StringIO(data), converters=0)
+
+    def test_converters(self):
+        data = """A,B,C,D
+a,1,2,01/01/2009
+b,3,4,01/02/2009
+c,4,5,01/03/2009
+"""
+        result = self.read_csv(StringIO(data), converters={'D': parse_date})
+        result2 = self.read_csv(StringIO(data), converters={3: parse_date})
+
+        expected = self.read_csv(StringIO(data))
+        expected['D'] = expected['D'].map(parse_date)
+
+        assert isinstance(result['D'][0], (datetime, Timestamp))
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result2, expected)
+
+        # produce integer
+        converter = lambda x: int(x.split('/')[2])
+        result = self.read_csv(StringIO(data), converters={'D': converter})
+        expected = self.read_csv(StringIO(data))
+        expected['D'] = expected['D'].map(converter)
+        tm.assert_frame_equal(result, expected)
+
+    def test_converters_no_implicit_conv(self):
+        # see gh-2184
+        data = """000102,1.2,A\n001245,2,B"""
+        f = lambda x: x.strip()
+        converter = {0: f}
+        df = self.read_csv(StringIO(data), header=None, converters=converter)
+        assert df[0].dtype == object
+
+    def test_converters_euro_decimal_format(self):
+        data = """Id;Number1;Number2;Text1;Text2;Number3
+1;1521,1541;187101,9543;ABC;poi;4,738797819
+2;121,12;14897,76;DEF;uyt;0,377320872
+3;878,158;108013,434;GHI;rez;2,735694704"""
+        f = lambda x: float(x.replace(",", "."))
+        converter = {'Number1': f, 'Number2': f, 'Number3': f}
+        df2 = self.read_csv(StringIO(data), sep=';', converters=converter)
+        assert df2['Number1'].dtype == float
+        assert df2['Number2'].dtype == float
+        assert df2['Number3'].dtype == float
+
+    def test_converter_return_string_bug(self):
+        # see gh-583
+        data = """Id;Number1;Number2;Text1;Text2;Number3
+1;1521,1541;187101,9543;ABC;poi;4,738797819
+2;121,12;14897,76;DEF;uyt;0,377320872
+3;878,158;108013,434;GHI;rez;2,735694704"""
+        f = lambda x: float(x.replace(",", "."))
+        converter = {'Number1': f, 'Number2': f, 'Number3': f}
+        df2 = self.read_csv(StringIO(data), sep=';', converters=converter)
+        assert df2['Number1'].dtype == float
+
+    def test_converters_corner_with_nas(self):
+        # skip aberration observed on Win64 Python 3.2.2
+        if hash(np.int64(-1)) != -2:
+            pytest.skip("skipping because of windows hash on Python"
+                        " 3.2.2")
+
+        data = """id,score,days
+1,2,12
+2,2-5,
+3,,14+
+4,6-12,2"""
+
+        def convert_days(x):
+            x = x.strip()
+            if not x:
+                return np.nan
+
+            is_plus = x.endswith('+')
+            if is_plus:
+                x = int(x[:-1]) + 1
+            else:
+                x = int(x)
+            return x
+
+        def convert_days_sentinel(x):
+            x = x.strip()
+            if not x:
+                return np.nan
+
+            is_plus = x.endswith('+')
+            if is_plus:
+                x = int(x[:-1]) + 1
+            else:
+                x = int(x)
+            return x
+
+        def convert_score(x):
+            x = x.strip()
+            if not x:
+                return np.nan
+            if x.find('-') > 0:
+                valmin, valmax = lmap(int, x.split('-'))
+                val = 0.5 * (valmin + valmax)
+            else:
+                val = float(x)
+
+            return val
+
+        fh = StringIO(data)
+        result = self.read_csv(fh, converters={'score': convert_score,
+                                               'days': convert_days},
+                               na_values=['', None])
+        assert pd.isna(result['days'][1])
+
+        fh = StringIO(data)
+        result2 = self.read_csv(fh, converters={'score': convert_score,
+                                                'days': convert_days_sentinel},
+                                na_values=['', None])
+        tm.assert_frame_equal(result, result2)
+
+    def test_converter_index_col_bug(self):
+        # see gh-1835
+        data = "A;B\n1;2\n3;4"
+
+        rs = self.read_csv(StringIO(data), sep=';', index_col='A',
+                           converters={'A': lambda x: x})
+
+        xp = DataFrame({'B': [2, 4]}, index=Index([1, 3], name='A'))
+        tm.assert_frame_equal(rs, xp)
+        assert rs.index.name == xp.index.name
diff --git a/pandas/tests/io/parser/data/iris.csv b/pandas/tests/io/parser/data/iris.csv
new file mode 100644
index 0000000000000..c19b9c3688515
--- /dev/null
+++ b/pandas/tests/io/parser/data/iris.csv
@@ -0,0 +1,151 @@
+SepalLength,SepalWidth,PetalLength,PetalWidth,Name
+5.1,3.5,1.4,0.2,Iris-setosa
+4.9,3.0,1.4,0.2,Iris-setosa
+4.7,3.2,1.3,0.2,Iris-setosa
+4.6,3.1,1.5,0.2,Iris-setosa
+5.0,3.6,1.4,0.2,Iris-setosa
+5.4,3.9,1.7,0.4,Iris-setosa
+4.6,3.4,1.4,0.3,Iris-setosa
+5.0,3.4,1.5,0.2,Iris-setosa
+4.4,2.9,1.4,0.2,Iris-setosa
+4.9,3.1,1.5,0.1,Iris-setosa
+5.4,3.7,1.5,0.2,Iris-setosa
+4.8,3.4,1.6,0.2,Iris-setosa
+4.8,3.0,1.4,0.1,Iris-setosa
+4.3,3.0,1.1,0.1,Iris-setosa
+5.8,4.0,1.2,0.2,Iris-setosa
+5.7,4.4,1.5,0.4,Iris-setosa
+5.4,3.9,1.3,0.4,Iris-setosa
+5.1,3.5,1.4,0.3,Iris-setosa
+5.7,3.8,1.7,0.3,Iris-setosa
+5.1,3.8,1.5,0.3,Iris-setosa
+5.4,3.4,1.7,0.2,Iris-setosa
+5.1,3.7,1.5,0.4,Iris-setosa
+4.6,3.6,1.0,0.2,Iris-setosa
+5.1,3.3,1.7,0.5,Iris-setosa
+4.8,3.4,1.9,0.2,Iris-setosa
+5.0,3.0,1.6,0.2,Iris-setosa
+5.0,3.4,1.6,0.4,Iris-setosa
+5.2,3.5,1.5,0.2,Iris-setosa
+5.2,3.4,1.4,0.2,Iris-setosa
+4.7,3.2,1.6,0.2,Iris-setosa
+4.8,3.1,1.6,0.2,Iris-setosa
+5.4,3.4,1.5,0.4,Iris-setosa
+5.2,4.1,1.5,0.1,Iris-setosa
+5.5,4.2,1.4,0.2,Iris-setosa
+4.9,3.1,1.5,0.1,Iris-setosa
+5.0,3.2,1.2,0.2,Iris-setosa
+5.5,3.5,1.3,0.2,Iris-setosa
+4.9,3.1,1.5,0.1,Iris-setosa
+4.4,3.0,1.3,0.2,Iris-setosa
+5.1,3.4,1.5,0.2,Iris-setosa
+5.0,3.5,1.3,0.3,Iris-setosa
+4.5,2.3,1.3,0.3,Iris-setosa
+4.4,3.2,1.3,0.2,Iris-setosa
+5.0,3.5,1.6,0.6,Iris-setosa
+5.1,3.8,1.9,0.4,Iris-setosa
+4.8,3.0,1.4,0.3,Iris-setosa
+5.1,3.8,1.6,0.2,Iris-setosa
+4.6,3.2,1.4,0.2,Iris-setosa
+5.3,3.7,1.5,0.2,Iris-setosa
+5.0,3.3,1.4,0.2,Iris-setosa
+7.0,3.2,4.7,1.4,Iris-versicolor
+6.4,3.2,4.5,1.5,Iris-versicolor
+6.9,3.1,4.9,1.5,Iris-versicolor
+5.5,2.3,4.0,1.3,Iris-versicolor
+6.5,2.8,4.6,1.5,Iris-versicolor
+5.7,2.8,4.5,1.3,Iris-versicolor
+6.3,3.3,4.7,1.6,Iris-versicolor
+4.9,2.4,3.3,1.0,Iris-versicolor
+6.6,2.9,4.6,1.3,Iris-versicolor
+5.2,2.7,3.9,1.4,Iris-versicolor
+5.0,2.0,3.5,1.0,Iris-versicolor
+5.9,3.0,4.2,1.5,Iris-versicolor
+6.0,2.2,4.0,1.0,Iris-versicolor
+6.1,2.9,4.7,1.4,Iris-versicolor
+5.6,2.9,3.6,1.3,Iris-versicolor
+6.7,3.1,4.4,1.4,Iris-versicolor
+5.6,3.0,4.5,1.5,Iris-versicolor
+5.8,2.7,4.1,1.0,Iris-versicolor
+6.2,2.2,4.5,1.5,Iris-versicolor
+5.6,2.5,3.9,1.1,Iris-versicolor
+5.9,3.2,4.8,1.8,Iris-versicolor
+6.1,2.8,4.0,1.3,Iris-versicolor
+6.3,2.5,4.9,1.5,Iris-versicolor
+6.1,2.8,4.7,1.2,Iris-versicolor
+6.4,2.9,4.3,1.3,Iris-versicolor
+6.6,3.0,4.4,1.4,Iris-versicolor
+6.8,2.8,4.8,1.4,Iris-versicolor
+6.7,3.0,5.0,1.7,Iris-versicolor
+6.0,2.9,4.5,1.5,Iris-versicolor
+5.7,2.6,3.5,1.0,Iris-versicolor
+5.5,2.4,3.8,1.1,Iris-versicolor
+5.5,2.4,3.7,1.0,Iris-versicolor
+5.8,2.7,3.9,1.2,Iris-versicolor
+6.0,2.7,5.1,1.6,Iris-versicolor
+5.4,3.0,4.5,1.5,Iris-versicolor
+6.0,3.4,4.5,1.6,Iris-versicolor
+6.7,3.1,4.7,1.5,Iris-versicolor
+6.3,2.3,4.4,1.3,Iris-versicolor
+5.6,3.0,4.1,1.3,Iris-versicolor
+5.5,2.5,4.0,1.3,Iris-versicolor
+5.5,2.6,4.4,1.2,Iris-versicolor
+6.1,3.0,4.6,1.4,Iris-versicolor
+5.8,2.6,4.0,1.2,Iris-versicolor
+5.0,2.3,3.3,1.0,Iris-versicolor
+5.6,2.7,4.2,1.3,Iris-versicolor
+5.7,3.0,4.2,1.2,Iris-versicolor
+5.7,2.9,4.2,1.3,Iris-versicolor
+6.2,2.9,4.3,1.3,Iris-versicolor
+5.1,2.5,3.0,1.1,Iris-versicolor
+5.7,2.8,4.1,1.3,Iris-versicolor
+6.3,3.3,6.0,2.5,Iris-virginica
+5.8,2.7,5.1,1.9,Iris-virginica
+7.1,3.0,5.9,2.1,Iris-virginica
+6.3,2.9,5.6,1.8,Iris-virginica
+6.5,3.0,5.8,2.2,Iris-virginica
+7.6,3.0,6.6,2.1,Iris-virginica
+4.9,2.5,4.5,1.7,Iris-virginica
+7.3,2.9,6.3,1.8,Iris-virginica
+6.7,2.5,5.8,1.8,Iris-virginica
+7.2,3.6,6.1,2.5,Iris-virginica
+6.5,3.2,5.1,2.0,Iris-virginica
+6.4,2.7,5.3,1.9,Iris-virginica
+6.8,3.0,5.5,2.1,Iris-virginica
+5.7,2.5,5.0,2.0,Iris-virginica
+5.8,2.8,5.1,2.4,Iris-virginica
+6.4,3.2,5.3,2.3,Iris-virginica
+6.5,3.0,5.5,1.8,Iris-virginica
+7.7,3.8,6.7,2.2,Iris-virginica
+7.7,2.6,6.9,2.3,Iris-virginica
+6.0,2.2,5.0,1.5,Iris-virginica
+6.9,3.2,5.7,2.3,Iris-virginica
+5.6,2.8,4.9,2.0,Iris-virginica
+7.7,2.8,6.7,2.0,Iris-virginica
+6.3,2.7,4.9,1.8,Iris-virginica
+6.7,3.3,5.7,2.1,Iris-virginica
+7.2,3.2,6.0,1.8,Iris-virginica
+6.2,2.8,4.8,1.8,Iris-virginica
+6.1,3.0,4.9,1.8,Iris-virginica
+6.4,2.8,5.6,2.1,Iris-virginica
+7.2,3.0,5.8,1.6,Iris-virginica
+7.4,2.8,6.1,1.9,Iris-virginica
+7.9,3.8,6.4,2.0,Iris-virginica
+6.4,2.8,5.6,2.2,Iris-virginica
+6.3,2.8,5.1,1.5,Iris-virginica
+6.1,2.6,5.6,1.4,Iris-virginica
+7.7,3.0,6.1,2.3,Iris-virginica
+6.3,3.4,5.6,2.4,Iris-virginica
+6.4,3.1,5.5,1.8,Iris-virginica
+6.0,3.0,4.8,1.8,Iris-virginica
+6.9,3.1,5.4,2.1,Iris-virginica
+6.7,3.1,5.6,2.4,Iris-virginica
+6.9,3.1,5.1,2.3,Iris-virginica
+5.8,2.7,5.1,1.9,Iris-virginica
+6.8,3.2,5.9,2.3,Iris-virginica
+6.7,3.3,5.7,2.5,Iris-virginica
+6.7,3.0,5.2,2.3,Iris-virginica
+6.3,2.5,5.0,1.9,Iris-virginica
+6.5,3.0,5.2,2.0,Iris-virginica
+6.2,3.4,5.4,2.3,Iris-virginica
+5.9,3.0,5.1,1.8,Iris-virginica
\ No newline at end of file
diff --git a/pandas/tests/io/parser/data/items.jsonl b/pandas/tests/io/parser/data/items.jsonl
new file mode 100644
index 0000000000000..f784d37befa82
--- /dev/null
+++ b/pandas/tests/io/parser/data/items.jsonl
@@ -0,0 +1,2 @@
+{"a": 1, "b": 2}
+{"b":2, "a" :1}
diff --git a/pandas/io/tests/data/salary.table b/pandas/tests/io/parser/data/salaries.csv
similarity index 100%
rename from pandas/io/tests/data/salary.table
rename to pandas/tests/io/parser/data/salaries.csv
diff --git a/pandas/tests/io/parser/data/salaries.csv.bz2 b/pandas/tests/io/parser/data/salaries.csv.bz2
new file mode 100644
index 0000000000000..a68b4e62bf34a
Binary files /dev/null and b/pandas/tests/io/parser/data/salaries.csv.bz2 differ
diff --git a/pandas/io/tests/data/salary.table.gz b/pandas/tests/io/parser/data/salaries.csv.gz
similarity index 100%
rename from pandas/io/tests/data/salary.table.gz
rename to pandas/tests/io/parser/data/salaries.csv.gz
diff --git a/pandas/tests/io/parser/data/salaries.csv.xz b/pandas/tests/io/parser/data/salaries.csv.xz
new file mode 100644
index 0000000000000..40df8e8f936dc
Binary files /dev/null and b/pandas/tests/io/parser/data/salaries.csv.xz differ
diff --git a/pandas/tests/io/parser/data/salaries.csv.zip b/pandas/tests/io/parser/data/salaries.csv.zip
new file mode 100644
index 0000000000000..294f65b36771d
Binary files /dev/null and b/pandas/tests/io/parser/data/salaries.csv.zip differ
diff --git a/pandas/tests/io/parser/data/sauron.SHIFT_JIS.csv b/pandas/tests/io/parser/data/sauron.SHIFT_JIS.csv
new file mode 100644
index 0000000000000..218ddf333ef52
--- /dev/null
+++ b/pandas/tests/io/parser/data/sauron.SHIFT_JIS.csv
@@ -0,0 +1,14 @@
+num, text
+1,�T�E�����iSauron�A�A�C�k�A�̑n���̎� - ��O�I3019�N3��25���j�́AJ�ER�ER�E�g�[���L���̒����𕑑�Ƃ��������w�z�r�b�g�̖`���x�w�w�֕���x�w�V���}�����̕���x�̓o��l���B
+2,�w�z�r�b�g�̖`���x�Ɍ��y�̂���u���l����Ȃ��t�v�i�f��w�z�r�b�g�V���[�Y�x�̎����ł́u���l�����i�l�N���}���T�[�j�v�j�Ƃ͔ނ̂��Ƃł���B
+3,���̑��҂ł���w�w�֕���x�ɂ����Ắu��̎w�ցithe One Ring�j�v�̍���A�u�����iDark Lord�j�v�A�u���̎ҁithe One�j[1]�v�Ƃ��ēo�ꂷ��B�O�j�ɂ�����w�V���}�����̕���x�ł́A����̖��������S�X�̍ł��͂��鑤�߂ł������B
+4,�T�E�����͌����A�A���_�i�n���j�̑n����S�����V�g�I�푰�A�C�k�A�̈���ł��������A�僁���R�[���̔��t�ɉ��S���đ����A�A���_�ɊQ���Ȃ����݂ƂȂ����B
+5,�u�T�E�����v�Ƃ̓N�E�F�����Łu�g�̖т̂悾���́v�Ƃ����Ӗ��ł���A�V���_�����œ��l�̈Ӗ��ł��閼�O�u�S���T�E�A�v�ƌĂ΂�邱�Ƃ�����B
+6,�����́A�T�E����������A���݌������G���t�ɂ�閼�ł���A�w�w�֕���x�쒆�ɂ����ăA���S�����́u����i�T�E�����j�͎����̖{���̖��͎g��Ȃ����A��������ɏ���������ɏo�����肷�邱�Ƃ������Ȃ��v�Ɣ������Ă���B
+7,���̂ق��A���I�ɃG���t�ɑ΂��Ď��̂����Ƃ���閼�ɁA�u�A���i�^�[���i������N�j�v�A�u�A���^�m�i���M�ȍ׍H�t�j�v�A�u�A�E�����f�B���i�A�E���̉��l�j�v������B
+8,���I�̍��̃T�E�����́A���݂ɕϐg����\�͂������Ă����B
+9,���̔\�͂��g���Ό��ڗ킵�����h�ȊO���𑕂����Ƃ�A�܂�����ȘT��z����������Ƃ����������ɕς��邱�Ƃ��ł��A�G���t���狰���ꂽ�B
+10,���I�Ɉ�̎w�ւ����グ���T�E�����́A���̗͂̎w�ւŐ�����鎖���₻�̏��L�҂��x�z�ł���悤�ɂȂ����B
+11,�܂��A���̂��łтĂ��w�ւ�������艽�x�ł��h�邱�Ƃ��ł����B
+12,�������k�[���m�[���v���̍ۂɔ��������̂�j�󂳂ꂽ��́A��x�Ɣ������ϐg���邱�Ƃ͂ł��Ȃ��Ȃ�A���̈��ӂ̋�̂悤�Ȍ�������낵���p�����Ƃ�Ȃ��Ȃ����Ƃ����B
+13,�܂����΂��΁u�܂Ԃ��̂Ȃ��΂ɉ����ꂽ�ځv�Ƃ������S�ە\���ő�����ꂽ�B
diff --git a/pandas/tests/io/parser/data/sub_char.csv b/pandas/tests/io/parser/data/sub_char.csv
new file mode 100644
index 0000000000000..ff1fa777832c7
--- /dev/null
+++ b/pandas/tests/io/parser/data/sub_char.csv
@@ -0,0 +1,2 @@
+a,"b",c
+1,2,3
\ No newline at end of file
diff --git a/pandas/tests/io/parser/data/tar_csv.tar b/pandas/tests/io/parser/data/tar_csv.tar
new file mode 100644
index 0000000000000..d1819550e0a00
Binary files /dev/null and b/pandas/tests/io/parser/data/tar_csv.tar differ
diff --git a/pandas/tests/io/parser/data/tar_csv.tar.gz b/pandas/tests/io/parser/data/tar_csv.tar.gz
new file mode 100644
index 0000000000000..b5a0f3e1b5805
Binary files /dev/null and b/pandas/tests/io/parser/data/tar_csv.tar.gz differ
diff --git a/pandas/tests/io/parser/data/test1.csv b/pandas/tests/io/parser/data/test1.csv
new file mode 100644
index 0000000000000..4bdb62943c4c8
--- /dev/null
+++ b/pandas/tests/io/parser/data/test1.csv
@@ -0,0 +1,8 @@
+index,A,B,C,D
+2000-01-03 00:00:00,0.980268513777,3.68573087906,-0.364216805298,-1.15973806169
+2000-01-04 00:00:00,1.04791624281,-0.0412318367011,-0.16181208307,0.212549316967
+2000-01-05 00:00:00,0.498580885705,0.731167677815,-0.537677223318,1.34627041952
+2000-01-06 00:00:00,1.12020151869,1.56762092543,0.00364077397681,0.67525259227
+2000-01-07 00:00:00,-0.487094399463,0.571454623474,-1.6116394093,0.103468562917
+2000-01-10 00:00:00,0.836648671666,0.246461918642,0.588542635376,1.0627820613
+2000-01-11 00:00:00,-0.157160753327,1.34030689438,1.19577795622,-1.09700699751
\ No newline at end of file
diff --git a/pandas/io/tests/data/test1.csv.bz2 b/pandas/tests/io/parser/data/test1.csv.bz2
similarity index 100%
rename from pandas/io/tests/data/test1.csv.bz2
rename to pandas/tests/io/parser/data/test1.csv.bz2
diff --git a/pandas/io/tests/data/test1.csv.gz b/pandas/tests/io/parser/data/test1.csv.gz
similarity index 100%
rename from pandas/io/tests/data/test1.csv.gz
rename to pandas/tests/io/parser/data/test1.csv.gz
diff --git a/pandas/io/tests/data/test2.csv b/pandas/tests/io/parser/data/test2.csv
similarity index 100%
rename from pandas/io/tests/data/test2.csv
rename to pandas/tests/io/parser/data/test2.csv
diff --git a/pandas/tests/io/parser/data/test_mmap.csv b/pandas/tests/io/parser/data/test_mmap.csv
new file mode 100644
index 0000000000000..2885fc2bfbd69
--- /dev/null
+++ b/pandas/tests/io/parser/data/test_mmap.csv
@@ -0,0 +1,4 @@
+a,b,c
+1,one,I
+2,two,II
+3,three,III
diff --git a/pandas/tests/io/parser/data/tips.csv b/pandas/tests/io/parser/data/tips.csv
new file mode 100644
index 0000000000000..856a65a69e647
--- /dev/null
+++ b/pandas/tests/io/parser/data/tips.csv
@@ -0,0 +1,245 @@
+total_bill,tip,sex,smoker,day,time,size
+16.99,1.01,Female,No,Sun,Dinner,2
+10.34,1.66,Male,No,Sun,Dinner,3
+21.01,3.5,Male,No,Sun,Dinner,3
+23.68,3.31,Male,No,Sun,Dinner,2
+24.59,3.61,Female,No,Sun,Dinner,4
+25.29,4.71,Male,No,Sun,Dinner,4
+8.77,2.0,Male,No,Sun,Dinner,2
+26.88,3.12,Male,No,Sun,Dinner,4
+15.04,1.96,Male,No,Sun,Dinner,2
+14.78,3.23,Male,No,Sun,Dinner,2
+10.27,1.71,Male,No,Sun,Dinner,2
+35.26,5.0,Female,No,Sun,Dinner,4
+15.42,1.57,Male,No,Sun,Dinner,2
+18.43,3.0,Male,No,Sun,Dinner,4
+14.83,3.02,Female,No,Sun,Dinner,2
+21.58,3.92,Male,No,Sun,Dinner,2
+10.33,1.67,Female,No,Sun,Dinner,3
+16.29,3.71,Male,No,Sun,Dinner,3
+16.97,3.5,Female,No,Sun,Dinner,3
+20.65,3.35,Male,No,Sat,Dinner,3
+17.92,4.08,Male,No,Sat,Dinner,2
+20.29,2.75,Female,No,Sat,Dinner,2
+15.77,2.23,Female,No,Sat,Dinner,2
+39.42,7.58,Male,No,Sat,Dinner,4
+19.82,3.18,Male,No,Sat,Dinner,2
+17.81,2.34,Male,No,Sat,Dinner,4
+13.37,2.0,Male,No,Sat,Dinner,2
+12.69,2.0,Male,No,Sat,Dinner,2
+21.7,4.3,Male,No,Sat,Dinner,2
+19.65,3.0,Female,No,Sat,Dinner,2
+9.55,1.45,Male,No,Sat,Dinner,2
+18.35,2.5,Male,No,Sat,Dinner,4
+15.06,3.0,Female,No,Sat,Dinner,2
+20.69,2.45,Female,No,Sat,Dinner,4
+17.78,3.27,Male,No,Sat,Dinner,2
+24.06,3.6,Male,No,Sat,Dinner,3
+16.31,2.0,Male,No,Sat,Dinner,3
+16.93,3.07,Female,No,Sat,Dinner,3
+18.69,2.31,Male,No,Sat,Dinner,3
+31.27,5.0,Male,No,Sat,Dinner,3
+16.04,2.24,Male,No,Sat,Dinner,3
+17.46,2.54,Male,No,Sun,Dinner,2
+13.94,3.06,Male,No,Sun,Dinner,2
+9.68,1.32,Male,No,Sun,Dinner,2
+30.4,5.6,Male,No,Sun,Dinner,4
+18.29,3.0,Male,No,Sun,Dinner,2
+22.23,5.0,Male,No,Sun,Dinner,2
+32.4,6.0,Male,No,Sun,Dinner,4
+28.55,2.05,Male,No,Sun,Dinner,3
+18.04,3.0,Male,No,Sun,Dinner,2
+12.54,2.5,Male,No,Sun,Dinner,2
+10.29,2.6,Female,No,Sun,Dinner,2
+34.81,5.2,Female,No,Sun,Dinner,4
+9.94,1.56,Male,No,Sun,Dinner,2
+25.56,4.34,Male,No,Sun,Dinner,4
+19.49,3.51,Male,No,Sun,Dinner,2
+38.01,3.0,Male,Yes,Sat,Dinner,4
+26.41,1.5,Female,No,Sat,Dinner,2
+11.24,1.76,Male,Yes,Sat,Dinner,2
+48.27,6.73,Male,No,Sat,Dinner,4
+20.29,3.21,Male,Yes,Sat,Dinner,2
+13.81,2.0,Male,Yes,Sat,Dinner,2
+11.02,1.98,Male,Yes,Sat,Dinner,2
+18.29,3.76,Male,Yes,Sat,Dinner,4
+17.59,2.64,Male,No,Sat,Dinner,3
+20.08,3.15,Male,No,Sat,Dinner,3
+16.45,2.47,Female,No,Sat,Dinner,2
+3.07,1.0,Female,Yes,Sat,Dinner,1
+20.23,2.01,Male,No,Sat,Dinner,2
+15.01,2.09,Male,Yes,Sat,Dinner,2
+12.02,1.97,Male,No,Sat,Dinner,2
+17.07,3.0,Female,No,Sat,Dinner,3
+26.86,3.14,Female,Yes,Sat,Dinner,2
+25.28,5.0,Female,Yes,Sat,Dinner,2
+14.73,2.2,Female,No,Sat,Dinner,2
+10.51,1.25,Male,No,Sat,Dinner,2
+17.92,3.08,Male,Yes,Sat,Dinner,2
+27.2,4.0,Male,No,Thur,Lunch,4
+22.76,3.0,Male,No,Thur,Lunch,2
+17.29,2.71,Male,No,Thur,Lunch,2
+19.44,3.0,Male,Yes,Thur,Lunch,2
+16.66,3.4,Male,No,Thur,Lunch,2
+10.07,1.83,Female,No,Thur,Lunch,1
+32.68,5.0,Male,Yes,Thur,Lunch,2
+15.98,2.03,Male,No,Thur,Lunch,2
+34.83,5.17,Female,No,Thur,Lunch,4
+13.03,2.0,Male,No,Thur,Lunch,2
+18.28,4.0,Male,No,Thur,Lunch,2
+24.71,5.85,Male,No,Thur,Lunch,2
+21.16,3.0,Male,No,Thur,Lunch,2
+28.97,3.0,Male,Yes,Fri,Dinner,2
+22.49,3.5,Male,No,Fri,Dinner,2
+5.75,1.0,Female,Yes,Fri,Dinner,2
+16.32,4.3,Female,Yes,Fri,Dinner,2
+22.75,3.25,Female,No,Fri,Dinner,2
+40.17,4.73,Male,Yes,Fri,Dinner,4
+27.28,4.0,Male,Yes,Fri,Dinner,2
+12.03,1.5,Male,Yes,Fri,Dinner,2
+21.01,3.0,Male,Yes,Fri,Dinner,2
+12.46,1.5,Male,No,Fri,Dinner,2
+11.35,2.5,Female,Yes,Fri,Dinner,2
+15.38,3.0,Female,Yes,Fri,Dinner,2
+44.3,2.5,Female,Yes,Sat,Dinner,3
+22.42,3.48,Female,Yes,Sat,Dinner,2
+20.92,4.08,Female,No,Sat,Dinner,2
+15.36,1.64,Male,Yes,Sat,Dinner,2
+20.49,4.06,Male,Yes,Sat,Dinner,2
+25.21,4.29,Male,Yes,Sat,Dinner,2
+18.24,3.76,Male,No,Sat,Dinner,2
+14.31,4.0,Female,Yes,Sat,Dinner,2
+14.0,3.0,Male,No,Sat,Dinner,2
+7.25,1.0,Female,No,Sat,Dinner,1
+38.07,4.0,Male,No,Sun,Dinner,3
+23.95,2.55,Male,No,Sun,Dinner,2
+25.71,4.0,Female,No,Sun,Dinner,3
+17.31,3.5,Female,No,Sun,Dinner,2
+29.93,5.07,Male,No,Sun,Dinner,4
+10.65,1.5,Female,No,Thur,Lunch,2
+12.43,1.8,Female,No,Thur,Lunch,2
+24.08,2.92,Female,No,Thur,Lunch,4
+11.69,2.31,Male,No,Thur,Lunch,2
+13.42,1.68,Female,No,Thur,Lunch,2
+14.26,2.5,Male,No,Thur,Lunch,2
+15.95,2.0,Male,No,Thur,Lunch,2
+12.48,2.52,Female,No,Thur,Lunch,2
+29.8,4.2,Female,No,Thur,Lunch,6
+8.52,1.48,Male,No,Thur,Lunch,2
+14.52,2.0,Female,No,Thur,Lunch,2
+11.38,2.0,Female,No,Thur,Lunch,2
+22.82,2.18,Male,No,Thur,Lunch,3
+19.08,1.5,Male,No,Thur,Lunch,2
+20.27,2.83,Female,No,Thur,Lunch,2
+11.17,1.5,Female,No,Thur,Lunch,2
+12.26,2.0,Female,No,Thur,Lunch,2
+18.26,3.25,Female,No,Thur,Lunch,2
+8.51,1.25,Female,No,Thur,Lunch,2
+10.33,2.0,Female,No,Thur,Lunch,2
+14.15,2.0,Female,No,Thur,Lunch,2
+16.0,2.0,Male,Yes,Thur,Lunch,2
+13.16,2.75,Female,No,Thur,Lunch,2
+17.47,3.5,Female,No,Thur,Lunch,2
+34.3,6.7,Male,No,Thur,Lunch,6
+41.19,5.0,Male,No,Thur,Lunch,5
+27.05,5.0,Female,No,Thur,Lunch,6
+16.43,2.3,Female,No,Thur,Lunch,2
+8.35,1.5,Female,No,Thur,Lunch,2
+18.64,1.36,Female,No,Thur,Lunch,3
+11.87,1.63,Female,No,Thur,Lunch,2
+9.78,1.73,Male,No,Thur,Lunch,2
+7.51,2.0,Male,No,Thur,Lunch,2
+14.07,2.5,Male,No,Sun,Dinner,2
+13.13,2.0,Male,No,Sun,Dinner,2
+17.26,2.74,Male,No,Sun,Dinner,3
+24.55,2.0,Male,No,Sun,Dinner,4
+19.77,2.0,Male,No,Sun,Dinner,4
+29.85,5.14,Female,No,Sun,Dinner,5
+48.17,5.0,Male,No,Sun,Dinner,6
+25.0,3.75,Female,No,Sun,Dinner,4
+13.39,2.61,Female,No,Sun,Dinner,2
+16.49,2.0,Male,No,Sun,Dinner,4
+21.5,3.5,Male,No,Sun,Dinner,4
+12.66,2.5,Male,No,Sun,Dinner,2
+16.21,2.0,Female,No,Sun,Dinner,3
+13.81,2.0,Male,No,Sun,Dinner,2
+17.51,3.0,Female,Yes,Sun,Dinner,2
+24.52,3.48,Male,No,Sun,Dinner,3
+20.76,2.24,Male,No,Sun,Dinner,2
+31.71,4.5,Male,No,Sun,Dinner,4
+10.59,1.61,Female,Yes,Sat,Dinner,2
+10.63,2.0,Female,Yes,Sat,Dinner,2
+50.81,10.0,Male,Yes,Sat,Dinner,3
+15.81,3.16,Male,Yes,Sat,Dinner,2
+7.25,5.15,Male,Yes,Sun,Dinner,2
+31.85,3.18,Male,Yes,Sun,Dinner,2
+16.82,4.0,Male,Yes,Sun,Dinner,2
+32.9,3.11,Male,Yes,Sun,Dinner,2
+17.89,2.0,Male,Yes,Sun,Dinner,2
+14.48,2.0,Male,Yes,Sun,Dinner,2
+9.6,4.0,Female,Yes,Sun,Dinner,2
+34.63,3.55,Male,Yes,Sun,Dinner,2
+34.65,3.68,Male,Yes,Sun,Dinner,4
+23.33,5.65,Male,Yes,Sun,Dinner,2
+45.35,3.5,Male,Yes,Sun,Dinner,3
+23.17,6.5,Male,Yes,Sun,Dinner,4
+40.55,3.0,Male,Yes,Sun,Dinner,2
+20.69,5.0,Male,No,Sun,Dinner,5
+20.9,3.5,Female,Yes,Sun,Dinner,3
+30.46,2.0,Male,Yes,Sun,Dinner,5
+18.15,3.5,Female,Yes,Sun,Dinner,3
+23.1,4.0,Male,Yes,Sun,Dinner,3
+15.69,1.5,Male,Yes,Sun,Dinner,2
+19.81,4.19,Female,Yes,Thur,Lunch,2
+28.44,2.56,Male,Yes,Thur,Lunch,2
+15.48,2.02,Male,Yes,Thur,Lunch,2
+16.58,4.0,Male,Yes,Thur,Lunch,2
+7.56,1.44,Male,No,Thur,Lunch,2
+10.34,2.0,Male,Yes,Thur,Lunch,2
+43.11,5.0,Female,Yes,Thur,Lunch,4
+13.0,2.0,Female,Yes,Thur,Lunch,2
+13.51,2.0,Male,Yes,Thur,Lunch,2
+18.71,4.0,Male,Yes,Thur,Lunch,3
+12.74,2.01,Female,Yes,Thur,Lunch,2
+13.0,2.0,Female,Yes,Thur,Lunch,2
+16.4,2.5,Female,Yes,Thur,Lunch,2
+20.53,4.0,Male,Yes,Thur,Lunch,4
+16.47,3.23,Female,Yes,Thur,Lunch,3
+26.59,3.41,Male,Yes,Sat,Dinner,3
+38.73,3.0,Male,Yes,Sat,Dinner,4
+24.27,2.03,Male,Yes,Sat,Dinner,2
+12.76,2.23,Female,Yes,Sat,Dinner,2
+30.06,2.0,Male,Yes,Sat,Dinner,3
+25.89,5.16,Male,Yes,Sat,Dinner,4
+48.33,9.0,Male,No,Sat,Dinner,4
+13.27,2.5,Female,Yes,Sat,Dinner,2
+28.17,6.5,Female,Yes,Sat,Dinner,3
+12.9,1.1,Female,Yes,Sat,Dinner,2
+28.15,3.0,Male,Yes,Sat,Dinner,5
+11.59,1.5,Male,Yes,Sat,Dinner,2
+7.74,1.44,Male,Yes,Sat,Dinner,2
+30.14,3.09,Female,Yes,Sat,Dinner,4
+12.16,2.2,Male,Yes,Fri,Lunch,2
+13.42,3.48,Female,Yes,Fri,Lunch,2
+8.58,1.92,Male,Yes,Fri,Lunch,1
+15.98,3.0,Female,No,Fri,Lunch,3
+13.42,1.58,Male,Yes,Fri,Lunch,2
+16.27,2.5,Female,Yes,Fri,Lunch,2
+10.09,2.0,Female,Yes,Fri,Lunch,2
+20.45,3.0,Male,No,Sat,Dinner,4
+13.28,2.72,Male,No,Sat,Dinner,2
+22.12,2.88,Female,Yes,Sat,Dinner,2
+24.01,2.0,Male,Yes,Sat,Dinner,4
+15.69,3.0,Male,Yes,Sat,Dinner,3
+11.61,3.39,Male,No,Sat,Dinner,2
+10.77,1.47,Male,No,Sat,Dinner,2
+15.53,3.0,Male,Yes,Sat,Dinner,2
+10.07,1.25,Male,No,Sat,Dinner,2
+12.6,1.0,Male,Yes,Sat,Dinner,2
+32.83,1.17,Male,Yes,Sat,Dinner,2
+35.83,4.67,Female,No,Sat,Dinner,3
+29.03,5.92,Male,No,Sat,Dinner,3
+27.18,2.0,Female,Yes,Sat,Dinner,2
+22.67,2.0,Male,Yes,Sat,Dinner,2
+17.82,1.75,Male,No,Sat,Dinner,2
+18.78,3.0,Female,No,Thur,Dinner,2
diff --git a/pandas/tests/io/parser/data/tips.csv.bz2 b/pandas/tests/io/parser/data/tips.csv.bz2
new file mode 100644
index 0000000000000..1452896b05e9d
Binary files /dev/null and b/pandas/tests/io/parser/data/tips.csv.bz2 differ
diff --git a/pandas/tests/io/parser/data/tips.csv.gz b/pandas/tests/io/parser/data/tips.csv.gz
new file mode 100644
index 0000000000000..3a131068b2a38
Binary files /dev/null and b/pandas/tests/io/parser/data/tips.csv.gz differ
diff --git a/pandas/tests/data/unicode_series.csv b/pandas/tests/io/parser/data/unicode_series.csv
similarity index 100%
rename from pandas/tests/data/unicode_series.csv
rename to pandas/tests/io/parser/data/unicode_series.csv
diff --git a/pandas/io/tests/data/utf16_ex.txt b/pandas/tests/io/parser/data/utf16_ex.txt
similarity index 100%
rename from pandas/io/tests/data/utf16_ex.txt
rename to pandas/tests/io/parser/data/utf16_ex.txt
diff --git a/pandas/tests/io/parser/data/utf16_ex_small.zip b/pandas/tests/io/parser/data/utf16_ex_small.zip
new file mode 100644
index 0000000000000..b0560c1b1f6c4
Binary files /dev/null and b/pandas/tests/io/parser/data/utf16_ex_small.zip differ
diff --git a/pandas/tests/io/parser/dialect.py b/pandas/tests/io/parser/dialect.py
new file mode 100644
index 0000000000000..f756fe71bf684
--- /dev/null
+++ b/pandas/tests/io/parser/dialect.py
@@ -0,0 +1,78 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that dialects are properly handled during parsing
+for all of the parsers defined in parsers.py
+"""
+
+import csv
+
+from pandas import DataFrame
+from pandas.compat import StringIO
+from pandas.errors import ParserWarning
+
+import pandas.util.testing as tm
+
+
+class DialectTests(object):
+
+    def test_dialect(self):
+        data = """\
+label1,label2,label3
+index1,"a,c,e
+index2,b,d,f
+"""
+
+        dia = csv.excel()
+        dia.quoting = csv.QUOTE_NONE
+        with tm.assert_produces_warning(ParserWarning):
+            df = self.read_csv(StringIO(data), dialect=dia)
+
+        data = '''\
+label1,label2,label3
+index1,a,c,e
+index2,b,d,f
+'''
+        exp = self.read_csv(StringIO(data))
+        exp.replace('a', '"a', inplace=True)
+        tm.assert_frame_equal(df, exp)
+
+    def test_dialect_str(self):
+        data = """\
+fruit:vegetable
+apple:brocolli
+pear:tomato
+"""
+        exp = DataFrame({
+            'fruit': ['apple', 'pear'],
+            'vegetable': ['brocolli', 'tomato']
+        })
+        csv.register_dialect('mydialect', delimiter=':')
+        with tm.assert_produces_warning(ParserWarning):
+            df = self.read_csv(StringIO(data), dialect='mydialect')
+
+        tm.assert_frame_equal(df, exp)
+        csv.unregister_dialect('mydialect')
+
+    def test_invalid_dialect(self):
+        class InvalidDialect(object):
+            pass
+
+        data = 'a\n1'
+        msg = 'Invalid dialect'
+
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(data), dialect=InvalidDialect)
+
+    def test_dialect_conflict(self):
+        data = 'a,b\n1,2'
+        dialect = 'excel'
+        exp = DataFrame({'a': [1], 'b': [2]})
+
+        with tm.assert_produces_warning(None):
+            df = self.read_csv(StringIO(data), delimiter=',', dialect=dialect)
+            tm.assert_frame_equal(df, exp)
+
+        with tm.assert_produces_warning(ParserWarning):
+            df = self.read_csv(StringIO(data), delimiter='.', dialect=dialect)
+            tm.assert_frame_equal(df, exp)
diff --git a/pandas/tests/io/parser/dtypes.py b/pandas/tests/io/parser/dtypes.py
new file mode 100644
index 0000000000000..8060ebf2fbcd4
--- /dev/null
+++ b/pandas/tests/io/parser/dtypes.py
@@ -0,0 +1,399 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests dtype specification during parsing
+for all of the parsers defined in parsers.py
+"""
+
+import pytest
+
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+
+from pandas import DataFrame, Series, Index, MultiIndex, Categorical
+from pandas.compat import StringIO
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas.errors import ParserWarning
+
+
+class DtypeTests(object):
+
+    def test_passing_dtype(self):
+        # see gh-6607
+        df = DataFrame(np.random.rand(5, 2).round(4), columns=list(
+            'AB'), index=['1A', '1B', '1C', '1D', '1E'])
+
+        with tm.ensure_clean('__passing_str_as_dtype__.csv') as path:
+            df.to_csv(path)
+
+            # see gh-3795: passing 'str' as the dtype
+            result = self.read_csv(path, dtype=str, index_col=0)
+            expected = df.astype(str)
+            tm.assert_frame_equal(result, expected)
+
+            # for parsing, interpret object as str
+            result = self.read_csv(path, dtype=object, index_col=0)
+            tm.assert_frame_equal(result, expected)
+
+            # we expect all object columns, so need to
+            # convert to test for equivalence
+            result = result.astype(float)
+            tm.assert_frame_equal(result, df)
+
+            # invalid dtype
+            pytest.raises(TypeError, self.read_csv, path,
+                          dtype={'A': 'foo', 'B': 'float64'},
+                          index_col=0)
+
+        # see gh-12048: empty frame
+        actual = self.read_csv(StringIO('A,B'), dtype=str)
+        expected = DataFrame({'A': [], 'B': []}, index=[], dtype=str)
+        tm.assert_frame_equal(actual, expected)
+
+    def test_pass_dtype(self):
+        data = """\
+one,two
+1,2.5
+2,3.5
+3,4.5
+4,5.5"""
+
+        result = self.read_csv(StringIO(data), dtype={'one': 'u1', 1: 'S1'})
+        assert result['one'].dtype == 'u1'
+        assert result['two'].dtype == 'object'
+
+    def test_categorical_dtype(self):
+        # GH 10153
+        data = """a,b,c
+1,a,3.4
+1,a,3.4
+2,b,4.5"""
+        expected = pd.DataFrame({'a': Categorical(['1', '1', '2']),
+                                 'b': Categorical(['a', 'a', 'b']),
+                                 'c': Categorical(['3.4', '3.4', '4.5'])})
+        actual = self.read_csv(StringIO(data), dtype='category')
+        tm.assert_frame_equal(actual, expected)
+
+        actual = self.read_csv(StringIO(data), dtype=CategoricalDtype())
+        tm.assert_frame_equal(actual, expected)
+
+        actual = self.read_csv(StringIO(data), dtype={'a': 'category',
+                                                      'b': 'category',
+                                                      'c': CategoricalDtype()})
+        tm.assert_frame_equal(actual, expected)
+
+        actual = self.read_csv(StringIO(data), dtype={'b': 'category'})
+        expected = pd.DataFrame({'a': [1, 1, 2],
+                                 'b': Categorical(['a', 'a', 'b']),
+                                 'c': [3.4, 3.4, 4.5]})
+        tm.assert_frame_equal(actual, expected)
+
+        actual = self.read_csv(StringIO(data), dtype={1: 'category'})
+        tm.assert_frame_equal(actual, expected)
+
+        # unsorted
+        data = """a,b,c
+1,b,3.4
+1,b,3.4
+2,a,4.5"""
+        expected = pd.DataFrame({'a': Categorical(['1', '1', '2']),
+                                 'b': Categorical(['b', 'b', 'a']),
+                                 'c': Categorical(['3.4', '3.4', '4.5'])})
+        actual = self.read_csv(StringIO(data), dtype='category')
+        tm.assert_frame_equal(actual, expected)
+
+        # missing
+        data = """a,b,c
+1,b,3.4
+1,nan,3.4
+2,a,4.5"""
+        expected = pd.DataFrame({'a': Categorical(['1', '1', '2']),
+                                 'b': Categorical(['b', np.nan, 'a']),
+                                 'c': Categorical(['3.4', '3.4', '4.5'])})
+        actual = self.read_csv(StringIO(data), dtype='category')
+        tm.assert_frame_equal(actual, expected)
+
+    @pytest.mark.slow
+    def test_categorical_dtype_high_cardinality_numeric(self):
+        # GH 18186
+        data = np.sort([str(i) for i in range(524289)])
+        expected = DataFrame({'a': Categorical(data, ordered=True)})
+        actual = self.read_csv(StringIO('a\n' + '\n'.join(data)),
+                               dtype='category')
+        actual["a"] = actual["a"].cat.reorder_categories(
+            np.sort(actual.a.cat.categories), ordered=True)
+        tm.assert_frame_equal(actual, expected)
+
+    def test_categorical_dtype_encoding(self, datapath):
+        # GH 10153
+        pth = datapath('io', 'parser', 'data', 'unicode_series.csv')
+        encoding = 'latin-1'
+        expected = self.read_csv(pth, header=None, encoding=encoding)
+        expected[1] = Categorical(expected[1])
+        actual = self.read_csv(pth, header=None, encoding=encoding,
+                               dtype={1: 'category'})
+        tm.assert_frame_equal(actual, expected)
+
+        pth = datapath('io', 'parser', 'data', 'utf16_ex.txt')
+        encoding = 'utf-16'
+        expected = self.read_table(pth, encoding=encoding)
+        expected = expected.apply(Categorical)
+        actual = self.read_table(pth, encoding=encoding, dtype='category')
+        tm.assert_frame_equal(actual, expected)
+
+    def test_categorical_dtype_chunksize(self):
+        # GH 10153
+        data = """a,b
+1,a
+1,b
+1,b
+2,c"""
+        expecteds = [pd.DataFrame({'a': [1, 1],
+                                   'b': Categorical(['a', 'b'])}),
+                     pd.DataFrame({'a': [1, 2],
+                                   'b': Categorical(['b', 'c'])},
+                                  index=[2, 3])]
+        actuals = self.read_csv(StringIO(data), dtype={'b': 'category'},
+                                chunksize=2)
+
+        for actual, expected in zip(actuals, expecteds):
+            tm.assert_frame_equal(actual, expected)
+
+    @pytest.mark.parametrize('ordered', [False, True])
+    @pytest.mark.parametrize('categories', [
+        ['a', 'b', 'c'],
+        ['a', 'c', 'b'],
+        ['a', 'b', 'c', 'd'],
+        ['c', 'b', 'a'],
+    ])
+    def test_categorical_categoricaldtype(self, categories, ordered):
+        data = """a,b
+1,a
+1,b
+1,b
+2,c"""
+        expected = pd.DataFrame({
+            "a": [1, 1, 1, 2],
+            "b": Categorical(['a', 'b', 'b', 'c'],
+                             categories=categories,
+                             ordered=ordered)
+        })
+        dtype = {"b": CategoricalDtype(categories=categories,
+                                       ordered=ordered)}
+        result = self.read_csv(StringIO(data), dtype=dtype)
+        tm.assert_frame_equal(result, expected)
+
+    def test_categorical_categoricaldtype_unsorted(self):
+        data = """a,b
+1,a
+1,b
+1,b
+2,c"""
+        dtype = CategoricalDtype(['c', 'b', 'a'])
+        expected = pd.DataFrame({
+            'a': [1, 1, 1, 2],
+            'b': Categorical(['a', 'b', 'b', 'c'], categories=['c', 'b', 'a'])
+        })
+        result = self.read_csv(StringIO(data), dtype={'b': dtype})
+        tm.assert_frame_equal(result, expected)
+
+    def test_categoricaldtype_coerces_numeric(self):
+        dtype = {'b': CategoricalDtype([1, 2, 3])}
+        data = "b\n1\n1\n2\n3"
+        expected = pd.DataFrame({'b': Categorical([1, 1, 2, 3])})
+        result = self.read_csv(StringIO(data), dtype=dtype)
+        tm.assert_frame_equal(result, expected)
+
+    def test_categoricaldtype_coerces_datetime(self):
+        dtype = {
+            'b': CategoricalDtype(pd.date_range('2017', '2019', freq='AS'))
+        }
+        data = "b\n2017-01-01\n2018-01-01\n2019-01-01"
+        expected = pd.DataFrame({'b': Categorical(dtype['b'].categories)})
+        result = self.read_csv(StringIO(data), dtype=dtype)
+        tm.assert_frame_equal(result, expected)
+
+        dtype = {
+            'b': CategoricalDtype([pd.Timestamp("2014")])
+        }
+        data = "b\n2014-01-01\n2014-01-01T00:00:00"
+        expected = pd.DataFrame({'b': Categorical([pd.Timestamp('2014')] * 2)})
+        result = self.read_csv(StringIO(data), dtype=dtype)
+        tm.assert_frame_equal(result, expected)
+
+    def test_categoricaldtype_coerces_timedelta(self):
+        dtype = {'b': CategoricalDtype(pd.to_timedelta(['1H', '2H', '3H']))}
+        data = "b\n1H\n2H\n3H"
+        expected = pd.DataFrame({'b': Categorical(dtype['b'].categories)})
+        result = self.read_csv(StringIO(data), dtype=dtype)
+        tm.assert_frame_equal(result, expected)
+
+    def test_categoricaldtype_unexpected_categories(self):
+        dtype = {'b': CategoricalDtype(['a', 'b', 'd', 'e'])}
+        data = "b\nd\na\nc\nd"  # Unexpected c
+        expected = pd.DataFrame({"b": Categorical(list('dacd'),
+                                                  dtype=dtype['b'])})
+        result = self.read_csv(StringIO(data), dtype=dtype)
+        tm.assert_frame_equal(result, expected)
+
+    def test_categorical_categoricaldtype_chunksize(self):
+        # GH 10153
+        data = """a,b
+1,a
+1,b
+1,b
+2,c"""
+        cats = ['a', 'b', 'c']
+        expecteds = [pd.DataFrame({'a': [1, 1],
+                                   'b': Categorical(['a', 'b'],
+                                                    categories=cats)}),
+                     pd.DataFrame({'a': [1, 2],
+                                   'b': Categorical(['b', 'c'],
+                                                    categories=cats)},
+                                  index=[2, 3])]
+        dtype = CategoricalDtype(cats)
+        actuals = self.read_csv(StringIO(data), dtype={'b': dtype},
+                                chunksize=2)
+
+        for actual, expected in zip(actuals, expecteds):
+            tm.assert_frame_equal(actual, expected)
+
+    def test_empty_pass_dtype(self):
+        data = 'one,two'
+        result = self.read_csv(StringIO(data), dtype={'one': 'u1'})
+
+        expected = DataFrame({'one': np.empty(0, dtype='u1'),
+                              'two': np.empty(0, dtype=np.object)})
+        tm.assert_frame_equal(result, expected, check_index_type=False)
+
+    def test_empty_with_index_pass_dtype(self):
+        data = 'one,two'
+        result = self.read_csv(StringIO(data), index_col=['one'],
+                               dtype={'one': 'u1', 1: 'f'})
+
+        expected = DataFrame({'two': np.empty(0, dtype='f')},
+                             index=Index([], dtype='u1', name='one'))
+        tm.assert_frame_equal(result, expected, check_index_type=False)
+
+    def test_empty_with_multiindex_pass_dtype(self):
+        data = 'one,two,three'
+        result = self.read_csv(StringIO(data), index_col=['one', 'two'],
+                               dtype={'one': 'u1', 1: 'f8'})
+
+        exp_idx = MultiIndex.from_arrays([np.empty(0, dtype='u1'),
+                                          np.empty(0, dtype='O')],
+                                         names=['one', 'two'])
+        expected = DataFrame(
+            {'three': np.empty(0, dtype=np.object)}, index=exp_idx)
+        tm.assert_frame_equal(result, expected, check_index_type=False)
+
+    def test_empty_with_mangled_column_pass_dtype_by_names(self):
+        data = 'one,one'
+        result = self.read_csv(StringIO(data), dtype={
+            'one': 'u1', 'one.1': 'f'})
+
+        expected = DataFrame(
+            {'one': np.empty(0, dtype='u1'), 'one.1': np.empty(0, dtype='f')})
+        tm.assert_frame_equal(result, expected, check_index_type=False)
+
+    def test_empty_with_mangled_column_pass_dtype_by_indexes(self):
+        data = 'one,one'
+        result = self.read_csv(StringIO(data), dtype={0: 'u1', 1: 'f'})
+
+        expected = DataFrame(
+            {'one': np.empty(0, dtype='u1'), 'one.1': np.empty(0, dtype='f')})
+        tm.assert_frame_equal(result, expected, check_index_type=False)
+
+    def test_empty_with_dup_column_pass_dtype_by_indexes(self):
+        # see gh-9424
+        expected = pd.concat([Series([], name='one', dtype='u1'),
+                              Series([], name='one.1', dtype='f')], axis=1)
+
+        data = 'one,one'
+        result = self.read_csv(StringIO(data), dtype={0: 'u1', 1: 'f'})
+        tm.assert_frame_equal(result, expected, check_index_type=False)
+
+        with tm.assert_produces_warning(UserWarning, check_stacklevel=False):
+            data = ''
+            result = self.read_csv(StringIO(data), names=['one', 'one'],
+                                   dtype={0: 'u1', 1: 'f'})
+            tm.assert_frame_equal(result, expected, check_index_type=False)
+
+    def test_raise_on_passed_int_dtype_with_nas(self):
+        # see gh-2631
+        data = """YEAR, DOY, a
+2001,106380451,10
+2001,,11
+2001,106380451,67"""
+        pytest.raises(ValueError, self.read_csv, StringIO(data),
+                      sep=",", skipinitialspace=True,
+                      dtype={'DOY': np.int64})
+
+    def test_dtype_with_converter(self):
+        data = """a,b
+1.1,2.2
+1.2,2.3"""
+        # dtype spec ignored if converted specified
+        with tm.assert_produces_warning(ParserWarning):
+            result = self.read_csv(StringIO(data), dtype={'a': 'i8'},
+                                   converters={'a': lambda x: str(x)})
+        expected = DataFrame({'a': ['1.1', '1.2'], 'b': [2.2, 2.3]})
+        tm.assert_frame_equal(result, expected)
+
+    def test_empty_dtype(self):
+        # see gh-14712
+        data = 'a,b'
+
+        expected = pd.DataFrame(columns=['a', 'b'], dtype=np.float64)
+        result = self.read_csv(StringIO(data), header=0, dtype=np.float64)
+        tm.assert_frame_equal(result, expected)
+
+        expected = pd.DataFrame({'a': pd.Categorical([]),
+                                 'b': pd.Categorical([])},
+                                index=[])
+        result = self.read_csv(StringIO(data), header=0,
+                               dtype='category')
+        tm.assert_frame_equal(result, expected)
+        result = self.read_csv(StringIO(data), header=0,
+                               dtype={'a': 'category', 'b': 'category'})
+        tm.assert_frame_equal(result, expected)
+
+        expected = pd.DataFrame(columns=['a', 'b'], dtype='datetime64[ns]')
+        result = self.read_csv(StringIO(data), header=0,
+                               dtype='datetime64[ns]')
+        tm.assert_frame_equal(result, expected)
+
+        expected = pd.DataFrame({'a': pd.Series([], dtype='timedelta64[ns]'),
+                                 'b': pd.Series([], dtype='timedelta64[ns]')},
+                                index=[])
+        result = self.read_csv(StringIO(data), header=0,
+                               dtype='timedelta64[ns]')
+        tm.assert_frame_equal(result, expected)
+
+        expected = pd.DataFrame(columns=['a', 'b'])
+        expected['a'] = expected['a'].astype(np.float64)
+        result = self.read_csv(StringIO(data), header=0,
+                               dtype={'a': np.float64})
+        tm.assert_frame_equal(result, expected)
+
+        expected = pd.DataFrame(columns=['a', 'b'])
+        expected['a'] = expected['a'].astype(np.float64)
+        result = self.read_csv(StringIO(data), header=0,
+                               dtype={0: np.float64})
+        tm.assert_frame_equal(result, expected)
+
+        expected = pd.DataFrame(columns=['a', 'b'])
+        expected['a'] = expected['a'].astype(np.int32)
+        expected['b'] = expected['b'].astype(np.float64)
+        result = self.read_csv(StringIO(data), header=0,
+                               dtype={'a': np.int32, 1: np.float64})
+        tm.assert_frame_equal(result, expected)
+
+    def test_numeric_dtype(self):
+        data = '0\n1'
+
+        for dt in np.typecodes['AllInteger'] + np.typecodes['Float']:
+            expected = pd.DataFrame([0, 1], dtype=dt)
+            result = self.read_csv(StringIO(data), header=None, dtype=dt)
+            tm.assert_frame_equal(expected, result)
diff --git a/pandas/tests/io/parser/header.py b/pandas/tests/io/parser/header.py
new file mode 100644
index 0000000000000..3fb0650348763
--- /dev/null
+++ b/pandas/tests/io/parser/header.py
@@ -0,0 +1,312 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that the file header is properly handled or inferred
+during parsing for all of the parsers defined in parsers.py
+"""
+
+import pytest
+
+import numpy as np
+import pandas.util.testing as tm
+
+from pandas import DataFrame, Index, MultiIndex
+from pandas.compat import StringIO, lrange, u
+
+
+class HeaderTests(object):
+
+    def test_read_with_bad_header(self):
+        errmsg = r"but only \d+ lines in file"
+
+        with tm.assert_raises_regex(ValueError, errmsg):
+            s = StringIO(',,')
+            self.read_csv(s, header=[10])
+
+    def test_bool_header_arg(self):
+        # see gh-6114
+        data = """\
+MyColumn
+   a
+   b
+   a
+   b"""
+        for arg in [True, False]:
+            with pytest.raises(TypeError):
+                self.read_csv(StringIO(data), header=arg)
+            with pytest.raises(TypeError):
+                self.read_table(StringIO(data), header=arg)
+
+    def test_no_header_prefix(self):
+        data = """1,2,3,4,5
+6,7,8,9,10
+11,12,13,14,15
+"""
+        df_pref = self.read_table(StringIO(data), sep=',', prefix='Field',
+                                  header=None)
+
+        expected = np.array([[1, 2, 3, 4, 5],
+                             [6, 7, 8, 9, 10],
+                             [11, 12, 13, 14, 15]], dtype=np.int64)
+        tm.assert_almost_equal(df_pref.values, expected)
+
+        tm.assert_index_equal(df_pref.columns,
+                              Index(['Field0', 'Field1', 'Field2',
+                                     'Field3', 'Field4']))
+
+    def test_header_with_index_col(self):
+        data = """foo,1,2,3
+bar,4,5,6
+baz,7,8,9
+"""
+        names = ['A', 'B', 'C']
+        df = self.read_csv(StringIO(data), names=names)
+
+        assert list(df.columns) == ['A', 'B', 'C']
+
+        values = [[1, 2, 3], [4, 5, 6], [7, 8, 9]]
+        expected = DataFrame(values, index=['foo', 'bar', 'baz'],
+                             columns=['A', 'B', 'C'])
+        tm.assert_frame_equal(df, expected)
+
+    def test_header_not_first_line(self):
+        data = """got,to,ignore,this,line
+got,to,ignore,this,line
+index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+"""
+        data2 = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+"""
+
+        df = self.read_csv(StringIO(data), header=2, index_col=0)
+        expected = self.read_csv(StringIO(data2), header=0, index_col=0)
+        tm.assert_frame_equal(df, expected)
+
+    def test_header_multi_index(self):
+        expected = tm.makeCustomDataframe(
+            5, 3, r_idx_nlevels=2, c_idx_nlevels=4)
+
+        data = """\
+C0,,C_l0_g0,C_l0_g1,C_l0_g2
+
+C1,,C_l1_g0,C_l1_g1,C_l1_g2
+C2,,C_l2_g0,C_l2_g1,C_l2_g2
+C3,,C_l3_g0,C_l3_g1,C_l3_g2
+R0,R1,,,
+R_l0_g0,R_l1_g0,R0C0,R0C1,R0C2
+R_l0_g1,R_l1_g1,R1C0,R1C1,R1C2
+R_l0_g2,R_l1_g2,R2C0,R2C1,R2C2
+R_l0_g3,R_l1_g3,R3C0,R3C1,R3C2
+R_l0_g4,R_l1_g4,R4C0,R4C1,R4C2
+"""
+
+        df = self.read_csv(StringIO(data), header=[0, 1, 2, 3],
+                           index_col=[0, 1])
+        tm.assert_frame_equal(df, expected)
+
+        # skipping lines in the header
+        df = self.read_csv(StringIO(data), header=[0, 1, 2, 3],
+                           index_col=[0, 1])
+        tm.assert_frame_equal(df, expected)
+
+        # INVALID OPTIONS
+
+        # names
+        pytest.raises(ValueError, self.read_csv,
+                      StringIO(data), header=[0, 1, 2, 3],
+                      index_col=[0, 1], names=['foo', 'bar'])
+
+        # usecols
+        pytest.raises(ValueError, self.read_csv,
+                      StringIO(data), header=[0, 1, 2, 3],
+                      index_col=[0, 1], usecols=['foo', 'bar'])
+
+        # non-numeric index_col
+        pytest.raises(ValueError, self.read_csv,
+                      StringIO(data), header=[0, 1, 2, 3],
+                      index_col=['foo', 'bar'])
+
+    def test_header_multiindex_common_format(self):
+
+        df = DataFrame([[1, 2, 3, 4, 5, 6], [7, 8, 9, 10, 11, 12]],
+                       index=['one', 'two'],
+                       columns=MultiIndex.from_tuples(
+                           [('a', 'q'), ('a', 'r'), ('a', 's'),
+                            ('b', 't'), ('c', 'u'), ('c', 'v')]))
+
+        # to_csv
+        data = """,a,a,a,b,c,c
+,q,r,s,t,u,v
+,,,,,,
+one,1,2,3,4,5,6
+two,7,8,9,10,11,12"""
+
+        result = self.read_csv(StringIO(data), header=[0, 1], index_col=0)
+        tm.assert_frame_equal(df, result)
+
+        # common
+        data = """,a,a,a,b,c,c
+,q,r,s,t,u,v
+one,1,2,3,4,5,6
+two,7,8,9,10,11,12"""
+
+        result = self.read_csv(StringIO(data), header=[0, 1], index_col=0)
+        tm.assert_frame_equal(df, result)
+
+        # common, no index_col
+        data = """a,a,a,b,c,c
+q,r,s,t,u,v
+1,2,3,4,5,6
+7,8,9,10,11,12"""
+
+        result = self.read_csv(StringIO(data), header=[0, 1], index_col=None)
+        tm.assert_frame_equal(df.reset_index(drop=True), result)
+
+        # malformed case 1
+        expected = DataFrame(np.array(
+            [[2, 3, 4, 5, 6], [8, 9, 10, 11, 12]], dtype='int64'),
+            index=Index([1, 7]),
+            columns=MultiIndex(levels=[[u('a'), u('b'), u('c')],
+                                       [u('r'), u('s'), u('t'),
+                                        u('u'), u('v')]],
+                               labels=[[0, 0, 1, 2, 2], [0, 1, 2, 3, 4]],
+                               names=[u('a'), u('q')]))
+
+        data = """a,a,a,b,c,c
+q,r,s,t,u,v
+1,2,3,4,5,6
+7,8,9,10,11,12"""
+
+        result = self.read_csv(StringIO(data), header=[0, 1], index_col=0)
+        tm.assert_frame_equal(expected, result)
+
+        # malformed case 2
+        expected = DataFrame(np.array(
+            [[2, 3, 4, 5, 6], [8, 9, 10, 11, 12]], dtype='int64'),
+            index=Index([1, 7]),
+            columns=MultiIndex(levels=[[u('a'), u('b'), u('c')],
+                                       [u('r'), u('s'), u('t'),
+                                        u('u'), u('v')]],
+                               labels=[[0, 0, 1, 2, 2], [0, 1, 2, 3, 4]],
+                               names=[None, u('q')]))
+
+        data = """,a,a,b,c,c
+q,r,s,t,u,v
+1,2,3,4,5,6
+7,8,9,10,11,12"""
+
+        result = self.read_csv(StringIO(data), header=[0, 1], index_col=0)
+        tm.assert_frame_equal(expected, result)
+
+        # mi on columns and index (malformed)
+        expected = DataFrame(np.array(
+            [[3, 4, 5, 6], [9, 10, 11, 12]], dtype='int64'),
+            index=MultiIndex(levels=[[1, 7], [2, 8]],
+                             labels=[[0, 1], [0, 1]]),
+            columns=MultiIndex(levels=[[u('a'), u('b'), u('c')],
+                                       [u('s'), u('t'), u('u'), u('v')]],
+                               labels=[[0, 1, 2, 2], [0, 1, 2, 3]],
+                               names=[None, u('q')]))
+
+        data = """,a,a,b,c,c
+q,r,s,t,u,v
+1,2,3,4,5,6
+7,8,9,10,11,12"""
+
+        result = self.read_csv(StringIO(data), header=[0, 1], index_col=[0, 1])
+        tm.assert_frame_equal(expected, result)
+
+    def test_header_names_backward_compat(self):
+        # #2539
+        data = '1,2,3\n4,5,6'
+
+        result = self.read_csv(StringIO(data), names=['a', 'b', 'c'])
+        expected = self.read_csv(StringIO(data), names=['a', 'b', 'c'],
+                                 header=None)
+        tm.assert_frame_equal(result, expected)
+
+        data2 = 'foo,bar,baz\n' + data
+        result = self.read_csv(StringIO(data2), names=['a', 'b', 'c'],
+                               header=0)
+        tm.assert_frame_equal(result, expected)
+
+    def test_read_only_header_no_rows(self):
+        # See gh-7773
+        expected = DataFrame(columns=['a', 'b', 'c'])
+
+        df = self.read_csv(StringIO('a,b,c'))
+        tm.assert_frame_equal(df, expected)
+
+        df = self.read_csv(StringIO('a,b,c'), index_col=False)
+        tm.assert_frame_equal(df, expected)
+
+    def test_no_header(self):
+        data = """1,2,3,4,5
+6,7,8,9,10
+11,12,13,14,15
+"""
+        df = self.read_table(StringIO(data), sep=',', header=None)
+        df_pref = self.read_table(StringIO(data), sep=',', prefix='X',
+                                  header=None)
+
+        names = ['foo', 'bar', 'baz', 'quux', 'panda']
+        df2 = self.read_table(StringIO(data), sep=',', names=names)
+        expected = np.array([[1, 2, 3, 4, 5],
+                             [6, 7, 8, 9, 10],
+                             [11, 12, 13, 14, 15]], dtype=np.int64)
+        tm.assert_almost_equal(df.values, expected)
+        tm.assert_almost_equal(df.values, df2.values)
+
+        tm.assert_index_equal(df_pref.columns,
+                              Index(['X0', 'X1', 'X2', 'X3', 'X4']))
+        tm.assert_index_equal(df.columns, Index(lrange(5)))
+
+        tm.assert_index_equal(df2.columns, Index(names))
+
+    def test_non_int_header(self):
+        # GH 16338
+        msg = 'header must be integer or list of integers'
+        data = """1,2\n3,4"""
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(data), sep=',', header=['a', 'b'])
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(data), sep=',', header='string_header')
+
+    def test_singleton_header(self):
+        # See GH #7757
+        data = """a,b,c\n0,1,2\n1,2,3"""
+        df = self.read_csv(StringIO(data), header=[0])
+        expected = DataFrame({"a": [0, 1], "b": [1, 2], "c": [2, 3]})
+        tm.assert_frame_equal(df, expected)
+
+    def test_mangles_multi_index(self):
+        # See GH 18062
+        data = """A,A,A,B\none,one,one,two\n0,40,34,0.1"""
+        df = self.read_csv(StringIO(data), header=[0, 1])
+        expected = DataFrame([[0, 40, 34, 0.1]],
+                             columns=MultiIndex.from_tuples(
+                                 [('A', 'one'), ('A', 'one.1'),
+                                  ('A', 'one.2'), ('B', 'two')]))
+        tm.assert_frame_equal(df, expected)
+
+        data = """A,A,A,B\none,one,one.1,two\n0,40,34,0.1"""
+        df = self.read_csv(StringIO(data), header=[0, 1])
+        expected = DataFrame([[0, 40, 34, 0.1]],
+                             columns=MultiIndex.from_tuples(
+                                 [('A', 'one'), ('A', 'one.1'),
+                                  ('A', 'one.1.1'), ('B', 'two')]))
+        tm.assert_frame_equal(df, expected)
+
+        data = """A,A,A,B,B\none,one,one.1,two,two\n0,40,34,0.1,0.1"""
+        df = self.read_csv(StringIO(data), header=[0, 1])
+        expected = DataFrame([[0, 40, 34, 0.1, 0.1]],
+                             columns=MultiIndex.from_tuples(
+                                 [('A', 'one'), ('A', 'one.1'),
+                                  ('A', 'one.1.1'), ('B', 'two'),
+                                  ('B', 'two.1')]))
+        tm.assert_frame_equal(df, expected)
diff --git a/pandas/tests/io/parser/index_col.py b/pandas/tests/io/parser/index_col.py
new file mode 100644
index 0000000000000..ee9b210443636
--- /dev/null
+++ b/pandas/tests/io/parser/index_col.py
@@ -0,0 +1,143 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that the specified index column (a.k.a 'index_col')
+is properly handled or inferred during parsing for all of
+the parsers defined in parsers.py
+"""
+
+import pytest
+
+import pandas.util.testing as tm
+
+from pandas import DataFrame, Index, MultiIndex
+from pandas.compat import StringIO
+
+
+class IndexColTests(object):
+
+    def test_index_col_named(self):
+        no_header = """\
+KORD1,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD2,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD3,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD4,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD5,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD6,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000"""  # noqa
+
+        h = "ID,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir\n"  # noqa
+        data = h + no_header
+        rs = self.read_csv(StringIO(data), index_col='ID')
+        xp = self.read_csv(StringIO(data), header=0).set_index('ID')
+        tm.assert_frame_equal(rs, xp)
+
+        pytest.raises(ValueError, self.read_csv, StringIO(no_header),
+                      index_col='ID')
+
+        data = """\
+1,2,3,4,hello
+5,6,7,8,world
+9,10,11,12,foo
+"""
+        names = ['a', 'b', 'c', 'd', 'message']
+        xp = DataFrame({'a': [1, 5, 9], 'b': [2, 6, 10], 'c': [3, 7, 11],
+                        'd': [4, 8, 12]},
+                       index=Index(['hello', 'world', 'foo'], name='message'))
+        rs = self.read_csv(StringIO(data), names=names, index_col=['message'])
+        tm.assert_frame_equal(xp, rs)
+        assert xp.index.name == rs.index.name
+
+        rs = self.read_csv(StringIO(data), names=names, index_col='message')
+        tm.assert_frame_equal(xp, rs)
+        assert xp.index.name == rs.index.name
+
+    def test_index_col_is_true(self):
+        # see gh-9798
+        pytest.raises(ValueError, self.read_csv,
+                      StringIO(self.ts_data), index_col=True)
+
+    def test_infer_index_col(self):
+        data = """A,B,C
+foo,1,2,3
+bar,4,5,6
+baz,7,8,9
+"""
+        data = self.read_csv(StringIO(data))
+        assert data.index.equals(Index(['foo', 'bar', 'baz']))
+
+    def test_empty_index_col_scenarios(self):
+        data = 'x,y,z'
+
+        # None, no index
+        index_col, expected = None, DataFrame([], columns=list('xyz')),
+        tm.assert_frame_equal(self.read_csv(
+            StringIO(data), index_col=index_col), expected)
+
+        # False, no index
+        index_col, expected = False, DataFrame([], columns=list('xyz')),
+        tm.assert_frame_equal(self.read_csv(
+            StringIO(data), index_col=index_col), expected)
+
+        # int, first column
+        index_col, expected = 0, DataFrame(
+            [], columns=['y', 'z'], index=Index([], name='x'))
+        tm.assert_frame_equal(self.read_csv(
+            StringIO(data), index_col=index_col), expected)
+
+        # int, not first column
+        index_col, expected = 1, DataFrame(
+            [], columns=['x', 'z'], index=Index([], name='y'))
+        tm.assert_frame_equal(self.read_csv(
+            StringIO(data), index_col=index_col), expected)
+
+        # str, first column
+        index_col, expected = 'x', DataFrame(
+            [], columns=['y', 'z'], index=Index([], name='x'))
+        tm.assert_frame_equal(self.read_csv(
+            StringIO(data), index_col=index_col), expected)
+
+        # str, not the first column
+        index_col, expected = 'y', DataFrame(
+            [], columns=['x', 'z'], index=Index([], name='y'))
+        tm.assert_frame_equal(self.read_csv(
+            StringIO(data), index_col=index_col), expected)
+
+        # list of int
+        index_col, expected = [0, 1], DataFrame(
+            [], columns=['z'], index=MultiIndex.from_arrays(
+                [[]] * 2, names=['x', 'y']))
+        tm.assert_frame_equal(self.read_csv(
+            StringIO(data), index_col=index_col),
+            expected, check_index_type=False)
+
+        # list of str
+        index_col = ['x', 'y']
+        expected = DataFrame([], columns=['z'],
+                             index=MultiIndex.from_arrays(
+                                 [[]] * 2, names=['x', 'y']))
+        tm.assert_frame_equal(self.read_csv(StringIO(
+            data), index_col=index_col),
+            expected, check_index_type=False)
+
+        # list of int, reversed sequence
+        index_col = [1, 0]
+        expected = DataFrame([], columns=['z'], index=MultiIndex.from_arrays(
+            [[]] * 2, names=['y', 'x']))
+        tm.assert_frame_equal(self.read_csv(
+            StringIO(data), index_col=index_col),
+            expected, check_index_type=False)
+
+        # list of str, reversed sequence
+        index_col = ['y', 'x']
+        expected = DataFrame([], columns=['z'], index=MultiIndex.from_arrays(
+            [[]] * 2, names=['y', 'x']))
+        tm.assert_frame_equal(self.read_csv(StringIO(
+            data), index_col=index_col),
+            expected, check_index_type=False)
+
+    def test_empty_with_index_col_false(self):
+        # see gh-10413
+        data = 'x,y'
+        result = self.read_csv(StringIO(data), index_col=False)
+        expected = DataFrame([], columns=['x', 'y'])
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/mangle_dupes.py b/pandas/tests/io/parser/mangle_dupes.py
new file mode 100644
index 0000000000000..6df69eb475bf7
--- /dev/null
+++ b/pandas/tests/io/parser/mangle_dupes.py
@@ -0,0 +1,88 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that duplicate columns are handled appropriately when parsed by the
+CSV engine. In general, the expected result is that they are either thoroughly
+de-duplicated (if mangling requested) or ignored otherwise.
+"""
+
+from pandas.compat import StringIO
+from pandas import DataFrame
+
+import pandas.util.testing as tm
+
+
+class DupeColumnTests(object):
+    def test_basic(self):
+        # TODO: add test for condition "mangle_dupe_cols=False"
+        # once it is actually supported (gh-12935)
+        data = "a,a,b,b,b\n1,2,3,4,5"
+
+        for method in ("read_csv", "read_table"):
+            # Check default behavior.
+            expected = ["a", "a.1", "b", "b.1", "b.2"]
+            df = getattr(self, method)(StringIO(data), sep=",")
+            assert list(df.columns) == expected
+
+            df = getattr(self, method)(StringIO(data), sep=",",
+                                       mangle_dupe_cols=True)
+            assert list(df.columns) == expected
+
+    def test_basic_names(self):
+        # See gh-7160
+        data = "a,b,a\n0,1,2\n3,4,5"
+        expected = DataFrame([[0, 1, 2], [3, 4, 5]],
+                             columns=["a", "b", "a.1"])
+
+        df = self.read_csv(StringIO(data))
+        tm.assert_frame_equal(df, expected)
+
+        with tm.assert_produces_warning(UserWarning, check_stacklevel=False):
+            data = "0,1,2\n3,4,5"
+            df = self.read_csv(StringIO(data),
+                               names=["a", "b", "a"])
+            tm.assert_frame_equal(df, expected)
+
+    def test_thorough_mangle_columns(self):
+        # see gh-17060
+        data = "a,a,a.1\n1,2,3"
+        df = self.read_csv(StringIO(data), sep=",", mangle_dupe_cols=True)
+        assert list(df.columns) == ["a", "a.1", "a.1.1"]
+
+        data = "a,a,a.1,a.1.1,a.1.1.1,a.1.1.1.1\n1,2,3,4,5,6"
+        df = self.read_csv(StringIO(data), sep=",", mangle_dupe_cols=True)
+        assert list(df.columns) == ["a", "a.1", "a.1.1", "a.1.1.1",
+                                    "a.1.1.1.1", "a.1.1.1.1.1"]
+
+        data = "a,a,a.3,a.1,a.2,a,a\n1,2,3,4,5,6,7"
+        df = self.read_csv(StringIO(data), sep=",", mangle_dupe_cols=True)
+        assert list(df.columns) == ["a", "a.1", "a.3", "a.1.1",
+                                    "a.2", "a.2.1", "a.3.1"]
+
+    def test_thorough_mangle_names(self):
+        # see gh-17095
+        data = "a,b,b\n1,2,3"
+        names = ["a.1", "a.1", "a.1.1"]
+
+        with tm.assert_produces_warning(UserWarning, check_stacklevel=False):
+            df = self.read_csv(StringIO(data), sep=",", names=names,
+                               mangle_dupe_cols=True)
+            assert list(df.columns) == ["a.1", "a.1.1", "a.1.1.1"]
+
+        data = "a,b,c,d,e,f\n1,2,3,4,5,6"
+        names = ["a", "a", "a.1", "a.1.1", "a.1.1.1", "a.1.1.1.1"]
+
+        with tm.assert_produces_warning(UserWarning, check_stacklevel=False):
+            df = self.read_csv(StringIO(data), sep=",", names=names,
+                               mangle_dupe_cols=True)
+            assert list(df.columns) == ["a", "a.1", "a.1.1", "a.1.1.1",
+                                        "a.1.1.1.1", "a.1.1.1.1.1"]
+
+        data = "a,b,c,d,e,f,g\n1,2,3,4,5,6,7"
+        names = ["a", "a", "a.3", "a.1", "a.2", "a", "a"]
+
+        with tm.assert_produces_warning(UserWarning, check_stacklevel=False):
+            df = self.read_csv(StringIO(data), sep=",", names=names,
+                               mangle_dupe_cols=True)
+            assert list(df.columns) == ["a", "a.1", "a.3", "a.1.1",
+                                        "a.2", "a.2.1", "a.3.1"]
diff --git a/pandas/tests/io/parser/multithread.py b/pandas/tests/io/parser/multithread.py
new file mode 100644
index 0000000000000..2aaef889db6de
--- /dev/null
+++ b/pandas/tests/io/parser/multithread.py
@@ -0,0 +1,99 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests multithreading behaviour for reading and
+parsing files for each parser defined in parsers.py
+"""
+
+from __future__ import division
+from multiprocessing.pool import ThreadPool
+
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+
+from pandas import DataFrame
+from pandas.compat import BytesIO, range
+
+
+def _construct_dataframe(num_rows):
+
+    df = DataFrame(np.random.rand(num_rows, 5), columns=list('abcde'))
+    df['foo'] = 'foo'
+    df['bar'] = 'bar'
+    df['baz'] = 'baz'
+    df['date'] = pd.date_range('20000101 09:00:00',
+                               periods=num_rows,
+                               freq='s')
+    df['int'] = np.arange(num_rows, dtype='int64')
+    return df
+
+
+class MultithreadTests(object):
+
+    def _generate_multithread_dataframe(self, path, num_rows, num_tasks):
+
+        def reader(arg):
+            start, nrows = arg
+
+            if not start:
+                return self.read_csv(path, index_col=0, header=0,
+                                     nrows=nrows, parse_dates=['date'])
+
+            return self.read_csv(path,
+                                 index_col=0,
+                                 header=None,
+                                 skiprows=int(start) + 1,
+                                 nrows=nrows,
+                                 parse_dates=[9])
+
+        tasks = [
+            (num_rows * i // num_tasks,
+             num_rows // num_tasks) for i in range(num_tasks)
+        ]
+
+        pool = ThreadPool(processes=num_tasks)
+
+        results = pool.map(reader, tasks)
+
+        header = results[0].columns
+        for r in results[1:]:
+            r.columns = header
+
+        final_dataframe = pd.concat(results)
+
+        return final_dataframe
+
+    def test_multithread_stringio_read_csv(self):
+        # see gh-11786
+        max_row_range = 10000
+        num_files = 100
+
+        bytes_to_df = [
+            '\n'.join(
+                ['%d,%d,%d' % (i, i, i) for i in range(max_row_range)]
+            ).encode() for j in range(num_files)]
+        files = [BytesIO(b) for b in bytes_to_df]
+
+        # read all files in many threads
+        pool = ThreadPool(8)
+        results = pool.map(self.read_csv, files)
+        first_result = results[0]
+
+        for result in results:
+            tm.assert_frame_equal(first_result, result)
+
+    def test_multithread_path_multipart_read_csv(self):
+        # see gh-11786
+        num_tasks = 4
+        file_name = '__threadpool_reader__.csv'
+        num_rows = 100000
+
+        df = _construct_dataframe(num_rows)
+
+        with tm.ensure_clean(file_name) as path:
+            df.to_csv(path)
+
+            final_dataframe = self._generate_multithread_dataframe(
+                path, num_rows, num_tasks)
+            tm.assert_frame_equal(df, final_dataframe)
diff --git a/pandas/tests/io/parser/na_values.py b/pandas/tests/io/parser/na_values.py
new file mode 100644
index 0000000000000..d2c3f82e95c4d
--- /dev/null
+++ b/pandas/tests/io/parser/na_values.py
@@ -0,0 +1,371 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that NA values are properly handled during
+parsing for all of the parsers defined in parsers.py
+"""
+
+import numpy as np
+from numpy import nan
+
+import pandas.io.common as com
+import pandas.util.testing as tm
+
+from pandas import DataFrame, Index, MultiIndex
+from pandas.compat import StringIO, range
+
+
+class NAvaluesTests(object):
+
+    def test_string_nas(self):
+        data = """A,B,C
+a,b,c
+d,,f
+,g,h
+"""
+        result = self.read_csv(StringIO(data))
+        expected = DataFrame([['a', 'b', 'c'],
+                              ['d', np.nan, 'f'],
+                              [np.nan, 'g', 'h']],
+                             columns=['A', 'B', 'C'])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_detect_string_na(self):
+        data = """A,B
+foo,bar
+NA,baz
+NaN,nan
+"""
+        expected = np.array([['foo', 'bar'], [nan, 'baz'], [nan, nan]],
+                            dtype=np.object_)
+        df = self.read_csv(StringIO(data))
+        tm.assert_numpy_array_equal(df.values, expected)
+
+    def test_non_string_na_values(self):
+        # see gh-3611: with an odd float format, we can't match
+        # the string '999.0' exactly but still need float matching
+        nice = """A,B
+-999,1.2
+2,-999
+3,4.5
+"""
+        ugly = """A,B
+-999,1.200
+2,-999.000
+3,4.500
+"""
+        na_values_param = [['-999.0', '-999'],
+                           [-999, -999.0],
+                           [-999.0, -999],
+                           ['-999.0'], ['-999'],
+                           [-999.0], [-999]]
+        expected = DataFrame([[np.nan, 1.2], [2.0, np.nan],
+                              [3.0, 4.5]], columns=['A', 'B'])
+
+        for data in (nice, ugly):
+            for na_values in na_values_param:
+                out = self.read_csv(StringIO(data), na_values=na_values)
+                tm.assert_frame_equal(out, expected)
+
+    def test_default_na_values(self):
+        _NA_VALUES = set(['-1.#IND', '1.#QNAN', '1.#IND', '-1.#QNAN',
+                          '#N/A', 'N/A', 'n/a', 'NA', '#NA', 'NULL', 'null',
+                          'NaN', 'nan', '-NaN', '-nan', '#N/A N/A', ''])
+        assert _NA_VALUES == com._NA_VALUES
+        nv = len(_NA_VALUES)
+
+        def f(i, v):
+            if i == 0:
+                buf = ''
+            elif i > 0:
+                buf = ''.join([','] * i)
+
+            buf = "{0}{1}".format(buf, v)
+
+            if i < nv - 1:
+                buf = "{0}{1}".format(buf, ''.join([','] * (nv - i - 1)))
+
+            return buf
+
+        data = StringIO('\n'.join(f(i, v) for i, v in enumerate(_NA_VALUES)))
+        expected = DataFrame(np.nan, columns=range(nv), index=range(nv))
+        df = self.read_csv(data, header=None)
+        tm.assert_frame_equal(df, expected)
+
+    def test_custom_na_values(self):
+        data = """A,B,C
+ignore,this,row
+1,NA,3
+-1.#IND,5,baz
+7,8,NaN
+"""
+        expected = np.array([[1., nan, 3],
+                             [nan, 5, nan],
+                             [7, 8, nan]])
+
+        df = self.read_csv(StringIO(data), na_values=['baz'], skiprows=[1])
+        tm.assert_numpy_array_equal(df.values, expected)
+
+        df2 = self.read_table(StringIO(data), sep=',', na_values=['baz'],
+                              skiprows=[1])
+        tm.assert_numpy_array_equal(df2.values, expected)
+
+        df3 = self.read_table(StringIO(data), sep=',', na_values='baz',
+                              skiprows=[1])
+        tm.assert_numpy_array_equal(df3.values, expected)
+
+    def test_bool_na_values(self):
+        data = """A,B,C
+True,False,True
+NA,True,False
+False,NA,True"""
+
+        result = self.read_csv(StringIO(data))
+        expected = DataFrame({'A': np.array([True, nan, False], dtype=object),
+                              'B': np.array([False, True, nan], dtype=object),
+                              'C': [True, False, True]})
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_na_value_dict(self):
+        data = """A,B,C
+foo,bar,NA
+bar,foo,foo
+foo,bar,NA
+bar,foo,foo"""
+
+        df = self.read_csv(StringIO(data),
+                           na_values={'A': ['foo'], 'B': ['bar']})
+        expected = DataFrame({'A': [np.nan, 'bar', np.nan, 'bar'],
+                              'B': [np.nan, 'foo', np.nan, 'foo'],
+                              'C': [np.nan, 'foo', np.nan, 'foo']})
+        tm.assert_frame_equal(df, expected)
+
+        data = """\
+a,b,c,d
+0,NA,1,5
+"""
+        xp = DataFrame({'b': [np.nan], 'c': [1], 'd': [5]}, index=[0])
+        xp.index.name = 'a'
+        df = self.read_csv(StringIO(data), na_values={}, index_col=0)
+        tm.assert_frame_equal(df, xp)
+
+        xp = DataFrame({'b': [np.nan], 'd': [5]},
+                       MultiIndex.from_tuples([(0, 1)]))
+        xp.index.names = ['a', 'c']
+        df = self.read_csv(StringIO(data), na_values={}, index_col=[0, 2])
+        tm.assert_frame_equal(df, xp)
+
+        xp = DataFrame({'b': [np.nan], 'd': [5]},
+                       MultiIndex.from_tuples([(0, 1)]))
+        xp.index.names = ['a', 'c']
+        df = self.read_csv(StringIO(data), na_values={}, index_col=['a', 'c'])
+        tm.assert_frame_equal(df, xp)
+
+    def test_na_values_keep_default(self):
+        data = """\
+One,Two,Three
+a,1,one
+b,2,two
+,3,three
+d,4,nan
+e,5,five
+nan,6,
+g,7,seven
+"""
+        df = self.read_csv(StringIO(data))
+        xp = DataFrame({'One': ['a', 'b', np.nan, 'd', 'e', np.nan, 'g'],
+                        'Two': [1, 2, 3, 4, 5, 6, 7],
+                        'Three': ['one', 'two', 'three', np.nan, 'five',
+                                  np.nan, 'seven']})
+        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
+
+        df = self.read_csv(StringIO(data), na_values={'One': [], 'Three': []},
+                           keep_default_na=False)
+        xp = DataFrame({'One': ['a', 'b', '', 'd', 'e', 'nan', 'g'],
+                        'Two': [1, 2, 3, 4, 5, 6, 7],
+                        'Three': ['one', 'two', 'three', 'nan', 'five',
+                                  '', 'seven']})
+        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
+
+        df = self.read_csv(
+            StringIO(data), na_values=['a'], keep_default_na=False)
+        xp = DataFrame({'One': [np.nan, 'b', '', 'd', 'e', 'nan', 'g'],
+                        'Two': [1, 2, 3, 4, 5, 6, 7],
+                        'Three': ['one', 'two', 'three', 'nan', 'five', '',
+                                  'seven']})
+        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
+
+        df = self.read_csv(StringIO(data), na_values={'One': [], 'Three': []})
+        xp = DataFrame({'One': ['a', 'b', np.nan, 'd', 'e', np.nan, 'g'],
+                        'Two': [1, 2, 3, 4, 5, 6, 7],
+                        'Three': ['one', 'two', 'three', np.nan, 'five',
+                                  np.nan, 'seven']})
+        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
+
+        # see gh-4318: passing na_values=None and
+        # keep_default_na=False yields 'None' as a na_value
+        data = """\
+One,Two,Three
+a,1,None
+b,2,two
+,3,None
+d,4,nan
+e,5,five
+nan,6,
+g,7,seven
+"""
+        df = self.read_csv(
+            StringIO(data), keep_default_na=False)
+        xp = DataFrame({'One': ['a', 'b', '', 'd', 'e', 'nan', 'g'],
+                        'Two': [1, 2, 3, 4, 5, 6, 7],
+                        'Three': ['None', 'two', 'None', 'nan', 'five', '',
+                                  'seven']})
+        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
+
+    def test_no_keep_default_na_dict_na_values(self):
+        # see gh-19227
+        data = "a,b\n,2"
+
+        df = self.read_csv(StringIO(data), na_values={"b": ["2"]},
+                           keep_default_na=False)
+        expected = DataFrame({"a": [""], "b": [np.nan]})
+        tm.assert_frame_equal(df, expected)
+
+        # Scalar values shouldn't cause the parsing to crash or fail.
+        data = "a,b\n1,2"
+
+        df = self.read_csv(StringIO(data), na_values={"b": 2},
+                           keep_default_na=False)
+        expected = DataFrame({"a": [1], "b": [np.nan]})
+        tm.assert_frame_equal(df, expected)
+
+        data = """\
+113125,"blah","/blaha",kjsdkj,412.166,225.874,214.008
+729639,"qwer","",asdfkj,466.681,,252.373
+"""
+        expected = DataFrame({0: [np.nan, 729639.0],
+                              1: [np.nan, "qwer"],
+                              2: ["/blaha", np.nan],
+                              3: ["kjsdkj", "asdfkj"],
+                              4: [412.166, 466.681],
+                              5: ["225.874", ""],
+                              6: [np.nan, 252.373]})
+
+        df = self.read_csv(StringIO(data), header=None, keep_default_na=False,
+                           na_values={2: "", 6: "214.008",
+                                      1: "blah", 0: 113125})
+        tm.assert_frame_equal(df, expected)
+
+        df = self.read_csv(StringIO(data), header=None, keep_default_na=False,
+                           na_values={2: "", 6: "214.008",
+                                      1: "blah", 0: "113125"})
+        tm.assert_frame_equal(df, expected)
+
+    def test_na_values_na_filter_override(self):
+        data = """\
+A,B
+1,A
+nan,B
+3,C
+"""
+
+        expected = DataFrame([[1, 'A'], [np.nan, np.nan], [3, 'C']],
+                             columns=['A', 'B'])
+        out = self.read_csv(StringIO(data), na_values=['B'], na_filter=True)
+        tm.assert_frame_equal(out, expected)
+
+        expected = DataFrame([['1', 'A'], ['nan', 'B'], ['3', 'C']],
+                             columns=['A', 'B'])
+        out = self.read_csv(StringIO(data), na_values=['B'], na_filter=False)
+        tm.assert_frame_equal(out, expected)
+
+    def test_na_trailing_columns(self):
+        data = """Date,Currenncy,Symbol,Type,Units,UnitPrice,Cost,Tax
+2012-03-14,USD,AAPL,BUY,1000
+2012-05-12,USD,SBUX,SELL,500"""
+
+        result = self.read_csv(StringIO(data))
+        assert result['Date'][1] == '2012-05-12'
+        assert result['UnitPrice'].isna().all()
+
+    def test_na_values_scalar(self):
+        # see gh-12224
+        names = ['a', 'b']
+        data = '1,2\n2,1'
+
+        expected = DataFrame([[np.nan, 2.0], [2.0, np.nan]],
+                             columns=names)
+        out = self.read_csv(StringIO(data), names=names, na_values=1)
+        tm.assert_frame_equal(out, expected)
+
+        expected = DataFrame([[1.0, 2.0], [np.nan, np.nan]],
+                             columns=names)
+        out = self.read_csv(StringIO(data), names=names,
+                            na_values={'a': 2, 'b': 1})
+        tm.assert_frame_equal(out, expected)
+
+    def test_na_values_dict_aliasing(self):
+        na_values = {'a': 2, 'b': 1}
+        na_values_copy = na_values.copy()
+
+        names = ['a', 'b']
+        data = '1,2\n2,1'
+
+        expected = DataFrame([[1.0, 2.0], [np.nan, np.nan]], columns=names)
+        out = self.read_csv(StringIO(data), names=names, na_values=na_values)
+
+        tm.assert_frame_equal(out, expected)
+        tm.assert_dict_equal(na_values, na_values_copy)
+
+    def test_na_values_dict_col_index(self):
+        # see gh-14203
+
+        data = 'a\nfoo\n1'
+        na_values = {0: 'foo'}
+
+        out = self.read_csv(StringIO(data), na_values=na_values)
+        expected = DataFrame({'a': [np.nan, 1]})
+        tm.assert_frame_equal(out, expected)
+
+    def test_na_values_uint64(self):
+        # see gh-14983
+
+        na_values = [2**63]
+        data = str(2**63) + '\n' + str(2**63 + 1)
+        expected = DataFrame([str(2**63), str(2**63 + 1)])
+        out = self.read_csv(StringIO(data), header=None, na_values=na_values)
+        tm.assert_frame_equal(out, expected)
+
+        data = str(2**63) + ',1' + '\n,2'
+        expected = DataFrame([[str(2**63), 1], ['', 2]])
+        out = self.read_csv(StringIO(data), header=None)
+        tm.assert_frame_equal(out, expected)
+
+    def test_empty_na_values_no_default_with_index(self):
+        # see gh-15835
+        data = "a,1\nb,2"
+
+        expected = DataFrame({'1': [2]}, index=Index(["b"], name="a"))
+        out = self.read_csv(StringIO(data), keep_default_na=False, index_col=0)
+
+        tm.assert_frame_equal(out, expected)
+
+    def test_no_na_filter_on_index(self):
+        # see gh-5239
+        data = "a,b,c\n1,,3\n4,5,6"
+
+        # Don't parse NA-values in index when na_filter=False.
+        out = self.read_csv(StringIO(data), index_col=[1], na_filter=False)
+
+        expected = DataFrame({"a": [1, 4], "c": [3, 6]},
+                             index=Index(["", "5"], name="b"))
+        tm.assert_frame_equal(out, expected)
+
+        # Parse NA-values in index when na_filter=True.
+        out = self.read_csv(StringIO(data), index_col=[1], na_filter=True)
+
+        expected = DataFrame({"a": [1, 4], "c": [3, 6]},
+                             index=Index([np.nan, 5.0], name="b"))
+        tm.assert_frame_equal(out, expected)
diff --git a/pandas/tests/io/parser/parse_dates.py b/pandas/tests/io/parser/parse_dates.py
new file mode 100644
index 0000000000000..919b357f14236
--- /dev/null
+++ b/pandas/tests/io/parser/parse_dates.py
@@ -0,0 +1,676 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests date parsing functionality for all of the
+parsers defined in parsers.py
+"""
+
+from distutils.version import LooseVersion
+from datetime import datetime, date
+
+import pytest
+import numpy as np
+from pandas._libs.tslibs import parsing
+from pandas._libs.tslib import Timestamp
+
+import pandas as pd
+import pandas.io.parsers as parsers
+import pandas.core.tools.datetimes as tools
+import pandas.util.testing as tm
+
+import pandas.io.date_converters as conv
+from pandas import DataFrame, Series, Index, DatetimeIndex, MultiIndex
+from pandas import compat
+from pandas.compat import parse_date, StringIO, lrange
+from pandas.compat.numpy import np_array_datetime64_compat
+from pandas.core.indexes.datetimes import date_range
+
+
+class ParseDatesTests(object):
+
+    def test_separator_date_conflict(self):
+        # Regression test for gh-4678: make sure thousands separator and
+        # date parsing do not conflict.
+        data = '06-02-2013;13:00;1-000.215'
+        expected = DataFrame(
+            [[datetime(2013, 6, 2, 13, 0, 0), 1000.215]],
+            columns=['Date', 2]
+        )
+
+        df = self.read_csv(StringIO(data), sep=';', thousands='-',
+                           parse_dates={'Date': [0, 1]}, header=None)
+        tm.assert_frame_equal(df, expected)
+
+    def test_multiple_date_col(self):
+        # Can use multiple date parsers
+        data = """\
+KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
+"""
+
+        def func(*date_cols):
+            res = parsing.try_parse_dates(parsers._concat_date_cols(date_cols))
+            return res
+
+        df = self.read_csv(StringIO(data), header=None,
+                           date_parser=func,
+                           prefix='X',
+                           parse_dates={'nominal': [1, 2],
+                                        'actual': [1, 3]})
+        assert 'nominal' in df
+        assert 'actual' in df
+        assert 'X1' not in df
+        assert 'X2' not in df
+        assert 'X3' not in df
+
+        d = datetime(1999, 1, 27, 19, 0)
+        assert df.loc[0, 'nominal'] == d
+
+        df = self.read_csv(StringIO(data), header=None,
+                           date_parser=func,
+                           parse_dates={'nominal': [1, 2],
+                                        'actual': [1, 3]},
+                           keep_date_col=True)
+        assert 'nominal' in df
+        assert 'actual' in df
+
+        assert 1 in df
+        assert 2 in df
+        assert 3 in df
+
+        data = """\
+KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
+"""
+        df = self.read_csv(StringIO(data), header=None,
+                           prefix='X', parse_dates=[[1, 2], [1, 3]])
+
+        assert 'X1_X2' in df
+        assert 'X1_X3' in df
+        assert 'X1' not in df
+        assert 'X2' not in df
+        assert 'X3' not in df
+
+        d = datetime(1999, 1, 27, 19, 0)
+        assert df.loc[0, 'X1_X2'] == d
+
+        df = self.read_csv(StringIO(data), header=None,
+                           parse_dates=[[1, 2], [1, 3]], keep_date_col=True)
+
+        assert '1_2' in df
+        assert '1_3' in df
+        assert 1 in df
+        assert 2 in df
+        assert 3 in df
+
+        data = '''\
+KORD,19990127 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD,19990127 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD,19990127 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD,19990127 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD,19990127 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+'''
+        df = self.read_csv(StringIO(data), sep=',', header=None,
+                           parse_dates=[1], index_col=1)
+        d = datetime(1999, 1, 27, 19, 0)
+        assert df.index[0] == d
+
+    def test_multiple_date_cols_int_cast(self):
+        data = ("KORD,19990127, 19:00:00, 18:56:00, 0.8100\n"
+                "KORD,19990127, 20:00:00, 19:56:00, 0.0100\n"
+                "KORD,19990127, 21:00:00, 20:56:00, -0.5900\n"
+                "KORD,19990127, 21:00:00, 21:18:00, -0.9900\n"
+                "KORD,19990127, 22:00:00, 21:56:00, -0.5900\n"
+                "KORD,19990127, 23:00:00, 22:56:00, -0.5900")
+        date_spec = {'nominal': [1, 2], 'actual': [1, 3]}
+        import pandas.io.date_converters as conv
+
+        # it works!
+        df = self.read_csv(StringIO(data), header=None, parse_dates=date_spec,
+                           date_parser=conv.parse_date_time)
+        assert 'nominal' in df
+
+    def test_multiple_date_col_timestamp_parse(self):
+        data = """05/31/2012,15:30:00.029,1306.25,1,E,0,,1306.25
+05/31/2012,15:30:00.029,1306.25,8,E,0,,1306.25"""
+        result = self.read_csv(StringIO(data), sep=',', header=None,
+                               parse_dates=[[0, 1]], date_parser=Timestamp)
+
+        ex_val = Timestamp('05/31/2012 15:30:00.029')
+        assert result['0_1'][0] == ex_val
+
+    def test_multiple_date_cols_with_header(self):
+        data = """\
+ID,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir
+KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000"""
+
+        df = self.read_csv(StringIO(data), parse_dates={'nominal': [1, 2]})
+        assert not isinstance(df.nominal[0], compat.string_types)
+
+    ts_data = """\
+ID,date,nominalTime,actualTime,A,B,C,D,E
+KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
+"""
+
+    def test_multiple_date_col_name_collision(self):
+        with pytest.raises(ValueError):
+            self.read_csv(StringIO(self.ts_data), parse_dates={'ID': [1, 2]})
+
+        data = """\
+date_NominalTime,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir
+KORD1,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD2,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD3,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD4,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD5,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD6,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000"""  # noqa
+
+        with pytest.raises(ValueError):
+            self.read_csv(StringIO(data), parse_dates=[[1, 2]])
+
+    def test_date_parser_int_bug(self):
+        # See gh-3071
+        log_file = StringIO(
+            'posix_timestamp,elapsed,sys,user,queries,query_time,rows,'
+            'accountid,userid,contactid,level,silo,method\n'
+            '1343103150,0.062353,0,4,6,0.01690,3,'
+            '12345,1,-1,3,invoice_InvoiceResource,search\n'
+        )
+
+        def f(posix_string):
+            return datetime.utcfromtimestamp(int(posix_string))
+
+        # it works!
+        self.read_csv(log_file, index_col=0, parse_dates=[0], date_parser=f)
+
+    def test_nat_parse(self):
+        # See gh-3062
+        df = DataFrame(dict({
+            'A': np.asarray(lrange(10), dtype='float64'),
+            'B': pd.Timestamp('20010101')}))
+        df.iloc[3:6, :] = np.nan
+
+        with tm.ensure_clean('__nat_parse_.csv') as path:
+            df.to_csv(path)
+            result = self.read_csv(path, index_col=0, parse_dates=['B'])
+            tm.assert_frame_equal(result, df)
+
+            expected = Series(dict(A='float64', B='datetime64[ns]'))
+            tm.assert_series_equal(expected, result.dtypes)
+
+            # test with NaT for the nan_rep
+            # we don't have a method to specify the Datetime na_rep
+            # (it defaults to '')
+            df.to_csv(path)
+            result = self.read_csv(path, index_col=0, parse_dates=['B'])
+            tm.assert_frame_equal(result, df)
+
+    def test_csv_custom_parser(self):
+        data = """A,B,C
+20090101,a,1,2
+20090102,b,3,4
+20090103,c,4,5
+"""
+        f = lambda x: datetime.strptime(x, '%Y%m%d')
+        df = self.read_csv(StringIO(data), date_parser=f)
+        expected = self.read_csv(StringIO(data), parse_dates=True)
+        tm.assert_frame_equal(df, expected)
+
+    def test_parse_dates_implicit_first_col(self):
+        data = """A,B,C
+20090101,a,1,2
+20090102,b,3,4
+20090103,c,4,5
+"""
+        df = self.read_csv(StringIO(data), parse_dates=True)
+        expected = self.read_csv(StringIO(data), index_col=0, parse_dates=True)
+        assert isinstance(
+            df.index[0], (datetime, np.datetime64, Timestamp))
+        tm.assert_frame_equal(df, expected)
+
+    def test_parse_dates_string(self):
+        data = """date,A,B,C
+20090101,a,1,2
+20090102,b,3,4
+20090103,c,4,5
+"""
+        rs = self.read_csv(
+            StringIO(data), index_col='date', parse_dates=['date'])
+        idx = date_range('1/1/2009', periods=3)
+        idx.name = 'date'
+        xp = DataFrame({'A': ['a', 'b', 'c'],
+                        'B': [1, 3, 4],
+                        'C': [2, 4, 5]}, idx)
+        tm.assert_frame_equal(rs, xp)
+
+    def test_yy_format_with_yearfirst(self):
+        data = """date,time,B,C
+090131,0010,1,2
+090228,1020,3,4
+090331,0830,5,6
+"""
+
+        # See gh-217
+        import dateutil
+        if LooseVersion(dateutil.__version__) >= LooseVersion('2.5.0'):
+            pytest.skip("testing yearfirst=True not-support"
+                        "on datetutil < 2.5.0 this works but"
+                        "is wrong")
+
+        rs = self.read_csv(StringIO(data), index_col=0,
+                           parse_dates=[['date', 'time']])
+        idx = DatetimeIndex([datetime(2009, 1, 31, 0, 10, 0),
+                             datetime(2009, 2, 28, 10, 20, 0),
+                             datetime(2009, 3, 31, 8, 30, 0)],
+                            dtype=object, name='date_time')
+        xp = DataFrame({'B': [1, 3, 5], 'C': [2, 4, 6]}, idx)
+        tm.assert_frame_equal(rs, xp)
+
+        rs = self.read_csv(StringIO(data), index_col=0,
+                           parse_dates=[[0, 1]])
+        idx = DatetimeIndex([datetime(2009, 1, 31, 0, 10, 0),
+                             datetime(2009, 2, 28, 10, 20, 0),
+                             datetime(2009, 3, 31, 8, 30, 0)],
+                            dtype=object, name='date_time')
+        xp = DataFrame({'B': [1, 3, 5], 'C': [2, 4, 6]}, idx)
+        tm.assert_frame_equal(rs, xp)
+
+    def test_parse_dates_column_list(self):
+        data = 'a,b,c\n01/01/2010,1,15/02/2010'
+
+        expected = DataFrame({'a': [datetime(2010, 1, 1)], 'b': [1],
+                              'c': [datetime(2010, 2, 15)]})
+        expected = expected.set_index(['a', 'b'])
+
+        df = self.read_csv(StringIO(data), index_col=[0, 1],
+                           parse_dates=[0, 2], dayfirst=True)
+        tm.assert_frame_equal(df, expected)
+
+        df = self.read_csv(StringIO(data), index_col=[0, 1],
+                           parse_dates=['a', 'c'], dayfirst=True)
+        tm.assert_frame_equal(df, expected)
+
+    def test_multi_index_parse_dates(self):
+        data = """index1,index2,A,B,C
+20090101,one,a,1,2
+20090101,two,b,3,4
+20090101,three,c,4,5
+20090102,one,a,1,2
+20090102,two,b,3,4
+20090102,three,c,4,5
+20090103,one,a,1,2
+20090103,two,b,3,4
+20090103,three,c,4,5
+"""
+        df = self.read_csv(StringIO(data), index_col=[0, 1], parse_dates=True)
+        assert isinstance(df.index.levels[0][0],
+                          (datetime, np.datetime64, Timestamp))
+
+        # specify columns out of order!
+        df2 = self.read_csv(StringIO(data), index_col=[1, 0], parse_dates=True)
+        assert isinstance(df2.index.levels[1][0],
+                          (datetime, np.datetime64, Timestamp))
+
+    def test_parse_dates_custom_euroformat(self):
+        text = """foo,bar,baz
+31/01/2010,1,2
+01/02/2010,1,NA
+02/02/2010,1,2
+"""
+        parser = lambda d: parse_date(d, dayfirst=True)
+        df = self.read_csv(StringIO(text),
+                           names=['time', 'Q', 'NTU'], header=0,
+                           index_col=0, parse_dates=True,
+                           date_parser=parser, na_values=['NA'])
+
+        exp_index = Index([datetime(2010, 1, 31), datetime(2010, 2, 1),
+                           datetime(2010, 2, 2)], name='time')
+        expected = DataFrame({'Q': [1, 1, 1], 'NTU': [2, np.nan, 2]},
+                             index=exp_index, columns=['Q', 'NTU'])
+        tm.assert_frame_equal(df, expected)
+
+        parser = lambda d: parse_date(d, day_first=True)
+        pytest.raises(TypeError, self.read_csv,
+                      StringIO(text), skiprows=[0],
+                      names=['time', 'Q', 'NTU'], index_col=0,
+                      parse_dates=True, date_parser=parser,
+                      na_values=['NA'])
+
+    def test_parse_tz_aware(self):
+        # See gh-1693
+        import pytz
+        data = StringIO("Date,x\n2012-06-13T01:39:00Z,0.5")
+
+        # it works
+        result = self.read_csv(data, index_col=0, parse_dates=True)
+        stamp = result.index[0]
+        assert stamp.minute == 39
+        try:
+            assert result.index.tz is pytz.utc
+        except AssertionError:  # hello Yaroslav
+            arr = result.index.to_pydatetime()
+            result = tools.to_datetime(arr, utc=True)[0]
+            assert stamp.minute == result.minute
+            assert stamp.hour == result.hour
+            assert stamp.day == result.day
+
+    def test_multiple_date_cols_index(self):
+        data = """
+ID,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir
+KORD1,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD2,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD3,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD4,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD5,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD6,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
+"""
+
+        xp = self.read_csv(StringIO(data), parse_dates={'nominal': [1, 2]})
+        df = self.read_csv(StringIO(data), parse_dates={'nominal': [1, 2]},
+                           index_col='nominal')
+        tm.assert_frame_equal(xp.set_index('nominal'), df)
+        df2 = self.read_csv(StringIO(data), parse_dates={'nominal': [1, 2]},
+                            index_col=0)
+        tm.assert_frame_equal(df2, df)
+
+        df3 = self.read_csv(StringIO(data), parse_dates=[[1, 2]], index_col=0)
+        tm.assert_frame_equal(df3, df, check_names=False)
+
+    def test_multiple_date_cols_chunked(self):
+        df = self.read_csv(StringIO(self.ts_data), parse_dates={
+            'nominal': [1, 2]}, index_col='nominal')
+        reader = self.read_csv(StringIO(self.ts_data),
+                               parse_dates={'nominal': [1, 2]},
+                               index_col='nominal', chunksize=2)
+
+        chunks = list(reader)
+
+        assert 'nominalTime' not in df
+
+        tm.assert_frame_equal(chunks[0], df[:2])
+        tm.assert_frame_equal(chunks[1], df[2:4])
+        tm.assert_frame_equal(chunks[2], df[4:])
+
+    def test_multiple_date_col_named_components(self):
+        xp = self.read_csv(StringIO(self.ts_data),
+                           parse_dates={'nominal': [1, 2]},
+                           index_col='nominal')
+        colspec = {'nominal': ['date', 'nominalTime']}
+        df = self.read_csv(StringIO(self.ts_data), parse_dates=colspec,
+                           index_col='nominal')
+        tm.assert_frame_equal(df, xp)
+
+    def test_multiple_date_col_multiple_index(self):
+        df = self.read_csv(StringIO(self.ts_data),
+                           parse_dates={'nominal': [1, 2]},
+                           index_col=['nominal', 'ID'])
+
+        xp = self.read_csv(StringIO(self.ts_data),
+                           parse_dates={'nominal': [1, 2]})
+
+        tm.assert_frame_equal(xp.set_index(['nominal', 'ID']), df)
+
+    def test_read_with_parse_dates_scalar_non_bool(self):
+        # See gh-5636
+        errmsg = ("Only booleans, lists, and "
+                  "dictionaries are accepted "
+                  "for the 'parse_dates' parameter")
+        data = """A,B,C
+        1,2,2003-11-1"""
+
+        tm.assert_raises_regex(TypeError, errmsg, self.read_csv,
+                               StringIO(data), parse_dates="C")
+        tm.assert_raises_regex(TypeError, errmsg, self.read_csv,
+                               StringIO(data), parse_dates="C",
+                               index_col="C")
+
+    def test_read_with_parse_dates_invalid_type(self):
+        errmsg = ("Only booleans, lists, and "
+                  "dictionaries are accepted "
+                  "for the 'parse_dates' parameter")
+        data = """A,B,C
+        1,2,2003-11-1"""
+
+        tm.assert_raises_regex(TypeError, errmsg, self.read_csv,
+                               StringIO(data), parse_dates=(1,))
+        tm.assert_raises_regex(TypeError, errmsg,
+                               self.read_csv, StringIO(data),
+                               parse_dates=np.array([4, 5]))
+        tm.assert_raises_regex(TypeError, errmsg, self.read_csv,
+                               StringIO(data), parse_dates=set([1, 3, 3]))
+
+    def test_parse_dates_empty_string(self):
+        # see gh-2263
+        data = "Date, test\n2012-01-01, 1\n,2"
+        result = self.read_csv(StringIO(data), parse_dates=["Date"],
+                               na_filter=False)
+        assert result['Date'].isna()[1]
+
+    def test_parse_dates_noconvert_thousands(self):
+        # see gh-14066
+        data = 'a\n04.15.2016'
+
+        expected = DataFrame([datetime(2016, 4, 15)], columns=['a'])
+        result = self.read_csv(StringIO(data), parse_dates=['a'],
+                               thousands='.')
+        tm.assert_frame_equal(result, expected)
+
+        exp_index = DatetimeIndex(['2016-04-15'], name='a')
+        expected = DataFrame(index=exp_index)
+        result = self.read_csv(StringIO(data), index_col=0,
+                               parse_dates=True, thousands='.')
+        tm.assert_frame_equal(result, expected)
+
+        data = 'a,b\n04.15.2016,09.16.2013'
+
+        expected = DataFrame([[datetime(2016, 4, 15),
+                               datetime(2013, 9, 16)]],
+                             columns=['a', 'b'])
+        result = self.read_csv(StringIO(data), parse_dates=['a', 'b'],
+                               thousands='.')
+        tm.assert_frame_equal(result, expected)
+
+        expected = DataFrame([[datetime(2016, 4, 15),
+                               datetime(2013, 9, 16)]],
+                             columns=['a', 'b'])
+        expected = expected.set_index(['a', 'b'])
+        result = self.read_csv(StringIO(data), index_col=[0, 1],
+                               parse_dates=True, thousands='.')
+        tm.assert_frame_equal(result, expected)
+
+    def test_parse_date_time_multi_level_column_name(self):
+        data = """\
+D,T,A,B
+date, time,a,b
+2001-01-05, 09:00:00, 0.0, 10.
+2001-01-06, 00:00:00, 1.0, 11.
+"""
+        datecols = {'date_time': [0, 1]}
+        result = self.read_csv(StringIO(data), sep=',', header=[0, 1],
+                               parse_dates=datecols,
+                               date_parser=conv.parse_date_time)
+
+        expected_data = [[datetime(2001, 1, 5, 9, 0, 0), 0., 10.],
+                         [datetime(2001, 1, 6, 0, 0, 0), 1., 11.]]
+        expected = DataFrame(expected_data,
+                             columns=['date_time', ('A', 'a'), ('B', 'b')])
+        tm.assert_frame_equal(result, expected)
+
+    def test_parse_date_time(self):
+        dates = np.array(['2007/1/3', '2008/2/4'], dtype=object)
+        times = np.array(['05:07:09', '06:08:00'], dtype=object)
+        expected = np.array([datetime(2007, 1, 3, 5, 7, 9),
+                             datetime(2008, 2, 4, 6, 8, 0)])
+
+        result = conv.parse_date_time(dates, times)
+        assert (result == expected).all()
+
+        data = """\
+date, time, a, b
+2001-01-05, 10:00:00, 0.0, 10.
+2001-01-05, 00:00:00, 1., 11.
+"""
+        datecols = {'date_time': [0, 1]}
+        df = self.read_csv(StringIO(data), sep=',', header=0,
+                           parse_dates=datecols,
+                           date_parser=conv.parse_date_time)
+        assert 'date_time' in df
+        assert df.date_time.loc[0] == datetime(2001, 1, 5, 10, 0, 0)
+
+        data = ("KORD,19990127, 19:00:00, 18:56:00, 0.8100\n"
+                "KORD,19990127, 20:00:00, 19:56:00, 0.0100\n"
+                "KORD,19990127, 21:00:00, 20:56:00, -0.5900\n"
+                "KORD,19990127, 21:00:00, 21:18:00, -0.9900\n"
+                "KORD,19990127, 22:00:00, 21:56:00, -0.5900\n"
+                "KORD,19990127, 23:00:00, 22:56:00, -0.5900")
+
+        date_spec = {'nominal': [1, 2], 'actual': [1, 3]}
+        df = self.read_csv(StringIO(data), header=None, parse_dates=date_spec,
+                           date_parser=conv.parse_date_time)
+
+    def test_parse_date_fields(self):
+        years = np.array([2007, 2008])
+        months = np.array([1, 2])
+        days = np.array([3, 4])
+        result = conv.parse_date_fields(years, months, days)
+        expected = np.array([datetime(2007, 1, 3), datetime(2008, 2, 4)])
+        assert (result == expected).all()
+
+        data = ("year, month, day, a\n 2001 , 01 , 10 , 10.\n"
+                "2001 , 02 , 1 , 11.")
+        datecols = {'ymd': [0, 1, 2]}
+        df = self.read_csv(StringIO(data), sep=',', header=0,
+                           parse_dates=datecols,
+                           date_parser=conv.parse_date_fields)
+        assert 'ymd' in df
+        assert df.ymd.loc[0] == datetime(2001, 1, 10)
+
+    def test_datetime_six_col(self):
+        years = np.array([2007, 2008])
+        months = np.array([1, 2])
+        days = np.array([3, 4])
+        hours = np.array([5, 6])
+        minutes = np.array([7, 8])
+        seconds = np.array([9, 0])
+        expected = np.array([datetime(2007, 1, 3, 5, 7, 9),
+                             datetime(2008, 2, 4, 6, 8, 0)])
+
+        result = conv.parse_all_fields(years, months, days,
+                                       hours, minutes, seconds)
+
+        assert (result == expected).all()
+
+        data = """\
+year, month, day, hour, minute, second, a, b
+2001, 01, 05, 10, 00, 0, 0.0, 10.
+2001, 01, 5, 10, 0, 00, 1., 11.
+"""
+        datecols = {'ymdHMS': [0, 1, 2, 3, 4, 5]}
+        df = self.read_csv(StringIO(data), sep=',', header=0,
+                           parse_dates=datecols,
+                           date_parser=conv.parse_all_fields)
+        assert 'ymdHMS' in df
+        assert df.ymdHMS.loc[0] == datetime(2001, 1, 5, 10, 0, 0)
+
+    def test_datetime_fractional_seconds(self):
+        data = """\
+year, month, day, hour, minute, second, a, b
+2001, 01, 05, 10, 00, 0.123456, 0.0, 10.
+2001, 01, 5, 10, 0, 0.500000, 1., 11.
+"""
+        datecols = {'ymdHMS': [0, 1, 2, 3, 4, 5]}
+        df = self.read_csv(StringIO(data), sep=',', header=0,
+                           parse_dates=datecols,
+                           date_parser=conv.parse_all_fields)
+        assert 'ymdHMS' in df
+        assert df.ymdHMS.loc[0] == datetime(2001, 1, 5, 10, 0, 0,
+                                            microsecond=123456)
+        assert df.ymdHMS.loc[1] == datetime(2001, 1, 5, 10, 0, 0,
+                                            microsecond=500000)
+
+    def test_generic(self):
+        data = "year, month, day, a\n 2001, 01, 10, 10.\n 2001, 02, 1, 11."
+        datecols = {'ym': [0, 1]}
+        dateconverter = lambda y, m: date(year=int(y), month=int(m), day=1)
+        df = self.read_csv(StringIO(data), sep=',', header=0,
+                           parse_dates=datecols,
+                           date_parser=dateconverter)
+        assert 'ym' in df
+        assert df.ym.loc[0] == date(2001, 1, 1)
+
+    def test_dateparser_resolution_if_not_ns(self):
+        # GH 10245
+        data = """\
+date,time,prn,rxstatus
+2013-11-03,19:00:00,126,00E80000
+2013-11-03,19:00:00,23,00E80000
+2013-11-03,19:00:00,13,00E80000
+"""
+
+        def date_parser(date, time):
+            datetime = np_array_datetime64_compat(
+                date + 'T' + time + 'Z', dtype='datetime64[s]')
+            return datetime
+
+        df = self.read_csv(StringIO(data), date_parser=date_parser,
+                           parse_dates={'datetime': ['date', 'time']},
+                           index_col=['datetime', 'prn'])
+
+        datetimes = np_array_datetime64_compat(['2013-11-03T19:00:00Z'] * 3,
+                                               dtype='datetime64[s]')
+        df_correct = DataFrame(data={'rxstatus': ['00E80000'] * 3},
+                               index=MultiIndex.from_tuples(
+                                   [(datetimes[0], 126),
+                                    (datetimes[1], 23),
+                                    (datetimes[2], 13)],
+                               names=['datetime', 'prn']))
+        tm.assert_frame_equal(df, df_correct)
+
+    def test_parse_date_column_with_empty_string(self):
+        # GH 6428
+        data = """case,opdate
+                  7,10/18/2006
+                  7,10/18/2008
+                  621, """
+        result = self.read_csv(StringIO(data), parse_dates=['opdate'])
+        expected_data = [[7, '10/18/2006'],
+                         [7, '10/18/2008'],
+                         [621, ' ']]
+        expected = DataFrame(expected_data, columns=['case', 'opdate'])
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("data,expected", [
+        ("a\n135217135789158401\n1352171357E+5",
+         DataFrame({"a": [135217135789158401,
+                          135217135700000]}, dtype="float64")),
+        ("a\n99999999999\n123456789012345\n1234E+0",
+         DataFrame({"a": [99999999999,
+                          123456789012345,
+                          1234]}, dtype="float64"))
+    ])
+    @pytest.mark.parametrize("parse_dates", [True, False])
+    def test_parse_date_float(self, data, expected, parse_dates):
+        # see gh-2697
+        #
+        # Date parsing should fail, so we leave the data untouched
+        # (i.e. float precision should remain unchanged).
+        result = self.read_csv(StringIO(data), parse_dates=parse_dates)
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/python_parser_only.py b/pandas/tests/io/parser/python_parser_only.py
new file mode 100644
index 0000000000000..c0616ebbab4a5
--- /dev/null
+++ b/pandas/tests/io/parser/python_parser_only.py
@@ -0,0 +1,263 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that apply specifically to the Python parser. Unless specifically
+stated as a Python-specific issue, the goal is to eventually move as many of
+these tests out of this module as soon as the C parser can accept further
+arguments when parsing.
+"""
+
+import csv
+import pytest
+
+import pandas.util.testing as tm
+from pandas import DataFrame, Index
+from pandas import compat
+from pandas.errors import ParserError
+from pandas.compat import StringIO, BytesIO, u
+
+
+class PythonParserTests(object):
+
+    def test_default_separator(self):
+        # GH17333
+        # csv.Sniffer in Python treats 'o' as separator.
+        text = 'aob\n1o2\n3o4'
+        expected = DataFrame({'a': [1, 3], 'b': [2, 4]})
+
+        result = self.read_csv(StringIO(text), sep=None)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_invalid_skipfooter(self):
+        text = "a\n1\n2"
+
+        # see gh-15925 (comment)
+        msg = "skipfooter must be an integer"
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(text), skipfooter="foo")
+
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(text), skipfooter=1.5)
+
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(text), skipfooter=True)
+
+        msg = "skipfooter cannot be negative"
+        with tm.assert_raises_regex(ValueError, msg):
+            self.read_csv(StringIO(text), skipfooter=-1)
+
+    def test_sniff_delimiter(self):
+        text = """index|A|B|C
+foo|1|2|3
+bar|4|5|6
+baz|7|8|9
+"""
+        data = self.read_csv(StringIO(text), index_col=0, sep=None)
+        tm.assert_index_equal(data.index,
+                              Index(['foo', 'bar', 'baz'], name='index'))
+
+        data2 = self.read_csv(StringIO(text), index_col=0, delimiter='|')
+        tm.assert_frame_equal(data, data2)
+
+        text = """ignore this
+ignore this too
+index|A|B|C
+foo|1|2|3
+bar|4|5|6
+baz|7|8|9
+"""
+        data3 = self.read_csv(StringIO(text), index_col=0,
+                              sep=None, skiprows=2)
+        tm.assert_frame_equal(data, data3)
+
+        text = u("""ignore this
+ignore this too
+index|A|B|C
+foo|1|2|3
+bar|4|5|6
+baz|7|8|9
+""").encode('utf-8')
+
+        s = BytesIO(text)
+        if compat.PY3:
+            # somewhat False since the code never sees bytes
+            from io import TextIOWrapper
+            s = TextIOWrapper(s, encoding='utf-8')
+
+        data4 = self.read_csv(s, index_col=0, sep=None, skiprows=2,
+                              encoding='utf-8')
+        tm.assert_frame_equal(data, data4)
+
+    def test_BytesIO_input(self):
+        if not compat.PY3:
+            pytest.skip(
+                "Bytes-related test - only needs to work on Python 3")
+
+        data = BytesIO("שלום::1234\n562::123".encode('cp1255'))
+        result = self.read_table(data, sep="::", encoding='cp1255')
+        expected = DataFrame([[562, 123]], columns=["שלום", "1234"])
+        tm.assert_frame_equal(result, expected)
+
+    def test_single_line(self):
+        # see gh-6607: sniff separator
+        df = self.read_csv(StringIO('1,2'), names=['a', 'b'],
+                           header=None, sep=None)
+        tm.assert_frame_equal(DataFrame({'a': [1], 'b': [2]}), df)
+
+    def test_skipfooter(self):
+        # see gh-6607
+        data = """A,B,C
+1,2,3
+4,5,6
+7,8,9
+want to skip this
+also also skip this
+"""
+        result = self.read_csv(StringIO(data), skipfooter=2)
+        no_footer = '\n'.join(data.split('\n')[:-3])
+        expected = self.read_csv(StringIO(no_footer))
+        tm.assert_frame_equal(result, expected)
+
+        result = self.read_csv(StringIO(data), nrows=3)
+        tm.assert_frame_equal(result, expected)
+
+        # skipfooter alias
+        result = self.read_csv(StringIO(data), skipfooter=2)
+        no_footer = '\n'.join(data.split('\n')[:-3])
+        expected = self.read_csv(StringIO(no_footer))
+        tm.assert_frame_equal(result, expected)
+
+    def test_decompression_regex_sep(self):
+        # see gh-6607
+
+        try:
+            import gzip
+            import bz2
+        except ImportError:
+            pytest.skip('need gzip and bz2 to run')
+
+        with open(self.csv1, 'rb') as f:
+            data = f.read()
+        data = data.replace(b',', b'::')
+        expected = self.read_csv(self.csv1)
+
+        with tm.ensure_clean() as path:
+            tmp = gzip.GzipFile(path, mode='wb')
+            tmp.write(data)
+            tmp.close()
+
+            result = self.read_csv(path, sep='::', compression='gzip')
+            tm.assert_frame_equal(result, expected)
+
+        with tm.ensure_clean() as path:
+            tmp = bz2.BZ2File(path, mode='wb')
+            tmp.write(data)
+            tmp.close()
+
+            result = self.read_csv(path, sep='::', compression='bz2')
+            tm.assert_frame_equal(result, expected)
+
+            pytest.raises(ValueError, self.read_csv,
+                          path, compression='bz3')
+
+    def test_read_table_buglet_4x_multiindex(self):
+        # see gh-6607
+        text = """                      A       B       C       D        E
+one two three   four
+a   b   10.0032 5    -0.5109 -2.3358 -0.4645  0.05076  0.3640
+a   q   20      4     0.4473  1.4152  0.2834  1.00661  0.1744
+x   q   30      3    -0.6662 -0.5243 -0.3580  0.89145  2.5838"""
+
+        df = self.read_table(StringIO(text), sep=r'\s+')
+        assert df.index.names == ('one', 'two', 'three', 'four')
+
+        # see gh-6893
+        data = '      A B C\na b c\n1 3 7 0 3 6\n3 1 4 1 5 9'
+        expected = DataFrame.from_records(
+            [(1, 3, 7, 0, 3, 6), (3, 1, 4, 1, 5, 9)],
+            columns=list('abcABC'), index=list('abc'))
+        actual = self.read_table(StringIO(data), sep=r'\s+')
+        tm.assert_frame_equal(actual, expected)
+
+    def test_skipfooter_with_decimal(self):
+        # see gh-6971
+        data = '1#2\n3#4'
+        expected = DataFrame({'a': [1.2, 3.4]})
+
+        result = self.read_csv(StringIO(data), names=['a'],
+                               decimal='#')
+        tm.assert_frame_equal(result, expected)
+
+        # the stray footer line should not mess with the
+        # casting of the first t    wo lines if we skip it
+        data = data + '\nFooter'
+        result = self.read_csv(StringIO(data), names=['a'],
+                               decimal='#', skipfooter=1)
+        tm.assert_frame_equal(result, expected)
+
+    def test_encoding_non_utf8_multichar_sep(self):
+        # see gh-3404
+        expected = DataFrame({'a': [1], 'b': [2]})
+
+        for sep in ['::', '#####', '!!!', '123', '#1!c5',
+                    '%!c!d', '@@#4:2', '_!pd#_']:
+            data = '1' + sep + '2'
+
+            for encoding in ['utf-16', 'utf-16-be', 'utf-16-le',
+                             'utf-32', 'cp037']:
+                encoded_data = data.encode(encoding)
+                result = self.read_csv(BytesIO(encoded_data),
+                                       sep=sep, names=['a', 'b'],
+                                       encoding=encoding)
+                tm.assert_frame_equal(result, expected)
+
+    def test_multi_char_sep_quotes(self):
+        # see gh-13374
+
+        data = 'a,,b\n1,,a\n2,,"2,,b"'
+        msg = 'ignored when a multi-char delimiter is used'
+
+        with tm.assert_raises_regex(ParserError, msg):
+            self.read_csv(StringIO(data), sep=',,')
+
+        # We expect no match, so there should be an assertion
+        # error out of the inner context manager.
+        with pytest.raises(AssertionError):
+            with tm.assert_raises_regex(ParserError, msg):
+                self.read_csv(StringIO(data), sep=',,',
+                              quoting=csv.QUOTE_NONE)
+
+    def test_none_delimiter(self):
+        # see gh-13374 and gh-17465
+
+        data = "a,b,c\n0,1,2\n3,4,5,6\n7,8,9"
+        expected = DataFrame({'a': [0, 7],
+                              'b': [1, 8],
+                              'c': [2, 9]})
+
+        # We expect the third line in the data to be
+        # skipped because it is malformed,
+        # but we do not expect any errors to occur.
+        result = self.read_csv(StringIO(data), header=0,
+                               sep=None,
+                               error_bad_lines=False,
+                               warn_bad_lines=True)
+        tm.assert_frame_equal(result, expected)
+
+    def test_skipfooter_bad_row(self):
+        # see gh-13879
+        # see gh-15910
+
+        msg = 'parsing errors in the skipped footer rows'
+
+        for data in ('a\n1\n"b"a',
+                     'a,b,c\ncat,foo,bar\ndog,foo,"baz'):
+            with tm.assert_raises_regex(ParserError, msg):
+                self.read_csv(StringIO(data), skipfooter=1)
+
+            # We expect no match, so there should be an assertion
+            # error out of the inner context manager.
+            with pytest.raises(AssertionError):
+                with tm.assert_raises_regex(ParserError, msg):
+                    self.read_csv(StringIO(data))
diff --git a/pandas/tests/io/parser/quoting.py b/pandas/tests/io/parser/quoting.py
new file mode 100644
index 0000000000000..15427aaf9825c
--- /dev/null
+++ b/pandas/tests/io/parser/quoting.py
@@ -0,0 +1,153 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that quoting specifications are properly handled
+during parsing for all of the parsers defined in parsers.py
+"""
+
+import csv
+import pandas.util.testing as tm
+
+from pandas import DataFrame
+from pandas.compat import PY3, StringIO, u
+
+
+class QuotingTests(object):
+
+    def test_bad_quote_char(self):
+        data = '1,2,3'
+
+        # Python 2.x: "...must be an 1-character..."
+        # Python 3.x: "...must be a 1-character..."
+        msg = '"quotechar" must be a(n)? 1-character string'
+        tm.assert_raises_regex(TypeError, msg, self.read_csv,
+                               StringIO(data), quotechar='foo')
+
+        msg = 'quotechar must be set if quoting enabled'
+        tm.assert_raises_regex(TypeError, msg, self.read_csv,
+                               StringIO(data), quotechar=None,
+                               quoting=csv.QUOTE_MINIMAL)
+
+        msg = '"quotechar" must be string, not int'
+        tm.assert_raises_regex(TypeError, msg, self.read_csv,
+                               StringIO(data), quotechar=2)
+
+    def test_bad_quoting(self):
+        data = '1,2,3'
+
+        msg = '"quoting" must be an integer'
+        tm.assert_raises_regex(TypeError, msg, self.read_csv,
+                               StringIO(data), quoting='foo')
+
+        # quoting must in the range [0, 3]
+        msg = 'bad "quoting" value'
+        tm.assert_raises_regex(TypeError, msg, self.read_csv,
+                               StringIO(data), quoting=5)
+
+    def test_quote_char_basic(self):
+        data = 'a,b,c\n1,2,"cat"'
+        expected = DataFrame([[1, 2, 'cat']],
+                             columns=['a', 'b', 'c'])
+        result = self.read_csv(StringIO(data), quotechar='"')
+        tm.assert_frame_equal(result, expected)
+
+    def test_quote_char_various(self):
+        data = 'a,b,c\n1,2,"cat"'
+        expected = DataFrame([[1, 2, 'cat']],
+                             columns=['a', 'b', 'c'])
+        quote_chars = ['~', '*', '%', '$', '@', 'P']
+
+        for quote_char in quote_chars:
+            new_data = data.replace('"', quote_char)
+            result = self.read_csv(StringIO(new_data), quotechar=quote_char)
+            tm.assert_frame_equal(result, expected)
+
+    def test_null_quote_char(self):
+        data = 'a,b,c\n1,2,3'
+
+        # sanity checks
+        msg = 'quotechar must be set if quoting enabled'
+
+        tm.assert_raises_regex(TypeError, msg, self.read_csv,
+                               StringIO(data), quotechar=None,
+                               quoting=csv.QUOTE_MINIMAL)
+
+        tm.assert_raises_regex(TypeError, msg, self.read_csv,
+                               StringIO(data), quotechar='',
+                               quoting=csv.QUOTE_MINIMAL)
+
+        # no errors should be raised if quoting is None
+        expected = DataFrame([[1, 2, 3]],
+                             columns=['a', 'b', 'c'])
+
+        result = self.read_csv(StringIO(data), quotechar=None,
+                               quoting=csv.QUOTE_NONE)
+        tm.assert_frame_equal(result, expected)
+
+        result = self.read_csv(StringIO(data), quotechar='',
+                               quoting=csv.QUOTE_NONE)
+        tm.assert_frame_equal(result, expected)
+
+    def test_quoting_various(self):
+        data = '1,2,"foo"'
+        cols = ['a', 'b', 'c']
+
+        # QUOTE_MINIMAL and QUOTE_ALL apply only to
+        # the CSV writer, so they should have no
+        # special effect for the CSV reader
+        expected = DataFrame([[1, 2, 'foo']], columns=cols)
+
+        # test default (afterwards, arguments are all explicit)
+        result = self.read_csv(StringIO(data), names=cols)
+        tm.assert_frame_equal(result, expected)
+
+        result = self.read_csv(StringIO(data), quotechar='"',
+                               quoting=csv.QUOTE_MINIMAL, names=cols)
+        tm.assert_frame_equal(result, expected)
+
+        result = self.read_csv(StringIO(data), quotechar='"',
+                               quoting=csv.QUOTE_ALL, names=cols)
+        tm.assert_frame_equal(result, expected)
+
+        # QUOTE_NONE tells the reader to do no special handling
+        # of quote characters and leave them alone
+        expected = DataFrame([[1, 2, '"foo"']], columns=cols)
+        result = self.read_csv(StringIO(data), quotechar='"',
+                               quoting=csv.QUOTE_NONE, names=cols)
+        tm.assert_frame_equal(result, expected)
+
+        # QUOTE_NONNUMERIC tells the reader to cast
+        # all non-quoted fields to float
+        expected = DataFrame([[1.0, 2.0, 'foo']], columns=cols)
+        result = self.read_csv(StringIO(data), quotechar='"',
+                               quoting=csv.QUOTE_NONNUMERIC,
+                               names=cols)
+        tm.assert_frame_equal(result, expected)
+
+    def test_double_quote(self):
+        data = 'a,b\n3,"4 "" 5"'
+
+        expected = DataFrame([[3, '4 " 5']],
+                             columns=['a', 'b'])
+        result = self.read_csv(StringIO(data), quotechar='"',
+                               doublequote=True)
+        tm.assert_frame_equal(result, expected)
+
+        expected = DataFrame([[3, '4 " 5"']],
+                             columns=['a', 'b'])
+        result = self.read_csv(StringIO(data), quotechar='"',
+                               doublequote=False)
+        tm.assert_frame_equal(result, expected)
+
+    def test_quotechar_unicode(self):
+        # See gh-14477
+        data = 'a\n1'
+        expected = DataFrame({'a': [1]})
+
+        result = self.read_csv(StringIO(data), quotechar=u('"'))
+        tm.assert_frame_equal(result, expected)
+
+        # Compared to Python 3.x, Python 2.x does not handle unicode well.
+        if PY3:
+            result = self.read_csv(StringIO(data), quotechar=u('\u0001'))
+            tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/skiprows.py b/pandas/tests/io/parser/skiprows.py
new file mode 100644
index 0000000000000..fb08ec0447267
--- /dev/null
+++ b/pandas/tests/io/parser/skiprows.py
@@ -0,0 +1,225 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that skipped rows are properly handled during
+parsing for all of the parsers defined in parsers.py
+"""
+
+from datetime import datetime
+
+import numpy as np
+
+import pandas.util.testing as tm
+
+from pandas import DataFrame
+from pandas.errors import EmptyDataError
+from pandas.compat import StringIO, range, lrange
+
+
+class SkipRowsTests(object):
+
+    def test_skiprows_bug(self):
+        # see gh-505
+        text = """#foo,a,b,c
+#foo,a,b,c
+#foo,a,b,c
+#foo,a,b,c
+#foo,a,b,c
+#foo,a,b,c
+1/1/2000,1.,2.,3.
+1/2/2000,4,5,6
+1/3/2000,7,8,9
+"""
+        data = self.read_csv(StringIO(text), skiprows=lrange(6), header=None,
+                             index_col=0, parse_dates=True)
+
+        data2 = self.read_csv(StringIO(text), skiprows=6, header=None,
+                              index_col=0, parse_dates=True)
+
+        expected = DataFrame(np.arange(1., 10.).reshape((3, 3)),
+                             columns=[1, 2, 3],
+                             index=[datetime(2000, 1, 1), datetime(2000, 1, 2),
+                                    datetime(2000, 1, 3)])
+        expected.index.name = 0
+        tm.assert_frame_equal(data, expected)
+        tm.assert_frame_equal(data, data2)
+
+    def test_deep_skiprows(self):
+        # see gh-4382
+        text = "a,b,c\n" + \
+               "\n".join([",".join([str(i), str(i + 1), str(i + 2)])
+                          for i in range(10)])
+        condensed_text = "a,b,c\n" + \
+                         "\n".join([",".join([str(i), str(i + 1), str(i + 2)])
+                                    for i in [0, 1, 2, 3, 4, 6, 8, 9]])
+        data = self.read_csv(StringIO(text), skiprows=[6, 8])
+        condensed_data = self.read_csv(StringIO(condensed_text))
+        tm.assert_frame_equal(data, condensed_data)
+
+    def test_skiprows_blank(self):
+        # see gh-9832
+        text = """#foo,a,b,c
+#foo,a,b,c
+
+#foo,a,b,c
+#foo,a,b,c
+
+1/1/2000,1.,2.,3.
+1/2/2000,4,5,6
+1/3/2000,7,8,9
+"""
+        data = self.read_csv(StringIO(text), skiprows=6, header=None,
+                             index_col=0, parse_dates=True)
+
+        expected = DataFrame(np.arange(1., 10.).reshape((3, 3)),
+                             columns=[1, 2, 3],
+                             index=[datetime(2000, 1, 1), datetime(2000, 1, 2),
+                                    datetime(2000, 1, 3)])
+        expected.index.name = 0
+        tm.assert_frame_equal(data, expected)
+
+    def test_skiprow_with_newline(self):
+        # see gh-12775 and gh-10911
+        data = """id,text,num_lines
+1,"line 11
+line 12",2
+2,"line 21
+line 22",2
+3,"line 31",1"""
+        expected = [[2, 'line 21\nline 22', 2],
+                    [3, 'line 31', 1]]
+        expected = DataFrame(expected, columns=[
+            'id', 'text', 'num_lines'])
+        df = self.read_csv(StringIO(data), skiprows=[1])
+        tm.assert_frame_equal(df, expected)
+
+        data = ('a,b,c\n~a\n b~,~e\n d~,'
+                '~f\n f~\n1,2,~12\n 13\n 14~')
+        expected = [['a\n b', 'e\n d', 'f\n f']]
+        expected = DataFrame(expected, columns=[
+            'a', 'b', 'c'])
+        df = self.read_csv(StringIO(data),
+                           quotechar="~",
+                           skiprows=[2])
+        tm.assert_frame_equal(df, expected)
+
+        data = ('Text,url\n~example\n '
+                'sentence\n one~,url1\n~'
+                'example\n sentence\n two~,url2\n~'
+                'example\n sentence\n three~,url3')
+        expected = [['example\n sentence\n two', 'url2']]
+        expected = DataFrame(expected, columns=[
+            'Text', 'url'])
+        df = self.read_csv(StringIO(data),
+                           quotechar="~",
+                           skiprows=[1, 3])
+        tm.assert_frame_equal(df, expected)
+
+    def test_skiprow_with_quote(self):
+        # see gh-12775 and gh-10911
+        data = """id,text,num_lines
+1,"line '11' line 12",2
+2,"line '21' line 22",2
+3,"line '31' line 32",1"""
+        expected = [[2, "line '21' line 22", 2],
+                    [3, "line '31' line 32", 1]]
+        expected = DataFrame(expected, columns=[
+            'id', 'text', 'num_lines'])
+        df = self.read_csv(StringIO(data), skiprows=[1])
+        tm.assert_frame_equal(df, expected)
+
+    def test_skiprow_with_newline_and_quote(self):
+        # see gh-12775 and gh-10911
+        data = """id,text,num_lines
+1,"line \n'11' line 12",2
+2,"line \n'21' line 22",2
+3,"line \n'31' line 32",1"""
+        expected = [[2, "line \n'21' line 22", 2],
+                    [3, "line \n'31' line 32", 1]]
+        expected = DataFrame(expected, columns=[
+            'id', 'text', 'num_lines'])
+        df = self.read_csv(StringIO(data), skiprows=[1])
+        tm.assert_frame_equal(df, expected)
+
+        data = """id,text,num_lines
+1,"line '11\n' line 12",2
+2,"line '21\n' line 22",2
+3,"line '31\n' line 32",1"""
+        expected = [[2, "line '21\n' line 22", 2],
+                    [3, "line '31\n' line 32", 1]]
+        expected = DataFrame(expected, columns=[
+            'id', 'text', 'num_lines'])
+        df = self.read_csv(StringIO(data), skiprows=[1])
+        tm.assert_frame_equal(df, expected)
+
+        data = """id,text,num_lines
+1,"line '11\n' \r\tline 12",2
+2,"line '21\n' \r\tline 22",2
+3,"line '31\n' \r\tline 32",1"""
+        expected = [[2, "line '21\n' \r\tline 22", 2],
+                    [3, "line '31\n' \r\tline 32", 1]]
+        expected = DataFrame(expected, columns=[
+            'id', 'text', 'num_lines'])
+        df = self.read_csv(StringIO(data), skiprows=[1])
+        tm.assert_frame_equal(df, expected)
+
+    def test_skiprows_lineterminator(self):
+        # see gh-9079
+        data = '\n'.join(['SMOSMANIA ThetaProbe-ML2X ',
+                          '2007/01/01 01:00   0.2140 U M ',
+                          '2007/01/01 02:00   0.2141 M O ',
+                          '2007/01/01 04:00   0.2142 D M '])
+        expected = DataFrame([['2007/01/01', '01:00', 0.2140, 'U', 'M'],
+                              ['2007/01/01', '02:00', 0.2141, 'M', 'O'],
+                              ['2007/01/01', '04:00', 0.2142, 'D', 'M']],
+                             columns=['date', 'time', 'var', 'flag',
+                                      'oflag'])
+
+        # test with default line terminators "LF" and "CRLF"
+        df = self.read_csv(StringIO(data), skiprows=1, delim_whitespace=True,
+                           names=['date', 'time', 'var', 'flag', 'oflag'])
+        tm.assert_frame_equal(df, expected)
+
+        df = self.read_csv(StringIO(data.replace('\n', '\r\n')),
+                           skiprows=1, delim_whitespace=True,
+                           names=['date', 'time', 'var', 'flag', 'oflag'])
+        tm.assert_frame_equal(df, expected)
+
+        # "CR" is not respected with the Python parser yet
+        if self.engine == 'c':
+            df = self.read_csv(StringIO(data.replace('\n', '\r')),
+                               skiprows=1, delim_whitespace=True,
+                               names=['date', 'time', 'var', 'flag', 'oflag'])
+            tm.assert_frame_equal(df, expected)
+
+    def test_skiprows_infield_quote(self):
+        # see gh-14459
+        data = 'a"\nb"\na\n1'
+        expected = DataFrame({'a': [1]})
+
+        df = self.read_csv(StringIO(data), skiprows=2)
+        tm.assert_frame_equal(df, expected)
+
+    def test_skiprows_callable(self):
+        data = 'a\n1\n2\n3\n4\n5'
+
+        skiprows = lambda x: x % 2 == 0
+        expected = DataFrame({'1': [3, 5]})
+        df = self.read_csv(StringIO(data), skiprows=skiprows)
+        tm.assert_frame_equal(df, expected)
+
+        expected = DataFrame({'foo': [3, 5]})
+        df = self.read_csv(StringIO(data), skiprows=skiprows,
+                           header=0, names=['foo'])
+        tm.assert_frame_equal(df, expected)
+
+        skiprows = lambda x: True
+        msg = "No columns to parse from file"
+        with tm.assert_raises_regex(EmptyDataError, msg):
+            self.read_csv(StringIO(data), skiprows=skiprows)
+
+        # This is a bad callable and should raise.
+        msg = "by zero"
+        skiprows = lambda x: 1 / 0
+        with tm.assert_raises_regex(ZeroDivisionError, msg):
+            self.read_csv(StringIO(data), skiprows=skiprows)
diff --git a/pandas/tests/io/parser/test_network.py b/pandas/tests/io/parser/test_network.py
new file mode 100644
index 0000000000000..e2243b8087a5b
--- /dev/null
+++ b/pandas/tests/io/parser/test_network.py
@@ -0,0 +1,200 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests parsers ability to read and parse non-local files
+and hence require a network connection to be read.
+"""
+import logging
+
+import pytest
+import numpy as np
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas import DataFrame
+from pandas.io.parsers import read_csv, read_table
+from pandas.compat import BytesIO, StringIO
+
+
+@pytest.mark.network
+@pytest.mark.parametrize(
+    "compress_type, extension", [
+        ('gzip', '.gz'), ('bz2', '.bz2'), ('zip', '.zip'),
+        pytest.param('xz', '.xz', marks=td.skip_if_no_lzma)
+    ]
+)
+@pytest.mark.parametrize('mode', ['explicit', 'infer'])
+@pytest.mark.parametrize('engine', ['python', 'c'])
+def test_compressed_urls(salaries_table, compress_type, extension, mode,
+                         engine):
+    check_compressed_urls(salaries_table, compress_type, extension, mode,
+                          engine)
+
+
+@tm.network
+def check_compressed_urls(salaries_table, compression, extension, mode,
+                          engine):
+    # test reading compressed urls with various engines and
+    # extension inference
+    base_url = ('https://github.com/pandas-dev/pandas/raw/master/'
+                'pandas/tests/io/parser/data/salaries.csv')
+
+    url = base_url + extension
+
+    if mode != 'explicit':
+        compression = mode
+
+    url_table = read_table(url, compression=compression, engine=engine)
+    tm.assert_frame_equal(url_table, salaries_table)
+
+
+@pytest.fixture
+def tips_df(datapath):
+    """DataFrame with the tips dataset."""
+    return read_csv(datapath('io', 'parser', 'data', 'tips.csv'))
+
+
+@pytest.mark.usefixtures("s3_resource")
+class TestS3(object):
+
+    def test_parse_public_s3_bucket(self, tips_df):
+        pytest.importorskip('s3fs')
+        # more of an integration test due to the not-public contents portion
+        # can probably mock this though.
+        for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
+            df = read_csv('s3://pandas-test/tips.csv' +
+                          ext, compression=comp)
+            assert isinstance(df, DataFrame)
+            assert not df.empty
+            tm.assert_frame_equal(df, tips_df)
+
+        # Read public file from bucket with not-public contents
+        df = read_csv('s3://cant_get_it/tips.csv')
+        assert isinstance(df, DataFrame)
+        assert not df.empty
+        tm.assert_frame_equal(df, tips_df)
+
+    def test_parse_public_s3n_bucket(self, tips_df):
+
+        # Read from AWS s3 as "s3n" URL
+        df = read_csv('s3n://pandas-test/tips.csv', nrows=10)
+        assert isinstance(df, DataFrame)
+        assert not df.empty
+        tm.assert_frame_equal(tips_df.iloc[:10], df)
+
+    def test_parse_public_s3a_bucket(self, tips_df):
+        # Read from AWS s3 as "s3a" URL
+        df = read_csv('s3a://pandas-test/tips.csv', nrows=10)
+        assert isinstance(df, DataFrame)
+        assert not df.empty
+        tm.assert_frame_equal(tips_df.iloc[:10], df)
+
+    def test_parse_public_s3_bucket_nrows(self, tips_df):
+        for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
+            df = read_csv('s3://pandas-test/tips.csv' +
+                          ext, nrows=10, compression=comp)
+            assert isinstance(df, DataFrame)
+            assert not df.empty
+            tm.assert_frame_equal(tips_df.iloc[:10], df)
+
+    def test_parse_public_s3_bucket_chunked(self, tips_df):
+        # Read with a chunksize
+        chunksize = 5
+        for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
+            df_reader = read_csv('s3://pandas-test/tips.csv' + ext,
+                                 chunksize=chunksize, compression=comp)
+            assert df_reader.chunksize == chunksize
+            for i_chunk in [0, 1, 2]:
+                # Read a couple of chunks and make sure we see them
+                # properly.
+                df = df_reader.get_chunk()
+                assert isinstance(df, DataFrame)
+                assert not df.empty
+                true_df = tips_df.iloc[
+                    chunksize * i_chunk: chunksize * (i_chunk + 1)]
+                tm.assert_frame_equal(true_df, df)
+
+    def test_parse_public_s3_bucket_chunked_python(self, tips_df):
+        # Read with a chunksize using the Python parser
+        chunksize = 5
+        for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
+            df_reader = read_csv('s3://pandas-test/tips.csv' + ext,
+                                 chunksize=chunksize, compression=comp,
+                                 engine='python')
+            assert df_reader.chunksize == chunksize
+            for i_chunk in [0, 1, 2]:
+                # Read a couple of chunks and make sure we see them properly.
+                df = df_reader.get_chunk()
+                assert isinstance(df, DataFrame)
+                assert not df.empty
+                true_df = tips_df.iloc[
+                    chunksize * i_chunk: chunksize * (i_chunk + 1)]
+                tm.assert_frame_equal(true_df, df)
+
+    def test_parse_public_s3_bucket_python(self, tips_df):
+        for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
+            df = read_csv('s3://pandas-test/tips.csv' + ext, engine='python',
+                          compression=comp)
+            assert isinstance(df, DataFrame)
+            assert not df.empty
+            tm.assert_frame_equal(df, tips_df)
+
+    def test_infer_s3_compression(self, tips_df):
+        for ext in ['', '.gz', '.bz2']:
+            df = read_csv('s3://pandas-test/tips.csv' + ext,
+                          engine='python', compression='infer')
+            assert isinstance(df, DataFrame)
+            assert not df.empty
+            tm.assert_frame_equal(df, tips_df)
+
+    def test_parse_public_s3_bucket_nrows_python(self, tips_df):
+        for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
+            df = read_csv('s3://pandas-test/tips.csv' + ext, engine='python',
+                          nrows=10, compression=comp)
+            assert isinstance(df, DataFrame)
+            assert not df.empty
+            tm.assert_frame_equal(tips_df.iloc[:10], df)
+
+    def test_s3_fails(self):
+        with pytest.raises(IOError):
+            read_csv('s3://nyqpug/asdf.csv')
+
+        # Receive a permission error when trying to read a private bucket.
+        # It's irrelevant here that this isn't actually a table.
+        with pytest.raises(IOError):
+            read_csv('s3://cant_get_it/')
+
+    def test_read_csv_handles_boto_s3_object(self,
+                                             s3_resource,
+                                             tips_file):
+        # see gh-16135
+
+        s3_object = s3_resource.meta.client.get_object(
+            Bucket='pandas-test',
+            Key='tips.csv')
+
+        result = read_csv(BytesIO(s3_object["Body"].read()), encoding='utf8')
+        assert isinstance(result, DataFrame)
+        assert not result.empty
+
+        expected = read_csv(tips_file)
+        tm.assert_frame_equal(result, expected)
+
+    def test_read_csv_chunked_download(self, s3_resource, caplog):
+        # 8 MB, S3FS usees 5MB chunks
+        df = DataFrame(np.random.randn(100000, 4), columns=list('abcd'))
+        buf = BytesIO()
+        str_buf = StringIO()
+
+        df.to_csv(str_buf)
+
+        buf = BytesIO(str_buf.getvalue().encode('utf-8'))
+
+        s3_resource.Bucket("pandas-test").put_object(
+            Key="large-file.csv",
+            Body=buf)
+
+        with caplog.at_level(logging.DEBUG, logger='s3fs.core'):
+            read_csv("s3://pandas-test/large-file.csv", nrows=5)
+            # log of fetch_range (start, stop)
+            assert ((0, 5505024) in set(x.args[-2:] for x in caplog.records))
diff --git a/pandas/tests/io/parser/test_parsers.py b/pandas/tests/io/parser/test_parsers.py
new file mode 100644
index 0000000000000..b6f13039641a2
--- /dev/null
+++ b/pandas/tests/io/parser/test_parsers.py
@@ -0,0 +1,154 @@
+# -*- coding: utf-8 -*-
+
+import os
+import pytest
+import pandas.util.testing as tm
+
+from pandas import read_csv, read_table, DataFrame
+import pandas.core.common as com
+from pandas._libs.tslib import Timestamp
+from pandas.compat import StringIO
+
+from .common import ParserTests
+from .header import HeaderTests
+from .comment import CommentTests
+from .dialect import DialectTests
+from .quoting import QuotingTests
+from .usecols import UsecolsTests
+from .skiprows import SkipRowsTests
+from .index_col import IndexColTests
+from .na_values import NAvaluesTests
+from .converters import ConverterTests
+from .c_parser_only import CParserTests
+from .parse_dates import ParseDatesTests
+from .compression import CompressionTests
+from .mangle_dupes import DupeColumnTests
+from .multithread import MultithreadTests
+from .python_parser_only import PythonParserTests
+from .dtypes import DtypeTests
+
+
+class BaseParser(CommentTests, CompressionTests,
+                 ConverterTests, DialectTests,
+                 DtypeTests, DupeColumnTests,
+                 HeaderTests, IndexColTests,
+                 MultithreadTests, NAvaluesTests,
+                 ParseDatesTests, ParserTests,
+                 SkipRowsTests, UsecolsTests,
+                 QuotingTests):
+
+    def read_csv(self, *args, **kwargs):
+        raise NotImplementedError
+
+    def read_table(self, *args, **kwargs):
+        raise NotImplementedError
+
+    def float_precision_choices(self):
+        raise com.AbstractMethodError(self)
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.dirpath = datapath('io', 'parser', 'data')
+        self.csv1 = os.path.join(self.dirpath, 'test1.csv')
+        self.csv2 = os.path.join(self.dirpath, 'test2.csv')
+        self.xls1 = os.path.join(self.dirpath, 'test.xls')
+        self.csv_shiftjs = os.path.join(self.dirpath, 'sauron.SHIFT_JIS.csv')
+
+
+class TestCParserHighMemory(BaseParser, CParserTests):
+    engine = 'c'
+    low_memory = False
+    float_precision_choices = [None, 'high', 'round_trip']
+
+    def read_csv(self, *args, **kwds):
+        kwds = kwds.copy()
+        kwds['engine'] = self.engine
+        kwds['low_memory'] = self.low_memory
+        return read_csv(*args, **kwds)
+
+    def read_table(self, *args, **kwds):
+        kwds = kwds.copy()
+        kwds['engine'] = self.engine
+        kwds['low_memory'] = self.low_memory
+        return read_table(*args, **kwds)
+
+
+class TestCParserLowMemory(BaseParser, CParserTests):
+    engine = 'c'
+    low_memory = True
+    float_precision_choices = [None, 'high', 'round_trip']
+
+    def read_csv(self, *args, **kwds):
+        kwds = kwds.copy()
+        kwds['engine'] = self.engine
+        kwds['low_memory'] = self.low_memory
+        return read_csv(*args, **kwds)
+
+    def read_table(self, *args, **kwds):
+        kwds = kwds.copy()
+        kwds['engine'] = self.engine
+        kwds['low_memory'] = True
+        return read_table(*args, **kwds)
+
+
+class TestPythonParser(BaseParser, PythonParserTests):
+    engine = 'python'
+    float_precision_choices = [None]
+
+    def read_csv(self, *args, **kwds):
+        kwds = kwds.copy()
+        kwds['engine'] = self.engine
+        return read_csv(*args, **kwds)
+
+    def read_table(self, *args, **kwds):
+        kwds = kwds.copy()
+        kwds['engine'] = self.engine
+        return read_table(*args, **kwds)
+
+
+class TestUnsortedUsecols(object):
+    def test_override__set_noconvert_columns(self):
+        # GH 17351 - usecols needs to be sorted in _setnoconvert_columns
+        # based on the test_usecols_with_parse_dates test from usecols.py
+        from pandas.io.parsers import CParserWrapper, TextFileReader
+
+        s = """a,b,c,d,e
+        0,1,20140101,0900,4
+        0,1,20140102,1000,4"""
+
+        parse_dates = [[1, 2]]
+        cols = {
+            'a': [0, 0],
+            'c_d': [
+                Timestamp('2014-01-01 09:00:00'),
+                Timestamp('2014-01-02 10:00:00')
+            ]
+        }
+        expected = DataFrame(cols, columns=['c_d', 'a'])
+
+        class MyTextFileReader(TextFileReader):
+            def __init__(self):
+                self._currow = 0
+                self.squeeze = False
+
+        class MyCParserWrapper(CParserWrapper):
+            def _set_noconvert_columns(self):
+                if self.usecols_dtype == 'integer':
+                    # self.usecols is a set, which is documented as unordered
+                    # but in practice, a CPython set of integers is sorted.
+                    # In other implementations this assumption does not hold.
+                    # The following code simulates a different order, which
+                    # before GH 17351 would cause the wrong columns to be
+                    # converted via the parse_dates parameter
+                    self.usecols = list(self.usecols)
+                    self.usecols.reverse()
+                return CParserWrapper._set_noconvert_columns(self)
+
+        parser = MyTextFileReader()
+        parser.options = {'usecols': [0, 2, 3],
+                          'parse_dates': parse_dates,
+                          'delimiter': ','}
+        parser._engine = MyCParserWrapper(StringIO(s), **parser.options)
+        df = parser.read()
+
+        tm.assert_frame_equal(df, expected)
diff --git a/pandas/tests/io/parser/test_read_fwf.py b/pandas/tests/io/parser/test_read_fwf.py
new file mode 100644
index 0000000000000..a60f2b5a4c946
--- /dev/null
+++ b/pandas/tests/io/parser/test_read_fwf.py
@@ -0,0 +1,436 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests the 'read_fwf' function in parsers.py. This
+test suite is independent of the others because the
+engine is set to 'python-fwf' internally.
+"""
+
+from datetime import datetime
+
+import pytest
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+
+from pandas import DataFrame
+from pandas import compat
+from pandas.compat import StringIO, BytesIO
+from pandas.io.parsers import read_csv, read_fwf, EmptyDataError
+
+
+class TestFwfParsing(object):
+
+    def test_fwf(self):
+        data_expected = """\
+2011,58,360.242940,149.910199,11950.7
+2011,59,444.953632,166.985655,11788.4
+2011,60,364.136849,183.628767,11806.2
+2011,61,413.836124,184.375703,11916.8
+2011,62,502.953953,173.237159,12468.3
+"""
+        expected = read_csv(StringIO(data_expected),
+                            engine='python', header=None)
+
+        data1 = """\
+201158    360.242940   149.910199   11950.7
+201159    444.953632   166.985655   11788.4
+201160    364.136849   183.628767   11806.2
+201161    413.836124   184.375703   11916.8
+201162    502.953953   173.237159   12468.3
+"""
+        colspecs = [(0, 4), (4, 8), (8, 20), (21, 33), (34, 43)]
+        df = read_fwf(StringIO(data1), colspecs=colspecs, header=None)
+        tm.assert_frame_equal(df, expected)
+
+        data2 = """\
+2011 58   360.242940   149.910199   11950.7
+2011 59   444.953632   166.985655   11788.4
+2011 60   364.136849   183.628767   11806.2
+2011 61   413.836124   184.375703   11916.8
+2011 62   502.953953   173.237159   12468.3
+"""
+        df = read_fwf(StringIO(data2), widths=[5, 5, 13, 13, 7], header=None)
+        tm.assert_frame_equal(df, expected)
+
+        # From Thomas Kluyver: apparently some non-space filler characters can
+        # be seen, this is supported by specifying the 'delimiter' character:
+        # http://publib.boulder.ibm.com/infocenter/dmndhelp/v6r1mx/index.jsp?topic=/com.ibm.wbit.612.help.config.doc/topics/rfixwidth.html
+        data3 = """\
+201158~~~~360.242940~~~149.910199~~~11950.7
+201159~~~~444.953632~~~166.985655~~~11788.4
+201160~~~~364.136849~~~183.628767~~~11806.2
+201161~~~~413.836124~~~184.375703~~~11916.8
+201162~~~~502.953953~~~173.237159~~~12468.3
+"""
+        df = read_fwf(
+            StringIO(data3), colspecs=colspecs, delimiter='~', header=None)
+        tm.assert_frame_equal(df, expected)
+
+        with tm.assert_raises_regex(ValueError,
+                                    "must specify only one of"):
+            read_fwf(StringIO(data3), colspecs=colspecs, widths=[6, 10, 10, 7])
+
+        with tm.assert_raises_regex(ValueError, "Must specify either"):
+            read_fwf(StringIO(data3), colspecs=None, widths=None)
+
+    def test_BytesIO_input(self):
+        if not compat.PY3:
+            pytest.skip(
+                "Bytes-related test - only needs to work on Python 3")
+
+        result = read_fwf(BytesIO("שלום\nשלום".encode('utf8')), widths=[
+            2, 2], encoding='utf8')
+        expected = DataFrame([["של", "ום"]], columns=["של", "ום"])
+        tm.assert_frame_equal(result, expected)
+
+    def test_fwf_colspecs_is_list_or_tuple(self):
+        data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+
+        with tm.assert_raises_regex(TypeError,
+                                    'column specifications must '
+                                    'be a list or tuple.+'):
+            pd.io.parsers.FixedWidthReader(StringIO(data),
+                                           {'a': 1}, ',', '#')
+
+    def test_fwf_colspecs_is_list_or_tuple_of_two_element_tuples(self):
+        data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+
+        with tm.assert_raises_regex(TypeError,
+                                    'Each column specification '
+                                    'must be.+'):
+            read_fwf(StringIO(data), [('a', 1)])
+
+    def test_fwf_colspecs_None(self):
+        # GH 7079
+        data = """\
+123456
+456789
+"""
+        colspecs = [(0, 3), (3, None)]
+        result = read_fwf(StringIO(data), colspecs=colspecs, header=None)
+        expected = DataFrame([[123, 456], [456, 789]])
+        tm.assert_frame_equal(result, expected)
+
+        colspecs = [(None, 3), (3, 6)]
+        result = read_fwf(StringIO(data), colspecs=colspecs, header=None)
+        expected = DataFrame([[123, 456], [456, 789]])
+        tm.assert_frame_equal(result, expected)
+
+        colspecs = [(0, None), (3, None)]
+        result = read_fwf(StringIO(data), colspecs=colspecs, header=None)
+        expected = DataFrame([[123456, 456], [456789, 789]])
+        tm.assert_frame_equal(result, expected)
+
+        colspecs = [(None, None), (3, 6)]
+        result = read_fwf(StringIO(data), colspecs=colspecs, header=None)
+        expected = DataFrame([[123456, 456], [456789, 789]])
+        tm.assert_frame_equal(result, expected)
+
+    def test_fwf_regression(self):
+        # GH 3594
+        # turns out 'T060' is parsable as a datetime slice!
+
+        tzlist = [1, 10, 20, 30, 60, 80, 100]
+        ntz = len(tzlist)
+        tcolspecs = [16] + [8] * ntz
+        tcolnames = ['SST'] + ["T%03d" % z for z in tzlist[1:]]
+        data = """  2009164202000   9.5403  9.4105  8.6571  7.8372  6.0612  5.8843  5.5192
+  2009164203000   9.5435  9.2010  8.6167  7.8176  6.0804  5.8728  5.4869
+  2009164204000   9.5873  9.1326  8.4694  7.5889  6.0422  5.8526  5.4657
+  2009164205000   9.5810  9.0896  8.4009  7.4652  6.0322  5.8189  5.4379
+  2009164210000   9.6034  9.0897  8.3822  7.4905  6.0908  5.7904  5.4039
+"""
+
+        df = read_fwf(StringIO(data),
+                      index_col=0,
+                      header=None,
+                      names=tcolnames,
+                      widths=tcolspecs,
+                      parse_dates=True,
+                      date_parser=lambda s: datetime.strptime(s, '%Y%j%H%M%S'))
+
+        for c in df.columns:
+            res = df.loc[:, c]
+            assert len(res)
+
+    def test_fwf_for_uint8(self):
+        data = """1421302965.213420    PRI=3 PGN=0xef00      DST=0x17 SRC=0x28    04 154 00 00 00 00 00 127
+1421302964.226776    PRI=6 PGN=0xf002               SRC=0x47    243 00 00 255 247 00 00 71"""  # noqa
+        df = read_fwf(StringIO(data),
+                      colspecs=[(0, 17), (25, 26), (33, 37),
+                                (49, 51), (58, 62), (63, 1000)],
+                      names=['time', 'pri', 'pgn', 'dst', 'src', 'data'],
+                      converters={
+                          'pgn': lambda x: int(x, 16),
+                          'src': lambda x: int(x, 16),
+                          'dst': lambda x: int(x, 16),
+                          'data': lambda x: len(x.split(' '))})
+
+        expected = DataFrame([[1421302965.213420, 3, 61184, 23, 40, 8],
+                              [1421302964.226776, 6, 61442, None, 71, 8]],
+                             columns=["time", "pri", "pgn",
+                                      "dst", "src", "data"])
+        expected["dst"] = expected["dst"].astype(object)
+
+        tm.assert_frame_equal(df, expected)
+
+    def test_fwf_compression(self):
+        try:
+            import gzip
+            import bz2
+        except ImportError:
+            pytest.skip("Need gzip and bz2 to run this test")
+
+        data = """1111111111
+        2222222222
+        3333333333""".strip()
+        widths = [5, 5]
+        names = ['one', 'two']
+        expected = read_fwf(StringIO(data), widths=widths, names=names)
+        if compat.PY3:
+            data = bytes(data, encoding='utf-8')
+        comps = [('gzip', gzip.GzipFile), ('bz2', bz2.BZ2File)]
+        for comp_name, compresser in comps:
+            with tm.ensure_clean() as path:
+                tmp = compresser(path, mode='wb')
+                tmp.write(data)
+                tmp.close()
+                result = read_fwf(path, widths=widths, names=names,
+                                  compression=comp_name)
+                tm.assert_frame_equal(result, expected)
+
+    def test_comment_fwf(self):
+        data = """
+  1   2.   4  #hello world
+  5  NaN  10.0
+"""
+        expected = np.array([[1, 2., 4],
+                             [5, np.nan, 10.]])
+        df = read_fwf(StringIO(data), colspecs=[(0, 3), (4, 9), (9, 25)],
+                      comment='#')
+        tm.assert_almost_equal(df.values, expected)
+
+    def test_1000_fwf(self):
+        data = """
+ 1 2,334.0    5
+10   13     10.
+"""
+        expected = np.array([[1, 2334., 5],
+                             [10, 13, 10]])
+        df = read_fwf(StringIO(data), colspecs=[(0, 3), (3, 11), (12, 16)],
+                      thousands=',')
+        tm.assert_almost_equal(df.values, expected)
+
+    def test_bool_header_arg(self):
+        # see gh-6114
+        data = """\
+MyColumn
+   a
+   b
+   a
+   b"""
+        for arg in [True, False]:
+            with pytest.raises(TypeError):
+                read_fwf(StringIO(data), header=arg)
+
+    def test_full_file(self):
+        # File with all values
+        test = """index                             A    B    C
+2000-01-03T00:00:00  0.980268513777    3  foo
+2000-01-04T00:00:00  1.04791624281    -4  bar
+2000-01-05T00:00:00  0.498580885705   73  baz
+2000-01-06T00:00:00  1.12020151869     1  foo
+2000-01-07T00:00:00  0.487094399463    0  bar
+2000-01-10T00:00:00  0.836648671666    2  baz
+2000-01-11T00:00:00  0.157160753327   34  foo"""
+        colspecs = ((0, 19), (21, 35), (38, 40), (42, 45))
+        expected = read_fwf(StringIO(test), colspecs=colspecs)
+        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
+
+    def test_full_file_with_missing(self):
+        # File with missing values
+        test = """index                             A    B    C
+2000-01-03T00:00:00  0.980268513777    3  foo
+2000-01-04T00:00:00  1.04791624281    -4  bar
+                     0.498580885705   73  baz
+2000-01-06T00:00:00  1.12020151869     1  foo
+2000-01-07T00:00:00                    0  bar
+2000-01-10T00:00:00  0.836648671666    2  baz
+                                      34"""
+        colspecs = ((0, 19), (21, 35), (38, 40), (42, 45))
+        expected = read_fwf(StringIO(test), colspecs=colspecs)
+        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
+
+    def test_full_file_with_spaces(self):
+        # File with spaces in columns
+        test = """
+Account                 Name  Balance     CreditLimit   AccountCreated
+101     Keanu Reeves          9315.45     10000.00           1/17/1998
+312     Gerard Butler         90.00       1000.00             8/6/2003
+868     Jennifer Love Hewitt  0           17000.00           5/25/1985
+761     Jada Pinkett-Smith    49654.87    100000.00          12/5/2006
+317     Bill Murray           789.65      5000.00             2/5/2007
+""".strip('\r\n')
+        colspecs = ((0, 7), (8, 28), (30, 38), (42, 53), (56, 70))
+        expected = read_fwf(StringIO(test), colspecs=colspecs)
+        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
+
+    def test_full_file_with_spaces_and_missing(self):
+        # File with spaces and missing values in columns
+        test = """
+Account               Name    Balance     CreditLimit   AccountCreated
+101                           10000.00                       1/17/1998
+312     Gerard Butler         90.00       1000.00             8/6/2003
+868                                                          5/25/1985
+761     Jada Pinkett-Smith    49654.87    100000.00          12/5/2006
+317     Bill Murray           789.65
+""".strip('\r\n')
+        colspecs = ((0, 7), (8, 28), (30, 38), (42, 53), (56, 70))
+        expected = read_fwf(StringIO(test), colspecs=colspecs)
+        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
+
+    def test_messed_up_data(self):
+        # Completely messed up file
+        test = """
+   Account          Name             Balance     Credit Limit   Account Created
+       101                           10000.00                       1/17/1998
+       312     Gerard Butler         90.00       1000.00
+
+       761     Jada Pinkett-Smith    49654.87    100000.00          12/5/2006
+  317          Bill Murray           789.65
+""".strip('\r\n')
+        colspecs = ((2, 10), (15, 33), (37, 45), (49, 61), (64, 79))
+        expected = read_fwf(StringIO(test), colspecs=colspecs)
+        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
+
+    def test_multiple_delimiters(self):
+        test = r"""
+col1~~~~~col2  col3++++++++++++++++++col4
+~~22.....11.0+++foo~~~~~~~~~~Keanu Reeves
+  33+++122.33\\\bar.........Gerard Butler
+++44~~~~12.01   baz~~Jennifer Love Hewitt
+~~55       11+++foo++++Jada Pinkett-Smith
+..66++++++.03~~~bar           Bill Murray
+""".strip('\r\n')
+        colspecs = ((0, 4), (7, 13), (15, 19), (21, 41))
+        expected = read_fwf(StringIO(test), colspecs=colspecs,
+                            delimiter=' +~.\\')
+        tm.assert_frame_equal(expected, read_fwf(StringIO(test),
+                                                 delimiter=' +~.\\'))
+
+    def test_variable_width_unicode(self):
+        if not compat.PY3:
+            pytest.skip(
+                'Bytes-related test - only needs to work on Python 3')
+        test = """
+שלום שלום
+ום   שלל
+של   ום
+""".strip('\r\n')
+        expected = read_fwf(BytesIO(test.encode('utf8')),
+                            colspecs=[(0, 4), (5, 9)],
+                            header=None, encoding='utf8')
+        tm.assert_frame_equal(expected, read_fwf(
+            BytesIO(test.encode('utf8')), header=None, encoding='utf8'))
+
+    def test_dtype(self):
+        data = """ a    b    c
+1    2    3.2
+3    4    5.2
+"""
+        colspecs = [(0, 5), (5, 10), (10, None)]
+        result = pd.read_fwf(StringIO(data), colspecs=colspecs)
+        expected = pd.DataFrame({
+            'a': [1, 3],
+            'b': [2, 4],
+            'c': [3.2, 5.2]}, columns=['a', 'b', 'c'])
+        tm.assert_frame_equal(result, expected)
+
+        expected['a'] = expected['a'].astype('float64')
+        expected['b'] = expected['b'].astype(str)
+        expected['c'] = expected['c'].astype('int32')
+        result = pd.read_fwf(StringIO(data), colspecs=colspecs,
+                             dtype={'a': 'float64', 'b': str, 'c': 'int32'})
+        tm.assert_frame_equal(result, expected)
+
+    def test_skiprows_inference(self):
+        # GH11256
+        test = """
+Text contained in the file header
+
+DataCol1   DataCol2
+     0.0        1.0
+   101.6      956.1
+""".strip()
+        expected = read_csv(StringIO(test), skiprows=2,
+                            delim_whitespace=True)
+        tm.assert_frame_equal(expected, read_fwf(
+            StringIO(test), skiprows=2))
+
+    def test_skiprows_by_index_inference(self):
+        test = """
+To be skipped
+Not  To  Be  Skipped
+Once more to be skipped
+123  34   8      123
+456  78   9      456
+""".strip()
+
+        expected = read_csv(StringIO(test), skiprows=[0, 2],
+                            delim_whitespace=True)
+        tm.assert_frame_equal(expected, read_fwf(
+            StringIO(test), skiprows=[0, 2]))
+
+    def test_skiprows_inference_empty(self):
+        test = """
+AA   BBB  C
+12   345  6
+78   901  2
+""".strip()
+
+        with pytest.raises(EmptyDataError):
+            read_fwf(StringIO(test), skiprows=3)
+
+    def test_whitespace_preservation(self):
+        # Addresses Issue #16772
+        data_expected = """
+ a ,bbb
+ cc,dd """
+        expected = read_csv(StringIO(data_expected), header=None)
+
+        test_data = """
+ a bbb
+ ccdd """
+        result = read_fwf(StringIO(test_data), widths=[3, 3],
+                          header=None, skiprows=[0], delimiter="\n\t")
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_default_delimiter(self):
+        data_expected = """
+a,bbb
+cc,dd"""
+        expected = read_csv(StringIO(data_expected), header=None)
+
+        test_data = """
+a \tbbb
+cc\tdd """
+        result = read_fwf(StringIO(test_data), widths=[3, 3],
+                          header=None, skiprows=[0])
+
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/test_textreader.py b/pandas/tests/io/parser/test_textreader.py
new file mode 100644
index 0000000000000..c7026e3e0fc88
--- /dev/null
+++ b/pandas/tests/io/parser/test_textreader.py
@@ -0,0 +1,354 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests the TextReader class in parsers.pyx, which
+is integral to the C engine in parsers.py
+"""
+
+import pytest
+
+from pandas.compat import StringIO, BytesIO, map
+from pandas import compat
+
+import os
+import sys
+
+from numpy import nan
+import numpy as np
+
+from pandas import DataFrame
+from pandas.io.parsers import (read_csv, TextFileReader)
+from pandas.util.testing import assert_frame_equal
+
+import pandas.util.testing as tm
+
+from pandas._libs.parsers import TextReader
+import pandas._libs.parsers as parser
+
+
+class TestTextReader(object):
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.dirpath = datapath('io', 'parser', 'data')
+        self.csv1 = os.path.join(self.dirpath, 'test1.csv')
+        self.csv2 = os.path.join(self.dirpath, 'test2.csv')
+        self.xls1 = os.path.join(self.dirpath, 'test.xls')
+
+    def test_file_handle(self):
+        with open(self.csv1, 'rb') as f:
+            reader = TextReader(f)
+            reader.read()
+
+    def test_string_filename(self):
+        reader = TextReader(self.csv1, header=None)
+        reader.read()
+
+    def test_file_handle_mmap(self):
+        with open(self.csv1, 'rb') as f:
+            reader = TextReader(f, memory_map=True, header=None)
+            reader.read()
+
+    def test_StringIO(self):
+        with open(self.csv1, 'rb') as f:
+            text = f.read()
+        src = BytesIO(text)
+        reader = TextReader(src, header=None)
+        reader.read()
+
+    def test_string_factorize(self):
+        # should this be optional?
+        data = 'a\nb\na\nb\na'
+        reader = TextReader(StringIO(data), header=None)
+        result = reader.read()
+        assert len(set(map(id, result[0]))) == 2
+
+    def test_skipinitialspace(self):
+        data = ('a,   b\n'
+                'a,   b\n'
+                'a,   b\n'
+                'a,   b')
+
+        reader = TextReader(StringIO(data), skipinitialspace=True,
+                            header=None)
+        result = reader.read()
+
+        tm.assert_numpy_array_equal(result[0], np.array(['a', 'a', 'a', 'a'],
+                                                        dtype=np.object_))
+        tm.assert_numpy_array_equal(result[1], np.array(['b', 'b', 'b', 'b'],
+                                                        dtype=np.object_))
+
+    def test_parse_booleans(self):
+        data = 'True\nFalse\nTrue\nTrue'
+
+        reader = TextReader(StringIO(data), header=None)
+        result = reader.read()
+
+        assert result[0].dtype == np.bool_
+
+    def test_delimit_whitespace(self):
+        data = 'a  b\na\t\t "b"\n"a"\t \t b'
+
+        reader = TextReader(StringIO(data), delim_whitespace=True,
+                            header=None)
+        result = reader.read()
+
+        tm.assert_numpy_array_equal(result[0], np.array(['a', 'a', 'a'],
+                                                        dtype=np.object_))
+        tm.assert_numpy_array_equal(result[1], np.array(['b', 'b', 'b'],
+                                                        dtype=np.object_))
+
+    def test_embedded_newline(self):
+        data = 'a\n"hello\nthere"\nthis'
+
+        reader = TextReader(StringIO(data), header=None)
+        result = reader.read()
+
+        expected = np.array(['a', 'hello\nthere', 'this'], dtype=np.object_)
+        tm.assert_numpy_array_equal(result[0], expected)
+
+    def test_euro_decimal(self):
+        data = '12345,67\n345,678'
+
+        reader = TextReader(StringIO(data), delimiter=':',
+                            decimal=',', header=None)
+        result = reader.read()
+
+        expected = np.array([12345.67, 345.678])
+        tm.assert_almost_equal(result[0], expected)
+
+    def test_integer_thousands(self):
+        data = '123,456\n12,500'
+
+        reader = TextReader(StringIO(data), delimiter=':',
+                            thousands=',', header=None)
+        result = reader.read()
+
+        expected = np.array([123456, 12500], dtype=np.int64)
+        tm.assert_almost_equal(result[0], expected)
+
+    def test_integer_thousands_alt(self):
+        data = '123.456\n12.500'
+
+        reader = TextFileReader(StringIO(data), delimiter=':',
+                                thousands='.', header=None)
+        result = reader.read()
+
+        expected = DataFrame([123456, 12500])
+        tm.assert_frame_equal(result, expected)
+
+    @tm.capture_stderr
+    def test_skip_bad_lines(self):
+        # too many lines, see #2430 for why
+        data = ('a:b:c\n'
+                'd:e:f\n'
+                'g:h:i\n'
+                'j:k:l:m\n'
+                'l:m:n\n'
+                'o:p:q:r')
+
+        reader = TextReader(StringIO(data), delimiter=':',
+                            header=None)
+        pytest.raises(parser.ParserError, reader.read)
+
+        reader = TextReader(StringIO(data), delimiter=':',
+                            header=None,
+                            error_bad_lines=False,
+                            warn_bad_lines=False)
+        result = reader.read()
+        expected = {0: np.array(['a', 'd', 'g', 'l'], dtype=object),
+                    1: np.array(['b', 'e', 'h', 'm'], dtype=object),
+                    2: np.array(['c', 'f', 'i', 'n'], dtype=object)}
+        assert_array_dicts_equal(result, expected)
+
+        reader = TextReader(StringIO(data), delimiter=':',
+                            header=None,
+                            error_bad_lines=False,
+                            warn_bad_lines=True)
+        reader.read()
+        val = sys.stderr.getvalue()
+
+        assert 'Skipping line 4' in val
+        assert 'Skipping line 6' in val
+
+    def test_header_not_enough_lines(self):
+        data = ('skip this\n'
+                'skip this\n'
+                'a,b,c\n'
+                '1,2,3\n'
+                '4,5,6')
+
+        reader = TextReader(StringIO(data), delimiter=',', header=2)
+        header = reader.header
+        expected = [['a', 'b', 'c']]
+        assert header == expected
+
+        recs = reader.read()
+        expected = {0: np.array([1, 4], dtype=np.int64),
+                    1: np.array([2, 5], dtype=np.int64),
+                    2: np.array([3, 6], dtype=np.int64)}
+        assert_array_dicts_equal(recs, expected)
+
+    def test_escapechar(self):
+        data = ('\\"hello world\"\n'
+                '\\"hello world\"\n'
+                '\\"hello world\"')
+
+        reader = TextReader(StringIO(data), delimiter=',', header=None,
+                            escapechar='\\')
+        result = reader.read()
+        expected = {0: np.array(['"hello world"'] * 3, dtype=object)}
+        assert_array_dicts_equal(result, expected)
+
+    def test_eof_has_eol(self):
+        # handling of new line at EOF
+        pass
+
+    def test_na_substitution(self):
+        pass
+
+    def test_numpy_string_dtype(self):
+        data = """\
+a,1
+aa,2
+aaa,3
+aaaa,4
+aaaaa,5"""
+
+        def _make_reader(**kwds):
+            return TextReader(StringIO(data), delimiter=',', header=None,
+                              **kwds)
+
+        reader = _make_reader(dtype='S5,i4')
+        result = reader.read()
+
+        assert result[0].dtype == 'S5'
+
+        ex_values = np.array(['a', 'aa', 'aaa', 'aaaa', 'aaaaa'], dtype='S5')
+        assert (result[0] == ex_values).all()
+        assert result[1].dtype == 'i4'
+
+        reader = _make_reader(dtype='S4')
+        result = reader.read()
+        assert result[0].dtype == 'S4'
+        ex_values = np.array(['a', 'aa', 'aaa', 'aaaa', 'aaaa'], dtype='S4')
+        assert (result[0] == ex_values).all()
+        assert result[1].dtype == 'S4'
+
+    def test_pass_dtype(self):
+        data = """\
+one,two
+1,a
+2,b
+3,c
+4,d"""
+
+        def _make_reader(**kwds):
+            return TextReader(StringIO(data), delimiter=',', **kwds)
+
+        reader = _make_reader(dtype={'one': 'u1', 1: 'S1'})
+        result = reader.read()
+        assert result[0].dtype == 'u1'
+        assert result[1].dtype == 'S1'
+
+        reader = _make_reader(dtype={'one': np.uint8, 1: object})
+        result = reader.read()
+        assert result[0].dtype == 'u1'
+        assert result[1].dtype == 'O'
+
+        reader = _make_reader(dtype={'one': np.dtype('u1'),
+                                     1: np.dtype('O')})
+        result = reader.read()
+        assert result[0].dtype == 'u1'
+        assert result[1].dtype == 'O'
+
+    def test_usecols(self):
+        data = """\
+a,b,c
+1,2,3
+4,5,6
+7,8,9
+10,11,12"""
+
+        def _make_reader(**kwds):
+            return TextReader(StringIO(data), delimiter=',', **kwds)
+
+        reader = _make_reader(usecols=(1, 2))
+        result = reader.read()
+
+        exp = _make_reader().read()
+        assert len(result) == 2
+        assert (result[1] == exp[1]).all()
+        assert (result[2] == exp[2]).all()
+
+    def test_cr_delimited(self):
+        def _test(text, **kwargs):
+            nice_text = text.replace('\r', '\r\n')
+            result = TextReader(StringIO(text), **kwargs).read()
+            expected = TextReader(StringIO(nice_text), **kwargs).read()
+            assert_array_dicts_equal(result, expected)
+
+        data = 'a,b,c\r1,2,3\r4,5,6\r7,8,9\r10,11,12'
+        _test(data, delimiter=',')
+
+        data = 'a  b  c\r1  2  3\r4  5  6\r7  8  9\r10  11  12'
+        _test(data, delim_whitespace=True)
+
+        data = 'a,b,c\r1,2,3\r4,5,6\r,88,9\r10,11,12'
+        _test(data, delimiter=',')
+
+        sample = ('A,B,C,D,E,F,G,H,I,J,K,L,M,N,O\r'
+                  'AAAAA,BBBBB,0,0,0,0,0,0,0,0,0,0,0,0,0\r'
+                  ',BBBBB,0,0,0,0,0,0,0,0,0,0,0,0,0')
+        _test(sample, delimiter=',')
+
+        data = 'A  B  C\r  2  3\r4  5  6'
+        _test(data, delim_whitespace=True)
+
+        data = 'A B C\r2 3\r4 5 6'
+        _test(data, delim_whitespace=True)
+
+    def test_empty_field_eof(self):
+        data = 'a,b,c\n1,2,3\n4,,'
+
+        result = TextReader(StringIO(data), delimiter=',').read()
+
+        expected = {0: np.array([1, 4], dtype=np.int64),
+                    1: np.array(['2', ''], dtype=object),
+                    2: np.array(['3', ''], dtype=object)}
+        assert_array_dicts_equal(result, expected)
+
+        # GH5664
+        a = DataFrame([['b'], [nan]], columns=['a'], index=['a', 'c'])
+        b = DataFrame([[1, 1, 1, 0], [1, 1, 1, 0]],
+                      columns=list('abcd'),
+                      index=[1, 1])
+        c = DataFrame([[1, 2, 3, 4], [6, nan, nan, nan],
+                       [8, 9, 10, 11], [13, 14, nan, nan]],
+                      columns=list('abcd'),
+                      index=[0, 5, 7, 12])
+
+        for _ in range(100):
+            df = read_csv(StringIO('a,b\nc\n'), skiprows=0,
+                          names=['a'], engine='c')
+            assert_frame_equal(df, a)
+
+            df = read_csv(StringIO('1,1,1,1,0\n' * 2 + '\n' * 2),
+                          names=list("abcd"), engine='c')
+            assert_frame_equal(df, b)
+
+            df = read_csv(StringIO('0,1,2,3,4\n5,6\n7,8,9,10,11\n12,13,14'),
+                          names=list('abcd'), engine='c')
+            assert_frame_equal(df, c)
+
+    def test_empty_csv_input(self):
+        # GH14867
+        df = read_csv(StringIO(), chunksize=20, header=None,
+                      names=['a', 'b', 'c'])
+        assert isinstance(df, TextFileReader)
+
+
+def assert_array_dicts_equal(left, right):
+    for k, v in compat.iteritems(left):
+        assert tm.assert_numpy_array_equal(np.asarray(v),
+                                           np.asarray(right[k]))
diff --git a/pandas/tests/io/parser/test_unsupported.py b/pandas/tests/io/parser/test_unsupported.py
new file mode 100644
index 0000000000000..3117f6fae55da
--- /dev/null
+++ b/pandas/tests/io/parser/test_unsupported.py
@@ -0,0 +1,139 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that features that are currently unsupported in
+either the Python or C parser are actually enforced
+and are clearly communicated to the user.
+
+Ultimately, the goal is to remove test cases from this
+test suite as new feature support is added to the parsers.
+"""
+
+import pandas.io.parsers as parsers
+import pandas.util.testing as tm
+
+from pandas.compat import StringIO
+from pandas.errors import ParserError
+from pandas.io.parsers import read_csv, read_table
+
+import pytest
+
+
+@pytest.fixture(params=["python", "python-fwf"], ids=lambda val: val)
+def python_engine(request):
+    return request.param
+
+
+class TestUnsupportedFeatures(object):
+
+    def test_mangle_dupe_cols_false(self):
+        # see gh-12935
+        data = 'a b c\n1 2 3'
+        msg = 'is not supported'
+
+        for engine in ('c', 'python'):
+            with tm.assert_raises_regex(ValueError, msg):
+                read_csv(StringIO(data), engine=engine,
+                         mangle_dupe_cols=False)
+
+    def test_c_engine(self):
+        # see gh-6607
+        data = 'a b c\n1 2 3'
+        msg = 'does not support'
+
+        # specify C engine with unsupported options (raise)
+        with tm.assert_raises_regex(ValueError, msg):
+            read_table(StringIO(data), engine='c',
+                       sep=None, delim_whitespace=False)
+        with tm.assert_raises_regex(ValueError, msg):
+            read_table(StringIO(data), engine='c', sep=r'\s')
+        with tm.assert_raises_regex(ValueError, msg):
+            read_table(StringIO(data), engine='c', quotechar=chr(128))
+        with tm.assert_raises_regex(ValueError, msg):
+            read_table(StringIO(data), engine='c', skipfooter=1)
+
+        # specify C-unsupported options without python-unsupported options
+        with tm.assert_produces_warning(parsers.ParserWarning):
+            read_table(StringIO(data), sep=None, delim_whitespace=False)
+        with tm.assert_produces_warning(parsers.ParserWarning):
+            read_table(StringIO(data), quotechar=chr(128))
+        with tm.assert_produces_warning(parsers.ParserWarning):
+            read_table(StringIO(data), sep=r'\s')
+        with tm.assert_produces_warning(parsers.ParserWarning):
+            read_table(StringIO(data), skipfooter=1)
+
+        text = """                      A       B       C       D        E
+one two three   four
+a   b   10.0032 5    -0.5109 -2.3358 -0.4645  0.05076  0.3640
+a   q   20      4     0.4473  1.4152  0.2834  1.00661  0.1744
+x   q   30      3    -0.6662 -0.5243 -0.3580  0.89145  2.5838"""
+        msg = 'Error tokenizing data'
+
+        with tm.assert_raises_regex(ParserError, msg):
+            read_table(StringIO(text), sep='\\s+')
+        with tm.assert_raises_regex(ParserError, msg):
+            read_table(StringIO(text), engine='c', sep='\\s+')
+
+        msg = "Only length-1 thousands markers supported"
+        data = """A|B|C
+1|2,334|5
+10|13|10.
+"""
+        with tm.assert_raises_regex(ValueError, msg):
+            read_csv(StringIO(data), thousands=',,')
+        with tm.assert_raises_regex(ValueError, msg):
+            read_csv(StringIO(data), thousands='')
+
+        msg = "Only length-1 line terminators supported"
+        data = 'a,b,c~~1,2,3~~4,5,6'
+        with tm.assert_raises_regex(ValueError, msg):
+            read_csv(StringIO(data), lineterminator='~~')
+
+    def test_python_engine(self, python_engine):
+        from pandas.io.parsers import _python_unsupported as py_unsupported
+
+        data = """1,2,3,,
+1,2,3,4,
+1,2,3,4,5
+1,2,,,
+1,2,3,4,"""
+
+        for default in py_unsupported:
+            msg = ('The %r option is not supported '
+                   'with the %r engine' % (default, python_engine))
+
+            kwargs = {default: object()}
+            with tm.assert_raises_regex(ValueError, msg):
+                read_csv(StringIO(data), engine=python_engine, **kwargs)
+
+    def test_python_engine_file_no_next(self, python_engine):
+        # see gh-16530
+        class NoNextBuffer(object):
+            def __init__(self, csv_data):
+                self.data = csv_data
+
+            def __iter__(self):
+                return self
+
+            def read(self):
+                return self.data
+
+        data = "a\n1"
+        msg = "The 'python' engine cannot iterate"
+
+        with tm.assert_raises_regex(ValueError, msg):
+            read_csv(NoNextBuffer(data), engine=python_engine)
+
+
+class TestDeprecatedFeatures(object):
+
+    @pytest.mark.parametrize("engine", ["c", "python"])
+    @pytest.mark.parametrize("kwargs", [{"tupleize_cols": True},
+                                        {"tupleize_cols": False}])
+    def test_deprecated_args(self, engine, kwargs):
+        data = "1,2,3"
+        arg, _ = list(kwargs.items())[0]
+
+        with tm.assert_produces_warning(
+                FutureWarning, check_stacklevel=False):
+            read_csv(StringIO(data), engine=engine, **kwargs)
diff --git a/pandas/tests/io/parser/usecols.py b/pandas/tests/io/parser/usecols.py
new file mode 100644
index 0000000000000..584711528e9cb
--- /dev/null
+++ b/pandas/tests/io/parser/usecols.py
@@ -0,0 +1,549 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests the usecols functionality during parsing
+for all of the parsers defined in parsers.py
+"""
+
+import pytest
+
+import numpy as np
+import pandas.util.testing as tm
+
+from pandas import DataFrame, Index
+from pandas._libs.tslib import Timestamp
+from pandas.compat import StringIO
+
+
+class UsecolsTests(object):
+    msg_validate_usecols_arg = ("'usecols' must either be list-like of all "
+                                "strings, all unicode, all integers or a "
+                                "callable.")
+    msg_validate_usecols_names = ("Usecols do not match columns, columns "
+                                  "expected but not found: {0}")
+
+    def test_raise_on_mixed_dtype_usecols(self):
+        # See gh-12678
+        data = """a,b,c
+        1000,2000,3000
+        4000,5000,6000
+        """
+
+        usecols = [0, 'b', 2]
+
+        with tm.assert_raises_regex(ValueError, self.msg_validate_usecols_arg):
+            self.read_csv(StringIO(data), usecols=usecols)
+
+    def test_usecols(self):
+        data = """\
+a,b,c
+1,2,3
+4,5,6
+7,8,9
+10,11,12"""
+
+        result = self.read_csv(StringIO(data), usecols=(1, 2))
+        result2 = self.read_csv(StringIO(data), usecols=('b', 'c'))
+        exp = self.read_csv(StringIO(data))
+
+        assert len(result.columns) == 2
+        assert (result['b'] == exp['b']).all()
+        assert (result['c'] == exp['c']).all()
+
+        tm.assert_frame_equal(result, result2)
+
+        result = self.read_csv(StringIO(data), usecols=[1, 2], header=0,
+                               names=['foo', 'bar'])
+        expected = self.read_csv(StringIO(data), usecols=[1, 2])
+        expected.columns = ['foo', 'bar']
+        tm.assert_frame_equal(result, expected)
+
+        data = """\
+1,2,3
+4,5,6
+7,8,9
+10,11,12"""
+        result = self.read_csv(StringIO(data), names=['b', 'c'],
+                               header=None, usecols=[1, 2])
+
+        expected = self.read_csv(StringIO(data), names=['a', 'b', 'c'],
+                                 header=None)
+        expected = expected[['b', 'c']]
+        tm.assert_frame_equal(result, expected)
+
+        result2 = self.read_csv(StringIO(data), names=['a', 'b', 'c'],
+                                header=None, usecols=['b', 'c'])
+        tm.assert_frame_equal(result2, result)
+
+        # see gh-5766
+        result = self.read_csv(StringIO(data), names=['a', 'b'],
+                               header=None, usecols=[0, 1])
+
+        expected = self.read_csv(StringIO(data), names=['a', 'b', 'c'],
+                                 header=None)
+        expected = expected[['a', 'b']]
+        tm.assert_frame_equal(result, expected)
+
+        # length conflict, passed names and usecols disagree
+        pytest.raises(ValueError, self.read_csv, StringIO(data),
+                      names=['a', 'b'], usecols=[1], header=None)
+
+    def test_usecols_single_string(self):
+        # GH 20558
+        data = """foo, bar, baz
+        1000, 2000, 3000
+        4000, 5000, 6000
+        """
+
+        usecols = 'foo'
+
+        with tm.assert_raises_regex(ValueError, self.msg_validate_usecols_arg):
+            self.read_csv(StringIO(data), usecols=usecols)
+
+    def test_usecols_index_col_False(self):
+        # see gh-9082
+        s = "a,b,c,d\n1,2,3,4\n5,6,7,8"
+        s_malformed = "a,b,c,d\n1,2,3,4,\n5,6,7,8,"
+        cols = ['a', 'c', 'd']
+        expected = DataFrame({'a': [1, 5], 'c': [3, 7], 'd': [4, 8]})
+        df = self.read_csv(StringIO(s), usecols=cols, index_col=False)
+        tm.assert_frame_equal(expected, df)
+        df = self.read_csv(StringIO(s_malformed),
+                           usecols=cols, index_col=False)
+        tm.assert_frame_equal(expected, df)
+
+    def test_usecols_index_col_conflict(self):
+        # see gh-4201: test that index_col as integer reflects usecols
+        data = 'a,b,c,d\nA,a,1,one\nB,b,2,two'
+        expected = DataFrame({'c': [1, 2]}, index=Index(
+            ['a', 'b'], name='b'))
+
+        df = self.read_csv(StringIO(data), usecols=['b', 'c'],
+                           index_col=0)
+        tm.assert_frame_equal(expected, df)
+
+        df = self.read_csv(StringIO(data), usecols=['b', 'c'],
+                           index_col='b')
+        tm.assert_frame_equal(expected, df)
+
+        df = self.read_csv(StringIO(data), usecols=[1, 2],
+                           index_col='b')
+        tm.assert_frame_equal(expected, df)
+
+        df = self.read_csv(StringIO(data), usecols=[1, 2],
+                           index_col=0)
+        tm.assert_frame_equal(expected, df)
+
+        expected = DataFrame(
+            {'b': ['a', 'b'], 'c': [1, 2], 'd': ('one', 'two')})
+        expected = expected.set_index(['b', 'c'])
+        df = self.read_csv(StringIO(data), usecols=['b', 'c', 'd'],
+                           index_col=['b', 'c'])
+        tm.assert_frame_equal(expected, df)
+
+    def test_usecols_implicit_index_col(self):
+        # see gh-2654
+        data = 'a,b,c\n4,apple,bat,5.7\n8,orange,cow,10'
+
+        result = self.read_csv(StringIO(data), usecols=['a', 'b'])
+        expected = DataFrame({'a': ['apple', 'orange'],
+                              'b': ['bat', 'cow']}, index=[4, 8])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_usecols_regex_sep(self):
+        # see gh-2733
+        data = 'a  b  c\n4  apple  bat  5.7\n8  orange  cow  10'
+
+        df = self.read_csv(StringIO(data), sep=r'\s+', usecols=('a', 'b'))
+
+        expected = DataFrame({'a': ['apple', 'orange'],
+                              'b': ['bat', 'cow']}, index=[4, 8])
+        tm.assert_frame_equal(df, expected)
+
+    def test_usecols_with_whitespace(self):
+        data = 'a  b  c\n4  apple  bat  5.7\n8  orange  cow  10'
+
+        result = self.read_csv(StringIO(data), delim_whitespace=True,
+                               usecols=('a', 'b'))
+        expected = DataFrame({'a': ['apple', 'orange'],
+                              'b': ['bat', 'cow']}, index=[4, 8])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_usecols_with_integer_like_header(self):
+        data = """2,0,1
+        1000,2000,3000
+        4000,5000,6000
+        """
+
+        usecols = [0, 1]  # column selection by index
+        expected = DataFrame(data=[[1000, 2000],
+                                   [4000, 5000]],
+                             columns=['2', '0'])
+        df = self.read_csv(StringIO(data), usecols=usecols)
+        tm.assert_frame_equal(df, expected)
+
+        usecols = ['0', '1']  # column selection by name
+        expected = DataFrame(data=[[2000, 3000],
+                                   [5000, 6000]],
+                             columns=['0', '1'])
+        df = self.read_csv(StringIO(data), usecols=usecols)
+        tm.assert_frame_equal(df, expected)
+
+    def test_usecols_with_parse_dates(self):
+        # See gh-9755
+        s = """a,b,c,d,e
+        0,1,20140101,0900,4
+        0,1,20140102,1000,4"""
+        parse_dates = [[1, 2]]
+
+        cols = {
+            'a': [0, 0],
+            'c_d': [
+                Timestamp('2014-01-01 09:00:00'),
+                Timestamp('2014-01-02 10:00:00')
+            ]
+        }
+        expected = DataFrame(cols, columns=['c_d', 'a'])
+
+        df = self.read_csv(StringIO(s), usecols=[0, 2, 3],
+                           parse_dates=parse_dates)
+        tm.assert_frame_equal(df, expected)
+
+        df = self.read_csv(StringIO(s), usecols=[3, 0, 2],
+                           parse_dates=parse_dates)
+        tm.assert_frame_equal(df, expected)
+
+        # See gh-13604
+        s = """2008-02-07 09:40,1032.43
+        2008-02-07 09:50,1042.54
+        2008-02-07 10:00,1051.65
+        """
+        parse_dates = [0]
+        names = ['date', 'values']
+        usecols = names[:]
+
+        index = Index([Timestamp('2008-02-07 09:40'),
+                       Timestamp('2008-02-07 09:50'),
+                       Timestamp('2008-02-07 10:00')],
+                      name='date')
+        cols = {'values': [1032.43, 1042.54, 1051.65]}
+        expected = DataFrame(cols, index=index)
+
+        df = self.read_csv(StringIO(s), parse_dates=parse_dates, index_col=0,
+                           usecols=usecols, header=None, names=names)
+        tm.assert_frame_equal(df, expected)
+
+        # See gh-14792
+        s = """a,b,c,d,e,f,g,h,i,j
+        2016/09/21,1,1,2,3,4,5,6,7,8"""
+        parse_dates = [0]
+        usecols = list('abcdefghij')
+        cols = {'a': Timestamp('2016-09-21'),
+                'b': [1], 'c': [1], 'd': [2],
+                'e': [3], 'f': [4], 'g': [5],
+                'h': [6], 'i': [7], 'j': [8]}
+        expected = DataFrame(cols, columns=usecols)
+        df = self.read_csv(StringIO(s), usecols=usecols,
+                           parse_dates=parse_dates)
+        tm.assert_frame_equal(df, expected)
+
+        s = """a,b,c,d,e,f,g,h,i,j\n2016/09/21,1,1,2,3,4,5,6,7,8"""
+        parse_dates = [[0, 1]]
+        usecols = list('abcdefghij')
+        cols = {'a_b': '2016/09/21 1',
+                'c': [1], 'd': [2], 'e': [3], 'f': [4],
+                'g': [5], 'h': [6], 'i': [7], 'j': [8]}
+        expected = DataFrame(cols, columns=['a_b'] + list('cdefghij'))
+        df = self.read_csv(StringIO(s), usecols=usecols,
+                           parse_dates=parse_dates)
+        tm.assert_frame_equal(df, expected)
+
+    def test_usecols_with_parse_dates_and_full_names(self):
+        # See gh-9755
+        s = """0,1,20140101,0900,4
+        0,1,20140102,1000,4"""
+        parse_dates = [[1, 2]]
+        names = list('abcde')
+
+        cols = {
+            'a': [0, 0],
+            'c_d': [
+                Timestamp('2014-01-01 09:00:00'),
+                Timestamp('2014-01-02 10:00:00')
+            ]
+        }
+        expected = DataFrame(cols, columns=['c_d', 'a'])
+
+        df = self.read_csv(StringIO(s), names=names,
+                           usecols=[0, 2, 3],
+                           parse_dates=parse_dates)
+        tm.assert_frame_equal(df, expected)
+
+        df = self.read_csv(StringIO(s), names=names,
+                           usecols=[3, 0, 2],
+                           parse_dates=parse_dates)
+        tm.assert_frame_equal(df, expected)
+
+    def test_usecols_with_parse_dates_and_usecol_names(self):
+        # See gh-9755
+        s = """0,1,20140101,0900,4
+        0,1,20140102,1000,4"""
+        parse_dates = [[1, 2]]
+        names = list('acd')
+
+        cols = {
+            'a': [0, 0],
+            'c_d': [
+                Timestamp('2014-01-01 09:00:00'),
+                Timestamp('2014-01-02 10:00:00')
+            ]
+        }
+        expected = DataFrame(cols, columns=['c_d', 'a'])
+
+        df = self.read_csv(StringIO(s), names=names,
+                           usecols=[0, 2, 3],
+                           parse_dates=parse_dates)
+        tm.assert_frame_equal(df, expected)
+
+        df = self.read_csv(StringIO(s), names=names,
+                           usecols=[3, 0, 2],
+                           parse_dates=parse_dates)
+        tm.assert_frame_equal(df, expected)
+
+    def test_usecols_with_unicode_strings(self):
+        # see gh-13219
+
+        s = '''AAA,BBB,CCC,DDD
+        0.056674973,8,True,a
+        2.613230982,2,False,b
+        3.568935038,7,False,a
+        '''
+
+        data = {
+            'AAA': {
+                0: 0.056674972999999997,
+                1: 2.6132309819999997,
+                2: 3.5689350380000002
+            },
+            'BBB': {0: 8, 1: 2, 2: 7}
+        }
+        expected = DataFrame(data)
+
+        df = self.read_csv(StringIO(s), usecols=[u'AAA', u'BBB'])
+        tm.assert_frame_equal(df, expected)
+
+    def test_usecols_with_single_byte_unicode_strings(self):
+        # see gh-13219
+
+        s = '''A,B,C,D
+        0.056674973,8,True,a
+        2.613230982,2,False,b
+        3.568935038,7,False,a
+        '''
+
+        data = {
+            'A': {
+                0: 0.056674972999999997,
+                1: 2.6132309819999997,
+                2: 3.5689350380000002
+            },
+            'B': {0: 8, 1: 2, 2: 7}
+        }
+        expected = DataFrame(data)
+
+        df = self.read_csv(StringIO(s), usecols=[u'A', u'B'])
+        tm.assert_frame_equal(df, expected)
+
+    def test_usecols_with_mixed_encoding_strings(self):
+        s = '''AAA,BBB,CCC,DDD
+        0.056674973,8,True,a
+        2.613230982,2,False,b
+        3.568935038,7,False,a
+        '''
+
+        with tm.assert_raises_regex(ValueError, self.msg_validate_usecols_arg):
+            self.read_csv(StringIO(s), usecols=[u'AAA', b'BBB'])
+
+        with tm.assert_raises_regex(ValueError, self.msg_validate_usecols_arg):
+            self.read_csv(StringIO(s), usecols=[b'AAA', u'BBB'])
+
+    def test_usecols_with_multibyte_characters(self):
+        s = '''あああ,いい,ううう,ええええ
+        0.056674973,8,True,a
+        2.613230982,2,False,b
+        3.568935038,7,False,a
+        '''
+        data = {
+            'あああ': {
+                0: 0.056674972999999997,
+                1: 2.6132309819999997,
+                2: 3.5689350380000002
+            },
+            'いい': {0: 8, 1: 2, 2: 7}
+        }
+        expected = DataFrame(data)
+
+        df = self.read_csv(StringIO(s), usecols=['あああ', 'いい'])
+        tm.assert_frame_equal(df, expected)
+
+    def test_usecols_with_multibyte_unicode_characters(self):
+        pytest.skip('TODO: see gh-13253')
+
+        s = '''あああ,いい,ううう,ええええ
+        0.056674973,8,True,a
+        2.613230982,2,False,b
+        3.568935038,7,False,a
+        '''
+        data = {
+            'あああ': {
+                0: 0.056674972999999997,
+                1: 2.6132309819999997,
+                2: 3.5689350380000002
+            },
+            'いい': {0: 8, 1: 2, 2: 7}
+        }
+        expected = DataFrame(data)
+
+        df = self.read_csv(StringIO(s), usecols=[u'あああ', u'いい'])
+        tm.assert_frame_equal(df, expected)
+
+    def test_empty_usecols(self):
+        # should not raise
+        data = 'a,b,c\n1,2,3\n4,5,6'
+        expected = DataFrame()
+        result = self.read_csv(StringIO(data), usecols=set([]))
+        tm.assert_frame_equal(result, expected)
+
+    def test_np_array_usecols(self):
+        # See gh-12546
+        data = 'a,b,c\n1,2,3'
+        usecols = np.array(['a', 'b'])
+
+        expected = DataFrame([[1, 2]], columns=usecols)
+        result = self.read_csv(StringIO(data), usecols=usecols)
+        tm.assert_frame_equal(result, expected)
+
+    def test_callable_usecols(self):
+        # See gh-14154
+        s = '''AaA,bBb,CCC,ddd
+        0.056674973,8,True,a
+        2.613230982,2,False,b
+        3.568935038,7,False,a
+        '''
+
+        data = {
+            'AaA': {
+                0: 0.056674972999999997,
+                1: 2.6132309819999997,
+                2: 3.5689350380000002
+            },
+            'bBb': {0: 8, 1: 2, 2: 7},
+            'ddd': {0: 'a', 1: 'b', 2: 'a'}
+        }
+        expected = DataFrame(data)
+        df = self.read_csv(StringIO(s), usecols=lambda x:
+                           x.upper() in ['AAA', 'BBB', 'DDD'])
+        tm.assert_frame_equal(df, expected)
+
+        # Check that a callable returning only False returns
+        # an empty DataFrame
+        expected = DataFrame()
+        df = self.read_csv(StringIO(s), usecols=lambda x: False)
+        tm.assert_frame_equal(df, expected)
+
+    def test_incomplete_first_row(self):
+        # see gh-6710
+        data = '1,2\n1,2,3'
+        names = ['a', 'b', 'c']
+        expected = DataFrame({'a': [1, 1],
+                              'c': [np.nan, 3]})
+
+        usecols = ['a', 'c']
+        df = self.read_csv(StringIO(data), names=names, usecols=usecols)
+        tm.assert_frame_equal(df, expected)
+
+        usecols = lambda x: x in ['a', 'c']
+        df = self.read_csv(StringIO(data), names=names, usecols=usecols)
+        tm.assert_frame_equal(df, expected)
+
+    def test_uneven_length_cols(self):
+        # see gh-8985
+        usecols = [0, 1, 2]
+        data = '19,29,39\n' * 2 + '10,20,30,40'
+        expected = DataFrame([[19, 29, 39],
+                              [19, 29, 39],
+                              [10, 20, 30]])
+        df = self.read_csv(StringIO(data), header=None, usecols=usecols)
+        tm.assert_frame_equal(df, expected)
+
+        # see gh-9549
+        usecols = ['A', 'B', 'C']
+        data = ('A,B,C\n1,2,3\n3,4,5\n1,2,4,5,1,6\n'
+                '1,2,3,,,1,\n1,2,3\n5,6,7')
+        expected = DataFrame({'A': [1, 3, 1, 1, 1, 5],
+                              'B': [2, 4, 2, 2, 2, 6],
+                              'C': [3, 5, 4, 3, 3, 7]})
+        df = self.read_csv(StringIO(data), usecols=usecols)
+        tm.assert_frame_equal(df, expected)
+
+    def test_raise_on_usecols_names_mismatch(self):
+        # GH 14671
+        data = 'a,b,c,d\n1,2,3,4\n5,6,7,8'
+
+        usecols = ['a', 'b', 'c', 'd']
+        df = self.read_csv(StringIO(data), usecols=usecols)
+        expected = DataFrame({'a': [1, 5], 'b': [2, 6], 'c': [3, 7],
+                              'd': [4, 8]})
+        tm.assert_frame_equal(df, expected)
+
+        usecols = ['a', 'b', 'c', 'f']
+        with tm.assert_raises_regex(ValueError,
+                                    self.msg_validate_usecols_names.format(
+                                        r"\['f'\]")):
+            self.read_csv(StringIO(data), usecols=usecols)
+
+        usecols = ['a', 'b', 'f']
+        with tm.assert_raises_regex(ValueError,
+                                    self.msg_validate_usecols_names.format(
+                                        r"\['f'\]")):
+            self.read_csv(StringIO(data), usecols=usecols)
+
+        usecols = ['a', 'b', 'f', 'g']
+        with tm.assert_raises_regex(ValueError,
+                                    self.msg_validate_usecols_names.format(
+                                        r"\[('f', 'g'|'g', 'f')\]")):
+            self.read_csv(StringIO(data), usecols=usecols)
+
+        names = ['A', 'B', 'C', 'D']
+
+        df = self.read_csv(StringIO(data), header=0, names=names)
+        expected = DataFrame({'A': [1, 5], 'B': [2, 6], 'C': [3, 7],
+                              'D': [4, 8]})
+        tm.assert_frame_equal(df, expected)
+
+        # TODO: https://github.com/pandas-dev/pandas/issues/16469
+        # usecols = ['A','C']
+        # df = self.read_csv(StringIO(data), header=0, names=names,
+        #                    usecols=usecols)
+        # expected = DataFrame({'A': [1,5], 'C': [3,7]})
+        # tm.assert_frame_equal(df, expected)
+        #
+        # usecols = [0,2]
+        # df = self.read_csv(StringIO(data), header=0, names=names,
+        #                    usecols=usecols)
+        # expected = DataFrame({'A': [1,5], 'C': [3,7]})
+        # tm.assert_frame_equal(df, expected)
+
+        usecols = ['A', 'B', 'C', 'f']
+        with tm.assert_raises_regex(ValueError,
+                                    self.msg_validate_usecols_names.format(
+                                        r"\['f'\]")):
+            self.read_csv(StringIO(data), header=0, names=names,
+                          usecols=usecols)
+        usecols = ['A', 'B', 'f']
+        with tm.assert_raises_regex(ValueError,
+                                    self.msg_validate_usecols_names.format(
+                                        r"\['f'\]")):
+            self.read_csv(StringIO(data), names=names, usecols=usecols)
diff --git a/pandas/tests/io/sas/__init__.py b/pandas/tests/io/sas/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/io/tests/data/DEMO_G.csv b/pandas/tests/io/sas/data/DEMO_G.csv
similarity index 100%
rename from pandas/io/tests/data/DEMO_G.csv
rename to pandas/tests/io/sas/data/DEMO_G.csv
diff --git a/pandas/io/tests/data/DEMO_G.XPT b/pandas/tests/io/sas/data/DEMO_G.xpt
similarity index 100%
rename from pandas/io/tests/data/DEMO_G.XPT
rename to pandas/tests/io/sas/data/DEMO_G.xpt
diff --git a/pandas/io/tests/data/DRXFCD_G.csv b/pandas/tests/io/sas/data/DRXFCD_G.csv
similarity index 100%
rename from pandas/io/tests/data/DRXFCD_G.csv
rename to pandas/tests/io/sas/data/DRXFCD_G.csv
diff --git a/pandas/io/tests/data/DRXFCD_G.XPT b/pandas/tests/io/sas/data/DRXFCD_G.xpt
similarity index 100%
rename from pandas/io/tests/data/DRXFCD_G.XPT
rename to pandas/tests/io/sas/data/DRXFCD_G.xpt
diff --git a/pandas/io/tests/data/SSHSV1_A.csv b/pandas/tests/io/sas/data/SSHSV1_A.csv
similarity index 100%
rename from pandas/io/tests/data/SSHSV1_A.csv
rename to pandas/tests/io/sas/data/SSHSV1_A.csv
diff --git a/pandas/io/tests/data/SSHSV1_A.XPT b/pandas/tests/io/sas/data/SSHSV1_A.xpt
similarity index 100%
rename from pandas/io/tests/data/SSHSV1_A.XPT
rename to pandas/tests/io/sas/data/SSHSV1_A.xpt
diff --git a/pandas/tests/io/sas/data/airline.csv b/pandas/tests/io/sas/data/airline.csv
new file mode 100644
index 0000000000000..a6336446003a9
--- /dev/null
+++ b/pandas/tests/io/sas/data/airline.csv
@@ -0,0 +1,33 @@
+YEAR,Y,W,R,L,K
+1948.00000839,1.21399998665,0.243000000715,0.145400002599,1.41499996185,0.611999988556
+1949.0000084,1.35399997234,0.259999990463,0.218099996448,1.38399994373,0.559000015259
+1950.0,1.56900000572,0.277999997139,0.315699994564,1.38800001144,0.573000013828
+1951.0,1.94799995422,0.29699999094,0.393999993801,1.54999995232,0.56400001049
+1952.0,2.2650001049,0.310000002384,0.355899989605,1.80200004578,0.574000000954
+1953.0,2.73099994659,0.321999996901,0.359299987555,1.92599999905,0.711000025272
+1954.0,3.02500009537,0.335000008345,0.402500003576,1.96399998665,0.776000022888
+1955.0,3.56200003624,0.34999999404,0.396100014448,2.11599993706,0.827000021935
+1956.0,3.97900009155,0.361000001431,0.38220000267,2.43499994278,0.800000011921
+1957.00036436,4.42000007629,0.379000008106,0.30450001359,2.70700001717,0.921000003815
+1958.00096758,4.56300020218,0.391000002623,0.328399986029,2.70600008965,1.06700003147
+1959.00096116,5.38500022888,0.425999999046,0.38560000062,2.84599995613,1.08299994469
+1960.0,5.55399990082,0.441000014544,0.319299995899,3.08899998665,1.48099994659
+1961.0,5.46500015259,0.460000008345,0.307900011539,3.12199997902,1.73599994183
+1962.0,5.82499980927,0.485000014305,0.378300011158,3.18400001526,1.92599999905
+1963.0,6.87599992752,0.505999982357,0.418000012636,3.26300001144,2.04099988937
+1964.0,7.82299995422,0.537999987602,0.516300022602,3.41199994087,1.99699997902
+1965.0,9.11999988556,0.56400001049,0.587899982929,3.62299990654,2.25699996948
+1966.00082638,10.5120000839,0.586000025272,0.536899983883,4.07399988174,2.742000103
+1967.00001699,13.0200004578,0.621999979019,0.444299995899,4.71000003815,3.56399989128
+1968.00096202,15.2609996796,0.666000008583,0.305200010538,5.21700000763,4.76700019836
+1969.00023643,16.3129997253,0.731000006199,0.233199998736,5.5689997673,6.5110001564
+1970.00003926,16.0020008087,0.830999970436,0.188299998641,5.49499988556,7.62699985504
+1971.00096131,15.8760004044,0.90600001812,0.202299997211,5.33400011063,8.67300033569
+1972.0001291,16.6620006561,1.0,0.250600010157,5.34499979019,8.33100032806
+1973.00001162,17.013999939,1.05599999428,0.266799986362,5.66200017929,8.55700016022
+1974.00096128,19.3050003052,1.13100004196,0.266400009394,5.72900009155,9.50800037384
+1975.0,18.7210006714,1.24699997902,0.230100005865,5.72200012207,9.06200027466
+1976.0,19.25,1.375,0.345200002193,5.76200008392,8.26200008392
+1977.0,20.6469993591,1.54400002956,0.450800001621,5.87699985504,7.47399997711
+1978.0,22.7259998322,1.70299994946,0.587700009346,6.10799980164,7.10400009155
+1979.0,23.6189994812,1.77900004387,0.534600019455,6.85200023651,6.87400007248
diff --git a/pandas/tests/io/sas/data/airline.sas7bdat b/pandas/tests/io/sas/data/airline.sas7bdat
new file mode 100644
index 0000000000000..462299bc6a952
Binary files /dev/null and b/pandas/tests/io/sas/data/airline.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/datetime.csv b/pandas/tests/io/sas/data/datetime.csv
new file mode 100644
index 0000000000000..6126f6d04eaf0
--- /dev/null
+++ b/pandas/tests/io/sas/data/datetime.csv
@@ -0,0 +1,5 @@
+Date1,Date2,DateTime,DateTimeHi,Taiw
+1677-09-22,1677-09-22,1677-09-21 00:12:44,1677-09-21 00:12:43.145226,1912-01-01
+1960-01-01,1960-01-01,1960-01-01 00:00:00,1960-01-01 00:00:00.000000,1960-01-01
+2016-02-29,2016-02-29,2016-02-29 23:59:59,2016-02-29 23:59:59.123456,2016-02-29
+2262-04-11,2262-04-11,2262-04-11 23:47:16,2262-04-11 23:47:16.854774,2262-04-11
diff --git a/pandas/tests/io/sas/data/datetime.sas7bdat b/pandas/tests/io/sas/data/datetime.sas7bdat
new file mode 100644
index 0000000000000..6469dbf29f8ee
Binary files /dev/null and b/pandas/tests/io/sas/data/datetime.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/paxraw_d_short.csv b/pandas/tests/io/sas/data/paxraw_d_short.csv
new file mode 100644
index 0000000000000..776799df5d8a2
--- /dev/null
+++ b/pandas/tests/io/sas/data/paxraw_d_short.csv
@@ -0,0 +1,101 @@
+SEQN,PAXSTAT,PAXCAL,PAXDAY,PAXN,PAXHOUR,PAXMINUT,PAXINTEN,PAXSTEP
+31128,1,1,1,1,0,0,166,4
+31128,1,1,1,2,0,1,27,0
+31128,1,1,1,3,0,2,0,0
+31128,1,1,1,4,0,3,276,4
+31128,1,1,1,5,0,4,0,0
+31128,1,1,1,6,0,5,0,0
+31128,1,1,1,7,0,6,0,0
+31128,1,1,1,8,0,7,0,0
+31128,1,1,1,9,0,8,0,0
+31128,1,1,1,10,0,9,0,0
+31128,1,1,1,11,0,10,0,0
+31128,1,1,1,12,0,11,0,0
+31128,1,1,1,13,0,12,0,0
+31128,1,1,1,14,0,13,0,0
+31128,1,1,1,15,0,14,0,0
+31128,1,1,1,16,0,15,0,0
+31128,1,1,1,17,0,16,0,0
+31128,1,1,1,18,0,17,0,0
+31128,1,1,1,19,0,18,0,0
+31128,1,1,1,20,0,19,0,0
+31128,1,1,1,21,0,20,260,3
+31128,1,1,1,22,0,21,0,0
+31128,1,1,1,23,0,22,0,0
+31128,1,1,1,24,0,23,19,0
+31128,1,1,1,25,0,24,34,1
+31128,1,1,1,26,0,25,47,4
+31128,1,1,1,27,0,26,4,0
+31128,1,1,1,28,0,27,11,0
+31128,1,1,1,29,0,28,48,1
+31128,1,1,1,30,0,29,58,3
+31128,1,1,1,31,0,30,32,2
+31128,1,1,1,32,0,31,15,1
+31128,1,1,1,33,0,32,117,3
+31128,1,1,1,34,0,33,24,0
+31128,1,1,1,35,0,34,61,7
+31128,1,1,1,36,0,35,115,12
+31128,1,1,1,37,0,36,183,11
+31128,1,1,1,38,0,37,68,5
+31128,1,1,1,39,0,38,73,3
+31128,1,1,1,40,0,39,93,7
+31128,1,1,1,41,0,40,201,14
+31128,1,1,1,42,0,41,126,6
+31128,1,1,1,43,0,42,61,4
+31128,1,1,1,44,0,43,97,7
+31128,1,1,1,45,0,44,62,3
+31128,1,1,1,46,0,45,77,10
+31128,1,1,1,47,0,46,105,8
+31128,1,1,1,48,0,47,209,12
+31128,1,1,1,49,0,48,72,4
+31128,1,1,1,50,0,49,50,1
+31128,1,1,1,51,0,50,324,7
+31128,1,1,1,52,0,51,582,16
+31128,1,1,1,53,0,52,387,31
+31128,1,1,1,54,0,53,780,54
+31128,1,1,1,55,0,54,618,10
+31128,1,1,1,56,0,55,0,0
+31128,1,1,1,57,0,56,0,0
+31128,1,1,1,58,0,57,0,0
+31128,1,1,1,59,0,58,123,1
+31128,1,1,1,60,0,59,0,0
+31128,1,1,1,61,1,0,0,0
+31128,1,1,1,62,1,1,0,0
+31128,1,1,1,63,1,2,0,0
+31128,1,1,1,64,1,3,0,0
+31128,1,1,1,65,1,4,0,0
+31128,1,1,1,66,1,5,0,0
+31128,1,1,1,67,1,6,0,0
+31128,1,1,1,68,1,7,0,0
+31128,1,1,1,69,1,8,0,0
+31128,1,1,1,70,1,9,0,0
+31128,1,1,1,71,1,10,0,0
+31128,1,1,1,72,1,11,0,0
+31128,1,1,1,73,1,12,0,0
+31128,1,1,1,74,1,13,0,0
+31128,1,1,1,75,1,14,0,0
+31128,1,1,1,76,1,15,0,0
+31128,1,1,1,77,1,16,0,0
+31128,1,1,1,78,1,17,0,0
+31128,1,1,1,79,1,18,0,0
+31128,1,1,1,80,1,19,0,0
+31128,1,1,1,81,1,20,0,0
+31128,1,1,1,82,1,21,0,0
+31128,1,1,1,83,1,22,0,0
+31128,1,1,1,84,1,23,0,0
+31128,1,1,1,85,1,24,0,0
+31128,1,1,1,86,1,25,0,0
+31128,1,1,1,87,1,26,0,0
+31128,1,1,1,88,1,27,0,0
+31128,1,1,1,89,1,28,0,0
+31128,1,1,1,90,1,29,0,0
+31128,1,1,1,91,1,30,0,0
+31128,1,1,1,92,1,31,0,0
+31128,1,1,1,93,1,32,0,0
+31128,1,1,1,94,1,33,0,0
+31128,1,1,1,95,1,34,2,0
+31128,1,1,1,96,1,35,0,0
+31128,1,1,1,97,1,36,0,0
+31128,1,1,1,98,1,37,0,0
+31128,1,1,1,99,1,38,0,0
+31128,1,1,1,100,1,39,0,0
diff --git a/pandas/tests/io/sas/data/paxraw_d_short.xpt b/pandas/tests/io/sas/data/paxraw_d_short.xpt
new file mode 100644
index 0000000000000..da5bf98244342
Binary files /dev/null and b/pandas/tests/io/sas/data/paxraw_d_short.xpt differ
diff --git a/pandas/tests/io/sas/data/productsales.csv b/pandas/tests/io/sas/data/productsales.csv
new file mode 100644
index 0000000000000..1f6a4424e1a97
--- /dev/null
+++ b/pandas/tests/io/sas/data/productsales.csv
@@ -0,0 +1,1441 @@
+ACTUAL,PREDICT,COUNTRY,REGION,DIVISION,PRODTYPE,PRODUCT,QUARTER,YEAR,MONTH
+925,850,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-01-01
+999,297,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-02-01
+608,846,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-03-01
+642,533,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-04-01
+656,646,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-05-01
+948,486,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-06-01
+612,717,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-07-01
+114,564,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-08-01
+685,230,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-09-01
+657,494,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-10-01
+608,903,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-11-01
+353,266,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-12-01
+107,190,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-01-01
+354,139,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-02-01
+101,217,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-03-01
+553,560,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-04-01
+877,148,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-05-01
+431,762,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-06-01
+511,457,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-07-01
+157,532,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-08-01
+520,629,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-09-01
+114,491,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-10-01
+277,0,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-11-01
+561,979,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-12-01
+220,585,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-01-01
+444,267,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-02-01
+178,487,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-03-01
+756,764,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-04-01
+329,312,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-05-01
+910,531,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-06-01
+530,536,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-07-01
+101,773,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-08-01
+515,143,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-09-01
+730,126,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-10-01
+993,862,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-11-01
+954,754,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-12-01
+267,410,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-01-01
+347,701,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-02-01
+991,204,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-03-01
+923,509,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-04-01
+437,378,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-05-01
+737,507,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-06-01
+104,49,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-07-01
+840,876,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-08-01
+704,66,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-09-01
+889,819,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-10-01
+107,351,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-11-01
+571,201,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-12-01
+688,209,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-01-01
+544,51,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-02-01
+954,135,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-03-01
+445,47,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-04-01
+829,379,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-05-01
+464,758,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-06-01
+968,475,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-07-01
+842,343,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-08-01
+721,507,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-09-01
+966,269,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-10-01
+332,699,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-11-01
+328,824,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-12-01
+355,497,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-01-01
+506,44,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-02-01
+585,522,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-03-01
+634,378,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-04-01
+662,689,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-05-01
+783,90,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-06-01
+786,720,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-07-01
+710,343,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-08-01
+950,457,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-09-01
+274,947,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-10-01
+406,834,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-11-01
+515,71,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-12-01
+35,282,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-01-01
+995,538,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-02-01
+670,679,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-03-01
+406,601,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-04-01
+825,577,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-05-01
+467,908,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-06-01
+709,819,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-07-01
+522,687,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-08-01
+688,157,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-09-01
+956,111,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-10-01
+129,31,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-11-01
+687,790,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-12-01
+877,795,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-01-01
+845,379,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-02-01
+425,114,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-03-01
+899,475,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-04-01
+987,747,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-05-01
+641,372,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-06-01
+448,415,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-07-01
+341,955,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-08-01
+137,356,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-09-01
+235,316,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-10-01
+482,351,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-11-01
+678,164,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-12-01
+240,386,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-01-01
+605,113,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-02-01
+274,68,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-03-01
+422,885,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-04-01
+763,575,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-05-01
+561,743,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-06-01
+339,816,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-07-01
+877,203,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-08-01
+192,581,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-09-01
+604,815,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-10-01
+55,333,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-11-01
+87,40,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-12-01
+942,672,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-01-01
+912,23,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-02-01
+768,948,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-03-01
+951,291,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-04-01
+768,839,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-05-01
+978,864,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-06-01
+20,337,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-07-01
+298,95,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-08-01
+193,535,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-09-01
+336,191,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-10-01
+617,412,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-11-01
+709,711,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-12-01
+5,425,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-01-01
+164,215,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-02-01
+422,948,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-03-01
+424,544,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-04-01
+854,764,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-05-01
+168,446,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-06-01
+8,957,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-07-01
+748,967,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-08-01
+682,11,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-09-01
+300,110,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-10-01
+672,263,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-11-01
+894,215,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-12-01
+944,965,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-01-01
+403,423,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-02-01
+596,753,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-03-01
+481,770,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-04-01
+503,263,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-05-01
+126,79,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-06-01
+721,441,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-07-01
+271,858,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-08-01
+721,667,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-09-01
+157,193,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-10-01
+991,394,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-11-01
+499,680,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-12-01
+284,414,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-01-01
+705,770,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-02-01
+737,679,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-03-01
+745,7,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-04-01
+633,713,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-05-01
+983,851,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-06-01
+591,944,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-07-01
+42,130,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-08-01
+771,485,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-09-01
+465,23,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-10-01
+296,193,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-11-01
+890,7,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-12-01
+312,919,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-01-01
+777,768,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-02-01
+364,854,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-03-01
+601,411,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-04-01
+823,736,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-05-01
+847,10,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-06-01
+490,311,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-07-01
+387,348,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-08-01
+688,458,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-09-01
+650,195,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-10-01
+447,658,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-11-01
+91,704,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-12-01
+197,807,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-01-01
+51,861,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-02-01
+570,873,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-03-01
+423,933,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-04-01
+524,355,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-05-01
+416,794,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-06-01
+789,645,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-07-01
+551,700,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-08-01
+400,831,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-09-01
+361,800,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-10-01
+189,830,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-11-01
+554,828,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-12-01
+585,12,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-01-01
+281,501,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-02-01
+629,914,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-03-01
+43,685,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-04-01
+533,755,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-05-01
+882,708,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-06-01
+790,595,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-07-01
+600,32,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-08-01
+148,49,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-09-01
+237,727,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-10-01
+488,239,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-11-01
+457,273,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-12-01
+401,986,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-01-01
+181,544,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-02-01
+995,182,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-03-01
+120,197,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-04-01
+119,435,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-05-01
+319,974,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-06-01
+333,524,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-07-01
+923,688,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-08-01
+634,750,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-09-01
+493,155,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-10-01
+461,860,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-11-01
+304,102,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-12-01
+641,425,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-01-01
+992,224,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-02-01
+202,408,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-03-01
+770,524,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-04-01
+202,816,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-05-01
+14,515,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-06-01
+134,793,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-07-01
+977,460,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-08-01
+174,732,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-09-01
+429,435,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-10-01
+514,38,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-11-01
+784,616,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-12-01
+973,225,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-01-01
+511,402,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-02-01
+30,697,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-03-01
+895,567,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-04-01
+557,231,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-05-01
+282,372,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-06-01
+909,15,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-07-01
+276,866,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-08-01
+234,452,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-09-01
+479,663,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-10-01
+782,982,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-11-01
+755,813,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-12-01
+689,523,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-01-01
+496,871,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-02-01
+24,511,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-03-01
+379,819,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-04-01
+441,525,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-05-01
+49,13,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-06-01
+243,694,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-07-01
+295,782,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-08-01
+395,839,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-09-01
+929,461,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-10-01
+997,303,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-11-01
+889,421,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-12-01
+72,421,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-01-01
+926,433,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-02-01
+850,394,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-03-01
+826,338,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-04-01
+651,764,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-05-01
+854,216,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-06-01
+899,96,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-07-01
+309,550,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-08-01
+943,636,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-09-01
+138,427,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-10-01
+99,652,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-11-01
+270,478,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-12-01
+862,18,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-01-01
+574,40,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-02-01
+359,453,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-03-01
+958,987,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-04-01
+791,26,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-05-01
+284,101,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-06-01
+190,969,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-07-01
+527,492,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-08-01
+112,263,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-09-01
+271,593,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-10-01
+643,923,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-11-01
+554,146,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-12-01
+211,305,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-01-01
+368,318,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-02-01
+778,417,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-03-01
+808,623,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-04-01
+46,761,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-05-01
+466,272,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-06-01
+18,988,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-07-01
+87,821,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-08-01
+765,962,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-09-01
+62,615,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-10-01
+13,523,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-11-01
+775,806,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-12-01
+636,586,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-01-01
+458,520,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-02-01
+206,908,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-03-01
+310,30,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-04-01
+813,247,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-05-01
+22,647,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-06-01
+742,55,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-07-01
+394,154,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-08-01
+957,344,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-09-01
+205,95,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-10-01
+198,665,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-11-01
+638,145,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-12-01
+155,925,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-01-01
+688,395,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-02-01
+730,749,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-03-01
+208,279,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-04-01
+525,288,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-05-01
+483,509,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-06-01
+748,255,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-07-01
+6,214,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-08-01
+168,473,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-09-01
+301,702,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-10-01
+9,814,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-11-01
+778,231,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-12-01
+799,422,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-01-01
+309,572,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-02-01
+433,363,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-03-01
+969,919,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-04-01
+181,355,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-05-01
+787,992,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-06-01
+971,147,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-07-01
+440,183,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-08-01
+209,375,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-09-01
+537,77,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-10-01
+364,308,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-11-01
+377,660,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-12-01
+251,555,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-01-01
+607,455,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-02-01
+127,888,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-03-01
+513,652,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-04-01
+146,799,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-05-01
+917,249,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-06-01
+776,539,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-07-01
+330,198,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-08-01
+981,340,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-09-01
+862,152,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-10-01
+612,347,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-11-01
+607,565,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-12-01
+786,855,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-01-01
+160,87,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-02-01
+199,69,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-03-01
+972,807,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-04-01
+870,565,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-05-01
+494,798,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-06-01
+975,714,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-07-01
+760,17,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-08-01
+180,797,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-09-01
+256,422,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-10-01
+422,621,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-11-01
+859,661,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-12-01
+586,363,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-01-01
+441,910,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-02-01
+597,998,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-03-01
+717,95,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-04-01
+713,731,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-05-01
+591,718,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-06-01
+492,467,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-07-01
+170,126,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-08-01
+684,127,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-09-01
+981,746,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-10-01
+966,878,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-11-01
+439,27,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-12-01
+151,569,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-01-01
+602,812,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-02-01
+187,603,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-03-01
+415,506,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-04-01
+61,185,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-05-01
+839,692,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-06-01
+596,565,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-07-01
+751,512,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-08-01
+460,86,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-09-01
+922,399,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-10-01
+153,672,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-11-01
+928,801,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-12-01
+951,730,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-01-01
+394,408,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-02-01
+615,982,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-03-01
+653,499,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-04-01
+180,307,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-05-01
+649,741,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-06-01
+921,640,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-07-01
+11,300,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-08-01
+696,929,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-09-01
+795,309,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-10-01
+550,340,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-11-01
+320,228,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-12-01
+845,1000,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-01-01
+245,21,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-02-01
+142,583,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-03-01
+717,506,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-04-01
+3,405,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-05-01
+790,556,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-06-01
+646,72,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-07-01
+230,103,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-08-01
+938,262,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-09-01
+629,102,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-10-01
+317,841,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-11-01
+812,159,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-12-01
+141,570,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-01-01
+64,375,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-02-01
+207,298,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-03-01
+435,32,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-04-01
+96,760,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-05-01
+252,338,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-06-01
+956,149,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-07-01
+633,343,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-08-01
+190,151,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-09-01
+227,44,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-10-01
+24,583,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-11-01
+420,230,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-12-01
+910,907,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-01-01
+709,783,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-02-01
+810,117,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-03-01
+723,416,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-04-01
+911,318,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-05-01
+230,888,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-06-01
+448,60,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-07-01
+945,596,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-08-01
+508,576,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-09-01
+262,576,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-10-01
+441,280,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-11-01
+15,219,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-12-01
+795,133,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-01-01
+301,273,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-02-01
+304,86,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-03-01
+49,400,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-04-01
+576,364,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-05-01
+669,63,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-06-01
+325,929,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-07-01
+272,344,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-08-01
+80,768,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-09-01
+46,668,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-10-01
+223,407,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-11-01
+774,536,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-12-01
+784,657,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-01-01
+92,215,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-02-01
+67,966,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-03-01
+747,674,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-04-01
+686,574,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-05-01
+93,266,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-06-01
+192,680,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-07-01
+51,362,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-08-01
+498,412,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-09-01
+546,431,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-10-01
+485,94,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-11-01
+925,345,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-12-01
+292,445,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-01-01
+540,632,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-02-01
+21,855,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-03-01
+100,36,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-04-01
+49,250,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-05-01
+353,427,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-06-01
+911,367,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-07-01
+823,245,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-08-01
+278,893,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-09-01
+576,490,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-10-01
+655,88,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-11-01
+763,964,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-12-01
+88,62,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-01-01
+746,506,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-02-01
+927,680,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-03-01
+297,153,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-04-01
+291,403,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-05-01
+838,98,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-06-01
+112,376,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-07-01
+509,477,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-08-01
+472,50,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-09-01
+495,592,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-10-01
+1000,813,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-11-01
+241,740,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-12-01
+693,873,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-01-01
+903,459,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-02-01
+791,224,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-03-01
+108,562,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-04-01
+845,199,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-05-01
+452,275,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-06-01
+479,355,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-07-01
+410,947,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-08-01
+379,454,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-09-01
+740,450,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-10-01
+471,575,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-11-01
+325,6,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-12-01
+455,847,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-01-01
+563,338,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-02-01
+879,517,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-03-01
+312,630,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-04-01
+587,381,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-05-01
+628,864,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-06-01
+486,416,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-07-01
+811,852,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-08-01
+990,815,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-09-01
+35,23,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-10-01
+764,527,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-11-01
+619,693,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-12-01
+996,977,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-01-01
+554,549,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-02-01
+540,951,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-03-01
+140,390,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-04-01
+554,204,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-05-01
+724,78,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-06-01
+693,613,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-07-01
+866,745,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-08-01
+833,56,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-09-01
+164,887,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-10-01
+753,651,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-11-01
+60,691,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-12-01
+688,767,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-01-01
+883,709,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-02-01
+109,417,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-03-01
+950,326,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-04-01
+438,599,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-05-01
+286,818,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-06-01
+342,13,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-07-01
+383,185,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-08-01
+80,140,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-09-01
+322,717,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-10-01
+749,852,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-11-01
+606,125,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-12-01
+641,325,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-01-01
+494,648,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-02-01
+428,365,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-03-01
+936,120,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-04-01
+597,347,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-05-01
+728,638,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-06-01
+933,732,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-07-01
+663,465,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-08-01
+394,262,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-09-01
+334,947,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-10-01
+114,694,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-11-01
+89,482,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-12-01
+874,600,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-01-01
+674,94,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-02-01
+347,323,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-03-01
+105,49,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-04-01
+286,70,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-05-01
+669,844,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-06-01
+786,773,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-07-01
+104,68,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-08-01
+770,110,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-09-01
+263,42,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-10-01
+900,171,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-11-01
+630,644,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-12-01
+597,408,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-01-01
+185,45,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-02-01
+175,522,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-03-01
+576,166,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-04-01
+957,885,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-05-01
+993,713,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-06-01
+500,838,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-07-01
+410,267,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-08-01
+592,967,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-09-01
+64,529,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-10-01
+208,656,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-11-01
+273,665,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-12-01
+906,419,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-01-01
+429,776,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-02-01
+961,971,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-03-01
+338,248,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-04-01
+472,486,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-05-01
+903,674,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-06-01
+299,603,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-07-01
+948,492,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-08-01
+931,512,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-09-01
+570,391,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-10-01
+97,313,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-11-01
+674,758,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-12-01
+468,304,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-01-01
+430,846,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-02-01
+893,912,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-03-01
+519,810,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-04-01
+267,122,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-05-01
+908,102,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-06-01
+176,161,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-07-01
+673,450,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-08-01
+798,215,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-09-01
+291,765,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-10-01
+583,557,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-11-01
+442,739,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-12-01
+951,811,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-01-01
+430,780,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-02-01
+559,645,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-03-01
+726,365,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-04-01
+944,597,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-05-01
+497,126,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-06-01
+388,655,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-07-01
+81,604,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-08-01
+111,280,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-09-01
+288,115,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-10-01
+845,205,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-11-01
+745,672,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-12-01
+352,339,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-01-01
+234,70,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-02-01
+167,528,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-03-01
+606,220,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-04-01
+670,691,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-05-01
+764,197,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-06-01
+659,239,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-07-01
+996,50,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-08-01
+424,135,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-09-01
+899,972,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-10-01
+392,475,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-11-01
+555,868,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-12-01
+860,451,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-01-01
+114,565,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-02-01
+943,116,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-03-01
+365,385,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-04-01
+249,375,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-05-01
+192,357,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-06-01
+328,230,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-07-01
+311,829,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-08-01
+576,971,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-09-01
+915,280,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-10-01
+522,853,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-11-01
+625,953,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-12-01
+873,874,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-01-01
+498,578,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-02-01
+808,768,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-03-01
+742,178,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-04-01
+744,916,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-05-01
+30,917,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-06-01
+747,633,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-07-01
+672,107,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-08-01
+564,523,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-09-01
+785,924,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-10-01
+825,481,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-11-01
+243,240,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-12-01
+959,819,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-01-01
+123,602,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-02-01
+714,538,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-03-01
+252,632,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-04-01
+715,952,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-05-01
+670,480,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-06-01
+81,700,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-07-01
+653,726,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-08-01
+795,526,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-09-01
+182,410,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-10-01
+725,307,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-11-01
+101,73,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-12-01
+143,232,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-01-01
+15,993,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-02-01
+742,652,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-03-01
+339,761,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-04-01
+39,428,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-05-01
+465,4,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-06-01
+889,101,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-07-01
+856,869,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-08-01
+358,271,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-09-01
+452,633,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-10-01
+387,481,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-11-01
+824,302,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-12-01
+185,245,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-01-01
+151,941,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-02-01
+419,721,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-03-01
+643,893,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-04-01
+63,898,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-05-01
+202,94,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-06-01
+332,962,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-07-01
+723,71,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-08-01
+148,108,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-09-01
+840,71,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-10-01
+601,767,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-11-01
+962,323,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-12-01
+166,982,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-01-01
+531,614,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-02-01
+963,839,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-03-01
+994,388,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-04-01
+978,296,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-05-01
+72,429,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-06-01
+33,901,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-07-01
+428,350,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-08-01
+413,581,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-09-01
+737,583,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-10-01
+85,92,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-11-01
+916,647,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-12-01
+785,771,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-01-01
+302,26,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-02-01
+1000,598,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-03-01
+458,715,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-04-01
+896,74,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-05-01
+615,580,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-06-01
+174,848,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-07-01
+651,118,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-08-01
+784,54,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-09-01
+121,929,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-10-01
+341,393,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-11-01
+615,820,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-12-01
+697,336,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-01-01
+215,299,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-02-01
+197,747,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-03-01
+205,154,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-04-01
+256,486,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-05-01
+377,251,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-06-01
+577,225,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-07-01
+686,77,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-08-01
+332,74,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-09-01
+534,596,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-10-01
+485,493,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-11-01
+594,782,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-12-01
+413,487,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-01-01
+13,127,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-02-01
+483,538,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-03-01
+820,94,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-04-01
+745,252,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-05-01
+79,722,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-06-01
+36,536,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-07-01
+950,958,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-08-01
+74,466,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-09-01
+458,309,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-10-01
+609,680,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-11-01
+429,539,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-12-01
+956,511,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-01-01
+205,505,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-02-01
+629,720,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-03-01
+277,823,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-04-01
+266,21,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-05-01
+872,142,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-06-01
+435,95,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-07-01
+988,398,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-08-01
+953,328,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-09-01
+556,151,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-10-01
+211,978,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-11-01
+389,918,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-12-01
+351,542,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-01-01
+14,96,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-02-01
+181,496,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-03-01
+452,77,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-04-01
+511,236,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-05-01
+193,913,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-06-01
+797,49,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-07-01
+988,967,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-08-01
+487,502,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-09-01
+941,790,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-10-01
+577,121,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-11-01
+456,55,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-12-01
+982,739,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-01-01
+593,683,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-02-01
+702,610,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-03-01
+528,248,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-04-01
+873,530,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-05-01
+301,889,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-06-01
+769,245,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-07-01
+724,473,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-08-01
+466,938,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-09-01
+774,150,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-10-01
+111,772,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-11-01
+954,201,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-12-01
+780,945,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-01-01
+210,177,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-02-01
+93,378,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-03-01
+332,83,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-04-01
+186,803,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-05-01
+782,398,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-06-01
+41,215,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-07-01
+222,194,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-08-01
+992,287,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-09-01
+477,410,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-10-01
+948,50,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-11-01
+817,204,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-12-01
+597,239,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-01-01
+649,637,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-02-01
+3,938,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-03-01
+731,788,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-04-01
+181,399,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-05-01
+468,576,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-06-01
+891,187,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-07-01
+226,703,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-08-01
+28,455,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-09-01
+609,244,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-10-01
+224,868,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-11-01
+230,353,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-12-01
+216,101,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-01-01
+282,924,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-02-01
+501,144,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-03-01
+320,0,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-04-01
+720,910,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-05-01
+464,259,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-06-01
+363,107,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-07-01
+49,63,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-08-01
+223,270,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-09-01
+452,554,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-10-01
+210,154,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-11-01
+444,205,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-12-01
+222,441,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-01-01
+678,183,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-02-01
+25,459,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-03-01
+57,810,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-04-01
+981,268,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-05-01
+740,916,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-06-01
+408,742,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-07-01
+966,522,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-08-01
+107,299,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-09-01
+488,677,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-10-01
+759,709,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-11-01
+504,310,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-12-01
+99,160,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-01-01
+503,698,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-02-01
+724,540,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-03-01
+309,901,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-04-01
+625,34,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-05-01
+294,536,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-06-01
+890,780,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-07-01
+501,716,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-08-01
+34,532,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-09-01
+203,871,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-10-01
+140,199,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-11-01
+845,845,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-12-01
+774,591,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-01-01
+645,378,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-02-01
+986,942,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-03-01
+296,686,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-04-01
+936,720,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-05-01
+341,546,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-06-01
+32,845,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-07-01
+277,667,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-08-01
+548,627,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-09-01
+727,142,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-10-01
+812,655,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-11-01
+168,556,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-12-01
+150,459,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-01-01
+136,89,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-02-01
+695,726,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-03-01
+363,38,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-04-01
+853,60,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-05-01
+621,369,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-06-01
+764,381,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-07-01
+669,465,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-08-01
+772,981,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-09-01
+228,758,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-10-01
+261,31,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-11-01
+821,237,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-12-01
+100,285,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-01-01
+465,94,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-02-01
+350,561,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-03-01
+991,143,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-04-01
+910,95,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-05-01
+206,341,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-06-01
+263,388,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-07-01
+374,272,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-08-01
+875,890,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-09-01
+810,734,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-10-01
+398,364,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-11-01
+565,619,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-12-01
+417,517,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-01-01
+291,781,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-02-01
+251,327,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-03-01
+449,48,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-04-01
+774,809,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-05-01
+386,73,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-06-01
+22,936,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-07-01
+940,400,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-08-01
+132,736,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-09-01
+103,211,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-10-01
+152,271,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-11-01
+952,855,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-12-01
+872,923,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-01-01
+748,854,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-02-01
+749,769,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-03-01
+876,271,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-04-01
+860,383,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-05-01
+900,29,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-06-01
+705,185,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-07-01
+913,351,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-08-01
+315,560,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-09-01
+466,840,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-10-01
+233,517,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-11-01
+906,949,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-12-01
+148,633,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-01-01
+661,636,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-02-01
+847,138,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-03-01
+768,481,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-04-01
+866,408,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-05-01
+475,130,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-06-01
+112,813,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-07-01
+136,661,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-08-01
+763,311,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-09-01
+388,872,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-10-01
+996,643,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-11-01
+486,174,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-12-01
+494,528,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-01-01
+771,124,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-02-01
+49,126,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-03-01
+322,440,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-04-01
+878,881,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-05-01
+827,292,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-06-01
+852,873,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-07-01
+716,357,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-08-01
+81,247,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-09-01
+916,18,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-10-01
+673,395,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-11-01
+242,620,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-12-01
+914,946,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-01-01
+902,72,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-02-01
+707,691,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-03-01
+223,95,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-04-01
+619,878,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-05-01
+254,757,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-06-01
+688,898,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-07-01
+477,172,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-08-01
+280,419,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-09-01
+546,849,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-10-01
+630,807,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-11-01
+455,599,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-12-01
+505,59,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-01-01
+823,790,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-02-01
+891,574,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-03-01
+840,96,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-04-01
+436,376,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-05-01
+168,352,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-06-01
+177,741,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-07-01
+727,12,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-08-01
+278,157,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-09-01
+443,10,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-10-01
+905,544,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-11-01
+881,817,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-12-01
+507,754,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-01-01
+363,425,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-02-01
+603,492,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-03-01
+473,485,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-04-01
+128,369,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-05-01
+105,560,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-06-01
+325,651,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-07-01
+711,326,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-08-01
+983,180,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-09-01
+241,935,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-10-01
+71,403,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-11-01
+395,345,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-12-01
+168,278,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-01-01
+512,376,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-02-01
+291,104,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-03-01
+776,543,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-04-01
+271,798,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-05-01
+946,333,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-06-01
+195,833,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-07-01
+165,132,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-08-01
+238,629,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-09-01
+409,337,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-10-01
+720,300,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-11-01
+309,470,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-12-01
+812,875,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-01-01
+441,237,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-02-01
+500,272,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-03-01
+517,860,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-04-01
+924,415,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-05-01
+572,140,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-06-01
+768,367,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-07-01
+692,195,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-08-01
+28,245,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-09-01
+202,285,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-10-01
+76,98,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-11-01
+421,932,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-12-01
+636,898,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-01-01
+52,330,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-02-01
+184,603,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-03-01
+739,280,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-04-01
+841,507,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-05-01
+65,202,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-06-01
+623,513,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-07-01
+517,132,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-08-01
+636,21,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-09-01
+845,657,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-10-01
+232,195,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-11-01
+26,323,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-12-01
+680,299,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-01-01
+364,811,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-02-01
+572,739,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-03-01
+145,889,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-04-01
+644,189,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-05-01
+87,698,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-06-01
+620,646,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-07-01
+535,562,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-08-01
+661,753,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-09-01
+884,425,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-10-01
+689,693,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-11-01
+646,941,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-12-01
+4,975,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-01-01
+813,455,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-02-01
+773,260,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-03-01
+205,69,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-04-01
+657,147,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-05-01
+154,533,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-06-01
+747,881,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-07-01
+787,457,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-08-01
+867,441,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-09-01
+307,859,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-10-01
+571,177,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-11-01
+92,633,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-12-01
+269,382,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-01-01
+764,707,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-02-01
+662,566,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-03-01
+818,349,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-04-01
+617,128,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-05-01
+649,231,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-06-01
+895,258,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-07-01
+750,812,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-08-01
+738,362,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-09-01
+107,133,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-10-01
+278,60,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-11-01
+32,88,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-12-01
+129,378,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-01-01
+187,569,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-02-01
+670,186,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-03-01
+678,875,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-04-01
+423,636,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-05-01
+389,360,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-06-01
+257,677,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-07-01
+780,708,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-08-01
+159,158,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-09-01
+97,384,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-10-01
+479,927,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-11-01
+9,134,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-12-01
+614,273,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-01-01
+261,27,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-02-01
+115,209,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-03-01
+358,470,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-04-01
+133,219,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-05-01
+891,907,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-06-01
+702,778,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-07-01
+58,998,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-08-01
+606,194,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-09-01
+668,933,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-10-01
+813,708,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-11-01
+450,949,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-12-01
+956,579,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-01-01
+276,131,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-02-01
+889,689,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-03-01
+708,908,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-04-01
+14,524,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-05-01
+904,336,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-06-01
+272,916,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-07-01
+257,236,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-08-01
+343,965,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-09-01
+80,350,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-10-01
+530,599,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-11-01
+340,901,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-12-01
+595,935,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-01-01
+47,667,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-02-01
+279,104,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-03-01
+293,803,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-04-01
+162,64,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-05-01
+935,825,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-06-01
+689,839,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-07-01
+484,184,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-08-01
+230,348,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-09-01
+164,904,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-10-01
+401,219,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-11-01
+607,381,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-12-01
+229,524,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-01-01
+786,902,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-02-01
+92,212,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-03-01
+455,762,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-04-01
+409,182,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-05-01
+166,442,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-06-01
+277,919,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-07-01
+92,67,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-08-01
+631,741,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-09-01
+390,617,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-10-01
+403,214,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-11-01
+964,202,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-12-01
+223,788,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-01-01
+684,639,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-02-01
+645,336,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-03-01
+470,937,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-04-01
+424,399,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-05-01
+862,21,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-06-01
+736,125,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-07-01
+554,635,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-08-01
+790,229,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-09-01
+115,770,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-10-01
+853,622,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-11-01
+643,109,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-12-01
+794,975,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-01-01
+892,820,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-02-01
+728,123,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-03-01
+744,135,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-04-01
+678,535,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-05-01
+768,971,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-06-01
+234,166,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-07-01
+333,814,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-08-01
+968,557,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-09-01
+119,820,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-10-01
+469,486,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-11-01
+261,429,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-12-01
+984,65,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-01-01
+845,977,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-02-01
+374,410,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-03-01
+687,150,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-04-01
+157,630,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-05-01
+49,488,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-06-01
+817,112,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-07-01
+223,598,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-08-01
+433,705,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-09-01
+41,226,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-10-01
+396,979,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-11-01
+131,19,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-12-01
+521,204,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-01-01
+751,805,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-02-01
+45,549,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-03-01
+144,912,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-04-01
+119,427,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-05-01
+728,1,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-06-01
+120,540,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-07-01
+657,940,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-08-01
+409,644,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-09-01
+881,821,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-10-01
+113,560,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-11-01
+831,309,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-12-01
+129,1000,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-01-01
+76,945,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-02-01
+260,931,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-03-01
+882,504,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-04-01
+157,950,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-05-01
+443,278,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-06-01
+111,225,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-07-01
+497,6,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-08-01
+321,124,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-09-01
+194,206,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-10-01
+684,320,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-11-01
+634,270,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-12-01
+622,278,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-01-01
+689,447,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-02-01
+120,170,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-03-01
+374,87,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-04-01
+926,384,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-05-01
+687,574,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-06-01
+600,585,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-07-01
+779,947,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-08-01
+223,984,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-09-01
+628,189,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-10-01
+326,364,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-11-01
+836,49,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-12-01
+361,851,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-01-01
+444,643,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-02-01
+501,143,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-03-01
+743,763,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-04-01
+861,987,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-05-01
+203,264,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-06-01
+762,439,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-07-01
+705,750,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-08-01
+153,37,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-09-01
+436,95,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-10-01
+428,79,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-11-01
+804,832,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-12-01
+805,649,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-01-01
+860,838,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-02-01
+104,439,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-03-01
+434,207,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-04-01
+912,804,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-05-01
+571,875,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-06-01
+267,473,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-07-01
+415,845,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-08-01
+261,91,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-09-01
+746,630,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-10-01
+30,185,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-11-01
+662,317,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-12-01
+916,88,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-01-01
+415,607,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-02-01
+514,35,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-03-01
+756,680,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-04-01
+461,78,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-05-01
+460,117,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-06-01
+305,440,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-07-01
+198,652,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-08-01
+234,249,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-09-01
+638,658,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-10-01
+88,563,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-11-01
+751,737,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-12-01
+816,789,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-01-01
+437,988,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-02-01
+715,220,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-03-01
+780,946,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-04-01
+245,986,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-05-01
+201,129,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-06-01
+815,433,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-07-01
+865,492,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-08-01
+634,306,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-09-01
+901,154,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-10-01
+789,206,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-11-01
+882,81,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-12-01
+953,882,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-01-01
+862,848,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-02-01
+628,664,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-03-01
+765,389,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-04-01
+741,182,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-05-01
+61,505,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-06-01
+470,861,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-07-01
+869,263,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-08-01
+650,400,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-09-01
+750,556,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-10-01
+602,497,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-11-01
+54,181,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-12-01
+384,619,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-01-01
+161,332,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-02-01
+977,669,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-03-01
+615,487,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-04-01
+783,994,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-05-01
+977,331,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-06-01
+375,739,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-07-01
+298,665,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-08-01
+104,921,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-09-01
+713,862,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-10-01
+556,662,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-11-01
+323,517,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-12-01
+391,352,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-01-01
+593,166,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-02-01
+906,859,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-03-01
+130,571,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-04-01
+613,976,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-05-01
+58,466,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-06-01
+314,79,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-07-01
+67,864,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-08-01
+654,623,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-09-01
+312,170,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-10-01
+349,662,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-11-01
+415,763,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-12-01
+404,896,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-01-01
+22,973,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-02-01
+744,161,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-03-01
+804,934,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-04-01
+101,697,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-05-01
+293,116,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-06-01
+266,84,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-07-01
+372,604,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-08-01
+38,371,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-09-01
+385,783,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-10-01
+262,335,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-11-01
+961,321,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-12-01
+831,177,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-01-01
+579,371,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-02-01
+301,583,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-03-01
+693,364,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-04-01
+895,343,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-05-01
+320,854,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-06-01
+284,691,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-07-01
+362,387,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-08-01
+132,298,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-09-01
+42,635,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-10-01
+118,81,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-11-01
+42,375,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-12-01
+18,846,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-01-01
+512,933,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-02-01
+337,237,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-03-01
+167,964,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-04-01
+749,382,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-05-01
+890,610,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-06-01
+910,148,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-07-01
+403,837,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-08-01
+403,85,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-09-01
+661,425,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-10-01
+485,633,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-11-01
+789,515,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-12-01
+415,512,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-01-01
+418,156,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-02-01
+163,464,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-03-01
+298,813,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-04-01
+584,455,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-05-01
+797,366,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-06-01
+767,734,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-07-01
+984,451,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-08-01
+388,134,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-09-01
+924,547,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-10-01
+566,802,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-11-01
+390,61,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-12-01
+608,556,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-01-01
+840,202,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-02-01
+112,964,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-03-01
+288,112,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-04-01
+408,445,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-05-01
+876,884,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-06-01
+224,348,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-07-01
+133,564,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-08-01
+662,568,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-09-01
+68,882,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-10-01
+626,542,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-11-01
+678,119,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-12-01
+361,248,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-01-01
+464,868,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-02-01
+681,841,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-03-01
+377,484,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-04-01
+222,986,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-05-01
+972,39,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-06-01
+56,930,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-07-01
+695,252,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-08-01
+908,794,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-09-01
+328,658,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-10-01
+891,139,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-11-01
+265,331,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-12-01
+251,261,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-01-01
+783,122,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-02-01
+425,296,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-03-01
+859,391,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-04-01
+314,75,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-05-01
+153,731,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-06-01
+955,883,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-07-01
+654,707,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-08-01
+693,97,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-09-01
+757,390,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-10-01
+221,237,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-11-01
+942,496,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-12-01
+31,814,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-01-01
+540,765,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-02-01
+352,308,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-03-01
+904,327,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-04-01
+436,266,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-05-01
+281,699,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-06-01
+801,599,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-07-01
+273,950,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-08-01
+716,117,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-09-01
+902,632,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-10-01
+341,35,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-11-01
+155,562,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-12-01
+796,144,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-01-01
+257,142,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-02-01
+611,273,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-03-01
+6,915,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-04-01
+125,920,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-05-01
+745,294,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-06-01
+437,681,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-07-01
+906,86,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-08-01
+844,764,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-09-01
+413,269,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-10-01
+869,138,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-11-01
+403,834,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-12-01
+137,112,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-01-01
+922,921,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-02-01
+202,859,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-03-01
+955,442,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-04-01
+781,593,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-05-01
+12,346,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-06-01
+931,312,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-07-01
+95,690,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-08-01
+795,344,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-09-01
+542,784,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-10-01
+935,639,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-11-01
+269,726,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-12-01
+197,596,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-01-01
+828,263,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-02-01
+461,194,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-03-01
+35,895,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-04-01
+88,502,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-05-01
+832,342,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-06-01
+900,421,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-07-01
+368,901,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-08-01
+201,474,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-09-01
+758,571,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-10-01
+504,511,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-11-01
+864,379,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-12-01
+574,68,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-01-01
+61,210,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-02-01
+565,478,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-03-01
+475,296,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-04-01
+44,664,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-05-01
+145,880,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-06-01
+813,607,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-07-01
+703,97,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-08-01
+757,908,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-09-01
+96,152,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-10-01
+860,622,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-11-01
+750,309,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-12-01
+585,912,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-01-01
+127,429,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-02-01
+669,580,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-03-01
+708,179,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-04-01
+830,119,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-05-01
+550,369,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-06-01
+762,882,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-07-01
+468,727,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-08-01
+151,823,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-09-01
+103,783,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-10-01
+876,884,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-11-01
+881,891,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-12-01
+116,909,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-01-01
+677,765,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-02-01
+477,180,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-03-01
+154,712,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-04-01
+331,175,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-05-01
+784,869,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-06-01
+563,820,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-07-01
+229,554,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-08-01
+451,126,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-09-01
+974,760,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-10-01
+484,446,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-11-01
+69,254,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-12-01
+755,516,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-01-01
+331,779,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-02-01
+482,987,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-03-01
+632,318,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-04-01
+750,427,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-05-01
+618,86,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-06-01
+935,553,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-07-01
+716,315,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-08-01
+205,328,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-09-01
+215,521,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-10-01
+871,156,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-11-01
+552,841,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-12-01
+619,623,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-01-01
+701,849,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-02-01
+104,438,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-03-01
+114,719,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-04-01
+854,906,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-05-01
+563,267,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-06-01
+73,542,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-07-01
+427,552,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-08-01
+348,428,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-09-01
+148,158,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-10-01
+895,379,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-11-01
+394,142,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-12-01
+792,588,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-01-01
+175,506,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-02-01
+208,382,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-03-01
+354,132,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-04-01
+163,652,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-05-01
+336,723,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-06-01
+804,682,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-07-01
+863,382,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-08-01
+326,125,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-09-01
+568,321,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-10-01
+691,922,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-11-01
+152,884,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-12-01
+565,38,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-01-01
+38,194,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-02-01
+185,996,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-03-01
+318,532,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-04-01
+960,391,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-05-01
+122,104,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-06-01
+400,22,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-07-01
+301,650,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-08-01
+909,143,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-09-01
+433,999,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-10-01
+508,415,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-11-01
+648,350,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-12-01
+793,342,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-01-01
+129,215,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-02-01
+481,52,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-03-01
+406,292,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-04-01
+512,862,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-05-01
+668,309,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-06-01
+551,886,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-07-01
+124,172,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-08-01
+655,912,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-09-01
+523,666,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-10-01
+739,656,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-11-01
+87,145,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-12-01
+890,664,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-01-01
+665,639,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-02-01
+329,707,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-03-01
+417,891,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-04-01
+828,466,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-05-01
+298,451,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-06-01
+356,451,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-07-01
+909,874,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-08-01
+251,805,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-09-01
+526,426,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-10-01
+652,932,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-11-01
+573,581,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-12-01
diff --git a/pandas/tests/io/sas/data/productsales.sas7bdat b/pandas/tests/io/sas/data/productsales.sas7bdat
new file mode 100644
index 0000000000000..6f18c5a048115
Binary files /dev/null and b/pandas/tests/io/sas/data/productsales.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test1.sas7bdat b/pandas/tests/io/sas/data/test1.sas7bdat
new file mode 100644
index 0000000000000..951173ce4d9f9
Binary files /dev/null and b/pandas/tests/io/sas/data/test1.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test10.sas7bdat b/pandas/tests/io/sas/data/test10.sas7bdat
new file mode 100644
index 0000000000000..a5fd43e6cb9ac
Binary files /dev/null and b/pandas/tests/io/sas/data/test10.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test11.sas7bdat b/pandas/tests/io/sas/data/test11.sas7bdat
new file mode 100644
index 0000000000000..072aa683f66d9
Binary files /dev/null and b/pandas/tests/io/sas/data/test11.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test12.sas7bdat b/pandas/tests/io/sas/data/test12.sas7bdat
new file mode 100644
index 0000000000000..e2a9db874948d
Binary files /dev/null and b/pandas/tests/io/sas/data/test12.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test13.sas7bdat b/pandas/tests/io/sas/data/test13.sas7bdat
new file mode 100644
index 0000000000000..b1dc6f9f8eddc
Binary files /dev/null and b/pandas/tests/io/sas/data/test13.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test14.sas7bdat b/pandas/tests/io/sas/data/test14.sas7bdat
new file mode 100644
index 0000000000000..5a958df51f0ce
Binary files /dev/null and b/pandas/tests/io/sas/data/test14.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test15.sas7bdat b/pandas/tests/io/sas/data/test15.sas7bdat
new file mode 100644
index 0000000000000..c028d8041a3d3
Binary files /dev/null and b/pandas/tests/io/sas/data/test15.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test16.sas7bdat b/pandas/tests/io/sas/data/test16.sas7bdat
new file mode 100644
index 0000000000000..867c3c51bbddd
Binary files /dev/null and b/pandas/tests/io/sas/data/test16.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test2.sas7bdat b/pandas/tests/io/sas/data/test2.sas7bdat
new file mode 100644
index 0000000000000..ba0b8e8dcbb91
Binary files /dev/null and b/pandas/tests/io/sas/data/test2.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test3.sas7bdat b/pandas/tests/io/sas/data/test3.sas7bdat
new file mode 100644
index 0000000000000..a061b1ddd0d45
Binary files /dev/null and b/pandas/tests/io/sas/data/test3.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test4.sas7bdat b/pandas/tests/io/sas/data/test4.sas7bdat
new file mode 100644
index 0000000000000..addd6edf90830
Binary files /dev/null and b/pandas/tests/io/sas/data/test4.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test5.sas7bdat b/pandas/tests/io/sas/data/test5.sas7bdat
new file mode 100644
index 0000000000000..ba741d5a635df
Binary files /dev/null and b/pandas/tests/io/sas/data/test5.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test6.sas7bdat b/pandas/tests/io/sas/data/test6.sas7bdat
new file mode 100644
index 0000000000000..2d9b4b0466047
Binary files /dev/null and b/pandas/tests/io/sas/data/test6.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test7.sas7bdat b/pandas/tests/io/sas/data/test7.sas7bdat
new file mode 100644
index 0000000000000..785b12cf175e3
Binary files /dev/null and b/pandas/tests/io/sas/data/test7.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test8.sas7bdat b/pandas/tests/io/sas/data/test8.sas7bdat
new file mode 100644
index 0000000000000..67db5a143de07
Binary files /dev/null and b/pandas/tests/io/sas/data/test8.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test9.sas7bdat b/pandas/tests/io/sas/data/test9.sas7bdat
new file mode 100644
index 0000000000000..d76a1f28033f4
Binary files /dev/null and b/pandas/tests/io/sas/data/test9.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test_12659.csv b/pandas/tests/io/sas/data/test_12659.csv
new file mode 100644
index 0000000000000..cd83f7caa6aaf
--- /dev/null
+++ b/pandas/tests/io/sas/data/test_12659.csv
@@ -0,0 +1,37 @@
+yearmonth,useGpCo,useGpVi,useSpec,useUrge,caseGpCo,caseGpVi,caseSpec,caseUrge,expendGpCo,expendGpVi,expendSpec,expendUrge
+201401,11,12,13,14,15,16,17,18,19,20,21,22
+201402,11,12,13,14,15,16,17,18,19,20,21,22
+201403,11,12,13,14,15,16,17,18,19,20,21,22
+201404,11,12,13,14,15,16,17,18,19,20,21,22
+201405,11,12,13,14,15,16,17,18,19,20,21,22
+201406,11,12,13,14,15,16,17,18,19,20,21,22
+201407,11,12,13,14,15,16,17,18,19,20,21,22
+201408,11,12,13,14,15,16,17,18,19,20,21,22
+201409,11,12,13,14,15,16,17,18,19,20,21,22
+201410,11,12,13,14,15,16,17,18,19,20,21,22
+201411,11,12,13,14,15,16,17,18,19,20,21,22
+201412,11,12,13,14,15,16,17,18,19,20,21,22
+201501,11,12,13,14,15,16,17,18,19,20,21,22
+201502,11,12,13,14,15,16,17,18,19,20,21,22
+201503,11,12,13,14,15,16,17,18,19,20,21,22
+201504,11,12,13,14,15,16,17,18,19,20,21,22
+201505,11,12,13,14,15,16,17,18,19,20,21,22
+201506,11,12,13,14,15,16,17,18,19,20,21,22
+201507,11,12,13,14,15,16,17,18,19,20,21,22
+201508,11,12,13,14,15,16,17,18,19,20,21,22
+201509,11,12,13,14,15,16,17,18,19,20,21,22
+201510,11,12,13,14,15,16,17,18,19,20,21,22
+201511,11,12,13,14,15,16,17,18,19,20,21,22
+201512,11,12,13,14,15,16,17,18,19,20,21,22
+201601,11,12,13,14,15,16,17,18,19,20,21,22
+201602,11,12,13,14,15,16,17,18,19,20,21,22
+201603,11,12,13,14,15,16,17,18,19,20,21,22
+201604,11,12,13,14,15,16,17,18,19,20,21,22
+201605,11,12,13,14,15,16,17,18,19,20,21,22
+201606,11,12,13,14,15,16,17,18,19,20,21,22
+201607,11,12,13,14,15,16,17,18,19,20,21,22
+201608,11,12,13,14,15,16,17,18,19,20,21,22
+201609,11,12,13,14,15,16,17,18,19,20,21,22
+201610,11,12,13,14,15,16,17,18,19,20,21,22
+201611,11,12,13,14,15,16,17,18,19,20,21,22
+201612,11,12,13,14,15,16,17,18,19,20,21,22
diff --git a/pandas/tests/io/sas/data/test_12659.sas7bdat b/pandas/tests/io/sas/data/test_12659.sas7bdat
new file mode 100644
index 0000000000000..bf91e931aa64a
Binary files /dev/null and b/pandas/tests/io/sas/data/test_12659.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/test_sas7bdat_1.csv b/pandas/tests/io/sas/data/test_sas7bdat_1.csv
new file mode 100644
index 0000000000000..3eb23e42448d1
--- /dev/null
+++ b/pandas/tests/io/sas/data/test_sas7bdat_1.csv
@@ -0,0 +1,11 @@
+Column1,Column2,Column3,Column4,Column5,Column6,Column7,Column8,Column9,Column10,Column11,Column12,Column13,Column14,Column15,Column16,Column17,Column18,Column19,Column20,Column21,Column22,Column23,Column24,Column25,Column26,Column27,Column28,Column29,Column30,Column31,Column32,Column33,Column34,Column35,Column36,Column37,Column38,Column39,Column40,Column41,Column42,Column43,Column44,Column45,Column46,Column47,Column48,Column49,Column50,Column51,Column52,Column53,Column54,Column55,Column56,Column57,Column58,Column59,Column60,Column61,Column62,Column63,Column64,Column65,Column66,Column67,Column68,Column69,Column70,Column71,Column72,Column73,Column74,Column75,Column76,Column77,Column78,Column79,Column80,Column81,Column82,Column83,Column84,Column85,Column86,Column87,Column88,Column89,Column90,Column91,Column92,Column93,Column94,Column95,Column96,Column97,Column98,Column99,Column100
+0.636,pear,84,2170,0.103,apple,20,,0.621,apple,,9697,0.047,dog,7,2543,0.728,crocodile,55,2615,0.146,crocodile,10,2832,0.644,crocodile,6,9671,,crocodile,28,9126,0.433,crocodile,22,8117,0.318,dog,61,3363,0.938,pear,58,3700,0.844,dog,26,3989,0.132,crocodile,88,8240,0.325,,9,6102,0.032,apple,34,2987,0.651,crocodile,81,8778,,apple,91,9908,0.897,dog,26,3682,0.274,crocodile,75,1629,0.918,apple,9,7935,0.761,crocodile,,2398,0.914,apple,75,9204,0.946,pear,87,5587,0.940,apple,50,1611,0.480,apple,45,3230
+0.283,dog,49,6275,0.398,pear,50,339,0.561,apple,22,8596,0.661,pear,38,4928,0.709,crocodile,73,6011,0.239,crocodile,93,,0.093,crocodile,23,6198,0.757,dog,61,,0.593,pear,12,9571,,dog,6,892,0.883,pear,81,3363,0.166,pear,,1814,0.454,dog,52,1161,0.630,dog,43,159,0.398,apple,17,8194,0.905,dog,29,4752,0.382,pear,44,9302,0.247,apple,45,4645,0.321,apple,56,,0.415,,,5912,0.580,,60,1918,0.821,dog,68,6847,0.542,apple,83,4465,0.169,pear,53,5820,0.942,dog,76,4904
+0.452,pear,35,8627,0.117,pear,70,5704,0.209,apple,7,5079,0.961,pear,73,,0.414,dog,,9681,,pear,80,4183,0.131,crocodile,53,972,,apple,86,772,0.460,,89,5950,0.293,apple,25,288,0.314,dog,38,106,0.108,pear,49,979,0.481,dog,25,7904,0.270,dog,4,4891,,dog,32,9820,0.517,,64,9053,0.487,dog,78,7238,0.488,apple,54,4349,0.356,pear,73,9991,0.113,,63,5731,0.294,dog,58,3060,,pear,2,,0.004,dog,45,9872,0.024,dog,69,,0.336,pear,9,
+0.557,dog,29,5292,0.640,pear,34,2766,0.910,dog,26,2576,0.924,pear,85,3495,0.478,crocodile,43,1586,0.576,apple,79,4403,0.329,crocodile,,3572,0.702,dog,46,1913,0.147,,10,4292,0.368,crocodile,27,7037,0.137,pear,19,4545,0.999,apple,81,,0.095,pear,36,9195,0.494,pear,61,3393,,crocodile,27,8252,,dog,87,7968,0.845,apple,31,3801,0.514,dog,,6542,0.483,dog,58,4688,,pear,71,402,0.275,apple,51,3673,0.642,,82,4443,0.538,apple,10,114,0.155,,17,8170,0.493,pear,89,8566
+0.138,,55,1903,0.583,crocodile,34,4170,0.226,crocodile,11,3985,0.271,pear,,4624,,,43,2539,,dog,50,,0.469,crocodile,72,5999,0.476,apple,71,1184,0.333,crocodile,23,5075,0.120,pear,64,5242,0.561,apple,7,8206,0.103,,45,,0.972,,1,432,0.423,dog,4,1860,0.686,apple,43,9640,0.622,pear,15,91,0.795,apple,33,2149,0.248,dog,,,0.942,dog,85,987,0.492,pear,2,754,0.955,apple,48,1268,0.498,apple,83,6654,0.305,crocodile,81,423,0.013,,32,3217,0.046,,57,894
+0.948,dog,33,8962,0.691,pear,,2276,0.330,crocodile,27,1104,0.668,,73,2883,0.007,,18,3726,0.301,,85,3621,,apple,39,9646,0.305,pear,48,,0.103,dog,71,8216,0.813,dog,41,6387,0.114,apple,24,4428,0.122,dog,41,,0.558,pear,49,6455,0.119,pear,56,9390,0.482,apple,75,9168,0.437,dog,74,4101,0.557,dog,74,1631,0.159,dog,26,2218,0.274,crocodile,,7653,,dog,,9637,0.345,apple,82,440,0.604,apple,89,6848,0.177,pear,31,2597,0.847,dog,77,,0.700,crocodile,60,6088
+0.162,crocodile,17,8189,0.002,pear,30,5161,0.851,,,7230,0.886,dog,43,5277,0.086,dog,10,6891,0.510,dog,63,2275,0.641,dog,74,9202,0.452,pear,4,6580,0.008,,38,,0.491,apple,11,1469,0.672,dog,89,6182,0.477,apple,4,1877,0.241,dog,61,5083,,apple,78,2526,,,,7547,0.969,dog,22,1578,,dog,86,1211,0.221,apple,1,3252,0.146,,85,9278,0.676,dog,30,1218,0.012,apple,93,3159,0.681,crocodile,45,,0.825,crocodile,0,3749,0.831,,74,7021,0.534,pear,20,6122
+0.148,crocodile,37,1740,0.411,apple,23,8833,0.620,crocodile,5,439,0.372,apple,31,,0.881,dog,84,736,0.347,crocodile,46,224,0.080,crocodile,80,891,0.452,pear,82,3304,0.418,pear,85,2984,0.362,dog,65,,0.167,,65,5265,,apple,89,2101,0.864,apple,92,3636,0.382,crocodile,89,269,0.958,dog,23,1419,0.410,pear,86,8488,0.739,pear,,6576,0.613,dog,37,859,0.426,dog,15,8618,0.554,crocodile,51,4864,0.046,,,4421,0.995,dog,25,622,0.191,pear,84,536,0.405,apple,54,7081,0.575,crocodile,15,2570
+,pear,15,3679,0.102,pear,1,3227,0.157,pear,12,1627,0.955,pear,21,64,0.967,dog,14,2876,0.533,,74,4269,0.881,apple,58,5565,,dog,,6286,0.373,crocodile,46,6525,0.477,crocodile,18,1836,0.067,apple,66,3851,0.224,pear,,7233,0.443,,75,5577,0.392,crocodile,92,4353,0.549,pear,96,4884,0.581,crocodile,10,4058,,crocodile,22,8038,0.411,,94,9236,,pear,40,,0.770,crocodile,36,4591,0.854,dog,32,2902,0.724,apple,57,5499,0.566,pear,19,7577,0.853,,,,,crocodile,84,2709
+0.663,pear,,7735,0.086,apple,80,,,pear,16,9159,0.053,dog,52,3478,0.691,pear,49,9979,0.428,dog,46,5776,0.744,crocodile,3,9549,0.249,dog,90,1192,0.009,dog,68,8678,0.046,apple,62,1873,0.684,,31,7227,0.300,crocodile,83,9881,,,82,8272,0.621,crocodile,40,8171,0.002,crocodile,38,,0.580,pear,31,3094,,,5,5711,0.668,,30,217,0.672,dog,34,3184,0.105,pear,,1521,0.239,dog,28,6896,0.011,apple,,4509,0.691,,97,9247,0.167,pear,74,9824,0.945,crocodile,89,
diff --git a/pandas/tests/io/sas/data/test_sas7bdat_2.csv b/pandas/tests/io/sas/data/test_sas7bdat_2.csv
new file mode 100644
index 0000000000000..adc0587ae2797
--- /dev/null
+++ b/pandas/tests/io/sas/data/test_sas7bdat_2.csv
@@ -0,0 +1,11 @@
+Column1,Column2,Column3,Column4,Column5,Column6,Column7,Column8,Column9,Column10,Column11,Column12,Column13,Column14,Column15,Column16,Column17,Column18,Column19,Column20,Column21,Column22,Column23,Column24,Column25,Column26,Column27,Column28,Column29,Column30,Column31,Column32,Column33,Column34,Column35,Column36,Column37,Column38,Column39,Column40,Column41,Column42,Column43,Column44,Column45,Column46,Column47,Column48,Column49,Column50,Column51,Column52,Column53,Column54,Column55,Column56,Column57,Column58,Column59,Column60,Column61,Column62,Column63,Column64,Column65,Column66,Column67,Column68,Column69,Column70,Column71,Column72,Column73,Column74,Column75,Column76,Column77,Column78,Column79,Column80,Column81,Column82,Column83,Column84,Column85,Column86,Column87,Column88,Column89,Column90,Column91,Column92,Column93,Column94,Column95,Column96,Column97,Column98,Column99,Column100
+0.636,高雄市,84,2170,0.103,부산,20,,0.621,부산,,9697,0.047,Иркутск,7,2543,0.728,鱷魚,55,2615,0.146,鱷魚,10,2832,0.644,鱷魚,6,9671,,鱷魚,28,9126,0.433,鱷魚,22,8117,0.318,Иркутск,61,3363,0.938,高雄市,58,3700,0.844,Иркутск,26,3989,0.132,鱷魚,88,8240,0.325,,9,6102,0.032,부산,34,2987,0.651,鱷魚,81,8778,,부산,91,9908,0.897,Иркутск,26,3682,0.274,鱷魚,75,1629,0.918,부산,9,7935,0.761,鱷魚,,2398,0.914,부산,75,9204,0.946,高雄市,87,5587,0.940,부산,50,1611,0.480,부산,45,3230
+0.283,Иркутск,49,6275,0.398,高雄市,50,339,0.561,부산,22,8596,0.661,高雄市,38,4928,0.709,鱷魚,73,6011,0.239,鱷魚,93,,0.093,鱷魚,23,6198,0.757,Иркутск,61,,0.593,高雄市,12,9571,,Иркутск,6,892,0.883,高雄市,81,3363,0.166,高雄市,,1814,0.454,Иркутск,52,1161,0.630,Иркутск,43,159,0.398,부산,17,8194,0.905,Иркутск,29,4752,0.382,高雄市,44,9302,0.247,부산,45,4645,0.321,부산,56,,0.415,,,5912,0.580,,60,1918,0.821,Иркутск,68,6847,0.542,부산,83,4465,0.169,高雄市,53,5820,0.942,Иркутск,76,4904
+0.452,高雄市,35,8627,0.117,高雄市,70,5704,0.209,부산,7,5079,0.961,高雄市,73,,0.414,Иркутск,,9681,,高雄市,80,4183,0.131,鱷魚,53,972,,부산,86,772,0.460,,89,5950,0.293,부산,25,288,0.314,Иркутск,38,106,0.108,高雄市,49,979,0.481,Иркутск,25,7904,0.270,Иркутск,4,4891,,Иркутск,32,9820,0.517,,64,9053,0.487,Иркутск,78,7238,0.488,부산,54,4349,0.356,高雄市,73,9991,0.113,,63,5731,0.294,Иркутск,58,3060,,高雄市,2,,0.004,Иркутск,45,9872,0.024,Иркутск,69,,0.336,高雄市,9,
+0.557,Иркутск,29,5292,0.640,高雄市,34,2766,0.910,Иркутск,26,2576,0.924,高雄市,85,3495,0.478,鱷魚,43,1586,0.576,부산,79,4403,0.329,鱷魚,,3572,0.702,Иркутск,46,1913,0.147,,10,4292,0.368,鱷魚,27,7037,0.137,高雄市,19,4545,0.999,부산,81,,0.095,高雄市,36,9195,0.494,高雄市,61,3393,,鱷魚,27,8252,,Иркутск,87,7968,0.845,부산,31,3801,0.514,Иркутск,,6542,0.483,Иркутск,58,4688,,高雄市,71,402,0.275,부산,51,3673,0.642,,82,4443,0.538,부산,10,114,0.155,,17,8170,0.493,高雄市,89,8566
+0.138,,55,1903,0.583,鱷魚,34,4170,0.226,鱷魚,11,3985,0.271,高雄市,,4624,,,43,2539,,Иркутск,50,,0.469,鱷魚,72,5999,0.476,부산,71,1184,0.333,鱷魚,23,5075,0.120,高雄市,64,5242,0.561,부산,7,8206,0.103,,45,,0.972,,1,432,0.423,Иркутск,4,1860,0.686,부산,43,9640,0.622,高雄市,15,91,0.795,부산,33,2149,0.248,Иркутск,,,0.942,Иркутск,85,987,0.492,高雄市,2,754,0.955,부산,48,1268,0.498,부산,83,6654,0.305,鱷魚,81,423,0.013,,32,3217,0.046,,57,894
+0.948,Иркутск,33,8962,0.691,高雄市,,2276,0.330,鱷魚,27,1104,0.668,,73,2883,0.007,,18,3726,0.301,,85,3621,,부산,39,9646,0.305,高雄市,48,,0.103,Иркутск,71,8216,0.813,Иркутск,41,6387,0.114,부산,24,4428,0.122,Иркутск,41,,0.558,高雄市,49,6455,0.119,高雄市,56,9390,0.482,부산,75,9168,0.437,Иркутск,74,4101,0.557,Иркутск,74,1631,0.159,Иркутск,26,2218,0.274,鱷魚,,7653,,Иркутск,,9637,0.345,부산,82,440,0.604,부산,89,6848,0.177,高雄市,31,2597,0.847,Иркутск,77,,0.700,鱷魚,60,6088
+0.162,鱷魚,17,8189,0.002,高雄市,30,5161,0.851,,,7230,0.886,Иркутск,43,5277,0.086,Иркутск,10,6891,0.510,Иркутск,63,2275,0.641,Иркутск,74,9202,0.452,高雄市,4,6580,0.008,,38,,0.491,부산,11,1469,0.672,Иркутск,89,6182,0.477,부산,4,1877,0.241,Иркутск,61,5083,,부산,78,2526,,,,7547,0.969,Иркутск,22,1578,,Иркутск,86,1211,0.221,부산,1,3252,0.146,,85,9278,0.676,Иркутск,30,1218,0.012,부산,93,3159,0.681,鱷魚,45,,0.825,鱷魚,0,3749,0.831,,74,7021,0.534,高雄市,20,6122
+0.148,鱷魚,37,1740,0.411,부산,23,8833,0.620,鱷魚,5,439,0.372,부산,31,,0.881,Иркутск,84,736,0.347,鱷魚,46,224,0.080,鱷魚,80,891,0.452,高雄市,82,3304,0.418,高雄市,85,2984,0.362,Иркутск,65,,0.167,,65,5265,,부산,89,2101,0.864,부산,92,3636,0.382,鱷魚,89,269,0.958,Иркутск,23,1419,0.410,高雄市,86,8488,0.739,高雄市,,6576,0.613,Иркутск,37,859,0.426,Иркутск,15,8618,0.554,鱷魚,51,4864,0.046,,,4421,0.995,Иркутск,25,622,0.191,高雄市,84,536,0.405,부산,54,7081,0.575,鱷魚,15,2570
+,高雄市,15,3679,0.102,高雄市,1,3227,0.157,高雄市,12,1627,0.955,高雄市,21,64,0.967,Иркутск,14,2876,0.533,,74,4269,0.881,부산,58,5565,,Иркутск,,6286,0.373,鱷魚,46,6525,0.477,鱷魚,18,1836,0.067,부산,66,3851,0.224,高雄市,,7233,0.443,,75,5577,0.392,鱷魚,92,4353,0.549,高雄市,96,4884,0.581,鱷魚,10,4058,,鱷魚,22,8038,0.411,,94,9236,,高雄市,40,,0.770,鱷魚,36,4591,0.854,Иркутск,32,2902,0.724,부산,57,5499,0.566,高雄市,19,7577,0.853,,,,,鱷魚,84,2709
+0.663,高雄市,,7735,0.086,부산,80,,,高雄市,16,9159,0.053,Иркутск,52,3478,0.691,高雄市,49,9979,0.428,Иркутск,46,5776,0.744,鱷魚,3,9549,0.249,Иркутск,90,1192,0.009,Иркутск,68,8678,0.046,부산,62,1873,0.684,,31,7227,0.300,鱷魚,83,9881,,,82,8272,0.621,鱷魚,40,8171,0.002,鱷魚,38,,0.580,高雄市,31,3094,,,5,5711,0.668,,30,217,0.672,Иркутск,34,3184,0.105,高雄市,,1521,0.239,Иркутск,28,6896,0.011,부산,,4509,0.691,,97,9247,0.167,高雄市,74,9824,0.945,鱷魚,89,
diff --git a/pandas/tests/io/sas/data/zero_variables.sas7bdat b/pandas/tests/io/sas/data/zero_variables.sas7bdat
new file mode 100644
index 0000000000000..85fec09447ec5
Binary files /dev/null and b/pandas/tests/io/sas/data/zero_variables.sas7bdat differ
diff --git a/pandas/tests/io/sas/test_sas.py b/pandas/tests/io/sas/test_sas.py
new file mode 100644
index 0000000000000..b85f6b6bbd5ce
--- /dev/null
+++ b/pandas/tests/io/sas/test_sas.py
@@ -0,0 +1,16 @@
+from pandas.compat import StringIO
+from pandas import read_sas
+
+import pandas.util.testing as tm
+
+
+class TestSas(object):
+
+    def test_sas_buffer_format(self):
+        # see gh-14947
+        b = StringIO("")
+
+        msg = ("If this is a buffer object rather than a string "
+               "name, you must specify a format string")
+        with tm.assert_raises_regex(ValueError, msg):
+            read_sas(b)
diff --git a/pandas/tests/io/sas/test_sas7bdat.py b/pandas/tests/io/sas/test_sas7bdat.py
new file mode 100644
index 0000000000000..101ee3e619f5b
--- /dev/null
+++ b/pandas/tests/io/sas/test_sas7bdat.py
@@ -0,0 +1,190 @@
+import pandas as pd
+from pandas.compat import PY2
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas.errors import EmptyDataError
+import os
+import io
+import numpy as np
+import pytest
+
+
+class TestSAS7BDAT(object):
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.dirpath = datapath("io", "sas", "data")
+        self.data = []
+        self.test_ix = [list(range(1, 16)), [16]]
+        for j in 1, 2:
+            fname = os.path.join(
+                self.dirpath, "test_sas7bdat_{j}.csv".format(j=j))
+            df = pd.read_csv(fname)
+            epoch = pd.datetime(1960, 1, 1)
+            t1 = pd.to_timedelta(df["Column4"], unit='d')
+            df["Column4"] = epoch + t1
+            t2 = pd.to_timedelta(df["Column12"], unit='d')
+            df["Column12"] = epoch + t2
+            for k in range(df.shape[1]):
+                col = df.iloc[:, k]
+                if col.dtype == np.int64:
+                    df.iloc[:, k] = df.iloc[:, k].astype(np.float64)
+                elif col.dtype == np.dtype('O'):
+                    if PY2:
+                        f = lambda x: (x.decode('utf-8') if
+                                       isinstance(x, str) else x)
+                        df.iloc[:, k] = df.iloc[:, k].apply(f)
+            self.data.append(df)
+
+    def test_from_file(self):
+        for j in 0, 1:
+            df0 = self.data[j]
+            for k in self.test_ix[j]:
+                fname = os.path.join(
+                    self.dirpath, "test{k}.sas7bdat".format(k=k))
+                df = pd.read_sas(fname, encoding='utf-8')
+                tm.assert_frame_equal(df, df0)
+
+    def test_from_buffer(self):
+        for j in 0, 1:
+            df0 = self.data[j]
+            for k in self.test_ix[j]:
+                fname = os.path.join(
+                    self.dirpath, "test{k}.sas7bdat".format(k=k))
+                with open(fname, 'rb') as f:
+                    byts = f.read()
+                buf = io.BytesIO(byts)
+                rdr = pd.read_sas(buf, format="sas7bdat",
+                                  iterator=True, encoding='utf-8')
+                df = rdr.read()
+                tm.assert_frame_equal(df, df0, check_exact=False)
+                rdr.close()
+
+    def test_from_iterator(self):
+        for j in 0, 1:
+            df0 = self.data[j]
+            for k in self.test_ix[j]:
+                fname = os.path.join(
+                    self.dirpath, "test{k}.sas7bdat".format(k=k))
+                rdr = pd.read_sas(fname, iterator=True, encoding='utf-8')
+                df = rdr.read(2)
+                tm.assert_frame_equal(df, df0.iloc[0:2, :])
+                df = rdr.read(3)
+                tm.assert_frame_equal(df, df0.iloc[2:5, :])
+                rdr.close()
+
+    @td.skip_if_no('pathlib')
+    def test_path_pathlib(self):
+        from pathlib import Path
+        for j in 0, 1:
+            df0 = self.data[j]
+            for k in self.test_ix[j]:
+                fname = Path(os.path.join(
+                    self.dirpath, "test{k}.sas7bdat".format(k=k)))
+                df = pd.read_sas(fname, encoding='utf-8')
+                tm.assert_frame_equal(df, df0)
+
+    @td.skip_if_no('py.path')
+    def test_path_localpath(self):
+        from py.path import local as LocalPath
+        for j in 0, 1:
+            df0 = self.data[j]
+            for k in self.test_ix[j]:
+                fname = LocalPath(os.path.join(
+                    self.dirpath, "test{k}.sas7bdat".format(k=k)))
+                df = pd.read_sas(fname, encoding='utf-8')
+                tm.assert_frame_equal(df, df0)
+
+    def test_iterator_loop(self):
+        # github #13654
+        for j in 0, 1:
+            for k in self.test_ix[j]:
+                for chunksize in 3, 5, 10, 11:
+                    fname = os.path.join(
+                        self.dirpath, "test{k}.sas7bdat".format(k=k))
+                    rdr = pd.read_sas(fname, chunksize=10, encoding='utf-8')
+                    y = 0
+                    for x in rdr:
+                        y += x.shape[0]
+                    assert y == rdr.row_count
+                    rdr.close()
+
+    def test_iterator_read_too_much(self):
+        # github #14734
+        k = self.test_ix[0][0]
+        fname = os.path.join(self.dirpath, "test{k}.sas7bdat".format(k=k))
+        rdr = pd.read_sas(fname, format="sas7bdat",
+                          iterator=True, encoding='utf-8')
+        d1 = rdr.read(rdr.row_count + 20)
+        rdr.close()
+
+        rdr = pd.read_sas(fname, iterator=True, encoding="utf-8")
+        d2 = rdr.read(rdr.row_count + 20)
+        tm.assert_frame_equal(d1, d2)
+        rdr.close()
+
+
+def test_encoding_options(datapath):
+    fname = datapath("io", "sas", "data", "test1.sas7bdat")
+    df1 = pd.read_sas(fname)
+    df2 = pd.read_sas(fname, encoding='utf-8')
+    for col in df1.columns:
+        try:
+            df1[col] = df1[col].str.decode('utf-8')
+        except AttributeError:
+            pass
+    tm.assert_frame_equal(df1, df2)
+
+    from pandas.io.sas.sas7bdat import SAS7BDATReader
+    rdr = SAS7BDATReader(fname, convert_header_text=False)
+    df3 = rdr.read()
+    rdr.close()
+    for x, y in zip(df1.columns, df3.columns):
+        assert(x == y.decode())
+
+
+def test_productsales(datapath):
+    fname = datapath("io", "sas", "data", "productsales.sas7bdat")
+    df = pd.read_sas(fname, encoding='utf-8')
+    fname = datapath("io", "sas", "data", "productsales.csv")
+    df0 = pd.read_csv(fname, parse_dates=['MONTH'])
+    vn = ["ACTUAL", "PREDICT", "QUARTER", "YEAR"]
+    df0[vn] = df0[vn].astype(np.float64)
+    tm.assert_frame_equal(df, df0)
+
+
+def test_12659(datapath):
+    fname = datapath("io", "sas", "data", "test_12659.sas7bdat")
+    df = pd.read_sas(fname)
+    fname = datapath("io", "sas", "data", "test_12659.csv")
+    df0 = pd.read_csv(fname)
+    df0 = df0.astype(np.float64)
+    tm.assert_frame_equal(df, df0)
+
+
+def test_airline(datapath):
+    fname = datapath("io", "sas", "data", "airline.sas7bdat")
+    df = pd.read_sas(fname)
+    fname = datapath("io", "sas", "data", "airline.csv")
+    df0 = pd.read_csv(fname)
+    df0 = df0.astype(np.float64)
+    tm.assert_frame_equal(df, df0, check_exact=False)
+
+
+def test_date_time(datapath):
+    # Support of different SAS date/datetime formats (PR #15871)
+    fname = datapath("io", "sas", "data", "datetime.sas7bdat")
+    df = pd.read_sas(fname)
+    fname = datapath("io", "sas", "data", "datetime.csv")
+    df0 = pd.read_csv(fname, parse_dates=['Date1', 'Date2', 'DateTime',
+                                          'DateTimeHi', 'Taiw'])
+    # GH 19732: Timestamps imported from sas will incur floating point errors
+    df.iloc[:, 3] = df.iloc[:, 3].dt.round('us')
+    tm.assert_frame_equal(df, df0)
+
+
+def test_zero_variables(datapath):
+    # Check if the SAS file has zero variables (PR #18184)
+    fname = datapath("io", "sas", "data", "zero_variables.sas7bdat")
+    with pytest.raises(EmptyDataError):
+        pd.read_sas(fname)
diff --git a/pandas/tests/io/sas/test_xport.py b/pandas/tests/io/sas/test_xport.py
new file mode 100644
index 0000000000000..6e5b2ab067aa5
--- /dev/null
+++ b/pandas/tests/io/sas/test_xport.py
@@ -0,0 +1,143 @@
+import pytest
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.io.sas.sasreader import read_sas
+import numpy as np
+import os
+
+# CSV versions of test xpt files were obtained using the R foreign library
+
+# Numbers in a SAS xport file are always float64, so need to convert
+# before making comparisons.
+
+
+def numeric_as_float(data):
+    for v in data.columns:
+        if data[v].dtype is np.dtype('int64'):
+            data[v] = data[v].astype(np.float64)
+
+
+class TestXport(object):
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.dirpath = datapath("io", "sas", "data")
+        self.file01 = os.path.join(self.dirpath, "DEMO_G.xpt")
+        self.file02 = os.path.join(self.dirpath, "SSHSV1_A.xpt")
+        self.file03 = os.path.join(self.dirpath, "DRXFCD_G.xpt")
+        self.file04 = os.path.join(self.dirpath, "paxraw_d_short.xpt")
+
+    def test1_basic(self):
+        # Tests with DEMO_G.xpt (all numeric file)
+
+        # Compare to this
+        data_csv = pd.read_csv(self.file01.replace(".xpt", ".csv"))
+        numeric_as_float(data_csv)
+
+        # Read full file
+        data = read_sas(self.file01, format="xport")
+        tm.assert_frame_equal(data, data_csv)
+        num_rows = data.shape[0]
+
+        # Test reading beyond end of file
+        reader = read_sas(self.file01, format="xport", iterator=True)
+        data = reader.read(num_rows + 100)
+        assert data.shape[0] == num_rows
+        reader.close()
+
+        # Test incremental read with `read` method.
+        reader = read_sas(self.file01, format="xport", iterator=True)
+        data = reader.read(10)
+        reader.close()
+        tm.assert_frame_equal(data, data_csv.iloc[0:10, :])
+
+        # Test incremental read with `get_chunk` method.
+        reader = read_sas(self.file01, format="xport", chunksize=10)
+        data = reader.get_chunk()
+        reader.close()
+        tm.assert_frame_equal(data, data_csv.iloc[0:10, :])
+
+        # Test read in loop
+        m = 0
+        reader = read_sas(self.file01, format="xport", chunksize=100)
+        for x in reader:
+            m += x.shape[0]
+        reader.close()
+        assert m == num_rows
+
+        # Read full file with `read_sas` method
+        data = read_sas(self.file01)
+        tm.assert_frame_equal(data, data_csv)
+
+    def test1_index(self):
+        # Tests with DEMO_G.xpt using index (all numeric file)
+
+        # Compare to this
+        data_csv = pd.read_csv(self.file01.replace(".xpt", ".csv"))
+        data_csv = data_csv.set_index("SEQN")
+        numeric_as_float(data_csv)
+
+        # Read full file
+        data = read_sas(self.file01, index="SEQN", format="xport")
+        tm.assert_frame_equal(data, data_csv, check_index_type=False)
+
+        # Test incremental read with `read` method.
+        reader = read_sas(self.file01, index="SEQN", format="xport",
+                          iterator=True)
+        data = reader.read(10)
+        reader.close()
+        tm.assert_frame_equal(data, data_csv.iloc[0:10, :],
+                              check_index_type=False)
+
+        # Test incremental read with `get_chunk` method.
+        reader = read_sas(self.file01, index="SEQN", format="xport",
+                          chunksize=10)
+        data = reader.get_chunk()
+        reader.close()
+        tm.assert_frame_equal(data, data_csv.iloc[0:10, :],
+                              check_index_type=False)
+
+    def test1_incremental(self):
+        # Test with DEMO_G.xpt, reading full file incrementally
+
+        data_csv = pd.read_csv(self.file01.replace(".xpt", ".csv"))
+        data_csv = data_csv.set_index("SEQN")
+        numeric_as_float(data_csv)
+
+        reader = read_sas(self.file01, index="SEQN", chunksize=1000)
+
+        all_data = [x for x in reader]
+        data = pd.concat(all_data, axis=0)
+
+        tm.assert_frame_equal(data, data_csv, check_index_type=False)
+
+    def test2(self):
+        # Test with SSHSV1_A.xpt
+
+        # Compare to this
+        data_csv = pd.read_csv(self.file02.replace(".xpt", ".csv"))
+        numeric_as_float(data_csv)
+
+        data = read_sas(self.file02)
+        tm.assert_frame_equal(data, data_csv)
+
+    def test_multiple_types(self):
+        # Test with DRXFCD_G.xpt (contains text and numeric variables)
+
+        # Compare to this
+        data_csv = pd.read_csv(self.file03.replace(".xpt", ".csv"))
+
+        data = read_sas(self.file03, encoding="utf-8")
+        tm.assert_frame_equal(data, data_csv)
+
+    def test_truncated_float_support(self):
+        # Test with paxraw_d_short.xpt, a shortened version of:
+        # http://wwwn.cdc.gov/Nchs/Nhanes/2005-2006/PAXRAW_D.ZIP
+        # This file has truncated floats (5 bytes in this case).
+
+        # GH 11713
+
+        data_csv = pd.read_csv(self.file04.replace(".xpt", ".csv"))
+
+        data = read_sas(self.file04, format="xport")
+        tm.assert_frame_equal(data.astype('int64'), data_csv)
diff --git a/pandas/tests/io/test_clipboard.py b/pandas/tests/io/test_clipboard.py
new file mode 100644
index 0000000000000..80fddd50fc9a8
--- /dev/null
+++ b/pandas/tests/io/test_clipboard.py
@@ -0,0 +1,200 @@
+# -*- coding: utf-8 -*-
+import numpy as np
+from numpy.random import randint
+from textwrap import dedent
+
+import pytest
+import pandas as pd
+
+from pandas import DataFrame
+from pandas import read_clipboard
+from pandas import get_option
+from pandas.compat import PY2
+from pandas.util import testing as tm
+from pandas.util.testing import makeCustomDataframe as mkdf
+from pandas.io.clipboard.exceptions import PyperclipException
+from pandas.io.clipboard import clipboard_set, clipboard_get
+
+
+try:
+    DataFrame({'A': [1, 2]}).to_clipboard()
+    _DEPS_INSTALLED = 1
+except (PyperclipException, RuntimeError):
+    _DEPS_INSTALLED = 0
+
+
+def build_kwargs(sep, excel):
+    kwargs = {}
+    if excel != 'default':
+        kwargs['excel'] = excel
+    if sep != 'default':
+        kwargs['sep'] = sep
+    return kwargs
+
+
+@pytest.fixture(params=['delims', 'utf8', 'string', 'long', 'nonascii',
+                        'colwidth', 'mixed', 'float', 'int'])
+def df(request):
+    data_type = request.param
+
+    if data_type == 'delims':
+        return pd.DataFrame({'a': ['"a,\t"b|c', 'd\tef´'],
+                             'b': ['hi\'j', 'k\'\'lm']})
+    elif data_type == 'utf8':
+        return pd.DataFrame({'a': ['µasd', 'Ωœ∑´'],
+                             'b': ['øπ∆˚¬', 'œ∑´®']})
+    elif data_type == 'string':
+        return mkdf(5, 3, c_idx_type='s', r_idx_type='i',
+                    c_idx_names=[None], r_idx_names=[None])
+    elif data_type == 'long':
+        max_rows = get_option('display.max_rows')
+        return mkdf(max_rows + 1, 3,
+                    data_gen_f=lambda *args: randint(2),
+                    c_idx_type='s', r_idx_type='i',
+                    c_idx_names=[None], r_idx_names=[None])
+    elif data_type == 'nonascii':
+        return pd.DataFrame({'en': 'in English'.split(),
+                             'es': 'en español'.split()})
+    elif data_type == 'colwidth':
+        _cw = get_option('display.max_colwidth') + 1
+        return mkdf(5, 3, data_gen_f=lambda *args: 'x' * _cw,
+                    c_idx_type='s', r_idx_type='i',
+                    c_idx_names=[None], r_idx_names=[None])
+    elif data_type == 'mixed':
+        return DataFrame({'a': np.arange(1.0, 6.0) + 0.01,
+                          'b': np.arange(1, 6),
+                          'c': list('abcde')})
+    elif data_type == 'float':
+        return mkdf(5, 3, data_gen_f=lambda r, c: float(r) + 0.01,
+                    c_idx_type='s', r_idx_type='i',
+                    c_idx_names=[None], r_idx_names=[None])
+    elif data_type == 'int':
+        return mkdf(5, 3, data_gen_f=lambda *args: randint(2),
+                    c_idx_type='s', r_idx_type='i',
+                    c_idx_names=[None], r_idx_names=[None])
+    else:
+        raise ValueError
+
+
+@pytest.mark.single
+@pytest.mark.skipif(not _DEPS_INSTALLED,
+                    reason="clipboard primitives not installed")
+class TestClipboard(object):
+    def check_round_trip_frame(self, data, excel=None, sep=None,
+                               encoding=None):
+        data.to_clipboard(excel=excel, sep=sep, encoding=encoding)
+        result = read_clipboard(sep=sep or '\t', index_col=0,
+                                encoding=encoding)
+        tm.assert_frame_equal(data, result, check_dtype=False)
+
+    # Test that default arguments copy as tab delimited
+    @pytest.mark.xfail(reason='to_clipboard defaults to space delim. '
+                       'Issue in #21104, Fixed in #21111')
+    def test_round_trip_frame(self, df):
+        self.check_round_trip_frame(df)
+
+    # Test that explicit delimiters are respected
+    @pytest.mark.parametrize('sep', ['\t', ',', '|'])
+    def test_round_trip_frame_sep(self, df, sep):
+        self.check_round_trip_frame(df, sep=sep)
+
+    # Test white space separator
+    @pytest.mark.xfail(reason="Fails on 'delims' df because quote escapes "
+                       "aren't handled correctly in default c engine. Fixed "
+                       "in #21111 by defaulting to python engine for "
+                       "whitespace separator")
+    def test_round_trip_frame_string(self, df):
+        df.to_clipboard(excel=False, sep=None)
+        result = read_clipboard()
+        assert df.to_string() == result.to_string()
+        assert df.shape == result.shape
+
+    # Two character separator is not supported in to_clipboard
+    # Test that multi-character separators are not silently passed
+    @pytest.mark.xfail(reason="Not yet implemented.  Fixed in #21111")
+    def test_excel_sep_warning(self, df):
+        with tm.assert_produces_warning():
+            df.to_clipboard(excel=True, sep=r'\t')
+
+    # Separator is ignored when excel=False and should produce a warning
+    @pytest.mark.xfail(reason="Not yet implemented.  Fixed in #21111")
+    def test_copy_delim_warning(self, df):
+        with tm.assert_produces_warning():
+            df.to_clipboard(excel=False, sep='\t')
+
+    # Tests that the default behavior of to_clipboard is tab
+    # delimited and excel="True"
+    @pytest.mark.xfail(reason="to_clipboard defaults to space delim. Issue in "
+                       "#21104, Fixed in #21111")
+    @pytest.mark.parametrize('sep', ['\t', None, 'default'])
+    @pytest.mark.parametrize('excel', [True, None, 'default'])
+    def test_clipboard_copy_tabs_default(self, sep, excel, df):
+        kwargs = build_kwargs(sep, excel)
+        df.to_clipboard(**kwargs)
+        if PY2:
+            # to_clipboard copies unicode, to_csv produces bytes. This is
+            # expected behavior
+            assert clipboard_get().encode('utf-8') == df.to_csv(sep='\t')
+        else:
+            assert clipboard_get() == df.to_csv(sep='\t')
+
+    # Tests reading of white space separated tables
+    @pytest.mark.xfail(reason="Fails on 'delims' df because quote escapes "
+                       "aren't handled correctly. in default c engine. Fixed "
+                       "in #21111 by defaulting to python engine for "
+                       "whitespace separator")
+    @pytest.mark.parametrize('sep', [None, 'default'])
+    @pytest.mark.parametrize('excel', [False])
+    def test_clipboard_copy_strings(self, sep, excel, df):
+        kwargs = build_kwargs(sep, excel)
+        df.to_clipboard(**kwargs)
+        result = read_clipboard(sep=r'\s+')
+        assert result.to_string() == df.to_string()
+        assert df.shape == result.shape
+
+    def test_read_clipboard_infer_excel(self):
+        # gh-19010: avoid warnings
+        clip_kwargs = dict(engine="python")
+
+        text = dedent("""
+            John James	Charlie Mingus
+            1	2
+            4	Harry Carney
+            """.strip())
+        clipboard_set(text)
+        df = pd.read_clipboard(**clip_kwargs)
+
+        # excel data is parsed correctly
+        assert df.iloc[1][1] == 'Harry Carney'
+
+        # having diff tab counts doesn't trigger it
+        text = dedent("""
+            a\t b
+            1  2
+            3  4
+            """.strip())
+        clipboard_set(text)
+        res = pd.read_clipboard(**clip_kwargs)
+
+        text = dedent("""
+            a  b
+            1  2
+            3  4
+            """.strip())
+        clipboard_set(text)
+        exp = pd.read_clipboard(**clip_kwargs)
+
+        tm.assert_frame_equal(res, exp)
+
+    def test_invalid_encoding(self, df):
+        # test case for testing invalid encoding
+        with pytest.raises(ValueError):
+            df.to_clipboard(encoding='ascii')
+        with pytest.raises(NotImplementedError):
+            pd.read_clipboard(encoding='ascii')
+
+    @pytest.mark.xfail(reason='to_clipboard defaults to space delim. '
+                       'Issue in #21104, Fixed in #21111')
+    @pytest.mark.parametrize('enc', ['UTF-8', 'utf-8', 'utf8'])
+    def test_round_trip_valid_encodings(self, enc, df):
+        self.check_round_trip_frame(df, encoding=enc)
diff --git a/pandas/tests/io/test_common.py b/pandas/tests/io/test_common.py
new file mode 100644
index 0000000000000..5c9739be73393
--- /dev/null
+++ b/pandas/tests/io/test_common.py
@@ -0,0 +1,288 @@
+"""
+    Tests for the pandas.io.common functionalities
+"""
+import mmap
+import pytest
+import os
+from os.path import isabs
+
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+from pandas.io import common
+from pandas.compat import is_platform_windows, StringIO, FileNotFoundError
+
+from pandas import read_csv, concat
+
+
+class CustomFSPath(object):
+    """For testing fspath on unknown objects"""
+    def __init__(self, path):
+        self.path = path
+
+    def __fspath__(self):
+        return self.path
+
+
+# Functions that consume a string path and return a string or path-like object
+path_types = [str, CustomFSPath]
+
+try:
+    from pathlib import Path
+    path_types.append(Path)
+except ImportError:
+    pass
+
+try:
+    from py.path import local as LocalPath
+    path_types.append(LocalPath)
+except ImportError:
+    pass
+
+HERE = os.path.abspath(os.path.dirname(__file__))
+
+
+class TestCommonIOCapabilities(object):
+    data1 = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+
+    def test_expand_user(self):
+        filename = '~/sometest'
+        expanded_name = common._expand_user(filename)
+
+        assert expanded_name != filename
+        assert isabs(expanded_name)
+        assert os.path.expanduser(filename) == expanded_name
+
+    def test_expand_user_normal_path(self):
+        filename = '/somefolder/sometest'
+        expanded_name = common._expand_user(filename)
+
+        assert expanded_name == filename
+        assert os.path.expanduser(filename) == expanded_name
+
+    @td.skip_if_no('pathlib')
+    def test_stringify_path_pathlib(self):
+        rel_path = common._stringify_path(Path('.'))
+        assert rel_path == '.'
+        redundant_path = common._stringify_path(Path('foo//bar'))
+        assert redundant_path == os.path.join('foo', 'bar')
+
+    @td.skip_if_no('py.path')
+    def test_stringify_path_localpath(self):
+        path = os.path.join('foo', 'bar')
+        abs_path = os.path.abspath(path)
+        lpath = LocalPath(path)
+        assert common._stringify_path(lpath) == abs_path
+
+    def test_stringify_path_fspath(self):
+        p = CustomFSPath('foo/bar.csv')
+        result = common._stringify_path(p)
+        assert result == 'foo/bar.csv'
+
+    @pytest.mark.parametrize('extension,expected', [
+        ('', None),
+        ('.gz', 'gzip'),
+        ('.bz2', 'bz2'),
+        ('.zip', 'zip'),
+        ('.xz', 'xz'),
+    ])
+    @pytest.mark.parametrize('path_type', path_types)
+    def test_infer_compression_from_path(self, extension, expected, path_type):
+        path = path_type('foo/bar.csv' + extension)
+        compression = common._infer_compression(path, compression='infer')
+        assert compression == expected
+
+    def test_get_filepath_or_buffer_with_path(self):
+        filename = '~/sometest'
+        filepath_or_buffer, _, _, should_close = common.get_filepath_or_buffer(
+            filename)
+        assert filepath_or_buffer != filename
+        assert isabs(filepath_or_buffer)
+        assert os.path.expanduser(filename) == filepath_or_buffer
+        assert not should_close
+
+    def test_get_filepath_or_buffer_with_buffer(self):
+        input_buffer = StringIO()
+        filepath_or_buffer, _, _, should_close = common.get_filepath_or_buffer(
+            input_buffer)
+        assert filepath_or_buffer == input_buffer
+        assert not should_close
+
+    def test_iterator(self):
+        reader = read_csv(StringIO(self.data1), chunksize=1)
+        result = concat(reader, ignore_index=True)
+        expected = read_csv(StringIO(self.data1))
+        tm.assert_frame_equal(result, expected)
+
+        # GH12153
+        it = read_csv(StringIO(self.data1), chunksize=1)
+        first = next(it)
+        tm.assert_frame_equal(first, expected.iloc[[0]])
+        tm.assert_frame_equal(concat(it), expected.iloc[1:])
+
+    @pytest.mark.parametrize('reader, module, error_class, fn_ext', [
+        (pd.read_csv, 'os', FileNotFoundError, 'csv'),
+        (pd.read_table, 'os', FileNotFoundError, 'csv'),
+        (pd.read_fwf, 'os', FileNotFoundError, 'txt'),
+        (pd.read_excel, 'xlrd', FileNotFoundError, 'xlsx'),
+        (pd.read_feather, 'feather', Exception, 'feather'),
+        (pd.read_hdf, 'tables', FileNotFoundError, 'h5'),
+        (pd.read_stata, 'os', FileNotFoundError, 'dta'),
+        (pd.read_sas, 'os', FileNotFoundError, 'sas7bdat'),
+        (pd.read_json, 'os', ValueError, 'json'),
+        (pd.read_msgpack, 'os', ValueError, 'mp'),
+        (pd.read_pickle, 'os', FileNotFoundError, 'pickle'),
+    ])
+    def test_read_non_existant(self, reader, module, error_class, fn_ext):
+        pytest.importorskip(module)
+
+        path = os.path.join(HERE, 'data', 'does_not_exist.' + fn_ext)
+        with pytest.raises(error_class):
+            reader(path)
+
+    @pytest.mark.parametrize('reader, module, path', [
+        (pd.read_csv, 'os', ('io', 'data', 'iris.csv')),
+        (pd.read_table, 'os', ('io', 'data', 'iris.csv')),
+        (pd.read_fwf, 'os', ('io', 'data', 'fixed_width_format.txt')),
+        (pd.read_excel, 'xlrd', ('io', 'data', 'test1.xlsx')),
+        (pd.read_feather, 'feather', ('io', 'data', 'feather-0_3_1.feather')),
+        (pd.read_hdf, 'tables', ('io', 'data', 'legacy_hdf',
+                                 'datetimetz_object.h5')),
+        (pd.read_stata, 'os', ('io', 'data', 'stata10_115.dta')),
+        (pd.read_sas, 'os', ('io', 'sas', 'data', 'test1.sas7bdat')),
+        (pd.read_json, 'os', ('io', 'json', 'data', 'tsframe_v012.json')),
+        (pd.read_msgpack, 'os', ('io', 'msgpack', 'data', 'frame.mp')),
+        (pd.read_pickle, 'os', ('io', 'data', 'categorical_0_14_1.pickle')),
+    ])
+    def test_read_fspath_all(self, reader, module, path, datapath):
+        pytest.importorskip(module)
+        path = datapath(*path)
+
+        mypath = CustomFSPath(path)
+        result = reader(mypath)
+        expected = reader(path)
+        if path.endswith('.pickle'):
+            # categorical
+            tm.assert_categorical_equal(result, expected)
+        else:
+            tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('writer_name, writer_kwargs, module', [
+        ('to_csv', {}, 'os'),
+        ('to_excel', {'engine': 'xlwt'}, 'xlwt'),
+        ('to_feather', {}, 'feather'),
+        ('to_html', {}, 'os'),
+        ('to_json', {}, 'os'),
+        ('to_latex', {}, 'os'),
+        ('to_msgpack', {}, 'os'),
+        ('to_pickle', {}, 'os'),
+        ('to_stata', {}, 'os'),
+    ])
+    def test_write_fspath_all(self, writer_name, writer_kwargs, module):
+        p1 = tm.ensure_clean('string')
+        p2 = tm.ensure_clean('fspath')
+        df = pd.DataFrame({"A": [1, 2]})
+
+        with p1 as string, p2 as fspath:
+            pytest.importorskip(module)
+            mypath = CustomFSPath(fspath)
+            writer = getattr(df, writer_name)
+
+            writer(string, **writer_kwargs)
+            with open(string, 'rb') as f:
+                expected = f.read()
+
+            writer(mypath, **writer_kwargs)
+            with open(fspath, 'rb') as f:
+                result = f.read()
+
+            assert result == expected
+
+    def test_write_fspath_hdf5(self):
+        # Same test as write_fspath_all, except HDF5 files aren't
+        # necessarily byte-for-byte identical for a given dataframe, so we'll
+        # have to read and compare equality
+        pytest.importorskip('tables')
+
+        df = pd.DataFrame({"A": [1, 2]})
+        p1 = tm.ensure_clean('string')
+        p2 = tm.ensure_clean('fspath')
+
+        with p1 as string, p2 as fspath:
+            mypath = CustomFSPath(fspath)
+            df.to_hdf(mypath, key='bar')
+            df.to_hdf(string, key='bar')
+
+            result = pd.read_hdf(fspath, key='bar')
+            expected = pd.read_hdf(string, key='bar')
+
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.fixture
+def mmap_file(datapath):
+    return datapath('io', 'data', 'test_mmap.csv')
+
+
+class TestMMapWrapper(object):
+
+    def test_constructor_bad_file(self, mmap_file):
+        non_file = StringIO('I am not a file')
+        non_file.fileno = lambda: -1
+
+        # the error raised is different on Windows
+        if is_platform_windows():
+            msg = "The parameter is incorrect"
+            err = OSError
+        else:
+            msg = "[Errno 22]"
+            err = mmap.error
+
+        tm.assert_raises_regex(err, msg, common.MMapWrapper, non_file)
+
+        target = open(mmap_file, 'r')
+        target.close()
+
+        msg = "I/O operation on closed file"
+        tm.assert_raises_regex(
+            ValueError, msg, common.MMapWrapper, target)
+
+    def test_get_attr(self, mmap_file):
+        with open(mmap_file, 'r') as target:
+            wrapper = common.MMapWrapper(target)
+
+        attrs = dir(wrapper.mmap)
+        attrs = [attr for attr in attrs
+                 if not attr.startswith('__')]
+        attrs.append('__next__')
+
+        for attr in attrs:
+            assert hasattr(wrapper, attr)
+
+        assert not hasattr(wrapper, 'foo')
+
+    def test_next(self, mmap_file):
+        with open(mmap_file, 'r') as target:
+            wrapper = common.MMapWrapper(target)
+            lines = target.readlines()
+
+        for line in lines:
+            next_line = next(wrapper)
+            assert next_line.strip() == line.strip()
+
+        pytest.raises(StopIteration, next, wrapper)
+
+    def test_unknown_engine(self):
+        with tm.ensure_clean() as path:
+            df = tm.makeDataFrame()
+            df.to_csv(path)
+            with tm.assert_raises_regex(ValueError, 'Unknown engine'):
+                read_csv(path, engine='pyt')
diff --git a/pandas/tests/io/test_excel.py b/pandas/tests/io/test_excel.py
new file mode 100644
index 0000000000000..1fda56dbff772
--- /dev/null
+++ b/pandas/tests/io/test_excel.py
@@ -0,0 +1,2379 @@
+# pylint: disable=E1101
+import os
+import warnings
+from datetime import datetime, date, time, timedelta
+from distutils.version import LooseVersion
+from functools import partial
+from warnings import catch_warnings
+from collections import OrderedDict
+
+import numpy as np
+import pytest
+from numpy import nan
+
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas import DataFrame, Index, MultiIndex
+from pandas.compat import u, range, map, BytesIO, iteritems, PY36
+from pandas.core.config import set_option, get_option
+from pandas.io.common import URLError
+from pandas.io.excel import (
+    ExcelFile, ExcelWriter, read_excel, _XlwtWriter, _OpenpyxlWriter,
+    register_writer, _XlsxWriter
+)
+from pandas.io.formats.excel import ExcelFormatter
+from pandas.io.parsers import read_csv
+from pandas.util.testing import ensure_clean, makeCustomDataframe as mkdf
+
+
+_seriesd = tm.getSeriesData()
+_tsd = tm.getTimeSeriesData()
+_frame = DataFrame(_seriesd)[:10]
+_frame2 = DataFrame(_seriesd, columns=['D', 'C', 'B', 'A'])[:10]
+_tsframe = tm.makeTimeDataFrame()[:5]
+_mixed_frame = _frame.copy()
+_mixed_frame['foo'] = 'bar'
+
+
+@td.skip_if_no('xlrd', '0.9')
+class SharedItems(object):
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.dirpath = datapath("io", "data")
+        self.frame = _frame.copy()
+        self.frame2 = _frame2.copy()
+        self.tsframe = _tsframe.copy()
+        self.mixed_frame = _mixed_frame.copy()
+
+    def get_csv_refdf(self, basename):
+        """
+        Obtain the reference data from read_csv with the Python engine.
+
+        Parameters
+        ----------
+
+        basename : str
+            File base name, excluding file extension.
+
+        Returns
+        -------
+
+        dfref : DataFrame
+        """
+        pref = os.path.join(self.dirpath, basename + '.csv')
+        dfref = read_csv(pref, index_col=0, parse_dates=True, engine='python')
+        return dfref
+
+    def get_excelfile(self, basename, ext):
+        """
+        Return test data ExcelFile instance.
+
+        Parameters
+        ----------
+
+        basename : str
+            File base name, excluding file extension.
+
+        Returns
+        -------
+
+        excel : io.excel.ExcelFile
+        """
+        return ExcelFile(os.path.join(self.dirpath, basename + ext))
+
+    def get_exceldf(self, basename, ext, *args, **kwds):
+        """
+        Return test data DataFrame.
+
+        Parameters
+        ----------
+
+        basename : str
+            File base name, excluding file extension.
+
+        Returns
+        -------
+
+        df : DataFrame
+        """
+        pth = os.path.join(self.dirpath, basename + ext)
+        return read_excel(pth, *args, **kwds)
+
+
+class ReadingTestsBase(SharedItems):
+    # This is based on ExcelWriterBase
+
+    def test_usecols_int(self, ext):
+
+        dfref = self.get_csv_refdf('test1')
+        dfref = dfref.reindex(columns=['A', 'B', 'C'])
+        df1 = self.get_exceldf('test1', ext, 'Sheet1', index_col=0, usecols=3)
+        df2 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                               index_col=0, usecols=3)
+
+        with tm.assert_produces_warning(FutureWarning):
+            df3 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                                   index_col=0, parse_cols=3)
+
+        # TODO add index to xls file)
+        tm.assert_frame_equal(df1, dfref, check_names=False)
+        tm.assert_frame_equal(df2, dfref, check_names=False)
+        tm.assert_frame_equal(df3, dfref, check_names=False)
+
+    def test_usecols_list(self, ext):
+
+        dfref = self.get_csv_refdf('test1')
+        dfref = dfref.reindex(columns=['B', 'C'])
+        df1 = self.get_exceldf('test1', ext, 'Sheet1', index_col=0,
+                               usecols=[0, 2, 3])
+        df2 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                               index_col=0, usecols=[0, 2, 3])
+
+        with tm.assert_produces_warning(FutureWarning):
+            df3 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                                   index_col=0, parse_cols=[0, 2, 3])
+
+        # TODO add index to xls file)
+        tm.assert_frame_equal(df1, dfref, check_names=False)
+        tm.assert_frame_equal(df2, dfref, check_names=False)
+        tm.assert_frame_equal(df3, dfref, check_names=False)
+
+    def test_usecols_str(self, ext):
+
+        dfref = self.get_csv_refdf('test1')
+
+        df1 = dfref.reindex(columns=['A', 'B', 'C'])
+        df2 = self.get_exceldf('test1', ext, 'Sheet1', index_col=0,
+                               usecols='A:D')
+        df3 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                               index_col=0, usecols='A:D')
+
+        with tm.assert_produces_warning(FutureWarning):
+            df4 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                                   index_col=0, parse_cols='A:D')
+
+        # TODO add index to xls, read xls ignores index name ?
+        tm.assert_frame_equal(df2, df1, check_names=False)
+        tm.assert_frame_equal(df3, df1, check_names=False)
+        tm.assert_frame_equal(df4, df1, check_names=False)
+
+        df1 = dfref.reindex(columns=['B', 'C'])
+        df2 = self.get_exceldf('test1', ext, 'Sheet1', index_col=0,
+                               usecols='A,C,D')
+        df3 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                               index_col=0, usecols='A,C,D')
+        # TODO add index to xls file
+        tm.assert_frame_equal(df2, df1, check_names=False)
+        tm.assert_frame_equal(df3, df1, check_names=False)
+
+        df1 = dfref.reindex(columns=['B', 'C'])
+        df2 = self.get_exceldf('test1', ext, 'Sheet1', index_col=0,
+                               usecols='A,C:D')
+        df3 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                               index_col=0, usecols='A,C:D')
+        tm.assert_frame_equal(df2, df1, check_names=False)
+        tm.assert_frame_equal(df3, df1, check_names=False)
+
+    def test_excel_stop_iterator(self, ext):
+
+        parsed = self.get_exceldf('test2', ext, 'Sheet1')
+        expected = DataFrame([['aaaa', 'bbbbb']], columns=['Test', 'Test1'])
+        tm.assert_frame_equal(parsed, expected)
+
+    def test_excel_cell_error_na(self, ext):
+
+        parsed = self.get_exceldf('test3', ext, 'Sheet1')
+        expected = DataFrame([[np.nan]], columns=['Test'])
+        tm.assert_frame_equal(parsed, expected)
+
+    def test_excel_passes_na(self, ext):
+
+        excel = self.get_excelfile('test4', ext)
+
+        parsed = read_excel(excel, 'Sheet1', keep_default_na=False,
+                            na_values=['apple'])
+        expected = DataFrame([['NA'], [1], ['NA'], [np.nan], ['rabbit']],
+                             columns=['Test'])
+        tm.assert_frame_equal(parsed, expected)
+
+        parsed = read_excel(excel, 'Sheet1', keep_default_na=True,
+                            na_values=['apple'])
+        expected = DataFrame([[np.nan], [1], [np.nan], [np.nan], ['rabbit']],
+                             columns=['Test'])
+        tm.assert_frame_equal(parsed, expected)
+
+        # 13967
+        excel = self.get_excelfile('test5', ext)
+
+        parsed = read_excel(excel, 'Sheet1', keep_default_na=False,
+                            na_values=['apple'])
+        expected = DataFrame([['1.#QNAN'], [1], ['nan'], [np.nan], ['rabbit']],
+                             columns=['Test'])
+        tm.assert_frame_equal(parsed, expected)
+
+        parsed = read_excel(excel, 'Sheet1', keep_default_na=True,
+                            na_values=['apple'])
+        expected = DataFrame([[np.nan], [1], [np.nan], [np.nan], ['rabbit']],
+                             columns=['Test'])
+        tm.assert_frame_equal(parsed, expected)
+
+    def test_excel_table_sheet_by_index(self, ext):
+
+        excel = self.get_excelfile('test1', ext)
+        dfref = self.get_csv_refdf('test1')
+
+        df1 = read_excel(excel, 0, index_col=0)
+        df2 = read_excel(excel, 1, skiprows=[1], index_col=0)
+        tm.assert_frame_equal(df1, dfref, check_names=False)
+        tm.assert_frame_equal(df2, dfref, check_names=False)
+
+        df1 = excel.parse(0, index_col=0)
+        df2 = excel.parse(1, skiprows=[1], index_col=0)
+        tm.assert_frame_equal(df1, dfref, check_names=False)
+        tm.assert_frame_equal(df2, dfref, check_names=False)
+
+        df3 = read_excel(excel, 0, index_col=0, skipfooter=1)
+        tm.assert_frame_equal(df3, df1.iloc[:-1])
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            df4 = read_excel(excel, 0, index_col=0, skip_footer=1)
+            tm.assert_frame_equal(df3, df4)
+
+        df3 = excel.parse(0, index_col=0, skipfooter=1)
+        tm.assert_frame_equal(df3, df1.iloc[:-1])
+
+        import xlrd
+        with pytest.raises(xlrd.XLRDError):
+            read_excel(excel, 'asdf')
+
+    def test_excel_table(self, ext):
+
+        dfref = self.get_csv_refdf('test1')
+
+        df1 = self.get_exceldf('test1', ext, 'Sheet1', index_col=0)
+        df2 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                               index_col=0)
+        # TODO add index to file
+        tm.assert_frame_equal(df1, dfref, check_names=False)
+        tm.assert_frame_equal(df2, dfref, check_names=False)
+
+        df3 = self.get_exceldf('test1', ext, 'Sheet1', index_col=0,
+                               skipfooter=1)
+        tm.assert_frame_equal(df3, df1.iloc[:-1])
+
+    def test_reader_special_dtypes(self, ext):
+
+        expected = DataFrame.from_dict(OrderedDict([
+            ("IntCol", [1, 2, -3, 4, 0]),
+            ("FloatCol", [1.25, 2.25, 1.83, 1.92, 0.0000000005]),
+            ("BoolCol", [True, False, True, True, False]),
+            ("StrCol", [1, 2, 3, 4, 5]),
+            # GH5394 - this is why convert_float isn't vectorized
+            ("Str2Col", ["a", 3, "c", "d", "e"]),
+            ("DateCol", [datetime(2013, 10, 30), datetime(2013, 10, 31),
+                         datetime(1905, 1, 1), datetime(2013, 12, 14),
+                         datetime(2015, 3, 14)])
+        ]))
+        basename = 'test_types'
+
+        # should read in correctly and infer types
+        actual = self.get_exceldf(basename, ext, 'Sheet1')
+        tm.assert_frame_equal(actual, expected)
+
+        # if not coercing number, then int comes in as float
+        float_expected = expected.copy()
+        float_expected["IntCol"] = float_expected["IntCol"].astype(float)
+        float_expected.loc[float_expected.index[1], "Str2Col"] = 3.0
+        actual = self.get_exceldf(basename, ext, 'Sheet1', convert_float=False)
+        tm.assert_frame_equal(actual, float_expected)
+
+        # check setting Index (assuming xls and xlsx are the same here)
+        for icol, name in enumerate(expected.columns):
+            actual = self.get_exceldf(basename, ext, 'Sheet1', index_col=icol)
+            exp = expected.set_index(name)
+            tm.assert_frame_equal(actual, exp)
+
+        # convert_float and converters should be different but both accepted
+        expected["StrCol"] = expected["StrCol"].apply(str)
+        actual = self.get_exceldf(
+            basename, ext, 'Sheet1', converters={"StrCol": str})
+        tm.assert_frame_equal(actual, expected)
+
+        no_convert_float = float_expected.copy()
+        no_convert_float["StrCol"] = no_convert_float["StrCol"].apply(str)
+        actual = self.get_exceldf(basename, ext, 'Sheet1', convert_float=False,
+                                  converters={"StrCol": str})
+        tm.assert_frame_equal(actual, no_convert_float)
+
+    # GH8212 - support for converters and missing values
+    def test_reader_converters(self, ext):
+
+        basename = 'test_converters'
+
+        expected = DataFrame.from_dict(OrderedDict([
+            ("IntCol", [1, 2, -3, -1000, 0]),
+            ("FloatCol", [12.5, np.nan, 18.3, 19.2, 0.000000005]),
+            ("BoolCol", ['Found', 'Found', 'Found', 'Not found', 'Found']),
+            ("StrCol", ['1', np.nan, '3', '4', '5']),
+        ]))
+
+        converters = {'IntCol': lambda x: int(x) if x != '' else -1000,
+                      'FloatCol': lambda x: 10 * x if x else np.nan,
+                      2: lambda x: 'Found' if x != '' else 'Not found',
+                      3: lambda x: str(x) if x else '',
+                      }
+
+        # should read in correctly and set types of single cells (not array
+        # dtypes)
+        actual = self.get_exceldf(basename, ext, 'Sheet1',
+                                  converters=converters)
+        tm.assert_frame_equal(actual, expected)
+
+    def test_reader_dtype(self, ext):
+        # GH 8212
+        basename = 'testdtype'
+        actual = self.get_exceldf(basename, ext)
+
+        expected = DataFrame({
+            'a': [1, 2, 3, 4],
+            'b': [2.5, 3.5, 4.5, 5.5],
+            'c': [1, 2, 3, 4],
+            'd': [1.0, 2.0, np.nan, 4.0]}).reindex(
+                columns=['a', 'b', 'c', 'd'])
+
+        tm.assert_frame_equal(actual, expected)
+
+        actual = self.get_exceldf(basename, ext,
+                                  dtype={'a': 'float64',
+                                         'b': 'float32',
+                                         'c': str})
+
+        expected['a'] = expected['a'].astype('float64')
+        expected['b'] = expected['b'].astype('float32')
+        expected['c'] = ['001', '002', '003', '004']
+        tm.assert_frame_equal(actual, expected)
+
+        with pytest.raises(ValueError):
+            actual = self.get_exceldf(basename, ext, dtype={'d': 'int64'})
+
+    def test_reading_all_sheets(self, ext):
+        # Test reading all sheetnames by setting sheetname to None,
+        # Ensure a dict is returned.
+        # See PR #9450
+        basename = 'test_multisheet'
+        dfs = self.get_exceldf(basename, ext, sheet_name=None)
+        # ensure this is not alphabetical to test order preservation
+        expected_keys = ['Charlie', 'Alpha', 'Beta']
+        tm.assert_contains_all(expected_keys, dfs.keys())
+        # Issue 9930
+        # Ensure sheet order is preserved
+        assert expected_keys == list(dfs.keys())
+
+    def test_reading_multiple_specific_sheets(self, ext):
+        # Test reading specific sheetnames by specifying a mixed list
+        # of integers and strings, and confirm that duplicated sheet
+        # references (positions/names) are removed properly.
+        # Ensure a dict is returned
+        # See PR #9450
+        basename = 'test_multisheet'
+        # Explicitly request duplicates. Only the set should be returned.
+        expected_keys = [2, 'Charlie', 'Charlie']
+        dfs = self.get_exceldf(basename, ext, sheet_name=expected_keys)
+        expected_keys = list(set(expected_keys))
+        tm.assert_contains_all(expected_keys, dfs.keys())
+        assert len(expected_keys) == len(dfs.keys())
+
+    def test_reading_all_sheets_with_blank(self, ext):
+        # Test reading all sheetnames by setting sheetname to None,
+        # In the case where some sheets are blank.
+        # Issue #11711
+        basename = 'blank_with_header'
+        dfs = self.get_exceldf(basename, ext, sheet_name=None)
+        expected_keys = ['Sheet1', 'Sheet2', 'Sheet3']
+        tm.assert_contains_all(expected_keys, dfs.keys())
+
+    # GH6403
+    def test_read_excel_blank(self, ext):
+        actual = self.get_exceldf('blank', ext, 'Sheet1')
+        tm.assert_frame_equal(actual, DataFrame())
+
+    def test_read_excel_blank_with_header(self, ext):
+        expected = DataFrame(columns=['col_1', 'col_2'])
+        actual = self.get_exceldf('blank_with_header', ext, 'Sheet1')
+        tm.assert_frame_equal(actual, expected)
+
+    @td.skip_if_no('openpyxl')
+    @td.skip_if_no('xlwt')
+    # GH 12292 : error when read one empty column from excel file
+    def test_read_one_empty_col_no_header(self, ext):
+        df = pd.DataFrame(
+            [["", 1, 100],
+             ["", 2, 200],
+             ["", 3, 300],
+             ["", 4, 400]]
+        )
+        with ensure_clean(ext) as path:
+            df.to_excel(path, 'no_header', index=False, header=False)
+            actual_header_none = read_excel(
+                path,
+                'no_header',
+                usecols=[0],
+                header=None
+            )
+
+            actual_header_zero = read_excel(
+                path,
+                'no_header',
+                usecols=[0],
+                header=0
+            )
+        expected = DataFrame()
+        tm.assert_frame_equal(actual_header_none, expected)
+        tm.assert_frame_equal(actual_header_zero, expected)
+
+    @td.skip_if_no('openpyxl')
+    @td.skip_if_no('xlwt')
+    def test_read_one_empty_col_with_header(self, ext):
+        df = pd.DataFrame(
+            [["", 1, 100],
+             ["", 2, 200],
+             ["", 3, 300],
+             ["", 4, 400]]
+        )
+        with ensure_clean(ext) as path:
+            df.to_excel(path, 'with_header', index=False, header=True)
+            actual_header_none = read_excel(
+                path,
+                'with_header',
+                usecols=[0],
+                header=None
+            )
+
+            actual_header_zero = read_excel(
+                path,
+                'with_header',
+                usecols=[0],
+                header=0
+            )
+        expected_header_none = DataFrame(pd.Series([0], dtype='int64'))
+        tm.assert_frame_equal(actual_header_none, expected_header_none)
+        expected_header_zero = DataFrame(columns=[0])
+        tm.assert_frame_equal(actual_header_zero, expected_header_zero)
+
+    @td.skip_if_no('openpyxl')
+    @td.skip_if_no('xlwt')
+    def test_set_column_names_in_parameter(self, ext):
+        # GH 12870 : pass down column names associated with
+        # keyword argument names
+        refdf = pd.DataFrame([[1, 'foo'], [2, 'bar'],
+                              [3, 'baz']], columns=['a', 'b'])
+
+        with ensure_clean(ext) as pth:
+            with ExcelWriter(pth) as writer:
+                refdf.to_excel(writer, 'Data_no_head',
+                               header=False, index=False)
+                refdf.to_excel(writer, 'Data_with_head', index=False)
+
+            refdf.columns = ['A', 'B']
+
+            with ExcelFile(pth) as reader:
+                xlsdf_no_head = read_excel(reader, 'Data_no_head',
+                                           header=None, names=['A', 'B'])
+                xlsdf_with_head = read_excel(reader, 'Data_with_head',
+                                             index_col=None, names=['A', 'B'])
+
+            tm.assert_frame_equal(xlsdf_no_head, refdf)
+            tm.assert_frame_equal(xlsdf_with_head, refdf)
+
+    def test_date_conversion_overflow(self, ext):
+        # GH 10001 : pandas.ExcelFile ignore parse_dates=False
+        expected = pd.DataFrame([[pd.Timestamp('2016-03-12'), 'Marc Johnson'],
+                                 [pd.Timestamp('2016-03-16'), 'Jack Black'],
+                                 [1e+20, 'Timothy Brown']],
+                                columns=['DateColWithBigInt', 'StringCol'])
+
+        result = self.get_exceldf('testdateoverflow', ext)
+        tm.assert_frame_equal(result, expected)
+
+    def test_sheet_name_and_sheetname(self, ext):
+        # GH10559: Minor improvement: Change "sheet_name" to "sheetname"
+        # GH10969: DOC: Consistent var names (sheetname vs sheet_name)
+        # GH12604: CLN GH10559 Rename sheetname variable to sheet_name
+        # GH20920: ExcelFile.parse() and pd.read_xlsx() have different
+        #          behavior for "sheetname" argument
+        dfref = self.get_csv_refdf('test1')
+        df1 = self.get_exceldf('test1', ext,
+                               sheet_name='Sheet1')  # doc
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            df2 = self.get_exceldf('test1', ext,
+                                   sheetname='Sheet1')  # bkwrd compat
+
+        excel = self.get_excelfile('test1', ext)
+        df1_parse = excel.parse(sheet_name='Sheet1')    # doc
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            df2_parse = excel.parse(sheetname='Sheet1')  # bkwrd compat
+
+        tm.assert_frame_equal(df1, dfref, check_names=False)
+        tm.assert_frame_equal(df2, dfref, check_names=False)
+        tm.assert_frame_equal(df1_parse, dfref, check_names=False)
+        tm.assert_frame_equal(df2_parse, dfref, check_names=False)
+
+    def test_sheet_name_both_raises(self, ext):
+        with tm.assert_raises_regex(TypeError, "Cannot specify both"):
+            self.get_exceldf('test1', ext, sheetname='Sheet1',
+                             sheet_name='Sheet1')
+
+        excel = self.get_excelfile('test1', ext)
+        with tm.assert_raises_regex(TypeError, "Cannot specify both"):
+            excel.parse(sheetname='Sheet1',
+                        sheet_name='Sheet1')
+
+
+@pytest.mark.parametrize("ext", ['.xls', '.xlsx', '.xlsm'])
+class TestXlrdReader(ReadingTestsBase):
+    """
+    This is the base class for the xlrd tests, and 3 different file formats
+    are supported: xls, xlsx, xlsm
+    """
+
+    def test_excel_read_buffer(self, ext):
+
+        pth = os.path.join(self.dirpath, 'test1' + ext)
+        expected = read_excel(pth, 'Sheet1', index_col=0)
+        with open(pth, 'rb') as f:
+            actual = read_excel(f, 'Sheet1', index_col=0)
+            tm.assert_frame_equal(expected, actual)
+
+        with open(pth, 'rb') as f:
+            xls = ExcelFile(f)
+            actual = read_excel(xls, 'Sheet1', index_col=0)
+            tm.assert_frame_equal(expected, actual)
+
+    @td.skip_if_no('xlwt')
+    def test_read_xlrd_Book(self, ext):
+        import xlrd
+
+        df = self.frame
+        with ensure_clean('.xls') as pth:
+            df.to_excel(pth, "SheetA")
+            book = xlrd.open_workbook(pth)
+
+            with ExcelFile(book, engine="xlrd") as xl:
+                result = read_excel(xl, "SheetA")
+                tm.assert_frame_equal(df, result)
+
+            result = read_excel(book, sheet_name="SheetA", engine="xlrd")
+            tm.assert_frame_equal(df, result)
+
+    @tm.network
+    def test_read_from_http_url(self, ext):
+        url = ('https://raw.github.com/pandas-dev/pandas/master/'
+               'pandas/tests/io/data/test1' + ext)
+        url_table = read_excel(url)
+        local_table = self.get_exceldf('test1', ext)
+        tm.assert_frame_equal(url_table, local_table)
+
+    @td.skip_if_no('s3fs')
+    def test_read_from_s3_url(self, ext):
+        boto3 = pytest.importorskip('boto3')
+        moto = pytest.importorskip('moto')
+
+        with moto.mock_s3():
+            conn = boto3.resource("s3", region_name="us-east-1")
+            conn.create_bucket(Bucket="pandas-test")
+            file_name = os.path.join(self.dirpath, 'test1' + ext)
+            with open(file_name, 'rb') as f:
+                conn.Bucket("pandas-test").put_object(Key="test1" + ext,
+                                                      Body=f)
+
+            url = ('s3://pandas-test/test1' + ext)
+            url_table = read_excel(url)
+            local_table = self.get_exceldf('test1', ext)
+            tm.assert_frame_equal(url_table, local_table)
+
+    @pytest.mark.slow
+    def test_read_from_file_url(self, ext):
+
+        # FILE
+        localtable = os.path.join(self.dirpath, 'test1' + ext)
+        local_table = read_excel(localtable)
+
+        try:
+            url_table = read_excel('file://localhost/' + localtable)
+        except URLError:
+            # fails on some systems
+            import platform
+            pytest.skip("failing on %s" %
+                        ' '.join(platform.uname()).strip())
+
+        tm.assert_frame_equal(url_table, local_table)
+
+    @td.skip_if_no('pathlib')
+    def test_read_from_pathlib_path(self, ext):
+
+        # GH12655
+        from pathlib import Path
+
+        str_path = os.path.join(self.dirpath, 'test1' + ext)
+        expected = read_excel(str_path, 'Sheet1', index_col=0)
+
+        path_obj = Path(self.dirpath, 'test1' + ext)
+        actual = read_excel(path_obj, 'Sheet1', index_col=0)
+
+        tm.assert_frame_equal(expected, actual)
+
+    @td.skip_if_no('py.path')
+    def test_read_from_py_localpath(self, ext):
+
+        # GH12655
+        from py.path import local as LocalPath
+
+        str_path = os.path.join(self.dirpath, 'test1' + ext)
+        expected = read_excel(str_path, 'Sheet1', index_col=0)
+
+        abs_dir = os.path.abspath(self.dirpath)
+        path_obj = LocalPath(abs_dir).join('test1' + ext)
+        actual = read_excel(path_obj, 'Sheet1', index_col=0)
+
+        tm.assert_frame_equal(expected, actual)
+
+    def test_reader_closes_file(self, ext):
+
+        pth = os.path.join(self.dirpath, 'test1' + ext)
+        f = open(pth, 'rb')
+        with ExcelFile(f) as xlsx:
+            # parses okay
+            read_excel(xlsx, 'Sheet1', index_col=0)
+
+        assert f.closed
+
+    @td.skip_if_no('openpyxl')
+    @td.skip_if_no('xlwt')
+    def test_creating_and_reading_multiple_sheets(self, ext):
+        # Test reading multiple sheets, from a runtime created excel file
+        # with multiple sheets.
+        # See PR #9450
+        def tdf(sheetname):
+            d, i = [11, 22, 33], [1, 2, 3]
+            return DataFrame(d, i, columns=[sheetname])
+
+        sheets = ['AAA', 'BBB', 'CCC']
+
+        dfs = [tdf(s) for s in sheets]
+        dfs = dict(zip(sheets, dfs))
+
+        with ensure_clean(ext) as pth:
+            with ExcelWriter(pth) as ew:
+                for sheetname, df in iteritems(dfs):
+                    df.to_excel(ew, sheetname)
+            dfs_returned = read_excel(pth, sheet_name=sheets)
+            for s in sheets:
+                tm.assert_frame_equal(dfs[s], dfs_returned[s])
+
+    def test_reader_seconds(self, ext):
+        import xlrd
+
+        # Test reading times with and without milliseconds. GH5945.
+        if LooseVersion(xlrd.__VERSION__) >= LooseVersion("0.9.3"):
+            # Xlrd >= 0.9.3 can handle Excel milliseconds.
+            expected = DataFrame.from_dict({"Time": [time(1, 2, 3),
+                                            time(2, 45, 56, 100000),
+                                            time(4, 29, 49, 200000),
+                                            time(6, 13, 42, 300000),
+                                            time(7, 57, 35, 400000),
+                                            time(9, 41, 28, 500000),
+                                            time(11, 25, 21, 600000),
+                                            time(13, 9, 14, 700000),
+                                            time(14, 53, 7, 800000),
+                                            time(16, 37, 0, 900000),
+                                            time(18, 20, 54)]})
+        else:
+            # Xlrd < 0.9.3 rounds Excel milliseconds.
+            expected = DataFrame.from_dict({"Time": [time(1, 2, 3),
+                                            time(2, 45, 56),
+                                            time(4, 29, 49),
+                                            time(6, 13, 42),
+                                            time(7, 57, 35),
+                                            time(9, 41, 29),
+                                            time(11, 25, 22),
+                                            time(13, 9, 15),
+                                            time(14, 53, 8),
+                                            time(16, 37, 1),
+                                            time(18, 20, 54)]})
+
+        actual = self.get_exceldf('times_1900', ext, 'Sheet1')
+        tm.assert_frame_equal(actual, expected)
+
+        actual = self.get_exceldf('times_1904', ext, 'Sheet1')
+        tm.assert_frame_equal(actual, expected)
+
+    def test_read_excel_multiindex(self, ext):
+        # GH 4679
+        mi = MultiIndex.from_product([['foo', 'bar'], ['a', 'b']])
+        mi_file = os.path.join(self.dirpath, 'testmultiindex' + ext)
+
+        expected = DataFrame([[1, 2.5, pd.Timestamp('2015-01-01'), True],
+                              [2, 3.5, pd.Timestamp('2015-01-02'), False],
+                              [3, 4.5, pd.Timestamp('2015-01-03'), False],
+                              [4, 5.5, pd.Timestamp('2015-01-04'), True]],
+                             columns=mi)
+
+        actual = read_excel(mi_file, 'mi_column', header=[0, 1])
+        tm.assert_frame_equal(actual, expected)
+        actual = read_excel(mi_file, 'mi_column', header=[0, 1], index_col=0)
+        tm.assert_frame_equal(actual, expected)
+
+        expected.columns = ['a', 'b', 'c', 'd']
+        expected.index = mi
+        actual = read_excel(mi_file, 'mi_index', index_col=[0, 1])
+        tm.assert_frame_equal(actual, expected, check_names=False)
+
+        expected.columns = mi
+        actual = read_excel(mi_file, 'both', index_col=[0, 1], header=[0, 1])
+        tm.assert_frame_equal(actual, expected, check_names=False)
+
+        expected.index = mi.set_names(['ilvl1', 'ilvl2'])
+        expected.columns = ['a', 'b', 'c', 'd']
+        actual = read_excel(mi_file, 'mi_index_name', index_col=[0, 1])
+        tm.assert_frame_equal(actual, expected)
+
+        expected.index = list(range(4))
+        expected.columns = mi.set_names(['c1', 'c2'])
+        actual = read_excel(mi_file, 'mi_column_name',
+                            header=[0, 1], index_col=0)
+        tm.assert_frame_equal(actual, expected)
+
+        # Issue #11317
+        expected.columns = mi.set_levels(
+            [1, 2], level=1).set_names(['c1', 'c2'])
+        actual = read_excel(mi_file, 'name_with_int',
+                            index_col=0, header=[0, 1])
+        tm.assert_frame_equal(actual, expected)
+
+        expected.columns = mi.set_names(['c1', 'c2'])
+        expected.index = mi.set_names(['ilvl1', 'ilvl2'])
+        actual = read_excel(mi_file, 'both_name',
+                            index_col=[0, 1], header=[0, 1])
+        tm.assert_frame_equal(actual, expected)
+
+        actual = read_excel(mi_file, 'both_name',
+                            index_col=[0, 1], header=[0, 1])
+        tm.assert_frame_equal(actual, expected)
+
+        actual = read_excel(mi_file, 'both_name_skiprows', index_col=[0, 1],
+                            header=[0, 1], skiprows=2)
+        tm.assert_frame_equal(actual, expected)
+
+    @td.skip_if_no('xlsxwriter')
+    def test_read_excel_multiindex_empty_level(self, ext):
+        # GH 12453
+        with ensure_clean('.xlsx') as path:
+            df = DataFrame({
+                ('One', 'x'): {0: 1},
+                ('Two', 'X'): {0: 3},
+                ('Two', 'Y'): {0: 7},
+                ('Zero', ''): {0: 0}
+            })
+
+            expected = DataFrame({
+                ('One', u'x'): {0: 1},
+                ('Two', u'X'): {0: 3},
+                ('Two', u'Y'): {0: 7},
+                ('Zero', 'Unnamed: 3_level_1'): {0: 0}
+            })
+
+            df.to_excel(path)
+            actual = pd.read_excel(path, header=[0, 1])
+            tm.assert_frame_equal(actual, expected)
+
+            df = pd.DataFrame({
+                ('Beg', ''): {0: 0},
+                ('Middle', 'x'): {0: 1},
+                ('Tail', 'X'): {0: 3},
+                ('Tail', 'Y'): {0: 7}
+            })
+
+            expected = pd.DataFrame({
+                ('Beg', 'Unnamed: 0_level_1'): {0: 0},
+                ('Middle', u'x'): {0: 1},
+                ('Tail', u'X'): {0: 3},
+                ('Tail', u'Y'): {0: 7}
+            })
+
+            df.to_excel(path)
+            actual = pd.read_excel(path, header=[0, 1])
+            tm.assert_frame_equal(actual, expected)
+
+    @td.skip_if_no('xlsxwriter')
+    def test_excel_multindex_roundtrip(self, ext):
+        # GH 4679
+        with ensure_clean('.xlsx') as pth:
+            for c_idx_names in [True, False]:
+                for r_idx_names in [True, False]:
+                    for c_idx_levels in [1, 3]:
+                        for r_idx_levels in [1, 3]:
+                            # column index name can't be serialized unless
+                            # MultiIndex
+                            if (c_idx_levels == 1 and c_idx_names):
+                                continue
+
+                            # empty name case current read in as unnamed
+                            # levels, not Nones
+                            check_names = True
+                            if not r_idx_names and r_idx_levels > 1:
+                                check_names = False
+
+                            df = mkdf(5, 5, c_idx_names,
+                                      r_idx_names, c_idx_levels,
+                                      r_idx_levels)
+                            df.to_excel(pth)
+                            act = pd.read_excel(
+                                pth, index_col=list(range(r_idx_levels)),
+                                header=list(range(c_idx_levels)))
+                            tm.assert_frame_equal(
+                                df, act, check_names=check_names)
+
+                            df.iloc[0, :] = np.nan
+                            df.to_excel(pth)
+                            act = pd.read_excel(
+                                pth, index_col=list(range(r_idx_levels)),
+                                header=list(range(c_idx_levels)))
+                            tm.assert_frame_equal(
+                                df, act, check_names=check_names)
+
+                            df.iloc[-1, :] = np.nan
+                            df.to_excel(pth)
+                            act = pd.read_excel(
+                                pth, index_col=list(range(r_idx_levels)),
+                                header=list(range(c_idx_levels)))
+                            tm.assert_frame_equal(
+                                df, act, check_names=check_names)
+
+    def test_excel_old_index_format(self, ext):
+        # see gh-4679
+        filename = 'test_index_name_pre17' + ext
+        in_file = os.path.join(self.dirpath, filename)
+
+        # We detect headers to determine if index names exist, so
+        # that "index" name in the "names" version of the data will
+        # now be interpreted as rows that include null data.
+        data = np.array([[None, None, None, None, None],
+                         ['R0C0', 'R0C1', 'R0C2', 'R0C3', 'R0C4'],
+                         ['R1C0', 'R1C1', 'R1C2', 'R1C3', 'R1C4'],
+                         ['R2C0', 'R2C1', 'R2C2', 'R2C3', 'R2C4'],
+                         ['R3C0', 'R3C1', 'R3C2', 'R3C3', 'R3C4'],
+                         ['R4C0', 'R4C1', 'R4C2', 'R4C3', 'R4C4']])
+        columns = ['C_l0_g0', 'C_l0_g1', 'C_l0_g2', 'C_l0_g3', 'C_l0_g4']
+        mi = MultiIndex(levels=[['R0', 'R_l0_g0', 'R_l0_g1',
+                                 'R_l0_g2', 'R_l0_g3', 'R_l0_g4'],
+                                ['R1', 'R_l1_g0', 'R_l1_g1',
+                                 'R_l1_g2', 'R_l1_g3', 'R_l1_g4']],
+                        labels=[[0, 1, 2, 3, 4, 5], [0, 1, 2, 3, 4, 5]],
+                        names=[None, None])
+        si = Index(['R0', 'R_l0_g0', 'R_l0_g1', 'R_l0_g2',
+                    'R_l0_g3', 'R_l0_g4'], name=None)
+
+        expected = pd.DataFrame(data, index=si, columns=columns)
+
+        actual = pd.read_excel(in_file, 'single_names')
+        tm.assert_frame_equal(actual, expected)
+
+        expected.index = mi
+
+        actual = pd.read_excel(in_file, 'multi_names')
+        tm.assert_frame_equal(actual, expected)
+
+        # The analogous versions of the "names" version data
+        # where there are explicitly no names for the indices.
+        data = np.array([['R0C0', 'R0C1', 'R0C2', 'R0C3', 'R0C4'],
+                         ['R1C0', 'R1C1', 'R1C2', 'R1C3', 'R1C4'],
+                         ['R2C0', 'R2C1', 'R2C2', 'R2C3', 'R2C4'],
+                         ['R3C0', 'R3C1', 'R3C2', 'R3C3', 'R3C4'],
+                         ['R4C0', 'R4C1', 'R4C2', 'R4C3', 'R4C4']])
+        columns = ['C_l0_g0', 'C_l0_g1', 'C_l0_g2', 'C_l0_g3', 'C_l0_g4']
+        mi = MultiIndex(levels=[['R_l0_g0', 'R_l0_g1', 'R_l0_g2',
+                                 'R_l0_g3', 'R_l0_g4'],
+                                ['R_l1_g0', 'R_l1_g1', 'R_l1_g2',
+                                 'R_l1_g3', 'R_l1_g4']],
+                        labels=[[0, 1, 2, 3, 4], [0, 1, 2, 3, 4]],
+                        names=[None, None])
+        si = Index(['R_l0_g0', 'R_l0_g1', 'R_l0_g2',
+                    'R_l0_g3', 'R_l0_g4'], name=None)
+
+        expected = pd.DataFrame(data, index=si, columns=columns)
+
+        actual = pd.read_excel(in_file, 'single_no_names')
+        tm.assert_frame_equal(actual, expected)
+
+        expected.index = mi
+
+        actual = pd.read_excel(in_file, 'multi_no_names', index_col=[0, 1])
+        tm.assert_frame_equal(actual, expected, check_names=False)
+
+    def test_read_excel_bool_header_arg(self, ext):
+        # GH 6114
+        for arg in [True, False]:
+            with pytest.raises(TypeError):
+                pd.read_excel(os.path.join(self.dirpath, 'test1' + ext),
+                              header=arg)
+
+    def test_read_excel_chunksize(self, ext):
+        # GH 8011
+        with pytest.raises(NotImplementedError):
+            pd.read_excel(os.path.join(self.dirpath, 'test1' + ext),
+                          chunksize=100)
+
+    @td.skip_if_no('openpyxl')
+    @td.skip_if_no('xlwt')
+    def test_read_excel_parse_dates(self, ext):
+        # GH 11544, 12051
+        df = DataFrame(
+            {'col': [1, 2, 3],
+             'date_strings': pd.date_range('2012-01-01', periods=3)})
+        df2 = df.copy()
+        df2['date_strings'] = df2['date_strings'].dt.strftime('%m/%d/%Y')
+
+        with ensure_clean(ext) as pth:
+            df2.to_excel(pth)
+
+            res = read_excel(pth)
+            tm.assert_frame_equal(df2, res)
+
+            # no index_col specified when parse_dates is True
+            with tm.assert_produces_warning():
+                res = read_excel(pth, parse_dates=True)
+                tm.assert_frame_equal(df2, res)
+
+            res = read_excel(pth, parse_dates=['date_strings'], index_col=0)
+            tm.assert_frame_equal(df, res)
+
+            dateparser = lambda x: pd.datetime.strptime(x, '%m/%d/%Y')
+            res = read_excel(pth, parse_dates=['date_strings'],
+                             date_parser=dateparser, index_col=0)
+            tm.assert_frame_equal(df, res)
+
+    def test_read_excel_skiprows_list(self, ext):
+        # GH 4903
+        actual = pd.read_excel(os.path.join(self.dirpath,
+                                            'testskiprows' + ext),
+                               'skiprows_list', skiprows=[0, 2])
+        expected = DataFrame([[1, 2.5, pd.Timestamp('2015-01-01'), True],
+                              [2, 3.5, pd.Timestamp('2015-01-02'), False],
+                              [3, 4.5, pd.Timestamp('2015-01-03'), False],
+                              [4, 5.5, pd.Timestamp('2015-01-04'), True]],
+                             columns=['a', 'b', 'c', 'd'])
+        tm.assert_frame_equal(actual, expected)
+
+        actual = pd.read_excel(os.path.join(self.dirpath,
+                                            'testskiprows' + ext),
+                               'skiprows_list', skiprows=np.array([0, 2]))
+        tm.assert_frame_equal(actual, expected)
+
+    def test_read_excel_nrows(self, ext):
+        # GH 16645
+        num_rows_to_pull = 5
+        actual = pd.read_excel(os.path.join(self.dirpath, 'test1' + ext),
+                               nrows=num_rows_to_pull)
+        expected = pd.read_excel(os.path.join(self.dirpath,
+                                              'test1' + ext))
+        expected = expected[:num_rows_to_pull]
+        tm.assert_frame_equal(actual, expected)
+
+    def test_read_excel_nrows_greater_than_nrows_in_file(self, ext):
+        # GH 16645
+        expected = pd.read_excel(os.path.join(self.dirpath,
+                                              'test1' + ext))
+        num_records_in_file = len(expected)
+        num_rows_to_pull = num_records_in_file + 10
+        actual = pd.read_excel(os.path.join(self.dirpath, 'test1' + ext),
+                               nrows=num_rows_to_pull)
+        tm.assert_frame_equal(actual, expected)
+
+    def test_read_excel_nrows_non_integer_parameter(self, ext):
+        # GH 16645
+        msg = "'nrows' must be an integer >=0"
+        with tm.assert_raises_regex(ValueError, msg):
+            pd.read_excel(os.path.join(self.dirpath, 'test1' + ext),
+                          nrows='5')
+
+    def test_read_excel_squeeze(self, ext):
+        # GH 12157
+        f = os.path.join(self.dirpath, 'test_squeeze' + ext)
+
+        actual = pd.read_excel(f, 'two_columns', index_col=0, squeeze=True)
+        expected = pd.Series([2, 3, 4], [4, 5, 6], name='b')
+        expected.index.name = 'a'
+        tm.assert_series_equal(actual, expected)
+
+        actual = pd.read_excel(f, 'two_columns', squeeze=True)
+        expected = pd.DataFrame({'a': [4, 5, 6],
+                                 'b': [2, 3, 4]})
+        tm.assert_frame_equal(actual, expected)
+
+        actual = pd.read_excel(f, 'one_column', squeeze=True)
+        expected = pd.Series([1, 2, 3], name='a')
+        tm.assert_series_equal(actual, expected)
+
+
+class _WriterBase(SharedItems):
+
+    @pytest.fixture(autouse=True)
+    def set_engine_and_path(self, request, merge_cells, engine, ext):
+        """Fixture to set engine and open file for use in each test case
+
+        Rather than requiring `engine=...` to be provided explicitly as an
+        argument in each test, this fixture sets a global option to dictate
+        which engine should be used to write Excel files. After executing
+        the test it rolls back said change to the global option.
+
+        It also uses a context manager to open a temporary excel file for
+        the function to write to, accessible via `self.path`
+
+        Notes
+        -----
+        This fixture will run as part of each test method defined in the
+        class and any subclasses, on account of the `autouse=True`
+        argument
+        """
+        option_name = 'io.excel.{ext}.writer'.format(ext=ext.strip('.'))
+        prev_engine = get_option(option_name)
+        set_option(option_name, engine)
+        with ensure_clean(ext) as path:
+            self.path = path
+            yield
+        set_option(option_name, prev_engine)  # Roll back option change
+
+
+@pytest.mark.parametrize("merge_cells", [True, False])
+@pytest.mark.parametrize("engine,ext", [
+    pytest.param('openpyxl', '.xlsx', marks=pytest.mark.skipif(
+        not td.safe_import('openpyxl'), reason='No openpyxl')),
+    pytest.param('openpyxl', '.xlsm', marks=pytest.mark.skipif(
+        not td.safe_import('openpyxl'), reason='No openpyxl')),
+    pytest.param('xlwt', '.xls', marks=pytest.mark.skipif(
+        not td.safe_import('xlwt'), reason='No xlwt')),
+    pytest.param('xlsxwriter', '.xlsx', marks=pytest.mark.skipif(
+        not td.safe_import('xlsxwriter'), reason='No xlsxwriter'))
+])
+class TestExcelWriter(_WriterBase):
+    # Base class for test cases to run with different Excel writers.
+
+    def test_excel_sheet_by_name_raise(self, merge_cells, engine, ext):
+        import xlrd
+
+        gt = DataFrame(np.random.randn(10, 2))
+        gt.to_excel(self.path)
+        xl = ExcelFile(self.path)
+        df = read_excel(xl, 0)
+        tm.assert_frame_equal(gt, df)
+
+        with pytest.raises(xlrd.XLRDError):
+            read_excel(xl, '0')
+
+    def test_excelwriter_contextmanager(self, merge_cells, engine, ext):
+        with ExcelWriter(self.path) as writer:
+            self.frame.to_excel(writer, 'Data1')
+            self.frame2.to_excel(writer, 'Data2')
+
+        with ExcelFile(self.path) as reader:
+            found_df = read_excel(reader, 'Data1')
+            found_df2 = read_excel(reader, 'Data2')
+            tm.assert_frame_equal(found_df, self.frame)
+            tm.assert_frame_equal(found_df2, self.frame2)
+
+    def test_roundtrip(self, merge_cells, engine, ext):
+        self.frame['A'][:5] = nan
+
+        self.frame.to_excel(self.path, 'test1')
+        self.frame.to_excel(self.path, 'test1', columns=['A', 'B'])
+        self.frame.to_excel(self.path, 'test1', header=False)
+        self.frame.to_excel(self.path, 'test1', index=False)
+
+        # test roundtrip
+        self.frame.to_excel(self.path, 'test1')
+        recons = read_excel(self.path, 'test1', index_col=0)
+        tm.assert_frame_equal(self.frame, recons)
+
+        self.frame.to_excel(self.path, 'test1', index=False)
+        recons = read_excel(self.path, 'test1', index_col=None)
+        recons.index = self.frame.index
+        tm.assert_frame_equal(self.frame, recons)
+
+        self.frame.to_excel(self.path, 'test1', na_rep='NA')
+        recons = read_excel(self.path, 'test1', index_col=0, na_values=['NA'])
+        tm.assert_frame_equal(self.frame, recons)
+
+        # GH 3611
+        self.frame.to_excel(self.path, 'test1', na_rep='88')
+        recons = read_excel(self.path, 'test1', index_col=0, na_values=['88'])
+        tm.assert_frame_equal(self.frame, recons)
+
+        self.frame.to_excel(self.path, 'test1', na_rep='88')
+        recons = read_excel(self.path, 'test1', index_col=0,
+                            na_values=[88, 88.0])
+        tm.assert_frame_equal(self.frame, recons)
+
+        # GH 6573
+        self.frame.to_excel(self.path, 'Sheet1')
+        recons = read_excel(self.path, index_col=0)
+        tm.assert_frame_equal(self.frame, recons)
+
+        self.frame.to_excel(self.path, '0')
+        recons = read_excel(self.path, index_col=0)
+        tm.assert_frame_equal(self.frame, recons)
+
+        # GH 8825 Pandas Series should provide to_excel method
+        s = self.frame["A"]
+        s.to_excel(self.path)
+        recons = read_excel(self.path, index_col=0)
+        tm.assert_frame_equal(s.to_frame(), recons)
+
+    def test_mixed(self, merge_cells, engine, ext):
+        self.mixed_frame.to_excel(self.path, 'test1')
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1', index_col=0)
+        tm.assert_frame_equal(self.mixed_frame, recons)
+
+    def test_tsframe(self, merge_cells, engine, ext):
+        df = tm.makeTimeDataFrame()[:5]
+
+        df.to_excel(self.path, 'test1')
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1')
+        tm.assert_frame_equal(df, recons)
+
+    def test_basics_with_nan(self, merge_cells, engine, ext):
+        self.frame['A'][:5] = nan
+        self.frame.to_excel(self.path, 'test1')
+        self.frame.to_excel(self.path, 'test1', columns=['A', 'B'])
+        self.frame.to_excel(self.path, 'test1', header=False)
+        self.frame.to_excel(self.path, 'test1', index=False)
+
+    @pytest.mark.parametrize("np_type", [
+        np.int8, np.int16, np.int32, np.int64])
+    def test_int_types(self, merge_cells, engine, ext, np_type):
+        # Test np.int values read come back as int (rather than float
+        # which is Excel's format).
+        frame = DataFrame(np.random.randint(-10, 10, size=(10, 2)),
+                          dtype=np_type)
+        frame.to_excel(self.path, 'test1')
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1')
+        int_frame = frame.astype(np.int64)
+        tm.assert_frame_equal(int_frame, recons)
+        recons2 = read_excel(self.path, 'test1')
+        tm.assert_frame_equal(int_frame, recons2)
+
+        # test with convert_float=False comes back as float
+        float_frame = frame.astype(float)
+        recons = read_excel(self.path, 'test1', convert_float=False)
+        tm.assert_frame_equal(recons, float_frame,
+                              check_index_type=False,
+                              check_column_type=False)
+
+    @pytest.mark.parametrize("np_type", [
+        np.float16, np.float32, np.float64])
+    def test_float_types(self, merge_cells, engine, ext, np_type):
+        # Test np.float values read come back as float.
+        frame = DataFrame(np.random.random_sample(10), dtype=np_type)
+        frame.to_excel(self.path, 'test1')
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1').astype(np_type)
+        tm.assert_frame_equal(frame, recons, check_dtype=False)
+
+    @pytest.mark.parametrize("np_type", [np.bool8, np.bool_])
+    def test_bool_types(self, merge_cells, engine, ext, np_type):
+        # Test np.bool values read come back as float.
+        frame = (DataFrame([1, 0, True, False], dtype=np_type))
+        frame.to_excel(self.path, 'test1')
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1').astype(np_type)
+        tm.assert_frame_equal(frame, recons)
+
+    def test_inf_roundtrip(self, merge_cells, engine, ext):
+        frame = DataFrame([(1, np.inf), (2, 3), (5, -np.inf)])
+        frame.to_excel(self.path, 'test1')
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1')
+        tm.assert_frame_equal(frame, recons)
+
+    def test_sheets(self, merge_cells, engine, ext):
+        self.frame['A'][:5] = nan
+
+        self.frame.to_excel(self.path, 'test1')
+        self.frame.to_excel(self.path, 'test1', columns=['A', 'B'])
+        self.frame.to_excel(self.path, 'test1', header=False)
+        self.frame.to_excel(self.path, 'test1', index=False)
+
+        # Test writing to separate sheets
+        writer = ExcelWriter(self.path)
+        self.frame.to_excel(writer, 'test1')
+        self.tsframe.to_excel(writer, 'test2')
+        writer.save()
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1', index_col=0)
+        tm.assert_frame_equal(self.frame, recons)
+        recons = read_excel(reader, 'test2', index_col=0)
+        tm.assert_frame_equal(self.tsframe, recons)
+        assert 2 == len(reader.sheet_names)
+        assert 'test1' == reader.sheet_names[0]
+        assert 'test2' == reader.sheet_names[1]
+
+    def test_colaliases(self, merge_cells, engine, ext):
+        self.frame['A'][:5] = nan
+
+        self.frame.to_excel(self.path, 'test1')
+        self.frame.to_excel(self.path, 'test1', columns=['A', 'B'])
+        self.frame.to_excel(self.path, 'test1', header=False)
+        self.frame.to_excel(self.path, 'test1', index=False)
+
+        # column aliases
+        col_aliases = Index(['AA', 'X', 'Y', 'Z'])
+        self.frame2.to_excel(self.path, 'test1', header=col_aliases)
+        reader = ExcelFile(self.path)
+        rs = read_excel(reader, 'test1', index_col=0)
+        xp = self.frame2.copy()
+        xp.columns = col_aliases
+        tm.assert_frame_equal(xp, rs)
+
+    def test_roundtrip_indexlabels(self, merge_cells, engine, ext):
+        self.frame['A'][:5] = nan
+
+        self.frame.to_excel(self.path, 'test1')
+        self.frame.to_excel(self.path, 'test1', columns=['A', 'B'])
+        self.frame.to_excel(self.path, 'test1', header=False)
+        self.frame.to_excel(self.path, 'test1', index=False)
+
+        # test index_label
+        frame = (DataFrame(np.random.randn(10, 2)) >= 0)
+        frame.to_excel(self.path, 'test1',
+                       index_label=['test'],
+                       merge_cells=merge_cells)
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1',
+                            index_col=0,
+                            ).astype(np.int64)
+        frame.index.names = ['test']
+        assert frame.index.names == recons.index.names
+
+        frame = (DataFrame(np.random.randn(10, 2)) >= 0)
+        frame.to_excel(self.path,
+                       'test1',
+                       index_label=['test', 'dummy', 'dummy2'],
+                       merge_cells=merge_cells)
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1',
+                            index_col=0,
+                            ).astype(np.int64)
+        frame.index.names = ['test']
+        assert frame.index.names == recons.index.names
+
+        frame = (DataFrame(np.random.randn(10, 2)) >= 0)
+        frame.to_excel(self.path,
+                       'test1',
+                       index_label='test',
+                       merge_cells=merge_cells)
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1',
+                            index_col=0,
+                            ).astype(np.int64)
+        frame.index.names = ['test']
+        tm.assert_frame_equal(frame, recons.astype(bool))
+
+        self.frame.to_excel(self.path,
+                            'test1',
+                            columns=['A', 'B', 'C', 'D'],
+                            index=False, merge_cells=merge_cells)
+        # take 'A' and 'B' as indexes (same row as cols 'C', 'D')
+        df = self.frame.copy()
+        df = df.set_index(['A', 'B'])
+
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1', index_col=[0, 1])
+        tm.assert_frame_equal(df, recons, check_less_precise=True)
+
+    def test_excel_roundtrip_indexname(self, merge_cells, engine, ext):
+        df = DataFrame(np.random.randn(10, 4))
+        df.index.name = 'foo'
+
+        df.to_excel(self.path, merge_cells=merge_cells)
+
+        xf = ExcelFile(self.path)
+        result = read_excel(xf, xf.sheet_names[0],
+                            index_col=0)
+
+        tm.assert_frame_equal(result, df)
+        assert result.index.name == 'foo'
+
+    def test_excel_roundtrip_datetime(self, merge_cells, engine, ext):
+        # datetime.date, not sure what to test here exactly
+        tsf = self.tsframe.copy()
+
+        tsf.index = [x.date() for x in self.tsframe.index]
+        tsf.to_excel(self.path, 'test1', merge_cells=merge_cells)
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1')
+        tm.assert_frame_equal(self.tsframe, recons)
+
+    # GH4133 - excel output format strings
+    def test_excel_date_datetime_format(self, merge_cells, engine, ext):
+        df = DataFrame([[date(2014, 1, 31),
+                         date(1999, 9, 24)],
+                        [datetime(1998, 5, 26, 23, 33, 4),
+                         datetime(2014, 2, 28, 13, 5, 13)]],
+                       index=['DATE', 'DATETIME'], columns=['X', 'Y'])
+        df_expected = DataFrame([[datetime(2014, 1, 31),
+                                  datetime(1999, 9, 24)],
+                                 [datetime(1998, 5, 26, 23, 33, 4),
+                                  datetime(2014, 2, 28, 13, 5, 13)]],
+                                index=['DATE', 'DATETIME'], columns=['X', 'Y'])
+
+        with ensure_clean(ext) as filename2:
+            writer1 = ExcelWriter(self.path)
+            writer2 = ExcelWriter(filename2,
+                                  date_format='DD.MM.YYYY',
+                                  datetime_format='DD.MM.YYYY HH-MM-SS')
+
+            df.to_excel(writer1, 'test1')
+            df.to_excel(writer2, 'test1')
+
+            writer1.close()
+            writer2.close()
+
+            reader1 = ExcelFile(self.path)
+            reader2 = ExcelFile(filename2)
+
+            rs1 = read_excel(reader1, 'test1', index_col=None)
+            rs2 = read_excel(reader2, 'test1', index_col=None)
+
+            tm.assert_frame_equal(rs1, rs2)
+
+            # since the reader returns a datetime object for dates, we need
+            # to use df_expected to check the result
+            tm.assert_frame_equal(rs2, df_expected)
+
+    def test_to_excel_interval_no_labels(self, merge_cells, engine, ext):
+        # GH19242 - test writing Interval without labels
+        frame = DataFrame(np.random.randint(-10, 10, size=(20, 1)),
+                          dtype=np.int64)
+        expected = frame.copy()
+        frame['new'] = pd.cut(frame[0], 10)
+        expected['new'] = pd.cut(expected[0], 10).astype(str)
+        frame.to_excel(self.path, 'test1')
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1')
+        tm.assert_frame_equal(expected, recons)
+
+    def test_to_excel_interval_labels(self, merge_cells, engine, ext):
+        # GH19242 - test writing Interval with labels
+        frame = DataFrame(np.random.randint(-10, 10, size=(20, 1)),
+                          dtype=np.int64)
+        expected = frame.copy()
+        intervals = pd.cut(frame[0], 10, labels=['A', 'B', 'C', 'D', 'E',
+                                                 'F', 'G', 'H', 'I', 'J'])
+        frame['new'] = intervals
+        expected['new'] = pd.Series(list(intervals))
+        frame.to_excel(self.path, 'test1')
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1')
+        tm.assert_frame_equal(expected, recons)
+
+    def test_to_excel_timedelta(self, merge_cells, engine, ext):
+        # GH 19242, GH9155 - test writing timedelta to xls
+        frame = DataFrame(np.random.randint(-10, 10, size=(20, 1)),
+                          columns=['A'],
+                          dtype=np.int64
+                          )
+        expected = frame.copy()
+        frame['new'] = frame['A'].apply(lambda x: timedelta(seconds=x))
+        expected['new'] = expected['A'].apply(
+            lambda x: timedelta(seconds=x).total_seconds() / float(86400))
+        frame.to_excel(self.path, 'test1')
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1')
+        tm.assert_frame_equal(expected, recons)
+
+    def test_to_excel_periodindex(self, merge_cells, engine, ext):
+        frame = self.tsframe
+        xp = frame.resample('M', kind='period').mean()
+
+        xp.to_excel(self.path, 'sht1')
+
+        reader = ExcelFile(self.path)
+        rs = read_excel(reader, 'sht1', index_col=0)
+        tm.assert_frame_equal(xp, rs.to_period('M'))
+
+    def test_to_excel_multiindex(self, merge_cells, engine, ext):
+        frame = self.frame
+        arrays = np.arange(len(frame.index) * 2).reshape(2, -1)
+        new_index = MultiIndex.from_arrays(arrays,
+                                           names=['first', 'second'])
+        frame.index = new_index
+
+        frame.to_excel(self.path, 'test1', header=False)
+        frame.to_excel(self.path, 'test1', columns=['A', 'B'])
+
+        # round trip
+        frame.to_excel(self.path, 'test1', merge_cells=merge_cells)
+        reader = ExcelFile(self.path)
+        df = read_excel(reader, 'test1', index_col=[0, 1])
+        tm.assert_frame_equal(frame, df)
+
+    # GH13511
+    def test_to_excel_multiindex_nan_label(self, merge_cells, engine, ext):
+        frame = pd.DataFrame({'A': [None, 2, 3],
+                              'B': [10, 20, 30],
+                              'C': np.random.sample(3)})
+        frame = frame.set_index(['A', 'B'])
+
+        frame.to_excel(self.path, merge_cells=merge_cells)
+        df = read_excel(self.path, index_col=[0, 1])
+        tm.assert_frame_equal(frame, df)
+
+    # Test for Issue 11328. If column indices are integers, make
+    # sure they are handled correctly for either setting of
+    # merge_cells
+    def test_to_excel_multiindex_cols(self, merge_cells, engine, ext):
+        frame = self.frame
+        arrays = np.arange(len(frame.index) * 2).reshape(2, -1)
+        new_index = MultiIndex.from_arrays(arrays,
+                                           names=['first', 'second'])
+        frame.index = new_index
+
+        new_cols_index = MultiIndex.from_tuples([(40, 1), (40, 2),
+                                                 (50, 1), (50, 2)])
+        frame.columns = new_cols_index
+        header = [0, 1]
+        if not merge_cells:
+            header = 0
+
+        # round trip
+        frame.to_excel(self.path, 'test1', merge_cells=merge_cells)
+        reader = ExcelFile(self.path)
+        df = read_excel(reader, 'test1', header=header,
+                        index_col=[0, 1])
+        if not merge_cells:
+            fm = frame.columns.format(sparsify=False,
+                                      adjoin=False, names=False)
+            frame.columns = [".".join(map(str, q)) for q in zip(*fm)]
+        tm.assert_frame_equal(frame, df)
+
+    def test_to_excel_multiindex_dates(self, merge_cells, engine, ext):
+        # try multiindex with dates
+        tsframe = self.tsframe.copy()
+        new_index = [tsframe.index, np.arange(len(tsframe.index))]
+        tsframe.index = MultiIndex.from_arrays(new_index)
+
+        tsframe.index.names = ['time', 'foo']
+        tsframe.to_excel(self.path, 'test1', merge_cells=merge_cells)
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1',
+                            index_col=[0, 1])
+
+        tm.assert_frame_equal(tsframe, recons)
+        assert recons.index.names == ('time', 'foo')
+
+    def test_to_excel_multiindex_no_write_index(self, merge_cells, engine,
+                                                ext):
+        # Test writing and re-reading a MI witout the index. GH 5616.
+
+        # Initial non-MI frame.
+        frame1 = DataFrame({'a': [10, 20], 'b': [30, 40], 'c': [50, 60]})
+
+        # Add a MI.
+        frame2 = frame1.copy()
+        multi_index = MultiIndex.from_tuples([(70, 80), (90, 100)])
+        frame2.index = multi_index
+
+        # Write out to Excel without the index.
+        frame2.to_excel(self.path, 'test1', index=False)
+
+        # Read it back in.
+        reader = ExcelFile(self.path)
+        frame3 = read_excel(reader, 'test1')
+
+        # Test that it is the same as the initial frame.
+        tm.assert_frame_equal(frame1, frame3)
+
+    def test_to_excel_float_format(self, merge_cells, engine, ext):
+        df = DataFrame([[0.123456, 0.234567, 0.567567],
+                        [12.32112, 123123.2, 321321.2]],
+                       index=['A', 'B'], columns=['X', 'Y', 'Z'])
+
+        df.to_excel(self.path, 'test1', float_format='%.2f')
+
+        reader = ExcelFile(self.path)
+        rs = read_excel(reader, 'test1', index_col=None)
+        xp = DataFrame([[0.12, 0.23, 0.57],
+                        [12.32, 123123.20, 321321.20]],
+                       index=['A', 'B'], columns=['X', 'Y', 'Z'])
+        tm.assert_frame_equal(rs, xp)
+
+    def test_to_excel_output_encoding(self, merge_cells, engine, ext):
+        # avoid mixed inferred_type
+        df = DataFrame([[u'\u0192', u'\u0193', u'\u0194'],
+                        [u'\u0195', u'\u0196', u'\u0197']],
+                       index=[u'A\u0192', u'B'],
+                       columns=[u'X\u0193', u'Y', u'Z'])
+
+        with ensure_clean('__tmp_to_excel_float_format__.' + ext) as filename:
+            df.to_excel(filename, sheet_name='TestSheet', encoding='utf8')
+            result = read_excel(filename, 'TestSheet', encoding='utf8')
+            tm.assert_frame_equal(result, df)
+
+    def test_to_excel_unicode_filename(self, merge_cells, engine, ext):
+        with ensure_clean(u('\u0192u.') + ext) as filename:
+            try:
+                f = open(filename, 'wb')
+            except UnicodeEncodeError:
+                pytest.skip('no unicode file names on this system')
+            else:
+                f.close()
+
+            df = DataFrame([[0.123456, 0.234567, 0.567567],
+                            [12.32112, 123123.2, 321321.2]],
+                           index=['A', 'B'], columns=['X', 'Y', 'Z'])
+
+            df.to_excel(filename, 'test1', float_format='%.2f')
+
+            reader = ExcelFile(filename)
+            rs = read_excel(reader, 'test1', index_col=None)
+            xp = DataFrame([[0.12, 0.23, 0.57],
+                            [12.32, 123123.20, 321321.20]],
+                           index=['A', 'B'], columns=['X', 'Y', 'Z'])
+            tm.assert_frame_equal(rs, xp)
+
+    # def test_to_excel_header_styling_xls(self, merge_cells, engine, ext):
+
+    #     import StringIO
+    #     s = StringIO(
+    #     """Date,ticker,type,value
+    #     2001-01-01,x,close,12.2
+    #     2001-01-01,x,open ,12.1
+    #     2001-01-01,y,close,12.2
+    #     2001-01-01,y,open ,12.1
+    #     2001-02-01,x,close,12.2
+    #     2001-02-01,x,open ,12.1
+    #     2001-02-01,y,close,12.2
+    #     2001-02-01,y,open ,12.1
+    #     2001-03-01,x,close,12.2
+    #     2001-03-01,x,open ,12.1
+    #     2001-03-01,y,close,12.2
+    #     2001-03-01,y,open ,12.1""")
+    #     df = read_csv(s, parse_dates=["Date"])
+    #     pdf = df.pivot_table(values="value", rows=["ticker"],
+    #                                          cols=["Date", "type"])
+
+    #     try:
+    #         import xlwt
+    #         import xlrd
+    #     except ImportError:
+    #         pytest.skip
+
+    #     filename = '__tmp_to_excel_header_styling_xls__.xls'
+    #     pdf.to_excel(filename, 'test1')
+
+    #     wbk = xlrd.open_workbook(filename,
+    #                              formatting_info=True)
+    #     assert ["test1"] == wbk.sheet_names()
+    #     ws = wbk.sheet_by_name('test1')
+    #     assert [(0, 1, 5, 7), (0, 1, 3, 5), (0, 1, 1, 3)] == ws.merged_cells
+    #     for i in range(0, 2):
+    #         for j in range(0, 7):
+    #             xfx = ws.cell_xf_index(0, 0)
+    #             cell_xf = wbk.xf_list[xfx]
+    #             font = wbk.font_list
+    #             assert 1 == font[cell_xf.font_index].bold
+    #             assert 1 == cell_xf.border.top_line_style
+    #             assert 1 == cell_xf.border.right_line_style
+    #             assert 1 == cell_xf.border.bottom_line_style
+    #             assert 1 == cell_xf.border.left_line_style
+    #             assert 2 == cell_xf.alignment.hor_align
+    #     os.remove(filename)
+    # def test_to_excel_header_styling_xlsx(self, merge_cells, engine, ext):
+    #     import StringIO
+    #     s = StringIO(
+    #     """Date,ticker,type,value
+    #     2001-01-01,x,close,12.2
+    #     2001-01-01,x,open ,12.1
+    #     2001-01-01,y,close,12.2
+    #     2001-01-01,y,open ,12.1
+    #     2001-02-01,x,close,12.2
+    #     2001-02-01,x,open ,12.1
+    #     2001-02-01,y,close,12.2
+    #     2001-02-01,y,open ,12.1
+    #     2001-03-01,x,close,12.2
+    #     2001-03-01,x,open ,12.1
+    #     2001-03-01,y,close,12.2
+    #     2001-03-01,y,open ,12.1""")
+    #     df = read_csv(s, parse_dates=["Date"])
+    #     pdf = df.pivot_table(values="value", rows=["ticker"],
+    #                                          cols=["Date", "type"])
+    #     try:
+    #         import openpyxl
+    #         from openpyxl.cell import get_column_letter
+    #     except ImportError:
+    #         pytest.skip
+    #     if openpyxl.__version__ < '1.6.1':
+    #         pytest.skip
+    #     # test xlsx_styling
+    #     filename = '__tmp_to_excel_header_styling_xlsx__.xlsx'
+    #     pdf.to_excel(filename, 'test1')
+    #     wbk = openpyxl.load_workbook(filename)
+    #     assert ["test1"] == wbk.get_sheet_names()
+    #     ws = wbk.get_sheet_by_name('test1')
+    #     xlsaddrs = ["%s2" % chr(i) for i in range(ord('A'), ord('H'))]
+    #     xlsaddrs += ["A%s" % i for i in range(1, 6)]
+    #     xlsaddrs += ["B1", "D1", "F1"]
+    #     for xlsaddr in xlsaddrs:
+    #         cell = ws.cell(xlsaddr)
+    #         assert cell.style.font.bold
+    #         assert (openpyxl.style.Border.BORDER_THIN ==
+    #                 cell.style.borders.top.border_style)
+    #         assert (openpyxl.style.Border.BORDER_THIN ==
+    #                 cell.style.borders.right.border_style)
+    #         assert (openpyxl.style.Border.BORDER_THIN ==
+    #                 cell.style.borders.bottom.border_style)
+    #         assert (openpyxl.style.Border.BORDER_THIN ==
+    #                 cell.style.borders.left.border_style)
+    #         assert (openpyxl.style.Alignment.HORIZONTAL_CENTER ==
+    #                 cell.style.alignment.horizontal)
+    #     mergedcells_addrs = ["C1", "E1", "G1"]
+    #     for maddr in mergedcells_addrs:
+    #         assert ws.cell(maddr).merged
+    #     os.remove(filename)
+
+    def test_excel_010_hemstring(self, merge_cells, engine, ext):
+        if merge_cells:
+            pytest.skip('Skip tests for merged MI format.')
+
+        from pandas.util.testing import makeCustomDataframe as mkdf
+        # ensure limited functionality in 0.10
+        # override of #2370 until sorted out in 0.11
+
+        def roundtrip(df, header=True, parser_hdr=0, index=True):
+
+            df.to_excel(self.path, header=header,
+                        merge_cells=merge_cells, index=index)
+            xf = ExcelFile(self.path)
+            res = read_excel(xf, xf.sheet_names[0], header=parser_hdr)
+            return res
+
+        nrows = 5
+        ncols = 3
+        for use_headers in (True, False):
+            for i in range(1, 4):  # row multindex up to nlevel=3
+                for j in range(1, 4):  # col ""
+                    df = mkdf(nrows, ncols, r_idx_nlevels=i, c_idx_nlevels=j)
+
+                    # this if will be removed once multi column excel writing
+                    # is implemented for now fixing #9794
+                    if j > 1:
+                        with pytest.raises(NotImplementedError):
+                            res = roundtrip(df, use_headers, index=False)
+                    else:
+                        res = roundtrip(df, use_headers)
+
+                    if use_headers:
+                        assert res.shape == (nrows, ncols + i)
+                    else:
+                        # first row taken as columns
+                        assert res.shape == (nrows - 1, ncols + i)
+
+                    # no nans
+                    for r in range(len(res.index)):
+                        for c in range(len(res.columns)):
+                            assert res.iloc[r, c] is not np.nan
+
+        res = roundtrip(DataFrame([0]))
+        assert res.shape == (1, 1)
+        assert res.iloc[0, 0] is not np.nan
+
+        res = roundtrip(DataFrame([0]), False, None)
+        assert res.shape == (1, 2)
+        assert res.iloc[0, 0] is not np.nan
+
+    def test_excel_010_hemstring_raises_NotImplementedError(self, merge_cells,
+                                                            engine, ext):
+        # This test was failing only for j>1 and header=False,
+        # So I reproduced a simple test.
+        if merge_cells:
+            pytest.skip('Skip tests for merged MI format.')
+
+        from pandas.util.testing import makeCustomDataframe as mkdf
+        # ensure limited functionality in 0.10
+        # override of #2370 until sorted out in 0.11
+
+        def roundtrip2(df, header=True, parser_hdr=0, index=True):
+
+            df.to_excel(self.path, header=header,
+                        merge_cells=merge_cells, index=index)
+            xf = ExcelFile(self.path)
+            res = read_excel(xf, xf.sheet_names[0], header=parser_hdr)
+            return res
+
+        nrows = 5
+        ncols = 3
+        j = 2
+        i = 1
+        df = mkdf(nrows, ncols, r_idx_nlevels=i, c_idx_nlevels=j)
+        with pytest.raises(NotImplementedError):
+            roundtrip2(df, header=False, index=False)
+
+    def test_duplicated_columns(self, merge_cells, engine, ext):
+        # Test for issue #5235
+        write_frame = DataFrame([[1, 2, 3], [1, 2, 3], [1, 2, 3]])
+        colnames = ['A', 'B', 'B']
+
+        write_frame.columns = colnames
+        write_frame.to_excel(self.path, 'test1')
+
+        read_frame = read_excel(self.path, 'test1')
+        read_frame.columns = colnames
+        tm.assert_frame_equal(write_frame, read_frame)
+
+        # 11007 / #10970
+        write_frame = DataFrame([[1, 2, 3, 4], [5, 6, 7, 8]],
+                                columns=['A', 'B', 'A', 'B'])
+        write_frame.to_excel(self.path, 'test1')
+        read_frame = read_excel(self.path, 'test1')
+        read_frame.columns = ['A', 'B', 'A', 'B']
+        tm.assert_frame_equal(write_frame, read_frame)
+
+        # 10982
+        write_frame.to_excel(self.path, 'test1', index=False, header=False)
+        read_frame = read_excel(self.path, 'test1', header=None)
+        write_frame.columns = [0, 1, 2, 3]
+        tm.assert_frame_equal(write_frame, read_frame)
+
+    def test_swapped_columns(self, merge_cells, engine, ext):
+        # Test for issue #5427.
+        write_frame = DataFrame({'A': [1, 1, 1],
+                                 'B': [2, 2, 2]})
+        write_frame.to_excel(self.path, 'test1', columns=['B', 'A'])
+
+        read_frame = read_excel(self.path, 'test1', header=0)
+
+        tm.assert_series_equal(write_frame['A'], read_frame['A'])
+        tm.assert_series_equal(write_frame['B'], read_frame['B'])
+
+    def test_invalid_columns(self, merge_cells, engine, ext):
+        # 10982
+        write_frame = DataFrame({'A': [1, 1, 1],
+                                 'B': [2, 2, 2]})
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            write_frame.to_excel(self.path, 'test1', columns=['B', 'C'])
+        expected = write_frame.reindex(columns=['B', 'C'])
+        read_frame = read_excel(self.path, 'test1')
+        tm.assert_frame_equal(expected, read_frame)
+
+        with pytest.raises(KeyError):
+            write_frame.to_excel(self.path, 'test1', columns=['C', 'D'])
+
+    def test_comment_arg(self, merge_cells, engine, ext):
+        # Re issue #18735
+        # Test the comment argument functionality to read_excel
+
+        # Create file to read in
+        df = DataFrame({'A': ['one', '#one', 'one'],
+                        'B': ['two', 'two', '#two']})
+        df.to_excel(self.path, 'test_c')
+
+        # Read file without comment arg
+        result1 = read_excel(self.path, 'test_c')
+        result1.iloc[1, 0] = None
+        result1.iloc[1, 1] = None
+        result1.iloc[2, 1] = None
+        result2 = read_excel(self.path, 'test_c', comment='#')
+        tm.assert_frame_equal(result1, result2)
+
+    def test_comment_default(self, merge_cells, engine, ext):
+        # Re issue #18735
+        # Test the comment argument default to read_excel
+
+        # Create file to read in
+        df = DataFrame({'A': ['one', '#one', 'one'],
+                        'B': ['two', 'two', '#two']})
+        df.to_excel(self.path, 'test_c')
+
+        # Read file with default and explicit comment=None
+        result1 = read_excel(self.path, 'test_c')
+        result2 = read_excel(self.path, 'test_c', comment=None)
+        tm.assert_frame_equal(result1, result2)
+
+    def test_comment_used(self, merge_cells, engine, ext):
+        # Re issue #18735
+        # Test the comment argument is working as expected when used
+
+        # Create file to read in
+        df = DataFrame({'A': ['one', '#one', 'one'],
+                        'B': ['two', 'two', '#two']})
+        df.to_excel(self.path, 'test_c')
+
+        # Test read_frame_comment against manually produced expected output
+        expected = DataFrame({'A': ['one', None, 'one'],
+                              'B': ['two', None, None]})
+        result = read_excel(self.path, 'test_c', comment='#')
+        tm.assert_frame_equal(result, expected)
+
+    def test_comment_emptyline(self, merge_cells, engine, ext):
+        # Re issue #18735
+        # Test that read_excel ignores commented lines at the end of file
+
+        df = DataFrame({'a': ['1', '#2'], 'b': ['2', '3']})
+        df.to_excel(self.path, index=False)
+
+        # Test that all-comment lines at EoF are ignored
+        expected = DataFrame({'a': [1], 'b': [2]})
+        result = read_excel(self.path, comment='#')
+        tm.assert_frame_equal(result, expected)
+
+    def test_datetimes(self, merge_cells, engine, ext):
+
+        # Test writing and reading datetimes. For issue #9139. (xref #9185)
+        datetimes = [datetime(2013, 1, 13, 1, 2, 3),
+                     datetime(2013, 1, 13, 2, 45, 56),
+                     datetime(2013, 1, 13, 4, 29, 49),
+                     datetime(2013, 1, 13, 6, 13, 42),
+                     datetime(2013, 1, 13, 7, 57, 35),
+                     datetime(2013, 1, 13, 9, 41, 28),
+                     datetime(2013, 1, 13, 11, 25, 21),
+                     datetime(2013, 1, 13, 13, 9, 14),
+                     datetime(2013, 1, 13, 14, 53, 7),
+                     datetime(2013, 1, 13, 16, 37, 0),
+                     datetime(2013, 1, 13, 18, 20, 52)]
+
+        write_frame = DataFrame({'A': datetimes})
+        write_frame.to_excel(self.path, 'Sheet1')
+        read_frame = read_excel(self.path, 'Sheet1', header=0)
+
+        tm.assert_series_equal(write_frame['A'], read_frame['A'])
+
+    # GH7074
+    def test_bytes_io(self, merge_cells, engine, ext):
+        bio = BytesIO()
+        df = DataFrame(np.random.randn(10, 2))
+        # pass engine explicitly as there is no file path to infer from
+        writer = ExcelWriter(bio, engine=engine)
+        df.to_excel(writer)
+        writer.save()
+        bio.seek(0)
+        reread_df = read_excel(bio)
+        tm.assert_frame_equal(df, reread_df)
+
+    # GH8188
+    def test_write_lists_dict(self, merge_cells, engine, ext):
+        df = DataFrame({'mixed': ['a', ['b', 'c'], {'d': 'e', 'f': 2}],
+                        'numeric': [1, 2, 3.0],
+                        'str': ['apple', 'banana', 'cherry']})
+        expected = df.copy()
+        expected.mixed = expected.mixed.apply(str)
+        expected.numeric = expected.numeric.astype('int64')
+
+        df.to_excel(self.path, 'Sheet1')
+        read = read_excel(self.path, 'Sheet1', header=0)
+        tm.assert_frame_equal(read, expected)
+
+    # GH13347
+    def test_true_and_false_value_options(self, merge_cells, engine, ext):
+        df = pd.DataFrame([['foo', 'bar']], columns=['col1', 'col2'])
+        expected = df.replace({'foo': True,
+                               'bar': False})
+
+        df.to_excel(self.path)
+        read_frame = read_excel(self.path, true_values=['foo'],
+                                false_values=['bar'])
+        tm.assert_frame_equal(read_frame, expected)
+
+    def test_freeze_panes(self, merge_cells, engine, ext):
+        # GH15160
+        expected = DataFrame([[1, 2], [3, 4]], columns=['col1', 'col2'])
+        expected.to_excel(self.path, "Sheet1", freeze_panes=(1, 1))
+        result = read_excel(self.path)
+        tm.assert_frame_equal(expected, result)
+
+    def test_path_pathlib(self, merge_cells, engine, ext):
+        df = tm.makeDataFrame()
+        writer = partial(df.to_excel, engine=engine)
+        reader = partial(pd.read_excel)
+        result = tm.round_trip_pathlib(writer, reader,
+                                       path="foo.{}".format(ext))
+        tm.assert_frame_equal(df, result)
+
+    def test_path_localpath(self, merge_cells, engine, ext):
+        df = tm.makeDataFrame()
+        writer = partial(df.to_excel, engine=engine)
+        reader = partial(pd.read_excel)
+        result = tm.round_trip_pathlib(writer, reader,
+                                       path="foo.{}".format(ext))
+        tm.assert_frame_equal(df, result)
+
+
+@td.skip_if_no('openpyxl')
+@pytest.mark.parametrize("merge_cells,ext,engine", [
+    (None, '.xlsx', 'openpyxl')])
+class TestOpenpyxlTests(_WriterBase):
+
+    def test_to_excel_styleconverter(self, merge_cells, ext, engine):
+        from openpyxl import styles
+
+        hstyle = {
+            "font": {
+                "color": '00FF0000',
+                "bold": True,
+            },
+            "borders": {
+                "top": "thin",
+                "right": "thin",
+                "bottom": "thin",
+                "left": "thin",
+            },
+            "alignment": {
+                "horizontal": "center",
+                "vertical": "top",
+            },
+            "fill": {
+                "patternType": 'solid',
+                'fgColor': {
+                    'rgb': '006666FF',
+                    'tint': 0.3,
+                },
+            },
+            "number_format": {
+                "format_code": "0.00"
+            },
+            "protection": {
+                "locked": True,
+                "hidden": False,
+            },
+        }
+
+        font_color = styles.Color('00FF0000')
+        font = styles.Font(bold=True, color=font_color)
+        side = styles.Side(style=styles.borders.BORDER_THIN)
+        border = styles.Border(top=side, right=side, bottom=side, left=side)
+        alignment = styles.Alignment(horizontal='center', vertical='top')
+        fill_color = styles.Color(rgb='006666FF', tint=0.3)
+        fill = styles.PatternFill(patternType='solid', fgColor=fill_color)
+
+        number_format = '0.00'
+
+        protection = styles.Protection(locked=True, hidden=False)
+
+        kw = _OpenpyxlWriter._convert_to_style_kwargs(hstyle)
+        assert kw['font'] == font
+        assert kw['border'] == border
+        assert kw['alignment'] == alignment
+        assert kw['fill'] == fill
+        assert kw['number_format'] == number_format
+        assert kw['protection'] == protection
+
+    def test_write_cells_merge_styled(self, merge_cells, ext, engine):
+        from pandas.io.formats.excel import ExcelCell
+
+        sheet_name = 'merge_styled'
+
+        sty_b1 = {'font': {'color': '00FF0000'}}
+        sty_a2 = {'font': {'color': '0000FF00'}}
+
+        initial_cells = [
+            ExcelCell(col=1, row=0, val=42, style=sty_b1),
+            ExcelCell(col=0, row=1, val=99, style=sty_a2),
+        ]
+
+        sty_merged = {'font': {'color': '000000FF', 'bold': True}}
+        sty_kwargs = _OpenpyxlWriter._convert_to_style_kwargs(sty_merged)
+        openpyxl_sty_merged = sty_kwargs['font']
+        merge_cells = [
+            ExcelCell(col=0, row=0, val='pandas',
+                      mergestart=1, mergeend=1, style=sty_merged),
+        ]
+
+        with ensure_clean(ext) as path:
+            writer = _OpenpyxlWriter(path)
+            writer.write_cells(initial_cells, sheet_name=sheet_name)
+            writer.write_cells(merge_cells, sheet_name=sheet_name)
+
+            wks = writer.sheets[sheet_name]
+            xcell_b1 = wks['B1']
+            xcell_a2 = wks['A2']
+            assert xcell_b1.font == openpyxl_sty_merged
+            assert xcell_a2.font == openpyxl_sty_merged
+
+    @pytest.mark.parametrize("mode,expected", [
+        ('w', ['baz']), ('a', ['foo', 'bar', 'baz'])])
+    def test_write_append_mode(self, merge_cells, ext, engine, mode, expected):
+        import openpyxl
+        df = DataFrame([1], columns=['baz'])
+
+        with ensure_clean(ext) as f:
+            wb = openpyxl.Workbook()
+            wb.worksheets[0].title = 'foo'
+            wb.worksheets[0]['A1'].value = 'foo'
+            wb.create_sheet('bar')
+            wb.worksheets[1]['A1'].value = 'bar'
+            wb.save(f)
+
+            writer = ExcelWriter(f, engine=engine, mode=mode)
+            df.to_excel(writer, sheet_name='baz', index=False)
+            writer.save()
+
+            wb2 = openpyxl.load_workbook(f)
+            result = [sheet.title for sheet in wb2.worksheets]
+            assert result == expected
+
+            for index, cell_value in enumerate(expected):
+                assert wb2.worksheets[index]['A1'].value == cell_value
+
+
+@td.skip_if_no('xlwt')
+@pytest.mark.parametrize("merge_cells,ext,engine", [
+    (None, '.xls', 'xlwt')])
+class TestXlwtTests(_WriterBase):
+
+    def test_excel_raise_error_on_multiindex_columns_and_no_index(
+            self, merge_cells, ext, engine):
+        # MultiIndex as columns is not yet implemented 9794
+        cols = MultiIndex.from_tuples([('site', ''),
+                                       ('2014', 'height'),
+                                       ('2014', 'weight')])
+        df = DataFrame(np.random.randn(10, 3), columns=cols)
+        with pytest.raises(NotImplementedError):
+            with ensure_clean(ext) as path:
+                df.to_excel(path, index=False)
+
+    def test_excel_multiindex_columns_and_index_true(self, merge_cells, ext,
+                                                     engine):
+        cols = MultiIndex.from_tuples([('site', ''),
+                                       ('2014', 'height'),
+                                       ('2014', 'weight')])
+        df = pd.DataFrame(np.random.randn(10, 3), columns=cols)
+        with ensure_clean(ext) as path:
+            df.to_excel(path, index=True)
+
+    def test_excel_multiindex_index(self, merge_cells, ext, engine):
+        # MultiIndex as index works so assert no error #9794
+        cols = MultiIndex.from_tuples([('site', ''),
+                                       ('2014', 'height'),
+                                       ('2014', 'weight')])
+        df = DataFrame(np.random.randn(3, 10), index=cols)
+        with ensure_clean(ext) as path:
+            df.to_excel(path, index=False)
+
+    def test_to_excel_styleconverter(self, merge_cells, ext, engine):
+        import xlwt
+
+        hstyle = {"font": {"bold": True},
+                  "borders": {"top": "thin",
+                              "right": "thin",
+                              "bottom": "thin",
+                              "left": "thin"},
+                  "alignment": {"horizontal": "center", "vertical": "top"}}
+
+        xls_style = _XlwtWriter._convert_to_style(hstyle)
+        assert xls_style.font.bold
+        assert xlwt.Borders.THIN == xls_style.borders.top
+        assert xlwt.Borders.THIN == xls_style.borders.right
+        assert xlwt.Borders.THIN == xls_style.borders.bottom
+        assert xlwt.Borders.THIN == xls_style.borders.left
+        assert xlwt.Alignment.HORZ_CENTER == xls_style.alignment.horz
+        assert xlwt.Alignment.VERT_TOP == xls_style.alignment.vert
+
+    def test_write_append_mode_raises(self, merge_cells, ext, engine):
+        msg = "Append mode is not supported with xlwt!"
+
+        with ensure_clean(ext) as f:
+            with tm.assert_raises_regex(ValueError, msg):
+                ExcelWriter(f, engine=engine, mode='a')
+
+
+@td.skip_if_no('xlsxwriter')
+@pytest.mark.parametrize("merge_cells,ext,engine", [
+    (None, '.xlsx', 'xlsxwriter')])
+class TestXlsxWriterTests(_WriterBase):
+
+    @td.skip_if_no('openpyxl')
+    def test_column_format(self, merge_cells, ext, engine):
+        # Test that column formats are applied to cells. Test for issue #9167.
+        # Applicable to xlsxwriter only.
+        with warnings.catch_warnings():
+            # Ignore the openpyxl lxml warning.
+            warnings.simplefilter("ignore")
+            import openpyxl
+
+        with ensure_clean(ext) as path:
+            frame = DataFrame({'A': [123456, 123456],
+                               'B': [123456, 123456]})
+
+            writer = ExcelWriter(path)
+            frame.to_excel(writer)
+
+            # Add a number format to col B and ensure it is applied to cells.
+            num_format = '#,##0'
+            write_workbook = writer.book
+            write_worksheet = write_workbook.worksheets()[0]
+            col_format = write_workbook.add_format({'num_format': num_format})
+            write_worksheet.set_column('B:B', None, col_format)
+            writer.save()
+
+            read_workbook = openpyxl.load_workbook(path)
+            try:
+                read_worksheet = read_workbook['Sheet1']
+            except TypeError:
+                # compat
+                read_worksheet = read_workbook.get_sheet_by_name(name='Sheet1')
+
+            # Get the number format from the cell.
+            try:
+                cell = read_worksheet['B2']
+            except TypeError:
+                # compat
+                cell = read_worksheet.cell('B2')
+
+            try:
+                read_num_format = cell.number_format
+            except Exception:
+                read_num_format = cell.style.number_format._format_code
+
+            assert read_num_format == num_format
+
+    def test_write_append_mode_raises(self, merge_cells, ext, engine):
+        msg = "Append mode is not supported with xlsxwriter!"
+
+        with ensure_clean(ext) as f:
+            with tm.assert_raises_regex(ValueError, msg):
+                ExcelWriter(f, engine=engine, mode='a')
+
+
+class TestExcelWriterEngineTests(object):
+
+    @pytest.mark.parametrize('klass,ext', [
+        pytest.param(_XlsxWriter, '.xlsx', marks=pytest.mark.skipif(
+            not td.safe_import('xlsxwriter'), reason='No xlsxwriter')),
+        pytest.param(_OpenpyxlWriter, '.xlsx', marks=pytest.mark.skipif(
+            not td.safe_import('openpyxl'), reason='No openpyxl')),
+        pytest.param(_XlwtWriter, '.xls', marks=pytest.mark.skipif(
+            not td.safe_import('xlwt'), reason='No xlwt'))
+    ])
+    def test_ExcelWriter_dispatch(self, klass, ext):
+        with ensure_clean(ext) as path:
+            writer = ExcelWriter(path)
+            if ext == '.xlsx' and td.safe_import('xlsxwriter'):
+                # xlsxwriter has preference over openpyxl if both installed
+                assert isinstance(writer, _XlsxWriter)
+            else:
+                assert isinstance(writer, klass)
+
+    def test_ExcelWriter_dispatch_raises(self):
+        with tm.assert_raises_regex(ValueError, 'No engine'):
+            ExcelWriter('nothing')
+
+    def test_register_writer(self):
+        # some awkward mocking to test out dispatch and such actually works
+        called_save = []
+        called_write_cells = []
+
+        class DummyClass(ExcelWriter):
+            called_save = False
+            called_write_cells = False
+            supported_extensions = ['test', 'xlsx', 'xls']
+            engine = 'dummy'
+
+            def save(self):
+                called_save.append(True)
+
+            def write_cells(self, *args, **kwargs):
+                called_write_cells.append(True)
+
+        def check_called(func):
+            func()
+            assert len(called_save) >= 1
+            assert len(called_write_cells) >= 1
+            del called_save[:]
+            del called_write_cells[:]
+
+        with pd.option_context('io.excel.xlsx.writer', 'dummy'):
+            register_writer(DummyClass)
+            writer = ExcelWriter('something.test')
+            assert isinstance(writer, DummyClass)
+            df = tm.makeCustomDataframe(1, 1)
+
+            with catch_warnings(record=True):
+                panel = tm.makePanel()
+                func = lambda: df.to_excel('something.test')
+                check_called(func)
+                check_called(lambda: panel.to_excel('something.test'))
+                check_called(lambda: df.to_excel('something.xlsx'))
+                check_called(
+                    lambda: df.to_excel(
+                        'something.xls', engine='dummy'))
+
+
+@pytest.mark.parametrize('engine', [
+    pytest.param('xlwt',
+                 marks=pytest.mark.xfail(reason='xlwt does not support '
+                                                'openpyxl-compatible '
+                                                'style dicts')),
+    'xlsxwriter',
+    'openpyxl',
+])
+def test_styler_to_excel(engine):
+    def style(df):
+        # XXX: RGB colors not supported in xlwt
+        return DataFrame([['font-weight: bold', '', ''],
+                          ['', 'color: blue', ''],
+                          ['', '', 'text-decoration: underline'],
+                          ['border-style: solid', '', ''],
+                          ['', 'font-style: italic', ''],
+                          ['', '', 'text-align: right'],
+                          ['background-color: red', '', ''],
+                          ['', '', ''],
+                          ['', '', ''],
+                          ['', '', '']],
+                         index=df.index, columns=df.columns)
+
+    def assert_equal_style(cell1, cell2):
+        # XXX: should find a better way to check equality
+        assert cell1.alignment.__dict__ == cell2.alignment.__dict__
+        assert cell1.border.__dict__ == cell2.border.__dict__
+        assert cell1.fill.__dict__ == cell2.fill.__dict__
+        assert cell1.font.__dict__ == cell2.font.__dict__
+        assert cell1.number_format == cell2.number_format
+        assert cell1.protection.__dict__ == cell2.protection.__dict__
+
+    def custom_converter(css):
+        # use bold iff there is custom style attached to the cell
+        if css.strip(' \n;'):
+            return {'font': {'bold': True}}
+        return {}
+
+    pytest.importorskip('jinja2')
+    pytest.importorskip(engine)
+
+    # Prepare spreadsheets
+
+    df = DataFrame(np.random.randn(10, 3))
+    with ensure_clean('.xlsx' if engine != 'xlwt' else '.xls') as path:
+        writer = ExcelWriter(path, engine=engine)
+        df.to_excel(writer, sheet_name='frame')
+        df.style.to_excel(writer, sheet_name='unstyled')
+        styled = df.style.apply(style, axis=None)
+        styled.to_excel(writer, sheet_name='styled')
+        ExcelFormatter(styled, style_converter=custom_converter).write(
+            writer, sheet_name='custom')
+        writer.save()
+
+        if engine not in ('openpyxl', 'xlsxwriter'):
+            # For other engines, we only smoke test
+            return
+        openpyxl = pytest.importorskip('openpyxl')
+        wb = openpyxl.load_workbook(path)
+
+        # (1) compare DataFrame.to_excel and Styler.to_excel when unstyled
+        n_cells = 0
+        for col1, col2 in zip(wb['frame'].columns,
+                              wb['unstyled'].columns):
+            assert len(col1) == len(col2)
+            for cell1, cell2 in zip(col1, col2):
+                assert cell1.value == cell2.value
+                assert_equal_style(cell1, cell2)
+                n_cells += 1
+
+        # ensure iteration actually happened:
+        assert n_cells == (10 + 1) * (3 + 1)
+
+        # (2) check styling with default converter
+
+        # XXX: openpyxl (as at 2.4) prefixes colors with 00, xlsxwriter with FF
+        alpha = '00' if engine == 'openpyxl' else 'FF'
+
+        n_cells = 0
+        for col1, col2 in zip(wb['frame'].columns,
+                              wb['styled'].columns):
+            assert len(col1) == len(col2)
+            for cell1, cell2 in zip(col1, col2):
+                ref = '%s%d' % (cell2.column, cell2.row)
+                # XXX: this isn't as strong a test as ideal; we should
+                #      confirm that differences are exclusive
+                if ref == 'B2':
+                    assert not cell1.font.bold
+                    assert cell2.font.bold
+                elif ref == 'C3':
+                    assert cell1.font.color.rgb != cell2.font.color.rgb
+                    assert cell2.font.color.rgb == alpha + '0000FF'
+                elif ref == 'D4':
+                    # This fails with engine=xlsxwriter due to
+                    # https://bitbucket.org/openpyxl/openpyxl/issues/800
+                    if engine == 'xlsxwriter' \
+                       and (LooseVersion(openpyxl.__version__) <
+                            LooseVersion('2.4.6')):
+                        pass
+                    else:
+                        assert cell1.font.underline != cell2.font.underline
+                        assert cell2.font.underline == 'single'
+                elif ref == 'B5':
+                    assert not cell1.border.left.style
+                    assert (cell2.border.top.style ==
+                            cell2.border.right.style ==
+                            cell2.border.bottom.style ==
+                            cell2.border.left.style ==
+                            'medium')
+                elif ref == 'C6':
+                    assert not cell1.font.italic
+                    assert cell2.font.italic
+                elif ref == 'D7':
+                    assert (cell1.alignment.horizontal !=
+                            cell2.alignment.horizontal)
+                    assert cell2.alignment.horizontal == 'right'
+                elif ref == 'B8':
+                    assert cell1.fill.fgColor.rgb != cell2.fill.fgColor.rgb
+                    assert cell1.fill.patternType != cell2.fill.patternType
+                    assert cell2.fill.fgColor.rgb == alpha + 'FF0000'
+                    assert cell2.fill.patternType == 'solid'
+                else:
+                    assert_equal_style(cell1, cell2)
+
+                assert cell1.value == cell2.value
+                n_cells += 1
+
+        assert n_cells == (10 + 1) * (3 + 1)
+
+        # (3) check styling with custom converter
+        n_cells = 0
+        for col1, col2 in zip(wb['frame'].columns,
+                              wb['custom'].columns):
+            assert len(col1) == len(col2)
+            for cell1, cell2 in zip(col1, col2):
+                ref = '%s%d' % (cell2.column, cell2.row)
+                if ref in ('B2', 'C3', 'D4', 'B5', 'C6', 'D7', 'B8'):
+                    assert not cell1.font.bold
+                    assert cell2.font.bold
+                else:
+                    assert_equal_style(cell1, cell2)
+
+                assert cell1.value == cell2.value
+                n_cells += 1
+
+        assert n_cells == (10 + 1) * (3 + 1)
+
+
+@td.skip_if_no('openpyxl')
+@pytest.mark.skipif(not PY36, reason='requires fspath')
+class TestFSPath(object):
+
+    def test_excelfile_fspath(self):
+        with tm.ensure_clean('foo.xlsx') as path:
+            df = DataFrame({"A": [1, 2]})
+            df.to_excel(path)
+            xl = ExcelFile(path)
+            result = os.fspath(xl)
+            assert result == path
+
+    def test_excelwriter_fspath(self):
+        with tm.ensure_clean('foo.xlsx') as path:
+            writer = ExcelWriter(path)
+            assert os.fspath(writer) == str(path)
diff --git a/pandas/tests/io/test_feather.py b/pandas/tests/io/test_feather.py
new file mode 100644
index 0000000000000..9d04111d64125
--- /dev/null
+++ b/pandas/tests/io/test_feather.py
@@ -0,0 +1,145 @@
+""" test feather-format compat """
+from distutils.version import LooseVersion
+from warnings import catch_warnings
+
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, ensure_clean
+
+import pytest
+feather = pytest.importorskip('feather')
+from feather import FeatherError  # noqa:E402
+
+from pandas.io.feather_format import to_feather, read_feather  # noqa:E402
+
+fv = LooseVersion(feather.__version__)
+
+
+@pytest.mark.single
+class TestFeather(object):
+
+    def check_error_on_write(self, df, exc):
+        # check that we are raising the exception
+        # on writing
+
+        with pytest.raises(exc):
+            with ensure_clean() as path:
+                to_feather(df, path)
+
+    def check_round_trip(self, df, **kwargs):
+
+        with ensure_clean() as path:
+            to_feather(df, path)
+
+            with catch_warnings(record=True):
+                result = read_feather(path, **kwargs)
+            assert_frame_equal(result, df)
+
+    def test_error(self):
+
+        for obj in [pd.Series([1, 2, 3]), 1, 'foo', pd.Timestamp('20130101'),
+                    np.array([1, 2, 3])]:
+            self.check_error_on_write(obj, ValueError)
+
+    def test_basic(self):
+
+        df = pd.DataFrame({'string': list('abc'),
+                           'int': list(range(1, 4)),
+                           'uint': np.arange(3, 6).astype('u1'),
+                           'float': np.arange(4.0, 7.0, dtype='float64'),
+                           'float_with_null': [1., np.nan, 3],
+                           'bool': [True, False, True],
+                           'bool_with_null': [True, np.nan, False],
+                           'cat': pd.Categorical(list('abc')),
+                           'dt': pd.date_range('20130101', periods=3),
+                           'dttz': pd.date_range('20130101', periods=3,
+                                                 tz='US/Eastern'),
+                           'dt_with_null': [pd.Timestamp('20130101'), pd.NaT,
+                                            pd.Timestamp('20130103')],
+                           'dtns': pd.date_range('20130101', periods=3,
+                                                 freq='ns')})
+
+        assert df.dttz.dtype.tz.zone == 'US/Eastern'
+        self.check_round_trip(df)
+
+    @pytest.mark.skipif(fv >= LooseVersion('0.4.0'), reason='fixed in 0.4.0')
+    def test_strided_data_issues(self):
+
+        # strided data issuehttps://github.com/wesm/feather/issues/97
+        df = pd.DataFrame(np.arange(12).reshape(4, 3), columns=list('abc'))
+        self.check_error_on_write(df, FeatherError)
+
+    def test_duplicate_columns(self):
+
+        # https://github.com/wesm/feather/issues/53
+        # not currently able to handle duplicate columns
+        df = pd.DataFrame(np.arange(12).reshape(4, 3),
+                          columns=list('aaa')).copy()
+        self.check_error_on_write(df, ValueError)
+
+    def test_stringify_columns(self):
+
+        df = pd.DataFrame(np.arange(12).reshape(4, 3)).copy()
+        self.check_error_on_write(df, ValueError)
+
+    @pytest.mark.skipif(fv >= LooseVersion('0.4.0'), reason='fixed in 0.4.0')
+    def test_unsupported(self):
+
+        # timedelta
+        df = pd.DataFrame({'a': pd.timedelta_range('1 day', periods=3)})
+        self.check_error_on_write(df, FeatherError)
+
+        # non-strings
+        df = pd.DataFrame({'a': ['a', 1, 2.0]})
+        self.check_error_on_write(df, ValueError)
+
+    def test_unsupported_other(self):
+
+        # period
+        df = pd.DataFrame({'a': pd.period_range('2013', freq='M', periods=3)})
+        self.check_error_on_write(df, ValueError)
+
+    @pytest.mark.skipif(fv < LooseVersion('0.4.0'), reason='new in 0.4.0')
+    def test_rw_nthreads(self):
+
+        df = pd.DataFrame({'A': np.arange(100000)})
+        self.check_round_trip(df, nthreads=2)
+
+    def test_write_with_index(self):
+
+        df = pd.DataFrame({'A': [1, 2, 3]})
+        self.check_round_trip(df)
+
+        # non-default index
+        for index in [[2, 3, 4],
+                      pd.date_range('20130101', periods=3),
+                      list('abc'),
+                      [1, 3, 4],
+                      pd.MultiIndex.from_tuples([('a', 1), ('a', 2),
+                                                 ('b', 1)]),
+                      ]:
+
+            df.index = index
+            self.check_error_on_write(df, ValueError)
+
+        # index with meta-data
+        df.index = [0, 1, 2]
+        df.index.name = 'foo'
+        self.check_error_on_write(df, ValueError)
+
+        # column multi-index
+        df.index = [0, 1, 2]
+        df.columns = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)]),
+        self.check_error_on_write(df, ValueError)
+
+    def test_path_pathlib(self):
+        df = tm.makeDataFrame().reset_index()
+        result = tm.round_trip_pathlib(df.to_feather, pd.read_feather)
+        tm.assert_frame_equal(df, result)
+
+    def test_path_localpath(self):
+        df = tm.makeDataFrame().reset_index()
+        result = tm.round_trip_localpath(df.to_feather, pd.read_feather)
+        tm.assert_frame_equal(df, result)
diff --git a/pandas/tests/io/test_gbq.py b/pandas/tests/io/test_gbq.py
new file mode 100644
index 0000000000000..dc6c319bb3366
--- /dev/null
+++ b/pandas/tests/io/test_gbq.py
@@ -0,0 +1,134 @@
+import pytest
+from datetime import datetime
+import pytz
+import platform
+import os
+
+import numpy as np
+import pandas as pd
+from pandas import compat, DataFrame
+
+from pandas.compat import range
+
+pandas_gbq = pytest.importorskip('pandas_gbq')
+
+PROJECT_ID = None
+PRIVATE_KEY_JSON_PATH = None
+PRIVATE_KEY_JSON_CONTENTS = None
+
+if compat.PY3:
+    DATASET_ID = 'pydata_pandas_bq_testing_py3'
+else:
+    DATASET_ID = 'pydata_pandas_bq_testing_py2'
+
+TABLE_ID = 'new_test'
+DESTINATION_TABLE = "{0}.{1}".format(DATASET_ID + "1", TABLE_ID)
+
+VERSION = platform.python_version()
+
+
+def _skip_if_no_project_id():
+    if not _get_project_id():
+        pytest.skip(
+            "Cannot run integration tests without a project id")
+
+
+def _skip_if_no_private_key_path():
+    if not _get_private_key_path():
+        pytest.skip("Cannot run integration tests without a "
+                    "private key json file path")
+
+
+def _in_travis_environment():
+    return 'TRAVIS_BUILD_DIR' in os.environ and \
+           'GBQ_PROJECT_ID' in os.environ
+
+
+def _get_project_id():
+    if _in_travis_environment():
+        return os.environ.get('GBQ_PROJECT_ID')
+    return PROJECT_ID or os.environ.get('GBQ_PROJECT_ID')
+
+
+def _get_private_key_path():
+    if _in_travis_environment():
+        return os.path.join(*[os.environ.get('TRAVIS_BUILD_DIR'), 'ci',
+                              'travis_gbq.json'])
+
+    private_key_path = PRIVATE_KEY_JSON_PATH
+    if not private_key_path:
+        private_key_path = os.environ.get('GBQ_GOOGLE_APPLICATION_CREDENTIALS')
+    return private_key_path
+
+
+def clean_gbq_environment(private_key=None):
+    dataset = pandas_gbq.gbq._Dataset(_get_project_id(),
+                                      private_key=private_key)
+
+    for i in range(1, 10):
+        if DATASET_ID + str(i) in dataset.datasets():
+            dataset_id = DATASET_ID + str(i)
+            table = pandas_gbq.gbq._Table(_get_project_id(), dataset_id,
+                                          private_key=private_key)
+            for j in range(1, 20):
+                if TABLE_ID + str(j) in dataset.tables(dataset_id):
+                    table.delete(TABLE_ID + str(j))
+
+            dataset.delete(dataset_id)
+
+
+def make_mixed_dataframe_v2(test_size):
+    # create df to test for all BQ datatypes except RECORD
+    bools = np.random.randint(2, size=(1, test_size)).astype(bool)
+    flts = np.random.randn(1, test_size)
+    ints = np.random.randint(1, 10, size=(1, test_size))
+    strs = np.random.randint(1, 10, size=(1, test_size)).astype(str)
+    times = [datetime.now(pytz.timezone('US/Arizona'))
+             for t in range(test_size)]
+    return DataFrame({'bools': bools[0],
+                      'flts': flts[0],
+                      'ints': ints[0],
+                      'strs': strs[0],
+                      'times': times[0]},
+                     index=range(test_size))
+
+
+@pytest.mark.single
+class TestToGBQIntegrationWithServiceAccountKeyPath(object):
+
+    @classmethod
+    def setup_class(cls):
+        # - GLOBAL CLASS FIXTURES -
+        # put here any instruction you want to execute only *ONCE* *BEFORE*
+        # executing *ALL* tests described below.
+
+        _skip_if_no_project_id()
+        _skip_if_no_private_key_path()
+
+        clean_gbq_environment(_get_private_key_path())
+        pandas_gbq.gbq._Dataset(_get_project_id(),
+                                private_key=_get_private_key_path()
+                                ).create(DATASET_ID + "1")
+
+    @classmethod
+    def teardown_class(cls):
+        # - GLOBAL CLASS FIXTURES -
+        # put here any instruction you want to execute only *ONCE* *AFTER*
+        # executing all tests.
+
+        clean_gbq_environment(_get_private_key_path())
+
+    def test_roundtrip(self):
+        destination_table = DESTINATION_TABLE + "1"
+
+        test_size = 20001
+        df = make_mixed_dataframe_v2(test_size)
+
+        df.to_gbq(destination_table, _get_project_id(), chunksize=None,
+                  private_key=_get_private_key_path())
+
+        result = pd.read_gbq("SELECT COUNT(*) AS num_rows FROM {0}"
+                             .format(destination_table),
+                             project_id=_get_project_id(),
+                             private_key=_get_private_key_path())
+        assert result['num_rows'][0] == test_size
diff --git a/pandas/tests/io/test_gcs.py b/pandas/tests/io/test_gcs.py
new file mode 100644
index 0000000000000..251c93df0733d
--- /dev/null
+++ b/pandas/tests/io/test_gcs.py
@@ -0,0 +1,47 @@
+import numpy as np
+import pytest
+
+from pandas import DataFrame, date_range, read_csv
+from pandas.compat import StringIO
+from pandas.io.common import is_gcs_url
+from pandas.util import _test_decorators as td
+from pandas.util.testing import assert_frame_equal
+
+
+def test_is_gcs_url():
+    assert is_gcs_url("gcs://pandas/somethingelse.com")
+    assert is_gcs_url("gs://pandas/somethingelse.com")
+    assert not is_gcs_url("s3://pandas/somethingelse.com")
+
+
+@td.skip_if_no('gcsfs')
+def test_read_csv_gcs(mock):
+    df1 = DataFrame({'int': [1, 3], 'float': [2.0, np.nan], 'str': ['t', 's'],
+                     'dt': date_range('2018-06-18', periods=2)})
+    with mock.patch('gcsfs.GCSFileSystem') as MockFileSystem:
+        instance = MockFileSystem.return_value
+        instance.open.return_value = StringIO(df1.to_csv(index=False))
+        df2 = read_csv('gs://test/test.csv', parse_dates=['dt'])
+
+    assert_frame_equal(df1, df2)
+
+
+@td.skip_if_no('gcsfs')
+def test_gcs_get_filepath_or_buffer(mock):
+    df1 = DataFrame({'int': [1, 3], 'float': [2.0, np.nan], 'str': ['t', 's'],
+                     'dt': date_range('2018-06-18', periods=2)})
+    with mock.patch('pandas.io.gcs.get_filepath_or_buffer') as MockGetFilepath:
+        MockGetFilepath.return_value = (StringIO(df1.to_csv(index=False)),
+                                        None, None, False)
+        df2 = read_csv('gs://test/test.csv', parse_dates=['dt'])
+
+    assert_frame_equal(df1, df2)
+    assert MockGetFilepath.called
+
+
+@pytest.mark.skipif(td.safe_import('gcsfs'),
+                    reason='Only check when gcsfs not installed')
+def test_gcs_not_present_exception():
+    with pytest.raises(ImportError) as e:
+        read_csv('gs://test/test.csv')
+        assert 'gcsfs library is required' in str(e.value)
diff --git a/pandas/tests/io/test_html.py b/pandas/tests/io/test_html.py
new file mode 100644
index 0000000000000..9c6a8de7ed446
--- /dev/null
+++ b/pandas/tests/io/test_html.py
@@ -0,0 +1,947 @@
+from __future__ import print_function
+
+import os
+import re
+import threading
+
+from functools import partial
+
+import pytest
+
+import numpy as np
+from numpy.random import rand
+
+from pandas import (DataFrame, MultiIndex, read_csv, Timestamp, Index,
+                    date_range, Series)
+from pandas.compat import (map, zip, StringIO, BytesIO,
+                           is_platform_windows, PY3, reload)
+from pandas.io.common import URLError, file_path_to_url
+import pandas.io.html
+from pandas.io.html import read_html
+from pandas._libs.parsers import ParserError
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas.util.testing import makeCustomDataframe as mkdf, network
+
+HERE = os.path.dirname(__file__)
+
+
+@pytest.fixture(params=[
+    'chinese_utf-16.html',
+    'chinese_utf-32.html',
+    'chinese_utf-8.html',
+    'letz_latin1.html',
+])
+def html_encoding_file(request, datapath):
+    """Parametrized fixture for HTML encoding test filenames."""
+    return datapath('io', 'data', 'html_encoding', request.param)
+
+
+def assert_framelist_equal(list1, list2, *args, **kwargs):
+    assert len(list1) == len(list2), ('lists are not of equal size '
+                                      'len(list1) == {0}, '
+                                      'len(list2) == {1}'.format(len(list1),
+                                                                 len(list2)))
+    msg = 'not all list elements are DataFrames'
+    both_frames = all(map(lambda x, y: isinstance(x, DataFrame) and
+                          isinstance(y, DataFrame), list1, list2))
+    assert both_frames, msg
+    for frame_i, frame_j in zip(list1, list2):
+        tm.assert_frame_equal(frame_i, frame_j, *args, **kwargs)
+        assert not frame_i.empty, 'frames are both empty'
+
+
+@td.skip_if_no('bs4')
+def test_bs4_version_fails(monkeypatch, datapath):
+    import bs4
+    monkeypatch.setattr(bs4, '__version__', '4.2')
+    with tm.assert_raises_regex(ValueError, "minimum version"):
+        read_html(datapath("io", "data", "spam.html"), flavor='bs4')
+
+
+def test_invalid_flavor():
+    url = 'google.com'
+    with pytest.raises(ValueError):
+        read_html(url, 'google', flavor='not a* valid**++ flaver')
+
+
+@td.skip_if_no('bs4')
+@td.skip_if_no('lxml')
+def test_same_ordering(datapath):
+    filename = datapath('io', 'data', 'valid_markup.html')
+    dfs_lxml = read_html(filename, index_col=0, flavor=['lxml'])
+    dfs_bs4 = read_html(filename, index_col=0, flavor=['bs4'])
+    assert_framelist_equal(dfs_lxml, dfs_bs4)
+
+
+@pytest.mark.parametrize("flavor", [
+    pytest.param('bs4', marks=pytest.mark.skipif(
+        not td.safe_import('lxml'), reason='No bs4')),
+    pytest.param('lxml', marks=pytest.mark.skipif(
+        not td.safe_import('lxml'), reason='No lxml'))], scope="class")
+class TestReadHtml(object):
+
+    @pytest.fixture(autouse=True)
+    def set_files(self, datapath):
+        self.spam_data = datapath('io', 'data', 'spam.html')
+        self.spam_data_kwargs = {}
+        if PY3:
+            self.spam_data_kwargs['encoding'] = 'UTF-8'
+        self.banklist_data = datapath("io", "data", "banklist.html")
+
+    @pytest.fixture(autouse=True, scope="function")
+    def set_defaults(self, flavor, request):
+        self.read_html = partial(read_html, flavor=flavor)
+        yield
+
+    def test_to_html_compat(self):
+        df = mkdf(4, 3, data_gen_f=lambda *args: rand(), c_idx_names=False,
+                  r_idx_names=False).applymap('{0:.3f}'.format).astype(float)
+        out = df.to_html()
+        res = self.read_html(out, attrs={'class': 'dataframe'}, index_col=0)[0]
+        tm.assert_frame_equal(res, df)
+
+    @network
+    def test_banklist_url(self):
+        url = 'http://www.fdic.gov/bank/individual/failed/banklist.html'
+        df1 = self.read_html(url, 'First Federal Bank of Florida',
+                             attrs={"id": 'table'})
+        df2 = self.read_html(url, 'Metcalf Bank', attrs={'id': 'table'})
+
+        assert_framelist_equal(df1, df2)
+
+    @network
+    def test_spam_url(self):
+        url = ('http://ndb.nal.usda.gov/ndb/foods/show/300772?fg=&man=&'
+               'lfacet=&format=&count=&max=25&offset=&sort=&qlookup=spam')
+        df1 = self.read_html(url, '.*Water.*')
+        df2 = self.read_html(url, 'Unit')
+
+        assert_framelist_equal(df1, df2)
+
+    @pytest.mark.slow
+    def test_banklist(self):
+        df1 = self.read_html(self.banklist_data, '.*Florida.*',
+                             attrs={'id': 'table'})
+        df2 = self.read_html(self.banklist_data, 'Metcalf Bank',
+                             attrs={'id': 'table'})
+
+        assert_framelist_equal(df1, df2)
+
+    def test_spam_no_types(self):
+
+        # infer_types removed in #10892
+        df1 = self.read_html(self.spam_data, '.*Water.*')
+        df2 = self.read_html(self.spam_data, 'Unit')
+        assert_framelist_equal(df1, df2)
+        assert df1[0].iloc[0, 0] == 'Proximates'
+        assert df1[0].columns[0] == 'Nutrient'
+
+    def test_spam_with_types(self):
+        df1 = self.read_html(self.spam_data, '.*Water.*')
+        df2 = self.read_html(self.spam_data, 'Unit')
+        assert_framelist_equal(df1, df2)
+
+        assert df1[0].iloc[0, 0] == 'Proximates'
+        assert df1[0].columns[0] == 'Nutrient'
+
+    def test_spam_no_match(self):
+        dfs = self.read_html(self.spam_data)
+        for df in dfs:
+            assert isinstance(df, DataFrame)
+
+    def test_banklist_no_match(self):
+        dfs = self.read_html(self.banklist_data, attrs={'id': 'table'})
+        for df in dfs:
+            assert isinstance(df, DataFrame)
+
+    def test_spam_header(self):
+        df = self.read_html(self.spam_data, '.*Water.*', header=1)[0]
+        assert df.columns[0] == 'Proximates'
+        assert not df.empty
+
+    def test_skiprows_int(self):
+        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=1)
+        df2 = self.read_html(self.spam_data, 'Unit', skiprows=1)
+
+        assert_framelist_equal(df1, df2)
+
+    def test_skiprows_xrange(self):
+        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=range(2))[0]
+        df2 = self.read_html(self.spam_data, 'Unit', skiprows=range(2))[0]
+        tm.assert_frame_equal(df1, df2)
+
+    def test_skiprows_list(self):
+        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=[1, 2])
+        df2 = self.read_html(self.spam_data, 'Unit', skiprows=[2, 1])
+
+        assert_framelist_equal(df1, df2)
+
+    def test_skiprows_set(self):
+        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=set([1, 2]))
+        df2 = self.read_html(self.spam_data, 'Unit', skiprows=set([2, 1]))
+
+        assert_framelist_equal(df1, df2)
+
+    def test_skiprows_slice(self):
+        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=1)
+        df2 = self.read_html(self.spam_data, 'Unit', skiprows=1)
+
+        assert_framelist_equal(df1, df2)
+
+    def test_skiprows_slice_short(self):
+        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=slice(2))
+        df2 = self.read_html(self.spam_data, 'Unit', skiprows=slice(2))
+
+        assert_framelist_equal(df1, df2)
+
+    def test_skiprows_slice_long(self):
+        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=slice(2, 5))
+        df2 = self.read_html(self.spam_data, 'Unit', skiprows=slice(4, 1, -1))
+
+        assert_framelist_equal(df1, df2)
+
+    def test_skiprows_ndarray(self):
+        df1 = self.read_html(self.spam_data, '.*Water.*',
+                             skiprows=np.arange(2))
+        df2 = self.read_html(self.spam_data, 'Unit', skiprows=np.arange(2))
+
+        assert_framelist_equal(df1, df2)
+
+    def test_skiprows_invalid(self):
+        with tm.assert_raises_regex(TypeError, 'is not a valid type '
+                                    'for skipping rows'):
+            self.read_html(self.spam_data, '.*Water.*', skiprows='asdf')
+
+    def test_index(self):
+        df1 = self.read_html(self.spam_data, '.*Water.*', index_col=0)
+        df2 = self.read_html(self.spam_data, 'Unit', index_col=0)
+        assert_framelist_equal(df1, df2)
+
+    def test_header_and_index_no_types(self):
+        df1 = self.read_html(self.spam_data, '.*Water.*', header=1,
+                             index_col=0)
+        df2 = self.read_html(self.spam_data, 'Unit', header=1, index_col=0)
+        assert_framelist_equal(df1, df2)
+
+    def test_header_and_index_with_types(self):
+        df1 = self.read_html(self.spam_data, '.*Water.*', header=1,
+                             index_col=0)
+        df2 = self.read_html(self.spam_data, 'Unit', header=1, index_col=0)
+        assert_framelist_equal(df1, df2)
+
+    def test_infer_types(self):
+
+        # 10892 infer_types removed
+        df1 = self.read_html(self.spam_data, '.*Water.*', index_col=0)
+        df2 = self.read_html(self.spam_data, 'Unit', index_col=0)
+        assert_framelist_equal(df1, df2)
+
+    def test_string_io(self):
+        with open(self.spam_data, **self.spam_data_kwargs) as f:
+            data1 = StringIO(f.read())
+
+        with open(self.spam_data, **self.spam_data_kwargs) as f:
+            data2 = StringIO(f.read())
+
+        df1 = self.read_html(data1, '.*Water.*')
+        df2 = self.read_html(data2, 'Unit')
+        assert_framelist_equal(df1, df2)
+
+    def test_string(self):
+        with open(self.spam_data, **self.spam_data_kwargs) as f:
+            data = f.read()
+
+        df1 = self.read_html(data, '.*Water.*')
+        df2 = self.read_html(data, 'Unit')
+
+        assert_framelist_equal(df1, df2)
+
+    def test_file_like(self):
+        with open(self.spam_data, **self.spam_data_kwargs) as f:
+            df1 = self.read_html(f, '.*Water.*')
+
+        with open(self.spam_data, **self.spam_data_kwargs) as f:
+            df2 = self.read_html(f, 'Unit')
+
+        assert_framelist_equal(df1, df2)
+
+    @network
+    def test_bad_url_protocol(self):
+        with pytest.raises(URLError):
+            self.read_html('git://github.com', match='.*Water.*')
+
+    @network
+    def test_invalid_url(self):
+        try:
+            with pytest.raises(URLError):
+                self.read_html('http://www.a23950sdfa908sd.com',
+                               match='.*Water.*')
+        except ValueError as e:
+            assert str(e) == 'No tables found'
+
+    @pytest.mark.slow
+    def test_file_url(self):
+        url = self.banklist_data
+        dfs = self.read_html(file_path_to_url(os.path.abspath(url)),
+                             'First',
+                             attrs={'id': 'table'})
+        assert isinstance(dfs, list)
+        for df in dfs:
+            assert isinstance(df, DataFrame)
+
+    @pytest.mark.slow
+    def test_invalid_table_attrs(self):
+        url = self.banklist_data
+        with tm.assert_raises_regex(ValueError, 'No tables found'):
+            self.read_html(url, 'First Federal Bank of Florida',
+                           attrs={'id': 'tasdfable'})
+
+    def _bank_data(self, *args, **kwargs):
+        return self.read_html(self.banklist_data, 'Metcalf',
+                              attrs={'id': 'table'}, *args, **kwargs)
+
+    @pytest.mark.slow
+    def test_multiindex_header(self):
+        df = self._bank_data(header=[0, 1])[0]
+        assert isinstance(df.columns, MultiIndex)
+
+    @pytest.mark.slow
+    def test_multiindex_index(self):
+        df = self._bank_data(index_col=[0, 1])[0]
+        assert isinstance(df.index, MultiIndex)
+
+    @pytest.mark.slow
+    def test_multiindex_header_index(self):
+        df = self._bank_data(header=[0, 1], index_col=[0, 1])[0]
+        assert isinstance(df.columns, MultiIndex)
+        assert isinstance(df.index, MultiIndex)
+
+    @pytest.mark.slow
+    def test_multiindex_header_skiprows_tuples(self):
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            df = self._bank_data(header=[0, 1], skiprows=1,
+                                 tupleize_cols=True)[0]
+            assert isinstance(df.columns, Index)
+
+    @pytest.mark.slow
+    def test_multiindex_header_skiprows(self):
+        df = self._bank_data(header=[0, 1], skiprows=1)[0]
+        assert isinstance(df.columns, MultiIndex)
+
+    @pytest.mark.slow
+    def test_multiindex_header_index_skiprows(self):
+        df = self._bank_data(header=[0, 1], index_col=[0, 1], skiprows=1)[0]
+        assert isinstance(df.index, MultiIndex)
+        assert isinstance(df.columns, MultiIndex)
+
+    @pytest.mark.slow
+    def test_regex_idempotency(self):
+        url = self.banklist_data
+        dfs = self.read_html(file_path_to_url(os.path.abspath(url)),
+                             match=re.compile(re.compile('Florida')),
+                             attrs={'id': 'table'})
+        assert isinstance(dfs, list)
+        for df in dfs:
+            assert isinstance(df, DataFrame)
+
+    def test_negative_skiprows(self):
+        with tm.assert_raises_regex(ValueError,
+                                    r'\(you passed a negative value\)'):
+            self.read_html(self.spam_data, 'Water', skiprows=-1)
+
+    @network
+    def test_multiple_matches(self):
+        url = 'https://docs.python.org/2/'
+        dfs = self.read_html(url, match='Python')
+        assert len(dfs) > 1
+
+    @network
+    def test_python_docs_table(self):
+        url = 'https://docs.python.org/2/'
+        dfs = self.read_html(url, match='Python')
+        zz = [df.iloc[0, 0][0:4] for df in dfs]
+        assert sorted(zz) == sorted(['Repo', 'What'])
+
+    @pytest.mark.slow
+    def test_thousands_macau_stats(self, datapath):
+        all_non_nan_table_index = -2
+        macau_data = datapath("io", "data", "macau.html")
+        dfs = self.read_html(macau_data, index_col=0,
+                             attrs={'class': 'style1'})
+        df = dfs[all_non_nan_table_index]
+
+        assert not any(s.isna().any() for _, s in df.iteritems())
+
+    @pytest.mark.slow
+    def test_thousands_macau_index_col(self, datapath):
+        all_non_nan_table_index = -2
+        macau_data = datapath('io', 'data', 'macau.html')
+        dfs = self.read_html(macau_data, index_col=0, header=0)
+        df = dfs[all_non_nan_table_index]
+
+        assert not any(s.isna().any() for _, s in df.iteritems())
+
+    def test_empty_tables(self):
+        """
+        Make sure that read_html ignores empty tables.
+        """
+        data1 = '''<table>
+            <thead>
+                <tr>
+                    <th>A</th>
+                    <th>B</th>
+                </tr>
+            </thead>
+            <tbody>
+                <tr>
+                    <td>1</td>
+                    <td>2</td>
+                </tr>
+            </tbody>
+        </table>'''
+        data2 = data1 + '''<table>
+            <tbody>
+            </tbody>
+        </table>'''
+        res1 = self.read_html(StringIO(data1))
+        res2 = self.read_html(StringIO(data2))
+        assert_framelist_equal(res1, res2)
+
+    def test_multiple_tbody(self):
+        # GH-20690
+        # Read all tbody tags within a single table.
+        data = '''<table>
+            <thead>
+                <tr>
+                    <th>A</th>
+                    <th>B</th>
+                </tr>
+            </thead>
+            <tbody>
+                <tr>
+                    <td>1</td>
+                    <td>2</td>
+                </tr>
+            </tbody>
+            <tbody>
+                <tr>
+                    <td>3</td>
+                    <td>4</td>
+                </tr>
+            </tbody>
+        </table>'''
+        expected = DataFrame({'A': [1, 3], 'B': [2, 4]})
+        result = self.read_html(StringIO(data))[0]
+        tm.assert_frame_equal(result, expected)
+
+    def test_header_and_one_column(self):
+        """
+        Don't fail with bs4 when there is a header and only one column
+        as described in issue #9178
+        """
+        data = StringIO('''<html>
+            <body>
+             <table>
+                <thead>
+                    <tr>
+                        <th>Header</th>
+                    </tr>
+                </thead>
+                <tbody>
+                    <tr>
+                        <td>first</td>
+                    </tr>
+                </tbody>
+            </table>
+            </body>
+        </html>''')
+        expected = DataFrame(data={'Header': 'first'}, index=[0])
+        result = self.read_html(data)[0]
+        tm.assert_frame_equal(result, expected)
+
+    def test_tfoot_read(self):
+        """
+        Make sure that read_html reads tfoot, containing td or th.
+        Ignores empty tfoot
+        """
+        data_template = '''<table>
+            <thead>
+                <tr>
+                    <th>A</th>
+                    <th>B</th>
+                </tr>
+            </thead>
+            <tbody>
+                <tr>
+                    <td>bodyA</td>
+                    <td>bodyB</td>
+                </tr>
+            </tbody>
+            <tfoot>
+                {footer}
+            </tfoot>
+        </table>'''
+
+        data1 = data_template.format(footer="")
+        data2 = data_template.format(
+            footer="<tr><td>footA</td><th>footB</th></tr>")
+
+        d1 = {'A': ['bodyA'], 'B': ['bodyB']}
+        d2 = {'A': ['bodyA', 'footA'], 'B': ['bodyB', 'footB']}
+
+        tm.assert_frame_equal(self.read_html(data1)[0], DataFrame(d1))
+        tm.assert_frame_equal(self.read_html(data2)[0], DataFrame(d2))
+
+    def test_countries_municipalities(self):
+        # GH5048
+        data1 = StringIO('''<table>
+            <thead>
+                <tr>
+                    <th>Country</th>
+                    <th>Municipality</th>
+                    <th>Year</th>
+                </tr>
+            </thead>
+            <tbody>
+                <tr>
+                    <td>Ukraine</td>
+                    <th>Odessa</th>
+                    <td>1944</td>
+                </tr>
+            </tbody>
+        </table>''')
+        data2 = StringIO('''
+        <table>
+            <tbody>
+                <tr>
+                    <th>Country</th>
+                    <th>Municipality</th>
+                    <th>Year</th>
+                </tr>
+                <tr>
+                    <td>Ukraine</td>
+                    <th>Odessa</th>
+                    <td>1944</td>
+                </tr>
+            </tbody>
+        </table>''')
+        res1 = self.read_html(data1)
+        res2 = self.read_html(data2, header=0)
+        assert_framelist_equal(res1, res2)
+
+    def test_nyse_wsj_commas_table(self, datapath):
+        data = datapath('io', 'data', 'nyse_wsj.html')
+        df = self.read_html(data, index_col=0, header=0,
+                            attrs={'class': 'mdcTable'})[0]
+
+        columns = Index(['Issue(Roll over for charts and headlines)',
+                         'Volume', 'Price', 'Chg', '% Chg'])
+        nrows = 100
+        assert df.shape[0] == nrows
+        tm.assert_index_equal(df.columns, columns)
+
+    @pytest.mark.slow
+    def test_banklist_header(self, datapath):
+        from pandas.io.html import _remove_whitespace
+
+        def try_remove_ws(x):
+            try:
+                return _remove_whitespace(x)
+            except AttributeError:
+                return x
+
+        df = self.read_html(self.banklist_data, 'Metcalf',
+                            attrs={'id': 'table'})[0]
+        ground_truth = read_csv(datapath('io', 'data', 'banklist.csv'),
+                                converters={'Updated Date': Timestamp,
+                                            'Closing Date': Timestamp})
+        assert df.shape == ground_truth.shape
+        old = ['First Vietnamese American BankIn Vietnamese',
+               'Westernbank Puerto RicoEn Espanol',
+               'R-G Premier Bank of Puerto RicoEn Espanol',
+               'EurobankEn Espanol', 'Sanderson State BankEn Espanol',
+               'Washington Mutual Bank(Including its subsidiary Washington '
+               'Mutual Bank FSB)',
+               'Silver State BankEn Espanol',
+               'AmTrade International BankEn Espanol',
+               'Hamilton Bank, NAEn Espanol',
+               'The Citizens Savings BankPioneer Community Bank, Inc.']
+        new = ['First Vietnamese American Bank', 'Westernbank Puerto Rico',
+               'R-G Premier Bank of Puerto Rico', 'Eurobank',
+               'Sanderson State Bank', 'Washington Mutual Bank',
+               'Silver State Bank', 'AmTrade International Bank',
+               'Hamilton Bank, NA', 'The Citizens Savings Bank']
+        dfnew = df.applymap(try_remove_ws).replace(old, new)
+        gtnew = ground_truth.applymap(try_remove_ws)
+        converted = dfnew._convert(datetime=True, numeric=True)
+        date_cols = ['Closing Date', 'Updated Date']
+        converted[date_cols] = converted[date_cols]._convert(datetime=True,
+                                                             coerce=True)
+        tm.assert_frame_equal(converted, gtnew)
+
+    @pytest.mark.slow
+    def test_gold_canyon(self):
+        gc = 'Gold Canyon'
+        with open(self.banklist_data, 'r') as f:
+            raw_text = f.read()
+
+        assert gc in raw_text
+        df = self.read_html(self.banklist_data, 'Gold Canyon',
+                            attrs={'id': 'table'})[0]
+        assert gc in df.to_string()
+
+    def test_different_number_of_rows(self):
+        expected = """<table border="1" class="dataframe">
+                        <thead>
+                            <tr style="text-align: right;">
+                            <th></th>
+                            <th>C_l0_g0</th>
+                            <th>C_l0_g1</th>
+                            <th>C_l0_g2</th>
+                            <th>C_l0_g3</th>
+                            <th>C_l0_g4</th>
+                            </tr>
+                        </thead>
+                        <tbody>
+                            <tr>
+                            <th>R_l0_g0</th>
+                            <td> 0.763</td>
+                            <td> 0.233</td>
+                            <td> nan</td>
+                            <td> nan</td>
+                            <td> nan</td>
+                            </tr>
+                            <tr>
+                            <th>R_l0_g1</th>
+                            <td> 0.244</td>
+                            <td> 0.285</td>
+                            <td> 0.392</td>
+                            <td> 0.137</td>
+                            <td> 0.222</td>
+                            </tr>
+                        </tbody>
+                    </table>"""
+        out = """<table border="1" class="dataframe">
+                    <thead>
+                        <tr style="text-align: right;">
+                        <th></th>
+                        <th>C_l0_g0</th>
+                        <th>C_l0_g1</th>
+                        <th>C_l0_g2</th>
+                        <th>C_l0_g3</th>
+                        <th>C_l0_g4</th>
+                        </tr>
+                    </thead>
+                    <tbody>
+                        <tr>
+                        <th>R_l0_g0</th>
+                        <td> 0.763</td>
+                        <td> 0.233</td>
+                        </tr>
+                        <tr>
+                        <th>R_l0_g1</th>
+                        <td> 0.244</td>
+                        <td> 0.285</td>
+                        <td> 0.392</td>
+                        <td> 0.137</td>
+                        <td> 0.222</td>
+                        </tr>
+                    </tbody>
+                 </table>"""
+        expected = self.read_html(expected, index_col=0)[0]
+        res = self.read_html(out, index_col=0)[0]
+        tm.assert_frame_equal(expected, res)
+
+    def test_parse_dates_list(self):
+        df = DataFrame({'date': date_range('1/1/2001', periods=10)})
+        expected = df.to_html()
+        res = self.read_html(expected, parse_dates=[1], index_col=0)
+        tm.assert_frame_equal(df, res[0])
+        res = self.read_html(expected, parse_dates=['date'], index_col=0)
+        tm.assert_frame_equal(df, res[0])
+
+    def test_parse_dates_combine(self):
+        raw_dates = Series(date_range('1/1/2001', periods=10))
+        df = DataFrame({'date': raw_dates.map(lambda x: str(x.date())),
+                        'time': raw_dates.map(lambda x: str(x.time()))})
+        res = self.read_html(df.to_html(), parse_dates={'datetime': [1, 2]},
+                             index_col=1)
+        newdf = DataFrame({'datetime': raw_dates})
+        tm.assert_frame_equal(newdf, res[0])
+
+    def test_computer_sales_page(self, datapath):
+        data = datapath('io', 'data', 'computer_sales_page.html')
+        with tm.assert_raises_regex(ParserError,
+                                    r"Passed header=\[0,1\] are "
+                                    r"too many rows for this "
+                                    r"multi_index of columns"):
+            self.read_html(data, header=[0, 1])
+
+        data = datapath('io', 'data', 'computer_sales_page.html')
+        assert self.read_html(data, header=[1, 2])
+
+    def test_wikipedia_states_table(self, datapath):
+        data = datapath('io', 'data', 'wikipedia_states.html')
+        assert os.path.isfile(data), '%r is not a file' % data
+        assert os.path.getsize(data), '%r is an empty file' % data
+        result = self.read_html(data, 'Arizona', header=1)[0]
+        assert result['sq mi'].dtype == np.dtype('float64')
+
+    def test_decimal_rows(self):
+
+        # GH 12907
+        data = StringIO('''<html>
+            <body>
+             <table>
+                <thead>
+                    <tr>
+                        <th>Header</th>
+                    </tr>
+                </thead>
+                <tbody>
+                    <tr>
+                        <td>1100#101</td>
+                    </tr>
+                </tbody>
+            </table>
+            </body>
+        </html>''')
+        expected = DataFrame(data={'Header': 1100.101}, index=[0])
+        result = self.read_html(data, decimal='#')[0]
+        assert result['Header'].dtype == np.dtype('float64')
+        tm.assert_frame_equal(result, expected)
+
+    def test_bool_header_arg(self):
+        # GH 6114
+        for arg in [True, False]:
+            with pytest.raises(TypeError):
+                read_html(self.spam_data, header=arg)
+
+    def test_converters(self):
+        # GH 13461
+        html_data = """<table>
+                        <thead>
+                            <th>a</th>
+                            </tr>
+                        </thead>
+                        <tbody>
+                            <tr>
+                            <td> 0.763</td>
+                            </tr>
+                            <tr>
+                            <td> 0.244</td>
+                            </tr>
+                        </tbody>
+                    </table>"""
+
+        expected_df = DataFrame({'a': ['0.763', '0.244']})
+        html_df = read_html(html_data, converters={'a': str})[0]
+        tm.assert_frame_equal(expected_df, html_df)
+
+    def test_na_values(self):
+        # GH 13461
+        html_data = """<table>
+                        <thead>
+                            <th>a</th>
+                            </tr>
+                        </thead>
+                        <tbody>
+                            <tr>
+                            <td> 0.763</td>
+                            </tr>
+                            <tr>
+                            <td> 0.244</td>
+                            </tr>
+                        </tbody>
+                    </table>"""
+
+        expected_df = DataFrame({'a': [0.763, np.nan]})
+        html_df = read_html(html_data, na_values=[0.244])[0]
+        tm.assert_frame_equal(expected_df, html_df)
+
+    def test_keep_default_na(self):
+        html_data = """<table>
+                        <thead>
+                            <th>a</th>
+                            </tr>
+                        </thead>
+                        <tbody>
+                            <tr>
+                            <td> N/A</td>
+                            </tr>
+                            <tr>
+                            <td> NA</td>
+                            </tr>
+                        </tbody>
+                    </table>"""
+
+        expected_df = DataFrame({'a': ['N/A', 'NA']})
+        html_df = read_html(html_data, keep_default_na=False)[0]
+        tm.assert_frame_equal(expected_df, html_df)
+
+        expected_df = DataFrame({'a': [np.nan, np.nan]})
+        html_df = read_html(html_data, keep_default_na=True)[0]
+        tm.assert_frame_equal(expected_df, html_df)
+
+    def test_multiple_header_rows(self):
+        # Issue #13434
+        expected_df = DataFrame(data=[("Hillary", 68, "D"),
+                                      ("Bernie", 74, "D"),
+                                      ("Donald", 69, "R")])
+        expected_df.columns = [["Unnamed: 0_level_0", "Age", "Party"],
+                               ["Name", "Unnamed: 1_level_1",
+                                "Unnamed: 2_level_1"]]
+        html = expected_df.to_html(index=False)
+        html_df = read_html(html, )[0]
+        tm.assert_frame_equal(expected_df, html_df)
+
+    def test_works_on_valid_markup(self, datapath):
+        filename = datapath('io', 'data', 'valid_markup.html')
+        dfs = self.read_html(filename, index_col=0)
+        assert isinstance(dfs, list)
+        assert isinstance(dfs[0], DataFrame)
+
+    @pytest.mark.slow
+    def test_fallback_success(self, datapath):
+        banklist_data = datapath('io', 'data', 'banklist.html')
+        self.read_html(banklist_data, '.*Water.*', flavor=['lxml', 'html5lib'])
+
+    def test_to_html_timestamp(self):
+        rng = date_range('2000-01-01', periods=10)
+        df = DataFrame(np.random.randn(10, 4), index=rng)
+
+        result = df.to_html()
+        assert '2000-01-01' in result
+
+    @pytest.mark.parametrize("displayed_only,exp0,exp1", [
+        (True, DataFrame(["foo"]), None),
+        (False, DataFrame(["foo  bar  baz  qux"]), DataFrame(["foo"]))])
+    def test_displayed_only(self, displayed_only, exp0, exp1):
+        # GH 20027
+        data = StringIO("""<html>
+          <body>
+            <table>
+              <tr>
+                <td>
+                  foo
+                  <span style="display:none;text-align:center">bar</span>
+                  <span style="display:none">baz</span>
+                  <span style="display: none">qux</span>
+                </td>
+              </tr>
+            </table>
+            <table style="display: none">
+              <tr>
+                <td>foo</td>
+              </tr>
+            </table>
+          </body>
+        </html>""")
+
+        dfs = self.read_html(data, displayed_only=displayed_only)
+        tm.assert_frame_equal(dfs[0], exp0)
+
+        if exp1 is not None:
+            tm.assert_frame_equal(dfs[1], exp1)
+        else:
+            assert len(dfs) == 1  # Should not parse hidden table
+
+    def test_encode(self, html_encoding_file):
+        _, encoding = os.path.splitext(
+            os.path.basename(html_encoding_file)
+        )[0].split('_')
+
+        try:
+            with open(html_encoding_file, 'rb') as fobj:
+                from_string = self.read_html(fobj.read(), encoding=encoding,
+                                             index_col=0).pop()
+
+            with open(html_encoding_file, 'rb') as fobj:
+                from_file_like = self.read_html(BytesIO(fobj.read()),
+                                                encoding=encoding,
+                                                index_col=0).pop()
+
+            from_filename = self.read_html(html_encoding_file,
+                                           encoding=encoding,
+                                           index_col=0).pop()
+            tm.assert_frame_equal(from_string, from_file_like)
+            tm.assert_frame_equal(from_string, from_filename)
+        except Exception:
+            # seems utf-16/32 fail on windows
+            if is_platform_windows():
+                if '16' in encoding or '32' in encoding:
+                    pytest.skip()
+                raise
+
+    def test_parse_failure_unseekable(self):
+        # Issue #17975
+
+        if self.read_html.keywords.get('flavor') == 'lxml':
+            pytest.skip("Not applicable for lxml")
+
+        class UnseekableStringIO(StringIO):
+            def seekable(self):
+                return False
+
+        bad = UnseekableStringIO('''
+            <table><tr><td>spam<foobr />eggs</td></tr></table>''')
+
+        assert self.read_html(bad)
+
+        with pytest.raises(ValueError,
+                           match='passed a non-rewindable file object'):
+            self.read_html(bad)
+
+    def test_parse_failure_rewinds(self):
+        # Issue #17975
+
+        class MockFile(object):
+            def __init__(self, data):
+                self.data = data
+                self.at_end = False
+
+            def read(self, size=None):
+                data = '' if self.at_end else self.data
+                self.at_end = True
+                return data
+
+            def seek(self, offset):
+                self.at_end = False
+
+            def seekable(self):
+                return True
+
+        good = MockFile('<table><tr><td>spam<br />eggs</td></tr></table>')
+        bad = MockFile('<table><tr><td>spam<foobr />eggs</td></tr></table>')
+
+        assert self.read_html(good)
+        assert self.read_html(bad)
+
+    @pytest.mark.slow
+    def test_importcheck_thread_safety(self, datapath):
+        # see gh-16928
+
+        class ErrorThread(threading.Thread):
+            def run(self):
+                try:
+                    super(ErrorThread, self).run()
+                except Exception as e:
+                    self.err = e
+                else:
+                    self.err = None
+
+        # force import check by reinitalising global vars in html.py
+        reload(pandas.io.html)
+
+        filename = datapath('io', 'data', 'valid_markup.html')
+        helper_thread1 = ErrorThread(target=self.read_html, args=(filename,))
+        helper_thread2 = ErrorThread(target=self.read_html, args=(filename,))
+
+        helper_thread1.start()
+        helper_thread2.start()
+
+        while helper_thread1.is_alive() or helper_thread2.is_alive():
+            pass
+        assert None is helper_thread1.err is helper_thread2.err
diff --git a/pandas/tests/io/test_packers.py b/pandas/tests/io/test_packers.py
new file mode 100644
index 0000000000000..412e218f95c6f
--- /dev/null
+++ b/pandas/tests/io/test_packers.py
@@ -0,0 +1,939 @@
+import pytest
+
+from warnings import catch_warnings
+import os
+import datetime
+import glob
+import numpy as np
+from distutils.version import LooseVersion
+
+from pandas import compat
+from pandas.compat import u, PY3
+from pandas import (Series, DataFrame, Panel, MultiIndex, bdate_range,
+                    date_range, period_range, Index, Categorical,
+                    Period, Interval)
+from pandas.errors import PerformanceWarning
+from pandas.io.packers import to_msgpack, read_msgpack
+import pandas.util.testing as tm
+from pandas.util.testing import (ensure_clean,
+                                 assert_categorical_equal,
+                                 assert_frame_equal,
+                                 assert_index_equal,
+                                 assert_series_equal,
+                                 patch)
+from pandas.tests.test_panel import assert_panel_equal
+
+import pandas
+from pandas import Timestamp, NaT
+from pandas._libs.tslib import iNaT
+
+nan = np.nan
+
+try:
+    import blosc  # NOQA
+except ImportError:
+    _BLOSC_INSTALLED = False
+else:
+    _BLOSC_INSTALLED = True
+
+try:
+    import zlib  # NOQA
+except ImportError:
+    _ZLIB_INSTALLED = False
+else:
+    _ZLIB_INSTALLED = True
+
+
+@pytest.fixture(scope='module')
+def current_packers_data():
+    # our current version packers data
+    from pandas.tests.io.generate_legacy_storage_files import (
+        create_msgpack_data)
+    return create_msgpack_data()
+
+
+@pytest.fixture(scope='module')
+def all_packers_data():
+    # our all of our current version packers data
+    from pandas.tests.io.generate_legacy_storage_files import (
+        create_data)
+    return create_data()
+
+
+def check_arbitrary(a, b):
+
+    if isinstance(a, (list, tuple)) and isinstance(b, (list, tuple)):
+        assert(len(a) == len(b))
+        for a_, b_ in zip(a, b):
+            check_arbitrary(a_, b_)
+    elif isinstance(a, Panel):
+        assert_panel_equal(a, b)
+    elif isinstance(a, DataFrame):
+        assert_frame_equal(a, b)
+    elif isinstance(a, Series):
+        assert_series_equal(a, b)
+    elif isinstance(a, Index):
+        assert_index_equal(a, b)
+    elif isinstance(a, Categorical):
+        # Temp,
+        # Categorical.categories is changed from str to bytes in PY3
+        # maybe the same as GH 13591
+        if PY3 and b.categories.inferred_type == 'string':
+            pass
+        else:
+            tm.assert_categorical_equal(a, b)
+    elif a is NaT:
+        assert b is NaT
+    elif isinstance(a, Timestamp):
+        assert a == b
+        assert a.freq == b.freq
+    else:
+        assert(a == b)
+
+
+class TestPackers(object):
+
+    def setup_method(self, method):
+        self.path = '__%s__.msg' % tm.rands(10)
+
+    def teardown_method(self, method):
+        pass
+
+    def encode_decode(self, x, compress=None, **kwargs):
+        with ensure_clean(self.path) as p:
+            to_msgpack(p, x, compress=compress, **kwargs)
+            return read_msgpack(p, **kwargs)
+
+
+class TestAPI(TestPackers):
+
+    def test_string_io(self):
+
+        df = DataFrame(np.random.randn(10, 2))
+        s = df.to_msgpack(None)
+        result = read_msgpack(s)
+        tm.assert_frame_equal(result, df)
+
+        s = df.to_msgpack()
+        result = read_msgpack(s)
+        tm.assert_frame_equal(result, df)
+
+        s = df.to_msgpack()
+        result = read_msgpack(compat.BytesIO(s))
+        tm.assert_frame_equal(result, df)
+
+        s = to_msgpack(None, df)
+        result = read_msgpack(s)
+        tm.assert_frame_equal(result, df)
+
+        with ensure_clean(self.path) as p:
+
+            s = df.to_msgpack()
+            with open(p, 'wb') as fh:
+                fh.write(s)
+            result = read_msgpack(p)
+            tm.assert_frame_equal(result, df)
+
+    def test_path_pathlib(self):
+        df = tm.makeDataFrame()
+        result = tm.round_trip_pathlib(df.to_msgpack, read_msgpack)
+        tm.assert_frame_equal(df, result)
+
+    def test_path_localpath(self):
+        df = tm.makeDataFrame()
+        result = tm.round_trip_localpath(df.to_msgpack, read_msgpack)
+        tm.assert_frame_equal(df, result)
+
+    def test_iterator_with_string_io(self):
+
+        dfs = [DataFrame(np.random.randn(10, 2)) for i in range(5)]
+        s = to_msgpack(None, *dfs)
+        for i, result in enumerate(read_msgpack(s, iterator=True)):
+            tm.assert_frame_equal(result, dfs[i])
+
+    def test_invalid_arg(self):
+        # GH10369
+        class A(object):
+
+            def __init__(self):
+                self.read = 0
+
+        pytest.raises(ValueError, read_msgpack, path_or_buf=None)
+        pytest.raises(ValueError, read_msgpack, path_or_buf={})
+        pytest.raises(ValueError, read_msgpack, path_or_buf=A())
+
+
+class TestNumpy(TestPackers):
+
+    def test_numpy_scalar_float(self):
+        x = np.float32(np.random.rand())
+        x_rec = self.encode_decode(x)
+        tm.assert_almost_equal(x, x_rec)
+
+    def test_numpy_scalar_complex(self):
+        x = np.complex64(np.random.rand() + 1j * np.random.rand())
+        x_rec = self.encode_decode(x)
+        assert np.allclose(x, x_rec)
+
+    def test_scalar_float(self):
+        x = np.random.rand()
+        x_rec = self.encode_decode(x)
+        tm.assert_almost_equal(x, x_rec)
+
+    def test_scalar_bool(self):
+        x = np.bool_(1)
+        x_rec = self.encode_decode(x)
+        tm.assert_almost_equal(x, x_rec)
+
+        x = np.bool_(0)
+        x_rec = self.encode_decode(x)
+        tm.assert_almost_equal(x, x_rec)
+
+    def test_scalar_complex(self):
+        x = np.random.rand() + 1j * np.random.rand()
+        x_rec = self.encode_decode(x)
+        assert np.allclose(x, x_rec)
+
+    def test_list_numpy_float(self):
+        x = [np.float32(np.random.rand()) for i in range(5)]
+        x_rec = self.encode_decode(x)
+        # current msgpack cannot distinguish list/tuple
+        tm.assert_almost_equal(tuple(x), x_rec)
+
+        x_rec = self.encode_decode(tuple(x))
+        tm.assert_almost_equal(tuple(x), x_rec)
+
+    def test_list_numpy_float_complex(self):
+        if not hasattr(np, 'complex128'):
+            pytest.skip('numpy can not handle complex128')
+
+        x = [np.float32(np.random.rand()) for i in range(5)] + \
+            [np.complex128(np.random.rand() + 1j * np.random.rand())
+             for i in range(5)]
+        x_rec = self.encode_decode(x)
+        assert np.allclose(x, x_rec)
+
+    def test_list_float(self):
+        x = [np.random.rand() for i in range(5)]
+        x_rec = self.encode_decode(x)
+        # current msgpack cannot distinguish list/tuple
+        tm.assert_almost_equal(tuple(x), x_rec)
+
+        x_rec = self.encode_decode(tuple(x))
+        tm.assert_almost_equal(tuple(x), x_rec)
+
+    def test_list_float_complex(self):
+        x = [np.random.rand() for i in range(5)] + \
+            [(np.random.rand() + 1j * np.random.rand()) for i in range(5)]
+        x_rec = self.encode_decode(x)
+        assert np.allclose(x, x_rec)
+
+    def test_dict_float(self):
+        x = {'foo': 1.0, 'bar': 2.0}
+        x_rec = self.encode_decode(x)
+        tm.assert_almost_equal(x, x_rec)
+
+    def test_dict_complex(self):
+        x = {'foo': 1.0 + 1.0j, 'bar': 2.0 + 2.0j}
+        x_rec = self.encode_decode(x)
+        tm.assert_dict_equal(x, x_rec)
+
+        for key in x:
+            tm.assert_class_equal(x[key], x_rec[key], obj="complex value")
+
+    def test_dict_numpy_float(self):
+        x = {'foo': np.float32(1.0), 'bar': np.float32(2.0)}
+        x_rec = self.encode_decode(x)
+        tm.assert_almost_equal(x, x_rec)
+
+    def test_dict_numpy_complex(self):
+        x = {'foo': np.complex128(1.0 + 1.0j),
+             'bar': np.complex128(2.0 + 2.0j)}
+        x_rec = self.encode_decode(x)
+        tm.assert_dict_equal(x, x_rec)
+
+        for key in x:
+            tm.assert_class_equal(x[key], x_rec[key], obj="numpy complex128")
+
+    def test_numpy_array_float(self):
+
+        # run multiple times
+        for n in range(10):
+            x = np.random.rand(10)
+            for dtype in ['float32', 'float64']:
+                x = x.astype(dtype)
+                x_rec = self.encode_decode(x)
+                tm.assert_almost_equal(x, x_rec)
+
+    def test_numpy_array_complex(self):
+        x = (np.random.rand(5) + 1j * np.random.rand(5)).astype(np.complex128)
+        x_rec = self.encode_decode(x)
+        assert (all(map(lambda x, y: x == y, x, x_rec)) and
+                x.dtype == x_rec.dtype)
+
+    def test_list_mixed(self):
+        x = [1.0, np.float32(3.5), np.complex128(4.25), u('foo'), np.bool_(1)]
+        x_rec = self.encode_decode(x)
+        # current msgpack cannot distinguish list/tuple
+        tm.assert_almost_equal(tuple(x), x_rec)
+
+        x_rec = self.encode_decode(tuple(x))
+        tm.assert_almost_equal(tuple(x), x_rec)
+
+
+class TestBasic(TestPackers):
+
+    def test_timestamp(self):
+
+        for i in [Timestamp(
+            '20130101'), Timestamp('20130101', tz='US/Eastern'),
+                Timestamp('201301010501')]:
+            i_rec = self.encode_decode(i)
+            assert i == i_rec
+
+    def test_nat(self):
+        nat_rec = self.encode_decode(NaT)
+        assert NaT is nat_rec
+
+    def test_datetimes(self):
+
+        for i in [datetime.datetime(2013, 1, 1),
+                  datetime.datetime(2013, 1, 1, 5, 1),
+                  datetime.date(2013, 1, 1),
+                  np.datetime64(datetime.datetime(2013, 1, 5, 2, 15))]:
+            i_rec = self.encode_decode(i)
+            assert i == i_rec
+
+    def test_timedeltas(self):
+
+        for i in [datetime.timedelta(days=1),
+                  datetime.timedelta(days=1, seconds=10),
+                  np.timedelta64(1000000)]:
+            i_rec = self.encode_decode(i)
+            assert i == i_rec
+
+    def test_periods(self):
+        # 13463
+        for i in [Period('2010-09', 'M'), Period('2014-Q1', 'Q')]:
+            i_rec = self.encode_decode(i)
+            assert i == i_rec
+
+    def test_intervals(self):
+        # 19967
+        for i in [Interval(0, 1), Interval(0, 1, 'left'),
+                  Interval(10, 25., 'right')]:
+            i_rec = self.encode_decode(i)
+            assert i == i_rec
+
+
+class TestIndex(TestPackers):
+
+    def setup_method(self, method):
+        super(TestIndex, self).setup_method(method)
+
+        self.d = {
+            'string': tm.makeStringIndex(100),
+            'date': tm.makeDateIndex(100),
+            'int': tm.makeIntIndex(100),
+            'rng': tm.makeRangeIndex(100),
+            'float': tm.makeFloatIndex(100),
+            'empty': Index([]),
+            'tuple': Index(zip(['foo', 'bar', 'baz'], [1, 2, 3])),
+            'period': Index(period_range('2012-1-1', freq='M', periods=3)),
+            'date2': Index(date_range('2013-01-1', periods=10)),
+            'bdate': Index(bdate_range('2013-01-02', periods=10)),
+            'cat': tm.makeCategoricalIndex(100),
+            'interval': tm.makeIntervalIndex(100),
+            'timedelta': tm.makeTimedeltaIndex(100, 'H')
+        }
+
+        self.mi = {
+            'reg': MultiIndex.from_tuples([('bar', 'one'), ('baz', 'two'),
+                                           ('foo', 'two'),
+                                           ('qux', 'one'), ('qux', 'two')],
+                                          names=['first', 'second']),
+        }
+
+    def test_basic_index(self):
+
+        for s, i in self.d.items():
+            i_rec = self.encode_decode(i)
+            tm.assert_index_equal(i, i_rec)
+
+        # datetime with no freq (GH5506)
+        i = Index([Timestamp('20130101'), Timestamp('20130103')])
+        i_rec = self.encode_decode(i)
+        tm.assert_index_equal(i, i_rec)
+
+        # datetime with timezone
+        i = Index([Timestamp('20130101 9:00:00'), Timestamp(
+            '20130103 11:00:00')]).tz_localize('US/Eastern')
+        i_rec = self.encode_decode(i)
+        tm.assert_index_equal(i, i_rec)
+
+    def test_multi_index(self):
+
+        for s, i in self.mi.items():
+            i_rec = self.encode_decode(i)
+            tm.assert_index_equal(i, i_rec)
+
+    def test_unicode(self):
+        i = tm.makeUnicodeIndex(100)
+
+        i_rec = self.encode_decode(i)
+        tm.assert_index_equal(i, i_rec)
+
+    def categorical_index(self):
+        # GH15487
+        df = DataFrame(np.random.randn(10, 2))
+        df = df.astype({0: 'category'}).set_index(0)
+        result = self.encode_decode(df)
+        tm.assert_frame_equal(result, df)
+
+
+class TestSeries(TestPackers):
+
+    def setup_method(self, method):
+        super(TestSeries, self).setup_method(method)
+
+        self.d = {}
+
+        s = tm.makeStringSeries()
+        s.name = 'string'
+        self.d['string'] = s
+
+        s = tm.makeObjectSeries()
+        s.name = 'object'
+        self.d['object'] = s
+
+        s = Series(iNaT, dtype='M8[ns]', index=range(5))
+        self.d['date'] = s
+
+        data = {
+            'A': [0., 1., 2., 3., np.nan],
+            'B': [0, 1, 0, 1, 0],
+            'C': ['foo1', 'foo2', 'foo3', 'foo4', 'foo5'],
+            'D': date_range('1/1/2009', periods=5),
+            'E': [0., 1, Timestamp('20100101'), 'foo', 2.],
+            'F': [Timestamp('20130102', tz='US/Eastern')] * 2 +
+                 [Timestamp('20130603', tz='CET')] * 3,
+            'G': [Timestamp('20130102', tz='US/Eastern')] * 5,
+            'H': Categorical([1, 2, 3, 4, 5]),
+            'I': Categorical([1, 2, 3, 4, 5], ordered=True),
+            'J': (np.bool_(1), 2, 3, 4, 5),
+        }
+
+        self.d['float'] = Series(data['A'])
+        self.d['int'] = Series(data['B'])
+        self.d['mixed'] = Series(data['E'])
+        self.d['dt_tz_mixed'] = Series(data['F'])
+        self.d['dt_tz'] = Series(data['G'])
+        self.d['cat_ordered'] = Series(data['H'])
+        self.d['cat_unordered'] = Series(data['I'])
+        self.d['numpy_bool_mixed'] = Series(data['J'])
+
+    def test_basic(self):
+
+        # run multiple times here
+        for n in range(10):
+            for s, i in self.d.items():
+                i_rec = self.encode_decode(i)
+                assert_series_equal(i, i_rec)
+
+
+class TestCategorical(TestPackers):
+
+    def setup_method(self, method):
+        super(TestCategorical, self).setup_method(method)
+
+        self.d = {}
+
+        self.d['plain_str'] = Categorical(['a', 'b', 'c', 'd', 'e'])
+        self.d['plain_str_ordered'] = Categorical(['a', 'b', 'c', 'd', 'e'],
+                                                  ordered=True)
+
+        self.d['plain_int'] = Categorical([5, 6, 7, 8])
+        self.d['plain_int_ordered'] = Categorical([5, 6, 7, 8], ordered=True)
+
+    def test_basic(self):
+
+        # run multiple times here
+        for n in range(10):
+            for s, i in self.d.items():
+                i_rec = self.encode_decode(i)
+                assert_categorical_equal(i, i_rec)
+
+
+class TestNDFrame(TestPackers):
+
+    def setup_method(self, method):
+        super(TestNDFrame, self).setup_method(method)
+
+        data = {
+            'A': [0., 1., 2., 3., np.nan],
+            'B': [0, 1, 0, 1, 0],
+            'C': ['foo1', 'foo2', 'foo3', 'foo4', 'foo5'],
+            'D': date_range('1/1/2009', periods=5),
+            'E': [0., 1, Timestamp('20100101'), 'foo', 2.],
+            'F': [Timestamp('20130102', tz='US/Eastern')] * 5,
+            'G': [Timestamp('20130603', tz='CET')] * 5,
+            'H': Categorical(['a', 'b', 'c', 'd', 'e']),
+            'I': Categorical(['a', 'b', 'c', 'd', 'e'], ordered=True),
+        }
+
+        self.frame = {
+            'float': DataFrame(dict(A=data['A'], B=Series(data['A']) + 1)),
+            'int': DataFrame(dict(A=data['B'], B=Series(data['B']) + 1)),
+            'mixed': DataFrame(data)}
+
+        with catch_warnings(record=True):
+            self.panel = {
+                'float': Panel(dict(ItemA=self.frame['float'],
+                                    ItemB=self.frame['float'] + 1))}
+
+    def test_basic_frame(self):
+
+        for s, i in self.frame.items():
+            i_rec = self.encode_decode(i)
+            assert_frame_equal(i, i_rec)
+
+    def test_basic_panel(self):
+
+        with catch_warnings(record=True):
+            for s, i in self.panel.items():
+                i_rec = self.encode_decode(i)
+                assert_panel_equal(i, i_rec)
+
+    def test_multi(self):
+
+        i_rec = self.encode_decode(self.frame)
+        for k in self.frame.keys():
+            assert_frame_equal(self.frame[k], i_rec[k])
+
+        l = tuple([self.frame['float'], self.frame['float'].A,
+                   self.frame['float'].B, None])
+        l_rec = self.encode_decode(l)
+        check_arbitrary(l, l_rec)
+
+        # this is an oddity in that packed lists will be returned as tuples
+        l = [self.frame['float'], self.frame['float']
+             .A, self.frame['float'].B, None]
+        l_rec = self.encode_decode(l)
+        assert isinstance(l_rec, tuple)
+        check_arbitrary(l, l_rec)
+
+    def test_iterator(self):
+
+        l = [self.frame['float'], self.frame['float']
+             .A, self.frame['float'].B, None]
+
+        with ensure_clean(self.path) as path:
+            to_msgpack(path, *l)
+            for i, packed in enumerate(read_msgpack(path, iterator=True)):
+                check_arbitrary(packed, l[i])
+
+    def tests_datetimeindex_freq_issue(self):
+
+        # GH 5947
+        # inferring freq on the datetimeindex
+        df = DataFrame([1, 2, 3], index=date_range('1/1/2013', '1/3/2013'))
+        result = self.encode_decode(df)
+        assert_frame_equal(result, df)
+
+        df = DataFrame([1, 2], index=date_range('1/1/2013', '1/2/2013'))
+        result = self.encode_decode(df)
+        assert_frame_equal(result, df)
+
+    def test_dataframe_duplicate_column_names(self):
+
+        # GH 9618
+        expected_1 = DataFrame(columns=['a', 'a'])
+        expected_2 = DataFrame(columns=[1] * 100)
+        expected_2.loc[0] = np.random.randn(100)
+        expected_3 = DataFrame(columns=[1, 1])
+        expected_3.loc[0] = ['abc', np.nan]
+
+        result_1 = self.encode_decode(expected_1)
+        result_2 = self.encode_decode(expected_2)
+        result_3 = self.encode_decode(expected_3)
+
+        assert_frame_equal(result_1, expected_1)
+        assert_frame_equal(result_2, expected_2)
+        assert_frame_equal(result_3, expected_3)
+
+
+class TestSparse(TestPackers):
+
+    def _check_roundtrip(self, obj, comparator, **kwargs):
+
+        # currently these are not implemetned
+        # i_rec = self.encode_decode(obj)
+        # comparator(obj, i_rec, **kwargs)
+        pytest.raises(NotImplementedError, self.encode_decode, obj)
+
+    def test_sparse_series(self):
+
+        s = tm.makeStringSeries()
+        s[3:5] = np.nan
+        ss = s.to_sparse()
+        self._check_roundtrip(ss, tm.assert_series_equal,
+                              check_series_type=True)
+
+        ss2 = s.to_sparse(kind='integer')
+        self._check_roundtrip(ss2, tm.assert_series_equal,
+                              check_series_type=True)
+
+        ss3 = s.to_sparse(fill_value=0)
+        self._check_roundtrip(ss3, tm.assert_series_equal,
+                              check_series_type=True)
+
+    def test_sparse_frame(self):
+
+        s = tm.makeDataFrame()
+        s.loc[3:5, 1:3] = np.nan
+        s.loc[8:10, -2] = np.nan
+        ss = s.to_sparse()
+
+        self._check_roundtrip(ss, tm.assert_frame_equal,
+                              check_frame_type=True)
+
+        ss2 = s.to_sparse(kind='integer')
+        self._check_roundtrip(ss2, tm.assert_frame_equal,
+                              check_frame_type=True)
+
+        ss3 = s.to_sparse(fill_value=0)
+        self._check_roundtrip(ss3, tm.assert_frame_equal,
+                              check_frame_type=True)
+
+
+class TestCompression(TestPackers):
+    """See https://github.com/pandas-dev/pandas/pull/9783
+    """
+
+    def setup_method(self, method):
+        try:
+            from sqlalchemy import create_engine
+            self._create_sql_engine = create_engine
+        except ImportError:
+            self._SQLALCHEMY_INSTALLED = False
+        else:
+            self._SQLALCHEMY_INSTALLED = True
+
+        super(TestCompression, self).setup_method(method)
+        data = {
+            'A': np.arange(1000, dtype=np.float64),
+            'B': np.arange(1000, dtype=np.int32),
+            'C': list(100 * 'abcdefghij'),
+            'D': date_range(datetime.datetime(2015, 4, 1), periods=1000),
+            'E': [datetime.timedelta(days=x) for x in range(1000)],
+        }
+        self.frame = {
+            'float': DataFrame({k: data[k] for k in ['A', 'A']}),
+            'int': DataFrame({k: data[k] for k in ['B', 'B']}),
+            'mixed': DataFrame(data),
+        }
+
+    def test_plain(self):
+        i_rec = self.encode_decode(self.frame)
+        for k in self.frame.keys():
+            assert_frame_equal(self.frame[k], i_rec[k])
+
+    def _test_compression(self, compress):
+        i_rec = self.encode_decode(self.frame, compress=compress)
+        for k in self.frame.keys():
+            value = i_rec[k]
+            expected = self.frame[k]
+            assert_frame_equal(value, expected)
+            # make sure that we can write to the new frames
+            for block in value._data.blocks:
+                assert block.values.flags.writeable
+
+    def test_compression_zlib(self):
+        if not _ZLIB_INSTALLED:
+            pytest.skip('no zlib')
+        self._test_compression('zlib')
+
+    def test_compression_blosc(self):
+        if not _BLOSC_INSTALLED:
+            pytest.skip('no blosc')
+        self._test_compression('blosc')
+
+    def _test_compression_warns_when_decompress_caches(self, compress):
+        not_garbage = []
+        control = []  # copied data
+
+        compress_module = globals()[compress]
+        real_decompress = compress_module.decompress
+
+        def decompress(ob):
+            """mock decompress function that delegates to the real
+            decompress but caches the result and a copy of the result.
+            """
+            res = real_decompress(ob)
+            not_garbage.append(res)  # hold a reference to this bytes object
+            control.append(bytearray(res))  # copy the data here to check later
+            return res
+
+        # types mapped to values to add in place.
+        rhs = {
+            np.dtype('float64'): 1.0,
+            np.dtype('int32'): 1,
+            np.dtype('object'): 'a',
+            np.dtype('datetime64[ns]'): np.timedelta64(1, 'ns'),
+            np.dtype('timedelta64[ns]'): np.timedelta64(1, 'ns'),
+        }
+
+        with patch(compress_module, 'decompress', decompress), \
+                tm.assert_produces_warning(PerformanceWarning) as ws:
+
+            i_rec = self.encode_decode(self.frame, compress=compress)
+            for k in self.frame.keys():
+
+                value = i_rec[k]
+                expected = self.frame[k]
+                assert_frame_equal(value, expected)
+                # make sure that we can write to the new frames even though
+                # we needed to copy the data
+                for block in value._data.blocks:
+                    assert block.values.flags.writeable
+                    # mutate the data in some way
+                    block.values[0] += rhs[block.dtype]
+
+        for w in ws:
+            # check the messages from our warnings
+            assert str(w.message) == ('copying data after decompressing; '
+                                      'this may mean that decompress is '
+                                      'caching its result')
+
+        for buf, control_buf in zip(not_garbage, control):
+            # make sure none of our mutations above affected the
+            # original buffers
+            assert buf == control_buf
+
+    def test_compression_warns_when_decompress_caches_zlib(self):
+        if not _ZLIB_INSTALLED:
+            pytest.skip('no zlib')
+        self._test_compression_warns_when_decompress_caches('zlib')
+
+    def test_compression_warns_when_decompress_caches_blosc(self):
+        if not _BLOSC_INSTALLED:
+            pytest.skip('no blosc')
+        self._test_compression_warns_when_decompress_caches('blosc')
+
+    def _test_small_strings_no_warn(self, compress):
+        empty = np.array([], dtype='uint8')
+        with tm.assert_produces_warning(None):
+            empty_unpacked = self.encode_decode(empty, compress=compress)
+
+        tm.assert_numpy_array_equal(empty_unpacked, empty)
+        assert empty_unpacked.flags.writeable
+
+        char = np.array([ord(b'a')], dtype='uint8')
+        with tm.assert_produces_warning(None):
+            char_unpacked = self.encode_decode(char, compress=compress)
+
+        tm.assert_numpy_array_equal(char_unpacked, char)
+        assert char_unpacked.flags.writeable
+        # if this test fails I am sorry because the interpreter is now in a
+        # bad state where b'a' points to 98 == ord(b'b').
+        char_unpacked[0] = ord(b'b')
+
+        # we compare the ord of bytes b'a' with unicode u'a' because the should
+        # always be the same (unless we were able to mutate the shared
+        # character singleton in which case ord(b'a') == ord(b'b').
+        assert ord(b'a') == ord(u'a')
+        tm.assert_numpy_array_equal(
+            char_unpacked,
+            np.array([ord(b'b')], dtype='uint8'),
+        )
+
+    def test_small_strings_no_warn_zlib(self):
+        if not _ZLIB_INSTALLED:
+            pytest.skip('no zlib')
+        self._test_small_strings_no_warn('zlib')
+
+    def test_small_strings_no_warn_blosc(self):
+        if not _BLOSC_INSTALLED:
+            pytest.skip('no blosc')
+        self._test_small_strings_no_warn('blosc')
+
+    def test_readonly_axis_blosc(self):
+        # GH11880
+        if not _BLOSC_INSTALLED:
+            pytest.skip('no blosc')
+        df1 = DataFrame({'A': list('abcd')})
+        df2 = DataFrame(df1, index=[1., 2., 3., 4.])
+        assert 1 in self.encode_decode(df1['A'], compress='blosc')
+        assert 1. in self.encode_decode(df2['A'], compress='blosc')
+
+    def test_readonly_axis_zlib(self):
+        # GH11880
+        df1 = DataFrame({'A': list('abcd')})
+        df2 = DataFrame(df1, index=[1., 2., 3., 4.])
+        assert 1 in self.encode_decode(df1['A'], compress='zlib')
+        assert 1. in self.encode_decode(df2['A'], compress='zlib')
+
+    def test_readonly_axis_blosc_to_sql(self):
+        # GH11880
+        if not _BLOSC_INSTALLED:
+            pytest.skip('no blosc')
+        if not self._SQLALCHEMY_INSTALLED:
+            pytest.skip('no sqlalchemy')
+        expected = DataFrame({'A': list('abcd')})
+        df = self.encode_decode(expected, compress='blosc')
+        eng = self._create_sql_engine("sqlite:///:memory:")
+        df.to_sql('test', eng, if_exists='append')
+        result = pandas.read_sql_table('test', eng, index_col='index')
+        result.index.names = [None]
+        assert_frame_equal(expected, result)
+
+    def test_readonly_axis_zlib_to_sql(self):
+        # GH11880
+        if not _ZLIB_INSTALLED:
+            pytest.skip('no zlib')
+        if not self._SQLALCHEMY_INSTALLED:
+            pytest.skip('no sqlalchemy')
+        expected = DataFrame({'A': list('abcd')})
+        df = self.encode_decode(expected, compress='zlib')
+        eng = self._create_sql_engine("sqlite:///:memory:")
+        df.to_sql('test', eng, if_exists='append')
+        result = pandas.read_sql_table('test', eng, index_col='index')
+        result.index.names = [None]
+        assert_frame_equal(expected, result)
+
+
+class TestEncoding(TestPackers):
+
+    def setup_method(self, method):
+        super(TestEncoding, self).setup_method(method)
+        data = {
+            'A': [compat.u('\u2019')] * 1000,
+            'B': np.arange(1000, dtype=np.int32),
+            'C': list(100 * 'abcdefghij'),
+            'D': date_range(datetime.datetime(2015, 4, 1), periods=1000),
+            'E': [datetime.timedelta(days=x) for x in range(1000)],
+            'G': [400] * 1000
+        }
+        self.frame = {
+            'float': DataFrame({k: data[k] for k in ['A', 'A']}),
+            'int': DataFrame({k: data[k] for k in ['B', 'B']}),
+            'mixed': DataFrame(data),
+        }
+        self.utf_encodings = ['utf8', 'utf16', 'utf32']
+
+    def test_utf(self):
+        # GH10581
+        for encoding in self.utf_encodings:
+            for frame in compat.itervalues(self.frame):
+                result = self.encode_decode(frame, encoding=encoding)
+                assert_frame_equal(result, frame)
+
+    def test_default_encoding(self):
+        for frame in compat.itervalues(self.frame):
+            result = frame.to_msgpack()
+            expected = frame.to_msgpack(encoding='utf8')
+            assert result == expected
+            result = self.encode_decode(frame)
+            assert_frame_equal(result, frame)
+
+
+files = glob.glob(os.path.join(os.path.dirname(__file__), "data",
+                               "legacy_msgpack", "*", "*.msgpack"))
+
+
+@pytest.fixture(params=files)
+def legacy_packer(request, datapath):
+    return datapath(request.param)
+
+
+class TestMsgpack(object):
+    """
+    How to add msgpack tests:
+
+    1. Install pandas version intended to output the msgpack.
+TestPackers
+    2. Execute "generate_legacy_storage_files.py" to create the msgpack.
+    $ python generate_legacy_storage_files.py <output_dir> msgpack
+
+    3. Move the created pickle to "data/legacy_msgpack/<version>" directory.
+    """
+
+    minimum_structure = {'series': ['float', 'int', 'mixed',
+                                    'ts', 'mi', 'dup'],
+                         'frame': ['float', 'int', 'mixed', 'mi'],
+                         'panel': ['float'],
+                         'index': ['int', 'date', 'period'],
+                         'mi': ['reg2']}
+
+    def check_min_structure(self, data, version):
+        for typ, v in self.minimum_structure.items():
+            assert typ in data, '"{0}" not found in unpacked data'.format(typ)
+            for kind in v:
+                msg = '"{0}" not found in data["{1}"]'.format(kind, typ)
+                assert kind in data[typ], msg
+
+    def compare(self, current_data, all_data, vf, version):
+        # GH12277 encoding default used to be latin-1, now utf-8
+        if LooseVersion(version) < LooseVersion('0.18.0'):
+            data = read_msgpack(vf, encoding='latin-1')
+        else:
+            data = read_msgpack(vf)
+        self.check_min_structure(data, version)
+        for typ, dv in data.items():
+            assert typ in all_data, ('unpacked data contains '
+                                     'extra key "{0}"'
+                                     .format(typ))
+            for dt, result in dv.items():
+                assert dt in current_data[typ], ('data["{0}"] contains extra '
+                                                 'key "{1}"'.format(typ, dt))
+                try:
+                    expected = current_data[typ][dt]
+                except KeyError:
+                    continue
+
+                # use a specific comparator
+                # if available
+                comp_method = "compare_{typ}_{dt}".format(typ=typ, dt=dt)
+                comparator = getattr(self, comp_method, None)
+                if comparator is not None:
+                    comparator(result, expected, typ, version)
+                else:
+                    check_arbitrary(result, expected)
+
+        return data
+
+    def compare_series_dt_tz(self, result, expected, typ, version):
+        # 8260
+        # dtype is object < 0.17.0
+        if LooseVersion(version) < LooseVersion('0.17.0'):
+            expected = expected.astype(object)
+            tm.assert_series_equal(result, expected)
+        else:
+            tm.assert_series_equal(result, expected)
+
+    def compare_frame_dt_mixed_tzs(self, result, expected, typ, version):
+        # 8260
+        # dtype is object < 0.17.0
+        if LooseVersion(version) < LooseVersion('0.17.0'):
+            expected = expected.astype(object)
+            tm.assert_frame_equal(result, expected)
+        else:
+            tm.assert_frame_equal(result, expected)
+
+    def test_msgpacks_legacy(self, current_packers_data, all_packers_data,
+                             legacy_packer, datapath):
+
+        version = os.path.basename(os.path.dirname(legacy_packer))
+
+        # GH12142 0.17 files packed in P2 can't be read in P3
+        if (compat.PY3 and version.startswith('0.17.') and
+                legacy_packer.split('.')[-4][-1] == '2'):
+            msg = "Files packed in Py2 can't be read in Py3 ({})"
+            pytest.skip(msg.format(version))
+        try:
+            with catch_warnings(record=True):
+                self.compare(current_packers_data, all_packers_data,
+                             legacy_packer, version)
+        except ImportError:
+            # blosc not installed
+            pass
diff --git a/pandas/tests/io/test_parquet.py b/pandas/tests/io/test_parquet.py
new file mode 100644
index 0000000000000..11cbea8ce6331
--- /dev/null
+++ b/pandas/tests/io/test_parquet.py
@@ -0,0 +1,504 @@
+""" test parquet compat """
+
+import pytest
+import datetime
+from distutils.version import LooseVersion
+from warnings import catch_warnings
+
+import numpy as np
+import pandas as pd
+from pandas.compat import PY3, is_platform_windows, is_platform_mac
+from pandas.io.parquet import (to_parquet, read_parquet, get_engine,
+                               PyArrowImpl, FastParquetImpl)
+from pandas.util import testing as tm
+
+try:
+    import pyarrow  # noqa
+    _HAVE_PYARROW = True
+except ImportError:
+    _HAVE_PYARROW = False
+
+try:
+    import fastparquet  # noqa
+    _HAVE_FASTPARQUET = True
+except ImportError:
+    _HAVE_FASTPARQUET = False
+
+
+# setup engines & skips
+@pytest.fixture(params=[
+    pytest.param('fastparquet',
+                 marks=pytest.mark.skipif(not _HAVE_FASTPARQUET,
+                                          reason='fastparquet is '
+                                                 'not installed')),
+    pytest.param('pyarrow',
+                 marks=pytest.mark.skipif(not _HAVE_PYARROW,
+                                          reason='pyarrow is '
+                                                 'not installed'))])
+def engine(request):
+    return request.param
+
+
+@pytest.fixture
+def pa():
+    if not _HAVE_PYARROW:
+        pytest.skip("pyarrow is not installed")
+    return 'pyarrow'
+
+
+@pytest.fixture
+def pa_lt_070():
+    if not _HAVE_PYARROW:
+        pytest.skip("pyarrow is not installed")
+    if LooseVersion(pyarrow.__version__) >= LooseVersion('0.7.0'):
+        pytest.skip("pyarrow is >= 0.7.0")
+    return 'pyarrow'
+
+
+@pytest.fixture
+def pa_ge_070():
+    if not _HAVE_PYARROW:
+        pytest.skip("pyarrow is not installed")
+    if LooseVersion(pyarrow.__version__) < LooseVersion('0.7.0'):
+        pytest.skip("pyarrow is < 0.7.0")
+    return 'pyarrow'
+
+
+@pytest.fixture
+def fp():
+    if not _HAVE_FASTPARQUET:
+        pytest.skip("fastparquet is not installed")
+    return 'fastparquet'
+
+
+@pytest.fixture
+def fp_lt_014():
+    if not _HAVE_FASTPARQUET:
+        pytest.skip("fastparquet is not installed")
+    if LooseVersion(fastparquet.__version__) >= LooseVersion('0.1.4'):
+        pytest.skip("fastparquet is >= 0.1.4")
+    return 'fastparquet'
+
+
+@pytest.fixture
+def df_compat():
+    return pd.DataFrame({'A': [1, 2, 3], 'B': 'foo'})
+
+
+@pytest.fixture
+def df_cross_compat():
+    df = pd.DataFrame({'a': list('abc'),
+                       'b': list(range(1, 4)),
+                       # 'c': np.arange(3, 6).astype('u1'),
+                       'd': np.arange(4.0, 7.0, dtype='float64'),
+                       'e': [True, False, True],
+                       'f': pd.date_range('20130101', periods=3),
+                       # 'g': pd.date_range('20130101', periods=3,
+                       #                    tz='US/Eastern'),
+                       # 'h': pd.date_range('20130101', periods=3, freq='ns')
+                       })
+    return df
+
+
+@pytest.fixture
+def df_full():
+    return pd.DataFrame(
+        {'string': list('abc'),
+         'string_with_nan': ['a', np.nan, 'c'],
+         'string_with_none': ['a', None, 'c'],
+         'bytes': [b'foo', b'bar', b'baz'],
+         'unicode': [u'foo', u'bar', u'baz'],
+         'int': list(range(1, 4)),
+         'uint': np.arange(3, 6).astype('u1'),
+         'float': np.arange(4.0, 7.0, dtype='float64'),
+         'float_with_nan': [2., np.nan, 3.],
+         'bool': [True, False, True],
+         'datetime': pd.date_range('20130101', periods=3),
+         'datetime_with_nat': [pd.Timestamp('20130101'),
+                               pd.NaT,
+                               pd.Timestamp('20130103')]})
+
+
+def check_round_trip(df, engine=None, path=None,
+                     write_kwargs=None, read_kwargs=None,
+                     expected=None, check_names=True,
+                     repeat=2):
+    """Verify parquet serializer and deserializer produce the same results.
+
+    Performs a pandas to disk and disk to pandas round trip,
+    then compares the 2 resulting DataFrames to verify equality.
+
+    Parameters
+    ----------
+    df: Dataframe
+    engine: str, optional
+        'pyarrow' or 'fastparquet'
+    path: str, optional
+    write_kwargs: dict of str:str, optional
+    read_kwargs: dict of str:str, optional
+    expected: DataFrame, optional
+        Expected deserialization result, otherwise will be equal to `df`
+    check_names: list of str, optional
+        Closed set of column names to be compared
+    repeat: int, optional
+        How many times to repeat the test
+    """
+
+    write_kwargs = write_kwargs or {'compression': None}
+    read_kwargs = read_kwargs or {}
+
+    if expected is None:
+        expected = df
+
+    if engine:
+        write_kwargs['engine'] = engine
+        read_kwargs['engine'] = engine
+
+    def compare(repeat):
+        for _ in range(repeat):
+            df.to_parquet(path, **write_kwargs)
+            with catch_warnings(record=True):
+                actual = read_parquet(path, **read_kwargs)
+            tm.assert_frame_equal(expected, actual,
+                                  check_names=check_names)
+
+    if path is None:
+        with tm.ensure_clean() as path:
+            compare(repeat)
+    else:
+        compare(repeat)
+
+
+def test_invalid_engine(df_compat):
+    with pytest.raises(ValueError):
+        check_round_trip(df_compat, 'foo', 'bar')
+
+
+def test_options_py(df_compat, pa):
+    # use the set option
+
+    with pd.option_context('io.parquet.engine', 'pyarrow'):
+        check_round_trip(df_compat)
+
+
+def test_options_fp(df_compat, fp):
+    # use the set option
+
+    with pd.option_context('io.parquet.engine', 'fastparquet'):
+        check_round_trip(df_compat)
+
+
+def test_options_auto(df_compat, fp, pa):
+    # use the set option
+
+    with pd.option_context('io.parquet.engine', 'auto'):
+        check_round_trip(df_compat)
+
+
+def test_options_get_engine(fp, pa):
+    assert isinstance(get_engine('pyarrow'), PyArrowImpl)
+    assert isinstance(get_engine('fastparquet'), FastParquetImpl)
+
+    with pd.option_context('io.parquet.engine', 'pyarrow'):
+        assert isinstance(get_engine('auto'), PyArrowImpl)
+        assert isinstance(get_engine('pyarrow'), PyArrowImpl)
+        assert isinstance(get_engine('fastparquet'), FastParquetImpl)
+
+    with pd.option_context('io.parquet.engine', 'fastparquet'):
+        assert isinstance(get_engine('auto'), FastParquetImpl)
+        assert isinstance(get_engine('pyarrow'), PyArrowImpl)
+        assert isinstance(get_engine('fastparquet'), FastParquetImpl)
+
+    with pd.option_context('io.parquet.engine', 'auto'):
+        assert isinstance(get_engine('auto'), PyArrowImpl)
+        assert isinstance(get_engine('pyarrow'), PyArrowImpl)
+        assert isinstance(get_engine('fastparquet'), FastParquetImpl)
+
+
+@pytest.mark.xfail(is_platform_windows() or is_platform_mac(),
+                   reason="reading pa metadata failing on Windows/mac")
+def test_cross_engine_pa_fp(df_cross_compat, pa, fp):
+    # cross-compat with differing reading/writing engines
+
+    df = df_cross_compat
+    with tm.ensure_clean() as path:
+        df.to_parquet(path, engine=pa, compression=None)
+
+        result = read_parquet(path, engine=fp)
+        tm.assert_frame_equal(result, df)
+
+        result = read_parquet(path, engine=fp, columns=['a', 'd'])
+        tm.assert_frame_equal(result, df[['a', 'd']])
+
+
+def test_cross_engine_fp_pa(df_cross_compat, pa, fp):
+    # cross-compat with differing reading/writing engines
+
+    df = df_cross_compat
+    with tm.ensure_clean() as path:
+        df.to_parquet(path, engine=fp, compression=None)
+
+        with catch_warnings(record=True):
+            result = read_parquet(path, engine=pa)
+            tm.assert_frame_equal(result, df)
+
+            result = read_parquet(path, engine=pa, columns=['a', 'd'])
+            tm.assert_frame_equal(result, df[['a', 'd']])
+
+
+class Base(object):
+
+    def check_error_on_write(self, df, engine, exc):
+        # check that we are raising the exception on writing
+        with tm.ensure_clean() as path:
+            with pytest.raises(exc):
+                to_parquet(df, path, engine, compression=None)
+
+
+class TestBasic(Base):
+
+    def test_error(self, engine):
+        for obj in [pd.Series([1, 2, 3]), 1, 'foo', pd.Timestamp('20130101'),
+                    np.array([1, 2, 3])]:
+            self.check_error_on_write(obj, engine, ValueError)
+
+    def test_columns_dtypes(self, engine):
+        df = pd.DataFrame({'string': list('abc'),
+                           'int': list(range(1, 4))})
+
+        # unicode
+        df.columns = [u'foo', u'bar']
+        check_round_trip(df, engine)
+
+    def test_columns_dtypes_invalid(self, engine):
+        df = pd.DataFrame({'string': list('abc'),
+                           'int': list(range(1, 4))})
+
+        # numeric
+        df.columns = [0, 1]
+        self.check_error_on_write(df, engine, ValueError)
+
+        if PY3:
+            # bytes on PY3, on PY2 these are str
+            df.columns = [b'foo', b'bar']
+            self.check_error_on_write(df, engine, ValueError)
+
+        # python object
+        df.columns = [datetime.datetime(2011, 1, 1, 0, 0),
+                      datetime.datetime(2011, 1, 1, 1, 1)]
+        self.check_error_on_write(df, engine, ValueError)
+
+    @pytest.mark.parametrize('compression', [None, 'gzip', 'snappy', 'brotli'])
+    def test_compression(self, engine, compression):
+
+        if compression == 'snappy':
+            pytest.importorskip('snappy')
+
+        elif compression == 'brotli':
+            pytest.importorskip('brotli')
+
+        df = pd.DataFrame({'A': [1, 2, 3]})
+        check_round_trip(df, engine, write_kwargs={'compression': compression})
+
+    def test_read_columns(self, engine):
+        # GH18154
+        df = pd.DataFrame({'string': list('abc'),
+                           'int': list(range(1, 4))})
+
+        expected = pd.DataFrame({'string': list('abc')})
+        check_round_trip(df, engine, expected=expected,
+                         read_kwargs={'columns': ['string']})
+
+    def test_write_index(self, engine):
+        check_names = engine != 'fastparquet'
+
+        if engine == 'pyarrow':
+            import pyarrow
+            if LooseVersion(pyarrow.__version__) < LooseVersion('0.7.0'):
+                pytest.skip("pyarrow is < 0.7.0")
+
+        df = pd.DataFrame({'A': [1, 2, 3]})
+        check_round_trip(df, engine)
+
+        indexes = [
+            [2, 3, 4],
+            pd.date_range('20130101', periods=3),
+            list('abc'),
+            [1, 3, 4],
+        ]
+        # non-default index
+        for index in indexes:
+            df.index = index
+            check_round_trip(df, engine, check_names=check_names)
+
+        # index with meta-data
+        df.index = [0, 1, 2]
+        df.index.name = 'foo'
+        check_round_trip(df, engine)
+
+    def test_write_multiindex(self, pa_ge_070):
+        # Not suppoprted in fastparquet as of 0.1.3 or older pyarrow version
+        engine = pa_ge_070
+
+        df = pd.DataFrame({'A': [1, 2, 3]})
+        index = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)])
+        df.index = index
+        check_round_trip(df, engine)
+
+    def test_write_column_multiindex(self, engine):
+        # column multi-index
+        mi_columns = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)])
+        df = pd.DataFrame(np.random.randn(4, 3), columns=mi_columns)
+        self.check_error_on_write(df, engine, ValueError)
+
+    def test_multiindex_with_columns(self, pa_ge_070):
+        engine = pa_ge_070
+        dates = pd.date_range('01-Jan-2018', '01-Dec-2018', freq='MS')
+        df = pd.DataFrame(np.random.randn(2 * len(dates), 3),
+                          columns=list('ABC'))
+        index1 = pd.MultiIndex.from_product(
+            [['Level1', 'Level2'], dates],
+            names=['level', 'date'])
+        index2 = index1.copy(names=None)
+        for index in [index1, index2]:
+            df.index = index
+
+            check_round_trip(df, engine)
+            check_round_trip(df, engine, read_kwargs={'columns': ['A', 'B']},
+                             expected=df[['A', 'B']])
+
+
+class TestParquetPyArrow(Base):
+
+    def test_basic(self, pa, df_full):
+
+        df = df_full
+
+        # additional supported types for pyarrow
+        import pyarrow
+        if LooseVersion(pyarrow.__version__) >= LooseVersion('0.7.0'):
+            df['datetime_tz'] = pd.date_range('20130101', periods=3,
+                                              tz='Europe/Brussels')
+        df['bool_with_none'] = [True, None, True]
+
+        check_round_trip(df, pa)
+
+    @pytest.mark.xfail(reason="pyarrow fails on this (ARROW-1883)")
+    def test_basic_subset_columns(self, pa, df_full):
+        # GH18628
+
+        df = df_full
+        # additional supported types for pyarrow
+        df['datetime_tz'] = pd.date_range('20130101', periods=3,
+                                          tz='Europe/Brussels')
+
+        check_round_trip(df, pa, expected=df[['string', 'int']],
+                         read_kwargs={'columns': ['string', 'int']})
+
+    def test_duplicate_columns(self, pa):
+        # not currently able to handle duplicate columns
+        df = pd.DataFrame(np.arange(12).reshape(4, 3),
+                          columns=list('aaa')).copy()
+        self.check_error_on_write(df, pa, ValueError)
+
+    def test_unsupported(self, pa):
+        # period
+        df = pd.DataFrame({'a': pd.period_range('2013', freq='M', periods=3)})
+        self.check_error_on_write(df, pa, ValueError)
+
+        # timedelta
+        df = pd.DataFrame({'a': pd.timedelta_range('1 day',
+                                                   periods=3)})
+        self.check_error_on_write(df, pa, NotImplementedError)
+
+        # mixed python objects
+        df = pd.DataFrame({'a': ['a', 1, 2.0]})
+        self.check_error_on_write(df, pa, ValueError)
+
+    def test_categorical(self, pa_ge_070):
+        pa = pa_ge_070
+
+        # supported in >= 0.7.0
+        df = pd.DataFrame({'a': pd.Categorical(list('abc'))})
+
+        # de-serialized as object
+        expected = df.assign(a=df.a.astype(object))
+        check_round_trip(df, pa, expected=expected)
+
+    def test_categorical_unsupported(self, pa_lt_070):
+        pa = pa_lt_070
+
+        # supported in >= 0.7.0
+        df = pd.DataFrame({'a': pd.Categorical(list('abc'))})
+        self.check_error_on_write(df, pa, NotImplementedError)
+
+    def test_s3_roundtrip(self, df_compat, s3_resource, pa):
+        # GH #19134
+        check_round_trip(df_compat, pa,
+                         path='s3://pandas-test/pyarrow.parquet')
+
+
+class TestParquetFastParquet(Base):
+
+    def test_basic(self, fp, df_full):
+        df = df_full
+
+        # additional supported types for fastparquet
+        if LooseVersion(fastparquet.__version__) >= LooseVersion('0.1.4'):
+            df['datetime_tz'] = pd.date_range('20130101', periods=3,
+                                              tz='US/Eastern')
+        df['timedelta'] = pd.timedelta_range('1 day', periods=3)
+        check_round_trip(df, fp)
+
+    @pytest.mark.skip(reason="not supported")
+    def test_duplicate_columns(self, fp):
+
+        # not currently able to handle duplicate columns
+        df = pd.DataFrame(np.arange(12).reshape(4, 3),
+                          columns=list('aaa')).copy()
+        self.check_error_on_write(df, fp, ValueError)
+
+    def test_bool_with_none(self, fp):
+        df = pd.DataFrame({'a': [True, None, False]})
+        expected = pd.DataFrame({'a': [1.0, np.nan, 0.0]}, dtype='float16')
+        check_round_trip(df, fp, expected=expected)
+
+    def test_unsupported(self, fp):
+
+        # period
+        df = pd.DataFrame({'a': pd.period_range('2013', freq='M', periods=3)})
+        self.check_error_on_write(df, fp, ValueError)
+
+        # mixed
+        df = pd.DataFrame({'a': ['a', 1, 2.0]})
+        self.check_error_on_write(df, fp, ValueError)
+
+    def test_categorical(self, fp):
+        if LooseVersion(fastparquet.__version__) < LooseVersion("0.1.3"):
+            pytest.skip("CategoricalDtype not supported for older fp")
+        df = pd.DataFrame({'a': pd.Categorical(list('abc'))})
+        check_round_trip(df, fp)
+
+    def test_datetime_tz(self, fp_lt_014):
+
+        # fastparquet<0.1.4 doesn't preserve tz
+        df = pd.DataFrame({'a': pd.date_range('20130101', periods=3,
+                                              tz='US/Eastern')})
+        # warns on the coercion
+        with catch_warnings(record=True):
+            check_round_trip(df, fp_lt_014,
+                             expected=df.astype('datetime64[ns]'))
+
+    def test_filter_row_groups(self, fp):
+        d = {'a': list(range(0, 3))}
+        df = pd.DataFrame(d)
+        with tm.ensure_clean() as path:
+            df.to_parquet(path, fp, compression=None,
+                          row_group_offsets=1)
+            result = read_parquet(path, fp, filters=[('a', '==', 0)])
+        assert len(result) == 1
+
+    def test_s3_roundtrip(self, df_compat, s3_resource, fp):
+        # GH #19134
+        check_round_trip(df_compat, fp,
+                         path='s3://pandas-test/fastparquet.parquet')
diff --git a/pandas/tests/io/test_pickle.py b/pandas/tests/io/test_pickle.py
new file mode 100644
index 0000000000000..45cbbd43cd6a8
--- /dev/null
+++ b/pandas/tests/io/test_pickle.py
@@ -0,0 +1,480 @@
+# pylint: disable=E1101,E1103,W0232
+
+"""
+manage legacy pickle tests
+
+How to add pickle tests:
+
+1. Install pandas version intended to output the pickle.
+
+2. Execute "generate_legacy_storage_files.py" to create the pickle.
+$ python generate_legacy_storage_files.py <output_dir> pickle
+
+3. Move the created pickle to "data/legacy_pickle/<version>" directory.
+"""
+import glob
+import pytest
+from warnings import catch_warnings
+
+import os
+from distutils.version import LooseVersion
+import pandas as pd
+from pandas import Index
+from pandas.compat import is_platform_little_endian, PY3
+import pandas
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas.tseries.offsets import Day, MonthEnd
+import shutil
+
+
+@pytest.fixture(scope='module')
+def current_pickle_data():
+    # our current version pickle data
+    from pandas.tests.io.generate_legacy_storage_files import (
+        create_pickle_data)
+    return create_pickle_data()
+
+
+# ---------------------
+# comparison functions
+# ---------------------
+def compare_element(result, expected, typ, version=None):
+    if isinstance(expected, Index):
+        tm.assert_index_equal(expected, result)
+        return
+
+    if typ.startswith('sp_'):
+        comparator = getattr(tm, "assert_%s_equal" % typ)
+        comparator(result, expected, exact_indices=False)
+    elif typ == 'timestamp':
+        if expected is pd.NaT:
+            assert result is pd.NaT
+        else:
+            assert result == expected
+            assert result.freq == expected.freq
+    else:
+        comparator = getattr(tm, "assert_%s_equal" %
+                             typ, tm.assert_almost_equal)
+        comparator(result, expected)
+
+
+def compare(data, vf, version):
+
+    # py3 compat when reading py2 pickle
+    try:
+        data = pandas.read_pickle(vf)
+    except (ValueError) as e:
+        if 'unsupported pickle protocol:' in str(e):
+            # trying to read a py3 pickle in py2
+            return
+        else:
+            raise
+
+    m = globals()
+    for typ, dv in data.items():
+        for dt, result in dv.items():
+            try:
+                expected = data[typ][dt]
+            except (KeyError):
+                if version in ('0.10.1', '0.11.0') and dt == 'reg':
+                    break
+                else:
+                    raise
+
+            # use a specific comparator
+            # if available
+            comparator = "compare_{typ}_{dt}".format(typ=typ, dt=dt)
+
+            comparator = m.get(comparator, m['compare_element'])
+            comparator(result, expected, typ, version)
+    return data
+
+
+def compare_sp_series_ts(res, exp, typ, version):
+    # SparseTimeSeries integrated into SparseSeries in 0.12.0
+    # and deprecated in 0.17.0
+    if version and LooseVersion(version) <= LooseVersion("0.12.0"):
+        tm.assert_sp_series_equal(res, exp, check_series_type=False)
+    else:
+        tm.assert_sp_series_equal(res, exp)
+
+
+def compare_series_ts(result, expected, typ, version):
+    # GH 7748
+    tm.assert_series_equal(result, expected)
+    assert result.index.freq == expected.index.freq
+    assert not result.index.freq.normalize
+    tm.assert_series_equal(result > 0, expected > 0)
+
+    # GH 9291
+    freq = result.index.freq
+    assert freq + Day(1) == Day(2)
+
+    res = freq + pandas.Timedelta(hours=1)
+    assert isinstance(res, pandas.Timedelta)
+    assert res == pandas.Timedelta(days=1, hours=1)
+
+    res = freq + pandas.Timedelta(nanoseconds=1)
+    assert isinstance(res, pandas.Timedelta)
+    assert res == pandas.Timedelta(days=1, nanoseconds=1)
+
+
+def compare_series_dt_tz(result, expected, typ, version):
+    # 8260
+    # dtype is object < 0.17.0
+    if LooseVersion(version) < LooseVersion('0.17.0'):
+        expected = expected.astype(object)
+        tm.assert_series_equal(result, expected)
+    else:
+        tm.assert_series_equal(result, expected)
+
+
+def compare_series_cat(result, expected, typ, version):
+    # Categorical dtype is added in 0.15.0
+    # ordered is changed in 0.16.0
+    if LooseVersion(version) < LooseVersion('0.15.0'):
+        tm.assert_series_equal(result, expected, check_dtype=False,
+                               check_categorical=False)
+    elif LooseVersion(version) < LooseVersion('0.16.0'):
+        tm.assert_series_equal(result, expected, check_categorical=False)
+    else:
+        tm.assert_series_equal(result, expected)
+
+
+def compare_frame_dt_mixed_tzs(result, expected, typ, version):
+    # 8260
+    # dtype is object < 0.17.0
+    if LooseVersion(version) < LooseVersion('0.17.0'):
+        expected = expected.astype(object)
+        tm.assert_frame_equal(result, expected)
+    else:
+        tm.assert_frame_equal(result, expected)
+
+
+def compare_frame_cat_onecol(result, expected, typ, version):
+    # Categorical dtype is added in 0.15.0
+    # ordered is changed in 0.16.0
+    if LooseVersion(version) < LooseVersion('0.15.0'):
+        tm.assert_frame_equal(result, expected, check_dtype=False,
+                              check_categorical=False)
+    elif LooseVersion(version) < LooseVersion('0.16.0'):
+        tm.assert_frame_equal(result, expected, check_categorical=False)
+    else:
+        tm.assert_frame_equal(result, expected)
+
+
+def compare_frame_cat_and_float(result, expected, typ, version):
+    compare_frame_cat_onecol(result, expected, typ, version)
+
+
+def compare_index_period(result, expected, typ, version):
+    tm.assert_index_equal(result, expected)
+    assert isinstance(result.freq, MonthEnd)
+    assert result.freq == MonthEnd()
+    assert result.freqstr == 'M'
+    tm.assert_index_equal(result.shift(2), expected.shift(2))
+
+
+def compare_sp_frame_float(result, expected, typ, version):
+    if LooseVersion(version) <= LooseVersion('0.18.1'):
+        tm.assert_sp_frame_equal(result, expected, exact_indices=False,
+                                 check_dtype=False)
+    else:
+        tm.assert_sp_frame_equal(result, expected)
+
+
+files = glob.glob(os.path.join(os.path.dirname(__file__), "data",
+                  "legacy_pickle", "*", "*.pickle"))
+
+
+@pytest.fixture(params=files)
+def legacy_pickle(request, datapath):
+    return datapath(request.param)
+
+
+# ---------------------
+# tests
+# ---------------------
+def test_pickles(current_pickle_data, legacy_pickle):
+    if not is_platform_little_endian():
+        pytest.skip("known failure on non-little endian")
+
+    version = os.path.basename(os.path.dirname(legacy_pickle))
+    with catch_warnings(record=True):
+        compare(current_pickle_data, legacy_pickle, version)
+
+
+def test_round_trip_current(current_pickle_data):
+
+    try:
+        import cPickle as c_pickle
+
+        def c_pickler(obj, path):
+            with open(path, 'wb') as fh:
+                c_pickle.dump(obj, fh, protocol=-1)
+
+        def c_unpickler(path):
+            with open(path, 'rb') as fh:
+                fh.seek(0)
+                return c_pickle.load(fh)
+    except:
+        c_pickler = None
+        c_unpickler = None
+
+    import pickle as python_pickle
+
+    def python_pickler(obj, path):
+        with open(path, 'wb') as fh:
+            python_pickle.dump(obj, fh, protocol=-1)
+
+    def python_unpickler(path):
+        with open(path, 'rb') as fh:
+            fh.seek(0)
+            return python_pickle.load(fh)
+
+    data = current_pickle_data
+    for typ, dv in data.items():
+        for dt, expected in dv.items():
+
+            for writer in [pd.to_pickle, c_pickler, python_pickler]:
+                if writer is None:
+                    continue
+
+                with tm.ensure_clean() as path:
+
+                    # test writing with each pickler
+                    writer(expected, path)
+
+                    # test reading with each unpickler
+                    result = pd.read_pickle(path)
+                    compare_element(result, expected, typ)
+
+                    if c_unpickler is not None:
+                        result = c_unpickler(path)
+                        compare_element(result, expected, typ)
+
+                    result = python_unpickler(path)
+                    compare_element(result, expected, typ)
+
+
+def test_pickle_v0_14_1(datapath):
+
+    cat = pd.Categorical(values=['a', 'b', 'c'], ordered=False,
+                         categories=['a', 'b', 'c', 'd'])
+    pickle_path = datapath('io', 'data', 'categorical_0_14_1.pickle')
+    # This code was executed once on v0.14.1 to generate the pickle:
+    #
+    # cat = Categorical(labels=np.arange(3), levels=['a', 'b', 'c', 'd'],
+    #                   name='foobar')
+    # with open(pickle_path, 'wb') as f: pickle.dump(cat, f)
+    #
+    tm.assert_categorical_equal(cat, pd.read_pickle(pickle_path))
+
+
+def test_pickle_v0_15_2(datapath):
+    # ordered -> _ordered
+    # GH 9347
+
+    cat = pd.Categorical(values=['a', 'b', 'c'], ordered=False,
+                         categories=['a', 'b', 'c', 'd'])
+    pickle_path = datapath('io', 'data', 'categorical_0_15_2.pickle')
+    # This code was executed once on v0.15.2 to generate the pickle:
+    #
+    # cat = Categorical(labels=np.arange(3), levels=['a', 'b', 'c', 'd'],
+    #                   name='foobar')
+    # with open(pickle_path, 'wb') as f: pickle.dump(cat, f)
+    #
+    tm.assert_categorical_equal(cat, pd.read_pickle(pickle_path))
+
+
+def test_pickle_path_pathlib():
+    df = tm.makeDataFrame()
+    result = tm.round_trip_pathlib(df.to_pickle, pd.read_pickle)
+    tm.assert_frame_equal(df, result)
+
+
+def test_pickle_path_localpath():
+    df = tm.makeDataFrame()
+    result = tm.round_trip_localpath(df.to_pickle, pd.read_pickle)
+    tm.assert_frame_equal(df, result)
+
+
+# ---------------------
+# test pickle compression
+# ---------------------
+
+@pytest.fixture
+def get_random_path():
+    return u'__%s__.pickle' % tm.rands(10)
+
+
+class TestCompression(object):
+
+    _compression_to_extension = {
+        None: ".none",
+        'gzip': '.gz',
+        'bz2': '.bz2',
+        'zip': '.zip',
+        'xz': '.xz',
+    }
+
+    def compress_file(self, src_path, dest_path, compression):
+        if compression is None:
+            shutil.copyfile(src_path, dest_path)
+            return
+
+        if compression == 'gzip':
+            import gzip
+            f = gzip.open(dest_path, "w")
+        elif compression == 'bz2':
+            import bz2
+            f = bz2.BZ2File(dest_path, "w")
+        elif compression == 'zip':
+            import zipfile
+            zip_file = zipfile.ZipFile(dest_path, "w",
+                                       compression=zipfile.ZIP_DEFLATED)
+            zip_file.write(src_path, os.path.basename(src_path))
+        elif compression == 'xz':
+            lzma = pandas.compat.import_lzma()
+            f = lzma.LZMAFile(dest_path, "w")
+        else:
+            msg = 'Unrecognized compression type: {}'.format(compression)
+            raise ValueError(msg)
+
+        if compression != "zip":
+            with open(src_path, "rb") as fh:
+                f.write(fh.read())
+            f.close()
+
+    def test_write_explicit(self, compression, get_random_path):
+        base = get_random_path
+        path1 = base + ".compressed"
+        path2 = base + ".raw"
+
+        with tm.ensure_clean(path1) as p1, tm.ensure_clean(path2) as p2:
+            df = tm.makeDataFrame()
+
+            # write to compressed file
+            df.to_pickle(p1, compression=compression)
+
+            # decompress
+            with tm.decompress_file(p1, compression=compression) as f:
+                with open(p2, "wb") as fh:
+                    fh.write(f.read())
+
+            # read decompressed file
+            df2 = pd.read_pickle(p2, compression=None)
+
+            tm.assert_frame_equal(df, df2)
+
+    @pytest.mark.parametrize('compression', ['', 'None', 'bad', '7z'])
+    def test_write_explicit_bad(self, compression, get_random_path):
+        with tm.assert_raises_regex(ValueError,
+                                    "Unrecognized compression type"):
+            with tm.ensure_clean(get_random_path) as path:
+                df = tm.makeDataFrame()
+                df.to_pickle(path, compression=compression)
+
+    @pytest.mark.parametrize('ext', [
+        '', '.gz', '.bz2', '.no_compress',
+        pytest.param('.xz', marks=td.skip_if_no_lzma)
+    ])
+    def test_write_infer(self, ext, get_random_path):
+        base = get_random_path
+        path1 = base + ext
+        path2 = base + ".raw"
+        compression = None
+        for c in self._compression_to_extension:
+            if self._compression_to_extension[c] == ext:
+                compression = c
+                break
+
+        with tm.ensure_clean(path1) as p1, tm.ensure_clean(path2) as p2:
+            df = tm.makeDataFrame()
+
+            # write to compressed file by inferred compression method
+            df.to_pickle(p1)
+
+            # decompress
+            with tm.decompress_file(p1, compression=compression) as f:
+                with open(p2, "wb") as fh:
+                    fh.write(f.read())
+
+            # read decompressed file
+            df2 = pd.read_pickle(p2, compression=None)
+
+            tm.assert_frame_equal(df, df2)
+
+    def test_read_explicit(self, compression, get_random_path):
+        base = get_random_path
+        path1 = base + ".raw"
+        path2 = base + ".compressed"
+
+        with tm.ensure_clean(path1) as p1, tm.ensure_clean(path2) as p2:
+            df = tm.makeDataFrame()
+
+            # write to uncompressed file
+            df.to_pickle(p1, compression=None)
+
+            # compress
+            self.compress_file(p1, p2, compression=compression)
+
+            # read compressed file
+            df2 = pd.read_pickle(p2, compression=compression)
+
+            tm.assert_frame_equal(df, df2)
+
+    @pytest.mark.parametrize('ext', [
+        '', '.gz', '.bz2', '.zip', '.no_compress',
+        pytest.param('.xz', marks=td.skip_if_no_lzma)
+    ])
+    def test_read_infer(self, ext, get_random_path):
+        base = get_random_path
+        path1 = base + ".raw"
+        path2 = base + ext
+        compression = None
+        for c in self._compression_to_extension:
+            if self._compression_to_extension[c] == ext:
+                compression = c
+                break
+
+        with tm.ensure_clean(path1) as p1, tm.ensure_clean(path2) as p2:
+            df = tm.makeDataFrame()
+
+            # write to uncompressed file
+            df.to_pickle(p1, compression=None)
+
+            # compress
+            self.compress_file(p1, p2, compression=compression)
+
+            # read compressed file by inferred compression method
+            df2 = pd.read_pickle(p2)
+
+            tm.assert_frame_equal(df, df2)
+
+
+# ---------------------
+# test pickle compression
+# ---------------------
+
+class TestProtocol(object):
+
+    @pytest.mark.parametrize('protocol', [-1, 0, 1, 2])
+    def test_read(self, protocol, get_random_path):
+        with tm.ensure_clean(get_random_path) as path:
+            df = tm.makeDataFrame()
+            df.to_pickle(path, protocol=protocol)
+            df2 = pd.read_pickle(path)
+            tm.assert_frame_equal(df, df2)
+
+    @pytest.mark.parametrize('protocol', [3, 4])
+    @pytest.mark.skipif(PY3, reason="Testing invalid parameters for Python 2")
+    def test_read_bad_versions(self, protocol, get_random_path):
+        # For Python 2, HIGHEST_PROTOCOL should be 2.
+        msg = ("pickle protocol {protocol} asked for; the highest available "
+               "protocol is 2").format(protocol=protocol)
+        with tm.assert_raises_regex(ValueError, msg):
+            with tm.ensure_clean(get_random_path) as path:
+                df = tm.makeDataFrame()
+                df.to_pickle(path, protocol=protocol)
diff --git a/pandas/tests/io/test_pytables.py b/pandas/tests/io/test_pytables.py
new file mode 100644
index 0000000000000..865cab7a1596e
--- /dev/null
+++ b/pandas/tests/io/test_pytables.py
@@ -0,0 +1,5614 @@
+import pytest
+import os
+import tempfile
+from contextlib import contextmanager
+from warnings import catch_warnings
+from distutils.version import LooseVersion
+
+import datetime
+from datetime import timedelta
+
+import numpy as np
+
+import pandas as pd
+from pandas import (Series, DataFrame, Panel, MultiIndex, Int64Index,
+                    RangeIndex, Categorical, bdate_range,
+                    date_range, timedelta_range, Index, DatetimeIndex,
+                    isna, compat, concat, Timestamp)
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas.util.testing import (assert_panel_equal,
+                                 assert_frame_equal,
+                                 assert_series_equal,
+                                 set_timezone)
+
+from pandas.compat import (is_platform_windows, is_platform_little_endian,
+                           PY35, PY36, BytesIO, text_type,
+                           range, lrange, u)
+from pandas.io.formats.printing import pprint_thing
+from pandas.core.dtypes.common import is_categorical_dtype
+
+tables = pytest.importorskip('tables')
+from pandas.io import pytables as pytables  # noqa:E402
+from pandas.io.pytables import (TableIterator,  # noqa:E402
+                                HDFStore, get_store, Term, read_hdf,
+                                PossibleDataLossError, ClosedFileError)
+
+
+_default_compressor = ('blosc' if LooseVersion(tables.__version__) >=
+                       LooseVersion('2.2') else 'zlib')
+
+
+# contextmanager to ensure the file cleanup
+
+
+def safe_remove(path):
+    if path is not None:
+        try:
+            os.remove(path)
+        except:
+            pass
+
+
+def safe_close(store):
+    try:
+        if store is not None:
+            store.close()
+    except:
+        pass
+
+
+def create_tempfile(path):
+    """ create an unopened named temporary file """
+    return os.path.join(tempfile.gettempdir(), path)
+
+
+@contextmanager
+def ensure_clean_store(path, mode='a', complevel=None, complib=None,
+                       fletcher32=False):
+
+    try:
+
+        # put in the temporary path if we don't have one already
+        if not len(os.path.dirname(path)):
+            path = create_tempfile(path)
+
+        store = HDFStore(path, mode=mode, complevel=complevel,
+                         complib=complib, fletcher32=False)
+        yield store
+    finally:
+        safe_close(store)
+        if mode == 'w' or mode == 'a':
+            safe_remove(path)
+
+
+@contextmanager
+def ensure_clean_path(path):
+    """
+    return essentially a named temporary file that is not opened
+    and deleted on existing; if path is a list, then create and
+    return list of filenames
+    """
+    try:
+        if isinstance(path, list):
+            filenames = [create_tempfile(p) for p in path]
+            yield filenames
+        else:
+            filenames = [create_tempfile(path)]
+            yield filenames[0]
+    finally:
+        for f in filenames:
+            safe_remove(f)
+
+
+# set these parameters so we don't have file sharing
+tables.parameters.MAX_NUMEXPR_THREADS = 1
+tables.parameters.MAX_BLOSC_THREADS = 1
+tables.parameters.MAX_THREADS = 1
+
+
+def _maybe_remove(store, key):
+    """For tests using tables, try removing the table to be sure there is
+    no content from previous tests using the same table name."""
+    try:
+        store.remove(key)
+    except:
+        pass
+
+
+class Base(object):
+
+    @classmethod
+    def setup_class(cls):
+
+        # Pytables 3.0.0 deprecates lots of things
+        tm.reset_testing_mode()
+
+    @classmethod
+    def teardown_class(cls):
+
+        # Pytables 3.0.0 deprecates lots of things
+        tm.set_testing_mode()
+
+    def setup_method(self, method):
+        self.path = 'tmp.__%s__.h5' % tm.rands(10)
+
+    def teardown_method(self, method):
+        pass
+
+
+@pytest.mark.single
+class TestHDFStore(Base):
+
+    def test_factory_fun(self):
+        path = create_tempfile(self.path)
+        try:
+            with catch_warnings(record=True):
+                with get_store(path) as tbl:
+                    raise ValueError('blah')
+        except ValueError:
+            pass
+        finally:
+            safe_remove(path)
+
+        try:
+            with catch_warnings(record=True):
+                with get_store(path) as tbl:
+                    tbl['a'] = tm.makeDataFrame()
+
+            with catch_warnings(record=True):
+                with get_store(path) as tbl:
+                    assert len(tbl) == 1
+                    assert type(tbl['a']) == DataFrame
+        finally:
+            safe_remove(self.path)
+
+    def test_context(self):
+        path = create_tempfile(self.path)
+        try:
+            with HDFStore(path) as tbl:
+                raise ValueError('blah')
+        except ValueError:
+            pass
+        finally:
+            safe_remove(path)
+
+        try:
+            with HDFStore(path) as tbl:
+                tbl['a'] = tm.makeDataFrame()
+
+            with HDFStore(path) as tbl:
+                assert len(tbl) == 1
+                assert type(tbl['a']) == DataFrame
+        finally:
+            safe_remove(path)
+
+    def test_conv_read_write(self):
+        path = create_tempfile(self.path)
+        try:
+            def roundtrip(key, obj, **kwargs):
+                obj.to_hdf(path, key, **kwargs)
+                return read_hdf(path, key)
+
+            o = tm.makeTimeSeries()
+            assert_series_equal(o, roundtrip('series', o))
+
+            o = tm.makeStringSeries()
+            assert_series_equal(o, roundtrip('string_series', o))
+
+            o = tm.makeDataFrame()
+            assert_frame_equal(o, roundtrip('frame', o))
+
+            with catch_warnings(record=True):
+
+                o = tm.makePanel()
+                assert_panel_equal(o, roundtrip('panel', o))
+
+            # table
+            df = DataFrame(dict(A=lrange(5), B=lrange(5)))
+            df.to_hdf(path, 'table', append=True)
+            result = read_hdf(path, 'table', where=['index>2'])
+            assert_frame_equal(df[df.index > 2], result)
+
+        finally:
+            safe_remove(path)
+
+    def test_long_strings(self):
+
+        # GH6166
+        # unconversion of long strings was being chopped in earlier
+        # versions of numpy < 1.7.2
+        df = DataFrame({'a': tm.rands_array(100, size=10)},
+                       index=tm.rands_array(100, size=10))
+
+        with ensure_clean_store(self.path) as store:
+            store.append('df', df, data_columns=['a'])
+
+            result = store.select('df')
+            assert_frame_equal(df, result)
+
+    def test_api(self):
+
+        # GH4584
+        # API issue when to_hdf doesn't acdept append AND format args
+        with ensure_clean_path(self.path) as path:
+
+            df = tm.makeDataFrame()
+            df.iloc[:10].to_hdf(path, 'df', append=True, format='table')
+            df.iloc[10:].to_hdf(path, 'df', append=True, format='table')
+            assert_frame_equal(read_hdf(path, 'df'), df)
+
+            # append to False
+            df.iloc[:10].to_hdf(path, 'df', append=False, format='table')
+            df.iloc[10:].to_hdf(path, 'df', append=True, format='table')
+            assert_frame_equal(read_hdf(path, 'df'), df)
+
+        with ensure_clean_path(self.path) as path:
+
+            df = tm.makeDataFrame()
+            df.iloc[:10].to_hdf(path, 'df', append=True)
+            df.iloc[10:].to_hdf(path, 'df', append=True, format='table')
+            assert_frame_equal(read_hdf(path, 'df'), df)
+
+            # append to False
+            df.iloc[:10].to_hdf(path, 'df', append=False, format='table')
+            df.iloc[10:].to_hdf(path, 'df', append=True)
+            assert_frame_equal(read_hdf(path, 'df'), df)
+
+        with ensure_clean_path(self.path) as path:
+
+            df = tm.makeDataFrame()
+            df.to_hdf(path, 'df', append=False, format='fixed')
+            assert_frame_equal(read_hdf(path, 'df'), df)
+
+            df.to_hdf(path, 'df', append=False, format='f')
+            assert_frame_equal(read_hdf(path, 'df'), df)
+
+            df.to_hdf(path, 'df', append=False)
+            assert_frame_equal(read_hdf(path, 'df'), df)
+
+            df.to_hdf(path, 'df')
+            assert_frame_equal(read_hdf(path, 'df'), df)
+
+        with ensure_clean_store(self.path) as store:
+
+            path = store._path
+            df = tm.makeDataFrame()
+
+            _maybe_remove(store, 'df')
+            store.append('df', df.iloc[:10], append=True, format='table')
+            store.append('df', df.iloc[10:], append=True, format='table')
+            assert_frame_equal(store.select('df'), df)
+
+            # append to False
+            _maybe_remove(store, 'df')
+            store.append('df', df.iloc[:10], append=False, format='table')
+            store.append('df', df.iloc[10:], append=True, format='table')
+            assert_frame_equal(store.select('df'), df)
+
+            # formats
+            _maybe_remove(store, 'df')
+            store.append('df', df.iloc[:10], append=False, format='table')
+            store.append('df', df.iloc[10:], append=True, format='table')
+            assert_frame_equal(store.select('df'), df)
+
+            _maybe_remove(store, 'df')
+            store.append('df', df.iloc[:10], append=False, format='table')
+            store.append('df', df.iloc[10:], append=True, format=None)
+            assert_frame_equal(store.select('df'), df)
+
+        with ensure_clean_path(self.path) as path:
+
+            # invalid
+            df = tm.makeDataFrame()
+            pytest.raises(ValueError, df.to_hdf, path,
+                          'df', append=True, format='f')
+            pytest.raises(ValueError, df.to_hdf, path,
+                          'df', append=True, format='fixed')
+
+            pytest.raises(TypeError, df.to_hdf, path,
+                          'df', append=True, format='foo')
+            pytest.raises(TypeError, df.to_hdf, path,
+                          'df', append=False, format='bar')
+
+        # File path doesn't exist
+        path = ""
+        pytest.raises(compat.FileNotFoundError,
+                      read_hdf, path, 'df')
+
+    def test_api_default_format(self):
+
+        # default_format option
+        with ensure_clean_store(self.path) as store:
+            df = tm.makeDataFrame()
+
+            pd.set_option('io.hdf.default_format', 'fixed')
+            _maybe_remove(store, 'df')
+            store.put('df', df)
+            assert not store.get_storer('df').is_table
+            pytest.raises(ValueError, store.append, 'df2', df)
+
+            pd.set_option('io.hdf.default_format', 'table')
+            _maybe_remove(store, 'df')
+            store.put('df', df)
+            assert store.get_storer('df').is_table
+            _maybe_remove(store, 'df2')
+            store.append('df2', df)
+            assert store.get_storer('df').is_table
+
+            pd.set_option('io.hdf.default_format', None)
+
+        with ensure_clean_path(self.path) as path:
+
+            df = tm.makeDataFrame()
+
+            pd.set_option('io.hdf.default_format', 'fixed')
+            df.to_hdf(path, 'df')
+            with HDFStore(path) as store:
+                assert not store.get_storer('df').is_table
+            pytest.raises(ValueError, df.to_hdf, path, 'df2', append=True)
+
+            pd.set_option('io.hdf.default_format', 'table')
+            df.to_hdf(path, 'df3')
+            with HDFStore(path) as store:
+                assert store.get_storer('df3').is_table
+            df.to_hdf(path, 'df4', append=True)
+            with HDFStore(path) as store:
+                assert store.get_storer('df4').is_table
+
+            pd.set_option('io.hdf.default_format', None)
+
+    def test_keys(self):
+
+        with ensure_clean_store(self.path) as store:
+            store['a'] = tm.makeTimeSeries()
+            store['b'] = tm.makeStringSeries()
+            store['c'] = tm.makeDataFrame()
+            with catch_warnings(record=True):
+                store['d'] = tm.makePanel()
+                store['foo/bar'] = tm.makePanel()
+            assert len(store) == 5
+            expected = set(['/a', '/b', '/c', '/d', '/foo/bar'])
+            assert set(store.keys()) == expected
+            assert set(store) == expected
+
+    def test_keys_ignore_hdf_softlink(self):
+
+        # GH 20523
+        # Puts a softlink into HDF file and rereads
+
+        with ensure_clean_store(self.path) as store:
+
+            df = DataFrame(dict(A=lrange(5), B=lrange(5)))
+            store.put("df", df)
+
+            assert store.keys() == ["/df"]
+
+            store._handle.create_soft_link(store._handle.root, "symlink", "df")
+
+            # Should ignore the softlink
+            assert store.keys() == ["/df"]
+
+    def test_iter_empty(self):
+
+        with ensure_clean_store(self.path) as store:
+            # GH 12221
+            assert list(store) == []
+
+    def test_repr(self):
+
+        with ensure_clean_store(self.path) as store:
+            repr(store)
+            store.info()
+            store['a'] = tm.makeTimeSeries()
+            store['b'] = tm.makeStringSeries()
+            store['c'] = tm.makeDataFrame()
+
+            with catch_warnings(record=True):
+                store['d'] = tm.makePanel()
+                store['foo/bar'] = tm.makePanel()
+                store.append('e', tm.makePanel())
+
+            df = tm.makeDataFrame()
+            df['obj1'] = 'foo'
+            df['obj2'] = 'bar'
+            df['bool1'] = df['A'] > 0
+            df['bool2'] = df['B'] > 0
+            df['bool3'] = True
+            df['int1'] = 1
+            df['int2'] = 2
+            df['timestamp1'] = Timestamp('20010102')
+            df['timestamp2'] = Timestamp('20010103')
+            df['datetime1'] = datetime.datetime(2001, 1, 2, 0, 0)
+            df['datetime2'] = datetime.datetime(2001, 1, 3, 0, 0)
+            df.loc[3:6, ['obj1']] = np.nan
+            df = df._consolidate()._convert(datetime=True)
+
+            # PerformanceWarning
+            with catch_warnings(record=True):
+                store['df'] = df
+
+            # make a random group in hdf space
+            store._handle.create_group(store._handle.root, 'bah')
+
+            assert store.filename in repr(store)
+            assert store.filename in str(store)
+            store.info()
+
+        # storers
+        with ensure_clean_store(self.path) as store:
+
+            df = tm.makeDataFrame()
+            store.append('df', df)
+
+            s = store.get_storer('df')
+            repr(s)
+            str(s)
+
+    def test_contains(self):
+
+        with ensure_clean_store(self.path) as store:
+            store['a'] = tm.makeTimeSeries()
+            store['b'] = tm.makeDataFrame()
+            store['foo/bar'] = tm.makeDataFrame()
+            assert 'a' in store
+            assert 'b' in store
+            assert 'c' not in store
+            assert 'foo/bar' in store
+            assert '/foo/bar' in store
+            assert '/foo/b' not in store
+            assert 'bar' not in store
+
+            # gh-2694: tables.NaturalNameWarning
+            with catch_warnings(record=True):
+                store['node())'] = tm.makeDataFrame()
+            assert 'node())' in store
+
+    def test_versioning(self):
+
+        with ensure_clean_store(self.path) as store:
+            store['a'] = tm.makeTimeSeries()
+            store['b'] = tm.makeDataFrame()
+            df = tm.makeTimeDataFrame()
+            _maybe_remove(store, 'df1')
+            store.append('df1', df[:10])
+            store.append('df1', df[10:])
+            assert store.root.a._v_attrs.pandas_version == '0.15.2'
+            assert store.root.b._v_attrs.pandas_version == '0.15.2'
+            assert store.root.df1._v_attrs.pandas_version == '0.15.2'
+
+            # write a file and wipe its versioning
+            _maybe_remove(store, 'df2')
+            store.append('df2', df)
+
+            # this is an error because its table_type is appendable, but no
+            # version info
+            store.get_node('df2')._v_attrs.pandas_version = None
+            pytest.raises(Exception, store.select, 'df2')
+
+    def test_mode(self):
+
+        df = tm.makeTimeDataFrame()
+
+        def check(mode):
+
+            with ensure_clean_path(self.path) as path:
+
+                # constructor
+                if mode in ['r', 'r+']:
+                    pytest.raises(IOError, HDFStore, path, mode=mode)
+
+                else:
+                    store = HDFStore(path, mode=mode)
+                    assert store._handle.mode == mode
+                    store.close()
+
+            with ensure_clean_path(self.path) as path:
+
+                # context
+                if mode in ['r', 'r+']:
+                    def f():
+                        with HDFStore(path, mode=mode) as store:  # noqa
+                            pass
+                    pytest.raises(IOError, f)
+                else:
+                    with HDFStore(path, mode=mode) as store:
+                        assert store._handle.mode == mode
+
+            with ensure_clean_path(self.path) as path:
+
+                # conv write
+                if mode in ['r', 'r+']:
+                    pytest.raises(IOError, df.to_hdf,
+                                  path, 'df', mode=mode)
+                    df.to_hdf(path, 'df', mode='w')
+                else:
+                    df.to_hdf(path, 'df', mode=mode)
+
+                # conv read
+                if mode in ['w']:
+                    pytest.raises(ValueError, read_hdf,
+                                  path, 'df', mode=mode)
+                else:
+                    result = read_hdf(path, 'df', mode=mode)
+                    assert_frame_equal(result, df)
+
+        def check_default_mode():
+
+            # read_hdf uses default mode
+            with ensure_clean_path(self.path) as path:
+                df.to_hdf(path, 'df', mode='w')
+                result = read_hdf(path, 'df')
+                assert_frame_equal(result, df)
+
+        check('r')
+        check('r+')
+        check('a')
+        check('w')
+        check_default_mode()
+
+    def test_reopen_handle(self):
+
+        with ensure_clean_path(self.path) as path:
+
+            store = HDFStore(path, mode='a')
+            store['a'] = tm.makeTimeSeries()
+
+            # invalid mode change
+            pytest.raises(PossibleDataLossError, store.open, 'w')
+            store.close()
+            assert not store.is_open
+
+            # truncation ok here
+            store.open('w')
+            assert store.is_open
+            assert len(store) == 0
+            store.close()
+            assert not store.is_open
+
+            store = HDFStore(path, mode='a')
+            store['a'] = tm.makeTimeSeries()
+
+            # reopen as read
+            store.open('r')
+            assert store.is_open
+            assert len(store) == 1
+            assert store._mode == 'r'
+            store.close()
+            assert not store.is_open
+
+            # reopen as append
+            store.open('a')
+            assert store.is_open
+            assert len(store) == 1
+            assert store._mode == 'a'
+            store.close()
+            assert not store.is_open
+
+            # reopen as append (again)
+            store.open('a')
+            assert store.is_open
+            assert len(store) == 1
+            assert store._mode == 'a'
+            store.close()
+            assert not store.is_open
+
+    def test_open_args(self):
+
+        with ensure_clean_path(self.path) as path:
+
+            df = tm.makeDataFrame()
+
+            # create an in memory store
+            store = HDFStore(path, mode='a', driver='H5FD_CORE',
+                             driver_core_backing_store=0)
+            store['df'] = df
+            store.append('df2', df)
+
+            tm.assert_frame_equal(store['df'], df)
+            tm.assert_frame_equal(store['df2'], df)
+
+            store.close()
+
+            # the file should not have actually been written
+            assert not os.path.exists(path)
+
+    def test_flush(self):
+
+        with ensure_clean_store(self.path) as store:
+            store['a'] = tm.makeTimeSeries()
+            store.flush()
+            store.flush(fsync=True)
+
+    def test_get(self):
+
+        with ensure_clean_store(self.path) as store:
+            store['a'] = tm.makeTimeSeries()
+            left = store.get('a')
+            right = store['a']
+            tm.assert_series_equal(left, right)
+
+            left = store.get('/a')
+            right = store['/a']
+            tm.assert_series_equal(left, right)
+
+            pytest.raises(KeyError, store.get, 'b')
+
+    @pytest.mark.parametrize('where, expected', [
+        ('/', {
+            '': ({'first_group', 'second_group'}, set()),
+            '/first_group': (set(), {'df1', 'df2'}),
+            '/second_group': ({'third_group'}, {'df3', 's1'}),
+            '/second_group/third_group': (set(), {'df4'}),
+        }),
+        ('/second_group', {
+            '/second_group': ({'third_group'}, {'df3', 's1'}),
+            '/second_group/third_group': (set(), {'df4'}),
+        })
+    ])
+    def test_walk(self, where, expected):
+        # GH10143
+        objs = {
+            'df1': pd.DataFrame([1, 2, 3]),
+            'df2': pd.DataFrame([4, 5, 6]),
+            'df3': pd.DataFrame([6, 7, 8]),
+            'df4': pd.DataFrame([9, 10, 11]),
+            's1': pd.Series([10, 9, 8]),
+            # Next 3 items aren't pandas objects and should be ignored
+            'a1': np.array([[1, 2, 3], [4, 5, 6]]),
+            'tb1': np.array([(1, 2, 3), (4, 5, 6)], dtype='i,i,i'),
+            'tb2': np.array([(7, 8, 9), (10, 11, 12)], dtype='i,i,i')
+        }
+
+        with ensure_clean_store('walk_groups.hdf', mode='w') as store:
+            store.put('/first_group/df1', objs['df1'])
+            store.put('/first_group/df2', objs['df2'])
+            store.put('/second_group/df3', objs['df3'])
+            store.put('/second_group/s1', objs['s1'])
+            store.put('/second_group/third_group/df4', objs['df4'])
+            # Create non-pandas objects
+            store._handle.create_array('/first_group', 'a1', objs['a1'])
+            store._handle.create_table('/first_group', 'tb1', obj=objs['tb1'])
+            store._handle.create_table('/second_group', 'tb2', obj=objs['tb2'])
+
+            assert len(list(store.walk(where=where))) == len(expected)
+            for path, groups, leaves in store.walk(where=where):
+                assert path in expected
+                expected_groups, expected_frames = expected[path]
+                assert expected_groups == set(groups)
+                assert expected_frames == set(leaves)
+                for leaf in leaves:
+                    frame_path = '/'.join([path, leaf])
+                    obj = store.get(frame_path)
+                    if 'df' in leaf:
+                        tm.assert_frame_equal(obj, objs[leaf])
+                    else:
+                        tm.assert_series_equal(obj, objs[leaf])
+
+    def test_getattr(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            s = tm.makeTimeSeries()
+            store['a'] = s
+
+            # test attribute access
+            result = store.a
+            tm.assert_series_equal(result, s)
+            result = getattr(store, 'a')
+            tm.assert_series_equal(result, s)
+
+            df = tm.makeTimeDataFrame()
+            store['df'] = df
+            result = store.df
+            tm.assert_frame_equal(result, df)
+
+            # errors
+            pytest.raises(AttributeError, getattr, store, 'd')
+
+            for x in ['mode', 'path', 'handle', 'complib']:
+                pytest.raises(AttributeError, getattr, store, x)
+
+            # not stores
+            for x in ['mode', 'path', 'handle', 'complib']:
+                getattr(store, "_%s" % x)
+
+    def test_put(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            ts = tm.makeTimeSeries()
+            df = tm.makeTimeDataFrame()
+            store['a'] = ts
+            store['b'] = df[:10]
+            store['foo/bar/bah'] = df[:10]
+            store['foo'] = df[:10]
+            store['/foo'] = df[:10]
+            store.put('c', df[:10], format='table')
+
+            # not OK, not a table
+            pytest.raises(
+                ValueError, store.put, 'b', df[10:], append=True)
+
+            # node does not currently exist, test _is_table_type returns False
+            # in this case
+            # _maybe_remove(store, 'f')
+            # pytest.raises(ValueError, store.put, 'f', df[10:],
+            #                   append=True)
+
+            # can't put to a table (use append instead)
+            pytest.raises(ValueError, store.put, 'c', df[10:], append=True)
+
+            # overwrite table
+            store.put('c', df[:10], format='table', append=False)
+            tm.assert_frame_equal(df[:10], store['c'])
+
+    def test_put_string_index(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            index = Index(
+                ["I am a very long string index: %s" % i for i in range(20)])
+            s = Series(np.arange(20), index=index)
+            df = DataFrame({'A': s, 'B': s})
+
+            store['a'] = s
+            tm.assert_series_equal(store['a'], s)
+
+            store['b'] = df
+            tm.assert_frame_equal(store['b'], df)
+
+            # mixed length
+            index = Index(['abcdefghijklmnopqrstuvwxyz1234567890'] +
+                          ["I am a very long string index: %s" % i
+                           for i in range(20)])
+            s = Series(np.arange(21), index=index)
+            df = DataFrame({'A': s, 'B': s})
+            store['a'] = s
+            tm.assert_series_equal(store['a'], s)
+
+            store['b'] = df
+            tm.assert_frame_equal(store['b'], df)
+
+    def test_put_compression(self):
+
+        with ensure_clean_store(self.path) as store:
+            df = tm.makeTimeDataFrame()
+
+            store.put('c', df, format='table', complib='zlib')
+            tm.assert_frame_equal(store['c'], df)
+
+            # can't compress if format='fixed'
+            pytest.raises(ValueError, store.put, 'b', df,
+                          format='fixed', complib='zlib')
+
+    @td.skip_if_windows_python_3
+    def test_put_compression_blosc(self):
+        df = tm.makeTimeDataFrame()
+
+        with ensure_clean_store(self.path) as store:
+
+            # can't compress if format='fixed'
+            pytest.raises(ValueError, store.put, 'b', df,
+                          format='fixed', complib='blosc')
+
+            store.put('c', df, format='table', complib='blosc')
+            tm.assert_frame_equal(store['c'], df)
+
+    def test_complibs_default_settings(self):
+        # GH15943
+        df = tm.makeDataFrame()
+
+        # Set complevel and check if complib is automatically set to
+        # default value
+        with ensure_clean_path(self.path) as tmpfile:
+            df.to_hdf(tmpfile, 'df', complevel=9)
+            result = pd.read_hdf(tmpfile, 'df')
+            tm.assert_frame_equal(result, df)
+
+            with tables.open_file(tmpfile, mode='r') as h5file:
+                for node in h5file.walk_nodes(where='/df', classname='Leaf'):
+                    assert node.filters.complevel == 9
+                    assert node.filters.complib == 'zlib'
+
+        # Set complib and check to see if compression is disabled
+        with ensure_clean_path(self.path) as tmpfile:
+            df.to_hdf(tmpfile, 'df', complib='zlib')
+            result = pd.read_hdf(tmpfile, 'df')
+            tm.assert_frame_equal(result, df)
+
+            with tables.open_file(tmpfile, mode='r') as h5file:
+                for node in h5file.walk_nodes(where='/df', classname='Leaf'):
+                    assert node.filters.complevel == 0
+                    assert node.filters.complib is None
+
+        # Check if not setting complib or complevel results in no compression
+        with ensure_clean_path(self.path) as tmpfile:
+            df.to_hdf(tmpfile, 'df')
+            result = pd.read_hdf(tmpfile, 'df')
+            tm.assert_frame_equal(result, df)
+
+            with tables.open_file(tmpfile, mode='r') as h5file:
+                for node in h5file.walk_nodes(where='/df', classname='Leaf'):
+                    assert node.filters.complevel == 0
+                    assert node.filters.complib is None
+
+        # Check if file-defaults can be overridden on a per table basis
+        with ensure_clean_path(self.path) as tmpfile:
+            store = pd.HDFStore(tmpfile)
+            store.append('dfc', df, complevel=9, complib='blosc')
+            store.append('df', df)
+            store.close()
+
+            with tables.open_file(tmpfile, mode='r') as h5file:
+                for node in h5file.walk_nodes(where='/df', classname='Leaf'):
+                    assert node.filters.complevel == 0
+                    assert node.filters.complib is None
+                for node in h5file.walk_nodes(where='/dfc', classname='Leaf'):
+                    assert node.filters.complevel == 9
+                    assert node.filters.complib == 'blosc'
+
+    def test_complibs(self):
+        # GH14478
+        df = tm.makeDataFrame()
+
+        # Building list of all complibs and complevels tuples
+        all_complibs = tables.filters.all_complibs
+        # Remove lzo if its not available on this platform
+        if not tables.which_lib_version('lzo'):
+            all_complibs.remove('lzo')
+        # Remove bzip2 if its not available on this platform
+        if not tables.which_lib_version("bzip2"):
+            all_complibs.remove("bzip2")
+
+        all_levels = range(0, 10)
+        all_tests = [(lib, lvl) for lib in all_complibs for lvl in all_levels]
+
+        for (lib, lvl) in all_tests:
+            with ensure_clean_path(self.path) as tmpfile:
+                gname = 'foo'
+
+                # Write and read file to see if data is consistent
+                df.to_hdf(tmpfile, gname, complib=lib, complevel=lvl)
+                result = pd.read_hdf(tmpfile, gname)
+                tm.assert_frame_equal(result, df)
+
+                # Open file and check metadata
+                # for correct amount of compression
+                h5table = tables.open_file(tmpfile, mode='r')
+                for node in h5table.walk_nodes(where='/' + gname,
+                                               classname='Leaf'):
+                    assert node.filters.complevel == lvl
+                    if lvl == 0:
+                        assert node.filters.complib is None
+                    else:
+                        assert node.filters.complib == lib
+                h5table.close()
+
+    def test_put_integer(self):
+        # non-date, non-string index
+        df = DataFrame(np.random.randn(50, 100))
+        self._check_roundtrip(df, tm.assert_frame_equal)
+
+    def test_put_mixed_type(self):
+        df = tm.makeTimeDataFrame()
+        df['obj1'] = 'foo'
+        df['obj2'] = 'bar'
+        df['bool1'] = df['A'] > 0
+        df['bool2'] = df['B'] > 0
+        df['bool3'] = True
+        df['int1'] = 1
+        df['int2'] = 2
+        df['timestamp1'] = Timestamp('20010102')
+        df['timestamp2'] = Timestamp('20010103')
+        df['datetime1'] = datetime.datetime(2001, 1, 2, 0, 0)
+        df['datetime2'] = datetime.datetime(2001, 1, 3, 0, 0)
+        df.loc[3:6, ['obj1']] = np.nan
+        df = df._consolidate()._convert(datetime=True)
+
+        with ensure_clean_store(self.path) as store:
+            _maybe_remove(store, 'df')
+
+            # PerformanceWarning
+            with catch_warnings(record=True):
+                store.put('df', df)
+
+            expected = store.get('df')
+            tm.assert_frame_equal(expected, df)
+
+    def test_append(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            # this is allowed by almost always don't want to do it
+            # tables.NaturalNameWarning):
+            with catch_warnings(record=True):
+
+                df = tm.makeTimeDataFrame()
+                _maybe_remove(store, 'df1')
+                store.append('df1', df[:10])
+                store.append('df1', df[10:])
+                tm.assert_frame_equal(store['df1'], df)
+
+                _maybe_remove(store, 'df2')
+                store.put('df2', df[:10], format='table')
+                store.append('df2', df[10:])
+                tm.assert_frame_equal(store['df2'], df)
+
+                _maybe_remove(store, 'df3')
+                store.append('/df3', df[:10])
+                store.append('/df3', df[10:])
+                tm.assert_frame_equal(store['df3'], df)
+
+                # this is allowed by almost always don't want to do it
+                # tables.NaturalNameWarning
+                _maybe_remove(store, '/df3 foo')
+                store.append('/df3 foo', df[:10])
+                store.append('/df3 foo', df[10:])
+                tm.assert_frame_equal(store['df3 foo'], df)
+
+                # panel
+                wp = tm.makePanel()
+                _maybe_remove(store, 'wp1')
+                store.append('wp1', wp.iloc[:, :10, :])
+                store.append('wp1', wp.iloc[:, 10:, :])
+                assert_panel_equal(store['wp1'], wp)
+
+                # test using differt order of items on the non-index axes
+                _maybe_remove(store, 'wp1')
+                wp_append1 = wp.iloc[:, :10, :]
+                store.append('wp1', wp_append1)
+                wp_append2 = wp.iloc[:, 10:, :].reindex(items=wp.items[::-1])
+                store.append('wp1', wp_append2)
+                assert_panel_equal(store['wp1'], wp)
+
+                # dtype issues - mizxed type in a single object column
+                df = DataFrame(data=[[1, 2], [0, 1], [1, 2], [0, 0]])
+                df['mixed_column'] = 'testing'
+                df.loc[2, 'mixed_column'] = np.nan
+                _maybe_remove(store, 'df')
+                store.append('df', df)
+                tm.assert_frame_equal(store['df'], df)
+
+                # uints - test storage of uints
+                uint_data = DataFrame({
+                    'u08': Series(np.random.randint(0, high=255, size=5),
+                                  dtype=np.uint8),
+                    'u16': Series(np.random.randint(0, high=65535, size=5),
+                                  dtype=np.uint16),
+                    'u32': Series(np.random.randint(0, high=2**30, size=5),
+                                  dtype=np.uint32),
+                    'u64': Series([2**58, 2**59, 2**60, 2**61, 2**62],
+                                  dtype=np.uint64)}, index=np.arange(5))
+                _maybe_remove(store, 'uints')
+                store.append('uints', uint_data)
+                tm.assert_frame_equal(store['uints'], uint_data)
+
+                # uints - test storage of uints in indexable columns
+                _maybe_remove(store, 'uints')
+                # 64-bit indices not yet supported
+                store.append('uints', uint_data, data_columns=[
+                             'u08', 'u16', 'u32'])
+                tm.assert_frame_equal(store['uints'], uint_data)
+
+    def test_append_series(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            # basic
+            ss = tm.makeStringSeries()
+            ts = tm.makeTimeSeries()
+            ns = Series(np.arange(100))
+
+            store.append('ss', ss)
+            result = store['ss']
+            tm.assert_series_equal(result, ss)
+            assert result.name is None
+
+            store.append('ts', ts)
+            result = store['ts']
+            tm.assert_series_equal(result, ts)
+            assert result.name is None
+
+            ns.name = 'foo'
+            store.append('ns', ns)
+            result = store['ns']
+            tm.assert_series_equal(result, ns)
+            assert result.name == ns.name
+
+            # select on the values
+            expected = ns[ns > 60]
+            result = store.select('ns', 'foo>60')
+            tm.assert_series_equal(result, expected)
+
+            # select on the index and values
+            expected = ns[(ns > 70) & (ns.index < 90)]
+            result = store.select('ns', 'foo>70 and index<90')
+            tm.assert_series_equal(result, expected)
+
+            # multi-index
+            mi = DataFrame(np.random.randn(5, 1), columns=['A'])
+            mi['B'] = np.arange(len(mi))
+            mi['C'] = 'foo'
+            mi.loc[3:5, 'C'] = 'bar'
+            mi.set_index(['C', 'B'], inplace=True)
+            s = mi.stack()
+            s.index = s.index.droplevel(2)
+            store.append('mi', s)
+            tm.assert_series_equal(store['mi'], s)
+
+    def test_store_index_types(self):
+        # GH5386
+        # test storing various index types
+
+        with ensure_clean_store(self.path) as store:
+
+            def check(format, index):
+                df = DataFrame(np.random.randn(10, 2), columns=list('AB'))
+                df.index = index(len(df))
+
+                _maybe_remove(store, 'df')
+                store.put('df', df, format=format)
+                assert_frame_equal(df, store['df'])
+
+            for index in [tm.makeFloatIndex, tm.makeStringIndex,
+                          tm.makeIntIndex, tm.makeDateIndex]:
+
+                check('table', index)
+                check('fixed', index)
+
+            # period index currently broken for table
+            # seee GH7796 FIXME
+            check('fixed', tm.makePeriodIndex)
+            # check('table',tm.makePeriodIndex)
+
+            # unicode
+            index = tm.makeUnicodeIndex
+            if compat.PY3:
+                check('table', index)
+                check('fixed', index)
+            else:
+
+                # only support for fixed types (and they have a perf warning)
+                pytest.raises(TypeError, check, 'table', index)
+
+                # PerformanceWarning
+                with catch_warnings(record=True):
+                    check('fixed', index)
+
+    @pytest.mark.skipif(not is_platform_little_endian(),
+                        reason="reason platform is not little endian")
+    def test_encoding(self):
+
+        with ensure_clean_store(self.path) as store:
+            df = DataFrame(dict(A='foo', B='bar'), index=range(5))
+            df.loc[2, 'A'] = np.nan
+            df.loc[3, 'B'] = np.nan
+            _maybe_remove(store, 'df')
+            store.append('df', df, encoding='ascii')
+            tm.assert_frame_equal(store['df'], df)
+
+            expected = df.reindex(columns=['A'])
+            result = store.select('df', Term('columns=A', encoding='ascii'))
+            tm.assert_frame_equal(result, expected)
+
+    def test_latin_encoding(self):
+
+        if compat.PY2:
+            tm.assert_raises_regex(
+                TypeError, r'\[unicode\] is not implemented as a table column')
+            return
+
+        values = [[b'E\xc9, 17', b'', b'a', b'b', b'c'],
+                  [b'E\xc9, 17', b'a', b'b', b'c'],
+                  [b'EE, 17', b'', b'a', b'b', b'c'],
+                  [b'E\xc9, 17', b'\xf8\xfc', b'a', b'b', b'c'],
+                  [b'', b'a', b'b', b'c'],
+                  [b'\xf8\xfc', b'a', b'b', b'c'],
+                  [b'A\xf8\xfc', b'', b'a', b'b', b'c'],
+                  [np.nan, b'', b'b', b'c'],
+                  [b'A\xf8\xfc', np.nan, b'', b'b', b'c']]
+
+        def _try_decode(x, encoding='latin-1'):
+            try:
+                return x.decode(encoding)
+            except AttributeError:
+                return x
+        # not sure how to remove latin-1 from code in python 2 and 3
+        values = [[_try_decode(x) for x in y] for y in values]
+
+        examples = []
+        for dtype in ['category', object]:
+            for val in values:
+                examples.append(pd.Series(val, dtype=dtype))
+
+        def roundtrip(s, key='data', encoding='latin-1', nan_rep=''):
+            with ensure_clean_path(self.path) as store:
+                s.to_hdf(store, key, format='table', encoding=encoding,
+                         nan_rep=nan_rep)
+                retr = read_hdf(store, key)
+                s_nan = s.replace(nan_rep, np.nan)
+                if is_categorical_dtype(s_nan):
+                    assert is_categorical_dtype(retr)
+                    assert_series_equal(s_nan, retr, check_dtype=False,
+                                        check_categorical=False)
+                else:
+                    assert_series_equal(s_nan, retr)
+
+        for s in examples:
+            roundtrip(s)
+
+        # fails:
+        # for x in examples:
+        #     roundtrip(s, nan_rep=b'\xf8\xfc')
+
+    def test_append_some_nans(self):
+
+        with ensure_clean_store(self.path) as store:
+            df = DataFrame({'A': Series(np.random.randn(20)).astype('int32'),
+                            'A1': np.random.randn(20),
+                            'A2': np.random.randn(20),
+                            'B': 'foo', 'C': 'bar',
+                            'D': Timestamp("20010101"),
+                            'E': datetime.datetime(2001, 1, 2, 0, 0)},
+                           index=np.arange(20))
+            # some nans
+            _maybe_remove(store, 'df1')
+            df.loc[0:15, ['A1', 'B', 'D', 'E']] = np.nan
+            store.append('df1', df[:10])
+            store.append('df1', df[10:])
+            tm.assert_frame_equal(store['df1'], df)
+
+            # first column
+            df1 = df.copy()
+            df1.loc[:, 'A1'] = np.nan
+            _maybe_remove(store, 'df1')
+            store.append('df1', df1[:10])
+            store.append('df1', df1[10:])
+            tm.assert_frame_equal(store['df1'], df1)
+
+            # 2nd column
+            df2 = df.copy()
+            df2.loc[:, 'A2'] = np.nan
+            _maybe_remove(store, 'df2')
+            store.append('df2', df2[:10])
+            store.append('df2', df2[10:])
+            tm.assert_frame_equal(store['df2'], df2)
+
+            # datetimes
+            df3 = df.copy()
+            df3.loc[:, 'E'] = np.nan
+            _maybe_remove(store, 'df3')
+            store.append('df3', df3[:10])
+            store.append('df3', df3[10:])
+            tm.assert_frame_equal(store['df3'], df3)
+
+    def test_append_all_nans(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            df = DataFrame({'A1': np.random.randn(20),
+                            'A2': np.random.randn(20)},
+                           index=np.arange(20))
+            df.loc[0:15, :] = np.nan
+
+            # nan some entire rows (dropna=True)
+            _maybe_remove(store, 'df')
+            store.append('df', df[:10], dropna=True)
+            store.append('df', df[10:], dropna=True)
+            tm.assert_frame_equal(store['df'], df[-4:])
+
+            # nan some entire rows (dropna=False)
+            _maybe_remove(store, 'df2')
+            store.append('df2', df[:10], dropna=False)
+            store.append('df2', df[10:], dropna=False)
+            tm.assert_frame_equal(store['df2'], df)
+
+            # tests the option io.hdf.dropna_table
+            pd.set_option('io.hdf.dropna_table', False)
+            _maybe_remove(store, 'df3')
+            store.append('df3', df[:10])
+            store.append('df3', df[10:])
+            tm.assert_frame_equal(store['df3'], df)
+
+            pd.set_option('io.hdf.dropna_table', True)
+            _maybe_remove(store, 'df4')
+            store.append('df4', df[:10])
+            store.append('df4', df[10:])
+            tm.assert_frame_equal(store['df4'], df[-4:])
+
+            # nan some entire rows (string are still written!)
+            df = DataFrame({'A1': np.random.randn(20),
+                            'A2': np.random.randn(20),
+                            'B': 'foo', 'C': 'bar'},
+                           index=np.arange(20))
+
+            df.loc[0:15, :] = np.nan
+
+            _maybe_remove(store, 'df')
+            store.append('df', df[:10], dropna=True)
+            store.append('df', df[10:], dropna=True)
+            tm.assert_frame_equal(store['df'], df)
+
+            _maybe_remove(store, 'df2')
+            store.append('df2', df[:10], dropna=False)
+            store.append('df2', df[10:], dropna=False)
+            tm.assert_frame_equal(store['df2'], df)
+
+            # nan some entire rows (but since we have dates they are still
+            # written!)
+            df = DataFrame({'A1': np.random.randn(20),
+                            'A2': np.random.randn(20),
+                            'B': 'foo', 'C': 'bar',
+                            'D': Timestamp("20010101"),
+                            'E': datetime.datetime(2001, 1, 2, 0, 0)},
+                           index=np.arange(20))
+
+            df.loc[0:15, :] = np.nan
+
+            _maybe_remove(store, 'df')
+            store.append('df', df[:10], dropna=True)
+            store.append('df', df[10:], dropna=True)
+            tm.assert_frame_equal(store['df'], df)
+
+            _maybe_remove(store, 'df2')
+            store.append('df2', df[:10], dropna=False)
+            store.append('df2', df[10:], dropna=False)
+            tm.assert_frame_equal(store['df2'], df)
+
+        # Test to make sure defaults are to not drop.
+        # Corresponding to Issue 9382
+        df_with_missing = DataFrame(
+            {'col1': [0, np.nan, 2], 'col2': [1, np.nan, np.nan]})
+
+        with ensure_clean_path(self.path) as path:
+            df_with_missing.to_hdf(path, 'df_with_missing', format='table')
+            reloaded = read_hdf(path, 'df_with_missing')
+            tm.assert_frame_equal(df_with_missing, reloaded)
+
+        matrix = [[[np.nan, np.nan, np.nan], [1, np.nan, np.nan]],
+                  [[np.nan, np.nan, np.nan], [np.nan, 5, 6]],
+                  [[np.nan, np.nan, np.nan], [np.nan, 3, np.nan]]]
+
+        with catch_warnings(record=True):
+            panel_with_missing = Panel(matrix,
+                                       items=['Item1', 'Item2', 'Item3'],
+                                       major_axis=[1, 2],
+                                       minor_axis=['A', 'B', 'C'])
+
+            with ensure_clean_path(self.path) as path:
+                panel_with_missing.to_hdf(
+                    path, 'panel_with_missing', format='table')
+                reloaded_panel = read_hdf(path, 'panel_with_missing')
+                tm.assert_panel_equal(panel_with_missing, reloaded_panel)
+
+    def test_append_frame_column_oriented(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            # column oriented
+            df = tm.makeTimeDataFrame()
+            _maybe_remove(store, 'df1')
+            store.append('df1', df.iloc[:, :2], axes=['columns'])
+            store.append('df1', df.iloc[:, 2:])
+            tm.assert_frame_equal(store['df1'], df)
+
+            result = store.select('df1', 'columns=A')
+            expected = df.reindex(columns=['A'])
+            tm.assert_frame_equal(expected, result)
+
+            # selection on the non-indexable
+            result = store.select(
+                'df1', ('columns=A', 'index=df.index[0:4]'))
+            expected = df.reindex(columns=['A'], index=df.index[0:4])
+            tm.assert_frame_equal(expected, result)
+
+            # this isn't supported
+            with pytest.raises(TypeError):
+                store.select('df1',
+                             'columns=A and index>df.index[4]')
+
+    def test_append_with_different_block_ordering(self):
+
+        # GH 4096; using same frames, but different block orderings
+        with ensure_clean_store(self.path) as store:
+
+            for i in range(10):
+
+                df = DataFrame(np.random.randn(10, 2), columns=list('AB'))
+                df['index'] = range(10)
+                df['index'] += i * 10
+                df['int64'] = Series([1] * len(df), dtype='int64')
+                df['int16'] = Series([1] * len(df), dtype='int16')
+
+                if i % 2 == 0:
+                    del df['int64']
+                    df['int64'] = Series([1] * len(df), dtype='int64')
+                if i % 3 == 0:
+                    a = df.pop('A')
+                    df['A'] = a
+
+                df.set_index('index', inplace=True)
+
+                store.append('df', df)
+
+        # test a different ordering but with more fields (like invalid
+        # combinate)
+        with ensure_clean_store(self.path) as store:
+
+            df = DataFrame(np.random.randn(10, 2),
+                           columns=list('AB'), dtype='float64')
+            df['int64'] = Series([1] * len(df), dtype='int64')
+            df['int16'] = Series([1] * len(df), dtype='int16')
+            store.append('df', df)
+
+            # store additional fields in different blocks
+            df['int16_2'] = Series([1] * len(df), dtype='int16')
+            pytest.raises(ValueError, store.append, 'df', df)
+
+            # store multile additional fields in different blocks
+            df['float_3'] = Series([1.] * len(df), dtype='float64')
+            pytest.raises(ValueError, store.append, 'df', df)
+
+    def test_append_with_strings(self):
+
+        with ensure_clean_store(self.path) as store:
+            with catch_warnings(record=True):
+                wp = tm.makePanel()
+                wp2 = wp.rename_axis(
+                    {x: "%s_extra" % x for x in wp.minor_axis}, axis=2)
+
+                def check_col(key, name, size):
+                    assert getattr(store.get_storer(key)
+                                   .table.description, name).itemsize == size
+
+                store.append('s1', wp, min_itemsize=20)
+                store.append('s1', wp2)
+                expected = concat([wp, wp2], axis=2)
+                expected = expected.reindex(
+                    minor_axis=sorted(expected.minor_axis))
+                assert_panel_equal(store['s1'], expected)
+                check_col('s1', 'minor_axis', 20)
+
+                # test dict format
+                store.append('s2', wp, min_itemsize={'minor_axis': 20})
+                store.append('s2', wp2)
+                expected = concat([wp, wp2], axis=2)
+                expected = expected.reindex(
+                    minor_axis=sorted(expected.minor_axis))
+                assert_panel_equal(store['s2'], expected)
+                check_col('s2', 'minor_axis', 20)
+
+                # apply the wrong field (similar to #1)
+                store.append('s3', wp, min_itemsize={'major_axis': 20})
+                pytest.raises(ValueError, store.append, 's3', wp2)
+
+                # test truncation of bigger strings
+                store.append('s4', wp)
+                pytest.raises(ValueError, store.append, 's4', wp2)
+
+                # avoid truncation on elements
+                df = DataFrame([[123, 'asdqwerty'], [345, 'dggnhebbsdfbdfb']])
+                store.append('df_big', df)
+                tm.assert_frame_equal(store.select('df_big'), df)
+                check_col('df_big', 'values_block_1', 15)
+
+                # appending smaller string ok
+                df2 = DataFrame([[124, 'asdqy'], [346, 'dggnhefbdfb']])
+                store.append('df_big', df2)
+                expected = concat([df, df2])
+                tm.assert_frame_equal(store.select('df_big'), expected)
+                check_col('df_big', 'values_block_1', 15)
+
+                # avoid truncation on elements
+                df = DataFrame([[123, 'asdqwerty'], [345, 'dggnhebbsdfbdfb']])
+                store.append('df_big2', df, min_itemsize={'values': 50})
+                tm.assert_frame_equal(store.select('df_big2'), df)
+                check_col('df_big2', 'values_block_1', 50)
+
+                # bigger string on next append
+                store.append('df_new', df)
+                df_new = DataFrame(
+                    [[124, 'abcdefqhij'], [346, 'abcdefghijklmnopqrtsuvwxyz']])
+                pytest.raises(ValueError, store.append, 'df_new', df_new)
+
+                # min_itemsize on Series index (GH 11412)
+                df = tm.makeMixedDataFrame().set_index('C')
+                store.append('ss', df['B'], min_itemsize={'index': 4})
+                tm.assert_series_equal(store.select('ss'), df['B'])
+
+                # same as above, with data_columns=True
+                store.append('ss2', df['B'], data_columns=True,
+                             min_itemsize={'index': 4})
+                tm.assert_series_equal(store.select('ss2'), df['B'])
+
+                # min_itemsize in index without appending (GH 10381)
+                store.put('ss3', df, format='table',
+                          min_itemsize={'index': 6})
+                # just make sure there is a longer string:
+                df2 = df.copy().reset_index().assign(C='longer').set_index('C')
+                store.append('ss3', df2)
+                tm.assert_frame_equal(store.select('ss3'),
+                                      pd.concat([df, df2]))
+
+                # same as above, with a Series
+                store.put('ss4', df['B'], format='table',
+                          min_itemsize={'index': 6})
+                store.append('ss4', df2['B'])
+                tm.assert_series_equal(store.select('ss4'),
+                                       pd.concat([df['B'], df2['B']]))
+
+                # with nans
+                _maybe_remove(store, 'df')
+                df = tm.makeTimeDataFrame()
+                df['string'] = 'foo'
+                df.loc[1:4, 'string'] = np.nan
+                df['string2'] = 'bar'
+                df.loc[4:8, 'string2'] = np.nan
+                df['string3'] = 'bah'
+                df.loc[1:, 'string3'] = np.nan
+                store.append('df', df)
+                result = store.select('df')
+                tm.assert_frame_equal(result, df)
+
+        with ensure_clean_store(self.path) as store:
+
+            def check_col(key, name, size):
+                assert getattr(store.get_storer(key)
+                               .table.description, name).itemsize, size
+
+            df = DataFrame(dict(A='foo', B='bar'), index=range(10))
+
+            # a min_itemsize that creates a data_column
+            _maybe_remove(store, 'df')
+            store.append('df', df, min_itemsize={'A': 200})
+            check_col('df', 'A', 200)
+            assert store.get_storer('df').data_columns == ['A']
+
+            # a min_itemsize that creates a data_column2
+            _maybe_remove(store, 'df')
+            store.append('df', df, data_columns=['B'], min_itemsize={'A': 200})
+            check_col('df', 'A', 200)
+            assert store.get_storer('df').data_columns == ['B', 'A']
+
+            # a min_itemsize that creates a data_column2
+            _maybe_remove(store, 'df')
+            store.append('df', df, data_columns=[
+                         'B'], min_itemsize={'values': 200})
+            check_col('df', 'B', 200)
+            check_col('df', 'values_block_0', 200)
+            assert store.get_storer('df').data_columns == ['B']
+
+            # infer the .typ on subsequent appends
+            _maybe_remove(store, 'df')
+            store.append('df', df[:5], min_itemsize=200)
+            store.append('df', df[5:], min_itemsize=200)
+            tm.assert_frame_equal(store['df'], df)
+
+            # invalid min_itemsize keys
+            df = DataFrame(['foo', 'foo', 'foo', 'barh',
+                            'barh', 'barh'], columns=['A'])
+            _maybe_remove(store, 'df')
+            pytest.raises(ValueError, store.append, 'df',
+                          df, min_itemsize={'foo': 20, 'foobar': 20})
+
+    def test_to_hdf_with_min_itemsize(self):
+
+        with ensure_clean_path(self.path) as path:
+
+            # min_itemsize in index with to_hdf (GH 10381)
+            df = tm.makeMixedDataFrame().set_index('C')
+            df.to_hdf(path, 'ss3', format='table', min_itemsize={'index': 6})
+            # just make sure there is a longer string:
+            df2 = df.copy().reset_index().assign(C='longer').set_index('C')
+            df2.to_hdf(path, 'ss3', append=True, format='table')
+            tm.assert_frame_equal(pd.read_hdf(path, 'ss3'),
+                                  pd.concat([df, df2]))
+
+            # same as above, with a Series
+            df['B'].to_hdf(path, 'ss4', format='table',
+                           min_itemsize={'index': 6})
+            df2['B'].to_hdf(path, 'ss4', append=True, format='table')
+            tm.assert_series_equal(pd.read_hdf(path, 'ss4'),
+                                   pd.concat([df['B'], df2['B']]))
+
+    @pytest.mark.parametrize("format", ['fixed', 'table'])
+    def test_to_hdf_errors(self, format):
+
+        data = ['\ud800foo']
+        ser = pd.Series(data, index=pd.Index(data))
+        with ensure_clean_path(self.path) as path:
+            # GH 20835
+            ser.to_hdf(path, 'table', format=format, errors='surrogatepass')
+
+            result = pd.read_hdf(path, 'table', errors='surrogatepass')
+            tm.assert_series_equal(result, ser)
+
+    def test_append_with_data_columns(self):
+
+        with ensure_clean_store(self.path) as store:
+            df = tm.makeTimeDataFrame()
+            df.iloc[0, df.columns.get_loc('B')] = 1.
+            _maybe_remove(store, 'df')
+            store.append('df', df[:2], data_columns=['B'])
+            store.append('df', df[2:])
+            tm.assert_frame_equal(store['df'], df)
+
+            # check that we have indices created
+            assert(store._handle.root.df.table.cols.index.is_indexed is True)
+            assert(store._handle.root.df.table.cols.B.is_indexed is True)
+
+            # data column searching
+            result = store.select('df', 'B>0')
+            expected = df[df.B > 0]
+            tm.assert_frame_equal(result, expected)
+
+            # data column searching (with an indexable and a data_columns)
+            result = store.select(
+                'df', 'B>0 and index>df.index[3]')
+            df_new = df.reindex(index=df.index[4:])
+            expected = df_new[df_new.B > 0]
+            tm.assert_frame_equal(result, expected)
+
+            # data column selection with a string data_column
+            df_new = df.copy()
+            df_new['string'] = 'foo'
+            df_new.loc[1:4, 'string'] = np.nan
+            df_new.loc[5:6, 'string'] = 'bar'
+            _maybe_remove(store, 'df')
+            store.append('df', df_new, data_columns=['string'])
+            result = store.select('df', "string='foo'")
+            expected = df_new[df_new.string == 'foo']
+            tm.assert_frame_equal(result, expected)
+
+            # using min_itemsize and a data column
+            def check_col(key, name, size):
+                assert getattr(store.get_storer(key)
+                               .table.description, name).itemsize == size
+
+        with ensure_clean_store(self.path) as store:
+            _maybe_remove(store, 'df')
+            store.append('df', df_new, data_columns=['string'],
+                         min_itemsize={'string': 30})
+            check_col('df', 'string', 30)
+            _maybe_remove(store, 'df')
+            store.append(
+                'df', df_new, data_columns=['string'], min_itemsize=30)
+            check_col('df', 'string', 30)
+            _maybe_remove(store, 'df')
+            store.append('df', df_new, data_columns=['string'],
+                         min_itemsize={'values': 30})
+            check_col('df', 'string', 30)
+
+        with ensure_clean_store(self.path) as store:
+            df_new['string2'] = 'foobarbah'
+            df_new['string_block1'] = 'foobarbah1'
+            df_new['string_block2'] = 'foobarbah2'
+            _maybe_remove(store, 'df')
+            store.append('df', df_new, data_columns=['string', 'string2'],
+                         min_itemsize={'string': 30, 'string2': 40,
+                                       'values': 50})
+            check_col('df', 'string', 30)
+            check_col('df', 'string2', 40)
+            check_col('df', 'values_block_1', 50)
+
+        with ensure_clean_store(self.path) as store:
+            # multiple data columns
+            df_new = df.copy()
+            df_new.iloc[0, df_new.columns.get_loc('A')] = 1.
+            df_new.iloc[0, df_new.columns.get_loc('B')] = -1.
+            df_new['string'] = 'foo'
+
+            sl = df_new.columns.get_loc('string')
+            df_new.iloc[1:4, sl] = np.nan
+            df_new.iloc[5:6, sl] = 'bar'
+
+            df_new['string2'] = 'foo'
+            sl = df_new.columns.get_loc('string2')
+            df_new.iloc[2:5, sl] = np.nan
+            df_new.iloc[7:8, sl] = 'bar'
+            _maybe_remove(store, 'df')
+            store.append(
+                'df', df_new, data_columns=['A', 'B', 'string', 'string2'])
+            result = store.select('df',
+                                  "string='foo' and string2='foo'"
+                                  " and A>0 and B<0")
+            expected = df_new[(df_new.string == 'foo') & (
+                df_new.string2 == 'foo') & (df_new.A > 0) & (df_new.B < 0)]
+            tm.assert_frame_equal(result, expected, check_index_type=False)
+
+            # yield an empty frame
+            result = store.select('df', "string='foo' and string2='cool'")
+            expected = df_new[(df_new.string == 'foo') & (
+                df_new.string2 == 'cool')]
+            tm.assert_frame_equal(result, expected, check_index_type=False)
+
+        with ensure_clean_store(self.path) as store:
+            # doc example
+            df_dc = df.copy()
+            df_dc['string'] = 'foo'
+            df_dc.loc[4:6, 'string'] = np.nan
+            df_dc.loc[7:9, 'string'] = 'bar'
+            df_dc['string2'] = 'cool'
+            df_dc['datetime'] = Timestamp('20010102')
+            df_dc = df_dc._convert(datetime=True)
+            df_dc.loc[3:5, ['A', 'B', 'datetime']] = np.nan
+
+            _maybe_remove(store, 'df_dc')
+            store.append('df_dc', df_dc,
+                         data_columns=['B', 'C', 'string',
+                                       'string2', 'datetime'])
+            result = store.select('df_dc', 'B>0')
+
+            expected = df_dc[df_dc.B > 0]
+            tm.assert_frame_equal(result, expected, check_index_type=False)
+
+            result = store.select(
+                'df_dc', ['B > 0', 'C > 0', 'string == foo'])
+            expected = df_dc[(df_dc.B > 0) & (df_dc.C > 0) & (
+                df_dc.string == 'foo')]
+            tm.assert_frame_equal(result, expected, check_index_type=False)
+
+        with ensure_clean_store(self.path) as store:
+            # doc example part 2
+            np.random.seed(1234)
+            index = date_range('1/1/2000', periods=8)
+            df_dc = DataFrame(np.random.randn(8, 3), index=index,
+                              columns=['A', 'B', 'C'])
+            df_dc['string'] = 'foo'
+            df_dc.loc[4:6, 'string'] = np.nan
+            df_dc.loc[7:9, 'string'] = 'bar'
+            df_dc.loc[:, ['B', 'C']] = df_dc.loc[:, ['B', 'C']].abs()
+            df_dc['string2'] = 'cool'
+
+            # on-disk operations
+            store.append('df_dc', df_dc, data_columns=[
+                         'B', 'C', 'string', 'string2'])
+
+            result = store.select('df_dc', 'B>0')
+            expected = df_dc[df_dc.B > 0]
+            tm.assert_frame_equal(result, expected)
+
+            result = store.select(
+                'df_dc', ['B > 0', 'C > 0', 'string == "foo"'])
+            expected = df_dc[(df_dc.B > 0) & (df_dc.C > 0) &
+                             (df_dc.string == 'foo')]
+            tm.assert_frame_equal(result, expected)
+
+        with ensure_clean_store(self.path) as store:
+            with catch_warnings(record=True):
+                # panel
+                # GH5717 not handling data_columns
+                np.random.seed(1234)
+                p = tm.makePanel()
+
+                store.append('p1', p)
+                tm.assert_panel_equal(store.select('p1'), p)
+
+                store.append('p2', p, data_columns=True)
+                tm.assert_panel_equal(store.select('p2'), p)
+
+                result = store.select('p2', where='ItemA>0')
+                expected = p.to_frame()
+                expected = expected[expected['ItemA'] > 0]
+                tm.assert_frame_equal(result.to_frame(), expected)
+
+                result = store.select(
+                    'p2', where='ItemA>0 & minor_axis=["A","B"]')
+                expected = p.to_frame()
+                expected = expected[expected['ItemA'] > 0]
+                expected = expected[expected.reset_index(
+                    level=['major']).index.isin(['A', 'B'])]
+                tm.assert_frame_equal(result.to_frame(), expected)
+
+    def test_create_table_index(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            with catch_warnings(record=True):
+                def col(t, column):
+                    return getattr(store.get_storer(t).table.cols, column)
+
+                # index=False
+                wp = tm.makePanel()
+                store.append('p5', wp, index=False)
+                store.create_table_index('p5', columns=['major_axis'])
+                assert(col('p5', 'major_axis').is_indexed is True)
+                assert(col('p5', 'minor_axis').is_indexed is False)
+
+                # index=True
+                store.append('p5i', wp, index=True)
+                assert(col('p5i', 'major_axis').is_indexed is True)
+                assert(col('p5i', 'minor_axis').is_indexed is True)
+
+                # default optlevels
+                store.get_storer('p5').create_index()
+                assert(col('p5', 'major_axis').index.optlevel == 6)
+                assert(col('p5', 'minor_axis').index.kind == 'medium')
+
+                # let's change the indexing scheme
+                store.create_table_index('p5')
+                assert(col('p5', 'major_axis').index.optlevel == 6)
+                assert(col('p5', 'minor_axis').index.kind == 'medium')
+                store.create_table_index('p5', optlevel=9)
+                assert(col('p5', 'major_axis').index.optlevel == 9)
+                assert(col('p5', 'minor_axis').index.kind == 'medium')
+                store.create_table_index('p5', kind='full')
+                assert(col('p5', 'major_axis').index.optlevel == 9)
+                assert(col('p5', 'minor_axis').index.kind == 'full')
+                store.create_table_index('p5', optlevel=1, kind='light')
+                assert(col('p5', 'major_axis').index.optlevel == 1)
+                assert(col('p5', 'minor_axis').index.kind == 'light')
+
+                # data columns
+                df = tm.makeTimeDataFrame()
+                df['string'] = 'foo'
+                df['string2'] = 'bar'
+                store.append('f', df, data_columns=['string', 'string2'])
+                assert(col('f', 'index').is_indexed is True)
+                assert(col('f', 'string').is_indexed is True)
+                assert(col('f', 'string2').is_indexed is True)
+
+                # specify index=columns
+                store.append(
+                    'f2', df, index=['string'],
+                    data_columns=['string', 'string2'])
+                assert(col('f2', 'index').is_indexed is False)
+                assert(col('f2', 'string').is_indexed is True)
+                assert(col('f2', 'string2').is_indexed is False)
+
+                # try to index a non-table
+                _maybe_remove(store, 'f2')
+                store.put('f2', df)
+                pytest.raises(TypeError, store.create_table_index, 'f2')
+
+    def test_append_diff_item_order(self):
+
+        with catch_warnings(record=True):
+            wp = tm.makePanel()
+            wp1 = wp.iloc[:, :10, :]
+            wp2 = wp.iloc[wp.items.get_indexer(['ItemC', 'ItemB', 'ItemA']),
+                          10:, :]
+
+            with ensure_clean_store(self.path) as store:
+                store.put('panel', wp1, format='table')
+                pytest.raises(ValueError, store.put, 'panel', wp2,
+                              append=True)
+
+    def test_append_hierarchical(self):
+        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                                   ['one', 'two', 'three']],
+                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           names=['foo', 'bar'])
+        df = DataFrame(np.random.randn(10, 3), index=index,
+                       columns=['A', 'B', 'C'])
+
+        with ensure_clean_store(self.path) as store:
+            store.append('mi', df)
+            result = store.select('mi')
+            tm.assert_frame_equal(result, df)
+
+            # GH 3748
+            result = store.select('mi', columns=['A', 'B'])
+            expected = df.reindex(columns=['A', 'B'])
+            tm.assert_frame_equal(result, expected)
+
+        with ensure_clean_path('test.hdf') as path:
+            df.to_hdf(path, 'df', format='table')
+            result = read_hdf(path, 'df', columns=['A', 'B'])
+            expected = df.reindex(columns=['A', 'B'])
+            tm.assert_frame_equal(result, expected)
+
+    def test_column_multiindex(self):
+        # GH 4710
+        # recreate multi-indexes properly
+
+        index = MultiIndex.from_tuples([('A', 'a'), ('A', 'b'),
+                                        ('B', 'a'), ('B', 'b')],
+                                       names=['first', 'second'])
+        df = DataFrame(np.arange(12).reshape(3, 4), columns=index)
+        expected = df.copy()
+        if isinstance(expected.index, RangeIndex):
+            expected.index = Int64Index(expected.index)
+
+        with ensure_clean_store(self.path) as store:
+
+            store.put('df', df)
+            tm.assert_frame_equal(store['df'], expected,
+                                  check_index_type=True,
+                                  check_column_type=True)
+
+            store.put('df1', df, format='table')
+            tm.assert_frame_equal(store['df1'], expected,
+                                  check_index_type=True,
+                                  check_column_type=True)
+
+            pytest.raises(ValueError, store.put, 'df2', df,
+                          format='table', data_columns=['A'])
+            pytest.raises(ValueError, store.put, 'df3', df,
+                          format='table', data_columns=True)
+
+        # appending multi-column on existing table (see GH 6167)
+        with ensure_clean_store(self.path) as store:
+            store.append('df2', df)
+            store.append('df2', df)
+
+            tm.assert_frame_equal(store['df2'], concat((df, df)))
+
+        # non_index_axes name
+        df = DataFrame(np.arange(12).reshape(3, 4),
+                       columns=Index(list('ABCD'), name='foo'))
+        expected = df.copy()
+        if isinstance(expected.index, RangeIndex):
+            expected.index = Int64Index(expected.index)
+
+        with ensure_clean_store(self.path) as store:
+
+            store.put('df1', df, format='table')
+            tm.assert_frame_equal(store['df1'], expected,
+                                  check_index_type=True,
+                                  check_column_type=True)
+
+    def test_store_multiindex(self):
+
+        # validate multi-index names
+        # GH 5527
+        with ensure_clean_store(self.path) as store:
+
+            def make_index(names=None):
+                return MultiIndex.from_tuples([(datetime.datetime(2013, 12, d),
+                                                s, t)
+                                               for d in range(1, 3)
+                                               for s in range(2)
+                                               for t in range(3)],
+                                              names=names)
+
+            # no names
+            _maybe_remove(store, 'df')
+            df = DataFrame(np.zeros((12, 2)), columns=[
+                           'a', 'b'], index=make_index())
+            store.append('df', df)
+            tm.assert_frame_equal(store.select('df'), df)
+
+            # partial names
+            _maybe_remove(store, 'df')
+            df = DataFrame(np.zeros((12, 2)), columns=[
+                           'a', 'b'], index=make_index(['date', None, None]))
+            store.append('df', df)
+            tm.assert_frame_equal(store.select('df'), df)
+
+            # series
+            _maybe_remove(store, 's')
+            s = Series(np.zeros(12), index=make_index(['date', None, None]))
+            store.append('s', s)
+            xp = Series(np.zeros(12), index=make_index(
+                ['date', 'level_1', 'level_2']))
+            tm.assert_series_equal(store.select('s'), xp)
+
+            # dup with column
+            _maybe_remove(store, 'df')
+            df = DataFrame(np.zeros((12, 2)), columns=[
+                           'a', 'b'], index=make_index(['date', 'a', 't']))
+            pytest.raises(ValueError, store.append, 'df', df)
+
+            # dup within level
+            _maybe_remove(store, 'df')
+            df = DataFrame(np.zeros((12, 2)), columns=['a', 'b'],
+                           index=make_index(['date', 'date', 'date']))
+            pytest.raises(ValueError, store.append, 'df', df)
+
+            # fully names
+            _maybe_remove(store, 'df')
+            df = DataFrame(np.zeros((12, 2)), columns=[
+                           'a', 'b'], index=make_index(['date', 's', 't']))
+            store.append('df', df)
+            tm.assert_frame_equal(store.select('df'), df)
+
+    def test_select_columns_in_where(self):
+
+        # GH 6169
+        # recreate multi-indexes when columns is passed
+        # in the `where` argument
+        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                                   ['one', 'two', 'three']],
+                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           names=['foo_name', 'bar_name'])
+
+        # With a DataFrame
+        df = DataFrame(np.random.randn(10, 3), index=index,
+                       columns=['A', 'B', 'C'])
+
+        with ensure_clean_store(self.path) as store:
+            store.put('df', df, format='table')
+            expected = df[['A']]
+
+            tm.assert_frame_equal(store.select('df', columns=['A']), expected)
+
+            tm.assert_frame_equal(store.select(
+                'df', where="columns=['A']"), expected)
+
+        # With a Series
+        s = Series(np.random.randn(10), index=index,
+                   name='A')
+        with ensure_clean_store(self.path) as store:
+            store.put('s', s, format='table')
+            tm.assert_series_equal(store.select('s', where="columns=['A']"), s)
+
+    def test_mi_data_columns(self):
+        # GH 14435
+        idx = pd.MultiIndex.from_arrays([date_range('2000-01-01', periods=5),
+                                         range(5)], names=['date', 'id'])
+        df = pd.DataFrame({'a': [1.1, 1.2, 1.3, 1.4, 1.5]}, index=idx)
+
+        with ensure_clean_store(self.path) as store:
+            store.append('df', df, data_columns=True)
+
+            actual = store.select('df', where='id == 1')
+            expected = df.iloc[[1], :]
+            tm.assert_frame_equal(actual, expected)
+
+    def test_pass_spec_to_storer(self):
+
+        df = tm.makeDataFrame()
+
+        with ensure_clean_store(self.path) as store:
+            store.put('df', df)
+            pytest.raises(TypeError, store.select, 'df', columns=['A'])
+            pytest.raises(TypeError, store.select,
+                          'df', where=[('columns=A')])
+
+    def test_append_misc(self):
+
+        with ensure_clean_store(self.path) as store:
+            df = tm.makeDataFrame()
+            store.append('df', df, chunksize=1)
+            result = store.select('df')
+            tm.assert_frame_equal(result, df)
+
+            store.append('df1', df, expectedrows=10)
+            result = store.select('df1')
+            tm.assert_frame_equal(result, df)
+
+        # more chunksize in append tests
+        def check(obj, comparator):
+            for c in [10, 200, 1000]:
+                with ensure_clean_store(self.path, mode='w') as store:
+                    store.append('obj', obj, chunksize=c)
+                    result = store.select('obj')
+                    comparator(result, obj)
+
+        df = tm.makeDataFrame()
+        df['string'] = 'foo'
+        df['float322'] = 1.
+        df['float322'] = df['float322'].astype('float32')
+        df['bool'] = df['float322'] > 0
+        df['time1'] = Timestamp('20130101')
+        df['time2'] = Timestamp('20130102')
+        check(df, tm.assert_frame_equal)
+
+        with catch_warnings(record=True):
+            p = tm.makePanel()
+            check(p, assert_panel_equal)
+
+        # empty frame, GH4273
+        with ensure_clean_store(self.path) as store:
+
+            # 0 len
+            df_empty = DataFrame(columns=list('ABC'))
+            store.append('df', df_empty)
+            pytest.raises(KeyError, store.select, 'df')
+
+            # repeated append of 0/non-zero frames
+            df = DataFrame(np.random.rand(10, 3), columns=list('ABC'))
+            store.append('df', df)
+            assert_frame_equal(store.select('df'), df)
+            store.append('df', df_empty)
+            assert_frame_equal(store.select('df'), df)
+
+            # store
+            df = DataFrame(columns=list('ABC'))
+            store.put('df2', df)
+            assert_frame_equal(store.select('df2'), df)
+
+            with catch_warnings(record=True):
+
+                # 0 len
+                p_empty = Panel(items=list('ABC'))
+                store.append('p', p_empty)
+                pytest.raises(KeyError, store.select, 'p')
+
+                # repeated append of 0/non-zero frames
+                p = Panel(np.random.randn(3, 4, 5), items=list('ABC'))
+                store.append('p', p)
+                assert_panel_equal(store.select('p'), p)
+                store.append('p', p_empty)
+                assert_panel_equal(store.select('p'), p)
+
+                # store
+                store.put('p2', p_empty)
+                assert_panel_equal(store.select('p2'), p_empty)
+
+    def test_append_raise(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            # test append with invalid input to get good error messages
+
+            # list in column
+            df = tm.makeDataFrame()
+            df['invalid'] = [['a']] * len(df)
+            assert df.dtypes['invalid'] == np.object_
+            pytest.raises(TypeError, store.append, 'df', df)
+
+            # multiple invalid columns
+            df['invalid2'] = [['a']] * len(df)
+            df['invalid3'] = [['a']] * len(df)
+            pytest.raises(TypeError, store.append, 'df', df)
+
+            # datetime with embedded nans as object
+            df = tm.makeDataFrame()
+            s = Series(datetime.datetime(2001, 1, 2), index=df.index)
+            s = s.astype(object)
+            s[0:5] = np.nan
+            df['invalid'] = s
+            assert df.dtypes['invalid'] == np.object_
+            pytest.raises(TypeError, store.append, 'df', df)
+
+            # directly ndarray
+            pytest.raises(TypeError, store.append, 'df', np.arange(10))
+
+            # series directly
+            pytest.raises(TypeError, store.append,
+                          'df', Series(np.arange(10)))
+
+            # appending an incompatible table
+            df = tm.makeDataFrame()
+            store.append('df', df)
+
+            df['foo'] = 'foo'
+            pytest.raises(ValueError, store.append, 'df', df)
+
+    def test_table_index_incompatible_dtypes(self):
+        df1 = DataFrame({'a': [1, 2, 3]})
+        df2 = DataFrame({'a': [4, 5, 6]},
+                        index=date_range('1/1/2000', periods=3))
+
+        with ensure_clean_store(self.path) as store:
+            store.put('frame', df1, format='table')
+            pytest.raises(TypeError, store.put, 'frame', df2,
+                          format='table', append=True)
+
+    def test_table_values_dtypes_roundtrip(self):
+
+        with ensure_clean_store(self.path) as store:
+            df1 = DataFrame({'a': [1, 2, 3]}, dtype='f8')
+            store.append('df_f8', df1)
+            assert_series_equal(df1.dtypes, store['df_f8'].dtypes)
+
+            df2 = DataFrame({'a': [1, 2, 3]}, dtype='i8')
+            store.append('df_i8', df2)
+            assert_series_equal(df2.dtypes, store['df_i8'].dtypes)
+
+            # incompatible dtype
+            pytest.raises(ValueError, store.append, 'df_i8', df1)
+
+            # check creation/storage/retrieval of float32 (a bit hacky to
+            # actually create them thought)
+            df1 = DataFrame(
+                np.array([[1], [2], [3]], dtype='f4'), columns=['A'])
+            store.append('df_f4', df1)
+            assert_series_equal(df1.dtypes, store['df_f4'].dtypes)
+            assert df1.dtypes[0] == 'float32'
+
+            # check with mixed dtypes
+            df1 = DataFrame(dict((c, Series(np.random.randint(5), dtype=c))
+                                 for c in ['float32', 'float64', 'int32',
+                                           'int64', 'int16', 'int8']))
+            df1['string'] = 'foo'
+            df1['float322'] = 1.
+            df1['float322'] = df1['float322'].astype('float32')
+            df1['bool'] = df1['float32'] > 0
+            df1['time1'] = Timestamp('20130101')
+            df1['time2'] = Timestamp('20130102')
+
+            store.append('df_mixed_dtypes1', df1)
+            result = store.select('df_mixed_dtypes1').get_dtype_counts()
+            expected = Series({'float32': 2, 'float64': 1, 'int32': 1,
+                               'bool': 1, 'int16': 1, 'int8': 1,
+                               'int64': 1, 'object': 1, 'datetime64[ns]': 2})
+            result = result.sort_index()
+            expected = expected.sort_index()
+            tm.assert_series_equal(result, expected)
+
+    def test_table_mixed_dtypes(self):
+
+        # frame
+        df = tm.makeDataFrame()
+        df['obj1'] = 'foo'
+        df['obj2'] = 'bar'
+        df['bool1'] = df['A'] > 0
+        df['bool2'] = df['B'] > 0
+        df['bool3'] = True
+        df['int1'] = 1
+        df['int2'] = 2
+        df['timestamp1'] = Timestamp('20010102')
+        df['timestamp2'] = Timestamp('20010103')
+        df['datetime1'] = datetime.datetime(2001, 1, 2, 0, 0)
+        df['datetime2'] = datetime.datetime(2001, 1, 3, 0, 0)
+        df.loc[3:6, ['obj1']] = np.nan
+        df = df._consolidate()._convert(datetime=True)
+
+        with ensure_clean_store(self.path) as store:
+            store.append('df1_mixed', df)
+            tm.assert_frame_equal(store.select('df1_mixed'), df)
+
+        with catch_warnings(record=True):
+
+            # panel
+            wp = tm.makePanel()
+            wp['obj1'] = 'foo'
+            wp['obj2'] = 'bar'
+            wp['bool1'] = wp['ItemA'] > 0
+            wp['bool2'] = wp['ItemB'] > 0
+            wp['int1'] = 1
+            wp['int2'] = 2
+            wp = wp._consolidate()
+
+        with catch_warnings(record=True):
+
+            with ensure_clean_store(self.path) as store:
+                store.append('p1_mixed', wp)
+                assert_panel_equal(store.select('p1_mixed'), wp)
+
+    def test_unimplemented_dtypes_table_columns(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            l = [('date', datetime.date(2001, 1, 2))]
+
+            # py3 ok for unicode
+            if not compat.PY3:
+                l.append(('unicode', u('\\u03c3')))
+
+            # currently not supported dtypes ####
+            for n, f in l:
+                df = tm.makeDataFrame()
+                df[n] = f
+                pytest.raises(
+                    TypeError, store.append, 'df1_%s' % n, df)
+
+        # frame
+        df = tm.makeDataFrame()
+        df['obj1'] = 'foo'
+        df['obj2'] = 'bar'
+        df['datetime1'] = datetime.date(2001, 1, 2)
+        df = df._consolidate()._convert(datetime=True)
+
+        with ensure_clean_store(self.path) as store:
+            # this fails because we have a date in the object block......
+            pytest.raises(TypeError, store.append, 'df_unimplemented', df)
+
+    def test_calendar_roundtrip_issue(self):
+
+        # 8591
+        # doc example from tseries holiday section
+        weekmask_egypt = 'Sun Mon Tue Wed Thu'
+        holidays = ['2012-05-01',
+                    datetime.datetime(2013, 5, 1), np.datetime64('2014-05-01')]
+        bday_egypt = pd.offsets.CustomBusinessDay(
+            holidays=holidays, weekmask=weekmask_egypt)
+        dt = datetime.datetime(2013, 4, 30)
+        dts = date_range(dt, periods=5, freq=bday_egypt)
+
+        s = (Series(dts.weekday, dts).map(
+            Series('Mon Tue Wed Thu Fri Sat Sun'.split())))
+
+        with ensure_clean_store(self.path) as store:
+
+            store.put('fixed', s)
+            result = store.select('fixed')
+            assert_series_equal(result, s)
+
+            store.append('table', s)
+            result = store.select('table')
+            assert_series_equal(result, s)
+
+    def test_roundtrip_tz_aware_index(self):
+        # GH 17618
+        time = pd.Timestamp('2000-01-01 01:00:00', tz='US/Eastern')
+        df = pd.DataFrame(data=[0], index=[time])
+
+        with ensure_clean_store(self.path) as store:
+            store.put('frame', df, format='fixed')
+            recons = store['frame']
+            tm.assert_frame_equal(recons, df)
+            assert recons.index[0].value == 946706400000000000
+
+    def test_append_with_timedelta(self):
+        # GH 3577
+        # append timedelta
+
+        df = DataFrame(dict(A=Timestamp('20130101'), B=[Timestamp(
+            '20130101') + timedelta(days=i, seconds=10) for i in range(10)]))
+        df['C'] = df['A'] - df['B']
+        df.loc[3:5, 'C'] = np.nan
+
+        with ensure_clean_store(self.path) as store:
+
+            # table
+            _maybe_remove(store, 'df')
+            store.append('df', df, data_columns=True)
+            result = store.select('df')
+            assert_frame_equal(result, df)
+
+            result = store.select('df', where="C<100000")
+            assert_frame_equal(result, df)
+
+            result = store.select('df', where="C<pd.Timedelta('-3D')")
+            assert_frame_equal(result, df.iloc[3:])
+
+            result = store.select('df', "C<'-3D'")
+            assert_frame_equal(result, df.iloc[3:])
+
+            # a bit hacky here as we don't really deal with the NaT properly
+
+            result = store.select('df', "C<'-500000s'")
+            result = result.dropna(subset=['C'])
+            assert_frame_equal(result, df.iloc[6:])
+
+            result = store.select('df', "C<'-3.5D'")
+            result = result.iloc[1:]
+            assert_frame_equal(result, df.iloc[4:])
+
+            # fixed
+            _maybe_remove(store, 'df2')
+            store.put('df2', df)
+            result = store.select('df2')
+            assert_frame_equal(result, df)
+
+    def test_remove(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            ts = tm.makeTimeSeries()
+            df = tm.makeDataFrame()
+            store['a'] = ts
+            store['b'] = df
+            _maybe_remove(store, 'a')
+            assert len(store) == 1
+            tm.assert_frame_equal(df, store['b'])
+
+            _maybe_remove(store, 'b')
+            assert len(store) == 0
+
+            # nonexistence
+            pytest.raises(KeyError, store.remove, 'a_nonexistent_store')
+
+            # pathing
+            store['a'] = ts
+            store['b/foo'] = df
+            _maybe_remove(store, 'foo')
+            _maybe_remove(store, 'b/foo')
+            assert len(store) == 1
+
+            store['a'] = ts
+            store['b/foo'] = df
+            _maybe_remove(store, 'b')
+            assert len(store) == 1
+
+            # __delitem__
+            store['a'] = ts
+            store['b'] = df
+            del store['a']
+            del store['b']
+            assert len(store) == 0
+
+    def test_remove_where(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            with catch_warnings(record=True):
+
+                # non-existance
+                crit1 = 'index>foo'
+                pytest.raises(KeyError, store.remove, 'a', [crit1])
+
+                # try to remove non-table (with crit)
+                # non-table ok (where = None)
+                wp = tm.makePanel(30)
+                store.put('wp', wp, format='table')
+                store.remove('wp', ["minor_axis=['A', 'D']"])
+                rs = store.select('wp')
+                expected = wp.reindex(minor_axis=['B', 'C'])
+                assert_panel_equal(rs, expected)
+
+                # empty where
+                _maybe_remove(store, 'wp')
+                store.put('wp', wp, format='table')
+
+                # deleted number (entire table)
+                n = store.remove('wp', [])
+                assert n == 120
+
+                # non - empty where
+                _maybe_remove(store, 'wp')
+                store.put('wp', wp, format='table')
+                pytest.raises(ValueError, store.remove,
+                              'wp', ['foo'])
+
+    def test_remove_startstop(self):
+        # GH #4835 and #6177
+
+        with ensure_clean_store(self.path) as store:
+
+            with catch_warnings(record=True):
+                wp = tm.makePanel(30)
+
+                # start
+                _maybe_remove(store, 'wp1')
+                store.put('wp1', wp, format='t')
+                n = store.remove('wp1', start=32)
+                assert n == 120 - 32
+                result = store.select('wp1')
+                expected = wp.reindex(major_axis=wp.major_axis[:32 // 4])
+                assert_panel_equal(result, expected)
+
+                _maybe_remove(store, 'wp2')
+                store.put('wp2', wp, format='t')
+                n = store.remove('wp2', start=-32)
+                assert n == 32
+                result = store.select('wp2')
+                expected = wp.reindex(major_axis=wp.major_axis[:-32 // 4])
+                assert_panel_equal(result, expected)
+
+                # stop
+                _maybe_remove(store, 'wp3')
+                store.put('wp3', wp, format='t')
+                n = store.remove('wp3', stop=32)
+                assert n == 32
+                result = store.select('wp3')
+                expected = wp.reindex(major_axis=wp.major_axis[32 // 4:])
+                assert_panel_equal(result, expected)
+
+                _maybe_remove(store, 'wp4')
+                store.put('wp4', wp, format='t')
+                n = store.remove('wp4', stop=-32)
+                assert n == 120 - 32
+                result = store.select('wp4')
+                expected = wp.reindex(major_axis=wp.major_axis[-32 // 4:])
+                assert_panel_equal(result, expected)
+
+                # start n stop
+                _maybe_remove(store, 'wp5')
+                store.put('wp5', wp, format='t')
+                n = store.remove('wp5', start=16, stop=-16)
+                assert n == 120 - 32
+                result = store.select('wp5')
+                expected = wp.reindex(
+                    major_axis=(wp.major_axis[:16 // 4]
+                                .union(wp.major_axis[-16 // 4:])))
+                assert_panel_equal(result, expected)
+
+                _maybe_remove(store, 'wp6')
+                store.put('wp6', wp, format='t')
+                n = store.remove('wp6', start=16, stop=16)
+                assert n == 0
+                result = store.select('wp6')
+                expected = wp.reindex(major_axis=wp.major_axis)
+                assert_panel_equal(result, expected)
+
+                # with where
+                _maybe_remove(store, 'wp7')
+
+                # TODO: unused?
+                date = wp.major_axis.take(np.arange(0, 30, 3))  # noqa
+
+                crit = 'major_axis=date'
+                store.put('wp7', wp, format='t')
+                n = store.remove('wp7', where=[crit], stop=80)
+                assert n == 28
+                result = store.select('wp7')
+                expected = wp.reindex(major_axis=wp.major_axis.difference(
+                    wp.major_axis[np.arange(0, 20, 3)]))
+                assert_panel_equal(result, expected)
+
+    def test_remove_crit(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            with catch_warnings(record=True):
+                wp = tm.makePanel(30)
+
+                # group row removal
+                _maybe_remove(store, 'wp3')
+                date4 = wp.major_axis.take([0, 1, 2, 4, 5, 6, 8, 9, 10])
+                crit4 = 'major_axis=date4'
+                store.put('wp3', wp, format='t')
+                n = store.remove('wp3', where=[crit4])
+                assert n == 36
+
+                result = store.select('wp3')
+                expected = wp.reindex(
+                    major_axis=wp.major_axis.difference(date4))
+                assert_panel_equal(result, expected)
+
+                # upper half
+                _maybe_remove(store, 'wp')
+                store.put('wp', wp, format='table')
+                date = wp.major_axis[len(wp.major_axis) // 2]
+
+                crit1 = 'major_axis>date'
+                crit2 = "minor_axis=['A', 'D']"
+                n = store.remove('wp', where=[crit1])
+                assert n == 56
+
+                n = store.remove('wp', where=[crit2])
+                assert n == 32
+
+                result = store['wp']
+                expected = wp.truncate(after=date).reindex(minor=['B', 'C'])
+                assert_panel_equal(result, expected)
+
+                # individual row elements
+                _maybe_remove(store, 'wp2')
+                store.put('wp2', wp, format='table')
+
+                date1 = wp.major_axis[1:3]
+                crit1 = 'major_axis=date1'
+                store.remove('wp2', where=[crit1])
+                result = store.select('wp2')
+                expected = wp.reindex(
+                    major_axis=wp.major_axis.difference(date1))
+                assert_panel_equal(result, expected)
+
+                date2 = wp.major_axis[5]
+                crit2 = 'major_axis=date2'
+                store.remove('wp2', where=[crit2])
+                result = store['wp2']
+                expected = wp.reindex(
+                    major_axis=(wp.major_axis
+                                .difference(date1)
+                                .difference(Index([date2]))
+                                ))
+                assert_panel_equal(result, expected)
+
+                date3 = [wp.major_axis[7], wp.major_axis[9]]
+                crit3 = 'major_axis=date3'
+                store.remove('wp2', where=[crit3])
+                result = store['wp2']
+                expected = wp.reindex(major_axis=wp.major_axis
+                                      .difference(date1)
+                                      .difference(Index([date2]))
+                                      .difference(Index(date3)))
+                assert_panel_equal(result, expected)
+
+                # corners
+                _maybe_remove(store, 'wp4')
+                store.put('wp4', wp, format='table')
+                n = store.remove(
+                    'wp4', where="major_axis>wp.major_axis[-1]")
+                result = store.select('wp4')
+                assert_panel_equal(result, wp)
+
+    def test_invalid_terms(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            with catch_warnings(record=True):
+
+                df = tm.makeTimeDataFrame()
+                df['string'] = 'foo'
+                df.loc[0:4, 'string'] = 'bar'
+                wp = tm.makePanel()
+
+                store.put('df', df, format='table')
+                store.put('wp', wp, format='table')
+
+                # some invalid terms
+                pytest.raises(ValueError, store.select,
+                              'wp', "minor=['A', 'B']")
+                pytest.raises(ValueError, store.select,
+                              'wp', ["index=['20121114']"])
+                pytest.raises(ValueError, store.select, 'wp', [
+                    "index=['20121114', '20121114']"])
+                pytest.raises(TypeError, Term)
+
+                # more invalid
+                pytest.raises(
+                    ValueError, store.select, 'df', 'df.index[3]')
+                pytest.raises(SyntaxError, store.select, 'df', 'index>')
+                pytest.raises(
+                    ValueError, store.select, 'wp',
+                    "major_axis<'20000108' & minor_axis['A', 'B']")
+
+        # from the docs
+        with ensure_clean_path(self.path) as path:
+            dfq = DataFrame(np.random.randn(10, 4), columns=list(
+                'ABCD'), index=date_range('20130101', periods=10))
+            dfq.to_hdf(path, 'dfq', format='table', data_columns=True)
+
+            # check ok
+            read_hdf(path, 'dfq',
+                     where="index>Timestamp('20130104') & columns=['A', 'B']")
+            read_hdf(path, 'dfq', where="A>0 or C>0")
+
+        # catch the invalid reference
+        with ensure_clean_path(self.path) as path:
+            dfq = DataFrame(np.random.randn(10, 4), columns=list(
+                'ABCD'), index=date_range('20130101', periods=10))
+            dfq.to_hdf(path, 'dfq', format='table')
+
+            pytest.raises(ValueError, read_hdf, path,
+                          'dfq', where="A>0 or C>0")
+
+    def test_terms(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            with catch_warnings(record=True):
+
+                wp = tm.makePanel()
+                wpneg = Panel.fromDict({-1: tm.makeDataFrame(),
+                                        0: tm.makeDataFrame(),
+                                        1: tm.makeDataFrame()})
+
+                store.put('wp', wp, format='table')
+                store.put('wpneg', wpneg, format='table')
+
+                # panel
+                result = store.select(
+                    'wp',
+                    "major_axis<'20000108' and minor_axis=['A', 'B']")
+                expected = wp.truncate(
+                    after='20000108').reindex(minor=['A', 'B'])
+                assert_panel_equal(result, expected)
+
+                # with deprecation
+                result = store.select(
+                    'wp', where=("major_axis<'20000108' "
+                                 "and minor_axis=['A', 'B']"))
+                expected = wp.truncate(
+                    after='20000108').reindex(minor=['A', 'B'])
+                tm.assert_panel_equal(result, expected)
+
+            with catch_warnings(record=True):
+
+                # valid terms
+                terms = [('major_axis=20121114'),
+                         ('major_axis>20121114'),
+                         (("major_axis=['20121114', '20121114']"),),
+                         ('major_axis=datetime.datetime(2012, 11, 14)'),
+                         'major_axis> 20121114',
+                         'major_axis >20121114',
+                         'major_axis > 20121114',
+                         (("minor_axis=['A', 'B']"),),
+                         (("minor_axis=['A', 'B']"),),
+                         ((("minor_axis==['A', 'B']"),),),
+                         (("items=['ItemA', 'ItemB']"),),
+                         ('items=ItemA'),
+                         ]
+
+                for t in terms:
+                    store.select('wp', t)
+
+                with tm.assert_raises_regex(
+                        TypeError, 'Only named functions are supported'):
+                    store.select(
+                        'wp',
+                        'major_axis == (lambda x: x)("20130101")')
+
+            with catch_warnings(record=True):
+                # check USub node parsing
+                res = store.select('wpneg', 'items == -1')
+                expected = Panel({-1: wpneg[-1]})
+                tm.assert_panel_equal(res, expected)
+
+                with tm.assert_raises_regex(NotImplementedError,
+                                            'Unary addition '
+                                            'not supported'):
+                    store.select('wpneg', 'items == +1')
+
+    def test_term_compat(self):
+        with ensure_clean_store(self.path) as store:
+
+            with catch_warnings(record=True):
+                wp = Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
+                           major_axis=date_range('1/1/2000', periods=5),
+                           minor_axis=['A', 'B', 'C', 'D'])
+                store.append('wp', wp)
+
+                result = store.select(
+                    'wp', where=("major_axis>20000102 "
+                                 "and minor_axis=['A', 'B']"))
+                expected = wp.loc[:, wp.major_axis >
+                                  Timestamp('20000102'), ['A', 'B']]
+                assert_panel_equal(result, expected)
+
+                store.remove('wp', 'major_axis>20000103')
+                result = store.select('wp')
+                expected = wp.loc[:, wp.major_axis <= Timestamp('20000103'), :]
+                assert_panel_equal(result, expected)
+
+        with ensure_clean_store(self.path) as store:
+
+            with catch_warnings(record=True):
+                wp = Panel(np.random.randn(2, 5, 4),
+                           items=['Item1', 'Item2'],
+                           major_axis=date_range('1/1/2000', periods=5),
+                           minor_axis=['A', 'B', 'C', 'D'])
+                store.append('wp', wp)
+
+                # stringified datetimes
+                result = store.select(
+                    'wp', 'major_axis>datetime.datetime(2000, 1, 2)')
+                expected = wp.loc[:, wp.major_axis > Timestamp('20000102')]
+                assert_panel_equal(result, expected)
+
+                result = store.select(
+                    'wp', 'major_axis>datetime.datetime(2000, 1, 2)')
+                expected = wp.loc[:, wp.major_axis > Timestamp('20000102')]
+                assert_panel_equal(result, expected)
+
+                result = store.select(
+                    'wp',
+                    "major_axis=[datetime.datetime(2000, 1, 2, 0, 0), "
+                    "datetime.datetime(2000, 1, 3, 0, 0)]")
+                expected = wp.loc[:, [Timestamp('20000102'),
+                                      Timestamp('20000103')]]
+                assert_panel_equal(result, expected)
+
+                result = store.select(
+                    'wp', "minor_axis=['A', 'B']")
+                expected = wp.loc[:, :, ['A', 'B']]
+                assert_panel_equal(result, expected)
+
+    def test_same_name_scoping(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            import pandas as pd
+            df = DataFrame(np.random.randn(20, 2),
+                           index=pd.date_range('20130101', periods=20))
+            store.put('df', df, format='table')
+            expected = df[df.index > pd.Timestamp('20130105')]
+
+            import datetime  # noqa
+            result = store.select('df', 'index>datetime.datetime(2013,1,5)')
+            assert_frame_equal(result, expected)
+
+            from datetime import datetime  # noqa
+
+            # technically an error, but allow it
+            result = store.select('df', 'index>datetime.datetime(2013,1,5)')
+            assert_frame_equal(result, expected)
+
+            result = store.select('df', 'index>datetime(2013,1,5)')
+            assert_frame_equal(result, expected)
+
+    def test_series(self):
+
+        s = tm.makeStringSeries()
+        self._check_roundtrip(s, tm.assert_series_equal)
+
+        ts = tm.makeTimeSeries()
+        self._check_roundtrip(ts, tm.assert_series_equal)
+
+        ts2 = Series(ts.index, Index(ts.index, dtype=object))
+        self._check_roundtrip(ts2, tm.assert_series_equal)
+
+        ts3 = Series(ts.values, Index(np.asarray(ts.index, dtype=object),
+                                      dtype=object))
+        self._check_roundtrip(ts3, tm.assert_series_equal,
+                              check_index_type=False)
+
+    def test_sparse_series(self):
+
+        s = tm.makeStringSeries()
+        s.iloc[3:5] = np.nan
+        ss = s.to_sparse()
+        self._check_roundtrip(ss, tm.assert_series_equal,
+                              check_series_type=True)
+
+        ss2 = s.to_sparse(kind='integer')
+        self._check_roundtrip(ss2, tm.assert_series_equal,
+                              check_series_type=True)
+
+        ss3 = s.to_sparse(fill_value=0)
+        self._check_roundtrip(ss3, tm.assert_series_equal,
+                              check_series_type=True)
+
+    def test_sparse_frame(self):
+
+        s = tm.makeDataFrame()
+        s.iloc[3:5, 1:3] = np.nan
+        s.iloc[8:10, -2] = np.nan
+        ss = s.to_sparse()
+
+        self._check_double_roundtrip(ss, tm.assert_frame_equal,
+                                     check_frame_type=True)
+
+        ss2 = s.to_sparse(kind='integer')
+        self._check_double_roundtrip(ss2, tm.assert_frame_equal,
+                                     check_frame_type=True)
+
+        ss3 = s.to_sparse(fill_value=0)
+        self._check_double_roundtrip(ss3, tm.assert_frame_equal,
+                                     check_frame_type=True)
+
+    def test_float_index(self):
+
+        # GH #454
+        index = np.random.randn(10)
+        s = Series(np.random.randn(10), index=index)
+        self._check_roundtrip(s, tm.assert_series_equal)
+
+    def test_tuple_index(self):
+
+        # GH #492
+        col = np.arange(10)
+        idx = [(0., 1.), (2., 3.), (4., 5.)]
+        data = np.random.randn(30).reshape((3, 10))
+        DF = DataFrame(data, index=idx, columns=col)
+
+        with catch_warnings(record=True):
+            self._check_roundtrip(DF, tm.assert_frame_equal)
+
+    def test_index_types(self):
+
+        with catch_warnings(record=True):
+            values = np.random.randn(2)
+
+            func = lambda l, r: tm.assert_series_equal(l, r,
+                                                       check_dtype=True,
+                                                       check_index_type=True,
+                                                       check_series_type=True)
+
+        with catch_warnings(record=True):
+            ser = Series(values, [0, 'y'])
+            self._check_roundtrip(ser, func)
+
+        with catch_warnings(record=True):
+            ser = Series(values, [datetime.datetime.today(), 0])
+            self._check_roundtrip(ser, func)
+
+        with catch_warnings(record=True):
+            ser = Series(values, ['y', 0])
+            self._check_roundtrip(ser, func)
+
+        with catch_warnings(record=True):
+            ser = Series(values, [datetime.date.today(), 'a'])
+            self._check_roundtrip(ser, func)
+
+        with catch_warnings(record=True):
+
+            ser = Series(values, [0, 'y'])
+            self._check_roundtrip(ser, func)
+
+            ser = Series(values, [datetime.datetime.today(), 0])
+            self._check_roundtrip(ser, func)
+
+            ser = Series(values, ['y', 0])
+            self._check_roundtrip(ser, func)
+
+            ser = Series(values, [datetime.date.today(), 'a'])
+            self._check_roundtrip(ser, func)
+
+            ser = Series(values, [1.23, 'b'])
+            self._check_roundtrip(ser, func)
+
+            ser = Series(values, [1, 1.53])
+            self._check_roundtrip(ser, func)
+
+            ser = Series(values, [1, 5])
+            self._check_roundtrip(ser, func)
+
+            ser = Series(values, [datetime.datetime(
+                2012, 1, 1), datetime.datetime(2012, 1, 2)])
+            self._check_roundtrip(ser, func)
+
+    def test_timeseries_preepoch(self):
+
+        dr = bdate_range('1/1/1940', '1/1/1960')
+        ts = Series(np.random.randn(len(dr)), index=dr)
+        try:
+            self._check_roundtrip(ts, tm.assert_series_equal)
+        except OverflowError:
+            pytest.skip('known failer on some windows platforms')
+
+    @pytest.mark.parametrize("compression", [
+        False, pytest.param(True, marks=td.skip_if_windows_python_3)
+    ])
+    def test_frame(self, compression):
+
+        df = tm.makeDataFrame()
+
+        # put in some random NAs
+        df.values[0, 0] = np.nan
+        df.values[5, 3] = np.nan
+
+        self._check_roundtrip_table(df, tm.assert_frame_equal,
+                                    compression=compression)
+        self._check_roundtrip(df, tm.assert_frame_equal,
+                              compression=compression)
+
+        tdf = tm.makeTimeDataFrame()
+        self._check_roundtrip(tdf, tm.assert_frame_equal,
+                              compression=compression)
+
+        with ensure_clean_store(self.path) as store:
+            # not consolidated
+            df['foo'] = np.random.randn(len(df))
+            store['df'] = df
+            recons = store['df']
+            assert recons._data.is_consolidated()
+
+        # empty
+        self._check_roundtrip(df[:0], tm.assert_frame_equal)
+
+    def test_empty_series_frame(self):
+        s0 = Series()
+        s1 = Series(name='myseries')
+        df0 = DataFrame()
+        df1 = DataFrame(index=['a', 'b', 'c'])
+        df2 = DataFrame(columns=['d', 'e', 'f'])
+
+        self._check_roundtrip(s0, tm.assert_series_equal)
+        self._check_roundtrip(s1, tm.assert_series_equal)
+        self._check_roundtrip(df0, tm.assert_frame_equal)
+        self._check_roundtrip(df1, tm.assert_frame_equal)
+        self._check_roundtrip(df2, tm.assert_frame_equal)
+
+    def test_empty_series(self):
+        for dtype in [np.int64, np.float64, np.object, 'm8[ns]', 'M8[ns]']:
+            s = Series(dtype=dtype)
+            self._check_roundtrip(s, tm.assert_series_equal)
+
+    def test_can_serialize_dates(self):
+
+        rng = [x.date() for x in bdate_range('1/1/2000', '1/30/2000')]
+        frame = DataFrame(np.random.randn(len(rng), 4), index=rng)
+
+        self._check_roundtrip(frame, tm.assert_frame_equal)
+
+    def test_store_hierarchical(self):
+        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                                   ['one', 'two', 'three']],
+                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           names=['foo', 'bar'])
+        frame = DataFrame(np.random.randn(10, 3), index=index,
+                          columns=['A', 'B', 'C'])
+
+        self._check_roundtrip(frame, tm.assert_frame_equal)
+        self._check_roundtrip(frame.T, tm.assert_frame_equal)
+        self._check_roundtrip(frame['A'], tm.assert_series_equal)
+
+        # check that the names are stored
+        with ensure_clean_store(self.path) as store:
+            store['frame'] = frame
+            recons = store['frame']
+            tm.assert_frame_equal(recons, frame)
+
+    def test_store_index_name(self):
+        df = tm.makeDataFrame()
+        df.index.name = 'foo'
+
+        with ensure_clean_store(self.path) as store:
+            store['frame'] = df
+            recons = store['frame']
+            tm.assert_frame_equal(recons, df)
+
+    def test_store_index_name_with_tz(self):
+        # GH 13884
+        df = pd.DataFrame({'A': [1, 2]})
+        df.index = pd.DatetimeIndex([1234567890123456787, 1234567890123456788])
+        df.index = df.index.tz_localize('UTC')
+        df.index.name = 'foo'
+
+        with ensure_clean_store(self.path) as store:
+            store.put('frame', df, format='table')
+            recons = store['frame']
+            tm.assert_frame_equal(recons, df)
+
+    @pytest.mark.parametrize('table_format', ['table', 'fixed'])
+    def test_store_index_name_numpy_str(self, table_format):
+        # GH #13492
+        idx = pd.Index(pd.to_datetime([datetime.date(2000, 1, 1),
+                                       datetime.date(2000, 1, 2)]),
+                       name=u('cols\u05d2'))
+        idx1 = pd.Index(pd.to_datetime([datetime.date(2010, 1, 1),
+                                        datetime.date(2010, 1, 2)]),
+                        name=u('rows\u05d0'))
+        df = pd.DataFrame(np.arange(4).reshape(2, 2), columns=idx, index=idx1)
+
+        # This used to fail, returning numpy strings instead of python strings.
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', format=table_format)
+            df2 = read_hdf(path, 'df')
+
+            assert_frame_equal(df, df2, check_names=True)
+
+            assert type(df2.index.name) == text_type
+            assert type(df2.columns.name) == text_type
+
+    def test_store_series_name(self):
+        df = tm.makeDataFrame()
+        series = df['A']
+
+        with ensure_clean_store(self.path) as store:
+            store['series'] = series
+            recons = store['series']
+            tm.assert_series_equal(recons, series)
+
+    @pytest.mark.parametrize("compression", [
+        False, pytest.param(True, marks=td.skip_if_windows_python_3)
+    ])
+    def test_store_mixed(self, compression):
+
+        def _make_one():
+            df = tm.makeDataFrame()
+            df['obj1'] = 'foo'
+            df['obj2'] = 'bar'
+            df['bool1'] = df['A'] > 0
+            df['bool2'] = df['B'] > 0
+            df['int1'] = 1
+            df['int2'] = 2
+            return df._consolidate()
+
+        df1 = _make_one()
+        df2 = _make_one()
+
+        self._check_roundtrip(df1, tm.assert_frame_equal)
+        self._check_roundtrip(df2, tm.assert_frame_equal)
+
+        with ensure_clean_store(self.path) as store:
+            store['obj'] = df1
+            tm.assert_frame_equal(store['obj'], df1)
+            store['obj'] = df2
+            tm.assert_frame_equal(store['obj'], df2)
+
+        # check that can store Series of all of these types
+        self._check_roundtrip(df1['obj1'], tm.assert_series_equal,
+                              compression=compression)
+        self._check_roundtrip(df1['bool1'], tm.assert_series_equal,
+                              compression=compression)
+        self._check_roundtrip(df1['int1'], tm.assert_series_equal,
+                              compression=compression)
+
+    def test_wide(self):
+
+        with catch_warnings(record=True):
+            wp = tm.makePanel()
+            self._check_roundtrip(wp, assert_panel_equal)
+
+    def test_select_with_dups(self):
+
+        # single dtypes
+        df = DataFrame(np.random.randn(10, 4), columns=['A', 'A', 'B', 'B'])
+        df.index = date_range('20130101 9:30', periods=10, freq='T')
+
+        with ensure_clean_store(self.path) as store:
+            store.append('df', df)
+
+            result = store.select('df')
+            expected = df
+            assert_frame_equal(result, expected, by_blocks=True)
+
+            result = store.select('df', columns=df.columns)
+            expected = df
+            assert_frame_equal(result, expected, by_blocks=True)
+
+            result = store.select('df', columns=['A'])
+            expected = df.loc[:, ['A']]
+            assert_frame_equal(result, expected)
+
+        # dups across dtypes
+        df = concat([DataFrame(np.random.randn(10, 4),
+                               columns=['A', 'A', 'B', 'B']),
+                     DataFrame(np.random.randint(0, 10, size=20)
+                               .reshape(10, 2),
+                               columns=['A', 'C'])],
+                    axis=1)
+        df.index = date_range('20130101 9:30', periods=10, freq='T')
+
+        with ensure_clean_store(self.path) as store:
+            store.append('df', df)
+
+            result = store.select('df')
+            expected = df
+            assert_frame_equal(result, expected, by_blocks=True)
+
+            result = store.select('df', columns=df.columns)
+            expected = df
+            assert_frame_equal(result, expected, by_blocks=True)
+
+            expected = df.loc[:, ['A']]
+            result = store.select('df', columns=['A'])
+            assert_frame_equal(result, expected, by_blocks=True)
+
+            expected = df.loc[:, ['B', 'A']]
+            result = store.select('df', columns=['B', 'A'])
+            assert_frame_equal(result, expected, by_blocks=True)
+
+        # duplicates on both index and columns
+        with ensure_clean_store(self.path) as store:
+            store.append('df', df)
+            store.append('df', df)
+
+            expected = df.loc[:, ['B', 'A']]
+            expected = concat([expected, expected])
+            result = store.select('df', columns=['B', 'A'])
+            assert_frame_equal(result, expected, by_blocks=True)
+
+    def test_wide_table_dups(self):
+        with ensure_clean_store(self.path) as store:
+            with catch_warnings(record=True):
+
+                wp = tm.makePanel()
+                store.put('panel', wp, format='table')
+                store.put('panel', wp, format='table', append=True)
+
+                recons = store['panel']
+
+                assert_panel_equal(recons, wp)
+
+    def test_long(self):
+        def _check(left, right):
+            assert_panel_equal(left.to_panel(), right.to_panel())
+
+        with catch_warnings(record=True):
+            wp = tm.makePanel()
+            self._check_roundtrip(wp.to_frame(), _check)
+
+    def test_overwrite_node(self):
+
+        with ensure_clean_store(self.path) as store:
+            store['a'] = tm.makeTimeDataFrame()
+            ts = tm.makeTimeSeries()
+            store['a'] = ts
+
+            tm.assert_series_equal(store['a'], ts)
+
+    def test_sparse_with_compression(self):
+
+        # GH 2931
+
+        # make sparse dataframe
+        arr = np.random.binomial(n=1, p=.01, size=(1000, 10))
+        df = DataFrame(arr).to_sparse(fill_value=0)
+
+        # case 1: store uncompressed
+        self._check_double_roundtrip(df, tm.assert_frame_equal,
+                                     compression=False,
+                                     check_frame_type=True)
+
+        # case 2: store compressed (works)
+        self._check_double_roundtrip(df, tm.assert_frame_equal,
+                                     compression='zlib',
+                                     check_frame_type=True)
+
+        # set one series to be completely sparse
+        df[0] = np.zeros(1000)
+
+        # case 3: store df with completely sparse series uncompressed
+        self._check_double_roundtrip(df, tm.assert_frame_equal,
+                                     compression=False,
+                                     check_frame_type=True)
+
+        # case 4: try storing df with completely sparse series compressed
+        # (fails)
+        self._check_double_roundtrip(df, tm.assert_frame_equal,
+                                     compression='zlib',
+                                     check_frame_type=True)
+
+    def test_select(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            with catch_warnings(record=True):
+                wp = tm.makePanel()
+
+                # put/select ok
+                _maybe_remove(store, 'wp')
+                store.put('wp', wp, format='table')
+                store.select('wp')
+
+                # non-table ok (where = None)
+                _maybe_remove(store, 'wp')
+                store.put('wp2', wp)
+                store.select('wp2')
+
+                # selection on the non-indexable with a large number of columns
+                wp = Panel(np.random.randn(100, 100, 100),
+                           items=['Item%03d' % i for i in range(100)],
+                           major_axis=date_range('1/1/2000', periods=100),
+                           minor_axis=['E%03d' % i for i in range(100)])
+
+                _maybe_remove(store, 'wp')
+                store.append('wp', wp)
+                items = ['Item%03d' % i for i in range(80)]
+                result = store.select('wp', 'items=items')
+                expected = wp.reindex(items=items)
+                assert_panel_equal(expected, result)
+
+                # selectin non-table with a where
+                # pytest.raises(ValueError, store.select,
+                #                  'wp2', ('column', ['A', 'D']))
+
+                # select with columns=
+                df = tm.makeTimeDataFrame()
+                _maybe_remove(store, 'df')
+                store.append('df', df)
+                result = store.select('df', columns=['A', 'B'])
+                expected = df.reindex(columns=['A', 'B'])
+                tm.assert_frame_equal(expected, result)
+
+                # equivalentsly
+                result = store.select('df', [("columns=['A', 'B']")])
+                expected = df.reindex(columns=['A', 'B'])
+                tm.assert_frame_equal(expected, result)
+
+                # with a data column
+                _maybe_remove(store, 'df')
+                store.append('df', df, data_columns=['A'])
+                result = store.select('df', ['A > 0'], columns=['A', 'B'])
+                expected = df[df.A > 0].reindex(columns=['A', 'B'])
+                tm.assert_frame_equal(expected, result)
+
+                # all a data columns
+                _maybe_remove(store, 'df')
+                store.append('df', df, data_columns=True)
+                result = store.select('df', ['A > 0'], columns=['A', 'B'])
+                expected = df[df.A > 0].reindex(columns=['A', 'B'])
+                tm.assert_frame_equal(expected, result)
+
+                # with a data column, but different columns
+                _maybe_remove(store, 'df')
+                store.append('df', df, data_columns=['A'])
+                result = store.select('df', ['A > 0'], columns=['C', 'D'])
+                expected = df[df.A > 0].reindex(columns=['C', 'D'])
+                tm.assert_frame_equal(expected, result)
+
+    def test_select_dtypes(self):
+
+        with ensure_clean_store(self.path) as store:
+            # with a Timestamp data column (GH #2637)
+            df = DataFrame(dict(
+                ts=bdate_range('2012-01-01', periods=300),
+                A=np.random.randn(300)))
+            _maybe_remove(store, 'df')
+            store.append('df', df, data_columns=['ts', 'A'])
+
+            result = store.select('df', "ts>=Timestamp('2012-02-01')")
+            expected = df[df.ts >= Timestamp('2012-02-01')]
+            tm.assert_frame_equal(expected, result)
+
+            # bool columns (GH #2849)
+            df = DataFrame(np.random.randn(5, 2), columns=['A', 'B'])
+            df['object'] = 'foo'
+            df.loc[4:5, 'object'] = 'bar'
+            df['boolv'] = df['A'] > 0
+            _maybe_remove(store, 'df')
+            store.append('df', df, data_columns=True)
+
+            expected = (df[df.boolv == True]  # noqa
+                        .reindex(columns=['A', 'boolv']))
+            for v in [True, 'true', 1]:
+                result = store.select('df', 'boolv == %s' % str(v),
+                                      columns=['A', 'boolv'])
+                tm.assert_frame_equal(expected, result)
+
+            expected = (df[df.boolv == False]  # noqa
+                        .reindex(columns=['A', 'boolv']))
+            for v in [False, 'false', 0]:
+                result = store.select(
+                    'df', 'boolv == %s' % str(v), columns=['A', 'boolv'])
+                tm.assert_frame_equal(expected, result)
+
+            # integer index
+            df = DataFrame(dict(A=np.random.rand(20), B=np.random.rand(20)))
+            _maybe_remove(store, 'df_int')
+            store.append('df_int', df)
+            result = store.select(
+                'df_int', "index<10 and columns=['A']")
+            expected = df.reindex(index=list(df.index)[0:10], columns=['A'])
+            tm.assert_frame_equal(expected, result)
+
+            # float index
+            df = DataFrame(dict(A=np.random.rand(
+                20), B=np.random.rand(20), index=np.arange(20, dtype='f8')))
+            _maybe_remove(store, 'df_float')
+            store.append('df_float', df)
+            result = store.select(
+                'df_float', "index<10.0 and columns=['A']")
+            expected = df.reindex(index=list(df.index)[0:10], columns=['A'])
+            tm.assert_frame_equal(expected, result)
+
+        with ensure_clean_store(self.path) as store:
+
+            # floats w/o NaN
+            df = DataFrame(
+                dict(cols=range(11), values=range(11)), dtype='float64')
+            df['cols'] = (df['cols'] + 10).apply(str)
+
+            store.append('df1', df, data_columns=True)
+            result = store.select(
+                'df1', where='values>2.0')
+            expected = df[df['values'] > 2.0]
+            tm.assert_frame_equal(expected, result)
+
+            # floats with NaN
+            df.iloc[0] = np.nan
+            expected = df[df['values'] > 2.0]
+
+            store.append('df2', df, data_columns=True, index=False)
+            result = store.select(
+                'df2', where='values>2.0')
+            tm.assert_frame_equal(expected, result)
+
+            # https://github.com/PyTables/PyTables/issues/282
+            # bug in selection when 0th row has a np.nan and an index
+            # store.append('df3',df,data_columns=True)
+            # result = store.select(
+            #    'df3', where='values>2.0')
+            # tm.assert_frame_equal(expected, result)
+
+            # not in first position float with NaN ok too
+            df = DataFrame(
+                dict(cols=range(11), values=range(11)), dtype='float64')
+            df['cols'] = (df['cols'] + 10).apply(str)
+
+            df.iloc[1] = np.nan
+            expected = df[df['values'] > 2.0]
+
+            store.append('df4', df, data_columns=True)
+            result = store.select(
+                'df4', where='values>2.0')
+            tm.assert_frame_equal(expected, result)
+
+        # test selection with comparison against numpy scalar
+        # GH 11283
+        with ensure_clean_store(self.path) as store:
+            df = tm.makeDataFrame()
+
+            expected = df[df['A'] > 0]
+
+            store.append('df', df, data_columns=True)
+            np_zero = np.float64(0)  # noqa
+            result = store.select('df', where=["A>np_zero"])
+            tm.assert_frame_equal(expected, result)
+
+    def test_select_with_many_inputs(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            df = DataFrame(dict(ts=bdate_range('2012-01-01', periods=300),
+                                A=np.random.randn(300),
+                                B=range(300),
+                                users=['a'] * 50 + ['b'] * 50 + ['c'] * 100 +
+                                ['a%03d' % i for i in range(100)]))
+            _maybe_remove(store, 'df')
+            store.append('df', df, data_columns=['ts', 'A', 'B', 'users'])
+
+            # regular select
+            result = store.select('df', "ts>=Timestamp('2012-02-01')")
+            expected = df[df.ts >= Timestamp('2012-02-01')]
+            tm.assert_frame_equal(expected, result)
+
+            # small selector
+            result = store.select(
+                'df',
+                "ts>=Timestamp('2012-02-01') & users=['a','b','c']")
+            expected = df[(df.ts >= Timestamp('2012-02-01')) &
+                          df.users.isin(['a', 'b', 'c'])]
+            tm.assert_frame_equal(expected, result)
+
+            # big selector along the columns
+            selector = ['a', 'b', 'c'] + ['a%03d' % i for i in range(60)]
+            result = store.select(
+                'df',
+                "ts>=Timestamp('2012-02-01') and users=selector")
+            expected = df[(df.ts >= Timestamp('2012-02-01')) &
+                          df.users.isin(selector)]
+            tm.assert_frame_equal(expected, result)
+
+            selector = range(100, 200)
+            result = store.select('df', 'B=selector')
+            expected = df[df.B.isin(selector)]
+            tm.assert_frame_equal(expected, result)
+            assert len(result) == 100
+
+            # big selector along the index
+            selector = Index(df.ts[0:100].values)
+            result = store.select('df', 'ts=selector')
+            expected = df[df.ts.isin(selector.values)]
+            tm.assert_frame_equal(expected, result)
+            assert len(result) == 100
+
+    def test_select_iterator(self):
+
+        # single table
+        with ensure_clean_store(self.path) as store:
+
+            df = tm.makeTimeDataFrame(500)
+            _maybe_remove(store, 'df')
+            store.append('df', df)
+
+            expected = store.select('df')
+
+            results = [s for s in store.select('df', iterator=True)]
+            result = concat(results)
+            tm.assert_frame_equal(expected, result)
+
+            results = [s for s in store.select('df', chunksize=100)]
+            assert len(results) == 5
+            result = concat(results)
+            tm.assert_frame_equal(expected, result)
+
+            results = [s for s in store.select('df', chunksize=150)]
+            result = concat(results)
+            tm.assert_frame_equal(result, expected)
+
+        with ensure_clean_path(self.path) as path:
+
+            df = tm.makeTimeDataFrame(500)
+            df.to_hdf(path, 'df_non_table')
+            pytest.raises(TypeError, read_hdf, path,
+                          'df_non_table', chunksize=100)
+            pytest.raises(TypeError, read_hdf, path,
+                          'df_non_table', iterator=True)
+
+        with ensure_clean_path(self.path) as path:
+
+            df = tm.makeTimeDataFrame(500)
+            df.to_hdf(path, 'df', format='table')
+
+            results = [s for s in read_hdf(path, 'df', chunksize=100)]
+            result = concat(results)
+
+            assert len(results) == 5
+            tm.assert_frame_equal(result, df)
+            tm.assert_frame_equal(result, read_hdf(path, 'df'))
+
+        # multiple
+
+        with ensure_clean_store(self.path) as store:
+
+            df1 = tm.makeTimeDataFrame(500)
+            store.append('df1', df1, data_columns=True)
+            df2 = tm.makeTimeDataFrame(500).rename(
+                columns=lambda x: "%s_2" % x)
+            df2['foo'] = 'bar'
+            store.append('df2', df2)
+
+            df = concat([df1, df2], axis=1)
+
+            # full selection
+            expected = store.select_as_multiple(
+                ['df1', 'df2'], selector='df1')
+            results = [s for s in store.select_as_multiple(
+                ['df1', 'df2'], selector='df1', chunksize=150)]
+            result = concat(results)
+            tm.assert_frame_equal(expected, result)
+
+    def test_select_iterator_complete_8014(self):
+
+        # GH 8014
+        # using iterator and where clause
+        chunksize = 1e4
+
+        # no iterator
+        with ensure_clean_store(self.path) as store:
+
+            expected = tm.makeTimeDataFrame(100064, 'S')
+            _maybe_remove(store, 'df')
+            store.append('df', expected)
+
+            beg_dt = expected.index[0]
+            end_dt = expected.index[-1]
+
+            # select w/o iteration and no where clause works
+            result = store.select('df')
+            tm.assert_frame_equal(expected, result)
+
+            # select w/o iterator and where clause, single term, begin
+            # of range, works
+            where = "index >= '%s'" % beg_dt
+            result = store.select('df', where=where)
+            tm.assert_frame_equal(expected, result)
+
+            # select w/o iterator and where clause, single term, end
+            # of range, works
+            where = "index <= '%s'" % end_dt
+            result = store.select('df', where=where)
+            tm.assert_frame_equal(expected, result)
+
+            # select w/o iterator and where clause, inclusive range,
+            # works
+            where = "index >= '%s' & index <= '%s'" % (beg_dt, end_dt)
+            result = store.select('df', where=where)
+            tm.assert_frame_equal(expected, result)
+
+        # with iterator, full range
+        with ensure_clean_store(self.path) as store:
+
+            expected = tm.makeTimeDataFrame(100064, 'S')
+            _maybe_remove(store, 'df')
+            store.append('df', expected)
+
+            beg_dt = expected.index[0]
+            end_dt = expected.index[-1]
+
+            # select w/iterator and no where clause works
+            results = [s for s in store.select('df', chunksize=chunksize)]
+            result = concat(results)
+            tm.assert_frame_equal(expected, result)
+
+            # select w/iterator and where clause, single term, begin of range
+            where = "index >= '%s'" % beg_dt
+            results = [s for s in store.select(
+                'df', where=where, chunksize=chunksize)]
+            result = concat(results)
+            tm.assert_frame_equal(expected, result)
+
+            # select w/iterator and where clause, single term, end of range
+            where = "index <= '%s'" % end_dt
+            results = [s for s in store.select(
+                'df', where=where, chunksize=chunksize)]
+            result = concat(results)
+            tm.assert_frame_equal(expected, result)
+
+            # select w/iterator and where clause, inclusive range
+            where = "index >= '%s' & index <= '%s'" % (beg_dt, end_dt)
+            results = [s for s in store.select(
+                'df', where=where, chunksize=chunksize)]
+            result = concat(results)
+            tm.assert_frame_equal(expected, result)
+
+    def test_select_iterator_non_complete_8014(self):
+
+        # GH 8014
+        # using iterator and where clause
+        chunksize = 1e4
+
+        # with iterator, non complete range
+        with ensure_clean_store(self.path) as store:
+
+            expected = tm.makeTimeDataFrame(100064, 'S')
+            _maybe_remove(store, 'df')
+            store.append('df', expected)
+
+            beg_dt = expected.index[1]
+            end_dt = expected.index[-2]
+
+            # select w/iterator and where clause, single term, begin of range
+            where = "index >= '%s'" % beg_dt
+            results = [s for s in store.select(
+                'df', where=where, chunksize=chunksize)]
+            result = concat(results)
+            rexpected = expected[expected.index >= beg_dt]
+            tm.assert_frame_equal(rexpected, result)
+
+            # select w/iterator and where clause, single term, end of range
+            where = "index <= '%s'" % end_dt
+            results = [s for s in store.select(
+                'df', where=where, chunksize=chunksize)]
+            result = concat(results)
+            rexpected = expected[expected.index <= end_dt]
+            tm.assert_frame_equal(rexpected, result)
+
+            # select w/iterator and where clause, inclusive range
+            where = "index >= '%s' & index <= '%s'" % (beg_dt, end_dt)
+            results = [s for s in store.select(
+                'df', where=where, chunksize=chunksize)]
+            result = concat(results)
+            rexpected = expected[(expected.index >= beg_dt) &
+                                 (expected.index <= end_dt)]
+            tm.assert_frame_equal(rexpected, result)
+
+        # with iterator, empty where
+        with ensure_clean_store(self.path) as store:
+
+            expected = tm.makeTimeDataFrame(100064, 'S')
+            _maybe_remove(store, 'df')
+            store.append('df', expected)
+
+            end_dt = expected.index[-1]
+
+            # select w/iterator and where clause, single term, begin of range
+            where = "index > '%s'" % end_dt
+            results = [s for s in store.select(
+                'df', where=where, chunksize=chunksize)]
+            assert 0 == len(results)
+
+    def test_select_iterator_many_empty_frames(self):
+
+        # GH 8014
+        # using iterator and where clause can return many empty
+        # frames.
+        chunksize = int(1e4)
+
+        # with iterator, range limited to the first chunk
+        with ensure_clean_store(self.path) as store:
+
+            expected = tm.makeTimeDataFrame(100000, 'S')
+            _maybe_remove(store, 'df')
+            store.append('df', expected)
+
+            beg_dt = expected.index[0]
+            end_dt = expected.index[chunksize - 1]
+
+            # select w/iterator and where clause, single term, begin of range
+            where = "index >= '%s'" % beg_dt
+            results = [s for s in store.select(
+                'df', where=where, chunksize=chunksize)]
+            result = concat(results)
+            rexpected = expected[expected.index >= beg_dt]
+            tm.assert_frame_equal(rexpected, result)
+
+            # select w/iterator and where clause, single term, end of range
+            where = "index <= '%s'" % end_dt
+            results = [s for s in store.select(
+                'df', where=where, chunksize=chunksize)]
+
+            assert len(results) == 1
+            result = concat(results)
+            rexpected = expected[expected.index <= end_dt]
+            tm.assert_frame_equal(rexpected, result)
+
+            # select w/iterator and where clause, inclusive range
+            where = "index >= '%s' & index <= '%s'" % (beg_dt, end_dt)
+            results = [s for s in store.select(
+                'df', where=where, chunksize=chunksize)]
+
+            # should be 1, is 10
+            assert len(results) == 1
+            result = concat(results)
+            rexpected = expected[(expected.index >= beg_dt) &
+                                 (expected.index <= end_dt)]
+            tm.assert_frame_equal(rexpected, result)
+
+            # select w/iterator and where clause which selects
+            # *nothing*.
+            #
+            # To be consistent with Python idiom I suggest this should
+            # return [] e.g. `for e in []: print True` never prints
+            # True.
+
+            where = "index <= '%s' & index >= '%s'" % (beg_dt, end_dt)
+            results = [s for s in store.select(
+                'df', where=where, chunksize=chunksize)]
+
+            # should be []
+            assert len(results) == 0
+
+    def test_retain_index_attributes(self):
+
+        # GH 3499, losing frequency info on index recreation
+        df = DataFrame(dict(
+            A=Series(lrange(3),
+                     index=date_range('2000-1-1', periods=3, freq='H'))))
+
+        with ensure_clean_store(self.path) as store:
+            _maybe_remove(store, 'data')
+            store.put('data', df, format='table')
+
+            result = store.get('data')
+            tm.assert_frame_equal(df, result)
+
+            for attr in ['freq', 'tz', 'name']:
+                for idx in ['index', 'columns']:
+                    assert (getattr(getattr(df, idx), attr, None) ==
+                            getattr(getattr(result, idx), attr, None))
+
+            # try to append a table with a different frequency
+            with catch_warnings(record=True):
+                df2 = DataFrame(dict(
+                    A=Series(lrange(3),
+                             index=date_range('2002-1-1',
+                                              periods=3, freq='D'))))
+                store.append('data', df2)
+
+            assert store.get_storer('data').info['index']['freq'] is None
+
+            # this is ok
+            _maybe_remove(store, 'df2')
+            df2 = DataFrame(dict(
+                A=Series(lrange(3),
+                         index=[Timestamp('20010101'), Timestamp('20010102'),
+                                Timestamp('20020101')])))
+            store.append('df2', df2)
+            df3 = DataFrame(dict(
+                A=Series(lrange(3),
+                         index=date_range('2002-1-1', periods=3,
+                                          freq='D'))))
+            store.append('df2', df3)
+
+    def test_retain_index_attributes2(self):
+        with ensure_clean_path(self.path) as path:
+
+            with catch_warnings(record=True):
+
+                df = DataFrame(dict(
+                    A=Series(lrange(3),
+                             index=date_range('2000-1-1',
+                                              periods=3, freq='H'))))
+                df.to_hdf(path, 'data', mode='w', append=True)
+                df2 = DataFrame(dict(
+                    A=Series(lrange(3),
+                             index=date_range('2002-1-1', periods=3,
+                                              freq='D'))))
+                df2.to_hdf(path, 'data', append=True)
+
+                idx = date_range('2000-1-1', periods=3, freq='H')
+                idx.name = 'foo'
+                df = DataFrame(dict(A=Series(lrange(3), index=idx)))
+                df.to_hdf(path, 'data', mode='w', append=True)
+
+            assert read_hdf(path, 'data').index.name == 'foo'
+
+            with catch_warnings(record=True):
+
+                idx2 = date_range('2001-1-1', periods=3, freq='H')
+                idx2.name = 'bar'
+                df2 = DataFrame(dict(A=Series(lrange(3), index=idx2)))
+                df2.to_hdf(path, 'data', append=True)
+
+            assert read_hdf(path, 'data').index.name is None
+
+    def test_panel_select(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            with catch_warnings(record=True):
+
+                wp = tm.makePanel()
+
+                store.put('wp', wp, format='table')
+                date = wp.major_axis[len(wp.major_axis) // 2]
+
+                crit1 = ('major_axis>=date')
+                crit2 = ("minor_axis=['A', 'D']")
+
+                result = store.select('wp', [crit1, crit2])
+                expected = wp.truncate(before=date).reindex(minor=['A', 'D'])
+                assert_panel_equal(result, expected)
+
+                result = store.select(
+                    'wp', ['major_axis>="20000124"',
+                           ("minor_axis=['A', 'B']")])
+                expected = wp.truncate(
+                    before='20000124').reindex(minor=['A', 'B'])
+                assert_panel_equal(result, expected)
+
+    def test_frame_select(self):
+
+        df = tm.makeTimeDataFrame()
+
+        with ensure_clean_store(self.path) as store:
+            store.put('frame', df, format='table')
+            date = df.index[len(df) // 2]
+
+            crit1 = Term('index>=date')
+            assert crit1.env.scope['date'] == date
+
+            crit2 = ("columns=['A', 'D']")
+            crit3 = ('columns=A')
+
+            result = store.select('frame', [crit1, crit2])
+            expected = df.loc[date:, ['A', 'D']]
+            tm.assert_frame_equal(result, expected)
+
+            result = store.select('frame', [crit3])
+            expected = df.loc[:, ['A']]
+            tm.assert_frame_equal(result, expected)
+
+            # invalid terms
+            df = tm.makeTimeDataFrame()
+            store.append('df_time', df)
+            pytest.raises(
+                ValueError, store.select, 'df_time', "index>0")
+
+            # can't select if not written as table
+            # store['frame'] = df
+            # pytest.raises(ValueError, store.select,
+            #                  'frame', [crit1, crit2])
+
+    def test_frame_select_complex(self):
+        # select via complex criteria
+
+        df = tm.makeTimeDataFrame()
+        df['string'] = 'foo'
+        df.loc[df.index[0:4], 'string'] = 'bar'
+
+        with ensure_clean_store(self.path) as store:
+            store.put('df', df, format='table', data_columns=['string'])
+
+            # empty
+            result = store.select('df', 'index>df.index[3] & string="bar"')
+            expected = df.loc[(df.index > df.index[3]) & (df.string == 'bar')]
+            tm.assert_frame_equal(result, expected)
+
+            result = store.select('df', 'index>df.index[3] & string="foo"')
+            expected = df.loc[(df.index > df.index[3]) & (df.string == 'foo')]
+            tm.assert_frame_equal(result, expected)
+
+            # or
+            result = store.select('df', 'index>df.index[3] | string="bar"')
+            expected = df.loc[(df.index > df.index[3]) | (df.string == 'bar')]
+            tm.assert_frame_equal(result, expected)
+
+            result = store.select('df', '(index>df.index[3] & '
+                                  'index<=df.index[6]) | string="bar"')
+            expected = df.loc[((df.index > df.index[3]) & (
+                df.index <= df.index[6])) | (df.string == 'bar')]
+            tm.assert_frame_equal(result, expected)
+
+            # invert
+            result = store.select('df', 'string!="bar"')
+            expected = df.loc[df.string != 'bar']
+            tm.assert_frame_equal(result, expected)
+
+            # invert not implemented in numexpr :(
+            pytest.raises(NotImplementedError,
+                          store.select, 'df', '~(string="bar")')
+
+            # invert ok for filters
+            result = store.select('df', "~(columns=['A','B'])")
+            expected = df.loc[:, df.columns.difference(['A', 'B'])]
+            tm.assert_frame_equal(result, expected)
+
+            # in
+            result = store.select(
+                'df', "index>df.index[3] & columns in ['A','B']")
+            expected = df.loc[df.index > df.index[3]].reindex(columns=[
+                                                              'A', 'B'])
+            tm.assert_frame_equal(result, expected)
+
+    def test_frame_select_complex2(self):
+
+        with ensure_clean_path(['parms.hdf', 'hist.hdf']) as paths:
+
+            pp, hh = paths
+
+            # use non-trivial selection criteria
+            parms = DataFrame({'A': [1, 1, 2, 2, 3]})
+            parms.to_hdf(pp, 'df', mode='w',
+                         format='table', data_columns=['A'])
+
+            selection = read_hdf(pp, 'df', where='A=[2,3]')
+            hist = DataFrame(np.random.randn(25, 1),
+                             columns=['data'],
+                             index=MultiIndex.from_tuples(
+                                 [(i, j) for i in range(5)
+                                  for j in range(5)],
+                                 names=['l1', 'l2']))
+
+            hist.to_hdf(hh, 'df', mode='w', format='table')
+
+            expected = read_hdf(hh, 'df', where='l1=[2, 3, 4]')
+
+            # sccope with list like
+            l = selection.index.tolist()  # noqa
+            store = HDFStore(hh)
+            result = store.select('df', where='l1=l')
+            assert_frame_equal(result, expected)
+            store.close()
+
+            result = read_hdf(hh, 'df', where='l1=l')
+            assert_frame_equal(result, expected)
+
+            # index
+            index = selection.index  # noqa
+            result = read_hdf(hh, 'df', where='l1=index')
+            assert_frame_equal(result, expected)
+
+            result = read_hdf(hh, 'df', where='l1=selection.index')
+            assert_frame_equal(result, expected)
+
+            result = read_hdf(hh, 'df', where='l1=selection.index.tolist()')
+            assert_frame_equal(result, expected)
+
+            result = read_hdf(hh, 'df', where='l1=list(selection.index)')
+            assert_frame_equal(result, expected)
+
+            # sccope with index
+            store = HDFStore(hh)
+
+            result = store.select('df', where='l1=index')
+            assert_frame_equal(result, expected)
+
+            result = store.select('df', where='l1=selection.index')
+            assert_frame_equal(result, expected)
+
+            result = store.select('df', where='l1=selection.index.tolist()')
+            assert_frame_equal(result, expected)
+
+            result = store.select('df', where='l1=list(selection.index)')
+            assert_frame_equal(result, expected)
+
+            store.close()
+
+    def test_invalid_filtering(self):
+
+        # can't use more than one filter (atm)
+
+        df = tm.makeTimeDataFrame()
+
+        with ensure_clean_store(self.path) as store:
+            store.put('df', df, format='table')
+
+            # not implemented
+            pytest.raises(NotImplementedError, store.select,
+                          'df', "columns=['A'] | columns=['B']")
+
+            # in theory we could deal with this
+            pytest.raises(NotImplementedError, store.select,
+                          'df', "columns=['A','B'] & columns=['C']")
+
+    def test_string_select(self):
+        # GH 2973
+        with ensure_clean_store(self.path) as store:
+
+            df = tm.makeTimeDataFrame()
+
+            # test string ==/!=
+            df['x'] = 'none'
+            df.loc[2:7, 'x'] = ''
+
+            store.append('df', df, data_columns=['x'])
+
+            result = store.select('df', 'x=none')
+            expected = df[df.x == 'none']
+            assert_frame_equal(result, expected)
+
+            try:
+                result = store.select('df', 'x!=none')
+                expected = df[df.x != 'none']
+                assert_frame_equal(result, expected)
+            except Exception as detail:
+                pprint_thing("[{0}]".format(detail))
+                pprint_thing(store)
+                pprint_thing(expected)
+
+            df2 = df.copy()
+            df2.loc[df2.x == '', 'x'] = np.nan
+
+            store.append('df2', df2, data_columns=['x'])
+            result = store.select('df2', 'x!=none')
+            expected = df2[isna(df2.x)]
+            assert_frame_equal(result, expected)
+
+            # int ==/!=
+            df['int'] = 1
+            df.loc[2:7, 'int'] = 2
+
+            store.append('df3', df, data_columns=['int'])
+
+            result = store.select('df3', 'int=2')
+            expected = df[df.int == 2]
+            assert_frame_equal(result, expected)
+
+            result = store.select('df3', 'int!=2')
+            expected = df[df.int != 2]
+            assert_frame_equal(result, expected)
+
+    def test_read_column(self):
+
+        df = tm.makeTimeDataFrame()
+
+        with ensure_clean_store(self.path) as store:
+            _maybe_remove(store, 'df')
+
+            # GH 17912
+            # HDFStore.select_column should raise a KeyError
+            # exception if the key is not a valid store
+            with pytest.raises(KeyError,
+                               message='No object named index in the file'):
+                store.select_column('df', 'index')
+
+            store.append('df', df)
+            # error
+            pytest.raises(KeyError, store.select_column, 'df', 'foo')
+
+            def f():
+                store.select_column('df', 'index', where=['index>5'])
+            pytest.raises(Exception, f)
+
+            # valid
+            result = store.select_column('df', 'index')
+            tm.assert_almost_equal(result.values, Series(df.index).values)
+            assert isinstance(result, Series)
+
+            # not a data indexable column
+            pytest.raises(
+                ValueError, store.select_column, 'df', 'values_block_0')
+
+            # a data column
+            df2 = df.copy()
+            df2['string'] = 'foo'
+            store.append('df2', df2, data_columns=['string'])
+            result = store.select_column('df2', 'string')
+            tm.assert_almost_equal(result.values, df2['string'].values)
+
+            # a data column with NaNs, result excludes the NaNs
+            df3 = df.copy()
+            df3['string'] = 'foo'
+            df3.loc[4:6, 'string'] = np.nan
+            store.append('df3', df3, data_columns=['string'])
+            result = store.select_column('df3', 'string')
+            tm.assert_almost_equal(result.values, df3['string'].values)
+
+            # start/stop
+            result = store.select_column('df3', 'string', start=2)
+            tm.assert_almost_equal(result.values, df3['string'].values[2:])
+
+            result = store.select_column('df3', 'string', start=-2)
+            tm.assert_almost_equal(result.values, df3['string'].values[-2:])
+
+            result = store.select_column('df3', 'string', stop=2)
+            tm.assert_almost_equal(result.values, df3['string'].values[:2])
+
+            result = store.select_column('df3', 'string', stop=-2)
+            tm.assert_almost_equal(result.values, df3['string'].values[:-2])
+
+            result = store.select_column('df3', 'string', start=2, stop=-2)
+            tm.assert_almost_equal(result.values, df3['string'].values[2:-2])
+
+            result = store.select_column('df3', 'string', start=-2, stop=2)
+            tm.assert_almost_equal(result.values, df3['string'].values[-2:2])
+
+            # GH 10392 - make sure column name is preserved
+            df4 = DataFrame({'A': np.random.randn(10), 'B': 'foo'})
+            store.append('df4', df4, data_columns=True)
+            expected = df4['B']
+            result = store.select_column('df4', 'B')
+            tm.assert_series_equal(result, expected)
+
+    def test_coordinates(self):
+        df = tm.makeTimeDataFrame()
+
+        with ensure_clean_store(self.path) as store:
+
+            _maybe_remove(store, 'df')
+            store.append('df', df)
+
+            # all
+            c = store.select_as_coordinates('df')
+            assert((c.values == np.arange(len(df.index))).all())
+
+            # get coordinates back & test vs frame
+            _maybe_remove(store, 'df')
+
+            df = DataFrame(dict(A=lrange(5), B=lrange(5)))
+            store.append('df', df)
+            c = store.select_as_coordinates('df', ['index<3'])
+            assert((c.values == np.arange(3)).all())
+            result = store.select('df', where=c)
+            expected = df.loc[0:2, :]
+            tm.assert_frame_equal(result, expected)
+
+            c = store.select_as_coordinates('df', ['index>=3', 'index<=4'])
+            assert((c.values == np.arange(2) + 3).all())
+            result = store.select('df', where=c)
+            expected = df.loc[3:4, :]
+            tm.assert_frame_equal(result, expected)
+            assert isinstance(c, Index)
+
+            # multiple tables
+            _maybe_remove(store, 'df1')
+            _maybe_remove(store, 'df2')
+            df1 = tm.makeTimeDataFrame()
+            df2 = tm.makeTimeDataFrame().rename(columns=lambda x: "%s_2" % x)
+            store.append('df1', df1, data_columns=['A', 'B'])
+            store.append('df2', df2)
+
+            c = store.select_as_coordinates('df1', ['A>0', 'B>0'])
+            df1_result = store.select('df1', c)
+            df2_result = store.select('df2', c)
+            result = concat([df1_result, df2_result], axis=1)
+
+            expected = concat([df1, df2], axis=1)
+            expected = expected[(expected.A > 0) & (expected.B > 0)]
+            tm.assert_frame_equal(result, expected)
+
+        # pass array/mask as the coordinates
+        with ensure_clean_store(self.path) as store:
+
+            df = DataFrame(np.random.randn(1000, 2),
+                           index=date_range('20000101', periods=1000))
+            store.append('df', df)
+            c = store.select_column('df', 'index')
+            where = c[DatetimeIndex(c).month == 5].index
+            expected = df.iloc[where]
+
+            # locations
+            result = store.select('df', where=where)
+            tm.assert_frame_equal(result, expected)
+
+            # boolean
+            result = store.select('df', where=where)
+            tm.assert_frame_equal(result, expected)
+
+            # invalid
+            pytest.raises(ValueError, store.select, 'df',
+                          where=np.arange(len(df), dtype='float64'))
+            pytest.raises(ValueError, store.select, 'df',
+                          where=np.arange(len(df) + 1))
+            pytest.raises(ValueError, store.select, 'df',
+                          where=np.arange(len(df)), start=5)
+            pytest.raises(ValueError, store.select, 'df',
+                          where=np.arange(len(df)), start=5, stop=10)
+
+            # selection with filter
+            selection = date_range('20000101', periods=500)
+            result = store.select('df', where='index in selection')
+            expected = df[df.index.isin(selection)]
+            tm.assert_frame_equal(result, expected)
+
+            # list
+            df = DataFrame(np.random.randn(10, 2))
+            store.append('df2', df)
+            result = store.select('df2', where=[0, 3, 5])
+            expected = df.iloc[[0, 3, 5]]
+            tm.assert_frame_equal(result, expected)
+
+            # boolean
+            where = [True] * 10
+            where[-2] = False
+            result = store.select('df2', where=where)
+            expected = df.loc[where]
+            tm.assert_frame_equal(result, expected)
+
+            # start/stop
+            result = store.select('df2', start=5, stop=10)
+            expected = df[5:10]
+            tm.assert_frame_equal(result, expected)
+
+    def test_append_to_multiple(self):
+        df1 = tm.makeTimeDataFrame()
+        df2 = tm.makeTimeDataFrame().rename(columns=lambda x: "%s_2" % x)
+        df2['foo'] = 'bar'
+        df = concat([df1, df2], axis=1)
+
+        with ensure_clean_store(self.path) as store:
+
+            # exceptions
+            pytest.raises(ValueError, store.append_to_multiple,
+                          {'df1': ['A', 'B'], 'df2': None}, df,
+                          selector='df3')
+            pytest.raises(ValueError, store.append_to_multiple,
+                          {'df1': None, 'df2': None}, df, selector='df3')
+            pytest.raises(
+                ValueError, store.append_to_multiple, 'df1', df, 'df1')
+
+            # regular operation
+            store.append_to_multiple(
+                {'df1': ['A', 'B'], 'df2': None}, df, selector='df1')
+            result = store.select_as_multiple(
+                ['df1', 'df2'], where=['A>0', 'B>0'], selector='df1')
+            expected = df[(df.A > 0) & (df.B > 0)]
+            tm.assert_frame_equal(result, expected)
+
+    def test_append_to_multiple_dropna(self):
+        df1 = tm.makeTimeDataFrame()
+        df2 = tm.makeTimeDataFrame().rename(columns=lambda x: "%s_2" % x)
+        df1.iloc[1, df1.columns.get_indexer(['A', 'B'])] = np.nan
+        df = concat([df1, df2], axis=1)
+
+        with ensure_clean_store(self.path) as store:
+
+            # dropna=True should guarantee rows are synchronized
+            store.append_to_multiple(
+                {'df1': ['A', 'B'], 'df2': None}, df, selector='df1',
+                dropna=True)
+            result = store.select_as_multiple(['df1', 'df2'])
+            expected = df.dropna()
+            tm.assert_frame_equal(result, expected)
+            tm.assert_index_equal(store.select('df1').index,
+                                  store.select('df2').index)
+
+    @pytest.mark.xfail(run=False,
+                       reason="append_to_multiple_dropna_false "
+                       "is not raising as failed")
+    def test_append_to_multiple_dropna_false(self):
+        df1 = tm.makeTimeDataFrame()
+        df2 = tm.makeTimeDataFrame().rename(columns=lambda x: "%s_2" % x)
+        df1.iloc[1, df1.columns.get_indexer(['A', 'B'])] = np.nan
+        df = concat([df1, df2], axis=1)
+
+        with ensure_clean_store(self.path) as store:
+
+            # dropna=False shouldn't synchronize row indexes
+            store.append_to_multiple(
+                {'df1a': ['A', 'B'], 'df2a': None}, df, selector='df1a',
+                dropna=False)
+
+            with pytest.raises(ValueError):
+                store.select_as_multiple(['df1a', 'df2a'])
+
+            assert not store.select('df1a').index.equals(
+                store.select('df2a').index)
+
+    def test_select_as_multiple(self):
+
+        df1 = tm.makeTimeDataFrame()
+        df2 = tm.makeTimeDataFrame().rename(columns=lambda x: "%s_2" % x)
+        df2['foo'] = 'bar'
+
+        with ensure_clean_store(self.path) as store:
+
+            # no tables stored
+            pytest.raises(Exception, store.select_as_multiple,
+                          None, where=['A>0', 'B>0'], selector='df1')
+
+            store.append('df1', df1, data_columns=['A', 'B'])
+            store.append('df2', df2)
+
+            # exceptions
+            pytest.raises(Exception, store.select_as_multiple,
+                          None, where=['A>0', 'B>0'], selector='df1')
+            pytest.raises(Exception, store.select_as_multiple,
+                          [None], where=['A>0', 'B>0'], selector='df1')
+            pytest.raises(KeyError, store.select_as_multiple,
+                          ['df1', 'df3'], where=['A>0', 'B>0'],
+                          selector='df1')
+            pytest.raises(KeyError, store.select_as_multiple,
+                          ['df3'], where=['A>0', 'B>0'], selector='df1')
+            pytest.raises(KeyError, store.select_as_multiple,
+                          ['df1', 'df2'], where=['A>0', 'B>0'],
+                          selector='df4')
+
+            # default select
+            result = store.select('df1', ['A>0', 'B>0'])
+            expected = store.select_as_multiple(
+                ['df1'], where=['A>0', 'B>0'], selector='df1')
+            tm.assert_frame_equal(result, expected)
+            expected = store.select_as_multiple(
+                'df1', where=['A>0', 'B>0'], selector='df1')
+            tm.assert_frame_equal(result, expected)
+
+            # multiple
+            result = store.select_as_multiple(
+                ['df1', 'df2'], where=['A>0', 'B>0'], selector='df1')
+            expected = concat([df1, df2], axis=1)
+            expected = expected[(expected.A > 0) & (expected.B > 0)]
+            tm.assert_frame_equal(result, expected)
+
+            # multiple (diff selector)
+            result = store.select_as_multiple(
+                ['df1', 'df2'], where='index>df2.index[4]', selector='df2')
+            expected = concat([df1, df2], axis=1)
+            expected = expected[5:]
+            tm.assert_frame_equal(result, expected)
+
+            # test excpection for diff rows
+            store.append('df3', tm.makeTimeDataFrame(nper=50))
+            pytest.raises(ValueError, store.select_as_multiple,
+                          ['df1', 'df3'], where=['A>0', 'B>0'],
+                          selector='df1')
+
+    @pytest.mark.skipif(
+        LooseVersion(tables.__version__) < LooseVersion('3.1.0'),
+        reason=("tables version does not support fix for nan selection "
+                "bug: GH 4858"))
+    def test_nan_selection_bug_4858(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            df = DataFrame(dict(cols=range(6), values=range(6)),
+                           dtype='float64')
+            df['cols'] = (df['cols'] + 10).apply(str)
+            df.iloc[0] = np.nan
+
+            expected = DataFrame(dict(cols=['13.0', '14.0', '15.0'], values=[
+                                 3., 4., 5.]), index=[3, 4, 5])
+
+            # write w/o the index on that particular column
+            store.append('df', df, data_columns=True, index=['cols'])
+            result = store.select('df', where='values>2.0')
+            assert_frame_equal(result, expected)
+
+    def test_start_stop_table(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            # table
+            df = DataFrame(dict(A=np.random.rand(20), B=np.random.rand(20)))
+            store.append('df', df)
+
+            result = store.select(
+                'df', "columns=['A']", start=0, stop=5)
+            expected = df.loc[0:4, ['A']]
+            tm.assert_frame_equal(result, expected)
+
+            # out of range
+            result = store.select(
+                'df', "columns=['A']", start=30, stop=40)
+            assert len(result) == 0
+            expected = df.loc[30:40, ['A']]
+            tm.assert_frame_equal(result, expected)
+
+    def test_start_stop_multiple(self):
+
+        # GH 16209
+        with ensure_clean_store(self.path) as store:
+
+            df = DataFrame({"foo": [1, 2], "bar": [1, 2]})
+
+            store.append_to_multiple({'selector': ['foo'], 'data': None}, df,
+                                     selector='selector')
+            result = store.select_as_multiple(['selector', 'data'],
+                                              selector='selector', start=0,
+                                              stop=1)
+            expected = df.loc[[0], ['foo', 'bar']]
+            tm.assert_frame_equal(result, expected)
+
+    def test_start_stop_fixed(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            # fixed, GH 8287
+            df = DataFrame(dict(A=np.random.rand(20),
+                                B=np.random.rand(20)),
+                           index=pd.date_range('20130101', periods=20))
+            store.put('df', df)
+
+            result = store.select(
+                'df', start=0, stop=5)
+            expected = df.iloc[0:5, :]
+            tm.assert_frame_equal(result, expected)
+
+            result = store.select(
+                'df', start=5, stop=10)
+            expected = df.iloc[5:10, :]
+            tm.assert_frame_equal(result, expected)
+
+            # out of range
+            result = store.select(
+                'df', start=30, stop=40)
+            expected = df.iloc[30:40, :]
+            tm.assert_frame_equal(result, expected)
+
+            # series
+            s = df.A
+            store.put('s', s)
+            result = store.select('s', start=0, stop=5)
+            expected = s.iloc[0:5]
+            tm.assert_series_equal(result, expected)
+
+            result = store.select('s', start=5, stop=10)
+            expected = s.iloc[5:10]
+            tm.assert_series_equal(result, expected)
+
+            # sparse; not implemented
+            df = tm.makeDataFrame()
+            df.iloc[3:5, 1:3] = np.nan
+            df.iloc[8:10, -2] = np.nan
+            dfs = df.to_sparse()
+            store.put('dfs', dfs)
+            with pytest.raises(NotImplementedError):
+                store.select('dfs', start=0, stop=5)
+
+    def test_select_filter_corner(self):
+
+        df = DataFrame(np.random.randn(50, 100))
+        df.index = ['%.3d' % c for c in df.index]
+        df.columns = ['%.3d' % c for c in df.columns]
+
+        with ensure_clean_store(self.path) as store:
+            store.put('frame', df, format='table')
+
+            crit = 'columns=df.columns[:75]'
+            result = store.select('frame', [crit])
+            tm.assert_frame_equal(result, df.loc[:, df.columns[:75]])
+
+            crit = 'columns=df.columns[:75:2]'
+            result = store.select('frame', [crit])
+            tm.assert_frame_equal(result, df.loc[:, df.columns[:75:2]])
+
+    def test_path_pathlib(self):
+        df = tm.makeDataFrame()
+
+        result = tm.round_trip_pathlib(
+            lambda p: df.to_hdf(p, 'df'),
+            lambda p: pd.read_hdf(p, 'df'))
+        tm.assert_frame_equal(df, result)
+
+    @pytest.mark.parametrize('start, stop', [(0, 2), (1, 2), (None, None)])
+    def test_contiguous_mixed_data_table(self, start, stop):
+        # GH 17021
+        # ValueError when reading a contiguous mixed-data table ft. VLArray
+        df = DataFrame({'a': Series([20111010, 20111011, 20111012]),
+                        'b': Series(['ab', 'cd', 'ab'])})
+
+        with ensure_clean_store(self.path) as store:
+            store.append('test_dataset', df)
+
+            result = store.select('test_dataset', start=start, stop=stop)
+            assert_frame_equal(df[start:stop], result)
+
+    def test_path_pathlib_hdfstore(self):
+        df = tm.makeDataFrame()
+
+        def writer(path):
+            with pd.HDFStore(path) as store:
+                df.to_hdf(store, 'df')
+
+        def reader(path):
+            with pd.HDFStore(path) as store:
+                return pd.read_hdf(store, 'df')
+
+        result = tm.round_trip_pathlib(writer, reader)
+        tm.assert_frame_equal(df, result)
+
+    def test_pickle_path_localpath(self):
+        df = tm.makeDataFrame()
+        result = tm.round_trip_pathlib(
+            lambda p: df.to_hdf(p, 'df'),
+            lambda p: pd.read_hdf(p, 'df'))
+        tm.assert_frame_equal(df, result)
+
+    def test_path_localpath_hdfstore(self):
+        df = tm.makeDataFrame()
+
+        def writer(path):
+            with pd.HDFStore(path) as store:
+                df.to_hdf(store, 'df')
+
+        def reader(path):
+            with pd.HDFStore(path) as store:
+                return pd.read_hdf(store, 'df')
+
+        result = tm.round_trip_localpath(writer, reader)
+        tm.assert_frame_equal(df, result)
+
+    def _check_roundtrip(self, obj, comparator, compression=False, **kwargs):
+
+        options = {}
+        if compression:
+            options['complib'] = _default_compressor
+
+        with ensure_clean_store(self.path, 'w', **options) as store:
+            store['obj'] = obj
+            retrieved = store['obj']
+            comparator(retrieved, obj, **kwargs)
+
+    def _check_double_roundtrip(self, obj, comparator, compression=False,
+                                **kwargs):
+        options = {}
+        if compression:
+            options['complib'] = compression or _default_compressor
+
+        with ensure_clean_store(self.path, 'w', **options) as store:
+            store['obj'] = obj
+            retrieved = store['obj']
+            comparator(retrieved, obj, **kwargs)
+            store['obj'] = retrieved
+            again = store['obj']
+            comparator(again, obj, **kwargs)
+
+    def _check_roundtrip_table(self, obj, comparator, compression=False):
+        options = {}
+        if compression:
+            options['complib'] = _default_compressor
+
+        with ensure_clean_store(self.path, 'w', **options) as store:
+            store.put('obj', obj, format='table')
+            retrieved = store['obj']
+
+            comparator(retrieved, obj)
+
+    def test_multiple_open_close(self):
+        # gh-4409: open & close multiple times
+
+        with ensure_clean_path(self.path) as path:
+
+            df = tm.makeDataFrame()
+            df.to_hdf(path, 'df', mode='w', format='table')
+
+            # single
+            store = HDFStore(path)
+            assert 'CLOSED' not in store.info()
+            assert store.is_open
+
+            store.close()
+            assert 'CLOSED' in store.info()
+            assert not store.is_open
+
+        with ensure_clean_path(self.path) as path:
+
+            if pytables._table_file_open_policy_is_strict:
+
+                # multiples
+                store1 = HDFStore(path)
+
+                def f():
+                    HDFStore(path)
+                pytest.raises(ValueError, f)
+                store1.close()
+
+            else:
+
+                # multiples
+                store1 = HDFStore(path)
+                store2 = HDFStore(path)
+
+                assert 'CLOSED' not in store1.info()
+                assert 'CLOSED' not in store2.info()
+                assert store1.is_open
+                assert store2.is_open
+
+                store1.close()
+                assert 'CLOSED' in store1.info()
+                assert not store1.is_open
+                assert 'CLOSED' not in store2.info()
+                assert store2.is_open
+
+                store2.close()
+                assert 'CLOSED' in store1.info()
+                assert 'CLOSED' in store2.info()
+                assert not store1.is_open
+                assert not store2.is_open
+
+                # nested close
+                store = HDFStore(path, mode='w')
+                store.append('df', df)
+
+                store2 = HDFStore(path)
+                store2.append('df2', df)
+                store2.close()
+                assert 'CLOSED' in store2.info()
+                assert not store2.is_open
+
+                store.close()
+                assert 'CLOSED' in store.info()
+                assert not store.is_open
+
+                # double closing
+                store = HDFStore(path, mode='w')
+                store.append('df', df)
+
+                store2 = HDFStore(path)
+                store.close()
+                assert 'CLOSED' in store.info()
+                assert not store.is_open
+
+                store2.close()
+                assert 'CLOSED' in store2.info()
+                assert not store2.is_open
+
+        # ops on a closed store
+        with ensure_clean_path(self.path) as path:
+
+            df = tm.makeDataFrame()
+            df.to_hdf(path, 'df', mode='w', format='table')
+
+            store = HDFStore(path)
+            store.close()
+
+            pytest.raises(ClosedFileError, store.keys)
+            pytest.raises(ClosedFileError, lambda: 'df' in store)
+            pytest.raises(ClosedFileError, lambda: len(store))
+            pytest.raises(ClosedFileError, lambda: store['df'])
+            pytest.raises(AttributeError, lambda: store.df)
+            pytest.raises(ClosedFileError, store.select, 'df')
+            pytest.raises(ClosedFileError, store.get, 'df')
+            pytest.raises(ClosedFileError, store.append, 'df2', df)
+            pytest.raises(ClosedFileError, store.put, 'df3', df)
+            pytest.raises(ClosedFileError, store.get_storer, 'df2')
+            pytest.raises(ClosedFileError, store.remove, 'df2')
+
+            def f():
+                store.select('df')
+            tm.assert_raises_regex(ClosedFileError, 'file is not open', f)
+
+    def test_pytables_native_read(self, datapath):
+        with ensure_clean_store(
+                datapath('io', 'data', 'legacy_hdf/pytables_native.h5'),
+                mode='r') as store:
+            d2 = store['detector/readout']
+            assert isinstance(d2, DataFrame)
+
+    @pytest.mark.skipif(PY35 and is_platform_windows(),
+                        reason="native2 read fails oddly on windows / 3.5")
+    def test_pytables_native2_read(self, datapath):
+        with ensure_clean_store(
+                datapath('io', 'data', 'legacy_hdf', 'pytables_native2.h5'),
+                mode='r') as store:
+            str(store)
+            d1 = store['detector']
+            assert isinstance(d1, DataFrame)
+
+    def test_legacy_table_read(self, datapath):
+        # legacy table types
+        with ensure_clean_store(
+                datapath('io', 'data', 'legacy_hdf', 'legacy_table.h5'),
+                mode='r') as store:
+
+            with catch_warnings(record=True):
+                store.select('df1')
+                store.select('df2')
+                store.select('wp1')
+
+                # force the frame
+                store.select('df2', typ='legacy_frame')
+
+                # old version warning
+                pytest.raises(
+                    Exception, store.select, 'wp1', 'minor_axis=B')
+
+                df2 = store.select('df2')
+                result = store.select('df2', 'index>df2.index[2]')
+                expected = df2[df2.index > df2.index[2]]
+                assert_frame_equal(expected, result)
+
+    def test_copy(self):
+
+        with catch_warnings(record=True):
+
+            def do_copy(f, new_f=None, keys=None,
+                        propindexes=True, **kwargs):
+                try:
+                    store = HDFStore(f, 'r')
+
+                    if new_f is None:
+                        import tempfile
+                        fd, new_f = tempfile.mkstemp()
+
+                    tstore = store.copy(
+                        new_f, keys=keys, propindexes=propindexes, **kwargs)
+
+                    # check keys
+                    if keys is None:
+                        keys = store.keys()
+                    assert set(keys) == set(tstore.keys())
+
+                    # check indices & nrows
+                    for k in tstore.keys():
+                        if tstore.get_storer(k).is_table:
+                            new_t = tstore.get_storer(k)
+                            orig_t = store.get_storer(k)
+
+                            assert orig_t.nrows == new_t.nrows
+
+                            # check propindixes
+                            if propindexes:
+                                for a in orig_t.axes:
+                                    if a.is_indexed:
+                                        assert new_t[a.name].is_indexed
+
+                finally:
+                    safe_close(store)
+                    safe_close(tstore)
+                    try:
+                        os.close(fd)
+                    except:
+                        pass
+                    safe_remove(new_f)
+
+            # new table
+            df = tm.makeDataFrame()
+
+            try:
+                path = create_tempfile(self.path)
+                st = HDFStore(path)
+                st.append('df', df, data_columns=['A'])
+                st.close()
+                do_copy(f=path)
+                do_copy(f=path, propindexes=False)
+            finally:
+                safe_remove(path)
+
+    def test_store_datetime_fractional_secs(self):
+
+        with ensure_clean_store(self.path) as store:
+            dt = datetime.datetime(2012, 1, 2, 3, 4, 5, 123456)
+            series = Series([0], [dt])
+            store['a'] = series
+            assert store['a'].index[0] == dt
+
+    def test_tseries_indices_series(self):
+
+        with ensure_clean_store(self.path) as store:
+            idx = tm.makeDateIndex(10)
+            ser = Series(np.random.randn(len(idx)), idx)
+            store['a'] = ser
+            result = store['a']
+
+            tm.assert_series_equal(result, ser)
+            assert result.index.freq == ser.index.freq
+            tm.assert_class_equal(result.index, ser.index, obj="series index")
+
+            idx = tm.makePeriodIndex(10)
+            ser = Series(np.random.randn(len(idx)), idx)
+            store['a'] = ser
+            result = store['a']
+
+            tm.assert_series_equal(result, ser)
+            assert result.index.freq == ser.index.freq
+            tm.assert_class_equal(result.index, ser.index, obj="series index")
+
+    def test_tseries_indices_frame(self):
+
+        with ensure_clean_store(self.path) as store:
+            idx = tm.makeDateIndex(10)
+            df = DataFrame(np.random.randn(len(idx), 3), index=idx)
+            store['a'] = df
+            result = store['a']
+
+            assert_frame_equal(result, df)
+            assert result.index.freq == df.index.freq
+            tm.assert_class_equal(result.index, df.index,
+                                  obj="dataframe index")
+
+            idx = tm.makePeriodIndex(10)
+            df = DataFrame(np.random.randn(len(idx), 3), idx)
+            store['a'] = df
+            result = store['a']
+
+            assert_frame_equal(result, df)
+            assert result.index.freq == df.index.freq
+            tm.assert_class_equal(result.index, df.index,
+                                  obj="dataframe index")
+
+    def test_unicode_index(self):
+
+        unicode_values = [u('\u03c3'), u('\u03c3\u03c3')]
+
+        # PerformanceWarning
+        with catch_warnings(record=True):
+            s = Series(np.random.randn(len(unicode_values)), unicode_values)
+            self._check_roundtrip(s, tm.assert_series_equal)
+
+    def test_unicode_longer_encoded(self):
+        # GH 11234
+        char = '\u0394'
+        df = pd.DataFrame({'A': [char]})
+        with ensure_clean_store(self.path) as store:
+            store.put('df', df, format='table', encoding='utf-8')
+            result = store.get('df')
+            tm.assert_frame_equal(result, df)
+
+        df = pd.DataFrame({'A': ['a', char], 'B': ['b', 'b']})
+        with ensure_clean_store(self.path) as store:
+            store.put('df', df, format='table', encoding='utf-8')
+            result = store.get('df')
+            tm.assert_frame_equal(result, df)
+
+    def test_store_datetime_mixed(self):
+
+        df = DataFrame(
+            {'a': [1, 2, 3], 'b': [1., 2., 3.], 'c': ['a', 'b', 'c']})
+        ts = tm.makeTimeSeries()
+        df['d'] = ts.index[:3]
+        self._check_roundtrip(df, tm.assert_frame_equal)
+
+    # def test_cant_write_multiindex_table(self):
+    #    # for now, #1848
+    #    df = DataFrame(np.random.randn(10, 4),
+    #                   index=[np.arange(5).repeat(2),
+    #                          np.tile(np.arange(2), 5)])
+
+    #    pytest.raises(Exception, store.put, 'foo', df, format='table')
+
+    def test_append_with_diff_col_name_types_raises_value_error(self):
+        df = DataFrame(np.random.randn(10, 1))
+        df2 = DataFrame({'a': np.random.randn(10)})
+        df3 = DataFrame({(1, 2): np.random.randn(10)})
+        df4 = DataFrame({('1', 2): np.random.randn(10)})
+        df5 = DataFrame({('1', 2, object): np.random.randn(10)})
+
+        with ensure_clean_store(self.path) as store:
+            name = 'df_%s' % tm.rands(10)
+            store.append(name, df)
+
+            for d in (df2, df3, df4, df5):
+                with pytest.raises(ValueError):
+                    store.append(name, d)
+
+    def test_query_with_nested_special_character(self):
+        df = DataFrame({'a': ['a', 'a', 'c', 'b',
+                              'test & test', 'c', 'b', 'e'],
+                        'b': [1, 2, 3, 4, 5, 6, 7, 8]})
+        expected = df[df.a == 'test & test']
+        with ensure_clean_store(self.path) as store:
+            store.append('test', df, format='table', data_columns=True)
+            result = store.select('test', 'a = "test & test"')
+        tm.assert_frame_equal(expected, result)
+
+    def test_categorical(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            # Basic
+            _maybe_remove(store, 's')
+            s = Series(Categorical(['a', 'b', 'b', 'a', 'a', 'c'], categories=[
+                       'a', 'b', 'c', 'd'], ordered=False))
+            store.append('s', s, format='table')
+            result = store.select('s')
+            tm.assert_series_equal(s, result)
+
+            _maybe_remove(store, 's_ordered')
+            s = Series(Categorical(['a', 'b', 'b', 'a', 'a', 'c'], categories=[
+                       'a', 'b', 'c', 'd'], ordered=True))
+            store.append('s_ordered', s, format='table')
+            result = store.select('s_ordered')
+            tm.assert_series_equal(s, result)
+
+            _maybe_remove(store, 'df')
+
+            df = DataFrame({"s": s, "vals": [1, 2, 3, 4, 5, 6]})
+            store.append('df', df, format='table')
+            result = store.select('df')
+            tm.assert_frame_equal(result, df)
+
+            # Dtypes
+            s = Series([1, 1, 2, 2, 3, 4, 5]).astype('category')
+            store.append('si', s)
+            result = store.select('si')
+            tm.assert_series_equal(result, s)
+
+            s = Series([1, 1, np.nan, 2, 3, 4, 5]).astype('category')
+            store.append('si2', s)
+            result = store.select('si2')
+            tm.assert_series_equal(result, s)
+
+            # Multiple
+            df2 = df.copy()
+            df2['s2'] = Series(list('abcdefg')).astype('category')
+            store.append('df2', df2)
+            result = store.select('df2')
+            tm.assert_frame_equal(result, df2)
+
+            # Make sure the metadata is OK
+            info = store.info()
+            assert '/df2   ' in info
+            # assert '/df2/meta/values_block_0/meta' in info
+            assert '/df2/meta/values_block_1/meta' in info
+
+            # unordered
+            s = Series(Categorical(['a', 'b', 'b', 'a', 'a', 'c'], categories=[
+                       'a', 'b', 'c', 'd'], ordered=False))
+            store.append('s2', s, format='table')
+            result = store.select('s2')
+            tm.assert_series_equal(result, s)
+
+            # Query
+            store.append('df3', df, data_columns=['s'])
+            expected = df[df.s.isin(['b', 'c'])]
+            result = store.select('df3', where=['s in ["b","c"]'])
+            tm.assert_frame_equal(result, expected)
+
+            expected = df[df.s.isin(['b', 'c'])]
+            result = store.select('df3', where=['s = ["b","c"]'])
+            tm.assert_frame_equal(result, expected)
+
+            expected = df[df.s.isin(['d'])]
+            result = store.select('df3', where=['s in ["d"]'])
+            tm.assert_frame_equal(result, expected)
+
+            expected = df[df.s.isin(['f'])]
+            result = store.select('df3', where=['s in ["f"]'])
+            tm.assert_frame_equal(result, expected)
+
+            # Appending with same categories is ok
+            store.append('df3', df)
+
+            df = concat([df, df])
+            expected = df[df.s.isin(['b', 'c'])]
+            result = store.select('df3', where=['s in ["b","c"]'])
+            tm.assert_frame_equal(result, expected)
+
+            # Appending must have the same categories
+            df3 = df.copy()
+            df3['s'].cat.remove_unused_categories(inplace=True)
+
+            with pytest.raises(ValueError):
+                store.append('df3', df3)
+
+            # Remove, and make sure meta data is removed (its a recursive
+            # removal so should be).
+            result = store.select('df3/meta/s/meta')
+            assert result is not None
+            store.remove('df3')
+
+            with pytest.raises(KeyError):
+                store.select('df3/meta/s/meta')
+
+    def test_categorical_conversion(self):
+
+        # GH13322
+        # Check that read_hdf with categorical columns doesn't return rows if
+        # where criteria isn't met.
+        obsids = ['ESP_012345_6789', 'ESP_987654_3210']
+        imgids = ['APF00006np', 'APF0001imm']
+        data = [4.3, 9.8]
+
+        # Test without categories
+        df = DataFrame(dict(obsids=obsids, imgids=imgids, data=data))
+
+        # We are expecting an empty DataFrame matching types of df
+        expected = df.iloc[[], :]
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', format='table', data_columns=True)
+            result = read_hdf(path, 'df', where='obsids=B')
+            tm.assert_frame_equal(result, expected)
+
+        # Test with categories
+        df.obsids = df.obsids.astype('category')
+        df.imgids = df.imgids.astype('category')
+
+        # We are expecting an empty DataFrame matching types of df
+        expected = df.iloc[[], :]
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', format='table', data_columns=True)
+            result = read_hdf(path, 'df', where='obsids=B')
+            tm.assert_frame_equal(result, expected)
+
+    def test_categorical_nan_only_columns(self):
+        # GH18413
+        # Check that read_hdf with categorical columns with NaN-only values can
+        # be read back.
+        df = pd.DataFrame({
+            'a': ['a', 'b', 'c', np.nan],
+            'b': [np.nan, np.nan, np.nan, np.nan],
+            'c': [1, 2, 3, 4],
+            'd': pd.Series([None] * 4, dtype=object)
+        })
+        df['a'] = df.a.astype('category')
+        df['b'] = df.b.astype('category')
+        df['d'] = df.b.astype('category')
+        expected = df
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', format='table', data_columns=True)
+            result = read_hdf(path, 'df')
+            tm.assert_frame_equal(result, expected)
+
+    def test_duplicate_column_name(self):
+        df = DataFrame(columns=["a", "a"], data=[[0, 0]])
+
+        with ensure_clean_path(self.path) as path:
+            pytest.raises(ValueError, df.to_hdf,
+                          path, 'df', format='fixed')
+
+            df.to_hdf(path, 'df', format='table')
+            other = read_hdf(path, 'df')
+
+            tm.assert_frame_equal(df, other)
+            assert df.equals(other)
+            assert other.equals(df)
+
+    def test_round_trip_equals(self):
+        # GH 9330
+        df = DataFrame({"B": [1, 2], "A": ["x", "y"]})
+
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', format='table')
+            other = read_hdf(path, 'df')
+            tm.assert_frame_equal(df, other)
+            assert df.equals(other)
+            assert other.equals(df)
+
+    def test_preserve_timedeltaindex_type(self):
+        # GH9635
+        # Storing TimedeltaIndexed DataFrames in fixed stores did not preserve
+        # the type of the index.
+        df = DataFrame(np.random.normal(size=(10, 5)))
+        df.index = timedelta_range(
+            start='0s', periods=10, freq='1s', name='example')
+
+        with ensure_clean_store(self.path) as store:
+
+            store['df'] = df
+            assert_frame_equal(store['df'], df)
+
+    def test_columns_multiindex_modified(self):
+        # BUG: 7212
+        # read_hdf store.select modified the passed columns parameters
+        # when multi-indexed.
+
+        df = DataFrame(np.random.rand(4, 5),
+                       index=list('abcd'),
+                       columns=list('ABCDE'))
+        df.index.name = 'letters'
+        df = df.set_index(keys='E', append=True)
+
+        data_columns = df.index.names + df.columns.tolist()
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df',
+                      mode='a',
+                      append=True,
+                      data_columns=data_columns,
+                      index=False)
+            cols2load = list('BCD')
+            cols2load_original = list(cols2load)
+            df_loaded = read_hdf(path, 'df', columns=cols2load)  # noqa
+            assert cols2load_original == cols2load
+
+    def test_to_hdf_with_object_column_names(self):
+        # GH9057
+        # Writing HDF5 table format should only work for string-like
+        # column types
+
+        types_should_fail = [tm.makeIntIndex, tm.makeFloatIndex,
+                             tm.makeDateIndex, tm.makeTimedeltaIndex,
+                             tm.makePeriodIndex]
+        types_should_run = [tm.makeStringIndex, tm.makeCategoricalIndex]
+
+        if compat.PY3:
+            types_should_run.append(tm.makeUnicodeIndex)
+        else:
+            # TODO: Add back to types_should_fail
+            # https://github.com/pandas-dev/pandas/issues/20907
+            pass
+
+        for index in types_should_fail:
+            df = DataFrame(np.random.randn(10, 2), columns=index(2))
+            with ensure_clean_path(self.path) as path:
+                with catch_warnings(record=True):
+                    with tm.assert_raises_regex(
+                        ValueError, ("cannot have non-object label "
+                                     "DataIndexableCol")):
+                        df.to_hdf(path, 'df', format='table',
+                                  data_columns=True)
+
+        for index in types_should_run:
+            df = DataFrame(np.random.randn(10, 2), columns=index(2))
+            with ensure_clean_path(self.path) as path:
+                with catch_warnings(record=True):
+                    df.to_hdf(path, 'df', format='table', data_columns=True)
+                    result = pd.read_hdf(
+                        path, 'df', where="index = [{0}]".format(df.index[0]))
+                    assert(len(result))
+
+    def test_read_hdf_open_store(self):
+        # GH10330
+        # No check for non-string path_or-buf, and no test of open store
+        df = DataFrame(np.random.rand(4, 5),
+                       index=list('abcd'),
+                       columns=list('ABCDE'))
+        df.index.name = 'letters'
+        df = df.set_index(keys='E', append=True)
+
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', mode='w')
+            direct = read_hdf(path, 'df')
+            store = HDFStore(path, mode='r')
+            indirect = read_hdf(store, 'df')
+            tm.assert_frame_equal(direct, indirect)
+            assert store.is_open
+            store.close()
+
+    def test_read_hdf_iterator(self):
+        df = DataFrame(np.random.rand(4, 5),
+                       index=list('abcd'),
+                       columns=list('ABCDE'))
+        df.index.name = 'letters'
+        df = df.set_index(keys='E', append=True)
+
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', mode='w', format='t')
+            direct = read_hdf(path, 'df')
+            iterator = read_hdf(path, 'df', iterator=True)
+            assert isinstance(iterator, TableIterator)
+            indirect = next(iterator.__iter__())
+            tm.assert_frame_equal(direct, indirect)
+            iterator.store.close()
+
+    def test_read_hdf_errors(self):
+        df = DataFrame(np.random.rand(4, 5),
+                       index=list('abcd'),
+                       columns=list('ABCDE'))
+
+        with ensure_clean_path(self.path) as path:
+            pytest.raises(IOError, read_hdf, path, 'key')
+            df.to_hdf(path, 'df')
+            store = HDFStore(path, mode='r')
+            store.close()
+            pytest.raises(IOError, read_hdf, store, 'df')
+
+    def test_read_hdf_generic_buffer_errors(self):
+        pytest.raises(NotImplementedError, read_hdf, BytesIO(b''), 'df')
+
+    def test_invalid_complib(self):
+        df = DataFrame(np.random.rand(4, 5),
+                       index=list('abcd'),
+                       columns=list('ABCDE'))
+        with ensure_clean_path(self.path) as path:
+            with pytest.raises(ValueError):
+                df.to_hdf(path, 'df', complib='foolib')
+    # GH10443
+
+    def test_read_nokey(self):
+        df = DataFrame(np.random.rand(4, 5),
+                       index=list('abcd'),
+                       columns=list('ABCDE'))
+
+        # Categorical dtype not supported for "fixed" format. So no need
+        # to test with that dtype in the dataframe here.
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', mode='a')
+            reread = read_hdf(path)
+            assert_frame_equal(df, reread)
+            df.to_hdf(path, 'df2', mode='a')
+            pytest.raises(ValueError, read_hdf, path)
+
+    def test_read_nokey_table(self):
+        # GH13231
+        df = DataFrame({'i': range(5),
+                        'c': Series(list('abacd'), dtype='category')})
+
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', mode='a', format='table')
+            reread = read_hdf(path)
+            assert_frame_equal(df, reread)
+            df.to_hdf(path, 'df2', mode='a', format='table')
+            pytest.raises(ValueError, read_hdf, path)
+
+    def test_read_nokey_empty(self):
+        with ensure_clean_path(self.path) as path:
+            store = HDFStore(path)
+            store.close()
+            pytest.raises(ValueError, read_hdf, path)
+
+    @td.skip_if_no('pathlib')
+    def test_read_from_pathlib_path(self):
+
+        # GH11773
+        from pathlib import Path
+
+        expected = DataFrame(np.random.rand(4, 5),
+                             index=list('abcd'),
+                             columns=list('ABCDE'))
+        with ensure_clean_path(self.path) as filename:
+            path_obj = Path(filename)
+
+            expected.to_hdf(path_obj, 'df', mode='a')
+            actual = read_hdf(path_obj, 'df')
+
+        tm.assert_frame_equal(expected, actual)
+
+    @td.skip_if_no('py.path')
+    def test_read_from_py_localpath(self):
+
+        # GH11773
+        from py.path import local as LocalPath
+
+        expected = DataFrame(np.random.rand(4, 5),
+                             index=list('abcd'),
+                             columns=list('ABCDE'))
+        with ensure_clean_path(self.path) as filename:
+            path_obj = LocalPath(filename)
+
+            expected.to_hdf(path_obj, 'df', mode='a')
+            actual = read_hdf(path_obj, 'df')
+
+        tm.assert_frame_equal(expected, actual)
+
+    def test_query_long_float_literal(self):
+        # GH 14241
+        df = pd.DataFrame({'A': [1000000000.0009,
+                                 1000000000.0011,
+                                 1000000000.0015]})
+
+        with ensure_clean_store(self.path) as store:
+            store.append('test', df, format='table', data_columns=True)
+
+            cutoff = 1000000000.0006
+            result = store.select('test', "A < %.4f" % cutoff)
+            assert result.empty
+
+            cutoff = 1000000000.0010
+            result = store.select('test', "A > %.4f" % cutoff)
+            expected = df.loc[[1, 2], :]
+            tm.assert_frame_equal(expected, result)
+
+            exact = 1000000000.0011
+            result = store.select('test', 'A == %.4f' % exact)
+            expected = df.loc[[1], :]
+            tm.assert_frame_equal(expected, result)
+
+    def test_query_compare_column_type(self):
+        # GH 15492
+        df = pd.DataFrame({'date': ['2014-01-01', '2014-01-02'],
+                           'real_date': date_range('2014-01-01', periods=2),
+                           'float': [1.1, 1.2],
+                           'int': [1, 2]},
+                          columns=['date', 'real_date', 'float', 'int'])
+
+        with ensure_clean_store(self.path) as store:
+            store.append('test', df, format='table', data_columns=True)
+
+            ts = pd.Timestamp('2014-01-01')  # noqa
+            result = store.select('test', where='real_date > ts')
+            expected = df.loc[[1], :]
+            tm.assert_frame_equal(expected, result)
+
+            for op in ['<', '>', '==']:
+                # non strings to string column always fail
+                for v in [2.1, True, pd.Timestamp('2014-01-01'),
+                          pd.Timedelta(1, 's')]:
+                    query = 'date {op} v'.format(op=op)
+                    with pytest.raises(TypeError):
+                        result = store.select('test', where=query)
+
+                # strings to other columns must be convertible to type
+                v = 'a'
+                for col in ['int', 'float', 'real_date']:
+                    query = '{col} {op} v'.format(op=op, col=col)
+                    with pytest.raises(ValueError):
+                        result = store.select('test', where=query)
+
+                for v, col in zip(['1', '1.1', '2014-01-01'],
+                                  ['int', 'float', 'real_date']):
+                    query = '{col} {op} v'.format(op=op, col=col)
+                    result = store.select('test', where=query)
+
+                    if op == '==':
+                        expected = df.loc[[0], :]
+                    elif op == '>':
+                        expected = df.loc[[1], :]
+                    else:
+                        expected = df.loc[[], :]
+                    tm.assert_frame_equal(expected, result)
+
+    @pytest.mark.parametrize('format', ['fixed', 'table'])
+    def test_read_hdf_series_mode_r(self, format):
+        # GH 16583
+        # Tests that reading a Series saved to an HDF file
+        # still works if a mode='r' argument is supplied
+        series = tm.makeFloatSeries()
+        with ensure_clean_path(self.path) as path:
+            series.to_hdf(path, key='data', format=format)
+            result = pd.read_hdf(path, key='data', mode='r')
+        tm.assert_series_equal(result, series)
+
+    @pytest.mark.skipif(not PY36, reason="Need python 3.6")
+    def test_fspath(self):
+        with tm.ensure_clean('foo.h5') as path:
+            with pd.HDFStore(path) as store:
+                assert os.fspath(store) == str(path)
+
+    def test_read_py2_hdf_file_in_py3(self, datapath):
+        # GH 16781
+
+        # tests reading a PeriodIndex DataFrame written in Python2 in Python3
+
+        # the file was generated in Python 2.7 like so:
+        #
+        # df = pd.DataFrame([1.,2,3], index=pd.PeriodIndex(
+        #              ['2015-01-01', '2015-01-02', '2015-01-05'], freq='B'))
+        # df.to_hdf('periodindex_0.20.1_x86_64_darwin_2.7.13.h5', 'p')
+
+        expected = pd.DataFrame([1., 2, 3], index=pd.PeriodIndex(
+            ['2015-01-01', '2015-01-02', '2015-01-05'], freq='B'))
+
+        with ensure_clean_store(
+                datapath('io', 'data', 'legacy_hdf',
+                         'periodindex_0.20.1_x86_64_darwin_2.7.13.h5'),
+                mode='r') as store:
+            result = store['p']
+            assert_frame_equal(result, expected)
+
+
+class TestHDFComplexValues(Base):
+    # GH10447
+
+    def test_complex_fixed(self):
+        df = DataFrame(np.random.rand(4, 5).astype(np.complex64),
+                       index=list('abcd'),
+                       columns=list('ABCDE'))
+
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df')
+            reread = read_hdf(path, 'df')
+            assert_frame_equal(df, reread)
+
+        df = DataFrame(np.random.rand(4, 5).astype(np.complex128),
+                       index=list('abcd'),
+                       columns=list('ABCDE'))
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df')
+            reread = read_hdf(path, 'df')
+            assert_frame_equal(df, reread)
+
+    def test_complex_table(self):
+        df = DataFrame(np.random.rand(4, 5).astype(np.complex64),
+                       index=list('abcd'),
+                       columns=list('ABCDE'))
+
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', format='table')
+            reread = read_hdf(path, 'df')
+            assert_frame_equal(df, reread)
+
+        df = DataFrame(np.random.rand(4, 5).astype(np.complex128),
+                       index=list('abcd'),
+                       columns=list('ABCDE'))
+
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', format='table', mode='w')
+            reread = read_hdf(path, 'df')
+            assert_frame_equal(df, reread)
+
+    def test_complex_mixed_fixed(self):
+        complex64 = np.array([1.0 + 1.0j, 1.0 + 1.0j,
+                              1.0 + 1.0j, 1.0 + 1.0j], dtype=np.complex64)
+        complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j],
+                              dtype=np.complex128)
+        df = DataFrame({'A': [1, 2, 3, 4],
+                        'B': ['a', 'b', 'c', 'd'],
+                        'C': complex64,
+                        'D': complex128,
+                        'E': [1.0, 2.0, 3.0, 4.0]},
+                       index=list('abcd'))
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df')
+            reread = read_hdf(path, 'df')
+            assert_frame_equal(df, reread)
+
+    def test_complex_mixed_table(self):
+        complex64 = np.array([1.0 + 1.0j, 1.0 + 1.0j,
+                              1.0 + 1.0j, 1.0 + 1.0j], dtype=np.complex64)
+        complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j],
+                              dtype=np.complex128)
+        df = DataFrame({'A': [1, 2, 3, 4],
+                        'B': ['a', 'b', 'c', 'd'],
+                        'C': complex64,
+                        'D': complex128,
+                        'E': [1.0, 2.0, 3.0, 4.0]},
+                       index=list('abcd'))
+
+        with ensure_clean_store(self.path) as store:
+            store.append('df', df, data_columns=['A', 'B'])
+            result = store.select('df', where='A>2')
+            assert_frame_equal(df.loc[df.A > 2], result)
+
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', format='table')
+            reread = read_hdf(path, 'df')
+            assert_frame_equal(df, reread)
+
+    def test_complex_across_dimensions_fixed(self):
+        with catch_warnings(record=True):
+            complex128 = np.array(
+                [1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j])
+            s = Series(complex128, index=list('abcd'))
+            df = DataFrame({'A': s, 'B': s})
+            p = Panel({'One': df, 'Two': df})
+
+            objs = [s, df, p]
+            comps = [tm.assert_series_equal, tm.assert_frame_equal,
+                     tm.assert_panel_equal]
+            for obj, comp in zip(objs, comps):
+                with ensure_clean_path(self.path) as path:
+                    obj.to_hdf(path, 'obj', format='fixed')
+                    reread = read_hdf(path, 'obj')
+                    comp(obj, reread)
+
+    def test_complex_across_dimensions(self):
+        complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j])
+        s = Series(complex128, index=list('abcd'))
+        df = DataFrame({'A': s, 'B': s})
+
+        with catch_warnings(record=True):
+            p = Panel({'One': df, 'Two': df})
+
+            objs = [df, p]
+            comps = [tm.assert_frame_equal, tm.assert_panel_equal]
+            for obj, comp in zip(objs, comps):
+                with ensure_clean_path(self.path) as path:
+                    obj.to_hdf(path, 'obj', format='table')
+                    reread = read_hdf(path, 'obj')
+                    comp(obj, reread)
+
+    def test_complex_indexing_error(self):
+        complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j],
+                              dtype=np.complex128)
+        df = DataFrame({'A': [1, 2, 3, 4],
+                        'B': ['a', 'b', 'c', 'd'],
+                        'C': complex128},
+                       index=list('abcd'))
+        with ensure_clean_store(self.path) as store:
+            pytest.raises(TypeError, store.append,
+                          'df', df, data_columns=['C'])
+
+    def test_complex_series_error(self):
+        complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j])
+        s = Series(complex128, index=list('abcd'))
+
+        with ensure_clean_path(self.path) as path:
+            pytest.raises(TypeError, s.to_hdf, path, 'obj', format='t')
+
+        with ensure_clean_path(self.path) as path:
+            s.to_hdf(path, 'obj', format='t', index=False)
+            reread = read_hdf(path, 'obj')
+            tm.assert_series_equal(s, reread)
+
+    def test_complex_append(self):
+        df = DataFrame({'a': np.random.randn(100).astype(np.complex128),
+                        'b': np.random.randn(100)})
+
+        with ensure_clean_store(self.path) as store:
+            store.append('df', df, data_columns=['b'])
+            store.append('df', df)
+            result = store.select('df')
+            assert_frame_equal(pd.concat([df, df], 0), result)
+
+
+class TestTimezones(Base):
+
+    def _compare_with_tz(self, a, b):
+        tm.assert_frame_equal(a, b)
+
+        # compare the zones on each element
+        for c in a.columns:
+            for i in a.index:
+                a_e = a.loc[i, c]
+                b_e = b.loc[i, c]
+                if not (a_e == b_e and a_e.tz == b_e.tz):
+                    raise AssertionError(
+                        "invalid tz comparison [%s] [%s]" % (a_e, b_e))
+
+    def test_append_with_timezones_dateutil(self):
+
+        from datetime import timedelta
+
+        # use maybe_get_tz instead of dateutil.tz.gettz to handle the windows
+        # filename issues.
+        from pandas._libs.tslibs.timezones import maybe_get_tz
+        gettz = lambda x: maybe_get_tz('dateutil/' + x)
+
+        # as columns
+        with ensure_clean_store(self.path) as store:
+
+            _maybe_remove(store, 'df_tz')
+            df = DataFrame(dict(A=[Timestamp('20130102 2:00:00', tz=gettz(
+                'US/Eastern')) + timedelta(hours=1) * i for i in range(5)]))
+
+            store.append('df_tz', df, data_columns=['A'])
+            result = store['df_tz']
+            self._compare_with_tz(result, df)
+            assert_frame_equal(result, df)
+
+            # select with tz aware
+            expected = df[df.A >= df.A[3]]
+            result = store.select('df_tz', where='A>=df.A[3]')
+            self._compare_with_tz(result, expected)
+
+            # ensure we include dates in DST and STD time here.
+            _maybe_remove(store, 'df_tz')
+            df = DataFrame(dict(A=Timestamp('20130102',
+                                            tz=gettz('US/Eastern')),
+                                B=Timestamp('20130603',
+                                            tz=gettz('US/Eastern'))),
+                           index=range(5))
+            store.append('df_tz', df)
+            result = store['df_tz']
+            self._compare_with_tz(result, df)
+            assert_frame_equal(result, df)
+
+            df = DataFrame(dict(A=Timestamp('20130102',
+                                            tz=gettz('US/Eastern')),
+                                B=Timestamp('20130102', tz=gettz('EET'))),
+                           index=range(5))
+            pytest.raises(ValueError, store.append, 'df_tz', df)
+
+            # this is ok
+            _maybe_remove(store, 'df_tz')
+            store.append('df_tz', df, data_columns=['A', 'B'])
+            result = store['df_tz']
+            self._compare_with_tz(result, df)
+            assert_frame_equal(result, df)
+
+            # can't append with diff timezone
+            df = DataFrame(dict(A=Timestamp('20130102',
+                                            tz=gettz('US/Eastern')),
+                                B=Timestamp('20130102', tz=gettz('CET'))),
+                           index=range(5))
+            pytest.raises(ValueError, store.append, 'df_tz', df)
+
+        # as index
+        with ensure_clean_store(self.path) as store:
+
+            # GH 4098 example
+            df = DataFrame(dict(A=Series(lrange(3), index=date_range(
+                '2000-1-1', periods=3, freq='H', tz=gettz('US/Eastern')))))
+
+            _maybe_remove(store, 'df')
+            store.put('df', df)
+            result = store.select('df')
+            assert_frame_equal(result, df)
+
+            _maybe_remove(store, 'df')
+            store.append('df', df)
+            result = store.select('df')
+            assert_frame_equal(result, df)
+
+    def test_append_with_timezones_pytz(self):
+
+        from datetime import timedelta
+
+        # as columns
+        with ensure_clean_store(self.path) as store:
+
+            _maybe_remove(store, 'df_tz')
+            df = DataFrame(dict(A=[Timestamp('20130102 2:00:00',
+                                             tz='US/Eastern') +
+                                   timedelta(hours=1) * i
+                                   for i in range(5)]))
+            store.append('df_tz', df, data_columns=['A'])
+            result = store['df_tz']
+            self._compare_with_tz(result, df)
+            assert_frame_equal(result, df)
+
+            # select with tz aware
+            self._compare_with_tz(store.select(
+                'df_tz', where='A>=df.A[3]'), df[df.A >= df.A[3]])
+
+            _maybe_remove(store, 'df_tz')
+            # ensure we include dates in DST and STD time here.
+            df = DataFrame(dict(A=Timestamp('20130102', tz='US/Eastern'),
+                                B=Timestamp('20130603', tz='US/Eastern')),
+                           index=range(5))
+            store.append('df_tz', df)
+            result = store['df_tz']
+            self._compare_with_tz(result, df)
+            assert_frame_equal(result, df)
+
+            df = DataFrame(dict(A=Timestamp('20130102', tz='US/Eastern'),
+                                B=Timestamp('20130102', tz='EET')),
+                           index=range(5))
+            pytest.raises(ValueError, store.append, 'df_tz', df)
+
+            # this is ok
+            _maybe_remove(store, 'df_tz')
+            store.append('df_tz', df, data_columns=['A', 'B'])
+            result = store['df_tz']
+            self._compare_with_tz(result, df)
+            assert_frame_equal(result, df)
+
+            # can't append with diff timezone
+            df = DataFrame(dict(A=Timestamp('20130102', tz='US/Eastern'),
+                                B=Timestamp('20130102', tz='CET')),
+                           index=range(5))
+            pytest.raises(ValueError, store.append, 'df_tz', df)
+
+        # as index
+        with ensure_clean_store(self.path) as store:
+
+            # GH 4098 example
+            df = DataFrame(dict(A=Series(lrange(3), index=date_range(
+                '2000-1-1', periods=3, freq='H', tz='US/Eastern'))))
+
+            _maybe_remove(store, 'df')
+            store.put('df', df)
+            result = store.select('df')
+            assert_frame_equal(result, df)
+
+            _maybe_remove(store, 'df')
+            store.append('df', df)
+            result = store.select('df')
+            assert_frame_equal(result, df)
+
+    def test_tseries_select_index_column(self):
+        # GH7777
+        # selecting a UTC datetimeindex column did
+        # not preserve UTC tzinfo set before storing
+
+        # check that no tz still works
+        rng = date_range('1/1/2000', '1/30/2000')
+        frame = DataFrame(np.random.randn(len(rng), 4), index=rng)
+
+        with ensure_clean_store(self.path) as store:
+            store.append('frame', frame)
+            result = store.select_column('frame', 'index')
+            assert rng.tz == DatetimeIndex(result.values).tz
+
+        # check utc
+        rng = date_range('1/1/2000', '1/30/2000', tz='UTC')
+        frame = DataFrame(np.random.randn(len(rng), 4), index=rng)
+
+        with ensure_clean_store(self.path) as store:
+            store.append('frame', frame)
+            result = store.select_column('frame', 'index')
+            assert rng.tz == result.dt.tz
+
+        # double check non-utc
+        rng = date_range('1/1/2000', '1/30/2000', tz='US/Eastern')
+        frame = DataFrame(np.random.randn(len(rng), 4), index=rng)
+
+        with ensure_clean_store(self.path) as store:
+            store.append('frame', frame)
+            result = store.select_column('frame', 'index')
+            assert rng.tz == result.dt.tz
+
+    def test_timezones_fixed(self):
+        with ensure_clean_store(self.path) as store:
+
+            # index
+            rng = date_range('1/1/2000', '1/30/2000', tz='US/Eastern')
+            df = DataFrame(np.random.randn(len(rng), 4), index=rng)
+            store['df'] = df
+            result = store['df']
+            assert_frame_equal(result, df)
+
+            # as data
+            # GH11411
+            _maybe_remove(store, 'df')
+            df = DataFrame({'A': rng,
+                            'B': rng.tz_convert('UTC').tz_localize(None),
+                            'C': rng.tz_convert('CET'),
+                            'D': range(len(rng))}, index=rng)
+            store['df'] = df
+            result = store['df']
+            assert_frame_equal(result, df)
+
+    def test_fixed_offset_tz(self):
+        rng = date_range('1/1/2000 00:00:00-07:00', '1/30/2000 00:00:00-07:00')
+        frame = DataFrame(np.random.randn(len(rng), 4), index=rng)
+
+        with ensure_clean_store(self.path) as store:
+            store['frame'] = frame
+            recons = store['frame']
+            tm.assert_index_equal(recons.index, rng)
+            assert rng.tz == recons.index.tz
+
+    @td.skip_if_windows
+    def test_store_timezone(self):
+        # GH2852
+        # issue storing datetime.date with a timezone as it resets when read
+        # back in a new timezone
+
+        # original method
+        with ensure_clean_store(self.path) as store:
+
+            today = datetime.date(2013, 9, 10)
+            df = DataFrame([1, 2, 3], index=[today, today, today])
+            store['obj1'] = df
+            result = store['obj1']
+            assert_frame_equal(result, df)
+
+        # with tz setting
+        with ensure_clean_store(self.path) as store:
+
+            with set_timezone('EST5EDT'):
+                today = datetime.date(2013, 9, 10)
+                df = DataFrame([1, 2, 3], index=[today, today, today])
+                store['obj1'] = df
+
+            with set_timezone('CST6CDT'):
+                result = store['obj1']
+
+            assert_frame_equal(result, df)
+
+    def test_legacy_datetimetz_object(self, datapath):
+        # legacy from < 0.17.0
+        # 8260
+        expected = DataFrame(dict(A=Timestamp('20130102', tz='US/Eastern'),
+                                  B=Timestamp('20130603', tz='CET')),
+                             index=range(5))
+        with ensure_clean_store(
+                datapath('io', 'data', 'legacy_hdf', 'datetimetz_object.h5'),
+                mode='r') as store:
+            result = store['df']
+            assert_frame_equal(result, expected)
+
+    def test_dst_transitions(self):
+        # make sure we are not failing on transaitions
+        with ensure_clean_store(self.path) as store:
+            times = pd.date_range("2013-10-26 23:00", "2013-10-27 01:00",
+                                  tz="Europe/London",
+                                  freq="H",
+                                  ambiguous='infer')
+
+            for i in [times, times + pd.Timedelta('10min')]:
+                _maybe_remove(store, 'df')
+                df = DataFrame({'A': range(len(i)), 'B': i}, index=i)
+                store.append('df', df)
+                result = store.select('df')
+                assert_frame_equal(result, df)
diff --git a/pandas/tests/io/test_s3.py b/pandas/tests/io/test_s3.py
new file mode 100644
index 0000000000000..7a3062f470ce8
--- /dev/null
+++ b/pandas/tests/io/test_s3.py
@@ -0,0 +1,8 @@
+from pandas.io.common import is_s3_url
+
+
+class TestS3URL(object):
+
+    def test_is_s3_url(self):
+        assert is_s3_url("s3://pandas/somethingelse.com")
+        assert not is_s3_url("s4://pandas/somethingelse.com")
diff --git a/pandas/tests/io/test_sql.py b/pandas/tests/io/test_sql.py
new file mode 100644
index 0000000000000..f8f742c5980ac
--- /dev/null
+++ b/pandas/tests/io/test_sql.py
@@ -0,0 +1,2636 @@
+"""SQL io tests
+
+The SQL tests are broken down in different classes:
+
+- `PandasSQLTest`: base class with common methods for all test classes
+- Tests for the public API (only tests with sqlite3)
+    - `_TestSQLApi` base class
+    - `TestSQLApi`: test the public API with sqlalchemy engine
+    - `TestSQLiteFallbackApi`: test the public API with a sqlite DBAPI
+      connection
+- Tests for the different SQL flavors (flavor specific type conversions)
+    - Tests for the sqlalchemy mode: `_TestSQLAlchemy` is the base class with
+      common methods, `_TestSQLAlchemyConn` tests the API with a SQLAlchemy
+      Connection object. The different tested flavors (sqlite3, MySQL,
+      PostgreSQL) derive from the base class
+    - Tests for the fallback mode (`TestSQLiteFallback`)
+
+"""
+
+from __future__ import print_function
+from warnings import catch_warnings
+import pytest
+import sqlite3
+import csv
+
+import warnings
+import numpy as np
+import pandas as pd
+
+from datetime import datetime, date, time
+
+from pandas.core.dtypes.common import (
+    is_object_dtype, is_datetime64_dtype,
+    is_datetime64tz_dtype)
+from pandas import DataFrame, Series, Index, MultiIndex, isna, concat
+from pandas import date_range, to_datetime, to_timedelta, Timestamp
+import pandas.compat as compat
+from pandas.compat import range, lrange, string_types, PY36
+from pandas.core.tools.datetimes import format as date_format
+
+import pandas.io.sql as sql
+from pandas.io.sql import read_sql_table, read_sql_query
+import pandas.util.testing as tm
+
+
+try:
+    import sqlalchemy
+    import sqlalchemy.schema
+    import sqlalchemy.sql.sqltypes as sqltypes
+    from sqlalchemy.ext import declarative
+    from sqlalchemy.orm import session as sa_session
+    SQLALCHEMY_INSTALLED = True
+except ImportError:
+    SQLALCHEMY_INSTALLED = False
+
+SQL_STRINGS = {
+    'create_iris': {
+        'sqlite': """CREATE TABLE iris (
+                "SepalLength" REAL,
+                "SepalWidth" REAL,
+                "PetalLength" REAL,
+                "PetalWidth" REAL,
+                "Name" TEXT
+            )""",
+        'mysql': """CREATE TABLE iris (
+                `SepalLength` DOUBLE,
+                `SepalWidth` DOUBLE,
+                `PetalLength` DOUBLE,
+                `PetalWidth` DOUBLE,
+                `Name` VARCHAR(200)
+            )""",
+        'postgresql': """CREATE TABLE iris (
+                "SepalLength" DOUBLE PRECISION,
+                "SepalWidth" DOUBLE PRECISION,
+                "PetalLength" DOUBLE PRECISION,
+                "PetalWidth" DOUBLE PRECISION,
+                "Name" VARCHAR(200)
+            )"""
+    },
+    'insert_iris': {
+        'sqlite': """INSERT INTO iris VALUES(?, ?, ?, ?, ?)""",
+        'mysql': """INSERT INTO iris VALUES(%s, %s, %s, %s, "%s");""",
+        'postgresql': """INSERT INTO iris VALUES(%s, %s, %s, %s, %s);"""
+    },
+    'create_test_types': {
+        'sqlite': """CREATE TABLE types_test_data (
+                    "TextCol" TEXT,
+                    "DateCol" TEXT,
+                    "IntDateCol" INTEGER,
+                    "IntDateOnlyCol" INTEGER,
+                    "FloatCol" REAL,
+                    "IntCol" INTEGER,
+                    "BoolCol" INTEGER,
+                    "IntColWithNull" INTEGER,
+                    "BoolColWithNull" INTEGER
+                )""",
+        'mysql': """CREATE TABLE types_test_data (
+                    `TextCol` TEXT,
+                    `DateCol` DATETIME,
+                    `IntDateCol` INTEGER,
+                    `IntDateOnlyCol` INTEGER,
+                    `FloatCol` DOUBLE,
+                    `IntCol` INTEGER,
+                    `BoolCol` BOOLEAN,
+                    `IntColWithNull` INTEGER,
+                    `BoolColWithNull` BOOLEAN
+                )""",
+        'postgresql': """CREATE TABLE types_test_data (
+                    "TextCol" TEXT,
+                    "DateCol" TIMESTAMP,
+                    "DateColWithTz" TIMESTAMP WITH TIME ZONE,
+                    "IntDateCol" INTEGER,
+                    "IntDateOnlyCol" INTEGER,
+                    "FloatCol" DOUBLE PRECISION,
+                    "IntCol" INTEGER,
+                    "BoolCol" BOOLEAN,
+                    "IntColWithNull" INTEGER,
+                    "BoolColWithNull" BOOLEAN
+                )"""
+    },
+    'insert_test_types': {
+        'sqlite': {
+            'query': """
+                INSERT INTO types_test_data
+                VALUES(?, ?, ?, ?, ?, ?, ?, ?, ?)
+                """,
+            'fields': (
+                'TextCol', 'DateCol', 'IntDateCol', 'IntDateOnlyCol',
+                'FloatCol', 'IntCol', 'BoolCol', 'IntColWithNull',
+                'BoolColWithNull'
+            )
+        },
+        'mysql': {
+            'query': """
+                INSERT INTO types_test_data
+                VALUES("%s", %s, %s, %s, %s, %s, %s, %s, %s)
+                """,
+            'fields': (
+                'TextCol', 'DateCol', 'IntDateCol', 'IntDateOnlyCol',
+                'FloatCol', 'IntCol', 'BoolCol', 'IntColWithNull',
+                'BoolColWithNull'
+            )
+        },
+        'postgresql': {
+            'query': """
+                INSERT INTO types_test_data
+                VALUES(%s, %s, %s, %s, %s, %s, %s, %s, %s, %s)
+                """,
+            'fields': (
+                'TextCol', 'DateCol', 'DateColWithTz',
+                'IntDateCol', 'IntDateOnlyCol', 'FloatCol',
+                'IntCol', 'BoolCol', 'IntColWithNull', 'BoolColWithNull'
+            )
+        },
+    },
+    'read_parameters': {
+        'sqlite': "SELECT * FROM iris WHERE Name=? AND SepalLength=?",
+        'mysql': 'SELECT * FROM iris WHERE `Name`="%s" AND `SepalLength`=%s',
+        'postgresql': 'SELECT * FROM iris WHERE "Name"=%s AND "SepalLength"=%s'
+    },
+    'read_named_parameters': {
+        'sqlite': """
+                SELECT * FROM iris WHERE Name=:name AND SepalLength=:length
+                """,
+        'mysql': """
+                SELECT * FROM iris WHERE
+                `Name`="%(name)s" AND `SepalLength`=%(length)s
+                """,
+        'postgresql': """
+                SELECT * FROM iris WHERE
+                "Name"=%(name)s AND "SepalLength"=%(length)s
+                """
+    },
+    'create_view': {
+        'sqlite': """
+                CREATE VIEW iris_view AS
+                SELECT * FROM iris
+                """
+    }
+}
+
+
+class MixInBase(object):
+
+    def teardown_method(self, method):
+        # if setup fails, there may not be a connection to close.
+        if hasattr(self, 'conn'):
+            for tbl in self._get_all_tables():
+                self.drop_table(tbl)
+            self._close_conn()
+
+
+class MySQLMixIn(MixInBase):
+
+    def drop_table(self, table_name):
+        cur = self.conn.cursor()
+        cur.execute("DROP TABLE IF EXISTS %s" %
+                    sql._get_valid_mysql_name(table_name))
+        self.conn.commit()
+
+    def _get_all_tables(self):
+        cur = self.conn.cursor()
+        cur.execute('SHOW TABLES')
+        return [table[0] for table in cur.fetchall()]
+
+    def _close_conn(self):
+        from pymysql.err import Error
+        try:
+            self.conn.close()
+        except Error:
+            pass
+
+
+class SQLiteMixIn(MixInBase):
+
+    def drop_table(self, table_name):
+        self.conn.execute("DROP TABLE IF EXISTS %s" %
+                          sql._get_valid_sqlite_name(table_name))
+        self.conn.commit()
+
+    def _get_all_tables(self):
+        c = self.conn.execute(
+            "SELECT name FROM sqlite_master WHERE type='table'")
+        return [table[0] for table in c.fetchall()]
+
+    def _close_conn(self):
+        self.conn.close()
+
+
+class SQLAlchemyMixIn(MixInBase):
+
+    def drop_table(self, table_name):
+        sql.SQLDatabase(self.conn).drop_table(table_name)
+
+    def _get_all_tables(self):
+        meta = sqlalchemy.schema.MetaData(bind=self.conn)
+        meta.reflect()
+        table_list = meta.tables.keys()
+        return table_list
+
+    def _close_conn(self):
+        pass
+
+
+class PandasSQLTest(object):
+    """
+    Base class with common private methods for SQLAlchemy and fallback cases.
+
+    """
+
+    def _get_exec(self):
+        if hasattr(self.conn, 'execute'):
+            return self.conn
+        else:
+            return self.conn.cursor()
+
+    def _load_iris_data(self, datapath):
+        import io
+        iris_csv_file = datapath('io', 'data', 'iris.csv')
+
+        self.drop_table('iris')
+        self._get_exec().execute(SQL_STRINGS['create_iris'][self.flavor])
+
+        with io.open(iris_csv_file, mode='r', newline=None) as iris_csv:
+            r = csv.reader(iris_csv)
+            next(r)  # skip header row
+            ins = SQL_STRINGS['insert_iris'][self.flavor]
+
+            for row in r:
+                self._get_exec().execute(ins, row)
+
+    def _load_iris_view(self):
+        self.drop_table('iris_view')
+        self._get_exec().execute(SQL_STRINGS['create_view'][self.flavor])
+
+    def _check_iris_loaded_frame(self, iris_frame):
+        pytype = iris_frame.dtypes[0].type
+        row = iris_frame.iloc[0]
+
+        assert issubclass(pytype, np.floating)
+        tm.equalContents(row.values, [5.1, 3.5, 1.4, 0.2, 'Iris-setosa'])
+
+    def _load_test1_data(self):
+        columns = ['index', 'A', 'B', 'C', 'D']
+        data = [(
+            '2000-01-03 00:00:00', 0.980268513777, 3.68573087906,
+            -0.364216805298, -1.15973806169),
+            ('2000-01-04 00:00:00', 1.04791624281, -
+             0.0412318367011, -0.16181208307, 0.212549316967),
+            ('2000-01-05 00:00:00', 0.498580885705,
+             0.731167677815, -0.537677223318, 1.34627041952),
+            ('2000-01-06 00:00:00', 1.12020151869, 1.56762092543,
+             0.00364077397681, 0.67525259227)]
+
+        self.test_frame1 = DataFrame(data, columns=columns)
+
+    def _load_test2_data(self):
+        df = DataFrame(dict(A=[4, 1, 3, 6],
+                            B=['asd', 'gsq', 'ylt', 'jkl'],
+                            C=[1.1, 3.1, 6.9, 5.3],
+                            D=[False, True, True, False],
+                            E=['1990-11-22', '1991-10-26',
+                               '1993-11-26', '1995-12-12']))
+        df['E'] = to_datetime(df['E'])
+
+        self.test_frame2 = df
+
+    def _load_test3_data(self):
+        columns = ['index', 'A', 'B']
+        data = [(
+            '2000-01-03 00:00:00', 2 ** 31 - 1, -1.987670),
+            ('2000-01-04 00:00:00', -29, -0.0412318367011),
+            ('2000-01-05 00:00:00', 20000, 0.731167677815),
+            ('2000-01-06 00:00:00', -290867, 1.56762092543)]
+
+        self.test_frame3 = DataFrame(data, columns=columns)
+
+    def _load_raw_sql(self):
+        self.drop_table('types_test_data')
+        self._get_exec().execute(SQL_STRINGS['create_test_types'][self.flavor])
+        ins = SQL_STRINGS['insert_test_types'][self.flavor]
+        data = [
+            {
+                'TextCol': 'first',
+                'DateCol': '2000-01-03 00:00:00',
+                'DateColWithTz': '2000-01-01 00:00:00-08:00',
+                'IntDateCol': 535852800,
+                'IntDateOnlyCol': 20101010,
+                'FloatCol': 10.10,
+                'IntCol': 1,
+                'BoolCol': False,
+                'IntColWithNull': 1,
+                'BoolColWithNull': False,
+            },
+            {
+                'TextCol': 'first',
+                'DateCol': '2000-01-04 00:00:00',
+                'DateColWithTz': '2000-06-01 00:00:00-07:00',
+                'IntDateCol': 1356998400,
+                'IntDateOnlyCol': 20101212,
+                'FloatCol': 10.10,
+                'IntCol': 1,
+                'BoolCol': False,
+                'IntColWithNull': None,
+                'BoolColWithNull': None,
+            },
+        ]
+
+        for d in data:
+            self._get_exec().execute(
+                ins['query'],
+                [d[field] for field in ins['fields']]
+            )
+
+    def _count_rows(self, table_name):
+        result = self._get_exec().execute(
+            "SELECT count(*) AS count_1 FROM %s" % table_name).fetchone()
+        return result[0]
+
+    def _read_sql_iris(self):
+        iris_frame = self.pandasSQL.read_query("SELECT * FROM iris")
+        self._check_iris_loaded_frame(iris_frame)
+
+    def _read_sql_iris_parameter(self):
+        query = SQL_STRINGS['read_parameters'][self.flavor]
+        params = ['Iris-setosa', 5.1]
+        iris_frame = self.pandasSQL.read_query(query, params=params)
+        self._check_iris_loaded_frame(iris_frame)
+
+    def _read_sql_iris_named_parameter(self):
+        query = SQL_STRINGS['read_named_parameters'][self.flavor]
+        params = {'name': 'Iris-setosa', 'length': 5.1}
+        iris_frame = self.pandasSQL.read_query(query, params=params)
+        self._check_iris_loaded_frame(iris_frame)
+
+    def _to_sql(self):
+        self.drop_table('test_frame1')
+
+        self.pandasSQL.to_sql(self.test_frame1, 'test_frame1')
+        assert self.pandasSQL.has_table('test_frame1')
+
+        # Nuke table
+        self.drop_table('test_frame1')
+
+    def _to_sql_empty(self):
+        self.drop_table('test_frame1')
+        self.pandasSQL.to_sql(self.test_frame1.iloc[:0], 'test_frame1')
+
+    def _to_sql_fail(self):
+        self.drop_table('test_frame1')
+
+        self.pandasSQL.to_sql(
+            self.test_frame1, 'test_frame1', if_exists='fail')
+        assert self.pandasSQL.has_table('test_frame1')
+
+        pytest.raises(ValueError, self.pandasSQL.to_sql,
+                      self.test_frame1, 'test_frame1', if_exists='fail')
+
+        self.drop_table('test_frame1')
+
+    def _to_sql_replace(self):
+        self.drop_table('test_frame1')
+
+        self.pandasSQL.to_sql(
+            self.test_frame1, 'test_frame1', if_exists='fail')
+        # Add to table again
+        self.pandasSQL.to_sql(
+            self.test_frame1, 'test_frame1', if_exists='replace')
+        assert self.pandasSQL.has_table('test_frame1')
+
+        num_entries = len(self.test_frame1)
+        num_rows = self._count_rows('test_frame1')
+
+        assert num_rows == num_entries
+        self.drop_table('test_frame1')
+
+    def _to_sql_append(self):
+        # Nuke table just in case
+        self.drop_table('test_frame1')
+
+        self.pandasSQL.to_sql(
+            self.test_frame1, 'test_frame1', if_exists='fail')
+
+        # Add to table again
+        self.pandasSQL.to_sql(
+            self.test_frame1, 'test_frame1', if_exists='append')
+        assert self.pandasSQL.has_table('test_frame1')
+
+        num_entries = 2 * len(self.test_frame1)
+        num_rows = self._count_rows('test_frame1')
+
+        assert num_rows == num_entries
+        self.drop_table('test_frame1')
+
+    def _roundtrip(self):
+        self.drop_table('test_frame_roundtrip')
+        self.pandasSQL.to_sql(self.test_frame1, 'test_frame_roundtrip')
+        result = self.pandasSQL.read_query(
+            'SELECT * FROM test_frame_roundtrip')
+
+        result.set_index('level_0', inplace=True)
+        # result.index.astype(int)
+
+        result.index.name = None
+
+        tm.assert_frame_equal(result, self.test_frame1)
+
+    def _execute_sql(self):
+        # drop_sql = "DROP TABLE IF EXISTS test"  # should already be done
+        iris_results = self.pandasSQL.execute("SELECT * FROM iris")
+        row = iris_results.fetchone()
+        tm.equalContents(row, [5.1, 3.5, 1.4, 0.2, 'Iris-setosa'])
+
+    def _to_sql_save_index(self):
+        df = DataFrame.from_records([(1, 2.1, 'line1'), (2, 1.5, 'line2')],
+                                    columns=['A', 'B', 'C'], index=['A'])
+        self.pandasSQL.to_sql(df, 'test_to_sql_saves_index')
+        ix_cols = self._get_index_columns('test_to_sql_saves_index')
+        assert ix_cols == [['A', ], ]
+
+    def _transaction_test(self):
+        self.pandasSQL.execute("CREATE TABLE test_trans (A INT, B TEXT)")
+
+        ins_sql = "INSERT INTO test_trans (A,B) VALUES (1, 'blah')"
+
+        # Make sure when transaction is rolled back, no rows get inserted
+        try:
+            with self.pandasSQL.run_transaction() as trans:
+                trans.execute(ins_sql)
+                raise Exception('error')
+        except:
+            # ignore raised exception
+            pass
+        res = self.pandasSQL.read_query('SELECT * FROM test_trans')
+        assert len(res) == 0
+
+        # Make sure when transaction is committed, rows do get inserted
+        with self.pandasSQL.run_transaction() as trans:
+            trans.execute(ins_sql)
+        res2 = self.pandasSQL.read_query('SELECT * FROM test_trans')
+        assert len(res2) == 1
+
+
+# -----------------------------------------------------------------------------
+# -- Testing the public API
+
+class _TestSQLApi(PandasSQLTest):
+
+    """
+    Base class to test the public API.
+
+    From this two classes are derived to run these tests for both the
+    sqlalchemy mode (`TestSQLApi`) and the fallback mode
+    (`TestSQLiteFallbackApi`).  These tests are run with sqlite3. Specific
+    tests for the different sql flavours are included in `_TestSQLAlchemy`.
+
+    Notes:
+    flavor can always be passed even in SQLAlchemy mode,
+    should be correctly ignored.
+
+    we don't use drop_table because that isn't part of the public api
+
+    """
+    flavor = 'sqlite'
+    mode = None
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.conn = self.connect()
+        self._load_iris_data(datapath)
+        self._load_iris_view()
+        self._load_test1_data()
+        self._load_test2_data()
+        self._load_test3_data()
+        self._load_raw_sql()
+
+    def test_read_sql_iris(self):
+        iris_frame = sql.read_sql_query(
+            "SELECT * FROM iris", self.conn)
+        self._check_iris_loaded_frame(iris_frame)
+
+    def test_read_sql_view(self):
+        iris_frame = sql.read_sql_query(
+            "SELECT * FROM iris_view", self.conn)
+        self._check_iris_loaded_frame(iris_frame)
+
+    def test_to_sql(self):
+        sql.to_sql(self.test_frame1, 'test_frame1', self.conn)
+        assert sql.has_table('test_frame1', self.conn)
+
+    def test_to_sql_fail(self):
+        sql.to_sql(self.test_frame1, 'test_frame2',
+                   self.conn, if_exists='fail')
+        assert sql.has_table('test_frame2', self.conn)
+
+        pytest.raises(ValueError, sql.to_sql, self.test_frame1,
+                      'test_frame2', self.conn, if_exists='fail')
+
+    def test_to_sql_replace(self):
+        sql.to_sql(self.test_frame1, 'test_frame3',
+                   self.conn, if_exists='fail')
+        # Add to table again
+        sql.to_sql(self.test_frame1, 'test_frame3',
+                   self.conn, if_exists='replace')
+        assert sql.has_table('test_frame3', self.conn)
+
+        num_entries = len(self.test_frame1)
+        num_rows = self._count_rows('test_frame3')
+
+        assert num_rows == num_entries
+
+    def test_to_sql_append(self):
+        sql.to_sql(self.test_frame1, 'test_frame4',
+                   self.conn, if_exists='fail')
+
+        # Add to table again
+        sql.to_sql(self.test_frame1, 'test_frame4',
+                   self.conn, if_exists='append')
+        assert sql.has_table('test_frame4', self.conn)
+
+        num_entries = 2 * len(self.test_frame1)
+        num_rows = self._count_rows('test_frame4')
+
+        assert num_rows == num_entries
+
+    def test_to_sql_type_mapping(self):
+        sql.to_sql(self.test_frame3, 'test_frame5', self.conn, index=False)
+        result = sql.read_sql("SELECT * FROM test_frame5", self.conn)
+
+        tm.assert_frame_equal(self.test_frame3, result)
+
+    def test_to_sql_series(self):
+        s = Series(np.arange(5, dtype='int64'), name='series')
+        sql.to_sql(s, "test_series", self.conn, index=False)
+        s2 = sql.read_sql_query("SELECT * FROM test_series", self.conn)
+        tm.assert_frame_equal(s.to_frame(), s2)
+
+    def test_to_sql_panel(self):
+        with catch_warnings(record=True):
+            panel = tm.makePanel()
+            pytest.raises(NotImplementedError, sql.to_sql, panel,
+                          'test_panel', self.conn)
+
+    def test_roundtrip(self):
+        sql.to_sql(self.test_frame1, 'test_frame_roundtrip',
+                   con=self.conn)
+        result = sql.read_sql_query(
+            'SELECT * FROM test_frame_roundtrip',
+            con=self.conn)
+
+        # HACK!
+        result.index = self.test_frame1.index
+        result.set_index('level_0', inplace=True)
+        result.index.astype(int)
+        result.index.name = None
+        tm.assert_frame_equal(result, self.test_frame1)
+
+    def test_roundtrip_chunksize(self):
+        sql.to_sql(self.test_frame1, 'test_frame_roundtrip', con=self.conn,
+                   index=False, chunksize=2)
+        result = sql.read_sql_query(
+            'SELECT * FROM test_frame_roundtrip',
+            con=self.conn)
+        tm.assert_frame_equal(result, self.test_frame1)
+
+    def test_execute_sql(self):
+        # drop_sql = "DROP TABLE IF EXISTS test"  # should already be done
+        iris_results = sql.execute("SELECT * FROM iris", con=self.conn)
+        row = iris_results.fetchone()
+        tm.equalContents(row, [5.1, 3.5, 1.4, 0.2, 'Iris-setosa'])
+
+    def test_date_parsing(self):
+        # Test date parsing in read_sql
+        # No Parsing
+        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn)
+        assert not issubclass(df.DateCol.dtype.type, np.datetime64)
+
+        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
+                                parse_dates=['DateCol'])
+        assert issubclass(df.DateCol.dtype.type, np.datetime64)
+        assert df.DateCol.tolist() == [
+            pd.Timestamp(2000, 1, 3, 0, 0, 0),
+            pd.Timestamp(2000, 1, 4, 0, 0, 0)
+        ]
+
+        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
+                                parse_dates={'DateCol': '%Y-%m-%d %H:%M:%S'})
+        assert issubclass(df.DateCol.dtype.type, np.datetime64)
+        assert df.DateCol.tolist() == [
+            pd.Timestamp(2000, 1, 3, 0, 0, 0),
+            pd.Timestamp(2000, 1, 4, 0, 0, 0)
+        ]
+
+        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
+                                parse_dates=['IntDateCol'])
+        assert issubclass(df.IntDateCol.dtype.type, np.datetime64)
+        assert df.IntDateCol.tolist() == [
+            pd.Timestamp(1986, 12, 25, 0, 0, 0),
+            pd.Timestamp(2013, 1, 1, 0, 0, 0)
+        ]
+
+        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
+                                parse_dates={'IntDateCol': 's'})
+        assert issubclass(df.IntDateCol.dtype.type, np.datetime64)
+        assert df.IntDateCol.tolist() == [
+            pd.Timestamp(1986, 12, 25, 0, 0, 0),
+            pd.Timestamp(2013, 1, 1, 0, 0, 0)
+        ]
+
+        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
+                                parse_dates={'IntDateOnlyCol': '%Y%m%d'})
+        assert issubclass(df.IntDateOnlyCol.dtype.type, np.datetime64)
+        assert df.IntDateOnlyCol.tolist() == [
+            pd.Timestamp('2010-10-10'),
+            pd.Timestamp('2010-12-12')
+        ]
+
+    def test_date_and_index(self):
+        # Test case where same column appears in parse_date and index_col
+
+        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
+                                index_col='DateCol',
+                                parse_dates=['DateCol', 'IntDateCol'])
+
+        assert issubclass(df.index.dtype.type, np.datetime64)
+        assert issubclass(df.IntDateCol.dtype.type, np.datetime64)
+
+    def test_timedelta(self):
+
+        # see #6921
+        df = to_timedelta(
+            Series(['00:00:01', '00:00:03'], name='foo')).to_frame()
+        with tm.assert_produces_warning(UserWarning):
+            df.to_sql('test_timedelta', self.conn)
+        result = sql.read_sql_query('SELECT * FROM test_timedelta', self.conn)
+        tm.assert_series_equal(result['foo'], df['foo'].astype('int64'))
+
+    def test_complex(self):
+        df = DataFrame({'a': [1 + 1j, 2j]})
+        # Complex data type should raise error
+        pytest.raises(ValueError, df.to_sql, 'test_complex', self.conn)
+
+    def test_to_sql_index_label(self):
+        temp_frame = DataFrame({'col1': range(4)})
+
+        # no index name, defaults to 'index'
+        sql.to_sql(temp_frame, 'test_index_label', self.conn)
+        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
+        assert frame.columns[0] == 'index'
+
+        # specifying index_label
+        sql.to_sql(temp_frame, 'test_index_label', self.conn,
+                   if_exists='replace', index_label='other_label')
+        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
+        assert frame.columns[0] == "other_label"
+
+        # using the index name
+        temp_frame.index.name = 'index_name'
+        sql.to_sql(temp_frame, 'test_index_label', self.conn,
+                   if_exists='replace')
+        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
+        assert frame.columns[0] == "index_name"
+
+        # has index name, but specifying index_label
+        sql.to_sql(temp_frame, 'test_index_label', self.conn,
+                   if_exists='replace', index_label='other_label')
+        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
+        assert frame.columns[0] == "other_label"
+
+        # index name is integer
+        temp_frame.index.name = 0
+        sql.to_sql(temp_frame, 'test_index_label', self.conn,
+                   if_exists='replace')
+        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
+        assert frame.columns[0] == "0"
+
+        temp_frame.index.name = None
+        sql.to_sql(temp_frame, 'test_index_label', self.conn,
+                   if_exists='replace', index_label=0)
+        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
+        assert frame.columns[0] == "0"
+
+    def test_to_sql_index_label_multiindex(self):
+        temp_frame = DataFrame({'col1': range(4)},
+                               index=MultiIndex.from_product(
+                                   [('A0', 'A1'), ('B0', 'B1')]))
+
+        # no index name, defaults to 'level_0' and 'level_1'
+        sql.to_sql(temp_frame, 'test_index_label', self.conn)
+        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
+        assert frame.columns[0] == 'level_0'
+        assert frame.columns[1] == 'level_1'
+
+        # specifying index_label
+        sql.to_sql(temp_frame, 'test_index_label', self.conn,
+                   if_exists='replace', index_label=['A', 'B'])
+        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
+        assert frame.columns[:2].tolist() == ['A', 'B']
+
+        # using the index name
+        temp_frame.index.names = ['A', 'B']
+        sql.to_sql(temp_frame, 'test_index_label', self.conn,
+                   if_exists='replace')
+        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
+        assert frame.columns[:2].tolist() == ['A', 'B']
+
+        # has index name, but specifying index_label
+        sql.to_sql(temp_frame, 'test_index_label', self.conn,
+                   if_exists='replace', index_label=['C', 'D'])
+        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
+        assert frame.columns[:2].tolist() == ['C', 'D']
+
+        # wrong length of index_label
+        pytest.raises(ValueError, sql.to_sql, temp_frame,
+                      'test_index_label', self.conn, if_exists='replace',
+                      index_label='C')
+
+    def test_multiindex_roundtrip(self):
+        df = DataFrame.from_records([(1, 2.1, 'line1'), (2, 1.5, 'line2')],
+                                    columns=['A', 'B', 'C'], index=['A', 'B'])
+
+        df.to_sql('test_multiindex_roundtrip', self.conn)
+        result = sql.read_sql_query('SELECT * FROM test_multiindex_roundtrip',
+                                    self.conn, index_col=['A', 'B'])
+        tm.assert_frame_equal(df, result, check_index_type=True)
+
+    def test_integer_col_names(self):
+        df = DataFrame([[1, 2], [3, 4]], columns=[0, 1])
+        sql.to_sql(df, "test_frame_integer_col_names", self.conn,
+                   if_exists='replace')
+
+    def test_get_schema(self):
+        create_sql = sql.get_schema(self.test_frame1, 'test', con=self.conn)
+        assert 'CREATE' in create_sql
+
+    def test_get_schema_dtypes(self):
+        float_frame = DataFrame({'a': [1.1, 1.2], 'b': [2.1, 2.2]})
+        dtype = sqlalchemy.Integer if self.mode == 'sqlalchemy' else 'INTEGER'
+        create_sql = sql.get_schema(float_frame, 'test',
+                                    con=self.conn, dtype={'b': dtype})
+        assert 'CREATE' in create_sql
+        assert 'INTEGER' in create_sql
+
+    def test_get_schema_keys(self):
+        frame = DataFrame({'Col1': [1.1, 1.2], 'Col2': [2.1, 2.2]})
+        create_sql = sql.get_schema(frame, 'test', con=self.conn, keys='Col1')
+        constraint_sentence = 'CONSTRAINT test_pk PRIMARY KEY ("Col1")'
+        assert constraint_sentence in create_sql
+
+        # multiple columns as key (GH10385)
+        create_sql = sql.get_schema(self.test_frame1, 'test',
+                                    con=self.conn, keys=['A', 'B'])
+        constraint_sentence = 'CONSTRAINT test_pk PRIMARY KEY ("A", "B")'
+        assert constraint_sentence in create_sql
+
+    def test_chunksize_read(self):
+        df = DataFrame(np.random.randn(22, 5), columns=list('abcde'))
+        df.to_sql('test_chunksize', self.conn, index=False)
+
+        # reading the query in one time
+        res1 = sql.read_sql_query("select * from test_chunksize", self.conn)
+
+        # reading the query in chunks with read_sql_query
+        res2 = DataFrame()
+        i = 0
+        sizes = [5, 5, 5, 5, 2]
+
+        for chunk in sql.read_sql_query("select * from test_chunksize",
+                                        self.conn, chunksize=5):
+            res2 = concat([res2, chunk], ignore_index=True)
+            assert len(chunk) == sizes[i]
+            i += 1
+
+        tm.assert_frame_equal(res1, res2)
+
+        # reading the query in chunks with read_sql_query
+        if self.mode == 'sqlalchemy':
+            res3 = DataFrame()
+            i = 0
+            sizes = [5, 5, 5, 5, 2]
+
+            for chunk in sql.read_sql_table("test_chunksize", self.conn,
+                                            chunksize=5):
+                res3 = concat([res3, chunk], ignore_index=True)
+                assert len(chunk) == sizes[i]
+                i += 1
+
+            tm.assert_frame_equal(res1, res3)
+
+    def test_categorical(self):
+        # GH8624
+        # test that categorical gets written correctly as dense column
+        df = DataFrame(
+            {'person_id': [1, 2, 3],
+             'person_name': ['John P. Doe', 'Jane Dove', 'John P. Doe']})
+        df2 = df.copy()
+        df2['person_name'] = df2['person_name'].astype('category')
+
+        df2.to_sql('test_categorical', self.conn, index=False)
+        res = sql.read_sql_query('SELECT * FROM test_categorical', self.conn)
+
+        tm.assert_frame_equal(res, df)
+
+    def test_unicode_column_name(self):
+        # GH 11431
+        df = DataFrame([[1, 2], [3, 4]], columns=[u'\xe9', u'b'])
+        df.to_sql('test_unicode', self.conn, index=False)
+
+    def test_escaped_table_name(self):
+        # GH 13206
+        df = DataFrame({'A': [0, 1, 2], 'B': [0.2, np.nan, 5.6]})
+        df.to_sql('d1187b08-4943-4c8d-a7f6', self.conn, index=False)
+
+        res = sql.read_sql_query('SELECT * FROM `d1187b08-4943-4c8d-a7f6`',
+                                 self.conn)
+
+        tm.assert_frame_equal(res, df)
+
+
+@pytest.mark.single
+class TestSQLApi(SQLAlchemyMixIn, _TestSQLApi):
+    """
+    Test the public API as it would be used directly
+
+    Tests for `read_sql_table` are included here, as this is specific for the
+    sqlalchemy mode.
+
+    """
+    flavor = 'sqlite'
+    mode = 'sqlalchemy'
+
+    def connect(self):
+        if SQLALCHEMY_INSTALLED:
+            return sqlalchemy.create_engine('sqlite:///:memory:')
+        else:
+            pytest.skip('SQLAlchemy not installed')
+
+    def test_read_table_columns(self):
+        # test columns argument in read_table
+        sql.to_sql(self.test_frame1, 'test_frame', self.conn)
+
+        cols = ['A', 'B']
+        result = sql.read_sql_table('test_frame', self.conn, columns=cols)
+        assert result.columns.tolist() == cols
+
+    def test_read_table_index_col(self):
+        # test columns argument in read_table
+        sql.to_sql(self.test_frame1, 'test_frame', self.conn)
+
+        result = sql.read_sql_table('test_frame', self.conn, index_col="index")
+        assert result.index.names == ["index"]
+
+        result = sql.read_sql_table(
+            'test_frame', self.conn, index_col=["A", "B"])
+        assert result.index.names == ["A", "B"]
+
+        result = sql.read_sql_table('test_frame', self.conn,
+                                    index_col=["A", "B"],
+                                    columns=["C", "D"])
+        assert result.index.names == ["A", "B"]
+        assert result.columns.tolist() == ["C", "D"]
+
+    def test_read_sql_delegate(self):
+        iris_frame1 = sql.read_sql_query(
+            "SELECT * FROM iris", self.conn)
+        iris_frame2 = sql.read_sql(
+            "SELECT * FROM iris", self.conn)
+        tm.assert_frame_equal(iris_frame1, iris_frame2)
+
+        iris_frame1 = sql.read_sql_table('iris', self.conn)
+        iris_frame2 = sql.read_sql('iris', self.conn)
+        tm.assert_frame_equal(iris_frame1, iris_frame2)
+
+    def test_not_reflect_all_tables(self):
+        # create invalid table
+        qry = """CREATE TABLE invalid (x INTEGER, y UNKNOWN);"""
+        self.conn.execute(qry)
+        qry = """CREATE TABLE other_table (x INTEGER, y INTEGER);"""
+        self.conn.execute(qry)
+
+        with warnings.catch_warnings(record=True) as w:
+            # Cause all warnings to always be triggered.
+            warnings.simplefilter("always")
+            # Trigger a warning.
+            sql.read_sql_table('other_table', self.conn)
+            sql.read_sql_query('SELECT * FROM other_table', self.conn)
+            # Verify some things
+            assert len(w) == 0
+
+    def test_warning_case_insensitive_table_name(self):
+        # see gh-7815
+        #
+        # We can't test that this warning is triggered, a the database
+        # configuration would have to be altered. But here we test that
+        # the warning is certainly NOT triggered in a normal case.
+        with warnings.catch_warnings(record=True) as w:
+            # Cause all warnings to always be triggered.
+            warnings.simplefilter("always")
+            # This should not trigger a Warning
+            self.test_frame1.to_sql('CaseSensitive', self.conn)
+            # Verify some things
+            assert len(w) == 0
+
+    def _get_index_columns(self, tbl_name):
+        from sqlalchemy.engine import reflection
+        insp = reflection.Inspector.from_engine(self.conn)
+        ixs = insp.get_indexes('test_index_saved')
+        ixs = [i['column_names'] for i in ixs]
+        return ixs
+
+    def test_sqlalchemy_type_mapping(self):
+
+        # Test Timestamp objects (no datetime64 because of timezone) (GH9085)
+        df = DataFrame({'time': to_datetime(['201412120154', '201412110254'],
+                                            utc=True)})
+        db = sql.SQLDatabase(self.conn)
+        table = sql.SQLTable("test_type", db, frame=df)
+        assert isinstance(table.table.c['time'].type, sqltypes.DateTime)
+
+    def test_database_uri_string(self):
+
+        # Test read_sql and .to_sql method with a database URI (GH10654)
+        test_frame1 = self.test_frame1
+        # db_uri = 'sqlite:///:memory:' # raises
+        # sqlalchemy.exc.OperationalError: (sqlite3.OperationalError) near
+        # "iris": syntax error [SQL: 'iris']
+        with tm.ensure_clean() as name:
+            db_uri = 'sqlite:///' + name
+            table = 'iris'
+            test_frame1.to_sql(table, db_uri, if_exists='replace', index=False)
+            test_frame2 = sql.read_sql(table, db_uri)
+            test_frame3 = sql.read_sql_table(table, db_uri)
+            query = 'SELECT * FROM iris'
+            test_frame4 = sql.read_sql_query(query, db_uri)
+        tm.assert_frame_equal(test_frame1, test_frame2)
+        tm.assert_frame_equal(test_frame1, test_frame3)
+        tm.assert_frame_equal(test_frame1, test_frame4)
+
+        # using driver that will not be installed on Travis to trigger error
+        # in sqlalchemy.create_engine -> test passing of this error to user
+        try:
+            # the rest of this test depends on pg8000's being absent
+            import pg8000  # noqa
+            pytest.skip("pg8000 is installed")
+        except ImportError:
+            pass
+
+        db_uri = "postgresql+pg8000://user:pass@host/dbname"
+        with tm.assert_raises_regex(ImportError, "pg8000"):
+            sql.read_sql("select * from table", db_uri)
+
+    def _make_iris_table_metadata(self):
+        sa = sqlalchemy
+        metadata = sa.MetaData()
+        iris = sa.Table('iris', metadata,
+                        sa.Column('SepalLength', sa.REAL),
+                        sa.Column('SepalWidth', sa.REAL),
+                        sa.Column('PetalLength', sa.REAL),
+                        sa.Column('PetalWidth', sa.REAL),
+                        sa.Column('Name', sa.TEXT)
+                        )
+
+        return iris
+
+    def test_query_by_text_obj(self):
+        # WIP : GH10846
+        name_text = sqlalchemy.text('select * from iris where name=:name')
+        iris_df = sql.read_sql(name_text, self.conn, params={
+                               'name': 'Iris-versicolor'})
+        all_names = set(iris_df['Name'])
+        assert all_names == set(['Iris-versicolor'])
+
+    def test_query_by_select_obj(self):
+        # WIP : GH10846
+        iris = self._make_iris_table_metadata()
+
+        name_select = sqlalchemy.select([iris]).where(
+            iris.c.Name == sqlalchemy.bindparam('name'))
+        iris_df = sql.read_sql(name_select, self.conn,
+                               params={'name': 'Iris-setosa'})
+        all_names = set(iris_df['Name'])
+        assert all_names == set(['Iris-setosa'])
+
+
+class _EngineToConnMixin(object):
+    """
+    A mixin that causes setup_connect to create a conn rather than an engine.
+    """
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        super(_EngineToConnMixin, self).setup_method(datapath)
+        engine = self.conn
+        conn = engine.connect()
+        self.__tx = conn.begin()
+        self.pandasSQL = sql.SQLDatabase(conn)
+        self.__engine = engine
+        self.conn = conn
+
+        yield
+
+        self.__tx.rollback()
+        self.conn.close()
+        self.conn = self.__engine
+        self.pandasSQL = sql.SQLDatabase(self.__engine)
+        # XXX:
+        # super(_EngineToConnMixin, self).teardown_method(method)
+
+
+@pytest.mark.single
+class TestSQLApiConn(_EngineToConnMixin, TestSQLApi):
+    pass
+
+
+@pytest.mark.single
+class TestSQLiteFallbackApi(SQLiteMixIn, _TestSQLApi):
+    """
+    Test the public sqlite connection fallback API
+
+    """
+    flavor = 'sqlite'
+    mode = 'fallback'
+
+    def connect(self, database=":memory:"):
+        return sqlite3.connect(database)
+
+    def test_sql_open_close(self):
+        # Test if the IO in the database still work if the connection closed
+        # between the writing and reading (as in many real situations).
+
+        with tm.ensure_clean() as name:
+
+            conn = self.connect(name)
+            sql.to_sql(self.test_frame3, "test_frame3_legacy",
+                       conn, index=False)
+            conn.close()
+
+            conn = self.connect(name)
+            result = sql.read_sql_query("SELECT * FROM test_frame3_legacy;",
+                                        conn)
+            conn.close()
+
+        tm.assert_frame_equal(self.test_frame3, result)
+
+    def test_con_string_import_error(self):
+        if not SQLALCHEMY_INSTALLED:
+            conn = 'mysql://root@localhost/pandas_nosetest'
+            pytest.raises(ImportError, sql.read_sql, "SELECT * FROM iris",
+                          conn)
+        else:
+            pytest.skip('SQLAlchemy is installed')
+
+    def test_read_sql_delegate(self):
+        iris_frame1 = sql.read_sql_query("SELECT * FROM iris", self.conn)
+        iris_frame2 = sql.read_sql("SELECT * FROM iris", self.conn)
+        tm.assert_frame_equal(iris_frame1, iris_frame2)
+
+        pytest.raises(sql.DatabaseError, sql.read_sql, 'iris', self.conn)
+
+    def test_safe_names_warning(self):
+        # GH 6798
+        df = DataFrame([[1, 2], [3, 4]], columns=['a', 'b '])  # has a space
+        # warns on create table with spaces in names
+        with tm.assert_produces_warning():
+            sql.to_sql(df, "test_frame3_legacy", self.conn, index=False)
+
+    def test_get_schema2(self):
+        # without providing a connection object (available for backwards comp)
+        create_sql = sql.get_schema(self.test_frame1, 'test')
+        assert 'CREATE' in create_sql
+
+    def _get_sqlite_column_type(self, schema, column):
+
+        for col in schema.split('\n'):
+            if col.split()[0].strip('""') == column:
+                return col.split()[1]
+        raise ValueError('Column %s not found' % (column))
+
+    def test_sqlite_type_mapping(self):
+
+        # Test Timestamp objects (no datetime64 because of timezone) (GH9085)
+        df = DataFrame({'time': to_datetime(['201412120154', '201412110254'],
+                                            utc=True)})
+        db = sql.SQLiteDatabase(self.conn)
+        table = sql.SQLiteTable("test_type", db, frame=df)
+        schema = table.sql_schema()
+        assert self._get_sqlite_column_type(schema, 'time') == "TIMESTAMP"
+
+
+# -----------------------------------------------------------------------------
+# -- Database flavor specific tests
+
+
+class _TestSQLAlchemy(SQLAlchemyMixIn, PandasSQLTest):
+    """
+    Base class for testing the sqlalchemy backend.
+
+    Subclasses for specific database types are created below. Tests that
+    deviate for each flavor are overwritten there.
+
+    """
+    flavor = None
+
+    @pytest.fixture(autouse=True, scope='class')
+    def setup_class(cls):
+        cls.setup_import()
+        cls.setup_driver()
+
+        # test connection
+        try:
+            conn = cls.connect()
+            conn.connect()
+        except sqlalchemy.exc.OperationalError:
+            msg = "{0} - can't connect to {1} server".format(cls, cls.flavor)
+            pytest.skip(msg)
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.setup_connect()
+
+        self._load_iris_data(datapath)
+        self._load_raw_sql()
+        self._load_test1_data()
+
+    @classmethod
+    def setup_import(cls):
+        # Skip this test if SQLAlchemy not available
+        if not SQLALCHEMY_INSTALLED:
+            pytest.skip('SQLAlchemy not installed')
+
+    @classmethod
+    def setup_driver(cls):
+        raise NotImplementedError()
+
+    @classmethod
+    def connect(cls):
+        raise NotImplementedError()
+
+    def setup_connect(self):
+        try:
+            self.conn = self.connect()
+            self.pandasSQL = sql.SQLDatabase(self.conn)
+            # to test if connection can be made:
+            self.conn.connect()
+        except sqlalchemy.exc.OperationalError:
+            pytest.skip(
+                "Can't connect to {0} server".format(self.flavor))
+
+    def test_aread_sql(self):
+        self._read_sql_iris()
+
+    def test_read_sql_parameter(self):
+        self._read_sql_iris_parameter()
+
+    def test_read_sql_named_parameter(self):
+        self._read_sql_iris_named_parameter()
+
+    def test_to_sql(self):
+        self._to_sql()
+
+    def test_to_sql_empty(self):
+        self._to_sql_empty()
+
+    def test_to_sql_fail(self):
+        self._to_sql_fail()
+
+    def test_to_sql_replace(self):
+        self._to_sql_replace()
+
+    def test_to_sql_append(self):
+        self._to_sql_append()
+
+    def test_create_table(self):
+        temp_conn = self.connect()
+        temp_frame = DataFrame(
+            {'one': [1., 2., 3., 4.], 'two': [4., 3., 2., 1.]})
+
+        pandasSQL = sql.SQLDatabase(temp_conn)
+        pandasSQL.to_sql(temp_frame, 'temp_frame')
+
+        assert temp_conn.has_table('temp_frame')
+
+    def test_drop_table(self):
+        temp_conn = self.connect()
+
+        temp_frame = DataFrame(
+            {'one': [1., 2., 3., 4.], 'two': [4., 3., 2., 1.]})
+
+        pandasSQL = sql.SQLDatabase(temp_conn)
+        pandasSQL.to_sql(temp_frame, 'temp_frame')
+
+        assert temp_conn.has_table('temp_frame')
+
+        pandasSQL.drop_table('temp_frame')
+
+        assert not temp_conn.has_table('temp_frame')
+
+    def test_roundtrip(self):
+        self._roundtrip()
+
+    def test_execute_sql(self):
+        self._execute_sql()
+
+    def test_read_table(self):
+        iris_frame = sql.read_sql_table("iris", con=self.conn)
+        self._check_iris_loaded_frame(iris_frame)
+
+    def test_read_table_columns(self):
+        iris_frame = sql.read_sql_table(
+            "iris", con=self.conn, columns=['SepalLength', 'SepalLength'])
+        tm.equalContents(
+            iris_frame.columns.values, ['SepalLength', 'SepalLength'])
+
+    def test_read_table_absent(self):
+        pytest.raises(
+            ValueError, sql.read_sql_table, "this_doesnt_exist", con=self.conn)
+
+    def test_default_type_conversion(self):
+        df = sql.read_sql_table("types_test_data", self.conn)
+
+        assert issubclass(df.FloatCol.dtype.type, np.floating)
+        assert issubclass(df.IntCol.dtype.type, np.integer)
+        assert issubclass(df.BoolCol.dtype.type, np.bool_)
+
+        # Int column with NA values stays as float
+        assert issubclass(df.IntColWithNull.dtype.type, np.floating)
+        # Bool column with NA values becomes object
+        assert issubclass(df.BoolColWithNull.dtype.type, np.object)
+
+    def test_bigint(self):
+        # int64 should be converted to BigInteger, GH7433
+        df = DataFrame(data={'i64': [2**62]})
+        df.to_sql('test_bigint', self.conn, index=False)
+        result = sql.read_sql_table('test_bigint', self.conn)
+
+        tm.assert_frame_equal(df, result)
+
+    def test_default_date_load(self):
+        df = sql.read_sql_table("types_test_data", self.conn)
+
+        # IMPORTANT - sqlite has no native date type, so shouldn't parse, but
+        # MySQL SHOULD be converted.
+        assert issubclass(df.DateCol.dtype.type, np.datetime64)
+
+    def test_datetime_with_timezone(self):
+        # edge case that converts postgresql datetime with time zone types
+        # to datetime64[ns,psycopg2.tz.FixedOffsetTimezone..], which is ok
+        # but should be more natural, so coerce to datetime64[ns] for now
+
+        def check(col):
+            # check that a column is either datetime64[ns]
+            # or datetime64[ns, UTC]
+            if is_datetime64_dtype(col.dtype):
+
+                # "2000-01-01 00:00:00-08:00" should convert to
+                # "2000-01-01 08:00:00"
+                assert col[0] == Timestamp('2000-01-01 08:00:00')
+
+                # "2000-06-01 00:00:00-07:00" should convert to
+                # "2000-06-01 07:00:00"
+                assert col[1] == Timestamp('2000-06-01 07:00:00')
+
+            elif is_datetime64tz_dtype(col.dtype):
+                assert str(col.dt.tz) == 'UTC'
+
+                # "2000-01-01 00:00:00-08:00" should convert to
+                # "2000-01-01 08:00:00"
+                # "2000-06-01 00:00:00-07:00" should convert to
+                # "2000-06-01 07:00:00"
+                # GH 6415
+                expected_data = [Timestamp('2000-01-01 08:00:00', tz='UTC'),
+                                 Timestamp('2000-06-01 07:00:00', tz='UTC')]
+                expected = Series(expected_data, name=col.name)
+                tm.assert_series_equal(col, expected)
+
+            else:
+                raise AssertionError("DateCol loaded with incorrect type "
+                                     "-> {0}".format(col.dtype))
+
+        # GH11216
+        df = pd.read_sql_query("select * from types_test_data", self.conn)
+        if not hasattr(df, 'DateColWithTz'):
+            pytest.skip("no column with datetime with time zone")
+
+        # this is parsed on Travis (linux), but not on macosx for some reason
+        # even with the same versions of psycopg2 & sqlalchemy, possibly a
+        # Postgrsql server version difference
+        col = df.DateColWithTz
+        assert (is_object_dtype(col.dtype) or
+                is_datetime64_dtype(col.dtype) or
+                is_datetime64tz_dtype(col.dtype))
+
+        df = pd.read_sql_query("select * from types_test_data",
+                               self.conn, parse_dates=['DateColWithTz'])
+        if not hasattr(df, 'DateColWithTz'):
+            pytest.skip("no column with datetime with time zone")
+        col = df.DateColWithTz
+        assert is_datetime64tz_dtype(col.dtype)
+        assert str(col.dt.tz) == 'UTC'
+        check(df.DateColWithTz)
+
+        df = pd.concat(list(pd.read_sql_query("select * from types_test_data",
+                                              self.conn, chunksize=1)),
+                       ignore_index=True)
+        col = df.DateColWithTz
+        assert is_datetime64tz_dtype(col.dtype)
+        assert str(col.dt.tz) == 'UTC'
+        expected = sql.read_sql_table("types_test_data", self.conn)
+        col = expected.DateColWithTz
+        assert is_datetime64tz_dtype(col.dtype)
+        tm.assert_series_equal(df.DateColWithTz, expected.DateColWithTz)
+
+        # xref #7139
+        # this might or might not be converted depending on the postgres driver
+        df = sql.read_sql_table("types_test_data", self.conn)
+        check(df.DateColWithTz)
+
+    def test_date_parsing(self):
+        # No Parsing
+        df = sql.read_sql_table("types_test_data", self.conn)
+
+        df = sql.read_sql_table("types_test_data", self.conn,
+                                parse_dates=['DateCol'])
+        assert issubclass(df.DateCol.dtype.type, np.datetime64)
+
+        df = sql.read_sql_table("types_test_data", self.conn,
+                                parse_dates={'DateCol': '%Y-%m-%d %H:%M:%S'})
+        assert issubclass(df.DateCol.dtype.type, np.datetime64)
+
+        df = sql.read_sql_table("types_test_data", self.conn, parse_dates={
+            'DateCol': {'format': '%Y-%m-%d %H:%M:%S'}})
+        assert issubclass(df.DateCol.dtype.type, np.datetime64)
+
+        df = sql.read_sql_table(
+            "types_test_data", self.conn, parse_dates=['IntDateCol'])
+        assert issubclass(df.IntDateCol.dtype.type, np.datetime64)
+
+        df = sql.read_sql_table(
+            "types_test_data", self.conn, parse_dates={'IntDateCol': 's'})
+        assert issubclass(df.IntDateCol.dtype.type, np.datetime64)
+
+        df = sql.read_sql_table("types_test_data", self.conn,
+                                parse_dates={'IntDateCol': {'unit': 's'}})
+        assert issubclass(df.IntDateCol.dtype.type, np.datetime64)
+
+    def test_datetime(self):
+        df = DataFrame({'A': date_range('2013-01-01 09:00:00', periods=3),
+                        'B': np.arange(3.0)})
+        df.to_sql('test_datetime', self.conn)
+
+        # with read_table -> type information from schema used
+        result = sql.read_sql_table('test_datetime', self.conn)
+        result = result.drop('index', axis=1)
+        tm.assert_frame_equal(result, df)
+
+        # with read_sql -> no type information -> sqlite has no native
+        result = sql.read_sql_query('SELECT * FROM test_datetime', self.conn)
+        result = result.drop('index', axis=1)
+        if self.flavor == 'sqlite':
+            assert isinstance(result.loc[0, 'A'], string_types)
+            result['A'] = to_datetime(result['A'])
+            tm.assert_frame_equal(result, df)
+        else:
+            tm.assert_frame_equal(result, df)
+
+    def test_datetime_NaT(self):
+        df = DataFrame({'A': date_range('2013-01-01 09:00:00', periods=3),
+                        'B': np.arange(3.0)})
+        df.loc[1, 'A'] = np.nan
+        df.to_sql('test_datetime', self.conn, index=False)
+
+        # with read_table -> type information from schema used
+        result = sql.read_sql_table('test_datetime', self.conn)
+        tm.assert_frame_equal(result, df)
+
+        # with read_sql -> no type information -> sqlite has no native
+        result = sql.read_sql_query('SELECT * FROM test_datetime', self.conn)
+        if self.flavor == 'sqlite':
+            assert isinstance(result.loc[0, 'A'], string_types)
+            result['A'] = to_datetime(result['A'], errors='coerce')
+            tm.assert_frame_equal(result, df)
+        else:
+            tm.assert_frame_equal(result, df)
+
+    def test_datetime_date(self):
+        # test support for datetime.date
+        df = DataFrame([date(2014, 1, 1), date(2014, 1, 2)], columns=["a"])
+        df.to_sql('test_date', self.conn, index=False)
+        res = read_sql_table('test_date', self.conn)
+        result = res['a']
+        expected = to_datetime(df['a'])
+        # comes back as datetime64
+        tm.assert_series_equal(result, expected)
+
+    def test_datetime_time(self):
+        # test support for datetime.time
+        df = DataFrame([time(9, 0, 0), time(9, 1, 30)], columns=["a"])
+        df.to_sql('test_time', self.conn, index=False)
+        res = read_sql_table('test_time', self.conn)
+        tm.assert_frame_equal(res, df)
+
+        # GH8341
+        # first, use the fallback to have the sqlite adapter put in place
+        sqlite_conn = TestSQLiteFallback.connect()
+        sql.to_sql(df, "test_time2", sqlite_conn, index=False)
+        res = sql.read_sql_query("SELECT * FROM test_time2", sqlite_conn)
+        ref = df.applymap(lambda _: _.strftime("%H:%M:%S.%f"))
+        tm.assert_frame_equal(ref, res)  # check if adapter is in place
+        # then test if sqlalchemy is unaffected by the sqlite adapter
+        sql.to_sql(df, "test_time3", self.conn, index=False)
+        if self.flavor == 'sqlite':
+            res = sql.read_sql_query("SELECT * FROM test_time3", self.conn)
+            ref = df.applymap(lambda _: _.strftime("%H:%M:%S.%f"))
+            tm.assert_frame_equal(ref, res)
+        res = sql.read_sql_table("test_time3", self.conn)
+        tm.assert_frame_equal(df, res)
+
+    def test_mixed_dtype_insert(self):
+        # see GH6509
+        s1 = Series(2**25 + 1, dtype=np.int32)
+        s2 = Series(0.0, dtype=np.float32)
+        df = DataFrame({'s1': s1, 's2': s2})
+
+        # write and read again
+        df.to_sql("test_read_write", self.conn, index=False)
+        df2 = sql.read_sql_table("test_read_write", self.conn)
+
+        tm.assert_frame_equal(df, df2, check_dtype=False, check_exact=True)
+
+    def test_nan_numeric(self):
+        # NaNs in numeric float column
+        df = DataFrame({'A': [0, 1, 2], 'B': [0.2, np.nan, 5.6]})
+        df.to_sql('test_nan', self.conn, index=False)
+
+        # with read_table
+        result = sql.read_sql_table('test_nan', self.conn)
+        tm.assert_frame_equal(result, df)
+
+        # with read_sql
+        result = sql.read_sql_query('SELECT * FROM test_nan', self.conn)
+        tm.assert_frame_equal(result, df)
+
+    def test_nan_fullcolumn(self):
+        # full NaN column (numeric float column)
+        df = DataFrame({'A': [0, 1, 2], 'B': [np.nan, np.nan, np.nan]})
+        df.to_sql('test_nan', self.conn, index=False)
+
+        # with read_table
+        result = sql.read_sql_table('test_nan', self.conn)
+        tm.assert_frame_equal(result, df)
+
+        # with read_sql -> not type info from table -> stays None
+        df['B'] = df['B'].astype('object')
+        df['B'] = None
+        result = sql.read_sql_query('SELECT * FROM test_nan', self.conn)
+        tm.assert_frame_equal(result, df)
+
+    def test_nan_string(self):
+        # NaNs in string column
+        df = DataFrame({'A': [0, 1, 2], 'B': ['a', 'b', np.nan]})
+        df.to_sql('test_nan', self.conn, index=False)
+
+        # NaNs are coming back as None
+        df.loc[2, 'B'] = None
+
+        # with read_table
+        result = sql.read_sql_table('test_nan', self.conn)
+        tm.assert_frame_equal(result, df)
+
+        # with read_sql
+        result = sql.read_sql_query('SELECT * FROM test_nan', self.conn)
+        tm.assert_frame_equal(result, df)
+
+    def _get_index_columns(self, tbl_name):
+        from sqlalchemy.engine import reflection
+        insp = reflection.Inspector.from_engine(self.conn)
+        ixs = insp.get_indexes(tbl_name)
+        ixs = [i['column_names'] for i in ixs]
+        return ixs
+
+    def test_to_sql_save_index(self):
+        self._to_sql_save_index()
+
+    def test_transactions(self):
+        self._transaction_test()
+
+    def test_get_schema_create_table(self):
+        # Use a dataframe without a bool column, since MySQL converts bool to
+        # TINYINT (which read_sql_table returns as an int and causes a dtype
+        # mismatch)
+
+        self._load_test3_data()
+        tbl = 'test_get_schema_create_table'
+        create_sql = sql.get_schema(self.test_frame3, tbl, con=self.conn)
+        blank_test_df = self.test_frame3.iloc[:0]
+
+        self.drop_table(tbl)
+        self.conn.execute(create_sql)
+        returned_df = sql.read_sql_table(tbl, self.conn)
+        tm.assert_frame_equal(returned_df, blank_test_df,
+                              check_index_type=False)
+        self.drop_table(tbl)
+
+    def test_dtype(self):
+        cols = ['A', 'B']
+        data = [(0.8, True),
+                (0.9, None)]
+        df = DataFrame(data, columns=cols)
+        df.to_sql('dtype_test', self.conn)
+        df.to_sql('dtype_test2', self.conn, dtype={'B': sqlalchemy.TEXT})
+        meta = sqlalchemy.schema.MetaData(bind=self.conn)
+        meta.reflect()
+        sqltype = meta.tables['dtype_test2'].columns['B'].type
+        assert isinstance(sqltype, sqlalchemy.TEXT)
+        pytest.raises(ValueError, df.to_sql,
+                      'error', self.conn, dtype={'B': str})
+
+        # GH9083
+        df.to_sql('dtype_test3', self.conn, dtype={'B': sqlalchemy.String(10)})
+        meta.reflect()
+        sqltype = meta.tables['dtype_test3'].columns['B'].type
+        assert isinstance(sqltype, sqlalchemy.String)
+        assert sqltype.length == 10
+
+        # single dtype
+        df.to_sql('single_dtype_test', self.conn, dtype=sqlalchemy.TEXT)
+        meta = sqlalchemy.schema.MetaData(bind=self.conn)
+        meta.reflect()
+        sqltypea = meta.tables['single_dtype_test'].columns['A'].type
+        sqltypeb = meta.tables['single_dtype_test'].columns['B'].type
+        assert isinstance(sqltypea, sqlalchemy.TEXT)
+        assert isinstance(sqltypeb, sqlalchemy.TEXT)
+
+    def test_notna_dtype(self):
+        cols = {'Bool': Series([True, None]),
+                'Date': Series([datetime(2012, 5, 1), None]),
+                'Int': Series([1, None], dtype='object'),
+                'Float': Series([1.1, None])
+                }
+        df = DataFrame(cols)
+
+        tbl = 'notna_dtype_test'
+        df.to_sql(tbl, self.conn)
+        returned_df = sql.read_sql_table(tbl, self.conn)  # noqa
+        meta = sqlalchemy.schema.MetaData(bind=self.conn)
+        meta.reflect()
+        if self.flavor == 'mysql':
+            my_type = sqltypes.Integer
+        else:
+            my_type = sqltypes.Boolean
+
+        col_dict = meta.tables[tbl].columns
+
+        assert isinstance(col_dict['Bool'].type, my_type)
+        assert isinstance(col_dict['Date'].type, sqltypes.DateTime)
+        assert isinstance(col_dict['Int'].type, sqltypes.Integer)
+        assert isinstance(col_dict['Float'].type, sqltypes.Float)
+
+    def test_double_precision(self):
+        V = 1.23456789101112131415
+
+        df = DataFrame({'f32': Series([V, ], dtype='float32'),
+                        'f64': Series([V, ], dtype='float64'),
+                        'f64_as_f32': Series([V, ], dtype='float64'),
+                        'i32': Series([5, ], dtype='int32'),
+                        'i64': Series([5, ], dtype='int64'),
+                        })
+
+        df.to_sql('test_dtypes', self.conn, index=False, if_exists='replace',
+                  dtype={'f64_as_f32': sqlalchemy.Float(precision=23)})
+        res = sql.read_sql_table('test_dtypes', self.conn)
+
+        # check precision of float64
+        assert (np.round(df['f64'].iloc[0], 14) ==
+                np.round(res['f64'].iloc[0], 14))
+
+        # check sql types
+        meta = sqlalchemy.schema.MetaData(bind=self.conn)
+        meta.reflect()
+        col_dict = meta.tables['test_dtypes'].columns
+        assert str(col_dict['f32'].type) == str(col_dict['f64_as_f32'].type)
+        assert isinstance(col_dict['f32'].type, sqltypes.Float)
+        assert isinstance(col_dict['f64'].type, sqltypes.Float)
+        assert isinstance(col_dict['i32'].type, sqltypes.Integer)
+        assert isinstance(col_dict['i64'].type, sqltypes.BigInteger)
+
+    def test_connectable_issue_example(self):
+        # This tests the example raised in issue
+        # https://github.com/pandas-dev/pandas/issues/10104
+
+        def foo(connection):
+            query = 'SELECT test_foo_data FROM test_foo_data'
+            return sql.read_sql_query(query, con=connection)
+
+        def bar(connection, data):
+            data.to_sql(name='test_foo_data',
+                        con=connection, if_exists='append')
+
+        def main(connectable):
+            with connectable.connect() as conn:
+                with conn.begin():
+                    foo_data = conn.run_callable(foo)
+                    conn.run_callable(bar, foo_data)
+
+        DataFrame({'test_foo_data': [0, 1, 2]}).to_sql(
+            'test_foo_data', self.conn)
+        main(self.conn)
+
+    def test_temporary_table(self):
+        test_data = u'Hello, World!'
+        expected = DataFrame({'spam': [test_data]})
+        Base = declarative.declarative_base()
+
+        class Temporary(Base):
+            __tablename__ = 'temp_test'
+            __table_args__ = {'prefixes': ['TEMPORARY']}
+            id = sqlalchemy.Column(sqlalchemy.Integer, primary_key=True)
+            spam = sqlalchemy.Column(sqlalchemy.Unicode(30), nullable=False)
+
+        Session = sa_session.sessionmaker(bind=self.conn)
+        session = Session()
+        with session.transaction:
+            conn = session.connection()
+            Temporary.__table__.create(conn)
+            session.add(Temporary(spam=test_data))
+            session.flush()
+            df = sql.read_sql_query(
+                sql=sqlalchemy.select([Temporary.spam]),
+                con=conn,
+            )
+
+        tm.assert_frame_equal(df, expected)
+
+
+class _TestSQLAlchemyConn(_EngineToConnMixin, _TestSQLAlchemy):
+
+    def test_transactions(self):
+        pytest.skip(
+            "Nested transactions rollbacks don't work with Pandas")
+
+
+class _TestSQLiteAlchemy(object):
+    """
+    Test the sqlalchemy backend against an in-memory sqlite database.
+
+    """
+    flavor = 'sqlite'
+
+    @classmethod
+    def connect(cls):
+        return sqlalchemy.create_engine('sqlite:///:memory:')
+
+    @classmethod
+    def setup_driver(cls):
+        # sqlite3 is built-in
+        cls.driver = None
+
+    def test_default_type_conversion(self):
+        df = sql.read_sql_table("types_test_data", self.conn)
+
+        assert issubclass(df.FloatCol.dtype.type, np.floating)
+        assert issubclass(df.IntCol.dtype.type, np.integer)
+
+        # sqlite has no boolean type, so integer type is returned
+        assert issubclass(df.BoolCol.dtype.type, np.integer)
+
+        # Int column with NA values stays as float
+        assert issubclass(df.IntColWithNull.dtype.type, np.floating)
+
+        # Non-native Bool column with NA values stays as float
+        assert issubclass(df.BoolColWithNull.dtype.type, np.floating)
+
+    def test_default_date_load(self):
+        df = sql.read_sql_table("types_test_data", self.conn)
+
+        # IMPORTANT - sqlite has no native date type, so shouldn't parse, but
+        assert not issubclass(df.DateCol.dtype.type, np.datetime64)
+
+    def test_bigint_warning(self):
+        # test no warning for BIGINT (to support int64) is raised (GH7433)
+        df = DataFrame({'a': [1, 2]}, dtype='int64')
+        df.to_sql('test_bigintwarning', self.conn, index=False)
+
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            sql.read_sql_table('test_bigintwarning', self.conn)
+            assert len(w) == 0
+
+
+class _TestMySQLAlchemy(object):
+    """
+    Test the sqlalchemy backend against an MySQL database.
+
+    """
+    flavor = 'mysql'
+
+    @classmethod
+    def connect(cls):
+        url = 'mysql+{driver}://root@localhost/pandas_nosetest'
+        return sqlalchemy.create_engine(url.format(driver=cls.driver),
+                                        connect_args=cls.connect_args)
+
+    @classmethod
+    def setup_driver(cls):
+        try:
+            import pymysql  # noqa
+            cls.driver = 'pymysql'
+            from pymysql.constants import CLIENT
+            cls.connect_args = {'client_flag': CLIENT.MULTI_STATEMENTS}
+        except ImportError:
+            pytest.skip('pymysql not installed')
+
+    def test_default_type_conversion(self):
+        df = sql.read_sql_table("types_test_data", self.conn)
+
+        assert issubclass(df.FloatCol.dtype.type, np.floating)
+        assert issubclass(df.IntCol.dtype.type, np.integer)
+
+        # MySQL has no real BOOL type (it's an alias for TINYINT)
+        assert issubclass(df.BoolCol.dtype.type, np.integer)
+
+        # Int column with NA values stays as float
+        assert issubclass(df.IntColWithNull.dtype.type, np.floating)
+
+        # Bool column with NA = int column with NA values => becomes float
+        assert issubclass(df.BoolColWithNull.dtype.type, np.floating)
+
+    def test_read_procedure(self):
+        # see GH7324. Although it is more an api test, it is added to the
+        # mysql tests as sqlite does not have stored procedures
+        df = DataFrame({'a': [1, 2, 3], 'b': [0.1, 0.2, 0.3]})
+        df.to_sql('test_procedure', self.conn, index=False)
+
+        proc = """DROP PROCEDURE IF EXISTS get_testdb;
+
+        CREATE PROCEDURE get_testdb ()
+
+        BEGIN
+            SELECT * FROM test_procedure;
+        END"""
+
+        connection = self.conn.connect()
+        trans = connection.begin()
+        try:
+            r1 = connection.execute(proc)  # noqa
+            trans.commit()
+        except:
+            trans.rollback()
+            raise
+
+        res1 = sql.read_sql_query("CALL get_testdb();", self.conn)
+        tm.assert_frame_equal(df, res1)
+
+        # test delegation to read_sql_query
+        res2 = sql.read_sql("CALL get_testdb();", self.conn)
+        tm.assert_frame_equal(df, res2)
+
+
+class _TestPostgreSQLAlchemy(object):
+    """
+    Test the sqlalchemy backend against an PostgreSQL database.
+
+    """
+    flavor = 'postgresql'
+
+    @classmethod
+    def connect(cls):
+        url = 'postgresql+{driver}://postgres@localhost/pandas_nosetest'
+        return sqlalchemy.create_engine(url.format(driver=cls.driver))
+
+    @classmethod
+    def setup_driver(cls):
+        try:
+            import psycopg2  # noqa
+            cls.driver = 'psycopg2'
+        except ImportError:
+            pytest.skip('psycopg2 not installed')
+
+    def test_schema_support(self):
+        # only test this for postgresql (schema's not supported in
+        # mysql/sqlite)
+        df = DataFrame({'col1': [1, 2], 'col2': [
+                       0.1, 0.2], 'col3': ['a', 'n']})
+
+        # create a schema
+        self.conn.execute("DROP SCHEMA IF EXISTS other CASCADE;")
+        self.conn.execute("CREATE SCHEMA other;")
+
+        # write dataframe to different schema's
+        df.to_sql('test_schema_public', self.conn, index=False)
+        df.to_sql('test_schema_public_explicit', self.conn, index=False,
+                  schema='public')
+        df.to_sql('test_schema_other', self.conn, index=False, schema='other')
+
+        # read dataframes back in
+        res1 = sql.read_sql_table('test_schema_public', self.conn)
+        tm.assert_frame_equal(df, res1)
+        res2 = sql.read_sql_table('test_schema_public_explicit', self.conn)
+        tm.assert_frame_equal(df, res2)
+        res3 = sql.read_sql_table('test_schema_public_explicit', self.conn,
+                                  schema='public')
+        tm.assert_frame_equal(df, res3)
+        res4 = sql.read_sql_table('test_schema_other', self.conn,
+                                  schema='other')
+        tm.assert_frame_equal(df, res4)
+        pytest.raises(ValueError, sql.read_sql_table, 'test_schema_other',
+                      self.conn, schema='public')
+
+        # different if_exists options
+
+        # create a schema
+        self.conn.execute("DROP SCHEMA IF EXISTS other CASCADE;")
+        self.conn.execute("CREATE SCHEMA other;")
+
+        # write dataframe with different if_exists options
+        df.to_sql('test_schema_other', self.conn, schema='other', index=False)
+        df.to_sql('test_schema_other', self.conn, schema='other', index=False,
+                  if_exists='replace')
+        df.to_sql('test_schema_other', self.conn, schema='other', index=False,
+                  if_exists='append')
+        res = sql.read_sql_table(
+            'test_schema_other', self.conn, schema='other')
+        tm.assert_frame_equal(concat([df, df], ignore_index=True), res)
+
+        # specifying schema in user-provided meta
+
+        # The schema won't be applied on another Connection
+        # because of transactional schemas
+        if isinstance(self.conn, sqlalchemy.engine.Engine):
+            engine2 = self.connect()
+            meta = sqlalchemy.MetaData(engine2, schema='other')
+            pdsql = sql.SQLDatabase(engine2, meta=meta)
+            pdsql.to_sql(df, 'test_schema_other2', index=False)
+            pdsql.to_sql(df, 'test_schema_other2',
+                         index=False, if_exists='replace')
+            pdsql.to_sql(df, 'test_schema_other2',
+                         index=False, if_exists='append')
+            res1 = sql.read_sql_table(
+                'test_schema_other2', self.conn, schema='other')
+            res2 = pdsql.read_table('test_schema_other2')
+            tm.assert_frame_equal(res1, res2)
+
+
+@pytest.mark.single
+class TestMySQLAlchemy(_TestMySQLAlchemy, _TestSQLAlchemy):
+    pass
+
+
+@pytest.mark.single
+class TestMySQLAlchemyConn(_TestMySQLAlchemy, _TestSQLAlchemyConn):
+    pass
+
+
+@pytest.mark.single
+class TestPostgreSQLAlchemy(_TestPostgreSQLAlchemy, _TestSQLAlchemy):
+    pass
+
+
+@pytest.mark.single
+class TestPostgreSQLAlchemyConn(_TestPostgreSQLAlchemy, _TestSQLAlchemyConn):
+    pass
+
+
+@pytest.mark.single
+class TestSQLiteAlchemy(_TestSQLiteAlchemy, _TestSQLAlchemy):
+    pass
+
+
+@pytest.mark.single
+class TestSQLiteAlchemyConn(_TestSQLiteAlchemy, _TestSQLAlchemyConn):
+    pass
+
+
+# -----------------------------------------------------------------------------
+# -- Test Sqlite / MySQL fallback
+
+@pytest.mark.single
+class TestSQLiteFallback(SQLiteMixIn, PandasSQLTest):
+    """
+    Test the fallback mode against an in-memory sqlite database.
+
+    """
+    flavor = 'sqlite'
+
+    @classmethod
+    def connect(cls):
+        return sqlite3.connect(':memory:')
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.conn = self.connect()
+        self.pandasSQL = sql.SQLiteDatabase(self.conn)
+
+        self._load_iris_data(datapath)
+
+        self._load_test1_data()
+
+    def test_read_sql(self):
+        self._read_sql_iris()
+
+    def test_read_sql_parameter(self):
+        self._read_sql_iris_parameter()
+
+    def test_read_sql_named_parameter(self):
+        self._read_sql_iris_named_parameter()
+
+    def test_to_sql(self):
+        self._to_sql()
+
+    def test_to_sql_empty(self):
+        self._to_sql_empty()
+
+    def test_to_sql_fail(self):
+        self._to_sql_fail()
+
+    def test_to_sql_replace(self):
+        self._to_sql_replace()
+
+    def test_to_sql_append(self):
+        self._to_sql_append()
+
+    def test_create_and_drop_table(self):
+        temp_frame = DataFrame(
+            {'one': [1., 2., 3., 4.], 'two': [4., 3., 2., 1.]})
+
+        self.pandasSQL.to_sql(temp_frame, 'drop_test_frame')
+
+        assert self.pandasSQL.has_table('drop_test_frame')
+
+        self.pandasSQL.drop_table('drop_test_frame')
+
+        assert not self.pandasSQL.has_table('drop_test_frame')
+
+    def test_roundtrip(self):
+        self._roundtrip()
+
+    def test_execute_sql(self):
+        self._execute_sql()
+
+    def test_datetime_date(self):
+        # test support for datetime.date
+        df = DataFrame([date(2014, 1, 1), date(2014, 1, 2)], columns=["a"])
+        df.to_sql('test_date', self.conn, index=False)
+        res = read_sql_query('SELECT * FROM test_date', self.conn)
+        if self.flavor == 'sqlite':
+            # comes back as strings
+            tm.assert_frame_equal(res, df.astype(str))
+        elif self.flavor == 'mysql':
+            tm.assert_frame_equal(res, df)
+
+    def test_datetime_time(self):
+        # test support for datetime.time, GH #8341
+        df = DataFrame([time(9, 0, 0), time(9, 1, 30)], columns=["a"])
+        df.to_sql('test_time', self.conn, index=False)
+        res = read_sql_query('SELECT * FROM test_time', self.conn)
+        if self.flavor == 'sqlite':
+            # comes back as strings
+            expected = df.applymap(lambda _: _.strftime("%H:%M:%S.%f"))
+            tm.assert_frame_equal(res, expected)
+
+    def _get_index_columns(self, tbl_name):
+        ixs = sql.read_sql_query(
+            "SELECT * FROM sqlite_master WHERE type = 'index' " +
+            "AND tbl_name = '%s'" % tbl_name, self.conn)
+        ix_cols = []
+        for ix_name in ixs.name:
+            ix_info = sql.read_sql_query(
+                "PRAGMA index_info(%s)" % ix_name, self.conn)
+            ix_cols.append(ix_info.name.tolist())
+        return ix_cols
+
+    def test_to_sql_save_index(self):
+        self._to_sql_save_index()
+
+    def test_transactions(self):
+        if PY36:
+            pytest.skip("not working on python > 3.5")
+        self._transaction_test()
+
+    def _get_sqlite_column_type(self, table, column):
+        recs = self.conn.execute('PRAGMA table_info(%s)' % table)
+        for cid, name, ctype, not_null, default, pk in recs:
+            if name == column:
+                return ctype
+        raise ValueError('Table %s, column %s not found' % (table, column))
+
+    def test_dtype(self):
+        if self.flavor == 'mysql':
+            pytest.skip('Not applicable to MySQL legacy')
+        cols = ['A', 'B']
+        data = [(0.8, True),
+                (0.9, None)]
+        df = DataFrame(data, columns=cols)
+        df.to_sql('dtype_test', self.conn)
+        df.to_sql('dtype_test2', self.conn, dtype={'B': 'STRING'})
+
+        # sqlite stores Boolean values as INTEGER
+        assert self._get_sqlite_column_type(
+            'dtype_test', 'B') == 'INTEGER'
+
+        assert self._get_sqlite_column_type(
+            'dtype_test2', 'B') == 'STRING'
+        pytest.raises(ValueError, df.to_sql,
+                      'error', self.conn, dtype={'B': bool})
+
+        # single dtype
+        df.to_sql('single_dtype_test', self.conn, dtype='STRING')
+        assert self._get_sqlite_column_type(
+            'single_dtype_test', 'A') == 'STRING'
+        assert self._get_sqlite_column_type(
+            'single_dtype_test', 'B') == 'STRING'
+
+    def test_notna_dtype(self):
+        if self.flavor == 'mysql':
+            pytest.skip('Not applicable to MySQL legacy')
+
+        cols = {'Bool': Series([True, None]),
+                'Date': Series([datetime(2012, 5, 1), None]),
+                'Int': Series([1, None], dtype='object'),
+                'Float': Series([1.1, None])
+                }
+        df = DataFrame(cols)
+
+        tbl = 'notna_dtype_test'
+        df.to_sql(tbl, self.conn)
+
+        assert self._get_sqlite_column_type(tbl, 'Bool') == 'INTEGER'
+        assert self._get_sqlite_column_type(tbl, 'Date') == 'TIMESTAMP'
+        assert self._get_sqlite_column_type(tbl, 'Int') == 'INTEGER'
+        assert self._get_sqlite_column_type(tbl, 'Float') == 'REAL'
+
+    def test_illegal_names(self):
+        # For sqlite, these should work fine
+        df = DataFrame([[1, 2], [3, 4]], columns=['a', 'b'])
+
+        # Raise error on blank
+        pytest.raises(ValueError, df.to_sql, "", self.conn)
+
+        for ndx, weird_name in enumerate(
+                ['test_weird_name]', 'test_weird_name[',
+                 'test_weird_name`', 'test_weird_name"', 'test_weird_name\'',
+                 '_b.test_weird_name_01-30', '"_b.test_weird_name_01-30"',
+                 '99beginswithnumber', '12345', u'\xe9']):
+            df.to_sql(weird_name, self.conn)
+            sql.table_exists(weird_name, self.conn)
+
+            df2 = DataFrame([[1, 2], [3, 4]], columns=['a', weird_name])
+            c_tbl = 'test_weird_col_name%d' % ndx
+            df2.to_sql(c_tbl, self.conn)
+            sql.table_exists(c_tbl, self.conn)
+
+
+# -----------------------------------------------------------------------------
+# -- Old tests from 0.13.1 (before refactor using sqlalchemy)
+
+
+_formatters = {
+    datetime: lambda dt: "'%s'" % date_format(dt),
+    str: lambda x: "'%s'" % x,
+    np.str_: lambda x: "'%s'" % x,
+    compat.text_type: lambda x: "'%s'" % x,
+    compat.binary_type: lambda x: "'%s'" % x,
+    float: lambda x: "%.8f" % x,
+    int: lambda x: "%s" % x,
+    type(None): lambda x: "NULL",
+    np.float64: lambda x: "%.10f" % x,
+    bool: lambda x: "'%s'" % x,
+}
+
+
+def format_query(sql, *args):
+    """
+
+    """
+    processed_args = []
+    for arg in args:
+        if isinstance(arg, float) and isna(arg):
+            arg = None
+
+        formatter = _formatters[type(arg)]
+        processed_args.append(formatter(arg))
+
+    return sql % tuple(processed_args)
+
+
+def tquery(query, con=None, cur=None):
+    """Replace removed sql.tquery function"""
+    res = sql.execute(query, con=con, cur=cur).fetchall()
+    if res is None:
+        return None
+    else:
+        return list(res)
+
+
+def _skip_if_no_pymysql():
+    try:
+        import pymysql  # noqa
+    except ImportError:
+        pytest.skip('pymysql not installed, skipping')
+
+
+@pytest.mark.single
+class TestXSQLite(SQLiteMixIn):
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, request, datapath):
+        self.method = request.function
+        self.conn = sqlite3.connect(':memory:')
+
+    def test_basic(self):
+        frame = tm.makeTimeDataFrame()
+        self._check_roundtrip(frame)
+
+    def test_write_row_by_row(self):
+
+        frame = tm.makeTimeDataFrame()
+        frame.iloc[0, 0] = np.nan
+        create_sql = sql.get_schema(frame, 'test')
+        cur = self.conn.cursor()
+        cur.execute(create_sql)
+
+        cur = self.conn.cursor()
+
+        ins = "INSERT INTO test VALUES (%s, %s, %s, %s)"
+        for idx, row in frame.iterrows():
+            fmt_sql = format_query(ins, *row)
+            tquery(fmt_sql, cur=cur)
+
+        self.conn.commit()
+
+        result = sql.read_sql("select * from test", con=self.conn)
+        result.index = frame.index
+        tm.assert_frame_equal(result, frame, check_less_precise=True)
+
+    def test_execute(self):
+        frame = tm.makeTimeDataFrame()
+        create_sql = sql.get_schema(frame, 'test')
+        cur = self.conn.cursor()
+        cur.execute(create_sql)
+        ins = "INSERT INTO test VALUES (?, ?, ?, ?)"
+
+        row = frame.iloc[0]
+        sql.execute(ins, self.conn, params=tuple(row))
+        self.conn.commit()
+
+        result = sql.read_sql("select * from test", self.conn)
+        result.index = frame.index[:1]
+        tm.assert_frame_equal(result, frame[:1])
+
+    def test_schema(self):
+        frame = tm.makeTimeDataFrame()
+        create_sql = sql.get_schema(frame, 'test')
+        lines = create_sql.splitlines()
+        for l in lines:
+            tokens = l.split(' ')
+            if len(tokens) == 2 and tokens[0] == 'A':
+                assert tokens[1] == 'DATETIME'
+
+        frame = tm.makeTimeDataFrame()
+        create_sql = sql.get_schema(frame, 'test', keys=['A', 'B'])
+        lines = create_sql.splitlines()
+        assert 'PRIMARY KEY ("A", "B")' in create_sql
+        cur = self.conn.cursor()
+        cur.execute(create_sql)
+
+    @tm.capture_stdout
+    def test_execute_fail(self):
+        create_sql = """
+        CREATE TABLE test
+        (
+        a TEXT,
+        b TEXT,
+        c REAL,
+        PRIMARY KEY (a, b)
+        );
+        """
+        cur = self.conn.cursor()
+        cur.execute(create_sql)
+
+        sql.execute('INSERT INTO test VALUES("foo", "bar", 1.234)', self.conn)
+        sql.execute('INSERT INTO test VALUES("foo", "baz", 2.567)', self.conn)
+
+        with pytest.raises(Exception):
+            sql.execute('INSERT INTO test VALUES("foo", "bar", 7)', self.conn)
+
+    def test_execute_closed_connection(self, request, datapath):
+        create_sql = """
+        CREATE TABLE test
+        (
+        a TEXT,
+        b TEXT,
+        c REAL,
+        PRIMARY KEY (a, b)
+        );
+        """
+        cur = self.conn.cursor()
+        cur.execute(create_sql)
+
+        sql.execute('INSERT INTO test VALUES("foo", "bar", 1.234)', self.conn)
+        self.conn.close()
+
+        with pytest.raises(Exception):
+            tquery("select * from test", con=self.conn)
+
+        # Initialize connection again (needed for tearDown)
+        self.setup_method(request, datapath)
+
+    def test_na_roundtrip(self):
+        pass
+
+    def _check_roundtrip(self, frame):
+        sql.to_sql(frame, name='test_table', con=self.conn, index=False)
+        result = sql.read_sql("select * from test_table", self.conn)
+
+        # HACK! Change this once indexes are handled properly.
+        result.index = frame.index
+
+        expected = frame
+        tm.assert_frame_equal(result, expected)
+
+        frame['txt'] = ['a'] * len(frame)
+        frame2 = frame.copy()
+        frame2['Idx'] = Index(lrange(len(frame2))) + 10
+        sql.to_sql(frame2, name='test_table2', con=self.conn, index=False)
+        result = sql.read_sql("select * from test_table2", self.conn,
+                              index_col='Idx')
+        expected = frame.copy()
+        expected.index = Index(lrange(len(frame2))) + 10
+        expected.index.name = 'Idx'
+        tm.assert_frame_equal(expected, result)
+
+    def test_keyword_as_column_names(self):
+        df = DataFrame({'From': np.ones(5)})
+        sql.to_sql(df, con=self.conn, name='testkeywords', index=False)
+
+    def test_onecolumn_of_integer(self):
+        # GH 3628
+        # a column_of_integers dataframe should transfer well to sql
+
+        mono_df = DataFrame([1, 2], columns=['c0'])
+        sql.to_sql(mono_df, con=self.conn, name='mono_df', index=False)
+        # computing the sum via sql
+        con_x = self.conn
+        the_sum = sum(my_c0[0]
+                      for my_c0 in con_x.execute("select * from mono_df"))
+        # it should not fail, and gives 3 ( Issue #3628 )
+        assert the_sum == 3
+
+        result = sql.read_sql("select * from mono_df", con_x)
+        tm.assert_frame_equal(result, mono_df)
+
+    def test_if_exists(self):
+        df_if_exists_1 = DataFrame({'col1': [1, 2], 'col2': ['A', 'B']})
+        df_if_exists_2 = DataFrame(
+            {'col1': [3, 4, 5], 'col2': ['C', 'D', 'E']})
+        table_name = 'table_if_exists'
+        sql_select = "SELECT * FROM %s" % table_name
+
+        def clean_up(test_table_to_drop):
+            """
+            Drops tables created from individual tests
+            so no dependencies arise from sequential tests
+            """
+            self.drop_table(test_table_to_drop)
+
+        # test if invalid value for if_exists raises appropriate error
+        pytest.raises(ValueError,
+                      sql.to_sql,
+                      frame=df_if_exists_1,
+                      con=self.conn,
+                      name=table_name,
+                      if_exists='notvalidvalue')
+        clean_up(table_name)
+
+        # test if_exists='fail'
+        sql.to_sql(frame=df_if_exists_1, con=self.conn,
+                   name=table_name, if_exists='fail')
+        pytest.raises(ValueError,
+                      sql.to_sql,
+                      frame=df_if_exists_1,
+                      con=self.conn,
+                      name=table_name,
+                      if_exists='fail')
+
+        # test if_exists='replace'
+        sql.to_sql(frame=df_if_exists_1, con=self.conn, name=table_name,
+                   if_exists='replace', index=False)
+        assert tquery(sql_select, con=self.conn) == [(1, 'A'), (2, 'B')]
+        sql.to_sql(frame=df_if_exists_2, con=self.conn, name=table_name,
+                   if_exists='replace', index=False)
+        assert (tquery(sql_select, con=self.conn) ==
+                [(3, 'C'), (4, 'D'), (5, 'E')])
+        clean_up(table_name)
+
+        # test if_exists='append'
+        sql.to_sql(frame=df_if_exists_1, con=self.conn, name=table_name,
+                   if_exists='fail', index=False)
+        assert tquery(sql_select, con=self.conn) == [(1, 'A'), (2, 'B')]
+        sql.to_sql(frame=df_if_exists_2, con=self.conn, name=table_name,
+                   if_exists='append', index=False)
+        assert (tquery(sql_select, con=self.conn) ==
+                [(1, 'A'), (2, 'B'), (3, 'C'), (4, 'D'), (5, 'E')])
+        clean_up(table_name)
+
+
+@pytest.mark.single
+@pytest.mark.skip(reason="gh-13611: there is no support for MySQL "
+                  "if SQLAlchemy is not installed")
+class TestXMySQL(MySQLMixIn):
+
+    @pytest.fixture(autouse=True, scope='class')
+    def setup_class(cls):
+        _skip_if_no_pymysql()
+
+        # test connection
+        import pymysql
+        try:
+            # Try Travis defaults.
+            # No real user should allow root access with a blank password.
+            pymysql.connect(host='localhost', user='root', passwd='',
+                            db='pandas_nosetest')
+        except:
+            pass
+        else:
+            return
+        try:
+            pymysql.connect(read_default_group='pandas')
+        except pymysql.ProgrammingError:
+            pytest.skip(
+                "Create a group of connection parameters under the heading "
+                "[pandas] in your system's mysql default file, "
+                "typically located at ~/.my.cnf or /etc/.my.cnf. ")
+        except pymysql.Error:
+            pytest.skip(
+                "Cannot connect to database. "
+                "Create a group of connection parameters under the heading "
+                "[pandas] in your system's mysql default file, "
+                "typically located at ~/.my.cnf or /etc/.my.cnf. ")
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, request, datapath):
+        _skip_if_no_pymysql()
+        import pymysql
+        try:
+            # Try Travis defaults.
+            # No real user should allow root access with a blank password.
+            self.conn = pymysql.connect(host='localhost', user='root',
+                                        passwd='', db='pandas_nosetest')
+        except:
+            pass
+        else:
+            return
+        try:
+            self.conn = pymysql.connect(read_default_group='pandas')
+        except pymysql.ProgrammingError:
+            pytest.skip(
+                "Create a group of connection parameters under the heading "
+                "[pandas] in your system's mysql default file, "
+                "typically located at ~/.my.cnf or /etc/.my.cnf. ")
+        except pymysql.Error:
+            pytest.skip(
+                "Cannot connect to database. "
+                "Create a group of connection parameters under the heading "
+                "[pandas] in your system's mysql default file, "
+                "typically located at ~/.my.cnf or /etc/.my.cnf. ")
+
+        self.method = request.function
+
+    def test_basic(self):
+        _skip_if_no_pymysql()
+        frame = tm.makeTimeDataFrame()
+        self._check_roundtrip(frame)
+
+    def test_write_row_by_row(self):
+
+        _skip_if_no_pymysql()
+        frame = tm.makeTimeDataFrame()
+        frame.iloc[0, 0] = np.nan
+        drop_sql = "DROP TABLE IF EXISTS test"
+        create_sql = sql.get_schema(frame, 'test')
+        cur = self.conn.cursor()
+        cur.execute(drop_sql)
+        cur.execute(create_sql)
+        ins = "INSERT INTO test VALUES (%s, %s, %s, %s)"
+        for idx, row in frame.iterrows():
+            fmt_sql = format_query(ins, *row)
+            tquery(fmt_sql, cur=cur)
+
+        self.conn.commit()
+
+        result = sql.read_sql("select * from test", con=self.conn)
+        result.index = frame.index
+        tm.assert_frame_equal(result, frame, check_less_precise=True)
+
+    def test_chunksize_read_type(self):
+        _skip_if_no_pymysql()
+        frame = tm.makeTimeDataFrame()
+        frame.index.name = "index"
+        drop_sql = "DROP TABLE IF EXISTS test"
+        cur = self.conn.cursor()
+        cur.execute(drop_sql)
+        sql.to_sql(frame, name='test', con=self.conn)
+        query = "select * from test"
+        chunksize = 5
+        chunk_gen = pd.read_sql_query(sql=query, con=self.conn,
+                                      chunksize=chunksize, index_col="index")
+        chunk_df = next(chunk_gen)
+        tm.assert_frame_equal(frame[:chunksize], chunk_df)
+
+    def test_execute(self):
+        _skip_if_no_pymysql()
+        frame = tm.makeTimeDataFrame()
+        drop_sql = "DROP TABLE IF EXISTS test"
+        create_sql = sql.get_schema(frame, 'test')
+        cur = self.conn.cursor()
+        with warnings.catch_warnings():
+            warnings.filterwarnings("ignore", "Unknown table.*")
+            cur.execute(drop_sql)
+        cur.execute(create_sql)
+        ins = "INSERT INTO test VALUES (%s, %s, %s, %s)"
+
+        row = frame.iloc[0].values.tolist()
+        sql.execute(ins, self.conn, params=tuple(row))
+        self.conn.commit()
+
+        result = sql.read_sql("select * from test", self.conn)
+        result.index = frame.index[:1]
+        tm.assert_frame_equal(result, frame[:1])
+
+    def test_schema(self):
+        _skip_if_no_pymysql()
+        frame = tm.makeTimeDataFrame()
+        create_sql = sql.get_schema(frame, 'test')
+        lines = create_sql.splitlines()
+        for l in lines:
+            tokens = l.split(' ')
+            if len(tokens) == 2 and tokens[0] == 'A':
+                assert tokens[1] == 'DATETIME'
+
+        frame = tm.makeTimeDataFrame()
+        drop_sql = "DROP TABLE IF EXISTS test"
+        create_sql = sql.get_schema(frame, 'test', keys=['A', 'B'])
+        lines = create_sql.splitlines()
+        assert 'PRIMARY KEY (`A`, `B`)' in create_sql
+        cur = self.conn.cursor()
+        cur.execute(drop_sql)
+        cur.execute(create_sql)
+
+    @tm.capture_stdout
+    def test_execute_fail(self):
+        _skip_if_no_pymysql()
+        drop_sql = "DROP TABLE IF EXISTS test"
+        create_sql = """
+        CREATE TABLE test
+        (
+        a TEXT,
+        b TEXT,
+        c REAL,
+        PRIMARY KEY (a(5), b(5))
+        );
+        """
+        cur = self.conn.cursor()
+        cur.execute(drop_sql)
+        cur.execute(create_sql)
+
+        sql.execute('INSERT INTO test VALUES("foo", "bar", 1.234)', self.conn)
+        sql.execute('INSERT INTO test VALUES("foo", "baz", 2.567)', self.conn)
+
+        with pytest.raises(Exception):
+            sql.execute('INSERT INTO test VALUES("foo", "bar", 7)', self.conn)
+
+    def test_execute_closed_connection(self, request, datapath):
+        _skip_if_no_pymysql()
+        drop_sql = "DROP TABLE IF EXISTS test"
+        create_sql = """
+        CREATE TABLE test
+        (
+        a TEXT,
+        b TEXT,
+        c REAL,
+        PRIMARY KEY (a(5), b(5))
+        );
+        """
+        cur = self.conn.cursor()
+        cur.execute(drop_sql)
+        cur.execute(create_sql)
+
+        sql.execute('INSERT INTO test VALUES("foo", "bar", 1.234)', self.conn)
+        self.conn.close()
+
+        with pytest.raises(Exception):
+            tquery("select * from test", con=self.conn)
+
+        # Initialize connection again (needed for tearDown)
+        self.setup_method(request, datapath)
+
+    def test_na_roundtrip(self):
+        _skip_if_no_pymysql()
+        pass
+
+    def _check_roundtrip(self, frame):
+        _skip_if_no_pymysql()
+        drop_sql = "DROP TABLE IF EXISTS test_table"
+        cur = self.conn.cursor()
+        with warnings.catch_warnings():
+            warnings.filterwarnings("ignore", "Unknown table.*")
+            cur.execute(drop_sql)
+        sql.to_sql(frame, name='test_table', con=self.conn, index=False)
+        result = sql.read_sql("select * from test_table", self.conn)
+
+        # HACK! Change this once indexes are handled properly.
+        result.index = frame.index
+        result.index.name = frame.index.name
+
+        expected = frame
+        tm.assert_frame_equal(result, expected)
+
+        frame['txt'] = ['a'] * len(frame)
+        frame2 = frame.copy()
+        index = Index(lrange(len(frame2))) + 10
+        frame2['Idx'] = index
+        drop_sql = "DROP TABLE IF EXISTS test_table2"
+        cur = self.conn.cursor()
+        with warnings.catch_warnings():
+            warnings.filterwarnings("ignore", "Unknown table.*")
+            cur.execute(drop_sql)
+        sql.to_sql(frame2, name='test_table2',
+                   con=self.conn, index=False)
+        result = sql.read_sql("select * from test_table2", self.conn,
+                              index_col='Idx')
+        expected = frame.copy()
+
+        # HACK! Change this once indexes are handled properly.
+        expected.index = index
+        expected.index.names = result.index.names
+        tm.assert_frame_equal(expected, result)
+
+    def test_keyword_as_column_names(self):
+        _skip_if_no_pymysql()
+        df = DataFrame({'From': np.ones(5)})
+        sql.to_sql(df, con=self.conn, name='testkeywords',
+                   if_exists='replace', index=False)
+
+    def test_if_exists(self):
+        _skip_if_no_pymysql()
+        df_if_exists_1 = DataFrame({'col1': [1, 2], 'col2': ['A', 'B']})
+        df_if_exists_2 = DataFrame(
+            {'col1': [3, 4, 5], 'col2': ['C', 'D', 'E']})
+        table_name = 'table_if_exists'
+        sql_select = "SELECT * FROM %s" % table_name
+
+        def clean_up(test_table_to_drop):
+            """
+            Drops tables created from individual tests
+            so no dependencies arise from sequential tests
+            """
+            self.drop_table(test_table_to_drop)
+
+        # test if invalid value for if_exists raises appropriate error
+        pytest.raises(ValueError,
+                      sql.to_sql,
+                      frame=df_if_exists_1,
+                      con=self.conn,
+                      name=table_name,
+                      if_exists='notvalidvalue')
+        clean_up(table_name)
+
+        # test if_exists='fail'
+        sql.to_sql(frame=df_if_exists_1, con=self.conn, name=table_name,
+                   if_exists='fail', index=False)
+        pytest.raises(ValueError,
+                      sql.to_sql,
+                      frame=df_if_exists_1,
+                      con=self.conn,
+                      name=table_name,
+                      if_exists='fail')
+
+        # test if_exists='replace'
+        sql.to_sql(frame=df_if_exists_1, con=self.conn, name=table_name,
+                   if_exists='replace', index=False)
+        assert tquery(sql_select, con=self.conn) == [(1, 'A'), (2, 'B')]
+        sql.to_sql(frame=df_if_exists_2, con=self.conn, name=table_name,
+                   if_exists='replace', index=False)
+        assert (tquery(sql_select, con=self.conn) ==
+                [(3, 'C'), (4, 'D'), (5, 'E')])
+        clean_up(table_name)
+
+        # test if_exists='append'
+        sql.to_sql(frame=df_if_exists_1, con=self.conn, name=table_name,
+                   if_exists='fail', index=False)
+        assert tquery(sql_select, con=self.conn) == [(1, 'A'), (2, 'B')]
+        sql.to_sql(frame=df_if_exists_2, con=self.conn, name=table_name,
+                   if_exists='append', index=False)
+        assert (tquery(sql_select, con=self.conn) ==
+                [(1, 'A'), (2, 'B'), (3, 'C'), (4, 'D'), (5, 'E')])
+        clean_up(table_name)
diff --git a/pandas/tests/io/test_stata.py b/pandas/tests/io/test_stata.py
new file mode 100644
index 0000000000000..cfe47cae7e5e1
--- /dev/null
+++ b/pandas/tests/io/test_stata.py
@@ -0,0 +1,1509 @@
+# -*- coding: utf-8 -*-
+# pylint: disable=E1101
+
+import datetime as dt
+import io
+import gzip
+import os
+import struct
+import warnings
+from collections import OrderedDict
+from datetime import datetime
+
+import numpy as np
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import compat
+from pandas.compat import iterkeys
+from pandas.core.dtypes.common import is_categorical_dtype
+from pandas.core.frame import DataFrame, Series
+from pandas.io.parsers import read_csv
+from pandas.io.stata import (InvalidColumnName, PossiblePrecisionLoss,
+                             StataMissingValue, StataReader, read_stata)
+
+
+@pytest.fixture
+def dirpath(datapath):
+    return datapath("io", "data")
+
+
+@pytest.fixture
+def parsed_114(dirpath):
+    dta14_114 = os.path.join(dirpath, 'stata5_114.dta')
+    parsed_114 = read_stata(dta14_114, convert_dates=True)
+    parsed_114.index.name = 'index'
+    return parsed_114
+
+
+class TestStata(object):
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.dirpath = datapath("io", "data")
+        self.dta1_114 = os.path.join(self.dirpath, 'stata1_114.dta')
+        self.dta1_117 = os.path.join(self.dirpath, 'stata1_117.dta')
+
+        self.dta2_113 = os.path.join(self.dirpath, 'stata2_113.dta')
+        self.dta2_114 = os.path.join(self.dirpath, 'stata2_114.dta')
+        self.dta2_115 = os.path.join(self.dirpath, 'stata2_115.dta')
+        self.dta2_117 = os.path.join(self.dirpath, 'stata2_117.dta')
+
+        self.dta3_113 = os.path.join(self.dirpath, 'stata3_113.dta')
+        self.dta3_114 = os.path.join(self.dirpath, 'stata3_114.dta')
+        self.dta3_115 = os.path.join(self.dirpath, 'stata3_115.dta')
+        self.dta3_117 = os.path.join(self.dirpath, 'stata3_117.dta')
+        self.csv3 = os.path.join(self.dirpath, 'stata3.csv')
+
+        self.dta4_113 = os.path.join(self.dirpath, 'stata4_113.dta')
+        self.dta4_114 = os.path.join(self.dirpath, 'stata4_114.dta')
+        self.dta4_115 = os.path.join(self.dirpath, 'stata4_115.dta')
+        self.dta4_117 = os.path.join(self.dirpath, 'stata4_117.dta')
+
+        self.dta_encoding = os.path.join(self.dirpath, 'stata1_encoding.dta')
+
+        self.csv14 = os.path.join(self.dirpath, 'stata5.csv')
+        self.dta14_113 = os.path.join(self.dirpath, 'stata5_113.dta')
+        self.dta14_114 = os.path.join(self.dirpath, 'stata5_114.dta')
+        self.dta14_115 = os.path.join(self.dirpath, 'stata5_115.dta')
+        self.dta14_117 = os.path.join(self.dirpath, 'stata5_117.dta')
+
+        self.csv15 = os.path.join(self.dirpath, 'stata6.csv')
+        self.dta15_113 = os.path.join(self.dirpath, 'stata6_113.dta')
+        self.dta15_114 = os.path.join(self.dirpath, 'stata6_114.dta')
+        self.dta15_115 = os.path.join(self.dirpath, 'stata6_115.dta')
+        self.dta15_117 = os.path.join(self.dirpath, 'stata6_117.dta')
+
+        self.dta16_115 = os.path.join(self.dirpath, 'stata7_115.dta')
+        self.dta16_117 = os.path.join(self.dirpath, 'stata7_117.dta')
+
+        self.dta17_113 = os.path.join(self.dirpath, 'stata8_113.dta')
+        self.dta17_115 = os.path.join(self.dirpath, 'stata8_115.dta')
+        self.dta17_117 = os.path.join(self.dirpath, 'stata8_117.dta')
+
+        self.dta18_115 = os.path.join(self.dirpath, 'stata9_115.dta')
+        self.dta18_117 = os.path.join(self.dirpath, 'stata9_117.dta')
+
+        self.dta19_115 = os.path.join(self.dirpath, 'stata10_115.dta')
+        self.dta19_117 = os.path.join(self.dirpath, 'stata10_117.dta')
+
+        self.dta20_115 = os.path.join(self.dirpath, 'stata11_115.dta')
+        self.dta20_117 = os.path.join(self.dirpath, 'stata11_117.dta')
+
+        self.dta21_117 = os.path.join(self.dirpath, 'stata12_117.dta')
+
+        self.dta22_118 = os.path.join(self.dirpath, 'stata14_118.dta')
+        self.dta23 = os.path.join(self.dirpath, 'stata15.dta')
+
+        self.dta24_111 = os.path.join(self.dirpath, 'stata7_111.dta')
+        self.dta25_118 = os.path.join(self.dirpath, 'stata16_118.dta')
+
+        self.stata_dates = os.path.join(self.dirpath, 'stata13_dates.dta')
+
+    def read_dta(self, file):
+        # Legacy default reader configuration
+        return read_stata(file, convert_dates=True)
+
+    def read_csv(self, file):
+        return read_csv(file, parse_dates=True)
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_read_empty_dta(self, version):
+        empty_ds = DataFrame(columns=['unit'])
+        # GH 7369, make sure can read a 0-obs dta file
+        with tm.ensure_clean() as path:
+            empty_ds.to_stata(path, write_index=False, version=version)
+            empty_ds2 = read_stata(path)
+            tm.assert_frame_equal(empty_ds, empty_ds2)
+
+    def test_data_method(self):
+        # Minimal testing of legacy data method
+        with StataReader(self.dta1_114) as rdr:
+            with warnings.catch_warnings(record=True) as w:  # noqa
+                parsed_114_data = rdr.data()
+
+        with StataReader(self.dta1_114) as rdr:
+            parsed_114_read = rdr.read()
+        tm.assert_frame_equal(parsed_114_data, parsed_114_read)
+
+    @pytest.mark.parametrize(
+        'file', ['dta1_114', 'dta1_117'])
+    def test_read_dta1(self, file):
+
+        file = getattr(self, file)
+        parsed = self.read_dta(file)
+
+        # Pandas uses np.nan as missing value.
+        # Thus, all columns will be of type float, regardless of their name.
+        expected = DataFrame([(np.nan, np.nan, np.nan, np.nan, np.nan)],
+                             columns=['float_miss', 'double_miss', 'byte_miss',
+                                      'int_miss', 'long_miss'])
+
+        # this is an oddity as really the nan should be float64, but
+        # the casting doesn't fail so need to match stata here
+        expected['float_miss'] = expected['float_miss'].astype(np.float32)
+
+        tm.assert_frame_equal(parsed, expected)
+
+    def test_read_dta2(self):
+
+        expected = DataFrame.from_records(
+            [
+                (
+                    datetime(2006, 11, 19, 23, 13, 20),
+                    1479596223000,
+                    datetime(2010, 1, 20),
+                    datetime(2010, 1, 8),
+                    datetime(2010, 1, 1),
+                    datetime(1974, 7, 1),
+                    datetime(2010, 1, 1),
+                    datetime(2010, 1, 1)
+                ),
+                (
+                    datetime(1959, 12, 31, 20, 3, 20),
+                    -1479590,
+                    datetime(1953, 10, 2),
+                    datetime(1948, 6, 10),
+                    datetime(1955, 1, 1),
+                    datetime(1955, 7, 1),
+                    datetime(1955, 1, 1),
+                    datetime(2, 1, 1)
+                ),
+                (
+                    pd.NaT,
+                    pd.NaT,
+                    pd.NaT,
+                    pd.NaT,
+                    pd.NaT,
+                    pd.NaT,
+                    pd.NaT,
+                    pd.NaT,
+                )
+            ],
+            columns=['datetime_c', 'datetime_big_c', 'date', 'weekly_date',
+                     'monthly_date', 'quarterly_date', 'half_yearly_date',
+                     'yearly_date']
+        )
+        expected['yearly_date'] = expected['yearly_date'].astype('O')
+
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            parsed_114 = self.read_dta(self.dta2_114)
+            parsed_115 = self.read_dta(self.dta2_115)
+            parsed_117 = self.read_dta(self.dta2_117)
+            # 113 is buggy due to limits of date format support in Stata
+            # parsed_113 = self.read_dta(self.dta2_113)
+
+            # Remove resource warnings
+            w = [x for x in w if x.category is UserWarning]
+
+            # should get warning for each call to read_dta
+            assert len(w) == 3
+
+        # buggy test because of the NaT comparison on certain platforms
+        # Format 113 test fails since it does not support tc and tC formats
+        # tm.assert_frame_equal(parsed_113, expected)
+        tm.assert_frame_equal(parsed_114, expected,
+                              check_datetimelike_compat=True)
+        tm.assert_frame_equal(parsed_115, expected,
+                              check_datetimelike_compat=True)
+        tm.assert_frame_equal(parsed_117, expected,
+                              check_datetimelike_compat=True)
+
+    @pytest.mark.parametrize(
+        'file', ['dta3_113', 'dta3_114', 'dta3_115', 'dta3_117'])
+    def test_read_dta3(self, file):
+
+        file = getattr(self, file)
+        parsed = self.read_dta(file)
+
+        # match stata here
+        expected = self.read_csv(self.csv3)
+        expected = expected.astype(np.float32)
+        expected['year'] = expected['year'].astype(np.int16)
+        expected['quarter'] = expected['quarter'].astype(np.int8)
+
+        tm.assert_frame_equal(parsed, expected)
+
+    @pytest.mark.parametrize(
+        'file', ['dta4_113', 'dta4_114', 'dta4_115', 'dta4_117'])
+    def test_read_dta4(self, file):
+
+        file = getattr(self, file)
+        parsed = self.read_dta(file)
+
+        expected = DataFrame.from_records(
+            [
+                ["one", "ten", "one", "one", "one"],
+                ["two", "nine", "two", "two", "two"],
+                ["three", "eight", "three", "three", "three"],
+                ["four", "seven", 4, "four", "four"],
+                ["five", "six", 5, np.nan, "five"],
+                ["six", "five", 6, np.nan, "six"],
+                ["seven", "four", 7, np.nan, "seven"],
+                ["eight", "three", 8, np.nan, "eight"],
+                ["nine", "two", 9, np.nan, "nine"],
+                ["ten", "one", "ten", np.nan, "ten"]
+            ],
+            columns=['fully_labeled', 'fully_labeled2', 'incompletely_labeled',
+                     'labeled_with_missings', 'float_labelled'])
+
+        # these are all categoricals
+        expected = pd.concat([expected[col].astype('category')
+                              for col in expected], axis=1)
+
+        # stata doesn't save .category metadata
+        tm.assert_frame_equal(parsed, expected, check_categorical=False)
+
+    # File containing strls
+    def test_read_dta12(self):
+        parsed_117 = self.read_dta(self.dta21_117)
+        expected = DataFrame.from_records(
+            [
+                [1, "abc", "abcdefghi"],
+                [3, "cba", "qwertywertyqwerty"],
+                [93, "", "strl"],
+            ],
+            columns=['x', 'y', 'z'])
+
+        tm.assert_frame_equal(parsed_117, expected, check_dtype=False)
+
+    def test_read_dta18(self):
+        parsed_118 = self.read_dta(self.dta22_118)
+        parsed_118["Bytes"] = parsed_118["Bytes"].astype('O')
+        expected = DataFrame.from_records(
+            [['Cat', 'Bogota', u'Bogotá', 1, 1.0, u'option b Ünicode', 1.0],
+             ['Dog', 'Boston', u'Uzunköprü', np.nan, np.nan, np.nan, np.nan],
+             ['Plane', 'Rome', u'Tromsø', 0, 0.0, 'option a', 0.0],
+             ['Potato', 'Tokyo', u'Elâzığ', -4, 4.0, 4, 4],
+             ['', '', '', 0, 0.3332999, 'option a', 1 / 3.]
+             ],
+            columns=['Things', 'Cities', 'Unicode_Cities_Strl',
+                     'Ints', 'Floats', 'Bytes', 'Longs'])
+        expected["Floats"] = expected["Floats"].astype(np.float32)
+        for col in parsed_118.columns:
+            tm.assert_almost_equal(parsed_118[col], expected[col])
+
+        with StataReader(self.dta22_118) as rdr:
+            vl = rdr.variable_labels()
+            vl_expected = {u'Unicode_Cities_Strl':
+                           u'Here are some strls with Ünicode chars',
+                           u'Longs': u'long data',
+                           u'Things': u'Here are some things',
+                           u'Bytes': u'byte data',
+                           u'Ints': u'int data',
+                           u'Cities': u'Here are some cities',
+                           u'Floats': u'float data'}
+            tm.assert_dict_equal(vl, vl_expected)
+
+            assert rdr.data_label == u'This is a  Ünicode data label'
+
+    def test_read_write_dta5(self):
+        original = DataFrame([(np.nan, np.nan, np.nan, np.nan, np.nan)],
+                             columns=['float_miss', 'double_miss', 'byte_miss',
+                                      'int_miss', 'long_miss'])
+        original.index.name = 'index'
+
+        with tm.ensure_clean() as path:
+            original.to_stata(path, None)
+            written_and_read_again = self.read_dta(path)
+            tm.assert_frame_equal(written_and_read_again.set_index('index'),
+                                  original)
+
+    def test_write_dta6(self):
+        original = self.read_csv(self.csv3)
+        original.index.name = 'index'
+        original.index = original.index.astype(np.int32)
+        original['year'] = original['year'].astype(np.int32)
+        original['quarter'] = original['quarter'].astype(np.int32)
+
+        with tm.ensure_clean() as path:
+            original.to_stata(path, None)
+            written_and_read_again = self.read_dta(path)
+            tm.assert_frame_equal(written_and_read_again.set_index('index'),
+                                  original, check_index_type=False)
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_read_write_dta10(self, version):
+        original = DataFrame(data=[["string", "object", 1, 1.1,
+                                    np.datetime64('2003-12-25')]],
+                             columns=['string', 'object', 'integer',
+                                      'floating', 'datetime'])
+        original["object"] = Series(original["object"], dtype=object)
+        original.index.name = 'index'
+        original.index = original.index.astype(np.int32)
+        original['integer'] = original['integer'].astype(np.int32)
+
+        with tm.ensure_clean() as path:
+            original.to_stata(path, {'datetime': 'tc'}, version=version)
+            written_and_read_again = self.read_dta(path)
+            # original.index is np.int32, read index is np.int64
+            tm.assert_frame_equal(written_and_read_again.set_index('index'),
+                                  original, check_index_type=False)
+
+    def test_stata_doc_examples(self):
+        with tm.ensure_clean() as path:
+            df = DataFrame(np.random.randn(10, 2), columns=list('AB'))
+            df.to_stata(path)
+
+    def test_write_preserves_original(self):
+        # 9795
+        np.random.seed(423)
+        df = pd.DataFrame(np.random.randn(5, 4), columns=list('abcd'))
+        df.loc[2, 'a':'c'] = np.nan
+        df_copy = df.copy()
+        with tm.ensure_clean() as path:
+            df.to_stata(path, write_index=False)
+        tm.assert_frame_equal(df, df_copy)
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_encoding(self, version):
+
+        # GH 4626, proper encoding handling
+        raw = read_stata(self.dta_encoding)
+        with tm.assert_produces_warning(FutureWarning):
+            encoded = read_stata(self.dta_encoding, encoding='latin-1')
+        result = encoded.kreis1849[0]
+
+        expected = raw.kreis1849[0]
+        assert result == expected
+        assert isinstance(result, compat.string_types)
+
+        with tm.ensure_clean() as path:
+            with tm.assert_produces_warning(FutureWarning):
+                encoded.to_stata(path, write_index=False, version=version,
+                                 encoding='latin-1')
+            reread_encoded = read_stata(path)
+            tm.assert_frame_equal(encoded, reread_encoded)
+
+    def test_read_write_dta11(self):
+        original = DataFrame([(1, 2, 3, 4)],
+                             columns=['good', compat.u('b\u00E4d'), '8number',
+                                      'astringwithmorethan32characters______'])
+        formatted = DataFrame([(1, 2, 3, 4)],
+                              columns=['good', 'b_d', '_8number',
+                                       'astringwithmorethan32characters_'])
+        formatted.index.name = 'index'
+        formatted = formatted.astype(np.int32)
+
+        with tm.ensure_clean() as path:
+            with warnings.catch_warnings(record=True) as w:
+                original.to_stata(path, None)
+                # should get a warning for that format.
+            assert len(w) == 1
+
+            written_and_read_again = self.read_dta(path)
+            tm.assert_frame_equal(
+                written_and_read_again.set_index('index'), formatted)
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_read_write_dta12(self, version):
+        original = DataFrame([(1, 2, 3, 4, 5, 6)],
+                             columns=['astringwithmorethan32characters_1',
+                                      'astringwithmorethan32characters_2',
+                                      '+',
+                                      '-',
+                                      'short',
+                                      'delete'])
+        formatted = DataFrame([(1, 2, 3, 4, 5, 6)],
+                              columns=['astringwithmorethan32characters_',
+                                       '_0astringwithmorethan32character',
+                                       '_',
+                                       '_1_',
+                                       '_short',
+                                       '_delete'])
+        formatted.index.name = 'index'
+        formatted = formatted.astype(np.int32)
+
+        with tm.ensure_clean() as path:
+            with warnings.catch_warnings(record=True) as w:
+                warnings.simplefilter('always', InvalidColumnName)
+                original.to_stata(path, None, version=version)
+                # should get a warning for that format.
+                assert len(w) == 1
+
+            written_and_read_again = self.read_dta(path)
+            tm.assert_frame_equal(
+                written_and_read_again.set_index('index'), formatted)
+
+    def test_read_write_dta13(self):
+        s1 = Series(2 ** 9, dtype=np.int16)
+        s2 = Series(2 ** 17, dtype=np.int32)
+        s3 = Series(2 ** 33, dtype=np.int64)
+        original = DataFrame({'int16': s1, 'int32': s2, 'int64': s3})
+        original.index.name = 'index'
+
+        formatted = original
+        formatted['int64'] = formatted['int64'].astype(np.float64)
+
+        with tm.ensure_clean() as path:
+            original.to_stata(path)
+            written_and_read_again = self.read_dta(path)
+            tm.assert_frame_equal(written_and_read_again.set_index('index'),
+                                  formatted)
+
+    @pytest.mark.parametrize('version', [114, 117])
+    @pytest.mark.parametrize(
+        'file', ['dta14_113', 'dta14_114', 'dta14_115', 'dta14_117'])
+    def test_read_write_reread_dta14(self, file, parsed_114, version):
+        file = getattr(self, file)
+        parsed = self.read_dta(file)
+        parsed.index.name = 'index'
+
+        expected = self.read_csv(self.csv14)
+        cols = ['byte_', 'int_', 'long_', 'float_', 'double_']
+        for col in cols:
+            expected[col] = expected[col]._convert(datetime=True, numeric=True)
+        expected['float_'] = expected['float_'].astype(np.float32)
+        expected['date_td'] = pd.to_datetime(
+            expected['date_td'], errors='coerce')
+
+        tm.assert_frame_equal(parsed_114, parsed)
+
+        with tm.ensure_clean() as path:
+            parsed_114.to_stata(path, {'date_td': 'td'}, version=version)
+            written_and_read_again = self.read_dta(path)
+            tm.assert_frame_equal(
+                written_and_read_again.set_index('index'), parsed_114)
+
+    @pytest.mark.parametrize(
+        'file', ['dta15_113', 'dta15_114', 'dta15_115', 'dta15_117'])
+    def test_read_write_reread_dta15(self, file):
+
+        expected = self.read_csv(self.csv15)
+        expected['byte_'] = expected['byte_'].astype(np.int8)
+        expected['int_'] = expected['int_'].astype(np.int16)
+        expected['long_'] = expected['long_'].astype(np.int32)
+        expected['float_'] = expected['float_'].astype(np.float32)
+        expected['double_'] = expected['double_'].astype(np.float64)
+        expected['date_td'] = expected['date_td'].apply(
+            datetime.strptime, args=('%Y-%m-%d',))
+
+        file = getattr(self, file)
+        parsed = self.read_dta(file)
+
+        tm.assert_frame_equal(expected, parsed)
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_timestamp_and_label(self, version):
+        original = DataFrame([(1,)], columns=['variable'])
+        time_stamp = datetime(2000, 2, 29, 14, 21)
+        data_label = 'This is a data file.'
+        with tm.ensure_clean() as path:
+            original.to_stata(path, time_stamp=time_stamp,
+                              data_label=data_label,
+                              version=version)
+
+            with StataReader(path) as reader:
+                assert reader.time_stamp == '29 Feb 2000 14:21'
+                assert reader.data_label == data_label
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_invalid_timestamp(self, version):
+        original = DataFrame([(1,)], columns=['variable'])
+        time_stamp = '01 Jan 2000, 00:00:00'
+        with tm.ensure_clean() as path:
+            with pytest.raises(ValueError):
+                original.to_stata(path, time_stamp=time_stamp,
+                                  version=version)
+
+    def test_numeric_column_names(self):
+        original = DataFrame(np.reshape(np.arange(25.0), (5, 5)))
+        original.index.name = 'index'
+        with tm.ensure_clean() as path:
+            # should get a warning for that format.
+            with tm.assert_produces_warning(InvalidColumnName):
+                original.to_stata(path)
+
+            written_and_read_again = self.read_dta(path)
+            written_and_read_again = written_and_read_again.set_index('index')
+            columns = list(written_and_read_again.columns)
+            convert_col_name = lambda x: int(x[1])
+            written_and_read_again.columns = map(convert_col_name, columns)
+            tm.assert_frame_equal(original, written_and_read_again)
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_nan_to_missing_value(self, version):
+        s1 = Series(np.arange(4.0), dtype=np.float32)
+        s2 = Series(np.arange(4.0), dtype=np.float64)
+        s1[::2] = np.nan
+        s2[1::2] = np.nan
+        original = DataFrame({'s1': s1, 's2': s2})
+        original.index.name = 'index'
+        with tm.ensure_clean() as path:
+            original.to_stata(path, version=version)
+            written_and_read_again = self.read_dta(path)
+            written_and_read_again = written_and_read_again.set_index('index')
+            tm.assert_frame_equal(written_and_read_again, original)
+
+    def test_no_index(self):
+        columns = ['x', 'y']
+        original = DataFrame(np.reshape(np.arange(10.0), (5, 2)),
+                             columns=columns)
+        original.index.name = 'index_not_written'
+        with tm.ensure_clean() as path:
+            original.to_stata(path, write_index=False)
+            written_and_read_again = self.read_dta(path)
+            pytest.raises(
+                KeyError, lambda: written_and_read_again['index_not_written'])
+
+    def test_string_no_dates(self):
+        s1 = Series(['a', 'A longer string'])
+        s2 = Series([1.0, 2.0], dtype=np.float64)
+        original = DataFrame({'s1': s1, 's2': s2})
+        original.index.name = 'index'
+        with tm.ensure_clean() as path:
+            original.to_stata(path)
+            written_and_read_again = self.read_dta(path)
+            tm.assert_frame_equal(written_and_read_again.set_index('index'),
+                                  original)
+
+    def test_large_value_conversion(self):
+        s0 = Series([1, 99], dtype=np.int8)
+        s1 = Series([1, 127], dtype=np.int8)
+        s2 = Series([1, 2 ** 15 - 1], dtype=np.int16)
+        s3 = Series([1, 2 ** 63 - 1], dtype=np.int64)
+        original = DataFrame({'s0': s0, 's1': s1, 's2': s2, 's3': s3})
+        original.index.name = 'index'
+        with tm.ensure_clean() as path:
+            with tm.assert_produces_warning(PossiblePrecisionLoss):
+                original.to_stata(path)
+
+            written_and_read_again = self.read_dta(path)
+            modified = original.copy()
+            modified['s1'] = Series(modified['s1'], dtype=np.int16)
+            modified['s2'] = Series(modified['s2'], dtype=np.int32)
+            modified['s3'] = Series(modified['s3'], dtype=np.float64)
+            tm.assert_frame_equal(written_and_read_again.set_index('index'),
+                                  modified)
+
+    def test_dates_invalid_column(self):
+        original = DataFrame([datetime(2006, 11, 19, 23, 13, 20)])
+        original.index.name = 'index'
+        with tm.ensure_clean() as path:
+            with tm.assert_produces_warning(InvalidColumnName):
+                original.to_stata(path, {0: 'tc'})
+
+            written_and_read_again = self.read_dta(path)
+            modified = original.copy()
+            modified.columns = ['_0']
+            tm.assert_frame_equal(written_and_read_again.set_index('index'),
+                                  modified)
+
+    def test_105(self):
+        # Data obtained from:
+        # http://go.worldbank.org/ZXY29PVJ21
+        dpath = os.path.join(self.dirpath, 'S4_EDUC1.dta')
+        df = pd.read_stata(dpath)
+        df0 = [[1, 1, 3, -2], [2, 1, 2, -2], [4, 1, 1, -2]]
+        df0 = pd.DataFrame(df0)
+        df0.columns = ["clustnum", "pri_schl", "psch_num", "psch_dis"]
+        df0['clustnum'] = df0["clustnum"].astype(np.int16)
+        df0['pri_schl'] = df0["pri_schl"].astype(np.int8)
+        df0['psch_num'] = df0["psch_num"].astype(np.int8)
+        df0['psch_dis'] = df0["psch_dis"].astype(np.float32)
+        tm.assert_frame_equal(df.head(3), df0)
+
+    def test_value_labels_old_format(self):
+        # GH 19417
+        #
+        # Test that value_labels() returns an empty dict if the file format
+        # predates supporting value labels.
+        dpath = os.path.join(self.dirpath, 'S4_EDUC1.dta')
+        reader = StataReader(dpath)
+        assert reader.value_labels() == {}
+        reader.close()
+
+    def test_date_export_formats(self):
+        columns = ['tc', 'td', 'tw', 'tm', 'tq', 'th', 'ty']
+        conversions = {c: c for c in columns}
+        data = [datetime(2006, 11, 20, 23, 13, 20)] * len(columns)
+        original = DataFrame([data], columns=columns)
+        original.index.name = 'index'
+        expected_values = [datetime(2006, 11, 20, 23, 13, 20),  # Time
+                           datetime(2006, 11, 20),  # Day
+                           datetime(2006, 11, 19),  # Week
+                           datetime(2006, 11, 1),  # Month
+                           datetime(2006, 10, 1),  # Quarter year
+                           datetime(2006, 7, 1),  # Half year
+                           datetime(2006, 1, 1)]  # Year
+
+        expected = DataFrame([expected_values], columns=columns)
+        expected.index.name = 'index'
+        with tm.ensure_clean() as path:
+            original.to_stata(path, conversions)
+            written_and_read_again = self.read_dta(path)
+            tm.assert_frame_equal(written_and_read_again.set_index('index'),
+                                  expected)
+
+    def test_write_missing_strings(self):
+        original = DataFrame([["1"], [None]], columns=["foo"])
+        expected = DataFrame([["1"], [""]], columns=["foo"])
+        expected.index.name = 'index'
+        with tm.ensure_clean() as path:
+            original.to_stata(path)
+            written_and_read_again = self.read_dta(path)
+            tm.assert_frame_equal(written_and_read_again.set_index('index'),
+                                  expected)
+
+    @pytest.mark.parametrize('version', [114, 117])
+    @pytest.mark.parametrize('byteorder', ['>', '<'])
+    def test_bool_uint(self, byteorder, version):
+        s0 = Series([0, 1, True], dtype=np.bool)
+        s1 = Series([0, 1, 100], dtype=np.uint8)
+        s2 = Series([0, 1, 255], dtype=np.uint8)
+        s3 = Series([0, 1, 2 ** 15 - 100], dtype=np.uint16)
+        s4 = Series([0, 1, 2 ** 16 - 1], dtype=np.uint16)
+        s5 = Series([0, 1, 2 ** 31 - 100], dtype=np.uint32)
+        s6 = Series([0, 1, 2 ** 32 - 1], dtype=np.uint32)
+
+        original = DataFrame({'s0': s0, 's1': s1, 's2': s2, 's3': s3,
+                              's4': s4, 's5': s5, 's6': s6})
+        original.index.name = 'index'
+        expected = original.copy()
+        expected_types = (np.int8, np.int8, np.int16, np.int16, np.int32,
+                          np.int32, np.float64)
+        for c, t in zip(expected.columns, expected_types):
+            expected[c] = expected[c].astype(t)
+
+        with tm.ensure_clean() as path:
+            original.to_stata(path, byteorder=byteorder, version=version)
+            written_and_read_again = self.read_dta(path)
+            written_and_read_again = written_and_read_again.set_index('index')
+            tm.assert_frame_equal(written_and_read_again, expected)
+
+    def test_variable_labels(self):
+        with StataReader(self.dta16_115) as rdr:
+            sr_115 = rdr.variable_labels()
+        with StataReader(self.dta16_117) as rdr:
+            sr_117 = rdr.variable_labels()
+        keys = ('var1', 'var2', 'var3')
+        labels = ('label1', 'label2', 'label3')
+        for k, v in compat.iteritems(sr_115):
+            assert k in sr_117
+            assert v == sr_117[k]
+            assert k in keys
+            assert v in labels
+
+    def test_minimal_size_col(self):
+        str_lens = (1, 100, 244)
+        s = {}
+        for str_len in str_lens:
+            s['s' + str(str_len)] = Series(['a' * str_len,
+                                            'b' * str_len, 'c' * str_len])
+        original = DataFrame(s)
+        with tm.ensure_clean() as path:
+            original.to_stata(path, write_index=False)
+
+            with StataReader(path) as sr:
+                typlist = sr.typlist
+                variables = sr.varlist
+                formats = sr.fmtlist
+                for variable, fmt, typ in zip(variables, formats, typlist):
+                    assert int(variable[1:]) == int(fmt[1:-1])
+                    assert int(variable[1:]) == typ
+
+    def test_excessively_long_string(self):
+        str_lens = (1, 244, 500)
+        s = {}
+        for str_len in str_lens:
+            s['s' + str(str_len)] = Series(['a' * str_len,
+                                            'b' * str_len, 'c' * str_len])
+        original = DataFrame(s)
+        with pytest.raises(ValueError):
+            with tm.ensure_clean() as path:
+                original.to_stata(path)
+
+    def test_missing_value_generator(self):
+        types = ('b', 'h', 'l')
+        df = DataFrame([[0.0]], columns=['float_'])
+        with tm.ensure_clean() as path:
+            df.to_stata(path)
+            with StataReader(path) as rdr:
+                valid_range = rdr.VALID_RANGE
+        expected_values = ['.' + chr(97 + i) for i in range(26)]
+        expected_values.insert(0, '.')
+        for t in types:
+            offset = valid_range[t][1]
+            for i in range(0, 27):
+                val = StataMissingValue(offset + 1 + i)
+                assert val.string == expected_values[i]
+
+        # Test extremes for floats
+        val = StataMissingValue(struct.unpack('<f', b'\x00\x00\x00\x7f')[0])
+        assert val.string == '.'
+        val = StataMissingValue(struct.unpack('<f', b'\x00\xd0\x00\x7f')[0])
+        assert val.string == '.z'
+
+        # Test extremes for floats
+        val = StataMissingValue(struct.unpack(
+            '<d', b'\x00\x00\x00\x00\x00\x00\xe0\x7f')[0])
+        assert val.string == '.'
+        val = StataMissingValue(struct.unpack(
+            '<d', b'\x00\x00\x00\x00\x00\x1a\xe0\x7f')[0])
+        assert val.string == '.z'
+
+    @pytest.mark.parametrize(
+        'file', ['dta17_113', 'dta17_115', 'dta17_117'])
+    def test_missing_value_conversion(self, file):
+        columns = ['int8_', 'int16_', 'int32_', 'float32_', 'float64_']
+        smv = StataMissingValue(101)
+        keys = [key for key in iterkeys(smv.MISSING_VALUES)]
+        keys.sort()
+        data = []
+        for i in range(27):
+            row = [StataMissingValue(keys[i + (j * 27)]) for j in range(5)]
+            data.append(row)
+        expected = DataFrame(data, columns=columns)
+
+        parsed = read_stata(getattr(self, file), convert_missing=True)
+        tm.assert_frame_equal(parsed, expected)
+
+    def test_big_dates(self):
+        yr = [1960, 2000, 9999, 100, 2262, 1677]
+        mo = [1, 1, 12, 1, 4, 9]
+        dd = [1, 1, 31, 1, 22, 23]
+        hr = [0, 0, 23, 0, 0, 0]
+        mm = [0, 0, 59, 0, 0, 0]
+        ss = [0, 0, 59, 0, 0, 0]
+        expected = []
+        for i in range(len(yr)):
+            row = []
+            for j in range(7):
+                if j == 0:
+                    row.append(
+                        datetime(yr[i], mo[i], dd[i], hr[i], mm[i], ss[i]))
+                elif j == 6:
+                    row.append(datetime(yr[i], 1, 1))
+                else:
+                    row.append(datetime(yr[i], mo[i], dd[i]))
+            expected.append(row)
+        expected.append([pd.NaT] * 7)
+        columns = ['date_tc', 'date_td', 'date_tw', 'date_tm', 'date_tq',
+                   'date_th', 'date_ty']
+
+        # Fixes for weekly, quarterly,half,year
+        expected[2][2] = datetime(9999, 12, 24)
+        expected[2][3] = datetime(9999, 12, 1)
+        expected[2][4] = datetime(9999, 10, 1)
+        expected[2][5] = datetime(9999, 7, 1)
+        expected[4][2] = datetime(2262, 4, 16)
+        expected[4][3] = expected[4][4] = datetime(2262, 4, 1)
+        expected[4][5] = expected[4][6] = datetime(2262, 1, 1)
+        expected[5][2] = expected[5][3] = expected[
+            5][4] = datetime(1677, 10, 1)
+        expected[5][5] = expected[5][6] = datetime(1678, 1, 1)
+
+        expected = DataFrame(expected, columns=columns, dtype=np.object)
+        parsed_115 = read_stata(self.dta18_115)
+        parsed_117 = read_stata(self.dta18_117)
+        tm.assert_frame_equal(expected, parsed_115,
+                              check_datetimelike_compat=True)
+        tm.assert_frame_equal(expected, parsed_117,
+                              check_datetimelike_compat=True)
+
+        date_conversion = {c: c[-2:] for c in columns}
+        # {c : c[-2:] for c in columns}
+        with tm.ensure_clean() as path:
+            expected.index.name = 'index'
+            expected.to_stata(path, date_conversion)
+            written_and_read_again = self.read_dta(path)
+            tm.assert_frame_equal(written_and_read_again.set_index('index'),
+                                  expected,
+                                  check_datetimelike_compat=True)
+
+    def test_dtype_conversion(self):
+        expected = self.read_csv(self.csv15)
+        expected['byte_'] = expected['byte_'].astype(np.int8)
+        expected['int_'] = expected['int_'].astype(np.int16)
+        expected['long_'] = expected['long_'].astype(np.int32)
+        expected['float_'] = expected['float_'].astype(np.float32)
+        expected['double_'] = expected['double_'].astype(np.float64)
+        expected['date_td'] = expected['date_td'].apply(datetime.strptime,
+                                                        args=('%Y-%m-%d',))
+
+        no_conversion = read_stata(self.dta15_117,
+                                   convert_dates=True)
+        tm.assert_frame_equal(expected, no_conversion)
+
+        conversion = read_stata(self.dta15_117,
+                                convert_dates=True,
+                                preserve_dtypes=False)
+
+        # read_csv types are the same
+        expected = self.read_csv(self.csv15)
+        expected['date_td'] = expected['date_td'].apply(datetime.strptime,
+                                                        args=('%Y-%m-%d',))
+
+        tm.assert_frame_equal(expected, conversion)
+
+    def test_drop_column(self):
+        expected = self.read_csv(self.csv15)
+        expected['byte_'] = expected['byte_'].astype(np.int8)
+        expected['int_'] = expected['int_'].astype(np.int16)
+        expected['long_'] = expected['long_'].astype(np.int32)
+        expected['float_'] = expected['float_'].astype(np.float32)
+        expected['double_'] = expected['double_'].astype(np.float64)
+        expected['date_td'] = expected['date_td'].apply(datetime.strptime,
+                                                        args=('%Y-%m-%d',))
+
+        columns = ['byte_', 'int_', 'long_']
+        expected = expected[columns]
+        dropped = read_stata(self.dta15_117, convert_dates=True,
+                             columns=columns)
+
+        tm.assert_frame_equal(expected, dropped)
+
+        # See PR 10757
+        columns = ['int_', 'long_', 'byte_']
+        expected = expected[columns]
+        reordered = read_stata(self.dta15_117, convert_dates=True,
+                               columns=columns)
+        tm.assert_frame_equal(expected, reordered)
+
+        with pytest.raises(ValueError):
+            columns = ['byte_', 'byte_']
+            read_stata(self.dta15_117, convert_dates=True, columns=columns)
+
+        with pytest.raises(ValueError):
+            columns = ['byte_', 'int_', 'long_', 'not_found']
+            read_stata(self.dta15_117, convert_dates=True, columns=columns)
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_categorical_writing(self, version):
+        original = DataFrame.from_records(
+            [
+                ["one", "ten", "one", "one", "one", 1],
+                ["two", "nine", "two", "two", "two", 2],
+                ["three", "eight", "three", "three", "three", 3],
+                ["four", "seven", 4, "four", "four", 4],
+                ["five", "six", 5, np.nan, "five", 5],
+                ["six", "five", 6, np.nan, "six", 6],
+                ["seven", "four", 7, np.nan, "seven", 7],
+                ["eight", "three", 8, np.nan, "eight", 8],
+                ["nine", "two", 9, np.nan, "nine", 9],
+                ["ten", "one", "ten", np.nan, "ten", 10]
+            ],
+            columns=['fully_labeled', 'fully_labeled2', 'incompletely_labeled',
+                     'labeled_with_missings', 'float_labelled', 'unlabeled'])
+        expected = original.copy()
+
+        # these are all categoricals
+        original = pd.concat([original[col].astype('category')
+                              for col in original], axis=1)
+
+        expected['incompletely_labeled'] = expected[
+            'incompletely_labeled'].apply(str)
+        expected['unlabeled'] = expected['unlabeled'].apply(str)
+        expected = pd.concat([expected[col].astype('category')
+                              for col in expected], axis=1)
+        expected.index.name = 'index'
+
+        with tm.ensure_clean() as path:
+            with warnings.catch_warnings(record=True) as w:  # noqa
+                # Silence warnings
+                original.to_stata(path, version=version)
+                written_and_read_again = self.read_dta(path)
+                res = written_and_read_again.set_index('index')
+                tm.assert_frame_equal(res, expected, check_categorical=False)
+
+    def test_categorical_warnings_and_errors(self):
+        # Warning for non-string labels
+        # Error for labels too long
+        original = pd.DataFrame.from_records(
+            [['a' * 10000],
+             ['b' * 10000],
+             ['c' * 10000],
+             ['d' * 10000]],
+            columns=['Too_long'])
+
+        original = pd.concat([original[col].astype('category')
+                              for col in original], axis=1)
+        with tm.ensure_clean() as path:
+            pytest.raises(ValueError, original.to_stata, path)
+
+        original = pd.DataFrame.from_records(
+            [['a'],
+             ['b'],
+             ['c'],
+             ['d'],
+             [1]],
+            columns=['Too_long'])
+        original = pd.concat([original[col].astype('category')
+                              for col in original], axis=1)
+
+        with warnings.catch_warnings(record=True) as w:
+            original.to_stata(path)
+            # should get a warning for mixed content
+            assert len(w) == 1
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_categorical_with_stata_missing_values(self, version):
+        values = [['a' + str(i)] for i in range(120)]
+        values.append([np.nan])
+        original = pd.DataFrame.from_records(values, columns=['many_labels'])
+        original = pd.concat([original[col].astype('category')
+                              for col in original], axis=1)
+        original.index.name = 'index'
+        with tm.ensure_clean() as path:
+            original.to_stata(path, version=version)
+            written_and_read_again = self.read_dta(path)
+            res = written_and_read_again.set_index('index')
+            tm.assert_frame_equal(res, original, check_categorical=False)
+
+    @pytest.mark.parametrize(
+        'file', ['dta19_115', 'dta19_117'])
+    def test_categorical_order(self, file):
+        # Directly construct using expected codes
+        # Format is is_cat, col_name, labels (in order), underlying data
+        expected = [(True, 'ordered', ['a', 'b', 'c', 'd', 'e'], np.arange(5)),
+                    (True, 'reverse', ['a', 'b', 'c',
+                                       'd', 'e'], np.arange(5)[::-1]),
+                    (True, 'noorder', ['a', 'b', 'c', 'd',
+                                       'e'], np.array([2, 1, 4, 0, 3])),
+                    (True, 'floating', [
+                     'a', 'b', 'c', 'd', 'e'], np.arange(0, 5)),
+                    (True, 'float_missing', [
+                     'a', 'd', 'e'], np.array([0, 1, 2, -1, -1])),
+                    (False, 'nolabel', [
+                     1.0, 2.0, 3.0, 4.0, 5.0], np.arange(5)),
+                    (True, 'int32_mixed', ['d', 2, 'e', 'b', 'a'],
+                     np.arange(5))]
+        cols = []
+        for is_cat, col, labels, codes in expected:
+            if is_cat:
+                cols.append((col, pd.Categorical.from_codes(codes, labels)))
+            else:
+                cols.append((col, pd.Series(labels, dtype=np.float32)))
+        expected = DataFrame.from_dict(OrderedDict(cols))
+
+        # Read with and with out categoricals, ensure order is identical
+        file = getattr(self, file)
+        parsed = read_stata(file)
+        tm.assert_frame_equal(expected, parsed, check_categorical=False)
+
+        # Check identity of codes
+        for col in expected:
+            if is_categorical_dtype(expected[col]):
+                tm.assert_series_equal(expected[col].cat.codes,
+                                       parsed[col].cat.codes)
+                tm.assert_index_equal(expected[col].cat.categories,
+                                      parsed[col].cat.categories)
+
+    @pytest.mark.parametrize(
+        'file', ['dta20_115', 'dta20_117'])
+    def test_categorical_sorting(self, file):
+        parsed = read_stata(getattr(self, file))
+
+        # Sort based on codes, not strings
+        parsed = parsed.sort_values("srh")
+
+        # Don't sort index
+        parsed.index = np.arange(parsed.shape[0])
+        codes = [-1, -1, 0, 1, 1, 1, 2, 2, 3, 4]
+        categories = ["Poor", "Fair", "Good", "Very good", "Excellent"]
+        cat = pd.Categorical.from_codes(codes=codes, categories=categories)
+        expected = pd.Series(cat, name='srh')
+        tm.assert_series_equal(expected, parsed["srh"],
+                               check_categorical=False)
+
+    @pytest.mark.parametrize(
+        'file', ['dta19_115', 'dta19_117'])
+    def test_categorical_ordering(self, file):
+        file = getattr(self, file)
+        parsed = read_stata(file)
+
+        parsed_unordered = read_stata(file,
+                                      order_categoricals=False)
+        for col in parsed:
+            if not is_categorical_dtype(parsed[col]):
+                continue
+            assert parsed[col].cat.ordered
+            assert not parsed_unordered[col].cat.ordered
+
+    @pytest.mark.parametrize(
+        'file', ['dta1_117', 'dta2_117', 'dta3_117',
+                 'dta4_117', 'dta14_117', 'dta15_117',
+                 'dta16_117', 'dta17_117', 'dta18_117',
+                 'dta19_117', 'dta20_117'])
+    @pytest.mark.parametrize(
+        'chunksize', [1, 2])
+    @pytest.mark.parametrize(
+        'convert_categoricals', [False, True])
+    @pytest.mark.parametrize(
+        'convert_dates', [False, True])
+    def test_read_chunks_117(self, file, chunksize,
+                             convert_categoricals, convert_dates):
+        fname = getattr(self, file)
+
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            parsed = read_stata(
+                fname,
+                convert_categoricals=convert_categoricals,
+                convert_dates=convert_dates)
+        itr = read_stata(
+            fname, iterator=True,
+            convert_categoricals=convert_categoricals,
+            convert_dates=convert_dates)
+
+        pos = 0
+        for j in range(5):
+            with warnings.catch_warnings(record=True) as w:  # noqa
+                warnings.simplefilter("always")
+                try:
+                    chunk = itr.read(chunksize)
+                except StopIteration:
+                    break
+            from_frame = parsed.iloc[pos:pos + chunksize, :]
+            tm.assert_frame_equal(
+                from_frame, chunk, check_dtype=False,
+                check_datetimelike_compat=True,
+                check_categorical=False)
+
+            pos += chunksize
+        itr.close()
+
+    def test_iterator(self):
+
+        fname = self.dta3_117
+
+        parsed = read_stata(fname)
+
+        with read_stata(fname, iterator=True) as itr:
+            chunk = itr.read(5)
+            tm.assert_frame_equal(parsed.iloc[0:5, :], chunk)
+
+        with read_stata(fname, chunksize=5) as itr:
+            chunk = list(itr)
+            tm.assert_frame_equal(parsed.iloc[0:5, :], chunk[0])
+
+        with read_stata(fname, iterator=True) as itr:
+            chunk = itr.get_chunk(5)
+            tm.assert_frame_equal(parsed.iloc[0:5, :], chunk)
+
+        with read_stata(fname, chunksize=5) as itr:
+            chunk = itr.get_chunk()
+            tm.assert_frame_equal(parsed.iloc[0:5, :], chunk)
+
+        # GH12153
+        with read_stata(fname, chunksize=4) as itr:
+            from_chunks = pd.concat(itr)
+        tm.assert_frame_equal(parsed, from_chunks)
+
+    @pytest.mark.parametrize(
+        'file', ['dta2_115', 'dta3_115', 'dta4_115',
+                 'dta14_115', 'dta15_115', 'dta16_115',
+                 'dta17_115', 'dta18_115', 'dta19_115',
+                 'dta20_115'])
+    @pytest.mark.parametrize(
+        'chunksize', [1, 2])
+    @pytest.mark.parametrize(
+        'convert_categoricals', [False, True])
+    @pytest.mark.parametrize(
+        'convert_dates', [False, True])
+    def test_read_chunks_115(self, file, chunksize,
+                             convert_categoricals, convert_dates):
+        fname = getattr(self, file)
+
+        # Read the whole file
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            parsed = read_stata(
+                fname,
+                convert_categoricals=convert_categoricals,
+                convert_dates=convert_dates)
+
+        # Compare to what we get when reading by chunk
+        itr = read_stata(
+            fname, iterator=True,
+            convert_dates=convert_dates,
+            convert_categoricals=convert_categoricals)
+        pos = 0
+        for j in range(5):
+            with warnings.catch_warnings(record=True) as w:  # noqa
+                warnings.simplefilter("always")
+                try:
+                    chunk = itr.read(chunksize)
+                except StopIteration:
+                    break
+            from_frame = parsed.iloc[pos:pos + chunksize, :]
+            tm.assert_frame_equal(
+                from_frame, chunk, check_dtype=False,
+                check_datetimelike_compat=True,
+                check_categorical=False)
+
+            pos += chunksize
+        itr.close()
+
+    def test_read_chunks_columns(self):
+        fname = self.dta3_117
+        columns = ['quarter', 'cpi', 'm1']
+        chunksize = 2
+
+        parsed = read_stata(fname, columns=columns)
+        with read_stata(fname, iterator=True) as itr:
+            pos = 0
+            for j in range(5):
+                chunk = itr.read(chunksize, columns=columns)
+                if chunk is None:
+                    break
+                from_frame = parsed.iloc[pos:pos + chunksize, :]
+                tm.assert_frame_equal(from_frame, chunk, check_dtype=False)
+                pos += chunksize
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_write_variable_labels(self, version):
+        # GH 13631, add support for writing variable labels
+        original = pd.DataFrame({'a': [1, 2, 3, 4],
+                                 'b': [1.0, 3.0, 27.0, 81.0],
+                                 'c': ['Atlanta', 'Birmingham',
+                                       'Cincinnati', 'Detroit']})
+        original.index.name = 'index'
+        variable_labels = {'a': 'City Rank', 'b': 'City Exponent', 'c': 'City'}
+        with tm.ensure_clean() as path:
+            original.to_stata(path,
+                              variable_labels=variable_labels,
+                              version=version)
+            with StataReader(path) as sr:
+                read_labels = sr.variable_labels()
+            expected_labels = {'index': '',
+                               'a': 'City Rank',
+                               'b': 'City Exponent',
+                               'c': 'City'}
+            assert read_labels == expected_labels
+
+        variable_labels['index'] = 'The Index'
+        with tm.ensure_clean() as path:
+            original.to_stata(path,
+                              variable_labels=variable_labels,
+                              version=version)
+            with StataReader(path) as sr:
+                read_labels = sr.variable_labels()
+            assert read_labels == variable_labels
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_invalid_variable_labels(self, version):
+        original = pd.DataFrame({'a': [1, 2, 3, 4],
+                                 'b': [1.0, 3.0, 27.0, 81.0],
+                                 'c': ['Atlanta', 'Birmingham',
+                                       'Cincinnati', 'Detroit']})
+        original.index.name = 'index'
+        variable_labels = {'a': 'very long' * 10,
+                           'b': 'City Exponent',
+                           'c': 'City'}
+        with tm.ensure_clean() as path:
+            with pytest.raises(ValueError):
+                original.to_stata(path,
+                                  variable_labels=variable_labels,
+                                  version=version)
+
+        variable_labels['a'] = u'invalid character Œ'
+        with tm.ensure_clean() as path:
+            with pytest.raises(ValueError):
+                original.to_stata(path,
+                                  variable_labels=variable_labels,
+                                  version=version)
+
+    def test_write_variable_label_errors(self):
+        original = pd.DataFrame({'a': [1, 2, 3, 4],
+                                 'b': [1.0, 3.0, 27.0, 81.0],
+                                 'c': ['Atlanta', 'Birmingham',
+                                       'Cincinnati', 'Detroit']})
+        values = [u'\u03A1', u'\u0391',
+                  u'\u039D', u'\u0394',
+                  u'\u0391', u'\u03A3']
+
+        variable_labels_utf8 = {'a': 'City Rank',
+                                'b': 'City Exponent',
+                                'c': u''.join(values)}
+
+        with pytest.raises(ValueError):
+            with tm.ensure_clean() as path:
+                original.to_stata(path, variable_labels=variable_labels_utf8)
+
+        variable_labels_long = {'a': 'City Rank',
+                                'b': 'City Exponent',
+                                'c': 'A very, very, very long variable label '
+                                     'that is too long for Stata which means '
+                                     'that it has more than 80 characters'}
+
+        with pytest.raises(ValueError):
+            with tm.ensure_clean() as path:
+                original.to_stata(path, variable_labels=variable_labels_long)
+
+    def test_default_date_conversion(self):
+        # GH 12259
+        dates = [dt.datetime(1999, 12, 31, 12, 12, 12, 12000),
+                 dt.datetime(2012, 12, 21, 12, 21, 12, 21000),
+                 dt.datetime(1776, 7, 4, 7, 4, 7, 4000)]
+        original = pd.DataFrame({'nums': [1.0, 2.0, 3.0],
+                                 'strs': ['apple', 'banana', 'cherry'],
+                                 'dates': dates})
+
+        with tm.ensure_clean() as path:
+            original.to_stata(path, write_index=False)
+            reread = read_stata(path, convert_dates=True)
+            tm.assert_frame_equal(original, reread)
+
+            original.to_stata(path,
+                              write_index=False,
+                              convert_dates={'dates': 'tc'})
+            direct = read_stata(path, convert_dates=True)
+            tm.assert_frame_equal(reread, direct)
+
+            dates_idx = original.columns.tolist().index('dates')
+            original.to_stata(path,
+                              write_index=False,
+                              convert_dates={dates_idx: 'tc'})
+            direct = read_stata(path, convert_dates=True)
+            tm.assert_frame_equal(reread, direct)
+
+    def test_unsupported_type(self):
+        original = pd.DataFrame({'a': [1 + 2j, 2 + 4j]})
+
+        with pytest.raises(NotImplementedError):
+            with tm.ensure_clean() as path:
+                original.to_stata(path)
+
+    def test_unsupported_datetype(self):
+        dates = [dt.datetime(1999, 12, 31, 12, 12, 12, 12000),
+                 dt.datetime(2012, 12, 21, 12, 21, 12, 21000),
+                 dt.datetime(1776, 7, 4, 7, 4, 7, 4000)]
+        original = pd.DataFrame({'nums': [1.0, 2.0, 3.0],
+                                 'strs': ['apple', 'banana', 'cherry'],
+                                 'dates': dates})
+
+        with pytest.raises(NotImplementedError):
+            with tm.ensure_clean() as path:
+                original.to_stata(path, convert_dates={'dates': 'tC'})
+
+        dates = pd.date_range('1-1-1990', periods=3, tz='Asia/Hong_Kong')
+        original = pd.DataFrame({'nums': [1.0, 2.0, 3.0],
+                                 'strs': ['apple', 'banana', 'cherry'],
+                                 'dates': dates})
+        with pytest.raises(NotImplementedError):
+            with tm.ensure_clean() as path:
+                original.to_stata(path)
+
+    def test_repeated_column_labels(self):
+        # GH 13923
+        with pytest.raises(ValueError) as cm:
+            read_stata(self.dta23, convert_categoricals=True)
+            assert 'wolof' in cm.exception
+
+    def test_stata_111(self):
+        # 111 is an old version but still used by current versions of
+        # SAS when exporting to Stata format. We do not know of any
+        # on-line documentation for this version.
+        df = read_stata(self.dta24_111)
+        original = pd.DataFrame({'y': [1, 1, 1, 1, 1, 0, 0, np.NaN, 0, 0],
+                                 'x': [1, 2, 1, 3, np.NaN, 4, 3, 5, 1, 6],
+                                 'w': [2, np.NaN, 5, 2, 4, 4, 3, 1, 2, 3],
+                                 'z': ['a', 'b', 'c', 'd', 'e', '', 'g', 'h',
+                                       'i', 'j']})
+        original = original[['y', 'x', 'w', 'z']]
+        tm.assert_frame_equal(original, df)
+
+    def test_out_of_range_double(self):
+        # GH 14618
+        df = DataFrame({'ColumnOk': [0.0,
+                                     np.finfo(np.double).eps,
+                                     4.49423283715579e+307],
+                        'ColumnTooBig': [0.0,
+                                         np.finfo(np.double).eps,
+                                         np.finfo(np.double).max]})
+        with pytest.raises(ValueError) as cm:
+            with tm.ensure_clean() as path:
+                df.to_stata(path)
+            assert 'ColumnTooBig' in cm.exception
+
+        df.loc[2, 'ColumnTooBig'] = np.inf
+        with pytest.raises(ValueError) as cm:
+            with tm.ensure_clean() as path:
+                df.to_stata(path)
+            assert 'ColumnTooBig' in cm.exception
+            assert 'infinity' in cm.exception
+
+    def test_out_of_range_float(self):
+        original = DataFrame({'ColumnOk': [0.0,
+                                           np.finfo(np.float32).eps,
+                                           np.finfo(np.float32).max / 10.0],
+                              'ColumnTooBig': [0.0,
+                                               np.finfo(np.float32).eps,
+                                               np.finfo(np.float32).max]})
+        original.index.name = 'index'
+        for col in original:
+            original[col] = original[col].astype(np.float32)
+
+        with tm.ensure_clean() as path:
+            original.to_stata(path)
+            reread = read_stata(path)
+            original['ColumnTooBig'] = original['ColumnTooBig'].astype(
+                np.float64)
+            tm.assert_frame_equal(original,
+                                  reread.set_index('index'))
+
+        original.loc[2, 'ColumnTooBig'] = np.inf
+        with pytest.raises(ValueError) as cm:
+            with tm.ensure_clean() as path:
+                original.to_stata(path)
+            assert 'ColumnTooBig' in cm.exception
+            assert 'infinity' in cm.exception
+
+    def test_path_pathlib(self):
+        df = tm.makeDataFrame()
+        df.index.name = 'index'
+        reader = lambda x: read_stata(x).set_index('index')
+        result = tm.round_trip_pathlib(df.to_stata, reader)
+        tm.assert_frame_equal(df, result)
+
+    def test_pickle_path_localpath(self):
+        df = tm.makeDataFrame()
+        df.index.name = 'index'
+        reader = lambda x: read_stata(x).set_index('index')
+        result = tm.round_trip_localpath(df.to_stata, reader)
+        tm.assert_frame_equal(df, result)
+
+    @pytest.mark.parametrize(
+        'write_index', [True, False])
+    def test_value_labels_iterator(self, write_index):
+        # GH 16923
+        d = {'A': ['B', 'E', 'C', 'A', 'E']}
+        df = pd.DataFrame(data=d)
+        df['A'] = df['A'].astype('category')
+        with tm.ensure_clean() as path:
+            df.to_stata(path, write_index=write_index)
+
+            with pd.read_stata(path, iterator=True) as dta_iter:
+                value_labels = dta_iter.value_labels()
+        assert value_labels == {'A': {0: 'A', 1: 'B', 2: 'C', 3: 'E'}}
+
+    def test_set_index(self):
+        # GH 17328
+        df = tm.makeDataFrame()
+        df.index.name = 'index'
+        with tm.ensure_clean() as path:
+            df.to_stata(path)
+            reread = pd.read_stata(path, index_col='index')
+        tm.assert_frame_equal(df, reread)
+
+    @pytest.mark.parametrize(
+        'column', ['ms', 'day', 'week', 'month', 'qtr', 'half', 'yr'])
+    def test_date_parsing_ignores_format_details(self, column):
+        # GH 17797
+        #
+        # Test that display formats are ignored when determining if a numeric
+        # column is a date value.
+        #
+        # All date types are stored as numbers and format associated with the
+        # column denotes both the type of the date and the display format.
+        #
+        # STATA supports 9 date types which each have distinct units. We test 7
+        # of the 9 types, ignoring %tC and %tb. %tC is a variant of %tc that
+        # accounts for leap seconds and %tb relies on STATAs business calendar.
+        df = read_stata(self.stata_dates)
+        unformatted = df.loc[0, column]
+        formatted = df.loc[0, column + "_fmt"]
+        assert unformatted == formatted
+
+    def test_writer_117(self):
+        original = DataFrame(data=[['string', 'object', 1, 1, 1, 1.1, 1.1,
+                                    np.datetime64('2003-12-25'),
+                                    'a', 'a' * 2045, 'a' * 5000, 'a'],
+                                   ['string-1', 'object-1', 1, 1, 1, 1.1, 1.1,
+                                    np.datetime64('2003-12-26'),
+                                    'b', 'b' * 2045, '', '']
+                                   ],
+                             columns=['string', 'object', 'int8', 'int16',
+                                      'int32', 'float32', 'float64',
+                                      'datetime',
+                                      's1', 's2045', 'srtl', 'forced_strl'])
+        original['object'] = Series(original['object'], dtype=object)
+        original['int8'] = Series(original['int8'], dtype=np.int8)
+        original['int16'] = Series(original['int16'], dtype=np.int16)
+        original['int32'] = original['int32'].astype(np.int32)
+        original['float32'] = Series(original['float32'], dtype=np.float32)
+        original.index.name = 'index'
+        original.index = original.index.astype(np.int32)
+        copy = original.copy()
+        with tm.ensure_clean() as path:
+            original.to_stata(path,
+                              convert_dates={'datetime': 'tc'},
+                              convert_strl=['forced_strl'],
+                              version=117)
+            written_and_read_again = self.read_dta(path)
+            # original.index is np.int32, read index is np.int64
+            tm.assert_frame_equal(written_and_read_again.set_index('index'),
+                                  original, check_index_type=False)
+            tm.assert_frame_equal(original, copy)
+
+    def test_convert_strl_name_swap(self):
+        original = DataFrame([['a' * 3000, 'A', 'apple'],
+                              ['b' * 1000, 'B', 'banana']],
+                             columns=['long1' * 10, 'long', 1])
+        original.index.name = 'index'
+
+        with warnings.catch_warnings(record=True) as w:  # noqa
+            with tm.ensure_clean() as path:
+                original.to_stata(path, convert_strl=['long', 1], version=117)
+                reread = self.read_dta(path)
+                reread = reread.set_index('index')
+                reread.columns = original.columns
+                tm.assert_frame_equal(reread, original,
+                                      check_index_type=False)
+
+    def test_invalid_date_conversion(self):
+        # GH 12259
+        dates = [dt.datetime(1999, 12, 31, 12, 12, 12, 12000),
+                 dt.datetime(2012, 12, 21, 12, 21, 12, 21000),
+                 dt.datetime(1776, 7, 4, 7, 4, 7, 4000)]
+        original = pd.DataFrame({'nums': [1.0, 2.0, 3.0],
+                                 'strs': ['apple', 'banana', 'cherry'],
+                                 'dates': dates})
+
+        with tm.ensure_clean() as path:
+            with pytest.raises(ValueError):
+                original.to_stata(path,
+                                  convert_dates={'wrong_name': 'tc'})
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_nonfile_writing(self, version):
+        # GH 21041
+        bio = io.BytesIO()
+        df = tm.makeDataFrame()
+        df.index.name = 'index'
+        with tm.ensure_clean() as path:
+            df.to_stata(bio, version=version)
+            bio.seek(0)
+            with open(path, 'wb') as dta:
+                dta.write(bio.read())
+            reread = pd.read_stata(path, index_col='index')
+        tm.assert_frame_equal(df, reread)
+
+    def test_gzip_writing(self):
+        # writing version 117 requires seek and cannot be used with gzip
+        df = tm.makeDataFrame()
+        df.index.name = 'index'
+        with tm.ensure_clean() as path:
+            with gzip.GzipFile(path, 'wb') as gz:
+                df.to_stata(gz, version=114)
+            with gzip.GzipFile(path, 'rb') as gz:
+                reread = pd.read_stata(gz, index_col='index')
+        tm.assert_frame_equal(df, reread)
+
+    def test_unicode_dta_118(self):
+        unicode_df = self.read_dta(self.dta25_118)
+
+        columns = ['utf8', 'latin1', 'ascii', 'utf8_strl', 'ascii_strl']
+        values = [[u'ραηδας', u'PÄNDÄS', 'p', u'ραηδας', 'p'],
+                  [u'ƤĀńĐąŜ', u'Ö', 'a', u'ƤĀńĐąŜ', 'a'],
+                  [u'ᴘᴀᴎᴅᴀS', u'Ü', 'n', u'ᴘᴀᴎᴅᴀS', 'n'],
+                  ['      ', '      ', 'd', '      ', 'd'],
+                  [' ', '', 'a', ' ', 'a'],
+                  ['', '', 's', '', 's'],
+                  ['', '', ' ', '', ' ']]
+        expected = pd.DataFrame(values, columns=columns)
+
+        tm.assert_frame_equal(unicode_df, expected)
diff --git a/pandas/tests/plotting/__init__.py b/pandas/tests/plotting/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/plotting/common.py b/pandas/tests/plotting/common.py
new file mode 100644
index 0000000000000..09687dd97bd43
--- /dev/null
+++ b/pandas/tests/plotting/common.py
@@ -0,0 +1,563 @@
+#!/usr/bin/env python
+# coding: utf-8
+
+import pytest
+import os
+import warnings
+
+from pandas import DataFrame, Series
+from pandas.compat import zip, iteritems
+from pandas.util._decorators import cache_readonly
+from pandas.core.dtypes.api import is_list_like
+import pandas.util.testing as tm
+from pandas.util.testing import (ensure_clean,
+                                 assert_is_valid_plot_return_object)
+import pandas.util._test_decorators as td
+
+import numpy as np
+from numpy import random
+
+import pandas.plotting as plotting
+from pandas.plotting._tools import _flatten
+
+"""
+This is a common base class used for various plotting tests
+"""
+
+
+def _skip_if_no_scipy_gaussian_kde():
+    try:
+        from scipy.stats import gaussian_kde  # noqa
+    except ImportError:
+        pytest.skip("scipy version doesn't support gaussian_kde")
+
+
+def _ok_for_gaussian_kde(kind):
+    if kind in ['kde', 'density']:
+        try:
+            from scipy.stats import gaussian_kde  # noqa
+        except ImportError:
+            return False
+
+    return plotting._compat._mpl_ge_1_5_0()
+
+
+@td.skip_if_no_mpl
+class TestPlotBase(object):
+
+    def setup_method(self, method):
+
+        import matplotlib as mpl
+        mpl.rcdefaults()
+
+        self.mpl_le_1_2_1 = plotting._compat._mpl_le_1_2_1()
+        self.mpl_ge_1_3_1 = plotting._compat._mpl_ge_1_3_1()
+        self.mpl_ge_1_4_0 = plotting._compat._mpl_ge_1_4_0()
+        self.mpl_ge_1_5_0 = plotting._compat._mpl_ge_1_5_0()
+        self.mpl_ge_2_0_0 = plotting._compat._mpl_ge_2_0_0()
+        self.mpl_ge_2_0_1 = plotting._compat._mpl_ge_2_0_1()
+        self.mpl_ge_2_2_0 = plotting._compat._mpl_ge_2_2_0()
+
+        if self.mpl_ge_1_4_0:
+            self.bp_n_objects = 7
+        else:
+            self.bp_n_objects = 8
+        if self.mpl_ge_1_5_0:
+            # 1.5 added PolyCollections to legend handler
+            # so we have twice as many items.
+            self.polycollection_factor = 2
+        else:
+            self.polycollection_factor = 1
+
+        if self.mpl_ge_2_0_0:
+            self.default_figsize = (6.4, 4.8)
+        else:
+            self.default_figsize = (8.0, 6.0)
+        self.default_tick_position = 'left' if self.mpl_ge_2_0_0 else 'default'
+
+        n = 100
+        with tm.RNGContext(42):
+            gender = np.random.choice(['Male', 'Female'], size=n)
+            classroom = np.random.choice(['A', 'B', 'C'], size=n)
+
+            self.hist_df = DataFrame({'gender': gender,
+                                      'classroom': classroom,
+                                      'height': random.normal(66, 4, size=n),
+                                      'weight': random.normal(161, 32, size=n),
+                                      'category': random.randint(4, size=n)})
+
+        self.tdf = tm.makeTimeDataFrame()
+        self.hexbin_df = DataFrame({"A": np.random.uniform(size=20),
+                                    "B": np.random.uniform(size=20),
+                                    "C": np.arange(20) + np.random.uniform(
+                                        size=20)})
+
+    def teardown_method(self, method):
+        tm.close()
+
+    @cache_readonly
+    def plt(self):
+        import matplotlib.pyplot as plt
+        return plt
+
+    @cache_readonly
+    def colorconverter(self):
+        import matplotlib.colors as colors
+        return colors.colorConverter
+
+    def _check_legend_labels(self, axes, labels=None, visible=True):
+        """
+        Check each axes has expected legend labels
+
+        Parameters
+        ----------
+        axes : matplotlib Axes object, or its list-like
+        labels : list-like
+            expected legend labels
+        visible : bool
+            expected legend visibility. labels are checked only when visible is
+            True
+        """
+
+        if visible and (labels is None):
+            raise ValueError('labels must be specified when visible is True')
+        axes = self._flatten_visible(axes)
+        for ax in axes:
+            if visible:
+                assert ax.get_legend() is not None
+                self._check_text_labels(ax.get_legend().get_texts(), labels)
+            else:
+                assert ax.get_legend() is None
+
+    def _check_data(self, xp, rs):
+        """
+        Check each axes has identical lines
+
+        Parameters
+        ----------
+        xp : matplotlib Axes object
+        rs : matplotlib Axes object
+        """
+        xp_lines = xp.get_lines()
+        rs_lines = rs.get_lines()
+
+        def check_line(xpl, rsl):
+            xpdata = xpl.get_xydata()
+            rsdata = rsl.get_xydata()
+            tm.assert_almost_equal(xpdata, rsdata)
+
+        assert len(xp_lines) == len(rs_lines)
+        [check_line(xpl, rsl) for xpl, rsl in zip(xp_lines, rs_lines)]
+        tm.close()
+
+    def _check_visible(self, collections, visible=True):
+        """
+        Check each artist is visible or not
+
+        Parameters
+        ----------
+        collections : matplotlib Artist or its list-like
+            target Artist or its list or collection
+        visible : bool
+            expected visibility
+        """
+        from matplotlib.collections import Collection
+        if not isinstance(collections,
+                          Collection) and not is_list_like(collections):
+            collections = [collections]
+
+        for patch in collections:
+            assert patch.get_visible() == visible
+
+    def _get_colors_mapped(self, series, colors):
+        unique = series.unique()
+        # unique and colors length can be differed
+        # depending on slice value
+        mapped = dict(zip(unique, colors))
+        return [mapped[v] for v in series.values]
+
+    def _check_colors(self, collections, linecolors=None, facecolors=None,
+                      mapping=None):
+        """
+        Check each artist has expected line colors and face colors
+
+        Parameters
+        ----------
+        collections : list-like
+            list or collection of target artist
+        linecolors : list-like which has the same length as collections
+            list of expected line colors
+        facecolors : list-like which has the same length as collections
+            list of expected face colors
+        mapping : Series
+            Series used for color grouping key
+            used for andrew_curves, parallel_coordinates, radviz test
+        """
+
+        from matplotlib.lines import Line2D
+        from matplotlib.collections import (
+            Collection, PolyCollection, LineCollection
+        )
+        conv = self.colorconverter
+        if linecolors is not None:
+
+            if mapping is not None:
+                linecolors = self._get_colors_mapped(mapping, linecolors)
+                linecolors = linecolors[:len(collections)]
+
+            assert len(collections) == len(linecolors)
+            for patch, color in zip(collections, linecolors):
+                if isinstance(patch, Line2D):
+                    result = patch.get_color()
+                    # Line2D may contains string color expression
+                    result = conv.to_rgba(result)
+                elif isinstance(patch, (PolyCollection, LineCollection)):
+                    result = tuple(patch.get_edgecolor()[0])
+                else:
+                    result = patch.get_edgecolor()
+
+                expected = conv.to_rgba(color)
+                assert result == expected
+
+        if facecolors is not None:
+
+            if mapping is not None:
+                facecolors = self._get_colors_mapped(mapping, facecolors)
+                facecolors = facecolors[:len(collections)]
+
+            assert len(collections) == len(facecolors)
+            for patch, color in zip(collections, facecolors):
+                if isinstance(patch, Collection):
+                    # returned as list of np.array
+                    result = patch.get_facecolor()[0]
+                else:
+                    result = patch.get_facecolor()
+
+                if isinstance(result, np.ndarray):
+                    result = tuple(result)
+
+                expected = conv.to_rgba(color)
+                assert result == expected
+
+    def _check_text_labels(self, texts, expected):
+        """
+        Check each text has expected labels
+
+        Parameters
+        ----------
+        texts : matplotlib Text object, or its list-like
+            target text, or its list
+        expected : str or list-like which has the same length as texts
+            expected text label, or its list
+        """
+        if not is_list_like(texts):
+            assert texts.get_text() == expected
+        else:
+            labels = [t.get_text() for t in texts]
+            assert len(labels) == len(expected)
+            for l, e in zip(labels, expected):
+                assert l == e
+
+    def _check_ticks_props(self, axes, xlabelsize=None, xrot=None,
+                           ylabelsize=None, yrot=None):
+        """
+        Check each axes has expected tick properties
+
+        Parameters
+        ----------
+        axes : matplotlib Axes object, or its list-like
+        xlabelsize : number
+            expected xticks font size
+        xrot : number
+            expected xticks rotation
+        ylabelsize : number
+            expected yticks font size
+        yrot : number
+            expected yticks rotation
+        """
+        from matplotlib.ticker import NullFormatter
+        axes = self._flatten_visible(axes)
+        for ax in axes:
+            if xlabelsize or xrot:
+                if isinstance(ax.xaxis.get_minor_formatter(), NullFormatter):
+                    # If minor ticks has NullFormatter, rot / fontsize are not
+                    # retained
+                    labels = ax.get_xticklabels()
+                else:
+                    labels = ax.get_xticklabels() + ax.get_xticklabels(
+                        minor=True)
+
+                for label in labels:
+                    if xlabelsize is not None:
+                        tm.assert_almost_equal(label.get_fontsize(),
+                                               xlabelsize)
+                    if xrot is not None:
+                        tm.assert_almost_equal(label.get_rotation(), xrot)
+
+            if ylabelsize or yrot:
+                if isinstance(ax.yaxis.get_minor_formatter(), NullFormatter):
+                    labels = ax.get_yticklabels()
+                else:
+                    labels = ax.get_yticklabels() + ax.get_yticklabels(
+                        minor=True)
+
+                for label in labels:
+                    if ylabelsize is not None:
+                        tm.assert_almost_equal(label.get_fontsize(),
+                                               ylabelsize)
+                    if yrot is not None:
+                        tm.assert_almost_equal(label.get_rotation(), yrot)
+
+    def _check_ax_scales(self, axes, xaxis='linear', yaxis='linear'):
+        """
+        Check each axes has expected scales
+
+        Parameters
+        ----------
+        axes : matplotlib Axes object, or its list-like
+        xaxis : {'linear', 'log'}
+            expected xaxis scale
+        yaxis :  {'linear', 'log'}
+            expected yaxis scale
+        """
+        axes = self._flatten_visible(axes)
+        for ax in axes:
+            assert ax.xaxis.get_scale() == xaxis
+            assert ax.yaxis.get_scale() == yaxis
+
+    def _check_axes_shape(self, axes, axes_num=None, layout=None,
+                          figsize=None):
+        """
+        Check expected number of axes is drawn in expected layout
+
+        Parameters
+        ----------
+        axes : matplotlib Axes object, or its list-like
+        axes_num : number
+            expected number of axes. Unnecessary axes should be set to
+            invisible.
+        layout :  tuple
+            expected layout, (expected number of rows , columns)
+        figsize : tuple
+            expected figsize. default is matplotlib default
+        """
+        if figsize is None:
+            figsize = self.default_figsize
+        visible_axes = self._flatten_visible(axes)
+
+        if axes_num is not None:
+            assert len(visible_axes) == axes_num
+            for ax in visible_axes:
+                # check something drawn on visible axes
+                assert len(ax.get_children()) > 0
+
+        if layout is not None:
+            result = self._get_axes_layout(_flatten(axes))
+            assert result == layout
+
+        tm.assert_numpy_array_equal(
+            visible_axes[0].figure.get_size_inches(),
+            np.array(figsize, dtype=np.float64))
+
+    def _get_axes_layout(self, axes):
+        x_set = set()
+        y_set = set()
+        for ax in axes:
+            # check axes coordinates to estimate layout
+            points = ax.get_position().get_points()
+            x_set.add(points[0][0])
+            y_set.add(points[0][1])
+        return (len(y_set), len(x_set))
+
+    def _flatten_visible(self, axes):
+        """
+        Flatten axes, and filter only visible
+
+        Parameters
+        ----------
+        axes : matplotlib Axes object, or its list-like
+
+        """
+        axes = _flatten(axes)
+        axes = [ax for ax in axes if ax.get_visible()]
+        return axes
+
+    def _check_has_errorbars(self, axes, xerr=0, yerr=0):
+        """
+        Check axes has expected number of errorbars
+
+        Parameters
+        ----------
+        axes : matplotlib Axes object, or its list-like
+        xerr : number
+            expected number of x errorbar
+        yerr : number
+            expected number of y errorbar
+        """
+        axes = self._flatten_visible(axes)
+        for ax in axes:
+            containers = ax.containers
+            xerr_count = 0
+            yerr_count = 0
+            for c in containers:
+                has_xerr = getattr(c, 'has_xerr', False)
+                has_yerr = getattr(c, 'has_yerr', False)
+                if has_xerr:
+                    xerr_count += 1
+                if has_yerr:
+                    yerr_count += 1
+            assert xerr == xerr_count
+            assert yerr == yerr_count
+
+    def _check_box_return_type(self, returned, return_type, expected_keys=None,
+                               check_ax_title=True):
+        """
+        Check box returned type is correct
+
+        Parameters
+        ----------
+        returned : object to be tested, returned from boxplot
+        return_type : str
+            return_type passed to boxplot
+        expected_keys : list-like, optional
+            group labels in subplot case. If not passed,
+            the function checks assuming boxplot uses single ax
+        check_ax_title : bool
+            Whether to check the ax.title is the same as expected_key
+            Intended to be checked by calling from ``boxplot``.
+            Normal ``plot`` doesn't attach ``ax.title``, it must be disabled.
+        """
+        from matplotlib.axes import Axes
+        types = {'dict': dict, 'axes': Axes, 'both': tuple}
+        if expected_keys is None:
+            # should be fixed when the returning default is changed
+            if return_type is None:
+                return_type = 'dict'
+
+            assert isinstance(returned, types[return_type])
+            if return_type == 'both':
+                assert isinstance(returned.ax, Axes)
+                assert isinstance(returned.lines, dict)
+        else:
+            # should be fixed when the returning default is changed
+            if return_type is None:
+                for r in self._flatten_visible(returned):
+                    assert isinstance(r, Axes)
+                return
+
+            assert isinstance(returned, Series)
+
+            assert sorted(returned.keys()) == sorted(expected_keys)
+            for key, value in iteritems(returned):
+                assert isinstance(value, types[return_type])
+                # check returned dict has correct mapping
+                if return_type == 'axes':
+                    if check_ax_title:
+                        assert value.get_title() == key
+                elif return_type == 'both':
+                    if check_ax_title:
+                        assert value.ax.get_title() == key
+                    assert isinstance(value.ax, Axes)
+                    assert isinstance(value.lines, dict)
+                elif return_type == 'dict':
+                    line = value['medians'][0]
+                    axes = line.axes if self.mpl_ge_1_5_0 else line.get_axes()
+                    if check_ax_title:
+                        assert axes.get_title() == key
+                else:
+                    raise AssertionError
+
+    def _check_grid_settings(self, obj, kinds, kws={}):
+        # Make sure plot defaults to rcParams['axes.grid'] setting, GH 9792
+
+        import matplotlib as mpl
+
+        def is_grid_on():
+            xoff = all(not g.gridOn
+                       for g in self.plt.gca().xaxis.get_major_ticks())
+            yoff = all(not g.gridOn
+                       for g in self.plt.gca().yaxis.get_major_ticks())
+            return not (xoff and yoff)
+
+        spndx = 1
+        for kind in kinds:
+            if not _ok_for_gaussian_kde(kind):
+                continue
+
+            self.plt.subplot(1, 4 * len(kinds), spndx)
+            spndx += 1
+            mpl.rc('axes', grid=False)
+            obj.plot(kind=kind, **kws)
+            assert not is_grid_on()
+
+            self.plt.subplot(1, 4 * len(kinds), spndx)
+            spndx += 1
+            mpl.rc('axes', grid=True)
+            obj.plot(kind=kind, grid=False, **kws)
+            assert not is_grid_on()
+
+            if kind != 'pie':
+                self.plt.subplot(1, 4 * len(kinds), spndx)
+                spndx += 1
+                mpl.rc('axes', grid=True)
+                obj.plot(kind=kind, **kws)
+                assert is_grid_on()
+
+                self.plt.subplot(1, 4 * len(kinds), spndx)
+                spndx += 1
+                mpl.rc('axes', grid=False)
+                obj.plot(kind=kind, grid=True, **kws)
+                assert is_grid_on()
+
+    def _maybe_unpack_cycler(self, rcParams, field='color'):
+        """
+        Compat layer for MPL 1.5 change to color cycle
+
+        Before: plt.rcParams['axes.color_cycle'] -> ['b', 'g', 'r'...]
+        After : plt.rcParams['axes.prop_cycle'] -> cycler(...)
+        """
+        if self.mpl_ge_1_5_0:
+            cyl = rcParams['axes.prop_cycle']
+            colors = [v[field] for v in cyl]
+        else:
+            colors = rcParams['axes.color_cycle']
+        return colors
+
+
+def _check_plot_works(f, filterwarnings='always', **kwargs):
+    import matplotlib.pyplot as plt
+    ret = None
+    with warnings.catch_warnings():
+        warnings.simplefilter(filterwarnings)
+        try:
+            try:
+                fig = kwargs['figure']
+            except KeyError:
+                fig = plt.gcf()
+
+            plt.clf()
+
+            ax = kwargs.get('ax', fig.add_subplot(211))  # noqa
+            ret = f(**kwargs)
+
+            assert_is_valid_plot_return_object(ret)
+
+            try:
+                kwargs['ax'] = fig.add_subplot(212)
+                ret = f(**kwargs)
+            except Exception:
+                pass
+            else:
+                assert_is_valid_plot_return_object(ret)
+
+            with ensure_clean(return_filelike=True) as path:
+                plt.savefig(path)
+        finally:
+            tm.close(fig)
+
+        return ret
+
+
+def curpath():
+    pth, _ = os.path.split(os.path.abspath(__file__))
+    return pth
diff --git a/pandas/tests/plotting/test_boxplot_method.py b/pandas/tests/plotting/test_boxplot_method.py
new file mode 100644
index 0000000000000..7661b46a79061
--- /dev/null
+++ b/pandas/tests/plotting/test_boxplot_method.py
@@ -0,0 +1,397 @@
+# coding: utf-8
+
+import pytest
+import itertools
+import string
+from distutils.version import LooseVersion
+
+from pandas import Series, DataFrame, MultiIndex
+from pandas.compat import range, lzip
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+import numpy as np
+from numpy import random
+
+import pandas.plotting as plotting
+
+from pandas.tests.plotting.common import (TestPlotBase, _check_plot_works)
+
+
+""" Test cases for .boxplot method """
+
+
+def _skip_if_mpl_14_or_dev_boxplot():
+    # GH 8382
+    # Boxplot failures on 1.4 and 1.4.1
+    # Don't need try / except since that's done at class level
+    import matplotlib
+    if LooseVersion(matplotlib.__version__) >= LooseVersion('1.4'):
+        pytest.skip("Matplotlib Regression in 1.4 and current dev.")
+
+
+@td.skip_if_no_mpl
+class TestDataFramePlots(TestPlotBase):
+
+    @pytest.mark.slow
+    def test_boxplot_legacy1(self):
+        df = DataFrame(np.random.randn(6, 4),
+                       index=list(string.ascii_letters[:6]),
+                       columns=['one', 'two', 'three', 'four'])
+        df['indic'] = ['foo', 'bar'] * 3
+        df['indic2'] = ['foo', 'bar', 'foo'] * 2
+
+        _check_plot_works(df.boxplot, return_type='dict')
+        _check_plot_works(df.boxplot, column=[
+                          'one', 'two'], return_type='dict')
+        # _check_plot_works adds an ax so catch warning. see GH #13188
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(df.boxplot, column=['one', 'two'],
+                              by='indic')
+        _check_plot_works(df.boxplot, column='one', by=['indic', 'indic2'])
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(df.boxplot, by='indic')
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(df.boxplot, by=['indic', 'indic2'])
+        _check_plot_works(plotting._core.boxplot, data=df['one'],
+                          return_type='dict')
+        _check_plot_works(df.boxplot, notch=1, return_type='dict')
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(df.boxplot, by='indic', notch=1)
+
+    @pytest.mark.slow
+    def test_boxplot_legacy2(self):
+        df = DataFrame(np.random.rand(10, 2), columns=['Col1', 'Col2'])
+        df['X'] = Series(['A', 'A', 'A', 'A', 'A', 'B', 'B', 'B', 'B', 'B'])
+        df['Y'] = Series(['A'] * 10)
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(df.boxplot, by='X')
+
+        # When ax is supplied and required number of axes is 1,
+        # passed ax should be used:
+        fig, ax = self.plt.subplots()
+        axes = df.boxplot('Col1', by='X', ax=ax)
+        ax_axes = ax.axes if self.mpl_ge_1_5_0 else ax.get_axes()
+        assert ax_axes is axes
+
+        fig, ax = self.plt.subplots()
+        axes = df.groupby('Y').boxplot(ax=ax, return_type='axes')
+        ax_axes = ax.axes if self.mpl_ge_1_5_0 else ax.get_axes()
+        assert ax_axes is axes['A']
+
+        # Multiple columns with an ax argument should use same figure
+        fig, ax = self.plt.subplots()
+        with tm.assert_produces_warning(UserWarning):
+            axes = df.boxplot(column=['Col1', 'Col2'],
+                              by='X', ax=ax, return_type='axes')
+        assert axes['Col1'].get_figure() is fig
+
+        # When by is None, check that all relevant lines are present in the
+        # dict
+        fig, ax = self.plt.subplots()
+        d = df.boxplot(ax=ax, return_type='dict')
+        lines = list(itertools.chain.from_iterable(d.values()))
+        assert len(ax.get_lines()) == len(lines)
+
+    @pytest.mark.slow
+    def test_boxplot_return_type_none(self):
+        # GH 12216; return_type=None & by=None -> axes
+        result = self.hist_df.boxplot()
+        assert isinstance(result, self.plt.Axes)
+
+    @pytest.mark.slow
+    def test_boxplot_return_type_legacy(self):
+        # API change in https://github.com/pandas-dev/pandas/pull/7096
+        import matplotlib as mpl  # noqa
+
+        df = DataFrame(np.random.randn(6, 4),
+                       index=list(string.ascii_letters[:6]),
+                       columns=['one', 'two', 'three', 'four'])
+        with pytest.raises(ValueError):
+            df.boxplot(return_type='NOTATYPE')
+
+        result = df.boxplot()
+        self._check_box_return_type(result, 'axes')
+
+        with tm.assert_produces_warning(False):
+            result = df.boxplot(return_type='dict')
+        self._check_box_return_type(result, 'dict')
+
+        with tm.assert_produces_warning(False):
+            result = df.boxplot(return_type='axes')
+        self._check_box_return_type(result, 'axes')
+
+        with tm.assert_produces_warning(False):
+            result = df.boxplot(return_type='both')
+        self._check_box_return_type(result, 'both')
+
+    @pytest.mark.slow
+    def test_boxplot_axis_limits(self):
+
+        def _check_ax_limits(col, ax):
+            y_min, y_max = ax.get_ylim()
+            assert y_min <= col.min()
+            assert y_max >= col.max()
+
+        df = self.hist_df.copy()
+        df['age'] = np.random.randint(1, 20, df.shape[0])
+        # One full row
+        height_ax, weight_ax = df.boxplot(['height', 'weight'], by='category')
+        _check_ax_limits(df['height'], height_ax)
+        _check_ax_limits(df['weight'], weight_ax)
+        assert weight_ax._sharey == height_ax
+
+        # Two rows, one partial
+        p = df.boxplot(['height', 'weight', 'age'], by='category')
+        height_ax, weight_ax, age_ax = p[0, 0], p[0, 1], p[1, 0]
+        dummy_ax = p[1, 1]
+
+        _check_ax_limits(df['height'], height_ax)
+        _check_ax_limits(df['weight'], weight_ax)
+        _check_ax_limits(df['age'], age_ax)
+        assert weight_ax._sharey == height_ax
+        assert age_ax._sharey == height_ax
+        assert dummy_ax._sharey is None
+
+    @pytest.mark.slow
+    def test_boxplot_empty_column(self):
+        _skip_if_mpl_14_or_dev_boxplot()
+        df = DataFrame(np.random.randn(20, 4))
+        df.loc[:, 0] = np.nan
+        _check_plot_works(df.boxplot, return_type='axes')
+
+    @pytest.mark.slow
+    def test_figsize(self):
+        df = DataFrame(np.random.rand(10, 5),
+                       columns=['A', 'B', 'C', 'D', 'E'])
+        result = df.boxplot(return_type='axes', figsize=(12, 8))
+        assert result.figure.bbox_inches.width == 12
+        assert result.figure.bbox_inches.height == 8
+
+    def test_fontsize(self):
+        df = DataFrame({"a": [1, 2, 3, 4, 5, 6]})
+        self._check_ticks_props(df.boxplot("a", fontsize=16),
+                                xlabelsize=16, ylabelsize=16)
+
+
+@td.skip_if_no_mpl
+class TestDataFrameGroupByPlots(TestPlotBase):
+
+    @pytest.mark.slow
+    def test_boxplot_legacy1(self):
+        grouped = self.hist_df.groupby(by='gender')
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(grouped.boxplot, return_type='axes')
+        self._check_axes_shape(list(axes.values), axes_num=2, layout=(1, 2))
+        axes = _check_plot_works(grouped.boxplot, subplots=False,
+                                 return_type='axes')
+        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
+
+    @pytest.mark.slow
+    def test_boxplot_legacy2(self):
+        tuples = lzip(string.ascii_letters[:10], range(10))
+        df = DataFrame(np.random.rand(10, 3),
+                       index=MultiIndex.from_tuples(tuples))
+        grouped = df.groupby(level=1)
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(grouped.boxplot, return_type='axes')
+        self._check_axes_shape(list(axes.values), axes_num=10, layout=(4, 3))
+
+        axes = _check_plot_works(grouped.boxplot, subplots=False,
+                                 return_type='axes')
+        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
+
+    @pytest.mark.slow
+    def test_boxplot_legacy3(self):
+        tuples = lzip(string.ascii_letters[:10], range(10))
+        df = DataFrame(np.random.rand(10, 3),
+                       index=MultiIndex.from_tuples(tuples))
+        grouped = df.unstack(level=1).groupby(level=0, axis=1)
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(grouped.boxplot, return_type='axes')
+        self._check_axes_shape(list(axes.values), axes_num=3, layout=(2, 2))
+        axes = _check_plot_works(grouped.boxplot, subplots=False,
+                                 return_type='axes')
+        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
+
+    @pytest.mark.slow
+    def test_grouped_plot_fignums(self):
+        n = 10
+        weight = Series(np.random.normal(166, 20, size=n))
+        height = Series(np.random.normal(60, 10, size=n))
+        with tm.RNGContext(42):
+            gender = np.random.choice(['male', 'female'], size=n)
+        df = DataFrame({'height': height, 'weight': weight, 'gender': gender})
+        gb = df.groupby('gender')
+
+        res = gb.plot()
+        assert len(self.plt.get_fignums()) == 2
+        assert len(res) == 2
+        tm.close()
+
+        res = gb.boxplot(return_type='axes')
+        assert len(self.plt.get_fignums()) == 1
+        assert len(res) == 2
+        tm.close()
+
+        # now works with GH 5610 as gender is excluded
+        res = df.groupby('gender').hist()
+        tm.close()
+
+    @pytest.mark.slow
+    def test_grouped_box_return_type(self):
+        df = self.hist_df
+
+        # old style: return_type=None
+        result = df.boxplot(by='gender')
+        assert isinstance(result, np.ndarray)
+        self._check_box_return_type(
+            result, None,
+            expected_keys=['height', 'weight', 'category'])
+
+        # now for groupby
+        result = df.groupby('gender').boxplot(return_type='dict')
+        self._check_box_return_type(
+            result, 'dict', expected_keys=['Male', 'Female'])
+
+        columns2 = 'X B C D A G Y N Q O'.split()
+        df2 = DataFrame(random.randn(50, 10), columns=columns2)
+        categories2 = 'A B C D E F G H I J'.split()
+        df2['category'] = categories2 * 5
+
+        for t in ['dict', 'axes', 'both']:
+            returned = df.groupby('classroom').boxplot(return_type=t)
+            self._check_box_return_type(
+                returned, t, expected_keys=['A', 'B', 'C'])
+
+            returned = df.boxplot(by='classroom', return_type=t)
+            self._check_box_return_type(
+                returned, t,
+                expected_keys=['height', 'weight', 'category'])
+
+            returned = df2.groupby('category').boxplot(return_type=t)
+            self._check_box_return_type(returned, t, expected_keys=categories2)
+
+            returned = df2.boxplot(by='category', return_type=t)
+            self._check_box_return_type(returned, t, expected_keys=columns2)
+
+    @pytest.mark.slow
+    def test_grouped_box_layout(self):
+        df = self.hist_df
+
+        pytest.raises(ValueError, df.boxplot, column=['weight', 'height'],
+                      by=df.gender, layout=(1, 1))
+        pytest.raises(ValueError, df.boxplot,
+                      column=['height', 'weight', 'category'],
+                      layout=(2, 1), return_type='dict')
+        pytest.raises(ValueError, df.boxplot, column=['weight', 'height'],
+                      by=df.gender, layout=(-1, -1))
+
+        # _check_plot_works adds an ax so catch warning. see GH #13188
+        with tm.assert_produces_warning(UserWarning):
+            box = _check_plot_works(df.groupby('gender').boxplot,
+                                    column='height', return_type='dict')
+        self._check_axes_shape(self.plt.gcf().axes, axes_num=2, layout=(1, 2))
+
+        with tm.assert_produces_warning(UserWarning):
+            box = _check_plot_works(df.groupby('category').boxplot,
+                                    column='height',
+                                    return_type='dict')
+        self._check_axes_shape(self.plt.gcf().axes, axes_num=4, layout=(2, 2))
+
+        # GH 6769
+        with tm.assert_produces_warning(UserWarning):
+            box = _check_plot_works(df.groupby('classroom').boxplot,
+                                    column='height', return_type='dict')
+        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(2, 2))
+
+        # GH 5897
+        axes = df.boxplot(column=['height', 'weight', 'category'], by='gender',
+                          return_type='axes')
+        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(2, 2))
+        for ax in [axes['height']]:
+            self._check_visible(ax.get_xticklabels(), visible=False)
+            self._check_visible([ax.xaxis.get_label()], visible=False)
+        for ax in [axes['weight'], axes['category']]:
+            self._check_visible(ax.get_xticklabels())
+            self._check_visible([ax.xaxis.get_label()])
+
+        box = df.groupby('classroom').boxplot(
+            column=['height', 'weight', 'category'], return_type='dict')
+        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(2, 2))
+
+        with tm.assert_produces_warning(UserWarning):
+            box = _check_plot_works(df.groupby('category').boxplot,
+                                    column='height',
+                                    layout=(3, 2), return_type='dict')
+        self._check_axes_shape(self.plt.gcf().axes, axes_num=4, layout=(3, 2))
+        with tm.assert_produces_warning(UserWarning):
+            box = _check_plot_works(df.groupby('category').boxplot,
+                                    column='height',
+                                    layout=(3, -1), return_type='dict')
+        self._check_axes_shape(self.plt.gcf().axes, axes_num=4, layout=(3, 2))
+
+        box = df.boxplot(column=['height', 'weight', 'category'], by='gender',
+                         layout=(4, 1))
+        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(4, 1))
+
+        box = df.boxplot(column=['height', 'weight', 'category'], by='gender',
+                         layout=(-1, 1))
+        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(3, 1))
+
+        box = df.groupby('classroom').boxplot(
+            column=['height', 'weight', 'category'], layout=(1, 4),
+            return_type='dict')
+        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(1, 4))
+
+        box = df.groupby('classroom').boxplot(  # noqa
+            column=['height', 'weight', 'category'], layout=(1, -1),
+            return_type='dict')
+        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(1, 3))
+
+    @pytest.mark.slow
+    def test_grouped_box_multiple_axes(self):
+        # GH 6970, GH 7069
+        df = self.hist_df
+
+        # check warning to ignore sharex / sharey
+        # this check should be done in the first function which
+        # passes multiple axes to plot, hist or boxplot
+        # location should be changed if other test is added
+        # which has earlier alphabetical order
+        with tm.assert_produces_warning(UserWarning):
+            fig, axes = self.plt.subplots(2, 2)
+            df.groupby('category').boxplot(
+                column='height', return_type='axes', ax=axes)
+            self._check_axes_shape(self.plt.gcf().axes,
+                                   axes_num=4, layout=(2, 2))
+
+        fig, axes = self.plt.subplots(2, 3)
+        with tm.assert_produces_warning(UserWarning):
+            returned = df.boxplot(column=['height', 'weight', 'category'],
+                                  by='gender', return_type='axes', ax=axes[0])
+        returned = np.array(list(returned.values))
+        self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
+        tm.assert_numpy_array_equal(returned, axes[0])
+        assert returned[0].figure is fig
+
+        # draw on second row
+        with tm.assert_produces_warning(UserWarning):
+            returned = df.groupby('classroom').boxplot(
+                column=['height', 'weight', 'category'],
+                return_type='axes', ax=axes[1])
+        returned = np.array(list(returned.values))
+        self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
+        tm.assert_numpy_array_equal(returned, axes[1])
+        assert returned[0].figure is fig
+
+        with pytest.raises(ValueError):
+            fig, axes = self.plt.subplots(2, 3)
+            # pass different number of axes from required
+            with tm.assert_produces_warning(UserWarning):
+                axes = df.groupby('classroom').boxplot(ax=axes)
+
+    def test_fontsize(self):
+        df = DataFrame({"a": [1, 2, 3, 4, 5, 6], "b": [0, 0, 0, 1, 1, 1]})
+        self._check_ticks_props(df.boxplot("a", by="b", fontsize=16),
+                                xlabelsize=16, ylabelsize=16)
diff --git a/pandas/tests/plotting/test_converter.py b/pandas/tests/plotting/test_converter.py
new file mode 100644
index 0000000000000..bb976a1e3e81c
--- /dev/null
+++ b/pandas/tests/plotting/test_converter.py
@@ -0,0 +1,355 @@
+import subprocess
+import sys
+import pytest
+from datetime import datetime, date
+
+import numpy as np
+from pandas import Timestamp, Period, Index, date_range, Series
+from pandas.compat import u
+import pandas.core.config as cf
+import pandas.util.testing as tm
+from pandas.tseries.offsets import Second, Milli, Micro, Day
+from pandas.compat.numpy import np_datetime64_compat
+
+converter = pytest.importorskip('pandas.plotting._converter')
+from pandas.plotting import (register_matplotlib_converters,
+                             deregister_matplotlib_converters)
+
+
+def test_timtetonum_accepts_unicode():
+    assert (converter.time2num("00:01") == converter.time2num(u("00:01")))
+
+
+class TestRegistration(object):
+
+    def test_register_by_default(self):
+        # Run in subprocess to ensure a clean state
+        code = ("'import matplotlib.units; "
+                "import pandas as pd; "
+                "units = dict(matplotlib.units.registry); "
+                "assert pd.Timestamp in units)'")
+        call = [sys.executable, '-c', code]
+        assert subprocess.check_call(call) == 0
+
+    def test_warns(self):
+        plt = pytest.importorskip("matplotlib.pyplot")
+        s = Series(range(12), index=date_range('2017', periods=12))
+        _, ax = plt.subplots()
+
+        # Set to the "warning" state, in case this isn't the first test run
+        converter._WARN = True
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False) as w:
+            ax.plot(s.index, s.values)
+            plt.close()
+
+        assert len(w) == 1
+        assert "Using an implicitly registered datetime converter" in str(w[0])
+
+    def test_registering_no_warning(self):
+        plt = pytest.importorskip("matplotlib.pyplot")
+        s = Series(range(12), index=date_range('2017', periods=12))
+        _, ax = plt.subplots()
+
+        # Set to the "warn" state, in case this isn't the first test run
+        converter._WARN = True
+        register_matplotlib_converters()
+        with tm.assert_produces_warning(None) as w:
+            ax.plot(s.index, s.values)
+
+        assert len(w) == 0
+
+    def test_pandas_plots_register(self):
+        pytest.importorskip("matplotlib.pyplot")
+        s = Series(range(12), index=date_range('2017', periods=12))
+        # Set to the "warn" state, in case this isn't the first test run
+        converter._WARN = True
+        with tm.assert_produces_warning(None) as w:
+            s.plot()
+
+        assert len(w) == 0
+
+    def test_matplotlib_formatters(self):
+        units = pytest.importorskip("matplotlib.units")
+        assert Timestamp in units.registry
+
+        ctx = cf.option_context("plotting.matplotlib.register_converters",
+                                False)
+        with ctx:
+            assert Timestamp not in units.registry
+
+        assert Timestamp in units.registry
+
+    def test_option_no_warning(self):
+        pytest.importorskip("matplotlib.pyplot")
+        ctx = cf.option_context("plotting.matplotlib.register_converters",
+                                False)
+        plt = pytest.importorskip("matplotlib.pyplot")
+        s = Series(range(12), index=date_range('2017', periods=12))
+        _, ax = plt.subplots()
+
+        converter._WARN = True
+        # Test without registering first, no warning
+        with ctx:
+            with tm.assert_produces_warning(None) as w:
+                ax.plot(s.index, s.values)
+
+        assert len(w) == 0
+
+        # Now test with registering
+        converter._WARN = True
+        register_matplotlib_converters()
+        with ctx:
+            with tm.assert_produces_warning(None) as w:
+                ax.plot(s.index, s.values)
+
+        assert len(w) == 0
+
+    def test_registry_resets(self):
+        units = pytest.importorskip("matplotlib.units")
+        dates = pytest.importorskip("matplotlib.dates")
+
+        # make a copy, to reset to
+        original = dict(units.registry)
+
+        try:
+            # get to a known state
+            units.registry.clear()
+            date_converter = dates.DateConverter()
+            units.registry[datetime] = date_converter
+            units.registry[date] = date_converter
+
+            register_matplotlib_converters()
+            assert units.registry[date] is not date_converter
+            deregister_matplotlib_converters()
+            assert units.registry[date] is date_converter
+
+        finally:
+            # restore original stater
+            units.registry.clear()
+            for k, v in original.items():
+                units.registry[k] = v
+
+    def test_old_import_warns(self):
+        with tm.assert_produces_warning(FutureWarning) as w:
+            from pandas.tseries import converter
+            converter.register()
+
+        assert len(w)
+        assert ('pandas.plotting.register_matplotlib_converters' in
+                str(w[0].message))
+
+
+class TestDateTimeConverter(object):
+
+    def setup_method(self, method):
+        self.dtc = converter.DatetimeConverter()
+        self.tc = converter.TimeFormatter(None)
+
+    def test_convert_accepts_unicode(self):
+        r1 = self.dtc.convert("12:22", None, None)
+        r2 = self.dtc.convert(u("12:22"), None, None)
+        assert (r1 == r2), "DatetimeConverter.convert should accept unicode"
+
+    def test_conversion(self):
+        rs = self.dtc.convert(['2012-1-1'], None, None)[0]
+        xp = datetime(2012, 1, 1).toordinal()
+        assert rs == xp
+
+        rs = self.dtc.convert('2012-1-1', None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(date(2012, 1, 1), None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(datetime(2012, 1, 1).toordinal(), None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert('2012-1-1', None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(Timestamp('2012-1-1'), None, None)
+        assert rs == xp
+
+        # also testing datetime64 dtype (GH8614)
+        rs = self.dtc.convert(np_datetime64_compat('2012-01-01'), None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(np_datetime64_compat(
+            '2012-01-01 00:00:00+0000'), None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(np.array([
+            np_datetime64_compat('2012-01-01 00:00:00+0000'),
+            np_datetime64_compat('2012-01-02 00:00:00+0000')]), None, None)
+        assert rs[0] == xp
+
+        # we have a tz-aware date (constructed to that when we turn to utc it
+        # is the same as our sample)
+        ts = (Timestamp('2012-01-01')
+              .tz_localize('UTC')
+              .tz_convert('US/Eastern')
+              )
+        rs = self.dtc.convert(ts, None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(ts.to_pydatetime(), None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(Index([ts - Day(1), ts]), None, None)
+        assert rs[1] == xp
+
+        rs = self.dtc.convert(Index([ts - Day(1), ts]).to_pydatetime(),
+                              None, None)
+        assert rs[1] == xp
+
+    def test_conversion_float(self):
+        decimals = 9
+
+        rs = self.dtc.convert(
+            Timestamp('2012-1-1 01:02:03', tz='UTC'), None, None)
+        xp = converter.dates.date2num(Timestamp('2012-1-1 01:02:03', tz='UTC'))
+        tm.assert_almost_equal(rs, xp, decimals)
+
+        rs = self.dtc.convert(
+            Timestamp('2012-1-1 09:02:03', tz='Asia/Hong_Kong'), None, None)
+        tm.assert_almost_equal(rs, xp, decimals)
+
+        rs = self.dtc.convert(datetime(2012, 1, 1, 1, 2, 3), None, None)
+        tm.assert_almost_equal(rs, xp, decimals)
+
+    def test_conversion_outofbounds_datetime(self):
+        # 2579
+        values = [date(1677, 1, 1), date(1677, 1, 2)]
+        rs = self.dtc.convert(values, None, None)
+        xp = converter.dates.date2num(values)
+        tm.assert_numpy_array_equal(rs, xp)
+        rs = self.dtc.convert(values[0], None, None)
+        xp = converter.dates.date2num(values[0])
+        assert rs == xp
+
+        values = [datetime(1677, 1, 1, 12), datetime(1677, 1, 2, 12)]
+        rs = self.dtc.convert(values, None, None)
+        xp = converter.dates.date2num(values)
+        tm.assert_numpy_array_equal(rs, xp)
+        rs = self.dtc.convert(values[0], None, None)
+        xp = converter.dates.date2num(values[0])
+        assert rs == xp
+
+    def test_time_formatter(self):
+        # issue 18478
+
+        # time2num(datetime.time.min)
+        rs = self.tc(0)
+        xp = '00:00'
+        assert rs == xp
+
+        # time2num(datetime.time.max)
+        rs = self.tc(86399.999999)
+        xp = '23:59:59.999999'
+        assert rs == xp
+
+        # some other times
+        rs = self.tc(90000)
+        xp = '01:00'
+        assert rs == xp
+        rs = self.tc(3723)
+        xp = '01:02:03'
+        assert rs == xp
+        rs = self.tc(39723.2)
+        xp = '11:02:03.200'
+        assert rs == xp
+
+    def test_dateindex_conversion(self):
+        decimals = 9
+
+        for freq in ('B', 'L', 'S'):
+            dateindex = tm.makeDateIndex(k=10, freq=freq)
+            rs = self.dtc.convert(dateindex, None, None)
+            xp = converter.dates.date2num(dateindex._mpl_repr())
+            tm.assert_almost_equal(rs, xp, decimals)
+
+    def test_resolution(self):
+        def _assert_less(ts1, ts2):
+            val1 = self.dtc.convert(ts1, None, None)
+            val2 = self.dtc.convert(ts2, None, None)
+            if not val1 < val2:
+                raise AssertionError('{0} is not less than {1}.'.format(val1,
+                                                                        val2))
+
+        # Matplotlib's time representation using floats cannot distinguish
+        # intervals smaller than ~10 microsecond in the common range of years.
+        ts = Timestamp('2012-1-1')
+        _assert_less(ts, ts + Second())
+        _assert_less(ts, ts + Milli())
+        _assert_less(ts, ts + Micro(50))
+
+    def test_convert_nested(self):
+        inner = [Timestamp('2017-01-01', Timestamp('2017-01-02'))]
+        data = [inner, inner]
+        result = self.dtc.convert(data, None, None)
+        expected = [self.dtc.convert(x, None, None) for x in data]
+        assert result == expected
+
+
+class TestPeriodConverter(object):
+
+    def setup_method(self, method):
+        self.pc = converter.PeriodConverter()
+
+        class Axis(object):
+            pass
+
+        self.axis = Axis()
+        self.axis.freq = 'D'
+
+    def test_convert_accepts_unicode(self):
+        r1 = self.pc.convert("2012-1-1", None, self.axis)
+        r2 = self.pc.convert(u("2012-1-1"), None, self.axis)
+        assert r1 == r2
+
+    def test_conversion(self):
+        rs = self.pc.convert(['2012-1-1'], None, self.axis)[0]
+        xp = Period('2012-1-1').ordinal
+        assert rs == xp
+
+        rs = self.pc.convert('2012-1-1', None, self.axis)
+        assert rs == xp
+
+        rs = self.pc.convert([date(2012, 1, 1)], None, self.axis)[0]
+        assert rs == xp
+
+        rs = self.pc.convert(date(2012, 1, 1), None, self.axis)
+        assert rs == xp
+
+        rs = self.pc.convert([Timestamp('2012-1-1')], None, self.axis)[0]
+        assert rs == xp
+
+        rs = self.pc.convert(Timestamp('2012-1-1'), None, self.axis)
+        assert rs == xp
+
+        rs = self.pc.convert(
+            np_datetime64_compat('2012-01-01'), None, self.axis)
+        assert rs == xp
+
+        rs = self.pc.convert(
+            np_datetime64_compat('2012-01-01 00:00:00+0000'), None, self.axis)
+        assert rs == xp
+
+        rs = self.pc.convert(np.array([
+            np_datetime64_compat('2012-01-01 00:00:00+0000'),
+            np_datetime64_compat('2012-01-02 00:00:00+0000')]),
+            None, self.axis)
+        assert rs[0] == xp
+
+    def test_integer_passthrough(self):
+        # GH9012
+        rs = self.pc.convert([0, 1], None, self.axis)
+        xp = [0, 1]
+        assert rs == xp
+
+    def test_convert_nested(self):
+        data = ['2012-1-1', '2012-1-2']
+        r1 = self.pc.convert([data, data], None, self.axis)
+        r2 = [self.pc.convert(data, None, self.axis) for _ in range(2)]
+        assert r1 == r2
diff --git a/pandas/tests/plotting/test_datetimelike.py b/pandas/tests/plotting/test_datetimelike.py
new file mode 100644
index 0000000000000..e3d502cd373e4
--- /dev/null
+++ b/pandas/tests/plotting/test_datetimelike.py
@@ -0,0 +1,1530 @@
+""" Test cases for time series specific (freq conversion, etc) """
+
+from datetime import datetime, timedelta, date, time
+import pickle
+
+import pytest
+from pandas.compat import lrange, zip
+
+import numpy as np
+from pandas import Index, Series, DataFrame, NaT
+from pandas.compat import PY3
+from pandas.core.indexes.datetimes import date_range, bdate_range
+from pandas.core.indexes.timedeltas import timedelta_range
+from pandas.tseries.offsets import DateOffset
+from pandas.core.indexes.period import period_range, Period, PeriodIndex
+from pandas.core.resample import DatetimeIndex
+
+from pandas.util.testing import assert_series_equal, ensure_clean
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+from pandas.tests.plotting.common import (TestPlotBase,
+                                          _skip_if_no_scipy_gaussian_kde)
+
+
+@td.skip_if_no_mpl
+class TestTSPlot(TestPlotBase):
+
+    def setup_method(self, method):
+        TestPlotBase.setup_method(self, method)
+
+        freq = ['S', 'T', 'H', 'D', 'W', 'M', 'Q', 'A']
+        idx = [period_range('12/31/1999', freq=x, periods=100) for x in freq]
+        self.period_ser = [Series(np.random.randn(len(x)), x) for x in idx]
+        self.period_df = [DataFrame(np.random.randn(len(x), 3), index=x,
+                                    columns=['A', 'B', 'C'])
+                          for x in idx]
+
+        freq = ['S', 'T', 'H', 'D', 'W', 'M', 'Q-DEC', 'A', '1B30Min']
+        idx = [date_range('12/31/1999', freq=x, periods=100) for x in freq]
+        self.datetime_ser = [Series(np.random.randn(len(x)), x) for x in idx]
+        self.datetime_df = [DataFrame(np.random.randn(len(x), 3), index=x,
+                                      columns=['A', 'B', 'C'])
+                            for x in idx]
+
+    def teardown_method(self, method):
+        tm.close()
+
+    @pytest.mark.slow
+    def test_ts_plot_with_tz(self):
+        # GH2877
+        index = date_range('1/1/2011', periods=2, freq='H',
+                           tz='Europe/Brussels')
+        ts = Series([188.5, 328.25], index=index)
+        _check_plot_works(ts.plot)
+
+    def test_fontsize_set_correctly(self):
+        # For issue #8765
+        df = DataFrame(np.random.randn(10, 9), index=range(10))
+        fig, ax = self.plt.subplots()
+        df.plot(fontsize=2, ax=ax)
+        for label in (ax.get_xticklabels() + ax.get_yticklabels()):
+            assert label.get_fontsize() == 2
+
+    @pytest.mark.slow
+    def test_frame_inferred(self):
+        # inferred freq
+        idx = date_range('1/1/1987', freq='MS', periods=100)
+        idx = DatetimeIndex(idx.values, freq=None)
+
+        df = DataFrame(np.random.randn(len(idx), 3), index=idx)
+        _check_plot_works(df.plot)
+
+        # axes freq
+        idx = idx[0:40].union(idx[45:99])
+        df2 = DataFrame(np.random.randn(len(idx), 3), index=idx)
+        _check_plot_works(df2.plot)
+
+        # N > 1
+        idx = date_range('2008-1-1 00:15:00', freq='15T', periods=10)
+        idx = DatetimeIndex(idx.values, freq=None)
+        df = DataFrame(np.random.randn(len(idx), 3), index=idx)
+        _check_plot_works(df.plot)
+
+    def test_is_error_nozeroindex(self):
+        # GH11858
+        i = np.array([1, 2, 3])
+        a = DataFrame(i, index=i)
+        _check_plot_works(a.plot, xerr=a)
+        _check_plot_works(a.plot, yerr=a)
+
+    def test_nonnumeric_exclude(self):
+        idx = date_range('1/1/1987', freq='A', periods=3)
+        df = DataFrame({'A': ["x", "y", "z"], 'B': [1, 2, 3]}, idx)
+
+        fig, ax = self.plt.subplots()
+        df.plot(ax=ax)  # it works
+        assert len(ax.get_lines()) == 1  # B was plotted
+        self.plt.close(fig)
+
+        pytest.raises(TypeError, df['A'].plot)
+
+    def test_tsplot_deprecated(self):
+        from pandas.tseries.plotting import tsplot
+
+        _, ax = self.plt.subplots()
+        ts = tm.makeTimeSeries()
+
+        with tm.assert_produces_warning(FutureWarning):
+            tsplot(ts, self.plt.Axes.plot, ax=ax)
+
+    @pytest.mark.slow
+    def test_tsplot(self):
+
+        from pandas.tseries.plotting import tsplot
+
+        _, ax = self.plt.subplots()
+        ts = tm.makeTimeSeries()
+
+        def f(*args, **kwds):
+            with tm.assert_produces_warning(FutureWarning):
+                return tsplot(s, self.plt.Axes.plot, *args, **kwds)
+
+        for s in self.period_ser:
+            _check_plot_works(f, s.index.freq, ax=ax, series=s)
+
+        for s in self.datetime_ser:
+            _check_plot_works(f, s.index.freq.rule_code, ax=ax, series=s)
+
+        for s in self.period_ser:
+            _check_plot_works(s.plot, ax=ax)
+
+        for s in self.datetime_ser:
+            _check_plot_works(s.plot, ax=ax)
+
+        _, ax = self.plt.subplots()
+        ts.plot(style='k', ax=ax)
+        color = (0., 0., 0., 1) if self.mpl_ge_2_0_0 else (0., 0., 0.)
+        assert color == ax.get_lines()[0].get_color()
+
+    def test_both_style_and_color(self):
+
+        ts = tm.makeTimeSeries()
+        pytest.raises(ValueError, ts.plot, style='b-', color='#000099')
+
+        s = ts.reset_index(drop=True)
+        pytest.raises(ValueError, s.plot, style='b-', color='#000099')
+
+    @pytest.mark.slow
+    def test_high_freq(self):
+        freaks = ['ms', 'us']
+        for freq in freaks:
+            _, ax = self.plt.subplots()
+            rng = date_range('1/1/2012', periods=100000, freq=freq)
+            ser = Series(np.random.randn(len(rng)), rng)
+            _check_plot_works(ser.plot, ax=ax)
+
+    def test_get_datevalue(self):
+        from pandas.plotting._converter import get_datevalue
+        assert get_datevalue(None, 'D') is None
+        assert get_datevalue(1987, 'A') == 1987
+        assert (get_datevalue(Period(1987, 'A'), 'M') ==
+                Period('1987-12', 'M').ordinal)
+        assert (get_datevalue('1/1/1987', 'D') ==
+                Period('1987-1-1', 'D').ordinal)
+
+    @pytest.mark.slow
+    def test_ts_plot_format_coord(self):
+        def check_format_of_first_point(ax, expected_string):
+            first_line = ax.get_lines()[0]
+            first_x = first_line.get_xdata()[0].ordinal
+            first_y = first_line.get_ydata()[0]
+            try:
+                assert expected_string == ax.format_coord(first_x, first_y)
+            except (ValueError):
+                pytest.skip("skipping test because issue forming "
+                            "test comparison GH7664")
+
+        annual = Series(1, index=date_range('2014-01-01', periods=3,
+                                            freq='A-DEC'))
+        _, ax = self.plt.subplots()
+        annual.plot(ax=ax)
+        check_format_of_first_point(ax, 't = 2014  y = 1.000000')
+
+        # note this is added to the annual plot already in existence, and
+        # changes its freq field
+        daily = Series(1, index=date_range('2014-01-01', periods=3, freq='D'))
+        daily.plot(ax=ax)
+        check_format_of_first_point(ax,
+                                    't = 2014-01-01  y = 1.000000')
+        tm.close()
+
+        # tsplot
+        from pandas.tseries.plotting import tsplot
+        _, ax = self.plt.subplots()
+        with tm.assert_produces_warning(FutureWarning):
+            tsplot(annual, self.plt.Axes.plot, ax=ax)
+        check_format_of_first_point(ax, 't = 2014  y = 1.000000')
+        with tm.assert_produces_warning(FutureWarning):
+            tsplot(daily, self.plt.Axes.plot, ax=ax)
+        check_format_of_first_point(ax, 't = 2014-01-01  y = 1.000000')
+
+    @pytest.mark.slow
+    def test_line_plot_period_series(self):
+        for s in self.period_ser:
+            _check_plot_works(s.plot, s.index.freq)
+
+    @pytest.mark.slow
+    def test_line_plot_datetime_series(self):
+        for s in self.datetime_ser:
+            _check_plot_works(s.plot, s.index.freq.rule_code)
+
+    @pytest.mark.slow
+    def test_line_plot_period_frame(self):
+        for df in self.period_df:
+            _check_plot_works(df.plot, df.index.freq)
+
+    @pytest.mark.slow
+    def test_line_plot_datetime_frame(self):
+        for df in self.datetime_df:
+            freq = df.index.to_period(df.index.freq.rule_code).freq
+            _check_plot_works(df.plot, freq)
+
+    @pytest.mark.slow
+    def test_line_plot_inferred_freq(self):
+        for ser in self.datetime_ser:
+            ser = Series(ser.values, Index(np.asarray(ser.index)))
+            _check_plot_works(ser.plot, ser.index.inferred_freq)
+
+            ser = ser[[0, 3, 5, 6]]
+            _check_plot_works(ser.plot)
+
+    def test_fake_inferred_business(self):
+        _, ax = self.plt.subplots()
+        rng = date_range('2001-1-1', '2001-1-10')
+        ts = Series(lrange(len(rng)), rng)
+        ts = ts[:3].append(ts[5:])
+        ts.plot(ax=ax)
+        assert not hasattr(ax, 'freq')
+
+    @pytest.mark.slow
+    def test_plot_offset_freq(self):
+        ser = tm.makeTimeSeries()
+        _check_plot_works(ser.plot)
+
+        dr = date_range(ser.index[0], freq='BQS', periods=10)
+        ser = Series(np.random.randn(len(dr)), dr)
+        _check_plot_works(ser.plot)
+
+    @pytest.mark.slow
+    def test_plot_multiple_inferred_freq(self):
+        dr = Index([datetime(2000, 1, 1), datetime(2000, 1, 6), datetime(
+            2000, 1, 11)])
+        ser = Series(np.random.randn(len(dr)), dr)
+        _check_plot_works(ser.plot)
+
+    @pytest.mark.slow
+    def test_uhf(self):
+        import pandas.plotting._converter as conv
+        idx = date_range('2012-6-22 21:59:51.960928', freq='L', periods=500)
+        df = DataFrame(np.random.randn(len(idx), 2), idx)
+
+        _, ax = self.plt.subplots()
+        df.plot(ax=ax)
+        axis = ax.get_xaxis()
+
+        tlocs = axis.get_ticklocs()
+        tlabels = axis.get_ticklabels()
+        for loc, label in zip(tlocs, tlabels):
+            xp = conv._from_ordinal(loc).strftime('%H:%M:%S.%f')
+            rs = str(label.get_text())
+            if len(rs):
+                assert xp == rs
+
+    @pytest.mark.slow
+    def test_irreg_hf(self):
+        idx = date_range('2012-6-22 21:59:51', freq='S', periods=100)
+        df = DataFrame(np.random.randn(len(idx), 2), idx)
+
+        irreg = df.iloc[[0, 1, 3, 4]]
+        _, ax = self.plt.subplots()
+        irreg.plot(ax=ax)
+        diffs = Series(ax.get_lines()[0].get_xydata()[:, 0]).diff()
+
+        sec = 1. / 24 / 60 / 60
+        assert (np.fabs(diffs[1:] - [sec, sec * 2, sec]) < 1e-8).all()
+
+        _, ax = self.plt.subplots()
+        df2 = df.copy()
+        df2.index = df.index.astype(object)
+        df2.plot(ax=ax)
+        diffs = Series(ax.get_lines()[0].get_xydata()[:, 0]).diff()
+        assert (np.fabs(diffs[1:] - sec) < 1e-8).all()
+
+    def test_irregular_datetime64_repr_bug(self):
+        ser = tm.makeTimeSeries()
+        ser = ser[[0, 1, 2, 7]]
+
+        _, ax = self.plt.subplots()
+
+        ret = ser.plot(ax=ax)
+        assert ret is not None
+
+        for rs, xp in zip(ax.get_lines()[0].get_xdata(), ser.index):
+            assert rs == xp
+
+    def test_business_freq(self):
+        bts = tm.makePeriodSeries()
+        _, ax = self.plt.subplots()
+        bts.plot(ax=ax)
+        assert ax.get_lines()[0].get_xydata()[0, 0] == bts.index[0].ordinal
+        idx = ax.get_lines()[0].get_xdata()
+        assert PeriodIndex(data=idx).freqstr == 'B'
+
+    @pytest.mark.slow
+    def test_business_freq_convert(self):
+        n = tm.N
+        tm.N = 300
+        bts = tm.makeTimeSeries().asfreq('BM')
+        tm.N = n
+        ts = bts.to_period('M')
+        _, ax = self.plt.subplots()
+        bts.plot(ax=ax)
+        assert ax.get_lines()[0].get_xydata()[0, 0] == ts.index[0].ordinal
+        idx = ax.get_lines()[0].get_xdata()
+        assert PeriodIndex(data=idx).freqstr == 'M'
+
+    def test_nonzero_base(self):
+        # GH2571
+        idx = (date_range('2012-12-20', periods=24, freq='H') + timedelta(
+            minutes=30))
+        df = DataFrame(np.arange(24), index=idx)
+        _, ax = self.plt.subplots()
+        df.plot(ax=ax)
+        rs = ax.get_lines()[0].get_xdata()
+        assert not Index(rs).is_normalized
+
+    def test_dataframe(self):
+        bts = DataFrame({'a': tm.makeTimeSeries()})
+        _, ax = self.plt.subplots()
+        bts.plot(ax=ax)
+        idx = ax.get_lines()[0].get_xdata()
+        tm.assert_index_equal(bts.index.to_period(), PeriodIndex(idx))
+
+    @pytest.mark.slow
+    def test_axis_limits(self):
+
+        def _test(ax):
+            xlim = ax.get_xlim()
+            ax.set_xlim(xlim[0] - 5, xlim[1] + 10)
+            ax.get_figure().canvas.draw()
+            result = ax.get_xlim()
+            assert result[0] == xlim[0] - 5
+            assert result[1] == xlim[1] + 10
+
+            # string
+            expected = (Period('1/1/2000', ax.freq),
+                        Period('4/1/2000', ax.freq))
+            ax.set_xlim('1/1/2000', '4/1/2000')
+            ax.get_figure().canvas.draw()
+            result = ax.get_xlim()
+            assert int(result[0]) == expected[0].ordinal
+            assert int(result[1]) == expected[1].ordinal
+
+            # datetime
+            expected = (Period('1/1/2000', ax.freq),
+                        Period('4/1/2000', ax.freq))
+            ax.set_xlim(datetime(2000, 1, 1), datetime(2000, 4, 1))
+            ax.get_figure().canvas.draw()
+            result = ax.get_xlim()
+            assert int(result[0]) == expected[0].ordinal
+            assert int(result[1]) == expected[1].ordinal
+            fig = ax.get_figure()
+            self.plt.close(fig)
+
+        ser = tm.makeTimeSeries()
+        _, ax = self.plt.subplots()
+        ser.plot(ax=ax)
+        _test(ax)
+
+        _, ax = self.plt.subplots()
+        df = DataFrame({'a': ser, 'b': ser + 1})
+        df.plot(ax=ax)
+        _test(ax)
+
+        df = DataFrame({'a': ser, 'b': ser + 1})
+        axes = df.plot(subplots=True)
+
+        for ax in axes:
+            _test(ax)
+
+    def test_get_finder(self):
+        import pandas.plotting._converter as conv
+
+        assert conv.get_finder('B') == conv._daily_finder
+        assert conv.get_finder('D') == conv._daily_finder
+        assert conv.get_finder('M') == conv._monthly_finder
+        assert conv.get_finder('Q') == conv._quarterly_finder
+        assert conv.get_finder('A') == conv._annual_finder
+        assert conv.get_finder('W') == conv._daily_finder
+
+    @pytest.mark.slow
+    def test_finder_daily(self):
+        day_lst = [10, 40, 252, 400, 950, 2750, 10000]
+
+        if self.mpl_ge_2_0_0:
+            xpl1 = [7565, 7564, 7553, 7546, 7518, 7428, 7066]
+            xpl2 = [7566, 7564, 7554, 7546, 7519, 7429, 7066]
+        else:
+            xpl1 = xpl2 = [Period('1999-1-1', freq='B').ordinal] * len(day_lst)
+
+        for i, n in enumerate(day_lst):
+            xp = xpl1[i]
+            rng = bdate_range('1999-1-1', periods=n)
+            ser = Series(np.random.randn(len(rng)), rng)
+            _, ax = self.plt.subplots()
+            ser.plot(ax=ax)
+            xaxis = ax.get_xaxis()
+            rs = xaxis.get_majorticklocs()[0]
+            assert xp == rs
+            xp = xpl2[i]
+            vmin, vmax = ax.get_xlim()
+            ax.set_xlim(vmin + 0.9, vmax)
+            rs = xaxis.get_majorticklocs()[0]
+            assert xp == rs
+            self.plt.close(ax.get_figure())
+
+    @pytest.mark.slow
+    def test_finder_quarterly(self):
+        yrs = [3.5, 11]
+
+        if self.mpl_ge_2_0_0:
+            xpl1 = [68, 68]
+            xpl2 = [72, 68]
+        else:
+            xpl1 = xpl2 = [Period('1988Q1').ordinal] * len(yrs)
+
+        for i, n in enumerate(yrs):
+            xp = xpl1[i]
+            rng = period_range('1987Q2', periods=int(n * 4), freq='Q')
+            ser = Series(np.random.randn(len(rng)), rng)
+            _, ax = self.plt.subplots()
+            ser.plot(ax=ax)
+            xaxis = ax.get_xaxis()
+            rs = xaxis.get_majorticklocs()[0]
+            assert rs == xp
+            xp = xpl2[i]
+            (vmin, vmax) = ax.get_xlim()
+            ax.set_xlim(vmin + 0.9, vmax)
+            rs = xaxis.get_majorticklocs()[0]
+            assert xp == rs
+            self.plt.close(ax.get_figure())
+
+    @pytest.mark.slow
+    def test_finder_monthly(self):
+        yrs = [1.15, 2.5, 4, 11]
+
+        if self.mpl_ge_2_0_0:
+            xpl1 = [216, 216, 204, 204]
+            xpl2 = [216, 216, 216, 204]
+        else:
+            xpl1 = xpl2 = [Period('Jan 1988').ordinal] * len(yrs)
+
+        for i, n in enumerate(yrs):
+            xp = xpl1[i]
+            rng = period_range('1987Q2', periods=int(n * 12), freq='M')
+            ser = Series(np.random.randn(len(rng)), rng)
+            _, ax = self.plt.subplots()
+            ser.plot(ax=ax)
+            xaxis = ax.get_xaxis()
+            rs = xaxis.get_majorticklocs()[0]
+            assert rs == xp
+            xp = xpl2[i]
+            vmin, vmax = ax.get_xlim()
+            ax.set_xlim(vmin + 0.9, vmax)
+            rs = xaxis.get_majorticklocs()[0]
+            assert xp == rs
+            self.plt.close(ax.get_figure())
+
+    def test_finder_monthly_long(self):
+        rng = period_range('1988Q1', periods=24 * 12, freq='M')
+        ser = Series(np.random.randn(len(rng)), rng)
+        _, ax = self.plt.subplots()
+        ser.plot(ax=ax)
+        xaxis = ax.get_xaxis()
+        rs = xaxis.get_majorticklocs()[0]
+        xp = Period('1989Q1', 'M').ordinal
+        assert rs == xp
+
+    @pytest.mark.slow
+    def test_finder_annual(self):
+        if self.mpl_ge_2_0_0:
+            xp = [1986, 1986, 1990, 1990, 1995, 2020, 1970, 1970]
+        else:
+            xp = [1987, 1988, 1990, 1990, 1995, 2020, 2070, 2170]
+
+        for i, nyears in enumerate([5, 10, 19, 49, 99, 199, 599, 1001]):
+            rng = period_range('1987', periods=nyears, freq='A')
+            ser = Series(np.random.randn(len(rng)), rng)
+            _, ax = self.plt.subplots()
+            ser.plot(ax=ax)
+            xaxis = ax.get_xaxis()
+            rs = xaxis.get_majorticklocs()[0]
+            assert rs == Period(xp[i], freq='A').ordinal
+            self.plt.close(ax.get_figure())
+
+    @pytest.mark.slow
+    def test_finder_minutely(self):
+        nminutes = 50 * 24 * 60
+        rng = date_range('1/1/1999', freq='Min', periods=nminutes)
+        ser = Series(np.random.randn(len(rng)), rng)
+        _, ax = self.plt.subplots()
+        ser.plot(ax=ax)
+        xaxis = ax.get_xaxis()
+        rs = xaxis.get_majorticklocs()[0]
+        if self.mpl_ge_2_0_0:
+            xp = Period('1998-12-29 12:00', freq='Min').ordinal
+        else:
+            xp = Period('1/1/1999', freq='Min').ordinal
+        assert rs == xp
+
+    def test_finder_hourly(self):
+        nhours = 23
+        rng = date_range('1/1/1999', freq='H', periods=nhours)
+        ser = Series(np.random.randn(len(rng)), rng)
+        _, ax = self.plt.subplots()
+        ser.plot(ax=ax)
+        xaxis = ax.get_xaxis()
+        rs = xaxis.get_majorticklocs()[0]
+        if self.mpl_ge_2_0_0:
+            xp = Period('1998-12-31 22:00', freq='H').ordinal
+        else:
+            xp = Period('1/1/1999', freq='H').ordinal
+        assert rs == xp
+
+    @td.skip_if_mpl_1_5
+    @pytest.mark.slow
+    def test_gaps(self):
+        ts = tm.makeTimeSeries()
+        ts[5:25] = np.nan
+        _, ax = self.plt.subplots()
+        ts.plot(ax=ax)
+        lines = ax.get_lines()
+        assert len(lines) == 1
+        l = lines[0]
+        data = l.get_xydata()
+        assert isinstance(data, np.ma.core.MaskedArray)
+        mask = data.mask
+        assert mask[5:25, 1].all()
+        self.plt.close(ax.get_figure())
+
+        # irregular
+        ts = tm.makeTimeSeries()
+        ts = ts[[0, 1, 2, 5, 7, 9, 12, 15, 20]]
+        ts[2:5] = np.nan
+        _, ax = self.plt.subplots()
+        ax = ts.plot(ax=ax)
+        lines = ax.get_lines()
+        assert len(lines) == 1
+        l = lines[0]
+        data = l.get_xydata()
+        assert isinstance(data, np.ma.core.MaskedArray)
+        mask = data.mask
+        assert mask[2:5, 1].all()
+        self.plt.close(ax.get_figure())
+
+        # non-ts
+        idx = [0, 1, 2, 5, 7, 9, 12, 15, 20]
+        ser = Series(np.random.randn(len(idx)), idx)
+        ser[2:5] = np.nan
+        _, ax = self.plt.subplots()
+        ser.plot(ax=ax)
+        lines = ax.get_lines()
+        assert len(lines) == 1
+        l = lines[0]
+        data = l.get_xydata()
+        assert isinstance(data, np.ma.core.MaskedArray)
+        mask = data.mask
+        assert mask[2:5, 1].all()
+
+    @td.skip_if_mpl_1_5
+    @pytest.mark.slow
+    def test_gap_upsample(self):
+        low = tm.makeTimeSeries()
+        low[5:25] = np.nan
+        _, ax = self.plt.subplots()
+        low.plot(ax=ax)
+
+        idxh = date_range(low.index[0], low.index[-1], freq='12h')
+        s = Series(np.random.randn(len(idxh)), idxh)
+        s.plot(secondary_y=True)
+        lines = ax.get_lines()
+        assert len(lines) == 1
+        assert len(ax.right_ax.get_lines()) == 1
+        l = lines[0]
+        data = l.get_xydata()
+
+        assert isinstance(data, np.ma.core.MaskedArray)
+        mask = data.mask
+        assert mask[5:25, 1].all()
+
+    @pytest.mark.slow
+    def test_secondary_y(self):
+        ser = Series(np.random.randn(10))
+        ser2 = Series(np.random.randn(10))
+        fig, _ = self.plt.subplots()
+        ax = ser.plot(secondary_y=True)
+        assert hasattr(ax, 'left_ax')
+        assert not hasattr(ax, 'right_ax')
+        axes = fig.get_axes()
+        l = ax.get_lines()[0]
+        xp = Series(l.get_ydata(), l.get_xdata())
+        assert_series_equal(ser, xp)
+        assert ax.get_yaxis().get_ticks_position() == 'right'
+        assert not axes[0].get_yaxis().get_visible()
+        self.plt.close(fig)
+
+        _, ax2 = self.plt.subplots()
+        ser2.plot(ax=ax2)
+        assert (ax2.get_yaxis().get_ticks_position() ==
+                self.default_tick_position)
+        self.plt.close(ax2.get_figure())
+
+        ax = ser2.plot()
+        ax2 = ser.plot(secondary_y=True)
+        assert ax.get_yaxis().get_visible()
+        assert not hasattr(ax, 'left_ax')
+        assert hasattr(ax, 'right_ax')
+        assert hasattr(ax2, 'left_ax')
+        assert not hasattr(ax2, 'right_ax')
+
+    @pytest.mark.slow
+    def test_secondary_y_ts(self):
+        idx = date_range('1/1/2000', periods=10)
+        ser = Series(np.random.randn(10), idx)
+        ser2 = Series(np.random.randn(10), idx)
+        fig, _ = self.plt.subplots()
+        ax = ser.plot(secondary_y=True)
+        assert hasattr(ax, 'left_ax')
+        assert not hasattr(ax, 'right_ax')
+        axes = fig.get_axes()
+        l = ax.get_lines()[0]
+        xp = Series(l.get_ydata(), l.get_xdata()).to_timestamp()
+        assert_series_equal(ser, xp)
+        assert ax.get_yaxis().get_ticks_position() == 'right'
+        assert not axes[0].get_yaxis().get_visible()
+        self.plt.close(fig)
+
+        _, ax2 = self.plt.subplots()
+        ser2.plot(ax=ax2)
+        assert (ax2.get_yaxis().get_ticks_position() ==
+                self.default_tick_position)
+        self.plt.close(ax2.get_figure())
+
+        ax = ser2.plot()
+        ax2 = ser.plot(secondary_y=True)
+        assert ax.get_yaxis().get_visible()
+
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
+    def test_secondary_kde(self):
+        if not self.mpl_ge_1_5_0:
+            pytest.skip("mpl is not supported")
+        _skip_if_no_scipy_gaussian_kde()
+
+        ser = Series(np.random.randn(10))
+        fig, ax = self.plt.subplots()
+        ax = ser.plot(secondary_y=True, kind='density', ax=ax)
+        assert hasattr(ax, 'left_ax')
+        assert not hasattr(ax, 'right_ax')
+        axes = fig.get_axes()
+        assert axes[1].get_yaxis().get_ticks_position() == 'right'
+
+    @pytest.mark.slow
+    def test_secondary_bar(self):
+        ser = Series(np.random.randn(10))
+        fig, ax = self.plt.subplots()
+        ser.plot(secondary_y=True, kind='bar', ax=ax)
+        axes = fig.get_axes()
+        assert axes[1].get_yaxis().get_ticks_position() == 'right'
+
+    @pytest.mark.slow
+    def test_secondary_frame(self):
+        df = DataFrame(np.random.randn(5, 3), columns=['a', 'b', 'c'])
+        axes = df.plot(secondary_y=['a', 'c'], subplots=True)
+        assert axes[0].get_yaxis().get_ticks_position() == 'right'
+        assert (axes[1].get_yaxis().get_ticks_position() ==
+                self.default_tick_position)
+        assert axes[2].get_yaxis().get_ticks_position() == 'right'
+
+    @pytest.mark.slow
+    def test_secondary_bar_frame(self):
+        df = DataFrame(np.random.randn(5, 3), columns=['a', 'b', 'c'])
+        axes = df.plot(kind='bar', secondary_y=['a', 'c'], subplots=True)
+        assert axes[0].get_yaxis().get_ticks_position() == 'right'
+        assert (axes[1].get_yaxis().get_ticks_position() ==
+                self.default_tick_position)
+        assert axes[2].get_yaxis().get_ticks_position() == 'right'
+
+    def test_mixed_freq_regular_first(self):
+        # TODO
+        s1 = tm.makeTimeSeries()
+        s2 = s1[[0, 5, 10, 11, 12, 13, 14, 15]]
+
+        # it works!
+        _, ax = self.plt.subplots()
+        s1.plot(ax=ax)
+
+        ax2 = s2.plot(style='g', ax=ax)
+        lines = ax2.get_lines()
+        idx1 = PeriodIndex(lines[0].get_xdata())
+        idx2 = PeriodIndex(lines[1].get_xdata())
+
+        tm.assert_index_equal(idx1, s1.index.to_period('B'))
+        tm.assert_index_equal(idx2, s2.index.to_period('B'))
+
+        left, right = ax2.get_xlim()
+        pidx = s1.index.to_period()
+        assert left <= pidx[0].ordinal
+        assert right >= pidx[-1].ordinal
+
+    @pytest.mark.slow
+    def test_mixed_freq_irregular_first(self):
+        s1 = tm.makeTimeSeries()
+        s2 = s1[[0, 5, 10, 11, 12, 13, 14, 15]]
+        _, ax = self.plt.subplots()
+        s2.plot(style='g', ax=ax)
+        s1.plot(ax=ax)
+        assert not hasattr(ax, 'freq')
+        lines = ax.get_lines()
+        x1 = lines[0].get_xdata()
+        tm.assert_numpy_array_equal(x1, s2.index.astype(object).values)
+        x2 = lines[1].get_xdata()
+        tm.assert_numpy_array_equal(x2, s1.index.astype(object).values)
+
+    def test_mixed_freq_regular_first_df(self):
+        # GH 9852
+        s1 = tm.makeTimeSeries().to_frame()
+        s2 = s1.iloc[[0, 5, 10, 11, 12, 13, 14, 15], :]
+        _, ax = self.plt.subplots()
+        s1.plot(ax=ax)
+        ax2 = s2.plot(style='g', ax=ax)
+        lines = ax2.get_lines()
+        idx1 = PeriodIndex(lines[0].get_xdata())
+        idx2 = PeriodIndex(lines[1].get_xdata())
+        assert idx1.equals(s1.index.to_period('B'))
+        assert idx2.equals(s2.index.to_period('B'))
+        left, right = ax2.get_xlim()
+        pidx = s1.index.to_period()
+        assert left <= pidx[0].ordinal
+        assert right >= pidx[-1].ordinal
+
+    @pytest.mark.slow
+    def test_mixed_freq_irregular_first_df(self):
+        # GH 9852
+        s1 = tm.makeTimeSeries().to_frame()
+        s2 = s1.iloc[[0, 5, 10, 11, 12, 13, 14, 15], :]
+        _, ax = self.plt.subplots()
+        s2.plot(style='g', ax=ax)
+        s1.plot(ax=ax)
+        assert not hasattr(ax, 'freq')
+        lines = ax.get_lines()
+        x1 = lines[0].get_xdata()
+        tm.assert_numpy_array_equal(x1, s2.index.astype(object).values)
+        x2 = lines[1].get_xdata()
+        tm.assert_numpy_array_equal(x2, s1.index.astype(object).values)
+
+    def test_mixed_freq_hf_first(self):
+        idxh = date_range('1/1/1999', periods=365, freq='D')
+        idxl = date_range('1/1/1999', periods=12, freq='M')
+        high = Series(np.random.randn(len(idxh)), idxh)
+        low = Series(np.random.randn(len(idxl)), idxl)
+        _, ax = self.plt.subplots()
+        high.plot(ax=ax)
+        low.plot(ax=ax)
+        for l in ax.get_lines():
+            assert PeriodIndex(data=l.get_xdata()).freq == 'D'
+
+    @pytest.mark.slow
+    def test_mixed_freq_alignment(self):
+        ts_ind = date_range('2012-01-01 13:00', '2012-01-02', freq='H')
+        ts_data = np.random.randn(12)
+
+        ts = Series(ts_data, index=ts_ind)
+        ts2 = ts.asfreq('T').interpolate()
+
+        _, ax = self.plt.subplots()
+        ax = ts.plot(ax=ax)
+        ts2.plot(style='r', ax=ax)
+
+        assert ax.lines[0].get_xdata()[0] == ax.lines[1].get_xdata()[0]
+
+    @pytest.mark.slow
+    def test_mixed_freq_lf_first(self):
+
+        idxh = date_range('1/1/1999', periods=365, freq='D')
+        idxl = date_range('1/1/1999', periods=12, freq='M')
+        high = Series(np.random.randn(len(idxh)), idxh)
+        low = Series(np.random.randn(len(idxl)), idxl)
+        _, ax = self.plt.subplots()
+        low.plot(legend=True, ax=ax)
+        high.plot(legend=True, ax=ax)
+        for l in ax.get_lines():
+            assert PeriodIndex(data=l.get_xdata()).freq == 'D'
+        leg = ax.get_legend()
+        assert len(leg.texts) == 2
+        self.plt.close(ax.get_figure())
+
+        idxh = date_range('1/1/1999', periods=240, freq='T')
+        idxl = date_range('1/1/1999', periods=4, freq='H')
+        high = Series(np.random.randn(len(idxh)), idxh)
+        low = Series(np.random.randn(len(idxl)), idxl)
+        _, ax = self.plt.subplots()
+        low.plot(ax=ax)
+        high.plot(ax=ax)
+        for l in ax.get_lines():
+            assert PeriodIndex(data=l.get_xdata()).freq == 'T'
+
+    def test_mixed_freq_irreg_period(self):
+        ts = tm.makeTimeSeries()
+        irreg = ts[[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 15, 16, 17, 18, 29]]
+        rng = period_range('1/3/2000', periods=30, freq='B')
+        ps = Series(np.random.randn(len(rng)), rng)
+        _, ax = self.plt.subplots()
+        irreg.plot(ax=ax)
+        ps.plot(ax=ax)
+
+    def test_mixed_freq_shared_ax(self):
+
+        # GH13341, using sharex=True
+        idx1 = date_range('2015-01-01', periods=3, freq='M')
+        idx2 = idx1[:1].union(idx1[2:])
+        s1 = Series(range(len(idx1)), idx1)
+        s2 = Series(range(len(idx2)), idx2)
+
+        fig, (ax1, ax2) = self.plt.subplots(nrows=2, sharex=True)
+        s1.plot(ax=ax1)
+        s2.plot(ax=ax2)
+
+        assert ax1.freq == 'M'
+        assert ax2.freq == 'M'
+        assert (ax1.lines[0].get_xydata()[0, 0] ==
+                ax2.lines[0].get_xydata()[0, 0])
+
+        # using twinx
+        fig, ax1 = self.plt.subplots()
+        ax2 = ax1.twinx()
+        s1.plot(ax=ax1)
+        s2.plot(ax=ax2)
+
+        assert (ax1.lines[0].get_xydata()[0, 0] ==
+                ax2.lines[0].get_xydata()[0, 0])
+
+        # TODO (GH14330, GH14322)
+        # plotting the irregular first does not yet work
+        # fig, ax1 = plt.subplots()
+        # ax2 = ax1.twinx()
+        # s2.plot(ax=ax1)
+        # s1.plot(ax=ax2)
+        # assert (ax1.lines[0].get_xydata()[0, 0] ==
+        #         ax2.lines[0].get_xydata()[0, 0])
+
+    def test_nat_handling(self):
+
+        _, ax = self.plt.subplots()
+
+        dti = DatetimeIndex(['2015-01-01', NaT, '2015-01-03'])
+        s = Series(range(len(dti)), dti)
+        s.plot(ax=ax)
+        xdata = ax.get_lines()[0].get_xdata()
+        # plot x data is bounded by index values
+        assert s.index.min() <= Series(xdata).min()
+        assert Series(xdata).max() <= s.index.max()
+
+    @pytest.mark.slow
+    def test_to_weekly_resampling(self):
+        idxh = date_range('1/1/1999', periods=52, freq='W')
+        idxl = date_range('1/1/1999', periods=12, freq='M')
+        high = Series(np.random.randn(len(idxh)), idxh)
+        low = Series(np.random.randn(len(idxl)), idxl)
+        _, ax = self.plt.subplots()
+        high.plot(ax=ax)
+        low.plot(ax=ax)
+        for l in ax.get_lines():
+            assert PeriodIndex(data=l.get_xdata()).freq == idxh.freq
+
+        _, ax = self.plt.subplots()
+        from pandas.tseries.plotting import tsplot
+        with tm.assert_produces_warning(FutureWarning):
+            tsplot(high, self.plt.Axes.plot, ax=ax)
+        with tm.assert_produces_warning(FutureWarning):
+            lines = tsplot(low, self.plt.Axes.plot, ax=ax)
+        for l in lines:
+            assert PeriodIndex(data=l.get_xdata()).freq == idxh.freq
+
+    @pytest.mark.slow
+    def test_from_weekly_resampling(self):
+        idxh = date_range('1/1/1999', periods=52, freq='W')
+        idxl = date_range('1/1/1999', periods=12, freq='M')
+        high = Series(np.random.randn(len(idxh)), idxh)
+        low = Series(np.random.randn(len(idxl)), idxl)
+        _, ax = self.plt.subplots()
+        low.plot(ax=ax)
+        high.plot(ax=ax)
+
+        expected_h = idxh.to_period().asi8.astype(np.float64)
+        expected_l = np.array([1514, 1519, 1523, 1527, 1531, 1536, 1540, 1544,
+                               1549, 1553, 1558, 1562], dtype=np.float64)
+        for l in ax.get_lines():
+            assert PeriodIndex(data=l.get_xdata()).freq == idxh.freq
+            xdata = l.get_xdata(orig=False)
+            if len(xdata) == 12:  # idxl lines
+                tm.assert_numpy_array_equal(xdata, expected_l)
+            else:
+                tm.assert_numpy_array_equal(xdata, expected_h)
+        tm.close()
+
+        _, ax = self.plt.subplots()
+        from pandas.tseries.plotting import tsplot
+        with tm.assert_produces_warning(FutureWarning):
+            tsplot(low, self.plt.Axes.plot, ax=ax)
+        with tm.assert_produces_warning(FutureWarning):
+            lines = tsplot(high, self.plt.Axes.plot, ax=ax)
+        for l in lines:
+            assert PeriodIndex(data=l.get_xdata()).freq == idxh.freq
+            xdata = l.get_xdata(orig=False)
+            if len(xdata) == 12:  # idxl lines
+                tm.assert_numpy_array_equal(xdata, expected_l)
+            else:
+                tm.assert_numpy_array_equal(xdata, expected_h)
+
+    @pytest.mark.slow
+    def test_from_resampling_area_line_mixed(self):
+        idxh = date_range('1/1/1999', periods=52, freq='W')
+        idxl = date_range('1/1/1999', periods=12, freq='M')
+        high = DataFrame(np.random.rand(len(idxh), 3),
+                         index=idxh, columns=[0, 1, 2])
+        low = DataFrame(np.random.rand(len(idxl), 3),
+                        index=idxl, columns=[0, 1, 2])
+
+        # low to high
+        for kind1, kind2 in [('line', 'area'), ('area', 'line')]:
+            _, ax = self.plt.subplots()
+            low.plot(kind=kind1, stacked=True, ax=ax)
+            high.plot(kind=kind2, stacked=True, ax=ax)
+
+            # check low dataframe result
+            expected_x = np.array([1514, 1519, 1523, 1527, 1531, 1536, 1540,
+                                   1544, 1549, 1553, 1558, 1562],
+                                  dtype=np.float64)
+            expected_y = np.zeros(len(expected_x), dtype=np.float64)
+            for i in range(3):
+                l = ax.lines[i]
+                assert PeriodIndex(l.get_xdata()).freq == idxh.freq
+                tm.assert_numpy_array_equal(l.get_xdata(orig=False),
+                                            expected_x)
+                # check stacked values are correct
+                expected_y += low[i].values
+                tm.assert_numpy_array_equal(l.get_ydata(orig=False),
+                                            expected_y)
+
+            # check high dataframe result
+            expected_x = idxh.to_period().asi8.astype(np.float64)
+            expected_y = np.zeros(len(expected_x), dtype=np.float64)
+            for i in range(3):
+                l = ax.lines[3 + i]
+                assert PeriodIndex(data=l.get_xdata()).freq == idxh.freq
+                tm.assert_numpy_array_equal(l.get_xdata(orig=False),
+                                            expected_x)
+                expected_y += high[i].values
+                tm.assert_numpy_array_equal(l.get_ydata(orig=False),
+                                            expected_y)
+
+        # high to low
+        for kind1, kind2 in [('line', 'area'), ('area', 'line')]:
+            _, ax = self.plt.subplots()
+            high.plot(kind=kind1, stacked=True, ax=ax)
+            low.plot(kind=kind2, stacked=True, ax=ax)
+
+            # check high dataframe result
+            expected_x = idxh.to_period().asi8.astype(np.float64)
+            expected_y = np.zeros(len(expected_x), dtype=np.float64)
+            for i in range(3):
+                l = ax.lines[i]
+                assert PeriodIndex(data=l.get_xdata()).freq == idxh.freq
+                tm.assert_numpy_array_equal(l.get_xdata(orig=False),
+                                            expected_x)
+                expected_y += high[i].values
+                tm.assert_numpy_array_equal(l.get_ydata(orig=False),
+                                            expected_y)
+
+            # check low dataframe result
+            expected_x = np.array([1514, 1519, 1523, 1527, 1531, 1536, 1540,
+                                   1544, 1549, 1553, 1558, 1562],
+                                  dtype=np.float64)
+            expected_y = np.zeros(len(expected_x), dtype=np.float64)
+            for i in range(3):
+                l = ax.lines[3 + i]
+                assert PeriodIndex(data=l.get_xdata()).freq == idxh.freq
+                tm.assert_numpy_array_equal(l.get_xdata(orig=False),
+                                            expected_x)
+                expected_y += low[i].values
+                tm.assert_numpy_array_equal(l.get_ydata(orig=False),
+                                            expected_y)
+
+    @pytest.mark.slow
+    def test_mixed_freq_second_millisecond(self):
+        # GH 7772, GH 7760
+        idxh = date_range('2014-07-01 09:00', freq='S', periods=50)
+        idxl = date_range('2014-07-01 09:00', freq='100L', periods=500)
+        high = Series(np.random.randn(len(idxh)), idxh)
+        low = Series(np.random.randn(len(idxl)), idxl)
+        # high to low
+        _, ax = self.plt.subplots()
+        high.plot(ax=ax)
+        low.plot(ax=ax)
+        assert len(ax.get_lines()) == 2
+        for l in ax.get_lines():
+            assert PeriodIndex(data=l.get_xdata()).freq == 'L'
+        tm.close()
+
+        # low to high
+        _, ax = self.plt.subplots()
+        low.plot(ax=ax)
+        high.plot(ax=ax)
+        assert len(ax.get_lines()) == 2
+        for l in ax.get_lines():
+            assert PeriodIndex(data=l.get_xdata()).freq == 'L'
+
+    @pytest.mark.slow
+    def test_irreg_dtypes(self):
+        # date
+        idx = [date(2000, 1, 1), date(2000, 1, 5), date(2000, 1, 20)]
+        df = DataFrame(np.random.randn(len(idx), 3), Index(idx, dtype=object))
+        _check_plot_works(df.plot)
+
+        # np.datetime64
+        idx = date_range('1/1/2000', periods=10)
+        idx = idx[[0, 2, 5, 9]].astype(object)
+        df = DataFrame(np.random.randn(len(idx), 3), idx)
+        _, ax = self.plt.subplots()
+        _check_plot_works(df.plot, ax=ax)
+
+    @pytest.mark.xfail(not PY3, reason="failing on mpl 1.4.3 on PY2")
+    @pytest.mark.slow
+    def test_time(self):
+        t = datetime(1, 1, 1, 3, 30, 0)
+        deltas = np.random.randint(1, 20, 3).cumsum()
+        ts = np.array([(t + timedelta(minutes=int(x))).time() for x in deltas])
+        df = DataFrame({'a': np.random.randn(len(ts)),
+                        'b': np.random.randn(len(ts))},
+                       index=ts)
+        fig, ax = self.plt.subplots()
+        df.plot(ax=ax)
+
+        # verify tick labels
+        fig.canvas.draw()
+        ticks = ax.get_xticks()
+        labels = ax.get_xticklabels()
+        for t, l in zip(ticks, labels):
+            m, s = divmod(int(t), 60)
+            h, m = divmod(m, 60)
+            rs = l.get_text()
+            if len(rs) > 0:
+                if s != 0:
+                    xp = time(h, m, s).strftime('%H:%M:%S')
+                else:
+                    xp = time(h, m, s).strftime('%H:%M')
+                assert xp == rs
+
+        # change xlim
+        ax.set_xlim('1:30', '5:00')
+
+        # check tick labels again
+        fig.canvas.draw()
+        ticks = ax.get_xticks()
+        labels = ax.get_xticklabels()
+        for t, l in zip(ticks, labels):
+            m, s = divmod(int(t), 60)
+            h, m = divmod(m, 60)
+            rs = l.get_text()
+            if len(rs) > 0:
+                if s != 0:
+                    xp = time(h, m, s).strftime('%H:%M:%S')
+                else:
+                    xp = time(h, m, s).strftime('%H:%M')
+                assert xp == rs
+
+    @pytest.mark.slow
+    def test_time_musec(self):
+        t = datetime(1, 1, 1, 3, 30, 0)
+        deltas = np.random.randint(1, 20, 3).cumsum()
+        ts = np.array([(t + timedelta(microseconds=int(x))).time()
+                       for x in deltas])
+        df = DataFrame({'a': np.random.randn(len(ts)),
+                        'b': np.random.randn(len(ts))},
+                       index=ts)
+        fig, ax = self.plt.subplots()
+        ax = df.plot(ax=ax)
+
+        # verify tick labels
+        fig.canvas.draw()
+        ticks = ax.get_xticks()
+        labels = ax.get_xticklabels()
+        for t, l in zip(ticks, labels):
+            m, s = divmod(int(t), 60)
+
+            us = int(round((t - int(t)) * 1e6))
+
+            h, m = divmod(m, 60)
+            rs = l.get_text()
+            if len(rs) > 0:
+                if (us % 1000) != 0:
+                    xp = time(h, m, s, us).strftime('%H:%M:%S.%f')
+                elif (us // 1000) != 0:
+                    xp = time(h, m, s, us).strftime('%H:%M:%S.%f')[:-3]
+                elif s != 0:
+                    xp = time(h, m, s, us).strftime('%H:%M:%S')
+                else:
+                    xp = time(h, m, s, us).strftime('%H:%M')
+                assert xp == rs
+
+    @pytest.mark.slow
+    def test_secondary_upsample(self):
+        idxh = date_range('1/1/1999', periods=365, freq='D')
+        idxl = date_range('1/1/1999', periods=12, freq='M')
+        high = Series(np.random.randn(len(idxh)), idxh)
+        low = Series(np.random.randn(len(idxl)), idxl)
+        _, ax = self.plt.subplots()
+        low.plot(ax=ax)
+        ax = high.plot(secondary_y=True, ax=ax)
+        for l in ax.get_lines():
+            assert PeriodIndex(l.get_xdata()).freq == 'D'
+        assert hasattr(ax, 'left_ax')
+        assert not hasattr(ax, 'right_ax')
+        for l in ax.left_ax.get_lines():
+            assert PeriodIndex(l.get_xdata()).freq == 'D'
+
+    @pytest.mark.slow
+    def test_secondary_legend(self):
+        fig = self.plt.figure()
+        ax = fig.add_subplot(211)
+
+        # ts
+        df = tm.makeTimeDataFrame()
+        df.plot(secondary_y=['A', 'B'], ax=ax)
+        leg = ax.get_legend()
+        assert len(leg.get_lines()) == 4
+        assert leg.get_texts()[0].get_text() == 'A (right)'
+        assert leg.get_texts()[1].get_text() == 'B (right)'
+        assert leg.get_texts()[2].get_text() == 'C'
+        assert leg.get_texts()[3].get_text() == 'D'
+        assert ax.right_ax.get_legend() is None
+        colors = set()
+        for line in leg.get_lines():
+            colors.add(line.get_color())
+
+        # TODO: color cycle problems
+        assert len(colors) == 4
+        self.plt.close(fig)
+
+        fig = self.plt.figure()
+        ax = fig.add_subplot(211)
+        df.plot(secondary_y=['A', 'C'], mark_right=False, ax=ax)
+        leg = ax.get_legend()
+        assert len(leg.get_lines()) == 4
+        assert leg.get_texts()[0].get_text() == 'A'
+        assert leg.get_texts()[1].get_text() == 'B'
+        assert leg.get_texts()[2].get_text() == 'C'
+        assert leg.get_texts()[3].get_text() == 'D'
+        self.plt.close(fig)
+
+        fig, ax = self.plt.subplots()
+        df.plot(kind='bar', secondary_y=['A'], ax=ax)
+        leg = ax.get_legend()
+        assert leg.get_texts()[0].get_text() == 'A (right)'
+        assert leg.get_texts()[1].get_text() == 'B'
+        self.plt.close(fig)
+
+        fig, ax = self.plt.subplots()
+        df.plot(kind='bar', secondary_y=['A'], mark_right=False, ax=ax)
+        leg = ax.get_legend()
+        assert leg.get_texts()[0].get_text() == 'A'
+        assert leg.get_texts()[1].get_text() == 'B'
+        self.plt.close(fig)
+
+        fig = self.plt.figure()
+        ax = fig.add_subplot(211)
+        df = tm.makeTimeDataFrame()
+        ax = df.plot(secondary_y=['C', 'D'], ax=ax)
+        leg = ax.get_legend()
+        assert len(leg.get_lines()) == 4
+        assert ax.right_ax.get_legend() is None
+        colors = set()
+        for line in leg.get_lines():
+            colors.add(line.get_color())
+
+        # TODO: color cycle problems
+        assert len(colors) == 4
+        self.plt.close(fig)
+
+        # non-ts
+        df = tm.makeDataFrame()
+        fig = self.plt.figure()
+        ax = fig.add_subplot(211)
+        ax = df.plot(secondary_y=['A', 'B'], ax=ax)
+        leg = ax.get_legend()
+        assert len(leg.get_lines()) == 4
+        assert ax.right_ax.get_legend() is None
+        colors = set()
+        for line in leg.get_lines():
+            colors.add(line.get_color())
+
+        # TODO: color cycle problems
+        assert len(colors) == 4
+        self.plt.close()
+
+        fig = self.plt.figure()
+        ax = fig.add_subplot(211)
+        ax = df.plot(secondary_y=['C', 'D'], ax=ax)
+        leg = ax.get_legend()
+        assert len(leg.get_lines()) == 4
+        assert ax.right_ax.get_legend() is None
+        colors = set()
+        for line in leg.get_lines():
+            colors.add(line.get_color())
+
+        # TODO: color cycle problems
+        assert len(colors) == 4
+
+    def test_format_date_axis(self):
+        rng = date_range('1/1/2012', periods=12, freq='M')
+        df = DataFrame(np.random.randn(len(rng), 3), rng)
+        _, ax = self.plt.subplots()
+        ax = df.plot(ax=ax)
+        xaxis = ax.get_xaxis()
+        for l in xaxis.get_ticklabels():
+            if len(l.get_text()) > 0:
+                assert l.get_rotation() == 30
+
+    @pytest.mark.slow
+    def test_ax_plot(self):
+        x = DatetimeIndex(start='2012-01-02', periods=10, freq='D')
+        y = lrange(len(x))
+        _, ax = self.plt.subplots()
+        lines = ax.plot(x, y, label='Y')
+        tm.assert_index_equal(DatetimeIndex(lines[0].get_xdata()), x)
+
+    @pytest.mark.slow
+    def test_mpl_nopandas(self):
+        dates = [date(2008, 12, 31), date(2009, 1, 31)]
+        values1 = np.arange(10.0, 11.0, 0.5)
+        values2 = np.arange(11.0, 12.0, 0.5)
+
+        kw = dict(fmt='-', lw=4)
+
+        _, ax = self.plt.subplots()
+        ax.plot_date([x.toordinal() for x in dates], values1, **kw)
+        ax.plot_date([x.toordinal() for x in dates], values2, **kw)
+
+        line1, line2 = ax.get_lines()
+
+        exp = np.array([x.toordinal() for x in dates], dtype=np.float64)
+        tm.assert_numpy_array_equal(line1.get_xydata()[:, 0], exp)
+        exp = np.array([x.toordinal() for x in dates], dtype=np.float64)
+        tm.assert_numpy_array_equal(line2.get_xydata()[:, 0], exp)
+
+    @pytest.mark.slow
+    def test_irregular_ts_shared_ax_xlim(self):
+        # GH 2960
+        ts = tm.makeTimeSeries()[:20]
+        ts_irregular = ts[[1, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 17, 18]]
+
+        # plot the left section of the irregular series, then the right section
+        _, ax = self.plt.subplots()
+        ts_irregular[:5].plot(ax=ax)
+        ts_irregular[5:].plot(ax=ax)
+
+        # check that axis limits are correct
+        left, right = ax.get_xlim()
+        assert left <= ts_irregular.index.min().toordinal()
+        assert right >= ts_irregular.index.max().toordinal()
+
+    @pytest.mark.slow
+    def test_secondary_y_non_ts_xlim(self):
+        # GH 3490 - non-timeseries with secondary y
+        index_1 = [1, 2, 3, 4]
+        index_2 = [5, 6, 7, 8]
+        s1 = Series(1, index=index_1)
+        s2 = Series(2, index=index_2)
+
+        _, ax = self.plt.subplots()
+        s1.plot(ax=ax)
+        left_before, right_before = ax.get_xlim()
+        s2.plot(secondary_y=True, ax=ax)
+        left_after, right_after = ax.get_xlim()
+
+        assert left_before >= left_after
+        assert right_before < right_after
+
+    @pytest.mark.slow
+    def test_secondary_y_regular_ts_xlim(self):
+        # GH 3490 - regular-timeseries with secondary y
+        index_1 = date_range(start='2000-01-01', periods=4, freq='D')
+        index_2 = date_range(start='2000-01-05', periods=4, freq='D')
+        s1 = Series(1, index=index_1)
+        s2 = Series(2, index=index_2)
+
+        _, ax = self.plt.subplots()
+        s1.plot(ax=ax)
+        left_before, right_before = ax.get_xlim()
+        s2.plot(secondary_y=True, ax=ax)
+        left_after, right_after = ax.get_xlim()
+
+        assert left_before >= left_after
+        assert right_before < right_after
+
+    @pytest.mark.slow
+    def test_secondary_y_mixed_freq_ts_xlim(self):
+        # GH 3490 - mixed frequency timeseries with secondary y
+        rng = date_range('2000-01-01', periods=10000, freq='min')
+        ts = Series(1, index=rng)
+
+        _, ax = self.plt.subplots()
+        ts.plot(ax=ax)
+        left_before, right_before = ax.get_xlim()
+        ts.resample('D').mean().plot(secondary_y=True, ax=ax)
+        left_after, right_after = ax.get_xlim()
+
+        # a downsample should not have changed either limit
+        assert left_before == left_after
+        assert right_before == right_after
+
+    @pytest.mark.slow
+    def test_secondary_y_irregular_ts_xlim(self):
+        # GH 3490 - irregular-timeseries with secondary y
+        ts = tm.makeTimeSeries()[:20]
+        ts_irregular = ts[[1, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 17, 18]]
+
+        _, ax = self.plt.subplots()
+        ts_irregular[:5].plot(ax=ax)
+        # plot higher-x values on secondary axis
+        ts_irregular[5:].plot(secondary_y=True, ax=ax)
+        # ensure secondary limits aren't overwritten by plot on primary
+        ts_irregular[:5].plot(ax=ax)
+
+        left, right = ax.get_xlim()
+        assert left <= ts_irregular.index.min().toordinal()
+        assert right >= ts_irregular.index.max().toordinal()
+
+    def test_plot_outofbounds_datetime(self):
+        # 2579 - checking this does not raise
+        values = [date(1677, 1, 1), date(1677, 1, 2)]
+        _, ax = self.plt.subplots()
+        ax.plot(values)
+
+        values = [datetime(1677, 1, 1, 12), datetime(1677, 1, 2, 12)]
+        ax.plot(values)
+
+    def test_format_timedelta_ticks_narrow(self):
+
+        if self.mpl_ge_2_2_0:
+            expected_labels = (['-1 days 23:59:59.999999998'] +
+                               ['00:00:00.0000000{:0>2d}'.format(2 * i)
+                                for i in range(6)])
+        elif self.mpl_ge_2_0_0:
+            expected_labels = [''] + [
+                '00:00:00.00000000{:d}'.format(2 * i)
+                for i in range(5)] + ['']
+        else:
+            expected_labels = [
+                '00:00:00.00000000{:d}'.format(i)
+                for i in range(10)]
+
+        rng = timedelta_range('0', periods=10, freq='ns')
+        df = DataFrame(np.random.randn(len(rng), 3), rng)
+        fig, ax = self.plt.subplots()
+        df.plot(fontsize=2, ax=ax)
+        fig.canvas.draw()
+        labels = ax.get_xticklabels()
+        assert len(labels) == len(expected_labels)
+        for l, l_expected in zip(labels, expected_labels):
+            assert l.get_text() == l_expected
+
+    def test_format_timedelta_ticks_wide(self):
+
+        if self.mpl_ge_2_0_0:
+            expected_labels = [
+                '',
+                '00:00:00',
+                '1 days 03:46:40',
+                '2 days 07:33:20',
+                '3 days 11:20:00',
+                '4 days 15:06:40',
+                '5 days 18:53:20',
+                '6 days 22:40:00',
+                '8 days 02:26:40',
+                '9 days 06:13:20',
+                ''
+            ]
+            if self.mpl_ge_2_2_0:
+                expected_labels[0] = '-2 days 20:13:20'
+                expected_labels[-1] = '10 days 10:00:00'
+        else:
+            expected_labels = [
+                '00:00:00',
+                '1 days 03:46:40',
+                '2 days 07:33:20',
+                '3 days 11:20:00',
+                '4 days 15:06:40',
+                '5 days 18:53:20',
+                '6 days 22:40:00',
+                '8 days 02:26:40',
+                ''
+            ]
+
+        rng = timedelta_range('0', periods=10, freq='1 d')
+        df = DataFrame(np.random.randn(len(rng), 3), rng)
+        fig, ax = self.plt.subplots()
+        ax = df.plot(fontsize=2, ax=ax)
+        fig.canvas.draw()
+        labels = ax.get_xticklabels()
+        assert len(labels) == len(expected_labels)
+        for l, l_expected in zip(labels, expected_labels):
+            assert l.get_text() == l_expected
+
+    def test_timedelta_plot(self):
+        # test issue #8711
+        s = Series(range(5), timedelta_range('1day', periods=5))
+        _, ax = self.plt.subplots()
+        _check_plot_works(s.plot, ax=ax)
+
+        # test long period
+        index = timedelta_range('1 day 2 hr 30 min 10 s',
+                                periods=10, freq='1 d')
+        s = Series(np.random.randn(len(index)), index)
+        _, ax = self.plt.subplots()
+        _check_plot_works(s.plot, ax=ax)
+
+        # test short period
+        index = timedelta_range('1 day 2 hr 30 min 10 s',
+                                periods=10, freq='1 ns')
+        s = Series(np.random.randn(len(index)), index)
+        _, ax = self.plt.subplots()
+        _check_plot_works(s.plot, ax=ax)
+
+    def test_hist(self):
+        # https://github.com/matplotlib/matplotlib/issues/8459
+        rng = date_range('1/1/2011', periods=10, freq='H')
+        x = rng
+        w1 = np.arange(0, 1, .1)
+        w2 = np.arange(0, 1, .1)[::-1]
+        _, ax = self.plt.subplots()
+        ax.hist([x, x], weights=[w1, w2])
+
+    @pytest.mark.slow
+    def test_overlapping_datetime(self):
+        # GB 6608
+        s1 = Series([1, 2, 3], index=[datetime(1995, 12, 31),
+                                      datetime(2000, 12, 31),
+                                      datetime(2005, 12, 31)])
+        s2 = Series([1, 2, 3], index=[datetime(1997, 12, 31),
+                                      datetime(2003, 12, 31),
+                                      datetime(2008, 12, 31)])
+
+        # plot first series, then add the second series to those axes,
+        # then try adding the first series again
+        _, ax = self.plt.subplots()
+        s1.plot(ax=ax)
+        s2.plot(ax=ax)
+        s1.plot(ax=ax)
+
+    @pytest.mark.xfail(reason="GH9053 matplotlib does not use"
+                              " ax.xaxis.converter")
+    def test_add_matplotlib_datetime64(self):
+        # GH9053 - ensure that a plot with PeriodConverter still understands
+        # datetime64 data. This still fails because matplotlib overrides the
+        # ax.xaxis.converter with a DatetimeConverter
+        s = Series(np.random.randn(10),
+                   index=date_range('1970-01-02', periods=10))
+        ax = s.plot()
+        ax.plot(s.index, s.values, color='g')
+        l1, l2 = ax.lines
+        tm.assert_numpy_array_equal(l1.get_xydata(), l2.get_xydata())
+
+
+def _check_plot_works(f, freq=None, series=None, *args, **kwargs):
+    import matplotlib.pyplot as plt
+
+    fig = plt.gcf()
+
+    try:
+        plt.clf()
+        ax = fig.add_subplot(211)
+        orig_ax = kwargs.pop('ax', plt.gca())
+        orig_axfreq = getattr(orig_ax, 'freq', None)
+
+        ret = f(*args, **kwargs)
+        assert ret is not None  # do something more intelligent
+
+        ax = kwargs.pop('ax', plt.gca())
+        if series is not None:
+            dfreq = series.index.freq
+            if isinstance(dfreq, DateOffset):
+                dfreq = dfreq.rule_code
+            if orig_axfreq is None:
+                assert ax.freq == dfreq
+
+        if freq is not None and orig_axfreq is None:
+            assert ax.freq == freq
+
+        ax = fig.add_subplot(212)
+        try:
+            kwargs['ax'] = ax
+            ret = f(*args, **kwargs)
+            assert ret is not None  # do something more intelligent
+        except Exception:
+            pass
+
+        with ensure_clean(return_filelike=True) as path:
+            plt.savefig(path)
+
+        # GH18439
+        # this is supported only in Python 3 pickle since
+        # pickle in Python2 doesn't support instancemethod pickling
+        if PY3:
+            with ensure_clean(return_filelike=True) as path:
+                pickle.dump(fig, path)
+    finally:
+        plt.close(fig)
diff --git a/pandas/tests/plotting/test_deprecated.py b/pandas/tests/plotting/test_deprecated.py
new file mode 100644
index 0000000000000..a45b17ec98261
--- /dev/null
+++ b/pandas/tests/plotting/test_deprecated.py
@@ -0,0 +1,57 @@
+# coding: utf-8
+
+import string
+
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+import pytest
+
+from numpy.random import randn
+
+import pandas.tools.plotting as plotting
+
+from pandas.tests.plotting.common import TestPlotBase
+
+
+"""
+Test cases for plot functions imported from deprecated
+pandas.tools.plotting
+"""
+
+
+@td.skip_if_no_mpl
+class TestDeprecatedNameSpace(TestPlotBase):
+
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
+    def test_scatter_plot_legacy(self):
+        df = pd.DataFrame(randn(100, 2))
+
+        with tm.assert_produces_warning(FutureWarning):
+            plotting.scatter_matrix(df)
+
+        with tm.assert_produces_warning(FutureWarning):
+            pd.scatter_matrix(df)
+
+    @pytest.mark.slow
+    def test_boxplot_deprecated(self):
+        df = pd.DataFrame(randn(6, 4),
+                          index=list(string.ascii_letters[:6]),
+                          columns=['one', 'two', 'three', 'four'])
+        df['indic'] = ['foo', 'bar'] * 3
+
+        with tm.assert_produces_warning(FutureWarning):
+            plotting.boxplot(df, column=['one', 'two'],
+                             by='indic')
+
+    @pytest.mark.slow
+    def test_radviz_deprecated(self, iris):
+        with tm.assert_produces_warning(FutureWarning):
+            plotting.radviz(frame=iris, class_column='Name')
+
+    @pytest.mark.slow
+    def test_plot_params(self):
+
+        with tm.assert_produces_warning(FutureWarning):
+            pd.plot_params['xaxis.compat'] = True
diff --git a/pandas/tests/plotting/test_frame.py b/pandas/tests/plotting/test_frame.py
new file mode 100644
index 0000000000000..101713b06df8c
--- /dev/null
+++ b/pandas/tests/plotting/test_frame.py
@@ -0,0 +1,2995 @@
+# coding: utf-8
+
+""" Test cases for DataFrame.plot """
+
+import pytest
+import string
+import warnings
+
+from datetime import datetime, date
+
+import pandas as pd
+from pandas import (Series, DataFrame, MultiIndex, PeriodIndex, date_range,
+                    bdate_range)
+from pandas.core.dtypes.api import is_list_like
+from pandas.compat import range, lrange, lmap, lzip, u, zip, PY3
+from pandas.io.formats.printing import pprint_thing
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+import numpy as np
+from numpy.random import rand, randn
+
+import pandas.plotting as plotting
+from pandas.tests.plotting.common import (TestPlotBase, _check_plot_works,
+                                          _skip_if_no_scipy_gaussian_kde,
+                                          _ok_for_gaussian_kde)
+
+
+@td.skip_if_no_mpl
+class TestDataFramePlots(TestPlotBase):
+
+    def setup_method(self, method):
+        TestPlotBase.setup_method(self, method)
+        import matplotlib as mpl
+        mpl.rcdefaults()
+
+        self.tdf = tm.makeTimeDataFrame()
+        self.hexbin_df = DataFrame({"A": np.random.uniform(size=20),
+                                    "B": np.random.uniform(size=20),
+                                    "C": np.arange(20) + np.random.uniform(
+                                        size=20)})
+
+    def _assert_ytickslabels_visibility(self, axes, expected):
+        for ax, exp in zip(axes, expected):
+            self._check_visible(ax.get_yticklabels(), visible=exp)
+
+    def _assert_xtickslabels_visibility(self, axes, expected):
+        for ax, exp in zip(axes, expected):
+            self._check_visible(ax.get_xticklabels(), visible=exp)
+
+    @pytest.mark.slow
+    def test_plot(self):
+        df = self.tdf
+        _check_plot_works(df.plot, grid=False)
+        # _check_plot_works adds an ax so catch warning. see GH #13188
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.plot,
+                                     subplots=True)
+        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.plot,
+                                     subplots=True, layout=(-1, 2))
+        self._check_axes_shape(axes, axes_num=4, layout=(2, 2))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.plot,
+                                     subplots=True, use_index=False)
+        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
+
+        df = DataFrame({'x': [1, 2], 'y': [3, 4]})
+        # mpl >= 1.5.2 (or slightly below) throw AttributError
+        with pytest.raises((TypeError, AttributeError)):
+            df.plot.line(blarg=True)
+
+        df = DataFrame(np.random.rand(10, 3),
+                       index=list(string.ascii_letters[:10]))
+
+        _check_plot_works(df.plot, use_index=True)
+        _check_plot_works(df.plot, sort_columns=False)
+        _check_plot_works(df.plot, yticks=[1, 5, 10])
+        _check_plot_works(df.plot, xticks=[1, 5, 10])
+        _check_plot_works(df.plot, ylim=(-100, 100), xlim=(-100, 100))
+
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(df.plot, subplots=True, title='blah')
+
+        # We have to redo it here because _check_plot_works does two plots,
+        # once without an ax kwarg and once with an ax kwarg and the new sharex
+        # behaviour does not remove the visibility of the latter axis (as ax is
+        # present).  see: https://github.com/pandas-dev/pandas/issues/9737
+
+        axes = df.plot(subplots=True, title='blah')
+        self._check_axes_shape(axes, axes_num=3, layout=(3, 1))
+        # axes[0].figure.savefig("test.png")
+        for ax in axes[:2]:
+            self._check_visible(ax.xaxis)  # xaxis must be visible for grid
+            self._check_visible(ax.get_xticklabels(), visible=False)
+            self._check_visible(ax.get_xticklabels(minor=True), visible=False)
+            self._check_visible([ax.xaxis.get_label()], visible=False)
+        for ax in [axes[2]]:
+            self._check_visible(ax.xaxis)
+            self._check_visible(ax.get_xticklabels())
+            self._check_visible([ax.xaxis.get_label()])
+            self._check_ticks_props(ax, xrot=0)
+
+        _check_plot_works(df.plot, title='blah')
+
+        tuples = lzip(string.ascii_letters[:10], range(10))
+        df = DataFrame(np.random.rand(10, 3),
+                       index=MultiIndex.from_tuples(tuples))
+        _check_plot_works(df.plot, use_index=True)
+
+        # unicode
+        index = MultiIndex.from_tuples([(u('\u03b1'), 0),
+                                        (u('\u03b1'), 1),
+                                        (u('\u03b2'), 2),
+                                        (u('\u03b2'), 3),
+                                        (u('\u03b3'), 4),
+                                        (u('\u03b3'), 5),
+                                        (u('\u03b4'), 6),
+                                        (u('\u03b4'), 7)], names=['i0', 'i1'])
+        columns = MultiIndex.from_tuples([('bar', u('\u0394')),
+                                          ('bar', u('\u0395'))], names=['c0',
+                                                                        'c1'])
+        df = DataFrame(np.random.randint(0, 10, (8, 2)),
+                       columns=columns,
+                       index=index)
+        _check_plot_works(df.plot, title=u('\u03A3'))
+
+        # GH 6951
+        # Test with single column
+        df = DataFrame({'x': np.random.rand(10)})
+        axes = _check_plot_works(df.plot.bar, subplots=True)
+        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
+
+        axes = _check_plot_works(df.plot.bar, subplots=True, layout=(-1, 1))
+        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
+        # When ax is supplied and required number of axes is 1,
+        # passed ax should be used:
+        fig, ax = self.plt.subplots()
+        axes = df.plot.bar(subplots=True, ax=ax)
+        assert len(axes) == 1
+        if self.mpl_ge_1_5_0:
+            result = ax.axes
+        else:
+            result = ax.get_axes()  # deprecated
+        assert result is axes[0]
+
+    # GH 15516
+    def test_mpl2_color_cycle_str(self):
+        # test CN mpl 2.0 color cycle
+        if self.mpl_ge_2_0_0:
+            colors = ['C' + str(x) for x in range(10)]
+            df = DataFrame(randn(10, 3), columns=['a', 'b', 'c'])
+            for c in colors:
+                _check_plot_works(df.plot, color=c)
+        else:
+            pytest.skip("not supported in matplotlib < 2.0.0")
+
+    def test_color_single_series_list(self):
+        # GH 3486
+        df = DataFrame({"A": [1, 2, 3]})
+        _check_plot_works(df.plot, color=['red'])
+
+    def test_rgb_tuple_color(self):
+        # GH 16695
+        df = DataFrame({'x': [1, 2], 'y': [3, 4]})
+        _check_plot_works(df.plot, x='x', y='y', color=(1, 0, 0))
+        _check_plot_works(df.plot, x='x', y='y', color=(1, 0, 0, 0.5))
+
+    def test_color_empty_string(self):
+        df = DataFrame(randn(10, 2))
+        with pytest.raises(ValueError):
+            df.plot(color='')
+
+    def test_color_and_style_arguments(self):
+        df = DataFrame({'x': [1, 2], 'y': [3, 4]})
+        # passing both 'color' and 'style' arguments should be allowed
+        # if there is no color symbol in the style strings:
+        ax = df.plot(color=['red', 'black'], style=['-', '--'])
+        # check that the linestyles are correctly set:
+        linestyle = [line.get_linestyle() for line in ax.lines]
+        assert linestyle == ['-', '--']
+        # check that the colors are correctly set:
+        color = [line.get_color() for line in ax.lines]
+        assert color == ['red', 'black']
+        # passing both 'color' and 'style' arguments should not be allowed
+        # if there is a color symbol in the style strings:
+        with pytest.raises(ValueError):
+            df.plot(color=['red', 'black'], style=['k-', 'r--'])
+
+    def test_nonnumeric_exclude(self):
+        df = DataFrame({'A': ["x", "y", "z"], 'B': [1, 2, 3]})
+        ax = df.plot()
+        assert len(ax.get_lines()) == 1  # B was plotted
+
+    @pytest.mark.slow
+    def test_implicit_label(self):
+        df = DataFrame(randn(10, 3), columns=['a', 'b', 'c'])
+        ax = df.plot(x='a', y='b')
+        self._check_text_labels(ax.xaxis.get_label(), 'a')
+
+    @pytest.mark.slow
+    def test_donot_overwrite_index_name(self):
+        # GH 8494
+        df = DataFrame(randn(2, 2), columns=['a', 'b'])
+        df.index.name = 'NAME'
+        df.plot(y='b', label='LABEL')
+        assert df.index.name == 'NAME'
+
+    @pytest.mark.slow
+    def test_plot_xy(self):
+        # columns.inferred_type == 'string'
+        df = self.tdf
+        self._check_data(df.plot(x=0, y=1), df.set_index('A')['B'].plot())
+        self._check_data(df.plot(x=0), df.set_index('A').plot())
+        self._check_data(df.plot(y=0), df.B.plot())
+        self._check_data(df.plot(x='A', y='B'), df.set_index('A').B.plot())
+        self._check_data(df.plot(x='A'), df.set_index('A').plot())
+        self._check_data(df.plot(y='B'), df.B.plot())
+
+        # columns.inferred_type == 'integer'
+        df.columns = lrange(1, len(df.columns) + 1)
+        self._check_data(df.plot(x=1, y=2), df.set_index(1)[2].plot())
+        self._check_data(df.plot(x=1), df.set_index(1).plot())
+        self._check_data(df.plot(y=1), df[1].plot())
+
+        # figsize and title
+        ax = df.plot(x=1, y=2, title='Test', figsize=(16, 8))
+        self._check_text_labels(ax.title, 'Test')
+        self._check_axes_shape(ax, axes_num=1, layout=(1, 1),
+                               figsize=(16., 8.))
+
+        # columns.inferred_type == 'mixed'
+        # TODO add MultiIndex test
+
+    @pytest.mark.slow
+    def test_logscales(self):
+        df = DataFrame({'a': np.arange(100)}, index=np.arange(100))
+        ax = df.plot(logy=True)
+        self._check_ax_scales(ax, yaxis='log')
+
+        ax = df.plot(logx=True)
+        self._check_ax_scales(ax, xaxis='log')
+
+        ax = df.plot(loglog=True)
+        self._check_ax_scales(ax, xaxis='log', yaxis='log')
+
+    @pytest.mark.slow
+    def test_xcompat(self):
+        import pandas as pd
+
+        df = self.tdf
+        ax = df.plot(x_compat=True)
+        lines = ax.get_lines()
+        assert not isinstance(lines[0].get_xdata(), PeriodIndex)
+
+        tm.close()
+        pd.plotting.plot_params['xaxis.compat'] = True
+        ax = df.plot()
+        lines = ax.get_lines()
+        assert not isinstance(lines[0].get_xdata(), PeriodIndex)
+
+        tm.close()
+        pd.plotting.plot_params['x_compat'] = False
+
+        ax = df.plot()
+        lines = ax.get_lines()
+        assert not isinstance(lines[0].get_xdata(), PeriodIndex)
+        assert isinstance(PeriodIndex(lines[0].get_xdata()), PeriodIndex)
+
+        tm.close()
+        # useful if you're plotting a bunch together
+        with pd.plotting.plot_params.use('x_compat', True):
+            ax = df.plot()
+            lines = ax.get_lines()
+            assert not isinstance(lines[0].get_xdata(), PeriodIndex)
+
+        tm.close()
+        ax = df.plot()
+        lines = ax.get_lines()
+        assert not isinstance(lines[0].get_xdata(), PeriodIndex)
+        assert isinstance(PeriodIndex(lines[0].get_xdata()), PeriodIndex)
+
+    def test_period_compat(self):
+        # GH 9012
+        # period-array conversions
+        df = DataFrame(
+            np.random.rand(21, 2),
+            index=bdate_range(datetime(2000, 1, 1), datetime(2000, 1, 31)),
+            columns=['a', 'b'])
+
+        df.plot()
+        self.plt.axhline(y=0)
+        tm.close()
+
+    def test_unsorted_index(self):
+        df = DataFrame({'y': np.arange(100)}, index=np.arange(99, -1, -1),
+                       dtype=np.int64)
+        ax = df.plot()
+        l = ax.get_lines()[0]
+        rs = l.get_xydata()
+        rs = Series(rs[:, 1], rs[:, 0], dtype=np.int64, name='y')
+        tm.assert_series_equal(rs, df.y, check_index_type=False)
+        tm.close()
+
+        df.index = pd.Index(np.arange(99, -1, -1), dtype=np.float64)
+        ax = df.plot()
+        l = ax.get_lines()[0]
+        rs = l.get_xydata()
+        rs = Series(rs[:, 1], rs[:, 0], dtype=np.int64, name='y')
+        tm.assert_series_equal(rs, df.y)
+
+    def test_unsorted_index_lims(self):
+        df = DataFrame({'y': [0., 1., 2., 3.]}, index=[1., 0., 3., 2.])
+        ax = df.plot()
+        xmin, xmax = ax.get_xlim()
+        lines = ax.get_lines()
+        assert xmin <= np.nanmin(lines[0].get_data()[0])
+        assert xmax >= np.nanmax(lines[0].get_data()[0])
+
+        df = DataFrame({'y': [0., 1., np.nan, 3., 4., 5., 6.]},
+                       index=[1., 0., 3., 2., np.nan, 3., 2.])
+        ax = df.plot()
+        xmin, xmax = ax.get_xlim()
+        lines = ax.get_lines()
+        assert xmin <= np.nanmin(lines[0].get_data()[0])
+        assert xmax >= np.nanmax(lines[0].get_data()[0])
+
+        df = DataFrame({'y': [0., 1., 2., 3.], 'z': [91., 90., 93., 92.]})
+        ax = df.plot(x='z', y='y')
+        xmin, xmax = ax.get_xlim()
+        lines = ax.get_lines()
+        assert xmin <= np.nanmin(lines[0].get_data()[0])
+        assert xmax >= np.nanmax(lines[0].get_data()[0])
+
+    @pytest.mark.slow
+    def test_subplots(self):
+        df = DataFrame(np.random.rand(10, 3),
+                       index=list(string.ascii_letters[:10]))
+
+        for kind in ['bar', 'barh', 'line', 'area']:
+            axes = df.plot(kind=kind, subplots=True, sharex=True, legend=True)
+            self._check_axes_shape(axes, axes_num=3, layout=(3, 1))
+            assert axes.shape == (3, )
+
+            for ax, column in zip(axes, df.columns):
+                self._check_legend_labels(ax,
+                                          labels=[pprint_thing(column)])
+
+            for ax in axes[:-2]:
+                self._check_visible(ax.xaxis)  # xaxis must be visible for grid
+                self._check_visible(ax.get_xticklabels(), visible=False)
+                self._check_visible(
+                    ax.get_xticklabels(minor=True), visible=False)
+                self._check_visible(ax.xaxis.get_label(), visible=False)
+                self._check_visible(ax.get_yticklabels())
+
+            self._check_visible(axes[-1].xaxis)
+            self._check_visible(axes[-1].get_xticklabels())
+            self._check_visible(axes[-1].get_xticklabels(minor=True))
+            self._check_visible(axes[-1].xaxis.get_label())
+            self._check_visible(axes[-1].get_yticklabels())
+
+            axes = df.plot(kind=kind, subplots=True, sharex=False)
+            for ax in axes:
+                self._check_visible(ax.xaxis)
+                self._check_visible(ax.get_xticklabels())
+                self._check_visible(ax.get_xticklabels(minor=True))
+                self._check_visible(ax.xaxis.get_label())
+                self._check_visible(ax.get_yticklabels())
+
+            axes = df.plot(kind=kind, subplots=True, legend=False)
+            for ax in axes:
+                assert ax.get_legend() is None
+
+    def test_groupby_boxplot_sharey(self):
+        # https://github.com/pandas-dev/pandas/issues/20968
+        # sharey can now be switched check whether the right
+        # pair of axes is turned on or off
+
+        df = DataFrame({'a': [-1.43, -0.15, -3.70, -1.43, -0.14],
+                        'b': [0.56, 0.84, 0.29, 0.56, 0.85],
+                        'c': [0, 1, 2, 3, 1]},
+                       index=[0, 1, 2, 3, 4])
+
+        # behavior without keyword
+        axes = df.groupby('c').boxplot()
+        expected = [True, False, True, False]
+        self._assert_ytickslabels_visibility(axes, expected)
+
+        # set sharey=True should be identical
+        axes = df.groupby('c').boxplot(sharey=True)
+        expected = [True, False, True, False]
+        self._assert_ytickslabels_visibility(axes, expected)
+
+        # sharey=False, all yticklabels should be visible
+        axes = df.groupby('c').boxplot(sharey=False)
+        expected = [True, True, True, True]
+        self._assert_ytickslabels_visibility(axes, expected)
+
+    def test_groupby_boxplot_sharex(self):
+        # https://github.com/pandas-dev/pandas/issues/20968
+        # sharex can now be switched check whether the right
+        # pair of axes is turned on or off
+
+        df = DataFrame({'a': [-1.43, -0.15, -3.70, -1.43, -0.14],
+                        'b': [0.56, 0.84, 0.29, 0.56, 0.85],
+                        'c': [0, 1, 2, 3, 1]},
+                       index=[0, 1, 2, 3, 4])
+
+        # behavior without keyword
+        axes = df.groupby('c').boxplot()
+        expected = [True, True, True, True]
+        self._assert_xtickslabels_visibility(axes, expected)
+
+        # set sharex=False should be identical
+        axes = df.groupby('c').boxplot(sharex=False)
+        expected = [True, True, True, True]
+        self._assert_xtickslabels_visibility(axes, expected)
+
+        # sharex=True, yticklabels should be visible
+        # only for bottom plots
+        axes = df.groupby('c').boxplot(sharex=True)
+        expected = [False, False, True, True]
+        self._assert_xtickslabels_visibility(axes, expected)
+
+    @pytest.mark.slow
+    def test_subplots_timeseries(self):
+        idx = date_range(start='2014-07-01', freq='M', periods=10)
+        df = DataFrame(np.random.rand(10, 3), index=idx)
+
+        for kind in ['line', 'area']:
+            axes = df.plot(kind=kind, subplots=True, sharex=True)
+            self._check_axes_shape(axes, axes_num=3, layout=(3, 1))
+
+            for ax in axes[:-2]:
+                # GH 7801
+                self._check_visible(ax.xaxis)  # xaxis must be visible for grid
+                self._check_visible(ax.get_xticklabels(), visible=False)
+                self._check_visible(
+                    ax.get_xticklabels(minor=True), visible=False)
+                self._check_visible(ax.xaxis.get_label(), visible=False)
+                self._check_visible(ax.get_yticklabels())
+
+            self._check_visible(axes[-1].xaxis)
+            self._check_visible(axes[-1].get_xticklabels())
+            self._check_visible(axes[-1].get_xticklabels(minor=True))
+            self._check_visible(axes[-1].xaxis.get_label())
+            self._check_visible(axes[-1].get_yticklabels())
+            self._check_ticks_props(axes, xrot=0)
+
+            axes = df.plot(kind=kind, subplots=True, sharex=False, rot=45,
+                           fontsize=7)
+            for ax in axes:
+                self._check_visible(ax.xaxis)
+                self._check_visible(ax.get_xticklabels())
+                self._check_visible(ax.get_xticklabels(minor=True))
+                self._check_visible(ax.xaxis.get_label())
+                self._check_visible(ax.get_yticklabels())
+                self._check_ticks_props(ax, xlabelsize=7, xrot=45,
+                                        ylabelsize=7)
+
+    def test_subplots_timeseries_y_axis(self):
+        # GH16953
+        data = {"numeric": np.array([1, 2, 5]),
+                "timedelta": [pd.Timedelta(-10, unit="s"),
+                              pd.Timedelta(10, unit="m"),
+                              pd.Timedelta(10, unit="h")],
+                "datetime_no_tz": [pd.to_datetime("2017-08-01 00:00:00"),
+                                   pd.to_datetime("2017-08-01 02:00:00"),
+                                   pd.to_datetime("2017-08-02 00:00:00")],
+                "datetime_all_tz": [pd.to_datetime("2017-08-01 00:00:00",
+                                                   utc=True),
+                                    pd.to_datetime("2017-08-01 02:00:00",
+                                                   utc=True),
+                                    pd.to_datetime("2017-08-02 00:00:00",
+                                                   utc=True)],
+                "text": ["This", "should", "fail"]}
+        testdata = DataFrame(data)
+
+        ax_numeric = testdata.plot(y="numeric")
+        assert (ax_numeric.get_lines()[0].get_data()[1] ==
+                testdata["numeric"].values).all()
+        ax_timedelta = testdata.plot(y="timedelta")
+        assert (ax_timedelta.get_lines()[0].get_data()[1] ==
+                testdata["timedelta"].values).all()
+        ax_datetime_no_tz = testdata.plot(y="datetime_no_tz")
+        assert (ax_datetime_no_tz.get_lines()[0].get_data()[1] ==
+                testdata["datetime_no_tz"].values).all()
+        ax_datetime_all_tz = testdata.plot(y="datetime_all_tz")
+        assert (ax_datetime_all_tz.get_lines()[0].get_data()[1] ==
+                testdata["datetime_all_tz"].values).all()
+        with pytest.raises(TypeError):
+            testdata.plot(y="text")
+
+    @pytest.mark.xfail(reason='not support for period, categorical, '
+                       'datetime_mixed_tz')
+    def test_subplots_timeseries_y_axis_not_supported(self):
+        """
+        This test will fail for:
+            period:
+                since period isn't yet implemented in ``select_dtypes``
+                and because it will need a custom value converter +
+                tick formater (as was done for x-axis plots)
+
+            categorical:
+                 because it will need a custom value converter +
+                 tick formater (also doesn't work for x-axis, as of now)
+
+            datetime_mixed_tz:
+                because of the way how pandas handels ``Series`` of
+                ``datetime`` objects with different timezone,
+                generally converting ``datetime`` objects in a tz-aware
+                form could help with this problem
+        """
+        data = {"numeric": np.array([1, 2, 5]),
+                "period": [pd.Period('2017-08-01 00:00:00', freq='H'),
+                           pd.Period('2017-08-01 02:00', freq='H'),
+                           pd.Period('2017-08-02 00:00:00', freq='H')],
+                "categorical": pd.Categorical(["c", "b", "a"],
+                                              categories=["a", "b", "c"],
+                                              ordered=False),
+                "datetime_mixed_tz": [pd.to_datetime("2017-08-01 00:00:00",
+                                                     utc=True),
+                                      pd.to_datetime("2017-08-01 02:00:00"),
+                                      pd.to_datetime("2017-08-02 00:00:00")]}
+        testdata = pd.DataFrame(data)
+        ax_period = testdata.plot(x="numeric", y="period")
+        assert (ax_period.get_lines()[0].get_data()[1] ==
+                testdata["period"].values).all()
+        ax_categorical = testdata.plot(x="numeric", y="categorical")
+        assert (ax_categorical.get_lines()[0].get_data()[1] ==
+                testdata["categorical"].values).all()
+        ax_datetime_mixed_tz = testdata.plot(x="numeric",
+                                             y="datetime_mixed_tz")
+        assert (ax_datetime_mixed_tz.get_lines()[0].get_data()[1] ==
+                testdata["datetime_mixed_tz"].values).all()
+
+    @pytest.mark.slow
+    def test_subplots_layout(self):
+        # GH 6667
+        df = DataFrame(np.random.rand(10, 3),
+                       index=list(string.ascii_letters[:10]))
+
+        axes = df.plot(subplots=True, layout=(2, 2))
+        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
+        assert axes.shape == (2, 2)
+
+        axes = df.plot(subplots=True, layout=(-1, 2))
+        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
+        assert axes.shape == (2, 2)
+
+        axes = df.plot(subplots=True, layout=(2, -1))
+        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
+        assert axes.shape == (2, 2)
+
+        axes = df.plot(subplots=True, layout=(1, 4))
+        self._check_axes_shape(axes, axes_num=3, layout=(1, 4))
+        assert axes.shape == (1, 4)
+
+        axes = df.plot(subplots=True, layout=(-1, 4))
+        self._check_axes_shape(axes, axes_num=3, layout=(1, 4))
+        assert axes.shape == (1, 4)
+
+        axes = df.plot(subplots=True, layout=(4, -1))
+        self._check_axes_shape(axes, axes_num=3, layout=(4, 1))
+        assert axes.shape == (4, 1)
+
+        with pytest.raises(ValueError):
+            df.plot(subplots=True, layout=(1, 1))
+        with pytest.raises(ValueError):
+            df.plot(subplots=True, layout=(-1, -1))
+
+        # single column
+        df = DataFrame(np.random.rand(10, 1),
+                       index=list(string.ascii_letters[:10]))
+        axes = df.plot(subplots=True)
+        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
+        assert axes.shape == (1, )
+
+        axes = df.plot(subplots=True, layout=(3, 3))
+        self._check_axes_shape(axes, axes_num=1, layout=(3, 3))
+        assert axes.shape == (3, 3)
+
+    @pytest.mark.slow
+    def test_subplots_warnings(self):
+        # GH 9464
+        warnings.simplefilter('error')
+        try:
+            df = DataFrame(np.random.randn(100, 4))
+            df.plot(subplots=True, layout=(3, 2))
+
+            df = DataFrame(np.random.randn(100, 4),
+                           index=date_range('1/1/2000', periods=100))
+            df.plot(subplots=True, layout=(3, 2))
+        except Warning as w:
+            self.fail(w)
+        warnings.simplefilter('default')
+
+    @pytest.mark.slow
+    def test_subplots_multiple_axes(self):
+        # GH 5353, 6970, GH 7069
+        fig, axes = self.plt.subplots(2, 3)
+        df = DataFrame(np.random.rand(10, 3),
+                       index=list(string.ascii_letters[:10]))
+
+        returned = df.plot(subplots=True, ax=axes[0], sharex=False,
+                           sharey=False)
+        self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
+        assert returned.shape == (3, )
+        assert returned[0].figure is fig
+        # draw on second row
+        returned = df.plot(subplots=True, ax=axes[1], sharex=False,
+                           sharey=False)
+        self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
+        assert returned.shape == (3, )
+        assert returned[0].figure is fig
+        self._check_axes_shape(axes, axes_num=6, layout=(2, 3))
+        tm.close()
+
+        with pytest.raises(ValueError):
+            fig, axes = self.plt.subplots(2, 3)
+            # pass different number of axes from required
+            df.plot(subplots=True, ax=axes)
+
+        # pass 2-dim axes and invalid layout
+        # invalid lauout should not affect to input and return value
+        # (show warning is tested in
+        # TestDataFrameGroupByPlots.test_grouped_box_multiple_axes
+        fig, axes = self.plt.subplots(2, 2)
+        with warnings.catch_warnings():
+            df = DataFrame(np.random.rand(10, 4),
+                           index=list(string.ascii_letters[:10]))
+
+            returned = df.plot(subplots=True, ax=axes, layout=(2, 1),
+                               sharex=False, sharey=False)
+            self._check_axes_shape(returned, axes_num=4, layout=(2, 2))
+            assert returned.shape == (4, )
+
+            returned = df.plot(subplots=True, ax=axes, layout=(2, -1),
+                               sharex=False, sharey=False)
+            self._check_axes_shape(returned, axes_num=4, layout=(2, 2))
+            assert returned.shape == (4, )
+
+            returned = df.plot(subplots=True, ax=axes, layout=(-1, 2),
+                               sharex=False, sharey=False)
+        self._check_axes_shape(returned, axes_num=4, layout=(2, 2))
+        assert returned.shape == (4, )
+
+        # single column
+        fig, axes = self.plt.subplots(1, 1)
+        df = DataFrame(np.random.rand(10, 1),
+                       index=list(string.ascii_letters[:10]))
+
+        axes = df.plot(subplots=True, ax=[axes], sharex=False, sharey=False)
+        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
+        assert axes.shape == (1, )
+
+    def test_subplots_ts_share_axes(self):
+        # GH 3964
+        fig, axes = self.plt.subplots(3, 3, sharex=True, sharey=True)
+        self.plt.subplots_adjust(left=0.05, right=0.95, hspace=0.3, wspace=0.3)
+        df = DataFrame(
+            np.random.randn(10, 9),
+            index=date_range(start='2014-07-01', freq='M', periods=10))
+        for i, ax in enumerate(axes.ravel()):
+            df[i].plot(ax=ax, fontsize=5)
+
+        # Rows other than bottom should not be visible
+        for ax in axes[0:-1].ravel():
+            self._check_visible(ax.get_xticklabels(), visible=False)
+
+        # Bottom row should be visible
+        for ax in axes[-1].ravel():
+            self._check_visible(ax.get_xticklabels(), visible=True)
+
+        # First column should be visible
+        for ax in axes[[0, 1, 2], [0]].ravel():
+            self._check_visible(ax.get_yticklabels(), visible=True)
+
+        # Other columns should not be visible
+        for ax in axes[[0, 1, 2], [1]].ravel():
+            self._check_visible(ax.get_yticklabels(), visible=False)
+        for ax in axes[[0, 1, 2], [2]].ravel():
+            self._check_visible(ax.get_yticklabels(), visible=False)
+
+    def test_subplots_sharex_axes_existing_axes(self):
+        # GH 9158
+        d = {'A': [1., 2., 3., 4.], 'B': [4., 3., 2., 1.], 'C': [5, 1, 3, 4]}
+        df = DataFrame(d, index=date_range('2014 10 11', '2014 10 14'))
+
+        axes = df[['A', 'B']].plot(subplots=True)
+        df['C'].plot(ax=axes[0], secondary_y=True)
+
+        self._check_visible(axes[0].get_xticklabels(), visible=False)
+        self._check_visible(axes[1].get_xticklabels(), visible=True)
+        for ax in axes.ravel():
+            self._check_visible(ax.get_yticklabels(), visible=True)
+
+    @pytest.mark.slow
+    def test_subplots_dup_columns(self):
+        # GH 10962
+        df = DataFrame(np.random.rand(5, 5), columns=list('aaaaa'))
+        axes = df.plot(subplots=True)
+        for ax in axes:
+            self._check_legend_labels(ax, labels=['a'])
+            assert len(ax.lines) == 1
+        tm.close()
+
+        axes = df.plot(subplots=True, secondary_y='a')
+        for ax in axes:
+            # (right) is only attached when subplots=False
+            self._check_legend_labels(ax, labels=['a'])
+            assert len(ax.lines) == 1
+        tm.close()
+
+        ax = df.plot(secondary_y='a')
+        self._check_legend_labels(ax, labels=['a (right)'] * 5)
+        assert len(ax.lines) == 0
+        assert len(ax.right_ax.lines) == 5
+
+    def test_negative_log(self):
+        df = - DataFrame(rand(6, 4),
+                         index=list(string.ascii_letters[:6]),
+                         columns=['x', 'y', 'z', 'four'])
+
+        with pytest.raises(ValueError):
+            df.plot.area(logy=True)
+        with pytest.raises(ValueError):
+            df.plot.area(loglog=True)
+
+    def _compare_stacked_y_cood(self, normal_lines, stacked_lines):
+        base = np.zeros(len(normal_lines[0].get_data()[1]))
+        for nl, sl in zip(normal_lines, stacked_lines):
+            base += nl.get_data()[1]  # get y coordinates
+            sy = sl.get_data()[1]
+            tm.assert_numpy_array_equal(base, sy)
+
+    def test_line_area_stacked(self):
+        with tm.RNGContext(42):
+            df = DataFrame(rand(6, 4), columns=['w', 'x', 'y', 'z'])
+            neg_df = -df
+            # each column has either positive or negative value
+            sep_df = DataFrame({'w': rand(6),
+                                'x': rand(6),
+                                'y': -rand(6),
+                                'z': -rand(6)})
+            # each column has positive-negative mixed value
+            mixed_df = DataFrame(randn(6, 4),
+                                 index=list(string.ascii_letters[:6]),
+                                 columns=['w', 'x', 'y', 'z'])
+
+            for kind in ['line', 'area']:
+                ax1 = _check_plot_works(df.plot, kind=kind, stacked=False)
+                ax2 = _check_plot_works(df.plot, kind=kind, stacked=True)
+                self._compare_stacked_y_cood(ax1.lines, ax2.lines)
+
+                ax1 = _check_plot_works(neg_df.plot, kind=kind, stacked=False)
+                ax2 = _check_plot_works(neg_df.plot, kind=kind, stacked=True)
+                self._compare_stacked_y_cood(ax1.lines, ax2.lines)
+
+                ax1 = _check_plot_works(sep_df.plot, kind=kind, stacked=False)
+                ax2 = _check_plot_works(sep_df.plot, kind=kind, stacked=True)
+                self._compare_stacked_y_cood(ax1.lines[:2], ax2.lines[:2])
+                self._compare_stacked_y_cood(ax1.lines[2:], ax2.lines[2:])
+
+                _check_plot_works(mixed_df.plot, stacked=False)
+                with pytest.raises(ValueError):
+                    mixed_df.plot(stacked=True)
+
+                _check_plot_works(df.plot, kind=kind, logx=True, stacked=True)
+
+    def test_line_area_nan_df(self):
+        values1 = [1, 2, np.nan, 3]
+        values2 = [3, np.nan, 2, 1]
+        df = DataFrame({'a': values1, 'b': values2})
+        tdf = DataFrame({'a': values1,
+                         'b': values2}, index=tm.makeDateIndex(k=4))
+
+        for d in [df, tdf]:
+            ax = _check_plot_works(d.plot)
+            masked1 = ax.lines[0].get_ydata()
+            masked2 = ax.lines[1].get_ydata()
+            # remove nan for comparison purpose
+
+            exp = np.array([1, 2, 3], dtype=np.float64)
+            tm.assert_numpy_array_equal(np.delete(masked1.data, 2), exp)
+
+            exp = np.array([3, 2, 1], dtype=np.float64)
+            tm.assert_numpy_array_equal(np.delete(masked2.data, 1), exp)
+            tm.assert_numpy_array_equal(
+                masked1.mask, np.array([False, False, True, False]))
+            tm.assert_numpy_array_equal(
+                masked2.mask, np.array([False, True, False, False]))
+
+            expected1 = np.array([1, 2, 0, 3], dtype=np.float64)
+            expected2 = np.array([3, 0, 2, 1], dtype=np.float64)
+
+            ax = _check_plot_works(d.plot, stacked=True)
+            tm.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected1)
+            tm.assert_numpy_array_equal(ax.lines[1].get_ydata(),
+                                        expected1 + expected2)
+
+            ax = _check_plot_works(d.plot.area)
+            tm.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected1)
+            tm.assert_numpy_array_equal(ax.lines[1].get_ydata(),
+                                        expected1 + expected2)
+
+            ax = _check_plot_works(d.plot.area, stacked=False)
+            tm.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected1)
+            tm.assert_numpy_array_equal(ax.lines[1].get_ydata(), expected2)
+
+    def test_line_lim(self):
+        df = DataFrame(rand(6, 3), columns=['x', 'y', 'z'])
+        ax = df.plot()
+        xmin, xmax = ax.get_xlim()
+        lines = ax.get_lines()
+        assert xmin <= lines[0].get_data()[0][0]
+        assert xmax >= lines[0].get_data()[0][-1]
+
+        ax = df.plot(secondary_y=True)
+        xmin, xmax = ax.get_xlim()
+        lines = ax.get_lines()
+        assert xmin <= lines[0].get_data()[0][0]
+        assert xmax >= lines[0].get_data()[0][-1]
+
+        axes = df.plot(secondary_y=True, subplots=True)
+        self._check_axes_shape(axes, axes_num=3, layout=(3, 1))
+        for ax in axes:
+            assert hasattr(ax, 'left_ax')
+            assert not hasattr(ax, 'right_ax')
+            xmin, xmax = ax.get_xlim()
+            lines = ax.get_lines()
+            assert xmin <= lines[0].get_data()[0][0]
+            assert xmax >= lines[0].get_data()[0][-1]
+
+    def test_area_lim(self):
+        df = DataFrame(rand(6, 4), columns=['x', 'y', 'z', 'four'])
+
+        neg_df = -df
+        for stacked in [True, False]:
+            ax = _check_plot_works(df.plot.area, stacked=stacked)
+            xmin, xmax = ax.get_xlim()
+            ymin, ymax = ax.get_ylim()
+            lines = ax.get_lines()
+            assert xmin <= lines[0].get_data()[0][0]
+            assert xmax >= lines[0].get_data()[0][-1]
+            assert ymin == 0
+
+            ax = _check_plot_works(neg_df.plot.area, stacked=stacked)
+            ymin, ymax = ax.get_ylim()
+            assert ymax == 0
+
+    @pytest.mark.slow
+    def test_bar_colors(self):
+        import matplotlib.pyplot as plt
+        default_colors = self._maybe_unpack_cycler(plt.rcParams)
+
+        df = DataFrame(randn(5, 5))
+        ax = df.plot.bar()
+        self._check_colors(ax.patches[::5], facecolors=default_colors[:5])
+        tm.close()
+
+        custom_colors = 'rgcby'
+        ax = df.plot.bar(color=custom_colors)
+        self._check_colors(ax.patches[::5], facecolors=custom_colors)
+        tm.close()
+
+        from matplotlib import cm
+        # Test str -> colormap functionality
+        ax = df.plot.bar(colormap='jet')
+        rgba_colors = lmap(cm.jet, np.linspace(0, 1, 5))
+        self._check_colors(ax.patches[::5], facecolors=rgba_colors)
+        tm.close()
+
+        # Test colormap functionality
+        ax = df.plot.bar(colormap=cm.jet)
+        rgba_colors = lmap(cm.jet, np.linspace(0, 1, 5))
+        self._check_colors(ax.patches[::5], facecolors=rgba_colors)
+        tm.close()
+
+        ax = df.loc[:, [0]].plot.bar(color='DodgerBlue')
+        self._check_colors([ax.patches[0]], facecolors=['DodgerBlue'])
+        tm.close()
+
+        ax = df.plot(kind='bar', color='green')
+        self._check_colors(ax.patches[::5], facecolors=['green'] * 5)
+        tm.close()
+
+    def test_bar_user_colors(self):
+        df = pd.DataFrame({"A": range(4),
+                           "B": range(1, 5),
+                           "color": ['red', 'blue', 'blue', 'red']})
+        # This should *only* work when `y` is specified, else
+        # we use one color per column
+        ax = df.plot.bar(y='A', color=df['color'])
+        result = [p.get_facecolor() for p in ax.patches]
+        expected = [(1., 0., 0., 1.),
+                    (0., 0., 1., 1.),
+                    (0., 0., 1., 1.),
+                    (1., 0., 0., 1.)]
+        assert result == expected
+
+    @pytest.mark.slow
+    def test_bar_linewidth(self):
+        df = DataFrame(randn(5, 5))
+
+        # regular
+        ax = df.plot.bar(linewidth=2)
+        for r in ax.patches:
+            assert r.get_linewidth() == 2
+
+        # stacked
+        ax = df.plot.bar(stacked=True, linewidth=2)
+        for r in ax.patches:
+            assert r.get_linewidth() == 2
+
+        # subplots
+        axes = df.plot.bar(linewidth=2, subplots=True)
+        self._check_axes_shape(axes, axes_num=5, layout=(5, 1))
+        for ax in axes:
+            for r in ax.patches:
+                assert r.get_linewidth() == 2
+
+    @pytest.mark.slow
+    def test_bar_barwidth(self):
+        df = DataFrame(randn(5, 5))
+
+        width = 0.9
+
+        # regular
+        ax = df.plot.bar(width=width)
+        for r in ax.patches:
+            assert r.get_width() == width / len(df.columns)
+
+        # stacked
+        ax = df.plot.bar(stacked=True, width=width)
+        for r in ax.patches:
+            assert r.get_width() == width
+
+        # horizontal regular
+        ax = df.plot.barh(width=width)
+        for r in ax.patches:
+            assert r.get_height() == width / len(df.columns)
+
+        # horizontal stacked
+        ax = df.plot.barh(stacked=True, width=width)
+        for r in ax.patches:
+            assert r.get_height() == width
+
+        # subplots
+        axes = df.plot.bar(width=width, subplots=True)
+        for ax in axes:
+            for r in ax.patches:
+                assert r.get_width() == width
+
+        # horizontal subplots
+        axes = df.plot.barh(width=width, subplots=True)
+        for ax in axes:
+            for r in ax.patches:
+                assert r.get_height() == width
+
+    @pytest.mark.slow
+    def test_bar_barwidth_position(self):
+        df = DataFrame(randn(5, 5))
+        self._check_bar_alignment(df, kind='bar', stacked=False, width=0.9,
+                                  position=0.2)
+        self._check_bar_alignment(df, kind='bar', stacked=True, width=0.9,
+                                  position=0.2)
+        self._check_bar_alignment(df, kind='barh', stacked=False, width=0.9,
+                                  position=0.2)
+        self._check_bar_alignment(df, kind='barh', stacked=True, width=0.9,
+                                  position=0.2)
+        self._check_bar_alignment(df, kind='bar', subplots=True, width=0.9,
+                                  position=0.2)
+        self._check_bar_alignment(df, kind='barh', subplots=True, width=0.9,
+                                  position=0.2)
+
+    @pytest.mark.slow
+    def test_bar_barwidth_position_int(self):
+        # GH 12979
+        df = DataFrame(randn(5, 5))
+
+        for w in [1, 1.]:
+            ax = df.plot.bar(stacked=True, width=w)
+            ticks = ax.xaxis.get_ticklocs()
+            tm.assert_numpy_array_equal(ticks, np.array([0, 1, 2, 3, 4]))
+            assert ax.get_xlim() == (-0.75, 4.75)
+            # check left-edge of bars
+            assert ax.patches[0].get_x() == -0.5
+            assert ax.patches[-1].get_x() == 3.5
+
+        self._check_bar_alignment(df, kind='bar', stacked=True, width=1)
+        self._check_bar_alignment(df, kind='barh', stacked=False, width=1)
+        self._check_bar_alignment(df, kind='barh', stacked=True, width=1)
+        self._check_bar_alignment(df, kind='bar', subplots=True, width=1)
+        self._check_bar_alignment(df, kind='barh', subplots=True, width=1)
+
+    @pytest.mark.slow
+    def test_bar_bottom_left(self):
+        df = DataFrame(rand(5, 5))
+        ax = df.plot.bar(stacked=False, bottom=1)
+        result = [p.get_y() for p in ax.patches]
+        assert result == [1] * 25
+
+        ax = df.plot.bar(stacked=True, bottom=[-1, -2, -3, -4, -5])
+        result = [p.get_y() for p in ax.patches[:5]]
+        assert result == [-1, -2, -3, -4, -5]
+
+        ax = df.plot.barh(stacked=False, left=np.array([1, 1, 1, 1, 1]))
+        result = [p.get_x() for p in ax.patches]
+        assert result == [1] * 25
+
+        ax = df.plot.barh(stacked=True, left=[1, 2, 3, 4, 5])
+        result = [p.get_x() for p in ax.patches[:5]]
+        assert result == [1, 2, 3, 4, 5]
+
+        axes = df.plot.bar(subplots=True, bottom=-1)
+        for ax in axes:
+            result = [p.get_y() for p in ax.patches]
+            assert result == [-1] * 5
+
+        axes = df.plot.barh(subplots=True, left=np.array([1, 1, 1, 1, 1]))
+        for ax in axes:
+            result = [p.get_x() for p in ax.patches]
+            assert result == [1] * 5
+
+    @pytest.mark.slow
+    def test_bar_nan(self):
+        df = DataFrame({'A': [10, np.nan, 20],
+                        'B': [5, 10, 20],
+                        'C': [1, 2, 3]})
+        ax = df.plot.bar()
+        expected = [10, 0, 20, 5, 10, 20, 1, 2, 3]
+        result = [p.get_height() for p in ax.patches]
+        assert result == expected
+
+        ax = df.plot.bar(stacked=True)
+        result = [p.get_height() for p in ax.patches]
+        assert result == expected
+
+        result = [p.get_y() for p in ax.patches]
+        expected = [0.0, 0.0, 0.0, 10.0, 0.0, 20.0, 15.0, 10.0, 40.0]
+        assert result == expected
+
+    @pytest.mark.slow
+    def test_bar_categorical(self):
+        # GH 13019
+        df1 = pd.DataFrame(np.random.randn(6, 5),
+                           index=pd.Index(list('ABCDEF')),
+                           columns=pd.Index(list('abcde')))
+        # categorical index must behave the same
+        df2 = pd.DataFrame(np.random.randn(6, 5),
+                           index=pd.CategoricalIndex(list('ABCDEF')),
+                           columns=pd.CategoricalIndex(list('abcde')))
+
+        for df in [df1, df2]:
+            ax = df.plot.bar()
+            ticks = ax.xaxis.get_ticklocs()
+            tm.assert_numpy_array_equal(ticks, np.array([0, 1, 2, 3, 4, 5]))
+            assert ax.get_xlim() == (-0.5, 5.5)
+            # check left-edge of bars
+            assert ax.patches[0].get_x() == -0.25
+            assert ax.patches[-1].get_x() == 5.15
+
+            ax = df.plot.bar(stacked=True)
+            tm.assert_numpy_array_equal(ticks, np.array([0, 1, 2, 3, 4, 5]))
+            assert ax.get_xlim() == (-0.5, 5.5)
+            assert ax.patches[0].get_x() == -0.25
+            assert ax.patches[-1].get_x() == 4.75
+
+    @pytest.mark.slow
+    def test_plot_scatter(self):
+        df = DataFrame(randn(6, 4),
+                       index=list(string.ascii_letters[:6]),
+                       columns=['x', 'y', 'z', 'four'])
+
+        _check_plot_works(df.plot.scatter, x='x', y='y')
+        _check_plot_works(df.plot.scatter, x=1, y=2)
+
+        with pytest.raises(TypeError):
+            df.plot.scatter(x='x')
+        with pytest.raises(TypeError):
+            df.plot.scatter(y='y')
+
+        # GH 6951
+        axes = df.plot(x='x', y='y', kind='scatter', subplots=True)
+        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
+
+    @pytest.mark.slow
+    def test_plot_scatter_with_categorical_data(self):
+        # GH 16199
+        df = pd.DataFrame({'x': [1, 2, 3, 4],
+                           'y': pd.Categorical(['a', 'b', 'a', 'c'])})
+
+        with pytest.raises(ValueError) as ve:
+            df.plot(x='x', y='y', kind='scatter')
+        ve.match('requires y column to be numeric')
+
+        with pytest.raises(ValueError) as ve:
+            df.plot(x='y', y='x', kind='scatter')
+        ve.match('requires x column to be numeric')
+
+        with pytest.raises(ValueError) as ve:
+            df.plot(x='y', y='y', kind='scatter')
+        ve.match('requires x column to be numeric')
+
+    @pytest.mark.slow
+    def test_plot_scatter_with_c(self):
+        df = DataFrame(randn(6, 4),
+                       index=list(string.ascii_letters[:6]),
+                       columns=['x', 'y', 'z', 'four'])
+
+        axes = [df.plot.scatter(x='x', y='y', c='z'),
+                df.plot.scatter(x=0, y=1, c=2)]
+        for ax in axes:
+            # default to Greys
+            assert ax.collections[0].cmap.name == 'Greys'
+
+            if self.mpl_ge_1_3_1:
+
+                # n.b. there appears to be no public method to get the colorbar
+                # label
+                assert ax.collections[0].colorbar._label == 'z'
+
+        cm = 'cubehelix'
+        ax = df.plot.scatter(x='x', y='y', c='z', colormap=cm)
+        assert ax.collections[0].cmap.name == cm
+
+        # verify turning off colorbar works
+        ax = df.plot.scatter(x='x', y='y', c='z', colorbar=False)
+        assert ax.collections[0].colorbar is None
+
+        # verify that we can still plot a solid color
+        ax = df.plot.scatter(x=0, y=1, c='red')
+        assert ax.collections[0].colorbar is None
+        self._check_colors(ax.collections, facecolors=['r'])
+
+        # Ensure that we can pass an np.array straight through to matplotlib,
+        # this functionality was accidentally removed previously.
+        # See https://github.com/pandas-dev/pandas/issues/8852 for bug report
+        #
+        # Exercise colormap path and non-colormap path as they are independent
+        #
+        df = DataFrame({'A': [1, 2], 'B': [3, 4]})
+        red_rgba = [1.0, 0.0, 0.0, 1.0]
+        green_rgba = [0.0, 1.0, 0.0, 1.0]
+        rgba_array = np.array([red_rgba, green_rgba])
+        ax = df.plot.scatter(x='A', y='B', c=rgba_array)
+        # expect the face colors of the points in the non-colormap path to be
+        # identical to the values we supplied, normally we'd be on shaky ground
+        # comparing floats for equality but here we expect them to be
+        # identical.
+        tm.assert_numpy_array_equal(ax.collections[0]
+                                    .get_facecolor(), rgba_array)
+        # we don't test the colors of the faces in this next plot because they
+        # are dependent on the spring colormap, which may change its colors
+        # later.
+        float_array = np.array([0.0, 1.0])
+        df.plot.scatter(x='A', y='B', c=float_array, cmap='spring')
+
+    def test_scatter_colors(self):
+        df = DataFrame({'a': [1, 2, 3], 'b': [1, 2, 3], 'c': [1, 2, 3]})
+        with pytest.raises(TypeError):
+            df.plot.scatter(x='a', y='b', c='c', color='green')
+
+        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
+
+        ax = df.plot.scatter(x='a', y='b', c='c')
+        tm.assert_numpy_array_equal(
+            ax.collections[0].get_facecolor()[0],
+            np.array(self.colorconverter.to_rgba(default_colors[0])))
+
+        ax = df.plot.scatter(x='a', y='b', color='white')
+        tm.assert_numpy_array_equal(ax.collections[0].get_facecolor()[0],
+                                    np.array([1, 1, 1, 1], dtype=np.float64))
+
+    @pytest.mark.slow
+    def test_plot_bar(self):
+        df = DataFrame(randn(6, 4),
+                       index=list(string.ascii_letters[:6]),
+                       columns=['one', 'two', 'three', 'four'])
+
+        _check_plot_works(df.plot.bar)
+        _check_plot_works(df.plot.bar, legend=False)
+        # _check_plot_works adds an ax so catch warning. see GH #13188
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(df.plot.bar, subplots=True)
+        _check_plot_works(df.plot.bar, stacked=True)
+
+        df = DataFrame(randn(10, 15),
+                       index=list(string.ascii_letters[:10]),
+                       columns=lrange(15))
+        _check_plot_works(df.plot.bar)
+
+        df = DataFrame({'a': [0, 1], 'b': [1, 0]})
+        ax = _check_plot_works(df.plot.bar)
+        self._check_ticks_props(ax, xrot=90)
+
+        ax = df.plot.bar(rot=35, fontsize=10)
+        self._check_ticks_props(ax, xrot=35, xlabelsize=10, ylabelsize=10)
+
+        ax = _check_plot_works(df.plot.barh)
+        self._check_ticks_props(ax, yrot=0)
+
+        ax = df.plot.barh(rot=55, fontsize=11)
+        self._check_ticks_props(ax, yrot=55, ylabelsize=11, xlabelsize=11)
+
+    def _check_bar_alignment(self, df, kind='bar', stacked=False,
+                             subplots=False, align='center', width=0.5,
+                             position=0.5):
+
+        axes = df.plot(kind=kind, stacked=stacked, subplots=subplots,
+                       align=align, width=width, position=position, grid=True)
+
+        axes = self._flatten_visible(axes)
+
+        for ax in axes:
+            if kind == 'bar':
+                axis = ax.xaxis
+                ax_min, ax_max = ax.get_xlim()
+                min_edge = min(p.get_x() for p in ax.patches)
+                max_edge = max(p.get_x() + p.get_width() for p in ax.patches)
+            elif kind == 'barh':
+                axis = ax.yaxis
+                ax_min, ax_max = ax.get_ylim()
+                min_edge = min(p.get_y() for p in ax.patches)
+                max_edge = max(p.get_y() + p.get_height() for p in ax.patches)
+            else:
+                raise ValueError
+
+            # GH 7498
+            # compare margins between lim and bar edges
+            tm.assert_almost_equal(ax_min, min_edge - 0.25)
+            tm.assert_almost_equal(ax_max, max_edge + 0.25)
+
+            p = ax.patches[0]
+            if kind == 'bar' and (stacked is True or subplots is True):
+                edge = p.get_x()
+                center = edge + p.get_width() * position
+            elif kind == 'bar' and stacked is False:
+                center = p.get_x() + p.get_width() * len(df.columns) * position
+                edge = p.get_x()
+            elif kind == 'barh' and (stacked is True or subplots is True):
+                center = p.get_y() + p.get_height() * position
+                edge = p.get_y()
+            elif kind == 'barh' and stacked is False:
+                center = p.get_y() + p.get_height() * len(
+                    df.columns) * position
+                edge = p.get_y()
+            else:
+                raise ValueError
+
+            # Check the ticks locates on integer
+            assert (axis.get_ticklocs() == np.arange(len(df))).all()
+
+            if align == 'center':
+                # Check whether the bar locates on center
+                tm.assert_almost_equal(axis.get_ticklocs()[0], center)
+            elif align == 'edge':
+                # Check whether the bar's edge starts from the tick
+                tm.assert_almost_equal(axis.get_ticklocs()[0], edge)
+            else:
+                raise ValueError
+
+        return axes
+
+    @pytest.mark.slow
+    def test_bar_stacked_center(self):
+        # GH2157
+        df = DataFrame({'A': [3] * 5, 'B': lrange(5)}, index=lrange(5))
+        self._check_bar_alignment(df, kind='bar', stacked=True)
+        self._check_bar_alignment(df, kind='bar', stacked=True, width=0.9)
+        self._check_bar_alignment(df, kind='barh', stacked=True)
+        self._check_bar_alignment(df, kind='barh', stacked=True, width=0.9)
+
+    @pytest.mark.slow
+    def test_bar_center(self):
+        df = DataFrame({'A': [3] * 5, 'B': lrange(5)}, index=lrange(5))
+        self._check_bar_alignment(df, kind='bar', stacked=False)
+        self._check_bar_alignment(df, kind='bar', stacked=False, width=0.9)
+        self._check_bar_alignment(df, kind='barh', stacked=False)
+        self._check_bar_alignment(df, kind='barh', stacked=False, width=0.9)
+
+    @pytest.mark.slow
+    def test_bar_subplots_center(self):
+        df = DataFrame({'A': [3] * 5, 'B': lrange(5)}, index=lrange(5))
+        self._check_bar_alignment(df, kind='bar', subplots=True)
+        self._check_bar_alignment(df, kind='bar', subplots=True, width=0.9)
+        self._check_bar_alignment(df, kind='barh', subplots=True)
+        self._check_bar_alignment(df, kind='barh', subplots=True, width=0.9)
+
+    @pytest.mark.slow
+    def test_bar_align_single_column(self):
+        df = DataFrame(randn(5))
+        self._check_bar_alignment(df, kind='bar', stacked=False)
+        self._check_bar_alignment(df, kind='bar', stacked=True)
+        self._check_bar_alignment(df, kind='barh', stacked=False)
+        self._check_bar_alignment(df, kind='barh', stacked=True)
+        self._check_bar_alignment(df, kind='bar', subplots=True)
+        self._check_bar_alignment(df, kind='barh', subplots=True)
+
+    @pytest.mark.slow
+    def test_bar_edge(self):
+        df = DataFrame({'A': [3] * 5, 'B': lrange(5)}, index=lrange(5))
+
+        self._check_bar_alignment(df, kind='bar', stacked=True, align='edge')
+        self._check_bar_alignment(df, kind='bar', stacked=True, width=0.9,
+                                  align='edge')
+        self._check_bar_alignment(df, kind='barh', stacked=True, align='edge')
+        self._check_bar_alignment(df, kind='barh', stacked=True, width=0.9,
+                                  align='edge')
+
+        self._check_bar_alignment(df, kind='bar', stacked=False, align='edge')
+        self._check_bar_alignment(df, kind='bar', stacked=False, width=0.9,
+                                  align='edge')
+        self._check_bar_alignment(df, kind='barh', stacked=False, align='edge')
+        self._check_bar_alignment(df, kind='barh', stacked=False, width=0.9,
+                                  align='edge')
+
+        self._check_bar_alignment(df, kind='bar', subplots=True, align='edge')
+        self._check_bar_alignment(df, kind='bar', subplots=True, width=0.9,
+                                  align='edge')
+        self._check_bar_alignment(df, kind='barh', subplots=True, align='edge')
+        self._check_bar_alignment(df, kind='barh', subplots=True, width=0.9,
+                                  align='edge')
+
+    @pytest.mark.slow
+    def test_bar_log_no_subplots(self):
+        # GH3254, GH3298 matplotlib/matplotlib#1882, #1892
+        # regressions in 1.2.1
+        expected = np.array([1., 10.])
+
+        if not self.mpl_le_1_2_1:
+            expected = np.hstack((.1, expected, 100))
+
+        # no subplots
+        df = DataFrame({'A': [3] * 5, 'B': lrange(1, 6)}, index=lrange(5))
+        ax = df.plot.bar(grid=True, log=True)
+        tm.assert_numpy_array_equal(ax.yaxis.get_ticklocs(), expected)
+
+    @pytest.mark.slow
+    def test_bar_log_subplots(self):
+        expected = np.array([1., 10., 100., 1000.])
+        if not self.mpl_le_1_2_1:
+            expected = np.hstack((.1, expected, 1e4))
+
+        ax = DataFrame([Series([200, 300]), Series([300, 500])]).plot.bar(
+            log=True, subplots=True)
+
+        tm.assert_numpy_array_equal(ax[0].yaxis.get_ticklocs(), expected)
+        tm.assert_numpy_array_equal(ax[1].yaxis.get_ticklocs(), expected)
+
+    @pytest.mark.slow
+    def test_boxplot(self):
+        df = self.hist_df
+        series = df['height']
+        numeric_cols = df._get_numeric_data().columns
+        labels = [pprint_thing(c) for c in numeric_cols]
+
+        ax = _check_plot_works(df.plot.box)
+        self._check_text_labels(ax.get_xticklabels(), labels)
+        tm.assert_numpy_array_equal(ax.xaxis.get_ticklocs(),
+                                    np.arange(1, len(numeric_cols) + 1))
+        assert len(ax.lines) == self.bp_n_objects * len(numeric_cols)
+
+        # different warning on py3
+        if not PY3:
+            with tm.assert_produces_warning(UserWarning):
+                axes = _check_plot_works(df.plot.box, subplots=True, logy=True)
+
+            self._check_axes_shape(axes, axes_num=3, layout=(1, 3))
+            self._check_ax_scales(axes, yaxis='log')
+            for ax, label in zip(axes, labels):
+                self._check_text_labels(ax.get_xticklabels(), [label])
+                assert len(ax.lines) == self.bp_n_objects
+
+        axes = series.plot.box(rot=40)
+        self._check_ticks_props(axes, xrot=40, yrot=0)
+        tm.close()
+
+        ax = _check_plot_works(series.plot.box)
+
+        positions = np.array([1, 6, 7])
+        ax = df.plot.box(positions=positions)
+        numeric_cols = df._get_numeric_data().columns
+        labels = [pprint_thing(c) for c in numeric_cols]
+        self._check_text_labels(ax.get_xticklabels(), labels)
+        tm.assert_numpy_array_equal(ax.xaxis.get_ticklocs(), positions)
+        assert len(ax.lines) == self.bp_n_objects * len(numeric_cols)
+
+    @pytest.mark.slow
+    def test_boxplot_vertical(self):
+        df = self.hist_df
+        numeric_cols = df._get_numeric_data().columns
+        labels = [pprint_thing(c) for c in numeric_cols]
+
+        # if horizontal, yticklabels are rotated
+        ax = df.plot.box(rot=50, fontsize=8, vert=False)
+        self._check_ticks_props(ax, xrot=0, yrot=50, ylabelsize=8)
+        self._check_text_labels(ax.get_yticklabels(), labels)
+        assert len(ax.lines) == self.bp_n_objects * len(numeric_cols)
+
+        # _check_plot_works adds an ax so catch warning. see GH #13188
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.plot.box,
+                                     subplots=True, vert=False, logx=True)
+        self._check_axes_shape(axes, axes_num=3, layout=(1, 3))
+        self._check_ax_scales(axes, xaxis='log')
+        for ax, label in zip(axes, labels):
+            self._check_text_labels(ax.get_yticklabels(), [label])
+            assert len(ax.lines) == self.bp_n_objects
+
+        positions = np.array([3, 2, 8])
+        ax = df.plot.box(positions=positions, vert=False)
+        self._check_text_labels(ax.get_yticklabels(), labels)
+        tm.assert_numpy_array_equal(ax.yaxis.get_ticklocs(), positions)
+        assert len(ax.lines) == self.bp_n_objects * len(numeric_cols)
+
+    @pytest.mark.slow
+    def test_boxplot_return_type(self):
+        df = DataFrame(randn(6, 4),
+                       index=list(string.ascii_letters[:6]),
+                       columns=['one', 'two', 'three', 'four'])
+        with pytest.raises(ValueError):
+            df.plot.box(return_type='NOTATYPE')
+
+        result = df.plot.box(return_type='dict')
+        self._check_box_return_type(result, 'dict')
+
+        result = df.plot.box(return_type='axes')
+        self._check_box_return_type(result, 'axes')
+
+        result = df.plot.box()  # default axes
+        self._check_box_return_type(result, 'axes')
+
+        result = df.plot.box(return_type='both')
+        self._check_box_return_type(result, 'both')
+
+    @pytest.mark.slow
+    def test_boxplot_subplots_return_type(self):
+        df = self.hist_df
+
+        # normal style: return_type=None
+        result = df.plot.box(subplots=True)
+        assert isinstance(result, Series)
+        self._check_box_return_type(result, None, expected_keys=[
+                                    'height', 'weight', 'category'])
+
+        for t in ['dict', 'axes', 'both']:
+            returned = df.plot.box(return_type=t, subplots=True)
+            self._check_box_return_type(
+                returned, t,
+                expected_keys=['height', 'weight', 'category'],
+                check_ax_title=False)
+
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
+    def test_kde_df(self):
+        _skip_if_no_scipy_gaussian_kde()
+        if not self.mpl_ge_1_5_0:
+            pytest.skip("mpl is not supported")
+
+        df = DataFrame(randn(100, 4))
+        ax = _check_plot_works(df.plot, kind='kde')
+        expected = [pprint_thing(c) for c in df.columns]
+        self._check_legend_labels(ax, labels=expected)
+        self._check_ticks_props(ax, xrot=0)
+
+        ax = df.plot(kind='kde', rot=20, fontsize=5)
+        self._check_ticks_props(ax, xrot=20, xlabelsize=5, ylabelsize=5)
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.plot, kind='kde',
+                                     subplots=True)
+        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
+
+        axes = df.plot(kind='kde', logy=True, subplots=True)
+        self._check_ax_scales(axes, yaxis='log')
+
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
+    def test_kde_missing_vals(self):
+        _skip_if_no_scipy_gaussian_kde()
+        if not self.mpl_ge_1_5_0:
+            pytest.skip("mpl is not supported")
+
+        df = DataFrame(np.random.uniform(size=(100, 4)))
+        df.loc[0, 0] = np.nan
+        _check_plot_works(df.plot, kind='kde')
+
+    @pytest.mark.slow
+    def test_hist_df(self):
+        from matplotlib.patches import Rectangle
+        if self.mpl_le_1_2_1:
+            pytest.skip("not supported in matplotlib <= 1.2.x")
+
+        df = DataFrame(randn(100, 4))
+        series = df[0]
+
+        ax = _check_plot_works(df.plot.hist)
+        expected = [pprint_thing(c) for c in df.columns]
+        self._check_legend_labels(ax, labels=expected)
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.plot.hist,
+                                     subplots=True, logy=True)
+        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
+        self._check_ax_scales(axes, yaxis='log')
+
+        axes = series.plot.hist(rot=40)
+        self._check_ticks_props(axes, xrot=40, yrot=0)
+        tm.close()
+
+        ax = series.plot.hist(normed=True, cumulative=True, bins=4)
+        # height of last bin (index 5) must be 1.0
+        rects = [x for x in ax.get_children() if isinstance(x, Rectangle)]
+        tm.assert_almost_equal(rects[-1].get_height(), 1.0)
+        tm.close()
+
+        ax = series.plot.hist(cumulative=True, bins=4)
+        rects = [x for x in ax.get_children() if isinstance(x, Rectangle)]
+
+        tm.assert_almost_equal(rects[-2].get_height(), 100.0)
+        tm.close()
+
+        # if horizontal, yticklabels are rotated
+        axes = df.plot.hist(rot=50, fontsize=8, orientation='horizontal')
+        self._check_ticks_props(axes, xrot=0, yrot=50, ylabelsize=8)
+
+    def _check_box_coord(self, patches, expected_y=None, expected_h=None,
+                         expected_x=None, expected_w=None):
+        result_y = np.array([p.get_y() for p in patches])
+        result_height = np.array([p.get_height() for p in patches])
+        result_x = np.array([p.get_x() for p in patches])
+        result_width = np.array([p.get_width() for p in patches])
+        # dtype is depending on above values, no need to check
+
+        if expected_y is not None:
+            tm.assert_numpy_array_equal(result_y, expected_y,
+                                        check_dtype=False)
+        if expected_h is not None:
+            tm.assert_numpy_array_equal(result_height, expected_h,
+                                        check_dtype=False)
+        if expected_x is not None:
+            tm.assert_numpy_array_equal(result_x, expected_x,
+                                        check_dtype=False)
+        if expected_w is not None:
+            tm.assert_numpy_array_equal(result_width, expected_w,
+                                        check_dtype=False)
+
+    @pytest.mark.slow
+    def test_hist_df_coord(self):
+        normal_df = DataFrame({'A': np.repeat(np.array([1, 2, 3, 4, 5]),
+                                              np.array([10, 9, 8, 7, 6])),
+                               'B': np.repeat(np.array([1, 2, 3, 4, 5]),
+                                              np.array([8, 8, 8, 8, 8])),
+                               'C': np.repeat(np.array([1, 2, 3, 4, 5]),
+                                              np.array([6, 7, 8, 9, 10]))},
+                              columns=['A', 'B', 'C'])
+
+        nan_df = DataFrame({'A': np.repeat(np.array([np.nan, 1, 2, 3, 4, 5]),
+                                           np.array([3, 10, 9, 8, 7, 6])),
+                            'B': np.repeat(np.array([1, np.nan, 2, 3, 4, 5]),
+                                           np.array([8, 3, 8, 8, 8, 8])),
+                            'C': np.repeat(np.array([1, 2, 3, np.nan, 4, 5]),
+                                           np.array([6, 7, 8, 3, 9, 10]))},
+                           columns=['A', 'B', 'C'])
+
+        for df in [normal_df, nan_df]:
+            ax = df.plot.hist(bins=5)
+            self._check_box_coord(ax.patches[:5],
+                                  expected_y=np.array([0, 0, 0, 0, 0]),
+                                  expected_h=np.array([10, 9, 8, 7, 6]))
+            self._check_box_coord(ax.patches[5:10],
+                                  expected_y=np.array([0, 0, 0, 0, 0]),
+                                  expected_h=np.array([8, 8, 8, 8, 8]))
+            self._check_box_coord(ax.patches[10:],
+                                  expected_y=np.array([0, 0, 0, 0, 0]),
+                                  expected_h=np.array([6, 7, 8, 9, 10]))
+
+            ax = df.plot.hist(bins=5, stacked=True)
+            self._check_box_coord(ax.patches[:5],
+                                  expected_y=np.array([0, 0, 0, 0, 0]),
+                                  expected_h=np.array([10, 9, 8, 7, 6]))
+            self._check_box_coord(ax.patches[5:10],
+                                  expected_y=np.array([10, 9, 8, 7, 6]),
+                                  expected_h=np.array([8, 8, 8, 8, 8]))
+            self._check_box_coord(ax.patches[10:],
+                                  expected_y=np.array([18, 17, 16, 15, 14]),
+                                  expected_h=np.array([6, 7, 8, 9, 10]))
+
+            axes = df.plot.hist(bins=5, stacked=True, subplots=True)
+            self._check_box_coord(axes[0].patches,
+                                  expected_y=np.array([0, 0, 0, 0, 0]),
+                                  expected_h=np.array([10, 9, 8, 7, 6]))
+            self._check_box_coord(axes[1].patches,
+                                  expected_y=np.array([0, 0, 0, 0, 0]),
+                                  expected_h=np.array([8, 8, 8, 8, 8]))
+            self._check_box_coord(axes[2].patches,
+                                  expected_y=np.array([0, 0, 0, 0, 0]),
+                                  expected_h=np.array([6, 7, 8, 9, 10]))
+
+            if self.mpl_ge_1_3_1:
+
+                # horizontal
+                ax = df.plot.hist(bins=5, orientation='horizontal')
+                self._check_box_coord(ax.patches[:5],
+                                      expected_x=np.array([0, 0, 0, 0, 0]),
+                                      expected_w=np.array([10, 9, 8, 7, 6]))
+                self._check_box_coord(ax.patches[5:10],
+                                      expected_x=np.array([0, 0, 0, 0, 0]),
+                                      expected_w=np.array([8, 8, 8, 8, 8]))
+                self._check_box_coord(ax.patches[10:],
+                                      expected_x=np.array([0, 0, 0, 0, 0]),
+                                      expected_w=np.array([6, 7, 8, 9, 10]))
+
+                ax = df.plot.hist(bins=5, stacked=True,
+                                  orientation='horizontal')
+                self._check_box_coord(ax.patches[:5],
+                                      expected_x=np.array([0, 0, 0, 0, 0]),
+                                      expected_w=np.array([10, 9, 8, 7, 6]))
+                self._check_box_coord(ax.patches[5:10],
+                                      expected_x=np.array([10, 9, 8, 7, 6]),
+                                      expected_w=np.array([8, 8, 8, 8, 8]))
+                self._check_box_coord(
+                    ax.patches[10:],
+                    expected_x=np.array([18, 17, 16, 15, 14]),
+                    expected_w=np.array([6, 7, 8, 9, 10]))
+
+                axes = df.plot.hist(bins=5, stacked=True, subplots=True,
+                                    orientation='horizontal')
+                self._check_box_coord(axes[0].patches,
+                                      expected_x=np.array([0, 0, 0, 0, 0]),
+                                      expected_w=np.array([10, 9, 8, 7, 6]))
+                self._check_box_coord(axes[1].patches,
+                                      expected_x=np.array([0, 0, 0, 0, 0]),
+                                      expected_w=np.array([8, 8, 8, 8, 8]))
+                self._check_box_coord(axes[2].patches,
+                                      expected_x=np.array([0, 0, 0, 0, 0]),
+                                      expected_w=np.array([6, 7, 8, 9, 10]))
+
+    @pytest.mark.slow
+    def test_plot_int_columns(self):
+        df = DataFrame(randn(100, 4)).cumsum()
+        _check_plot_works(df.plot, legend=True)
+
+    @pytest.mark.slow
+    def test_df_legend_labels(self):
+        kinds = ['line', 'bar', 'barh', 'kde', 'area', 'hist']
+        df = DataFrame(rand(3, 3), columns=['a', 'b', 'c'])
+        df2 = DataFrame(rand(3, 3), columns=['d', 'e', 'f'])
+        df3 = DataFrame(rand(3, 3), columns=['g', 'h', 'i'])
+        df4 = DataFrame(rand(3, 3), columns=['j', 'k', 'l'])
+
+        for kind in kinds:
+            if not _ok_for_gaussian_kde(kind):
+                continue
+
+            ax = df.plot(kind=kind, legend=True)
+            self._check_legend_labels(ax, labels=df.columns)
+
+            ax = df2.plot(kind=kind, legend=False, ax=ax)
+            self._check_legend_labels(ax, labels=df.columns)
+
+            ax = df3.plot(kind=kind, legend=True, ax=ax)
+            self._check_legend_labels(ax, labels=df.columns.union(df3.columns))
+
+            ax = df4.plot(kind=kind, legend='reverse', ax=ax)
+            expected = list(df.columns.union(df3.columns)) + list(reversed(
+                df4.columns))
+            self._check_legend_labels(ax, labels=expected)
+
+        # Secondary Y
+        ax = df.plot(legend=True, secondary_y='b')
+        self._check_legend_labels(ax, labels=['a', 'b (right)', 'c'])
+        ax = df2.plot(legend=False, ax=ax)
+        self._check_legend_labels(ax, labels=['a', 'b (right)', 'c'])
+        ax = df3.plot(kind='bar', legend=True, secondary_y='h', ax=ax)
+        self._check_legend_labels(
+            ax, labels=['a', 'b (right)', 'c', 'g', 'h (right)', 'i'])
+
+        # Time Series
+        ind = date_range('1/1/2014', periods=3)
+        df = DataFrame(randn(3, 3), columns=['a', 'b', 'c'], index=ind)
+        df2 = DataFrame(randn(3, 3), columns=['d', 'e', 'f'], index=ind)
+        df3 = DataFrame(randn(3, 3), columns=['g', 'h', 'i'], index=ind)
+        ax = df.plot(legend=True, secondary_y='b')
+        self._check_legend_labels(ax, labels=['a', 'b (right)', 'c'])
+        ax = df2.plot(legend=False, ax=ax)
+        self._check_legend_labels(ax, labels=['a', 'b (right)', 'c'])
+        ax = df3.plot(legend=True, ax=ax)
+        self._check_legend_labels(
+            ax, labels=['a', 'b (right)', 'c', 'g', 'h', 'i'])
+
+        # scatter
+        ax = df.plot.scatter(x='a', y='b', label='data1')
+        self._check_legend_labels(ax, labels=['data1'])
+        ax = df2.plot.scatter(x='d', y='e', legend=False, label='data2', ax=ax)
+        self._check_legend_labels(ax, labels=['data1'])
+        ax = df3.plot.scatter(x='g', y='h', label='data3', ax=ax)
+        self._check_legend_labels(ax, labels=['data1', 'data3'])
+
+        # ensure label args pass through and
+        # index name does not mutate
+        # column names don't mutate
+        df5 = df.set_index('a')
+        ax = df5.plot(y='b')
+        self._check_legend_labels(ax, labels=['b'])
+        ax = df5.plot(y='b', label='LABEL_b')
+        self._check_legend_labels(ax, labels=['LABEL_b'])
+        self._check_text_labels(ax.xaxis.get_label(), 'a')
+        ax = df5.plot(y='c', label='LABEL_c', ax=ax)
+        self._check_legend_labels(ax, labels=['LABEL_b', 'LABEL_c'])
+        assert df5.columns.tolist() == ['b', 'c']
+
+    def test_legend_name(self):
+        multi = DataFrame(randn(4, 4),
+                          columns=[np.array(['a', 'a', 'b', 'b']),
+                                   np.array(['x', 'y', 'x', 'y'])])
+        multi.columns.names = ['group', 'individual']
+
+        ax = multi.plot()
+        leg_title = ax.legend_.get_title()
+        self._check_text_labels(leg_title, 'group,individual')
+
+        df = DataFrame(randn(5, 5))
+        ax = df.plot(legend=True, ax=ax)
+        leg_title = ax.legend_.get_title()
+        self._check_text_labels(leg_title, 'group,individual')
+
+        df.columns.name = 'new'
+        ax = df.plot(legend=False, ax=ax)
+        leg_title = ax.legend_.get_title()
+        self._check_text_labels(leg_title, 'group,individual')
+
+        ax = df.plot(legend=True, ax=ax)
+        leg_title = ax.legend_.get_title()
+        self._check_text_labels(leg_title, 'new')
+
+    @pytest.mark.slow
+    def test_no_legend(self):
+        kinds = ['line', 'bar', 'barh', 'kde', 'area', 'hist']
+        df = DataFrame(rand(3, 3), columns=['a', 'b', 'c'])
+
+        for kind in kinds:
+            if not _ok_for_gaussian_kde(kind):
+                continue
+
+            ax = df.plot(kind=kind, legend=False)
+            self._check_legend_labels(ax, visible=False)
+
+    @pytest.mark.slow
+    def test_style_by_column(self):
+        import matplotlib.pyplot as plt
+        fig = plt.gcf()
+
+        df = DataFrame(randn(100, 3))
+        for markers in [{0: '^',
+                         1: '+',
+                         2: 'o'}, {0: '^',
+                                   1: '+'}, ['^', '+', 'o'], ['^', '+']]:
+            fig.clf()
+            fig.add_subplot(111)
+            ax = df.plot(style=markers)
+            for i, l in enumerate(ax.get_lines()[:len(markers)]):
+                assert l.get_marker() == markers[i]
+
+    @pytest.mark.slow
+    def test_line_label_none(self):
+        s = Series([1, 2])
+        ax = s.plot()
+        assert ax.get_legend() is None
+
+        ax = s.plot(legend=True)
+        assert ax.get_legend().get_texts()[0].get_text() == 'None'
+
+    @pytest.mark.slow
+    @tm.capture_stdout
+    def test_line_colors(self):
+        from matplotlib import cm
+
+        custom_colors = 'rgcby'
+        df = DataFrame(randn(5, 5))
+
+        ax = df.plot(color=custom_colors)
+        self._check_colors(ax.get_lines(), linecolors=custom_colors)
+
+        tm.close()
+
+        ax2 = df.plot(colors=custom_colors)
+        lines2 = ax2.get_lines()
+
+        for l1, l2 in zip(ax.get_lines(), lines2):
+            assert l1.get_color() == l2.get_color()
+
+        tm.close()
+
+        ax = df.plot(colormap='jet')
+        rgba_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
+        self._check_colors(ax.get_lines(), linecolors=rgba_colors)
+        tm.close()
+
+        ax = df.plot(colormap=cm.jet)
+        rgba_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
+        self._check_colors(ax.get_lines(), linecolors=rgba_colors)
+        tm.close()
+
+        # make color a list if plotting one column frame
+        # handles cases like df.plot(color='DodgerBlue')
+        ax = df.loc[:, [0]].plot(color='DodgerBlue')
+        self._check_colors(ax.lines, linecolors=['DodgerBlue'])
+
+        ax = df.plot(color='red')
+        self._check_colors(ax.get_lines(), linecolors=['red'] * 5)
+        tm.close()
+
+        # GH 10299
+        custom_colors = ['#FF0000', '#0000FF', '#FFFF00', '#000000', '#FFFFFF']
+        ax = df.plot(color=custom_colors)
+        self._check_colors(ax.get_lines(), linecolors=custom_colors)
+        tm.close()
+
+        with pytest.raises(ValueError):
+            # Color contains shorthand hex value results in ValueError
+            custom_colors = ['#F00', '#00F', '#FF0', '#000', '#FFF']
+            # Forced show plot
+            _check_plot_works(df.plot, color=custom_colors)
+
+    @pytest.mark.slow
+    def test_dont_modify_colors(self):
+        colors = ['r', 'g', 'b']
+        pd.DataFrame(np.random.rand(10, 2)).plot(color=colors)
+        assert len(colors) == 3
+
+    @pytest.mark.slow
+    def test_line_colors_and_styles_subplots(self):
+        # GH 9894
+        from matplotlib import cm
+        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
+
+        df = DataFrame(randn(5, 5))
+
+        axes = df.plot(subplots=True)
+        for ax, c in zip(axes, list(default_colors)):
+            if self.mpl_ge_2_0_0:
+                c = [c]
+            self._check_colors(ax.get_lines(), linecolors=c)
+        tm.close()
+
+        # single color char
+        axes = df.plot(subplots=True, color='k')
+        for ax in axes:
+            self._check_colors(ax.get_lines(), linecolors=['k'])
+        tm.close()
+
+        # single color str
+        axes = df.plot(subplots=True, color='green')
+        for ax in axes:
+            self._check_colors(ax.get_lines(), linecolors=['green'])
+        tm.close()
+
+        custom_colors = 'rgcby'
+        axes = df.plot(color=custom_colors, subplots=True)
+        for ax, c in zip(axes, list(custom_colors)):
+            self._check_colors(ax.get_lines(), linecolors=[c])
+        tm.close()
+
+        axes = df.plot(color=list(custom_colors), subplots=True)
+        for ax, c in zip(axes, list(custom_colors)):
+            self._check_colors(ax.get_lines(), linecolors=[c])
+        tm.close()
+
+        # GH 10299
+        custom_colors = ['#FF0000', '#0000FF', '#FFFF00', '#000000', '#FFFFFF']
+        axes = df.plot(color=custom_colors, subplots=True)
+        for ax, c in zip(axes, list(custom_colors)):
+            self._check_colors(ax.get_lines(), linecolors=[c])
+        tm.close()
+
+        with pytest.raises(ValueError):
+            # Color contains shorthand hex value results in ValueError
+            custom_colors = ['#F00', '#00F', '#FF0', '#000', '#FFF']
+            # Forced show plot
+            # _check_plot_works adds an ax so catch warning. see GH #13188
+            with tm.assert_produces_warning(UserWarning):
+                _check_plot_works(df.plot, color=custom_colors, subplots=True)
+
+        rgba_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
+        for cmap in ['jet', cm.jet]:
+            axes = df.plot(colormap=cmap, subplots=True)
+            for ax, c in zip(axes, rgba_colors):
+                self._check_colors(ax.get_lines(), linecolors=[c])
+            tm.close()
+
+        # make color a list if plotting one column frame
+        # handles cases like df.plot(color='DodgerBlue')
+        axes = df.loc[:, [0]].plot(color='DodgerBlue', subplots=True)
+        self._check_colors(axes[0].lines, linecolors=['DodgerBlue'])
+
+        # single character style
+        axes = df.plot(style='r', subplots=True)
+        for ax in axes:
+            self._check_colors(ax.get_lines(), linecolors=['r'])
+        tm.close()
+
+        # list of styles
+        styles = list('rgcby')
+        axes = df.plot(style=styles, subplots=True)
+        for ax, c in zip(axes, styles):
+            self._check_colors(ax.get_lines(), linecolors=[c])
+        tm.close()
+
+    @pytest.mark.slow
+    def test_area_colors(self):
+        from matplotlib import cm
+        from matplotlib.collections import PolyCollection
+
+        custom_colors = 'rgcby'
+        df = DataFrame(rand(5, 5))
+
+        ax = df.plot.area(color=custom_colors)
+        self._check_colors(ax.get_lines(), linecolors=custom_colors)
+        poly = [o for o in ax.get_children() if isinstance(o, PolyCollection)]
+        self._check_colors(poly, facecolors=custom_colors)
+
+        handles, labels = ax.get_legend_handles_labels()
+        if self.mpl_ge_1_5_0:
+            self._check_colors(handles, facecolors=custom_colors)
+        else:
+            # legend is stored as Line2D, thus check linecolors
+            linehandles = [x for x in handles
+                           if not isinstance(x, PolyCollection)]
+            self._check_colors(linehandles, linecolors=custom_colors)
+
+        for h in handles:
+            assert h.get_alpha() is None
+        tm.close()
+
+        ax = df.plot.area(colormap='jet')
+        jet_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
+        self._check_colors(ax.get_lines(), linecolors=jet_colors)
+        poly = [o for o in ax.get_children() if isinstance(o, PolyCollection)]
+        self._check_colors(poly, facecolors=jet_colors)
+
+        handles, labels = ax.get_legend_handles_labels()
+        if self.mpl_ge_1_5_0:
+            self._check_colors(handles, facecolors=jet_colors)
+        else:
+            linehandles = [x for x in handles
+                           if not isinstance(x, PolyCollection)]
+            self._check_colors(linehandles, linecolors=jet_colors)
+        for h in handles:
+            assert h.get_alpha() is None
+        tm.close()
+
+        # When stacked=False, alpha is set to 0.5
+        ax = df.plot.area(colormap=cm.jet, stacked=False)
+        self._check_colors(ax.get_lines(), linecolors=jet_colors)
+        poly = [o for o in ax.get_children() if isinstance(o, PolyCollection)]
+        jet_with_alpha = [(c[0], c[1], c[2], 0.5) for c in jet_colors]
+        self._check_colors(poly, facecolors=jet_with_alpha)
+
+        handles, labels = ax.get_legend_handles_labels()
+        if self.mpl_ge_1_5_0:
+            linecolors = jet_with_alpha
+        else:
+            # Line2D can't have alpha in its linecolor
+            linecolors = jet_colors
+        self._check_colors(handles[:len(jet_colors)], linecolors=linecolors)
+        for h in handles:
+            assert h.get_alpha() == 0.5
+
+    @pytest.mark.slow
+    def test_hist_colors(self):
+        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
+
+        df = DataFrame(randn(5, 5))
+        ax = df.plot.hist()
+        self._check_colors(ax.patches[::10], facecolors=default_colors[:5])
+        tm.close()
+
+        custom_colors = 'rgcby'
+        ax = df.plot.hist(color=custom_colors)
+        self._check_colors(ax.patches[::10], facecolors=custom_colors)
+        tm.close()
+
+        from matplotlib import cm
+        # Test str -> colormap functionality
+        ax = df.plot.hist(colormap='jet')
+        rgba_colors = lmap(cm.jet, np.linspace(0, 1, 5))
+        self._check_colors(ax.patches[::10], facecolors=rgba_colors)
+        tm.close()
+
+        # Test colormap functionality
+        ax = df.plot.hist(colormap=cm.jet)
+        rgba_colors = lmap(cm.jet, np.linspace(0, 1, 5))
+        self._check_colors(ax.patches[::10], facecolors=rgba_colors)
+        tm.close()
+
+        ax = df.loc[:, [0]].plot.hist(color='DodgerBlue')
+        self._check_colors([ax.patches[0]], facecolors=['DodgerBlue'])
+
+        ax = df.plot(kind='hist', color='green')
+        self._check_colors(ax.patches[::10], facecolors=['green'] * 5)
+        tm.close()
+
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
+    def test_kde_colors(self):
+        _skip_if_no_scipy_gaussian_kde()
+        if not self.mpl_ge_1_5_0:
+            pytest.skip("mpl is not supported")
+
+        from matplotlib import cm
+
+        custom_colors = 'rgcby'
+        df = DataFrame(rand(5, 5))
+
+        ax = df.plot.kde(color=custom_colors)
+        self._check_colors(ax.get_lines(), linecolors=custom_colors)
+        tm.close()
+
+        ax = df.plot.kde(colormap='jet')
+        rgba_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
+        self._check_colors(ax.get_lines(), linecolors=rgba_colors)
+        tm.close()
+
+        ax = df.plot.kde(colormap=cm.jet)
+        rgba_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
+        self._check_colors(ax.get_lines(), linecolors=rgba_colors)
+
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
+    def test_kde_colors_and_styles_subplots(self):
+        _skip_if_no_scipy_gaussian_kde()
+        if not self.mpl_ge_1_5_0:
+            pytest.skip("mpl is not supported")
+
+        from matplotlib import cm
+        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
+
+        df = DataFrame(randn(5, 5))
+
+        axes = df.plot(kind='kde', subplots=True)
+        for ax, c in zip(axes, list(default_colors)):
+            self._check_colors(ax.get_lines(), linecolors=[c])
+        tm.close()
+
+        # single color char
+        axes = df.plot(kind='kde', color='k', subplots=True)
+        for ax in axes:
+            self._check_colors(ax.get_lines(), linecolors=['k'])
+        tm.close()
+
+        # single color str
+        axes = df.plot(kind='kde', color='red', subplots=True)
+        for ax in axes:
+            self._check_colors(ax.get_lines(), linecolors=['red'])
+        tm.close()
+
+        custom_colors = 'rgcby'
+        axes = df.plot(kind='kde', color=custom_colors, subplots=True)
+        for ax, c in zip(axes, list(custom_colors)):
+            self._check_colors(ax.get_lines(), linecolors=[c])
+        tm.close()
+
+        rgba_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
+        for cmap in ['jet', cm.jet]:
+            axes = df.plot(kind='kde', colormap=cmap, subplots=True)
+            for ax, c in zip(axes, rgba_colors):
+                self._check_colors(ax.get_lines(), linecolors=[c])
+            tm.close()
+
+        # make color a list if plotting one column frame
+        # handles cases like df.plot(color='DodgerBlue')
+        axes = df.loc[:, [0]].plot(kind='kde', color='DodgerBlue',
+                                   subplots=True)
+        self._check_colors(axes[0].lines, linecolors=['DodgerBlue'])
+
+        # single character style
+        axes = df.plot(kind='kde', style='r', subplots=True)
+        for ax in axes:
+            self._check_colors(ax.get_lines(), linecolors=['r'])
+        tm.close()
+
+        # list of styles
+        styles = list('rgcby')
+        axes = df.plot(kind='kde', style=styles, subplots=True)
+        for ax, c in zip(axes, styles):
+            self._check_colors(ax.get_lines(), linecolors=[c])
+        tm.close()
+
+    @pytest.mark.slow
+    def test_boxplot_colors(self):
+        def _check_colors(bp, box_c, whiskers_c, medians_c, caps_c='k',
+                          fliers_c=None):
+            # TODO: outside this func?
+            if fliers_c is None:
+                fliers_c = 'k' if self.mpl_ge_2_0_0 else 'b'
+            self._check_colors(bp['boxes'],
+                               linecolors=[box_c] * len(bp['boxes']))
+            self._check_colors(bp['whiskers'],
+                               linecolors=[whiskers_c] * len(bp['whiskers']))
+            self._check_colors(bp['medians'],
+                               linecolors=[medians_c] * len(bp['medians']))
+            self._check_colors(bp['fliers'],
+                               linecolors=[fliers_c] * len(bp['fliers']))
+            self._check_colors(bp['caps'],
+                               linecolors=[caps_c] * len(bp['caps']))
+
+        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
+
+        df = DataFrame(randn(5, 5))
+        bp = df.plot.box(return_type='dict')
+        _check_colors(bp, default_colors[0], default_colors[0],
+                      default_colors[2])
+        tm.close()
+
+        dict_colors = dict(boxes='#572923', whiskers='#982042',
+                           medians='#804823', caps='#123456')
+        bp = df.plot.box(color=dict_colors, sym='r+', return_type='dict')
+        _check_colors(bp, dict_colors['boxes'], dict_colors['whiskers'],
+                      dict_colors['medians'], dict_colors['caps'], 'r')
+        tm.close()
+
+        # partial colors
+        dict_colors = dict(whiskers='c', medians='m')
+        bp = df.plot.box(color=dict_colors, return_type='dict')
+        _check_colors(bp, default_colors[0], 'c', 'm')
+        tm.close()
+
+        from matplotlib import cm
+        # Test str -> colormap functionality
+        bp = df.plot.box(colormap='jet', return_type='dict')
+        jet_colors = lmap(cm.jet, np.linspace(0, 1, 3))
+        _check_colors(bp, jet_colors[0], jet_colors[0], jet_colors[2])
+        tm.close()
+
+        # Test colormap functionality
+        bp = df.plot.box(colormap=cm.jet, return_type='dict')
+        _check_colors(bp, jet_colors[0], jet_colors[0], jet_colors[2])
+        tm.close()
+
+        # string color is applied to all artists except fliers
+        bp = df.plot.box(color='DodgerBlue', return_type='dict')
+        _check_colors(bp, 'DodgerBlue', 'DodgerBlue', 'DodgerBlue',
+                      'DodgerBlue')
+
+        # tuple is also applied to all artists except fliers
+        bp = df.plot.box(color=(0, 1, 0), sym='#123456', return_type='dict')
+        _check_colors(bp, (0, 1, 0), (0, 1, 0), (0, 1, 0),
+                      (0, 1, 0), '#123456')
+
+        with pytest.raises(ValueError):
+            # Color contains invalid key results in ValueError
+            df.plot.box(color=dict(boxes='red', xxxx='blue'))
+
+    def test_default_color_cycle(self):
+        import matplotlib.pyplot as plt
+        colors = list('rgbk')
+        if self.mpl_ge_1_5_0:
+            import cycler
+            plt.rcParams['axes.prop_cycle'] = cycler.cycler('color', colors)
+        else:
+            plt.rcParams['axes.color_cycle'] = colors
+
+        df = DataFrame(randn(5, 3))
+        ax = df.plot()
+
+        expected = self._maybe_unpack_cycler(plt.rcParams)[:3]
+        self._check_colors(ax.get_lines(), linecolors=expected)
+
+    def test_unordered_ts(self):
+        df = DataFrame(np.array([3.0, 2.0, 1.0]),
+                       index=[date(2012, 10, 1),
+                              date(2012, 9, 1),
+                              date(2012, 8, 1)],
+                       columns=['test'])
+        ax = df.plot()
+        xticks = ax.lines[0].get_xdata()
+        assert xticks[0] < xticks[1]
+        ydata = ax.lines[0].get_ydata()
+        tm.assert_numpy_array_equal(ydata, np.array([1.0, 2.0, 3.0]))
+
+    def test_kind_both_ways(self):
+        df = DataFrame({'x': [1, 2, 3]})
+        for kind in plotting._core._common_kinds:
+            if not _ok_for_gaussian_kde(kind):
+                continue
+            df.plot(kind=kind)
+            getattr(df.plot, kind)()
+        for kind in ['scatter', 'hexbin']:
+            df.plot('x', 'x', kind=kind)
+            getattr(df.plot, kind)('x', 'x')
+
+    def test_all_invalid_plot_data(self):
+        df = DataFrame(list('abcd'))
+        for kind in plotting._core._common_kinds:
+            if not _ok_for_gaussian_kde(kind):
+                continue
+            with pytest.raises(TypeError):
+                df.plot(kind=kind)
+
+    @pytest.mark.slow
+    def test_partially_invalid_plot_data(self):
+        with tm.RNGContext(42):
+            df = DataFrame(randn(10, 2), dtype=object)
+            df[np.random.rand(df.shape[0]) > 0.5] = 'a'
+            for kind in plotting._core._common_kinds:
+                if not _ok_for_gaussian_kde(kind):
+                    continue
+                with pytest.raises(TypeError):
+                    df.plot(kind=kind)
+
+        with tm.RNGContext(42):
+            # area plot doesn't support positive/negative mixed data
+            kinds = ['area']
+            df = DataFrame(rand(10, 2), dtype=object)
+            df[np.random.rand(df.shape[0]) > 0.5] = 'a'
+            for kind in kinds:
+                with pytest.raises(TypeError):
+                    df.plot(kind=kind)
+
+    def test_invalid_kind(self):
+        df = DataFrame(randn(10, 2))
+        with pytest.raises(ValueError):
+            df.plot(kind='aasdf')
+
+    @pytest.mark.parametrize("x,y,lbl", [
+        (['B', 'C'], 'A', 'a'),
+        (['A'], ['B', 'C'], ['b', 'c']),
+        ('A', ['B', 'C'], 'badlabel')
+    ])
+    def test_invalid_xy_args(self, x, y, lbl):
+        # GH 18671, 19699 allows y to be list-like but not x
+        df = DataFrame({"A": [1, 2], 'B': [3, 4], 'C': [5, 6]})
+        with pytest.raises(ValueError):
+            df.plot(x=x, y=y, label=lbl)
+
+    @pytest.mark.parametrize("x,y", [
+        ('A', 'B'),
+        (['A'], 'B')
+    ])
+    def test_invalid_xy_args_dup_cols(self, x, y):
+        # GH 18671, 19699 allows y to be list-like but not x
+        df = DataFrame([[1, 3, 5], [2, 4, 6]], columns=list('AAB'))
+        with pytest.raises(ValueError):
+            df.plot(x=x, y=y)
+
+    @pytest.mark.parametrize("x,y,lbl,colors", [
+        ('A', ['B'], ['b'], ['red']),
+        ('A', ['B', 'C'], ['b', 'c'], ['red', 'blue']),
+        (0, [1, 2], ['bokeh', 'cython'], ['green', 'yellow'])
+    ])
+    def test_y_listlike(self, x, y, lbl, colors):
+        # GH 19699: tests list-like y and verifies lbls & colors
+        df = DataFrame({"A": [1, 2], 'B': [3, 4], 'C': [5, 6]})
+        _check_plot_works(df.plot, x='A', y=y, label=lbl)
+
+        ax = df.plot(x=x, y=y, label=lbl, color=colors)
+        assert len(ax.lines) == len(y)
+        self._check_colors(ax.get_lines(), linecolors=colors)
+
+    @pytest.mark.parametrize("x,y,colnames", [
+        (0, 1, ['A', 'B']),
+        (1, 0, [0, 1])
+    ])
+    def test_xy_args_integer(self, x, y, colnames):
+        # GH 20056: tests integer args for xy and checks col names
+        df = DataFrame({"A": [1, 2], 'B': [3, 4]})
+        df.columns = colnames
+        _check_plot_works(df.plot, x=x, y=y)
+
+    @pytest.mark.slow
+    def test_hexbin_basic(self):
+        df = self.hexbin_df
+
+        ax = df.plot.hexbin(x='A', y='B', gridsize=10)
+        # TODO: need better way to test. This just does existence.
+        assert len(ax.collections) == 1
+
+        # GH 6951
+        axes = df.plot.hexbin(x='A', y='B', subplots=True)
+        # hexbin should have 2 axes in the figure, 1 for plotting and another
+        # is colorbar
+        assert len(axes[0].figure.axes) == 2
+        # return value is single axes
+        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
+
+    @pytest.mark.slow
+    def test_hexbin_with_c(self):
+        df = self.hexbin_df
+
+        ax = df.plot.hexbin(x='A', y='B', C='C')
+        assert len(ax.collections) == 1
+
+        ax = df.plot.hexbin(x='A', y='B', C='C', reduce_C_function=np.std)
+        assert len(ax.collections) == 1
+
+    @pytest.mark.slow
+    def test_hexbin_cmap(self):
+        df = self.hexbin_df
+
+        # Default to BuGn
+        ax = df.plot.hexbin(x='A', y='B')
+        assert ax.collections[0].cmap.name == 'BuGn'
+
+        cm = 'cubehelix'
+        ax = df.plot.hexbin(x='A', y='B', colormap=cm)
+        assert ax.collections[0].cmap.name == cm
+
+    @pytest.mark.slow
+    def test_no_color_bar(self):
+        df = self.hexbin_df
+
+        ax = df.plot.hexbin(x='A', y='B', colorbar=None)
+        assert ax.collections[0].colorbar is None
+
+    @pytest.mark.slow
+    def test_allow_cmap(self):
+        df = self.hexbin_df
+
+        ax = df.plot.hexbin(x='A', y='B', cmap='YlGn')
+        assert ax.collections[0].cmap.name == 'YlGn'
+
+        with pytest.raises(TypeError):
+            df.plot.hexbin(x='A', y='B', cmap='YlGn', colormap='BuGn')
+
+    @pytest.mark.slow
+    def test_pie_df(self):
+        df = DataFrame(np.random.rand(5, 3), columns=['X', 'Y', 'Z'],
+                       index=['a', 'b', 'c', 'd', 'e'])
+        with pytest.raises(ValueError):
+            df.plot.pie()
+
+        ax = _check_plot_works(df.plot.pie, y='Y')
+        self._check_text_labels(ax.texts, df.index)
+
+        ax = _check_plot_works(df.plot.pie, y=2)
+        self._check_text_labels(ax.texts, df.index)
+
+        # _check_plot_works adds an ax so catch warning. see GH #13188
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.plot.pie,
+                                     subplots=True)
+        assert len(axes) == len(df.columns)
+        for ax in axes:
+            self._check_text_labels(ax.texts, df.index)
+        for ax, ylabel in zip(axes, df.columns):
+            assert ax.get_ylabel() == ylabel
+
+        labels = ['A', 'B', 'C', 'D', 'E']
+        color_args = ['r', 'g', 'b', 'c', 'm']
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.plot.pie,
+                                     subplots=True, labels=labels,
+                                     colors=color_args)
+        assert len(axes) == len(df.columns)
+
+        for ax in axes:
+            self._check_text_labels(ax.texts, labels)
+            self._check_colors(ax.patches, facecolors=color_args)
+
+    def test_pie_df_nan(self):
+        df = DataFrame(np.random.rand(4, 4))
+        for i in range(4):
+            df.iloc[i, i] = np.nan
+        fig, axes = self.plt.subplots(ncols=4)
+        df.plot.pie(subplots=True, ax=axes, legend=True)
+
+        base_expected = ['0', '1', '2', '3']
+        for i, ax in enumerate(axes):
+            expected = list(base_expected)  # force copy
+            expected[i] = ''
+            result = [x.get_text() for x in ax.texts]
+            assert result == expected
+            # legend labels
+            # NaN's not included in legend with subplots
+            # see https://github.com/pandas-dev/pandas/issues/8390
+            assert ([x.get_text() for x in ax.get_legend().get_texts()] ==
+                    base_expected[:i] + base_expected[i + 1:])
+
+    @pytest.mark.slow
+    def test_errorbar_plot(self):
+        with warnings.catch_warnings():
+            d = {'x': np.arange(12), 'y': np.arange(12, 0, -1)}
+            df = DataFrame(d)
+            d_err = {'x': np.ones(12) * 0.2, 'y': np.ones(12) * 0.4}
+            df_err = DataFrame(d_err)
+
+            # check line plots
+            ax = _check_plot_works(df.plot, yerr=df_err, logy=True)
+            self._check_has_errorbars(ax, xerr=0, yerr=2)
+            ax = _check_plot_works(df.plot, yerr=df_err, logx=True, logy=True)
+            self._check_has_errorbars(ax, xerr=0, yerr=2)
+            ax = _check_plot_works(df.plot, yerr=df_err, loglog=True)
+            self._check_has_errorbars(ax, xerr=0, yerr=2)
+
+            kinds = ['line', 'bar', 'barh']
+            for kind in kinds:
+                ax = _check_plot_works(df.plot, yerr=df_err['x'], kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=2)
+                ax = _check_plot_works(df.plot, yerr=d_err, kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=2)
+                ax = _check_plot_works(df.plot, yerr=df_err, xerr=df_err,
+                                       kind=kind)
+                self._check_has_errorbars(ax, xerr=2, yerr=2)
+                ax = _check_plot_works(df.plot, yerr=df_err['x'],
+                                       xerr=df_err['x'],
+                                       kind=kind)
+                self._check_has_errorbars(ax, xerr=2, yerr=2)
+                ax = _check_plot_works(df.plot, xerr=0.2, yerr=0.2, kind=kind)
+                self._check_has_errorbars(ax, xerr=2, yerr=2)
+
+                # _check_plot_works adds an ax so catch warning. see GH #13188
+                axes = _check_plot_works(df.plot,
+                                         yerr=df_err, xerr=df_err,
+                                         subplots=True,
+                                         kind=kind)
+                self._check_has_errorbars(axes, xerr=1, yerr=1)
+
+            ax = _check_plot_works((df + 1).plot, yerr=df_err,
+                                   xerr=df_err, kind='bar', log=True)
+            self._check_has_errorbars(ax, xerr=2, yerr=2)
+
+            # yerr is raw error values
+            ax = _check_plot_works(df['y'].plot, yerr=np.ones(12) * 0.4)
+            self._check_has_errorbars(ax, xerr=0, yerr=1)
+            ax = _check_plot_works(df.plot, yerr=np.ones((2, 12)) * 0.4)
+            self._check_has_errorbars(ax, xerr=0, yerr=2)
+
+            # yerr is iterator
+            import itertools
+            ax = _check_plot_works(df.plot,
+                                   yerr=itertools.repeat(0.1, len(df)))
+            self._check_has_errorbars(ax, xerr=0, yerr=2)
+
+            # yerr is column name
+            for yerr in ['yerr', u('誤差')]:
+                s_df = df.copy()
+                s_df[yerr] = np.ones(12) * 0.2
+                ax = _check_plot_works(s_df.plot, yerr=yerr)
+                self._check_has_errorbars(ax, xerr=0, yerr=2)
+                ax = _check_plot_works(s_df.plot, y='y', x='x', yerr=yerr)
+                self._check_has_errorbars(ax, xerr=0, yerr=1)
+
+            with pytest.raises(ValueError):
+                df.plot(yerr=np.random.randn(11))
+
+            df_err = DataFrame({'x': ['zzz'] * 12, 'y': ['zzz'] * 12})
+            with pytest.raises((ValueError, TypeError)):
+                df.plot(yerr=df_err)
+
+    @pytest.mark.slow
+    def test_errorbar_with_integer_column_names(self):
+        # test with integer column names
+        df = DataFrame(np.random.randn(10, 2))
+        df_err = DataFrame(np.random.randn(10, 2))
+        ax = _check_plot_works(df.plot, yerr=df_err)
+        self._check_has_errorbars(ax, xerr=0, yerr=2)
+        ax = _check_plot_works(df.plot, y=0, yerr=1)
+        self._check_has_errorbars(ax, xerr=0, yerr=1)
+
+    @pytest.mark.slow
+    def test_errorbar_with_partial_columns(self):
+        df = DataFrame(np.random.randn(10, 3))
+        df_err = DataFrame(np.random.randn(10, 2), columns=[0, 2])
+        kinds = ['line', 'bar']
+        for kind in kinds:
+            ax = _check_plot_works(df.plot, yerr=df_err, kind=kind)
+            self._check_has_errorbars(ax, xerr=0, yerr=2)
+
+        ix = date_range('1/1/2000', periods=10, freq='M')
+        df.set_index(ix, inplace=True)
+        df_err.set_index(ix, inplace=True)
+        ax = _check_plot_works(df.plot, yerr=df_err, kind='line')
+        self._check_has_errorbars(ax, xerr=0, yerr=2)
+
+        d = {'x': np.arange(12), 'y': np.arange(12, 0, -1)}
+        df = DataFrame(d)
+        d_err = {'x': np.ones(12) * 0.2, 'z': np.ones(12) * 0.4}
+        df_err = DataFrame(d_err)
+        for err in [d_err, df_err]:
+            ax = _check_plot_works(df.plot, yerr=err)
+            self._check_has_errorbars(ax, xerr=0, yerr=1)
+
+    @pytest.mark.slow
+    def test_errorbar_timeseries(self):
+
+        with warnings.catch_warnings():
+            d = {'x': np.arange(12), 'y': np.arange(12, 0, -1)}
+            d_err = {'x': np.ones(12) * 0.2, 'y': np.ones(12) * 0.4}
+
+            # check time-series plots
+            ix = date_range('1/1/2000', '1/1/2001', freq='M')
+            tdf = DataFrame(d, index=ix)
+            tdf_err = DataFrame(d_err, index=ix)
+
+            kinds = ['line', 'bar', 'barh']
+            for kind in kinds:
+                ax = _check_plot_works(tdf.plot, yerr=tdf_err, kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=2)
+                ax = _check_plot_works(tdf.plot, yerr=d_err, kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=2)
+                ax = _check_plot_works(tdf.plot, y='y', yerr=tdf_err['x'],
+                                       kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=1)
+                ax = _check_plot_works(tdf.plot, y='y', yerr='x', kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=1)
+                ax = _check_plot_works(tdf.plot, yerr=tdf_err, kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=2)
+
+                # _check_plot_works adds an ax so catch warning. see GH #13188
+                axes = _check_plot_works(tdf.plot,
+                                         kind=kind, yerr=tdf_err,
+                                         subplots=True)
+                self._check_has_errorbars(axes, xerr=0, yerr=1)
+
+    def test_errorbar_asymmetrical(self):
+
+        np.random.seed(0)
+        err = np.random.rand(3, 2, 5)
+
+        # each column is [0, 1, 2, 3, 4], [3, 4, 5, 6, 7]...
+        df = DataFrame(np.arange(15).reshape(3, 5)).T
+        data = df.values
+
+        ax = df.plot(yerr=err, xerr=err / 2)
+
+        if self.mpl_ge_2_0_0:
+            yerr_0_0 = ax.collections[1].get_paths()[0].vertices[:, 1]
+            expected_0_0 = err[0, :, 0] * np.array([-1, 1])
+            tm.assert_almost_equal(yerr_0_0, expected_0_0)
+        else:
+            assert ax.lines[7].get_ydata()[0] == data[0, 1] - err[1, 0, 0]
+            assert ax.lines[8].get_ydata()[0] == data[0, 1] + err[1, 1, 0]
+            assert ax.lines[5].get_xdata()[0] == -err[1, 0, 0] / 2
+            assert ax.lines[6].get_xdata()[0] == err[1, 1, 0] / 2
+
+        with pytest.raises(ValueError):
+            df.plot(yerr=err.T)
+
+        tm.close()
+
+    @td.xfail_if_mpl_2_2
+    def test_table(self):
+        df = DataFrame(np.random.rand(10, 3),
+                       index=list(string.ascii_letters[:10]))
+        _check_plot_works(df.plot, table=True)
+        _check_plot_works(df.plot, table=df)
+
+        ax = df.plot()
+        assert len(ax.tables) == 0
+        plotting.table(ax, df.T)
+        assert len(ax.tables) == 1
+
+    def test_errorbar_scatter(self):
+        df = DataFrame(
+            np.random.randn(5, 2), index=range(5), columns=['x', 'y'])
+        df_err = DataFrame(np.random.randn(5, 2) / 5,
+                           index=range(5), columns=['x', 'y'])
+
+        ax = _check_plot_works(df.plot.scatter, x='x', y='y')
+        self._check_has_errorbars(ax, xerr=0, yerr=0)
+        ax = _check_plot_works(df.plot.scatter, x='x', y='y', xerr=df_err)
+        self._check_has_errorbars(ax, xerr=1, yerr=0)
+
+        ax = _check_plot_works(df.plot.scatter, x='x', y='y', yerr=df_err)
+        self._check_has_errorbars(ax, xerr=0, yerr=1)
+        ax = _check_plot_works(df.plot.scatter, x='x', y='y', xerr=df_err,
+                               yerr=df_err)
+        self._check_has_errorbars(ax, xerr=1, yerr=1)
+
+        def _check_errorbar_color(containers, expected, has_err='has_xerr'):
+            lines = []
+            errs = [c.lines
+                    for c in ax.containers if getattr(c, has_err, False)][0]
+            for el in errs:
+                if is_list_like(el):
+                    lines.extend(el)
+                else:
+                    lines.append(el)
+            err_lines = [x for x in lines if x in ax.collections]
+            self._check_colors(
+                err_lines, linecolors=np.array([expected] * len(err_lines)))
+
+        # GH 8081
+        df = DataFrame(
+            np.random.randn(10, 5), columns=['a', 'b', 'c', 'd', 'e'])
+        ax = df.plot.scatter(x='a', y='b', xerr='d', yerr='e', c='red')
+        self._check_has_errorbars(ax, xerr=1, yerr=1)
+        _check_errorbar_color(ax.containers, 'red', has_err='has_xerr')
+        _check_errorbar_color(ax.containers, 'red', has_err='has_yerr')
+
+        ax = df.plot.scatter(x='a', y='b', yerr='e', color='green')
+        self._check_has_errorbars(ax, xerr=0, yerr=1)
+        _check_errorbar_color(ax.containers, 'green', has_err='has_yerr')
+
+    @pytest.mark.slow
+    def test_sharex_and_ax(self):
+        # https://github.com/pandas-dev/pandas/issues/9737 using gridspec,
+        # the axis in fig.get_axis() are sorted differently than pandas
+        # expected them, so make sure that only the right ones are removed
+        import matplotlib.pyplot as plt
+        plt.close('all')
+        gs, axes = _generate_4_axes_via_gridspec()
+
+        df = DataFrame({"a": [1, 2, 3, 4, 5, 6],
+                        "b": [1, 2, 3, 4, 5, 6],
+                        "c": [1, 2, 3, 4, 5, 6],
+                        "d": [1, 2, 3, 4, 5, 6]})
+
+        def _check(axes):
+            for ax in axes:
+                assert len(ax.lines) == 1
+                self._check_visible(ax.get_yticklabels(), visible=True)
+            for ax in [axes[0], axes[2]]:
+                self._check_visible(ax.get_xticklabels(), visible=False)
+                self._check_visible(
+                    ax.get_xticklabels(minor=True), visible=False)
+            for ax in [axes[1], axes[3]]:
+                self._check_visible(ax.get_xticklabels(), visible=True)
+                self._check_visible(
+                    ax.get_xticklabels(minor=True), visible=True)
+
+        for ax in axes:
+            df.plot(x="a", y="b", title="title", ax=ax, sharex=True)
+        gs.tight_layout(plt.gcf())
+        _check(axes)
+        tm.close()
+
+        gs, axes = _generate_4_axes_via_gridspec()
+        with tm.assert_produces_warning(UserWarning):
+            axes = df.plot(subplots=True, ax=axes, sharex=True)
+        _check(axes)
+        tm.close()
+
+        gs, axes = _generate_4_axes_via_gridspec()
+        # without sharex, no labels should be touched!
+        for ax in axes:
+            df.plot(x="a", y="b", title="title", ax=ax)
+
+        gs.tight_layout(plt.gcf())
+        for ax in axes:
+            assert len(ax.lines) == 1
+            self._check_visible(ax.get_yticklabels(), visible=True)
+            self._check_visible(ax.get_xticklabels(), visible=True)
+            self._check_visible(ax.get_xticklabels(minor=True), visible=True)
+        tm.close()
+
+    @pytest.mark.slow
+    def test_sharey_and_ax(self):
+        # https://github.com/pandas-dev/pandas/issues/9737 using gridspec,
+        # the axis in fig.get_axis() are sorted differently than pandas
+        # expected them, so make sure that only the right ones are removed
+        import matplotlib.pyplot as plt
+
+        gs, axes = _generate_4_axes_via_gridspec()
+
+        df = DataFrame({"a": [1, 2, 3, 4, 5, 6],
+                        "b": [1, 2, 3, 4, 5, 6],
+                        "c": [1, 2, 3, 4, 5, 6],
+                        "d": [1, 2, 3, 4, 5, 6]})
+
+        def _check(axes):
+            for ax in axes:
+                assert len(ax.lines) == 1
+                self._check_visible(ax.get_xticklabels(), visible=True)
+                self._check_visible(
+                    ax.get_xticklabels(minor=True), visible=True)
+            for ax in [axes[0], axes[1]]:
+                self._check_visible(ax.get_yticklabels(), visible=True)
+            for ax in [axes[2], axes[3]]:
+                self._check_visible(ax.get_yticklabels(), visible=False)
+
+        for ax in axes:
+            df.plot(x="a", y="b", title="title", ax=ax, sharey=True)
+        gs.tight_layout(plt.gcf())
+        _check(axes)
+        tm.close()
+
+        gs, axes = _generate_4_axes_via_gridspec()
+        with tm.assert_produces_warning(UserWarning):
+            axes = df.plot(subplots=True, ax=axes, sharey=True)
+
+        gs.tight_layout(plt.gcf())
+        _check(axes)
+        tm.close()
+
+        gs, axes = _generate_4_axes_via_gridspec()
+        # without sharex, no labels should be touched!
+        for ax in axes:
+            df.plot(x="a", y="b", title="title", ax=ax)
+
+        gs.tight_layout(plt.gcf())
+        for ax in axes:
+            assert len(ax.lines) == 1
+            self._check_visible(ax.get_yticklabels(), visible=True)
+            self._check_visible(ax.get_xticklabels(), visible=True)
+            self._check_visible(ax.get_xticklabels(minor=True), visible=True)
+
+    def test_memory_leak(self):
+        """ Check that every plot type gets properly collected. """
+        import weakref
+        import gc
+
+        results = {}
+        for kind in plotting._core._plot_klass.keys():
+            if not _ok_for_gaussian_kde(kind):
+                continue
+            args = {}
+            if kind in ['hexbin', 'scatter', 'pie']:
+                df = self.hexbin_df
+                args = {'x': 'A', 'y': 'B'}
+            elif kind == 'area':
+                df = self.tdf.abs()
+            else:
+                df = self.tdf
+
+            # Use a weakref so we can see if the object gets collected without
+            # also preventing it from being collected
+            results[kind] = weakref.proxy(df.plot(kind=kind, **args))
+
+        # have matplotlib delete all the figures
+        tm.close()
+        # force a garbage collection
+        gc.collect()
+        for key in results:
+            # check that every plot was collected
+            with pytest.raises(ReferenceError):
+                # need to actually access something to get an error
+                results[key].lines
+
+    @pytest.mark.slow
+    def test_df_subplots_patterns_minorticks(self):
+        # GH 10657
+        import matplotlib.pyplot as plt
+
+        df = DataFrame(np.random.randn(10, 2),
+                       index=date_range('1/1/2000', periods=10),
+                       columns=list('AB'))
+
+        # shared subplots
+        fig, axes = plt.subplots(2, 1, sharex=True)
+        axes = df.plot(subplots=True, ax=axes)
+        for ax in axes:
+            assert len(ax.lines) == 1
+            self._check_visible(ax.get_yticklabels(), visible=True)
+        # xaxis of 1st ax must be hidden
+        self._check_visible(axes[0].get_xticklabels(), visible=False)
+        self._check_visible(axes[0].get_xticklabels(minor=True), visible=False)
+        self._check_visible(axes[1].get_xticklabels(), visible=True)
+        self._check_visible(axes[1].get_xticklabels(minor=True), visible=True)
+        tm.close()
+
+        fig, axes = plt.subplots(2, 1)
+        with tm.assert_produces_warning(UserWarning):
+            axes = df.plot(subplots=True, ax=axes, sharex=True)
+        for ax in axes:
+            assert len(ax.lines) == 1
+            self._check_visible(ax.get_yticklabels(), visible=True)
+        # xaxis of 1st ax must be hidden
+        self._check_visible(axes[0].get_xticklabels(), visible=False)
+        self._check_visible(axes[0].get_xticklabels(minor=True), visible=False)
+        self._check_visible(axes[1].get_xticklabels(), visible=True)
+        self._check_visible(axes[1].get_xticklabels(minor=True), visible=True)
+        tm.close()
+
+        # not shared
+        fig, axes = plt.subplots(2, 1)
+        axes = df.plot(subplots=True, ax=axes)
+        for ax in axes:
+            assert len(ax.lines) == 1
+            self._check_visible(ax.get_yticklabels(), visible=True)
+            self._check_visible(ax.get_xticklabels(), visible=True)
+            self._check_visible(ax.get_xticklabels(minor=True), visible=True)
+        tm.close()
+
+    @pytest.mark.slow
+    def test_df_gridspec_patterns(self):
+        # GH 10819
+        import matplotlib.pyplot as plt
+        import matplotlib.gridspec as gridspec
+
+        ts = Series(np.random.randn(10),
+                    index=date_range('1/1/2000', periods=10))
+
+        df = DataFrame(np.random.randn(10, 2), index=ts.index,
+                       columns=list('AB'))
+
+        def _get_vertical_grid():
+            gs = gridspec.GridSpec(3, 1)
+            fig = plt.figure()
+            ax1 = fig.add_subplot(gs[:2, :])
+            ax2 = fig.add_subplot(gs[2, :])
+            return ax1, ax2
+
+        def _get_horizontal_grid():
+            gs = gridspec.GridSpec(1, 3)
+            fig = plt.figure()
+            ax1 = fig.add_subplot(gs[:, :2])
+            ax2 = fig.add_subplot(gs[:, 2])
+            return ax1, ax2
+
+        for ax1, ax2 in [_get_vertical_grid(), _get_horizontal_grid()]:
+            ax1 = ts.plot(ax=ax1)
+            assert len(ax1.lines) == 1
+            ax2 = df.plot(ax=ax2)
+            assert len(ax2.lines) == 2
+            for ax in [ax1, ax2]:
+                self._check_visible(ax.get_yticklabels(), visible=True)
+                self._check_visible(ax.get_xticklabels(), visible=True)
+                self._check_visible(
+                    ax.get_xticklabels(minor=True), visible=True)
+            tm.close()
+
+        # subplots=True
+        for ax1, ax2 in [_get_vertical_grid(), _get_horizontal_grid()]:
+            axes = df.plot(subplots=True, ax=[ax1, ax2])
+            assert len(ax1.lines) == 1
+            assert len(ax2.lines) == 1
+            for ax in axes:
+                self._check_visible(ax.get_yticklabels(), visible=True)
+                self._check_visible(ax.get_xticklabels(), visible=True)
+                self._check_visible(
+                    ax.get_xticklabels(minor=True), visible=True)
+            tm.close()
+
+        # vertical / subplots / sharex=True / sharey=True
+        ax1, ax2 = _get_vertical_grid()
+        with tm.assert_produces_warning(UserWarning):
+            axes = df.plot(subplots=True, ax=[ax1, ax2], sharex=True,
+                           sharey=True)
+        assert len(axes[0].lines) == 1
+        assert len(axes[1].lines) == 1
+        for ax in [ax1, ax2]:
+            # yaxis are visible because there is only one column
+            self._check_visible(ax.get_yticklabels(), visible=True)
+        # xaxis of axes0 (top) are hidden
+        self._check_visible(axes[0].get_xticklabels(), visible=False)
+        self._check_visible(axes[0].get_xticklabels(minor=True), visible=False)
+        self._check_visible(axes[1].get_xticklabels(), visible=True)
+        self._check_visible(axes[1].get_xticklabels(minor=True), visible=True)
+        tm.close()
+
+        # horizontal / subplots / sharex=True / sharey=True
+        ax1, ax2 = _get_horizontal_grid()
+        with tm.assert_produces_warning(UserWarning):
+            axes = df.plot(subplots=True, ax=[ax1, ax2], sharex=True,
+                           sharey=True)
+        assert len(axes[0].lines) == 1
+        assert len(axes[1].lines) == 1
+        self._check_visible(axes[0].get_yticklabels(), visible=True)
+        # yaxis of axes1 (right) are hidden
+        self._check_visible(axes[1].get_yticklabels(), visible=False)
+        for ax in [ax1, ax2]:
+            # xaxis are visible because there is only one column
+            self._check_visible(ax.get_xticklabels(), visible=True)
+            self._check_visible(ax.get_xticklabels(minor=True), visible=True)
+        tm.close()
+
+        # boxed
+        def _get_boxed_grid():
+            gs = gridspec.GridSpec(3, 3)
+            fig = plt.figure()
+            ax1 = fig.add_subplot(gs[:2, :2])
+            ax2 = fig.add_subplot(gs[:2, 2])
+            ax3 = fig.add_subplot(gs[2, :2])
+            ax4 = fig.add_subplot(gs[2, 2])
+            return ax1, ax2, ax3, ax4
+
+        axes = _get_boxed_grid()
+        df = DataFrame(np.random.randn(10, 4),
+                       index=ts.index, columns=list('ABCD'))
+        axes = df.plot(subplots=True, ax=axes)
+        for ax in axes:
+            assert len(ax.lines) == 1
+            # axis are visible because these are not shared
+            self._check_visible(ax.get_yticklabels(), visible=True)
+            self._check_visible(ax.get_xticklabels(), visible=True)
+            self._check_visible(ax.get_xticklabels(minor=True), visible=True)
+        tm.close()
+
+        # subplots / sharex=True / sharey=True
+        axes = _get_boxed_grid()
+        with tm.assert_produces_warning(UserWarning):
+            axes = df.plot(subplots=True, ax=axes, sharex=True, sharey=True)
+        for ax in axes:
+            assert len(ax.lines) == 1
+        for ax in [axes[0], axes[2]]:  # left column
+            self._check_visible(ax.get_yticklabels(), visible=True)
+        for ax in [axes[1], axes[3]]:  # right column
+            self._check_visible(ax.get_yticklabels(), visible=False)
+        for ax in [axes[0], axes[1]]:  # top row
+            self._check_visible(ax.get_xticklabels(), visible=False)
+            self._check_visible(ax.get_xticklabels(minor=True), visible=False)
+        for ax in [axes[2], axes[3]]:  # bottom row
+            self._check_visible(ax.get_xticklabels(), visible=True)
+            self._check_visible(ax.get_xticklabels(minor=True), visible=True)
+        tm.close()
+
+    @pytest.mark.slow
+    def test_df_grid_settings(self):
+        # Make sure plot defaults to rcParams['axes.grid'] setting, GH 9792
+        self._check_grid_settings(
+            DataFrame({'a': [1, 2, 3], 'b': [2, 3, 4]}),
+            plotting._core._dataframe_kinds, kws={'x': 'a', 'y': 'b'})
+
+    def test_invalid_colormap(self):
+        df = DataFrame(randn(3, 2), columns=['A', 'B'])
+
+        with pytest.raises(ValueError):
+            df.plot(colormap='invalid_colormap')
+
+    def test_plain_axes(self):
+
+        # supplied ax itself is a SubplotAxes, but figure contains also
+        # a plain Axes object (GH11556)
+        fig, ax = self.plt.subplots()
+        fig.add_axes([0.2, 0.2, 0.2, 0.2])
+        Series(rand(10)).plot(ax=ax)
+
+        # suppliad ax itself is a plain Axes, but because the cmap keyword
+        # a new ax is created for the colorbar -> also multiples axes (GH11520)
+        df = DataFrame({'a': randn(8), 'b': randn(8)})
+        fig = self.plt.figure()
+        ax = fig.add_axes((0, 0, 1, 1))
+        df.plot(kind='scatter', ax=ax, x='a', y='b', c='a', cmap='hsv')
+
+        # other examples
+        fig, ax = self.plt.subplots()
+        from mpl_toolkits.axes_grid1 import make_axes_locatable
+        divider = make_axes_locatable(ax)
+        cax = divider.append_axes("right", size="5%", pad=0.05)
+        Series(rand(10)).plot(ax=ax)
+        Series(rand(10)).plot(ax=cax)
+
+        fig, ax = self.plt.subplots()
+        from mpl_toolkits.axes_grid1.inset_locator import inset_axes
+        iax = inset_axes(ax, width="30%", height=1., loc=3)
+        Series(rand(10)).plot(ax=ax)
+        Series(rand(10)).plot(ax=iax)
+
+    def test_passed_bar_colors(self):
+        import matplotlib as mpl
+        color_tuples = [(0.9, 0, 0, 1), (0, 0.9, 0, 1), (0, 0, 0.9, 1)]
+        colormap = mpl.colors.ListedColormap(color_tuples)
+        barplot = pd.DataFrame([[1, 2, 3]]).plot(kind="bar", cmap=colormap)
+        assert color_tuples == [c.get_facecolor() for c in barplot.patches]
+
+    def test_rcParams_bar_colors(self):
+        import matplotlib as mpl
+        color_tuples = [(0.9, 0, 0, 1), (0, 0.9, 0, 1), (0, 0, 0.9, 1)]
+        try:  # mpl 1.5
+            with mpl.rc_context(
+                    rc={'axes.prop_cycle': mpl.cycler("color", color_tuples)}):
+                barplot = pd.DataFrame([[1, 2, 3]]).plot(kind="bar")
+        except (AttributeError, KeyError):  # mpl 1.4
+            with mpl.rc_context(rc={'axes.color_cycle': color_tuples}):
+                barplot = pd.DataFrame([[1, 2, 3]]).plot(kind="bar")
+        assert color_tuples == [c.get_facecolor() for c in barplot.patches]
+
+    @pytest.mark.parametrize('method', ['line', 'barh', 'bar'])
+    def test_secondary_axis_font_size(self, method):
+        # GH: 12565
+        df = (pd.DataFrame(np.random.randn(15, 2),
+                           columns=list('AB'))
+              .assign(C=lambda df: df.B.cumsum())
+              .assign(D=lambda df: df.C * 1.1))
+
+        fontsize = 20
+        sy = ['C', 'D']
+
+        kwargs = dict(secondary_y=sy, fontsize=fontsize,
+                      mark_right=True)
+        ax = getattr(df.plot, method)(**kwargs)
+        self._check_ticks_props(axes=ax.right_ax,
+                                ylabelsize=fontsize)
+
+
+def _generate_4_axes_via_gridspec():
+    import matplotlib.pyplot as plt
+    import matplotlib as mpl
+    import matplotlib.gridspec  # noqa
+
+    gs = mpl.gridspec.GridSpec(2, 2)
+    ax_tl = plt.subplot(gs[0, 0])
+    ax_ll = plt.subplot(gs[1, 0])
+    ax_tr = plt.subplot(gs[0, 1])
+    ax_lr = plt.subplot(gs[1, 1])
+
+    return gs, [ax_tl, ax_ll, ax_tr, ax_lr]
diff --git a/pandas/tests/plotting/test_groupby.py b/pandas/tests/plotting/test_groupby.py
new file mode 100644
index 0000000000000..a7c99a06c34e9
--- /dev/null
+++ b/pandas/tests/plotting/test_groupby.py
@@ -0,0 +1,75 @@
+# coding: utf-8
+
+""" Test cases for GroupBy.plot """
+
+
+from pandas import Series, DataFrame
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+import numpy as np
+
+from pandas.tests.plotting.common import TestPlotBase
+
+
+@td.skip_if_no_mpl
+class TestDataFrameGroupByPlots(TestPlotBase):
+
+    def test_series_groupby_plotting_nominally_works(self):
+        n = 10
+        weight = Series(np.random.normal(166, 20, size=n))
+        height = Series(np.random.normal(60, 10, size=n))
+        with tm.RNGContext(42):
+            gender = np.random.choice(['male', 'female'], size=n)
+
+        weight.groupby(gender).plot()
+        tm.close()
+        height.groupby(gender).hist()
+        tm.close()
+        # Regression test for GH8733
+        height.groupby(gender).plot(alpha=0.5)
+        tm.close()
+
+    def test_plotting_with_float_index_works(self):
+        # GH 7025
+        df = DataFrame({'def': [1, 1, 1, 2, 2, 2, 3, 3, 3],
+                        'val': np.random.randn(9)},
+                       index=[1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0])
+
+        df.groupby('def')['val'].plot()
+        tm.close()
+        df.groupby('def')['val'].apply(lambda x: x.plot())
+        tm.close()
+
+    def test_hist_single_row(self):
+        # GH10214
+        bins = np.arange(80, 100 + 2, 1)
+        df = DataFrame({"Name": ["AAA", "BBB"],
+                        "ByCol": [1, 2],
+                        "Mark": [85, 89]})
+        df["Mark"].hist(by=df["ByCol"], bins=bins)
+        df = DataFrame({"Name": ["AAA"], "ByCol": [1], "Mark": [85]})
+        df["Mark"].hist(by=df["ByCol"], bins=bins)
+
+    def test_plot_submethod_works(self):
+        df = DataFrame({'x': [1, 2, 3, 4, 5],
+                        'y': [1, 2, 3, 2, 1],
+                        'z': list('ababa')})
+        df.groupby('z').plot.scatter('x', 'y')
+        tm.close()
+        df.groupby('z')['x'].plot.line()
+        tm.close()
+
+    def test_plot_kwargs(self):
+
+        df = DataFrame({'x': [1, 2, 3, 4, 5],
+                        'y': [1, 2, 3, 2, 1],
+                        'z': list('ababa')})
+
+        res = df.groupby('z').plot(kind='scatter', x='x', y='y')
+        # check that a scatter plot is effectively plotted: the axes should
+        # contain a PathCollection from the scatter plot (GH11805)
+        assert len(res['a'].collections) == 1
+
+        res = df.groupby('z').plot.scatter(x='x', y='y')
+        assert len(res['a'].collections) == 1
diff --git a/pandas/tests/plotting/test_hist_method.py b/pandas/tests/plotting/test_hist_method.py
new file mode 100644
index 0000000000000..864d39eba29c5
--- /dev/null
+++ b/pandas/tests/plotting/test_hist_method.py
@@ -0,0 +1,428 @@
+# coding: utf-8
+
+""" Test cases for .hist method """
+
+import pytest
+
+from pandas import Series, DataFrame
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+import numpy as np
+from numpy.random import randn
+
+from pandas.plotting._core import grouped_hist
+from pandas.tests.plotting.common import (TestPlotBase, _check_plot_works)
+
+
+@td.skip_if_no_mpl
+class TestSeriesPlots(TestPlotBase):
+
+    def setup_method(self, method):
+        TestPlotBase.setup_method(self, method)
+        import matplotlib as mpl
+        mpl.rcdefaults()
+
+        self.ts = tm.makeTimeSeries()
+        self.ts.name = 'ts'
+
+    @pytest.mark.slow
+    def test_hist_legacy(self):
+        _check_plot_works(self.ts.hist)
+        _check_plot_works(self.ts.hist, grid=False)
+        _check_plot_works(self.ts.hist, figsize=(8, 10))
+        # _check_plot_works adds an ax so catch warning. see GH #13188
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(self.ts.hist, by=self.ts.index.month)
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(self.ts.hist, by=self.ts.index.month, bins=5)
+
+        fig, ax = self.plt.subplots(1, 1)
+        _check_plot_works(self.ts.hist, ax=ax)
+        _check_plot_works(self.ts.hist, ax=ax, figure=fig)
+        _check_plot_works(self.ts.hist, figure=fig)
+        tm.close()
+
+        fig, (ax1, ax2) = self.plt.subplots(1, 2)
+        _check_plot_works(self.ts.hist, figure=fig, ax=ax1)
+        _check_plot_works(self.ts.hist, figure=fig, ax=ax2)
+
+        with pytest.raises(ValueError):
+            self.ts.hist(by=self.ts.index, figure=fig)
+
+    @pytest.mark.slow
+    def test_hist_bins_legacy(self):
+        df = DataFrame(np.random.randn(10, 2))
+        ax = df.hist(bins=2)[0][0]
+        assert len(ax.patches) == 2
+
+    @pytest.mark.slow
+    def test_hist_layout(self):
+        df = self.hist_df
+        with pytest.raises(ValueError):
+            df.height.hist(layout=(1, 1))
+
+        with pytest.raises(ValueError):
+            df.height.hist(layout=[1, 1])
+
+    @pytest.mark.slow
+    def test_hist_layout_with_by(self):
+        df = self.hist_df
+
+        # _check_plot_works adds an `ax` kwarg to the method call
+        # so we get a warning about an axis being cleared, even
+        # though we don't explicing pass one, see GH #13188
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.height.hist, by=df.gender,
+                                     layout=(2, 1))
+        self._check_axes_shape(axes, axes_num=2, layout=(2, 1))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.height.hist, by=df.gender,
+                                     layout=(3, -1))
+        self._check_axes_shape(axes, axes_num=2, layout=(3, 1))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.height.hist, by=df.category,
+                                     layout=(4, 1))
+        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(
+                df.height.hist, by=df.category, layout=(2, -1))
+        self._check_axes_shape(axes, axes_num=4, layout=(2, 2))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(
+                df.height.hist, by=df.category, layout=(3, -1))
+        self._check_axes_shape(axes, axes_num=4, layout=(3, 2))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(
+                df.height.hist, by=df.category, layout=(-1, 4))
+        self._check_axes_shape(axes, axes_num=4, layout=(1, 4))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(
+                df.height.hist, by=df.classroom, layout=(2, 2))
+        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
+
+        axes = df.height.hist(by=df.category, layout=(4, 2), figsize=(12, 7))
+        self._check_axes_shape(
+            axes, axes_num=4, layout=(4, 2), figsize=(12, 7))
+
+    @pytest.mark.slow
+    def test_hist_no_overlap(self):
+        from matplotlib.pyplot import subplot, gcf
+        x = Series(randn(2))
+        y = Series(randn(2))
+        subplot(121)
+        x.hist()
+        subplot(122)
+        y.hist()
+        fig = gcf()
+        axes = fig.axes if self.mpl_ge_1_5_0 else fig.get_axes()
+        assert len(axes) == 2
+
+    @pytest.mark.slow
+    def test_hist_by_no_extra_plots(self):
+        df = self.hist_df
+        axes = df.height.hist(by=df.gender)  # noqa
+        assert len(self.plt.get_fignums()) == 1
+
+    @pytest.mark.slow
+    def test_plot_fails_when_ax_differs_from_figure(self):
+        from pylab import figure
+        fig1 = figure()
+        fig2 = figure()
+        ax1 = fig1.add_subplot(111)
+        with pytest.raises(AssertionError):
+            self.ts.hist(ax=ax1, figure=fig2)
+
+
+@td.skip_if_no_mpl
+class TestDataFramePlots(TestPlotBase):
+
+    @pytest.mark.slow
+    def test_hist_df_legacy(self):
+        from matplotlib.patches import Rectangle
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(self.hist_df.hist)
+
+        # make sure layout is handled
+        df = DataFrame(randn(100, 3))
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.hist, grid=False)
+        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
+        assert not axes[1, 1].get_visible()
+
+        df = DataFrame(randn(100, 1))
+        _check_plot_works(df.hist)
+
+        # make sure layout is handled
+        df = DataFrame(randn(100, 6))
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.hist, layout=(4, 2))
+        self._check_axes_shape(axes, axes_num=6, layout=(4, 2))
+
+        # make sure sharex, sharey is handled
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(df.hist, sharex=True, sharey=True)
+
+        # handle figsize arg
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(df.hist, figsize=(8, 10))
+
+        # check bins argument
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(df.hist, bins=5)
+
+        # make sure xlabelsize and xrot are handled
+        ser = df[0]
+        xf, yf = 20, 18
+        xrot, yrot = 30, 40
+        axes = ser.hist(xlabelsize=xf, xrot=xrot, ylabelsize=yf, yrot=yrot)
+        self._check_ticks_props(axes, xlabelsize=xf, xrot=xrot,
+                                ylabelsize=yf, yrot=yrot)
+
+        xf, yf = 20, 18
+        xrot, yrot = 30, 40
+        axes = df.hist(xlabelsize=xf, xrot=xrot, ylabelsize=yf, yrot=yrot)
+        self._check_ticks_props(axes, xlabelsize=xf, xrot=xrot,
+                                ylabelsize=yf, yrot=yrot)
+
+        tm.close()
+        # make sure kwargs to hist are handled
+        ax = ser.hist(normed=True, cumulative=True, bins=4)
+        # height of last bin (index 5) must be 1.0
+        rects = [x for x in ax.get_children() if isinstance(x, Rectangle)]
+        tm.assert_almost_equal(rects[-1].get_height(), 1.0)
+
+        tm.close()
+        ax = ser.hist(log=True)
+        # scale of y must be 'log'
+        self._check_ax_scales(ax, yaxis='log')
+
+        tm.close()
+
+        # propagate attr exception from matplotlib.Axes.hist
+        with pytest.raises(AttributeError):
+            ser.hist(foo='bar')
+
+    @pytest.mark.slow
+    def test_hist_layout(self):
+        df = DataFrame(randn(100, 3))
+
+        layout_to_expected_size = (
+            {'layout': None, 'expected_size': (2, 2)},  # default is 2x2
+            {'layout': (2, 2), 'expected_size': (2, 2)},
+            {'layout': (4, 1), 'expected_size': (4, 1)},
+            {'layout': (1, 4), 'expected_size': (1, 4)},
+            {'layout': (3, 3), 'expected_size': (3, 3)},
+            {'layout': (-1, 4), 'expected_size': (1, 4)},
+            {'layout': (4, -1), 'expected_size': (4, 1)},
+            {'layout': (-1, 2), 'expected_size': (2, 2)},
+            {'layout': (2, -1), 'expected_size': (2, 2)}
+        )
+
+        for layout_test in layout_to_expected_size:
+            axes = df.hist(layout=layout_test['layout'])
+            expected = layout_test['expected_size']
+            self._check_axes_shape(axes, axes_num=3, layout=expected)
+
+        # layout too small for all 4 plots
+        with pytest.raises(ValueError):
+            df.hist(layout=(1, 1))
+
+        # invalid format for layout
+        with pytest.raises(ValueError):
+            df.hist(layout=(1,))
+        with pytest.raises(ValueError):
+            df.hist(layout=(-1, -1))
+
+    @pytest.mark.slow
+    # GH 9351
+    def test_tight_layout(self):
+        if self.mpl_ge_2_0_1:
+            df = DataFrame(randn(100, 3))
+            _check_plot_works(df.hist)
+            self.plt.tight_layout()
+
+            tm.close()
+
+
+@td.skip_if_no_mpl
+class TestDataFrameGroupByPlots(TestPlotBase):
+
+    @pytest.mark.slow
+    def test_grouped_hist_legacy(self):
+        from matplotlib.patches import Rectangle
+
+        df = DataFrame(randn(500, 2), columns=['A', 'B'])
+        df['C'] = np.random.randint(0, 4, 500)
+        df['D'] = ['X'] * 500
+
+        axes = grouped_hist(df.A, by=df.C)
+        self._check_axes_shape(axes, axes_num=4, layout=(2, 2))
+
+        tm.close()
+        axes = df.hist(by=df.C)
+        self._check_axes_shape(axes, axes_num=4, layout=(2, 2))
+
+        tm.close()
+        # group by a key with single value
+        axes = df.hist(by='D', rot=30)
+        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
+        self._check_ticks_props(axes, xrot=30)
+
+        tm.close()
+        # make sure kwargs to hist are handled
+        xf, yf = 20, 18
+        xrot, yrot = 30, 40
+        axes = grouped_hist(df.A, by=df.C, normed=True, cumulative=True,
+                            bins=4, xlabelsize=xf, xrot=xrot,
+                            ylabelsize=yf, yrot=yrot)
+        # height of last bin (index 5) must be 1.0
+        for ax in axes.ravel():
+            rects = [x for x in ax.get_children() if isinstance(x, Rectangle)]
+            height = rects[-1].get_height()
+            tm.assert_almost_equal(height, 1.0)
+        self._check_ticks_props(axes, xlabelsize=xf, xrot=xrot,
+                                ylabelsize=yf, yrot=yrot)
+
+        tm.close()
+        axes = grouped_hist(df.A, by=df.C, log=True)
+        # scale of y must be 'log'
+        self._check_ax_scales(axes, yaxis='log')
+
+        tm.close()
+        # propagate attr exception from matplotlib.Axes.hist
+        with pytest.raises(AttributeError):
+            grouped_hist(df.A, by=df.C, foo='bar')
+
+        with tm.assert_produces_warning(FutureWarning):
+            df.hist(by='C', figsize='default')
+
+    @pytest.mark.slow
+    def test_grouped_hist_legacy2(self):
+        n = 10
+        weight = Series(np.random.normal(166, 20, size=n))
+        height = Series(np.random.normal(60, 10, size=n))
+        with tm.RNGContext(42):
+            gender_int = np.random.choice([0, 1], size=n)
+        df_int = DataFrame({'height': height, 'weight': weight,
+                            'gender': gender_int})
+        gb = df_int.groupby('gender')
+        axes = gb.hist()
+        assert len(axes) == 2
+        assert len(self.plt.get_fignums()) == 2
+        tm.close()
+
+    @pytest.mark.slow
+    def test_grouped_hist_layout(self):
+        df = self.hist_df
+        pytest.raises(ValueError, df.hist, column='weight', by=df.gender,
+                      layout=(1, 1))
+        pytest.raises(ValueError, df.hist, column='height', by=df.category,
+                      layout=(1, 3))
+        pytest.raises(ValueError, df.hist, column='height', by=df.category,
+                      layout=(-1, -1))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.hist, column='height', by=df.gender,
+                                     layout=(2, 1))
+        self._check_axes_shape(axes, axes_num=2, layout=(2, 1))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.hist, column='height', by=df.gender,
+                                     layout=(2, -1))
+        self._check_axes_shape(axes, axes_num=2, layout=(2, 1))
+
+        axes = df.hist(column='height', by=df.category, layout=(4, 1))
+        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
+
+        axes = df.hist(column='height', by=df.category, layout=(-1, 1))
+        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
+
+        axes = df.hist(column='height', by=df.category,
+                       layout=(4, 2), figsize=(12, 8))
+        self._check_axes_shape(
+            axes, axes_num=4, layout=(4, 2), figsize=(12, 8))
+        tm.close()
+
+        # GH 6769
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(
+                df.hist, column='height', by='classroom', layout=(2, 2))
+        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
+
+        # without column
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.hist, by='classroom')
+        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
+
+        axes = df.hist(by='gender', layout=(3, 5))
+        self._check_axes_shape(axes, axes_num=2, layout=(3, 5))
+
+        axes = df.hist(column=['height', 'weight', 'category'])
+        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
+
+    @pytest.mark.slow
+    def test_grouped_hist_multiple_axes(self):
+        # GH 6970, GH 7069
+        df = self.hist_df
+
+        fig, axes = self.plt.subplots(2, 3)
+        returned = df.hist(column=['height', 'weight', 'category'], ax=axes[0])
+        self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
+        tm.assert_numpy_array_equal(returned, axes[0])
+        assert returned[0].figure is fig
+        returned = df.hist(by='classroom', ax=axes[1])
+        self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
+        tm.assert_numpy_array_equal(returned, axes[1])
+        assert returned[0].figure is fig
+
+        with pytest.raises(ValueError):
+            fig, axes = self.plt.subplots(2, 3)
+            # pass different number of axes from required
+            axes = df.hist(column='height', ax=axes)
+
+    @pytest.mark.slow
+    def test_axis_share_x(self):
+        df = self.hist_df
+        # GH4089
+        ax1, ax2 = df.hist(column='height', by=df.gender, sharex=True)
+
+        # share x
+        assert ax1._shared_x_axes.joined(ax1, ax2)
+        assert ax2._shared_x_axes.joined(ax1, ax2)
+
+        # don't share y
+        assert not ax1._shared_y_axes.joined(ax1, ax2)
+        assert not ax2._shared_y_axes.joined(ax1, ax2)
+
+    @pytest.mark.slow
+    def test_axis_share_y(self):
+        df = self.hist_df
+        ax1, ax2 = df.hist(column='height', by=df.gender, sharey=True)
+
+        # share y
+        assert ax1._shared_y_axes.joined(ax1, ax2)
+        assert ax2._shared_y_axes.joined(ax1, ax2)
+
+        # don't share x
+        assert not ax1._shared_x_axes.joined(ax1, ax2)
+        assert not ax2._shared_x_axes.joined(ax1, ax2)
+
+    @pytest.mark.slow
+    def test_axis_share_xy(self):
+        df = self.hist_df
+        ax1, ax2 = df.hist(column='height', by=df.gender, sharex=True,
+                           sharey=True)
+
+        # share both x and y
+        assert ax1._shared_x_axes.joined(ax1, ax2)
+        assert ax2._shared_x_axes.joined(ax1, ax2)
+
+        assert ax1._shared_y_axes.joined(ax1, ax2)
+        assert ax2._shared_y_axes.joined(ax1, ax2)
diff --git a/pandas/tests/plotting/test_misc.py b/pandas/tests/plotting/test_misc.py
new file mode 100644
index 0000000000000..0473610ea2f8f
--- /dev/null
+++ b/pandas/tests/plotting/test_misc.py
@@ -0,0 +1,315 @@
+# coding: utf-8
+
+""" Test cases for misc plot functions """
+
+import pytest
+
+from pandas import DataFrame
+from pandas.compat import lmap
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+import numpy as np
+from numpy import random
+from numpy.random import randn
+
+import pandas.plotting as plotting
+from pandas.tests.plotting.common import TestPlotBase, _check_plot_works
+
+
+@td.skip_if_mpl
+def test_import_error_message():
+    # GH-19810
+    df = DataFrame({"A": [1, 2]})
+
+    with tm.assert_raises_regex(ImportError, 'matplotlib is required'):
+        df.plot()
+
+
+@td.skip_if_no_mpl
+class TestSeriesPlots(TestPlotBase):
+
+    def setup_method(self, method):
+        TestPlotBase.setup_method(self, method)
+        import matplotlib as mpl
+        mpl.rcdefaults()
+
+        self.ts = tm.makeTimeSeries()
+        self.ts.name = 'ts'
+
+    @pytest.mark.slow
+    def test_autocorrelation_plot(self):
+        from pandas.plotting import autocorrelation_plot
+        _check_plot_works(autocorrelation_plot, series=self.ts)
+        _check_plot_works(autocorrelation_plot, series=self.ts.values)
+
+        ax = autocorrelation_plot(self.ts, label='Test')
+        self._check_legend_labels(ax, labels=['Test'])
+
+    @pytest.mark.slow
+    def test_lag_plot(self):
+        from pandas.plotting import lag_plot
+        _check_plot_works(lag_plot, series=self.ts)
+        _check_plot_works(lag_plot, series=self.ts, lag=5)
+
+    @pytest.mark.slow
+    def test_bootstrap_plot(self):
+        from pandas.plotting import bootstrap_plot
+        _check_plot_works(bootstrap_plot, series=self.ts, size=10)
+
+
+@td.skip_if_no_mpl
+class TestDataFramePlots(TestPlotBase):
+
+    @td.xfail_if_mpl_2_2
+    @td.skip_if_no_scipy
+    def test_scatter_matrix_axis(self):
+        scatter_matrix = plotting.scatter_matrix
+
+        with tm.RNGContext(42):
+            df = DataFrame(randn(100, 3))
+
+        # we are plotting multiples on a sub-plot
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(scatter_matrix, filterwarnings='always',
+                                     frame=df, range_padding=.1)
+        axes0_labels = axes[0][0].yaxis.get_majorticklabels()
+
+        # GH 5662
+        if self.mpl_ge_2_0_0:
+            expected = ['-2', '0', '2']
+        else:
+            expected = ['-2', '-1', '0', '1', '2']
+        self._check_text_labels(axes0_labels, expected)
+        self._check_ticks_props(
+            axes, xlabelsize=8, xrot=90, ylabelsize=8, yrot=0)
+
+        df[0] = ((df[0] - 2) / 3)
+
+        # we are plotting multiples on a sub-plot
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(scatter_matrix, filterwarnings='always',
+                                     frame=df, range_padding=.1)
+        axes0_labels = axes[0][0].yaxis.get_majorticklabels()
+        if self.mpl_ge_2_0_0:
+            expected = ['-1.0', '-0.5', '0.0']
+        else:
+            expected = ['-1.2', '-1.0', '-0.8', '-0.6', '-0.4', '-0.2', '0.0']
+        self._check_text_labels(axes0_labels, expected)
+        self._check_ticks_props(
+            axes, xlabelsize=8, xrot=90, ylabelsize=8, yrot=0)
+
+    @pytest.mark.slow
+    def test_andrews_curves(self, iris):
+        from pandas.plotting import andrews_curves
+        from matplotlib import cm
+
+        df = iris
+
+        _check_plot_works(andrews_curves, frame=df, class_column='Name')
+
+        rgba = ('#556270', '#4ECDC4', '#C7F464')
+        ax = _check_plot_works(andrews_curves, frame=df,
+                               class_column='Name', color=rgba)
+        self._check_colors(
+            ax.get_lines()[:10], linecolors=rgba, mapping=df['Name'][:10])
+
+        cnames = ['dodgerblue', 'aquamarine', 'seagreen']
+        ax = _check_plot_works(andrews_curves, frame=df,
+                               class_column='Name', color=cnames)
+        self._check_colors(
+            ax.get_lines()[:10], linecolors=cnames, mapping=df['Name'][:10])
+
+        ax = _check_plot_works(andrews_curves, frame=df,
+                               class_column='Name', colormap=cm.jet)
+        cmaps = lmap(cm.jet, np.linspace(0, 1, df['Name'].nunique()))
+        self._check_colors(
+            ax.get_lines()[:10], linecolors=cmaps, mapping=df['Name'][:10])
+
+        length = 10
+        df = DataFrame({"A": random.rand(length),
+                        "B": random.rand(length),
+                        "C": random.rand(length),
+                        "Name": ["A"] * length})
+
+        _check_plot_works(andrews_curves, frame=df, class_column='Name')
+
+        rgba = ('#556270', '#4ECDC4', '#C7F464')
+        ax = _check_plot_works(andrews_curves, frame=df,
+                               class_column='Name', color=rgba)
+        self._check_colors(
+            ax.get_lines()[:10], linecolors=rgba, mapping=df['Name'][:10])
+
+        cnames = ['dodgerblue', 'aquamarine', 'seagreen']
+        ax = _check_plot_works(andrews_curves, frame=df,
+                               class_column='Name', color=cnames)
+        self._check_colors(
+            ax.get_lines()[:10], linecolors=cnames, mapping=df['Name'][:10])
+
+        ax = _check_plot_works(andrews_curves, frame=df,
+                               class_column='Name', colormap=cm.jet)
+        cmaps = lmap(cm.jet, np.linspace(0, 1, df['Name'].nunique()))
+        self._check_colors(
+            ax.get_lines()[:10], linecolors=cmaps, mapping=df['Name'][:10])
+
+        colors = ['b', 'g', 'r']
+        df = DataFrame({"A": [1, 2, 3],
+                        "B": [1, 2, 3],
+                        "C": [1, 2, 3],
+                        "Name": colors})
+        ax = andrews_curves(df, 'Name', color=colors)
+        handles, labels = ax.get_legend_handles_labels()
+        self._check_colors(handles, linecolors=colors)
+
+        with tm.assert_produces_warning(FutureWarning):
+            andrews_curves(data=df, class_column='Name')
+
+    @pytest.mark.slow
+    def test_parallel_coordinates(self, iris):
+        from pandas.plotting import parallel_coordinates
+        from matplotlib import cm
+
+        df = iris
+
+        ax = _check_plot_works(parallel_coordinates,
+                               frame=df, class_column='Name')
+        nlines = len(ax.get_lines())
+        nxticks = len(ax.xaxis.get_ticklabels())
+
+        rgba = ('#556270', '#4ECDC4', '#C7F464')
+        ax = _check_plot_works(parallel_coordinates,
+                               frame=df, class_column='Name', color=rgba)
+        self._check_colors(
+            ax.get_lines()[:10], linecolors=rgba, mapping=df['Name'][:10])
+
+        cnames = ['dodgerblue', 'aquamarine', 'seagreen']
+        ax = _check_plot_works(parallel_coordinates,
+                               frame=df, class_column='Name', color=cnames)
+        self._check_colors(
+            ax.get_lines()[:10], linecolors=cnames, mapping=df['Name'][:10])
+
+        ax = _check_plot_works(parallel_coordinates,
+                               frame=df, class_column='Name', colormap=cm.jet)
+        cmaps = lmap(cm.jet, np.linspace(0, 1, df['Name'].nunique()))
+        self._check_colors(
+            ax.get_lines()[:10], linecolors=cmaps, mapping=df['Name'][:10])
+
+        ax = _check_plot_works(parallel_coordinates,
+                               frame=df, class_column='Name', axvlines=False)
+        assert len(ax.get_lines()) == (nlines - nxticks)
+
+        colors = ['b', 'g', 'r']
+        df = DataFrame({"A": [1, 2, 3],
+                        "B": [1, 2, 3],
+                        "C": [1, 2, 3],
+                        "Name": colors})
+        ax = parallel_coordinates(df, 'Name', color=colors)
+        handles, labels = ax.get_legend_handles_labels()
+        self._check_colors(handles, linecolors=colors)
+
+        with tm.assert_produces_warning(FutureWarning):
+            parallel_coordinates(data=df, class_column='Name')
+        with tm.assert_produces_warning(FutureWarning):
+            parallel_coordinates(df, 'Name', colors=colors)
+
+    @pytest.mark.xfail(reason="unreliable test")
+    def test_parallel_coordinates_with_sorted_labels(self):
+        """ For #15908 """
+        from pandas.plotting import parallel_coordinates
+
+        df = DataFrame({"feat": [i for i in range(30)],
+                        "class": [2 for _ in range(10)] +
+                        [3 for _ in range(10)] +
+                        [1 for _ in range(10)]})
+        ax = parallel_coordinates(df, 'class', sort_labels=True)
+        polylines, labels = ax.get_legend_handles_labels()
+        color_label_tuples = \
+            zip([polyline.get_color() for polyline in polylines], labels)
+        ordered_color_label_tuples = sorted(color_label_tuples,
+                                            key=lambda x: x[1])
+        prev_next_tupels = zip([i for i in ordered_color_label_tuples[0:-1]],
+                               [i for i in ordered_color_label_tuples[1:]])
+        for prev, nxt in prev_next_tupels:
+            # labels and colors are ordered strictly increasing
+            assert prev[1] < nxt[1] and prev[0] < nxt[0]
+
+    @pytest.mark.slow
+    def test_radviz(self, iris):
+        from pandas.plotting import radviz
+        from matplotlib import cm
+
+        df = iris
+        _check_plot_works(radviz, frame=df, class_column='Name')
+
+        rgba = ('#556270', '#4ECDC4', '#C7F464')
+        ax = _check_plot_works(
+            radviz, frame=df, class_column='Name', color=rgba)
+        # skip Circle drawn as ticks
+        patches = [p for p in ax.patches[:20] if p.get_label() != '']
+        self._check_colors(
+            patches[:10], facecolors=rgba, mapping=df['Name'][:10])
+
+        cnames = ['dodgerblue', 'aquamarine', 'seagreen']
+        _check_plot_works(radviz, frame=df, class_column='Name', color=cnames)
+        patches = [p for p in ax.patches[:20] if p.get_label() != '']
+        self._check_colors(patches, facecolors=cnames, mapping=df['Name'][:10])
+
+        _check_plot_works(radviz, frame=df,
+                          class_column='Name', colormap=cm.jet)
+        cmaps = lmap(cm.jet, np.linspace(0, 1, df['Name'].nunique()))
+        patches = [p for p in ax.patches[:20] if p.get_label() != '']
+        self._check_colors(patches, facecolors=cmaps, mapping=df['Name'][:10])
+
+        colors = [[0., 0., 1., 1.],
+                  [0., 0.5, 1., 1.],
+                  [1., 0., 0., 1.]]
+        df = DataFrame({"A": [1, 2, 3],
+                        "B": [2, 1, 3],
+                        "C": [3, 2, 1],
+                        "Name": ['b', 'g', 'r']})
+        ax = radviz(df, 'Name', color=colors)
+        handles, labels = ax.get_legend_handles_labels()
+        self._check_colors(handles, facecolors=colors)
+
+    @pytest.mark.slow
+    def test_subplot_titles(self, iris):
+        df = iris.drop('Name', axis=1).head()
+        # Use the column names as the subplot titles
+        title = list(df.columns)
+
+        # Case len(title) == len(df)
+        plot = df.plot(subplots=True, title=title)
+        assert [p.get_title() for p in plot] == title
+
+        # Case len(title) > len(df)
+        pytest.raises(ValueError, df.plot, subplots=True,
+                      title=title + ["kittens > puppies"])
+
+        # Case len(title) < len(df)
+        pytest.raises(ValueError, df.plot, subplots=True, title=title[:2])
+
+        # Case subplots=False and title is of type list
+        pytest.raises(ValueError, df.plot, subplots=False, title=title)
+
+        # Case df with 3 numeric columns but layout of (2,2)
+        plot = df.drop('SepalWidth', axis=1).plot(subplots=True, layout=(2, 2),
+                                                  title=title[:-1])
+        title_list = [ax.get_title() for sublist in plot for ax in sublist]
+        assert title_list == title[:3] + ['']
+
+    def test_get_standard_colors_random_seed(self):
+        # GH17525
+        df = DataFrame(np.zeros((10, 10)))
+
+        # Make sure that the random seed isn't reset by _get_standard_colors
+        plotting.parallel_coordinates(df, 0)
+        rand1 = random.random()
+        plotting.parallel_coordinates(df, 0)
+        rand2 = random.random()
+        assert rand1 != rand2
+
+        # Make sure it produces the same colors every time it's called
+        from pandas.plotting._style import _get_standard_colors
+        color1 = _get_standard_colors(1, color_type='random')
+        color2 = _get_standard_colors(1, color_type='random')
+        assert color1 == color2
diff --git a/pandas/tests/plotting/test_series.py b/pandas/tests/plotting/test_series.py
new file mode 100644
index 0000000000000..5dc7d52e05778
--- /dev/null
+++ b/pandas/tests/plotting/test_series.py
@@ -0,0 +1,902 @@
+# coding: utf-8
+
+""" Test cases for Series.plot """
+
+
+from itertools import chain
+import pytest
+
+from datetime import datetime
+
+import pandas as pd
+from pandas import Series, DataFrame, date_range
+from pandas.compat import range, lrange
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+import numpy as np
+from numpy.random import randn
+
+import pandas.plotting as plotting
+from pandas.tests.plotting.common import (TestPlotBase, _check_plot_works,
+                                          _skip_if_no_scipy_gaussian_kde,
+                                          _ok_for_gaussian_kde)
+
+
+@td.skip_if_no_mpl
+class TestSeriesPlots(TestPlotBase):
+
+    def setup_method(self, method):
+        TestPlotBase.setup_method(self, method)
+        import matplotlib as mpl
+        mpl.rcdefaults()
+
+        self.ts = tm.makeTimeSeries()
+        self.ts.name = 'ts'
+
+        self.series = tm.makeStringSeries()
+        self.series.name = 'series'
+
+        self.iseries = tm.makePeriodSeries()
+        self.iseries.name = 'iseries'
+
+    @pytest.mark.slow
+    def test_plot(self):
+        _check_plot_works(self.ts.plot, label='foo')
+        _check_plot_works(self.ts.plot, use_index=False)
+        axes = _check_plot_works(self.ts.plot, rot=0)
+        self._check_ticks_props(axes, xrot=0)
+
+        ax = _check_plot_works(self.ts.plot, style='.', logy=True)
+        self._check_ax_scales(ax, yaxis='log')
+
+        ax = _check_plot_works(self.ts.plot, style='.', logx=True)
+        self._check_ax_scales(ax, xaxis='log')
+
+        ax = _check_plot_works(self.ts.plot, style='.', loglog=True)
+        self._check_ax_scales(ax, xaxis='log', yaxis='log')
+
+        _check_plot_works(self.ts[:10].plot.bar)
+        _check_plot_works(self.ts.plot.area, stacked=False)
+        _check_plot_works(self.iseries.plot)
+
+        for kind in ['line', 'bar', 'barh', 'kde', 'hist', 'box']:
+            if not _ok_for_gaussian_kde(kind):
+                continue
+            _check_plot_works(self.series[:5].plot, kind=kind)
+
+        _check_plot_works(self.series[:10].plot.barh)
+        ax = _check_plot_works(Series(randn(10)).plot.bar, color='black')
+        self._check_colors([ax.patches[0]], facecolors=['black'])
+
+        # GH 6951
+        ax = _check_plot_works(self.ts.plot, subplots=True)
+        self._check_axes_shape(ax, axes_num=1, layout=(1, 1))
+
+        ax = _check_plot_works(self.ts.plot, subplots=True, layout=(-1, 1))
+        self._check_axes_shape(ax, axes_num=1, layout=(1, 1))
+        ax = _check_plot_works(self.ts.plot, subplots=True, layout=(1, -1))
+        self._check_axes_shape(ax, axes_num=1, layout=(1, 1))
+
+    @pytest.mark.slow
+    def test_plot_figsize_and_title(self):
+        # figsize and title
+        _, ax = self.plt.subplots()
+        ax = self.series.plot(title='Test', figsize=(16, 8), ax=ax)
+        self._check_text_labels(ax.title, 'Test')
+        self._check_axes_shape(ax, axes_num=1, layout=(1, 1), figsize=(16, 8))
+
+    def test_dont_modify_rcParams(self):
+        # GH 8242
+        if self.mpl_ge_1_5_0:
+            key = 'axes.prop_cycle'
+        else:
+            key = 'axes.color_cycle'
+        colors = self.plt.rcParams[key]
+        _, ax = self.plt.subplots()
+        Series([1, 2, 3]).plot(ax=ax)
+        assert colors == self.plt.rcParams[key]
+
+    def test_ts_line_lim(self):
+        fig, ax = self.plt.subplots()
+        ax = self.ts.plot(ax=ax)
+        xmin, xmax = ax.get_xlim()
+        lines = ax.get_lines()
+        assert xmin <= lines[0].get_data(orig=False)[0][0]
+        assert xmax >= lines[0].get_data(orig=False)[0][-1]
+        tm.close()
+
+        ax = self.ts.plot(secondary_y=True, ax=ax)
+        xmin, xmax = ax.get_xlim()
+        lines = ax.get_lines()
+        assert xmin <= lines[0].get_data(orig=False)[0][0]
+        assert xmax >= lines[0].get_data(orig=False)[0][-1]
+
+    def test_ts_area_lim(self):
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.area(stacked=False, ax=ax)
+        xmin, xmax = ax.get_xlim()
+        line = ax.get_lines()[0].get_data(orig=False)[0]
+        assert xmin <= line[0]
+        assert xmax >= line[-1]
+        tm.close()
+
+        # GH 7471
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.area(stacked=False, x_compat=True, ax=ax)
+        xmin, xmax = ax.get_xlim()
+        line = ax.get_lines()[0].get_data(orig=False)[0]
+        assert xmin <= line[0]
+        assert xmax >= line[-1]
+        tm.close()
+
+        tz_ts = self.ts.copy()
+        tz_ts.index = tz_ts.tz_localize('GMT').tz_convert('CET')
+        _, ax = self.plt.subplots()
+        ax = tz_ts.plot.area(stacked=False, x_compat=True, ax=ax)
+        xmin, xmax = ax.get_xlim()
+        line = ax.get_lines()[0].get_data(orig=False)[0]
+        assert xmin <= line[0]
+        assert xmax >= line[-1]
+        tm.close()
+
+        _, ax = self.plt.subplots()
+        ax = tz_ts.plot.area(stacked=False, secondary_y=True, ax=ax)
+        xmin, xmax = ax.get_xlim()
+        line = ax.get_lines()[0].get_data(orig=False)[0]
+        assert xmin <= line[0]
+        assert xmax >= line[-1]
+
+    def test_label(self):
+        s = Series([1, 2])
+        _, ax = self.plt.subplots()
+        ax = s.plot(label='LABEL', legend=True, ax=ax)
+        self._check_legend_labels(ax, labels=['LABEL'])
+        self.plt.close()
+        _, ax = self.plt.subplots()
+        ax = s.plot(legend=True, ax=ax)
+        self._check_legend_labels(ax, labels=['None'])
+        self.plt.close()
+        # get name from index
+        s.name = 'NAME'
+        _, ax = self.plt.subplots()
+        ax = s.plot(legend=True, ax=ax)
+        self._check_legend_labels(ax, labels=['NAME'])
+        self.plt.close()
+        # override the default
+        _, ax = self.plt.subplots()
+        ax = s.plot(legend=True, label='LABEL', ax=ax)
+        self._check_legend_labels(ax, labels=['LABEL'])
+        self.plt.close()
+        # Add lebel info, but don't draw
+        _, ax = self.plt.subplots()
+        ax = s.plot(legend=False, label='LABEL', ax=ax)
+        assert ax.get_legend() is None  # Hasn't been drawn
+        ax.legend()  # draw it
+        self._check_legend_labels(ax, labels=['LABEL'])
+
+    def test_line_area_nan_series(self):
+        values = [1, 2, np.nan, 3]
+        s = Series(values)
+        ts = Series(values, index=tm.makeDateIndex(k=4))
+
+        for d in [s, ts]:
+            ax = _check_plot_works(d.plot)
+            masked = ax.lines[0].get_ydata()
+            # remove nan for comparison purpose
+            exp = np.array([1, 2, 3], dtype=np.float64)
+            tm.assert_numpy_array_equal(np.delete(masked.data, 2), exp)
+            tm.assert_numpy_array_equal(
+                masked.mask, np.array([False, False, True, False]))
+
+            expected = np.array([1, 2, 0, 3], dtype=np.float64)
+            ax = _check_plot_works(d.plot, stacked=True)
+            tm.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected)
+            ax = _check_plot_works(d.plot.area)
+            tm.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected)
+            ax = _check_plot_works(d.plot.area, stacked=False)
+            tm.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected)
+
+    def test_line_use_index_false(self):
+        s = Series([1, 2, 3], index=['a', 'b', 'c'])
+        s.index.name = 'The Index'
+        _, ax = self.plt.subplots()
+        ax = s.plot(use_index=False, ax=ax)
+        label = ax.get_xlabel()
+        assert label == ''
+        _, ax = self.plt.subplots()
+        ax2 = s.plot.bar(use_index=False, ax=ax)
+        label2 = ax2.get_xlabel()
+        assert label2 == ''
+
+    @pytest.mark.slow
+    def test_bar_log(self):
+        expected = np.array([1., 10., 100., 1000.])
+
+        if not self.mpl_le_1_2_1:
+            expected = np.hstack((.1, expected, 1e4))
+
+        _, ax = self.plt.subplots()
+        ax = Series([200, 500]).plot.bar(log=True, ax=ax)
+        tm.assert_numpy_array_equal(ax.yaxis.get_ticklocs(), expected)
+        tm.close()
+
+        _, ax = self.plt.subplots()
+        ax = Series([200, 500]).plot.barh(log=True, ax=ax)
+        tm.assert_numpy_array_equal(ax.xaxis.get_ticklocs(), expected)
+        tm.close()
+
+        # GH 9905
+        expected = np.array([1.0e-03, 1.0e-02, 1.0e-01, 1.0e+00])
+
+        if not self.mpl_le_1_2_1:
+            expected = np.hstack((1.0e-04, expected, 1.0e+01))
+        if self.mpl_ge_2_0_0:
+            expected = np.hstack((1.0e-05, expected))
+
+        _, ax = self.plt.subplots()
+        ax = Series([0.1, 0.01, 0.001]).plot(log=True, kind='bar', ax=ax)
+        ymin = 0.0007943282347242822 if self.mpl_ge_2_0_0 else 0.001
+        ymax = 0.12589254117941673 if self.mpl_ge_2_0_0 else .10000000000000001
+        res = ax.get_ylim()
+        tm.assert_almost_equal(res[0], ymin)
+        tm.assert_almost_equal(res[1], ymax)
+        tm.assert_numpy_array_equal(ax.yaxis.get_ticklocs(), expected)
+        tm.close()
+
+        _, ax = self.plt.subplots()
+        ax = Series([0.1, 0.01, 0.001]).plot(log=True, kind='barh', ax=ax)
+        res = ax.get_xlim()
+        tm.assert_almost_equal(res[0], ymin)
+        tm.assert_almost_equal(res[1], ymax)
+        tm.assert_numpy_array_equal(ax.xaxis.get_ticklocs(), expected)
+
+    @pytest.mark.slow
+    def test_bar_ignore_index(self):
+        df = Series([1, 2, 3, 4], index=['a', 'b', 'c', 'd'])
+        _, ax = self.plt.subplots()
+        ax = df.plot.bar(use_index=False, ax=ax)
+        self._check_text_labels(ax.get_xticklabels(), ['0', '1', '2', '3'])
+
+    def test_bar_user_colors(self):
+        s = Series([1, 2, 3, 4])
+        ax = s.plot.bar(color=['red', 'blue', 'blue', 'red'])
+        result = [p.get_facecolor() for p in ax.patches]
+        expected = [(1., 0., 0., 1.),
+                    (0., 0., 1., 1.),
+                    (0., 0., 1., 1.),
+                    (1., 0., 0., 1.)]
+        assert result == expected
+
+    def test_rotation(self):
+        df = DataFrame(randn(5, 5))
+        # Default rot 0
+        _, ax = self.plt.subplots()
+        axes = df.plot(ax=ax)
+        self._check_ticks_props(axes, xrot=0)
+
+        _, ax = self.plt.subplots()
+        axes = df.plot(rot=30, ax=ax)
+        self._check_ticks_props(axes, xrot=30)
+
+    def test_irregular_datetime(self):
+        rng = date_range('1/1/2000', '3/1/2000')
+        rng = rng[[0, 1, 2, 3, 5, 9, 10, 11, 12]]
+        ser = Series(randn(len(rng)), rng)
+        _, ax = self.plt.subplots()
+        ax = ser.plot(ax=ax)
+        xp = datetime(1999, 1, 1).toordinal()
+        ax.set_xlim('1/1/1999', '1/1/2001')
+        assert xp == ax.get_xlim()[0]
+
+    def test_unsorted_index_xlim(self):
+        ser = Series([0., 1., np.nan, 3., 4., 5., 6.],
+                     index=[1., 0., 3., 2., np.nan, 3., 2.])
+        _, ax = self.plt.subplots()
+        ax = ser.plot(ax=ax)
+        xmin, xmax = ax.get_xlim()
+        lines = ax.get_lines()
+        assert xmin <= np.nanmin(lines[0].get_data(orig=False)[0])
+        assert xmax >= np.nanmax(lines[0].get_data(orig=False)[0])
+
+    @pytest.mark.slow
+    def test_pie_series(self):
+        # if sum of values is less than 1.0, pie handle them as rate and draw
+        # semicircle.
+        series = Series(np.random.randint(1, 5),
+                        index=['a', 'b', 'c', 'd', 'e'], name='YLABEL')
+        ax = _check_plot_works(series.plot.pie)
+        self._check_text_labels(ax.texts, series.index)
+        assert ax.get_ylabel() == 'YLABEL'
+
+        # without wedge labels
+        ax = _check_plot_works(series.plot.pie, labels=None)
+        self._check_text_labels(ax.texts, [''] * 5)
+
+        # with less colors than elements
+        color_args = ['r', 'g', 'b']
+        ax = _check_plot_works(series.plot.pie, colors=color_args)
+
+        color_expected = ['r', 'g', 'b', 'r', 'g']
+        self._check_colors(ax.patches, facecolors=color_expected)
+
+        # with labels and colors
+        labels = ['A', 'B', 'C', 'D', 'E']
+        color_args = ['r', 'g', 'b', 'c', 'm']
+        ax = _check_plot_works(series.plot.pie, labels=labels,
+                               colors=color_args)
+        self._check_text_labels(ax.texts, labels)
+        self._check_colors(ax.patches, facecolors=color_args)
+
+        # with autopct and fontsize
+        ax = _check_plot_works(series.plot.pie, colors=color_args,
+                               autopct='%.2f', fontsize=7)
+        pcts = ['{0:.2f}'.format(s * 100)
+                for s in series.values / float(series.sum())]
+        expected_texts = list(chain.from_iterable(zip(series.index, pcts)))
+        self._check_text_labels(ax.texts, expected_texts)
+        for t in ax.texts:
+            assert t.get_fontsize() == 7
+
+        # includes negative value
+        with pytest.raises(ValueError):
+            series = Series([1, 2, 0, 4, -1], index=['a', 'b', 'c', 'd', 'e'])
+            series.plot.pie()
+
+        # includes nan
+        series = Series([1, 2, np.nan, 4], index=['a', 'b', 'c', 'd'],
+                        name='YLABEL')
+        ax = _check_plot_works(series.plot.pie)
+        self._check_text_labels(ax.texts, ['a', 'b', '', 'd'])
+
+    def test_pie_nan(self):
+        s = Series([1, np.nan, 1, 1])
+        _, ax = self.plt.subplots()
+        ax = s.plot.pie(legend=True, ax=ax)
+        expected = ['0', '', '2', '3']
+        result = [x.get_text() for x in ax.texts]
+        assert result == expected
+
+    @pytest.mark.slow
+    def test_hist_df_kwargs(self):
+        df = DataFrame(np.random.randn(10, 2))
+        _, ax = self.plt.subplots()
+        ax = df.plot.hist(bins=5, ax=ax)
+        assert len(ax.patches) == 10
+
+    @pytest.mark.slow
+    def test_hist_df_with_nonnumerics(self):
+        # GH 9853
+        with tm.RNGContext(1):
+            df = DataFrame(
+                np.random.randn(10, 4), columns=['A', 'B', 'C', 'D'])
+        df['E'] = ['x', 'y'] * 5
+        _, ax = self.plt.subplots()
+        ax = df.plot.hist(bins=5, ax=ax)
+        assert len(ax.patches) == 20
+
+        _, ax = self.plt.subplots()
+        ax = df.plot.hist(ax=ax)  # bins=10
+        assert len(ax.patches) == 40
+
+    @pytest.mark.slow
+    def test_hist_legacy(self):
+        _check_plot_works(self.ts.hist)
+        _check_plot_works(self.ts.hist, grid=False)
+        _check_plot_works(self.ts.hist, figsize=(8, 10))
+        # _check_plot_works adds an ax so catch warning. see GH #13188
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(self.ts.hist,
+                              by=self.ts.index.month)
+        with tm.assert_produces_warning(UserWarning):
+            _check_plot_works(self.ts.hist,
+                              by=self.ts.index.month, bins=5)
+
+        fig, ax = self.plt.subplots(1, 1)
+        _check_plot_works(self.ts.hist, ax=ax)
+        _check_plot_works(self.ts.hist, ax=ax, figure=fig)
+        _check_plot_works(self.ts.hist, figure=fig)
+        tm.close()
+
+        fig, (ax1, ax2) = self.plt.subplots(1, 2)
+        _check_plot_works(self.ts.hist, figure=fig, ax=ax1)
+        _check_plot_works(self.ts.hist, figure=fig, ax=ax2)
+
+        with pytest.raises(ValueError):
+            self.ts.hist(by=self.ts.index, figure=fig)
+
+    @pytest.mark.slow
+    def test_hist_bins_legacy(self):
+        df = DataFrame(np.random.randn(10, 2))
+        ax = df.hist(bins=2)[0][0]
+        assert len(ax.patches) == 2
+
+    @pytest.mark.slow
+    def test_hist_layout(self):
+        df = self.hist_df
+        with pytest.raises(ValueError):
+            df.height.hist(layout=(1, 1))
+
+        with pytest.raises(ValueError):
+            df.height.hist(layout=[1, 1])
+
+    @pytest.mark.slow
+    def test_hist_layout_with_by(self):
+        df = self.hist_df
+
+        # _check_plot_works adds an ax so catch warning. see GH #13188
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.height.hist,
+                                     by=df.gender, layout=(2, 1))
+        self._check_axes_shape(axes, axes_num=2, layout=(2, 1))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.height.hist,
+                                     by=df.gender, layout=(3, -1))
+        self._check_axes_shape(axes, axes_num=2, layout=(3, 1))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.height.hist,
+                                     by=df.category, layout=(4, 1))
+        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.height.hist,
+                                     by=df.category, layout=(2, -1))
+        self._check_axes_shape(axes, axes_num=4, layout=(2, 2))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.height.hist,
+                                     by=df.category, layout=(3, -1))
+        self._check_axes_shape(axes, axes_num=4, layout=(3, 2))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.height.hist,
+                                     by=df.category, layout=(-1, 4))
+        self._check_axes_shape(axes, axes_num=4, layout=(1, 4))
+
+        with tm.assert_produces_warning(UserWarning):
+            axes = _check_plot_works(df.height.hist,
+                                     by=df.classroom, layout=(2, 2))
+        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
+
+        axes = df.height.hist(by=df.category, layout=(4, 2), figsize=(12, 7))
+        self._check_axes_shape(axes, axes_num=4, layout=(4, 2),
+                               figsize=(12, 7))
+
+    @pytest.mark.slow
+    def test_hist_no_overlap(self):
+        from matplotlib.pyplot import subplot, gcf
+        x = Series(randn(2))
+        y = Series(randn(2))
+        subplot(121)
+        x.hist()
+        subplot(122)
+        y.hist()
+        fig = gcf()
+        axes = fig.axes if self.mpl_ge_1_5_0 else fig.get_axes()
+        assert len(axes) == 2
+
+    @pytest.mark.slow
+    def test_hist_secondary_legend(self):
+        # GH 9610
+        df = DataFrame(np.random.randn(30, 4), columns=list('abcd'))
+
+        # primary -> secondary
+        _, ax = self.plt.subplots()
+        ax = df['a'].plot.hist(legend=True, ax=ax)
+        df['b'].plot.hist(ax=ax, legend=True, secondary_y=True)
+        # both legends are dran on left ax
+        # left and right axis must be visible
+        self._check_legend_labels(ax, labels=['a', 'b (right)'])
+        assert ax.get_yaxis().get_visible()
+        assert ax.right_ax.get_yaxis().get_visible()
+        tm.close()
+
+        # secondary -> secondary
+        _, ax = self.plt.subplots()
+        ax = df['a'].plot.hist(legend=True, secondary_y=True, ax=ax)
+        df['b'].plot.hist(ax=ax, legend=True, secondary_y=True)
+        # both legends are draw on left ax
+        # left axis must be invisible, right axis must be visible
+        self._check_legend_labels(ax.left_ax,
+                                  labels=['a (right)', 'b (right)'])
+        assert not ax.left_ax.get_yaxis().get_visible()
+        assert ax.get_yaxis().get_visible()
+        tm.close()
+
+        # secondary -> primary
+        _, ax = self.plt.subplots()
+        ax = df['a'].plot.hist(legend=True, secondary_y=True, ax=ax)
+        # right axes is returned
+        df['b'].plot.hist(ax=ax, legend=True)
+        # both legends are draw on left ax
+        # left and right axis must be visible
+        self._check_legend_labels(ax.left_ax, labels=['a (right)', 'b'])
+        assert ax.left_ax.get_yaxis().get_visible()
+        assert ax.get_yaxis().get_visible()
+        tm.close()
+
+    @pytest.mark.slow
+    def test_df_series_secondary_legend(self):
+        # GH 9779
+        df = DataFrame(np.random.randn(30, 3), columns=list('abc'))
+        s = Series(np.random.randn(30), name='x')
+
+        # primary -> secondary (without passing ax)
+        _, ax = self.plt.subplots()
+        ax = df.plot(ax=ax)
+        s.plot(legend=True, secondary_y=True, ax=ax)
+        # both legends are dran on left ax
+        # left and right axis must be visible
+        self._check_legend_labels(ax, labels=['a', 'b', 'c', 'x (right)'])
+        assert ax.get_yaxis().get_visible()
+        assert ax.right_ax.get_yaxis().get_visible()
+        tm.close()
+
+        # primary -> secondary (with passing ax)
+        _, ax = self.plt.subplots()
+        ax = df.plot(ax=ax)
+        s.plot(ax=ax, legend=True, secondary_y=True)
+        # both legends are dran on left ax
+        # left and right axis must be visible
+        self._check_legend_labels(ax, labels=['a', 'b', 'c', 'x (right)'])
+        assert ax.get_yaxis().get_visible()
+        assert ax.right_ax.get_yaxis().get_visible()
+        tm.close()
+
+        # seconcary -> secondary (without passing ax)
+        _, ax = self.plt.subplots()
+        ax = df.plot(secondary_y=True, ax=ax)
+        s.plot(legend=True, secondary_y=True, ax=ax)
+        # both legends are dran on left ax
+        # left axis must be invisible and right axis must be visible
+        expected = ['a (right)', 'b (right)', 'c (right)', 'x (right)']
+        self._check_legend_labels(ax.left_ax, labels=expected)
+        assert not ax.left_ax.get_yaxis().get_visible()
+        assert ax.get_yaxis().get_visible()
+        tm.close()
+
+        # secondary -> secondary (with passing ax)
+        _, ax = self.plt.subplots()
+        ax = df.plot(secondary_y=True, ax=ax)
+        s.plot(ax=ax, legend=True, secondary_y=True)
+        # both legends are dran on left ax
+        # left axis must be invisible and right axis must be visible
+        expected = ['a (right)', 'b (right)', 'c (right)', 'x (right)']
+        self._check_legend_labels(ax.left_ax, expected)
+        assert not ax.left_ax.get_yaxis().get_visible()
+        assert ax.get_yaxis().get_visible()
+        tm.close()
+
+        # secondary -> secondary (with passing ax)
+        _, ax = self.plt.subplots()
+        ax = df.plot(secondary_y=True, mark_right=False, ax=ax)
+        s.plot(ax=ax, legend=True, secondary_y=True)
+        # both legends are dran on left ax
+        # left axis must be invisible and right axis must be visible
+        expected = ['a', 'b', 'c', 'x (right)']
+        self._check_legend_labels(ax.left_ax, expected)
+        assert not ax.left_ax.get_yaxis().get_visible()
+        assert ax.get_yaxis().get_visible()
+        tm.close()
+
+    @pytest.mark.slow
+    def test_plot_fails_with_dupe_color_and_style(self):
+        x = Series(randn(2))
+        with pytest.raises(ValueError):
+            _, ax = self.plt.subplots()
+            x.plot(style='k--', color='k', ax=ax)
+
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
+    def test_hist_kde(self):
+        if not self.mpl_ge_1_5_0:
+            pytest.skip("mpl is not supported")
+
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.hist(logy=True, ax=ax)
+        self._check_ax_scales(ax, yaxis='log')
+        xlabels = ax.get_xticklabels()
+        # ticks are values, thus ticklabels are blank
+        self._check_text_labels(xlabels, [''] * len(xlabels))
+        ylabels = ax.get_yticklabels()
+        self._check_text_labels(ylabels, [''] * len(ylabels))
+
+        _skip_if_no_scipy_gaussian_kde()
+        _check_plot_works(self.ts.plot.kde)
+        _check_plot_works(self.ts.plot.density)
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.kde(logy=True, ax=ax)
+        self._check_ax_scales(ax, yaxis='log')
+        xlabels = ax.get_xticklabels()
+        self._check_text_labels(xlabels, [''] * len(xlabels))
+        ylabels = ax.get_yticklabels()
+        self._check_text_labels(ylabels, [''] * len(ylabels))
+
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
+    def test_kde_kwargs(self):
+        _skip_if_no_scipy_gaussian_kde()
+        if not self.mpl_ge_1_5_0:
+            pytest.skip("mpl is not supported")
+
+        sample_points = np.linspace(-100, 100, 20)
+        _check_plot_works(self.ts.plot.kde, bw_method='scott', ind=20)
+        _check_plot_works(self.ts.plot.kde, bw_method=None, ind=20)
+        _check_plot_works(self.ts.plot.kde, bw_method=None, ind=np.int(20))
+        _check_plot_works(self.ts.plot.kde, bw_method=.5, ind=sample_points)
+        _check_plot_works(self.ts.plot.density, bw_method=.5,
+                          ind=sample_points)
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.kde(logy=True, bw_method=.5, ind=sample_points,
+                              ax=ax)
+        self._check_ax_scales(ax, yaxis='log')
+        self._check_text_labels(ax.yaxis.get_label(), 'Density')
+
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
+    def test_kde_missing_vals(self):
+        _skip_if_no_scipy_gaussian_kde()
+        if not self.mpl_ge_1_5_0:
+            pytest.skip("mpl is not supported")
+
+        s = Series(np.random.uniform(size=50))
+        s[0] = np.nan
+        axes = _check_plot_works(s.plot.kde)
+
+        # gh-14821: check if the values have any missing values
+        assert any(~np.isnan(axes.lines[0].get_xdata()))
+
+    @pytest.mark.slow
+    def test_hist_kwargs(self):
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.hist(bins=5, ax=ax)
+        assert len(ax.patches) == 5
+        self._check_text_labels(ax.yaxis.get_label(), 'Frequency')
+        tm.close()
+
+        if self.mpl_ge_1_3_1:
+            _, ax = self.plt.subplots()
+            ax = self.ts.plot.hist(orientation='horizontal', ax=ax)
+            self._check_text_labels(ax.xaxis.get_label(), 'Frequency')
+            tm.close()
+
+            _, ax = self.plt.subplots()
+            ax = self.ts.plot.hist(align='left', stacked=True, ax=ax)
+            tm.close()
+
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
+    def test_hist_kde_color(self):
+        if not self.mpl_ge_1_5_0:
+            pytest.skip("mpl is not supported")
+
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.hist(logy=True, bins=10, color='b', ax=ax)
+        self._check_ax_scales(ax, yaxis='log')
+        assert len(ax.patches) == 10
+        self._check_colors(ax.patches, facecolors=['b'] * 10)
+
+        _skip_if_no_scipy_gaussian_kde()
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.kde(logy=True, color='r', ax=ax)
+        self._check_ax_scales(ax, yaxis='log')
+        lines = ax.get_lines()
+        assert len(lines) == 1
+        self._check_colors(lines, ['r'])
+
+    @pytest.mark.slow
+    def test_boxplot_series(self):
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.box(logy=True, ax=ax)
+        self._check_ax_scales(ax, yaxis='log')
+        xlabels = ax.get_xticklabels()
+        self._check_text_labels(xlabels, [self.ts.name])
+        ylabels = ax.get_yticklabels()
+        self._check_text_labels(ylabels, [''] * len(ylabels))
+
+    @pytest.mark.slow
+    def test_kind_both_ways(self):
+        s = Series(range(3))
+        kinds = (plotting._core._common_kinds +
+                 plotting._core._series_kinds)
+        _, ax = self.plt.subplots()
+        for kind in kinds:
+            if not _ok_for_gaussian_kde(kind):
+                continue
+            s.plot(kind=kind, ax=ax)
+            getattr(s.plot, kind)()
+
+    @pytest.mark.slow
+    def test_invalid_plot_data(self):
+        s = Series(list('abcd'))
+        _, ax = self.plt.subplots()
+        for kind in plotting._core._common_kinds:
+            if not _ok_for_gaussian_kde(kind):
+                continue
+            with pytest.raises(TypeError):
+                s.plot(kind=kind, ax=ax)
+
+    @pytest.mark.slow
+    def test_valid_object_plot(self):
+        s = Series(lrange(10), dtype=object)
+        for kind in plotting._core._common_kinds:
+            if not _ok_for_gaussian_kde(kind):
+                continue
+            _check_plot_works(s.plot, kind=kind)
+
+    def test_partially_invalid_plot_data(self):
+        s = Series(['a', 'b', 1.0, 2])
+        _, ax = self.plt.subplots()
+        for kind in plotting._core._common_kinds:
+            if not _ok_for_gaussian_kde(kind):
+                continue
+            with pytest.raises(TypeError):
+                s.plot(kind=kind, ax=ax)
+
+    def test_invalid_kind(self):
+        s = Series([1, 2])
+        with pytest.raises(ValueError):
+            s.plot(kind='aasdf')
+
+    @pytest.mark.slow
+    def test_dup_datetime_index_plot(self):
+        dr1 = date_range('1/1/2009', periods=4)
+        dr2 = date_range('1/2/2009', periods=4)
+        index = dr1.append(dr2)
+        values = randn(index.size)
+        s = Series(values, index=index)
+        _check_plot_works(s.plot)
+
+    @pytest.mark.slow
+    def test_errorbar_plot(self):
+
+        s = Series(np.arange(10), name='x')
+        s_err = np.random.randn(10)
+        d_err = DataFrame(randn(10, 2), index=s.index, columns=['x', 'y'])
+        # test line and bar plots
+        kinds = ['line', 'bar']
+        for kind in kinds:
+            ax = _check_plot_works(s.plot, yerr=Series(s_err), kind=kind)
+            self._check_has_errorbars(ax, xerr=0, yerr=1)
+            ax = _check_plot_works(s.plot, yerr=s_err, kind=kind)
+            self._check_has_errorbars(ax, xerr=0, yerr=1)
+            ax = _check_plot_works(s.plot, yerr=s_err.tolist(), kind=kind)
+            self._check_has_errorbars(ax, xerr=0, yerr=1)
+            ax = _check_plot_works(s.plot, yerr=d_err, kind=kind)
+            self._check_has_errorbars(ax, xerr=0, yerr=1)
+            ax = _check_plot_works(s.plot, xerr=0.2, yerr=0.2, kind=kind)
+            self._check_has_errorbars(ax, xerr=1, yerr=1)
+
+        ax = _check_plot_works(s.plot, xerr=s_err)
+        self._check_has_errorbars(ax, xerr=1, yerr=0)
+
+        # test time series plotting
+        ix = date_range('1/1/2000', '1/1/2001', freq='M')
+        ts = Series(np.arange(12), index=ix, name='x')
+        ts_err = Series(np.random.randn(12), index=ix)
+        td_err = DataFrame(randn(12, 2), index=ix, columns=['x', 'y'])
+
+        ax = _check_plot_works(ts.plot, yerr=ts_err)
+        self._check_has_errorbars(ax, xerr=0, yerr=1)
+        ax = _check_plot_works(ts.plot, yerr=td_err)
+        self._check_has_errorbars(ax, xerr=0, yerr=1)
+
+        # check incorrect lengths and types
+        with pytest.raises(ValueError):
+            s.plot(yerr=np.arange(11))
+
+        s_err = ['zzz'] * 10
+        # in mpl 1.5+ this is a TypeError
+        with pytest.raises((ValueError, TypeError)):
+            s.plot(yerr=s_err)
+
+    @td.xfail_if_mpl_2_2
+    def test_table(self):
+        _check_plot_works(self.series.plot, table=True)
+        _check_plot_works(self.series.plot, table=self.series)
+
+    @pytest.mark.slow
+    def test_series_grid_settings(self):
+        # Make sure plot defaults to rcParams['axes.grid'] setting, GH 9792
+        self._check_grid_settings(Series([1, 2, 3]),
+                                  plotting._core._series_kinds +
+                                  plotting._core._common_kinds)
+
+    @pytest.mark.slow
+    def test_standard_colors(self):
+        from pandas.plotting._style import _get_standard_colors
+
+        for c in ['r', 'red', 'green', '#FF0000']:
+            result = _get_standard_colors(1, color=c)
+            assert result == [c]
+
+            result = _get_standard_colors(1, color=[c])
+            assert result == [c]
+
+            result = _get_standard_colors(3, color=c)
+            assert result == [c] * 3
+
+            result = _get_standard_colors(3, color=[c])
+            assert result == [c] * 3
+
+    @pytest.mark.slow
+    def test_standard_colors_all(self):
+        import matplotlib.colors as colors
+        from pandas.plotting._style import _get_standard_colors
+
+        # multiple colors like mediumaquamarine
+        for c in colors.cnames:
+            result = _get_standard_colors(num_colors=1, color=c)
+            assert result == [c]
+
+            result = _get_standard_colors(num_colors=1, color=[c])
+            assert result == [c]
+
+            result = _get_standard_colors(num_colors=3, color=c)
+            assert result == [c] * 3
+
+            result = _get_standard_colors(num_colors=3, color=[c])
+            assert result == [c] * 3
+
+        # single letter colors like k
+        for c in colors.ColorConverter.colors:
+            result = _get_standard_colors(num_colors=1, color=c)
+            assert result == [c]
+
+            result = _get_standard_colors(num_colors=1, color=[c])
+            assert result == [c]
+
+            result = _get_standard_colors(num_colors=3, color=c)
+            assert result == [c] * 3
+
+            result = _get_standard_colors(num_colors=3, color=[c])
+            assert result == [c] * 3
+
+    def test_series_plot_color_kwargs(self):
+        # GH1890
+        _, ax = self.plt.subplots()
+        ax = Series(np.arange(12) + 1).plot(color='green', ax=ax)
+        self._check_colors(ax.get_lines(), linecolors=['green'])
+
+    def test_time_series_plot_color_kwargs(self):
+        # #1890
+        _, ax = self.plt.subplots()
+        ax = Series(np.arange(12) + 1, index=date_range(
+            '1/1/2000', periods=12)).plot(color='green', ax=ax)
+        self._check_colors(ax.get_lines(), linecolors=['green'])
+
+    def test_time_series_plot_color_with_empty_kwargs(self):
+        import matplotlib as mpl
+
+        if self.mpl_ge_1_5_0:
+            def_colors = self._maybe_unpack_cycler(mpl.rcParams)
+        else:
+            def_colors = mpl.rcParams['axes.color_cycle']
+        index = date_range('1/1/2000', periods=12)
+        s = Series(np.arange(1, 13), index=index)
+
+        ncolors = 3
+
+        _, ax = self.plt.subplots()
+        for i in range(ncolors):
+            ax = s.plot(ax=ax)
+        self._check_colors(ax.get_lines(), linecolors=def_colors[:ncolors])
+
+    def test_xticklabels(self):
+        # GH11529
+        s = Series(np.arange(10), index=['P%02d' % i for i in range(10)])
+        _, ax = self.plt.subplots()
+        ax = s.plot(xticks=[0, 3, 5, 9], ax=ax)
+        exp = ['P%02d' % i for i in [0, 3, 5, 9]]
+        self._check_text_labels(ax.get_xticklabels(), exp)
+
+    def test_custom_business_day_freq(self):
+        # GH7222
+        from pandas.tseries.offsets import CustomBusinessDay
+        s = Series(range(100, 121), index=pd.bdate_range(
+            start='2014-05-01', end='2014-06-01',
+            freq=CustomBusinessDay(holidays=['2014-05-26'])))
+
+        _check_plot_works(s.plot)
diff --git a/pandas/tests/reshape/__init__.py b/pandas/tests/reshape/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tools/tests/cut_data.csv b/pandas/tests/reshape/data/cut_data.csv
similarity index 100%
rename from pandas/tools/tests/cut_data.csv
rename to pandas/tests/reshape/data/cut_data.csv
diff --git a/pandas/tests/reshape/merge/__init__.py b/pandas/tests/reshape/merge/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/reshape/merge/data/allow_exact_matches.csv b/pandas/tests/reshape/merge/data/allow_exact_matches.csv
new file mode 100644
index 0000000000000..0446fb744c540
--- /dev/null
+++ b/pandas/tests/reshape/merge/data/allow_exact_matches.csv
@@ -0,0 +1,28 @@
+time,ticker,price,quantity,marketCenter,bid,ask
+20160525 13:30:00.023,MSFT,51.95,75,NASDAQ,,
+20160525 13:30:00.038,MSFT,51.95,155,NASDAQ,51.95,51.95
+20160525 13:30:00.048,GOOG,720.77,100,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.92,100,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,200,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,300,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,600,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,44,NASDAQ,720.5,720.93
+20160525 13:30:00.074,AAPL,98.67,478343,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.67,478343,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.66,6,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.65,30,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.65,75,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.65,20,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.65,35,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.65,10,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.55,6,ARCA,,
+20160525 13:30:00.075,AAPL,98.55,6,ARCA,,
+20160525 13:30:00.076,AAPL,98.56,1000,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,200,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,300,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,400,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,600,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,200,ARCA,98.55,98.56
+20160525 13:30:00.078,MSFT,51.95,783,NASDAQ,51.95,51.95
+20160525 13:30:00.078,MSFT,51.95,100,NASDAQ,51.95,51.95
+20160525 13:30:00.078,MSFT,51.95,100,NASDAQ,51.95,51.95
diff --git a/pandas/tests/reshape/merge/data/allow_exact_matches_and_tolerance.csv b/pandas/tests/reshape/merge/data/allow_exact_matches_and_tolerance.csv
new file mode 100644
index 0000000000000..0446fb744c540
--- /dev/null
+++ b/pandas/tests/reshape/merge/data/allow_exact_matches_and_tolerance.csv
@@ -0,0 +1,28 @@
+time,ticker,price,quantity,marketCenter,bid,ask
+20160525 13:30:00.023,MSFT,51.95,75,NASDAQ,,
+20160525 13:30:00.038,MSFT,51.95,155,NASDAQ,51.95,51.95
+20160525 13:30:00.048,GOOG,720.77,100,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.92,100,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,200,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,300,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,600,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,44,NASDAQ,720.5,720.93
+20160525 13:30:00.074,AAPL,98.67,478343,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.67,478343,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.66,6,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.65,30,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.65,75,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.65,20,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.65,35,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.65,10,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.55,6,ARCA,,
+20160525 13:30:00.075,AAPL,98.55,6,ARCA,,
+20160525 13:30:00.076,AAPL,98.56,1000,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,200,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,300,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,400,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,600,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,200,ARCA,98.55,98.56
+20160525 13:30:00.078,MSFT,51.95,783,NASDAQ,51.95,51.95
+20160525 13:30:00.078,MSFT,51.95,100,NASDAQ,51.95,51.95
+20160525 13:30:00.078,MSFT,51.95,100,NASDAQ,51.95,51.95
diff --git a/pandas/tests/reshape/merge/data/asof.csv b/pandas/tests/reshape/merge/data/asof.csv
new file mode 100644
index 0000000000000..d7d061bc46ccc
--- /dev/null
+++ b/pandas/tests/reshape/merge/data/asof.csv
@@ -0,0 +1,28 @@
+time,ticker,price,quantity,marketCenter,bid,ask
+20160525 13:30:00.023,MSFT,51.95,75,NASDAQ,51.95,51.95
+20160525 13:30:00.038,MSFT,51.95,155,NASDAQ,51.95,51.95
+20160525 13:30:00.048,GOOG,720.77,100,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.92,100,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,200,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,300,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,600,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,44,NASDAQ,720.5,720.93
+20160525 13:30:00.074,AAPL,98.67,478343,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.67,478343,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.66,6,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,30,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,75,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,20,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,35,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,10,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.55,6,ARCA,98.55,98.56
+20160525 13:30:00.075,AAPL,98.55,6,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,1000,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,200,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,300,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,400,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,600,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,200,ARCA,98.55,98.56
+20160525 13:30:00.078,MSFT,51.95,783,NASDAQ,51.92,51.95
+20160525 13:30:00.078,MSFT,51.95,100,NASDAQ,51.92,51.95
+20160525 13:30:00.078,MSFT,51.95,100,NASDAQ,51.92,51.95
diff --git a/pandas/tests/reshape/merge/data/asof2.csv b/pandas/tests/reshape/merge/data/asof2.csv
new file mode 100644
index 0000000000000..2c9c0392dd617
--- /dev/null
+++ b/pandas/tests/reshape/merge/data/asof2.csv
@@ -0,0 +1,78 @@
+time,ticker,price,quantity,marketCenter,bid,ask
+20160525 13:30:00.023,MSFT,51.95,75,NASDAQ,51.95,51.95
+20160525 13:30:00.038,MSFT,51.95,155,NASDAQ,51.95,51.95
+20160525 13:30:00.048,GOOG,720.77,100,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.92,100,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,200,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,300,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,600,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,44,NASDAQ,720.5,720.93
+20160525 13:30:00.074,AAPL,98.67,478343,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.67,478343,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.66,6,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,30,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,75,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,20,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,35,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,10,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.55,6,ARCA,98.55,98.56
+20160525 13:30:00.075,AAPL,98.55,6,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,1000,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,200,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,300,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,400,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,600,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,200,ARCA,98.55,98.56
+20160525 13:30:00.078,MSFT,51.95,783,NASDAQ,51.92,51.95
+20160525 13:30:00.078,MSFT,51.95,100,NASDAQ,51.92,51.95
+20160525 13:30:00.078,MSFT,51.95,100,NASDAQ,51.92,51.95
+20160525 13:30:00.084,AAPL,98.64,40,NASDAQ,98.55,98.56
+20160525 13:30:00.084,AAPL,98.55,149,EDGX,98.55,98.56
+20160525 13:30:00.086,AAPL,98.56,500,ARCA,98.55,98.63
+20160525 13:30:00.104,AAPL,98.63,647,EDGX,98.62,98.63
+20160525 13:30:00.104,AAPL,98.63,300,EDGX,98.62,98.63
+20160525 13:30:00.104,AAPL,98.63,50,NASDAQ,98.62,98.63
+20160525 13:30:00.104,AAPL,98.63,50,NASDAQ,98.62,98.63
+20160525 13:30:00.104,AAPL,98.63,70,NASDAQ,98.62,98.63
+20160525 13:30:00.104,AAPL,98.63,70,NASDAQ,98.62,98.63
+20160525 13:30:00.104,AAPL,98.63,1,NASDAQ,98.62,98.63
+20160525 13:30:00.104,AAPL,98.63,62,NASDAQ,98.62,98.63
+20160525 13:30:00.104,AAPL,98.63,10,NASDAQ,98.62,98.63
+20160525 13:30:00.104,AAPL,98.63,100,ARCA,98.62,98.63
+20160525 13:30:00.105,AAPL,98.63,100,ARCA,98.62,98.63
+20160525 13:30:00.105,AAPL,98.63,700,ARCA,98.62,98.63
+20160525 13:30:00.106,AAPL,98.63,61,EDGX,98.62,98.63
+20160525 13:30:00.107,AAPL,98.63,100,ARCA,98.62,98.63
+20160525 13:30:00.107,AAPL,98.63,53,ARCA,98.62,98.63
+20160525 13:30:00.108,AAPL,98.63,100,ARCA,98.62,98.63
+20160525 13:30:00.108,AAPL,98.63,839,ARCA,98.62,98.63
+20160525 13:30:00.115,AAPL,98.63,5,EDGX,98.62,98.63
+20160525 13:30:00.118,AAPL,98.63,295,EDGX,98.62,98.63
+20160525 13:30:00.118,AAPL,98.63,5,EDGX,98.62,98.63
+20160525 13:30:00.128,AAPL,98.63,100,NASDAQ,98.62,98.63
+20160525 13:30:00.128,AAPL,98.63,100,NASDAQ,98.62,98.63
+20160525 13:30:00.128,MSFT,51.92,100,ARCA,51.92,51.95
+20160525 13:30:00.129,AAPL,98.62,100,NASDAQ,98.61,98.63
+20160525 13:30:00.129,AAPL,98.62,10,NASDAQ,98.61,98.63
+20160525 13:30:00.129,AAPL,98.62,59,NASDAQ,98.61,98.63
+20160525 13:30:00.129,AAPL,98.62,31,NASDAQ,98.61,98.63
+20160525 13:30:00.129,AAPL,98.62,69,NASDAQ,98.61,98.63
+20160525 13:30:00.129,AAPL,98.62,12,NASDAQ,98.61,98.63
+20160525 13:30:00.129,AAPL,98.62,12,EDGX,98.61,98.63
+20160525 13:30:00.129,AAPL,98.62,100,ARCA,98.61,98.63
+20160525 13:30:00.129,AAPL,98.62,100,ARCA,98.61,98.63
+20160525 13:30:00.130,MSFT,51.95,317,ARCA,51.93,51.95
+20160525 13:30:00.130,MSFT,51.95,283,ARCA,51.93,51.95
+20160525 13:30:00.135,MSFT,51.93,100,EDGX,51.92,51.95
+20160525 13:30:00.135,AAPL,98.62,100,ARCA,98.61,98.62
+20160525 13:30:00.144,AAPL,98.62,12,NASDAQ,98.61,98.62
+20160525 13:30:00.144,AAPL,98.62,88,NASDAQ,98.61,98.62
+20160525 13:30:00.144,AAPL,98.62,162,NASDAQ,98.61,98.62
+20160525 13:30:00.144,AAPL,98.61,100,BATS,98.61,98.62
+20160525 13:30:00.144,AAPL,98.62,61,ARCA,98.61,98.62
+20160525 13:30:00.144,AAPL,98.62,25,ARCA,98.61,98.62
+20160525 13:30:00.144,AAPL,98.62,14,ARCA,98.61,98.62
+20160525 13:30:00.145,AAPL,98.62,12,ARCA,98.6,98.63
+20160525 13:30:00.145,AAPL,98.62,100,ARCA,98.6,98.63
+20160525 13:30:00.145,AAPL,98.63,100,NASDAQ,98.6,98.63
+20160525 13:30:00.145,AAPL,98.63,100,NASDAQ,98.6,98.63
diff --git a/pandas/tests/reshape/merge/data/quotes.csv b/pandas/tests/reshape/merge/data/quotes.csv
new file mode 100644
index 0000000000000..3f31d2cfffe1b
--- /dev/null
+++ b/pandas/tests/reshape/merge/data/quotes.csv
@@ -0,0 +1,17 @@
+time,ticker,bid,ask
+20160525 13:30:00.023,GOOG,720.50,720.93
+20160525 13:30:00.023,MSFT,51.95,51.95
+20160525 13:30:00.041,MSFT,51.95,51.95
+20160525 13:30:00.048,GOOG,720.50,720.93
+20160525 13:30:00.048,GOOG,720.50,720.93
+20160525 13:30:00.048,GOOG,720.50,720.93
+20160525 13:30:00.048,GOOG,720.50,720.93
+20160525 13:30:00.072,GOOG,720.50,720.88
+20160525 13:30:00.075,AAPL,98.55,98.56
+20160525 13:30:00.076,AAPL,98.55,98.56
+20160525 13:30:00.076,AAPL,98.55,98.56
+20160525 13:30:00.076,AAPL,98.55,98.56
+20160525 13:30:00.078,MSFT,51.95,51.95
+20160525 13:30:00.078,MSFT,51.95,51.95
+20160525 13:30:00.078,MSFT,51.95,51.95
+20160525 13:30:00.078,MSFT,51.92,51.95
diff --git a/pandas/tests/reshape/merge/data/quotes2.csv b/pandas/tests/reshape/merge/data/quotes2.csv
new file mode 100644
index 0000000000000..7ade1e7faf1ae
--- /dev/null
+++ b/pandas/tests/reshape/merge/data/quotes2.csv
@@ -0,0 +1,57 @@
+time,ticker,bid,ask
+20160525 13:30:00.023,GOOG,720.50,720.93
+20160525 13:30:00.023,MSFT,51.95,51.95
+20160525 13:30:00.041,MSFT,51.95,51.95
+20160525 13:30:00.048,GOOG,720.50,720.93
+20160525 13:30:00.048,GOOG,720.50,720.93
+20160525 13:30:00.048,GOOG,720.50,720.93
+20160525 13:30:00.048,GOOG,720.50,720.93
+20160525 13:30:00.072,GOOG,720.50,720.88
+20160525 13:30:00.075,AAPL,98.55,98.56
+20160525 13:30:00.076,AAPL,98.55,98.56
+20160525 13:30:00.076,AAPL,98.55,98.56
+20160525 13:30:00.076,AAPL,98.55,98.56
+20160525 13:30:00.078,MSFT,51.95,51.95
+20160525 13:30:00.078,MSFT,51.95,51.95
+20160525 13:30:00.078,MSFT,51.95,51.95
+20160525 13:30:00.078,MSFT,51.92,51.95
+20160525 13:30:00.079,MSFT,51.92,51.95
+20160525 13:30:00.080,AAPL,98.55,98.56
+20160525 13:30:00.084,AAPL,98.55,98.56
+20160525 13:30:00.086,AAPL,98.55,98.63
+20160525 13:30:00.088,AAPL,98.65,98.63
+20160525 13:30:00.089,AAPL,98.63,98.63
+20160525 13:30:00.104,AAPL,98.63,98.63
+20160525 13:30:00.104,AAPL,98.63,98.63
+20160525 13:30:00.104,AAPL,98.63,98.63
+20160525 13:30:00.104,AAPL,98.63,98.63
+20160525 13:30:00.104,AAPL,98.62,98.63
+20160525 13:30:00.105,AAPL,98.62,98.63
+20160525 13:30:00.107,AAPL,98.62,98.63
+20160525 13:30:00.115,AAPL,98.62,98.63
+20160525 13:30:00.115,AAPL,98.62,98.63
+20160525 13:30:00.118,AAPL,98.62,98.63
+20160525 13:30:00.128,AAPL,98.62,98.63
+20160525 13:30:00.128,AAPL,98.62,98.63
+20160525 13:30:00.129,AAPL,98.62,98.63
+20160525 13:30:00.129,AAPL,98.61,98.63
+20160525 13:30:00.129,AAPL,98.62,98.63
+20160525 13:30:00.129,AAPL,98.62,98.63
+20160525 13:30:00.129,AAPL,98.61,98.63
+20160525 13:30:00.130,MSFT,51.93,51.95
+20160525 13:30:00.130,MSFT,51.93,51.95
+20160525 13:30:00.130,AAPL,98.61,98.63
+20160525 13:30:00.131,AAPL,98.61,98.62
+20160525 13:30:00.131,AAPL,98.61,98.62
+20160525 13:30:00.135,MSFT,51.92,51.95
+20160525 13:30:00.135,AAPL,98.61,98.62
+20160525 13:30:00.136,AAPL,98.61,98.62
+20160525 13:30:00.136,AAPL,98.61,98.62
+20160525 13:30:00.144,AAPL,98.61,98.62
+20160525 13:30:00.144,AAPL,98.61,98.62
+20160525 13:30:00.145,AAPL,98.61,98.62
+20160525 13:30:00.145,AAPL,98.61,98.63
+20160525 13:30:00.145,AAPL,98.61,98.63
+20160525 13:30:00.145,AAPL,98.60,98.63
+20160525 13:30:00.145,AAPL,98.61,98.63
+20160525 13:30:00.145,AAPL,98.60,98.63
diff --git a/pandas/tests/reshape/merge/data/tolerance.csv b/pandas/tests/reshape/merge/data/tolerance.csv
new file mode 100644
index 0000000000000..d7d061bc46ccc
--- /dev/null
+++ b/pandas/tests/reshape/merge/data/tolerance.csv
@@ -0,0 +1,28 @@
+time,ticker,price,quantity,marketCenter,bid,ask
+20160525 13:30:00.023,MSFT,51.95,75,NASDAQ,51.95,51.95
+20160525 13:30:00.038,MSFT,51.95,155,NASDAQ,51.95,51.95
+20160525 13:30:00.048,GOOG,720.77,100,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.92,100,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,200,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,300,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,600,NASDAQ,720.5,720.93
+20160525 13:30:00.048,GOOG,720.93,44,NASDAQ,720.5,720.93
+20160525 13:30:00.074,AAPL,98.67,478343,NASDAQ,,
+20160525 13:30:00.075,AAPL,98.67,478343,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.66,6,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,30,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,75,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,20,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,35,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.65,10,NASDAQ,98.55,98.56
+20160525 13:30:00.075,AAPL,98.55,6,ARCA,98.55,98.56
+20160525 13:30:00.075,AAPL,98.55,6,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,1000,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,200,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,300,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,400,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,600,ARCA,98.55,98.56
+20160525 13:30:00.076,AAPL,98.56,200,ARCA,98.55,98.56
+20160525 13:30:00.078,MSFT,51.95,783,NASDAQ,51.92,51.95
+20160525 13:30:00.078,MSFT,51.95,100,NASDAQ,51.92,51.95
+20160525 13:30:00.078,MSFT,51.95,100,NASDAQ,51.92,51.95
diff --git a/pandas/tests/reshape/merge/data/trades.csv b/pandas/tests/reshape/merge/data/trades.csv
new file mode 100644
index 0000000000000..b26a4ce714255
--- /dev/null
+++ b/pandas/tests/reshape/merge/data/trades.csv
@@ -0,0 +1,28 @@
+time,ticker,price,quantity,marketCenter
+20160525 13:30:00.023,MSFT,51.9500,75,NASDAQ
+20160525 13:30:00.038,MSFT,51.9500,155,NASDAQ
+20160525 13:30:00.048,GOOG,720.7700,100,NASDAQ
+20160525 13:30:00.048,GOOG,720.9200,100,NASDAQ
+20160525 13:30:00.048,GOOG,720.9300,200,NASDAQ
+20160525 13:30:00.048,GOOG,720.9300,300,NASDAQ
+20160525 13:30:00.048,GOOG,720.9300,600,NASDAQ
+20160525 13:30:00.048,GOOG,720.9300,44,NASDAQ
+20160525 13:30:00.074,AAPL,98.6700,478343,NASDAQ
+20160525 13:30:00.075,AAPL,98.6700,478343,NASDAQ
+20160525 13:30:00.075,AAPL,98.6600,6,NASDAQ
+20160525 13:30:00.075,AAPL,98.6500,30,NASDAQ
+20160525 13:30:00.075,AAPL,98.6500,75,NASDAQ
+20160525 13:30:00.075,AAPL,98.6500,20,NASDAQ
+20160525 13:30:00.075,AAPL,98.6500,35,NASDAQ
+20160525 13:30:00.075,AAPL,98.6500,10,NASDAQ
+20160525 13:30:00.075,AAPL,98.5500,6,ARCA
+20160525 13:30:00.075,AAPL,98.5500,6,ARCA
+20160525 13:30:00.076,AAPL,98.5600,1000,ARCA
+20160525 13:30:00.076,AAPL,98.5600,200,ARCA
+20160525 13:30:00.076,AAPL,98.5600,300,ARCA
+20160525 13:30:00.076,AAPL,98.5600,400,ARCA
+20160525 13:30:00.076,AAPL,98.5600,600,ARCA
+20160525 13:30:00.076,AAPL,98.5600,200,ARCA
+20160525 13:30:00.078,MSFT,51.9500,783,NASDAQ
+20160525 13:30:00.078,MSFT,51.9500,100,NASDAQ
+20160525 13:30:00.078,MSFT,51.9500,100,NASDAQ
diff --git a/pandas/tests/reshape/merge/data/trades2.csv b/pandas/tests/reshape/merge/data/trades2.csv
new file mode 100644
index 0000000000000..64021faa68ce3
--- /dev/null
+++ b/pandas/tests/reshape/merge/data/trades2.csv
@@ -0,0 +1,78 @@
+time,ticker,price,quantity,marketCenter
+20160525 13:30:00.023,MSFT,51.9500,75,NASDAQ
+20160525 13:30:00.038,MSFT,51.9500,155,NASDAQ
+20160525 13:30:00.048,GOOG,720.7700,100,NASDAQ
+20160525 13:30:00.048,GOOG,720.9200,100,NASDAQ
+20160525 13:30:00.048,GOOG,720.9300,200,NASDAQ
+20160525 13:30:00.048,GOOG,720.9300,300,NASDAQ
+20160525 13:30:00.048,GOOG,720.9300,600,NASDAQ
+20160525 13:30:00.048,GOOG,720.9300,44,NASDAQ
+20160525 13:30:00.074,AAPL,98.6700,478343,NASDAQ
+20160525 13:30:00.075,AAPL,98.6700,478343,NASDAQ
+20160525 13:30:00.075,AAPL,98.6600,6,NASDAQ
+20160525 13:30:00.075,AAPL,98.6500,30,NASDAQ
+20160525 13:30:00.075,AAPL,98.6500,75,NASDAQ
+20160525 13:30:00.075,AAPL,98.6500,20,NASDAQ
+20160525 13:30:00.075,AAPL,98.6500,35,NASDAQ
+20160525 13:30:00.075,AAPL,98.6500,10,NASDAQ
+20160525 13:30:00.075,AAPL,98.5500,6,ARCA
+20160525 13:30:00.075,AAPL,98.5500,6,ARCA
+20160525 13:30:00.076,AAPL,98.5600,1000,ARCA
+20160525 13:30:00.076,AAPL,98.5600,200,ARCA
+20160525 13:30:00.076,AAPL,98.5600,300,ARCA
+20160525 13:30:00.076,AAPL,98.5600,400,ARCA
+20160525 13:30:00.076,AAPL,98.5600,600,ARCA
+20160525 13:30:00.076,AAPL,98.5600,200,ARCA
+20160525 13:30:00.078,MSFT,51.9500,783,NASDAQ
+20160525 13:30:00.078,MSFT,51.9500,100,NASDAQ
+20160525 13:30:00.078,MSFT,51.9500,100,NASDAQ
+20160525 13:30:00.084,AAPL,98.6400,40,NASDAQ
+20160525 13:30:00.084,AAPL,98.5500,149,EDGX
+20160525 13:30:00.086,AAPL,98.5600,500,ARCA
+20160525 13:30:00.104,AAPL,98.6300,647,EDGX
+20160525 13:30:00.104,AAPL,98.6300,300,EDGX
+20160525 13:30:00.104,AAPL,98.6300,50,NASDAQ
+20160525 13:30:00.104,AAPL,98.6300,50,NASDAQ
+20160525 13:30:00.104,AAPL,98.6300,70,NASDAQ
+20160525 13:30:00.104,AAPL,98.6300,70,NASDAQ
+20160525 13:30:00.104,AAPL,98.6300,1,NASDAQ
+20160525 13:30:00.104,AAPL,98.6300,62,NASDAQ
+20160525 13:30:00.104,AAPL,98.6300,10,NASDAQ
+20160525 13:30:00.104,AAPL,98.6300,100,ARCA
+20160525 13:30:00.105,AAPL,98.6300,100,ARCA
+20160525 13:30:00.105,AAPL,98.6300,700,ARCA
+20160525 13:30:00.106,AAPL,98.6300,61,EDGX
+20160525 13:30:00.107,AAPL,98.6300,100,ARCA
+20160525 13:30:00.107,AAPL,98.6300,53,ARCA
+20160525 13:30:00.108,AAPL,98.6300,100,ARCA
+20160525 13:30:00.108,AAPL,98.6300,839,ARCA
+20160525 13:30:00.115,AAPL,98.6300,5,EDGX
+20160525 13:30:00.118,AAPL,98.6300,295,EDGX
+20160525 13:30:00.118,AAPL,98.6300,5,EDGX
+20160525 13:30:00.128,AAPL,98.6300,100,NASDAQ
+20160525 13:30:00.128,AAPL,98.6300,100,NASDAQ
+20160525 13:30:00.128,MSFT,51.9200,100,ARCA
+20160525 13:30:00.129,AAPL,98.6200,100,NASDAQ
+20160525 13:30:00.129,AAPL,98.6200,10,NASDAQ
+20160525 13:30:00.129,AAPL,98.6200,59,NASDAQ
+20160525 13:30:00.129,AAPL,98.6200,31,NASDAQ
+20160525 13:30:00.129,AAPL,98.6200,69,NASDAQ
+20160525 13:30:00.129,AAPL,98.6200,12,NASDAQ
+20160525 13:30:00.129,AAPL,98.6200,12,EDGX
+20160525 13:30:00.129,AAPL,98.6200,100,ARCA
+20160525 13:30:00.129,AAPL,98.6200,100,ARCA
+20160525 13:30:00.130,MSFT,51.9500,317,ARCA
+20160525 13:30:00.130,MSFT,51.9500,283,ARCA
+20160525 13:30:00.135,MSFT,51.9300,100,EDGX
+20160525 13:30:00.135,AAPL,98.6200,100,ARCA
+20160525 13:30:00.144,AAPL,98.6200,12,NASDAQ
+20160525 13:30:00.144,AAPL,98.6200,88,NASDAQ
+20160525 13:30:00.144,AAPL,98.6200,162,NASDAQ
+20160525 13:30:00.144,AAPL,98.6100,100,BATS
+20160525 13:30:00.144,AAPL,98.6200,61,ARCA
+20160525 13:30:00.144,AAPL,98.6200,25,ARCA
+20160525 13:30:00.144,AAPL,98.6200,14,ARCA
+20160525 13:30:00.145,AAPL,98.6200,12,ARCA
+20160525 13:30:00.145,AAPL,98.6200,100,ARCA
+20160525 13:30:00.145,AAPL,98.6300,100,NASDAQ
+20160525 13:30:00.145,AAPL,98.6300,100,NASDAQ
diff --git a/pandas/tests/reshape/merge/test_join.py b/pandas/tests/reshape/merge/test_join.py
new file mode 100644
index 0000000000000..1b8f3632d381c
--- /dev/null
+++ b/pandas/tests/reshape/merge/test_join.py
@@ -0,0 +1,812 @@
+# pylint: disable=E1103
+
+from warnings import catch_warnings
+from numpy.random import randn
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas.compat import lrange
+import pandas.compat as compat
+from pandas.util.testing import assert_frame_equal
+from pandas import DataFrame, MultiIndex, Series, Index, merge, concat
+
+from pandas._libs import join as libjoin
+import pandas.util.testing as tm
+from pandas.tests.reshape.merge.test_merge import get_test_data, N, NGROUPS
+
+
+a_ = np.array
+
+
+class TestJoin(object):
+
+    def setup_method(self, method):
+        # aggregate multiple columns
+        self.df = DataFrame({'key1': get_test_data(),
+                             'key2': get_test_data(),
+                             'data1': np.random.randn(N),
+                             'data2': np.random.randn(N)})
+
+        # exclude a couple keys for fun
+        self.df = self.df[self.df['key2'] > 1]
+
+        self.df2 = DataFrame({'key1': get_test_data(n=N // 5),
+                              'key2': get_test_data(ngroups=NGROUPS // 2,
+                                                    n=N // 5),
+                              'value': np.random.randn(N // 5)})
+
+        index, data = tm.getMixedTypeDict()
+        self.target = DataFrame(data, index=index)
+
+        # Join on string value
+        self.source = DataFrame({'MergedA': data['A'], 'MergedD': data['D']},
+                                index=data['C'])
+
+    def test_cython_left_outer_join(self):
+        left = a_([0, 1, 2, 1, 2, 0, 0, 1, 2, 3, 3], dtype=np.int64)
+        right = a_([1, 1, 0, 4, 2, 2, 1], dtype=np.int64)
+        max_group = 5
+
+        ls, rs = libjoin.left_outer_join(left, right, max_group)
+
+        exp_ls = left.argsort(kind='mergesort')
+        exp_rs = right.argsort(kind='mergesort')
+
+        exp_li = a_([0, 1, 2, 3, 3, 3, 4, 4, 4, 5, 5, 5,
+                     6, 6, 7, 7, 8, 8, 9, 10])
+        exp_ri = a_([0, 0, 0, 1, 2, 3, 1, 2, 3, 1, 2, 3,
+                     4, 5, 4, 5, 4, 5, -1, -1])
+
+        exp_ls = exp_ls.take(exp_li)
+        exp_ls[exp_li == -1] = -1
+
+        exp_rs = exp_rs.take(exp_ri)
+        exp_rs[exp_ri == -1] = -1
+
+        tm.assert_numpy_array_equal(ls, exp_ls, check_dtype=False)
+        tm.assert_numpy_array_equal(rs, exp_rs, check_dtype=False)
+
+    def test_cython_right_outer_join(self):
+        left = a_([0, 1, 2, 1, 2, 0, 0, 1, 2, 3, 3], dtype=np.int64)
+        right = a_([1, 1, 0, 4, 2, 2, 1], dtype=np.int64)
+        max_group = 5
+
+        rs, ls = libjoin.left_outer_join(right, left, max_group)
+
+        exp_ls = left.argsort(kind='mergesort')
+        exp_rs = right.argsort(kind='mergesort')
+
+        #            0        1        1        1
+        exp_li = a_([0, 1, 2, 3, 4, 5, 3, 4, 5, 3, 4, 5,
+                     #            2        2        4
+                     6, 7, 8, 6, 7, 8, -1])
+        exp_ri = a_([0, 0, 0, 1, 1, 1, 2, 2, 2, 3, 3, 3,
+                     4, 4, 4, 5, 5, 5, 6])
+
+        exp_ls = exp_ls.take(exp_li)
+        exp_ls[exp_li == -1] = -1
+
+        exp_rs = exp_rs.take(exp_ri)
+        exp_rs[exp_ri == -1] = -1
+
+        tm.assert_numpy_array_equal(ls, exp_ls, check_dtype=False)
+        tm.assert_numpy_array_equal(rs, exp_rs, check_dtype=False)
+
+    def test_cython_inner_join(self):
+        left = a_([0, 1, 2, 1, 2, 0, 0, 1, 2, 3, 3], dtype=np.int64)
+        right = a_([1, 1, 0, 4, 2, 2, 1, 4], dtype=np.int64)
+        max_group = 5
+
+        ls, rs = libjoin.inner_join(left, right, max_group)
+
+        exp_ls = left.argsort(kind='mergesort')
+        exp_rs = right.argsort(kind='mergesort')
+
+        exp_li = a_([0, 1, 2, 3, 3, 3, 4, 4, 4, 5, 5, 5,
+                     6, 6, 7, 7, 8, 8])
+        exp_ri = a_([0, 0, 0, 1, 2, 3, 1, 2, 3, 1, 2, 3,
+                     4, 5, 4, 5, 4, 5])
+
+        exp_ls = exp_ls.take(exp_li)
+        exp_ls[exp_li == -1] = -1
+
+        exp_rs = exp_rs.take(exp_ri)
+        exp_rs[exp_ri == -1] = -1
+
+        tm.assert_numpy_array_equal(ls, exp_ls, check_dtype=False)
+        tm.assert_numpy_array_equal(rs, exp_rs, check_dtype=False)
+
+    def test_left_outer_join(self):
+        joined_key2 = merge(self.df, self.df2, on='key2')
+        _check_join(self.df, self.df2, joined_key2, ['key2'], how='left')
+
+        joined_both = merge(self.df, self.df2)
+        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
+                    how='left')
+
+    def test_right_outer_join(self):
+        joined_key2 = merge(self.df, self.df2, on='key2', how='right')
+        _check_join(self.df, self.df2, joined_key2, ['key2'], how='right')
+
+        joined_both = merge(self.df, self.df2, how='right')
+        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
+                    how='right')
+
+    def test_full_outer_join(self):
+        joined_key2 = merge(self.df, self.df2, on='key2', how='outer')
+        _check_join(self.df, self.df2, joined_key2, ['key2'], how='outer')
+
+        joined_both = merge(self.df, self.df2, how='outer')
+        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
+                    how='outer')
+
+    def test_inner_join(self):
+        joined_key2 = merge(self.df, self.df2, on='key2', how='inner')
+        _check_join(self.df, self.df2, joined_key2, ['key2'], how='inner')
+
+        joined_both = merge(self.df, self.df2, how='inner')
+        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
+                    how='inner')
+
+    def test_handle_overlap(self):
+        joined = merge(self.df, self.df2, on='key2',
+                       suffixes=['.foo', '.bar'])
+
+        assert 'key1.foo' in joined
+        assert 'key1.bar' in joined
+
+    def test_handle_overlap_arbitrary_key(self):
+        joined = merge(self.df, self.df2,
+                       left_on='key2', right_on='key1',
+                       suffixes=['.foo', '.bar'])
+        assert 'key1.foo' in joined
+        assert 'key2.bar' in joined
+
+    def test_join_on(self):
+        target = self.target
+        source = self.source
+
+        merged = target.join(source, on='C')
+        tm.assert_series_equal(merged['MergedA'], target['A'],
+                               check_names=False)
+        tm.assert_series_equal(merged['MergedD'], target['D'],
+                               check_names=False)
+
+        # join with duplicates (fix regression from DataFrame/Matrix merge)
+        df = DataFrame({'key': ['a', 'a', 'b', 'b', 'c']})
+        df2 = DataFrame({'value': [0, 1, 2]}, index=['a', 'b', 'c'])
+        joined = df.join(df2, on='key')
+        expected = DataFrame({'key': ['a', 'a', 'b', 'b', 'c'],
+                              'value': [0, 0, 1, 1, 2]})
+        assert_frame_equal(joined, expected)
+
+        # Test when some are missing
+        df_a = DataFrame([[1], [2], [3]], index=['a', 'b', 'c'],
+                         columns=['one'])
+        df_b = DataFrame([['foo'], ['bar']], index=[1, 2],
+                         columns=['two'])
+        df_c = DataFrame([[1], [2]], index=[1, 2],
+                         columns=['three'])
+        joined = df_a.join(df_b, on='one')
+        joined = joined.join(df_c, on='one')
+        assert np.isnan(joined['two']['c'])
+        assert np.isnan(joined['three']['c'])
+
+        # merge column not p resent
+        pytest.raises(KeyError, target.join, source, on='E')
+
+        # overlap
+        source_copy = source.copy()
+        source_copy['A'] = 0
+        pytest.raises(ValueError, target.join, source_copy, on='A')
+
+    def test_join_on_fails_with_different_right_index(self):
+        with pytest.raises(ValueError):
+            df = DataFrame({'a': np.random.choice(['m', 'f'], size=3),
+                            'b': np.random.randn(3)})
+            df2 = DataFrame({'a': np.random.choice(['m', 'f'], size=10),
+                             'b': np.random.randn(10)},
+                            index=tm.makeCustomIndex(10, 2))
+            merge(df, df2, left_on='a', right_index=True)
+
+    def test_join_on_fails_with_different_left_index(self):
+        with pytest.raises(ValueError):
+            df = DataFrame({'a': np.random.choice(['m', 'f'], size=3),
+                            'b': np.random.randn(3)},
+                           index=tm.makeCustomIndex(10, 2))
+            df2 = DataFrame({'a': np.random.choice(['m', 'f'], size=10),
+                             'b': np.random.randn(10)})
+            merge(df, df2, right_on='b', left_index=True)
+
+    def test_join_on_fails_with_different_column_counts(self):
+        with pytest.raises(ValueError):
+            df = DataFrame({'a': np.random.choice(['m', 'f'], size=3),
+                            'b': np.random.randn(3)})
+            df2 = DataFrame({'a': np.random.choice(['m', 'f'], size=10),
+                             'b': np.random.randn(10)},
+                            index=tm.makeCustomIndex(10, 2))
+            merge(df, df2, right_on='a', left_on=['a', 'b'])
+
+    def test_join_on_fails_with_wrong_object_type(self):
+        # GH12081
+        wrongly_typed = [Series([0, 1]), 2, 'str', None, np.array([0, 1])]
+        df = DataFrame({'a': [1, 1]})
+
+        for obj in wrongly_typed:
+            with tm.assert_raises_regex(ValueError, str(type(obj))):
+                merge(obj, df, left_on='a', right_on='a')
+            with tm.assert_raises_regex(ValueError, str(type(obj))):
+                merge(df, obj, left_on='a', right_on='a')
+
+    def test_join_on_pass_vector(self):
+        expected = self.target.join(self.source, on='C')
+        del expected['C']
+
+        join_col = self.target.pop('C')
+        result = self.target.join(self.source, on=join_col)
+        assert_frame_equal(result, expected)
+
+    def test_join_with_len0(self):
+        # nothing to merge
+        merged = self.target.join(self.source.reindex([]), on='C')
+        for col in self.source:
+            assert col in merged
+            assert merged[col].isna().all()
+
+        merged2 = self.target.join(self.source.reindex([]), on='C',
+                                   how='inner')
+        tm.assert_index_equal(merged2.columns, merged.columns)
+        assert len(merged2) == 0
+
+    def test_join_on_inner(self):
+        df = DataFrame({'key': ['a', 'a', 'd', 'b', 'b', 'c']})
+        df2 = DataFrame({'value': [0, 1]}, index=['a', 'b'])
+
+        joined = df.join(df2, on='key', how='inner')
+
+        expected = df.join(df2, on='key')
+        expected = expected[expected['value'].notna()]
+        tm.assert_series_equal(joined['key'], expected['key'],
+                               check_dtype=False)
+        tm.assert_series_equal(joined['value'], expected['value'],
+                               check_dtype=False)
+        tm.assert_index_equal(joined.index, expected.index)
+
+    def test_join_on_singlekey_list(self):
+        df = DataFrame({'key': ['a', 'a', 'b', 'b', 'c']})
+        df2 = DataFrame({'value': [0, 1, 2]}, index=['a', 'b', 'c'])
+
+        # corner cases
+        joined = df.join(df2, on=['key'])
+        expected = df.join(df2, on='key')
+
+        assert_frame_equal(joined, expected)
+
+    def test_join_on_series(self):
+        result = self.target.join(self.source['MergedA'], on='C')
+        expected = self.target.join(self.source[['MergedA']], on='C')
+        assert_frame_equal(result, expected)
+
+    def test_join_on_series_buglet(self):
+        # GH #638
+        df = DataFrame({'a': [1, 1]})
+        ds = Series([2], index=[1], name='b')
+        result = df.join(ds, on='a')
+        expected = DataFrame({'a': [1, 1],
+                              'b': [2, 2]}, index=df.index)
+        tm.assert_frame_equal(result, expected)
+
+    def test_join_index_mixed(self, join_type):
+        # no overlapping blocks
+        df1 = DataFrame(index=np.arange(10))
+        df1['bool'] = True
+        df1['string'] = 'foo'
+
+        df2 = DataFrame(index=np.arange(5, 15))
+        df2['int'] = 1
+        df2['float'] = 1.
+
+        joined = df1.join(df2, how=join_type)
+        expected = _join_by_hand(df1, df2, how=join_type)
+        assert_frame_equal(joined, expected)
+
+        joined = df2.join(df1, how=join_type)
+        expected = _join_by_hand(df2, df1, how=join_type)
+        assert_frame_equal(joined, expected)
+
+    def test_join_index_mixed_overlap(self):
+        df1 = DataFrame({'A': 1., 'B': 2, 'C': 'foo', 'D': True},
+                        index=np.arange(10),
+                        columns=['A', 'B', 'C', 'D'])
+        assert df1['B'].dtype == np.int64
+        assert df1['D'].dtype == np.bool_
+
+        df2 = DataFrame({'A': 1., 'B': 2, 'C': 'foo', 'D': True},
+                        index=np.arange(0, 10, 2),
+                        columns=['A', 'B', 'C', 'D'])
+
+        # overlap
+        joined = df1.join(df2, lsuffix='_one', rsuffix='_two')
+        expected_columns = ['A_one', 'B_one', 'C_one', 'D_one',
+                            'A_two', 'B_two', 'C_two', 'D_two']
+        df1.columns = expected_columns[:4]
+        df2.columns = expected_columns[4:]
+        expected = _join_by_hand(df1, df2)
+        assert_frame_equal(joined, expected)
+
+    def test_join_empty_bug(self):
+        # generated an exception in 0.4.3
+        x = DataFrame()
+        x.join(DataFrame([3], index=[0], columns=['A']), how='outer')
+
+    def test_join_unconsolidated(self):
+        # GH #331
+        a = DataFrame(randn(30, 2), columns=['a', 'b'])
+        c = Series(randn(30))
+        a['c'] = c
+        d = DataFrame(randn(30, 1), columns=['q'])
+
+        # it works!
+        a.join(d)
+        d.join(a)
+
+    def test_join_multiindex(self):
+        index1 = MultiIndex.from_arrays([['a', 'a', 'a', 'b', 'b', 'b'],
+                                         [1, 2, 3, 1, 2, 3]],
+                                        names=['first', 'second'])
+
+        index2 = MultiIndex.from_arrays([['b', 'b', 'b', 'c', 'c', 'c'],
+                                         [1, 2, 3, 1, 2, 3]],
+                                        names=['first', 'second'])
+
+        df1 = DataFrame(data=np.random.randn(6), index=index1,
+                        columns=['var X'])
+        df2 = DataFrame(data=np.random.randn(6), index=index2,
+                        columns=['var Y'])
+
+        df1 = df1.sort_index(level=0)
+        df2 = df2.sort_index(level=0)
+
+        joined = df1.join(df2, how='outer')
+        ex_index = Index(index1.values).union(Index(index2.values))
+        expected = df1.reindex(ex_index).join(df2.reindex(ex_index))
+        expected.index.names = index1.names
+        assert_frame_equal(joined, expected)
+        assert joined.index.names == index1.names
+
+        df1 = df1.sort_index(level=1)
+        df2 = df2.sort_index(level=1)
+
+        joined = df1.join(df2, how='outer').sort_index(level=0)
+        ex_index = Index(index1.values).union(Index(index2.values))
+        expected = df1.reindex(ex_index).join(df2.reindex(ex_index))
+        expected.index.names = index1.names
+
+        assert_frame_equal(joined, expected)
+        assert joined.index.names == index1.names
+
+    def test_join_inner_multiindex(self):
+        key1 = ['bar', 'bar', 'bar', 'foo', 'foo', 'baz', 'baz', 'qux',
+                'qux', 'snap']
+        key2 = ['two', 'one', 'three', 'one', 'two', 'one', 'two', 'two',
+                'three', 'one']
+
+        data = np.random.randn(len(key1))
+        data = DataFrame({'key1': key1, 'key2': key2,
+                          'data': data})
+
+        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                                   ['one', 'two', 'three']],
+                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           names=['first', 'second'])
+        to_join = DataFrame(np.random.randn(10, 3), index=index,
+                            columns=['j_one', 'j_two', 'j_three'])
+
+        joined = data.join(to_join, on=['key1', 'key2'], how='inner')
+        expected = merge(data, to_join.reset_index(),
+                         left_on=['key1', 'key2'],
+                         right_on=['first', 'second'], how='inner',
+                         sort=False)
+
+        expected2 = merge(to_join, data,
+                          right_on=['key1', 'key2'], left_index=True,
+                          how='inner', sort=False)
+        assert_frame_equal(joined, expected2.reindex_like(joined))
+
+        expected2 = merge(to_join, data, right_on=['key1', 'key2'],
+                          left_index=True, how='inner', sort=False)
+
+        expected = expected.drop(['first', 'second'], axis=1)
+        expected.index = joined.index
+
+        assert joined.index.is_monotonic
+        assert_frame_equal(joined, expected)
+
+        # _assert_same_contents(expected, expected2.loc[:, expected.columns])
+
+    def test_join_hierarchical_mixed(self):
+        # GH 2024
+        df = DataFrame([(1, 2, 3), (4, 5, 6)], columns=['a', 'b', 'c'])
+        new_df = df.groupby(['a']).agg({'b': [np.mean, np.sum]})
+        other_df = DataFrame(
+            [(1, 2, 3), (7, 10, 6)], columns=['a', 'b', 'd'])
+        other_df.set_index('a', inplace=True)
+        # GH 9455, 12219
+        with tm.assert_produces_warning(UserWarning):
+            result = merge(new_df, other_df, left_index=True, right_index=True)
+        assert ('b', 'mean') in result
+        assert 'b' in result
+
+    def test_join_float64_float32(self):
+
+        a = DataFrame(randn(10, 2), columns=['a', 'b'], dtype=np.float64)
+        b = DataFrame(randn(10, 1), columns=['c'], dtype=np.float32)
+        joined = a.join(b)
+        assert joined.dtypes['a'] == 'float64'
+        assert joined.dtypes['b'] == 'float64'
+        assert joined.dtypes['c'] == 'float32'
+
+        a = np.random.randint(0, 5, 100).astype('int64')
+        b = np.random.random(100).astype('float64')
+        c = np.random.random(100).astype('float32')
+        df = DataFrame({'a': a, 'b': b, 'c': c})
+        xpdf = DataFrame({'a': a, 'b': b, 'c': c})
+        s = DataFrame(np.random.random(5).astype('float32'), columns=['md'])
+        rs = df.merge(s, left_on='a', right_index=True)
+        assert rs.dtypes['a'] == 'int64'
+        assert rs.dtypes['b'] == 'float64'
+        assert rs.dtypes['c'] == 'float32'
+        assert rs.dtypes['md'] == 'float32'
+
+        xp = xpdf.merge(s, left_on='a', right_index=True)
+        assert_frame_equal(rs, xp)
+
+    def test_join_many_non_unique_index(self):
+        df1 = DataFrame({"a": [1, 1], "b": [1, 1], "c": [10, 20]})
+        df2 = DataFrame({"a": [1, 1], "b": [1, 2], "d": [100, 200]})
+        df3 = DataFrame({"a": [1, 1], "b": [1, 2], "e": [1000, 2000]})
+        idf1 = df1.set_index(["a", "b"])
+        idf2 = df2.set_index(["a", "b"])
+        idf3 = df3.set_index(["a", "b"])
+
+        result = idf1.join([idf2, idf3], how='outer')
+
+        df_partially_merged = merge(df1, df2, on=['a', 'b'], how='outer')
+        expected = merge(df_partially_merged, df3, on=['a', 'b'], how='outer')
+
+        result = result.reset_index()
+        expected = expected[result.columns]
+        expected['a'] = expected.a.astype('int64')
+        expected['b'] = expected.b.astype('int64')
+        assert_frame_equal(result, expected)
+
+        df1 = DataFrame({"a": [1, 1, 1], "b": [1, 1, 1], "c": [10, 20, 30]})
+        df2 = DataFrame({"a": [1, 1, 1], "b": [1, 1, 2], "d": [100, 200, 300]})
+        df3 = DataFrame(
+            {"a": [1, 1, 1], "b": [1, 1, 2], "e": [1000, 2000, 3000]})
+        idf1 = df1.set_index(["a", "b"])
+        idf2 = df2.set_index(["a", "b"])
+        idf3 = df3.set_index(["a", "b"])
+        result = idf1.join([idf2, idf3], how='inner')
+
+        df_partially_merged = merge(df1, df2, on=['a', 'b'], how='inner')
+        expected = merge(df_partially_merged, df3, on=['a', 'b'], how='inner')
+
+        result = result.reset_index()
+
+        assert_frame_equal(result, expected.loc[:, result.columns])
+
+        # GH 11519
+        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                              'foo', 'bar', 'foo', 'foo'],
+                        'B': ['one', 'one', 'two', 'three',
+                              'two', 'two', 'one', 'three'],
+                        'C': np.random.randn(8),
+                        'D': np.random.randn(8)})
+        s = Series(np.repeat(np.arange(8), 2),
+                   index=np.repeat(np.arange(8), 2), name='TEST')
+        inner = df.join(s, how='inner')
+        outer = df.join(s, how='outer')
+        left = df.join(s, how='left')
+        right = df.join(s, how='right')
+        assert_frame_equal(inner, outer)
+        assert_frame_equal(inner, left)
+        assert_frame_equal(inner, right)
+
+    def test_join_sort(self):
+        left = DataFrame({'key': ['foo', 'bar', 'baz', 'foo'],
+                          'value': [1, 2, 3, 4]})
+        right = DataFrame({'value2': ['a', 'b', 'c']},
+                          index=['bar', 'baz', 'foo'])
+
+        joined = left.join(right, on='key', sort=True)
+        expected = DataFrame({'key': ['bar', 'baz', 'foo', 'foo'],
+                              'value': [2, 3, 1, 4],
+                              'value2': ['a', 'b', 'c', 'c']},
+                             index=[1, 2, 0, 3])
+        assert_frame_equal(joined, expected)
+
+        # smoke test
+        joined = left.join(right, on='key', sort=False)
+        tm.assert_index_equal(joined.index, pd.Index(lrange(4)))
+
+    def test_join_mixed_non_unique_index(self):
+        # GH 12814, unorderable types in py3 with a non-unique index
+        df1 = DataFrame({'a': [1, 2, 3, 4]}, index=[1, 2, 3, 'a'])
+        df2 = DataFrame({'b': [5, 6, 7, 8]}, index=[1, 3, 3, 4])
+        result = df1.join(df2)
+        expected = DataFrame({'a': [1, 2, 3, 3, 4],
+                              'b': [5, np.nan, 6, 7, np.nan]},
+                             index=[1, 2, 3, 3, 'a'])
+        tm.assert_frame_equal(result, expected)
+
+        df3 = DataFrame({'a': [1, 2, 3, 4]}, index=[1, 2, 2, 'a'])
+        df4 = DataFrame({'b': [5, 6, 7, 8]}, index=[1, 2, 3, 4])
+        result = df3.join(df4)
+        expected = DataFrame({'a': [1, 2, 3, 4], 'b': [5, 6, 6, np.nan]},
+                             index=[1, 2, 2, 'a'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_join_non_unique_period_index(self):
+        # GH #16871
+        index = pd.period_range('2016-01-01', periods=16, freq='M')
+        df = DataFrame([i for i in range(len(index))],
+                       index=index, columns=['pnum'])
+        df2 = concat([df, df])
+        result = df.join(df2, how='inner', rsuffix='_df2')
+        expected = DataFrame(
+            np.tile(np.arange(16, dtype=np.int64).repeat(2).reshape(-1, 1), 2),
+            columns=['pnum', 'pnum_df2'], index=df2.sort_index().index)
+        tm.assert_frame_equal(result, expected)
+
+    def test_mixed_type_join_with_suffix(self):
+        # GH #916
+        df = DataFrame(np.random.randn(20, 6),
+                       columns=['a', 'b', 'c', 'd', 'e', 'f'])
+        df.insert(0, 'id', 0)
+        df.insert(5, 'dt', 'foo')
+
+        grouped = df.groupby('id')
+        mn = grouped.mean()
+        cn = grouped.count()
+
+        # it works!
+        mn.join(cn, rsuffix='_right')
+
+    def test_join_many(self):
+        df = DataFrame(np.random.randn(10, 6), columns=list('abcdef'))
+        df_list = [df[['a', 'b']], df[['c', 'd']], df[['e', 'f']]]
+
+        joined = df_list[0].join(df_list[1:])
+        tm.assert_frame_equal(joined, df)
+
+        df_list = [df[['a', 'b']][:-2],
+                   df[['c', 'd']][2:], df[['e', 'f']][1:9]]
+
+        def _check_diff_index(df_list, result, exp_index):
+            reindexed = [x.reindex(exp_index) for x in df_list]
+            expected = reindexed[0].join(reindexed[1:])
+            tm.assert_frame_equal(result, expected)
+
+        # different join types
+        joined = df_list[0].join(df_list[1:], how='outer')
+        _check_diff_index(df_list, joined, df.index)
+
+        joined = df_list[0].join(df_list[1:])
+        _check_diff_index(df_list, joined, df_list[0].index)
+
+        joined = df_list[0].join(df_list[1:], how='inner')
+        _check_diff_index(df_list, joined, df.index[2:8])
+
+        pytest.raises(ValueError, df_list[0].join, df_list[1:], on='a')
+
+    def test_join_many_mixed(self):
+        df = DataFrame(np.random.randn(8, 4), columns=['A', 'B', 'C', 'D'])
+        df['key'] = ['foo', 'bar'] * 4
+        df1 = df.loc[:, ['A', 'B']]
+        df2 = df.loc[:, ['C', 'D']]
+        df3 = df.loc[:, ['key']]
+
+        result = df1.join([df2, df3])
+        assert_frame_equal(result, df)
+
+    def test_join_dups(self):
+
+        # joining dups
+        df = concat([DataFrame(np.random.randn(10, 4),
+                               columns=['A', 'A', 'B', 'B']),
+                     DataFrame(np.random.randint(0, 10, size=20)
+                               .reshape(10, 2),
+                               columns=['A', 'C'])],
+                    axis=1)
+
+        expected = concat([df, df], axis=1)
+        result = df.join(df, rsuffix='_2')
+        result.columns = expected.columns
+        assert_frame_equal(result, expected)
+
+        # GH 4975, invalid join on dups
+        w = DataFrame(np.random.randn(4, 2), columns=["x", "y"])
+        x = DataFrame(np.random.randn(4, 2), columns=["x", "y"])
+        y = DataFrame(np.random.randn(4, 2), columns=["x", "y"])
+        z = DataFrame(np.random.randn(4, 2), columns=["x", "y"])
+
+        dta = x.merge(y, left_index=True, right_index=True).merge(
+            z, left_index=True, right_index=True, how="outer")
+        dta = dta.merge(w, left_index=True, right_index=True)
+        expected = concat([x, y, z, w], axis=1)
+        expected.columns = ['x_x', 'y_x', 'x_y',
+                            'y_y', 'x_x', 'y_x', 'x_y', 'y_y']
+        assert_frame_equal(dta, expected)
+
+    def test_panel_join(self):
+        with catch_warnings(record=True):
+            panel = tm.makePanel()
+            tm.add_nans(panel)
+
+            p1 = panel.iloc[:2, :10, :3]
+            p2 = panel.iloc[2:, 5:, 2:]
+
+            # left join
+            result = p1.join(p2)
+            expected = p1.copy()
+            expected['ItemC'] = p2['ItemC']
+            tm.assert_panel_equal(result, expected)
+
+            # right join
+            result = p1.join(p2, how='right')
+            expected = p2.copy()
+            expected['ItemA'] = p1['ItemA']
+            expected['ItemB'] = p1['ItemB']
+            expected = expected.reindex(items=['ItemA', 'ItemB', 'ItemC'])
+            tm.assert_panel_equal(result, expected)
+
+            # inner join
+            result = p1.join(p2, how='inner')
+            expected = panel.iloc[:, 5:10, 2:3]
+            tm.assert_panel_equal(result, expected)
+
+            # outer join
+            result = p1.join(p2, how='outer')
+            expected = p1.reindex(major=panel.major_axis,
+                                  minor=panel.minor_axis)
+            expected = expected.join(p2.reindex(major=panel.major_axis,
+                                                minor=panel.minor_axis))
+            tm.assert_panel_equal(result, expected)
+
+    def test_panel_join_overlap(self):
+        with catch_warnings(record=True):
+            panel = tm.makePanel()
+            tm.add_nans(panel)
+
+            p1 = panel.loc[['ItemA', 'ItemB', 'ItemC']]
+            p2 = panel.loc[['ItemB', 'ItemC']]
+
+            # Expected index is
+            #
+            # ItemA, ItemB_p1, ItemC_p1, ItemB_p2, ItemC_p2
+            joined = p1.join(p2, lsuffix='_p1', rsuffix='_p2')
+            p1_suf = p1.loc[['ItemB', 'ItemC']].add_suffix('_p1')
+            p2_suf = p2.loc[['ItemB', 'ItemC']].add_suffix('_p2')
+            no_overlap = panel.loc[['ItemA']]
+            expected = no_overlap.join(p1_suf.join(p2_suf))
+            tm.assert_panel_equal(joined, expected)
+
+    def test_panel_join_many(self):
+        with catch_warnings(record=True):
+            tm.K = 10
+            panel = tm.makePanel()
+            tm.K = 4
+
+            panels = [panel.iloc[:2], panel.iloc[2:6], panel.iloc[6:]]
+
+            joined = panels[0].join(panels[1:])
+            tm.assert_panel_equal(joined, panel)
+
+            panels = [panel.iloc[:2, :-5],
+                      panel.iloc[2:6, 2:],
+                      panel.iloc[6:, 5:-7]]
+
+            data_dict = {}
+            for p in panels:
+                data_dict.update(p.iteritems())
+
+            joined = panels[0].join(panels[1:], how='inner')
+            expected = pd.Panel.from_dict(data_dict, intersect=True)
+            tm.assert_panel_equal(joined, expected)
+
+            joined = panels[0].join(panels[1:], how='outer')
+            expected = pd.Panel.from_dict(data_dict, intersect=False)
+            tm.assert_panel_equal(joined, expected)
+
+            # edge cases
+            pytest.raises(ValueError, panels[0].join, panels[1:],
+                          how='outer', lsuffix='foo', rsuffix='bar')
+            pytest.raises(ValueError, panels[0].join, panels[1:],
+                          how='right')
+
+
+def _check_join(left, right, result, join_col, how='left',
+                lsuffix='_x', rsuffix='_y'):
+
+    # some smoke tests
+    for c in join_col:
+        assert(result[c].notna().all())
+
+    left_grouped = left.groupby(join_col)
+    right_grouped = right.groupby(join_col)
+
+    for group_key, group in result.groupby(join_col):
+        l_joined = _restrict_to_columns(group, left.columns, lsuffix)
+        r_joined = _restrict_to_columns(group, right.columns, rsuffix)
+
+        try:
+            lgroup = left_grouped.get_group(group_key)
+        except KeyError:
+            if how in ('left', 'inner'):
+                raise AssertionError('key %s should not have been in the join'
+                                     % str(group_key))
+
+            _assert_all_na(l_joined, left.columns, join_col)
+        else:
+            _assert_same_contents(l_joined, lgroup)
+
+        try:
+            rgroup = right_grouped.get_group(group_key)
+        except KeyError:
+            if how in ('right', 'inner'):
+                raise AssertionError('key %s should not have been in the join'
+                                     % str(group_key))
+
+            _assert_all_na(r_joined, right.columns, join_col)
+        else:
+            _assert_same_contents(r_joined, rgroup)
+
+
+def _restrict_to_columns(group, columns, suffix):
+    found = [c for c in group.columns
+             if c in columns or c.replace(suffix, '') in columns]
+
+    # filter
+    group = group.loc[:, found]
+
+    # get rid of suffixes, if any
+    group = group.rename(columns=lambda x: x.replace(suffix, ''))
+
+    # put in the right order...
+    group = group.loc[:, columns]
+
+    return group
+
+
+def _assert_same_contents(join_chunk, source):
+    NA_SENTINEL = -1234567  # drop_duplicates not so NA-friendly...
+
+    jvalues = join_chunk.fillna(NA_SENTINEL).drop_duplicates().values
+    svalues = source.fillna(NA_SENTINEL).drop_duplicates().values
+
+    rows = {tuple(row) for row in jvalues}
+    assert(len(rows) == len(source))
+    assert(all(tuple(row) in rows for row in svalues))
+
+
+def _assert_all_na(join_chunk, source_columns, join_col):
+    for c in source_columns:
+        if c in join_col:
+            continue
+        assert(join_chunk[c].isna().all())
+
+
+def _join_by_hand(a, b, how='left'):
+    join_index = a.index.join(b.index, how=how)
+
+    a_re = a.reindex(join_index)
+    b_re = b.reindex(join_index)
+
+    result_columns = a.columns.append(b.columns)
+
+    for col, s in compat.iteritems(b_re):
+        a_re[col] = s
+    return a_re.reindex(columns=result_columns)
diff --git a/pandas/tests/reshape/merge/test_merge.py b/pandas/tests/reshape/merge/test_merge.py
new file mode 100644
index 0000000000000..037bd9cc7cd18
--- /dev/null
+++ b/pandas/tests/reshape/merge/test_merge.py
@@ -0,0 +1,1889 @@
+# pylint: disable=E1103
+
+import random
+import re
+from collections import OrderedDict
+from datetime import date, datetime
+
+import numpy as np
+import pytest
+from numpy import nan
+from numpy.random import randn
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import (Categorical, CategoricalIndex, DataFrame, DatetimeIndex,
+                    Float64Index, Index, Int64Index, MultiIndex, RangeIndex,
+                    Series, UInt64Index)
+from pandas.api.types import CategoricalDtype as CDT
+from pandas.compat import lrange, lzip
+from pandas.core.dtypes.common import is_categorical_dtype, is_object_dtype
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas.core.reshape.concat import concat
+from pandas.core.reshape.merge import MergeError, merge
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+
+N = 50
+NGROUPS = 8
+
+
+def get_test_data(ngroups=NGROUPS, n=N):
+    unique_groups = lrange(ngroups)
+    arr = np.asarray(np.tile(unique_groups, n // ngroups))
+
+    if len(arr) < n:
+        arr = np.asarray(list(arr) + unique_groups[:n - len(arr)])
+
+    random.shuffle(arr)
+    return arr
+
+
+class TestMerge(object):
+
+    def setup_method(self, method):
+        # aggregate multiple columns
+        self.df = DataFrame({'key1': get_test_data(),
+                             'key2': get_test_data(),
+                             'data1': np.random.randn(N),
+                             'data2': np.random.randn(N)})
+
+        # exclude a couple keys for fun
+        self.df = self.df[self.df['key2'] > 1]
+
+        self.df2 = DataFrame({'key1': get_test_data(n=N // 5),
+                              'key2': get_test_data(ngroups=NGROUPS // 2,
+                                                    n=N // 5),
+                              'value': np.random.randn(N // 5)})
+
+        self.left = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'e', 'a'],
+                               'v1': np.random.randn(7)})
+        self.right = DataFrame({'v2': np.random.randn(4)},
+                               index=['d', 'b', 'c', 'a'])
+
+    def test_merge_inner_join_empty(self):
+        # GH 15328
+        df_empty = pd.DataFrame()
+        df_a = pd.DataFrame({'a': [1, 2]}, index=[0, 1], dtype='int64')
+        result = pd.merge(df_empty, df_a, left_index=True, right_index=True)
+        expected = pd.DataFrame({'a': []}, index=[], dtype='int64')
+        assert_frame_equal(result, expected)
+
+    def test_merge_common(self):
+        joined = merge(self.df, self.df2)
+        exp = merge(self.df, self.df2, on=['key1', 'key2'])
+        tm.assert_frame_equal(joined, exp)
+
+    def test_merge_index_as_on_arg(self):
+        # GH14355
+
+        left = self.df.set_index('key1')
+        right = self.df2.set_index('key1')
+        result = merge(left, right, on='key1')
+        expected = merge(self.df, self.df2, on='key1').set_index('key1')
+        assert_frame_equal(result, expected)
+
+    def test_merge_index_singlekey_right_vs_left(self):
+        left = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'e', 'a'],
+                          'v1': np.random.randn(7)})
+        right = DataFrame({'v2': np.random.randn(4)},
+                          index=['d', 'b', 'c', 'a'])
+
+        merged1 = merge(left, right, left_on='key',
+                        right_index=True, how='left', sort=False)
+        merged2 = merge(right, left, right_on='key',
+                        left_index=True, how='right', sort=False)
+        assert_frame_equal(merged1, merged2.loc[:, merged1.columns])
+
+        merged1 = merge(left, right, left_on='key',
+                        right_index=True, how='left', sort=True)
+        merged2 = merge(right, left, right_on='key',
+                        left_index=True, how='right', sort=True)
+        assert_frame_equal(merged1, merged2.loc[:, merged1.columns])
+
+    def test_merge_index_singlekey_inner(self):
+        left = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'e', 'a'],
+                          'v1': np.random.randn(7)})
+        right = DataFrame({'v2': np.random.randn(4)},
+                          index=['d', 'b', 'c', 'a'])
+
+        # inner join
+        result = merge(left, right, left_on='key', right_index=True,
+                       how='inner')
+        expected = left.join(right, on='key').loc[result.index]
+        assert_frame_equal(result, expected)
+
+        result = merge(right, left, right_on='key', left_index=True,
+                       how='inner')
+        expected = left.join(right, on='key').loc[result.index]
+        assert_frame_equal(result, expected.loc[:, result.columns])
+
+    def test_merge_misspecified(self):
+        pytest.raises(ValueError, merge, self.left, self.right,
+                      left_index=True)
+        pytest.raises(ValueError, merge, self.left, self.right,
+                      right_index=True)
+
+        pytest.raises(ValueError, merge, self.left, self.left,
+                      left_on='key', on='key')
+
+        pytest.raises(ValueError, merge, self.df, self.df2,
+                      left_on=['key1'], right_on=['key1', 'key2'])
+
+    def test_index_and_on_parameters_confusion(self):
+        pytest.raises(ValueError, merge, self.df, self.df2, how='left',
+                      left_index=False, right_index=['key1', 'key2'])
+        pytest.raises(ValueError, merge, self.df, self.df2, how='left',
+                      left_index=['key1', 'key2'], right_index=False)
+        pytest.raises(ValueError, merge, self.df, self.df2, how='left',
+                      left_index=['key1', 'key2'],
+                      right_index=['key1', 'key2'])
+
+    def test_merge_overlap(self):
+        merged = merge(self.left, self.left, on='key')
+        exp_len = (self.left['key'].value_counts() ** 2).sum()
+        assert len(merged) == exp_len
+        assert 'v1_x' in merged
+        assert 'v1_y' in merged
+
+    def test_merge_different_column_key_names(self):
+        left = DataFrame({'lkey': ['foo', 'bar', 'baz', 'foo'],
+                          'value': [1, 2, 3, 4]})
+        right = DataFrame({'rkey': ['foo', 'bar', 'qux', 'foo'],
+                           'value': [5, 6, 7, 8]})
+
+        merged = left.merge(right, left_on='lkey', right_on='rkey',
+                            how='outer', sort=True)
+
+        exp = pd.Series(['bar', 'baz', 'foo', 'foo', 'foo', 'foo', np.nan],
+                        name='lkey')
+        tm.assert_series_equal(merged['lkey'], exp)
+
+        exp = pd.Series(['bar', np.nan, 'foo', 'foo', 'foo', 'foo', 'qux'],
+                        name='rkey')
+        tm.assert_series_equal(merged['rkey'], exp)
+
+        exp = pd.Series([2, 3, 1, 1, 4, 4, np.nan], name='value_x')
+        tm.assert_series_equal(merged['value_x'], exp)
+
+        exp = pd.Series([6, np.nan, 5, 8, 5, 8, 7], name='value_y')
+        tm.assert_series_equal(merged['value_y'], exp)
+
+    def test_merge_copy(self):
+        left = DataFrame({'a': 0, 'b': 1}, index=lrange(10))
+        right = DataFrame({'c': 'foo', 'd': 'bar'}, index=lrange(10))
+
+        merged = merge(left, right, left_index=True,
+                       right_index=True, copy=True)
+
+        merged['a'] = 6
+        assert (left['a'] == 0).all()
+
+        merged['d'] = 'peekaboo'
+        assert (right['d'] == 'bar').all()
+
+    def test_merge_nocopy(self):
+        left = DataFrame({'a': 0, 'b': 1}, index=lrange(10))
+        right = DataFrame({'c': 'foo', 'd': 'bar'}, index=lrange(10))
+
+        merged = merge(left, right, left_index=True,
+                       right_index=True, copy=False)
+
+        merged['a'] = 6
+        assert (left['a'] == 6).all()
+
+        merged['d'] = 'peekaboo'
+        assert (right['d'] == 'peekaboo').all()
+
+    def test_intelligently_handle_join_key(self):
+        # #733, be a bit more 1337 about not returning unconsolidated DataFrame
+
+        left = DataFrame({'key': [1, 1, 2, 2, 3],
+                          'value': lrange(5)}, columns=['value', 'key'])
+        right = DataFrame({'key': [1, 1, 2, 3, 4, 5],
+                           'rvalue': lrange(6)})
+
+        joined = merge(left, right, on='key', how='outer')
+        expected = DataFrame({'key': [1, 1, 1, 1, 2, 2, 3, 4, 5],
+                              'value': np.array([0, 0, 1, 1, 2, 3, 4,
+                                                 np.nan, np.nan]),
+                              'rvalue': [0, 1, 0, 1, 2, 2, 3, 4, 5]},
+                             columns=['value', 'key', 'rvalue'])
+        assert_frame_equal(joined, expected)
+
+    def test_merge_join_key_dtype_cast(self):
+        # #8596
+
+        df1 = DataFrame({'key': [1], 'v1': [10]})
+        df2 = DataFrame({'key': [2], 'v1': [20]})
+        df = merge(df1, df2, how='outer')
+        assert df['key'].dtype == 'int64'
+
+        df1 = DataFrame({'key': [True], 'v1': [1]})
+        df2 = DataFrame({'key': [False], 'v1': [0]})
+        df = merge(df1, df2, how='outer')
+
+        # GH13169
+        # this really should be bool
+        assert df['key'].dtype == 'object'
+
+        df1 = DataFrame({'val': [1]})
+        df2 = DataFrame({'val': [2]})
+        lkey = np.array([1])
+        rkey = np.array([2])
+        df = merge(df1, df2, left_on=lkey, right_on=rkey, how='outer')
+        assert df['key_0'].dtype == 'int64'
+
+    def test_handle_join_key_pass_array(self):
+        left = DataFrame({'key': [1, 1, 2, 2, 3],
+                          'value': lrange(5)}, columns=['value', 'key'])
+        right = DataFrame({'rvalue': lrange(6)})
+        key = np.array([1, 1, 2, 3, 4, 5])
+
+        merged = merge(left, right, left_on='key', right_on=key, how='outer')
+        merged2 = merge(right, left, left_on=key, right_on='key', how='outer')
+
+        assert_series_equal(merged['key'], merged2['key'])
+        assert merged['key'].notna().all()
+        assert merged2['key'].notna().all()
+
+        left = DataFrame({'value': lrange(5)}, columns=['value'])
+        right = DataFrame({'rvalue': lrange(6)})
+        lkey = np.array([1, 1, 2, 2, 3])
+        rkey = np.array([1, 1, 2, 3, 4, 5])
+
+        merged = merge(left, right, left_on=lkey, right_on=rkey, how='outer')
+        tm.assert_series_equal(merged['key_0'], Series([1, 1, 1, 1, 2,
+                                                        2, 3, 4, 5],
+                                                       name='key_0'))
+
+        left = DataFrame({'value': lrange(3)})
+        right = DataFrame({'rvalue': lrange(6)})
+
+        key = np.array([0, 1, 1, 2, 2, 3], dtype=np.int64)
+        merged = merge(left, right, left_index=True, right_on=key, how='outer')
+        tm.assert_series_equal(merged['key_0'], Series(key, name='key_0'))
+
+    def test_no_overlap_more_informative_error(self):
+        dt = datetime.now()
+        df1 = DataFrame({'x': ['a']}, index=[dt])
+
+        df2 = DataFrame({'y': ['b', 'c']}, index=[dt, dt])
+        pytest.raises(MergeError, merge, df1, df2)
+
+        msg = ('No common columns to perform merge on. '
+               'Merge options: left_on={lon}, right_on={ron}, '
+               'left_index={lidx}, right_index={ridx}'
+               .format(lon=None, ron=None, lidx=False, ridx=False))
+
+        with tm.assert_raises_regex(MergeError, msg):
+            merge(df1, df2)
+
+    def test_merge_non_unique_indexes(self):
+
+        dt = datetime(2012, 5, 1)
+        dt2 = datetime(2012, 5, 2)
+        dt3 = datetime(2012, 5, 3)
+        dt4 = datetime(2012, 5, 4)
+
+        df1 = DataFrame({'x': ['a']}, index=[dt])
+        df2 = DataFrame({'y': ['b', 'c']}, index=[dt, dt])
+        _check_merge(df1, df2)
+
+        # Not monotonic
+        df1 = DataFrame({'x': ['a', 'b', 'q']}, index=[dt2, dt, dt4])
+        df2 = DataFrame({'y': ['c', 'd', 'e', 'f', 'g', 'h']},
+                        index=[dt3, dt3, dt2, dt2, dt, dt])
+        _check_merge(df1, df2)
+
+        df1 = DataFrame({'x': ['a', 'b']}, index=[dt, dt])
+        df2 = DataFrame({'y': ['c', 'd']}, index=[dt, dt])
+        _check_merge(df1, df2)
+
+    def test_merge_non_unique_index_many_to_many(self):
+        dt = datetime(2012, 5, 1)
+        dt2 = datetime(2012, 5, 2)
+        dt3 = datetime(2012, 5, 3)
+        df1 = DataFrame({'x': ['a', 'b', 'c', 'd']},
+                        index=[dt2, dt2, dt, dt])
+        df2 = DataFrame({'y': ['e', 'f', 'g', ' h', 'i']},
+                        index=[dt2, dt2, dt3, dt, dt])
+        _check_merge(df1, df2)
+
+    def test_left_merge_empty_dataframe(self):
+        left = DataFrame({'key': [1], 'value': [2]})
+        right = DataFrame({'key': []})
+
+        result = merge(left, right, on='key', how='left')
+        assert_frame_equal(result, left)
+
+        result = merge(right, left, on='key', how='right')
+        assert_frame_equal(result, left)
+
+    @pytest.mark.parametrize('kwarg',
+                             [dict(left_index=True, right_index=True),
+                              dict(left_index=True, right_on='x'),
+                              dict(left_on='a', right_index=True),
+                              dict(left_on='a', right_on='x')])
+    def test_merge_left_empty_right_empty(self, join_type, kwarg):
+        # GH 10824
+        left = pd.DataFrame([], columns=['a', 'b', 'c'])
+        right = pd.DataFrame([], columns=['x', 'y', 'z'])
+
+        exp_in = pd.DataFrame([], columns=['a', 'b', 'c', 'x', 'y', 'z'],
+                              index=pd.Index([], dtype=object),
+                              dtype=object)
+
+        result = pd.merge(left, right, how=join_type, **kwarg)
+        tm.assert_frame_equal(result, exp_in)
+
+    def test_merge_left_empty_right_notempty(self):
+        # GH 10824
+        left = pd.DataFrame([], columns=['a', 'b', 'c'])
+        right = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                             columns=['x', 'y', 'z'])
+
+        exp_out = pd.DataFrame({'a': np.array([np.nan] * 3, dtype=object),
+                                'b': np.array([np.nan] * 3, dtype=object),
+                                'c': np.array([np.nan] * 3, dtype=object),
+                                'x': [1, 4, 7],
+                                'y': [2, 5, 8],
+                                'z': [3, 6, 9]},
+                               columns=['a', 'b', 'c', 'x', 'y', 'z'])
+        exp_in = exp_out[0:0]  # make empty DataFrame keeping dtype
+        # result will have object dtype
+        exp_in.index = exp_in.index.astype(object)
+
+        def check1(exp, kwarg):
+            result = pd.merge(left, right, how='inner', **kwarg)
+            tm.assert_frame_equal(result, exp)
+            result = pd.merge(left, right, how='left', **kwarg)
+            tm.assert_frame_equal(result, exp)
+
+        def check2(exp, kwarg):
+            result = pd.merge(left, right, how='right', **kwarg)
+            tm.assert_frame_equal(result, exp)
+            result = pd.merge(left, right, how='outer', **kwarg)
+            tm.assert_frame_equal(result, exp)
+
+        for kwarg in [dict(left_index=True, right_index=True),
+                      dict(left_index=True, right_on='x')]:
+            check1(exp_in, kwarg)
+            check2(exp_out, kwarg)
+
+        kwarg = dict(left_on='a', right_index=True)
+        check1(exp_in, kwarg)
+        exp_out['a'] = [0, 1, 2]
+        check2(exp_out, kwarg)
+
+        kwarg = dict(left_on='a', right_on='x')
+        check1(exp_in, kwarg)
+        exp_out['a'] = np.array([np.nan] * 3, dtype=object)
+        check2(exp_out, kwarg)
+
+    def test_merge_left_notempty_right_empty(self):
+        # GH 10824
+        left = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                            columns=['a', 'b', 'c'])
+        right = pd.DataFrame([], columns=['x', 'y', 'z'])
+
+        exp_out = pd.DataFrame({'a': [1, 4, 7],
+                                'b': [2, 5, 8],
+                                'c': [3, 6, 9],
+                                'x': np.array([np.nan] * 3, dtype=object),
+                                'y': np.array([np.nan] * 3, dtype=object),
+                                'z': np.array([np.nan] * 3, dtype=object)},
+                               columns=['a', 'b', 'c', 'x', 'y', 'z'])
+        exp_in = exp_out[0:0]  # make empty DataFrame keeping dtype
+        # result will have object dtype
+        exp_in.index = exp_in.index.astype(object)
+
+        def check1(exp, kwarg):
+            result = pd.merge(left, right, how='inner', **kwarg)
+            tm.assert_frame_equal(result, exp)
+            result = pd.merge(left, right, how='right', **kwarg)
+            tm.assert_frame_equal(result, exp)
+
+        def check2(exp, kwarg):
+            result = pd.merge(left, right, how='left', **kwarg)
+            tm.assert_frame_equal(result, exp)
+            result = pd.merge(left, right, how='outer', **kwarg)
+            tm.assert_frame_equal(result, exp)
+
+            for kwarg in [dict(left_index=True, right_index=True),
+                          dict(left_index=True, right_on='x'),
+                          dict(left_on='a', right_index=True),
+                          dict(left_on='a', right_on='x')]:
+                check1(exp_in, kwarg)
+                check2(exp_out, kwarg)
+
+    def test_merge_nosort(self):
+        # #2098, anything to do?
+
+        from datetime import datetime
+
+        d = {"var1": np.random.randint(0, 10, size=10),
+             "var2": np.random.randint(0, 10, size=10),
+             "var3": [datetime(2012, 1, 12),
+                      datetime(2011, 2, 4),
+                      datetime(2010, 2, 3),
+                      datetime(2012, 1, 12),
+                      datetime(2011, 2, 4),
+                      datetime(2012, 4, 3),
+                      datetime(2012, 3, 4),
+                      datetime(2008, 5, 1),
+                      datetime(2010, 2, 3),
+                      datetime(2012, 2, 3)]}
+        df = DataFrame.from_dict(d)
+        var3 = df.var3.unique()
+        var3.sort()
+        new = DataFrame.from_dict({"var3": var3,
+                                   "var8": np.random.random(7)})
+
+        result = df.merge(new, on="var3", sort=False)
+        exp = merge(df, new, on='var3', sort=False)
+        assert_frame_equal(result, exp)
+
+        assert (df.var3.unique() == result.var3.unique()).all()
+
+    def test_merge_nan_right(self):
+        df1 = DataFrame({"i1": [0, 1], "i2": [0, 1]})
+        df2 = DataFrame({"i1": [0], "i3": [0]})
+        result = df1.join(df2, on="i1", rsuffix="_")
+        expected = (DataFrame({'i1': {0: 0.0, 1: 1}, 'i2': {0: 0, 1: 1},
+                               'i1_': {0: 0, 1: np.nan},
+                               'i3': {0: 0.0, 1: np.nan},
+                               None: {0: 0, 1: 0}})
+                    .set_index(None)
+                    .reset_index()[['i1', 'i2', 'i1_', 'i3']])
+        assert_frame_equal(result, expected, check_dtype=False)
+
+        df1 = DataFrame({"i1": [0, 1], "i2": [0.5, 1.5]})
+        df2 = DataFrame({"i1": [0], "i3": [0.7]})
+        result = df1.join(df2, rsuffix="_", on='i1')
+        expected = (DataFrame({'i1': {0: 0, 1: 1}, 'i1_': {0: 0.0, 1: nan},
+                               'i2': {0: 0.5, 1: 1.5},
+                               'i3': {0: 0.69999999999999996,
+                                      1: nan}})
+                    [['i1', 'i2', 'i1_', 'i3']])
+        assert_frame_equal(result, expected)
+
+    def test_merge_type(self):
+        class NotADataFrame(DataFrame):
+
+            @property
+            def _constructor(self):
+                return NotADataFrame
+
+        nad = NotADataFrame(self.df)
+        result = nad.merge(self.df2, on='key1')
+
+        assert isinstance(result, NotADataFrame)
+
+    def test_join_append_timedeltas(self):
+
+        import datetime as dt
+        from pandas import NaT
+
+        # timedelta64 issues with join/merge
+        # GH 5695
+
+        d = {'d': dt.datetime(2013, 11, 5, 5, 56), 't': dt.timedelta(0, 22500)}
+        df = DataFrame(columns=list('dt'))
+        df = df.append(d, ignore_index=True)
+        result = df.append(d, ignore_index=True)
+        expected = DataFrame({'d': [dt.datetime(2013, 11, 5, 5, 56),
+                                    dt.datetime(2013, 11, 5, 5, 56)],
+                              't': [dt.timedelta(0, 22500),
+                                    dt.timedelta(0, 22500)]})
+        assert_frame_equal(result, expected)
+
+        td = np.timedelta64(300000000)
+        lhs = DataFrame(Series([td, td], index=["A", "B"]))
+        rhs = DataFrame(Series([td], index=["A"]))
+
+        result = lhs.join(rhs, rsuffix='r', how="left")
+        expected = DataFrame({'0': Series([td, td], index=list('AB')),
+                              '0r': Series([td, NaT], index=list('AB'))})
+        assert_frame_equal(result, expected)
+
+    def test_other_datetime_unit(self):
+        # GH 13389
+        df1 = pd.DataFrame({'entity_id': [101, 102]})
+        s = pd.Series([None, None], index=[101, 102], name='days')
+
+        for dtype in ['datetime64[D]', 'datetime64[h]', 'datetime64[m]',
+                      'datetime64[s]', 'datetime64[ms]', 'datetime64[us]',
+                      'datetime64[ns]']:
+
+            df2 = s.astype(dtype).to_frame('days')
+            # coerces to datetime64[ns], thus sholuld not be affected
+            assert df2['days'].dtype == 'datetime64[ns]'
+
+            result = df1.merge(df2, left_on='entity_id', right_index=True)
+
+            exp = pd.DataFrame({'entity_id': [101, 102],
+                                'days': np.array(['nat', 'nat'],
+                                                 dtype='datetime64[ns]')},
+                               columns=['entity_id', 'days'])
+            tm.assert_frame_equal(result, exp)
+
+    @pytest.mark.parametrize("unit", ['D', 'h', 'm', 's', 'ms', 'us', 'ns'])
+    def test_other_timedelta_unit(self, unit):
+        # GH 13389
+        df1 = pd.DataFrame({'entity_id': [101, 102]})
+        s = pd.Series([None, None], index=[101, 102], name='days')
+
+        dtype = "m8[{}]".format(unit)
+        df2 = s.astype(dtype).to_frame('days')
+        assert df2['days'].dtype == 'm8[ns]'
+
+        result = df1.merge(df2, left_on='entity_id', right_index=True)
+
+        exp = pd.DataFrame({'entity_id': [101, 102],
+                            'days': np.array(['nat', 'nat'],
+                                             dtype=dtype)},
+                           columns=['entity_id', 'days'])
+        tm.assert_frame_equal(result, exp)
+
+    def test_overlapping_columns_error_message(self):
+        df = DataFrame({'key': [1, 2, 3],
+                        'v1': [4, 5, 6],
+                        'v2': [7, 8, 9]})
+        df2 = DataFrame({'key': [1, 2, 3],
+                         'v1': [4, 5, 6],
+                         'v2': [7, 8, 9]})
+
+        df.columns = ['key', 'foo', 'foo']
+        df2.columns = ['key', 'bar', 'bar']
+        expected = DataFrame({'key': [1, 2, 3],
+                              'v1': [4, 5, 6],
+                              'v2': [7, 8, 9],
+                              'v3': [4, 5, 6],
+                              'v4': [7, 8, 9]})
+        expected.columns = ['key', 'foo', 'foo', 'bar', 'bar']
+        assert_frame_equal(merge(df, df2), expected)
+
+        # #2649, #10639
+        df2.columns = ['key1', 'foo', 'foo']
+        pytest.raises(ValueError, merge, df, df2)
+
+    def test_merge_on_datetime64tz(self):
+
+        # GH11405
+        left = pd.DataFrame({'key': pd.date_range('20151010', periods=2,
+                                                  tz='US/Eastern'),
+                             'value': [1, 2]})
+        right = pd.DataFrame({'key': pd.date_range('20151011', periods=3,
+                                                   tz='US/Eastern'),
+                              'value': [1, 2, 3]})
+
+        expected = DataFrame({'key': pd.date_range('20151010', periods=4,
+                                                   tz='US/Eastern'),
+                              'value_x': [1, 2, np.nan, np.nan],
+                              'value_y': [np.nan, 1, 2, 3]})
+        result = pd.merge(left, right, on='key', how='outer')
+        assert_frame_equal(result, expected)
+
+        left = pd.DataFrame({'key': [1, 2],
+                             'value': pd.date_range('20151010', periods=2,
+                                                    tz='US/Eastern')})
+        right = pd.DataFrame({'key': [2, 3],
+                              'value': pd.date_range('20151011', periods=2,
+                                                     tz='US/Eastern')})
+        expected = DataFrame({
+            'key': [1, 2, 3],
+            'value_x': list(pd.date_range('20151010', periods=2,
+                                          tz='US/Eastern')) + [pd.NaT],
+            'value_y': [pd.NaT] + list(pd.date_range('20151011', periods=2,
+                                                     tz='US/Eastern'))})
+        result = pd.merge(left, right, on='key', how='outer')
+        assert_frame_equal(result, expected)
+        assert result['value_x'].dtype == 'datetime64[ns, US/Eastern]'
+        assert result['value_y'].dtype == 'datetime64[ns, US/Eastern]'
+
+    def test_merge_non_unique_period_index(self):
+        # GH #16871
+        index = pd.period_range('2016-01-01', periods=16, freq='M')
+        df = DataFrame([i for i in range(len(index))],
+                       index=index, columns=['pnum'])
+        df2 = concat([df, df])
+        result = df.merge(df2, left_index=True, right_index=True, how='inner')
+        expected = DataFrame(
+            np.tile(np.arange(16, dtype=np.int64).repeat(2).reshape(-1, 1), 2),
+            columns=['pnum_x', 'pnum_y'], index=df2.sort_index().index)
+        tm.assert_frame_equal(result, expected)
+
+    def test_merge_on_periods(self):
+        left = pd.DataFrame({'key': pd.period_range('20151010', periods=2,
+                                                    freq='D'),
+                             'value': [1, 2]})
+        right = pd.DataFrame({'key': pd.period_range('20151011', periods=3,
+                                                     freq='D'),
+                              'value': [1, 2, 3]})
+
+        expected = DataFrame({'key': pd.period_range('20151010', periods=4,
+                                                     freq='D'),
+                              'value_x': [1, 2, np.nan, np.nan],
+                              'value_y': [np.nan, 1, 2, 3]})
+        result = pd.merge(left, right, on='key', how='outer')
+        assert_frame_equal(result, expected)
+
+        left = pd.DataFrame({'key': [1, 2],
+                             'value': pd.period_range('20151010', periods=2,
+                                                      freq='D')})
+        right = pd.DataFrame({'key': [2, 3],
+                              'value': pd.period_range('20151011', periods=2,
+                                                       freq='D')})
+
+        exp_x = pd.period_range('20151010', periods=2, freq='D')
+        exp_y = pd.period_range('20151011', periods=2, freq='D')
+        expected = DataFrame({'key': [1, 2, 3],
+                              'value_x': list(exp_x) + [pd.NaT],
+                              'value_y': [pd.NaT] + list(exp_y)})
+        result = pd.merge(left, right, on='key', how='outer')
+        assert_frame_equal(result, expected)
+        assert result['value_x'].dtype == 'object'
+        assert result['value_y'].dtype == 'object'
+
+    def test_indicator(self):
+        # PR #10054. xref #7412 and closes #8790.
+        df1 = DataFrame({'col1': [0, 1], 'col_conflict': [1, 2],
+                         'col_left': ['a', 'b']})
+        df1_copy = df1.copy()
+
+        df2 = DataFrame({'col1': [1, 2, 3, 4, 5],
+                         'col_conflict': [1, 2, 3, 4, 5],
+                         'col_right': [2, 2, 2, 2, 2]})
+        df2_copy = df2.copy()
+
+        df_result = DataFrame({
+            'col1': [0, 1, 2, 3, 4, 5],
+            'col_conflict_x': [1, 2, np.nan, np.nan, np.nan, np.nan],
+            'col_left': ['a', 'b', np.nan, np.nan, np.nan, np.nan],
+            'col_conflict_y': [np.nan, 1, 2, 3, 4, 5],
+            'col_right': [np.nan, 2, 2, 2, 2, 2]})
+        df_result['_merge'] = Categorical(
+            ['left_only', 'both', 'right_only',
+             'right_only', 'right_only', 'right_only'],
+            categories=['left_only', 'right_only', 'both'])
+
+        df_result = df_result[['col1', 'col_conflict_x', 'col_left',
+                               'col_conflict_y', 'col_right', '_merge']]
+
+        test = merge(df1, df2, on='col1', how='outer', indicator=True)
+        assert_frame_equal(test, df_result)
+        test = df1.merge(df2, on='col1', how='outer', indicator=True)
+        assert_frame_equal(test, df_result)
+
+        # No side effects
+        assert_frame_equal(df1, df1_copy)
+        assert_frame_equal(df2, df2_copy)
+
+        # Check with custom name
+        df_result_custom_name = df_result
+        df_result_custom_name = df_result_custom_name.rename(
+            columns={'_merge': 'custom_name'})
+
+        test_custom_name = merge(
+            df1, df2, on='col1', how='outer', indicator='custom_name')
+        assert_frame_equal(test_custom_name, df_result_custom_name)
+        test_custom_name = df1.merge(
+            df2, on='col1', how='outer', indicator='custom_name')
+        assert_frame_equal(test_custom_name, df_result_custom_name)
+
+        # Check only accepts strings and booleans
+        with pytest.raises(ValueError):
+            merge(df1, df2, on='col1', how='outer', indicator=5)
+        with pytest.raises(ValueError):
+            df1.merge(df2, on='col1', how='outer', indicator=5)
+
+        # Check result integrity
+
+        test2 = merge(df1, df2, on='col1', how='left', indicator=True)
+        assert (test2._merge != 'right_only').all()
+        test2 = df1.merge(df2, on='col1', how='left', indicator=True)
+        assert (test2._merge != 'right_only').all()
+
+        test3 = merge(df1, df2, on='col1', how='right', indicator=True)
+        assert (test3._merge != 'left_only').all()
+        test3 = df1.merge(df2, on='col1', how='right', indicator=True)
+        assert (test3._merge != 'left_only').all()
+
+        test4 = merge(df1, df2, on='col1', how='inner', indicator=True)
+        assert (test4._merge == 'both').all()
+        test4 = df1.merge(df2, on='col1', how='inner', indicator=True)
+        assert (test4._merge == 'both').all()
+
+        # Check if working name in df
+        for i in ['_right_indicator', '_left_indicator', '_merge']:
+            df_badcolumn = DataFrame({'col1': [1, 2], i: [2, 2]})
+
+            with pytest.raises(ValueError):
+                merge(df1, df_badcolumn, on='col1',
+                      how='outer', indicator=True)
+            with pytest.raises(ValueError):
+                df1.merge(df_badcolumn, on='col1', how='outer', indicator=True)
+
+        # Check for name conflict with custom name
+        df_badcolumn = DataFrame(
+            {'col1': [1, 2], 'custom_column_name': [2, 2]})
+
+        with pytest.raises(ValueError):
+            merge(df1, df_badcolumn, on='col1', how='outer',
+                  indicator='custom_column_name')
+        with pytest.raises(ValueError):
+            df1.merge(df_badcolumn, on='col1', how='outer',
+                      indicator='custom_column_name')
+
+        # Merge on multiple columns
+        df3 = DataFrame({'col1': [0, 1], 'col2': ['a', 'b']})
+
+        df4 = DataFrame({'col1': [1, 1, 3], 'col2': ['b', 'x', 'y']})
+
+        hand_coded_result = DataFrame({'col1': [0, 1, 1, 3],
+                                       'col2': ['a', 'b', 'x', 'y']})
+        hand_coded_result['_merge'] = Categorical(
+            ['left_only', 'both', 'right_only', 'right_only'],
+            categories=['left_only', 'right_only', 'both'])
+
+        test5 = merge(df3, df4, on=['col1', 'col2'],
+                      how='outer', indicator=True)
+        assert_frame_equal(test5, hand_coded_result)
+        test5 = df3.merge(df4, on=['col1', 'col2'],
+                          how='outer', indicator=True)
+        assert_frame_equal(test5, hand_coded_result)
+
+    def test_validation(self):
+        left = DataFrame({'a': ['a', 'b', 'c', 'd'],
+                          'b': ['cat', 'dog', 'weasel', 'horse']},
+                         index=range(4))
+
+        right = DataFrame({'a': ['a', 'b', 'c', 'd', 'e'],
+                           'c': ['meow', 'bark', 'um... weasel noise?',
+                                 'nay', 'chirp']},
+                          index=range(5))
+
+        # Make sure no side effects.
+        left_copy = left.copy()
+        right_copy = right.copy()
+
+        result = merge(left, right, left_index=True, right_index=True,
+                       validate='1:1')
+        assert_frame_equal(left, left_copy)
+        assert_frame_equal(right, right_copy)
+
+        # make sure merge still correct
+        expected = DataFrame({'a_x': ['a', 'b', 'c', 'd'],
+                              'b': ['cat', 'dog', 'weasel', 'horse'],
+                              'a_y': ['a', 'b', 'c', 'd'],
+                              'c': ['meow', 'bark', 'um... weasel noise?',
+                                    'nay']},
+                             index=range(4),
+                             columns=['a_x', 'b', 'a_y', 'c'])
+
+        result = merge(left, right, left_index=True, right_index=True,
+                       validate='one_to_one')
+        assert_frame_equal(result, expected)
+
+        expected_2 = DataFrame({'a': ['a', 'b', 'c', 'd'],
+                                'b': ['cat', 'dog', 'weasel', 'horse'],
+                                'c': ['meow', 'bark', 'um... weasel noise?',
+                                      'nay']},
+                               index=range(4))
+
+        result = merge(left, right, on='a', validate='1:1')
+        assert_frame_equal(left, left_copy)
+        assert_frame_equal(right, right_copy)
+        assert_frame_equal(result, expected_2)
+
+        result = merge(left, right, on='a', validate='one_to_one')
+        assert_frame_equal(result, expected_2)
+
+        # One index, one column
+        expected_3 = DataFrame({'b': ['cat', 'dog', 'weasel', 'horse'],
+                                'a': ['a', 'b', 'c', 'd'],
+                                'c': ['meow', 'bark', 'um... weasel noise?',
+                                      'nay']},
+                               columns=['b', 'a', 'c'],
+                               index=range(4))
+
+        left_index_reset = left.set_index('a')
+        result = merge(left_index_reset, right, left_index=True,
+                       right_on='a', validate='one_to_one')
+        assert_frame_equal(result, expected_3)
+
+        # Dups on right
+        right_w_dups = right.append(pd.DataFrame({'a': ['e'], 'c': ['moo']},
+                                                 index=[4]))
+        merge(left, right_w_dups, left_index=True, right_index=True,
+              validate='one_to_many')
+
+        with pytest.raises(MergeError):
+            merge(left, right_w_dups, left_index=True, right_index=True,
+                  validate='one_to_one')
+
+        with pytest.raises(MergeError):
+            merge(left, right_w_dups, on='a', validate='one_to_one')
+
+        # Dups on left
+        left_w_dups = left.append(pd.DataFrame({'a': ['a'], 'c': ['cow']},
+                                               index=[3]), sort=True)
+        merge(left_w_dups, right, left_index=True, right_index=True,
+              validate='many_to_one')
+
+        with pytest.raises(MergeError):
+            merge(left_w_dups, right, left_index=True, right_index=True,
+                  validate='one_to_one')
+
+        with pytest.raises(MergeError):
+            merge(left_w_dups, right, on='a', validate='one_to_one')
+
+        # Dups on both
+        merge(left_w_dups, right_w_dups, on='a', validate='many_to_many')
+
+        with pytest.raises(MergeError):
+            merge(left_w_dups, right_w_dups, left_index=True,
+                  right_index=True, validate='many_to_one')
+
+        with pytest.raises(MergeError):
+            merge(left_w_dups, right_w_dups, on='a',
+                  validate='one_to_many')
+
+        # Check invalid arguments
+        with pytest.raises(ValueError):
+            merge(left, right, on='a', validate='jibberish')
+
+        # Two column merge, dups in both, but jointly no dups.
+        left = DataFrame({'a': ['a', 'a', 'b', 'b'],
+                          'b': [0, 1, 0, 1],
+                          'c': ['cat', 'dog', 'weasel', 'horse']},
+                         index=range(4))
+
+        right = DataFrame({'a': ['a', 'a', 'b'],
+                           'b': [0, 1, 0],
+                           'd': ['meow', 'bark', 'um... weasel noise?']},
+                          index=range(3))
+
+        expected_multi = DataFrame({'a': ['a', 'a', 'b'],
+                                    'b': [0, 1, 0],
+                                    'c': ['cat', 'dog', 'weasel'],
+                                    'd': ['meow', 'bark',
+                                          'um... weasel noise?']},
+                                   index=range(3))
+
+        with pytest.raises(MergeError):
+            merge(left, right, on='a', validate='1:1')
+
+        result = merge(left, right, on=['a', 'b'], validate='1:1')
+        assert_frame_equal(result, expected_multi)
+
+    def test_merge_two_empty_df_no_division_error(self):
+        # GH17776, PR #17846
+        a = pd.DataFrame({'a': [], 'b': [], 'c': []})
+        with np.errstate(divide='raise'):
+            merge(a, a, on=('a', 'b'))
+
+
+def _check_merge(x, y):
+    for how in ['inner', 'left', 'outer']:
+        result = x.join(y, how=how)
+
+        expected = merge(x.reset_index(), y.reset_index(), how=how,
+                         sort=True)
+        expected = expected.set_index('index')
+
+        # TODO check_names on merge?
+        assert_frame_equal(result, expected, check_names=False)
+
+
+class TestMergeMulti(object):
+
+    def setup_method(self, method):
+        self.index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                                        ['one', 'two', 'three']],
+                                labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                        [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                                names=['first', 'second'])
+        self.to_join = DataFrame(np.random.randn(10, 3), index=self.index,
+                                 columns=['j_one', 'j_two', 'j_three'])
+
+        # a little relevant example with NAs
+        key1 = ['bar', 'bar', 'bar', 'foo', 'foo', 'baz', 'baz', 'qux',
+                'qux', 'snap']
+        key2 = ['two', 'one', 'three', 'one', 'two', 'one', 'two', 'two',
+                'three', 'one']
+
+        data = np.random.randn(len(key1))
+        self.data = DataFrame({'key1': key1, 'key2': key2,
+                               'data': data})
+
+    def test_merge_on_multikey(self):
+        joined = self.data.join(self.to_join, on=['key1', 'key2'])
+
+        join_key = Index(lzip(self.data['key1'], self.data['key2']))
+        indexer = self.to_join.index.get_indexer(join_key)
+        ex_values = self.to_join.values.take(indexer, axis=0)
+        ex_values[indexer == -1] = np.nan
+        expected = self.data.join(DataFrame(ex_values,
+                                            columns=self.to_join.columns))
+
+        # TODO: columns aren't in the same order yet
+        assert_frame_equal(joined, expected.loc[:, joined.columns])
+
+        left = self.data.join(self.to_join, on=['key1', 'key2'], sort=True)
+        right = expected.loc[:, joined.columns].sort_values(['key1', 'key2'],
+                                                            kind='mergesort')
+        assert_frame_equal(left, right)
+
+    def test_left_join_multi_index(self):
+        icols = ['1st', '2nd', '3rd']
+
+        def bind_cols(df):
+            iord = lambda a: 0 if a != a else ord(a)
+            f = lambda ts: ts.map(iord) - ord('a')
+            return (f(df['1st']) + f(df['3rd']) * 1e2 +
+                    df['2nd'].fillna(0) * 1e4)
+
+        def run_asserts(left, right):
+            for sort in [False, True]:
+                res = left.join(right, on=icols, how='left', sort=sort)
+
+                assert len(left) < len(res) + 1
+                assert not res['4th'].isna().any()
+                assert not res['5th'].isna().any()
+
+                tm.assert_series_equal(
+                    res['4th'], - res['5th'], check_names=False)
+                result = bind_cols(res.iloc[:, :-2])
+                tm.assert_series_equal(res['4th'], result, check_names=False)
+                assert result.name is None
+
+                if sort:
+                    tm.assert_frame_equal(
+                        res, res.sort_values(icols, kind='mergesort'))
+
+                out = merge(left, right.reset_index(), on=icols,
+                            sort=sort, how='left')
+
+                res.index = np.arange(len(res))
+                tm.assert_frame_equal(out, res)
+
+        lc = list(map(chr, np.arange(ord('a'), ord('z') + 1)))
+        left = DataFrame(np.random.choice(lc, (5000, 2)),
+                         columns=['1st', '3rd'])
+        left.insert(1, '2nd', np.random.randint(0, 1000, len(left)))
+
+        i = np.random.permutation(len(left))
+        right = left.iloc[i].copy()
+
+        left['4th'] = bind_cols(left)
+        right['5th'] = - bind_cols(right)
+        right.set_index(icols, inplace=True)
+
+        run_asserts(left, right)
+
+        # inject some nulls
+        left.loc[1::23, '1st'] = np.nan
+        left.loc[2::37, '2nd'] = np.nan
+        left.loc[3::43, '3rd'] = np.nan
+        left['4th'] = bind_cols(left)
+
+        i = np.random.permutation(len(left))
+        right = left.iloc[i, :-1]
+        right['5th'] = - bind_cols(right)
+        right.set_index(icols, inplace=True)
+
+        run_asserts(left, right)
+
+    def test_merge_right_vs_left(self):
+        # compare left vs right merge with multikey
+        for sort in [False, True]:
+            merged1 = self.data.merge(self.to_join, left_on=['key1', 'key2'],
+                                      right_index=True, how='left', sort=sort)
+
+            merged2 = self.to_join.merge(self.data, right_on=['key1', 'key2'],
+                                         left_index=True, how='right',
+                                         sort=sort)
+
+            merged2 = merged2.loc[:, merged1.columns]
+            assert_frame_equal(merged1, merged2)
+
+    def test_compress_group_combinations(self):
+
+        # ~ 40000000 possible unique groups
+        key1 = tm.rands_array(10, 10000)
+        key1 = np.tile(key1, 2)
+        key2 = key1[::-1]
+
+        df = DataFrame({'key1': key1, 'key2': key2,
+                        'value1': np.random.randn(20000)})
+
+        df2 = DataFrame({'key1': key1[::2], 'key2': key2[::2],
+                         'value2': np.random.randn(10000)})
+
+        # just to hit the label compression code path
+        merge(df, df2, how='outer')
+
+    def test_left_join_index_preserve_order(self):
+
+        left = DataFrame({'k1': [0, 1, 2] * 8,
+                          'k2': ['foo', 'bar'] * 12,
+                          'v': np.array(np.arange(24), dtype=np.int64)})
+
+        index = MultiIndex.from_tuples([(2, 'bar'), (1, 'foo')])
+        right = DataFrame({'v2': [5, 7]}, index=index)
+
+        result = left.join(right, on=['k1', 'k2'])
+
+        expected = left.copy()
+        expected['v2'] = np.nan
+        expected.loc[(expected.k1 == 2) & (expected.k2 == 'bar'), 'v2'] = 5
+        expected.loc[(expected.k1 == 1) & (expected.k2 == 'foo'), 'v2'] = 7
+
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(
+            result.sort_values(['k1', 'k2'], kind='mergesort'),
+            left.join(right, on=['k1', 'k2'], sort=True))
+
+        # test join with multi dtypes blocks
+        left = DataFrame({'k1': [0, 1, 2] * 8,
+                          'k2': ['foo', 'bar'] * 12,
+                          'k3': np.array([0, 1, 2] * 8, dtype=np.float32),
+                          'v': np.array(np.arange(24), dtype=np.int32)})
+
+        index = MultiIndex.from_tuples([(2, 'bar'), (1, 'foo')])
+        right = DataFrame({'v2': [5, 7]}, index=index)
+
+        result = left.join(right, on=['k1', 'k2'])
+
+        expected = left.copy()
+        expected['v2'] = np.nan
+        expected.loc[(expected.k1 == 2) & (expected.k2 == 'bar'), 'v2'] = 5
+        expected.loc[(expected.k1 == 1) & (expected.k2 == 'foo'), 'v2'] = 7
+
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(
+            result.sort_values(['k1', 'k2'], kind='mergesort'),
+            left.join(right, on=['k1', 'k2'], sort=True))
+
+        # do a right join for an extra test
+        joined = merge(right, left, left_index=True,
+                       right_on=['k1', 'k2'], how='right')
+        tm.assert_frame_equal(joined.loc[:, expected.columns], expected)
+
+    def test_left_join_index_multi_match_multiindex(self):
+        left = DataFrame([
+            ['X', 'Y', 'C', 'a'],
+            ['W', 'Y', 'C', 'e'],
+            ['V', 'Q', 'A', 'h'],
+            ['V', 'R', 'D', 'i'],
+            ['X', 'Y', 'D', 'b'],
+            ['X', 'Y', 'A', 'c'],
+            ['W', 'Q', 'B', 'f'],
+            ['W', 'R', 'C', 'g'],
+            ['V', 'Y', 'C', 'j'],
+            ['X', 'Y', 'B', 'd']],
+            columns=['cola', 'colb', 'colc', 'tag'],
+            index=[3, 2, 0, 1, 7, 6, 4, 5, 9, 8])
+
+        right = DataFrame([
+            ['W', 'R', 'C', 0],
+            ['W', 'Q', 'B', 3],
+            ['W', 'Q', 'B', 8],
+            ['X', 'Y', 'A', 1],
+            ['X', 'Y', 'A', 4],
+            ['X', 'Y', 'B', 5],
+            ['X', 'Y', 'C', 6],
+            ['X', 'Y', 'C', 9],
+            ['X', 'Q', 'C', -6],
+            ['X', 'R', 'C', -9],
+            ['V', 'Y', 'C', 7],
+            ['V', 'R', 'D', 2],
+            ['V', 'R', 'D', -1],
+            ['V', 'Q', 'A', -3]],
+            columns=['col1', 'col2', 'col3', 'val'])
+
+        right.set_index(['col1', 'col2', 'col3'], inplace=True)
+        result = left.join(right, on=['cola', 'colb', 'colc'], how='left')
+
+        expected = DataFrame([
+            ['X', 'Y', 'C', 'a', 6],
+            ['X', 'Y', 'C', 'a', 9],
+            ['W', 'Y', 'C', 'e', nan],
+            ['V', 'Q', 'A', 'h', -3],
+            ['V', 'R', 'D', 'i', 2],
+            ['V', 'R', 'D', 'i', -1],
+            ['X', 'Y', 'D', 'b', nan],
+            ['X', 'Y', 'A', 'c', 1],
+            ['X', 'Y', 'A', 'c', 4],
+            ['W', 'Q', 'B', 'f', 3],
+            ['W', 'Q', 'B', 'f', 8],
+            ['W', 'R', 'C', 'g', 0],
+            ['V', 'Y', 'C', 'j', 7],
+            ['X', 'Y', 'B', 'd', 5]],
+            columns=['cola', 'colb', 'colc', 'tag', 'val'],
+            index=[3, 3, 2, 0, 1, 1, 7, 6, 6, 4, 4, 5, 9, 8])
+
+        tm.assert_frame_equal(result, expected)
+
+        result = left.join(right, on=['cola', 'colb', 'colc'],
+                           how='left', sort=True)
+
+        tm.assert_frame_equal(
+            result,
+            expected.sort_values(['cola', 'colb', 'colc'], kind='mergesort'))
+
+        # GH7331 - maintain left frame order in left merge
+        right.reset_index(inplace=True)
+        right.columns = left.columns[:3].tolist() + right.columns[-1:].tolist()
+        result = merge(left, right, how='left', on=left.columns[:-1].tolist())
+        expected.index = np.arange(len(expected))
+        tm.assert_frame_equal(result, expected)
+
+    def test_left_join_index_multi_match(self):
+        left = DataFrame([
+            ['c', 0],
+            ['b', 1],
+            ['a', 2],
+            ['b', 3]],
+            columns=['tag', 'val'],
+            index=[2, 0, 1, 3])
+
+        right = DataFrame([
+            ['a', 'v'],
+            ['c', 'w'],
+            ['c', 'x'],
+            ['d', 'y'],
+            ['a', 'z'],
+            ['c', 'r'],
+            ['e', 'q'],
+            ['c', 's']],
+            columns=['tag', 'char'])
+
+        right.set_index('tag', inplace=True)
+        result = left.join(right, on='tag', how='left')
+
+        expected = DataFrame([
+            ['c', 0, 'w'],
+            ['c', 0, 'x'],
+            ['c', 0, 'r'],
+            ['c', 0, 's'],
+            ['b', 1, nan],
+            ['a', 2, 'v'],
+            ['a', 2, 'z'],
+            ['b', 3, nan]],
+            columns=['tag', 'val', 'char'],
+            index=[2, 2, 2, 2, 0, 1, 1, 3])
+
+        tm.assert_frame_equal(result, expected)
+
+        result = left.join(right, on='tag', how='left', sort=True)
+        tm.assert_frame_equal(
+            result, expected.sort_values('tag', kind='mergesort'))
+
+        # GH7331 - maintain left frame order in left merge
+        result = merge(left, right.reset_index(), how='left', on='tag')
+        expected.index = np.arange(len(expected))
+        tm.assert_frame_equal(result, expected)
+
+    def test_left_merge_na_buglet(self):
+        left = DataFrame({'id': list('abcde'), 'v1': randn(5),
+                          'v2': randn(5), 'dummy': list('abcde'),
+                          'v3': randn(5)},
+                         columns=['id', 'v1', 'v2', 'dummy', 'v3'])
+        right = DataFrame({'id': ['a', 'b', np.nan, np.nan, np.nan],
+                           'sv3': [1.234, 5.678, np.nan, np.nan, np.nan]})
+
+        merged = merge(left, right, on='id', how='left')
+
+        rdf = right.drop(['id'], axis=1)
+        expected = left.join(rdf)
+        tm.assert_frame_equal(merged, expected)
+
+    def test_merge_na_keys(self):
+        data = [[1950, "A", 1.5],
+                [1950, "B", 1.5],
+                [1955, "B", 1.5],
+                [1960, "B", np.nan],
+                [1970, "B", 4.],
+                [1950, "C", 4.],
+                [1960, "C", np.nan],
+                [1965, "C", 3.],
+                [1970, "C", 4.]]
+
+        frame = DataFrame(data, columns=["year", "panel", "data"])
+
+        other_data = [[1960, 'A', np.nan],
+                      [1970, 'A', np.nan],
+                      [1955, 'A', np.nan],
+                      [1965, 'A', np.nan],
+                      [1965, 'B', np.nan],
+                      [1955, 'C', np.nan]]
+        other = DataFrame(other_data, columns=['year', 'panel', 'data'])
+
+        result = frame.merge(other, how='outer')
+
+        expected = frame.fillna(-999).merge(other.fillna(-999), how='outer')
+        expected = expected.replace(-999, np.nan)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_join_multi_levels(self):
+
+        # GH 3662
+        # merge multi-levels
+        household = (
+            DataFrame(
+                dict(household_id=[1, 2, 3],
+                     male=[0, 1, 0],
+                     wealth=[196087.3, 316478.7, 294750]),
+                columns=['household_id', 'male', 'wealth'])
+            .set_index('household_id'))
+        portfolio = (
+            DataFrame(
+                dict(household_id=[1, 2, 2, 3, 3, 3, 4],
+                     asset_id=["nl0000301109", "nl0000289783", "gb00b03mlx29",
+                               "gb00b03mlx29", "lu0197800237", "nl0000289965",
+                               np.nan],
+                     name=["ABN Amro", "Robeco", "Royal Dutch Shell",
+                           "Royal Dutch Shell",
+                           "AAB Eastern Europe Equity Fund",
+                           "Postbank BioTech Fonds", np.nan],
+                     share=[1.0, 0.4, 0.6, 0.15, 0.6, 0.25, 1.0]),
+                columns=['household_id', 'asset_id', 'name', 'share'])
+            .set_index(['household_id', 'asset_id']))
+        result = household.join(portfolio, how='inner')
+        expected = (
+            DataFrame(
+                dict(male=[0, 1, 1, 0, 0, 0],
+                     wealth=[196087.3, 316478.7, 316478.7,
+                             294750.0, 294750.0, 294750.0],
+                     name=['ABN Amro', 'Robeco', 'Royal Dutch Shell',
+                           'Royal Dutch Shell',
+                           'AAB Eastern Europe Equity Fund',
+                           'Postbank BioTech Fonds'],
+                     share=[1.00, 0.40, 0.60, 0.15, 0.60, 0.25],
+                     household_id=[1, 2, 2, 3, 3, 3],
+                     asset_id=['nl0000301109', 'nl0000289783', 'gb00b03mlx29',
+                               'gb00b03mlx29', 'lu0197800237',
+                               'nl0000289965']))
+            .set_index(['household_id', 'asset_id'])
+            .reindex(columns=['male', 'wealth', 'name', 'share']))
+        assert_frame_equal(result, expected)
+
+        assert_frame_equal(result, expected)
+
+        # equivalency
+        result2 = (merge(household.reset_index(), portfolio.reset_index(),
+                         on=['household_id'], how='inner')
+                   .set_index(['household_id', 'asset_id']))
+        assert_frame_equal(result2, expected)
+
+        result = household.join(portfolio, how='outer')
+        expected = (concat([
+            expected,
+            (DataFrame(
+                dict(share=[1.00]),
+                index=MultiIndex.from_tuples(
+                    [(4, np.nan)],
+                    names=['household_id', 'asset_id'])))
+        ], axis=0, sort=True).reindex(columns=expected.columns))
+        assert_frame_equal(result, expected)
+
+        # invalid cases
+        household.index.name = 'foo'
+
+        def f():
+            household.join(portfolio, how='inner')
+
+        pytest.raises(ValueError, f)
+
+        portfolio2 = portfolio.copy()
+        portfolio2.index.set_names(['household_id', 'foo'])
+
+        def f():
+            portfolio2.join(portfolio, how='inner')
+
+        pytest.raises(ValueError, f)
+
+    def test_join_multi_levels2(self):
+
+        # some more advanced merges
+        # GH6360
+        household = (
+            DataFrame(
+                dict(household_id=[1, 2, 2, 3, 3, 3, 4],
+                     asset_id=["nl0000301109", "nl0000301109", "gb00b03mlx29",
+                               "gb00b03mlx29", "lu0197800237", "nl0000289965",
+                               np.nan],
+                     share=[1.0, 0.4, 0.6, 0.15, 0.6, 0.25, 1.0]),
+                columns=['household_id', 'asset_id', 'share'])
+            .set_index(['household_id', 'asset_id']))
+
+        log_return = DataFrame(dict(
+            asset_id=["gb00b03mlx29", "gb00b03mlx29",
+                      "gb00b03mlx29", "lu0197800237", "lu0197800237"],
+            t=[233, 234, 235, 180, 181],
+            log_return=[.09604978, -.06524096, .03532373, .03025441, .036997]
+        )).set_index(["asset_id", "t"])
+
+        expected = (
+            DataFrame(dict(
+                household_id=[2, 2, 2, 3, 3, 3, 3, 3],
+                asset_id=["gb00b03mlx29", "gb00b03mlx29",
+                          "gb00b03mlx29", "gb00b03mlx29",
+                          "gb00b03mlx29", "gb00b03mlx29",
+                          "lu0197800237", "lu0197800237"],
+                t=[233, 234, 235, 233, 234, 235, 180, 181],
+                share=[0.6, 0.6, 0.6, 0.15, 0.15, 0.15, 0.6, 0.6],
+                log_return=[.09604978, -.06524096, .03532373,
+                            .09604978, -.06524096, .03532373,
+                            .03025441, .036997]
+            ))
+            .set_index(["household_id", "asset_id", "t"])
+            .reindex(columns=['share', 'log_return']))
+
+        def f():
+            household.join(log_return, how='inner')
+
+        pytest.raises(NotImplementedError, f)
+
+        # this is the equivalency
+        result = (merge(household.reset_index(), log_return.reset_index(),
+                        on=['asset_id'], how='inner')
+                  .set_index(['household_id', 'asset_id', 't']))
+        assert_frame_equal(result, expected)
+
+        expected = (
+            DataFrame(dict(
+                household_id=[1, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 4],
+                asset_id=["nl0000301109", "nl0000289783", "gb00b03mlx29",
+                          "gb00b03mlx29", "gb00b03mlx29",
+                          "gb00b03mlx29", "gb00b03mlx29", "gb00b03mlx29",
+                          "lu0197800237", "lu0197800237",
+                          "nl0000289965", None],
+                t=[None, None, 233, 234, 235, 233, 234,
+                   235, 180, 181, None, None],
+                share=[1.0, 0.4, 0.6, 0.6, 0.6, 0.15,
+                       0.15, 0.15, 0.6, 0.6, 0.25, 1.0],
+                log_return=[None, None, .09604978, -.06524096, .03532373,
+                            .09604978, -.06524096, .03532373,
+                            .03025441, .036997, None, None]
+            ))
+            .set_index(["household_id", "asset_id", "t"]))
+
+        def f():
+            household.join(log_return, how='outer')
+
+        pytest.raises(NotImplementedError, f)
+
+    @pytest.mark.parametrize("klass", [None, np.asarray, Series, Index])
+    def test_merge_datetime_index(self, klass):
+        # see gh-19038
+        df = DataFrame([1, 2, 3],
+                       ["2016-01-01", "2017-01-01", "2018-01-01"],
+                       columns=["a"])
+        df.index = pd.to_datetime(df.index)
+        on_vector = df.index.year
+
+        if klass is not None:
+            on_vector = klass(on_vector)
+
+        expected = DataFrame(
+            OrderedDict([
+                ("a", [1, 2, 3]),
+                ("key_1", [2016, 2017, 2018]),
+            ])
+        )
+
+        result = df.merge(df, on=["a", on_vector], how="inner")
+        tm.assert_frame_equal(result, expected)
+
+        expected = DataFrame(
+            OrderedDict([
+                ("key_0", [2016, 2017, 2018]),
+                ("a_x", [1, 2, 3]),
+                ("a_y", [1, 2, 3]),
+            ])
+        )
+
+        result = df.merge(df, on=[df.index.year], how="inner")
+        tm.assert_frame_equal(result, expected)
+
+
+class TestMergeDtypes(object):
+
+    @pytest.mark.parametrize('right_vals', [
+        ['foo', 'bar'],
+        Series(['foo', 'bar']).astype('category'),
+        [1, 2],
+        [1.0, 2.0],
+        Series([1, 2], dtype='uint64'),
+        Series([1, 2], dtype='int32')
+    ])
+    def test_different(self, right_vals):
+
+        left = DataFrame({'A': ['foo', 'bar'],
+                          'B': Series(['foo', 'bar']).astype('category'),
+                          'C': [1, 2],
+                          'D': [1.0, 2.0],
+                          'E': Series([1, 2], dtype='uint64'),
+                          'F': Series([1, 2], dtype='int32')})
+        right = DataFrame({'A': right_vals})
+
+        # GH 9780
+        # We allow merging on object and categorical cols and cast
+        # categorical cols to object
+        if (is_categorical_dtype(right['A'].dtype) or
+                is_object_dtype(right['A'].dtype)):
+            result = pd.merge(left, right, on='A')
+            assert is_object_dtype(result.A.dtype)
+
+        # GH 9780
+        # We raise for merging on object col and int/float col and
+        # merging on categorical col and int/float col
+        else:
+            msg = ("You are trying to merge on "
+                   "{lk_dtype} and {rk_dtype} columns. "
+                   "If you wish to proceed you should use "
+                   "pd.concat".format(lk_dtype=left['A'].dtype,
+                                      rk_dtype=right['A'].dtype))
+            with tm.assert_raises_regex(ValueError, msg):
+                pd.merge(left, right, on='A')
+
+    @pytest.mark.parametrize('d1', [np.int64, np.int32,
+                                    np.int16, np.int8, np.uint8])
+    @pytest.mark.parametrize('d2', [np.int64, np.float64,
+                                    np.float32, np.float16])
+    def test_join_multi_dtypes(self, d1, d2):
+
+        dtype1 = np.dtype(d1)
+        dtype2 = np.dtype(d2)
+
+        left = DataFrame({'k1': np.array([0, 1, 2] * 8, dtype=dtype1),
+                          'k2': ['foo', 'bar'] * 12,
+                          'v': np.array(np.arange(24), dtype=np.int64)})
+
+        index = MultiIndex.from_tuples([(2, 'bar'), (1, 'foo')])
+        right = DataFrame({'v2': np.array([5, 7], dtype=dtype2)}, index=index)
+
+        result = left.join(right, on=['k1', 'k2'])
+
+        expected = left.copy()
+
+        if dtype2.kind == 'i':
+            dtype2 = np.dtype('float64')
+        expected['v2'] = np.array(np.nan, dtype=dtype2)
+        expected.loc[(expected.k1 == 2) & (expected.k2 == 'bar'), 'v2'] = 5
+        expected.loc[(expected.k1 == 1) & (expected.k2 == 'foo'), 'v2'] = 7
+
+        tm.assert_frame_equal(result, expected)
+
+        result = left.join(right, on=['k1', 'k2'], sort=True)
+        expected.sort_values(['k1', 'k2'], kind='mergesort', inplace=True)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('int_vals, float_vals, exp_vals', [
+        ([1, 2, 3], [1.0, 2.0, 3.0], {'X': [1, 2, 3], 'Y': [1.0, 2.0, 3.0]}),
+        ([1, 2, 3], [1.0, 3.0], {'X': [1, 3], 'Y': [1.0, 3.0]}),
+        ([1, 2], [1.0, 2.0, 3.0], {'X': [1, 2], 'Y': [1.0, 2.0]}),
+    ])
+    def test_merge_on_ints_floats(self, int_vals, float_vals, exp_vals):
+        # GH 16572
+        # Check that float column is not cast to object if
+        # merging on float and int columns
+        A = DataFrame({'X': int_vals})
+        B = DataFrame({'Y': float_vals})
+        expected = DataFrame(exp_vals)
+
+        result = A.merge(B, left_on='X', right_on='Y')
+        assert_frame_equal(result, expected)
+
+        result = B.merge(A, left_on='Y', right_on='X')
+        assert_frame_equal(result, expected[['Y', 'X']])
+
+    def test_merge_on_ints_floats_warning(self):
+        # GH 16572
+        # merge will produce a warning when merging on int and
+        # float columns where the float values are not exactly
+        # equal to their int representation
+        A = DataFrame({'X': [1, 2, 3]})
+        B = DataFrame({'Y': [1.1, 2.5, 3.0]})
+        expected = DataFrame({'X': [3], 'Y': [3.0]})
+
+        with tm.assert_produces_warning(UserWarning):
+            result = A.merge(B, left_on='X', right_on='Y')
+            assert_frame_equal(result, expected)
+
+        with tm.assert_produces_warning(UserWarning):
+            result = B.merge(A, left_on='Y', right_on='X')
+            assert_frame_equal(result, expected[['Y', 'X']])
+
+        # test no warning if float has NaNs
+        B = DataFrame({'Y': [np.nan, np.nan, 3.0]})
+
+        with tm.assert_produces_warning(None):
+            result = B.merge(A, left_on='Y', right_on='X')
+            assert_frame_equal(result, expected[['Y', 'X']])
+
+    def test_merge_incompat_infer_boolean_object(self):
+        # GH21119: bool + object bool merge OK
+        df1 = DataFrame({'key': Series([True, False], dtype=object)})
+        df2 = DataFrame({'key': [True, False]})
+
+        expected = DataFrame({'key': [True, False]}, dtype=object)
+        result = pd.merge(df1, df2, on='key')
+        assert_frame_equal(result, expected)
+        result = pd.merge(df2, df1, on='key')
+        assert_frame_equal(result, expected)
+
+        # with missing value
+        df1 = DataFrame({'key': Series([True, False, np.nan], dtype=object)})
+        df2 = DataFrame({'key': [True, False]})
+
+        expected = DataFrame({'key': [True, False]}, dtype=object)
+        result = pd.merge(df1, df2, on='key')
+        assert_frame_equal(result, expected)
+        result = pd.merge(df2, df1, on='key')
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('df1_vals, df2_vals', [
+        ([0, 1, 2], ["0", "1", "2"]),
+        ([0.0, 1.0, 2.0], ["0", "1", "2"]),
+        ([0, 1, 2], [u"0", u"1", u"2"]),
+        (pd.date_range('1/1/2011', periods=2, freq='D'), ['2011-01-01',
+                                                          '2011-01-02']),
+        (pd.date_range('1/1/2011', periods=2, freq='D'), [0, 1]),
+        (pd.date_range('1/1/2011', periods=2, freq='D'), [0.0, 1.0]),
+        (pd.date_range('20130101', periods=3),
+            pd.date_range('20130101', periods=3, tz='US/Eastern')),
+        ([0, 1, 2], Series(['a', 'b', 'a']).astype('category')),
+        ([0.0, 1.0, 2.0], Series(['a', 'b', 'a']).astype('category')),
+        # TODO ([0, 1], pd.Series([False, True], dtype=bool)),
+        ([0, 1], pd.Series([False, True], dtype=object))
+    ])
+    def test_merge_incompat_dtypes(self, df1_vals, df2_vals):
+        # GH 9780, GH 15800
+        # Raise a ValueError when a user tries to merge on
+        # dtypes that are incompatible (e.g., obj and int/float)
+
+        df1 = DataFrame({'A': df1_vals})
+        df2 = DataFrame({'A': df2_vals})
+
+        msg = ("You are trying to merge on {lk_dtype} and "
+               "{rk_dtype} columns. If you wish to proceed "
+               "you should use pd.concat".format(lk_dtype=df1['A'].dtype,
+                                                 rk_dtype=df2['A'].dtype))
+        msg = re.escape(msg)
+        with tm.assert_raises_regex(ValueError, msg):
+            pd.merge(df1, df2, on=['A'])
+
+        # Check that error still raised when swapping order of dataframes
+        msg = ("You are trying to merge on {lk_dtype} and "
+               "{rk_dtype} columns. If you wish to proceed "
+               "you should use pd.concat".format(lk_dtype=df2['A'].dtype,
+                                                 rk_dtype=df1['A'].dtype))
+        msg = re.escape(msg)
+        with tm.assert_raises_regex(ValueError, msg):
+            pd.merge(df2, df1, on=['A'])
+
+
+@pytest.fixture
+def left():
+    np.random.seed(1234)
+    return DataFrame(
+        {'X': Series(np.random.choice(
+            ['foo', 'bar'],
+            size=(10,))).astype(CDT(['foo', 'bar'])),
+         'Y': np.random.choice(['one', 'two', 'three'], size=(10,))})
+
+
+@pytest.fixture
+def right():
+    np.random.seed(1234)
+    return DataFrame(
+        {'X': Series(['foo', 'bar']).astype(CDT(['foo', 'bar'])),
+         'Z': [1, 2]})
+
+
+class TestMergeCategorical(object):
+
+    def test_identical(self, left):
+        # merging on the same, should preserve dtypes
+        merged = pd.merge(left, left, on='X')
+        result = merged.dtypes.sort_index()
+        expected = Series([CategoricalDtype(),
+                           np.dtype('O'),
+                           np.dtype('O')],
+                          index=['X', 'Y_x', 'Y_y'])
+        assert_series_equal(result, expected)
+
+    def test_basic(self, left, right):
+        # we have matching Categorical dtypes in X
+        # so should preserve the merged column
+        merged = pd.merge(left, right, on='X')
+        result = merged.dtypes.sort_index()
+        expected = Series([CategoricalDtype(),
+                           np.dtype('O'),
+                           np.dtype('int64')],
+                          index=['X', 'Y', 'Z'])
+        assert_series_equal(result, expected)
+
+    def test_merge_categorical(self):
+        # GH 9426
+
+        right = DataFrame({'c': {0: 'a',
+                                 1: 'b',
+                                 2: 'c',
+                                 3: 'd',
+                                 4: 'e'},
+                           'd': {0: 'null',
+                                 1: 'null',
+                                 2: 'null',
+                                 3: 'null',
+                                 4: 'null'}})
+        left = DataFrame({'a': {0: 'f',
+                                1: 'f',
+                                2: 'f',
+                                3: 'f',
+                                4: 'f'},
+                          'b': {0: 'g',
+                                1: 'g',
+                                2: 'g',
+                                3: 'g',
+                                4: 'g'}})
+        df = pd.merge(left, right, how='left', left_on='b', right_on='c')
+
+        # object-object
+        expected = df.copy()
+
+        # object-cat
+        # note that we propagate the category
+        # because we don't have any matching rows
+        cright = right.copy()
+        cright['d'] = cright['d'].astype('category')
+        result = pd.merge(left, cright, how='left', left_on='b', right_on='c')
+        expected['d'] = expected['d'].astype(CategoricalDtype(['null']))
+        tm.assert_frame_equal(result, expected)
+
+        # cat-object
+        cleft = left.copy()
+        cleft['b'] = cleft['b'].astype('category')
+        result = pd.merge(cleft, cright, how='left', left_on='b', right_on='c')
+        tm.assert_frame_equal(result, expected)
+
+        # cat-cat
+        cright = right.copy()
+        cright['d'] = cright['d'].astype('category')
+        cleft = left.copy()
+        cleft['b'] = cleft['b'].astype('category')
+        result = pd.merge(cleft, cright, how='left', left_on='b', right_on='c')
+        tm.assert_frame_equal(result, expected)
+
+    def tests_merge_categorical_unordered_equal(self):
+        # GH-19551
+        df1 = DataFrame({
+            'Foo': Categorical(['A', 'B', 'C'], categories=['A', 'B', 'C']),
+            'Left': ['A0', 'B0', 'C0'],
+        })
+
+        df2 = DataFrame({
+            'Foo': Categorical(['C', 'B', 'A'], categories=['C', 'B', 'A']),
+            'Right': ['C1', 'B1', 'A1'],
+        })
+        result = pd.merge(df1, df2, on=['Foo'])
+        expected = DataFrame({
+            'Foo': pd.Categorical(['A', 'B', 'C']),
+            'Left': ['A0', 'B0', 'C0'],
+            'Right': ['A1', 'B1', 'C1'],
+        })
+        assert_frame_equal(result, expected)
+
+    def test_other_columns(self, left, right):
+        # non-merge columns should preserve if possible
+        right = right.assign(Z=right.Z.astype('category'))
+
+        merged = pd.merge(left, right, on='X')
+        result = merged.dtypes.sort_index()
+        expected = Series([CategoricalDtype(),
+                           np.dtype('O'),
+                           CategoricalDtype()],
+                          index=['X', 'Y', 'Z'])
+        assert_series_equal(result, expected)
+
+        # categories are preserved
+        assert left.X.values.is_dtype_equal(merged.X.values)
+        assert right.Z.values.is_dtype_equal(merged.Z.values)
+
+    @pytest.mark.parametrize(
+        'change', [lambda x: x,
+                   lambda x: x.astype(CDT(['foo', 'bar', 'bah'])),
+                   lambda x: x.astype(CDT(ordered=True))])
+    def test_dtype_on_merged_different(self, change, join_type, left, right):
+        # our merging columns, X now has 2 different dtypes
+        # so we must be object as a result
+
+        X = change(right.X.astype('object'))
+        right = right.assign(X=X)
+        assert is_categorical_dtype(left.X.values)
+        # assert not left.X.values.is_dtype_equal(right.X.values)
+
+        merged = pd.merge(left, right, on='X', how=join_type)
+
+        result = merged.dtypes.sort_index()
+        expected = Series([np.dtype('O'),
+                           np.dtype('O'),
+                           np.dtype('int64')],
+                          index=['X', 'Y', 'Z'])
+        assert_series_equal(result, expected)
+
+    def test_self_join_multiple_categories(self):
+        # GH 16767
+        # non-duplicates should work with multiple categories
+        m = 5
+        df = pd.DataFrame({
+            'a': ['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j'] * m,
+            'b': ['t', 'w', 'x', 'y', 'z'] * 2 * m,
+            'c': [letter
+                  for each in ['m', 'n', 'u', 'p', 'o']
+                  for letter in [each] * 2 * m],
+            'd': [letter
+                  for each in ['aa', 'bb', 'cc', 'dd', 'ee',
+                               'ff', 'gg', 'hh', 'ii', 'jj']
+                  for letter in [each] * m]})
+
+        # change them all to categorical variables
+        df = df.apply(lambda x: x.astype('category'))
+
+        # self-join should equal ourselves
+        result = pd.merge(df, df, on=list(df.columns))
+
+        assert_frame_equal(result, df)
+
+    def test_dtype_on_categorical_dates(self):
+        # GH 16900
+        # dates should not be coerced to ints
+
+        df = pd.DataFrame(
+            [[date(2001, 1, 1), 1.1],
+             [date(2001, 1, 2), 1.3]],
+            columns=['date', 'num2']
+        )
+        df['date'] = df['date'].astype('category')
+
+        df2 = pd.DataFrame(
+            [[date(2001, 1, 1), 1.3],
+             [date(2001, 1, 3), 1.4]],
+            columns=['date', 'num4']
+        )
+        df2['date'] = df2['date'].astype('category')
+
+        expected_outer = pd.DataFrame([
+            [pd.Timestamp('2001-01-01'), 1.1, 1.3],
+            [pd.Timestamp('2001-01-02'), 1.3, np.nan],
+            [pd.Timestamp('2001-01-03'), np.nan, 1.4]],
+            columns=['date', 'num2', 'num4']
+        )
+        result_outer = pd.merge(df, df2, how='outer', on=['date'])
+        assert_frame_equal(result_outer, expected_outer)
+
+        expected_inner = pd.DataFrame(
+            [[pd.Timestamp('2001-01-01'), 1.1, 1.3]],
+            columns=['date', 'num2', 'num4']
+        )
+        result_inner = pd.merge(df, df2, how='inner', on=['date'])
+        assert_frame_equal(result_inner, expected_inner)
+
+    @pytest.mark.parametrize('ordered', [True, False])
+    @pytest.mark.parametrize('category_column,categories,expected_categories',
+                             [([False, True, True, False], [True, False],
+                               [True, False]),
+                              ([2, 1, 1, 2], [1, 2], [1, 2]),
+                              (['False', 'True', 'True', 'False'],
+                               ['True', 'False'], ['True', 'False'])])
+    def test_merging_with_bool_or_int_cateorical_column(self, category_column,
+                                                        categories,
+                                                        expected_categories,
+                                                        ordered):
+        # GH 17187
+        # merging with a boolean/int categorical column
+        df1 = pd.DataFrame({'id': [1, 2, 3, 4],
+                            'cat': category_column})
+        df1['cat'] = df1['cat'].astype(CDT(categories, ordered=ordered))
+        df2 = pd.DataFrame({'id': [2, 4], 'num': [1, 9]})
+        result = df1.merge(df2)
+        expected = pd.DataFrame({'id': [2, 4], 'cat': expected_categories,
+                                 'num': [1, 9]})
+        expected['cat'] = expected['cat'].astype(
+            CDT(categories, ordered=ordered))
+        assert_frame_equal(expected, result)
+
+
+@pytest.fixture
+def left_df():
+    return DataFrame({'a': [20, 10, 0]}, index=[2, 1, 0])
+
+
+@pytest.fixture
+def right_df():
+    return DataFrame({'b': [300, 100, 200]}, index=[3, 1, 2])
+
+
+class TestMergeOnIndexes(object):
+
+    @pytest.mark.parametrize(
+        "how, sort, expected",
+        [('inner', False, DataFrame({'a': [20, 10],
+                                     'b': [200, 100]},
+                                    index=[2, 1])),
+         ('inner', True, DataFrame({'a': [10, 20],
+                                    'b': [100, 200]},
+                                   index=[1, 2])),
+         ('left', False, DataFrame({'a': [20, 10, 0],
+                                    'b': [200, 100, np.nan]},
+                                   index=[2, 1, 0])),
+         ('left', True, DataFrame({'a': [0, 10, 20],
+                                   'b': [np.nan, 100, 200]},
+                                  index=[0, 1, 2])),
+         ('right', False, DataFrame({'a': [np.nan, 10, 20],
+                                     'b': [300, 100, 200]},
+                                    index=[3, 1, 2])),
+         ('right', True, DataFrame({'a': [10, 20, np.nan],
+                                    'b': [100, 200, 300]},
+                                   index=[1, 2, 3])),
+         ('outer', False, DataFrame({'a': [0, 10, 20, np.nan],
+                                     'b': [np.nan, 100, 200, 300]},
+                                    index=[0, 1, 2, 3])),
+         ('outer', True, DataFrame({'a': [0, 10, 20, np.nan],
+                                    'b': [np.nan, 100, 200, 300]},
+                                   index=[0, 1, 2, 3]))])
+    def test_merge_on_indexes(self, left_df, right_df, how, sort, expected):
+        result = pd.merge(left_df, right_df,
+                          left_index=True,
+                          right_index=True,
+                          how=how,
+                          sort=sort)
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize(
+    'index', [
+        CategoricalIndex(['A', 'B'], categories=['A', 'B'], name='index_col'),
+        Float64Index([1.0, 2.0], name='index_col'),
+        Int64Index([1, 2], name='index_col'),
+        UInt64Index([1, 2], name='index_col'),
+        RangeIndex(start=0, stop=2, name='index_col'),
+        DatetimeIndex(["2018-01-01", "2018-01-02"], name='index_col'),
+    ], ids=lambda x: type(x).__name__)
+def test_merge_index_types(index):
+    # gh-20777
+    # assert key access is consistent across index types
+    left = DataFrame({"left_data": [1, 2]}, index=index)
+    right = DataFrame({"right_data": [1.0, 2.0]}, index=index)
+
+    result = left.merge(right, on=['index_col'])
+
+    expected = DataFrame(
+        OrderedDict([('left_data', [1, 2]), ('right_data', [1.0, 2.0])]),
+        index=index)
+    assert_frame_equal(result, expected)
diff --git a/pandas/tests/reshape/merge/test_merge_asof.py b/pandas/tests/reshape/merge/test_merge_asof.py
new file mode 100644
index 0000000000000..59b53cd23010e
--- /dev/null
+++ b/pandas/tests/reshape/merge/test_merge_asof.py
@@ -0,0 +1,1007 @@
+import pytest
+
+import pytz
+import numpy as np
+import pandas as pd
+from pandas import (merge_asof, read_csv,
+                    to_datetime, Timedelta)
+from pandas.core.reshape.merge import MergeError
+from pandas.util import testing as tm
+from pandas.util.testing import assert_frame_equal
+
+
+class TestAsOfMerge(object):
+
+    def read_data(self, datapath, name, dedupe=False):
+        path = datapath('reshape', 'merge', 'data', name)
+        x = read_csv(path)
+        if dedupe:
+            x = (x.drop_duplicates(['time', 'ticker'], keep='last')
+                  .reset_index(drop=True)
+                 )
+        x.time = to_datetime(x.time)
+        return x
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+
+        self.trades = self.read_data(datapath, 'trades.csv')
+        self.quotes = self.read_data(datapath, 'quotes.csv', dedupe=True)
+        self.asof = self.read_data(datapath, 'asof.csv')
+        self.tolerance = self.read_data(datapath, 'tolerance.csv')
+        self.allow_exact_matches = self.read_data(datapath,
+                                                  'allow_exact_matches.csv')
+        self.allow_exact_matches_and_tolerance = self.read_data(
+            datapath, 'allow_exact_matches_and_tolerance.csv')
+
+    def test_examples1(self):
+        """ doc-string examples """
+
+        left = pd.DataFrame({'a': [1, 5, 10],
+                             'left_val': ['a', 'b', 'c']})
+        right = pd.DataFrame({'a': [1, 2, 3, 6, 7],
+                              'right_val': [1, 2, 3, 6, 7]})
+
+        expected = pd.DataFrame({'a': [1, 5, 10],
+                                 'left_val': ['a', 'b', 'c'],
+                                 'right_val': [1, 3, 7]})
+
+        result = pd.merge_asof(left, right, on='a')
+        assert_frame_equal(result, expected)
+
+    def test_examples2(self):
+        """ doc-string examples """
+
+        trades = pd.DataFrame({
+            'time': pd.to_datetime(['20160525 13:30:00.023',
+                                    '20160525 13:30:00.038',
+                                    '20160525 13:30:00.048',
+                                    '20160525 13:30:00.048',
+                                    '20160525 13:30:00.048']),
+            'ticker': ['MSFT', 'MSFT',
+                       'GOOG', 'GOOG', 'AAPL'],
+            'price': [51.95, 51.95,
+                      720.77, 720.92, 98.00],
+            'quantity': [75, 155,
+                         100, 100, 100]},
+            columns=['time', 'ticker', 'price', 'quantity'])
+
+        quotes = pd.DataFrame({
+            'time': pd.to_datetime(['20160525 13:30:00.023',
+                                    '20160525 13:30:00.023',
+                                    '20160525 13:30:00.030',
+                                    '20160525 13:30:00.041',
+                                    '20160525 13:30:00.048',
+                                    '20160525 13:30:00.049',
+                                    '20160525 13:30:00.072',
+                                    '20160525 13:30:00.075']),
+            'ticker': ['GOOG', 'MSFT', 'MSFT',
+                       'MSFT', 'GOOG', 'AAPL', 'GOOG',
+                       'MSFT'],
+            'bid': [720.50, 51.95, 51.97, 51.99,
+                    720.50, 97.99, 720.50, 52.01],
+            'ask': [720.93, 51.96, 51.98, 52.00,
+                    720.93, 98.01, 720.88, 52.03]},
+            columns=['time', 'ticker', 'bid', 'ask'])
+
+        pd.merge_asof(trades, quotes,
+                      on='time',
+                      by='ticker')
+
+        pd.merge_asof(trades, quotes,
+                      on='time',
+                      by='ticker',
+                      tolerance=pd.Timedelta('2ms'))
+
+        expected = pd.DataFrame({
+            'time': pd.to_datetime(['20160525 13:30:00.023',
+                                    '20160525 13:30:00.038',
+                                    '20160525 13:30:00.048',
+                                    '20160525 13:30:00.048',
+                                    '20160525 13:30:00.048']),
+            'ticker': ['MSFT', 'MSFT', 'GOOG', 'GOOG', 'AAPL'],
+            'price': [51.95, 51.95,
+                      720.77, 720.92, 98.00],
+            'quantity': [75, 155,
+                         100, 100, 100],
+            'bid': [np.nan, 51.97, np.nan,
+                    np.nan, np.nan],
+            'ask': [np.nan, 51.98, np.nan,
+                    np.nan, np.nan]},
+            columns=['time', 'ticker', 'price', 'quantity',
+                     'bid', 'ask'])
+
+        result = pd.merge_asof(trades, quotes,
+                               on='time',
+                               by='ticker',
+                               tolerance=pd.Timedelta('10ms'),
+                               allow_exact_matches=False)
+        assert_frame_equal(result, expected)
+
+    def test_examples3(self):
+        """ doc-string examples """
+        # GH14887
+
+        left = pd.DataFrame({'a': [1, 5, 10],
+                             'left_val': ['a', 'b', 'c']})
+        right = pd.DataFrame({'a': [1, 2, 3, 6, 7],
+                              'right_val': [1, 2, 3, 6, 7]})
+
+        expected = pd.DataFrame({'a': [1, 5, 10],
+                                 'left_val': ['a', 'b', 'c'],
+                                 'right_val': [1, 6, np.nan]})
+
+        result = pd.merge_asof(left, right, on='a', direction='forward')
+        assert_frame_equal(result, expected)
+
+    def test_examples4(self):
+        """ doc-string examples """
+        # GH14887
+
+        left = pd.DataFrame({'a': [1, 5, 10],
+                             'left_val': ['a', 'b', 'c']})
+        right = pd.DataFrame({'a': [1, 2, 3, 6, 7],
+                              'right_val': [1, 2, 3, 6, 7]})
+
+        expected = pd.DataFrame({'a': [1, 5, 10],
+                                 'left_val': ['a', 'b', 'c'],
+                                 'right_val': [1, 6, 7]})
+
+        result = pd.merge_asof(left, right, on='a', direction='nearest')
+        assert_frame_equal(result, expected)
+
+    def test_basic(self):
+
+        expected = self.asof
+        trades = self.trades
+        quotes = self.quotes
+
+        result = merge_asof(trades, quotes,
+                            on='time',
+                            by='ticker')
+        assert_frame_equal(result, expected)
+
+    def test_basic_categorical(self):
+
+        expected = self.asof
+        trades = self.trades.copy()
+        trades.ticker = trades.ticker.astype('category')
+        quotes = self.quotes.copy()
+        quotes.ticker = quotes.ticker.astype('category')
+        expected.ticker = expected.ticker.astype('category')
+
+        result = merge_asof(trades, quotes,
+                            on='time',
+                            by='ticker')
+        assert_frame_equal(result, expected)
+
+    def test_basic_left_index(self):
+
+        # GH14253
+        expected = self.asof
+        trades = self.trades.set_index('time')
+        quotes = self.quotes
+
+        result = merge_asof(trades, quotes,
+                            left_index=True,
+                            right_on='time',
+                            by='ticker')
+        # left-only index uses right's index, oddly
+        expected.index = result.index
+        # time column appears after left's columns
+        expected = expected[result.columns]
+        assert_frame_equal(result, expected)
+
+    def test_basic_right_index(self):
+
+        expected = self.asof
+        trades = self.trades
+        quotes = self.quotes.set_index('time')
+
+        result = merge_asof(trades, quotes,
+                            left_on='time',
+                            right_index=True,
+                            by='ticker')
+        assert_frame_equal(result, expected)
+
+    def test_basic_left_index_right_index(self):
+
+        expected = self.asof.set_index('time')
+        trades = self.trades.set_index('time')
+        quotes = self.quotes.set_index('time')
+
+        result = merge_asof(trades, quotes,
+                            left_index=True,
+                            right_index=True,
+                            by='ticker')
+        assert_frame_equal(result, expected)
+
+    def test_multi_index(self):
+
+        # MultiIndex is prohibited
+        trades = self.trades.set_index(['time', 'price'])
+        quotes = self.quotes.set_index('time')
+        with pytest.raises(MergeError):
+            merge_asof(trades, quotes,
+                       left_index=True,
+                       right_index=True)
+
+        trades = self.trades.set_index('time')
+        quotes = self.quotes.set_index(['time', 'bid'])
+        with pytest.raises(MergeError):
+            merge_asof(trades, quotes,
+                       left_index=True,
+                       right_index=True)
+
+    def test_on_and_index(self):
+
+        # 'on' parameter and index together is prohibited
+        trades = self.trades.set_index('time')
+        quotes = self.quotes.set_index('time')
+        with pytest.raises(MergeError):
+            merge_asof(trades, quotes,
+                       left_on='price',
+                       left_index=True,
+                       right_index=True)
+
+        trades = self.trades.set_index('time')
+        quotes = self.quotes.set_index('time')
+        with pytest.raises(MergeError):
+            merge_asof(trades, quotes,
+                       right_on='bid',
+                       left_index=True,
+                       right_index=True)
+
+    def test_basic_left_by_right_by(self):
+
+        # GH14253
+        expected = self.asof
+        trades = self.trades
+        quotes = self.quotes
+
+        result = merge_asof(trades, quotes,
+                            on='time',
+                            left_by='ticker',
+                            right_by='ticker')
+        assert_frame_equal(result, expected)
+
+    def test_missing_right_by(self):
+
+        expected = self.asof
+        trades = self.trades
+        quotes = self.quotes
+
+        q = quotes[quotes.ticker != 'MSFT']
+        result = merge_asof(trades, q,
+                            on='time',
+                            by='ticker')
+        expected.loc[expected.ticker == 'MSFT', ['bid', 'ask']] = np.nan
+        assert_frame_equal(result, expected)
+
+    def test_multiby(self):
+        # GH13936
+        trades = pd.DataFrame({
+            'time': pd.to_datetime(['20160525 13:30:00.023',
+                                    '20160525 13:30:00.023',
+                                    '20160525 13:30:00.046',
+                                    '20160525 13:30:00.048',
+                                    '20160525 13:30:00.050']),
+            'ticker': ['MSFT', 'MSFT',
+                       'GOOG', 'GOOG', 'AAPL'],
+            'exch': ['ARCA', 'NSDQ', 'NSDQ', 'BATS', 'NSDQ'],
+            'price': [51.95, 51.95,
+                      720.77, 720.92, 98.00],
+            'quantity': [75, 155,
+                         100, 100, 100]},
+            columns=['time', 'ticker', 'exch',
+                     'price', 'quantity'])
+
+        quotes = pd.DataFrame({
+            'time': pd.to_datetime(['20160525 13:30:00.023',
+                                    '20160525 13:30:00.023',
+                                    '20160525 13:30:00.030',
+                                    '20160525 13:30:00.041',
+                                    '20160525 13:30:00.045',
+                                    '20160525 13:30:00.049']),
+            'ticker': ['GOOG', 'MSFT', 'MSFT',
+                       'MSFT', 'GOOG', 'AAPL'],
+            'exch': ['BATS', 'NSDQ', 'ARCA', 'ARCA',
+                     'NSDQ', 'ARCA'],
+            'bid': [720.51, 51.95, 51.97, 51.99,
+                    720.50, 97.99],
+            'ask': [720.92, 51.96, 51.98, 52.00,
+                    720.93, 98.01]},
+            columns=['time', 'ticker', 'exch', 'bid', 'ask'])
+
+        expected = pd.DataFrame({
+            'time': pd.to_datetime(['20160525 13:30:00.023',
+                                    '20160525 13:30:00.023',
+                                    '20160525 13:30:00.046',
+                                    '20160525 13:30:00.048',
+                                    '20160525 13:30:00.050']),
+            'ticker': ['MSFT', 'MSFT',
+                       'GOOG', 'GOOG', 'AAPL'],
+            'exch': ['ARCA', 'NSDQ', 'NSDQ', 'BATS', 'NSDQ'],
+            'price': [51.95, 51.95,
+                      720.77, 720.92, 98.00],
+            'quantity': [75, 155,
+                         100, 100, 100],
+            'bid': [np.nan, 51.95, 720.50, 720.51, np.nan],
+            'ask': [np.nan, 51.96, 720.93, 720.92, np.nan]},
+            columns=['time', 'ticker', 'exch',
+                     'price', 'quantity', 'bid', 'ask'])
+
+        result = pd.merge_asof(trades, quotes, on='time',
+                               by=['ticker', 'exch'])
+        assert_frame_equal(result, expected)
+
+    def test_multiby_heterogeneous_types(self):
+        # GH13936
+        trades = pd.DataFrame({
+            'time': pd.to_datetime(['20160525 13:30:00.023',
+                                    '20160525 13:30:00.023',
+                                    '20160525 13:30:00.046',
+                                    '20160525 13:30:00.048',
+                                    '20160525 13:30:00.050']),
+            'ticker': [0, 0, 1, 1, 2],
+            'exch': ['ARCA', 'NSDQ', 'NSDQ', 'BATS', 'NSDQ'],
+            'price': [51.95, 51.95,
+                      720.77, 720.92, 98.00],
+            'quantity': [75, 155,
+                         100, 100, 100]},
+            columns=['time', 'ticker', 'exch',
+                     'price', 'quantity'])
+
+        quotes = pd.DataFrame({
+            'time': pd.to_datetime(['20160525 13:30:00.023',
+                                    '20160525 13:30:00.023',
+                                    '20160525 13:30:00.030',
+                                    '20160525 13:30:00.041',
+                                    '20160525 13:30:00.045',
+                                    '20160525 13:30:00.049']),
+            'ticker': [1, 0, 0, 0, 1, 2],
+            'exch': ['BATS', 'NSDQ', 'ARCA', 'ARCA',
+                     'NSDQ', 'ARCA'],
+            'bid': [720.51, 51.95, 51.97, 51.99,
+                    720.50, 97.99],
+            'ask': [720.92, 51.96, 51.98, 52.00,
+                    720.93, 98.01]},
+            columns=['time', 'ticker', 'exch', 'bid', 'ask'])
+
+        expected = pd.DataFrame({
+            'time': pd.to_datetime(['20160525 13:30:00.023',
+                                    '20160525 13:30:00.023',
+                                    '20160525 13:30:00.046',
+                                    '20160525 13:30:00.048',
+                                    '20160525 13:30:00.050']),
+            'ticker': [0, 0, 1, 1, 2],
+            'exch': ['ARCA', 'NSDQ', 'NSDQ', 'BATS', 'NSDQ'],
+            'price': [51.95, 51.95,
+                      720.77, 720.92, 98.00],
+            'quantity': [75, 155,
+                         100, 100, 100],
+            'bid': [np.nan, 51.95, 720.50, 720.51, np.nan],
+            'ask': [np.nan, 51.96, 720.93, 720.92, np.nan]},
+            columns=['time', 'ticker', 'exch',
+                     'price', 'quantity', 'bid', 'ask'])
+
+        result = pd.merge_asof(trades, quotes, on='time',
+                               by=['ticker', 'exch'])
+        assert_frame_equal(result, expected)
+
+    def test_multiby_indexed(self):
+        # GH15676
+        left = pd.DataFrame([
+            [pd.to_datetime('20160602'), 1, 'a'],
+            [pd.to_datetime('20160602'), 2, 'a'],
+            [pd.to_datetime('20160603'), 1, 'b'],
+            [pd.to_datetime('20160603'), 2, 'b']],
+            columns=['time', 'k1', 'k2']).set_index('time')
+
+        right = pd.DataFrame([
+            [pd.to_datetime('20160502'), 1, 'a', 1.0],
+            [pd.to_datetime('20160502'), 2, 'a', 2.0],
+            [pd.to_datetime('20160503'), 1, 'b', 3.0],
+            [pd.to_datetime('20160503'), 2, 'b', 4.0]],
+            columns=['time', 'k1', 'k2', 'value']).set_index('time')
+
+        expected = pd.DataFrame([
+            [pd.to_datetime('20160602'), 1, 'a', 1.0],
+            [pd.to_datetime('20160602'), 2, 'a', 2.0],
+            [pd.to_datetime('20160603'), 1, 'b', 3.0],
+            [pd.to_datetime('20160603'), 2, 'b', 4.0]],
+            columns=['time', 'k1', 'k2', 'value']).set_index('time')
+
+        result = pd.merge_asof(left,
+                               right,
+                               left_index=True,
+                               right_index=True,
+                               by=['k1', 'k2'])
+
+        assert_frame_equal(expected, result)
+
+        with pytest.raises(MergeError):
+            pd.merge_asof(left, right, left_index=True, right_index=True,
+                          left_by=['k1', 'k2'], right_by=['k1'])
+
+    def test_basic2(self, datapath):
+
+        expected = self.read_data(datapath, 'asof2.csv')
+        trades = self.read_data(datapath, 'trades2.csv')
+        quotes = self.read_data(datapath, 'quotes2.csv', dedupe=True)
+
+        result = merge_asof(trades, quotes,
+                            on='time',
+                            by='ticker')
+        assert_frame_equal(result, expected)
+
+    def test_basic_no_by(self):
+        f = lambda x: x[x.ticker == 'MSFT'].drop('ticker', axis=1) \
+            .reset_index(drop=True)
+
+        # just use a single ticker
+        expected = f(self.asof)
+        trades = f(self.trades)
+        quotes = f(self.quotes)
+
+        result = merge_asof(trades, quotes,
+                            on='time')
+        assert_frame_equal(result, expected)
+
+    def test_valid_join_keys(self):
+
+        trades = self.trades
+        quotes = self.quotes
+
+        with pytest.raises(MergeError):
+            merge_asof(trades, quotes,
+                       left_on='time',
+                       right_on='bid',
+                       by='ticker')
+
+        with pytest.raises(MergeError):
+            merge_asof(trades, quotes,
+                       on=['time', 'ticker'],
+                       by='ticker')
+
+        with pytest.raises(MergeError):
+            merge_asof(trades, quotes,
+                       by='ticker')
+
+    def test_with_duplicates(self, datapath):
+
+        q = pd.concat([self.quotes, self.quotes]).sort_values(
+            ['time', 'ticker']).reset_index(drop=True)
+        result = merge_asof(self.trades, q,
+                            on='time',
+                            by='ticker')
+        expected = self.read_data(datapath, 'asof.csv')
+        assert_frame_equal(result, expected)
+
+    def test_with_duplicates_no_on(self):
+
+        df1 = pd.DataFrame({'key': [1, 1, 3],
+                            'left_val': [1, 2, 3]})
+        df2 = pd.DataFrame({'key': [1, 2, 2],
+                            'right_val': [1, 2, 3]})
+        result = merge_asof(df1, df2, on='key')
+        expected = pd.DataFrame({'key': [1, 1, 3],
+                                 'left_val': [1, 2, 3],
+                                 'right_val': [1, 1, 3]})
+        assert_frame_equal(result, expected)
+
+    def test_valid_allow_exact_matches(self):
+
+        trades = self.trades
+        quotes = self.quotes
+
+        with pytest.raises(MergeError):
+            merge_asof(trades, quotes,
+                       on='time',
+                       by='ticker',
+                       allow_exact_matches='foo')
+
+    def test_valid_tolerance(self):
+
+        trades = self.trades
+        quotes = self.quotes
+
+        # dti
+        merge_asof(trades, quotes,
+                   on='time',
+                   by='ticker',
+                   tolerance=Timedelta('1s'))
+
+        # integer
+        merge_asof(trades.reset_index(), quotes.reset_index(),
+                   on='index',
+                   by='ticker',
+                   tolerance=1)
+
+        # incompat
+        with pytest.raises(MergeError):
+            merge_asof(trades, quotes,
+                       on='time',
+                       by='ticker',
+                       tolerance=1)
+
+        # invalid
+        with pytest.raises(MergeError):
+            merge_asof(trades.reset_index(), quotes.reset_index(),
+                       on='index',
+                       by='ticker',
+                       tolerance=1.0)
+
+        # invalid negative
+        with pytest.raises(MergeError):
+            merge_asof(trades, quotes,
+                       on='time',
+                       by='ticker',
+                       tolerance=-Timedelta('1s'))
+
+        with pytest.raises(MergeError):
+            merge_asof(trades.reset_index(), quotes.reset_index(),
+                       on='index',
+                       by='ticker',
+                       tolerance=-1)
+
+    def test_non_sorted(self):
+
+        trades = self.trades.sort_values('time', ascending=False)
+        quotes = self.quotes.sort_values('time', ascending=False)
+
+        # we require that we are already sorted on time & quotes
+        assert not trades.time.is_monotonic
+        assert not quotes.time.is_monotonic
+        with pytest.raises(ValueError):
+            merge_asof(trades, quotes,
+                       on='time',
+                       by='ticker')
+
+        trades = self.trades.sort_values('time')
+        assert trades.time.is_monotonic
+        assert not quotes.time.is_monotonic
+        with pytest.raises(ValueError):
+            merge_asof(trades, quotes,
+                       on='time',
+                       by='ticker')
+
+        quotes = self.quotes.sort_values('time')
+        assert trades.time.is_monotonic
+        assert quotes.time.is_monotonic
+
+        # ok, though has dupes
+        merge_asof(trades, self.quotes,
+                   on='time',
+                   by='ticker')
+
+    def test_tolerance(self):
+
+        trades = self.trades
+        quotes = self.quotes
+
+        result = merge_asof(trades, quotes,
+                            on='time',
+                            by='ticker',
+                            tolerance=Timedelta('1day'))
+        expected = self.tolerance
+        assert_frame_equal(result, expected)
+
+    def test_tolerance_forward(self):
+        # GH14887
+
+        left = pd.DataFrame({'a': [1, 5, 10],
+                             'left_val': ['a', 'b', 'c']})
+        right = pd.DataFrame({'a': [1, 2, 3, 7, 11],
+                              'right_val': [1, 2, 3, 7, 11]})
+
+        expected = pd.DataFrame({'a': [1, 5, 10],
+                                 'left_val': ['a', 'b', 'c'],
+                                 'right_val': [1, np.nan, 11]})
+
+        result = pd.merge_asof(left, right, on='a', direction='forward',
+                               tolerance=1)
+        assert_frame_equal(result, expected)
+
+    def test_tolerance_nearest(self):
+        # GH14887
+
+        left = pd.DataFrame({'a': [1, 5, 10],
+                             'left_val': ['a', 'b', 'c']})
+        right = pd.DataFrame({'a': [1, 2, 3, 7, 11],
+                              'right_val': [1, 2, 3, 7, 11]})
+
+        expected = pd.DataFrame({'a': [1, 5, 10],
+                                 'left_val': ['a', 'b', 'c'],
+                                 'right_val': [1, np.nan, 11]})
+
+        result = pd.merge_asof(left, right, on='a', direction='nearest',
+                               tolerance=1)
+        assert_frame_equal(result, expected)
+
+    def test_tolerance_tz(self):
+        # GH 14844
+        left = pd.DataFrame(
+            {'date': pd.DatetimeIndex(start=pd.to_datetime('2016-01-02'),
+                                      freq='D', periods=5,
+                                      tz=pytz.timezone('UTC')),
+             'value1': np.arange(5)})
+        right = pd.DataFrame(
+            {'date': pd.DatetimeIndex(start=pd.to_datetime('2016-01-01'),
+                                      freq='D', periods=5,
+                                      tz=pytz.timezone('UTC')),
+             'value2': list("ABCDE")})
+        result = pd.merge_asof(left, right, on='date',
+                               tolerance=pd.Timedelta('1 day'))
+
+        expected = pd.DataFrame(
+            {'date': pd.DatetimeIndex(start=pd.to_datetime('2016-01-02'),
+                                      freq='D', periods=5,
+                                      tz=pytz.timezone('UTC')),
+             'value1': np.arange(5),
+             'value2': list("BCDEE")})
+        assert_frame_equal(result, expected)
+
+    def test_index_tolerance(self):
+        # GH 15135
+        expected = self.tolerance.set_index('time')
+        trades = self.trades.set_index('time')
+        quotes = self.quotes.set_index('time')
+
+        result = pd.merge_asof(trades, quotes,
+                               left_index=True,
+                               right_index=True,
+                               by='ticker',
+                               tolerance=pd.Timedelta('1day'))
+        assert_frame_equal(result, expected)
+
+    def test_allow_exact_matches(self):
+
+        result = merge_asof(self.trades, self.quotes,
+                            on='time',
+                            by='ticker',
+                            allow_exact_matches=False)
+        expected = self.allow_exact_matches
+        assert_frame_equal(result, expected)
+
+    def test_allow_exact_matches_forward(self):
+        # GH14887
+
+        left = pd.DataFrame({'a': [1, 5, 10],
+                             'left_val': ['a', 'b', 'c']})
+        right = pd.DataFrame({'a': [1, 2, 3, 7, 11],
+                              'right_val': [1, 2, 3, 7, 11]})
+
+        expected = pd.DataFrame({'a': [1, 5, 10],
+                                 'left_val': ['a', 'b', 'c'],
+                                 'right_val': [2, 7, 11]})
+
+        result = pd.merge_asof(left, right, on='a', direction='forward',
+                               allow_exact_matches=False)
+        assert_frame_equal(result, expected)
+
+    def test_allow_exact_matches_nearest(self):
+        # GH14887
+
+        left = pd.DataFrame({'a': [1, 5, 10],
+                             'left_val': ['a', 'b', 'c']})
+        right = pd.DataFrame({'a': [1, 2, 3, 7, 11],
+                              'right_val': [1, 2, 3, 7, 11]})
+
+        expected = pd.DataFrame({'a': [1, 5, 10],
+                                 'left_val': ['a', 'b', 'c'],
+                                 'right_val': [2, 3, 11]})
+
+        result = pd.merge_asof(left, right, on='a', direction='nearest',
+                               allow_exact_matches=False)
+        assert_frame_equal(result, expected)
+
+    def test_allow_exact_matches_and_tolerance(self):
+
+        result = merge_asof(self.trades, self.quotes,
+                            on='time',
+                            by='ticker',
+                            tolerance=Timedelta('100ms'),
+                            allow_exact_matches=False)
+        expected = self.allow_exact_matches_and_tolerance
+        assert_frame_equal(result, expected)
+
+    def test_allow_exact_matches_and_tolerance2(self):
+        # GH 13695
+        df1 = pd.DataFrame({
+            'time': pd.to_datetime(['2016-07-15 13:30:00.030']),
+            'username': ['bob']})
+        df2 = pd.DataFrame({
+            'time': pd.to_datetime(['2016-07-15 13:30:00.000',
+                                    '2016-07-15 13:30:00.030']),
+            'version': [1, 2]})
+
+        result = pd.merge_asof(df1, df2, on='time')
+        expected = pd.DataFrame({
+            'time': pd.to_datetime(['2016-07-15 13:30:00.030']),
+            'username': ['bob'],
+            'version': [2]})
+        assert_frame_equal(result, expected)
+
+        result = pd.merge_asof(df1, df2, on='time', allow_exact_matches=False)
+        expected = pd.DataFrame({
+            'time': pd.to_datetime(['2016-07-15 13:30:00.030']),
+            'username': ['bob'],
+            'version': [1]})
+        assert_frame_equal(result, expected)
+
+        result = pd.merge_asof(df1, df2, on='time', allow_exact_matches=False,
+                               tolerance=pd.Timedelta('10ms'))
+        expected = pd.DataFrame({
+            'time': pd.to_datetime(['2016-07-15 13:30:00.030']),
+            'username': ['bob'],
+            'version': [np.nan]})
+        assert_frame_equal(result, expected)
+
+    def test_allow_exact_matches_and_tolerance3(self):
+        # GH 13709
+        df1 = pd.DataFrame({
+            'time': pd.to_datetime(['2016-07-15 13:30:00.030',
+                                    '2016-07-15 13:30:00.030']),
+            'username': ['bob', 'charlie']})
+        df2 = pd.DataFrame({
+            'time': pd.to_datetime(['2016-07-15 13:30:00.000',
+                                    '2016-07-15 13:30:00.030']),
+            'version': [1, 2]})
+
+        result = pd.merge_asof(df1, df2, on='time', allow_exact_matches=False,
+                               tolerance=pd.Timedelta('10ms'))
+        expected = pd.DataFrame({
+            'time': pd.to_datetime(['2016-07-15 13:30:00.030',
+                                    '2016-07-15 13:30:00.030']),
+            'username': ['bob', 'charlie'],
+            'version': [np.nan, np.nan]})
+        assert_frame_equal(result, expected)
+
+    def test_allow_exact_matches_and_tolerance_forward(self):
+        # GH14887
+
+        left = pd.DataFrame({'a': [1, 5, 10],
+                             'left_val': ['a', 'b', 'c']})
+        right = pd.DataFrame({'a': [1, 3, 4, 6, 11],
+                              'right_val': [1, 3, 4, 6, 11]})
+
+        expected = pd.DataFrame({'a': [1, 5, 10],
+                                 'left_val': ['a', 'b', 'c'],
+                                 'right_val': [np.nan, 6, 11]})
+
+        result = pd.merge_asof(left, right, on='a', direction='forward',
+                               allow_exact_matches=False, tolerance=1)
+        assert_frame_equal(result, expected)
+
+    def test_allow_exact_matches_and_tolerance_nearest(self):
+        # GH14887
+
+        left = pd.DataFrame({'a': [1, 5, 10],
+                             'left_val': ['a', 'b', 'c']})
+        right = pd.DataFrame({'a': [1, 3, 4, 6, 11],
+                              'right_val': [1, 3, 4, 7, 11]})
+
+        expected = pd.DataFrame({'a': [1, 5, 10],
+                                 'left_val': ['a', 'b', 'c'],
+                                 'right_val': [np.nan, 4, 11]})
+
+        result = pd.merge_asof(left, right, on='a', direction='nearest',
+                               allow_exact_matches=False, tolerance=1)
+        assert_frame_equal(result, expected)
+
+    def test_forward_by(self):
+        # GH14887
+
+        left = pd.DataFrame({'a': [1, 5, 10, 12, 15],
+                             'b': ['X', 'X', 'Y', 'Z', 'Y'],
+                             'left_val': ['a', 'b', 'c', 'd', 'e']})
+        right = pd.DataFrame({'a': [1, 6, 11, 15, 16],
+                              'b': ['X', 'Z', 'Y', 'Z', 'Y'],
+                              'right_val': [1, 6, 11, 15, 16]})
+
+        expected = pd.DataFrame({'a': [1, 5, 10, 12, 15],
+                                 'b': ['X', 'X', 'Y', 'Z', 'Y'],
+                                 'left_val': ['a', 'b', 'c', 'd', 'e'],
+                                 'right_val': [1, np.nan, 11, 15, 16]})
+
+        result = pd.merge_asof(left, right, on='a', by='b',
+                               direction='forward')
+        assert_frame_equal(result, expected)
+
+    def test_nearest_by(self):
+        # GH14887
+
+        left = pd.DataFrame({'a': [1, 5, 10, 12, 15],
+                             'b': ['X', 'X', 'Z', 'Z', 'Y'],
+                             'left_val': ['a', 'b', 'c', 'd', 'e']})
+        right = pd.DataFrame({'a': [1, 6, 11, 15, 16],
+                              'b': ['X', 'Z', 'Z', 'Z', 'Y'],
+                              'right_val': [1, 6, 11, 15, 16]})
+
+        expected = pd.DataFrame({'a': [1, 5, 10, 12, 15],
+                                 'b': ['X', 'X', 'Z', 'Z', 'Y'],
+                                 'left_val': ['a', 'b', 'c', 'd', 'e'],
+                                 'right_val': [1, 1, 11, 11, 16]})
+
+        result = pd.merge_asof(left, right, on='a', by='b',
+                               direction='nearest')
+        assert_frame_equal(result, expected)
+
+    def test_by_int(self):
+        # we specialize by type, so test that this is correct
+        df1 = pd.DataFrame({
+            'time': pd.to_datetime(['20160525 13:30:00.020',
+                                    '20160525 13:30:00.030',
+                                    '20160525 13:30:00.040',
+                                    '20160525 13:30:00.050',
+                                    '20160525 13:30:00.060']),
+            'key': [1, 2, 1, 3, 2],
+            'value1': [1.1, 1.2, 1.3, 1.4, 1.5]},
+            columns=['time', 'key', 'value1'])
+
+        df2 = pd.DataFrame({
+            'time': pd.to_datetime(['20160525 13:30:00.015',
+                                    '20160525 13:30:00.020',
+                                    '20160525 13:30:00.025',
+                                    '20160525 13:30:00.035',
+                                    '20160525 13:30:00.040',
+                                    '20160525 13:30:00.055',
+                                    '20160525 13:30:00.060',
+                                    '20160525 13:30:00.065']),
+            'key': [2, 1, 1, 3, 2, 1, 2, 3],
+            'value2': [2.1, 2.2, 2.3, 2.4, 2.5, 2.6, 2.7, 2.8]},
+            columns=['time', 'key', 'value2'])
+
+        result = pd.merge_asof(df1, df2, on='time', by='key')
+
+        expected = pd.DataFrame({
+            'time': pd.to_datetime(['20160525 13:30:00.020',
+                                    '20160525 13:30:00.030',
+                                    '20160525 13:30:00.040',
+                                    '20160525 13:30:00.050',
+                                    '20160525 13:30:00.060']),
+            'key': [1, 2, 1, 3, 2],
+            'value1': [1.1, 1.2, 1.3, 1.4, 1.5],
+            'value2': [2.2, 2.1, 2.3, 2.4, 2.7]},
+            columns=['time', 'key', 'value1', 'value2'])
+
+        assert_frame_equal(result, expected)
+
+    def test_on_float(self):
+        # mimics how to determine the minimum-price variation
+        df1 = pd.DataFrame({
+            'price': [5.01, 0.0023, 25.13, 340.05, 30.78, 1040.90, 0.0078],
+            'symbol': list("ABCDEFG")},
+            columns=['symbol', 'price'])
+
+        df2 = pd.DataFrame({
+            'price': [0.0, 1.0, 100.0],
+            'mpv': [0.0001, 0.01, 0.05]},
+            columns=['price', 'mpv'])
+
+        df1 = df1.sort_values('price').reset_index(drop=True)
+
+        result = pd.merge_asof(df1, df2, on='price')
+
+        expected = pd.DataFrame({
+            'symbol': list("BGACEDF"),
+            'price': [0.0023, 0.0078, 5.01, 25.13, 30.78, 340.05, 1040.90],
+            'mpv': [0.0001, 0.0001, 0.01, 0.01, 0.01, 0.05, 0.05]},
+            columns=['symbol', 'price', 'mpv'])
+
+        assert_frame_equal(result, expected)
+
+    def test_on_specialized_type(self):
+        # GH13936
+        for dtype in [np.uint8, np.uint16, np.uint32, np.uint64,
+                      np.int8, np.int16, np.int32, np.int64,
+                      np.float16, np.float32, np.float64]:
+            df1 = pd.DataFrame({
+                'value': [5, 2, 25, 100, 78, 120, 79],
+                'symbol': list("ABCDEFG")},
+                columns=['symbol', 'value'])
+            df1.value = dtype(df1.value)
+
+            df2 = pd.DataFrame({
+                'value': [0, 80, 120, 125],
+                'result': list('xyzw')},
+                columns=['value', 'result'])
+            df2.value = dtype(df2.value)
+
+            df1 = df1.sort_values('value').reset_index(drop=True)
+
+            if dtype == np.float16:
+                with pytest.raises(MergeError):
+                    pd.merge_asof(df1, df2, on='value')
+                continue
+
+            result = pd.merge_asof(df1, df2, on='value')
+
+            expected = pd.DataFrame(
+                {'symbol': list("BACEGDF"),
+                 'value': [2, 5, 25, 78, 79, 100, 120],
+                 'result': list('xxxxxyz')
+                 }, columns=['symbol', 'value', 'result'])
+            expected.value = dtype(expected.value)
+
+            assert_frame_equal(result, expected)
+
+    def test_on_specialized_type_by_int(self):
+        # GH13936
+        for dtype in [np.uint8, np.uint16, np.uint32, np.uint64,
+                      np.int8, np.int16, np.int32, np.int64,
+                      np.float16, np.float32, np.float64]:
+            df1 = pd.DataFrame({
+                'value': [5, 2, 25, 100, 78, 120, 79],
+                'key': [1, 2, 3, 2, 3, 1, 2],
+                'symbol': list("ABCDEFG")},
+                columns=['symbol', 'key', 'value'])
+            df1.value = dtype(df1.value)
+
+            df2 = pd.DataFrame({
+                'value': [0, 80, 120, 125],
+                'key': [1, 2, 2, 3],
+                'result': list('xyzw')},
+                columns=['value', 'key', 'result'])
+            df2.value = dtype(df2.value)
+
+            df1 = df1.sort_values('value').reset_index(drop=True)
+
+            if dtype == np.float16:
+                with pytest.raises(MergeError):
+                    pd.merge_asof(df1, df2, on='value', by='key')
+            else:
+                result = pd.merge_asof(df1, df2, on='value', by='key')
+
+                expected = pd.DataFrame({
+                    'symbol': list("BACEGDF"),
+                    'key': [2, 1, 3, 3, 2, 2, 1],
+                    'value': [2, 5, 25, 78, 79, 100, 120],
+                    'result': [np.nan, 'x', np.nan, np.nan, np.nan, 'y', 'x']},
+                    columns=['symbol', 'key', 'value', 'result'])
+                expected.value = dtype(expected.value)
+
+                assert_frame_equal(result, expected)
+
+    def test_on_float_by_int(self):
+        # type specialize both "by" and "on" parameters
+        df1 = pd.DataFrame({
+            'symbol': list("AAABBBCCC"),
+            'exch': [1, 2, 3, 1, 2, 3, 1, 2, 3],
+            'price': [3.26, 3.2599, 3.2598, 12.58, 12.59,
+                      12.5, 378.15, 378.2, 378.25]},
+            columns=['symbol', 'exch', 'price'])
+
+        df2 = pd.DataFrame({
+            'exch': [1, 1, 1, 2, 2, 2, 3, 3, 3],
+            'price': [0.0, 1.0, 100.0, 0.0, 5.0, 100.0, 0.0, 5.0, 1000.0],
+            'mpv': [0.0001, 0.01, 0.05, 0.0001, 0.01, 0.1, 0.0001, 0.25, 1.0]},
+            columns=['exch', 'price', 'mpv'])
+
+        df1 = df1.sort_values('price').reset_index(drop=True)
+        df2 = df2.sort_values('price').reset_index(drop=True)
+
+        result = pd.merge_asof(df1, df2, on='price', by='exch')
+
+        expected = pd.DataFrame({
+            'symbol': list("AAABBBCCC"),
+            'exch': [3, 2, 1, 3, 1, 2, 1, 2, 3],
+            'price': [3.2598, 3.2599, 3.26, 12.5, 12.58,
+                      12.59, 378.15, 378.2, 378.25],
+            'mpv': [0.0001, 0.0001, 0.01, 0.25, 0.01, 0.01, 0.05, 0.1, 0.25]},
+            columns=['symbol', 'exch', 'price', 'mpv'])
+
+        assert_frame_equal(result, expected)
+
+    def test_merge_datatype_error(self):
+        """ Tests merge datatype mismatch error """
+        msg = r'merge keys \[0\] object and int64, must be the same type'
+
+        left = pd.DataFrame({'left_val': [1, 5, 10],
+                             'a': ['a', 'b', 'c']})
+        right = pd.DataFrame({'right_val': [1, 2, 3, 6, 7],
+                              'a': [1, 2, 3, 6, 7]})
+
+        with tm.assert_raises_regex(MergeError, msg):
+            merge_asof(left, right, on='a')
diff --git a/pandas/tests/reshape/merge/test_merge_index_as_string.py b/pandas/tests/reshape/merge/test_merge_index_as_string.py
new file mode 100644
index 0000000000000..a27fcf41681e6
--- /dev/null
+++ b/pandas/tests/reshape/merge/test_merge_index_as_string.py
@@ -0,0 +1,213 @@
+import numpy as np
+import pytest
+
+from pandas import DataFrame
+from pandas.util import testing as tm
+from pandas.util.testing import assert_frame_equal
+
+
+@pytest.fixture
+def df1():
+    return DataFrame(dict(
+        outer=[1, 1, 1, 2, 2, 2, 2, 3, 3, 4, 4],
+        inner=[1, 2, 3, 1, 2, 3, 4, 1, 2, 1, 2],
+        v1=np.linspace(0, 1, 11)))
+
+
+@pytest.fixture
+def df2():
+    return DataFrame(dict(
+        outer=[1, 1, 1, 1, 1, 1, 2, 2, 3, 3, 3, 3],
+        inner=[1, 2, 2, 3, 3, 4, 2, 3, 1, 1, 2, 3],
+        v2=np.linspace(10, 11, 12)))
+
+
+@pytest.fixture(params=[[], ['outer'], ['outer', 'inner']])
+def left_df(request, df1):
+    """ Construct left test DataFrame with specified levels
+    (any of 'outer', 'inner', and 'v1')"""
+    levels = request.param
+    if levels:
+        df1 = df1.set_index(levels)
+
+    return df1
+
+
+@pytest.fixture(params=[[], ['outer'], ['outer', 'inner']])
+def right_df(request, df2):
+    """ Construct right test DataFrame with specified levels
+    (any of 'outer', 'inner', and 'v2')"""
+    levels = request.param
+
+    if levels:
+        df2 = df2.set_index(levels)
+
+    return df2
+
+
+def compute_expected(df_left, df_right,
+                     on=None, left_on=None, right_on=None, how=None):
+    """
+    Compute the expected merge result for the test case.
+
+    This method computes the expected result of merging two DataFrames on
+    a combination of their columns and index levels. It does so by
+    explicitly dropping/resetting their named index levels, performing a
+    merge on their columns, and then finally restoring the appropriate
+    index in the result.
+
+    Parameters
+    ----------
+    df_left : DataFrame
+        The left DataFrame (may have zero or more named index levels)
+    df_right : DataFrame
+        The right DataFrame (may have zero or more named index levels)
+    on : list of str
+        The on parameter to the merge operation
+    left_on : list of str
+        The left_on parameter to the merge operation
+    right_on : list of str
+        The right_on parameter to the merge operation
+    how : str
+        The how parameter to the merge operation
+
+    Returns
+    -------
+    DataFrame
+        The expected merge result
+    """
+
+    # Handle on param if specified
+    if on is not None:
+        left_on, right_on = on, on
+
+    # Compute input named index levels
+    left_levels = [n for n in df_left.index.names if n is not None]
+    right_levels = [n for n in df_right.index.names if n is not None]
+
+    # Compute output named index levels
+    output_levels = [i for i in left_on
+                     if i in right_levels and i in left_levels]
+
+    # Drop index levels that aren't involved in the merge
+    drop_left = [n for n in left_levels if n not in left_on]
+    if drop_left:
+        df_left = df_left.reset_index(drop_left, drop=True)
+
+    drop_right = [n for n in right_levels if n not in right_on]
+    if drop_right:
+        df_right = df_right.reset_index(drop_right, drop=True)
+
+    # Convert remaining index levels to columns
+    reset_left = [n for n in left_levels if n in left_on]
+    if reset_left:
+        df_left = df_left.reset_index(level=reset_left)
+
+    reset_right = [n for n in right_levels if n in right_on]
+    if reset_right:
+        df_right = df_right.reset_index(level=reset_right)
+
+    # Perform merge
+    expected = df_left.merge(df_right,
+                             left_on=left_on,
+                             right_on=right_on,
+                             how=how)
+
+    # Restore index levels
+    if output_levels:
+        expected = expected.set_index(output_levels)
+
+    return expected
+
+
+@pytest.mark.parametrize('on,how',
+                         [(['outer'], 'inner'),
+                          (['inner'], 'left'),
+                          (['outer', 'inner'], 'right'),
+                          (['inner', 'outer'], 'outer')])
+def test_merge_indexes_and_columns_on(left_df, right_df, on, how):
+
+    # Construct expected result
+    expected = compute_expected(left_df, right_df, on=on, how=how)
+
+    # Perform merge
+    result = left_df.merge(right_df, on=on, how=how)
+    assert_frame_equal(result, expected, check_like=True)
+
+
+@pytest.mark.parametrize('left_on,right_on,how',
+                         [(['outer'], ['outer'], 'inner'),
+                          (['inner'], ['inner'], 'right'),
+                          (['outer', 'inner'], ['outer', 'inner'], 'left'),
+                          (['inner', 'outer'], ['inner', 'outer'], 'outer')])
+def test_merge_indexes_and_columns_lefton_righton(
+        left_df, right_df, left_on, right_on, how):
+
+    # Construct expected result
+    expected = compute_expected(left_df, right_df,
+                                left_on=left_on,
+                                right_on=right_on,
+                                how=how)
+
+    # Perform merge
+    result = left_df.merge(right_df,
+                           left_on=left_on, right_on=right_on, how=how)
+    assert_frame_equal(result, expected, check_like=True)
+
+
+@pytest.mark.parametrize('left_index',
+                         ['inner', ['inner', 'outer']])
+def test_join_indexes_and_columns_on(df1, df2, left_index, join_type):
+
+    # Construct left_df
+    left_df = df1.set_index(left_index)
+
+    # Construct right_df
+    right_df = df2.set_index(['outer', 'inner'])
+
+    # Result
+    expected = (left_df.reset_index()
+                .join(right_df, on=['outer', 'inner'], how=join_type,
+                      lsuffix='_x', rsuffix='_y')
+                .set_index(left_index))
+
+    # Perform join
+    result = left_df.join(right_df, on=['outer', 'inner'], how=join_type,
+                          lsuffix='_x', rsuffix='_y')
+
+    assert_frame_equal(result, expected, check_like=True)
+
+
+def test_merge_index_column_precedence(df1, df2):
+
+    # Construct left_df with both an index and a column named 'outer'.
+    # We make this 'outer' column equal to the 'inner' column so that we
+    # can verify that the correct values are used by the merge operation
+    left_df = df1.set_index('outer')
+    left_df['outer'] = left_df['inner']
+
+    # Construct right_df with an index level named 'outer'
+    right_df = df2.set_index('outer')
+
+    # Construct expected result.
+    # The 'outer' column from left_df is chosen and the resulting
+    # frame has no index levels
+    expected = (left_df.reset_index(level='outer', drop=True)
+                .merge(right_df.reset_index(), on=['outer', 'inner']))
+
+    # Merge left_df and right_df on 'outer' and 'inner'
+    #  'outer' for left_df should refer to the 'outer' column, not the
+    #  'outer' index level and a FutureWarning should be raised
+    with tm.assert_produces_warning(FutureWarning):
+        result = left_df.merge(right_df, on=['outer', 'inner'])
+
+    # Check results
+    assert_frame_equal(result, expected)
+
+    # Perform the same using the left_on and right_on parameters
+    with tm.assert_produces_warning(FutureWarning):
+        result = left_df.merge(right_df,
+                               left_on=['outer', 'inner'],
+                               right_on=['outer', 'inner'])
+
+    assert_frame_equal(result, expected)
diff --git a/pandas/tests/reshape/merge/test_merge_ordered.py b/pandas/tests/reshape/merge/test_merge_ordered.py
new file mode 100644
index 0000000000000..42d8eb7273ee1
--- /dev/null
+++ b/pandas/tests/reshape/merge/test_merge_ordered.py
@@ -0,0 +1,102 @@
+import pandas as pd
+from pandas import DataFrame, merge_ordered
+from pandas.util import testing as tm
+from pandas.util.testing import assert_frame_equal
+
+from numpy import nan
+
+
+class TestMergeOrdered(object):
+
+    def setup_method(self, method):
+        self.left = DataFrame({'key': ['a', 'c', 'e'],
+                               'lvalue': [1, 2., 3]})
+
+        self.right = DataFrame({'key': ['b', 'c', 'd', 'f'],
+                                'rvalue': [1, 2, 3., 4]})
+
+    def test_basic(self):
+        result = merge_ordered(self.left, self.right, on='key')
+        expected = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'f'],
+                              'lvalue': [1, nan, 2, nan, 3, nan],
+                              'rvalue': [nan, 1, 2, 3, nan, 4]})
+
+        assert_frame_equal(result, expected)
+
+    def test_ffill(self):
+        result = merge_ordered(
+            self.left, self.right, on='key', fill_method='ffill')
+        expected = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'f'],
+                              'lvalue': [1., 1, 2, 2, 3, 3.],
+                              'rvalue': [nan, 1, 2, 3, 3, 4]})
+        assert_frame_equal(result, expected)
+
+    def test_multigroup(self):
+        left = pd.concat([self.left, self.left], ignore_index=True)
+
+        left['group'] = ['a'] * 3 + ['b'] * 3
+
+        result = merge_ordered(left, self.right, on='key', left_by='group',
+                               fill_method='ffill')
+        expected = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'f'] * 2,
+                              'lvalue': [1., 1, 2, 2, 3, 3.] * 2,
+                              'rvalue': [nan, 1, 2, 3, 3, 4] * 2})
+        expected['group'] = ['a'] * 6 + ['b'] * 6
+
+        assert_frame_equal(result, expected.loc[:, result.columns])
+
+        result2 = merge_ordered(self.right, left, on='key', right_by='group',
+                                fill_method='ffill')
+        assert_frame_equal(result, result2.loc[:, result.columns])
+
+        result = merge_ordered(left, self.right, on='key', left_by='group')
+        assert result['group'].notna().all()
+
+    def test_merge_type(self):
+        class NotADataFrame(DataFrame):
+
+            @property
+            def _constructor(self):
+                return NotADataFrame
+
+        nad = NotADataFrame(self.left)
+        result = nad.merge(self.right, on='key')
+
+        assert isinstance(result, NotADataFrame)
+
+    def test_empty_sequence_concat(self):
+        # GH 9157
+        empty_pat = "[Nn]o objects"
+        none_pat = "objects.*None"
+        test_cases = [
+            ((), empty_pat),
+            ([], empty_pat),
+            ({}, empty_pat),
+            ([None], none_pat),
+            ([None, None], none_pat)
+        ]
+        for df_seq, pattern in test_cases:
+            tm.assert_raises_regex(ValueError, pattern, pd.concat, df_seq)
+
+        pd.concat([pd.DataFrame()])
+        pd.concat([None, pd.DataFrame()])
+        pd.concat([pd.DataFrame(), None])
+
+    def test_doc_example(self):
+        left = DataFrame({'group': list('aaabbb'),
+                          'key': ['a', 'c', 'e', 'a', 'c', 'e'],
+                          'lvalue': [1, 2, 3] * 2,
+                          })
+
+        right = DataFrame({'key': ['b', 'c', 'd'],
+                           'rvalue': [1, 2, 3]})
+
+        result = merge_ordered(left, right, fill_method='ffill',
+                               left_by='group')
+
+        expected = DataFrame({'group': list('aaaaabbbbb'),
+                              'key': ['a', 'b', 'c', 'd', 'e'] * 2,
+                              'lvalue': [1, 1, 2, 2, 3] * 2,
+                              'rvalue': [nan, 1, 2, 3, 3] * 2})
+
+        assert_frame_equal(result, expected)
diff --git a/pandas/tests/reshape/test_concat.py b/pandas/tests/reshape/test_concat.py
new file mode 100644
index 0000000000000..8d819f9926abb
--- /dev/null
+++ b/pandas/tests/reshape/test_concat.py
@@ -0,0 +1,2501 @@
+from warnings import catch_warnings
+from itertools import combinations
+
+import datetime as dt
+import dateutil
+import numpy as np
+from numpy.random import randn
+
+from datetime import datetime
+from pandas.compat import StringIO, iteritems, PY2
+import pandas as pd
+from pandas import (DataFrame, concat,
+                    read_csv, isna, Series, date_range,
+                    Index, Panel, MultiIndex, Timestamp,
+                    DatetimeIndex, Categorical)
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas.util import testing as tm
+from pandas.util.testing import (assert_frame_equal,
+                                 makeCustomDataframe as mkdf)
+
+import pytest
+
+
+@pytest.fixture(params=[True, False])
+def sort(request):
+    """Boolean sort keyword for concat and DataFrame.append."""
+    return request.param
+
+
+@pytest.fixture(params=[True, False, None])
+def sort_with_none(request):
+    """Boolean sort keyword for concat and DataFrame.append.
+
+    Includes the default of None
+    """
+    # TODO: Replace with sort once keyword changes.
+    return request.param
+
+
+class ConcatenateBase(object):
+
+    def setup_method(self, method):
+        self.frame = DataFrame(tm.getSeriesData())
+        self.mixed_frame = self.frame.copy()
+        self.mixed_frame['foo'] = 'bar'
+
+
+class TestConcatAppendCommon(ConcatenateBase):
+
+    """
+    Test common dtype coercion rules between concat and append.
+    """
+
+    def setup_method(self, method):
+
+        dt_data = [pd.Timestamp('2011-01-01'),
+                   pd.Timestamp('2011-01-02'),
+                   pd.Timestamp('2011-01-03')]
+        tz_data = [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+                   pd.Timestamp('2011-01-02', tz='US/Eastern'),
+                   pd.Timestamp('2011-01-03', tz='US/Eastern')]
+
+        td_data = [pd.Timedelta('1 days'),
+                   pd.Timedelta('2 days'),
+                   pd.Timedelta('3 days')]
+
+        period_data = [pd.Period('2011-01', freq='M'),
+                       pd.Period('2011-02', freq='M'),
+                       pd.Period('2011-03', freq='M')]
+
+        self.data = {'bool': [True, False, True],
+                     'int64': [1, 2, 3],
+                     'float64': [1.1, np.nan, 3.3],
+                     'category': pd.Categorical(['X', 'Y', 'Z']),
+                     'object': ['a', 'b', 'c'],
+                     'datetime64[ns]': dt_data,
+                     'datetime64[ns, US/Eastern]': tz_data,
+                     'timedelta64[ns]': td_data,
+                     'period[M]': period_data}
+
+    def _check_expected_dtype(self, obj, label):
+        """
+        Check whether obj has expected dtype depending on label
+        considering not-supported dtypes
+        """
+        if isinstance(obj, pd.Index):
+            if label == 'bool':
+                assert obj.dtype == 'object'
+            else:
+                assert obj.dtype == label
+        elif isinstance(obj, pd.Series):
+            if label.startswith('period'):
+                assert obj.dtype == 'object'
+            else:
+                assert obj.dtype == label
+        else:
+            raise ValueError
+
+    def test_dtypes(self):
+        # to confirm test case covers intended dtypes
+        for typ, vals in iteritems(self.data):
+            self._check_expected_dtype(pd.Index(vals), typ)
+            self._check_expected_dtype(pd.Series(vals), typ)
+
+    def test_concatlike_same_dtypes(self):
+        # GH 13660
+        for typ1, vals1 in iteritems(self.data):
+
+            vals2 = vals1
+            vals3 = vals1
+
+            if typ1 == 'category':
+                exp_data = pd.Categorical(list(vals1) + list(vals2))
+                exp_data3 = pd.Categorical(list(vals1) + list(vals2) +
+                                           list(vals3))
+            else:
+                exp_data = vals1 + vals2
+                exp_data3 = vals1 + vals2 + vals3
+
+            # ----- Index ----- #
+
+            # index.append
+            res = pd.Index(vals1).append(pd.Index(vals2))
+            exp = pd.Index(exp_data)
+            tm.assert_index_equal(res, exp)
+
+            # 3 elements
+            res = pd.Index(vals1).append([pd.Index(vals2), pd.Index(vals3)])
+            exp = pd.Index(exp_data3)
+            tm.assert_index_equal(res, exp)
+
+            # index.append name mismatch
+            i1 = pd.Index(vals1, name='x')
+            i2 = pd.Index(vals2, name='y')
+            res = i1.append(i2)
+            exp = pd.Index(exp_data)
+            tm.assert_index_equal(res, exp)
+
+            # index.append name match
+            i1 = pd.Index(vals1, name='x')
+            i2 = pd.Index(vals2, name='x')
+            res = i1.append(i2)
+            exp = pd.Index(exp_data, name='x')
+            tm.assert_index_equal(res, exp)
+
+            # cannot append non-index
+            with tm.assert_raises_regex(TypeError,
+                                        'all inputs must be Index'):
+                pd.Index(vals1).append(vals2)
+
+            with tm.assert_raises_regex(TypeError,
+                                        'all inputs must be Index'):
+                pd.Index(vals1).append([pd.Index(vals2), vals3])
+
+            # ----- Series ----- #
+
+            # series.append
+            res = pd.Series(vals1).append(pd.Series(vals2),
+                                          ignore_index=True)
+            exp = pd.Series(exp_data)
+            tm.assert_series_equal(res, exp, check_index_type=True)
+
+            # concat
+            res = pd.concat([pd.Series(vals1), pd.Series(vals2)],
+                            ignore_index=True)
+            tm.assert_series_equal(res, exp, check_index_type=True)
+
+            # 3 elements
+            res = pd.Series(vals1).append([pd.Series(vals2), pd.Series(vals3)],
+                                          ignore_index=True)
+            exp = pd.Series(exp_data3)
+            tm.assert_series_equal(res, exp)
+
+            res = pd.concat([pd.Series(vals1), pd.Series(vals2),
+                             pd.Series(vals3)], ignore_index=True)
+            tm.assert_series_equal(res, exp)
+
+            # name mismatch
+            s1 = pd.Series(vals1, name='x')
+            s2 = pd.Series(vals2, name='y')
+            res = s1.append(s2, ignore_index=True)
+            exp = pd.Series(exp_data)
+            tm.assert_series_equal(res, exp, check_index_type=True)
+
+            res = pd.concat([s1, s2], ignore_index=True)
+            tm.assert_series_equal(res, exp, check_index_type=True)
+
+            # name match
+            s1 = pd.Series(vals1, name='x')
+            s2 = pd.Series(vals2, name='x')
+            res = s1.append(s2, ignore_index=True)
+            exp = pd.Series(exp_data, name='x')
+            tm.assert_series_equal(res, exp, check_index_type=True)
+
+            res = pd.concat([s1, s2], ignore_index=True)
+            tm.assert_series_equal(res, exp, check_index_type=True)
+
+            # cannot append non-index
+            msg = (r'cannot concatenate object of type \"(.+?)\";'
+                   ' only pd.Series, pd.DataFrame, and pd.Panel'
+                   r' \(deprecated\) objs are valid')
+            with tm.assert_raises_regex(TypeError, msg):
+                pd.Series(vals1).append(vals2)
+
+            with tm.assert_raises_regex(TypeError, msg):
+                pd.Series(vals1).append([pd.Series(vals2), vals3])
+
+            with tm.assert_raises_regex(TypeError, msg):
+                pd.concat([pd.Series(vals1), vals2])
+
+            with tm.assert_raises_regex(TypeError, msg):
+                pd.concat([pd.Series(vals1), pd.Series(vals2), vals3])
+
+    def test_concatlike_dtypes_coercion(self):
+        # GH 13660
+        for typ1, vals1 in iteritems(self.data):
+            for typ2, vals2 in iteritems(self.data):
+
+                vals3 = vals2
+
+                # basically infer
+                exp_index_dtype = None
+                exp_series_dtype = None
+
+                if typ1 == typ2:
+                    # same dtype is tested in test_concatlike_same_dtypes
+                    continue
+                elif typ1 == 'category' or typ2 == 'category':
+                    # ToDo: suspicious
+                    continue
+
+                # specify expected dtype
+                if typ1 == 'bool' and typ2 in ('int64', 'float64'):
+                    # series coerces to numeric based on numpy rule
+                    # index doesn't because bool is object dtype
+                    exp_series_dtype = typ2
+                elif typ2 == 'bool' and typ1 in ('int64', 'float64'):
+                    exp_series_dtype = typ1
+                elif (typ1 == 'datetime64[ns, US/Eastern]' or
+                      typ2 == 'datetime64[ns, US/Eastern]' or
+                      typ1 == 'timedelta64[ns]' or
+                      typ2 == 'timedelta64[ns]'):
+                    exp_index_dtype = object
+                    exp_series_dtype = object
+
+                exp_data = vals1 + vals2
+                exp_data3 = vals1 + vals2 + vals3
+
+                # ----- Index ----- #
+
+                # index.append
+                res = pd.Index(vals1).append(pd.Index(vals2))
+                exp = pd.Index(exp_data, dtype=exp_index_dtype)
+                tm.assert_index_equal(res, exp)
+
+                # 3 elements
+                res = pd.Index(vals1).append([pd.Index(vals2),
+                                              pd.Index(vals3)])
+                exp = pd.Index(exp_data3, dtype=exp_index_dtype)
+                tm.assert_index_equal(res, exp)
+
+                # ----- Series ----- #
+
+                # series.append
+                res = pd.Series(vals1).append(pd.Series(vals2),
+                                              ignore_index=True)
+                exp = pd.Series(exp_data, dtype=exp_series_dtype)
+                tm.assert_series_equal(res, exp, check_index_type=True)
+
+                # concat
+                res = pd.concat([pd.Series(vals1), pd.Series(vals2)],
+                                ignore_index=True)
+                tm.assert_series_equal(res, exp, check_index_type=True)
+
+                # 3 elements
+                res = pd.Series(vals1).append([pd.Series(vals2),
+                                               pd.Series(vals3)],
+                                              ignore_index=True)
+                exp = pd.Series(exp_data3, dtype=exp_series_dtype)
+                tm.assert_series_equal(res, exp)
+
+                res = pd.concat([pd.Series(vals1), pd.Series(vals2),
+                                 pd.Series(vals3)], ignore_index=True)
+                tm.assert_series_equal(res, exp)
+
+    def test_concatlike_common_coerce_to_pandas_object(self):
+        # GH 13626
+        # result must be Timestamp/Timedelta, not datetime.datetime/timedelta
+        dti = pd.DatetimeIndex(['2011-01-01', '2011-01-02'])
+        tdi = pd.TimedeltaIndex(['1 days', '2 days'])
+
+        exp = pd.Index([pd.Timestamp('2011-01-01'),
+                        pd.Timestamp('2011-01-02'),
+                        pd.Timedelta('1 days'),
+                        pd.Timedelta('2 days')])
+
+        res = dti.append(tdi)
+        tm.assert_index_equal(res, exp)
+        assert isinstance(res[0], pd.Timestamp)
+        assert isinstance(res[-1], pd.Timedelta)
+
+        dts = pd.Series(dti)
+        tds = pd.Series(tdi)
+        res = dts.append(tds)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+        assert isinstance(res.iloc[0], pd.Timestamp)
+        assert isinstance(res.iloc[-1], pd.Timedelta)
+
+        res = pd.concat([dts, tds])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+        assert isinstance(res.iloc[0], pd.Timestamp)
+        assert isinstance(res.iloc[-1], pd.Timedelta)
+
+    def test_concatlike_datetimetz(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH 7795
+        dti1 = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], tz=tz)
+        dti2 = pd.DatetimeIndex(['2012-01-01', '2012-01-02'], tz=tz)
+
+        exp = pd.DatetimeIndex(['2011-01-01', '2011-01-02',
+                                '2012-01-01', '2012-01-02'], tz=tz)
+
+        res = dti1.append(dti2)
+        tm.assert_index_equal(res, exp)
+
+        dts1 = pd.Series(dti1)
+        dts2 = pd.Series(dti2)
+        res = dts1.append(dts2)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([dts1, dts2])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+    @pytest.mark.parametrize('tz',
+                             ['UTC', 'US/Eastern', 'Asia/Tokyo', 'EST5EDT'])
+    def test_concatlike_datetimetz_short(self, tz):
+        # GH 7795
+        ix1 = pd.DatetimeIndex(start='2014-07-15', end='2014-07-17',
+                               freq='D', tz=tz)
+        ix2 = pd.DatetimeIndex(['2014-07-11', '2014-07-21'], tz=tz)
+        df1 = pd.DataFrame(0, index=ix1, columns=['A', 'B'])
+        df2 = pd.DataFrame(0, index=ix2, columns=['A', 'B'])
+
+        exp_idx = pd.DatetimeIndex(['2014-07-15', '2014-07-16',
+                                    '2014-07-17', '2014-07-11',
+                                    '2014-07-21'], tz=tz)
+        exp = pd.DataFrame(0, index=exp_idx, columns=['A', 'B'])
+
+        tm.assert_frame_equal(df1.append(df2), exp)
+        tm.assert_frame_equal(pd.concat([df1, df2]), exp)
+
+    def test_concatlike_datetimetz_to_object(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH 13660
+
+        # different tz coerces to object
+        dti1 = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], tz=tz)
+        dti2 = pd.DatetimeIndex(['2012-01-01', '2012-01-02'])
+
+        exp = pd.Index([pd.Timestamp('2011-01-01', tz=tz),
+                        pd.Timestamp('2011-01-02', tz=tz),
+                        pd.Timestamp('2012-01-01'),
+                        pd.Timestamp('2012-01-02')], dtype=object)
+
+        res = dti1.append(dti2)
+        tm.assert_index_equal(res, exp)
+
+        dts1 = pd.Series(dti1)
+        dts2 = pd.Series(dti2)
+        res = dts1.append(dts2)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([dts1, dts2])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        # different tz
+        dti3 = pd.DatetimeIndex(['2012-01-01', '2012-01-02'],
+                                tz='US/Pacific')
+
+        exp = pd.Index([pd.Timestamp('2011-01-01', tz=tz),
+                        pd.Timestamp('2011-01-02', tz=tz),
+                        pd.Timestamp('2012-01-01', tz='US/Pacific'),
+                        pd.Timestamp('2012-01-02', tz='US/Pacific')],
+                       dtype=object)
+
+        res = dti1.append(dti3)
+        # tm.assert_index_equal(res, exp)
+
+        dts1 = pd.Series(dti1)
+        dts3 = pd.Series(dti3)
+        res = dts1.append(dts3)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([dts1, dts3])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+    def test_concatlike_common_period(self):
+        # GH 13660
+        pi1 = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
+        pi2 = pd.PeriodIndex(['2012-01', '2012-02'], freq='M')
+
+        exp = pd.PeriodIndex(['2011-01', '2011-02', '2012-01',
+                              '2012-02'], freq='M')
+
+        res = pi1.append(pi2)
+        tm.assert_index_equal(res, exp)
+
+        ps1 = pd.Series(pi1)
+        ps2 = pd.Series(pi2)
+        res = ps1.append(ps2)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([ps1, ps2])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+    def test_concatlike_common_period_diff_freq_to_object(self):
+        # GH 13221
+        pi1 = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
+        pi2 = pd.PeriodIndex(['2012-01-01', '2012-02-01'], freq='D')
+
+        exp = pd.Index([pd.Period('2011-01', freq='M'),
+                        pd.Period('2011-02', freq='M'),
+                        pd.Period('2012-01-01', freq='D'),
+                        pd.Period('2012-02-01', freq='D')], dtype=object)
+
+        res = pi1.append(pi2)
+        tm.assert_index_equal(res, exp)
+
+        ps1 = pd.Series(pi1)
+        ps2 = pd.Series(pi2)
+        res = ps1.append(ps2)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([ps1, ps2])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+    def test_concatlike_common_period_mixed_dt_to_object(self):
+        # GH 13221
+        # different datetimelike
+        pi1 = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
+        tdi = pd.TimedeltaIndex(['1 days', '2 days'])
+        exp = pd.Index([pd.Period('2011-01', freq='M'),
+                        pd.Period('2011-02', freq='M'),
+                        pd.Timedelta('1 days'),
+                        pd.Timedelta('2 days')], dtype=object)
+
+        res = pi1.append(tdi)
+        tm.assert_index_equal(res, exp)
+
+        ps1 = pd.Series(pi1)
+        tds = pd.Series(tdi)
+        res = ps1.append(tds)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([ps1, tds])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        # inverse
+        exp = pd.Index([pd.Timedelta('1 days'),
+                        pd.Timedelta('2 days'),
+                        pd.Period('2011-01', freq='M'),
+                        pd.Period('2011-02', freq='M')], dtype=object)
+
+        res = tdi.append(pi1)
+        tm.assert_index_equal(res, exp)
+
+        ps1 = pd.Series(pi1)
+        tds = pd.Series(tdi)
+        res = tds.append(ps1)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([tds, ps1])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+    def test_concat_categorical(self):
+        # GH 13524
+
+        # same categories -> category
+        s1 = pd.Series([1, 2, np.nan], dtype='category')
+        s2 = pd.Series([2, 1, 2], dtype='category')
+
+        exp = pd.Series([1, 2, np.nan, 2, 1, 2], dtype='category')
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        # partially different categories => not-category
+        s1 = pd.Series([3, 2], dtype='category')
+        s2 = pd.Series([2, 1], dtype='category')
+
+        exp = pd.Series([3, 2, 2, 1])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        # completely different categories (same dtype) => not-category
+        s1 = pd.Series([10, 11, np.nan], dtype='category')
+        s2 = pd.Series([np.nan, 1, 3, 2], dtype='category')
+
+        exp = pd.Series([10, 11, np.nan, np.nan, 1, 3, 2])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+    def test_union_categorical_same_categories_different_order(self):
+        # https://github.com/pandas-dev/pandas/issues/19096
+        a = pd.Series(Categorical(['a', 'b', 'c'], categories=['a', 'b', 'c']))
+        b = pd.Series(Categorical(['a', 'b', 'c'], categories=['b', 'a', 'c']))
+        result = pd.concat([a, b], ignore_index=True)
+        expected = pd.Series(Categorical(['a', 'b', 'c', 'a', 'b', 'c'],
+                                         categories=['a', 'b', 'c']))
+        tm.assert_series_equal(result, expected)
+
+    def test_concat_categorical_coercion(self):
+        # GH 13524
+
+        # category + not-category => not-category
+        s1 = pd.Series([1, 2, np.nan], dtype='category')
+        s2 = pd.Series([2, 1, 2])
+
+        exp = pd.Series([1, 2, np.nan, 2, 1, 2])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        # result shouldn't be affected by 1st elem dtype
+        exp = pd.Series([2, 1, 2, 1, 2, np.nan])
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+        # all values are not in category => not-category
+        s1 = pd.Series([3, 2], dtype='category')
+        s2 = pd.Series([2, 1])
+
+        exp = pd.Series([3, 2, 2, 1])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        exp = pd.Series([2, 1, 3, 2])
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+        # completely different categories => not-category
+        s1 = pd.Series([10, 11, np.nan], dtype='category')
+        s2 = pd.Series([1, 3, 2])
+
+        exp = pd.Series([10, 11, np.nan, 1, 3, 2])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        exp = pd.Series([1, 3, 2, 10, 11, np.nan])
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+        # different dtype => not-category
+        s1 = pd.Series([10, 11, np.nan], dtype='category')
+        s2 = pd.Series(['a', 'b', 'c'])
+
+        exp = pd.Series([10, 11, np.nan, 'a', 'b', 'c'])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        exp = pd.Series(['a', 'b', 'c', 10, 11, np.nan])
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+        # if normal series only contains NaN-likes => not-category
+        s1 = pd.Series([10, 11], dtype='category')
+        s2 = pd.Series([np.nan, np.nan, np.nan])
+
+        exp = pd.Series([10, 11, np.nan, np.nan, np.nan])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        exp = pd.Series([np.nan, np.nan, np.nan, 10, 11])
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+    def test_concat_categorical_3elem_coercion(self):
+        # GH 13524
+
+        # mixed dtypes => not-category
+        s1 = pd.Series([1, 2, np.nan], dtype='category')
+        s2 = pd.Series([2, 1, 2], dtype='category')
+        s3 = pd.Series([1, 2, 1, 2, np.nan])
+
+        exp = pd.Series([1, 2, np.nan, 2, 1, 2, 1, 2, 1, 2, np.nan])
+        tm.assert_series_equal(pd.concat([s1, s2, s3], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append([s2, s3], ignore_index=True), exp)
+
+        exp = pd.Series([1, 2, 1, 2, np.nan, 1, 2, np.nan, 2, 1, 2])
+        tm.assert_series_equal(pd.concat([s3, s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s3.append([s1, s2], ignore_index=True), exp)
+
+        # values are all in either category => not-category
+        s1 = pd.Series([4, 5, 6], dtype='category')
+        s2 = pd.Series([1, 2, 3], dtype='category')
+        s3 = pd.Series([1, 3, 4])
+
+        exp = pd.Series([4, 5, 6, 1, 2, 3, 1, 3, 4])
+        tm.assert_series_equal(pd.concat([s1, s2, s3], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append([s2, s3], ignore_index=True), exp)
+
+        exp = pd.Series([1, 3, 4, 4, 5, 6, 1, 2, 3])
+        tm.assert_series_equal(pd.concat([s3, s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s3.append([s1, s2], ignore_index=True), exp)
+
+        # values are all in either category => not-category
+        s1 = pd.Series([4, 5, 6], dtype='category')
+        s2 = pd.Series([1, 2, 3], dtype='category')
+        s3 = pd.Series([10, 11, 12])
+
+        exp = pd.Series([4, 5, 6, 1, 2, 3, 10, 11, 12])
+        tm.assert_series_equal(pd.concat([s1, s2, s3], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append([s2, s3], ignore_index=True), exp)
+
+        exp = pd.Series([10, 11, 12, 4, 5, 6, 1, 2, 3])
+        tm.assert_series_equal(pd.concat([s3, s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s3.append([s1, s2], ignore_index=True), exp)
+
+    def test_concat_categorical_multi_coercion(self):
+        # GH 13524
+
+        s1 = pd.Series([1, 3], dtype='category')
+        s2 = pd.Series([3, 4], dtype='category')
+        s3 = pd.Series([2, 3])
+        s4 = pd.Series([2, 2], dtype='category')
+        s5 = pd.Series([1, np.nan])
+        s6 = pd.Series([1, 3, 2], dtype='category')
+
+        # mixed dtype, values are all in categories => not-category
+        exp = pd.Series([1, 3, 3, 4, 2, 3, 2, 2, 1, np.nan, 1, 3, 2])
+        res = pd.concat([s1, s2, s3, s4, s5, s6], ignore_index=True)
+        tm.assert_series_equal(res, exp)
+        res = s1.append([s2, s3, s4, s5, s6], ignore_index=True)
+        tm.assert_series_equal(res, exp)
+
+        exp = pd.Series([1, 3, 2, 1, np.nan, 2, 2, 2, 3, 3, 4, 1, 3])
+        res = pd.concat([s6, s5, s4, s3, s2, s1], ignore_index=True)
+        tm.assert_series_equal(res, exp)
+        res = s6.append([s5, s4, s3, s2, s1], ignore_index=True)
+        tm.assert_series_equal(res, exp)
+
+    def test_concat_categorical_ordered(self):
+        # GH 13524
+
+        s1 = pd.Series(pd.Categorical([1, 2, np.nan], ordered=True))
+        s2 = pd.Series(pd.Categorical([2, 1, 2], ordered=True))
+
+        exp = pd.Series(pd.Categorical([1, 2, np.nan, 2, 1, 2], ordered=True))
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        exp = pd.Series(pd.Categorical([1, 2, np.nan, 2, 1, 2, 1, 2, np.nan],
+                                       ordered=True))
+        tm.assert_series_equal(pd.concat([s1, s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append([s2, s1], ignore_index=True), exp)
+
+    def test_concat_categorical_coercion_nan(self):
+        # GH 13524
+
+        # some edge cases
+        # category + not-category => not category
+        s1 = pd.Series(np.array([np.nan, np.nan], dtype=np.float64),
+                       dtype='category')
+        s2 = pd.Series([np.nan, 1])
+
+        exp = pd.Series([np.nan, np.nan, np.nan, 1])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        s1 = pd.Series([1, np.nan], dtype='category')
+        s2 = pd.Series([np.nan, np.nan])
+
+        exp = pd.Series([1, np.nan, np.nan, np.nan])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        # mixed dtype, all nan-likes => not-category
+        s1 = pd.Series([np.nan, np.nan], dtype='category')
+        s2 = pd.Series([np.nan, np.nan])
+
+        exp = pd.Series([np.nan, np.nan, np.nan, np.nan])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+        # all category nan-likes => category
+        s1 = pd.Series([np.nan, np.nan], dtype='category')
+        s2 = pd.Series([np.nan, np.nan], dtype='category')
+
+        exp = pd.Series([np.nan, np.nan, np.nan, np.nan], dtype='category')
+
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+    def test_concat_categorical_empty(self):
+        # GH 13524
+
+        s1 = pd.Series([], dtype='category')
+        s2 = pd.Series([1, 2], dtype='category')
+
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), s2)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), s2)
+
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), s2)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), s2)
+
+        s1 = pd.Series([], dtype='category')
+        s2 = pd.Series([], dtype='category')
+
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), s2)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), s2)
+
+        s1 = pd.Series([], dtype='category')
+        s2 = pd.Series([], dtype='object')
+
+        # different dtype => not-category
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), s2)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), s2)
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), s2)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), s2)
+
+        s1 = pd.Series([], dtype='category')
+        s2 = pd.Series([np.nan, np.nan])
+
+        # empty Series is ignored
+        exp = pd.Series([np.nan, np.nan])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+
+class TestAppend(ConcatenateBase):
+
+    def test_append(self, sort):
+        begin_index = self.frame.index[:5]
+        end_index = self.frame.index[5:]
+
+        begin_frame = self.frame.reindex(begin_index)
+        end_frame = self.frame.reindex(end_index)
+
+        appended = begin_frame.append(end_frame)
+        tm.assert_almost_equal(appended['A'], self.frame['A'])
+
+        del end_frame['A']
+        partial_appended = begin_frame.append(end_frame, sort=sort)
+        assert 'A' in partial_appended
+
+        partial_appended = end_frame.append(begin_frame, sort=sort)
+        assert 'A' in partial_appended
+
+        # mixed type handling
+        appended = self.mixed_frame[:5].append(self.mixed_frame[5:])
+        tm.assert_frame_equal(appended, self.mixed_frame)
+
+        # what to test here
+        mixed_appended = self.mixed_frame[:5].append(self.frame[5:], sort=sort)
+        mixed_appended2 = self.frame[:5].append(self.mixed_frame[5:],
+                                                sort=sort)
+
+        # all equal except 'foo' column
+        tm.assert_frame_equal(
+            mixed_appended.reindex(columns=['A', 'B', 'C', 'D']),
+            mixed_appended2.reindex(columns=['A', 'B', 'C', 'D']))
+
+        # append empty
+        empty = DataFrame({})
+
+        appended = self.frame.append(empty)
+        tm.assert_frame_equal(self.frame, appended)
+        assert appended is not self.frame
+
+        appended = empty.append(self.frame)
+        tm.assert_frame_equal(self.frame, appended)
+        assert appended is not self.frame
+
+        # Overlap
+        with pytest.raises(ValueError):
+            self.frame.append(self.frame, verify_integrity=True)
+
+        # see gh-6129: new columns
+        df = DataFrame({'a': {'x': 1, 'y': 2}, 'b': {'x': 3, 'y': 4}})
+        row = Series([5, 6, 7], index=['a', 'b', 'c'], name='z')
+        expected = DataFrame({'a': {'x': 1, 'y': 2, 'z': 5}, 'b': {
+                             'x': 3, 'y': 4, 'z': 6}, 'c': {'z': 7}})
+        result = df.append(row)
+        tm.assert_frame_equal(result, expected)
+
+    def test_append_length0_frame(self, sort):
+        df = DataFrame(columns=['A', 'B', 'C'])
+        df3 = DataFrame(index=[0, 1], columns=['A', 'B'])
+        df5 = df.append(df3, sort=sort)
+
+        expected = DataFrame(index=[0, 1], columns=['A', 'B', 'C'])
+        assert_frame_equal(df5, expected)
+
+    def test_append_records(self):
+        arr1 = np.zeros((2,), dtype=('i4,f4,a10'))
+        arr1[:] = [(1, 2., 'Hello'), (2, 3., "World")]
+
+        arr2 = np.zeros((3,), dtype=('i4,f4,a10'))
+        arr2[:] = [(3, 4., 'foo'),
+                   (5, 6., "bar"),
+                   (7., 8., 'baz')]
+
+        df1 = DataFrame(arr1)
+        df2 = DataFrame(arr2)
+
+        result = df1.append(df2, ignore_index=True)
+        expected = DataFrame(np.concatenate((arr1, arr2)))
+        assert_frame_equal(result, expected)
+
+    # rewrite sort fixture, since we also want to test default of None
+    def test_append_sorts(self, sort_with_none):
+        df1 = pd.DataFrame({"a": [1, 2], "b": [1, 2]}, columns=['b', 'a'])
+        df2 = pd.DataFrame({"a": [1, 2], 'c': [3, 4]}, index=[2, 3])
+
+        if sort_with_none is None:
+            # only warn if not explicitly specified
+            # don't check stacklevel since its set for concat, and append
+            # has an extra stack.
+            ctx = tm.assert_produces_warning(FutureWarning,
+                                             check_stacklevel=False)
+        else:
+            ctx = tm.assert_produces_warning(None)
+
+        with ctx:
+            result = df1.append(df2, sort=sort_with_none)
+
+        # for None / True
+        expected = pd.DataFrame({"b": [1, 2, None, None],
+                                 "a": [1, 2, 1, 2],
+                                 "c": [None, None, 3, 4]},
+                                columns=['a', 'b', 'c'])
+        if sort_with_none is False:
+            expected = expected[['b', 'a', 'c']]
+        tm.assert_frame_equal(result, expected)
+
+    def test_append_different_columns(self, sort):
+        df = DataFrame({'bools': np.random.randn(10) > 0,
+                        'ints': np.random.randint(0, 10, 10),
+                        'floats': np.random.randn(10),
+                        'strings': ['foo', 'bar'] * 5})
+
+        a = df[:5].loc[:, ['bools', 'ints', 'floats']]
+        b = df[5:].loc[:, ['strings', 'ints', 'floats']]
+
+        appended = a.append(b, sort=sort)
+        assert isna(appended['strings'][0:4]).all()
+        assert isna(appended['bools'][5:]).all()
+
+    def test_append_many(self, sort):
+        chunks = [self.frame[:5], self.frame[5:10],
+                  self.frame[10:15], self.frame[15:]]
+
+        result = chunks[0].append(chunks[1:])
+        tm.assert_frame_equal(result, self.frame)
+
+        chunks[-1] = chunks[-1].copy()
+        chunks[-1]['foo'] = 'bar'
+        result = chunks[0].append(chunks[1:], sort=sort)
+        tm.assert_frame_equal(result.loc[:, self.frame.columns], self.frame)
+        assert (result['foo'][15:] == 'bar').all()
+        assert result['foo'][:15].isna().all()
+
+    def test_append_preserve_index_name(self):
+        # #980
+        df1 = DataFrame(data=None, columns=['A', 'B', 'C'])
+        df1 = df1.set_index(['A'])
+        df2 = DataFrame(data=[[1, 4, 7], [2, 5, 8], [3, 6, 9]],
+                        columns=['A', 'B', 'C'])
+        df2 = df2.set_index(['A'])
+
+        result = df1.append(df2)
+        assert result.index.name == 'A'
+
+    indexes_can_append = [
+        pd.RangeIndex(3),
+        pd.Index([4, 5, 6]),
+        pd.Index([4.5, 5.5, 6.5]),
+        pd.Index(list('abc')),
+        pd.CategoricalIndex('A B C'.split()),
+        pd.CategoricalIndex('D E F'.split(), ordered=True),
+        pd.DatetimeIndex([dt.datetime(2013, 1, 3, 0, 0),
+                          dt.datetime(2013, 1, 3, 6, 10),
+                          dt.datetime(2013, 1, 3, 7, 12)]),
+    ]
+
+    indexes_cannot_append_with_other = [
+        pd.IntervalIndex.from_breaks([0, 1, 2, 3]),
+        pd.MultiIndex.from_arrays(['A B C'.split(), 'D E F'.split()]),
+    ]
+
+    all_indexes = indexes_can_append + indexes_cannot_append_with_other
+
+    @pytest.mark.parametrize("index",
+                             all_indexes,
+                             ids=lambda x: x.__class__.__name__)
+    def test_append_same_columns_type(self, index):
+        # GH18359
+
+        # df wider than ser
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]], columns=index)
+        ser_index = index[:2]
+        ser = pd.Series([7, 8], index=ser_index, name=2)
+        result = df.append(ser)
+        expected = pd.DataFrame([[1., 2., 3.], [4, 5, 6], [7, 8, np.nan]],
+                                index=[0, 1, 2],
+                                columns=index)
+        assert_frame_equal(result, expected)
+
+        # ser wider than df
+        ser_index = index
+        index = index[:2]
+        df = pd.DataFrame([[1, 2], [4, 5]], columns=index)
+        ser = pd.Series([7, 8, 9], index=ser_index, name=2)
+        result = df.append(ser)
+        expected = pd.DataFrame([[1, 2, np.nan], [4, 5, np.nan], [7, 8, 9]],
+                                index=[0, 1, 2],
+                                columns=ser_index)
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("df_columns, series_index",
+                             combinations(indexes_can_append, r=2),
+                             ids=lambda x: x.__class__.__name__)
+    def test_append_different_columns_types(self, df_columns, series_index):
+        # GH18359
+        # See also test 'test_append_different_columns_types_raises' below
+        # for errors raised when appending
+
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]], columns=df_columns)
+        ser = pd.Series([7, 8, 9], index=series_index, name=2)
+
+        result = df.append(ser)
+        idx_diff = ser.index.difference(df_columns)
+        combined_columns = Index(df_columns.tolist()).append(idx_diff)
+        expected = pd.DataFrame([[1., 2., 3., np.nan, np.nan, np.nan],
+                                 [4, 5, 6, np.nan, np.nan, np.nan],
+                                 [np.nan, np.nan, np.nan, 7, 8, 9]],
+                                index=[0, 1, 2],
+                                columns=combined_columns)
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('index_can_append', indexes_can_append,
+                             ids=lambda x: x.__class__.__name__)
+    @pytest.mark.parametrize('index_cannot_append_with_other',
+                             indexes_cannot_append_with_other,
+                             ids=lambda x: x.__class__.__name__)
+    def test_append_different_columns_types_raises(
+            self, index_can_append, index_cannot_append_with_other):
+        # GH18359
+        # Dataframe.append will raise if IntervalIndex/MultiIndex appends
+        # or is appended to a different index type
+        #
+        # See also test 'test_append_different_columns_types' above for
+        # appending without raising.
+
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]], columns=index_can_append)
+        ser = pd.Series([7, 8, 9], index=index_cannot_append_with_other,
+                        name=2)
+        with pytest.raises(TypeError):
+            df.append(ser)
+
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]],
+                          columns=index_cannot_append_with_other)
+        ser = pd.Series([7, 8, 9], index=index_can_append, name=2)
+        with pytest.raises(TypeError):
+            df.append(ser)
+
+    def test_append_dtype_coerce(self, sort):
+
+        # GH 4993
+        # appending with datetime will incorrectly convert datetime64
+
+        df1 = DataFrame(index=[1, 2], data=[dt.datetime(2013, 1, 1, 0, 0),
+                                            dt.datetime(2013, 1, 2, 0, 0)],
+                        columns=['start_time'])
+        df2 = DataFrame(index=[4, 5], data=[[dt.datetime(2013, 1, 3, 0, 0),
+                                             dt.datetime(2013, 1, 3, 6, 10)],
+                                            [dt.datetime(2013, 1, 4, 0, 0),
+                                             dt.datetime(2013, 1, 4, 7, 10)]],
+                        columns=['start_time', 'end_time'])
+
+        expected = concat([Series([pd.NaT,
+                                   pd.NaT,
+                                   dt.datetime(2013, 1, 3, 6, 10),
+                                   dt.datetime(2013, 1, 4, 7, 10)],
+                                  name='end_time'),
+                           Series([dt.datetime(2013, 1, 1, 0, 0),
+                                   dt.datetime(2013, 1, 2, 0, 0),
+                                   dt.datetime(2013, 1, 3, 0, 0),
+                                   dt.datetime(2013, 1, 4, 0, 0)],
+                                  name='start_time')],
+                          axis=1, sort=sort)
+        result = df1.append(df2, ignore_index=True, sort=sort)
+        if sort:
+            expected = expected[['end_time', 'start_time']]
+        else:
+            expected = expected[['start_time', 'end_time']]
+
+        assert_frame_equal(result, expected)
+
+    def test_append_missing_column_proper_upcast(self, sort):
+        df1 = DataFrame({'A': np.array([1, 2, 3, 4], dtype='i8')})
+        df2 = DataFrame({'B': np.array([True, False, True, False],
+                                       dtype=bool)})
+
+        appended = df1.append(df2, ignore_index=True, sort=sort)
+        assert appended['A'].dtype == 'f8'
+        assert appended['B'].dtype == 'O'
+
+
+class TestConcatenate(ConcatenateBase):
+
+    def test_concat_copy(self):
+        df = DataFrame(np.random.randn(4, 3))
+        df2 = DataFrame(np.random.randint(0, 10, size=4).reshape(4, 1))
+        df3 = DataFrame({5: 'foo'}, index=range(4))
+
+        # These are actual copies.
+        result = concat([df, df2, df3], axis=1, copy=True)
+
+        for b in result._data.blocks:
+            assert b.values.base is None
+
+        # These are the same.
+        result = concat([df, df2, df3], axis=1, copy=False)
+
+        for b in result._data.blocks:
+            if b.is_float:
+                assert b.values.base is df._data.blocks[0].values.base
+            elif b.is_integer:
+                assert b.values.base is df2._data.blocks[0].values.base
+            elif b.is_object:
+                assert b.values.base is not None
+
+        # Float block was consolidated.
+        df4 = DataFrame(np.random.randn(4, 1))
+        result = concat([df, df2, df3, df4], axis=1, copy=False)
+        for b in result._data.blocks:
+            if b.is_float:
+                assert b.values.base is None
+            elif b.is_integer:
+                assert b.values.base is df2._data.blocks[0].values.base
+            elif b.is_object:
+                assert b.values.base is not None
+
+    def test_concat_with_group_keys(self):
+        df = DataFrame(np.random.randn(4, 3))
+        df2 = DataFrame(np.random.randn(4, 4))
+
+        # axis=0
+        df = DataFrame(np.random.randn(3, 4))
+        df2 = DataFrame(np.random.randn(4, 4))
+
+        result = concat([df, df2], keys=[0, 1])
+        exp_index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1, 1],
+                                            [0, 1, 2, 0, 1, 2, 3]])
+        expected = DataFrame(np.r_[df.values, df2.values],
+                             index=exp_index)
+        tm.assert_frame_equal(result, expected)
+
+        result = concat([df, df], keys=[0, 1])
+        exp_index2 = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1],
+                                             [0, 1, 2, 0, 1, 2]])
+        expected = DataFrame(np.r_[df.values, df.values],
+                             index=exp_index2)
+        tm.assert_frame_equal(result, expected)
+
+        # axis=1
+        df = DataFrame(np.random.randn(4, 3))
+        df2 = DataFrame(np.random.randn(4, 4))
+
+        result = concat([df, df2], keys=[0, 1], axis=1)
+        expected = DataFrame(np.c_[df.values, df2.values],
+                             columns=exp_index)
+        tm.assert_frame_equal(result, expected)
+
+        result = concat([df, df], keys=[0, 1], axis=1)
+        expected = DataFrame(np.c_[df.values, df.values],
+                             columns=exp_index2)
+        tm.assert_frame_equal(result, expected)
+
+    def test_concat_keys_specific_levels(self):
+        df = DataFrame(np.random.randn(10, 4))
+        pieces = [df.iloc[:, [0, 1]], df.iloc[:, [2]], df.iloc[:, [3]]]
+        level = ['three', 'two', 'one', 'zero']
+        result = concat(pieces, axis=1, keys=['one', 'two', 'three'],
+                        levels=[level],
+                        names=['group_key'])
+
+        tm.assert_index_equal(result.columns.levels[0],
+                              Index(level, name='group_key'))
+        assert result.columns.names[0] == 'group_key'
+
+    def test_concat_dataframe_keys_bug(self, sort):
+        t1 = DataFrame({
+            'value': Series([1, 2, 3], index=Index(['a', 'b', 'c'],
+                                                   name='id'))})
+        t2 = DataFrame({
+            'value': Series([7, 8], index=Index(['a', 'b'], name='id'))})
+
+        # it works
+        result = concat([t1, t2], axis=1, keys=['t1', 't2'], sort=sort)
+        assert list(result.columns) == [('t1', 'value'), ('t2', 'value')]
+
+    def test_concat_series_partial_columns_names(self):
+        # GH10698
+        foo = Series([1, 2], name='foo')
+        bar = Series([1, 2])
+        baz = Series([4, 5])
+
+        result = concat([foo, bar, baz], axis=1)
+        expected = DataFrame({'foo': [1, 2], 0: [1, 2], 1: [
+                             4, 5]}, columns=['foo', 0, 1])
+        tm.assert_frame_equal(result, expected)
+
+        result = concat([foo, bar, baz], axis=1, keys=[
+                        'red', 'blue', 'yellow'])
+        expected = DataFrame({'red': [1, 2], 'blue': [1, 2], 'yellow': [
+                             4, 5]}, columns=['red', 'blue', 'yellow'])
+        tm.assert_frame_equal(result, expected)
+
+        result = concat([foo, bar, baz], axis=1, ignore_index=True)
+        expected = DataFrame({0: [1, 2], 1: [1, 2], 2: [4, 5]})
+        tm.assert_frame_equal(result, expected)
+
+    def test_concat_dict(self):
+        frames = {'foo': DataFrame(np.random.randn(4, 3)),
+                  'bar': DataFrame(np.random.randn(4, 3)),
+                  'baz': DataFrame(np.random.randn(4, 3)),
+                  'qux': DataFrame(np.random.randn(4, 3))}
+
+        sorted_keys = sorted(frames)
+
+        result = concat(frames)
+        expected = concat([frames[k] for k in sorted_keys], keys=sorted_keys)
+        tm.assert_frame_equal(result, expected)
+
+        result = concat(frames, axis=1)
+        expected = concat([frames[k] for k in sorted_keys], keys=sorted_keys,
+                          axis=1)
+        tm.assert_frame_equal(result, expected)
+
+        keys = ['baz', 'foo', 'bar']
+        result = concat(frames, keys=keys)
+        expected = concat([frames[k] for k in keys], keys=keys)
+        tm.assert_frame_equal(result, expected)
+
+    def test_concat_ignore_index(self, sort):
+        frame1 = DataFrame({"test1": ["a", "b", "c"],
+                            "test2": [1, 2, 3],
+                            "test3": [4.5, 3.2, 1.2]})
+        frame2 = DataFrame({"test3": [5.2, 2.2, 4.3]})
+        frame1.index = Index(["x", "y", "z"])
+        frame2.index = Index(["x", "y", "q"])
+
+        v1 = concat([frame1, frame2], axis=1,
+                    ignore_index=True, sort=sort)
+
+        nan = np.nan
+        expected = DataFrame([[nan, nan, nan, 4.3],
+                              ['a', 1, 4.5, 5.2],
+                              ['b', 2, 3.2, 2.2],
+                              ['c', 3, 1.2, nan]],
+                             index=Index(["q", "x", "y", "z"]))
+        if not sort:
+            expected = expected.loc[['x', 'y', 'z', 'q']]
+
+        tm.assert_frame_equal(v1, expected)
+
+    def test_concat_multiindex_with_keys(self):
+        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                                   ['one', 'two', 'three']],
+                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           names=['first', 'second'])
+        frame = DataFrame(np.random.randn(10, 3), index=index,
+                          columns=Index(['A', 'B', 'C'], name='exp'))
+        result = concat([frame, frame], keys=[0, 1], names=['iteration'])
+
+        assert result.index.names == ('iteration',) + index.names
+        tm.assert_frame_equal(result.loc[0], frame)
+        tm.assert_frame_equal(result.loc[1], frame)
+        assert result.index.nlevels == 3
+
+    def test_concat_multiindex_with_tz(self):
+        # GH 6606
+        df = DataFrame({'dt': [datetime(2014, 1, 1),
+                               datetime(2014, 1, 2),
+                               datetime(2014, 1, 3)],
+                        'b': ['A', 'B', 'C'],
+                        'c': [1, 2, 3], 'd': [4, 5, 6]})
+        df['dt'] = df['dt'].apply(lambda d: Timestamp(d, tz='US/Pacific'))
+        df = df.set_index(['dt', 'b'])
+
+        exp_idx1 = DatetimeIndex(['2014-01-01', '2014-01-02',
+                                  '2014-01-03'] * 2,
+                                 tz='US/Pacific', name='dt')
+        exp_idx2 = Index(['A', 'B', 'C'] * 2, name='b')
+        exp_idx = MultiIndex.from_arrays([exp_idx1, exp_idx2])
+        expected = DataFrame({'c': [1, 2, 3] * 2, 'd': [4, 5, 6] * 2},
+                             index=exp_idx, columns=['c', 'd'])
+
+        result = concat([df, df])
+        tm.assert_frame_equal(result, expected)
+
+    def test_concat_multiindex_with_none_in_index_names(self):
+        # GH 15787
+        index = pd.MultiIndex.from_product([[1], range(5)],
+                                           names=['level1', None])
+        df = pd.DataFrame({'col': range(5)}, index=index, dtype=np.int32)
+
+        result = concat([df, df], keys=[1, 2], names=['level2'])
+        index = pd.MultiIndex.from_product([[1, 2], [1], range(5)],
+                                           names=['level2', 'level1', None])
+        expected = pd.DataFrame({'col': list(range(5)) * 2},
+                                index=index, dtype=np.int32)
+        assert_frame_equal(result, expected)
+
+        result = concat([df, df[:2]], keys=[1, 2], names=['level2'])
+        level2 = [1] * 5 + [2] * 2
+        level1 = [1] * 7
+        no_name = list(range(5)) + list(range(2))
+        tuples = list(zip(level2, level1, no_name))
+        index = pd.MultiIndex.from_tuples(tuples,
+                                          names=['level2', 'level1', None])
+        expected = pd.DataFrame({'col': no_name}, index=index,
+                                dtype=np.int32)
+        assert_frame_equal(result, expected)
+
+    def test_concat_keys_and_levels(self):
+        df = DataFrame(np.random.randn(1, 3))
+        df2 = DataFrame(np.random.randn(1, 4))
+
+        levels = [['foo', 'baz'], ['one', 'two']]
+        names = ['first', 'second']
+        result = concat([df, df2, df, df2],
+                        keys=[('foo', 'one'), ('foo', 'two'),
+                              ('baz', 'one'), ('baz', 'two')],
+                        levels=levels,
+                        names=names)
+        expected = concat([df, df2, df, df2])
+        exp_index = MultiIndex(levels=levels + [[0]],
+                               labels=[[0, 0, 1, 1], [0, 1, 0, 1],
+                                       [0, 0, 0, 0]],
+                               names=names + [None])
+        expected.index = exp_index
+
+        tm.assert_frame_equal(result, expected)
+
+        # no names
+        result = concat([df, df2, df, df2],
+                        keys=[('foo', 'one'), ('foo', 'two'),
+                              ('baz', 'one'), ('baz', 'two')],
+                        levels=levels)
+        assert result.index.names == (None,) * 3
+
+        # no levels
+        result = concat([df, df2, df, df2],
+                        keys=[('foo', 'one'), ('foo', 'two'),
+                              ('baz', 'one'), ('baz', 'two')],
+                        names=['first', 'second'])
+        assert result.index.names == ('first', 'second') + (None,)
+        tm.assert_index_equal(result.index.levels[0],
+                              Index(['baz', 'foo'], name='first'))
+
+    def test_concat_keys_levels_no_overlap(self):
+        # GH #1406
+        df = DataFrame(np.random.randn(1, 3), index=['a'])
+        df2 = DataFrame(np.random.randn(1, 4), index=['b'])
+
+        pytest.raises(ValueError, concat, [df, df],
+                      keys=['one', 'two'], levels=[['foo', 'bar', 'baz']])
+
+        pytest.raises(ValueError, concat, [df, df2],
+                      keys=['one', 'two'], levels=[['foo', 'bar', 'baz']])
+
+    def test_concat_rename_index(self):
+        a = DataFrame(np.random.rand(3, 3),
+                      columns=list('ABC'),
+                      index=Index(list('abc'), name='index_a'))
+        b = DataFrame(np.random.rand(3, 3),
+                      columns=list('ABC'),
+                      index=Index(list('abc'), name='index_b'))
+
+        result = concat([a, b], keys=['key0', 'key1'],
+                        names=['lvl0', 'lvl1'])
+
+        exp = concat([a, b], keys=['key0', 'key1'], names=['lvl0'])
+        names = list(exp.index.names)
+        names[1] = 'lvl1'
+        exp.index.set_names(names, inplace=True)
+
+        tm.assert_frame_equal(result, exp)
+        assert result.index.names == exp.index.names
+
+    def test_crossed_dtypes_weird_corner(self):
+        columns = ['A', 'B', 'C', 'D']
+        df1 = DataFrame({'A': np.array([1, 2, 3, 4], dtype='f8'),
+                         'B': np.array([1, 2, 3, 4], dtype='i8'),
+                         'C': np.array([1, 2, 3, 4], dtype='f8'),
+                         'D': np.array([1, 2, 3, 4], dtype='i8')},
+                        columns=columns)
+
+        df2 = DataFrame({'A': np.array([1, 2, 3, 4], dtype='i8'),
+                         'B': np.array([1, 2, 3, 4], dtype='f8'),
+                         'C': np.array([1, 2, 3, 4], dtype='i8'),
+                         'D': np.array([1, 2, 3, 4], dtype='f8')},
+                        columns=columns)
+
+        appended = df1.append(df2, ignore_index=True)
+        expected = DataFrame(np.concatenate([df1.values, df2.values], axis=0),
+                             columns=columns)
+        tm.assert_frame_equal(appended, expected)
+
+        df = DataFrame(np.random.randn(1, 3), index=['a'])
+        df2 = DataFrame(np.random.randn(1, 4), index=['b'])
+        result = concat(
+            [df, df2], keys=['one', 'two'], names=['first', 'second'])
+        assert result.index.names == ('first', 'second')
+
+    def test_dups_index(self):
+        # GH 4771
+
+        # single dtypes
+        df = DataFrame(np.random.randint(0, 10, size=40).reshape(
+            10, 4), columns=['A', 'A', 'C', 'C'])
+
+        result = concat([df, df], axis=1)
+        assert_frame_equal(result.iloc[:, :4], df)
+        assert_frame_equal(result.iloc[:, 4:], df)
+
+        result = concat([df, df], axis=0)
+        assert_frame_equal(result.iloc[:10], df)
+        assert_frame_equal(result.iloc[10:], df)
+
+        # multi dtypes
+        df = concat([DataFrame(np.random.randn(10, 4),
+                               columns=['A', 'A', 'B', 'B']),
+                     DataFrame(np.random.randint(0, 10, size=20)
+                               .reshape(10, 2),
+                               columns=['A', 'C'])],
+                    axis=1)
+
+        result = concat([df, df], axis=1)
+        assert_frame_equal(result.iloc[:, :6], df)
+        assert_frame_equal(result.iloc[:, 6:], df)
+
+        result = concat([df, df], axis=0)
+        assert_frame_equal(result.iloc[:10], df)
+        assert_frame_equal(result.iloc[10:], df)
+
+        # append
+        result = df.iloc[0:8, :].append(df.iloc[8:])
+        assert_frame_equal(result, df)
+
+        result = df.iloc[0:8, :].append(df.iloc[8:9]).append(df.iloc[9:10])
+        assert_frame_equal(result, df)
+
+        expected = concat([df, df], axis=0)
+        result = df.append(df)
+        assert_frame_equal(result, expected)
+
+    def test_with_mixed_tuples(self, sort):
+        # 10697
+        # columns have mixed tuples, so handle properly
+        df1 = DataFrame({u'A': 'foo', (u'B', 1): 'bar'}, index=range(2))
+        df2 = DataFrame({u'B': 'foo', (u'B', 1): 'bar'}, index=range(2))
+
+        # it works
+        concat([df1, df2], sort=sort)
+
+    def test_handle_empty_objects(self, sort):
+        df = DataFrame(np.random.randn(10, 4), columns=list('abcd'))
+
+        baz = df[:5].copy()
+        baz['foo'] = 'bar'
+        empty = df[5:5]
+
+        frames = [baz, empty, empty, df[5:]]
+        concatted = concat(frames, axis=0, sort=sort)
+
+        expected = df.reindex(columns=['a', 'b', 'c', 'd', 'foo'])
+        expected['foo'] = expected['foo'].astype('O')
+        expected.loc[0:4, 'foo'] = 'bar'
+
+        tm.assert_frame_equal(concatted, expected)
+
+        # empty as first element with time series
+        # GH3259
+        df = DataFrame(dict(A=range(10000)), index=date_range(
+            '20130101', periods=10000, freq='s'))
+        empty = DataFrame()
+        result = concat([df, empty], axis=1)
+        assert_frame_equal(result, df)
+        result = concat([empty, df], axis=1)
+        assert_frame_equal(result, df)
+
+        result = concat([df, empty])
+        assert_frame_equal(result, df)
+        result = concat([empty, df])
+        assert_frame_equal(result, df)
+
+    def test_concat_mixed_objs(self):
+
+        # concat mixed series/frames
+        # G2385
+
+        # axis 1
+        index = date_range('01-Jan-2013', periods=10, freq='H')
+        arr = np.arange(10, dtype='int64')
+        s1 = Series(arr, index=index)
+        s2 = Series(arr, index=index)
+        df = DataFrame(arr.reshape(-1, 1), index=index)
+
+        expected = DataFrame(np.repeat(arr, 2).reshape(-1, 2),
+                             index=index, columns=[0, 0])
+        result = concat([df, df], axis=1)
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame(np.repeat(arr, 2).reshape(-1, 2),
+                             index=index, columns=[0, 1])
+        result = concat([s1, s2], axis=1)
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame(np.repeat(arr, 3).reshape(-1, 3),
+                             index=index, columns=[0, 1, 2])
+        result = concat([s1, s2, s1], axis=1)
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame(np.repeat(arr, 5).reshape(-1, 5),
+                             index=index, columns=[0, 0, 1, 2, 3])
+        result = concat([s1, df, s2, s2, s1], axis=1)
+        assert_frame_equal(result, expected)
+
+        # with names
+        s1.name = 'foo'
+        expected = DataFrame(np.repeat(arr, 3).reshape(-1, 3),
+                             index=index, columns=['foo', 0, 0])
+        result = concat([s1, df, s2], axis=1)
+        assert_frame_equal(result, expected)
+
+        s2.name = 'bar'
+        expected = DataFrame(np.repeat(arr, 3).reshape(-1, 3),
+                             index=index, columns=['foo', 0, 'bar'])
+        result = concat([s1, df, s2], axis=1)
+        assert_frame_equal(result, expected)
+
+        # ignore index
+        expected = DataFrame(np.repeat(arr, 3).reshape(-1, 3),
+                             index=index, columns=[0, 1, 2])
+        result = concat([s1, df, s2], axis=1, ignore_index=True)
+        assert_frame_equal(result, expected)
+
+        # axis 0
+        expected = DataFrame(np.tile(arr, 3).reshape(-1, 1),
+                             index=index.tolist() * 3, columns=[0])
+        result = concat([s1, df, s2])
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame(np.tile(arr, 3).reshape(-1, 1), columns=[0])
+        result = concat([s1, df, s2], ignore_index=True)
+        assert_frame_equal(result, expected)
+
+        # invalid concatente of mixed dims
+        with catch_warnings(record=True):
+            panel = tm.makePanel()
+            pytest.raises(ValueError, lambda: concat([panel, s1], axis=1))
+
+    def test_empty_dtype_coerce(self):
+
+        # xref to #12411
+        # xref to #12045
+        # xref to #11594
+        # see below
+
+        # 10571
+        df1 = DataFrame(data=[[1, None], [2, None]], columns=['a', 'b'])
+        df2 = DataFrame(data=[[3, None], [4, None]], columns=['a', 'b'])
+        result = concat([df1, df2])
+        expected = df1.dtypes
+        tm.assert_series_equal(result.dtypes, expected)
+
+    def test_dtype_coerceion(self):
+
+        # 12411
+        df = DataFrame({'date': [pd.Timestamp('20130101').tz_localize('UTC'),
+                                 pd.NaT]})
+
+        result = concat([df.iloc[[0]], df.iloc[[1]]])
+        tm.assert_series_equal(result.dtypes, df.dtypes)
+
+        # 12045
+        import datetime
+        df = DataFrame({'date': [datetime.datetime(2012, 1, 1),
+                                 datetime.datetime(1012, 1, 2)]})
+        result = concat([df.iloc[[0]], df.iloc[[1]]])
+        tm.assert_series_equal(result.dtypes, df.dtypes)
+
+        # 11594
+        df = DataFrame({'text': ['some words'] + [None] * 9})
+        result = concat([df.iloc[[0]], df.iloc[[1]]])
+        tm.assert_series_equal(result.dtypes, df.dtypes)
+
+    def test_panel_concat_other_axes(self):
+        with catch_warnings(record=True):
+            panel = tm.makePanel()
+
+            p1 = panel.iloc[:, :5, :]
+            p2 = panel.iloc[:, 5:, :]
+
+            result = concat([p1, p2], axis=1)
+            tm.assert_panel_equal(result, panel)
+
+            p1 = panel.iloc[:, :, :2]
+            p2 = panel.iloc[:, :, 2:]
+
+            result = concat([p1, p2], axis=2)
+            tm.assert_panel_equal(result, panel)
+
+            # if things are a bit misbehaved
+            p1 = panel.iloc[:2, :, :2]
+            p2 = panel.iloc[:, :, 2:]
+            p1['ItemC'] = 'baz'
+
+            result = concat([p1, p2], axis=2)
+
+            expected = panel.copy()
+            expected['ItemC'] = expected['ItemC'].astype('O')
+            expected.loc['ItemC', :, :2] = 'baz'
+            tm.assert_panel_equal(result, expected)
+
+    def test_panel_concat_buglet(self, sort):
+        with catch_warnings(record=True):
+            # #2257
+            def make_panel():
+                index = 5
+                cols = 3
+
+                def df():
+                    return DataFrame(np.random.randn(index, cols),
+                                     index=["I%s" % i for i in range(index)],
+                                     columns=["C%s" % i for i in range(cols)])
+                return Panel(dict(("Item%s" % x, df())
+                                  for x in ['A', 'B', 'C']))
+
+            panel1 = make_panel()
+            panel2 = make_panel()
+
+            panel2 = panel2.rename_axis(dict((x, "%s_1" % x)
+                                             for x in panel2.major_axis),
+                                        axis=1)
+
+            panel3 = panel2.rename_axis(lambda x: '%s_1' % x, axis=1)
+            panel3 = panel3.rename_axis(lambda x: '%s_1' % x, axis=2)
+
+            # it works!
+            concat([panel1, panel3], axis=1, verify_integrity=True, sort=sort)
+
+    def test_concat_series(self):
+
+        ts = tm.makeTimeSeries()
+        ts.name = 'foo'
+
+        pieces = [ts[:5], ts[5:15], ts[15:]]
+
+        result = concat(pieces)
+        tm.assert_series_equal(result, ts)
+        assert result.name == ts.name
+
+        result = concat(pieces, keys=[0, 1, 2])
+        expected = ts.copy()
+
+        ts.index = DatetimeIndex(np.array(ts.index.values, dtype='M8[ns]'))
+
+        exp_labels = [np.repeat([0, 1, 2], [len(x) for x in pieces]),
+                      np.arange(len(ts))]
+        exp_index = MultiIndex(levels=[[0, 1, 2], ts.index],
+                               labels=exp_labels)
+        expected.index = exp_index
+        tm.assert_series_equal(result, expected)
+
+    def test_concat_series_axis1(self, sort=sort):
+        ts = tm.makeTimeSeries()
+
+        pieces = [ts[:-2], ts[2:], ts[2:-2]]
+
+        result = concat(pieces, axis=1)
+        expected = DataFrame(pieces).T
+        assert_frame_equal(result, expected)
+
+        result = concat(pieces, keys=['A', 'B', 'C'], axis=1)
+        expected = DataFrame(pieces, index=['A', 'B', 'C']).T
+        assert_frame_equal(result, expected)
+
+        # preserve series names, #2489
+        s = Series(randn(5), name='A')
+        s2 = Series(randn(5), name='B')
+
+        result = concat([s, s2], axis=1)
+        expected = DataFrame({'A': s, 'B': s2})
+        assert_frame_equal(result, expected)
+
+        s2.name = None
+        result = concat([s, s2], axis=1)
+        tm.assert_index_equal(result.columns,
+                              Index(['A', 0], dtype='object'))
+
+        # must reindex, #2603
+        s = Series(randn(3), index=['c', 'a', 'b'], name='A')
+        s2 = Series(randn(4), index=['d', 'a', 'b', 'c'], name='B')
+        result = concat([s, s2], axis=1, sort=sort)
+        expected = DataFrame({'A': s, 'B': s2})
+        assert_frame_equal(result, expected)
+
+    def test_concat_single_with_key(self):
+        df = DataFrame(np.random.randn(10, 4))
+
+        result = concat([df], keys=['foo'])
+        expected = concat([df, df], keys=['foo', 'bar'])
+        tm.assert_frame_equal(result, expected[:10])
+
+    def test_concat_exclude_none(self):
+        df = DataFrame(np.random.randn(10, 4))
+
+        pieces = [df[:5], None, None, df[5:]]
+        result = concat(pieces)
+        tm.assert_frame_equal(result, df)
+        pytest.raises(ValueError, concat, [None, None])
+
+    def test_concat_datetime64_block(self):
+        from pandas.core.indexes.datetimes import date_range
+
+        rng = date_range('1/1/2000', periods=10)
+
+        df = DataFrame({'time': rng})
+
+        result = concat([df, df])
+        assert (result.iloc[:10]['time'] == rng).all()
+        assert (result.iloc[10:]['time'] == rng).all()
+
+    def test_concat_timedelta64_block(self):
+        from pandas import to_timedelta
+
+        rng = to_timedelta(np.arange(10), unit='s')
+
+        df = DataFrame({'time': rng})
+
+        result = concat([df, df])
+        assert (result.iloc[:10]['time'] == rng).all()
+        assert (result.iloc[10:]['time'] == rng).all()
+
+    def test_concat_keys_with_none(self):
+        # #1649
+        df0 = DataFrame([[10, 20, 30], [10, 20, 30], [10, 20, 30]])
+
+        result = concat(dict(a=None, b=df0, c=df0[:2], d=df0[:1], e=df0))
+        expected = concat(dict(b=df0, c=df0[:2], d=df0[:1], e=df0))
+        tm.assert_frame_equal(result, expected)
+
+        result = concat([None, df0, df0[:2], df0[:1], df0],
+                        keys=['a', 'b', 'c', 'd', 'e'])
+        expected = concat([df0, df0[:2], df0[:1], df0],
+                          keys=['b', 'c', 'd', 'e'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_concat_bug_1719(self):
+        ts1 = tm.makeTimeSeries()
+        ts2 = tm.makeTimeSeries()[::2]
+
+        # to join with union
+        # these two are of different length!
+        left = concat([ts1, ts2], join='outer', axis=1)
+        right = concat([ts2, ts1], join='outer', axis=1)
+
+        assert len(left) == len(right)
+
+    def test_concat_bug_2972(self):
+        ts0 = Series(np.zeros(5))
+        ts1 = Series(np.ones(5))
+        ts0.name = ts1.name = 'same name'
+        result = concat([ts0, ts1], axis=1)
+
+        expected = DataFrame({0: ts0, 1: ts1})
+        expected.columns = ['same name', 'same name']
+        assert_frame_equal(result, expected)
+
+    def test_concat_bug_3602(self):
+
+        # GH 3602, duplicate columns
+        df1 = DataFrame({'firmNo': [0, 0, 0, 0], 'prc': [6, 6, 6, 6],
+                         'stringvar': ['rrr', 'rrr', 'rrr', 'rrr']})
+        df2 = DataFrame({'C': [9, 10, 11, 12], 'misc': [1, 2, 3, 4],
+                         'prc': [6, 6, 6, 6]})
+        expected = DataFrame([[0, 6, 'rrr', 9, 1, 6],
+                              [0, 6, 'rrr', 10, 2, 6],
+                              [0, 6, 'rrr', 11, 3, 6],
+                              [0, 6, 'rrr', 12, 4, 6]])
+        expected.columns = ['firmNo', 'prc', 'stringvar', 'C', 'misc', 'prc']
+
+        result = concat([df1, df2], axis=1)
+        assert_frame_equal(result, expected)
+
+    def test_concat_inner_join_empty(self):
+        # GH 15328
+        df_empty = pd.DataFrame()
+        df_a = pd.DataFrame({'a': [1, 2]}, index=[0, 1], dtype='int64')
+        df_expected = pd.DataFrame({'a': []}, index=[], dtype='int64')
+
+        for how, expected in [('inner', df_expected), ('outer', df_a)]:
+            result = pd.concat([df_a, df_empty], axis=1, join=how)
+            assert_frame_equal(result, expected)
+
+    def test_concat_series_axis1_same_names_ignore_index(self):
+        dates = date_range('01-Jan-2013', '01-Jan-2014', freq='MS')[0:-1]
+        s1 = Series(randn(len(dates)), index=dates, name='value')
+        s2 = Series(randn(len(dates)), index=dates, name='value')
+
+        result = concat([s1, s2], axis=1, ignore_index=True)
+        expected = Index([0, 1])
+
+        tm.assert_index_equal(result.columns, expected)
+
+    def test_concat_iterables(self):
+        from collections import deque, Iterable
+
+        # GH8645 check concat works with tuples, list, generators, and weird
+        # stuff like deque and custom iterables
+        df1 = DataFrame([1, 2, 3])
+        df2 = DataFrame([4, 5, 6])
+        expected = DataFrame([1, 2, 3, 4, 5, 6])
+        assert_frame_equal(concat((df1, df2), ignore_index=True), expected)
+        assert_frame_equal(concat([df1, df2], ignore_index=True), expected)
+        assert_frame_equal(concat((df for df in (df1, df2)),
+                                  ignore_index=True), expected)
+        assert_frame_equal(
+            concat(deque((df1, df2)), ignore_index=True), expected)
+
+        class CustomIterator1(object):
+
+            def __len__(self):
+                return 2
+
+            def __getitem__(self, index):
+                try:
+                    return {0: df1, 1: df2}[index]
+                except KeyError:
+                    raise IndexError
+        assert_frame_equal(pd.concat(CustomIterator1(),
+                                     ignore_index=True), expected)
+
+        class CustomIterator2(Iterable):
+
+            def __iter__(self):
+                yield df1
+                yield df2
+        assert_frame_equal(pd.concat(CustomIterator2(),
+                                     ignore_index=True), expected)
+
+    def test_concat_invalid(self):
+
+        # trying to concat a ndframe with a non-ndframe
+        df1 = mkdf(10, 2)
+        for obj in [1, dict(), [1, 2], (1, 2)]:
+            pytest.raises(TypeError, lambda x: concat([df1, obj]))
+
+    def test_concat_invalid_first_argument(self):
+        df1 = mkdf(10, 2)
+        df2 = mkdf(10, 2)
+        pytest.raises(TypeError, concat, df1, df2)
+
+        # generator ok though
+        concat(DataFrame(np.random.rand(5, 5)) for _ in range(3))
+
+        # text reader ok
+        # GH6583
+        data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+
+        reader = read_csv(StringIO(data), chunksize=1)
+        result = concat(reader, ignore_index=True)
+        expected = read_csv(StringIO(data))
+        assert_frame_equal(result, expected)
+
+    def test_concat_NaT_series(self):
+        # GH 11693
+        # test for merging NaT series with datetime series.
+        x = Series(date_range('20151124 08:00', '20151124 09:00',
+                              freq='1h', tz='US/Eastern'))
+        y = Series(pd.NaT, index=[0, 1], dtype='datetime64[ns, US/Eastern]')
+        expected = Series([x[0], x[1], pd.NaT, pd.NaT])
+
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+
+        # all NaT with tz
+        expected = Series(pd.NaT, index=range(4),
+                          dtype='datetime64[ns, US/Eastern]')
+        result = pd.concat([y, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+
+        # without tz
+        x = pd.Series(pd.date_range('20151124 08:00',
+                                    '20151124 09:00', freq='1h'))
+        y = pd.Series(pd.date_range('20151124 10:00',
+                                    '20151124 11:00', freq='1h'))
+        y[:] = pd.NaT
+        expected = pd.Series([x[0], x[1], pd.NaT, pd.NaT])
+        result = pd.concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+
+        # all NaT without tz
+        x[:] = pd.NaT
+        expected = pd.Series(pd.NaT, index=range(4),
+                             dtype='datetime64[ns]')
+        result = pd.concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+
+    def test_concat_tz_frame(self):
+        df2 = DataFrame(dict(A=pd.Timestamp('20130102', tz='US/Eastern'),
+                             B=pd.Timestamp('20130603', tz='CET')),
+                        index=range(5))
+
+        # concat
+        df3 = pd.concat([df2.A.to_frame(), df2.B.to_frame()], axis=1)
+        assert_frame_equal(df2, df3)
+
+    def test_concat_tz_series(self):
+        # gh-11755: tz and no tz
+        x = Series(date_range('20151124 08:00',
+                              '20151124 09:00',
+                              freq='1h', tz='UTC'))
+        y = Series(date_range('2012-01-01', '2012-01-02'))
+        expected = Series([x[0], x[1], y[0], y[1]],
+                          dtype='object')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+
+        # gh-11887: concat tz and object
+        x = Series(date_range('20151124 08:00',
+                              '20151124 09:00',
+                              freq='1h', tz='UTC'))
+        y = Series(['a', 'b'])
+        expected = Series([x[0], x[1], y[0], y[1]],
+                          dtype='object')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+
+        # see gh-12217 and gh-12306
+        # Concatenating two UTC times
+        first = pd.DataFrame([[datetime(2016, 1, 1)]])
+        first[0] = first[0].dt.tz_localize('UTC')
+
+        second = pd.DataFrame([[datetime(2016, 1, 2)]])
+        second[0] = second[0].dt.tz_localize('UTC')
+
+        result = pd.concat([first, second])
+        assert result[0].dtype == 'datetime64[ns, UTC]'
+
+        # Concatenating two London times
+        first = pd.DataFrame([[datetime(2016, 1, 1)]])
+        first[0] = first[0].dt.tz_localize('Europe/London')
+
+        second = pd.DataFrame([[datetime(2016, 1, 2)]])
+        second[0] = second[0].dt.tz_localize('Europe/London')
+
+        result = pd.concat([first, second])
+        assert result[0].dtype == 'datetime64[ns, Europe/London]'
+
+        # Concatenating 2+1 London times
+        first = pd.DataFrame([[datetime(2016, 1, 1)], [datetime(2016, 1, 2)]])
+        first[0] = first[0].dt.tz_localize('Europe/London')
+
+        second = pd.DataFrame([[datetime(2016, 1, 3)]])
+        second[0] = second[0].dt.tz_localize('Europe/London')
+
+        result = pd.concat([first, second])
+        assert result[0].dtype == 'datetime64[ns, Europe/London]'
+
+        # Concat'ing 1+2 London times
+        first = pd.DataFrame([[datetime(2016, 1, 1)]])
+        first[0] = first[0].dt.tz_localize('Europe/London')
+
+        second = pd.DataFrame([[datetime(2016, 1, 2)], [datetime(2016, 1, 3)]])
+        second[0] = second[0].dt.tz_localize('Europe/London')
+
+        result = pd.concat([first, second])
+        assert result[0].dtype == 'datetime64[ns, Europe/London]'
+
+    def test_concat_tz_series_with_datetimelike(self):
+        # see gh-12620: tz and timedelta
+        x = [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+             pd.Timestamp('2011-02-01', tz='US/Eastern')]
+        y = [pd.Timedelta('1 day'), pd.Timedelta('2 day')]
+        result = concat([pd.Series(x), pd.Series(y)], ignore_index=True)
+        tm.assert_series_equal(result, pd.Series(x + y, dtype='object'))
+
+        # tz and period
+        y = [pd.Period('2011-03', freq='M'), pd.Period('2011-04', freq='M')]
+        result = concat([pd.Series(x), pd.Series(y)], ignore_index=True)
+        tm.assert_series_equal(result, pd.Series(x + y, dtype='object'))
+
+    def test_concat_tz_series_tzlocal(self):
+        # see gh-13583
+        x = [pd.Timestamp('2011-01-01', tz=dateutil.tz.tzlocal()),
+             pd.Timestamp('2011-02-01', tz=dateutil.tz.tzlocal())]
+        y = [pd.Timestamp('2012-01-01', tz=dateutil.tz.tzlocal()),
+             pd.Timestamp('2012-02-01', tz=dateutil.tz.tzlocal())]
+
+        result = concat([pd.Series(x), pd.Series(y)], ignore_index=True)
+        tm.assert_series_equal(result, pd.Series(x + y))
+        assert result.dtype == 'datetime64[ns, tzlocal()]'
+
+    @pytest.mark.parametrize('tz1', [None, 'UTC'])
+    @pytest.mark.parametrize('tz2', [None, 'UTC'])
+    @pytest.mark.parametrize('s', [pd.NaT, pd.Timestamp('20150101')])
+    def test_concat_NaT_dataframes_all_NaT_axis_0(self, tz1, tz2, s):
+        # GH 12396
+
+        # tz-naive
+        first = pd.DataFrame([[pd.NaT], [pd.NaT]]).apply(
+            lambda x: x.dt.tz_localize(tz1))
+        second = pd.DataFrame([s]).apply(lambda x: x.dt.tz_localize(tz2))
+
+        result = pd.concat([first, second], axis=0)
+        expected = pd.DataFrame(pd.Series(
+            [pd.NaT, pd.NaT, s], index=[0, 1, 0]))
+        expected = expected.apply(lambda x: x.dt.tz_localize(tz2))
+        if tz1 != tz2:
+            expected = expected.astype(object)
+
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('tz1', [None, 'UTC'])
+    @pytest.mark.parametrize('tz2', [None, 'UTC'])
+    def test_concat_NaT_dataframes_all_NaT_axis_1(self, tz1, tz2):
+        # GH 12396
+
+        first = pd.DataFrame(pd.Series([pd.NaT, pd.NaT]).dt.tz_localize(tz1))
+        second = pd.DataFrame(pd.Series(
+            [pd.NaT]).dt.tz_localize(tz2), columns=[1])
+        expected = pd.DataFrame(
+            {0: pd.Series([pd.NaT, pd.NaT]).dt.tz_localize(tz1),
+             1: pd.Series([pd.NaT, pd.NaT]).dt.tz_localize(tz2)}
+        )
+        result = pd.concat([first, second], axis=1)
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('tz1', [None, 'UTC'])
+    @pytest.mark.parametrize('tz2', [None, 'UTC'])
+    def test_concat_NaT_series_dataframe_all_NaT(self, tz1, tz2):
+        # GH 12396
+
+        # tz-naive
+        first = pd.Series([pd.NaT, pd.NaT]).dt.tz_localize(tz1)
+        second = pd.DataFrame([[pd.Timestamp('2015/01/01', tz=tz2)],
+                               [pd.Timestamp('2016/01/01', tz=tz2)]],
+                              index=[2, 3])
+
+        expected = pd.DataFrame([pd.NaT, pd.NaT,
+                                 pd.Timestamp('2015/01/01', tz=tz2),
+                                 pd.Timestamp('2016/01/01', tz=tz2)])
+        if tz1 != tz2:
+            expected = expected.astype(object)
+
+        result = pd.concat([first, second])
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('tz', [None, 'UTC'])
+    def test_concat_NaT_dataframes(self, tz):
+        # GH 12396
+
+        first = pd.DataFrame([[pd.NaT], [pd.NaT]])
+        first = first.apply(lambda x: x.dt.tz_localize(tz))
+        second = pd.DataFrame([[pd.Timestamp('2015/01/01', tz=tz)],
+                               [pd.Timestamp('2016/01/01', tz=tz)]],
+                              index=[2, 3])
+        expected = pd.DataFrame([pd.NaT, pd.NaT,
+                                 pd.Timestamp('2015/01/01', tz=tz),
+                                 pd.Timestamp('2016/01/01', tz=tz)])
+
+        result = pd.concat([first, second], axis=0)
+        assert_frame_equal(result, expected)
+
+    def test_concat_period_series(self):
+        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
+        y = Series(pd.PeriodIndex(['2015-10-01', '2016-01-01'], freq='D'))
+        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'object'
+
+        # different freq
+        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
+        y = Series(pd.PeriodIndex(['2015-10-01', '2016-01-01'], freq='M'))
+        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'object'
+
+        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
+        y = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='M'))
+        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'object'
+
+        # non-period
+        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
+        y = Series(pd.DatetimeIndex(['2015-11-01', '2015-12-01']))
+        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'object'
+
+        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
+        y = Series(['A', 'B'])
+        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'object'
+
+    def test_concat_empty_series(self):
+        # GH 11082
+        s1 = pd.Series([1, 2, 3], name='x')
+        s2 = pd.Series(name='y')
+        res = pd.concat([s1, s2], axis=1)
+        exp = pd.DataFrame({'x': [1, 2, 3], 'y': [np.nan, np.nan, np.nan]})
+        tm.assert_frame_equal(res, exp)
+
+        s1 = pd.Series([1, 2, 3], name='x')
+        s2 = pd.Series(name='y')
+        res = pd.concat([s1, s2], axis=0)
+        # name will be reset
+        exp = pd.Series([1, 2, 3])
+        tm.assert_series_equal(res, exp)
+
+        # empty Series with no name
+        s1 = pd.Series([1, 2, 3], name='x')
+        s2 = pd.Series(name=None)
+        res = pd.concat([s1, s2], axis=1)
+        exp = pd.DataFrame({'x': [1, 2, 3], 0: [np.nan, np.nan, np.nan]},
+                           columns=['x', 0])
+        tm.assert_frame_equal(res, exp)
+
+    @pytest.mark.parametrize('tz', [None, 'UTC'])
+    @pytest.mark.parametrize('values', [[], [1, 2, 3]])
+    def test_concat_empty_series_timelike(self, tz, values):
+        # GH 18447
+
+        first = Series([], dtype='M8[ns]').dt.tz_localize(tz)
+        second = Series(values)
+        expected = DataFrame(
+            {0: pd.Series([pd.NaT] * len(values),
+                          dtype='M8[ns]'
+                          ).dt.tz_localize(tz),
+             1: values})
+        result = concat([first, second], axis=1)
+        assert_frame_equal(result, expected)
+
+    def test_default_index(self):
+        # is_series and ignore_index
+        s1 = pd.Series([1, 2, 3], name='x')
+        s2 = pd.Series([4, 5, 6], name='y')
+        res = pd.concat([s1, s2], axis=1, ignore_index=True)
+        assert isinstance(res.columns, pd.RangeIndex)
+        exp = pd.DataFrame([[1, 4], [2, 5], [3, 6]])
+        # use check_index_type=True to check the result have
+        # RangeIndex (default index)
+        tm.assert_frame_equal(res, exp, check_index_type=True,
+                              check_column_type=True)
+
+        # is_series and all inputs have no names
+        s1 = pd.Series([1, 2, 3])
+        s2 = pd.Series([4, 5, 6])
+        res = pd.concat([s1, s2], axis=1, ignore_index=False)
+        assert isinstance(res.columns, pd.RangeIndex)
+        exp = pd.DataFrame([[1, 4], [2, 5], [3, 6]])
+        exp.columns = pd.RangeIndex(2)
+        tm.assert_frame_equal(res, exp, check_index_type=True,
+                              check_column_type=True)
+
+        # is_dataframe and ignore_index
+        df1 = pd.DataFrame({'A': [1, 2], 'B': [5, 6]})
+        df2 = pd.DataFrame({'A': [3, 4], 'B': [7, 8]})
+
+        res = pd.concat([df1, df2], axis=0, ignore_index=True)
+        exp = pd.DataFrame([[1, 5], [2, 6], [3, 7], [4, 8]],
+                           columns=['A', 'B'])
+        tm.assert_frame_equal(res, exp, check_index_type=True,
+                              check_column_type=True)
+
+        res = pd.concat([df1, df2], axis=1, ignore_index=True)
+        exp = pd.DataFrame([[1, 5, 3, 7], [2, 6, 4, 8]])
+        tm.assert_frame_equal(res, exp, check_index_type=True,
+                              check_column_type=True)
+
+    def test_concat_multiindex_rangeindex(self):
+        # GH13542
+        # when multi-index levels are RangeIndex objects
+        # there is a bug in concat with objects of len 1
+
+        df = DataFrame(np.random.randn(9, 2))
+        df.index = MultiIndex(levels=[pd.RangeIndex(3), pd.RangeIndex(3)],
+                              labels=[np.repeat(np.arange(3), 3),
+                                      np.tile(np.arange(3), 3)])
+
+        res = concat([df.iloc[[2, 3, 4], :], df.iloc[[5], :]])
+        exp = df.iloc[[2, 3, 4, 5], :]
+        tm.assert_frame_equal(res, exp)
+
+    def test_concat_multiindex_dfs_with_deepcopy(self):
+        # GH 9967
+        from copy import deepcopy
+        example_multiindex1 = pd.MultiIndex.from_product([['a'], ['b']])
+        example_dataframe1 = pd.DataFrame([0], index=example_multiindex1)
+
+        example_multiindex2 = pd.MultiIndex.from_product([['a'], ['c']])
+        example_dataframe2 = pd.DataFrame([1], index=example_multiindex2)
+
+        example_dict = {'s1': example_dataframe1, 's2': example_dataframe2}
+        expected_index = pd.MultiIndex(levels=[['s1', 's2'],
+                                               ['a'],
+                                               ['b', 'c']],
+                                       labels=[[0, 1], [0, 0], [0, 1]],
+                                       names=['testname', None, None])
+        expected = pd.DataFrame([[0], [1]], index=expected_index)
+        result_copy = pd.concat(deepcopy(example_dict), names=['testname'])
+        tm.assert_frame_equal(result_copy, expected)
+        result_no_copy = pd.concat(example_dict, names=['testname'])
+        tm.assert_frame_equal(result_no_copy, expected)
+
+    def test_categorical_concat_append(self):
+        cat = Categorical(["a", "b"], categories=["a", "b"])
+        vals = [1, 2]
+        df = DataFrame({"cats": cat, "vals": vals})
+        cat2 = Categorical(["a", "b", "a", "b"], categories=["a", "b"])
+        vals2 = [1, 2, 1, 2]
+        exp = DataFrame({"cats": cat2, "vals": vals2},
+                        index=Index([0, 1, 0, 1]))
+
+        tm.assert_frame_equal(pd.concat([df, df]), exp)
+        tm.assert_frame_equal(df.append(df), exp)
+
+        # GH 13524 can concat different categories
+        cat3 = Categorical(["a", "b"], categories=["a", "b", "c"])
+        vals3 = [1, 2]
+        df_different_categories = DataFrame({"cats": cat3, "vals": vals3})
+
+        res = pd.concat([df, df_different_categories], ignore_index=True)
+        exp = DataFrame({"cats": list('abab'), "vals": [1, 2, 1, 2]})
+        tm.assert_frame_equal(res, exp)
+
+        res = df.append(df_different_categories, ignore_index=True)
+        tm.assert_frame_equal(res, exp)
+
+    def test_categorical_concat_dtypes(self):
+
+        # GH8143
+        index = ['cat', 'obj', 'num']
+        cat = Categorical(['a', 'b', 'c'])
+        obj = Series(['a', 'b', 'c'])
+        num = Series([1, 2, 3])
+        df = pd.concat([Series(cat), obj, num], axis=1, keys=index)
+
+        result = df.dtypes == 'object'
+        expected = Series([False, True, False], index=index)
+        tm.assert_series_equal(result, expected)
+
+        result = df.dtypes == 'int64'
+        expected = Series([False, False, True], index=index)
+        tm.assert_series_equal(result, expected)
+
+        result = df.dtypes == 'category'
+        expected = Series([True, False, False], index=index)
+        tm.assert_series_equal(result, expected)
+
+    def test_categorical_concat(self, sort):
+        # See GH 10177
+        df1 = DataFrame(np.arange(18, dtype='int64').reshape(6, 3),
+                        columns=["a", "b", "c"])
+
+        df2 = DataFrame(np.arange(14, dtype='int64').reshape(7, 2),
+                        columns=["a", "c"])
+
+        cat_values = ["one", "one", "two", "one", "two", "two", "one"]
+        df2['h'] = Series(Categorical(cat_values))
+
+        res = pd.concat((df1, df2), axis=0, ignore_index=True, sort=sort)
+        exp = DataFrame({'a': [0, 3, 6, 9, 12, 15, 0, 2, 4, 6, 8, 10, 12],
+                         'b': [1, 4, 7, 10, 13, 16, np.nan, np.nan, np.nan,
+                               np.nan, np.nan, np.nan, np.nan],
+                         'c': [2, 5, 8, 11, 14, 17, 1, 3, 5, 7, 9, 11, 13],
+                         'h': [None] * 6 + cat_values})
+        tm.assert_frame_equal(res, exp)
+
+    def test_categorical_concat_gh7864(self):
+        # GH 7864
+        # make sure ordering is preserverd
+        df = DataFrame({"id": [1, 2, 3, 4, 5, 6], "raw_grade": list('abbaae')})
+        df["grade"] = Categorical(df["raw_grade"])
+        df['grade'].cat.set_categories(['e', 'a', 'b'])
+
+        df1 = df[0:3]
+        df2 = df[3:]
+
+        tm.assert_index_equal(df['grade'].cat.categories,
+                              df1['grade'].cat.categories)
+        tm.assert_index_equal(df['grade'].cat.categories,
+                              df2['grade'].cat.categories)
+
+        dfx = pd.concat([df1, df2])
+        tm.assert_index_equal(df['grade'].cat.categories,
+                              dfx['grade'].cat.categories)
+
+        dfa = df1.append(df2)
+        tm.assert_index_equal(df['grade'].cat.categories,
+                              dfa['grade'].cat.categories)
+
+    def test_categorical_concat_preserve(self):
+
+        # GH 8641  series concat not preserving category dtype
+        # GH 13524 can concat different categories
+        s = Series(list('abc'), dtype='category')
+        s2 = Series(list('abd'), dtype='category')
+
+        exp = Series(list('abcabd'))
+        res = pd.concat([s, s2], ignore_index=True)
+        tm.assert_series_equal(res, exp)
+
+        exp = Series(list('abcabc'), dtype='category')
+        res = pd.concat([s, s], ignore_index=True)
+        tm.assert_series_equal(res, exp)
+
+        exp = Series(list('abcabc'), index=[0, 1, 2, 0, 1, 2],
+                     dtype='category')
+        res = pd.concat([s, s])
+        tm.assert_series_equal(res, exp)
+
+        a = Series(np.arange(6, dtype='int64'))
+        b = Series(list('aabbca'))
+
+        df2 = DataFrame({'A': a,
+                         'B': b.astype(CategoricalDtype(list('cab')))})
+        res = pd.concat([df2, df2])
+        exp = DataFrame(
+            {'A': pd.concat([a, a]),
+             'B': pd.concat([b, b]).astype(CategoricalDtype(list('cab')))})
+        tm.assert_frame_equal(res, exp)
+
+    def test_categorical_index_preserver(self):
+
+        a = Series(np.arange(6, dtype='int64'))
+        b = Series(list('aabbca'))
+
+        df2 = DataFrame({'A': a,
+                         'B': b.astype(CategoricalDtype(list('cab')))
+                         }).set_index('B')
+        result = pd.concat([df2, df2])
+        expected = DataFrame(
+            {'A': pd.concat([a, a]),
+             'B': pd.concat([b, b]).astype(CategoricalDtype(list('cab')))
+             }).set_index('B')
+        tm.assert_frame_equal(result, expected)
+
+        # wrong catgories
+        df3 = DataFrame({'A': a, 'B': Categorical(b, categories=list('abe'))
+                         }).set_index('B')
+        pytest.raises(TypeError, lambda: pd.concat([df2, df3]))
+
+    def test_concat_categoricalindex(self):
+        # GH 16111, categories that aren't lexsorted
+        categories = [9, 0, 1, 2, 3]
+
+        a = pd.Series(1, index=pd.CategoricalIndex([9, 0],
+                                                   categories=categories))
+        b = pd.Series(2, index=pd.CategoricalIndex([0, 1],
+                                                   categories=categories))
+        c = pd.Series(3, index=pd.CategoricalIndex([1, 2],
+                                                   categories=categories))
+
+        result = pd.concat([a, b, c], axis=1)
+
+        exp_idx = pd.CategoricalIndex([0, 1, 2, 9])
+        exp = pd.DataFrame({0: [1, np.nan, np.nan, 1],
+                            1: [2, 2, np.nan, np.nan],
+                            2: [np.nan, 3, 3, np.nan]},
+                           columns=[0, 1, 2],
+                           index=exp_idx)
+        tm.assert_frame_equal(result, exp)
+
+    def test_concat_order(self):
+        # GH 17344
+        dfs = [pd.DataFrame(index=range(3), columns=['a', 1, None])]
+        dfs += [pd.DataFrame(index=range(3), columns=[None, 1, 'a'])
+                for i in range(100)]
+
+        result = pd.concat(dfs, sort=True).columns
+
+        if PY2:
+            # Different sort order between incomparable objects between
+            # python 2 and python3 via Index.union.
+            expected = dfs[1].columns
+        else:
+            expected = dfs[0].columns
+        tm.assert_index_equal(result, expected)
+
+    def test_concat_datetime_timezone(self):
+        # GH 18523
+        idx1 = pd.date_range('2011-01-01', periods=3, freq='H',
+                             tz='Europe/Paris')
+        idx2 = pd.date_range(start=idx1[0], end=idx1[-1], freq='H')
+        df1 = pd.DataFrame({'a': [1, 2, 3]}, index=idx1)
+        df2 = pd.DataFrame({'b': [1, 2, 3]}, index=idx2)
+        result = pd.concat([df1, df2], axis=1)
+
+        exp_idx = DatetimeIndex(['2011-01-01 00:00:00+01:00',
+                                 '2011-01-01 01:00:00+01:00',
+                                 '2011-01-01 02:00:00+01:00'],
+                                freq='H'
+                                ).tz_localize('UTC').tz_convert('Europe/Paris')
+
+        expected = pd.DataFrame([[1, 1], [2, 2], [3, 3]],
+                                index=exp_idx, columns=['a', 'b'])
+
+        tm.assert_frame_equal(result, expected)
+
+        idx3 = pd.date_range('2011-01-01', periods=3,
+                             freq='H', tz='Asia/Tokyo')
+        df3 = pd.DataFrame({'b': [1, 2, 3]}, index=idx3)
+        result = pd.concat([df1, df3], axis=1)
+
+        exp_idx = DatetimeIndex(['2010-12-31 15:00:00+00:00',
+                                 '2010-12-31 16:00:00+00:00',
+                                 '2010-12-31 17:00:00+00:00',
+                                 '2010-12-31 23:00:00+00:00',
+                                 '2011-01-01 00:00:00+00:00',
+                                 '2011-01-01 01:00:00+00:00']
+                                ).tz_localize('UTC')
+
+        expected = pd.DataFrame([[np.nan, 1], [np.nan, 2], [np.nan, 3],
+                                 [1, np.nan], [2, np.nan], [3, np.nan]],
+                                index=exp_idx, columns=['a', 'b'])
+
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('pdt', [pd.Series, pd.DataFrame, pd.Panel])
+@pytest.mark.parametrize('dt', np.sctypes['float'])
+def test_concat_no_unnecessary_upcast(dt, pdt):
+    with catch_warnings(record=True):
+        # GH 13247
+        dims = pdt().ndim
+        dfs = [pdt(np.array([1], dtype=dt, ndmin=dims)),
+               pdt(np.array([np.nan], dtype=dt, ndmin=dims)),
+               pdt(np.array([5], dtype=dt, ndmin=dims))]
+        x = pd.concat(dfs)
+        assert x.values.dtype == dt
+
+
+@pytest.mark.parametrize('pdt', [pd.Series, pd.DataFrame, pd.Panel])
+@pytest.mark.parametrize('dt', np.sctypes['int'])
+def test_concat_will_upcast(dt, pdt):
+    with catch_warnings(record=True):
+        dims = pdt().ndim
+        dfs = [pdt(np.array([1], dtype=dt, ndmin=dims)),
+               pdt(np.array([np.nan], ndmin=dims)),
+               pdt(np.array([5], dtype=dt, ndmin=dims))]
+        x = pd.concat(dfs)
+        assert x.values.dtype == 'float64'
+
+
+def test_concat_empty_and_non_empty_frame_regression():
+    # GH 18178 regression test
+    df1 = pd.DataFrame({'foo': [1]})
+    df2 = pd.DataFrame({'foo': []})
+    expected = pd.DataFrame({'foo': [1.0]})
+    result = pd.concat([df1, df2])
+    assert_frame_equal(result, expected)
+
+
+def test_concat_empty_and_non_empty_series_regression():
+    # GH 18187 regression test
+    s1 = pd.Series([1])
+    s2 = pd.Series([])
+    expected = s1
+    result = pd.concat([s1, s2])
+    tm.assert_series_equal(result, expected)
+
+
+def test_concat_sorts_columns(sort_with_none):
+    # GH-4588
+    df1 = pd.DataFrame({"a": [1, 2], "b": [1, 2]}, columns=['b', 'a'])
+    df2 = pd.DataFrame({"a": [3, 4], "c": [5, 6]})
+
+    # for sort=True/None
+    expected = pd.DataFrame({"a": [1, 2, 3, 4],
+                             "b": [1, 2, None, None],
+                             "c": [None, None, 5, 6]},
+                            columns=['a', 'b', 'c'])
+
+    if sort_with_none is False:
+        expected = expected[['b', 'a', 'c']]
+
+    if sort_with_none is None:
+        # only warn if not explicitly specified
+        ctx = tm.assert_produces_warning(FutureWarning)
+    else:
+        ctx = tm.assert_produces_warning(None)
+
+    # default
+    with ctx:
+        result = pd.concat([df1, df2], ignore_index=True, sort=sort_with_none)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_concat_sorts_index(sort_with_none):
+    df1 = pd.DataFrame({"a": [1, 2, 3]}, index=['c', 'a', 'b'])
+    df2 = pd.DataFrame({"b": [1, 2]}, index=['a', 'b'])
+
+    # For True/None
+    expected = pd.DataFrame({"a": [2, 3, 1], "b": [1, 2, None]},
+                            index=['a', 'b', 'c'],
+                            columns=['a', 'b'])
+    if sort_with_none is False:
+        expected = expected.loc[['c', 'a', 'b']]
+
+    if sort_with_none is None:
+        # only warn if not explicitly specified
+        ctx = tm.assert_produces_warning(FutureWarning)
+    else:
+        ctx = tm.assert_produces_warning(None)
+
+    # Warn and sort by default
+    with ctx:
+        result = pd.concat([df1, df2], axis=1, sort=sort_with_none)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_concat_inner_sort(sort_with_none):
+    # https://github.com/pandas-dev/pandas/pull/20613
+    df1 = pd.DataFrame({"a": [1, 2], "b": [1, 2], "c": [1, 2]},
+                       columns=['b', 'a', 'c'])
+    df2 = pd.DataFrame({"a": [1, 2], 'b': [3, 4]}, index=[3, 4])
+
+    with tm.assert_produces_warning(None):
+        # unset sort should *not* warn for inner join
+        # since that never sorted
+        result = pd.concat([df1, df2], sort=sort_with_none,
+                           join='inner',
+                           ignore_index=True)
+
+    expected = pd.DataFrame({"b": [1, 2, 3, 4], "a": [1, 2, 1, 2]},
+                            columns=['b', 'a'])
+    if sort_with_none is True:
+        expected = expected[['a', 'b']]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_concat_aligned_sort():
+    # GH-4588
+    df = pd.DataFrame({"c": [1, 2], "b": [3, 4], 'a': [5, 6]},
+                      columns=['c', 'b', 'a'])
+    result = pd.concat([df, df], sort=True, ignore_index=True)
+    expected = pd.DataFrame({'a': [5, 6, 5, 6], 'b': [3, 4, 3, 4],
+                             'c': [1, 2, 1, 2]},
+                            columns=['a', 'b', 'c'])
+    tm.assert_frame_equal(result, expected)
+
+    result = pd.concat([df, df[['c', 'b']]], join='inner', sort=True,
+                       ignore_index=True)
+    expected = expected[['b', 'c']]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_concat_aligned_sort_does_not_raise():
+    # GH-4588
+    # We catch TypeErrors from sorting internally and do not re-raise.
+    df = pd.DataFrame({1: [1, 2], "a": [3, 4]}, columns=[1, 'a'])
+    expected = pd.DataFrame({1: [1, 2, 1, 2], 'a': [3, 4, 3, 4]},
+                            columns=[1, 'a'])
+    result = pd.concat([df, df], ignore_index=True, sort=True)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("s1name,s2name", [
+    (np.int64(190), (43, 0)), (190, (43, 0))])
+def test_concat_series_name_npscalar_tuple(s1name, s2name):
+    # GH21015
+    s1 = pd.Series({'a': 1, 'b': 2}, name=s1name)
+    s2 = pd.Series({'c': 5, 'd': 6}, name=s2name)
+    result = pd.concat([s1, s2])
+    expected = pd.Series({'a': 1, 'b': 2, 'c': 5, 'd': 6})
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/reshape/test_melt.py b/pandas/tests/reshape/test_melt.py
new file mode 100644
index 0000000000000..81570de7586de
--- /dev/null
+++ b/pandas/tests/reshape/test_melt.py
@@ -0,0 +1,642 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=W0612,E1101
+
+import pytest
+
+from pandas import DataFrame
+import pandas as pd
+
+from numpy import nan
+import numpy as np
+
+from pandas import melt, lreshape, wide_to_long
+import pandas.util.testing as tm
+from pandas.compat import range
+
+
+class TestMelt(object):
+
+    def setup_method(self, method):
+        self.df = tm.makeTimeDataFrame()[:10]
+        self.df['id1'] = (self.df['A'] > 0).astype(np.int64)
+        self.df['id2'] = (self.df['B'] > 0).astype(np.int64)
+
+        self.var_name = 'var'
+        self.value_name = 'val'
+
+        self.df1 = pd.DataFrame([[1.067683, -1.110463, 0.20867
+                                  ], [-1.321405, 0.368915, -1.055342],
+                                 [-0.807333, 0.08298, -0.873361]])
+        self.df1.columns = [list('ABC'), list('abc')]
+        self.df1.columns.names = ['CAP', 'low']
+
+    def test_top_level_method(self):
+        result = melt(self.df)
+        assert result.columns.tolist() == ['variable', 'value']
+
+    def test_method_signatures(self):
+        tm.assert_frame_equal(self.df.melt(),
+                              melt(self.df))
+
+        tm.assert_frame_equal(self.df.melt(id_vars=['id1', 'id2'],
+                                           value_vars=['A', 'B']),
+                              melt(self.df,
+                                   id_vars=['id1', 'id2'],
+                                   value_vars=['A', 'B']))
+
+        tm.assert_frame_equal(self.df.melt(var_name=self.var_name,
+                                           value_name=self.value_name),
+                              melt(self.df,
+                                   var_name=self.var_name,
+                                   value_name=self.value_name))
+
+        tm.assert_frame_equal(self.df1.melt(col_level=0),
+                              melt(self.df1, col_level=0))
+
+    def test_default_col_names(self):
+        result = self.df.melt()
+        assert result.columns.tolist() == ['variable', 'value']
+
+        result1 = self.df.melt(id_vars=['id1'])
+        assert result1.columns.tolist() == ['id1', 'variable', 'value']
+
+        result2 = self.df.melt(id_vars=['id1', 'id2'])
+        assert result2.columns.tolist() == ['id1', 'id2', 'variable', 'value']
+
+    def test_value_vars(self):
+        result3 = self.df.melt(id_vars=['id1', 'id2'], value_vars='A')
+        assert len(result3) == 10
+
+        result4 = self.df.melt(id_vars=['id1', 'id2'], value_vars=['A', 'B'])
+        expected4 = DataFrame({'id1': self.df['id1'].tolist() * 2,
+                               'id2': self.df['id2'].tolist() * 2,
+                               'variable': ['A'] * 10 + ['B'] * 10,
+                               'value': (self.df['A'].tolist() +
+                                         self.df['B'].tolist())},
+                              columns=['id1', 'id2', 'variable', 'value'])
+        tm.assert_frame_equal(result4, expected4)
+
+    def test_value_vars_types(self):
+        # GH 15348
+        expected = DataFrame({'id1': self.df['id1'].tolist() * 2,
+                              'id2': self.df['id2'].tolist() * 2,
+                              'variable': ['A'] * 10 + ['B'] * 10,
+                              'value': (self.df['A'].tolist() +
+                                        self.df['B'].tolist())},
+                             columns=['id1', 'id2', 'variable', 'value'])
+
+        for type_ in (tuple, list, np.array):
+            result = self.df.melt(id_vars=['id1', 'id2'],
+                                  value_vars=type_(('A', 'B')))
+            tm.assert_frame_equal(result, expected)
+
+    def test_vars_work_with_multiindex(self):
+        expected = DataFrame({
+            ('A', 'a'): self.df1[('A', 'a')],
+            'CAP': ['B'] * len(self.df1),
+            'low': ['b'] * len(self.df1),
+            'value': self.df1[('B', 'b')],
+        }, columns=[('A', 'a'), 'CAP', 'low', 'value'])
+
+        result = self.df1.melt(id_vars=[('A', 'a')], value_vars=[('B', 'b')])
+        tm.assert_frame_equal(result, expected)
+
+    def test_tuple_vars_fail_with_multiindex(self):
+        # melt should fail with an informative error message if
+        # the columns have a MultiIndex and a tuple is passed
+        # for id_vars or value_vars.
+        tuple_a = ('A', 'a')
+        list_a = [tuple_a]
+        tuple_b = ('B', 'b')
+        list_b = [tuple_b]
+
+        for id_vars, value_vars in ((tuple_a, list_b), (list_a, tuple_b),
+                                    (tuple_a, tuple_b)):
+            with tm.assert_raises_regex(ValueError, r'MultiIndex'):
+                self.df1.melt(id_vars=id_vars, value_vars=value_vars)
+
+    def test_custom_var_name(self):
+        result5 = self.df.melt(var_name=self.var_name)
+        assert result5.columns.tolist() == ['var', 'value']
+
+        result6 = self.df.melt(id_vars=['id1'], var_name=self.var_name)
+        assert result6.columns.tolist() == ['id1', 'var', 'value']
+
+        result7 = self.df.melt(id_vars=['id1', 'id2'], var_name=self.var_name)
+        assert result7.columns.tolist() == ['id1', 'id2', 'var', 'value']
+
+        result8 = self.df.melt(id_vars=['id1', 'id2'], value_vars='A',
+                               var_name=self.var_name)
+        assert result8.columns.tolist() == ['id1', 'id2', 'var', 'value']
+
+        result9 = self.df.melt(id_vars=['id1', 'id2'], value_vars=['A', 'B'],
+                               var_name=self.var_name)
+        expected9 = DataFrame({'id1': self.df['id1'].tolist() * 2,
+                               'id2': self.df['id2'].tolist() * 2,
+                               self.var_name: ['A'] * 10 + ['B'] * 10,
+                               'value': (self.df['A'].tolist() +
+                                         self.df['B'].tolist())},
+                              columns=['id1', 'id2', self.var_name, 'value'])
+        tm.assert_frame_equal(result9, expected9)
+
+    def test_custom_value_name(self):
+        result10 = self.df.melt(value_name=self.value_name)
+        assert result10.columns.tolist() == ['variable', 'val']
+
+        result11 = self.df.melt(id_vars=['id1'], value_name=self.value_name)
+        assert result11.columns.tolist() == ['id1', 'variable', 'val']
+
+        result12 = self.df.melt(id_vars=['id1', 'id2'],
+                                value_name=self.value_name)
+        assert result12.columns.tolist() == ['id1', 'id2', 'variable', 'val']
+
+        result13 = self.df.melt(id_vars=['id1', 'id2'], value_vars='A',
+                                value_name=self.value_name)
+        assert result13.columns.tolist() == ['id1', 'id2', 'variable', 'val']
+
+        result14 = self.df.melt(id_vars=['id1', 'id2'], value_vars=['A', 'B'],
+                                value_name=self.value_name)
+        expected14 = DataFrame({'id1': self.df['id1'].tolist() * 2,
+                                'id2': self.df['id2'].tolist() * 2,
+                                'variable': ['A'] * 10 + ['B'] * 10,
+                                self.value_name: (self.df['A'].tolist() +
+                                                  self.df['B'].tolist())},
+                               columns=['id1', 'id2', 'variable',
+                                        self.value_name])
+        tm.assert_frame_equal(result14, expected14)
+
+    def test_custom_var_and_value_name(self):
+
+        result15 = self.df.melt(var_name=self.var_name,
+                                value_name=self.value_name)
+        assert result15.columns.tolist() == ['var', 'val']
+
+        result16 = self.df.melt(id_vars=['id1'], var_name=self.var_name,
+                                value_name=self.value_name)
+        assert result16.columns.tolist() == ['id1', 'var', 'val']
+
+        result17 = self.df.melt(id_vars=['id1', 'id2'],
+                                var_name=self.var_name,
+                                value_name=self.value_name)
+        assert result17.columns.tolist() == ['id1', 'id2', 'var', 'val']
+
+        result18 = self.df.melt(id_vars=['id1', 'id2'], value_vars='A',
+                                var_name=self.var_name,
+                                value_name=self.value_name)
+        assert result18.columns.tolist() == ['id1', 'id2', 'var', 'val']
+
+        result19 = self.df.melt(id_vars=['id1', 'id2'], value_vars=['A', 'B'],
+                                var_name=self.var_name,
+                                value_name=self.value_name)
+        expected19 = DataFrame({'id1': self.df['id1'].tolist() * 2,
+                                'id2': self.df['id2'].tolist() * 2,
+                                self.var_name: ['A'] * 10 + ['B'] * 10,
+                                self.value_name: (self.df['A'].tolist() +
+                                                  self.df['B'].tolist())},
+                               columns=['id1', 'id2', self.var_name,
+                                        self.value_name])
+        tm.assert_frame_equal(result19, expected19)
+
+        df20 = self.df.copy()
+        df20.columns.name = 'foo'
+        result20 = df20.melt()
+        assert result20.columns.tolist() == ['foo', 'value']
+
+    def test_col_level(self):
+        res1 = self.df1.melt(col_level=0)
+        res2 = self.df1.melt(col_level='CAP')
+        assert res1.columns.tolist() == ['CAP', 'value']
+        assert res2.columns.tolist() == ['CAP', 'value']
+
+    def test_multiindex(self):
+        res = self.df1.melt()
+        assert res.columns.tolist() == ['CAP', 'low', 'value']
+
+    @pytest.mark.parametrize("col", [
+        pd.Series(pd.date_range('2010', periods=5, tz='US/Pacific')),
+        pd.Series(["a", "b", "c", "a", "d"], dtype="category"),
+        pd.Series([0, 1, 0, 0, 0])])
+    def test_pandas_dtypes(self, col):
+        # GH 15785
+        df = DataFrame({'klass': range(5),
+                        'col': col,
+                        'attr1': [1, 0, 0, 0, 0],
+                        'attr2': col})
+        expected_value = pd.concat([pd.Series([1, 0, 0, 0, 0]), col],
+                                   ignore_index=True)
+        result = melt(df, id_vars=['klass', 'col'], var_name='attribute',
+                      value_name='value')
+        expected = DataFrame({0: list(range(5)) * 2,
+                              1: pd.concat([col] * 2, ignore_index=True),
+                              2: ['attr1'] * 5 + ['attr2'] * 5,
+                              3: expected_value})
+        expected.columns = ['klass', 'col', 'attribute', 'value']
+        tm.assert_frame_equal(result, expected)
+
+
+class TestLreshape(object):
+
+    def test_pairs(self):
+        data = {'birthdt': ['08jan2009', '20dec2008', '30dec2008', '21dec2008',
+                            '11jan2009'],
+                'birthwt': [1766, 3301, 1454, 3139, 4133],
+                'id': [101, 102, 103, 104, 105],
+                'sex': ['Male', 'Female', 'Female', 'Female', 'Female'],
+                'visitdt1': ['11jan2009', '22dec2008', '04jan2009',
+                             '29dec2008', '20jan2009'],
+                'visitdt2':
+                ['21jan2009', nan, '22jan2009', '31dec2008', '03feb2009'],
+                'visitdt3': ['05feb2009', nan, nan, '02jan2009', '15feb2009'],
+                'wt1': [1823, 3338, 1549, 3298, 4306],
+                'wt2': [2011.0, nan, 1892.0, 3338.0, 4575.0],
+                'wt3': [2293.0, nan, nan, 3377.0, 4805.0]}
+
+        df = DataFrame(data)
+
+        spec = {'visitdt': ['visitdt%d' % i for i in range(1, 4)],
+                'wt': ['wt%d' % i for i in range(1, 4)]}
+        result = lreshape(df, spec)
+
+        exp_data = {'birthdt':
+                    ['08jan2009', '20dec2008', '30dec2008', '21dec2008',
+                     '11jan2009', '08jan2009', '30dec2008', '21dec2008',
+                     '11jan2009', '08jan2009', '21dec2008', '11jan2009'],
+                    'birthwt': [1766, 3301, 1454, 3139, 4133, 1766, 1454, 3139,
+                                4133, 1766, 3139, 4133],
+                    'id': [101, 102, 103, 104, 105, 101, 103, 104, 105, 101,
+                           104, 105],
+                    'sex': ['Male', 'Female', 'Female', 'Female', 'Female',
+                            'Male', 'Female', 'Female', 'Female', 'Male',
+                            'Female', 'Female'],
+                    'visitdt': ['11jan2009', '22dec2008', '04jan2009',
+                                '29dec2008', '20jan2009', '21jan2009',
+                                '22jan2009', '31dec2008', '03feb2009',
+                                '05feb2009', '02jan2009', '15feb2009'],
+                    'wt': [1823.0, 3338.0, 1549.0, 3298.0, 4306.0, 2011.0,
+                           1892.0, 3338.0, 4575.0, 2293.0, 3377.0, 4805.0]}
+        exp = DataFrame(exp_data, columns=result.columns)
+        tm.assert_frame_equal(result, exp)
+
+        result = lreshape(df, spec, dropna=False)
+        exp_data = {'birthdt':
+                    ['08jan2009', '20dec2008', '30dec2008', '21dec2008',
+                     '11jan2009', '08jan2009', '20dec2008', '30dec2008',
+                     '21dec2008', '11jan2009', '08jan2009', '20dec2008',
+                     '30dec2008', '21dec2008', '11jan2009'],
+                    'birthwt': [1766, 3301, 1454, 3139, 4133, 1766, 3301, 1454,
+                                3139, 4133, 1766, 3301, 1454, 3139, 4133],
+                    'id': [101, 102, 103, 104, 105, 101, 102, 103, 104, 105,
+                           101, 102, 103, 104, 105],
+                    'sex': ['Male', 'Female', 'Female', 'Female', 'Female',
+                            'Male', 'Female', 'Female', 'Female', 'Female',
+                            'Male', 'Female', 'Female', 'Female', 'Female'],
+                    'visitdt': ['11jan2009', '22dec2008', '04jan2009',
+                                '29dec2008', '20jan2009', '21jan2009', nan,
+                                '22jan2009', '31dec2008', '03feb2009',
+                                '05feb2009', nan, nan, '02jan2009',
+                                '15feb2009'],
+                    'wt': [1823.0, 3338.0, 1549.0, 3298.0, 4306.0, 2011.0, nan,
+                           1892.0, 3338.0, 4575.0, 2293.0, nan, nan, 3377.0,
+                           4805.0]}
+        exp = DataFrame(exp_data, columns=result.columns)
+        tm.assert_frame_equal(result, exp)
+
+        spec = {'visitdt': ['visitdt%d' % i for i in range(1, 3)],
+                'wt': ['wt%d' % i for i in range(1, 4)]}
+        pytest.raises(ValueError, lreshape, df, spec)
+
+
+class TestWideToLong(object):
+
+    def test_simple(self):
+        np.random.seed(123)
+        x = np.random.randn(3)
+        df = pd.DataFrame({"A1970": {0: "a",
+                                     1: "b",
+                                     2: "c"},
+                           "A1980": {0: "d",
+                                     1: "e",
+                                     2: "f"},
+                           "B1970": {0: 2.5,
+                                     1: 1.2,
+                                     2: .7},
+                           "B1980": {0: 3.2,
+                                     1: 1.3,
+                                     2: .1},
+                           "X": dict(zip(
+                               range(3), x))})
+        df["id"] = df.index
+        exp_data = {"X": x.tolist() + x.tolist(),
+                    "A": ['a', 'b', 'c', 'd', 'e', 'f'],
+                    "B": [2.5, 1.2, 0.7, 3.2, 1.3, 0.1],
+                    "year": [1970, 1970, 1970, 1980, 1980, 1980],
+                    "id": [0, 1, 2, 0, 1, 2]}
+        expected = DataFrame(exp_data)
+        expected = expected.set_index(['id', 'year'])[["X", "A", "B"]]
+        result = wide_to_long(df, ["A", "B"], i="id", j="year")
+        tm.assert_frame_equal(result, expected)
+
+    def test_stubs(self):
+        # GH9204
+        df = pd.DataFrame([[0, 1, 2, 3, 8], [4, 5, 6, 7, 9]])
+        df.columns = ['id', 'inc1', 'inc2', 'edu1', 'edu2']
+        stubs = ['inc', 'edu']
+
+        # TODO: unused?
+        df_long = pd.wide_to_long(df, stubs, i='id', j='age')  # noqa
+
+        assert stubs == ['inc', 'edu']
+
+    def test_separating_character(self):
+        # GH14779
+        np.random.seed(123)
+        x = np.random.randn(3)
+        df = pd.DataFrame({"A.1970": {0: "a",
+                                      1: "b",
+                                      2: "c"},
+                           "A.1980": {0: "d",
+                                      1: "e",
+                                      2: "f"},
+                           "B.1970": {0: 2.5,
+                                      1: 1.2,
+                                      2: .7},
+                           "B.1980": {0: 3.2,
+                                      1: 1.3,
+                                      2: .1},
+                           "X": dict(zip(
+                               range(3), x))})
+        df["id"] = df.index
+        exp_data = {"X": x.tolist() + x.tolist(),
+                    "A": ['a', 'b', 'c', 'd', 'e', 'f'],
+                    "B": [2.5, 1.2, 0.7, 3.2, 1.3, 0.1],
+                    "year": [1970, 1970, 1970, 1980, 1980, 1980],
+                    "id": [0, 1, 2, 0, 1, 2]}
+        expected = DataFrame(exp_data)
+        expected = expected.set_index(['id', 'year'])[["X", "A", "B"]]
+        result = wide_to_long(df, ["A", "B"], i="id", j="year", sep=".")
+        tm.assert_frame_equal(result, expected)
+
+    def test_escapable_characters(self):
+        np.random.seed(123)
+        x = np.random.randn(3)
+        df = pd.DataFrame({"A(quarterly)1970": {0: "a",
+                                                1: "b",
+                                                2: "c"},
+                           "A(quarterly)1980": {0: "d",
+                                                1: "e",
+                                                2: "f"},
+                           "B(quarterly)1970": {0: 2.5,
+                                                1: 1.2,
+                                                2: .7},
+                           "B(quarterly)1980": {0: 3.2,
+                                                1: 1.3,
+                                                2: .1},
+                           "X": dict(zip(
+                               range(3), x))})
+        df["id"] = df.index
+        exp_data = {"X": x.tolist() + x.tolist(),
+                    "A(quarterly)": ['a', 'b', 'c', 'd', 'e', 'f'],
+                    "B(quarterly)": [2.5, 1.2, 0.7, 3.2, 1.3, 0.1],
+                    "year": [1970, 1970, 1970, 1980, 1980, 1980],
+                    "id": [0, 1, 2, 0, 1, 2]}
+        expected = DataFrame(exp_data)
+        expected = expected.set_index(
+            ['id', 'year'])[["X", "A(quarterly)", "B(quarterly)"]]
+        result = wide_to_long(df, ["A(quarterly)", "B(quarterly)"],
+                              i="id", j="year")
+        tm.assert_frame_equal(result, expected)
+
+    def test_unbalanced(self):
+        # test that we can have a varying amount of time variables
+        df = pd.DataFrame({'A2010': [1.0, 2.0],
+                           'A2011': [3.0, 4.0],
+                           'B2010': [5.0, 6.0],
+                           'X': ['X1', 'X2']})
+        df['id'] = df.index
+        exp_data = {'X': ['X1', 'X1', 'X2', 'X2'],
+                    'A': [1.0, 3.0, 2.0, 4.0],
+                    'B': [5.0, np.nan, 6.0, np.nan],
+                    'id': [0, 0, 1, 1],
+                    'year': [2010, 2011, 2010, 2011]}
+        expected = pd.DataFrame(exp_data)
+        expected = expected.set_index(['id', 'year'])[["X", "A", "B"]]
+        result = wide_to_long(df, ['A', 'B'], i='id', j='year')
+        tm.assert_frame_equal(result, expected)
+
+    def test_character_overlap(self):
+        # Test we handle overlapping characters in both id_vars and value_vars
+        df = pd.DataFrame({
+            'A11': ['a11', 'a22', 'a33'],
+            'A12': ['a21', 'a22', 'a23'],
+            'B11': ['b11', 'b12', 'b13'],
+            'B12': ['b21', 'b22', 'b23'],
+            'BB11': [1, 2, 3],
+            'BB12': [4, 5, 6],
+            'BBBX': [91, 92, 93],
+            'BBBZ': [91, 92, 93]
+        })
+        df['id'] = df.index
+        expected = pd.DataFrame({
+            'BBBX': [91, 92, 93, 91, 92, 93],
+            'BBBZ': [91, 92, 93, 91, 92, 93],
+            'A': ['a11', 'a22', 'a33', 'a21', 'a22', 'a23'],
+            'B': ['b11', 'b12', 'b13', 'b21', 'b22', 'b23'],
+            'BB': [1, 2, 3, 4, 5, 6],
+            'id': [0, 1, 2, 0, 1, 2],
+            'year': [11, 11, 11, 12, 12, 12]})
+        expected = expected.set_index(['id', 'year'])[
+            ['BBBX', 'BBBZ', 'A', 'B', 'BB']]
+        result = wide_to_long(df, ['A', 'B', 'BB'], i='id', j='year')
+        tm.assert_frame_equal(result.sort_index(axis=1),
+                              expected.sort_index(axis=1))
+
+    def test_invalid_separator(self):
+        # if an invalid separator is supplied a empty data frame is returned
+        sep = 'nope!'
+        df = pd.DataFrame({'A2010': [1.0, 2.0],
+                           'A2011': [3.0, 4.0],
+                           'B2010': [5.0, 6.0],
+                           'X': ['X1', 'X2']})
+        df['id'] = df.index
+        exp_data = {'X': '',
+                    'A2010': [],
+                    'A2011': [],
+                    'B2010': [],
+                    'id': [],
+                    'year': [],
+                    'A': [],
+                    'B': []}
+        expected = pd.DataFrame(exp_data).astype({'year': 'int'})
+        expected = expected.set_index(['id', 'year'])[[
+            'X', 'A2010', 'A2011', 'B2010', 'A', 'B']]
+        expected.index.set_levels([0, 1], level=0, inplace=True)
+        result = wide_to_long(df, ['A', 'B'], i='id', j='year', sep=sep)
+        tm.assert_frame_equal(result.sort_index(axis=1),
+                              expected.sort_index(axis=1))
+
+    def test_num_string_disambiguation(self):
+        # Test that we can disambiguate number value_vars from
+        # string value_vars
+        df = pd.DataFrame({
+            'A11': ['a11', 'a22', 'a33'],
+            'A12': ['a21', 'a22', 'a23'],
+            'B11': ['b11', 'b12', 'b13'],
+            'B12': ['b21', 'b22', 'b23'],
+            'BB11': [1, 2, 3],
+            'BB12': [4, 5, 6],
+            'Arating': [91, 92, 93],
+            'Arating_old': [91, 92, 93]
+        })
+        df['id'] = df.index
+        expected = pd.DataFrame({
+            'Arating': [91, 92, 93, 91, 92, 93],
+            'Arating_old': [91, 92, 93, 91, 92, 93],
+            'A': ['a11', 'a22', 'a33', 'a21', 'a22', 'a23'],
+            'B': ['b11', 'b12', 'b13', 'b21', 'b22', 'b23'],
+            'BB': [1, 2, 3, 4, 5, 6],
+            'id': [0, 1, 2, 0, 1, 2],
+            'year': [11, 11, 11, 12, 12, 12]})
+        expected = expected.set_index(['id', 'year'])[
+            ['Arating', 'Arating_old', 'A', 'B', 'BB']]
+        result = wide_to_long(df, ['A', 'B', 'BB'], i='id', j='year')
+        tm.assert_frame_equal(result.sort_index(axis=1),
+                              expected.sort_index(axis=1))
+
+    def test_invalid_suffixtype(self):
+        # If all stubs names end with a string, but a numeric suffix is
+        # assumed,  an empty data frame is returned
+        df = pd.DataFrame({'Aone': [1.0, 2.0],
+                           'Atwo': [3.0, 4.0],
+                           'Bone': [5.0, 6.0],
+                           'X': ['X1', 'X2']})
+        df['id'] = df.index
+        exp_data = {'X': '',
+                    'Aone': [],
+                    'Atwo': [],
+                    'Bone': [],
+                    'id': [],
+                    'year': [],
+                    'A': [],
+                    'B': []}
+        expected = pd.DataFrame(exp_data).astype({'year': 'int'})
+
+        expected = expected.set_index(['id', 'year'])
+        expected.index.set_levels([0, 1], level=0, inplace=True)
+        result = wide_to_long(df, ['A', 'B'], i='id', j='year')
+        tm.assert_frame_equal(result.sort_index(axis=1),
+                              expected.sort_index(axis=1))
+
+    def test_multiple_id_columns(self):
+        # Taken from http://www.ats.ucla.edu/stat/stata/modules/reshapel.htm
+        df = pd.DataFrame({
+            'famid': [1, 1, 1, 2, 2, 2, 3, 3, 3],
+            'birth': [1, 2, 3, 1, 2, 3, 1, 2, 3],
+            'ht1': [2.8, 2.9, 2.2, 2, 1.8, 1.9, 2.2, 2.3, 2.1],
+            'ht2': [3.4, 3.8, 2.9, 3.2, 2.8, 2.4, 3.3, 3.4, 2.9]
+        })
+        expected = pd.DataFrame({
+            'ht': [2.8, 3.4, 2.9, 3.8, 2.2, 2.9, 2.0, 3.2, 1.8,
+                   2.8, 1.9, 2.4, 2.2, 3.3, 2.3, 3.4, 2.1, 2.9],
+            'famid': [1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3],
+            'birth': [1, 1, 2, 2, 3, 3, 1, 1, 2, 2, 3, 3, 1, 1, 2, 2, 3, 3],
+            'age': [1, 2, 1, 2, 1, 2, 1, 2, 1,
+                    2, 1, 2, 1, 2, 1, 2, 1, 2]
+        })
+        expected = expected.set_index(['famid', 'birth', 'age'])[['ht']]
+        result = wide_to_long(df, 'ht', i=['famid', 'birth'], j='age')
+        tm.assert_frame_equal(result, expected)
+
+    def test_non_unique_idvars(self):
+        # GH16382
+        # Raise an error message if non unique id vars (i) are passed
+        df = pd.DataFrame({
+            'A_A1': [1, 2, 3, 4, 5],
+            'B_B1': [1, 2, 3, 4, 5],
+            'x': [1, 1, 1, 1, 1]
+        })
+        with pytest.raises(ValueError):
+            wide_to_long(df, ['A_A', 'B_B'], i='x', j='colname')
+
+    def test_cast_j_int(self):
+        df = pd.DataFrame({
+            'actor_1': ['CCH Pounder', 'Johnny Depp', 'Christoph Waltz'],
+            'actor_2': ['Joel David Moore', 'Orlando Bloom', 'Rory Kinnear'],
+            'actor_fb_likes_1': [1000.0, 40000.0, 11000.0],
+            'actor_fb_likes_2': [936.0, 5000.0, 393.0],
+            'title': ['Avatar', "Pirates of the Caribbean", 'Spectre']})
+
+        expected = pd.DataFrame({
+            'actor': ['CCH Pounder',
+                      'Johnny Depp',
+                      'Christoph Waltz',
+                      'Joel David Moore',
+                      'Orlando Bloom',
+                      'Rory Kinnear'],
+            'actor_fb_likes': [1000.0, 40000.0, 11000.0, 936.0, 5000.0, 393.0],
+            'num': [1, 1, 1, 2, 2, 2],
+            'title': ['Avatar',
+                      'Pirates of the Caribbean',
+                      'Spectre',
+                      'Avatar',
+                      'Pirates of the Caribbean',
+                      'Spectre']}).set_index(['title', 'num'])
+        result = wide_to_long(df, ['actor', 'actor_fb_likes'],
+                              i='title', j='num', sep='_')
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_identical_stubnames(self):
+        df = pd.DataFrame({'A2010': [1.0, 2.0],
+                           'A2011': [3.0, 4.0],
+                           'B2010': [5.0, 6.0],
+                           'A': ['X1', 'X2']})
+        with pytest.raises(ValueError):
+            wide_to_long(df, ['A', 'B'], i='A', j='colname')
+
+    def test_nonnumeric_suffix(self):
+        df = pd.DataFrame({'treatment_placebo': [1.0, 2.0],
+                           'treatment_test': [3.0, 4.0],
+                           'result_placebo': [5.0, 6.0],
+                           'A': ['X1', 'X2']})
+        expected = pd.DataFrame({
+            'A': ['X1', 'X1', 'X2', 'X2'],
+            'colname': ['placebo', 'test', 'placebo', 'test'],
+            'result': [5.0, np.nan, 6.0, np.nan],
+            'treatment': [1.0, 3.0, 2.0, 4.0]})
+        expected = expected.set_index(['A', 'colname'])
+        result = wide_to_long(df, ['result', 'treatment'],
+                              i='A', j='colname', suffix='[a-z]+', sep='_')
+        tm.assert_frame_equal(result, expected)
+
+    def test_mixed_type_suffix(self):
+        df = pd.DataFrame({
+            'A': ['X1', 'X2'],
+            'result_1': [0, 9],
+            'result_foo': [5.0, 6.0],
+            'treatment_1': [1.0, 2.0],
+            'treatment_foo': [3.0, 4.0]})
+        expected = pd.DataFrame({
+            'A': ['X1', 'X2', 'X1', 'X2'],
+            'colname': ['1', '1', 'foo', 'foo'],
+            'result': [0.0, 9.0, 5.0, 6.0],
+            'treatment': [1.0, 2.0, 3.0, 4.0]}).set_index(['A', 'colname'])
+        result = wide_to_long(df, ['result', 'treatment'],
+                              i='A', j='colname', suffix='.+', sep='_')
+        tm.assert_frame_equal(result, expected)
+
+    def test_float_suffix(self):
+        df = pd.DataFrame({
+            'treatment_1.1': [1.0, 2.0],
+            'treatment_2.1': [3.0, 4.0],
+            'result_1.2': [5.0, 6.0],
+            'result_1': [0, 9],
+            'A': ['X1', 'X2']})
+        expected = pd.DataFrame({
+            'A': ['X1', 'X1', 'X1', 'X1', 'X2', 'X2', 'X2', 'X2'],
+            'colname': [1, 1.1, 1.2, 2.1, 1, 1.1, 1.2, 2.1],
+            'result': [0.0, np.nan, 5.0, np.nan, 9.0, np.nan, 6.0, np.nan],
+            'treatment': [np.nan, 1.0, np.nan, 3.0, np.nan, 2.0, np.nan, 4.0]})
+        expected = expected.set_index(['A', 'colname'])
+        result = wide_to_long(df, ['result', 'treatment'],
+                              i='A', j='colname', suffix='[0-9.]+', sep='_')
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/reshape/test_pivot.py b/pandas/tests/reshape/test_pivot.py
new file mode 100644
index 0000000000000..7e7e081408534
--- /dev/null
+++ b/pandas/tests/reshape/test_pivot.py
@@ -0,0 +1,1782 @@
+# -*- coding: utf-8 -*-
+
+from datetime import datetime, date, timedelta
+
+import pytest
+
+
+import numpy as np
+
+from collections import OrderedDict
+import pandas as pd
+from pandas import (DataFrame, Series, Index, MultiIndex,
+                    Grouper, date_range, concat, Categorical)
+from pandas.core.reshape.pivot import pivot_table, crosstab
+from pandas.compat import range, product
+import pandas.util.testing as tm
+from pandas.api.types import CategoricalDtype as CDT
+
+
+@pytest.fixture(params=[True, False])
+def dropna(request):
+    return request.param
+
+
+class TestPivotTable(object):
+
+    def setup_method(self, method):
+        self.data = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
+                                     'bar', 'bar', 'bar', 'bar',
+                                     'foo', 'foo', 'foo'],
+                               'B': ['one', 'one', 'one', 'two',
+                                     'one', 'one', 'one', 'two',
+                                     'two', 'two', 'one'],
+                               'C': ['dull', 'dull', 'shiny', 'dull',
+                                     'dull', 'shiny', 'shiny', 'dull',
+                                     'shiny', 'shiny', 'shiny'],
+                               'D': np.random.randn(11),
+                               'E': np.random.randn(11),
+                               'F': np.random.randn(11)})
+
+    def test_pivot_table(self):
+        index = ['A', 'B']
+        columns = 'C'
+        table = pivot_table(self.data, values='D',
+                            index=index, columns=columns)
+
+        table2 = self.data.pivot_table(
+            values='D', index=index, columns=columns)
+        tm.assert_frame_equal(table, table2)
+
+        # this works
+        pivot_table(self.data, values='D', index=index)
+
+        if len(index) > 1:
+            assert table.index.names == tuple(index)
+        else:
+            assert table.index.name == index[0]
+
+        if len(columns) > 1:
+            assert table.columns.names == columns
+        else:
+            assert table.columns.name == columns[0]
+
+        expected = self.data.groupby(
+            index + [columns])['D'].agg(np.mean).unstack()
+        tm.assert_frame_equal(table, expected)
+
+    def test_pivot_table_nocols(self):
+        df = DataFrame({'rows': ['a', 'b', 'c'],
+                        'cols': ['x', 'y', 'z'],
+                        'values': [1, 2, 3]})
+        rs = df.pivot_table(columns='cols', aggfunc=np.sum)
+        xp = df.pivot_table(index='cols', aggfunc=np.sum).T
+        tm.assert_frame_equal(rs, xp)
+
+        rs = df.pivot_table(columns='cols', aggfunc={'values': 'mean'})
+        xp = df.pivot_table(index='cols', aggfunc={'values': 'mean'}).T
+        tm.assert_frame_equal(rs, xp)
+
+    def test_pivot_table_dropna(self):
+        df = DataFrame({'amount': {0: 60000, 1: 100000, 2: 50000, 3: 30000},
+                        'customer': {0: 'A', 1: 'A', 2: 'B', 3: 'C'},
+                        'month': {0: 201307, 1: 201309, 2: 201308, 3: 201310},
+                        'product': {0: 'a', 1: 'b', 2: 'c', 3: 'd'},
+                        'quantity': {0: 2000000, 1: 500000,
+                                     2: 1000000, 3: 1000000}})
+        pv_col = df.pivot_table('quantity', 'month', [
+                                'customer', 'product'], dropna=False)
+        pv_ind = df.pivot_table(
+            'quantity', ['customer', 'product'], 'month', dropna=False)
+
+        m = MultiIndex.from_tuples([('A', 'a'), ('A', 'b'), ('A', 'c'),
+                                    ('A', 'd'), ('B', 'a'), ('B', 'b'),
+                                    ('B', 'c'), ('B', 'd'), ('C', 'a'),
+                                    ('C', 'b'), ('C', 'c'), ('C', 'd')],
+                                   names=['customer', 'product'])
+        tm.assert_index_equal(pv_col.columns, m)
+        tm.assert_index_equal(pv_ind.index, m)
+
+    def test_pivot_table_categorical(self):
+
+        cat1 = Categorical(["a", "a", "b", "b"],
+                           categories=["a", "b", "z"], ordered=True)
+        cat2 = Categorical(["c", "d", "c", "d"],
+                           categories=["c", "d", "y"], ordered=True)
+        df = DataFrame({"A": cat1, "B": cat2, "values": [1, 2, 3, 4]})
+        result = pd.pivot_table(df, values='values', index=['A', 'B'],
+                                dropna=True)
+
+        exp_index = pd.MultiIndex.from_arrays(
+            [cat1, cat2],
+            names=['A', 'B'])
+        expected = DataFrame(
+            {'values': [1, 2, 3, 4]},
+            index=exp_index)
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_table_dropna_categoricals(self, dropna):
+        # GH 15193
+        categories = ['a', 'b', 'c', 'd']
+
+        df = DataFrame({'A': ['a', 'a', 'a', 'b', 'b', 'b', 'c', 'c', 'c'],
+                        'B': [1, 2, 3, 1, 2, 3, 1, 2, 3],
+                        'C': range(0, 9)})
+
+        df['A'] = df['A'].astype(CDT(categories, ordered=False))
+        result = df.pivot_table(index='B', columns='A', values='C',
+                                dropna=dropna)
+        expected_columns = Series(['a', 'b', 'c'], name='A')
+        expected_columns = expected_columns.astype(
+            CDT(categories, ordered=False))
+        expected_index = Series([1, 2, 3], name='B')
+        expected = DataFrame([[0, 3, 6],
+                              [1, 4, 7],
+                              [2, 5, 8]],
+                             index=expected_index,
+                             columns=expected_columns,)
+        if not dropna:
+            # add back the non observed to compare
+            expected = expected.reindex(
+                columns=Categorical(categories)).astype('float')
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_with_non_observable_dropna(self, dropna):
+        # gh-21133
+        df = pd.DataFrame(
+            {'A': pd.Categorical([np.nan, 'low', 'high', 'low', 'high'],
+                                 categories=['low', 'high'],
+                                 ordered=True),
+             'B': range(5)})
+
+        result = df.pivot_table(index='A', values='B', dropna=dropna)
+        expected = pd.DataFrame(
+            {'B': [2, 3]},
+            index=pd.Index(
+                pd.Categorical.from_codes([0, 1],
+                                          categories=['low', 'high'],
+                                          ordered=True),
+                name='A'))
+
+        tm.assert_frame_equal(result, expected)
+
+        # gh-21378
+        df = pd.DataFrame(
+            {'A': pd.Categorical(['left', 'low', 'high', 'low', 'high'],
+                                 categories=['low', 'high', 'left'],
+                                 ordered=True),
+             'B': range(5)})
+
+        result = df.pivot_table(index='A', values='B', dropna=dropna)
+        expected = pd.DataFrame(
+            {'B': [2, 3, 0]},
+            index=pd.Index(
+                pd.Categorical.from_codes([0, 1, 2],
+                                          categories=['low', 'high', 'left'],
+                                          ordered=True),
+                name='A'))
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_pass_array(self):
+        result = self.data.pivot_table(
+            'D', index=self.data.A, columns=self.data.C)
+        expected = self.data.pivot_table('D', index='A', columns='C')
+        tm.assert_frame_equal(result, expected)
+
+    def test_pass_function(self):
+        result = self.data.pivot_table('D', index=lambda x: x // 5,
+                                       columns=self.data.C)
+        expected = self.data.pivot_table('D', index=self.data.index // 5,
+                                         columns='C')
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_table_multiple(self):
+        index = ['A', 'B']
+        columns = 'C'
+        table = pivot_table(self.data, index=index, columns=columns)
+        expected = self.data.groupby(index + [columns]).agg(np.mean).unstack()
+        tm.assert_frame_equal(table, expected)
+
+    def test_pivot_dtypes(self):
+
+        # can convert dtypes
+        f = DataFrame({'a': ['cat', 'bat', 'cat', 'bat'], 'v': [
+                      1, 2, 3, 4], 'i': ['a', 'b', 'a', 'b']})
+        assert f.dtypes['v'] == 'int64'
+
+        z = pivot_table(f, values='v', index=['a'], columns=[
+                        'i'], fill_value=0, aggfunc=np.sum)
+        result = z.get_dtype_counts()
+        expected = Series(dict(int64=2))
+        tm.assert_series_equal(result, expected)
+
+        # cannot convert dtypes
+        f = DataFrame({'a': ['cat', 'bat', 'cat', 'bat'], 'v': [
+                      1.5, 2.5, 3.5, 4.5], 'i': ['a', 'b', 'a', 'b']})
+        assert f.dtypes['v'] == 'float64'
+
+        z = pivot_table(f, values='v', index=['a'], columns=[
+                        'i'], fill_value=0, aggfunc=np.mean)
+        result = z.get_dtype_counts()
+        expected = Series(dict(float64=2))
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('columns,values',
+                             [('bool1', ['float1', 'float2']),
+                              ('bool1', ['float1', 'float2', 'bool1']),
+                              ('bool2', ['float1', 'float2', 'bool1'])])
+    def test_pivot_preserve_dtypes(self, columns, values):
+        # GH 7142 regression test
+        v = np.arange(5, dtype=np.float64)
+        df = DataFrame({'float1': v, 'float2': v + 2.0,
+                        'bool1': v <= 2, 'bool2': v <= 3})
+
+        df_res = df.reset_index().pivot_table(
+            index='index', columns=columns, values=values)
+
+        result = dict(df_res.dtypes)
+        expected = {col: np.dtype('O') if col[0].startswith('b')
+                    else np.dtype('float64') for col in df_res}
+        assert result == expected
+
+    def test_pivot_no_values(self):
+        # GH 14380
+        idx = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-01-02',
+                                '2011-01-01', '2011-01-02'])
+        df = pd.DataFrame({'A': [1, 2, 3, 4, 5]},
+                          index=idx)
+        res = df.pivot_table(index=df.index.month, columns=df.index.day)
+
+        exp_columns = pd.MultiIndex.from_tuples([('A', 1), ('A', 2)])
+        exp = pd.DataFrame([[2.5, 4.0], [2.0, np.nan]],
+                           index=[1, 2], columns=exp_columns)
+        tm.assert_frame_equal(res, exp)
+
+        df = pd.DataFrame({'A': [1, 2, 3, 4, 5],
+                           'dt': pd.date_range('2011-01-01', freq='D',
+                                               periods=5)},
+                          index=idx)
+        res = df.pivot_table(index=df.index.month,
+                             columns=pd.Grouper(key='dt', freq='M'))
+        exp_columns = pd.MultiIndex.from_tuples([('A',
+                                                  pd.Timestamp('2011-01-31'))])
+        exp_columns.names = [None, 'dt']
+        exp = pd.DataFrame([3.25, 2.0],
+                           index=[1, 2], columns=exp_columns)
+        tm.assert_frame_equal(res, exp)
+
+        res = df.pivot_table(index=pd.Grouper(freq='A'),
+                             columns=pd.Grouper(key='dt', freq='M'))
+        exp = pd.DataFrame([3],
+                           index=pd.DatetimeIndex(['2011-12-31']),
+                           columns=exp_columns)
+        tm.assert_frame_equal(res, exp)
+
+    def test_pivot_multi_values(self):
+        result = pivot_table(self.data, values=['D', 'E'],
+                             index='A', columns=['B', 'C'], fill_value=0)
+        expected = pivot_table(self.data.drop(['F'], axis=1),
+                               index='A', columns=['B', 'C'], fill_value=0)
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_multi_functions(self):
+        f = lambda func: pivot_table(self.data, values=['D', 'E'],
+                                     index=['A', 'B'], columns='C',
+                                     aggfunc=func)
+        result = f([np.mean, np.std])
+        means = f(np.mean)
+        stds = f(np.std)
+        expected = concat([means, stds], keys=['mean', 'std'], axis=1)
+        tm.assert_frame_equal(result, expected)
+
+        # margins not supported??
+        f = lambda func: pivot_table(self.data, values=['D', 'E'],
+                                     index=['A', 'B'], columns='C',
+                                     aggfunc=func, margins=True)
+        result = f([np.mean, np.std])
+        means = f(np.mean)
+        stds = f(np.std)
+        expected = concat([means, stds], keys=['mean', 'std'], axis=1)
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_index_with_nan(self):
+        # GH 3588
+        nan = np.nan
+        df = DataFrame({'a': ['R1', 'R2', nan, 'R4'],
+                        'b': ['C1', 'C2', 'C3', 'C4'],
+                        'c': [10, 15, 17, 20]})
+        result = df.pivot('a', 'b', 'c')
+        expected = DataFrame([[nan, nan, 17, nan], [10, nan, nan, nan],
+                              [nan, 15, nan, nan], [nan, nan, nan, 20]],
+                             index=Index([nan, 'R1', 'R2', 'R4'], name='a'),
+                             columns=Index(['C1', 'C2', 'C3', 'C4'], name='b'))
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(df.pivot('b', 'a', 'c'), expected.T)
+
+        # GH9491
+        df = DataFrame({'a': pd.date_range('2014-02-01', periods=6, freq='D'),
+                        'c': 100 + np.arange(6)})
+        df['b'] = df['a'] - pd.Timestamp('2014-02-02')
+        df.loc[1, 'a'] = df.loc[3, 'a'] = nan
+        df.loc[1, 'b'] = df.loc[4, 'b'] = nan
+
+        pv = df.pivot('a', 'b', 'c')
+        assert pv.notna().values.sum() == len(df)
+
+        for _, row in df.iterrows():
+            assert pv.loc[row['a'], row['b']] == row['c']
+
+        tm.assert_frame_equal(df.pivot('b', 'a', 'c'), pv.T)
+
+    def test_pivot_with_tz(self):
+        # GH 5878
+        df = DataFrame({'dt1': [datetime(2013, 1, 1, 9, 0),
+                                datetime(2013, 1, 2, 9, 0),
+                                datetime(2013, 1, 1, 9, 0),
+                                datetime(2013, 1, 2, 9, 0)],
+                        'dt2': [datetime(2014, 1, 1, 9, 0),
+                                datetime(2014, 1, 1, 9, 0),
+                                datetime(2014, 1, 2, 9, 0),
+                                datetime(2014, 1, 2, 9, 0)],
+                        'data1': np.arange(4, dtype='int64'),
+                        'data2': np.arange(4, dtype='int64')})
+
+        df['dt1'] = df['dt1'].apply(lambda d: pd.Timestamp(d, tz='US/Pacific'))
+        df['dt2'] = df['dt2'].apply(lambda d: pd.Timestamp(d, tz='Asia/Tokyo'))
+
+        exp_col1 = Index(['data1', 'data1', 'data2', 'data2'])
+        exp_col2 = pd.DatetimeIndex(['2014/01/01 09:00',
+                                     '2014/01/02 09:00'] * 2,
+                                    name='dt2', tz='Asia/Tokyo')
+        exp_col = pd.MultiIndex.from_arrays([exp_col1, exp_col2])
+        expected = DataFrame([[0, 2, 0, 2], [1, 3, 1, 3]],
+                             index=pd.DatetimeIndex(['2013/01/01 09:00',
+                                                     '2013/01/02 09:00'],
+                                                    name='dt1',
+                                                    tz='US/Pacific'),
+                             columns=exp_col)
+
+        pv = df.pivot(index='dt1', columns='dt2')
+        tm.assert_frame_equal(pv, expected)
+
+        expected = DataFrame([[0, 2], [1, 3]],
+                             index=pd.DatetimeIndex(['2013/01/01 09:00',
+                                                     '2013/01/02 09:00'],
+                                                    name='dt1',
+                                                    tz='US/Pacific'),
+                             columns=pd.DatetimeIndex(['2014/01/01 09:00',
+                                                       '2014/01/02 09:00'],
+                                                      name='dt2',
+                                                      tz='Asia/Tokyo'))
+
+        pv = df.pivot(index='dt1', columns='dt2', values='data1')
+        tm.assert_frame_equal(pv, expected)
+
+    def test_pivot_periods(self):
+        df = DataFrame({'p1': [pd.Period('2013-01-01', 'D'),
+                               pd.Period('2013-01-02', 'D'),
+                               pd.Period('2013-01-01', 'D'),
+                               pd.Period('2013-01-02', 'D')],
+                        'p2': [pd.Period('2013-01', 'M'),
+                               pd.Period('2013-01', 'M'),
+                               pd.Period('2013-02', 'M'),
+                               pd.Period('2013-02', 'M')],
+                        'data1': np.arange(4, dtype='int64'),
+                        'data2': np.arange(4, dtype='int64')})
+
+        exp_col1 = Index(['data1', 'data1', 'data2', 'data2'])
+        exp_col2 = pd.PeriodIndex(['2013-01', '2013-02'] * 2,
+                                  name='p2', freq='M')
+        exp_col = pd.MultiIndex.from_arrays([exp_col1, exp_col2])
+        expected = DataFrame([[0, 2, 0, 2], [1, 3, 1, 3]],
+                             index=pd.PeriodIndex(['2013-01-01', '2013-01-02'],
+                                                  name='p1', freq='D'),
+                             columns=exp_col)
+
+        pv = df.pivot(index='p1', columns='p2')
+        tm.assert_frame_equal(pv, expected)
+
+        expected = DataFrame([[0, 2], [1, 3]],
+                             index=pd.PeriodIndex(['2013-01-01', '2013-01-02'],
+                                                  name='p1', freq='D'),
+                             columns=pd.PeriodIndex(['2013-01', '2013-02'],
+                                                    name='p2', freq='M'))
+
+        pv = df.pivot(index='p1', columns='p2', values='data1')
+        tm.assert_frame_equal(pv, expected)
+
+    @pytest.mark.parametrize('values', [
+        ['baz', 'zoo'], np.array(['baz', 'zoo']),
+        pd.Series(['baz', 'zoo']), pd.Index(['baz', 'zoo'])
+    ])
+    def test_pivot_with_list_like_values(self, values):
+        # issue #17160
+        df = pd.DataFrame({'foo': ['one', 'one', 'one', 'two', 'two', 'two'],
+                           'bar': ['A', 'B', 'C', 'A', 'B', 'C'],
+                           'baz': [1, 2, 3, 4, 5, 6],
+                           'zoo': ['x', 'y', 'z', 'q', 'w', 't']})
+
+        result = df.pivot(index='foo', columns='bar', values=values)
+
+        data = [[1, 2, 3, 'x', 'y', 'z'],
+                [4, 5, 6, 'q', 'w', 't']]
+        index = Index(data=['one', 'two'], name='foo')
+        columns = MultiIndex(levels=[['baz', 'zoo'], ['A', 'B', 'C']],
+                             labels=[[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 1, 2]],
+                             names=[None, 'bar'])
+        expected = DataFrame(data=data, index=index,
+                             columns=columns, dtype='object')
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('values', [
+        ['bar', 'baz'], np.array(['bar', 'baz']),
+        pd.Series(['bar', 'baz']), pd.Index(['bar', 'baz'])
+    ])
+    def test_pivot_with_list_like_values_nans(self, values):
+        # issue #17160
+        df = pd.DataFrame({'foo': ['one', 'one', 'one', 'two', 'two', 'two'],
+                           'bar': ['A', 'B', 'C', 'A', 'B', 'C'],
+                           'baz': [1, 2, 3, 4, 5, 6],
+                           'zoo': ['x', 'y', 'z', 'q', 'w', 't']})
+
+        result = df.pivot(index='zoo', columns='foo', values=values)
+
+        data = [[np.nan, 'A', np.nan, 4],
+                [np.nan, 'C', np.nan, 6],
+                [np.nan, 'B', np.nan, 5],
+                ['A', np.nan, 1, np.nan],
+                ['B', np.nan, 2, np.nan],
+                ['C', np.nan, 3, np.nan]]
+        index = Index(data=['q', 't', 'w', 'x', 'y', 'z'], name='zoo')
+        columns = MultiIndex(levels=[['bar', 'baz'], ['one', 'two']],
+                             labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                             names=[None, 'foo'])
+        expected = DataFrame(data=data, index=index,
+                             columns=columns, dtype='object')
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.xfail(reason='MultiIndexed unstack with tuple names fails'
+                              'with KeyError #19966')
+    def test_pivot_with_multiindex(self):
+        # issue #17160
+        index = Index(data=[0, 1, 2, 3, 4, 5])
+        data = [['one', 'A', 1, 'x'],
+                ['one', 'B', 2, 'y'],
+                ['one', 'C', 3, 'z'],
+                ['two', 'A', 4, 'q'],
+                ['two', 'B', 5, 'w'],
+                ['two', 'C', 6, 't']]
+        columns = MultiIndex(levels=[['bar', 'baz'], ['first', 'second']],
+                             labels=[[0, 0, 1, 1], [0, 1, 0, 1]])
+        df = DataFrame(data=data, index=index, columns=columns, dtype='object')
+        result = df.pivot(index=('bar', 'first'), columns=('bar', 'second'),
+                          values=('baz', 'first'))
+
+        data = {'A': Series([1, 4], index=['one', 'two']),
+                'B': Series([2, 5], index=['one', 'two']),
+                'C': Series([3, 6], index=['one', 'two'])}
+        expected = DataFrame(data)
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_with_tuple_of_values(self):
+        # issue #17160
+        df = pd.DataFrame({'foo': ['one', 'one', 'one', 'two', 'two', 'two'],
+                           'bar': ['A', 'B', 'C', 'A', 'B', 'C'],
+                           'baz': [1, 2, 3, 4, 5, 6],
+                           'zoo': ['x', 'y', 'z', 'q', 'w', 't']})
+        with pytest.raises(KeyError):
+            # tuple is seen as a single column name
+            df.pivot(index='zoo', columns='foo', values=('bar', 'baz'))
+
+    def test_margins(self):
+        def _check_output(result, values_col, index=['A', 'B'],
+                          columns=['C'],
+                          margins_col='All'):
+            col_margins = result.loc[result.index[:-1], margins_col]
+            expected_col_margins = self.data.groupby(index)[values_col].mean()
+            tm.assert_series_equal(col_margins, expected_col_margins,
+                                   check_names=False)
+            assert col_margins.name == margins_col
+
+            result = result.sort_index()
+            index_margins = result.loc[(margins_col, '')].iloc[:-1]
+
+            expected_ix_margins = self.data.groupby(columns)[values_col].mean()
+            tm.assert_series_equal(index_margins, expected_ix_margins,
+                                   check_names=False)
+            assert index_margins.name == (margins_col, '')
+
+            grand_total_margins = result.loc[(margins_col, ''), margins_col]
+            expected_total_margins = self.data[values_col].mean()
+            assert grand_total_margins == expected_total_margins
+
+        # column specified
+        result = self.data.pivot_table(values='D', index=['A', 'B'],
+                                       columns='C',
+                                       margins=True, aggfunc=np.mean)
+        _check_output(result, 'D')
+
+        # Set a different margins_name (not 'All')
+        result = self.data.pivot_table(values='D', index=['A', 'B'],
+                                       columns='C',
+                                       margins=True, aggfunc=np.mean,
+                                       margins_name='Totals')
+        _check_output(result, 'D', margins_col='Totals')
+
+        # no column specified
+        table = self.data.pivot_table(index=['A', 'B'], columns='C',
+                                      margins=True, aggfunc=np.mean)
+        for value_col in table.columns.levels[0]:
+            _check_output(table[value_col], value_col)
+
+        # no col
+
+        # to help with a buglet
+        self.data.columns = [k * 2 for k in self.data.columns]
+        table = self.data.pivot_table(index=['AA', 'BB'], margins=True,
+                                      aggfunc=np.mean)
+        for value_col in table.columns:
+            totals = table.loc[('All', ''), value_col]
+            assert totals == self.data[value_col].mean()
+
+        # no rows
+        rtable = self.data.pivot_table(columns=['AA', 'BB'], margins=True,
+                                       aggfunc=np.mean)
+        assert isinstance(rtable, Series)
+
+        table = self.data.pivot_table(index=['AA', 'BB'], margins=True,
+                                      aggfunc='mean')
+        for item in ['DD', 'EE', 'FF']:
+            totals = table.loc[('All', ''), item]
+            assert totals == self.data[item].mean()
+
+        # issue number #8349: pivot_table with margins and dictionary aggfunc
+        data = [
+            {'JOB': 'Worker', 'NAME': 'Bob', 'YEAR': 2013,
+             'MONTH': 12, 'DAYS': 3, 'SALARY': 17},
+            {'JOB': 'Employ', 'NAME':
+             'Mary', 'YEAR': 2013, 'MONTH': 12, 'DAYS': 5, 'SALARY': 23},
+            {'JOB': 'Worker', 'NAME': 'Bob', 'YEAR': 2014,
+             'MONTH': 1, 'DAYS': 10, 'SALARY': 100},
+            {'JOB': 'Worker', 'NAME': 'Bob', 'YEAR': 2014,
+             'MONTH': 1, 'DAYS': 11, 'SALARY': 110},
+            {'JOB': 'Employ', 'NAME': 'Mary', 'YEAR': 2014,
+             'MONTH': 1, 'DAYS': 15, 'SALARY': 200},
+            {'JOB': 'Worker', 'NAME': 'Bob', 'YEAR': 2014,
+             'MONTH': 2, 'DAYS': 8, 'SALARY': 80},
+            {'JOB': 'Employ', 'NAME': 'Mary', 'YEAR': 2014,
+             'MONTH': 2, 'DAYS': 5, 'SALARY': 190},
+        ]
+
+        df = DataFrame(data)
+
+        df = df.set_index(['JOB', 'NAME', 'YEAR', 'MONTH'], drop=False,
+                          append=False)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df.pivot_table(index=['JOB', 'NAME'],
+                                    columns=['YEAR', 'MONTH'],
+                                    values=['DAYS', 'SALARY'],
+                                    aggfunc={'DAYS': 'mean', 'SALARY': 'sum'},
+                                    margins=True)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            expected = df.pivot_table(index=['JOB', 'NAME'],
+                                      columns=['YEAR', 'MONTH'],
+                                      values=['DAYS'],
+                                      aggfunc='mean', margins=True)
+
+        tm.assert_frame_equal(result['DAYS'], expected['DAYS'])
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            expected = df.pivot_table(index=['JOB', 'NAME'],
+                                      columns=['YEAR', 'MONTH'],
+                                      values=['SALARY'],
+                                      aggfunc='sum', margins=True)
+
+        tm.assert_frame_equal(result['SALARY'], expected['SALARY'])
+
+    def test_margins_dtype(self):
+        # GH 17013
+
+        df = self.data.copy()
+        df[['D', 'E', 'F']] = np.arange(len(df) * 3).reshape(len(df), 3)
+
+        mi_val = list(product(['bar', 'foo'], ['one', 'two'])) + [('All', '')]
+        mi = MultiIndex.from_tuples(mi_val, names=('A', 'B'))
+        expected = DataFrame({'dull': [12, 21, 3, 9, 45],
+                              'shiny': [33, 0, 36, 51, 120]},
+                             index=mi).rename_axis('C', axis=1)
+        expected['All'] = expected['dull'] + expected['shiny']
+
+        result = df.pivot_table(values='D', index=['A', 'B'],
+                                       columns='C', margins=True,
+                                       aggfunc=np.sum, fill_value=0)
+
+        tm.assert_frame_equal(expected, result)
+
+    @pytest.mark.xfail(reason='GH 17035 (len of floats is casted back to '
+                              'floats)')
+    def test_margins_dtype_len(self):
+        mi_val = list(product(['bar', 'foo'], ['one', 'two'])) + [('All', '')]
+        mi = MultiIndex.from_tuples(mi_val, names=('A', 'B'))
+        expected = DataFrame({'dull': [1, 1, 2, 1, 5],
+                              'shiny': [2, 0, 2, 2, 6]},
+                             index=mi).rename_axis('C', axis=1)
+        expected['All'] = expected['dull'] + expected['shiny']
+
+        result = self.data.pivot_table(values='D', index=['A', 'B'],
+                                       columns='C', margins=True,
+                                       aggfunc=len, fill_value=0)
+
+        tm.assert_frame_equal(expected, result)
+
+    def test_pivot_integer_columns(self):
+        # caused by upstream bug in unstack
+
+        d = date.min
+        data = list(product(['foo', 'bar'], ['A', 'B', 'C'], ['x1', 'x2'],
+                            [d + timedelta(i)
+                             for i in range(20)], [1.0]))
+        df = DataFrame(data)
+        table = df.pivot_table(values=4, index=[0, 1, 3], columns=[2])
+
+        df2 = df.rename(columns=str)
+        table2 = df2.pivot_table(
+            values='4', index=['0', '1', '3'], columns=['2'])
+
+        tm.assert_frame_equal(table, table2, check_names=False)
+
+    def test_pivot_no_level_overlap(self):
+        # GH #1181
+
+        data = DataFrame({'a': ['a', 'a', 'a', 'a', 'b', 'b', 'b', 'b'] * 2,
+                          'b': [0, 0, 0, 0, 1, 1, 1, 1] * 2,
+                          'c': (['foo'] * 4 + ['bar'] * 4) * 2,
+                          'value': np.random.randn(16)})
+
+        table = data.pivot_table('value', index='a', columns=['b', 'c'])
+
+        grouped = data.groupby(['a', 'b', 'c'])['value'].mean()
+        expected = grouped.unstack('b').unstack('c').dropna(axis=1, how='all')
+        tm.assert_frame_equal(table, expected)
+
+    def test_pivot_columns_lexsorted(self):
+
+        n = 10000
+
+        dtype = np.dtype([
+            ("Index", object),
+            ("Symbol", object),
+            ("Year", int),
+            ("Month", int),
+            ("Day", int),
+            ("Quantity", int),
+            ("Price", float),
+        ])
+
+        products = np.array([
+            ('SP500', 'ADBE'),
+            ('SP500', 'NVDA'),
+            ('SP500', 'ORCL'),
+            ('NDQ100', 'AAPL'),
+            ('NDQ100', 'MSFT'),
+            ('NDQ100', 'GOOG'),
+            ('FTSE', 'DGE.L'),
+            ('FTSE', 'TSCO.L'),
+            ('FTSE', 'GSK.L'),
+        ], dtype=[('Index', object), ('Symbol', object)])
+        items = np.empty(n, dtype=dtype)
+        iproduct = np.random.randint(0, len(products), n)
+        items['Index'] = products['Index'][iproduct]
+        items['Symbol'] = products['Symbol'][iproduct]
+        dr = pd.date_range(date(2000, 1, 1),
+                           date(2010, 12, 31))
+        dates = dr[np.random.randint(0, len(dr), n)]
+        items['Year'] = dates.year
+        items['Month'] = dates.month
+        items['Day'] = dates.day
+        items['Price'] = np.random.lognormal(4.0, 2.0, n)
+
+        df = DataFrame(items)
+
+        pivoted = df.pivot_table('Price', index=['Month', 'Day'],
+                                 columns=['Index', 'Symbol', 'Year'],
+                                 aggfunc='mean')
+
+        assert pivoted.columns.is_monotonic
+
+    def test_pivot_complex_aggfunc(self):
+        f = OrderedDict([('D', ['std']), ('E', ['sum'])])
+        expected = self.data.groupby(['A', 'B']).agg(f).unstack('B')
+        result = self.data.pivot_table(index='A', columns='B', aggfunc=f)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_margins_no_values_no_cols(self):
+        # Regression test on pivot table: no values or cols passed.
+        result = self.data[['A', 'B']].pivot_table(
+            index=['A', 'B'], aggfunc=len, margins=True)
+        result_list = result.tolist()
+        assert sum(result_list[:-1]) == result_list[-1]
+
+    def test_margins_no_values_two_rows(self):
+        # Regression test on pivot table: no values passed but rows are a
+        # multi-index
+        result = self.data[['A', 'B', 'C']].pivot_table(
+            index=['A', 'B'], columns='C', aggfunc=len, margins=True)
+        assert result.All.tolist() == [3.0, 1.0, 4.0, 3.0, 11.0]
+
+    def test_margins_no_values_one_row_one_col(self):
+        # Regression test on pivot table: no values passed but row and col
+        # defined
+        result = self.data[['A', 'B']].pivot_table(
+            index='A', columns='B', aggfunc=len, margins=True)
+        assert result.All.tolist() == [4.0, 7.0, 11.0]
+
+    def test_margins_no_values_two_row_two_cols(self):
+        # Regression test on pivot table: no values passed but rows and cols
+        # are multi-indexed
+        self.data['D'] = ['a', 'b', 'c', 'd',
+                          'e', 'f', 'g', 'h', 'i', 'j', 'k']
+        result = self.data[['A', 'B', 'C', 'D']].pivot_table(
+            index=['A', 'B'], columns=['C', 'D'], aggfunc=len, margins=True)
+        assert result.All.tolist() == [3.0, 1.0, 4.0, 3.0, 11.0]
+
+    def test_pivot_table_with_margins_set_margin_name(self):
+        # see gh-3335
+        for margin_name in ['foo', 'one', 666, None, ['a', 'b']]:
+            with pytest.raises(ValueError):
+                # multi-index index
+                pivot_table(self.data, values='D', index=['A', 'B'],
+                            columns=['C'], margins=True,
+                            margins_name=margin_name)
+            with pytest.raises(ValueError):
+                # multi-index column
+                pivot_table(self.data, values='D', index=['C'],
+                            columns=['A', 'B'], margins=True,
+                            margins_name=margin_name)
+            with pytest.raises(ValueError):
+                # non-multi-index index/column
+                pivot_table(self.data, values='D', index=['A'],
+                            columns=['B'], margins=True,
+                            margins_name=margin_name)
+
+    def test_pivot_timegrouper(self):
+        df = DataFrame({
+            'Branch': 'A A A A A A A B'.split(),
+            'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
+            'Quantity': [1, 3, 5, 1, 8, 1, 9, 3],
+            'Date': [datetime(2013, 1, 1),
+                     datetime(2013, 1, 1),
+                     datetime(2013, 10, 1),
+                     datetime(2013, 10, 2),
+                     datetime(2013, 10, 1),
+                     datetime(2013, 10, 2),
+                     datetime(2013, 12, 2),
+                     datetime(2013, 12, 2), ]}).set_index('Date')
+
+        expected = DataFrame(np.array([10, 18, 3], dtype='int64')
+                             .reshape(1, 3),
+                             index=[datetime(2013, 12, 31)],
+                             columns='Carl Joe Mark'.split())
+        expected.index.name = 'Date'
+        expected.columns.name = 'Buyer'
+
+        result = pivot_table(df, index=Grouper(freq='A'), columns='Buyer',
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index='Buyer', columns=Grouper(freq='A'),
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected.T)
+
+        expected = DataFrame(np.array([1, np.nan, 3, 9, 18, np.nan])
+                             .reshape(2, 3),
+                             index=[datetime(2013, 1, 1),
+                                    datetime(2013, 7, 1)],
+                             columns='Carl Joe Mark'.split())
+        expected.index.name = 'Date'
+        expected.columns.name = 'Buyer'
+
+        result = pivot_table(df, index=Grouper(freq='6MS'), columns='Buyer',
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index='Buyer', columns=Grouper(freq='6MS'),
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected.T)
+
+        # passing the name
+        df = df.reset_index()
+        result = pivot_table(df, index=Grouper(freq='6MS', key='Date'),
+                             columns='Buyer',
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index='Buyer',
+                             columns=Grouper(freq='6MS', key='Date'),
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected.T)
+
+        pytest.raises(KeyError, lambda: pivot_table(
+            df, index=Grouper(freq='6MS', key='foo'),
+            columns='Buyer', values='Quantity', aggfunc=np.sum))
+        pytest.raises(KeyError, lambda: pivot_table(
+            df, index='Buyer',
+            columns=Grouper(freq='6MS', key='foo'),
+            values='Quantity', aggfunc=np.sum))
+
+        # passing the level
+        df = df.set_index('Date')
+        result = pivot_table(df, index=Grouper(freq='6MS', level='Date'),
+                             columns='Buyer', values='Quantity',
+                             aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index='Buyer',
+                             columns=Grouper(freq='6MS', level='Date'),
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected.T)
+
+        pytest.raises(ValueError, lambda: pivot_table(
+            df, index=Grouper(freq='6MS', level='foo'),
+            columns='Buyer', values='Quantity', aggfunc=np.sum))
+        pytest.raises(ValueError, lambda: pivot_table(
+            df, index='Buyer',
+            columns=Grouper(freq='6MS', level='foo'),
+            values='Quantity', aggfunc=np.sum))
+
+        # double grouper
+        df = DataFrame({
+            'Branch': 'A A A A A A A B'.split(),
+            'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
+            'Quantity': [1, 3, 5, 1, 8, 1, 9, 3],
+            'Date': [datetime(2013, 11, 1, 13, 0), datetime(2013, 9, 1, 13, 5),
+                     datetime(2013, 10, 1, 20, 0),
+                     datetime(2013, 10, 2, 10, 0),
+                     datetime(2013, 11, 1, 20, 0),
+                     datetime(2013, 10, 2, 10, 0),
+                     datetime(2013, 10, 2, 12, 0),
+                     datetime(2013, 12, 5, 14, 0)],
+            'PayDay': [datetime(2013, 10, 4, 0, 0),
+                       datetime(2013, 10, 15, 13, 5),
+                       datetime(2013, 9, 5, 20, 0),
+                       datetime(2013, 11, 2, 10, 0),
+                       datetime(2013, 10, 7, 20, 0),
+                       datetime(2013, 9, 5, 10, 0),
+                       datetime(2013, 12, 30, 12, 0),
+                       datetime(2013, 11, 20, 14, 0), ]})
+
+        result = pivot_table(df, index=Grouper(freq='M', key='Date'),
+                             columns=Grouper(freq='M', key='PayDay'),
+                             values='Quantity', aggfunc=np.sum)
+        expected = DataFrame(np.array([np.nan, 3, np.nan, np.nan,
+                                       6, np.nan, 1, 9,
+                                       np.nan, 9, np.nan, np.nan, np.nan,
+                                       np.nan, 3, np.nan]).reshape(4, 4),
+                             index=[datetime(2013, 9, 30),
+                                    datetime(2013, 10, 31),
+                                    datetime(2013, 11, 30),
+                                    datetime(2013, 12, 31)],
+                             columns=[datetime(2013, 9, 30),
+                                      datetime(2013, 10, 31),
+                                      datetime(2013, 11, 30),
+                                      datetime(2013, 12, 31)])
+        expected.index.name = 'Date'
+        expected.columns.name = 'PayDay'
+
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index=Grouper(freq='M', key='PayDay'),
+                             columns=Grouper(freq='M', key='Date'),
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected.T)
+
+        tuples = [(datetime(2013, 9, 30), datetime(2013, 10, 31)),
+                  (datetime(2013, 10, 31),
+                   datetime(2013, 9, 30)),
+                  (datetime(2013, 10, 31),
+                   datetime(2013, 11, 30)),
+                  (datetime(2013, 10, 31),
+                   datetime(2013, 12, 31)),
+                  (datetime(2013, 11, 30),
+                   datetime(2013, 10, 31)),
+                  (datetime(2013, 12, 31), datetime(2013, 11, 30)), ]
+        idx = MultiIndex.from_tuples(tuples, names=['Date', 'PayDay'])
+        expected = DataFrame(np.array([3, np.nan, 6, np.nan, 1, np.nan,
+                                       9, np.nan, 9, np.nan,
+                                       np.nan, 3]).reshape(6, 2),
+                             index=idx, columns=['A', 'B'])
+        expected.columns.name = 'Branch'
+
+        result = pivot_table(
+            df, index=[Grouper(freq='M', key='Date'),
+                       Grouper(freq='M', key='PayDay')], columns=['Branch'],
+            values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index=['Branch'],
+                             columns=[Grouper(freq='M', key='Date'),
+                                      Grouper(freq='M', key='PayDay')],
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected.T)
+
+    def test_pivot_datetime_tz(self):
+        dates1 = ['2011-07-19 07:00:00', '2011-07-19 08:00:00',
+                  '2011-07-19 09:00:00',
+                  '2011-07-19 07:00:00', '2011-07-19 08:00:00',
+                  '2011-07-19 09:00:00']
+        dates2 = ['2013-01-01 15:00:00', '2013-01-01 15:00:00',
+                  '2013-01-01 15:00:00',
+                  '2013-02-01 15:00:00', '2013-02-01 15:00:00',
+                  '2013-02-01 15:00:00']
+        df = DataFrame({'label': ['a', 'a', 'a', 'b', 'b', 'b'],
+                        'dt1': dates1, 'dt2': dates2,
+                        'value1': np.arange(6, dtype='int64'),
+                        'value2': [1, 2] * 3})
+        df['dt1'] = df['dt1'].apply(lambda d: pd.Timestamp(d, tz='US/Pacific'))
+        df['dt2'] = df['dt2'].apply(lambda d: pd.Timestamp(d, tz='Asia/Tokyo'))
+
+        exp_idx = pd.DatetimeIndex(['2011-07-19 07:00:00',
+                                    '2011-07-19 08:00:00',
+                                    '2011-07-19 09:00:00'],
+                                   tz='US/Pacific', name='dt1')
+        exp_col1 = Index(['value1', 'value1'])
+        exp_col2 = Index(['a', 'b'], name='label')
+        exp_col = MultiIndex.from_arrays([exp_col1, exp_col2])
+        expected = DataFrame([[0, 3], [1, 4], [2, 5]],
+                             index=exp_idx, columns=exp_col)
+        result = pivot_table(df, index=['dt1'], columns=[
+                             'label'], values=['value1'])
+        tm.assert_frame_equal(result, expected)
+
+        exp_col1 = Index(['sum', 'sum', 'sum', 'sum',
+                          'mean', 'mean', 'mean', 'mean'])
+        exp_col2 = Index(['value1', 'value1', 'value2', 'value2'] * 2)
+        exp_col3 = pd.DatetimeIndex(['2013-01-01 15:00:00',
+                                     '2013-02-01 15:00:00'] * 4,
+                                    tz='Asia/Tokyo', name='dt2')
+        exp_col = MultiIndex.from_arrays([exp_col1, exp_col2, exp_col3])
+        expected = DataFrame(np.array([[0, 3, 1, 2, 0, 3, 1, 2],
+                                       [1, 4, 2, 1, 1, 4, 2, 1],
+                                       [2, 5, 1, 2, 2, 5, 1, 2]],
+                                      dtype='int64'),
+                             index=exp_idx,
+                             columns=exp_col)
+
+        result = pivot_table(df, index=['dt1'], columns=['dt2'],
+                             values=['value1', 'value2'],
+                             aggfunc=[np.sum, np.mean])
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_dtaccessor(self):
+        # GH 8103
+        dates1 = ['2011-07-19 07:00:00', '2011-07-19 08:00:00',
+                  '2011-07-19 09:00:00',
+                  '2011-07-19 07:00:00', '2011-07-19 08:00:00',
+                  '2011-07-19 09:00:00']
+        dates2 = ['2013-01-01 15:00:00', '2013-01-01 15:00:00',
+                  '2013-01-01 15:00:00',
+                  '2013-02-01 15:00:00', '2013-02-01 15:00:00',
+                  '2013-02-01 15:00:00']
+        df = DataFrame({'label': ['a', 'a', 'a', 'b', 'b', 'b'],
+                        'dt1': dates1, 'dt2': dates2,
+                        'value1': np.arange(6, dtype='int64'),
+                        'value2': [1, 2] * 3})
+        df['dt1'] = df['dt1'].apply(lambda d: pd.Timestamp(d))
+        df['dt2'] = df['dt2'].apply(lambda d: pd.Timestamp(d))
+
+        result = pivot_table(df, index='label', columns=df['dt1'].dt.hour,
+                             values='value1')
+
+        exp_idx = Index(['a', 'b'], name='label')
+        expected = DataFrame({7: [0, 3], 8: [1, 4], 9: [2, 5]},
+                             index=exp_idx,
+                             columns=Index([7, 8, 9], name='dt1'))
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index=df['dt2'].dt.month,
+                             columns=df['dt1'].dt.hour,
+                             values='value1')
+
+        expected = DataFrame({7: [0, 3], 8: [1, 4], 9: [2, 5]},
+                             index=Index([1, 2], name='dt2'),
+                             columns=Index([7, 8, 9], name='dt1'))
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index=df['dt2'].dt.year.values,
+                             columns=[df['dt1'].dt.hour, df['dt2'].dt.month],
+                             values='value1')
+
+        exp_col = MultiIndex.from_arrays(
+            [[7, 7, 8, 8, 9, 9], [1, 2] * 3], names=['dt1', 'dt2'])
+        expected = DataFrame(np.array([[0, 3, 1, 4, 2, 5]], dtype='int64'),
+                             index=[2013], columns=exp_col)
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index=np.array(['X', 'X', 'X',
+                                                 'X', 'Y', 'Y']),
+                             columns=[df['dt1'].dt.hour, df['dt2'].dt.month],
+                             values='value1')
+        expected = DataFrame(np.array([[0, 3, 1, np.nan, 2, np.nan],
+                                       [np.nan, np.nan, np.nan,
+                                        4, np.nan, 5]]),
+                             index=['X', 'Y'], columns=exp_col)
+        tm.assert_frame_equal(result, expected)
+
+    def test_daily(self):
+        rng = date_range('1/1/2000', '12/31/2004', freq='D')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        annual = pivot_table(DataFrame(ts), index=ts.index.year,
+                             columns=ts.index.dayofyear)
+        annual.columns = annual.columns.droplevel(0)
+
+        doy = np.asarray(ts.index.dayofyear)
+
+        for i in range(1, 367):
+            subset = ts[doy == i]
+            subset.index = subset.index.year
+
+            result = annual[i].dropna()
+            tm.assert_series_equal(result, subset, check_names=False)
+            assert result.name == i
+
+    def test_monthly(self):
+        rng = date_range('1/1/2000', '12/31/2004', freq='M')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        annual = pivot_table(pd.DataFrame(ts), index=ts.index.year,
+                             columns=ts.index.month)
+        annual.columns = annual.columns.droplevel(0)
+
+        month = ts.index.month
+        for i in range(1, 13):
+            subset = ts[month == i]
+            subset.index = subset.index.year
+            result = annual[i].dropna()
+            tm.assert_series_equal(result, subset, check_names=False)
+            assert result.name == i
+
+    def test_pivot_table_with_iterator_values(self):
+        # GH 12017
+        aggs = {'D': 'sum', 'E': 'mean'}
+
+        pivot_values_list = pd.pivot_table(
+            self.data, index=['A'], values=list(aggs.keys()), aggfunc=aggs,
+        )
+
+        pivot_values_keys = pd.pivot_table(
+            self.data, index=['A'], values=aggs.keys(), aggfunc=aggs,
+        )
+        tm.assert_frame_equal(pivot_values_keys, pivot_values_list)
+
+        agg_values_gen = (value for value in aggs.keys())
+        pivot_values_gen = pd.pivot_table(
+            self.data, index=['A'], values=agg_values_gen, aggfunc=aggs,
+        )
+        tm.assert_frame_equal(pivot_values_gen, pivot_values_list)
+
+    def test_pivot_table_margins_name_with_aggfunc_list(self):
+        # GH 13354
+        margins_name = 'Weekly'
+        costs = pd.DataFrame(
+            {'item': ['bacon', 'cheese', 'bacon', 'cheese'],
+             'cost': [2.5, 4.5, 3.2, 3.3],
+             'day': ['M', 'M', 'T', 'T']}
+        )
+        table = costs.pivot_table(
+            index="item", columns="day", margins=True,
+            margins_name=margins_name, aggfunc=[np.mean, max]
+        )
+        ix = pd.Index(
+            ['bacon', 'cheese', margins_name], dtype='object', name='item'
+        )
+        tups = [('mean', 'cost', 'M'), ('mean', 'cost', 'T'),
+                ('mean', 'cost', margins_name), ('max', 'cost', 'M'),
+                ('max', 'cost', 'T'), ('max', 'cost', margins_name)]
+        cols = pd.MultiIndex.from_tuples(tups, names=[None, None, 'day'])
+        expected = pd.DataFrame(table.values, index=ix, columns=cols)
+        tm.assert_frame_equal(table, expected)
+
+    @pytest.mark.xfail(reason='GH 17035 (np.mean of ints is casted back to '
+                              'ints)')
+    def test_categorical_margins(self, observed):
+        # GH 10989
+        df = pd.DataFrame({'x': np.arange(8),
+                           'y': np.arange(8) // 4,
+                           'z': np.arange(8) % 2})
+
+        expected = pd.DataFrame([[1.0, 2.0, 1.5], [5, 6, 5.5], [3, 4, 3.5]])
+        expected.index = Index([0, 1, 'All'], name='y')
+        expected.columns = Index([0, 1, 'All'], name='z')
+
+        table = df.pivot_table('x', 'y', 'z', dropna=observed, margins=True)
+        tm.assert_frame_equal(table, expected)
+
+    @pytest.mark.xfail(reason='GH 17035 (np.mean of ints is casted back to '
+                              'ints)')
+    def test_categorical_margins_category(self, observed):
+        df = pd.DataFrame({'x': np.arange(8),
+                           'y': np.arange(8) // 4,
+                           'z': np.arange(8) % 2})
+
+        expected = pd.DataFrame([[1.0, 2.0, 1.5], [5, 6, 5.5], [3, 4, 3.5]])
+        expected.index = Index([0, 1, 'All'], name='y')
+        expected.columns = Index([0, 1, 'All'], name='z')
+
+        df.y = df.y.astype('category')
+        df.z = df.z.astype('category')
+        table = df.pivot_table('x', 'y', 'z', dropna=observed, margins=True)
+        tm.assert_frame_equal(table, expected)
+
+    def test_categorical_aggfunc(self, observed):
+        # GH 9534
+        df = pd.DataFrame({"C1": ["A", "B", "C", "C"],
+                           "C2": ["a", "a", "b", "b"],
+                           "V": [1, 2, 3, 4]})
+        df["C1"] = df["C1"].astype("category")
+        result = df.pivot_table("V", index="C1", columns="C2",
+                                dropna=observed, aggfunc="count")
+
+        expected_index = pd.CategoricalIndex(['A', 'B', 'C'],
+                                             categories=['A', 'B', 'C'],
+                                             ordered=False,
+                                             name='C1')
+        expected_columns = pd.Index(['a', 'b'], name='C2')
+        expected_data = np.array([[1., np.nan],
+                                  [1., np.nan],
+                                  [np.nan, 2.]])
+        expected = pd.DataFrame(expected_data,
+                                index=expected_index,
+                                columns=expected_columns)
+        tm.assert_frame_equal(result, expected)
+
+    def test_categorical_pivot_index_ordering(self, observed):
+        # GH 8731
+        df = pd.DataFrame({'Sales': [100, 120, 220],
+                           'Month': ['January', 'January', 'January'],
+                           'Year': [2013, 2014, 2013]})
+        months = ['January', 'February', 'March', 'April', 'May', 'June',
+                  'July', 'August', 'September', 'October', 'November',
+                  'December']
+        df['Month'] = df['Month'].astype('category').cat.set_categories(months)
+        result = df.pivot_table(values='Sales',
+                                index='Month',
+                                columns='Year',
+                                dropna=observed,
+                                aggfunc='sum')
+        expected_columns = pd.Int64Index([2013, 2014], name='Year')
+        expected_index = pd.CategoricalIndex(['January'],
+                                             categories=months,
+                                             ordered=False,
+                                             name='Month')
+        expected = pd.DataFrame([[320, 120]],
+                                index=expected_index,
+                                columns=expected_columns)
+        if not observed:
+            result = result.dropna().astype(np.int64)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_table_not_series(self):
+        # GH 4386
+        # pivot_table always returns a DataFrame
+        # when values is not list like and columns is None
+        # and aggfunc is not instance of list
+        df = DataFrame({'col1': [3, 4, 5],
+                        'col2': ['C', 'D', 'E'],
+                        'col3': [1, 3, 9]})
+
+        result = df.pivot_table('col1', index=['col3', 'col2'], aggfunc=np.sum)
+        m = MultiIndex.from_arrays([[1, 3, 9],
+                                    ['C', 'D', 'E']],
+                                   names=['col3', 'col2'])
+        expected = DataFrame([3, 4, 5],
+                             index=m, columns=['col1'])
+
+        tm.assert_frame_equal(result, expected)
+
+        result = df.pivot_table(
+            'col1', index='col3', columns='col2', aggfunc=np.sum
+        )
+        expected = DataFrame([[3, np.NaN, np.NaN],
+                              [np.NaN, 4, np.NaN],
+                              [np.NaN, np.NaN, 5]],
+                             index=Index([1, 3, 9], name='col3'),
+                             columns=Index(['C', 'D', 'E'], name='col2'))
+
+        tm.assert_frame_equal(result, expected)
+
+        result = df.pivot_table('col1', index='col3', aggfunc=[np.sum])
+        m = MultiIndex.from_arrays([['sum'],
+                                    ['col1']])
+        expected = DataFrame([3, 4, 5],
+                             index=Index([1, 3, 9], name='col3'),
+                             columns=m)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_margins_name_unicode(self):
+        # issue #13292
+        greek = u'\u0394\u03bf\u03ba\u03b9\u03bc\u03ae'
+        frame = pd.DataFrame({'foo': [1, 2, 3]})
+        table = pd.pivot_table(frame, index=['foo'], aggfunc=len, margins=True,
+                               margins_name=greek)
+        index = pd.Index([1, 2, 3, greek], dtype='object', name='foo')
+        expected = pd.DataFrame(index=index)
+        tm.assert_frame_equal(table, expected)
+
+    def test_pivot_string_as_func(self):
+        # GH #18713
+        # for correctness purposes
+        data = DataFrame({'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar',
+                                'bar', 'bar', 'foo', 'foo', 'foo'],
+                          'B': ['one', 'one', 'one', 'two', 'one', 'one',
+                                'one', 'two', 'two', 'two', 'one'],
+                          'C': range(11)})
+
+        result = pivot_table(data, index='A', columns='B', aggfunc='sum')
+        mi = MultiIndex(levels=[['C'], ['one', 'two']],
+                        labels=[[0, 0], [0, 1]], names=[None, 'B'])
+        expected = DataFrame({('C', 'one'): {'bar': 15, 'foo': 13},
+                              ('C', 'two'): {'bar': 7, 'foo': 20}},
+                             columns=mi).rename_axis('A')
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(data, index='A', columns='B',
+                             aggfunc=['sum', 'mean'])
+        mi = MultiIndex(levels=[['sum', 'mean'], ['C'], ['one', 'two']],
+                        labels=[[0, 0, 1, 1], [0, 0, 0, 0], [0, 1, 0, 1]],
+                        names=[None, None, 'B'])
+        expected = DataFrame({('mean', 'C', 'one'): {'bar': 5.0, 'foo': 3.25},
+                              ('mean', 'C', 'two'): {'bar': 7.0,
+                                                     'foo': 6.666666666666667},
+                              ('sum', 'C', 'one'): {'bar': 15, 'foo': 13},
+                              ('sum', 'C', 'two'): {'bar': 7, 'foo': 20}},
+                             columns=mi).rename_axis('A')
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('f, f_numpy',
+                             [('sum', np.sum),
+                              ('mean', np.mean),
+                              ('std', np.std),
+                              (['sum', 'mean'], [np.sum, np.mean]),
+                              (['sum', 'std'], [np.sum, np.std]),
+                              (['std', 'mean'], [np.std, np.mean])])
+    def test_pivot_string_func_vs_func(self, f, f_numpy):
+        # GH #18713
+        # for consistency purposes
+        result = pivot_table(self.data, index='A', columns='B', aggfunc=f)
+        expected = pivot_table(self.data, index='A', columns='B',
+                               aggfunc=f_numpy)
+        tm.assert_frame_equal(result, expected)
+
+
+class TestCrosstab(object):
+
+    def setup_method(self, method):
+        df = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
+                              'bar', 'bar', 'bar', 'bar',
+                              'foo', 'foo', 'foo'],
+                        'B': ['one', 'one', 'one', 'two',
+                              'one', 'one', 'one', 'two',
+                              'two', 'two', 'one'],
+                        'C': ['dull', 'dull', 'shiny', 'dull',
+                              'dull', 'shiny', 'shiny', 'dull',
+                              'shiny', 'shiny', 'shiny'],
+                        'D': np.random.randn(11),
+                        'E': np.random.randn(11),
+                        'F': np.random.randn(11)})
+
+        self.df = df.append(df, ignore_index=True)
+
+    def test_crosstab_single(self):
+        df = self.df
+        result = crosstab(df['A'], df['C'])
+        expected = df.groupby(['A', 'C']).size().unstack()
+        tm.assert_frame_equal(result, expected.fillna(0).astype(np.int64))
+
+    def test_crosstab_multiple(self):
+        df = self.df
+
+        result = crosstab(df['A'], [df['B'], df['C']])
+        expected = df.groupby(['A', 'B', 'C']).size()
+        expected = expected.unstack(
+            'B').unstack('C').fillna(0).astype(np.int64)
+        tm.assert_frame_equal(result, expected)
+
+        result = crosstab([df['B'], df['C']], df['A'])
+        expected = df.groupby(['B', 'C', 'A']).size()
+        expected = expected.unstack('A').fillna(0).astype(np.int64)
+        tm.assert_frame_equal(result, expected)
+
+    def test_crosstab_ndarray(self):
+        a = np.random.randint(0, 5, size=100)
+        b = np.random.randint(0, 3, size=100)
+        c = np.random.randint(0, 10, size=100)
+
+        df = DataFrame({'a': a, 'b': b, 'c': c})
+
+        result = crosstab(a, [b, c], rownames=['a'], colnames=('b', 'c'))
+        expected = crosstab(df['a'], [df['b'], df['c']])
+        tm.assert_frame_equal(result, expected)
+
+        result = crosstab([b, c], a, colnames=['a'], rownames=('b', 'c'))
+        expected = crosstab([df['b'], df['c']], df['a'])
+        tm.assert_frame_equal(result, expected)
+
+        # assign arbitrary names
+        result = crosstab(self.df['A'].values, self.df['C'].values)
+        assert result.index.name == 'row_0'
+        assert result.columns.name == 'col_0'
+
+    def test_crosstab_non_aligned(self):
+        # GH 17005
+        a = pd.Series([0, 1, 1], index=['a', 'b', 'c'])
+        b = pd.Series([3, 4, 3, 4, 3], index=['a', 'b', 'c', 'd', 'f'])
+        c = np.array([3, 4, 3])
+
+        expected = pd.DataFrame([[1, 0], [1, 1]],
+                                index=Index([0, 1], name='row_0'),
+                                columns=Index([3, 4], name='col_0'))
+
+        result = crosstab(a, b)
+        tm.assert_frame_equal(result, expected)
+
+        result = crosstab(a, c)
+        tm.assert_frame_equal(result, expected)
+
+    def test_crosstab_margins(self):
+        a = np.random.randint(0, 7, size=100)
+        b = np.random.randint(0, 3, size=100)
+        c = np.random.randint(0, 5, size=100)
+
+        df = DataFrame({'a': a, 'b': b, 'c': c})
+
+        result = crosstab(a, [b, c], rownames=['a'], colnames=('b', 'c'),
+                          margins=True)
+
+        assert result.index.names == ('a',)
+        assert result.columns.names == ['b', 'c']
+
+        all_cols = result['All', '']
+        exp_cols = df.groupby(['a']).size().astype('i8')
+        # to keep index.name
+        exp_margin = Series([len(df)], index=Index(['All'], name='a'))
+        exp_cols = exp_cols.append(exp_margin)
+        exp_cols.name = ('All', '')
+
+        tm.assert_series_equal(all_cols, exp_cols)
+
+        all_rows = result.loc['All']
+        exp_rows = df.groupby(['b', 'c']).size().astype('i8')
+        exp_rows = exp_rows.append(Series([len(df)], index=[('All', '')]))
+        exp_rows.name = 'All'
+
+        exp_rows = exp_rows.reindex(all_rows.index)
+        exp_rows = exp_rows.fillna(0).astype(np.int64)
+        tm.assert_series_equal(all_rows, exp_rows)
+
+    def test_crosstab_margins_set_margin_name(self):
+        # GH 15972
+        a = np.random.randint(0, 7, size=100)
+        b = np.random.randint(0, 3, size=100)
+        c = np.random.randint(0, 5, size=100)
+
+        df = DataFrame({'a': a, 'b': b, 'c': c})
+
+        result = crosstab(a, [b, c], rownames=['a'], colnames=('b', 'c'),
+                          margins=True, margins_name='TOTAL')
+
+        assert result.index.names == ('a',)
+        assert result.columns.names == ['b', 'c']
+
+        all_cols = result['TOTAL', '']
+        exp_cols = df.groupby(['a']).size().astype('i8')
+        # to keep index.name
+        exp_margin = Series([len(df)], index=Index(['TOTAL'], name='a'))
+        exp_cols = exp_cols.append(exp_margin)
+        exp_cols.name = ('TOTAL', '')
+
+        tm.assert_series_equal(all_cols, exp_cols)
+
+        all_rows = result.loc['TOTAL']
+        exp_rows = df.groupby(['b', 'c']).size().astype('i8')
+        exp_rows = exp_rows.append(Series([len(df)], index=[('TOTAL', '')]))
+        exp_rows.name = 'TOTAL'
+
+        exp_rows = exp_rows.reindex(all_rows.index)
+        exp_rows = exp_rows.fillna(0).astype(np.int64)
+        tm.assert_series_equal(all_rows, exp_rows)
+
+        for margins_name in [666, None, ['a', 'b']]:
+            with pytest.raises(ValueError):
+                crosstab(a, [b, c], rownames=['a'], colnames=('b', 'c'),
+                         margins=True, margins_name=margins_name)
+
+    def test_crosstab_pass_values(self):
+        a = np.random.randint(0, 7, size=100)
+        b = np.random.randint(0, 3, size=100)
+        c = np.random.randint(0, 5, size=100)
+        values = np.random.randn(100)
+
+        table = crosstab([a, b], c, values, aggfunc=np.sum,
+                         rownames=['foo', 'bar'], colnames=['baz'])
+
+        df = DataFrame({'foo': a, 'bar': b, 'baz': c, 'values': values})
+
+        expected = df.pivot_table('values', index=['foo', 'bar'],
+                                  columns='baz', aggfunc=np.sum)
+        tm.assert_frame_equal(table, expected)
+
+    def test_crosstab_dropna(self):
+        # GH 3820
+        a = np.array(['foo', 'foo', 'foo', 'bar',
+                      'bar', 'foo', 'foo'], dtype=object)
+        b = np.array(['one', 'one', 'two', 'one',
+                      'two', 'two', 'two'], dtype=object)
+        c = np.array(['dull', 'dull', 'dull', 'dull',
+                      'dull', 'shiny', 'shiny'], dtype=object)
+        res = pd.crosstab(a, [b, c], rownames=['a'],
+                          colnames=['b', 'c'], dropna=False)
+        m = MultiIndex.from_tuples([('one', 'dull'), ('one', 'shiny'),
+                                    ('two', 'dull'), ('two', 'shiny')],
+                                   names=['b', 'c'])
+        tm.assert_index_equal(res.columns, m)
+
+    def test_crosstab_no_overlap(self):
+        # GS 10291
+
+        s1 = pd.Series([1, 2, 3], index=[1, 2, 3])
+        s2 = pd.Series([4, 5, 6], index=[4, 5, 6])
+
+        actual = crosstab(s1, s2)
+        expected = pd.DataFrame()
+
+        tm.assert_frame_equal(actual, expected)
+
+    def test_margin_dropna(self):
+        # GH 12577
+        # pivot_table counts null into margin ('All')
+        # when margins=true and dropna=true
+
+        df = pd.DataFrame({'a': [1, 2, 2, 2, 2, np.nan],
+                           'b': [3, 3, 4, 4, 4, 4]})
+        actual = pd.crosstab(df.a, df.b, margins=True, dropna=True)
+        expected = pd.DataFrame([[1, 0, 1], [1, 3, 4], [2, 3, 5]])
+        expected.index = Index([1.0, 2.0, 'All'], name='a')
+        expected.columns = Index([3, 4, 'All'], name='b')
+        tm.assert_frame_equal(actual, expected)
+
+        df = DataFrame({'a': [1, np.nan, np.nan, np.nan, 2, np.nan],
+                        'b': [3, np.nan, 4, 4, 4, 4]})
+        actual = pd.crosstab(df.a, df.b, margins=True, dropna=True)
+        expected = pd.DataFrame([[1, 0, 1], [0, 1, 1], [1, 1, 2]])
+        expected.index = Index([1.0, 2.0, 'All'], name='a')
+        expected.columns = Index([3.0, 4.0, 'All'], name='b')
+        tm.assert_frame_equal(actual, expected)
+
+        df = DataFrame({'a': [1, np.nan, np.nan, np.nan, np.nan, 2],
+                        'b': [3, 3, 4, 4, 4, 4]})
+        actual = pd.crosstab(df.a, df.b, margins=True, dropna=True)
+        expected = pd.DataFrame([[1, 0, 1], [0, 1, 1], [1, 1, 2]])
+        expected.index = Index([1.0, 2.0, 'All'], name='a')
+        expected.columns = Index([3, 4, 'All'], name='b')
+        tm.assert_frame_equal(actual, expected)
+
+        # GH 12642
+        # _add_margins raises KeyError: Level None not found
+        # when margins=True and dropna=False
+        df = pd.DataFrame({'a': [1, 2, 2, 2, 2, np.nan],
+                           'b': [3, 3, 4, 4, 4, 4]})
+        actual = pd.crosstab(df.a, df.b, margins=True, dropna=False)
+        expected = pd.DataFrame([[1, 0, 1], [1, 3, 4], [2, 4, 6]])
+        expected.index = Index([1.0, 2.0, 'All'], name='a')
+        expected.columns = Index([3, 4, 'All'], name='b')
+        tm.assert_frame_equal(actual, expected)
+
+        df = DataFrame({'a': [1, np.nan, np.nan, np.nan, 2, np.nan],
+                        'b': [3, np.nan, 4, 4, 4, 4]})
+        actual = pd.crosstab(df.a, df.b, margins=True, dropna=False)
+        expected = pd.DataFrame([[1, 0, 1], [0, 1, 1], [1, 4, 6]])
+        expected.index = Index([1.0, 2.0, 'All'], name='a')
+        expected.columns = Index([3.0, 4.0, 'All'], name='b')
+        tm.assert_frame_equal(actual, expected)
+
+        a = np.array(['foo', 'foo', 'foo', 'bar',
+                      'bar', 'foo', 'foo'], dtype=object)
+        b = np.array(['one', 'one', 'two', 'one',
+                      'two', np.nan, 'two'], dtype=object)
+        c = np.array(['dull', 'dull', 'dull', 'dull',
+                      'dull', 'shiny', 'shiny'], dtype=object)
+
+        actual = pd.crosstab(a, [b, c], rownames=['a'],
+                             colnames=['b', 'c'], margins=True, dropna=False)
+        m = MultiIndex.from_arrays([['one', 'one', 'two', 'two', 'All'],
+                                    ['dull', 'shiny', 'dull', 'shiny', '']],
+                                   names=['b', 'c'])
+        expected = DataFrame([[1, 0, 1, 0, 2], [2, 0, 1, 1, 5],
+                              [3, 0, 2, 1, 7]], columns=m)
+        expected.index = Index(['bar', 'foo', 'All'], name='a')
+        tm.assert_frame_equal(actual, expected)
+
+        actual = pd.crosstab([a, b], c, rownames=['a', 'b'],
+                             colnames=['c'], margins=True, dropna=False)
+        m = MultiIndex.from_arrays([['bar', 'bar', 'foo', 'foo', 'All'],
+                                    ['one', 'two', 'one', 'two', '']],
+                                   names=['a', 'b'])
+        expected = DataFrame([[1, 0, 1], [1, 0, 1], [2, 0, 2], [1, 1, 2],
+                              [5, 2, 7]], index=m)
+        expected.columns = Index(['dull', 'shiny', 'All'], name='c')
+        tm.assert_frame_equal(actual, expected)
+
+        actual = pd.crosstab([a, b], c, rownames=['a', 'b'],
+                             colnames=['c'], margins=True, dropna=True)
+        m = MultiIndex.from_arrays([['bar', 'bar', 'foo', 'foo', 'All'],
+                                    ['one', 'two', 'one', 'two', '']],
+                                   names=['a', 'b'])
+        expected = DataFrame([[1, 0, 1], [1, 0, 1], [2, 0, 2], [1, 1, 2],
+                              [5, 1, 6]], index=m)
+        expected.columns = Index(['dull', 'shiny', 'All'], name='c')
+        tm.assert_frame_equal(actual, expected)
+
+    def test_crosstab_normalize(self):
+        # Issue 12578
+        df = pd.DataFrame({'a': [1, 2, 2, 2, 2], 'b': [3, 3, 4, 4, 4],
+                           'c': [1, 1, np.nan, 1, 1]})
+
+        rindex = pd.Index([1, 2], name='a')
+        cindex = pd.Index([3, 4], name='b')
+        full_normal = pd.DataFrame([[0.2, 0], [0.2, 0.6]],
+                                   index=rindex, columns=cindex)
+        row_normal = pd.DataFrame([[1.0, 0], [0.25, 0.75]],
+                                  index=rindex, columns=cindex)
+        col_normal = pd.DataFrame([[0.5, 0], [0.5, 1.0]],
+                                  index=rindex, columns=cindex)
+
+        # Check all normalize args
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='all'),
+                              full_normal)
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize=True),
+                              full_normal)
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='index'),
+                              row_normal)
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='columns'),
+                              col_normal)
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize=1),
+                              pd.crosstab(df.a, df.b, normalize='columns'))
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize=0),
+                              pd.crosstab(df.a, df.b, normalize='index'))
+
+        row_normal_margins = pd.DataFrame([[1.0, 0],
+                                           [0.25, 0.75],
+                                           [0.4, 0.6]],
+                                          index=pd.Index([1, 2, 'All'],
+                                                         name='a',
+                                                         dtype='object'),
+                                          columns=pd.Index([3, 4], name='b',
+                                                           dtype='object'))
+        col_normal_margins = pd.DataFrame([[0.5, 0, 0.2], [0.5, 1.0, 0.8]],
+                                          index=pd.Index([1, 2], name='a',
+                                                         dtype='object'),
+                                          columns=pd.Index([3, 4, 'All'],
+                                                           name='b',
+                                                           dtype='object'))
+
+        all_normal_margins = pd.DataFrame([[0.2, 0, 0.2],
+                                           [0.2, 0.6, 0.8],
+                                           [0.4, 0.6, 1]],
+                                          index=pd.Index([1, 2, 'All'],
+                                                         name='a',
+                                                         dtype='object'),
+                                          columns=pd.Index([3, 4, 'All'],
+                                                           name='b',
+                                                           dtype='object'))
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='index',
+                                          margins=True), row_normal_margins)
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='columns',
+                                          margins=True), col_normal_margins)
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize=True,
+                                          margins=True), all_normal_margins)
+
+        # Test arrays
+        pd.crosstab([np.array([1, 1, 2, 2]), np.array([1, 2, 1, 2])],
+                    np.array([1, 2, 1, 2]))
+
+        # Test with aggfunc
+        norm_counts = pd.DataFrame([[0.25, 0, 0.25],
+                                    [0.25, 0.5, 0.75],
+                                    [0.5, 0.5, 1]],
+                                   index=pd.Index([1, 2, 'All'],
+                                                  name='a',
+                                                  dtype='object'),
+                                   columns=pd.Index([3, 4, 'All'],
+                                                    name='b'))
+        test_case = pd.crosstab(df.a, df.b, df.c, aggfunc='count',
+                                normalize='all',
+                                margins=True)
+        tm.assert_frame_equal(test_case, norm_counts)
+
+        df = pd.DataFrame({'a': [1, 2, 2, 2, 2], 'b': [3, 3, 4, 4, 4],
+                           'c': [0, 4, np.nan, 3, 3]})
+
+        norm_sum = pd.DataFrame([[0, 0, 0.],
+                                 [0.4, 0.6, 1],
+                                 [0.4, 0.6, 1]],
+                                index=pd.Index([1, 2, 'All'],
+                                               name='a',
+                                               dtype='object'),
+                                columns=pd.Index([3, 4, 'All'],
+                                                 name='b',
+                                                 dtype='object'))
+        test_case = pd.crosstab(df.a, df.b, df.c, aggfunc=np.sum,
+                                normalize='all',
+                                margins=True)
+        tm.assert_frame_equal(test_case, norm_sum)
+
+    def test_crosstab_with_empties(self):
+        # Check handling of empties
+        df = pd.DataFrame({'a': [1, 2, 2, 2, 2], 'b': [3, 3, 4, 4, 4],
+                           'c': [np.nan, np.nan, np.nan, np.nan, np.nan]})
+
+        empty = pd.DataFrame([[0.0, 0.0], [0.0, 0.0]],
+                             index=pd.Index([1, 2],
+                                            name='a',
+                                            dtype='int64'),
+                             columns=pd.Index([3, 4], name='b'))
+
+        for i in [True, 'index', 'columns']:
+            calculated = pd.crosstab(df.a, df.b, values=df.c, aggfunc='count',
+                                     normalize=i)
+            tm.assert_frame_equal(empty, calculated)
+
+        nans = pd.DataFrame([[0.0, np.nan], [0.0, 0.0]],
+                            index=pd.Index([1, 2],
+                                           name='a',
+                                           dtype='int64'),
+                            columns=pd.Index([3, 4], name='b'))
+
+        calculated = pd.crosstab(df.a, df.b, values=df.c, aggfunc='count',
+                                 normalize=False)
+        tm.assert_frame_equal(nans, calculated)
+
+    def test_crosstab_errors(self):
+        # Issue 12578
+
+        df = pd.DataFrame({'a': [1, 2, 2, 2, 2], 'b': [3, 3, 4, 4, 4],
+                           'c': [1, 1, np.nan, 1, 1]})
+
+        error = 'values cannot be used without an aggfunc.'
+        with tm.assert_raises_regex(ValueError, error):
+            pd.crosstab(df.a, df.b, values=df.c)
+
+        error = 'aggfunc cannot be used without values'
+        with tm.assert_raises_regex(ValueError, error):
+            pd.crosstab(df.a, df.b, aggfunc=np.mean)
+
+        error = 'Not a valid normalize argument'
+        with tm.assert_raises_regex(ValueError, error):
+            pd.crosstab(df.a, df.b, normalize='42')
+
+        with tm.assert_raises_regex(ValueError, error):
+            pd.crosstab(df.a, df.b, normalize=42)
+
+        error = 'Not a valid margins argument'
+        with tm.assert_raises_regex(ValueError, error):
+            pd.crosstab(df.a, df.b, normalize='all', margins=42)
+
+    def test_crosstab_with_categorial_columns(self):
+        # GH 8860
+        df = pd.DataFrame({'MAKE': ['Honda', 'Acura', 'Tesla',
+                                    'Honda', 'Honda', 'Acura'],
+                           'MODEL': ['Sedan', 'Sedan', 'Electric',
+                                     'Pickup', 'Sedan', 'Sedan']})
+        categories = ['Sedan', 'Electric', 'Pickup']
+        df['MODEL'] = (df['MODEL'].astype('category')
+                                  .cat.set_categories(categories))
+        result = pd.crosstab(df['MAKE'], df['MODEL'])
+
+        expected_index = pd.Index(['Acura', 'Honda', 'Tesla'], name='MAKE')
+        expected_columns = pd.CategoricalIndex(categories,
+                                               categories=categories,
+                                               ordered=False,
+                                               name='MODEL')
+        expected_data = [[2, 0, 0], [2, 0, 1], [0, 1, 0]]
+        expected = pd.DataFrame(expected_data,
+                                index=expected_index,
+                                columns=expected_columns)
+        tm.assert_frame_equal(result, expected)
+
+    def test_crosstab_with_numpy_size(self):
+        # GH 4003
+        df = pd.DataFrame({'A': ['one', 'one', 'two', 'three'] * 6,
+                           'B': ['A', 'B', 'C'] * 8,
+                           'C': ['foo', 'foo', 'foo', 'bar', 'bar', 'bar'] * 4,
+                           'D': np.random.randn(24),
+                           'E': np.random.randn(24)})
+        result = pd.crosstab(index=[df['A'], df['B']],
+                             columns=[df['C']],
+                             margins=True,
+                             aggfunc=np.size,
+                             values=df['D'])
+        expected_index = pd.MultiIndex(levels=[['All', 'one', 'three', 'two'],
+                                               ['', 'A', 'B', 'C']],
+                                       labels=[[1, 1, 1, 2, 2, 2, 3, 3, 3, 0],
+                                               [1, 2, 3, 1, 2, 3, 1, 2, 3, 0]],
+                                       names=['A', 'B'])
+        expected_column = pd.Index(['bar', 'foo', 'All'],
+                                   dtype='object',
+                                   name='C')
+        expected_data = np.array([[2., 2., 4.],
+                                  [2., 2., 4.],
+                                  [2., 2., 4.],
+                                  [2., np.nan, 2.],
+                                  [np.nan, 2., 2.],
+                                  [2., np.nan, 2.],
+                                  [np.nan, 2., 2.],
+                                  [2., np.nan, 2.],
+                                  [np.nan, 2., 2.],
+                                  [12., 12., 24.]])
+        expected = pd.DataFrame(expected_data,
+                                index=expected_index,
+                                columns=expected_column)
+        tm.assert_frame_equal(result, expected)
+
+    def test_crosstab_dup_index_names(self):
+        # GH 13279
+        s = pd.Series(range(3), name='foo')
+
+        result = pd.crosstab(s, s)
+        expected_index = pd.Index(range(3), name='foo')
+        expected = pd.DataFrame(np.eye(3, dtype=np.int64),
+                                index=expected_index,
+                                columns=expected_index)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("names", [['a', ('b', 'c')],
+                                       [('a', 'b'), 'c']])
+    def test_crosstab_tuple_name(self, names):
+        s1 = pd.Series(range(3), name=names[0])
+        s2 = pd.Series(range(1, 4), name=names[1])
+
+        mi = pd.MultiIndex.from_arrays([range(3), range(1, 4)], names=names)
+        expected = pd.Series(1, index=mi).unstack(1, fill_value=0)
+
+        result = pd.crosstab(s1, s2)
+        tm.assert_frame_equal(result, expected)
+
+    def test_crosstab_unsorted_order(self):
+        df = pd.DataFrame({"b": [3, 1, 2], 'a': [5, 4, 6]},
+                          index=['C', 'A', 'B'])
+        result = pd.crosstab(df.index, [df.b, df.a])
+        e_idx = pd.Index(['A', 'B', 'C'], name='row_0')
+        e_columns = pd.MultiIndex.from_tuples([(1, 4), (2, 6), (3, 5)],
+                                              names=['b', 'a'])
+        expected = pd.DataFrame([[1, 0, 0], [0, 1, 0], [0, 0, 1]],
+                                index=e_idx,
+                                columns=e_columns)
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/reshape/test_reshape.py b/pandas/tests/reshape/test_reshape.py
new file mode 100644
index 0000000000000..295801f3e8def
--- /dev/null
+++ b/pandas/tests/reshape/test_reshape.py
@@ -0,0 +1,524 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=W0612,E1101
+
+from warnings import catch_warnings
+import pytest
+from collections import OrderedDict
+
+from pandas import DataFrame, Series
+import pandas as pd
+
+from numpy import nan
+import numpy as np
+
+from pandas.util.testing import assert_frame_equal
+
+from pandas import get_dummies, Categorical, Index
+import pandas.util.testing as tm
+from pandas.compat import u
+
+
+class TestGetDummies(object):
+
+    @pytest.fixture
+    def df(self):
+        return DataFrame({'A': ['a', 'b', 'a'],
+                          'B': ['b', 'b', 'c'],
+                          'C': [1, 2, 3]})
+
+    @pytest.fixture(params=['uint8', 'i8', np.float64, bool, None])
+    def dtype(self, request):
+        return np.dtype(request.param)
+
+    @pytest.fixture(params=['dense', 'sparse'])
+    def sparse(self, request):
+        # params are strings to simplify reading test results,
+        # e.g. TestGetDummies::test_basic[uint8-sparse] instead of [uint8-True]
+        return request.param == 'sparse'
+
+    def effective_dtype(self, dtype):
+        if dtype is None:
+            return np.uint8
+        return dtype
+
+    def test_raises_on_dtype_object(self, df):
+        with pytest.raises(ValueError):
+            get_dummies(df, dtype='object')
+
+    def test_basic(self, sparse, dtype):
+        s_list = list('abc')
+        s_series = Series(s_list)
+        s_series_index = Series(s_list, list('ABC'))
+
+        expected = DataFrame({'a': [1, 0, 0],
+                              'b': [0, 1, 0],
+                              'c': [0, 0, 1]},
+                             dtype=self.effective_dtype(dtype))
+        result = get_dummies(s_list, sparse=sparse, dtype=dtype)
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(s_series, sparse=sparse, dtype=dtype)
+        assert_frame_equal(result, expected)
+
+        expected.index = list('ABC')
+        result = get_dummies(s_series_index, sparse=sparse, dtype=dtype)
+        assert_frame_equal(result, expected)
+
+    def test_basic_types(self, sparse, dtype):
+        # GH 10531
+        s_list = list('abc')
+        s_series = Series(s_list)
+        s_df = DataFrame({'a': [0, 1, 0, 1, 2],
+                          'b': ['A', 'A', 'B', 'C', 'C'],
+                          'c': [2, 3, 3, 3, 2]})
+
+        expected = DataFrame({'a': [1, 0, 0],
+                              'b': [0, 1, 0],
+                              'c': [0, 0, 1]},
+                             dtype=self.effective_dtype(dtype),
+                             columns=list('abc'))
+        if not sparse:
+            compare = tm.assert_frame_equal
+        else:
+            expected = expected.to_sparse(fill_value=0, kind='integer')
+            compare = tm.assert_sp_frame_equal
+
+        result = get_dummies(s_list, sparse=sparse, dtype=dtype)
+        compare(result, expected)
+
+        result = get_dummies(s_series, sparse=sparse, dtype=dtype)
+        compare(result, expected)
+
+        result = get_dummies(s_df, columns=s_df.columns,
+                             sparse=sparse, dtype=dtype)
+        tm.assert_series_equal(result.get_dtype_counts(),
+                               Series({dtype.name: 8}))
+
+        result = get_dummies(s_df, columns=['a'], sparse=sparse, dtype=dtype)
+        dtype_name = self.effective_dtype(dtype).name
+
+        expected_counts = {'int64': 1, 'object': 1}
+        expected_counts[dtype_name] = 3 + expected_counts.get(dtype_name, 0)
+
+        expected = Series(expected_counts).sort_index()
+        tm.assert_series_equal(result.get_dtype_counts().sort_index(),
+                               expected)
+
+    def test_just_na(self, sparse):
+        just_na_list = [np.nan]
+        just_na_series = Series(just_na_list)
+        just_na_series_index = Series(just_na_list, index=['A'])
+
+        res_list = get_dummies(just_na_list, sparse=sparse)
+        res_series = get_dummies(just_na_series, sparse=sparse)
+        res_series_index = get_dummies(just_na_series_index, sparse=sparse)
+
+        assert res_list.empty
+        assert res_series.empty
+        assert res_series_index.empty
+
+        assert res_list.index.tolist() == [0]
+        assert res_series.index.tolist() == [0]
+        assert res_series_index.index.tolist() == ['A']
+
+    def test_include_na(self, sparse, dtype):
+        if sparse:
+            pytest.xfail(reason='nan in index is problematic (GH 16894)')
+
+        s = ['a', 'b', np.nan]
+        res = get_dummies(s, sparse=sparse, dtype=dtype)
+        exp = DataFrame({'a': [1, 0, 0],
+                         'b': [0, 1, 0]},
+                        dtype=self.effective_dtype(dtype))
+        assert_frame_equal(res, exp)
+
+        # Sparse dataframes do not allow nan labelled columns, see #GH8822
+        res_na = get_dummies(s, dummy_na=True, sparse=sparse, dtype=dtype)
+        exp_na = DataFrame({nan: [0, 0, 1],
+                            'a': [1, 0, 0],
+                            'b': [0, 1, 0]},
+                           dtype=self.effective_dtype(dtype))
+        exp_na = exp_na.reindex(['a', 'b', nan], axis=1)
+        # hack (NaN handling in assert_index_equal)
+        exp_na.columns = res_na.columns
+        assert_frame_equal(res_na, exp_na)
+
+        res_just_na = get_dummies([nan], dummy_na=True,
+                                  sparse=sparse, dtype=dtype)
+        exp_just_na = DataFrame(Series(1, index=[0]), columns=[nan],
+                                dtype=self.effective_dtype(dtype))
+        tm.assert_numpy_array_equal(res_just_na.values, exp_just_na.values)
+
+    def test_unicode(self, sparse):
+        # See GH 6885 - get_dummies chokes on unicode values
+        import unicodedata
+        e = 'e'
+        eacute = unicodedata.lookup('LATIN SMALL LETTER E WITH ACUTE')
+        s = [e, eacute, eacute]
+        res = get_dummies(s, prefix='letter', sparse=sparse)
+        exp = DataFrame({'letter_e': [1, 0, 0],
+                         u('letter_%s') % eacute: [0, 1, 1]},
+                        dtype=np.uint8)
+        assert_frame_equal(res, exp)
+
+    def test_dataframe_dummies_all_obj(self, df, sparse):
+        df = df[['A', 'B']]
+        result = get_dummies(df, sparse=sparse)
+        expected = DataFrame({'A_a': [1, 0, 1],
+                              'A_b': [0, 1, 0],
+                              'B_b': [1, 1, 0],
+                              'B_c': [0, 0, 1]},
+                             dtype=np.uint8)
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_mix_default(self, df, sparse, dtype):
+        result = get_dummies(df, sparse=sparse, dtype=dtype)
+        expected = DataFrame({'C': [1, 2, 3],
+                              'A_a': [1, 0, 1],
+                              'A_b': [0, 1, 0],
+                              'B_b': [1, 1, 0],
+                              'B_c': [0, 0, 1]})
+        cols = ['A_a', 'A_b', 'B_b', 'B_c']
+        expected[cols] = expected[cols].astype(dtype)
+        expected = expected[['C', 'A_a', 'A_b', 'B_b', 'B_c']]
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_prefix_list(self, df, sparse):
+        prefixes = ['from_A', 'from_B']
+        result = get_dummies(df, prefix=prefixes, sparse=sparse)
+        expected = DataFrame({'C': [1, 2, 3],
+                              'from_A_a': [1, 0, 1],
+                              'from_A_b': [0, 1, 0],
+                              'from_B_b': [1, 1, 0],
+                              'from_B_c': [0, 0, 1]},
+                             dtype=np.uint8)
+        expected[['C']] = df[['C']]
+        expected = expected[['C', 'from_A_a', 'from_A_b',
+                             'from_B_b', 'from_B_c']]
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_prefix_str(self, df, sparse):
+        # not that you should do this...
+        result = get_dummies(df, prefix='bad', sparse=sparse)
+        bad_columns = ['bad_a', 'bad_b', 'bad_b', 'bad_c']
+        expected = DataFrame([[1, 1, 0, 1, 0],
+                              [2, 0, 1, 1, 0],
+                              [3, 1, 0, 0, 1]],
+                             columns=['C'] + bad_columns,
+                             dtype=np.uint8)
+        expected = expected.astype({"C": np.int64})
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_subset(self, df, sparse):
+        result = get_dummies(df, prefix=['from_A'], columns=['A'],
+                             sparse=sparse)
+        expected = DataFrame({'B': ['b', 'b', 'c'],
+                              'C': [1, 2, 3],
+                              'from_A_a': [1, 0, 1],
+                              'from_A_b': [0, 1, 0]}, dtype=np.uint8)
+        expected[['C']] = df[['C']]
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_prefix_sep(self, df, sparse):
+        result = get_dummies(df, prefix_sep='..', sparse=sparse)
+        expected = DataFrame({'C': [1, 2, 3],
+                              'A..a': [1, 0, 1],
+                              'A..b': [0, 1, 0],
+                              'B..b': [1, 1, 0],
+                              'B..c': [0, 0, 1]},
+                             dtype=np.uint8)
+        expected[['C']] = df[['C']]
+        expected = expected[['C', 'A..a', 'A..b', 'B..b', 'B..c']]
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(df, prefix_sep=['..', '__'], sparse=sparse)
+        expected = expected.rename(columns={'B..b': 'B__b', 'B..c': 'B__c'})
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(df, prefix_sep={'A': '..', 'B': '__'},
+                             sparse=sparse)
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_prefix_bad_length(self, df, sparse):
+        with pytest.raises(ValueError):
+            get_dummies(df, prefix=['too few'], sparse=sparse)
+
+    def test_dataframe_dummies_prefix_sep_bad_length(self, df, sparse):
+        with pytest.raises(ValueError):
+            get_dummies(df, prefix_sep=['bad'], sparse=sparse)
+
+    def test_dataframe_dummies_prefix_dict(self, sparse):
+        prefixes = {'A': 'from_A', 'B': 'from_B'}
+        df = DataFrame({'C': [1, 2, 3],
+                        'A': ['a', 'b', 'a'],
+                        'B': ['b', 'b', 'c']})
+        result = get_dummies(df, prefix=prefixes, sparse=sparse)
+
+        expected = DataFrame({'C': [1, 2, 3],
+                              'from_A_a': [1, 0, 1],
+                              'from_A_b': [0, 1, 0],
+                              'from_B_b': [1, 1, 0],
+                              'from_B_c': [0, 0, 1]})
+
+        columns = ['from_A_a', 'from_A_b', 'from_B_b', 'from_B_c']
+        expected[columns] = expected[columns].astype(np.uint8)
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_with_na(self, df, sparse, dtype):
+        df.loc[3, :] = [np.nan, np.nan, np.nan]
+        result = get_dummies(df, dummy_na=True,
+                             sparse=sparse, dtype=dtype).sort_index(axis=1)
+        expected = DataFrame({'C': [1, 2, 3, np.nan],
+                              'A_a': [1, 0, 1, 0],
+                              'A_b': [0, 1, 0, 0],
+                              'A_nan': [0, 0, 0, 1],
+                              'B_b': [1, 1, 0, 0],
+                              'B_c': [0, 0, 1, 0],
+                              'B_nan': [0, 0, 0, 1]}).sort_index(axis=1)
+
+        e_dtype = self.effective_dtype(dtype)
+        columns = ['A_a', 'A_b', 'A_nan', 'B_b', 'B_c', 'B_nan']
+        expected[columns] = expected[columns].astype(e_dtype)
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(df, dummy_na=False, sparse=sparse, dtype=dtype)
+        expected = expected[['C', 'A_a', 'A_b', 'B_b', 'B_c']]
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_with_categorical(self, df, sparse, dtype):
+        df['cat'] = pd.Categorical(['x', 'y', 'y'])
+        result = get_dummies(df, sparse=sparse, dtype=dtype).sort_index(axis=1)
+        expected = DataFrame({'C': [1, 2, 3],
+                              'A_a': [1, 0, 1],
+                              'A_b': [0, 1, 0],
+                              'B_b': [1, 1, 0],
+                              'B_c': [0, 0, 1],
+                              'cat_x': [1, 0, 0],
+                              'cat_y': [0, 1, 1]}).sort_index(axis=1)
+
+        columns = ['A_a', 'A_b', 'B_b', 'B_c', 'cat_x', 'cat_y']
+        effective_dtype = self.effective_dtype(dtype)
+        expected[columns] = expected[columns].astype(effective_dtype)
+        expected.sort_index(axis=1)
+        assert_frame_equal(result, expected)
+
+    def test_basic_drop_first(self, sparse):
+        # GH12402 Add a new parameter `drop_first` to avoid collinearity
+        # Basic case
+        s_list = list('abc')
+        s_series = Series(s_list)
+        s_series_index = Series(s_list, list('ABC'))
+
+        expected = DataFrame({'b': [0, 1, 0],
+                              'c': [0, 0, 1]},
+                             dtype=np.uint8)
+
+        result = get_dummies(s_list, drop_first=True, sparse=sparse)
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(s_series, drop_first=True, sparse=sparse)
+        assert_frame_equal(result, expected)
+
+        expected.index = list('ABC')
+        result = get_dummies(s_series_index, drop_first=True, sparse=sparse)
+        assert_frame_equal(result, expected)
+
+    def test_basic_drop_first_one_level(self, sparse):
+        # Test the case that categorical variable only has one level.
+        s_list = list('aaa')
+        s_series = Series(s_list)
+        s_series_index = Series(s_list, list('ABC'))
+
+        expected = DataFrame(index=np.arange(3))
+
+        result = get_dummies(s_list, drop_first=True, sparse=sparse)
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(s_series, drop_first=True, sparse=sparse)
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame(index=list('ABC'))
+        result = get_dummies(s_series_index, drop_first=True, sparse=sparse)
+        assert_frame_equal(result, expected)
+
+    def test_basic_drop_first_NA(self, sparse):
+        # Test NA handling together with drop_first
+        s_NA = ['a', 'b', np.nan]
+        res = get_dummies(s_NA, drop_first=True, sparse=sparse)
+        exp = DataFrame({'b': [0, 1, 0]}, dtype=np.uint8)
+        assert_frame_equal(res, exp)
+
+        res_na = get_dummies(s_NA, dummy_na=True, drop_first=True,
+                             sparse=sparse)
+        exp_na = DataFrame(
+            {'b': [0, 1, 0],
+             nan: [0, 0, 1]},
+            dtype=np.uint8).reindex(['b', nan], axis=1)
+        assert_frame_equal(res_na, exp_na)
+
+        res_just_na = get_dummies([nan], dummy_na=True, drop_first=True,
+                                  sparse=sparse)
+        exp_just_na = DataFrame(index=np.arange(1))
+        assert_frame_equal(res_just_na, exp_just_na)
+
+    def test_dataframe_dummies_drop_first(self, df, sparse):
+        df = df[['A', 'B']]
+        result = get_dummies(df, drop_first=True, sparse=sparse)
+        expected = DataFrame({'A_b': [0, 1, 0],
+                              'B_c': [0, 0, 1]},
+                             dtype=np.uint8)
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_drop_first_with_categorical(
+            self, df, sparse, dtype):
+        df['cat'] = pd.Categorical(['x', 'y', 'y'])
+        result = get_dummies(df, drop_first=True, sparse=sparse)
+        expected = DataFrame({'C': [1, 2, 3],
+                              'A_b': [0, 1, 0],
+                              'B_c': [0, 0, 1],
+                              'cat_y': [0, 1, 1]})
+        cols = ['A_b', 'B_c', 'cat_y']
+        expected[cols] = expected[cols].astype(np.uint8)
+        expected = expected[['C', 'A_b', 'B_c', 'cat_y']]
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_drop_first_with_na(self, df, sparse):
+        df.loc[3, :] = [np.nan, np.nan, np.nan]
+        result = get_dummies(df, dummy_na=True, drop_first=True,
+                             sparse=sparse).sort_index(axis=1)
+        expected = DataFrame({'C': [1, 2, 3, np.nan],
+                              'A_b': [0, 1, 0, 0],
+                              'A_nan': [0, 0, 0, 1],
+                              'B_c': [0, 0, 1, 0],
+                              'B_nan': [0, 0, 0, 1]})
+        cols = ['A_b', 'A_nan', 'B_c', 'B_nan']
+        expected[cols] = expected[cols].astype(np.uint8)
+        expected = expected.sort_index(axis=1)
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(df, dummy_na=False, drop_first=True,
+                             sparse=sparse)
+        expected = expected[['C', 'A_b', 'B_c']]
+        assert_frame_equal(result, expected)
+
+    def test_int_int(self):
+        data = Series([1, 2, 1])
+        result = pd.get_dummies(data)
+        expected = DataFrame([[1, 0],
+                              [0, 1],
+                              [1, 0]],
+                             columns=[1, 2],
+                             dtype=np.uint8)
+        tm.assert_frame_equal(result, expected)
+
+        data = Series(pd.Categorical(['a', 'b', 'a']))
+        result = pd.get_dummies(data)
+        expected = DataFrame([[1, 0],
+                              [0, 1],
+                              [1, 0]],
+                             columns=pd.Categorical(['a', 'b']),
+                             dtype=np.uint8)
+        tm.assert_frame_equal(result, expected)
+
+    def test_int_df(self, dtype):
+        data = DataFrame(
+            {'A': [1, 2, 1],
+             'B': pd.Categorical(['a', 'b', 'a']),
+             'C': [1, 2, 1],
+             'D': [1., 2., 1.]
+             }
+        )
+        columns = ['C', 'D', 'A_1', 'A_2', 'B_a', 'B_b']
+        expected = DataFrame([
+            [1, 1., 1, 0, 1, 0],
+            [2, 2., 0, 1, 0, 1],
+            [1, 1., 1, 0, 1, 0]
+        ], columns=columns)
+        expected[columns[2:]] = expected[columns[2:]].astype(dtype)
+        result = pd.get_dummies(data, columns=['A', 'B'], dtype=dtype)
+        tm.assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_preserve_categorical_dtype(self, dtype):
+        # GH13854
+        for ordered in [False, True]:
+            cat = pd.Categorical(list("xy"), categories=list("xyz"),
+                                 ordered=ordered)
+            result = get_dummies(cat, dtype=dtype)
+
+            data = np.array([[1, 0, 0], [0, 1, 0]],
+                            dtype=self.effective_dtype(dtype))
+            cols = pd.CategoricalIndex(cat.categories,
+                                       categories=cat.categories,
+                                       ordered=ordered)
+            expected = DataFrame(data, columns=cols,
+                                 dtype=self.effective_dtype(dtype))
+
+            tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('sparse', [True, False])
+    def test_get_dummies_dont_sparsify_all_columns(self, sparse):
+        # GH18914
+        df = DataFrame.from_dict(OrderedDict([('GDP', [1, 2]),
+                                              ('Nation', ['AB', 'CD'])]))
+        df = get_dummies(df, columns=['Nation'], sparse=sparse)
+        df2 = df.reindex(columns=['GDP'])
+
+        tm.assert_frame_equal(df[['GDP']], df2)
+
+    def test_get_dummies_duplicate_columns(self, df):
+        # GH20839
+        df.columns = ["A", "A", "A"]
+        result = get_dummies(df).sort_index(axis=1)
+
+        expected = DataFrame([[1, 1, 0, 1, 0],
+                              [2, 0, 1, 1, 0],
+                              [3, 1, 0, 0, 1]],
+                             columns=['A', 'A_a', 'A_b', 'A_b', 'A_c'],
+                             dtype=np.uint8).sort_index(axis=1)
+
+        expected = expected.astype({"A": np.int64})
+
+        tm.assert_frame_equal(result, expected)
+
+
+class TestCategoricalReshape(object):
+
+    def test_reshaping_panel_categorical(self):
+
+        with catch_warnings(record=True):
+            p = tm.makePanel()
+            p['str'] = 'foo'
+            df = p.to_frame()
+
+        df['category'] = df['str'].astype('category')
+        result = df['category'].unstack()
+
+        c = Categorical(['foo'] * len(p.major_axis))
+        expected = DataFrame({'A': c.copy(),
+                              'B': c.copy(),
+                              'C': c.copy(),
+                              'D': c.copy()},
+                             columns=Index(list('ABCD'), name='minor'),
+                             index=p.major_axis.set_names('major'))
+        tm.assert_frame_equal(result, expected)
+
+
+class TestMakeAxisDummies(object):
+
+    def test_preserve_categorical_dtype(self):
+        # GH13854
+        for ordered in [False, True]:
+            cidx = pd.CategoricalIndex(list("xyz"), ordered=ordered)
+            midx = pd.MultiIndex(levels=[['a'], cidx],
+                                 labels=[[0, 0], [0, 1]])
+            df = DataFrame([[10, 11]], index=midx)
+
+            expected = DataFrame([[1.0, 0.0, 0.0], [0.0, 1.0, 0.0]],
+                                 index=midx, columns=cidx)
+
+            from pandas.core.reshape.reshape import make_axis_dummies
+            result = make_axis_dummies(df)
+            tm.assert_frame_equal(result, expected)
+
+            result = make_axis_dummies(df, transform=lambda x: x)
+            tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/reshape/test_tile.py b/pandas/tests/reshape/test_tile.py
new file mode 100644
index 0000000000000..807fb2530603a
--- /dev/null
+++ b/pandas/tests/reshape/test_tile.py
@@ -0,0 +1,607 @@
+import os
+import pytest
+
+import numpy as np
+from pandas.compat import zip
+
+import pandas as pd
+from pandas import (DataFrame, Series, isna, to_datetime, DatetimeIndex, Index,
+                    Timestamp, Interval, IntervalIndex, Categorical,
+                    cut, qcut, date_range, NaT, TimedeltaIndex)
+from pandas.tseries.offsets import Nano, Day
+import pandas.util.testing as tm
+from pandas.api.types import CategoricalDtype as CDT
+
+from pandas.core.algorithms import quantile
+import pandas.core.reshape.tile as tmod
+
+
+class TestCut(object):
+
+    def test_simple(self):
+        data = np.ones(5, dtype='int64')
+        result = cut(data, 4, labels=False)
+        expected = np.array([1, 1, 1, 1, 1])
+        tm.assert_numpy_array_equal(result, expected,
+                                    check_dtype=False)
+
+    def test_bins(self):
+        data = np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1])
+        result, bins = cut(data, 3, retbins=True)
+
+        intervals = IntervalIndex.from_breaks(bins.round(3))
+        intervals = intervals.take([0, 0, 0, 1, 2, 0])
+        expected = Categorical(intervals, ordered=True)
+        tm.assert_categorical_equal(result, expected)
+        tm.assert_almost_equal(bins, np.array([0.1905, 3.36666667,
+                                               6.53333333, 9.7]))
+
+    def test_right(self):
+        data = np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1, 2.575])
+        result, bins = cut(data, 4, right=True, retbins=True)
+        intervals = IntervalIndex.from_breaks(bins.round(3))
+        expected = Categorical(intervals, ordered=True)
+        expected = expected.take([0, 0, 0, 2, 3, 0, 0])
+        tm.assert_categorical_equal(result, expected)
+        tm.assert_almost_equal(bins, np.array([0.1905, 2.575, 4.95,
+                                               7.325, 9.7]))
+
+    def test_noright(self):
+        data = np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1, 2.575])
+        result, bins = cut(data, 4, right=False, retbins=True)
+        intervals = IntervalIndex.from_breaks(bins.round(3), closed='left')
+        intervals = intervals.take([0, 0, 0, 2, 3, 0, 1])
+        expected = Categorical(intervals, ordered=True)
+        tm.assert_categorical_equal(result, expected)
+        tm.assert_almost_equal(bins, np.array([0.2, 2.575, 4.95,
+                                               7.325, 9.7095]))
+
+    def test_arraylike(self):
+        data = [.2, 1.4, 2.5, 6.2, 9.7, 2.1]
+        result, bins = cut(data, 3, retbins=True)
+        intervals = IntervalIndex.from_breaks(bins.round(3))
+        intervals = intervals.take([0, 0, 0, 1, 2, 0])
+        expected = Categorical(intervals, ordered=True)
+        tm.assert_categorical_equal(result, expected)
+        tm.assert_almost_equal(bins, np.array([0.1905, 3.36666667,
+                                               6.53333333, 9.7]))
+
+    def test_bins_from_intervalindex(self):
+        c = cut(range(5), 3)
+        expected = c
+        result = cut(range(5), bins=expected.categories)
+        tm.assert_categorical_equal(result, expected)
+
+        expected = Categorical.from_codes(np.append(c.codes, -1),
+                                          categories=c.categories,
+                                          ordered=True)
+        result = cut(range(6), bins=expected.categories)
+        tm.assert_categorical_equal(result, expected)
+
+        # doc example
+        # make sure we preserve the bins
+        ages = np.array([10, 15, 13, 12, 23, 25, 28, 59, 60])
+        c = cut(ages, bins=[0, 18, 35, 70])
+        expected = IntervalIndex.from_tuples([(0, 18), (18, 35), (35, 70)])
+        tm.assert_index_equal(c.categories, expected)
+
+        result = cut([25, 20, 50], bins=c.categories)
+        tm.assert_index_equal(result.categories, expected)
+        tm.assert_numpy_array_equal(result.codes,
+                                    np.array([1, 1, 2], dtype='int8'))
+
+    def test_bins_not_monotonic(self):
+        data = [.2, 1.4, 2.5, 6.2, 9.7, 2.1]
+        pytest.raises(ValueError, cut, data, [0.1, 1.5, 1, 10])
+
+    def test_wrong_num_labels(self):
+        data = [.2, 1.4, 2.5, 6.2, 9.7, 2.1]
+        pytest.raises(ValueError, cut, data, [0, 1, 10],
+                      labels=['foo', 'bar', 'baz'])
+
+    def test_cut_corner(self):
+        # h3h
+        pytest.raises(ValueError, cut, [], 2)
+
+        pytest.raises(ValueError, cut, [1, 2, 3], 0.5)
+
+    @pytest.mark.parametrize('arg', [2, np.eye(2), DataFrame(np.eye(2))])
+    @pytest.mark.parametrize('cut_func', [cut, qcut])
+    def test_cut_not_1d_arg(self, arg, cut_func):
+        with pytest.raises(ValueError):
+            cut_func(arg, 2)
+
+    def test_cut_out_of_range_more(self):
+        # #1511
+        s = Series([0, -1, 0, 1, -3], name='x')
+        ind = cut(s, [0, 1], labels=False)
+        exp = Series([np.nan, np.nan, np.nan, 0, np.nan], name='x')
+        tm.assert_series_equal(ind, exp)
+
+    def test_labels(self):
+        arr = np.tile(np.arange(0, 1.01, 0.1), 4)
+
+        result, bins = cut(arr, 4, retbins=True)
+        ex_levels = IntervalIndex.from_breaks([-1e-3, 0.25, 0.5, 0.75, 1])
+        tm.assert_index_equal(result.categories, ex_levels)
+
+        result, bins = cut(arr, 4, retbins=True, right=False)
+        ex_levels = IntervalIndex.from_breaks([0, 0.25, 0.5, 0.75, 1 + 1e-3],
+                                              closed='left')
+        tm.assert_index_equal(result.categories, ex_levels)
+
+    def test_cut_pass_series_name_to_factor(self):
+        s = Series(np.random.randn(100), name='foo')
+
+        factor = cut(s, 4)
+        assert factor.name == 'foo'
+
+    def test_label_precision(self):
+        arr = np.arange(0, 0.73, 0.01)
+
+        result = cut(arr, 4, precision=2)
+        ex_levels = IntervalIndex.from_breaks([-0.00072, 0.18, 0.36,
+                                               0.54, 0.72])
+        tm.assert_index_equal(result.categories, ex_levels)
+
+    def test_na_handling(self):
+        arr = np.arange(0, 0.75, 0.01)
+        arr[::3] = np.nan
+
+        result = cut(arr, 4)
+
+        result_arr = np.asarray(result)
+
+        ex_arr = np.where(isna(arr), np.nan, result_arr)
+
+        tm.assert_almost_equal(result_arr, ex_arr)
+
+        result = cut(arr, 4, labels=False)
+        ex_result = np.where(isna(arr), np.nan, result)
+        tm.assert_almost_equal(result, ex_result)
+
+    def test_inf_handling(self):
+        data = np.arange(6)
+        data_ser = Series(data, dtype='int64')
+
+        bins = [-np.inf, 2, 4, np.inf]
+        result = cut(data, bins)
+        result_ser = cut(data_ser, bins)
+
+        ex_uniques = IntervalIndex.from_breaks(bins)
+        tm.assert_index_equal(result.categories, ex_uniques)
+        assert result[5] == Interval(4, np.inf)
+        assert result[0] == Interval(-np.inf, 2)
+        assert result_ser[5] == Interval(4, np.inf)
+        assert result_ser[0] == Interval(-np.inf, 2)
+
+    def test_qcut(self):
+        arr = np.random.randn(1000)
+
+        # We store the bins as Index that have been rounded
+        # to comparisons are a bit tricky.
+        labels, bins = qcut(arr, 4, retbins=True)
+        ex_bins = quantile(arr, [0, .25, .5, .75, 1.])
+        result = labels.categories.left.values
+        assert np.allclose(result, ex_bins[:-1], atol=1e-2)
+        result = labels.categories.right.values
+        assert np.allclose(result, ex_bins[1:], atol=1e-2)
+
+        ex_levels = cut(arr, ex_bins, include_lowest=True)
+        tm.assert_categorical_equal(labels, ex_levels)
+
+    def test_qcut_bounds(self):
+        arr = np.random.randn(1000)
+
+        factor = qcut(arr, 10, labels=False)
+        assert len(np.unique(factor)) == 10
+
+    def test_qcut_specify_quantiles(self):
+        arr = np.random.randn(100)
+
+        factor = qcut(arr, [0, .25, .5, .75, 1.])
+        expected = qcut(arr, 4)
+        tm.assert_categorical_equal(factor, expected)
+
+    def test_qcut_all_bins_same(self):
+        tm.assert_raises_regex(ValueError, "edges.*unique", qcut,
+                               [0, 0, 0, 0, 0, 0, 0, 0, 0, 0], 3)
+
+    def test_cut_out_of_bounds(self):
+        arr = np.random.randn(100)
+
+        result = cut(arr, [-1, 0, 1])
+
+        mask = isna(result)
+        ex_mask = (arr < -1) | (arr > 1)
+        tm.assert_numpy_array_equal(mask, ex_mask)
+
+    def test_cut_pass_labels(self):
+        arr = [50, 5, 10, 15, 20, 30, 70]
+        bins = [0, 25, 50, 100]
+        labels = ['Small', 'Medium', 'Large']
+
+        result = cut(arr, bins, labels=labels)
+        exp = Categorical(['Medium'] + 4 * ['Small'] + ['Medium', 'Large'],
+                          categories=labels,
+                          ordered=True)
+        tm.assert_categorical_equal(result, exp)
+
+        result = cut(arr, bins, labels=Categorical.from_codes([0, 1, 2],
+                                                              labels))
+        exp = Categorical.from_codes([1] + 4 * [0] + [1, 2], labels)
+        tm.assert_categorical_equal(result, exp)
+
+        # issue 16459
+        labels = ['Good', 'Medium', 'Bad']
+        result = cut(arr, 3, labels=labels)
+        exp = cut(arr, 3, labels=Categorical(labels, categories=labels,
+                                             ordered=True))
+        tm.assert_categorical_equal(result, exp)
+
+    def test_qcut_include_lowest(self):
+        values = np.arange(10)
+
+        ii = qcut(values, 4)
+
+        ex_levels = IntervalIndex(
+            [Interval(-0.001, 2.25),
+             Interval(2.25, 4.5),
+             Interval(4.5, 6.75),
+             Interval(6.75, 9)])
+        tm.assert_index_equal(ii.categories, ex_levels)
+
+    def test_qcut_nas(self):
+        arr = np.random.randn(100)
+        arr[:20] = np.nan
+
+        result = qcut(arr, 4)
+        assert isna(result[:20]).all()
+
+    def test_qcut_index(self):
+        result = qcut([0, 2], 2)
+        intervals = [Interval(-0.001, 1), Interval(1, 2)]
+        expected = Categorical(intervals, ordered=True)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_round_frac(self):
+        # it works
+        result = cut(np.arange(11.), 2)
+
+        result = cut(np.arange(11.) / 1e10, 2)
+
+        # #1979, negative numbers
+
+        result = tmod._round_frac(-117.9998, precision=3)
+        assert result == -118
+        result = tmod._round_frac(117.9998, precision=3)
+        assert result == 118
+
+        result = tmod._round_frac(117.9998, precision=2)
+        assert result == 118
+        result = tmod._round_frac(0.000123456, precision=2)
+        assert result == 0.00012
+
+    def test_qcut_binning_issues(self, datapath):
+        # #1978, 1979
+        cut_file = datapath(os.path.join('reshape', 'data', 'cut_data.csv'))
+        arr = np.loadtxt(cut_file)
+
+        result = qcut(arr, 20)
+
+        starts = []
+        ends = []
+        for lev in np.unique(result):
+            s = lev.left
+            e = lev.right
+            assert s != e
+
+            starts.append(float(s))
+            ends.append(float(e))
+
+        for (sp, sn), (ep, en) in zip(zip(starts[:-1], starts[1:]),
+                                      zip(ends[:-1], ends[1:])):
+            assert sp < sn
+            assert ep < en
+            assert ep <= sn
+
+    def test_cut_return_intervals(self):
+        s = Series([0, 1, 2, 3, 4, 5, 6, 7, 8])
+        res = cut(s, 3)
+        exp_bins = np.linspace(0, 8, num=4).round(3)
+        exp_bins[0] -= 0.008
+        exp = Series(IntervalIndex.from_breaks(exp_bins, closed='right').take(
+            [0, 0, 0, 1, 1, 1, 2, 2, 2])).astype(CDT(ordered=True))
+        tm.assert_series_equal(res, exp)
+
+    def test_qcut_return_intervals(self):
+        s = Series([0, 1, 2, 3, 4, 5, 6, 7, 8])
+        res = qcut(s, [0, 0.333, 0.666, 1])
+        exp_levels = np.array([Interval(-0.001, 2.664),
+                               Interval(2.664, 5.328), Interval(5.328, 8)])
+        exp = Series(exp_levels.take([0, 0, 0, 1, 1, 1, 2, 2, 2])).astype(
+            CDT(ordered=True))
+        tm.assert_series_equal(res, exp)
+
+    def test_series_retbins(self):
+        # GH 8589
+        s = Series(np.arange(4))
+        result, bins = cut(s, 2, retbins=True)
+        expected = Series(IntervalIndex.from_breaks(
+            [-0.003, 1.5, 3], closed='right').repeat(2)).astype(
+            CDT(ordered=True))
+        tm.assert_series_equal(result, expected)
+
+        result, bins = qcut(s, 2, retbins=True)
+        expected = Series(IntervalIndex.from_breaks(
+            [-0.001, 1.5, 3], closed='right').repeat(2)).astype(
+            CDT(ordered=True))
+        tm.assert_series_equal(result, expected)
+
+    def test_cut_duplicates_bin(self):
+        # issue 20947
+        values = Series(np.array([1, 3, 5, 7, 9]),
+                        index=["a", "b", "c", "d", "e"])
+        bins = [0, 2, 4, 6, 10, 10]
+        result = cut(values, bins, duplicates='drop')
+        expected = cut(values, pd.unique(bins))
+        tm.assert_series_equal(result, expected)
+
+        pytest.raises(ValueError, cut, values, bins)
+        pytest.raises(ValueError, cut, values, bins, duplicates='raise')
+
+        # invalid
+        pytest.raises(ValueError, cut, values, bins, duplicates='foo')
+
+    def test_qcut_duplicates_bin(self):
+        # GH 7751
+        values = [0, 0, 0, 0, 1, 2, 3]
+        expected = IntervalIndex([Interval(-0.001, 1), Interval(1, 3)])
+
+        result = qcut(values, 3, duplicates='drop')
+        tm.assert_index_equal(result.categories, expected)
+
+        pytest.raises(ValueError, qcut, values, 3)
+        pytest.raises(ValueError, qcut, values, 3, duplicates='raise')
+
+        # invalid
+        pytest.raises(ValueError, qcut, values, 3, duplicates='foo')
+
+    def test_single_quantile(self):
+        # issue 15431
+        expected = Series([0, 0])
+
+        s = Series([9., 9.])
+        result = qcut(s, 1, labels=False)
+        tm.assert_series_equal(result, expected)
+        result = qcut(s, 1)
+        intervals = IntervalIndex([Interval(8.999, 9.0),
+                                   Interval(8.999, 9.0)], closed='right')
+        expected = Series(intervals).astype(CDT(ordered=True))
+        tm.assert_series_equal(result, expected)
+
+        s = Series([-9., -9.])
+        expected = Series([0, 0])
+        result = qcut(s, 1, labels=False)
+        tm.assert_series_equal(result, expected)
+        result = qcut(s, 1)
+        intervals = IntervalIndex([Interval(-9.001, -9.0),
+                                   Interval(-9.001, -9.0)], closed='right')
+        expected = Series(intervals).astype(CDT(ordered=True))
+        tm.assert_series_equal(result, expected)
+
+        s = Series([0., 0.])
+        expected = Series([0, 0])
+        result = qcut(s, 1, labels=False)
+        tm.assert_series_equal(result, expected)
+        result = qcut(s, 1)
+        intervals = IntervalIndex([Interval(-0.001, 0.0),
+                                   Interval(-0.001, 0.0)], closed='right')
+        expected = Series(intervals).astype(CDT(ordered=True))
+        tm.assert_series_equal(result, expected)
+
+        s = Series([9])
+        expected = Series([0])
+        result = qcut(s, 1, labels=False)
+        tm.assert_series_equal(result, expected)
+        result = qcut(s, 1)
+        intervals = IntervalIndex([Interval(8.999, 9.0)], closed='right')
+        expected = Series(intervals).astype(CDT(ordered=True))
+        tm.assert_series_equal(result, expected)
+
+        s = Series([-9])
+        expected = Series([0])
+        result = qcut(s, 1, labels=False)
+        tm.assert_series_equal(result, expected)
+        result = qcut(s, 1)
+        intervals = IntervalIndex([Interval(-9.001, -9.0)], closed='right')
+        expected = Series(intervals).astype(CDT(ordered=True))
+        tm.assert_series_equal(result, expected)
+
+        s = Series([0])
+        expected = Series([0])
+        result = qcut(s, 1, labels=False)
+        tm.assert_series_equal(result, expected)
+        result = qcut(s, 1)
+        intervals = IntervalIndex([Interval(-0.001, 0.0)], closed='right')
+        expected = Series(intervals).astype(CDT(ordered=True))
+        tm.assert_series_equal(result, expected)
+
+    def test_single_bin(self):
+        # issue 14652
+        expected = Series([0, 0])
+
+        s = Series([9., 9.])
+        result = cut(s, 1, labels=False)
+        tm.assert_series_equal(result, expected)
+
+        s = Series([-9., -9.])
+        result = cut(s, 1, labels=False)
+        tm.assert_series_equal(result, expected)
+
+        expected = Series([0])
+
+        s = Series([9])
+        result = cut(s, 1, labels=False)
+        tm.assert_series_equal(result, expected)
+
+        s = Series([-9])
+        result = cut(s, 1, labels=False)
+        tm.assert_series_equal(result, expected)
+
+        # issue 15428
+        expected = Series([0, 0])
+
+        s = Series([0., 0.])
+        result = cut(s, 1, labels=False)
+        tm.assert_series_equal(result, expected)
+
+        expected = Series([0])
+
+        s = Series([0])
+        result = cut(s, 1, labels=False)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        "array_1_writeable, array_2_writeable",
+        [(True, True), (True, False), (False, False)])
+    def test_cut_read_only(self, array_1_writeable, array_2_writeable):
+        # issue 18773
+        array_1 = np.arange(0, 100, 10)
+        array_1.flags.writeable = array_1_writeable
+
+        array_2 = np.arange(0, 100, 10)
+        array_2.flags.writeable = array_2_writeable
+
+        hundred_elements = np.arange(100)
+
+        tm.assert_categorical_equal(cut(hundred_elements, array_1),
+                                    cut(hundred_elements, array_2))
+
+
+class TestDatelike(object):
+
+    @pytest.mark.parametrize('s', [
+        Series(DatetimeIndex(['20180101', NaT, '20180103'])),
+        Series(TimedeltaIndex(['0 days', NaT, '2 days']))],
+        ids=lambda x: str(x.dtype))
+    def test_qcut_nat(self, s):
+        # GH 19768
+        intervals = IntervalIndex.from_tuples(
+            [(s[0] - Nano(), s[2] - Day()), np.nan, (s[2] - Day(), s[2])])
+        expected = Series(Categorical(intervals, ordered=True))
+        result = qcut(s, 2)
+        tm.assert_series_equal(result, expected)
+
+    def test_datetime_cut(self):
+        # GH 14714
+        # testing for time data to be present as series
+        data = to_datetime(Series(['2013-01-01', '2013-01-02', '2013-01-03']))
+
+        result, bins = cut(data, 3, retbins=True)
+        expected = (
+            Series(IntervalIndex([
+                Interval(Timestamp('2012-12-31 23:57:07.200000'),
+                         Timestamp('2013-01-01 16:00:00')),
+                Interval(Timestamp('2013-01-01 16:00:00'),
+                         Timestamp('2013-01-02 08:00:00')),
+                Interval(Timestamp('2013-01-02 08:00:00'),
+                         Timestamp('2013-01-03 00:00:00'))]))
+            .astype(CDT(ordered=True)))
+
+        tm.assert_series_equal(result, expected)
+
+        # testing for time data to be present as list
+        data = [np.datetime64('2013-01-01'), np.datetime64('2013-01-02'),
+                np.datetime64('2013-01-03')]
+        result, bins = cut(data, 3, retbins=True)
+        tm.assert_series_equal(Series(result), expected)
+
+        # testing for time data to be present as ndarray
+        data = np.array([np.datetime64('2013-01-01'),
+                         np.datetime64('2013-01-02'),
+                         np.datetime64('2013-01-03')])
+        result, bins = cut(data, 3, retbins=True)
+        tm.assert_series_equal(Series(result), expected)
+
+        # testing for time data to be present as datetime index
+        data = DatetimeIndex(['2013-01-01', '2013-01-02', '2013-01-03'])
+        result, bins = cut(data, 3, retbins=True)
+        tm.assert_series_equal(Series(result), expected)
+
+    @pytest.mark.parametrize('bins', [
+        3, [Timestamp('2013-01-01 04:57:07.200000'),
+            Timestamp('2013-01-01 21:00:00'),
+            Timestamp('2013-01-02 13:00:00'),
+            Timestamp('2013-01-03 05:00:00')]])
+    @pytest.mark.parametrize('box', [list, np.array, Index, Series])
+    def test_datetimetz_cut(self, bins, box):
+        # GH 19872
+        tz = 'US/Eastern'
+        s = Series(date_range('20130101', periods=3, tz=tz))
+        if not isinstance(bins, int):
+            bins = box(bins)
+        result = cut(s, bins)
+        expected = (
+            Series(IntervalIndex([
+                Interval(Timestamp('2012-12-31 23:57:07.200000', tz=tz),
+                         Timestamp('2013-01-01 16:00:00', tz=tz)),
+                Interval(Timestamp('2013-01-01 16:00:00', tz=tz),
+                         Timestamp('2013-01-02 08:00:00', tz=tz)),
+                Interval(Timestamp('2013-01-02 08:00:00', tz=tz),
+                         Timestamp('2013-01-03 00:00:00', tz=tz))]))
+            .astype(CDT(ordered=True)))
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('bins', [3, np.linspace(0, 1, 4)])
+    def test_datetimetz_qcut(self, bins):
+        # GH 19872
+        tz = 'US/Eastern'
+        s = Series(date_range('20130101', periods=3, tz=tz))
+        result = qcut(s, bins)
+        expected = (
+            Series(IntervalIndex([
+                Interval(Timestamp('2012-12-31 23:59:59.999999999', tz=tz),
+                         Timestamp('2013-01-01 16:00:00', tz=tz)),
+                Interval(Timestamp('2013-01-01 16:00:00', tz=tz),
+                         Timestamp('2013-01-02 08:00:00', tz=tz)),
+                Interval(Timestamp('2013-01-02 08:00:00', tz=tz),
+                         Timestamp('2013-01-03 00:00:00', tz=tz))]))
+            .astype(CDT(ordered=True)))
+        tm.assert_series_equal(result, expected)
+
+    def test_datetime_bin(self):
+        data = [np.datetime64('2012-12-13'), np.datetime64('2012-12-15')]
+        bin_data = ['2012-12-12', '2012-12-14', '2012-12-16']
+        expected = (
+            Series(IntervalIndex([
+                Interval(Timestamp(bin_data[0]), Timestamp(bin_data[1])),
+                Interval(Timestamp(bin_data[1]), Timestamp(bin_data[2]))]))
+            .astype(CDT(ordered=True)))
+
+        for conv in [Timestamp, Timestamp, np.datetime64]:
+            bins = [conv(v) for v in bin_data]
+            result = cut(data, bins=bins)
+            tm.assert_series_equal(Series(result), expected)
+
+        bin_pydatetime = [Timestamp(v).to_pydatetime() for v in bin_data]
+        result = cut(data, bins=bin_pydatetime)
+        tm.assert_series_equal(Series(result), expected)
+
+        bins = to_datetime(bin_data)
+        result = cut(data, bins=bin_pydatetime)
+        tm.assert_series_equal(Series(result), expected)
+
+    def test_datetime_nan(self):
+
+        def f():
+            cut(date_range('20130101', periods=3), bins=[0, 2, 4])
+        pytest.raises(ValueError, f)
+
+        result = cut(date_range('20130102', periods=5),
+                     bins=date_range('20130101', periods=2))
+        mask = result.categories.isna()
+        tm.assert_numpy_array_equal(mask, np.array([False]))
+        mask = result.isna()
+        tm.assert_numpy_array_equal(
+            mask, np.array([False, True, True, True, True]))
diff --git a/pandas/tests/reshape/test_union_categoricals.py b/pandas/tests/reshape/test_union_categoricals.py
new file mode 100644
index 0000000000000..8743d11118200
--- /dev/null
+++ b/pandas/tests/reshape/test_union_categoricals.py
@@ -0,0 +1,345 @@
+import pytest
+
+import numpy as np
+import pandas as pd
+from pandas import Categorical, Series, CategoricalIndex
+from pandas.core.dtypes.concat import union_categoricals
+from pandas.util import testing as tm
+
+
+class TestUnionCategoricals(object):
+
+    def test_union_categorical(self):
+        # GH 13361
+        data = [
+            (list('abc'), list('abd'), list('abcabd')),
+            ([0, 1, 2], [2, 3, 4], [0, 1, 2, 2, 3, 4]),
+            ([0, 1.2, 2], [2, 3.4, 4], [0, 1.2, 2, 2, 3.4, 4]),
+
+            (['b', 'b', np.nan, 'a'], ['a', np.nan, 'c'],
+             ['b', 'b', np.nan, 'a', 'a', np.nan, 'c']),
+
+            (pd.date_range('2014-01-01', '2014-01-05'),
+             pd.date_range('2014-01-06', '2014-01-07'),
+             pd.date_range('2014-01-01', '2014-01-07')),
+
+            (pd.date_range('2014-01-01', '2014-01-05', tz='US/Central'),
+             pd.date_range('2014-01-06', '2014-01-07', tz='US/Central'),
+             pd.date_range('2014-01-01', '2014-01-07', tz='US/Central')),
+
+            (pd.period_range('2014-01-01', '2014-01-05'),
+             pd.period_range('2014-01-06', '2014-01-07'),
+             pd.period_range('2014-01-01', '2014-01-07')),
+        ]
+
+        for a, b, combined in data:
+            for box in [Categorical, CategoricalIndex, Series]:
+                result = union_categoricals([box(Categorical(a)),
+                                             box(Categorical(b))])
+                expected = Categorical(combined)
+                tm.assert_categorical_equal(result, expected,
+                                            check_category_order=True)
+
+        # new categories ordered by appearance
+        s = Categorical(['x', 'y', 'z'])
+        s2 = Categorical(['a', 'b', 'c'])
+        result = union_categoricals([s, s2])
+        expected = Categorical(['x', 'y', 'z', 'a', 'b', 'c'],
+                               categories=['x', 'y', 'z', 'a', 'b', 'c'])
+        tm.assert_categorical_equal(result, expected)
+
+        s = Categorical([0, 1.2, 2], ordered=True)
+        s2 = Categorical([0, 1.2, 2], ordered=True)
+        result = union_categoricals([s, s2])
+        expected = Categorical([0, 1.2, 2, 0, 1.2, 2], ordered=True)
+        tm.assert_categorical_equal(result, expected)
+
+        # must exactly match types
+        s = Categorical([0, 1.2, 2])
+        s2 = Categorical([2, 3, 4])
+        msg = 'dtype of categories must be the same'
+        with tm.assert_raises_regex(TypeError, msg):
+            union_categoricals([s, s2])
+
+        msg = 'No Categoricals to union'
+        with tm.assert_raises_regex(ValueError, msg):
+            union_categoricals([])
+
+    def test_union_categoricals_nan(self):
+        # GH 13759
+        res = union_categoricals([pd.Categorical([1, 2, np.nan]),
+                                  pd.Categorical([3, 2, np.nan])])
+        exp = Categorical([1, 2, np.nan, 3, 2, np.nan])
+        tm.assert_categorical_equal(res, exp)
+
+        res = union_categoricals([pd.Categorical(['A', 'B']),
+                                  pd.Categorical(['B', 'B', np.nan])])
+        exp = Categorical(['A', 'B', 'B', 'B', np.nan])
+        tm.assert_categorical_equal(res, exp)
+
+        val1 = [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-03-01'),
+                pd.NaT]
+        val2 = [pd.NaT, pd.Timestamp('2011-01-01'),
+                pd.Timestamp('2011-02-01')]
+
+        res = union_categoricals([pd.Categorical(val1), pd.Categorical(val2)])
+        exp = Categorical(val1 + val2,
+                          categories=[pd.Timestamp('2011-01-01'),
+                                      pd.Timestamp('2011-03-01'),
+                                      pd.Timestamp('2011-02-01')])
+        tm.assert_categorical_equal(res, exp)
+
+        # all NaN
+        res = union_categoricals([pd.Categorical(np.array([np.nan, np.nan],
+                                                          dtype=object)),
+                                  pd.Categorical(['X'])])
+        exp = Categorical([np.nan, np.nan, 'X'])
+        tm.assert_categorical_equal(res, exp)
+
+        res = union_categoricals([pd.Categorical([np.nan, np.nan]),
+                                  pd.Categorical([np.nan, np.nan])])
+        exp = Categorical([np.nan, np.nan, np.nan, np.nan])
+        tm.assert_categorical_equal(res, exp)
+
+    def test_union_categoricals_empty(self):
+        # GH 13759
+        res = union_categoricals([pd.Categorical([]),
+                                  pd.Categorical([])])
+        exp = Categorical([])
+        tm.assert_categorical_equal(res, exp)
+
+        res = union_categoricals([Categorical([]),
+                                  Categorical(['1'])])
+        exp = Categorical(['1'])
+        tm.assert_categorical_equal(res, exp)
+
+    def test_union_categorical_same_category(self):
+        # check fastpath
+        c1 = Categorical([1, 2, 3, 4], categories=[1, 2, 3, 4])
+        c2 = Categorical([3, 2, 1, np.nan], categories=[1, 2, 3, 4])
+        res = union_categoricals([c1, c2])
+        exp = Categorical([1, 2, 3, 4, 3, 2, 1, np.nan],
+                          categories=[1, 2, 3, 4])
+        tm.assert_categorical_equal(res, exp)
+
+        c1 = Categorical(['z', 'z', 'z'], categories=['x', 'y', 'z'])
+        c2 = Categorical(['x', 'x', 'x'], categories=['x', 'y', 'z'])
+        res = union_categoricals([c1, c2])
+        exp = Categorical(['z', 'z', 'z', 'x', 'x', 'x'],
+                          categories=['x', 'y', 'z'])
+        tm.assert_categorical_equal(res, exp)
+
+    def test_union_categorical_same_categories_different_order(self):
+        # https://github.com/pandas-dev/pandas/issues/19096
+        c1 = Categorical(['a', 'b', 'c'], categories=['a', 'b', 'c'])
+        c2 = Categorical(['a', 'b', 'c'], categories=['b', 'a', 'c'])
+        result = union_categoricals([c1, c2])
+        expected = Categorical(['a', 'b', 'c', 'a', 'b', 'c'],
+                               categories=['a', 'b', 'c'])
+        tm.assert_categorical_equal(result, expected)
+
+    def test_union_categoricals_ordered(self):
+        c1 = Categorical([1, 2, 3], ordered=True)
+        c2 = Categorical([1, 2, 3], ordered=False)
+
+        msg = 'Categorical.ordered must be the same'
+        with tm.assert_raises_regex(TypeError, msg):
+            union_categoricals([c1, c2])
+
+        res = union_categoricals([c1, c1])
+        exp = Categorical([1, 2, 3, 1, 2, 3], ordered=True)
+        tm.assert_categorical_equal(res, exp)
+
+        c1 = Categorical([1, 2, 3, np.nan], ordered=True)
+        c2 = Categorical([3, 2], categories=[1, 2, 3], ordered=True)
+
+        res = union_categoricals([c1, c2])
+        exp = Categorical([1, 2, 3, np.nan, 3, 2], ordered=True)
+        tm.assert_categorical_equal(res, exp)
+
+        c1 = Categorical([1, 2, 3], ordered=True)
+        c2 = Categorical([1, 2, 3], categories=[3, 2, 1], ordered=True)
+
+        msg = "to union ordered Categoricals, all categories must be the same"
+        with tm.assert_raises_regex(TypeError, msg):
+            union_categoricals([c1, c2])
+
+    def test_union_categoricals_ignore_order(self):
+        # GH 15219
+        c1 = Categorical([1, 2, 3], ordered=True)
+        c2 = Categorical([1, 2, 3], ordered=False)
+
+        res = union_categoricals([c1, c2], ignore_order=True)
+        exp = Categorical([1, 2, 3, 1, 2, 3])
+        tm.assert_categorical_equal(res, exp)
+
+        msg = 'Categorical.ordered must be the same'
+        with tm.assert_raises_regex(TypeError, msg):
+            union_categoricals([c1, c2], ignore_order=False)
+
+        res = union_categoricals([c1, c1], ignore_order=True)
+        exp = Categorical([1, 2, 3, 1, 2, 3])
+        tm.assert_categorical_equal(res, exp)
+
+        res = union_categoricals([c1, c1], ignore_order=False)
+        exp = Categorical([1, 2, 3, 1, 2, 3],
+                          categories=[1, 2, 3], ordered=True)
+        tm.assert_categorical_equal(res, exp)
+
+        c1 = Categorical([1, 2, 3, np.nan], ordered=True)
+        c2 = Categorical([3, 2], categories=[1, 2, 3], ordered=True)
+
+        res = union_categoricals([c1, c2], ignore_order=True)
+        exp = Categorical([1, 2, 3, np.nan, 3, 2])
+        tm.assert_categorical_equal(res, exp)
+
+        c1 = Categorical([1, 2, 3], ordered=True)
+        c2 = Categorical([1, 2, 3], categories=[3, 2, 1], ordered=True)
+
+        res = union_categoricals([c1, c2], ignore_order=True)
+        exp = Categorical([1, 2, 3, 1, 2, 3])
+        tm.assert_categorical_equal(res, exp)
+
+        res = union_categoricals([c2, c1], ignore_order=True,
+                                 sort_categories=True)
+        exp = Categorical([1, 2, 3, 1, 2, 3], categories=[1, 2, 3])
+        tm.assert_categorical_equal(res, exp)
+
+        c1 = Categorical([1, 2, 3], ordered=True)
+        c2 = Categorical([4, 5, 6], ordered=True)
+        result = union_categoricals([c1, c2], ignore_order=True)
+        expected = Categorical([1, 2, 3, 4, 5, 6])
+        tm.assert_categorical_equal(result, expected)
+
+        msg = "to union ordered Categoricals, all categories must be the same"
+        with tm.assert_raises_regex(TypeError, msg):
+            union_categoricals([c1, c2], ignore_order=False)
+
+        with tm.assert_raises_regex(TypeError, msg):
+            union_categoricals([c1, c2])
+
+    def test_union_categoricals_sort(self):
+        # GH 13846
+        c1 = Categorical(['x', 'y', 'z'])
+        c2 = Categorical(['a', 'b', 'c'])
+        result = union_categoricals([c1, c2], sort_categories=True)
+        expected = Categorical(['x', 'y', 'z', 'a', 'b', 'c'],
+                               categories=['a', 'b', 'c', 'x', 'y', 'z'])
+        tm.assert_categorical_equal(result, expected)
+
+        # fastpath
+        c1 = Categorical(['a', 'b'], categories=['b', 'a', 'c'])
+        c2 = Categorical(['b', 'c'], categories=['b', 'a', 'c'])
+        result = union_categoricals([c1, c2], sort_categories=True)
+        expected = Categorical(['a', 'b', 'b', 'c'],
+                               categories=['a', 'b', 'c'])
+        tm.assert_categorical_equal(result, expected)
+
+        c1 = Categorical(['a', 'b'], categories=['c', 'a', 'b'])
+        c2 = Categorical(['b', 'c'], categories=['c', 'a', 'b'])
+        result = union_categoricals([c1, c2], sort_categories=True)
+        expected = Categorical(['a', 'b', 'b', 'c'],
+                               categories=['a', 'b', 'c'])
+        tm.assert_categorical_equal(result, expected)
+
+        # fastpath - skip resort
+        c1 = Categorical(['a', 'b'], categories=['a', 'b', 'c'])
+        c2 = Categorical(['b', 'c'], categories=['a', 'b', 'c'])
+        result = union_categoricals([c1, c2], sort_categories=True)
+        expected = Categorical(['a', 'b', 'b', 'c'],
+                               categories=['a', 'b', 'c'])
+        tm.assert_categorical_equal(result, expected)
+
+        c1 = Categorical(['x', np.nan])
+        c2 = Categorical([np.nan, 'b'])
+        result = union_categoricals([c1, c2], sort_categories=True)
+        expected = Categorical(['x', np.nan, np.nan, 'b'],
+                               categories=['b', 'x'])
+        tm.assert_categorical_equal(result, expected)
+
+        c1 = Categorical([np.nan])
+        c2 = Categorical([np.nan])
+        result = union_categoricals([c1, c2], sort_categories=True)
+        expected = Categorical([np.nan, np.nan])
+        tm.assert_categorical_equal(result, expected)
+
+        c1 = Categorical([])
+        c2 = Categorical([])
+        result = union_categoricals([c1, c2], sort_categories=True)
+        expected = Categorical([])
+        tm.assert_categorical_equal(result, expected)
+
+        c1 = Categorical(['b', 'a'], categories=['b', 'a', 'c'], ordered=True)
+        c2 = Categorical(['a', 'c'], categories=['b', 'a', 'c'], ordered=True)
+        with pytest.raises(TypeError):
+            union_categoricals([c1, c2], sort_categories=True)
+
+    def test_union_categoricals_sort_false(self):
+        # GH 13846
+        c1 = Categorical(['x', 'y', 'z'])
+        c2 = Categorical(['a', 'b', 'c'])
+        result = union_categoricals([c1, c2], sort_categories=False)
+        expected = Categorical(['x', 'y', 'z', 'a', 'b', 'c'],
+                               categories=['x', 'y', 'z', 'a', 'b', 'c'])
+        tm.assert_categorical_equal(result, expected)
+
+        # fastpath
+        c1 = Categorical(['a', 'b'], categories=['b', 'a', 'c'])
+        c2 = Categorical(['b', 'c'], categories=['b', 'a', 'c'])
+        result = union_categoricals([c1, c2], sort_categories=False)
+        expected = Categorical(['a', 'b', 'b', 'c'],
+                               categories=['b', 'a', 'c'])
+        tm.assert_categorical_equal(result, expected)
+
+        # fastpath - skip resort
+        c1 = Categorical(['a', 'b'], categories=['a', 'b', 'c'])
+        c2 = Categorical(['b', 'c'], categories=['a', 'b', 'c'])
+        result = union_categoricals([c1, c2], sort_categories=False)
+        expected = Categorical(['a', 'b', 'b', 'c'],
+                               categories=['a', 'b', 'c'])
+        tm.assert_categorical_equal(result, expected)
+
+        c1 = Categorical(['x', np.nan])
+        c2 = Categorical([np.nan, 'b'])
+        result = union_categoricals([c1, c2], sort_categories=False)
+        expected = Categorical(['x', np.nan, np.nan, 'b'],
+                               categories=['x', 'b'])
+        tm.assert_categorical_equal(result, expected)
+
+        c1 = Categorical([np.nan])
+        c2 = Categorical([np.nan])
+        result = union_categoricals([c1, c2], sort_categories=False)
+        expected = Categorical([np.nan, np.nan])
+        tm.assert_categorical_equal(result, expected)
+
+        c1 = Categorical([])
+        c2 = Categorical([])
+        result = union_categoricals([c1, c2], sort_categories=False)
+        expected = Categorical([])
+        tm.assert_categorical_equal(result, expected)
+
+        c1 = Categorical(['b', 'a'], categories=['b', 'a', 'c'], ordered=True)
+        c2 = Categorical(['a', 'c'], categories=['b', 'a', 'c'], ordered=True)
+        result = union_categoricals([c1, c2], sort_categories=False)
+        expected = Categorical(['b', 'a', 'a', 'c'],
+                               categories=['b', 'a', 'c'], ordered=True)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_union_categorical_unwrap(self):
+        # GH 14173
+        c1 = Categorical(['a', 'b'])
+        c2 = pd.Series(['b', 'c'], dtype='category')
+        result = union_categoricals([c1, c2])
+        expected = Categorical(['a', 'b', 'b', 'c'])
+        tm.assert_categorical_equal(result, expected)
+
+        c2 = CategoricalIndex(c2)
+        result = union_categoricals([c1, c2])
+        tm.assert_categorical_equal(result, expected)
+
+        c1 = Series(c1)
+        result = union_categoricals([c1, c2])
+        tm.assert_categorical_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            union_categoricals([c1, ['a', 'b', 'c']])
diff --git a/pandas/tests/reshape/test_util.py b/pandas/tests/reshape/test_util.py
new file mode 100644
index 0000000000000..e4a9591b95c26
--- /dev/null
+++ b/pandas/tests/reshape/test_util.py
@@ -0,0 +1,49 @@
+
+import numpy as np
+from pandas import date_range, Index
+import pandas.util.testing as tm
+from pandas.core.reshape.util import cartesian_product
+
+
+class TestCartesianProduct(object):
+
+    def test_simple(self):
+        x, y = list('ABC'), [1, 22]
+        result1, result2 = cartesian_product([x, y])
+        expected1 = np.array(['A', 'A', 'B', 'B', 'C', 'C'])
+        expected2 = np.array([1, 22, 1, 22, 1, 22])
+        tm.assert_numpy_array_equal(result1, expected1)
+        tm.assert_numpy_array_equal(result2, expected2)
+
+    def test_datetimeindex(self):
+        # regression test for GitHub issue #6439
+        # make sure that the ordering on datetimeindex is consistent
+        x = date_range('2000-01-01', periods=2)
+        result1, result2 = [Index(y).day for y in cartesian_product([x, x])]
+        expected1 = Index([1, 1, 2, 2])
+        expected2 = Index([1, 2, 1, 2])
+        tm.assert_index_equal(result1, expected1)
+        tm.assert_index_equal(result2, expected2)
+
+    def test_empty(self):
+        # product of empty factors
+        X = [[], [0, 1], []]
+        Y = [[], [], ['a', 'b', 'c']]
+        for x, y in zip(X, Y):
+            expected1 = np.array([], dtype=np.asarray(x).dtype)
+            expected2 = np.array([], dtype=np.asarray(y).dtype)
+            result1, result2 = cartesian_product([x, y])
+            tm.assert_numpy_array_equal(result1, expected1)
+            tm.assert_numpy_array_equal(result2, expected2)
+
+        # empty product (empty input):
+        result = cartesian_product([])
+        expected = []
+        assert result == expected
+
+    def test_invalid_input(self):
+        invalid_inputs = [1, [1], [1, 2], [[1], 2],
+                          'a', ['a'], ['a', 'b'], [['a'], 'b']]
+        msg = "Input must be a list-like of list-likes"
+        for X in invalid_inputs:
+            tm.assert_raises_regex(TypeError, msg, cartesian_product, X=X)
diff --git a/pandas/tests/scalar/__init__.py b/pandas/tests/scalar/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/scalar/interval/__init__.py b/pandas/tests/scalar/interval/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/scalar/interval/test_interval.py b/pandas/tests/scalar/interval/test_interval.py
new file mode 100644
index 0000000000000..c9e6e84d226a8
--- /dev/null
+++ b/pandas/tests/scalar/interval/test_interval.py
@@ -0,0 +1,202 @@
+from __future__ import division
+
+import numpy as np
+from pandas import Interval, Timestamp, Timedelta
+import pandas.core.common as com
+
+import pytest
+import pandas.util.testing as tm
+
+
+@pytest.fixture
+def interval():
+    return Interval(0, 1)
+
+
+class TestInterval(object):
+
+    def test_properties(self, interval):
+        assert interval.closed == 'right'
+        assert interval.left == 0
+        assert interval.right == 1
+        assert interval.mid == 0.5
+
+    def test_repr(self, interval):
+        assert repr(interval) == "Interval(0, 1, closed='right')"
+        assert str(interval) == "(0, 1]"
+
+        interval_left = Interval(0, 1, closed='left')
+        assert repr(interval_left) == "Interval(0, 1, closed='left')"
+        assert str(interval_left) == "[0, 1)"
+
+    def test_contains(self, interval):
+        assert 0.5 in interval
+        assert 1 in interval
+        assert 0 not in interval
+
+        msg = "__contains__ not defined for two intervals"
+        with tm.assert_raises_regex(TypeError, msg):
+            interval in interval
+
+        interval_both = Interval(0, 1, closed='both')
+        assert 0 in interval_both
+        assert 1 in interval_both
+
+        interval_neither = Interval(0, 1, closed='neither')
+        assert 0 not in interval_neither
+        assert 0.5 in interval_neither
+        assert 1 not in interval_neither
+
+    def test_equal(self):
+        assert Interval(0, 1) == Interval(0, 1, closed='right')
+        assert Interval(0, 1) != Interval(0, 1, closed='left')
+        assert Interval(0, 1) != 0
+
+    def test_comparison(self):
+        with tm.assert_raises_regex(TypeError, 'unorderable types'):
+            Interval(0, 1) < 2
+
+        assert Interval(0, 1) < Interval(1, 2)
+        assert Interval(0, 1) < Interval(0, 2)
+        assert Interval(0, 1) < Interval(0.5, 1.5)
+        assert Interval(0, 1) <= Interval(0, 1)
+        assert Interval(0, 1) > Interval(-1, 2)
+        assert Interval(0, 1) >= Interval(0, 1)
+
+    def test_hash(self, interval):
+        # should not raise
+        hash(interval)
+
+    @pytest.mark.parametrize('left, right, expected', [
+        (0, 5, 5),
+        (-2, 5.5, 7.5),
+        (10, 10, 0),
+        (10, np.inf, np.inf),
+        (-np.inf, -5, np.inf),
+        (-np.inf, np.inf, np.inf),
+        (Timedelta('0 days'), Timedelta('5 days'), Timedelta('5 days')),
+        (Timedelta('10 days'), Timedelta('10 days'), Timedelta('0 days')),
+        (Timedelta('1H10M'), Timedelta('5H5M'), Timedelta('3H55M')),
+        (Timedelta('5S'), Timedelta('1H'), Timedelta('59M55S'))])
+    def test_length(self, left, right, expected):
+        # GH 18789
+        iv = Interval(left, right)
+        result = iv.length
+        assert result == expected
+
+    @pytest.mark.parametrize('left, right, expected', [
+        ('2017-01-01', '2017-01-06', '5 days'),
+        ('2017-01-01', '2017-01-01 12:00:00', '12 hours'),
+        ('2017-01-01 12:00', '2017-01-01 12:00:00', '0 days'),
+        ('2017-01-01 12:01', '2017-01-05 17:31:00', '4 days 5 hours 30 min')])
+    @pytest.mark.parametrize('tz', (None, 'UTC', 'CET', 'US/Eastern'))
+    def test_length_timestamp(self, tz, left, right, expected):
+        # GH 18789
+        iv = Interval(Timestamp(left, tz=tz), Timestamp(right, tz=tz))
+        result = iv.length
+        expected = Timedelta(expected)
+        assert result == expected
+
+    @pytest.mark.parametrize('left, right', [
+        ('a', 'z'),
+        (('a', 'b'), ('c', 'd')),
+        (list('AB'), list('ab')),
+        (Interval(0, 1), Interval(1, 2))])
+    def test_length_errors(self, left, right):
+        # GH 18789
+        iv = Interval(left, right)
+        msg = 'cannot compute length between .* and .*'
+        with tm.assert_raises_regex(TypeError, msg):
+            iv.length
+
+    def test_math_add(self, interval):
+        expected = Interval(1, 2)
+        actual = interval + 1
+        assert expected == actual
+
+        expected = Interval(1, 2)
+        actual = 1 + interval
+        assert expected == actual
+
+        actual = interval
+        actual += 1
+        assert expected == actual
+
+        msg = r"unsupported operand type\(s\) for \+"
+        with tm.assert_raises_regex(TypeError, msg):
+            interval + Interval(1, 2)
+
+        with tm.assert_raises_regex(TypeError, msg):
+            interval + 'foo'
+
+    def test_math_sub(self, interval):
+        expected = Interval(-1, 0)
+        actual = interval - 1
+        assert expected == actual
+
+        actual = interval
+        actual -= 1
+        assert expected == actual
+
+        msg = r"unsupported operand type\(s\) for -"
+        with tm.assert_raises_regex(TypeError, msg):
+            interval - Interval(1, 2)
+
+        with tm.assert_raises_regex(TypeError, msg):
+            interval - 'foo'
+
+    def test_math_mult(self, interval):
+        expected = Interval(0, 2)
+        actual = interval * 2
+        assert expected == actual
+
+        expected = Interval(0, 2)
+        actual = 2 * interval
+        assert expected == actual
+
+        actual = interval
+        actual *= 2
+        assert expected == actual
+
+        msg = r"unsupported operand type\(s\) for \*"
+        with tm.assert_raises_regex(TypeError, msg):
+            interval * Interval(1, 2)
+
+        msg = r"can\'t multiply sequence by non-int"
+        with tm.assert_raises_regex(TypeError, msg):
+            interval * 'foo'
+
+    def test_math_div(self, interval):
+        expected = Interval(0, 0.5)
+        actual = interval / 2.0
+        assert expected == actual
+
+        actual = interval
+        actual /= 2.0
+        assert expected == actual
+
+        msg = r"unsupported operand type\(s\) for /"
+        with tm.assert_raises_regex(TypeError, msg):
+            interval / Interval(1, 2)
+
+        with tm.assert_raises_regex(TypeError, msg):
+            interval / 'foo'
+
+    def test_constructor_errors(self):
+        msg = "invalid option for 'closed': foo"
+        with tm.assert_raises_regex(ValueError, msg):
+            Interval(0, 1, closed='foo')
+
+        msg = 'left side of interval must be <= right side'
+        with tm.assert_raises_regex(ValueError, msg):
+            Interval(1, 0)
+
+    @pytest.mark.parametrize('tz_left, tz_right', [
+        (None, 'UTC'), ('UTC', None), ('UTC', 'US/Eastern')])
+    def test_constructor_errors_tz(self, tz_left, tz_right):
+        # GH 18538
+        left = Timestamp('2017-01-01', tz=tz_left)
+        right = Timestamp('2017-01-02', tz=tz_right)
+        error = TypeError if com._any_none(tz_left, tz_right) else ValueError
+        with pytest.raises(error):
+            Interval(left, right)
diff --git a/pandas/tests/scalar/period/__init__.py b/pandas/tests/scalar/period/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/scalar/period/test_asfreq.py b/pandas/tests/scalar/period/test_asfreq.py
new file mode 100644
index 0000000000000..474d19809b03c
--- /dev/null
+++ b/pandas/tests/scalar/period/test_asfreq.py
@@ -0,0 +1,748 @@
+import pytest
+
+from pandas.errors import OutOfBoundsDatetime
+
+import pandas as pd
+from pandas import Period, offsets
+from pandas.util import testing as tm
+from pandas._libs.tslibs.frequencies import _period_code_map
+
+
+class TestFreqConversion(object):
+    """Test frequency conversion of date objects"""
+    @pytest.mark.parametrize('freq', ['A', 'Q', 'M', 'W', 'B', 'D'])
+    def test_asfreq_near_zero(self, freq):
+        # GH#19643, GH#19650
+        per = Period('0001-01-01', freq=freq)
+        tup1 = (per.year, per.hour, per.day)
+
+        prev = per - 1
+        assert (per - 1).ordinal == per.ordinal - 1
+        tup2 = (prev.year, prev.month, prev.day)
+        assert tup2 < tup1
+
+    def test_asfreq_near_zero_weekly(self):
+        # GH#19834
+        per1 = Period('0001-01-01', 'D') + 6
+        per2 = Period('0001-01-01', 'D') - 6
+        week1 = per1.asfreq('W')
+        week2 = per2.asfreq('W')
+        assert week1 != week2
+        assert week1.asfreq('D', 'E') >= per1
+        assert week2.asfreq('D', 'S') <= per2
+
+    @pytest.mark.xfail(reason='GH#19643 period_helper asfreq functions fail '
+                              'to check for overflows')
+    def test_to_timestamp_out_of_bounds(self):
+        # GH#19643, currently gives Timestamp('1754-08-30 22:43:41.128654848')
+        per = Period('0001-01-01', freq='B')
+        with pytest.raises(OutOfBoundsDatetime):
+            per.to_timestamp()
+
+    def test_asfreq_corner(self):
+        val = Period(freq='A', year=2007)
+        result1 = val.asfreq('5t')
+        result2 = val.asfreq('t')
+        expected = Period('2007-12-31 23:59', freq='t')
+        assert result1.ordinal == expected.ordinal
+        assert result1.freqstr == '5T'
+        assert result2.ordinal == expected.ordinal
+        assert result2.freqstr == 'T'
+
+    def test_conv_annual(self):
+        # frequency conversion tests: from Annual Frequency
+
+        ival_A = Period(freq='A', year=2007)
+
+        ival_AJAN = Period(freq="A-JAN", year=2007)
+        ival_AJUN = Period(freq="A-JUN", year=2007)
+        ival_ANOV = Period(freq="A-NOV", year=2007)
+
+        ival_A_to_Q_start = Period(freq='Q', year=2007, quarter=1)
+        ival_A_to_Q_end = Period(freq='Q', year=2007, quarter=4)
+        ival_A_to_M_start = Period(freq='M', year=2007, month=1)
+        ival_A_to_M_end = Period(freq='M', year=2007, month=12)
+        ival_A_to_W_start = Period(freq='W', year=2007, month=1, day=1)
+        ival_A_to_W_end = Period(freq='W', year=2007, month=12, day=31)
+        ival_A_to_B_start = Period(freq='B', year=2007, month=1, day=1)
+        ival_A_to_B_end = Period(freq='B', year=2007, month=12, day=31)
+        ival_A_to_D_start = Period(freq='D', year=2007, month=1, day=1)
+        ival_A_to_D_end = Period(freq='D', year=2007, month=12, day=31)
+        ival_A_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_A_to_H_end = Period(freq='H', year=2007, month=12, day=31,
+                                 hour=23)
+        ival_A_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_A_to_T_end = Period(freq='Min', year=2007, month=12, day=31,
+                                 hour=23, minute=59)
+        ival_A_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_A_to_S_end = Period(freq='S', year=2007, month=12, day=31,
+                                 hour=23, minute=59, second=59)
+
+        ival_AJAN_to_D_end = Period(freq='D', year=2007, month=1, day=31)
+        ival_AJAN_to_D_start = Period(freq='D', year=2006, month=2, day=1)
+        ival_AJUN_to_D_end = Period(freq='D', year=2007, month=6, day=30)
+        ival_AJUN_to_D_start = Period(freq='D', year=2006, month=7, day=1)
+        ival_ANOV_to_D_end = Period(freq='D', year=2007, month=11, day=30)
+        ival_ANOV_to_D_start = Period(freq='D', year=2006, month=12, day=1)
+
+        assert ival_A.asfreq('Q', 'S') == ival_A_to_Q_start
+        assert ival_A.asfreq('Q', 'e') == ival_A_to_Q_end
+        assert ival_A.asfreq('M', 's') == ival_A_to_M_start
+        assert ival_A.asfreq('M', 'E') == ival_A_to_M_end
+        assert ival_A.asfreq('W', 'S') == ival_A_to_W_start
+        assert ival_A.asfreq('W', 'E') == ival_A_to_W_end
+        assert ival_A.asfreq('B', 'S') == ival_A_to_B_start
+        assert ival_A.asfreq('B', 'E') == ival_A_to_B_end
+        assert ival_A.asfreq('D', 'S') == ival_A_to_D_start
+        assert ival_A.asfreq('D', 'E') == ival_A_to_D_end
+        assert ival_A.asfreq('H', 'S') == ival_A_to_H_start
+        assert ival_A.asfreq('H', 'E') == ival_A_to_H_end
+        assert ival_A.asfreq('min', 'S') == ival_A_to_T_start
+        assert ival_A.asfreq('min', 'E') == ival_A_to_T_end
+        assert ival_A.asfreq('T', 'S') == ival_A_to_T_start
+        assert ival_A.asfreq('T', 'E') == ival_A_to_T_end
+        assert ival_A.asfreq('S', 'S') == ival_A_to_S_start
+        assert ival_A.asfreq('S', 'E') == ival_A_to_S_end
+
+        assert ival_AJAN.asfreq('D', 'S') == ival_AJAN_to_D_start
+        assert ival_AJAN.asfreq('D', 'E') == ival_AJAN_to_D_end
+
+        assert ival_AJUN.asfreq('D', 'S') == ival_AJUN_to_D_start
+        assert ival_AJUN.asfreq('D', 'E') == ival_AJUN_to_D_end
+
+        assert ival_ANOV.asfreq('D', 'S') == ival_ANOV_to_D_start
+        assert ival_ANOV.asfreq('D', 'E') == ival_ANOV_to_D_end
+
+        assert ival_A.asfreq('A') == ival_A
+
+    def test_conv_quarterly(self):
+        # frequency conversion tests: from Quarterly Frequency
+
+        ival_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_Q_end_of_year = Period(freq='Q', year=2007, quarter=4)
+
+        ival_QEJAN = Period(freq="Q-JAN", year=2007, quarter=1)
+        ival_QEJUN = Period(freq="Q-JUN", year=2007, quarter=1)
+
+        ival_Q_to_A = Period(freq='A', year=2007)
+        ival_Q_to_M_start = Period(freq='M', year=2007, month=1)
+        ival_Q_to_M_end = Period(freq='M', year=2007, month=3)
+        ival_Q_to_W_start = Period(freq='W', year=2007, month=1, day=1)
+        ival_Q_to_W_end = Period(freq='W', year=2007, month=3, day=31)
+        ival_Q_to_B_start = Period(freq='B', year=2007, month=1, day=1)
+        ival_Q_to_B_end = Period(freq='B', year=2007, month=3, day=30)
+        ival_Q_to_D_start = Period(freq='D', year=2007, month=1, day=1)
+        ival_Q_to_D_end = Period(freq='D', year=2007, month=3, day=31)
+        ival_Q_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_Q_to_H_end = Period(freq='H', year=2007, month=3, day=31, hour=23)
+        ival_Q_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_Q_to_T_end = Period(freq='Min', year=2007, month=3, day=31,
+                                 hour=23, minute=59)
+        ival_Q_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_Q_to_S_end = Period(freq='S', year=2007, month=3, day=31, hour=23,
+                                 minute=59, second=59)
+
+        ival_QEJAN_to_D_start = Period(freq='D', year=2006, month=2, day=1)
+        ival_QEJAN_to_D_end = Period(freq='D', year=2006, month=4, day=30)
+
+        ival_QEJUN_to_D_start = Period(freq='D', year=2006, month=7, day=1)
+        ival_QEJUN_to_D_end = Period(freq='D', year=2006, month=9, day=30)
+
+        assert ival_Q.asfreq('A') == ival_Q_to_A
+        assert ival_Q_end_of_year.asfreq('A') == ival_Q_to_A
+
+        assert ival_Q.asfreq('M', 'S') == ival_Q_to_M_start
+        assert ival_Q.asfreq('M', 'E') == ival_Q_to_M_end
+        assert ival_Q.asfreq('W', 'S') == ival_Q_to_W_start
+        assert ival_Q.asfreq('W', 'E') == ival_Q_to_W_end
+        assert ival_Q.asfreq('B', 'S') == ival_Q_to_B_start
+        assert ival_Q.asfreq('B', 'E') == ival_Q_to_B_end
+        assert ival_Q.asfreq('D', 'S') == ival_Q_to_D_start
+        assert ival_Q.asfreq('D', 'E') == ival_Q_to_D_end
+        assert ival_Q.asfreq('H', 'S') == ival_Q_to_H_start
+        assert ival_Q.asfreq('H', 'E') == ival_Q_to_H_end
+        assert ival_Q.asfreq('Min', 'S') == ival_Q_to_T_start
+        assert ival_Q.asfreq('Min', 'E') == ival_Q_to_T_end
+        assert ival_Q.asfreq('S', 'S') == ival_Q_to_S_start
+        assert ival_Q.asfreq('S', 'E') == ival_Q_to_S_end
+
+        assert ival_QEJAN.asfreq('D', 'S') == ival_QEJAN_to_D_start
+        assert ival_QEJAN.asfreq('D', 'E') == ival_QEJAN_to_D_end
+        assert ival_QEJUN.asfreq('D', 'S') == ival_QEJUN_to_D_start
+        assert ival_QEJUN.asfreq('D', 'E') == ival_QEJUN_to_D_end
+
+        assert ival_Q.asfreq('Q') == ival_Q
+
+    def test_conv_monthly(self):
+        # frequency conversion tests: from Monthly Frequency
+
+        ival_M = Period(freq='M', year=2007, month=1)
+        ival_M_end_of_year = Period(freq='M', year=2007, month=12)
+        ival_M_end_of_quarter = Period(freq='M', year=2007, month=3)
+        ival_M_to_A = Period(freq='A', year=2007)
+        ival_M_to_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_M_to_W_start = Period(freq='W', year=2007, month=1, day=1)
+        ival_M_to_W_end = Period(freq='W', year=2007, month=1, day=31)
+        ival_M_to_B_start = Period(freq='B', year=2007, month=1, day=1)
+        ival_M_to_B_end = Period(freq='B', year=2007, month=1, day=31)
+        ival_M_to_D_start = Period(freq='D', year=2007, month=1, day=1)
+        ival_M_to_D_end = Period(freq='D', year=2007, month=1, day=31)
+        ival_M_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_M_to_H_end = Period(freq='H', year=2007, month=1, day=31, hour=23)
+        ival_M_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_M_to_T_end = Period(freq='Min', year=2007, month=1, day=31,
+                                 hour=23, minute=59)
+        ival_M_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_M_to_S_end = Period(freq='S', year=2007, month=1, day=31, hour=23,
+                                 minute=59, second=59)
+
+        assert ival_M.asfreq('A') == ival_M_to_A
+        assert ival_M_end_of_year.asfreq('A') == ival_M_to_A
+        assert ival_M.asfreq('Q') == ival_M_to_Q
+        assert ival_M_end_of_quarter.asfreq('Q') == ival_M_to_Q
+
+        assert ival_M.asfreq('W', 'S') == ival_M_to_W_start
+        assert ival_M.asfreq('W', 'E') == ival_M_to_W_end
+        assert ival_M.asfreq('B', 'S') == ival_M_to_B_start
+        assert ival_M.asfreq('B', 'E') == ival_M_to_B_end
+        assert ival_M.asfreq('D', 'S') == ival_M_to_D_start
+        assert ival_M.asfreq('D', 'E') == ival_M_to_D_end
+        assert ival_M.asfreq('H', 'S') == ival_M_to_H_start
+        assert ival_M.asfreq('H', 'E') == ival_M_to_H_end
+        assert ival_M.asfreq('Min', 'S') == ival_M_to_T_start
+        assert ival_M.asfreq('Min', 'E') == ival_M_to_T_end
+        assert ival_M.asfreq('S', 'S') == ival_M_to_S_start
+        assert ival_M.asfreq('S', 'E') == ival_M_to_S_end
+
+        assert ival_M.asfreq('M') == ival_M
+
+    def test_conv_weekly(self):
+        # frequency conversion tests: from Weekly Frequency
+        ival_W = Period(freq='W', year=2007, month=1, day=1)
+
+        ival_WSUN = Period(freq='W', year=2007, month=1, day=7)
+        ival_WSAT = Period(freq='W-SAT', year=2007, month=1, day=6)
+        ival_WFRI = Period(freq='W-FRI', year=2007, month=1, day=5)
+        ival_WTHU = Period(freq='W-THU', year=2007, month=1, day=4)
+        ival_WWED = Period(freq='W-WED', year=2007, month=1, day=3)
+        ival_WTUE = Period(freq='W-TUE', year=2007, month=1, day=2)
+        ival_WMON = Period(freq='W-MON', year=2007, month=1, day=1)
+
+        ival_WSUN_to_D_start = Period(freq='D', year=2007, month=1, day=1)
+        ival_WSUN_to_D_end = Period(freq='D', year=2007, month=1, day=7)
+        ival_WSAT_to_D_start = Period(freq='D', year=2006, month=12, day=31)
+        ival_WSAT_to_D_end = Period(freq='D', year=2007, month=1, day=6)
+        ival_WFRI_to_D_start = Period(freq='D', year=2006, month=12, day=30)
+        ival_WFRI_to_D_end = Period(freq='D', year=2007, month=1, day=5)
+        ival_WTHU_to_D_start = Period(freq='D', year=2006, month=12, day=29)
+        ival_WTHU_to_D_end = Period(freq='D', year=2007, month=1, day=4)
+        ival_WWED_to_D_start = Period(freq='D', year=2006, month=12, day=28)
+        ival_WWED_to_D_end = Period(freq='D', year=2007, month=1, day=3)
+        ival_WTUE_to_D_start = Period(freq='D', year=2006, month=12, day=27)
+        ival_WTUE_to_D_end = Period(freq='D', year=2007, month=1, day=2)
+        ival_WMON_to_D_start = Period(freq='D', year=2006, month=12, day=26)
+        ival_WMON_to_D_end = Period(freq='D', year=2007, month=1, day=1)
+
+        ival_W_end_of_year = Period(freq='W', year=2007, month=12, day=31)
+        ival_W_end_of_quarter = Period(freq='W', year=2007, month=3, day=31)
+        ival_W_end_of_month = Period(freq='W', year=2007, month=1, day=31)
+        ival_W_to_A = Period(freq='A', year=2007)
+        ival_W_to_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_W_to_M = Period(freq='M', year=2007, month=1)
+
+        if Period(freq='D', year=2007, month=12, day=31).weekday == 6:
+            ival_W_to_A_end_of_year = Period(freq='A', year=2007)
+        else:
+            ival_W_to_A_end_of_year = Period(freq='A', year=2008)
+
+        if Period(freq='D', year=2007, month=3, day=31).weekday == 6:
+            ival_W_to_Q_end_of_quarter = Period(freq='Q', year=2007, quarter=1)
+        else:
+            ival_W_to_Q_end_of_quarter = Period(freq='Q', year=2007, quarter=2)
+
+        if Period(freq='D', year=2007, month=1, day=31).weekday == 6:
+            ival_W_to_M_end_of_month = Period(freq='M', year=2007, month=1)
+        else:
+            ival_W_to_M_end_of_month = Period(freq='M', year=2007, month=2)
+
+        ival_W_to_B_start = Period(freq='B', year=2007, month=1, day=1)
+        ival_W_to_B_end = Period(freq='B', year=2007, month=1, day=5)
+        ival_W_to_D_start = Period(freq='D', year=2007, month=1, day=1)
+        ival_W_to_D_end = Period(freq='D', year=2007, month=1, day=7)
+        ival_W_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_W_to_H_end = Period(freq='H', year=2007, month=1, day=7, hour=23)
+        ival_W_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_W_to_T_end = Period(freq='Min', year=2007, month=1, day=7,
+                                 hour=23, minute=59)
+        ival_W_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_W_to_S_end = Period(freq='S', year=2007, month=1, day=7, hour=23,
+                                 minute=59, second=59)
+
+        assert ival_W.asfreq('A') == ival_W_to_A
+        assert ival_W_end_of_year.asfreq('A') == ival_W_to_A_end_of_year
+
+        assert ival_W.asfreq('Q') == ival_W_to_Q
+        assert ival_W_end_of_quarter.asfreq('Q') == ival_W_to_Q_end_of_quarter
+
+        assert ival_W.asfreq('M') == ival_W_to_M
+        assert ival_W_end_of_month.asfreq('M') == ival_W_to_M_end_of_month
+
+        assert ival_W.asfreq('B', 'S') == ival_W_to_B_start
+        assert ival_W.asfreq('B', 'E') == ival_W_to_B_end
+
+        assert ival_W.asfreq('D', 'S') == ival_W_to_D_start
+        assert ival_W.asfreq('D', 'E') == ival_W_to_D_end
+
+        assert ival_WSUN.asfreq('D', 'S') == ival_WSUN_to_D_start
+        assert ival_WSUN.asfreq('D', 'E') == ival_WSUN_to_D_end
+        assert ival_WSAT.asfreq('D', 'S') == ival_WSAT_to_D_start
+        assert ival_WSAT.asfreq('D', 'E') == ival_WSAT_to_D_end
+        assert ival_WFRI.asfreq('D', 'S') == ival_WFRI_to_D_start
+        assert ival_WFRI.asfreq('D', 'E') == ival_WFRI_to_D_end
+        assert ival_WTHU.asfreq('D', 'S') == ival_WTHU_to_D_start
+        assert ival_WTHU.asfreq('D', 'E') == ival_WTHU_to_D_end
+        assert ival_WWED.asfreq('D', 'S') == ival_WWED_to_D_start
+        assert ival_WWED.asfreq('D', 'E') == ival_WWED_to_D_end
+        assert ival_WTUE.asfreq('D', 'S') == ival_WTUE_to_D_start
+        assert ival_WTUE.asfreq('D', 'E') == ival_WTUE_to_D_end
+        assert ival_WMON.asfreq('D', 'S') == ival_WMON_to_D_start
+        assert ival_WMON.asfreq('D', 'E') == ival_WMON_to_D_end
+
+        assert ival_W.asfreq('H', 'S') == ival_W_to_H_start
+        assert ival_W.asfreq('H', 'E') == ival_W_to_H_end
+        assert ival_W.asfreq('Min', 'S') == ival_W_to_T_start
+        assert ival_W.asfreq('Min', 'E') == ival_W_to_T_end
+        assert ival_W.asfreq('S', 'S') == ival_W_to_S_start
+        assert ival_W.asfreq('S', 'E') == ival_W_to_S_end
+
+        assert ival_W.asfreq('W') == ival_W
+
+        msg = pd._libs.tslibs.frequencies._INVALID_FREQ_ERROR
+        with tm.assert_raises_regex(ValueError, msg):
+            ival_W.asfreq('WK')
+
+    def test_conv_weekly_legacy(self):
+        # frequency conversion tests: from Weekly Frequency
+        msg = pd._libs.tslibs.frequencies._INVALID_FREQ_ERROR
+        with tm.assert_raises_regex(ValueError, msg):
+            Period(freq='WK', year=2007, month=1, day=1)
+
+        with tm.assert_raises_regex(ValueError, msg):
+            Period(freq='WK-SAT', year=2007, month=1, day=6)
+        with tm.assert_raises_regex(ValueError, msg):
+            Period(freq='WK-FRI', year=2007, month=1, day=5)
+        with tm.assert_raises_regex(ValueError, msg):
+            Period(freq='WK-THU', year=2007, month=1, day=4)
+        with tm.assert_raises_regex(ValueError, msg):
+            Period(freq='WK-WED', year=2007, month=1, day=3)
+        with tm.assert_raises_regex(ValueError, msg):
+            Period(freq='WK-TUE', year=2007, month=1, day=2)
+        with tm.assert_raises_regex(ValueError, msg):
+            Period(freq='WK-MON', year=2007, month=1, day=1)
+
+    def test_conv_business(self):
+        # frequency conversion tests: from Business Frequency"
+
+        ival_B = Period(freq='B', year=2007, month=1, day=1)
+        ival_B_end_of_year = Period(freq='B', year=2007, month=12, day=31)
+        ival_B_end_of_quarter = Period(freq='B', year=2007, month=3, day=30)
+        ival_B_end_of_month = Period(freq='B', year=2007, month=1, day=31)
+        ival_B_end_of_week = Period(freq='B', year=2007, month=1, day=5)
+
+        ival_B_to_A = Period(freq='A', year=2007)
+        ival_B_to_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_B_to_M = Period(freq='M', year=2007, month=1)
+        ival_B_to_W = Period(freq='W', year=2007, month=1, day=7)
+        ival_B_to_D = Period(freq='D', year=2007, month=1, day=1)
+        ival_B_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_B_to_H_end = Period(freq='H', year=2007, month=1, day=1, hour=23)
+        ival_B_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_B_to_T_end = Period(freq='Min', year=2007, month=1, day=1,
+                                 hour=23, minute=59)
+        ival_B_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_B_to_S_end = Period(freq='S', year=2007, month=1, day=1, hour=23,
+                                 minute=59, second=59)
+
+        assert ival_B.asfreq('A') == ival_B_to_A
+        assert ival_B_end_of_year.asfreq('A') == ival_B_to_A
+        assert ival_B.asfreq('Q') == ival_B_to_Q
+        assert ival_B_end_of_quarter.asfreq('Q') == ival_B_to_Q
+        assert ival_B.asfreq('M') == ival_B_to_M
+        assert ival_B_end_of_month.asfreq('M') == ival_B_to_M
+        assert ival_B.asfreq('W') == ival_B_to_W
+        assert ival_B_end_of_week.asfreq('W') == ival_B_to_W
+
+        assert ival_B.asfreq('D') == ival_B_to_D
+
+        assert ival_B.asfreq('H', 'S') == ival_B_to_H_start
+        assert ival_B.asfreq('H', 'E') == ival_B_to_H_end
+        assert ival_B.asfreq('Min', 'S') == ival_B_to_T_start
+        assert ival_B.asfreq('Min', 'E') == ival_B_to_T_end
+        assert ival_B.asfreq('S', 'S') == ival_B_to_S_start
+        assert ival_B.asfreq('S', 'E') == ival_B_to_S_end
+
+        assert ival_B.asfreq('B') == ival_B
+
+    def test_conv_daily(self):
+        # frequency conversion tests: from Business Frequency"
+
+        ival_D = Period(freq='D', year=2007, month=1, day=1)
+        ival_D_end_of_year = Period(freq='D', year=2007, month=12, day=31)
+        ival_D_end_of_quarter = Period(freq='D', year=2007, month=3, day=31)
+        ival_D_end_of_month = Period(freq='D', year=2007, month=1, day=31)
+        ival_D_end_of_week = Period(freq='D', year=2007, month=1, day=7)
+
+        ival_D_friday = Period(freq='D', year=2007, month=1, day=5)
+        ival_D_saturday = Period(freq='D', year=2007, month=1, day=6)
+        ival_D_sunday = Period(freq='D', year=2007, month=1, day=7)
+
+        # TODO: unused?
+        # ival_D_monday = Period(freq='D', year=2007, month=1, day=8)
+
+        ival_B_friday = Period(freq='B', year=2007, month=1, day=5)
+        ival_B_monday = Period(freq='B', year=2007, month=1, day=8)
+
+        ival_D_to_A = Period(freq='A', year=2007)
+
+        ival_Deoq_to_AJAN = Period(freq='A-JAN', year=2008)
+        ival_Deoq_to_AJUN = Period(freq='A-JUN', year=2007)
+        ival_Deoq_to_ADEC = Period(freq='A-DEC', year=2007)
+
+        ival_D_to_QEJAN = Period(freq="Q-JAN", year=2007, quarter=4)
+        ival_D_to_QEJUN = Period(freq="Q-JUN", year=2007, quarter=3)
+        ival_D_to_QEDEC = Period(freq="Q-DEC", year=2007, quarter=1)
+
+        ival_D_to_M = Period(freq='M', year=2007, month=1)
+        ival_D_to_W = Period(freq='W', year=2007, month=1, day=7)
+
+        ival_D_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_D_to_H_end = Period(freq='H', year=2007, month=1, day=1, hour=23)
+        ival_D_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_D_to_T_end = Period(freq='Min', year=2007, month=1, day=1,
+                                 hour=23, minute=59)
+        ival_D_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_D_to_S_end = Period(freq='S', year=2007, month=1, day=1, hour=23,
+                                 minute=59, second=59)
+
+        assert ival_D.asfreq('A') == ival_D_to_A
+
+        assert ival_D_end_of_quarter.asfreq('A-JAN') == ival_Deoq_to_AJAN
+        assert ival_D_end_of_quarter.asfreq('A-JUN') == ival_Deoq_to_AJUN
+        assert ival_D_end_of_quarter.asfreq('A-DEC') == ival_Deoq_to_ADEC
+
+        assert ival_D_end_of_year.asfreq('A') == ival_D_to_A
+        assert ival_D_end_of_quarter.asfreq('Q') == ival_D_to_QEDEC
+        assert ival_D.asfreq("Q-JAN") == ival_D_to_QEJAN
+        assert ival_D.asfreq("Q-JUN") == ival_D_to_QEJUN
+        assert ival_D.asfreq("Q-DEC") == ival_D_to_QEDEC
+        assert ival_D.asfreq('M') == ival_D_to_M
+        assert ival_D_end_of_month.asfreq('M') == ival_D_to_M
+        assert ival_D.asfreq('W') == ival_D_to_W
+        assert ival_D_end_of_week.asfreq('W') == ival_D_to_W
+
+        assert ival_D_friday.asfreq('B') == ival_B_friday
+        assert ival_D_saturday.asfreq('B', 'S') == ival_B_friday
+        assert ival_D_saturday.asfreq('B', 'E') == ival_B_monday
+        assert ival_D_sunday.asfreq('B', 'S') == ival_B_friday
+        assert ival_D_sunday.asfreq('B', 'E') == ival_B_monday
+
+        assert ival_D.asfreq('H', 'S') == ival_D_to_H_start
+        assert ival_D.asfreq('H', 'E') == ival_D_to_H_end
+        assert ival_D.asfreq('Min', 'S') == ival_D_to_T_start
+        assert ival_D.asfreq('Min', 'E') == ival_D_to_T_end
+        assert ival_D.asfreq('S', 'S') == ival_D_to_S_start
+        assert ival_D.asfreq('S', 'E') == ival_D_to_S_end
+
+        assert ival_D.asfreq('D') == ival_D
+
+    def test_conv_hourly(self):
+        # frequency conversion tests: from Hourly Frequency"
+
+        ival_H = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_H_end_of_year = Period(freq='H', year=2007, month=12, day=31,
+                                    hour=23)
+        ival_H_end_of_quarter = Period(freq='H', year=2007, month=3, day=31,
+                                       hour=23)
+        ival_H_end_of_month = Period(freq='H', year=2007, month=1, day=31,
+                                     hour=23)
+        ival_H_end_of_week = Period(freq='H', year=2007, month=1, day=7,
+                                    hour=23)
+        ival_H_end_of_day = Period(freq='H', year=2007, month=1, day=1,
+                                   hour=23)
+        ival_H_end_of_bus = Period(freq='H', year=2007, month=1, day=1,
+                                   hour=23)
+
+        ival_H_to_A = Period(freq='A', year=2007)
+        ival_H_to_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_H_to_M = Period(freq='M', year=2007, month=1)
+        ival_H_to_W = Period(freq='W', year=2007, month=1, day=7)
+        ival_H_to_D = Period(freq='D', year=2007, month=1, day=1)
+        ival_H_to_B = Period(freq='B', year=2007, month=1, day=1)
+
+        ival_H_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_H_to_T_end = Period(freq='Min', year=2007, month=1, day=1, hour=0,
+                                 minute=59)
+        ival_H_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_H_to_S_end = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                 minute=59, second=59)
+
+        assert ival_H.asfreq('A') == ival_H_to_A
+        assert ival_H_end_of_year.asfreq('A') == ival_H_to_A
+        assert ival_H.asfreq('Q') == ival_H_to_Q
+        assert ival_H_end_of_quarter.asfreq('Q') == ival_H_to_Q
+        assert ival_H.asfreq('M') == ival_H_to_M
+        assert ival_H_end_of_month.asfreq('M') == ival_H_to_M
+        assert ival_H.asfreq('W') == ival_H_to_W
+        assert ival_H_end_of_week.asfreq('W') == ival_H_to_W
+        assert ival_H.asfreq('D') == ival_H_to_D
+        assert ival_H_end_of_day.asfreq('D') == ival_H_to_D
+        assert ival_H.asfreq('B') == ival_H_to_B
+        assert ival_H_end_of_bus.asfreq('B') == ival_H_to_B
+
+        assert ival_H.asfreq('Min', 'S') == ival_H_to_T_start
+        assert ival_H.asfreq('Min', 'E') == ival_H_to_T_end
+        assert ival_H.asfreq('S', 'S') == ival_H_to_S_start
+        assert ival_H.asfreq('S', 'E') == ival_H_to_S_end
+
+        assert ival_H.asfreq('H') == ival_H
+
+    def test_conv_minutely(self):
+        # frequency conversion tests: from Minutely Frequency"
+
+        ival_T = Period(freq='Min', year=2007, month=1, day=1, hour=0,
+                        minute=0)
+        ival_T_end_of_year = Period(freq='Min', year=2007, month=12, day=31,
+                                    hour=23, minute=59)
+        ival_T_end_of_quarter = Period(freq='Min', year=2007, month=3, day=31,
+                                       hour=23, minute=59)
+        ival_T_end_of_month = Period(freq='Min', year=2007, month=1, day=31,
+                                     hour=23, minute=59)
+        ival_T_end_of_week = Period(freq='Min', year=2007, month=1, day=7,
+                                    hour=23, minute=59)
+        ival_T_end_of_day = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=23, minute=59)
+        ival_T_end_of_bus = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=23, minute=59)
+        ival_T_end_of_hour = Period(freq='Min', year=2007, month=1, day=1,
+                                    hour=0, minute=59)
+
+        ival_T_to_A = Period(freq='A', year=2007)
+        ival_T_to_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_T_to_M = Period(freq='M', year=2007, month=1)
+        ival_T_to_W = Period(freq='W', year=2007, month=1, day=7)
+        ival_T_to_D = Period(freq='D', year=2007, month=1, day=1)
+        ival_T_to_B = Period(freq='B', year=2007, month=1, day=1)
+        ival_T_to_H = Period(freq='H', year=2007, month=1, day=1, hour=0)
+
+        ival_T_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_T_to_S_end = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                 minute=0, second=59)
+
+        assert ival_T.asfreq('A') == ival_T_to_A
+        assert ival_T_end_of_year.asfreq('A') == ival_T_to_A
+        assert ival_T.asfreq('Q') == ival_T_to_Q
+        assert ival_T_end_of_quarter.asfreq('Q') == ival_T_to_Q
+        assert ival_T.asfreq('M') == ival_T_to_M
+        assert ival_T_end_of_month.asfreq('M') == ival_T_to_M
+        assert ival_T.asfreq('W') == ival_T_to_W
+        assert ival_T_end_of_week.asfreq('W') == ival_T_to_W
+        assert ival_T.asfreq('D') == ival_T_to_D
+        assert ival_T_end_of_day.asfreq('D') == ival_T_to_D
+        assert ival_T.asfreq('B') == ival_T_to_B
+        assert ival_T_end_of_bus.asfreq('B') == ival_T_to_B
+        assert ival_T.asfreq('H') == ival_T_to_H
+        assert ival_T_end_of_hour.asfreq('H') == ival_T_to_H
+
+        assert ival_T.asfreq('S', 'S') == ival_T_to_S_start
+        assert ival_T.asfreq('S', 'E') == ival_T_to_S_end
+
+        assert ival_T.asfreq('Min') == ival_T
+
+    def test_conv_secondly(self):
+        # frequency conversion tests: from Secondly Frequency"
+
+        ival_S = Period(freq='S', year=2007, month=1, day=1, hour=0, minute=0,
+                        second=0)
+        ival_S_end_of_year = Period(freq='S', year=2007, month=12, day=31,
+                                    hour=23, minute=59, second=59)
+        ival_S_end_of_quarter = Period(freq='S', year=2007, month=3, day=31,
+                                       hour=23, minute=59, second=59)
+        ival_S_end_of_month = Period(freq='S', year=2007, month=1, day=31,
+                                     hour=23, minute=59, second=59)
+        ival_S_end_of_week = Period(freq='S', year=2007, month=1, day=7,
+                                    hour=23, minute=59, second=59)
+        ival_S_end_of_day = Period(freq='S', year=2007, month=1, day=1,
+                                   hour=23, minute=59, second=59)
+        ival_S_end_of_bus = Period(freq='S', year=2007, month=1, day=1,
+                                   hour=23, minute=59, second=59)
+        ival_S_end_of_hour = Period(freq='S', year=2007, month=1, day=1,
+                                    hour=0, minute=59, second=59)
+        ival_S_end_of_minute = Period(freq='S', year=2007, month=1, day=1,
+                                      hour=0, minute=0, second=59)
+
+        ival_S_to_A = Period(freq='A', year=2007)
+        ival_S_to_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_S_to_M = Period(freq='M', year=2007, month=1)
+        ival_S_to_W = Period(freq='W', year=2007, month=1, day=7)
+        ival_S_to_D = Period(freq='D', year=2007, month=1, day=1)
+        ival_S_to_B = Period(freq='B', year=2007, month=1, day=1)
+        ival_S_to_H = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_S_to_T = Period(freq='Min', year=2007, month=1, day=1, hour=0,
+                             minute=0)
+
+        assert ival_S.asfreq('A') == ival_S_to_A
+        assert ival_S_end_of_year.asfreq('A') == ival_S_to_A
+        assert ival_S.asfreq('Q') == ival_S_to_Q
+        assert ival_S_end_of_quarter.asfreq('Q') == ival_S_to_Q
+        assert ival_S.asfreq('M') == ival_S_to_M
+        assert ival_S_end_of_month.asfreq('M') == ival_S_to_M
+        assert ival_S.asfreq('W') == ival_S_to_W
+        assert ival_S_end_of_week.asfreq('W') == ival_S_to_W
+        assert ival_S.asfreq('D') == ival_S_to_D
+        assert ival_S_end_of_day.asfreq('D') == ival_S_to_D
+        assert ival_S.asfreq('B') == ival_S_to_B
+        assert ival_S_end_of_bus.asfreq('B') == ival_S_to_B
+        assert ival_S.asfreq('H') == ival_S_to_H
+        assert ival_S_end_of_hour.asfreq('H') == ival_S_to_H
+        assert ival_S.asfreq('Min') == ival_S_to_T
+        assert ival_S_end_of_minute.asfreq('Min') == ival_S_to_T
+
+        assert ival_S.asfreq('S') == ival_S
+
+    def test_asfreq_mult(self):
+        # normal freq to mult freq
+        p = Period(freq='A', year=2007)
+        # ordinal will not change
+        for freq in ['3A', offsets.YearEnd(3)]:
+            result = p.asfreq(freq)
+            expected = Period('2007', freq='3A')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+        # ordinal will not change
+        for freq in ['3A', offsets.YearEnd(3)]:
+            result = p.asfreq(freq, how='S')
+            expected = Period('2007', freq='3A')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+
+        # mult freq to normal freq
+        p = Period(freq='3A', year=2007)
+        # ordinal will change because how=E is the default
+        for freq in ['A', offsets.YearEnd()]:
+            result = p.asfreq(freq)
+            expected = Period('2009', freq='A')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+        # ordinal will not change
+        for freq in ['A', offsets.YearEnd()]:
+            result = p.asfreq(freq, how='S')
+            expected = Period('2007', freq='A')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+
+        p = Period(freq='A', year=2007)
+        for freq in ['2M', offsets.MonthEnd(2)]:
+            result = p.asfreq(freq)
+            expected = Period('2007-12', freq='2M')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+        for freq in ['2M', offsets.MonthEnd(2)]:
+            result = p.asfreq(freq, how='S')
+            expected = Period('2007-01', freq='2M')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+
+        p = Period(freq='3A', year=2007)
+        for freq in ['2M', offsets.MonthEnd(2)]:
+            result = p.asfreq(freq)
+            expected = Period('2009-12', freq='2M')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+        for freq in ['2M', offsets.MonthEnd(2)]:
+            result = p.asfreq(freq, how='S')
+            expected = Period('2007-01', freq='2M')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+
+    def test_asfreq_combined(self):
+        # normal freq to combined freq
+        p = Period('2007', freq='H')
+
+        # ordinal will not change
+        expected = Period('2007', freq='25H')
+        for freq, how in zip(['1D1H', '1H1D'], ['E', 'S']):
+            result = p.asfreq(freq, how=how)
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+
+        # combined freq to normal freq
+        p1 = Period(freq='1D1H', year=2007)
+        p2 = Period(freq='1H1D', year=2007)
+
+        # ordinal will change because how=E is the default
+        result1 = p1.asfreq('H')
+        result2 = p2.asfreq('H')
+        expected = Period('2007-01-02', freq='H')
+        assert result1 == expected
+        assert result1.ordinal == expected.ordinal
+        assert result1.freq == expected.freq
+        assert result2 == expected
+        assert result2.ordinal == expected.ordinal
+        assert result2.freq == expected.freq
+
+        # ordinal will not change
+        result1 = p1.asfreq('H', how='S')
+        result2 = p2.asfreq('H', how='S')
+        expected = Period('2007-01-01', freq='H')
+        assert result1 == expected
+        assert result1.ordinal == expected.ordinal
+        assert result1.freq == expected.freq
+        assert result2 == expected
+        assert result2.ordinal == expected.ordinal
+        assert result2.freq == expected.freq
+
+    def test_asfreq_MS(self):
+        initial = Period("2013")
+
+        assert initial.asfreq(freq="M", how="S") == Period('2013-01', 'M')
+
+        msg = pd._libs.tslibs.frequencies._INVALID_FREQ_ERROR
+        with tm.assert_raises_regex(ValueError, msg):
+            initial.asfreq(freq="MS", how="S")
+
+        with tm.assert_raises_regex(ValueError, msg):
+            pd.Period('2013-01', 'MS')
+
+        assert _period_code_map.get("MS") is None
diff --git a/pandas/tests/scalar/period/test_period.py b/pandas/tests/scalar/period/test_period.py
new file mode 100644
index 0000000000000..ffc375ba12e34
--- /dev/null
+++ b/pandas/tests/scalar/period/test_period.py
@@ -0,0 +1,1450 @@
+import pytest
+
+import pytz
+import numpy as np
+from datetime import datetime, date, timedelta
+
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.core.indexes.period as period
+from pandas.compat import text_type, iteritems
+from pandas.compat.numpy import np_datetime64_compat
+
+from pandas._libs import tslib
+from pandas._libs.tslibs import period as libperiod
+from pandas._libs.tslibs.ccalendar import DAYS, MONTHS
+from pandas._libs.tslibs.parsing import DateParseError
+from pandas import Period, Timestamp, offsets
+
+
+class TestPeriodProperties(object):
+    "Test properties such as year, month, weekday, etc...."
+
+    @pytest.mark.parametrize('freq', ['A', 'M', 'D', 'H'])
+    def test_is_leap_year(self, freq):
+        # GH 13727
+        p = Period('2000-01-01 00:00:00', freq=freq)
+        assert p.is_leap_year
+        assert isinstance(p.is_leap_year, bool)
+
+        p = Period('1999-01-01 00:00:00', freq=freq)
+        assert not p.is_leap_year
+
+        p = Period('2004-01-01 00:00:00', freq=freq)
+        assert p.is_leap_year
+
+        p = Period('2100-01-01 00:00:00', freq=freq)
+        assert not p.is_leap_year
+
+    def test_quarterly_negative_ordinals(self):
+        p = Period(ordinal=-1, freq='Q-DEC')
+        assert p.year == 1969
+        assert p.quarter == 4
+        assert isinstance(p, Period)
+
+        p = Period(ordinal=-2, freq='Q-DEC')
+        assert p.year == 1969
+        assert p.quarter == 3
+        assert isinstance(p, Period)
+
+        p = Period(ordinal=-2, freq='M')
+        assert p.year == 1969
+        assert p.month == 11
+        assert isinstance(p, Period)
+
+    @pytest.mark.parametrize('month', MONTHS)
+    def test_period_cons_quarterly(self, month):
+        # bugs in scikits.timeseries
+        freq = 'Q-%s' % month
+        exp = Period('1989Q3', freq=freq)
+        assert '1989Q3' in str(exp)
+        stamp = exp.to_timestamp('D', how='end')
+        p = Period(stamp, freq=freq)
+        assert p == exp
+
+        stamp = exp.to_timestamp('3D', how='end')
+        p = Period(stamp, freq=freq)
+        assert p == exp
+
+    @pytest.mark.parametrize('month', MONTHS)
+    def test_period_cons_annual(self, month):
+        # bugs in scikits.timeseries
+        freq = 'A-%s' % month
+        exp = Period('1989', freq=freq)
+        stamp = exp.to_timestamp('D', how='end') + timedelta(days=30)
+        p = Period(stamp, freq=freq)
+        assert p == exp + 1
+        assert isinstance(p, Period)
+
+    @pytest.mark.parametrize('day', DAYS)
+    @pytest.mark.parametrize('num', range(10, 17))
+    def test_period_cons_weekly(self, num, day):
+        daystr = '2011-02-%d' % num
+        freq = 'W-%s' % day
+
+        result = Period(daystr, freq=freq)
+        expected = Period(daystr, freq='D').asfreq(freq)
+        assert result == expected
+        assert isinstance(result, Period)
+
+    def test_period_from_ordinal(self):
+        p = pd.Period('2011-01', freq='M')
+        res = pd.Period._from_ordinal(p.ordinal, freq='M')
+        assert p == res
+        assert isinstance(res, Period)
+
+    def test_period_cons_nat(self):
+        p = Period('NaT', freq='M')
+        assert p is pd.NaT
+
+        p = Period('nat', freq='W-SUN')
+        assert p is pd.NaT
+
+        p = Period(tslib.iNaT, freq='D')
+        assert p is pd.NaT
+
+        p = Period(tslib.iNaT, freq='3D')
+        assert p is pd.NaT
+
+        p = Period(tslib.iNaT, freq='1D1H')
+        assert p is pd.NaT
+
+        p = Period('NaT')
+        assert p is pd.NaT
+
+        p = Period(tslib.iNaT)
+        assert p is pd.NaT
+
+    def test_period_cons_mult(self):
+        p1 = Period('2011-01', freq='3M')
+        p2 = Period('2011-01', freq='M')
+        assert p1.ordinal == p2.ordinal
+
+        assert p1.freq == offsets.MonthEnd(3)
+        assert p1.freqstr == '3M'
+
+        assert p2.freq == offsets.MonthEnd()
+        assert p2.freqstr == 'M'
+
+        result = p1 + 1
+        assert result.ordinal == (p2 + 3).ordinal
+        assert result.freq == p1.freq
+        assert result.freqstr == '3M'
+
+        result = p1 - 1
+        assert result.ordinal == (p2 - 3).ordinal
+        assert result.freq == p1.freq
+        assert result.freqstr == '3M'
+
+        msg = ('Frequency must be positive, because it'
+               ' represents span: -3M')
+        with tm.assert_raises_regex(ValueError, msg):
+            Period('2011-01', freq='-3M')
+
+        msg = ('Frequency must be positive, because it' ' represents span: 0M')
+        with tm.assert_raises_regex(ValueError, msg):
+            Period('2011-01', freq='0M')
+
+    def test_period_cons_combined(self):
+        p = [(Period('2011-01', freq='1D1H'),
+              Period('2011-01', freq='1H1D'),
+              Period('2011-01', freq='H')),
+             (Period(ordinal=1, freq='1D1H'),
+              Period(ordinal=1, freq='1H1D'),
+              Period(ordinal=1, freq='H'))]
+
+        for p1, p2, p3 in p:
+            assert p1.ordinal == p3.ordinal
+            assert p2.ordinal == p3.ordinal
+
+            assert p1.freq == offsets.Hour(25)
+            assert p1.freqstr == '25H'
+
+            assert p2.freq == offsets.Hour(25)
+            assert p2.freqstr == '25H'
+
+            assert p3.freq == offsets.Hour()
+            assert p3.freqstr == 'H'
+
+            result = p1 + 1
+            assert result.ordinal == (p3 + 25).ordinal
+            assert result.freq == p1.freq
+            assert result.freqstr == '25H'
+
+            result = p2 + 1
+            assert result.ordinal == (p3 + 25).ordinal
+            assert result.freq == p2.freq
+            assert result.freqstr == '25H'
+
+            result = p1 - 1
+            assert result.ordinal == (p3 - 25).ordinal
+            assert result.freq == p1.freq
+            assert result.freqstr == '25H'
+
+            result = p2 - 1
+            assert result.ordinal == (p3 - 25).ordinal
+            assert result.freq == p2.freq
+            assert result.freqstr == '25H'
+
+        msg = ('Frequency must be positive, because it'
+               ' represents span: -25H')
+        with tm.assert_raises_regex(ValueError, msg):
+            Period('2011-01', freq='-1D1H')
+        with tm.assert_raises_regex(ValueError, msg):
+            Period('2011-01', freq='-1H1D')
+        with tm.assert_raises_regex(ValueError, msg):
+            Period(ordinal=1, freq='-1D1H')
+        with tm.assert_raises_regex(ValueError, msg):
+            Period(ordinal=1, freq='-1H1D')
+
+        msg = ('Frequency must be positive, because it'
+               ' represents span: 0D')
+        with tm.assert_raises_regex(ValueError, msg):
+            Period('2011-01', freq='0D0H')
+        with tm.assert_raises_regex(ValueError, msg):
+            Period(ordinal=1, freq='0D0H')
+
+        # You can only combine together day and intraday offsets
+        msg = ('Invalid frequency: 1W1D')
+        with tm.assert_raises_regex(ValueError, msg):
+            Period('2011-01', freq='1W1D')
+        msg = ('Invalid frequency: 1D1W')
+        with tm.assert_raises_regex(ValueError, msg):
+            Period('2011-01', freq='1D1W')
+
+    @pytest.mark.parametrize('tzstr', ['Europe/Brussels',
+                                       'Asia/Tokyo', 'US/Pacific'])
+    def test_timestamp_tz_arg(self, tzstr):
+        p = Period('1/1/2005', freq='M').to_timestamp(tz=tzstr)
+        exp = Timestamp('1/1/2005', tz='UTC').tz_convert(tzstr)
+        exp_zone = pytz.timezone(tzstr).normalize(p)
+
+        assert p == exp
+        assert p.tz == exp_zone.tzinfo
+        assert p.tz == exp.tz
+
+        p = Period('1/1/2005', freq='3H').to_timestamp(tz=tzstr)
+        exp = Timestamp('1/1/2005', tz='UTC').tz_convert(tzstr)
+        exp_zone = pytz.timezone(tzstr).normalize(p)
+
+        assert p == exp
+        assert p.tz == exp_zone.tzinfo
+        assert p.tz == exp.tz
+
+        p = Period('1/1/2005', freq='A').to_timestamp(freq='A', tz=tzstr)
+        exp = Timestamp('31/12/2005', tz='UTC').tz_convert(tzstr)
+        exp_zone = pytz.timezone(tzstr).normalize(p)
+
+        assert p == exp
+        assert p.tz == exp_zone.tzinfo
+        assert p.tz == exp.tz
+
+        p = Period('1/1/2005', freq='A').to_timestamp(freq='3H', tz=tzstr)
+        exp = Timestamp('1/1/2005', tz='UTC').tz_convert(tzstr)
+        exp_zone = pytz.timezone(tzstr).normalize(p)
+
+        assert p == exp
+        assert p.tz == exp_zone.tzinfo
+        assert p.tz == exp.tz
+
+    @pytest.mark.parametrize('tzstr', ['dateutil/Europe/Brussels',
+                                       'dateutil/Asia/Tokyo',
+                                       'dateutil/US/Pacific'])
+    def test_timestamp_tz_arg_dateutil(self, tzstr):
+        from pandas._libs.tslibs.timezones import dateutil_gettz
+        from pandas._libs.tslibs.timezones import maybe_get_tz
+        tz = maybe_get_tz(tzstr)
+        p = Period('1/1/2005', freq='M').to_timestamp(tz=tz)
+        exp = Timestamp('1/1/2005', tz='UTC').tz_convert(tzstr)
+        assert p == exp
+        assert p.tz == dateutil_gettz(tzstr.split('/', 1)[1])
+        assert p.tz == exp.tz
+
+        p = Period('1/1/2005', freq='M').to_timestamp(freq='3H', tz=tz)
+        exp = Timestamp('1/1/2005', tz='UTC').tz_convert(tzstr)
+        assert p == exp
+        assert p.tz == dateutil_gettz(tzstr.split('/', 1)[1])
+        assert p.tz == exp.tz
+
+    def test_timestamp_tz_arg_dateutil_from_string(self):
+        from pandas._libs.tslibs.timezones import dateutil_gettz
+        p = Period('1/1/2005',
+                   freq='M').to_timestamp(tz='dateutil/Europe/Brussels')
+        assert p.tz == dateutil_gettz('Europe/Brussels')
+
+    def test_timestamp_mult(self):
+        p = pd.Period('2011-01', freq='M')
+        assert p.to_timestamp(how='S') == pd.Timestamp('2011-01-01')
+        assert p.to_timestamp(how='E') == pd.Timestamp('2011-01-31')
+
+        p = pd.Period('2011-01', freq='3M')
+        assert p.to_timestamp(how='S') == pd.Timestamp('2011-01-01')
+        assert p.to_timestamp(how='E') == pd.Timestamp('2011-03-31')
+
+    def test_construction(self):
+        i1 = Period('1/1/2005', freq='M')
+        i2 = Period('Jan 2005')
+
+        assert i1 == i2
+
+        i1 = Period('2005', freq='A')
+        i2 = Period('2005')
+        i3 = Period('2005', freq='a')
+
+        assert i1 == i2
+        assert i1 == i3
+
+        i4 = Period('2005', freq='M')
+        i5 = Period('2005', freq='m')
+
+        pytest.raises(ValueError, i1.__ne__, i4)
+        assert i4 == i5
+
+        i1 = Period.now('Q')
+        i2 = Period(datetime.now(), freq='Q')
+        i3 = Period.now('q')
+
+        assert i1 == i2
+        assert i1 == i3
+
+        i1 = Period('1982', freq='min')
+        i2 = Period('1982', freq='MIN')
+        assert i1 == i2
+        i2 = Period('1982', freq=('Min', 1))
+        assert i1 == i2
+
+        i1 = Period(year=2005, month=3, day=1, freq='D')
+        i2 = Period('3/1/2005', freq='D')
+        assert i1 == i2
+
+        i3 = Period(year=2005, month=3, day=1, freq='d')
+        assert i1 == i3
+
+        i1 = Period('2007-01-01 09:00:00.001')
+        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1000), freq='L')
+        assert i1 == expected
+
+        expected = Period(np_datetime64_compat(
+            '2007-01-01 09:00:00.001Z'), freq='L')
+        assert i1 == expected
+
+        i1 = Period('2007-01-01 09:00:00.00101')
+        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1010), freq='U')
+        assert i1 == expected
+
+        expected = Period(np_datetime64_compat('2007-01-01 09:00:00.00101Z'),
+                          freq='U')
+        assert i1 == expected
+
+        pytest.raises(ValueError, Period, ordinal=200701)
+
+        pytest.raises(ValueError, Period, '2007-1-1', freq='X')
+
+    def test_construction_bday(self):
+
+        # Biz day construction, roll forward if non-weekday
+        i1 = Period('3/10/12', freq='B')
+        i2 = Period('3/10/12', freq='D')
+        assert i1 == i2.asfreq('B')
+        i2 = Period('3/11/12', freq='D')
+        assert i1 == i2.asfreq('B')
+        i2 = Period('3/12/12', freq='D')
+        assert i1 == i2.asfreq('B')
+
+        i3 = Period('3/10/12', freq='b')
+        assert i1 == i3
+
+        i1 = Period(year=2012, month=3, day=10, freq='B')
+        i2 = Period('3/12/12', freq='B')
+        assert i1 == i2
+
+    def test_construction_quarter(self):
+
+        i1 = Period(year=2005, quarter=1, freq='Q')
+        i2 = Period('1/1/2005', freq='Q')
+        assert i1 == i2
+
+        i1 = Period(year=2005, quarter=3, freq='Q')
+        i2 = Period('9/1/2005', freq='Q')
+        assert i1 == i2
+
+        i1 = Period('2005Q1')
+        i2 = Period(year=2005, quarter=1, freq='Q')
+        i3 = Period('2005q1')
+        assert i1 == i2
+        assert i1 == i3
+
+        i1 = Period('05Q1')
+        assert i1 == i2
+        lower = Period('05q1')
+        assert i1 == lower
+
+        i1 = Period('1Q2005')
+        assert i1 == i2
+        lower = Period('1q2005')
+        assert i1 == lower
+
+        i1 = Period('1Q05')
+        assert i1 == i2
+        lower = Period('1q05')
+        assert i1 == lower
+
+        i1 = Period('4Q1984')
+        assert i1.year == 1984
+        lower = Period('4q1984')
+        assert i1 == lower
+
+    def test_construction_month(self):
+
+        expected = Period('2007-01', freq='M')
+        i1 = Period('200701', freq='M')
+        assert i1 == expected
+
+        i1 = Period('200701', freq='M')
+        assert i1 == expected
+
+        i1 = Period(200701, freq='M')
+        assert i1 == expected
+
+        i1 = Period(ordinal=200701, freq='M')
+        assert i1.year == 18695
+
+        i1 = Period(datetime(2007, 1, 1), freq='M')
+        i2 = Period('200701', freq='M')
+        assert i1 == i2
+
+        i1 = Period(date(2007, 1, 1), freq='M')
+        i2 = Period(datetime(2007, 1, 1), freq='M')
+        i3 = Period(np.datetime64('2007-01-01'), freq='M')
+        i4 = Period(np_datetime64_compat('2007-01-01 00:00:00Z'), freq='M')
+        i5 = Period(np_datetime64_compat('2007-01-01 00:00:00.000Z'), freq='M')
+        assert i1 == i2
+        assert i1 == i3
+        assert i1 == i4
+        assert i1 == i5
+
+    def test_period_constructor_offsets(self):
+        assert (Period('1/1/2005', freq=offsets.MonthEnd()) ==
+                Period('1/1/2005', freq='M'))
+        assert (Period('2005', freq=offsets.YearEnd()) ==
+                Period('2005', freq='A'))
+        assert (Period('2005', freq=offsets.MonthEnd()) ==
+                Period('2005', freq='M'))
+        assert (Period('3/10/12', freq=offsets.BusinessDay()) ==
+                Period('3/10/12', freq='B'))
+        assert (Period('3/10/12', freq=offsets.Day()) ==
+                Period('3/10/12', freq='D'))
+
+        assert (Period(year=2005, quarter=1,
+                       freq=offsets.QuarterEnd(startingMonth=12)) ==
+                Period(year=2005, quarter=1, freq='Q'))
+        assert (Period(year=2005, quarter=2,
+                       freq=offsets.QuarterEnd(startingMonth=12)) ==
+                Period(year=2005, quarter=2, freq='Q'))
+
+        assert (Period(year=2005, month=3, day=1, freq=offsets.Day()) ==
+                Period(year=2005, month=3, day=1, freq='D'))
+        assert (Period(year=2012, month=3, day=10, freq=offsets.BDay()) ==
+                Period(year=2012, month=3, day=10, freq='B'))
+
+        expected = Period('2005-03-01', freq='3D')
+        assert (Period(year=2005, month=3, day=1,
+                       freq=offsets.Day(3)) == expected)
+        assert Period(year=2005, month=3, day=1, freq='3D') == expected
+
+        assert (Period(year=2012, month=3, day=10,
+                       freq=offsets.BDay(3)) ==
+                Period(year=2012, month=3, day=10, freq='3B'))
+
+        assert (Period(200701, freq=offsets.MonthEnd()) ==
+                Period(200701, freq='M'))
+
+        i1 = Period(ordinal=200701, freq=offsets.MonthEnd())
+        i2 = Period(ordinal=200701, freq='M')
+        assert i1 == i2
+        assert i1.year == 18695
+        assert i2.year == 18695
+
+        i1 = Period(datetime(2007, 1, 1), freq='M')
+        i2 = Period('200701', freq='M')
+        assert i1 == i2
+
+        i1 = Period(date(2007, 1, 1), freq='M')
+        i2 = Period(datetime(2007, 1, 1), freq='M')
+        i3 = Period(np.datetime64('2007-01-01'), freq='M')
+        i4 = Period(np_datetime64_compat('2007-01-01 00:00:00Z'), freq='M')
+        i5 = Period(np_datetime64_compat('2007-01-01 00:00:00.000Z'), freq='M')
+        assert i1 == i2
+        assert i1 == i3
+        assert i1 == i4
+        assert i1 == i5
+
+        i1 = Period('2007-01-01 09:00:00.001')
+        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1000), freq='L')
+        assert i1 == expected
+
+        expected = Period(np_datetime64_compat(
+            '2007-01-01 09:00:00.001Z'), freq='L')
+        assert i1 == expected
+
+        i1 = Period('2007-01-01 09:00:00.00101')
+        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1010), freq='U')
+        assert i1 == expected
+
+        expected = Period(np_datetime64_compat('2007-01-01 09:00:00.00101Z'),
+                          freq='U')
+        assert i1 == expected
+
+        pytest.raises(ValueError, Period, ordinal=200701)
+
+        pytest.raises(ValueError, Period, '2007-1-1', freq='X')
+
+    def test_freq_str(self):
+        i1 = Period('1982', freq='Min')
+        assert i1.freq == offsets.Minute()
+        assert i1.freqstr == 'T'
+
+    def test_period_deprecated_freq(self):
+        cases = {"M": ["MTH", "MONTH", "MONTHLY", "Mth", "month", "monthly"],
+                 "B": ["BUS", "BUSINESS", "BUSINESSLY", "WEEKDAY", "bus"],
+                 "D": ["DAY", "DLY", "DAILY", "Day", "Dly", "Daily"],
+                 "H": ["HR", "HOUR", "HRLY", "HOURLY", "hr", "Hour", "HRly"],
+                 "T": ["minute", "MINUTE", "MINUTELY", "minutely"],
+                 "S": ["sec", "SEC", "SECOND", "SECONDLY", "second"],
+                 "L": ["MILLISECOND", "MILLISECONDLY", "millisecond"],
+                 "U": ["MICROSECOND", "MICROSECONDLY", "microsecond"],
+                 "N": ["NANOSECOND", "NANOSECONDLY", "nanosecond"]}
+
+        msg = pd._libs.tslibs.frequencies._INVALID_FREQ_ERROR
+        for exp, freqs in iteritems(cases):
+            for freq in freqs:
+                with tm.assert_raises_regex(ValueError, msg):
+                    Period('2016-03-01 09:00', freq=freq)
+                with tm.assert_raises_regex(ValueError, msg):
+                    Period(ordinal=1, freq=freq)
+
+            # check supported freq-aliases still works
+            p1 = Period('2016-03-01 09:00', freq=exp)
+            p2 = Period(ordinal=1, freq=exp)
+            assert isinstance(p1, Period)
+            assert isinstance(p2, Period)
+
+    def test_hash(self):
+        assert (hash(Period('2011-01', freq='M')) ==
+                hash(Period('2011-01', freq='M')))
+
+        assert (hash(Period('2011-01-01', freq='D')) !=
+                hash(Period('2011-01', freq='M')))
+
+        assert (hash(Period('2011-01', freq='3M')) !=
+                hash(Period('2011-01', freq='2M')))
+
+        assert (hash(Period('2011-01', freq='M')) !=
+                hash(Period('2011-02', freq='M')))
+
+    def test_repr(self):
+        p = Period('Jan-2000')
+        assert '2000-01' in repr(p)
+
+        p = Period('2000-12-15')
+        assert '2000-12-15' in repr(p)
+
+    def test_repr_nat(self):
+        p = Period('nat', freq='M')
+        assert repr(tslib.NaT) in repr(p)
+
+    def test_millisecond_repr(self):
+        p = Period('2000-01-01 12:15:02.123')
+
+        assert repr(p) == "Period('2000-01-01 12:15:02.123', 'L')"
+
+    def test_microsecond_repr(self):
+        p = Period('2000-01-01 12:15:02.123567')
+
+        assert repr(p) == "Period('2000-01-01 12:15:02.123567', 'U')"
+
+    def test_strftime(self):
+        p = Period('2000-1-1 12:34:12', freq='S')
+        res = p.strftime('%Y-%m-%d %H:%M:%S')
+        assert res == '2000-01-01 12:34:12'
+        assert isinstance(res, text_type)  # GH3363
+
+    def test_sub_delta(self):
+        left, right = Period('2011', freq='A'), Period('2007', freq='A')
+        result = left - right
+        assert result == 4 * right.freq
+
+        with pytest.raises(period.IncompatibleFrequency):
+            left - Period('2007-01', freq='M')
+
+    def test_to_timestamp(self):
+        p = Period('1982', freq='A')
+        start_ts = p.to_timestamp(how='S')
+        aliases = ['s', 'StarT', 'BEGIn']
+        for a in aliases:
+            assert start_ts == p.to_timestamp('D', how=a)
+            # freq with mult should not affect to the result
+            assert start_ts == p.to_timestamp('3D', how=a)
+
+        end_ts = p.to_timestamp(how='E')
+        aliases = ['e', 'end', 'FINIsH']
+        for a in aliases:
+            assert end_ts == p.to_timestamp('D', how=a)
+            assert end_ts == p.to_timestamp('3D', how=a)
+
+        from_lst = ['A', 'Q', 'M', 'W', 'B', 'D', 'H', 'Min', 'S']
+
+        def _ex(p):
+            return Timestamp((p + 1).start_time.value - 1)
+
+        for i, fcode in enumerate(from_lst):
+            p = Period('1982', freq=fcode)
+            result = p.to_timestamp().to_period(fcode)
+            assert result == p
+
+            assert p.start_time == p.to_timestamp(how='S')
+
+            assert p.end_time == _ex(p)
+
+        # Frequency other than daily
+
+        p = Period('1985', freq='A')
+
+        result = p.to_timestamp('H', how='end')
+        expected = datetime(1985, 12, 31, 23)
+        assert result == expected
+        result = p.to_timestamp('3H', how='end')
+        assert result == expected
+
+        result = p.to_timestamp('T', how='end')
+        expected = datetime(1985, 12, 31, 23, 59)
+        assert result == expected
+        result = p.to_timestamp('2T', how='end')
+        assert result == expected
+
+        result = p.to_timestamp(how='end')
+        expected = datetime(1985, 12, 31)
+        assert result == expected
+
+        expected = datetime(1985, 1, 1)
+        result = p.to_timestamp('H', how='start')
+        assert result == expected
+        result = p.to_timestamp('T', how='start')
+        assert result == expected
+        result = p.to_timestamp('S', how='start')
+        assert result == expected
+        result = p.to_timestamp('3H', how='start')
+        assert result == expected
+        result = p.to_timestamp('5S', how='start')
+        assert result == expected
+
+    def test_start_time(self):
+        freq_lst = ['A', 'Q', 'M', 'D', 'H', 'T', 'S']
+        xp = datetime(2012, 1, 1)
+        for f in freq_lst:
+            p = Period('2012', freq=f)
+            assert p.start_time == xp
+        assert Period('2012', freq='B').start_time == datetime(2012, 1, 2)
+        assert Period('2012', freq='W').start_time == datetime(2011, 12, 26)
+
+    def test_end_time(self):
+        p = Period('2012', freq='A')
+
+        def _ex(*args):
+            return Timestamp(Timestamp(datetime(*args)).value - 1)
+
+        xp = _ex(2013, 1, 1)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='Q')
+        xp = _ex(2012, 4, 1)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='M')
+        xp = _ex(2012, 2, 1)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='D')
+        xp = _ex(2012, 1, 2)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='H')
+        xp = _ex(2012, 1, 1, 1)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='B')
+        xp = _ex(2012, 1, 3)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='W')
+        xp = _ex(2012, 1, 2)
+        assert xp == p.end_time
+
+        # Test for GH 11738
+        p = Period('2012', freq='15D')
+        xp = _ex(2012, 1, 16)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='1D1H')
+        xp = _ex(2012, 1, 2, 1)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='1H1D')
+        xp = _ex(2012, 1, 2, 1)
+        assert xp == p.end_time
+
+    def test_anchor_week_end_time(self):
+        def _ex(*args):
+            return Timestamp(Timestamp(datetime(*args)).value - 1)
+
+        p = Period('2013-1-1', 'W-SAT')
+        xp = _ex(2013, 1, 6)
+        assert p.end_time == xp
+
+    def test_properties_annually(self):
+        # Test properties on Periods with annually frequency.
+        a_date = Period(freq='A', year=2007)
+        assert a_date.year == 2007
+
+    def test_properties_quarterly(self):
+        # Test properties on Periods with daily frequency.
+        qedec_date = Period(freq="Q-DEC", year=2007, quarter=1)
+        qejan_date = Period(freq="Q-JAN", year=2007, quarter=1)
+        qejun_date = Period(freq="Q-JUN", year=2007, quarter=1)
+        #
+        for x in range(3):
+            for qd in (qedec_date, qejan_date, qejun_date):
+                assert (qd + x).qyear == 2007
+                assert (qd + x).quarter == x + 1
+
+    def test_properties_monthly(self):
+        # Test properties on Periods with daily frequency.
+        m_date = Period(freq='M', year=2007, month=1)
+        for x in range(11):
+            m_ival_x = m_date + x
+            assert m_ival_x.year == 2007
+            if 1 <= x + 1 <= 3:
+                assert m_ival_x.quarter == 1
+            elif 4 <= x + 1 <= 6:
+                assert m_ival_x.quarter == 2
+            elif 7 <= x + 1 <= 9:
+                assert m_ival_x.quarter == 3
+            elif 10 <= x + 1 <= 12:
+                assert m_ival_x.quarter == 4
+            assert m_ival_x.month == x + 1
+
+    def test_properties_weekly(self):
+        # Test properties on Periods with daily frequency.
+        w_date = Period(freq='W', year=2007, month=1, day=7)
+        #
+        assert w_date.year == 2007
+        assert w_date.quarter == 1
+        assert w_date.month == 1
+        assert w_date.week == 1
+        assert (w_date - 1).week == 52
+        assert w_date.days_in_month == 31
+        assert Period(freq='W', year=2012,
+                      month=2, day=1).days_in_month == 29
+
+    def test_properties_weekly_legacy(self):
+        # Test properties on Periods with daily frequency.
+        w_date = Period(freq='W', year=2007, month=1, day=7)
+        assert w_date.year == 2007
+        assert w_date.quarter == 1
+        assert w_date.month == 1
+        assert w_date.week == 1
+        assert (w_date - 1).week == 52
+        assert w_date.days_in_month == 31
+
+        exp = Period(freq='W', year=2012, month=2, day=1)
+        assert exp.days_in_month == 29
+
+        msg = pd._libs.tslibs.frequencies._INVALID_FREQ_ERROR
+        with tm.assert_raises_regex(ValueError, msg):
+            Period(freq='WK', year=2007, month=1, day=7)
+
+    def test_properties_daily(self):
+        # Test properties on Periods with daily frequency.
+        b_date = Period(freq='B', year=2007, month=1, day=1)
+        #
+        assert b_date.year == 2007
+        assert b_date.quarter == 1
+        assert b_date.month == 1
+        assert b_date.day == 1
+        assert b_date.weekday == 0
+        assert b_date.dayofyear == 1
+        assert b_date.days_in_month == 31
+        assert Period(freq='B', year=2012,
+                      month=2, day=1).days_in_month == 29
+
+        d_date = Period(freq='D', year=2007, month=1, day=1)
+
+        assert d_date.year == 2007
+        assert d_date.quarter == 1
+        assert d_date.month == 1
+        assert d_date.day == 1
+        assert d_date.weekday == 0
+        assert d_date.dayofyear == 1
+        assert d_date.days_in_month == 31
+        assert Period(freq='D', year=2012, month=2,
+                      day=1).days_in_month == 29
+
+    def test_properties_hourly(self):
+        # Test properties on Periods with hourly frequency.
+        h_date1 = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        h_date2 = Period(freq='2H', year=2007, month=1, day=1, hour=0)
+
+        for h_date in [h_date1, h_date2]:
+            assert h_date.year == 2007
+            assert h_date.quarter == 1
+            assert h_date.month == 1
+            assert h_date.day == 1
+            assert h_date.weekday == 0
+            assert h_date.dayofyear == 1
+            assert h_date.hour == 0
+            assert h_date.days_in_month == 31
+            assert Period(freq='H', year=2012, month=2, day=1,
+                          hour=0).days_in_month == 29
+
+    def test_properties_minutely(self):
+        # Test properties on Periods with minutely frequency.
+        t_date = Period(freq='Min', year=2007, month=1, day=1, hour=0,
+                        minute=0)
+        #
+        assert t_date.quarter == 1
+        assert t_date.month == 1
+        assert t_date.day == 1
+        assert t_date.weekday == 0
+        assert t_date.dayofyear == 1
+        assert t_date.hour == 0
+        assert t_date.minute == 0
+        assert t_date.days_in_month == 31
+        assert Period(freq='D', year=2012, month=2, day=1, hour=0,
+                      minute=0).days_in_month == 29
+
+    def test_properties_secondly(self):
+        # Test properties on Periods with secondly frequency.
+        s_date = Period(freq='Min', year=2007, month=1, day=1, hour=0,
+                        minute=0, second=0)
+        #
+        assert s_date.year == 2007
+        assert s_date.quarter == 1
+        assert s_date.month == 1
+        assert s_date.day == 1
+        assert s_date.weekday == 0
+        assert s_date.dayofyear == 1
+        assert s_date.hour == 0
+        assert s_date.minute == 0
+        assert s_date.second == 0
+        assert s_date.days_in_month == 31
+        assert Period(freq='Min', year=2012, month=2, day=1, hour=0,
+                      minute=0, second=0).days_in_month == 29
+
+    def test_pnow(self):
+
+        # deprecation, xref #13790
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            period.pnow('D')
+
+    def test_constructor_corner(self):
+        expected = Period('2007-01', freq='2M')
+        assert Period(year=2007, month=1, freq='2M') == expected
+
+        pytest.raises(ValueError, Period, datetime.now())
+        pytest.raises(ValueError, Period, datetime.now().date())
+        pytest.raises(ValueError, Period, 1.6, freq='D')
+        pytest.raises(ValueError, Period, ordinal=1.6, freq='D')
+        pytest.raises(ValueError, Period, ordinal=2, value=1, freq='D')
+        assert Period(None) is pd.NaT
+        pytest.raises(ValueError, Period, month=1)
+
+        p = Period('2007-01-01', freq='D')
+
+        result = Period(p, freq='A')
+        exp = Period('2007', freq='A')
+        assert result == exp
+
+    def test_constructor_infer_freq(self):
+        p = Period('2007-01-01')
+        assert p.freq == 'D'
+
+        p = Period('2007-01-01 07')
+        assert p.freq == 'H'
+
+        p = Period('2007-01-01 07:10')
+        assert p.freq == 'T'
+
+        p = Period('2007-01-01 07:10:15')
+        assert p.freq == 'S'
+
+        p = Period('2007-01-01 07:10:15.123')
+        assert p.freq == 'L'
+
+        p = Period('2007-01-01 07:10:15.123000')
+        assert p.freq == 'L'
+
+        p = Period('2007-01-01 07:10:15.123400')
+        assert p.freq == 'U'
+
+    def test_badinput(self):
+        pytest.raises(ValueError, Period, '-2000', 'A')
+        pytest.raises(DateParseError, Period, '0', 'A')
+        pytest.raises(DateParseError, Period, '1/1/-2000', 'A')
+
+    def test_multiples(self):
+        result1 = Period('1989', freq='2A')
+        result2 = Period('1989', freq='A')
+        assert result1.ordinal == result2.ordinal
+        assert result1.freqstr == '2A-DEC'
+        assert result2.freqstr == 'A-DEC'
+        assert result1.freq == offsets.YearEnd(2)
+        assert result2.freq == offsets.YearEnd()
+
+        assert (result1 + 1).ordinal == result1.ordinal + 2
+        assert (1 + result1).ordinal == result1.ordinal + 2
+        assert (result1 - 1).ordinal == result2.ordinal - 2
+        assert (-1 + result1).ordinal == result2.ordinal - 2
+
+    def test_round_trip(self):
+
+        p = Period('2000Q1')
+        new_p = tm.round_trip_pickle(p)
+        assert new_p == p
+
+
+class TestPeriodField(object):
+
+    def test_get_period_field_array_raises_on_out_of_range(self):
+        pytest.raises(ValueError, libperiod.get_period_field_arr, -1,
+                      np.empty(1), 0)
+
+
+class TestComparisons(object):
+
+    def setup_method(self, method):
+        self.january1 = Period('2000-01', 'M')
+        self.january2 = Period('2000-01', 'M')
+        self.february = Period('2000-02', 'M')
+        self.march = Period('2000-03', 'M')
+        self.day = Period('2012-01-01', 'D')
+
+    def test_equal(self):
+        assert self.january1 == self.january2
+
+    def test_equal_Raises_Value(self):
+        with pytest.raises(period.IncompatibleFrequency):
+            self.january1 == self.day
+
+    def test_notEqual(self):
+        assert self.january1 != 1
+        assert self.january1 != self.february
+
+    def test_greater(self):
+        assert self.february > self.january1
+
+    def test_greater_Raises_Value(self):
+        with pytest.raises(period.IncompatibleFrequency):
+            self.january1 > self.day
+
+    def test_greater_Raises_Type(self):
+        with pytest.raises(TypeError):
+            self.january1 > 1
+
+    def test_greaterEqual(self):
+        assert self.january1 >= self.january2
+
+    def test_greaterEqual_Raises_Value(self):
+        with pytest.raises(period.IncompatibleFrequency):
+            self.january1 >= self.day
+
+        with pytest.raises(TypeError):
+            print(self.january1 >= 1)
+
+    def test_smallerEqual(self):
+        assert self.january1 <= self.january2
+
+    def test_smallerEqual_Raises_Value(self):
+        with pytest.raises(period.IncompatibleFrequency):
+            self.january1 <= self.day
+
+    def test_smallerEqual_Raises_Type(self):
+        with pytest.raises(TypeError):
+            self.january1 <= 1
+
+    def test_smaller(self):
+        assert self.january1 < self.february
+
+    def test_smaller_Raises_Value(self):
+        with pytest.raises(period.IncompatibleFrequency):
+            self.january1 < self.day
+
+    def test_smaller_Raises_Type(self):
+        with pytest.raises(TypeError):
+            self.january1 < 1
+
+    def test_sort(self):
+        periods = [self.march, self.january1, self.february]
+        correctPeriods = [self.january1, self.february, self.march]
+        assert sorted(periods) == correctPeriods
+
+    def test_period_nat_comp(self):
+        p_nat = Period('NaT', freq='D')
+        p = Period('2011-01-01', freq='D')
+
+        nat = pd.Timestamp('NaT')
+        t = pd.Timestamp('2011-01-01')
+        # confirm Period('NaT') work identical with Timestamp('NaT')
+        for left, right in [(p_nat, p), (p, p_nat), (p_nat, p_nat), (nat, t),
+                            (t, nat), (nat, nat)]:
+            assert not left < right
+            assert not left > right
+            assert not left == right
+            assert left != right
+            assert not left <= right
+            assert not left >= right
+
+
+class TestMethods(object):
+
+    def test_add(self):
+        dt1 = Period(freq='D', year=2008, month=1, day=1)
+        dt2 = Period(freq='D', year=2008, month=1, day=2)
+        assert dt1 + 1 == dt2
+        assert 1 + dt1 == dt2
+
+    def test_add_pdnat(self):
+        p = pd.Period('2011-01', freq='M')
+        assert p + pd.NaT is pd.NaT
+        assert pd.NaT + p is pd.NaT
+
+        p = pd.Period('NaT', freq='M')
+        assert p + pd.NaT is pd.NaT
+        assert pd.NaT + p is pd.NaT
+
+    def test_add_raises(self):
+        # GH 4731
+        dt1 = Period(freq='D', year=2008, month=1, day=1)
+        dt2 = Period(freq='D', year=2008, month=1, day=2)
+        msg = r"unsupported operand type\(s\)"
+        with tm.assert_raises_regex(TypeError, msg):
+            dt1 + "str"
+
+        msg = r"unsupported operand type\(s\)"
+        with tm.assert_raises_regex(TypeError, msg):
+            "str" + dt1
+
+        with tm.assert_raises_regex(TypeError, msg):
+            dt1 + dt2
+
+    boxes = [lambda x: x, lambda x: pd.Series([x]), lambda x: pd.Index([x])]
+
+    @pytest.mark.parametrize('lbox', boxes)
+    @pytest.mark.parametrize('rbox', boxes)
+    def test_add_timestamp_raises(self, rbox, lbox):
+        # GH # 17983
+        ts = pd.Timestamp('2017')
+        per = pd.Period('2017', freq='M')
+
+        # We may get a different message depending on which class raises
+        # the error.
+        msg = (r"cannot add|unsupported operand|"
+               r"can only operate on a|incompatible type|"
+               r"ufunc add cannot use operands")
+        with tm.assert_raises_regex(TypeError, msg):
+            lbox(ts) + rbox(per)
+
+        with tm.assert_raises_regex(TypeError, msg):
+            lbox(per) + rbox(ts)
+
+        with tm.assert_raises_regex(TypeError, msg):
+            lbox(per) + rbox(per)
+
+    def test_sub(self):
+        dt1 = Period('2011-01-01', freq='D')
+        dt2 = Period('2011-01-15', freq='D')
+
+        off = dt1.freq
+        assert dt1 - dt2 == -14 * off
+        assert dt2 - dt1 == 14 * off
+
+        msg = r"Input has different freq=M from Period\(freq=D\)"
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            dt1 - pd.Period('2011-02', freq='M')
+
+    def test_add_offset(self):
+        # freq is DateOffset
+        for freq in ['A', '2A', '3A']:
+            p = Period('2011', freq=freq)
+            exp = Period('2013', freq=freq)
+            assert p + offsets.YearEnd(2) == exp
+            assert offsets.YearEnd(2) + p == exp
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p + o
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    with pytest.raises(period.IncompatibleFrequency):
+                        o + p
+
+        for freq in ['M', '2M', '3M']:
+            p = Period('2011-03', freq=freq)
+            exp = Period('2011-05', freq=freq)
+            assert p + offsets.MonthEnd(2) == exp
+            assert offsets.MonthEnd(2) + p == exp
+
+            exp = Period('2012-03', freq=freq)
+            assert p + offsets.MonthEnd(12) == exp
+            assert offsets.MonthEnd(12) + p == exp
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p + o
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    with pytest.raises(period.IncompatibleFrequency):
+                        o + p
+
+        # freq is Tick
+        for freq in ['D', '2D', '3D']:
+            p = Period('2011-04-01', freq=freq)
+
+            exp = Period('2011-04-06', freq=freq)
+            assert p + offsets.Day(5) == exp
+            assert offsets.Day(5) + p == exp
+
+            exp = Period('2011-04-02', freq=freq)
+            assert p + offsets.Hour(24) == exp
+            assert offsets.Hour(24) + p == exp
+
+            exp = Period('2011-04-03', freq=freq)
+            assert p + np.timedelta64(2, 'D') == exp
+            with pytest.raises(TypeError):
+                np.timedelta64(2, 'D') + p
+
+            exp = Period('2011-04-02', freq=freq)
+            assert p + np.timedelta64(3600 * 24, 's') == exp
+            with pytest.raises(TypeError):
+                np.timedelta64(3600 * 24, 's') + p
+
+            exp = Period('2011-03-30', freq=freq)
+            assert p + timedelta(-2) == exp
+            assert timedelta(-2) + p == exp
+
+            exp = Period('2011-04-03', freq=freq)
+            assert p + timedelta(hours=48) == exp
+            assert timedelta(hours=48) + p == exp
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(4, 'h'),
+                      timedelta(hours=23)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p + o
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    with pytest.raises(period.IncompatibleFrequency):
+                        o + p
+
+        for freq in ['H', '2H', '3H']:
+            p = Period('2011-04-01 09:00', freq=freq)
+
+            exp = Period('2011-04-03 09:00', freq=freq)
+            assert p + offsets.Day(2) == exp
+            assert offsets.Day(2) + p == exp
+
+            exp = Period('2011-04-01 12:00', freq=freq)
+            assert p + offsets.Hour(3) == exp
+            assert offsets.Hour(3) + p == exp
+
+            exp = Period('2011-04-01 12:00', freq=freq)
+            assert p + np.timedelta64(3, 'h') == exp
+            with pytest.raises(TypeError):
+                np.timedelta64(3, 'h') + p
+
+            exp = Period('2011-04-01 10:00', freq=freq)
+            assert p + np.timedelta64(3600, 's') == exp
+            with pytest.raises(TypeError):
+                np.timedelta64(3600, 's') + p
+
+            exp = Period('2011-04-01 11:00', freq=freq)
+            assert p + timedelta(minutes=120) == exp
+            assert timedelta(minutes=120) + p == exp
+
+            exp = Period('2011-04-05 12:00', freq=freq)
+            assert p + timedelta(days=4, minutes=180) == exp
+            assert timedelta(days=4, minutes=180) + p == exp
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(3200, 's'),
+                      timedelta(hours=23, minutes=30)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p + o
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    with pytest.raises(period.IncompatibleFrequency):
+                        o + p
+
+    def test_add_offset_nat(self):
+        # freq is DateOffset
+        for freq in ['A', '2A', '3A']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.YearEnd(2)]:
+                assert p + o is tslib.NaT
+                assert o + p is tslib.NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                assert p + o is tslib.NaT
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    assert o + p is tslib.NaT
+
+        for freq in ['M', '2M', '3M']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.MonthEnd(2), offsets.MonthEnd(12)]:
+                assert p + o is tslib.NaT
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    assert o + p is tslib.NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                assert p + o is tslib.NaT
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    assert o + p is tslib.NaT
+
+        # freq is Tick
+        for freq in ['D', '2D', '3D']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.Day(5), offsets.Hour(24), np.timedelta64(2, 'D'),
+                      np.timedelta64(3600 * 24, 's'), timedelta(-2),
+                      timedelta(hours=48)]:
+                assert p + o is tslib.NaT
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    assert o + p is tslib.NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(4, 'h'),
+                      timedelta(hours=23)]:
+                assert p + o is tslib.NaT
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    assert o + p is tslib.NaT
+
+        for freq in ['H', '2H', '3H']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.Day(2), offsets.Hour(3), np.timedelta64(3, 'h'),
+                      np.timedelta64(3600, 's'), timedelta(minutes=120),
+                      timedelta(days=4, minutes=180)]:
+                assert p + o is tslib.NaT
+
+                if not isinstance(o, np.timedelta64):
+                    assert o + p is tslib.NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(3200, 's'),
+                      timedelta(hours=23, minutes=30)]:
+                assert p + o is tslib.NaT
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    assert o + p is tslib.NaT
+
+    def test_sub_pdnat(self):
+        # GH 13071
+        p = pd.Period('2011-01', freq='M')
+        assert p - pd.NaT is pd.NaT
+        assert pd.NaT - p is pd.NaT
+
+        p = pd.Period('NaT', freq='M')
+        assert p - pd.NaT is pd.NaT
+        assert pd.NaT - p is pd.NaT
+
+    def test_sub_offset(self):
+        # freq is DateOffset
+        for freq in ['A', '2A', '3A']:
+            p = Period('2011', freq=freq)
+            assert p - offsets.YearEnd(2) == Period('2009', freq=freq)
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p - o
+
+        for freq in ['M', '2M', '3M']:
+            p = Period('2011-03', freq=freq)
+            assert p - offsets.MonthEnd(2) == Period('2011-01', freq=freq)
+            assert p - offsets.MonthEnd(12) == Period('2010-03', freq=freq)
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p - o
+
+        # freq is Tick
+        for freq in ['D', '2D', '3D']:
+            p = Period('2011-04-01', freq=freq)
+            assert p - offsets.Day(5) == Period('2011-03-27', freq=freq)
+            assert p - offsets.Hour(24) == Period('2011-03-31', freq=freq)
+            assert p - np.timedelta64(2, 'D') == Period(
+                '2011-03-30', freq=freq)
+            assert p - np.timedelta64(3600 * 24, 's') == Period(
+                '2011-03-31', freq=freq)
+            assert p - timedelta(-2) == Period('2011-04-03', freq=freq)
+            assert p - timedelta(hours=48) == Period('2011-03-30', freq=freq)
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(4, 'h'),
+                      timedelta(hours=23)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p - o
+
+        for freq in ['H', '2H', '3H']:
+            p = Period('2011-04-01 09:00', freq=freq)
+            assert p - offsets.Day(2) == Period('2011-03-30 09:00', freq=freq)
+            assert p - offsets.Hour(3) == Period('2011-04-01 06:00', freq=freq)
+            assert p - np.timedelta64(3, 'h') == Period(
+                '2011-04-01 06:00', freq=freq)
+            assert p - np.timedelta64(3600, 's') == Period(
+                '2011-04-01 08:00', freq=freq)
+            assert p - timedelta(minutes=120) == Period(
+                '2011-04-01 07:00', freq=freq)
+            assert p - timedelta(days=4, minutes=180) == Period(
+                '2011-03-28 06:00', freq=freq)
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(3200, 's'),
+                      timedelta(hours=23, minutes=30)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p - o
+
+    def test_sub_offset_nat(self):
+        # freq is DateOffset
+        for freq in ['A', '2A', '3A']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.YearEnd(2)]:
+                assert p - o is tslib.NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                assert p - o is tslib.NaT
+
+        for freq in ['M', '2M', '3M']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.MonthEnd(2), offsets.MonthEnd(12)]:
+                assert p - o is tslib.NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                assert p - o is tslib.NaT
+
+        # freq is Tick
+        for freq in ['D', '2D', '3D']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.Day(5), offsets.Hour(24), np.timedelta64(2, 'D'),
+                      np.timedelta64(3600 * 24, 's'), timedelta(-2),
+                      timedelta(hours=48)]:
+                assert p - o is tslib.NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(4, 'h'),
+                      timedelta(hours=23)]:
+                assert p - o is tslib.NaT
+
+        for freq in ['H', '2H', '3H']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.Day(2), offsets.Hour(3), np.timedelta64(3, 'h'),
+                      np.timedelta64(3600, 's'), timedelta(minutes=120),
+                      timedelta(days=4, minutes=180)]:
+                assert p - o is tslib.NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(3200, 's'),
+                      timedelta(hours=23, minutes=30)]:
+                assert p - o is tslib.NaT
+
+    @pytest.mark.parametrize('freq', ['M', '2M', '3M'])
+    def test_nat_ops(self, freq):
+        p = Period('NaT', freq=freq)
+        assert p + 1 is tslib.NaT
+        assert 1 + p is tslib.NaT
+        assert p - 1 is tslib.NaT
+        assert p - Period('2011-01', freq=freq) is tslib.NaT
+        assert Period('2011-01', freq=freq) - p is tslib.NaT
+
+    def test_period_ops_offset(self):
+        p = Period('2011-04-01', freq='D')
+        result = p + offsets.Day()
+        exp = pd.Period('2011-04-02', freq='D')
+        assert result == exp
+
+        result = p - offsets.Day(2)
+        exp = pd.Period('2011-03-30', freq='D')
+        assert result == exp
+
+        msg = r"Input cannot be converted to Period\(freq=D\)"
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            p + offsets.Hour(2)
+
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            p - offsets.Hour(2)
+
+
+def test_period_immutable():
+    # see gh-17116
+    per = pd.Period('2014Q1')
+    with pytest.raises(AttributeError):
+        per.ordinal = 14
+
+    freq = per.freq
+    with pytest.raises(AttributeError):
+        per.freq = 2 * freq
+
+
+@pytest.mark.xfail(reason='GH#19834 Period parsing error')
+def test_small_year_parsing():
+    per1 = Period('0001-01-07', 'D')
+    assert per1.year == 1
+    assert per1.day == 7
diff --git a/pandas/tests/scalar/test_nat.py b/pandas/tests/scalar/test_nat.py
new file mode 100644
index 0000000000000..a6b217a37bd0c
--- /dev/null
+++ b/pandas/tests/scalar/test_nat.py
@@ -0,0 +1,332 @@
+import pytest
+
+from datetime import datetime, timedelta
+import pytz
+
+import numpy as np
+from pandas import (NaT, Index, Timestamp, Timedelta, Period,
+                    DatetimeIndex, PeriodIndex,
+                    TimedeltaIndex, Series, isna)
+from pandas.util import testing as tm
+from pandas._libs.tslib import iNaT
+
+from pandas.compat import callable
+
+
+@pytest.mark.parametrize('nat, idx', [(Timestamp('NaT'), DatetimeIndex),
+                                      (Timedelta('NaT'), TimedeltaIndex),
+                                      (Period('NaT', freq='M'), PeriodIndex)])
+def test_nat_fields(nat, idx):
+
+    for field in idx._field_ops:
+
+        # weekday is a property of DTI, but a method
+        # on NaT/Timestamp for compat with datetime
+        if field == 'weekday':
+            continue
+
+        result = getattr(NaT, field)
+        assert np.isnan(result)
+
+        result = getattr(nat, field)
+        assert np.isnan(result)
+
+    for field in idx._bool_ops:
+
+        result = getattr(NaT, field)
+        assert result is False
+
+        result = getattr(nat, field)
+        assert result is False
+
+
+def test_nat_vector_field_access():
+    idx = DatetimeIndex(['1/1/2000', None, None, '1/4/2000'])
+
+    for field in DatetimeIndex._field_ops:
+        # weekday is a property of DTI, but a method
+        # on NaT/Timestamp for compat with datetime
+        if field == 'weekday':
+            continue
+
+        result = getattr(idx, field)
+        expected = Index([getattr(x, field) for x in idx])
+        tm.assert_index_equal(result, expected)
+
+    s = Series(idx)
+
+    for field in DatetimeIndex._field_ops:
+
+        # weekday is a property of DTI, but a method
+        # on NaT/Timestamp for compat with datetime
+        if field == 'weekday':
+            continue
+
+        result = getattr(s.dt, field)
+        expected = [getattr(x, field) for x in idx]
+        tm.assert_series_equal(result, Series(expected))
+
+    for field in DatetimeIndex._bool_ops:
+        result = getattr(s.dt, field)
+        expected = [getattr(x, field) for x in idx]
+        tm.assert_series_equal(result, Series(expected))
+
+
+@pytest.mark.parametrize('klass', [Timestamp, Timedelta, Period])
+def test_identity(klass):
+    assert klass(None) is NaT
+
+    result = klass(np.nan)
+    assert result is NaT
+
+    result = klass(None)
+    assert result is NaT
+
+    result = klass(iNaT)
+    assert result is NaT
+
+    result = klass(np.nan)
+    assert result is NaT
+
+    result = klass(float('nan'))
+    assert result is NaT
+
+    result = klass(NaT)
+    assert result is NaT
+
+    result = klass('NaT')
+    assert result is NaT
+
+    assert isna(klass('nat'))
+
+
+@pytest.mark.parametrize('klass', [Timestamp, Timedelta, Period])
+def test_equality(klass):
+
+    # nat
+    if klass is not Period:
+        klass('').value == iNaT
+    klass('nat').value == iNaT
+    klass('NAT').value == iNaT
+    klass(None).value == iNaT
+    klass(np.nan).value == iNaT
+    assert isna(klass('nat'))
+
+
+@pytest.mark.parametrize('klass', [Timestamp, Timedelta])
+def test_round_nat(klass):
+    # GH14940
+    ts = klass('nat')
+    for method in ["round", "floor", "ceil"]:
+        round_method = getattr(ts, method)
+        for freq in ["s", "5s", "min", "5min", "h", "5h"]:
+            assert round_method(freq) is ts
+
+
+def test_NaT_methods():
+    # GH 9513
+    # GH 17329 for `timestamp`
+    raise_methods = ['astimezone', 'combine', 'ctime', 'dst',
+                     'fromordinal', 'fromtimestamp', 'isocalendar',
+                     'strftime', 'strptime', 'time', 'timestamp',
+                     'timetuple', 'timetz', 'toordinal', 'tzname',
+                     'utcfromtimestamp', 'utcnow', 'utcoffset',
+                     'utctimetuple', 'timestamp']
+    nat_methods = ['date', 'now', 'replace', 'to_datetime', 'today',
+                   'tz_convert', 'tz_localize']
+    nan_methods = ['weekday', 'isoweekday']
+
+    for method in raise_methods:
+        if hasattr(NaT, method):
+            with pytest.raises(ValueError):
+                getattr(NaT, method)()
+
+    for method in nan_methods:
+        if hasattr(NaT, method):
+            assert np.isnan(getattr(NaT, method)())
+
+    for method in nat_methods:
+        if hasattr(NaT, method):
+            # see gh-8254
+            exp_warning = None
+            if method == 'to_datetime':
+                exp_warning = FutureWarning
+            with tm.assert_produces_warning(
+                    exp_warning, check_stacklevel=False):
+                assert getattr(NaT, method)() is NaT
+
+    # GH 12300
+    assert NaT.isoformat() == 'NaT'
+
+
+def test_NaT_docstrings():
+    # GH#17327
+    nat_names = dir(NaT)
+
+    # NaT should have *most* of the Timestamp methods, with matching
+    # docstrings.  The attributes that are not expected to be present in NaT
+    # are private methods plus `ts_expected` below.
+    ts_names = dir(Timestamp)
+    ts_missing = [x for x in ts_names if x not in nat_names and
+                  not x.startswith('_')]
+    ts_missing.sort()
+    ts_expected = ['freqstr', 'normalize',
+                   'to_julian_date',
+                   'to_period', 'tz']
+    assert ts_missing == ts_expected
+
+    ts_overlap = [x for x in nat_names if x in ts_names and
+                  not x.startswith('_') and
+                  callable(getattr(Timestamp, x))]
+    for name in ts_overlap:
+        tsdoc = getattr(Timestamp, name).__doc__
+        natdoc = getattr(NaT, name).__doc__
+        assert tsdoc == natdoc
+
+    # NaT should have *most* of the Timedelta methods, with matching
+    # docstrings.  The attributes that are not expected to be present in NaT
+    # are private methods plus `td_expected` below.
+    # For methods that are both Timestamp and Timedelta methods, the
+    # Timestamp docstring takes priority.
+    td_names = dir(Timedelta)
+    td_missing = [x for x in td_names if x not in nat_names and
+                  not x.startswith('_')]
+    td_missing.sort()
+    td_expected = ['components', 'delta', 'is_populated',
+                   'to_pytimedelta', 'to_timedelta64', 'view']
+    assert td_missing == td_expected
+
+    td_overlap = [x for x in nat_names if x in td_names and
+                  x not in ts_names and  # Timestamp __doc__ takes priority
+                  not x.startswith('_') and
+                  callable(getattr(Timedelta, x))]
+    assert td_overlap == ['total_seconds']
+    for name in td_overlap:
+        tddoc = getattr(Timedelta, name).__doc__
+        natdoc = getattr(NaT, name).__doc__
+        assert tddoc == natdoc
+
+
+@pytest.mark.parametrize('klass', [Timestamp, Timedelta])
+def test_isoformat(klass):
+
+    result = klass('NaT').isoformat()
+    expected = 'NaT'
+    assert result == expected
+
+
+def test_nat_arithmetic():
+    # GH 6873
+    i = 2
+    f = 1.5
+
+    for (left, right) in [(NaT, i), (NaT, f), (NaT, np.nan)]:
+        assert left / right is NaT
+        assert left * right is NaT
+        assert right * left is NaT
+        with pytest.raises(TypeError):
+            right / left
+
+    # Timestamp / datetime
+    t = Timestamp('2014-01-01')
+    dt = datetime(2014, 1, 1)
+    for (left, right) in [(NaT, NaT), (NaT, t), (NaT, dt)]:
+        # NaT __add__ or __sub__ Timestamp-like (or inverse) returns NaT
+        assert right + left is NaT
+        assert left + right is NaT
+        assert left - right is NaT
+        assert right - left is NaT
+
+    # timedelta-like
+    # offsets are tested in test_offsets.py
+
+    delta = timedelta(3600)
+    td = Timedelta('5s')
+
+    for (left, right) in [(NaT, delta), (NaT, td)]:
+        # NaT + timedelta-like returns NaT
+        assert right + left is NaT
+        assert left + right is NaT
+        assert right - left is NaT
+        assert left - right is NaT
+        assert np.isnan(left / right)
+        assert np.isnan(right / left)
+
+    # GH 11718
+    t_utc = Timestamp('2014-01-01', tz='UTC')
+    t_tz = Timestamp('2014-01-01', tz='US/Eastern')
+    dt_tz = pytz.timezone('Asia/Tokyo').localize(dt)
+
+    for (left, right) in [(NaT, t_utc), (NaT, t_tz),
+                          (NaT, dt_tz)]:
+        # NaT __add__ or __sub__ Timestamp-like (or inverse) returns NaT
+        assert right + left is NaT
+        assert left + right is NaT
+        assert left - right is NaT
+        assert right - left is NaT
+
+    # int addition / subtraction
+    for (left, right) in [(NaT, 2), (NaT, 0), (NaT, -3)]:
+        assert right + left is NaT
+        assert left + right is NaT
+        assert left - right is NaT
+        assert right - left is NaT
+
+
+def test_nat_rfloordiv_timedelta():
+    # GH#18846
+    # See also test_timedelta.TestTimedeltaArithmetic.test_floordiv
+    td = Timedelta(hours=3, minutes=4)
+
+    assert td // np.nan is NaT
+    assert np.isnan(td // NaT)
+    assert np.isnan(td // np.timedelta64('NaT'))
+
+
+def test_nat_arithmetic_index():
+    # GH 11718
+
+    dti = DatetimeIndex(['2011-01-01', '2011-01-02'], name='x')
+    exp = DatetimeIndex([NaT, NaT], name='x')
+    tm.assert_index_equal(dti + NaT, exp)
+    tm.assert_index_equal(NaT + dti, exp)
+
+    dti_tz = DatetimeIndex(['2011-01-01', '2011-01-02'],
+                           tz='US/Eastern', name='x')
+    exp = DatetimeIndex([NaT, NaT], name='x', tz='US/Eastern')
+    tm.assert_index_equal(dti_tz + NaT, exp)
+    tm.assert_index_equal(NaT + dti_tz, exp)
+
+    exp = TimedeltaIndex([NaT, NaT], name='x')
+    for (left, right) in [(NaT, dti), (NaT, dti_tz)]:
+        tm.assert_index_equal(left - right, exp)
+        tm.assert_index_equal(right - left, exp)
+
+    # timedelta # GH#19124
+    tdi = TimedeltaIndex(['1 day', '2 day'], name='x')
+    tdi_nat = TimedeltaIndex([NaT, NaT], name='x')
+
+    tm.assert_index_equal(tdi + NaT, tdi_nat)
+    tm.assert_index_equal(NaT + tdi, tdi_nat)
+    tm.assert_index_equal(tdi - NaT, tdi_nat)
+    tm.assert_index_equal(NaT - tdi, tdi_nat)
+
+
+@pytest.mark.parametrize('box, assert_func', [
+    (TimedeltaIndex, tm.assert_index_equal),
+    (Series, tm.assert_series_equal)
+])
+def test_nat_arithmetic_td64_vector(box, assert_func):
+    # GH#19124
+    vec = box(['1 day', '2 day'], dtype='timedelta64[ns]')
+    box_nat = box([NaT, NaT], dtype='timedelta64[ns]')
+
+    assert_func(vec + NaT, box_nat)
+    assert_func(NaT + vec, box_nat)
+    assert_func(vec - NaT, box_nat)
+    assert_func(NaT - vec, box_nat)
+
+
+def test_nat_pinned_docstrings():
+    # GH17327
+    assert NaT.ctime.__doc__ == datetime.ctime.__doc__
diff --git a/pandas/tests/scalar/timedelta/__init__.py b/pandas/tests/scalar/timedelta/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/scalar/timedelta/test_arithmetic.py b/pandas/tests/scalar/timedelta/test_arithmetic.py
new file mode 100644
index 0000000000000..9636c92ec22d5
--- /dev/null
+++ b/pandas/tests/scalar/timedelta/test_arithmetic.py
@@ -0,0 +1,618 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for scalar Timedelta arithmetic ops
+"""
+from datetime import datetime, timedelta
+import operator
+
+import numpy as np
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.core import ops
+from pandas import Timedelta, Timestamp, NaT
+
+
+class TestTimedeltaAdditionSubtraction(object):
+    """
+    Tests for Timedelta methods:
+
+        __add__, __radd__,
+        __sub__, __rsub__
+    """
+    @pytest.mark.parametrize('ten_seconds', [
+        Timedelta(10, unit='s'),
+        timedelta(seconds=10),
+        np.timedelta64(10, 's'),
+        np.timedelta64(10000000000, 'ns'),
+        pd.offsets.Second(10)])
+    def test_td_add_sub_ten_seconds(self, ten_seconds):
+        # GH#6808
+        base = Timestamp('20130101 09:01:12.123456')
+        expected_add = Timestamp('20130101 09:01:22.123456')
+        expected_sub = Timestamp('20130101 09:01:02.123456')
+
+        result = base + ten_seconds
+        assert result == expected_add
+
+        result = base - ten_seconds
+        assert result == expected_sub
+
+    @pytest.mark.parametrize('one_day_ten_secs', [
+        Timedelta('1 day, 00:00:10'),
+        Timedelta('1 days, 00:00:10'),
+        timedelta(days=1, seconds=10),
+        np.timedelta64(1, 'D') + np.timedelta64(10, 's'),
+        pd.offsets.Day() + pd.offsets.Second(10)])
+    def test_td_add_sub_one_day_ten_seconds(self, one_day_ten_secs):
+        # GH#6808
+        base = Timestamp('20130102 09:01:12.123456')
+        expected_add = Timestamp('20130103 09:01:22.123456')
+        expected_sub = Timestamp('20130101 09:01:02.123456')
+
+        result = base + one_day_ten_secs
+        assert result == expected_add
+
+        result = base - one_day_ten_secs
+        assert result == expected_sub
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_td_add_datetimelike_scalar(self, op):
+        # GH#19738
+        td = Timedelta(10, unit='d')
+
+        result = op(td, datetime(2016, 1, 1))
+        if op is operator.add:
+            # datetime + Timedelta does _not_ call Timedelta.__radd__,
+            # so we get a datetime back instead of a Timestamp
+            assert isinstance(result, Timestamp)
+        assert result == Timestamp(2016, 1, 11)
+
+        result = op(td, Timestamp('2018-01-12 18:09'))
+        assert isinstance(result, Timestamp)
+        assert result == Timestamp('2018-01-22 18:09')
+
+        result = op(td, np.datetime64('2018-01-12'))
+        assert isinstance(result, Timestamp)
+        assert result == Timestamp('2018-01-22')
+
+        result = op(td, NaT)
+        assert result is NaT
+
+        with pytest.raises(TypeError):
+            op(td, 2)
+        with pytest.raises(TypeError):
+            op(td, 2.0)
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_td_add_td(self, op):
+        td = Timedelta(10, unit='d')
+
+        result = op(td, Timedelta(days=10))
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(days=20)
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_td_add_pytimedelta(self, op):
+        td = Timedelta(10, unit='d')
+        result = op(td, timedelta(days=9))
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(days=19)
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_td_add_timedelta64(self, op):
+        td = Timedelta(10, unit='d')
+        result = op(td, np.timedelta64(-4, 'D'))
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(days=6)
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_td_add_offset(self, op):
+        td = Timedelta(10, unit='d')
+
+        result = op(td, pd.offsets.Hour(6))
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(days=10, hours=6)
+
+    def test_td_sub_td(self):
+        td = Timedelta(10, unit='d')
+        expected = Timedelta(0, unit='ns')
+        result = td - td
+        assert isinstance(result, Timedelta)
+        assert result == expected
+
+    def test_td_sub_pytimedelta(self):
+        td = Timedelta(10, unit='d')
+        expected = Timedelta(0, unit='ns')
+        result = td - td.to_pytimedelta()
+        assert isinstance(result, Timedelta)
+        assert result == expected
+
+    def test_td_sub_timedelta64(self):
+        td = Timedelta(10, unit='d')
+        expected = Timedelta(0, unit='ns')
+        result = td - td.to_timedelta64()
+        assert isinstance(result, Timedelta)
+        assert result == expected
+
+    def test_td_sub_nat(self):
+        td = Timedelta(10, unit='d')
+        result = td - NaT
+        assert result is NaT
+
+    def test_td_sub_td64_nat(self):
+        td = Timedelta(10, unit='d')
+        result = td - np.timedelta64('NaT')
+        assert result is NaT
+
+    def test_td_sub_offset(self):
+        td = Timedelta(10, unit='d')
+        result = td - pd.offsets.Hour(1)
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(239, unit='h')
+
+    def test_td_sub_numeric_raises(self):
+        td = td = Timedelta(10, unit='d')
+        with pytest.raises(TypeError):
+            td - 2
+        with pytest.raises(TypeError):
+            td - 2.0
+
+    def test_td_rsub_pytimedelta(self):
+        td = Timedelta(10, unit='d')
+        expected = Timedelta(0, unit='ns')
+
+        result = td.to_pytimedelta() - td
+        assert isinstance(result, Timedelta)
+        assert result == expected
+
+    def test_td_rsub_timedelta64(self):
+        td = Timedelta(10, unit='d')
+        expected = Timedelta(0, unit='ns')
+
+        result = td.to_timedelta64() - td
+        assert isinstance(result, Timedelta)
+        assert result == expected
+
+    def test_td_rsub_nat(self):
+        td = Timedelta(10, unit='d')
+        result = NaT - td
+        assert result is NaT
+
+        result = np.datetime64('NaT') - td
+        assert result is NaT
+
+    def test_td_rsub_td64_nat(self):
+        td = Timedelta(10, unit='d')
+        result = np.timedelta64('NaT') - td
+        assert result is NaT
+
+    def test_td_rsub_offset(self):
+        result = pd.offsets.Hour(1) - Timedelta(10, unit='d')
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(-239, unit='h')
+
+    def test_td_rsub_numeric_raises(self):
+        td = td = Timedelta(10, unit='d')
+        with pytest.raises(TypeError):
+            2 - td
+        with pytest.raises(TypeError):
+            2.0 - td
+
+
+class TestTimedeltaMultiplicationDivision(object):
+    """
+    Tests for Timedelta methods:
+
+        __mul__, __rmul__,
+        __div__, __rdiv__,
+        __truediv__, __rtruediv__,
+        __floordiv__, __rfloordiv__,
+        __mod__, __rmod__,
+        __divmod__, __rdivmod__
+    """
+
+    # ---------------------------------------------------------------
+    # Timedelta.__mul__, __rmul__
+
+    @pytest.mark.parametrize('td_nat', [pd.NaT,
+                                        np.timedelta64('NaT', 'ns'),
+                                        np.timedelta64('NaT')])
+    @pytest.mark.parametrize('op', [operator.mul, ops.rmul])
+    def test_td_mul_nat(self, op, td_nat):
+        # GH#19819
+        td = Timedelta(10, unit='d')
+        with pytest.raises(TypeError):
+            op(td, td_nat)
+
+    @pytest.mark.parametrize('op', [operator.mul, ops.rmul])
+    def test_td_mul_scalar(self, op):
+        # GH#19738
+        td = Timedelta(minutes=3)
+
+        result = op(td, 2)
+        assert result == Timedelta(minutes=6)
+
+        result = op(td, 1.5)
+        assert result == Timedelta(minutes=4, seconds=30)
+
+        assert op(td, np.nan) is NaT
+
+        assert op(-1, td).value == -1 * td.value
+        assert op(-1.0, td).value == -1.0 * td.value
+
+        with pytest.raises(TypeError):
+            # timedelta * datetime is gibberish
+            op(td, Timestamp(2016, 1, 2))
+
+        with pytest.raises(TypeError):
+            # invalid multiply with another timedelta
+            op(td, td)
+
+    # ---------------------------------------------------------------
+    # Timedelta.__div__, __truediv__
+
+    def test_td_div_timedeltalike_scalar(self):
+        # GH#19738
+        td = Timedelta(10, unit='d')
+
+        result = td / pd.offsets.Hour(1)
+        assert result == 240
+
+        assert td / td == 1
+        assert td / np.timedelta64(60, 'h') == 4
+
+        assert np.isnan(td / NaT)
+
+    def test_td_div_numeric_scalar(self):
+        # GH#19738
+        td = Timedelta(10, unit='d')
+
+        result = td / 2
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(days=5)
+
+        result = td / 5.0
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(days=2)
+
+    # ---------------------------------------------------------------
+    # Timedelta.__rdiv__
+
+    def test_td_rdiv_timedeltalike_scalar(self):
+        # GH#19738
+        td = Timedelta(10, unit='d')
+        result = pd.offsets.Hour(1) / td
+        assert result == 1 / 240.0
+
+        assert np.timedelta64(60, 'h') / td == 0.25
+
+    # ---------------------------------------------------------------
+    # Timedelta.__floordiv__
+
+    def test_td_floordiv_timedeltalike_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=4)
+        scalar = Timedelta(hours=3, minutes=3)
+
+        assert td // scalar == 1
+        assert -td // scalar.to_pytimedelta() == -2
+        assert (2 * td) // scalar.to_timedelta64() == 2
+
+    def test_td_floordiv_null_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=4)
+
+        assert td // np.nan is NaT
+        assert np.isnan(td // NaT)
+        assert np.isnan(td // np.timedelta64('NaT'))
+
+    def test_td_floordiv_offsets(self):
+        # GH#19738
+        td = Timedelta(hours=3, minutes=4)
+        assert td // pd.offsets.Hour(1) == 3
+        assert td // pd.offsets.Minute(2) == 92
+
+    def test_td_floordiv_invalid_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=4)
+
+        with pytest.raises(TypeError):
+            td // np.datetime64('2016-01-01', dtype='datetime64[us]')
+
+    def test_td_floordiv_numeric_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=4)
+
+        expected = Timedelta(hours=1, minutes=32)
+        assert td // 2 == expected
+        assert td // 2.0 == expected
+        assert td // np.float64(2.0) == expected
+        assert td // np.int32(2.0) == expected
+        assert td // np.uint8(2.0) == expected
+
+    def test_td_floordiv_timedeltalike_array(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=4)
+        scalar = Timedelta(hours=3, minutes=3)
+
+        # Array-like others
+        assert td // np.array(scalar.to_timedelta64()) == 1
+
+        res = (3 * td) // np.array([scalar.to_timedelta64()])
+        expected = np.array([3], dtype=np.int64)
+        tm.assert_numpy_array_equal(res, expected)
+
+        res = (10 * td) // np.array([scalar.to_timedelta64(),
+                                     np.timedelta64('NaT')])
+        expected = np.array([10, np.nan])
+        tm.assert_numpy_array_equal(res, expected)
+
+    def test_td_floordiv_numeric_series(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=4)
+        ser = pd.Series([1], dtype=np.int64)
+        res = td // ser
+        assert res.dtype.kind == 'm'
+
+    # ---------------------------------------------------------------
+    # Timedelta.__rfloordiv__
+
+    def test_td_rfloordiv_timedeltalike_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=3)
+        scalar = Timedelta(hours=3, minutes=4)
+
+        # scalar others
+        # x // Timedelta is defined only for timedelta-like x. int-like,
+        # float-like, and date-like, in particular, should all either
+        # a) raise TypeError directly or
+        # b) return NotImplemented, following which the reversed
+        #    operation will raise TypeError.
+        assert td.__rfloordiv__(scalar) == 1
+        assert (-td).__rfloordiv__(scalar.to_pytimedelta()) == -2
+        assert (2 * td).__rfloordiv__(scalar.to_timedelta64()) == 0
+
+    def test_td_rfloordiv_null_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=3)
+
+        assert np.isnan(td.__rfloordiv__(NaT))
+        assert np.isnan(td.__rfloordiv__(np.timedelta64('NaT')))
+
+    def test_td_rfloordiv_offsets(self):
+        # GH#19738
+        assert pd.offsets.Hour(1) // Timedelta(minutes=25) == 2
+
+    def test_td_rfloordiv_invalid_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=3)
+
+        dt64 = np.datetime64('2016-01-01', dtype='datetime64[us]')
+        with pytest.raises(TypeError):
+            td.__rfloordiv__(dt64)
+
+    def test_td_rfloordiv_numeric_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=3)
+
+        assert td.__rfloordiv__(np.nan) is NotImplemented
+        assert td.__rfloordiv__(3.5) is NotImplemented
+        assert td.__rfloordiv__(2) is NotImplemented
+
+        with pytest.raises(TypeError):
+            td.__rfloordiv__(np.float64(2.0))
+        with pytest.raises(TypeError):
+            td.__rfloordiv__(np.uint8(9))
+        with tm.assert_produces_warning(FutureWarning):
+            # GH-19761: Change to TypeError.
+            td.__rfloordiv__(np.int32(2.0))
+
+    def test_td_rfloordiv_timedeltalike_array(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=3)
+        scalar = Timedelta(hours=3, minutes=4)
+
+        # Array-like others
+        assert td.__rfloordiv__(np.array(scalar.to_timedelta64())) == 1
+
+        res = td.__rfloordiv__(np.array([(3 * scalar).to_timedelta64()]))
+        expected = np.array([3], dtype=np.int64)
+        tm.assert_numpy_array_equal(res, expected)
+
+        arr = np.array([(10 * scalar).to_timedelta64(),
+                        np.timedelta64('NaT')])
+        res = td.__rfloordiv__(arr)
+        expected = np.array([10, np.nan])
+        tm.assert_numpy_array_equal(res, expected)
+
+    def test_td_rfloordiv_numeric_series(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=3)
+        ser = pd.Series([1], dtype=np.int64)
+        res = td.__rfloordiv__(ser)
+        assert res is NotImplemented
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # TODO: GH-19761. Change to TypeError.
+            ser // td
+
+    def test_mod_timedeltalike(self):
+        # GH#19365
+        td = Timedelta(hours=37)
+
+        # Timedelta-like others
+        result = td % Timedelta(hours=6)
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(hours=1)
+
+        result = td % timedelta(minutes=60)
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(0)
+
+        result = td % NaT
+        assert result is NaT
+
+    def test_mod_timedelta64_nat(self):
+        # GH#19365
+        td = Timedelta(hours=37)
+
+        result = td % np.timedelta64('NaT', 'ns')
+        assert result is NaT
+
+    def test_mod_timedelta64(self):
+        # GH#19365
+        td = Timedelta(hours=37)
+
+        result = td % np.timedelta64(2, 'h')
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(hours=1)
+
+    def test_mod_offset(self):
+        # GH#19365
+        td = Timedelta(hours=37)
+
+        result = td % pd.offsets.Hour(5)
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(hours=2)
+
+    # ----------------------------------------------------------------
+    # Timedelta.__mod__, __rmod__
+
+    def test_mod_numeric(self):
+        # GH#19365
+        td = Timedelta(hours=37)
+
+        # Numeric Others
+        result = td % 2
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(0)
+
+        result = td % 1e12
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(minutes=3, seconds=20)
+
+        result = td % int(1e12)
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(minutes=3, seconds=20)
+
+    def test_mod_invalid(self):
+        # GH#19365
+        td = Timedelta(hours=37)
+
+        with pytest.raises(TypeError):
+            td % pd.Timestamp('2018-01-22')
+
+        with pytest.raises(TypeError):
+            td % []
+
+    def test_rmod_pytimedelta(self):
+        # GH#19365
+        td = Timedelta(minutes=3)
+
+        result = timedelta(minutes=4) % td
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(minutes=1)
+
+    def test_rmod_timedelta64(self):
+        # GH#19365
+        td = Timedelta(minutes=3)
+        result = np.timedelta64(5, 'm') % td
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(minutes=2)
+
+    def test_rmod_invalid(self):
+        # GH#19365
+        td = Timedelta(minutes=3)
+
+        with pytest.raises(TypeError):
+            pd.Timestamp('2018-01-22') % td
+
+        with pytest.raises(TypeError):
+            15 % td
+
+        with pytest.raises(TypeError):
+            16.0 % td
+
+        with pytest.raises(TypeError):
+            np.array([22, 24]) % td
+
+    # ----------------------------------------------------------------
+    # Timedelta.__divmod__, __rdivmod__
+
+    def test_divmod_numeric(self):
+        # GH#19365
+        td = Timedelta(days=2, hours=6)
+
+        result = divmod(td, 53 * 3600 * 1e9)
+        assert result[0] == Timedelta(1, unit='ns')
+        assert isinstance(result[1], Timedelta)
+        assert result[1] == Timedelta(hours=1)
+
+        assert result
+        result = divmod(td, np.nan)
+        assert result[0] is pd.NaT
+        assert result[1] is pd.NaT
+
+    def test_divmod(self):
+        # GH#19365
+        td = Timedelta(days=2, hours=6)
+
+        result = divmod(td, timedelta(days=1))
+        assert result[0] == 2
+        assert isinstance(result[1], Timedelta)
+        assert result[1] == Timedelta(hours=6)
+
+        result = divmod(td, 54)
+        assert result[0] == Timedelta(hours=1)
+        assert isinstance(result[1], Timedelta)
+        assert result[1] == Timedelta(0)
+
+        result = divmod(td, pd.NaT)
+        assert np.isnan(result[0])
+        assert result[1] is pd.NaT
+
+    def test_divmod_offset(self):
+        # GH#19365
+        td = Timedelta(days=2, hours=6)
+
+        result = divmod(td, pd.offsets.Hour(-4))
+        assert result[0] == -14
+        assert isinstance(result[1], Timedelta)
+        assert result[1] == Timedelta(hours=-2)
+
+    def test_divmod_invalid(self):
+        # GH#19365
+        td = Timedelta(days=2, hours=6)
+
+        with pytest.raises(TypeError):
+            divmod(td, pd.Timestamp('2018-01-22'))
+
+    def test_rdivmod_pytimedelta(self):
+        # GH#19365
+        result = divmod(timedelta(days=2, hours=6), Timedelta(days=1))
+        assert result[0] == 2
+        assert isinstance(result[1], Timedelta)
+        assert result[1] == Timedelta(hours=6)
+
+    def test_rdivmod_offset(self):
+        result = divmod(pd.offsets.Hour(54), Timedelta(hours=-4))
+        assert result[0] == -14
+        assert isinstance(result[1], Timedelta)
+        assert result[1] == Timedelta(hours=-2)
+
+    def test_rdivmod_invalid(self):
+        # GH#19365
+        td = Timedelta(minutes=3)
+
+        with pytest.raises(TypeError):
+            divmod(pd.Timestamp('2018-01-22'), td)
+
+        with pytest.raises(TypeError):
+            divmod(15, td)
+
+        with pytest.raises(TypeError):
+            divmod(16.0, td)
+
+        with pytest.raises(TypeError):
+            divmod(np.array([22, 24]), td)
diff --git a/pandas/tests/scalar/timedelta/test_construction.py b/pandas/tests/scalar/timedelta/test_construction.py
new file mode 100644
index 0000000000000..d648140aa7347
--- /dev/null
+++ b/pandas/tests/scalar/timedelta/test_construction.py
@@ -0,0 +1,212 @@
+# -*- coding: utf-8 -*-
+from datetime import timedelta
+
+import pytest
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas import Timedelta
+
+
+def test_construction():
+    expected = np.timedelta64(10, 'D').astype('m8[ns]').view('i8')
+    assert Timedelta(10, unit='d').value == expected
+    assert Timedelta(10.0, unit='d').value == expected
+    assert Timedelta('10 days').value == expected
+    assert Timedelta(days=10).value == expected
+    assert Timedelta(days=10.0).value == expected
+
+    expected += np.timedelta64(10, 's').astype('m8[ns]').view('i8')
+    assert Timedelta('10 days 00:00:10').value == expected
+    assert Timedelta(days=10, seconds=10).value == expected
+    assert Timedelta(days=10, milliseconds=10 * 1000).value == expected
+    assert Timedelta(days=10,
+                     microseconds=10 * 1000 * 1000).value == expected
+
+    # rounding cases
+    assert Timedelta(82739999850000).value == 82739999850000
+    assert ('0 days 22:58:59.999850' in str(Timedelta(82739999850000)))
+    assert Timedelta(123072001000000).value == 123072001000000
+    assert ('1 days 10:11:12.001' in str(Timedelta(123072001000000)))
+
+    # string conversion with/without leading zero
+    # GH#9570
+    assert Timedelta('0:00:00') == timedelta(hours=0)
+    assert Timedelta('00:00:00') == timedelta(hours=0)
+    assert Timedelta('-1:00:00') == -timedelta(hours=1)
+    assert Timedelta('-01:00:00') == -timedelta(hours=1)
+
+    # more strings & abbrevs
+    # GH#8190
+    assert Timedelta('1 h') == timedelta(hours=1)
+    assert Timedelta('1 hour') == timedelta(hours=1)
+    assert Timedelta('1 hr') == timedelta(hours=1)
+    assert Timedelta('1 hours') == timedelta(hours=1)
+    assert Timedelta('-1 hours') == -timedelta(hours=1)
+    assert Timedelta('1 m') == timedelta(minutes=1)
+    assert Timedelta('1.5 m') == timedelta(seconds=90)
+    assert Timedelta('1 minute') == timedelta(minutes=1)
+    assert Timedelta('1 minutes') == timedelta(minutes=1)
+    assert Timedelta('1 s') == timedelta(seconds=1)
+    assert Timedelta('1 second') == timedelta(seconds=1)
+    assert Timedelta('1 seconds') == timedelta(seconds=1)
+    assert Timedelta('1 ms') == timedelta(milliseconds=1)
+    assert Timedelta('1 milli') == timedelta(milliseconds=1)
+    assert Timedelta('1 millisecond') == timedelta(milliseconds=1)
+    assert Timedelta('1 us') == timedelta(microseconds=1)
+    assert Timedelta('1 micros') == timedelta(microseconds=1)
+    assert Timedelta('1 microsecond') == timedelta(microseconds=1)
+    assert Timedelta('1.5 microsecond') == Timedelta('00:00:00.000001500')
+    assert Timedelta('1 ns') == Timedelta('00:00:00.000000001')
+    assert Timedelta('1 nano') == Timedelta('00:00:00.000000001')
+    assert Timedelta('1 nanosecond') == Timedelta('00:00:00.000000001')
+
+    # combos
+    assert Timedelta('10 days 1 hour') == timedelta(days=10, hours=1)
+    assert Timedelta('10 days 1 h') == timedelta(days=10, hours=1)
+    assert Timedelta('10 days 1 h 1m 1s') == timedelta(
+        days=10, hours=1, minutes=1, seconds=1)
+    assert Timedelta('-10 days 1 h 1m 1s') == -timedelta(
+        days=10, hours=1, minutes=1, seconds=1)
+    assert Timedelta('-10 days 1 h 1m 1s') == -timedelta(
+        days=10, hours=1, minutes=1, seconds=1)
+    assert Timedelta('-10 days 1 h 1m 1s 3us') == -timedelta(
+        days=10, hours=1, minutes=1, seconds=1, microseconds=3)
+    assert Timedelta('-10 days 1 h 1.5m 1s 3us') == -timedelta(
+        days=10, hours=1, minutes=1, seconds=31, microseconds=3)
+
+    # Currently invalid as it has a - on the hh:mm:dd part
+    # (only allowed on the days)
+    with pytest.raises(ValueError):
+        Timedelta('-10 days -1 h 1.5m 1s 3us')
+
+    # only leading neg signs are allowed
+    with pytest.raises(ValueError):
+        Timedelta('10 days -1 h 1.5m 1s 3us')
+
+    # no units specified
+    with pytest.raises(ValueError):
+        Timedelta('3.1415')
+
+    # invalid construction
+    tm.assert_raises_regex(ValueError, "cannot construct a Timedelta",
+                           lambda: Timedelta())
+    tm.assert_raises_regex(ValueError,
+                           "unit abbreviation w/o a number",
+                           lambda: Timedelta('foo'))
+    tm.assert_raises_regex(ValueError,
+                           "cannot construct a Timedelta from the "
+                           "passed arguments, allowed keywords are ",
+                           lambda: Timedelta(day=10))
+
+    # floats
+    expected = np.timedelta64(
+        10, 's').astype('m8[ns]').view('i8') + np.timedelta64(
+            500, 'ms').astype('m8[ns]').view('i8')
+    assert Timedelta(10.5, unit='s').value == expected
+
+    # offset
+    assert pd.to_timedelta(pd.offsets.Hour(2)) == Timedelta(hours=2)
+    assert Timedelta(pd.offsets.Hour(2)) == Timedelta(hours=2)
+    assert Timedelta(pd.offsets.Second(2)) == Timedelta(seconds=2)
+
+    # GH#11995: unicode
+    expected = Timedelta('1H')
+    result = pd.Timedelta(u'1H')
+    assert result == expected
+    assert (pd.to_timedelta(pd.offsets.Hour(2)) ==
+            Timedelta(u'0 days, 02:00:00'))
+
+    with pytest.raises(ValueError):
+        Timedelta(u'foo bar')
+
+
+@pytest.mark.parametrize('item', list({'days': 'D',
+                                       'seconds': 's',
+                                       'microseconds': 'us',
+                                       'milliseconds': 'ms',
+                                       'minutes': 'm',
+                                       'hours': 'h',
+                                       'weeks': 'W'}.items()))
+@pytest.mark.parametrize('npdtype', [np.int64, np.int32, np.int16,
+                                     np.float64, np.float32, np.float16])
+def test_td_construction_with_np_dtypes(npdtype, item):
+    # GH#8757: test construction with np dtypes
+    pykwarg, npkwarg = item
+    expected = np.timedelta64(1, npkwarg).astype('m8[ns]').view('i8')
+    assert Timedelta(**{pykwarg: npdtype(1)}).value == expected
+
+
+@pytest.mark.parametrize('val', [
+    '1s', '-1s', '1us', '-1us', '1 day', '-1 day',
+    '-23:59:59.999999', '-1 days +23:59:59.999999', '-1ns',
+    '1ns', '-23:59:59.999999999'])
+def test_td_from_repr_roundtrip(val):
+    # round-trip both for string and value
+    td = Timedelta(val)
+    assert Timedelta(td.value) == td
+
+    # str does not normally display nanos
+    if not td.nanoseconds:
+        assert Timedelta(str(td)) == td
+    assert Timedelta(td._repr_base(format='all')) == td
+
+
+def test_overflow_on_construction():
+    # xref https://github.com/statsmodels/statsmodels/issues/3374
+    value = pd.Timedelta('1day').value * 20169940
+    with pytest.raises(OverflowError):
+        pd.Timedelta(value)
+
+    # xref GH#17637
+    with pytest.raises(OverflowError):
+        pd.Timedelta(7 * 19999, unit='D')
+
+    with pytest.raises(OverflowError):
+        pd.Timedelta(timedelta(days=13 * 19999))
+
+
+@pytest.mark.parametrize('fmt,exp', [
+    ('P6DT0H50M3.010010012S', Timedelta(days=6, minutes=50, seconds=3,
+                                        milliseconds=10, microseconds=10,
+                                        nanoseconds=12)),
+    ('P-6DT0H50M3.010010012S', Timedelta(days=-6, minutes=50, seconds=3,
+                                         milliseconds=10, microseconds=10,
+                                         nanoseconds=12)),
+    ('P4DT12H30M5S', Timedelta(days=4, hours=12, minutes=30, seconds=5)),
+    ('P0DT0H0M0.000000123S', Timedelta(nanoseconds=123)),
+    ('P0DT0H0M0.00001S', Timedelta(microseconds=10)),
+    ('P0DT0H0M0.001S', Timedelta(milliseconds=1)),
+    ('P0DT0H1M0S', Timedelta(minutes=1)),
+    ('P1DT25H61M61S', Timedelta(days=1, hours=25, minutes=61, seconds=61))
+])
+def test_iso_constructor(fmt, exp):
+    assert Timedelta(fmt) == exp
+
+
+@pytest.mark.parametrize('fmt', [
+    'PPPPPPPPPPPP', 'PDTHMS', 'P0DT999H999M999S',
+    'P1DT0H0M0.0000000000000S', 'P1DT0H0M00000000000S',
+    'P1DT0H0M0.S'])
+def test_iso_constructor_raises(fmt):
+    with tm.assert_raises_regex(ValueError, 'Invalid ISO 8601 Duration '
+                                'format - {}'.format(fmt)):
+        Timedelta(fmt)
+
+
+@pytest.mark.parametrize('constructed_td, conversion', [
+    (Timedelta(nanoseconds=100), '100ns'),
+    (Timedelta(days=1, hours=1, minutes=1, weeks=1, seconds=1, milliseconds=1,
+               microseconds=1, nanoseconds=1), 694861001001001),
+    (Timedelta(microseconds=1) + Timedelta(nanoseconds=1), '1us1ns'),
+    (Timedelta(microseconds=1) - Timedelta(nanoseconds=1), '999ns'),
+    (Timedelta(microseconds=1) + 5 * Timedelta(nanoseconds=-2), '990ns')])
+def test_td_constructor_on_nanoseconds(constructed_td, conversion):
+    # GH#9273
+    assert constructed_td == Timedelta(conversion)
+
+
+def test_td_constructor_value_error():
+    with pytest.raises(TypeError):
+        Timedelta(nanoseconds='abc')
diff --git a/pandas/tests/scalar/timedelta/test_formats.py b/pandas/tests/scalar/timedelta/test_formats.py
new file mode 100644
index 0000000000000..0d0b24f192f96
--- /dev/null
+++ b/pandas/tests/scalar/timedelta/test_formats.py
@@ -0,0 +1,28 @@
+# -*- coding: utf-8 -*-
+import pytest
+
+from pandas import Timedelta
+
+
+@pytest.mark.parametrize('td, expected_repr', [
+    (Timedelta(10, unit='d'), "Timedelta('10 days 00:00:00')"),
+    (Timedelta(10, unit='s'), "Timedelta('0 days 00:00:10')"),
+    (Timedelta(10, unit='ms'), "Timedelta('0 days 00:00:00.010000')"),
+    (Timedelta(-10, unit='ms'), "Timedelta('-1 days +23:59:59.990000')")])
+def test_repr(td, expected_repr):
+    assert repr(td) == expected_repr
+
+
+@pytest.mark.parametrize('td, expected_iso', [
+    (Timedelta(days=6, minutes=50, seconds=3, milliseconds=10, microseconds=10,
+               nanoseconds=12), 'P6DT0H50M3.010010012S'),
+    (Timedelta(days=4, hours=12, minutes=30, seconds=5), 'P4DT12H30M5S'),
+    (Timedelta(nanoseconds=123), 'P0DT0H0M0.000000123S'),
+    # trim nano
+    (Timedelta(microseconds=10), 'P0DT0H0M0.00001S'),
+    # trim micro
+    (Timedelta(milliseconds=1), 'P0DT0H0M0.001S'),
+    # don't strip every 0
+    (Timedelta(minutes=1), 'P0DT0H1M0S')])
+def test_isoformat(td, expected_iso):
+    assert td.isoformat() == expected_iso
diff --git a/pandas/tests/scalar/timedelta/test_timedelta.py b/pandas/tests/scalar/timedelta/test_timedelta.py
new file mode 100644
index 0000000000000..6472bd4245622
--- /dev/null
+++ b/pandas/tests/scalar/timedelta/test_timedelta.py
@@ -0,0 +1,604 @@
+""" test the scalar Timedelta """
+import pytest
+
+import numpy as np
+from datetime import timedelta
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.core.tools.timedeltas import _coerce_scalar_to_timedelta_type as ct
+from pandas import (Timedelta, TimedeltaIndex, timedelta_range, Series,
+                    to_timedelta, compat)
+from pandas._libs.tslib import iNaT, NaT
+
+
+class TestTimedeltaArithmetic(object):
+
+    def test_arithmetic_overflow(self):
+        with pytest.raises(OverflowError):
+            pd.Timestamp('1700-01-01') + pd.Timedelta(13 * 19999, unit='D')
+
+        with pytest.raises(OverflowError):
+            pd.Timestamp('1700-01-01') + timedelta(days=13 * 19999)
+
+    def test_array_timedelta_floordiv(self):
+        # https://github.com/pandas-dev/pandas/issues/19761
+        ints = pd.date_range('2012-10-08', periods=4, freq='D').view('i8')
+        msg = r"Use 'array // timedelta.value'"
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ints // pd.Timedelta(1, unit='s')
+
+        assert msg in str(m[0].message)
+        expected = np.array([1349654400, 1349740800, 1349827200, 1349913600],
+                            dtype='i8')
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_ops_error_str(self):
+        # GH 13624
+        td = Timedelta('1 day')
+
+        for left, right in [(td, 'a'), ('a', td)]:
+
+            with pytest.raises(TypeError):
+                left + right
+
+            with pytest.raises(TypeError):
+                left > right
+
+            assert not left == right
+            assert left != right
+
+    def test_ops_notimplemented(self):
+        class Other(object):
+            pass
+
+        other = Other()
+
+        td = Timedelta('1 day')
+        assert td.__add__(other) is NotImplemented
+        assert td.__sub__(other) is NotImplemented
+        assert td.__truediv__(other) is NotImplemented
+        assert td.__mul__(other) is NotImplemented
+        assert td.__floordiv__(other) is NotImplemented
+
+    def test_unary_ops(self):
+        td = Timedelta(10, unit='d')
+
+        # __neg__, __pos__
+        assert -td == Timedelta(-10, unit='d')
+        assert -td == Timedelta('-10d')
+        assert +td == Timedelta(10, unit='d')
+
+        # __abs__, __abs__(__neg__)
+        assert abs(td) == td
+        assert abs(-td) == td
+        assert abs(-td) == Timedelta('10d')
+
+
+class TestTimedeltaComparison(object):
+    def test_comparison_object_array(self):
+        # analogous to GH#15183
+        td = Timedelta('2 days')
+        other = Timedelta('3 hours')
+
+        arr = np.array([other, td], dtype=object)
+        res = arr == td
+        expected = np.array([False, True], dtype=bool)
+        assert (res == expected).all()
+
+        # 2D case
+        arr = np.array([[other, td],
+                        [td, other]],
+                       dtype=object)
+        res = arr != td
+        expected = np.array([[True, False], [False, True]], dtype=bool)
+        assert res.shape == expected.shape
+        assert (res == expected).all()
+
+    def test_compare_timedelta_ndarray(self):
+        # GH11835
+        periods = [Timedelta('0 days 01:00:00'), Timedelta('0 days 01:00:00')]
+        arr = np.array(periods)
+        result = arr[0] > arr
+        expected = np.array([False, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+
+class TestTimedeltas(object):
+
+    @pytest.mark.parametrize("unit, value, expected", [
+        ('us', 9.999, 9999), ('ms', 9.999999, 9999999),
+        ('s', 9.999999999, 9999999999)])
+    def test_rounding_on_int_unit_construction(self, unit, value, expected):
+        # GH 12690
+        result = Timedelta(value, unit=unit)
+        assert result.value == expected
+        result = Timedelta(str(value) + unit)
+        assert result.value == expected
+
+    def test_total_seconds_scalar(self):
+        # see gh-10939
+        rng = Timedelta('1 days, 10:11:12.100123456')
+        expt = 1 * 86400 + 10 * 3600 + 11 * 60 + 12 + 100123456. / 1e9
+        tm.assert_almost_equal(rng.total_seconds(), expt)
+
+        rng = Timedelta(np.nan)
+        assert np.isnan(rng.total_seconds())
+
+    def test_conversion(self):
+
+        for td in [Timedelta(10, unit='d'),
+                   Timedelta('1 days, 10:11:12.012345')]:
+            pydt = td.to_pytimedelta()
+            assert td == Timedelta(pydt)
+            assert td == pydt
+            assert (isinstance(pydt, timedelta) and not isinstance(
+                pydt, Timedelta))
+
+            assert td == np.timedelta64(td.value, 'ns')
+            td64 = td.to_timedelta64()
+
+            assert td64 == np.timedelta64(td.value, 'ns')
+            assert td == td64
+
+            assert isinstance(td64, np.timedelta64)
+
+        # this is NOT equal and cannot be roundtriped (because of the nanos)
+        td = Timedelta('1 days, 10:11:12.012345678')
+        assert td != td.to_pytimedelta()
+
+    def test_freq_conversion(self):
+
+        # truediv
+        td = Timedelta('1 days 2 hours 3 ns')
+        result = td / np.timedelta64(1, 'D')
+        assert result == td.value / float(86400 * 1e9)
+        result = td / np.timedelta64(1, 's')
+        assert result == td.value / float(1e9)
+        result = td / np.timedelta64(1, 'ns')
+        assert result == td.value
+
+        # floordiv
+        td = Timedelta('1 days 2 hours 3 ns')
+        result = td // np.timedelta64(1, 'D')
+        assert result == 1
+        result = td // np.timedelta64(1, 's')
+        assert result == 93600
+        result = td // np.timedelta64(1, 'ns')
+        assert result == td.value
+
+    def test_fields(self):
+        def check(value):
+            # that we are int/long like
+            assert isinstance(value, (int, compat.long))
+
+        # compat to datetime.timedelta
+        rng = to_timedelta('1 days, 10:11:12')
+        assert rng.days == 1
+        assert rng.seconds == 10 * 3600 + 11 * 60 + 12
+        assert rng.microseconds == 0
+        assert rng.nanoseconds == 0
+
+        pytest.raises(AttributeError, lambda: rng.hours)
+        pytest.raises(AttributeError, lambda: rng.minutes)
+        pytest.raises(AttributeError, lambda: rng.milliseconds)
+
+        # GH 10050
+        check(rng.days)
+        check(rng.seconds)
+        check(rng.microseconds)
+        check(rng.nanoseconds)
+
+        td = Timedelta('-1 days, 10:11:12')
+        assert abs(td) == Timedelta('13:48:48')
+        assert str(td) == "-1 days +10:11:12"
+        assert -td == Timedelta('0 days 13:48:48')
+        assert -Timedelta('-1 days, 10:11:12').value == 49728000000000
+        assert Timedelta('-1 days, 10:11:12').value == -49728000000000
+
+        rng = to_timedelta('-1 days, 10:11:12.100123456')
+        assert rng.days == -1
+        assert rng.seconds == 10 * 3600 + 11 * 60 + 12
+        assert rng.microseconds == 100 * 1000 + 123
+        assert rng.nanoseconds == 456
+        pytest.raises(AttributeError, lambda: rng.hours)
+        pytest.raises(AttributeError, lambda: rng.minutes)
+        pytest.raises(AttributeError, lambda: rng.milliseconds)
+
+        # components
+        tup = pd.to_timedelta(-1, 'us').components
+        assert tup.days == -1
+        assert tup.hours == 23
+        assert tup.minutes == 59
+        assert tup.seconds == 59
+        assert tup.milliseconds == 999
+        assert tup.microseconds == 999
+        assert tup.nanoseconds == 0
+
+        # GH 10050
+        check(tup.days)
+        check(tup.hours)
+        check(tup.minutes)
+        check(tup.seconds)
+        check(tup.milliseconds)
+        check(tup.microseconds)
+        check(tup.nanoseconds)
+
+        tup = Timedelta('-1 days 1 us').components
+        assert tup.days == -2
+        assert tup.hours == 23
+        assert tup.minutes == 59
+        assert tup.seconds == 59
+        assert tup.milliseconds == 999
+        assert tup.microseconds == 999
+        assert tup.nanoseconds == 0
+
+    def test_nat_converters(self):
+        assert to_timedelta('nat', box=False).astype('int64') == iNaT
+        assert to_timedelta('nan', box=False).astype('int64') == iNaT
+
+        def testit(unit, transform):
+
+            # array
+            result = to_timedelta(np.arange(5), unit=unit)
+            expected = TimedeltaIndex([np.timedelta64(i, transform(unit))
+                                       for i in np.arange(5).tolist()])
+            tm.assert_index_equal(result, expected)
+
+            # scalar
+            result = to_timedelta(2, unit=unit)
+            expected = Timedelta(np.timedelta64(2, transform(unit)).astype(
+                'timedelta64[ns]'))
+            assert result == expected
+
+        # validate all units
+        # GH 6855
+        for unit in ['Y', 'M', 'W', 'D', 'y', 'w', 'd']:
+            testit(unit, lambda x: x.upper())
+        for unit in ['days', 'day', 'Day', 'Days']:
+            testit(unit, lambda x: 'D')
+        for unit in ['h', 'm', 's', 'ms', 'us', 'ns', 'H', 'S', 'MS', 'US',
+                     'NS']:
+            testit(unit, lambda x: x.lower())
+
+        # offsets
+
+        # m
+        testit('T', lambda x: 'm')
+
+        # ms
+        testit('L', lambda x: 'ms')
+
+    def test_numeric_conversions(self):
+        assert ct(0) == np.timedelta64(0, 'ns')
+        assert ct(10) == np.timedelta64(10, 'ns')
+        assert ct(10, unit='ns') == np.timedelta64(10, 'ns').astype('m8[ns]')
+
+        assert ct(10, unit='us') == np.timedelta64(10, 'us').astype('m8[ns]')
+        assert ct(10, unit='ms') == np.timedelta64(10, 'ms').astype('m8[ns]')
+        assert ct(10, unit='s') == np.timedelta64(10, 's').astype('m8[ns]')
+        assert ct(10, unit='d') == np.timedelta64(10, 'D').astype('m8[ns]')
+
+    def test_timedelta_conversions(self):
+        assert (ct(timedelta(seconds=1)) ==
+                np.timedelta64(1, 's').astype('m8[ns]'))
+        assert (ct(timedelta(microseconds=1)) ==
+                np.timedelta64(1, 'us').astype('m8[ns]'))
+        assert (ct(timedelta(days=1)) ==
+                np.timedelta64(1, 'D').astype('m8[ns]'))
+
+    def test_round(self):
+
+        t1 = Timedelta('1 days 02:34:56.789123456')
+        t2 = Timedelta('-1 days 02:34:56.789123456')
+
+        for (freq, s1, s2) in [('N', t1, t2),
+                               ('U', Timedelta('1 days 02:34:56.789123000'),
+                                Timedelta('-1 days 02:34:56.789123000')),
+                               ('L', Timedelta('1 days 02:34:56.789000000'),
+                                Timedelta('-1 days 02:34:56.789000000')),
+                               ('S', Timedelta('1 days 02:34:57'),
+                                Timedelta('-1 days 02:34:57')),
+                               ('2S', Timedelta('1 days 02:34:56'),
+                                Timedelta('-1 days 02:34:56')),
+                               ('5S', Timedelta('1 days 02:34:55'),
+                                Timedelta('-1 days 02:34:55')),
+                               ('T', Timedelta('1 days 02:35:00'),
+                                Timedelta('-1 days 02:35:00')),
+                               ('12T', Timedelta('1 days 02:36:00'),
+                                Timedelta('-1 days 02:36:00')),
+                               ('H', Timedelta('1 days 03:00:00'),
+                                Timedelta('-1 days 03:00:00')),
+                               ('d', Timedelta('1 days'),
+                                Timedelta('-1 days'))]:
+            r1 = t1.round(freq)
+            assert r1 == s1
+            r2 = t2.round(freq)
+            assert r2 == s2
+
+        # invalid
+        for freq in ['Y', 'M', 'foobar']:
+            pytest.raises(ValueError, lambda: t1.round(freq))
+
+        t1 = timedelta_range('1 days', periods=3, freq='1 min 2 s 3 us')
+        t2 = -1 * t1
+        t1a = timedelta_range('1 days', periods=3, freq='1 min 2 s')
+        t1c = pd.TimedeltaIndex([1, 1, 1], unit='D')
+
+        # note that negative times round DOWN! so don't give whole numbers
+        for (freq, s1, s2) in [('N', t1, t2),
+                               ('U', t1, t2),
+                               ('L', t1a,
+                                TimedeltaIndex(['-1 days +00:00:00',
+                                                '-2 days +23:58:58',
+                                                '-2 days +23:57:56'],
+                                               dtype='timedelta64[ns]',
+                                               freq=None)
+                                ),
+                               ('S', t1a,
+                                TimedeltaIndex(['-1 days +00:00:00',
+                                                '-2 days +23:58:58',
+                                                '-2 days +23:57:56'],
+                                               dtype='timedelta64[ns]',
+                                               freq=None)
+                                ),
+                               ('12T', t1c,
+                                TimedeltaIndex(['-1 days',
+                                                '-1 days',
+                                                '-1 days'],
+                                               dtype='timedelta64[ns]',
+                                               freq=None)
+                                ),
+                               ('H', t1c,
+                                TimedeltaIndex(['-1 days',
+                                                '-1 days',
+                                                '-1 days'],
+                                               dtype='timedelta64[ns]',
+                                               freq=None)
+                                ),
+                               ('d', t1c,
+                                pd.TimedeltaIndex([-1, -1, -1], unit='D')
+                                )]:
+
+            r1 = t1.round(freq)
+            tm.assert_index_equal(r1, s1)
+            r2 = t2.round(freq)
+        tm.assert_index_equal(r2, s2)
+
+        # invalid
+        for freq in ['Y', 'M', 'foobar']:
+            pytest.raises(ValueError, lambda: t1.round(freq))
+
+    def test_contains(self):
+        # Checking for any NaT-like objects
+        # GH 13603
+        td = to_timedelta(range(5), unit='d') + pd.offsets.Hour(1)
+        for v in [pd.NaT, None, float('nan'), np.nan]:
+            assert not (v in td)
+
+        td = to_timedelta([pd.NaT])
+        for v in [pd.NaT, None, float('nan'), np.nan]:
+            assert (v in td)
+
+    def test_identity(self):
+
+        td = Timedelta(10, unit='d')
+        assert isinstance(td, Timedelta)
+        assert isinstance(td, timedelta)
+
+    def test_short_format_converters(self):
+        def conv(v):
+            return v.astype('m8[ns]')
+
+        assert ct('10') == np.timedelta64(10, 'ns')
+        assert ct('10ns') == np.timedelta64(10, 'ns')
+        assert ct('100') == np.timedelta64(100, 'ns')
+        assert ct('100ns') == np.timedelta64(100, 'ns')
+
+        assert ct('1000') == np.timedelta64(1000, 'ns')
+        assert ct('1000ns') == np.timedelta64(1000, 'ns')
+        assert ct('1000NS') == np.timedelta64(1000, 'ns')
+
+        assert ct('10us') == np.timedelta64(10000, 'ns')
+        assert ct('100us') == np.timedelta64(100000, 'ns')
+        assert ct('1000us') == np.timedelta64(1000000, 'ns')
+        assert ct('1000Us') == np.timedelta64(1000000, 'ns')
+        assert ct('1000uS') == np.timedelta64(1000000, 'ns')
+
+        assert ct('1ms') == np.timedelta64(1000000, 'ns')
+        assert ct('10ms') == np.timedelta64(10000000, 'ns')
+        assert ct('100ms') == np.timedelta64(100000000, 'ns')
+        assert ct('1000ms') == np.timedelta64(1000000000, 'ns')
+
+        assert ct('-1s') == -np.timedelta64(1000000000, 'ns')
+        assert ct('1s') == np.timedelta64(1000000000, 'ns')
+        assert ct('10s') == np.timedelta64(10000000000, 'ns')
+        assert ct('100s') == np.timedelta64(100000000000, 'ns')
+        assert ct('1000s') == np.timedelta64(1000000000000, 'ns')
+
+        assert ct('1d') == conv(np.timedelta64(1, 'D'))
+        assert ct('-1d') == -conv(np.timedelta64(1, 'D'))
+        assert ct('1D') == conv(np.timedelta64(1, 'D'))
+        assert ct('10D') == conv(np.timedelta64(10, 'D'))
+        assert ct('100D') == conv(np.timedelta64(100, 'D'))
+        assert ct('1000D') == conv(np.timedelta64(1000, 'D'))
+        assert ct('10000D') == conv(np.timedelta64(10000, 'D'))
+
+        # space
+        assert ct(' 10000D ') == conv(np.timedelta64(10000, 'D'))
+        assert ct(' - 10000D ') == -conv(np.timedelta64(10000, 'D'))
+
+        # invalid
+        pytest.raises(ValueError, ct, '1foo')
+        pytest.raises(ValueError, ct, 'foo')
+
+    def test_full_format_converters(self):
+        def conv(v):
+            return v.astype('m8[ns]')
+
+        d1 = np.timedelta64(1, 'D')
+
+        assert ct('1days') == conv(d1)
+        assert ct('1days,') == conv(d1)
+        assert ct('- 1days,') == -conv(d1)
+
+        assert ct('00:00:01') == conv(np.timedelta64(1, 's'))
+        assert ct('06:00:01') == conv(np.timedelta64(6 * 3600 + 1, 's'))
+        assert ct('06:00:01.0') == conv(np.timedelta64(6 * 3600 + 1, 's'))
+        assert ct('06:00:01.01') == conv(np.timedelta64(
+            1000 * (6 * 3600 + 1) + 10, 'ms'))
+
+        assert (ct('- 1days, 00:00:01') ==
+                conv(-d1 + np.timedelta64(1, 's')))
+        assert (ct('1days, 06:00:01') ==
+                conv(d1 + np.timedelta64(6 * 3600 + 1, 's')))
+        assert (ct('1days, 06:00:01.01') ==
+                conv(d1 + np.timedelta64(1000 * (6 * 3600 + 1) + 10, 'ms')))
+
+        # invalid
+        pytest.raises(ValueError, ct, '- 1days, 00')
+
+    def test_overflow(self):
+        # GH 9442
+        s = Series(pd.date_range('20130101', periods=100000, freq='H'))
+        s[0] += pd.Timedelta('1s 1ms')
+
+        # mean
+        result = (s - s.min()).mean()
+        expected = pd.Timedelta((pd.DatetimeIndex((s - s.min())).asi8 / len(s)
+                                 ).sum())
+
+        # the computation is converted to float so
+        # might be some loss of precision
+        assert np.allclose(result.value / 1000, expected.value / 1000)
+
+        # sum
+        pytest.raises(ValueError, lambda: (s - s.min()).sum())
+        s1 = s[0:10000]
+        pytest.raises(ValueError, lambda: (s1 - s1.min()).sum())
+        s2 = s[0:1000]
+        result = (s2 - s2.min()).sum()
+
+    def test_pickle(self):
+
+        v = Timedelta('1 days 10:11:12.0123456')
+        v_p = tm.round_trip_pickle(v)
+        assert v == v_p
+
+    def test_timedelta_hash_equality(self):
+        # GH 11129
+        v = Timedelta(1, 'D')
+        td = timedelta(days=1)
+        assert hash(v) == hash(td)
+
+        d = {td: 2}
+        assert d[v] == 2
+
+        tds = timedelta_range('1 second', periods=20)
+        assert all(hash(td) == hash(td.to_pytimedelta()) for td in tds)
+
+        # python timedeltas drop ns resolution
+        ns_td = Timedelta(1, 'ns')
+        assert hash(ns_td) != hash(ns_td.to_pytimedelta())
+
+    def test_implementation_limits(self):
+        min_td = Timedelta(Timedelta.min)
+        max_td = Timedelta(Timedelta.max)
+
+        # GH 12727
+        # timedelta limits correspond to int64 boundaries
+        assert min_td.value == np.iinfo(np.int64).min + 1
+        assert max_td.value == np.iinfo(np.int64).max
+
+        # Beyond lower limit, a NAT before the Overflow
+        assert (min_td - Timedelta(1, 'ns')) is NaT
+
+        with pytest.raises(OverflowError):
+            min_td - Timedelta(2, 'ns')
+
+        with pytest.raises(OverflowError):
+            max_td + Timedelta(1, 'ns')
+
+        # Same tests using the internal nanosecond values
+        td = Timedelta(min_td.value - 1, 'ns')
+        assert td is NaT
+
+        with pytest.raises(OverflowError):
+            Timedelta(min_td.value - 2, 'ns')
+
+        with pytest.raises(OverflowError):
+            Timedelta(max_td.value + 1, 'ns')
+
+    def test_total_seconds_precision(self):
+        # GH 19458
+        assert Timedelta('30S').total_seconds() == 30.0
+        assert Timedelta('0').total_seconds() == 0.0
+        assert Timedelta('-2S').total_seconds() == -2.0
+        assert Timedelta('5.324S').total_seconds() == 5.324
+        assert (Timedelta('30S').total_seconds() - 30.0) < 1e-20
+        assert (30.0 - Timedelta('30S').total_seconds()) < 1e-20
+
+    def test_timedelta_arithmetic(self):
+        data = pd.Series(['nat', '32 days'], dtype='timedelta64[ns]')
+        deltas = [timedelta(days=1), Timedelta(1, unit='D')]
+        for delta in deltas:
+            result_method = data.add(delta)
+            result_operator = data + delta
+            expected = pd.Series(['nat', '33 days'], dtype='timedelta64[ns]')
+            tm.assert_series_equal(result_operator, expected)
+            tm.assert_series_equal(result_method, expected)
+
+            result_method = data.sub(delta)
+            result_operator = data - delta
+            expected = pd.Series(['nat', '31 days'], dtype='timedelta64[ns]')
+            tm.assert_series_equal(result_operator, expected)
+            tm.assert_series_equal(result_method, expected)
+            # GH 9396
+            result_method = data.div(delta)
+            result_operator = data / delta
+            expected = pd.Series([np.nan, 32.], dtype='float64')
+            tm.assert_series_equal(result_operator, expected)
+            tm.assert_series_equal(result_method, expected)
+
+    def test_apply_to_timedelta(self):
+        timedelta_NaT = pd.to_timedelta('NaT')
+
+        list_of_valid_strings = ['00:00:01', '00:00:02']
+        a = pd.to_timedelta(list_of_valid_strings)
+        b = Series(list_of_valid_strings).apply(pd.to_timedelta)
+        # Can't compare until apply on a Series gives the correct dtype
+        # assert_series_equal(a, b)
+
+        list_of_strings = ['00:00:01', np.nan, pd.NaT, timedelta_NaT]
+
+        # TODO: unused?
+        a = pd.to_timedelta(list_of_strings)  # noqa
+        b = Series(list_of_strings).apply(pd.to_timedelta)  # noqa
+        # Can't compare until apply on a Series gives the correct dtype
+        # assert_series_equal(a, b)
+
+    def test_components(self):
+        rng = timedelta_range('1 days, 10:11:12', periods=2, freq='s')
+        rng.components
+
+        # with nat
+        s = Series(rng)
+        s[1] = np.nan
+
+        result = s.dt.components
+        assert not result.iloc[0].isna().all()
+        assert result.iloc[1].isna().all()
+
+
+@pytest.mark.parametrize('value, expected', [
+    (Timedelta('10S'), True),
+    (Timedelta('-10S'), True),
+    (Timedelta(10, unit='ns'), True),
+    (Timedelta(0, unit='ns'), False),
+    (Timedelta(-10, unit='ns'), True),
+    (Timedelta(None), True),
+    (pd.NaT, True),
+])
+def test_truthiness(value, expected):
+    # https://github.com/pandas-dev/pandas/issues/21484
+    assert bool(value) is expected
diff --git a/pandas/tests/scalar/timestamp/__init__.py b/pandas/tests/scalar/timestamp/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/scalar/timestamp/test_arithmetic.py b/pandas/tests/scalar/timestamp/test_arithmetic.py
new file mode 100644
index 0000000000000..8f4809c93e28b
--- /dev/null
+++ b/pandas/tests/scalar/timestamp/test_arithmetic.py
@@ -0,0 +1,76 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime, timedelta
+
+import pytest
+import numpy as np
+
+from pandas.compat import long
+from pandas.tseries import offsets
+from pandas import Timestamp, Timedelta
+
+
+class TestTimestampArithmetic(object):
+    def test_overflow_offset(self):
+        # xref https://github.com/statsmodels/statsmodels/issues/3374
+        # ends up multiplying really large numbers which overflow
+
+        stamp = Timestamp('2017-01-13 00:00:00', freq='D')
+        offset = 20169940 * offsets.Day(1)
+
+        with pytest.raises(OverflowError):
+            stamp + offset
+
+        with pytest.raises(OverflowError):
+            offset + stamp
+
+        with pytest.raises(OverflowError):
+            stamp - offset
+
+    def test_delta_preserve_nanos(self):
+        val = Timestamp(long(1337299200000000123))
+        result = val + timedelta(1)
+        assert result.nanosecond == val.nanosecond
+
+    def test_timestamp_sub_datetime(self):
+        dt = datetime(2013, 10, 12)
+        ts = Timestamp(datetime(2013, 10, 13))
+        assert (ts - dt).days == 1
+        assert (dt - ts).days == -1
+
+    def test_addition_subtraction_types(self):
+        # Assert on the types resulting from Timestamp +/- various date/time
+        # objects
+        dt = datetime(2014, 3, 4)
+        td = timedelta(seconds=1)
+        # build a timestamp with a frequency, since then it supports
+        # addition/subtraction of integers
+        ts = Timestamp(dt, freq='D')
+
+        assert type(ts + 1) == Timestamp
+        assert type(ts - 1) == Timestamp
+
+        # Timestamp + datetime not supported, though subtraction is supported
+        # and yields timedelta more tests in tseries/base/tests/test_base.py
+        assert type(ts - dt) == Timedelta
+        assert type(ts + td) == Timestamp
+        assert type(ts - td) == Timestamp
+
+        # Timestamp +/- datetime64 not supported, so not tested (could possibly
+        # assert error raised?)
+        td64 = np.timedelta64(1, 'D')
+        assert type(ts + td64) == Timestamp
+        assert type(ts - td64) == Timestamp
+
+    def test_addition_subtraction_preserve_frequency(self):
+        ts = Timestamp('2014-03-05', freq='D')
+        td = timedelta(days=1)
+        original_freq = ts.freq
+
+        assert (ts + 1).freq == original_freq
+        assert (ts - 1).freq == original_freq
+        assert (ts + td).freq == original_freq
+        assert (ts - td).freq == original_freq
+
+        td64 = np.timedelta64(1, 'D')
+        assert (ts + td64).freq == original_freq
+        assert (ts - td64).freq == original_freq
diff --git a/pandas/tests/scalar/timestamp/test_comparisons.py b/pandas/tests/scalar/timestamp/test_comparisons.py
new file mode 100644
index 0000000000000..50e72c11abc4b
--- /dev/null
+++ b/pandas/tests/scalar/timestamp/test_comparisons.py
@@ -0,0 +1,193 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime
+import operator
+
+import pytest
+import numpy as np
+
+from dateutil.tz import tzutc
+from pytz import utc
+
+from pandas.compat import long, PY2
+from pandas import Timestamp
+
+
+class TestTimestampComparison(object):
+    def test_comparison_object_array(self):
+        # GH#15183
+        ts = Timestamp('2011-01-03 00:00:00-0500', tz='US/Eastern')
+        other = Timestamp('2011-01-01 00:00:00-0500', tz='US/Eastern')
+        naive = Timestamp('2011-01-01 00:00:00')
+
+        arr = np.array([other, ts], dtype=object)
+        res = arr == ts
+        expected = np.array([False, True], dtype=bool)
+        assert (res == expected).all()
+
+        # 2D case
+        arr = np.array([[other, ts],
+                        [ts, other]],
+                       dtype=object)
+        res = arr != ts
+        expected = np.array([[True, False], [False, True]], dtype=bool)
+        assert res.shape == expected.shape
+        assert (res == expected).all()
+
+        # tzaware mismatch
+        arr = np.array([naive], dtype=object)
+        with pytest.raises(TypeError):
+            arr < ts
+
+    def test_comparison(self):
+        # 5-18-2012 00:00:00.000
+        stamp = long(1337299200000000000)
+
+        val = Timestamp(stamp)
+
+        assert val == val
+        assert not val != val
+        assert not val < val
+        assert val <= val
+        assert not val > val
+        assert val >= val
+
+        other = datetime(2012, 5, 18)
+        assert val == other
+        assert not val != other
+        assert not val < other
+        assert val <= other
+        assert not val > other
+        assert val >= other
+
+        other = Timestamp(stamp + 100)
+
+        assert val != other
+        assert val != other
+        assert val < other
+        assert val <= other
+        assert other > val
+        assert other >= val
+
+    def test_compare_invalid(self):
+        # GH 8058
+        val = Timestamp('20130101 12:01:02')
+        assert not val == 'foo'
+        assert not val == 10.0
+        assert not val == 1
+        assert not val == long(1)
+        assert not val == []
+        assert not val == {'foo': 1}
+        assert not val == np.float64(1)
+        assert not val == np.int64(1)
+
+        assert val != 'foo'
+        assert val != 10.0
+        assert val != 1
+        assert val != long(1)
+        assert val != []
+        assert val != {'foo': 1}
+        assert val != np.float64(1)
+        assert val != np.int64(1)
+
+    def test_cant_compare_tz_naive_w_aware(self):
+        # see gh-1404
+        a = Timestamp('3/12/2012')
+        b = Timestamp('3/12/2012', tz='utc')
+
+        pytest.raises(Exception, a.__eq__, b)
+        pytest.raises(Exception, a.__ne__, b)
+        pytest.raises(Exception, a.__lt__, b)
+        pytest.raises(Exception, a.__gt__, b)
+        pytest.raises(Exception, b.__eq__, a)
+        pytest.raises(Exception, b.__ne__, a)
+        pytest.raises(Exception, b.__lt__, a)
+        pytest.raises(Exception, b.__gt__, a)
+
+        if PY2:
+            pytest.raises(Exception, a.__eq__, b.to_pydatetime())
+            pytest.raises(Exception, a.to_pydatetime().__eq__, b)
+        else:
+            assert not a == b.to_pydatetime()
+            assert not a.to_pydatetime() == b
+
+    def test_cant_compare_tz_naive_w_aware_explicit_pytz(self):
+        # see gh-1404
+        a = Timestamp('3/12/2012')
+        b = Timestamp('3/12/2012', tz=utc)
+
+        pytest.raises(Exception, a.__eq__, b)
+        pytest.raises(Exception, a.__ne__, b)
+        pytest.raises(Exception, a.__lt__, b)
+        pytest.raises(Exception, a.__gt__, b)
+        pytest.raises(Exception, b.__eq__, a)
+        pytest.raises(Exception, b.__ne__, a)
+        pytest.raises(Exception, b.__lt__, a)
+        pytest.raises(Exception, b.__gt__, a)
+
+        if PY2:
+            pytest.raises(Exception, a.__eq__, b.to_pydatetime())
+            pytest.raises(Exception, a.to_pydatetime().__eq__, b)
+        else:
+            assert not a == b.to_pydatetime()
+            assert not a.to_pydatetime() == b
+
+    def test_cant_compare_tz_naive_w_aware_dateutil(self):
+        # see gh-1404
+        a = Timestamp('3/12/2012')
+        b = Timestamp('3/12/2012', tz=tzutc())
+
+        pytest.raises(Exception, a.__eq__, b)
+        pytest.raises(Exception, a.__ne__, b)
+        pytest.raises(Exception, a.__lt__, b)
+        pytest.raises(Exception, a.__gt__, b)
+        pytest.raises(Exception, b.__eq__, a)
+        pytest.raises(Exception, b.__ne__, a)
+        pytest.raises(Exception, b.__lt__, a)
+        pytest.raises(Exception, b.__gt__, a)
+
+        if PY2:
+            pytest.raises(Exception, a.__eq__, b.to_pydatetime())
+            pytest.raises(Exception, a.to_pydatetime().__eq__, b)
+        else:
+            assert not a == b.to_pydatetime()
+            assert not a.to_pydatetime() == b
+
+    def test_timestamp_compare_scalars(self):
+        # case where ndim == 0
+        lhs = np.datetime64(datetime(2013, 12, 6))
+        rhs = Timestamp('now')
+        nat = Timestamp('nat')
+
+        ops = {'gt': 'lt',
+               'lt': 'gt',
+               'ge': 'le',
+               'le': 'ge',
+               'eq': 'eq',
+               'ne': 'ne'}
+
+        for left, right in ops.items():
+            left_f = getattr(operator, left)
+            right_f = getattr(operator, right)
+            expected = left_f(lhs, rhs)
+
+            result = right_f(rhs, lhs)
+            assert result == expected
+
+            expected = left_f(rhs, nat)
+            result = right_f(nat, rhs)
+            assert result == expected
+
+    def test_timestamp_compare_with_early_datetime(self):
+        # e.g. datetime.min
+        stamp = Timestamp('2012-01-01')
+
+        assert not stamp == datetime.min
+        assert not stamp == datetime(1600, 1, 1)
+        assert not stamp == datetime(2700, 1, 1)
+        assert stamp != datetime.min
+        assert stamp != datetime(1600, 1, 1)
+        assert stamp != datetime(2700, 1, 1)
+        assert stamp > datetime(1600, 1, 1)
+        assert stamp >= datetime(1600, 1, 1)
+        assert stamp < datetime(2700, 1, 1)
+        assert stamp <= datetime(2700, 1, 1)
diff --git a/pandas/tests/scalar/timestamp/test_rendering.py b/pandas/tests/scalar/timestamp/test_rendering.py
new file mode 100644
index 0000000000000..c404b60567daf
--- /dev/null
+++ b/pandas/tests/scalar/timestamp/test_rendering.py
@@ -0,0 +1,96 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+import dateutil
+import pytz  # noqa  # a test below uses pytz but only inside a `eval` call
+
+import pprint
+from distutils.version import LooseVersion
+
+from pandas import Timestamp
+
+
+class TestTimestampRendering(object):
+
+    # dateutil zone change (only matters for repr)
+    if LooseVersion(dateutil.__version__) >= LooseVersion('2.6.0'):
+        timezones = ['UTC', 'Asia/Tokyo', 'US/Eastern',
+                     'dateutil/US/Pacific']
+    else:
+        timezones = ['UTC', 'Asia/Tokyo', 'US/Eastern',
+                     'dateutil/America/Los_Angeles']
+
+    @pytest.mark.parametrize('tz', timezones)
+    @pytest.mark.parametrize('freq', ['D', 'M', 'S', 'N'])
+    @pytest.mark.parametrize('date', ['2014-03-07', '2014-01-01 09:00',
+                                      '2014-01-01 00:00:00.000000001'])
+    def test_repr(self, date, freq, tz):
+        # avoid to match with timezone name
+        freq_repr = "'{0}'".format(freq)
+        if tz.startswith('dateutil'):
+            tz_repr = tz.replace('dateutil', '')
+        else:
+            tz_repr = tz
+
+        date_only = Timestamp(date)
+        assert date in repr(date_only)
+        assert tz_repr not in repr(date_only)
+        assert freq_repr not in repr(date_only)
+        assert date_only == eval(repr(date_only))
+
+        date_tz = Timestamp(date, tz=tz)
+        assert date in repr(date_tz)
+        assert tz_repr in repr(date_tz)
+        assert freq_repr not in repr(date_tz)
+        assert date_tz == eval(repr(date_tz))
+
+        date_freq = Timestamp(date, freq=freq)
+        assert date in repr(date_freq)
+        assert tz_repr not in repr(date_freq)
+        assert freq_repr in repr(date_freq)
+        assert date_freq == eval(repr(date_freq))
+
+        date_tz_freq = Timestamp(date, tz=tz, freq=freq)
+        assert date in repr(date_tz_freq)
+        assert tz_repr in repr(date_tz_freq)
+        assert freq_repr in repr(date_tz_freq)
+        assert date_tz_freq == eval(repr(date_tz_freq))
+
+    def test_repr_utcoffset(self):
+        # This can cause the tz field to be populated, but it's redundant to
+        # include this information in the date-string.
+        date_with_utc_offset = Timestamp('2014-03-13 00:00:00-0400', tz=None)
+        assert '2014-03-13 00:00:00-0400' in repr(date_with_utc_offset)
+        assert 'tzoffset' not in repr(date_with_utc_offset)
+        assert 'pytz.FixedOffset(-240)' in repr(date_with_utc_offset)
+        expr = repr(date_with_utc_offset).replace("'pytz.FixedOffset(-240)'",
+                                                  'pytz.FixedOffset(-240)')
+        assert date_with_utc_offset == eval(expr)
+
+    def test_timestamp_repr_pre1900(self):
+        # pre-1900
+        stamp = Timestamp('1850-01-01', tz='US/Eastern')
+        repr(stamp)
+
+        iso8601 = '1850-01-01 01:23:45.012345'
+        stamp = Timestamp(iso8601, tz='US/Eastern')
+        result = repr(stamp)
+        assert iso8601 in result
+
+    def test_pprint(self):
+        # GH#12622
+        nested_obj = {'foo': 1,
+                      'bar': [{'w': {'a': Timestamp('2011-01-01')}}] * 10}
+        result = pprint.pformat(nested_obj, width=50)
+        expected = r"""{'bar': [{'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}}],
+ 'foo': 1}"""
+        assert result == expected
diff --git a/pandas/tests/scalar/timestamp/test_timestamp.py b/pandas/tests/scalar/timestamp/test_timestamp.py
new file mode 100644
index 0000000000000..5272059163a07
--- /dev/null
+++ b/pandas/tests/scalar/timestamp/test_timestamp.py
@@ -0,0 +1,912 @@
+""" test the scalar Timestamp """
+
+import pytz
+import pytest
+import dateutil
+import calendar
+import locale
+import numpy as np
+
+from dateutil.tz import tzutc
+from pytz import timezone, utc
+from datetime import datetime, timedelta
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+from pandas.tseries import offsets
+
+from pandas._libs.tslibs import conversion
+from pandas._libs.tslibs.timezones import get_timezone, dateutil_gettz as gettz
+
+from pandas.errors import OutOfBoundsDatetime
+from pandas.compat import long, PY3
+from pandas.compat.numpy import np_datetime64_compat
+from pandas import Timestamp, Period, Timedelta, NaT
+
+
+class TestTimestampProperties(object):
+
+    def test_properties_business(self):
+        ts = Timestamp('2017-10-01', freq='B')
+        control = Timestamp('2017-10-01')
+        assert ts.dayofweek == 6
+        assert not ts.is_month_start    # not a weekday
+        assert not ts.is_quarter_start  # not a weekday
+        # Control case: non-business is month/qtr start
+        assert control.is_month_start
+        assert control.is_quarter_start
+
+        ts = Timestamp('2017-09-30', freq='B')
+        control = Timestamp('2017-09-30')
+        assert ts.dayofweek == 5
+        assert not ts.is_month_end    # not a weekday
+        assert not ts.is_quarter_end  # not a weekday
+        # Control case: non-business is month/qtr start
+        assert control.is_month_end
+        assert control.is_quarter_end
+
+    def test_fields(self):
+        def check(value, equal):
+            # that we are int/long like
+            assert isinstance(value, (int, long))
+            assert value == equal
+
+        # GH 10050
+        ts = Timestamp('2015-05-10 09:06:03.000100001')
+        check(ts.year, 2015)
+        check(ts.month, 5)
+        check(ts.day, 10)
+        check(ts.hour, 9)
+        check(ts.minute, 6)
+        check(ts.second, 3)
+        pytest.raises(AttributeError, lambda: ts.millisecond)
+        check(ts.microsecond, 100)
+        check(ts.nanosecond, 1)
+        check(ts.dayofweek, 6)
+        check(ts.quarter, 2)
+        check(ts.dayofyear, 130)
+        check(ts.week, 19)
+        check(ts.daysinmonth, 31)
+        check(ts.daysinmonth, 31)
+
+        # GH 13303
+        ts = Timestamp('2014-12-31 23:59:00-05:00', tz='US/Eastern')
+        check(ts.year, 2014)
+        check(ts.month, 12)
+        check(ts.day, 31)
+        check(ts.hour, 23)
+        check(ts.minute, 59)
+        check(ts.second, 0)
+        pytest.raises(AttributeError, lambda: ts.millisecond)
+        check(ts.microsecond, 0)
+        check(ts.nanosecond, 0)
+        check(ts.dayofweek, 2)
+        check(ts.quarter, 4)
+        check(ts.dayofyear, 365)
+        check(ts.week, 1)
+        check(ts.daysinmonth, 31)
+
+        ts = Timestamp('2014-01-01 00:00:00+01:00')
+        starts = ['is_month_start', 'is_quarter_start', 'is_year_start']
+        for start in starts:
+            assert getattr(ts, start)
+        ts = Timestamp('2014-12-31 23:59:59+01:00')
+        ends = ['is_month_end', 'is_year_end', 'is_quarter_end']
+        for end in ends:
+            assert getattr(ts, end)
+
+    # GH 12806
+    @pytest.mark.parametrize('data',
+                             [Timestamp('2017-08-28 23:00:00'),
+                              Timestamp('2017-08-28 23:00:00', tz='EST')])
+    @pytest.mark.parametrize('time_locale', [
+        None] if tm.get_locales() is None else [None] + tm.get_locales())
+    def test_names(self, data, time_locale):
+        # GH 17354
+        # Test .weekday_name, .day_name(), .month_name
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert data.weekday_name == 'Monday'
+        if time_locale is None:
+            expected_day = 'Monday'
+            expected_month = 'August'
+        else:
+            with tm.set_locale(time_locale, locale.LC_TIME):
+                expected_day = calendar.day_name[0].capitalize()
+                expected_month = calendar.month_name[8].capitalize()
+
+        assert data.day_name(time_locale) == expected_day
+        assert data.month_name(time_locale) == expected_month
+
+        # Test NaT
+        nan_ts = Timestamp(NaT)
+        assert np.isnan(nan_ts.day_name(time_locale))
+        assert np.isnan(nan_ts.month_name(time_locale))
+
+    def test_is_leap_year(self, tz_naive_fixture):
+        tz = tz_naive_fixture
+        # GH 13727
+        dt = Timestamp('2000-01-01 00:00:00', tz=tz)
+        assert dt.is_leap_year
+        assert isinstance(dt.is_leap_year, bool)
+
+        dt = Timestamp('1999-01-01 00:00:00', tz=tz)
+        assert not dt.is_leap_year
+
+        dt = Timestamp('2004-01-01 00:00:00', tz=tz)
+        assert dt.is_leap_year
+
+        dt = Timestamp('2100-01-01 00:00:00', tz=tz)
+        assert not dt.is_leap_year
+
+    def test_woy_boundary(self):
+        # make sure weeks at year boundaries are correct
+        d = datetime(2013, 12, 31)
+        result = Timestamp(d).week
+        expected = 1  # ISO standard
+        assert result == expected
+
+        d = datetime(2008, 12, 28)
+        result = Timestamp(d).week
+        expected = 52  # ISO standard
+        assert result == expected
+
+        d = datetime(2009, 12, 31)
+        result = Timestamp(d).week
+        expected = 53  # ISO standard
+        assert result == expected
+
+        d = datetime(2010, 1, 1)
+        result = Timestamp(d).week
+        expected = 53  # ISO standard
+        assert result == expected
+
+        d = datetime(2010, 1, 3)
+        result = Timestamp(d).week
+        expected = 53  # ISO standard
+        assert result == expected
+
+        result = np.array([Timestamp(datetime(*args)).week
+                           for args in [(2000, 1, 1), (2000, 1, 2), (
+                               2005, 1, 1), (2005, 1, 2)]])
+        assert (result == [52, 52, 53, 53]).all()
+
+
+class TestTimestampConstructors(object):
+
+    def test_constructor(self):
+        base_str = '2014-07-01 09:00'
+        base_dt = datetime(2014, 7, 1, 9)
+        base_expected = 1404205200000000000
+
+        # confirm base representation is correct
+        import calendar
+        assert (calendar.timegm(base_dt.timetuple()) * 1000000000 ==
+                base_expected)
+
+        tests = [(base_str, base_dt, base_expected),
+                 ('2014-07-01 10:00', datetime(2014, 7, 1, 10),
+                  base_expected + 3600 * 1000000000),
+                 ('2014-07-01 09:00:00.000008000',
+                  datetime(2014, 7, 1, 9, 0, 0, 8),
+                  base_expected + 8000),
+                 ('2014-07-01 09:00:00.000000005',
+                  Timestamp('2014-07-01 09:00:00.000000005'),
+                  base_expected + 5)]
+
+        timezones = [(None, 0), ('UTC', 0), (pytz.utc, 0), ('Asia/Tokyo', 9),
+                     ('US/Eastern', -4), ('dateutil/US/Pacific', -7),
+                     (pytz.FixedOffset(-180), -3),
+                     (dateutil.tz.tzoffset(None, 18000), 5)]
+
+        for date_str, date, expected in tests:
+            for result in [Timestamp(date_str), Timestamp(date)]:
+                # only with timestring
+                assert result.value == expected
+                assert conversion.pydt_to_i8(result) == expected
+
+                # re-creation shouldn't affect to internal value
+                result = Timestamp(result)
+                assert result.value == expected
+                assert conversion.pydt_to_i8(result) == expected
+
+            # with timezone
+            for tz, offset in timezones:
+                for result in [Timestamp(date_str, tz=tz), Timestamp(date,
+                                                                     tz=tz)]:
+                    expected_tz = expected - offset * 3600 * 1000000000
+                    assert result.value == expected_tz
+                    assert conversion.pydt_to_i8(result) == expected_tz
+
+                    # should preserve tz
+                    result = Timestamp(result)
+                    assert result.value == expected_tz
+                    assert conversion.pydt_to_i8(result) == expected_tz
+
+                    # should convert to UTC
+                    result = Timestamp(result, tz='UTC')
+                    expected_utc = expected - offset * 3600 * 1000000000
+                    assert result.value == expected_utc
+                    assert conversion.pydt_to_i8(result) == expected_utc
+
+    def test_constructor_with_stringoffset(self):
+        # GH 7833
+        base_str = '2014-07-01 11:00:00+02:00'
+        base_dt = datetime(2014, 7, 1, 9)
+        base_expected = 1404205200000000000
+
+        # confirm base representation is correct
+        import calendar
+        assert (calendar.timegm(base_dt.timetuple()) * 1000000000 ==
+                base_expected)
+
+        tests = [(base_str, base_expected),
+                 ('2014-07-01 12:00:00+02:00',
+                  base_expected + 3600 * 1000000000),
+                 ('2014-07-01 11:00:00.000008000+02:00', base_expected + 8000),
+                 ('2014-07-01 11:00:00.000000005+02:00', base_expected + 5)]
+
+        timezones = [(None, 0), ('UTC', 0), (pytz.utc, 0), ('Asia/Tokyo', 9),
+                     ('US/Eastern', -4), ('dateutil/US/Pacific', -7),
+                     (pytz.FixedOffset(-180), -3),
+                     (dateutil.tz.tzoffset(None, 18000), 5)]
+
+        for date_str, expected in tests:
+            for result in [Timestamp(date_str)]:
+                # only with timestring
+                assert result.value == expected
+                assert conversion.pydt_to_i8(result) == expected
+
+                # re-creation shouldn't affect to internal value
+                result = Timestamp(result)
+                assert result.value == expected
+                assert conversion.pydt_to_i8(result) == expected
+
+            # with timezone
+            for tz, offset in timezones:
+                result = Timestamp(date_str, tz=tz)
+                expected_tz = expected
+                assert result.value == expected_tz
+                assert conversion.pydt_to_i8(result) == expected_tz
+
+                # should preserve tz
+                result = Timestamp(result)
+                assert result.value == expected_tz
+                assert conversion.pydt_to_i8(result) == expected_tz
+
+                # should convert to UTC
+                result = Timestamp(result, tz='UTC')
+                expected_utc = expected
+                assert result.value == expected_utc
+                assert conversion.pydt_to_i8(result) == expected_utc
+
+        # This should be 2013-11-01 05:00 in UTC
+        # converted to Chicago tz
+        result = Timestamp('2013-11-01 00:00:00-0500', tz='America/Chicago')
+        assert result.value == Timestamp('2013-11-01 05:00').value
+        expected = "Timestamp('2013-11-01 00:00:00-0500', tz='America/Chicago')"  # noqa
+        assert repr(result) == expected
+        assert result == eval(repr(result))
+
+        # This should be 2013-11-01 05:00 in UTC
+        # converted to Tokyo tz (+09:00)
+        result = Timestamp('2013-11-01 00:00:00-0500', tz='Asia/Tokyo')
+        assert result.value == Timestamp('2013-11-01 05:00').value
+        expected = "Timestamp('2013-11-01 14:00:00+0900', tz='Asia/Tokyo')"
+        assert repr(result) == expected
+        assert result == eval(repr(result))
+
+        # GH11708
+        # This should be 2015-11-18 10:00 in UTC
+        # converted to Asia/Katmandu
+        result = Timestamp("2015-11-18 15:45:00+05:45", tz="Asia/Katmandu")
+        assert result.value == Timestamp("2015-11-18 10:00").value
+        expected = "Timestamp('2015-11-18 15:45:00+0545', tz='Asia/Katmandu')"
+        assert repr(result) == expected
+        assert result == eval(repr(result))
+
+        # This should be 2015-11-18 10:00 in UTC
+        # converted to Asia/Kolkata
+        result = Timestamp("2015-11-18 15:30:00+05:30", tz="Asia/Kolkata")
+        assert result.value == Timestamp("2015-11-18 10:00").value
+        expected = "Timestamp('2015-11-18 15:30:00+0530', tz='Asia/Kolkata')"
+        assert repr(result) == expected
+        assert result == eval(repr(result))
+
+    def test_constructor_invalid(self):
+        with tm.assert_raises_regex(TypeError, 'Cannot convert input'):
+            Timestamp(slice(2))
+        with tm.assert_raises_regex(ValueError, 'Cannot convert Period'):
+            Timestamp(Period('1000-01-01'))
+
+    def test_constructor_invalid_tz(self):
+        # GH#17690
+        with tm.assert_raises_regex(TypeError, 'must be a datetime.tzinfo'):
+            Timestamp('2017-10-22', tzinfo='US/Eastern')
+
+        with tm.assert_raises_regex(ValueError, 'at most one of'):
+            Timestamp('2017-10-22', tzinfo=utc, tz='UTC')
+
+        with tm.assert_raises_regex(ValueError, "Invalid frequency:"):
+            # GH#5168
+            # case where user tries to pass tz as an arg, not kwarg, gets
+            # interpreted as a `freq`
+            Timestamp('2012-01-01', 'US/Pacific')
+
+    def test_constructor_tz_or_tzinfo(self):
+        # GH#17943, GH#17690, GH#5168
+        stamps = [Timestamp(year=2017, month=10, day=22, tz='UTC'),
+                  Timestamp(year=2017, month=10, day=22, tzinfo=utc),
+                  Timestamp(year=2017, month=10, day=22, tz=utc),
+                  Timestamp(datetime(2017, 10, 22), tzinfo=utc),
+                  Timestamp(datetime(2017, 10, 22), tz='UTC'),
+                  Timestamp(datetime(2017, 10, 22), tz=utc)]
+        assert all(ts == stamps[0] for ts in stamps)
+
+    def test_constructor_positional(self):
+        # see gh-10758
+        with pytest.raises(TypeError):
+            Timestamp(2000, 1)
+        with pytest.raises(ValueError):
+            Timestamp(2000, 0, 1)
+        with pytest.raises(ValueError):
+            Timestamp(2000, 13, 1)
+        with pytest.raises(ValueError):
+            Timestamp(2000, 1, 0)
+        with pytest.raises(ValueError):
+            Timestamp(2000, 1, 32)
+
+        # see gh-11630
+        assert (repr(Timestamp(2015, 11, 12)) ==
+                repr(Timestamp('20151112')))
+        assert (repr(Timestamp(2015, 11, 12, 1, 2, 3, 999999)) ==
+                repr(Timestamp('2015-11-12 01:02:03.999999')))
+
+    def test_constructor_keyword(self):
+        # GH 10758
+        with pytest.raises(TypeError):
+            Timestamp(year=2000, month=1)
+        with pytest.raises(ValueError):
+            Timestamp(year=2000, month=0, day=1)
+        with pytest.raises(ValueError):
+            Timestamp(year=2000, month=13, day=1)
+        with pytest.raises(ValueError):
+            Timestamp(year=2000, month=1, day=0)
+        with pytest.raises(ValueError):
+            Timestamp(year=2000, month=1, day=32)
+
+        assert (repr(Timestamp(year=2015, month=11, day=12)) ==
+                repr(Timestamp('20151112')))
+
+        assert (repr(Timestamp(year=2015, month=11, day=12, hour=1, minute=2,
+                               second=3, microsecond=999999)) ==
+                repr(Timestamp('2015-11-12 01:02:03.999999')))
+
+    def test_constructor_fromordinal(self):
+        base = datetime(2000, 1, 1)
+
+        ts = Timestamp.fromordinal(base.toordinal(), freq='D')
+        assert base == ts
+        assert ts.freq == 'D'
+        assert base.toordinal() == ts.toordinal()
+
+        ts = Timestamp.fromordinal(base.toordinal(), tz='US/Eastern')
+        assert Timestamp('2000-01-01', tz='US/Eastern') == ts
+        assert base.toordinal() == ts.toordinal()
+
+        # GH#3042
+        dt = datetime(2011, 4, 16, 0, 0)
+        ts = Timestamp.fromordinal(dt.toordinal())
+        assert ts.to_pydatetime() == dt
+
+        # with a tzinfo
+        stamp = Timestamp('2011-4-16', tz='US/Eastern')
+        dt_tz = stamp.to_pydatetime()
+        ts = Timestamp.fromordinal(dt_tz.toordinal(), tz='US/Eastern')
+        assert ts.to_pydatetime() == dt_tz
+
+    @pytest.mark.parametrize('result', [
+        Timestamp(datetime(2000, 1, 2, 3, 4, 5, 6), nanosecond=1),
+        Timestamp(year=2000, month=1, day=2, hour=3, minute=4, second=5,
+                  microsecond=6, nanosecond=1),
+        Timestamp(year=2000, month=1, day=2, hour=3, minute=4, second=5,
+                  microsecond=6, nanosecond=1, tz='UTC'),
+        Timestamp(2000, 1, 2, 3, 4, 5, 6, 1, None),
+        Timestamp(2000, 1, 2, 3, 4, 5, 6, 1, pytz.UTC)])
+    def test_constructor_nanosecond(self, result):
+        # GH 18898
+        expected = Timestamp(datetime(2000, 1, 2, 3, 4, 5, 6), tz=result.tz)
+        expected = expected + Timedelta(nanoseconds=1)
+        assert result == expected
+
+    @pytest.mark.parametrize('z', ['Z0', 'Z00'])
+    def test_constructor_invalid_Z0_isostring(self, z):
+        # GH 8910
+        with pytest.raises(ValueError):
+            Timestamp('2014-11-02 01:00{}'.format(z))
+
+    @pytest.mark.parametrize('arg', ['year', 'month', 'day', 'hour', 'minute',
+                                     'second', 'microsecond', 'nanosecond'])
+    def test_invalid_date_kwarg_with_string_input(self, arg):
+        kwarg = {arg: 1}
+        with pytest.raises(ValueError):
+            Timestamp('2010-10-10 12:59:59.999999999', **kwarg)
+
+    def test_out_of_bounds_value(self):
+        one_us = np.timedelta64(1).astype('timedelta64[us]')
+
+        # By definition we can't go out of bounds in [ns], so we
+        # convert the datetime64s to [us] so we can go out of bounds
+        min_ts_us = np.datetime64(Timestamp.min).astype('M8[us]')
+        max_ts_us = np.datetime64(Timestamp.max).astype('M8[us]')
+
+        # No error for the min/max datetimes
+        Timestamp(min_ts_us)
+        Timestamp(max_ts_us)
+
+        # One us less than the minimum is an error
+        with pytest.raises(ValueError):
+            Timestamp(min_ts_us - one_us)
+
+        # One us more than the maximum is an error
+        with pytest.raises(ValueError):
+            Timestamp(max_ts_us + one_us)
+
+    def test_out_of_bounds_string(self):
+        with pytest.raises(ValueError):
+            Timestamp('1676-01-01')
+        with pytest.raises(ValueError):
+            Timestamp('2263-01-01')
+
+    def test_barely_out_of_bounds(self):
+        # GH#19529
+        # GH#19382 close enough to bounds that dropping nanos would result
+        # in an in-bounds datetime
+        with pytest.raises(OutOfBoundsDatetime):
+            Timestamp('2262-04-11 23:47:16.854775808')
+
+    def test_bounds_with_different_units(self):
+        out_of_bounds_dates = ('1677-09-21', '2262-04-12')
+
+        time_units = ('D', 'h', 'm', 's', 'ms', 'us')
+
+        for date_string in out_of_bounds_dates:
+            for unit in time_units:
+                dt64 = np.datetime64(date_string, dtype='M8[%s]' % unit)
+                with pytest.raises(ValueError):
+                    Timestamp(dt64)
+
+        in_bounds_dates = ('1677-09-23', '2262-04-11')
+
+        for date_string in in_bounds_dates:
+            for unit in time_units:
+                dt64 = np.datetime64(date_string, dtype='M8[%s]' % unit)
+                Timestamp(dt64)
+
+    def test_min_valid(self):
+        # Ensure that Timestamp.min is a valid Timestamp
+        Timestamp(Timestamp.min)
+
+    def test_max_valid(self):
+        # Ensure that Timestamp.max is a valid Timestamp
+        Timestamp(Timestamp.max)
+
+    def test_now(self):
+        # GH#9000
+        ts_from_string = Timestamp('now')
+        ts_from_method = Timestamp.now()
+        ts_datetime = datetime.now()
+
+        ts_from_string_tz = Timestamp('now', tz='US/Eastern')
+        ts_from_method_tz = Timestamp.now(tz='US/Eastern')
+
+        # Check that the delta between the times is less than 1s (arbitrarily
+        # small)
+        delta = Timedelta(seconds=1)
+        assert abs(ts_from_method - ts_from_string) < delta
+        assert abs(ts_datetime - ts_from_method) < delta
+        assert abs(ts_from_method_tz - ts_from_string_tz) < delta
+        assert (abs(ts_from_string_tz.tz_localize(None) -
+                    ts_from_method_tz.tz_localize(None)) < delta)
+
+    def test_today(self):
+        ts_from_string = Timestamp('today')
+        ts_from_method = Timestamp.today()
+        ts_datetime = datetime.today()
+
+        ts_from_string_tz = Timestamp('today', tz='US/Eastern')
+        ts_from_method_tz = Timestamp.today(tz='US/Eastern')
+
+        # Check that the delta between the times is less than 1s (arbitrarily
+        # small)
+        delta = Timedelta(seconds=1)
+        assert abs(ts_from_method - ts_from_string) < delta
+        assert abs(ts_datetime - ts_from_method) < delta
+        assert abs(ts_from_method_tz - ts_from_string_tz) < delta
+        assert (abs(ts_from_string_tz.tz_localize(None) -
+                    ts_from_method_tz.tz_localize(None)) < delta)
+
+    @pytest.mark.parametrize('tz', [None, pytz.timezone('US/Pacific')])
+    def test_disallow_setting_tz(self, tz):
+        # GH 3746
+        ts = Timestamp('2010')
+        with pytest.raises(AttributeError):
+            ts.tz = tz
+
+    @pytest.mark.parametrize('offset', ['+0300', '+0200'])
+    def test_construct_timestamp_near_dst(self, offset):
+        # GH 20854
+        expected = Timestamp('2016-10-30 03:00:00{}'.format(offset),
+                             tz='Europe/Helsinki')
+        result = Timestamp(expected, tz='Europe/Helsinki')
+        assert result == expected
+
+    @pytest.mark.parametrize('arg', [
+        '2013/01/01 00:00:00+09:00', '2013-01-01 00:00:00+09:00'])
+    def test_construct_with_different_string_format(self, arg):
+        # GH 12064
+        result = Timestamp(arg)
+        expected = Timestamp(datetime(2013, 1, 1), tz=pytz.FixedOffset(540))
+        assert result == expected
+
+
+class TestTimestamp(object):
+
+    def test_tz(self):
+        tstr = '2014-02-01 09:00'
+        ts = Timestamp(tstr)
+        local = ts.tz_localize('Asia/Tokyo')
+        assert local.hour == 9
+        assert local == Timestamp(tstr, tz='Asia/Tokyo')
+        conv = local.tz_convert('US/Eastern')
+        assert conv == Timestamp('2014-01-31 19:00', tz='US/Eastern')
+        assert conv.hour == 19
+
+        # preserves nanosecond
+        ts = Timestamp(tstr) + offsets.Nano(5)
+        local = ts.tz_localize('Asia/Tokyo')
+        assert local.hour == 9
+        assert local.nanosecond == 5
+        conv = local.tz_convert('US/Eastern')
+        assert conv.nanosecond == 5
+        assert conv.hour == 19
+
+    def test_utc_z_designator(self):
+        assert get_timezone(Timestamp('2014-11-02 01:00Z').tzinfo) == 'UTC'
+
+    def test_asm8(self):
+        np.random.seed(7960929)
+        ns = [Timestamp.min.value, Timestamp.max.value, 1000]
+
+        for n in ns:
+            assert (Timestamp(n).asm8.view('i8') ==
+                    np.datetime64(n, 'ns').view('i8') == n)
+
+        assert (Timestamp('nat').asm8.view('i8') ==
+                np.datetime64('nat', 'ns').view('i8'))
+
+    def test_class_ops_pytz(self):
+        def compare(x, y):
+            assert (int(Timestamp(x).value / 1e9) ==
+                    int(Timestamp(y).value / 1e9))
+
+        compare(Timestamp.now(), datetime.now())
+        compare(Timestamp.now('UTC'), datetime.now(timezone('UTC')))
+        compare(Timestamp.utcnow(), datetime.utcnow())
+        compare(Timestamp.today(), datetime.today())
+        current_time = calendar.timegm(datetime.now().utctimetuple())
+        compare(Timestamp.utcfromtimestamp(current_time),
+                datetime.utcfromtimestamp(current_time))
+        compare(Timestamp.fromtimestamp(current_time),
+                datetime.fromtimestamp(current_time))
+
+        date_component = datetime.utcnow()
+        time_component = (date_component + timedelta(minutes=10)).time()
+        compare(Timestamp.combine(date_component, time_component),
+                datetime.combine(date_component, time_component))
+
+    def test_class_ops_dateutil(self):
+        def compare(x, y):
+            assert (int(np.round(Timestamp(x).value / 1e9)) ==
+                    int(np.round(Timestamp(y).value / 1e9)))
+
+        compare(Timestamp.now(), datetime.now())
+        compare(Timestamp.now('UTC'), datetime.now(tzutc()))
+        compare(Timestamp.utcnow(), datetime.utcnow())
+        compare(Timestamp.today(), datetime.today())
+        current_time = calendar.timegm(datetime.now().utctimetuple())
+        compare(Timestamp.utcfromtimestamp(current_time),
+                datetime.utcfromtimestamp(current_time))
+        compare(Timestamp.fromtimestamp(current_time),
+                datetime.fromtimestamp(current_time))
+
+        date_component = datetime.utcnow()
+        time_component = (date_component + timedelta(minutes=10)).time()
+        compare(Timestamp.combine(date_component, time_component),
+                datetime.combine(date_component, time_component))
+
+    def test_basics_nanos(self):
+        val = np.int64(946684800000000000).view('M8[ns]')
+        stamp = Timestamp(val.view('i8') + 500)
+        assert stamp.year == 2000
+        assert stamp.month == 1
+        assert stamp.microsecond == 0
+        assert stamp.nanosecond == 500
+
+        # GH 14415
+        val = np.iinfo(np.int64).min + 80000000000000
+        stamp = Timestamp(val)
+        assert stamp.year == 1677
+        assert stamp.month == 9
+        assert stamp.day == 21
+        assert stamp.microsecond == 145224
+        assert stamp.nanosecond == 192
+
+    @pytest.mark.parametrize('value, check_kwargs', [
+        [946688461000000000, {}],
+        [946688461000000000 / long(1000), dict(unit='us')],
+        [946688461000000000 / long(1000000), dict(unit='ms')],
+        [946688461000000000 / long(1000000000), dict(unit='s')],
+        [10957, dict(unit='D', h=0)],
+        pytest.param((946688461000000000 + 500000) / long(1000000000),
+                     dict(unit='s', us=499, ns=964),
+                     marks=pytest.mark.skipif(not PY3,
+                                              reason='using truediv, so these'
+                                                     ' are like floats')),
+        pytest.param((946688461000000000 + 500000000) / long(1000000000),
+                     dict(unit='s', us=500000),
+                     marks=pytest.mark.skipif(not PY3,
+                                              reason='using truediv, so these'
+                                                     ' are like floats')),
+        pytest.param((946688461000000000 + 500000) / long(1000000),
+                     dict(unit='ms', us=500),
+                     marks=pytest.mark.skipif(not PY3,
+                                              reason='using truediv, so these'
+                                                     ' are like floats')),
+        pytest.param((946688461000000000 + 500000) / long(1000000000),
+                     dict(unit='s'),
+                     marks=pytest.mark.skipif(PY3,
+                                              reason='get chopped in py2')),
+        pytest.param((946688461000000000 + 500000000) / long(1000000000),
+                     dict(unit='s'),
+                     marks=pytest.mark.skipif(PY3,
+                                              reason='get chopped in py2')),
+        pytest.param((946688461000000000 + 500000) / long(1000000),
+                     dict(unit='ms'),
+                     marks=pytest.mark.skipif(PY3,
+                                              reason='get chopped in py2')),
+        [(946688461000000000 + 500000) / long(1000), dict(unit='us', us=500)],
+        [(946688461000000000 + 500000000) / long(1000000),
+         dict(unit='ms', us=500000)],
+        [946688461000000000 / 1000.0 + 5, dict(unit='us', us=5)],
+        [946688461000000000 / 1000.0 + 5000, dict(unit='us', us=5000)],
+        [946688461000000000 / 1000000.0 + 0.5, dict(unit='ms', us=500)],
+        [946688461000000000 / 1000000.0 + 0.005, dict(unit='ms', us=5, ns=5)],
+        [946688461000000000 / 1000000000.0 + 0.5, dict(unit='s', us=500000)],
+        [10957 + 0.5, dict(unit='D', h=12)]])
+    def test_unit(self, value, check_kwargs):
+        def check(value, unit=None, h=1, s=1, us=0, ns=0):
+            stamp = Timestamp(value, unit=unit)
+            assert stamp.year == 2000
+            assert stamp.month == 1
+            assert stamp.day == 1
+            assert stamp.hour == h
+            if unit != 'D':
+                assert stamp.minute == 1
+                assert stamp.second == s
+                assert stamp.microsecond == us
+            else:
+                assert stamp.minute == 0
+                assert stamp.second == 0
+                assert stamp.microsecond == 0
+            assert stamp.nanosecond == ns
+
+        check(value, **check_kwargs)
+
+    def test_roundtrip(self):
+
+        # test value to string and back conversions
+        # further test accessors
+        base = Timestamp('20140101 00:00:00')
+
+        result = Timestamp(base.value + Timedelta('5ms').value)
+        assert result == Timestamp(str(base) + ".005000")
+        assert result.microsecond == 5000
+
+        result = Timestamp(base.value + Timedelta('5us').value)
+        assert result == Timestamp(str(base) + ".000005")
+        assert result.microsecond == 5
+
+        result = Timestamp(base.value + Timedelta('5ns').value)
+        assert result == Timestamp(str(base) + ".000000005")
+        assert result.nanosecond == 5
+        assert result.microsecond == 0
+
+        result = Timestamp(base.value + Timedelta('6ms 5us').value)
+        assert result == Timestamp(str(base) + ".006005")
+        assert result.microsecond == 5 + 6 * 1000
+
+        result = Timestamp(base.value + Timedelta('200ms 5us').value)
+        assert result == Timestamp(str(base) + ".200005")
+        assert result.microsecond == 5 + 200 * 1000
+
+    def test_hash_equivalent(self):
+        d = {datetime(2011, 1, 1): 5}
+        stamp = Timestamp(datetime(2011, 1, 1))
+        assert d[stamp] == 5
+
+
+class TestTimestampNsOperations(object):
+
+    def setup_method(self, method):
+        self.timestamp = Timestamp(datetime.utcnow())
+
+    def assert_ns_timedelta(self, modified_timestamp, expected_value):
+        value = self.timestamp.value
+        modified_value = modified_timestamp.value
+
+        assert modified_value - value == expected_value
+
+    def test_timedelta_ns_arithmetic(self):
+        self.assert_ns_timedelta(self.timestamp + np.timedelta64(-123, 'ns'),
+                                 -123)
+
+    def test_timedelta_ns_based_arithmetic(self):
+        self.assert_ns_timedelta(self.timestamp + np.timedelta64(
+            1234567898, 'ns'), 1234567898)
+
+    def test_timedelta_us_arithmetic(self):
+        self.assert_ns_timedelta(self.timestamp + np.timedelta64(-123, 'us'),
+                                 -123000)
+
+    def test_timedelta_ms_arithmetic(self):
+        time = self.timestamp + np.timedelta64(-123, 'ms')
+        self.assert_ns_timedelta(time, -123000000)
+
+    def test_nanosecond_string_parsing(self):
+        ts = Timestamp('2013-05-01 07:15:45.123456789')
+        # GH 7878
+        expected_repr = '2013-05-01 07:15:45.123456789'
+        expected_value = 1367392545123456789
+        assert ts.value == expected_value
+        assert expected_repr in repr(ts)
+
+        ts = Timestamp('2013-05-01 07:15:45.123456789+09:00', tz='Asia/Tokyo')
+        assert ts.value == expected_value - 9 * 3600 * 1000000000
+        assert expected_repr in repr(ts)
+
+        ts = Timestamp('2013-05-01 07:15:45.123456789', tz='UTC')
+        assert ts.value == expected_value
+        assert expected_repr in repr(ts)
+
+        ts = Timestamp('2013-05-01 07:15:45.123456789', tz='US/Eastern')
+        assert ts.value == expected_value + 4 * 3600 * 1000000000
+        assert expected_repr in repr(ts)
+
+        # GH 10041
+        ts = Timestamp('20130501T071545.123456789')
+        assert ts.value == expected_value
+        assert expected_repr in repr(ts)
+
+    def test_nanosecond_timestamp(self):
+        # GH 7610
+        expected = 1293840000000000005
+        t = Timestamp('2011-01-01') + offsets.Nano(5)
+        assert repr(t) == "Timestamp('2011-01-01 00:00:00.000000005')"
+        assert t.value == expected
+        assert t.nanosecond == 5
+
+        t = Timestamp(t)
+        assert repr(t) == "Timestamp('2011-01-01 00:00:00.000000005')"
+        assert t.value == expected
+        assert t.nanosecond == 5
+
+        t = Timestamp(np_datetime64_compat('2011-01-01 00:00:00.000000005Z'))
+        assert repr(t) == "Timestamp('2011-01-01 00:00:00.000000005')"
+        assert t.value == expected
+        assert t.nanosecond == 5
+
+        expected = 1293840000000000010
+        t = t + offsets.Nano(5)
+        assert repr(t) == "Timestamp('2011-01-01 00:00:00.000000010')"
+        assert t.value == expected
+        assert t.nanosecond == 10
+
+        t = Timestamp(t)
+        assert repr(t) == "Timestamp('2011-01-01 00:00:00.000000010')"
+        assert t.value == expected
+        assert t.nanosecond == 10
+
+        t = Timestamp(np_datetime64_compat('2011-01-01 00:00:00.000000010Z'))
+        assert repr(t) == "Timestamp('2011-01-01 00:00:00.000000010')"
+        assert t.value == expected
+        assert t.nanosecond == 10
+
+
+class TestTimestampToJulianDate(object):
+
+    def test_compare_1700(self):
+        r = Timestamp('1700-06-23').to_julian_date()
+        assert r == 2342145.5
+
+    def test_compare_2000(self):
+        r = Timestamp('2000-04-12').to_julian_date()
+        assert r == 2451646.5
+
+    def test_compare_2100(self):
+        r = Timestamp('2100-08-12').to_julian_date()
+        assert r == 2488292.5
+
+    def test_compare_hour01(self):
+        r = Timestamp('2000-08-12T01:00:00').to_julian_date()
+        assert r == 2451768.5416666666666666
+
+    def test_compare_hour13(self):
+        r = Timestamp('2000-08-12T13:00:00').to_julian_date()
+        assert r == 2451769.0416666666666666
+
+
+class TestTimestampConversion(object):
+    def test_conversion(self):
+        # GH#9255
+        ts = Timestamp('2000-01-01')
+
+        result = ts.to_pydatetime()
+        expected = datetime(2000, 1, 1)
+        assert result == expected
+        assert type(result) == type(expected)
+
+        result = ts.to_datetime64()
+        expected = np.datetime64(ts.value, 'ns')
+        assert result == expected
+        assert type(result) == type(expected)
+        assert result.dtype == expected.dtype
+
+    def test_to_pydatetime_nonzero_nano(self):
+        ts = Timestamp('2011-01-01 9:00:00.123456789')
+
+        # Warn the user of data loss (nanoseconds).
+        with tm.assert_produces_warning(UserWarning,
+                                        check_stacklevel=False):
+            expected = datetime(2011, 1, 1, 9, 0, 0, 123456)
+            result = ts.to_pydatetime()
+            assert result == expected
+
+    def test_timestamp_to_datetime(self):
+        stamp = Timestamp('20090415', tz='US/Eastern', freq='D')
+        dtval = stamp.to_pydatetime()
+        assert stamp == dtval
+        assert stamp.tzinfo == dtval.tzinfo
+
+    def test_timestamp_to_datetime_dateutil(self):
+        stamp = Timestamp('20090415', tz='dateutil/US/Eastern', freq='D')
+        dtval = stamp.to_pydatetime()
+        assert stamp == dtval
+        assert stamp.tzinfo == dtval.tzinfo
+
+    def test_timestamp_to_datetime_explicit_pytz(self):
+        stamp = Timestamp('20090415', tz=pytz.timezone('US/Eastern'), freq='D')
+        dtval = stamp.to_pydatetime()
+        assert stamp == dtval
+        assert stamp.tzinfo == dtval.tzinfo
+
+    @td.skip_if_windows_python_3
+    def test_timestamp_to_datetime_explicit_dateutil(self):
+        stamp = Timestamp('20090415', tz=gettz('US/Eastern'), freq='D')
+        dtval = stamp.to_pydatetime()
+        assert stamp == dtval
+        assert stamp.tzinfo == dtval.tzinfo
+
+    def test_to_datetime_bijective(self):
+        # Ensure that converting to datetime and back only loses precision
+        # by going from nanoseconds to microseconds.
+        exp_warning = None if Timestamp.max.nanosecond == 0 else UserWarning
+        with tm.assert_produces_warning(exp_warning, check_stacklevel=False):
+            assert (Timestamp(Timestamp.max.to_pydatetime()).value / 1000 ==
+                    Timestamp.max.value / 1000)
+
+        exp_warning = None if Timestamp.min.nanosecond == 0 else UserWarning
+        with tm.assert_produces_warning(exp_warning, check_stacklevel=False):
+            assert (Timestamp(Timestamp.min.to_pydatetime()).value / 1000 ==
+                    Timestamp.min.value / 1000)
diff --git a/pandas/tests/scalar/timestamp/test_timezones.py b/pandas/tests/scalar/timestamp/test_timezones.py
new file mode 100644
index 0000000000000..cd0379e7af1a3
--- /dev/null
+++ b/pandas/tests/scalar/timestamp/test_timezones.py
@@ -0,0 +1,292 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for Timestamp timezone-related methods
+"""
+from datetime import date, timedelta
+
+from distutils.version import LooseVersion
+import pytest
+import pytz
+from pytz.exceptions import AmbiguousTimeError, NonExistentTimeError
+import dateutil
+from dateutil.tz import gettz, tzoffset
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+from pandas import Timestamp, NaT
+from pandas.errors import OutOfBoundsDatetime
+
+
+class TestTimestampTZOperations(object):
+    # --------------------------------------------------------------
+    # Timestamp.tz_localize
+
+    def test_tz_localize_pushes_out_of_bounds(self):
+        # GH#12677
+        # tz_localize that pushes away from the boundary is OK
+        pac = Timestamp.min.tz_localize('US/Pacific')
+        assert pac.value > Timestamp.min.value
+        pac.tz_convert('Asia/Tokyo')  # tz_convert doesn't change value
+        with pytest.raises(OutOfBoundsDatetime):
+            Timestamp.min.tz_localize('Asia/Tokyo')
+
+        # tz_localize that pushes away from the boundary is OK
+        tokyo = Timestamp.max.tz_localize('Asia/Tokyo')
+        assert tokyo.value < Timestamp.max.value
+        tokyo.tz_convert('US/Pacific')  # tz_convert doesn't change value
+        with pytest.raises(OutOfBoundsDatetime):
+            Timestamp.max.tz_localize('US/Pacific')
+
+    def test_tz_localize_ambiguous_bool(self):
+        # make sure that we are correctly accepting bool values as ambiguous
+        # GH#14402
+        ts = Timestamp('2015-11-01 01:00:03')
+        expected0 = Timestamp('2015-11-01 01:00:03-0500', tz='US/Central')
+        expected1 = Timestamp('2015-11-01 01:00:03-0600', tz='US/Central')
+
+        with pytest.raises(pytz.AmbiguousTimeError):
+            ts.tz_localize('US/Central')
+
+        result = ts.tz_localize('US/Central', ambiguous=True)
+        assert result == expected0
+
+        result = ts.tz_localize('US/Central', ambiguous=False)
+        assert result == expected1
+
+    def test_tz_localize_ambiguous(self):
+        ts = Timestamp('2014-11-02 01:00')
+        ts_dst = ts.tz_localize('US/Eastern', ambiguous=True)
+        ts_no_dst = ts.tz_localize('US/Eastern', ambiguous=False)
+
+        assert (ts_no_dst.value - ts_dst.value) / 1e9 == 3600
+        with pytest.raises(ValueError):
+            ts.tz_localize('US/Eastern', ambiguous='infer')
+
+        # GH#8025
+        with tm.assert_raises_regex(TypeError,
+                                    'Cannot localize tz-aware Timestamp, '
+                                    'use tz_convert for conversions'):
+            Timestamp('2011-01-01', tz='US/Eastern').tz_localize('Asia/Tokyo')
+
+        with tm.assert_raises_regex(TypeError,
+                                    'Cannot convert tz-naive Timestamp, '
+                                    'use tz_localize to localize'):
+            Timestamp('2011-01-01').tz_convert('Asia/Tokyo')
+
+    @pytest.mark.parametrize('stamp, tz', [
+        ('2015-03-08 02:00', 'US/Eastern'),
+        ('2015-03-08 02:30', 'US/Pacific'),
+        ('2015-03-29 02:00', 'Europe/Paris'),
+        ('2015-03-29 02:30', 'Europe/Belgrade')])
+    def test_tz_localize_nonexistent(self, stamp, tz):
+        # GH#13057
+        ts = Timestamp(stamp)
+        with pytest.raises(NonExistentTimeError):
+            ts.tz_localize(tz)
+        with pytest.raises(NonExistentTimeError):
+            ts.tz_localize(tz, errors='raise')
+        assert ts.tz_localize(tz, errors='coerce') is NaT
+
+    def test_tz_localize_errors_ambiguous(self):
+        # GH#13057
+        ts = Timestamp('2015-11-1 01:00')
+        with pytest.raises(AmbiguousTimeError):
+            ts.tz_localize('US/Pacific', errors='coerce')
+
+    @pytest.mark.parametrize('stamp', ['2014-02-01 09:00', '2014-07-08 09:00',
+                                       '2014-11-01 17:00', '2014-11-05 00:00'])
+    def test_tz_localize_roundtrip(self, stamp, tz_aware_fixture):
+        tz = tz_aware_fixture
+        ts = Timestamp(stamp)
+        localized = ts.tz_localize(tz)
+        assert localized == Timestamp(stamp, tz=tz)
+
+        with pytest.raises(TypeError):
+            localized.tz_localize(tz)
+
+        reset = localized.tz_localize(None)
+        assert reset == ts
+        assert reset.tzinfo is None
+
+    def test_tz_localize_ambiguous_compat(self):
+        # validate that pytz and dateutil are compat for dst
+        # when the transition happens
+        naive = Timestamp('2013-10-27 01:00:00')
+
+        pytz_zone = 'Europe/London'
+        dateutil_zone = 'dateutil/Europe/London'
+        result_pytz = naive.tz_localize(pytz_zone, ambiguous=0)
+        result_dateutil = naive.tz_localize(dateutil_zone, ambiguous=0)
+        assert result_pytz.value == result_dateutil.value
+        assert result_pytz.value == 1382835600000000000
+
+        if LooseVersion(dateutil.__version__) < LooseVersion('2.6.0'):
+            # dateutil 2.6 buggy w.r.t. ambiguous=0
+            # see gh-14621
+            # see https://github.com/dateutil/dateutil/issues/321
+            assert (result_pytz.to_pydatetime().tzname() ==
+                    result_dateutil.to_pydatetime().tzname())
+            assert str(result_pytz) == str(result_dateutil)
+        elif LooseVersion(dateutil.__version__) > LooseVersion('2.6.0'):
+            # fixed ambiguous behavior
+            assert result_pytz.to_pydatetime().tzname() == 'GMT'
+            assert result_dateutil.to_pydatetime().tzname() == 'BST'
+            assert str(result_pytz) != str(result_dateutil)
+
+        # 1 hour difference
+        result_pytz = naive.tz_localize(pytz_zone, ambiguous=1)
+        result_dateutil = naive.tz_localize(dateutil_zone, ambiguous=1)
+        assert result_pytz.value == result_dateutil.value
+        assert result_pytz.value == 1382832000000000000
+
+        # dateutil < 2.6 is buggy w.r.t. ambiguous timezones
+        if LooseVersion(dateutil.__version__) > LooseVersion('2.5.3'):
+            # see gh-14621
+            assert str(result_pytz) == str(result_dateutil)
+            assert (result_pytz.to_pydatetime().tzname() ==
+                    result_dateutil.to_pydatetime().tzname())
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern'),
+                                    'US/Eastern', 'dateutil/US/Eastern'])
+    def test_timestamp_tz_localize(self, tz):
+        stamp = Timestamp('3/11/2012 04:00')
+
+        result = stamp.tz_localize(tz)
+        expected = Timestamp('3/11/2012 04:00', tz=tz)
+        assert result.hour == expected.hour
+        assert result == expected
+
+    # ------------------------------------------------------------------
+    # Timestamp.tz_convert
+
+    @pytest.mark.parametrize('stamp', ['2014-02-01 09:00', '2014-07-08 09:00',
+                                       '2014-11-01 17:00', '2014-11-05 00:00'])
+    def test_tz_convert_roundtrip(self, stamp, tz_aware_fixture):
+        tz = tz_aware_fixture
+
+        ts = Timestamp(stamp, tz='UTC')
+        converted = ts.tz_convert(tz)
+
+        reset = converted.tz_convert(None)
+        assert reset == Timestamp(stamp)
+        assert reset.tzinfo is None
+        assert reset == converted.tz_convert('UTC').tz_localize(None)
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_astimezone(self, tzstr):
+        # astimezone is an alias for tz_convert, so keep it with
+        # the tz_convert tests
+        utcdate = Timestamp('3/11/2012 22:00', tz='UTC')
+        expected = utcdate.tz_convert(tzstr)
+        result = utcdate.astimezone(tzstr)
+        assert expected == result
+        assert isinstance(result, Timestamp)
+
+    @td.skip_if_windows
+    def test_tz_convert_utc_with_system_utc(self):
+        from pandas._libs.tslibs.timezones import maybe_get_tz
+
+        # from system utc to real utc
+        ts = Timestamp('2001-01-05 11:56', tz=maybe_get_tz('dateutil/UTC'))
+        # check that the time hasn't changed.
+        assert ts == ts.tz_convert(dateutil.tz.tzutc())
+
+        # from system utc to real utc
+        ts = Timestamp('2001-01-05 11:56', tz=maybe_get_tz('dateutil/UTC'))
+        # check that the time hasn't changed.
+        assert ts == ts.tz_convert(dateutil.tz.tzutc())
+
+    # ------------------------------------------------------------------
+    # Timestamp.__init__ with tz str or tzinfo
+
+    def test_timestamp_constructor_tz_utc(self):
+        utc_stamp = Timestamp('3/11/2012 05:00', tz='utc')
+        assert utc_stamp.tzinfo is pytz.utc
+        assert utc_stamp.hour == 5
+
+        utc_stamp = Timestamp('3/11/2012 05:00').tz_localize('utc')
+        assert utc_stamp.hour == 5
+
+    def test_timestamp_to_datetime_tzoffset(self):
+        tzinfo = tzoffset(None, 7200)
+        expected = Timestamp('3/11/2012 04:00', tz=tzinfo)
+        result = Timestamp(expected.to_pydatetime())
+        assert expected == result
+
+    def test_timestamp_constructor_near_dst_boundary(self):
+        # GH#11481 & GH#15777
+        # Naive string timestamps were being localized incorrectly
+        # with tz_convert_single instead of tz_localize_to_utc
+
+        for tz in ['Europe/Brussels', 'Europe/Prague']:
+            result = Timestamp('2015-10-25 01:00', tz=tz)
+            expected = Timestamp('2015-10-25 01:00').tz_localize(tz)
+            assert result == expected
+
+            with pytest.raises(pytz.AmbiguousTimeError):
+                Timestamp('2015-10-25 02:00', tz=tz)
+
+        result = Timestamp('2017-03-26 01:00', tz='Europe/Paris')
+        expected = Timestamp('2017-03-26 01:00').tz_localize('Europe/Paris')
+        assert result == expected
+
+        with pytest.raises(pytz.NonExistentTimeError):
+            Timestamp('2017-03-26 02:00', tz='Europe/Paris')
+
+        # GH#11708
+        naive = Timestamp('2015-11-18 10:00:00')
+        result = naive.tz_localize('UTC').tz_convert('Asia/Kolkata')
+        expected = Timestamp('2015-11-18 15:30:00+0530', tz='Asia/Kolkata')
+        assert result == expected
+
+        # GH#15823
+        result = Timestamp('2017-03-26 00:00', tz='Europe/Paris')
+        expected = Timestamp('2017-03-26 00:00:00+0100', tz='Europe/Paris')
+        assert result == expected
+
+        result = Timestamp('2017-03-26 01:00', tz='Europe/Paris')
+        expected = Timestamp('2017-03-26 01:00:00+0100', tz='Europe/Paris')
+        assert result == expected
+
+        with pytest.raises(pytz.NonExistentTimeError):
+            Timestamp('2017-03-26 02:00', tz='Europe/Paris')
+
+        result = Timestamp('2017-03-26 02:00:00+0100', tz='Europe/Paris')
+        naive = Timestamp(result.value)
+        expected = naive.tz_localize('UTC').tz_convert('Europe/Paris')
+        assert result == expected
+
+        result = Timestamp('2017-03-26 03:00', tz='Europe/Paris')
+        expected = Timestamp('2017-03-26 03:00:00+0200', tz='Europe/Paris')
+        assert result == expected
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern'),
+                                    'US/Eastern', 'dateutil/US/Eastern'])
+    def test_timestamp_constructed_by_date_and_tz(self, tz):
+        # GH#2993, Timestamp cannot be constructed by datetime.date
+        # and tz correctly
+
+        result = Timestamp(date(2012, 3, 11), tz=tz)
+
+        expected = Timestamp('3/11/2012', tz=tz)
+        assert result.hour == expected.hour
+        assert result == expected
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern'),
+                                    'US/Eastern', 'dateutil/US/Eastern'])
+    def test_timestamp_add_timedelta_push_over_dst_boundary(self, tz):
+        # GH#1389
+
+        # 4 hours before DST transition
+        stamp = Timestamp('3/10/2012 22:00', tz=tz)
+
+        result = stamp + timedelta(hours=6)
+
+        # spring forward, + "7" hours
+        expected = Timestamp('3/11/2012 05:00', tz=tz)
+
+        assert result == expected
diff --git a/pandas/tests/scalar/timestamp/test_unary_ops.py b/pandas/tests/scalar/timestamp/test_unary_ops.py
new file mode 100644
index 0000000000000..b02fef707a6fe
--- /dev/null
+++ b/pandas/tests/scalar/timestamp/test_unary_ops.py
@@ -0,0 +1,288 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime
+
+import pytest
+import pytz
+from pytz import utc
+from dateutil.tz import gettz
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+from pandas.compat import PY3
+from pandas._libs import tslib
+from pandas._libs.tslibs.frequencies import _INVALID_FREQ_ERROR
+from pandas import Timestamp, NaT
+
+
+class TestTimestampUnaryOps(object):
+
+    # --------------------------------------------------------------
+    # Timestamp.round
+
+    def test_round_day_naive(self):
+        dt = Timestamp('20130101 09:10:11')
+        result = dt.round('D')
+        expected = Timestamp('20130101')
+        assert result == expected
+
+        dt = Timestamp('20130101 19:10:11')
+        result = dt.round('D')
+        expected = Timestamp('20130102')
+        assert result == expected
+
+        dt = Timestamp('20130201 12:00:00')
+        result = dt.round('D')
+        expected = Timestamp('20130202')
+        assert result == expected
+
+        dt = Timestamp('20130104 12:00:00')
+        result = dt.round('D')
+        expected = Timestamp('20130105')
+        assert result == expected
+
+    def test_round_tzaware(self):
+        dt = Timestamp('20130101 09:10:11', tz='US/Eastern')
+        result = dt.round('D')
+        expected = Timestamp('20130101', tz='US/Eastern')
+        assert result == expected
+
+        dt = Timestamp('20130101 09:10:11', tz='US/Eastern')
+        result = dt.round('s')
+        assert result == dt
+
+    def test_round_30min(self):
+        # round
+        dt = Timestamp('20130104 12:32:00')
+        result = dt.round('30Min')
+        expected = Timestamp('20130104 12:30:00')
+        assert result == expected
+
+    def test_round_subsecond(self):
+        # GH#14440 & GH#15578
+        result = Timestamp('2016-10-17 12:00:00.0015').round('ms')
+        expected = Timestamp('2016-10-17 12:00:00.002000')
+        assert result == expected
+
+        result = Timestamp('2016-10-17 12:00:00.00149').round('ms')
+        expected = Timestamp('2016-10-17 12:00:00.001000')
+        assert result == expected
+
+        ts = Timestamp('2016-10-17 12:00:00.0015')
+        for freq in ['us', 'ns']:
+            assert ts == ts.round(freq)
+
+        result = Timestamp('2016-10-17 12:00:00.001501031').round('10ns')
+        expected = Timestamp('2016-10-17 12:00:00.001501030')
+        assert result == expected
+
+    def test_round_nonstandard_freq(self):
+        with tm.assert_produces_warning():
+            Timestamp('2016-10-17 12:00:00.001501031').round('1010ns')
+
+    def test_round_invalid_arg(self):
+        stamp = Timestamp('2000-01-05 05:09:15.13')
+        with tm.assert_raises_regex(ValueError, _INVALID_FREQ_ERROR):
+            stamp.round('foo')
+
+    @pytest.mark.parametrize('freq, expected', [
+        ('D', Timestamp('2000-01-05 00:00:00')),
+        ('H', Timestamp('2000-01-05 05:00:00')),
+        ('S', Timestamp('2000-01-05 05:09:15'))])
+    def test_round_frequencies(self, freq, expected):
+        stamp = Timestamp('2000-01-05 05:09:15.13')
+
+        result = stamp.round(freq=freq)
+        assert result == expected
+
+    @pytest.mark.parametrize('test_input, rounder, freq, expected', [
+        ('2117-01-01 00:00:45', 'floor', '15s', '2117-01-01 00:00:45'),
+        ('2117-01-01 00:00:45', 'ceil', '15s', '2117-01-01 00:00:45'),
+        ('2117-01-01 00:00:45.000000012', 'floor', '10ns',
+         '2117-01-01 00:00:45.000000010'),
+        ('1823-01-01 00:00:01.000000012', 'ceil', '10ns',
+         '1823-01-01 00:00:01.000000020'),
+        ('1823-01-01 00:00:01', 'floor', '1s', '1823-01-01 00:00:01'),
+        ('1823-01-01 00:00:01', 'ceil', '1s', '1823-01-01 00:00:01'),
+        ('NaT', 'floor', '1s', 'NaT'),
+        ('NaT', 'ceil', '1s', 'NaT')
+    ])
+    def test_ceil_floor_edge(self, test_input, rounder, freq, expected):
+        dt = Timestamp(test_input)
+        func = getattr(dt, rounder)
+        result = func(freq)
+
+        if dt is NaT:
+            assert result is NaT
+        else:
+            expected = Timestamp(expected)
+            assert result == expected
+
+    @pytest.mark.parametrize('test_input, freq, expected', [
+        ('2018-01-01 00:02:06', '2s', '2018-01-01 00:02:06'),
+        ('2018-01-01 00:02:00', '2T', '2018-01-01 00:02:00'),
+        ('2018-01-01 00:04:00', '4T', '2018-01-01 00:04:00'),
+        ('2018-01-01 00:15:00', '15T', '2018-01-01 00:15:00'),
+        ('2018-01-01 00:20:00', '20T', '2018-01-01 00:20:00'),
+        ('2018-01-01 03:00:00', '3H', '2018-01-01 03:00:00'),
+    ])
+    @pytest.mark.parametrize('rounder', ['ceil', 'floor', 'round'])
+    def test_round_minute_freq(self, test_input, freq, expected, rounder):
+        # Ensure timestamps that shouldnt round dont!
+        # GH#21262
+
+        dt = Timestamp(test_input)
+        expected = Timestamp(expected)
+        func = getattr(dt, rounder)
+        result = func(freq)
+        assert result == expected
+
+    def test_ceil(self):
+        dt = Timestamp('20130101 09:10:11')
+        result = dt.ceil('D')
+        expected = Timestamp('20130102')
+        assert result == expected
+
+    def test_floor(self):
+        dt = Timestamp('20130101 09:10:11')
+        result = dt.floor('D')
+        expected = Timestamp('20130101')
+        assert result == expected
+
+    # --------------------------------------------------------------
+    # Timestamp.replace
+
+    def test_replace_naive(self):
+        # GH#14621, GH#7825
+        ts = Timestamp('2016-01-01 09:00:00')
+        result = ts.replace(hour=0)
+        expected = Timestamp('2016-01-01 00:00:00')
+        assert result == expected
+
+    def test_replace_aware(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH#14621, GH#7825
+        # replacing datetime components with and w/o presence of a timezone
+        ts = Timestamp('2016-01-01 09:00:00', tz=tz)
+        result = ts.replace(hour=0)
+        expected = Timestamp('2016-01-01 00:00:00', tz=tz)
+        assert result == expected
+
+    def test_replace_preserves_nanos(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH#14621, GH#7825
+        ts = Timestamp('2016-01-01 09:00:00.000000123', tz=tz)
+        result = ts.replace(hour=0)
+        expected = Timestamp('2016-01-01 00:00:00.000000123', tz=tz)
+        assert result == expected
+
+    def test_replace_multiple(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH#14621, GH#7825
+        # replacing datetime components with and w/o presence of a timezone
+        # test all
+        ts = Timestamp('2016-01-01 09:00:00.000000123', tz=tz)
+        result = ts.replace(year=2015, month=2, day=2, hour=0, minute=5,
+                            second=5, microsecond=5, nanosecond=5)
+        expected = Timestamp('2015-02-02 00:05:05.000005005', tz=tz)
+        assert result == expected
+
+    def test_replace_invalid_kwarg(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH#14621, GH#7825
+        ts = Timestamp('2016-01-01 09:00:00.000000123', tz=tz)
+        with pytest.raises(TypeError):
+            ts.replace(foo=5)
+
+    def test_replace_integer_args(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH#14621, GH#7825
+        ts = Timestamp('2016-01-01 09:00:00.000000123', tz=tz)
+        with pytest.raises(ValueError):
+            ts.replace(hour=0.1)
+
+    def test_replace_tzinfo_equiv_tz_localize_none(self):
+        # GH#14621, GH#7825
+        # assert conversion to naive is the same as replacing tzinfo with None
+        ts = Timestamp('2013-11-03 01:59:59.999999-0400', tz='US/Eastern')
+        assert ts.tz_localize(None) == ts.replace(tzinfo=None)
+
+    @td.skip_if_windows
+    def test_replace_tzinfo(self):
+        # GH#15683
+        dt = datetime(2016, 3, 27, 1)
+        tzinfo = pytz.timezone('CET').localize(dt, is_dst=False).tzinfo
+
+        result_dt = dt.replace(tzinfo=tzinfo)
+        result_pd = Timestamp(dt).replace(tzinfo=tzinfo)
+
+        if PY3:
+            # datetime.timestamp() converts in the local timezone
+            with tm.set_timezone('UTC'):
+                assert result_dt.timestamp() == result_pd.timestamp()
+
+        assert result_dt == result_pd
+        assert result_dt == result_pd.to_pydatetime()
+
+        result_dt = dt.replace(tzinfo=tzinfo).replace(tzinfo=None)
+        result_pd = Timestamp(dt).replace(tzinfo=tzinfo).replace(tzinfo=None)
+
+        if PY3:
+            # datetime.timestamp() converts in the local timezone
+            with tm.set_timezone('UTC'):
+                assert result_dt.timestamp() == result_pd.timestamp()
+
+        assert result_dt == result_pd
+        assert result_dt == result_pd.to_pydatetime()
+
+    @pytest.mark.parametrize('tz, normalize', [
+        (pytz.timezone('US/Eastern'), lambda x: x.tzinfo.normalize(x)),
+        (gettz('US/Eastern'), lambda x: x)])
+    def test_replace_across_dst(self, tz, normalize):
+        # GH#18319 check that 1) timezone is correctly normalized and
+        # 2) that hour is not incorrectly changed by this normalization
+        ts_naive = Timestamp('2017-12-03 16:03:30')
+        ts_aware = tslib._localize_pydatetime(ts_naive, tz)
+
+        # Preliminary sanity-check
+        assert ts_aware == normalize(ts_aware)
+
+        # Replace across DST boundary
+        ts2 = ts_aware.replace(month=6)
+
+        # Check that `replace` preserves hour literal
+        assert (ts2.hour, ts2.minute) == (ts_aware.hour, ts_aware.minute)
+
+        # Check that post-replace object is appropriately normalized
+        ts2b = normalize(ts2)
+        assert ts2 == ts2b
+
+    def test_replace_dst_border(self):
+        # Gh 7825
+        t = Timestamp('2013-11-3', tz='America/Chicago')
+        result = t.replace(hour=3)
+        expected = Timestamp('2013-11-3 03:00:00', tz='America/Chicago')
+        assert result == expected
+
+    # --------------------------------------------------------------
+
+    @td.skip_if_windows
+    def test_timestamp(self):
+        # GH#17329
+        # tz-naive --> treat it as if it were UTC for purposes of timestamp()
+        ts = Timestamp.now()
+        uts = ts.replace(tzinfo=utc)
+        assert ts.timestamp() == uts.timestamp()
+
+        tsc = Timestamp('2014-10-11 11:00:01.12345678', tz='US/Central')
+        utsc = tsc.tz_convert('UTC')
+
+        # utsc is a different representation of the same time
+        assert tsc.timestamp() == utsc.timestamp()
+
+        if PY3:
+            # datetime.timestamp() converts in the local timezone
+            with tm.set_timezone('UTC'):
+                # should agree with datetime.timestamp method
+                dt = ts.to_pydatetime()
+                assert dt.timestamp() == ts.timestamp()
diff --git a/pandas/tests/series/__init__.py b/pandas/tests/series/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/series/common.py b/pandas/tests/series/common.py
new file mode 100644
index 0000000000000..0c25dcb29c3b2
--- /dev/null
+++ b/pandas/tests/series/common.py
@@ -0,0 +1,30 @@
+from pandas.util._decorators import cache_readonly
+import pandas.util.testing as tm
+import pandas as pd
+
+_ts = tm.makeTimeSeries()
+
+
+class TestData(object):
+
+    @cache_readonly
+    def ts(self):
+        ts = _ts.copy()
+        ts.name = 'ts'
+        return ts
+
+    @cache_readonly
+    def series(self):
+        series = tm.makeStringSeries()
+        series.name = 'series'
+        return series
+
+    @cache_readonly
+    def objSeries(self):
+        objSeries = tm.makeObjectSeries()
+        objSeries.name = 'objects'
+        return objSeries
+
+    @cache_readonly
+    def empty(self):
+        return pd.Series([], index=[])
diff --git a/pandas/tests/series/indexing/__init__.py b/pandas/tests/series/indexing/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/series/indexing/conftest.py b/pandas/tests/series/indexing/conftest.py
new file mode 100644
index 0000000000000..0e06f6b8e4640
--- /dev/null
+++ b/pandas/tests/series/indexing/conftest.py
@@ -0,0 +1,8 @@
+import pytest
+
+from pandas.tests.series.common import TestData
+
+
+@pytest.fixture(scope='module')
+def test_data():
+    return TestData()
diff --git a/pandas/tests/series/indexing/test_alter_index.py b/pandas/tests/series/indexing/test_alter_index.py
new file mode 100644
index 0000000000000..561d6a9b42508
--- /dev/null
+++ b/pandas/tests/series/indexing/test_alter_index.py
@@ -0,0 +1,557 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+
+from datetime import datetime
+
+import pandas as pd
+import numpy as np
+
+from numpy import nan
+
+from pandas import compat
+
+from pandas import (Series, date_range, isna, Categorical)
+from pandas.compat import lrange, range
+
+from pandas.util.testing import (assert_series_equal)
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize(
+    'first_slice,second_slice', [
+        [[2, None], [None, -5]],
+        [[None, 0], [None, -5]],
+        [[None, -5], [None, 0]],
+        [[None, 0], [None, 0]]
+    ])
+@pytest.mark.parametrize('fill', [None, -1])
+def test_align(test_data, first_slice, second_slice, join_type, fill):
+    a = test_data.ts[slice(*first_slice)]
+    b = test_data.ts[slice(*second_slice)]
+
+    aa, ab = a.align(b, join=join_type, fill_value=fill)
+
+    join_index = a.index.join(b.index, how=join_type)
+    if fill is not None:
+        diff_a = aa.index.difference(join_index)
+        diff_b = ab.index.difference(join_index)
+        if len(diff_a) > 0:
+            assert (aa.reindex(diff_a) == fill).all()
+        if len(diff_b) > 0:
+            assert (ab.reindex(diff_b) == fill).all()
+
+    ea = a.reindex(join_index)
+    eb = b.reindex(join_index)
+
+    if fill is not None:
+        ea = ea.fillna(fill)
+        eb = eb.fillna(fill)
+
+    assert_series_equal(aa, ea)
+    assert_series_equal(ab, eb)
+    assert aa.name == 'ts'
+    assert ea.name == 'ts'
+    assert ab.name == 'ts'
+    assert eb.name == 'ts'
+
+
+@pytest.mark.parametrize(
+    'first_slice,second_slice', [
+        [[2, None], [None, -5]],
+        [[None, 0], [None, -5]],
+        [[None, -5], [None, 0]],
+        [[None, 0], [None, 0]]
+    ])
+@pytest.mark.parametrize('method', ['pad', 'bfill'])
+@pytest.mark.parametrize('limit', [None, 1])
+def test_align_fill_method(test_data,
+                           first_slice, second_slice,
+                           join_type, method, limit):
+    a = test_data.ts[slice(*first_slice)]
+    b = test_data.ts[slice(*second_slice)]
+
+    aa, ab = a.align(b, join=join_type, method=method, limit=limit)
+
+    join_index = a.index.join(b.index, how=join_type)
+    ea = a.reindex(join_index)
+    eb = b.reindex(join_index)
+
+    ea = ea.fillna(method=method, limit=limit)
+    eb = eb.fillna(method=method, limit=limit)
+
+    assert_series_equal(aa, ea)
+    assert_series_equal(ab, eb)
+
+
+def test_align_nocopy(test_data):
+    b = test_data.ts[:5].copy()
+
+    # do copy
+    a = test_data.ts.copy()
+    ra, _ = a.align(b, join='left')
+    ra[:5] = 5
+    assert not (a[:5] == 5).any()
+
+    # do not copy
+    a = test_data.ts.copy()
+    ra, _ = a.align(b, join='left', copy=False)
+    ra[:5] = 5
+    assert (a[:5] == 5).all()
+
+    # do copy
+    a = test_data.ts.copy()
+    b = test_data.ts[:5].copy()
+    _, rb = a.align(b, join='right')
+    rb[:3] = 5
+    assert not (b[:3] == 5).any()
+
+    # do not copy
+    a = test_data.ts.copy()
+    b = test_data.ts[:5].copy()
+    _, rb = a.align(b, join='right', copy=False)
+    rb[:2] = 5
+    assert (b[:2] == 5).all()
+
+
+def test_align_same_index(test_data):
+    a, b = test_data.ts.align(test_data.ts, copy=False)
+    assert a.index is test_data.ts.index
+    assert b.index is test_data.ts.index
+
+    a, b = test_data.ts.align(test_data.ts, copy=True)
+    assert a.index is not test_data.ts.index
+    assert b.index is not test_data.ts.index
+
+
+def test_align_multiindex():
+    # GH 10665
+
+    midx = pd.MultiIndex.from_product([range(2), range(3), range(2)],
+                                      names=('a', 'b', 'c'))
+    idx = pd.Index(range(2), name='b')
+    s1 = pd.Series(np.arange(12, dtype='int64'), index=midx)
+    s2 = pd.Series(np.arange(2, dtype='int64'), index=idx)
+
+    # these must be the same results (but flipped)
+    res1l, res1r = s1.align(s2, join='left')
+    res2l, res2r = s2.align(s1, join='right')
+
+    expl = s1
+    tm.assert_series_equal(expl, res1l)
+    tm.assert_series_equal(expl, res2r)
+    expr = pd.Series([0, 0, 1, 1, np.nan, np.nan] * 2, index=midx)
+    tm.assert_series_equal(expr, res1r)
+    tm.assert_series_equal(expr, res2l)
+
+    res1l, res1r = s1.align(s2, join='right')
+    res2l, res2r = s2.align(s1, join='left')
+
+    exp_idx = pd.MultiIndex.from_product([range(2), range(2), range(2)],
+                                         names=('a', 'b', 'c'))
+    expl = pd.Series([0, 1, 2, 3, 6, 7, 8, 9], index=exp_idx)
+    tm.assert_series_equal(expl, res1l)
+    tm.assert_series_equal(expl, res2r)
+    expr = pd.Series([0, 0, 1, 1] * 2, index=exp_idx)
+    tm.assert_series_equal(expr, res1r)
+    tm.assert_series_equal(expr, res2l)
+
+
+def test_reindex(test_data):
+    identity = test_data.series.reindex(test_data.series.index)
+
+    # __array_interface__ is not defined for older numpies
+    # and on some pythons
+    try:
+        assert np.may_share_memory(test_data.series.index, identity.index)
+    except AttributeError:
+        pass
+
+    assert identity.index.is_(test_data.series.index)
+    assert identity.index.identical(test_data.series.index)
+
+    subIndex = test_data.series.index[10:20]
+    subSeries = test_data.series.reindex(subIndex)
+
+    for idx, val in compat.iteritems(subSeries):
+        assert val == test_data.series[idx]
+
+    subIndex2 = test_data.ts.index[10:20]
+    subTS = test_data.ts.reindex(subIndex2)
+
+    for idx, val in compat.iteritems(subTS):
+        assert val == test_data.ts[idx]
+    stuffSeries = test_data.ts.reindex(subIndex)
+
+    assert np.isnan(stuffSeries).all()
+
+    # This is extremely important for the Cython code to not screw up
+    nonContigIndex = test_data.ts.index[::2]
+    subNonContig = test_data.ts.reindex(nonContigIndex)
+    for idx, val in compat.iteritems(subNonContig):
+        assert val == test_data.ts[idx]
+
+    # return a copy the same index here
+    result = test_data.ts.reindex()
+    assert not (result is test_data.ts)
+
+
+def test_reindex_nan():
+    ts = Series([2, 3, 5, 7], index=[1, 4, nan, 8])
+
+    i, j = [nan, 1, nan, 8, 4, nan], [2, 0, 2, 3, 1, 2]
+    assert_series_equal(ts.reindex(i), ts.iloc[j])
+
+    ts.index = ts.index.astype('object')
+
+    # reindex coerces index.dtype to float, loc/iloc doesn't
+    assert_series_equal(ts.reindex(i), ts.iloc[j], check_index_type=False)
+
+
+def test_reindex_series_add_nat():
+    rng = date_range('1/1/2000 00:00:00', periods=10, freq='10s')
+    series = Series(rng)
+
+    result = series.reindex(lrange(15))
+    assert np.issubdtype(result.dtype, np.dtype('M8[ns]'))
+
+    mask = result.isna()
+    assert mask[-5:].all()
+    assert not mask[:-5].any()
+
+
+def test_reindex_with_datetimes():
+    rng = date_range('1/1/2000', periods=20)
+    ts = Series(np.random.randn(20), index=rng)
+
+    result = ts.reindex(list(ts.index[5:10]))
+    expected = ts[5:10]
+    tm.assert_series_equal(result, expected)
+
+    result = ts[list(ts.index[5:10])]
+    tm.assert_series_equal(result, expected)
+
+
+def test_reindex_corner(test_data):
+    # (don't forget to fix this) I think it's fixed
+    test_data.empty.reindex(test_data.ts.index, method='pad')  # it works
+
+    # corner case: pad empty series
+    reindexed = test_data.empty.reindex(test_data.ts.index, method='pad')
+
+    # pass non-Index
+    reindexed = test_data.ts.reindex(list(test_data.ts.index))
+    assert_series_equal(test_data.ts, reindexed)
+
+    # bad fill method
+    ts = test_data.ts[::2]
+    pytest.raises(Exception, ts.reindex, test_data.ts.index, method='foo')
+
+
+def test_reindex_pad():
+    s = Series(np.arange(10), dtype='int64')
+    s2 = s[::2]
+
+    reindexed = s2.reindex(s.index, method='pad')
+    reindexed2 = s2.reindex(s.index, method='ffill')
+    assert_series_equal(reindexed, reindexed2)
+
+    expected = Series([0, 0, 2, 2, 4, 4, 6, 6, 8, 8], index=np.arange(10))
+    assert_series_equal(reindexed, expected)
+
+    # GH4604
+    s = Series([1, 2, 3, 4, 5], index=['a', 'b', 'c', 'd', 'e'])
+    new_index = ['a', 'g', 'c', 'f']
+    expected = Series([1, 1, 3, 3], index=new_index)
+
+    # this changes dtype because the ffill happens after
+    result = s.reindex(new_index).ffill()
+    assert_series_equal(result, expected.astype('float64'))
+
+    result = s.reindex(new_index).ffill(downcast='infer')
+    assert_series_equal(result, expected)
+
+    expected = Series([1, 5, 3, 5], index=new_index)
+    result = s.reindex(new_index, method='ffill')
+    assert_series_equal(result, expected)
+
+    # inference of new dtype
+    s = Series([True, False, False, True], index=list('abcd'))
+    new_index = 'agc'
+    result = s.reindex(list(new_index)).ffill()
+    expected = Series([True, True, False], index=list(new_index))
+    assert_series_equal(result, expected)
+
+    # GH4618 shifted series downcasting
+    s = Series(False, index=lrange(0, 5))
+    result = s.shift(1).fillna(method='bfill')
+    expected = Series(False, index=lrange(0, 5))
+    assert_series_equal(result, expected)
+
+
+def test_reindex_nearest():
+    s = Series(np.arange(10, dtype='int64'))
+    target = [0.1, 0.9, 1.5, 2.0]
+    actual = s.reindex(target, method='nearest')
+    expected = Series(np.around(target).astype('int64'), target)
+    assert_series_equal(expected, actual)
+
+    actual = s.reindex_like(actual, method='nearest')
+    assert_series_equal(expected, actual)
+
+    actual = s.reindex_like(actual, method='nearest', tolerance=1)
+    assert_series_equal(expected, actual)
+    actual = s.reindex_like(actual, method='nearest',
+                            tolerance=[1, 2, 3, 4])
+    assert_series_equal(expected, actual)
+
+    actual = s.reindex(target, method='nearest', tolerance=0.2)
+    expected = Series([0, 1, np.nan, 2], target)
+    assert_series_equal(expected, actual)
+
+    actual = s.reindex(target, method='nearest',
+                       tolerance=[0.3, 0.01, 0.4, 3])
+    expected = Series([0, np.nan, np.nan, 2], target)
+    assert_series_equal(expected, actual)
+
+
+def test_reindex_backfill():
+    pass
+
+
+def test_reindex_int(test_data):
+    ts = test_data.ts[::2]
+    int_ts = Series(np.zeros(len(ts), dtype=int), index=ts.index)
+
+    # this should work fine
+    reindexed_int = int_ts.reindex(test_data.ts.index)
+
+    # if NaNs introduced
+    assert reindexed_int.dtype == np.float_
+
+    # NO NaNs introduced
+    reindexed_int = int_ts.reindex(int_ts.index[::2])
+    assert reindexed_int.dtype == np.int_
+
+
+def test_reindex_bool(test_data):
+    # A series other than float, int, string, or object
+    ts = test_data.ts[::2]
+    bool_ts = Series(np.zeros(len(ts), dtype=bool), index=ts.index)
+
+    # this should work fine
+    reindexed_bool = bool_ts.reindex(test_data.ts.index)
+
+    # if NaNs introduced
+    assert reindexed_bool.dtype == np.object_
+
+    # NO NaNs introduced
+    reindexed_bool = bool_ts.reindex(bool_ts.index[::2])
+    assert reindexed_bool.dtype == np.bool_
+
+
+def test_reindex_bool_pad(test_data):
+    # fail
+    ts = test_data.ts[5:]
+    bool_ts = Series(np.zeros(len(ts), dtype=bool), index=ts.index)
+    filled_bool = bool_ts.reindex(test_data.ts.index, method='pad')
+    assert isna(filled_bool[:5]).all()
+
+
+def test_reindex_categorical():
+    index = date_range('20000101', periods=3)
+
+    # reindexing to an invalid Categorical
+    s = Series(['a', 'b', 'c'], dtype='category')
+    result = s.reindex(index)
+    expected = Series(Categorical(values=[np.nan, np.nan, np.nan],
+                                  categories=['a', 'b', 'c']))
+    expected.index = index
+    tm.assert_series_equal(result, expected)
+
+    # partial reindexing
+    expected = Series(Categorical(values=['b', 'c'], categories=['a', 'b',
+                                                                 'c']))
+    expected.index = [1, 2]
+    result = s.reindex([1, 2])
+    tm.assert_series_equal(result, expected)
+
+    expected = Series(Categorical(
+        values=['c', np.nan], categories=['a', 'b', 'c']))
+    expected.index = [2, 3]
+    result = s.reindex([2, 3])
+    tm.assert_series_equal(result, expected)
+
+
+def test_reindex_like(test_data):
+    other = test_data.ts[::2]
+    assert_series_equal(test_data.ts.reindex(other.index),
+                        test_data.ts.reindex_like(other))
+
+    # GH 7179
+    day1 = datetime(2013, 3, 5)
+    day2 = datetime(2013, 5, 5)
+    day3 = datetime(2014, 3, 5)
+
+    series1 = Series([5, None, None], [day1, day2, day3])
+    series2 = Series([None, None], [day1, day3])
+
+    result = series1.reindex_like(series2, method='pad')
+    expected = Series([5, np.nan], index=[day1, day3])
+    assert_series_equal(result, expected)
+
+
+def test_reindex_fill_value():
+    # -----------------------------------------------------------
+    # floats
+    floats = Series([1., 2., 3.])
+    result = floats.reindex([1, 2, 3])
+    expected = Series([2., 3., np.nan], index=[1, 2, 3])
+    assert_series_equal(result, expected)
+
+    result = floats.reindex([1, 2, 3], fill_value=0)
+    expected = Series([2., 3., 0], index=[1, 2, 3])
+    assert_series_equal(result, expected)
+
+    # -----------------------------------------------------------
+    # ints
+    ints = Series([1, 2, 3])
+
+    result = ints.reindex([1, 2, 3])
+    expected = Series([2., 3., np.nan], index=[1, 2, 3])
+    assert_series_equal(result, expected)
+
+    # don't upcast
+    result = ints.reindex([1, 2, 3], fill_value=0)
+    expected = Series([2, 3, 0], index=[1, 2, 3])
+    assert issubclass(result.dtype.type, np.integer)
+    assert_series_equal(result, expected)
+
+    # -----------------------------------------------------------
+    # objects
+    objects = Series([1, 2, 3], dtype=object)
+
+    result = objects.reindex([1, 2, 3])
+    expected = Series([2, 3, np.nan], index=[1, 2, 3], dtype=object)
+    assert_series_equal(result, expected)
+
+    result = objects.reindex([1, 2, 3], fill_value='foo')
+    expected = Series([2, 3, 'foo'], index=[1, 2, 3], dtype=object)
+    assert_series_equal(result, expected)
+
+    # ------------------------------------------------------------
+    # bools
+    bools = Series([True, False, True])
+
+    result = bools.reindex([1, 2, 3])
+    expected = Series([False, True, np.nan], index=[1, 2, 3], dtype=object)
+    assert_series_equal(result, expected)
+
+    result = bools.reindex([1, 2, 3], fill_value=False)
+    expected = Series([False, True, False], index=[1, 2, 3])
+    assert_series_equal(result, expected)
+
+
+def test_reindex_datetimeindexes_tz_naive_and_aware():
+    # GH 8306
+    idx = date_range('20131101', tz='America/Chicago', periods=7)
+    newidx = date_range('20131103', periods=10, freq='H')
+    s = Series(range(7), index=idx)
+    with pytest.raises(TypeError):
+        s.reindex(newidx, method='ffill')
+
+
+def test_rename():
+    # GH 17407
+    s = Series(range(1, 6), index=pd.Index(range(2, 7), name='IntIndex'))
+    result = s.rename(str)
+    expected = s.rename(lambda i: str(i))
+    assert_series_equal(result, expected)
+
+    assert result.name == expected.name
+
+
+@pytest.mark.parametrize(
+    'data, index, drop_labels,'
+    ' axis, expected_data, expected_index',
+    [
+        # Unique Index
+        ([1, 2], ['one', 'two'], ['two'],
+         0, [1], ['one']),
+        ([1, 2], ['one', 'two'], ['two'],
+         'rows', [1], ['one']),
+        ([1, 1, 2], ['one', 'two', 'one'], ['two'],
+         0, [1, 2], ['one', 'one']),
+
+        # GH 5248 Non-Unique Index
+        ([1, 1, 2], ['one', 'two', 'one'], 'two',
+         0, [1, 2], ['one', 'one']),
+        ([1, 1, 2], ['one', 'two', 'one'], ['one'],
+         0, [1], ['two']),
+        ([1, 1, 2], ['one', 'two', 'one'], 'one',
+         0, [1], ['two'])])
+def test_drop_unique_and_non_unique_index(data, index, axis, drop_labels,
+                                          expected_data, expected_index):
+
+    s = Series(data=data, index=index)
+    result = s.drop(drop_labels, axis=axis)
+    expected = Series(data=expected_data, index=expected_index)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize(
+    'data, index, drop_labels,'
+    ' axis, error_type, error_desc',
+    [
+        # single string/tuple-like
+        (range(3), list('abc'), 'bc',
+         0, KeyError, 'not found in axis'),
+
+        # bad axis
+        (range(3), list('abc'), ('a',),
+         0, KeyError, 'not found in axis'),
+        (range(3), list('abc'), 'one',
+         'columns', ValueError, 'No axis named columns')])
+def test_drop_exception_raised(data, index, drop_labels,
+                               axis, error_type, error_desc):
+
+    with tm.assert_raises_regex(error_type, error_desc):
+        Series(data, index=index).drop(drop_labels, axis=axis)
+
+
+def test_drop_with_ignore_errors():
+    # errors='ignore'
+    s = Series(range(3), index=list('abc'))
+    result = s.drop('bc', errors='ignore')
+    tm.assert_series_equal(result, s)
+    result = s.drop(['a', 'd'], errors='ignore')
+    expected = s.iloc[1:]
+    tm.assert_series_equal(result, expected)
+
+    # GH 8522
+    s = Series([2, 3], index=[True, False])
+    assert s.index.is_object()
+    result = s.drop(True)
+    expected = Series([3], index=[False])
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('index', [[1, 2, 3], [1, 1, 3]])
+@pytest.mark.parametrize('drop_labels', [[], [1], [3]])
+def test_drop_empty_list(index, drop_labels):
+    # GH 21494
+    expected_index = [i for i in index if i not in drop_labels]
+    series = pd.Series(index=index).drop(drop_labels)
+    tm.assert_series_equal(series, pd.Series(index=expected_index))
+
+
+@pytest.mark.parametrize('data, index, drop_labels', [
+    (None, [1, 2, 3], [1, 4]),
+    (None, [1, 2, 2], [1, 4]),
+    ([2, 3], [0, 1], [False, True])
+])
+def test_drop_non_empty_list(data, index, drop_labels):
+    # GH 21494 and GH 16877
+    with tm.assert_raises_regex(KeyError, 'not found in axis'):
+        pd.Series(data=data, index=index).drop(drop_labels)
diff --git a/pandas/tests/series/indexing/test_boolean.py b/pandas/tests/series/indexing/test_boolean.py
new file mode 100644
index 0000000000000..2aef0df5349cb
--- /dev/null
+++ b/pandas/tests/series/indexing/test_boolean.py
@@ -0,0 +1,601 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+
+import pandas as pd
+import numpy as np
+
+from pandas import (Series, date_range, isna, Index, Timestamp)
+from pandas.compat import lrange, range
+from pandas.core.dtypes.common import is_integer
+
+from pandas.core.indexing import IndexingError
+from pandas.tseries.offsets import BDay
+
+from pandas.util.testing import (assert_series_equal)
+import pandas.util.testing as tm
+
+
+def test_getitem_boolean(test_data):
+    s = test_data.series
+    mask = s > s.median()
+
+    # passing list is OK
+    result = s[list(mask)]
+    expected = s[mask]
+    assert_series_equal(result, expected)
+    tm.assert_index_equal(result.index, s.index[mask])
+
+
+def test_getitem_boolean_empty():
+    s = Series([], dtype=np.int64)
+    s.index.name = 'index_name'
+    s = s[s.isna()]
+    assert s.index.name == 'index_name'
+    assert s.dtype == np.int64
+
+    # GH5877
+    # indexing with empty series
+    s = Series(['A', 'B'])
+    expected = Series(np.nan, index=['C'], dtype=object)
+    result = s[Series(['C'], dtype=object)]
+    assert_series_equal(result, expected)
+
+    s = Series(['A', 'B'])
+    expected = Series(dtype=object, index=Index([], dtype='int64'))
+    result = s[Series([], dtype=object)]
+    assert_series_equal(result, expected)
+
+    # invalid because of the boolean indexer
+    # that's empty or not-aligned
+    def f():
+        s[Series([], dtype=bool)]
+
+    pytest.raises(IndexingError, f)
+
+    def f():
+        s[Series([True], dtype=bool)]
+
+    pytest.raises(IndexingError, f)
+
+
+def test_getitem_boolean_object(test_data):
+    # using column from DataFrame
+
+    s = test_data.series
+    mask = s > s.median()
+    omask = mask.astype(object)
+
+    # getitem
+    result = s[omask]
+    expected = s[mask]
+    assert_series_equal(result, expected)
+
+    # setitem
+    s2 = s.copy()
+    cop = s.copy()
+    cop[omask] = 5
+    s2[mask] = 5
+    assert_series_equal(cop, s2)
+
+    # nans raise exception
+    omask[5:10] = np.nan
+    pytest.raises(Exception, s.__getitem__, omask)
+    pytest.raises(Exception, s.__setitem__, omask, 5)
+
+
+def test_getitem_setitem_boolean_corner(test_data):
+    ts = test_data.ts
+    mask_shifted = ts.shift(1, freq=BDay()) > ts.median()
+
+    # these used to raise...??
+
+    pytest.raises(Exception, ts.__getitem__, mask_shifted)
+    pytest.raises(Exception, ts.__setitem__, mask_shifted, 1)
+    # ts[mask_shifted]
+    # ts[mask_shifted] = 1
+
+    pytest.raises(Exception, ts.loc.__getitem__, mask_shifted)
+    pytest.raises(Exception, ts.loc.__setitem__, mask_shifted, 1)
+    # ts.loc[mask_shifted]
+    # ts.loc[mask_shifted] = 2
+
+
+def test_setitem_boolean(test_data):
+    mask = test_data.series > test_data.series.median()
+
+    # similar indexed series
+    result = test_data.series.copy()
+    result[mask] = test_data.series * 2
+    expected = test_data.series * 2
+    assert_series_equal(result[mask], expected[mask])
+
+    # needs alignment
+    result = test_data.series.copy()
+    result[mask] = (test_data.series * 2)[0:5]
+    expected = (test_data.series * 2)[0:5].reindex_like(test_data.series)
+    expected[-mask] = test_data.series[mask]
+    assert_series_equal(result[mask], expected[mask])
+
+
+def test_get_set_boolean_different_order(test_data):
+    ordered = test_data.series.sort_values()
+
+    # setting
+    copy = test_data.series.copy()
+    copy[ordered > 0] = 0
+
+    expected = test_data.series.copy()
+    expected[expected > 0] = 0
+
+    assert_series_equal(copy, expected)
+
+    # getting
+    sel = test_data.series[ordered > 0]
+    exp = test_data.series[test_data.series > 0]
+    assert_series_equal(sel, exp)
+
+
+def test_where_unsafe():
+    # unsafe dtype changes
+    for dtype in [np.int8, np.int16, np.int32, np.int64, np.float16,
+                  np.float32, np.float64]:
+        s = Series(np.arange(10), dtype=dtype)
+        mask = s < 5
+        s[mask] = lrange(2, 7)
+        expected = Series(lrange(2, 7) + lrange(5, 10), dtype=dtype)
+        assert_series_equal(s, expected)
+        assert s.dtype == expected.dtype
+
+    # these are allowed operations, but are upcasted
+    for dtype in [np.int64, np.float64]:
+        s = Series(np.arange(10), dtype=dtype)
+        mask = s < 5
+        values = [2.5, 3.5, 4.5, 5.5, 6.5]
+        s[mask] = values
+        expected = Series(values + lrange(5, 10), dtype='float64')
+        assert_series_equal(s, expected)
+        assert s.dtype == expected.dtype
+
+    # GH 9731
+    s = Series(np.arange(10), dtype='int64')
+    mask = s > 5
+    values = [2.5, 3.5, 4.5, 5.5]
+    s[mask] = values
+    expected = Series(lrange(6) + values, dtype='float64')
+    assert_series_equal(s, expected)
+
+    # can't do these as we are forced to change the itemsize of the input
+    # to something we cannot
+    for dtype in [np.int8, np.int16, np.int32, np.float16, np.float32]:
+        s = Series(np.arange(10), dtype=dtype)
+        mask = s < 5
+        values = [2.5, 3.5, 4.5, 5.5, 6.5]
+        pytest.raises(Exception, s.__setitem__, tuple(mask), values)
+
+    # GH3235
+    s = Series(np.arange(10), dtype='int64')
+    mask = s < 5
+    s[mask] = lrange(2, 7)
+    expected = Series(lrange(2, 7) + lrange(5, 10), dtype='int64')
+    assert_series_equal(s, expected)
+    assert s.dtype == expected.dtype
+
+    s = Series(np.arange(10), dtype='int64')
+    mask = s > 5
+    s[mask] = [0] * 4
+    expected = Series([0, 1, 2, 3, 4, 5] + [0] * 4, dtype='int64')
+    assert_series_equal(s, expected)
+
+    s = Series(np.arange(10))
+    mask = s > 5
+
+    def f():
+        s[mask] = [5, 4, 3, 2, 1]
+
+    pytest.raises(ValueError, f)
+
+    def f():
+        s[mask] = [0] * 5
+
+    pytest.raises(ValueError, f)
+
+    # dtype changes
+    s = Series([1, 2, 3, 4])
+    result = s.where(s > 2, np.nan)
+    expected = Series([np.nan, np.nan, 3, 4])
+    assert_series_equal(result, expected)
+
+    # GH 4667
+    # setting with None changes dtype
+    s = Series(range(10)).astype(float)
+    s[8] = None
+    result = s[8]
+    assert isna(result)
+
+    s = Series(range(10)).astype(float)
+    s[s > 8] = None
+    result = s[isna(s)]
+    expected = Series(np.nan, index=[9])
+    assert_series_equal(result, expected)
+
+
+def test_where_raise_on_error_deprecation():
+    # gh-14968
+    # deprecation of raise_on_error
+    s = Series(np.random.randn(5))
+    cond = s > 0
+    with tm.assert_produces_warning(FutureWarning):
+        s.where(cond, raise_on_error=True)
+    with tm.assert_produces_warning(FutureWarning):
+        s.mask(cond, raise_on_error=True)
+
+
+def test_where():
+    s = Series(np.random.randn(5))
+    cond = s > 0
+
+    rs = s.where(cond).dropna()
+    rs2 = s[cond]
+    assert_series_equal(rs, rs2)
+
+    rs = s.where(cond, -s)
+    assert_series_equal(rs, s.abs())
+
+    rs = s.where(cond)
+    assert (s.shape == rs.shape)
+    assert (rs is not s)
+
+    # test alignment
+    cond = Series([True, False, False, True, False], index=s.index)
+    s2 = -(s.abs())
+
+    expected = s2[cond].reindex(s2.index[:3]).reindex(s2.index)
+    rs = s2.where(cond[:3])
+    assert_series_equal(rs, expected)
+
+    expected = s2.abs()
+    expected.iloc[0] = s2[0]
+    rs = s2.where(cond[:3], -s2)
+    assert_series_equal(rs, expected)
+
+
+def test_where_error():
+    s = Series(np.random.randn(5))
+    cond = s > 0
+
+    pytest.raises(ValueError, s.where, 1)
+    pytest.raises(ValueError, s.where, cond[:3].values, -s)
+
+    # GH 2745
+    s = Series([1, 2])
+    s[[True, False]] = [0, 1]
+    expected = Series([0, 2])
+    assert_series_equal(s, expected)
+
+    # failures
+    pytest.raises(ValueError, s.__setitem__, tuple([[[True, False]]]),
+                  [0, 2, 3])
+    pytest.raises(ValueError, s.__setitem__, tuple([[[True, False]]]),
+                  [])
+
+
+@pytest.mark.parametrize('klass', [list, tuple, np.array, Series])
+def test_where_array_like(klass):
+    # see gh-15414
+    s = Series([1, 2, 3])
+    cond = [False, True, True]
+    expected = Series([np.nan, 2, 3])
+
+    result = s.where(klass(cond))
+    assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('cond', [
+    [1, 0, 1],
+    Series([2, 5, 7]),
+    ["True", "False", "True"],
+    [Timestamp("2017-01-01"), pd.NaT, Timestamp("2017-01-02")]
+])
+def test_where_invalid_input(cond):
+    # see gh-15414: only boolean arrays accepted
+    s = Series([1, 2, 3])
+    msg = "Boolean array expected for the condition"
+
+    with tm.assert_raises_regex(ValueError, msg):
+        s.where(cond)
+
+    msg = "Array conditional must be same shape as self"
+    with tm.assert_raises_regex(ValueError, msg):
+        s.where([True])
+
+
+def test_where_ndframe_align():
+    msg = "Array conditional must be same shape as self"
+    s = Series([1, 2, 3])
+
+    cond = [True]
+    with tm.assert_raises_regex(ValueError, msg):
+        s.where(cond)
+
+    expected = Series([1, np.nan, np.nan])
+
+    out = s.where(Series(cond))
+    tm.assert_series_equal(out, expected)
+
+    cond = np.array([False, True, False, True])
+    with tm.assert_raises_regex(ValueError, msg):
+        s.where(cond)
+
+    expected = Series([np.nan, 2, np.nan])
+
+    out = s.where(Series(cond))
+    tm.assert_series_equal(out, expected)
+
+
+def test_where_setitem_invalid():
+    # GH 2702
+    # make sure correct exceptions are raised on invalid list assignment
+
+    # slice
+    s = Series(list('abc'))
+
+    def f():
+        s[0:3] = list(range(27))
+
+    pytest.raises(ValueError, f)
+
+    s[0:3] = list(range(3))
+    expected = Series([0, 1, 2])
+    assert_series_equal(s.astype(np.int64), expected, )
+
+    # slice with step
+    s = Series(list('abcdef'))
+
+    def f():
+        s[0:4:2] = list(range(27))
+
+    pytest.raises(ValueError, f)
+
+    s = Series(list('abcdef'))
+    s[0:4:2] = list(range(2))
+    expected = Series([0, 'b', 1, 'd', 'e', 'f'])
+    assert_series_equal(s, expected)
+
+    # neg slices
+    s = Series(list('abcdef'))
+
+    def f():
+        s[:-1] = list(range(27))
+
+    pytest.raises(ValueError, f)
+
+    s[-3:-1] = list(range(2))
+    expected = Series(['a', 'b', 'c', 0, 1, 'f'])
+    assert_series_equal(s, expected)
+
+    # list
+    s = Series(list('abc'))
+
+    def f():
+        s[[0, 1, 2]] = list(range(27))
+
+    pytest.raises(ValueError, f)
+
+    s = Series(list('abc'))
+
+    def f():
+        s[[0, 1, 2]] = list(range(2))
+
+    pytest.raises(ValueError, f)
+
+    # scalar
+    s = Series(list('abc'))
+    s[0] = list(range(10))
+    expected = Series([list(range(10)), 'b', 'c'])
+    assert_series_equal(s, expected)
+
+
+@pytest.mark.parametrize('size', range(2, 6))
+@pytest.mark.parametrize('mask', [
+    [True, False, False, False, False],
+    [True, False],
+    [False]
+])
+@pytest.mark.parametrize('item', [
+    2.0, np.nan, np.finfo(np.float).max, np.finfo(np.float).min
+])
+# Test numpy arrays, lists and tuples as the input to be
+# broadcast
+@pytest.mark.parametrize('box', [
+    lambda x: np.array([x]),
+    lambda x: [x],
+    lambda x: (x,)
+])
+def test_broadcast(size, mask, item, box):
+    selection = np.resize(mask, size)
+
+    data = np.arange(size, dtype=float)
+
+    # Construct the expected series by taking the source
+    # data or item based on the selection
+    expected = Series([item if use_item else data[
+        i] for i, use_item in enumerate(selection)])
+
+    s = Series(data)
+    s[selection] = box(item)
+    assert_series_equal(s, expected)
+
+    s = Series(data)
+    result = s.where(~selection, box(item))
+    assert_series_equal(result, expected)
+
+    s = Series(data)
+    result = s.mask(selection, box(item))
+    assert_series_equal(result, expected)
+
+
+def test_where_inplace():
+    s = Series(np.random.randn(5))
+    cond = s > 0
+
+    rs = s.copy()
+
+    rs.where(cond, inplace=True)
+    assert_series_equal(rs.dropna(), s[cond])
+    assert_series_equal(rs, s.where(cond))
+
+    rs = s.copy()
+    rs.where(cond, -s, inplace=True)
+    assert_series_equal(rs, s.where(cond, -s))
+
+
+def test_where_dups():
+    # GH 4550
+    # where crashes with dups in index
+    s1 = Series(list(range(3)))
+    s2 = Series(list(range(3)))
+    comb = pd.concat([s1, s2])
+    result = comb.where(comb < 2)
+    expected = Series([0, 1, np.nan, 0, 1, np.nan],
+                      index=[0, 1, 2, 0, 1, 2])
+    assert_series_equal(result, expected)
+
+    # GH 4548
+    # inplace updating not working with dups
+    comb[comb < 1] = 5
+    expected = Series([5, 1, 2, 5, 1, 2], index=[0, 1, 2, 0, 1, 2])
+    assert_series_equal(comb, expected)
+
+    comb[comb < 2] += 10
+    expected = Series([5, 11, 2, 5, 11, 2], index=[0, 1, 2, 0, 1, 2])
+    assert_series_equal(comb, expected)
+
+
+def test_where_numeric_with_string():
+    # GH 9280
+    s = pd.Series([1, 2, 3])
+    w = s.where(s > 1, 'X')
+
+    assert not is_integer(w[0])
+    assert is_integer(w[1])
+    assert is_integer(w[2])
+    assert isinstance(w[0], str)
+    assert w.dtype == 'object'
+
+    w = s.where(s > 1, ['X', 'Y', 'Z'])
+    assert not is_integer(w[0])
+    assert is_integer(w[1])
+    assert is_integer(w[2])
+    assert isinstance(w[0], str)
+    assert w.dtype == 'object'
+
+    w = s.where(s > 1, np.array(['X', 'Y', 'Z']))
+    assert not is_integer(w[0])
+    assert is_integer(w[1])
+    assert is_integer(w[2])
+    assert isinstance(w[0], str)
+    assert w.dtype == 'object'
+
+
+def test_where_timedelta_coerce():
+    s = Series([1, 2], dtype='timedelta64[ns]')
+    expected = Series([10, 10])
+    mask = np.array([False, False])
+
+    rs = s.where(mask, [10, 10])
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, 10)
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, 10.0)
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, [10.0, 10.0])
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, [10.0, np.nan])
+    expected = Series([10, None], dtype='object')
+    assert_series_equal(rs, expected)
+
+
+def test_where_datetime_conversion():
+    s = Series(date_range('20130102', periods=2))
+    expected = Series([10, 10])
+    mask = np.array([False, False])
+
+    rs = s.where(mask, [10, 10])
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, 10)
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, 10.0)
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, [10.0, 10.0])
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, [10.0, np.nan])
+    expected = Series([10, None], dtype='object')
+    assert_series_equal(rs, expected)
+
+    # GH 15701
+    timestamps = ['2016-12-31 12:00:04+00:00',
+                  '2016-12-31 12:00:04.010000+00:00']
+    s = Series([pd.Timestamp(t) for t in timestamps])
+    rs = s.where(Series([False, True]))
+    expected = Series([pd.NaT, s[1]])
+    assert_series_equal(rs, expected)
+
+
+def test_mask():
+    # compare with tested results in test_where
+    s = Series(np.random.randn(5))
+    cond = s > 0
+
+    rs = s.where(~cond, np.nan)
+    assert_series_equal(rs, s.mask(cond))
+
+    rs = s.where(~cond)
+    rs2 = s.mask(cond)
+    assert_series_equal(rs, rs2)
+
+    rs = s.where(~cond, -s)
+    rs2 = s.mask(cond, -s)
+    assert_series_equal(rs, rs2)
+
+    cond = Series([True, False, False, True, False], index=s.index)
+    s2 = -(s.abs())
+    rs = s2.where(~cond[:3])
+    rs2 = s2.mask(cond[:3])
+    assert_series_equal(rs, rs2)
+
+    rs = s2.where(~cond[:3], -s2)
+    rs2 = s2.mask(cond[:3], -s2)
+    assert_series_equal(rs, rs2)
+
+    pytest.raises(ValueError, s.mask, 1)
+    pytest.raises(ValueError, s.mask, cond[:3].values, -s)
+
+    # dtype changes
+    s = Series([1, 2, 3, 4])
+    result = s.mask(s > 2, np.nan)
+    expected = Series([1, 2, np.nan, np.nan])
+    assert_series_equal(result, expected)
+
+
+def test_mask_inplace():
+    s = Series(np.random.randn(5))
+    cond = s > 0
+
+    rs = s.copy()
+    rs.mask(cond, inplace=True)
+    assert_series_equal(rs.dropna(), s[~cond])
+    assert_series_equal(rs, s.mask(cond))
+
+    rs = s.copy()
+    rs.mask(cond, -s, inplace=True)
+    assert_series_equal(rs, s.mask(cond, -s))
diff --git a/pandas/tests/series/indexing/test_callable.py b/pandas/tests/series/indexing/test_callable.py
new file mode 100644
index 0000000000000..b656137545903
--- /dev/null
+++ b/pandas/tests/series/indexing/test_callable.py
@@ -0,0 +1,33 @@
+import pandas as pd
+import pandas.util.testing as tm
+
+
+def test_getitem_callable():
+    # GH 12533
+    s = pd.Series(4, index=list('ABCD'))
+    result = s[lambda x: 'A']
+    assert result == s.loc['A']
+
+    result = s[lambda x: ['A', 'B']]
+    tm.assert_series_equal(result, s.loc[['A', 'B']])
+
+    result = s[lambda x: [True, False, True, True]]
+    tm.assert_series_equal(result, s.iloc[[0, 2, 3]])
+
+
+def test_setitem_callable():
+    # GH 12533
+    s = pd.Series([1, 2, 3, 4], index=list('ABCD'))
+    s[lambda x: 'A'] = -1
+    tm.assert_series_equal(s, pd.Series([-1, 2, 3, 4], index=list('ABCD')))
+
+
+def test_setitem_other_callable():
+    # GH 13299
+    inc = lambda x: x + 1
+
+    s = pd.Series([1, 2, -1, 4])
+    s[s < 0] = inc
+
+    expected = pd.Series([1, 2, inc, 4])
+    tm.assert_series_equal(s, expected)
diff --git a/pandas/tests/series/indexing/test_datetime.py b/pandas/tests/series/indexing/test_datetime.py
new file mode 100644
index 0000000000000..bcea47f42056b
--- /dev/null
+++ b/pandas/tests/series/indexing/test_datetime.py
@@ -0,0 +1,709 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+
+from datetime import datetime, timedelta
+
+import numpy as np
+import pandas as pd
+
+from pandas import (Series, DataFrame,
+                    date_range, Timestamp, DatetimeIndex, NaT)
+
+from pandas.compat import lrange, range
+from pandas.util.testing import (assert_series_equal,
+                                 assert_frame_equal, assert_almost_equal)
+
+import pandas.util.testing as tm
+
+import pandas._libs.index as _index
+from pandas._libs import tslib
+
+
+"""
+Also test support for datetime64[ns] in Series / DataFrame
+"""
+
+
+def test_fancy_getitem():
+    dti = DatetimeIndex(freq='WOM-1FRI', start=datetime(2005, 1, 1),
+                        end=datetime(2010, 1, 1))
+
+    s = Series(np.arange(len(dti)), index=dti)
+
+    assert s[48] == 48
+    assert s['1/2/2009'] == 48
+    assert s['2009-1-2'] == 48
+    assert s[datetime(2009, 1, 2)] == 48
+    assert s[Timestamp(datetime(2009, 1, 2))] == 48
+    pytest.raises(KeyError, s.__getitem__, '2009-1-3')
+
+    assert_series_equal(s['3/6/2009':'2009-06-05'],
+                        s[datetime(2009, 3, 6):datetime(2009, 6, 5)])
+
+
+def test_fancy_setitem():
+    dti = DatetimeIndex(freq='WOM-1FRI', start=datetime(2005, 1, 1),
+                        end=datetime(2010, 1, 1))
+
+    s = Series(np.arange(len(dti)), index=dti)
+    s[48] = -1
+    assert s[48] == -1
+    s['1/2/2009'] = -2
+    assert s[48] == -2
+    s['1/2/2009':'2009-06-05'] = -3
+    assert (s[48:54] == -3).all()
+
+
+def test_dti_snap():
+    dti = DatetimeIndex(['1/1/2002', '1/2/2002', '1/3/2002', '1/4/2002',
+                         '1/5/2002', '1/6/2002', '1/7/2002'], freq='D')
+
+    res = dti.snap(freq='W-MON')
+    exp = date_range('12/31/2001', '1/7/2002', freq='w-mon')
+    exp = exp.repeat([3, 4])
+    assert (res == exp).all()
+
+    res = dti.snap(freq='B')
+
+    exp = date_range('1/1/2002', '1/7/2002', freq='b')
+    exp = exp.repeat([1, 1, 1, 2, 2])
+    assert (res == exp).all()
+
+
+def test_dti_reset_index_round_trip():
+    dti = DatetimeIndex(start='1/1/2001', end='6/1/2001', freq='D')
+    d1 = DataFrame({'v': np.random.rand(len(dti))}, index=dti)
+    d2 = d1.reset_index()
+    assert d2.dtypes[0] == np.dtype('M8[ns]')
+    d3 = d2.set_index('index')
+    assert_frame_equal(d1, d3, check_names=False)
+
+    # #2329
+    stamp = datetime(2012, 11, 22)
+    df = DataFrame([[stamp, 12.1]], columns=['Date', 'Value'])
+    df = df.set_index('Date')
+
+    assert df.index[0] == stamp
+    assert df.reset_index()['Date'][0] == stamp
+
+
+def test_series_set_value():
+    # #1561
+
+    dates = [datetime(2001, 1, 1), datetime(2001, 1, 2)]
+    index = DatetimeIndex(dates)
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        s = Series().set_value(dates[0], 1.)
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        s2 = s.set_value(dates[1], np.nan)
+
+    exp = Series([1., np.nan], index=index)
+
+    assert_series_equal(s2, exp)
+
+    # s = Series(index[:1], index[:1])
+    # s2 = s.set_value(dates[1], index[1])
+    # assert s2.values.dtype == 'M8[ns]'
+
+
+@pytest.mark.slow
+def test_slice_locs_indexerror():
+    times = [datetime(2000, 1, 1) + timedelta(minutes=i * 10)
+             for i in range(100000)]
+    s = Series(lrange(100000), times)
+    s.loc[datetime(1900, 1, 1):datetime(2100, 1, 1)]
+
+
+def test_slicing_datetimes():
+    # GH 7523
+
+    # unique
+    df = DataFrame(np.arange(4., dtype='float64'),
+                   index=[datetime(2001, 1, i, 10, 00)
+                          for i in [1, 2, 3, 4]])
+    result = df.loc[datetime(2001, 1, 1, 10):]
+    assert_frame_equal(result, df)
+    result = df.loc[:datetime(2001, 1, 4, 10)]
+    assert_frame_equal(result, df)
+    result = df.loc[datetime(2001, 1, 1, 10):datetime(2001, 1, 4, 10)]
+    assert_frame_equal(result, df)
+
+    result = df.loc[datetime(2001, 1, 1, 11):]
+    expected = df.iloc[1:]
+    assert_frame_equal(result, expected)
+    result = df.loc['20010101 11':]
+    assert_frame_equal(result, expected)
+
+    # duplicates
+    df = pd.DataFrame(np.arange(5., dtype='float64'),
+                      index=[datetime(2001, 1, i, 10, 00)
+                             for i in [1, 2, 2, 3, 4]])
+
+    result = df.loc[datetime(2001, 1, 1, 10):]
+    assert_frame_equal(result, df)
+    result = df.loc[:datetime(2001, 1, 4, 10)]
+    assert_frame_equal(result, df)
+    result = df.loc[datetime(2001, 1, 1, 10):datetime(2001, 1, 4, 10)]
+    assert_frame_equal(result, df)
+
+    result = df.loc[datetime(2001, 1, 1, 11):]
+    expected = df.iloc[1:]
+    assert_frame_equal(result, expected)
+    result = df.loc['20010101 11':]
+    assert_frame_equal(result, expected)
+
+
+def test_frame_datetime64_duplicated():
+    dates = date_range('2010-07-01', end='2010-08-05')
+
+    tst = DataFrame({'symbol': 'AAA', 'date': dates})
+    result = tst.duplicated(['date', 'symbol'])
+    assert (-result).all()
+
+    tst = DataFrame({'date': dates})
+    result = tst.duplicated()
+    assert (-result).all()
+
+
+def test_getitem_setitem_datetime_tz_pytz():
+    from pytz import timezone as tz
+    from pandas import date_range
+
+    N = 50
+    # testing with timezone, GH #2785
+    rng = date_range('1/1/1990', periods=N, freq='H', tz='US/Eastern')
+    ts = Series(np.random.randn(N), index=rng)
+
+    # also test Timestamp tz handling, GH #2789
+    result = ts.copy()
+    result["1990-01-01 09:00:00+00:00"] = 0
+    result["1990-01-01 09:00:00+00:00"] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts.copy()
+    result["1990-01-01 03:00:00-06:00"] = 0
+    result["1990-01-01 03:00:00-06:00"] = ts[4]
+    assert_series_equal(result, ts)
+
+    # repeat with datetimes
+    result = ts.copy()
+    result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = 0
+    result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts.copy()
+
+    # comparison dates with datetime MUST be localized!
+    date = tz('US/Central').localize(datetime(1990, 1, 1, 3))
+    result[date] = 0
+    result[date] = ts[4]
+    assert_series_equal(result, ts)
+
+
+def test_getitem_setitem_datetime_tz_dateutil():
+    from dateutil.tz import tzutc
+    from pandas._libs.tslibs.timezones import dateutil_gettz as gettz
+
+    tz = lambda x: tzutc() if x == 'UTC' else gettz(
+        x)  # handle special case for utc in dateutil
+
+    from pandas import date_range
+
+    N = 50
+
+    # testing with timezone, GH #2785
+    rng = date_range('1/1/1990', periods=N, freq='H',
+                     tz='America/New_York')
+    ts = Series(np.random.randn(N), index=rng)
+
+    # also test Timestamp tz handling, GH #2789
+    result = ts.copy()
+    result["1990-01-01 09:00:00+00:00"] = 0
+    result["1990-01-01 09:00:00+00:00"] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts.copy()
+    result["1990-01-01 03:00:00-06:00"] = 0
+    result["1990-01-01 03:00:00-06:00"] = ts[4]
+    assert_series_equal(result, ts)
+
+    # repeat with datetimes
+    result = ts.copy()
+    result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = 0
+    result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts.copy()
+    result[datetime(1990, 1, 1, 3, tzinfo=tz('America/Chicago'))] = 0
+    result[datetime(1990, 1, 1, 3, tzinfo=tz('America/Chicago'))] = ts[4]
+    assert_series_equal(result, ts)
+
+
+def test_getitem_setitem_datetimeindex():
+    N = 50
+    # testing with timezone, GH #2785
+    rng = date_range('1/1/1990', periods=N, freq='H', tz='US/Eastern')
+    ts = Series(np.random.randn(N), index=rng)
+
+    result = ts["1990-01-01 04:00:00"]
+    expected = ts[4]
+    assert result == expected
+
+    result = ts.copy()
+    result["1990-01-01 04:00:00"] = 0
+    result["1990-01-01 04:00:00"] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts["1990-01-01 04:00:00":"1990-01-01 07:00:00"]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    result = ts.copy()
+    result["1990-01-01 04:00:00":"1990-01-01 07:00:00"] = 0
+    result["1990-01-01 04:00:00":"1990-01-01 07:00:00"] = ts[4:8]
+    assert_series_equal(result, ts)
+
+    lb = "1990-01-01 04:00:00"
+    rb = "1990-01-01 07:00:00"
+    # GH#18435 strings get a pass from tzawareness compat
+    result = ts[(ts.index >= lb) & (ts.index <= rb)]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    lb = "1990-01-01 04:00:00-0500"
+    rb = "1990-01-01 07:00:00-0500"
+    result = ts[(ts.index >= lb) & (ts.index <= rb)]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    # repeat all the above with naive datetimes
+    result = ts[datetime(1990, 1, 1, 4)]
+    expected = ts[4]
+    assert result == expected
+
+    result = ts.copy()
+    result[datetime(1990, 1, 1, 4)] = 0
+    result[datetime(1990, 1, 1, 4)] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts[datetime(1990, 1, 1, 4):datetime(1990, 1, 1, 7)]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    result = ts.copy()
+    result[datetime(1990, 1, 1, 4):datetime(1990, 1, 1, 7)] = 0
+    result[datetime(1990, 1, 1, 4):datetime(1990, 1, 1, 7)] = ts[4:8]
+    assert_series_equal(result, ts)
+
+    lb = datetime(1990, 1, 1, 4)
+    rb = datetime(1990, 1, 1, 7)
+    with pytest.raises(TypeError):
+        # tznaive vs tzaware comparison is invalid
+        # see GH#18376, GH#18162
+        ts[(ts.index >= lb) & (ts.index <= rb)]
+
+    lb = pd.Timestamp(datetime(1990, 1, 1, 4)).tz_localize(rng.tzinfo)
+    rb = pd.Timestamp(datetime(1990, 1, 1, 7)).tz_localize(rng.tzinfo)
+    result = ts[(ts.index >= lb) & (ts.index <= rb)]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    result = ts[ts.index[4]]
+    expected = ts[4]
+    assert result == expected
+
+    result = ts[ts.index[4:8]]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    result = ts.copy()
+    result[ts.index[4:8]] = 0
+    result[4:8] = ts[4:8]
+    assert_series_equal(result, ts)
+
+    # also test partial date slicing
+    result = ts["1990-01-02"]
+    expected = ts[24:48]
+    assert_series_equal(result, expected)
+
+    result = ts.copy()
+    result["1990-01-02"] = 0
+    result["1990-01-02"] = ts[24:48]
+    assert_series_equal(result, ts)
+
+
+def test_getitem_setitem_periodindex():
+    from pandas import period_range
+
+    N = 50
+    rng = period_range('1/1/1990', periods=N, freq='H')
+    ts = Series(np.random.randn(N), index=rng)
+
+    result = ts["1990-01-01 04"]
+    expected = ts[4]
+    assert result == expected
+
+    result = ts.copy()
+    result["1990-01-01 04"] = 0
+    result["1990-01-01 04"] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts["1990-01-01 04":"1990-01-01 07"]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    result = ts.copy()
+    result["1990-01-01 04":"1990-01-01 07"] = 0
+    result["1990-01-01 04":"1990-01-01 07"] = ts[4:8]
+    assert_series_equal(result, ts)
+
+    lb = "1990-01-01 04"
+    rb = "1990-01-01 07"
+    result = ts[(ts.index >= lb) & (ts.index <= rb)]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    # GH 2782
+    result = ts[ts.index[4]]
+    expected = ts[4]
+    assert result == expected
+
+    result = ts[ts.index[4:8]]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    result = ts.copy()
+    result[ts.index[4:8]] = 0
+    result[4:8] = ts[4:8]
+    assert_series_equal(result, ts)
+
+
+def test_getitem_median_slice_bug():
+    index = date_range('20090415', '20090519', freq='2B')
+    s = Series(np.random.randn(13), index=index)
+
+    indexer = [slice(6, 7, None)]
+    result = s[indexer]
+    expected = s[indexer[0]]
+    assert_series_equal(result, expected)
+
+
+def test_datetime_indexing():
+    from pandas import date_range
+
+    index = date_range('1/1/2000', '1/7/2000')
+    index = index.repeat(3)
+
+    s = Series(len(index), index=index)
+    stamp = Timestamp('1/8/2000')
+
+    pytest.raises(KeyError, s.__getitem__, stamp)
+    s[stamp] = 0
+    assert s[stamp] == 0
+
+    # not monotonic
+    s = Series(len(index), index=index)
+    s = s[::-1]
+
+    pytest.raises(KeyError, s.__getitem__, stamp)
+    s[stamp] = 0
+    assert s[stamp] == 0
+
+
+"""
+test duplicates in time series
+"""
+
+
+@pytest.fixture(scope='module')
+def dups():
+    dates = [datetime(2000, 1, 2), datetime(2000, 1, 2),
+             datetime(2000, 1, 2), datetime(2000, 1, 3),
+             datetime(2000, 1, 3), datetime(2000, 1, 3),
+             datetime(2000, 1, 4), datetime(2000, 1, 4),
+             datetime(2000, 1, 4), datetime(2000, 1, 5)]
+
+    return Series(np.random.randn(len(dates)), index=dates)
+
+
+def test_constructor(dups):
+    assert isinstance(dups, Series)
+    assert isinstance(dups.index, DatetimeIndex)
+
+
+def test_is_unique_monotonic(dups):
+    assert not dups.index.is_unique
+
+
+def test_index_unique(dups):
+    uniques = dups.index.unique()
+    expected = DatetimeIndex([datetime(2000, 1, 2), datetime(2000, 1, 3),
+                              datetime(2000, 1, 4), datetime(2000, 1, 5)])
+    assert uniques.dtype == 'M8[ns]'  # sanity
+    tm.assert_index_equal(uniques, expected)
+    assert dups.index.nunique() == 4
+
+    # #2563
+    assert isinstance(uniques, DatetimeIndex)
+
+    dups_local = dups.index.tz_localize('US/Eastern')
+    dups_local.name = 'foo'
+    result = dups_local.unique()
+    expected = DatetimeIndex(expected, name='foo')
+    expected = expected.tz_localize('US/Eastern')
+    assert result.tz is not None
+    assert result.name == 'foo'
+    tm.assert_index_equal(result, expected)
+
+    # NaT, note this is excluded
+    arr = [1370745748 + t for t in range(20)] + [tslib.iNaT]
+    idx = DatetimeIndex(arr * 3)
+    tm.assert_index_equal(idx.unique(), DatetimeIndex(arr))
+    assert idx.nunique() == 20
+    assert idx.nunique(dropna=False) == 21
+
+    arr = [Timestamp('2013-06-09 02:42:28') + timedelta(seconds=t)
+           for t in range(20)] + [NaT]
+    idx = DatetimeIndex(arr * 3)
+    tm.assert_index_equal(idx.unique(), DatetimeIndex(arr))
+    assert idx.nunique() == 20
+    assert idx.nunique(dropna=False) == 21
+
+
+def test_index_dupes_contains():
+    d = datetime(2011, 12, 5, 20, 30)
+    ix = DatetimeIndex([d, d])
+    assert d in ix
+
+
+def test_duplicate_dates_indexing(dups):
+    ts = dups
+
+    uniques = ts.index.unique()
+    for date in uniques:
+        result = ts[date]
+
+        mask = ts.index == date
+        total = (ts.index == date).sum()
+        expected = ts[mask]
+        if total > 1:
+            assert_series_equal(result, expected)
+        else:
+            assert_almost_equal(result, expected[0])
+
+        cp = ts.copy()
+        cp[date] = 0
+        expected = Series(np.where(mask, 0, ts), index=ts.index)
+        assert_series_equal(cp, expected)
+
+    pytest.raises(KeyError, ts.__getitem__, datetime(2000, 1, 6))
+
+    # new index
+    ts[datetime(2000, 1, 6)] = 0
+    assert ts[datetime(2000, 1, 6)] == 0
+
+
+def test_range_slice():
+    idx = DatetimeIndex(['1/1/2000', '1/2/2000', '1/2/2000', '1/3/2000',
+                         '1/4/2000'])
+
+    ts = Series(np.random.randn(len(idx)), index=idx)
+
+    result = ts['1/2/2000':]
+    expected = ts[1:]
+    assert_series_equal(result, expected)
+
+    result = ts['1/2/2000':'1/3/2000']
+    expected = ts[1:4]
+    assert_series_equal(result, expected)
+
+
+def test_groupby_average_dup_values(dups):
+    result = dups.groupby(level=0).mean()
+    expected = dups.groupby(dups.index).mean()
+    assert_series_equal(result, expected)
+
+
+def test_indexing_over_size_cutoff():
+    import datetime
+    # #1821
+
+    old_cutoff = _index._SIZE_CUTOFF
+    try:
+        _index._SIZE_CUTOFF = 1000
+
+        # create large list of non periodic datetime
+        dates = []
+        sec = datetime.timedelta(seconds=1)
+        half_sec = datetime.timedelta(microseconds=500000)
+        d = datetime.datetime(2011, 12, 5, 20, 30)
+        n = 1100
+        for i in range(n):
+            dates.append(d)
+            dates.append(d + sec)
+            dates.append(d + sec + half_sec)
+            dates.append(d + sec + sec + half_sec)
+            d += 3 * sec
+
+        # duplicate some values in the list
+        duplicate_positions = np.random.randint(0, len(dates) - 1, 20)
+        for p in duplicate_positions:
+            dates[p + 1] = dates[p]
+
+        df = DataFrame(np.random.randn(len(dates), 4),
+                       index=dates,
+                       columns=list('ABCD'))
+
+        pos = n * 3
+        timestamp = df.index[pos]
+        assert timestamp in df.index
+
+        # it works!
+        df.loc[timestamp]
+        assert len(df.loc[[timestamp]]) > 0
+    finally:
+        _index._SIZE_CUTOFF = old_cutoff
+
+
+def test_indexing_unordered():
+    # GH 2437
+    rng = date_range(start='2011-01-01', end='2011-01-15')
+    ts = Series(np.random.rand(len(rng)), index=rng)
+    ts2 = pd.concat([ts[0:4], ts[-4:], ts[4:-4]])
+
+    for t in ts.index:
+        # TODO: unused?
+        s = str(t)  # noqa
+
+        expected = ts[t]
+        result = ts2[t]
+        assert expected == result
+
+    # GH 3448 (ranges)
+    def compare(slobj):
+        result = ts2[slobj].copy()
+        result = result.sort_index()
+        expected = ts[slobj]
+        assert_series_equal(result, expected)
+
+    compare(slice('2011-01-01', '2011-01-15'))
+    compare(slice('2010-12-30', '2011-01-15'))
+    compare(slice('2011-01-01', '2011-01-16'))
+
+    # partial ranges
+    compare(slice('2011-01-01', '2011-01-6'))
+    compare(slice('2011-01-06', '2011-01-8'))
+    compare(slice('2011-01-06', '2011-01-12'))
+
+    # single values
+    result = ts2['2011'].sort_index()
+    expected = ts['2011']
+    assert_series_equal(result, expected)
+
+    # diff freq
+    rng = date_range(datetime(2005, 1, 1), periods=20, freq='M')
+    ts = Series(np.arange(len(rng)), index=rng)
+    ts = ts.take(np.random.permutation(20))
+
+    result = ts['2005']
+    for t in result.index:
+        assert t.year == 2005
+
+
+def test_indexing():
+    idx = date_range("2001-1-1", periods=20, freq='M')
+    ts = Series(np.random.rand(len(idx)), index=idx)
+
+    # getting
+
+    # GH 3070, make sure semantics work on Series/Frame
+    expected = ts['2001']
+    expected.name = 'A'
+
+    df = DataFrame(dict(A=ts))
+    result = df['2001']['A']
+    assert_series_equal(expected, result)
+
+    # setting
+    ts['2001'] = 1
+    expected = ts['2001']
+    expected.name = 'A'
+
+    df.loc['2001', 'A'] = 1
+
+    result = df['2001']['A']
+    assert_series_equal(expected, result)
+
+    # GH3546 (not including times on the last day)
+    idx = date_range(start='2013-05-31 00:00', end='2013-05-31 23:00',
+                     freq='H')
+    ts = Series(lrange(len(idx)), index=idx)
+    expected = ts['2013-05']
+    assert_series_equal(expected, ts)
+
+    idx = date_range(start='2013-05-31 00:00', end='2013-05-31 23:59',
+                     freq='S')
+    ts = Series(lrange(len(idx)), index=idx)
+    expected = ts['2013-05']
+    assert_series_equal(expected, ts)
+
+    idx = [Timestamp('2013-05-31 00:00'),
+           Timestamp(datetime(2013, 5, 31, 23, 59, 59, 999999))]
+    ts = Series(lrange(len(idx)), index=idx)
+    expected = ts['2013']
+    assert_series_equal(expected, ts)
+
+    # GH14826, indexing with a seconds resolution string / datetime object
+    df = DataFrame(np.random.rand(5, 5),
+                   columns=['open', 'high', 'low', 'close', 'volume'],
+                   index=date_range('2012-01-02 18:01:00',
+                                    periods=5, tz='US/Central', freq='s'))
+    expected = df.loc[[df.index[2]]]
+
+    # this is a single date, so will raise
+    pytest.raises(KeyError, df.__getitem__, '2012-01-02 18:01:02', )
+    pytest.raises(KeyError, df.__getitem__, df.index[2], )
+
+
+"""
+test NaT support
+"""
+
+
+def test_set_none_nan():
+    series = Series(date_range('1/1/2000', periods=10))
+    series[3] = None
+    assert series[3] is NaT
+
+    series[3:5] = None
+    assert series[4] is NaT
+
+    series[5] = np.nan
+    assert series[5] is NaT
+
+    series[5:7] = np.nan
+    assert series[6] is NaT
+
+
+def test_nat_operations():
+    # GH 8617
+    s = Series([0, pd.NaT], dtype='m8[ns]')
+    exp = s[0]
+    assert s.median() == exp
+    assert s.min() == exp
+    assert s.max() == exp
+
+
+@pytest.mark.parametrize('method', ["round", "floor", "ceil"])
+@pytest.mark.parametrize('freq', ["s", "5s", "min", "5min", "h", "5h"])
+def test_round_nat(method, freq):
+    # GH14940
+    s = Series([pd.NaT])
+    expected = Series(pd.NaT)
+    round_method = getattr(s.dt, method)
+    assert_series_equal(round_method(freq), expected)
diff --git a/pandas/tests/series/indexing/test_iloc.py b/pandas/tests/series/indexing/test_iloc.py
new file mode 100644
index 0000000000000..648a37ce0262b
--- /dev/null
+++ b/pandas/tests/series/indexing/test_iloc.py
@@ -0,0 +1,38 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import numpy as np
+
+from pandas import Series
+
+from pandas.compat import lrange, range
+from pandas.util.testing import (assert_series_equal,
+                                 assert_almost_equal)
+
+
+def test_iloc():
+    s = Series(np.random.randn(10), index=lrange(0, 20, 2))
+
+    for i in range(len(s)):
+        result = s.iloc[i]
+        exp = s[s.index[i]]
+        assert_almost_equal(result, exp)
+
+    # pass a slice
+    result = s.iloc[slice(1, 3)]
+    expected = s.loc[2:4]
+    assert_series_equal(result, expected)
+
+    # test slice is a view
+    result[:] = 0
+    assert (s[1:3] == 0).all()
+
+    # list of integers
+    result = s.iloc[[0, 2, 3, 4, 5]]
+    expected = s.reindex(s.index[[0, 2, 3, 4, 5]])
+    assert_series_equal(result, expected)
+
+
+def test_iloc_nonunique():
+    s = Series([0, 1, 2], index=[0, 1, 0])
+    assert s.iloc[2] == 2
diff --git a/pandas/tests/series/indexing/test_indexing.py b/pandas/tests/series/indexing/test_indexing.py
new file mode 100644
index 0000000000000..25bc394e312a0
--- /dev/null
+++ b/pandas/tests/series/indexing/test_indexing.py
@@ -0,0 +1,813 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+""" test get/set & misc """
+
+import pytest
+
+from datetime import timedelta
+
+import numpy as np
+import pandas as pd
+
+from pandas.core.dtypes.common import is_scalar
+from pandas import (Series, DataFrame, MultiIndex,
+                    Timestamp, Timedelta, Categorical)
+from pandas.tseries.offsets import BDay
+
+from pandas.compat import lrange, range
+
+from pandas.util.testing import (assert_series_equal)
+import pandas.util.testing as tm
+
+
+def test_basic_indexing():
+    s = Series(np.random.randn(5), index=['a', 'b', 'a', 'a', 'b'])
+
+    pytest.raises(IndexError, s.__getitem__, 5)
+    pytest.raises(IndexError, s.__setitem__, 5, 0)
+
+    pytest.raises(KeyError, s.__getitem__, 'c')
+
+    s = s.sort_index()
+
+    pytest.raises(IndexError, s.__getitem__, 5)
+    pytest.raises(IndexError, s.__setitem__, 5, 0)
+
+
+def test_basic_getitem_with_labels(test_data):
+    indices = test_data.ts.index[[5, 10, 15]]
+
+    result = test_data.ts[indices]
+    expected = test_data.ts.reindex(indices)
+    assert_series_equal(result, expected)
+
+    result = test_data.ts[indices[0]:indices[2]]
+    expected = test_data.ts.loc[indices[0]:indices[2]]
+    assert_series_equal(result, expected)
+
+    # integer indexes, be careful
+    s = Series(np.random.randn(10), index=lrange(0, 20, 2))
+    inds = [0, 2, 5, 7, 8]
+    arr_inds = np.array([0, 2, 5, 7, 8])
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        result = s[inds]
+    expected = s.reindex(inds)
+    assert_series_equal(result, expected)
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        result = s[arr_inds]
+    expected = s.reindex(arr_inds)
+    assert_series_equal(result, expected)
+
+    # GH12089
+    # with tz for values
+    s = Series(pd.date_range("2011-01-01", periods=3, tz="US/Eastern"),
+               index=['a', 'b', 'c'])
+    expected = Timestamp('2011-01-01', tz='US/Eastern')
+    result = s.loc['a']
+    assert result == expected
+    result = s.iloc[0]
+    assert result == expected
+    result = s['a']
+    assert result == expected
+
+
+def test_getitem_setitem_ellipsis():
+    s = Series(np.random.randn(10))
+
+    np.fix(s)
+
+    result = s[...]
+    assert_series_equal(result, s)
+
+    s[...] = 5
+    assert (result == 5).all()
+
+
+def test_getitem_get(test_data):
+    test_series = test_data.series
+    test_obj_series = test_data.objSeries
+
+    idx1 = test_series.index[5]
+    idx2 = test_obj_series.index[5]
+
+    assert test_series[idx1] == test_series.get(idx1)
+    assert test_obj_series[idx2] == test_obj_series.get(idx2)
+
+    assert test_series[idx1] == test_series[5]
+    assert test_obj_series[idx2] == test_obj_series[5]
+
+    assert test_series.get(-1) == test_series.get(test_series.index[-1])
+    assert test_series[5] == test_series.get(test_series.index[5])
+
+    # missing
+    d = test_data.ts.index[0] - BDay()
+    pytest.raises(KeyError, test_data.ts.__getitem__, d)
+
+    # None
+    # GH 5652
+    for s in [Series(), Series(index=list('abc'))]:
+        result = s.get(None)
+        assert result is None
+
+
+def test_getitem_fancy(test_data):
+    slice1 = test_data.series[[1, 2, 3]]
+    slice2 = test_data.objSeries[[1, 2, 3]]
+    assert test_data.series.index[2] == slice1.index[1]
+    assert test_data.objSeries.index[2] == slice2.index[1]
+    assert test_data.series[2] == slice1[1]
+    assert test_data.objSeries[2] == slice2[1]
+
+
+def test_getitem_generator(test_data):
+    gen = (x > 0 for x in test_data.series)
+    result = test_data.series[gen]
+    result2 = test_data.series[iter(test_data.series > 0)]
+    expected = test_data.series[test_data.series > 0]
+    assert_series_equal(result, expected)
+    assert_series_equal(result2, expected)
+
+
+def test_type_promotion():
+    # GH12599
+    s = pd.Series()
+    s["a"] = pd.Timestamp("2016-01-01")
+    s["b"] = 3.0
+    s["c"] = "foo"
+    expected = Series([pd.Timestamp("2016-01-01"), 3.0, "foo"],
+                      index=["a", "b", "c"])
+    assert_series_equal(s, expected)
+
+
+@pytest.mark.parametrize(
+    'result_1, duplicate_item, expected_1',
+    [
+        [
+            pd.Series({1: 12, 2: [1, 2, 2, 3]}), pd.Series({1: 313}),
+            pd.Series({1: 12, }, dtype=object),
+        ],
+        [
+            pd.Series({1: [1, 2, 3], 2: [1, 2, 2, 3]}),
+            pd.Series({1: [1, 2, 3]}), pd.Series({1: [1, 2, 3], }),
+        ],
+    ])
+def test_getitem_with_duplicates_indices(
+        result_1, duplicate_item, expected_1):
+    # GH 17610
+    result = result_1.append(duplicate_item)
+    expected = expected_1.append(duplicate_item)
+    assert_series_equal(result[1], expected)
+    assert result[2] == result_1[2]
+
+
+def test_getitem_out_of_bounds(test_data):
+    # don't segfault, GH #495
+    pytest.raises(IndexError, test_data.ts.__getitem__, len(test_data.ts))
+
+    # GH #917
+    s = Series([])
+    pytest.raises(IndexError, s.__getitem__, -1)
+
+
+def test_getitem_setitem_integers():
+    # caused bug without test
+    s = Series([1, 2, 3], ['a', 'b', 'c'])
+
+    assert s.iloc[0] == s['a']
+    s.iloc[0] = 5
+    tm.assert_almost_equal(s['a'], 5)
+
+
+def test_getitem_box_float64(test_data):
+    value = test_data.ts[5]
+    assert isinstance(value, np.float64)
+
+
+@pytest.mark.parametrize(
+    'arr',
+    [
+        np.random.randn(10),
+        tm.makeDateIndex(10, name='a').tz_localize(
+            tz='US/Eastern'),
+    ])
+def test_get(arr):
+    # GH 21260
+    s = Series(arr, index=[2 * i for i in range(len(arr))])
+    assert s.get(4) == s.iloc[2]
+
+    result = s.get([4, 6])
+    expected = s.iloc[[2, 3]]
+    tm.assert_series_equal(result, expected)
+
+    result = s.get(slice(2))
+    expected = s.iloc[[0, 1]]
+    tm.assert_series_equal(result, expected)
+
+    assert s.get(-1) is None
+    assert s.get(s.index.max() + 1) is None
+
+    s = Series(arr[:6], index=list('abcdef'))
+    assert s.get('c') == s.iloc[2]
+
+    result = s.get(slice('b', 'd'))
+    expected = s.iloc[[1, 2, 3]]
+    tm.assert_series_equal(result, expected)
+
+    result = s.get('Z')
+    assert result is None
+
+    assert s.get(4) == s.iloc[4]
+    assert s.get(-1) == s.iloc[-1]
+    assert s.get(len(s)) is None
+
+    # GH 21257
+    s = pd.Series(arr)
+    s2 = s[::2]
+    assert s2.get(1) is None
+
+
+def test_series_box_timestamp():
+    rng = pd.date_range('20090415', '20090519', freq='B')
+    ser = Series(rng)
+
+    assert isinstance(ser[5], pd.Timestamp)
+
+    rng = pd.date_range('20090415', '20090519', freq='B')
+    ser = Series(rng, index=rng)
+    assert isinstance(ser[5], pd.Timestamp)
+
+    assert isinstance(ser.iat[5], pd.Timestamp)
+
+
+def test_getitem_ambiguous_keyerror():
+    s = Series(lrange(10), index=lrange(0, 20, 2))
+    pytest.raises(KeyError, s.__getitem__, 1)
+    pytest.raises(KeyError, s.loc.__getitem__, 1)
+
+
+def test_getitem_unordered_dup():
+    obj = Series(lrange(5), index=['c', 'a', 'a', 'b', 'b'])
+    assert is_scalar(obj['c'])
+    assert obj['c'] == 0
+
+
+def test_getitem_dups_with_missing():
+    # breaks reindex, so need to use .loc internally
+    # GH 4246
+    s = Series([1, 2, 3, 4], ['foo', 'bar', 'foo', 'bah'])
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        expected = s.loc[['foo', 'bar', 'bah', 'bam']]
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        result = s[['foo', 'bar', 'bah', 'bam']]
+    assert_series_equal(result, expected)
+
+
+def test_getitem_dups():
+    s = Series(range(5), index=['A', 'A', 'B', 'C', 'C'], dtype=np.int64)
+    expected = Series([3, 4], index=['C', 'C'], dtype=np.int64)
+    result = s['C']
+    assert_series_equal(result, expected)
+
+
+def test_setitem_ambiguous_keyerror():
+    s = Series(lrange(10), index=lrange(0, 20, 2))
+
+    # equivalent of an append
+    s2 = s.copy()
+    s2[1] = 5
+    expected = s.append(Series([5], index=[1]))
+    assert_series_equal(s2, expected)
+
+    s2 = s.copy()
+    s2.loc[1] = 5
+    expected = s.append(Series([5], index=[1]))
+    assert_series_equal(s2, expected)
+
+
+def test_getitem_dataframe():
+    rng = list(range(10))
+    s = pd.Series(10, index=rng)
+    df = pd.DataFrame(rng, index=rng)
+    pytest.raises(TypeError, s.__getitem__, df > 5)
+
+
+def test_setitem(test_data):
+    test_data.ts[test_data.ts.index[5]] = np.NaN
+    test_data.ts[[1, 2, 17]] = np.NaN
+    test_data.ts[6] = np.NaN
+    assert np.isnan(test_data.ts[6])
+    assert np.isnan(test_data.ts[2])
+    test_data.ts[np.isnan(test_data.ts)] = 5
+    assert not np.isnan(test_data.ts[2])
+
+    # caught this bug when writing tests
+    series = Series(tm.makeIntIndex(20).astype(float),
+                    index=tm.makeIntIndex(20))
+
+    series[::2] = 0
+    assert (series[::2] == 0).all()
+
+    # set item that's not contained
+    s = test_data.series.copy()
+    s['foobar'] = 1
+
+    app = Series([1], index=['foobar'], name='series')
+    expected = test_data.series.append(app)
+    assert_series_equal(s, expected)
+
+    # Test for issue #10193
+    key = pd.Timestamp('2012-01-01')
+    series = pd.Series()
+    series[key] = 47
+    expected = pd.Series(47, [key])
+    assert_series_equal(series, expected)
+
+    series = pd.Series([], pd.DatetimeIndex([], freq='D'))
+    series[key] = 47
+    expected = pd.Series(47, pd.DatetimeIndex([key], freq='D'))
+    assert_series_equal(series, expected)
+
+
+def test_setitem_dtypes():
+    # change dtypes
+    # GH 4463
+    expected = Series([np.nan, 2, 3])
+
+    s = Series([1, 2, 3])
+    s.iloc[0] = np.nan
+    assert_series_equal(s, expected)
+
+    s = Series([1, 2, 3])
+    s.loc[0] = np.nan
+    assert_series_equal(s, expected)
+
+    s = Series([1, 2, 3])
+    s[0] = np.nan
+    assert_series_equal(s, expected)
+
+    s = Series([False])
+    s.loc[0] = np.nan
+    assert_series_equal(s, Series([np.nan]))
+
+    s = Series([False, True])
+    s.loc[0] = np.nan
+    assert_series_equal(s, Series([np.nan, 1.0]))
+
+
+def test_set_value(test_data):
+    idx = test_data.ts.index[10]
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        res = test_data.ts.set_value(idx, 0)
+    assert res is test_data.ts
+    assert test_data.ts[idx] == 0
+
+    # equiv
+    s = test_data.series.copy()
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        res = s.set_value('foobar', 0)
+    assert res is s
+    assert res.index[-1] == 'foobar'
+    assert res['foobar'] == 0
+
+    s = test_data.series.copy()
+    s.loc['foobar'] = 0
+    assert s.index[-1] == 'foobar'
+    assert s['foobar'] == 0
+
+
+def test_setslice(test_data):
+    sl = test_data.ts[5:20]
+    assert len(sl) == len(sl.index)
+    assert sl.index.is_unique
+
+
+def test_basic_getitem_setitem_corner(test_data):
+    # invalid tuples, e.g. td.ts[:, None] vs. td.ts[:, 2]
+    with tm.assert_raises_regex(ValueError, 'tuple-index'):
+        test_data.ts[:, 2]
+    with tm.assert_raises_regex(ValueError, 'tuple-index'):
+        test_data.ts[:, 2] = 2
+
+    # weird lists. [slice(0, 5)] will work but not two slices
+    result = test_data.ts[[slice(None, 5)]]
+    expected = test_data.ts[:5]
+    assert_series_equal(result, expected)
+
+    # OK
+    pytest.raises(Exception, test_data.ts.__getitem__,
+                  [5, slice(None, None)])
+    pytest.raises(Exception, test_data.ts.__setitem__,
+                  [5, slice(None, None)], 2)
+
+
+@pytest.mark.parametrize('tz', ['US/Eastern', 'UTC', 'Asia/Tokyo'])
+def test_setitem_with_tz(tz):
+    orig = pd.Series(pd.date_range('2016-01-01', freq='H', periods=3,
+                                   tz=tz))
+    assert orig.dtype == 'datetime64[ns, {0}]'.format(tz)
+
+    # scalar
+    s = orig.copy()
+    s[1] = pd.Timestamp('2011-01-01', tz=tz)
+    exp = pd.Series([pd.Timestamp('2016-01-01 00:00', tz=tz),
+                     pd.Timestamp('2011-01-01 00:00', tz=tz),
+                     pd.Timestamp('2016-01-01 02:00', tz=tz)])
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.loc[1] = pd.Timestamp('2011-01-01', tz=tz)
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.iloc[1] = pd.Timestamp('2011-01-01', tz=tz)
+    tm.assert_series_equal(s, exp)
+
+    # vector
+    vals = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
+                      pd.Timestamp('2012-01-01', tz=tz)], index=[1, 2])
+    assert vals.dtype == 'datetime64[ns, {0}]'.format(tz)
+
+    s[[1, 2]] = vals
+    exp = pd.Series([pd.Timestamp('2016-01-01 00:00', tz=tz),
+                     pd.Timestamp('2011-01-01 00:00', tz=tz),
+                     pd.Timestamp('2012-01-01 00:00', tz=tz)])
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.loc[[1, 2]] = vals
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.iloc[[1, 2]] = vals
+    tm.assert_series_equal(s, exp)
+
+
+def test_setitem_with_tz_dst():
+    # GH XXX
+    tz = 'US/Eastern'
+    orig = pd.Series(pd.date_range('2016-11-06', freq='H', periods=3,
+                                   tz=tz))
+    assert orig.dtype == 'datetime64[ns, {0}]'.format(tz)
+
+    # scalar
+    s = orig.copy()
+    s[1] = pd.Timestamp('2011-01-01', tz=tz)
+    exp = pd.Series([pd.Timestamp('2016-11-06 00:00-04:00', tz=tz),
+                     pd.Timestamp('2011-01-01 00:00-05:00', tz=tz),
+                     pd.Timestamp('2016-11-06 01:00-05:00', tz=tz)])
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.loc[1] = pd.Timestamp('2011-01-01', tz=tz)
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.iloc[1] = pd.Timestamp('2011-01-01', tz=tz)
+    tm.assert_series_equal(s, exp)
+
+    # vector
+    vals = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
+                      pd.Timestamp('2012-01-01', tz=tz)], index=[1, 2])
+    assert vals.dtype == 'datetime64[ns, {0}]'.format(tz)
+
+    s[[1, 2]] = vals
+    exp = pd.Series([pd.Timestamp('2016-11-06 00:00', tz=tz),
+                     pd.Timestamp('2011-01-01 00:00', tz=tz),
+                     pd.Timestamp('2012-01-01 00:00', tz=tz)])
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.loc[[1, 2]] = vals
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.iloc[[1, 2]] = vals
+    tm.assert_series_equal(s, exp)
+
+
+def test_categorial_assigning_ops():
+    orig = Series(Categorical(["b", "b"], categories=["a", "b"]))
+    s = orig.copy()
+    s[:] = "a"
+    exp = Series(Categorical(["a", "a"], categories=["a", "b"]))
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s[1] = "a"
+    exp = Series(Categorical(["b", "a"], categories=["a", "b"]))
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s[s.index > 0] = "a"
+    exp = Series(Categorical(["b", "a"], categories=["a", "b"]))
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s[[False, True]] = "a"
+    exp = Series(Categorical(["b", "a"], categories=["a", "b"]))
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.index = ["x", "y"]
+    s["y"] = "a"
+    exp = Series(Categorical(["b", "a"], categories=["a", "b"]),
+                 index=["x", "y"])
+    tm.assert_series_equal(s, exp)
+
+    # ensure that one can set something to np.nan
+    s = Series(Categorical([1, 2, 3]))
+    exp = Series(Categorical([1, np.nan, 3], categories=[1, 2, 3]))
+    s[1] = np.nan
+    tm.assert_series_equal(s, exp)
+
+
+def test_slice(test_data):
+    numSlice = test_data.series[10:20]
+    numSliceEnd = test_data.series[-10:]
+    objSlice = test_data.objSeries[10:20]
+
+    assert test_data.series.index[9] not in numSlice.index
+    assert test_data.objSeries.index[9] not in objSlice.index
+
+    assert len(numSlice) == len(numSlice.index)
+    assert test_data.series[numSlice.index[0]] == numSlice[numSlice.index[0]]
+
+    assert numSlice.index[1] == test_data.series.index[11]
+    assert tm.equalContents(numSliceEnd, np.array(test_data.series)[-10:])
+
+    # Test return view.
+    sl = test_data.series[10:20]
+    sl[:] = 0
+
+    assert (test_data.series[10:20] == 0).all()
+
+
+def test_slice_can_reorder_not_uniquely_indexed():
+    s = Series(1, index=['a', 'a', 'b', 'b', 'c'])
+    s[::-1]  # it works!
+
+
+def test_ix_setitem(test_data):
+    inds = test_data.series.index[[3, 4, 7]]
+
+    result = test_data.series.copy()
+    result.loc[inds] = 5
+
+    expected = test_data.series.copy()
+    expected[[3, 4, 7]] = 5
+    assert_series_equal(result, expected)
+
+    result.iloc[5:10] = 10
+    expected[5:10] = 10
+    assert_series_equal(result, expected)
+
+    # set slice with indices
+    d1, d2 = test_data.series.index[[5, 15]]
+    result.loc[d1:d2] = 6
+    expected[5:16] = 6  # because it's inclusive
+    assert_series_equal(result, expected)
+
+    # set index value
+    test_data.series.loc[d1] = 4
+    test_data.series.loc[d2] = 6
+    assert test_data.series[d1] == 4
+    assert test_data.series[d2] == 6
+
+
+def test_setitem_na():
+    # these induce dtype changes
+    expected = Series([np.nan, 3, np.nan, 5, np.nan, 7, np.nan, 9, np.nan])
+    s = Series([2, 3, 4, 5, 6, 7, 8, 9, 10])
+    s[::2] = np.nan
+    assert_series_equal(s, expected)
+
+    # gets coerced to float, right?
+    expected = Series([np.nan, 1, np.nan, 0])
+    s = Series([True, True, False, False])
+    s[::2] = np.nan
+    assert_series_equal(s, expected)
+
+    expected = Series([np.nan, np.nan, np.nan, np.nan, np.nan, 5, 6, 7, 8,
+                       9])
+    s = Series(np.arange(10))
+    s[:5] = np.nan
+    assert_series_equal(s, expected)
+
+
+def test_timedelta_assignment():
+    # GH 8209
+    s = Series([])
+    s.loc['B'] = timedelta(1)
+    tm.assert_series_equal(s, Series(Timedelta('1 days'), index=['B']))
+
+    s = s.reindex(s.index.insert(0, 'A'))
+    tm.assert_series_equal(s, Series(
+        [np.nan, Timedelta('1 days')], index=['A', 'B']))
+
+    result = s.fillna(timedelta(1))
+    expected = Series(Timedelta('1 days'), index=['A', 'B'])
+    tm.assert_series_equal(result, expected)
+
+    s.loc['A'] = timedelta(1)
+    tm.assert_series_equal(s, expected)
+
+    # GH 14155
+    s = Series(10 * [np.timedelta64(10, 'm')])
+    s.loc[[1, 2, 3]] = np.timedelta64(20, 'm')
+    expected = pd.Series(10 * [np.timedelta64(10, 'm')])
+    expected.loc[[1, 2, 3]] = pd.Timedelta(np.timedelta64(20, 'm'))
+    tm.assert_series_equal(s, expected)
+
+
+def test_underlying_data_conversion():
+    # GH 4080
+    df = DataFrame({c: [1, 2, 3] for c in ['a', 'b', 'c']})
+    df.set_index(['a', 'b', 'c'], inplace=True)
+    s = Series([1], index=[(2, 2, 2)])
+    df['val'] = 0
+    df
+    df['val'].update(s)
+
+    expected = DataFrame(
+        dict(a=[1, 2, 3], b=[1, 2, 3], c=[1, 2, 3], val=[0, 1, 0]))
+    expected.set_index(['a', 'b', 'c'], inplace=True)
+    tm.assert_frame_equal(df, expected)
+
+    # GH 3970
+    # these are chained assignments as well
+    pd.set_option('chained_assignment', None)
+    df = DataFrame({"aa": range(5), "bb": [2.2] * 5})
+    df["cc"] = 0.0
+
+    ck = [True] * len(df)
+
+    df["bb"].iloc[0] = .13
+
+    # TODO: unused
+    df_tmp = df.iloc[ck]  # noqa
+
+    df["bb"].iloc[0] = .15
+    assert df['bb'].iloc[0] == 0.15
+    pd.set_option('chained_assignment', 'raise')
+
+    # GH 3217
+    df = DataFrame(dict(a=[1, 3], b=[np.nan, 2]))
+    df['c'] = np.nan
+    df['c'].update(pd.Series(['foo'], index=[0]))
+
+    expected = DataFrame(dict(a=[1, 3], b=[np.nan, 2], c=['foo', np.nan]))
+    tm.assert_frame_equal(df, expected)
+
+
+def test_preserve_refs(test_data):
+    seq = test_data.ts[[5, 10, 15]]
+    seq[1] = np.NaN
+    assert not np.isnan(test_data.ts[10])
+
+
+def test_cast_on_putmask():
+    # GH 2746
+
+    # need to upcast
+    s = Series([1, 2], index=[1, 2], dtype='int64')
+    s[[True, False]] = Series([0], index=[1], dtype='int64')
+    expected = Series([0, 2], index=[1, 2], dtype='int64')
+
+    assert_series_equal(s, expected)
+
+
+def test_type_promote_putmask():
+    # GH8387: test that changing types does not break alignment
+    ts = Series(np.random.randn(100), index=np.arange(100, 0, -1)).round(5)
+    left, mask = ts.copy(), ts > 0
+    right = ts[mask].copy().map(str)
+    left[mask] = right
+    assert_series_equal(left, ts.map(lambda t: str(t) if t > 0 else t))
+
+    s = Series([0, 1, 2, 0])
+    mask = s > 0
+    s2 = s[mask].map(str)
+    s[mask] = s2
+    assert_series_equal(s, Series([0, '1', '2', 0]))
+
+    s = Series([0, 'foo', 'bar', 0])
+    mask = Series([False, True, True, False])
+    s2 = s[mask]
+    s[mask] = s2
+    assert_series_equal(s, Series([0, 'foo', 'bar', 0]))
+
+
+def test_multilevel_preserve_name():
+    index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
+                                                              'three']],
+                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       names=['first', 'second'])
+    s = Series(np.random.randn(len(index)), index=index, name='sth')
+
+    result = s['foo']
+    result2 = s.loc['foo']
+    assert result.name == s.name
+    assert result2.name == s.name
+
+
+def test_setitem_scalar_into_readonly_backing_data():
+    # GH14359: test that you cannot mutate a read only buffer
+
+    array = np.zeros(5)
+    array.flags.writeable = False  # make the array immutable
+    series = Series(array)
+
+    for n in range(len(series)):
+        with pytest.raises(ValueError):
+            series[n] = 1
+
+        assert array[n] == 0
+
+
+def test_setitem_slice_into_readonly_backing_data():
+    # GH14359: test that you cannot mutate a read only buffer
+
+    array = np.zeros(5)
+    array.flags.writeable = False  # make the array immutable
+    series = Series(array)
+
+    with pytest.raises(ValueError):
+        series[1:3] = 1
+
+    assert not array.any()
+
+
+"""
+miscellaneous methods
+"""
+
+
+def test_select(test_data):
+    # deprecated: gh-12410
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        n = len(test_data.ts)
+        result = test_data.ts.select(lambda x: x >= test_data.ts.index[n // 2])
+        expected = test_data.ts.reindex(test_data.ts.index[n // 2:])
+        assert_series_equal(result, expected)
+
+        result = test_data.ts.select(lambda x: x.weekday() == 2)
+        expected = test_data.ts[test_data.ts.index.weekday == 2]
+        assert_series_equal(result, expected)
+
+
+def test_pop():
+    # GH 6600
+    df = DataFrame({'A': 0, 'B': np.arange(5, dtype='int64'), 'C': 0, })
+    k = df.iloc[4]
+
+    result = k.pop('B')
+    assert result == 4
+
+    expected = Series([0, 0], index=['A', 'C'], name=4)
+    assert_series_equal(k, expected)
+
+
+def test_take():
+    s = Series([-1, 5, 6, 2, 4])
+
+    actual = s.take([1, 3, 4])
+    expected = Series([5, 2, 4], index=[1, 3, 4])
+    tm.assert_series_equal(actual, expected)
+
+    actual = s.take([-1, 3, 4])
+    expected = Series([4, 2, 4], index=[4, 3, 4])
+    tm.assert_series_equal(actual, expected)
+
+    pytest.raises(IndexError, s.take, [1, 10])
+    pytest.raises(IndexError, s.take, [2, 5])
+
+    with tm.assert_produces_warning(FutureWarning):
+        s.take([-1, 3, 4], convert=False)
+
+
+def test_take_categorical():
+    # https://github.com/pandas-dev/pandas/issues/20664
+    s = Series(pd.Categorical(['a', 'b', 'c']))
+    result = s.take([-2, -2, 0])
+    expected = Series(pd.Categorical(['b', 'b', 'a'],
+                      categories=['a', 'b', 'c']),
+                      index=[1, 1, 0])
+    assert_series_equal(result, expected)
+
+
+def test_head_tail(test_data):
+    assert_series_equal(test_data.series.head(), test_data.series[:5])
+    assert_series_equal(test_data.series.head(0), test_data.series[0:0])
+    assert_series_equal(test_data.series.tail(), test_data.series[-5:])
+    assert_series_equal(test_data.series.tail(0), test_data.series[0:0])
diff --git a/pandas/tests/series/indexing/test_loc.py b/pandas/tests/series/indexing/test_loc.py
new file mode 100644
index 0000000000000..088406e0a1db6
--- /dev/null
+++ b/pandas/tests/series/indexing/test_loc.py
@@ -0,0 +1,150 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+
+import numpy as np
+import pandas as pd
+
+from pandas import (Series, Timestamp)
+
+from pandas.compat import lrange
+from pandas.util.testing import (assert_series_equal)
+
+
+def test_loc_getitem(test_data):
+    inds = test_data.series.index[[3, 4, 7]]
+    assert_series_equal(
+        test_data.series.loc[inds],
+        test_data.series.reindex(inds))
+    assert_series_equal(test_data.series.iloc[5::2], test_data.series[5::2])
+
+    # slice with indices
+    d1, d2 = test_data.ts.index[[5, 15]]
+    result = test_data.ts.loc[d1:d2]
+    expected = test_data.ts.truncate(d1, d2)
+    assert_series_equal(result, expected)
+
+    # boolean
+    mask = test_data.series > test_data.series.median()
+    assert_series_equal(test_data.series.loc[mask], test_data.series[mask])
+
+    # ask for index value
+    assert test_data.ts.loc[d1] == test_data.ts[d1]
+    assert test_data.ts.loc[d2] == test_data.ts[d2]
+
+
+def test_loc_getitem_not_monotonic(test_data):
+    d1, d2 = test_data.ts.index[[5, 15]]
+
+    ts2 = test_data.ts[::2][[1, 2, 0]]
+
+    pytest.raises(KeyError, ts2.loc.__getitem__, slice(d1, d2))
+    pytest.raises(KeyError, ts2.loc.__setitem__, slice(d1, d2), 0)
+
+
+def test_loc_getitem_setitem_integer_slice_keyerrors():
+    s = Series(np.random.randn(10), index=lrange(0, 20, 2))
+
+    # this is OK
+    cp = s.copy()
+    cp.iloc[4:10] = 0
+    assert (cp.iloc[4:10] == 0).all()
+
+    # so is this
+    cp = s.copy()
+    cp.iloc[3:11] = 0
+    assert (cp.iloc[3:11] == 0).values.all()
+
+    result = s.iloc[2:6]
+    result2 = s.loc[3:11]
+    expected = s.reindex([4, 6, 8, 10])
+
+    assert_series_equal(result, expected)
+    assert_series_equal(result2, expected)
+
+    # non-monotonic, raise KeyError
+    s2 = s.iloc[lrange(5) + lrange(5, 10)[::-1]]
+    pytest.raises(KeyError, s2.loc.__getitem__, slice(3, 11))
+    pytest.raises(KeyError, s2.loc.__setitem__, slice(3, 11), 0)
+
+
+def test_loc_getitem_iterator(test_data):
+    idx = iter(test_data.series.index[:10])
+    result = test_data.series.loc[idx]
+    assert_series_equal(result, test_data.series[:10])
+
+
+def test_loc_setitem_boolean(test_data):
+    mask = test_data.series > test_data.series.median()
+
+    result = test_data.series.copy()
+    result.loc[mask] = 0
+    expected = test_data.series
+    expected[mask] = 0
+    assert_series_equal(result, expected)
+
+
+def test_loc_setitem_corner(test_data):
+    inds = list(test_data.series.index[[5, 8, 12]])
+    test_data.series.loc[inds] = 5
+    pytest.raises(Exception, test_data.series.loc.__setitem__,
+                  inds + ['foo'], 5)
+
+
+def test_basic_setitem_with_labels(test_data):
+    indices = test_data.ts.index[[5, 10, 15]]
+
+    cp = test_data.ts.copy()
+    exp = test_data.ts.copy()
+    cp[indices] = 0
+    exp.loc[indices] = 0
+    assert_series_equal(cp, exp)
+
+    cp = test_data.ts.copy()
+    exp = test_data.ts.copy()
+    cp[indices[0]:indices[2]] = 0
+    exp.loc[indices[0]:indices[2]] = 0
+    assert_series_equal(cp, exp)
+
+    # integer indexes, be careful
+    s = Series(np.random.randn(10), index=lrange(0, 20, 2))
+    inds = [0, 4, 6]
+    arr_inds = np.array([0, 4, 6])
+
+    cp = s.copy()
+    exp = s.copy()
+    s[inds] = 0
+    s.loc[inds] = 0
+    assert_series_equal(cp, exp)
+
+    cp = s.copy()
+    exp = s.copy()
+    s[arr_inds] = 0
+    s.loc[arr_inds] = 0
+    assert_series_equal(cp, exp)
+
+    inds_notfound = [0, 4, 5, 6]
+    arr_inds_notfound = np.array([0, 4, 5, 6])
+    pytest.raises(Exception, s.__setitem__, inds_notfound, 0)
+    pytest.raises(Exception, s.__setitem__, arr_inds_notfound, 0)
+
+    # GH12089
+    # with tz for values
+    s = Series(pd.date_range("2011-01-01", periods=3, tz="US/Eastern"),
+               index=['a', 'b', 'c'])
+    s2 = s.copy()
+    expected = Timestamp('2011-01-03', tz='US/Eastern')
+    s2.loc['a'] = expected
+    result = s2.loc['a']
+    assert result == expected
+
+    s2 = s.copy()
+    s2.iloc[0] = expected
+    result = s2.iloc[0]
+    assert result == expected
+
+    s2 = s.copy()
+    s2['a'] = expected
+    result = s2['a']
+    assert result == expected
diff --git a/pandas/tests/series/indexing/test_numeric.py b/pandas/tests/series/indexing/test_numeric.py
new file mode 100644
index 0000000000000..6df63c3981af3
--- /dev/null
+++ b/pandas/tests/series/indexing/test_numeric.py
@@ -0,0 +1,251 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+
+import numpy as np
+import pandas as pd
+
+from pandas import (Index, Series, DataFrame)
+
+from pandas.compat import lrange, range
+from pandas.util.testing import (assert_series_equal)
+
+import pandas.util.testing as tm
+
+
+def test_get():
+    # GH 6383
+    s = Series(np.array([43, 48, 60, 48, 50, 51, 50, 45, 57, 48, 56, 45,
+                         51, 39, 55, 43, 54, 52, 51, 54]))
+
+    result = s.get(25, 0)
+    expected = 0
+    assert result == expected
+
+    s = Series(np.array([43, 48, 60, 48, 50, 51, 50, 45, 57, 48, 56,
+                         45, 51, 39, 55, 43, 54, 52, 51, 54]),
+               index=pd.Float64Index(
+                   [25.0, 36.0, 49.0, 64.0, 81.0, 100.0,
+                    121.0, 144.0, 169.0, 196.0, 1225.0,
+                    1296.0, 1369.0, 1444.0, 1521.0, 1600.0,
+                    1681.0, 1764.0, 1849.0, 1936.0],
+                   dtype='object'))
+
+    result = s.get(25, 0)
+    expected = 43
+    assert result == expected
+
+    # GH 7407
+    # with a boolean accessor
+    df = pd.DataFrame({'i': [0] * 3, 'b': [False] * 3})
+    vc = df.i.value_counts()
+    result = vc.get(99, default='Missing')
+    assert result == 'Missing'
+
+    vc = df.b.value_counts()
+    result = vc.get(False, default='Missing')
+    assert result == 3
+
+    result = vc.get(True, default='Missing')
+    assert result == 'Missing'
+
+
+def test_get_nan():
+    # GH 8569
+    s = pd.Float64Index(range(10)).to_series()
+    assert s.get(np.nan) is None
+    assert s.get(np.nan, default='Missing') == 'Missing'
+
+
+def test_get_nan_multiple():
+    # GH 8569
+    # ensure that fixing "test_get_nan" above hasn't broken get
+    # with multiple elements
+    s = pd.Float64Index(range(10)).to_series()
+
+    idx = [2, 30]
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        assert_series_equal(s.get(idx),
+                            Series([2, np.nan], index=idx))
+
+    idx = [2, np.nan]
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        assert_series_equal(s.get(idx),
+                            Series([2, np.nan], index=idx))
+
+    # GH 17295 - all missing keys
+    idx = [20, 30]
+    assert(s.get(idx) is None)
+
+    idx = [np.nan, np.nan]
+    assert(s.get(idx) is None)
+
+
+def test_delitem():
+    # GH 5542
+    # should delete the item inplace
+    s = Series(lrange(5))
+    del s[0]
+
+    expected = Series(lrange(1, 5), index=lrange(1, 5))
+    assert_series_equal(s, expected)
+
+    del s[1]
+    expected = Series(lrange(2, 5), index=lrange(2, 5))
+    assert_series_equal(s, expected)
+
+    # empty
+    s = Series()
+
+    def f():
+        del s[0]
+
+    pytest.raises(KeyError, f)
+
+    # only 1 left, del, add, del
+    s = Series(1)
+    del s[0]
+    assert_series_equal(s, Series(dtype='int64', index=Index(
+        [], dtype='int64')))
+    s[0] = 1
+    assert_series_equal(s, Series(1))
+    del s[0]
+    assert_series_equal(s, Series(dtype='int64', index=Index(
+        [], dtype='int64')))
+
+    # Index(dtype=object)
+    s = Series(1, index=['a'])
+    del s['a']
+    assert_series_equal(s, Series(dtype='int64', index=Index(
+        [], dtype='object')))
+    s['a'] = 1
+    assert_series_equal(s, Series(1, index=['a']))
+    del s['a']
+    assert_series_equal(s, Series(dtype='int64', index=Index(
+        [], dtype='object')))
+
+
+def test_slice_float64():
+    values = np.arange(10., 50., 2)
+    index = Index(values)
+
+    start, end = values[[5, 15]]
+
+    s = Series(np.random.randn(20), index=index)
+
+    result = s[start:end]
+    expected = s.iloc[5:16]
+    assert_series_equal(result, expected)
+
+    result = s.loc[start:end]
+    assert_series_equal(result, expected)
+
+    df = DataFrame(np.random.randn(20, 3), index=index)
+
+    result = df[start:end]
+    expected = df.iloc[5:16]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.loc[start:end]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_getitem_negative_out_of_bounds():
+    s = Series(tm.rands_array(5, 10), index=tm.rands_array(10, 10))
+
+    pytest.raises(IndexError, s.__getitem__, -11)
+    pytest.raises(IndexError, s.__setitem__, -11, 'foo')
+
+
+def test_getitem_regression():
+    s = Series(lrange(5), index=lrange(5))
+    result = s[lrange(5)]
+    assert_series_equal(result, s)
+
+
+def test_getitem_setitem_slice_bug():
+    s = Series(lrange(10), lrange(10))
+    result = s[-12:]
+    assert_series_equal(result, s)
+
+    result = s[-7:]
+    assert_series_equal(result, s[3:])
+
+    result = s[:-12]
+    assert_series_equal(result, s[:0])
+
+    s = Series(lrange(10), lrange(10))
+    s[-12:] = 0
+    assert (s == 0).all()
+
+    s[:-12] = 5
+    assert (s == 0).all()
+
+
+def test_getitem_setitem_slice_integers():
+    s = Series(np.random.randn(8), index=[2, 4, 6, 8, 10, 12, 14, 16])
+
+    result = s[:4]
+    expected = s.reindex([2, 4, 6, 8])
+    assert_series_equal(result, expected)
+
+    s[:4] = 0
+    assert (s[:4] == 0).all()
+    assert not (s[4:] == 0).any()
+
+
+def test_setitem_float_labels():
+    # note labels are floats
+    s = Series(['a', 'b', 'c'], index=[0, 0.5, 1])
+    tmp = s.copy()
+
+    s.loc[1] = 'zoo'
+    tmp.iloc[2] = 'zoo'
+
+    assert_series_equal(s, tmp)
+
+
+def test_slice_float_get_set(test_data):
+    pytest.raises(TypeError, lambda: test_data.ts[4.0:10.0])
+
+    def f():
+        test_data.ts[4.0:10.0] = 0
+
+    pytest.raises(TypeError, f)
+
+    pytest.raises(TypeError, test_data.ts.__getitem__, slice(4.5, 10.0))
+    pytest.raises(TypeError, test_data.ts.__setitem__, slice(4.5, 10.0), 0)
+
+
+def test_slice_floats2():
+    s = Series(np.random.rand(10), index=np.arange(10, 20, dtype=float))
+
+    assert len(s.loc[12.0:]) == 8
+    assert len(s.loc[12.5:]) == 7
+
+    i = np.arange(10, 20, dtype=float)
+    i[2] = 12.2
+    s.index = i
+    assert len(s.loc[12.0:]) == 8
+    assert len(s.loc[12.5:]) == 7
+
+
+def test_int_indexing():
+    s = Series(np.random.randn(6), index=[0, 0, 1, 1, 2, 2])
+
+    pytest.raises(KeyError, s.__getitem__, 5)
+
+    pytest.raises(KeyError, s.__getitem__, 'c')
+
+    # not monotonic
+    s = Series(np.random.randn(6), index=[2, 2, 0, 0, 1, 1])
+
+    pytest.raises(KeyError, s.__getitem__, 5)
+
+    pytest.raises(KeyError, s.__getitem__, 'c')
+
+
+def test_getitem_int64(test_data):
+    idx = np.int64(5)
+    assert test_data.ts[idx] == test_data.ts[5]
diff --git a/pandas/tests/series/test_alter_axes.py b/pandas/tests/series/test_alter_axes.py
new file mode 100644
index 0000000000000..859082a7e722d
--- /dev/null
+++ b/pandas/tests/series/test_alter_axes.py
@@ -0,0 +1,297 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+
+from datetime import datetime
+
+import numpy as np
+import pandas as pd
+
+from pandas import Index, Series
+from pandas.core.index import MultiIndex, RangeIndex
+
+from pandas.compat import lrange, range, zip
+from pandas.util.testing import assert_series_equal, assert_frame_equal
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestSeriesAlterAxes(TestData):
+
+    def test_setindex(self):
+        # wrong type
+        series = self.series.copy()
+        pytest.raises(TypeError, setattr, series, 'index', None)
+
+        # wrong length
+        series = self.series.copy()
+        pytest.raises(Exception, setattr, series, 'index',
+                      np.arange(len(series) - 1))
+
+        # works
+        series = self.series.copy()
+        series.index = np.arange(len(series))
+        assert isinstance(series.index, Index)
+
+    def test_rename(self):
+        renamer = lambda x: x.strftime('%Y%m%d')
+        renamed = self.ts.rename(renamer)
+        assert renamed.index[0] == renamer(self.ts.index[0])
+
+        # dict
+        rename_dict = dict(zip(self.ts.index, renamed.index))
+        renamed2 = self.ts.rename(rename_dict)
+        assert_series_equal(renamed, renamed2)
+
+        # partial dict
+        s = Series(np.arange(4), index=['a', 'b', 'c', 'd'], dtype='int64')
+        renamed = s.rename({'b': 'foo', 'd': 'bar'})
+        tm.assert_index_equal(renamed.index, Index(['a', 'foo', 'c', 'bar']))
+
+        # index with name
+        renamer = Series(np.arange(4),
+                         index=Index(['a', 'b', 'c', 'd'], name='name'),
+                         dtype='int64')
+        renamed = renamer.rename({})
+        assert renamed.index.name == renamer.index.name
+
+    def test_rename_by_series(self):
+        s = Series(range(5), name='foo')
+        renamer = Series({1: 10, 2: 20})
+        result = s.rename(renamer)
+        expected = Series(range(5), index=[0, 10, 20, 3, 4], name='foo')
+        tm.assert_series_equal(result, expected)
+
+    def test_rename_set_name(self):
+        s = Series(range(4), index=list('abcd'))
+        for name in ['foo', 123, 123., datetime(2001, 11, 11), ('foo',)]:
+            result = s.rename(name)
+            assert result.name == name
+            tm.assert_numpy_array_equal(result.index.values, s.index.values)
+            assert s.name is None
+
+    def test_rename_set_name_inplace(self):
+        s = Series(range(3), index=list('abc'))
+        for name in ['foo', 123, 123., datetime(2001, 11, 11), ('foo',)]:
+            s.rename(name, inplace=True)
+            assert s.name == name
+
+            exp = np.array(['a', 'b', 'c'], dtype=np.object_)
+            tm.assert_numpy_array_equal(s.index.values, exp)
+
+    def test_rename_axis_supported(self):
+        # Supporting axis for compatibility, detailed in GH-18589
+        s = Series(range(5))
+        s.rename({}, axis=0)
+        s.rename({}, axis='index')
+        with tm.assert_raises_regex(ValueError, 'No axis named 5'):
+            s.rename({}, axis=5)
+
+    def test_set_name_attribute(self):
+        s = Series([1, 2, 3])
+        s2 = Series([1, 2, 3], name='bar')
+        for name in [7, 7., 'name', datetime(2001, 1, 1), (1,), u"\u05D0"]:
+            s.name = name
+            assert s.name == name
+            s2.name = name
+            assert s2.name == name
+
+    def test_set_name(self):
+        s = Series([1, 2, 3])
+        s2 = s._set_name('foo')
+        assert s2.name == 'foo'
+        assert s.name is None
+        assert s is not s2
+
+    def test_rename_inplace(self):
+        renamer = lambda x: x.strftime('%Y%m%d')
+        expected = renamer(self.ts.index[0])
+
+        self.ts.rename(renamer, inplace=True)
+        assert self.ts.index[0] == expected
+
+    def test_set_index_makes_timeseries(self):
+        idx = tm.makeDateIndex(10)
+
+        s = Series(lrange(10))
+        s.index = idx
+        assert s.index.is_all_dates
+
+    def test_reset_index(self):
+        df = tm.makeDataFrame()[:5]
+        ser = df.stack()
+        ser.index.names = ['hash', 'category']
+
+        ser.name = 'value'
+        df = ser.reset_index()
+        assert 'value' in df
+
+        df = ser.reset_index(name='value2')
+        assert 'value2' in df
+
+        # check inplace
+        s = ser.reset_index(drop=True)
+        s2 = ser
+        s2.reset_index(drop=True, inplace=True)
+        assert_series_equal(s, s2)
+
+        # level
+        index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
+                           labels=[[0, 0, 0, 0, 0, 0], [0, 1, 2, 0, 1, 2],
+                                   [0, 1, 0, 1, 0, 1]])
+        s = Series(np.random.randn(6), index=index)
+        rs = s.reset_index(level=1)
+        assert len(rs.columns) == 2
+
+        rs = s.reset_index(level=[0, 2], drop=True)
+        tm.assert_index_equal(rs.index, Index(index.get_level_values(1)))
+        assert isinstance(rs, Series)
+
+    def test_reset_index_level(self):
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]],
+                          columns=['A', 'B', 'C'])
+
+        for levels in ['A', 'B'], [0, 1]:
+            # With MultiIndex
+            s = df.set_index(['A', 'B'])['C']
+
+            result = s.reset_index(level=levels[0])
+            tm.assert_frame_equal(result, df.set_index('B'))
+
+            result = s.reset_index(level=levels[:1])
+            tm.assert_frame_equal(result, df.set_index('B'))
+
+            result = s.reset_index(level=levels)
+            tm.assert_frame_equal(result, df)
+
+            result = df.set_index(['A', 'B']).reset_index(level=levels,
+                                                          drop=True)
+            tm.assert_frame_equal(result, df[['C']])
+
+            with tm.assert_raises_regex(KeyError, 'Level E '):
+                s.reset_index(level=['A', 'E'])
+
+            # With single-level Index
+            s = df.set_index('A')['B']
+
+            result = s.reset_index(level=levels[0])
+            tm.assert_frame_equal(result, df[['A', 'B']])
+
+            result = s.reset_index(level=levels[:1])
+            tm.assert_frame_equal(result, df[['A', 'B']])
+
+            result = s.reset_index(level=levels[0], drop=True)
+            tm.assert_series_equal(result, df['B'])
+
+            with tm.assert_raises_regex(IndexError, 'Too many levels'):
+                s.reset_index(level=[0, 1, 2])
+
+        # Check that .reset_index([],drop=True) doesn't fail
+        result = pd.Series(range(4)).reset_index([], drop=True)
+        expected = pd.Series(range(4))
+        assert_series_equal(result, expected)
+
+    def test_reset_index_range(self):
+        # GH 12071
+        s = pd.Series(range(2), name='A', dtype='int64')
+        series_result = s.reset_index()
+        assert isinstance(series_result.index, RangeIndex)
+        series_expected = pd.DataFrame([[0, 0], [1, 1]],
+                                       columns=['index', 'A'],
+                                       index=RangeIndex(stop=2))
+        assert_frame_equal(series_result, series_expected)
+
+    def test_reorder_levels(self):
+        index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
+                           labels=[[0, 0, 0, 0, 0, 0], [0, 1, 2, 0, 1, 2],
+                                   [0, 1, 0, 1, 0, 1]],
+                           names=['L0', 'L1', 'L2'])
+        s = Series(np.arange(6), index=index)
+
+        # no change, position
+        result = s.reorder_levels([0, 1, 2])
+        assert_series_equal(s, result)
+
+        # no change, labels
+        result = s.reorder_levels(['L0', 'L1', 'L2'])
+        assert_series_equal(s, result)
+
+        # rotate, position
+        result = s.reorder_levels([1, 2, 0])
+        e_idx = MultiIndex(levels=[['one', 'two', 'three'], [0, 1], ['bar']],
+                           labels=[[0, 1, 2, 0, 1, 2], [0, 1, 0, 1, 0, 1],
+                                   [0, 0, 0, 0, 0, 0]],
+                           names=['L1', 'L2', 'L0'])
+        expected = Series(np.arange(6), index=e_idx)
+        assert_series_equal(result, expected)
+
+    def test_rename_axis_inplace(self):
+        # GH 15704
+        series = self.ts.copy()
+        expected = series.rename_axis('foo')
+        result = series.copy()
+        no_return = result.rename_axis('foo', inplace=True)
+
+        assert no_return is None
+        assert_series_equal(result, expected)
+
+    def test_set_axis_inplace(self):
+        # GH14636
+
+        s = Series(np.arange(4), index=[1, 3, 5, 7], dtype='int64')
+
+        expected = s.copy()
+        expected.index = list('abcd')
+
+        for axis in 0, 'index':
+            # inplace=True
+            # The FutureWarning comes from the fact that we would like to have
+            # inplace default to False some day
+            for inplace, warn in (None, FutureWarning), (True, None):
+                result = s.copy()
+                kwargs = {'inplace': inplace}
+                with tm.assert_produces_warning(warn):
+                    result.set_axis(list('abcd'), axis=axis, **kwargs)
+                tm.assert_series_equal(result, expected)
+
+        # inplace=False
+        result = s.set_axis(list('abcd'), axis=0, inplace=False)
+        tm.assert_series_equal(expected, result)
+
+        # omitting the "axis" parameter
+        with tm.assert_produces_warning(None):
+            result = s.set_axis(list('abcd'), inplace=False)
+        tm.assert_series_equal(result, expected)
+
+        # wrong values for the "axis" parameter
+        for axis in 2, 'foo':
+            with tm.assert_raises_regex(ValueError, 'No axis named'):
+                s.set_axis(list('abcd'), axis=axis, inplace=False)
+
+    def test_set_axis_prior_to_deprecation_signature(self):
+        s = Series(np.arange(4), index=[1, 3, 5, 7], dtype='int64')
+
+        expected = s.copy()
+        expected.index = list('abcd')
+
+        for axis in 0, 'index':
+            with tm.assert_produces_warning(FutureWarning):
+                result = s.set_axis(0, list('abcd'), inplace=False)
+            tm.assert_series_equal(result, expected)
+
+    def test_reset_index_drop_errors(self):
+        #  GH 20925
+
+        # KeyError raised for series index when passed level name is missing
+        s = pd.Series(range(4))
+        with tm.assert_raises_regex(KeyError, 'must be same as name'):
+            s.reset_index('wrong', drop=True)
+        with tm.assert_raises_regex(KeyError, 'must be same as name'):
+            s.reset_index('wrong')
+
+        # KeyError raised for series when level to be dropped is missing
+        s = pd.Series(range(4), index=pd.MultiIndex.from_product([[1, 2]] * 2))
+        with tm.assert_raises_regex(KeyError, 'not found'):
+            s.reset_index('wrong', drop=True)
diff --git a/pandas/tests/series/test_analytics.py b/pandas/tests/series/test_analytics.py
new file mode 100644
index 0000000000000..fcfaff9b11002
--- /dev/null
+++ b/pandas/tests/series/test_analytics.py
@@ -0,0 +1,2289 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+from itertools import product
+from distutils.version import LooseVersion
+import operator
+import pytest
+
+from numpy import nan
+import numpy as np
+import pandas as pd
+
+from pandas import (Series, Categorical, DataFrame, isna, notna,
+                    bdate_range, date_range, _np_version_under1p10,
+                    CategoricalIndex)
+from pandas.core.index import MultiIndex
+from pandas.core.indexes.datetimes import Timestamp
+from pandas.core.indexes.timedeltas import Timedelta
+import pandas.core.nanops as nanops
+
+from pandas.compat import lrange, range, PY35
+from pandas import compat
+from pandas.util.testing import (assert_series_equal, assert_almost_equal,
+                                 assert_frame_equal, assert_index_equal)
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from .common import TestData
+
+
+class TestSeriesAnalytics(TestData):
+
+    @pytest.mark.parametrize("use_bottleneck", [True, False])
+    @pytest.mark.parametrize("method, unit", [
+        ("sum", 0.0),
+        ("prod", 1.0)
+    ])
+    def test_empty(self, method, unit, use_bottleneck):
+        with pd.option_context("use_bottleneck", use_bottleneck):
+            # GH 9422 / 18921
+            # Entirely empty
+            s = Series([])
+            # NA by default
+            result = getattr(s, method)()
+            assert result == unit
+
+            # Explicit
+            result = getattr(s, method)(min_count=0)
+            assert result == unit
+
+            result = getattr(s, method)(min_count=1)
+            assert isna(result)
+
+            # Skipna, default
+            result = getattr(s, method)(skipna=True)
+            result == unit
+
+            # Skipna, explicit
+            result = getattr(s, method)(skipna=True, min_count=0)
+            assert result == unit
+
+            result = getattr(s, method)(skipna=True, min_count=1)
+            assert isna(result)
+
+            # All-NA
+            s = Series([np.nan])
+            # NA by default
+            result = getattr(s, method)()
+            assert result == unit
+
+            # Explicit
+            result = getattr(s, method)(min_count=0)
+            assert result == unit
+
+            result = getattr(s, method)(min_count=1)
+            assert isna(result)
+
+            # Skipna, default
+            result = getattr(s, method)(skipna=True)
+            result == unit
+
+            # skipna, explicit
+            result = getattr(s, method)(skipna=True, min_count=0)
+            assert result == unit
+
+            result = getattr(s, method)(skipna=True, min_count=1)
+            assert isna(result)
+
+            # Mix of valid, empty
+            s = Series([np.nan, 1])
+            # Default
+            result = getattr(s, method)()
+            assert result == 1.0
+
+            # Explicit
+            result = getattr(s, method)(min_count=0)
+            assert result == 1.0
+
+            result = getattr(s, method)(min_count=1)
+            assert result == 1.0
+
+            # Skipna
+            result = getattr(s, method)(skipna=True)
+            assert result == 1.0
+
+            result = getattr(s, method)(skipna=True, min_count=0)
+            assert result == 1.0
+
+            result = getattr(s, method)(skipna=True, min_count=1)
+            assert result == 1.0
+
+            # GH #844 (changed in 9422)
+            df = DataFrame(np.empty((10, 0)))
+            assert (getattr(df, method)(1) == unit).all()
+
+            s = pd.Series([1])
+            result = getattr(s, method)(min_count=2)
+            assert isna(result)
+
+            s = pd.Series([np.nan])
+            result = getattr(s, method)(min_count=2)
+            assert isna(result)
+
+            s = pd.Series([np.nan, 1])
+            result = getattr(s, method)(min_count=2)
+            assert isna(result)
+
+    @pytest.mark.parametrize('method, unit', [
+        ('sum', 0.0),
+        ('prod', 1.0),
+    ])
+    def test_empty_multi(self, method, unit):
+        s = pd.Series([1, np.nan, np.nan, np.nan],
+                      index=pd.MultiIndex.from_product([('a', 'b'), (0, 1)]))
+        # 1 / 0 by default
+        result = getattr(s, method)(level=0)
+        expected = pd.Series([1, unit], index=['a', 'b'])
+        tm.assert_series_equal(result, expected)
+
+        # min_count=0
+        result = getattr(s, method)(level=0, min_count=0)
+        expected = pd.Series([1, unit], index=['a', 'b'])
+        tm.assert_series_equal(result, expected)
+
+        # min_count=1
+        result = getattr(s, method)(level=0, min_count=1)
+        expected = pd.Series([1, np.nan], index=['a', 'b'])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        "method", ['mean', 'median', 'std', 'var'])
+    def test_ops_consistency_on_empty(self, method):
+
+        # GH 7869
+        # consistency on empty
+
+        # float
+        result = getattr(Series(dtype=float), method)()
+        assert isna(result)
+
+        # timedelta64[ns]
+        result = getattr(Series(dtype='m8[ns]'), method)()
+        assert result is pd.NaT
+
+    def test_nansum_buglet(self):
+        s = Series([1.0, np.nan], index=[0, 1])
+        result = np.nansum(s)
+        assert_almost_equal(result, 1)
+
+    @pytest.mark.parametrize("use_bottleneck", [True, False])
+    def test_sum_overflow(self, use_bottleneck):
+
+        with pd.option_context('use_bottleneck', use_bottleneck):
+            # GH 6915
+            # overflowing on the smaller int dtypes
+            for dtype in ['int32', 'int64']:
+                v = np.arange(5000000, dtype=dtype)
+                s = Series(v)
+
+                result = s.sum(skipna=False)
+                assert int(result) == v.sum(dtype='int64')
+                result = s.min(skipna=False)
+                assert int(result) == 0
+                result = s.max(skipna=False)
+                assert int(result) == v[-1]
+
+            for dtype in ['float32', 'float64']:
+                v = np.arange(5000000, dtype=dtype)
+                s = Series(v)
+
+                result = s.sum(skipna=False)
+                assert result == v.sum(dtype=dtype)
+                result = s.min(skipna=False)
+                assert np.allclose(float(result), 0.0)
+                result = s.max(skipna=False)
+                assert np.allclose(float(result), v[-1])
+
+    def test_sum(self):
+        self._check_stat_op('sum', np.sum, check_allna=False)
+
+    def test_sum_inf(self):
+        s = Series(np.random.randn(10))
+        s2 = s.copy()
+
+        s[5:8] = np.inf
+        s2[5:8] = np.nan
+
+        assert np.isinf(s.sum())
+
+        arr = np.random.randn(100, 100).astype('f4')
+        arr[:, 2] = np.inf
+
+        with pd.option_context("mode.use_inf_as_na", True):
+            assert_almost_equal(s.sum(), s2.sum())
+
+        res = nanops.nansum(arr, axis=1)
+        assert np.isinf(res).all()
+
+    def test_mean(self):
+        self._check_stat_op('mean', np.mean)
+
+    def test_median(self):
+        self._check_stat_op('median', np.median)
+
+        # test with integers, test failure
+        int_ts = Series(np.ones(10, dtype=int), index=lrange(10))
+        tm.assert_almost_equal(np.median(int_ts), int_ts.median())
+
+    def test_prod(self):
+        self._check_stat_op('prod', np.prod)
+
+    def test_min(self):
+        self._check_stat_op('min', np.min, check_objects=True)
+
+    def test_max(self):
+        self._check_stat_op('max', np.max, check_objects=True)
+
+    def test_var_std(self):
+        alt = lambda x: np.std(x, ddof=1)
+        self._check_stat_op('std', alt)
+
+        alt = lambda x: np.var(x, ddof=1)
+        self._check_stat_op('var', alt)
+
+        result = self.ts.std(ddof=4)
+        expected = np.std(self.ts.values, ddof=4)
+        assert_almost_equal(result, expected)
+
+        result = self.ts.var(ddof=4)
+        expected = np.var(self.ts.values, ddof=4)
+        assert_almost_equal(result, expected)
+
+        # 1 - element series with ddof=1
+        s = self.ts.iloc[[0]]
+        result = s.var(ddof=1)
+        assert isna(result)
+
+        result = s.std(ddof=1)
+        assert isna(result)
+
+    def test_sem(self):
+        alt = lambda x: np.std(x, ddof=1) / np.sqrt(len(x))
+        self._check_stat_op('sem', alt)
+
+        result = self.ts.sem(ddof=4)
+        expected = np.std(self.ts.values,
+                          ddof=4) / np.sqrt(len(self.ts.values))
+        assert_almost_equal(result, expected)
+
+        # 1 - element series with ddof=1
+        s = self.ts.iloc[[0]]
+        result = s.sem(ddof=1)
+        assert isna(result)
+
+    @td.skip_if_no_scipy
+    def test_skew(self):
+        from scipy.stats import skew
+        alt = lambda x: skew(x, bias=False)
+        self._check_stat_op('skew', alt)
+
+        # test corner cases, skew() returns NaN unless there's at least 3
+        # values
+        min_N = 3
+        for i in range(1, min_N + 1):
+            s = Series(np.ones(i))
+            df = DataFrame(np.ones((i, i)))
+            if i < min_N:
+                assert np.isnan(s.skew())
+                assert np.isnan(df.skew()).all()
+            else:
+                assert 0 == s.skew()
+                assert (df.skew() == 0).all()
+
+    @td.skip_if_no_scipy
+    def test_kurt(self):
+        from scipy.stats import kurtosis
+        alt = lambda x: kurtosis(x, bias=False)
+        self._check_stat_op('kurt', alt)
+
+        index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
+                           labels=[[0, 0, 0, 0, 0, 0], [0, 1, 2, 0, 1, 2],
+                                   [0, 1, 0, 1, 0, 1]])
+        s = Series(np.random.randn(6), index=index)
+        tm.assert_almost_equal(s.kurt(), s.kurt(level=0)['bar'])
+
+        # test corner cases, kurt() returns NaN unless there's at least 4
+        # values
+        min_N = 4
+        for i in range(1, min_N + 1):
+            s = Series(np.ones(i))
+            df = DataFrame(np.ones((i, i)))
+            if i < min_N:
+                assert np.isnan(s.kurt())
+                assert np.isnan(df.kurt()).all()
+            else:
+                assert 0 == s.kurt()
+                assert (df.kurt() == 0).all()
+
+    def test_describe(self):
+        s = Series([0, 1, 2, 3, 4], name='int_data')
+        result = s.describe()
+        expected = Series([5, 2, s.std(), 0, 1, 2, 3, 4],
+                          name='int_data',
+                          index=['count', 'mean', 'std', 'min', '25%',
+                                 '50%', '75%', 'max'])
+        tm.assert_series_equal(result, expected)
+
+        s = Series([True, True, False, False, False], name='bool_data')
+        result = s.describe()
+        expected = Series([5, 2, False, 3], name='bool_data',
+                          index=['count', 'unique', 'top', 'freq'])
+        tm.assert_series_equal(result, expected)
+
+        s = Series(['a', 'a', 'b', 'c', 'd'], name='str_data')
+        result = s.describe()
+        expected = Series([5, 4, 'a', 2], name='str_data',
+                          index=['count', 'unique', 'top', 'freq'])
+        tm.assert_series_equal(result, expected)
+
+    def test_argsort(self):
+        self._check_accum_op('argsort', check_dtype=False)
+        argsorted = self.ts.argsort()
+        assert issubclass(argsorted.dtype.type, np.integer)
+
+        # GH 2967 (introduced bug in 0.11-dev I think)
+        s = Series([Timestamp('201301%02d' % (i + 1)) for i in range(5)])
+        assert s.dtype == 'datetime64[ns]'
+        shifted = s.shift(-1)
+        assert shifted.dtype == 'datetime64[ns]'
+        assert isna(shifted[4])
+
+        result = s.argsort()
+        expected = Series(lrange(5), dtype='int64')
+        assert_series_equal(result, expected)
+
+        result = shifted.argsort()
+        expected = Series(lrange(4) + [-1], dtype='int64')
+        assert_series_equal(result, expected)
+
+    def test_argsort_stable(self):
+        s = Series(np.random.randint(0, 100, size=10000))
+        mindexer = s.argsort(kind='mergesort')
+        qindexer = s.argsort()
+
+        mexpected = np.argsort(s.values, kind='mergesort')
+        qexpected = np.argsort(s.values, kind='quicksort')
+
+        tm.assert_series_equal(mindexer, Series(mexpected),
+                               check_dtype=False)
+        tm.assert_series_equal(qindexer, Series(qexpected),
+                               check_dtype=False)
+        pytest.raises(AssertionError, tm.assert_numpy_array_equal,
+                      qindexer, mindexer)
+
+    def test_cumsum(self):
+        self._check_accum_op('cumsum')
+
+    def test_cumprod(self):
+        self._check_accum_op('cumprod')
+
+    def test_cummin(self):
+        tm.assert_numpy_array_equal(self.ts.cummin().values,
+                                    np.minimum.accumulate(np.array(self.ts)))
+        ts = self.ts.copy()
+        ts[::2] = np.NaN
+        result = ts.cummin()[1::2]
+        expected = np.minimum.accumulate(ts.dropna())
+
+        tm.assert_series_equal(result, expected)
+
+    def test_cummax(self):
+        tm.assert_numpy_array_equal(self.ts.cummax().values,
+                                    np.maximum.accumulate(np.array(self.ts)))
+        ts = self.ts.copy()
+        ts[::2] = np.NaN
+        result = ts.cummax()[1::2]
+        expected = np.maximum.accumulate(ts.dropna())
+
+        tm.assert_series_equal(result, expected)
+
+    def test_cummin_datetime64(self):
+        s = pd.Series(pd.to_datetime(['NaT', '2000-1-2', 'NaT', '2000-1-1',
+                                      'NaT', '2000-1-3']))
+
+        expected = pd.Series(pd.to_datetime(['NaT', '2000-1-2', 'NaT',
+                                             '2000-1-1', 'NaT', '2000-1-1']))
+        result = s.cummin(skipna=True)
+        tm.assert_series_equal(expected, result)
+
+        expected = pd.Series(pd.to_datetime(
+            ['NaT', '2000-1-2', '2000-1-2', '2000-1-1', '2000-1-1', '2000-1-1'
+             ]))
+        result = s.cummin(skipna=False)
+        tm.assert_series_equal(expected, result)
+
+    def test_cummax_datetime64(self):
+        s = pd.Series(pd.to_datetime(['NaT', '2000-1-2', 'NaT', '2000-1-1',
+                                      'NaT', '2000-1-3']))
+
+        expected = pd.Series(pd.to_datetime(['NaT', '2000-1-2', 'NaT',
+                                             '2000-1-2', 'NaT', '2000-1-3']))
+        result = s.cummax(skipna=True)
+        tm.assert_series_equal(expected, result)
+
+        expected = pd.Series(pd.to_datetime(
+            ['NaT', '2000-1-2', '2000-1-2', '2000-1-2', '2000-1-2', '2000-1-3'
+             ]))
+        result = s.cummax(skipna=False)
+        tm.assert_series_equal(expected, result)
+
+    def test_cummin_timedelta64(self):
+        s = pd.Series(pd.to_timedelta(['NaT',
+                                       '2 min',
+                                       'NaT',
+                                       '1 min',
+                                       'NaT',
+                                       '3 min', ]))
+
+        expected = pd.Series(pd.to_timedelta(['NaT',
+                                              '2 min',
+                                              'NaT',
+                                              '1 min',
+                                              'NaT',
+                                              '1 min', ]))
+        result = s.cummin(skipna=True)
+        tm.assert_series_equal(expected, result)
+
+        expected = pd.Series(pd.to_timedelta(['NaT',
+                                              '2 min',
+                                              '2 min',
+                                              '1 min',
+                                              '1 min',
+                                              '1 min', ]))
+        result = s.cummin(skipna=False)
+        tm.assert_series_equal(expected, result)
+
+    def test_cummax_timedelta64(self):
+        s = pd.Series(pd.to_timedelta(['NaT',
+                                       '2 min',
+                                       'NaT',
+                                       '1 min',
+                                       'NaT',
+                                       '3 min', ]))
+
+        expected = pd.Series(pd.to_timedelta(['NaT',
+                                              '2 min',
+                                              'NaT',
+                                              '2 min',
+                                              'NaT',
+                                              '3 min', ]))
+        result = s.cummax(skipna=True)
+        tm.assert_series_equal(expected, result)
+
+        expected = pd.Series(pd.to_timedelta(['NaT',
+                                              '2 min',
+                                              '2 min',
+                                              '2 min',
+                                              '2 min',
+                                              '3 min', ]))
+        result = s.cummax(skipna=False)
+        tm.assert_series_equal(expected, result)
+
+    def test_npdiff(self):
+        pytest.skip("skipping due to Series no longer being an "
+                    "ndarray")
+
+        # no longer works as the return type of np.diff is now nd.array
+        s = Series(np.arange(5))
+
+        r = np.diff(s)
+        assert_series_equal(Series([nan, 0, 0, 0, nan]), r)
+
+    def _check_stat_op(self, name, alternate, check_objects=False,
+                       check_allna=False):
+
+        with pd.option_context('use_bottleneck', False):
+            f = getattr(Series, name)
+
+            # add some NaNs
+            self.series[5:15] = np.NaN
+
+            # idxmax, idxmin, min, and max are valid for dates
+            if name not in ['max', 'min']:
+                ds = Series(date_range('1/1/2001', periods=10))
+                pytest.raises(TypeError, f, ds)
+
+            # skipna or no
+            assert notna(f(self.series))
+            assert isna(f(self.series, skipna=False))
+
+            # check the result is correct
+            nona = self.series.dropna()
+            assert_almost_equal(f(nona), alternate(nona.values))
+            assert_almost_equal(f(self.series), alternate(nona.values))
+
+            allna = self.series * nan
+
+            if check_allna:
+                assert np.isnan(f(allna))
+
+            # dtype=object with None, it works!
+            s = Series([1, 2, 3, None, 5])
+            f(s)
+
+            # 2888
+            l = [0]
+            l.extend(lrange(2 ** 40, 2 ** 40 + 1000))
+            s = Series(l, dtype='int64')
+            assert_almost_equal(float(f(s)), float(alternate(s.values)))
+
+            # check date range
+            if check_objects:
+                s = Series(bdate_range('1/1/2000', periods=10))
+                res = f(s)
+                exp = alternate(s)
+                assert res == exp
+
+            # check on string data
+            if name not in ['sum', 'min', 'max']:
+                pytest.raises(TypeError, f, Series(list('abc')))
+
+            # Invalid axis.
+            pytest.raises(ValueError, f, self.series, axis=1)
+
+            # Unimplemented numeric_only parameter.
+            if 'numeric_only' in compat.signature(f).args:
+                tm.assert_raises_regex(NotImplementedError, name, f,
+                                       self.series, numeric_only=True)
+
+    def _check_accum_op(self, name, check_dtype=True):
+        func = getattr(np, name)
+        tm.assert_numpy_array_equal(func(self.ts).values,
+                                    func(np.array(self.ts)),
+                                    check_dtype=check_dtype)
+
+        # with missing values
+        ts = self.ts.copy()
+        ts[::2] = np.NaN
+
+        result = func(ts)[1::2]
+        expected = func(np.array(ts.dropna()))
+
+        tm.assert_numpy_array_equal(result.values, expected,
+                                    check_dtype=False)
+
+    def test_compress(self):
+        cond = [True, False, True, False, False]
+        s = Series([1, -1, 5, 8, 7],
+                   index=list('abcde'), name='foo')
+        expected = Series(s.values.compress(cond),
+                          index=list('ac'), name='foo')
+        tm.assert_series_equal(s.compress(cond), expected)
+
+    def test_numpy_compress(self):
+        cond = [True, False, True, False, False]
+        s = Series([1, -1, 5, 8, 7],
+                   index=list('abcde'), name='foo')
+        expected = Series(s.values.compress(cond),
+                          index=list('ac'), name='foo')
+        tm.assert_series_equal(np.compress(cond, s), expected)
+
+        msg = "the 'axis' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.compress,
+                               cond, s, axis=1)
+
+        msg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.compress,
+                               cond, s, out=s)
+
+    def test_round(self):
+        self.ts.index.name = "index_name"
+        result = self.ts.round(2)
+        expected = Series(np.round(self.ts.values, 2),
+                          index=self.ts.index, name='ts')
+        assert_series_equal(result, expected)
+        assert result.name == self.ts.name
+
+    def test_numpy_round(self):
+        # See gh-12600
+        s = Series([1.53, 1.36, 0.06])
+        out = np.round(s, decimals=0)
+        expected = Series([2., 1., 0.])
+        assert_series_equal(out, expected)
+
+        msg = "the 'out' parameter is not supported"
+        with tm.assert_raises_regex(ValueError, msg):
+            np.round(s, decimals=0, out=s)
+
+    def test_built_in_round(self):
+        if not compat.PY3:
+            pytest.skip(
+                'build in round cannot be overridden prior to Python 3')
+
+        s = Series([1.123, 2.123, 3.123], index=lrange(3))
+        result = round(s)
+        expected_rounded0 = Series([1., 2., 3.], index=lrange(3))
+        tm.assert_series_equal(result, expected_rounded0)
+
+        decimals = 2
+        expected_rounded = Series([1.12, 2.12, 3.12], index=lrange(3))
+        result = round(s, decimals)
+        tm.assert_series_equal(result, expected_rounded)
+
+    def test_prod_numpy16_bug(self):
+        s = Series([1., 1., 1.], index=lrange(3))
+        result = s.prod()
+
+        assert not isinstance(result, Series)
+
+    def test_all_any(self):
+        ts = tm.makeTimeSeries()
+        bool_series = ts > 0
+        assert not bool_series.all()
+        assert bool_series.any()
+
+        # Alternative types, with implicit 'object' dtype.
+        s = Series(['abc', True])
+        assert 'abc' == s.any()  # 'abc' || True => 'abc'
+
+    def test_all_any_params(self):
+        # Check skipna, with implicit 'object' dtype.
+        s1 = Series([np.nan, True])
+        s2 = Series([np.nan, False])
+        assert s1.all(skipna=False)  # nan && True => True
+        assert s1.all(skipna=True)
+        assert np.isnan(s2.any(skipna=False))  # nan || False => nan
+        assert not s2.any(skipna=True)
+
+        # Check level.
+        s = pd.Series([False, False, True, True, False, True],
+                      index=[0, 0, 1, 1, 2, 2])
+        assert_series_equal(s.all(level=0), Series([False, True, False]))
+        assert_series_equal(s.any(level=0), Series([False, True, True]))
+
+        # bool_only is not implemented with level option.
+        pytest.raises(NotImplementedError, s.any, bool_only=True, level=0)
+        pytest.raises(NotImplementedError, s.all, bool_only=True, level=0)
+
+        # bool_only is not implemented alone.
+        pytest.raises(NotImplementedError, s.any, bool_only=True)
+        pytest.raises(NotImplementedError, s.all, bool_only=True)
+
+    def test_modulo(self):
+        with np.errstate(all='ignore'):
+
+            # GH3590, modulo as ints
+            p = DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+            result = p['first'] % p['second']
+            expected = Series(p['first'].values % p['second'].values,
+                              dtype='float64')
+            expected.iloc[0:3] = np.nan
+            assert_series_equal(result, expected)
+
+            result = p['first'] % 0
+            expected = Series(np.nan, index=p.index, name='first')
+            assert_series_equal(result, expected)
+
+            p = p.astype('float64')
+            result = p['first'] % p['second']
+            expected = Series(p['first'].values % p['second'].values)
+            assert_series_equal(result, expected)
+
+            p = p.astype('float64')
+            result = p['first'] % p['second']
+            result2 = p['second'] % p['first']
+            assert not result.equals(result2)
+
+            # GH 9144
+            s = Series([0, 1])
+
+            result = s % 0
+            expected = Series([nan, nan])
+            assert_series_equal(result, expected)
+
+            result = 0 % s
+            expected = Series([nan, 0.0])
+            assert_series_equal(result, expected)
+
+    @td.skip_if_no_scipy
+    def test_corr(self):
+        import scipy.stats as stats
+
+        # full overlap
+        tm.assert_almost_equal(self.ts.corr(self.ts), 1)
+
+        # partial overlap
+        tm.assert_almost_equal(self.ts[:15].corr(self.ts[5:]), 1)
+
+        assert isna(self.ts[:15].corr(self.ts[5:], min_periods=12))
+
+        ts1 = self.ts[:15].reindex(self.ts.index)
+        ts2 = self.ts[5:].reindex(self.ts.index)
+        assert isna(ts1.corr(ts2, min_periods=12))
+
+        # No overlap
+        assert np.isnan(self.ts[::2].corr(self.ts[1::2]))
+
+        # all NA
+        cp = self.ts[:10].copy()
+        cp[:] = np.nan
+        assert isna(cp.corr(cp))
+
+        A = tm.makeTimeSeries()
+        B = tm.makeTimeSeries()
+        result = A.corr(B)
+        expected, _ = stats.pearsonr(A, B)
+        tm.assert_almost_equal(result, expected)
+
+    @td.skip_if_no_scipy
+    def test_corr_rank(self):
+        import scipy
+        import scipy.stats as stats
+
+        # kendall and spearman
+        A = tm.makeTimeSeries()
+        B = tm.makeTimeSeries()
+        A[-5:] = A[:5]
+        result = A.corr(B, method='kendall')
+        expected = stats.kendalltau(A, B)[0]
+        tm.assert_almost_equal(result, expected)
+
+        result = A.corr(B, method='spearman')
+        expected = stats.spearmanr(A, B)[0]
+        tm.assert_almost_equal(result, expected)
+
+        # these methods got rewritten in 0.8
+        if LooseVersion(scipy.__version__) < LooseVersion('0.9'):
+            pytest.skip("skipping corr rank because of scipy version "
+                        "{0}".format(scipy.__version__))
+
+        # results from R
+        A = Series(
+            [-0.89926396, 0.94209606, -1.03289164, -0.95445587, 0.76910310, -
+             0.06430576, -2.09704447, 0.40660407, -0.89926396, 0.94209606])
+        B = Series(
+            [-1.01270225, -0.62210117, -1.56895827, 0.59592943, -0.01680292,
+             1.17258718, -1.06009347, -0.10222060, -0.89076239, 0.89372375])
+        kexp = 0.4319297
+        sexp = 0.5853767
+        tm.assert_almost_equal(A.corr(B, method='kendall'), kexp)
+        tm.assert_almost_equal(A.corr(B, method='spearman'), sexp)
+
+    def test_cov(self):
+        # full overlap
+        tm.assert_almost_equal(self.ts.cov(self.ts), self.ts.std() ** 2)
+
+        # partial overlap
+        tm.assert_almost_equal(self.ts[:15].cov(self.ts[5:]),
+                               self.ts[5:15].std() ** 2)
+
+        # No overlap
+        assert np.isnan(self.ts[::2].cov(self.ts[1::2]))
+
+        # all NA
+        cp = self.ts[:10].copy()
+        cp[:] = np.nan
+        assert isna(cp.cov(cp))
+
+        # min_periods
+        assert isna(self.ts[:15].cov(self.ts[5:], min_periods=12))
+
+        ts1 = self.ts[:15].reindex(self.ts.index)
+        ts2 = self.ts[5:].reindex(self.ts.index)
+        assert isna(ts1.cov(ts2, min_periods=12))
+
+    def test_count(self):
+        assert self.ts.count() == len(self.ts)
+
+        self.ts[::2] = np.NaN
+
+        assert self.ts.count() == np.isfinite(self.ts).sum()
+
+        mi = MultiIndex.from_arrays([list('aabbcc'), [1, 2, 2, nan, 1, 2]])
+        ts = Series(np.arange(len(mi)), index=mi)
+
+        left = ts.count(level=1)
+        right = Series([2, 3, 1], index=[1, 2, nan])
+        assert_series_equal(left, right)
+
+        ts.iloc[[0, 3, 5]] = nan
+        assert_series_equal(ts.count(level=1), right - 1)
+
+    def test_dot(self):
+        a = Series(np.random.randn(4), index=['p', 'q', 'r', 's'])
+        b = DataFrame(np.random.randn(3, 4), index=['1', '2', '3'],
+                      columns=['p', 'q', 'r', 's']).T
+
+        result = a.dot(b)
+        expected = Series(np.dot(a.values, b.values), index=['1', '2', '3'])
+        assert_series_equal(result, expected)
+
+        # Check index alignment
+        b2 = b.reindex(index=reversed(b.index))
+        result = a.dot(b)
+        assert_series_equal(result, expected)
+
+        # Check ndarray argument
+        result = a.dot(b.values)
+        assert np.all(result == expected.values)
+        assert_almost_equal(a.dot(b['2'].values), expected['2'])
+
+        # Check series argument
+        assert_almost_equal(a.dot(b['1']), expected['1'])
+        assert_almost_equal(a.dot(b2['1']), expected['1'])
+
+        pytest.raises(Exception, a.dot, a.values[:3])
+        pytest.raises(ValueError, a.dot, b.T)
+
+    @pytest.mark.skipif(not PY35,
+                        reason='matmul supported for Python>=3.5')
+    def test_matmul(self):
+        # matmul test is for GH #10259
+        a = Series(np.random.randn(4), index=['p', 'q', 'r', 's'])
+        b = DataFrame(np.random.randn(3, 4), index=['1', '2', '3'],
+                      columns=['p', 'q', 'r', 's']).T
+
+        # Series @ DataFrame
+        result = operator.matmul(a, b)
+        expected = Series(np.dot(a.values, b.values), index=['1', '2', '3'])
+        assert_series_equal(result, expected)
+
+        # DataFrame @ Series
+        result = operator.matmul(b.T, a)
+        expected = Series(np.dot(b.T.values, a.T.values),
+                          index=['1', '2', '3'])
+        assert_series_equal(result, expected)
+
+        # Series @ Series
+        result = operator.matmul(a, a)
+        expected = np.dot(a.values, a.values)
+        assert_almost_equal(result, expected)
+
+        # GH 21530
+        # vector (1D np.array) @ Series (__rmatmul__)
+        result = operator.matmul(a.values, a)
+        expected = np.dot(a.values, a.values)
+        assert_almost_equal(result, expected)
+
+        # GH 21530
+        # vector (1D list) @ Series (__rmatmul__)
+        result = operator.matmul(a.values.tolist(), a)
+        expected = np.dot(a.values, a.values)
+        assert_almost_equal(result, expected)
+
+        # GH 21530
+        # matrix (2D np.array) @ Series (__rmatmul__)
+        result = operator.matmul(b.T.values, a)
+        expected = np.dot(b.T.values, a.values)
+        assert_almost_equal(result, expected)
+
+        # GH 21530
+        # matrix (2D nested lists) @ Series (__rmatmul__)
+        result = operator.matmul(b.T.values.tolist(), a)
+        expected = np.dot(b.T.values, a.values)
+        assert_almost_equal(result, expected)
+
+        # mixed dtype DataFrame @ Series
+        a['p'] = int(a.p)
+        result = operator.matmul(b.T, a)
+        expected = Series(np.dot(b.T.values, a.T.values),
+                          index=['1', '2', '3'])
+        assert_series_equal(result, expected)
+
+        # different dtypes DataFrame @ Series
+        a = a.astype(int)
+        result = operator.matmul(b.T, a)
+        expected = Series(np.dot(b.T.values, a.T.values),
+                          index=['1', '2', '3'])
+        assert_series_equal(result, expected)
+
+        pytest.raises(Exception, a.dot, a.values[:3])
+        pytest.raises(ValueError, a.dot, b.T)
+
+    def test_value_counts_nunique(self):
+
+        # basics.rst doc example
+        series = Series(np.random.randn(500))
+        series[20:500] = np.nan
+        series[10:20] = 5000
+        result = series.nunique()
+        assert result == 11
+
+        # GH 18051
+        s = pd.Series(pd.Categorical([]))
+        assert s.nunique() == 0
+        s = pd.Series(pd.Categorical([np.nan]))
+        assert s.nunique() == 0
+
+    def test_unique(self):
+
+        # 714 also, dtype=float
+        s = Series([1.2345] * 100)
+        s[::2] = np.nan
+        result = s.unique()
+        assert len(result) == 2
+
+        s = Series([1.2345] * 100, dtype='f4')
+        s[::2] = np.nan
+        result = s.unique()
+        assert len(result) == 2
+
+        # NAs in object arrays #714
+        s = Series(['foo'] * 100, dtype='O')
+        s[::2] = np.nan
+        result = s.unique()
+        assert len(result) == 2
+
+        # decision about None
+        s = Series([1, 2, 3, None, None, None], dtype=object)
+        result = s.unique()
+        expected = np.array([1, 2, 3, None], dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        # GH 18051
+        s = pd.Series(pd.Categorical([]))
+        tm.assert_categorical_equal(s.unique(), pd.Categorical([]),
+                                    check_dtype=False)
+        s = pd.Series(pd.Categorical([np.nan]))
+        tm.assert_categorical_equal(s.unique(), pd.Categorical([np.nan]),
+                                    check_dtype=False)
+
+    @pytest.mark.parametrize(
+        "tc1, tc2",
+        [
+            (
+                Series([1, 2, 3, 3], dtype=np.dtype('int_')),
+                Series([1, 2, 3, 5, 3, 2, 4], dtype=np.dtype('int_'))
+            ),
+            (
+                Series([1, 2, 3, 3], dtype=np.dtype('uint')),
+                Series([1, 2, 3, 5, 3, 2, 4], dtype=np.dtype('uint'))
+            ),
+            (
+                Series([1, 2, 3, 3], dtype=np.dtype('float_')),
+                Series([1, 2, 3, 5, 3, 2, 4], dtype=np.dtype('float_'))
+            ),
+            (
+                Series([1, 2, 3, 3], dtype=np.dtype('unicode_')),
+                Series([1, 2, 3, 5, 3, 2, 4], dtype=np.dtype('unicode_'))
+            )
+        ]
+    )
+    def test_drop_duplicates_non_bool(self, tc1, tc2):
+        # Test case 1
+        expected = Series([False, False, False, True])
+        assert_series_equal(tc1.duplicated(), expected)
+        assert_series_equal(tc1.drop_duplicates(), tc1[~expected])
+        sc = tc1.copy()
+        sc.drop_duplicates(inplace=True)
+        assert_series_equal(sc, tc1[~expected])
+
+        expected = Series([False, False, True, False])
+        assert_series_equal(tc1.duplicated(keep='last'), expected)
+        assert_series_equal(tc1.drop_duplicates(keep='last'), tc1[~expected])
+        sc = tc1.copy()
+        sc.drop_duplicates(keep='last', inplace=True)
+        assert_series_equal(sc, tc1[~expected])
+
+        expected = Series([False, False, True, True])
+        assert_series_equal(tc1.duplicated(keep=False), expected)
+        assert_series_equal(tc1.drop_duplicates(keep=False), tc1[~expected])
+        sc = tc1.copy()
+        sc.drop_duplicates(keep=False, inplace=True)
+        assert_series_equal(sc, tc1[~expected])
+
+        # Test case 2
+        expected = Series([False, False, False, False, True, True, False])
+        assert_series_equal(tc2.duplicated(), expected)
+        assert_series_equal(tc2.drop_duplicates(), tc2[~expected])
+        sc = tc2.copy()
+        sc.drop_duplicates(inplace=True)
+        assert_series_equal(sc, tc2[~expected])
+
+        expected = Series([False, True, True, False, False, False, False])
+        assert_series_equal(tc2.duplicated(keep='last'), expected)
+        assert_series_equal(tc2.drop_duplicates(keep='last'), tc2[~expected])
+        sc = tc2.copy()
+        sc.drop_duplicates(keep='last', inplace=True)
+        assert_series_equal(sc, tc2[~expected])
+
+        expected = Series([False, True, True, False, True, True, False])
+        assert_series_equal(tc2.duplicated(keep=False), expected)
+        assert_series_equal(tc2.drop_duplicates(keep=False), tc2[~expected])
+        sc = tc2.copy()
+        sc.drop_duplicates(keep=False, inplace=True)
+        assert_series_equal(sc, tc2[~expected])
+
+    def test_drop_duplicates_bool(self):
+        tc = Series([True, False, True, False])
+
+        expected = Series([False, False, True, True])
+        assert_series_equal(tc.duplicated(), expected)
+        assert_series_equal(tc.drop_duplicates(), tc[~expected])
+        sc = tc.copy()
+        sc.drop_duplicates(inplace=True)
+        assert_series_equal(sc, tc[~expected])
+
+        expected = Series([True, True, False, False])
+        assert_series_equal(tc.duplicated(keep='last'), expected)
+        assert_series_equal(tc.drop_duplicates(keep='last'), tc[~expected])
+        sc = tc.copy()
+        sc.drop_duplicates(keep='last', inplace=True)
+        assert_series_equal(sc, tc[~expected])
+
+        expected = Series([True, True, True, True])
+        assert_series_equal(tc.duplicated(keep=False), expected)
+        assert_series_equal(tc.drop_duplicates(keep=False), tc[~expected])
+        sc = tc.copy()
+        sc.drop_duplicates(keep=False, inplace=True)
+        assert_series_equal(sc, tc[~expected])
+
+    def test_clip(self):
+        val = self.ts.median()
+
+        assert self.ts.clip_lower(val).min() == val
+        assert self.ts.clip_upper(val).max() == val
+
+        assert self.ts.clip(lower=val).min() == val
+        assert self.ts.clip(upper=val).max() == val
+
+        result = self.ts.clip(-0.5, 0.5)
+        expected = np.clip(self.ts, -0.5, 0.5)
+        assert_series_equal(result, expected)
+        assert isinstance(expected, Series)
+
+    def test_clip_types_and_nulls(self):
+
+        sers = [Series([np.nan, 1.0, 2.0, 3.0]), Series([None, 'a', 'b', 'c']),
+                Series(pd.to_datetime(
+                    [np.nan, 1, 2, 3], unit='D'))]
+
+        for s in sers:
+            thresh = s[2]
+            l = s.clip_lower(thresh)
+            u = s.clip_upper(thresh)
+            assert l[notna(l)].min() == thresh
+            assert u[notna(u)].max() == thresh
+            assert list(isna(s)) == list(isna(l))
+            assert list(isna(s)) == list(isna(u))
+
+    def test_clip_with_na_args(self):
+        """Should process np.nan argument as None """
+        # GH # 17276
+        s = Series([1, 2, 3])
+
+        assert_series_equal(s.clip(np.nan), Series([1, 2, 3]))
+        assert_series_equal(s.clip(upper=[1, 1, np.nan]), Series([1, 2, 3]))
+        assert_series_equal(s.clip(lower=[1, np.nan, 1]), Series([1, 2, 3]))
+        assert_series_equal(s.clip(upper=np.nan, lower=np.nan),
+                            Series([1, 2, 3]))
+
+    def test_clip_against_series(self):
+        # GH #6966
+
+        s = Series([1.0, 1.0, 4.0])
+        threshold = Series([1.0, 2.0, 3.0])
+
+        assert_series_equal(s.clip_lower(threshold), Series([1.0, 2.0, 4.0]))
+        assert_series_equal(s.clip_upper(threshold), Series([1.0, 1.0, 3.0]))
+
+        lower = Series([1.0, 2.0, 3.0])
+        upper = Series([1.5, 2.5, 3.5])
+
+        assert_series_equal(s.clip(lower, upper), Series([1.0, 2.0, 3.5]))
+        assert_series_equal(s.clip(1.5, upper), Series([1.5, 1.5, 3.5]))
+
+    @pytest.mark.parametrize("inplace", [True, False])
+    @pytest.mark.parametrize("upper", [[1, 2, 3], np.asarray([1, 2, 3])])
+    def test_clip_against_list_like(self, inplace, upper):
+        # GH #15390
+        original = pd.Series([5, 6, 7])
+        result = original.clip(upper=upper, inplace=inplace)
+        expected = pd.Series([1, 2, 3])
+
+        if inplace:
+            result = original
+        tm.assert_series_equal(result, expected, check_exact=True)
+
+    def test_clip_with_datetimes(self):
+
+        # GH 11838
+        # naive and tz-aware datetimes
+
+        t = Timestamp('2015-12-01 09:30:30')
+        s = Series([Timestamp('2015-12-01 09:30:00'),
+                    Timestamp('2015-12-01 09:31:00')])
+        result = s.clip(upper=t)
+        expected = Series([Timestamp('2015-12-01 09:30:00'),
+                           Timestamp('2015-12-01 09:30:30')])
+        assert_series_equal(result, expected)
+
+        t = Timestamp('2015-12-01 09:30:30', tz='US/Eastern')
+        s = Series([Timestamp('2015-12-01 09:30:00', tz='US/Eastern'),
+                    Timestamp('2015-12-01 09:31:00', tz='US/Eastern')])
+        result = s.clip(upper=t)
+        expected = Series([Timestamp('2015-12-01 09:30:00', tz='US/Eastern'),
+                           Timestamp('2015-12-01 09:30:30', tz='US/Eastern')])
+        assert_series_equal(result, expected)
+
+    def test_cummethods_bool(self):
+        # GH 6270
+        # looks like a buggy np.maximum.accumulate for numpy 1.6.1, py 3.2
+        def cummin(x):
+            return np.minimum.accumulate(x)
+
+        def cummax(x):
+            return np.maximum.accumulate(x)
+
+        a = pd.Series([False, False, False, True, True, False, False])
+        b = ~a
+        c = pd.Series([False] * len(b))
+        d = ~c
+        methods = {'cumsum': np.cumsum,
+                   'cumprod': np.cumprod,
+                   'cummin': cummin,
+                   'cummax': cummax}
+        args = product((a, b, c, d), methods)
+        for s, method in args:
+            expected = Series(methods[method](s.values))
+            result = getattr(s, method)()
+            assert_series_equal(result, expected)
+
+        e = pd.Series([False, True, nan, False])
+        cse = pd.Series([0, 1, nan, 1], dtype=object)
+        cpe = pd.Series([False, 0, nan, 0])
+        cmin = pd.Series([False, False, nan, False])
+        cmax = pd.Series([False, True, nan, True])
+        expecteds = {'cumsum': cse,
+                     'cumprod': cpe,
+                     'cummin': cmin,
+                     'cummax': cmax}
+
+        for method in methods:
+            res = getattr(e, method)()
+            assert_series_equal(res, expecteds[method])
+
+    def test_isin(self):
+        s = Series(['A', 'B', 'C', 'a', 'B', 'B', 'A', 'C'])
+
+        result = s.isin(['A', 'C'])
+        expected = Series([True, False, True, False, False, False, True, True])
+        assert_series_equal(result, expected)
+
+        # GH: 16012
+        # This specific issue has to have a series over 1e6 in len, but the
+        # comparison array (in_list) must be large enough so that numpy doesn't
+        # do a manual masking trick that will avoid this issue altogether
+        s = Series(list('abcdefghijk' * 10 ** 5))
+        # If numpy doesn't do the manual comparison/mask, these
+        # unorderable mixed types are what cause the exception in numpy
+        in_list = [-1, 'a', 'b', 'G', 'Y', 'Z', 'E',
+                   'K', 'E', 'S', 'I', 'R', 'R'] * 6
+
+        assert s.isin(in_list).sum() == 200000
+
+    def test_isin_with_string_scalar(self):
+        # GH4763
+        s = Series(['A', 'B', 'C', 'a', 'B', 'B', 'A', 'C'])
+        with pytest.raises(TypeError):
+            s.isin('a')
+
+        with pytest.raises(TypeError):
+            s = Series(['aaa', 'b', 'c'])
+            s.isin('aaa')
+
+    def test_isin_with_i8(self):
+        # GH 5021
+
+        expected = Series([True, True, False, False, False])
+        expected2 = Series([False, True, False, False, False])
+
+        # datetime64[ns]
+        s = Series(date_range('jan-01-2013', 'jan-05-2013'))
+
+        result = s.isin(s[0:2])
+        assert_series_equal(result, expected)
+
+        result = s.isin(s[0:2].values)
+        assert_series_equal(result, expected)
+
+        # fails on dtype conversion in the first place
+        result = s.isin(s[0:2].values.astype('datetime64[D]'))
+        assert_series_equal(result, expected)
+
+        result = s.isin([s[1]])
+        assert_series_equal(result, expected2)
+
+        result = s.isin([np.datetime64(s[1])])
+        assert_series_equal(result, expected2)
+
+        result = s.isin(set(s[0:2]))
+        assert_series_equal(result, expected)
+
+        # timedelta64[ns]
+        s = Series(pd.to_timedelta(lrange(5), unit='d'))
+        result = s.isin(s[0:2])
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("empty", [[], Series(), np.array([])])
+    def test_isin_empty(self, empty):
+        # see gh-16991
+        s = Series(["a", "b"])
+        expected = Series([False, False])
+
+        result = s.isin(empty)
+        tm.assert_series_equal(expected, result)
+
+    def test_timedelta64_analytics(self):
+        from pandas import date_range
+
+        # index min/max
+        td = Series(date_range('2012-1-1', periods=3, freq='D')) - \
+            Timestamp('20120101')
+
+        result = td.idxmin()
+        assert result == 0
+
+        result = td.idxmax()
+        assert result == 2
+
+        # GH 2982
+        # with NaT
+        td[0] = np.nan
+
+        result = td.idxmin()
+        assert result == 1
+
+        result = td.idxmax()
+        assert result == 2
+
+        # abs
+        s1 = Series(date_range('20120101', periods=3))
+        s2 = Series(date_range('20120102', periods=3))
+        expected = Series(s2 - s1)
+
+        # this fails as numpy returns timedelta64[us]
+        # result = np.abs(s1-s2)
+        # assert_frame_equal(result,expected)
+
+        result = (s1 - s2).abs()
+        assert_series_equal(result, expected)
+
+        # max/min
+        result = td.max()
+        expected = Timedelta('2 days')
+        assert result == expected
+
+        result = td.min()
+        expected = Timedelta('1 days')
+        assert result == expected
+
+    def test_idxmin(self):
+        # test idxmin
+        # _check_stat_op approach can not be used here because of isna check.
+
+        # add some NaNs
+        self.series[5:15] = np.NaN
+
+        # skipna or no
+        assert self.series[self.series.idxmin()] == self.series.min()
+        assert isna(self.series.idxmin(skipna=False))
+
+        # no NaNs
+        nona = self.series.dropna()
+        assert nona[nona.idxmin()] == nona.min()
+        assert (nona.index.values.tolist().index(nona.idxmin()) ==
+                nona.values.argmin())
+
+        # all NaNs
+        allna = self.series * nan
+        assert isna(allna.idxmin())
+
+        # datetime64[ns]
+        from pandas import date_range
+        s = Series(date_range('20130102', periods=6))
+        result = s.idxmin()
+        assert result == 0
+
+        s[0] = np.nan
+        result = s.idxmin()
+        assert result == 1
+
+    def test_numpy_argmin_deprecated(self):
+        # See gh-16830
+        data = np.arange(1, 11)
+
+        s = Series(data, index=data)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # The deprecation of Series.argmin also causes a deprecation
+            # warning when calling np.argmin. This behavior is temporary
+            # until the implementation of Series.argmin is corrected.
+            result = np.argmin(s)
+
+        assert result == 1
+
+        with tm.assert_produces_warning(FutureWarning):
+            # argmin is aliased to idxmin
+            result = s.argmin()
+
+        assert result == 1
+
+        if not _np_version_under1p10:
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                msg = "the 'out' parameter is not supported"
+                tm.assert_raises_regex(ValueError, msg, np.argmin,
+                                       s, out=data)
+
+    def test_idxmax(self):
+        # test idxmax
+        # _check_stat_op approach can not be used here because of isna check.
+
+        # add some NaNs
+        self.series[5:15] = np.NaN
+
+        # skipna or no
+        assert self.series[self.series.idxmax()] == self.series.max()
+        assert isna(self.series.idxmax(skipna=False))
+
+        # no NaNs
+        nona = self.series.dropna()
+        assert nona[nona.idxmax()] == nona.max()
+        assert (nona.index.values.tolist().index(nona.idxmax()) ==
+                nona.values.argmax())
+
+        # all NaNs
+        allna = self.series * nan
+        assert isna(allna.idxmax())
+
+        from pandas import date_range
+        s = Series(date_range('20130102', periods=6))
+        result = s.idxmax()
+        assert result == 5
+
+        s[5] = np.nan
+        result = s.idxmax()
+        assert result == 4
+
+        # Float64Index
+        # GH 5914
+        s = pd.Series([1, 2, 3], [1.1, 2.1, 3.1])
+        result = s.idxmax()
+        assert result == 3.1
+        result = s.idxmin()
+        assert result == 1.1
+
+        s = pd.Series(s.index, s.index)
+        result = s.idxmax()
+        assert result == 3.1
+        result = s.idxmin()
+        assert result == 1.1
+
+    def test_numpy_argmax_deprecated(self):
+        # See gh-16830
+        data = np.arange(1, 11)
+
+        s = Series(data, index=data)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # The deprecation of Series.argmax also causes a deprecation
+            # warning when calling np.argmax. This behavior is temporary
+            # until the implementation of Series.argmax is corrected.
+            result = np.argmax(s)
+        assert result == 10
+
+        with tm.assert_produces_warning(FutureWarning):
+            # argmax is aliased to idxmax
+            result = s.argmax()
+
+        assert result == 10
+
+        if not _np_version_under1p10:
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                msg = "the 'out' parameter is not supported"
+                tm.assert_raises_regex(ValueError, msg, np.argmax,
+                                       s, out=data)
+
+    def test_ptp(self):
+        N = 1000
+        arr = np.random.randn(N)
+        ser = Series(arr)
+        assert np.ptp(ser) == np.ptp(arr)
+
+        # GH11163
+        s = Series([3, 5, np.nan, -3, 10])
+        assert s.ptp() == 13
+        assert pd.isna(s.ptp(skipna=False))
+
+        mi = pd.MultiIndex.from_product([['a', 'b'], [1, 2, 3]])
+        s = pd.Series([1, np.nan, 7, 3, 5, np.nan], index=mi)
+
+        expected = pd.Series([6, 2], index=['a', 'b'], dtype=np.float64)
+        tm.assert_series_equal(s.ptp(level=0), expected)
+
+        expected = pd.Series([np.nan, np.nan], index=['a', 'b'])
+        tm.assert_series_equal(s.ptp(level=0, skipna=False), expected)
+
+        with pytest.raises(ValueError):
+            s.ptp(axis=1)
+
+        s = pd.Series(['a', 'b', 'c', 'd', 'e'])
+        with pytest.raises(TypeError):
+            s.ptp()
+
+        with pytest.raises(NotImplementedError):
+            s.ptp(numeric_only=True)
+
+    def test_empty_timeseries_redections_return_nat(self):
+        # covers #11245
+        for dtype in ('m8[ns]', 'm8[ns]', 'M8[ns]', 'M8[ns, UTC]'):
+            assert Series([], dtype=dtype).min() is pd.NaT
+            assert Series([], dtype=dtype).max() is pd.NaT
+
+    def test_unique_data_ownership(self):
+        # it works! #1807
+        Series(Series(["a", "c", "b"]).unique()).sort_values()
+
+    def test_repeat(self):
+        s = Series(np.random.randn(3), index=['a', 'b', 'c'])
+
+        reps = s.repeat(5)
+        exp = Series(s.values.repeat(5), index=s.index.values.repeat(5))
+        assert_series_equal(reps, exp)
+
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.repeat(reps=5)
+            assert_series_equal(result, exp)
+
+        to_rep = [2, 3, 4]
+        reps = s.repeat(to_rep)
+        exp = Series(s.values.repeat(to_rep),
+                     index=s.index.values.repeat(to_rep))
+        assert_series_equal(reps, exp)
+
+    def test_numpy_repeat(self):
+        s = Series(np.arange(3), name='x')
+        expected = Series(s.values.repeat(2), name='x',
+                          index=s.index.values.repeat(2))
+        assert_series_equal(np.repeat(s, 2), expected)
+
+        msg = "the 'axis' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.repeat, s, 2, axis=0)
+
+    def test_searchsorted(self):
+        s = Series([1, 2, 3])
+
+        idx = s.searchsorted(1, side='left')
+        tm.assert_numpy_array_equal(idx, np.array([0], dtype=np.intp))
+
+        idx = s.searchsorted(1, side='right')
+        tm.assert_numpy_array_equal(idx, np.array([1], dtype=np.intp))
+
+        with tm.assert_produces_warning(FutureWarning):
+            idx = s.searchsorted(v=1, side='left')
+            tm.assert_numpy_array_equal(idx, np.array([0], dtype=np.intp))
+
+    def test_searchsorted_numeric_dtypes_scalar(self):
+        s = Series([1, 2, 90, 1000, 3e9])
+        r = s.searchsorted(30)
+        e = 2
+        assert r == e
+
+        r = s.searchsorted([30])
+        e = np.array([2], dtype=np.intp)
+        tm.assert_numpy_array_equal(r, e)
+
+    def test_searchsorted_numeric_dtypes_vector(self):
+        s = Series([1, 2, 90, 1000, 3e9])
+        r = s.searchsorted([91, 2e6])
+        e = np.array([3, 4], dtype=np.intp)
+        tm.assert_numpy_array_equal(r, e)
+
+    def test_search_sorted_datetime64_scalar(self):
+        s = Series(pd.date_range('20120101', periods=10, freq='2D'))
+        v = pd.Timestamp('20120102')
+        r = s.searchsorted(v)
+        e = 1
+        assert r == e
+
+    def test_search_sorted_datetime64_list(self):
+        s = Series(pd.date_range('20120101', periods=10, freq='2D'))
+        v = [pd.Timestamp('20120102'), pd.Timestamp('20120104')]
+        r = s.searchsorted(v)
+        e = np.array([1, 2], dtype=np.intp)
+        tm.assert_numpy_array_equal(r, e)
+
+    def test_searchsorted_sorter(self):
+        # GH8490
+        s = Series([3, 1, 2])
+        r = s.searchsorted([0, 3], sorter=np.argsort(s))
+        e = np.array([0, 2], dtype=np.intp)
+        tm.assert_numpy_array_equal(r, e)
+
+    def test_is_unique(self):
+        # GH11946
+        s = Series(np.random.randint(0, 10, size=1000))
+        assert not s.is_unique
+        s = Series(np.arange(1000))
+        assert s.is_unique
+
+    def test_is_unique_class_ne(self, capsys):
+        # GH 20661
+        class Foo(object):
+            def __init__(self, val):
+                self._value = val
+
+            def __ne__(self, other):
+                raise Exception("NEQ not supported")
+
+        li = [Foo(i) for i in range(5)]
+        s = pd.Series(li, index=[i for i in range(5)])
+        _, err = capsys.readouterr()
+        s.is_unique
+        _, err = capsys.readouterr()
+        assert len(err) == 0
+
+    def test_is_monotonic(self):
+
+        s = Series(np.random.randint(0, 10, size=1000))
+        assert not s.is_monotonic
+        s = Series(np.arange(1000))
+        assert s.is_monotonic
+        assert s.is_monotonic_increasing
+        s = Series(np.arange(1000, 0, -1))
+        assert s.is_monotonic_decreasing
+
+        s = Series(pd.date_range('20130101', periods=10))
+        assert s.is_monotonic
+        assert s.is_monotonic_increasing
+        s = Series(list(reversed(s.tolist())))
+        assert not s.is_monotonic
+        assert s.is_monotonic_decreasing
+
+    def test_sort_index_level(self):
+        mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
+        s = Series([1, 2], mi)
+        backwards = s.iloc[[1, 0]]
+
+        res = s.sort_index(level='A')
+        assert_series_equal(backwards, res)
+
+        res = s.sort_index(level=['A', 'B'])
+        assert_series_equal(backwards, res)
+
+        res = s.sort_index(level='A', sort_remaining=False)
+        assert_series_equal(s, res)
+
+        res = s.sort_index(level=['A', 'B'], sort_remaining=False)
+        assert_series_equal(s, res)
+
+    def test_apply_categorical(self):
+        values = pd.Categorical(list('ABBABCD'), categories=list('DCBA'),
+                                ordered=True)
+        s = pd.Series(values, name='XX', index=list('abcdefg'))
+        result = s.apply(lambda x: x.lower())
+
+        # should be categorical dtype when the number of categories are
+        # the same
+        values = pd.Categorical(list('abbabcd'), categories=list('dcba'),
+                                ordered=True)
+        exp = pd.Series(values, name='XX', index=list('abcdefg'))
+        tm.assert_series_equal(result, exp)
+        tm.assert_categorical_equal(result.values, exp.values)
+
+        result = s.apply(lambda x: 'A')
+        exp = pd.Series(['A'] * 7, name='XX', index=list('abcdefg'))
+        tm.assert_series_equal(result, exp)
+        assert result.dtype == np.object
+
+    def test_shift_int(self):
+        ts = self.ts.astype(int)
+        shifted = ts.shift(1)
+        expected = ts.astype(float).shift(1)
+        assert_series_equal(shifted, expected)
+
+    def test_shift_categorical(self):
+        # GH 9416
+        s = pd.Series(['a', 'b', 'c', 'd'], dtype='category')
+
+        assert_series_equal(s.iloc[:-1], s.shift(1).shift(-1).dropna())
+
+        sp1 = s.shift(1)
+        assert_index_equal(s.index, sp1.index)
+        assert np.all(sp1.values.codes[:1] == -1)
+        assert np.all(s.values.codes[:-1] == sp1.values.codes[1:])
+
+        sn2 = s.shift(-2)
+        assert_index_equal(s.index, sn2.index)
+        assert np.all(sn2.values.codes[-2:] == -1)
+        assert np.all(s.values.codes[2:] == sn2.values.codes[:-2])
+
+        assert_index_equal(s.values.categories, sp1.values.categories)
+        assert_index_equal(s.values.categories, sn2.values.categories)
+
+    def test_unstack(self):
+        from numpy import nan
+
+        index = MultiIndex(levels=[['bar', 'foo'], ['one', 'three', 'two']],
+                           labels=[[1, 1, 0, 0], [0, 1, 0, 2]])
+
+        s = Series(np.arange(4.), index=index)
+        unstacked = s.unstack()
+
+        expected = DataFrame([[2., nan, 3.], [0., 1., nan]],
+                             index=['bar', 'foo'],
+                             columns=['one', 'three', 'two'])
+
+        assert_frame_equal(unstacked, expected)
+
+        unstacked = s.unstack(level=0)
+        assert_frame_equal(unstacked, expected.T)
+
+        index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
+                           labels=[[0, 0, 0, 0, 0, 0], [0, 1, 2, 0, 1, 2],
+                                   [0, 1, 0, 1, 0, 1]])
+        s = Series(np.random.randn(6), index=index)
+        exp_index = MultiIndex(levels=[['one', 'two', 'three'], [0, 1]],
+                               labels=[[0, 1, 2, 0, 1, 2], [0, 1, 0, 1, 0, 1]])
+        expected = DataFrame({'bar': s.values},
+                             index=exp_index).sort_index(level=0)
+        unstacked = s.unstack(0).sort_index()
+        assert_frame_equal(unstacked, expected)
+
+        # GH5873
+        idx = pd.MultiIndex.from_arrays([[101, 102], [3.5, np.nan]])
+        ts = pd.Series([1, 2], index=idx)
+        left = ts.unstack()
+        right = DataFrame([[nan, 1], [2, nan]], index=[101, 102],
+                          columns=[nan, 3.5])
+        assert_frame_equal(left, right)
+
+        idx = pd.MultiIndex.from_arrays([['cat', 'cat', 'cat', 'dog', 'dog'
+                                          ], ['a', 'a', 'b', 'a', 'b'],
+                                         [1, 2, 1, 1, np.nan]])
+        ts = pd.Series([1.0, 1.1, 1.2, 1.3, 1.4], index=idx)
+        right = DataFrame([[1.0, 1.3], [1.1, nan], [nan, 1.4], [1.2, nan]],
+                          columns=['cat', 'dog'])
+        tpls = [('a', 1), ('a', 2), ('b', nan), ('b', 1)]
+        right.index = pd.MultiIndex.from_tuples(tpls)
+        assert_frame_equal(ts.unstack(level=0), right)
+
+    def test_value_counts_datetime(self):
+        # most dtypes are tested in test_base.py
+        values = [pd.Timestamp('2011-01-01 09:00'),
+                  pd.Timestamp('2011-01-01 10:00'),
+                  pd.Timestamp('2011-01-01 11:00'),
+                  pd.Timestamp('2011-01-01 09:00'),
+                  pd.Timestamp('2011-01-01 09:00'),
+                  pd.Timestamp('2011-01-01 11:00')]
+
+        exp_idx = pd.DatetimeIndex(['2011-01-01 09:00', '2011-01-01 11:00',
+                                    '2011-01-01 10:00'])
+        exp = pd.Series([3, 2, 1], index=exp_idx, name='xxx')
+
+        s = pd.Series(values, name='xxx')
+        tm.assert_series_equal(s.value_counts(), exp)
+        # check DatetimeIndex outputs the same result
+        idx = pd.DatetimeIndex(values, name='xxx')
+        tm.assert_series_equal(idx.value_counts(), exp)
+
+        # normalize
+        exp = pd.Series(np.array([3., 2., 1]) / 6.,
+                        index=exp_idx, name='xxx')
+        tm.assert_series_equal(s.value_counts(normalize=True), exp)
+        tm.assert_series_equal(idx.value_counts(normalize=True), exp)
+
+    def test_value_counts_datetime_tz(self):
+        values = [pd.Timestamp('2011-01-01 09:00', tz='US/Eastern'),
+                  pd.Timestamp('2011-01-01 10:00', tz='US/Eastern'),
+                  pd.Timestamp('2011-01-01 11:00', tz='US/Eastern'),
+                  pd.Timestamp('2011-01-01 09:00', tz='US/Eastern'),
+                  pd.Timestamp('2011-01-01 09:00', tz='US/Eastern'),
+                  pd.Timestamp('2011-01-01 11:00', tz='US/Eastern')]
+
+        exp_idx = pd.DatetimeIndex(['2011-01-01 09:00', '2011-01-01 11:00',
+                                    '2011-01-01 10:00'], tz='US/Eastern')
+        exp = pd.Series([3, 2, 1], index=exp_idx, name='xxx')
+
+        s = pd.Series(values, name='xxx')
+        tm.assert_series_equal(s.value_counts(), exp)
+        idx = pd.DatetimeIndex(values, name='xxx')
+        tm.assert_series_equal(idx.value_counts(), exp)
+
+        exp = pd.Series(np.array([3., 2., 1]) / 6.,
+                        index=exp_idx, name='xxx')
+        tm.assert_series_equal(s.value_counts(normalize=True), exp)
+        tm.assert_series_equal(idx.value_counts(normalize=True), exp)
+
+    def test_value_counts_period(self):
+        values = [pd.Period('2011-01', freq='M'),
+                  pd.Period('2011-02', freq='M'),
+                  pd.Period('2011-03', freq='M'),
+                  pd.Period('2011-01', freq='M'),
+                  pd.Period('2011-01', freq='M'),
+                  pd.Period('2011-03', freq='M')]
+
+        exp_idx = pd.PeriodIndex(['2011-01', '2011-03', '2011-02'], freq='M')
+        exp = pd.Series([3, 2, 1], index=exp_idx, name='xxx')
+
+        s = pd.Series(values, name='xxx')
+        tm.assert_series_equal(s.value_counts(), exp)
+        # check DatetimeIndex outputs the same result
+        idx = pd.PeriodIndex(values, name='xxx')
+        tm.assert_series_equal(idx.value_counts(), exp)
+
+        # normalize
+        exp = pd.Series(np.array([3., 2., 1]) / 6.,
+                        index=exp_idx, name='xxx')
+        tm.assert_series_equal(s.value_counts(normalize=True), exp)
+        tm.assert_series_equal(idx.value_counts(normalize=True), exp)
+
+    def test_value_counts_categorical_ordered(self):
+        # most dtypes are tested in test_base.py
+        values = pd.Categorical([1, 2, 3, 1, 1, 3], ordered=True)
+
+        exp_idx = pd.CategoricalIndex([1, 3, 2], categories=[1, 2, 3],
+                                      ordered=True)
+        exp = pd.Series([3, 2, 1], index=exp_idx, name='xxx')
+
+        s = pd.Series(values, name='xxx')
+        tm.assert_series_equal(s.value_counts(), exp)
+        # check CategoricalIndex outputs the same result
+        idx = pd.CategoricalIndex(values, name='xxx')
+        tm.assert_series_equal(idx.value_counts(), exp)
+
+        # normalize
+        exp = pd.Series(np.array([3., 2., 1]) / 6.,
+                        index=exp_idx, name='xxx')
+        tm.assert_series_equal(s.value_counts(normalize=True), exp)
+        tm.assert_series_equal(idx.value_counts(normalize=True), exp)
+
+    def test_value_counts_categorical_not_ordered(self):
+        values = pd.Categorical([1, 2, 3, 1, 1, 3], ordered=False)
+
+        exp_idx = pd.CategoricalIndex([1, 3, 2], categories=[1, 2, 3],
+                                      ordered=False)
+        exp = pd.Series([3, 2, 1], index=exp_idx, name='xxx')
+
+        s = pd.Series(values, name='xxx')
+        tm.assert_series_equal(s.value_counts(), exp)
+        # check CategoricalIndex outputs the same result
+        idx = pd.CategoricalIndex(values, name='xxx')
+        tm.assert_series_equal(idx.value_counts(), exp)
+
+        # normalize
+        exp = pd.Series(np.array([3., 2., 1]) / 6.,
+                        index=exp_idx, name='xxx')
+        tm.assert_series_equal(s.value_counts(normalize=True), exp)
+        tm.assert_series_equal(idx.value_counts(normalize=True), exp)
+
+
+@pytest.fixture
+def s_main_dtypes():
+    df = pd.DataFrame(
+        {'datetime': pd.to_datetime(['2003', '2002',
+                                     '2001', '2002',
+                                     '2005']),
+         'datetimetz': pd.to_datetime(
+             ['2003', '2002',
+              '2001', '2002',
+              '2005']).tz_localize('US/Eastern'),
+         'timedelta': pd.to_timedelta(['3d', '2d', '1d',
+                                       '2d', '5d'])})
+
+    for dtype in ['int8', 'int16', 'int32', 'int64',
+                  'float32', 'float64',
+                  'uint8', 'uint16', 'uint32', 'uint64']:
+        df[dtype] = Series([3, 2, 1, 2, 5], dtype=dtype)
+
+    return df
+
+
+class TestMode(object):
+
+    @pytest.mark.parametrize('dropna, expected', [
+        (True, Series([], dtype=np.float64)),
+        (False, Series([], dtype=np.float64))
+    ])
+    def test_mode_empty(self, dropna, expected):
+        s = Series([], dtype=np.float64)
+        result = s.mode(dropna)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dropna, data, expected', [
+        (True, [1, 1, 1, 2], [1]),
+        (True, [1, 1, 1, 2, 3, 3, 3], [1, 3]),
+        (False, [1, 1, 1, 2], [1]),
+        (False, [1, 1, 1, 2, 3, 3, 3], [1, 3]),
+    ])
+    @pytest.mark.parametrize(
+        'dt',
+        list(np.typecodes['AllInteger'] + np.typecodes['Float'])
+    )
+    def test_mode_numerical(self, dropna, data, expected, dt):
+        s = Series(data, dtype=dt)
+        result = s.mode(dropna)
+        expected = Series(expected, dtype=dt)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dropna, expected', [
+        (True, [1.0]),
+        (False, [1, np.nan]),
+    ])
+    def test_mode_numerical_nan(self, dropna, expected):
+        s = Series([1, 1, 2, np.nan, np.nan])
+        result = s.mode(dropna)
+        expected = Series(expected)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dropna, expected1, expected2, expected3', [
+        (True, ['b'], ['bar'], ['nan']),
+        (False, ['b'], [np.nan], ['nan'])
+    ])
+    def test_mode_str_obj(self, dropna, expected1, expected2, expected3):
+        # Test string and object types.
+        data = ['a'] * 2 + ['b'] * 3
+
+        s = Series(data, dtype='c')
+        result = s.mode(dropna)
+        expected1 = Series(expected1, dtype='c')
+        tm.assert_series_equal(result, expected1)
+
+        data = ['foo', 'bar', 'bar', np.nan, np.nan, np.nan]
+
+        s = Series(data, dtype=object)
+        result = s.mode(dropna)
+        expected2 = Series(expected2, dtype=object)
+        tm.assert_series_equal(result, expected2)
+
+        data = ['foo', 'bar', 'bar', np.nan, np.nan, np.nan]
+
+        s = Series(data, dtype=object).astype(str)
+        result = s.mode(dropna)
+        expected3 = Series(expected3, dtype=str)
+        tm.assert_series_equal(result, expected3)
+
+    @pytest.mark.parametrize('dropna, expected1, expected2', [
+        (True, ['foo'], ['foo']),
+        (False, ['foo'], [np.nan])
+    ])
+    def test_mode_mixeddtype(self, dropna, expected1, expected2):
+        s = Series([1, 'foo', 'foo'])
+        result = s.mode(dropna)
+        expected = Series(expected1)
+        tm.assert_series_equal(result, expected)
+
+        s = Series([1, 'foo', 'foo', np.nan, np.nan, np.nan])
+        result = s.mode(dropna)
+        expected = Series(expected2, dtype=object)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dropna, expected1, expected2', [
+        (True, ['1900-05-03', '2011-01-03', '2013-01-02'],
+               ['2011-01-03', '2013-01-02']),
+        (False, [np.nan], [np.nan, '2011-01-03', '2013-01-02']),
+    ])
+    def test_mode_datetime(self, dropna, expected1, expected2):
+        s = Series(['2011-01-03', '2013-01-02',
+                    '1900-05-03', 'nan', 'nan'], dtype='M8[ns]')
+        result = s.mode(dropna)
+        expected1 = Series(expected1, dtype='M8[ns]')
+        tm.assert_series_equal(result, expected1)
+
+        s = Series(['2011-01-03', '2013-01-02', '1900-05-03',
+                    '2011-01-03', '2013-01-02', 'nan', 'nan'],
+                   dtype='M8[ns]')
+        result = s.mode(dropna)
+        expected2 = Series(expected2, dtype='M8[ns]')
+        tm.assert_series_equal(result, expected2)
+
+    @pytest.mark.parametrize('dropna, expected1, expected2', [
+        (True, ['-1 days', '0 days', '1 days'], ['2 min', '1 day']),
+        (False, [np.nan], [np.nan, '2 min', '1 day']),
+    ])
+    def test_mode_timedelta(self, dropna, expected1, expected2):
+        # gh-5986: Test timedelta types.
+
+        s = Series(['1 days', '-1 days', '0 days', 'nan', 'nan'],
+                   dtype='timedelta64[ns]')
+        result = s.mode(dropna)
+        expected1 = Series(expected1, dtype='timedelta64[ns]')
+        tm.assert_series_equal(result, expected1)
+
+        s = Series(['1 day', '1 day', '-1 day', '-1 day 2 min',
+                    '2 min', '2 min', 'nan', 'nan'],
+                   dtype='timedelta64[ns]')
+        result = s.mode(dropna)
+        expected2 = Series(expected2, dtype='timedelta64[ns]')
+        tm.assert_series_equal(result, expected2)
+
+    @pytest.mark.parametrize('dropna, expected1, expected2, expected3', [
+        (True, Categorical([1, 2], categories=[1, 2]),
+         Categorical(['a'], categories=[1, 'a']),
+         Categorical([3, 1], categories=[3, 2, 1], ordered=True)),
+        (False, Categorical([np.nan], categories=[1, 2]),
+         Categorical([np.nan, 'a'], categories=[1, 'a']),
+         Categorical([np.nan, 3, 1], categories=[3, 2, 1], ordered=True)),
+    ])
+    def test_mode_category(self, dropna, expected1, expected2, expected3):
+        s = Series(Categorical([1, 2, np.nan, np.nan]))
+        result = s.mode(dropna)
+        expected1 = Series(expected1, dtype='category')
+        tm.assert_series_equal(result, expected1)
+
+        s = Series(Categorical([1, 'a', 'a', np.nan, np.nan]))
+        result = s.mode(dropna)
+        expected2 = Series(expected2, dtype='category')
+        tm.assert_series_equal(result, expected2)
+
+        s = Series(Categorical([1, 1, 2, 3, 3, np.nan, np.nan],
+                               categories=[3, 2, 1], ordered=True))
+        result = s.mode(dropna)
+        expected3 = Series(expected3, dtype='category')
+        tm.assert_series_equal(result, expected3)
+
+    @pytest.mark.parametrize('dropna, expected1, expected2', [
+        (True, [2**63], [1, 2**63]),
+        (False, [2**63], [1, 2**63])
+    ])
+    def test_mode_intoverflow(self, dropna, expected1, expected2):
+        # Test for uint64 overflow.
+        s = Series([1, 2**63, 2**63], dtype=np.uint64)
+        result = s.mode(dropna)
+        expected1 = Series(expected1, dtype=np.uint64)
+        tm.assert_series_equal(result, expected1)
+
+        s = Series([1, 2**63], dtype=np.uint64)
+        result = s.mode(dropna)
+        expected2 = Series(expected2, dtype=np.uint64)
+        tm.assert_series_equal(result, expected2)
+
+    @pytest.mark.skipif(not compat.PY3, reason="only PY3")
+    def test_mode_sortwarning(self):
+        # Check for the warning that is raised when the mode
+        # results cannot be sorted
+
+        expected = Series(['foo', np.nan])
+        s = Series([1, 'foo', 'foo', np.nan, np.nan])
+
+        with tm.assert_produces_warning(UserWarning, check_stacklevel=False):
+            result = s.mode(dropna=False)
+            result = result.sort_values().reset_index(drop=True)
+
+        tm.assert_series_equal(result, expected)
+
+
+def assert_check_nselect_boundary(vals, dtype, method):
+    # helper function for 'test_boundary_{dtype}' tests
+    s = Series(vals, dtype=dtype)
+    result = getattr(s, method)(3)
+    expected_idxr = [0, 1, 2] if method == 'nsmallest' else [3, 2, 1]
+    expected = s.loc[expected_idxr]
+    tm.assert_series_equal(result, expected)
+
+
+class TestNLargestNSmallest(object):
+
+    @pytest.mark.parametrize(
+        "r", [Series([3., 2, 1, 2, '5'], dtype='object'),
+              Series([3., 2, 1, 2, 5], dtype='object'),
+              # not supported on some archs
+              # Series([3., 2, 1, 2, 5], dtype='complex256'),
+              Series([3., 2, 1, 2, 5], dtype='complex128'),
+              Series(list('abcde')),
+              Series(list('abcde'), dtype='category')])
+    def test_error(self, r):
+        dt = r.dtype
+        msg = ("Cannot use method 'n(larg|small)est' with "
+               "dtype {dt}".format(dt=dt))
+        args = 2, len(r), 0, -1
+        methods = r.nlargest, r.nsmallest
+        for method, arg in product(methods, args):
+            with tm.assert_raises_regex(TypeError, msg):
+                method(arg)
+
+    @pytest.mark.parametrize(
+        "s",
+        [v for k, v in s_main_dtypes().iteritems()])
+    def test_nsmallest_nlargest(self, s):
+        # float, int, datetime64 (use i8), timedelts64 (same),
+        # object that are numbers, object that are strings
+
+        assert_series_equal(s.nsmallest(2), s.iloc[[2, 1]])
+        assert_series_equal(s.nsmallest(2, keep='last'), s.iloc[[2, 3]])
+
+        empty = s.iloc[0:0]
+        assert_series_equal(s.nsmallest(0), empty)
+        assert_series_equal(s.nsmallest(-1), empty)
+        assert_series_equal(s.nlargest(0), empty)
+        assert_series_equal(s.nlargest(-1), empty)
+
+        assert_series_equal(s.nsmallest(len(s)), s.sort_values())
+        assert_series_equal(s.nsmallest(len(s) + 1), s.sort_values())
+        assert_series_equal(s.nlargest(len(s)), s.iloc[[4, 0, 1, 3, 2]])
+        assert_series_equal(s.nlargest(len(s) + 1),
+                            s.iloc[[4, 0, 1, 3, 2]])
+
+    def test_misc(self):
+
+        s = Series([3., np.nan, 1, 2, 5])
+        assert_series_equal(s.nlargest(), s.iloc[[4, 0, 3, 2]])
+        assert_series_equal(s.nsmallest(), s.iloc[[2, 3, 0, 4]])
+
+        msg = 'keep must be either "first", "last"'
+        with tm.assert_raises_regex(ValueError, msg):
+            s.nsmallest(keep='invalid')
+        with tm.assert_raises_regex(ValueError, msg):
+            s.nlargest(keep='invalid')
+
+        # GH 15297
+        s = Series([1] * 5, index=[1, 2, 3, 4, 5])
+        expected_first = Series([1] * 3, index=[1, 2, 3])
+        expected_last = Series([1] * 3, index=[5, 4, 3])
+
+        result = s.nsmallest(3)
+        assert_series_equal(result, expected_first)
+
+        result = s.nsmallest(3, keep='last')
+        assert_series_equal(result, expected_last)
+
+        result = s.nlargest(3)
+        assert_series_equal(result, expected_first)
+
+        result = s.nlargest(3, keep='last')
+        assert_series_equal(result, expected_last)
+
+    @pytest.mark.parametrize('n', range(1, 5))
+    def test_n(self, n):
+
+        # GH 13412
+        s = Series([1, 4, 3, 2], index=[0, 0, 1, 1])
+        result = s.nlargest(n)
+        expected = s.sort_values(ascending=False).head(n)
+        assert_series_equal(result, expected)
+
+        result = s.nsmallest(n)
+        expected = s.sort_values().head(n)
+        assert_series_equal(result, expected)
+
+    def test_boundary_integer(self, nselect_method, any_int_dtype):
+        # GH 21426
+        dtype_info = np.iinfo(any_int_dtype)
+        min_val, max_val = dtype_info.min, dtype_info.max
+        vals = [min_val, min_val + 1, max_val - 1, max_val]
+        assert_check_nselect_boundary(vals, any_int_dtype, nselect_method)
+
+    def test_boundary_float(self, nselect_method, float_dtype):
+        # GH 21426
+        dtype_info = np.finfo(float_dtype)
+        min_val, max_val = dtype_info.min, dtype_info.max
+        min_2nd, max_2nd = np.nextafter(
+            [min_val, max_val], 0, dtype=float_dtype)
+        vals = [min_val, min_2nd, max_2nd, max_val]
+        assert_check_nselect_boundary(vals, float_dtype, nselect_method)
+
+    @pytest.mark.parametrize('dtype', ['datetime64[ns]', 'timedelta64[ns]'])
+    def test_boundary_datetimelike(self, nselect_method, dtype):
+        # GH 21426
+        # use int64 bounds and +1 to min_val since true minimum is NaT
+        # (include min_val/NaT at end to maintain same expected_idxr)
+        dtype_info = np.iinfo('int64')
+        min_val, max_val = dtype_info.min, dtype_info.max
+        vals = [min_val + 1, min_val + 2, max_val - 1, max_val, min_val]
+        assert_check_nselect_boundary(vals, dtype, nselect_method)
+
+    def test_duplicate_keep_all_ties(self):
+        # see gh-16818
+        s = Series([10, 9, 8, 7, 7, 7, 7, 6])
+        result = s.nlargest(4, keep='all')
+        expected = Series([10, 9, 8, 7, 7, 7, 7])
+        assert_series_equal(result, expected)
+
+        result = s.nsmallest(2, keep='all')
+        expected = Series([6, 7, 7, 7, 7], index=[7, 3, 4, 5, 6])
+        assert_series_equal(result, expected)
+
+
+class TestCategoricalSeriesAnalytics(object):
+
+    def test_count(self):
+
+        s = Series(Categorical([np.nan, 1, 2, np.nan],
+                               categories=[5, 4, 3, 2, 1], ordered=True))
+        result = s.count()
+        assert result == 2
+
+    def test_min_max(self):
+        # unordered cats have no min/max
+        cat = Series(Categorical(["a", "b", "c", "d"], ordered=False))
+        pytest.raises(TypeError, lambda: cat.min())
+        pytest.raises(TypeError, lambda: cat.max())
+
+        cat = Series(Categorical(["a", "b", "c", "d"], ordered=True))
+        _min = cat.min()
+        _max = cat.max()
+        assert _min == "a"
+        assert _max == "d"
+
+        cat = Series(Categorical(["a", "b", "c", "d"], categories=[
+                     'd', 'c', 'b', 'a'], ordered=True))
+        _min = cat.min()
+        _max = cat.max()
+        assert _min == "d"
+        assert _max == "a"
+
+        cat = Series(Categorical(
+            [np.nan, "b", "c", np.nan], categories=['d', 'c', 'b', 'a'
+                                                    ], ordered=True))
+        _min = cat.min()
+        _max = cat.max()
+        assert np.isnan(_min)
+        assert _max == "b"
+
+        cat = Series(Categorical(
+            [np.nan, 1, 2, np.nan], categories=[5, 4, 3, 2, 1], ordered=True))
+        _min = cat.min()
+        _max = cat.max()
+        assert np.isnan(_min)
+        assert _max == 1
+
+    def test_value_counts(self):
+        # GH 12835
+        cats = Categorical(list('abcccb'), categories=list('cabd'))
+        s = Series(cats, name='xxx')
+        res = s.value_counts(sort=False)
+
+        exp_index = CategoricalIndex(list('cabd'), categories=cats.categories)
+        exp = Series([3, 1, 2, 0], name='xxx', index=exp_index)
+        tm.assert_series_equal(res, exp)
+
+        res = s.value_counts(sort=True)
+
+        exp_index = CategoricalIndex(list('cbad'), categories=cats.categories)
+        exp = Series([3, 2, 1, 0], name='xxx', index=exp_index)
+        tm.assert_series_equal(res, exp)
+
+        # check object dtype handles the Series.name as the same
+        # (tested in test_base.py)
+        s = Series(["a", "b", "c", "c", "c", "b"], name='xxx')
+        res = s.value_counts()
+        exp = Series([3, 2, 1], name='xxx', index=["c", "b", "a"])
+        tm.assert_series_equal(res, exp)
+
+    def test_value_counts_with_nan(self):
+        # see gh-9443
+
+        # sanity check
+        s = Series(["a", "b", "a"], dtype="category")
+        exp = Series([2, 1], index=CategoricalIndex(["a", "b"]))
+
+        res = s.value_counts(dropna=True)
+        tm.assert_series_equal(res, exp)
+
+        res = s.value_counts(dropna=True)
+        tm.assert_series_equal(res, exp)
+
+        # same Series via two different constructions --> same behaviour
+        series = [
+            Series(["a", "b", None, "a", None, None], dtype="category"),
+            Series(Categorical(["a", "b", None, "a", None, None],
+                               categories=["a", "b"]))
+        ]
+
+        for s in series:
+            # None is a NaN value, so we exclude its count here
+            exp = Series([2, 1], index=CategoricalIndex(["a", "b"]))
+            res = s.value_counts(dropna=True)
+            tm.assert_series_equal(res, exp)
+
+            # we don't exclude the count of None and sort by counts
+            exp = Series([3, 2, 1], index=CategoricalIndex([np.nan, "a", "b"]))
+            res = s.value_counts(dropna=False)
+            tm.assert_series_equal(res, exp)
+
+            # When we aren't sorting by counts, and np.nan isn't a
+            # category, it should be last.
+            exp = Series([2, 1, 3], index=CategoricalIndex(["a", "b", np.nan]))
+            res = s.value_counts(dropna=False, sort=False)
+            tm.assert_series_equal(res, exp)
+
+    @pytest.mark.parametrize(
+        "dtype",
+        ["int_", "uint", "float_", "unicode_", "timedelta64[h]",
+         pytest.param("datetime64[D]",
+                      marks=pytest.mark.xfail(reason="issue7996"))]
+    )
+    @pytest.mark.parametrize("is_ordered", [True, False])
+    def test_drop_duplicates_categorical_non_bool(self, dtype, is_ordered):
+        cat_array = np.array([1, 2, 3, 4, 5], dtype=np.dtype(dtype))
+
+        # Test case 1
+        input1 = np.array([1, 2, 3, 3], dtype=np.dtype(dtype))
+        tc1 = Series(Categorical(input1, categories=cat_array,
+                                 ordered=is_ordered))
+
+        expected = Series([False, False, False, True])
+        tm.assert_series_equal(tc1.duplicated(), expected)
+        tm.assert_series_equal(tc1.drop_duplicates(), tc1[~expected])
+        sc = tc1.copy()
+        sc.drop_duplicates(inplace=True)
+        tm.assert_series_equal(sc, tc1[~expected])
+
+        expected = Series([False, False, True, False])
+        tm.assert_series_equal(tc1.duplicated(keep='last'), expected)
+        tm.assert_series_equal(tc1.drop_duplicates(keep='last'),
+                               tc1[~expected])
+        sc = tc1.copy()
+        sc.drop_duplicates(keep='last', inplace=True)
+        tm.assert_series_equal(sc, tc1[~expected])
+
+        expected = Series([False, False, True, True])
+        tm.assert_series_equal(tc1.duplicated(keep=False), expected)
+        tm.assert_series_equal(tc1.drop_duplicates(keep=False), tc1[~expected])
+        sc = tc1.copy()
+        sc.drop_duplicates(keep=False, inplace=True)
+        tm.assert_series_equal(sc, tc1[~expected])
+
+        # Test case 2
+        input2 = np.array([1, 2, 3, 5, 3, 2, 4], dtype=np.dtype(dtype))
+        tc2 = Series(Categorical(
+            input2, categories=cat_array, ordered=is_ordered)
+        )
+
+        expected = Series([False, False, False, False, True, True, False])
+        tm.assert_series_equal(tc2.duplicated(), expected)
+        tm.assert_series_equal(tc2.drop_duplicates(), tc2[~expected])
+        sc = tc2.copy()
+        sc.drop_duplicates(inplace=True)
+        tm.assert_series_equal(sc, tc2[~expected])
+
+        expected = Series([False, True, True, False, False, False, False])
+        tm.assert_series_equal(tc2.duplicated(keep='last'), expected)
+        tm.assert_series_equal(tc2.drop_duplicates(keep='last'),
+                               tc2[~expected])
+        sc = tc2.copy()
+        sc.drop_duplicates(keep='last', inplace=True)
+        tm.assert_series_equal(sc, tc2[~expected])
+
+        expected = Series([False, True, True, False, True, True, False])
+        tm.assert_series_equal(tc2.duplicated(keep=False), expected)
+        tm.assert_series_equal(tc2.drop_duplicates(keep=False), tc2[~expected])
+        sc = tc2.copy()
+        sc.drop_duplicates(keep=False, inplace=True)
+        tm.assert_series_equal(sc, tc2[~expected])
+
+    @pytest.mark.parametrize("is_ordered", [True, False])
+    def test_drop_duplicates_categorical_bool(self, is_ordered):
+        tc = Series(Categorical([True, False, True, False],
+                                categories=[True, False], ordered=is_ordered))
+
+        expected = Series([False, False, True, True])
+        tm.assert_series_equal(tc.duplicated(), expected)
+        tm.assert_series_equal(tc.drop_duplicates(), tc[~expected])
+        sc = tc.copy()
+        sc.drop_duplicates(inplace=True)
+        tm.assert_series_equal(sc, tc[~expected])
+
+        expected = Series([True, True, False, False])
+        tm.assert_series_equal(tc.duplicated(keep='last'), expected)
+        tm.assert_series_equal(tc.drop_duplicates(keep='last'), tc[~expected])
+        sc = tc.copy()
+        sc.drop_duplicates(keep='last', inplace=True)
+        tm.assert_series_equal(sc, tc[~expected])
+
+        expected = Series([True, True, True, True])
+        tm.assert_series_equal(tc.duplicated(keep=False), expected)
+        tm.assert_series_equal(tc.drop_duplicates(keep=False), tc[~expected])
+        sc = tc.copy()
+        sc.drop_duplicates(keep=False, inplace=True)
+        tm.assert_series_equal(sc, tc[~expected])
diff --git a/pandas/tests/series/test_api.py b/pandas/tests/series/test_api.py
new file mode 100644
index 0000000000000..f7f1ea019a3f0
--- /dev/null
+++ b/pandas/tests/series/test_api.py
@@ -0,0 +1,756 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+from collections import OrderedDict
+import pydoc
+
+import pytest
+
+import numpy as np
+import pandas as pd
+
+from pandas import Index, Series, DataFrame, date_range
+from pandas.core.indexes.datetimes import Timestamp
+
+from pandas.compat import range, lzip, isidentifier, string_types
+from pandas import (compat, Categorical, period_range, timedelta_range,
+                    DatetimeIndex, PeriodIndex, TimedeltaIndex)
+import pandas.io.formats.printing as printing
+from pandas.util.testing import (assert_series_equal,
+                                 ensure_clean)
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class SharedWithSparse(object):
+    """
+    A collection of tests Series and SparseSeries can share.
+
+    In generic tests on this class, use ``self._assert_series_equal()``
+    which is implemented in sub-classes.
+    """
+    def _assert_series_equal(self, left, right):
+        """Dispatch to series class dependent assertion"""
+        raise NotImplementedError
+
+    def test_scalarop_preserve_name(self):
+        result = self.ts * 2
+        assert result.name == self.ts.name
+
+    def test_copy_name(self):
+        result = self.ts.copy()
+        assert result.name == self.ts.name
+
+    def test_copy_index_name_checking(self):
+        # don't want to be able to modify the index stored elsewhere after
+        # making a copy
+
+        self.ts.index.name = None
+        assert self.ts.index.name is None
+        assert self.ts is self.ts
+
+        cp = self.ts.copy()
+        cp.index.name = 'foo'
+        printing.pprint_thing(self.ts.index.name)
+        assert self.ts.index.name is None
+
+    def test_append_preserve_name(self):
+        result = self.ts[:5].append(self.ts[5:])
+        assert result.name == self.ts.name
+
+    def test_binop_maybe_preserve_name(self):
+        # names match, preserve
+        result = self.ts * self.ts
+        assert result.name == self.ts.name
+        result = self.ts.mul(self.ts)
+        assert result.name == self.ts.name
+
+        result = self.ts * self.ts[:-2]
+        assert result.name == self.ts.name
+
+        # names don't match, don't preserve
+        cp = self.ts.copy()
+        cp.name = 'something else'
+        result = self.ts + cp
+        assert result.name is None
+        result = self.ts.add(cp)
+        assert result.name is None
+
+        ops = ['add', 'sub', 'mul', 'div', 'truediv', 'floordiv', 'mod', 'pow']
+        ops = ops + ['r' + op for op in ops]
+        for op in ops:
+            # names match, preserve
+            s = self.ts.copy()
+            result = getattr(s, op)(s)
+            assert result.name == self.ts.name
+
+            # names don't match, don't preserve
+            cp = self.ts.copy()
+            cp.name = 'changed'
+            result = getattr(s, op)(cp)
+            assert result.name is None
+
+    def test_combine_first_name(self):
+        result = self.ts.combine_first(self.ts[:5])
+        assert result.name == self.ts.name
+
+    def test_getitem_preserve_name(self):
+        result = self.ts[self.ts > 0]
+        assert result.name == self.ts.name
+
+        result = self.ts[[0, 2, 4]]
+        assert result.name == self.ts.name
+
+        result = self.ts[5:10]
+        assert result.name == self.ts.name
+
+    def test_pickle(self):
+        unp_series = self._pickle_roundtrip(self.series)
+        unp_ts = self._pickle_roundtrip(self.ts)
+        assert_series_equal(unp_series, self.series)
+        assert_series_equal(unp_ts, self.ts)
+
+    def _pickle_roundtrip(self, obj):
+
+        with ensure_clean() as path:
+            obj.to_pickle(path)
+            unpickled = pd.read_pickle(path)
+            return unpickled
+
+    def test_argsort_preserve_name(self):
+        result = self.ts.argsort()
+        assert result.name == self.ts.name
+
+    def test_sort_index_name(self):
+        result = self.ts.sort_index(ascending=False)
+        assert result.name == self.ts.name
+
+    def test_to_sparse_pass_name(self):
+        result = self.ts.to_sparse()
+        assert result.name == self.ts.name
+
+    def test_constructor_dict(self):
+        d = {'a': 0., 'b': 1., 'c': 2.}
+        result = self.series_klass(d)
+        expected = self.series_klass(d, index=sorted(d.keys()))
+        self._assert_series_equal(result, expected)
+
+        result = self.series_klass(d, index=['b', 'c', 'd', 'a'])
+        expected = self.series_klass([1, 2, np.nan, 0],
+                                     index=['b', 'c', 'd', 'a'])
+        self._assert_series_equal(result, expected)
+
+    def test_constructor_subclass_dict(self):
+        data = tm.TestSubDict((x, 10.0 * x) for x in range(10))
+        series = self.series_klass(data)
+        expected = self.series_klass(dict(compat.iteritems(data)))
+        self._assert_series_equal(series, expected)
+
+    def test_constructor_ordereddict(self):
+        # GH3283
+        data = OrderedDict(
+            ('col%s' % i, np.random.random()) for i in range(12))
+
+        series = self.series_klass(data)
+        expected = self.series_klass(list(data.values()), list(data.keys()))
+        self._assert_series_equal(series, expected)
+
+        # Test with subclass
+        class A(OrderedDict):
+            pass
+
+        series = self.series_klass(A(data))
+        self._assert_series_equal(series, expected)
+
+    def test_constructor_dict_multiindex(self):
+        d = {('a', 'a'): 0., ('b', 'a'): 1., ('b', 'c'): 2.}
+        _d = sorted(d.items())
+        result = self.series_klass(d)
+        expected = self.series_klass(
+            [x[1] for x in _d],
+            index=pd.MultiIndex.from_tuples([x[0] for x in _d]))
+        self._assert_series_equal(result, expected)
+
+        d['z'] = 111.
+        _d.insert(0, ('z', d['z']))
+        result = self.series_klass(d)
+        expected = self.series_klass([x[1] for x in _d],
+                                     index=pd.Index([x[0] for x in _d],
+                                                    tupleize_cols=False))
+        result = result.reindex(index=expected.index)
+        self._assert_series_equal(result, expected)
+
+    def test_constructor_dict_timedelta_index(self):
+        # GH #12169 : Resample category data with timedelta index
+        # construct Series from dict as data and TimedeltaIndex as index
+        # will result NaN in result Series data
+        expected = self.series_klass(
+            data=['A', 'B', 'C'],
+            index=pd.to_timedelta([0, 10, 20], unit='s')
+        )
+
+        result = self.series_klass(
+            data={pd.to_timedelta(0, unit='s'): 'A',
+                  pd.to_timedelta(10, unit='s'): 'B',
+                  pd.to_timedelta(20, unit='s'): 'C'},
+            index=pd.to_timedelta([0, 10, 20], unit='s')
+        )
+        self._assert_series_equal(result, expected)
+
+    def test_from_array_deprecated(self):
+
+        with tm.assert_produces_warning(FutureWarning):
+            self.series_klass.from_array([1, 2, 3])
+
+
+class TestSeriesMisc(TestData, SharedWithSparse):
+
+    series_klass = Series
+    # SharedWithSparse tests use generic, series_klass-agnostic assertion
+    _assert_series_equal = staticmethod(tm.assert_series_equal)
+
+    def test_tab_completion(self):
+        # GH 9910
+        s = Series(list('abcd'))
+        # Series of str values should have .str but not .dt/.cat in __dir__
+        assert 'str' in dir(s)
+        assert 'dt' not in dir(s)
+        assert 'cat' not in dir(s)
+
+        # similarly for .dt
+        s = Series(date_range('1/1/2015', periods=5))
+        assert 'dt' in dir(s)
+        assert 'str' not in dir(s)
+        assert 'cat' not in dir(s)
+
+        # Similarly for .cat, but with the twist that str and dt should be
+        # there if the categories are of that type first cat and str.
+        s = Series(list('abbcd'), dtype="category")
+        assert 'cat' in dir(s)
+        assert 'str' in dir(s)  # as it is a string categorical
+        assert 'dt' not in dir(s)
+
+        # similar to cat and str
+        s = Series(date_range('1/1/2015', periods=5)).astype("category")
+        assert 'cat' in dir(s)
+        assert 'str' not in dir(s)
+        assert 'dt' in dir(s)  # as it is a datetime categorical
+
+    def test_tab_completion_with_categorical(self):
+        # test the tab completion display
+        ok_for_cat = ['categories', 'codes', 'ordered', 'set_categories',
+                      'add_categories', 'remove_categories',
+                      'rename_categories', 'reorder_categories',
+                      'remove_unused_categories', 'as_ordered', 'as_unordered']
+
+        def get_dir(s):
+            results = [r for r in s.cat.__dir__() if not r.startswith('_')]
+            return list(sorted(set(results)))
+
+        s = Series(list('aabbcde')).astype('category')
+        results = get_dir(s)
+        tm.assert_almost_equal(results, list(sorted(set(ok_for_cat))))
+
+    @pytest.mark.parametrize("index", [
+        tm.makeUnicodeIndex(10),
+        tm.makeStringIndex(10),
+        tm.makeCategoricalIndex(10),
+        Index(['foo', 'bar', 'baz'] * 2),
+        tm.makeDateIndex(10),
+        tm.makePeriodIndex(10),
+        tm.makeTimedeltaIndex(10),
+        tm.makeIntIndex(10),
+        tm.makeUIntIndex(10),
+        tm.makeIntIndex(10),
+        tm.makeFloatIndex(10),
+        Index([True, False]),
+        Index(['a{}'.format(i) for i in range(101)]),
+        pd.MultiIndex.from_tuples(lzip('ABCD', 'EFGH')),
+        pd.MultiIndex.from_tuples(lzip([0, 1, 2, 3], 'EFGH')), ])
+    def test_index_tab_completion(self, index):
+        # dir contains string-like values of the Index.
+        s = pd.Series(index=index)
+        dir_s = dir(s)
+        for i, x in enumerate(s.index.unique(level=0)):
+            if i < 100:
+                assert (not isinstance(x, string_types) or
+                        not isidentifier(x) or x in dir_s)
+            else:
+                assert x not in dir_s
+
+    def test_not_hashable(self):
+        s_empty = Series()
+        s = Series([1])
+        pytest.raises(TypeError, hash, s_empty)
+        pytest.raises(TypeError, hash, s)
+
+    def test_contains(self):
+        tm.assert_contains_all(self.ts.index, self.ts)
+
+    def test_iter(self):
+        for i, val in enumerate(self.series):
+            assert val == self.series[i]
+
+        for i, val in enumerate(self.ts):
+            assert val == self.ts[i]
+
+    def test_keys(self):
+        # HACK: By doing this in two stages, we avoid 2to3 wrapping the call
+        # to .keys() in a list()
+        getkeys = self.ts.keys
+        assert getkeys() is self.ts.index
+
+    def test_values(self):
+        tm.assert_almost_equal(self.ts.values, self.ts, check_dtype=False)
+
+    def test_iteritems(self):
+        for idx, val in compat.iteritems(self.series):
+            assert val == self.series[idx]
+
+        for idx, val in compat.iteritems(self.ts):
+            assert val == self.ts[idx]
+
+        # assert is lazy (genrators don't define reverse, lists do)
+        assert not hasattr(self.series.iteritems(), 'reverse')
+
+    def test_items(self):
+        for idx, val in self.series.items():
+            assert val == self.series[idx]
+
+        for idx, val in self.ts.items():
+            assert val == self.ts[idx]
+
+        # assert is lazy (genrators don't define reverse, lists do)
+        assert not hasattr(self.series.items(), 'reverse')
+
+    def test_raise_on_info(self):
+        s = Series(np.random.randn(10))
+        with pytest.raises(AttributeError):
+            s.info()
+
+    def test_copy(self):
+
+        for deep in [None, False, True]:
+            s = Series(np.arange(10), dtype='float64')
+
+            # default deep is True
+            if deep is None:
+                s2 = s.copy()
+            else:
+                s2 = s.copy(deep=deep)
+
+            s2[::2] = np.NaN
+
+            if deep is None or deep is True:
+                # Did not modify original Series
+                assert np.isnan(s2[0])
+                assert not np.isnan(s[0])
+            else:
+                # we DID modify the original Series
+                assert np.isnan(s2[0])
+                assert np.isnan(s[0])
+
+        # GH 11794
+        # copy of tz-aware
+        expected = Series([Timestamp('2012/01/01', tz='UTC')])
+        expected2 = Series([Timestamp('1999/01/01', tz='UTC')])
+
+        for deep in [None, False, True]:
+
+            s = Series([Timestamp('2012/01/01', tz='UTC')])
+
+            if deep is None:
+                s2 = s.copy()
+            else:
+                s2 = s.copy(deep=deep)
+
+            s2[0] = pd.Timestamp('1999/01/01', tz='UTC')
+
+            # default deep is True
+            if deep is None or deep is True:
+                # Did not modify original Series
+                assert_series_equal(s2, expected2)
+                assert_series_equal(s, expected)
+            else:
+                # we DID modify the original Series
+                assert_series_equal(s2, expected2)
+                assert_series_equal(s, expected2)
+
+    def test_axis_alias(self):
+        s = Series([1, 2, np.nan])
+        assert_series_equal(s.dropna(axis='rows'), s.dropna(axis='index'))
+        assert s.dropna().sum('rows') == 3
+        assert s._get_axis_number('rows') == 0
+        assert s._get_axis_name('rows') == 'index'
+
+    def test_class_axis(self):
+        # https://github.com/pandas-dev/pandas/issues/18147
+        # no exception and no empty docstring
+        assert pydoc.getdoc(Series.index)
+
+    def test_numpy_unique(self):
+        # it works!
+        np.unique(self.ts)
+
+    def test_ndarray_compat(self):
+
+        # test numpy compat with Series as sub-class of NDFrame
+        tsdf = DataFrame(np.random.randn(1000, 3), columns=['A', 'B', 'C'],
+                         index=date_range('1/1/2000', periods=1000))
+
+        def f(x):
+            return x[x.idxmax()]
+
+        result = tsdf.apply(f)
+        expected = tsdf.max()
+        tm.assert_series_equal(result, expected)
+
+        # .item()
+        s = Series([1])
+        result = s.item()
+        assert result == 1
+        assert s.item() == s.iloc[0]
+
+        # using an ndarray like function
+        s = Series(np.random.randn(10))
+        result = Series(np.ones_like(s))
+        expected = Series(1, index=range(10), dtype='float64')
+        tm.assert_series_equal(result, expected)
+
+        # ravel
+        s = Series(np.random.randn(10))
+        tm.assert_almost_equal(s.ravel(order='F'), s.values.ravel(order='F'))
+
+        # compress
+        # GH 6658
+        s = Series([0, 1., -1], index=list('abc'))
+        result = np.compress(s > 0, s)
+        tm.assert_series_equal(result, Series([1.], index=['b']))
+
+        result = np.compress(s < -1, s)
+        # result empty Index(dtype=object) as the same as original
+        exp = Series([], dtype='float64', index=Index([], dtype='object'))
+        tm.assert_series_equal(result, exp)
+
+        s = Series([0, 1., -1], index=[.1, .2, .3])
+        result = np.compress(s > 0, s)
+        tm.assert_series_equal(result, Series([1.], index=[.2]))
+
+        result = np.compress(s < -1, s)
+        # result empty Float64Index as the same as original
+        exp = Series([], dtype='float64', index=Index([], dtype='float64'))
+        tm.assert_series_equal(result, exp)
+
+    def test_str_attribute(self):
+        # GH9068
+        methods = ['strip', 'rstrip', 'lstrip']
+        s = Series([' jack', 'jill ', ' jesse ', 'frank'])
+        for method in methods:
+            expected = Series([getattr(str, method)(x) for x in s.values])
+            assert_series_equal(getattr(Series.str, method)(s.str), expected)
+
+        # str accessor only valid with string values
+        s = Series(range(5))
+        with tm.assert_raises_regex(AttributeError,
+                                    'only use .str accessor'):
+            s.str.repeat(2)
+
+    def test_empty_method(self):
+        s_empty = pd.Series()
+        assert s_empty.empty
+
+        for full_series in [pd.Series([1]), pd.Series(index=[1])]:
+            assert not full_series.empty
+
+    def test_tab_complete_warning(self, ip):
+        # https://github.com/pandas-dev/pandas/issues/16409
+        pytest.importorskip('IPython', minversion="6.0.0")
+        from IPython.core.completer import provisionalcompleter
+
+        code = "import pandas as pd; s = pd.Series()"
+        ip.run_code(code)
+        with tm.assert_produces_warning(None):
+            with provisionalcompleter('ignore'):
+                list(ip.Completer.completions('s.', 1))
+
+
+class TestCategoricalSeries(object):
+
+    @pytest.mark.parametrize(
+        "method",
+        [
+            lambda x: x.cat.set_categories([1, 2, 3]),
+            lambda x: x.cat.reorder_categories([2, 3, 1], ordered=True),
+            lambda x: x.cat.rename_categories([1, 2, 3]),
+            lambda x: x.cat.remove_unused_categories(),
+            lambda x: x.cat.remove_categories([2]),
+            lambda x: x.cat.add_categories([4]),
+            lambda x: x.cat.as_ordered(),
+            lambda x: x.cat.as_unordered(),
+        ])
+    def test_getname_categorical_accessor(self, method):
+        # GH 17509
+        s = Series([1, 2, 3], name='A').astype('category')
+        expected = 'A'
+        result = method(s).name
+        assert result == expected
+
+    def test_cat_accessor(self):
+        s = Series(Categorical(["a", "b", np.nan, "a"]))
+        tm.assert_index_equal(s.cat.categories, Index(["a", "b"]))
+        assert not s.cat.ordered, False
+
+        exp = Categorical(["a", "b", np.nan, "a"], categories=["b", "a"])
+        s.cat.set_categories(["b", "a"], inplace=True)
+        tm.assert_categorical_equal(s.values, exp)
+
+        res = s.cat.set_categories(["b", "a"])
+        tm.assert_categorical_equal(res.values, exp)
+
+        s[:] = "a"
+        s = s.cat.remove_unused_categories()
+        tm.assert_index_equal(s.cat.categories, Index(["a"]))
+
+    def test_cat_accessor_api(self):
+        # GH 9322
+        from pandas.core.arrays.categorical import CategoricalAccessor
+        assert Series.cat is CategoricalAccessor
+        s = Series(list('aabbcde')).astype('category')
+        assert isinstance(s.cat, CategoricalAccessor)
+
+        invalid = Series([1])
+        with tm.assert_raises_regex(AttributeError,
+                                    "only use .cat accessor"):
+            invalid.cat
+        assert not hasattr(invalid, 'cat')
+
+    def test_cat_accessor_no_new_attributes(self):
+        # https://github.com/pandas-dev/pandas/issues/10673
+        c = Series(list('aabbcde')).astype('category')
+        with tm.assert_raises_regex(AttributeError,
+                                    "You cannot add any new attribute"):
+            c.cat.xlabel = "a"
+
+    def test_categorical_delegations(self):
+
+        # invalid accessor
+        pytest.raises(AttributeError, lambda: Series([1, 2, 3]).cat)
+        tm.assert_raises_regex(
+            AttributeError,
+            r"Can only use .cat accessor with a 'category' dtype",
+            lambda: Series([1, 2, 3]).cat)
+        pytest.raises(AttributeError, lambda: Series(['a', 'b', 'c']).cat)
+        pytest.raises(AttributeError, lambda: Series(np.arange(5.)).cat)
+        pytest.raises(AttributeError,
+                      lambda: Series([Timestamp('20130101')]).cat)
+
+        # Series should delegate calls to '.categories', '.codes', '.ordered'
+        # and the methods '.set_categories()' 'drop_unused_categories()' to the
+        # categorical# -*- coding: utf-8 -*-
+        s = Series(Categorical(["a", "b", "c", "a"], ordered=True))
+        exp_categories = Index(["a", "b", "c"])
+        tm.assert_index_equal(s.cat.categories, exp_categories)
+        s.cat.categories = [1, 2, 3]
+        exp_categories = Index([1, 2, 3])
+        tm.assert_index_equal(s.cat.categories, exp_categories)
+
+        exp_codes = Series([0, 1, 2, 0], dtype='int8')
+        tm.assert_series_equal(s.cat.codes, exp_codes)
+
+        assert s.cat.ordered
+        s = s.cat.as_unordered()
+        assert not s.cat.ordered
+        s.cat.as_ordered(inplace=True)
+        assert s.cat.ordered
+
+        # reorder
+        s = Series(Categorical(["a", "b", "c", "a"], ordered=True))
+        exp_categories = Index(["c", "b", "a"])
+        exp_values = np.array(["a", "b", "c", "a"], dtype=np.object_)
+        s = s.cat.set_categories(["c", "b", "a"])
+        tm.assert_index_equal(s.cat.categories, exp_categories)
+        tm.assert_numpy_array_equal(s.values.__array__(), exp_values)
+        tm.assert_numpy_array_equal(s.__array__(), exp_values)
+
+        # remove unused categories
+        s = Series(Categorical(["a", "b", "b", "a"], categories=["a", "b", "c"
+                                                                 ]))
+        exp_categories = Index(["a", "b"])
+        exp_values = np.array(["a", "b", "b", "a"], dtype=np.object_)
+        s = s.cat.remove_unused_categories()
+        tm.assert_index_equal(s.cat.categories, exp_categories)
+        tm.assert_numpy_array_equal(s.values.__array__(), exp_values)
+        tm.assert_numpy_array_equal(s.__array__(), exp_values)
+
+        # This method is likely to be confused, so test that it raises an error
+        # on wrong inputs:
+        def f():
+            s.set_categories([4, 3, 2, 1])
+
+        pytest.raises(Exception, f)
+        # right: s.cat.set_categories([4,3,2,1])
+
+        # GH18862 (let Series.cat.rename_categories take callables)
+        s = Series(Categorical(["a", "b", "c", "a"], ordered=True))
+        result = s.cat.rename_categories(lambda x: x.upper())
+        expected = Series(Categorical(["A", "B", "C", "A"],
+                                      categories=["A", "B", "C"],
+                                      ordered=True))
+        tm.assert_series_equal(result, expected)
+
+    def test_str_accessor_api_for_categorical(self):
+        # https://github.com/pandas-dev/pandas/issues/10661
+        from pandas.core.strings import StringMethods
+        s = Series(list('aabb'))
+        s = s + " " + s
+        c = s.astype('category')
+        assert isinstance(c.str, StringMethods)
+
+        # str functions, which need special arguments
+        special_func_defs = [
+            ('cat', (list("zyxw"),), {"sep": ","}),
+            ('center', (10,), {}),
+            ('contains', ("a",), {}),
+            ('count', ("a",), {}),
+            ('decode', ("UTF-8",), {}),
+            ('encode', ("UTF-8",), {}),
+            ('endswith', ("a",), {}),
+            ('extract', ("([a-z]*) ",), {"expand": False}),
+            ('extract', ("([a-z]*) ",), {"expand": True}),
+            ('extractall', ("([a-z]*) ",), {}),
+            ('find', ("a",), {}),
+            ('findall', ("a",), {}),
+            ('index', (" ",), {}),
+            ('ljust', (10,), {}),
+            ('match', ("a"), {}),  # deprecated...
+            ('normalize', ("NFC",), {}),
+            ('pad', (10,), {}),
+            ('partition', (" ",), {"expand": False}),  # not default
+            ('partition', (" ",), {"expand": True}),  # default
+            ('repeat', (3,), {}),
+            ('replace', ("a", "z"), {}),
+            ('rfind', ("a",), {}),
+            ('rindex', (" ",), {}),
+            ('rjust', (10,), {}),
+            ('rpartition', (" ",), {"expand": False}),  # not default
+            ('rpartition', (" ",), {"expand": True}),  # default
+            ('slice', (0, 1), {}),
+            ('slice_replace', (0, 1, "z"), {}),
+            ('split', (" ",), {"expand": False}),  # default
+            ('split', (" ",), {"expand": True}),  # not default
+            ('startswith', ("a",), {}),
+            ('wrap', (2,), {}),
+            ('zfill', (10,), {})
+        ]
+        _special_func_names = [f[0] for f in special_func_defs]
+
+        # * get, join: they need a individual elements of type lists, but
+        #   we can't make a categorical with lists as individual categories.
+        #   -> `s.str.split(" ").astype("category")` will error!
+        # * `translate` has different interfaces for py2 vs. py3
+        _ignore_names = ["get", "join", "translate"]
+
+        str_func_names = [f for f in dir(s.str) if not (
+            f.startswith("_") or
+            f in _special_func_names or
+            f in _ignore_names)]
+
+        func_defs = [(f, (), {}) for f in str_func_names]
+        func_defs.extend(special_func_defs)
+
+        for func, args, kwargs in func_defs:
+            res = getattr(c.str, func)(*args, **kwargs)
+            exp = getattr(s.str, func)(*args, **kwargs)
+
+            if isinstance(res, DataFrame):
+                tm.assert_frame_equal(res, exp)
+            else:
+                tm.assert_series_equal(res, exp)
+
+        invalid = Series([1, 2, 3]).astype('category')
+        with tm.assert_raises_regex(AttributeError,
+                                    "Can only use .str "
+                                    "accessor with string"):
+            invalid.str
+        assert not hasattr(invalid, 'str')
+
+    def test_dt_accessor_api_for_categorical(self):
+        # https://github.com/pandas-dev/pandas/issues/10661
+        from pandas.core.indexes.accessors import Properties
+
+        s_dr = Series(date_range('1/1/2015', periods=5, tz="MET"))
+        c_dr = s_dr.astype("category")
+
+        s_pr = Series(period_range('1/1/2015', freq='D', periods=5))
+        c_pr = s_pr.astype("category")
+
+        s_tdr = Series(timedelta_range('1 days', '10 days'))
+        c_tdr = s_tdr.astype("category")
+
+        # only testing field (like .day)
+        # and bool (is_month_start)
+        get_ops = lambda x: x._datetimelike_ops
+
+        test_data = [
+            ("Datetime", get_ops(DatetimeIndex), s_dr, c_dr),
+            ("Period", get_ops(PeriodIndex), s_pr, c_pr),
+            ("Timedelta", get_ops(TimedeltaIndex), s_tdr, c_tdr)]
+
+        assert isinstance(c_dr.dt, Properties)
+
+        special_func_defs = [
+            ('strftime', ("%Y-%m-%d",), {}),
+            ('tz_convert', ("EST",), {}),
+            ('round', ("D",), {}),
+            ('floor', ("D",), {}),
+            ('ceil', ("D",), {}),
+            ('asfreq', ("D",), {}),
+            # ('tz_localize', ("UTC",), {}),
+        ]
+        _special_func_names = [f[0] for f in special_func_defs]
+
+        # the series is already localized
+        _ignore_names = ['tz_localize', 'components']
+
+        for name, attr_names, s, c in test_data:
+            func_names = [f
+                          for f in dir(s.dt)
+                          if not (f.startswith("_") or f in attr_names or f in
+                                  _special_func_names or f in _ignore_names)]
+
+            func_defs = [(f, (), {}) for f in func_names]
+            for f_def in special_func_defs:
+                if f_def[0] in dir(s.dt):
+                    func_defs.append(f_def)
+
+            for func, args, kwargs in func_defs:
+                res = getattr(c.dt, func)(*args, **kwargs)
+                exp = getattr(s.dt, func)(*args, **kwargs)
+
+                if isinstance(res, DataFrame):
+                    tm.assert_frame_equal(res, exp)
+                elif isinstance(res, Series):
+                    tm.assert_series_equal(res, exp)
+                else:
+                    tm.assert_almost_equal(res, exp)
+
+            for attr in attr_names:
+                try:
+                    res = getattr(c.dt, attr)
+                    exp = getattr(s.dt, attr)
+                except Exception as e:
+                    print(name, attr)
+                    raise e
+
+            if isinstance(res, DataFrame):
+                tm.assert_frame_equal(res, exp)
+            elif isinstance(res, Series):
+                tm.assert_series_equal(res, exp)
+            else:
+                tm.assert_almost_equal(res, exp)
+
+        invalid = Series([1, 2, 3]).astype('category')
+        with tm.assert_raises_regex(
+                AttributeError, "Can only use .dt accessor with datetimelike"):
+            invalid.dt
+        assert not hasattr(invalid, 'str')
diff --git a/pandas/tests/series/test_apply.py b/pandas/tests/series/test_apply.py
new file mode 100644
index 0000000000000..b28b9f342695f
--- /dev/null
+++ b/pandas/tests/series/test_apply.py
@@ -0,0 +1,589 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+
+from collections import Counter, defaultdict, OrderedDict
+
+import numpy as np
+import pandas as pd
+
+from pandas import (Index, Series, DataFrame, isna)
+from pandas.compat import lrange
+from pandas import compat
+from pandas.util.testing import assert_series_equal, assert_frame_equal
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestSeriesApply(TestData):
+
+    def test_apply(self):
+        with np.errstate(all='ignore'):
+            tm.assert_series_equal(self.ts.apply(np.sqrt), np.sqrt(self.ts))
+
+            # element-wise apply
+            import math
+            tm.assert_series_equal(self.ts.apply(math.exp), np.exp(self.ts))
+
+        # empty series
+        s = Series(dtype=object, name='foo', index=pd.Index([], name='bar'))
+        rs = s.apply(lambda x: x)
+        tm.assert_series_equal(s, rs)
+
+        # check all metadata (GH 9322)
+        assert s is not rs
+        assert s.index is rs.index
+        assert s.dtype == rs.dtype
+        assert s.name == rs.name
+
+        # index but no data
+        s = Series(index=[1, 2, 3])
+        rs = s.apply(lambda x: x)
+        tm.assert_series_equal(s, rs)
+
+    def test_apply_same_length_inference_bug(self):
+        s = Series([1, 2])
+        f = lambda x: (x, x + 1)
+
+        result = s.apply(f)
+        expected = s.map(f)
+        assert_series_equal(result, expected)
+
+        s = Series([1, 2, 3])
+        result = s.apply(f)
+        expected = s.map(f)
+        assert_series_equal(result, expected)
+
+    def test_apply_dont_convert_dtype(self):
+        s = Series(np.random.randn(10))
+
+        f = lambda x: x if x > 0 else np.nan
+        result = s.apply(f, convert_dtype=False)
+        assert result.dtype == object
+
+    def test_with_string_args(self):
+
+        for arg in ['sum', 'mean', 'min', 'max', 'std']:
+            result = self.ts.apply(arg)
+            expected = getattr(self.ts, arg)()
+            assert result == expected
+
+    def test_apply_args(self):
+        s = Series(['foo,bar'])
+
+        result = s.apply(str.split, args=(',', ))
+        assert result[0] == ['foo', 'bar']
+        assert isinstance(result[0], list)
+
+    def test_series_map_box_timestamps(self):
+        # GH#2689, GH#2627
+        ser = Series(pd.date_range('1/1/2000', periods=10))
+
+        def func(x):
+            return (x.hour, x.day, x.month)
+
+        # it works!
+        ser.map(func)
+        ser.apply(func)
+
+    def test_apply_box(self):
+        # ufunc will not be boxed. Same test cases as the test_map_box
+        vals = [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02')]
+        s = pd.Series(vals)
+        assert s.dtype == 'datetime64[ns]'
+        # boxed value must be Timestamp instance
+        res = s.apply(lambda x: '{0}_{1}_{2}'.format(x.__class__.__name__,
+                                                     x.day, x.tz))
+        exp = pd.Series(['Timestamp_1_None', 'Timestamp_2_None'])
+        tm.assert_series_equal(res, exp)
+
+        vals = [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+                pd.Timestamp('2011-01-02', tz='US/Eastern')]
+        s = pd.Series(vals)
+        assert s.dtype == 'datetime64[ns, US/Eastern]'
+        res = s.apply(lambda x: '{0}_{1}_{2}'.format(x.__class__.__name__,
+                                                     x.day, x.tz))
+        exp = pd.Series(['Timestamp_1_US/Eastern', 'Timestamp_2_US/Eastern'])
+        tm.assert_series_equal(res, exp)
+
+        # timedelta
+        vals = [pd.Timedelta('1 days'), pd.Timedelta('2 days')]
+        s = pd.Series(vals)
+        assert s.dtype == 'timedelta64[ns]'
+        res = s.apply(lambda x: '{0}_{1}'.format(x.__class__.__name__, x.days))
+        exp = pd.Series(['Timedelta_1', 'Timedelta_2'])
+        tm.assert_series_equal(res, exp)
+
+        # period (object dtype, not boxed)
+        vals = [pd.Period('2011-01-01', freq='M'),
+                pd.Period('2011-01-02', freq='M')]
+        s = pd.Series(vals)
+        assert s.dtype == 'object'
+        res = s.apply(lambda x: '{0}_{1}'.format(x.__class__.__name__,
+                                                 x.freqstr))
+        exp = pd.Series(['Period_M', 'Period_M'])
+        tm.assert_series_equal(res, exp)
+
+    def test_apply_datetimetz(self):
+        values = pd.date_range('2011-01-01', '2011-01-02',
+                               freq='H').tz_localize('Asia/Tokyo')
+        s = pd.Series(values, name='XX')
+
+        result = s.apply(lambda x: x + pd.offsets.Day())
+        exp_values = pd.date_range('2011-01-02', '2011-01-03',
+                                   freq='H').tz_localize('Asia/Tokyo')
+        exp = pd.Series(exp_values, name='XX')
+        tm.assert_series_equal(result, exp)
+
+        # change dtype
+        # GH 14506 : Returned dtype changed from int32 to int64
+        result = s.apply(lambda x: x.hour)
+        exp = pd.Series(list(range(24)) + [0], name='XX', dtype=np.int64)
+        tm.assert_series_equal(result, exp)
+
+        # not vectorized
+        def f(x):
+            if not isinstance(x, pd.Timestamp):
+                raise ValueError
+            return str(x.tz)
+
+        result = s.map(f)
+        exp = pd.Series(['Asia/Tokyo'] * 25, name='XX')
+        tm.assert_series_equal(result, exp)
+
+    def test_apply_dict_depr(self):
+
+        tsdf = pd.DataFrame(np.random.randn(10, 3),
+                            columns=['A', 'B', 'C'],
+                            index=pd.date_range('1/1/2000', periods=10))
+        with tm.assert_produces_warning(FutureWarning):
+            tsdf.A.agg({'foo': ['sum', 'mean']})
+
+
+class TestSeriesAggregate(TestData):
+
+    def test_transform(self):
+        # transforming functions
+
+        with np.errstate(all='ignore'):
+
+            f_sqrt = np.sqrt(self.series)
+            f_abs = np.abs(self.series)
+
+            # ufunc
+            result = self.series.transform(np.sqrt)
+            expected = f_sqrt.copy()
+            assert_series_equal(result, expected)
+
+            result = self.series.apply(np.sqrt)
+            assert_series_equal(result, expected)
+
+            # list-like
+            result = self.series.transform([np.sqrt])
+            expected = f_sqrt.to_frame().copy()
+            expected.columns = ['sqrt']
+            assert_frame_equal(result, expected)
+
+            result = self.series.transform([np.sqrt])
+            assert_frame_equal(result, expected)
+
+            result = self.series.transform(['sqrt'])
+            assert_frame_equal(result, expected)
+
+            # multiple items in list
+            # these are in the order as if we are applying both functions per
+            # series and then concatting
+            expected = pd.concat([f_sqrt, f_abs], axis=1)
+            expected.columns = ['sqrt', 'absolute']
+            result = self.series.apply([np.sqrt, np.abs])
+            assert_frame_equal(result, expected)
+
+            result = self.series.transform(['sqrt', 'abs'])
+            expected.columns = ['sqrt', 'abs']
+            assert_frame_equal(result, expected)
+
+            # dict, provide renaming
+            expected = pd.concat([f_sqrt, f_abs], axis=1)
+            expected.columns = ['foo', 'bar']
+            expected = expected.unstack().rename('series')
+
+            result = self.series.apply({'foo': np.sqrt, 'bar': np.abs})
+            assert_series_equal(result.reindex_like(expected), expected)
+
+    def test_transform_and_agg_error(self):
+        # we are trying to transform with an aggregator
+        def f():
+            self.series.transform(['min', 'max'])
+        pytest.raises(ValueError, f)
+
+        def f():
+            with np.errstate(all='ignore'):
+                self.series.agg(['sqrt', 'max'])
+        pytest.raises(ValueError, f)
+
+        def f():
+            with np.errstate(all='ignore'):
+                self.series.transform(['sqrt', 'max'])
+        pytest.raises(ValueError, f)
+
+        def f():
+            with np.errstate(all='ignore'):
+                self.series.agg({'foo': np.sqrt, 'bar': 'sum'})
+        pytest.raises(ValueError, f)
+
+    def test_demo(self):
+        # demonstration tests
+        s = Series(range(6), dtype='int64', name='series')
+
+        result = s.agg(['min', 'max'])
+        expected = Series([0, 5], index=['min', 'max'], name='series')
+        tm.assert_series_equal(result, expected)
+
+        result = s.agg({'foo': 'min'})
+        expected = Series([0], index=['foo'], name='series')
+        tm.assert_series_equal(result, expected)
+
+        # nested renaming
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.agg({'foo': ['min', 'max']})
+
+        expected = DataFrame(
+            {'foo': [0, 5]},
+            index=['min', 'max']).unstack().rename('series')
+        tm.assert_series_equal(result, expected)
+
+    def test_multiple_aggregators_with_dict_api(self):
+
+        s = Series(range(6), dtype='int64', name='series')
+        # nested renaming
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.agg({'foo': ['min', 'max'], 'bar': ['sum', 'mean']})
+
+        expected = DataFrame(
+            {'foo': [5.0, np.nan, 0.0, np.nan],
+             'bar': [np.nan, 2.5, np.nan, 15.0]},
+            columns=['foo', 'bar'],
+            index=['max', 'mean',
+                   'min', 'sum']).unstack().rename('series')
+        tm.assert_series_equal(result.reindex_like(expected), expected)
+
+    def test_agg_apply_evaluate_lambdas_the_same(self):
+        # test that we are evaluating row-by-row first
+        # before vectorized evaluation
+        result = self.series.apply(lambda x: str(x))
+        expected = self.series.agg(lambda x: str(x))
+        tm.assert_series_equal(result, expected)
+
+        result = self.series.apply(str)
+        expected = self.series.agg(str)
+        tm.assert_series_equal(result, expected)
+
+    def test_with_nested_series(self):
+        # GH 2316
+        # .agg with a reducer and a transform, what to do
+        result = self.ts.apply(lambda x: Series(
+            [x, x ** 2], index=['x', 'x^2']))
+        expected = DataFrame({'x': self.ts, 'x^2': self.ts ** 2})
+        tm.assert_frame_equal(result, expected)
+
+        result = self.ts.agg(lambda x: Series(
+            [x, x ** 2], index=['x', 'x^2']))
+        tm.assert_frame_equal(result, expected)
+
+    def test_replicate_describe(self):
+        # this also tests a result set that is all scalars
+        expected = self.series.describe()
+        result = self.series.apply(OrderedDict(
+            [('count', 'count'),
+             ('mean', 'mean'),
+             ('std', 'std'),
+             ('min', 'min'),
+             ('25%', lambda x: x.quantile(0.25)),
+             ('50%', 'median'),
+             ('75%', lambda x: x.quantile(0.75)),
+             ('max', 'max')]))
+        assert_series_equal(result, expected)
+
+    def test_reduce(self):
+        # reductions with named functions
+        result = self.series.agg(['sum', 'mean'])
+        expected = Series([self.series.sum(),
+                           self.series.mean()],
+                          ['sum', 'mean'],
+                          name=self.series.name)
+        assert_series_equal(result, expected)
+
+    def test_non_callable_aggregates(self):
+        # test agg using non-callable series attributes
+        s = Series([1, 2, None])
+
+        # Calling agg w/ just a string arg same as calling s.arg
+        result = s.agg('size')
+        expected = s.size
+        assert result == expected
+
+        # test when mixed w/ callable reducers
+        result = s.agg(['size', 'count', 'mean'])
+        expected = Series(OrderedDict([('size', 3.0),
+                                       ('count', 2.0),
+                                       ('mean', 1.5)]))
+        assert_series_equal(result[expected.index], expected)
+
+
+class TestSeriesMap(TestData):
+
+    def test_map(self):
+        index, data = tm.getMixedTypeDict()
+
+        source = Series(data['B'], index=data['C'])
+        target = Series(data['C'][:4], index=data['D'][:4])
+
+        merged = target.map(source)
+
+        for k, v in compat.iteritems(merged):
+            assert v == source[target[k]]
+
+        # input could be a dict
+        merged = target.map(source.to_dict())
+
+        for k, v in compat.iteritems(merged):
+            assert v == source[target[k]]
+
+        # function
+        result = self.ts.map(lambda x: x * 2)
+        tm.assert_series_equal(result, self.ts * 2)
+
+        # GH 10324
+        a = Series([1, 2, 3, 4])
+        b = Series(["even", "odd", "even", "odd"], dtype="category")
+        c = Series(["even", "odd", "even", "odd"])
+
+        exp = Series(["odd", "even", "odd", np.nan], dtype="category")
+        tm.assert_series_equal(a.map(b), exp)
+        exp = Series(["odd", "even", "odd", np.nan])
+        tm.assert_series_equal(a.map(c), exp)
+
+        a = Series(['a', 'b', 'c', 'd'])
+        b = Series([1, 2, 3, 4],
+                   index=pd.CategoricalIndex(['b', 'c', 'd', 'e']))
+        c = Series([1, 2, 3, 4], index=Index(['b', 'c', 'd', 'e']))
+
+        exp = Series([np.nan, 1, 2, 3])
+        tm.assert_series_equal(a.map(b), exp)
+        exp = Series([np.nan, 1, 2, 3])
+        tm.assert_series_equal(a.map(c), exp)
+
+        a = Series(['a', 'b', 'c', 'd'])
+        b = Series(['B', 'C', 'D', 'E'], dtype='category',
+                   index=pd.CategoricalIndex(['b', 'c', 'd', 'e']))
+        c = Series(['B', 'C', 'D', 'E'], index=Index(['b', 'c', 'd', 'e']))
+
+        exp = Series(pd.Categorical([np.nan, 'B', 'C', 'D'],
+                                    categories=['B', 'C', 'D', 'E']))
+        tm.assert_series_equal(a.map(b), exp)
+        exp = Series([np.nan, 'B', 'C', 'D'])
+        tm.assert_series_equal(a.map(c), exp)
+
+    @pytest.mark.parametrize("index", tm.all_index_generator(10))
+    def test_map_empty(self, index):
+        s = Series(index)
+        result = s.map({})
+
+        expected = pd.Series(np.nan, index=s.index)
+        tm.assert_series_equal(result, expected)
+
+    def test_map_compat(self):
+        # related GH 8024
+        s = Series([True, True, False], index=[1, 2, 3])
+        result = s.map({True: 'foo', False: 'bar'})
+        expected = Series(['foo', 'foo', 'bar'], index=[1, 2, 3])
+        assert_series_equal(result, expected)
+
+    def test_map_int(self):
+        left = Series({'a': 1., 'b': 2., 'c': 3., 'd': 4})
+        right = Series({1: 11, 2: 22, 3: 33})
+
+        assert left.dtype == np.float_
+        assert issubclass(right.dtype.type, np.integer)
+
+        merged = left.map(right)
+        assert merged.dtype == np.float_
+        assert isna(merged['d'])
+        assert not isna(merged['c'])
+
+    def test_map_type_inference(self):
+        s = Series(lrange(3))
+        s2 = s.map(lambda x: np.where(x == 0, 0, 1))
+        assert issubclass(s2.dtype.type, np.integer)
+
+    def test_map_decimal(self):
+        from decimal import Decimal
+
+        result = self.series.map(lambda x: Decimal(str(x)))
+        assert result.dtype == np.object_
+        assert isinstance(result[0], Decimal)
+
+    def test_map_na_exclusion(self):
+        s = Series([1.5, np.nan, 3, np.nan, 5])
+
+        result = s.map(lambda x: x * 2, na_action='ignore')
+        exp = s * 2
+        assert_series_equal(result, exp)
+
+    def test_map_dict_with_tuple_keys(self):
+        """
+        Due to new MultiIndex-ing behaviour in v0.14.0,
+        dicts with tuple keys passed to map were being
+        converted to a multi-index, preventing tuple values
+        from being mapped properly.
+        """
+        # GH 18496
+        df = pd.DataFrame({'a': [(1, ), (2, ), (3, 4), (5, 6)]})
+        label_mappings = {(1, ): 'A', (2, ): 'B', (3, 4): 'A', (5, 6): 'B'}
+
+        df['labels'] = df['a'].map(label_mappings)
+        df['expected_labels'] = pd.Series(['A', 'B', 'A', 'B'], index=df.index)
+        # All labels should be filled now
+        tm.assert_series_equal(df['labels'], df['expected_labels'],
+                               check_names=False)
+
+    def test_map_counter(self):
+        s = Series(['a', 'b', 'c'], index=[1, 2, 3])
+        counter = Counter()
+        counter['b'] = 5
+        counter['c'] += 1
+        result = s.map(counter)
+        expected = Series([0, 5, 1], index=[1, 2, 3])
+        assert_series_equal(result, expected)
+
+    def test_map_defaultdict(self):
+        s = Series([1, 2, 3], index=['a', 'b', 'c'])
+        default_dict = defaultdict(lambda: 'blank')
+        default_dict[1] = 'stuff'
+        result = s.map(default_dict)
+        expected = Series(['stuff', 'blank', 'blank'], index=['a', 'b', 'c'])
+        assert_series_equal(result, expected)
+
+    def test_map_dict_subclass_with_missing(self):
+        """
+        Test Series.map with a dictionary subclass that defines __missing__,
+        i.e. sets a default value (GH #15999).
+        """
+        class DictWithMissing(dict):
+            def __missing__(self, key):
+                return 'missing'
+        s = Series([1, 2, 3])
+        dictionary = DictWithMissing({3: 'three'})
+        result = s.map(dictionary)
+        expected = Series(['missing', 'missing', 'three'])
+        assert_series_equal(result, expected)
+
+    def test_map_dict_subclass_without_missing(self):
+        class DictWithoutMissing(dict):
+            pass
+        s = Series([1, 2, 3])
+        dictionary = DictWithoutMissing({3: 'three'})
+        result = s.map(dictionary)
+        expected = Series([np.nan, np.nan, 'three'])
+        assert_series_equal(result, expected)
+
+    def test_map_box(self):
+        vals = [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02')]
+        s = pd.Series(vals)
+        assert s.dtype == 'datetime64[ns]'
+        # boxed value must be Timestamp instance
+        res = s.map(lambda x: '{0}_{1}_{2}'.format(x.__class__.__name__,
+                                                   x.day, x.tz))
+        exp = pd.Series(['Timestamp_1_None', 'Timestamp_2_None'])
+        tm.assert_series_equal(res, exp)
+
+        vals = [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+                pd.Timestamp('2011-01-02', tz='US/Eastern')]
+        s = pd.Series(vals)
+        assert s.dtype == 'datetime64[ns, US/Eastern]'
+        res = s.map(lambda x: '{0}_{1}_{2}'.format(x.__class__.__name__,
+                                                   x.day, x.tz))
+        exp = pd.Series(['Timestamp_1_US/Eastern', 'Timestamp_2_US/Eastern'])
+        tm.assert_series_equal(res, exp)
+
+        # timedelta
+        vals = [pd.Timedelta('1 days'), pd.Timedelta('2 days')]
+        s = pd.Series(vals)
+        assert s.dtype == 'timedelta64[ns]'
+        res = s.map(lambda x: '{0}_{1}'.format(x.__class__.__name__, x.days))
+        exp = pd.Series(['Timedelta_1', 'Timedelta_2'])
+        tm.assert_series_equal(res, exp)
+
+        # period (object dtype, not boxed)
+        vals = [pd.Period('2011-01-01', freq='M'),
+                pd.Period('2011-01-02', freq='M')]
+        s = pd.Series(vals)
+        assert s.dtype == 'object'
+        res = s.map(lambda x: '{0}_{1}'.format(x.__class__.__name__,
+                                               x.freqstr))
+        exp = pd.Series(['Period_M', 'Period_M'])
+        tm.assert_series_equal(res, exp)
+
+    def test_map_categorical(self):
+        values = pd.Categorical(list('ABBABCD'), categories=list('DCBA'),
+                                ordered=True)
+        s = pd.Series(values, name='XX', index=list('abcdefg'))
+
+        result = s.map(lambda x: x.lower())
+        exp_values = pd.Categorical(list('abbabcd'), categories=list('dcba'),
+                                    ordered=True)
+        exp = pd.Series(exp_values, name='XX', index=list('abcdefg'))
+        tm.assert_series_equal(result, exp)
+        tm.assert_categorical_equal(result.values, exp_values)
+
+        result = s.map(lambda x: 'A')
+        exp = pd.Series(['A'] * 7, name='XX', index=list('abcdefg'))
+        tm.assert_series_equal(result, exp)
+        assert result.dtype == np.object
+
+        with pytest.raises(NotImplementedError):
+            s.map(lambda x: x, na_action='ignore')
+
+    def test_map_datetimetz(self):
+        values = pd.date_range('2011-01-01', '2011-01-02',
+                               freq='H').tz_localize('Asia/Tokyo')
+        s = pd.Series(values, name='XX')
+
+        # keep tz
+        result = s.map(lambda x: x + pd.offsets.Day())
+        exp_values = pd.date_range('2011-01-02', '2011-01-03',
+                                   freq='H').tz_localize('Asia/Tokyo')
+        exp = pd.Series(exp_values, name='XX')
+        tm.assert_series_equal(result, exp)
+
+        # change dtype
+        # GH 14506 : Returned dtype changed from int32 to int64
+        result = s.map(lambda x: x.hour)
+        exp = pd.Series(list(range(24)) + [0], name='XX', dtype=np.int64)
+        tm.assert_series_equal(result, exp)
+
+        with pytest.raises(NotImplementedError):
+            s.map(lambda x: x, na_action='ignore')
+
+        # not vectorized
+        def f(x):
+            if not isinstance(x, pd.Timestamp):
+                raise ValueError
+            return str(x.tz)
+
+        result = s.map(f)
+        exp = pd.Series(['Asia/Tokyo'] * 25, name='XX')
+        tm.assert_series_equal(result, exp)
+
+    @pytest.mark.parametrize("vals,mapping,exp", [
+        (list('abc'), {np.nan: 'not NaN'}, [np.nan] * 3 + ['not NaN']),
+        (list('abc'), {'a': 'a letter'}, ['a letter'] + [np.nan] * 3),
+        (list(range(3)), {0: 42}, [42] + [np.nan] * 3)])
+    def test_map_missing_mixed(self, vals, mapping, exp):
+        # GH20495
+        s = pd.Series(vals + [np.nan])
+        result = s.map(mapping)
+
+        tm.assert_series_equal(result, pd.Series(exp))
diff --git a/pandas/tests/series/test_arithmetic.py b/pandas/tests/series/test_arithmetic.py
new file mode 100644
index 0000000000000..f4bdb7ba86aaf
--- /dev/null
+++ b/pandas/tests/series/test_arithmetic.py
@@ -0,0 +1,909 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime, timedelta
+import operator
+from decimal import Decimal
+
+import numpy as np
+import pytest
+
+from pandas import Series, Timestamp, Timedelta, Period, NaT
+from pandas._libs.tslibs.period import IncompatibleFrequency
+
+import pandas as pd
+import pandas.util.testing as tm
+
+
+@pytest.fixture
+def tdser():
+    """
+    Return a Series with dtype='timedelta64[ns]', including a NaT.
+    """
+    return Series(['59 Days', '59 Days', 'NaT'], dtype='timedelta64[ns]')
+
+
+# ------------------------------------------------------------------
+# Comparisons
+
+class TestSeriesComparison(object):
+    def test_compare_invalid(self):
+        # GH#8058
+        # ops testing
+        a = pd.Series(np.random.randn(5), name=0)
+        b = pd.Series(np.random.randn(5))
+        b.name = pd.Timestamp('2000-01-01')
+        tm.assert_series_equal(a / b, 1 / (b / a))
+
+    @pytest.mark.parametrize('opname', ['eq', 'ne', 'gt', 'lt', 'ge', 'le'])
+    def test_ser_flex_cmp_return_dtypes(self, opname):
+        # GH#15115
+        ser = Series([1, 3, 2], index=range(3))
+        const = 2
+
+        result = getattr(ser, opname)(const).get_dtype_counts()
+        tm.assert_series_equal(result, Series([1], ['bool']))
+
+    @pytest.mark.parametrize('opname', ['eq', 'ne', 'gt', 'lt', 'ge', 'le'])
+    def test_ser_flex_cmp_return_dtypes_empty(self, opname):
+        # GH#15115 empty Series case
+        ser = Series([1, 3, 2], index=range(3))
+        empty = ser.iloc[:0]
+        const = 2
+
+        result = getattr(empty, opname)(const).get_dtype_counts()
+        tm.assert_series_equal(result, Series([1], ['bool']))
+
+    @pytest.mark.parametrize('op', [operator.eq, operator.ne,
+                                    operator.le, operator.lt,
+                                    operator.ge, operator.gt])
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('baz', 'baz', 'baz')])
+    def test_ser_cmp_result_names(self, names, op):
+        # datetime64 dtype
+        dti = pd.date_range('1949-06-07 03:00:00',
+                            freq='H', periods=5, name=names[0])
+        ser = Series(dti).rename(names[1])
+        result = op(ser, dti)
+        assert result.name == names[2]
+
+        # datetime64tz dtype
+        dti = dti.tz_localize('US/Central')
+        ser = Series(dti).rename(names[1])
+        result = op(ser, dti)
+        assert result.name == names[2]
+
+        # timedelta64 dtype
+        tdi = dti - dti.shift(1)
+        ser = Series(tdi).rename(names[1])
+        result = op(ser, tdi)
+        assert result.name == names[2]
+
+        # categorical
+        if op in [operator.eq, operator.ne]:
+            # categorical dtype comparisons raise for inequalities
+            cidx = tdi.astype('category')
+            ser = Series(cidx).rename(names[1])
+            result = op(ser, cidx)
+            assert result.name == names[2]
+
+
+class TestTimestampSeriesComparison(object):
+    def test_dt64_ser_cmp_date_warning(self):
+        # https://github.com/pandas-dev/pandas/issues/21359
+        # Remove this test and enble invalid test below
+        ser = pd.Series(pd.date_range('20010101', periods=10), name='dates')
+        date = ser.iloc[0].to_pydatetime().date()
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ser == date
+        expected = pd.Series([True] + [False] * 9, name='dates')
+        tm.assert_series_equal(result, expected)
+        assert "Comparing Series of datetimes " in str(m[0].message)
+        assert "will not compare equal" in str(m[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ser != date
+        tm.assert_series_equal(result, ~expected)
+        assert "will not compare equal" in str(m[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ser <= date
+        tm.assert_series_equal(result, expected)
+        assert "a TypeError will be raised" in str(m[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ser < date
+        tm.assert_series_equal(result, pd.Series([False] * 10, name='dates'))
+        assert "a TypeError will be raised" in str(m[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ser >= date
+        tm.assert_series_equal(result, pd.Series([True] * 10, name='dates'))
+        assert "a TypeError will be raised" in str(m[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ser > date
+        tm.assert_series_equal(result, pd.Series([False] + [True] * 9,
+                                                 name='dates'))
+        assert "a TypeError will be raised" in str(m[0].message)
+
+    @pytest.mark.skip(reason="GH-21359")
+    def test_dt64ser_cmp_date_invalid(self):
+        # GH#19800 datetime.date comparison raises to
+        # match DatetimeIndex/Timestamp.  This also matches the behavior
+        # of stdlib datetime.datetime
+        ser = pd.Series(pd.date_range('20010101', periods=10), name='dates')
+        date = ser.iloc[0].to_pydatetime().date()
+        assert not (ser == date).any()
+        assert (ser != date).all()
+        with pytest.raises(TypeError):
+            ser > date
+        with pytest.raises(TypeError):
+            ser < date
+        with pytest.raises(TypeError):
+            ser >= date
+        with pytest.raises(TypeError):
+            ser <= date
+
+    def test_dt64ser_cmp_period_scalar(self):
+        ser = Series(pd.period_range('2000-01-01', periods=10, freq='D'))
+        val = Period('2000-01-04', freq='D')
+        result = ser > val
+        expected = Series([x > val for x in ser])
+        tm.assert_series_equal(result, expected)
+
+        val = ser[5]
+        result = ser > val
+        expected = Series([x > val for x in ser])
+        tm.assert_series_equal(result, expected)
+
+    def test_timestamp_compare_series(self):
+        # make sure we can compare Timestamps on the right AND left hand side
+        # GH#4982
+        ser = pd.Series(pd.date_range('20010101', periods=10), name='dates')
+        s_nat = ser.copy(deep=True)
+
+        ser[0] = pd.Timestamp('nat')
+        ser[3] = pd.Timestamp('nat')
+
+        ops = {'lt': 'gt', 'le': 'ge', 'eq': 'eq', 'ne': 'ne'}
+
+        for left, right in ops.items():
+            left_f = getattr(operator, left)
+            right_f = getattr(operator, right)
+
+            # no nats
+            expected = left_f(ser, pd.Timestamp('20010109'))
+            result = right_f(pd.Timestamp('20010109'), ser)
+            tm.assert_series_equal(result, expected)
+
+            # nats
+            expected = left_f(ser, pd.Timestamp('nat'))
+            result = right_f(pd.Timestamp('nat'), ser)
+            tm.assert_series_equal(result, expected)
+
+            # compare to timestamp with series containing nats
+            expected = left_f(s_nat, pd.Timestamp('20010109'))
+            result = right_f(pd.Timestamp('20010109'), s_nat)
+            tm.assert_series_equal(result, expected)
+
+            # compare to nat with series containing nats
+            expected = left_f(s_nat, pd.Timestamp('nat'))
+            result = right_f(pd.Timestamp('nat'), s_nat)
+            tm.assert_series_equal(result, expected)
+
+    def test_timestamp_equality(self):
+        # GH#11034
+        ser = pd.Series([pd.Timestamp('2000-01-29 01:59:00'), 'NaT'])
+        result = ser != ser
+        tm.assert_series_equal(result, pd.Series([False, True]))
+        result = ser != ser[0]
+        tm.assert_series_equal(result, pd.Series([False, True]))
+        result = ser != ser[1]
+        tm.assert_series_equal(result, pd.Series([True, True]))
+
+        result = ser == ser
+        tm.assert_series_equal(result, pd.Series([True, False]))
+        result = ser == ser[0]
+        tm.assert_series_equal(result, pd.Series([True, False]))
+        result = ser == ser[1]
+        tm.assert_series_equal(result, pd.Series([False, False]))
+
+
+class TestTimedeltaSeriesComparisons(object):
+    def test_compare_timedelta_series(self):
+        # regresssion test for GH5963
+        s = pd.Series([timedelta(days=1), timedelta(days=2)])
+        actual = s > timedelta(days=1)
+        expected = pd.Series([False, True])
+        tm.assert_series_equal(actual, expected)
+
+
+class TestPeriodSeriesComparisons(object):
+    @pytest.mark.parametrize('freq', ['M', '2M', '3M'])
+    def test_cmp_series_period_scalar(self, freq):
+        # GH 13200
+        base = Series([Period(x, freq=freq) for x in
+                       ['2011-01', '2011-02', '2011-03', '2011-04']])
+        p = Period('2011-02', freq=freq)
+
+        exp = Series([False, True, False, False])
+        tm.assert_series_equal(base == p, exp)
+        tm.assert_series_equal(p == base, exp)
+
+        exp = Series([True, False, True, True])
+        tm.assert_series_equal(base != p, exp)
+        tm.assert_series_equal(p != base, exp)
+
+        exp = Series([False, False, True, True])
+        tm.assert_series_equal(base > p, exp)
+        tm.assert_series_equal(p < base, exp)
+
+        exp = Series([True, False, False, False])
+        tm.assert_series_equal(base < p, exp)
+        tm.assert_series_equal(p > base, exp)
+
+        exp = Series([False, True, True, True])
+        tm.assert_series_equal(base >= p, exp)
+        tm.assert_series_equal(p <= base, exp)
+
+        exp = Series([True, True, False, False])
+        tm.assert_series_equal(base <= p, exp)
+        tm.assert_series_equal(p >= base, exp)
+
+        # different base freq
+        msg = "Input has different freq=A-DEC from Period"
+        with tm.assert_raises_regex(IncompatibleFrequency, msg):
+            base <= Period('2011', freq='A')
+
+        with tm.assert_raises_regex(IncompatibleFrequency, msg):
+            Period('2011', freq='A') >= base
+
+    @pytest.mark.parametrize('freq', ['M', '2M', '3M'])
+    def test_cmp_series_period_series(self, freq):
+        # GH#13200
+        base = Series([Period(x, freq=freq) for x in
+                       ['2011-01', '2011-02', '2011-03', '2011-04']])
+
+        ser = Series([Period(x, freq=freq) for x in
+                      ['2011-02', '2011-01', '2011-03', '2011-05']])
+
+        exp = Series([False, False, True, False])
+        tm.assert_series_equal(base == ser, exp)
+
+        exp = Series([True, True, False, True])
+        tm.assert_series_equal(base != ser, exp)
+
+        exp = Series([False, True, False, False])
+        tm.assert_series_equal(base > ser, exp)
+
+        exp = Series([True, False, False, True])
+        tm.assert_series_equal(base < ser, exp)
+
+        exp = Series([False, True, True, False])
+        tm.assert_series_equal(base >= ser, exp)
+
+        exp = Series([True, False, True, True])
+        tm.assert_series_equal(base <= ser, exp)
+
+        ser2 = Series([Period(x, freq='A') for x in
+                       ['2011', '2011', '2011', '2011']])
+
+        # different base freq
+        msg = "Input has different freq=A-DEC from Period"
+        with tm.assert_raises_regex(IncompatibleFrequency, msg):
+            base <= ser2
+
+    def test_cmp_series_period_series_mixed_freq(self):
+        # GH#13200
+        base = Series([Period('2011', freq='A'),
+                       Period('2011-02', freq='M'),
+                       Period('2013', freq='A'),
+                       Period('2011-04', freq='M')])
+
+        ser = Series([Period('2012', freq='A'),
+                      Period('2011-01', freq='M'),
+                      Period('2013', freq='A'),
+                      Period('2011-05', freq='M')])
+
+        exp = Series([False, False, True, False])
+        tm.assert_series_equal(base == ser, exp)
+
+        exp = Series([True, True, False, True])
+        tm.assert_series_equal(base != ser, exp)
+
+        exp = Series([False, True, False, False])
+        tm.assert_series_equal(base > ser, exp)
+
+        exp = Series([True, False, False, True])
+        tm.assert_series_equal(base < ser, exp)
+
+        exp = Series([False, True, True, False])
+        tm.assert_series_equal(base >= ser, exp)
+
+        exp = Series([True, False, True, True])
+        tm.assert_series_equal(base <= ser, exp)
+
+
+# ------------------------------------------------------------------
+# Arithmetic
+
+class TestSeriesDivision(object):
+    # __div__, __rdiv__, __floordiv__, __rfloordiv__
+    # for non-timestamp/timedelta/period dtypes
+
+    def test_divide_decimal(self):
+        # resolves issue GH#9787
+        expected = Series([Decimal(5)])
+
+        ser = Series([Decimal(10)])
+        result = ser / Decimal(2)
+
+        tm.assert_series_equal(result, expected)
+
+        ser = Series([Decimal(10)])
+        result = ser // Decimal(2)
+
+        tm.assert_series_equal(result, expected)
+
+    def test_div_equiv_binop(self):
+        # Test Series.div as well as Series.__div__
+        # float/integer issue
+        # GH#7785
+        first = Series([1, 0], name='first')
+        second = Series([-0.01, -0.02], name='second')
+        expected = Series([-0.01, -np.inf])
+
+        result = second.div(first)
+        tm.assert_series_equal(result, expected, check_names=False)
+
+        result = second / first
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype2', [
+        np.int64, np.int32, np.int16, np.int8,
+        np.float64, np.float32, np.float16,
+        np.uint64, np.uint32, np.uint16, np.uint8])
+    @pytest.mark.parametrize('dtype1', [np.int64, np.float64, np.uint64])
+    def test_ser_div_ser(self, dtype1, dtype2):
+        # no longer do integer div for any ops, but deal with the 0's
+        first = Series([3, 4, 5, 8], name='first').astype(dtype1)
+        second = Series([0, 0, 0, 3], name='second').astype(dtype2)
+
+        with np.errstate(all='ignore'):
+            expected = Series(first.values.astype(np.float64) / second.values,
+                              dtype='float64', name=None)
+        expected.iloc[0:3] = np.inf
+
+        result = first / second
+        tm.assert_series_equal(result, expected)
+        assert not result.equals(second / first)
+
+    def test_rdiv_zero_compat(self):
+        # GH#8674
+        zero_array = np.array([0] * 5)
+        data = np.random.randn(5)
+        expected = Series([0.] * 5)
+
+        result = zero_array / Series(data)
+        tm.assert_series_equal(result, expected)
+
+        result = Series(zero_array) / data
+        tm.assert_series_equal(result, expected)
+
+        result = Series(zero_array) / Series(data)
+        tm.assert_series_equal(result, expected)
+
+    def test_div_zero_inf_signs(self):
+        # GH#9144, inf signing
+        ser = Series([-1, 0, 1], name='first')
+        expected = Series([-np.inf, np.nan, np.inf], name='first')
+
+        result = ser / 0
+        tm.assert_series_equal(result, expected)
+
+    def test_rdiv_zero(self):
+        # GH#9144
+        ser = Series([-1, 0, 1], name='first')
+        expected = Series([0.0, np.nan, 0.0], name='first')
+
+        result = 0 / ser
+        tm.assert_series_equal(result, expected)
+
+    def test_floordiv_div(self):
+        # GH#9144
+        ser = Series([-1, 0, 1], name='first')
+
+        result = ser // 0
+        expected = Series([-np.inf, np.nan, np.inf], name='first')
+        tm.assert_series_equal(result, expected)
+
+
+class TestSeriesArithmetic(object):
+    # Standard, numeric, or otherwise not-Timestamp/Timedelta/Period dtypes
+    @pytest.mark.parametrize('data', [
+        [1, 2, 3],
+        [1.1, 2.2, 3.3],
+        [Timestamp('2011-01-01'), Timestamp('2011-01-02'), pd.NaT],
+        ['x', 'y', 1]])
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_series_radd_str_invalid(self, dtype, data):
+        ser = Series(data, dtype=dtype)
+        with pytest.raises(TypeError):
+            'foo_' + ser
+
+    # TODO: parametrize, better name
+    def test_object_ser_add_invalid(self):
+        # invalid ops
+        obj_ser = tm.makeObjectSeries()
+        obj_ser.name = 'objects'
+        with pytest.raises(Exception):
+            obj_ser + 1
+        with pytest.raises(Exception):
+            obj_ser + np.array(1, dtype=np.int64)
+        with pytest.raises(Exception):
+            obj_ser - 1
+        with pytest.raises(Exception):
+            obj_ser - np.array(1, dtype=np.int64)
+
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_series_with_dtype_radd_nan(self, dtype):
+        ser = pd.Series([1, 2, 3], dtype=dtype)
+        expected = pd.Series([np.nan, np.nan, np.nan], dtype=dtype)
+
+        result = np.nan + ser
+        tm.assert_series_equal(result, expected)
+
+        result = ser + np.nan
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_series_with_dtype_radd_int(self, dtype):
+        ser = pd.Series([1, 2, 3], dtype=dtype)
+        expected = pd.Series([2, 3, 4], dtype=dtype)
+
+        result = 1 + ser
+        tm.assert_series_equal(result, expected)
+
+        result = ser + 1
+        tm.assert_series_equal(result, expected)
+
+    def test_series_radd_str(self):
+        ser = pd.Series(['x', np.nan, 'x'])
+        tm.assert_series_equal('a' + ser, pd.Series(['ax', np.nan, 'ax']))
+        tm.assert_series_equal(ser + 'a', pd.Series(['xa', np.nan, 'xa']))
+
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_series_with_dtype_radd_timedelta(self, dtype):
+        # note this test is _not_ aimed at timedelta64-dtyped Series
+        ser = pd.Series([pd.Timedelta('1 days'), pd.Timedelta('2 days'),
+                         pd.Timedelta('3 days')], dtype=dtype)
+        expected = pd.Series([pd.Timedelta('4 days'), pd.Timedelta('5 days'),
+                              pd.Timedelta('6 days')])
+
+        result = pd.Timedelta('3 days') + ser
+        tm.assert_series_equal(result, expected)
+
+        result = ser + pd.Timedelta('3 days')
+        tm.assert_series_equal(result, expected)
+
+
+class TestPeriodSeriesArithmetic(object):
+    def test_ops_series_timedelta(self):
+        # GH 13043
+        ser = pd.Series([pd.Period('2015-01-01', freq='D'),
+                         pd.Period('2015-01-02', freq='D')], name='xxx')
+        assert ser.dtype == object
+
+        expected = pd.Series([pd.Period('2015-01-02', freq='D'),
+                              pd.Period('2015-01-03', freq='D')], name='xxx')
+
+        result = ser + pd.Timedelta('1 days')
+        tm.assert_series_equal(result, expected)
+
+        result = pd.Timedelta('1 days') + ser
+        tm.assert_series_equal(result, expected)
+
+        result = ser + pd.tseries.offsets.Day()
+        tm.assert_series_equal(result, expected)
+
+        result = pd.tseries.offsets.Day() + ser
+        tm.assert_series_equal(result, expected)
+
+    def test_ops_series_period(self):
+        # GH 13043
+        ser = pd.Series([pd.Period('2015-01-01', freq='D'),
+                         pd.Period('2015-01-02', freq='D')], name='xxx')
+        assert ser.dtype == object
+
+        per = pd.Period('2015-01-10', freq='D')
+        off = per.freq
+        # dtype will be object because of original dtype
+        expected = pd.Series([9 * off, 8 * off], name='xxx', dtype=object)
+        tm.assert_series_equal(per - ser, expected)
+        tm.assert_series_equal(ser - per, -1 * expected)
+
+        s2 = pd.Series([pd.Period('2015-01-05', freq='D'),
+                        pd.Period('2015-01-04', freq='D')], name='xxx')
+        assert s2.dtype == object
+
+        expected = pd.Series([4 * off, 2 * off], name='xxx', dtype=object)
+        tm.assert_series_equal(s2 - ser, expected)
+        tm.assert_series_equal(ser - s2, -1 * expected)
+
+
+class TestTimestampSeriesArithmetic(object):
+    def test_timestamp_sub_series(self):
+        ser = pd.Series(pd.date_range('2014-03-17', periods=2, freq='D',
+                                      tz='US/Eastern'))
+        ts = ser[0]
+
+        delta_series = pd.Series([np.timedelta64(0, 'D'),
+                                  np.timedelta64(1, 'D')])
+        tm.assert_series_equal(ser - ts, delta_series)
+        tm.assert_series_equal(ts - ser, -delta_series)
+
+    def test_dt64ser_sub_datetime_dtype(self):
+        ts = Timestamp(datetime(1993, 1, 7, 13, 30, 00))
+        dt = datetime(1993, 6, 22, 13, 30)
+        ser = Series([ts])
+        result = pd.to_timedelta(np.abs(ser - dt))
+        assert result.dtype == 'timedelta64[ns]'
+
+
+class TestTimedeltaSeriesAdditionSubtraction(object):
+    # Tests for Series[timedelta64[ns]] __add__, __sub__, __radd__, __rsub__
+
+    # ------------------------------------------------------------------
+    # Operations with int-like others
+
+    def test_td64series_add_int_series_invalid(self, tdser):
+        with pytest.raises(TypeError):
+            tdser + Series([2, 3, 4])
+
+    @pytest.mark.xfail(reason='GH#19123 integer interpreted as nanoseconds')
+    def test_td64series_radd_int_series_invalid(self, tdser):
+        with pytest.raises(TypeError):
+            Series([2, 3, 4]) + tdser
+
+    def test_td64series_sub_int_series_invalid(self, tdser):
+        with pytest.raises(TypeError):
+            tdser - Series([2, 3, 4])
+
+    @pytest.mark.xfail(reason='GH#19123 integer interpreted as nanoseconds')
+    def test_td64series_rsub_int_series_invalid(self, tdser):
+        with pytest.raises(TypeError):
+            Series([2, 3, 4]) - tdser
+
+    def test_td64_series_add_intlike(self):
+        # GH#19123
+        tdi = pd.TimedeltaIndex(['59 days', '59 days', 'NaT'])
+        ser = Series(tdi)
+
+        other = Series([20, 30, 40], dtype='uint8')
+
+        pytest.raises(TypeError, ser.__add__, 1)
+        pytest.raises(TypeError, ser.__sub__, 1)
+
+        pytest.raises(TypeError, ser.__add__, other)
+        pytest.raises(TypeError, ser.__sub__, other)
+
+        pytest.raises(TypeError, ser.__add__, other.values)
+        pytest.raises(TypeError, ser.__sub__, other.values)
+
+        pytest.raises(TypeError, ser.__add__, pd.Index(other))
+        pytest.raises(TypeError, ser.__sub__, pd.Index(other))
+
+    @pytest.mark.parametrize('scalar', [1, 1.5, np.array(2)])
+    def test_td64series_add_sub_numeric_scalar_invalid(self, scalar, tdser):
+        with pytest.raises(TypeError):
+            tdser + scalar
+        with pytest.raises(TypeError):
+            scalar + tdser
+        with pytest.raises(TypeError):
+            tdser - scalar
+        with pytest.raises(TypeError):
+            scalar - tdser
+
+    @pytest.mark.parametrize('dtype', ['int64', 'int32', 'int16',
+                                       'uint64', 'uint32', 'uint16', 'uint8',
+                                       'float64', 'float32', 'float16'])
+    @pytest.mark.parametrize('vector', [
+        np.array([1, 2, 3]),
+        pd.Index([1, 2, 3]),
+        pytest.param(Series([1, 2, 3]),
+                     marks=pytest.mark.xfail(reason='GH#19123 integer '
+                                                    'interpreted as nanos'))
+    ])
+    def test_td64series_add_sub_numeric_array_invalid(self, vector,
+                                                      dtype, tdser):
+        vector = vector.astype(dtype)
+        with pytest.raises(TypeError):
+            tdser + vector
+        with pytest.raises(TypeError):
+            vector + tdser
+        with pytest.raises(TypeError):
+            tdser - vector
+        with pytest.raises(TypeError):
+            vector - tdser
+
+    # ------------------------------------------------------------------
+    # Operations with datetime-like others
+
+    def test_td64series_add_sub_timestamp(self):
+        # GH#11925
+        tdser = Series(pd.timedelta_range('1 day', periods=3))
+        ts = Timestamp('2012-01-01')
+        expected = Series(pd.date_range('2012-01-02', periods=3))
+        tm.assert_series_equal(ts + tdser, expected)
+        tm.assert_series_equal(tdser + ts, expected)
+
+        expected2 = Series(pd.date_range('2011-12-31', periods=3, freq='-1D'))
+        tm.assert_series_equal(ts - tdser, expected2)
+        tm.assert_series_equal(ts + (-tdser), expected2)
+
+        with pytest.raises(TypeError):
+            tdser - ts
+
+    # ------------------------------------------------------------------
+    # Operations with timedelta-like others (including DateOffsets)
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('Egon', 'Venkman', None),
+                                       ('NCC1701D', 'NCC1701D', 'NCC1701D')])
+    def test_td64_series_with_tdi(self, names):
+        # GH#17250 make sure result dtype is correct
+        # GH#19043 make sure names are propagated correctly
+        tdi = pd.TimedeltaIndex(['0 days', '1 day'], name=names[0])
+        ser = Series([Timedelta(hours=3), Timedelta(hours=4)], name=names[1])
+        expected = Series([Timedelta(hours=3), Timedelta(days=1, hours=4)],
+                          name=names[2])
+
+        result = tdi + ser
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'timedelta64[ns]'
+
+        result = ser + tdi
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'timedelta64[ns]'
+
+        expected = Series([Timedelta(hours=-3), Timedelta(days=1, hours=-4)],
+                          name=names[2])
+
+        result = tdi - ser
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'timedelta64[ns]'
+
+        result = ser - tdi
+        tm.assert_series_equal(result, -expected)
+        assert result.dtype == 'timedelta64[ns]'
+
+    def test_td64_sub_NaT(self):
+        # GH#18808
+        ser = Series([NaT, Timedelta('1s')])
+        res = ser - NaT
+        expected = Series([NaT, NaT], dtype='timedelta64[ns]')
+        tm.assert_series_equal(res, expected)
+
+
+class TestTimedeltaSeriesMultiplicationDivision(object):
+    # Tests for Series[timedelta64[ns]]
+    # __mul__, __rmul__, __div__, __rdiv__, __floordiv__, __rfloordiv__
+
+    # ------------------------------------------------------------------
+    # __floordiv__, __rfloordiv__
+
+    @pytest.mark.parametrize('scalar_td', [
+        timedelta(minutes=5, seconds=4),
+        Timedelta('5m4s'),
+        Timedelta('5m4s').to_timedelta64()])
+    def test_timedelta_floordiv(self, scalar_td):
+        # GH#18831
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        result = td1 // scalar_td
+        expected = Series([0, 0, np.nan])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('scalar_td', [
+        timedelta(minutes=5, seconds=4),
+        Timedelta('5m4s'),
+        Timedelta('5m4s').to_timedelta64()])
+    def test_timedelta_rfloordiv(self, scalar_td):
+        # GH#18831
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+        result = scalar_td // td1
+        expected = Series([1, 1, np.nan])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('scalar_td', [
+        timedelta(minutes=5, seconds=4),
+        Timedelta('5m4s'),
+        Timedelta('5m4s').to_timedelta64()])
+    def test_timedelta_rfloordiv_explicit(self, scalar_td):
+        # GH#18831
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        # We can test __rfloordiv__ using this syntax,
+        # see `test_timedelta_rfloordiv`
+        result = td1.__rfloordiv__(scalar_td)
+        expected = Series([1, 1, np.nan])
+        tm.assert_series_equal(result, expected)
+
+    # ------------------------------------------------------------------
+    # Operations with int-like others
+
+    @pytest.mark.parametrize('dtype', ['int64', 'int32', 'int16',
+                                       'uint64', 'uint32', 'uint16', 'uint8',
+                                       'float64', 'float32', 'float16'])
+    @pytest.mark.parametrize('vector', [np.array([20, 30, 40]),
+                                        pd.Index([20, 30, 40]),
+                                        Series([20, 30, 40])])
+    def test_td64series_div_numeric_array(self, vector, dtype, tdser):
+        # GH#4521
+        # divide/multiply by integers
+        vector = vector.astype(dtype)
+        expected = Series(['2.95D', '1D 23H 12m', 'NaT'],
+                          dtype='timedelta64[ns]')
+
+        result = tdser / vector
+        tm.assert_series_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            vector / tdser
+
+    @pytest.mark.parametrize('dtype', ['int64', 'int32', 'int16',
+                                       'uint64', 'uint32', 'uint16', 'uint8',
+                                       'float64', 'float32', 'float16'])
+    @pytest.mark.parametrize('vector', [np.array([20, 30, 40]),
+                                        pd.Index([20, 30, 40]),
+                                        Series([20, 30, 40])])
+    def test_td64series_mul_numeric_array(self, vector, dtype, tdser):
+        # GH#4521
+        # divide/multiply by integers
+        vector = vector.astype(dtype)
+
+        expected = Series(['1180 Days', '1770 Days', 'NaT'],
+                          dtype='timedelta64[ns]')
+
+        result = tdser * vector
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', ['int64', 'int32', 'int16',
+                                       'uint64', 'uint32', 'uint16', 'uint8',
+                                       'float64', 'float32', 'float16'])
+    @pytest.mark.parametrize('vector', [
+        np.array([20, 30, 40]),
+        pytest.param(pd.Index([20, 30, 40]),
+                     marks=pytest.mark.xfail(reason='__mul__ raises '
+                                                    'instead of returning '
+                                                    'NotImplemented')),
+        Series([20, 30, 40])
+    ])
+    def test_td64series_rmul_numeric_array(self, vector, dtype, tdser):
+        # GH#4521
+        # divide/multiply by integers
+        vector = vector.astype(dtype)
+
+        expected = Series(['1180 Days', '1770 Days', 'NaT'],
+                          dtype='timedelta64[ns]')
+
+        result = vector * tdser
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('one', [1, np.array(1), 1.0, np.array(1.0)])
+    def test_td64series_mul_numeric_scalar(self, one, tdser):
+        # GH#4521
+        # divide/multiply by integers
+        expected = Series(['-59 Days', '-59 Days', 'NaT'],
+                          dtype='timedelta64[ns]')
+
+        result = tdser * (-one)
+        tm.assert_series_equal(result, expected)
+        result = (-one) * tdser
+        tm.assert_series_equal(result, expected)
+
+        expected = Series(['118 Days', '118 Days', 'NaT'],
+                          dtype='timedelta64[ns]')
+
+        result = tdser * (2 * one)
+        tm.assert_series_equal(result, expected)
+        result = (2 * one) * tdser
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('two', [
+        2, 2.0,
+        pytest.param(np.array(2),
+                     marks=pytest.mark.xfail(reason='GH#19011 is_list_like '
+                                                    'incorrectly True.')),
+        pytest.param(np.array(2.0),
+                     marks=pytest.mark.xfail(reason='GH#19011 is_list_like '
+                                                    'incorrectly True.')),
+    ])
+    def test_td64series_div_numeric_scalar(self, two, tdser):
+        # GH#4521
+        # divide/multiply by integers
+        expected = Series(['29.5D', '29.5D', 'NaT'], dtype='timedelta64[ns]')
+
+        result = tdser / two
+        tm.assert_series_equal(result, expected)
+
+    # ------------------------------------------------------------------
+    # Operations with timedelta-like others
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('Egon', 'Venkman', None),
+                                       ('NCC1701D', 'NCC1701D', 'NCC1701D')])
+    def test_tdi_mul_int_series(self, names):
+        # GH#19042
+        tdi = pd.TimedeltaIndex(['0days', '1day', '2days', '3days', '4days'],
+                                name=names[0])
+        ser = Series([0, 1, 2, 3, 4], dtype=np.int64, name=names[1])
+
+        expected = Series(['0days', '1day', '4days', '9days', '16days'],
+                          dtype='timedelta64[ns]',
+                          name=names[2])
+
+        result = ser * tdi
+        tm.assert_series_equal(result, expected)
+
+        # The direct operation tdi * ser still needs to be fixed.
+        result = ser.__rmul__(tdi)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('Egon', 'Venkman', None),
+                                       ('NCC1701D', 'NCC1701D', 'NCC1701D')])
+    def test_float_series_rdiv_tdi(self, names):
+        # GH#19042
+        # TODO: the direct operation TimedeltaIndex / Series still
+        # needs to be fixed.
+        tdi = pd.TimedeltaIndex(['0days', '1day', '2days', '3days', '4days'],
+                                name=names[0])
+        ser = Series([1.5, 3, 4.5, 6, 7.5], dtype=np.float64, name=names[1])
+
+        expected = Series([tdi[n] / ser[n] for n in range(len(ser))],
+                          dtype='timedelta64[ns]',
+                          name=names[2])
+
+        result = ser.__rdiv__(tdi)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('scalar_td', [
+        timedelta(minutes=5, seconds=4),
+        Timedelta('5m4s'),
+        Timedelta('5m4s').to_timedelta64()])
+    def test_td64series_mul_timedeltalike_invalid(self, scalar_td):
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        # check that we are getting a TypeError
+        # with 'operate' (from core/ops.py) for the ops that are not
+        # defined
+        pattern = 'operate|unsupported|cannot|not supported'
+        with tm.assert_raises_regex(TypeError, pattern):
+            td1 * scalar_td
+        with tm.assert_raises_regex(TypeError, pattern):
+            scalar_td * td1
+
+
+class TestTimedeltaSeriesInvalidArithmeticOps(object):
+    @pytest.mark.parametrize('scalar_td', [
+        timedelta(minutes=5, seconds=4),
+        Timedelta('5m4s'),
+        Timedelta('5m4s').to_timedelta64()])
+    def test_td64series_pow_invalid(self, scalar_td):
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        # check that we are getting a TypeError
+        # with 'operate' (from core/ops.py) for the ops that are not
+        # defined
+        pattern = 'operate|unsupported|cannot|not supported'
+        with tm.assert_raises_regex(TypeError, pattern):
+            scalar_td ** td1
+        with tm.assert_raises_regex(TypeError, pattern):
+            td1 ** scalar_td
diff --git a/pandas/tests/series/test_asof.py b/pandas/tests/series/test_asof.py
new file mode 100644
index 0000000000000..3104d85601434
--- /dev/null
+++ b/pandas/tests/series/test_asof.py
@@ -0,0 +1,178 @@
+# coding=utf-8
+
+import pytest
+
+import numpy as np
+from pandas import (offsets, Series, notna,
+                    isna, date_range, Timestamp)
+
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestSeriesAsof(TestData):
+
+    def test_basic(self):
+
+        # array or list or dates
+        N = 50
+        rng = date_range('1/1/1990', periods=N, freq='53s')
+        ts = Series(np.random.randn(N), index=rng)
+        ts[15:30] = np.nan
+        dates = date_range('1/1/1990', periods=N * 3, freq='25s')
+
+        result = ts.asof(dates)
+        assert notna(result).all()
+        lb = ts.index[14]
+        ub = ts.index[30]
+
+        result = ts.asof(list(dates))
+        assert notna(result).all()
+        lb = ts.index[14]
+        ub = ts.index[30]
+
+        mask = (result.index >= lb) & (result.index < ub)
+        rs = result[mask]
+        assert (rs == ts[lb]).all()
+
+        val = result[result.index[result.index >= ub][0]]
+        assert ts[ub] == val
+
+    def test_scalar(self):
+
+        N = 30
+        rng = date_range('1/1/1990', periods=N, freq='53s')
+        ts = Series(np.arange(N), index=rng)
+        ts[5:10] = np.NaN
+        ts[15:20] = np.NaN
+
+        val1 = ts.asof(ts.index[7])
+        val2 = ts.asof(ts.index[19])
+
+        assert val1 == ts[4]
+        assert val2 == ts[14]
+
+        # accepts strings
+        val1 = ts.asof(str(ts.index[7]))
+        assert val1 == ts[4]
+
+        # in there
+        result = ts.asof(ts.index[3])
+        assert result == ts[3]
+
+        # no as of value
+        d = ts.index[0] - offsets.BDay()
+        assert np.isnan(ts.asof(d))
+
+    def test_with_nan(self):
+        # basic asof test
+        rng = date_range('1/1/2000', '1/2/2000', freq='4h')
+        s = Series(np.arange(len(rng)), index=rng)
+        r = s.resample('2h').mean()
+
+        result = r.asof(r.index)
+        expected = Series([0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 6.],
+                          index=date_range('1/1/2000', '1/2/2000', freq='2h'))
+        tm.assert_series_equal(result, expected)
+
+        r.iloc[3:5] = np.nan
+        result = r.asof(r.index)
+        expected = Series([0, 0, 1, 1, 1, 1, 3, 3, 4, 4, 5, 5, 6.],
+                          index=date_range('1/1/2000', '1/2/2000', freq='2h'))
+        tm.assert_series_equal(result, expected)
+
+        r.iloc[-3:] = np.nan
+        result = r.asof(r.index)
+        expected = Series([0, 0, 1, 1, 1, 1, 3, 3, 4, 4, 4, 4, 4.],
+                          index=date_range('1/1/2000', '1/2/2000', freq='2h'))
+        tm.assert_series_equal(result, expected)
+
+    def test_periodindex(self):
+        from pandas import period_range, PeriodIndex
+        # array or list or dates
+        N = 50
+        rng = period_range('1/1/1990', periods=N, freq='H')
+        ts = Series(np.random.randn(N), index=rng)
+        ts[15:30] = np.nan
+        dates = date_range('1/1/1990', periods=N * 3, freq='37min')
+
+        result = ts.asof(dates)
+        assert notna(result).all()
+        lb = ts.index[14]
+        ub = ts.index[30]
+
+        result = ts.asof(list(dates))
+        assert notna(result).all()
+        lb = ts.index[14]
+        ub = ts.index[30]
+
+        pix = PeriodIndex(result.index.values, freq='H')
+        mask = (pix >= lb) & (pix < ub)
+        rs = result[mask]
+        assert (rs == ts[lb]).all()
+
+        ts[5:10] = np.nan
+        ts[15:20] = np.nan
+
+        val1 = ts.asof(ts.index[7])
+        val2 = ts.asof(ts.index[19])
+
+        assert val1 == ts[4]
+        assert val2 == ts[14]
+
+        # accepts strings
+        val1 = ts.asof(str(ts.index[7]))
+        assert val1 == ts[4]
+
+        # in there
+        assert ts.asof(ts.index[3]) == ts[3]
+
+        # no as of value
+        d = ts.index[0].to_timestamp() - offsets.BDay()
+        assert isna(ts.asof(d))
+
+    def test_errors(self):
+
+        s = Series([1, 2, 3],
+                   index=[Timestamp('20130101'),
+                          Timestamp('20130103'),
+                          Timestamp('20130102')])
+
+        # non-monotonic
+        assert not s.index.is_monotonic
+        with pytest.raises(ValueError):
+            s.asof(s.index[0])
+
+        # subset with Series
+        N = 10
+        rng = date_range('1/1/1990', periods=N, freq='53s')
+        s = Series(np.random.randn(N), index=rng)
+        with pytest.raises(ValueError):
+            s.asof(s.index[0], subset='foo')
+
+    def test_all_nans(self):
+        # GH 15713
+        # series is all nans
+        result = Series([np.nan]).asof([0])
+        expected = Series([np.nan])
+        tm.assert_series_equal(result, expected)
+
+        # testing non-default indexes
+        N = 50
+        rng = date_range('1/1/1990', periods=N, freq='53s')
+
+        dates = date_range('1/1/1990', periods=N * 3, freq='25s')
+        result = Series(np.nan, index=rng).asof(dates)
+        expected = Series(np.nan, index=dates)
+        tm.assert_series_equal(result, expected)
+
+        # testing scalar input
+        date = date_range('1/1/1990', periods=N * 3, freq='25s')[0]
+        result = Series(np.nan, index=rng).asof(date)
+        assert isna(result)
+
+        # test name is propagated
+        result = Series(np.nan, index=[1, 2, 3, 4], name='test').asof([4, 5])
+        expected = Series(np.nan, index=[4, 5], name='test')
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/series/test_combine_concat.py b/pandas/tests/series/test_combine_concat.py
new file mode 100644
index 0000000000000..f35cce6ac9d71
--- /dev/null
+++ b/pandas/tests/series/test_combine_concat.py
@@ -0,0 +1,325 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+
+from datetime import datetime
+
+from numpy import nan
+import numpy as np
+import pandas as pd
+
+from pandas import Series, DataFrame, date_range, DatetimeIndex
+
+from pandas import compat
+from pandas.util.testing import assert_series_equal
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestSeriesCombine(TestData):
+
+    def test_append(self):
+        appendedSeries = self.series.append(self.objSeries)
+        for idx, value in compat.iteritems(appendedSeries):
+            if idx in self.series.index:
+                assert value == self.series[idx]
+            elif idx in self.objSeries.index:
+                assert value == self.objSeries[idx]
+            else:
+                self.fail("orphaned index!")
+
+        pytest.raises(ValueError, self.ts.append, self.ts,
+                      verify_integrity=True)
+
+    def test_append_many(self):
+        pieces = [self.ts[:5], self.ts[5:10], self.ts[10:]]
+
+        result = pieces[0].append(pieces[1:])
+        assert_series_equal(result, self.ts)
+
+    def test_append_duplicates(self):
+        # GH 13677
+        s1 = pd.Series([1, 2, 3])
+        s2 = pd.Series([4, 5, 6])
+        exp = pd.Series([1, 2, 3, 4, 5, 6], index=[0, 1, 2, 0, 1, 2])
+        tm.assert_series_equal(s1.append(s2), exp)
+        tm.assert_series_equal(pd.concat([s1, s2]), exp)
+
+        # the result must have RangeIndex
+        exp = pd.Series([1, 2, 3, 4, 5, 6])
+        tm.assert_series_equal(s1.append(s2, ignore_index=True),
+                               exp, check_index_type=True)
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True),
+                               exp, check_index_type=True)
+
+        msg = 'Indexes have overlapping values:'
+        with tm.assert_raises_regex(ValueError, msg):
+            s1.append(s2, verify_integrity=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            pd.concat([s1, s2], verify_integrity=True)
+
+    def test_combine_scalar(self):
+        # GH 21248
+        # Note - combine() with another Series is tested elsewhere because
+        # it is used when testing operators
+        s = pd.Series([i * 10 for i in range(5)])
+        result = s.combine(3, lambda x, y: x + y)
+        expected = pd.Series([i * 10 + 3 for i in range(5)])
+        tm.assert_series_equal(result, expected)
+
+        result = s.combine(22, lambda x, y: min(x, y))
+        expected = pd.Series([min(i * 10, 22) for i in range(5)])
+        tm.assert_series_equal(result, expected)
+
+    def test_combine_first(self):
+        values = tm.makeIntIndex(20).values.astype(float)
+        series = Series(values, index=tm.makeIntIndex(20))
+
+        series_copy = series * 2
+        series_copy[::2] = np.NaN
+
+        # nothing used from the input
+        combined = series.combine_first(series_copy)
+
+        tm.assert_series_equal(combined, series)
+
+        # Holes filled from input
+        combined = series_copy.combine_first(series)
+        assert np.isfinite(combined).all()
+
+        tm.assert_series_equal(combined[::2], series[::2])
+        tm.assert_series_equal(combined[1::2], series_copy[1::2])
+
+        # mixed types
+        index = tm.makeStringIndex(20)
+        floats = Series(tm.randn(20), index=index)
+        strings = Series(tm.makeStringIndex(10), index=index[::2])
+
+        combined = strings.combine_first(floats)
+
+        tm.assert_series_equal(strings, combined.loc[index[::2]])
+        tm.assert_series_equal(floats[1::2].astype(object),
+                               combined.loc[index[1::2]])
+
+        # corner case
+        s = Series([1., 2, 3], index=[0, 1, 2])
+        result = s.combine_first(Series([], index=[]))
+        assert_series_equal(s, result)
+
+    def test_update(self):
+        s = Series([1.5, nan, 3., 4., nan])
+        s2 = Series([nan, 3.5, nan, 5.])
+        s.update(s2)
+
+        expected = Series([1.5, 3.5, 3., 5., np.nan])
+        assert_series_equal(s, expected)
+
+        # GH 3217
+        df = DataFrame([{"a": 1}, {"a": 3, "b": 2}])
+        df['c'] = np.nan
+
+        # this will fail as long as series is a sub-class of ndarray
+        # df['c'].update(Series(['foo'],index=[0])) #####
+
+    def test_concat_empty_series_dtypes_roundtrips(self):
+
+        # round-tripping with self & like self
+        dtypes = map(np.dtype, ['float64', 'int8', 'uint8', 'bool', 'm8[ns]',
+                                'M8[ns]'])
+
+        for dtype in dtypes:
+            assert pd.concat([Series(dtype=dtype)]).dtype == dtype
+            assert pd.concat([Series(dtype=dtype),
+                              Series(dtype=dtype)]).dtype == dtype
+
+        def int_result_type(dtype, dtype2):
+            typs = set([dtype.kind, dtype2.kind])
+            if not len(typs - set(['i', 'u', 'b'])) and (dtype.kind == 'i' or
+                                                         dtype2.kind == 'i'):
+                return 'i'
+            elif not len(typs - set(['u', 'b'])) and (dtype.kind == 'u' or
+                                                      dtype2.kind == 'u'):
+                return 'u'
+            return None
+
+        def float_result_type(dtype, dtype2):
+            typs = set([dtype.kind, dtype2.kind])
+            if not len(typs - set(['f', 'i', 'u'])) and (dtype.kind == 'f' or
+                                                         dtype2.kind == 'f'):
+                return 'f'
+            return None
+
+        def get_result_type(dtype, dtype2):
+            result = float_result_type(dtype, dtype2)
+            if result is not None:
+                return result
+            result = int_result_type(dtype, dtype2)
+            if result is not None:
+                return result
+            return 'O'
+
+        for dtype in dtypes:
+            for dtype2 in dtypes:
+                if dtype == dtype2:
+                    continue
+
+                expected = get_result_type(dtype, dtype2)
+                result = pd.concat([Series(dtype=dtype), Series(dtype=dtype2)
+                                    ]).dtype
+                assert result.kind == expected
+
+    def test_concat_empty_series_dtypes(self):
+
+        # booleans
+        assert pd.concat([Series(dtype=np.bool_),
+                          Series(dtype=np.int32)]).dtype == np.int32
+        assert pd.concat([Series(dtype=np.bool_),
+                          Series(dtype=np.float32)]).dtype == np.object_
+
+        # datetime-like
+        assert pd.concat([Series(dtype='m8[ns]'),
+                          Series(dtype=np.bool)]).dtype == np.object_
+        assert pd.concat([Series(dtype='m8[ns]'),
+                          Series(dtype=np.int64)]).dtype == np.object_
+        assert pd.concat([Series(dtype='M8[ns]'),
+                          Series(dtype=np.bool)]).dtype == np.object_
+        assert pd.concat([Series(dtype='M8[ns]'),
+                          Series(dtype=np.int64)]).dtype == np.object_
+        assert pd.concat([Series(dtype='M8[ns]'),
+                          Series(dtype=np.bool_),
+                          Series(dtype=np.int64)]).dtype == np.object_
+
+        # categorical
+        assert pd.concat([Series(dtype='category'),
+                          Series(dtype='category')]).dtype == 'category'
+        # GH 18515
+        assert pd.concat([Series(np.array([]), dtype='category'),
+                          Series(dtype='float64')]).dtype == 'float64'
+        assert pd.concat([Series(dtype='category'),
+                          Series(dtype='object')]).dtype == 'object'
+
+        # sparse
+        result = pd.concat([Series(dtype='float64').to_sparse(), Series(
+            dtype='float64').to_sparse()])
+        assert result.dtype == np.float64
+        assert result.ftype == 'float64:sparse'
+
+        result = pd.concat([Series(dtype='float64').to_sparse(), Series(
+            dtype='float64')])
+        assert result.dtype == np.float64
+        assert result.ftype == 'float64:sparse'
+
+        result = pd.concat([Series(dtype='float64').to_sparse(), Series(
+            dtype='object')])
+        assert result.dtype == np.object_
+        assert result.ftype == 'object:dense'
+
+    def test_combine_first_dt64(self):
+        from pandas.core.tools.datetimes import to_datetime
+        s0 = to_datetime(Series(["2010", np.NaN]))
+        s1 = to_datetime(Series([np.NaN, "2011"]))
+        rs = s0.combine_first(s1)
+        xp = to_datetime(Series(['2010', '2011']))
+        assert_series_equal(rs, xp)
+
+        s0 = to_datetime(Series(["2010", np.NaN]))
+        s1 = Series([np.NaN, "2011"])
+        rs = s0.combine_first(s1)
+        xp = Series([datetime(2010, 1, 1), '2011'])
+        assert_series_equal(rs, xp)
+
+
+class TestTimeseries(object):
+
+    def test_append_concat(self):
+        rng = date_range('5/8/2012 1:45', periods=10, freq='5T')
+        ts = Series(np.random.randn(len(rng)), rng)
+        df = DataFrame(np.random.randn(len(rng), 4), index=rng)
+
+        result = ts.append(ts)
+        result_df = df.append(df)
+        ex_index = DatetimeIndex(np.tile(rng.values, 2))
+        tm.assert_index_equal(result.index, ex_index)
+        tm.assert_index_equal(result_df.index, ex_index)
+
+        appended = rng.append(rng)
+        tm.assert_index_equal(appended, ex_index)
+
+        appended = rng.append([rng, rng])
+        ex_index = DatetimeIndex(np.tile(rng.values, 3))
+        tm.assert_index_equal(appended, ex_index)
+
+        # different index names
+        rng1 = rng.copy()
+        rng2 = rng.copy()
+        rng1.name = 'foo'
+        rng2.name = 'bar'
+        assert rng1.append(rng1).name == 'foo'
+        assert rng1.append(rng2).name is None
+
+    def test_append_concat_tz(self):
+        # see gh-2938
+        rng = date_range('5/8/2012 1:45', periods=10, freq='5T',
+                         tz='US/Eastern')
+        rng2 = date_range('5/8/2012 2:35', periods=10, freq='5T',
+                          tz='US/Eastern')
+        rng3 = date_range('5/8/2012 1:45', periods=20, freq='5T',
+                          tz='US/Eastern')
+        ts = Series(np.random.randn(len(rng)), rng)
+        df = DataFrame(np.random.randn(len(rng), 4), index=rng)
+        ts2 = Series(np.random.randn(len(rng2)), rng2)
+        df2 = DataFrame(np.random.randn(len(rng2), 4), index=rng2)
+
+        result = ts.append(ts2)
+        result_df = df.append(df2)
+        tm.assert_index_equal(result.index, rng3)
+        tm.assert_index_equal(result_df.index, rng3)
+
+        appended = rng.append(rng2)
+        tm.assert_index_equal(appended, rng3)
+
+    def test_append_concat_tz_explicit_pytz(self):
+        # see gh-2938
+        from pytz import timezone as timezone
+
+        rng = date_range('5/8/2012 1:45', periods=10, freq='5T',
+                         tz=timezone('US/Eastern'))
+        rng2 = date_range('5/8/2012 2:35', periods=10, freq='5T',
+                          tz=timezone('US/Eastern'))
+        rng3 = date_range('5/8/2012 1:45', periods=20, freq='5T',
+                          tz=timezone('US/Eastern'))
+        ts = Series(np.random.randn(len(rng)), rng)
+        df = DataFrame(np.random.randn(len(rng), 4), index=rng)
+        ts2 = Series(np.random.randn(len(rng2)), rng2)
+        df2 = DataFrame(np.random.randn(len(rng2), 4), index=rng2)
+
+        result = ts.append(ts2)
+        result_df = df.append(df2)
+        tm.assert_index_equal(result.index, rng3)
+        tm.assert_index_equal(result_df.index, rng3)
+
+        appended = rng.append(rng2)
+        tm.assert_index_equal(appended, rng3)
+
+    def test_append_concat_tz_dateutil(self):
+        # see gh-2938
+        rng = date_range('5/8/2012 1:45', periods=10, freq='5T',
+                         tz='dateutil/US/Eastern')
+        rng2 = date_range('5/8/2012 2:35', periods=10, freq='5T',
+                          tz='dateutil/US/Eastern')
+        rng3 = date_range('5/8/2012 1:45', periods=20, freq='5T',
+                          tz='dateutil/US/Eastern')
+        ts = Series(np.random.randn(len(rng)), rng)
+        df = DataFrame(np.random.randn(len(rng), 4), index=rng)
+        ts2 = Series(np.random.randn(len(rng2)), rng2)
+        df2 = DataFrame(np.random.randn(len(rng2), 4), index=rng2)
+
+        result = ts.append(ts2)
+        result_df = df.append(df2)
+        tm.assert_index_equal(result.index, rng3)
+        tm.assert_index_equal(result_df.index, rng3)
+
+        appended = rng.append(rng2)
+        tm.assert_index_equal(appended, rng3)
diff --git a/pandas/tests/series/test_constructors.py b/pandas/tests/series/test_constructors.py
new file mode 100644
index 0000000000000..fe224436c52e6
--- /dev/null
+++ b/pandas/tests/series/test_constructors.py
@@ -0,0 +1,1195 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+
+from datetime import datetime, timedelta
+from collections import OrderedDict
+
+from numpy import nan
+import numpy as np
+import numpy.ma as ma
+import pandas as pd
+
+from pandas.api.types import CategoricalDtype
+from pandas.core.dtypes.common import (
+    is_categorical_dtype,
+    is_datetime64tz_dtype)
+from pandas import (Index, Series, isna, date_range, Timestamp,
+                    NaT, period_range, timedelta_range, MultiIndex,
+                    IntervalIndex, Categorical, DataFrame)
+
+from pandas._libs import lib
+from pandas._libs.tslib import iNaT
+
+from pandas.compat import lrange, range, zip, long, PY36
+from pandas.util.testing import assert_series_equal
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestSeriesConstructors(TestData):
+
+    def test_invalid_dtype(self):
+        # GH15520
+        msg = 'not understood'
+        invalid_list = [pd.Timestamp, 'pd.Timestamp', list]
+        for dtype in invalid_list:
+            with tm.assert_raises_regex(TypeError, msg):
+                Series([], name='time', dtype=dtype)
+
+    def test_scalar_conversion(self):
+
+        # Pass in scalar is disabled
+        scalar = Series(0.5)
+        assert not isinstance(scalar, float)
+
+        # Coercion
+        assert float(Series([1.])) == 1.0
+        assert int(Series([1.])) == 1
+        assert long(Series([1.])) == 1
+
+    def test_constructor(self):
+        assert self.ts.index.is_all_dates
+
+        # Pass in Series
+        derived = Series(self.ts)
+        assert derived.index.is_all_dates
+
+        assert tm.equalContents(derived.index, self.ts.index)
+        # Ensure new index is not created
+        assert id(self.ts.index) == id(derived.index)
+
+        # Mixed type Series
+        mixed = Series(['hello', np.NaN], index=[0, 1])
+        assert mixed.dtype == np.object_
+        assert mixed[1] is np.NaN
+
+        assert not self.empty.index.is_all_dates
+        assert not Series({}).index.is_all_dates
+        pytest.raises(Exception, Series, np.random.randn(3, 3),
+                      index=np.arange(3))
+
+        mixed.name = 'Series'
+        rs = Series(mixed).name
+        xp = 'Series'
+        assert rs == xp
+
+        # raise on MultiIndex GH4187
+        m = MultiIndex.from_arrays([[1, 2], [3, 4]])
+        pytest.raises(NotImplementedError, Series, m)
+
+    @pytest.mark.parametrize('input_class', [list, dict, OrderedDict])
+    def test_constructor_empty(self, input_class):
+        empty = Series()
+        empty2 = Series(input_class())
+
+        # these are Index() and RangeIndex() which don't compare type equal
+        # but are just .equals
+        assert_series_equal(empty, empty2, check_index_type=False)
+
+        # With explicit dtype:
+        empty = Series(dtype='float64')
+        empty2 = Series(input_class(), dtype='float64')
+        assert_series_equal(empty, empty2, check_index_type=False)
+
+        # GH 18515 : with dtype=category:
+        empty = Series(dtype='category')
+        empty2 = Series(input_class(), dtype='category')
+        assert_series_equal(empty, empty2, check_index_type=False)
+
+        if input_class is not list:
+            # With index:
+            empty = Series(index=lrange(10))
+            empty2 = Series(input_class(), index=lrange(10))
+            assert_series_equal(empty, empty2)
+
+            # With index and dtype float64:
+            empty = Series(np.nan, index=lrange(10))
+            empty2 = Series(input_class(), index=lrange(10), dtype='float64')
+            assert_series_equal(empty, empty2)
+
+            # GH 19853 : with empty string, index and dtype str
+            empty = Series('', dtype=str, index=range(3))
+            empty2 = Series('', index=range(3))
+            assert_series_equal(empty, empty2)
+
+    @pytest.mark.parametrize('input_arg', [np.nan, float('nan')])
+    def test_constructor_nan(self, input_arg):
+        empty = Series(dtype='float64', index=lrange(10))
+        empty2 = Series(input_arg, index=lrange(10))
+
+        assert_series_equal(empty, empty2, check_index_type=False)
+
+    @pytest.mark.parametrize('dtype', [
+        'f8', 'i8', 'M8[ns]', 'm8[ns]', 'category', 'object',
+        'datetime64[ns, UTC]',
+    ])
+    @pytest.mark.parametrize('index', [None, pd.Index([])])
+    def test_constructor_dtype_only(self, dtype, index):
+        # GH-20865
+        result = pd.Series(dtype=dtype, index=index)
+        assert result.dtype == dtype
+        assert len(result) == 0
+
+    def test_constructor_no_data_index_order(self):
+        result = pd.Series(index=['b', 'a', 'c'])
+        assert result.index.tolist() == ['b', 'a', 'c']
+
+    def test_constructor_dtype_str_na_values(self, string_dtype):
+        # https://github.com/pandas-dev/pandas/issues/21083
+        ser = Series(['x', None], dtype=string_dtype)
+        result = ser.isna()
+        expected = Series([False, True])
+        tm.assert_series_equal(result, expected)
+        assert ser.iloc[1] is None
+
+        ser = Series(['x', np.nan], dtype=string_dtype)
+        assert np.isnan(ser.iloc[1])
+
+    def test_constructor_series(self):
+        index1 = ['d', 'b', 'a', 'c']
+        index2 = sorted(index1)
+        s1 = Series([4, 7, -5, 3], index=index1)
+        s2 = Series(s1, index=index2)
+
+        assert_series_equal(s2, s1.sort_index())
+
+    def test_constructor_iterator(self):
+
+        expected = Series(list(range(10)), dtype='int64')
+        result = Series(range(10), dtype='int64')
+        assert_series_equal(result, expected)
+
+    def test_constructor_list_like(self):
+
+        # make sure that we are coercing different
+        # list-likes to standard dtypes and not
+        # platform specific
+        expected = Series([1, 2, 3], dtype='int64')
+        for obj in [[1, 2, 3], (1, 2, 3),
+                    np.array([1, 2, 3], dtype='int64')]:
+            result = Series(obj, index=[0, 1, 2])
+            assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('input_vals', [
+        ([1, 2]),
+        (['1', '2']),
+        (list(pd.date_range('1/1/2011', periods=2, freq='H'))),
+        (list(pd.date_range('1/1/2011', periods=2, freq='H',
+                            tz='US/Eastern'))),
+        ([pd.Interval(left=0, right=5)]),
+    ])
+    def test_constructor_list_str(self, input_vals, string_dtype):
+        # GH 16605
+        # Ensure that data elements from a list are converted to strings
+        # when dtype is str, 'str', or 'U'
+        result = Series(input_vals, dtype=string_dtype)
+        expected = Series(input_vals).astype(string_dtype)
+        assert_series_equal(result, expected)
+
+    def test_constructor_list_str_na(self, string_dtype):
+        result = Series([1.0, 2.0, np.nan], dtype=string_dtype)
+        expected = Series(['1.0', '2.0', np.nan], dtype=object)
+        assert_series_equal(result, expected)
+        assert np.isnan(result[2])
+
+    def test_constructor_generator(self):
+        gen = (i for i in range(10))
+
+        result = Series(gen)
+        exp = Series(lrange(10))
+        assert_series_equal(result, exp)
+
+        gen = (i for i in range(10))
+        result = Series(gen, index=lrange(10, 20))
+        exp.index = lrange(10, 20)
+        assert_series_equal(result, exp)
+
+    def test_constructor_map(self):
+        # GH8909
+        m = map(lambda x: x, range(10))
+
+        result = Series(m)
+        exp = Series(lrange(10))
+        assert_series_equal(result, exp)
+
+        m = map(lambda x: x, range(10))
+        result = Series(m, index=lrange(10, 20))
+        exp.index = lrange(10, 20)
+        assert_series_equal(result, exp)
+
+    def test_constructor_categorical(self):
+        cat = pd.Categorical([0, 1, 2, 0, 1, 2], ['a', 'b', 'c'],
+                             fastpath=True)
+        res = Series(cat)
+        tm.assert_categorical_equal(res.values, cat)
+
+        # GH12574
+        pytest.raises(
+            ValueError, lambda: Series(pd.Categorical([1, 2, 3]),
+                                       dtype='int64'))
+        cat = Series(pd.Categorical([1, 2, 3]), dtype='category')
+        assert is_categorical_dtype(cat)
+        assert is_categorical_dtype(cat.dtype)
+        s = Series([1, 2, 3], dtype='category')
+        assert is_categorical_dtype(s)
+        assert is_categorical_dtype(s.dtype)
+
+    def test_constructor_categorical_with_coercion(self):
+        factor = Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
+        # test basic creation / coercion of categoricals
+        s = Series(factor, name='A')
+        assert s.dtype == 'category'
+        assert len(s) == len(factor)
+        str(s.values)
+        str(s)
+
+        # in a frame
+        df = DataFrame({'A': factor})
+        result = df['A']
+        tm.assert_series_equal(result, s)
+        result = df.iloc[:, 0]
+        tm.assert_series_equal(result, s)
+        assert len(df) == len(factor)
+        str(df.values)
+        str(df)
+
+        df = DataFrame({'A': s})
+        result = df['A']
+        tm.assert_series_equal(result, s)
+        assert len(df) == len(factor)
+        str(df.values)
+        str(df)
+
+        # multiples
+        df = DataFrame({'A': s, 'B': s, 'C': 1})
+        result1 = df['A']
+        result2 = df['B']
+        tm.assert_series_equal(result1, s)
+        tm.assert_series_equal(result2, s, check_names=False)
+        assert result2.name == 'B'
+        assert len(df) == len(factor)
+        str(df.values)
+        str(df)
+
+        # GH8623
+        x = DataFrame([[1, 'John P. Doe'], [2, 'Jane Dove'],
+                       [1, 'John P. Doe']],
+                      columns=['person_id', 'person_name'])
+        x['person_name'] = Categorical(x.person_name
+                                       )  # doing this breaks transform
+
+        expected = x.iloc[0].person_name
+        result = x.person_name.iloc[0]
+        assert result == expected
+
+        result = x.person_name[0]
+        assert result == expected
+
+        result = x.person_name.loc[0]
+        assert result == expected
+
+    def test_constructor_categorical_dtype(self):
+        result = pd.Series(['a', 'b'],
+                           dtype=CategoricalDtype(['a', 'b', 'c'],
+                                                  ordered=True))
+        assert is_categorical_dtype(result) is True
+        tm.assert_index_equal(result.cat.categories, pd.Index(['a', 'b', 'c']))
+        assert result.cat.ordered
+
+        result = pd.Series(['a', 'b'], dtype=CategoricalDtype(['b', 'a']))
+        assert is_categorical_dtype(result)
+        tm.assert_index_equal(result.cat.categories, pd.Index(['b', 'a']))
+        assert result.cat.ordered is False
+
+        # GH 19565 - Check broadcasting of scalar with Categorical dtype
+        result = Series('a', index=[0, 1],
+                        dtype=CategoricalDtype(['a', 'b'], ordered=True))
+        expected = Series(['a', 'a'], index=[0, 1],
+                          dtype=CategoricalDtype(['a', 'b'], ordered=True))
+        tm.assert_series_equal(result, expected, check_categorical=True)
+
+    def test_categorical_sideeffects_free(self):
+        # Passing a categorical to a Series and then changing values in either
+        # the series or the categorical should not change the values in the
+        # other one, IF you specify copy!
+        cat = Categorical(["a", "b", "c", "a"])
+        s = Series(cat, copy=True)
+        assert s.cat is not cat
+        s.cat.categories = [1, 2, 3]
+        exp_s = np.array([1, 2, 3, 1], dtype=np.int64)
+        exp_cat = np.array(["a", "b", "c", "a"], dtype=np.object_)
+        tm.assert_numpy_array_equal(s.__array__(), exp_s)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_cat)
+
+        # setting
+        s[0] = 2
+        exp_s2 = np.array([2, 2, 3, 1], dtype=np.int64)
+        tm.assert_numpy_array_equal(s.__array__(), exp_s2)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_cat)
+
+        # however, copy is False by default
+        # so this WILL change values
+        cat = Categorical(["a", "b", "c", "a"])
+        s = Series(cat)
+        assert s.values is cat
+        s.cat.categories = [1, 2, 3]
+        exp_s = np.array([1, 2, 3, 1], dtype=np.int64)
+        tm.assert_numpy_array_equal(s.__array__(), exp_s)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_s)
+
+        s[0] = 2
+        exp_s2 = np.array([2, 2, 3, 1], dtype=np.int64)
+        tm.assert_numpy_array_equal(s.__array__(), exp_s2)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_s2)
+
+    def test_unordered_compare_equal(self):
+        left = pd.Series(['a', 'b', 'c'],
+                         dtype=CategoricalDtype(['a', 'b']))
+        right = pd.Series(pd.Categorical(['a', 'b', np.nan],
+                                         categories=['a', 'b']))
+        tm.assert_series_equal(left, right)
+
+    def test_constructor_maskedarray(self):
+        data = ma.masked_all((3, ), dtype=float)
+        result = Series(data)
+        expected = Series([nan, nan, nan])
+        assert_series_equal(result, expected)
+
+        data[0] = 0.0
+        data[2] = 2.0
+        index = ['a', 'b', 'c']
+        result = Series(data, index=index)
+        expected = Series([0.0, nan, 2.0], index=index)
+        assert_series_equal(result, expected)
+
+        data[1] = 1.0
+        result = Series(data, index=index)
+        expected = Series([0.0, 1.0, 2.0], index=index)
+        assert_series_equal(result, expected)
+
+        data = ma.masked_all((3, ), dtype=int)
+        result = Series(data)
+        expected = Series([nan, nan, nan], dtype=float)
+        assert_series_equal(result, expected)
+
+        data[0] = 0
+        data[2] = 2
+        index = ['a', 'b', 'c']
+        result = Series(data, index=index)
+        expected = Series([0, nan, 2], index=index, dtype=float)
+        assert_series_equal(result, expected)
+
+        data[1] = 1
+        result = Series(data, index=index)
+        expected = Series([0, 1, 2], index=index, dtype=int)
+        assert_series_equal(result, expected)
+
+        data = ma.masked_all((3, ), dtype=bool)
+        result = Series(data)
+        expected = Series([nan, nan, nan], dtype=object)
+        assert_series_equal(result, expected)
+
+        data[0] = True
+        data[2] = False
+        index = ['a', 'b', 'c']
+        result = Series(data, index=index)
+        expected = Series([True, nan, False], index=index, dtype=object)
+        assert_series_equal(result, expected)
+
+        data[1] = True
+        result = Series(data, index=index)
+        expected = Series([True, True, False], index=index, dtype=bool)
+        assert_series_equal(result, expected)
+
+        data = ma.masked_all((3, ), dtype='M8[ns]')
+        result = Series(data)
+        expected = Series([iNaT, iNaT, iNaT], dtype='M8[ns]')
+        assert_series_equal(result, expected)
+
+        data[0] = datetime(2001, 1, 1)
+        data[2] = datetime(2001, 1, 3)
+        index = ['a', 'b', 'c']
+        result = Series(data, index=index)
+        expected = Series([datetime(2001, 1, 1), iNaT,
+                           datetime(2001, 1, 3)], index=index, dtype='M8[ns]')
+        assert_series_equal(result, expected)
+
+        data[1] = datetime(2001, 1, 2)
+        result = Series(data, index=index)
+        expected = Series([datetime(2001, 1, 1), datetime(2001, 1, 2),
+                           datetime(2001, 1, 3)], index=index, dtype='M8[ns]')
+        assert_series_equal(result, expected)
+
+    def test_series_ctor_plus_datetimeindex(self):
+        rng = date_range('20090415', '20090519', freq='B')
+        data = {k: 1 for k in rng}
+
+        result = Series(data, index=rng)
+        assert result.index is rng
+
+    def test_constructor_default_index(self):
+        s = Series([0, 1, 2])
+        tm.assert_index_equal(s.index, pd.Index(np.arange(3)))
+
+    @pytest.mark.parametrize('input', [[1, 2, 3],
+                                       (1, 2, 3),
+                                       list(range(3)),
+                                       pd.Categorical(['a', 'b', 'a']),
+                                       (i for i in range(3)),
+                                       map(lambda x: x, range(3))])
+    def test_constructor_index_mismatch(self, input):
+        # GH 19342
+        # test that construction of a Series with an index of different length
+        # raises an error
+        msg = 'Length of passed values is 3, index implies 4'
+        with pytest.raises(ValueError, message=msg):
+            Series(input, index=np.arange(4))
+
+    def test_constructor_numpy_scalar(self):
+        # GH 19342
+        # construction with a numpy scalar
+        # should not raise
+        result = Series(np.array(100), index=np.arange(4), dtype='int64')
+        expected = Series(100, index=np.arange(4), dtype='int64')
+        tm.assert_series_equal(result, expected)
+
+    def test_constructor_broadcast_list(self):
+        # GH 19342
+        # construction with single-element container and index
+        # should raise
+        pytest.raises(ValueError, Series, ['foo'], index=['a', 'b', 'c'])
+
+    def test_constructor_corner(self):
+        df = tm.makeTimeDataFrame()
+        objs = [df, df]
+        s = Series(objs, index=[0, 1])
+        assert isinstance(s, Series)
+
+    def test_constructor_sanitize(self):
+        s = Series(np.array([1., 1., 8.]), dtype='i8')
+        assert s.dtype == np.dtype('i8')
+
+        s = Series(np.array([1., 1., np.nan]), copy=True, dtype='i8')
+        assert s.dtype == np.dtype('f8')
+
+    def test_constructor_copy(self):
+        # GH15125
+        # test dtype parameter has no side effects on copy=True
+        for data in [[1.], np.array([1.])]:
+            x = Series(data)
+            y = pd.Series(x, copy=True, dtype=float)
+
+            # copy=True maintains original data in Series
+            tm.assert_series_equal(x, y)
+
+            # changes to origin of copy does not affect the copy
+            x[0] = 2.
+            assert not x.equals(y)
+            assert x[0] == 2.
+            assert y[0] == 1.
+
+    @pytest.mark.parametrize(
+        "index",
+        [
+            pd.date_range('20170101', periods=3, tz='US/Eastern'),
+            pd.date_range('20170101', periods=3),
+            pd.timedelta_range('1 day', periods=3),
+            pd.period_range('2012Q1', periods=3, freq='Q'),
+            pd.Index(list('abc')),
+            pd.Int64Index([1, 2, 3]),
+            pd.RangeIndex(0, 3)],
+        ids=lambda x: type(x).__name__)
+    def test_constructor_limit_copies(self, index):
+        # GH 17449
+        # limit copies of input
+        s = pd.Series(index)
+
+        # we make 1 copy; this is just a smoke test here
+        assert s._data.blocks[0].values is not index
+
+    def test_constructor_pass_none(self):
+        s = Series(None, index=lrange(5))
+        assert s.dtype == np.float64
+
+        s = Series(None, index=lrange(5), dtype=object)
+        assert s.dtype == np.object_
+
+        # GH 7431
+        # inference on the index
+        s = Series(index=np.array([None]))
+        expected = Series(index=Index([None]))
+        assert_series_equal(s, expected)
+
+    def test_constructor_pass_nan_nat(self):
+        # GH 13467
+        exp = Series([np.nan, np.nan], dtype=np.float64)
+        assert exp.dtype == np.float64
+        tm.assert_series_equal(Series([np.nan, np.nan]), exp)
+        tm.assert_series_equal(Series(np.array([np.nan, np.nan])), exp)
+
+        exp = Series([pd.NaT, pd.NaT])
+        assert exp.dtype == 'datetime64[ns]'
+        tm.assert_series_equal(Series([pd.NaT, pd.NaT]), exp)
+        tm.assert_series_equal(Series(np.array([pd.NaT, pd.NaT])), exp)
+
+        tm.assert_series_equal(Series([pd.NaT, np.nan]), exp)
+        tm.assert_series_equal(Series(np.array([pd.NaT, np.nan])), exp)
+
+        tm.assert_series_equal(Series([np.nan, pd.NaT]), exp)
+        tm.assert_series_equal(Series(np.array([np.nan, pd.NaT])), exp)
+
+    def test_constructor_cast(self):
+        msg = "could not convert string to float"
+        with tm.assert_raises_regex(ValueError, msg):
+            Series(["a", "b", "c"], dtype=float)
+
+    def test_constructor_unsigned_dtype_overflow(self, uint_dtype):
+        # see gh-15832
+        msg = 'Trying to coerce negative values to unsigned integers'
+        with tm.assert_raises_regex(OverflowError, msg):
+            Series([-1], dtype=uint_dtype)
+
+    def test_constructor_coerce_float_fail(self, any_int_dtype):
+        # see gh-15832
+        msg = "Trying to coerce float values to integers"
+        with tm.assert_raises_regex(ValueError, msg):
+            Series([1, 2, 3.5], dtype=any_int_dtype)
+
+    def test_constructor_coerce_float_valid(self, float_dtype):
+        s = Series([1, 2, 3.5], dtype=float_dtype)
+        expected = Series([1, 2, 3.5]).astype(float_dtype)
+        assert_series_equal(s, expected)
+
+    def test_constructor_dtype_no_cast(self):
+        # see gh-1572
+        s = Series([1, 2, 3])
+        s2 = Series(s, dtype=np.int64)
+
+        s2[1] = 5
+        assert s[1] == 5
+
+    def test_constructor_datelike_coercion(self):
+
+        # GH 9477
+        # incorrectly inferring on dateimelike looking when object dtype is
+        # specified
+        s = Series([Timestamp('20130101'), 'NOV'], dtype=object)
+        assert s.iloc[0] == Timestamp('20130101')
+        assert s.iloc[1] == 'NOV'
+        assert s.dtype == object
+
+        # the dtype was being reset on the slicing and re-inferred to datetime
+        # even thought the blocks are mixed
+        belly = '216 3T19'.split()
+        wing1 = '2T15 4H19'.split()
+        wing2 = '416 4T20'.split()
+        mat = pd.to_datetime('2016-01-22 2019-09-07'.split())
+        df = pd.DataFrame(
+            {'wing1': wing1,
+             'wing2': wing2,
+             'mat': mat}, index=belly)
+
+        result = df.loc['3T19']
+        assert result.dtype == object
+        result = df.loc['216']
+        assert result.dtype == object
+
+    def test_constructor_datetimes_with_nulls(self):
+        # gh-15869
+        for arr in [np.array([None, None, None, None,
+                              datetime.now(), None]),
+                    np.array([None, None, datetime.now(), None])]:
+            result = Series(arr)
+            assert result.dtype == 'M8[ns]'
+
+    def test_constructor_dtype_datetime64(self):
+
+        s = Series(iNaT, dtype='M8[ns]', index=lrange(5))
+        assert isna(s).all()
+
+        # in theory this should be all nulls, but since
+        # we are not specifying a dtype is ambiguous
+        s = Series(iNaT, index=lrange(5))
+        assert not isna(s).all()
+
+        s = Series(nan, dtype='M8[ns]', index=lrange(5))
+        assert isna(s).all()
+
+        s = Series([datetime(2001, 1, 2, 0, 0), iNaT], dtype='M8[ns]')
+        assert isna(s[1])
+        assert s.dtype == 'M8[ns]'
+
+        s = Series([datetime(2001, 1, 2, 0, 0), nan], dtype='M8[ns]')
+        assert isna(s[1])
+        assert s.dtype == 'M8[ns]'
+
+        # GH3416
+        dates = [
+            np.datetime64(datetime(2013, 1, 1)),
+            np.datetime64(datetime(2013, 1, 2)),
+            np.datetime64(datetime(2013, 1, 3)),
+        ]
+
+        s = Series(dates)
+        assert s.dtype == 'M8[ns]'
+
+        s.iloc[0] = np.nan
+        assert s.dtype == 'M8[ns]'
+
+        # GH3414 related
+        pytest.raises(TypeError, lambda x: Series(
+            Series(dates).astype('int') / 1000000, dtype='M8[ms]'))
+        pytest.raises(TypeError,
+                      lambda x: Series(dates, dtype='datetime64'))
+
+        # invalid dates can be help as object
+        result = Series([datetime(2, 1, 1)])
+        assert result[0] == datetime(2, 1, 1, 0, 0)
+
+        result = Series([datetime(3000, 1, 1)])
+        assert result[0] == datetime(3000, 1, 1, 0, 0)
+
+        # don't mix types
+        result = Series([Timestamp('20130101'), 1], index=['a', 'b'])
+        assert result['a'] == Timestamp('20130101')
+        assert result['b'] == 1
+
+        # GH6529
+        # coerce datetime64 non-ns properly
+        dates = date_range('01-Jan-2015', '01-Dec-2015', freq='M')
+        values2 = dates.view(np.ndarray).astype('datetime64[ns]')
+        expected = Series(values2, index=dates)
+
+        for dtype in ['s', 'D', 'ms', 'us', 'ns']:
+            values1 = dates.view(np.ndarray).astype('M8[{0}]'.format(dtype))
+            result = Series(values1, dates)
+            assert_series_equal(result, expected)
+
+        # GH 13876
+        # coerce to non-ns to object properly
+        expected = Series(values2, index=dates, dtype=object)
+        for dtype in ['s', 'D', 'ms', 'us', 'ns']:
+            values1 = dates.view(np.ndarray).astype('M8[{0}]'.format(dtype))
+            result = Series(values1, index=dates, dtype=object)
+            assert_series_equal(result, expected)
+
+        # leave datetime.date alone
+        dates2 = np.array([d.date() for d in dates.to_pydatetime()],
+                          dtype=object)
+        series1 = Series(dates2, dates)
+        tm.assert_numpy_array_equal(series1.values, dates2)
+        assert series1.dtype == object
+
+        # these will correctly infer a datetime
+        s = Series([None, pd.NaT, '2013-08-05 15:30:00.000001'])
+        assert s.dtype == 'datetime64[ns]'
+        s = Series([np.nan, pd.NaT, '2013-08-05 15:30:00.000001'])
+        assert s.dtype == 'datetime64[ns]'
+        s = Series([pd.NaT, None, '2013-08-05 15:30:00.000001'])
+        assert s.dtype == 'datetime64[ns]'
+        s = Series([pd.NaT, np.nan, '2013-08-05 15:30:00.000001'])
+        assert s.dtype == 'datetime64[ns]'
+
+        # tz-aware (UTC and other tz's)
+        # GH 8411
+        dr = date_range('20130101', periods=3)
+        assert Series(dr).iloc[0].tz is None
+        dr = date_range('20130101', periods=3, tz='UTC')
+        assert str(Series(dr).iloc[0].tz) == 'UTC'
+        dr = date_range('20130101', periods=3, tz='US/Eastern')
+        assert str(Series(dr).iloc[0].tz) == 'US/Eastern'
+
+        # non-convertible
+        s = Series([1479596223000, -1479590, pd.NaT])
+        assert s.dtype == 'object'
+        assert s[2] is pd.NaT
+        assert 'NaT' in str(s)
+
+        # if we passed a NaT it remains
+        s = Series([datetime(2010, 1, 1), datetime(2, 1, 1), pd.NaT])
+        assert s.dtype == 'object'
+        assert s[2] is pd.NaT
+        assert 'NaT' in str(s)
+
+        # if we passed a nan it remains
+        s = Series([datetime(2010, 1, 1), datetime(2, 1, 1), np.nan])
+        assert s.dtype == 'object'
+        assert s[2] is np.nan
+        assert 'NaN' in str(s)
+
+    def test_constructor_with_datetime_tz(self):
+
+        # 8260
+        # support datetime64 with tz
+
+        dr = date_range('20130101', periods=3, tz='US/Eastern')
+        s = Series(dr)
+        assert s.dtype.name == 'datetime64[ns, US/Eastern]'
+        assert s.dtype == 'datetime64[ns, US/Eastern]'
+        assert is_datetime64tz_dtype(s.dtype)
+        assert 'datetime64[ns, US/Eastern]' in str(s)
+
+        # export
+        result = s.values
+        assert isinstance(result, np.ndarray)
+        assert result.dtype == 'datetime64[ns]'
+
+        exp = pd.DatetimeIndex(result)
+        exp = exp.tz_localize('UTC').tz_convert(tz=s.dt.tz)
+        tm.assert_index_equal(dr, exp)
+
+        # indexing
+        result = s.iloc[0]
+        assert result == Timestamp('2013-01-01 00:00:00-0500',
+                                   tz='US/Eastern', freq='D')
+        result = s[0]
+        assert result == Timestamp('2013-01-01 00:00:00-0500',
+                                   tz='US/Eastern', freq='D')
+
+        result = s[Series([True, True, False], index=s.index)]
+        assert_series_equal(result, s[0:2])
+
+        result = s.iloc[0:1]
+        assert_series_equal(result, Series(dr[0:1]))
+
+        # concat
+        result = pd.concat([s.iloc[0:1], s.iloc[1:]])
+        assert_series_equal(result, s)
+
+        # short str
+        assert 'datetime64[ns, US/Eastern]' in str(s)
+
+        # formatting with NaT
+        result = s.shift()
+        assert 'datetime64[ns, US/Eastern]' in str(result)
+        assert 'NaT' in str(result)
+
+        # long str
+        t = Series(date_range('20130101', periods=1000, tz='US/Eastern'))
+        assert 'datetime64[ns, US/Eastern]' in str(t)
+
+        result = pd.DatetimeIndex(s, freq='infer')
+        tm.assert_index_equal(result, dr)
+
+        # inference
+        s = Series([pd.Timestamp('2013-01-01 13:00:00-0800', tz='US/Pacific'),
+                    pd.Timestamp('2013-01-02 14:00:00-0800', tz='US/Pacific')])
+        assert s.dtype == 'datetime64[ns, US/Pacific]'
+        assert lib.infer_dtype(s) == 'datetime64'
+
+        s = Series([pd.Timestamp('2013-01-01 13:00:00-0800', tz='US/Pacific'),
+                    pd.Timestamp('2013-01-02 14:00:00-0800', tz='US/Eastern')])
+        assert s.dtype == 'object'
+        assert lib.infer_dtype(s) == 'datetime'
+
+        # with all NaT
+        s = Series(pd.NaT, index=[0, 1], dtype='datetime64[ns, US/Eastern]')
+        expected = Series(pd.DatetimeIndex(['NaT', 'NaT'], tz='US/Eastern'))
+        assert_series_equal(s, expected)
+
+    @pytest.mark.parametrize("arr_dtype", [np.int64, np.float64])
+    @pytest.mark.parametrize("dtype", ["M8", "m8"])
+    @pytest.mark.parametrize("unit", ['ns', 'us', 'ms', 's', 'h', 'm', 'D'])
+    def test_construction_to_datetimelike_unit(self, arr_dtype, dtype, unit):
+        # tests all units
+        # gh-19223
+        dtype = "{}[{}]".format(dtype, unit)
+        arr = np.array([1, 2, 3], dtype=arr_dtype)
+        s = Series(arr)
+        result = s.astype(dtype)
+        expected = Series(arr.astype(dtype))
+
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('arg',
+                             ['2013-01-01 00:00:00', pd.NaT, np.nan, None])
+    def test_constructor_with_naive_string_and_datetimetz_dtype(self, arg):
+        # GH 17415: With naive string
+        result = Series([arg], dtype='datetime64[ns, CET]')
+        expected = Series(pd.Timestamp(arg)).dt.tz_localize('CET')
+        assert_series_equal(result, expected)
+
+    def test_construction_interval(self):
+        # construction from interval & array of intervals
+        index = IntervalIndex.from_breaks(np.arange(3), closed='right')
+        result = Series(index)
+        repr(result)
+        str(result)
+        tm.assert_index_equal(Index(result.values), index)
+
+        result = Series(index.values)
+        tm.assert_index_equal(Index(result.values), index)
+
+    def test_construction_consistency(self):
+
+        # make sure that we are not re-localizing upon construction
+        # GH 14928
+        s = Series(pd.date_range('20130101', periods=3, tz='US/Eastern'))
+
+        result = Series(s, dtype=s.dtype)
+        tm.assert_series_equal(result, s)
+
+        result = Series(s.dt.tz_convert('UTC'), dtype=s.dtype)
+        tm.assert_series_equal(result, s)
+
+        result = Series(s.values, dtype=s.dtype)
+        tm.assert_series_equal(result, s)
+
+    def test_constructor_periodindex(self):
+        # GH7932
+        # converting a PeriodIndex when put in a Series
+
+        pi = period_range('20130101', periods=5, freq='D')
+        s = Series(pi)
+        expected = Series(pi.astype(object))
+        assert_series_equal(s, expected)
+
+        assert s.dtype == 'object'
+
+    def test_constructor_dict(self):
+        d = {'a': 0., 'b': 1., 'c': 2.}
+        result = Series(d, index=['b', 'c', 'd', 'a'])
+        expected = Series([1, 2, nan, 0], index=['b', 'c', 'd', 'a'])
+        assert_series_equal(result, expected)
+
+        pidx = tm.makePeriodIndex(100)
+        d = {pidx[0]: 0, pidx[1]: 1}
+        result = Series(d, index=pidx)
+        expected = Series(np.nan, pidx)
+        expected.iloc[0] = 0
+        expected.iloc[1] = 1
+        assert_series_equal(result, expected)
+
+    def test_constructor_dict_order(self):
+        # GH19018
+        # initialization ordering: by insertion order if python>= 3.6, else
+        # order by value
+        d = {'b': 1, 'a': 0, 'c': 2}
+        result = Series(d)
+        if PY36:
+            expected = Series([1, 0, 2], index=list('bac'))
+        else:
+            expected = Series([0, 1, 2], index=list('abc'))
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("value", [2, np.nan, None, float('nan')])
+    def test_constructor_dict_nan_key(self, value):
+        # GH 18480
+        d = {1: 'a', value: 'b', float('nan'): 'c', 4: 'd'}
+        result = Series(d).sort_values()
+        expected = Series(['a', 'b', 'c', 'd'], index=[1, value, np.nan, 4])
+        assert_series_equal(result, expected)
+
+        # MultiIndex:
+        d = {(1, 1): 'a', (2, np.nan): 'b', (3, value): 'c'}
+        result = Series(d).sort_values()
+        expected = Series(['a', 'b', 'c'],
+                          index=Index([(1, 1), (2, np.nan), (3, value)]))
+        assert_series_equal(result, expected)
+
+    def test_constructor_dict_datetime64_index(self):
+        # GH 9456
+
+        dates_as_str = ['1984-02-19', '1988-11-06', '1989-12-03', '1990-03-15']
+        values = [42544017.198965244, 1234565, 40512335.181958228, -1]
+
+        def create_data(constructor):
+            return dict(zip((constructor(x) for x in dates_as_str), values))
+
+        data_datetime64 = create_data(np.datetime64)
+        data_datetime = create_data(lambda x: datetime.strptime(x, '%Y-%m-%d'))
+        data_Timestamp = create_data(Timestamp)
+
+        expected = Series(values, (Timestamp(x) for x in dates_as_str))
+
+        result_datetime64 = Series(data_datetime64)
+        result_datetime = Series(data_datetime)
+        result_Timestamp = Series(data_Timestamp)
+
+        assert_series_equal(result_datetime64, expected)
+        assert_series_equal(result_datetime, expected)
+        assert_series_equal(result_Timestamp, expected)
+
+    def test_constructor_list_of_tuples(self):
+        data = [(1, 1), (2, 2), (2, 3)]
+        s = Series(data)
+        assert list(s) == data
+
+    def test_constructor_tuple_of_tuples(self):
+        data = ((1, 1), (2, 2), (2, 3))
+        s = Series(data)
+        assert tuple(s) == data
+
+    def test_constructor_dict_of_tuples(self):
+        data = {(1, 2): 3,
+                (None, 5): 6}
+        result = Series(data).sort_values()
+        expected = Series([3, 6],
+                          index=MultiIndex.from_tuples([(1, 2), (None, 5)]))
+        tm.assert_series_equal(result, expected)
+
+    def test_constructor_set(self):
+        values = set([1, 2, 3, 4, 5])
+        pytest.raises(TypeError, Series, values)
+        values = frozenset(values)
+        pytest.raises(TypeError, Series, values)
+
+    def test_fromDict(self):
+        data = {'a': 0, 'b': 1, 'c': 2, 'd': 3}
+
+        series = Series(data)
+        assert tm.is_sorted(series.index)
+
+        data = {'a': 0, 'b': '1', 'c': '2', 'd': datetime.now()}
+        series = Series(data)
+        assert series.dtype == np.object_
+
+        data = {'a': 0, 'b': '1', 'c': '2', 'd': '3'}
+        series = Series(data)
+        assert series.dtype == np.object_
+
+        data = {'a': '0', 'b': '1'}
+        series = Series(data, dtype=float)
+        assert series.dtype == np.float64
+
+    def test_fromValue(self):
+
+        nans = Series(np.NaN, index=self.ts.index)
+        assert nans.dtype == np.float_
+        assert len(nans) == len(self.ts)
+
+        strings = Series('foo', index=self.ts.index)
+        assert strings.dtype == np.object_
+        assert len(strings) == len(self.ts)
+
+        d = datetime.now()
+        dates = Series(d, index=self.ts.index)
+        assert dates.dtype == 'M8[ns]'
+        assert len(dates) == len(self.ts)
+
+        # GH12336
+        # Test construction of categorical series from value
+        categorical = Series(0, index=self.ts.index, dtype="category")
+        expected = Series(0, index=self.ts.index).astype("category")
+        assert categorical.dtype == 'category'
+        assert len(categorical) == len(self.ts)
+        tm.assert_series_equal(categorical, expected)
+
+    def test_constructor_dtype_timedelta64(self):
+
+        # basic
+        td = Series([timedelta(days=i) for i in range(3)])
+        assert td.dtype == 'timedelta64[ns]'
+
+        td = Series([timedelta(days=1)])
+        assert td.dtype == 'timedelta64[ns]'
+
+        td = Series([timedelta(days=1), timedelta(days=2), np.timedelta64(
+            1, 's')])
+
+        assert td.dtype == 'timedelta64[ns]'
+
+        # mixed with NaT
+        td = Series([timedelta(days=1), NaT], dtype='m8[ns]')
+        assert td.dtype == 'timedelta64[ns]'
+
+        td = Series([timedelta(days=1), np.nan], dtype='m8[ns]')
+        assert td.dtype == 'timedelta64[ns]'
+
+        td = Series([np.timedelta64(300000000), pd.NaT], dtype='m8[ns]')
+        assert td.dtype == 'timedelta64[ns]'
+
+        # improved inference
+        # GH5689
+        td = Series([np.timedelta64(300000000), NaT])
+        assert td.dtype == 'timedelta64[ns]'
+
+        # because iNaT is int, not coerced to timedelta
+        td = Series([np.timedelta64(300000000), iNaT])
+        assert td.dtype == 'object'
+
+        td = Series([np.timedelta64(300000000), np.nan])
+        assert td.dtype == 'timedelta64[ns]'
+
+        td = Series([pd.NaT, np.timedelta64(300000000)])
+        assert td.dtype == 'timedelta64[ns]'
+
+        td = Series([np.timedelta64(1, 's')])
+        assert td.dtype == 'timedelta64[ns]'
+
+        # these are frequency conversion astypes
+        # for t in ['s', 'D', 'us', 'ms']:
+        #    pytest.raises(TypeError, td.astype, 'm8[%s]' % t)
+
+        # valid astype
+        td.astype('int64')
+
+        # invalid casting
+        pytest.raises(TypeError, td.astype, 'int32')
+
+        # this is an invalid casting
+        def f():
+            Series([timedelta(days=1), 'foo'], dtype='m8[ns]')
+
+        pytest.raises(Exception, f)
+
+        # leave as object here
+        td = Series([timedelta(days=i) for i in range(3)] + ['foo'])
+        assert td.dtype == 'object'
+
+        # these will correctly infer a timedelta
+        s = Series([None, pd.NaT, '1 Day'])
+        assert s.dtype == 'timedelta64[ns]'
+        s = Series([np.nan, pd.NaT, '1 Day'])
+        assert s.dtype == 'timedelta64[ns]'
+        s = Series([pd.NaT, None, '1 Day'])
+        assert s.dtype == 'timedelta64[ns]'
+        s = Series([pd.NaT, np.nan, '1 Day'])
+        assert s.dtype == 'timedelta64[ns]'
+
+    # GH 16406
+    def test_constructor_mixed_tz(self):
+        s = Series([Timestamp('20130101'),
+                    Timestamp('20130101', tz='US/Eastern')])
+        expected = Series([Timestamp('20130101'),
+                           Timestamp('20130101', tz='US/Eastern')],
+                          dtype='object')
+        assert_series_equal(s, expected)
+
+    def test_NaT_scalar(self):
+        series = Series([0, 1000, 2000, iNaT], dtype='M8[ns]')
+
+        val = series[3]
+        assert isna(val)
+
+        series[2] = val
+        assert isna(series[2])
+
+    def test_NaT_cast(self):
+        # GH10747
+        result = Series([np.nan]).astype('M8[ns]')
+        expected = Series([NaT])
+        assert_series_equal(result, expected)
+
+    def test_constructor_name_hashable(self):
+        for n in [777, 777., 'name', datetime(2001, 11, 11), (1, ), u"\u05D0"]:
+            for data in [[1, 2, 3], np.ones(3), {'a': 0, 'b': 1}]:
+                s = Series(data, name=n)
+                assert s.name == n
+
+    def test_constructor_name_unhashable(self):
+        for n in [['name_list'], np.ones(2), {1: 2}]:
+            for data in [['name_list'], np.ones(2), {1: 2}]:
+                pytest.raises(TypeError, Series, data, name=n)
+
+    def test_auto_conversion(self):
+        series = Series(list(date_range('1/1/2000', periods=10)))
+        assert series.dtype == 'M8[ns]'
+
+    def test_convert_non_ns(self):
+        # convert from a numpy array of non-ns timedelta64
+        arr = np.array([1, 2, 3], dtype='timedelta64[s]')
+        s = Series(arr)
+        expected = Series(pd.timedelta_range('00:00:01', periods=3, freq='s'))
+        assert_series_equal(s, expected)
+
+        # convert from a numpy array of non-ns datetime64
+        # note that creating a numpy datetime64 is in LOCAL time!!!!
+        # seems to work for M8[D], but not for M8[s]
+
+        s = Series(np.array(['2013-01-01', '2013-01-02',
+                             '2013-01-03'], dtype='datetime64[D]'))
+        assert_series_equal(s, Series(date_range('20130101', periods=3,
+                                                 freq='D')))
+
+        # s = Series(np.array(['2013-01-01 00:00:01','2013-01-01
+        # 00:00:02','2013-01-01 00:00:03'],dtype='datetime64[s]'))
+
+        # assert_series_equal(s,date_range('20130101
+        # 00:00:01',period=3,freq='s'))
+
+    @pytest.mark.parametrize(
+        "index",
+        [
+            date_range('1/1/2000', periods=10),
+            timedelta_range('1 day', periods=10),
+            period_range('2000-Q1', periods=10, freq='Q')],
+        ids=lambda x: type(x).__name__)
+    def test_constructor_cant_cast_datetimelike(self, index):
+
+        # floats are not ok
+        msg = "Cannot cast {} to ".format(type(index).__name__)
+        with tm.assert_raises_regex(TypeError, msg):
+            Series(index, dtype=float)
+
+        # ints are ok
+        # we test with np.int64 to get similar results on
+        # windows / 32-bit platforms
+        result = Series(index, dtype=np.int64)
+        expected = Series(index.astype(np.int64))
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        "index",
+        [
+            date_range('1/1/2000', periods=10),
+            timedelta_range('1 day', periods=10),
+            period_range('2000-Q1', periods=10, freq='Q')],
+        ids=lambda x: type(x).__name__)
+    def test_constructor_cast_object(self, index):
+        s = Series(index, dtype=object)
+        exp = Series(index).astype(object)
+        tm.assert_series_equal(s, exp)
+
+        s = Series(pd.Index(index, dtype=object), dtype=object)
+        exp = Series(index).astype(object)
+        tm.assert_series_equal(s, exp)
+
+        s = Series(index.astype(object), dtype=object)
+        exp = Series(index).astype(object)
+        tm.assert_series_equal(s, exp)
+
+    def test_constructor_generic_timestamp_deprecated(self):
+        # see gh-15524
+
+        with tm.assert_produces_warning(FutureWarning):
+            dtype = np.timedelta64
+            s = Series([], dtype=dtype)
+
+            assert s.empty
+            assert s.dtype == 'm8[ns]'
+
+        with tm.assert_produces_warning(FutureWarning):
+            dtype = np.datetime64
+            s = Series([], dtype=dtype)
+
+            assert s.empty
+            assert s.dtype == 'M8[ns]'
+
+        # These timestamps have the wrong frequencies,
+        # so an Exception should be raised now.
+        msg = "cannot convert timedeltalike"
+        with tm.assert_raises_regex(TypeError, msg):
+            Series([], dtype='m8[ps]')
+
+        msg = "cannot convert datetimelike"
+        with tm.assert_raises_regex(TypeError, msg):
+            Series([], dtype='M8[ps]')
+
+    @pytest.mark.parametrize('dtype', [None, 'uint8', 'category'])
+    def test_constructor_range_dtype(self, dtype):
+        # GH 16804
+        expected = Series([0, 1, 2, 3, 4], dtype=dtype or 'int64')
+        result = Series(range(5), dtype=dtype)
+        tm.assert_series_equal(result, expected)
+
+    def test_constructor_tz_mixed_data(self):
+        # GH 13051
+        dt_list = [Timestamp('2016-05-01 02:03:37'),
+                   Timestamp('2016-04-30 19:03:37-0700', tz='US/Pacific')]
+        result = Series(dt_list)
+        expected = Series(dt_list, dtype=object)
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/series/test_datetime_values.py b/pandas/tests/series/test_datetime_values.py
new file mode 100644
index 0000000000000..47798d0ddd7f5
--- /dev/null
+++ b/pandas/tests/series/test_datetime_values.py
@@ -0,0 +1,462 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import locale
+import calendar
+import pytest
+
+from datetime import datetime, date
+
+import numpy as np
+import pandas as pd
+
+from pandas.core.dtypes.common import is_integer_dtype, is_list_like
+from pandas import (Index, Series, DataFrame, bdate_range,
+                    date_range, period_range, timedelta_range,
+                    PeriodIndex, DatetimeIndex, TimedeltaIndex)
+import pandas.core.common as com
+
+from pandas.util.testing import assert_series_equal
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestSeriesDatetimeValues(TestData):
+
+    def test_dt_namespace_accessor(self):
+
+        # GH 7207, 11128
+        # test .dt namespace accessor
+
+        ok_for_period = PeriodIndex._datetimelike_ops
+        ok_for_period_methods = ['strftime', 'to_timestamp', 'asfreq']
+        ok_for_dt = DatetimeIndex._datetimelike_ops
+        ok_for_dt_methods = ['to_period', 'to_pydatetime', 'tz_localize',
+                             'tz_convert', 'normalize', 'strftime', 'round',
+                             'floor', 'ceil', 'day_name', 'month_name']
+        ok_for_td = TimedeltaIndex._datetimelike_ops
+        ok_for_td_methods = ['components', 'to_pytimedelta', 'total_seconds',
+                             'round', 'floor', 'ceil']
+
+        def get_expected(s, name):
+            result = getattr(Index(s._values), prop)
+            if isinstance(result, np.ndarray):
+                if is_integer_dtype(result):
+                    result = result.astype('int64')
+            elif not is_list_like(result):
+                return result
+            return Series(result, index=s.index, name=s.name)
+
+        def compare(s, name):
+            a = getattr(s.dt, prop)
+            b = get_expected(s, prop)
+            if not (is_list_like(a) and is_list_like(b)):
+                assert a == b
+            else:
+                tm.assert_series_equal(a, b)
+
+        # datetimeindex
+        cases = [Series(date_range('20130101', periods=5), name='xxx'),
+                 Series(date_range('20130101', periods=5, freq='s'),
+                        name='xxx'),
+                 Series(date_range('20130101 00:00:00', periods=5, freq='ms'),
+                        name='xxx')]
+        for s in cases:
+            for prop in ok_for_dt:
+                # we test freq below
+                if prop != 'freq':
+                    compare(s, prop)
+
+            for prop in ok_for_dt_methods:
+                getattr(s.dt, prop)
+
+            result = s.dt.to_pydatetime()
+            assert isinstance(result, np.ndarray)
+            assert result.dtype == object
+
+            result = s.dt.tz_localize('US/Eastern')
+            exp_values = DatetimeIndex(s.values).tz_localize('US/Eastern')
+            expected = Series(exp_values, index=s.index, name='xxx')
+            tm.assert_series_equal(result, expected)
+
+            tz_result = result.dt.tz
+            assert str(tz_result) == 'US/Eastern'
+            freq_result = s.dt.freq
+            assert freq_result == DatetimeIndex(s.values, freq='infer').freq
+
+            # let's localize, then convert
+            result = s.dt.tz_localize('UTC').dt.tz_convert('US/Eastern')
+            exp_values = (DatetimeIndex(s.values).tz_localize('UTC')
+                                                 .tz_convert('US/Eastern'))
+            expected = Series(exp_values, index=s.index, name='xxx')
+            tm.assert_series_equal(result, expected)
+
+        # round
+        s = Series(pd.to_datetime(['2012-01-01 13:00:00',
+                                   '2012-01-01 12:01:00',
+                                   '2012-01-01 08:00:00']), name='xxx')
+        result = s.dt.round('D')
+        expected = Series(pd.to_datetime(['2012-01-02', '2012-01-02',
+                                          '2012-01-01']), name='xxx')
+        tm.assert_series_equal(result, expected)
+
+        # round with tz
+        result = (s.dt.tz_localize('UTC')
+                   .dt.tz_convert('US/Eastern')
+                   .dt.round('D'))
+        exp_values = pd.to_datetime(['2012-01-01', '2012-01-01',
+                                     '2012-01-01']).tz_localize('US/Eastern')
+        expected = Series(exp_values, name='xxx')
+        tm.assert_series_equal(result, expected)
+
+        # floor
+        s = Series(pd.to_datetime(['2012-01-01 13:00:00',
+                                   '2012-01-01 12:01:00',
+                                   '2012-01-01 08:00:00']), name='xxx')
+        result = s.dt.floor('D')
+        expected = Series(pd.to_datetime(['2012-01-01', '2012-01-01',
+                                          '2012-01-01']), name='xxx')
+        tm.assert_series_equal(result, expected)
+
+        # ceil
+        s = Series(pd.to_datetime(['2012-01-01 13:00:00',
+                                   '2012-01-01 12:01:00',
+                                   '2012-01-01 08:00:00']), name='xxx')
+        result = s.dt.ceil('D')
+        expected = Series(pd.to_datetime(['2012-01-02', '2012-01-02',
+                                          '2012-01-02']), name='xxx')
+        tm.assert_series_equal(result, expected)
+
+        # datetimeindex with tz
+        s = Series(date_range('20130101', periods=5, tz='US/Eastern'),
+                   name='xxx')
+        for prop in ok_for_dt:
+
+            # we test freq below
+            if prop != 'freq':
+                compare(s, prop)
+
+        for prop in ok_for_dt_methods:
+            getattr(s.dt, prop)
+
+        result = s.dt.to_pydatetime()
+        assert isinstance(result, np.ndarray)
+        assert result.dtype == object
+
+        result = s.dt.tz_convert('CET')
+        expected = Series(s._values.tz_convert('CET'),
+                          index=s.index, name='xxx')
+        tm.assert_series_equal(result, expected)
+
+        tz_result = result.dt.tz
+        assert str(tz_result) == 'CET'
+        freq_result = s.dt.freq
+        assert freq_result == DatetimeIndex(s.values, freq='infer').freq
+
+        # timedelta index
+        cases = [Series(timedelta_range('1 day', periods=5),
+                        index=list('abcde'), name='xxx'),
+                 Series(timedelta_range('1 day 01:23:45', periods=5,
+                                        freq='s'), name='xxx'),
+                 Series(timedelta_range('2 days 01:23:45.012345', periods=5,
+                                        freq='ms'), name='xxx')]
+        for s in cases:
+            for prop in ok_for_td:
+                # we test freq below
+                if prop != 'freq':
+                    compare(s, prop)
+
+            for prop in ok_for_td_methods:
+                getattr(s.dt, prop)
+
+            result = s.dt.components
+            assert isinstance(result, DataFrame)
+            tm.assert_index_equal(result.index, s.index)
+
+            result = s.dt.to_pytimedelta()
+            assert isinstance(result, np.ndarray)
+            assert result.dtype == object
+
+            result = s.dt.total_seconds()
+            assert isinstance(result, pd.Series)
+            assert result.dtype == 'float64'
+
+            freq_result = s.dt.freq
+            assert freq_result == TimedeltaIndex(s.values, freq='infer').freq
+
+        # both
+        index = date_range('20130101', periods=3, freq='D')
+        s = Series(date_range('20140204', periods=3, freq='s'),
+                   index=index, name='xxx')
+        exp = Series(np.array([2014, 2014, 2014], dtype='int64'),
+                     index=index, name='xxx')
+        tm.assert_series_equal(s.dt.year, exp)
+
+        exp = Series(np.array([2, 2, 2], dtype='int64'),
+                     index=index, name='xxx')
+        tm.assert_series_equal(s.dt.month, exp)
+
+        exp = Series(np.array([0, 1, 2], dtype='int64'),
+                     index=index, name='xxx')
+        tm.assert_series_equal(s.dt.second, exp)
+
+        exp = pd.Series([s[0]] * 3, index=index, name='xxx')
+        tm.assert_series_equal(s.dt.normalize(), exp)
+
+        # periodindex
+        cases = [Series(period_range('20130101', periods=5, freq='D'),
+                        name='xxx')]
+        for s in cases:
+            for prop in ok_for_period:
+                # we test freq below
+                if prop != 'freq':
+                    compare(s, prop)
+
+            for prop in ok_for_period_methods:
+                getattr(s.dt, prop)
+
+            freq_result = s.dt.freq
+            assert freq_result == PeriodIndex(s.values).freq
+
+        # test limited display api
+        def get_dir(s):
+            results = [r for r in s.dt.__dir__() if not r.startswith('_')]
+            return list(sorted(set(results)))
+
+        s = Series(date_range('20130101', periods=5, freq='D'), name='xxx')
+        results = get_dir(s)
+        tm.assert_almost_equal(
+            results, list(sorted(set(ok_for_dt + ok_for_dt_methods))))
+
+        s = Series(period_range('20130101', periods=5,
+                                freq='D', name='xxx').astype(object))
+        results = get_dir(s)
+        tm.assert_almost_equal(
+            results, list(sorted(set(ok_for_period + ok_for_period_methods))))
+
+        # 11295
+        # ambiguous time error on the conversions
+        s = Series(pd.date_range('2015-01-01', '2016-01-01',
+                                 freq='T'), name='xxx')
+        s = s.dt.tz_localize('UTC').dt.tz_convert('America/Chicago')
+        results = get_dir(s)
+        tm.assert_almost_equal(
+            results, list(sorted(set(ok_for_dt + ok_for_dt_methods))))
+        exp_values = pd.date_range('2015-01-01', '2016-01-01', freq='T',
+                                   tz='UTC').tz_convert('America/Chicago')
+        expected = Series(exp_values, name='xxx')
+        tm.assert_series_equal(s, expected)
+
+        # no setting allowed
+        s = Series(date_range('20130101', periods=5, freq='D'), name='xxx')
+        with tm.assert_raises_regex(ValueError, "modifications"):
+            s.dt.hour = 5
+
+        # trying to set a copy
+        with pd.option_context('chained_assignment', 'raise'):
+
+            def f():
+                s.dt.hour[0] = 5
+
+            pytest.raises(com.SettingWithCopyError, f)
+
+    def test_dt_namespace_accessor_categorical(self):
+        # GH 19468
+        dti = DatetimeIndex(['20171111', '20181212']).repeat(2)
+        s = Series(pd.Categorical(dti), name='foo')
+        result = s.dt.year
+        expected = Series([2017, 2017, 2018, 2018], name='foo')
+        tm.assert_series_equal(result, expected)
+
+    def test_dt_accessor_no_new_attributes(self):
+        # https://github.com/pandas-dev/pandas/issues/10673
+        s = Series(date_range('20130101', periods=5, freq='D'))
+        with tm.assert_raises_regex(AttributeError,
+                                    "You cannot add any new attribute"):
+            s.dt.xlabel = "a"
+
+    @pytest.mark.parametrize('time_locale', [
+        None] if tm.get_locales() is None else [None] + tm.get_locales())
+    def test_dt_accessor_datetime_name_accessors(self, time_locale):
+        # Test Monday -> Sunday and January -> December, in that sequence
+        if time_locale is None:
+            # If the time_locale is None, day-name and month_name should
+            # return the english attributes
+            expected_days = ['Monday', 'Tuesday', 'Wednesday', 'Thursday',
+                             'Friday', 'Saturday', 'Sunday']
+            expected_months = ['January', 'February', 'March', 'April', 'May',
+                               'June', 'July', 'August', 'September',
+                               'October', 'November', 'December']
+        else:
+            with tm.set_locale(time_locale, locale.LC_TIME):
+                expected_days = calendar.day_name[:]
+                expected_months = calendar.month_name[1:]
+
+        s = Series(DatetimeIndex(freq='D', start=datetime(1998, 1, 1),
+                                 periods=365))
+        english_days = ['Monday', 'Tuesday', 'Wednesday', 'Thursday',
+                        'Friday', 'Saturday', 'Sunday']
+        for day, name, eng_name in zip(range(4, 11),
+                                       expected_days,
+                                       english_days):
+            name = name.capitalize()
+            assert s.dt.weekday_name[day] == eng_name
+            assert s.dt.day_name(locale=time_locale)[day] == name
+        s = s.append(Series([pd.NaT]))
+        assert np.isnan(s.dt.day_name(locale=time_locale).iloc[-1])
+
+        s = Series(DatetimeIndex(freq='M', start='2012', end='2013'))
+        result = s.dt.month_name(locale=time_locale)
+        expected = Series([month.capitalize() for month in expected_months])
+        tm.assert_series_equal(result, expected)
+        for s_date, expected in zip(s, expected_months):
+            result = s_date.month_name(locale=time_locale)
+            assert result == expected.capitalize()
+        s = s.append(Series([pd.NaT]))
+        assert np.isnan(s.dt.month_name(locale=time_locale).iloc[-1])
+
+    def test_strftime(self):
+        # GH 10086
+        s = Series(date_range('20130101', periods=5))
+        result = s.dt.strftime('%Y/%m/%d')
+        expected = Series(['2013/01/01', '2013/01/02', '2013/01/03',
+                           '2013/01/04', '2013/01/05'])
+        tm.assert_series_equal(result, expected)
+
+        s = Series(date_range('2015-02-03 11:22:33.4567', periods=5))
+        result = s.dt.strftime('%Y/%m/%d %H-%M-%S')
+        expected = Series(['2015/02/03 11-22-33', '2015/02/04 11-22-33',
+                           '2015/02/05 11-22-33', '2015/02/06 11-22-33',
+                           '2015/02/07 11-22-33'])
+        tm.assert_series_equal(result, expected)
+
+        s = Series(period_range('20130101', periods=5))
+        result = s.dt.strftime('%Y/%m/%d')
+        expected = Series(['2013/01/01', '2013/01/02', '2013/01/03',
+                           '2013/01/04', '2013/01/05'])
+        tm.assert_series_equal(result, expected)
+
+        s = Series(period_range(
+            '2015-02-03 11:22:33.4567', periods=5, freq='s'))
+        result = s.dt.strftime('%Y/%m/%d %H-%M-%S')
+        expected = Series(['2015/02/03 11-22-33', '2015/02/03 11-22-34',
+                           '2015/02/03 11-22-35', '2015/02/03 11-22-36',
+                           '2015/02/03 11-22-37'])
+        tm.assert_series_equal(result, expected)
+
+        s = Series(date_range('20130101', periods=5))
+        s.iloc[0] = pd.NaT
+        result = s.dt.strftime('%Y/%m/%d')
+        expected = Series(['NaT', '2013/01/02', '2013/01/03', '2013/01/04',
+                           '2013/01/05'])
+        tm.assert_series_equal(result, expected)
+
+        datetime_index = date_range('20150301', periods=5)
+        result = datetime_index.strftime("%Y/%m/%d")
+
+        expected = Index(['2015/03/01', '2015/03/02', '2015/03/03',
+                          '2015/03/04', '2015/03/05'], dtype=np.object_)
+        # dtype may be S10 or U10 depending on python version
+        tm.assert_index_equal(result, expected)
+
+        period_index = period_range('20150301', periods=5)
+        result = period_index.strftime("%Y/%m/%d")
+        expected = Index(['2015/03/01', '2015/03/02', '2015/03/03',
+                          '2015/03/04', '2015/03/05'], dtype='=U10')
+        tm.assert_index_equal(result, expected)
+
+        s = Series([datetime(2013, 1, 1, 2, 32, 59), datetime(2013, 1, 2, 14,
+                                                              32, 1)])
+        result = s.dt.strftime('%Y-%m-%d %H:%M:%S')
+        expected = Series(["2013-01-01 02:32:59", "2013-01-02 14:32:01"])
+        tm.assert_series_equal(result, expected)
+
+        s = Series(period_range('20130101', periods=4, freq='H'))
+        result = s.dt.strftime('%Y/%m/%d %H:%M:%S')
+        expected = Series(["2013/01/01 00:00:00", "2013/01/01 01:00:00",
+                           "2013/01/01 02:00:00", "2013/01/01 03:00:00"])
+
+        s = Series(period_range('20130101', periods=4, freq='L'))
+        result = s.dt.strftime('%Y/%m/%d %H:%M:%S.%l')
+        expected = Series(["2013/01/01 00:00:00.000",
+                           "2013/01/01 00:00:00.001",
+                           "2013/01/01 00:00:00.002",
+                           "2013/01/01 00:00:00.003"])
+        tm.assert_series_equal(result, expected)
+
+    def test_valid_dt_with_missing_values(self):
+
+        from datetime import date, time
+
+        # GH 8689
+        s = Series(date_range('20130101', periods=5, freq='D'))
+        s.iloc[2] = pd.NaT
+
+        for attr in ['microsecond', 'nanosecond', 'second', 'minute', 'hour',
+                     'day']:
+            expected = getattr(s.dt, attr).copy()
+            expected.iloc[2] = np.nan
+            result = getattr(s.dt, attr)
+            tm.assert_series_equal(result, expected)
+
+        result = s.dt.date
+        expected = Series(
+            [date(2013, 1, 1), date(2013, 1, 2), np.nan, date(2013, 1, 4),
+             date(2013, 1, 5)], dtype='object')
+        tm.assert_series_equal(result, expected)
+
+        result = s.dt.time
+        expected = Series(
+            [time(0), time(0), np.nan, time(0), time(0)], dtype='object')
+        tm.assert_series_equal(result, expected)
+
+    def test_dt_accessor_api(self):
+        # GH 9322
+        from pandas.core.indexes.accessors import (
+            CombinedDatetimelikeProperties, DatetimeProperties)
+        assert Series.dt is CombinedDatetimelikeProperties
+
+        s = Series(date_range('2000-01-01', periods=3))
+        assert isinstance(s.dt, DatetimeProperties)
+
+        for s in [Series(np.arange(5)), Series(list('abcde')),
+                  Series(np.random.randn(5))]:
+            with tm.assert_raises_regex(AttributeError,
+                                        "only use .dt accessor"):
+                s.dt
+            assert not hasattr(s, 'dt')
+
+    def test_between(self):
+        s = Series(bdate_range('1/1/2000', periods=20).astype(object))
+        s[::2] = np.nan
+
+        result = s[s.between(s[3], s[17])]
+        expected = s[3:18].dropna()
+        assert_series_equal(result, expected)
+
+        result = s[s.between(s[3], s[17], inclusive=False)]
+        expected = s[5:16].dropna()
+        assert_series_equal(result, expected)
+
+    def test_date_tz(self):
+        # GH11757
+        rng = pd.DatetimeIndex(['2014-04-04 23:56',
+                                '2014-07-18 21:24',
+                                '2015-11-22 22:14'], tz="US/Eastern")
+        s = Series(rng)
+        expected = Series([date(2014, 4, 4),
+                           date(2014, 7, 18),
+                           date(2015, 11, 22)])
+        assert_series_equal(s.dt.date, expected)
+        assert_series_equal(s.apply(lambda x: x.date()), expected)
+
+    def test_datetime_understood(self):
+        # Ensures it doesn't fail to create the right series
+        # reported in issue#16726
+        series = pd.Series(pd.date_range("2012-01-01", periods=3))
+        offset = pd.offsets.DateOffset(days=6)
+        result = series - offset
+        expected = pd.Series(pd.to_datetime([
+            '2011-12-26', '2011-12-27', '2011-12-28']))
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/series/test_dtypes.py b/pandas/tests/series/test_dtypes.py
new file mode 100644
index 0000000000000..dd1b623f0f7ff
--- /dev/null
+++ b/pandas/tests/series/test_dtypes.py
@@ -0,0 +1,508 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+
+from datetime import datetime, timedelta
+
+import sys
+import string
+import warnings
+
+from numpy import nan
+import pandas as pd
+import numpy as np
+
+from pandas import (
+    Series, Timestamp, Timedelta, DataFrame, date_range,
+    Categorical, Index
+)
+from pandas.api.types import CategoricalDtype
+import pandas._libs.tslib as tslib
+
+from pandas.compat import lrange, range, u
+from pandas import compat
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestSeriesDtypes(TestData):
+
+    def test_dt64_series_astype_object(self):
+        dt64ser = Series(date_range('20130101', periods=3))
+        result = dt64ser.astype(object)
+        assert isinstance(result.iloc[0], datetime)
+        assert result.dtype == np.object_
+
+    def test_td64_series_astype_object(self):
+        tdser = Series(['59 Days', '59 Days', 'NaT'], dtype='timedelta64[ns]')
+        result = tdser.astype(object)
+        assert isinstance(result.iloc[0], timedelta)
+        assert result.dtype == np.object_
+
+    @pytest.mark.parametrize("dtype", ["float32", "float64",
+                                       "int64", "int32"])
+    def test_astype(self, dtype):
+        s = Series(np.random.randn(5), name='foo')
+        as_typed = s.astype(dtype)
+
+        assert as_typed.dtype == dtype
+        assert as_typed.name == s.name
+
+    def test_asobject_deprecated(self):
+        s = Series(np.random.randn(5), name='foo')
+        with tm.assert_produces_warning(FutureWarning):
+            o = s.asobject
+        assert isinstance(o, np.ndarray)
+
+    def test_dtype(self):
+
+        assert self.ts.dtype == np.dtype('float64')
+        assert self.ts.dtypes == np.dtype('float64')
+        assert self.ts.ftype == 'float64:dense'
+        assert self.ts.ftypes == 'float64:dense'
+        tm.assert_series_equal(self.ts.get_dtype_counts(),
+                               Series(1, ['float64']))
+        # GH18243 - Assert .get_ftype_counts is deprecated
+        with tm.assert_produces_warning(FutureWarning):
+            tm.assert_series_equal(self.ts.get_ftype_counts(),
+                                   Series(1, ['float64:dense']))
+
+    @pytest.mark.parametrize("value", [np.nan, np.inf])
+    @pytest.mark.parametrize("dtype", [np.int32, np.int64])
+    def test_astype_cast_nan_inf_int(self, dtype, value):
+        # gh-14265: check NaN and inf raise error when converting to int
+        msg = 'Cannot convert non-finite values \\(NA or inf\\) to integer'
+        s = Series([value])
+
+        with tm.assert_raises_regex(ValueError, msg):
+            s.astype(dtype)
+
+    @pytest.mark.parametrize("dtype", [int, np.int8, np.int64])
+    def test_astype_cast_object_int_fail(self, dtype):
+        arr = Series(["car", "house", "tree", "1"])
+        with pytest.raises(ValueError):
+            arr.astype(dtype)
+
+    def test_astype_cast_object_int(self):
+        arr = Series(['1', '2', '3', '4'], dtype=object)
+        result = arr.astype(int)
+
+        tm.assert_series_equal(result, Series(np.arange(1, 5)))
+
+    def test_astype_datetime(self):
+        s = Series(tslib.iNaT, dtype='M8[ns]', index=lrange(5))
+
+        s = s.astype('O')
+        assert s.dtype == np.object_
+
+        s = Series([datetime(2001, 1, 2, 0, 0)])
+
+        s = s.astype('O')
+        assert s.dtype == np.object_
+
+        s = Series([datetime(2001, 1, 2, 0, 0) for i in range(3)])
+
+        s[1] = np.nan
+        assert s.dtype == 'M8[ns]'
+
+        s = s.astype('O')
+        assert s.dtype == np.object_
+
+    def test_astype_datetime64tz(self):
+        s = Series(date_range('20130101', periods=3, tz='US/Eastern'))
+
+        # astype
+        result = s.astype(object)
+        expected = Series(s.astype(object), dtype=object)
+        tm.assert_series_equal(result, expected)
+
+        result = Series(s.values).dt.tz_localize('UTC').dt.tz_convert(s.dt.tz)
+        tm.assert_series_equal(result, s)
+
+        # astype - object, preserves on construction
+        result = Series(s.astype(object))
+        expected = s.astype(object)
+        tm.assert_series_equal(result, expected)
+
+        # astype - datetime64[ns, tz]
+        result = Series(s.values).astype('datetime64[ns, US/Eastern]')
+        tm.assert_series_equal(result, s)
+
+        result = Series(s.values).astype(s.dtype)
+        tm.assert_series_equal(result, s)
+
+        result = s.astype('datetime64[ns, CET]')
+        expected = Series(date_range('20130101 06:00:00', periods=3, tz='CET'))
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("dtype", [compat.text_type, np.str_])
+    @pytest.mark.parametrize("series", [Series([string.digits * 10,
+                                                tm.rands(63),
+                                                tm.rands(64),
+                                                tm.rands(1000)]),
+                                        Series([string.digits * 10,
+                                                tm.rands(63),
+                                                tm.rands(64), nan, 1.0])])
+    def test_astype_str_map(self, dtype, series):
+        # see gh-4405
+        result = series.astype(dtype)
+        expected = series.map(compat.text_type)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("dtype", [str, compat.text_type])
+    def test_astype_str_cast(self, dtype):
+        # see gh-9757: test str and unicode on python 2.x
+        # and just str on python 3.x
+        ts = Series([Timestamp('2010-01-04 00:00:00')])
+        s = ts.astype(dtype)
+
+        expected = Series([dtype('2010-01-04')])
+        tm.assert_series_equal(s, expected)
+
+        ts = Series([Timestamp('2010-01-04 00:00:00', tz='US/Eastern')])
+        s = ts.astype(dtype)
+
+        expected = Series([dtype('2010-01-04 00:00:00-05:00')])
+        tm.assert_series_equal(s, expected)
+
+        td = Series([Timedelta(1, unit='d')])
+        s = td.astype(dtype)
+
+        expected = Series([dtype('1 days 00:00:00.000000000')])
+        tm.assert_series_equal(s, expected)
+
+    def test_astype_unicode(self):
+        # see gh-7758: A bit of magic is required to set
+        # default encoding to utf-8
+        digits = string.digits
+        test_series = [
+            Series([digits * 10, tm.rands(63), tm.rands(64), tm.rands(1000)]),
+            Series([u('データーサイエンス、お前はもう死んでいる')]),
+        ]
+
+        former_encoding = None
+
+        if not compat.PY3:
+            # In Python, we can force the default encoding for this test
+            former_encoding = sys.getdefaultencoding()
+            reload(sys)  # noqa
+
+            sys.setdefaultencoding("utf-8")
+        if sys.getdefaultencoding() == "utf-8":
+            test_series.append(Series([u('野菜食べないとやばい')
+                                       .encode("utf-8")]))
+
+        for s in test_series:
+            res = s.astype("unicode")
+            expec = s.map(compat.text_type)
+            tm.assert_series_equal(res, expec)
+
+        # Restore the former encoding
+        if former_encoding is not None and former_encoding != "utf-8":
+            reload(sys)  # noqa
+            sys.setdefaultencoding(former_encoding)
+
+    @pytest.mark.parametrize("dtype_class", [dict, Series])
+    def test_astype_dict_like(self, dtype_class):
+        # see gh-7271
+        s = Series(range(0, 10, 2), name='abc')
+
+        dt1 = dtype_class({'abc': str})
+        result = s.astype(dt1)
+        expected = Series(['0', '2', '4', '6', '8'], name='abc')
+        tm.assert_series_equal(result, expected)
+
+        dt2 = dtype_class({'abc': 'float64'})
+        result = s.astype(dt2)
+        expected = Series([0.0, 2.0, 4.0, 6.0, 8.0], dtype='float64',
+                          name='abc')
+        tm.assert_series_equal(result, expected)
+
+        dt3 = dtype_class({'abc': str, 'def': str})
+        with pytest.raises(KeyError):
+            s.astype(dt3)
+
+        dt4 = dtype_class({0: str})
+        with pytest.raises(KeyError):
+            s.astype(dt4)
+
+        # GH16717
+        # if dtypes provided is empty, it should error
+        dt5 = dtype_class({})
+        with pytest.raises(KeyError):
+            s.astype(dt5)
+
+    def test_astype_categories_deprecation(self):
+
+        # deprecated 17636
+        s = Series(['a', 'b', 'a'])
+        expected = s.astype(CategoricalDtype(['a', 'b'], ordered=True))
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = s.astype('category', categories=['a', 'b'], ordered=True)
+        tm.assert_series_equal(result, expected)
+
+    def test_astype_from_categorical(self):
+        l = ["a", "b", "c", "a"]
+        s = Series(l)
+        exp = Series(Categorical(l))
+        res = s.astype('category')
+        tm.assert_series_equal(res, exp)
+
+        l = [1, 2, 3, 1]
+        s = Series(l)
+        exp = Series(Categorical(l))
+        res = s.astype('category')
+        tm.assert_series_equal(res, exp)
+
+        df = DataFrame({"cats": [1, 2, 3, 4, 5, 6],
+                        "vals": [1, 2, 3, 4, 5, 6]})
+        cats = Categorical([1, 2, 3, 4, 5, 6])
+        exp_df = DataFrame({"cats": cats, "vals": [1, 2, 3, 4, 5, 6]})
+        df["cats"] = df["cats"].astype("category")
+        tm.assert_frame_equal(exp_df, df)
+
+        df = DataFrame({"cats": ['a', 'b', 'b', 'a', 'a', 'd'],
+                        "vals": [1, 2, 3, 4, 5, 6]})
+        cats = Categorical(['a', 'b', 'b', 'a', 'a', 'd'])
+        exp_df = DataFrame({"cats": cats, "vals": [1, 2, 3, 4, 5, 6]})
+        df["cats"] = df["cats"].astype("category")
+        tm.assert_frame_equal(exp_df, df)
+
+        # with keywords
+        l = ["a", "b", "c", "a"]
+        s = Series(l)
+        exp = Series(Categorical(l, ordered=True))
+        res = s.astype(CategoricalDtype(None, ordered=True))
+        tm.assert_series_equal(res, exp)
+
+        exp = Series(Categorical(l, categories=list('abcdef'), ordered=True))
+        res = s.astype(CategoricalDtype(list('abcdef'), ordered=True))
+        tm.assert_series_equal(res, exp)
+
+    def test_astype_categorical_to_other(self):
+
+        df = DataFrame({'value': np.random.randint(0, 10000, 100)})
+        labels = ["{0} - {1}".format(i, i + 499) for i in range(0, 10000, 500)]
+        cat_labels = Categorical(labels, labels)
+
+        df = df.sort_values(by=['value'], ascending=True)
+        df['value_group'] = pd.cut(df.value, range(0, 10500, 500),
+                                   right=False, labels=cat_labels)
+
+        s = df['value_group']
+        expected = s
+        tm.assert_series_equal(s.astype('category'), expected)
+        tm.assert_series_equal(s.astype(CategoricalDtype()), expected)
+        pytest.raises(ValueError, lambda: s.astype('float64'))
+
+        cat = Series(Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c']))
+        exp = Series(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
+        tm.assert_series_equal(cat.astype('str'), exp)
+        s2 = Series(Categorical(['1', '2', '3', '4']))
+        exp2 = Series([1, 2, 3, 4]).astype(int)
+        tm.assert_series_equal(s2.astype('int'), exp2)
+
+        # object don't sort correctly, so just compare that we have the same
+        # values
+        def cmp(a, b):
+            tm.assert_almost_equal(
+                np.sort(np.unique(a)), np.sort(np.unique(b)))
+
+        expected = Series(np.array(s.values), name='value_group')
+        cmp(s.astype('object'), expected)
+        cmp(s.astype(np.object_), expected)
+
+        # array conversion
+        tm.assert_almost_equal(np.array(s), np.array(s.values))
+
+        # valid conversion
+        for valid in [lambda x: x.astype('category'),
+                      lambda x: x.astype(CategoricalDtype()),
+                      lambda x: x.astype('object').astype('category'),
+                      lambda x: x.astype('object').astype(
+                          CategoricalDtype())
+                      ]:
+
+            result = valid(s)
+            # compare series values
+            # internal .categories can't be compared because it is sorted
+            tm.assert_series_equal(result, s, check_categorical=False)
+
+        # invalid conversion (these are NOT a dtype)
+        for invalid in [lambda x: x.astype(Categorical),
+                        lambda x: x.astype('object').astype(Categorical)]:
+            pytest.raises(TypeError, lambda: invalid(s))
+
+    @pytest.mark.parametrize('name', [None, 'foo'])
+    @pytest.mark.parametrize('dtype_ordered', [True, False])
+    @pytest.mark.parametrize('series_ordered', [True, False])
+    def test_astype_categorical_to_categorical(self, name, dtype_ordered,
+                                               series_ordered):
+        # GH 10696/18593
+        s_data = list('abcaacbab')
+        s_dtype = CategoricalDtype(list('bac'), ordered=series_ordered)
+        s = Series(s_data, dtype=s_dtype, name=name)
+
+        # unspecified categories
+        dtype = CategoricalDtype(ordered=dtype_ordered)
+        result = s.astype(dtype)
+        exp_dtype = CategoricalDtype(s_dtype.categories, dtype_ordered)
+        expected = Series(s_data, name=name, dtype=exp_dtype)
+        tm.assert_series_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.astype('category', ordered=dtype_ordered)
+        tm.assert_series_equal(result, expected)
+
+        # different categories
+        dtype = CategoricalDtype(list('adc'), dtype_ordered)
+        result = s.astype(dtype)
+        expected = Series(s_data, name=name, dtype=dtype)
+        tm.assert_series_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.astype(
+                'category', categories=list('adc'), ordered=dtype_ordered)
+        tm.assert_series_equal(result, expected)
+
+        if dtype_ordered is False:
+            # not specifying ordered, so only test once
+            expected = s
+            result = s.astype('category')
+            tm.assert_series_equal(result, expected)
+
+    def test_astype_categoricaldtype(self):
+        s = Series(['a', 'b', 'a'])
+        result = s.astype(CategoricalDtype(['a', 'b'], ordered=True))
+        expected = Series(Categorical(['a', 'b', 'a'], ordered=True))
+        tm.assert_series_equal(result, expected)
+
+        result = s.astype(CategoricalDtype(['a', 'b'], ordered=False))
+        expected = Series(Categorical(['a', 'b', 'a'], ordered=False))
+        tm.assert_series_equal(result, expected)
+
+        result = s.astype(CategoricalDtype(['a', 'b', 'c'], ordered=False))
+        expected = Series(Categorical(['a', 'b', 'a'],
+                                      categories=['a', 'b', 'c'],
+                                      ordered=False))
+        tm.assert_series_equal(result, expected)
+        tm.assert_index_equal(result.cat.categories, Index(['a', 'b', 'c']))
+
+    def test_astype_categoricaldtype_with_args(self):
+        s = Series(['a', 'b'])
+        type_ = CategoricalDtype(['a', 'b'])
+
+        with pytest.raises(TypeError):
+            s.astype(type_, ordered=True)
+        with pytest.raises(TypeError):
+            s.astype(type_, categories=['a', 'b'])
+        with pytest.raises(TypeError):
+            s.astype(type_, categories=['a', 'b'], ordered=False)
+
+    def test_astype_generic_timestamp_deprecated(self):
+        # see gh-15524
+        data = [1]
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            s = Series(data)
+            dtype = np.datetime64
+            result = s.astype(dtype)
+            expected = Series(data, dtype=dtype)
+            tm.assert_series_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            s = Series(data)
+            dtype = np.timedelta64
+            result = s.astype(dtype)
+            expected = Series(data, dtype=dtype)
+            tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("dtype", np.typecodes['All'])
+    def test_astype_empty_constructor_equality(self, dtype):
+        # see gh-15524
+
+        if dtype not in ('S', 'V'):  # poor support (if any) currently
+            with warnings.catch_warnings(record=True):
+                # Generic timestamp dtypes ('M' and 'm') are deprecated,
+                # but we test that already in series/test_constructors.py
+
+                init_empty = Series([], dtype=dtype)
+                as_type_empty = Series([]).astype(dtype)
+                tm.assert_series_equal(init_empty, as_type_empty)
+
+    def test_complex(self):
+        # see gh-4819: complex access for ndarray compat
+        a = np.arange(5, dtype=np.float64)
+        b = Series(a + 4j * a)
+
+        tm.assert_numpy_array_equal(a, b.real)
+        tm.assert_numpy_array_equal(4 * a, b.imag)
+
+        b.real = np.arange(5) + 5
+        tm.assert_numpy_array_equal(a + 5, b.real)
+        tm.assert_numpy_array_equal(4 * a, b.imag)
+
+    def test_arg_for_errors_in_astype(self):
+        # see gh-14878
+        s = Series([1, 2, 3])
+
+        with pytest.raises(ValueError):
+            s.astype(np.float64, errors=False)
+
+        with tm.assert_produces_warning(FutureWarning):
+            s.astype(np.int8, raise_on_error=True)
+
+        s.astype(np.int8, errors='raise')
+
+    def test_intercept_astype_object(self):
+        series = Series(date_range('1/1/2000', periods=10))
+
+        # This test no longer makes sense, as
+        # Series is by default already M8[ns].
+        expected = series.astype('object')
+
+        df = DataFrame({'a': series,
+                        'b': np.random.randn(len(series))})
+        exp_dtypes = Series([np.dtype('datetime64[ns]'),
+                             np.dtype('float64')], index=['a', 'b'])
+        tm.assert_series_equal(df.dtypes, exp_dtypes)
+
+        result = df.values.squeeze()
+        assert (result[:, 0] == expected.values).all()
+
+        df = DataFrame({'a': series, 'b': ['foo'] * len(series)})
+
+        result = df.values.squeeze()
+        assert (result[:, 0] == expected.values).all()
+
+    def test_series_to_categorical(self):
+        # see gh-16524: test conversion of Series to Categorical
+        series = Series(['a', 'b', 'c'])
+
+        result = Series(series, dtype='category')
+        expected = Series(['a', 'b', 'c'], dtype='category')
+
+        tm.assert_series_equal(result, expected)
+
+    def test_infer_objects_series(self):
+        # GH 11221
+        actual = Series(np.array([1, 2, 3], dtype='O')).infer_objects()
+        expected = Series([1, 2, 3])
+        tm.assert_series_equal(actual, expected)
+
+        actual = Series(np.array([1, 2, 3, None], dtype='O')).infer_objects()
+        expected = Series([1., 2., 3., np.nan])
+        tm.assert_series_equal(actual, expected)
+
+        # only soft conversions, unconvertable pass thru unchanged
+        actual = (Series(np.array([1, 2, 3, None, 'a'], dtype='O'))
+                  .infer_objects())
+        expected = Series([1, 2, 3, None, 'a'])
+
+        assert actual.dtype == 'object'
+        tm.assert_series_equal(actual, expected)
diff --git a/pandas/tests/series/test_internals.py b/pandas/tests/series/test_internals.py
new file mode 100644
index 0000000000000..79e23459ac992
--- /dev/null
+++ b/pandas/tests/series/test_internals.py
@@ -0,0 +1,311 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+
+from datetime import datetime
+
+from numpy import nan
+import numpy as np
+
+from pandas import Series
+from pandas.core.indexes.datetimes import Timestamp
+import pandas._libs.lib as lib
+
+from pandas.util.testing import assert_series_equal
+import pandas.util.testing as tm
+
+
+class TestSeriesInternals(object):
+
+    def test_convert_objects(self):
+
+        s = Series([1., 2, 3], index=['a', 'b', 'c'])
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.convert_objects(convert_dates=False,
+                                       convert_numeric=True)
+        assert_series_equal(result, s)
+
+        # force numeric conversion
+        r = s.copy().astype('O')
+        r['a'] = '1'
+        with tm.assert_produces_warning(FutureWarning):
+            result = r.convert_objects(convert_dates=False,
+                                       convert_numeric=True)
+        assert_series_equal(result, s)
+
+        r = s.copy().astype('O')
+        r['a'] = '1.'
+        with tm.assert_produces_warning(FutureWarning):
+            result = r.convert_objects(convert_dates=False,
+                                       convert_numeric=True)
+        assert_series_equal(result, s)
+
+        r = s.copy().astype('O')
+        r['a'] = 'garbled'
+        expected = s.copy()
+        expected['a'] = np.nan
+        with tm.assert_produces_warning(FutureWarning):
+            result = r.convert_objects(convert_dates=False,
+                                       convert_numeric=True)
+        assert_series_equal(result, expected)
+
+        # GH 4119, not converting a mixed type (e.g.floats and object)
+        s = Series([1, 'na', 3, 4])
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.convert_objects(convert_numeric=True)
+        expected = Series([1, np.nan, 3, 4])
+        assert_series_equal(result, expected)
+
+        s = Series([1, '', 3, 4])
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.convert_objects(convert_numeric=True)
+        expected = Series([1, np.nan, 3, 4])
+        assert_series_equal(result, expected)
+
+        # dates
+        s = Series([datetime(2001, 1, 1, 0, 0), datetime(2001, 1, 2, 0, 0),
+                    datetime(2001, 1, 3, 0, 0)])
+        s2 = Series([datetime(2001, 1, 1, 0, 0), datetime(2001, 1, 2, 0, 0),
+                     datetime(2001, 1, 3, 0, 0), 'foo', 1.0, 1,
+                     Timestamp('20010104'), '20010105'],
+                    dtype='O')
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.convert_objects(convert_dates=True,
+                                       convert_numeric=False)
+        expected = Series([Timestamp('20010101'), Timestamp('20010102'),
+                           Timestamp('20010103')], dtype='M8[ns]')
+        assert_series_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.convert_objects(convert_dates='coerce',
+                                       convert_numeric=False)
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.convert_objects(convert_dates='coerce',
+                                       convert_numeric=True)
+        assert_series_equal(result, expected)
+
+        expected = Series([Timestamp('20010101'), Timestamp('20010102'),
+                           Timestamp('20010103'),
+                           lib.NaT, lib.NaT, lib.NaT, Timestamp('20010104'),
+                           Timestamp('20010105')], dtype='M8[ns]')
+        with tm.assert_produces_warning(FutureWarning):
+            result = s2.convert_objects(convert_dates='coerce',
+                                        convert_numeric=False)
+        assert_series_equal(result, expected)
+        with tm.assert_produces_warning(FutureWarning):
+            result = s2.convert_objects(convert_dates='coerce',
+                                        convert_numeric=True)
+        assert_series_equal(result, expected)
+
+        # preserver all-nans (if convert_dates='coerce')
+        s = Series(['foo', 'bar', 1, 1.0], dtype='O')
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.convert_objects(convert_dates='coerce',
+                                       convert_numeric=False)
+        expected = Series([lib.NaT] * 2 + [Timestamp(1)] * 2)
+        assert_series_equal(result, expected)
+
+        # preserver if non-object
+        s = Series([1], dtype='float32')
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.convert_objects(convert_dates='coerce',
+                                       convert_numeric=False)
+        assert_series_equal(result, s)
+
+        # r = s.copy()
+        # r[0] = np.nan
+        # result = r.convert_objects(convert_dates=True,convert_numeric=False)
+        # assert result.dtype == 'M8[ns]'
+
+        # dateutil parses some single letters into today's value as a date
+        for x in 'abcdefghijklmnopqrstuvwxyz':
+            s = Series([x])
+            with tm.assert_produces_warning(FutureWarning):
+                result = s.convert_objects(convert_dates='coerce')
+            assert_series_equal(result, s)
+            s = Series([x.upper()])
+            with tm.assert_produces_warning(FutureWarning):
+                result = s.convert_objects(convert_dates='coerce')
+            assert_series_equal(result, s)
+
+    def test_convert_objects_preserve_bool(self):
+        s = Series([1, True, 3, 5], dtype=object)
+        with tm.assert_produces_warning(FutureWarning):
+            r = s.convert_objects(convert_numeric=True)
+        e = Series([1, 1, 3, 5], dtype='i8')
+        tm.assert_series_equal(r, e)
+
+    def test_convert_objects_preserve_all_bool(self):
+        s = Series([False, True, False, False], dtype=object)
+        with tm.assert_produces_warning(FutureWarning):
+            r = s.convert_objects(convert_numeric=True)
+        e = Series([False, True, False, False], dtype=bool)
+        tm.assert_series_equal(r, e)
+
+    # GH 10265
+    def test_convert(self):
+        # Tests: All to nans, coerce, true
+        # Test coercion returns correct type
+        s = Series(['a', 'b', 'c'])
+        results = s._convert(datetime=True, coerce=True)
+        expected = Series([lib.NaT] * 3)
+        assert_series_equal(results, expected)
+
+        results = s._convert(numeric=True, coerce=True)
+        expected = Series([np.nan] * 3)
+        assert_series_equal(results, expected)
+
+        expected = Series([lib.NaT] * 3, dtype=np.dtype('m8[ns]'))
+        results = s._convert(timedelta=True, coerce=True)
+        assert_series_equal(results, expected)
+
+        dt = datetime(2001, 1, 1, 0, 0)
+        td = dt - datetime(2000, 1, 1, 0, 0)
+
+        # Test coercion with mixed types
+        s = Series(['a', '3.1415', dt, td])
+        results = s._convert(datetime=True, coerce=True)
+        expected = Series([lib.NaT, lib.NaT, dt, lib.NaT])
+        assert_series_equal(results, expected)
+
+        results = s._convert(numeric=True, coerce=True)
+        expected = Series([nan, 3.1415, nan, nan])
+        assert_series_equal(results, expected)
+
+        results = s._convert(timedelta=True, coerce=True)
+        expected = Series([lib.NaT, lib.NaT, lib.NaT, td],
+                          dtype=np.dtype('m8[ns]'))
+        assert_series_equal(results, expected)
+
+        # Test standard conversion returns original
+        results = s._convert(datetime=True)
+        assert_series_equal(results, s)
+        results = s._convert(numeric=True)
+        expected = Series([nan, 3.1415, nan, nan])
+        assert_series_equal(results, expected)
+        results = s._convert(timedelta=True)
+        assert_series_equal(results, s)
+
+        # test pass-through and non-conversion when other types selected
+        s = Series(['1.0', '2.0', '3.0'])
+        results = s._convert(datetime=True, numeric=True, timedelta=True)
+        expected = Series([1.0, 2.0, 3.0])
+        assert_series_equal(results, expected)
+        results = s._convert(True, False, True)
+        assert_series_equal(results, s)
+
+        s = Series([datetime(2001, 1, 1, 0, 0), datetime(2001, 1, 1, 0, 0)],
+                   dtype='O')
+        results = s._convert(datetime=True, numeric=True, timedelta=True)
+        expected = Series([datetime(2001, 1, 1, 0, 0), datetime(2001, 1, 1, 0,
+                                                                0)])
+        assert_series_equal(results, expected)
+        results = s._convert(datetime=False, numeric=True, timedelta=True)
+        assert_series_equal(results, s)
+
+        td = datetime(2001, 1, 1, 0, 0) - datetime(2000, 1, 1, 0, 0)
+        s = Series([td, td], dtype='O')
+        results = s._convert(datetime=True, numeric=True, timedelta=True)
+        expected = Series([td, td])
+        assert_series_equal(results, expected)
+        results = s._convert(True, True, False)
+        assert_series_equal(results, s)
+
+        s = Series([1., 2, 3], index=['a', 'b', 'c'])
+        result = s._convert(numeric=True)
+        assert_series_equal(result, s)
+
+        # force numeric conversion
+        r = s.copy().astype('O')
+        r['a'] = '1'
+        result = r._convert(numeric=True)
+        assert_series_equal(result, s)
+
+        r = s.copy().astype('O')
+        r['a'] = '1.'
+        result = r._convert(numeric=True)
+        assert_series_equal(result, s)
+
+        r = s.copy().astype('O')
+        r['a'] = 'garbled'
+        result = r._convert(numeric=True)
+        expected = s.copy()
+        expected['a'] = nan
+        assert_series_equal(result, expected)
+
+        # GH 4119, not converting a mixed type (e.g.floats and object)
+        s = Series([1, 'na', 3, 4])
+        result = s._convert(datetime=True, numeric=True)
+        expected = Series([1, nan, 3, 4])
+        assert_series_equal(result, expected)
+
+        s = Series([1, '', 3, 4])
+        result = s._convert(datetime=True, numeric=True)
+        assert_series_equal(result, expected)
+
+        # dates
+        s = Series([datetime(2001, 1, 1, 0, 0), datetime(2001, 1, 2, 0, 0),
+                    datetime(2001, 1, 3, 0, 0)])
+        s2 = Series([datetime(2001, 1, 1, 0, 0), datetime(2001, 1, 2, 0, 0),
+                     datetime(2001, 1, 3, 0, 0), 'foo', 1.0, 1,
+                     Timestamp('20010104'), '20010105'], dtype='O')
+
+        result = s._convert(datetime=True)
+        expected = Series([Timestamp('20010101'), Timestamp('20010102'),
+                           Timestamp('20010103')], dtype='M8[ns]')
+        assert_series_equal(result, expected)
+
+        result = s._convert(datetime=True, coerce=True)
+        assert_series_equal(result, expected)
+
+        expected = Series([Timestamp('20010101'), Timestamp('20010102'),
+                           Timestamp('20010103'), lib.NaT, lib.NaT, lib.NaT,
+                           Timestamp('20010104'), Timestamp('20010105')],
+                          dtype='M8[ns]')
+        result = s2._convert(datetime=True, numeric=False, timedelta=False,
+                             coerce=True)
+        assert_series_equal(result, expected)
+        result = s2._convert(datetime=True, coerce=True)
+        assert_series_equal(result, expected)
+
+        s = Series(['foo', 'bar', 1, 1.0], dtype='O')
+        result = s._convert(datetime=True, coerce=True)
+        expected = Series([lib.NaT] * 2 + [Timestamp(1)] * 2)
+        assert_series_equal(result, expected)
+
+        # preserver if non-object
+        s = Series([1], dtype='float32')
+        result = s._convert(datetime=True, coerce=True)
+        assert_series_equal(result, s)
+
+        # r = s.copy()
+        # r[0] = np.nan
+        # result = r._convert(convert_dates=True,convert_numeric=False)
+        # assert result.dtype == 'M8[ns]'
+
+        # dateutil parses some single letters into today's value as a date
+        expected = Series([lib.NaT])
+        for x in 'abcdefghijklmnopqrstuvwxyz':
+            s = Series([x])
+            result = s._convert(datetime=True, coerce=True)
+            assert_series_equal(result, expected)
+            s = Series([x.upper()])
+            result = s._convert(datetime=True, coerce=True)
+            assert_series_equal(result, expected)
+
+    def test_convert_no_arg_error(self):
+        s = Series(['1.0', '2'])
+        pytest.raises(ValueError, s._convert)
+
+    def test_convert_preserve_bool(self):
+        s = Series([1, True, 3, 5], dtype=object)
+        r = s._convert(datetime=True, numeric=True)
+        e = Series([1, 1, 3, 5], dtype='i8')
+        tm.assert_series_equal(r, e)
+
+    def test_convert_preserve_all_bool(self):
+        s = Series([False, True, False, False], dtype=object)
+        r = s._convert(datetime=True, numeric=True)
+        e = Series([False, True, False, False], dtype=bool)
+        tm.assert_series_equal(r, e)
diff --git a/pandas/tests/series/test_io.py b/pandas/tests/series/test_io.py
new file mode 100644
index 0000000000000..814d794d45c18
--- /dev/null
+++ b/pandas/tests/series/test_io.py
@@ -0,0 +1,248 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+from datetime import datetime
+import collections
+import pytest
+
+import numpy as np
+import pandas as pd
+
+from pandas import Series, DataFrame
+
+from pandas.compat import StringIO, u
+from pandas.io.common import _get_handle
+from pandas.util.testing import (assert_series_equal, assert_almost_equal,
+                                 assert_frame_equal, ensure_clean)
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestSeriesToCSV(TestData):
+
+    def read_csv(self, path, **kwargs):
+        params = dict(squeeze=True, index_col=0,
+                      header=None, parse_dates=True)
+        params.update(**kwargs)
+
+        header = params.get("header")
+        out = pd.read_csv(path, **params)
+
+        if header is None:
+            out.name = out.index.name = None
+
+        return out
+
+    def test_from_csv_deprecation(self):
+        # see gh-17812
+        with ensure_clean() as path:
+            self.ts.to_csv(path)
+
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                ts = self.read_csv(path)
+                depr_ts = Series.from_csv(path)
+                assert_series_equal(depr_ts, ts)
+
+    def test_from_csv(self):
+
+        with ensure_clean() as path:
+            self.ts.to_csv(path)
+            ts = self.read_csv(path)
+            assert_series_equal(self.ts, ts, check_names=False)
+
+            assert ts.name is None
+            assert ts.index.name is None
+
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                depr_ts = Series.from_csv(path)
+                assert_series_equal(depr_ts, ts)
+
+            # see gh-10483
+            self.ts.to_csv(path, header=True)
+            ts_h = self.read_csv(path, header=0)
+            assert ts_h.name == "ts"
+
+            self.series.to_csv(path)
+            series = self.read_csv(path)
+            assert_series_equal(self.series, series, check_names=False)
+
+            assert series.name is None
+            assert series.index.name is None
+
+            self.series.to_csv(path, header=True)
+            series_h = self.read_csv(path, header=0)
+            assert series_h.name == "series"
+
+            with open(path, "w") as outfile:
+                outfile.write("1998-01-01|1.0\n1999-01-01|2.0")
+
+            series = self.read_csv(path, sep="|")
+            check_series = Series({datetime(1998, 1, 1): 1.0,
+                                   datetime(1999, 1, 1): 2.0})
+            assert_series_equal(check_series, series)
+
+            series = self.read_csv(path, sep="|", parse_dates=False)
+            check_series = Series({"1998-01-01": 1.0, "1999-01-01": 2.0})
+            assert_series_equal(check_series, series)
+
+    def test_to_csv(self):
+        import io
+
+        with ensure_clean() as path:
+            self.ts.to_csv(path)
+
+            with io.open(path, newline=None) as f:
+                lines = f.readlines()
+            assert (lines[1] != '\n')
+
+            self.ts.to_csv(path, index=False)
+            arr = np.loadtxt(path)
+            assert_almost_equal(arr, self.ts.values)
+
+    def test_to_csv_unicode_index(self):
+        buf = StringIO()
+        s = Series([u("\u05d0"), "d2"], index=[u("\u05d0"), u("\u05d1")])
+
+        s.to_csv(buf, encoding="UTF-8")
+        buf.seek(0)
+
+        s2 = self.read_csv(buf, index_col=0, encoding="UTF-8")
+        assert_series_equal(s, s2)
+
+    def test_to_csv_float_format(self):
+
+        with ensure_clean() as filename:
+            ser = Series([0.123456, 0.234567, 0.567567])
+            ser.to_csv(filename, float_format="%.2f")
+
+            rs = self.read_csv(filename)
+            xp = Series([0.12, 0.23, 0.57])
+            assert_series_equal(rs, xp)
+
+    def test_to_csv_list_entries(self):
+        s = Series(['jack and jill', 'jesse and frank'])
+
+        split = s.str.split(r'\s+and\s+')
+
+        buf = StringIO()
+        split.to_csv(buf)
+
+    def test_to_csv_path_is_none(self):
+        # GH 8215
+        # Series.to_csv() was returning None, inconsistent with
+        # DataFrame.to_csv() which returned string
+        s = Series([1, 2, 3])
+        csv_str = s.to_csv(path=None)
+        assert isinstance(csv_str, str)
+
+    @pytest.mark.parametrize('s,encoding', [
+        (Series([0.123456, 0.234567, 0.567567], index=['A', 'B', 'C'],
+                name='X'), None),
+        # GH 21241, 21118
+        (Series(['abc', 'def', 'ghi'], name='X'), 'ascii'),
+        (Series(["123", u"你好", u"世界"], name=u"中文"), 'gb2312'),
+        (Series(["123", u"Γειά σου", u"Κόσμε"], name=u"Ελληνικά"), 'cp737')
+    ])
+    def test_to_csv_compression(self, s, encoding, compression):
+
+        with ensure_clean() as filename:
+
+            s.to_csv(filename, compression=compression, encoding=encoding,
+                     header=True)
+            # test the round trip - to_csv -> read_csv
+            result = pd.read_csv(filename, compression=compression,
+                                 encoding=encoding, index_col=0, squeeze=True)
+            assert_series_equal(s, result)
+
+            # test the round trip using file handle - to_csv -> read_csv
+            f, _handles = _get_handle(filename, 'w', compression=compression,
+                                      encoding=encoding)
+            with f:
+                s.to_csv(f, encoding=encoding, header=True)
+            result = pd.read_csv(filename, compression=compression,
+                                 encoding=encoding, index_col=0, squeeze=True)
+            assert_series_equal(s, result)
+
+            # explicitly ensure file was compressed
+            with tm.decompress_file(filename, compression) as fh:
+                text = fh.read().decode(encoding or 'utf8')
+                assert s.name in text
+
+            with tm.decompress_file(filename, compression) as fh:
+                assert_series_equal(s, pd.read_csv(fh,
+                                                   index_col=0,
+                                                   squeeze=True,
+                                                   encoding=encoding))
+
+
+class TestSeriesIO(TestData):
+
+    def test_to_frame(self):
+        self.ts.name = None
+        rs = self.ts.to_frame()
+        xp = pd.DataFrame(self.ts.values, index=self.ts.index)
+        assert_frame_equal(rs, xp)
+
+        self.ts.name = 'testname'
+        rs = self.ts.to_frame()
+        xp = pd.DataFrame(dict(testname=self.ts.values), index=self.ts.index)
+        assert_frame_equal(rs, xp)
+
+        rs = self.ts.to_frame(name='testdifferent')
+        xp = pd.DataFrame(
+            dict(testdifferent=self.ts.values), index=self.ts.index)
+        assert_frame_equal(rs, xp)
+
+    def test_timeseries_periodindex(self):
+        # GH2891
+        from pandas import period_range
+        prng = period_range('1/1/2011', '1/1/2012', freq='M')
+        ts = Series(np.random.randn(len(prng)), prng)
+        new_ts = tm.round_trip_pickle(ts)
+        assert new_ts.index.freq == 'M'
+
+    def test_pickle_preserve_name(self):
+        for n in [777, 777., 'name', datetime(2001, 11, 11), (1, 2)]:
+            unpickled = self._pickle_roundtrip_name(tm.makeTimeSeries(name=n))
+            assert unpickled.name == n
+
+    def _pickle_roundtrip_name(self, obj):
+
+        with ensure_clean() as path:
+            obj.to_pickle(path)
+            unpickled = pd.read_pickle(path)
+            return unpickled
+
+    def test_to_frame_expanddim(self):
+        # GH 9762
+
+        class SubclassedSeries(Series):
+
+            @property
+            def _constructor_expanddim(self):
+                return SubclassedFrame
+
+        class SubclassedFrame(DataFrame):
+            pass
+
+        s = SubclassedSeries([1, 2, 3], name='X')
+        result = s.to_frame()
+        assert isinstance(result, SubclassedFrame)
+        expected = SubclassedFrame({'X': [1, 2, 3]})
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('mapping', (
+        dict,
+        collections.defaultdict(list),
+        collections.OrderedDict))
+    def test_to_dict(self, mapping):
+        # GH16122
+        ts = TestData().ts
+        tm.assert_series_equal(
+            Series(ts.to_dict(mapping), name='ts'), ts)
+        from_method = Series(ts.to_dict(collections.Counter))
+        from_constructor = Series(collections.Counter(ts.iteritems()))
+        tm.assert_series_equal(from_method, from_constructor)
diff --git a/pandas/tests/series/test_missing.py b/pandas/tests/series/test_missing.py
new file mode 100644
index 0000000000000..2bc44cb1c683f
--- /dev/null
+++ b/pandas/tests/series/test_missing.py
@@ -0,0 +1,1319 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytz
+import pytest
+
+from datetime import timedelta, datetime
+
+from distutils.version import LooseVersion
+from numpy import nan
+import numpy as np
+import pandas as pd
+
+from pandas import (Series, DataFrame, isna, date_range,
+                    MultiIndex, Index, Timestamp, NaT, IntervalIndex,
+                    Categorical)
+from pandas.compat import range
+from pandas._libs.tslib import iNaT
+from pandas.core.series import remove_na
+from pandas.util.testing import assert_series_equal, assert_frame_equal
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+from .common import TestData
+
+try:
+    import scipy
+    _is_scipy_ge_0190 = (LooseVersion(scipy.__version__) >=
+                         LooseVersion('0.19.0'))
+except:
+    _is_scipy_ge_0190 = False
+
+
+def _skip_if_no_pchip():
+    try:
+        from scipy.interpolate import pchip_interpolate  # noqa
+    except ImportError:
+        import pytest
+        pytest.skip('scipy.interpolate.pchip missing')
+
+
+def _skip_if_no_akima():
+    try:
+        from scipy.interpolate import Akima1DInterpolator  # noqa
+    except ImportError:
+        import pytest
+        pytest.skip('scipy.interpolate.Akima1DInterpolator missing')
+
+
+def _simple_ts(start, end, freq='D'):
+    rng = date_range(start, end, freq=freq)
+    return Series(np.random.randn(len(rng)), index=rng)
+
+
+class TestSeriesMissingData(TestData):
+
+    def test_remove_na_deprecation(self):
+        # see gh-16971
+        with tm.assert_produces_warning(FutureWarning):
+            remove_na(Series([]))
+
+    def test_timedelta_fillna(self):
+        # GH 3371
+        s = Series([Timestamp('20130101'), Timestamp('20130101'),
+                    Timestamp('20130102'), Timestamp('20130103 9:01:01')])
+        td = s.diff()
+
+        # reg fillna
+        result = td.fillna(0)
+        expected = Series([timedelta(0), timedelta(0), timedelta(1),
+                           timedelta(days=1, seconds=9 * 3600 + 60 + 1)])
+        assert_series_equal(result, expected)
+
+        # interprested as seconds
+        result = td.fillna(1)
+        expected = Series([timedelta(seconds=1), timedelta(0), timedelta(1),
+                           timedelta(days=1, seconds=9 * 3600 + 60 + 1)])
+        assert_series_equal(result, expected)
+
+        result = td.fillna(timedelta(days=1, seconds=1))
+        expected = Series([timedelta(days=1, seconds=1), timedelta(0),
+                           timedelta(1),
+                           timedelta(days=1, seconds=9 * 3600 + 60 + 1)])
+        assert_series_equal(result, expected)
+
+        result = td.fillna(np.timedelta64(int(1e9)))
+        expected = Series([timedelta(seconds=1), timedelta(0), timedelta(1),
+                           timedelta(days=1, seconds=9 * 3600 + 60 + 1)])
+        assert_series_equal(result, expected)
+
+        result = td.fillna(NaT)
+        expected = Series([NaT, timedelta(0), timedelta(1),
+                           timedelta(days=1, seconds=9 * 3600 + 60 + 1)],
+                          dtype='m8[ns]')
+        assert_series_equal(result, expected)
+
+        # ffill
+        td[2] = np.nan
+        result = td.ffill()
+        expected = td.fillna(0)
+        expected[0] = np.nan
+        assert_series_equal(result, expected)
+
+        # bfill
+        td[2] = np.nan
+        result = td.bfill()
+        expected = td.fillna(0)
+        expected[2] = timedelta(days=1, seconds=9 * 3600 + 60 + 1)
+        assert_series_equal(result, expected)
+
+    def test_datetime64_fillna(self):
+
+        s = Series([Timestamp('20130101'), Timestamp('20130101'), Timestamp(
+            '20130102'), Timestamp('20130103 9:01:01')])
+        s[2] = np.nan
+
+        # reg fillna
+        result = s.fillna(Timestamp('20130104'))
+        expected = Series([Timestamp('20130101'), Timestamp(
+            '20130101'), Timestamp('20130104'), Timestamp('20130103 9:01:01')])
+        assert_series_equal(result, expected)
+
+        result = s.fillna(NaT)
+        expected = s
+        assert_series_equal(result, expected)
+
+        # ffill
+        result = s.ffill()
+        expected = Series([Timestamp('20130101'), Timestamp(
+            '20130101'), Timestamp('20130101'), Timestamp('20130103 9:01:01')])
+        assert_series_equal(result, expected)
+
+        # bfill
+        result = s.bfill()
+        expected = Series([Timestamp('20130101'), Timestamp('20130101'),
+                           Timestamp('20130103 9:01:01'), Timestamp(
+                               '20130103 9:01:01')])
+        assert_series_equal(result, expected)
+
+        # GH 6587
+        # make sure that we are treating as integer when filling
+        # this also tests inference of a datetime-like with NaT's
+        s = Series([pd.NaT, pd.NaT, '2013-08-05 15:30:00.000001'])
+        expected = Series(
+            ['2013-08-05 15:30:00.000001', '2013-08-05 15:30:00.000001',
+             '2013-08-05 15:30:00.000001'], dtype='M8[ns]')
+        result = s.fillna(method='backfill')
+        assert_series_equal(result, expected)
+
+    def test_datetime64_tz_fillna(self):
+
+        for tz in ['US/Eastern', 'Asia/Tokyo']:
+            # DatetimeBlock
+            s = Series([Timestamp('2011-01-01 10:00'), pd.NaT,
+                        Timestamp('2011-01-03 10:00'), pd.NaT])
+            null_loc = pd.Series([False, True, False, True])
+
+            result = s.fillna(pd.Timestamp('2011-01-02 10:00'))
+            expected = Series([Timestamp('2011-01-01 10:00'),
+                               Timestamp('2011-01-02 10:00'),
+                               Timestamp('2011-01-03 10:00'),
+                               Timestamp('2011-01-02 10:00')])
+            tm.assert_series_equal(expected, result)
+            # check s is not changed
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+            result = s.fillna(pd.Timestamp('2011-01-02 10:00', tz=tz))
+            expected = Series([Timestamp('2011-01-01 10:00'),
+                               Timestamp('2011-01-02 10:00', tz=tz),
+                               Timestamp('2011-01-03 10:00'),
+                               Timestamp('2011-01-02 10:00', tz=tz)])
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+            result = s.fillna('AAA')
+            expected = Series([Timestamp('2011-01-01 10:00'), 'AAA',
+                               Timestamp('2011-01-03 10:00'), 'AAA'],
+                              dtype=object)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+            result = s.fillna({1: pd.Timestamp('2011-01-02 10:00', tz=tz),
+                               3: pd.Timestamp('2011-01-04 10:00')})
+            expected = Series([Timestamp('2011-01-01 10:00'),
+                               Timestamp('2011-01-02 10:00', tz=tz),
+                               Timestamp('2011-01-03 10:00'),
+                               Timestamp('2011-01-04 10:00')])
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+            result = s.fillna({1: pd.Timestamp('2011-01-02 10:00'),
+                               3: pd.Timestamp('2011-01-04 10:00')})
+            expected = Series([Timestamp('2011-01-01 10:00'),
+                               Timestamp('2011-01-02 10:00'),
+                               Timestamp('2011-01-03 10:00'),
+                               Timestamp('2011-01-04 10:00')])
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+            # DatetimeBlockTZ
+            idx = pd.DatetimeIndex(['2011-01-01 10:00', pd.NaT,
+                                    '2011-01-03 10:00', pd.NaT], tz=tz)
+            s = pd.Series(idx)
+            assert s.dtype == 'datetime64[ns, {0}]'.format(tz)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+            result = s.fillna(pd.Timestamp('2011-01-02 10:00'))
+            expected = Series([Timestamp('2011-01-01 10:00', tz=tz),
+                               Timestamp('2011-01-02 10:00'),
+                               Timestamp('2011-01-03 10:00', tz=tz),
+                               Timestamp('2011-01-02 10:00')])
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+            result = s.fillna(pd.Timestamp('2011-01-02 10:00', tz=tz))
+            idx = pd.DatetimeIndex(['2011-01-01 10:00', '2011-01-02 10:00',
+                                    '2011-01-03 10:00', '2011-01-02 10:00'],
+                                   tz=tz)
+            expected = Series(idx)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+            result = s.fillna(pd.Timestamp('2011-01-02 10:00',
+                                           tz=tz).to_pydatetime())
+            idx = pd.DatetimeIndex(['2011-01-01 10:00', '2011-01-02 10:00',
+                                    '2011-01-03 10:00', '2011-01-02 10:00'],
+                                   tz=tz)
+            expected = Series(idx)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+            result = s.fillna('AAA')
+            expected = Series([Timestamp('2011-01-01 10:00', tz=tz), 'AAA',
+                               Timestamp('2011-01-03 10:00', tz=tz), 'AAA'],
+                              dtype=object)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+            result = s.fillna({1: pd.Timestamp('2011-01-02 10:00', tz=tz),
+                               3: pd.Timestamp('2011-01-04 10:00')})
+            expected = Series([Timestamp('2011-01-01 10:00', tz=tz),
+                               Timestamp('2011-01-02 10:00', tz=tz),
+                               Timestamp('2011-01-03 10:00', tz=tz),
+                               Timestamp('2011-01-04 10:00')])
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+            result = s.fillna({1: pd.Timestamp('2011-01-02 10:00', tz=tz),
+                               3: pd.Timestamp('2011-01-04 10:00', tz=tz)})
+            expected = Series([Timestamp('2011-01-01 10:00', tz=tz),
+                               Timestamp('2011-01-02 10:00', tz=tz),
+                               Timestamp('2011-01-03 10:00', tz=tz),
+                               Timestamp('2011-01-04 10:00', tz=tz)])
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+            # filling with a naive/other zone, coerce to object
+            result = s.fillna(Timestamp('20130101'))
+            expected = Series([Timestamp('2011-01-01 10:00', tz=tz),
+                               Timestamp('2013-01-01'),
+                               Timestamp('2011-01-03 10:00', tz=tz),
+                               Timestamp('2013-01-01')])
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+            result = s.fillna(Timestamp('20130101', tz='US/Pacific'))
+            expected = Series([Timestamp('2011-01-01 10:00', tz=tz),
+                               Timestamp('2013-01-01', tz='US/Pacific'),
+                               Timestamp('2011-01-03 10:00', tz=tz),
+                               Timestamp('2013-01-01', tz='US/Pacific')])
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+        # with timezone
+        # GH 15855
+        df = pd.Series([pd.Timestamp('2012-11-11 00:00:00+01:00'), pd.NaT])
+        exp = pd.Series([pd.Timestamp('2012-11-11 00:00:00+01:00'),
+                         pd.Timestamp('2012-11-11 00:00:00+01:00')])
+        assert_series_equal(df.fillna(method='pad'), exp)
+
+        df = pd.Series([pd.NaT, pd.Timestamp('2012-11-11 00:00:00+01:00')])
+        exp = pd.Series([pd.Timestamp('2012-11-11 00:00:00+01:00'),
+                         pd.Timestamp('2012-11-11 00:00:00+01:00')])
+        assert_series_equal(df.fillna(method='bfill'), exp)
+
+    def test_fillna_consistency(self):
+        # GH 16402
+        # fillna with a tz aware to a tz-naive, should result in object
+
+        s = Series([Timestamp('20130101'), pd.NaT])
+
+        result = s.fillna(Timestamp('20130101', tz='US/Eastern'))
+        expected = Series([Timestamp('20130101'),
+                           Timestamp('2013-01-01', tz='US/Eastern')],
+                          dtype='object')
+        assert_series_equal(result, expected)
+
+        # where (we ignore the errors=)
+        result = s.where([True, False],
+                         Timestamp('20130101', tz='US/Eastern'),
+                         errors='ignore')
+        assert_series_equal(result, expected)
+
+        result = s.where([True, False],
+                         Timestamp('20130101', tz='US/Eastern'),
+                         errors='ignore')
+        assert_series_equal(result, expected)
+
+        # with a non-datetime
+        result = s.fillna('foo')
+        expected = Series([Timestamp('20130101'),
+                           'foo'])
+        assert_series_equal(result, expected)
+
+        # assignment
+        s2 = s.copy()
+        s2[1] = 'foo'
+        assert_series_equal(s2, expected)
+
+    def test_datetime64tz_fillna_round_issue(self):
+        # GH 14872
+
+        data = pd.Series([pd.NaT, pd.NaT,
+                          datetime(2016, 12, 12, 22, 24, 6, 100001,
+                                   tzinfo=pytz.utc)])
+
+        filled = data.fillna(method='bfill')
+
+        expected = pd.Series([datetime(2016, 12, 12, 22, 24, 6,
+                                       100001, tzinfo=pytz.utc),
+                              datetime(2016, 12, 12, 22, 24, 6,
+                                       100001, tzinfo=pytz.utc),
+                              datetime(2016, 12, 12, 22, 24, 6,
+                                       100001, tzinfo=pytz.utc)])
+
+        assert_series_equal(filled, expected)
+
+    def test_fillna_downcast(self):
+        # GH 15277
+        # infer int64 from float64
+        s = pd.Series([1., np.nan])
+        result = s.fillna(0, downcast='infer')
+        expected = pd.Series([1, 0])
+        assert_series_equal(result, expected)
+
+        # infer int64 from float64 when fillna value is a dict
+        s = pd.Series([1., np.nan])
+        result = s.fillna({1: 0}, downcast='infer')
+        expected = pd.Series([1, 0])
+        assert_series_equal(result, expected)
+
+    def test_fillna_int(self):
+        s = Series(np.random.randint(-100, 100, 50))
+        s.fillna(method='ffill', inplace=True)
+        assert_series_equal(s.fillna(method='ffill', inplace=False), s)
+
+    def test_fillna_raise(self):
+        s = Series(np.random.randint(-100, 100, 50))
+        pytest.raises(TypeError, s.fillna, [1, 2])
+        pytest.raises(TypeError, s.fillna, (1, 2))
+
+        # related GH 9217, make sure limit is an int and greater than 0
+        s = Series([1, 2, 3, None])
+        for limit in [-1, 0, 1., 2.]:
+            for method in ['backfill', 'bfill', 'pad', 'ffill', None]:
+                with pytest.raises(ValueError):
+                    s.fillna(1, limit=limit, method=method)
+
+    def test_categorical_nan_equality(self):
+        cat = Series(Categorical(["a", "b", "c", np.nan]))
+        exp = Series([True, True, True, False])
+        res = (cat == cat)
+        tm.assert_series_equal(res, exp)
+
+    def test_categorical_nan_handling(self):
+
+        # NaNs are represented as -1 in labels
+        s = Series(Categorical(["a", "b", np.nan, "a"]))
+        tm.assert_index_equal(s.cat.categories, Index(["a", "b"]))
+        tm.assert_numpy_array_equal(s.values.codes,
+                                    np.array([0, 1, -1, 0], dtype=np.int8))
+
+    @pytest.mark.parametrize('fill_value, expected_output', [
+        ('a', ['a', 'a', 'b', 'a', 'a']),
+        ({1: 'a', 3: 'b', 4: 'b'}, ['a', 'a', 'b', 'b', 'b']),
+        ({1: 'a'}, ['a', 'a', 'b', np.nan, np.nan]),
+        ({1: 'a', 3: 'b'}, ['a', 'a', 'b', 'b', np.nan]),
+        (Series('a'), ['a', np.nan, 'b', np.nan, np.nan]),
+        (Series('a', index=[1]), ['a', 'a', 'b', np.nan, np.nan]),
+        (Series({1: 'a', 3: 'b'}), ['a', 'a', 'b', 'b', np.nan]),
+        (Series(['a', 'b'], index=[3, 4]), ['a', np.nan, 'b', 'a', 'b'])
+    ])
+    def test_fillna_categorical(self, fill_value, expected_output):
+        # GH 17033
+        # Test fillna for a Categorical series
+        data = ['a', np.nan, 'b', np.nan, np.nan]
+        s = Series(Categorical(data, categories=['a', 'b']))
+        exp = Series(Categorical(expected_output, categories=['a', 'b']))
+        tm.assert_series_equal(s.fillna(fill_value), exp)
+
+    def test_fillna_categorical_raise(self):
+        data = ['a', np.nan, 'b', np.nan, np.nan]
+        s = Series(Categorical(data, categories=['a', 'b']))
+
+        with tm.assert_raises_regex(ValueError,
+                                    "fill value must be in categories"):
+            s.fillna('d')
+
+        with tm.assert_raises_regex(ValueError,
+                                    "fill value must be in categories"):
+            s.fillna(Series('d'))
+
+        with tm.assert_raises_regex(ValueError,
+                                    "fill value must be in categories"):
+            s.fillna({1: 'd', 3: 'a'})
+
+        with tm.assert_raises_regex(TypeError,
+                                    '"value" parameter must be a scalar or '
+                                    'dict, but you passed a "list"'):
+            s.fillna(['a', 'b'])
+
+        with tm.assert_raises_regex(TypeError,
+                                    '"value" parameter must be a scalar or '
+                                    'dict, but you passed a "tuple"'):
+            s.fillna(('a', 'b'))
+
+        with tm.assert_raises_regex(TypeError,
+                                    '"value" parameter must be a scalar, dict '
+                                    'or Series, but you passed a "DataFrame"'):
+            s.fillna(DataFrame({1: ['a'], 3: ['b']}))
+
+    def test_fillna_nat(self):
+        series = Series([0, 1, 2, iNaT], dtype='M8[ns]')
+
+        filled = series.fillna(method='pad')
+        filled2 = series.fillna(value=series.values[2])
+
+        expected = series.copy()
+        expected.values[3] = expected.values[2]
+
+        assert_series_equal(filled, expected)
+        assert_series_equal(filled2, expected)
+
+        df = DataFrame({'A': series})
+        filled = df.fillna(method='pad')
+        filled2 = df.fillna(value=series.values[2])
+        expected = DataFrame({'A': expected})
+        assert_frame_equal(filled, expected)
+        assert_frame_equal(filled2, expected)
+
+        series = Series([iNaT, 0, 1, 2], dtype='M8[ns]')
+
+        filled = series.fillna(method='bfill')
+        filled2 = series.fillna(value=series[1])
+
+        expected = series.copy()
+        expected[0] = expected[1]
+
+        assert_series_equal(filled, expected)
+        assert_series_equal(filled2, expected)
+
+        df = DataFrame({'A': series})
+        filled = df.fillna(method='bfill')
+        filled2 = df.fillna(value=series[1])
+        expected = DataFrame({'A': expected})
+        assert_frame_equal(filled, expected)
+        assert_frame_equal(filled2, expected)
+
+    def test_isna_for_inf(self):
+        s = Series(['a', np.inf, np.nan, 1.0])
+        with pd.option_context('mode.use_inf_as_na', True):
+            r = s.isna()
+            dr = s.dropna()
+        e = Series([False, True, True, False])
+        de = Series(['a', 1.0], index=[0, 3])
+        tm.assert_series_equal(r, e)
+        tm.assert_series_equal(dr, de)
+
+    @tm.capture_stdout
+    def test_isnull_for_inf_deprecated(self):
+        # gh-17115
+        s = Series(['a', np.inf, np.nan, 1.0])
+        with pd.option_context('mode.use_inf_as_null', True):
+            r = s.isna()
+            dr = s.dropna()
+
+        e = Series([False, True, True, False])
+        de = Series(['a', 1.0], index=[0, 3])
+        tm.assert_series_equal(r, e)
+        tm.assert_series_equal(dr, de)
+
+    def test_fillna(self):
+        ts = Series([0., 1., 2., 3., 4.], index=tm.makeDateIndex(5))
+
+        tm.assert_series_equal(ts, ts.fillna(method='ffill'))
+
+        ts[2] = np.NaN
+
+        exp = Series([0., 1., 1., 3., 4.], index=ts.index)
+        tm.assert_series_equal(ts.fillna(method='ffill'), exp)
+
+        exp = Series([0., 1., 3., 3., 4.], index=ts.index)
+        tm.assert_series_equal(ts.fillna(method='backfill'), exp)
+
+        exp = Series([0., 1., 5., 3., 4.], index=ts.index)
+        tm.assert_series_equal(ts.fillna(value=5), exp)
+
+        pytest.raises(ValueError, ts.fillna)
+        pytest.raises(ValueError, self.ts.fillna, value=0, method='ffill')
+
+        # GH 5703
+        s1 = Series([np.nan])
+        s2 = Series([1])
+        result = s1.fillna(s2)
+        expected = Series([1.])
+        assert_series_equal(result, expected)
+        result = s1.fillna({})
+        assert_series_equal(result, s1)
+        result = s1.fillna(Series(()))
+        assert_series_equal(result, s1)
+        result = s2.fillna(s1)
+        assert_series_equal(result, s2)
+        result = s1.fillna({0: 1})
+        assert_series_equal(result, expected)
+        result = s1.fillna({1: 1})
+        assert_series_equal(result, Series([np.nan]))
+        result = s1.fillna({0: 1, 1: 1})
+        assert_series_equal(result, expected)
+        result = s1.fillna(Series({0: 1, 1: 1}))
+        assert_series_equal(result, expected)
+        result = s1.fillna(Series({0: 1, 1: 1}, index=[4, 5]))
+        assert_series_equal(result, s1)
+
+        s1 = Series([0, 1, 2], list('abc'))
+        s2 = Series([0, np.nan, 2], list('bac'))
+        result = s2.fillna(s1)
+        expected = Series([0, 0, 2.], list('bac'))
+        assert_series_equal(result, expected)
+
+        # limit
+        s = Series(np.nan, index=[0, 1, 2])
+        result = s.fillna(999, limit=1)
+        expected = Series([999, np.nan, np.nan], index=[0, 1, 2])
+        assert_series_equal(result, expected)
+
+        result = s.fillna(999, limit=2)
+        expected = Series([999, 999, np.nan], index=[0, 1, 2])
+        assert_series_equal(result, expected)
+
+        # GH 9043
+        # make sure a string representation of int/float values can be filled
+        # correctly without raising errors or being converted
+        vals = ['0', '1.5', '-0.3']
+        for val in vals:
+            s = Series([0, 1, np.nan, np.nan, 4], dtype='float64')
+            result = s.fillna(val)
+            expected = Series([0, 1, val, val, 4], dtype='object')
+            assert_series_equal(result, expected)
+
+    def test_fillna_bug(self):
+        x = Series([nan, 1., nan, 3., nan], ['z', 'a', 'b', 'c', 'd'])
+        filled = x.fillna(method='ffill')
+        expected = Series([nan, 1., 1., 3., 3.], x.index)
+        assert_series_equal(filled, expected)
+
+        filled = x.fillna(method='bfill')
+        expected = Series([1., 1., 3., 3., nan], x.index)
+        assert_series_equal(filled, expected)
+
+    def test_fillna_inplace(self):
+        x = Series([nan, 1., nan, 3., nan], ['z', 'a', 'b', 'c', 'd'])
+        y = x.copy()
+
+        y.fillna(value=0, inplace=True)
+
+        expected = x.fillna(value=0)
+        assert_series_equal(y, expected)
+
+    def test_fillna_invalid_method(self):
+        try:
+            self.ts.fillna(method='ffil')
+        except ValueError as inst:
+            assert 'ffil' in str(inst)
+
+    def test_ffill(self):
+        ts = Series([0., 1., 2., 3., 4.], index=tm.makeDateIndex(5))
+        ts[2] = np.NaN
+        assert_series_equal(ts.ffill(), ts.fillna(method='ffill'))
+
+    def test_ffill_mixed_dtypes_without_missing_data(self):
+        # GH14956
+        series = pd.Series([datetime(2015, 1, 1, tzinfo=pytz.utc), 1])
+        result = series.ffill()
+        assert_series_equal(series, result)
+
+    def test_bfill(self):
+        ts = Series([0., 1., 2., 3., 4.], index=tm.makeDateIndex(5))
+        ts[2] = np.NaN
+        assert_series_equal(ts.bfill(), ts.fillna(method='bfill'))
+
+    def test_timedelta64_nan(self):
+
+        td = Series([timedelta(days=i) for i in range(10)])
+
+        # nan ops on timedeltas
+        td1 = td.copy()
+        td1[0] = np.nan
+        assert isna(td1[0])
+        assert td1[0].value == iNaT
+        td1[0] = td[0]
+        assert not isna(td1[0])
+
+        td1[1] = iNaT
+        assert isna(td1[1])
+        assert td1[1].value == iNaT
+        td1[1] = td[1]
+        assert not isna(td1[1])
+
+        td1[2] = NaT
+        assert isna(td1[2])
+        assert td1[2].value == iNaT
+        td1[2] = td[2]
+        assert not isna(td1[2])
+
+        # boolean setting
+        # this doesn't work, not sure numpy even supports it
+        # result = td[(td>np.timedelta64(timedelta(days=3))) &
+        # td<np.timedelta64(timedelta(days=7)))] = np.nan
+        # assert isna(result).sum() == 7
+
+        # NumPy limitiation =(
+
+        # def test_logical_range_select(self):
+        #     np.random.seed(12345)
+        #     selector = -0.5 <= self.ts <= 0.5
+        #     expected = (self.ts >= -0.5) & (self.ts <= 0.5)
+        #     assert_series_equal(selector, expected)
+
+    def test_dropna_empty(self):
+        s = Series([])
+        assert len(s.dropna()) == 0
+        s.dropna(inplace=True)
+        assert len(s) == 0
+
+        # invalid axis
+        pytest.raises(ValueError, s.dropna, axis=1)
+
+    def test_datetime64_tz_dropna(self):
+        # DatetimeBlock
+        s = Series([Timestamp('2011-01-01 10:00'), pd.NaT, Timestamp(
+            '2011-01-03 10:00'), pd.NaT])
+        result = s.dropna()
+        expected = Series([Timestamp('2011-01-01 10:00'),
+                           Timestamp('2011-01-03 10:00')], index=[0, 2])
+        tm.assert_series_equal(result, expected)
+
+        # DatetimeBlockTZ
+        idx = pd.DatetimeIndex(['2011-01-01 10:00', pd.NaT,
+                                '2011-01-03 10:00', pd.NaT],
+                               tz='Asia/Tokyo')
+        s = pd.Series(idx)
+        assert s.dtype == 'datetime64[ns, Asia/Tokyo]'
+        result = s.dropna()
+        expected = Series([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
+                           Timestamp('2011-01-03 10:00', tz='Asia/Tokyo')],
+                          index=[0, 2])
+        assert result.dtype == 'datetime64[ns, Asia/Tokyo]'
+        tm.assert_series_equal(result, expected)
+
+    def test_dropna_no_nan(self):
+        for s in [Series([1, 2, 3], name='x'), Series(
+                [False, True, False], name='x')]:
+
+            result = s.dropna()
+            tm.assert_series_equal(result, s)
+            assert result is not s
+
+            s2 = s.copy()
+            s2.dropna(inplace=True)
+            tm.assert_series_equal(s2, s)
+
+    def test_dropna_intervals(self):
+        s = Series([np.nan, 1, 2, 3], IntervalIndex.from_arrays(
+            [np.nan, 0, 1, 2],
+            [np.nan, 1, 2, 3]))
+
+        result = s.dropna()
+        expected = s.iloc[1:]
+        assert_series_equal(result, expected)
+
+    def test_valid(self):
+        ts = self.ts.copy()
+        ts[::2] = np.NaN
+
+        result = ts.dropna()
+        assert len(result) == ts.count()
+        tm.assert_series_equal(result, ts[1::2])
+        tm.assert_series_equal(result, ts[pd.notna(ts)])
+
+    def test_isna(self):
+        ser = Series([0, 5.4, 3, nan, -0.001])
+        expected = Series([False, False, False, True, False])
+        tm.assert_series_equal(ser.isna(), expected)
+
+        ser = Series(["hi", "", nan])
+        expected = Series([False, False, True])
+        tm.assert_series_equal(ser.isna(), expected)
+
+    def test_notna(self):
+        ser = Series([0, 5.4, 3, nan, -0.001])
+        expected = Series([True, True, True, False, True])
+        tm.assert_series_equal(ser.notna(), expected)
+
+        ser = Series(["hi", "", nan])
+        expected = Series([True, True, False])
+        tm.assert_series_equal(ser.notna(), expected)
+
+    def test_pad_nan(self):
+        x = Series([np.nan, 1., np.nan, 3., np.nan], ['z', 'a', 'b', 'c', 'd'],
+                   dtype=float)
+
+        x.fillna(method='pad', inplace=True)
+
+        expected = Series([np.nan, 1.0, 1.0, 3.0, 3.0],
+                          ['z', 'a', 'b', 'c', 'd'], dtype=float)
+        assert_series_equal(x[1:], expected[1:])
+        assert np.isnan(x[0]), np.isnan(expected[0])
+
+    def test_pad_require_monotonicity(self):
+        rng = date_range('1/1/2000', '3/1/2000', freq='B')
+
+        # neither monotonic increasing or decreasing
+        rng2 = rng[[1, 0, 2]]
+
+        pytest.raises(ValueError, rng2.get_indexer, rng, method='pad')
+
+    def test_dropna_preserve_name(self):
+        self.ts[:5] = np.nan
+        result = self.ts.dropna()
+        assert result.name == self.ts.name
+        name = self.ts.name
+        ts = self.ts.copy()
+        ts.dropna(inplace=True)
+        assert ts.name == name
+
+    def test_fill_value_when_combine_const(self):
+        # GH12723
+        s = Series([0, 1, np.nan, 3, 4, 5])
+
+        exp = s.fillna(0).add(2)
+        res = s.add(2, fill_value=0)
+        assert_series_equal(res, exp)
+
+    def test_series_fillna_limit(self):
+        index = np.arange(10)
+        s = Series(np.random.randn(10), index=index)
+
+        result = s[:2].reindex(index)
+        result = result.fillna(method='pad', limit=5)
+
+        expected = s[:2].reindex(index).fillna(method='pad')
+        expected[-3:] = np.nan
+        assert_series_equal(result, expected)
+
+        result = s[-2:].reindex(index)
+        result = result.fillna(method='bfill', limit=5)
+
+        expected = s[-2:].reindex(index).fillna(method='backfill')
+        expected[:3] = np.nan
+        assert_series_equal(result, expected)
+
+    def test_sparse_series_fillna_limit(self):
+        index = np.arange(10)
+        s = Series(np.random.randn(10), index=index)
+
+        ss = s[:2].reindex(index).to_sparse()
+        result = ss.fillna(method='pad', limit=5)
+        expected = ss.fillna(method='pad', limit=5)
+        expected = expected.to_dense()
+        expected[-3:] = np.nan
+        expected = expected.to_sparse()
+        assert_series_equal(result, expected)
+
+        ss = s[-2:].reindex(index).to_sparse()
+        result = ss.fillna(method='backfill', limit=5)
+        expected = ss.fillna(method='backfill')
+        expected = expected.to_dense()
+        expected[:3] = np.nan
+        expected = expected.to_sparse()
+        assert_series_equal(result, expected)
+
+    def test_sparse_series_pad_backfill_limit(self):
+        index = np.arange(10)
+        s = Series(np.random.randn(10), index=index)
+        s = s.to_sparse()
+
+        result = s[:2].reindex(index, method='pad', limit=5)
+        expected = s[:2].reindex(index).fillna(method='pad')
+        expected = expected.to_dense()
+        expected[-3:] = np.nan
+        expected = expected.to_sparse()
+        assert_series_equal(result, expected)
+
+        result = s[-2:].reindex(index, method='backfill', limit=5)
+        expected = s[-2:].reindex(index).fillna(method='backfill')
+        expected = expected.to_dense()
+        expected[:3] = np.nan
+        expected = expected.to_sparse()
+        assert_series_equal(result, expected)
+
+    def test_series_pad_backfill_limit(self):
+        index = np.arange(10)
+        s = Series(np.random.randn(10), index=index)
+
+        result = s[:2].reindex(index, method='pad', limit=5)
+
+        expected = s[:2].reindex(index).fillna(method='pad')
+        expected[-3:] = np.nan
+        assert_series_equal(result, expected)
+
+        result = s[-2:].reindex(index, method='backfill', limit=5)
+
+        expected = s[-2:].reindex(index).fillna(method='backfill')
+        expected[:3] = np.nan
+        assert_series_equal(result, expected)
+
+
+class TestSeriesInterpolateData(TestData):
+
+    def test_interpolate(self):
+        ts = Series(np.arange(len(self.ts), dtype=float), self.ts.index)
+
+        ts_copy = ts.copy()
+        ts_copy[5:10] = np.NaN
+
+        linear_interp = ts_copy.interpolate(method='linear')
+        tm.assert_series_equal(linear_interp, ts)
+
+        ord_ts = Series([d.toordinal() for d in self.ts.index],
+                        index=self.ts.index).astype(float)
+
+        ord_ts_copy = ord_ts.copy()
+        ord_ts_copy[5:10] = np.NaN
+
+        time_interp = ord_ts_copy.interpolate(method='time')
+        tm.assert_series_equal(time_interp, ord_ts)
+
+        # try time interpolation on a non-TimeSeries
+        # Only raises ValueError if there are NaNs.
+        non_ts = self.series.copy()
+        non_ts[0] = np.NaN
+        pytest.raises(ValueError, non_ts.interpolate, method='time')
+
+    @td.skip_if_no_scipy
+    def test_interpolate_pchip(self):
+        _skip_if_no_pchip()
+
+        ser = Series(np.sort(np.random.uniform(size=100)))
+
+        # interpolate at new_index
+        new_index = ser.index.union(Index([49.25, 49.5, 49.75, 50.25, 50.5,
+                                           50.75]))
+        interp_s = ser.reindex(new_index).interpolate(method='pchip')
+        # does not blow up, GH5977
+        interp_s[49:51]
+
+    @td.skip_if_no_scipy
+    def test_interpolate_akima(self):
+        _skip_if_no_akima()
+
+        ser = Series([10, 11, 12, 13])
+
+        expected = Series([11.00, 11.25, 11.50, 11.75,
+                           12.00, 12.25, 12.50, 12.75, 13.00],
+                          index=Index([1.0, 1.25, 1.5, 1.75,
+                                       2.0, 2.25, 2.5, 2.75, 3.0]))
+        # interpolate at new_index
+        new_index = ser.index.union(Index([1.25, 1.5, 1.75, 2.25, 2.5, 2.75]))
+        interp_s = ser.reindex(new_index).interpolate(method='akima')
+        assert_series_equal(interp_s[1:3], expected)
+
+    @td.skip_if_no_scipy
+    def test_interpolate_piecewise_polynomial(self):
+        ser = Series([10, 11, 12, 13])
+
+        expected = Series([11.00, 11.25, 11.50, 11.75,
+                           12.00, 12.25, 12.50, 12.75, 13.00],
+                          index=Index([1.0, 1.25, 1.5, 1.75,
+                                       2.0, 2.25, 2.5, 2.75, 3.0]))
+        # interpolate at new_index
+        new_index = ser.index.union(Index([1.25, 1.5, 1.75, 2.25, 2.5, 2.75]))
+        interp_s = ser.reindex(new_index).interpolate(
+            method='piecewise_polynomial')
+        assert_series_equal(interp_s[1:3], expected)
+
+    @td.skip_if_no_scipy
+    def test_interpolate_from_derivatives(self):
+        ser = Series([10, 11, 12, 13])
+
+        expected = Series([11.00, 11.25, 11.50, 11.75,
+                           12.00, 12.25, 12.50, 12.75, 13.00],
+                          index=Index([1.0, 1.25, 1.5, 1.75,
+                                       2.0, 2.25, 2.5, 2.75, 3.0]))
+        # interpolate at new_index
+        new_index = ser.index.union(Index([1.25, 1.5, 1.75, 2.25, 2.5, 2.75]))
+        interp_s = ser.reindex(new_index).interpolate(
+            method='from_derivatives')
+        assert_series_equal(interp_s[1:3], expected)
+
+    @pytest.mark.parametrize("kwargs", [
+        {},
+        pytest.param({'method': 'polynomial', 'order': 1},
+                     marks=td.skip_if_no_scipy)
+    ])
+    def test_interpolate_corners(self, kwargs):
+        s = Series([np.nan, np.nan])
+        assert_series_equal(s.interpolate(**kwargs), s)
+
+        s = Series([]).interpolate()
+        assert_series_equal(s.interpolate(**kwargs), s)
+
+    def test_interpolate_index_values(self):
+        s = Series(np.nan, index=np.sort(np.random.rand(30)))
+        s[::3] = np.random.randn(10)
+
+        vals = s.index.values.astype(float)
+
+        result = s.interpolate(method='index')
+
+        expected = s.copy()
+        bad = isna(expected.values)
+        good = ~bad
+        expected = Series(np.interp(vals[bad], vals[good],
+                                    s.values[good]),
+                          index=s.index[bad])
+
+        assert_series_equal(result[bad], expected)
+
+        # 'values' is synonymous with 'index' for the method kwarg
+        other_result = s.interpolate(method='values')
+
+        assert_series_equal(other_result, result)
+        assert_series_equal(other_result[bad], expected)
+
+    def test_interpolate_non_ts(self):
+        s = Series([1, 3, np.nan, np.nan, np.nan, 11])
+        with pytest.raises(ValueError):
+            s.interpolate(method='time')
+
+    @pytest.mark.parametrize("kwargs", [
+        {},
+        pytest.param({'method': 'polynomial', 'order': 1},
+                     marks=td.skip_if_no_scipy)
+    ])
+    def test_nan_interpolate(self, kwargs):
+        s = Series([0, 1, np.nan, 3])
+        result = s.interpolate(**kwargs)
+        expected = Series([0., 1., 2., 3.])
+        assert_series_equal(result, expected)
+
+    def test_nan_irregular_index(self):
+        s = Series([1, 2, np.nan, 4], index=[1, 3, 5, 9])
+        result = s.interpolate()
+        expected = Series([1., 2., 3., 4.], index=[1, 3, 5, 9])
+        assert_series_equal(result, expected)
+
+    def test_nan_str_index(self):
+        s = Series([0, 1, 2, np.nan], index=list('abcd'))
+        result = s.interpolate()
+        expected = Series([0., 1., 2., 2.], index=list('abcd'))
+        assert_series_equal(result, expected)
+
+    @td.skip_if_no_scipy
+    def test_interp_quad(self):
+        sq = Series([1, 4, np.nan, 16], index=[1, 2, 3, 4])
+        result = sq.interpolate(method='quadratic')
+        expected = Series([1., 4., 9., 16.], index=[1, 2, 3, 4])
+        assert_series_equal(result, expected)
+
+    @td.skip_if_no_scipy
+    def test_interp_scipy_basic(self):
+        s = Series([1, 3, np.nan, 12, np.nan, 25])
+        # slinear
+        expected = Series([1., 3., 7.5, 12., 18.5, 25.])
+        result = s.interpolate(method='slinear')
+        assert_series_equal(result, expected)
+
+        result = s.interpolate(method='slinear', downcast='infer')
+        assert_series_equal(result, expected)
+        # nearest
+        expected = Series([1, 3, 3, 12, 12, 25])
+        result = s.interpolate(method='nearest')
+        assert_series_equal(result, expected.astype('float'))
+
+        result = s.interpolate(method='nearest', downcast='infer')
+        assert_series_equal(result, expected)
+        # zero
+        expected = Series([1, 3, 3, 12, 12, 25])
+        result = s.interpolate(method='zero')
+        assert_series_equal(result, expected.astype('float'))
+
+        result = s.interpolate(method='zero', downcast='infer')
+        assert_series_equal(result, expected)
+        # quadratic
+        # GH #15662.
+        # new cubic and quadratic interpolation algorithms from scipy 0.19.0.
+        # previously `splmake` was used. See scipy/scipy#6710
+        if _is_scipy_ge_0190:
+            expected = Series([1, 3., 6.823529, 12., 18.058824, 25.])
+        else:
+            expected = Series([1, 3., 6.769231, 12., 18.230769, 25.])
+        result = s.interpolate(method='quadratic')
+        assert_series_equal(result, expected)
+
+        result = s.interpolate(method='quadratic', downcast='infer')
+        assert_series_equal(result, expected)
+        # cubic
+        expected = Series([1., 3., 6.8, 12., 18.2, 25.])
+        result = s.interpolate(method='cubic')
+        assert_series_equal(result, expected)
+
+    def test_interp_limit(self):
+        s = Series([1, 3, np.nan, np.nan, np.nan, 11])
+
+        expected = Series([1., 3., 5., 7., np.nan, 11.])
+        result = s.interpolate(method='linear', limit=2)
+        assert_series_equal(result, expected)
+
+        # GH 9217, make sure limit is an int and greater than 0
+        methods = ['linear', 'time', 'index', 'values', 'nearest', 'zero',
+                   'slinear', 'quadratic', 'cubic', 'barycentric', 'krogh',
+                   'polynomial', 'spline', 'piecewise_polynomial', None,
+                   'from_derivatives', 'pchip', 'akima']
+        s = pd.Series([1, 2, np.nan, np.nan, 5])
+        for limit in [-1, 0, 1., 2.]:
+            for method in methods:
+                with pytest.raises(ValueError):
+                    s.interpolate(limit=limit, method=method)
+
+    def test_interp_limit_forward(self):
+        s = Series([1, 3, np.nan, np.nan, np.nan, 11])
+
+        # Provide 'forward' (the default) explicitly here.
+        expected = Series([1., 3., 5., 7., np.nan, 11.])
+
+        result = s.interpolate(method='linear', limit=2,
+                               limit_direction='forward')
+        assert_series_equal(result, expected)
+
+        result = s.interpolate(method='linear', limit=2,
+                               limit_direction='FORWARD')
+        assert_series_equal(result, expected)
+
+    def test_interp_unlimited(self):
+        # these test are for issue #16282 default Limit=None is unlimited
+        s = Series([np.nan, 1., 3., np.nan, np.nan, np.nan, 11., np.nan])
+        expected = Series([1., 1., 3., 5., 7., 9., 11., 11.])
+        result = s.interpolate(method='linear',
+                               limit_direction='both')
+        assert_series_equal(result, expected)
+
+        expected = Series([np.nan, 1., 3., 5., 7., 9., 11., 11.])
+        result = s.interpolate(method='linear',
+                               limit_direction='forward')
+        assert_series_equal(result, expected)
+
+        expected = Series([1., 1., 3., 5., 7., 9., 11., np.nan])
+        result = s.interpolate(method='linear',
+                               limit_direction='backward')
+        assert_series_equal(result, expected)
+
+    def test_interp_limit_bad_direction(self):
+        s = Series([1, 3, np.nan, np.nan, np.nan, 11])
+
+        pytest.raises(ValueError, s.interpolate, method='linear', limit=2,
+                      limit_direction='abc')
+
+        # raises an error even if no limit is specified.
+        pytest.raises(ValueError, s.interpolate, method='linear',
+                      limit_direction='abc')
+
+    # limit_area introduced GH #16284
+    def test_interp_limit_area(self):
+        # These tests are for issue #9218 -- fill NaNs in both directions.
+        s = Series([nan, nan, 3, nan, nan, nan, 7, nan, nan])
+
+        expected = Series([nan, nan, 3., 4., 5., 6., 7., nan, nan])
+        result = s.interpolate(method='linear', limit_area='inside')
+        assert_series_equal(result, expected)
+
+        expected = Series([nan, nan, 3., 4., nan, nan, 7., nan, nan])
+        result = s.interpolate(method='linear', limit_area='inside',
+                               limit=1)
+
+        expected = Series([nan, nan, 3., 4., nan, 6., 7., nan, nan])
+        result = s.interpolate(method='linear', limit_area='inside',
+                               limit_direction='both', limit=1)
+        assert_series_equal(result, expected)
+
+        expected = Series([nan, nan, 3., nan, nan, nan, 7., 7., 7.])
+        result = s.interpolate(method='linear', limit_area='outside')
+        assert_series_equal(result, expected)
+
+        expected = Series([nan, nan, 3., nan, nan, nan, 7., 7., nan])
+        result = s.interpolate(method='linear', limit_area='outside',
+                               limit=1)
+
+        expected = Series([nan, 3., 3., nan, nan, nan, 7., 7., nan])
+        result = s.interpolate(method='linear', limit_area='outside',
+                               limit_direction='both', limit=1)
+        assert_series_equal(result, expected)
+
+        expected = Series([3., 3., 3., nan, nan, nan, 7., nan, nan])
+        result = s.interpolate(method='linear', limit_area='outside',
+                               direction='backward')
+
+        # raises an error even if limit type is wrong.
+        pytest.raises(ValueError, s.interpolate, method='linear',
+                      limit_area='abc')
+
+    def test_interp_limit_direction(self):
+        # These tests are for issue #9218 -- fill NaNs in both directions.
+        s = Series([1, 3, np.nan, np.nan, np.nan, 11])
+
+        expected = Series([1., 3., np.nan, 7., 9., 11.])
+        result = s.interpolate(method='linear', limit=2,
+                               limit_direction='backward')
+        assert_series_equal(result, expected)
+
+        expected = Series([1., 3., 5., np.nan, 9., 11.])
+        result = s.interpolate(method='linear', limit=1,
+                               limit_direction='both')
+        assert_series_equal(result, expected)
+
+        # Check that this works on a longer series of nans.
+        s = Series([1, 3, np.nan, np.nan, np.nan, 7, 9, np.nan, np.nan, 12,
+                    np.nan])
+
+        expected = Series([1., 3., 4., 5., 6., 7., 9., 10., 11., 12., 12.])
+        result = s.interpolate(method='linear', limit=2,
+                               limit_direction='both')
+        assert_series_equal(result, expected)
+
+        expected = Series([1., 3., 4., np.nan, 6., 7., 9., 10., 11., 12., 12.])
+        result = s.interpolate(method='linear', limit=1,
+                               limit_direction='both')
+        assert_series_equal(result, expected)
+
+    def test_interp_limit_to_ends(self):
+        # These test are for issue #10420 -- flow back to beginning.
+        s = Series([np.nan, np.nan, 5, 7, 9, np.nan])
+
+        expected = Series([5., 5., 5., 7., 9., np.nan])
+        result = s.interpolate(method='linear', limit=2,
+                               limit_direction='backward')
+        assert_series_equal(result, expected)
+
+        expected = Series([5., 5., 5., 7., 9., 9.])
+        result = s.interpolate(method='linear', limit=2,
+                               limit_direction='both')
+        assert_series_equal(result, expected)
+
+    def test_interp_limit_before_ends(self):
+        # These test are for issue #11115 -- limit ends properly.
+        s = Series([np.nan, np.nan, 5, 7, np.nan, np.nan])
+
+        expected = Series([np.nan, np.nan, 5., 7., 7., np.nan])
+        result = s.interpolate(method='linear', limit=1,
+                               limit_direction='forward')
+        assert_series_equal(result, expected)
+
+        expected = Series([np.nan, 5., 5., 7., np.nan, np.nan])
+        result = s.interpolate(method='linear', limit=1,
+                               limit_direction='backward')
+        assert_series_equal(result, expected)
+
+        expected = Series([np.nan, 5., 5., 7., 7., np.nan])
+        result = s.interpolate(method='linear', limit=1,
+                               limit_direction='both')
+        assert_series_equal(result, expected)
+
+    @td.skip_if_no_scipy
+    def test_interp_all_good(self):
+        s = Series([1, 2, 3])
+        result = s.interpolate(method='polynomial', order=1)
+        assert_series_equal(result, s)
+
+        # non-scipy
+        result = s.interpolate()
+        assert_series_equal(result, s)
+
+    @pytest.mark.parametrize("check_scipy", [
+        False,
+        pytest.param(True, marks=td.skip_if_no_scipy)
+    ])
+    def test_interp_multiIndex(self, check_scipy):
+        idx = MultiIndex.from_tuples([(0, 'a'), (1, 'b'), (2, 'c')])
+        s = Series([1, 2, np.nan], index=idx)
+
+        expected = s.copy()
+        expected.loc[2] = 2
+        result = s.interpolate()
+        assert_series_equal(result, expected)
+
+        if check_scipy:
+            with pytest.raises(ValueError):
+                s.interpolate(method='polynomial', order=1)
+
+    @td.skip_if_no_scipy
+    def test_interp_nonmono_raise(self):
+        s = Series([1, np.nan, 3], index=[0, 2, 1])
+        with pytest.raises(ValueError):
+            s.interpolate(method='krogh')
+
+    @td.skip_if_no_scipy
+    def test_interp_datetime64(self):
+        df = Series([1, np.nan, 3], index=date_range('1/1/2000', periods=3))
+        result = df.interpolate(method='nearest')
+        expected = Series([1., 1., 3.],
+                          index=date_range('1/1/2000', periods=3))
+        assert_series_equal(result, expected)
+
+    def test_interp_limit_no_nans(self):
+        # GH 7173
+        s = pd.Series([1., 2., 3.])
+        result = s.interpolate(limit=1)
+        expected = s
+        assert_series_equal(result, expected)
+
+    @td.skip_if_no_scipy
+    @pytest.mark.parametrize("method", ['polynomial', 'spline'])
+    def test_no_order(self, method):
+        s = Series([0, 1, np.nan, 3])
+        with pytest.raises(ValueError):
+            s.interpolate(method=method)
+
+    @td.skip_if_no_scipy
+    def test_spline(self):
+        s = Series([1, 2, np.nan, 4, 5, np.nan, 7])
+        result = s.interpolate(method='spline', order=1)
+        expected = Series([1., 2., 3., 4., 5., 6., 7.])
+        assert_series_equal(result, expected)
+
+    @td.skip_if_no('scipy', min_version='0.15')
+    def test_spline_extrapolate(self):
+        s = Series([1, 2, 3, 4, np.nan, 6, np.nan])
+        result3 = s.interpolate(method='spline', order=1, ext=3)
+        expected3 = Series([1., 2., 3., 4., 5., 6., 6.])
+        assert_series_equal(result3, expected3)
+
+        result1 = s.interpolate(method='spline', order=1, ext=0)
+        expected1 = Series([1., 2., 3., 4., 5., 6., 7.])
+        assert_series_equal(result1, expected1)
+
+    @td.skip_if_no_scipy
+    def test_spline_smooth(self):
+        s = Series([1, 2, np.nan, 4, 5.1, np.nan, 7])
+        assert (s.interpolate(method='spline', order=3, s=0)[5] !=
+                s.interpolate(method='spline', order=3)[5])
+
+    @td.skip_if_no_scipy
+    def test_spline_interpolation(self):
+        s = Series(np.arange(10) ** 2)
+        s[np.random.randint(0, 9, 3)] = np.nan
+        result1 = s.interpolate(method='spline', order=1)
+        expected1 = s.interpolate(method='spline', order=1)
+        assert_series_equal(result1, expected1)
+
+    @td.skip_if_no_scipy
+    def test_spline_error(self):
+        # see gh-10633
+        s = pd.Series(np.arange(10) ** 2)
+        s[np.random.randint(0, 9, 3)] = np.nan
+        with pytest.raises(ValueError):
+            s.interpolate(method='spline')
+
+        with pytest.raises(ValueError):
+            s.interpolate(method='spline', order=0)
+
+    def test_interp_timedelta64(self):
+        # GH 6424
+        df = Series([1, np.nan, 3],
+                    index=pd.to_timedelta([1, 2, 3]))
+        result = df.interpolate(method='time')
+        expected = Series([1., 2., 3.],
+                          index=pd.to_timedelta([1, 2, 3]))
+        assert_series_equal(result, expected)
+
+        # test for non uniform spacing
+        df = Series([1, np.nan, 3],
+                    index=pd.to_timedelta([1, 2, 4]))
+        result = df.interpolate(method='time')
+        expected = Series([1., 1.666667, 3.],
+                          index=pd.to_timedelta([1, 2, 4]))
+        assert_series_equal(result, expected)
+
+    def test_series_interpolate_method_values(self):
+        # #1646
+        ts = _simple_ts('1/1/2000', '1/20/2000')
+        ts[::2] = np.nan
+
+        result = ts.interpolate(method='values')
+        exp = ts.interpolate()
+        assert_series_equal(result, exp)
+
+    def test_series_interpolate_intraday(self):
+        # #1698
+        index = pd.date_range('1/1/2012', periods=4, freq='12D')
+        ts = pd.Series([0, 12, 24, 36], index)
+        new_index = index.append(index + pd.DateOffset(days=1)).sort_values()
+
+        exp = ts.reindex(new_index).interpolate(method='time')
+
+        index = pd.date_range('1/1/2012', periods=4, freq='12H')
+        ts = pd.Series([0, 12, 24, 36], index)
+        new_index = index.append(index + pd.DateOffset(hours=1)).sort_values()
+        result = ts.reindex(new_index).interpolate(method='time')
+
+        tm.assert_numpy_array_equal(result.values, exp.values)
diff --git a/pandas/tests/series/test_operators.py b/pandas/tests/series/test_operators.py
new file mode 100644
index 0000000000000..ecb74622edf10
--- /dev/null
+++ b/pandas/tests/series/test_operators.py
@@ -0,0 +1,1875 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+import pytz
+
+from collections import Iterable
+from datetime import datetime, timedelta
+import operator
+from itertools import product, starmap
+
+from numpy import nan
+import numpy as np
+import pandas as pd
+
+from pandas import (Index, Series, DataFrame, isna, bdate_range,
+                    NaT, date_range, timedelta_range, Categorical)
+from pandas.core.indexes.datetimes import Timestamp
+from pandas.core.indexes.timedeltas import Timedelta
+import pandas.core.nanops as nanops
+
+from pandas.errors import PerformanceWarning
+from pandas.compat import range, zip
+from pandas import compat
+from pandas.util.testing import (assert_series_equal, assert_almost_equal,
+                                 assert_frame_equal, assert_index_equal)
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestSeriesComparisons(object):
+    def test_series_comparison_scalars(self):
+        series = Series(date_range('1/1/2000', periods=10))
+
+        val = datetime(2000, 1, 4)
+        result = series > val
+        expected = Series([x > val for x in series])
+        tm.assert_series_equal(result, expected)
+
+        val = series[5]
+        result = series > val
+        expected = Series([x > val for x in series])
+        tm.assert_series_equal(result, expected)
+
+    def test_comparisons(self):
+        left = np.random.randn(10)
+        right = np.random.randn(10)
+        left[:3] = np.nan
+
+        result = nanops.nangt(left, right)
+        with np.errstate(invalid='ignore'):
+            expected = (left > right).astype('O')
+        expected[:3] = np.nan
+
+        assert_almost_equal(result, expected)
+
+        s = Series(['a', 'b', 'c'])
+        s2 = Series([False, True, False])
+
+        # it works!
+        exp = Series([False, False, False])
+        assert_series_equal(s == s2, exp)
+        assert_series_equal(s2 == s, exp)
+
+    def test_operator_series_comparison_zerorank(self):
+        # GH 13006
+        result = np.float64(0) > pd.Series([1, 2, 3])
+        expected = 0.0 > pd.Series([1, 2, 3])
+        tm.assert_series_equal(result, expected)
+        result = pd.Series([1, 2, 3]) < np.float64(0)
+        expected = pd.Series([1, 2, 3]) < 0.0
+        tm.assert_series_equal(result, expected)
+        result = np.array([0, 1, 2])[0] > pd.Series([0, 1, 2])
+        expected = 0.0 > pd.Series([1, 2, 3])
+        tm.assert_series_equal(result, expected)
+
+    def test_object_comparisons(self):
+        s = Series(['a', 'b', np.nan, 'c', 'a'])
+
+        result = s == 'a'
+        expected = Series([True, False, False, False, True])
+        assert_series_equal(result, expected)
+
+        result = s < 'a'
+        expected = Series([False, False, False, False, False])
+        assert_series_equal(result, expected)
+
+        result = s != 'a'
+        expected = -(s == 'a')
+        assert_series_equal(result, expected)
+
+    def test_categorical_comparisons(self):
+        # GH 8938
+        # allow equality comparisons
+        a = Series(list('abc'), dtype="category")
+        b = Series(list('abc'), dtype="object")
+        c = Series(['a', 'b', 'cc'], dtype="object")
+        d = Series(list('acb'), dtype="object")
+        e = Categorical(list('abc'))
+        f = Categorical(list('acb'))
+
+        # vs scalar
+        assert not (a == 'a').all()
+        assert ((a != 'a') == ~(a == 'a')).all()
+
+        assert not ('a' == a).all()
+        assert (a == 'a')[0]
+        assert ('a' == a)[0]
+        assert not ('a' != a)[0]
+
+        # vs list-like
+        assert (a == a).all()
+        assert not (a != a).all()
+
+        assert (a == list(a)).all()
+        assert (a == b).all()
+        assert (b == a).all()
+        assert ((~(a == b)) == (a != b)).all()
+        assert ((~(b == a)) == (b != a)).all()
+
+        assert not (a == c).all()
+        assert not (c == a).all()
+        assert not (a == d).all()
+        assert not (d == a).all()
+
+        # vs a cat-like
+        assert (a == e).all()
+        assert (e == a).all()
+        assert not (a == f).all()
+        assert not (f == a).all()
+
+        assert ((~(a == e) == (a != e)).all())
+        assert ((~(e == a) == (e != a)).all())
+        assert ((~(a == f) == (a != f)).all())
+        assert ((~(f == a) == (f != a)).all())
+
+        # non-equality is not comparable
+        pytest.raises(TypeError, lambda: a < b)
+        pytest.raises(TypeError, lambda: b < a)
+        pytest.raises(TypeError, lambda: a > b)
+        pytest.raises(TypeError, lambda: b > a)
+
+    def test_comparison_tuples(self):
+        # GH11339
+        # comparisons vs tuple
+        s = Series([(1, 1), (1, 2)])
+
+        result = s == (1, 2)
+        expected = Series([False, True])
+        assert_series_equal(result, expected)
+
+        result = s != (1, 2)
+        expected = Series([True, False])
+        assert_series_equal(result, expected)
+
+        result = s == (0, 0)
+        expected = Series([False, False])
+        assert_series_equal(result, expected)
+
+        result = s != (0, 0)
+        expected = Series([True, True])
+        assert_series_equal(result, expected)
+
+        s = Series([(1, 1), (1, 1)])
+
+        result = s == (1, 1)
+        expected = Series([True, True])
+        assert_series_equal(result, expected)
+
+        result = s != (1, 1)
+        expected = Series([False, False])
+        assert_series_equal(result, expected)
+
+        s = Series([frozenset([1]), frozenset([1, 2])])
+
+        result = s == frozenset([1])
+        expected = Series([True, False])
+        assert_series_equal(result, expected)
+
+    def test_comparison_operators_with_nas(self):
+        ser = Series(bdate_range('1/1/2000', periods=10), dtype=object)
+        ser[::2] = np.nan
+
+        # test that comparisons work
+        ops = ['lt', 'le', 'gt', 'ge', 'eq', 'ne']
+        for op in ops:
+            val = ser[5]
+
+            f = getattr(operator, op)
+            result = f(ser, val)
+
+            expected = f(ser.dropna(), val).reindex(ser.index)
+
+            if op == 'ne':
+                expected = expected.fillna(True).astype(bool)
+            else:
+                expected = expected.fillna(False).astype(bool)
+
+            assert_series_equal(result, expected)
+
+            # fffffffuuuuuuuuuuuu
+            # result = f(val, s)
+            # expected = f(val, s.dropna()).reindex(s.index)
+            # assert_series_equal(result, expected)
+
+            # boolean &, |, ^ should work with object arrays and propagate NAs
+
+        ops = ['and_', 'or_', 'xor']
+        mask = ser.isna()
+        for bool_op in ops:
+            func = getattr(operator, bool_op)
+
+            filled = ser.fillna(ser[0])
+
+            result = func(ser < ser[9], ser > ser[3])
+
+            expected = func(filled < filled[9], filled > filled[3])
+            expected[mask] = False
+            assert_series_equal(result, expected)
+
+    def test_comparison_object_numeric_nas(self):
+        ser = Series(np.random.randn(10), dtype=object)
+        shifted = ser.shift(2)
+
+        ops = ['lt', 'le', 'gt', 'ge', 'eq', 'ne']
+        for op in ops:
+            func = getattr(operator, op)
+
+            result = func(ser, shifted)
+            expected = func(ser.astype(float), shifted.astype(float))
+            assert_series_equal(result, expected)
+
+    def test_comparison_invalid(self):
+        # GH4968
+        # invalid date/int comparisons
+        s = Series(range(5))
+        s2 = Series(date_range('20010101', periods=5))
+
+        for (x, y) in [(s, s2), (s2, s)]:
+            pytest.raises(TypeError, lambda: x == y)
+            pytest.raises(TypeError, lambda: x != y)
+            pytest.raises(TypeError, lambda: x >= y)
+            pytest.raises(TypeError, lambda: x > y)
+            pytest.raises(TypeError, lambda: x < y)
+            pytest.raises(TypeError, lambda: x <= y)
+
+    def test_unequal_categorical_comparison_raises_type_error(self):
+        # unequal comparison should raise for unordered cats
+        cat = Series(Categorical(list("abc")))
+
+        def f():
+            cat > "b"
+
+        pytest.raises(TypeError, f)
+        cat = Series(Categorical(list("abc"), ordered=False))
+
+        def f():
+            cat > "b"
+
+        pytest.raises(TypeError, f)
+
+        # https://github.com/pandas-dev/pandas/issues/9836#issuecomment-92123057
+        # and following comparisons with scalars not in categories should raise
+        # for unequal comps, but not for equal/not equal
+        cat = Series(Categorical(list("abc"), ordered=True))
+
+        pytest.raises(TypeError, lambda: cat < "d")
+        pytest.raises(TypeError, lambda: cat > "d")
+        pytest.raises(TypeError, lambda: "d" < cat)
+        pytest.raises(TypeError, lambda: "d" > cat)
+
+        tm.assert_series_equal(cat == "d", Series([False, False, False]))
+        tm.assert_series_equal(cat != "d", Series([True, True, True]))
+
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_more_na_comparisons(self, dtype):
+        left = Series(['a', np.nan, 'c'], dtype=dtype)
+        right = Series(['a', np.nan, 'd'], dtype=dtype)
+
+        result = left == right
+        expected = Series([True, False, False])
+        assert_series_equal(result, expected)
+
+        result = left != right
+        expected = Series([False, True, True])
+        assert_series_equal(result, expected)
+
+        result = left == np.nan
+        expected = Series([False, False, False])
+        assert_series_equal(result, expected)
+
+        result = left != np.nan
+        expected = Series([True, True, True])
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('pair', [
+        ([pd.Timestamp('2011-01-01'), NaT, pd.Timestamp('2011-01-03')],
+         [NaT, NaT, pd.Timestamp('2011-01-03')]),
+
+        ([pd.Timedelta('1 days'), NaT, pd.Timedelta('3 days')],
+         [NaT, NaT, pd.Timedelta('3 days')]),
+
+        ([pd.Period('2011-01', freq='M'), NaT, pd.Period('2011-03', freq='M')],
+         [NaT, NaT, pd.Period('2011-03', freq='M')])])
+    @pytest.mark.parametrize('reverse', [True, False])
+    @pytest.mark.parametrize('box', [Series, Index])
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_nat_comparisons(self, dtype, box, reverse, pair):
+        l, r = pair
+        if reverse:
+            # add lhs / rhs switched data
+            l, r = r, l
+
+        left = Series(l, dtype=dtype)
+        right = box(r, dtype=dtype)
+        # Series, Index
+
+        expected = Series([False, False, True])
+        assert_series_equal(left == right, expected)
+
+        expected = Series([True, True, False])
+        assert_series_equal(left != right, expected)
+
+        expected = Series([False, False, False])
+        assert_series_equal(left < right, expected)
+
+        expected = Series([False, False, False])
+        assert_series_equal(left > right, expected)
+
+        expected = Series([False, False, True])
+        assert_series_equal(left >= right, expected)
+
+        expected = Series([False, False, True])
+        assert_series_equal(left <= right, expected)
+
+    @pytest.mark.parametrize('data', [
+        [pd.Timestamp('2011-01-01'), NaT, pd.Timestamp('2011-01-03')],
+        [pd.Timedelta('1 days'), NaT, pd.Timedelta('3 days')],
+        [pd.Period('2011-01', freq='M'), NaT, pd.Period('2011-03', freq='M')]
+    ])
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_nat_comparisons_scalar(self, dtype, data):
+        left = Series(data, dtype=dtype)
+
+        expected = Series([False, False, False])
+        assert_series_equal(left == pd.NaT, expected)
+        assert_series_equal(pd.NaT == left, expected)
+
+        expected = Series([True, True, True])
+        assert_series_equal(left != pd.NaT, expected)
+        assert_series_equal(pd.NaT != left, expected)
+
+        expected = Series([False, False, False])
+        assert_series_equal(left < pd.NaT, expected)
+        assert_series_equal(pd.NaT > left, expected)
+        assert_series_equal(left <= pd.NaT, expected)
+        assert_series_equal(pd.NaT >= left, expected)
+
+        assert_series_equal(left > pd.NaT, expected)
+        assert_series_equal(pd.NaT < left, expected)
+        assert_series_equal(left >= pd.NaT, expected)
+        assert_series_equal(pd.NaT <= left, expected)
+
+    def test_comparison_different_length(self):
+        a = Series(['a', 'b', 'c'])
+        b = Series(['b', 'a'])
+        pytest.raises(ValueError, a.__lt__, b)
+
+        a = Series([1, 2])
+        b = Series([2, 3, 4])
+        pytest.raises(ValueError, a.__eq__, b)
+
+    def test_comparison_label_based(self):
+
+        # GH 4947
+        # comparisons should be label based
+
+        a = Series([True, False, True], list('bca'))
+        b = Series([False, True, False], list('abc'))
+
+        expected = Series([False, True, False], list('abc'))
+        result = a & b
+        assert_series_equal(result, expected)
+
+        expected = Series([True, True, False], list('abc'))
+        result = a | b
+        assert_series_equal(result, expected)
+
+        expected = Series([True, False, False], list('abc'))
+        result = a ^ b
+        assert_series_equal(result, expected)
+
+        # rhs is bigger
+        a = Series([True, False, True], list('bca'))
+        b = Series([False, True, False, True], list('abcd'))
+
+        expected = Series([False, True, False, False], list('abcd'))
+        result = a & b
+        assert_series_equal(result, expected)
+
+        expected = Series([True, True, False, False], list('abcd'))
+        result = a | b
+        assert_series_equal(result, expected)
+
+        # filling
+
+        # vs empty
+        result = a & Series([])
+        expected = Series([False, False, False], list('bca'))
+        assert_series_equal(result, expected)
+
+        result = a | Series([])
+        expected = Series([True, False, True], list('bca'))
+        assert_series_equal(result, expected)
+
+        # vs non-matching
+        result = a & Series([1], ['z'])
+        expected = Series([False, False, False, False], list('abcz'))
+        assert_series_equal(result, expected)
+
+        result = a | Series([1], ['z'])
+        expected = Series([True, True, False, False], list('abcz'))
+        assert_series_equal(result, expected)
+
+        # identity
+        # we would like s[s|e] == s to hold for any e, whether empty or not
+        for e in [Series([]), Series([1], ['z']),
+                  Series(np.nan, b.index), Series(np.nan, a.index)]:
+            result = a[a | e]
+            assert_series_equal(result, a[a])
+
+        for e in [Series(['z'])]:
+            if compat.PY3:
+                with tm.assert_produces_warning(RuntimeWarning):
+                    result = a[a | e]
+            else:
+                result = a[a | e]
+            assert_series_equal(result, a[a])
+
+        # vs scalars
+        index = list('bca')
+        t = Series([True, False, True])
+
+        for v in [True, 1, 2]:
+            result = Series([True, False, True], index=index) | v
+            expected = Series([True, True, True], index=index)
+            assert_series_equal(result, expected)
+
+        for v in [np.nan, 'foo']:
+            pytest.raises(TypeError, lambda: t | v)
+
+        for v in [False, 0]:
+            result = Series([True, False, True], index=index) | v
+            expected = Series([True, False, True], index=index)
+            assert_series_equal(result, expected)
+
+        for v in [True, 1]:
+            result = Series([True, False, True], index=index) & v
+            expected = Series([True, False, True], index=index)
+            assert_series_equal(result, expected)
+
+        for v in [False, 0]:
+            result = Series([True, False, True], index=index) & v
+            expected = Series([False, False, False], index=index)
+            assert_series_equal(result, expected)
+        for v in [np.nan]:
+            pytest.raises(TypeError, lambda: t & v)
+
+    def test_comparison_flex_basic(self):
+        left = pd.Series(np.random.randn(10))
+        right = pd.Series(np.random.randn(10))
+
+        assert_series_equal(left.eq(right), left == right)
+        assert_series_equal(left.ne(right), left != right)
+        assert_series_equal(left.le(right), left < right)
+        assert_series_equal(left.lt(right), left <= right)
+        assert_series_equal(left.gt(right), left > right)
+        assert_series_equal(left.ge(right), left >= right)
+
+        # axis
+        for axis in [0, None, 'index']:
+            assert_series_equal(left.eq(right, axis=axis), left == right)
+            assert_series_equal(left.ne(right, axis=axis), left != right)
+            assert_series_equal(left.le(right, axis=axis), left < right)
+            assert_series_equal(left.lt(right, axis=axis), left <= right)
+            assert_series_equal(left.gt(right, axis=axis), left > right)
+            assert_series_equal(left.ge(right, axis=axis), left >= right)
+
+        #
+        msg = 'No axis named 1 for object type'
+        for op in ['eq', 'ne', 'le', 'le', 'gt', 'ge']:
+            with tm.assert_raises_regex(ValueError, msg):
+                getattr(left, op)(right, axis=1)
+
+    def test_comparison_flex_alignment(self):
+        left = Series([1, 3, 2], index=list('abc'))
+        right = Series([2, 2, 2], index=list('bcd'))
+
+        exp = pd.Series([False, False, True, False], index=list('abcd'))
+        assert_series_equal(left.eq(right), exp)
+
+        exp = pd.Series([True, True, False, True], index=list('abcd'))
+        assert_series_equal(left.ne(right), exp)
+
+        exp = pd.Series([False, False, True, False], index=list('abcd'))
+        assert_series_equal(left.le(right), exp)
+
+        exp = pd.Series([False, False, False, False], index=list('abcd'))
+        assert_series_equal(left.lt(right), exp)
+
+        exp = pd.Series([False, True, True, False], index=list('abcd'))
+        assert_series_equal(left.ge(right), exp)
+
+        exp = pd.Series([False, True, False, False], index=list('abcd'))
+        assert_series_equal(left.gt(right), exp)
+
+    def test_comparison_flex_alignment_fill(self):
+        left = Series([1, 3, 2], index=list('abc'))
+        right = Series([2, 2, 2], index=list('bcd'))
+
+        exp = pd.Series([False, False, True, True], index=list('abcd'))
+        assert_series_equal(left.eq(right, fill_value=2), exp)
+
+        exp = pd.Series([True, True, False, False], index=list('abcd'))
+        assert_series_equal(left.ne(right, fill_value=2), exp)
+
+        exp = pd.Series([False, False, True, True], index=list('abcd'))
+        assert_series_equal(left.le(right, fill_value=0), exp)
+
+        exp = pd.Series([False, False, False, True], index=list('abcd'))
+        assert_series_equal(left.lt(right, fill_value=0), exp)
+
+        exp = pd.Series([True, True, True, False], index=list('abcd'))
+        assert_series_equal(left.ge(right, fill_value=0), exp)
+
+        exp = pd.Series([True, True, False, False], index=list('abcd'))
+        assert_series_equal(left.gt(right, fill_value=0), exp)
+
+    def test_ne(self):
+        ts = Series([3, 4, 5, 6, 7], [3, 4, 5, 6, 7], dtype=float)
+        expected = [True, True, False, True, True]
+        assert tm.equalContents(ts.index != 5, expected)
+        assert tm.equalContents(~(ts.index == 5), expected)
+
+    def test_comp_ops_df_compat(self):
+        # GH 1134
+        s1 = pd.Series([1, 2, 3], index=list('ABC'), name='x')
+        s2 = pd.Series([2, 2, 2], index=list('ABD'), name='x')
+
+        s3 = pd.Series([1, 2, 3], index=list('ABC'), name='x')
+        s4 = pd.Series([2, 2, 2, 2], index=list('ABCD'), name='x')
+
+        for left, right in [(s1, s2), (s2, s1), (s3, s4), (s4, s3)]:
+
+            msg = "Can only compare identically-labeled Series objects"
+            with tm.assert_raises_regex(ValueError, msg):
+                left == right
+
+            with tm.assert_raises_regex(ValueError, msg):
+                left != right
+
+            with tm.assert_raises_regex(ValueError, msg):
+                left < right
+
+            msg = "Can only compare identically-labeled DataFrame objects"
+            with tm.assert_raises_regex(ValueError, msg):
+                left.to_frame() == right.to_frame()
+
+            with tm.assert_raises_regex(ValueError, msg):
+                left.to_frame() != right.to_frame()
+
+            with tm.assert_raises_regex(ValueError, msg):
+                left.to_frame() < right.to_frame()
+
+
+class TestTimedeltaSeriesArithmetic(object):
+
+    def test_timedelta64_operations_with_DateOffset(self):
+        # GH 10699
+        td = Series([timedelta(minutes=5, seconds=3)] * 3)
+        result = td + pd.offsets.Minute(1)
+        expected = Series([timedelta(minutes=6, seconds=3)] * 3)
+        assert_series_equal(result, expected)
+
+        result = td - pd.offsets.Minute(1)
+        expected = Series([timedelta(minutes=4, seconds=3)] * 3)
+        assert_series_equal(result, expected)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            result = td + Series([pd.offsets.Minute(1), pd.offsets.Second(3),
+                                  pd.offsets.Hour(2)])
+        expected = Series([timedelta(minutes=6, seconds=3), timedelta(
+            minutes=5, seconds=6), timedelta(hours=2, minutes=5, seconds=3)])
+        assert_series_equal(result, expected)
+
+        result = td + pd.offsets.Minute(1) + pd.offsets.Second(12)
+        expected = Series([timedelta(minutes=6, seconds=15)] * 3)
+        assert_series_equal(result, expected)
+
+        # valid DateOffsets
+        for do in ['Hour', 'Minute', 'Second', 'Day', 'Micro', 'Milli',
+                   'Nano']:
+            op = getattr(pd.offsets, do)
+            td + op(5)
+            op(5) + td
+            td - op(5)
+            op(5) - td
+
+    def test_timedelta64_operations_with_timedeltas(self):
+        # td operate with td
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td2 = timedelta(minutes=5, seconds=4)
+        result = td1 - td2
+        expected = (Series([timedelta(seconds=0)] * 3) -
+                    Series([timedelta(seconds=1)] * 3))
+        assert result.dtype == 'm8[ns]'
+        assert_series_equal(result, expected)
+
+        result2 = td2 - td1
+        expected = (Series([timedelta(seconds=1)] * 3) -
+                    Series([timedelta(seconds=0)] * 3))
+        assert_series_equal(result2, expected)
+
+        # roundtrip
+        assert_series_equal(result + td2, td1)
+
+        # Now again, using pd.to_timedelta, which should build
+        # a Series or a scalar, depending on input.
+        td1 = Series(pd.to_timedelta(['00:05:03'] * 3))
+        td2 = pd.to_timedelta('00:05:04')
+        result = td1 - td2
+        expected = (Series([timedelta(seconds=0)] * 3) -
+                    Series([timedelta(seconds=1)] * 3))
+        assert result.dtype == 'm8[ns]'
+        assert_series_equal(result, expected)
+
+        result2 = td2 - td1
+        expected = (Series([timedelta(seconds=1)] * 3) -
+                    Series([timedelta(seconds=0)] * 3))
+        assert_series_equal(result2, expected)
+
+        # roundtrip
+        assert_series_equal(result + td2, td1)
+
+    def test_operators_timedelta64(self):
+        # series ops
+        v1 = date_range('2012-1-1', periods=3, freq='D')
+        v2 = date_range('2012-1-2', periods=3, freq='D')
+        rs = Series(v2) - Series(v1)
+        xp = Series(1e9 * 3600 * 24,
+                    rs.index).astype('int64').astype('timedelta64[ns]')
+        assert_series_equal(rs, xp)
+        assert rs.dtype == 'timedelta64[ns]'
+
+        df = DataFrame(dict(A=v1))
+        td = Series([timedelta(days=i) for i in range(3)])
+        assert td.dtype == 'timedelta64[ns]'
+
+        # series on the rhs
+        result = df['A'] - df['A'].shift()
+        assert result.dtype == 'timedelta64[ns]'
+
+        result = df['A'] + td
+        assert result.dtype == 'M8[ns]'
+
+        # scalar Timestamp on rhs
+        maxa = df['A'].max()
+        assert isinstance(maxa, Timestamp)
+
+        resultb = df['A'] - df['A'].max()
+        assert resultb.dtype == 'timedelta64[ns]'
+
+        # timestamp on lhs
+        result = resultb + df['A']
+        values = [Timestamp('20111230'), Timestamp('20120101'),
+                  Timestamp('20120103')]
+        expected = Series(values, name='A')
+        assert_series_equal(result, expected)
+
+        # datetimes on rhs
+        result = df['A'] - datetime(2001, 1, 1)
+        expected = Series(
+            [timedelta(days=4017 + i) for i in range(3)], name='A')
+        assert_series_equal(result, expected)
+        assert result.dtype == 'm8[ns]'
+
+        d = datetime(2001, 1, 1, 3, 4)
+        resulta = df['A'] - d
+        assert resulta.dtype == 'm8[ns]'
+
+        # roundtrip
+        resultb = resulta + d
+        assert_series_equal(df['A'], resultb)
+
+        # timedeltas on rhs
+        td = timedelta(days=1)
+        resulta = df['A'] + td
+        resultb = resulta - td
+        assert_series_equal(resultb, df['A'])
+        assert resultb.dtype == 'M8[ns]'
+
+        # roundtrip
+        td = timedelta(minutes=5, seconds=3)
+        resulta = df['A'] + td
+        resultb = resulta - td
+        assert_series_equal(df['A'], resultb)
+        assert resultb.dtype == 'M8[ns]'
+
+        # inplace
+        value = rs[2] + np.timedelta64(timedelta(minutes=5, seconds=1))
+        rs[2] += np.timedelta64(timedelta(minutes=5, seconds=1))
+        assert rs[2] == value
+
+    def test_timedelta64_ops_nat(self):
+        # GH 11349
+        timedelta_series = Series([NaT, Timedelta('1s')])
+        nat_series_dtype_timedelta = Series([NaT, NaT],
+                                            dtype='timedelta64[ns]')
+        single_nat_dtype_timedelta = Series([NaT], dtype='timedelta64[ns]')
+
+        # subtraction
+        assert_series_equal(timedelta_series - NaT,
+                            nat_series_dtype_timedelta)
+        assert_series_equal(-NaT + timedelta_series,
+                            nat_series_dtype_timedelta)
+
+        assert_series_equal(timedelta_series - single_nat_dtype_timedelta,
+                            nat_series_dtype_timedelta)
+        assert_series_equal(-single_nat_dtype_timedelta + timedelta_series,
+                            nat_series_dtype_timedelta)
+
+        # addition
+        assert_series_equal(nat_series_dtype_timedelta + NaT,
+                            nat_series_dtype_timedelta)
+        assert_series_equal(NaT + nat_series_dtype_timedelta,
+                            nat_series_dtype_timedelta)
+
+        assert_series_equal(nat_series_dtype_timedelta +
+                            single_nat_dtype_timedelta,
+                            nat_series_dtype_timedelta)
+        assert_series_equal(single_nat_dtype_timedelta +
+                            nat_series_dtype_timedelta,
+                            nat_series_dtype_timedelta)
+
+        assert_series_equal(timedelta_series + NaT,
+                            nat_series_dtype_timedelta)
+        assert_series_equal(NaT + timedelta_series,
+                            nat_series_dtype_timedelta)
+
+        assert_series_equal(timedelta_series + single_nat_dtype_timedelta,
+                            nat_series_dtype_timedelta)
+        assert_series_equal(single_nat_dtype_timedelta + timedelta_series,
+                            nat_series_dtype_timedelta)
+
+        assert_series_equal(nat_series_dtype_timedelta + NaT,
+                            nat_series_dtype_timedelta)
+        assert_series_equal(NaT + nat_series_dtype_timedelta,
+                            nat_series_dtype_timedelta)
+
+        assert_series_equal(nat_series_dtype_timedelta +
+                            single_nat_dtype_timedelta,
+                            nat_series_dtype_timedelta)
+        assert_series_equal(single_nat_dtype_timedelta +
+                            nat_series_dtype_timedelta,
+                            nat_series_dtype_timedelta)
+
+        # multiplication
+        assert_series_equal(nat_series_dtype_timedelta * 1.0,
+                            nat_series_dtype_timedelta)
+        assert_series_equal(1.0 * nat_series_dtype_timedelta,
+                            nat_series_dtype_timedelta)
+
+        assert_series_equal(timedelta_series * 1, timedelta_series)
+        assert_series_equal(1 * timedelta_series, timedelta_series)
+
+        assert_series_equal(timedelta_series * 1.5,
+                            Series([NaT, Timedelta('1.5s')]))
+        assert_series_equal(1.5 * timedelta_series,
+                            Series([NaT, Timedelta('1.5s')]))
+
+        assert_series_equal(timedelta_series * nan,
+                            nat_series_dtype_timedelta)
+        assert_series_equal(nan * timedelta_series,
+                            nat_series_dtype_timedelta)
+
+        # division
+        assert_series_equal(timedelta_series / 2,
+                            Series([NaT, Timedelta('0.5s')]))
+        assert_series_equal(timedelta_series / 2.0,
+                            Series([NaT, Timedelta('0.5s')]))
+        assert_series_equal(timedelta_series / nan,
+                            nat_series_dtype_timedelta)
+
+    @pytest.mark.parametrize('scalar_td', [timedelta(minutes=5, seconds=4),
+                                           Timedelta(minutes=5, seconds=4),
+                                           Timedelta('5m4s').to_timedelta64()])
+    def test_operators_timedelta64_with_timedelta(self, scalar_td):
+        # smoke tests
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        td1 + scalar_td
+        scalar_td + td1
+        td1 - scalar_td
+        scalar_td - td1
+        td1 / scalar_td
+        scalar_td / td1
+
+
+class TestDatetimeSeriesArithmetic(object):
+    @pytest.mark.parametrize(
+        'box, assert_func',
+        [(Series, tm.assert_series_equal),
+         (pd.Index, tm.assert_index_equal)])
+    def test_sub_datetime64_not_ns(self, box, assert_func):
+        # GH#7996
+        dt64 = np.datetime64('2013-01-01')
+        assert dt64.dtype == 'datetime64[D]'
+
+        obj = box(date_range('20130101', periods=3))
+        res = obj - dt64
+        expected = box([Timedelta(days=0), Timedelta(days=1),
+                        Timedelta(days=2)])
+        assert_func(res, expected)
+
+        res = dt64 - obj
+        assert_func(res, -expected)
+
+    def test_operators_datetimelike_invalid(self, all_arithmetic_operators):
+        # these are all TypeEror ops
+        op_str = all_arithmetic_operators
+
+        def check(get_ser, test_ser):
+
+            # check that we are getting a TypeError
+            # with 'operate' (from core/ops.py) for the ops that are not
+            # defined
+            op = getattr(get_ser, op_str, None)
+            with tm.assert_raises_regex(TypeError, 'operate|cannot'):
+                op(test_ser)
+
+        # ## timedelta64 ###
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        # ## datetime64 ###
+        dt1 = Series([Timestamp('20111230'), Timestamp('20120101'),
+                      Timestamp('20120103')])
+        dt1.iloc[2] = np.nan
+        dt2 = Series([Timestamp('20111231'), Timestamp('20120102'),
+                      Timestamp('20120104')])
+        if op_str not in ['__sub__', '__rsub__']:
+            check(dt1, dt2)
+
+        # ## datetime64 with timetimedelta ###
+        # TODO(jreback) __rsub__ should raise?
+        if op_str not in ['__add__', '__radd__', '__sub__']:
+            check(dt1, td1)
+
+        # 8260, 10763
+        # datetime64 with tz
+        tz = 'US/Eastern'
+        dt1 = Series(date_range('2000-01-01 09:00:00', periods=5,
+                                tz=tz), name='foo')
+        dt2 = dt1.copy()
+        dt2.iloc[2] = np.nan
+        td1 = Series(timedelta_range('1 days 1 min', periods=5, freq='H'))
+        td2 = td1.copy()
+        td2.iloc[1] = np.nan
+
+        if op_str not in ['__add__', '__radd__', '__sub__', '__rsub__']:
+            check(dt2, td2)
+
+    def test_operators_datetimelike(self):
+
+        # ## timedelta64 ###
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        # ## datetime64 ###
+        dt1 = Series([Timestamp('20111230'), Timestamp('20120101'),
+                      Timestamp('20120103')])
+        dt1.iloc[2] = np.nan
+        dt2 = Series([Timestamp('20111231'), Timestamp('20120102'),
+                      Timestamp('20120104')])
+        dt1 - dt2
+        dt2 - dt1
+
+        # ## datetime64 with timetimedelta ###
+        dt1 + td1
+        td1 + dt1
+        dt1 - td1
+        # TODO: Decide if this ought to work.
+        # td1 - dt1
+
+        # ## timetimedelta with datetime64 ###
+        td1 + dt1
+        dt1 + td1
+
+    def test_operators_datetimelike_with_timezones(self):
+
+        tz = 'US/Eastern'
+        dt1 = Series(date_range('2000-01-01 09:00:00', periods=5,
+                                tz=tz), name='foo')
+        dt2 = dt1.copy()
+        dt2.iloc[2] = np.nan
+
+        td1 = Series(timedelta_range('1 days 1 min', periods=5, freq='H'))
+        td2 = td1.copy()
+        td2.iloc[1] = np.nan
+
+        result = dt1 + td1[0]
+        exp = (dt1.dt.tz_localize(None) + td1[0]).dt.tz_localize(tz)
+        assert_series_equal(result, exp)
+
+        result = dt2 + td2[0]
+        exp = (dt2.dt.tz_localize(None) + td2[0]).dt.tz_localize(tz)
+        assert_series_equal(result, exp)
+
+        # odd numpy behavior with scalar timedeltas
+        result = td1[0] + dt1
+        exp = (dt1.dt.tz_localize(None) + td1[0]).dt.tz_localize(tz)
+        assert_series_equal(result, exp)
+
+        result = td2[0] + dt2
+        exp = (dt2.dt.tz_localize(None) + td2[0]).dt.tz_localize(tz)
+        assert_series_equal(result, exp)
+
+        result = dt1 - td1[0]
+        exp = (dt1.dt.tz_localize(None) - td1[0]).dt.tz_localize(tz)
+        assert_series_equal(result, exp)
+        pytest.raises(TypeError, lambda: td1[0] - dt1)
+
+        result = dt2 - td2[0]
+        exp = (dt2.dt.tz_localize(None) - td2[0]).dt.tz_localize(tz)
+        assert_series_equal(result, exp)
+        pytest.raises(TypeError, lambda: td2[0] - dt2)
+
+        result = dt1 + td1
+        exp = (dt1.dt.tz_localize(None) + td1).dt.tz_localize(tz)
+        assert_series_equal(result, exp)
+
+        result = dt2 + td2
+        exp = (dt2.dt.tz_localize(None) + td2).dt.tz_localize(tz)
+        assert_series_equal(result, exp)
+
+        result = dt1 - td1
+        exp = (dt1.dt.tz_localize(None) - td1).dt.tz_localize(tz)
+        assert_series_equal(result, exp)
+
+        result = dt2 - td2
+        exp = (dt2.dt.tz_localize(None) - td2).dt.tz_localize(tz)
+        assert_series_equal(result, exp)
+
+        pytest.raises(TypeError, lambda: td1 - dt1)
+        pytest.raises(TypeError, lambda: td2 - dt2)
+
+    def test_sub_single_tz(self):
+        # GH12290
+        s1 = Series([pd.Timestamp('2016-02-10', tz='America/Sao_Paulo')])
+        s2 = Series([pd.Timestamp('2016-02-08', tz='America/Sao_Paulo')])
+        result = s1 - s2
+        expected = Series([Timedelta('2days')])
+        assert_series_equal(result, expected)
+        result = s2 - s1
+        expected = Series([Timedelta('-2days')])
+        assert_series_equal(result, expected)
+
+    def test_dt64tz_series_sub_dtitz(self):
+        # GH#19071 subtracting tzaware DatetimeIndex from tzaware Series
+        # (with same tz) raises, fixed by #19024
+        dti = pd.date_range('1999-09-30', periods=10, tz='US/Pacific')
+        ser = pd.Series(dti)
+        expected = pd.Series(pd.TimedeltaIndex(['0days'] * 10))
+
+        res = dti - ser
+        tm.assert_series_equal(res, expected)
+        res = ser - dti
+        tm.assert_series_equal(res, expected)
+
+    def test_sub_datetime_compat(self):
+        # see gh-14088
+        s = Series([datetime(2016, 8, 23, 12, tzinfo=pytz.utc), pd.NaT])
+        dt = datetime(2016, 8, 22, 12, tzinfo=pytz.utc)
+        exp = Series([Timedelta('1 days'), pd.NaT])
+        assert_series_equal(s - dt, exp)
+        assert_series_equal(s - Timestamp(dt), exp)
+
+    def test_dt64_series_with_timedelta(self):
+        # scalar timedeltas/np.timedelta64 objects
+        # operate with np.timedelta64 correctly
+        s = Series([Timestamp('20130101 9:01'), Timestamp('20130101 9:02')])
+
+        result = s + np.timedelta64(1, 's')
+        result2 = np.timedelta64(1, 's') + s
+        expected = Series([Timestamp('20130101 9:01:01'),
+                           Timestamp('20130101 9:02:01')])
+        assert_series_equal(result, expected)
+        assert_series_equal(result2, expected)
+
+        result = s + np.timedelta64(5, 'ms')
+        result2 = np.timedelta64(5, 'ms') + s
+        expected = Series([Timestamp('20130101 9:01:00.005'),
+                           Timestamp('20130101 9:02:00.005')])
+        assert_series_equal(result, expected)
+        assert_series_equal(result2, expected)
+
+    def test_dt64_series_add_tick_DateOffset(self):
+        # GH 4532
+        # operate with pd.offsets
+        ser = Series([Timestamp('20130101 9:01'), Timestamp('20130101 9:02')])
+        expected = Series([Timestamp('20130101 9:01:05'),
+                           Timestamp('20130101 9:02:05')])
+
+        result = ser + pd.offsets.Second(5)
+        assert_series_equal(result, expected)
+
+        result2 = pd.offsets.Second(5) + ser
+        assert_series_equal(result2, expected)
+
+    def test_dt64_series_sub_tick_DateOffset(self):
+        # GH 4532
+        # operate with pd.offsets
+        ser = Series([Timestamp('20130101 9:01'), Timestamp('20130101 9:02')])
+        expected = Series([Timestamp('20130101 9:00:55'),
+                           Timestamp('20130101 9:01:55')])
+
+        result = ser - pd.offsets.Second(5)
+        assert_series_equal(result, expected)
+
+        result2 = -pd.offsets.Second(5) + ser
+        assert_series_equal(result2, expected)
+
+        with pytest.raises(TypeError):
+            pd.offsets.Second(5) - ser
+
+    @pytest.mark.parametrize('cls_name', ['Day', 'Hour', 'Minute', 'Second',
+                                          'Milli', 'Micro', 'Nano'])
+    def test_dt64_series_with_tick_DateOffset_smoke(self, cls_name):
+        # GH 4532
+        # smoke tests for valid DateOffsets
+        ser = Series([Timestamp('20130101 9:01'), Timestamp('20130101 9:02')])
+
+        offset_cls = getattr(pd.offsets, cls_name)
+        ser + offset_cls(5)
+        offset_cls(5) + ser
+
+    def test_dt64_series_add_mixed_tick_DateOffset(self):
+        # GH 4532
+        # operate with pd.offsets
+        s = Series([Timestamp('20130101 9:01'), Timestamp('20130101 9:02')])
+
+        result = s + pd.offsets.Milli(5)
+        result2 = pd.offsets.Milli(5) + s
+        expected = Series([Timestamp('20130101 9:01:00.005'),
+                           Timestamp('20130101 9:02:00.005')])
+        assert_series_equal(result, expected)
+        assert_series_equal(result2, expected)
+
+        result = s + pd.offsets.Minute(5) + pd.offsets.Milli(5)
+        expected = Series([Timestamp('20130101 9:06:00.005'),
+                           Timestamp('20130101 9:07:00.005')])
+        assert_series_equal(result, expected)
+
+    def test_dt64_series_sub_NaT(self):
+        # GH#18808
+        dti = pd.DatetimeIndex([pd.NaT, pd.Timestamp('19900315')])
+        ser = pd.Series(dti)
+        res = ser - pd.NaT
+        expected = pd.Series([pd.NaT, pd.NaT], dtype='timedelta64[ns]')
+        tm.assert_series_equal(res, expected)
+
+        dti_tz = dti.tz_localize('Asia/Tokyo')
+        ser_tz = pd.Series(dti_tz)
+        res = ser_tz - pd.NaT
+        expected = pd.Series([pd.NaT, pd.NaT], dtype='timedelta64[ns]')
+        tm.assert_series_equal(res, expected)
+
+    def test_datetime64_ops_nat(self):
+        # GH 11349
+        datetime_series = Series([NaT, Timestamp('19900315')])
+        nat_series_dtype_timestamp = Series([NaT, NaT], dtype='datetime64[ns]')
+        single_nat_dtype_datetime = Series([NaT], dtype='datetime64[ns]')
+
+        # subtraction
+        assert_series_equal(-NaT + datetime_series, nat_series_dtype_timestamp)
+        with pytest.raises(TypeError):
+            -single_nat_dtype_datetime + datetime_series
+
+        assert_series_equal(-NaT + nat_series_dtype_timestamp,
+                            nat_series_dtype_timestamp)
+        with pytest.raises(TypeError):
+            -single_nat_dtype_datetime + nat_series_dtype_timestamp
+
+        # addition
+        assert_series_equal(nat_series_dtype_timestamp + NaT,
+                            nat_series_dtype_timestamp)
+        assert_series_equal(NaT + nat_series_dtype_timestamp,
+                            nat_series_dtype_timestamp)
+
+        assert_series_equal(nat_series_dtype_timestamp + NaT,
+                            nat_series_dtype_timestamp)
+        assert_series_equal(NaT + nat_series_dtype_timestamp,
+                            nat_series_dtype_timestamp)
+
+    @pytest.mark.parametrize('dt64_series', [
+        Series([Timestamp('19900315'), Timestamp('19900315')]),
+        Series([NaT, Timestamp('19900315')]),
+        Series([NaT, NaT], dtype='datetime64[ns]')])
+    @pytest.mark.parametrize('one', [1, 1.0, np.array(1)])
+    def test_dt64_mul_div_numeric_invalid(self, one, dt64_series):
+        # multiplication
+        with pytest.raises(TypeError):
+            dt64_series * one
+        with pytest.raises(TypeError):
+            one * dt64_series
+
+        # division
+        with pytest.raises(TypeError):
+            dt64_series / one
+        with pytest.raises(TypeError):
+            one / dt64_series
+
+    def test_dt64_series_arith_overflow(self):
+        # GH#12534, fixed by #19024
+        dt = pd.Timestamp('1700-01-31')
+        td = pd.Timedelta('20000 Days')
+        dti = pd.date_range('1949-09-30', freq='100Y', periods=4)
+        ser = pd.Series(dti)
+        with pytest.raises(OverflowError):
+            ser - dt
+        with pytest.raises(OverflowError):
+            dt - ser
+        with pytest.raises(OverflowError):
+            ser + td
+        with pytest.raises(OverflowError):
+            td + ser
+
+        ser.iloc[-1] = pd.NaT
+        expected = pd.Series(['2004-10-03', '2104-10-04', '2204-10-04', 'NaT'],
+                             dtype='datetime64[ns]')
+        res = ser + td
+        tm.assert_series_equal(res, expected)
+        res = td + ser
+        tm.assert_series_equal(res, expected)
+
+        ser.iloc[1:] = pd.NaT
+        expected = pd.Series(['91279 Days', 'NaT', 'NaT', 'NaT'],
+                             dtype='timedelta64[ns]')
+        res = ser - dt
+        tm.assert_series_equal(res, expected)
+        res = dt - ser
+        tm.assert_series_equal(res, -expected)
+
+    @pytest.mark.parametrize('op', ['__add__', '__radd__',
+                                    '__sub__', '__rsub__'])
+    @pytest.mark.parametrize('tz', [None, 'Asia/Tokyo'])
+    def test_dt64_series_add_intlike(self, tz, op):
+        # GH#19123
+        dti = pd.DatetimeIndex(['2016-01-02', '2016-02-03', 'NaT'], tz=tz)
+        ser = Series(dti)
+
+        other = Series([20, 30, 40], dtype='uint8')
+
+        pytest.raises(TypeError, getattr(ser, op), 1)
+
+        pytest.raises(TypeError, getattr(ser, op), other)
+
+        pytest.raises(TypeError, getattr(ser, op), other.values)
+
+        pytest.raises(TypeError, getattr(ser, op), pd.Index(other))
+
+
+class TestSeriesOperators(TestData):
+    @pytest.mark.parametrize(
+        'ts',
+        [
+            (lambda x: x, lambda x: x * 2, False),
+            (lambda x: x, lambda x: x[::2], False),
+            (lambda x: x, lambda x: 5, True),
+            (lambda x: tm.makeFloatSeries(),
+             lambda x: tm.makeFloatSeries(),
+             True)
+        ])
+    @pytest.mark.parametrize('opname', ['add', 'sub', 'mul', 'floordiv',
+                                        'truediv', 'div', 'pow'])
+    def test_op_method(self, opname, ts):
+        # check that Series.{opname} behaves like Series.__{opname}__,
+        series = ts[0](self.ts)
+        other = ts[1](self.ts)
+        check_reverse = ts[2]
+
+        if opname == 'div' and compat.PY3:
+            pytest.skip('div test only for Py3')
+
+        op = getattr(Series, opname)
+
+        if op == 'div':
+            alt = operator.truediv
+        else:
+            alt = getattr(operator, opname)
+
+        result = op(series, other)
+        expected = alt(series, other)
+        assert_almost_equal(result, expected)
+        if check_reverse:
+            rop = getattr(Series, "r" + opname)
+            result = rop(series, other)
+            expected = alt(other, series)
+            assert_almost_equal(result, expected)
+
+    def test_neg(self):
+        assert_series_equal(-self.series, -1 * self.series)
+
+    def test_invert(self):
+        assert_series_equal(-(self.series < 0), ~(self.series < 0))
+
+    def test_operators(self):
+        def _check_op(series, other, op, pos_only=False,
+                      check_dtype=True):
+            left = np.abs(series) if pos_only else series
+            right = np.abs(other) if pos_only else other
+
+            cython_or_numpy = op(left, right)
+            python = left.combine(right, op)
+            assert_series_equal(cython_or_numpy, python,
+                                check_dtype=check_dtype)
+
+        def check(series, other):
+            simple_ops = ['add', 'sub', 'mul', 'truediv', 'floordiv', 'mod']
+
+            for opname in simple_ops:
+                _check_op(series, other, getattr(operator, opname))
+
+            _check_op(series, other, operator.pow, pos_only=True)
+
+            _check_op(series, other, lambda x, y: operator.add(y, x))
+            _check_op(series, other, lambda x, y: operator.sub(y, x))
+            _check_op(series, other, lambda x, y: operator.truediv(y, x))
+            _check_op(series, other, lambda x, y: operator.floordiv(y, x))
+            _check_op(series, other, lambda x, y: operator.mul(y, x))
+            _check_op(series, other, lambda x, y: operator.pow(y, x),
+                      pos_only=True)
+            _check_op(series, other, lambda x, y: operator.mod(y, x))
+
+        check(self.ts, self.ts * 2)
+        check(self.ts, self.ts * 0)
+        check(self.ts, self.ts[::2])
+        check(self.ts, 5)
+
+        def check_comparators(series, other, check_dtype=True):
+            _check_op(series, other, operator.gt, check_dtype=check_dtype)
+            _check_op(series, other, operator.ge, check_dtype=check_dtype)
+            _check_op(series, other, operator.eq, check_dtype=check_dtype)
+            _check_op(series, other, operator.lt, check_dtype=check_dtype)
+            _check_op(series, other, operator.le, check_dtype=check_dtype)
+
+        check_comparators(self.ts, 5)
+        check_comparators(self.ts, self.ts + 1, check_dtype=False)
+
+    def test_divmod(self):
+        def check(series, other):
+            results = divmod(series, other)
+            if isinstance(other, Iterable) and len(series) != len(other):
+                # if the lengths don't match, this is the test where we use
+                # `self.ts[::2]`. Pad every other value in `other_np` with nan.
+                other_np = []
+                for n in other:
+                    other_np.append(n)
+                    other_np.append(np.nan)
+            else:
+                other_np = other
+            other_np = np.asarray(other_np)
+            with np.errstate(all='ignore'):
+                expecteds = divmod(series.values, np.asarray(other_np))
+
+            for result, expected in zip(results, expecteds):
+                # check the values, name, and index separately
+                assert_almost_equal(np.asarray(result), expected)
+
+                assert result.name == series.name
+                assert_index_equal(result.index, series.index)
+
+        check(self.ts, self.ts * 2)
+        check(self.ts, self.ts * 0)
+        check(self.ts, self.ts[::2])
+        check(self.ts, 5)
+
+    def test_operators_empty_int_corner(self):
+        s1 = Series([], [], dtype=np.int32)
+        s2 = Series({'x': 0.})
+        assert_series_equal(s1 * s2, Series([np.nan], index=['x']))
+
+    @pytest.mark.parametrize("m", [1, 3, 10])
+    @pytest.mark.parametrize("unit", ['D', 'h', 'm', 's', 'ms', 'us', 'ns'])
+    def test_timedelta64_conversions(self, m, unit):
+
+        startdate = Series(date_range('2013-01-01', '2013-01-03'))
+        enddate = Series(date_range('2013-03-01', '2013-03-03'))
+
+        s1 = enddate - startdate
+        s1[2] = np.nan
+
+        # op
+        expected = s1.apply(lambda x: x / np.timedelta64(m, unit))
+        result = s1 / np.timedelta64(m, unit)
+        assert_series_equal(result, expected)
+
+        # reverse op
+        expected = s1.apply(
+            lambda x: Timedelta(np.timedelta64(m, unit)) / x)
+        result = np.timedelta64(m, unit) / s1
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('op', [operator.add, operator.sub])
+    def test_timedelta64_equal_timedelta_supported_ops(self, op):
+        ser = Series([Timestamp('20130301'), Timestamp('20130228 23:00:00'),
+                      Timestamp('20130228 22:00:00'),
+                      Timestamp('20130228 21:00:00')])
+
+        intervals = 'D', 'h', 'm', 's', 'us'
+
+        # TODO: unused
+        # npy16_mappings = {'D': 24 * 60 * 60 * 1000000,
+        #                   'h': 60 * 60 * 1000000,
+        #                   'm': 60 * 1000000,
+        #                   's': 1000000,
+        #                   'us': 1}
+
+        def timedelta64(*args):
+            return sum(starmap(np.timedelta64, zip(args, intervals)))
+
+        for d, h, m, s, us in product(*([range(2)] * 5)):
+            nptd = timedelta64(d, h, m, s, us)
+            pytd = timedelta(days=d, hours=h, minutes=m, seconds=s,
+                             microseconds=us)
+            lhs = op(ser, nptd)
+            rhs = op(ser, pytd)
+
+            assert_series_equal(lhs, rhs)
+
+    def test_ops_nat_mixed_datetime64_timedelta64(self):
+        # GH 11349
+        timedelta_series = Series([NaT, Timedelta('1s')])
+        datetime_series = Series([NaT, Timestamp('19900315')])
+        nat_series_dtype_timedelta = Series([NaT, NaT],
+                                            dtype='timedelta64[ns]')
+        nat_series_dtype_timestamp = Series([NaT, NaT], dtype='datetime64[ns]')
+        single_nat_dtype_datetime = Series([NaT], dtype='datetime64[ns]')
+        single_nat_dtype_timedelta = Series([NaT], dtype='timedelta64[ns]')
+
+        # subtraction
+        assert_series_equal(datetime_series - single_nat_dtype_datetime,
+                            nat_series_dtype_timedelta)
+
+        assert_series_equal(datetime_series - single_nat_dtype_timedelta,
+                            nat_series_dtype_timestamp)
+        assert_series_equal(-single_nat_dtype_timedelta + datetime_series,
+                            nat_series_dtype_timestamp)
+
+        # without a Series wrapping the NaT, it is ambiguous
+        # whether it is a datetime64 or timedelta64
+        # defaults to interpreting it as timedelta64
+        assert_series_equal(nat_series_dtype_timestamp -
+                            single_nat_dtype_datetime,
+                            nat_series_dtype_timedelta)
+
+        assert_series_equal(nat_series_dtype_timestamp -
+                            single_nat_dtype_timedelta,
+                            nat_series_dtype_timestamp)
+        assert_series_equal(-single_nat_dtype_timedelta +
+                            nat_series_dtype_timestamp,
+                            nat_series_dtype_timestamp)
+
+        with pytest.raises(TypeError):
+            timedelta_series - single_nat_dtype_datetime
+
+        # addition
+        assert_series_equal(nat_series_dtype_timestamp +
+                            single_nat_dtype_timedelta,
+                            nat_series_dtype_timestamp)
+        assert_series_equal(single_nat_dtype_timedelta +
+                            nat_series_dtype_timestamp,
+                            nat_series_dtype_timestamp)
+
+        assert_series_equal(nat_series_dtype_timestamp +
+                            single_nat_dtype_timedelta,
+                            nat_series_dtype_timestamp)
+        assert_series_equal(single_nat_dtype_timedelta +
+                            nat_series_dtype_timestamp,
+                            nat_series_dtype_timestamp)
+
+        assert_series_equal(nat_series_dtype_timedelta +
+                            single_nat_dtype_datetime,
+                            nat_series_dtype_timestamp)
+        assert_series_equal(single_nat_dtype_datetime +
+                            nat_series_dtype_timedelta,
+                            nat_series_dtype_timestamp)
+
+    def test_ops_datetimelike_align(self):
+        # GH 7500
+        # datetimelike ops need to align
+        dt = Series(date_range('2012-1-1', periods=3, freq='D'))
+        dt.iloc[2] = np.nan
+        dt2 = dt[::-1]
+
+        expected = Series([timedelta(0), timedelta(0), pd.NaT])
+        # name is reset
+        result = dt2 - dt
+        assert_series_equal(result, expected)
+
+        expected = Series(expected, name=0)
+        result = (dt2.to_frame() - dt.to_frame())[0]
+        assert_series_equal(result, expected)
+
+    def test_operators_bitwise(self):
+        # GH 9016: support bitwise op for integer types
+        index = list('bca')
+
+        s_tft = Series([True, False, True], index=index)
+        s_fff = Series([False, False, False], index=index)
+        s_tff = Series([True, False, False], index=index)
+        s_empty = Series([])
+
+        # TODO: unused
+        # s_0101 = Series([0, 1, 0, 1])
+
+        s_0123 = Series(range(4), dtype='int64')
+        s_3333 = Series([3] * 4)
+        s_4444 = Series([4] * 4)
+
+        res = s_tft & s_empty
+        expected = s_fff
+        assert_series_equal(res, expected)
+
+        res = s_tft | s_empty
+        expected = s_tft
+        assert_series_equal(res, expected)
+
+        res = s_0123 & s_3333
+        expected = Series(range(4), dtype='int64')
+        assert_series_equal(res, expected)
+
+        res = s_0123 | s_4444
+        expected = Series(range(4, 8), dtype='int64')
+        assert_series_equal(res, expected)
+
+        s_a0b1c0 = Series([1], list('b'))
+
+        res = s_tft & s_a0b1c0
+        expected = s_tff.reindex(list('abc'))
+        assert_series_equal(res, expected)
+
+        res = s_tft | s_a0b1c0
+        expected = s_tft.reindex(list('abc'))
+        assert_series_equal(res, expected)
+
+        n0 = 0
+        res = s_tft & n0
+        expected = s_fff
+        assert_series_equal(res, expected)
+
+        res = s_0123 & n0
+        expected = Series([0] * 4)
+        assert_series_equal(res, expected)
+
+        n1 = 1
+        res = s_tft & n1
+        expected = s_tft
+        assert_series_equal(res, expected)
+
+        res = s_0123 & n1
+        expected = Series([0, 1, 0, 1])
+        assert_series_equal(res, expected)
+
+        s_1111 = Series([1] * 4, dtype='int8')
+        res = s_0123 & s_1111
+        expected = Series([0, 1, 0, 1], dtype='int64')
+        assert_series_equal(res, expected)
+
+        res = s_0123.astype(np.int16) | s_1111.astype(np.int32)
+        expected = Series([1, 1, 3, 3], dtype='int32')
+        assert_series_equal(res, expected)
+
+        pytest.raises(TypeError, lambda: s_1111 & 'a')
+        pytest.raises(TypeError, lambda: s_1111 & ['a', 'b', 'c', 'd'])
+        pytest.raises(TypeError, lambda: s_0123 & np.NaN)
+        pytest.raises(TypeError, lambda: s_0123 & 3.14)
+        pytest.raises(TypeError, lambda: s_0123 & [0.1, 4, 3.14, 2])
+
+        # s_0123 will be all false now because of reindexing like s_tft
+        if compat.PY3:
+            # unable to sort incompatible object via .union.
+            exp = Series([False] * 7, index=['b', 'c', 'a', 0, 1, 2, 3])
+            with tm.assert_produces_warning(RuntimeWarning):
+                assert_series_equal(s_tft & s_0123, exp)
+        else:
+            exp = Series([False] * 7, index=[0, 1, 2, 3, 'a', 'b', 'c'])
+            assert_series_equal(s_tft & s_0123, exp)
+
+        # s_tft will be all false now because of reindexing like s_0123
+        if compat.PY3:
+            # unable to sort incompatible object via .union.
+            exp = Series([False] * 7, index=[0, 1, 2, 3, 'b', 'c', 'a'])
+            with tm.assert_produces_warning(RuntimeWarning):
+                assert_series_equal(s_0123 & s_tft, exp)
+        else:
+            exp = Series([False] * 7, index=[0, 1, 2, 3, 'a', 'b', 'c'])
+            assert_series_equal(s_0123 & s_tft, exp)
+
+        assert_series_equal(s_0123 & False, Series([False] * 4))
+        assert_series_equal(s_0123 ^ False, Series([False, True, True, True]))
+        assert_series_equal(s_0123 & [False], Series([False] * 4))
+        assert_series_equal(s_0123 & (False), Series([False] * 4))
+        assert_series_equal(s_0123 & Series([False, np.NaN, False, False]),
+                            Series([False] * 4))
+
+        s_ftft = Series([False, True, False, True])
+        assert_series_equal(s_0123 & Series([0.1, 4, -3.14, 2]), s_ftft)
+
+        s_abNd = Series(['a', 'b', np.NaN, 'd'])
+        res = s_0123 & s_abNd
+        expected = s_ftft
+        assert_series_equal(res, expected)
+
+    def test_scalar_na_cmp_corners(self):
+        s = Series([2, 3, 4, 5, 6, 7, 8, 9, 10])
+
+        def tester(a, b):
+            return a & b
+
+        pytest.raises(TypeError, tester, s, datetime(2005, 1, 1))
+
+        s = Series([2, 3, 4, 5, 6, 7, 8, 9, datetime(2005, 1, 1)])
+        s[::2] = np.nan
+
+        expected = Series(True, index=s.index)
+        expected[::2] = False
+        assert_series_equal(tester(s, list(s)), expected)
+
+        d = DataFrame({'A': s})
+        # TODO: Fix this exception - needs to be fixed! (see GH5035)
+        # (previously this was a TypeError because series returned
+        # NotImplemented
+
+        # this is an alignment issue; these are equivalent
+        # https://github.com/pandas-dev/pandas/issues/5284
+
+        pytest.raises(ValueError, lambda: d.__and__(s, axis='columns'))
+        pytest.raises(ValueError, tester, s, d)
+
+        # this is wrong as its not a boolean result
+        # result = d.__and__(s,axis='index')
+
+    def test_operators_corner(self):
+        series = self.ts
+
+        empty = Series([], index=Index([]))
+
+        result = series + empty
+        assert np.isnan(result).all()
+
+        result = empty + Series([], index=Index([]))
+        assert len(result) == 0
+
+        # TODO: this returned NotImplemented earlier, what to do?
+        # deltas = Series([timedelta(1)] * 5, index=np.arange(5))
+        # sub_deltas = deltas[::2]
+        # deltas5 = deltas * 5
+        # deltas = deltas + sub_deltas
+
+        # float + int
+        int_ts = self.ts.astype(int)[:-5]
+        added = self.ts + int_ts
+        expected = Series(self.ts.values[:-5] + int_ts.values,
+                          index=self.ts.index[:-5], name='ts')
+        tm.assert_series_equal(added[:-5], expected)
+
+    @pytest.mark.parametrize('op', [operator.add, operator.sub, operator.mul,
+                                    operator.truediv, operator.floordiv])
+    def test_operators_reverse_object(self, op):
+        # GH 56
+        arr = Series(np.random.randn(10), index=np.arange(10), dtype=object)
+
+        result = op(1., arr)
+        expected = op(1., arr.astype(float))
+        assert_series_equal(result.astype(float), expected)
+
+    def test_operators_combine(self):
+        def _check_fill(meth, op, a, b, fill_value=0):
+            exp_index = a.index.union(b.index)
+            a = a.reindex(exp_index)
+            b = b.reindex(exp_index)
+
+            amask = isna(a)
+            bmask = isna(b)
+
+            exp_values = []
+            for i in range(len(exp_index)):
+                with np.errstate(all='ignore'):
+                    if amask[i]:
+                        if bmask[i]:
+                            exp_values.append(nan)
+                            continue
+                        exp_values.append(op(fill_value, b[i]))
+                    elif bmask[i]:
+                        if amask[i]:
+                            exp_values.append(nan)
+                            continue
+                        exp_values.append(op(a[i], fill_value))
+                    else:
+                        exp_values.append(op(a[i], b[i]))
+
+            result = meth(a, b, fill_value=fill_value)
+            expected = Series(exp_values, exp_index)
+            assert_series_equal(result, expected)
+
+        a = Series([nan, 1., 2., 3., nan], index=np.arange(5))
+        b = Series([nan, 1, nan, 3, nan, 4.], index=np.arange(6))
+
+        pairings = []
+        for op in ['add', 'sub', 'mul', 'pow', 'truediv', 'floordiv']:
+            fv = 0
+            lop = getattr(Series, op)
+            lequiv = getattr(operator, op)
+            rop = getattr(Series, 'r' + op)
+            # bind op at definition time...
+            requiv = lambda x, y, op=op: getattr(operator, op)(y, x)
+            pairings.append((lop, lequiv, fv))
+            pairings.append((rop, requiv, fv))
+
+        if compat.PY3:
+            pairings.append((Series.div, operator.truediv, 1))
+            pairings.append((Series.rdiv, lambda x, y: operator.truediv(y, x),
+                             1))
+        else:
+            pairings.append((Series.div, operator.div, 1))
+            pairings.append((Series.rdiv, lambda x, y: operator.div(y, x), 1))
+
+        for op, equiv_op, fv in pairings:
+            result = op(a, b)
+            exp = equiv_op(a, b)
+            assert_series_equal(result, exp)
+            _check_fill(op, equiv_op, a, b, fill_value=fv)
+            # should accept axis=0 or axis='rows'
+            op(a, b, axis=0)
+
+    def test_operators_na_handling(self):
+        from decimal import Decimal
+        from datetime import date
+        s = Series([Decimal('1.3'), Decimal('2.3')],
+                   index=[date(2012, 1, 1), date(2012, 1, 2)])
+
+        result = s + s.shift(1)
+        result2 = s.shift(1) + s
+        assert isna(result[0])
+        assert isna(result2[0])
+
+        s = Series(['foo', 'bar', 'baz', np.nan])
+        result = 'prefix_' + s
+        expected = Series(['prefix_foo', 'prefix_bar', 'prefix_baz', np.nan])
+        assert_series_equal(result, expected)
+
+        result = s + '_suffix'
+        expected = Series(['foo_suffix', 'bar_suffix', 'baz_suffix', np.nan])
+        assert_series_equal(result, expected)
+
+    def test_datetime64_with_index(self):
+        # arithmetic integer ops with an index
+        ser = Series(np.random.randn(5))
+        expected = ser - ser.index.to_series()
+        result = ser - ser.index
+        assert_series_equal(result, expected)
+
+        # GH 4629
+        # arithmetic datetime64 ops with an index
+        ser = Series(date_range('20130101', periods=5),
+                     index=date_range('20130101', periods=5))
+        expected = ser - ser.index.to_series()
+        result = ser - ser.index
+        assert_series_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            # GH#18850
+            result = ser - ser.index.to_period()
+
+        df = DataFrame(np.random.randn(5, 2),
+                       index=date_range('20130101', periods=5))
+        df['date'] = Timestamp('20130102')
+        df['expected'] = df['date'] - df.index.to_series()
+        df['result'] = df['date'] - df.index
+        assert_series_equal(df['result'], df['expected'], check_names=False)
+
+    def test_op_duplicate_index(self):
+        # GH14227
+        s1 = Series([1, 2], index=[1, 1])
+        s2 = Series([10, 10], index=[1, 2])
+        result = s1 + s2
+        expected = pd.Series([11, 12, np.nan], index=[1, 1, 2])
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        "test_input,error_type",
+        [
+            (pd.Series([]), ValueError),
+
+            # For strings, or any Series with dtype 'O'
+            (pd.Series(['foo', 'bar', 'baz']), TypeError),
+            (pd.Series([(1,), (2,)]), TypeError),
+
+            # For mixed data types
+            (
+                pd.Series(['foo', 'foo', 'bar', 'bar', None, np.nan, 'baz']),
+                TypeError
+            ),
+        ]
+    )
+    def test_assert_idxminmax_raises(self, test_input, error_type):
+        """
+        Cases where ``Series.argmax`` and related should raise an exception
+        """
+        with pytest.raises(error_type):
+            test_input.idxmin()
+        with pytest.raises(error_type):
+            test_input.idxmin(skipna=False)
+        with pytest.raises(error_type):
+            test_input.idxmax()
+        with pytest.raises(error_type):
+            test_input.idxmax(skipna=False)
+
+    def test_idxminmax_with_inf(self):
+        # For numeric data with NA and Inf (GH #13595)
+        s = pd.Series([0, -np.inf, np.inf, np.nan])
+
+        assert s.idxmin() == 1
+        assert np.isnan(s.idxmin(skipna=False))
+
+        assert s.idxmax() == 2
+        assert np.isnan(s.idxmax(skipna=False))
+
+        # Using old-style behavior that treats floating point nan, -inf, and
+        # +inf as missing
+        with pd.option_context('mode.use_inf_as_na', True):
+            assert s.idxmin() == 0
+            assert np.isnan(s.idxmin(skipna=False))
+            assert s.idxmax() == 0
+            np.isnan(s.idxmax(skipna=False))
+
+
+class TestSeriesOperationsDataFrameCompat(object):
+    def test_operators_frame(self):
+        # rpow does not work with DataFrame
+        ts = tm.makeTimeSeries()
+        ts.name = 'ts'
+
+        df = DataFrame({'A': ts})
+
+        assert_series_equal(ts + ts, ts + df['A'],
+                            check_names=False)
+        assert_series_equal(ts ** ts, ts ** df['A'],
+                            check_names=False)
+        assert_series_equal(ts < ts, ts < df['A'],
+                            check_names=False)
+        assert_series_equal(ts / ts, ts / df['A'],
+                            check_names=False)
+
+    def test_series_frame_radd_bug(self):
+        # GH#353
+        vals = Series(tm.rands_array(5, 10))
+        result = 'foo_' + vals
+        expected = vals.map(lambda x: 'foo_' + x)
+        assert_series_equal(result, expected)
+
+        frame = DataFrame({'vals': vals})
+        result = 'foo_' + frame
+        expected = DataFrame({'vals': vals.map(lambda x: 'foo_' + x)})
+        assert_frame_equal(result, expected)
+
+        ts = tm.makeTimeSeries()
+        ts.name = 'ts'
+
+        # really raise this time
+        with pytest.raises(TypeError):
+            datetime.now() + ts
+
+        with pytest.raises(TypeError):
+            ts + datetime.now()
+
+    def test_bool_ops_df_compat(self):
+        # GH 1134
+        s1 = pd.Series([True, False, True], index=list('ABC'), name='x')
+        s2 = pd.Series([True, True, False], index=list('ABD'), name='x')
+
+        exp = pd.Series([True, False, False, False],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s1 & s2, exp)
+        assert_series_equal(s2 & s1, exp)
+
+        # True | np.nan => True
+        exp = pd.Series([True, True, True, False],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s1 | s2, exp)
+        # np.nan | True => np.nan, filled with False
+        exp = pd.Series([True, True, False, False],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s2 | s1, exp)
+
+        # DataFrame doesn't fill nan with False
+        exp = pd.DataFrame({'x': [True, False, np.nan, np.nan]},
+                           index=list('ABCD'))
+        assert_frame_equal(s1.to_frame() & s2.to_frame(), exp)
+        assert_frame_equal(s2.to_frame() & s1.to_frame(), exp)
+
+        exp = pd.DataFrame({'x': [True, True, np.nan, np.nan]},
+                           index=list('ABCD'))
+        assert_frame_equal(s1.to_frame() | s2.to_frame(), exp)
+        assert_frame_equal(s2.to_frame() | s1.to_frame(), exp)
+
+        # different length
+        s3 = pd.Series([True, False, True], index=list('ABC'), name='x')
+        s4 = pd.Series([True, True, True, True], index=list('ABCD'), name='x')
+
+        exp = pd.Series([True, False, True, False],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s3 & s4, exp)
+        assert_series_equal(s4 & s3, exp)
+
+        # np.nan | True => np.nan, filled with False
+        exp = pd.Series([True, True, True, False],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s3 | s4, exp)
+        # True | np.nan => True
+        exp = pd.Series([True, True, True, True],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s4 | s3, exp)
+
+        exp = pd.DataFrame({'x': [True, False, True, np.nan]},
+                           index=list('ABCD'))
+        assert_frame_equal(s3.to_frame() & s4.to_frame(), exp)
+        assert_frame_equal(s4.to_frame() & s3.to_frame(), exp)
+
+        exp = pd.DataFrame({'x': [True, True, True, np.nan]},
+                           index=list('ABCD'))
+        assert_frame_equal(s3.to_frame() | s4.to_frame(), exp)
+        assert_frame_equal(s4.to_frame() | s3.to_frame(), exp)
+
+    def test_arith_ops_df_compat(self):
+        # GH#1134
+        s1 = pd.Series([1, 2, 3], index=list('ABC'), name='x')
+        s2 = pd.Series([2, 2, 2], index=list('ABD'), name='x')
+
+        exp = pd.Series([3.0, 4.0, np.nan, np.nan],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s1 + s2, exp)
+        assert_series_equal(s2 + s1, exp)
+
+        exp = pd.DataFrame({'x': [3.0, 4.0, np.nan, np.nan]},
+                           index=list('ABCD'))
+        assert_frame_equal(s1.to_frame() + s2.to_frame(), exp)
+        assert_frame_equal(s2.to_frame() + s1.to_frame(), exp)
+
+        # different length
+        s3 = pd.Series([1, 2, 3], index=list('ABC'), name='x')
+        s4 = pd.Series([2, 2, 2, 2], index=list('ABCD'), name='x')
+
+        exp = pd.Series([3, 4, 5, np.nan],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s3 + s4, exp)
+        assert_series_equal(s4 + s3, exp)
+
+        exp = pd.DataFrame({'x': [3, 4, 5, np.nan]},
+                           index=list('ABCD'))
+        assert_frame_equal(s3.to_frame() + s4.to_frame(), exp)
+        assert_frame_equal(s4.to_frame() + s3.to_frame(), exp)
diff --git a/pandas/tests/series/test_period.py b/pandas/tests/series/test_period.py
new file mode 100644
index 0000000000000..63726f27914f3
--- /dev/null
+++ b/pandas/tests/series/test_period.py
@@ -0,0 +1,169 @@
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.core.indexes.period as period
+from pandas import Series, period_range, DataFrame
+
+
+def _permute(obj):
+    return obj.take(np.random.permutation(len(obj)))
+
+
+class TestSeriesPeriod(object):
+
+    def setup_method(self, method):
+        self.series = Series(period_range('2000-01-01', periods=10, freq='D'))
+
+    def test_auto_conversion(self):
+        series = Series(list(period_range('2000-01-01', periods=10, freq='D')))
+        assert series.dtype == 'object'
+
+        series = pd.Series([pd.Period('2011-01-01', freq='D'),
+                            pd.Period('2011-02-01', freq='D')])
+        assert series.dtype == 'object'
+
+    def test_getitem(self):
+        assert self.series[1] == pd.Period('2000-01-02', freq='D')
+
+        result = self.series[[2, 4]]
+        exp = pd.Series([pd.Period('2000-01-03', freq='D'),
+                         pd.Period('2000-01-05', freq='D')],
+                        index=[2, 4])
+        tm.assert_series_equal(result, exp)
+        assert result.dtype == 'object'
+
+    def test_isna(self):
+        # GH 13737
+        s = Series([pd.Period('2011-01', freq='M'),
+                    pd.Period('NaT', freq='M')])
+        tm.assert_series_equal(s.isna(), Series([False, True]))
+        tm.assert_series_equal(s.notna(), Series([True, False]))
+
+    def test_fillna(self):
+        # GH 13737
+        s = Series([pd.Period('2011-01', freq='M'),
+                    pd.Period('NaT', freq='M')])
+
+        res = s.fillna(pd.Period('2012-01', freq='M'))
+        exp = Series([pd.Period('2011-01', freq='M'),
+                      pd.Period('2012-01', freq='M')])
+        tm.assert_series_equal(res, exp)
+        assert res.dtype == 'object'
+
+        res = s.fillna('XXX')
+        exp = Series([pd.Period('2011-01', freq='M'), 'XXX'])
+        tm.assert_series_equal(res, exp)
+        assert res.dtype == 'object'
+
+    def test_dropna(self):
+        # GH 13737
+        s = Series([pd.Period('2011-01', freq='M'),
+                    pd.Period('NaT', freq='M')])
+        tm.assert_series_equal(s.dropna(),
+                               Series([pd.Period('2011-01', freq='M')]))
+
+    def test_between(self):
+        left, right = self.series[[2, 7]]
+        result = self.series.between(left, right)
+        expected = (self.series >= left) & (self.series <= right)
+        tm.assert_series_equal(result, expected)
+
+    # ---------------------------------------------------------------------
+    # NaT support
+
+    """
+    # ToDo: Enable when support period dtype
+    def test_NaT_scalar(self):
+        series = Series([0, 1000, 2000, iNaT], dtype='period[D]')
+
+        val = series[3]
+        assert isna(val)
+
+        series[2] = val
+        assert isna(series[2])
+
+    def test_NaT_cast(self):
+        result = Series([np.nan]).astype('period[D]')
+        expected = Series([NaT])
+        tm.assert_series_equal(result, expected)
+    """
+
+    def test_set_none_nan(self):
+        # currently Period is stored as object dtype, not as NaT
+        self.series[3] = None
+        assert self.series[3] is None
+
+        self.series[3:5] = None
+        assert self.series[4] is None
+
+        self.series[5] = np.nan
+        assert np.isnan(self.series[5])
+
+        self.series[5:7] = np.nan
+        assert np.isnan(self.series[6])
+
+    def test_intercept_astype_object(self):
+        expected = self.series.astype('object')
+
+        df = DataFrame({'a': self.series,
+                        'b': np.random.randn(len(self.series))})
+
+        result = df.values.squeeze()
+        assert (result[:, 0] == expected.values).all()
+
+        df = DataFrame({'a': self.series, 'b': ['foo'] * len(self.series)})
+
+        result = df.values.squeeze()
+        assert (result[:, 0] == expected.values).all()
+
+    def test_add_series(self):
+        rng = period_range('1/1/2000', '1/1/2010', freq='A')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        result = ts + ts[::2]
+        expected = ts + ts
+        expected[1::2] = np.nan
+        tm.assert_series_equal(result, expected)
+
+        result = ts + _permute(ts[::2])
+        tm.assert_series_equal(result, expected)
+
+        msg = "Input has different freq=D from PeriodIndex\\(freq=A-DEC\\)"
+        with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
+            ts + ts.asfreq('D', how="end")
+
+    def test_align_series(self, join_type):
+        rng = period_range('1/1/2000', '1/1/2010', freq='A')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        ts.align(ts[::2], join=join_type)
+
+    def test_truncate(self):
+        # GH 17717
+        idx1 = pd.PeriodIndex([
+            pd.Period('2017-09-02'),
+            pd.Period('2017-09-02'),
+            pd.Period('2017-09-03')
+        ])
+        series1 = pd.Series([1, 2, 3], index=idx1)
+        result1 = series1.truncate(after='2017-09-02')
+
+        expected_idx1 = pd.PeriodIndex([
+            pd.Period('2017-09-02'),
+            pd.Period('2017-09-02')
+        ])
+        tm.assert_series_equal(result1, pd.Series([1, 2], index=expected_idx1))
+
+        idx2 = pd.PeriodIndex([
+            pd.Period('2017-09-03'),
+            pd.Period('2017-09-02'),
+            pd.Period('2017-09-03')
+        ])
+        series2 = pd.Series([1, 2, 3], index=idx2)
+        result2 = series2.sort_index().truncate(after='2017-09-02')
+
+        expected_idx2 = pd.PeriodIndex([
+            pd.Period('2017-09-02')
+        ])
+        tm.assert_series_equal(result2, pd.Series([2], index=expected_idx2))
diff --git a/pandas/tests/series/test_quantile.py b/pandas/tests/series/test_quantile.py
new file mode 100644
index 0000000000000..3c93ff1d3f31e
--- /dev/null
+++ b/pandas/tests/series/test_quantile.py
@@ -0,0 +1,184 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import numpy as np
+import pandas as pd
+
+from pandas import Index, Series
+from pandas.core.indexes.datetimes import Timestamp
+from pandas.core.dtypes.common import is_integer
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestSeriesQuantile(TestData):
+
+    def test_quantile(self):
+
+        q = self.ts.quantile(0.1)
+        assert q == np.percentile(self.ts.dropna(), 10)
+
+        q = self.ts.quantile(0.9)
+        assert q == np.percentile(self.ts.dropna(), 90)
+
+        # object dtype
+        q = Series(self.ts, dtype=object).quantile(0.9)
+        assert q == np.percentile(self.ts.dropna(), 90)
+
+        # datetime64[ns] dtype
+        dts = self.ts.index.to_series()
+        q = dts.quantile(.2)
+        assert q == Timestamp('2000-01-10 19:12:00')
+
+        # timedelta64[ns] dtype
+        tds = dts.diff()
+        q = tds.quantile(.25)
+        assert q == pd.to_timedelta('24:00:00')
+
+        # GH7661
+        result = Series([np.timedelta64('NaT')]).sum()
+        assert result == pd.Timedelta(0)
+
+        msg = 'percentiles should all be in the interval \\[0, 1\\]'
+        for invalid in [-1, 2, [0.5, -1], [0.5, 2]]:
+            with tm.assert_raises_regex(ValueError, msg):
+                self.ts.quantile(invalid)
+
+    def test_quantile_multi(self):
+
+        qs = [.1, .9]
+        result = self.ts.quantile(qs)
+        expected = pd.Series([np.percentile(self.ts.dropna(), 10),
+                              np.percentile(self.ts.dropna(), 90)],
+                             index=qs, name=self.ts.name)
+        tm.assert_series_equal(result, expected)
+
+        dts = self.ts.index.to_series()
+        dts.name = 'xxx'
+        result = dts.quantile((.2, .2))
+        expected = Series([Timestamp('2000-01-10 19:12:00'),
+                           Timestamp('2000-01-10 19:12:00')],
+                          index=[.2, .2], name='xxx')
+        tm.assert_series_equal(result, expected)
+
+        result = self.ts.quantile([])
+        expected = pd.Series([], name=self.ts.name, index=Index(
+            [], dtype=float))
+        tm.assert_series_equal(result, expected)
+
+    def test_quantile_interpolation(self):
+        # see gh-10174
+
+        # interpolation = linear (default case)
+        q = self.ts.quantile(0.1, interpolation='linear')
+        assert q == np.percentile(self.ts.dropna(), 10)
+        q1 = self.ts.quantile(0.1)
+        assert q1 == np.percentile(self.ts.dropna(), 10)
+
+        # test with and without interpolation keyword
+        assert q == q1
+
+    def test_quantile_interpolation_dtype(self):
+        # GH #10174
+
+        # interpolation = linear (default case)
+        q = pd.Series([1, 3, 4]).quantile(0.5, interpolation='lower')
+        assert q == np.percentile(np.array([1, 3, 4]), 50)
+        assert is_integer(q)
+
+        q = pd.Series([1, 3, 4]).quantile(0.5, interpolation='higher')
+        assert q == np.percentile(np.array([1, 3, 4]), 50)
+        assert is_integer(q)
+
+    def test_quantile_nan(self):
+
+        # GH 13098
+        s = pd.Series([1, 2, 3, 4, np.nan])
+        result = s.quantile(0.5)
+        expected = 2.5
+        assert result == expected
+
+        # all nan/empty
+        cases = [Series([]), Series([np.nan, np.nan])]
+
+        for s in cases:
+            res = s.quantile(0.5)
+            assert np.isnan(res)
+
+            res = s.quantile([0.5])
+            tm.assert_series_equal(res, pd.Series([np.nan], index=[0.5]))
+
+            res = s.quantile([0.2, 0.3])
+            tm.assert_series_equal(res, pd.Series([np.nan, np.nan],
+                                                  index=[0.2, 0.3]))
+
+    def test_quantile_box(self):
+        cases = [[pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02'),
+                  pd.Timestamp('2011-01-03')],
+                 [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+                  pd.Timestamp('2011-01-02', tz='US/Eastern'),
+                  pd.Timestamp('2011-01-03', tz='US/Eastern')],
+                 [pd.Timedelta('1 days'), pd.Timedelta('2 days'),
+                  pd.Timedelta('3 days')],
+                 # NaT
+                 [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02'),
+                  pd.Timestamp('2011-01-03'), pd.NaT],
+                 [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+                  pd.Timestamp('2011-01-02', tz='US/Eastern'),
+                  pd.Timestamp('2011-01-03', tz='US/Eastern'), pd.NaT],
+                 [pd.Timedelta('1 days'), pd.Timedelta('2 days'),
+                  pd.Timedelta('3 days'), pd.NaT]]
+
+        for case in cases:
+            s = pd.Series(case, name='XXX')
+            res = s.quantile(0.5)
+            assert res == case[1]
+
+            res = s.quantile([0.5])
+            exp = pd.Series([case[1]], index=[0.5], name='XXX')
+            tm.assert_series_equal(res, exp)
+
+    def test_datetime_timedelta_quantiles(self):
+        # covers #9694
+        assert pd.isna(Series([], dtype='M8[ns]').quantile(.5))
+        assert pd.isna(Series([], dtype='m8[ns]').quantile(.5))
+
+    def test_quantile_nat(self):
+        res = Series([pd.NaT, pd.NaT]).quantile(0.5)
+        assert res is pd.NaT
+
+        res = Series([pd.NaT, pd.NaT]).quantile([0.5])
+        tm.assert_series_equal(res, pd.Series([pd.NaT], index=[0.5]))
+
+    def test_quantile_empty(self):
+
+        # floats
+        s = Series([], dtype='float64')
+
+        res = s.quantile(0.5)
+        assert np.isnan(res)
+
+        res = s.quantile([0.5])
+        exp = Series([np.nan], index=[0.5])
+        tm.assert_series_equal(res, exp)
+
+        # int
+        s = Series([], dtype='int64')
+
+        res = s.quantile(0.5)
+        assert np.isnan(res)
+
+        res = s.quantile([0.5])
+        exp = Series([np.nan], index=[0.5])
+        tm.assert_series_equal(res, exp)
+
+        # datetime
+        s = Series([], dtype='datetime64[ns]')
+
+        res = s.quantile(0.5)
+        assert res is pd.NaT
+
+        res = s.quantile([0.5])
+        exp = Series([pd.NaT], index=[0.5])
+        tm.assert_series_equal(res, exp)
diff --git a/pandas/tests/series/test_rank.py b/pandas/tests/series/test_rank.py
new file mode 100644
index 0000000000000..004e42e14cb93
--- /dev/null
+++ b/pandas/tests/series/test_rank.py
@@ -0,0 +1,487 @@
+# -*- coding: utf-8 -*-
+from pandas import compat, Timestamp
+
+import pytest
+
+from distutils.version import LooseVersion
+from numpy import nan
+import numpy as np
+
+from pandas import Series, date_range, NaT
+from pandas.api.types import CategoricalDtype
+
+from pandas.compat import product
+from pandas.util.testing import assert_series_equal
+import pandas.util.testing as tm
+from pandas.tests.series.common import TestData
+from pandas._libs.tslib import iNaT
+from pandas._libs.algos import Infinity, NegInfinity
+from itertools import chain
+import pandas.util._test_decorators as td
+
+
+class TestSeriesRank(TestData):
+    s = Series([1, 3, 4, 2, nan, 2, 1, 5, nan, 3])
+
+    results = {
+        'average': np.array([1.5, 5.5, 7.0, 3.5, nan,
+                             3.5, 1.5, 8.0, nan, 5.5]),
+        'min': np.array([1, 5, 7, 3, nan, 3, 1, 8, nan, 5]),
+        'max': np.array([2, 6, 7, 4, nan, 4, 2, 8, nan, 6]),
+        'first': np.array([1, 5, 7, 3, nan, 4, 2, 8, nan, 6]),
+        'dense': np.array([1, 3, 4, 2, nan, 2, 1, 5, nan, 3]),
+    }
+
+    def test_rank(self):
+        pytest.importorskip('scipy.stats.special')
+        rankdata = pytest.importorskip('scipy.stats.rankdata')
+
+        self.ts[::2] = np.nan
+        self.ts[:10][::3] = 4.
+
+        ranks = self.ts.rank()
+        oranks = self.ts.astype('O').rank()
+
+        assert_series_equal(ranks, oranks)
+
+        mask = np.isnan(self.ts)
+        filled = self.ts.fillna(np.inf)
+
+        # rankdata returns a ndarray
+        exp = Series(rankdata(filled), index=filled.index, name='ts')
+        exp[mask] = np.nan
+
+        tm.assert_series_equal(ranks, exp)
+
+        iseries = Series(np.arange(5).repeat(2))
+
+        iranks = iseries.rank()
+        exp = iseries.astype(float).rank()
+        assert_series_equal(iranks, exp)
+        iseries = Series(np.arange(5)) + 1.0
+        exp = iseries / 5.0
+        iranks = iseries.rank(pct=True)
+
+        assert_series_equal(iranks, exp)
+
+        iseries = Series(np.repeat(1, 100))
+        exp = Series(np.repeat(0.505, 100))
+        iranks = iseries.rank(pct=True)
+        assert_series_equal(iranks, exp)
+
+        iseries[1] = np.nan
+        exp = Series(np.repeat(50.0 / 99.0, 100))
+        exp[1] = np.nan
+        iranks = iseries.rank(pct=True)
+        assert_series_equal(iranks, exp)
+
+        iseries = Series(np.arange(5)) + 1.0
+        iseries[4] = np.nan
+        exp = iseries / 4.0
+        iranks = iseries.rank(pct=True)
+        assert_series_equal(iranks, exp)
+
+        iseries = Series(np.repeat(np.nan, 100))
+        exp = iseries.copy()
+        iranks = iseries.rank(pct=True)
+        assert_series_equal(iranks, exp)
+
+        iseries = Series(np.arange(5)) + 1
+        iseries[4] = np.nan
+        exp = iseries / 4.0
+        iranks = iseries.rank(pct=True)
+        assert_series_equal(iranks, exp)
+
+        rng = date_range('1/1/1990', periods=5)
+        iseries = Series(np.arange(5), rng) + 1
+        iseries.iloc[4] = np.nan
+        exp = iseries / 4.0
+        iranks = iseries.rank(pct=True)
+        assert_series_equal(iranks, exp)
+
+        iseries = Series([1e-50, 1e-100, 1e-20, 1e-2, 1e-20 + 1e-30, 1e-1])
+        exp = Series([2, 1, 3, 5, 4, 6.0])
+        iranks = iseries.rank()
+        assert_series_equal(iranks, exp)
+
+        # GH 5968
+        iseries = Series(['3 day', '1 day 10m', '-2 day', NaT],
+                         dtype='m8[ns]')
+        exp = Series([3, 2, 1, np.nan])
+        iranks = iseries.rank()
+        assert_series_equal(iranks, exp)
+
+        values = np.array(
+            [-50, -1, -1e-20, -1e-25, -1e-50, 0, 1e-40, 1e-20, 1e-10, 2, 40
+             ], dtype='float64')
+        random_order = np.random.permutation(len(values))
+        iseries = Series(values[random_order])
+        exp = Series(random_order + 1.0, dtype='float64')
+        iranks = iseries.rank()
+        assert_series_equal(iranks, exp)
+
+    def test_rank_categorical(self):
+        # GH issue #15420 rank incorrectly orders ordered categories
+
+        # Test ascending/descending ranking for ordered categoricals
+        exp = Series([1., 2., 3., 4., 5., 6.])
+        exp_desc = Series([6., 5., 4., 3., 2., 1.])
+        ordered = Series(
+            ['first', 'second', 'third', 'fourth', 'fifth', 'sixth']
+        ).astype(CategoricalDtype(categories=['first', 'second', 'third',
+                                              'fourth', 'fifth', 'sixth'],
+                                  ordered=True))
+        assert_series_equal(ordered.rank(), exp)
+        assert_series_equal(ordered.rank(ascending=False), exp_desc)
+
+        # Unordered categoricals should be ranked as objects
+        unordered = Series(['first', 'second', 'third', 'fourth',
+                            'fifth', 'sixth']).astype(
+            CategoricalDtype(categories=['first', 'second', 'third',
+                                         'fourth', 'fifth', 'sixth'],
+                             ordered=False))
+        exp_unordered = Series([2., 4., 6., 3., 1., 5.])
+        res = unordered.rank()
+        assert_series_equal(res, exp_unordered)
+
+        unordered1 = Series(
+            [1, 2, 3, 4, 5, 6],
+        ).astype(CategoricalDtype([1, 2, 3, 4, 5, 6], False))
+        exp_unordered1 = Series([1., 2., 3., 4., 5., 6.])
+        res1 = unordered1.rank()
+        assert_series_equal(res1, exp_unordered1)
+
+        # Test na_option for rank data
+        na_ser = Series(
+            ['first', 'second', 'third', 'fourth', 'fifth', 'sixth', np.NaN]
+        ).astype(CategoricalDtype(['first', 'second', 'third', 'fourth',
+                                   'fifth', 'sixth', 'seventh'], True))
+
+        exp_top = Series([2., 3., 4., 5., 6., 7., 1.])
+        exp_bot = Series([1., 2., 3., 4., 5., 6., 7.])
+        exp_keep = Series([1., 2., 3., 4., 5., 6., np.NaN])
+
+        assert_series_equal(na_ser.rank(na_option='top'), exp_top)
+        assert_series_equal(na_ser.rank(na_option='bottom'), exp_bot)
+        assert_series_equal(na_ser.rank(na_option='keep'), exp_keep)
+
+        # Test na_option for rank data with ascending False
+        exp_top = Series([7., 6., 5., 4., 3., 2., 1.])
+        exp_bot = Series([6., 5., 4., 3., 2., 1., 7.])
+        exp_keep = Series([6., 5., 4., 3., 2., 1., np.NaN])
+
+        assert_series_equal(
+            na_ser.rank(na_option='top', ascending=False),
+            exp_top
+        )
+        assert_series_equal(
+            na_ser.rank(na_option='bottom', ascending=False),
+            exp_bot
+        )
+        assert_series_equal(
+            na_ser.rank(na_option='keep', ascending=False),
+            exp_keep
+        )
+
+        # Test with pct=True
+        na_ser = Series(['first', 'second', 'third', 'fourth', np.NaN]).astype(
+            CategoricalDtype(['first', 'second', 'third', 'fourth'], True))
+        exp_top = Series([0.4, 0.6, 0.8, 1., 0.2])
+        exp_bot = Series([0.2, 0.4, 0.6, 0.8, 1.])
+        exp_keep = Series([0.25, 0.5, 0.75, 1., np.NaN])
+
+        assert_series_equal(na_ser.rank(na_option='top', pct=True), exp_top)
+        assert_series_equal(na_ser.rank(na_option='bottom', pct=True), exp_bot)
+        assert_series_equal(na_ser.rank(na_option='keep', pct=True), exp_keep)
+
+    def test_rank_signature(self):
+        s = Series([0, 1])
+        s.rank(method='average')
+        pytest.raises(ValueError, s.rank, 'average')
+
+    @pytest.mark.parametrize('contents,dtype', [
+        ([-np.inf, -50, -1, -1e-20, -1e-25, -1e-50, 0, 1e-40, 1e-20, 1e-10,
+          2, 40, np.inf],
+         'float64'),
+        ([-np.inf, -50, -1, -1e-20, -1e-25, -1e-45, 0, 1e-40, 1e-20, 1e-10,
+          2, 40, np.inf],
+         'float32'),
+        ([np.iinfo(np.uint8).min, 1, 2, 100, np.iinfo(np.uint8).max],
+         'uint8'),
+        pytest.param([np.iinfo(np.int64).min, -100, 0, 1, 9999, 100000,
+                      1e10, np.iinfo(np.int64).max],
+                     'int64',
+                     marks=pytest.mark.xfail(
+                         reason="iNaT is equivalent to minimum value of dtype"
+                         "int64 pending issue #16674")),
+        ([NegInfinity(), '1', 'A', 'BA', 'Ba', 'C', Infinity()],
+         'object')
+    ])
+    def test_rank_inf(self, contents, dtype):
+        dtype_na_map = {
+            'float64': np.nan,
+            'float32': np.nan,
+            'int64': iNaT,
+            'object': None
+        }
+        # Insert nans at random positions if underlying dtype has missing
+        # value. Then adjust the expected order by adding nans accordingly
+        # This is for testing whether rank calculation is affected
+        # when values are interwined with nan values.
+        values = np.array(contents, dtype=dtype)
+        exp_order = np.array(range(len(values)), dtype='float64') + 1.0
+        if dtype in dtype_na_map:
+            na_value = dtype_na_map[dtype]
+            nan_indices = np.random.choice(range(len(values)), 5)
+            values = np.insert(values, nan_indices, na_value)
+            exp_order = np.insert(exp_order, nan_indices, np.nan)
+        # shuffle the testing array and expected results in the same way
+        random_order = np.random.permutation(len(values))
+        iseries = Series(values[random_order])
+        exp = Series(exp_order[random_order], dtype='float64')
+        iranks = iseries.rank()
+        assert_series_equal(iranks, exp)
+
+    def test_rank_tie_methods(self):
+        s = self.s
+
+        def _check(s, expected, method='average'):
+            result = s.rank(method=method)
+            tm.assert_series_equal(result, Series(expected))
+
+        dtypes = [None, object]
+        disabled = set([(object, 'first')])
+        results = self.results
+
+        for method, dtype in product(results, dtypes):
+            if (dtype, method) in disabled:
+                continue
+            series = s if dtype is None else s.astype(dtype)
+            _check(series, results[method], method=method)
+
+    @td.skip_if_no_scipy
+    @pytest.mark.parametrize('ascending', [True, False])
+    @pytest.mark.parametrize('method', ['average', 'min', 'max', 'first',
+                                        'dense'])
+    @pytest.mark.parametrize('na_option', ['top', 'bottom', 'keep'])
+    def test_rank_tie_methods_on_infs_nans(self, method, na_option, ascending):
+        dtypes = [('object', None, Infinity(), NegInfinity()),
+                  ('float64', np.nan, np.inf, -np.inf)]
+        chunk = 3
+        disabled = set([('object', 'first')])
+
+        def _check(s, method, na_option, ascending):
+            exp_ranks = {
+                'average': ([2, 2, 2], [5, 5, 5], [8, 8, 8]),
+                'min': ([1, 1, 1], [4, 4, 4], [7, 7, 7]),
+                'max': ([3, 3, 3], [6, 6, 6], [9, 9, 9]),
+                'first': ([1, 2, 3], [4, 5, 6], [7, 8, 9]),
+                'dense': ([1, 1, 1], [2, 2, 2], [3, 3, 3])
+            }
+            ranks = exp_ranks[method]
+            if na_option == 'top':
+                order = [ranks[1], ranks[0], ranks[2]]
+            elif na_option == 'bottom':
+                order = [ranks[0], ranks[2], ranks[1]]
+            else:
+                order = [ranks[0], [np.nan] * chunk, ranks[1]]
+            expected = order if ascending else order[::-1]
+            expected = list(chain.from_iterable(expected))
+            result = s.rank(method=method, na_option=na_option,
+                            ascending=ascending)
+            tm.assert_series_equal(result, Series(expected, dtype='float64'))
+
+        for dtype, na_value, pos_inf, neg_inf in dtypes:
+            in_arr = [neg_inf] * chunk + [na_value] * chunk + [pos_inf] * chunk
+            iseries = Series(in_arr, dtype=dtype)
+            if (dtype, method) in disabled:
+                continue
+            _check(iseries, method, na_option, ascending)
+
+    def test_rank_desc_mix_nans_infs(self):
+        # GH 19538
+        # check descending ranking when mix nans and infs
+        iseries = Series([1, np.nan, np.inf, -np.inf, 25])
+        result = iseries.rank(ascending=False)
+        exp = Series([3, np.nan, 1, 4, 2], dtype='float64')
+        tm.assert_series_equal(result, exp)
+
+    def test_rank_methods_series(self):
+        pytest.importorskip('scipy.stats.special')
+        rankdata = pytest.importorskip('scipy.stats.rankdata')
+        import scipy
+
+        xs = np.random.randn(9)
+        xs = np.concatenate([xs[i:] for i in range(0, 9, 2)])  # add duplicates
+        np.random.shuffle(xs)
+
+        index = [chr(ord('a') + i) for i in range(len(xs))]
+
+        for vals in [xs, xs + 1e6, xs * 1e-6]:
+            ts = Series(vals, index=index)
+
+            for m in ['average', 'min', 'max', 'first', 'dense']:
+                result = ts.rank(method=m)
+                sprank = rankdata(vals, m if m != 'first' else 'ordinal')
+                expected = Series(sprank, index=index)
+
+                if LooseVersion(scipy.__version__) >= LooseVersion('0.17.0'):
+                    expected = expected.astype('float64')
+                tm.assert_series_equal(result, expected)
+
+    def test_rank_dense_method(self):
+        dtypes = ['O', 'f8', 'i8']
+        in_out = [([1], [1]),
+                  ([2], [1]),
+                  ([0], [1]),
+                  ([2, 2], [1, 1]),
+                  ([1, 2, 3], [1, 2, 3]),
+                  ([4, 2, 1], [3, 2, 1],),
+                  ([1, 1, 5, 5, 3], [1, 1, 3, 3, 2]),
+                  ([-5, -4, -3, -2, -1], [1, 2, 3, 4, 5])]
+
+        for ser, exp in in_out:
+            for dtype in dtypes:
+                s = Series(ser).astype(dtype)
+                result = s.rank(method='dense')
+                expected = Series(exp).astype(result.dtype)
+                assert_series_equal(result, expected)
+
+    def test_rank_descending(self):
+        dtypes = ['O', 'f8', 'i8']
+
+        for dtype, method in product(dtypes, self.results):
+            if 'i' in dtype:
+                s = self.s.dropna()
+            else:
+                s = self.s.astype(dtype)
+
+            res = s.rank(ascending=False)
+            expected = (s.max() - s).rank()
+            assert_series_equal(res, expected)
+
+            if method == 'first' and dtype == 'O':
+                continue
+
+            expected = (s.max() - s).rank(method=method)
+            res2 = s.rank(method=method, ascending=False)
+            assert_series_equal(res2, expected)
+
+    def test_rank_int(self):
+        s = self.s.dropna().astype('i8')
+
+        for method, res in compat.iteritems(self.results):
+            result = s.rank(method=method)
+            expected = Series(res).dropna()
+            expected.index = result.index
+            assert_series_equal(result, expected)
+
+    def test_rank_object_bug(self):
+        # GH 13445
+
+        # smoke tests
+        Series([np.nan] * 32).astype(object).rank(ascending=True)
+        Series([np.nan] * 32).astype(object).rank(ascending=False)
+
+    def test_rank_modify_inplace(self):
+        # GH 18521
+        # Check rank does not mutate series
+        s = Series([Timestamp('2017-01-05 10:20:27.569000'), NaT])
+        expected = s.copy()
+
+        s.rank()
+        result = s
+        assert_series_equal(result, expected)
+
+
+# GH15630, pct should be on 100% basis when method='dense'
+
+@pytest.mark.parametrize('dtype', ['O', 'f8', 'i8'])
+@pytest.mark.parametrize('ser, exp', [
+    ([1], [1.]),
+    ([1, 2], [1. / 2, 2. / 2]),
+    ([2, 2], [1., 1.]),
+    ([1, 2, 3], [1. / 3, 2. / 3, 3. / 3]),
+    ([1, 2, 2], [1. / 2, 2. / 2, 2. / 2]),
+    ([4, 2, 1], [3. / 3, 2. / 3, 1. / 3],),
+    ([1, 1, 5, 5, 3], [1. / 3, 1. / 3, 3. / 3, 3. / 3, 2. / 3]),
+    ([1, 1, 3, 3, 5, 5], [1. / 3, 1. / 3, 2. / 3, 2. / 3, 3. / 3, 3. / 3]),
+    ([-5, -4, -3, -2, -1], [1. / 5, 2. / 5, 3. / 5, 4. / 5, 5. / 5])])
+def test_rank_dense_pct(dtype, ser, exp):
+        s = Series(ser).astype(dtype)
+        result = s.rank(method='dense', pct=True)
+        expected = Series(exp).astype(result.dtype)
+        assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('dtype', ['O', 'f8', 'i8'])
+@pytest.mark.parametrize('ser, exp', [
+    ([1], [1.]),
+    ([1, 2], [1. / 2, 2. / 2]),
+    ([2, 2], [1. / 2, 1. / 2]),
+    ([1, 2, 3], [1. / 3, 2. / 3, 3. / 3]),
+    ([1, 2, 2], [1. / 3, 2. / 3, 2. / 3]),
+    ([4, 2, 1], [3. / 3, 2. / 3, 1. / 3],),
+    ([1, 1, 5, 5, 3], [1. / 5, 1. / 5, 4. / 5, 4. / 5, 3. / 5]),
+    ([1, 1, 3, 3, 5, 5], [1. / 6, 1. / 6, 3. / 6, 3. / 6, 5. / 6, 5. / 6]),
+    ([-5, -4, -3, -2, -1], [1. / 5, 2. / 5, 3. / 5, 4. / 5, 5. / 5])])
+def test_rank_min_pct(dtype, ser, exp):
+        s = Series(ser).astype(dtype)
+        result = s.rank(method='min', pct=True)
+        expected = Series(exp).astype(result.dtype)
+        assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('dtype', ['O', 'f8', 'i8'])
+@pytest.mark.parametrize('ser, exp', [
+    ([1], [1.]),
+    ([1, 2], [1. / 2, 2. / 2]),
+    ([2, 2], [1., 1.]),
+    ([1, 2, 3], [1. / 3, 2. / 3, 3. / 3]),
+    ([1, 2, 2], [1. / 3, 3. / 3, 3. / 3]),
+    ([4, 2, 1], [3. / 3, 2. / 3, 1. / 3],),
+    ([1, 1, 5, 5, 3], [2. / 5, 2. / 5, 5. / 5, 5. / 5, 3. / 5]),
+    ([1, 1, 3, 3, 5, 5], [2. / 6, 2. / 6, 4. / 6, 4. / 6, 6. / 6, 6. / 6]),
+    ([-5, -4, -3, -2, -1], [1. / 5, 2. / 5, 3. / 5, 4. / 5, 5. / 5])])
+def test_rank_max_pct(dtype, ser, exp):
+        s = Series(ser).astype(dtype)
+        result = s.rank(method='max', pct=True)
+        expected = Series(exp).astype(result.dtype)
+        assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('dtype', ['O', 'f8', 'i8'])
+@pytest.mark.parametrize('ser, exp', [
+    ([1], [1.]),
+    ([1, 2], [1. / 2, 2. / 2]),
+    ([2, 2], [1.5 / 2, 1.5 / 2]),
+    ([1, 2, 3], [1. / 3, 2. / 3, 3. / 3]),
+    ([1, 2, 2], [1. / 3, 2.5 / 3, 2.5 / 3]),
+    ([4, 2, 1], [3. / 3, 2. / 3, 1. / 3],),
+    ([1, 1, 5, 5, 3], [1.5 / 5, 1.5 / 5, 4.5 / 5, 4.5 / 5, 3. / 5]),
+    ([1, 1, 3, 3, 5, 5],
+     [1.5 / 6, 1.5 / 6, 3.5 / 6, 3.5 / 6, 5.5 / 6, 5.5 / 6]),
+    ([-5, -4, -3, -2, -1], [1. / 5, 2. / 5, 3. / 5, 4. / 5, 5. / 5])])
+def test_rank_average_pct(dtype, ser, exp):
+        s = Series(ser).astype(dtype)
+        result = s.rank(method='average', pct=True)
+        expected = Series(exp).astype(result.dtype)
+        assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('dtype', ['f8', 'i8'])
+@pytest.mark.parametrize('ser, exp', [
+    ([1], [1.]),
+    ([1, 2], [1. / 2, 2. / 2]),
+    ([2, 2], [1. / 2, 2. / 2.]),
+    ([1, 2, 3], [1. / 3, 2. / 3, 3. / 3]),
+    ([1, 2, 2], [1. / 3, 2. / 3, 3. / 3]),
+    ([4, 2, 1], [3. / 3, 2. / 3, 1. / 3],),
+    ([1, 1, 5, 5, 3], [1. / 5, 2. / 5, 4. / 5, 5. / 5, 3. / 5]),
+    ([1, 1, 3, 3, 5, 5], [1. / 6, 2. / 6, 3. / 6, 4. / 6, 5. / 6, 6. / 6]),
+    ([-5, -4, -3, -2, -1], [1. / 5, 2. / 5, 3. / 5, 4. / 5, 5. / 5])])
+def test_rank_first_pct(dtype, ser, exp):
+        s = Series(ser).astype(dtype)
+        result = s.rank(method='first', pct=True)
+        expected = Series(exp).astype(result.dtype)
+        assert_series_equal(result, expected)
diff --git a/pandas/tests/series/test_replace.py b/pandas/tests/series/test_replace.py
new file mode 100644
index 0000000000000..a3b92798879f5
--- /dev/null
+++ b/pandas/tests/series/test_replace.py
@@ -0,0 +1,258 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+
+import numpy as np
+import pandas as pd
+import pandas._libs.lib as lib
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestSeriesReplace(TestData):
+    def test_replace(self):
+        N = 100
+        ser = pd.Series(np.random.randn(N))
+        ser[0:4] = np.nan
+        ser[6:10] = 0
+
+        # replace list with a single value
+        ser.replace([np.nan], -1, inplace=True)
+
+        exp = ser.fillna(-1)
+        tm.assert_series_equal(ser, exp)
+
+        rs = ser.replace(0., np.nan)
+        ser[ser == 0.] = np.nan
+        tm.assert_series_equal(rs, ser)
+
+        ser = pd.Series(np.fabs(np.random.randn(N)), tm.makeDateIndex(N),
+                        dtype=object)
+        ser[:5] = np.nan
+        ser[6:10] = 'foo'
+        ser[20:30] = 'bar'
+
+        # replace list with a single value
+        rs = ser.replace([np.nan, 'foo', 'bar'], -1)
+
+        assert (rs[:5] == -1).all()
+        assert (rs[6:10] == -1).all()
+        assert (rs[20:30] == -1).all()
+        assert (pd.isna(ser[:5])).all()
+
+        # replace with different values
+        rs = ser.replace({np.nan: -1, 'foo': -2, 'bar': -3})
+
+        assert (rs[:5] == -1).all()
+        assert (rs[6:10] == -2).all()
+        assert (rs[20:30] == -3).all()
+        assert (pd.isna(ser[:5])).all()
+
+        # replace with different values with 2 lists
+        rs2 = ser.replace([np.nan, 'foo', 'bar'], [-1, -2, -3])
+        tm.assert_series_equal(rs, rs2)
+
+        # replace inplace
+        ser.replace([np.nan, 'foo', 'bar'], -1, inplace=True)
+
+        assert (ser[:5] == -1).all()
+        assert (ser[6:10] == -1).all()
+        assert (ser[20:30] == -1).all()
+
+        ser = pd.Series([np.nan, 0, np.inf])
+        tm.assert_series_equal(ser.replace(np.nan, 0), ser.fillna(0))
+
+        ser = pd.Series([np.nan, 0, 'foo', 'bar', np.inf, None, lib.NaT])
+        tm.assert_series_equal(ser.replace(np.nan, 0), ser.fillna(0))
+        filled = ser.copy()
+        filled[4] = 0
+        tm.assert_series_equal(ser.replace(np.inf, 0), filled)
+
+        ser = pd.Series(self.ts.index)
+        tm.assert_series_equal(ser.replace(np.nan, 0), ser.fillna(0))
+
+        # malformed
+        pytest.raises(ValueError, ser.replace, [1, 2, 3], [np.nan, 0])
+
+        # make sure that we aren't just masking a TypeError because bools don't
+        # implement indexing
+        with tm.assert_raises_regex(TypeError, 'Cannot compare types .+'):
+            ser.replace([1, 2], [np.nan, 0])
+
+        ser = pd.Series([0, 1, 2, 3, 4])
+        result = ser.replace([0, 1, 2, 3, 4], [4, 3, 2, 1, 0])
+        tm.assert_series_equal(result, pd.Series([4, 3, 2, 1, 0]))
+
+    def test_replace_gh5319(self):
+        # API change from 0.12?
+        # GH 5319
+        ser = pd.Series([0, np.nan, 2, 3, 4])
+        expected = ser.ffill()
+        result = ser.replace([np.nan])
+        tm.assert_series_equal(result, expected)
+
+        ser = pd.Series([0, np.nan, 2, 3, 4])
+        expected = ser.ffill()
+        result = ser.replace(np.nan)
+        tm.assert_series_equal(result, expected)
+        # GH 5797
+        ser = pd.Series(pd.date_range('20130101', periods=5))
+        expected = ser.copy()
+        expected.loc[2] = pd.Timestamp('20120101')
+        result = ser.replace({pd.Timestamp('20130103'):
+                              pd.Timestamp('20120101')})
+        tm.assert_series_equal(result, expected)
+        result = ser.replace(pd.Timestamp('20130103'),
+                             pd.Timestamp('20120101'))
+        tm.assert_series_equal(result, expected)
+
+        # GH 11792: Test with replacing NaT in a list with tz data
+        ts = pd.Timestamp('2015/01/01', tz='UTC')
+        s = pd.Series([pd.NaT, pd.Timestamp('2015/01/01', tz='UTC')])
+        result = s.replace([np.nan, pd.NaT], pd.Timestamp.min)
+        expected = pd.Series([pd.Timestamp.min, ts], dtype=object)
+        tm.assert_series_equal(expected, result)
+
+    def test_replace_with_single_list(self):
+        ser = pd.Series([0, 1, 2, 3, 4])
+        result = ser.replace([1, 2, 3])
+        tm.assert_series_equal(result, pd.Series([0, 0, 0, 0, 4]))
+
+        s = ser.copy()
+        s.replace([1, 2, 3], inplace=True)
+        tm.assert_series_equal(s, pd.Series([0, 0, 0, 0, 4]))
+
+        # make sure things don't get corrupted when fillna call fails
+        s = ser.copy()
+        with pytest.raises(ValueError):
+            s.replace([1, 2, 3], inplace=True, method='crash_cymbal')
+        tm.assert_series_equal(s, ser)
+
+    def test_replace_mixed_types(self):
+        s = pd.Series(np.arange(5), dtype='int64')
+
+        def check_replace(to_rep, val, expected):
+            sc = s.copy()
+            r = s.replace(to_rep, val)
+            sc.replace(to_rep, val, inplace=True)
+            tm.assert_series_equal(expected, r)
+            tm.assert_series_equal(expected, sc)
+
+        # MUST upcast to float
+        e = pd.Series([0., 1., 2., 3., 4.])
+        tr, v = [3], [3.0]
+        check_replace(tr, v, e)
+
+        # MUST upcast to float
+        e = pd.Series([0, 1, 2, 3.5, 4])
+        tr, v = [3], [3.5]
+        check_replace(tr, v, e)
+
+        # casts to object
+        e = pd.Series([0, 1, 2, 3.5, 'a'])
+        tr, v = [3, 4], [3.5, 'a']
+        check_replace(tr, v, e)
+
+        # again casts to object
+        e = pd.Series([0, 1, 2, 3.5, pd.Timestamp('20130101')])
+        tr, v = [3, 4], [3.5, pd.Timestamp('20130101')]
+        check_replace(tr, v, e)
+
+        # casts to object
+        e = pd.Series([0, 1, 2, 3.5, True], dtype='object')
+        tr, v = [3, 4], [3.5, True]
+        check_replace(tr, v, e)
+
+        # test an object with dates + floats + integers + strings
+        dr = pd.date_range('1/1/2001', '1/10/2001',
+                           freq='D').to_series().reset_index(drop=True)
+        result = dr.astype(object).replace(
+            [dr[0], dr[1], dr[2]], [1.0, 2, 'a'])
+        expected = pd.Series([1.0, 2, 'a'] + dr[3:].tolist(), dtype=object)
+        tm.assert_series_equal(result, expected)
+
+    def test_replace_bool_with_string_no_op(self):
+        s = pd.Series([True, False, True])
+        result = s.replace('fun', 'in-the-sun')
+        tm.assert_series_equal(s, result)
+
+    def test_replace_bool_with_string(self):
+        # nonexistent elements
+        s = pd.Series([True, False, True])
+        result = s.replace(True, '2u')
+        expected = pd.Series(['2u', False, '2u'])
+        tm.assert_series_equal(expected, result)
+
+    def test_replace_bool_with_bool(self):
+        s = pd.Series([True, False, True])
+        result = s.replace(True, False)
+        expected = pd.Series([False] * len(s))
+        tm.assert_series_equal(expected, result)
+
+    def test_replace_with_dict_with_bool_keys(self):
+        s = pd.Series([True, False, True])
+        with tm.assert_raises_regex(TypeError, 'Cannot compare types .+'):
+            s.replace({'asdf': 'asdb', True: 'yes'})
+
+    def test_replace2(self):
+        N = 100
+        ser = pd.Series(np.fabs(np.random.randn(N)), tm.makeDateIndex(N),
+                        dtype=object)
+        ser[:5] = np.nan
+        ser[6:10] = 'foo'
+        ser[20:30] = 'bar'
+
+        # replace list with a single value
+        rs = ser.replace([np.nan, 'foo', 'bar'], -1)
+
+        assert (rs[:5] == -1).all()
+        assert (rs[6:10] == -1).all()
+        assert (rs[20:30] == -1).all()
+        assert (pd.isna(ser[:5])).all()
+
+        # replace with different values
+        rs = ser.replace({np.nan: -1, 'foo': -2, 'bar': -3})
+
+        assert (rs[:5] == -1).all()
+        assert (rs[6:10] == -2).all()
+        assert (rs[20:30] == -3).all()
+        assert (pd.isna(ser[:5])).all()
+
+        # replace with different values with 2 lists
+        rs2 = ser.replace([np.nan, 'foo', 'bar'], [-1, -2, -3])
+        tm.assert_series_equal(rs, rs2)
+
+        # replace inplace
+        ser.replace([np.nan, 'foo', 'bar'], -1, inplace=True)
+        assert (ser[:5] == -1).all()
+        assert (ser[6:10] == -1).all()
+        assert (ser[20:30] == -1).all()
+
+    def test_replace_with_empty_dictlike(self):
+        # GH 15289
+        s = pd.Series(list('abcd'))
+        tm.assert_series_equal(s, s.replace(dict()))
+        tm.assert_series_equal(s, s.replace(pd.Series([])))
+
+    def test_replace_string_with_number(self):
+        # GH 15743
+        s = pd.Series([1, 2, 3])
+        result = s.replace('2', np.nan)
+        expected = pd.Series([1, 2, 3])
+        tm.assert_series_equal(expected, result)
+
+    def test_replace_unicode_with_number(self):
+        # GH 15743
+        s = pd.Series([1, 2, 3])
+        result = s.replace(u'2', np.nan)
+        expected = pd.Series([1, 2, 3])
+        tm.assert_series_equal(expected, result)
+
+    def test_replace_mixed_types_with_string(self):
+        # Testing mixed
+        s = pd.Series([1, 2, 3, '4', 4, 5])
+        result = s.replace([2, '4'], np.nan)
+        expected = pd.Series([1, np.nan, 3, np.nan, 4, 5])
+        tm.assert_series_equal(expected, result)
diff --git a/pandas/tests/series/test_repr.py b/pandas/tests/series/test_repr.py
new file mode 100644
index 0000000000000..730c2b7865f1f
--- /dev/null
+++ b/pandas/tests/series/test_repr.py
@@ -0,0 +1,478 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+from datetime import datetime, timedelta
+
+import sys
+
+import numpy as np
+import pandas as pd
+
+from pandas import (Index, Series, DataFrame, date_range, option_context,
+                    Categorical, period_range, timedelta_range)
+from pandas.core.index import MultiIndex
+from pandas.core.base import StringMixin
+
+from pandas.compat import lrange, range, u
+from pandas import compat
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestSeriesRepr(TestData):
+
+    def test_multilevel_name_print(self):
+        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
+                                                                  'three']],
+                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           names=['first', 'second'])
+        s = Series(lrange(0, len(index)), index=index, name='sth')
+        expected = ["first  second", "foo    one       0",
+                    "       two       1", "       three     2",
+                    "bar    one       3", "       two       4",
+                    "baz    two       5", "       three     6",
+                    "qux    one       7", "       two       8",
+                    "       three     9", "Name: sth, dtype: int64"]
+        expected = "\n".join(expected)
+        assert repr(s) == expected
+
+    def test_name_printing(self):
+        # Test small Series.
+        s = Series([0, 1, 2])
+
+        s.name = "test"
+        assert "Name: test" in repr(s)
+
+        s.name = None
+        assert "Name:" not in repr(s)
+
+        # Test big Series (diff code path).
+        s = Series(lrange(0, 1000))
+
+        s.name = "test"
+        assert "Name: test" in repr(s)
+
+        s.name = None
+        assert "Name:" not in repr(s)
+
+        s = Series(index=date_range('20010101', '20020101'), name='test')
+        assert "Name: test" in repr(s)
+
+    def test_repr(self):
+        str(self.ts)
+        str(self.series)
+        str(self.series.astype(int))
+        str(self.objSeries)
+
+        str(Series(tm.randn(1000), index=np.arange(1000)))
+        str(Series(tm.randn(1000), index=np.arange(1000, 0, step=-1)))
+
+        # empty
+        str(self.empty)
+
+        # with NaNs
+        self.series[5:7] = np.NaN
+        str(self.series)
+
+        # with Nones
+        ots = self.ts.astype('O')
+        ots[::2] = None
+        repr(ots)
+
+        # various names
+        for name in ['', 1, 1.2, 'foo', u('\u03B1\u03B2\u03B3'),
+                     'loooooooooooooooooooooooooooooooooooooooooooooooooooong',
+                     ('foo', 'bar', 'baz'), (1, 2), ('foo', 1, 2.3),
+                     (u('\u03B1'), u('\u03B2'), u('\u03B3')),
+                     (u('\u03B1'), 'bar')]:
+            self.series.name = name
+            repr(self.series)
+
+        biggie = Series(tm.randn(1000), index=np.arange(1000),
+                        name=('foo', 'bar', 'baz'))
+        repr(biggie)
+
+        # 0 as name
+        ser = Series(np.random.randn(100), name=0)
+        rep_str = repr(ser)
+        assert "Name: 0" in rep_str
+
+        # tidy repr
+        ser = Series(np.random.randn(1001), name=0)
+        rep_str = repr(ser)
+        assert "Name: 0" in rep_str
+
+        ser = Series(["a\n\r\tb"], name="a\n\r\td", index=["a\n\r\tf"])
+        assert "\t" not in repr(ser)
+        assert "\r" not in repr(ser)
+        assert "a\n" not in repr(ser)
+
+        # with empty series (#4651)
+        s = Series([], dtype=np.int64, name='foo')
+        assert repr(s) == 'Series([], Name: foo, dtype: int64)'
+
+        s = Series([], dtype=np.int64, name=None)
+        assert repr(s) == 'Series([], dtype: int64)'
+
+    def test_tidy_repr(self):
+        a = Series([u("\u05d0")] * 1000)
+        a.name = 'title1'
+        repr(a)  # should not raise exception
+
+    @tm.capture_stderr
+    def test_repr_bool_fails(self):
+        s = Series([DataFrame(np.random.randn(2, 2)) for i in range(5)])
+
+        # It works (with no Cython exception barf)!
+        repr(s)
+
+        output = sys.stderr.getvalue()
+        assert output == ''
+
+    def test_repr_name_iterable_indexable(self):
+        s = Series([1, 2, 3], name=np.int64(3))
+
+        # it works!
+        repr(s)
+
+        s.name = (u("\u05d0"), ) * 2
+        repr(s)
+
+    def test_repr_should_return_str(self):
+        # https://docs.python.org/3/reference/datamodel.html#object.__repr__
+        # ...The return value must be a string object.
+
+        # (str on py2.x, str (unicode) on py3)
+
+        data = [8, 5, 3, 5]
+        index1 = [u("\u03c3"), u("\u03c4"), u("\u03c5"), u("\u03c6")]
+        df = Series(data, index=index1)
+        assert type(df.__repr__() == str)  # both py2 / 3
+
+    def test_repr_max_rows(self):
+        # GH 6863
+        with pd.option_context('max_rows', None):
+            str(Series(range(1001)))  # should not raise exception
+
+    def test_unicode_string_with_unicode(self):
+        df = Series([u("\u05d0")], name=u("\u05d1"))
+        if compat.PY3:
+            str(df)
+        else:
+            compat.text_type(df)
+
+    def test_bytestring_with_unicode(self):
+        df = Series([u("\u05d0")], name=u("\u05d1"))
+        if compat.PY3:
+            bytes(df)
+        else:
+            str(df)
+
+    def test_timeseries_repr_object_dtype(self):
+        index = Index([datetime(2000, 1, 1) + timedelta(i)
+                       for i in range(1000)], dtype=object)
+        ts = Series(np.random.randn(len(index)), index)
+        repr(ts)
+
+        ts = tm.makeTimeSeries(1000)
+        assert repr(ts).splitlines()[-1].startswith('Freq:')
+
+        ts2 = ts.iloc[np.random.randint(0, len(ts) - 1, 400)]
+        repr(ts2).splitlines()[-1]
+
+    def test_latex_repr(self):
+        result = r"""\begin{tabular}{ll}
+\toprule
+{} &         0 \\
+\midrule
+0 &  $\alpha$ \\
+1 &         b \\
+2 &         c \\
+\bottomrule
+\end{tabular}
+"""
+        with option_context('display.latex.escape', False,
+                            'display.latex.repr', True):
+            s = Series([r'$\alpha$', 'b', 'c'])
+            assert result == s._repr_latex_()
+
+        assert s._repr_latex_() is None
+
+
+class TestCategoricalRepr(object):
+
+    def test_categorical_repr_unicode(self):
+        # GH#21002 if len(index) > 60, sys.getdefaultencoding()=='ascii',
+        # and we are working in PY2, then rendering a Categorical could raise
+        # UnicodeDecodeError by trying to decode when it shouldn't
+
+        class County(StringMixin):
+            name = u'San Sebastián'
+            state = u'PR'
+
+            def __unicode__(self):
+                return self.name + u', ' + self.state
+
+        cat = pd.Categorical([County() for n in range(61)])
+        idx = pd.Index(cat)
+        ser = idx.to_series()
+
+        if compat.PY3:
+            # no reloading of sys, just check that the default (utf8) works
+            # as expected
+            repr(ser)
+            str(ser)
+
+        else:
+            # set sys.defaultencoding to ascii, then change it back after
+            # the test
+            with tm.set_defaultencoding('ascii'):
+                repr(ser)
+                str(ser)
+
+    def test_categorical_repr(self):
+        a = Series(Categorical([1, 2, 3, 4]))
+        exp = u("0    1\n1    2\n2    3\n3    4\n" +
+                "dtype: category\nCategories (4, int64): [1, 2, 3, 4]")
+
+        assert exp == a.__unicode__()
+
+        a = Series(Categorical(["a", "b"] * 25))
+        exp = u("0     a\n1     b\n" + "     ..\n" + "48    a\n49    b\n" +
+                "Length: 50, dtype: category\nCategories (2, object): [a, b]")
+        with option_context("display.max_rows", 5):
+            assert exp == repr(a)
+
+        levs = list("abcdefghijklmnopqrstuvwxyz")
+        a = Series(Categorical(["a", "b"], categories=levs, ordered=True))
+        exp = u("0    a\n1    b\n" + "dtype: category\n"
+                "Categories (26, object): [a < b < c < d ... w < x < y < z]")
+        assert exp == a.__unicode__()
+
+    def test_categorical_series_repr(self):
+        s = Series(Categorical([1, 2, 3]))
+        exp = """0    1
+1    2
+2    3
+dtype: category
+Categories (3, int64): [1, 2, 3]"""
+
+        assert repr(s) == exp
+
+        s = Series(Categorical(np.arange(10)))
+        exp = """0    0
+1    1
+2    2
+3    3
+4    4
+5    5
+6    6
+7    7
+8    8
+9    9
+dtype: category
+Categories (10, int64): [0, 1, 2, 3, ..., 6, 7, 8, 9]"""
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_ordered(self):
+        s = Series(Categorical([1, 2, 3], ordered=True))
+        exp = """0    1
+1    2
+2    3
+dtype: category
+Categories (3, int64): [1 < 2 < 3]"""
+
+        assert repr(s) == exp
+
+        s = Series(Categorical(np.arange(10), ordered=True))
+        exp = """0    0
+1    1
+2    2
+3    3
+4    4
+5    5
+6    6
+7    7
+8    8
+9    9
+dtype: category
+Categories (10, int64): [0 < 1 < 2 < 3 ... 6 < 7 < 8 < 9]"""
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_datetime(self):
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5)
+        s = Series(Categorical(idx))
+        exp = """0   2011-01-01 09:00:00
+1   2011-01-01 10:00:00
+2   2011-01-01 11:00:00
+3   2011-01-01 12:00:00
+4   2011-01-01 13:00:00
+dtype: category
+Categories (5, datetime64[ns]): [2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00,
+                                 2011-01-01 12:00:00, 2011-01-01 13:00:00]"""  # noqa
+
+        assert repr(s) == exp
+
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5,
+                         tz='US/Eastern')
+        s = Series(Categorical(idx))
+        exp = """0   2011-01-01 09:00:00-05:00
+1   2011-01-01 10:00:00-05:00
+2   2011-01-01 11:00:00-05:00
+3   2011-01-01 12:00:00-05:00
+4   2011-01-01 13:00:00-05:00
+dtype: category
+Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00,
+                                             2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00,
+                                             2011-01-01 13:00:00-05:00]"""  # noqa
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_datetime_ordered(self):
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5)
+        s = Series(Categorical(idx, ordered=True))
+        exp = """0   2011-01-01 09:00:00
+1   2011-01-01 10:00:00
+2   2011-01-01 11:00:00
+3   2011-01-01 12:00:00
+4   2011-01-01 13:00:00
+dtype: category
+Categories (5, datetime64[ns]): [2011-01-01 09:00:00 < 2011-01-01 10:00:00 < 2011-01-01 11:00:00 <
+                                 2011-01-01 12:00:00 < 2011-01-01 13:00:00]"""  # noqa
+
+        assert repr(s) == exp
+
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5,
+                         tz='US/Eastern')
+        s = Series(Categorical(idx, ordered=True))
+        exp = """0   2011-01-01 09:00:00-05:00
+1   2011-01-01 10:00:00-05:00
+2   2011-01-01 11:00:00-05:00
+3   2011-01-01 12:00:00-05:00
+4   2011-01-01 13:00:00-05:00
+dtype: category
+Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00 < 2011-01-01 10:00:00-05:00 <
+                                             2011-01-01 11:00:00-05:00 < 2011-01-01 12:00:00-05:00 <
+                                             2011-01-01 13:00:00-05:00]"""  # noqa
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_period(self):
+        idx = period_range('2011-01-01 09:00', freq='H', periods=5)
+        s = Series(Categorical(idx))
+        exp = """0   2011-01-01 09:00
+1   2011-01-01 10:00
+2   2011-01-01 11:00
+3   2011-01-01 12:00
+4   2011-01-01 13:00
+dtype: category
+Categories (5, period[H]): [2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00,
+                            2011-01-01 13:00]"""  # noqa
+
+        assert repr(s) == exp
+
+        idx = period_range('2011-01', freq='M', periods=5)
+        s = Series(Categorical(idx))
+        exp = """0   2011-01
+1   2011-02
+2   2011-03
+3   2011-04
+4   2011-05
+dtype: category
+Categories (5, period[M]): [2011-01, 2011-02, 2011-03, 2011-04, 2011-05]"""
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_period_ordered(self):
+        idx = period_range('2011-01-01 09:00', freq='H', periods=5)
+        s = Series(Categorical(idx, ordered=True))
+        exp = """0   2011-01-01 09:00
+1   2011-01-01 10:00
+2   2011-01-01 11:00
+3   2011-01-01 12:00
+4   2011-01-01 13:00
+dtype: category
+Categories (5, period[H]): [2011-01-01 09:00 < 2011-01-01 10:00 < 2011-01-01 11:00 < 2011-01-01 12:00 <
+                            2011-01-01 13:00]"""  # noqa
+
+        assert repr(s) == exp
+
+        idx = period_range('2011-01', freq='M', periods=5)
+        s = Series(Categorical(idx, ordered=True))
+        exp = """0   2011-01
+1   2011-02
+2   2011-03
+3   2011-04
+4   2011-05
+dtype: category
+Categories (5, period[M]): [2011-01 < 2011-02 < 2011-03 < 2011-04 < 2011-05]"""
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_timedelta(self):
+        idx = timedelta_range('1 days', periods=5)
+        s = Series(Categorical(idx))
+        exp = """0   1 days
+1   2 days
+2   3 days
+3   4 days
+4   5 days
+dtype: category
+Categories (5, timedelta64[ns]): [1 days, 2 days, 3 days, 4 days, 5 days]"""
+
+        assert repr(s) == exp
+
+        idx = timedelta_range('1 hours', periods=10)
+        s = Series(Categorical(idx))
+        exp = """0   0 days 01:00:00
+1   1 days 01:00:00
+2   2 days 01:00:00
+3   3 days 01:00:00
+4   4 days 01:00:00
+5   5 days 01:00:00
+6   6 days 01:00:00
+7   7 days 01:00:00
+8   8 days 01:00:00
+9   9 days 01:00:00
+dtype: category
+Categories (10, timedelta64[ns]): [0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00,
+                                   3 days 01:00:00, ..., 6 days 01:00:00, 7 days 01:00:00,
+                                   8 days 01:00:00, 9 days 01:00:00]"""  # noqa
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_timedelta_ordered(self):
+        idx = timedelta_range('1 days', periods=5)
+        s = Series(Categorical(idx, ordered=True))
+        exp = """0   1 days
+1   2 days
+2   3 days
+3   4 days
+4   5 days
+dtype: category
+Categories (5, timedelta64[ns]): [1 days < 2 days < 3 days < 4 days < 5 days]"""  # noqa
+
+        assert repr(s) == exp
+
+        idx = timedelta_range('1 hours', periods=10)
+        s = Series(Categorical(idx, ordered=True))
+        exp = """0   0 days 01:00:00
+1   1 days 01:00:00
+2   2 days 01:00:00
+3   3 days 01:00:00
+4   4 days 01:00:00
+5   5 days 01:00:00
+6   6 days 01:00:00
+7   7 days 01:00:00
+8   8 days 01:00:00
+9   9 days 01:00:00
+dtype: category
+Categories (10, timedelta64[ns]): [0 days 01:00:00 < 1 days 01:00:00 < 2 days 01:00:00 <
+                                   3 days 01:00:00 ... 6 days 01:00:00 < 7 days 01:00:00 <
+                                   8 days 01:00:00 < 9 days 01:00:00]"""  # noqa
+
+        assert repr(s) == exp
diff --git a/pandas/tests/series/test_sorting.py b/pandas/tests/series/test_sorting.py
new file mode 100644
index 0000000000000..13e0d1b12c372
--- /dev/null
+++ b/pandas/tests/series/test_sorting.py
@@ -0,0 +1,267 @@
+# coding=utf-8
+
+import pytest
+
+import numpy as np
+import random
+
+from pandas import DataFrame, Series, MultiIndex, IntervalIndex, Categorical
+
+from pandas.util.testing import assert_series_equal, assert_almost_equal
+import pandas.util.testing as tm
+
+from .common import TestData
+
+
+class TestSeriesSorting(TestData):
+
+    def test_sortlevel_deprecated(self):
+        ts = self.ts.copy()
+
+        # see gh-9816
+        with tm.assert_produces_warning(FutureWarning):
+            ts.sortlevel()
+
+    def test_sort_values(self):
+
+        # check indexes are reordered corresponding with the values
+        ser = Series([3, 2, 4, 1], ['A', 'B', 'C', 'D'])
+        expected = Series([1, 2, 3, 4], ['D', 'B', 'A', 'C'])
+        result = ser.sort_values()
+        tm.assert_series_equal(expected, result)
+
+        ts = self.ts.copy()
+        ts[:5] = np.NaN
+        vals = ts.values
+
+        result = ts.sort_values()
+        assert np.isnan(result[-5:]).all()
+        tm.assert_numpy_array_equal(result[:-5].values, np.sort(vals[5:]))
+
+        # na_position
+        result = ts.sort_values(na_position='first')
+        assert np.isnan(result[:5]).all()
+        tm.assert_numpy_array_equal(result[5:].values, np.sort(vals[5:]))
+
+        # something object-type
+        ser = Series(['A', 'B'], [1, 2])
+        # no failure
+        ser.sort_values()
+
+        # ascending=False
+        ordered = ts.sort_values(ascending=False)
+        expected = np.sort(ts.dropna().values)[::-1]
+        assert_almost_equal(expected, ordered.dropna().values)
+        ordered = ts.sort_values(ascending=False, na_position='first')
+        assert_almost_equal(expected, ordered.dropna().values)
+
+        # ascending=[False] should behave the same as ascending=False
+        ordered = ts.sort_values(ascending=[False])
+        expected = ts.sort_values(ascending=False)
+        assert_series_equal(expected, ordered)
+        ordered = ts.sort_values(ascending=[False], na_position='first')
+        expected = ts.sort_values(ascending=False, na_position='first')
+        assert_series_equal(expected, ordered)
+
+        pytest.raises(ValueError,
+                      lambda: ts.sort_values(ascending=None))
+        pytest.raises(ValueError,
+                      lambda: ts.sort_values(ascending=[]))
+        pytest.raises(ValueError,
+                      lambda: ts.sort_values(ascending=[1, 2, 3]))
+        pytest.raises(ValueError,
+                      lambda: ts.sort_values(ascending=[False, False]))
+        pytest.raises(ValueError,
+                      lambda: ts.sort_values(ascending='foobar'))
+
+        # inplace=True
+        ts = self.ts.copy()
+        ts.sort_values(ascending=False, inplace=True)
+        tm.assert_series_equal(ts, self.ts.sort_values(ascending=False))
+        tm.assert_index_equal(ts.index,
+                              self.ts.sort_values(ascending=False).index)
+
+        # GH 5856/5853
+        # Series.sort_values operating on a view
+        df = DataFrame(np.random.randn(10, 4))
+        s = df.iloc[:, 0]
+
+        def f():
+            s.sort_values(inplace=True)
+
+        pytest.raises(ValueError, f)
+
+    def test_sort_index(self):
+        rindex = list(self.ts.index)
+        random.shuffle(rindex)
+
+        random_order = self.ts.reindex(rindex)
+        sorted_series = random_order.sort_index()
+        assert_series_equal(sorted_series, self.ts)
+
+        # descending
+        sorted_series = random_order.sort_index(ascending=False)
+        assert_series_equal(sorted_series,
+                            self.ts.reindex(self.ts.index[::-1]))
+
+        # compat on level
+        sorted_series = random_order.sort_index(level=0)
+        assert_series_equal(sorted_series, self.ts)
+
+        # compat on axis
+        sorted_series = random_order.sort_index(axis=0)
+        assert_series_equal(sorted_series, self.ts)
+
+        pytest.raises(ValueError, lambda: random_order.sort_values(axis=1))
+
+        sorted_series = random_order.sort_index(level=0, axis=0)
+        assert_series_equal(sorted_series, self.ts)
+
+        pytest.raises(ValueError,
+                      lambda: random_order.sort_index(level=0, axis=1))
+
+    def test_sort_index_inplace(self):
+
+        # For #11402
+        rindex = list(self.ts.index)
+        random.shuffle(rindex)
+
+        # descending
+        random_order = self.ts.reindex(rindex)
+        result = random_order.sort_index(ascending=False, inplace=True)
+
+        assert result is None
+        tm.assert_series_equal(random_order, self.ts.reindex(
+            self.ts.index[::-1]))
+
+        # ascending
+        random_order = self.ts.reindex(rindex)
+        result = random_order.sort_index(ascending=True, inplace=True)
+
+        assert result is None
+        tm.assert_series_equal(random_order, self.ts)
+
+    @pytest.mark.parametrize("level", ['A', 0])  # GH 21052
+    def test_sort_index_multiindex(self, level):
+
+        mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
+        s = Series([1, 2], mi)
+        backwards = s.iloc[[1, 0]]
+
+        # implicit sort_remaining=True
+        res = s.sort_index(level=level)
+        assert_series_equal(backwards, res)
+
+        # GH13496
+        # sort has no effect without remaining lvls
+        res = s.sort_index(level=level, sort_remaining=False)
+        assert_series_equal(s, res)
+
+    def test_sort_index_kind(self):
+        # GH #14444 & #13589:  Add support for sort algo choosing
+        series = Series(index=[3, 2, 1, 4, 3])
+        expected_series = Series(index=[1, 2, 3, 3, 4])
+
+        index_sorted_series = series.sort_index(kind='mergesort')
+        assert_series_equal(expected_series, index_sorted_series)
+
+        index_sorted_series = series.sort_index(kind='quicksort')
+        assert_series_equal(expected_series, index_sorted_series)
+
+        index_sorted_series = series.sort_index(kind='heapsort')
+        assert_series_equal(expected_series, index_sorted_series)
+
+    def test_sort_index_na_position(self):
+        series = Series(index=[3, 2, 1, 4, 3, np.nan])
+
+        expected_series_first = Series(index=[np.nan, 1, 2, 3, 3, 4])
+        index_sorted_series = series.sort_index(na_position='first')
+        assert_series_equal(expected_series_first, index_sorted_series)
+
+        expected_series_last = Series(index=[1, 2, 3, 3, 4, np.nan])
+        index_sorted_series = series.sort_index(na_position='last')
+        assert_series_equal(expected_series_last, index_sorted_series)
+
+    def test_sort_index_intervals(self):
+        s = Series([np.nan, 1, 2, 3], IntervalIndex.from_arrays(
+            [0, 1, 2, 3],
+            [1, 2, 3, 4]))
+
+        result = s.sort_index()
+        expected = s
+        assert_series_equal(result, expected)
+
+        result = s.sort_index(ascending=False)
+        expected = Series([3, 2, 1, np.nan], IntervalIndex.from_arrays(
+            [3, 2, 1, 0],
+            [4, 3, 2, 1]))
+        assert_series_equal(result, expected)
+
+    def test_sort_values_categorical(self):
+
+        c = Categorical(["a", "b", "b", "a"], ordered=False)
+        cat = Series(c.copy())
+
+        # sort in the categories order
+        expected = Series(
+            Categorical(["a", "a", "b", "b"],
+                        ordered=False), index=[0, 3, 1, 2])
+        result = cat.sort_values()
+        tm.assert_series_equal(result, expected)
+
+        cat = Series(Categorical(["a", "c", "b", "d"], ordered=True))
+        res = cat.sort_values()
+        exp = np.array(["a", "b", "c", "d"], dtype=np.object_)
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+
+        cat = Series(Categorical(["a", "c", "b", "d"], categories=[
+                     "a", "b", "c", "d"], ordered=True))
+        res = cat.sort_values()
+        exp = np.array(["a", "b", "c", "d"], dtype=np.object_)
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+
+        res = cat.sort_values(ascending=False)
+        exp = np.array(["d", "c", "b", "a"], dtype=np.object_)
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+
+        raw_cat1 = Categorical(["a", "b", "c", "d"],
+                               categories=["a", "b", "c", "d"], ordered=False)
+        raw_cat2 = Categorical(["a", "b", "c", "d"],
+                               categories=["d", "c", "b", "a"], ordered=True)
+        s = ["a", "b", "c", "d"]
+        df = DataFrame({"unsort": raw_cat1,
+                        "sort": raw_cat2,
+                        "string": s,
+                        "values": [1, 2, 3, 4]})
+
+        # Cats must be sorted in a dataframe
+        res = df.sort_values(by=["string"], ascending=False)
+        exp = np.array(["d", "c", "b", "a"], dtype=np.object_)
+        tm.assert_numpy_array_equal(res["sort"].values.__array__(), exp)
+        assert res["sort"].dtype == "category"
+
+        res = df.sort_values(by=["sort"], ascending=False)
+        exp = df.sort_values(by=["string"], ascending=True)
+        tm.assert_series_equal(res["values"], exp["values"])
+        assert res["sort"].dtype == "category"
+        assert res["unsort"].dtype == "category"
+
+        # unordered cat, but we allow this
+        df.sort_values(by=["unsort"], ascending=False)
+
+        # multi-columns sort
+        # GH 7848
+        df = DataFrame({"id": [6, 5, 4, 3, 2, 1],
+                        "raw_grade": ['a', 'b', 'b', 'a', 'a', 'e']})
+        df["grade"] = Categorical(df["raw_grade"], ordered=True)
+        df['grade'] = df['grade'].cat.set_categories(['b', 'e', 'a'])
+
+        # sorts 'grade' according to the order of the categories
+        result = df.sort_values(by=['grade'])
+        expected = df.iloc[[1, 2, 5, 0, 3, 4]]
+        tm.assert_frame_equal(result, expected)
+
+        # multi
+        result = df.sort_values(by=['grade', 'id'])
+        expected = df.iloc[[2, 1, 5, 4, 3, 0]]
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/series/test_subclass.py b/pandas/tests/series/test_subclass.py
new file mode 100644
index 0000000000000..60afaa3b821e1
--- /dev/null
+++ b/pandas/tests/series/test_subclass.py
@@ -0,0 +1,107 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+
+
+class TestSeriesSubclassing(object):
+
+    def test_indexing_sliced(self):
+        s = tm.SubclassedSeries([1, 2, 3, 4], index=list('abcd'))
+        res = s.loc[['a', 'b']]
+        exp = tm.SubclassedSeries([1, 2], index=list('ab'))
+        tm.assert_series_equal(res, exp)
+
+        res = s.iloc[[2, 3]]
+        exp = tm.SubclassedSeries([3, 4], index=list('cd'))
+        tm.assert_series_equal(res, exp)
+
+        res = s.loc[['a', 'b']]
+        exp = tm.SubclassedSeries([1, 2], index=list('ab'))
+        tm.assert_series_equal(res, exp)
+
+    def test_to_frame(self):
+        s = tm.SubclassedSeries([1, 2, 3, 4], index=list('abcd'), name='xxx')
+        res = s.to_frame()
+        exp = tm.SubclassedDataFrame({'xxx': [1, 2, 3, 4]}, index=list('abcd'))
+        tm.assert_frame_equal(res, exp)
+
+    def test_subclass_unstack(self):
+        # GH 15564
+        s = tm.SubclassedSeries(
+            [1, 2, 3, 4], index=[list('aabb'), list('xyxy')])
+
+        res = s.unstack()
+        exp = tm.SubclassedDataFrame(
+            {'x': [1, 3], 'y': [2, 4]}, index=['a', 'b'])
+
+        tm.assert_frame_equal(res, exp)
+
+
+class TestSparseSeriesSubclassing(object):
+
+    def test_subclass_sparse_slice(self):
+        # int64
+        s = tm.SubclassedSparseSeries([1, 2, 3, 4, 5])
+        exp = tm.SubclassedSparseSeries([2, 3, 4], index=[1, 2, 3])
+        tm.assert_sp_series_equal(s.loc[1:3], exp)
+        assert s.loc[1:3].dtype == np.int64
+
+        exp = tm.SubclassedSparseSeries([2, 3], index=[1, 2])
+        tm.assert_sp_series_equal(s.iloc[1:3], exp)
+        assert s.iloc[1:3].dtype == np.int64
+
+        exp = tm.SubclassedSparseSeries([2, 3], index=[1, 2])
+        tm.assert_sp_series_equal(s[1:3], exp)
+        assert s[1:3].dtype == np.int64
+
+        # float64
+        s = tm.SubclassedSparseSeries([1., 2., 3., 4., 5.])
+        exp = tm.SubclassedSparseSeries([2., 3., 4.], index=[1, 2, 3])
+        tm.assert_sp_series_equal(s.loc[1:3], exp)
+        assert s.loc[1:3].dtype == np.float64
+
+        exp = tm.SubclassedSparseSeries([2., 3.], index=[1, 2])
+        tm.assert_sp_series_equal(s.iloc[1:3], exp)
+        assert s.iloc[1:3].dtype == np.float64
+
+        exp = tm.SubclassedSparseSeries([2., 3.], index=[1, 2])
+        tm.assert_sp_series_equal(s[1:3], exp)
+        assert s[1:3].dtype == np.float64
+
+    def test_subclass_sparse_addition(self):
+        s1 = tm.SubclassedSparseSeries([1, 3, 5])
+        s2 = tm.SubclassedSparseSeries([-2, 5, 12])
+        exp = tm.SubclassedSparseSeries([-1, 8, 17])
+        tm.assert_sp_series_equal(s1 + s2, exp)
+
+        s1 = tm.SubclassedSparseSeries([4.0, 5.0, 6.0])
+        s2 = tm.SubclassedSparseSeries([1.0, 2.0, 3.0])
+        exp = tm.SubclassedSparseSeries([5., 7., 9.])
+        tm.assert_sp_series_equal(s1 + s2, exp)
+
+    def test_subclass_sparse_to_frame(self):
+        s = tm.SubclassedSparseSeries([1, 2], index=list('abcd'), name='xxx')
+        res = s.to_frame()
+
+        exp_arr = pd.SparseArray([1, 2], dtype=np.int64, kind='block',
+                                 fill_value=0)
+        exp = tm.SubclassedSparseDataFrame({'xxx': exp_arr},
+                                           index=list('abcd'),
+                                           default_fill_value=0)
+        tm.assert_sp_frame_equal(res, exp)
+
+        # create from int dict
+        res = tm.SubclassedSparseDataFrame({'xxx': [1, 2]},
+                                           index=list('abcd'),
+                                           default_fill_value=0)
+        tm.assert_sp_frame_equal(res, exp)
+
+        s = tm.SubclassedSparseSeries([1.1, 2.1], index=list('abcd'),
+                                      name='xxx')
+        res = s.to_frame()
+        exp = tm.SubclassedSparseDataFrame({'xxx': [1.1, 2.1]},
+                                           index=list('abcd'))
+        tm.assert_sp_frame_equal(res, exp)
diff --git a/pandas/tests/series/test_timeseries.py b/pandas/tests/series/test_timeseries.py
new file mode 100644
index 0000000000000..376b4d71f81e8
--- /dev/null
+++ b/pandas/tests/series/test_timeseries.py
@@ -0,0 +1,1014 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+
+import numpy as np
+from datetime import datetime, timedelta, time
+
+import pandas as pd
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas._libs.tslib import iNaT
+from pandas.compat import lrange, StringIO, product
+from pandas.errors import NullFrequencyError
+
+from pandas.core.indexes.timedeltas import TimedeltaIndex
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.tseries.offsets import BDay, BMonthEnd
+from pandas import (Index, Series, date_range, NaT, concat, DataFrame,
+                    Timestamp, to_datetime, offsets,
+                    timedelta_range)
+from pandas.util.testing import (assert_series_equal, assert_almost_equal,
+                                 assert_frame_equal)
+
+from pandas.tests.series.common import TestData
+
+
+def _simple_ts(start, end, freq='D'):
+    rng = date_range(start, end, freq=freq)
+    return Series(np.random.randn(len(rng)), index=rng)
+
+
+def assert_range_equal(left, right):
+    assert (left.equals(right))
+    assert (left.freq == right.freq)
+    assert (left.tz == right.tz)
+
+
+class TestTimeSeries(TestData):
+
+    def test_shift(self):
+        shifted = self.ts.shift(1)
+        unshifted = shifted.shift(-1)
+
+        tm.assert_index_equal(shifted.index, self.ts.index)
+        tm.assert_index_equal(unshifted.index, self.ts.index)
+        tm.assert_numpy_array_equal(unshifted.dropna().values,
+                                    self.ts.values[:-1])
+
+        offset = BDay()
+        shifted = self.ts.shift(1, freq=offset)
+        unshifted = shifted.shift(-1, freq=offset)
+
+        assert_series_equal(unshifted, self.ts)
+
+        unshifted = self.ts.shift(0, freq=offset)
+        assert_series_equal(unshifted, self.ts)
+
+        shifted = self.ts.shift(1, freq='B')
+        unshifted = shifted.shift(-1, freq='B')
+
+        assert_series_equal(unshifted, self.ts)
+
+        # corner case
+        unshifted = self.ts.shift(0)
+        assert_series_equal(unshifted, self.ts)
+
+        # Shifting with PeriodIndex
+        ps = tm.makePeriodSeries()
+        shifted = ps.shift(1)
+        unshifted = shifted.shift(-1)
+        tm.assert_index_equal(shifted.index, ps.index)
+        tm.assert_index_equal(unshifted.index, ps.index)
+        tm.assert_numpy_array_equal(unshifted.dropna().values, ps.values[:-1])
+
+        shifted2 = ps.shift(1, 'B')
+        shifted3 = ps.shift(1, BDay())
+        assert_series_equal(shifted2, shifted3)
+        assert_series_equal(ps, shifted2.shift(-1, 'B'))
+
+        pytest.raises(ValueError, ps.shift, freq='D')
+
+        # legacy support
+        shifted4 = ps.shift(1, freq='B')
+        assert_series_equal(shifted2, shifted4)
+
+        shifted5 = ps.shift(1, freq=BDay())
+        assert_series_equal(shifted5, shifted4)
+
+        # 32-bit taking
+        # GH 8129
+        index = date_range('2000-01-01', periods=5)
+        for dtype in ['int32', 'int64']:
+            s1 = Series(np.arange(5, dtype=dtype), index=index)
+            p = s1.iloc[1]
+            result = s1.shift(periods=p)
+            expected = Series([np.nan, 0, 1, 2, 3], index=index)
+            assert_series_equal(result, expected)
+
+        # xref 8260
+        # with tz
+        s = Series(date_range('2000-01-01 09:00:00', periods=5,
+                              tz='US/Eastern'), name='foo')
+        result = s - s.shift()
+
+        exp = Series(TimedeltaIndex(['NaT'] + ['1 days'] * 4), name='foo')
+        assert_series_equal(result, exp)
+
+        # incompat tz
+        s2 = Series(date_range('2000-01-01 09:00:00', periods=5,
+                               tz='CET'), name='foo')
+        pytest.raises(TypeError, lambda: s - s2)
+
+    def test_shift2(self):
+        ts = Series(np.random.randn(5),
+                    index=date_range('1/1/2000', periods=5, freq='H'))
+
+        result = ts.shift(1, freq='5T')
+        exp_index = ts.index.shift(1, freq='5T')
+        tm.assert_index_equal(result.index, exp_index)
+
+        # GH #1063, multiple of same base
+        result = ts.shift(1, freq='4H')
+        exp_index = ts.index + offsets.Hour(4)
+        tm.assert_index_equal(result.index, exp_index)
+
+        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-04'])
+        pytest.raises(NullFrequencyError, idx.shift, 1)
+
+    def test_shift_dst(self):
+        # GH 13926
+        dates = date_range('2016-11-06', freq='H', periods=10, tz='US/Eastern')
+        s = Series(dates)
+
+        res = s.shift(0)
+        tm.assert_series_equal(res, s)
+        assert res.dtype == 'datetime64[ns, US/Eastern]'
+
+        res = s.shift(1)
+        exp_vals = [NaT] + dates.astype(object).values.tolist()[:9]
+        exp = Series(exp_vals)
+        tm.assert_series_equal(res, exp)
+        assert res.dtype == 'datetime64[ns, US/Eastern]'
+
+        res = s.shift(-2)
+        exp_vals = dates.astype(object).values.tolist()[2:] + [NaT, NaT]
+        exp = Series(exp_vals)
+        tm.assert_series_equal(res, exp)
+        assert res.dtype == 'datetime64[ns, US/Eastern]'
+
+        for ex in [10, -10, 20, -20]:
+            res = s.shift(ex)
+            exp = Series([NaT] * 10, dtype='datetime64[ns, US/Eastern]')
+            tm.assert_series_equal(res, exp)
+            assert res.dtype == 'datetime64[ns, US/Eastern]'
+
+    def test_tshift(self):
+        # PeriodIndex
+        ps = tm.makePeriodSeries()
+        shifted = ps.tshift(1)
+        unshifted = shifted.tshift(-1)
+
+        assert_series_equal(unshifted, ps)
+
+        shifted2 = ps.tshift(freq='B')
+        assert_series_equal(shifted, shifted2)
+
+        shifted3 = ps.tshift(freq=BDay())
+        assert_series_equal(shifted, shifted3)
+
+        pytest.raises(ValueError, ps.tshift, freq='M')
+
+        # DatetimeIndex
+        shifted = self.ts.tshift(1)
+        unshifted = shifted.tshift(-1)
+
+        assert_series_equal(self.ts, unshifted)
+
+        shifted2 = self.ts.tshift(freq=self.ts.index.freq)
+        assert_series_equal(shifted, shifted2)
+
+        inferred_ts = Series(self.ts.values, Index(np.asarray(self.ts.index)),
+                             name='ts')
+        shifted = inferred_ts.tshift(1)
+        unshifted = shifted.tshift(-1)
+        assert_series_equal(shifted, self.ts.tshift(1))
+        assert_series_equal(unshifted, inferred_ts)
+
+        no_freq = self.ts[[0, 5, 7]]
+        pytest.raises(ValueError, no_freq.tshift)
+
+    def test_truncate(self):
+        offset = BDay()
+
+        ts = self.ts[::3]
+
+        start, end = self.ts.index[3], self.ts.index[6]
+        start_missing, end_missing = self.ts.index[2], self.ts.index[7]
+
+        # neither specified
+        truncated = ts.truncate()
+        assert_series_equal(truncated, ts)
+
+        # both specified
+        expected = ts[1:3]
+
+        truncated = ts.truncate(start, end)
+        assert_series_equal(truncated, expected)
+
+        truncated = ts.truncate(start_missing, end_missing)
+        assert_series_equal(truncated, expected)
+
+        # start specified
+        expected = ts[1:]
+
+        truncated = ts.truncate(before=start)
+        assert_series_equal(truncated, expected)
+
+        truncated = ts.truncate(before=start_missing)
+        assert_series_equal(truncated, expected)
+
+        # end specified
+        expected = ts[:3]
+
+        truncated = ts.truncate(after=end)
+        assert_series_equal(truncated, expected)
+
+        truncated = ts.truncate(after=end_missing)
+        assert_series_equal(truncated, expected)
+
+        # corner case, empty series returned
+        truncated = ts.truncate(after=self.ts.index[0] - offset)
+        assert (len(truncated) == 0)
+
+        truncated = ts.truncate(before=self.ts.index[-1] + offset)
+        assert (len(truncated) == 0)
+
+        pytest.raises(ValueError, ts.truncate,
+                      before=self.ts.index[-1] + offset,
+                      after=self.ts.index[0] - offset)
+
+    def test_truncate_nonsortedindex(self):
+        # GH 17935
+
+        s = pd.Series(['a', 'b', 'c', 'd', 'e'],
+                      index=[5, 3, 2, 9, 0])
+        with tm.assert_raises_regex(ValueError,
+                                    'truncate requires a sorted index'):
+            s.truncate(before=3, after=9)
+
+        rng = pd.date_range('2011-01-01', '2012-01-01', freq='W')
+        ts = pd.Series(np.random.randn(len(rng)), index=rng)
+        with tm.assert_raises_regex(ValueError,
+                                    'truncate requires a sorted index'):
+            ts.sort_values(ascending=False).truncate(before='2011-11',
+                                                     after='2011-12')
+
+    def test_asfreq(self):
+        ts = Series([0., 1., 2.], index=[datetime(2009, 10, 30), datetime(
+            2009, 11, 30), datetime(2009, 12, 31)])
+
+        daily_ts = ts.asfreq('B')
+        monthly_ts = daily_ts.asfreq('BM')
+        tm.assert_series_equal(monthly_ts, ts)
+
+        daily_ts = ts.asfreq('B', method='pad')
+        monthly_ts = daily_ts.asfreq('BM')
+        tm.assert_series_equal(monthly_ts, ts)
+
+        daily_ts = ts.asfreq(BDay())
+        monthly_ts = daily_ts.asfreq(BMonthEnd())
+        tm.assert_series_equal(monthly_ts, ts)
+
+        result = ts[:0].asfreq('M')
+        assert len(result) == 0
+        assert result is not ts
+
+        daily_ts = ts.asfreq('D', fill_value=-1)
+        result = daily_ts.value_counts().sort_index()
+        expected = Series([60, 1, 1, 1],
+                          index=[-1.0, 2.0, 1.0, 0.0]).sort_index()
+        tm.assert_series_equal(result, expected)
+
+    def test_asfreq_datetimeindex_empty_series(self):
+        # GH 14320
+        expected = Series(index=pd.DatetimeIndex(
+            ["2016-09-29 11:00"])).asfreq('H')
+        result = Series(index=pd.DatetimeIndex(["2016-09-29 11:00"]),
+                        data=[3]).asfreq('H')
+        tm.assert_index_equal(expected.index, result.index)
+
+    def test_diff(self):
+        # Just run the function
+        self.ts.diff()
+
+        # int dtype
+        a = 10000000000000000
+        b = a + 1
+        s = Series([a, b])
+
+        rs = s.diff()
+        assert rs[1] == 1
+
+        # neg n
+        rs = self.ts.diff(-1)
+        xp = self.ts - self.ts.shift(-1)
+        assert_series_equal(rs, xp)
+
+        # 0
+        rs = self.ts.diff(0)
+        xp = self.ts - self.ts
+        assert_series_equal(rs, xp)
+
+        # datetime diff (GH3100)
+        s = Series(date_range('20130102', periods=5))
+        rs = s - s.shift(1)
+        xp = s.diff()
+        assert_series_equal(rs, xp)
+
+        # timedelta diff
+        nrs = rs - rs.shift(1)
+        nxp = xp.diff()
+        assert_series_equal(nrs, nxp)
+
+        # with tz
+        s = Series(
+            date_range('2000-01-01 09:00:00', periods=5,
+                       tz='US/Eastern'), name='foo')
+        result = s.diff()
+        assert_series_equal(result, Series(
+            TimedeltaIndex(['NaT'] + ['1 days'] * 4), name='foo'))
+
+    def test_pct_change(self):
+        rs = self.ts.pct_change(fill_method=None)
+        assert_series_equal(rs, self.ts / self.ts.shift(1) - 1)
+
+        rs = self.ts.pct_change(2)
+        filled = self.ts.fillna(method='pad')
+        assert_series_equal(rs, filled / filled.shift(2) - 1)
+
+        rs = self.ts.pct_change(fill_method='bfill', limit=1)
+        filled = self.ts.fillna(method='bfill', limit=1)
+        assert_series_equal(rs, filled / filled.shift(1) - 1)
+
+        rs = self.ts.pct_change(freq='5D')
+        filled = self.ts.fillna(method='pad')
+        assert_series_equal(rs,
+                            (filled / filled.shift(freq='5D') - 1)
+                            .reindex_like(filled))
+
+    def test_pct_change_shift_over_nas(self):
+        s = Series([1., 1.5, np.nan, 2.5, 3.])
+
+        chg = s.pct_change()
+        expected = Series([np.nan, 0.5, 0., 2.5 / 1.5 - 1, .2])
+        assert_series_equal(chg, expected)
+
+    @pytest.mark.parametrize("freq, periods, fill_method, limit",
+                             [('5B', 5, None, None),
+                              ('3B', 3, None, None),
+                              ('3B', 3, 'bfill', None),
+                              ('7B', 7, 'pad', 1),
+                              ('7B', 7, 'bfill', 3),
+                              ('14B', 14, None, None)])
+    def test_pct_change_periods_freq(self, freq, periods, fill_method, limit):
+        # GH 7292
+        rs_freq = self.ts.pct_change(freq=freq,
+                                     fill_method=fill_method,
+                                     limit=limit)
+        rs_periods = self.ts.pct_change(periods,
+                                        fill_method=fill_method,
+                                        limit=limit)
+        assert_series_equal(rs_freq, rs_periods)
+
+        empty_ts = Series(index=self.ts.index)
+        rs_freq = empty_ts.pct_change(freq=freq,
+                                      fill_method=fill_method,
+                                      limit=limit)
+        rs_periods = empty_ts.pct_change(periods,
+                                         fill_method=fill_method,
+                                         limit=limit)
+        assert_series_equal(rs_freq, rs_periods)
+
+    def test_autocorr(self):
+        # Just run the function
+        corr1 = self.ts.autocorr()
+
+        # Now run it with the lag parameter
+        corr2 = self.ts.autocorr(lag=1)
+
+        # corr() with lag needs Series of at least length 2
+        if len(self.ts) <= 2:
+            assert np.isnan(corr1)
+            assert np.isnan(corr2)
+        else:
+            assert corr1 == corr2
+
+        # Choose a random lag between 1 and length of Series - 2
+        # and compare the result with the Series corr() function
+        n = 1 + np.random.randint(max(1, len(self.ts) - 2))
+        corr1 = self.ts.corr(self.ts.shift(n))
+        corr2 = self.ts.autocorr(lag=n)
+
+        # corr() with lag needs Series of at least length 2
+        if len(self.ts) <= 2:
+            assert np.isnan(corr1)
+            assert np.isnan(corr2)
+        else:
+            assert corr1 == corr2
+
+    def test_first_last_valid(self):
+        ts = self.ts.copy()
+        ts[:5] = np.NaN
+
+        index = ts.first_valid_index()
+        assert index == ts.index[5]
+
+        ts[-5:] = np.NaN
+        index = ts.last_valid_index()
+        assert index == ts.index[-6]
+
+        ts[:] = np.nan
+        assert ts.last_valid_index() is None
+        assert ts.first_valid_index() is None
+
+        ser = Series([], index=[])
+        assert ser.last_valid_index() is None
+        assert ser.first_valid_index() is None
+
+        # GH12800
+        empty = Series()
+        assert empty.last_valid_index() is None
+        assert empty.first_valid_index() is None
+
+        # GH20499: its preserves freq with holes
+        ts.index = date_range("20110101", periods=len(ts), freq="B")
+        ts.iloc[1] = 1
+        ts.iloc[-2] = 1
+        assert ts.first_valid_index() == ts.index[1]
+        assert ts.last_valid_index() == ts.index[-2]
+        assert ts.first_valid_index().freq == ts.index.freq
+        assert ts.last_valid_index().freq == ts.index.freq
+
+    def test_mpl_compat_hack(self):
+        result = self.ts[:, np.newaxis]
+        expected = self.ts.values[:, np.newaxis]
+        assert_almost_equal(result, expected)
+
+    def test_timeseries_coercion(self):
+        idx = tm.makeDateIndex(10000)
+        ser = Series(np.random.randn(len(idx)), idx.astype(object))
+        assert ser.index.is_all_dates
+        assert isinstance(ser.index, DatetimeIndex)
+
+    def test_empty_series_ops(self):
+        # see issue #13844
+        a = Series(dtype='M8[ns]')
+        b = Series(dtype='m8[ns]')
+        assert_series_equal(a, a + b)
+        assert_series_equal(a, a - b)
+        assert_series_equal(a, b + a)
+        pytest.raises(TypeError, lambda x, y: x - y, b, a)
+
+    def test_contiguous_boolean_preserve_freq(self):
+        rng = date_range('1/1/2000', '3/1/2000', freq='B')
+
+        mask = np.zeros(len(rng), dtype=bool)
+        mask[10:20] = True
+
+        masked = rng[mask]
+        expected = rng[10:20]
+        assert expected.freq is not None
+        assert_range_equal(masked, expected)
+
+        mask[22] = True
+        masked = rng[mask]
+        assert masked.freq is None
+
+    def test_to_datetime_unit(self):
+
+        epoch = 1370745748
+        s = Series([epoch + t for t in range(20)])
+        result = to_datetime(s, unit='s')
+        expected = Series([Timestamp('2013-06-09 02:42:28') + timedelta(
+            seconds=t) for t in range(20)])
+        assert_series_equal(result, expected)
+
+        s = Series([epoch + t for t in range(20)]).astype(float)
+        result = to_datetime(s, unit='s')
+        expected = Series([Timestamp('2013-06-09 02:42:28') + timedelta(
+            seconds=t) for t in range(20)])
+        assert_series_equal(result, expected)
+
+        s = Series([epoch + t for t in range(20)] + [iNaT])
+        result = to_datetime(s, unit='s')
+        expected = Series([Timestamp('2013-06-09 02:42:28') + timedelta(
+            seconds=t) for t in range(20)] + [NaT])
+        assert_series_equal(result, expected)
+
+        s = Series([epoch + t for t in range(20)] + [iNaT]).astype(float)
+        result = to_datetime(s, unit='s')
+        expected = Series([Timestamp('2013-06-09 02:42:28') + timedelta(
+            seconds=t) for t in range(20)] + [NaT])
+        assert_series_equal(result, expected)
+
+        # GH13834
+        s = Series([epoch + t for t in np.arange(0, 2, .25)] +
+                   [iNaT]).astype(float)
+        result = to_datetime(s, unit='s')
+        expected = Series([Timestamp('2013-06-09 02:42:28') + timedelta(
+            seconds=t) for t in np.arange(0, 2, .25)] + [NaT])
+        assert_series_equal(result, expected)
+
+        s = concat([Series([epoch + t for t in range(20)]
+                           ).astype(float), Series([np.nan])],
+                   ignore_index=True)
+        result = to_datetime(s, unit='s')
+        expected = Series([Timestamp('2013-06-09 02:42:28') + timedelta(
+            seconds=t) for t in range(20)] + [NaT])
+        assert_series_equal(result, expected)
+
+        result = to_datetime([1, 2, 'NaT', pd.NaT, np.nan], unit='D')
+        expected = DatetimeIndex([Timestamp('1970-01-02'),
+                                  Timestamp('1970-01-03')] + ['NaT'] * 3)
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(ValueError):
+            to_datetime([1, 2, 'foo'], unit='D')
+        with pytest.raises(ValueError):
+            to_datetime([1, 2, 111111111], unit='D')
+
+        # coerce we can process
+        expected = DatetimeIndex([Timestamp('1970-01-02'),
+                                  Timestamp('1970-01-03')] + ['NaT'] * 1)
+        result = to_datetime([1, 2, 'foo'], unit='D', errors='coerce')
+        tm.assert_index_equal(result, expected)
+
+        result = to_datetime([1, 2, 111111111], unit='D', errors='coerce')
+        tm.assert_index_equal(result, expected)
+
+    def test_series_ctor_datetime64(self):
+        rng = date_range('1/1/2000 00:00:00', '1/1/2000 1:59:50', freq='10s')
+        dates = np.asarray(rng)
+
+        series = Series(dates)
+        assert np.issubdtype(series.dtype, np.dtype('M8[ns]'))
+
+    def test_series_repr_nat(self):
+        series = Series([0, 1000, 2000, iNaT], dtype='M8[ns]')
+
+        result = repr(series)
+        expected = ('0   1970-01-01 00:00:00.000000\n'
+                    '1   1970-01-01 00:00:00.000001\n'
+                    '2   1970-01-01 00:00:00.000002\n'
+                    '3                          NaT\n'
+                    'dtype: datetime64[ns]')
+        assert result == expected
+
+    def test_asfreq_keep_index_name(self):
+        # GH #9854
+        index_name = 'bar'
+        index = pd.date_range('20130101', periods=20, name=index_name)
+        df = pd.DataFrame([x for x in range(20)], columns=['foo'], index=index)
+
+        assert index_name == df.index.name
+        assert index_name == df.asfreq('10D').index.name
+
+    def test_promote_datetime_date(self):
+        rng = date_range('1/1/2000', periods=20)
+        ts = Series(np.random.randn(20), index=rng)
+
+        ts_slice = ts[5:]
+        ts2 = ts_slice.copy()
+        ts2.index = [x.date() for x in ts2.index]
+
+        result = ts + ts2
+        result2 = ts2 + ts
+        expected = ts + ts[5:]
+        assert_series_equal(result, expected)
+        assert_series_equal(result2, expected)
+
+        # test asfreq
+        result = ts2.asfreq('4H', method='ffill')
+        expected = ts[5:].asfreq('4H', method='ffill')
+        assert_series_equal(result, expected)
+
+        result = rng.get_indexer(ts2.index)
+        expected = rng.get_indexer(ts_slice.index)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_asfreq_normalize(self):
+        rng = date_range('1/1/2000 09:30', periods=20)
+        norm = date_range('1/1/2000', periods=20)
+        vals = np.random.randn(20)
+        ts = Series(vals, index=rng)
+
+        result = ts.asfreq('D', normalize=True)
+        norm = date_range('1/1/2000', periods=20)
+        expected = Series(vals, index=norm)
+
+        assert_series_equal(result, expected)
+
+        vals = np.random.randn(20, 3)
+        ts = DataFrame(vals, index=rng)
+
+        result = ts.asfreq('D', normalize=True)
+        expected = DataFrame(vals, index=norm)
+
+        assert_frame_equal(result, expected)
+
+    def test_first_subset(self):
+        ts = _simple_ts('1/1/2000', '1/1/2010', freq='12h')
+        result = ts.first('10d')
+        assert len(result) == 20
+
+        ts = _simple_ts('1/1/2000', '1/1/2010')
+        result = ts.first('10d')
+        assert len(result) == 10
+
+        result = ts.first('3M')
+        expected = ts[:'3/31/2000']
+        assert_series_equal(result, expected)
+
+        result = ts.first('21D')
+        expected = ts[:21]
+        assert_series_equal(result, expected)
+
+        result = ts[:0].first('3M')
+        assert_series_equal(result, ts[:0])
+
+    def test_first_raises(self):
+        # GH20725
+        ser = pd.Series('a b c'.split())
+        with pytest.raises(TypeError):  # index is not a DatetimeIndex
+            ser.first('1D')
+
+    def test_last_subset(self):
+        ts = _simple_ts('1/1/2000', '1/1/2010', freq='12h')
+        result = ts.last('10d')
+        assert len(result) == 20
+
+        ts = _simple_ts('1/1/2000', '1/1/2010')
+        result = ts.last('10d')
+        assert len(result) == 10
+
+        result = ts.last('21D')
+        expected = ts['12/12/2009':]
+        assert_series_equal(result, expected)
+
+        result = ts.last('21D')
+        expected = ts[-21:]
+        assert_series_equal(result, expected)
+
+        result = ts[:0].last('3M')
+        assert_series_equal(result, ts[:0])
+
+    def test_last_raises(self):
+        # GH20725
+        ser = pd.Series('a b c'.split())
+        with pytest.raises(TypeError):  # index is not a DatetimeIndex
+            ser.last('1D')
+
+    def test_format_pre_1900_dates(self):
+        rng = date_range('1/1/1850', '1/1/1950', freq='A-DEC')
+        rng.format()
+        ts = Series(1, index=rng)
+        repr(ts)
+
+    def test_at_time(self):
+        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+        rs = ts.at_time(rng[1])
+        assert (rs.index.hour == rng[1].hour).all()
+        assert (rs.index.minute == rng[1].minute).all()
+        assert (rs.index.second == rng[1].second).all()
+
+        result = ts.at_time('9:30')
+        expected = ts.at_time(time(9, 30))
+        assert_series_equal(result, expected)
+
+        df = DataFrame(np.random.randn(len(rng), 3), index=rng)
+
+        result = ts[time(9, 30)]
+        result_df = df.loc[time(9, 30)]
+        expected = ts[(rng.hour == 9) & (rng.minute == 30)]
+        exp_df = df[(rng.hour == 9) & (rng.minute == 30)]
+
+        # expected.index = date_range('1/1/2000', '1/4/2000')
+
+        assert_series_equal(result, expected)
+        tm.assert_frame_equal(result_df, exp_df)
+
+        chunk = df.loc['1/4/2000':]
+        result = chunk.loc[time(9, 30)]
+        expected = result_df[-1:]
+        tm.assert_frame_equal(result, expected)
+
+        # midnight, everything
+        rng = date_range('1/1/2000', '1/31/2000')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        result = ts.at_time(time(0, 0))
+        assert_series_equal(result, ts)
+
+        # time doesn't exist
+        rng = date_range('1/1/2012', freq='23Min', periods=384)
+        ts = Series(np.random.randn(len(rng)), rng)
+        rs = ts.at_time('16:00')
+        assert len(rs) == 0
+
+    def test_at_time_raises(self):
+        # GH20725
+        ser = pd.Series('a b c'.split())
+        with pytest.raises(TypeError):  # index is not a DatetimeIndex
+            ser.at_time('00:00')
+
+    def test_between(self):
+        series = Series(date_range('1/1/2000', periods=10))
+        left, right = series[[2, 7]]
+
+        result = series.between(left, right)
+        expected = (series >= left) & (series <= right)
+        assert_series_equal(result, expected)
+
+    def test_between_time(self):
+        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+        stime = time(0, 0)
+        etime = time(1, 0)
+
+        close_open = product([True, False], [True, False])
+        for inc_start, inc_end in close_open:
+            filtered = ts.between_time(stime, etime, inc_start, inc_end)
+            exp_len = 13 * 4 + 1
+            if not inc_start:
+                exp_len -= 5
+            if not inc_end:
+                exp_len -= 4
+
+            assert len(filtered) == exp_len
+            for rs in filtered.index:
+                t = rs.time()
+                if inc_start:
+                    assert t >= stime
+                else:
+                    assert t > stime
+
+                if inc_end:
+                    assert t <= etime
+                else:
+                    assert t < etime
+
+        result = ts.between_time('00:00', '01:00')
+        expected = ts.between_time(stime, etime)
+        assert_series_equal(result, expected)
+
+        # across midnight
+        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+        stime = time(22, 0)
+        etime = time(9, 0)
+
+        close_open = product([True, False], [True, False])
+        for inc_start, inc_end in close_open:
+            filtered = ts.between_time(stime, etime, inc_start, inc_end)
+            exp_len = (12 * 11 + 1) * 4 + 1
+            if not inc_start:
+                exp_len -= 4
+            if not inc_end:
+                exp_len -= 4
+
+            assert len(filtered) == exp_len
+            for rs in filtered.index:
+                t = rs.time()
+                if inc_start:
+                    assert (t >= stime) or (t <= etime)
+                else:
+                    assert (t > stime) or (t <= etime)
+
+                if inc_end:
+                    assert (t <= etime) or (t >= stime)
+                else:
+                    assert (t < etime) or (t >= stime)
+
+    def test_between_time_raises(self):
+        # GH20725
+        ser = pd.Series('a b c'.split())
+        with pytest.raises(TypeError):  # index is not a DatetimeIndex
+            ser.between_time(start_time='00:00', end_time='12:00')
+
+    def test_between_time_types(self):
+        # GH11818
+        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
+        pytest.raises(ValueError, rng.indexer_between_time,
+                      datetime(2010, 1, 2, 1), datetime(2010, 1, 2, 5))
+
+        frame = DataFrame({'A': 0}, index=rng)
+        pytest.raises(ValueError, frame.between_time,
+                      datetime(2010, 1, 2, 1), datetime(2010, 1, 2, 5))
+
+        series = Series(0, index=rng)
+        pytest.raises(ValueError, series.between_time,
+                      datetime(2010, 1, 2, 1), datetime(2010, 1, 2, 5))
+
+    @td.skip_if_has_locale
+    def test_between_time_formats(self):
+        # GH11818
+        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
+        ts = DataFrame(np.random.randn(len(rng), 2), index=rng)
+
+        strings = [("2:00", "2:30"), ("0200", "0230"), ("2:00am", "2:30am"),
+                   ("0200am", "0230am"), ("2:00:00", "2:30:00"),
+                   ("020000", "023000"), ("2:00:00am", "2:30:00am"),
+                   ("020000am", "023000am")]
+        expected_length = 28
+
+        for time_string in strings:
+            assert len(ts.between_time(*time_string)) == expected_length
+
+    def test_to_period(self):
+        from pandas.core.indexes.period import period_range
+
+        ts = _simple_ts('1/1/2000', '1/1/2001')
+
+        pts = ts.to_period()
+        exp = ts.copy()
+        exp.index = period_range('1/1/2000', '1/1/2001')
+        assert_series_equal(pts, exp)
+
+        pts = ts.to_period('M')
+        exp.index = exp.index.asfreq('M')
+        tm.assert_index_equal(pts.index, exp.index.asfreq('M'))
+        assert_series_equal(pts, exp)
+
+        # GH 7606 without freq
+        idx = DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03',
+                             '2011-01-04'])
+        exp_idx = pd.PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03',
+                                  '2011-01-04'], freq='D')
+
+        s = Series(np.random.randn(4), index=idx)
+        expected = s.copy()
+        expected.index = exp_idx
+        assert_series_equal(s.to_period(), expected)
+
+        df = DataFrame(np.random.randn(4, 4), index=idx, columns=idx)
+        expected = df.copy()
+        expected.index = exp_idx
+        assert_frame_equal(df.to_period(), expected)
+
+        expected = df.copy()
+        expected.columns = exp_idx
+        assert_frame_equal(df.to_period(axis=1), expected)
+
+    def test_groupby_count_dateparseerror(self):
+        dr = date_range(start='1/1/2012', freq='5min', periods=10)
+
+        # BAD Example, datetimes first
+        s = Series(np.arange(10), index=[dr, lrange(10)])
+        grouped = s.groupby(lambda x: x[1] % 2 == 0)
+        result = grouped.count()
+
+        s = Series(np.arange(10), index=[lrange(10), dr])
+        grouped = s.groupby(lambda x: x[0] % 2 == 0)
+        expected = grouped.count()
+
+        assert_series_equal(result, expected)
+
+    def test_to_csv_numpy_16_bug(self):
+        frame = DataFrame({'a': date_range('1/1/2000', periods=10)})
+
+        buf = StringIO()
+        frame.to_csv(buf)
+
+        result = buf.getvalue()
+        assert '2000-01-01' in result
+
+    def test_series_map_box_timedelta(self):
+        # GH 11349
+        s = Series(timedelta_range('1 day 1 s', periods=5, freq='h'))
+
+        def f(x):
+            return x.total_seconds()
+
+        s.map(f)
+        s.apply(f)
+        DataFrame(s).applymap(f)
+
+    def test_asfreq_resample_set_correct_freq(self):
+        # GH5613
+        # we test if .asfreq() and .resample() set the correct value for .freq
+        df = pd.DataFrame({'date': ["2012-01-01", "2012-01-02", "2012-01-03"],
+                           'col': [1, 2, 3]})
+        df = df.set_index(pd.to_datetime(df.date))
+
+        # testing the settings before calling .asfreq() and .resample()
+        assert df.index.freq is None
+        assert df.index.inferred_freq == 'D'
+
+        # does .asfreq() set .freq correctly?
+        assert df.asfreq('D').index.freq == 'D'
+
+        # does .resample() set .freq correctly?
+        assert df.resample('D').asfreq().index.freq == 'D'
+
+    def test_pickle(self):
+
+        # GH4606
+        p = tm.round_trip_pickle(NaT)
+        assert p is NaT
+
+        idx = pd.to_datetime(['2013-01-01', NaT, '2014-01-06'])
+        idx_p = tm.round_trip_pickle(idx)
+        assert idx_p[0] == idx[0]
+        assert idx_p[1] is NaT
+        assert idx_p[2] == idx[2]
+
+        # GH11002
+        # don't infer freq
+        idx = date_range('1750-1-1', '2050-1-1', freq='7D')
+        idx_p = tm.round_trip_pickle(idx)
+        tm.assert_index_equal(idx, idx_p)
+
+    def test_setops_preserve_freq(self):
+        for tz in [None, 'Asia/Tokyo', 'US/Eastern']:
+            rng = date_range('1/1/2000', '1/1/2002', name='idx', tz=tz)
+
+            result = rng[:50].union(rng[50:100])
+            assert result.name == rng.name
+            assert result.freq == rng.freq
+            assert result.tz == rng.tz
+
+            result = rng[:50].union(rng[30:100])
+            assert result.name == rng.name
+            assert result.freq == rng.freq
+            assert result.tz == rng.tz
+
+            result = rng[:50].union(rng[60:100])
+            assert result.name == rng.name
+            assert result.freq is None
+            assert result.tz == rng.tz
+
+            result = rng[:50].intersection(rng[25:75])
+            assert result.name == rng.name
+            assert result.freqstr == 'D'
+            assert result.tz == rng.tz
+
+            nofreq = DatetimeIndex(list(rng[25:75]), name='other')
+            result = rng[:50].union(nofreq)
+            assert result.name is None
+            assert result.freq == rng.freq
+            assert result.tz == rng.tz
+
+            result = rng[:50].intersection(nofreq)
+            assert result.name is None
+            assert result.freq == rng.freq
+            assert result.tz == rng.tz
+
+    def test_min_max(self):
+        rng = date_range('1/1/2000', '12/31/2000')
+        rng2 = rng.take(np.random.permutation(len(rng)))
+
+        the_min = rng2.min()
+        the_max = rng2.max()
+        assert isinstance(the_min, Timestamp)
+        assert isinstance(the_max, Timestamp)
+        assert the_min == rng[0]
+        assert the_max == rng[-1]
+
+        assert rng.min() == rng[0]
+        assert rng.max() == rng[-1]
+
+    def test_min_max_series(self):
+        rng = date_range('1/1/2000', periods=10, freq='4h')
+        lvls = ['A', 'A', 'A', 'B', 'B', 'B', 'C', 'C', 'C', 'C']
+        df = DataFrame({'TS': rng, 'V': np.random.randn(len(rng)), 'L': lvls})
+
+        result = df.TS.max()
+        exp = Timestamp(df.TS.iat[-1])
+        assert isinstance(result, Timestamp)
+        assert result == exp
+
+        result = df.TS.min()
+        exp = Timestamp(df.TS.iat[0])
+        assert isinstance(result, Timestamp)
+        assert result == exp
+
+    def test_from_M8_structured(self):
+        dates = [(datetime(2012, 9, 9, 0, 0), datetime(2012, 9, 8, 15, 10))]
+        arr = np.array(dates,
+                       dtype=[('Date', 'M8[us]'), ('Forecasting', 'M8[us]')])
+        df = DataFrame(arr)
+
+        assert df['Date'][0] == dates[0][0]
+        assert df['Forecasting'][0] == dates[0][1]
+
+        s = Series(arr['Date'])
+        assert isinstance(s[0], Timestamp)
+        assert s[0] == dates[0][0]
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            s = Series.from_array(arr['Date'], Index([0]))
+            assert s[0] == dates[0][0]
+
+    def test_get_level_values_box(self):
+        from pandas import MultiIndex
+
+        dates = date_range('1/1/2000', periods=4)
+        levels = [dates, [0, 1]]
+        labels = [[0, 0, 1, 1, 2, 2, 3, 3], [0, 1, 0, 1, 0, 1, 0, 1]]
+
+        index = MultiIndex(levels=levels, labels=labels)
+
+        assert isinstance(index.get_level_values(0)[0], Timestamp)
diff --git a/pandas/tests/series/test_timezones.py b/pandas/tests/series/test_timezones.py
new file mode 100644
index 0000000000000..f2433163352ac
--- /dev/null
+++ b/pandas/tests/series/test_timezones.py
@@ -0,0 +1,310 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for Series timezone-related methods
+"""
+from datetime import datetime
+
+import pytest
+import pytz
+import numpy as np
+from dateutil.tz import tzoffset
+
+import pandas.util.testing as tm
+from pandas._libs import tslib
+from pandas._libs.tslibs import timezones
+from pandas.compat import lrange
+from pandas.core.indexes.datetimes import date_range
+from pandas import Series, Timestamp, DatetimeIndex, Index
+
+
+class TestSeriesTimezones(object):
+    # -----------------------------------------------------------------
+    # Series.tz_localize
+    def test_series_tz_localize(self):
+
+        rng = date_range('1/1/2011', periods=100, freq='H')
+        ts = Series(1, index=rng)
+
+        result = ts.tz_localize('utc')
+        assert result.index.tz.zone == 'UTC'
+
+        # Can't localize if already tz-aware
+        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
+        ts = Series(1, index=rng)
+        tm.assert_raises_regex(TypeError, 'Already tz-aware',
+                               ts.tz_localize, 'US/Eastern')
+
+    def test_series_tz_localize_ambiguous_bool(self):
+        # make sure that we are correctly accepting bool values as ambiguous
+
+        # GH#14402
+        ts = Timestamp('2015-11-01 01:00:03')
+        expected0 = Timestamp('2015-11-01 01:00:03-0500', tz='US/Central')
+        expected1 = Timestamp('2015-11-01 01:00:03-0600', tz='US/Central')
+
+        ser = Series([ts])
+        expected0 = Series([expected0])
+        expected1 = Series([expected1])
+
+        with pytest.raises(pytz.AmbiguousTimeError):
+            ser.dt.tz_localize('US/Central')
+
+        result = ser.dt.tz_localize('US/Central', ambiguous=True)
+        tm.assert_series_equal(result, expected0)
+
+        result = ser.dt.tz_localize('US/Central', ambiguous=[True])
+        tm.assert_series_equal(result, expected0)
+
+        result = ser.dt.tz_localize('US/Central', ambiguous=False)
+        tm.assert_series_equal(result, expected1)
+
+        result = ser.dt.tz_localize('US/Central', ambiguous=[False])
+        tm.assert_series_equal(result, expected1)
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_series_tz_localize_empty(self, tzstr):
+        # GH#2248
+        ser = Series()
+
+        ser2 = ser.tz_localize('utc')
+        assert ser2.index.tz == pytz.utc
+
+        ser2 = ser.tz_localize(tzstr)
+        timezones.tz_compare(ser2.index.tz, timezones.maybe_get_tz(tzstr))
+
+    # -----------------------------------------------------------------
+    # Series.tz_convert
+
+    def test_series_tz_convert(self):
+        rng = date_range('1/1/2011', periods=200, freq='D', tz='US/Eastern')
+        ts = Series(1, index=rng)
+
+        result = ts.tz_convert('Europe/Berlin')
+        assert result.index.tz.zone == 'Europe/Berlin'
+
+        # can't convert tz-naive
+        rng = date_range('1/1/2011', periods=200, freq='D')
+        ts = Series(1, index=rng)
+        tm.assert_raises_regex(TypeError, "Cannot convert tz-naive",
+                               ts.tz_convert, 'US/Eastern')
+
+    def test_series_tz_convert_to_utc(self):
+        base = DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
+                             tz='UTC')
+        idx1 = base.tz_convert('Asia/Tokyo')[:2]
+        idx2 = base.tz_convert('US/Eastern')[1:]
+
+        res = Series([1, 2], index=idx1) + Series([1, 1], index=idx2)
+        tm.assert_series_equal(res, Series([np.nan, 3, np.nan], index=base))
+
+    # -----------------------------------------------------------------
+    # Series.append
+
+    def test_series_append_aware(self):
+        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H',
+                          tz='US/Eastern')
+        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H',
+                          tz='US/Eastern')
+        ser1 = Series([1], index=rng1)
+        ser2 = Series([2], index=rng2)
+        ts_result = ser1.append(ser2)
+
+        exp_index = DatetimeIndex(['2011-01-01 01:00', '2011-01-01 02:00'],
+                                  tz='US/Eastern')
+        exp = Series([1, 2], index=exp_index)
+        tm.assert_series_equal(ts_result, exp)
+        assert ts_result.index.tz == rng1.tz
+
+        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H', tz='UTC')
+        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H', tz='UTC')
+        ser1 = Series([1], index=rng1)
+        ser2 = Series([2], index=rng2)
+        ts_result = ser1.append(ser2)
+
+        exp_index = DatetimeIndex(['2011-01-01 01:00', '2011-01-01 02:00'],
+                                  tz='UTC')
+        exp = Series([1, 2], index=exp_index)
+        tm.assert_series_equal(ts_result, exp)
+        utc = rng1.tz
+        assert utc == ts_result.index.tz
+
+        # GH#7795
+        # different tz coerces to object dtype, not UTC
+        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H',
+                          tz='US/Eastern')
+        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H',
+                          tz='US/Central')
+        ser1 = Series([1], index=rng1)
+        ser2 = Series([2], index=rng2)
+        ts_result = ser1.append(ser2)
+        exp_index = Index([Timestamp('1/1/2011 01:00', tz='US/Eastern'),
+                           Timestamp('1/1/2011 02:00', tz='US/Central')])
+        exp = Series([1, 2], index=exp_index)
+        tm.assert_series_equal(ts_result, exp)
+
+    def test_series_append_aware_naive(self):
+        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H')
+        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H',
+                          tz='US/Eastern')
+        ser1 = Series(np.random.randn(len(rng1)), index=rng1)
+        ser2 = Series(np.random.randn(len(rng2)), index=rng2)
+        ts_result = ser1.append(ser2)
+
+        expected = ser1.index.astype(object).append(ser2.index.astype(object))
+        assert ts_result.index.equals(expected)
+
+        # mixed
+        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H')
+        rng2 = lrange(100)
+        ser1 = Series(np.random.randn(len(rng1)), index=rng1)
+        ser2 = Series(np.random.randn(len(rng2)), index=rng2)
+        ts_result = ser1.append(ser2)
+
+        expected = ser1.index.astype(object).append(ser2.index)
+        assert ts_result.index.equals(expected)
+
+    def test_series_append_dst(self):
+        rng1 = date_range('1/1/2016 01:00', periods=3, freq='H',
+                          tz='US/Eastern')
+        rng2 = date_range('8/1/2016 01:00', periods=3, freq='H',
+                          tz='US/Eastern')
+        ser1 = Series([1, 2, 3], index=rng1)
+        ser2 = Series([10, 11, 12], index=rng2)
+        ts_result = ser1.append(ser2)
+
+        exp_index = DatetimeIndex(['2016-01-01 01:00', '2016-01-01 02:00',
+                                   '2016-01-01 03:00', '2016-08-01 01:00',
+                                   '2016-08-01 02:00', '2016-08-01 03:00'],
+                                  tz='US/Eastern')
+        exp = Series([1, 2, 3, 10, 11, 12], index=exp_index)
+        tm.assert_series_equal(ts_result, exp)
+        assert ts_result.index.tz == rng1.tz
+
+    # -----------------------------------------------------------------
+
+    def test_dateutil_tzoffset_support(self):
+        values = [188.5, 328.25]
+        tzinfo = tzoffset(None, 7200)
+        index = [datetime(2012, 5, 11, 11, tzinfo=tzinfo),
+                 datetime(2012, 5, 11, 12, tzinfo=tzinfo)]
+        series = Series(data=values, index=index)
+
+        assert series.index.tz == tzinfo
+
+        # it works! #2443
+        repr(series.index[0])
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_tz_aware_asfreq(self, tz):
+        dr = date_range('2011-12-01', '2012-07-20', freq='D', tz=tz)
+
+        ser = Series(np.random.randn(len(dr)), index=dr)
+
+        # it works!
+        ser.asfreq('T')
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_string_index_alias_tz_aware(self, tz):
+        rng = date_range('1/1/2000', periods=10, tz=tz)
+        ser = Series(np.random.randn(len(rng)), index=rng)
+
+        result = ser['1/3/2000']
+        tm.assert_almost_equal(result, ser[2])
+
+    # TODO: De-duplicate with test below
+    def test_series_add_tz_mismatch_converts_to_utc_duplicate(self):
+        rng = date_range('1/1/2011', periods=10, freq='H', tz='US/Eastern')
+        ser = Series(np.random.randn(len(rng)), index=rng)
+
+        ts_moscow = ser.tz_convert('Europe/Moscow')
+
+        result = ser + ts_moscow
+        assert result.index.tz is pytz.utc
+
+        result = ts_moscow + ser
+        assert result.index.tz is pytz.utc
+
+    def test_series_add_tz_mismatch_converts_to_utc(self):
+        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
+
+        perm = np.random.permutation(100)[:90]
+        ser1 = Series(np.random.randn(90),
+                      index=rng.take(perm).tz_convert('US/Eastern'))
+
+        perm = np.random.permutation(100)[:90]
+        ser2 = Series(np.random.randn(90),
+                      index=rng.take(perm).tz_convert('Europe/Berlin'))
+
+        result = ser1 + ser2
+
+        uts1 = ser1.tz_convert('utc')
+        uts2 = ser2.tz_convert('utc')
+        expected = uts1 + uts2
+
+        assert result.index.tz == pytz.UTC
+        tm.assert_series_equal(result, expected)
+
+    def test_series_add_aware_naive_raises(self):
+        rng = date_range('1/1/2011', periods=10, freq='H')
+        ser = Series(np.random.randn(len(rng)), index=rng)
+
+        ser_utc = ser.tz_localize('utc')
+
+        with pytest.raises(Exception):
+            ser + ser_utc
+
+        with pytest.raises(Exception):
+            ser_utc + ser
+
+    def test_series_align_aware(self):
+        idx1 = date_range('2001', periods=5, freq='H', tz='US/Eastern')
+        ser = Series(np.random.randn(len(idx1)), index=idx1)
+        ser_central = ser.tz_convert('US/Central')
+        # # different timezones convert to UTC
+
+        new1, new2 = ser.align(ser_central)
+        assert new1.index.tz == pytz.UTC
+        assert new2.index.tz == pytz.UTC
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_localized_at_time_between_time(self, tzstr):
+        from datetime import time
+        tz = timezones.maybe_get_tz(tzstr)
+
+        rng = date_range('4/16/2012', '5/1/2012', freq='H')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        ts_local = ts.tz_localize(tzstr)
+
+        result = ts_local.at_time(time(10, 0))
+        expected = ts.at_time(time(10, 0)).tz_localize(tzstr)
+        tm.assert_series_equal(result, expected)
+        assert timezones.tz_compare(result.index.tz, tz)
+
+        t1, t2 = time(10, 0), time(11, 0)
+        result = ts_local.between_time(t1, t2)
+        expected = ts.between_time(t1, t2).tz_localize(tzstr)
+        tm.assert_series_equal(result, expected)
+        assert timezones.tz_compare(result.index.tz, tz)
+
+    @pytest.mark.parametrize('tzstr', ['Europe/Berlin',
+                                       'dateutil/Europe/Berlin'])
+    def test_getitem_pydatetime_tz(self, tzstr):
+        tz = timezones.maybe_get_tz(tzstr)
+
+        index = date_range(start='2012-12-24 16:00', end='2012-12-24 18:00',
+                           freq='H', tz=tzstr)
+        ts = Series(index=index, data=index.hour)
+        time_pandas = Timestamp('2012-12-24 17:00', tz=tzstr)
+
+        dt = datetime(2012, 12, 24, 17, 0)
+        time_datetime = tslib._localize_pydatetime(dt, tz)
+        assert ts[time_pandas] == ts[time_datetime]
+
+    def test_series_truncate_datetimeindex_tz(self):
+        # GH 9243
+        idx = date_range('4/1/2005', '4/30/2005', freq='D', tz='US/Pacific')
+        s = Series(range(len(idx)), index=idx)
+        result = s.truncate(datetime(2005, 4, 2), datetime(2005, 4, 4))
+        expected = Series([1, 2, 3], index=idx[1:4])
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/series/test_validate.py b/pandas/tests/series/test_validate.py
new file mode 100644
index 0000000000000..a0cde5f81d021
--- /dev/null
+++ b/pandas/tests/series/test_validate.py
@@ -0,0 +1,27 @@
+from pandas.core.series import Series
+
+import pytest
+import pandas.util.testing as tm
+
+
+@pytest.fixture
+def series():
+    return Series([1, 2, 3, 4, 5])
+
+
+class TestSeriesValidate(object):
+    """Tests for error handling related to data types of method arguments."""
+
+    @pytest.mark.parametrize("func", ["reset_index", "_set_name",
+                                      "sort_values", "sort_index",
+                                      "rename", "dropna"])
+    @pytest.mark.parametrize("inplace", [1, "True", [1, 2, 3], 5.0])
+    def test_validate_bool_args(self, series, func, inplace):
+        msg = "For argument \"inplace\" expected type bool"
+        kwargs = dict(inplace=inplace)
+
+        if func == "_set_name":
+            kwargs["name"] = "hello"
+
+        with tm.assert_raises_regex(ValueError, msg):
+            getattr(series, func)(**kwargs)
diff --git a/pandas/tests/sparse/__init__.py b/pandas/tests/sparse/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/sparse/common.py b/pandas/tests/sparse/common.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/sparse/frame/__init__.py b/pandas/tests/sparse/frame/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/sparse/frame/test_analytics.py b/pandas/tests/sparse/frame/test_analytics.py
new file mode 100644
index 0000000000000..ccb30502b862e
--- /dev/null
+++ b/pandas/tests/sparse/frame/test_analytics.py
@@ -0,0 +1,40 @@
+import pytest
+import numpy as np
+from pandas import SparseDataFrame, DataFrame, SparseSeries
+from pandas.util import testing as tm
+
+
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization '
+                   '(GH 17386)')
+def test_quantile():
+    # GH 17386
+    data = [[1, 1], [2, 10], [3, 100], [np.nan, np.nan]]
+    q = 0.1
+
+    sparse_df = SparseDataFrame(data)
+    result = sparse_df.quantile(q)
+
+    dense_df = DataFrame(data)
+    dense_expected = dense_df.quantile(q)
+    sparse_expected = SparseSeries(dense_expected)
+
+    tm.assert_series_equal(result, dense_expected)
+    tm.assert_sp_series_equal(result, sparse_expected)
+
+
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization '
+                   '(GH 17386)')
+def test_quantile_multi():
+    # GH 17386
+    data = [[1, 1], [2, 10], [3, 100], [np.nan, np.nan]]
+    q = [0.1, 0.5]
+
+    sparse_df = SparseDataFrame(data)
+    result = sparse_df.quantile(q)
+
+    dense_df = DataFrame(data)
+    dense_expected = dense_df.quantile(q)
+    sparse_expected = SparseDataFrame(dense_expected)
+
+    tm.assert_frame_equal(result, dense_expected)
+    tm.assert_sp_frame_equal(result, sparse_expected)
diff --git a/pandas/tests/sparse/frame/test_apply.py b/pandas/tests/sparse/frame/test_apply.py
new file mode 100644
index 0000000000000..07e4b1bf7c913
--- /dev/null
+++ b/pandas/tests/sparse/frame/test_apply.py
@@ -0,0 +1,92 @@
+import pytest
+import numpy as np
+from pandas import SparseDataFrame, DataFrame, Series, bdate_range
+from pandas.core import nanops
+from pandas.util import testing as tm
+
+
+@pytest.fixture
+def dates():
+    return bdate_range('1/1/2011', periods=10)
+
+
+@pytest.fixture
+def empty():
+    return SparseDataFrame()
+
+
+@pytest.fixture
+def frame(dates):
+    data = {'A': [np.nan, np.nan, np.nan, 0, 1, 2, 3, 4, 5, 6],
+            'B': [0, 1, 2, np.nan, np.nan, np.nan, 3, 4, 5, 6],
+            'C': np.arange(10, dtype=np.float64),
+            'D': [0, 1, 2, 3, 4, 5, np.nan, np.nan, np.nan, np.nan]}
+
+    return SparseDataFrame(data, index=dates)
+
+
+@pytest.fixture
+def fill_frame(frame):
+    values = frame.values.copy()
+    values[np.isnan(values)] = 2
+
+    return SparseDataFrame(values, columns=['A', 'B', 'C', 'D'],
+                           default_fill_value=2,
+                           index=frame.index)
+
+
+def test_apply(frame):
+    applied = frame.apply(np.sqrt)
+    assert isinstance(applied, SparseDataFrame)
+    tm.assert_almost_equal(applied.values, np.sqrt(frame.values))
+
+    # agg / broadcast
+    with tm.assert_produces_warning(FutureWarning):
+        broadcasted = frame.apply(np.sum, broadcast=True)
+    assert isinstance(broadcasted, SparseDataFrame)
+
+    with tm.assert_produces_warning(FutureWarning):
+        exp = frame.to_dense().apply(np.sum, broadcast=True)
+    tm.assert_frame_equal(broadcasted.to_dense(), exp)
+
+    applied = frame.apply(np.sum)
+    tm.assert_series_equal(applied,
+                           frame.to_dense().apply(nanops.nansum))
+
+
+def test_apply_fill(fill_frame):
+    applied = fill_frame.apply(np.sqrt)
+    assert applied['A'].fill_value == np.sqrt(2)
+
+
+def test_apply_empty(empty):
+    assert empty.apply(np.sqrt) is empty
+
+
+def test_apply_nonuq():
+    orig = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                     index=['a', 'a', 'c'])
+    sparse = orig.to_sparse()
+    res = sparse.apply(lambda s: s[0], axis=1)
+    exp = orig.apply(lambda s: s[0], axis=1)
+
+    # dtype must be kept
+    assert res.dtype == np.int64
+
+    # ToDo: apply must return subclassed dtype
+    assert isinstance(res, Series)
+    tm.assert_series_equal(res.to_dense(), exp)
+
+    # df.T breaks
+    sparse = orig.T.to_sparse()
+    res = sparse.apply(lambda s: s[0], axis=0)  # noqa
+    exp = orig.T.apply(lambda s: s[0], axis=0)
+
+    # TODO: no non-unique columns supported in sparse yet
+    # tm.assert_series_equal(res.to_dense(), exp)
+
+
+def test_applymap(frame):
+    # just test that it works
+    result = frame.applymap(lambda x: x * 2)
+    assert isinstance(result, SparseDataFrame)
diff --git a/pandas/tests/sparse/frame/test_frame.py b/pandas/tests/sparse/frame/test_frame.py
new file mode 100644
index 0000000000000..9cc615e15564f
--- /dev/null
+++ b/pandas/tests/sparse/frame/test_frame.py
@@ -0,0 +1,1303 @@
+# pylint: disable-msg=E1101,W0612
+
+import operator
+
+import pytest
+from warnings import catch_warnings
+from numpy import nan
+import numpy as np
+import pandas as pd
+
+from pandas import Series, DataFrame, bdate_range, Panel
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.tseries.offsets import BDay
+from pandas.util import testing as tm
+from pandas.compat import lrange
+from pandas import compat
+from pandas.core.sparse import frame as spf
+
+from pandas._libs.sparse import BlockIndex, IntIndex
+from pandas.core.sparse.api import SparseSeries, SparseDataFrame, SparseArray
+from pandas.tests.frame.test_api import SharedWithSparse
+
+
+class TestSparseDataFrame(SharedWithSparse):
+    klass = SparseDataFrame
+
+    # SharedWithSparse tests use generic, klass-agnostic assertion
+    _assert_frame_equal = staticmethod(tm.assert_sp_frame_equal)
+    _assert_series_equal = staticmethod(tm.assert_sp_series_equal)
+
+    def setup_method(self, method):
+        self.data = {'A': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
+                     'B': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
+                     'C': np.arange(10, dtype=np.float64),
+                     'D': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]}
+
+        self.dates = bdate_range('1/1/2011', periods=10)
+
+        self.orig = pd.DataFrame(self.data, index=self.dates)
+        self.iorig = pd.DataFrame(self.data, index=self.dates)
+
+        self.frame = SparseDataFrame(self.data, index=self.dates)
+        self.iframe = SparseDataFrame(self.data, index=self.dates,
+                                      default_kind='integer')
+        self.mixed_frame = self.frame.copy(False)
+        self.mixed_frame['foo'] = pd.SparseArray(['bar'] * len(self.dates))
+
+        values = self.frame.values.copy()
+        values[np.isnan(values)] = 0
+
+        self.zorig = pd.DataFrame(values, columns=['A', 'B', 'C', 'D'],
+                                  index=self.dates)
+        self.zframe = SparseDataFrame(values, columns=['A', 'B', 'C', 'D'],
+                                      default_fill_value=0, index=self.dates)
+
+        values = self.frame.values.copy()
+        values[np.isnan(values)] = 2
+
+        self.fill_orig = pd.DataFrame(values, columns=['A', 'B', 'C', 'D'],
+                                      index=self.dates)
+        self.fill_frame = SparseDataFrame(values, columns=['A', 'B', 'C', 'D'],
+                                          default_fill_value=2,
+                                          index=self.dates)
+
+        self.empty = SparseDataFrame()
+
+    def test_fill_value_when_combine_const(self):
+        # GH12723
+        dat = np.array([0, 1, np.nan, 3, 4, 5], dtype='float')
+        df = SparseDataFrame({'foo': dat}, index=range(6))
+
+        exp = df.fillna(0).add(2)
+        res = df.add(2, fill_value=0)
+        tm.assert_sp_frame_equal(res, exp)
+
+    def test_values(self):
+        empty = self.empty.values
+        assert empty.shape == (0, 0)
+
+        no_cols = SparseDataFrame(index=np.arange(10))
+        mat = no_cols.values
+        assert mat.shape == (10, 0)
+
+        no_index = SparseDataFrame(columns=np.arange(10))
+        mat = no_index.values
+        assert mat.shape == (0, 10)
+
+    def test_copy(self):
+        cp = self.frame.copy()
+        assert isinstance(cp, SparseDataFrame)
+        tm.assert_sp_frame_equal(cp, self.frame)
+
+        # as of v0.15.0
+        # this is now identical (but not is_a )
+        assert cp.index.identical(self.frame.index)
+
+    def test_constructor(self):
+        for col, series in compat.iteritems(self.frame):
+            assert isinstance(series, SparseSeries)
+
+        assert isinstance(self.iframe['A'].sp_index, IntIndex)
+
+        # constructed zframe from matrix above
+        assert self.zframe['A'].fill_value == 0
+        tm.assert_numpy_array_equal(pd.SparseArray([1., 2., 3., 4., 5., 6.]),
+                                    self.zframe['A'].values)
+        tm.assert_numpy_array_equal(np.array([0., 0., 0., 0., 1., 2.,
+                                              3., 4., 5., 6.]),
+                                    self.zframe['A'].to_dense().values)
+
+        # construct no data
+        sdf = SparseDataFrame(columns=np.arange(10), index=np.arange(10))
+        for col, series in compat.iteritems(sdf):
+            assert isinstance(series, SparseSeries)
+
+        # construct from nested dict
+        data = {}
+        for c, s in compat.iteritems(self.frame):
+            data[c] = s.to_dict()
+
+        sdf = SparseDataFrame(data)
+        tm.assert_sp_frame_equal(sdf, self.frame)
+
+        # TODO: test data is copied from inputs
+
+        # init dict with different index
+        idx = self.frame.index[:5]
+        cons = SparseDataFrame(
+            self.frame, index=idx, columns=self.frame.columns,
+            default_fill_value=self.frame.default_fill_value,
+            default_kind=self.frame.default_kind, copy=True)
+        reindexed = self.frame.reindex(idx)
+
+        tm.assert_sp_frame_equal(cons, reindexed, exact_indices=False)
+
+        # assert level parameter breaks reindex
+        with pytest.raises(TypeError):
+            self.frame.reindex(idx, level=0)
+
+        repr(self.frame)
+
+    def test_constructor_dict_order(self):
+        # GH19018
+        # initialization ordering: by insertion order if python>= 3.6, else
+        # order by value
+        d = {'b': [2, 3], 'a': [0, 1]}
+        frame = SparseDataFrame(data=d)
+        if compat.PY36:
+            expected = SparseDataFrame(data=d, columns=list('ba'))
+        else:
+            expected = SparseDataFrame(data=d, columns=list('ab'))
+        tm.assert_sp_frame_equal(frame, expected)
+
+    def test_constructor_ndarray(self):
+        # no index or columns
+        sp = SparseDataFrame(self.frame.values)
+
+        # 1d
+        sp = SparseDataFrame(self.data['A'], index=self.dates, columns=['A'])
+        tm.assert_sp_frame_equal(sp, self.frame.reindex(columns=['A']))
+
+        # raise on level argument
+        pytest.raises(TypeError, self.frame.reindex, columns=['A'],
+                      level=1)
+
+        # wrong length index / columns
+        with tm.assert_raises_regex(ValueError, "^Index length"):
+            SparseDataFrame(self.frame.values, index=self.frame.index[:-1])
+
+        with tm.assert_raises_regex(ValueError, "^Column length"):
+            SparseDataFrame(self.frame.values, columns=self.frame.columns[:-1])
+
+    # GH 9272
+    def test_constructor_empty(self):
+        sp = SparseDataFrame()
+        assert len(sp.index) == 0
+        assert len(sp.columns) == 0
+
+    def test_constructor_dataframe(self):
+        dense = self.frame.to_dense()
+        sp = SparseDataFrame(dense)
+        tm.assert_sp_frame_equal(sp, self.frame)
+
+    def test_constructor_convert_index_once(self):
+        arr = np.array([1.5, 2.5, 3.5])
+        sdf = SparseDataFrame(columns=lrange(4), index=arr)
+        assert sdf[0].index is sdf[1].index
+
+    def test_constructor_from_series(self):
+
+        # GH 2873
+        x = Series(np.random.randn(10000), name='a')
+        x = x.to_sparse(fill_value=0)
+        assert isinstance(x, SparseSeries)
+        df = SparseDataFrame(x)
+        assert isinstance(df, SparseDataFrame)
+
+        x = Series(np.random.randn(10000), name='a')
+        y = Series(np.random.randn(10000), name='b')
+        x2 = x.astype(float)
+        x2.loc[:9998] = np.NaN
+        # TODO: x_sparse is unused...fix
+        x_sparse = x2.to_sparse(fill_value=np.NaN)  # noqa
+
+        # Currently fails too with weird ufunc error
+        # df1 = SparseDataFrame([x_sparse, y])
+
+        y.loc[:9998] = 0
+        # TODO: y_sparse is unsused...fix
+        y_sparse = y.to_sparse(fill_value=0)  # noqa
+        # without sparse value raises error
+        # df2 = SparseDataFrame([x2_sparse, y])
+
+    def test_constructor_from_dense_series(self):
+        # GH 19393
+        # series with name
+        x = Series(np.random.randn(10000), name='a')
+        result = SparseDataFrame(x)
+        expected = x.to_frame().to_sparse()
+        tm.assert_sp_frame_equal(result, expected)
+
+        # series with no name
+        x = Series(np.random.randn(10000))
+        result = SparseDataFrame(x)
+        expected = x.to_frame().to_sparse()
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_constructor_from_unknown_type(self):
+        # GH 19393
+        class Unknown(object):
+            pass
+        with pytest.raises(TypeError,
+                           message='SparseDataFrame called with unknown type '
+                                   '"Unknown" for data argument'):
+            SparseDataFrame(Unknown())
+
+    def test_constructor_preserve_attr(self):
+        # GH 13866
+        arr = pd.SparseArray([1, 0, 3, 0], dtype=np.int64, fill_value=0)
+        assert arr.dtype == np.int64
+        assert arr.fill_value == 0
+
+        df = pd.SparseDataFrame({'x': arr})
+        assert df['x'].dtype == np.int64
+        assert df['x'].fill_value == 0
+
+        s = pd.SparseSeries(arr, name='x')
+        assert s.dtype == np.int64
+        assert s.fill_value == 0
+
+        df = pd.SparseDataFrame(s)
+        assert df['x'].dtype == np.int64
+        assert df['x'].fill_value == 0
+
+        df = pd.SparseDataFrame({'x': s})
+        assert df['x'].dtype == np.int64
+        assert df['x'].fill_value == 0
+
+    def test_constructor_nan_dataframe(self):
+        # GH 10079
+        trains = np.arange(100)
+        thresholds = [10, 20, 30, 40, 50, 60]
+        tuples = [(i, j) for i in trains for j in thresholds]
+        index = pd.MultiIndex.from_tuples(tuples,
+                                          names=['trains', 'thresholds'])
+        matrix = np.empty((len(index), len(trains)))
+        matrix.fill(np.nan)
+        df = pd.DataFrame(matrix, index=index, columns=trains, dtype=float)
+        result = df.to_sparse()
+        expected = pd.SparseDataFrame(matrix, index=index, columns=trains,
+                                      dtype=float)
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_type_coercion_at_construction(self):
+        # GH 15682
+        result = pd.SparseDataFrame(
+            {'a': [1, 0, 0], 'b': [0, 1, 0], 'c': [0, 0, 1]}, dtype='uint8',
+            default_fill_value=0)
+        expected = pd.SparseDataFrame(
+            {'a': pd.SparseSeries([1, 0, 0], dtype='uint8'),
+             'b': pd.SparseSeries([0, 1, 0], dtype='uint8'),
+             'c': pd.SparseSeries([0, 0, 1], dtype='uint8')},
+            default_fill_value=0)
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_dtypes(self):
+        df = DataFrame(np.random.randn(10000, 4))
+        df.loc[:9998] = np.nan
+        sdf = df.to_sparse()
+
+        result = sdf.get_dtype_counts()
+        expected = Series({'float64': 4})
+        tm.assert_series_equal(result, expected)
+
+    def test_shape(self):
+        # see gh-10452
+        assert self.frame.shape == (10, 4)
+        assert self.iframe.shape == (10, 4)
+        assert self.zframe.shape == (10, 4)
+        assert self.fill_frame.shape == (10, 4)
+
+    def test_str(self):
+        df = DataFrame(np.random.randn(10000, 4))
+        df.loc[:9998] = np.nan
+
+        sdf = df.to_sparse()
+        str(sdf)
+
+    def test_array_interface(self):
+        res = np.sqrt(self.frame)
+        dres = np.sqrt(self.frame.to_dense())
+        tm.assert_frame_equal(res.to_dense(), dres)
+
+    def test_pickle(self):
+
+        def _test_roundtrip(frame, orig):
+            result = tm.round_trip_pickle(frame)
+            tm.assert_sp_frame_equal(frame, result)
+            tm.assert_frame_equal(result.to_dense(), orig, check_dtype=False)
+
+        _test_roundtrip(SparseDataFrame(), DataFrame())
+        self._check_all(_test_roundtrip)
+
+    def test_dense_to_sparse(self):
+        df = DataFrame({'A': [nan, nan, nan, 1, 2],
+                        'B': [1, 2, nan, nan, nan]})
+        sdf = df.to_sparse()
+        assert isinstance(sdf, SparseDataFrame)
+        assert np.isnan(sdf.default_fill_value)
+        assert isinstance(sdf['A'].sp_index, BlockIndex)
+        tm.assert_frame_equal(sdf.to_dense(), df)
+
+        sdf = df.to_sparse(kind='integer')
+        assert isinstance(sdf['A'].sp_index, IntIndex)
+
+        df = DataFrame({'A': [0, 0, 0, 1, 2],
+                        'B': [1, 2, 0, 0, 0]}, dtype=float)
+        sdf = df.to_sparse(fill_value=0)
+        assert sdf.default_fill_value == 0
+        tm.assert_frame_equal(sdf.to_dense(), df)
+
+    def test_density(self):
+        df = SparseSeries([nan, nan, nan, 0, 1, 2, 3, 4, 5, 6])
+        assert df.density == 0.7
+
+        df = SparseDataFrame({'A': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
+                              'B': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
+                              'C': np.arange(10),
+                              'D': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]})
+
+        assert df.density == 0.75
+
+    def test_sparse_to_dense(self):
+        pass
+
+    def test_sparse_series_ops(self):
+        self._check_frame_ops(self.frame)
+
+    def test_sparse_series_ops_i(self):
+        self._check_frame_ops(self.iframe)
+
+    def test_sparse_series_ops_z(self):
+        self._check_frame_ops(self.zframe)
+
+    def test_sparse_series_ops_fill(self):
+        self._check_frame_ops(self.fill_frame)
+
+    def _check_frame_ops(self, frame):
+
+        def _compare_to_dense(a, b, da, db, op):
+            sparse_result = op(a, b)
+            dense_result = op(da, db)
+
+            fill = sparse_result.default_fill_value
+            dense_result = dense_result.to_sparse(fill_value=fill)
+            tm.assert_sp_frame_equal(sparse_result, dense_result,
+                                     exact_indices=False)
+
+            if isinstance(a, DataFrame) and isinstance(db, DataFrame):
+                mixed_result = op(a, db)
+                assert isinstance(mixed_result, SparseDataFrame)
+                tm.assert_sp_frame_equal(mixed_result, sparse_result,
+                                         exact_indices=False)
+
+        opnames = ['add', 'sub', 'mul', 'truediv', 'floordiv']
+        ops = [getattr(operator, name) for name in opnames]
+
+        fidx = frame.index
+
+        # time series operations
+
+        series = [frame['A'], frame['B'], frame['C'], frame['D'],
+                  frame['A'].reindex(fidx[:7]), frame['A'].reindex(fidx[::2]),
+                  SparseSeries(
+                      [], index=[])]
+
+        for op in opnames:
+            _compare_to_dense(frame, frame[::2], frame.to_dense(),
+                              frame[::2].to_dense(), getattr(operator, op))
+
+            # 2304, no auto-broadcasting
+            for i, s in enumerate(series):
+                f = lambda a, b: getattr(a, op)(b, axis='index')
+                _compare_to_dense(frame, s, frame.to_dense(), s.to_dense(), f)
+
+                # rops are not implemented
+                # _compare_to_dense(s, frame, s.to_dense(),
+                #                   frame.to_dense(), f)
+
+                # cross-sectional operations
+        series = [frame.xs(fidx[0]), frame.xs(fidx[3]), frame.xs(fidx[5]),
+                  frame.xs(fidx[7]), frame.xs(fidx[5])[:2]]
+
+        for op in ops:
+            for s in series:
+                _compare_to_dense(frame, s, frame.to_dense(), s, op)
+                _compare_to_dense(s, frame, s, frame.to_dense(), op)
+
+        # it works!
+        result = self.frame + self.frame.loc[:, ['A', 'B']]  # noqa
+
+    def test_op_corners(self):
+        empty = self.empty + self.empty
+        assert empty.empty
+
+        foo = self.frame + self.empty
+        assert isinstance(foo.index, DatetimeIndex)
+        tm.assert_frame_equal(foo, self.frame * np.nan)
+
+        foo = self.empty + self.frame
+        tm.assert_frame_equal(foo, self.frame * np.nan)
+
+    def test_scalar_ops(self):
+        pass
+
+    def test_getitem(self):
+        # 1585 select multiple columns
+        sdf = SparseDataFrame(index=[0, 1, 2], columns=['a', 'b', 'c'])
+
+        result = sdf[['a', 'b']]
+        exp = sdf.reindex(columns=['a', 'b'])
+        tm.assert_sp_frame_equal(result, exp)
+
+        pytest.raises(Exception, sdf.__getitem__, ['a', 'd'])
+
+    def test_iloc(self):
+
+        # 2227
+        result = self.frame.iloc[:, 0]
+        assert isinstance(result, SparseSeries)
+        tm.assert_sp_series_equal(result, self.frame['A'])
+
+        # preserve sparse index type. #2251
+        data = {'A': [0, 1]}
+        iframe = SparseDataFrame(data, default_kind='integer')
+        tm.assert_class_equal(iframe['A'].sp_index,
+                              iframe.iloc[:, 0].sp_index)
+
+    def test_set_value(self):
+
+        # ok, as the index gets converted to object
+        frame = self.frame.copy()
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res = frame.set_value('foobar', 'B', 1.5)
+        assert res.index.dtype == 'object'
+
+        res = self.frame
+        res.index = res.index.astype(object)
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res = self.frame.set_value('foobar', 'B', 1.5)
+        assert res is not self.frame
+        assert res.index[-1] == 'foobar'
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert res.get_value('foobar', 'B') == 1.5
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res2 = res.set_value('foobar', 'qux', 1.5)
+        assert res2 is not res
+        tm.assert_index_equal(res2.columns,
+                              pd.Index(list(self.frame.columns) + ['qux']))
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert res2.get_value('foobar', 'qux') == 1.5
+
+    def test_fancy_index_misc(self):
+        # axis = 0
+        sliced = self.frame.iloc[-2:, :]
+        expected = self.frame.reindex(index=self.frame.index[-2:])
+        tm.assert_sp_frame_equal(sliced, expected)
+
+        # axis = 1
+        sliced = self.frame.iloc[:, -2:]
+        expected = self.frame.reindex(columns=self.frame.columns[-2:])
+        tm.assert_sp_frame_equal(sliced, expected)
+
+    def test_getitem_overload(self):
+        # slicing
+        sl = self.frame[:20]
+        tm.assert_sp_frame_equal(sl, self.frame.reindex(self.frame.index[:20]))
+
+        # boolean indexing
+        d = self.frame.index[5]
+        indexer = self.frame.index > d
+
+        subindex = self.frame.index[indexer]
+        subframe = self.frame[indexer]
+
+        tm.assert_index_equal(subindex, subframe.index)
+        pytest.raises(Exception, self.frame.__getitem__, indexer[:-1])
+
+    def test_setitem(self):
+
+        def _check_frame(frame, orig):
+            N = len(frame)
+
+            # insert SparseSeries
+            frame['E'] = frame['A']
+            assert isinstance(frame['E'], SparseSeries)
+            tm.assert_sp_series_equal(frame['E'], frame['A'],
+                                      check_names=False)
+
+            # insert SparseSeries differently-indexed
+            to_insert = frame['A'][::2]
+            frame['E'] = to_insert
+            expected = to_insert.to_dense().reindex(frame.index)
+            result = frame['E'].to_dense()
+            tm.assert_series_equal(result, expected, check_names=False)
+            assert result.name == 'E'
+
+            # insert Series
+            frame['F'] = frame['A'].to_dense()
+            assert isinstance(frame['F'], SparseSeries)
+            tm.assert_sp_series_equal(frame['F'], frame['A'],
+                                      check_names=False)
+
+            # insert Series differently-indexed
+            to_insert = frame['A'].to_dense()[::2]
+            frame['G'] = to_insert
+            expected = to_insert.reindex(frame.index)
+            expected.name = 'G'
+            tm.assert_series_equal(frame['G'].to_dense(), expected)
+
+            # insert ndarray
+            frame['H'] = np.random.randn(N)
+            assert isinstance(frame['H'], SparseSeries)
+
+            to_sparsify = np.random.randn(N)
+            to_sparsify[N // 2:] = frame.default_fill_value
+            frame['I'] = to_sparsify
+            assert len(frame['I'].sp_values) == N // 2
+
+            # insert ndarray wrong size
+            pytest.raises(Exception, frame.__setitem__, 'foo',
+                          np.random.randn(N - 1))
+
+            # scalar value
+            frame['J'] = 5
+            assert len(frame['J'].sp_values) == N
+            assert (frame['J'].sp_values == 5).all()
+
+            frame['K'] = frame.default_fill_value
+            assert len(frame['K'].sp_values) == 0
+
+        self._check_all(_check_frame)
+
+    def test_setitem_corner(self):
+        self.frame['a'] = self.frame['B']
+        tm.assert_sp_series_equal(self.frame['a'], self.frame['B'],
+                                  check_names=False)
+
+    def test_setitem_array(self):
+        arr = self.frame['B']
+
+        self.frame['E'] = arr
+        tm.assert_sp_series_equal(self.frame['E'], self.frame['B'],
+                                  check_names=False)
+
+        self.frame['F'] = arr[:-1]
+        index = self.frame.index[:-1]
+        tm.assert_sp_series_equal(self.frame['E'].reindex(index),
+                                  self.frame['F'].reindex(index),
+                                  check_names=False)
+
+    def test_setitem_chained_no_consolidate(self):
+        # https://github.com/pandas-dev/pandas/pull/19268
+        # issuecomment-361696418
+        # chained setitem used to cause consolidation
+        sdf = pd.SparseDataFrame([[np.nan, 1], [2, np.nan]])
+        with pd.option_context('mode.chained_assignment', None):
+            sdf[0][1] = 2
+        assert len(sdf._data.blocks) == 2
+
+    def test_delitem(self):
+        A = self.frame['A']
+        C = self.frame['C']
+
+        del self.frame['B']
+        assert 'B' not in self.frame
+        tm.assert_sp_series_equal(self.frame['A'], A)
+        tm.assert_sp_series_equal(self.frame['C'], C)
+
+        del self.frame['D']
+        assert 'D' not in self.frame
+
+        del self.frame['A']
+        assert 'A' not in self.frame
+
+    def test_set_columns(self):
+        self.frame.columns = self.frame.columns
+        pytest.raises(Exception, setattr, self.frame, 'columns',
+                      self.frame.columns[:-1])
+
+    def test_set_index(self):
+        self.frame.index = self.frame.index
+        pytest.raises(Exception, setattr, self.frame, 'index',
+                      self.frame.index[:-1])
+
+    def test_append(self):
+        a = self.frame[:5]
+        b = self.frame[5:]
+
+        appended = a.append(b)
+        tm.assert_sp_frame_equal(appended, self.frame, exact_indices=False)
+
+        a = self.frame.iloc[:5, :3]
+        b = self.frame.iloc[5:]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # Stacklevel is set for pd.concat, not append
+            appended = a.append(b)
+        tm.assert_sp_frame_equal(appended.iloc[:, :3], self.frame.iloc[:, :3],
+                                 exact_indices=False)
+
+        a = a[['B', 'C', 'A']].head(2)
+        b = b.head(2)
+
+        expected = pd.SparseDataFrame({
+            "B": [0., 1, None, 3],
+            "C": [0., 1, 5, 6],
+            "A": [None, None, 2, 3],
+            "D": [None, None, 5, None],
+        }, index=a.index | b.index, columns=['B', 'C', 'A', 'D'])
+        with tm.assert_produces_warning(None):
+            appended = a.append(b, sort=False)
+
+        tm.assert_frame_equal(appended, expected)
+
+        with tm.assert_produces_warning(None):
+            appended = a.append(b, sort=True)
+
+        tm.assert_sp_frame_equal(appended, expected[['A', 'B', 'C', 'D']])
+
+    def test_astype(self):
+        sparse = pd.SparseDataFrame({'A': SparseArray([1, 2, 3, 4],
+                                                      dtype=np.int64),
+                                     'B': SparseArray([4, 5, 6, 7],
+                                                      dtype=np.int64)})
+        assert sparse['A'].dtype == np.int64
+        assert sparse['B'].dtype == np.int64
+
+        res = sparse.astype(np.float64)
+        exp = pd.SparseDataFrame({'A': SparseArray([1., 2., 3., 4.],
+                                                   fill_value=0.),
+                                  'B': SparseArray([4., 5., 6., 7.],
+                                                   fill_value=0.)},
+                                 default_fill_value=np.nan)
+        tm.assert_sp_frame_equal(res, exp)
+        assert res['A'].dtype == np.float64
+        assert res['B'].dtype == np.float64
+
+        sparse = pd.SparseDataFrame({'A': SparseArray([0, 2, 0, 4],
+                                                      dtype=np.int64),
+                                     'B': SparseArray([0, 5, 0, 7],
+                                                      dtype=np.int64)},
+                                    default_fill_value=0)
+        assert sparse['A'].dtype == np.int64
+        assert sparse['B'].dtype == np.int64
+
+        res = sparse.astype(np.float64)
+        exp = pd.SparseDataFrame({'A': SparseArray([0., 2., 0., 4.],
+                                                   fill_value=0.),
+                                  'B': SparseArray([0., 5., 0., 7.],
+                                                   fill_value=0.)},
+                                 default_fill_value=0.)
+        tm.assert_sp_frame_equal(res, exp)
+        assert res['A'].dtype == np.float64
+        assert res['B'].dtype == np.float64
+
+    def test_astype_bool(self):
+        sparse = pd.SparseDataFrame({'A': SparseArray([0, 2, 0, 4],
+                                                      fill_value=0,
+                                                      dtype=np.int64),
+                                     'B': SparseArray([0, 5, 0, 7],
+                                                      fill_value=0,
+                                                      dtype=np.int64)},
+                                    default_fill_value=0)
+        assert sparse['A'].dtype == np.int64
+        assert sparse['B'].dtype == np.int64
+
+        res = sparse.astype(bool)
+        exp = pd.SparseDataFrame({'A': SparseArray([False, True, False, True],
+                                                   dtype=np.bool,
+                                                   fill_value=False),
+                                  'B': SparseArray([False, True, False, True],
+                                                   dtype=np.bool,
+                                                   fill_value=False)},
+                                 default_fill_value=False)
+        tm.assert_sp_frame_equal(res, exp)
+        assert res['A'].dtype == np.bool
+        assert res['B'].dtype == np.bool
+
+    def test_fillna(self):
+        df = self.zframe.reindex(lrange(5))
+        dense = self.zorig.reindex(lrange(5))
+
+        result = df.fillna(0)
+        expected = dense.fillna(0)
+        tm.assert_sp_frame_equal(result, expected.to_sparse(fill_value=0),
+                                 exact_indices=False)
+        tm.assert_frame_equal(result.to_dense(), expected)
+
+        result = df.copy()
+        result.fillna(0, inplace=True)
+        expected = dense.fillna(0)
+
+        tm.assert_sp_frame_equal(result, expected.to_sparse(fill_value=0),
+                                 exact_indices=False)
+        tm.assert_frame_equal(result.to_dense(), expected)
+
+        result = df.copy()
+        result = df['A']
+        result.fillna(0, inplace=True)
+
+        expected = dense['A'].fillna(0)
+        # this changes internal SparseArray repr
+        # tm.assert_sp_series_equal(result, expected.to_sparse(fill_value=0))
+        tm.assert_series_equal(result.to_dense(), expected)
+
+    def test_fillna_fill_value(self):
+        df = pd.DataFrame({'A': [1, 0, 0], 'B': [np.nan, np.nan, 4]})
+
+        sparse = pd.SparseDataFrame(df)
+        tm.assert_frame_equal(sparse.fillna(-1).to_dense(),
+                              df.fillna(-1), check_dtype=False)
+
+        sparse = pd.SparseDataFrame(df, default_fill_value=0)
+        tm.assert_frame_equal(sparse.fillna(-1).to_dense(),
+                              df.fillna(-1), check_dtype=False)
+
+    def test_sparse_frame_pad_backfill_limit(self):
+        index = np.arange(10)
+        df = DataFrame(np.random.randn(10, 4), index=index)
+        sdf = df.to_sparse()
+
+        result = sdf[:2].reindex(index, method='pad', limit=5)
+
+        expected = sdf[:2].reindex(index).fillna(method='pad')
+        expected = expected.to_dense()
+        expected.values[-3:] = np.nan
+        expected = expected.to_sparse()
+        tm.assert_frame_equal(result, expected)
+
+        result = sdf[-2:].reindex(index, method='backfill', limit=5)
+
+        expected = sdf[-2:].reindex(index).fillna(method='backfill')
+        expected = expected.to_dense()
+        expected.values[:3] = np.nan
+        expected = expected.to_sparse()
+        tm.assert_frame_equal(result, expected)
+
+    def test_sparse_frame_fillna_limit(self):
+        index = np.arange(10)
+        df = DataFrame(np.random.randn(10, 4), index=index)
+        sdf = df.to_sparse()
+
+        result = sdf[:2].reindex(index)
+        result = result.fillna(method='pad', limit=5)
+
+        expected = sdf[:2].reindex(index).fillna(method='pad')
+        expected = expected.to_dense()
+        expected.values[-3:] = np.nan
+        expected = expected.to_sparse()
+        tm.assert_frame_equal(result, expected)
+
+        result = sdf[-2:].reindex(index)
+        result = result.fillna(method='backfill', limit=5)
+
+        expected = sdf[-2:].reindex(index).fillna(method='backfill')
+        expected = expected.to_dense()
+        expected.values[:3] = np.nan
+        expected = expected.to_sparse()
+        tm.assert_frame_equal(result, expected)
+
+    def test_rename(self):
+        result = self.frame.rename(index=str)
+        expected = SparseDataFrame(self.data, index=self.dates.strftime(
+            "%Y-%m-%d %H:%M:%S"))
+        tm.assert_sp_frame_equal(result, expected)
+
+        result = self.frame.rename(columns=lambda x: '%s%d' % (x, len(x)))
+        data = {'A1': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
+                'B1': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
+                'C1': np.arange(10, dtype=np.float64),
+                'D1': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]}
+        expected = SparseDataFrame(data, index=self.dates)
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_corr(self):
+        res = self.frame.corr()
+        tm.assert_frame_equal(res, self.frame.to_dense().corr())
+
+    def test_describe(self):
+        self.frame['foo'] = np.nan
+        self.frame.get_dtype_counts()
+        str(self.frame)
+        desc = self.frame.describe()  # noqa
+
+    def test_join(self):
+        left = self.frame.loc[:, ['A', 'B']]
+        right = self.frame.loc[:, ['C', 'D']]
+        joined = left.join(right)
+        tm.assert_sp_frame_equal(joined, self.frame, exact_indices=False)
+
+        right = self.frame.loc[:, ['B', 'D']]
+        pytest.raises(Exception, left.join, right)
+
+        with tm.assert_raises_regex(ValueError,
+                                    'Other Series must have a name'):
+            self.frame.join(Series(
+                np.random.randn(len(self.frame)), index=self.frame.index))
+
+    def test_reindex(self):
+
+        def _check_frame(frame):
+            index = frame.index
+            sidx = index[::2]
+            sidx2 = index[:5]  # noqa
+
+            sparse_result = frame.reindex(sidx)
+            dense_result = frame.to_dense().reindex(sidx)
+            tm.assert_frame_equal(sparse_result.to_dense(), dense_result)
+
+            tm.assert_frame_equal(frame.reindex(list(sidx)).to_dense(),
+                                  dense_result)
+
+            sparse_result2 = sparse_result.reindex(index)
+            dense_result2 = dense_result.reindex(index)
+            tm.assert_frame_equal(sparse_result2.to_dense(), dense_result2)
+
+            # propagate CORRECT fill value
+            tm.assert_almost_equal(sparse_result.default_fill_value,
+                                   frame.default_fill_value)
+            tm.assert_almost_equal(sparse_result['A'].fill_value,
+                                   frame['A'].fill_value)
+
+            # length zero
+            length_zero = frame.reindex([])
+            assert len(length_zero) == 0
+            assert len(length_zero.columns) == len(frame.columns)
+            assert len(length_zero['A']) == 0
+
+            # frame being reindexed has length zero
+            length_n = length_zero.reindex(index)
+            assert len(length_n) == len(frame)
+            assert len(length_n.columns) == len(frame.columns)
+            assert len(length_n['A']) == len(frame)
+
+            # reindex columns
+            reindexed = frame.reindex(columns=['A', 'B', 'Z'])
+            assert len(reindexed.columns) == 3
+            tm.assert_almost_equal(reindexed['Z'].fill_value,
+                                   frame.default_fill_value)
+            assert np.isnan(reindexed['Z'].sp_values).all()
+
+        _check_frame(self.frame)
+        _check_frame(self.iframe)
+        _check_frame(self.zframe)
+        _check_frame(self.fill_frame)
+
+        # with copy=False
+        reindexed = self.frame.reindex(self.frame.index, copy=False)
+        reindexed['F'] = reindexed['A']
+        assert 'F' in self.frame
+
+        reindexed = self.frame.reindex(self.frame.index)
+        reindexed['G'] = reindexed['A']
+        assert 'G' not in self.frame
+
+    def test_reindex_fill_value(self):
+        rng = bdate_range('20110110', periods=20)
+
+        result = self.zframe.reindex(rng, fill_value=0)
+        exp = self.zorig.reindex(rng, fill_value=0)
+        exp = exp.to_sparse(self.zframe.default_fill_value)
+        tm.assert_sp_frame_equal(result, exp)
+
+    def test_reindex_method(self):
+
+        sparse = SparseDataFrame(data=[[11., 12., 14.],
+                                       [21., 22., 24.],
+                                       [41., 42., 44.]],
+                                 index=[1, 2, 4],
+                                 columns=[1, 2, 4],
+                                 dtype=float)
+
+        # Over indices
+
+        # default method
+        result = sparse.reindex(index=range(6))
+        expected = SparseDataFrame(data=[[nan, nan, nan],
+                                         [11., 12., 14.],
+                                         [21., 22., 24.],
+                                         [nan, nan, nan],
+                                         [41., 42., 44.],
+                                         [nan, nan, nan]],
+                                   index=range(6),
+                                   columns=[1, 2, 4],
+                                   dtype=float)
+        tm.assert_sp_frame_equal(result, expected)
+
+        # method='bfill'
+        result = sparse.reindex(index=range(6), method='bfill')
+        expected = SparseDataFrame(data=[[11., 12., 14.],
+                                         [11., 12., 14.],
+                                         [21., 22., 24.],
+                                         [41., 42., 44.],
+                                         [41., 42., 44.],
+                                         [nan, nan, nan]],
+                                   index=range(6),
+                                   columns=[1, 2, 4],
+                                   dtype=float)
+        tm.assert_sp_frame_equal(result, expected)
+
+        # method='ffill'
+        result = sparse.reindex(index=range(6), method='ffill')
+        expected = SparseDataFrame(data=[[nan, nan, nan],
+                                         [11., 12., 14.],
+                                         [21., 22., 24.],
+                                         [21., 22., 24.],
+                                         [41., 42., 44.],
+                                         [41., 42., 44.]],
+                                   index=range(6),
+                                   columns=[1, 2, 4],
+                                   dtype=float)
+        tm.assert_sp_frame_equal(result, expected)
+
+        # Over columns
+
+        # default method
+        result = sparse.reindex(columns=range(6))
+        expected = SparseDataFrame(data=[[nan, 11., 12., nan, 14., nan],
+                                         [nan, 21., 22., nan, 24., nan],
+                                         [nan, 41., 42., nan, 44., nan]],
+                                   index=[1, 2, 4],
+                                   columns=range(6),
+                                   dtype=float)
+        tm.assert_sp_frame_equal(result, expected)
+
+        # method='bfill'
+        with pytest.raises(NotImplementedError):
+            sparse.reindex(columns=range(6), method='bfill')
+
+        # method='ffill'
+        with pytest.raises(NotImplementedError):
+            sparse.reindex(columns=range(6), method='ffill')
+
+    def test_take(self):
+        result = self.frame.take([1, 0, 2], axis=1)
+        expected = self.frame.reindex(columns=['B', 'A', 'C'])
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_to_dense(self):
+        def _check(frame, orig):
+            dense_dm = frame.to_dense()
+            tm.assert_frame_equal(frame, dense_dm)
+            tm.assert_frame_equal(dense_dm, orig, check_dtype=False)
+
+        self._check_all(_check)
+
+    def test_stack_sparse_frame(self):
+        with catch_warnings(record=True):
+
+            def _check(frame):
+                dense_frame = frame.to_dense()  # noqa
+
+                wp = Panel.from_dict({'foo': frame})
+                from_dense_lp = wp.to_frame()
+
+                from_sparse_lp = spf.stack_sparse_frame(frame)
+
+                tm.assert_numpy_array_equal(from_dense_lp.values,
+                                            from_sparse_lp.values)
+
+            _check(self.frame)
+            _check(self.iframe)
+
+            # for now
+            pytest.raises(Exception, _check, self.zframe)
+            pytest.raises(Exception, _check, self.fill_frame)
+
+    def test_transpose(self):
+
+        def _check(frame, orig):
+            transposed = frame.T
+            untransposed = transposed.T
+            tm.assert_sp_frame_equal(frame, untransposed)
+
+            tm.assert_frame_equal(frame.T.to_dense(), orig.T)
+            tm.assert_frame_equal(frame.T.T.to_dense(), orig.T.T)
+            tm.assert_sp_frame_equal(frame, frame.T.T, exact_indices=False)
+
+        self._check_all(_check)
+
+    def test_shift(self):
+
+        def _check(frame, orig):
+            shifted = frame.shift(0)
+            exp = orig.shift(0)
+            tm.assert_frame_equal(shifted.to_dense(), exp)
+
+            shifted = frame.shift(1)
+            exp = orig.shift(1)
+            tm.assert_frame_equal(shifted, exp)
+
+            shifted = frame.shift(-2)
+            exp = orig.shift(-2)
+            tm.assert_frame_equal(shifted, exp)
+
+            shifted = frame.shift(2, freq='B')
+            exp = orig.shift(2, freq='B')
+            exp = exp.to_sparse(frame.default_fill_value,
+                                kind=frame.default_kind)
+            tm.assert_frame_equal(shifted, exp)
+
+            shifted = frame.shift(2, freq=BDay())
+            exp = orig.shift(2, freq=BDay())
+            exp = exp.to_sparse(frame.default_fill_value,
+                                kind=frame.default_kind)
+            tm.assert_frame_equal(shifted, exp)
+
+        self._check_all(_check)
+
+    def test_count(self):
+        dense_result = self.frame.to_dense().count()
+
+        result = self.frame.count()
+        tm.assert_series_equal(result, dense_result)
+
+        result = self.frame.count(axis=None)
+        tm.assert_series_equal(result, dense_result)
+
+        result = self.frame.count(axis=0)
+        tm.assert_series_equal(result, dense_result)
+
+        result = self.frame.count(axis=1)
+        dense_result = self.frame.to_dense().count(axis=1)
+
+        # win32 don't check dtype
+        tm.assert_series_equal(result, dense_result, check_dtype=False)
+
+    def _check_all(self, check_func):
+        check_func(self.frame, self.orig)
+        check_func(self.iframe, self.iorig)
+        check_func(self.zframe, self.zorig)
+        check_func(self.fill_frame, self.fill_orig)
+
+    def test_numpy_transpose(self):
+        sdf = SparseDataFrame([1, 2, 3], index=[1, 2, 3], columns=['a'])
+        result = np.transpose(np.transpose(sdf))
+        tm.assert_sp_frame_equal(result, sdf)
+
+        msg = "the 'axes' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.transpose, sdf, axes=1)
+
+    def test_combine_first(self):
+        df = self.frame
+
+        result = df[::2].combine_first(df)
+        result2 = df[::2].combine_first(df.to_dense())
+
+        expected = df[::2].to_dense().combine_first(df.to_dense())
+        expected = expected.to_sparse(fill_value=df.default_fill_value)
+
+        tm.assert_sp_frame_equal(result, result2)
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_combine_add(self):
+        df = self.frame.to_dense()
+        df2 = df.copy()
+        df2['C'][:3] = np.nan
+        df['A'][:3] = 5.7
+
+        result = df.to_sparse().add(df2.to_sparse(), fill_value=0)
+        expected = df.add(df2, fill_value=0).to_sparse()
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_isin(self):
+        sparse_df = DataFrame({'flag': [1., 0., 1.]}).to_sparse(fill_value=0.)
+        xp = sparse_df[sparse_df.flag == 1.]
+        rs = sparse_df[sparse_df.flag.isin([1.])]
+        tm.assert_frame_equal(xp, rs)
+
+    def test_sparse_pow_issue(self):
+        # 2220
+        df = SparseDataFrame({'A': [1.1, 3.3], 'B': [2.5, -3.9]})
+
+        # note : no error without nan
+        df = SparseDataFrame({'A': [nan, 0, 1]})
+
+        # note that 2 ** df works fine, also df ** 1
+        result = 1 ** df
+
+        r1 = result.take([0], 1)['A']
+        r2 = result['A']
+
+        assert len(r2.sp_values) == len(r1.sp_values)
+
+    def test_as_blocks(self):
+        df = SparseDataFrame({'A': [1.1, 3.3], 'B': [nan, -3.9]},
+                             dtype='float64')
+
+        # deprecated 0.21.0
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            df_blocks = df.blocks
+        assert list(df_blocks.keys()) == ['float64']
+        tm.assert_frame_equal(df_blocks['float64'], df)
+
+    @pytest.mark.xfail(reason='nan column names in _init_dict problematic '
+                              '(GH 16894)')
+    def test_nan_columnname(self):
+        # GH 8822
+        nan_colname = DataFrame(Series(1.0, index=[0]), columns=[nan])
+        nan_colname_sparse = nan_colname.to_sparse()
+        assert np.isnan(nan_colname_sparse.columns[0])
+
+    def test_isna(self):
+        # GH 8276
+        df = pd.SparseDataFrame({'A': [np.nan, np.nan, 1, 2, np.nan],
+                                 'B': [0, np.nan, np.nan, 2, np.nan]})
+
+        res = df.isna()
+        exp = pd.SparseDataFrame({'A': [True, True, False, False, True],
+                                  'B': [False, True, True, False, True]},
+                                 default_fill_value=True)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+        # if fill_value is not nan, True can be included in sp_values
+        df = pd.SparseDataFrame({'A': [0, 0, 1, 2, np.nan],
+                                 'B': [0, np.nan, 0, 2, np.nan]},
+                                default_fill_value=0.)
+        res = df.isna()
+        assert isinstance(res, pd.SparseDataFrame)
+        exp = pd.DataFrame({'A': [False, False, False, False, True],
+                            'B': [False, True, False, False, True]})
+        tm.assert_frame_equal(res.to_dense(), exp)
+
+    def test_notna(self):
+        # GH 8276
+        df = pd.SparseDataFrame({'A': [np.nan, np.nan, 1, 2, np.nan],
+                                 'B': [0, np.nan, np.nan, 2, np.nan]})
+
+        res = df.notna()
+        exp = pd.SparseDataFrame({'A': [False, False, True, True, False],
+                                  'B': [True, False, False, True, False]},
+                                 default_fill_value=False)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+        # if fill_value is not nan, True can be included in sp_values
+        df = pd.SparseDataFrame({'A': [0, 0, 1, 2, np.nan],
+                                 'B': [0, np.nan, 0, 2, np.nan]},
+                                default_fill_value=0.)
+        res = df.notna()
+        assert isinstance(res, pd.SparseDataFrame)
+        exp = pd.DataFrame({'A': [True, True, True, True, False],
+                            'B': [True, False, True, True, False]})
+        tm.assert_frame_equal(res.to_dense(), exp)
+
+
+class TestSparseDataFrameArithmetic(object):
+
+    def test_numeric_op_scalar(self):
+        df = pd.DataFrame({'A': [nan, nan, 0, 1, ],
+                           'B': [0, 1, 2, nan],
+                           'C': [1., 2., 3., 4.],
+                           'D': [nan, nan, nan, nan]})
+        sparse = df.to_sparse()
+
+        tm.assert_sp_frame_equal(sparse + 1, (df + 1).to_sparse())
+
+    def test_comparison_op_scalar(self):
+        # GH 13001
+        df = pd.DataFrame({'A': [nan, nan, 0, 1, ],
+                           'B': [0, 1, 2, nan],
+                           'C': [1., 2., 3., 4.],
+                           'D': [nan, nan, nan, nan]})
+        sparse = df.to_sparse()
+
+        # comparison changes internal repr, compare with dense
+        res = sparse > 1
+        assert isinstance(res, pd.SparseDataFrame)
+        tm.assert_frame_equal(res.to_dense(), df > 1)
+
+        res = sparse != 0
+        assert isinstance(res, pd.SparseDataFrame)
+        tm.assert_frame_equal(res.to_dense(), df != 0)
+
+
+class TestSparseDataFrameAnalytics(object):
+    def setup_method(self, method):
+        self.data = {'A': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
+                     'B': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
+                     'C': np.arange(10, dtype=float),
+                     'D': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]}
+
+        self.dates = bdate_range('1/1/2011', periods=10)
+
+        self.frame = SparseDataFrame(self.data, index=self.dates)
+
+    def test_cumsum(self):
+        expected = SparseDataFrame(self.frame.to_dense().cumsum())
+
+        result = self.frame.cumsum()
+        tm.assert_sp_frame_equal(result, expected)
+
+        result = self.frame.cumsum(axis=None)
+        tm.assert_sp_frame_equal(result, expected)
+
+        result = self.frame.cumsum(axis=0)
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_numpy_cumsum(self):
+        result = np.cumsum(self.frame)
+        expected = SparseDataFrame(self.frame.to_dense().cumsum())
+        tm.assert_sp_frame_equal(result, expected)
+
+        msg = "the 'dtype' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.cumsum,
+                               self.frame, dtype=np.int64)
+
+        msg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.cumsum,
+                               self.frame, out=result)
+
+    def test_numpy_func_call(self):
+        # no exception should be raised even though
+        # numpy passes in 'axis=None' or `axis=-1'
+        funcs = ['sum', 'cumsum', 'var',
+                 'mean', 'prod', 'cumprod',
+                 'std', 'min', 'max']
+        for func in funcs:
+            getattr(np, func)(self.frame)
+
+    @pytest.mark.xfail(reason='Wrong SparseBlock initialization '
+                              '(GH 17386)')
+    def test_quantile(self):
+        # GH 17386
+        data = [[1, 1], [2, 10], [3, 100], [nan, nan]]
+        q = 0.1
+
+        sparse_df = SparseDataFrame(data)
+        result = sparse_df.quantile(q)
+
+        dense_df = DataFrame(data)
+        dense_expected = dense_df.quantile(q)
+        sparse_expected = SparseSeries(dense_expected)
+
+        tm.assert_series_equal(result, dense_expected)
+        tm.assert_sp_series_equal(result, sparse_expected)
+
+    @pytest.mark.xfail(reason='Wrong SparseBlock initialization '
+                              '(GH 17386)')
+    def test_quantile_multi(self):
+        # GH 17386
+        data = [[1, 1], [2, 10], [3, 100], [nan, nan]]
+        q = [0.1, 0.5]
+
+        sparse_df = SparseDataFrame(data)
+        result = sparse_df.quantile(q)
+
+        dense_df = DataFrame(data)
+        dense_expected = dense_df.quantile(q)
+        sparse_expected = SparseDataFrame(dense_expected)
+
+        tm.assert_frame_equal(result, dense_expected)
+        tm.assert_sp_frame_equal(result, sparse_expected)
+
+    def test_assign_with_sparse_frame(self):
+        # GH 19163
+        df = pd.DataFrame({"a": [1, 2, 3]})
+        res = df.to_sparse(fill_value=False).assign(newcol=False)
+        exp = df.assign(newcol=False).to_sparse(fill_value=False)
+
+        tm.assert_sp_frame_equal(res, exp)
+
+        for column in res.columns:
+            assert type(res[column]) is SparseSeries
diff --git a/pandas/tests/sparse/frame/test_indexing.py b/pandas/tests/sparse/frame/test_indexing.py
new file mode 100644
index 0000000000000..1c27d44015c2b
--- /dev/null
+++ b/pandas/tests/sparse/frame/test_indexing.py
@@ -0,0 +1,113 @@
+import pytest
+import numpy as np
+from pandas import SparseDataFrame, DataFrame
+from pandas.util import testing as tm
+
+
+pytestmark = pytest.mark.skip("Wrong SparseBlock initialization (GH 17386)")
+
+
+@pytest.mark.parametrize('data', [
+    [[1, 1], [2, 2], [3, 3], [4, 4], [0, 0]],
+    [[1.0, 1.0], [2.0, 2.0], [3.0, 3.0], [4.0, 4.0], [np.nan, np.nan]],
+    [
+        [1.0, 1.0 + 1.0j],
+        [2.0 + 2.0j, 2.0],
+        [3.0, 3.0 + 3.0j],
+        [4.0 + 4.0j, 4.0],
+        [np.nan, np.nan]
+    ]
+])
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization '
+                          '(GH 17386)')
+def test_where_with_numeric_data(data):
+    # GH 17386
+    lower_bound = 1.5
+
+    sparse = SparseDataFrame(data)
+    result = sparse.where(sparse > lower_bound)
+
+    dense = DataFrame(data)
+    dense_expected = dense.where(dense > lower_bound)
+    sparse_expected = SparseDataFrame(dense_expected)
+
+    tm.assert_frame_equal(result, dense_expected)
+    tm.assert_sp_frame_equal(result, sparse_expected)
+
+
+@pytest.mark.parametrize('data', [
+    [[1, 1], [2, 2], [3, 3], [4, 4], [0, 0]],
+    [[1.0, 1.0], [2.0, 2.0], [3.0, 3.0], [4.0, 4.0], [np.nan, np.nan]],
+    [
+        [1.0, 1.0 + 1.0j],
+        [2.0 + 2.0j, 2.0],
+        [3.0, 3.0 + 3.0j],
+        [4.0 + 4.0j, 4.0],
+        [np.nan, np.nan]
+    ]
+])
+@pytest.mark.parametrize('other', [
+    True,
+    -100,
+    0.1,
+    100.0 + 100.0j
+])
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization '
+                          '(GH 17386)')
+def test_where_with_numeric_data_and_other(data, other):
+    # GH 17386
+    lower_bound = 1.5
+
+    sparse = SparseDataFrame(data)
+    result = sparse.where(sparse > lower_bound, other)
+
+    dense = DataFrame(data)
+    dense_expected = dense.where(dense > lower_bound, other)
+    sparse_expected = SparseDataFrame(dense_expected,
+                                      default_fill_value=other)
+
+    tm.assert_frame_equal(result, dense_expected)
+    tm.assert_sp_frame_equal(result, sparse_expected)
+
+
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization '
+                          '(GH 17386)')
+def test_where_with_bool_data():
+    # GH 17386
+    data = [[False, False], [True, True], [False, False]]
+    cond = True
+
+    sparse = SparseDataFrame(data)
+    result = sparse.where(sparse == cond)
+
+    dense = DataFrame(data)
+    dense_expected = dense.where(dense == cond)
+    sparse_expected = SparseDataFrame(dense_expected)
+
+    tm.assert_frame_equal(result, dense_expected)
+    tm.assert_sp_frame_equal(result, sparse_expected)
+
+
+@pytest.mark.parametrize('other', [
+    True,
+    0,
+    0.1,
+    100.0 + 100.0j
+])
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization '
+                          '(GH 17386)')
+def test_where_with_bool_data_and_other(other):
+    # GH 17386
+    data = [[False, False], [True, True], [False, False]]
+    cond = True
+
+    sparse = SparseDataFrame(data)
+    result = sparse.where(sparse == cond, other)
+
+    dense = DataFrame(data)
+    dense_expected = dense.where(dense == cond, other)
+    sparse_expected = SparseDataFrame(dense_expected,
+                                      default_fill_value=other)
+
+    tm.assert_frame_equal(result, dense_expected)
+    tm.assert_sp_frame_equal(result, sparse_expected)
diff --git a/pandas/tests/sparse/frame/test_to_csv.py b/pandas/tests/sparse/frame/test_to_csv.py
new file mode 100644
index 0000000000000..b0243dfde8d3f
--- /dev/null
+++ b/pandas/tests/sparse/frame/test_to_csv.py
@@ -0,0 +1,20 @@
+import numpy as np
+import pytest
+from pandas import SparseDataFrame, read_csv
+from pandas.util import testing as tm
+
+
+class TestSparseDataFrameToCsv(object):
+    fill_values = [np.nan, 0, None, 1]
+
+    @pytest.mark.parametrize('fill_value', fill_values)
+    def test_to_csv_sparse_dataframe(self, fill_value):
+        # GH19384
+        sdf = SparseDataFrame({'a': type(self).fill_values},
+                              default_fill_value=fill_value)
+
+        with tm.ensure_clean('sparse_df.csv') as path:
+            sdf.to_csv(path, index=False)
+            df = read_csv(path, skip_blank_lines=False)
+
+            tm.assert_sp_frame_equal(df.to_sparse(fill_value=fill_value), sdf)
diff --git a/pandas/tests/sparse/frame/test_to_from_scipy.py b/pandas/tests/sparse/frame/test_to_from_scipy.py
new file mode 100644
index 0000000000000..aef49c84fc2ad
--- /dev/null
+++ b/pandas/tests/sparse/frame/test_to_from_scipy.py
@@ -0,0 +1,168 @@
+import pytest
+import numpy as np
+from warnings import catch_warnings
+from pandas.util import testing as tm
+from pandas import SparseDataFrame, SparseSeries
+from distutils.version import LooseVersion
+from pandas.core.dtypes.common import (
+    is_bool_dtype,
+    is_float_dtype,
+    is_object_dtype,
+    is_float)
+
+
+scipy = pytest.importorskip('scipy')
+
+
+@pytest.mark.parametrize('index', [None, list('abc')])  # noqa: F811
+@pytest.mark.parametrize('columns', [None, list('def')])
+@pytest.mark.parametrize('fill_value', [None, 0, np.nan])
+@pytest.mark.parametrize('dtype', [bool, int, float, np.uint16])
+def test_from_to_scipy(spmatrix, index, columns, fill_value, dtype):
+    # GH 4343
+    # Make one ndarray and from it one sparse matrix, both to be used for
+    # constructing frames and comparing results
+    arr = np.eye(3, dtype=dtype)
+    # GH 16179
+    arr[0, 1] = dtype(2)
+    try:
+        spm = spmatrix(arr)
+        assert spm.dtype == arr.dtype
+    except (TypeError, AssertionError):
+        # If conversion to sparse fails for this spmatrix type and arr.dtype,
+        # then the combination is not currently supported in NumPy, so we
+        # can just skip testing it thoroughly
+        return
+
+    sdf = SparseDataFrame(spm, index=index, columns=columns,
+                          default_fill_value=fill_value)
+
+    # Expected result construction is kind of tricky for all
+    # dtype-fill_value combinations; easiest to cast to something generic
+    # and except later on
+    rarr = arr.astype(object)
+    rarr[arr == 0] = np.nan
+    expected = SparseDataFrame(rarr, index=index, columns=columns).fillna(
+        fill_value if fill_value is not None else np.nan)
+
+    # Assert frame is as expected
+    sdf_obj = sdf.astype(object)
+    tm.assert_sp_frame_equal(sdf_obj, expected)
+    tm.assert_frame_equal(sdf_obj.to_dense(), expected.to_dense())
+
+    # Assert spmatrices equal
+    assert dict(sdf.to_coo().todok()) == dict(spm.todok())
+
+    # Ensure dtype is preserved if possible
+    was_upcast = ((fill_value is None or is_float(fill_value)) and
+                  not is_object_dtype(dtype) and
+                  not is_float_dtype(dtype))
+    res_dtype = (bool if is_bool_dtype(dtype) else
+                 float if was_upcast else
+                 dtype)
+    tm.assert_contains_all(sdf.dtypes, {np.dtype(res_dtype)})
+    assert sdf.to_coo().dtype == res_dtype
+
+    # However, adding a str column results in an upcast to object
+    sdf['strings'] = np.arange(len(sdf)).astype(str)
+    assert sdf.to_coo().dtype == np.object_
+
+
+@pytest.mark.parametrize('fill_value', [None, 0, np.nan])  # noqa: F811
+def test_from_to_scipy_object(spmatrix, fill_value):
+    # GH 4343
+    dtype = object
+    columns = list('cd')
+    index = list('ab')
+
+    if (spmatrix is scipy.sparse.dok_matrix and LooseVersion(
+            scipy.__version__) >= LooseVersion('0.19.0')):
+        pytest.skip("dok_matrix from object does not work in SciPy >= 0.19")
+
+    # Make one ndarray and from it one sparse matrix, both to be used for
+    # constructing frames and comparing results
+    arr = np.eye(2, dtype=dtype)
+    try:
+        spm = spmatrix(arr)
+        assert spm.dtype == arr.dtype
+    except (TypeError, AssertionError):
+        # If conversion to sparse fails for this spmatrix type and arr.dtype,
+        # then the combination is not currently supported in NumPy, so we
+        # can just skip testing it thoroughly
+        return
+
+    sdf = SparseDataFrame(spm, index=index, columns=columns,
+                          default_fill_value=fill_value)
+
+    # Expected result construction is kind of tricky for all
+    # dtype-fill_value combinations; easiest to cast to something generic
+    # and except later on
+    rarr = arr.astype(object)
+    rarr[arr == 0] = np.nan
+    expected = SparseDataFrame(rarr, index=index, columns=columns).fillna(
+        fill_value if fill_value is not None else np.nan)
+
+    # Assert frame is as expected
+    sdf_obj = sdf.astype(object)
+    tm.assert_sp_frame_equal(sdf_obj, expected)
+    tm.assert_frame_equal(sdf_obj.to_dense(), expected.to_dense())
+
+    # Assert spmatrices equal
+    with catch_warnings(record=True):
+        assert dict(sdf.to_coo().todok()) == dict(spm.todok())
+
+    # Ensure dtype is preserved if possible
+    res_dtype = object
+    tm.assert_contains_all(sdf.dtypes, {np.dtype(res_dtype)})
+    assert sdf.to_coo().dtype == res_dtype
+
+
+def test_from_scipy_correct_ordering(spmatrix):
+    # GH 16179
+    arr = np.arange(1, 5).reshape(2, 2)
+    try:
+        spm = spmatrix(arr)
+        assert spm.dtype == arr.dtype
+    except (TypeError, AssertionError):
+        # If conversion to sparse fails for this spmatrix type and arr.dtype,
+        # then the combination is not currently supported in NumPy, so we
+        # can just skip testing it thoroughly
+        return
+
+    sdf = SparseDataFrame(spm)
+    expected = SparseDataFrame(arr)
+    tm.assert_sp_frame_equal(sdf, expected)
+    tm.assert_frame_equal(sdf.to_dense(), expected.to_dense())
+
+
+def test_from_scipy_fillna(spmatrix):
+    # GH 16112
+    arr = np.eye(3)
+    arr[1:, 0] = np.nan
+
+    try:
+        spm = spmatrix(arr)
+        assert spm.dtype == arr.dtype
+    except (TypeError, AssertionError):
+        # If conversion to sparse fails for this spmatrix type and arr.dtype,
+        # then the combination is not currently supported in NumPy, so we
+        # can just skip testing it thoroughly
+        return
+
+    sdf = SparseDataFrame(spm).fillna(-1.0)
+
+    # Returning frame should fill all nan values with -1.0
+    expected = SparseDataFrame({
+        0: SparseSeries([1., -1, -1]),
+        1: SparseSeries([np.nan, 1, np.nan]),
+        2: SparseSeries([np.nan, np.nan, 1]),
+    }, default_fill_value=-1)
+
+    # fill_value is expected to be what .fillna() above was called with
+    # We don't use -1 as initial fill_value in expected SparseSeries
+    # construction because this way we obtain "compressed" SparseArrays,
+    # avoiding having to construct them ourselves
+    for col in expected:
+        expected[col].fill_value = -1
+
+    tm.assert_sp_frame_equal(sdf, expected)
diff --git a/pandas/tests/sparse/series/__init__.py b/pandas/tests/sparse/series/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/sparse/series/test_indexing.py b/pandas/tests/sparse/series/test_indexing.py
new file mode 100644
index 0000000000000..de01b065a9fa0
--- /dev/null
+++ b/pandas/tests/sparse/series/test_indexing.py
@@ -0,0 +1,113 @@
+import pytest
+import numpy as np
+from pandas import SparseSeries, Series
+from pandas.util import testing as tm
+
+
+pytestmark = pytest.mark.skip("Wrong SparseBlock initialization (GH 17386)")
+
+
+@pytest.mark.parametrize('data', [
+    [1, 1, 2, 2, 3, 3, 4, 4, 0, 0],
+    [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, np.nan, np.nan],
+    [
+        1.0, 1.0 + 1.0j,
+        2.0 + 2.0j, 2.0,
+        3.0, 3.0 + 3.0j,
+        4.0 + 4.0j, 4.0,
+        np.nan, np.nan
+    ]
+])
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization '
+                          '(GH 17386)')
+def test_where_with_numeric_data(data):
+    # GH 17386
+    lower_bound = 1.5
+
+    sparse = SparseSeries(data)
+    result = sparse.where(sparse > lower_bound)
+
+    dense = Series(data)
+    dense_expected = dense.where(dense > lower_bound)
+    sparse_expected = SparseSeries(dense_expected)
+
+    tm.assert_series_equal(result, dense_expected)
+    tm.assert_sp_series_equal(result, sparse_expected)
+
+
+@pytest.mark.parametrize('data', [
+    [1, 1, 2, 2, 3, 3, 4, 4, 0, 0],
+    [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, np.nan, np.nan],
+    [
+        1.0, 1.0 + 1.0j,
+        2.0 + 2.0j, 2.0,
+        3.0, 3.0 + 3.0j,
+        4.0 + 4.0j, 4.0,
+        np.nan, np.nan
+    ]
+])
+@pytest.mark.parametrize('other', [
+    True,
+    -100,
+    0.1,
+    100.0 + 100.0j
+])
+@pytest.mark.skip(reason='Wrong SparseBlock initialization '
+                         '(Segfault) '
+                         '(GH 17386)')
+def test_where_with_numeric_data_and_other(data, other):
+    # GH 17386
+    lower_bound = 1.5
+
+    sparse = SparseSeries(data)
+    result = sparse.where(sparse > lower_bound, other)
+
+    dense = Series(data)
+    dense_expected = dense.where(dense > lower_bound, other)
+    sparse_expected = SparseSeries(dense_expected, fill_value=other)
+
+    tm.assert_series_equal(result, dense_expected)
+    tm.assert_sp_series_equal(result, sparse_expected)
+
+
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization '
+                          '(GH 17386)')
+def test_where_with_bool_data():
+    # GH 17386
+    data = [False, False, True, True, False, False]
+    cond = True
+
+    sparse = SparseSeries(data)
+    result = sparse.where(sparse == cond)
+
+    dense = Series(data)
+    dense_expected = dense.where(dense == cond)
+    sparse_expected = SparseSeries(dense_expected)
+
+    tm.assert_series_equal(result, dense_expected)
+    tm.assert_sp_series_equal(result, sparse_expected)
+
+
+@pytest.mark.parametrize('other', [
+    True,
+    0,
+    0.1,
+    100.0 + 100.0j
+])
+@pytest.mark.skip(reason='Wrong SparseBlock initialization '
+                         '(Segfault) '
+                         '(GH 17386)')
+def test_where_with_bool_data_and_other(other):
+    # GH 17386
+    data = [False, False, True, True, False, False]
+    cond = True
+
+    sparse = SparseSeries(data)
+    result = sparse.where(sparse == cond, other)
+
+    dense = Series(data)
+    dense_expected = dense.where(dense == cond, other)
+    sparse_expected = SparseSeries(dense_expected, fill_value=other)
+
+    tm.assert_series_equal(result, dense_expected)
+    tm.assert_sp_series_equal(result, sparse_expected)
diff --git a/pandas/tests/sparse/series/test_series.py b/pandas/tests/sparse/series/test_series.py
new file mode 100644
index 0000000000000..921c30234660f
--- /dev/null
+++ b/pandas/tests/sparse/series/test_series.py
@@ -0,0 +1,1458 @@
+# pylint: disable-msg=E1101,W0612
+
+import operator
+from datetime import datetime
+
+import pytest
+
+from numpy import nan
+import numpy as np
+import pandas as pd
+
+from pandas import (Series, DataFrame, bdate_range,
+                    isna, compat, _np_version_under1p12)
+from pandas.tseries.offsets import BDay
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas.compat import range, PY36
+from pandas.core.reshape.util import cartesian_product
+
+import pandas.core.sparse.frame as spf
+
+from pandas._libs.sparse import BlockIndex, IntIndex
+from pandas.core.sparse.api import SparseSeries
+from pandas.tests.series.test_api import SharedWithSparse
+
+
+def _test_data1():
+    # nan-based
+    arr = np.arange(20, dtype=float)
+    index = np.arange(20)
+    arr[:2] = nan
+    arr[5:10] = nan
+    arr[-3:] = nan
+
+    return arr, index
+
+
+def _test_data2():
+    # nan-based
+    arr = np.arange(15, dtype=float)
+    index = np.arange(15)
+    arr[7:12] = nan
+    arr[-1:] = nan
+    return arr, index
+
+
+def _test_data1_zero():
+    # zero-based
+    arr, index = _test_data1()
+    arr[np.isnan(arr)] = 0
+    return arr, index
+
+
+def _test_data2_zero():
+    # zero-based
+    arr, index = _test_data2()
+    arr[np.isnan(arr)] = 0
+    return arr, index
+
+
+class TestSparseSeries(SharedWithSparse):
+
+    series_klass = SparseSeries
+    # SharedWithSparse tests use generic, series_klass-agnostic assertion
+    _assert_series_equal = staticmethod(tm.assert_sp_series_equal)
+
+    def setup_method(self, method):
+        arr, index = _test_data1()
+
+        date_index = bdate_range('1/1/2011', periods=len(index))
+
+        self.bseries = SparseSeries(arr, index=index, kind='block',
+                                    name='bseries')
+        self.ts = self.bseries
+
+        self.btseries = SparseSeries(arr, index=date_index, kind='block')
+
+        self.iseries = SparseSeries(arr, index=index, kind='integer',
+                                    name='iseries')
+
+        arr, index = _test_data2()
+        self.bseries2 = SparseSeries(arr, index=index, kind='block')
+        self.iseries2 = SparseSeries(arr, index=index, kind='integer')
+
+        arr, index = _test_data1_zero()
+        self.zbseries = SparseSeries(arr, index=index, kind='block',
+                                     fill_value=0, name='zbseries')
+        self.ziseries = SparseSeries(arr, index=index, kind='integer',
+                                     fill_value=0)
+
+        arr, index = _test_data2_zero()
+        self.zbseries2 = SparseSeries(arr, index=index, kind='block',
+                                      fill_value=0)
+        self.ziseries2 = SparseSeries(arr, index=index, kind='integer',
+                                      fill_value=0)
+
+    def test_constructor_dict_input(self):
+        # gh-16905
+        constructor_dict = {1: 1.}
+        index = [0, 1, 2]
+
+        # Series with index passed in
+        series = pd.Series(constructor_dict)
+        expected = SparseSeries(series, index=index)
+
+        result = SparseSeries(constructor_dict, index=index)
+        tm.assert_sp_series_equal(result, expected)
+
+        # Series with index and dictionary with no index
+        expected = SparseSeries(series)
+
+        result = SparseSeries(constructor_dict)
+        tm.assert_sp_series_equal(result, expected)
+
+    def test_constructor_dict_order(self):
+        # GH19018
+        # initialization ordering: by insertion order if python>= 3.6, else
+        # order by value
+        d = {'b': 1, 'a': 0, 'c': 2}
+        result = SparseSeries(d)
+        if PY36:
+            expected = SparseSeries([1, 0, 2], index=list('bac'))
+        else:
+            expected = SparseSeries([0, 1, 2], index=list('abc'))
+        tm.assert_sp_series_equal(result, expected)
+
+    def test_constructor_dtype(self):
+        arr = SparseSeries([np.nan, 1, 2, np.nan])
+        assert arr.dtype == np.float64
+        assert np.isnan(arr.fill_value)
+
+        arr = SparseSeries([np.nan, 1, 2, np.nan], fill_value=0)
+        assert arr.dtype == np.float64
+        assert arr.fill_value == 0
+
+        arr = SparseSeries([0, 1, 2, 4], dtype=np.int64, fill_value=np.nan)
+        assert arr.dtype == np.int64
+        assert np.isnan(arr.fill_value)
+
+        arr = SparseSeries([0, 1, 2, 4], dtype=np.int64)
+        assert arr.dtype == np.int64
+        assert arr.fill_value == 0
+
+        arr = SparseSeries([0, 1, 2, 4], fill_value=0, dtype=np.int64)
+        assert arr.dtype == np.int64
+        assert arr.fill_value == 0
+
+    def test_iteration_and_str(self):
+        [x for x in self.bseries]
+        str(self.bseries)
+
+    def test_construct_DataFrame_with_sp_series(self):
+        # it works!
+        df = DataFrame({'col': self.bseries})
+
+        # printing & access
+        df.iloc[:1]
+        df['col']
+        df.dtypes
+        str(df)
+
+        tm.assert_sp_series_equal(df['col'], self.bseries, check_names=False)
+
+        result = df.iloc[:, 0]
+        tm.assert_sp_series_equal(result, self.bseries, check_names=False)
+
+        # blocking
+        expected = Series({'col': 'float64:sparse'})
+        result = df.ftypes
+        tm.assert_series_equal(expected, result)
+
+    def test_constructor_preserve_attr(self):
+        arr = pd.SparseArray([1, 0, 3, 0], dtype=np.int64, fill_value=0)
+        assert arr.dtype == np.int64
+        assert arr.fill_value == 0
+
+        s = pd.SparseSeries(arr, name='x')
+        assert s.dtype == np.int64
+        assert s.fill_value == 0
+
+    def test_series_density(self):
+        # GH2803
+        ts = Series(np.random.randn(10))
+        ts[2:-2] = nan
+        sts = ts.to_sparse()
+        density = sts.density  # don't die
+        assert density == 4 / 10.0
+
+    def test_sparse_to_dense(self):
+        arr, index = _test_data1()
+        series = self.bseries.to_dense()
+        tm.assert_series_equal(series, Series(arr, name='bseries'))
+
+        # see gh-14647
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            series = self.bseries.to_dense(sparse_only=True)
+
+        indexer = np.isfinite(arr)
+        exp = Series(arr[indexer], index=index[indexer], name='bseries')
+        tm.assert_series_equal(series, exp)
+
+        series = self.iseries.to_dense()
+        tm.assert_series_equal(series, Series(arr, name='iseries'))
+
+        arr, index = _test_data1_zero()
+        series = self.zbseries.to_dense()
+        tm.assert_series_equal(series, Series(arr, name='zbseries'))
+
+        series = self.ziseries.to_dense()
+        tm.assert_series_equal(series, Series(arr))
+
+    def test_to_dense_fill_value(self):
+        s = pd.Series([1, np.nan, np.nan, 3, np.nan])
+        res = SparseSeries(s).to_dense()
+        tm.assert_series_equal(res, s)
+
+        res = SparseSeries(s, fill_value=0).to_dense()
+        tm.assert_series_equal(res, s)
+
+        s = pd.Series([1, np.nan, 0, 3, 0])
+        res = SparseSeries(s, fill_value=0).to_dense()
+        tm.assert_series_equal(res, s)
+
+        res = SparseSeries(s, fill_value=0).to_dense()
+        tm.assert_series_equal(res, s)
+
+        s = pd.Series([np.nan, np.nan, np.nan, np.nan, np.nan])
+        res = SparseSeries(s).to_dense()
+        tm.assert_series_equal(res, s)
+
+        s = pd.Series([np.nan, np.nan, np.nan, np.nan, np.nan])
+        res = SparseSeries(s, fill_value=0).to_dense()
+        tm.assert_series_equal(res, s)
+
+    def test_dense_to_sparse(self):
+        series = self.bseries.to_dense()
+        bseries = series.to_sparse(kind='block')
+        iseries = series.to_sparse(kind='integer')
+        tm.assert_sp_series_equal(bseries, self.bseries)
+        tm.assert_sp_series_equal(iseries, self.iseries, check_names=False)
+        assert iseries.name == self.bseries.name
+
+        assert len(series) == len(bseries)
+        assert len(series) == len(iseries)
+        assert series.shape == bseries.shape
+        assert series.shape == iseries.shape
+
+        # non-NaN fill value
+        series = self.zbseries.to_dense()
+        zbseries = series.to_sparse(kind='block', fill_value=0)
+        ziseries = series.to_sparse(kind='integer', fill_value=0)
+        tm.assert_sp_series_equal(zbseries, self.zbseries)
+        tm.assert_sp_series_equal(ziseries, self.ziseries, check_names=False)
+        assert ziseries.name == self.zbseries.name
+
+        assert len(series) == len(zbseries)
+        assert len(series) == len(ziseries)
+        assert series.shape == zbseries.shape
+        assert series.shape == ziseries.shape
+
+    def test_to_dense_preserve_name(self):
+        assert (self.bseries.name is not None)
+        result = self.bseries.to_dense()
+        assert result.name == self.bseries.name
+
+    def test_constructor(self):
+        # test setup guys
+        assert np.isnan(self.bseries.fill_value)
+        assert isinstance(self.bseries.sp_index, BlockIndex)
+        assert np.isnan(self.iseries.fill_value)
+        assert isinstance(self.iseries.sp_index, IntIndex)
+
+        assert self.zbseries.fill_value == 0
+        tm.assert_numpy_array_equal(self.zbseries.values.values,
+                                    self.bseries.to_dense().fillna(0).values)
+
+        # pass SparseSeries
+        def _check_const(sparse, name):
+            # use passed series name
+            result = SparseSeries(sparse)
+            tm.assert_sp_series_equal(result, sparse)
+            assert sparse.name == name
+            assert result.name == name
+
+            # use passed name
+            result = SparseSeries(sparse, name='x')
+            tm.assert_sp_series_equal(result, sparse, check_names=False)
+            assert result.name == 'x'
+
+        _check_const(self.bseries, 'bseries')
+        _check_const(self.iseries, 'iseries')
+        _check_const(self.zbseries, 'zbseries')
+
+        # Sparse time series works
+        date_index = bdate_range('1/1/2000', periods=len(self.bseries))
+        s5 = SparseSeries(self.bseries, index=date_index)
+        assert isinstance(s5, SparseSeries)
+
+        # pass Series
+        bseries2 = SparseSeries(self.bseries.to_dense())
+        tm.assert_numpy_array_equal(self.bseries.sp_values, bseries2.sp_values)
+
+        # pass dict?
+
+        # don't copy the data by default
+        values = np.ones(self.bseries.npoints)
+        sp = SparseSeries(values, sparse_index=self.bseries.sp_index)
+        sp.sp_values[:5] = 97
+        assert values[0] == 97
+
+        assert len(sp) == 20
+        assert sp.shape == (20, )
+
+        # but can make it copy!
+        sp = SparseSeries(values, sparse_index=self.bseries.sp_index,
+                          copy=True)
+        sp.sp_values[:5] = 100
+        assert values[0] == 97
+
+        assert len(sp) == 20
+        assert sp.shape == (20, )
+
+    def test_constructor_scalar(self):
+        data = 5
+        sp = SparseSeries(data, np.arange(100))
+        sp = sp.reindex(np.arange(200))
+        assert (sp.loc[:99] == data).all()
+        assert isna(sp.loc[100:]).all()
+
+        data = np.nan
+        sp = SparseSeries(data, np.arange(100))
+        assert len(sp) == 100
+        assert sp.shape == (100, )
+
+    def test_constructor_ndarray(self):
+        pass
+
+    def test_constructor_nonnan(self):
+        arr = [0, 0, 0, nan, nan]
+        sp_series = SparseSeries(arr, fill_value=0)
+        tm.assert_numpy_array_equal(sp_series.values.values, np.array(arr))
+        assert len(sp_series) == 5
+        assert sp_series.shape == (5, )
+
+    def test_constructor_empty(self):
+        # see gh-9272
+        sp = SparseSeries()
+        assert len(sp.index) == 0
+        assert sp.shape == (0, )
+
+    def test_copy_astype(self):
+        cop = self.bseries.astype(np.float64)
+        assert cop is not self.bseries
+        assert cop.sp_index is self.bseries.sp_index
+        assert cop.dtype == np.float64
+
+        cop2 = self.iseries.copy()
+
+        tm.assert_sp_series_equal(cop, self.bseries)
+        tm.assert_sp_series_equal(cop2, self.iseries)
+
+        # test that data is copied
+        cop[:5] = 97
+        assert cop.sp_values[0] == 97
+        assert self.bseries.sp_values[0] != 97
+
+        # correct fill value
+        zbcop = self.zbseries.copy()
+        zicop = self.ziseries.copy()
+
+        tm.assert_sp_series_equal(zbcop, self.zbseries)
+        tm.assert_sp_series_equal(zicop, self.ziseries)
+
+        # no deep copy
+        view = self.bseries.copy(deep=False)
+        view.sp_values[:5] = 5
+        assert (self.bseries.sp_values[:5] == 5).all()
+
+    def test_shape(self):
+        # see gh-10452
+        assert self.bseries.shape == (20, )
+        assert self.btseries.shape == (20, )
+        assert self.iseries.shape == (20, )
+
+        assert self.bseries2.shape == (15, )
+        assert self.iseries2.shape == (15, )
+
+        assert self.zbseries2.shape == (15, )
+        assert self.ziseries2.shape == (15, )
+
+    def test_astype(self):
+        with pytest.raises(ValueError):
+            self.bseries.astype(np.int64)
+
+    def test_astype_all(self):
+        orig = pd.Series(np.array([1, 2, 3]))
+        s = SparseSeries(orig)
+
+        types = [np.float64, np.float32, np.int64,
+                 np.int32, np.int16, np.int8]
+        for typ in types:
+            res = s.astype(typ)
+            assert res.dtype == typ
+            tm.assert_series_equal(res.to_dense(), orig.astype(typ))
+
+    def test_kind(self):
+        assert self.bseries.kind == 'block'
+        assert self.iseries.kind == 'integer'
+
+    def test_to_frame(self):
+        # GH 9850
+        s = pd.SparseSeries([1, 2, 0, nan, 4, nan, 0], name='x')
+        exp = pd.SparseDataFrame({'x': [1, 2, 0, nan, 4, nan, 0]})
+        tm.assert_sp_frame_equal(s.to_frame(), exp)
+
+        exp = pd.SparseDataFrame({'y': [1, 2, 0, nan, 4, nan, 0]})
+        tm.assert_sp_frame_equal(s.to_frame(name='y'), exp)
+
+        s = pd.SparseSeries([1, 2, 0, nan, 4, nan, 0], name='x', fill_value=0)
+        exp = pd.SparseDataFrame({'x': [1, 2, 0, nan, 4, nan, 0]},
+                                 default_fill_value=0)
+
+        tm.assert_sp_frame_equal(s.to_frame(), exp)
+        exp = pd.DataFrame({'y': [1, 2, 0, nan, 4, nan, 0]})
+        tm.assert_frame_equal(s.to_frame(name='y').to_dense(), exp)
+
+    def test_pickle(self):
+        def _test_roundtrip(series):
+            unpickled = tm.round_trip_pickle(series)
+            tm.assert_sp_series_equal(series, unpickled)
+            tm.assert_series_equal(series.to_dense(), unpickled.to_dense())
+
+        self._check_all(_test_roundtrip)
+
+    def _check_all(self, check_func):
+        check_func(self.bseries)
+        check_func(self.iseries)
+        check_func(self.zbseries)
+        check_func(self.ziseries)
+
+    def test_getitem(self):
+        def _check_getitem(sp, dense):
+            for idx, val in compat.iteritems(dense):
+                tm.assert_almost_equal(val, sp[idx])
+
+            for i in range(len(dense)):
+                tm.assert_almost_equal(sp[i], dense[i])
+                # j = np.float64(i)
+                # assert_almost_equal(sp[j], dense[j])
+
+                # API change 1/6/2012
+                # negative getitem works
+                # for i in xrange(len(dense)):
+                #     assert_almost_equal(sp[-i], dense[-i])
+
+        _check_getitem(self.bseries, self.bseries.to_dense())
+        _check_getitem(self.btseries, self.btseries.to_dense())
+
+        _check_getitem(self.zbseries, self.zbseries.to_dense())
+        _check_getitem(self.iseries, self.iseries.to_dense())
+        _check_getitem(self.ziseries, self.ziseries.to_dense())
+
+        # exception handling
+        pytest.raises(Exception, self.bseries.__getitem__,
+                      len(self.bseries) + 1)
+
+        # index not contained
+        pytest.raises(Exception, self.btseries.__getitem__,
+                      self.btseries.index[-1] + BDay())
+
+    def test_get_get_value(self):
+        tm.assert_almost_equal(self.bseries.get(10), self.bseries[10])
+        assert self.bseries.get(len(self.bseries) + 1) is None
+
+        dt = self.btseries.index[10]
+        result = self.btseries.get(dt)
+        expected = self.btseries.to_dense()[dt]
+        tm.assert_almost_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            tm.assert_almost_equal(
+                self.bseries.get_value(10), self.bseries[10])
+
+    def test_set_value(self):
+
+        idx = self.btseries.index[7]
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            self.btseries.set_value(idx, 0)
+        assert self.btseries[idx] == 0
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            self.iseries.set_value('foobar', 0)
+        assert self.iseries.index[-1] == 'foobar'
+        assert self.iseries['foobar'] == 0
+
+    def test_getitem_slice(self):
+        idx = self.bseries.index
+        res = self.bseries[::2]
+        assert isinstance(res, SparseSeries)
+
+        expected = self.bseries.reindex(idx[::2])
+        tm.assert_sp_series_equal(res, expected)
+
+        res = self.bseries[:5]
+        assert isinstance(res, SparseSeries)
+        tm.assert_sp_series_equal(res, self.bseries.reindex(idx[:5]))
+
+        res = self.bseries[5:]
+        tm.assert_sp_series_equal(res, self.bseries.reindex(idx[5:]))
+
+        # negative indices
+        res = self.bseries[:-3]
+        tm.assert_sp_series_equal(res, self.bseries.reindex(idx[:-3]))
+
+    def test_take(self):
+        def _compare_with_dense(sp):
+            dense = sp.to_dense()
+
+            def _compare(idx):
+                dense_result = dense.take(idx).values
+                sparse_result = sp.take(idx)
+                assert isinstance(sparse_result, SparseSeries)
+                tm.assert_almost_equal(dense_result,
+                                       sparse_result.values.values)
+
+            _compare([1., 2., 3., 4., 5., 0.])
+            _compare([7, 2, 9, 0, 4])
+            _compare([3, 6, 3, 4, 7])
+
+        self._check_all(_compare_with_dense)
+
+        pytest.raises(Exception, self.bseries.take,
+                      [0, len(self.bseries) + 1])
+
+        # Corner case
+        sp = SparseSeries(np.ones(10) * nan)
+        exp = pd.Series(np.repeat(nan, 5))
+        tm.assert_series_equal(sp.take([0, 1, 2, 3, 4]), exp)
+
+        with tm.assert_produces_warning(FutureWarning):
+            sp.take([1, 5], convert=True)
+
+        with tm.assert_produces_warning(FutureWarning):
+            sp.take([1, 5], convert=False)
+
+    def test_numpy_take(self):
+        sp = SparseSeries([1.0, 2.0, 3.0])
+        indices = [1, 2]
+
+        if not _np_version_under1p12:
+            tm.assert_series_equal(np.take(sp, indices, axis=0).to_dense(),
+                                   np.take(sp.to_dense(), indices, axis=0))
+
+            msg = "the 'out' parameter is not supported"
+            tm.assert_raises_regex(ValueError, msg, np.take,
+                                   sp, indices, out=np.empty(sp.shape))
+
+            msg = "the 'mode' parameter is not supported"
+            tm.assert_raises_regex(ValueError, msg, np.take,
+                                   sp, indices, out=None, mode='clip')
+
+    def test_setitem(self):
+        self.bseries[5] = 7.
+        assert self.bseries[5] == 7.
+
+    def test_setslice(self):
+        self.bseries[5:10] = 7.
+        tm.assert_series_equal(self.bseries[5:10].to_dense(),
+                               Series(7., index=range(5, 10),
+                                      name=self.bseries.name))
+
+    def test_operators(self):
+
+        def _check_op(a, b, op):
+            sp_result = op(a, b)
+            adense = a.to_dense() if isinstance(a, SparseSeries) else a
+            bdense = b.to_dense() if isinstance(b, SparseSeries) else b
+            dense_result = op(adense, bdense)
+            tm.assert_almost_equal(sp_result.to_dense(), dense_result)
+
+        def check(a, b):
+            _check_op(a, b, operator.add)
+            _check_op(a, b, operator.sub)
+            _check_op(a, b, operator.truediv)
+            _check_op(a, b, operator.floordiv)
+            _check_op(a, b, operator.mul)
+
+            _check_op(a, b, lambda x, y: operator.add(y, x))
+            _check_op(a, b, lambda x, y: operator.sub(y, x))
+            _check_op(a, b, lambda x, y: operator.truediv(y, x))
+            _check_op(a, b, lambda x, y: operator.floordiv(y, x))
+            _check_op(a, b, lambda x, y: operator.mul(y, x))
+
+            # NaN ** 0 = 1 in C?
+            # _check_op(a, b, operator.pow)
+            # _check_op(a, b, lambda x, y: operator.pow(y, x))
+
+        check(self.bseries, self.bseries)
+        check(self.iseries, self.iseries)
+        check(self.bseries, self.iseries)
+
+        check(self.bseries, self.bseries2)
+        check(self.bseries, self.iseries2)
+        check(self.iseries, self.iseries2)
+
+        # scalar value
+        check(self.bseries, 5)
+
+        # zero-based
+        check(self.zbseries, self.zbseries * 2)
+        check(self.zbseries, self.zbseries2)
+        check(self.ziseries, self.ziseries2)
+
+        # with dense
+        result = self.bseries + self.bseries.to_dense()
+        tm.assert_sp_series_equal(result, self.bseries + self.bseries)
+
+    def test_binary_operators(self):
+
+        # skipping for now #####
+        import pytest
+        pytest.skip("skipping sparse binary operators test")
+
+        def _check_inplace_op(iop, op):
+            tmp = self.bseries.copy()
+
+            expected = op(tmp, self.bseries)
+            iop(tmp, self.bseries)
+            tm.assert_sp_series_equal(tmp, expected)
+
+        inplace_ops = ['add', 'sub', 'mul', 'truediv', 'floordiv', 'pow']
+        for op in inplace_ops:
+            _check_inplace_op(getattr(operator, "i%s" % op),
+                              getattr(operator, op))
+
+    def test_abs(self):
+        s = SparseSeries([1, 2, -3], name='x')
+        expected = SparseSeries([1, 2, 3], name='x')
+        result = s.abs()
+        tm.assert_sp_series_equal(result, expected)
+        assert result.name == 'x'
+
+        result = abs(s)
+        tm.assert_sp_series_equal(result, expected)
+        assert result.name == 'x'
+
+        result = np.abs(s)
+        tm.assert_sp_series_equal(result, expected)
+        assert result.name == 'x'
+
+        s = SparseSeries([1, -2, 2, -3], fill_value=-2, name='x')
+        expected = SparseSeries([1, 2, 3], sparse_index=s.sp_index,
+                                fill_value=2, name='x')
+        result = s.abs()
+        tm.assert_sp_series_equal(result, expected)
+        assert result.name == 'x'
+
+        result = abs(s)
+        tm.assert_sp_series_equal(result, expected)
+        assert result.name == 'x'
+
+        result = np.abs(s)
+        tm.assert_sp_series_equal(result, expected)
+        assert result.name == 'x'
+
+    def test_reindex(self):
+        def _compare_with_series(sps, new_index):
+            spsre = sps.reindex(new_index)
+
+            series = sps.to_dense()
+            seriesre = series.reindex(new_index)
+            seriesre = seriesre.to_sparse(fill_value=sps.fill_value)
+
+            tm.assert_sp_series_equal(spsre, seriesre)
+            tm.assert_series_equal(spsre.to_dense(), seriesre.to_dense())
+
+        _compare_with_series(self.bseries, self.bseries.index[::2])
+        _compare_with_series(self.bseries, list(self.bseries.index[::2]))
+        _compare_with_series(self.bseries, self.bseries.index[:10])
+        _compare_with_series(self.bseries, self.bseries.index[5:])
+
+        _compare_with_series(self.zbseries, self.zbseries.index[::2])
+        _compare_with_series(self.zbseries, self.zbseries.index[:10])
+        _compare_with_series(self.zbseries, self.zbseries.index[5:])
+
+        # special cases
+        same_index = self.bseries.reindex(self.bseries.index)
+        tm.assert_sp_series_equal(self.bseries, same_index)
+        assert same_index is not self.bseries
+
+        # corner cases
+        sp = SparseSeries([], index=[])
+        # TODO: sp_zero is not used anywhere...remove?
+        sp_zero = SparseSeries([], index=[], fill_value=0)  # noqa
+        _compare_with_series(sp, np.arange(10))
+
+        # with copy=False
+        reindexed = self.bseries.reindex(self.bseries.index, copy=True)
+        reindexed.sp_values[:] = 1.
+        assert (self.bseries.sp_values != 1.).all()
+
+        reindexed = self.bseries.reindex(self.bseries.index, copy=False)
+        reindexed.sp_values[:] = 1.
+        tm.assert_numpy_array_equal(self.bseries.sp_values, np.repeat(1., 10))
+
+    def test_sparse_reindex(self):
+        length = 10
+
+        def _check(values, index1, index2, fill_value):
+            first_series = SparseSeries(values, sparse_index=index1,
+                                        fill_value=fill_value)
+            reindexed = first_series.sparse_reindex(index2)
+            assert reindexed.sp_index is index2
+
+            int_indices1 = index1.to_int_index().indices
+            int_indices2 = index2.to_int_index().indices
+
+            expected = Series(values, index=int_indices1)
+            expected = expected.reindex(int_indices2).fillna(fill_value)
+            tm.assert_almost_equal(expected.values, reindexed.sp_values)
+
+            # make sure level argument asserts
+            # TODO: expected is not used anywhere...remove?
+            expected = expected.reindex(int_indices2).fillna(fill_value)  # noqa
+
+        def _check_with_fill_value(values, first, second, fill_value=nan):
+            i_index1 = IntIndex(length, first)
+            i_index2 = IntIndex(length, second)
+
+            b_index1 = i_index1.to_block_index()
+            b_index2 = i_index2.to_block_index()
+
+            _check(values, i_index1, i_index2, fill_value)
+            _check(values, b_index1, b_index2, fill_value)
+
+        def _check_all(values, first, second):
+            _check_with_fill_value(values, first, second, fill_value=nan)
+            _check_with_fill_value(values, first, second, fill_value=0)
+
+        index1 = [2, 4, 5, 6, 8, 9]
+        values1 = np.arange(6.)
+
+        _check_all(values1, index1, [2, 4, 5])
+        _check_all(values1, index1, [2, 3, 4, 5, 6, 7, 8, 9])
+        _check_all(values1, index1, [0, 1])
+        _check_all(values1, index1, [0, 1, 7, 8, 9])
+        _check_all(values1, index1, [])
+
+        first_series = SparseSeries(values1,
+                                    sparse_index=IntIndex(length, index1),
+                                    fill_value=nan)
+        with tm.assert_raises_regex(TypeError,
+                                    'new index must be a SparseIndex'):
+            reindexed = first_series.sparse_reindex(0)  # noqa
+
+    def test_repr(self):
+        # TODO: These aren't used
+        bsrepr = repr(self.bseries)  # noqa
+        isrepr = repr(self.iseries)  # noqa
+
+    def test_iter(self):
+        pass
+
+    def test_truncate(self):
+        pass
+
+    def test_fillna(self):
+        pass
+
+    def test_groupby(self):
+        pass
+
+    def test_reductions(self):
+        def _compare_with_dense(obj, op):
+            sparse_result = getattr(obj, op)()
+            series = obj.to_dense()
+            dense_result = getattr(series, op)()
+            assert sparse_result == dense_result
+
+        to_compare = ['count', 'sum', 'mean', 'std', 'var', 'skew']
+
+        def _compare_all(obj):
+            for op in to_compare:
+                _compare_with_dense(obj, op)
+
+        _compare_all(self.bseries)
+
+        self.bseries.sp_values[5:10] = np.NaN
+        _compare_all(self.bseries)
+
+        _compare_all(self.zbseries)
+        self.zbseries.sp_values[5:10] = np.NaN
+        _compare_all(self.zbseries)
+
+        series = self.zbseries.copy()
+        series.fill_value = 2
+        _compare_all(series)
+
+        nonna = Series(np.random.randn(20)).to_sparse()
+        _compare_all(nonna)
+
+        nonna2 = Series(np.random.randn(20)).to_sparse(fill_value=0)
+        _compare_all(nonna2)
+
+    def test_dropna(self):
+        sp = SparseSeries([0, 0, 0, nan, nan, 5, 6], fill_value=0)
+
+        sp_valid = sp.dropna()
+
+        expected = sp.to_dense().dropna()
+        expected = expected[expected != 0]
+        exp_arr = pd.SparseArray(expected.values, fill_value=0, kind='block')
+        tm.assert_sp_array_equal(sp_valid.values, exp_arr)
+        tm.assert_index_equal(sp_valid.index, expected.index)
+        assert len(sp_valid.sp_values) == 2
+
+        result = self.bseries.dropna()
+        expected = self.bseries.to_dense().dropna()
+        assert not isinstance(result, SparseSeries)
+        tm.assert_series_equal(result, expected)
+
+    def test_homogenize(self):
+        def _check_matches(indices, expected):
+            data = {}
+            for i, idx in enumerate(indices):
+                data[i] = SparseSeries(idx.to_int_index().indices,
+                                       sparse_index=idx, fill_value=np.nan)
+            # homogenized is only valid with NaN fill values
+            homogenized = spf.homogenize(data)
+
+            for k, v in compat.iteritems(homogenized):
+                assert (v.sp_index.equals(expected))
+
+        indices1 = [BlockIndex(10, [2], [7]), BlockIndex(10, [1, 6], [3, 4]),
+                    BlockIndex(10, [0], [10])]
+        expected1 = BlockIndex(10, [2, 6], [2, 3])
+        _check_matches(indices1, expected1)
+
+        indices2 = [BlockIndex(10, [2], [7]), BlockIndex(10, [2], [7])]
+        expected2 = indices2[0]
+        _check_matches(indices2, expected2)
+
+        # must have NaN fill value
+        data = {'a': SparseSeries(np.arange(7), sparse_index=expected2,
+                                  fill_value=0)}
+        with tm.assert_raises_regex(TypeError, "NaN fill value"):
+            spf.homogenize(data)
+
+    def test_fill_value_corner(self):
+        cop = self.zbseries.copy()
+        cop.fill_value = 0
+        result = self.bseries / cop
+
+        assert np.isnan(result.fill_value)
+
+        cop2 = self.zbseries.copy()
+        cop2.fill_value = 1
+        result = cop2 / cop
+        # 1 / 0 is inf
+        assert np.isinf(result.fill_value)
+
+    def test_fill_value_when_combine_const(self):
+        # GH12723
+        s = SparseSeries([0, 1, np.nan, 3, 4, 5], index=np.arange(6))
+
+        exp = s.fillna(0).add(2)
+        res = s.add(2, fill_value=0)
+        tm.assert_series_equal(res, exp)
+
+    def test_shift(self):
+        series = SparseSeries([nan, 1., 2., 3., nan, nan], index=np.arange(6))
+
+        shifted = series.shift(0)
+        assert shifted is not series
+        tm.assert_sp_series_equal(shifted, series)
+
+        f = lambda s: s.shift(1)
+        _dense_series_compare(series, f)
+
+        f = lambda s: s.shift(-2)
+        _dense_series_compare(series, f)
+
+        series = SparseSeries([nan, 1., 2., 3., nan, nan],
+                              index=bdate_range('1/1/2000', periods=6))
+        f = lambda s: s.shift(2, freq='B')
+        _dense_series_compare(series, f)
+
+        f = lambda s: s.shift(2, freq=BDay())
+        _dense_series_compare(series, f)
+
+    def test_shift_nan(self):
+        # GH 12908
+        orig = pd.Series([np.nan, 2, np.nan, 4, 0, np.nan, 0])
+        sparse = orig.to_sparse()
+
+        tm.assert_sp_series_equal(sparse.shift(0), orig.shift(0).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(1), orig.shift(1).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(2), orig.shift(2).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(3), orig.shift(3).to_sparse())
+
+        tm.assert_sp_series_equal(sparse.shift(-1), orig.shift(-1).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(-2), orig.shift(-2).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(-3), orig.shift(-3).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(-4), orig.shift(-4).to_sparse())
+
+        sparse = orig.to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(sparse.shift(0),
+                                  orig.shift(0).to_sparse(fill_value=0))
+        tm.assert_sp_series_equal(sparse.shift(1),
+                                  orig.shift(1).to_sparse(fill_value=0))
+        tm.assert_sp_series_equal(sparse.shift(2),
+                                  orig.shift(2).to_sparse(fill_value=0))
+        tm.assert_sp_series_equal(sparse.shift(3),
+                                  orig.shift(3).to_sparse(fill_value=0))
+
+        tm.assert_sp_series_equal(sparse.shift(-1),
+                                  orig.shift(-1).to_sparse(fill_value=0))
+        tm.assert_sp_series_equal(sparse.shift(-2),
+                                  orig.shift(-2).to_sparse(fill_value=0))
+        tm.assert_sp_series_equal(sparse.shift(-3),
+                                  orig.shift(-3).to_sparse(fill_value=0))
+        tm.assert_sp_series_equal(sparse.shift(-4),
+                                  orig.shift(-4).to_sparse(fill_value=0))
+
+    def test_shift_dtype(self):
+        # GH 12908
+        orig = pd.Series([1, 2, 3, 4], dtype=np.int64)
+
+        sparse = orig.to_sparse()
+        tm.assert_sp_series_equal(sparse.shift(0), orig.shift(0).to_sparse())
+
+        sparse = orig.to_sparse(fill_value=np.nan)
+        tm.assert_sp_series_equal(sparse.shift(0),
+                                  orig.shift(0).to_sparse(fill_value=np.nan))
+        # shift(1) or more span changes dtype to float64
+        tm.assert_sp_series_equal(sparse.shift(1), orig.shift(1).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(2), orig.shift(2).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(3), orig.shift(3).to_sparse())
+
+        tm.assert_sp_series_equal(sparse.shift(-1), orig.shift(-1).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(-2), orig.shift(-2).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(-3), orig.shift(-3).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(-4), orig.shift(-4).to_sparse())
+
+    def test_shift_dtype_fill_value(self):
+        # GH 12908
+        orig = pd.Series([1, 0, 0, 4], dtype=np.int64)
+
+        for v in [0, 1, np.nan]:
+            sparse = orig.to_sparse(fill_value=v)
+
+            tm.assert_sp_series_equal(sparse.shift(0),
+                                      orig.shift(0).to_sparse(fill_value=v))
+            tm.assert_sp_series_equal(sparse.shift(1),
+                                      orig.shift(1).to_sparse(fill_value=v))
+            tm.assert_sp_series_equal(sparse.shift(2),
+                                      orig.shift(2).to_sparse(fill_value=v))
+            tm.assert_sp_series_equal(sparse.shift(3),
+                                      orig.shift(3).to_sparse(fill_value=v))
+
+            tm.assert_sp_series_equal(sparse.shift(-1),
+                                      orig.shift(-1).to_sparse(fill_value=v))
+            tm.assert_sp_series_equal(sparse.shift(-2),
+                                      orig.shift(-2).to_sparse(fill_value=v))
+            tm.assert_sp_series_equal(sparse.shift(-3),
+                                      orig.shift(-3).to_sparse(fill_value=v))
+            tm.assert_sp_series_equal(sparse.shift(-4),
+                                      orig.shift(-4).to_sparse(fill_value=v))
+
+    def test_combine_first(self):
+        s = self.bseries
+
+        result = s[::2].combine_first(s)
+        result2 = s[::2].combine_first(s.to_dense())
+
+        expected = s[::2].to_dense().combine_first(s.to_dense())
+        expected = expected.to_sparse(fill_value=s.fill_value)
+
+        tm.assert_sp_series_equal(result, result2)
+        tm.assert_sp_series_equal(result, expected)
+
+    @pytest.mark.parametrize('deep', [True, False])
+    @pytest.mark.parametrize('fill_value', [0, 1, np.nan, None])
+    def test_memory_usage_deep(self, deep, fill_value):
+        values = [0, 1, np.nan, None]
+        sparse_series = SparseSeries(values, fill_value=fill_value)
+        dense_series = Series(values)
+        sparse_usage = sparse_series.memory_usage(deep=deep)
+        dense_usage = dense_series.memory_usage(deep=deep)
+
+        assert sparse_usage < dense_usage
+
+
+class TestSparseHandlingMultiIndexes(object):
+
+    def setup_method(self, method):
+        miindex = pd.MultiIndex.from_product(
+            [["x", "y"], ["10", "20"]], names=['row-foo', 'row-bar'])
+        micol = pd.MultiIndex.from_product(
+            [['a', 'b', 'c'], ["1", "2"]], names=['col-foo', 'col-bar'])
+        dense_multiindex_frame = pd.DataFrame(
+            index=miindex, columns=micol).sort_index().sort_index(axis=1)
+        self.dense_multiindex_frame = dense_multiindex_frame.fillna(value=3.14)
+
+    def test_to_sparse_preserve_multiindex_names_columns(self):
+        sparse_multiindex_frame = self.dense_multiindex_frame.to_sparse()
+        sparse_multiindex_frame = sparse_multiindex_frame.copy()
+        tm.assert_index_equal(sparse_multiindex_frame.columns,
+                              self.dense_multiindex_frame.columns)
+
+    def test_round_trip_preserve_multiindex_names(self):
+        sparse_multiindex_frame = self.dense_multiindex_frame.to_sparse()
+        round_trip_multiindex_frame = sparse_multiindex_frame.to_dense()
+        tm.assert_frame_equal(self.dense_multiindex_frame,
+                              round_trip_multiindex_frame,
+                              check_column_type=True,
+                              check_names=True)
+
+
+@td.skip_if_no_scipy
+class TestSparseSeriesScipyInteraction(object):
+    # Issue 8048: add SparseSeries coo methods
+
+    def setup_method(self, method):
+        import scipy.sparse
+        # SparseSeries inputs used in tests, the tests rely on the order
+        self.sparse_series = []
+        s = pd.Series([3.0, nan, 1.0, 2.0, nan, nan])
+        s.index = pd.MultiIndex.from_tuples([(1, 2, 'a', 0),
+                                             (1, 2, 'a', 1),
+                                             (1, 1, 'b', 0),
+                                             (1, 1, 'b', 1),
+                                             (2, 1, 'b', 0),
+                                             (2, 1, 'b', 1)],
+                                            names=['A', 'B', 'C', 'D'])
+        self.sparse_series.append(s.to_sparse())
+
+        ss = self.sparse_series[0].copy()
+        ss.index.names = [3, 0, 1, 2]
+        self.sparse_series.append(ss)
+
+        ss = pd.Series([
+            nan
+        ] * 12, index=cartesian_product((range(3), range(4)))).to_sparse()
+        for k, v in zip([(0, 0), (1, 2), (1, 3)], [3.0, 1.0, 2.0]):
+            ss[k] = v
+        self.sparse_series.append(ss)
+
+        # results used in tests
+        self.coo_matrices = []
+        self.coo_matrices.append(scipy.sparse.coo_matrix(
+            ([3.0, 1.0, 2.0], ([0, 1, 1], [0, 2, 3])), shape=(3, 4)))
+        self.coo_matrices.append(scipy.sparse.coo_matrix(
+            ([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])), shape=(3, 4)))
+        self.coo_matrices.append(scipy.sparse.coo_matrix(
+            ([3.0, 1.0, 2.0], ([0, 1, 1], [0, 0, 1])), shape=(3, 2)))
+        self.ils = [[(1, 2), (1, 1), (2, 1)], [(1, 1), (1, 2), (2, 1)],
+                    [(1, 2, 'a'), (1, 1, 'b'), (2, 1, 'b')]]
+        self.jls = [[('a', 0), ('a', 1), ('b', 0), ('b', 1)], [0, 1]]
+
+    def test_to_coo_text_names_integer_row_levels_nosort(self):
+        ss = self.sparse_series[0]
+        kwargs = {'row_levels': [0, 1], 'column_levels': [2, 3]}
+        result = (self.coo_matrices[0], self.ils[0], self.jls[0])
+        self._run_test(ss, kwargs, result)
+
+    def test_to_coo_text_names_integer_row_levels_sort(self):
+        ss = self.sparse_series[0]
+        kwargs = {'row_levels': [0, 1],
+                  'column_levels': [2, 3],
+                  'sort_labels': True}
+        result = (self.coo_matrices[1], self.ils[1], self.jls[0])
+        self._run_test(ss, kwargs, result)
+
+    def test_to_coo_text_names_text_row_levels_nosort_col_level_single(self):
+        ss = self.sparse_series[0]
+        kwargs = {'row_levels': ['A', 'B', 'C'],
+                  'column_levels': ['D'],
+                  'sort_labels': False}
+        result = (self.coo_matrices[2], self.ils[2], self.jls[1])
+        self._run_test(ss, kwargs, result)
+
+    def test_to_coo_integer_names_integer_row_levels_nosort(self):
+        ss = self.sparse_series[1]
+        kwargs = {'row_levels': [3, 0], 'column_levels': [1, 2]}
+        result = (self.coo_matrices[0], self.ils[0], self.jls[0])
+        self._run_test(ss, kwargs, result)
+
+    def test_to_coo_text_names_text_row_levels_nosort(self):
+        ss = self.sparse_series[0]
+        kwargs = {'row_levels': ['A', 'B'], 'column_levels': ['C', 'D']}
+        result = (self.coo_matrices[0], self.ils[0], self.jls[0])
+        self._run_test(ss, kwargs, result)
+
+    def test_to_coo_bad_partition_nonnull_intersection(self):
+        ss = self.sparse_series[0]
+        pytest.raises(ValueError, ss.to_coo, ['A', 'B', 'C'], ['C', 'D'])
+
+    def test_to_coo_bad_partition_small_union(self):
+        ss = self.sparse_series[0]
+        pytest.raises(ValueError, ss.to_coo, ['A'], ['C', 'D'])
+
+    def test_to_coo_nlevels_less_than_two(self):
+        ss = self.sparse_series[0]
+        ss.index = np.arange(len(ss.index))
+        pytest.raises(ValueError, ss.to_coo)
+
+    def test_to_coo_bad_ilevel(self):
+        ss = self.sparse_series[0]
+        pytest.raises(KeyError, ss.to_coo, ['A', 'B'], ['C', 'D', 'E'])
+
+    def test_to_coo_duplicate_index_entries(self):
+        ss = pd.concat([self.sparse_series[0],
+                        self.sparse_series[0]]).to_sparse()
+        pytest.raises(ValueError, ss.to_coo, ['A', 'B'], ['C', 'D'])
+
+    def test_from_coo_dense_index(self):
+        ss = SparseSeries.from_coo(self.coo_matrices[0], dense_index=True)
+        check = self.sparse_series[2]
+        tm.assert_sp_series_equal(ss, check)
+
+    def test_from_coo_nodense_index(self):
+        ss = SparseSeries.from_coo(self.coo_matrices[0], dense_index=False)
+        check = self.sparse_series[2]
+        check = check.dropna().to_sparse()
+        tm.assert_sp_series_equal(ss, check)
+
+    def test_from_coo_long_repr(self):
+        # GH 13114
+        # test it doesn't raise error. Formatting is tested in test_format
+        import scipy.sparse
+
+        sparse = SparseSeries.from_coo(scipy.sparse.rand(350, 18))
+        repr(sparse)
+
+    def _run_test(self, ss, kwargs, check):
+        results = ss.to_coo(**kwargs)
+        self._check_results_to_coo(results, check)
+        # for every test, also test symmetry property (transpose), switch
+        # row_levels and column_levels
+        d = kwargs.copy()
+        d['row_levels'] = kwargs['column_levels']
+        d['column_levels'] = kwargs['row_levels']
+        results = ss.to_coo(**d)
+        results = (results[0].T, results[2], results[1])
+        self._check_results_to_coo(results, check)
+
+    def _check_results_to_coo(self, results, check):
+        (A, il, jl) = results
+        (A_result, il_result, jl_result) = check
+        # convert to dense and compare
+        tm.assert_numpy_array_equal(A.todense(), A_result.todense())
+        # or compare directly as difference of sparse
+        # assert(abs(A - A_result).max() < 1e-12) # max is failing in python
+        # 2.6
+        assert il == il_result
+        assert jl == jl_result
+
+    def test_concat(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        for kind in ['integer', 'block']:
+            sparse1 = pd.SparseSeries(val1, name='x', kind=kind)
+            sparse2 = pd.SparseSeries(val2, name='y', kind=kind)
+
+            res = pd.concat([sparse1, sparse2])
+            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+            exp = pd.SparseSeries(exp, kind=kind)
+            tm.assert_sp_series_equal(res, exp)
+
+            sparse1 = pd.SparseSeries(val1, fill_value=0, name='x', kind=kind)
+            sparse2 = pd.SparseSeries(val2, fill_value=0, name='y', kind=kind)
+
+            res = pd.concat([sparse1, sparse2])
+            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+            exp = pd.SparseSeries(exp, fill_value=0, kind=kind)
+            tm.assert_sp_series_equal(res, exp)
+
+    def test_concat_axis1(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        sparse1 = pd.SparseSeries(val1, name='x')
+        sparse2 = pd.SparseSeries(val2, name='y')
+
+        res = pd.concat([sparse1, sparse2], axis=1)
+        exp = pd.concat([pd.Series(val1, name='x'),
+                         pd.Series(val2, name='y')], axis=1)
+        exp = pd.SparseDataFrame(exp)
+        tm.assert_sp_frame_equal(res, exp)
+
+    def test_concat_different_fill(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        for kind in ['integer', 'block']:
+            sparse1 = pd.SparseSeries(val1, name='x', kind=kind)
+            sparse2 = pd.SparseSeries(val2, name='y', kind=kind, fill_value=0)
+
+            res = pd.concat([sparse1, sparse2])
+            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+            exp = pd.SparseSeries(exp, kind=kind)
+            tm.assert_sp_series_equal(res, exp)
+
+            res = pd.concat([sparse2, sparse1])
+            exp = pd.concat([pd.Series(val2), pd.Series(val1)])
+            exp = pd.SparseSeries(exp, kind=kind, fill_value=0)
+            tm.assert_sp_series_equal(res, exp)
+
+    def test_concat_axis1_different_fill(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        sparse1 = pd.SparseSeries(val1, name='x')
+        sparse2 = pd.SparseSeries(val2, name='y', fill_value=0)
+
+        res = pd.concat([sparse1, sparse2], axis=1)
+        exp = pd.concat([pd.Series(val1, name='x'),
+                         pd.Series(val2, name='y')], axis=1)
+        assert isinstance(res, pd.SparseDataFrame)
+        tm.assert_frame_equal(res.to_dense(), exp)
+
+    def test_concat_different_kind(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        sparse1 = pd.SparseSeries(val1, name='x', kind='integer')
+        sparse2 = pd.SparseSeries(val2, name='y', kind='block', fill_value=0)
+
+        res = pd.concat([sparse1, sparse2])
+        exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+        exp = pd.SparseSeries(exp, kind='integer')
+        tm.assert_sp_series_equal(res, exp)
+
+        res = pd.concat([sparse2, sparse1])
+        exp = pd.concat([pd.Series(val2), pd.Series(val1)])
+        exp = pd.SparseSeries(exp, kind='block', fill_value=0)
+        tm.assert_sp_series_equal(res, exp)
+
+    def test_concat_sparse_dense(self):
+        # use first input's fill_value
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        for kind in ['integer', 'block']:
+            sparse = pd.SparseSeries(val1, name='x', kind=kind)
+            dense = pd.Series(val2, name='y')
+
+            res = pd.concat([sparse, dense])
+            exp = pd.concat([pd.Series(val1), dense])
+            exp = pd.SparseSeries(exp, kind=kind)
+            tm.assert_sp_series_equal(res, exp)
+
+            res = pd.concat([dense, sparse, dense])
+            exp = pd.concat([dense, pd.Series(val1), dense])
+            exp = pd.SparseSeries(exp, kind=kind)
+            tm.assert_sp_series_equal(res, exp)
+
+            sparse = pd.SparseSeries(val1, name='x', kind=kind, fill_value=0)
+            dense = pd.Series(val2, name='y')
+
+            res = pd.concat([sparse, dense])
+            exp = pd.concat([pd.Series(val1), dense])
+            exp = pd.SparseSeries(exp, kind=kind, fill_value=0)
+            tm.assert_sp_series_equal(res, exp)
+
+            res = pd.concat([dense, sparse, dense])
+            exp = pd.concat([dense, pd.Series(val1), dense])
+            exp = pd.SparseSeries(exp, kind=kind, fill_value=0)
+            tm.assert_sp_series_equal(res, exp)
+
+    def test_value_counts(self):
+        vals = [1, 2, nan, 0, nan, 1, 2, nan, nan, 1, 2, 0, 1, 1]
+        dense = pd.Series(vals, name='xx')
+
+        sparse = pd.SparseSeries(vals, name='xx')
+        tm.assert_series_equal(sparse.value_counts(),
+                               dense.value_counts())
+        tm.assert_series_equal(sparse.value_counts(dropna=False),
+                               dense.value_counts(dropna=False))
+
+        sparse = pd.SparseSeries(vals, name='xx', fill_value=0)
+        tm.assert_series_equal(sparse.value_counts(),
+                               dense.value_counts())
+        tm.assert_series_equal(sparse.value_counts(dropna=False),
+                               dense.value_counts(dropna=False))
+
+    def test_value_counts_dup(self):
+        vals = [1, 2, nan, 0, nan, 1, 2, nan, nan, 1, 2, 0, 1, 1]
+
+        # numeric op may cause sp_values to include the same value as
+        # fill_value
+        dense = pd.Series(vals, name='xx') / 0.
+        sparse = pd.SparseSeries(vals, name='xx') / 0.
+        tm.assert_series_equal(sparse.value_counts(),
+                               dense.value_counts())
+        tm.assert_series_equal(sparse.value_counts(dropna=False),
+                               dense.value_counts(dropna=False))
+
+        vals = [1, 2, 0, 0, 0, 1, 2, 0, 0, 1, 2, 0, 1, 1]
+
+        dense = pd.Series(vals, name='xx') * 0.
+        sparse = pd.SparseSeries(vals, name='xx') * 0.
+        tm.assert_series_equal(sparse.value_counts(),
+                               dense.value_counts())
+        tm.assert_series_equal(sparse.value_counts(dropna=False),
+                               dense.value_counts(dropna=False))
+
+    def test_value_counts_int(self):
+        vals = [1, 2, 0, 1, 2, 1, 2, 0, 1, 1]
+        dense = pd.Series(vals, name='xx')
+
+        # fill_value is np.nan, but should not be included in the result
+        sparse = pd.SparseSeries(vals, name='xx')
+        tm.assert_series_equal(sparse.value_counts(),
+                               dense.value_counts())
+        tm.assert_series_equal(sparse.value_counts(dropna=False),
+                               dense.value_counts(dropna=False))
+
+        sparse = pd.SparseSeries(vals, name='xx', fill_value=0)
+        tm.assert_series_equal(sparse.value_counts(),
+                               dense.value_counts())
+        tm.assert_series_equal(sparse.value_counts(dropna=False),
+                               dense.value_counts(dropna=False))
+
+    def test_isna(self):
+        # GH 8276
+        s = pd.SparseSeries([np.nan, np.nan, 1, 2, np.nan], name='xxx')
+
+        res = s.isna()
+        exp = pd.SparseSeries([True, True, False, False, True], name='xxx',
+                              fill_value=True)
+        tm.assert_sp_series_equal(res, exp)
+
+        # if fill_value is not nan, True can be included in sp_values
+        s = pd.SparseSeries([np.nan, 0., 1., 2., 0.], name='xxx',
+                            fill_value=0.)
+        res = s.isna()
+        assert isinstance(res, pd.SparseSeries)
+        exp = pd.Series([True, False, False, False, False], name='xxx')
+        tm.assert_series_equal(res.to_dense(), exp)
+
+    def test_notna(self):
+        # GH 8276
+        s = pd.SparseSeries([np.nan, np.nan, 1, 2, np.nan], name='xxx')
+
+        res = s.notna()
+        exp = pd.SparseSeries([False, False, True, True, False], name='xxx',
+                              fill_value=False)
+        tm.assert_sp_series_equal(res, exp)
+
+        # if fill_value is not nan, True can be included in sp_values
+        s = pd.SparseSeries([np.nan, 0., 1., 2., 0.], name='xxx',
+                            fill_value=0.)
+        res = s.notna()
+        assert isinstance(res, pd.SparseSeries)
+        exp = pd.Series([False, True, True, True, True], name='xxx')
+        tm.assert_series_equal(res.to_dense(), exp)
+
+
+def _dense_series_compare(s, f):
+    result = f(s)
+    assert (isinstance(result, SparseSeries))
+    dense_result = f(s.to_dense())
+    tm.assert_series_equal(result.to_dense(), dense_result)
+
+
+class TestSparseSeriesAnalytics(object):
+
+    def setup_method(self, method):
+        arr, index = _test_data1()
+        self.bseries = SparseSeries(arr, index=index, kind='block',
+                                    name='bseries')
+
+        arr, index = _test_data1_zero()
+        self.zbseries = SparseSeries(arr, index=index, kind='block',
+                                     fill_value=0, name='zbseries')
+
+    def test_cumsum(self):
+        result = self.bseries.cumsum()
+        expected = SparseSeries(self.bseries.to_dense().cumsum())
+        tm.assert_sp_series_equal(result, expected)
+
+        result = self.zbseries.cumsum()
+        expected = self.zbseries.to_dense().cumsum()
+        tm.assert_series_equal(result, expected)
+
+        axis = 1  # Series is 1-D, so only axis = 0 is valid.
+        msg = "No axis named {axis}".format(axis=axis)
+        with tm.assert_raises_regex(ValueError, msg):
+            self.bseries.cumsum(axis=axis)
+
+    def test_numpy_cumsum(self):
+        result = np.cumsum(self.bseries)
+        expected = SparseSeries(self.bseries.to_dense().cumsum())
+        tm.assert_sp_series_equal(result, expected)
+
+        result = np.cumsum(self.zbseries)
+        expected = self.zbseries.to_dense().cumsum()
+        tm.assert_series_equal(result, expected)
+
+        msg = "the 'dtype' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.cumsum,
+                               self.bseries, dtype=np.int64)
+
+        msg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.cumsum,
+                               self.zbseries, out=result)
+
+    def test_numpy_func_call(self):
+        # no exception should be raised even though
+        # numpy passes in 'axis=None' or `axis=-1'
+        funcs = ['sum', 'cumsum', 'var', 'mean',
+                 'prod', 'cumprod', 'std', 'argsort',
+                 'min', 'max']
+        for func in funcs:
+            for series in ('bseries', 'zbseries'):
+                getattr(np, func)(getattr(self, series))
+
+    def test_deprecated_numpy_func_call(self):
+        # NOTE: These should be add to the 'test_numpy_func_call' test above
+        # once the behavior of argmin/argmax is corrected.
+        funcs = ['argmin', 'argmax']
+        for func in funcs:
+            for series in ('bseries', 'zbseries'):
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    getattr(np, func)(getattr(self, series))
+
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    getattr(getattr(self, series), func)()
+
+    def test_deprecated_reindex_axis(self):
+        # https://github.com/pandas-dev/pandas/issues/17833
+        with tm.assert_produces_warning(FutureWarning) as m:
+            self.bseries.reindex_axis([0, 1, 2])
+        assert 'reindex' in str(m[0].message)
+
+
+@pytest.mark.parametrize(
+    'datetime_type', (np.datetime64,
+                      pd.Timestamp,
+                      lambda x: datetime.strptime(x, '%Y-%m-%d')))
+def test_constructor_dict_datetime64_index(datetime_type):
+    # GH 9456
+    dates = ['1984-02-19', '1988-11-06', '1989-12-03', '1990-03-15']
+    values = [42544017.198965244, 1234565, 40512335.181958228, -1]
+
+    result = SparseSeries(dict(zip(map(datetime_type, dates), values)))
+    expected = SparseSeries(values, map(pd.Timestamp, dates))
+
+    tm.assert_sp_series_equal(result, expected)
diff --git a/pandas/tests/sparse/test_arithmetics.py b/pandas/tests/sparse/test_arithmetics.py
new file mode 100644
index 0000000000000..f023cd0003910
--- /dev/null
+++ b/pandas/tests/sparse/test_arithmetics.py
@@ -0,0 +1,451 @@
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+
+
+class TestSparseArrayArithmetics(object):
+
+    _base = np.array
+    _klass = pd.SparseArray
+
+    def _assert(self, a, b):
+        tm.assert_numpy_array_equal(a, b)
+
+    def _check_numeric_ops(self, a, b, a_dense, b_dense):
+        with np.errstate(invalid='ignore', divide='ignore'):
+            # Unfortunately, trying to wrap the computation of each expected
+            # value is with np.errstate() is too tedious.
+
+            # sparse & sparse
+            self._assert((a + b).to_dense(), a_dense + b_dense)
+            self._assert((b + a).to_dense(), b_dense + a_dense)
+
+            self._assert((a - b).to_dense(), a_dense - b_dense)
+            self._assert((b - a).to_dense(), b_dense - a_dense)
+
+            self._assert((a * b).to_dense(), a_dense * b_dense)
+            self._assert((b * a).to_dense(), b_dense * a_dense)
+
+            # pandas uses future division
+            self._assert((a / b).to_dense(), a_dense * 1.0 / b_dense)
+            self._assert((b / a).to_dense(), b_dense * 1.0 / a_dense)
+
+            # ToDo: FIXME in GH 13843
+            if not (self._base == pd.Series and a.dtype == 'int64'):
+                self._assert((a // b).to_dense(), a_dense // b_dense)
+                self._assert((b // a).to_dense(), b_dense // a_dense)
+
+            self._assert((a % b).to_dense(), a_dense % b_dense)
+            self._assert((b % a).to_dense(), b_dense % a_dense)
+
+            self._assert((a ** b).to_dense(), a_dense ** b_dense)
+            self._assert((b ** a).to_dense(), b_dense ** a_dense)
+
+            # sparse & dense
+            self._assert((a + b_dense).to_dense(), a_dense + b_dense)
+            self._assert((b_dense + a).to_dense(), b_dense + a_dense)
+
+            self._assert((a - b_dense).to_dense(), a_dense - b_dense)
+            self._assert((b_dense - a).to_dense(), b_dense - a_dense)
+
+            self._assert((a * b_dense).to_dense(), a_dense * b_dense)
+            self._assert((b_dense * a).to_dense(), b_dense * a_dense)
+
+            # pandas uses future division
+            self._assert((a / b_dense).to_dense(), a_dense * 1.0 / b_dense)
+            self._assert((b_dense / a).to_dense(), b_dense * 1.0 / a_dense)
+
+            # ToDo: FIXME in GH 13843
+            if not (self._base == pd.Series and a.dtype == 'int64'):
+                self._assert((a // b_dense).to_dense(), a_dense // b_dense)
+                self._assert((b_dense // a).to_dense(), b_dense // a_dense)
+
+            self._assert((a % b_dense).to_dense(), a_dense % b_dense)
+            self._assert((b_dense % a).to_dense(), b_dense % a_dense)
+
+            self._assert((a ** b_dense).to_dense(), a_dense ** b_dense)
+            self._assert((b_dense ** a).to_dense(), b_dense ** a_dense)
+
+    def _check_bool_result(self, res):
+        assert isinstance(res, self._klass)
+        assert res.dtype == np.bool
+        assert isinstance(res.fill_value, bool)
+
+    def _check_comparison_ops(self, a, b, a_dense, b_dense):
+        with np.errstate(invalid='ignore'):
+            # Unfortunately, trying to wrap the computation of each expected
+            # value is with np.errstate() is too tedious.
+            #
+            # sparse & sparse
+            self._check_bool_result(a == b)
+            self._assert((a == b).to_dense(), a_dense == b_dense)
+
+            self._check_bool_result(a != b)
+            self._assert((a != b).to_dense(), a_dense != b_dense)
+
+            self._check_bool_result(a >= b)
+            self._assert((a >= b).to_dense(), a_dense >= b_dense)
+
+            self._check_bool_result(a <= b)
+            self._assert((a <= b).to_dense(), a_dense <= b_dense)
+
+            self._check_bool_result(a > b)
+            self._assert((a > b).to_dense(), a_dense > b_dense)
+
+            self._check_bool_result(a < b)
+            self._assert((a < b).to_dense(), a_dense < b_dense)
+
+            # sparse & dense
+            self._check_bool_result(a == b_dense)
+            self._assert((a == b_dense).to_dense(), a_dense == b_dense)
+
+            self._check_bool_result(a != b_dense)
+            self._assert((a != b_dense).to_dense(), a_dense != b_dense)
+
+            self._check_bool_result(a >= b_dense)
+            self._assert((a >= b_dense).to_dense(), a_dense >= b_dense)
+
+            self._check_bool_result(a <= b_dense)
+            self._assert((a <= b_dense).to_dense(), a_dense <= b_dense)
+
+            self._check_bool_result(a > b_dense)
+            self._assert((a > b_dense).to_dense(), a_dense > b_dense)
+
+            self._check_bool_result(a < b_dense)
+            self._assert((a < b_dense).to_dense(), a_dense < b_dense)
+
+    def _check_logical_ops(self, a, b, a_dense, b_dense):
+        # sparse & sparse
+        self._check_bool_result(a & b)
+        self._assert((a & b).to_dense(), a_dense & b_dense)
+
+        self._check_bool_result(a | b)
+        self._assert((a | b).to_dense(), a_dense | b_dense)
+        # sparse & dense
+        self._check_bool_result(a & b_dense)
+        self._assert((a & b_dense).to_dense(), a_dense & b_dense)
+
+        self._check_bool_result(a | b_dense)
+        self._assert((a | b_dense).to_dense(), a_dense | b_dense)
+
+    def test_float_scalar(self):
+        values = self._base([np.nan, 1, 2, 0, np.nan, 0, 1, 2, 1, np.nan])
+
+        for kind in ['integer', 'block']:
+            a = self._klass(values, kind=kind)
+            self._check_numeric_ops(a, 1, values, 1)
+            self._check_numeric_ops(a, 0, values, 0)
+            self._check_numeric_ops(a, 3, values, 3)
+
+            a = self._klass(values, kind=kind, fill_value=0)
+            self._check_numeric_ops(a, 1, values, 1)
+            self._check_numeric_ops(a, 0, values, 0)
+            self._check_numeric_ops(a, 3, values, 3)
+
+            a = self._klass(values, kind=kind, fill_value=2)
+            self._check_numeric_ops(a, 1, values, 1)
+            self._check_numeric_ops(a, 0, values, 0)
+            self._check_numeric_ops(a, 3, values, 3)
+
+    def test_float_scalar_comparison(self):
+        values = self._base([np.nan, 1, 2, 0, np.nan, 0, 1, 2, 1, np.nan])
+
+        for kind in ['integer', 'block']:
+            a = self._klass(values, kind=kind)
+            self._check_comparison_ops(a, 1, values, 1)
+            self._check_comparison_ops(a, 0, values, 0)
+            self._check_comparison_ops(a, 3, values, 3)
+
+            a = self._klass(values, kind=kind, fill_value=0)
+            self._check_comparison_ops(a, 1, values, 1)
+            self._check_comparison_ops(a, 0, values, 0)
+            self._check_comparison_ops(a, 3, values, 3)
+
+            a = self._klass(values, kind=kind, fill_value=2)
+            self._check_comparison_ops(a, 1, values, 1)
+            self._check_comparison_ops(a, 0, values, 0)
+            self._check_comparison_ops(a, 3, values, 3)
+
+    def test_float_same_index(self):
+        # when sp_index are the same
+        for kind in ['integer', 'block']:
+            values = self._base([np.nan, 1, 2, 0, np.nan, 0, 1, 2, 1, np.nan])
+            rvalues = self._base([np.nan, 2, 3, 4, np.nan, 0, 1, 3, 2, np.nan])
+
+            a = self._klass(values, kind=kind)
+            b = self._klass(rvalues, kind=kind)
+            self._check_numeric_ops(a, b, values, rvalues)
+
+            values = self._base([0., 1., 2., 6., 0., 0., 1., 2., 1., 0.])
+            rvalues = self._base([0., 2., 3., 4., 0., 0., 1., 3., 2., 0.])
+
+            a = self._klass(values, kind=kind, fill_value=0)
+            b = self._klass(rvalues, kind=kind, fill_value=0)
+            self._check_numeric_ops(a, b, values, rvalues)
+
+    def test_float_same_index_comparison(self):
+        # when sp_index are the same
+        for kind in ['integer', 'block']:
+            values = self._base([np.nan, 1, 2, 0, np.nan, 0, 1, 2, 1, np.nan])
+            rvalues = self._base([np.nan, 2, 3, 4, np.nan, 0, 1, 3, 2, np.nan])
+
+            a = self._klass(values, kind=kind)
+            b = self._klass(rvalues, kind=kind)
+            self._check_comparison_ops(a, b, values, rvalues)
+
+            values = self._base([0., 1., 2., 6., 0., 0., 1., 2., 1., 0.])
+            rvalues = self._base([0., 2., 3., 4., 0., 0., 1., 3., 2., 0.])
+
+            a = self._klass(values, kind=kind, fill_value=0)
+            b = self._klass(rvalues, kind=kind, fill_value=0)
+            self._check_comparison_ops(a, b, values, rvalues)
+
+    def test_float_array(self):
+        values = self._base([np.nan, 1, 2, 0, np.nan, 0, 1, 2, 1, np.nan])
+        rvalues = self._base([2, np.nan, 2, 3, np.nan, 0, 1, 5, 2, np.nan])
+
+        for kind in ['integer', 'block']:
+            a = self._klass(values, kind=kind)
+            b = self._klass(rvalues, kind=kind)
+            self._check_numeric_ops(a, b, values, rvalues)
+            self._check_numeric_ops(a, b * 0, values, rvalues * 0)
+
+            a = self._klass(values, kind=kind, fill_value=0)
+            b = self._klass(rvalues, kind=kind)
+            self._check_numeric_ops(a, b, values, rvalues)
+
+            a = self._klass(values, kind=kind, fill_value=0)
+            b = self._klass(rvalues, kind=kind, fill_value=0)
+            self._check_numeric_ops(a, b, values, rvalues)
+
+            a = self._klass(values, kind=kind, fill_value=1)
+            b = self._klass(rvalues, kind=kind, fill_value=2)
+            self._check_numeric_ops(a, b, values, rvalues)
+
+    def test_float_array_different_kind(self):
+        values = self._base([np.nan, 1, 2, 0, np.nan, 0, 1, 2, 1, np.nan])
+        rvalues = self._base([2, np.nan, 2, 3, np.nan, 0, 1, 5, 2, np.nan])
+
+        a = self._klass(values, kind='integer')
+        b = self._klass(rvalues, kind='block')
+        self._check_numeric_ops(a, b, values, rvalues)
+        self._check_numeric_ops(a, b * 0, values, rvalues * 0)
+
+        a = self._klass(values, kind='integer', fill_value=0)
+        b = self._klass(rvalues, kind='block')
+        self._check_numeric_ops(a, b, values, rvalues)
+
+        a = self._klass(values, kind='integer', fill_value=0)
+        b = self._klass(rvalues, kind='block', fill_value=0)
+        self._check_numeric_ops(a, b, values, rvalues)
+
+        a = self._klass(values, kind='integer', fill_value=1)
+        b = self._klass(rvalues, kind='block', fill_value=2)
+        self._check_numeric_ops(a, b, values, rvalues)
+
+    def test_float_array_comparison(self):
+        values = self._base([np.nan, 1, 2, 0, np.nan, 0, 1, 2, 1, np.nan])
+        rvalues = self._base([2, np.nan, 2, 3, np.nan, 0, 1, 5, 2, np.nan])
+
+        for kind in ['integer', 'block']:
+            a = self._klass(values, kind=kind)
+            b = self._klass(rvalues, kind=kind)
+            self._check_comparison_ops(a, b, values, rvalues)
+            self._check_comparison_ops(a, b * 0, values, rvalues * 0)
+
+            a = self._klass(values, kind=kind, fill_value=0)
+            b = self._klass(rvalues, kind=kind)
+            self._check_comparison_ops(a, b, values, rvalues)
+
+            a = self._klass(values, kind=kind, fill_value=0)
+            b = self._klass(rvalues, kind=kind, fill_value=0)
+            self._check_comparison_ops(a, b, values, rvalues)
+
+            a = self._klass(values, kind=kind, fill_value=1)
+            b = self._klass(rvalues, kind=kind, fill_value=2)
+            self._check_comparison_ops(a, b, values, rvalues)
+
+    def test_int_array(self):
+        # have to specify dtype explicitly until fixing GH 667
+        dtype = np.int64
+
+        values = self._base([0, 1, 2, 0, 0, 0, 1, 2, 1, 0], dtype=dtype)
+        rvalues = self._base([2, 0, 2, 3, 0, 0, 1, 5, 2, 0], dtype=dtype)
+
+        for kind in ['integer', 'block']:
+            a = self._klass(values, dtype=dtype, kind=kind)
+            assert a.dtype == dtype
+            b = self._klass(rvalues, dtype=dtype, kind=kind)
+            assert b.dtype == dtype
+
+            self._check_numeric_ops(a, b, values, rvalues)
+            self._check_numeric_ops(a, b * 0, values, rvalues * 0)
+
+            a = self._klass(values, fill_value=0, dtype=dtype, kind=kind)
+            assert a.dtype == dtype
+            b = self._klass(rvalues, dtype=dtype, kind=kind)
+            assert b.dtype == dtype
+
+            self._check_numeric_ops(a, b, values, rvalues)
+
+            a = self._klass(values, fill_value=0, dtype=dtype, kind=kind)
+            assert a.dtype == dtype
+            b = self._klass(rvalues, fill_value=0, dtype=dtype, kind=kind)
+            assert b.dtype == dtype
+            self._check_numeric_ops(a, b, values, rvalues)
+
+            a = self._klass(values, fill_value=1, dtype=dtype, kind=kind)
+            assert a.dtype == dtype
+            b = self._klass(rvalues, fill_value=2, dtype=dtype, kind=kind)
+            assert b.dtype == dtype
+            self._check_numeric_ops(a, b, values, rvalues)
+
+    def test_int_array_comparison(self):
+
+        # int32 NI ATM
+        for dtype in ['int64']:
+            values = self._base([0, 1, 2, 0, 0, 0, 1, 2, 1, 0], dtype=dtype)
+            rvalues = self._base([2, 0, 2, 3, 0, 0, 1, 5, 2, 0], dtype=dtype)
+
+            for kind in ['integer', 'block']:
+                a = self._klass(values, dtype=dtype, kind=kind)
+                b = self._klass(rvalues, dtype=dtype, kind=kind)
+                self._check_comparison_ops(a, b, values, rvalues)
+                self._check_comparison_ops(a, b * 0, values, rvalues * 0)
+
+                a = self._klass(values, dtype=dtype, kind=kind, fill_value=0)
+                b = self._klass(rvalues, dtype=dtype, kind=kind)
+                self._check_comparison_ops(a, b, values, rvalues)
+
+                a = self._klass(values, dtype=dtype, kind=kind, fill_value=0)
+                b = self._klass(rvalues, dtype=dtype, kind=kind, fill_value=0)
+                self._check_comparison_ops(a, b, values, rvalues)
+
+                a = self._klass(values, dtype=dtype, kind=kind, fill_value=1)
+                b = self._klass(rvalues, dtype=dtype, kind=kind, fill_value=2)
+                self._check_comparison_ops(a, b, values, rvalues)
+
+    def test_bool_same_index(self):
+        # GH 14000
+        # when sp_index are the same
+        for kind in ['integer', 'block']:
+            values = self._base([True, False, True, True], dtype=np.bool)
+            rvalues = self._base([True, False, True, True], dtype=np.bool)
+
+            for fill_value in [True, False, np.nan]:
+                a = self._klass(values, kind=kind, dtype=np.bool,
+                                fill_value=fill_value)
+                b = self._klass(rvalues, kind=kind, dtype=np.bool,
+                                fill_value=fill_value)
+                self._check_logical_ops(a, b, values, rvalues)
+
+    def test_bool_array_logical(self):
+        # GH 14000
+        # when sp_index are the same
+        for kind in ['integer', 'block']:
+            values = self._base([True, False, True, False, True, True],
+                                dtype=np.bool)
+            rvalues = self._base([True, False, False, True, False, True],
+                                 dtype=np.bool)
+
+            for fill_value in [True, False, np.nan]:
+                a = self._klass(values, kind=kind, dtype=np.bool,
+                                fill_value=fill_value)
+                b = self._klass(rvalues, kind=kind, dtype=np.bool,
+                                fill_value=fill_value)
+                self._check_logical_ops(a, b, values, rvalues)
+
+    def test_mixed_array_float_int(self):
+
+        for rdtype in ['int64']:
+            values = self._base([np.nan, 1, 2, 0, np.nan, 0, 1, 2, 1, np.nan])
+            rvalues = self._base([2, 0, 2, 3, 0, 0, 1, 5, 2, 0], dtype=rdtype)
+
+            for kind in ['integer', 'block']:
+                a = self._klass(values, kind=kind)
+                b = self._klass(rvalues, kind=kind)
+                assert b.dtype == rdtype
+
+                self._check_numeric_ops(a, b, values, rvalues)
+                self._check_numeric_ops(a, b * 0, values, rvalues * 0)
+
+                a = self._klass(values, kind=kind, fill_value=0)
+                b = self._klass(rvalues, kind=kind)
+                assert b.dtype == rdtype
+                self._check_numeric_ops(a, b, values, rvalues)
+
+                a = self._klass(values, kind=kind, fill_value=0)
+                b = self._klass(rvalues, kind=kind, fill_value=0)
+                assert b.dtype == rdtype
+                self._check_numeric_ops(a, b, values, rvalues)
+
+                a = self._klass(values, kind=kind, fill_value=1)
+                b = self._klass(rvalues, kind=kind, fill_value=2)
+                assert b.dtype == rdtype
+                self._check_numeric_ops(a, b, values, rvalues)
+
+    def test_mixed_array_comparison(self):
+
+        # int32 NI ATM
+        for rdtype in ['int64']:
+            values = self._base([np.nan, 1, 2, 0, np.nan, 0, 1, 2, 1, np.nan])
+            rvalues = self._base([2, 0, 2, 3, 0, 0, 1, 5, 2, 0], dtype=rdtype)
+
+            for kind in ['integer', 'block']:
+                a = self._klass(values, kind=kind)
+                b = self._klass(rvalues, kind=kind)
+                assert b.dtype == rdtype
+
+                self._check_comparison_ops(a, b, values, rvalues)
+                self._check_comparison_ops(a, b * 0, values, rvalues * 0)
+
+                a = self._klass(values, kind=kind, fill_value=0)
+                b = self._klass(rvalues, kind=kind)
+                assert b.dtype == rdtype
+                self._check_comparison_ops(a, b, values, rvalues)
+
+                a = self._klass(values, kind=kind, fill_value=0)
+                b = self._klass(rvalues, kind=kind, fill_value=0)
+                assert b.dtype == rdtype
+                self._check_comparison_ops(a, b, values, rvalues)
+
+                a = self._klass(values, kind=kind, fill_value=1)
+                b = self._klass(rvalues, kind=kind, fill_value=2)
+                assert b.dtype == rdtype
+                self._check_comparison_ops(a, b, values, rvalues)
+
+
+class TestSparseSeriesArithmetic(TestSparseArrayArithmetics):
+
+    _base = pd.Series
+    _klass = pd.SparseSeries
+
+    def _assert(self, a, b):
+        tm.assert_series_equal(a, b)
+
+    def test_alignment(self):
+        da = pd.Series(np.arange(4))
+        db = pd.Series(np.arange(4), index=[1, 2, 3, 4])
+
+        sa = pd.SparseSeries(np.arange(4), dtype=np.int64, fill_value=0)
+        sb = pd.SparseSeries(np.arange(4), index=[1, 2, 3, 4],
+                             dtype=np.int64, fill_value=0)
+        self._check_numeric_ops(sa, sb, da, db)
+
+        sa = pd.SparseSeries(np.arange(4), dtype=np.int64, fill_value=np.nan)
+        sb = pd.SparseSeries(np.arange(4), index=[1, 2, 3, 4],
+                             dtype=np.int64, fill_value=np.nan)
+        self._check_numeric_ops(sa, sb, da, db)
+
+        da = pd.Series(np.arange(4))
+        db = pd.Series(np.arange(4), index=[10, 11, 12, 13])
+
+        sa = pd.SparseSeries(np.arange(4), dtype=np.int64, fill_value=0)
+        sb = pd.SparseSeries(np.arange(4), index=[10, 11, 12, 13],
+                             dtype=np.int64, fill_value=0)
+        self._check_numeric_ops(sa, sb, da, db)
+
+        sa = pd.SparseSeries(np.arange(4), dtype=np.int64, fill_value=np.nan)
+        sb = pd.SparseSeries(np.arange(4), index=[10, 11, 12, 13],
+                             dtype=np.int64, fill_value=np.nan)
+        self._check_numeric_ops(sa, sb, da, db)
diff --git a/pandas/tests/sparse/test_array.py b/pandas/tests/sparse/test_array.py
new file mode 100644
index 0000000000000..b3330f866ba1f
--- /dev/null
+++ b/pandas/tests/sparse/test_array.py
@@ -0,0 +1,935 @@
+from pandas.compat import range
+
+import re
+import operator
+import pytest
+import warnings
+
+from numpy import nan
+import numpy as np
+
+from pandas.core.sparse.api import SparseArray, SparseSeries
+from pandas._libs.sparse import IntIndex
+from pandas.util.testing import assert_almost_equal
+import pandas.util.testing as tm
+
+
+class TestSparseArray(object):
+
+    def setup_method(self, method):
+        self.arr_data = np.array([nan, nan, 1, 2, 3, nan, 4, 5, nan, 6])
+        self.arr = SparseArray(self.arr_data)
+        self.zarr = SparseArray([0, 0, 1, 2, 3, 0, 4, 5, 0, 6], fill_value=0)
+
+    def test_constructor_dtype(self):
+        arr = SparseArray([np.nan, 1, 2, np.nan])
+        assert arr.dtype == np.float64
+        assert np.isnan(arr.fill_value)
+
+        arr = SparseArray([np.nan, 1, 2, np.nan], fill_value=0)
+        assert arr.dtype == np.float64
+        assert arr.fill_value == 0
+
+        arr = SparseArray([0, 1, 2, 4], dtype=np.float64)
+        assert arr.dtype == np.float64
+        assert np.isnan(arr.fill_value)
+
+        arr = SparseArray([0, 1, 2, 4], dtype=np.int64)
+        assert arr.dtype == np.int64
+        assert arr.fill_value == 0
+
+        arr = SparseArray([0, 1, 2, 4], fill_value=0, dtype=np.int64)
+        assert arr.dtype == np.int64
+        assert arr.fill_value == 0
+
+        arr = SparseArray([0, 1, 2, 4], dtype=None)
+        assert arr.dtype == np.int64
+        assert arr.fill_value == 0
+
+        arr = SparseArray([0, 1, 2, 4], fill_value=0, dtype=None)
+        assert arr.dtype == np.int64
+        assert arr.fill_value == 0
+
+    def test_constructor_object_dtype(self):
+        # GH 11856
+        arr = SparseArray(['A', 'A', np.nan, 'B'], dtype=np.object)
+        assert arr.dtype == np.object
+        assert np.isnan(arr.fill_value)
+
+        arr = SparseArray(['A', 'A', np.nan, 'B'], dtype=np.object,
+                          fill_value='A')
+        assert arr.dtype == np.object
+        assert arr.fill_value == 'A'
+
+        # GH 17574
+        data = [False, 0, 100.0, 0.0]
+        arr = SparseArray(data, dtype=np.object, fill_value=False)
+        assert arr.dtype == np.object
+        assert arr.fill_value is False
+        arr_expected = np.array(data, dtype=np.object)
+        it = (type(x) == type(y) and x == y for x, y in zip(arr, arr_expected))
+        assert np.fromiter(it, dtype=np.bool).all()
+
+    def test_constructor_spindex_dtype(self):
+        arr = SparseArray(data=[1, 2], sparse_index=IntIndex(4, [1, 2]))
+        tm.assert_sp_array_equal(arr, SparseArray([np.nan, 1, 2, np.nan]))
+        assert arr.dtype == np.float64
+        assert np.isnan(arr.fill_value)
+
+        arr = SparseArray(data=[1, 2, 3],
+                          sparse_index=IntIndex(4, [1, 2, 3]),
+                          dtype=np.int64, fill_value=0)
+        exp = SparseArray([0, 1, 2, 3], dtype=np.int64, fill_value=0)
+        tm.assert_sp_array_equal(arr, exp)
+        assert arr.dtype == np.int64
+        assert arr.fill_value == 0
+
+        arr = SparseArray(data=[1, 2], sparse_index=IntIndex(4, [1, 2]),
+                          fill_value=0, dtype=np.int64)
+        exp = SparseArray([0, 1, 2, 0], fill_value=0, dtype=np.int64)
+        tm.assert_sp_array_equal(arr, exp)
+        assert arr.dtype == np.int64
+        assert arr.fill_value == 0
+
+        arr = SparseArray(data=[1, 2, 3],
+                          sparse_index=IntIndex(4, [1, 2, 3]),
+                          dtype=None, fill_value=0)
+        exp = SparseArray([0, 1, 2, 3], dtype=None)
+        tm.assert_sp_array_equal(arr, exp)
+        assert arr.dtype == np.int64
+        assert arr.fill_value == 0
+
+        # scalar input
+        arr = SparseArray(data=1, sparse_index=IntIndex(1, [0]), dtype=None)
+        exp = SparseArray([1], dtype=None)
+        tm.assert_sp_array_equal(arr, exp)
+        assert arr.dtype == np.int64
+        assert arr.fill_value == 0
+
+        arr = SparseArray(data=[1, 2], sparse_index=IntIndex(4, [1, 2]),
+                          fill_value=0, dtype=None)
+        exp = SparseArray([0, 1, 2, 0], fill_value=0, dtype=None)
+        tm.assert_sp_array_equal(arr, exp)
+        assert arr.dtype == np.int64
+        assert arr.fill_value == 0
+
+    @pytest.mark.parametrize('scalar,dtype', [
+        (False, bool),
+        (0.0, 'float64'),
+        (1, 'int64'),
+        ('z', 'object')])
+    def test_scalar_with_index_infer_dtype(self, scalar, dtype):
+        # GH 19163
+        arr = SparseArray(scalar, index=[1, 2, 3], fill_value=scalar)
+        exp = SparseArray([scalar, scalar, scalar], fill_value=scalar)
+
+        tm.assert_sp_array_equal(arr, exp)
+
+        assert arr.dtype == dtype
+        assert exp.dtype == dtype
+
+    def test_sparseseries_roundtrip(self):
+        # GH 13999
+        for kind in ['integer', 'block']:
+            for fill in [1, np.nan, 0]:
+                arr = SparseArray([np.nan, 1, np.nan, 2, 3], kind=kind,
+                                  fill_value=fill)
+                res = SparseArray(SparseSeries(arr))
+                tm.assert_sp_array_equal(arr, res)
+
+                arr = SparseArray([0, 0, 0, 1, 1, 2], dtype=np.int64,
+                                  kind=kind, fill_value=fill)
+                res = SparseArray(SparseSeries(arr), dtype=np.int64)
+                tm.assert_sp_array_equal(arr, res)
+
+                res = SparseArray(SparseSeries(arr))
+                tm.assert_sp_array_equal(arr, res)
+
+            for fill in [True, False, np.nan]:
+                arr = SparseArray([True, False, True, True], dtype=np.bool,
+                                  kind=kind, fill_value=fill)
+                res = SparseArray(SparseSeries(arr))
+                tm.assert_sp_array_equal(arr, res)
+
+                res = SparseArray(SparseSeries(arr))
+                tm.assert_sp_array_equal(arr, res)
+
+    def test_get_item(self):
+
+        assert np.isnan(self.arr[1])
+        assert self.arr[2] == 1
+        assert self.arr[7] == 5
+
+        assert self.zarr[0] == 0
+        assert self.zarr[2] == 1
+        assert self.zarr[7] == 5
+
+        errmsg = re.compile("bounds")
+        tm.assert_raises_regex(IndexError, errmsg, lambda: self.arr[11])
+        tm.assert_raises_regex(IndexError, errmsg, lambda: self.arr[-11])
+        assert self.arr[-1] == self.arr[len(self.arr) - 1]
+
+    def test_take(self):
+        assert np.isnan(self.arr.take(0))
+        assert np.isscalar(self.arr.take(2))
+
+        assert self.arr.take(2) == np.take(self.arr_data, 2)
+        assert self.arr.take(6) == np.take(self.arr_data, 6)
+
+        exp = SparseArray(np.take(self.arr_data, [2, 3]))
+        tm.assert_sp_array_equal(self.arr.take([2, 3]), exp)
+
+        exp = SparseArray(np.take(self.arr_data, [0, 1, 2]))
+        tm.assert_sp_array_equal(self.arr.take([0, 1, 2]), exp)
+
+    def test_take_fill_value(self):
+        data = np.array([1, np.nan, 0, 3, 0])
+        sparse = SparseArray(data, fill_value=0)
+
+        exp = SparseArray(np.take(data, [0]), fill_value=0)
+        tm.assert_sp_array_equal(sparse.take([0]), exp)
+
+        exp = SparseArray(np.take(data, [1, 3, 4]), fill_value=0)
+        tm.assert_sp_array_equal(sparse.take([1, 3, 4]), exp)
+
+    def test_take_negative(self):
+        exp = SparseArray(np.take(self.arr_data, [-1]))
+        tm.assert_sp_array_equal(self.arr.take([-1]), exp)
+
+        exp = SparseArray(np.take(self.arr_data, [-4, -3, -2]))
+        tm.assert_sp_array_equal(self.arr.take([-4, -3, -2]), exp)
+
+    def test_bad_take(self):
+        tm.assert_raises_regex(
+            IndexError, "bounds", lambda: self.arr.take(11))
+        pytest.raises(IndexError, lambda: self.arr.take(-11))
+
+    def test_take_invalid_kwargs(self):
+        msg = r"take\(\) got an unexpected keyword argument 'foo'"
+        tm.assert_raises_regex(TypeError, msg, self.arr.take,
+                               [2, 3], foo=2)
+
+        msg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, self.arr.take,
+                               [2, 3], out=self.arr)
+
+        msg = "the 'mode' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, self.arr.take,
+                               [2, 3], mode='clip')
+
+    def test_take_filling(self):
+        # similar tests as GH 12631
+        sparse = SparseArray([np.nan, np.nan, 1, np.nan, 4])
+        result = sparse.take(np.array([1, 0, -1]))
+        expected = SparseArray([np.nan, np.nan, 4])
+        tm.assert_sp_array_equal(result, expected)
+
+        # fill_value
+        result = sparse.take(np.array([1, 0, -1]), fill_value=True)
+        expected = SparseArray([np.nan, np.nan, np.nan])
+        tm.assert_sp_array_equal(result, expected)
+
+        # allow_fill=False
+        result = sparse.take(np.array([1, 0, -1]),
+                             allow_fill=False, fill_value=True)
+        expected = SparseArray([np.nan, np.nan, 4])
+        tm.assert_sp_array_equal(result, expected)
+
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+        with tm.assert_raises_regex(ValueError, msg):
+            sparse.take(np.array([1, 0, -2]), fill_value=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            sparse.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, -6]))
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, 5]))
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, 5]), fill_value=True)
+
+    def test_take_filling_fill_value(self):
+        # same tests as GH 12631
+        sparse = SparseArray([np.nan, 0, 1, 0, 4], fill_value=0)
+        result = sparse.take(np.array([1, 0, -1]))
+        expected = SparseArray([0, np.nan, 4], fill_value=0)
+        tm.assert_sp_array_equal(result, expected)
+
+        # fill_value
+        result = sparse.take(np.array([1, 0, -1]), fill_value=True)
+        expected = SparseArray([0, np.nan, 0], fill_value=0)
+        tm.assert_sp_array_equal(result, expected)
+
+        # allow_fill=False
+        result = sparse.take(np.array([1, 0, -1]),
+                             allow_fill=False, fill_value=True)
+        expected = SparseArray([0, np.nan, 4], fill_value=0)
+        tm.assert_sp_array_equal(result, expected)
+
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+        with tm.assert_raises_regex(ValueError, msg):
+            sparse.take(np.array([1, 0, -2]), fill_value=True)
+        with tm.assert_raises_regex(ValueError, msg):
+            sparse.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, -6]))
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, 5]))
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, 5]), fill_value=True)
+
+    def test_take_filling_all_nan(self):
+        sparse = SparseArray([np.nan, np.nan, np.nan, np.nan, np.nan])
+        result = sparse.take(np.array([1, 0, -1]))
+        expected = SparseArray([np.nan, np.nan, np.nan])
+        tm.assert_sp_array_equal(result, expected)
+
+        result = sparse.take(np.array([1, 0, -1]), fill_value=True)
+        expected = SparseArray([np.nan, np.nan, np.nan])
+        tm.assert_sp_array_equal(result, expected)
+
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, -6]))
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, 5]))
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, 5]), fill_value=True)
+
+    def test_set_item(self):
+        def setitem():
+            self.arr[5] = 3
+
+        def setslice():
+            self.arr[1:5] = 2
+
+        tm.assert_raises_regex(TypeError, "item assignment", setitem)
+        tm.assert_raises_regex(TypeError, "item assignment", setslice)
+
+    def test_constructor_from_too_large_array(self):
+        tm.assert_raises_regex(TypeError, "expected dimension <= 1 data",
+                               SparseArray, np.arange(10).reshape((2, 5)))
+
+    def test_constructor_from_sparse(self):
+        res = SparseArray(self.zarr)
+        assert res.fill_value == 0
+        assert_almost_equal(res.sp_values, self.zarr.sp_values)
+
+    def test_constructor_copy(self):
+        cp = SparseArray(self.arr, copy=True)
+        cp.sp_values[:3] = 0
+        assert not (self.arr.sp_values[:3] == 0).any()
+
+        not_copy = SparseArray(self.arr)
+        not_copy.sp_values[:3] = 0
+        assert (self.arr.sp_values[:3] == 0).all()
+
+    def test_constructor_bool(self):
+        # GH 10648
+        data = np.array([False, False, True, True, False, False])
+        arr = SparseArray(data, fill_value=False, dtype=bool)
+
+        assert arr.dtype == bool
+        tm.assert_numpy_array_equal(arr.sp_values, np.array([True, True]))
+        tm.assert_numpy_array_equal(arr.sp_values, np.asarray(arr))
+        tm.assert_numpy_array_equal(arr.sp_index.indices,
+                                    np.array([2, 3], np.int32))
+
+        for dense in [arr.to_dense(), arr.values]:
+            assert dense.dtype == bool
+            tm.assert_numpy_array_equal(dense, data)
+
+    def test_constructor_bool_fill_value(self):
+        arr = SparseArray([True, False, True], dtype=None)
+        assert arr.dtype == np.bool
+        assert not arr.fill_value
+
+        arr = SparseArray([True, False, True], dtype=np.bool)
+        assert arr.dtype == np.bool
+        assert not arr.fill_value
+
+        arr = SparseArray([True, False, True], dtype=np.bool, fill_value=True)
+        assert arr.dtype == np.bool
+        assert arr.fill_value
+
+    def test_constructor_float32(self):
+        # GH 10648
+        data = np.array([1., np.nan, 3], dtype=np.float32)
+        arr = SparseArray(data, dtype=np.float32)
+
+        assert arr.dtype == np.float32
+        tm.assert_numpy_array_equal(arr.sp_values,
+                                    np.array([1, 3], dtype=np.float32))
+        tm.assert_numpy_array_equal(arr.sp_values, np.asarray(arr))
+        tm.assert_numpy_array_equal(arr.sp_index.indices,
+                                    np.array([0, 2], dtype=np.int32))
+
+        for dense in [arr.to_dense(), arr.values]:
+            assert dense.dtype == np.float32
+            tm.assert_numpy_array_equal(dense, data)
+
+    def test_astype(self):
+        res = self.arr.astype('f8')
+        res.sp_values[:3] = 27
+        assert not (self.arr.sp_values[:3] == 27).any()
+
+        msg = "unable to coerce current fill_value nan to int64 dtype"
+        with tm.assert_raises_regex(ValueError, msg):
+            self.arr.astype('i8')
+
+        arr = SparseArray([0, np.nan, 0, 1])
+        with tm.assert_raises_regex(ValueError, msg):
+            arr.astype('i8')
+
+        arr = SparseArray([0, np.nan, 0, 1], fill_value=0)
+        msg = 'Cannot convert non-finite values \\(NA or inf\\) to integer'
+        with tm.assert_raises_regex(ValueError, msg):
+            arr.astype('i8')
+
+    def test_astype_all(self):
+        vals = np.array([1, 2, 3])
+        arr = SparseArray(vals, fill_value=1)
+
+        types = [np.float64, np.float32, np.int64,
+                 np.int32, np.int16, np.int8]
+        for typ in types:
+            res = arr.astype(typ)
+            assert res.dtype == typ
+            assert res.sp_values.dtype == typ
+
+            tm.assert_numpy_array_equal(res.values, vals.astype(typ))
+
+    def test_set_fill_value(self):
+        arr = SparseArray([1., np.nan, 2.], fill_value=np.nan)
+        arr.fill_value = 2
+        assert arr.fill_value == 2
+
+        arr = SparseArray([1, 0, 2], fill_value=0, dtype=np.int64)
+        arr.fill_value = 2
+        assert arr.fill_value == 2
+
+        # coerces to int
+        msg = "unable to set fill_value 3\\.1 to int64 dtype"
+        with tm.assert_raises_regex(ValueError, msg):
+            arr.fill_value = 3.1
+
+        msg = "unable to set fill_value nan to int64 dtype"
+        with tm.assert_raises_regex(ValueError, msg):
+            arr.fill_value = np.nan
+
+        arr = SparseArray([True, False, True], fill_value=False, dtype=np.bool)
+        arr.fill_value = True
+        assert arr.fill_value
+
+        # coerces to bool
+        msg = "unable to set fill_value 0 to bool dtype"
+        with tm.assert_raises_regex(ValueError, msg):
+            arr.fill_value = 0
+
+        msg = "unable to set fill_value nan to bool dtype"
+        with tm.assert_raises_regex(ValueError, msg):
+            arr.fill_value = np.nan
+
+        # invalid
+        msg = "fill_value must be a scalar"
+        for val in [[1, 2, 3], np.array([1, 2]), (1, 2, 3)]:
+            with tm.assert_raises_regex(ValueError, msg):
+                arr.fill_value = val
+
+    def test_copy_shallow(self):
+        arr2 = self.arr.copy(deep=False)
+
+        def _get_base(values):
+            base = values.base
+            while base.base is not None:
+                base = base.base
+            return base
+
+        assert (_get_base(arr2) is _get_base(self.arr))
+
+    def test_values_asarray(self):
+        assert_almost_equal(self.arr.values, self.arr_data)
+        assert_almost_equal(self.arr.to_dense(), self.arr_data)
+        assert_almost_equal(self.arr.sp_values, np.asarray(self.arr))
+
+    @pytest.mark.parametrize('data,shape,dtype', [
+        ([0, 0, 0, 0, 0], (5,), None),
+        ([], (0,), None),
+        ([0], (1,), None),
+        (['A', 'A', np.nan, 'B'], (4,), np.object)
+    ])
+    def test_shape(self, data, shape, dtype):
+        # GH 21126
+        out = SparseArray(data, dtype=dtype)
+        assert out.shape == shape
+
+    def test_to_dense(self):
+        vals = np.array([1, np.nan, np.nan, 3, np.nan])
+        res = SparseArray(vals).to_dense()
+        tm.assert_numpy_array_equal(res, vals)
+
+        res = SparseArray(vals, fill_value=0).to_dense()
+        tm.assert_numpy_array_equal(res, vals)
+
+        vals = np.array([1, np.nan, 0, 3, 0])
+        res = SparseArray(vals).to_dense()
+        tm.assert_numpy_array_equal(res, vals)
+
+        res = SparseArray(vals, fill_value=0).to_dense()
+        tm.assert_numpy_array_equal(res, vals)
+
+        vals = np.array([np.nan, np.nan, np.nan, np.nan, np.nan])
+        res = SparseArray(vals).to_dense()
+        tm.assert_numpy_array_equal(res, vals)
+
+        res = SparseArray(vals, fill_value=0).to_dense()
+        tm.assert_numpy_array_equal(res, vals)
+
+        # see gh-14647
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            SparseArray(vals).to_dense(fill=2)
+
+    def test_getitem(self):
+        def _checkit(i):
+            assert_almost_equal(self.arr[i], self.arr.values[i])
+
+        for i in range(len(self.arr)):
+            _checkit(i)
+            _checkit(-i)
+
+    def test_getslice(self):
+        result = self.arr[:-3]
+        exp = SparseArray(self.arr.values[:-3])
+        tm.assert_sp_array_equal(result, exp)
+
+        result = self.arr[-4:]
+        exp = SparseArray(self.arr.values[-4:])
+        tm.assert_sp_array_equal(result, exp)
+
+        # two corner cases from Series
+        result = self.arr[-12:]
+        exp = SparseArray(self.arr)
+        tm.assert_sp_array_equal(result, exp)
+
+        result = self.arr[:-12]
+        exp = SparseArray(self.arr.values[:0])
+        tm.assert_sp_array_equal(result, exp)
+
+    def test_getslice_tuple(self):
+        dense = np.array([np.nan, 0, 3, 4, 0, 5, np.nan, np.nan, 0])
+
+        sparse = SparseArray(dense)
+        res = sparse[4:, ]
+        exp = SparseArray(dense[4:, ])
+        tm.assert_sp_array_equal(res, exp)
+
+        sparse = SparseArray(dense, fill_value=0)
+        res = sparse[4:, ]
+        exp = SparseArray(dense[4:, ], fill_value=0)
+        tm.assert_sp_array_equal(res, exp)
+
+        with pytest.raises(IndexError):
+            sparse[4:, :]
+
+        with pytest.raises(IndexError):
+            # check numpy compat
+            dense[4:, :]
+
+    def test_binary_operators(self):
+        data1 = np.random.randn(20)
+        data2 = np.random.randn(20)
+        data1[::2] = np.nan
+        data2[::3] = np.nan
+
+        arr1 = SparseArray(data1)
+        arr2 = SparseArray(data2)
+
+        data1[::2] = 3
+        data2[::3] = 3
+        farr1 = SparseArray(data1, fill_value=3)
+        farr2 = SparseArray(data2, fill_value=3)
+
+        def _check_op(op, first, second):
+            res = op(first, second)
+            exp = SparseArray(op(first.values, second.values),
+                              fill_value=first.fill_value)
+            assert isinstance(res, SparseArray)
+            assert_almost_equal(res.values, exp.values)
+
+            res2 = op(first, second.values)
+            assert isinstance(res2, SparseArray)
+            tm.assert_sp_array_equal(res, res2)
+
+            res3 = op(first.values, second)
+            assert isinstance(res3, SparseArray)
+            tm.assert_sp_array_equal(res, res3)
+
+            res4 = op(first, 4)
+            assert isinstance(res4, SparseArray)
+
+            # ignore this if the actual op raises (e.g. pow)
+            try:
+                exp = op(first.values, 4)
+                exp_fv = op(first.fill_value, 4)
+                assert_almost_equal(res4.fill_value, exp_fv)
+                assert_almost_equal(res4.values, exp)
+            except ValueError:
+                pass
+
+        def _check_inplace_op(op):
+            tmp = arr1.copy()
+            pytest.raises(NotImplementedError, op, tmp, arr2)
+
+        with np.errstate(all='ignore'):
+            bin_ops = [operator.add, operator.sub, operator.mul,
+                       operator.truediv, operator.floordiv, operator.pow]
+            for op in bin_ops:
+                _check_op(op, arr1, arr2)
+                _check_op(op, farr1, farr2)
+
+            inplace_ops = ['iadd', 'isub', 'imul', 'itruediv', 'ifloordiv',
+                           'ipow']
+            for op in inplace_ops:
+                _check_inplace_op(getattr(operator, op))
+
+    def test_pickle(self):
+        def _check_roundtrip(obj):
+            unpickled = tm.round_trip_pickle(obj)
+            tm.assert_sp_array_equal(unpickled, obj)
+
+        _check_roundtrip(self.arr)
+        _check_roundtrip(self.zarr)
+
+    def test_generator_warnings(self):
+        sp_arr = SparseArray([1, 2, 3])
+        with warnings.catch_warnings(record=True) as w:
+            warnings.filterwarnings(action='always',
+                                    category=DeprecationWarning)
+            warnings.filterwarnings(action='always',
+                                    category=PendingDeprecationWarning)
+            for _ in sp_arr:
+                pass
+            assert len(w) == 0
+
+    def test_fillna(self):
+        s = SparseArray([1, np.nan, np.nan, 3, np.nan])
+        res = s.fillna(-1)
+        exp = SparseArray([1, -1, -1, 3, -1], fill_value=-1, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+        s = SparseArray([1, np.nan, np.nan, 3, np.nan], fill_value=0)
+        res = s.fillna(-1)
+        exp = SparseArray([1, -1, -1, 3, -1], fill_value=0, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+        s = SparseArray([1, np.nan, 0, 3, 0])
+        res = s.fillna(-1)
+        exp = SparseArray([1, -1, 0, 3, 0], fill_value=-1, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+        s = SparseArray([1, np.nan, 0, 3, 0], fill_value=0)
+        res = s.fillna(-1)
+        exp = SparseArray([1, -1, 0, 3, 0], fill_value=0, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+        s = SparseArray([np.nan, np.nan, np.nan, np.nan])
+        res = s.fillna(-1)
+        exp = SparseArray([-1, -1, -1, -1], fill_value=-1, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+        s = SparseArray([np.nan, np.nan, np.nan, np.nan], fill_value=0)
+        res = s.fillna(-1)
+        exp = SparseArray([-1, -1, -1, -1], fill_value=0, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+        # float dtype's fill_value is np.nan, replaced by -1
+        s = SparseArray([0., 0., 0., 0.])
+        res = s.fillna(-1)
+        exp = SparseArray([0., 0., 0., 0.], fill_value=-1)
+        tm.assert_sp_array_equal(res, exp)
+
+        # int dtype shouldn't have missing. No changes.
+        s = SparseArray([0, 0, 0, 0])
+        assert s.dtype == np.int64
+        assert s.fill_value == 0
+        res = s.fillna(-1)
+        tm.assert_sp_array_equal(res, s)
+
+        s = SparseArray([0, 0, 0, 0], fill_value=0)
+        assert s.dtype == np.int64
+        assert s.fill_value == 0
+        res = s.fillna(-1)
+        exp = SparseArray([0, 0, 0, 0], fill_value=0)
+        tm.assert_sp_array_equal(res, exp)
+
+        # fill_value can be nan if there is no missing hole.
+        # only fill_value will be changed
+        s = SparseArray([0, 0, 0, 0], fill_value=np.nan)
+        assert s.dtype == np.int64
+        assert np.isnan(s.fill_value)
+        res = s.fillna(-1)
+        exp = SparseArray([0, 0, 0, 0], fill_value=-1)
+        tm.assert_sp_array_equal(res, exp)
+
+    def test_fillna_overlap(self):
+        s = SparseArray([1, np.nan, np.nan, 3, np.nan])
+        # filling with existing value doesn't replace existing value with
+        # fill_value, i.e. existing 3 remains in sp_values
+        res = s.fillna(3)
+        exp = np.array([1, 3, 3, 3, 3], dtype=np.float64)
+        tm.assert_numpy_array_equal(res.to_dense(), exp)
+
+        s = SparseArray([1, np.nan, np.nan, 3, np.nan], fill_value=0)
+        res = s.fillna(3)
+        exp = SparseArray([1, 3, 3, 3, 3], fill_value=0, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+
+class TestSparseArrayAnalytics(object):
+
+    @pytest.mark.parametrize('data,pos,neg', [
+        ([True, True, True], True, False),
+        ([1, 2, 1], 1, 0),
+        ([1.0, 2.0, 1.0], 1.0, 0.0)
+    ])
+    def test_all(self, data, pos, neg):
+        # GH 17570
+        out = SparseArray(data).all()
+        assert out
+
+        out = SparseArray(data, fill_value=pos).all()
+        assert out
+
+        data[1] = neg
+        out = SparseArray(data).all()
+        assert not out
+
+        out = SparseArray(data, fill_value=pos).all()
+        assert not out
+
+    @pytest.mark.parametrize('data,pos,neg', [
+        ([True, True, True], True, False),
+        ([1, 2, 1], 1, 0),
+        ([1.0, 2.0, 1.0], 1.0, 0.0)
+    ])
+    def test_numpy_all(self, data, pos, neg):
+        # GH 17570
+        out = np.all(SparseArray(data))
+        assert out
+
+        out = np.all(SparseArray(data, fill_value=pos))
+        assert out
+
+        data[1] = neg
+        out = np.all(SparseArray(data))
+        assert not out
+
+        out = np.all(SparseArray(data, fill_value=pos))
+        assert not out
+
+        msg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.all,
+                               SparseArray(data), out=out)
+
+    @pytest.mark.parametrize('data,pos,neg', [
+        ([False, True, False], True, False),
+        ([0, 2, 0], 2, 0),
+        ([0.0, 2.0, 0.0], 2.0, 0.0)
+    ])
+    def test_any(self, data, pos, neg):
+        # GH 17570
+        out = SparseArray(data).any()
+        assert out
+
+        out = SparseArray(data, fill_value=pos).any()
+        assert out
+
+        data[1] = neg
+        out = SparseArray(data).any()
+        assert not out
+
+        out = SparseArray(data, fill_value=pos).any()
+        assert not out
+
+    @pytest.mark.parametrize('data,pos,neg', [
+        ([False, True, False], True, False),
+        ([0, 2, 0], 2, 0),
+        ([0.0, 2.0, 0.0], 2.0, 0.0)
+    ])
+    def test_numpy_any(self, data, pos, neg):
+        # GH 17570
+        out = np.any(SparseArray(data))
+        assert out
+
+        out = np.any(SparseArray(data, fill_value=pos))
+        assert out
+
+        data[1] = neg
+        out = np.any(SparseArray(data))
+        assert not out
+
+        out = np.any(SparseArray(data, fill_value=pos))
+        assert not out
+
+        msg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.any,
+                               SparseArray(data), out=out)
+
+    def test_sum(self):
+        data = np.arange(10).astype(float)
+        out = SparseArray(data).sum()
+        assert out == 45.0
+
+        data[5] = np.nan
+        out = SparseArray(data, fill_value=2).sum()
+        assert out == 40.0
+
+        out = SparseArray(data, fill_value=np.nan).sum()
+        assert out == 40.0
+
+    def test_numpy_sum(self):
+        data = np.arange(10).astype(float)
+        out = np.sum(SparseArray(data))
+        assert out == 45.0
+
+        data[5] = np.nan
+        out = np.sum(SparseArray(data, fill_value=2))
+        assert out == 40.0
+
+        out = np.sum(SparseArray(data, fill_value=np.nan))
+        assert out == 40.0
+
+        msg = "the 'dtype' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.sum,
+                               SparseArray(data), dtype=np.int64)
+
+        msg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.sum,
+                               SparseArray(data), out=out)
+
+    def test_cumsum(self):
+        non_null_data = np.array([1, 2, 3, 4, 5], dtype=float)
+        non_null_expected = SparseArray(non_null_data.cumsum())
+
+        null_data = np.array([1, 2, np.nan, 4, 5], dtype=float)
+        null_expected = SparseArray(np.array([1.0, 3.0, np.nan, 7.0, 12.0]))
+
+        for data, expected in [
+            (null_data, null_expected),
+            (non_null_data, non_null_expected)
+        ]:
+            out = SparseArray(data).cumsum()
+            tm.assert_sp_array_equal(out, expected)
+
+            out = SparseArray(data, fill_value=np.nan).cumsum()
+            tm.assert_sp_array_equal(out, expected)
+
+            out = SparseArray(data, fill_value=2).cumsum()
+            tm.assert_sp_array_equal(out, expected)
+
+            axis = 1  # SparseArray currently 1-D, so only axis = 0 is valid.
+            msg = "axis\\(={axis}\\) out of bounds".format(axis=axis)
+            with tm.assert_raises_regex(ValueError, msg):
+                SparseArray(data).cumsum(axis=axis)
+
+    def test_numpy_cumsum(self):
+        non_null_data = np.array([1, 2, 3, 4, 5], dtype=float)
+        non_null_expected = SparseArray(non_null_data.cumsum())
+
+        null_data = np.array([1, 2, np.nan, 4, 5], dtype=float)
+        null_expected = SparseArray(np.array([1.0, 3.0, np.nan, 7.0, 12.0]))
+
+        for data, expected in [
+            (null_data, null_expected),
+            (non_null_data, non_null_expected)
+        ]:
+            out = np.cumsum(SparseArray(data))
+            tm.assert_sp_array_equal(out, expected)
+
+            out = np.cumsum(SparseArray(data, fill_value=np.nan))
+            tm.assert_sp_array_equal(out, expected)
+
+            out = np.cumsum(SparseArray(data, fill_value=2))
+            tm.assert_sp_array_equal(out, expected)
+
+            msg = "the 'dtype' parameter is not supported"
+            tm.assert_raises_regex(ValueError, msg, np.cumsum,
+                                   SparseArray(data), dtype=np.int64)
+
+            msg = "the 'out' parameter is not supported"
+            tm.assert_raises_regex(ValueError, msg, np.cumsum,
+                                   SparseArray(data), out=out)
+
+    def test_mean(self):
+        data = np.arange(10).astype(float)
+        out = SparseArray(data).mean()
+        assert out == 4.5
+
+        data[5] = np.nan
+        out = SparseArray(data).mean()
+        assert out == 40.0 / 9
+
+    def test_numpy_mean(self):
+        data = np.arange(10).astype(float)
+        out = np.mean(SparseArray(data))
+        assert out == 4.5
+
+        data[5] = np.nan
+        out = np.mean(SparseArray(data))
+        assert out == 40.0 / 9
+
+        msg = "the 'dtype' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.mean,
+                               SparseArray(data), dtype=np.int64)
+
+        msg = "the 'out' parameter is not supported"
+        tm.assert_raises_regex(ValueError, msg, np.mean,
+                               SparseArray(data), out=out)
+
+    def test_ufunc(self):
+        # GH 13853 make sure ufunc is applied to fill_value
+        sparse = SparseArray([1, np.nan, 2, np.nan, -2])
+        result = SparseArray([1, np.nan, 2, np.nan, 2])
+        tm.assert_sp_array_equal(abs(sparse), result)
+        tm.assert_sp_array_equal(np.abs(sparse), result)
+
+        sparse = SparseArray([1, -1, 2, -2], fill_value=1)
+        result = SparseArray([1, 2, 2], sparse_index=sparse.sp_index,
+                             fill_value=1)
+        tm.assert_sp_array_equal(abs(sparse), result)
+        tm.assert_sp_array_equal(np.abs(sparse), result)
+
+        sparse = SparseArray([1, -1, 2, -2], fill_value=-1)
+        result = SparseArray([1, 2, 2], sparse_index=sparse.sp_index,
+                             fill_value=1)
+        tm.assert_sp_array_equal(abs(sparse), result)
+        tm.assert_sp_array_equal(np.abs(sparse), result)
+
+        sparse = SparseArray([1, np.nan, 2, np.nan, -2])
+        result = SparseArray(np.sin([1, np.nan, 2, np.nan, -2]))
+        tm.assert_sp_array_equal(np.sin(sparse), result)
+
+        sparse = SparseArray([1, -1, 2, -2], fill_value=1)
+        result = SparseArray(np.sin([1, -1, 2, -2]), fill_value=np.sin(1))
+        tm.assert_sp_array_equal(np.sin(sparse), result)
+
+        sparse = SparseArray([1, -1, 0, -2], fill_value=0)
+        result = SparseArray(np.sin([1, -1, 0, -2]), fill_value=np.sin(0))
+        tm.assert_sp_array_equal(np.sin(sparse), result)
+
+    def test_ufunc_args(self):
+        # GH 13853 make sure ufunc is applied to fill_value, including its arg
+        sparse = SparseArray([1, np.nan, 2, np.nan, -2])
+        result = SparseArray([2, np.nan, 3, np.nan, -1])
+        tm.assert_sp_array_equal(np.add(sparse, 1), result)
+
+        sparse = SparseArray([1, -1, 2, -2], fill_value=1)
+        result = SparseArray([2, 0, 3, -1], fill_value=2)
+        tm.assert_sp_array_equal(np.add(sparse, 1), result)
+
+        sparse = SparseArray([1, -1, 0, -2], fill_value=0)
+        result = SparseArray([2, 0, 1, -1], fill_value=1)
+        tm.assert_sp_array_equal(np.add(sparse, 1), result)
diff --git a/pandas/tests/sparse/test_combine_concat.py b/pandas/tests/sparse/test_combine_concat.py
new file mode 100644
index 0000000000000..9e392457edbc3
--- /dev/null
+++ b/pandas/tests/sparse/test_combine_concat.py
@@ -0,0 +1,384 @@
+# pylint: disable-msg=E1101,W0612
+import pytest
+
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+import itertools
+
+
+class TestSparseSeriesConcat(object):
+
+    def test_concat(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        for kind in ['integer', 'block']:
+            sparse1 = pd.SparseSeries(val1, name='x', kind=kind)
+            sparse2 = pd.SparseSeries(val2, name='y', kind=kind)
+
+            res = pd.concat([sparse1, sparse2])
+            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+            exp = pd.SparseSeries(exp, kind=kind)
+            tm.assert_sp_series_equal(res, exp)
+
+            sparse1 = pd.SparseSeries(val1, fill_value=0, name='x', kind=kind)
+            sparse2 = pd.SparseSeries(val2, fill_value=0, name='y', kind=kind)
+
+            res = pd.concat([sparse1, sparse2])
+            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+            exp = pd.SparseSeries(exp, fill_value=0, kind=kind)
+            tm.assert_sp_series_equal(res, exp)
+
+    def test_concat_axis1(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        sparse1 = pd.SparseSeries(val1, name='x')
+        sparse2 = pd.SparseSeries(val2, name='y')
+
+        res = pd.concat([sparse1, sparse2], axis=1)
+        exp = pd.concat([pd.Series(val1, name='x'),
+                         pd.Series(val2, name='y')], axis=1)
+        exp = pd.SparseDataFrame(exp)
+        tm.assert_sp_frame_equal(res, exp)
+
+    def test_concat_different_fill(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        for kind in ['integer', 'block']:
+            sparse1 = pd.SparseSeries(val1, name='x', kind=kind)
+            sparse2 = pd.SparseSeries(val2, name='y', kind=kind, fill_value=0)
+
+            res = pd.concat([sparse1, sparse2])
+            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+            exp = pd.SparseSeries(exp, kind=kind)
+            tm.assert_sp_series_equal(res, exp)
+
+            res = pd.concat([sparse2, sparse1])
+            exp = pd.concat([pd.Series(val2), pd.Series(val1)])
+            exp = pd.SparseSeries(exp, kind=kind, fill_value=0)
+            tm.assert_sp_series_equal(res, exp)
+
+    def test_concat_axis1_different_fill(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        sparse1 = pd.SparseSeries(val1, name='x')
+        sparse2 = pd.SparseSeries(val2, name='y', fill_value=0)
+
+        res = pd.concat([sparse1, sparse2], axis=1)
+        exp = pd.concat([pd.Series(val1, name='x'),
+                         pd.Series(val2, name='y')], axis=1)
+        assert isinstance(res, pd.SparseDataFrame)
+        tm.assert_frame_equal(res.to_dense(), exp)
+
+    def test_concat_different_kind(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        sparse1 = pd.SparseSeries(val1, name='x', kind='integer')
+        sparse2 = pd.SparseSeries(val2, name='y', kind='block', fill_value=0)
+
+        res = pd.concat([sparse1, sparse2])
+        exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+        exp = pd.SparseSeries(exp, kind='integer')
+        tm.assert_sp_series_equal(res, exp)
+
+        res = pd.concat([sparse2, sparse1])
+        exp = pd.concat([pd.Series(val2), pd.Series(val1)])
+        exp = pd.SparseSeries(exp, kind='block', fill_value=0)
+        tm.assert_sp_series_equal(res, exp)
+
+    def test_concat_sparse_dense(self):
+        # use first input's fill_value
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        for kind in ['integer', 'block']:
+            sparse = pd.SparseSeries(val1, name='x', kind=kind)
+            dense = pd.Series(val2, name='y')
+
+            res = pd.concat([sparse, dense])
+            exp = pd.concat([pd.Series(val1), dense])
+            exp = pd.SparseSeries(exp, kind=kind)
+            tm.assert_sp_series_equal(res, exp)
+
+            res = pd.concat([dense, sparse, dense])
+            exp = pd.concat([dense, pd.Series(val1), dense])
+            exp = pd.SparseSeries(exp, kind=kind)
+            tm.assert_sp_series_equal(res, exp)
+
+            sparse = pd.SparseSeries(val1, name='x', kind=kind, fill_value=0)
+            dense = pd.Series(val2, name='y')
+
+            res = pd.concat([sparse, dense])
+            exp = pd.concat([pd.Series(val1), dense])
+            exp = pd.SparseSeries(exp, kind=kind, fill_value=0)
+            tm.assert_sp_series_equal(res, exp)
+
+            res = pd.concat([dense, sparse, dense])
+            exp = pd.concat([dense, pd.Series(val1), dense])
+            exp = pd.SparseSeries(exp, kind=kind, fill_value=0)
+            tm.assert_sp_series_equal(res, exp)
+
+
+class TestSparseDataFrameConcat(object):
+
+    def setup_method(self, method):
+
+        self.dense1 = pd.DataFrame({'A': [0., 1., 2., np.nan],
+                                    'B': [0., 0., 0., 0.],
+                                    'C': [np.nan, np.nan, np.nan, np.nan],
+                                    'D': [1., 2., 3., 4.]})
+
+        self.dense2 = pd.DataFrame({'A': [5., 6., 7., 8.],
+                                    'B': [np.nan, 0., 7., 8.],
+                                    'C': [5., 6., np.nan, np.nan],
+                                    'D': [np.nan, np.nan, np.nan, np.nan]})
+
+        self.dense3 = pd.DataFrame({'E': [5., 6., 7., 8.],
+                                    'F': [np.nan, 0., 7., 8.],
+                                    'G': [5., 6., np.nan, np.nan],
+                                    'H': [np.nan, np.nan, np.nan, np.nan]})
+
+    def test_concat(self):
+        # fill_value = np.nan
+        sparse = self.dense1.to_sparse()
+        sparse2 = self.dense2.to_sparse()
+
+        res = pd.concat([sparse, sparse])
+        exp = pd.concat([self.dense1, self.dense1]).to_sparse()
+        tm.assert_sp_frame_equal(res, exp)
+
+        res = pd.concat([sparse2, sparse2])
+        exp = pd.concat([self.dense2, self.dense2]).to_sparse()
+        tm.assert_sp_frame_equal(res, exp)
+
+        res = pd.concat([sparse, sparse2])
+        exp = pd.concat([self.dense1, self.dense2]).to_sparse()
+        tm.assert_sp_frame_equal(res, exp)
+
+        res = pd.concat([sparse2, sparse])
+        exp = pd.concat([self.dense2, self.dense1]).to_sparse()
+        tm.assert_sp_frame_equal(res, exp)
+
+        # fill_value = 0
+        sparse = self.dense1.to_sparse(fill_value=0)
+        sparse2 = self.dense2.to_sparse(fill_value=0)
+
+        res = pd.concat([sparse, sparse])
+        exp = pd.concat([self.dense1, self.dense1]).to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+        res = pd.concat([sparse2, sparse2])
+        exp = pd.concat([self.dense2, self.dense2]).to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+        res = pd.concat([sparse, sparse2])
+        exp = pd.concat([self.dense1, self.dense2]).to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+        res = pd.concat([sparse2, sparse])
+        exp = pd.concat([self.dense2, self.dense1]).to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+    def test_concat_different_fill_value(self):
+        # 1st fill_value will be used
+        sparse = self.dense1.to_sparse()
+        sparse2 = self.dense2.to_sparse(fill_value=0)
+
+        res = pd.concat([sparse, sparse2])
+        exp = pd.concat([self.dense1, self.dense2]).to_sparse()
+        tm.assert_sp_frame_equal(res, exp)
+
+        res = pd.concat([sparse2, sparse])
+        exp = pd.concat([self.dense2, self.dense1]).to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+    def test_concat_different_columns_sort_warns(self):
+        sparse = self.dense1.to_sparse()
+        sparse3 = self.dense3.to_sparse()
+
+        with tm.assert_produces_warning(FutureWarning):
+            res = pd.concat([sparse, sparse3])
+        with tm.assert_produces_warning(FutureWarning):
+            exp = pd.concat([self.dense1, self.dense3])
+
+        exp = exp.to_sparse()
+        tm.assert_sp_frame_equal(res, exp)
+
+    def test_concat_different_columns(self):
+        # fill_value = np.nan
+        sparse = self.dense1.to_sparse()
+        sparse3 = self.dense3.to_sparse()
+
+        res = pd.concat([sparse, sparse3], sort=True)
+        exp = pd.concat([self.dense1, self.dense3], sort=True).to_sparse()
+        tm.assert_sp_frame_equal(res, exp)
+
+        res = pd.concat([sparse3, sparse], sort=True)
+        exp = pd.concat([self.dense3, self.dense1], sort=True).to_sparse()
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+        # fill_value = 0
+        sparse = self.dense1.to_sparse(fill_value=0)
+        sparse3 = self.dense3.to_sparse(fill_value=0)
+
+        res = pd.concat([sparse, sparse3], sort=True)
+        exp = (pd.concat([self.dense1, self.dense3], sort=True)
+                 .to_sparse(fill_value=0))
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+        res = pd.concat([sparse3, sparse], sort=True)
+        exp = (pd.concat([self.dense3, self.dense1], sort=True)
+                 .to_sparse(fill_value=0))
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+        # different fill values
+        sparse = self.dense1.to_sparse()
+        sparse3 = self.dense3.to_sparse(fill_value=0)
+        # each columns keeps its fill_value, thus compare in dense
+        res = pd.concat([sparse, sparse3], sort=True)
+        exp = pd.concat([self.dense1, self.dense3], sort=True)
+        assert isinstance(res, pd.SparseDataFrame)
+        tm.assert_frame_equal(res.to_dense(), exp)
+
+        res = pd.concat([sparse3, sparse], sort=True)
+        exp = pd.concat([self.dense3, self.dense1], sort=True)
+        assert isinstance(res, pd.SparseDataFrame)
+        tm.assert_frame_equal(res.to_dense(), exp)
+
+    def test_concat_series(self):
+        # fill_value = np.nan
+        sparse = self.dense1.to_sparse()
+        sparse2 = self.dense2.to_sparse()
+
+        for col in ['A', 'D']:
+            res = pd.concat([sparse, sparse2[col]])
+            exp = pd.concat([self.dense1, self.dense2[col]]).to_sparse()
+            tm.assert_sp_frame_equal(res, exp)
+
+            res = pd.concat([sparse2[col], sparse])
+            exp = pd.concat([self.dense2[col], self.dense1]).to_sparse()
+            tm.assert_sp_frame_equal(res, exp)
+
+        # fill_value = 0
+        sparse = self.dense1.to_sparse(fill_value=0)
+        sparse2 = self.dense2.to_sparse(fill_value=0)
+
+        for col in ['C', 'D']:
+            res = pd.concat([sparse, sparse2[col]])
+            exp = pd.concat([self.dense1,
+                             self.dense2[col]]).to_sparse(fill_value=0)
+            exp._default_fill_value = np.nan
+            tm.assert_sp_frame_equal(res, exp)
+
+            res = pd.concat([sparse2[col], sparse])
+            exp = pd.concat([self.dense2[col],
+                             self.dense1]).to_sparse(fill_value=0)
+            exp._default_fill_value = np.nan
+            tm.assert_sp_frame_equal(res, exp)
+
+    def test_concat_axis1(self):
+        # fill_value = np.nan
+        sparse = self.dense1.to_sparse()
+        sparse3 = self.dense3.to_sparse()
+
+        res = pd.concat([sparse, sparse3], axis=1)
+        exp = pd.concat([self.dense1, self.dense3], axis=1).to_sparse()
+        tm.assert_sp_frame_equal(res, exp)
+
+        res = pd.concat([sparse3, sparse], axis=1)
+        exp = pd.concat([self.dense3, self.dense1], axis=1).to_sparse()
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+        # fill_value = 0
+        sparse = self.dense1.to_sparse(fill_value=0)
+        sparse3 = self.dense3.to_sparse(fill_value=0)
+
+        res = pd.concat([sparse, sparse3], axis=1)
+        exp = pd.concat([self.dense1, self.dense3],
+                        axis=1).to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+        res = pd.concat([sparse3, sparse], axis=1)
+        exp = pd.concat([self.dense3, self.dense1],
+                        axis=1).to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+        # different fill values
+        sparse = self.dense1.to_sparse()
+        sparse3 = self.dense3.to_sparse(fill_value=0)
+        # each columns keeps its fill_value, thus compare in dense
+        res = pd.concat([sparse, sparse3], axis=1)
+        exp = pd.concat([self.dense1, self.dense3], axis=1)
+        assert isinstance(res, pd.SparseDataFrame)
+        tm.assert_frame_equal(res.to_dense(), exp)
+
+        res = pd.concat([sparse3, sparse], axis=1)
+        exp = pd.concat([self.dense3, self.dense1], axis=1)
+        assert isinstance(res, pd.SparseDataFrame)
+        tm.assert_frame_equal(res.to_dense(), exp)
+
+    @pytest.mark.parametrize('fill_value,sparse_idx,dense_idx',
+                             itertools.product([None, 0, 1, np.nan],
+                                               [0, 1],
+                                               [1, 0]))
+    def test_concat_sparse_dense_rows(self, fill_value, sparse_idx, dense_idx):
+        frames = [self.dense1, self.dense2]
+        sparse_frame = [frames[dense_idx],
+                        frames[sparse_idx].to_sparse(fill_value=fill_value)]
+        dense_frame = [frames[dense_idx], frames[sparse_idx]]
+
+        # This will try both directions sparse + dense and dense + sparse
+        for _ in range(2):
+            res = pd.concat(sparse_frame)
+            exp = pd.concat(dense_frame)
+
+            assert isinstance(res, pd.SparseDataFrame)
+            tm.assert_frame_equal(res.to_dense(), exp)
+
+            sparse_frame = sparse_frame[::-1]
+            dense_frame = dense_frame[::-1]
+
+    @pytest.mark.parametrize('fill_value,sparse_idx,dense_idx',
+                             itertools.product([None, 0, 1, np.nan],
+                                               [0, 1],
+                                               [1, 0]))
+    def test_concat_sparse_dense_cols(self, fill_value, sparse_idx, dense_idx):
+        # See GH16874, GH18914 and #18686 for why this should be a DataFrame
+
+        frames = [self.dense1, self.dense3]
+
+        sparse_frame = [frames[dense_idx],
+                        frames[sparse_idx].to_sparse(fill_value=fill_value)]
+        dense_frame = [frames[dense_idx], frames[sparse_idx]]
+
+        # This will try both directions sparse + dense and dense + sparse
+        for _ in range(2):
+            res = pd.concat(sparse_frame, axis=1)
+            exp = pd.concat(dense_frame, axis=1)
+
+            for column in frames[dense_idx].columns:
+                if dense_idx == sparse_idx:
+                    tm.assert_frame_equal(res[column], exp[column])
+                else:
+                    tm.assert_series_equal(res[column], exp[column])
+
+            tm.assert_frame_equal(res, exp)
+
+            sparse_frame = sparse_frame[::-1]
+            dense_frame = dense_frame[::-1]
diff --git a/pandas/tests/sparse/test_format.py b/pandas/tests/sparse/test_format.py
new file mode 100644
index 0000000000000..d983bd209085a
--- /dev/null
+++ b/pandas/tests/sparse/test_format.py
@@ -0,0 +1,132 @@
+# -*- coding: utf-8 -*-
+from __future__ import print_function
+
+import numpy as np
+import pandas as pd
+
+import pandas.util.testing as tm
+from pandas.compat import (is_platform_windows,
+                           is_platform_32bit)
+from pandas.core.config import option_context
+
+
+use_32bit_repr = is_platform_windows() or is_platform_32bit()
+
+
+class TestSparseSeriesFormatting(object):
+
+    @property
+    def dtype_format_for_platform(self):
+        return '' if use_32bit_repr else ', dtype=int32'
+
+    def test_sparse_max_row(self):
+        s = pd.Series([1, np.nan, np.nan, 3, np.nan]).to_sparse()
+        result = repr(s)
+        dfm = self.dtype_format_for_platform
+        exp = ("0    1.0\n1    NaN\n2    NaN\n3    3.0\n"
+               "4    NaN\ndtype: float64\nBlockIndex\n"
+               "Block locations: array([0, 3]{0})\n"
+               "Block lengths: array([1, 1]{0})".format(dfm))
+        assert result == exp
+
+        with option_context("display.max_rows", 3):
+            # GH 10560
+            result = repr(s)
+            exp = ("0    1.0\n    ... \n4    NaN\n"
+                   "Length: 5, dtype: float64\nBlockIndex\n"
+                   "Block locations: array([0, 3]{0})\n"
+                   "Block lengths: array([1, 1]{0})".format(dfm))
+            assert result == exp
+
+    def test_sparse_mi_max_row(self):
+        idx = pd.MultiIndex.from_tuples([('A', 0), ('A', 1), ('B', 0),
+                                         ('C', 0), ('C', 1), ('C', 2)])
+        s = pd.Series([1, np.nan, np.nan, 3, np.nan, np.nan],
+                      index=idx).to_sparse()
+        result = repr(s)
+        dfm = self.dtype_format_for_platform
+        exp = ("A  0    1.0\n   1    NaN\nB  0    NaN\n"
+               "C  0    3.0\n   1    NaN\n   2    NaN\n"
+               "dtype: float64\nBlockIndex\n"
+               "Block locations: array([0, 3]{0})\n"
+               "Block lengths: array([1, 1]{0})".format(dfm))
+        assert result == exp
+
+        with option_context("display.max_rows", 3,
+                            "display.show_dimensions", False):
+            # GH 13144
+            result = repr(s)
+            exp = ("A  0    1.0\n       ... \nC  2    NaN\n"
+                   "dtype: float64\nBlockIndex\n"
+                   "Block locations: array([0, 3]{0})\n"
+                   "Block lengths: array([1, 1]{0})".format(dfm))
+            assert result == exp
+
+    def test_sparse_bool(self):
+        # GH 13110
+        s = pd.SparseSeries([True, False, False, True, False, False],
+                            fill_value=False)
+        result = repr(s)
+        dtype = '' if use_32bit_repr else ', dtype=int32'
+        exp = ("0     True\n1    False\n2    False\n"
+               "3     True\n4    False\n5    False\n"
+               "dtype: bool\nBlockIndex\n"
+               "Block locations: array([0, 3]{0})\n"
+               "Block lengths: array([1, 1]{0})".format(dtype))
+        assert result == exp
+
+        with option_context("display.max_rows", 3):
+            result = repr(s)
+            exp = ("0     True\n     ...  \n5    False\n"
+                   "Length: 6, dtype: bool\nBlockIndex\n"
+                   "Block locations: array([0, 3]{0})\n"
+                   "Block lengths: array([1, 1]{0})".format(dtype))
+            assert result == exp
+
+    def test_sparse_int(self):
+        # GH 13110
+        s = pd.SparseSeries([0, 1, 0, 0, 1, 0], fill_value=False)
+
+        result = repr(s)
+        dtype = '' if use_32bit_repr else ', dtype=int32'
+        exp = ("0    0\n1    1\n2    0\n3    0\n4    1\n"
+               "5    0\ndtype: int64\nBlockIndex\n"
+               "Block locations: array([1, 4]{0})\n"
+               "Block lengths: array([1, 1]{0})".format(dtype))
+        assert result == exp
+
+        with option_context("display.max_rows", 3,
+                            "display.show_dimensions", False):
+            result = repr(s)
+            exp = ("0    0\n    ..\n5    0\n"
+                   "dtype: int64\nBlockIndex\n"
+                   "Block locations: array([1, 4]{0})\n"
+                   "Block lengths: array([1, 1]{0})".format(dtype))
+            assert result == exp
+
+
+class TestSparseDataFrameFormatting(object):
+
+    def test_sparse_frame(self):
+        # GH 13110
+        df = pd.DataFrame({'A': [True, False, True, False, True],
+                           'B': [True, False, True, False, True],
+                           'C': [0, 0, 3, 0, 5],
+                           'D': [np.nan, np.nan, np.nan, 1, 2]})
+        sparse = df.to_sparse()
+        assert repr(sparse) == repr(df)
+
+        with option_context("display.max_rows", 3):
+            assert repr(sparse) == repr(df)
+
+    def test_sparse_repr_after_set(self):
+        # GH 15488
+        sdf = pd.SparseDataFrame([[np.nan, 1], [2, np.nan]])
+        res = sdf.copy()
+
+        # Ignore the warning
+        with pd.option_context('mode.chained_assignment', None):
+            sdf[0][1] = 2  # This line triggers the bug
+
+        repr(sdf)
+        tm.assert_sp_frame_equal(sdf, res)
diff --git a/pandas/tests/sparse/test_groupby.py b/pandas/tests/sparse/test_groupby.py
new file mode 100644
index 0000000000000..c9049ed9743dd
--- /dev/null
+++ b/pandas/tests/sparse/test_groupby.py
@@ -0,0 +1,44 @@
+# -*- coding: utf-8 -*-
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+
+
+class TestSparseGroupBy(object):
+
+    def setup_method(self, method):
+        self.dense = pd.DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                                         'foo', 'bar', 'foo', 'foo'],
+                                   'B': ['one', 'one', 'two', 'three',
+                                         'two', 'two', 'one', 'three'],
+                                   'C': np.random.randn(8),
+                                   'D': np.random.randn(8),
+                                   'E': [np.nan, np.nan, 1, 2,
+                                         np.nan, 1, np.nan, np.nan]})
+        self.sparse = self.dense.to_sparse()
+
+    def test_first_last_nth(self):
+        # tests for first / last / nth
+        sparse_grouped = self.sparse.groupby('A')
+        dense_grouped = self.dense.groupby('A')
+
+        tm.assert_frame_equal(sparse_grouped.first(),
+                              dense_grouped.first())
+        tm.assert_frame_equal(sparse_grouped.last(),
+                              dense_grouped.last())
+        tm.assert_frame_equal(sparse_grouped.nth(1),
+                              dense_grouped.nth(1))
+
+    def test_aggfuncs(self):
+        sparse_grouped = self.sparse.groupby('A')
+        dense_grouped = self.dense.groupby('A')
+
+        tm.assert_frame_equal(sparse_grouped.mean(),
+                              dense_grouped.mean())
+
+        # ToDo: sparse sum includes str column
+        # tm.assert_frame_equal(sparse_grouped.sum(),
+        #                       dense_grouped.sum())
+
+        tm.assert_frame_equal(sparse_grouped.count(),
+                              dense_grouped.count())
diff --git a/pandas/tests/sparse/test_indexing.py b/pandas/tests/sparse/test_indexing.py
new file mode 100644
index 0000000000000..37a287af71451
--- /dev/null
+++ b/pandas/tests/sparse/test_indexing.py
@@ -0,0 +1,1037 @@
+# pylint: disable-msg=E1101,W0612
+
+import pytest
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+
+
+class TestSparseSeriesIndexing(object):
+
+    def setup_method(self, method):
+        self.orig = pd.Series([1, np.nan, np.nan, 3, np.nan])
+        self.sparse = self.orig.to_sparse()
+
+    def test_getitem(self):
+        orig = self.orig
+        sparse = self.sparse
+
+        assert sparse[0] == 1
+        assert np.isnan(sparse[1])
+        assert sparse[3] == 3
+
+        result = sparse[[1, 3, 4]]
+        exp = orig[[1, 3, 4]].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # dense array
+        result = sparse[orig % 2 == 1]
+        exp = orig[orig % 2 == 1].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # sparse array (actuary it coerces to normal Series)
+        result = sparse[sparse % 2 == 1]
+        exp = orig[orig % 2 == 1].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # sparse array
+        result = sparse[pd.SparseArray(sparse % 2 == 1, dtype=bool)]
+        tm.assert_sp_series_equal(result, exp)
+
+    def test_getitem_slice(self):
+        orig = self.orig
+        sparse = self.sparse
+
+        tm.assert_sp_series_equal(sparse[:2], orig[:2].to_sparse())
+        tm.assert_sp_series_equal(sparse[4:2], orig[4:2].to_sparse())
+        tm.assert_sp_series_equal(sparse[::2], orig[::2].to_sparse())
+        tm.assert_sp_series_equal(sparse[-5:], orig[-5:].to_sparse())
+
+    def test_getitem_int_dtype(self):
+        # GH 8292
+        s = pd.SparseSeries([0, 1, 2, 3, 4, 5, 6], name='xxx')
+        res = s[::2]
+        exp = pd.SparseSeries([0, 2, 4, 6], index=[0, 2, 4, 6], name='xxx')
+        tm.assert_sp_series_equal(res, exp)
+        assert res.dtype == np.int64
+
+        s = pd.SparseSeries([0, 1, 2, 3, 4, 5, 6], fill_value=0, name='xxx')
+        res = s[::2]
+        exp = pd.SparseSeries([0, 2, 4, 6], index=[0, 2, 4, 6],
+                              fill_value=0, name='xxx')
+        tm.assert_sp_series_equal(res, exp)
+        assert res.dtype == np.int64
+
+    def test_getitem_fill_value(self):
+        orig = pd.Series([1, np.nan, 0, 3, 0])
+        sparse = orig.to_sparse(fill_value=0)
+
+        assert sparse[0] == 1
+        assert np.isnan(sparse[1])
+        assert sparse[2] == 0
+        assert sparse[3] == 3
+
+        result = sparse[[1, 3, 4]]
+        exp = orig[[1, 3, 4]].to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(result, exp)
+
+        # dense array
+        result = sparse[orig % 2 == 1]
+        exp = orig[orig % 2 == 1].to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(result, exp)
+
+        # sparse array (actuary it coerces to normal Series)
+        result = sparse[sparse % 2 == 1]
+        exp = orig[orig % 2 == 1].to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(result, exp)
+
+        # sparse array
+        result = sparse[pd.SparseArray(sparse % 2 == 1, dtype=bool)]
+        tm.assert_sp_series_equal(result, exp)
+
+    def test_getitem_ellipsis(self):
+        # GH 9467
+        s = pd.SparseSeries([1, np.nan, 2, 0, np.nan])
+        tm.assert_sp_series_equal(s[...], s)
+
+        s = pd.SparseSeries([1, np.nan, 2, 0, np.nan], fill_value=0)
+        tm.assert_sp_series_equal(s[...], s)
+
+    def test_getitem_slice_fill_value(self):
+        orig = pd.Series([1, np.nan, 0, 3, 0])
+        sparse = orig.to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(sparse[:2],
+                                  orig[:2].to_sparse(fill_value=0))
+        tm.assert_sp_series_equal(sparse[4:2],
+                                  orig[4:2].to_sparse(fill_value=0))
+        tm.assert_sp_series_equal(sparse[::2],
+                                  orig[::2].to_sparse(fill_value=0))
+        tm.assert_sp_series_equal(sparse[-5:],
+                                  orig[-5:].to_sparse(fill_value=0))
+
+    def test_loc(self):
+        orig = self.orig
+        sparse = self.sparse
+
+        assert sparse.loc[0] == 1
+        assert np.isnan(sparse.loc[1])
+
+        result = sparse.loc[[1, 3, 4]]
+        exp = orig.loc[[1, 3, 4]].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # exceeds the bounds
+        result = sparse.reindex([1, 3, 4, 5])
+        exp = orig.reindex([1, 3, 4, 5]).to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+        # padded with NaN
+        assert np.isnan(result[-1])
+
+        # dense array
+        result = sparse.loc[orig % 2 == 1]
+        exp = orig.loc[orig % 2 == 1].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # sparse array (actuary it coerces to normal Series)
+        result = sparse.loc[sparse % 2 == 1]
+        exp = orig.loc[orig % 2 == 1].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # sparse array
+        result = sparse.loc[pd.SparseArray(sparse % 2 == 1, dtype=bool)]
+        tm.assert_sp_series_equal(result, exp)
+
+    def test_loc_index(self):
+        orig = pd.Series([1, np.nan, np.nan, 3, np.nan], index=list('ABCDE'))
+        sparse = orig.to_sparse()
+
+        assert sparse.loc['A'] == 1
+        assert np.isnan(sparse.loc['B'])
+
+        result = sparse.loc[['A', 'C', 'D']]
+        exp = orig.loc[['A', 'C', 'D']].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # dense array
+        result = sparse.loc[orig % 2 == 1]
+        exp = orig.loc[orig % 2 == 1].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # sparse array (actuary it coerces to normal Series)
+        result = sparse.loc[sparse % 2 == 1]
+        exp = orig.loc[orig % 2 == 1].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # sparse array
+        result = sparse[pd.SparseArray(sparse % 2 == 1, dtype=bool)]
+        tm.assert_sp_series_equal(result, exp)
+
+    def test_loc_index_fill_value(self):
+        orig = pd.Series([1, np.nan, 0, 3, 0], index=list('ABCDE'))
+        sparse = orig.to_sparse(fill_value=0)
+
+        assert sparse.loc['A'] == 1
+        assert np.isnan(sparse.loc['B'])
+
+        result = sparse.loc[['A', 'C', 'D']]
+        exp = orig.loc[['A', 'C', 'D']].to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(result, exp)
+
+        # dense array
+        result = sparse.loc[orig % 2 == 1]
+        exp = orig.loc[orig % 2 == 1].to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(result, exp)
+
+        # sparse array (actuary it coerces to normal Series)
+        result = sparse.loc[sparse % 2 == 1]
+        exp = orig.loc[orig % 2 == 1].to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(result, exp)
+
+    def test_loc_slice(self):
+        orig = self.orig
+        sparse = self.sparse
+        tm.assert_sp_series_equal(sparse.loc[2:], orig.loc[2:].to_sparse())
+
+    def test_loc_slice_index_fill_value(self):
+        orig = pd.Series([1, np.nan, 0, 3, 0], index=list('ABCDE'))
+        sparse = orig.to_sparse(fill_value=0)
+
+        tm.assert_sp_series_equal(sparse.loc['C':],
+                                  orig.loc['C':].to_sparse(fill_value=0))
+
+    def test_loc_slice_fill_value(self):
+        orig = pd.Series([1, np.nan, 0, 3, 0])
+        sparse = orig.to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(sparse.loc[2:],
+                                  orig.loc[2:].to_sparse(fill_value=0))
+
+    def test_iloc(self):
+        orig = self.orig
+        sparse = self.sparse
+
+        assert sparse.iloc[3] == 3
+        assert np.isnan(sparse.iloc[2])
+
+        result = sparse.iloc[[1, 3, 4]]
+        exp = orig.iloc[[1, 3, 4]].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        result = sparse.iloc[[1, -2, -4]]
+        exp = orig.iloc[[1, -2, -4]].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        with pytest.raises(IndexError):
+            sparse.iloc[[1, 3, 5]]
+
+    def test_iloc_fill_value(self):
+        orig = pd.Series([1, np.nan, 0, 3, 0])
+        sparse = orig.to_sparse(fill_value=0)
+
+        assert sparse.iloc[3] == 3
+        assert np.isnan(sparse.iloc[1])
+        assert sparse.iloc[4] == 0
+
+        result = sparse.iloc[[1, 3, 4]]
+        exp = orig.iloc[[1, 3, 4]].to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(result, exp)
+
+    def test_iloc_slice(self):
+        orig = pd.Series([1, np.nan, np.nan, 3, np.nan])
+        sparse = orig.to_sparse()
+        tm.assert_sp_series_equal(sparse.iloc[2:], orig.iloc[2:].to_sparse())
+
+    def test_iloc_slice_fill_value(self):
+        orig = pd.Series([1, np.nan, 0, 3, 0])
+        sparse = orig.to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(sparse.iloc[2:],
+                                  orig.iloc[2:].to_sparse(fill_value=0))
+
+    def test_at(self):
+        orig = pd.Series([1, np.nan, np.nan, 3, np.nan])
+        sparse = orig.to_sparse()
+        assert sparse.at[0] == orig.at[0]
+        assert np.isnan(sparse.at[1])
+        assert np.isnan(sparse.at[2])
+        assert sparse.at[3] == orig.at[3]
+        assert np.isnan(sparse.at[4])
+
+        orig = pd.Series([1, np.nan, np.nan, 3, np.nan],
+                         index=list('abcde'))
+        sparse = orig.to_sparse()
+        assert sparse.at['a'] == orig.at['a']
+        assert np.isnan(sparse.at['b'])
+        assert np.isnan(sparse.at['c'])
+        assert sparse.at['d'] == orig.at['d']
+        assert np.isnan(sparse.at['e'])
+
+    def test_at_fill_value(self):
+        orig = pd.Series([1, np.nan, 0, 3, 0],
+                         index=list('abcde'))
+        sparse = orig.to_sparse(fill_value=0)
+        assert sparse.at['a'] == orig.at['a']
+        assert np.isnan(sparse.at['b'])
+        assert sparse.at['c'] == orig.at['c']
+        assert sparse.at['d'] == orig.at['d']
+        assert sparse.at['e'] == orig.at['e']
+
+    def test_iat(self):
+        orig = self.orig
+        sparse = self.sparse
+
+        assert sparse.iat[0] == orig.iat[0]
+        assert np.isnan(sparse.iat[1])
+        assert np.isnan(sparse.iat[2])
+        assert sparse.iat[3] == orig.iat[3]
+        assert np.isnan(sparse.iat[4])
+
+        assert np.isnan(sparse.iat[-1])
+        assert sparse.iat[-5] == orig.iat[-5]
+
+    def test_iat_fill_value(self):
+        orig = pd.Series([1, np.nan, 0, 3, 0])
+        sparse = orig.to_sparse()
+        assert sparse.iat[0] == orig.iat[0]
+        assert np.isnan(sparse.iat[1])
+        assert sparse.iat[2] == orig.iat[2]
+        assert sparse.iat[3] == orig.iat[3]
+        assert sparse.iat[4] == orig.iat[4]
+
+        assert sparse.iat[-1] == orig.iat[-1]
+        assert sparse.iat[-5] == orig.iat[-5]
+
+    def test_get(self):
+        s = pd.SparseSeries([1, np.nan, np.nan, 3, np.nan])
+        assert s.get(0) == 1
+        assert np.isnan(s.get(1))
+        assert s.get(5) is None
+
+        s = pd.SparseSeries([1, np.nan, 0, 3, 0], index=list('ABCDE'))
+        assert s.get('A') == 1
+        assert np.isnan(s.get('B'))
+        assert s.get('C') == 0
+        assert s.get('XX') is None
+
+        s = pd.SparseSeries([1, np.nan, 0, 3, 0], index=list('ABCDE'),
+                            fill_value=0)
+        assert s.get('A') == 1
+        assert np.isnan(s.get('B'))
+        assert s.get('C') == 0
+        assert s.get('XX') is None
+
+    def test_take(self):
+        orig = pd.Series([1, np.nan, np.nan, 3, np.nan],
+                         index=list('ABCDE'))
+        sparse = orig.to_sparse()
+
+        tm.assert_sp_series_equal(sparse.take([0]),
+                                  orig.take([0]).to_sparse())
+        tm.assert_sp_series_equal(sparse.take([0, 1, 3]),
+                                  orig.take([0, 1, 3]).to_sparse())
+        tm.assert_sp_series_equal(sparse.take([-1, -2]),
+                                  orig.take([-1, -2]).to_sparse())
+
+    def test_take_fill_value(self):
+        orig = pd.Series([1, np.nan, 0, 3, 0],
+                         index=list('ABCDE'))
+        sparse = orig.to_sparse(fill_value=0)
+
+        tm.assert_sp_series_equal(sparse.take([0]),
+                                  orig.take([0]).to_sparse(fill_value=0))
+
+        exp = orig.take([0, 1, 3]).to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(sparse.take([0, 1, 3]), exp)
+
+        exp = orig.take([-1, -2]).to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(sparse.take([-1, -2]), exp)
+
+    def test_reindex(self):
+        orig = pd.Series([1, np.nan, np.nan, 3, np.nan],
+                         index=list('ABCDE'))
+        sparse = orig.to_sparse()
+
+        res = sparse.reindex(['A', 'E', 'C', 'D'])
+        exp = orig.reindex(['A', 'E', 'C', 'D']).to_sparse()
+        tm.assert_sp_series_equal(res, exp)
+
+        # all missing & fill_value
+        res = sparse.reindex(['B', 'E', 'C'])
+        exp = orig.reindex(['B', 'E', 'C']).to_sparse()
+        tm.assert_sp_series_equal(res, exp)
+
+        orig = pd.Series([np.nan, np.nan, np.nan, np.nan, np.nan],
+                         index=list('ABCDE'))
+        sparse = orig.to_sparse()
+
+        res = sparse.reindex(['A', 'E', 'C', 'D'])
+        exp = orig.reindex(['A', 'E', 'C', 'D']).to_sparse()
+        tm.assert_sp_series_equal(res, exp)
+
+    def test_fill_value_reindex(self):
+        orig = pd.Series([1, np.nan, 0, 3, 0], index=list('ABCDE'))
+        sparse = orig.to_sparse(fill_value=0)
+
+        res = sparse.reindex(['A', 'E', 'C', 'D'])
+        exp = orig.reindex(['A', 'E', 'C', 'D']).to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(res, exp)
+
+        # includes missing and fill_value
+        res = sparse.reindex(['A', 'B', 'C'])
+        exp = orig.reindex(['A', 'B', 'C']).to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(res, exp)
+
+        # all missing
+        orig = pd.Series([np.nan, np.nan, np.nan, np.nan, np.nan],
+                         index=list('ABCDE'))
+        sparse = orig.to_sparse(fill_value=0)
+
+        res = sparse.reindex(['A', 'E', 'C', 'D'])
+        exp = orig.reindex(['A', 'E', 'C', 'D']).to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(res, exp)
+
+        # all fill_value
+        orig = pd.Series([0., 0., 0., 0., 0.],
+                         index=list('ABCDE'))
+        sparse = orig.to_sparse(fill_value=0)
+
+        res = sparse.reindex(['A', 'E', 'C', 'D'])
+        exp = orig.reindex(['A', 'E', 'C', 'D']).to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(res, exp)
+
+    def test_reindex_fill_value(self):
+        floats = pd.Series([1., 2., 3.]).to_sparse()
+        result = floats.reindex([1, 2, 3], fill_value=0)
+        expected = pd.Series([2., 3., 0], index=[1, 2, 3]).to_sparse()
+        tm.assert_sp_series_equal(result, expected)
+
+    def test_reindex_nearest(self):
+        s = pd.Series(np.arange(10, dtype='float64')).to_sparse()
+        target = [0.1, 0.9, 1.5, 2.0]
+        actual = s.reindex(target, method='nearest')
+        expected = pd.Series(np.around(target), target).to_sparse()
+        tm.assert_sp_series_equal(expected, actual)
+
+        actual = s.reindex(target, method='nearest', tolerance=0.2)
+        expected = pd.Series([0, 1, np.nan, 2], target).to_sparse()
+        tm.assert_sp_series_equal(expected, actual)
+
+        actual = s.reindex(target, method='nearest',
+                           tolerance=[0.3, 0.01, 0.4, 3])
+        expected = pd.Series([0, np.nan, np.nan, 2], target).to_sparse()
+        tm.assert_sp_series_equal(expected, actual)
+
+    def tests_indexing_with_sparse(self):
+        # GH 13985
+
+        for kind in ['integer', 'block']:
+            for fill in [True, False, np.nan]:
+                arr = pd.SparseArray([1, 2, 3], kind=kind)
+                indexer = pd.SparseArray([True, False, True], fill_value=fill,
+                                         dtype=bool)
+
+                tm.assert_sp_array_equal(pd.SparseArray([1, 3], kind=kind),
+                                         arr[indexer])
+
+                s = pd.SparseSeries(arr, index=['a', 'b', 'c'],
+                                    dtype=np.float64)
+                exp = pd.SparseSeries([1, 3], index=['a', 'c'],
+                                      dtype=np.float64, kind=kind)
+                tm.assert_sp_series_equal(s[indexer], exp)
+                tm.assert_sp_series_equal(s.loc[indexer], exp)
+                tm.assert_sp_series_equal(s.iloc[indexer], exp)
+
+                indexer = pd.SparseSeries(indexer, index=['a', 'b', 'c'])
+                tm.assert_sp_series_equal(s[indexer], exp)
+                tm.assert_sp_series_equal(s.loc[indexer], exp)
+
+                msg = ("iLocation based boolean indexing cannot use an "
+                       "indexable as a mask")
+                with tm.assert_raises_regex(ValueError, msg):
+                    s.iloc[indexer]
+
+
+class TestSparseSeriesMultiIndexing(TestSparseSeriesIndexing):
+
+    def setup_method(self, method):
+        # Mi with duplicated values
+        idx = pd.MultiIndex.from_tuples([('A', 0), ('A', 1), ('B', 0),
+                                         ('C', 0), ('C', 1)])
+        self.orig = pd.Series([1, np.nan, np.nan, 3, np.nan], index=idx)
+        self.sparse = self.orig.to_sparse()
+
+    def test_getitem_multi(self):
+        orig = self.orig
+        sparse = self.sparse
+
+        assert sparse[0] == orig[0]
+        assert np.isnan(sparse[1])
+        assert sparse[3] == orig[3]
+
+        tm.assert_sp_series_equal(sparse['A'], orig['A'].to_sparse())
+        tm.assert_sp_series_equal(sparse['B'], orig['B'].to_sparse())
+
+        result = sparse[[1, 3, 4]]
+        exp = orig[[1, 3, 4]].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # dense array
+        result = sparse[orig % 2 == 1]
+        exp = orig[orig % 2 == 1].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # sparse array (actuary it coerces to normal Series)
+        result = sparse[sparse % 2 == 1]
+        exp = orig[orig % 2 == 1].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # sparse array
+        result = sparse[pd.SparseArray(sparse % 2 == 1, dtype=bool)]
+        tm.assert_sp_series_equal(result, exp)
+
+    def test_getitem_multi_tuple(self):
+        orig = self.orig
+        sparse = self.sparse
+
+        assert sparse['C', 0] == orig['C', 0]
+        assert np.isnan(sparse['A', 1])
+        assert np.isnan(sparse['B', 0])
+
+    def test_getitems_slice_multi(self):
+        orig = self.orig
+        sparse = self.sparse
+
+        tm.assert_sp_series_equal(sparse[2:], orig[2:].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc['B':], orig.loc['B':].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc['C':], orig.loc['C':].to_sparse())
+
+        tm.assert_sp_series_equal(sparse.loc['A':'B'],
+                                  orig.loc['A':'B'].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc[:'B'], orig.loc[:'B'].to_sparse())
+
+    def test_loc(self):
+        # need to be override to use different label
+        orig = self.orig
+        sparse = self.sparse
+
+        tm.assert_sp_series_equal(sparse.loc['A'],
+                                  orig.loc['A'].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc['B'],
+                                  orig.loc['B'].to_sparse())
+
+        result = sparse.loc[[1, 3, 4]]
+        exp = orig.loc[[1, 3, 4]].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # exceeds the bounds
+        result = sparse.loc[[1, 3, 4, 5]]
+        exp = orig.loc[[1, 3, 4, 5]].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # single element list (GH 15447)
+        result = sparse.loc[['A']]
+        exp = orig.loc[['A']].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # dense array
+        result = sparse.loc[orig % 2 == 1]
+        exp = orig.loc[orig % 2 == 1].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # sparse array (actuary it coerces to normal Series)
+        result = sparse.loc[sparse % 2 == 1]
+        exp = orig.loc[orig % 2 == 1].to_sparse()
+        tm.assert_sp_series_equal(result, exp)
+
+        # sparse array
+        result = sparse.loc[pd.SparseArray(sparse % 2 == 1, dtype=bool)]
+        tm.assert_sp_series_equal(result, exp)
+
+    def test_loc_multi_tuple(self):
+        orig = self.orig
+        sparse = self.sparse
+
+        assert sparse.loc['C', 0] == orig.loc['C', 0]
+        assert np.isnan(sparse.loc['A', 1])
+        assert np.isnan(sparse.loc['B', 0])
+
+    def test_loc_slice(self):
+        orig = self.orig
+        sparse = self.sparse
+        tm.assert_sp_series_equal(sparse.loc['A':], orig.loc['A':].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc['B':], orig.loc['B':].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc['C':], orig.loc['C':].to_sparse())
+
+        tm.assert_sp_series_equal(sparse.loc['A':'B'],
+                                  orig.loc['A':'B'].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc[:'B'], orig.loc[:'B'].to_sparse())
+
+    def test_reindex(self):
+        # GH 15447
+        orig = self.orig
+        sparse = self.sparse
+
+        res = sparse.reindex([('A', 0), ('C', 1)])
+        exp = orig.reindex([('A', 0), ('C', 1)]).to_sparse()
+        tm.assert_sp_series_equal(res, exp)
+
+        # On specific level:
+        res = sparse.reindex(['A', 'C', 'B'], level=0)
+        exp = orig.reindex(['A', 'C', 'B'], level=0).to_sparse()
+        tm.assert_sp_series_equal(res, exp)
+
+        # single element list (GH 15447)
+        res = sparse.reindex(['A'], level=0)
+        exp = orig.reindex(['A'], level=0).to_sparse()
+        tm.assert_sp_series_equal(res, exp)
+
+        with pytest.raises(TypeError):
+            # Incomplete keys are not accepted for reindexing:
+            sparse.reindex(['A', 'C'])
+
+        # "copy" argument:
+        res = sparse.reindex(sparse.index, copy=True)
+        exp = orig.reindex(orig.index, copy=True).to_sparse()
+        tm.assert_sp_series_equal(res, exp)
+        assert sparse is not res
+
+
+class TestSparseDataFrameIndexing(object):
+
+    def test_getitem(self):
+        orig = pd.DataFrame([[1, np.nan, np.nan],
+                             [2, 3, np.nan],
+                             [np.nan, np.nan, 4],
+                             [0, np.nan, 5]],
+                            columns=list('xyz'))
+        sparse = orig.to_sparse()
+
+        tm.assert_sp_series_equal(sparse['x'], orig['x'].to_sparse())
+        tm.assert_sp_frame_equal(sparse[['x']], orig[['x']].to_sparse())
+        tm.assert_sp_frame_equal(sparse[['z', 'x']],
+                                 orig[['z', 'x']].to_sparse())
+
+        tm.assert_sp_frame_equal(sparse[[True, False, True, True]],
+                                 orig[[True, False, True, True]].to_sparse())
+
+        tm.assert_sp_frame_equal(sparse.iloc[[1, 2]],
+                                 orig.iloc[[1, 2]].to_sparse())
+
+    def test_getitem_fill_value(self):
+        orig = pd.DataFrame([[1, np.nan, 0],
+                             [2, 3, np.nan],
+                             [0, np.nan, 4],
+                             [0, np.nan, 5]],
+                            columns=list('xyz'))
+        sparse = orig.to_sparse(fill_value=0)
+
+        tm.assert_sp_series_equal(sparse['y'],
+                                  orig['y'].to_sparse(fill_value=0))
+
+        exp = orig[['x']].to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(sparse[['x']], exp)
+
+        exp = orig[['z', 'x']].to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(sparse[['z', 'x']], exp)
+
+        indexer = [True, False, True, True]
+        exp = orig[indexer].to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(sparse[indexer], exp)
+
+        exp = orig.iloc[[1, 2]].to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(sparse.iloc[[1, 2]], exp)
+
+    def test_loc(self):
+        orig = pd.DataFrame([[1, np.nan, np.nan],
+                             [2, 3, np.nan],
+                             [np.nan, np.nan, 4]],
+                            columns=list('xyz'))
+        sparse = orig.to_sparse()
+
+        assert sparse.loc[0, 'x'] == 1
+        assert np.isnan(sparse.loc[1, 'z'])
+        assert sparse.loc[2, 'z'] == 4
+
+        tm.assert_sp_series_equal(sparse.loc[0], orig.loc[0].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc[1], orig.loc[1].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc[2, :],
+                                  orig.loc[2, :].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc[2, :],
+                                  orig.loc[2, :].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc[:, 'y'],
+                                  orig.loc[:, 'y'].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc[:, 'y'],
+                                  orig.loc[:, 'y'].to_sparse())
+
+        result = sparse.loc[[1, 2]]
+        exp = orig.loc[[1, 2]].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        result = sparse.loc[[1, 2], :]
+        exp = orig.loc[[1, 2], :].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        result = sparse.loc[:, ['x', 'z']]
+        exp = orig.loc[:, ['x', 'z']].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        result = sparse.loc[[0, 2], ['x', 'z']]
+        exp = orig.loc[[0, 2], ['x', 'z']].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        # exceeds the bounds
+        result = sparse.reindex([1, 3, 4, 5])
+        exp = orig.reindex([1, 3, 4, 5]).to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        # dense array
+        result = sparse.loc[orig.x % 2 == 1]
+        exp = orig.loc[orig.x % 2 == 1].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        # sparse array (actuary it coerces to normal Series)
+        result = sparse.loc[sparse.x % 2 == 1]
+        exp = orig.loc[orig.x % 2 == 1].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        # sparse array
+        result = sparse.loc[pd.SparseArray(sparse.x % 2 == 1, dtype=bool)]
+        tm.assert_sp_frame_equal(result, exp)
+
+    def test_loc_index(self):
+        orig = pd.DataFrame([[1, np.nan, np.nan],
+                             [2, 3, np.nan],
+                             [np.nan, np.nan, 4]],
+                            index=list('abc'), columns=list('xyz'))
+        sparse = orig.to_sparse()
+
+        assert sparse.loc['a', 'x'] == 1
+        assert np.isnan(sparse.loc['b', 'z'])
+        assert sparse.loc['c', 'z'] == 4
+
+        tm.assert_sp_series_equal(sparse.loc['a'], orig.loc['a'].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc['b'], orig.loc['b'].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc['b', :],
+                                  orig.loc['b', :].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc['b', :],
+                                  orig.loc['b', :].to_sparse())
+
+        tm.assert_sp_series_equal(sparse.loc[:, 'z'],
+                                  orig.loc[:, 'z'].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc[:, 'z'],
+                                  orig.loc[:, 'z'].to_sparse())
+
+        result = sparse.loc[['a', 'b']]
+        exp = orig.loc[['a', 'b']].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        result = sparse.loc[['a', 'b'], :]
+        exp = orig.loc[['a', 'b'], :].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        result = sparse.loc[:, ['x', 'z']]
+        exp = orig.loc[:, ['x', 'z']].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        result = sparse.loc[['c', 'a'], ['x', 'z']]
+        exp = orig.loc[['c', 'a'], ['x', 'z']].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        # dense array
+        result = sparse.loc[orig.x % 2 == 1]
+        exp = orig.loc[orig.x % 2 == 1].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        # sparse array (actuary it coerces to normal Series)
+        result = sparse.loc[sparse.x % 2 == 1]
+        exp = orig.loc[orig.x % 2 == 1].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        # sparse array
+        result = sparse.loc[pd.SparseArray(sparse.x % 2 == 1, dtype=bool)]
+        tm.assert_sp_frame_equal(result, exp)
+
+    def test_loc_slice(self):
+        orig = pd.DataFrame([[1, np.nan, np.nan],
+                             [2, 3, np.nan],
+                             [np.nan, np.nan, 4]],
+                            columns=list('xyz'))
+        sparse = orig.to_sparse()
+        tm.assert_sp_frame_equal(sparse.loc[2:], orig.loc[2:].to_sparse())
+
+    def test_iloc(self):
+        orig = pd.DataFrame([[1, np.nan, np.nan],
+                             [2, 3, np.nan],
+                             [np.nan, np.nan, 4]])
+        sparse = orig.to_sparse()
+
+        assert sparse.iloc[1, 1] == 3
+        assert np.isnan(sparse.iloc[2, 0])
+
+        tm.assert_sp_series_equal(sparse.iloc[0], orig.loc[0].to_sparse())
+        tm.assert_sp_series_equal(sparse.iloc[1], orig.loc[1].to_sparse())
+        tm.assert_sp_series_equal(sparse.iloc[2, :],
+                                  orig.iloc[2, :].to_sparse())
+        tm.assert_sp_series_equal(sparse.iloc[2, :],
+                                  orig.iloc[2, :].to_sparse())
+        tm.assert_sp_series_equal(sparse.iloc[:, 1],
+                                  orig.iloc[:, 1].to_sparse())
+        tm.assert_sp_series_equal(sparse.iloc[:, 1],
+                                  orig.iloc[:, 1].to_sparse())
+
+        result = sparse.iloc[[1, 2]]
+        exp = orig.iloc[[1, 2]].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        result = sparse.iloc[[1, 2], :]
+        exp = orig.iloc[[1, 2], :].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        result = sparse.iloc[:, [1, 0]]
+        exp = orig.iloc[:, [1, 0]].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        result = sparse.iloc[[2], [1, 0]]
+        exp = orig.iloc[[2], [1, 0]].to_sparse()
+        tm.assert_sp_frame_equal(result, exp)
+
+        with pytest.raises(IndexError):
+            sparse.iloc[[1, 3, 5]]
+
+    def test_iloc_slice(self):
+        orig = pd.DataFrame([[1, np.nan, np.nan],
+                             [2, 3, np.nan],
+                             [np.nan, np.nan, 4]],
+                            columns=list('xyz'))
+        sparse = orig.to_sparse()
+        tm.assert_sp_frame_equal(sparse.iloc[2:], orig.iloc[2:].to_sparse())
+
+    def test_at(self):
+        orig = pd.DataFrame([[1, np.nan, 0],
+                             [2, 3, np.nan],
+                             [0, np.nan, 4],
+                             [0, np.nan, 5]],
+                            index=list('ABCD'), columns=list('xyz'))
+        sparse = orig.to_sparse()
+        assert sparse.at['A', 'x'] == orig.at['A', 'x']
+        assert np.isnan(sparse.at['B', 'z'])
+        assert np.isnan(sparse.at['C', 'y'])
+        assert sparse.at['D', 'x'] == orig.at['D', 'x']
+
+    def test_at_fill_value(self):
+        orig = pd.DataFrame([[1, np.nan, 0],
+                             [2, 3, np.nan],
+                             [0, np.nan, 4],
+                             [0, np.nan, 5]],
+                            index=list('ABCD'), columns=list('xyz'))
+        sparse = orig.to_sparse(fill_value=0)
+        assert sparse.at['A', 'x'] == orig.at['A', 'x']
+        assert np.isnan(sparse.at['B', 'z'])
+        assert np.isnan(sparse.at['C', 'y'])
+        assert sparse.at['D', 'x'] == orig.at['D', 'x']
+
+    def test_iat(self):
+        orig = pd.DataFrame([[1, np.nan, 0],
+                             [2, 3, np.nan],
+                             [0, np.nan, 4],
+                             [0, np.nan, 5]],
+                            index=list('ABCD'), columns=list('xyz'))
+        sparse = orig.to_sparse()
+        assert sparse.iat[0, 0] == orig.iat[0, 0]
+        assert np.isnan(sparse.iat[1, 2])
+        assert np.isnan(sparse.iat[2, 1])
+        assert sparse.iat[2, 0] == orig.iat[2, 0]
+
+        assert np.isnan(sparse.iat[-1, -2])
+        assert sparse.iat[-1, -1] == orig.iat[-1, -1]
+
+    def test_iat_fill_value(self):
+        orig = pd.DataFrame([[1, np.nan, 0],
+                             [2, 3, np.nan],
+                             [0, np.nan, 4],
+                             [0, np.nan, 5]],
+                            index=list('ABCD'), columns=list('xyz'))
+        sparse = orig.to_sparse(fill_value=0)
+        assert sparse.iat[0, 0] == orig.iat[0, 0]
+        assert np.isnan(sparse.iat[1, 2])
+        assert np.isnan(sparse.iat[2, 1])
+        assert sparse.iat[2, 0] == orig.iat[2, 0]
+
+        assert np.isnan(sparse.iat[-1, -2])
+        assert sparse.iat[-1, -1] == orig.iat[-1, -1]
+
+    def test_take(self):
+        orig = pd.DataFrame([[1, np.nan, 0],
+                             [2, 3, np.nan],
+                             [0, np.nan, 4],
+                             [0, np.nan, 5]],
+                            columns=list('xyz'))
+        sparse = orig.to_sparse()
+
+        tm.assert_sp_frame_equal(sparse.take([0]),
+                                 orig.take([0]).to_sparse())
+        tm.assert_sp_frame_equal(sparse.take([0, 1]),
+                                 orig.take([0, 1]).to_sparse())
+        tm.assert_sp_frame_equal(sparse.take([-1, -2]),
+                                 orig.take([-1, -2]).to_sparse())
+
+    def test_take_fill_value(self):
+        orig = pd.DataFrame([[1, np.nan, 0],
+                             [2, 3, np.nan],
+                             [0, np.nan, 4],
+                             [0, np.nan, 5]],
+                            columns=list('xyz'))
+        sparse = orig.to_sparse(fill_value=0)
+
+        exp = orig.take([0]).to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(sparse.take([0]), exp)
+
+        exp = orig.take([0, 1]).to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(sparse.take([0, 1]), exp)
+
+        exp = orig.take([-1, -2]).to_sparse(fill_value=0)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(sparse.take([-1, -2]), exp)
+
+    def test_reindex(self):
+        orig = pd.DataFrame([[1, np.nan, 0],
+                             [2, 3, np.nan],
+                             [0, np.nan, 4],
+                             [0, np.nan, 5]],
+                            index=list('ABCD'), columns=list('xyz'))
+        sparse = orig.to_sparse()
+
+        res = sparse.reindex(['A', 'C', 'B'])
+        exp = orig.reindex(['A', 'C', 'B']).to_sparse()
+        tm.assert_sp_frame_equal(res, exp)
+
+        orig = pd.DataFrame([[np.nan, np.nan, np.nan],
+                             [np.nan, np.nan, np.nan],
+                             [np.nan, np.nan, np.nan],
+                             [np.nan, np.nan, np.nan]],
+                            index=list('ABCD'), columns=list('xyz'))
+        sparse = orig.to_sparse()
+
+        res = sparse.reindex(['A', 'C', 'B'])
+        exp = orig.reindex(['A', 'C', 'B']).to_sparse()
+        tm.assert_sp_frame_equal(res, exp)
+
+    def test_reindex_fill_value(self):
+        orig = pd.DataFrame([[1, np.nan, 0],
+                             [2, 3, np.nan],
+                             [0, np.nan, 4],
+                             [0, np.nan, 5]],
+                            index=list('ABCD'), columns=list('xyz'))
+        sparse = orig.to_sparse(fill_value=0)
+
+        res = sparse.reindex(['A', 'C', 'B'])
+        exp = orig.reindex(['A', 'C', 'B']).to_sparse(fill_value=0)
+        tm.assert_sp_frame_equal(res, exp)
+
+        # all missing
+        orig = pd.DataFrame([[np.nan, np.nan, np.nan],
+                             [np.nan, np.nan, np.nan],
+                             [np.nan, np.nan, np.nan],
+                             [np.nan, np.nan, np.nan]],
+                            index=list('ABCD'), columns=list('xyz'))
+        sparse = orig.to_sparse(fill_value=0)
+
+        res = sparse.reindex(['A', 'C', 'B'])
+        exp = orig.reindex(['A', 'C', 'B']).to_sparse(fill_value=0)
+        tm.assert_sp_frame_equal(res, exp)
+
+        # all fill_value
+        orig = pd.DataFrame([[0, 0, 0],
+                             [0, 0, 0],
+                             [0, 0, 0],
+                             [0, 0, 0]],
+                            index=list('ABCD'), columns=list('xyz'))
+        sparse = orig.to_sparse(fill_value=0)
+
+        res = sparse.reindex(['A', 'C', 'B'])
+        exp = orig.reindex(['A', 'C', 'B']).to_sparse(fill_value=0)
+        tm.assert_sp_frame_equal(res, exp)
+
+
+class TestMultitype(object):
+
+    def setup_method(self, method):
+        self.cols = ['string', 'int', 'float', 'object']
+
+        self.string_series = pd.SparseSeries(['a', 'b', 'c'])
+        self.int_series = pd.SparseSeries([1, 2, 3])
+        self.float_series = pd.SparseSeries([1.1, 1.2, 1.3])
+        self.object_series = pd.SparseSeries([[], {}, set()])
+        self.sdf = pd.SparseDataFrame({
+            'string': self.string_series,
+            'int': self.int_series,
+            'float': self.float_series,
+            'object': self.object_series,
+        })
+        self.sdf = self.sdf[self.cols]
+        self.ss = pd.SparseSeries(['a', 1, 1.1, []], index=self.cols)
+
+    def test_frame_basic_dtypes(self):
+        for _, row in self.sdf.iterrows():
+            assert row.dtype == object
+        tm.assert_sp_series_equal(self.sdf['string'], self.string_series,
+                                  check_names=False)
+        tm.assert_sp_series_equal(self.sdf['int'], self.int_series,
+                                  check_names=False)
+        tm.assert_sp_series_equal(self.sdf['float'], self.float_series,
+                                  check_names=False)
+        tm.assert_sp_series_equal(self.sdf['object'], self.object_series,
+                                  check_names=False)
+
+    def test_frame_indexing_single(self):
+        tm.assert_sp_series_equal(self.sdf.iloc[0],
+                                  pd.SparseSeries(['a', 1, 1.1, []],
+                                                  index=self.cols),
+                                  check_names=False)
+        tm.assert_sp_series_equal(self.sdf.iloc[1],
+                                  pd.SparseSeries(['b', 2, 1.2, {}],
+                                                  index=self.cols),
+                                  check_names=False)
+        tm.assert_sp_series_equal(self.sdf.iloc[2],
+                                  pd.SparseSeries(['c', 3, 1.3, set()],
+                                                  index=self.cols),
+                                  check_names=False)
+
+    def test_frame_indexing_multiple(self):
+        tm.assert_sp_frame_equal(self.sdf, self.sdf[:])
+        tm.assert_sp_frame_equal(self.sdf, self.sdf.loc[:])
+        tm.assert_sp_frame_equal(self.sdf.iloc[[1, 2]],
+                                 pd.SparseDataFrame({
+                                     'string': self.string_series.iloc[[1, 2]],
+                                     'int': self.int_series.iloc[[1, 2]],
+                                     'float': self.float_series.iloc[[1, 2]],
+                                     'object': self.object_series.iloc[[1, 2]]
+                                 }, index=[1, 2])[self.cols])
+        tm.assert_sp_frame_equal(self.sdf[['int', 'string']],
+                                 pd.SparseDataFrame({
+                                     'int': self.int_series,
+                                     'string': self.string_series,
+                                 }))
+
+    def test_series_indexing_single(self):
+        for i, idx in enumerate(self.cols):
+            assert self.ss.iloc[i] == self.ss[idx]
+            tm.assert_class_equal(self.ss.iloc[i], self.ss[idx],
+                                  obj="series index")
+
+        assert self.ss['string'] == 'a'
+        assert self.ss['int'] == 1
+        assert self.ss['float'] == 1.1
+        assert self.ss['object'] == []
+
+    def test_series_indexing_multiple(self):
+        tm.assert_sp_series_equal(self.ss.loc[['string', 'int']],
+                                  pd.SparseSeries(['a', 1],
+                                                  index=['string', 'int']))
+        tm.assert_sp_series_equal(self.ss.loc[['string', 'object']],
+                                  pd.SparseSeries(['a', []],
+                                                  index=['string', 'object']))
diff --git a/pandas/tests/sparse/test_libsparse.py b/pandas/tests/sparse/test_libsparse.py
new file mode 100644
index 0000000000000..7719ea46503fd
--- /dev/null
+++ b/pandas/tests/sparse/test_libsparse.py
@@ -0,0 +1,617 @@
+from pandas import Series
+
+import pytest
+import numpy as np
+import operator
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+from pandas.core.sparse.array import IntIndex, BlockIndex, _make_index
+import pandas._libs.sparse as splib
+
+TEST_LENGTH = 20
+
+plain_case = dict(xloc=[0, 7, 15], xlen=[3, 5, 5], yloc=[2, 9, 14],
+                  ylen=[2, 3, 5], intersect_loc=[2, 9, 15],
+                  intersect_len=[1, 3, 4])
+delete_blocks = dict(xloc=[0, 5], xlen=[4, 4], yloc=[1], ylen=[4],
+                     intersect_loc=[1], intersect_len=[3])
+split_blocks = dict(xloc=[0], xlen=[10], yloc=[0, 5], ylen=[3, 7],
+                    intersect_loc=[0, 5], intersect_len=[3, 5])
+skip_block = dict(xloc=[10], xlen=[5], yloc=[0, 12], ylen=[5, 3],
+                  intersect_loc=[12], intersect_len=[3])
+
+no_intersect = dict(xloc=[0, 10], xlen=[4, 6], yloc=[5, 17], ylen=[4, 2],
+                    intersect_loc=[], intersect_len=[])
+
+
+def check_cases(_check_case):
+    def _check_case_dict(case):
+        _check_case(case['xloc'], case['xlen'], case['yloc'], case['ylen'],
+                    case['intersect_loc'], case['intersect_len'])
+
+    _check_case_dict(plain_case)
+    _check_case_dict(delete_blocks)
+    _check_case_dict(split_blocks)
+    _check_case_dict(skip_block)
+    _check_case_dict(no_intersect)
+
+    # one or both is empty
+    _check_case([0], [5], [], [], [], [])
+    _check_case([], [], [], [], [], [])
+
+
+class TestSparseIndexUnion(object):
+
+    def test_index_make_union(self):
+        def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
+            xindex = BlockIndex(TEST_LENGTH, xloc, xlen)
+            yindex = BlockIndex(TEST_LENGTH, yloc, ylen)
+            bresult = xindex.make_union(yindex)
+            assert (isinstance(bresult, BlockIndex))
+            tm.assert_numpy_array_equal(bresult.blocs,
+                                        np.array(eloc, dtype=np.int32))
+            tm.assert_numpy_array_equal(bresult.blengths,
+                                        np.array(elen, dtype=np.int32))
+
+            ixindex = xindex.to_int_index()
+            iyindex = yindex.to_int_index()
+            iresult = ixindex.make_union(iyindex)
+            assert (isinstance(iresult, IntIndex))
+            tm.assert_numpy_array_equal(iresult.indices,
+                                        bresult.to_int_index().indices)
+
+        """
+        x: ----
+        y:     ----
+        r: --------
+        """
+        xloc = [0]
+        xlen = [5]
+        yloc = [5]
+        ylen = [4]
+        eloc = [0]
+        elen = [9]
+        _check_case(xloc, xlen, yloc, ylen, eloc, elen)
+        """
+        x: -----     -----
+        y:   -----          --
+        """
+        xloc = [0, 10]
+        xlen = [5, 5]
+        yloc = [2, 17]
+        ylen = [5, 2]
+        eloc = [0, 10, 17]
+        elen = [7, 5, 2]
+        _check_case(xloc, xlen, yloc, ylen, eloc, elen)
+        """
+        x: ------
+        y:    -------
+        r: ----------
+        """
+        xloc = [1]
+        xlen = [5]
+        yloc = [3]
+        ylen = [5]
+        eloc = [1]
+        elen = [7]
+        _check_case(xloc, xlen, yloc, ylen, eloc, elen)
+        """
+        x: ------  -----
+        y:    -------
+        r: -------------
+        """
+        xloc = [2, 10]
+        xlen = [4, 4]
+        yloc = [4]
+        ylen = [8]
+        eloc = [2]
+        elen = [12]
+        _check_case(xloc, xlen, yloc, ylen, eloc, elen)
+        """
+        x: ---  -----
+        y: -------
+        r: -------------
+        """
+        xloc = [0, 5]
+        xlen = [3, 5]
+        yloc = [0]
+        ylen = [7]
+        eloc = [0]
+        elen = [10]
+        _check_case(xloc, xlen, yloc, ylen, eloc, elen)
+        """
+        x: ------  -----
+        y:    -------  ---
+        r: -------------
+        """
+        xloc = [2, 10]
+        xlen = [4, 4]
+        yloc = [4, 13]
+        ylen = [8, 4]
+        eloc = [2]
+        elen = [15]
+        _check_case(xloc, xlen, yloc, ylen, eloc, elen)
+        """
+        x: ----------------------
+        y:   ----  ----   ---
+        r: ----------------------
+        """
+        xloc = [2]
+        xlen = [15]
+        yloc = [4, 9, 14]
+        ylen = [3, 2, 2]
+        eloc = [2]
+        elen = [15]
+        _check_case(xloc, xlen, yloc, ylen, eloc, elen)
+        """
+        x: ----       ---
+        y:       ---       ---
+        """
+        xloc = [0, 10]
+        xlen = [3, 3]
+        yloc = [5, 15]
+        ylen = [2, 2]
+        eloc = [0, 5, 10, 15]
+        elen = [3, 2, 3, 2]
+        _check_case(xloc, xlen, yloc, ylen, eloc, elen)
+
+    def test_intindex_make_union(self):
+        a = IntIndex(5, np.array([0, 3, 4], dtype=np.int32))
+        b = IntIndex(5, np.array([0, 2], dtype=np.int32))
+        res = a.make_union(b)
+        exp = IntIndex(5, np.array([0, 2, 3, 4], np.int32))
+        assert res.equals(exp)
+
+        a = IntIndex(5, np.array([], dtype=np.int32))
+        b = IntIndex(5, np.array([0, 2], dtype=np.int32))
+        res = a.make_union(b)
+        exp = IntIndex(5, np.array([0, 2], np.int32))
+        assert res.equals(exp)
+
+        a = IntIndex(5, np.array([], dtype=np.int32))
+        b = IntIndex(5, np.array([], dtype=np.int32))
+        res = a.make_union(b)
+        exp = IntIndex(5, np.array([], np.int32))
+        assert res.equals(exp)
+
+        a = IntIndex(5, np.array([0, 1, 2, 3, 4], dtype=np.int32))
+        b = IntIndex(5, np.array([0, 1, 2, 3, 4], dtype=np.int32))
+        res = a.make_union(b)
+        exp = IntIndex(5, np.array([0, 1, 2, 3, 4], np.int32))
+        assert res.equals(exp)
+
+        a = IntIndex(5, np.array([0, 1], dtype=np.int32))
+        b = IntIndex(4, np.array([0, 1], dtype=np.int32))
+        with pytest.raises(ValueError):
+            a.make_union(b)
+
+
+class TestSparseIndexIntersect(object):
+
+    @td.skip_if_windows
+    def test_intersect(self):
+        def _check_correct(a, b, expected):
+            result = a.intersect(b)
+            assert (result.equals(expected))
+
+        def _check_length_exc(a, longer):
+            pytest.raises(Exception, a.intersect, longer)
+
+        def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
+            xindex = BlockIndex(TEST_LENGTH, xloc, xlen)
+            yindex = BlockIndex(TEST_LENGTH, yloc, ylen)
+            expected = BlockIndex(TEST_LENGTH, eloc, elen)
+            longer_index = BlockIndex(TEST_LENGTH + 1, yloc, ylen)
+
+            _check_correct(xindex, yindex, expected)
+            _check_correct(xindex.to_int_index(), yindex.to_int_index(),
+                           expected.to_int_index())
+
+            _check_length_exc(xindex, longer_index)
+            _check_length_exc(xindex.to_int_index(),
+                              longer_index.to_int_index())
+
+        check_cases(_check_case)
+
+    def test_intersect_empty(self):
+        xindex = IntIndex(4, np.array([], dtype=np.int32))
+        yindex = IntIndex(4, np.array([2, 3], dtype=np.int32))
+        assert xindex.intersect(yindex).equals(xindex)
+        assert yindex.intersect(xindex).equals(xindex)
+
+        xindex = xindex.to_block_index()
+        yindex = yindex.to_block_index()
+        assert xindex.intersect(yindex).equals(xindex)
+        assert yindex.intersect(xindex).equals(xindex)
+
+    def test_intersect_identical(self):
+        cases = [IntIndex(5, np.array([1, 2], dtype=np.int32)),
+                 IntIndex(5, np.array([0, 2, 4], dtype=np.int32)),
+                 IntIndex(0, np.array([], dtype=np.int32)),
+                 IntIndex(5, np.array([], dtype=np.int32))]
+
+        for case in cases:
+            assert case.intersect(case).equals(case)
+            case = case.to_block_index()
+            assert case.intersect(case).equals(case)
+
+
+class TestSparseIndexCommon(object):
+
+    def test_int_internal(self):
+        idx = _make_index(4, np.array([2, 3], dtype=np.int32), kind='integer')
+        assert isinstance(idx, IntIndex)
+        assert idx.npoints == 2
+        tm.assert_numpy_array_equal(idx.indices,
+                                    np.array([2, 3], dtype=np.int32))
+
+        idx = _make_index(4, np.array([], dtype=np.int32), kind='integer')
+        assert isinstance(idx, IntIndex)
+        assert idx.npoints == 0
+        tm.assert_numpy_array_equal(idx.indices,
+                                    np.array([], dtype=np.int32))
+
+        idx = _make_index(4, np.array([0, 1, 2, 3], dtype=np.int32),
+                          kind='integer')
+        assert isinstance(idx, IntIndex)
+        assert idx.npoints == 4
+        tm.assert_numpy_array_equal(idx.indices,
+                                    np.array([0, 1, 2, 3], dtype=np.int32))
+
+    def test_block_internal(self):
+        idx = _make_index(4, np.array([2, 3], dtype=np.int32), kind='block')
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 2
+        tm.assert_numpy_array_equal(idx.blocs,
+                                    np.array([2], dtype=np.int32))
+        tm.assert_numpy_array_equal(idx.blengths,
+                                    np.array([2], dtype=np.int32))
+
+        idx = _make_index(4, np.array([], dtype=np.int32), kind='block')
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 0
+        tm.assert_numpy_array_equal(idx.blocs,
+                                    np.array([], dtype=np.int32))
+        tm.assert_numpy_array_equal(idx.blengths,
+                                    np.array([], dtype=np.int32))
+
+        idx = _make_index(4, np.array([0, 1, 2, 3], dtype=np.int32),
+                          kind='block')
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 4
+        tm.assert_numpy_array_equal(idx.blocs,
+                                    np.array([0], dtype=np.int32))
+        tm.assert_numpy_array_equal(idx.blengths,
+                                    np.array([4], dtype=np.int32))
+
+        idx = _make_index(4, np.array([0, 2, 3], dtype=np.int32),
+                          kind='block')
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 3
+        tm.assert_numpy_array_equal(idx.blocs,
+                                    np.array([0, 2], dtype=np.int32))
+        tm.assert_numpy_array_equal(idx.blengths,
+                                    np.array([1, 2], dtype=np.int32))
+
+    def test_lookup(self):
+        for kind in ['integer', 'block']:
+            idx = _make_index(4, np.array([2, 3], dtype=np.int32), kind=kind)
+            assert idx.lookup(-1) == -1
+            assert idx.lookup(0) == -1
+            assert idx.lookup(1) == -1
+            assert idx.lookup(2) == 0
+            assert idx.lookup(3) == 1
+            assert idx.lookup(4) == -1
+
+            idx = _make_index(4, np.array([], dtype=np.int32), kind=kind)
+
+            for i in range(-1, 5):
+                assert idx.lookup(i) == -1
+
+            idx = _make_index(4, np.array([0, 1, 2, 3], dtype=np.int32),
+                              kind=kind)
+            assert idx.lookup(-1) == -1
+            assert idx.lookup(0) == 0
+            assert idx.lookup(1) == 1
+            assert idx.lookup(2) == 2
+            assert idx.lookup(3) == 3
+            assert idx.lookup(4) == -1
+
+            idx = _make_index(4, np.array([0, 2, 3], dtype=np.int32),
+                              kind=kind)
+            assert idx.lookup(-1) == -1
+            assert idx.lookup(0) == 0
+            assert idx.lookup(1) == -1
+            assert idx.lookup(2) == 1
+            assert idx.lookup(3) == 2
+            assert idx.lookup(4) == -1
+
+    def test_lookup_array(self):
+        for kind in ['integer', 'block']:
+            idx = _make_index(4, np.array([2, 3], dtype=np.int32), kind=kind)
+
+            res = idx.lookup_array(np.array([-1, 0, 2], dtype=np.int32))
+            exp = np.array([-1, -1, 0], dtype=np.int32)
+            tm.assert_numpy_array_equal(res, exp)
+
+            res = idx.lookup_array(np.array([4, 2, 1, 3], dtype=np.int32))
+            exp = np.array([-1, 0, -1, 1], dtype=np.int32)
+            tm.assert_numpy_array_equal(res, exp)
+
+            idx = _make_index(4, np.array([], dtype=np.int32), kind=kind)
+            res = idx.lookup_array(np.array([-1, 0, 2, 4], dtype=np.int32))
+            exp = np.array([-1, -1, -1, -1], dtype=np.int32)
+
+            idx = _make_index(4, np.array([0, 1, 2, 3], dtype=np.int32),
+                              kind=kind)
+            res = idx.lookup_array(np.array([-1, 0, 2], dtype=np.int32))
+            exp = np.array([-1, 0, 2], dtype=np.int32)
+            tm.assert_numpy_array_equal(res, exp)
+
+            res = idx.lookup_array(np.array([4, 2, 1, 3], dtype=np.int32))
+            exp = np.array([-1, 2, 1, 3], dtype=np.int32)
+            tm.assert_numpy_array_equal(res, exp)
+
+            idx = _make_index(4, np.array([0, 2, 3], dtype=np.int32),
+                              kind=kind)
+            res = idx.lookup_array(np.array([2, 1, 3, 0], dtype=np.int32))
+            exp = np.array([1, -1, 2, 0], dtype=np.int32)
+            tm.assert_numpy_array_equal(res, exp)
+
+            res = idx.lookup_array(np.array([1, 4, 2, 5], dtype=np.int32))
+            exp = np.array([-1, -1, 1, -1], dtype=np.int32)
+            tm.assert_numpy_array_equal(res, exp)
+
+    def test_lookup_basics(self):
+        def _check(index):
+            assert (index.lookup(0) == -1)
+            assert (index.lookup(5) == 0)
+            assert (index.lookup(7) == 2)
+            assert (index.lookup(8) == -1)
+            assert (index.lookup(9) == -1)
+            assert (index.lookup(10) == -1)
+            assert (index.lookup(11) == -1)
+            assert (index.lookup(12) == 3)
+            assert (index.lookup(17) == 8)
+            assert (index.lookup(18) == -1)
+
+        bindex = BlockIndex(20, [5, 12], [3, 6])
+        iindex = bindex.to_int_index()
+
+        _check(bindex)
+        _check(iindex)
+
+        # corner cases
+
+
+class TestBlockIndex(object):
+
+    def test_block_internal(self):
+        idx = _make_index(4, np.array([2, 3], dtype=np.int32), kind='block')
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 2
+        tm.assert_numpy_array_equal(idx.blocs,
+                                    np.array([2], dtype=np.int32))
+        tm.assert_numpy_array_equal(idx.blengths,
+                                    np.array([2], dtype=np.int32))
+
+        idx = _make_index(4, np.array([], dtype=np.int32), kind='block')
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 0
+        tm.assert_numpy_array_equal(idx.blocs,
+                                    np.array([], dtype=np.int32))
+        tm.assert_numpy_array_equal(idx.blengths,
+                                    np.array([], dtype=np.int32))
+
+        idx = _make_index(4, np.array([0, 1, 2, 3], dtype=np.int32),
+                          kind='block')
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 4
+        tm.assert_numpy_array_equal(idx.blocs,
+                                    np.array([0], dtype=np.int32))
+        tm.assert_numpy_array_equal(idx.blengths,
+                                    np.array([4], dtype=np.int32))
+
+        idx = _make_index(4, np.array([0, 2, 3], dtype=np.int32), kind='block')
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 3
+        tm.assert_numpy_array_equal(idx.blocs,
+                                    np.array([0, 2], dtype=np.int32))
+        tm.assert_numpy_array_equal(idx.blengths,
+                                    np.array([1, 2], dtype=np.int32))
+
+    def test_make_block_boundary(self):
+        for i in [5, 10, 100, 101]:
+            idx = _make_index(i, np.arange(0, i, 2, dtype=np.int32),
+                              kind='block')
+
+            exp = np.arange(0, i, 2, dtype=np.int32)
+            tm.assert_numpy_array_equal(idx.blocs, exp)
+            tm.assert_numpy_array_equal(idx.blengths,
+                                        np.ones(len(exp), dtype=np.int32))
+
+    def test_equals(self):
+        index = BlockIndex(10, [0, 4], [2, 5])
+
+        assert index.equals(index)
+        assert not index.equals(BlockIndex(10, [0, 4], [2, 6]))
+
+    def test_check_integrity(self):
+        locs = []
+        lengths = []
+
+        # 0-length OK
+        # TODO: index variables are not used...is that right?
+        index = BlockIndex(0, locs, lengths)  # noqa
+
+        # also OK even though empty
+        index = BlockIndex(1, locs, lengths)  # noqa
+
+        # block extend beyond end
+        pytest.raises(Exception, BlockIndex, 10, [5], [10])
+
+        # block overlap
+        pytest.raises(Exception, BlockIndex, 10, [2, 5], [5, 3])
+
+    def test_to_int_index(self):
+        locs = [0, 10]
+        lengths = [4, 6]
+        exp_inds = [0, 1, 2, 3, 10, 11, 12, 13, 14, 15]
+
+        block = BlockIndex(20, locs, lengths)
+        dense = block.to_int_index()
+
+        tm.assert_numpy_array_equal(dense.indices,
+                                    np.array(exp_inds, dtype=np.int32))
+
+    def test_to_block_index(self):
+        index = BlockIndex(10, [0, 5], [4, 5])
+        assert index.to_block_index() is index
+
+
+class TestIntIndex(object):
+
+    def test_check_integrity(self):
+
+        # Too many indices than specified in self.length
+        msg = "Too many indices"
+
+        with tm.assert_raises_regex(ValueError, msg):
+            IntIndex(length=1, indices=[1, 2, 3])
+
+        # No index can be negative.
+        msg = "No index can be less than zero"
+
+        with tm.assert_raises_regex(ValueError, msg):
+            IntIndex(length=5, indices=[1, -2, 3])
+
+        # No index can be negative.
+        msg = "No index can be less than zero"
+
+        with tm.assert_raises_regex(ValueError, msg):
+            IntIndex(length=5, indices=[1, -2, 3])
+
+        # All indices must be less than the length.
+        msg = "All indices must be less than the length"
+
+        with tm.assert_raises_regex(ValueError, msg):
+            IntIndex(length=5, indices=[1, 2, 5])
+
+        with tm.assert_raises_regex(ValueError, msg):
+            IntIndex(length=5, indices=[1, 2, 6])
+
+        # Indices must be strictly ascending.
+        msg = "Indices must be strictly increasing"
+
+        with tm.assert_raises_regex(ValueError, msg):
+            IntIndex(length=5, indices=[1, 3, 2])
+
+        with tm.assert_raises_regex(ValueError, msg):
+            IntIndex(length=5, indices=[1, 3, 3])
+
+    def test_int_internal(self):
+        idx = _make_index(4, np.array([2, 3], dtype=np.int32), kind='integer')
+        assert isinstance(idx, IntIndex)
+        assert idx.npoints == 2
+        tm.assert_numpy_array_equal(idx.indices,
+                                    np.array([2, 3], dtype=np.int32))
+
+        idx = _make_index(4, np.array([], dtype=np.int32), kind='integer')
+        assert isinstance(idx, IntIndex)
+        assert idx.npoints == 0
+        tm.assert_numpy_array_equal(idx.indices,
+                                    np.array([], dtype=np.int32))
+
+        idx = _make_index(4, np.array([0, 1, 2, 3], dtype=np.int32),
+                          kind='integer')
+        assert isinstance(idx, IntIndex)
+        assert idx.npoints == 4
+        tm.assert_numpy_array_equal(idx.indices,
+                                    np.array([0, 1, 2, 3], dtype=np.int32))
+
+    def test_equals(self):
+        index = IntIndex(10, [0, 1, 2, 3, 4])
+        assert index.equals(index)
+        assert not index.equals(IntIndex(10, [0, 1, 2, 3]))
+
+    def test_to_block_index(self):
+
+        def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
+            xindex = BlockIndex(TEST_LENGTH, xloc, xlen)
+            yindex = BlockIndex(TEST_LENGTH, yloc, ylen)
+
+            # see if survive the round trip
+            xbindex = xindex.to_int_index().to_block_index()
+            ybindex = yindex.to_int_index().to_block_index()
+            assert isinstance(xbindex, BlockIndex)
+            assert xbindex.equals(xindex)
+            assert ybindex.equals(yindex)
+
+        check_cases(_check_case)
+
+    def test_to_int_index(self):
+        index = IntIndex(10, [2, 3, 4, 5, 6])
+        assert index.to_int_index() is index
+
+
+class TestSparseOperators(object):
+
+    def _op_tests(self, sparse_op, python_op):
+        def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
+            xindex = BlockIndex(TEST_LENGTH, xloc, xlen)
+            yindex = BlockIndex(TEST_LENGTH, yloc, ylen)
+
+            xdindex = xindex.to_int_index()
+            ydindex = yindex.to_int_index()
+
+            x = np.arange(xindex.npoints) * 10. + 1
+            y = np.arange(yindex.npoints) * 100. + 1
+
+            xfill = 0
+            yfill = 2
+
+            result_block_vals, rb_index, bfill = sparse_op(x, xindex, xfill, y,
+                                                           yindex, yfill)
+            result_int_vals, ri_index, ifill = sparse_op(x, xdindex, xfill, y,
+                                                         ydindex, yfill)
+
+            assert rb_index.to_int_index().equals(ri_index)
+            tm.assert_numpy_array_equal(result_block_vals, result_int_vals)
+            assert bfill == ifill
+
+            # check versus Series...
+            xseries = Series(x, xdindex.indices)
+            xseries = xseries.reindex(np.arange(TEST_LENGTH)).fillna(xfill)
+
+            yseries = Series(y, ydindex.indices)
+            yseries = yseries.reindex(np.arange(TEST_LENGTH)).fillna(yfill)
+
+            series_result = python_op(xseries, yseries)
+            series_result = series_result.reindex(ri_index.indices)
+
+            tm.assert_numpy_array_equal(result_block_vals,
+                                        series_result.values)
+            tm.assert_numpy_array_equal(result_int_vals, series_result.values)
+
+        check_cases(_check_case)
+
+
+# too cute? oh but how I abhor code duplication
+check_ops = ['add', 'sub', 'mul', 'truediv', 'floordiv']
+
+
+def make_optestf(op):
+    def f(self):
+        sparse_op = getattr(splib, 'sparse_%s_float64' % op)
+        python_op = getattr(operator, op)
+        self._op_tests(sparse_op, python_op)
+
+    f.__name__ = 'test_%s' % op
+    return f
+
+
+for op in check_ops:
+    g = make_optestf(op)
+    setattr(TestSparseOperators, g.__name__, g)
+    del g
diff --git a/pandas/tests/sparse/test_pivot.py b/pandas/tests/sparse/test_pivot.py
new file mode 100644
index 0000000000000..e7eba63e4e0b3
--- /dev/null
+++ b/pandas/tests/sparse/test_pivot.py
@@ -0,0 +1,50 @@
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
+
+
+class TestPivotTable(object):
+
+    def setup_method(self, method):
+        self.dense = pd.DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                                         'foo', 'bar', 'foo', 'foo'],
+                                   'B': ['one', 'one', 'two', 'three',
+                                         'two', 'two', 'one', 'three'],
+                                   'C': np.random.randn(8),
+                                   'D': np.random.randn(8),
+                                   'E': [np.nan, np.nan, 1, 2,
+                                         np.nan, 1, np.nan, np.nan]})
+        self.sparse = self.dense.to_sparse()
+
+    def test_pivot_table(self):
+        res_sparse = pd.pivot_table(self.sparse, index='A', columns='B',
+                                    values='C')
+        res_dense = pd.pivot_table(self.dense, index='A', columns='B',
+                                   values='C')
+        tm.assert_frame_equal(res_sparse, res_dense)
+
+        res_sparse = pd.pivot_table(self.sparse, index='A', columns='B',
+                                    values='E')
+        res_dense = pd.pivot_table(self.dense, index='A', columns='B',
+                                   values='E')
+        tm.assert_frame_equal(res_sparse, res_dense)
+
+        res_sparse = pd.pivot_table(self.sparse, index='A', columns='B',
+                                    values='E', aggfunc='mean')
+        res_dense = pd.pivot_table(self.dense, index='A', columns='B',
+                                   values='E', aggfunc='mean')
+        tm.assert_frame_equal(res_sparse, res_dense)
+
+        # ToDo: sum doesn't handle nan properly
+        # res_sparse = pd.pivot_table(self.sparse, index='A', columns='B',
+        #                             values='E', aggfunc='sum')
+        # res_dense = pd.pivot_table(self.dense, index='A', columns='B',
+        #                            values='E', aggfunc='sum')
+        # tm.assert_frame_equal(res_sparse, res_dense)
+
+    def test_pivot_table_multi(self):
+        res_sparse = pd.pivot_table(self.sparse, index='A', columns='B',
+                                    values=['D', 'E'])
+        res_dense = pd.pivot_table(self.dense, index='A', columns='B',
+                                   values=['D', 'E'])
+        tm.assert_frame_equal(res_sparse, res_dense)
diff --git a/pandas/tests/sparse/test_reshape.py b/pandas/tests/sparse/test_reshape.py
new file mode 100644
index 0000000000000..b492c47375bcf
--- /dev/null
+++ b/pandas/tests/sparse/test_reshape.py
@@ -0,0 +1,38 @@
+import pytest
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+
+
+@pytest.fixture
+def sparse_df():
+    return pd.SparseDataFrame({0: {0: 1}, 1: {1: 1}, 2: {2: 1}})  # eye
+
+
+@pytest.fixture
+def multi_index3():
+    return pd.MultiIndex.from_tuples([(0, 0), (1, 1), (2, 2)])
+
+
+def test_sparse_frame_stack(sparse_df, multi_index3):
+    ss = sparse_df.stack()
+    expected = pd.SparseSeries(np.ones(3), index=multi_index3)
+    tm.assert_sp_series_equal(ss, expected)
+
+
+def test_sparse_frame_unstack(sparse_df):
+    mi = pd.MultiIndex.from_tuples([(0, 0), (1, 0), (1, 2)])
+    sparse_df.index = mi
+    arr = np.array([[1, np.nan, np.nan],
+                    [np.nan, 1, np.nan],
+                    [np.nan, np.nan, 1]])
+    unstacked_df = pd.DataFrame(arr, index=mi).unstack()
+    unstacked_sdf = sparse_df.unstack()
+
+    tm.assert_numpy_array_equal(unstacked_df.values, unstacked_sdf.values)
+
+
+def test_sparse_series_unstack(sparse_df, multi_index3):
+    frame = pd.SparseSeries(np.ones(3), index=multi_index3).unstack()
+    tm.assert_sp_frame_equal(frame, sparse_df)
diff --git a/pandas/tests/test_algos.py b/pandas/tests/test_algos.py
index b18bd7b2b3978..46bd879c2db87 100644
--- a/pandas/tests/test_algos.py
+++ b/pandas/tests/test_algos.py
@@ -1,90 +1,107 @@
 # -*- coding: utf-8 -*-
-from pandas.compat import range
 
 import numpy as np
-from numpy.random import RandomState
+import pytest
 
-from pandas.core.api import Series, Categorical, CategoricalIndex
+from numpy.random import RandomState
+from numpy import nan
+from datetime import datetime
+from itertools import permutations
+from pandas import (Series, Categorical, CategoricalIndex,
+                    Timestamp, DatetimeIndex, Index, IntervalIndex)
 import pandas as pd
 
 from pandas import compat
+from pandas._libs import (groupby as libgroupby, algos as libalgos,
+                          hashtable as ht)
+from pandas._libs.hashtable import unique_label_indices
+from pandas.compat import lrange, range
 import pandas.core.algorithms as algos
+import pandas.core.common as com
 import pandas.util.testing as tm
-import pandas.hashtable as hashtable
+import pandas.util._test_decorators as td
+from pandas.core.dtypes.dtypes import CategoricalDtype as CDT
+from pandas.compat.numpy import np_array_datetime64_compat
+from pandas.util.testing import assert_almost_equal
 
 
-class TestMatch(tm.TestCase):
-    _multiprocess_can_split_ = True
+class TestMatch(object):
 
     def test_ints(self):
         values = np.array([0, 2, 1])
         to_match = np.array([0, 1, 2, 2, 0, 1, 3, 0])
 
         result = algos.match(to_match, values)
-        expected = np.array([0, 2, 1, 1, 0, 2, -1, 0])
-        self.assert_numpy_array_equal(result, expected)
+        expected = np.array([0, 2, 1, 1, 0, 2, -1, 0], dtype=np.int64)
+        tm.assert_numpy_array_equal(result, expected)
 
         result = Series(algos.match(to_match, values, np.nan))
         expected = Series(np.array([0, 2, 1, 1, 0, 2, np.nan, 0]))
         tm.assert_series_equal(result, expected)
 
-        s = pd.Series(np.arange(5),dtype=np.float32)
-        result = algos.match(s, [2,4])
-        expected = np.array([-1, -1, 0, -1, 1])
-        self.assert_numpy_array_equal(result, expected)
+        s = Series(np.arange(5), dtype=np.float32)
+        result = algos.match(s, [2, 4])
+        expected = np.array([-1, -1, 0, -1, 1], dtype=np.int64)
+        tm.assert_numpy_array_equal(result, expected)
 
-        result = Series(algos.match(s, [2,4], np.nan))
+        result = Series(algos.match(s, [2, 4], np.nan))
         expected = Series(np.array([np.nan, np.nan, 0, np.nan, 1]))
-        tm.assert_series_equal(result,expected)
+        tm.assert_series_equal(result, expected)
 
     def test_strings(self):
         values = ['foo', 'bar', 'baz']
         to_match = ['bar', 'foo', 'qux', 'foo', 'bar', 'baz', 'qux']
 
         result = algos.match(to_match, values)
-        expected = np.array([1, 0, -1, 0, 1, 2, -1])
-        self.assert_numpy_array_equal(result, expected)
+        expected = np.array([1, 0, -1, 0, 1, 2, -1], dtype=np.int64)
+        tm.assert_numpy_array_equal(result, expected)
 
         result = Series(algos.match(to_match, values, np.nan))
         expected = Series(np.array([1, 0, np.nan, 0, 1, 2, np.nan]))
-        tm.assert_series_equal(result,expected)
-
-class TestFactorize(tm.TestCase):
-    _multiprocess_can_split_ = True
+        tm.assert_series_equal(result, expected)
 
-    def test_warn(self):
 
-        s = Series([1, 2, 3])
-        with tm.assert_produces_warning(FutureWarning):
-            algos.factorize(s, order='A')
+class TestFactorize(object):
 
     def test_basic(self):
 
-        labels, uniques = algos.factorize(['a', 'b', 'b', 'a',
-                                           'a', 'c', 'c', 'c'])
-        # self.assert_numpy_array_equal(labels, np.array([ 0, 1, 1, 0, 0, 2, 2, 2],dtype=np.int64))
-        self.assert_numpy_array_equal(uniques, np.array(['a','b','c'], dtype=object))
+        labels, uniques = algos.factorize(['a', 'b', 'b', 'a', 'a', 'c', 'c',
+                                           'c'])
+        tm.assert_numpy_array_equal(
+            uniques, np.array(['a', 'b', 'c'], dtype=object))
 
         labels, uniques = algos.factorize(['a', 'b', 'b', 'a',
                                            'a', 'c', 'c', 'c'], sort=True)
-        self.assert_numpy_array_equal(labels, np.array([ 0, 1, 1, 0, 0, 2, 2, 2],dtype=np.int64))
-        self.assert_numpy_array_equal(uniques, np.array(['a','b','c'], dtype=object))
+        exp = np.array([0, 1, 1, 0, 0, 2, 2, 2], dtype=np.intp)
+        tm.assert_numpy_array_equal(labels, exp)
+        exp = np.array(['a', 'b', 'c'], dtype=object)
+        tm.assert_numpy_array_equal(uniques, exp)
 
         labels, uniques = algos.factorize(list(reversed(range(5))))
-        self.assert_numpy_array_equal(labels, np.array([0, 1, 2, 3, 4], dtype=np.int64))
-        self.assert_numpy_array_equal(uniques, np.array([ 4, 3, 2, 1, 0],dtype=np.int64))
+        exp = np.array([0, 1, 2, 3, 4], dtype=np.intp)
+        tm.assert_numpy_array_equal(labels, exp)
+        exp = np.array([4, 3, 2, 1, 0], dtype=np.int64)
+        tm.assert_numpy_array_equal(uniques, exp)
 
         labels, uniques = algos.factorize(list(reversed(range(5))), sort=True)
-        self.assert_numpy_array_equal(labels, np.array([ 4, 3, 2, 1, 0],dtype=np.int64))
-        self.assert_numpy_array_equal(uniques, np.array([0, 1, 2, 3, 4], dtype=np.int64))
 
-        labels, uniques = algos.factorize(list(reversed(np.arange(5.))))
-        self.assert_numpy_array_equal(labels, np.array([0., 1., 2., 3., 4.], dtype=np.float64))
-        self.assert_numpy_array_equal(uniques, np.array([ 4, 3, 2, 1, 0],dtype=np.int64))
+        exp = np.array([4, 3, 2, 1, 0], dtype=np.intp)
+        tm.assert_numpy_array_equal(labels, exp)
+        exp = np.array([0, 1, 2, 3, 4], dtype=np.int64)
+        tm.assert_numpy_array_equal(uniques, exp)
 
-        labels, uniques = algos.factorize(list(reversed(np.arange(5.))), sort=True)
-        self.assert_numpy_array_equal(labels, np.array([ 4, 3, 2, 1, 0],dtype=np.int64))
-        self.assert_numpy_array_equal(uniques, np.array([0., 1., 2., 3., 4.], dtype=np.float64))
+        labels, uniques = algos.factorize(list(reversed(np.arange(5.))))
+        exp = np.array([0, 1, 2, 3, 4], dtype=np.intp)
+        tm.assert_numpy_array_equal(labels, exp)
+        exp = np.array([4., 3., 2., 1., 0.], dtype=np.float64)
+        tm.assert_numpy_array_equal(uniques, exp)
+
+        labels, uniques = algos.factorize(list(reversed(np.arange(5.))),
+                                          sort=True)
+        exp = np.array([4, 3, 2, 1, 0], dtype=np.intp)
+        tm.assert_numpy_array_equal(labels, exp)
+        exp = np.array([0., 1., 2., 3., 4.], dtype=np.float64)
+        tm.assert_numpy_array_equal(uniques, exp)
 
     def test_mixed(self):
 
@@ -92,130 +109,198 @@ def test_mixed(self):
         x = Series(['A', 'A', np.nan, 'B', 3.14, np.inf])
         labels, uniques = algos.factorize(x)
 
-        self.assert_numpy_array_equal(labels, np.array([ 0,  0, -1,  1,  2,  3],dtype=np.int64))
-        self.assert_numpy_array_equal(uniques, np.array(['A', 'B', 3.14, np.inf], dtype=object))
+        exp = np.array([0, 0, -1, 1, 2, 3], dtype=np.intp)
+        tm.assert_numpy_array_equal(labels, exp)
+        exp = Index(['A', 'B', 3.14, np.inf])
+        tm.assert_index_equal(uniques, exp)
 
         labels, uniques = algos.factorize(x, sort=True)
-        self.assert_numpy_array_equal(labels, np.array([ 2,  2, -1,  3,  0,  1],dtype=np.int64))
-        self.assert_numpy_array_equal(uniques, np.array([3.14, np.inf, 'A', 'B'], dtype=object))
+        exp = np.array([2, 2, -1, 3, 0, 1], dtype=np.intp)
+        tm.assert_numpy_array_equal(labels, exp)
+        exp = Index([3.14, np.inf, 'A', 'B'])
+        tm.assert_index_equal(uniques, exp)
 
     def test_datelike(self):
 
         # M8
-        v1 = pd.Timestamp('20130101 09:00:00.00004')
-        v2 = pd.Timestamp('20130101')
-        x = Series([v1,v1,v1,v2,v2,v1])
+        v1 = Timestamp('20130101 09:00:00.00004')
+        v2 = Timestamp('20130101')
+        x = Series([v1, v1, v1, v2, v2, v1])
         labels, uniques = algos.factorize(x)
-        self.assert_numpy_array_equal(labels, np.array([ 0,0,0,1,1,0],dtype=np.int64))
-        self.assert_numpy_array_equal(uniques, np.array([v1.value,v2.value],dtype='M8[ns]'))
+
+        exp = np.array([0, 0, 0, 1, 1, 0], dtype=np.intp)
+        tm.assert_numpy_array_equal(labels, exp)
+        exp = DatetimeIndex([v1, v2])
+        tm.assert_index_equal(uniques, exp)
 
         labels, uniques = algos.factorize(x, sort=True)
-        self.assert_numpy_array_equal(labels, np.array([ 1,1,1,0,0,1],dtype=np.int64))
-        self.assert_numpy_array_equal(uniques, np.array([v2.value,v1.value],dtype='M8[ns]'))
+        exp = np.array([1, 1, 1, 0, 0, 1], dtype=np.intp)
+        tm.assert_numpy_array_equal(labels, exp)
+        exp = DatetimeIndex([v2, v1])
+        tm.assert_index_equal(uniques, exp)
 
         # period
-        v1 = pd.Period('201302',freq='M')
-        v2 = pd.Period('201303',freq='M')
-        x = Series([v1,v1,v1,v2,v2,v1])
+        v1 = pd.Period('201302', freq='M')
+        v2 = pd.Period('201303', freq='M')
+        x = Series([v1, v1, v1, v2, v2, v1])
 
         # periods are not 'sorted' as they are converted back into an index
         labels, uniques = algos.factorize(x)
-        self.assert_numpy_array_equal(labels, np.array([ 0,0,0,1,1,0],dtype=np.int64))
-        self.assert_numpy_array_equal(uniques, pd.PeriodIndex([v1, v2]))
+        exp = np.array([0, 0, 0, 1, 1, 0], dtype=np.intp)
+        tm.assert_numpy_array_equal(labels, exp)
+        tm.assert_index_equal(uniques, pd.PeriodIndex([v1, v2]))
 
-        labels, uniques = algos.factorize(x,sort=True)
-        self.assert_numpy_array_equal(labels, np.array([ 0,0,0,1,1,0],dtype=np.int64))
-        self.assert_numpy_array_equal(uniques, pd.PeriodIndex([v1, v2]))
+        labels, uniques = algos.factorize(x, sort=True)
+        exp = np.array([0, 0, 0, 1, 1, 0], dtype=np.intp)
+        tm.assert_numpy_array_equal(labels, exp)
+        tm.assert_index_equal(uniques, pd.PeriodIndex([v1, v2]))
+
+        # GH 5986
+        v1 = pd.to_timedelta('1 day 1 min')
+        v2 = pd.to_timedelta('1 day')
+        x = Series([v1, v2, v1, v1, v2, v2, v1])
+        labels, uniques = algos.factorize(x)
+        exp = np.array([0, 1, 0, 0, 1, 1, 0], dtype=np.intp)
+        tm.assert_numpy_array_equal(labels, exp)
+        tm.assert_index_equal(uniques, pd.to_timedelta([v1, v2]))
+
+        labels, uniques = algos.factorize(x, sort=True)
+        exp = np.array([1, 0, 1, 1, 0, 0, 1], dtype=np.intp)
+        tm.assert_numpy_array_equal(labels, exp)
+        tm.assert_index_equal(uniques, pd.to_timedelta([v2, v1]))
 
     def test_factorize_nan(self):
         # nan should map to na_sentinel, not reverse_indexer[na_sentinel]
         # rizer.factorize should not raise an exception if na_sentinel indexes
         # outside of reverse_indexer
         key = np.array([1, 2, 1, np.nan], dtype='O')
-        rizer = hashtable.Factorizer(len(key))
+        rizer = ht.Factorizer(len(key))
         for na_sentinel in (-1, 20):
             ids = rizer.factorize(key, sort=True, na_sentinel=na_sentinel)
             expected = np.array([0, 1, 0, na_sentinel], dtype='int32')
-            self.assertEqual(len(set(key)), len(set(expected)))
-            self.assertTrue(np.array_equal(pd.isnull(key), expected == na_sentinel))
+            assert len(set(key)) == len(set(expected))
+            tm.assert_numpy_array_equal(pd.isna(key),
+                                        expected == na_sentinel)
 
         # nan still maps to na_sentinel when sort=False
         key = np.array([0, np.nan, 1], dtype='O')
         na_sentinel = -1
-        ids = rizer.factorize(key, sort=False, na_sentinel=na_sentinel)
-        expected = np.array([ 2, -1,  0], dtype='int32')
-        self.assertEqual(len(set(key)), len(set(expected)))
-        self.assertTrue(np.array_equal(pd.isnull(key), expected == na_sentinel))
 
-    def test_vector_resize(self):
-        # Test for memory errors after internal vector
-        # reallocations (pull request #7157)
-
-        def _test_vector_resize(htable, uniques, dtype, nvals):
-            vals = np.array(np.random.randn(1000), dtype=dtype)
-            # get_labels appends to the vector
-            htable.get_labels(vals[:nvals], uniques, 0, -1)
-            # to_array resizes the vector
-            uniques.to_array()
-            htable.get_labels(vals, uniques, 0, -1)
-
-        test_cases = [
-            (hashtable.PyObjectHashTable, hashtable.ObjectVector, 'object'),
-            (hashtable.Float64HashTable,  hashtable.Float64Vector, 'float64'),
-            (hashtable.Int64HashTable,    hashtable.Int64Vector, 'int64')]
-
-        for (tbl, vect, dtype) in test_cases:
-            # resizing to empty is a special case
-            _test_vector_resize(tbl(), vect(), dtype, 0)
-            _test_vector_resize(tbl(), vect(), dtype, 10)
-
-class TestIndexer(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def test_outer_join_indexer(self):
-        typemap = [('int32', algos.algos.outer_join_indexer_int32),
-                   ('int64', algos.algos.outer_join_indexer_int64),
-                   ('float32', algos.algos.outer_join_indexer_float32),
-                   ('float64', algos.algos.outer_join_indexer_float64),
-                   ('object', algos.algos.outer_join_indexer_object)]
-
-        for dtype, indexer in typemap:
-            left = np.arange(3, dtype = dtype)
-            right = np.arange(2,5, dtype = dtype)
-            empty = np.array([], dtype = dtype)
-
-            result, lindexer, rindexer = indexer(left, right)
-            tm.assertIsInstance(result, np.ndarray)
-            tm.assertIsInstance(lindexer, np.ndarray)
-            tm.assertIsInstance(rindexer, np.ndarray)
-            tm.assert_numpy_array_equal(result, np.arange(5, dtype = dtype))
-            tm.assert_numpy_array_equal(lindexer, np.array([0, 1, 2, -1, -1]))
-            tm.assert_numpy_array_equal(rindexer, np.array([-1, -1, 0, 1, 2]))
-
-            result, lindexer, rindexer = indexer(empty, right)
-            tm.assert_numpy_array_equal(result, right)
-            tm.assert_numpy_array_equal(lindexer, np.array([-1, -1, -1]))
-            tm.assert_numpy_array_equal(rindexer, np.array([0, 1, 2]))
-
-            result, lindexer, rindexer = indexer(left, empty)
-            tm.assert_numpy_array_equal(result, left)
-            tm.assert_numpy_array_equal(lindexer, np.array([0, 1, 2]))
-            tm.assert_numpy_array_equal(rindexer, np.array([-1, -1, -1]))
-
-class TestUnique(tm.TestCase):
-    _multiprocess_can_split_ = True
+        # TODO(wesm): unused?
+        ids = rizer.factorize(key, sort=False, na_sentinel=na_sentinel)  # noqa
+
+        expected = np.array([2, -1, 0], dtype='int32')
+        assert len(set(key)) == len(set(expected))
+        tm.assert_numpy_array_equal(pd.isna(key), expected == na_sentinel)
+
+    @pytest.mark.parametrize("data,expected_label,expected_level", [
+        (
+            [(1, 1), (1, 2), (0, 0), (1, 2), 'nonsense'],
+            [0, 1, 2, 1, 3],
+            [(1, 1), (1, 2), (0, 0), 'nonsense']
+        ),
+        (
+            [(1, 1), (1, 2), (0, 0), (1, 2), (1, 2, 3)],
+            [0, 1, 2, 1, 3],
+            [(1, 1), (1, 2), (0, 0), (1, 2, 3)]
+        ),
+        (
+            [(1, 1), (1, 2), (0, 0), (1, 2)],
+            [0, 1, 2, 1],
+            [(1, 1), (1, 2), (0, 0)]
+        )
+    ])
+    def test_factorize_tuple_list(self, data, expected_label, expected_level):
+        # GH9454
+        result = pd.factorize(data)
+
+        tm.assert_numpy_array_equal(result[0],
+                                    np.array(expected_label, dtype=np.intp))
+
+        expected_level_array = com._asarray_tuplesafe(expected_level,
+                                                      dtype=object)
+        tm.assert_numpy_array_equal(result[1], expected_level_array)
+
+    def test_complex_sorting(self):
+        # gh 12666 - check no segfault
+        # Test not valid numpy versions older than 1.11
+        if pd._np_version_under1p11:
+            pytest.skip("Test valid only for numpy 1.11+")
+
+        x17 = np.array([complex(i) for i in range(17)], dtype=object)
+
+        pytest.raises(TypeError, algos.factorize, x17[::-1], sort=True)
+
+    def test_uint64_factorize(self):
+        data = np.array([2**63, 1, 2**63], dtype=np.uint64)
+        exp_labels = np.array([0, 1, 0], dtype=np.intp)
+        exp_uniques = np.array([2**63, 1], dtype=np.uint64)
+
+        labels, uniques = algos.factorize(data)
+        tm.assert_numpy_array_equal(labels, exp_labels)
+        tm.assert_numpy_array_equal(uniques, exp_uniques)
+
+        data = np.array([2**63, -1, 2**63], dtype=object)
+        exp_labels = np.array([0, 1, 0], dtype=np.intp)
+        exp_uniques = np.array([2**63, -1], dtype=object)
+
+        labels, uniques = algos.factorize(data)
+        tm.assert_numpy_array_equal(labels, exp_labels)
+        tm.assert_numpy_array_equal(uniques, exp_uniques)
+
+    def test_deprecate_order(self):
+        # gh 19727 - check warning is raised for deprecated keyword, order.
+        # Test not valid once order keyword is removed.
+        data = np.array([2**63, 1, 2**63], dtype=np.uint64)
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            algos.factorize(data, order=True)
+        with tm.assert_produces_warning(False):
+            algos.factorize(data)
+
+    @pytest.mark.parametrize('data', [
+        np.array([0, 1, 0], dtype='u8'),
+        np.array([-2**63, 1, -2**63], dtype='i8'),
+        np.array(['__nan__', 'foo', '__nan__'], dtype='object'),
+    ])
+    def test_parametrized_factorize_na_value_default(self, data):
+        # arrays that include the NA default for that type, but isn't used.
+        l, u = algos.factorize(data)
+        expected_uniques = data[[0, 1]]
+        expected_labels = np.array([0, 1, 0], dtype=np.intp)
+        tm.assert_numpy_array_equal(l, expected_labels)
+        tm.assert_numpy_array_equal(u, expected_uniques)
+
+    @pytest.mark.parametrize('data, na_value', [
+        (np.array([0, 1, 0, 2], dtype='u8'), 0),
+        (np.array([1, 0, 1, 2], dtype='u8'), 1),
+        (np.array([-2**63, 1, -2**63, 0], dtype='i8'), -2**63),
+        (np.array([1, -2**63, 1, 0], dtype='i8'), 1),
+        (np.array(['a', '', 'a', 'b'], dtype=object), 'a'),
+        (np.array([(), ('a', 1), (), ('a', 2)], dtype=object), ()),
+        (np.array([('a', 1), (), ('a', 1), ('a', 2)], dtype=object),
+         ('a', 1)),
+    ])
+    def test_parametrized_factorize_na_value(self, data, na_value):
+        l, u = algos._factorize_array(data, na_value=na_value)
+        expected_uniques = data[[1, 3]]
+        expected_labels = np.array([-1, 0, -1, 1], dtype=np.intp)
+        tm.assert_numpy_array_equal(l, expected_labels)
+        tm.assert_numpy_array_equal(u, expected_uniques)
+
+
+class TestUnique(object):
 
     def test_ints(self):
         arr = np.random.randint(0, 100, size=50)
 
         result = algos.unique(arr)
-        tm.assertIsInstance(result, np.ndarray)
+        assert isinstance(result, np.ndarray)
 
     def test_objects(self):
         arr = np.random.randint(0, 100, size=50).astype('O')
 
         result = algos.unique(arr)
-        tm.assertIsInstance(result, np.ndarray)
+        assert isinstance(result, np.ndarray)
 
     def test_object_refcount_bug(self):
         lst = ['A', 'B', 'C', 'D', 'E']
@@ -224,8 +309,8 @@ def test_object_refcount_bug(self):
 
     def test_on_index_object(self):
 
-        mindex = pd.MultiIndex.from_arrays([np.arange(5).repeat(5),
-                                            np.tile(np.arange(5), 5)])
+        mindex = pd.MultiIndex.from_arrays([np.arange(5).repeat(5), np.tile(
+            np.arange(5), 5)])
         expected = mindex.values
         expected.sort()
 
@@ -238,26 +323,27 @@ def test_on_index_object(self):
 
     def test_datetime64_dtype_array_returned(self):
         # GH 9431
-        expected = np.array(['2015-01-03T00:00:00.000000000+0000',
-                             '2015-01-01T00:00:00.000000000+0000'], dtype='M8[ns]')
+        expected = np_array_datetime64_compat(
+            ['2015-01-03T00:00:00.000000000+0000',
+             '2015-01-01T00:00:00.000000000+0000'],
+            dtype='M8[ns]')
 
         dt_index = pd.to_datetime(['2015-01-03T00:00:00.000000000+0000',
                                    '2015-01-01T00:00:00.000000000+0000',
                                    '2015-01-01T00:00:00.000000000+0000'])
         result = algos.unique(dt_index)
         tm.assert_numpy_array_equal(result, expected)
-        self.assertEqual(result.dtype, expected.dtype)
+        assert result.dtype == expected.dtype
 
-        s = pd.Series(dt_index)
+        s = Series(dt_index)
         result = algos.unique(s)
         tm.assert_numpy_array_equal(result, expected)
-        self.assertEqual(result.dtype, expected.dtype)
+        assert result.dtype == expected.dtype
 
         arr = s.values
         result = algos.unique(arr)
         tm.assert_numpy_array_equal(result, expected)
-        self.assertEqual(result.dtype, expected.dtype)
-
+        assert result.dtype == expected.dtype
 
     def test_timedelta64_dtype_array_returned(self):
         # GH 9431
@@ -266,126 +352,298 @@ def test_timedelta64_dtype_array_returned(self):
         td_index = pd.to_timedelta([31200, 45678, 31200, 10000, 45678])
         result = algos.unique(td_index)
         tm.assert_numpy_array_equal(result, expected)
-        self.assertEqual(result.dtype, expected.dtype)
+        assert result.dtype == expected.dtype
 
-        s = pd.Series(td_index)
+        s = Series(td_index)
         result = algos.unique(s)
         tm.assert_numpy_array_equal(result, expected)
-        self.assertEqual(result.dtype, expected.dtype)
+        assert result.dtype == expected.dtype
 
         arr = s.values
         result = algos.unique(arr)
         tm.assert_numpy_array_equal(result, expected)
-        self.assertEqual(result.dtype, expected.dtype)
+        assert result.dtype == expected.dtype
+
+    def test_uint64_overflow(self):
+        s = Series([1, 2, 2**63, 2**63], dtype=np.uint64)
+        exp = np.array([1, 2, 2**63], dtype=np.uint64)
+        tm.assert_numpy_array_equal(algos.unique(s), exp)
+
+    def test_nan_in_object_array(self):
+        l = ['a', np.nan, 'c', 'c']
+        result = pd.unique(l)
+        expected = np.array(['a', np.nan, 'c'], dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_categorical(self):
+
+        # we are expecting to return in the order
+        # of appearance
+        expected = Categorical(list('bac'), categories=list('bac'))
+
+        # we are expecting to return in the order
+        # of the categories
+        expected_o = Categorical(
+            list('bac'), categories=list('abc'), ordered=True)
+
+        # GH 15939
+        c = Categorical(list('baabc'))
+        result = c.unique()
+        tm.assert_categorical_equal(result, expected)
+
+        result = algos.unique(c)
+        tm.assert_categorical_equal(result, expected)
+
+        c = Categorical(list('baabc'), ordered=True)
+        result = c.unique()
+        tm.assert_categorical_equal(result, expected_o)
+
+        result = algos.unique(c)
+        tm.assert_categorical_equal(result, expected_o)
+
+        # Series of categorical dtype
+        s = Series(Categorical(list('baabc')), name='foo')
+        result = s.unique()
+        tm.assert_categorical_equal(result, expected)
+
+        result = pd.unique(s)
+        tm.assert_categorical_equal(result, expected)
+
+        # CI -> return CI
+        ci = CategoricalIndex(Categorical(list('baabc'),
+                                          categories=list('bac')))
+        expected = CategoricalIndex(expected)
+        result = ci.unique()
+        tm.assert_index_equal(result, expected)
 
-class TestIsin(tm.TestCase):
-    _multiprocess_can_split_ = True
+        result = pd.unique(ci)
+        tm.assert_index_equal(result, expected)
+
+    def test_datetime64tz_aware(self):
+        # GH 15939
+
+        result = Series(
+            Index([Timestamp('20160101', tz='US/Eastern'),
+                   Timestamp('20160101', tz='US/Eastern')])).unique()
+        expected = np.array([Timestamp('2016-01-01 00:00:00-0500',
+                                       tz='US/Eastern')], dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = Index([Timestamp('20160101', tz='US/Eastern'),
+                        Timestamp('20160101', tz='US/Eastern')]).unique()
+        expected = DatetimeIndex(['2016-01-01 00:00:00'],
+                                 dtype='datetime64[ns, US/Eastern]', freq=None)
+        tm.assert_index_equal(result, expected)
+
+        result = pd.unique(
+            Series(Index([Timestamp('20160101', tz='US/Eastern'),
+                          Timestamp('20160101', tz='US/Eastern')])))
+        expected = np.array([Timestamp('2016-01-01 00:00:00-0500',
+                                       tz='US/Eastern')], dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = pd.unique(Index([Timestamp('20160101', tz='US/Eastern'),
+                                  Timestamp('20160101', tz='US/Eastern')]))
+        expected = DatetimeIndex(['2016-01-01 00:00:00'],
+                                 dtype='datetime64[ns, US/Eastern]', freq=None)
+        tm.assert_index_equal(result, expected)
+
+    def test_order_of_appearance(self):
+        # 9346
+        # light testing of guarantee of order of appearance
+        # these also are the doc-examples
+        result = pd.unique(Series([2, 1, 3, 3]))
+        tm.assert_numpy_array_equal(result,
+                                    np.array([2, 1, 3], dtype='int64'))
+
+        result = pd.unique(Series([2] + [1] * 5))
+        tm.assert_numpy_array_equal(result,
+                                    np.array([2, 1], dtype='int64'))
+
+        result = pd.unique(Series([Timestamp('20160101'),
+                                   Timestamp('20160101')]))
+        expected = np.array(['2016-01-01T00:00:00.000000000'],
+                            dtype='datetime64[ns]')
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = pd.unique(Index(
+            [Timestamp('20160101', tz='US/Eastern'),
+             Timestamp('20160101', tz='US/Eastern')]))
+        expected = DatetimeIndex(['2016-01-01 00:00:00'],
+                                 dtype='datetime64[ns, US/Eastern]',
+                                 freq=None)
+        tm.assert_index_equal(result, expected)
+
+        result = pd.unique(list('aabc'))
+        expected = np.array(['a', 'b', 'c'], dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = pd.unique(Series(Categorical(list('aabc'))))
+        expected = Categorical(list('abc'))
+        tm.assert_categorical_equal(result, expected)
+
+    @pytest.mark.parametrize("arg ,expected", [
+        (('1', '1', '2'), np.array(['1', '2'], dtype=object)),
+        (('foo',), np.array(['foo'], dtype=object))
+    ])
+    def test_tuple_with_strings(self, arg, expected):
+        # see GH 17108
+        result = pd.unique(arg)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_obj_none_preservation(self):
+        # GH 20866
+        arr = np.array(['foo', None], dtype=object)
+        result = pd.unique(arr)
+        expected = np.array(['foo', None], dtype=object)
+
+        tm.assert_numpy_array_equal(result, expected, strict_nan=True)
+
+
+class TestIsin(object):
 
     def test_invalid(self):
 
-        self.assertRaises(TypeError, lambda : algos.isin(1,1))
-        self.assertRaises(TypeError, lambda : algos.isin(1,[1]))
-        self.assertRaises(TypeError, lambda : algos.isin([1],1))
+        pytest.raises(TypeError, lambda: algos.isin(1, 1))
+        pytest.raises(TypeError, lambda: algos.isin(1, [1]))
+        pytest.raises(TypeError, lambda: algos.isin([1], 1))
 
     def test_basic(self):
 
-        result = algos.isin([1,2],[1])
-        expected = np.array([True,False])
+        result = algos.isin([1, 2], [1])
+        expected = np.array([True, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = algos.isin(np.array([1, 2]), [1])
+        expected = np.array([True, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = algos.isin(Series([1, 2]), [1])
+        expected = np.array([True, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        result = algos.isin(np.array([1,2]),[1])
-        expected = np.array([True,False])
+        result = algos.isin(Series([1, 2]), Series([1]))
+        expected = np.array([True, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        result = algos.isin(pd.Series([1,2]),[1])
-        expected = np.array([True,False])
+        result = algos.isin(Series([1, 2]), set([1]))
+        expected = np.array([True, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        result = algos.isin(pd.Series([1,2]),pd.Series([1]))
-        expected = np.array([True,False])
+        result = algos.isin(['a', 'b'], ['a'])
+        expected = np.array([True, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        result = algos.isin(['a','b'],['a'])
-        expected = np.array([True,False])
+        result = algos.isin(Series(['a', 'b']), Series(['a']))
+        expected = np.array([True, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        result = algos.isin(pd.Series(['a','b']),pd.Series(['a']))
-        expected = np.array([True,False])
+        result = algos.isin(Series(['a', 'b']), set(['a']))
+        expected = np.array([True, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        result = algos.isin(['a','b'],[1])
-        expected = np.array([False,False])
+        result = algos.isin(['a', 'b'], [1])
+        expected = np.array([False, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        arr = pd.date_range('20130101',periods=3).values
-        result = algos.isin(arr,[arr[0]])
-        expected = np.array([True,False,False])
+    def test_i8(self):
+
+        arr = pd.date_range('20130101', periods=3).values
+        result = algos.isin(arr, [arr[0]])
+        expected = np.array([True, False, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        result = algos.isin(arr,arr[0:2])
-        expected = np.array([True,True,False])
+        result = algos.isin(arr, arr[0:2])
+        expected = np.array([True, True, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        arr = pd.timedelta_range('1 day',periods=3).values
-        result = algos.isin(arr,[arr[0]])
-        expected = np.array([True,False,False])
+        result = algos.isin(arr, set(arr[0:2]))
+        expected = np.array([True, True, False])
         tm.assert_numpy_array_equal(result, expected)
 
+        arr = pd.timedelta_range('1 day', periods=3).values
+        result = algos.isin(arr, [arr[0]])
+        expected = np.array([True, False, False])
+        tm.assert_numpy_array_equal(result, expected)
 
+        result = algos.isin(arr, arr[0:2])
+        expected = np.array([True, True, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = algos.isin(arr, set(arr[0:2]))
+        expected = np.array([True, True, False])
+        tm.assert_numpy_array_equal(result, expected)
 
     def test_large(self):
 
-        s = pd.date_range('20000101',periods=2000000,freq='s').values
-        result = algos.isin(s,s[0:2])
-        expected = np.zeros(len(s),dtype=bool)
+        s = pd.date_range('20000101', periods=2000000, freq='s').values
+        result = algos.isin(s, s[0:2])
+        expected = np.zeros(len(s), dtype=bool)
         expected[0] = True
         expected[1] = True
         tm.assert_numpy_array_equal(result, expected)
 
-class TestValueCounts(tm.TestCase):
-    _multiprocess_can_split_ = True
+    def test_categorical_from_codes(self):
+        # GH 16639
+        vals = np.array([0, 1, 2, 0])
+        cats = ['a', 'b', 'c']
+        Sd = Series(Categorical(1).from_codes(vals, cats))
+        St = Series(Categorical(1).from_codes(np.array([0, 1]), cats))
+        expected = np.array([True, True, False, True])
+        result = algos.isin(Sd, St)
+        tm.assert_numpy_array_equal(expected, result)
+
+    @pytest.mark.parametrize("empty", [[], Series(), np.array([])])
+    def test_empty(self, empty):
+        # see gh-16991
+        vals = Index(["a", "b"])
+        expected = np.array([False, False])
+
+        result = algos.isin(vals, empty)
+        tm.assert_numpy_array_equal(expected, result)
+
+
+class TestValueCounts(object):
 
     def test_value_counts(self):
         np.random.seed(1234)
-        from pandas.tools.tile import cut
+        from pandas.core.reshape.tile import cut
 
         arr = np.random.randn(4)
         factor = cut(arr, 4)
 
-        tm.assertIsInstance(factor, Categorical)
+        # assert isinstance(factor, n)
         result = algos.value_counts(factor)
-        cats = ['(-1.194, -0.535]',
-                '(-0.535, 0.121]',
-                '(0.121, 0.777]',
-                '(0.777, 1.433]'
-        ]
-        expected_index = CategoricalIndex(cats, cats, ordered=True)
-        expected = Series([1, 1, 1, 1],
-                          index=expected_index)
+        breaks = [-1.194, -0.535, 0.121, 0.777, 1.433]
+        index = IntervalIndex.from_breaks(breaks).astype(CDT(ordered=True))
+        expected = Series([1, 1, 1, 1], index=index)
         tm.assert_series_equal(result.sort_index(), expected.sort_index())
 
     def test_value_counts_bins(self):
         s = [1, 2, 3, 4]
         result = algos.value_counts(s, bins=1)
-        self.assertEqual(result.tolist(), [4])
-        self.assertEqual(result.index[0], 0.997)
+        expected = Series([4],
+                          index=IntervalIndex.from_tuples([(0.996, 4.0)]))
+        tm.assert_series_equal(result, expected)
 
         result = algos.value_counts(s, bins=2, sort=False)
-        self.assertEqual(result.tolist(), [2, 2])
-        self.assertEqual(result.index[0], 0.997)
-        self.assertEqual(result.index[1], 2.5)
+        expected = Series([2, 2],
+                          index=IntervalIndex.from_tuples([(0.996, 2.5),
+                                                           (2.5, 4.0)]))
+        tm.assert_series_equal(result, expected)
 
     def test_value_counts_dtypes(self):
         result = algos.value_counts([1, 1.])
-        self.assertEqual(len(result), 1)
+        assert len(result) == 1
 
         result = algos.value_counts([1, 1.], bins=1)
-        self.assertEqual(len(result), 1)
+        assert len(result) == 1
 
         result = algos.value_counts(Series([1, 1., '1']))  # object
-        self.assertEqual(len(result), 2)
+        assert len(result) == 2
 
-        self.assertRaises(TypeError, lambda s: algos.value_counts(s, bins=1), ['1', 1])
+        pytest.raises(TypeError, lambda s: algos.value_counts(s, bins=1),
+                      ['1', 1])
 
     def test_value_counts_nat(self):
         td = Series([np.timedelta64(10000), pd.NaT], dtype='timedelta64[ns]')
@@ -394,17 +652,36 @@ def test_value_counts_nat(self):
         for s in [td, dt]:
             vc = algos.value_counts(s)
             vc_with_na = algos.value_counts(s, dropna=False)
-            self.assertEqual(len(vc), 1)
-            self.assertEqual(len(vc_with_na), 2)
+            assert len(vc) == 1
+            assert len(vc_with_na) == 2
 
-        exp_dt = pd.Series({pd.Timestamp('2014-01-01 00:00:00'): 1})
+        exp_dt = Series({Timestamp('2014-01-01 00:00:00'): 1})
         tm.assert_series_equal(algos.value_counts(dt), exp_dt)
         # TODO same for (timedelta)
 
+    def test_value_counts_datetime_outofbounds(self):
+        # GH 13663
+        s = Series([datetime(3000, 1, 1), datetime(5000, 1, 1),
+                    datetime(5000, 1, 1), datetime(6000, 1, 1),
+                    datetime(3000, 1, 1), datetime(3000, 1, 1)])
+        res = s.value_counts()
+
+        exp_index = Index([datetime(3000, 1, 1), datetime(5000, 1, 1),
+                           datetime(6000, 1, 1)], dtype=object)
+        exp = Series([3, 2, 1], index=exp_index)
+        tm.assert_series_equal(res, exp)
+
+        # GH 12424
+        res = pd.to_datetime(Series(['2362-01-01', np.nan]),
+                             errors='ignore')
+        exp = Series(['2362-01-01', np.nan], dtype=object)
+        tm.assert_series_equal(res, exp)
+
     def test_categorical(self):
-        s = Series(pd.Categorical(list('aaabbc')))
+        s = Series(Categorical(list('aaabbc')))
         result = s.value_counts()
-        expected = pd.Series([3, 2, 1], index=pd.CategoricalIndex(['a', 'b', 'c']))
+        expected = Series([3, 2, 1], index=CategoricalIndex(['a', 'b', 'c']))
+
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         # preserve order?
@@ -414,76 +691,273 @@ def test_categorical(self):
         tm.assert_series_equal(result, expected, check_index_type=True)
 
     def test_categorical_nans(self):
-        s = Series(pd.Categorical(list('aaaaabbbcc'))) # 4,3,2,1 (nan)
+        s = Series(Categorical(list('aaaaabbbcc')))  # 4,3,2,1 (nan)
         s.iloc[1] = np.nan
         result = s.value_counts()
-        expected = pd.Series([4, 3, 2],
-                             index=pd.CategoricalIndex(['a', 'b', 'c'],
-                                                       categories=['a', 'b', 'c']))
+        expected = Series([4, 3, 2], index=CategoricalIndex(
+            ['a', 'b', 'c'], categories=['a', 'b', 'c']))
         tm.assert_series_equal(result, expected, check_index_type=True)
         result = s.value_counts(dropna=False)
-        expected = pd.Series([4, 3, 2, 1], index=pd.CategoricalIndex(
-            ['a', 'b',  'c', np.nan]))
+        expected = Series([
+            4, 3, 2, 1
+        ], index=CategoricalIndex(['a', 'b', 'c', np.nan]))
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         # out of order
-        s = Series(pd.Categorical(list('aaaaabbbcc'),
-                                  ordered=True, categories=['b', 'a', 'c']))
+        s = Series(Categorical(
+            list('aaaaabbbcc'), ordered=True, categories=['b', 'a', 'c']))
         s.iloc[1] = np.nan
         result = s.value_counts()
-        expected = pd.Series([4, 3, 2],
-                             index=pd.CategoricalIndex(['a', 'b', 'c'],
-                                                       categories=['b', 'a', 'c'],
-                                                       ordered=True))
+        expected = Series([4, 3, 2], index=CategoricalIndex(
+            ['a', 'b', 'c'], categories=['b', 'a', 'c'], ordered=True))
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         result = s.value_counts(dropna=False)
-        expected = pd.Series([4, 3, 2, 1], index=pd.CategoricalIndex(
-            ['a', 'b',  'c', np.nan], categories=['b', 'a', 'c'], ordered=True))
+        expected = Series([4, 3, 2, 1], index=CategoricalIndex(
+            ['a', 'b', 'c', np.nan], categories=['b', 'a', 'c'], ordered=True))
         tm.assert_series_equal(result, expected, check_index_type=True)
 
     def test_categorical_zeroes(self):
         # keep the `d` category with 0
-        s = Series(pd.Categorical(list('bbbaac'), categories=list('abcd'),
-                                  ordered=True))
+        s = Series(Categorical(
+            list('bbbaac'), categories=list('abcd'), ordered=True))
         result = s.value_counts()
-        expected = Series([3, 2, 1, 0], index=pd.Categorical(
+        expected = Series([3, 2, 1, 0], index=Categorical(
             ['b', 'a', 'c', 'd'], categories=list('abcd'), ordered=True))
         tm.assert_series_equal(result, expected, check_index_type=True)
 
-
     def test_dropna(self):
-        # https://github.com/pydata/pandas/issues/9443#issuecomment-73719328
+        # https://github.com/pandas-dev/pandas/issues/9443#issuecomment-73719328
 
         tm.assert_series_equal(
-            pd.Series([True, True, False]).value_counts(dropna=True),
-            pd.Series([2, 1], index=[True, False]))
+            Series([True, True, False]).value_counts(dropna=True),
+            Series([2, 1], index=[True, False]))
         tm.assert_series_equal(
-            pd.Series([True, True, False]).value_counts(dropna=False),
-            pd.Series([2, 1], index=[True, False]))
+            Series([True, True, False]).value_counts(dropna=False),
+            Series([2, 1], index=[True, False]))
 
         tm.assert_series_equal(
-            pd.Series([True, True, False, None]).value_counts(dropna=True),
-            pd.Series([2, 1], index=[True, False]))
+            Series([True, True, False, None]).value_counts(dropna=True),
+            Series([2, 1], index=[True, False]))
         tm.assert_series_equal(
-            pd.Series([True, True, False, None]).value_counts(dropna=False),
-            pd.Series([2, 1, 1], index=[True, False, np.nan]))
+            Series([True, True, False, None]).value_counts(dropna=False),
+            Series([2, 1, 1], index=[True, False, np.nan]))
         tm.assert_series_equal(
-            pd.Series([10.3, 5., 5.]).value_counts(dropna=True),
-            pd.Series([2, 1], index=[5., 10.3]))
+            Series([10.3, 5., 5.]).value_counts(dropna=True),
+            Series([2, 1], index=[5., 10.3]))
         tm.assert_series_equal(
-            pd.Series([10.3, 5., 5.]).value_counts(dropna=False),
-            pd.Series([2, 1], index=[5., 10.3]))
+            Series([10.3, 5., 5.]).value_counts(dropna=False),
+            Series([2, 1], index=[5., 10.3]))
 
         tm.assert_series_equal(
-            pd.Series([10.3, 5., 5., None]).value_counts(dropna=True),
-            pd.Series([2, 1], index=[5., 10.3]))
+            Series([10.3, 5., 5., None]).value_counts(dropna=True),
+            Series([2, 1], index=[5., 10.3]))
 
         # 32-bit linux has a different ordering
         if not compat.is_platform_32bit():
-            tm.assert_series_equal(
-                pd.Series([10.3, 5., 5., None]).value_counts(dropna=False),
-                pd.Series([2, 1, 1], index=[5., 10.3, np.nan]))
+            result = Series([10.3, 5., 5., None]).value_counts(dropna=False)
+            expected = Series([2, 1, 1], index=[5., 10.3, np.nan])
+            tm.assert_series_equal(result, expected)
+
+    def test_value_counts_normalized(self):
+        # GH12558
+        s = Series([1, 2, np.nan, np.nan, np.nan])
+        dtypes = (np.float64, np.object, 'M8[ns]')
+        for t in dtypes:
+            s_typed = s.astype(t)
+            result = s_typed.value_counts(normalize=True, dropna=False)
+            expected = Series([0.6, 0.2, 0.2],
+                              index=Series([np.nan, 2.0, 1.0], dtype=t))
+            tm.assert_series_equal(result, expected)
+
+            result = s_typed.value_counts(normalize=True, dropna=True)
+            expected = Series([0.5, 0.5],
+                              index=Series([2.0, 1.0], dtype=t))
+            tm.assert_series_equal(result, expected)
+
+    def test_value_counts_uint64(self):
+        arr = np.array([2**63], dtype=np.uint64)
+        expected = Series([1], index=[2**63])
+        result = algos.value_counts(arr)
+
+        tm.assert_series_equal(result, expected)
+
+        arr = np.array([-1, 2**63], dtype=object)
+        expected = Series([1, 1], index=[-1, 2**63])
+        result = algos.value_counts(arr)
+
+        # 32-bit linux has a different ordering
+        if not compat.is_platform_32bit():
+            tm.assert_series_equal(result, expected)
+
+
+class TestDuplicated(object):
+
+    def test_duplicated_with_nas(self):
+        keys = np.array([0, 1, np.nan, 0, 2, np.nan], dtype=object)
+
+        result = algos.duplicated(keys)
+        expected = np.array([False, False, False, True, False, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = algos.duplicated(keys, keep='first')
+        expected = np.array([False, False, False, True, False, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = algos.duplicated(keys, keep='last')
+        expected = np.array([True, False, True, False, False, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = algos.duplicated(keys, keep=False)
+        expected = np.array([True, False, True, True, False, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+        keys = np.empty(8, dtype=object)
+        for i, t in enumerate(zip([0, 0, np.nan, np.nan] * 2,
+                                  [0, np.nan, 0, np.nan] * 2)):
+            keys[i] = t
+
+        result = algos.duplicated(keys)
+        falses = [False] * 4
+        trues = [True] * 4
+        expected = np.array(falses + trues)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = algos.duplicated(keys, keep='last')
+        expected = np.array(trues + falses)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = algos.duplicated(keys, keep=False)
+        expected = np.array(trues + trues)
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('case', [
+        np.array([1, 2, 1, 5, 3,
+                  2, 4, 1, 5, 6]),
+        np.array([1.1, 2.2, 1.1, np.nan, 3.3,
+                  2.2, 4.4, 1.1, np.nan, 6.6]),
+        pytest.param(np.array([1 + 1j, 2 + 2j, 1 + 1j, 5 + 5j, 3 + 3j,
+                               2 + 2j, 4 + 4j, 1 + 1j, 5 + 5j, 6 + 6j]),
+                     marks=pytest.mark.xfail(reason="Complex bug. GH 16399")
+                     ),
+        np.array(['a', 'b', 'a', 'e', 'c',
+                  'b', 'd', 'a', 'e', 'f'], dtype=object),
+        np.array([1, 2**63, 1, 3**5, 10, 2**63, 39, 1, 3**5, 7],
+                 dtype=np.uint64),
+    ])
+    def test_numeric_object_likes(self, case):
+        exp_first = np.array([False, False, True, False, False,
+                              True, False, True, True, False])
+        exp_last = np.array([True, True, True, True, False,
+                             False, False, False, False, False])
+        exp_false = exp_first | exp_last
+
+        res_first = algos.duplicated(case, keep='first')
+        tm.assert_numpy_array_equal(res_first, exp_first)
+
+        res_last = algos.duplicated(case, keep='last')
+        tm.assert_numpy_array_equal(res_last, exp_last)
+
+        res_false = algos.duplicated(case, keep=False)
+        tm.assert_numpy_array_equal(res_false, exp_false)
+
+        # index
+        for idx in [Index(case), Index(case, dtype='category')]:
+            res_first = idx.duplicated(keep='first')
+            tm.assert_numpy_array_equal(res_first, exp_first)
+
+            res_last = idx.duplicated(keep='last')
+            tm.assert_numpy_array_equal(res_last, exp_last)
+
+            res_false = idx.duplicated(keep=False)
+            tm.assert_numpy_array_equal(res_false, exp_false)
+
+        # series
+        for s in [Series(case), Series(case, dtype='category')]:
+            res_first = s.duplicated(keep='first')
+            tm.assert_series_equal(res_first, Series(exp_first))
+
+            res_last = s.duplicated(keep='last')
+            tm.assert_series_equal(res_last, Series(exp_last))
+
+            res_false = s.duplicated(keep=False)
+            tm.assert_series_equal(res_false, Series(exp_false))
+
+    def test_datetime_likes(self):
+
+        dt = ['2011-01-01', '2011-01-02', '2011-01-01', 'NaT', '2011-01-03',
+              '2011-01-02', '2011-01-04', '2011-01-01', 'NaT', '2011-01-06']
+        td = ['1 days', '2 days', '1 days', 'NaT', '3 days',
+              '2 days', '4 days', '1 days', 'NaT', '6 days']
+
+        cases = [np.array([Timestamp(d) for d in dt]),
+                 np.array([Timestamp(d, tz='US/Eastern') for d in dt]),
+                 np.array([pd.Period(d, freq='D') for d in dt]),
+                 np.array([np.datetime64(d) for d in dt]),
+                 np.array([pd.Timedelta(d) for d in td])]
+
+        exp_first = np.array([False, False, True, False, False,
+                              True, False, True, True, False])
+        exp_last = np.array([True, True, True, True, False,
+                             False, False, False, False, False])
+        exp_false = exp_first | exp_last
+
+        for case in cases:
+            res_first = algos.duplicated(case, keep='first')
+            tm.assert_numpy_array_equal(res_first, exp_first)
+
+            res_last = algos.duplicated(case, keep='last')
+            tm.assert_numpy_array_equal(res_last, exp_last)
+
+            res_false = algos.duplicated(case, keep=False)
+            tm.assert_numpy_array_equal(res_false, exp_false)
+
+            # index
+            for idx in [Index(case), Index(case, dtype='category'),
+                        Index(case, dtype=object)]:
+                res_first = idx.duplicated(keep='first')
+                tm.assert_numpy_array_equal(res_first, exp_first)
+
+                res_last = idx.duplicated(keep='last')
+                tm.assert_numpy_array_equal(res_last, exp_last)
+
+                res_false = idx.duplicated(keep=False)
+                tm.assert_numpy_array_equal(res_false, exp_false)
+
+            # series
+            for s in [Series(case), Series(case, dtype='category'),
+                      Series(case, dtype=object)]:
+                res_first = s.duplicated(keep='first')
+                tm.assert_series_equal(res_first, Series(exp_first))
+
+                res_last = s.duplicated(keep='last')
+                tm.assert_series_equal(res_last, Series(exp_last))
+
+                res_false = s.duplicated(keep=False)
+                tm.assert_series_equal(res_false, Series(exp_false))
+
+    def test_unique_index(self):
+        cases = [Index([1, 2, 3]), pd.RangeIndex(0, 3)]
+        for case in cases:
+            assert case.is_unique
+            tm.assert_numpy_array_equal(case.duplicated(),
+                                        np.array([False, False, False]))
+
+    @pytest.mark.parametrize('arr, unique', [
+        ([(0, 0), (0, 1), (1, 0), (1, 1), (0, 0), (0, 1), (1, 0), (1, 1)],
+         [(0, 0), (0, 1), (1, 0), (1, 1)]),
+        ([('b', 'c'), ('a', 'b'), ('a', 'b'), ('b', 'c')],
+         [('b', 'c'), ('a', 'b')]),
+        ([('a', 1), ('b', 2), ('a', 3), ('a', 1)],
+         [('a', 1), ('b', 2), ('a', 3)]),
+    ])
+    def test_unique_tuples(self, arr, unique):
+        # https://github.com/pandas-dev/pandas/issues/16519
+        expected = np.empty(len(unique), dtype=object)
+        expected[:] = unique
+
+        result = pd.unique(arr)
+        tm.assert_numpy_array_equal(result, expected)
 
 
 class GroupVarTestMixin(object):
@@ -502,7 +976,7 @@ def test_group_var_generic_1d(self):
         expected_counts = counts + 3
 
         self.algo(out, counts, values, labels)
-        np.testing.assert_allclose(out, expected_out, self.rtol)
+        assert np.allclose(out, expected_out, self.rtol)
         tm.assert_numpy_array_equal(counts, expected_counts)
 
     def test_group_var_generic_1d_flat_labels(self):
@@ -518,7 +992,7 @@ def test_group_var_generic_1d_flat_labels(self):
 
         self.algo(out, counts, values, labels)
 
-        np.testing.assert_allclose(out, expected_out, self.rtol)
+        assert np.allclose(out, expected_out, self.rtol)
         tm.assert_numpy_array_equal(counts, expected_counts)
 
     def test_group_var_generic_2d_all_finite(self):
@@ -529,12 +1003,11 @@ def test_group_var_generic_2d_all_finite(self):
         values = 10 * prng.rand(10, 2).astype(self.dtype)
         labels = np.tile(np.arange(5), (2, )).astype('int64')
 
-        expected_out = np.std(
-            values.reshape(2, 5, 2), ddof=1, axis=0) ** 2
+        expected_out = np.std(values.reshape(2, 5, 2), ddof=1, axis=0) ** 2
         expected_counts = counts + 2
 
         self.algo(out, counts, values, labels)
-        np.testing.assert_allclose(out, expected_out, self.rtol)
+        assert np.allclose(out, expected_out, self.rtol)
         tm.assert_numpy_array_equal(counts, expected_counts)
 
     def test_group_var_generic_2d_some_nan(self):
@@ -546,36 +1019,35 @@ def test_group_var_generic_2d_some_nan(self):
         values[:, 1] = np.nan
         labels = np.tile(np.arange(5), (2, )).astype('int64')
 
-        expected_out = np.vstack([
-            values[:, 0].reshape(5, 2, order='F').std(ddof=1, axis=1) ** 2,
-            np.nan * np.ones(5)
-        ]).T
+        expected_out = np.vstack([values[:, 0]
+                                  .reshape(5, 2, order='F')
+                                  .std(ddof=1, axis=1) ** 2,
+                                  np.nan * np.ones(5)]).T.astype(self.dtype)
         expected_counts = counts + 2
 
         self.algo(out, counts, values, labels)
-        np.testing.assert_allclose(out, expected_out, self.rtol)
+        tm.assert_almost_equal(out, expected_out, check_less_precise=6)
         tm.assert_numpy_array_equal(counts, expected_counts)
 
     def test_group_var_constant(self):
         # Regression test from GH 10448.
 
         out = np.array([[np.nan]], dtype=self.dtype)
-        counts = np.array([0],dtype='int64')
+        counts = np.array([0], dtype='int64')
         values = 0.832845131556193 * np.ones((3, 1), dtype=self.dtype)
         labels = np.zeros(3, dtype='int64')
 
         self.algo(out, counts, values, labels)
 
-        self.assertEqual(counts[0], 3)
-        self.assertTrue(out[0, 0] >= 0)  # Python 2.6 has no assertGreaterEqual
+        assert counts[0] == 3
+        assert out[0, 0] >= 0
         tm.assert_almost_equal(out[0, 0], 0.0)
 
 
-class TestGroupVarFloat64(tm.TestCase, GroupVarTestMixin):
+class TestGroupVarFloat64(GroupVarTestMixin):
     __test__ = True
-    _multiprocess_can_split_ = True
 
-    algo = algos.algos.group_var_float64
+    algo = libgroupby.group_var_float64
     dtype = np.float64
     rtol = 1e-5
 
@@ -584,26 +1056,81 @@ def test_group_var_large_inputs(self):
         prng = RandomState(1234)
 
         out = np.array([[np.nan]], dtype=self.dtype)
-        counts = np.array([0],dtype='int64')
+        counts = np.array([0], dtype='int64')
         values = (prng.rand(10 ** 6) + 10 ** 12).astype(self.dtype)
         values.shape = (10 ** 6, 1)
         labels = np.zeros(10 ** 6, dtype='int64')
 
         self.algo(out, counts, values, labels)
 
-        self.assertEqual(counts[0], 10 ** 6)
+        assert counts[0] == 10 ** 6
         tm.assert_almost_equal(out[0, 0], 1.0 / 12, check_less_precise=True)
 
 
-class TestGroupVarFloat32(tm.TestCase, GroupVarTestMixin):
+class TestGroupVarFloat32(GroupVarTestMixin):
     __test__ = True
-    _multiprocess_can_split_ = True
 
-    algo = algos.algos.group_var_float32
+    algo = libgroupby.group_var_float32
     dtype = np.float32
     rtol = 1e-2
 
 
+class TestHashTable(object):
+
+    def test_lookup_nan(self):
+        xs = np.array([2.718, 3.14, np.nan, -7, 5, 2, 3])
+        m = ht.Float64HashTable()
+        m.map_locations(xs)
+        tm.assert_numpy_array_equal(m.lookup(xs), np.arange(len(xs),
+                                                            dtype=np.int64))
+
+    def test_lookup_overflow(self):
+        xs = np.array([1, 2, 2**63], dtype=np.uint64)
+        m = ht.UInt64HashTable()
+        m.map_locations(xs)
+        tm.assert_numpy_array_equal(m.lookup(xs), np.arange(len(xs),
+                                                            dtype=np.int64))
+
+    def test_get_unique(self):
+        s = Series([1, 2, 2**63, 2**63], dtype=np.uint64)
+        exp = np.array([1, 2, 2**63], dtype=np.uint64)
+        tm.assert_numpy_array_equal(s.unique(), exp)
+
+    def test_vector_resize(self):
+        # Test for memory errors after internal vector
+        # reallocations (pull request #7157)
+
+        def _test_vector_resize(htable, uniques, dtype, nvals, safely_resizes):
+            vals = np.array(np.random.randn(1000), dtype=dtype)
+            # get_labels may append to uniques
+            htable.get_labels(vals[:nvals], uniques, 0, -1)
+            # to_array() set an external_view_exists flag on uniques.
+            tmp = uniques.to_array()
+            oldshape = tmp.shape
+            # subsequent get_labels() calls can no longer append to it
+            # (for all but StringHashTables + ObjectVector)
+            if safely_resizes:
+                htable.get_labels(vals, uniques, 0, -1)
+            else:
+                with pytest.raises(ValueError) as excinfo:
+                    htable.get_labels(vals, uniques, 0, -1)
+                assert str(excinfo.value).startswith('external reference')
+            uniques.to_array()   # should not raise here
+            assert tmp.shape == oldshape
+
+        test_cases = [
+            (ht.PyObjectHashTable, ht.ObjectVector, 'object', False),
+            (ht.StringHashTable, ht.ObjectVector, 'object', True),
+            (ht.Float64HashTable, ht.Float64Vector, 'float64', False),
+            (ht.Int64HashTable, ht.Int64Vector, 'int64', False),
+            (ht.UInt64HashTable, ht.UInt64Vector, 'uint64', False)]
+
+        for (tbl, vect, dtype, safely_resizes) in test_cases:
+            # resizing to empty is a special case
+            _test_vector_resize(tbl(), vect(), dtype, 0, safely_resizes)
+            _test_vector_resize(tbl(), vect(), dtype, 10, safely_resizes)
+
+
 def test_quantile():
     s = Series(np.random.randn(100))
 
@@ -611,22 +1138,437 @@ def test_quantile():
     expected = algos.quantile(s.values, [0, .25, .5, .75, 1.])
     tm.assert_almost_equal(result, expected)
 
+
 def test_unique_label_indices():
-    from pandas.hashtable import unique_label_indices
 
     a = np.random.randint(1, 1 << 10, 1 << 15).astype('i8')
 
     left = unique_label_indices(a)
     right = np.unique(a, return_index=True)[1]
 
-    tm.assert_numpy_array_equal(left, right)
+    tm.assert_numpy_array_equal(left, right,
+                                check_dtype=False)
 
     a[np.random.choice(len(a), 10)] = -1
-    left= unique_label_indices(a)
+    left = unique_label_indices(a)
     right = np.unique(a, return_index=True)[1][1:]
-    tm.assert_numpy_array_equal(left, right)
+    tm.assert_numpy_array_equal(left, right,
+                                check_dtype=False)
 
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
+
+class TestRank(object):
+
+    @td.skip_if_no_scipy
+    def test_scipy_compat(self):
+        from scipy.stats import rankdata
+
+        def _check(arr):
+            mask = ~np.isfinite(arr)
+            arr = arr.copy()
+            result = libalgos.rank_1d_float64(arr)
+            arr[mask] = np.inf
+            exp = rankdata(arr)
+            exp[mask] = nan
+            assert_almost_equal(result, exp)
+
+        _check(np.array([nan, nan, 5., 5., 5., nan, 1, 2, 3, nan]))
+        _check(np.array([4., nan, 5., 5., 5., nan, 1, 2, 4., nan]))
+
+    def test_basic(self):
+        exp = np.array([1, 2], dtype=np.float64)
+
+        for dtype in np.typecodes['AllInteger']:
+            s = Series([1, 100], dtype=dtype)
+            tm.assert_numpy_array_equal(algos.rank(s), exp)
+
+    def test_uint64_overflow(self):
+        exp = np.array([1, 2], dtype=np.float64)
+
+        for dtype in [np.float64, np.uint64]:
+            s = Series([1, 2**63], dtype=dtype)
+            tm.assert_numpy_array_equal(algos.rank(s), exp)
+
+    def test_too_many_ndims(self):
+        arr = np.array([[[1, 2, 3], [4, 5, 6], [7, 8, 9]]])
+        msg = "Array with ndim > 2 are not supported"
+
+        with tm.assert_raises_regex(TypeError, msg):
+            algos.rank(arr)
+
+
+def test_pad_backfill_object_segfault():
+
+    old = np.array([], dtype='O')
+    new = np.array([datetime(2010, 12, 31)], dtype='O')
+
+    result = libalgos.pad_object(old, new)
+    expected = np.array([-1], dtype=np.int64)
+    tm.assert_numpy_array_equal(result, expected)
+
+    result = libalgos.pad_object(new, old)
+    expected = np.array([], dtype=np.int64)
+    tm.assert_numpy_array_equal(result, expected)
+
+    result = libalgos.backfill_object(old, new)
+    expected = np.array([-1], dtype=np.int64)
+    tm.assert_numpy_array_equal(result, expected)
+
+    result = libalgos.backfill_object(new, old)
+    expected = np.array([], dtype=np.int64)
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_arrmap():
+    values = np.array(['foo', 'foo', 'bar', 'bar', 'baz', 'qux'], dtype='O')
+    result = libalgos.arrmap_object(values, lambda x: x in ['foo', 'bar'])
+    assert (result.dtype == np.bool_)
+
+
+class TestTseriesUtil(object):
+
+    def test_combineFunc(self):
+        pass
+
+    def test_reindex(self):
+        pass
+
+    def test_isna(self):
+        pass
+
+    def test_groupby(self):
+        pass
+
+    def test_groupby_withnull(self):
+        pass
+
+    def test_backfill(self):
+        old = Index([1, 5, 10])
+        new = Index(lrange(12))
+
+        filler = libalgos.backfill_int64(old.values, new.values)
+
+        expect_filler = np.array([0, 0, 1, 1, 1, 1,
+                                  2, 2, 2, 2, 2, -1], dtype=np.int64)
+        tm.assert_numpy_array_equal(filler, expect_filler)
+
+        # corner case
+        old = Index([1, 4])
+        new = Index(lrange(5, 10))
+        filler = libalgos.backfill_int64(old.values, new.values)
+
+        expect_filler = np.array([-1, -1, -1, -1, -1], dtype=np.int64)
+        tm.assert_numpy_array_equal(filler, expect_filler)
+
+    def test_pad(self):
+        old = Index([1, 5, 10])
+        new = Index(lrange(12))
+
+        filler = libalgos.pad_int64(old.values, new.values)
+
+        expect_filler = np.array([-1, 0, 0, 0, 0, 1,
+                                  1, 1, 1, 1, 2, 2], dtype=np.int64)
+        tm.assert_numpy_array_equal(filler, expect_filler)
+
+        # corner case
+        old = Index([5, 10])
+        new = Index(lrange(5))
+        filler = libalgos.pad_int64(old.values, new.values)
+        expect_filler = np.array([-1, -1, -1, -1, -1], dtype=np.int64)
+        tm.assert_numpy_array_equal(filler, expect_filler)
+
+
+def test_is_lexsorted():
+    failure = [
+        np.array([3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
+                  3, 3,
+                  3, 3,
+                  3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 2, 2, 2, 2, 2, 2,
+                  2, 2, 2, 2, 2, 2, 2,
+                  2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
+                  1, 1, 1, 1, 1, 1, 1,
+                  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+                  1, 1, 1, 1, 1, 1, 1,
+                  1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+                  0, 0, 0, 0, 0, 0, 0,
+                  0, 0, 0, 0, 0, 0, 0, 0, 0], dtype='int64'),
+        np.array([30, 29, 28, 27, 26, 25, 24, 23, 22, 21, 20, 19, 18, 17, 16,
+                  15, 14,
+                  13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0, 30, 29, 28,
+                  27, 26, 25, 24, 23, 22, 21, 20, 19, 18, 17, 16, 15, 14, 13,
+                  12, 11,
+                  10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0, 30, 29, 28, 27, 26, 25,
+                  24, 23, 22, 21, 20, 19, 18, 17, 16, 15, 14, 13, 12, 11, 10,
+                  9, 8,
+                  7, 6, 5, 4, 3, 2, 1, 0, 30, 29, 28, 27, 26, 25, 24, 23, 22,
+                  21, 20, 19, 18, 17, 16, 15, 14, 13, 12, 11, 10, 9, 8, 7,
+                  6, 5,
+                  4, 3, 2, 1, 0], dtype='int64')]
+
+    assert (not libalgos.is_lexsorted(failure))
+
+
+def test_groupsort_indexer():
+    a = np.random.randint(0, 1000, 100).astype(np.int64)
+    b = np.random.randint(0, 1000, 100).astype(np.int64)
+
+    result = libalgos.groupsort_indexer(a, 1000)[0]
+
+    # need to use a stable sort
+    # np.argsort returns int, groupsort_indexer
+    # always returns int64
+    expected = np.argsort(a, kind='mergesort')
+    expected = expected.astype(np.int64)
+
+    tm.assert_numpy_array_equal(result, expected)
+
+    # compare with lexsort
+    # np.lexsort returns int, groupsort_indexer
+    # always returns int64
+    key = a * 1000 + b
+    result = libalgos.groupsort_indexer(key, 1000000)[0]
+    expected = np.lexsort((b, a))
+    expected = expected.astype(np.int64)
+
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_infinity_sort():
+    # GH 13445
+    # numpy's argsort can be unhappy if something is less than
+    # itself.  Instead, let's give our infinities a self-consistent
+    # ordering, but outside the float extended real line.
+
+    Inf = libalgos.Infinity()
+    NegInf = libalgos.NegInfinity()
+
+    ref_nums = [NegInf, float("-inf"), -1e100, 0, 1e100, float("inf"), Inf]
+
+    assert all(Inf >= x for x in ref_nums)
+    assert all(Inf > x or x is Inf for x in ref_nums)
+    assert Inf >= Inf and Inf == Inf
+    assert not Inf < Inf and not Inf > Inf
+    assert libalgos.Infinity() == libalgos.Infinity()
+    assert not libalgos.Infinity() != libalgos.Infinity()
+
+    assert all(NegInf <= x for x in ref_nums)
+    assert all(NegInf < x or x is NegInf for x in ref_nums)
+    assert NegInf <= NegInf and NegInf == NegInf
+    assert not NegInf < NegInf and not NegInf > NegInf
+    assert libalgos.NegInfinity() == libalgos.NegInfinity()
+    assert not libalgos.NegInfinity() != libalgos.NegInfinity()
+
+    for perm in permutations(ref_nums):
+        assert sorted(perm) == ref_nums
+
+    # smoke tests
+    np.array([libalgos.Infinity()] * 32).argsort()
+    np.array([libalgos.NegInfinity()] * 32).argsort()
+
+
+def test_infinity_against_nan():
+    Inf = libalgos.Infinity()
+    NegInf = libalgos.NegInfinity()
+
+    assert not Inf > np.nan
+    assert not Inf >= np.nan
+    assert not Inf < np.nan
+    assert not Inf <= np.nan
+    assert not Inf == np.nan
+    assert Inf != np.nan
+
+    assert not NegInf > np.nan
+    assert not NegInf >= np.nan
+    assert not NegInf < np.nan
+    assert not NegInf <= np.nan
+    assert not NegInf == np.nan
+    assert NegInf != np.nan
+
+
+def test_ensure_platform_int():
+    arr = np.arange(100, dtype=np.intp)
+
+    result = libalgos.ensure_platform_int(arr)
+    assert (result is arr)
+
+
+def test_int64_add_overflow():
+    # see gh-14068
+    msg = "Overflow in int64 addition"
+    m = np.iinfo(np.int64).max
+    n = np.iinfo(np.int64).min
+
+    with tm.assert_raises_regex(OverflowError, msg):
+        algos.checked_add_with_arr(np.array([m, m]), m)
+    with tm.assert_raises_regex(OverflowError, msg):
+        algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]))
+    with tm.assert_raises_regex(OverflowError, msg):
+        algos.checked_add_with_arr(np.array([n, n]), n)
+    with tm.assert_raises_regex(OverflowError, msg):
+        algos.checked_add_with_arr(np.array([n, n]), np.array([n, n]))
+    with tm.assert_raises_regex(OverflowError, msg):
+        algos.checked_add_with_arr(np.array([m, n]), np.array([n, n]))
+    with tm.assert_raises_regex(OverflowError, msg):
+        algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
+                                   arr_mask=np.array([False, True]))
+    with tm.assert_raises_regex(OverflowError, msg):
+        algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
+                                   b_mask=np.array([False, True]))
+    with tm.assert_raises_regex(OverflowError, msg):
+        algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
+                                   arr_mask=np.array([False, True]),
+                                   b_mask=np.array([False, True]))
+    with tm.assert_raises_regex(OverflowError, msg):
+        with tm.assert_produces_warning(RuntimeWarning):
+            algos.checked_add_with_arr(np.array([m, m]),
+                                       np.array([np.nan, m]))
+
+    # Check that the nan boolean arrays override whether or not
+    # the addition overflows. We don't check the result but just
+    # the fact that an OverflowError is not raised.
+    with pytest.raises(AssertionError):
+        with tm.assert_raises_regex(OverflowError, msg):
+            algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
+                                       arr_mask=np.array([True, True]))
+    with pytest.raises(AssertionError):
+        with tm.assert_raises_regex(OverflowError, msg):
+            algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
+                                       b_mask=np.array([True, True]))
+    with pytest.raises(AssertionError):
+        with tm.assert_raises_regex(OverflowError, msg):
+            algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
+                                       arr_mask=np.array([True, False]),
+                                       b_mask=np.array([False, True]))
+
+
+class TestMode(object):
+
+    def test_no_mode(self):
+        exp = Series([], dtype=np.float64)
+        tm.assert_series_equal(algos.mode([]), exp)
+
+    def test_mode_single(self):
+        # GH 15714
+        exp_single = [1]
+        data_single = [1]
+
+        exp_multi = [1]
+        data_multi = [1, 1]
+
+        for dt in np.typecodes['AllInteger'] + np.typecodes['Float']:
+            s = Series(data_single, dtype=dt)
+            exp = Series(exp_single, dtype=dt)
+            tm.assert_series_equal(algos.mode(s), exp)
+
+            s = Series(data_multi, dtype=dt)
+            exp = Series(exp_multi, dtype=dt)
+            tm.assert_series_equal(algos.mode(s), exp)
+
+        exp = Series([1], dtype=np.int)
+        tm.assert_series_equal(algos.mode([1]), exp)
+
+        exp = Series(['a', 'b', 'c'], dtype=np.object)
+        tm.assert_series_equal(algos.mode(['a', 'b', 'c']), exp)
+
+    def test_number_mode(self):
+        exp_single = [1]
+        data_single = [1] * 5 + [2] * 3
+
+        exp_multi = [1, 3]
+        data_multi = [1] * 5 + [2] * 3 + [3] * 5
+
+        for dt in np.typecodes['AllInteger'] + np.typecodes['Float']:
+            s = Series(data_single, dtype=dt)
+            exp = Series(exp_single, dtype=dt)
+            tm.assert_series_equal(algos.mode(s), exp)
+
+            s = Series(data_multi, dtype=dt)
+            exp = Series(exp_multi, dtype=dt)
+            tm.assert_series_equal(algos.mode(s), exp)
+
+    def test_strobj_mode(self):
+        exp = ['b']
+        data = ['a'] * 2 + ['b'] * 3
+
+        s = Series(data, dtype='c')
+        exp = Series(exp, dtype='c')
+        tm.assert_series_equal(algos.mode(s), exp)
+
+        exp = ['bar']
+        data = ['foo'] * 2 + ['bar'] * 3
+
+        for dt in [str, object]:
+            s = Series(data, dtype=dt)
+            exp = Series(exp, dtype=dt)
+            tm.assert_series_equal(algos.mode(s), exp)
+
+    def test_datelike_mode(self):
+        exp = Series(['1900-05-03', '2011-01-03',
+                      '2013-01-02'], dtype="M8[ns]")
+        s = Series(['2011-01-03', '2013-01-02',
+                    '1900-05-03'], dtype='M8[ns]')
+        tm.assert_series_equal(algos.mode(s), exp)
+
+        exp = Series(['2011-01-03', '2013-01-02'], dtype='M8[ns]')
+        s = Series(['2011-01-03', '2013-01-02', '1900-05-03',
+                    '2011-01-03', '2013-01-02'], dtype='M8[ns]')
+        tm.assert_series_equal(algos.mode(s), exp)
+
+    def test_timedelta_mode(self):
+        exp = Series(['-1 days', '0 days', '1 days'],
+                     dtype='timedelta64[ns]')
+        s = Series(['1 days', '-1 days', '0 days'],
+                   dtype='timedelta64[ns]')
+        tm.assert_series_equal(algos.mode(s), exp)
+
+        exp = Series(['2 min', '1 day'], dtype='timedelta64[ns]')
+        s = Series(['1 day', '1 day', '-1 day', '-1 day 2 min',
+                    '2 min', '2 min'], dtype='timedelta64[ns]')
+        tm.assert_series_equal(algos.mode(s), exp)
+
+    def test_mixed_dtype(self):
+        exp = Series(['foo'])
+        s = Series([1, 'foo', 'foo'])
+        tm.assert_series_equal(algos.mode(s), exp)
+
+    def test_uint64_overflow(self):
+        exp = Series([2**63], dtype=np.uint64)
+        s = Series([1, 2**63, 2**63], dtype=np.uint64)
+        tm.assert_series_equal(algos.mode(s), exp)
+
+        exp = Series([1, 2**63], dtype=np.uint64)
+        s = Series([1, 2**63], dtype=np.uint64)
+        tm.assert_series_equal(algos.mode(s), exp)
+
+    def test_categorical(self):
+        c = Categorical([1, 2])
+        exp = c
+        tm.assert_categorical_equal(algos.mode(c), exp)
+        tm.assert_categorical_equal(c.mode(), exp)
+
+        c = Categorical([1, 'a', 'a'])
+        exp = Categorical(['a'], categories=[1, 'a'])
+        tm.assert_categorical_equal(algos.mode(c), exp)
+        tm.assert_categorical_equal(c.mode(), exp)
+
+        c = Categorical([1, 1, 2, 3, 3])
+        exp = Categorical([1, 3], categories=[1, 2, 3])
+        tm.assert_categorical_equal(algos.mode(c), exp)
+        tm.assert_categorical_equal(c.mode(), exp)
+
+    def test_index(self):
+        idx = Index([1, 2, 3])
+        exp = Series([1, 2, 3], dtype=np.int64)
+        tm.assert_series_equal(algos.mode(idx), exp)
+
+        idx = Index([1, 'a', 'a'])
+        exp = Series(['a'], dtype=object)
+        tm.assert_series_equal(algos.mode(idx), exp)
+
+        idx = Index([1, 1, 2, 3, 3])
+        exp = Series([1, 3], dtype=np.int64)
+        tm.assert_series_equal(algos.mode(idx), exp)
+
+        exp = Series(['2 min', '1 day'], dtype='timedelta64[ns]')
+        idx = Index(['1 day', '1 day', '-1 day', '-1 day 2 min',
+                     '2 min', '2 min'], dtype='timedelta64[ns]')
+        tm.assert_series_equal(algos.mode(idx), exp)
diff --git a/pandas/tests/test_base.py b/pandas/tests/test_base.py
index fb255f300ebdd..a5d83c1c26948 100644
--- a/pandas/tests/test_base.py
+++ b/pandas/tests/test_base.py
@@ -1,65 +1,79 @@
 # -*- coding: utf-8 -*-
 from __future__ import print_function
+
 import re
+import sys
 from datetime import datetime, timedelta
+import pytest
 import numpy as np
-import pandas.compat as compat
-import pandas as pd
-from pandas.compat import u, StringIO
-from pandas.core.base import FrozenList, FrozenNDArray, PandasDelegate
-import pandas.core.common as com
-from pandas.tseries.base import DatetimeIndexOpsMixin
-from pandas.util.testing import assertRaisesRegexp, assertIsInstance
-from pandas.tseries.common import is_datetimelike
-from pandas import Series, Index, Int64Index, DatetimeIndex, TimedeltaIndex, PeriodIndex, Timedelta
-import pandas.tslib as tslib
-from pandas import _np_version_under1p9
-import nose
 
+import pandas as pd
+import pandas.compat as compat
+from pandas.core.dtypes.common import (
+    is_object_dtype, is_datetimetz, is_datetime64_dtype,
+    needs_i8_conversion)
 import pandas.util.testing as tm
+from pandas import (Series, Index, DatetimeIndex, TimedeltaIndex,
+                    PeriodIndex, Timedelta, IntervalIndex, Interval,
+                    CategoricalIndex, Timestamp)
+from pandas.compat import StringIO, PYPY, long
+from pandas.compat.numpy import np_array_datetime64_compat
+from pandas.core.accessor import PandasDelegate
+from pandas.core.base import PandasObject, NoNewAttributesMixin
+from pandas.core.indexes.datetimelike import DatetimeIndexOpsMixin
+from pandas._libs.tslib import iNaT
+
 
 class CheckStringMixin(object):
+
     def test_string_methods_dont_fail(self):
         repr(self.container)
         str(self.container)
         bytes(self.container)
         if not compat.PY3:
-            unicode(self.container)
+            unicode(self.container)  # noqa
 
     def test_tricky_container(self):
         if not hasattr(self, 'unicode_container'):
-            raise nose.SkipTest('Need unicode_container to test with this')
+            pytest.skip('Need unicode_container to test with this')
         repr(self.unicode_container)
         str(self.unicode_container)
         bytes(self.unicode_container)
         if not compat.PY3:
-            unicode(self.unicode_container)
+            unicode(self.unicode_container)  # noqa
 
 
 class CheckImmutable(object):
     mutable_regex = re.compile('does not support mutable operations')
 
     def check_mutable_error(self, *args, **kwargs):
-        # pass whatever functions you normally would to assertRaises (after the Exception kind)
-        assertRaisesRegexp(TypeError, self.mutable_regex, *args, **kwargs)
+        # Pass whatever function you normally would to assert_raises_regex
+        # (after the Exception kind).
+        tm.assert_raises_regex(
+            TypeError, self.mutable_regex, *args, **kwargs)
 
     def test_no_mutable_funcs(self):
-        def setitem(): self.container[0] = 5
+        def setitem():
+            self.container[0] = 5
 
         self.check_mutable_error(setitem)
 
-        def setslice(): self.container[1:2] = 3
+        def setslice():
+            self.container[1:2] = 3
 
         self.check_mutable_error(setslice)
 
-        def delitem(): del self.container[0]
+        def delitem():
+            del self.container[0]
 
         self.check_mutable_error(delitem)
 
-        def delslice(): del self.container[0:3]
+        def delslice():
+            del self.container[0:3]
 
         self.check_mutable_error(delslice)
         mutable_methods = getattr(self, "mutable_methods", [])
+
         for meth in mutable_methods:
             self.check_mutable_error(getattr(self.container, meth))
 
@@ -70,139 +84,113 @@ def test_slicing_maintains_type(self):
 
     def check_result(self, result, expected, klass=None):
         klass = klass or self.klass
-        assertIsInstance(result, klass)
-        self.assertEqual(result, expected)
-
+        assert isinstance(result, klass)
+        assert result == expected
 
-class TestFrozenList(CheckImmutable, CheckStringMixin, tm.TestCase):
-    mutable_methods = ('extend', 'pop', 'remove', 'insert')
-    unicode_container = FrozenList([u("\u05d0"), u("\u05d1"), "c"])
 
-    def setUp(self):
-        self.lst = [1, 2, 3, 4, 5]
-        self.container = FrozenList(self.lst)
-        self.klass = FrozenList
+class TestPandasDelegate(object):
 
-    def test_add(self):
-        result = self.container + (1, 2, 3)
-        expected = FrozenList(self.lst + [1, 2, 3])
-        self.check_result(result, expected)
+    class Delegator(object):
+        _properties = ['foo']
+        _methods = ['bar']
 
-        result = (1, 2, 3) + self.container
-        expected = FrozenList([1, 2, 3] + self.lst)
-        self.check_result(result, expected)
+        def _set_foo(self, value):
+            self.foo = value
 
-    def test_inplace(self):
-        q = r = self.container
-        q += [5]
-        self.check_result(q, self.lst + [5])
-        # other shouldn't be mutated
-        self.check_result(r, self.lst)
-
-
-class TestFrozenNDArray(CheckImmutable, CheckStringMixin, tm.TestCase):
-    mutable_methods = ('put', 'itemset', 'fill')
-    unicode_container = FrozenNDArray([u("\u05d0"), u("\u05d1"), "c"])
-
-    def setUp(self):
-        self.lst = [3, 5, 7, -2]
-        self.container = FrozenNDArray(self.lst)
-        self.klass = FrozenNDArray
-
-    def test_shallow_copying(self):
-        original = self.container.copy()
-        assertIsInstance(self.container.view(), FrozenNDArray)
-        self.assertFalse(isinstance(self.container.view(np.ndarray), FrozenNDArray))
-        self.assertIsNot(self.container.view(), self.container)
-        self.assert_numpy_array_equal(self.container, original)
-        # shallow copy should be the same too
-        assertIsInstance(self.container._shallow_copy(), FrozenNDArray)
-        # setting should not be allowed
-        def testit(container): container[0] = 16
-
-        self.check_mutable_error(testit, self.container)
-
-    def test_values(self):
-        original = self.container.view(np.ndarray).copy()
-        n = original[0] + 15
-        vals = self.container.values()
-        self.assert_numpy_array_equal(original, vals)
-        self.assertIsNot(original, vals)
-        vals[0] = n
-        self.assert_numpy_array_equal(self.container, original)
-        self.assertEqual(vals[0], n)
-
-
-class TestPandasDelegate(tm.TestCase):
-
-    def setUp(self):
-        pass
-
-    def test_invalida_delgation(self):
-        # these show that in order for the delegation to work
-        # the _delegate_* methods need to be overriden to not raise a TypeError
+        def _get_foo(self):
+            return self.foo
 
-        class Delegator(object):
-            _properties = ['foo']
-            _methods = ['bar']
+        foo = property(_get_foo, _set_foo, doc="foo property")
 
-            def _set_foo(self, value):
-                self.foo = value
+        def bar(self, *args, **kwargs):
+            """ a test bar method """
+            pass
 
-            def _get_foo(self):
-                return self.foo
+    class Delegate(PandasDelegate, PandasObject):
 
-            foo = property(_get_foo, _set_foo, doc="foo property")
+        def __init__(self, obj):
+            self.obj = obj
 
-            def bar(self, *args, **kwargs):
-                """ a test bar method """
-                pass
-
-        class Delegate(PandasDelegate):
-            def __init__(self, obj):
-                self.obj = obj
-        Delegate._add_delegate_accessors(delegate=Delegator,
-                                         accessors=Delegator._properties,
-                                         typ='property')
-        Delegate._add_delegate_accessors(delegate=Delegator,
-                                         accessors=Delegator._methods,
-                                         typ='method')
+    def setup_method(self, method):
+        pass
 
-        delegate = Delegate(Delegator())
+    def test_invalid_delegation(self):
+        # these show that in order for the delegation to work
+        # the _delegate_* methods need to be overridden to not raise
+        # a TypeError
+
+        self.Delegate._add_delegate_accessors(
+            delegate=self.Delegator,
+            accessors=self.Delegator._properties,
+            typ='property'
+        )
+        self.Delegate._add_delegate_accessors(
+            delegate=self.Delegator,
+            accessors=self.Delegator._methods,
+            typ='method'
+        )
+
+        delegate = self.Delegate(self.Delegator())
 
         def f():
             delegate.foo
-        self.assertRaises(TypeError, f)
+
+        pytest.raises(TypeError, f)
+
         def f():
             delegate.foo = 5
-        self.assertRaises(TypeError, f)
+
+        pytest.raises(TypeError, f)
+
         def f():
             delegate.foo()
-        self.assertRaises(TypeError, f)
-
 
-class Ops(tm.TestCase):
-    def setUp(self):
-        self.bool_index    = tm.makeBoolIndex(10, name='a')
-        self.int_index     = tm.makeIntIndex(10, name='a')
-        self.float_index   = tm.makeFloatIndex(10, name='a')
-        self.dt_index      = tm.makeDateIndex(10, name='a')
-        self.dt_tz_index   = tm.makeDateIndex(10, name='a').tz_localize(tz='US/Eastern')
-        self.period_index  = tm.makePeriodIndex(10, name='a')
-        self.string_index  = tm.makeStringIndex(10, name='a')
-        self.unicode_index  = tm.makeUnicodeIndex(10, name='a')
+        pytest.raises(TypeError, f)
+
+    @pytest.mark.skipif(PYPY, reason="not relevant for PyPy")
+    def test_memory_usage(self):
+        # Delegate does not implement memory_usage.
+        # Check that we fall back to in-built `__sizeof__`
+        # GH 12924
+        delegate = self.Delegate(self.Delegator())
+        sys.getsizeof(delegate)
+
+
+class Ops(object):
+
+    def _allow_na_ops(self, obj):
+        """Whether to skip test cases including NaN"""
+        if (isinstance(obj, Index) and
+                (obj.is_boolean() or not obj._can_hold_na)):
+            # don't test boolean / int64 index
+            return False
+        return True
+
+    def setup_method(self, method):
+        self.bool_index = tm.makeBoolIndex(10, name='a')
+        self.int_index = tm.makeIntIndex(10, name='a')
+        self.float_index = tm.makeFloatIndex(10, name='a')
+        self.dt_index = tm.makeDateIndex(10, name='a')
+        self.dt_tz_index = tm.makeDateIndex(10, name='a').tz_localize(
+            tz='US/Eastern')
+        self.period_index = tm.makePeriodIndex(10, name='a')
+        self.string_index = tm.makeStringIndex(10, name='a')
+        self.unicode_index = tm.makeUnicodeIndex(10, name='a')
 
         arr = np.random.randn(10)
-        self.int_series    = Series(arr, index=self.int_index, name='a')
-        self.float_series  = Series(arr, index=self.float_index, name='a')
-        self.dt_series     = Series(arr, index=self.dt_index, name='a')
-        self.dt_tz_series  = self.dt_tz_index.to_series(keep_tz=True)
+        self.int_series = Series(arr, index=self.int_index, name='a')
+        self.float_series = Series(arr, index=self.float_index, name='a')
+        self.dt_series = Series(arr, index=self.dt_index, name='a')
+        self.dt_tz_series = self.dt_tz_index.to_series(keep_tz=True)
         self.period_series = Series(arr, index=self.period_index, name='a')
         self.string_series = Series(arr, index=self.string_index, name='a')
 
-        types = ['bool','int','float','dt', 'dt_tz', 'period','string', 'unicode']
-        fmts = [ "{0}_{1}".format(t,f) for t in types for f in ['index','series'] ]
-        self.objs = [ getattr(self,f) for f in fmts if getattr(self,f,None) is not None ]
+        types = ['bool', 'int', 'float', 'dt', 'dt_tz', 'period', 'string',
+                 'unicode']
+        fmts = ["{0}_{1}".format(t, f)
+                for t in types for f in ['index', 'series']]
+        self.objs = [getattr(self, f)
+                     for f in fmts if getattr(self, f, None) is not None]
 
     def check_ops_properties(self, props, filter=None, ignore_failures=False):
         for op in props:
@@ -216,36 +204,39 @@ def check_ops_properties(self, props, filter=None, ignore_failures=False):
 
                 try:
                     if isinstance(o, Series):
-                        expected = Series(getattr(o.index,op), index=o.index, name='a')
+                        expected = Series(
+                            getattr(o.index, op), index=o.index, name='a')
                     else:
                         expected = getattr(o, op)
                 except (AttributeError):
                     if ignore_failures:
                         continue
 
-                result = getattr(o,op)
+                result = getattr(o, op)
 
                 # these couuld be series, arrays or scalars
-                if isinstance(result,Series) and isinstance(expected,Series):
-                    tm.assert_series_equal(result,expected)
-                elif isinstance(result,Index) and isinstance(expected,Index):
-                    tm.assert_index_equal(result,expected)
-                elif isinstance(result,np.ndarray) and isinstance(expected,np.ndarray):
-                    self.assert_numpy_array_equal(result,expected)
+                if isinstance(result, Series) and isinstance(expected, Series):
+                    tm.assert_series_equal(result, expected)
+                elif isinstance(result, Index) and isinstance(expected, Index):
+                    tm.assert_index_equal(result, expected)
+                elif isinstance(result, np.ndarray) and isinstance(expected,
+                                                                   np.ndarray):
+                    tm.assert_numpy_array_equal(result, expected)
                 else:
-                    self.assertEqual(result, expected)
+                    assert result == expected
 
-            # freq raises AttributeError on an Int64Index because its not defined
-            # we mostly care about Series hwere anyhow
+            # freq raises AttributeError on an Int64Index because its not
+            # defined we mostly care about Series here anyhow
             if not ignore_failures:
                 for o in self.not_valid_objs:
 
-                    # an object that is datetimelike will raise a TypeError, otherwise
-                    # an AttributeError
+                    # an object that is datetimelike will raise a TypeError,
+                    # otherwise an AttributeError
                     if issubclass(type(o), DatetimeIndexOpsMixin):
-                        self.assertRaises(TypeError, lambda : getattr(o,op))
+                        pytest.raises(TypeError, lambda: getattr(o, op))
                     else:
-                        self.assertRaises(AttributeError, lambda : getattr(o,op))
+                        pytest.raises(AttributeError,
+                                      lambda: getattr(o, op))
 
     def test_binary_ops_docs(self):
         from pandas import DataFrame, Panel
@@ -256,24 +247,26 @@ def test_binary_ops_docs(self):
                   'pow': '**',
                   'truediv': '/',
                   'floordiv': '//'}
-        for op_name in ['add', 'sub', 'mul', 'mod', 'pow', 'truediv', 'floordiv']:
+        for op_name in ['add', 'sub', 'mul', 'mod', 'pow', 'truediv',
+                        'floordiv']:
             for klass in [Series, DataFrame, Panel]:
                 operand1 = klass.__name__.lower()
                 operand2 = 'other'
                 op = op_map[op_name]
                 expected_str = ' '.join([operand1, op, operand2])
-                self.assertTrue(expected_str in getattr(klass, op_name).__doc__)
+                assert expected_str in getattr(klass, op_name).__doc__
 
                 # reverse version of the binary ops
                 expected_str = ' '.join([operand2, op, operand1])
-                self.assertTrue(expected_str in getattr(klass, 'r' + op_name).__doc__)
+                assert expected_str in getattr(klass, 'r' + op_name).__doc__
+
 
 class TestIndexOps(Ops):
 
-    def setUp(self):
-        super(TestIndexOps, self).setUp()
-        self.is_valid_objs  = [ o for o in self.objs if o._allow_index_ops ]
-        self.not_valid_objs = [ o for o in self.objs if not o._allow_index_ops ]
+    def setup_method(self, method):
+        super(TestIndexOps, self).setup_method(method)
+        self.is_valid_objs = self.objs
+        self.not_valid_objs = []
 
     def test_none_comparison(self):
 
@@ -284,215 +277,248 @@ def test_none_comparison(self):
 
                 o[0] = np.nan
 
-                result = o == None
-                self.assertFalse(result.iat[0])
-                self.assertFalse(result.iat[1])
+                # noinspection PyComparisonWithNone
+                result = o == None  # noqa
+                assert not result.iat[0]
+                assert not result.iat[1]
 
-                result = o != None
-                self.assertTrue(result.iat[0])
-                self.assertTrue(result.iat[1])
+                # noinspection PyComparisonWithNone
+                result = o != None  # noqa
+                assert result.iat[0]
+                assert result.iat[1]
 
-                result = None == o
-                self.assertFalse(result.iat[0])
-                self.assertFalse(result.iat[1])
+                result = None == o  # noqa
+                assert not result.iat[0]
+                assert not result.iat[1]
 
                 # this fails for numpy < 1.9
                 # and oddly for *some* platforms
-                #result = None != o
-                #self.assertTrue(result.iat[0])
-                #self.assertTrue(result.iat[1])
-
-                result = None > o
-                self.assertFalse(result.iat[0])
-                self.assertFalse(result.iat[1])
-
-                result = o < None
-                self.assertFalse(result.iat[0])
-                self.assertFalse(result.iat[1])
+                # result = None != o  # noqa
+                # assert result.iat[0]
+                # assert result.iat[1]
+                if (is_datetime64_dtype(o) or is_datetimetz(o)):
+                    # Following DatetimeIndex (and Timestamp) convention,
+                    # inequality comparisons with Series[datetime64] raise
+                    with pytest.raises(TypeError):
+                        None > o
+                    with pytest.raises(TypeError):
+                        o > None
+                else:
+                    result = None > o
+                    assert not result.iat[0]
+                    assert not result.iat[1]
 
+                    result = o < None
+                    assert not result.iat[0]
+                    assert not result.iat[1]
 
     def test_ndarray_compat_properties(self):
 
         for o in self.objs:
+            # Check that we work.
+            for p in ['shape', 'dtype', 'T', 'nbytes']:
+                assert getattr(o, p, None) is not None
+
+            # deprecated properties
+            for p in ['flags', 'strides', 'itemsize']:
+                with tm.assert_produces_warning(FutureWarning):
+                    assert getattr(o, p, None) is not None
 
-            # check that we work
-            for p in ['shape', 'dtype', 'flags', 'T',
-                      'strides', 'itemsize', 'nbytes']:
-                self.assertIsNotNone(getattr(o, p, None))
-            self.assertTrue(hasattr(o, 'base'))
+            with tm.assert_produces_warning(FutureWarning):
+                assert hasattr(o, 'base')
 
-            # if we have a datetimelike dtype then needs a view to work
+            # If we have a datetime-like dtype then needs a view to work
             # but the user is responsible for that
             try:
-                self.assertIsNotNone(o.data)
+                with tm.assert_produces_warning(FutureWarning):
+                    assert o.data is not None
             except ValueError:
                 pass
 
-            self.assertRaises(ValueError, o.item)  # len > 1
-            self.assertEqual(o.ndim, 1)
-            self.assertEqual(o.size, len(o))
+            with pytest.raises(ValueError):
+                o.item()  # len > 1
 
-        self.assertEqual(Index([1]).item(), 1)
-        self.assertEqual(Series([1]).item(), 1)
+            assert o.ndim == 1
+            assert o.size == len(o)
+
+        assert Index([1]).item() == 1
+        assert Series([1]).item() == 1
 
     def test_ops(self):
-        for op in ['max','min']:
+        for op in ['max', 'min']:
             for o in self.objs:
-                result = getattr(o,op)()
+                result = getattr(o, op)()
                 if not isinstance(o, PeriodIndex):
                     expected = getattr(o.values, op)()
                 else:
-                    expected = pd.Period(ordinal=getattr(o.values, op)(), freq=o.freq)
+                    expected = pd.Period(
+                        ordinal=getattr(o._ndarray_values, op)(),
+                        freq=o.freq)
                 try:
-                    self.assertEqual(result, expected)
+                    assert result == expected
                 except TypeError:
-                    # comparing tz-aware series with np.array results in TypeError
+                    # comparing tz-aware series with np.array results in
+                    # TypeError
                     expected = expected.astype('M8[ns]').astype('int64')
-                    self.assertEqual(result.value, expected)
+                    assert result.value == expected
 
     def test_nanops(self):
         # GH 7261
-        for op in ['max','min']:
+        for op in ['max', 'min']:
             for klass in [Index, Series]:
 
                 obj = klass([np.nan, 2.0])
-                self.assertEqual(getattr(obj, op)(), 2.0)
+                assert getattr(obj, op)() == 2.0
 
                 obj = klass([np.nan])
-                self.assertTrue(pd.isnull(getattr(obj, op)()))
+                assert pd.isna(getattr(obj, op)())
 
                 obj = klass([])
-                self.assertTrue(pd.isnull(getattr(obj, op)()))
+                assert pd.isna(getattr(obj, op)())
 
                 obj = klass([pd.NaT, datetime(2011, 11, 1)])
                 # check DatetimeIndex monotonic path
-                self.assertEqual(getattr(obj, op)(), datetime(2011, 11, 1))
+                assert getattr(obj, op)() == datetime(2011, 11, 1)
 
                 obj = klass([pd.NaT, datetime(2011, 11, 1), pd.NaT])
                 # check DatetimeIndex non-monotonic path
-                self.assertEqual(getattr(obj, op)(), datetime(2011, 11, 1))
+                assert getattr(obj, op)(), datetime(2011, 11, 1)
 
         # argmin/max
-        obj = Index(np.arange(5,dtype='int64'))
-        self.assertEqual(obj.argmin(),0)
-        self.assertEqual(obj.argmax(),4)
+        obj = Index(np.arange(5, dtype='int64'))
+        assert obj.argmin() == 0
+        assert obj.argmax() == 4
 
         obj = Index([np.nan, 1, np.nan, 2])
-        self.assertEqual(obj.argmin(),1)
-        self.assertEqual(obj.argmax(),3)
+        assert obj.argmin() == 1
+        assert obj.argmax() == 3
 
         obj = Index([np.nan])
-        self.assertEqual(obj.argmin(),-1)
-        self.assertEqual(obj.argmax(),-1)
+        assert obj.argmin() == -1
+        assert obj.argmax() == -1
 
-        obj = Index([pd.NaT, datetime(2011, 11, 1), datetime(2011,11,2),pd.NaT])
-        self.assertEqual(obj.argmin(),1)
-        self.assertEqual(obj.argmax(),2)
+        obj = Index([pd.NaT, datetime(2011, 11, 1), datetime(2011, 11, 2),
+                     pd.NaT])
+        assert obj.argmin() == 1
+        assert obj.argmax() == 2
 
         obj = Index([pd.NaT])
-        self.assertEqual(obj.argmin(),-1)
-        self.assertEqual(obj.argmax(),-1)
+        assert obj.argmin() == -1
+        assert obj.argmax() == -1
 
     def test_value_counts_unique_nunique(self):
-        for o in self.objs:
+        for orig in self.objs:
+            o = orig.copy()
             klass = type(o)
-            values = o.values
+            values = o._values
 
-            # create repeated values, 'n'th element is repeated by n+1 times
-            if isinstance(o, PeriodIndex):
-                # freq must be specified because repeat makes freq ambiguous
+            if isinstance(values, Index):
+                # reset name not to affect latter process
+                values.name = None
 
-                # resets name from Index
-                expected_index = pd.Index(o[::-1])
-
-                # attach name to klass
-                o = o.repeat(range(1, len(o) + 1))
-                o.name = 'a'
-
-            elif isinstance(o, DatetimeIndex):
-
-                # resets name from Index
-                expected_index = pd.Index(o[::-1])
-
-                # attach name to klass
-                o = o.repeat(range(1, len(o) + 1))
-                o.name = 'a'
-
-            # don't test boolean
-            elif isinstance(o,Index) and o.is_boolean():
+            # create repeated values, 'n'th element is repeated by n+1 times
+            # skip boolean, because it only has 2 values at most
+            if isinstance(o, Index) and o.is_boolean():
                 continue
             elif isinstance(o, Index):
-                expected_index = pd.Index(values[::-1])
+                expected_index = Index(o[::-1])
+                expected_index.name = None
                 o = o.repeat(range(1, len(o) + 1))
                 o.name = 'a'
             else:
-                expected_index = pd.Index(values[::-1])
+                expected_index = Index(values[::-1])
                 idx = o.index.repeat(range(1, len(o) + 1))
-                o = klass(np.repeat(values, range(1, len(o) + 1)), index=idx, name='a')
+                rep = np.repeat(values, range(1, len(o) + 1))
+                o = klass(rep, index=idx, name='a')
 
-            expected_s = Series(range(10, 0, -1), index=expected_index, dtype='int64', name='a')
+            # check values has the same dtype as the original
+            assert o.dtype == orig.dtype
+
+            expected_s = Series(range(10, 0, -1), index=expected_index,
+                                dtype='int64', name='a')
 
             result = o.value_counts()
             tm.assert_series_equal(result, expected_s)
-            self.assertTrue(result.index.name is None)
-            self.assertEqual(result.name, 'a')
+            assert result.index.name is None
+            assert result.name == 'a'
 
             result = o.unique()
-            if isinstance(o, (DatetimeIndex, PeriodIndex)):
-                self.assertTrue(isinstance(result, o.__class__))
-                self.assertEqual(result.name, o.name)
-                self.assertEqual(result.freq, o.freq)
+            if isinstance(o, Index):
+                assert isinstance(result, o.__class__)
+                tm.assert_index_equal(result, orig)
+            elif is_datetimetz(o):
+                # datetimetz Series returns array of Timestamp
+                assert result[0] == orig[0]
+                for r in result:
+                    assert isinstance(r, Timestamp)
+                tm.assert_numpy_array_equal(result,
+                                            orig._values.astype(object).values)
+            else:
+                tm.assert_numpy_array_equal(result, orig.values)
 
-            self.assert_numpy_array_equal(result, values)
+            assert o.nunique() == len(np.unique(o.values))
 
-            self.assertEqual(o.nunique(), len(np.unique(o.values)))
+    def test_value_counts_unique_nunique_null(self):
 
         for null_obj in [np.nan, None]:
-            for o in self.objs:
+            for orig in self.objs:
+                o = orig.copy()
                 klass = type(o)
-                values = o.values
-
-                if isinstance(o,Index) and o.is_boolean():
-                    # don't test boolean
-                    continue
+                values = o._ndarray_values
 
-                if ((isinstance(o, Int64Index) and not isinstance(o,
-                    (DatetimeIndex, PeriodIndex)))):
-                    # skips int64 because it doesn't allow to include nan or None
+                if not self._allow_na_ops(o):
                     continue
 
                 # special assign to the numpy array
-                if com.is_datetimetz(o):
+                if is_datetimetz(o):
                     if isinstance(o, DatetimeIndex):
                         v = o.asi8
-                        v[0:2] = pd.tslib.iNaT
+                        v[0:2] = iNaT
                         values = o._shallow_copy(v)
                     else:
                         o = o.copy()
-                        o[0:2] = pd.tslib.iNaT
-                        values = o.values
-                elif o.values.dtype == 'datetime64[ns]' or isinstance(o, PeriodIndex):
-                    values[0:2] = pd.tslib.iNaT
+                        o[0:2] = iNaT
+                        values = o._values
+
+                elif needs_i8_conversion(o):
+                    values[0:2] = iNaT
+                    values = o._shallow_copy(values)
                 else:
                     values[0:2] = null_obj
+                # check values has the same dtype as the original
 
-                # create repeated values, 'n'th element is repeated by n+1 times
-                if isinstance(o, PeriodIndex):
-                    # freq must be specified because repeat makes freq ambiguous
+                assert values.dtype == o.dtype
+
+                # create repeated values, 'n'th element is repeated by n+1
+                # times
+                if isinstance(o, (DatetimeIndex, PeriodIndex)):
+                    expected_index = o.copy()
+                    expected_index.name = None
 
-                    # resets name from Index
-                    expected_index = pd.Index(o, name=None)
                     # attach name to klass
-                    o = klass(np.repeat(values, range(1, len(o) + 1)), freq=o.freq, name='a')
-                elif isinstance(o, Index):
-                    expected_index = pd.Index(values, name=None)
-                    o = klass(np.repeat(values, range(1, len(o) + 1)), name='a')
+                    o = klass(values.repeat(range(1, len(o) + 1)))
+                    o.name = 'a'
                 else:
-                    expected_index = pd.Index(values, name=None)
-                    idx = np.repeat(o.index.values, range(1, len(o) + 1))
-                    o = klass(np.repeat(values, range(1, len(o) + 1)), index=idx, name='a')
+                    if is_datetimetz(o):
+                        expected_index = orig._values._shallow_copy(values)
+                    else:
+                        expected_index = Index(values)
+                    expected_index.name = None
+                    o = o.repeat(range(1, len(o) + 1))
+                    o.name = 'a'
+
+                # check values has the same dtype as the original
+                assert o.dtype == orig.dtype
+                # check values correctly have NaN
+                nanloc = np.zeros(len(o), dtype=np.bool)
+                nanloc[:3] = True
+                if isinstance(o, Index):
+                    tm.assert_numpy_array_equal(pd.isna(o), nanloc)
+                else:
+                    exp = Series(nanloc, o.index, name='a')
+                    tm.assert_series_equal(pd.isna(o), exp)
 
-                expected_s_na = Series(list(range(10, 2, -1)) +[3],
+                expected_s_na = Series(list(range(10, 2, -1)) + [3],
                                        index=expected_index[9:0:-1],
                                        dtype='int64', name='a')
                 expected_s = Series(list(range(10, 2, -1)),
@@ -501,24 +527,30 @@ def test_value_counts_unique_nunique(self):
 
                 result_s_na = o.value_counts(dropna=False)
                 tm.assert_series_equal(result_s_na, expected_s_na)
-                self.assertTrue(result_s_na.index.name is None)
-                self.assertEqual(result_s_na.name, 'a')
+                assert result_s_na.index.name is None
+                assert result_s_na.name == 'a'
                 result_s = o.value_counts()
                 tm.assert_series_equal(o.value_counts(), expected_s)
-                self.assertTrue(result_s.index.name is None)
-                self.assertEqual(result_s.name, 'a')
+                assert result_s.index.name is None
+                assert result_s.name == 'a'
 
-                # numpy_array_equal cannot compare arrays includes nan
                 result = o.unique()
-                self.assert_numpy_array_equal(result[1:], values[2:])
-
-                if isinstance(o, (DatetimeIndex, PeriodIndex)):
-                    self.assertTrue(result.asi8[0] == pd.tslib.iNaT)
+                if isinstance(o, Index):
+                    tm.assert_index_equal(result,
+                                          Index(values[1:], name='a'))
+                elif is_datetimetz(o):
+                    # unable to compare NaT / nan
+                    vals = values[2:].astype(object).values
+                    tm.assert_numpy_array_equal(result[1:], vals)
+                    assert result[0] is pd.NaT
                 else:
-                    self.assertTrue(pd.isnull(result[0]))
+                    tm.assert_numpy_array_equal(result[1:], values[2:])
+
+                    assert pd.isna(result[0])
+                    assert result.dtype == orig.dtype
 
-                self.assertEqual(o.nunique(), 8)
-                self.assertEqual(o.nunique(dropna=False), 9)
+                assert o.nunique() == 8
+                assert o.nunique(dropna=False) == 9
 
     def test_value_counts_inferred(self):
         klasses = [Index, Series]
@@ -528,9 +560,16 @@ def test_value_counts_inferred(self):
             expected = Series([4, 3, 2, 1], index=['b', 'a', 'd', 'c'])
             tm.assert_series_equal(s.value_counts(), expected)
 
-            self.assert_numpy_array_equal(s.unique(), np.unique(s_values))
-            self.assertEqual(s.nunique(), 4)
-            # don't sort, have to sort after the fact as not sorting is platform-dep
+            if isinstance(s, Index):
+                exp = Index(np.unique(np.array(s_values, dtype=np.object_)))
+                tm.assert_index_equal(s.unique(), exp)
+            else:
+                exp = np.unique(np.array(s_values, dtype=np.object_))
+                tm.assert_numpy_array_equal(s.unique(), exp)
+
+            assert s.nunique() == 4
+            # don't sort, have to sort after the fact as not sorting is
+            # platform-dep
             hist = s.value_counts(sort=False).sort_values()
             expected = Series([3, 1, 4, 2], index=list('acbd')).sort_values()
             tm.assert_series_equal(hist, expected)
@@ -545,132 +584,181 @@ def test_value_counts_inferred(self):
             expected = Series([.4, .3, .2, .1], index=['b', 'a', 'd', 'c'])
             tm.assert_series_equal(hist, expected)
 
+    def test_value_counts_bins(self):
+        klasses = [Index, Series]
+        for klass in klasses:
+            s_values = ['a', 'b', 'b', 'b', 'b', 'c', 'd', 'd', 'a', 'a']
+            s = klass(s_values)
+
             # bins
-            self.assertRaises(TypeError, lambda bins: s.value_counts(bins=bins), 1)
+            pytest.raises(TypeError, lambda bins: s.value_counts(bins=bins), 1)
 
             s1 = Series([1, 1, 2, 3])
             res1 = s1.value_counts(bins=1)
-            exp1 = Series({0.998: 4})
+            exp1 = Series({Interval(0.997, 3.0): 4})
             tm.assert_series_equal(res1, exp1)
             res1n = s1.value_counts(bins=1, normalize=True)
-            exp1n = Series({0.998: 1.0})
+            exp1n = Series({Interval(0.997, 3.0): 1.0})
             tm.assert_series_equal(res1n, exp1n)
 
-            self.assert_numpy_array_equal(s1.unique(), np.array([1, 2, 3]))
-            self.assertEqual(s1.nunique(), 3)
+            if isinstance(s1, Index):
+                tm.assert_index_equal(s1.unique(), Index([1, 2, 3]))
+            else:
+                exp = np.array([1, 2, 3], dtype=np.int64)
+                tm.assert_numpy_array_equal(s1.unique(), exp)
+
+            assert s1.nunique() == 3
+
+            # these return the same
+            res4 = s1.value_counts(bins=4, dropna=True)
+            intervals = IntervalIndex.from_breaks([0.997, 1.5, 2.0, 2.5, 3.0])
+            exp4 = Series([2, 1, 1, 0], index=intervals.take([0, 3, 1, 2]))
+            tm.assert_series_equal(res4, exp4)
 
-            res4 = s1.value_counts(bins=4)
-            exp4 = Series({0.998: 2, 1.5: 1, 2.0: 0, 2.5: 1}, index=[0.998, 2.5, 1.5, 2.0])
+            res4 = s1.value_counts(bins=4, dropna=False)
+            intervals = IntervalIndex.from_breaks([0.997, 1.5, 2.0, 2.5, 3.0])
+            exp4 = Series([2, 1, 1, 0], index=intervals.take([0, 3, 1, 2]))
             tm.assert_series_equal(res4, exp4)
+
             res4n = s1.value_counts(bins=4, normalize=True)
-            exp4n = Series({0.998: 0.5, 1.5: 0.25, 2.0: 0.0, 2.5: 0.25}, index=[0.998, 2.5, 1.5, 2.0])
+            exp4n = Series([0.5, 0.25, 0.25, 0],
+                           index=intervals.take([0, 3, 1, 2]))
             tm.assert_series_equal(res4n, exp4n)
 
             # handle NA's properly
-            s_values = ['a', 'b', 'b', 'b', np.nan, np.nan, 'd', 'd', 'a', 'a', 'b']
+            s_values = ['a', 'b', 'b', 'b', np.nan, np.nan,
+                        'd', 'd', 'a', 'a', 'b']
             s = klass(s_values)
             expected = Series([4, 3, 2], index=['b', 'a', 'd'])
             tm.assert_series_equal(s.value_counts(), expected)
 
-            self.assert_numpy_array_equal(s.unique(), np.array(['a', 'b', np.nan, 'd'], dtype='O'))
-            self.assertEqual(s.nunique(), 3)
+            if isinstance(s, Index):
+                exp = Index(['a', 'b', np.nan, 'd'])
+                tm.assert_index_equal(s.unique(), exp)
+            else:
+                exp = np.array(['a', 'b', np.nan, 'd'], dtype=object)
+                tm.assert_numpy_array_equal(s.unique(), exp)
+            assert s.nunique() == 3
 
             s = klass({})
             expected = Series([], dtype=np.int64)
-            tm.assert_series_equal(s.value_counts(), expected)
-            self.assert_numpy_array_equal(s.unique(), np.array([]))
-            self.assertEqual(s.nunique(), 0)
-
-            # GH 3002, datetime64[ns]
-            # don't test names though
-            txt = "\n".join(['xxyyzz20100101PIE', 'xxyyzz20100101GUM', 'xxyyzz20100101EGG',
-                             'xxyyww20090101EGG', 'foofoo20080909PIE', 'foofoo20080909GUM'])
-            f = StringIO(txt)
-            df = pd.read_fwf(f, widths=[6, 8, 3], names=["person_id", "dt", "food"],
-                             parse_dates=["dt"])
-
-            s = klass(df['dt'].copy())
-            s.name = None
-
-            idx = pd.to_datetime(['2010-01-01 00:00:00Z', '2008-09-09 00:00:00Z',
-                                  '2009-01-01 00:00:00X'])
-            expected_s = Series([3, 2, 1], index=idx)
-            tm.assert_series_equal(s.value_counts(), expected_s)
-
-            expected = np.array(['2010-01-01 00:00:00Z', '2009-01-01 00:00:00Z',
-                                 '2008-09-09 00:00:00Z'], dtype='datetime64[ns]')
-            if isinstance(s, DatetimeIndex):
-                expected = DatetimeIndex(expected)
-                self.assertTrue(s.unique().equals(expected))
-            else:
-                self.assert_numpy_array_equal(s.unique(), expected)
-
-            self.assertEqual(s.nunique(), 3)
-
-            # with NaT
-            s = df['dt'].copy()
-            s = klass([v for v in s.values] + [pd.NaT])
-
-            result = s.value_counts()
-            self.assertEqual(result.index.dtype, 'datetime64[ns]')
-            tm.assert_series_equal(result, expected_s)
-
-            result = s.value_counts(dropna=False)
-            expected_s[pd.NaT] = 1
-            tm.assert_series_equal(result, expected_s)
-
-            unique = s.unique()
-            self.assertEqual(unique.dtype, 'datetime64[ns]')
-
-            # numpy_array_equal cannot compare pd.NaT
-            self.assert_numpy_array_equal(unique[:3], expected)
-            self.assertTrue(unique[3] is pd.NaT or unique[3].astype('int64') == pd.tslib.iNaT)
-
-            self.assertEqual(s.nunique(), 3)
-            self.assertEqual(s.nunique(dropna=False), 4)
-
-            # timedelta64[ns]
-            td = df.dt - df.dt + timedelta(1)
-            td = klass(td, name='dt')
-
-            result = td.value_counts()
-            expected_s = Series([6], index=[Timedelta('1day')], name='dt')
-            tm.assert_series_equal(result, expected_s)
-
-            expected = TimedeltaIndex(['1 days'])
-            if isinstance(td, TimedeltaIndex):
-                self.assertTrue(td.unique().equals(expected))
+            tm.assert_series_equal(s.value_counts(), expected,
+                                   check_index_type=False)
+            # returned dtype differs depending on original
+            if isinstance(s, Index):
+                tm.assert_index_equal(s.unique(), Index([]), exact=False)
             else:
-                self.assert_numpy_array_equal(td.unique(), expected.values)
-
-            td2 = timedelta(1) + (df.dt - df.dt)
-            td2 = klass(td2, name='dt')
-            result2 = td2.value_counts()
-            tm.assert_series_equal(result2, expected_s)
+                tm.assert_numpy_array_equal(s.unique(), np.array([]),
+                                            check_dtype=False)
+
+            assert s.nunique() == 0
+
+    @pytest.mark.parametrize('klass', [Index, Series])
+    def test_value_counts_datetime64(self, klass):
+
+        # GH 3002, datetime64[ns]
+        # don't test names though
+        txt = "\n".join(['xxyyzz20100101PIE', 'xxyyzz20100101GUM',
+                         'xxyyzz20100101EGG', 'xxyyww20090101EGG',
+                         'foofoo20080909PIE', 'foofoo20080909GUM'])
+        f = StringIO(txt)
+        df = pd.read_fwf(f, widths=[6, 8, 3],
+                         names=["person_id", "dt", "food"],
+                         parse_dates=["dt"])
+
+        s = klass(df['dt'].copy())
+        s.name = None
+
+        idx = pd.to_datetime(['2010-01-01 00:00:00Z',
+                              '2008-09-09 00:00:00Z',
+                              '2009-01-01 00:00:00Z'])
+        expected_s = Series([3, 2, 1], index=idx)
+        tm.assert_series_equal(s.value_counts(), expected_s)
+
+        expected = np_array_datetime64_compat(['2010-01-01 00:00:00Z',
+                                               '2009-01-01 00:00:00Z',
+                                               '2008-09-09 00:00:00Z'],
+                                              dtype='datetime64[ns]')
+        if isinstance(s, Index):
+            tm.assert_index_equal(s.unique(), DatetimeIndex(expected))
+        else:
+            tm.assert_numpy_array_equal(s.unique(), expected)
+
+        assert s.nunique() == 3
+
+        # with NaT
+        s = df['dt'].copy()
+        s = klass([v for v in s.values] + [pd.NaT])
+
+        result = s.value_counts()
+        assert result.index.dtype == 'datetime64[ns]'
+        tm.assert_series_equal(result, expected_s)
+
+        result = s.value_counts(dropna=False)
+        expected_s[pd.NaT] = 1
+        tm.assert_series_equal(result, expected_s)
+
+        unique = s.unique()
+        assert unique.dtype == 'datetime64[ns]'
+
+        # numpy_array_equal cannot compare pd.NaT
+        if isinstance(s, Index):
+            exp_idx = DatetimeIndex(expected.tolist() + [pd.NaT])
+            tm.assert_index_equal(unique, exp_idx)
+        else:
+            tm.assert_numpy_array_equal(unique[:3], expected)
+            assert pd.isna(unique[3])
+
+        assert s.nunique() == 3
+        assert s.nunique(dropna=False) == 4
+
+        # timedelta64[ns]
+        td = df.dt - df.dt + timedelta(1)
+        td = klass(td, name='dt')
+
+        result = td.value_counts()
+        expected_s = Series([6], index=[Timedelta('1day')], name='dt')
+        tm.assert_series_equal(result, expected_s)
+
+        expected = TimedeltaIndex(['1 days'], name='dt')
+        if isinstance(td, Index):
+            tm.assert_index_equal(td.unique(), expected)
+        else:
+            tm.assert_numpy_array_equal(td.unique(), expected.values)
+
+        td2 = timedelta(1) + (df.dt - df.dt)
+        td2 = klass(td2, name='dt')
+        result2 = td2.value_counts()
+        tm.assert_series_equal(result2, expected_s)
 
     def test_factorize(self):
-        for o in self.objs:
+        for orig in self.objs:
+            o = orig.copy()
 
-            if isinstance(o,Index) and o.is_boolean():
-                exp_arr = np.array([0,1] + [0] * 8)
+            if isinstance(o, Index) and o.is_boolean():
+                exp_arr = np.array([0, 1] + [0] * 8, dtype=np.intp)
                 exp_uniques = o
-                exp_uniques = Index([False,True])
+                exp_uniques = Index([False, True])
             else:
-                exp_arr = np.array(range(len(o)))
+                exp_arr = np.array(range(len(o)), dtype=np.intp)
                 exp_uniques = o
             labels, uniques = o.factorize()
 
-            self.assert_numpy_array_equal(labels, exp_arr)
+            tm.assert_numpy_array_equal(labels, exp_arr)
             if isinstance(o, Series):
-                expected = Index(o.values)
-                self.assert_numpy_array_equal(uniques, expected)
+                tm.assert_index_equal(uniques, Index(orig),
+                                      check_names=False)
             else:
-                self.assertTrue(uniques.equals(exp_uniques))
+                # factorize explicitly resets name
+                tm.assert_index_equal(uniques, exp_uniques,
+                                      check_names=False)
 
-        for o in self.objs:
+    def test_factorize_repeated(self):
+        for orig in self.objs:
+            o = orig.copy()
 
             # don't test boolean
-            if isinstance(o,Index) and o.is_boolean():
+            if isinstance(o, Index) and o.is_boolean():
                 continue
 
             # sort by value, and create duplicates
@@ -682,37 +770,38 @@ def test_factorize(self):
                 o = o.take(indexer)
                 n = o[5:].append(o)
 
-            exp_arr = np.array([5, 6, 7, 8, 9, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9])
+            exp_arr = np.array([5, 6, 7, 8, 9, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9],
+                               dtype=np.intp)
             labels, uniques = n.factorize(sort=True)
 
-            self.assert_numpy_array_equal(labels, exp_arr)
+            tm.assert_numpy_array_equal(labels, exp_arr)
             if isinstance(o, Series):
-                expected = Index(o.values)
-                self.assert_numpy_array_equal(uniques, expected)
+                tm.assert_index_equal(uniques, Index(orig).sort_values(),
+                                      check_names=False)
             else:
-                self.assertTrue(uniques.equals(o))
+                tm.assert_index_equal(uniques, o, check_names=False)
 
-            exp_arr = np.array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 0, 1, 2, 3, 4])
+            exp_arr = np.array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 0, 1, 2, 3, 4],
+                               np.intp)
             labels, uniques = n.factorize(sort=False)
-            self.assert_numpy_array_equal(labels, exp_arr)
+            tm.assert_numpy_array_equal(labels, exp_arr)
 
             if isinstance(o, Series):
-                expected = Index(np.concatenate([o.values[5:10], o.values[:5]]))
-                self.assert_numpy_array_equal(uniques, expected)
+                expected = Index(o.iloc[5:10].append(o.iloc[:5]))
+                tm.assert_index_equal(uniques, expected, check_names=False)
             else:
-                expected = o[5:].append(o[:5])
-                self.assertTrue(uniques.equals(expected))
+                expected = o[5:10].append(o[:5])
+                tm.assert_index_equal(uniques, expected, check_names=False)
 
-    def test_duplicated_drop_duplicates(self):
+    def test_duplicated_drop_duplicates_index(self):
         # GH 4060
         for original in self.objs:
-
             if isinstance(original, Index):
 
                 # special case
                 if original.is_boolean():
                     result = original.drop_duplicates()
-                    expected = Index([False,True], name='a')
+                    expected = Index([False, True], name='a')
                     tm.assert_index_equal(result, expected)
                     continue
 
@@ -720,20 +809,21 @@ def test_duplicated_drop_duplicates(self):
                 expected = np.array([False] * len(original), dtype=bool)
                 duplicated = original.duplicated()
                 tm.assert_numpy_array_equal(duplicated, expected)
-                self.assertTrue(duplicated.dtype == bool)
+                assert duplicated.dtype == bool
                 result = original.drop_duplicates()
                 tm.assert_index_equal(result, original)
-                self.assertFalse(result is original)
+                assert result is not original
 
                 # has_duplicates
-                self.assertFalse(original.has_duplicates)
+                assert not original.has_duplicates
 
                 # create repeated values, 3rd and 5th values are duplicated
                 idx = original[list(range(len(original))) + [5, 3]]
-                expected = np.array([False] * len(original) + [True, True], dtype=bool)
+                expected = np.array([False] * len(original) + [True, True],
+                                    dtype=bool)
                 duplicated = idx.duplicated()
                 tm.assert_numpy_array_equal(duplicated, expected)
-                self.assertTrue(duplicated.dtype == bool)
+                assert duplicated.dtype == bool
                 tm.assert_index_equal(idx.drop_duplicates(), original)
 
                 base = [False] * len(idx)
@@ -743,19 +833,10 @@ def test_duplicated_drop_duplicates(self):
 
                 duplicated = idx.duplicated(keep='last')
                 tm.assert_numpy_array_equal(duplicated, expected)
-                self.assertTrue(duplicated.dtype == bool)
+                assert duplicated.dtype == bool
                 result = idx.drop_duplicates(keep='last')
                 tm.assert_index_equal(result, idx[~expected])
 
-                # deprecate take_last
-                with tm.assert_produces_warning(FutureWarning):
-                    duplicated = idx.duplicated(take_last=True)
-                tm.assert_numpy_array_equal(duplicated, expected)
-                self.assertTrue(duplicated.dtype == bool)
-                with tm.assert_produces_warning(FutureWarning):
-                    result = idx.drop_duplicates(take_last=True)
-                tm.assert_index_equal(result, idx[~expected])
-
                 base = [False] * len(original) + [True, True]
                 base[3] = True
                 base[5] = True
@@ -763,12 +844,13 @@ def test_duplicated_drop_duplicates(self):
 
                 duplicated = idx.duplicated(keep=False)
                 tm.assert_numpy_array_equal(duplicated, expected)
-                self.assertTrue(duplicated.dtype == bool)
+                assert duplicated.dtype == bool
                 result = idx.drop_duplicates(keep=False)
                 tm.assert_index_equal(result, idx[~expected])
 
-                with tm.assertRaisesRegexp(TypeError,
-                                           "drop_duplicates\(\) got an unexpected keyword argument"):
+                with tm.assert_raises_regex(
+                        TypeError, r"drop_duplicates\(\) got an unexpected "
+                        "keyword argument"):
                     idx.drop_duplicates(inplace=True)
 
             else:
@@ -777,7 +859,7 @@ def test_duplicated_drop_duplicates(self):
                 tm.assert_series_equal(original.duplicated(), expected)
                 result = original.drop_duplicates()
                 tm.assert_series_equal(result, original)
-                self.assertFalse(result is original)
+                assert result is not original
 
                 idx = original.index[list(range(len(original))) + [5, 3]]
                 values = original._values[list(range(len(original))) + [5, 3]]
@@ -797,12 +879,6 @@ def test_duplicated_drop_duplicates(self):
                 tm.assert_series_equal(s.drop_duplicates(keep='last'),
                                        s[~np.array(base)])
 
-                # deprecate take_last
-                with tm.assert_produces_warning(FutureWarning):
-                    tm.assert_series_equal(s.duplicated(take_last=True), expected)
-                with tm.assert_produces_warning(FutureWarning):
-                    tm.assert_series_equal(s.drop_duplicates(take_last=True),
-                                           s[~np.array(base)])
                 base = [False] * len(original) + [True, True]
                 base[3] = True
                 base[5] = True
@@ -815,19 +891,353 @@ def test_duplicated_drop_duplicates(self):
                 s.drop_duplicates(inplace=True)
                 tm.assert_series_equal(s, original)
 
+    def test_drop_duplicates_series_vs_dataframe(self):
+        # GH 14192
+        df = pd.DataFrame({'a': [1, 1, 1, 'one', 'one'],
+                           'b': [2, 2, np.nan, np.nan, np.nan],
+                           'c': [3, 3, np.nan, np.nan, 'three'],
+                           'd': [1, 2, 3, 4, 4],
+                           'e': [datetime(2015, 1, 1), datetime(2015, 1, 1),
+                                 datetime(2015, 2, 1), pd.NaT, pd.NaT]
+                           })
+        for column in df.columns:
+            for keep in ['first', 'last', False]:
+                dropped_frame = df[[column]].drop_duplicates(keep=keep)
+                dropped_series = df[column].drop_duplicates(keep=keep)
+                tm.assert_frame_equal(dropped_frame, dropped_series.to_frame())
+
+    def test_fillna(self):
+        # # GH 11343
+        # though Index.fillna and Series.fillna has separate impl,
+        # test here to confirm these works as the same
+
+        for orig in self.objs:
+
+            o = orig.copy()
+            values = o.values
+
+            # values will not be changed
+            result = o.fillna(o.astype(object).values[0])
+            if isinstance(o, Index):
+                tm.assert_index_equal(o, result)
+            else:
+                tm.assert_series_equal(o, result)
+            # check shallow_copied
+            assert o is not result
 
-class TestFloat64HashTable(tm.TestCase):
-    def test_lookup_nan(self):
-        from pandas.hashtable import Float64HashTable
-        xs = np.array([2.718, 3.14, np.nan, -7, 5, 2, 3])
-        m = Float64HashTable()
-        m.map_locations(xs)
-        self.assert_numpy_array_equal(m.lookup(xs), np.arange(len(xs)))
+        for null_obj in [np.nan, None]:
+            for orig in self.objs:
+                o = orig.copy()
+                klass = type(o)
 
+                if not self._allow_na_ops(o):
+                    continue
 
-if __name__ == '__main__':
-    import nose
+                if needs_i8_conversion(o):
 
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   # '--with-coverage', '--cover-package=pandas.core'],
-                   exit=False)
+                    values = o.astype(object).values
+                    fill_value = values[0]
+                    values[0:2] = pd.NaT
+                else:
+                    values = o.values.copy()
+                    fill_value = o.values[0]
+                    values[0:2] = null_obj
+
+                expected = [fill_value] * 2 + list(values[2:])
+
+                expected = klass(expected)
+                o = klass(values)
+
+                # check values has the same dtype as the original
+                assert o.dtype == orig.dtype
+
+                result = o.fillna(fill_value)
+                if isinstance(o, Index):
+                    tm.assert_index_equal(result, expected)
+                else:
+                    tm.assert_series_equal(result, expected)
+                # check shallow_copied
+                assert o is not result
+
+    @pytest.mark.skipif(PYPY, reason="not relevant for PyPy")
+    def test_memory_usage(self):
+        for o in self.objs:
+            res = o.memory_usage()
+            res_deep = o.memory_usage(deep=True)
+
+            if (is_object_dtype(o) or (isinstance(o, Series) and
+                                       is_object_dtype(o.index))):
+                # if there are objects, only deep will pick them up
+                assert res_deep > res
+            else:
+                assert res == res_deep
+
+            if isinstance(o, Series):
+                assert ((o.memory_usage(index=False) +
+                         o.index.memory_usage()) ==
+                        o.memory_usage(index=True))
+
+            # sys.getsizeof will call the .memory_usage with
+            # deep=True, and add on some GC overhead
+            diff = res_deep - sys.getsizeof(o)
+            assert abs(diff) < 100
+
+    def test_searchsorted(self):
+        # See gh-12238
+        for o in self.objs:
+            index = np.searchsorted(o, max(o))
+            assert 0 <= index <= len(o)
+
+            index = np.searchsorted(o, max(o), sorter=range(len(o)))
+            assert 0 <= index <= len(o)
+
+    def test_validate_bool_args(self):
+        invalid_values = [1, "True", [1, 2, 3], 5.0]
+
+        for value in invalid_values:
+            with pytest.raises(ValueError):
+                self.int_series.drop_duplicates(inplace=value)
+
+
+class TestTranspose(Ops):
+    errmsg = "the 'axes' parameter is not supported"
+
+    def test_transpose(self):
+        for obj in self.objs:
+            if isinstance(obj, Index):
+                tm.assert_index_equal(obj.transpose(), obj)
+            else:
+                tm.assert_series_equal(obj.transpose(), obj)
+
+    def test_transpose_non_default_axes(self):
+        for obj in self.objs:
+            tm.assert_raises_regex(ValueError, self.errmsg,
+                                   obj.transpose, 1)
+            tm.assert_raises_regex(ValueError, self.errmsg,
+                                   obj.transpose, axes=1)
+
+    def test_numpy_transpose(self):
+        for obj in self.objs:
+            if isinstance(obj, Index):
+                tm.assert_index_equal(np.transpose(obj), obj)
+            else:
+                tm.assert_series_equal(np.transpose(obj), obj)
+
+            tm.assert_raises_regex(ValueError, self.errmsg,
+                                   np.transpose, obj, axes=1)
+
+
+class TestNoNewAttributesMixin(object):
+
+    def test_mixin(self):
+        class T(NoNewAttributesMixin):
+            pass
+
+        t = T()
+        assert not hasattr(t, "__frozen")
+
+        t.a = "test"
+        assert t.a == "test"
+
+        t._freeze()
+        assert "__frozen" in dir(t)
+        assert getattr(t, "__frozen")
+
+        def f():
+            t.b = "test"
+
+        pytest.raises(AttributeError, f)
+        assert not hasattr(t, "b")
+
+
+class TestToIterable(object):
+    # test that we convert an iterable to python types
+
+    dtypes = [
+        ('int8', (int, long)),
+        ('int16', (int, long)),
+        ('int32', (int, long)),
+        ('int64', (int, long)),
+        ('uint8', (int, long)),
+        ('uint16', (int, long)),
+        ('uint32', (int, long)),
+        ('uint64', (int, long)),
+        ('float16', float),
+        ('float32', float),
+        ('float64', float),
+        ('datetime64[ns]', Timestamp),
+        ('datetime64[ns, US/Eastern]', Timestamp),
+        ('timedelta64[ns]', Timedelta)]
+
+    @pytest.mark.parametrize(
+        'dtype, rdtype', dtypes)
+    @pytest.mark.parametrize(
+        'method',
+        [
+            lambda x: x.tolist(),
+            lambda x: list(x),
+            lambda x: list(x.__iter__()),
+        ], ids=['tolist', 'list', 'iter'])
+    @pytest.mark.parametrize('typ', [Series, Index])
+    def test_iterable(self, typ, method, dtype, rdtype):
+        # gh-10904
+        # gh-13258
+        # coerce iteration to underlying python / pandas types
+        s = typ([1], dtype=dtype)
+        result = method(s)[0]
+        assert isinstance(result, rdtype)
+
+    @pytest.mark.parametrize(
+        'dtype, rdtype, obj',
+        [
+            ('object', object, 'a'),
+            ('object', (int, long), 1),
+            ('category', object, 'a'),
+            ('category', (int, long), 1)])
+    @pytest.mark.parametrize(
+        'method',
+        [
+            lambda x: x.tolist(),
+            lambda x: list(x),
+            lambda x: list(x.__iter__()),
+        ], ids=['tolist', 'list', 'iter'])
+    @pytest.mark.parametrize('typ', [Series, Index])
+    def test_iterable_object_and_category(self, typ, method,
+                                          dtype, rdtype, obj):
+        # gh-10904
+        # gh-13258
+        # coerce iteration to underlying python / pandas types
+        s = typ([obj], dtype=dtype)
+        result = method(s)[0]
+        assert isinstance(result, rdtype)
+
+    @pytest.mark.parametrize(
+        'dtype, rdtype', dtypes)
+    def test_iterable_items(self, dtype, rdtype):
+        # gh-13258
+        # test items / iteritems yields the correct boxed scalars
+        # this only applies to series
+        s = Series([1], dtype=dtype)
+        _, result = list(s.items())[0]
+        assert isinstance(result, rdtype)
+
+        _, result = list(s.iteritems())[0]
+        assert isinstance(result, rdtype)
+
+    @pytest.mark.parametrize(
+        'dtype, rdtype',
+        dtypes + [
+            ('object', (int, long)),
+            ('category', (int, long))])
+    @pytest.mark.parametrize('typ', [Series, Index])
+    def test_iterable_map(self, typ, dtype, rdtype):
+        # gh-13236
+        # coerce iteration to underlying python / pandas types
+        s = typ([1], dtype=dtype)
+        result = s.map(type)[0]
+        if not isinstance(rdtype, tuple):
+            rdtype = tuple([rdtype])
+        assert result in rdtype
+
+    @pytest.mark.parametrize(
+        'method',
+        [
+            lambda x: x.tolist(),
+            lambda x: list(x),
+            lambda x: list(x.__iter__()),
+        ], ids=['tolist', 'list', 'iter'])
+    def test_categorial_datetimelike(self, method):
+        i = CategoricalIndex([Timestamp('1999-12-31'),
+                              Timestamp('2000-12-31')])
+
+        result = method(i)[0]
+        assert isinstance(result, Timestamp)
+
+    def test_iter_box(self):
+        vals = [Timestamp('2011-01-01'), Timestamp('2011-01-02')]
+        s = Series(vals)
+        assert s.dtype == 'datetime64[ns]'
+        for res, exp in zip(s, vals):
+            assert isinstance(res, Timestamp)
+            assert res.tz is None
+            assert res == exp
+
+        vals = [Timestamp('2011-01-01', tz='US/Eastern'),
+                Timestamp('2011-01-02', tz='US/Eastern')]
+        s = Series(vals)
+
+        assert s.dtype == 'datetime64[ns, US/Eastern]'
+        for res, exp in zip(s, vals):
+            assert isinstance(res, Timestamp)
+            assert res.tz == exp.tz
+            assert res == exp
+
+        # timedelta
+        vals = [Timedelta('1 days'), Timedelta('2 days')]
+        s = Series(vals)
+        assert s.dtype == 'timedelta64[ns]'
+        for res, exp in zip(s, vals):
+            assert isinstance(res, Timedelta)
+            assert res == exp
+
+        # period (object dtype, not boxed)
+        vals = [pd.Period('2011-01-01', freq='M'),
+                pd.Period('2011-01-02', freq='M')]
+        s = Series(vals)
+        assert s.dtype == 'object'
+        for res, exp in zip(s, vals):
+            assert isinstance(res, pd.Period)
+            assert res.freq == 'M'
+            assert res == exp
+
+
+@pytest.mark.parametrize('array, expected_type, dtype', [
+    (np.array([0, 1], dtype=np.int64), np.ndarray, 'int64'),
+    (np.array(['a', 'b']), np.ndarray, 'object'),
+    (pd.Categorical(['a', 'b']), pd.Categorical, 'category'),
+    (pd.DatetimeIndex(['2017', '2018']), np.ndarray, 'datetime64[ns]'),
+    (pd.DatetimeIndex(['2017', '2018'], tz="US/Central"), pd.DatetimeIndex,
+     'datetime64[ns, US/Central]'),
+    (pd.TimedeltaIndex([10**10]), np.ndarray, 'm8[ns]'),
+    (pd.PeriodIndex([2018, 2019], freq='A'), np.ndarray, 'object'),
+    (pd.IntervalIndex.from_breaks([0, 1, 2]), np.ndarray, 'object'),
+])
+def test_values_consistent(array, expected_type, dtype):
+    l_values = pd.Series(array)._values
+    r_values = pd.Index(array)._values
+    assert type(l_values) is expected_type
+    assert type(l_values) is type(r_values)
+
+    if isinstance(l_values, np.ndarray):
+        tm.assert_numpy_array_equal(l_values, r_values)
+    elif isinstance(l_values, pd.Index):
+        tm.assert_index_equal(l_values, r_values)
+    elif pd.api.types.is_categorical(l_values):
+        tm.assert_categorical_equal(l_values, r_values)
+    else:
+        raise TypeError("Unexpected type {}".format(type(l_values)))
+
+    assert l_values.dtype == dtype
+    assert r_values.dtype == dtype
+
+
+@pytest.mark.parametrize('array, expected', [
+    (np.array([0, 1], dtype=np.int64), np.array([0, 1], dtype=np.int64)),
+    (np.array(['0', '1']), np.array(['0', '1'], dtype=object)),
+    (pd.Categorical(['a', 'a']), np.array([0, 0], dtype='int8')),
+    (pd.DatetimeIndex(['2017-01-01T00:00:00']),
+     np.array(['2017-01-01T00:00:00'], dtype='M8[ns]')),
+    (pd.DatetimeIndex(['2017-01-01T00:00:00'], tz="US/Eastern"),
+     np.array(['2017-01-01T05:00:00'], dtype='M8[ns]')),
+    (pd.TimedeltaIndex([10**10]), np.array([10**10], dtype='m8[ns]')),
+    pytest.param(
+        pd.PeriodIndex(['2017', '2018'], freq='D'),
+        np.array([17167, 17532]),
+        marks=pytest.mark.xfail(reason="PeriodArray Not implemented")
+    ),
+])
+def test_ndarray_values(array, expected):
+    l_values = pd.Series(array)._ndarray_values
+    r_values = pd.Index(array)._ndarray_values
+    tm.assert_numpy_array_equal(l_values, r_values)
+    tm.assert_numpy_array_equal(l_values, expected)
diff --git a/pandas/tests/test_categorical.py b/pandas/tests/test_categorical.py
deleted file mode 100755
index e97010e1cb552..0000000000000
--- a/pandas/tests/test_categorical.py
+++ /dev/null
@@ -1,3687 +0,0 @@
-# -*- coding: utf-8 -*-
-# pylint: disable=E1101,E1103,W0232
-
-from datetime import datetime
-from pandas.compat import range, lrange, u, PY3
-import os
-import pickle
-import re
-from distutils.version import LooseVersion
-
-import numpy as np
-import pandas as pd
-
-from pandas import Categorical, Index, Series, DataFrame, PeriodIndex, Timestamp, CategoricalIndex
-
-from pandas.core.config import option_context
-import pandas.core.common as com
-import pandas.compat as compat
-import pandas.util.testing as tm
-
-class TestCategorical(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.factor = Categorical.from_array(['a', 'b', 'b', 'a',
-                                              'a', 'c', 'c', 'c'], ordered=True)
-
-    def test_getitem(self):
-        self.assertEqual(self.factor[0], 'a')
-        self.assertEqual(self.factor[-1], 'c')
-
-        subf = self.factor[[0, 1, 2]]
-        tm.assert_almost_equal(subf._codes, [0, 1, 1])
-
-        subf = self.factor[np.asarray(self.factor) == 'c']
-        tm.assert_almost_equal(subf._codes, [2, 2, 2])
-
-    def test_getitem_listlike(self):
-
-        # GH 9469
-        # properly coerce the input indexers
-        np.random.seed(1)
-        c = Categorical(np.random.randint(0, 5, size=150000).astype(np.int8))
-        result = c.codes[np.array([100000]).astype(np.int64)]
-        expected = c[np.array([100000]).astype(np.int64)].codes
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_setitem(self):
-
-        # int/positional
-        c = self.factor.copy()
-        c[0] = 'b'
-        self.assertEqual(c[0], 'b')
-        c[-1] = 'a'
-        self.assertEqual(c[-1], 'a')
-
-        # boolean
-        c = self.factor.copy()
-        indexer = np.zeros(len(c),dtype='bool')
-        indexer[0] = True
-        indexer[-1] = True
-        c[indexer] = 'c'
-        expected = Categorical.from_array(['c', 'b', 'b', 'a',
-                                           'a', 'c', 'c', 'c'], ordered=True)
-
-        self.assert_categorical_equal(c, expected)
-
-    def test_setitem_listlike(self):
-
-        # GH 9469
-        # properly coerce the input indexers
-        np.random.seed(1)
-        c = Categorical(np.random.randint(0, 5, size=150000).astype(np.int8)).add_categories([-1000])
-        indexer = np.array([100000]).astype(np.int64)
-        c[indexer] = -1000
-
-        # we are asserting the code result here
-        # which maps to the -1000 category
-        result = c.codes[np.array([100000]).astype(np.int64)]
-        self.assertEqual(result, np.array([5], dtype='int8'))
-
-    def test_constructor_unsortable(self):
-
-        # it works!
-        arr = np.array([1, 2, 3, datetime.now()], dtype='O')
-        factor = Categorical.from_array(arr, ordered=False)
-        self.assertFalse(factor.ordered)
-
-        # this however will raise as cannot be sorted
-        # but fixed in newer versions of numpy
-        if LooseVersion(np.__version__) < "1.10":
-            self.assertRaises(TypeError, lambda :  Categorical.from_array(arr, ordered=True))
-        else:
-            Categorical.from_array(arr, ordered=True)
-
-    def test_is_equal_dtype(self):
-
-        # test dtype comparisons between cats
-
-        c1 = Categorical(list('aabca'),categories=list('abc'),ordered=False)
-        c2 = Categorical(list('aabca'),categories=list('cab'),ordered=False)
-        c3 = Categorical(list('aabca'),categories=list('cab'),ordered=True)
-        self.assertTrue(c1.is_dtype_equal(c1))
-        self.assertTrue(c2.is_dtype_equal(c2))
-        self.assertTrue(c3.is_dtype_equal(c3))
-        self.assertFalse(c1.is_dtype_equal(c2))
-        self.assertFalse(c1.is_dtype_equal(c3))
-        self.assertFalse(c1.is_dtype_equal(Index(list('aabca'))))
-        self.assertFalse(c1.is_dtype_equal(c1.astype(object)))
-        self.assertTrue(c1.is_dtype_equal(CategoricalIndex(c1)))
-        self.assertFalse(c1.is_dtype_equal(CategoricalIndex(c1,categories=list('cab'))))
-        self.assertFalse(c1.is_dtype_equal(CategoricalIndex(c1,ordered=True)))
-
-    def test_constructor(self):
-
-        exp_arr = np.array(["a", "b", "c", "a", "b", "c"])
-        c1 = Categorical(exp_arr)
-        self.assert_numpy_array_equal(c1.__array__(), exp_arr)
-        c2 = Categorical(exp_arr, categories=["a","b","c"])
-        self.assert_numpy_array_equal(c2.__array__(), exp_arr)
-        c2 = Categorical(exp_arr, categories=["c","b","a"])
-        self.assert_numpy_array_equal(c2.__array__(), exp_arr)
-
-        # categories must be unique
-        def f():
-            Categorical([1,2], [1,2,2])
-        self.assertRaises(ValueError, f)
-        def f():
-            Categorical(["a","b"], ["a","b","b"])
-        self.assertRaises(ValueError, f)
-        def f():
-            with tm.assert_produces_warning(FutureWarning):
-                Categorical([1,2], [1,2,np.nan, np.nan])
-        self.assertRaises(ValueError, f)
-
-        # The default should be unordered
-        c1 = Categorical(["a", "b", "c", "a"])
-        self.assertFalse(c1.ordered)
-
-        # Categorical as input
-        c1 = Categorical(["a", "b", "c", "a"])
-        c2 = Categorical(c1)
-        self.assertTrue(c1.equals(c2))
-
-        c1 = Categorical(["a", "b", "c", "a"], categories=["a","b","c","d"])
-        c2 = Categorical(c1)
-        self.assertTrue(c1.equals(c2))
-
-        c1 = Categorical(["a", "b", "c", "a"], categories=["a","c","b"])
-        c2 = Categorical(c1)
-        self.assertTrue(c1.equals(c2))
-
-        c1 = Categorical(["a", "b", "c", "a"], categories=["a","c","b"])
-        c2 = Categorical(c1, categories=["a","b","c"])
-        self.assert_numpy_array_equal(c1.__array__(), c2.__array__())
-        self.assert_numpy_array_equal(c2.categories, np.array(["a","b","c"]))
-
-        # Series of dtype category
-        c1 = Categorical(["a", "b", "c", "a"], categories=["a","b","c","d"])
-        c2 = Categorical(Series(c1))
-        self.assertTrue(c1.equals(c2))
-
-        c1 = Categorical(["a", "b", "c", "a"], categories=["a","c","b"])
-        c2 = Categorical(Series(c1))
-        self.assertTrue(c1.equals(c2))
-
-        # Series
-        c1 = Categorical(["a", "b", "c", "a"])
-        c2 = Categorical(Series(["a", "b", "c", "a"]))
-        self.assertTrue(c1.equals(c2))
-
-        c1 = Categorical(["a", "b", "c", "a"], categories=["a","b","c","d"])
-        c2 = Categorical(Series(["a", "b", "c", "a"]), categories=["a","b","c","d"])
-        self.assertTrue(c1.equals(c2))
-
-        # This should result in integer categories, not float!
-        cat = pd.Categorical([1,2,3,np.nan], categories=[1,2,3])
-        self.assertTrue(com.is_integer_dtype(cat.categories))
-
-        # https://github.com/pydata/pandas/issues/3678
-        cat = pd.Categorical([np.nan,1, 2, 3])
-        self.assertTrue(com.is_integer_dtype(cat.categories))
-
-        # this should result in floats
-        cat = pd.Categorical([np.nan, 1, 2., 3 ])
-        self.assertTrue(com.is_float_dtype(cat.categories))
-
-        cat = pd.Categorical([np.nan, 1., 2., 3. ])
-        self.assertTrue(com.is_float_dtype(cat.categories))
-
-        # Deprecating NaNs in categoires (GH #10748)
-        # preserve int as far as possible by converting to object if NaN is in categories
-        with tm.assert_produces_warning(FutureWarning):
-            cat = pd.Categorical([np.nan, 1, 2, 3], categories=[np.nan, 1, 2, 3])
-        self.assertTrue(com.is_object_dtype(cat.categories))
-        # This doesn't work -> this would probably need some kind of "remember the original type"
-        # feature to try to cast the array interface result to...
-        #vals = np.asarray(cat[cat.notnull()])
-        #self.assertTrue(com.is_integer_dtype(vals))
-        with tm.assert_produces_warning(FutureWarning):
-            cat = pd.Categorical([np.nan,"a", "b", "c"], categories=[np.nan,"a", "b", "c"])
-        self.assertTrue(com.is_object_dtype(cat.categories))
-        # but don't do it for floats
-        with tm.assert_produces_warning(FutureWarning):
-            cat = pd.Categorical([np.nan, 1., 2., 3.], categories=[np.nan, 1., 2., 3.])
-        self.assertTrue(com.is_float_dtype(cat.categories))
-
-
-        # corner cases
-        cat = pd.Categorical([1])
-        self.assertTrue(len(cat.categories) == 1)
-        self.assertTrue(cat.categories[0] == 1)
-        self.assertTrue(len(cat.codes) == 1)
-        self.assertTrue(cat.codes[0] == 0)
-
-        cat = pd.Categorical(["a"])
-        self.assertTrue(len(cat.categories) == 1)
-        self.assertTrue(cat.categories[0] == "a")
-        self.assertTrue(len(cat.codes) == 1)
-        self.assertTrue(cat.codes[0] == 0)
-
-        # Scalars should be converted to lists
-        cat = pd.Categorical(1)
-        self.assertTrue(len(cat.categories) == 1)
-        self.assertTrue(cat.categories[0] == 1)
-        self.assertTrue(len(cat.codes) == 1)
-        self.assertTrue(cat.codes[0] == 0)
-
-        cat = pd.Categorical([1], categories=1)
-        self.assertTrue(len(cat.categories) == 1)
-        self.assertTrue(cat.categories[0] == 1)
-        self.assertTrue(len(cat.codes) == 1)
-        self.assertTrue(cat.codes[0] == 0)
-
-        # Catch old style constructor useage: two arrays, codes + categories
-        # We can only catch two cases:
-        #  - when the first is an integer dtype and the second is not
-        #  - when the resulting codes are all -1/NaN
-        with tm.assert_produces_warning(RuntimeWarning):
-            c_old = Categorical([0,1,2,0,1,2], categories=["a","b","c"])
-
-        with tm.assert_produces_warning(RuntimeWarning):
-            c_old = Categorical([0,1,2,0,1,2], categories=[3,4,5])
-
-        # the next one are from the old docs, but unfortunately these don't trigger :-(
-        with tm.assert_produces_warning(None):
-            c_old2 = Categorical([0, 1, 2, 0, 1, 2], [1, 2, 3])
-            cat = Categorical([1,2], categories=[1,2,3])
-
-        # this is a legitimate constructor
-        with tm.assert_produces_warning(None):
-            c = Categorical(np.array([],dtype='int64'),categories=[3,2,1],ordered=True)
-
-    def test_constructor_with_index(self):
-
-        ci = CategoricalIndex(list('aabbca'),categories=list('cab'))
-        self.assertTrue(ci.values.equals(Categorical(ci)))
-
-        ci = CategoricalIndex(list('aabbca'),categories=list('cab'))
-        self.assertTrue(ci.values.equals(Categorical(ci.astype(object),categories=ci.categories)))
-
-    def test_constructor_with_generator(self):
-        # This was raising an Error in isnull(single_val).any() because isnull returned a scalar
-        # for a generator
-        from pandas.compat import range as xrange
-
-        exp = Categorical([0,1,2])
-        cat = Categorical((x for x in [0,1,2]))
-        self.assertTrue(cat.equals(exp))
-        cat = Categorical(xrange(3))
-        self.assertTrue(cat.equals(exp))
-
-        # This uses xrange internally
-        from pandas.core.index import MultiIndex
-        MultiIndex.from_product([range(5), ['a', 'b', 'c']])
-
-        # check that categories accept generators and sequences
-        cat = pd.Categorical([0,1,2], categories=(x for x in [0,1,2]))
-        self.assertTrue(cat.equals(exp))
-        cat = pd.Categorical([0,1,2], categories=xrange(3))
-        self.assertTrue(cat.equals(exp))
-
-
-    def test_from_codes(self):
-
-        # too few categories
-        def f():
-            Categorical.from_codes([1,2], [1,2])
-        self.assertRaises(ValueError, f)
-
-        # no int codes
-        def f():
-            Categorical.from_codes(["a"], [1,2])
-        self.assertRaises(ValueError, f)
-
-        # no unique categories
-        def f():
-            Categorical.from_codes([0,1,2], ["a","a","b"])
-        self.assertRaises(ValueError, f)
-
-        # too negative
-        def f():
-            Categorical.from_codes([-2,1,2], ["a","b","c"])
-        self.assertRaises(ValueError, f)
-
-
-        exp = Categorical(["a","b","c"], ordered=False)
-        res = Categorical.from_codes([0,1,2], ["a","b","c"])
-        self.assertTrue(exp.equals(res))
-
-        # Not available in earlier numpy versions
-        if hasattr(np.random, "choice"):
-            codes = np.random.choice([0,1], 5, p=[0.9,0.1])
-            pd.Categorical.from_codes(codes, categories=["train", "test"])
-
-    def test_comparisons(self):
-
-        result = self.factor[self.factor == 'a']
-        expected = self.factor[np.asarray(self.factor) == 'a']
-        self.assertTrue(result.equals(expected))
-
-        result = self.factor[self.factor != 'a']
-        expected = self.factor[np.asarray(self.factor) != 'a']
-        self.assertTrue(result.equals(expected))
-
-        result = self.factor[self.factor < 'c']
-        expected = self.factor[np.asarray(self.factor) < 'c']
-        self.assertTrue(result.equals(expected))
-
-        result = self.factor[self.factor > 'a']
-        expected = self.factor[np.asarray(self.factor) > 'a']
-        self.assertTrue(result.equals(expected))
-
-        result = self.factor[self.factor >= 'b']
-        expected = self.factor[np.asarray(self.factor) >= 'b']
-        self.assertTrue(result.equals(expected))
-
-        result = self.factor[self.factor <= 'b']
-        expected = self.factor[np.asarray(self.factor) <= 'b']
-        self.assertTrue(result.equals(expected))
-
-        n = len(self.factor)
-
-        other = self.factor[np.random.permutation(n)]
-        result = self.factor == other
-        expected = np.asarray(self.factor) == np.asarray(other)
-        self.assert_numpy_array_equal(result, expected)
-
-        result = self.factor == 'd'
-        expected = np.repeat(False, len(self.factor))
-        self.assert_numpy_array_equal(result, expected)
-
-        # comparisons with categoricals
-        cat_rev = pd.Categorical(["a","b","c"], categories=["c","b","a"], ordered=True)
-        cat_rev_base = pd.Categorical(["b","b","b"], categories=["c","b","a"], ordered=True)
-        cat = pd.Categorical(["a","b","c"], ordered=True)
-        cat_base = pd.Categorical(["b","b","b"], categories=cat.categories, ordered=True)
-
-        # comparisons need to take categories ordering into account
-        res_rev = cat_rev > cat_rev_base
-        exp_rev = np.array([True, False, False])
-        self.assert_numpy_array_equal(res_rev, exp_rev)
-
-        res_rev = cat_rev < cat_rev_base
-        exp_rev = np.array([False, False, True])
-        self.assert_numpy_array_equal(res_rev, exp_rev)
-
-        res = cat > cat_base
-        exp = np.array([False, False, True])
-        self.assert_numpy_array_equal(res, exp)
-
-        # Only categories with same categories can be compared
-        def f():
-            cat > cat_rev
-        self.assertRaises(TypeError, f)
-
-        cat_rev_base2 = pd.Categorical(["b","b","b"], categories=["c","b","a","d"])
-        def f():
-            cat_rev > cat_rev_base2
-        self.assertRaises(TypeError, f)
-
-        # Only categories with same ordering information can be compared
-        cat_unorderd = cat.set_ordered(False)
-        self.assertFalse((cat > cat).any())
-        def f():
-            cat > cat_unorderd
-        self.assertRaises(TypeError, f)
-
-        # comparison (in both directions) with Series will raise
-        s = Series(["b","b","b"])
-        self.assertRaises(TypeError, lambda: cat > s)
-        self.assertRaises(TypeError, lambda: cat_rev > s)
-        self.assertRaises(TypeError, lambda: s < cat)
-        self.assertRaises(TypeError, lambda: s < cat_rev)
-
-        # comparison with numpy.array will raise in both direction, but only on newer
-        # numpy versions
-        a = np.array(["b","b","b"])
-        self.assertRaises(TypeError, lambda: cat > a)
-        self.assertRaises(TypeError, lambda: cat_rev > a)
-
-        # The following work via '__array_priority__ = 1000'
-        # works only on numpy >= 1.7.1
-        if LooseVersion(np.__version__) > "1.7.1":
-            self.assertRaises(TypeError, lambda: a < cat)
-            self.assertRaises(TypeError, lambda: a < cat_rev)
-
-        # Make sure that unequal comparison take the categories order in account
-        cat_rev = pd.Categorical(list("abc"), categories=list("cba"), ordered=True)
-        exp = np.array([True, False, False])
-        res = cat_rev > "b"
-        self.assert_numpy_array_equal(res, exp)
-
-
-    def test_na_flags_int_categories(self):
-        # #1457
-
-        categories = lrange(10)
-        labels = np.random.randint(0, 10, 20)
-        labels[::5] = -1
-
-        cat = Categorical(labels, categories, fastpath=True)
-        repr(cat)
-
-        self.assert_numpy_array_equal(com.isnull(cat), labels == -1)
-
-    def test_categories_none(self):
-        factor = Categorical(['a', 'b', 'b', 'a',
-                              'a', 'c', 'c', 'c'], ordered=True)
-        self.assertTrue(factor.equals(self.factor))
-
-    def test_describe(self):
-        # string type
-        desc = self.factor.describe()
-        expected = DataFrame.from_dict(dict(counts=[3, 2, 3],
-                                            freqs=[3/8., 2/8., 3/8.],
-                                            categories=['a', 'b', 'c'])
-                                            ).set_index('categories')
-        tm.assert_frame_equal(desc, expected)
-
-        # check unused categories
-        cat = self.factor.copy()
-        cat.set_categories(["a","b","c","d"], inplace=True)
-        desc = cat.describe()
-        expected = DataFrame.from_dict(dict(counts=[3, 2, 3, 0],
-                                            freqs=[3/8., 2/8., 3/8., 0],
-                                            categories=['a', 'b', 'c', 'd'])
-                                            ).set_index('categories')
-        tm.assert_frame_equal(desc, expected)
-
-        # check an integer one
-        desc = Categorical([1,2,3,1,2,3,3,2,1,1,1]).describe()
-        expected = DataFrame.from_dict(dict(counts=[5, 3, 3],
-                                            freqs=[5/11., 3/11., 3/11.],
-                                            categories=[1,2,3]
-                                            )
-                                            ).set_index('categories')
-        tm.assert_frame_equal(desc, expected)
-
-        # https://github.com/pydata/pandas/issues/3678
-        # describe should work with NaN
-        cat = pd.Categorical([np.nan,1, 2, 2])
-        desc = cat.describe()
-        expected = DataFrame.from_dict(dict(counts=[1, 2, 1],
-                                            freqs=[1/4., 2/4., 1/4.],
-                                            categories=Categorical([1,2,np.nan],
-                                                                   [1, 2])
-                                            )
-                                            ).set_index('categories')
-        tm.assert_frame_equal(desc, expected)
-
-        # NA as a category
-        with tm.assert_produces_warning(FutureWarning):
-            cat = pd.Categorical(["a","c","c",np.nan], categories=["b","a","c",np.nan])
-            result = cat.describe()
-
-        expected = DataFrame([[0,0],[1,0.25],[2,0.5],[1,0.25]],
-                             columns=['counts','freqs'],
-                             index=Index(['b','a','c',np.nan],name='categories'))
-        tm.assert_frame_equal(result,expected)
-
-        # NA as an unused category
-        with tm.assert_produces_warning(FutureWarning):
-            cat = pd.Categorical(["a","c","c"], categories=["b","a","c",np.nan])
-            result = cat.describe()
-
-        expected = DataFrame([[0,0],[1,1/3.],[2,2/3.],[0,0]],
-                             columns=['counts','freqs'],
-                             index=Index(['b','a','c',np.nan],name='categories'))
-        tm.assert_frame_equal(result,expected)
-
-
-    def test_print(self):
-        expected = ["[a, b, b, a, a, c, c, c]",
-                    "Categories (3, object): [a < b < c]"]
-        expected = "\n".join(expected)
-        actual = repr(self.factor)
-        self.assertEqual(actual, expected)
-
-    def test_big_print(self):
-        factor = Categorical([0,1,2,0,1,2]*100, ['a', 'b', 'c'], name='cat', fastpath=True)
-        expected = ["[a, b, c, a, b, ..., b, c, a, b, c]",
-                    "Length: 600",
-                    "Categories (3, object): [a, b, c]"]
-        expected = "\n".join(expected)
-
-        actual = repr(factor)
-
-        self.assertEqual(actual, expected)
-
-    def test_empty_print(self):
-        factor = Categorical([], ["a","b","c"])
-        expected = ("[], Categories (3, object): [a, b, c]")
-        # hack because array_repr changed in numpy > 1.6.x
-        actual = repr(factor)
-        self.assertEqual(actual, expected)
-
-        self.assertEqual(expected, actual)
-        factor = Categorical([], ["a","b","c"], ordered=True)
-        expected = ("[], Categories (3, object): [a < b < c]")
-        actual = repr(factor)
-        self.assertEqual(expected, actual)
-
-        factor = Categorical([], [])
-        expected = ("[], Categories (0, object): []")
-        self.assertEqual(expected, repr(factor))
-
-    def test_print_none_width(self):
-        # GH10087
-        a = pd.Series(pd.Categorical([1,2,3,4]))
-        exp = u("0    1\n1    2\n2    3\n3    4\n" +
-              "dtype: category\nCategories (4, int64): [1, 2, 3, 4]")
-
-        with option_context("display.width", None):
-            self.assertEqual(exp, repr(a))
-
-    def test_unicode_print(self):
-        if PY3:
-            _rep = repr
-        else:
-            _rep = unicode
-
-        c = pd.Categorical(['aaaaa', 'bb', 'cccc'] * 20)
-        expected = u"""[aaaaa, bb, cccc, aaaaa, bb, ..., bb, cccc, aaaaa, bb, cccc]
-Length: 60
-Categories (3, object): [aaaaa, bb, cccc]"""
-        self.assertEqual(_rep(c), expected)
-
-        c = pd.Categorical([u'ああああ', u'いいいいい', u'ううううううう'] * 20)
-        expected = u"""[ああああ, いいいいい, ううううううう, ああああ, いいいいい, ..., いいいいい, ううううううう, ああああ, いいいいい, ううううううう]
-Length: 60
-Categories (3, object): [ああああ, いいいいい, ううううううう]"""
-        self.assertEqual(_rep(c), expected)
-
-        # unicode option should not affect to Categorical, as it doesn't care the repr width
-        with option_context('display.unicode.east_asian_width', True):
-
-            c = pd.Categorical([u'ああああ', u'いいいいい', u'ううううううう'] * 20)
-            expected = u"""[ああああ, いいいいい, ううううううう, ああああ, いいいいい, ..., いいいいい, ううううううう, ああああ, いいいいい, ううううううう]
-Length: 60
-Categories (3, object): [ああああ, いいいいい, ううううううう]"""
-            self.assertEqual(_rep(c), expected)
-
-    def test_periodindex(self):
-        idx1 = PeriodIndex(['2014-01', '2014-01', '2014-02', '2014-02',
-                            '2014-03', '2014-03'], freq='M')
-
-        cat1 = Categorical.from_array(idx1)
-        str(cat1)
-        exp_arr = np.array([0, 0, 1, 1, 2, 2],dtype='int64')
-        exp_idx = PeriodIndex(['2014-01', '2014-02', '2014-03'], freq='M')
-        self.assert_numpy_array_equal(cat1._codes, exp_arr)
-        self.assertTrue(cat1.categories.equals(exp_idx))
-
-        idx2 = PeriodIndex(['2014-03', '2014-03', '2014-02', '2014-01',
-                            '2014-03', '2014-01'], freq='M')
-        cat2 = Categorical.from_array(idx2, ordered=True)
-        str(cat2)
-        exp_arr = np.array([2, 2, 1, 0, 2, 0],dtype='int64')
-        exp_idx2 = PeriodIndex(['2014-01', '2014-02', '2014-03'], freq='M')
-        self.assert_numpy_array_equal(cat2._codes, exp_arr)
-        self.assertTrue(cat2.categories.equals(exp_idx2))
-
-        idx3 = PeriodIndex(['2013-12', '2013-11', '2013-10', '2013-09',
-                            '2013-08', '2013-07', '2013-05'], freq='M')
-        cat3 = Categorical.from_array(idx3, ordered=True)
-        exp_arr = np.array([6, 5, 4, 3, 2, 1, 0],dtype='int64')
-        exp_idx = PeriodIndex(['2013-05', '2013-07', '2013-08', '2013-09',
-                               '2013-10', '2013-11', '2013-12'], freq='M')
-        self.assert_numpy_array_equal(cat3._codes, exp_arr)
-        self.assertTrue(cat3.categories.equals(exp_idx))
-
-    def test_categories_assigments(self):
-        s = pd.Categorical(["a","b","c","a"])
-        exp = np.array([1,2,3,1])
-        s.categories = [1,2,3]
-        self.assert_numpy_array_equal(s.__array__(), exp)
-        self.assert_numpy_array_equal(s.categories, np.array([1,2,3]))
-        # lengthen
-        def f():
-            s.categories = [1,2,3,4]
-        self.assertRaises(ValueError, f)
-        # shorten
-        def f():
-            s.categories = [1,2]
-        self.assertRaises(ValueError, f)
-
-    def test_construction_with_ordered(self):
-        # GH 9347, 9190
-        cat = Categorical([0,1,2])
-        self.assertFalse(cat.ordered)
-        cat = Categorical([0,1,2],ordered=False)
-        self.assertFalse(cat.ordered)
-        cat = Categorical([0,1,2],ordered=True)
-        self.assertTrue(cat.ordered)
-
-    def test_ordered_api(self):
-        # GH 9347
-        cat1 = pd.Categorical(["a","c","b"], ordered=False)
-        self.assertTrue(cat1.categories.equals(Index(['a','b','c'])))
-        self.assertFalse(cat1.ordered)
-
-        cat2 = pd.Categorical(["a","c","b"], categories=['b','c','a'], ordered=False)
-        self.assertTrue(cat2.categories.equals(Index(['b','c','a'])))
-        self.assertFalse(cat2.ordered)
-
-        cat3 = pd.Categorical(["a","c","b"], ordered=True)
-        self.assertTrue(cat3.categories.equals(Index(['a','b','c'])))
-        self.assertTrue(cat3.ordered)
-
-        cat4 = pd.Categorical(["a","c","b"], categories=['b','c','a'], ordered=True)
-        self.assertTrue(cat4.categories.equals(Index(['b','c','a'])))
-        self.assertTrue(cat4.ordered)
-
-    def test_set_ordered(self):
-
-        cat = Categorical(["a","b","c","a"], ordered=True)
-        cat2 = cat.as_unordered()
-        self.assertFalse(cat2.ordered)
-        cat2 = cat.as_ordered()
-        self.assertTrue(cat2.ordered)
-        cat2.as_unordered(inplace=True)
-        self.assertFalse(cat2.ordered)
-        cat2.as_ordered(inplace=True)
-        self.assertTrue(cat2.ordered)
-
-        self.assertTrue(cat2.set_ordered(True).ordered)
-        self.assertFalse(cat2.set_ordered(False).ordered)
-        cat2.set_ordered(True, inplace=True)
-        self.assertTrue(cat2.ordered)
-        cat2.set_ordered(False, inplace=True)
-        self.assertFalse(cat2.ordered)
-
-        # deperecated in v0.16.0
-        with tm.assert_produces_warning(FutureWarning):
-            cat.ordered = False
-            self.assertFalse(cat.ordered)
-        with tm.assert_produces_warning(FutureWarning):
-            cat.ordered = True
-            self.assertTrue(cat.ordered)
-
-    def test_set_categories(self):
-        cat = Categorical(["a","b","c","a"], ordered=True)
-        exp_categories = np.array(["c","b","a"])
-        exp_values = np.array(["a","b","c","a"])
-
-        res = cat.set_categories(["c","b","a"], inplace=True)
-        self.assert_numpy_array_equal(cat.categories, exp_categories)
-        self.assert_numpy_array_equal(cat.__array__(), exp_values)
-        self.assertIsNone(res)
-
-        res = cat.set_categories(["a","b","c"])
-        # cat must be the same as before
-        self.assert_numpy_array_equal(cat.categories, exp_categories)
-        self.assert_numpy_array_equal(cat.__array__(), exp_values)
-        # only res is changed
-        exp_categories_back = np.array(["a","b","c"])
-        self.assert_numpy_array_equal(res.categories, exp_categories_back)
-        self.assert_numpy_array_equal(res.__array__(), exp_values)
-
-        # not all "old" included in "new" -> all not included ones are now np.nan
-        cat = Categorical(["a","b","c","a"], ordered=True)
-        res = cat.set_categories(["a"])
-        self.assert_numpy_array_equal(res.codes, np.array([0,-1,-1,0]))
-
-        # still not all "old" in "new"
-        res = cat.set_categories(["a","b","d"])
-        self.assert_numpy_array_equal(res.codes, np.array([0,1,-1,0]))
-        self.assert_numpy_array_equal(res.categories, np.array(["a","b","d"]))
-
-        # all "old" included in "new"
-        cat = cat.set_categories(["a","b","c","d"])
-        exp_categories = np.array(["a","b","c","d"])
-        self.assert_numpy_array_equal(cat.categories, exp_categories)
-
-        # internals...
-        c = Categorical([1,2,3,4,1], categories=[1,2,3,4], ordered=True)
-        self.assert_numpy_array_equal(c._codes, np.array([0,1,2,3,0]))
-        self.assert_numpy_array_equal(c.categories , np.array([1,2,3,4] ))
-        self.assert_numpy_array_equal(c.get_values(), np.array([1,2,3,4,1] ))
-        c = c.set_categories([4,3,2,1]) # all "pointers" to '4' must be changed from 3 to 0,...
-        self.assert_numpy_array_equal(c._codes, np.array([3,2,1,0,3])) # positions are changed
-        self.assert_numpy_array_equal(c.categories, np.array([4,3,2,1])) # categories are now in new order
-        self.assert_numpy_array_equal(c.get_values(), np.array([1,2,3,4,1])) # output is the same
-        self.assertTrue(c.min(), 4)
-        self.assertTrue(c.max(), 1)
-
-        # set_categories should set the ordering if specified
-        c2 = c.set_categories([4,3,2,1],ordered=False)
-        self.assertFalse(c2.ordered)
-        self.assert_numpy_array_equal(c.get_values(), c2.get_values())
-
-        # set_categories should pass thru the ordering
-        c2 = c.set_ordered(False).set_categories([4,3,2,1])
-        self.assertFalse(c2.ordered)
-        self.assert_numpy_array_equal(c.get_values(), c2.get_values())
-
-    def test_rename_categories(self):
-        cat = pd.Categorical(["a","b","c","a"])
-
-        # inplace=False: the old one must not be changed
-        res = cat.rename_categories([1,2,3])
-        self.assert_numpy_array_equal(res.__array__(), np.array([1,2,3,1]))
-        self.assert_numpy_array_equal(res.categories, np.array([1,2,3]))
-        self.assert_numpy_array_equal(cat.__array__(), np.array(["a","b","c","a"]))
-        self.assert_numpy_array_equal(cat.categories, np.array(["a","b","c"]))
-        res = cat.rename_categories([1,2,3], inplace=True)
-
-        # and now inplace
-        self.assertIsNone(res)
-        self.assert_numpy_array_equal(cat.__array__(), np.array([1,2,3,1]))
-        self.assert_numpy_array_equal(cat.categories, np.array([1,2,3]))
-
-        # lengthen
-        def f():
-            cat.rename_categories([1,2,3,4])
-        self.assertRaises(ValueError, f)
-        # shorten
-        def f():
-            cat.rename_categories([1,2])
-        self.assertRaises(ValueError, f)
-
-    def test_reorder_categories(self):
-        cat = Categorical(["a","b","c","a"], ordered=True)
-        old = cat.copy()
-        new = Categorical(["a","b","c","a"], categories=["c","b","a"], ordered=True)
-
-        # first inplace == False
-        res = cat.reorder_categories(["c","b","a"])
-        # cat must be the same as before
-        self.assert_categorical_equal(cat, old)
-        # only res is changed
-        self.assert_categorical_equal(res, new)
-
-        # inplace == True
-        res = cat.reorder_categories(["c","b","a"], inplace=True)
-        self.assertIsNone(res)
-        self.assert_categorical_equal(cat, new)
-
-        # not all "old" included in "new"
-        cat = Categorical(["a","b","c","a"], ordered=True)
-        def f():
-            cat.reorder_categories(["a"])
-        self.assertRaises(ValueError, f)
-
-        # still not all "old" in "new"
-        def f():
-            cat.reorder_categories(["a","b","d"])
-        self.assertRaises(ValueError, f)
-
-        # all "old" included in "new", but too long
-        def f():
-            cat.reorder_categories(["a","b","c","d"])
-        self.assertRaises(ValueError, f)
-
-    def test_add_categories(self):
-        cat = Categorical(["a","b","c","a"], ordered=True)
-        old = cat.copy()
-        new = Categorical(["a","b","c","a"], categories=["a","b","c","d"], ordered=True)
-
-        # first inplace == False
-        res = cat.add_categories("d")
-        self.assert_categorical_equal(cat, old)
-        self.assert_categorical_equal(res, new)
-
-        res = cat.add_categories(["d"])
-        self.assert_categorical_equal(cat, old)
-        self.assert_categorical_equal(res, new)
-
-        # inplace == True
-        res = cat.add_categories("d", inplace=True)
-        self.assert_categorical_equal(cat, new)
-        self.assertIsNone(res)
-
-        # new is in old categories
-        def f():
-            cat.add_categories(["d"])
-        self.assertRaises(ValueError, f)
-
-        # GH 9927
-        cat = Categorical(list("abc"), ordered=True)
-        expected = Categorical(list("abc"), categories=list("abcde"), ordered=True)
-        # test with Series, np.array, index, list
-        res = cat.add_categories(Series(["d", "e"]))
-        self.assert_categorical_equal(res, expected)
-        res = cat.add_categories(np.array(["d", "e"]))
-        self.assert_categorical_equal(res, expected)
-        res = cat.add_categories(Index(["d", "e"]))
-        self.assert_categorical_equal(res, expected)
-        res = cat.add_categories(["d", "e"])
-        self.assert_categorical_equal(res, expected)
-
-    def test_remove_categories(self):
-        cat = Categorical(["a","b","c","a"], ordered=True)
-        old = cat.copy()
-        new = Categorical(["a","b",np.nan,"a"], categories=["a","b"], ordered=True)
-
-        # first inplace == False
-        res = cat.remove_categories("c")
-        self.assert_categorical_equal(cat, old)
-        self.assert_categorical_equal(res, new)
-
-        res = cat.remove_categories(["c"])
-        self.assert_categorical_equal(cat, old)
-        self.assert_categorical_equal(res, new)
-
-        # inplace == True
-        res = cat.remove_categories("c", inplace=True)
-        self.assert_categorical_equal(cat, new)
-        self.assertIsNone(res)
-
-        # removal is not in categories
-        def f():
-            cat.remove_categories(["c"])
-        self.assertRaises(ValueError, f)
-
-    def test_remove_unused_categories(self):
-        c = Categorical(["a","b","c","d","a"], categories=["a","b","c","d","e"])
-        exp_categories_all = np.array(["a","b","c","d","e"])
-        exp_categories_dropped = np.array(["a","b","c","d"])
-
-        self.assert_numpy_array_equal(c.categories, exp_categories_all)
-
-        res = c.remove_unused_categories()
-        self.assert_numpy_array_equal(res.categories, exp_categories_dropped)
-        self.assert_numpy_array_equal(c.categories, exp_categories_all)
-
-        res = c.remove_unused_categories(inplace=True)
-        self.assert_numpy_array_equal(c.categories, exp_categories_dropped)
-        self.assertIsNone(res)
-
-
-    def test_nan_handling(self):
-
-        # Nans are represented as -1 in codes
-        c = Categorical(["a","b",np.nan,"a"])
-        self.assert_numpy_array_equal(c.categories , np.array(["a","b"]))
-        self.assert_numpy_array_equal(c._codes , np.array([0,1,-1,0]))
-        c[1] = np.nan
-        self.assert_numpy_array_equal(c.categories , np.array(["a","b"]))
-        self.assert_numpy_array_equal(c._codes , np.array([0,-1,-1,0]))
-
-        # If categories have nan included, the code should point to that instead
-        with tm.assert_produces_warning(FutureWarning):
-            c = Categorical(["a","b",np.nan,"a"], categories=["a","b",np.nan])
-        self.assert_numpy_array_equal(c.categories, np.array(["a","b",np.nan],
-                                                             dtype=np.object_))
-        self.assert_numpy_array_equal(c._codes, np.array([0,1,2,0]))
-        c[1] = np.nan
-        self.assert_numpy_array_equal(c.categories, np.array(["a","b",np.nan],
-                                                             dtype=np.object_))
-        self.assert_numpy_array_equal(c._codes, np.array([0,2,2,0]))
-
-        # Changing categories should also make the replaced category np.nan
-        c = Categorical(["a","b","c","a"])
-        with tm.assert_produces_warning(FutureWarning):
-            c.categories = ["a","b",np.nan]
-        self.assert_numpy_array_equal(c.categories, np.array(["a","b",np.nan],
-                                                             dtype=np.object_))
-        self.assert_numpy_array_equal(c._codes, np.array([0,1,2,0]))
-
-        # Adding nan to categories should make assigned nan point to the category!
-        c = Categorical(["a","b",np.nan,"a"])
-        self.assert_numpy_array_equal(c.categories , np.array(["a","b"]))
-        self.assert_numpy_array_equal(c._codes , np.array([0,1,-1,0]))
-        with tm.assert_produces_warning(FutureWarning):
-            c.set_categories(["a","b",np.nan], rename=True, inplace=True)
-        self.assert_numpy_array_equal(c.categories, np.array(["a","b",np.nan],
-                                                             dtype=np.object_))
-        self.assert_numpy_array_equal(c._codes, np.array([0,1,-1,0]))
-        c[1] = np.nan
-        self.assert_numpy_array_equal(c.categories , np.array(["a","b",np.nan],
-                                                              dtype=np.object_))
-        self.assert_numpy_array_equal(c._codes, np.array([0,2,-1,0]))
-
-        # Remove null categories (GH 10156)
-        cases = [
-            ([1.0, 2.0, np.nan], [1.0, 2.0]),
-            (['a', 'b', None], ['a', 'b']),
-            ([pd.Timestamp('2012-05-01'), pd.NaT], [pd.Timestamp('2012-05-01')])
-        ]
-
-        null_values = [np.nan, None, pd.NaT]
-
-        for with_null, without in cases:
-            with tm.assert_produces_warning(FutureWarning):
-                base = Categorical([], with_null)
-            expected = Categorical([], without)
-
-            for nullval in null_values:
-                result = base.remove_categories(nullval)
-            self.assert_categorical_equal(result, expected)
-
-        # Different null values are indistinguishable
-        for i, j in [(0, 1), (0, 2), (1, 2)]:
-            nulls = [null_values[i], null_values[j]]
-
-            def f():
-                with tm.assert_produces_warning(FutureWarning):
-                    Categorical([], categories=nulls)
-            self.assertRaises(ValueError, f)
-
-
-    def test_isnull(self):
-        exp = np.array([False, False, True])
-        c = Categorical(["a","b",np.nan])
-        res = c.isnull()
-        self.assert_numpy_array_equal(res, exp)
-
-        with tm.assert_produces_warning(FutureWarning):
-            c = Categorical(["a","b",np.nan], categories=["a","b",np.nan])
-        res = c.isnull()
-        self.assert_numpy_array_equal(res, exp)
-
-        # test both nan in categories and as -1
-        exp = np.array([True, False, True])
-        c = Categorical(["a","b",np.nan])
-        with tm.assert_produces_warning(FutureWarning):
-            c.set_categories(["a","b",np.nan], rename=True, inplace=True)
-        c[0] = np.nan
-        res = c.isnull()
-        self.assert_numpy_array_equal(res, exp)
-
-    def test_codes_immutable(self):
-
-        # Codes should be read only
-        c = Categorical(["a","b","c","a", np.nan])
-        exp = np.array([0,1,2,0,-1],dtype='int8')
-        self.assert_numpy_array_equal(c.codes, exp)
-
-        # Assignments to codes should raise
-        def f():
-            c.codes = np.array([0,1,2,0,1],dtype='int8')
-        self.assertRaises(ValueError, f)
-
-        # changes in the codes array should raise
-        # np 1.6.1 raises RuntimeError rather than ValueError
-        codes= c.codes
-        def f():
-            codes[4] = 1
-        self.assertRaises(ValueError, f)
-
-        # But even after getting the codes, the original array should still be writeable!
-        c[4] = "a"
-        exp = np.array([0,1,2,0,0],dtype='int8')
-        self.assert_numpy_array_equal(c.codes, exp)
-        c._codes[4] = 2
-        exp = np.array([0,1,2,0, 2],dtype='int8')
-        self.assert_numpy_array_equal(c.codes, exp)
-
-
-    def test_min_max(self):
-
-        # unordered cats have no min/max
-        cat = Categorical(["a","b","c","d"], ordered=False)
-        self.assertRaises(TypeError, lambda : cat.min())
-        self.assertRaises(TypeError, lambda : cat.max())
-        cat = Categorical(["a","b","c","d"], ordered=True)
-        _min = cat.min()
-        _max = cat.max()
-        self.assertEqual(_min, "a")
-        self.assertEqual(_max, "d")
-        cat = Categorical(["a","b","c","d"], categories=['d','c','b','a'], ordered=True)
-        _min = cat.min()
-        _max = cat.max()
-        self.assertEqual(_min, "d")
-        self.assertEqual(_max, "a")
-        cat = Categorical([np.nan,"b","c",np.nan], categories=['d','c','b','a'], ordered=True)
-        _min = cat.min()
-        _max = cat.max()
-        self.assertTrue(np.isnan(_min))
-        self.assertEqual(_max, "b")
-
-        _min = cat.min(numeric_only=True)
-        self.assertEqual(_min, "c")
-        _max = cat.max(numeric_only=True)
-        self.assertEqual(_max, "b")
-
-        cat = Categorical([np.nan,1,2,np.nan], categories=[5,4,3,2,1], ordered=True)
-        _min = cat.min()
-        _max = cat.max()
-        self.assertTrue(np.isnan(_min))
-        self.assertEqual(_max, 1)
-
-        _min = cat.min(numeric_only=True)
-        self.assertEqual(_min, 2)
-        _max = cat.max(numeric_only=True)
-        self.assertEqual(_max, 1)
-
-    def test_unique(self):
-        # categories are reordered based on value when ordered=False
-        cat = Categorical(["a", "b"])
-        exp = np.asarray(["a", "b"])
-        res = cat.unique()
-        self.assert_numpy_array_equal(res, exp)
-
-        cat = Categorical(["a", "b", "a", "a"], categories=["a", "b", "c"])
-        res = cat.unique()
-        self.assert_numpy_array_equal(res, exp)
-        tm.assert_categorical_equal(res, Categorical(exp))
-
-        cat = Categorical(["c", "a", "b", "a", "a"], categories=["a", "b", "c"])
-        exp = np.asarray(["c", "a", "b"])
-        res = cat.unique()
-        self.assert_numpy_array_equal(res, exp)
-        tm.assert_categorical_equal(res, Categorical(exp, categories=['c', 'a', 'b']))
-
-        # nan must be removed
-        cat = Categorical(["b", np.nan, "b", np.nan, "a"], categories=["a", "b", "c"])
-        res = cat.unique()
-        exp = np.asarray(["b", np.nan, "a"], dtype=object)
-        self.assert_numpy_array_equal(res, exp)
-        tm.assert_categorical_equal(res, Categorical(["b", np.nan, "a"], categories=["b", "a"]))
-
-    def test_unique_ordered(self):
-        # keep categories order when ordered=True
-        cat = Categorical(['b', 'a', 'b'], categories=['a', 'b'], ordered=True)
-        res = cat.unique()
-        exp = np.asarray(['b', 'a'])
-        exp_cat = Categorical(exp, categories=['a', 'b'], ordered=True)
-        self.assert_numpy_array_equal(res, exp)
-        tm.assert_categorical_equal(res, exp_cat)
-
-        cat = Categorical(['c', 'b', 'a', 'a'], categories=['a', 'b', 'c'], ordered=True)
-        res = cat.unique()
-        exp = np.asarray(['c', 'b', 'a'])
-        exp_cat = Categorical(exp, categories=['a', 'b', 'c'], ordered=True)
-        self.assert_numpy_array_equal(res, exp)
-        tm.assert_categorical_equal(res, exp_cat)
-
-        cat = Categorical(['b', 'a', 'a'], categories=['a', 'b', 'c'], ordered=True)
-        res = cat.unique()
-        exp = np.asarray(['b', 'a'])
-        exp_cat = Categorical(exp, categories=['a', 'b'], ordered=True)
-        self.assert_numpy_array_equal(res, exp)
-        tm.assert_categorical_equal(res, exp_cat)
-
-        cat = Categorical(['b', 'b', np.nan, 'a'], categories=['a', 'b', 'c'], ordered=True)
-        res = cat.unique()
-        exp = np.asarray(['b', np.nan, 'a'], dtype=object)
-        exp_cat = Categorical(exp, categories=['a', 'b'], ordered=True)
-        self.assert_numpy_array_equal(res, exp)
-        tm.assert_categorical_equal(res, exp_cat)
-
-    def test_mode(self):
-        s = Categorical([1,1,2,4,5,5,5], categories=[5,4,3,2,1], ordered=True)
-        res = s.mode()
-        exp = Categorical([5], categories=[5,4,3,2,1], ordered=True)
-        self.assertTrue(res.equals(exp))
-        s = Categorical([1,1,1,4,5,5,5], categories=[5,4,3,2,1], ordered=True)
-        res = s.mode()
-        exp = Categorical([5,1], categories=[5,4,3,2,1], ordered=True)
-        self.assertTrue(res.equals(exp))
-        s = Categorical([1,2,3,4,5], categories=[5,4,3,2,1], ordered=True)
-        res = s.mode()
-        exp = Categorical([], categories=[5,4,3,2,1], ordered=True)
-        self.assertTrue(res.equals(exp))
-        # NaN should not become the mode!
-        s = Categorical([np.nan,np.nan,np.nan,4,5], categories=[5,4,3,2,1], ordered=True)
-        res = s.mode()
-        exp = Categorical([], categories=[5,4,3,2,1], ordered=True)
-        self.assertTrue(res.equals(exp))
-        s = Categorical([np.nan,np.nan,np.nan,4,5,4], categories=[5,4,3,2,1], ordered=True)
-        res = s.mode()
-        exp = Categorical([4], categories=[5,4,3,2,1], ordered=True)
-        self.assertTrue(res.equals(exp))
-        s = Categorical([np.nan,np.nan,4,5,4], categories=[5,4,3,2,1], ordered=True)
-        res = s.mode()
-        exp = Categorical([4], categories=[5,4,3,2,1], ordered=True)
-        self.assertTrue(res.equals(exp))
-
-
-    def test_sort(self):
-
-        # unordered cats are sortable
-        cat = Categorical(["a","b","b","a"], ordered=False)
-        cat.sort_values()
-        cat.sort()
-
-        cat = Categorical(["a","c","b","d"], ordered=True)
-
-        # sort_values
-        res = cat.sort_values()
-        exp = np.array(["a","b","c","d"],dtype=object)
-        self.assert_numpy_array_equal(res.__array__(), exp)
-
-        cat = Categorical(["a","c","b","d"], categories=["a","b","c","d"], ordered=True)
-        res = cat.sort_values()
-        exp = np.array(["a","b","c","d"],dtype=object)
-        self.assert_numpy_array_equal(res.__array__(), exp)
-
-        res = cat.sort_values(ascending=False)
-        exp = np.array(["d","c","b","a"],dtype=object)
-        self.assert_numpy_array_equal(res.__array__(), exp)
-
-        # sort (inplace order)
-        cat1 = cat.copy()
-        cat1.sort()
-        exp = np.array(["a","b","c","d"],dtype=object)
-        self.assert_numpy_array_equal(cat1.__array__(), exp)
-
-    def test_slicing_directly(self):
-        cat = Categorical(["a","b","c","d","a","b","c"])
-        sliced = cat[3]
-        tm.assert_equal(sliced, "d")
-        sliced = cat[3:5]
-        expected = Categorical(["d","a"], categories=['a', 'b', 'c', 'd'])
-        self.assert_numpy_array_equal(sliced._codes, expected._codes)
-        tm.assert_index_equal(sliced.categories, expected.categories)
-
-    def test_set_item_nan(self):
-        cat = pd.Categorical([1,2,3])
-        exp = pd.Categorical([1,np.nan,3], categories=[1,2,3])
-        cat[1] = np.nan
-        self.assertTrue(cat.equals(exp))
-
-        # if nan in categories, the proper code should be set!
-        cat = pd.Categorical([1,2,3, np.nan], categories=[1,2,3])
-        with tm.assert_produces_warning(FutureWarning):
-            cat.set_categories([1,2,3, np.nan], rename=True, inplace=True)
-        cat[1] = np.nan
-        exp = np.array([0,3,2,-1])
-        self.assert_numpy_array_equal(cat.codes, exp)
-
-        cat = pd.Categorical([1,2,3, np.nan], categories=[1,2,3])
-        with tm.assert_produces_warning(FutureWarning):
-            cat.set_categories([1,2,3, np.nan], rename=True, inplace=True)
-        cat[1:3] = np.nan
-        exp = np.array([0,3,3,-1])
-        self.assert_numpy_array_equal(cat.codes, exp)
-
-        cat = pd.Categorical([1,2,3, np.nan], categories=[1,2,3])
-        with tm.assert_produces_warning(FutureWarning):
-            cat.set_categories([1,2,3, np.nan], rename=True, inplace=True)
-        cat[1:3] = [np.nan, 1]
-        exp = np.array([0,3,0,-1])
-        self.assert_numpy_array_equal(cat.codes, exp)
-
-        cat = pd.Categorical([1,2,3, np.nan], categories=[1,2,3])
-        with tm.assert_produces_warning(FutureWarning):
-            cat.set_categories([1,2,3, np.nan], rename=True, inplace=True)
-        cat[1:3] = [np.nan, np.nan]
-        exp = np.array([0,3,3,-1])
-        self.assert_numpy_array_equal(cat.codes, exp)
-
-        cat = pd.Categorical([1,2, np.nan, 3], categories=[1,2,3])
-        with tm.assert_produces_warning(FutureWarning):
-            cat.set_categories([1,2,3, np.nan], rename=True, inplace=True)
-        cat[pd.isnull(cat)] = np.nan
-        exp = np.array([0,1,3,2])
-        self.assert_numpy_array_equal(cat.codes, exp)
-
-    def test_shift(self):
-        # GH 9416
-        cat = pd.Categorical(['a', 'b', 'c', 'd', 'a'])
-
-        # shift forward
-        sp1 = cat.shift(1)
-        xp1 = pd.Categorical([np.nan, 'a', 'b', 'c', 'd'])
-        self.assert_categorical_equal(sp1, xp1)
-        self.assert_categorical_equal(cat[:-1], sp1[1:])
-
-        # shift back
-        sn2 = cat.shift(-2)
-        xp2 = pd.Categorical(['c', 'd', 'a', np.nan, np.nan],
-                categories=['a', 'b', 'c', 'd'])
-        self.assert_categorical_equal(sn2, xp2)
-        self.assert_categorical_equal(cat[2:], sn2[:-2])
-
-        # shift by zero
-        self.assert_categorical_equal(cat, cat.shift(0))
-
-    def test_nbytes(self):
-        cat = pd.Categorical([1,2,3])
-        exp = cat._codes.nbytes + cat._categories.values.nbytes
-        self.assertEqual(cat.nbytes, exp)
-
-    def test_searchsorted(self):
-        # https://github.com/pydata/pandas/issues/8420
-        s1 = pd.Series(['apple', 'bread', 'bread', 'cheese', 'milk' ])
-        s2 = pd.Series(['apple', 'bread', 'bread', 'cheese', 'milk', 'donuts' ])
-        c1 = pd.Categorical(s1, ordered=True)
-        c2 = pd.Categorical(s2, ordered=True)
-
-        # Single item array
-        res = c1.searchsorted(['bread'])
-        chk = s1.searchsorted(['bread'])
-        exp = np.array([1])
-        self.assert_numpy_array_equal(res, exp)
-        self.assert_numpy_array_equal(res, chk)
-
-        # Scalar version of single item array
-        # Categorical return np.array like pd.Series, but different from np.array.searchsorted()
-        res = c1.searchsorted('bread')
-        chk = s1.searchsorted('bread')
-        exp = np.array([1])
-        self.assert_numpy_array_equal(res, exp)
-        self.assert_numpy_array_equal(res, chk)
-
-        # Searching for a value that is not present in the Categorical
-        res = c1.searchsorted(['bread', 'eggs'])
-        chk = s1.searchsorted(['bread', 'eggs'])
-        exp = np.array([1, 4])
-        self.assert_numpy_array_equal(res, exp)
-        self.assert_numpy_array_equal(res, chk)
-
-        # Searching for a value that is not present, to the right
-        res = c1.searchsorted(['bread', 'eggs'], side='right')
-        chk = s1.searchsorted(['bread', 'eggs'], side='right')
-        exp = np.array([3, 4])	    # eggs before milk
-        self.assert_numpy_array_equal(res, exp)
-        self.assert_numpy_array_equal(res, chk)
-
-        # As above, but with a sorter array to reorder an unsorted array
-        res = c2.searchsorted(['bread', 'eggs'], side='right', sorter=[0, 1, 2, 3, 5, 4])
-        chk = s2.searchsorted(['bread', 'eggs'], side='right', sorter=[0, 1, 2, 3, 5, 4])
-        exp = np.array([3, 5])       # eggs after donuts, after switching milk and donuts
-        self.assert_numpy_array_equal(res, exp)
-        self.assert_numpy_array_equal(res, chk)
-
-    def test_deprecated_labels(self):
-        # TODO: labels is deprecated and should be removed in 0.18 or 2017, whatever is earlier
-        cat = pd.Categorical([1,2,3, np.nan], categories=[1,2,3])
-        exp = cat.codes
-        with tm.assert_produces_warning(FutureWarning):
-            res = cat.labels
-        self.assert_numpy_array_equal(res, exp)
-        self.assertFalse(LooseVersion(pd.__version__) >= '0.18')
-
-    def test_deprecated_levels(self):
-        # TODO: levels is deprecated and should be removed in 0.18 or 2017, whatever is earlier
-        cat = pd.Categorical([1,2,3, np.nan], categories=[1,2,3])
-        exp = cat.categories
-        with tm.assert_produces_warning(FutureWarning):
-            res = cat.levels
-        self.assert_numpy_array_equal(res, exp)
-        with tm.assert_produces_warning(FutureWarning):
-            res = pd.Categorical([1,2,3, np.nan], levels=[1,2,3])
-        self.assert_numpy_array_equal(res.categories, exp)
-
-        self.assertFalse(LooseVersion(pd.__version__) >= '0.18')
-
-    def test_removed_names_produces_warning(self):
-
-        # 10482
-        with tm.assert_produces_warning(UserWarning):
-            Categorical([0,1], name="a")
-
-        with tm.assert_produces_warning(UserWarning):
-            Categorical.from_codes([1,2], ["a","b","c"], name="a")
-
-    def test_datetime_categorical_comparison(self):
-        dt_cat = pd.Categorical(pd.date_range('2014-01-01', periods=3), ordered=True)
-        self.assert_numpy_array_equal(dt_cat > dt_cat[0], [False, True, True])
-        self.assert_numpy_array_equal(dt_cat[0] < dt_cat, [False, True, True])
-
-    def test_reflected_comparison_with_scalars(self):
-        # GH8658
-        cat = pd.Categorical([1, 2, 3], ordered=True)
-        self.assert_numpy_array_equal(cat > cat[0], [False, True, True])
-        self.assert_numpy_array_equal(cat[0] < cat, [False, True, True])
-
-    def test_comparison_with_unknown_scalars(self):
-        # https://github.com/pydata/pandas/issues/9836#issuecomment-92123057 and following
-        # comparisons with scalars not in categories should raise for unequal comps, but not for
-        # equal/not equal
-        cat = pd.Categorical([1, 2, 3], ordered=True)
-
-        self.assertRaises(TypeError, lambda: cat < 4)
-        self.assertRaises(TypeError, lambda: cat > 4)
-        self.assertRaises(TypeError, lambda: 4 < cat)
-        self.assertRaises(TypeError, lambda: 4 > cat)
-
-        self.assert_numpy_array_equal(cat == 4 , [False, False, False])
-        self.assert_numpy_array_equal(cat != 4 , [True, True, True])
-
-
-class TestCategoricalAsBlock(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.factor = Categorical.from_array(['a', 'b', 'b', 'a',
-                                              'a', 'c', 'c', 'c'])
-
-        df = DataFrame({'value': np.random.randint(0, 10000, 100)})
-        labels = [ "{0} - {1}".format(i, i + 499) for i in range(0, 10000, 500) ]
-
-        df = df.sort_values(by=['value'], ascending=True)
-        df['value_group'] = pd.cut(df.value, range(0, 10500, 500), right=False, labels=labels)
-        self.cat = df
-
-    def test_dtypes(self):
-
-
-        # GH8143
-        index = ['cat','obj','num']
-        cat = pd.Categorical(['a', 'b', 'c'])
-        obj = pd.Series(['a', 'b', 'c'])
-        num = pd.Series([1, 2, 3])
-        df = pd.concat([pd.Series(cat), obj, num], axis=1, keys=index)
-
-        result = df.dtypes == 'object'
-        expected = Series([False,True,False],index=index)
-        tm.assert_series_equal(result, expected)
-
-        result = df.dtypes == 'int64'
-        expected = Series([False,False,True],index=index)
-        tm.assert_series_equal(result, expected)
-
-        result = df.dtypes == 'category'
-        expected = Series([True,False,False],index=index)
-        tm.assert_series_equal(result, expected)
-
-    def test_codes_dtypes(self):
-
-        # GH 8453
-        result = Categorical(['foo','bar','baz'])
-        self.assertTrue(result.codes.dtype == 'int8')
-
-        result = Categorical(['foo%05d' % i for i in range(400) ])
-        self.assertTrue(result.codes.dtype == 'int16')
-
-        result = Categorical(['foo%05d' % i for i in range(40000) ])
-        self.assertTrue(result.codes.dtype == 'int32')
-
-        # adding cats
-        result = Categorical(['foo','bar','baz'])
-        self.assertTrue(result.codes.dtype == 'int8')
-        result = result.add_categories(['foo%05d' % i for i in range(400) ])
-        self.assertTrue(result.codes.dtype == 'int16')
-
-        # removing cats
-        result = result.remove_categories(['foo%05d' % i for i in range(300) ])
-        self.assertTrue(result.codes.dtype == 'int8')
-
-    def test_basic(self):
-
-        # test basic creation / coercion of categoricals
-        s = Series(self.factor, name='A')
-        self.assertEqual(s.dtype,'category')
-        self.assertEqual(len(s),len(self.factor))
-        str(s.values)
-        str(s)
-
-        # in a frame
-        df = DataFrame({'A' : self.factor })
-        result = df['A']
-        tm.assert_series_equal(result,s)
-        result = df.iloc[:,0]
-        tm.assert_series_equal(result,s)
-        self.assertEqual(len(df),len(self.factor))
-        str(df.values)
-        str(df)
-
-        df = DataFrame({'A' : s })
-        result = df['A']
-        tm.assert_series_equal(result,s)
-        self.assertEqual(len(df),len(self.factor))
-        str(df.values)
-        str(df)
-
-        # multiples
-        df = DataFrame({'A' : s, 'B' : s, 'C' : 1})
-        result1 = df['A']
-        result2 = df['B']
-        tm.assert_series_equal(result1, s)
-        tm.assert_series_equal(result2, s, check_names=False)
-        self.assertEqual(result2.name, 'B')
-        self.assertEqual(len(df),len(self.factor))
-        str(df.values)
-        str(df)
-
-        # GH8623
-        x = pd.DataFrame([[1,'John P. Doe'],[2,'Jane Dove'],[1,'John P. Doe']],
-                         columns=['person_id','person_name'])
-        x['person_name'] = pd.Categorical(x.person_name) # doing this breaks transform
-
-        expected = x.iloc[0].person_name
-        result = x.person_name.iloc[0]
-        self.assertEqual(result,expected)
-
-        result = x.person_name[0]
-        self.assertEqual(result,expected)
-
-        result = x.person_name.loc[0]
-        self.assertEqual(result,expected)
-
-    def test_creation_astype(self):
-        l = ["a","b","c","a"]
-        s = pd.Series(l)
-        exp = pd.Series(Categorical(l))
-        res = s.astype('category')
-        tm.assert_series_equal(res, exp)
-
-        l = [1,2,3,1]
-        s = pd.Series(l)
-        exp = pd.Series(Categorical(l))
-        res = s.astype('category')
-        tm.assert_series_equal(res, exp)
-
-        df = pd.DataFrame({"cats":[1,2,3,4,5,6], "vals":[1,2,3,4,5,6]})
-        cats = Categorical([1,2,3,4,5,6])
-        exp_df = pd.DataFrame({"cats":cats, "vals":[1,2,3,4,5,6]})
-        df["cats"] =  df["cats"].astype("category")
-        tm.assert_frame_equal(exp_df, df)
-
-        df = pd.DataFrame({"cats":['a', 'b', 'b', 'a', 'a', 'd'], "vals":[1,2,3,4,5,6]})
-        cats = Categorical(['a', 'b', 'b', 'a', 'a', 'd'])
-        exp_df = pd.DataFrame({"cats":cats, "vals":[1,2,3,4,5,6]})
-        df["cats"] =  df["cats"].astype("category")
-        tm.assert_frame_equal(exp_df, df)
-
-        # with keywords
-        l = ["a","b","c","a"]
-        s = pd.Series(l)
-        exp = pd.Series(Categorical(l, ordered=True))
-        res = s.astype('category', ordered=True)
-        tm.assert_series_equal(res, exp)
-
-        exp = pd.Series(Categorical(l, categories=list('abcdef'), ordered=True))
-        res = s.astype('category', categories=list('abcdef'), ordered=True)
-        tm.assert_series_equal(res, exp)
-
-    def test_construction_series(self):
-
-        l = [1,2,3,1]
-        exp = Series(l).astype('category')
-        res = Series(l,dtype='category')
-        tm.assert_series_equal(res, exp)
-
-        l = ["a","b","c","a"]
-        exp = Series(l).astype('category')
-        res = Series(l,dtype='category')
-        tm.assert_series_equal(res, exp)
-
-        # insert into frame with different index
-        # GH 8076
-        index = pd.date_range('20000101', periods=3)
-        expected = Series(Categorical(values=[np.nan,np.nan,np.nan],categories=['a', 'b', 'c']))
-        expected.index = index
-
-        expected = DataFrame({'x': expected})
-        df = DataFrame({'x': Series(['a', 'b', 'c'],dtype='category')}, index=index)
-        tm.assert_frame_equal(df, expected)
-
-    def test_construction_frame(self):
-
-        # GH8626
-
-        # dict creation
-        df = DataFrame({ 'A' : list('abc') }, dtype='category')
-        expected = Series(list('abc'), dtype='category', name='A')
-        tm.assert_series_equal(df['A'], expected)
-
-        # to_frame
-        s = Series(list('abc'), dtype='category')
-        result = s.to_frame()
-        expected = Series(list('abc'), dtype='category', name=0)
-        tm.assert_series_equal(result[0], expected)
-        result = s.to_frame(name='foo')
-        expected = Series(list('abc'), dtype='category', name='foo')
-        tm.assert_series_equal(result['foo'], expected)
-
-        # list-like creation
-        df = DataFrame(list('abc'), dtype='category')
-        expected = Series(list('abc'), dtype='category', name=0)
-        tm.assert_series_equal(df[0], expected)
-
-        # ndim != 1
-        df = DataFrame([pd.Categorical(list('abc'))])
-        expected = DataFrame({ 0 : Series(list('abc'),dtype='category')})
-        tm.assert_frame_equal(df,expected)
-
-        df = DataFrame([pd.Categorical(list('abc')),pd.Categorical(list('abd'))])
-        expected = DataFrame({ 0 : Series(list('abc'),dtype='category'),
-                               1 : Series(list('abd'),dtype='category')},columns=[0,1])
-        tm.assert_frame_equal(df,expected)
-
-        # mixed
-        df = DataFrame([pd.Categorical(list('abc')),list('def')])
-        expected = DataFrame({ 0 : Series(list('abc'),dtype='category'),
-                               1 : list('def')},columns=[0,1])
-        tm.assert_frame_equal(df,expected)
-
-        # invalid (shape)
-        self.assertRaises(ValueError, lambda : DataFrame([pd.Categorical(list('abc')),pd.Categorical(list('abdefg'))]))
-
-        # ndim > 1
-        self.assertRaises(NotImplementedError, lambda : pd.Categorical(np.array([list('abcd')])))
-
-    def test_reshaping(self):
-
-        p = tm.makePanel()
-        p['str'] = 'foo'
-        df = p.to_frame()
-        df['category'] = df['str'].astype('category')
-        result = df['category'].unstack()
-
-        c = Categorical(['foo']*len(p.major_axis))
-        expected = DataFrame({'A' : c.copy(),
-                              'B' : c.copy(),
-                              'C' : c.copy(),
-                              'D' : c.copy()},
-                             columns=Index(list('ABCD'),name='minor'),
-                             index=p.major_axis.set_names('major'))
-        tm.assert_frame_equal(result, expected)
-
-    def test_reindex(self):
-
-        index = pd.date_range('20000101', periods=3)
-
-        # reindexing to an invalid Categorical
-        s = Series(['a', 'b', 'c'],dtype='category')
-        result = s.reindex(index)
-        expected = Series(Categorical(values=[np.nan,np.nan,np.nan],categories=['a', 'b', 'c']))
-        expected.index = index
-        tm.assert_series_equal(result, expected)
-
-        # partial reindexing
-        expected = Series(Categorical(values=['b','c'],categories=['a', 'b', 'c']))
-        expected.index = [1,2]
-        result = s.reindex([1,2])
-        tm.assert_series_equal(result, expected)
-
-        expected = Series(Categorical(values=['c',np.nan],categories=['a', 'b', 'c']))
-        expected.index = [2,3]
-        result = s.reindex([2,3])
-        tm.assert_series_equal(result, expected)
-
-
-
-    def test_sideeffects_free(self):
-
-        # Passing a categorical to a Series and then changing values in either the series or the
-        # categorical should not change the values in the other one, IF you specify copy!
-        cat = Categorical(["a","b","c","a"])
-        s =  pd.Series(cat, copy=True)
-        self.assertFalse(s.cat is cat)
-        s.cat.categories = [1,2,3]
-        exp_s = np.array([1,2,3,1])
-        exp_cat = np.array(["a","b","c","a"])
-        self.assert_numpy_array_equal(s.__array__(), exp_s)
-        self.assert_numpy_array_equal(cat.__array__(), exp_cat)
-
-        # setting
-        s[0] = 2
-        exp_s2 = np.array([2,2,3,1])
-        self.assert_numpy_array_equal(s.__array__(), exp_s2)
-        self.assert_numpy_array_equal(cat.__array__(), exp_cat)
-
-        # however, copy is False by default
-        # so this WILL change values
-        cat = Categorical(["a","b","c","a"])
-        s =  pd.Series(cat)
-        self.assertTrue(s.values is cat)
-        s.cat.categories = [1,2,3]
-        exp_s = np.array([1,2,3,1])
-        self.assert_numpy_array_equal(s.__array__(), exp_s)
-        self.assert_numpy_array_equal(cat.__array__(), exp_s)
-
-        s[0] = 2
-        exp_s2 = np.array([2,2,3,1])
-        self.assert_numpy_array_equal(s.__array__(), exp_s2)
-        self.assert_numpy_array_equal(cat.__array__(), exp_s2)
-
-    def test_nan_handling(self):
-
-        # Nans are represented as -1 in labels
-        s = Series(Categorical(["a","b",np.nan,"a"]))
-        self.assert_numpy_array_equal(s.cat.categories, np.array(["a","b"]))
-        self.assert_numpy_array_equal(s.values.codes, np.array([0,1,-1,0]))
-
-        # If categories have nan included, the label should point to that instead
-        with tm.assert_produces_warning(FutureWarning):
-            s2 = Series(Categorical(["a","b",np.nan,"a"], categories=["a","b",np.nan]))
-        self.assert_numpy_array_equal(s2.cat.categories,
-                                      np.array(["a","b",np.nan], dtype=np.object_))
-        self.assert_numpy_array_equal(s2.values.codes, np.array([0,1,2,0]))
-
-        # Changing categories should also make the replaced category np.nan
-        s3 = Series(Categorical(["a","b","c","a"]))
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            s3.cat.categories = ["a","b",np.nan]
-        self.assert_numpy_array_equal(s3.cat.categories,
-                                      np.array(["a","b",np.nan], dtype=np.object_))
-        self.assert_numpy_array_equal(s3.values.codes, np.array([0,1,2,0]))
-
-    def test_cat_accessor(self):
-        s = Series(Categorical(["a","b",np.nan,"a"]))
-        self.assert_numpy_array_equal(s.cat.categories, np.array(["a","b"]))
-        self.assertEqual(s.cat.ordered, False)
-        exp = Categorical(["a","b",np.nan,"a"], categories=["b","a"])
-        s.cat.set_categories(["b", "a"], inplace=True)
-        self.assertTrue(s.values.equals(exp))
-        res = s.cat.set_categories(["b", "a"])
-        self.assertTrue(res.values.equals(exp))
-        exp = Categorical(["a","b",np.nan,"a"], categories=["b","a"])
-        s[:] = "a"
-        s = s.cat.remove_unused_categories()
-        self.assert_numpy_array_equal(s.cat.categories, np.array(["a"]))
-
-    def test_sequence_like(self):
-
-        # GH 7839
-        # make sure can iterate
-        df = DataFrame({"id":[1,2,3,4,5,6], "raw_grade":['a', 'b', 'b', 'a', 'a', 'e']})
-        df['grade'] = Categorical(df['raw_grade'])
-
-        # basic sequencing testing
-        result = list(df.grade.values)
-        expected = np.array(df.grade.values).tolist()
-        tm.assert_almost_equal(result,expected)
-
-        # iteration
-        for t in df.itertuples(index=False):
-            str(t)
-
-        for row, s in df.iterrows():
-            str(s)
-
-        for c, col in df.iteritems():
-            str(s)
-
-    def test_series_delegations(self):
-
-        # invalid accessor
-        self.assertRaises(AttributeError, lambda : Series([1,2,3]).cat)
-        tm.assertRaisesRegexp(AttributeError,
-                              r"Can only use .cat accessor with a 'category' dtype",
-                              lambda : Series([1,2,3]).cat)
-        self.assertRaises(AttributeError, lambda : Series(['a','b','c']).cat)
-        self.assertRaises(AttributeError, lambda : Series(np.arange(5.)).cat)
-        self.assertRaises(AttributeError, lambda : Series([Timestamp('20130101')]).cat)
-
-        # Series should delegate calls to '.categories', '.codes', '.ordered' and the
-        # methods '.set_categories()' 'drop_unused_categories()' to the categorical
-        s = Series(Categorical(["a","b","c","a"], ordered=True))
-        exp_categories = np.array(["a","b","c"])
-        self.assert_numpy_array_equal(s.cat.categories, exp_categories)
-        s.cat.categories = [1,2,3]
-        exp_categories = np.array([1,2,3])
-        self.assert_numpy_array_equal(s.cat.categories, exp_categories)
-
-        exp_codes = Series([0,1,2,0],dtype='int8')
-        tm.assert_series_equal(s.cat.codes, exp_codes)
-
-        self.assertEqual(s.cat.ordered, True)
-        s = s.cat.as_unordered()
-        self.assertEqual(s.cat.ordered, False)
-        s.cat.as_ordered(inplace=True)
-        self.assertEqual(s.cat.ordered, True)
-
-        # reorder
-        s = Series(Categorical(["a","b","c","a"], ordered=True))
-        exp_categories = np.array(["c","b","a"])
-        exp_values = np.array(["a","b","c","a"])
-        s = s.cat.set_categories(["c","b","a"])
-        self.assert_numpy_array_equal(s.cat.categories, exp_categories)
-        self.assert_numpy_array_equal(s.values.__array__(), exp_values)
-        self.assert_numpy_array_equal(s.__array__(), exp_values)
-
-        # remove unused categories
-        s = Series(Categorical(["a","b","b","a"], categories=["a","b","c"]))
-        exp_categories = np.array(["a","b"])
-        exp_values = np.array(["a","b","b","a"])
-        s = s.cat.remove_unused_categories()
-        self.assert_numpy_array_equal(s.cat.categories, exp_categories)
-        self.assert_numpy_array_equal(s.values.__array__(), exp_values)
-        self.assert_numpy_array_equal(s.__array__(), exp_values)
-
-        # This method is likely to be confused, so test that it raises an error on wrong inputs:
-        def f():
-            s.set_categories([4,3,2,1])
-        self.assertRaises(Exception, f)
-        # right: s.cat.set_categories([4,3,2,1])
-
-    def test_series_functions_no_warnings(self):
-        df = pd.DataFrame({'value': np.random.randint(0, 100, 20)})
-        labels = [ "{0} - {1}".format(i, i + 9) for i in range(0, 100, 10)]
-        with tm.assert_produces_warning(False):
-            df['group'] = pd.cut(df.value, range(0, 105, 10), right=False, labels=labels)
-
-    def test_assignment_to_dataframe(self):
-        # assignment
-        df = DataFrame({'value': np.array(np.random.randint(0, 10000, 100),dtype='int32')})
-        labels = [ "{0} - {1}".format(i, i + 499) for i in range(0, 10000, 500) ]
-
-        df = df.sort_values(by=['value'], ascending=True)
-        s = pd.cut(df.value, range(0, 10500, 500), right=False, labels=labels)
-        d = s.values
-        df['D'] = d
-        str(df)
-
-        result = df.dtypes
-        expected = Series([np.dtype('int32'), com.CategoricalDtype()],index=['value','D'])
-        tm.assert_series_equal(result,expected)
-
-        df['E'] = s
-        str(df)
-
-        result = df.dtypes
-        expected = Series([np.dtype('int32'), com.CategoricalDtype(), com.CategoricalDtype()],
-                          index=['value','D','E'])
-        tm.assert_series_equal(result,expected)
-
-        result1 = df['D']
-        result2 = df['E']
-        self.assertTrue(result1._data._block.values.equals(d))
-
-        # sorting
-        s.name = 'E'
-        self.assertTrue(result2.sort_index().equals(s.sort_index()))
-
-        cat = pd.Categorical([1,2,3,10], categories=[1,2,3,4,10])
-        df = pd.DataFrame(pd.Series(cat))
-
-    def test_describe(self):
-
-        # Categoricals should not show up together with numerical columns
-        result = self.cat.describe()
-        self.assertEqual(len(result.columns),1)
-
-
-        # In a frame, describe() for the cat should be the same as for string arrays (count, unique,
-        # top, freq)
-
-        cat = Categorical(["a","b","b","b"], categories=['a','b','c'], ordered=True)
-        s = Series(cat)
-        result = s.describe()
-        expected = Series([4,2,"b",3],index=['count','unique','top', 'freq'])
-        tm.assert_series_equal(result,expected)
-
-        cat = pd.Series(pd.Categorical(["a","b","c","c"]))
-        df3 = pd.DataFrame({"cat":cat, "s":["a","b","c","c"]})
-        res = df3.describe()
-        self.assert_numpy_array_equal(res["cat"].values, res["s"].values)
-
-    def test_repr(self):
-        a = pd.Series(pd.Categorical([1,2,3,4]))
-        exp = u("0    1\n1    2\n2    3\n3    4\n" +
-              "dtype: category\nCategories (4, int64): [1, 2, 3, 4]")
-
-        self.assertEqual(exp, a.__unicode__())
-
-        a = pd.Series(pd.Categorical(["a","b"] *25))
-        exp = u("0     a\n1     b\n" + "     ..\n" +
-                "48    a\n49    b\n" +
-                "dtype: category\nCategories (2, object): [a, b]")
-        with option_context("display.max_rows", 5):
-            self.assertEqual(exp, repr(a))
-
-        levs = list("abcdefghijklmnopqrstuvwxyz")
-        a = pd.Series(pd.Categorical(["a","b"], categories=levs, ordered=True))
-        exp = u("0    a\n1    b\n" +
-                "dtype: category\n"
-                "Categories (26, object): [a < b < c < d ... w < x < y < z]")
-        self.assertEqual(exp,a.__unicode__())
-
-    def test_categorical_repr(self):
-        c = pd.Categorical([1, 2 ,3])
-        exp = """[1, 2, 3]
-Categories (3, int64): [1, 2, 3]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical([1, 2 ,3, 1, 2 ,3], categories=[1, 2, 3])
-        exp = """[1, 2, 3, 1, 2, 3]
-Categories (3, int64): [1, 2, 3]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical([1, 2, 3, 4, 5] * 10)
-        exp = """[1, 2, 3, 4, 5, ..., 1, 2, 3, 4, 5]
-Length: 50
-Categories (5, int64): [1, 2, 3, 4, 5]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(np.arange(20))
-        exp = """[0, 1, 2, 3, 4, ..., 15, 16, 17, 18, 19]
-Length: 20
-Categories (20, int64): [0, 1, 2, 3, ..., 16, 17, 18, 19]"""
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_ordered(self):
-        c = pd.Categorical([1, 2 ,3], ordered=True)
-        exp = """[1, 2, 3]
-Categories (3, int64): [1 < 2 < 3]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical([1, 2 ,3, 1, 2 ,3], categories=[1, 2, 3], ordered=True)
-        exp = """[1, 2, 3, 1, 2, 3]
-Categories (3, int64): [1 < 2 < 3]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical([1, 2, 3, 4, 5] * 10, ordered=True)
-        exp = """[1, 2, 3, 4, 5, ..., 1, 2, 3, 4, 5]
-Length: 50
-Categories (5, int64): [1 < 2 < 3 < 4 < 5]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(np.arange(20), ordered=True)
-        exp = """[0, 1, 2, 3, 4, ..., 15, 16, 17, 18, 19]
-Length: 20
-Categories (20, int64): [0 < 1 < 2 < 3 ... 16 < 17 < 18 < 19]"""
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_datetime(self):
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5)
-        c = pd.Categorical(idx)
-        exp = """[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00]
-Categories (5, datetime64[ns]): [2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00,
-                                 2011-01-01 12:00:00, 2011-01-01 13:00:00]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx)
-        exp = """[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00, 2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00]
-Categories (5, datetime64[ns]): [2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00,
-                                 2011-01-01 12:00:00, 2011-01-01 13:00:00]"""
-        self.assertEqual(repr(c), exp)
-
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5, tz='US/Eastern')
-        c = pd.Categorical(idx)
-        exp = """[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00]
-Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00,\n                                             2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00,\n                                             2011-01-01 13:00:00-05:00]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx)
-        exp = """[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00, 2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00]
-Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00,
-                                             2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00,
-                                             2011-01-01 13:00:00-05:00]"""
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_datetime_ordered(self):
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5)
-        c = pd.Categorical(idx, ordered=True)
-        exp = """[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00]
-Categories (5, datetime64[ns]): [2011-01-01 09:00:00 < 2011-01-01 10:00:00 < 2011-01-01 11:00:00 <
-                                 2011-01-01 12:00:00 < 2011-01-01 13:00:00]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx, ordered=True)
-        exp = """[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00, 2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00]
-Categories (5, datetime64[ns]): [2011-01-01 09:00:00 < 2011-01-01 10:00:00 < 2011-01-01 11:00:00 <
-                                 2011-01-01 12:00:00 < 2011-01-01 13:00:00]"""
-        self.assertEqual(repr(c), exp)
-
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5, tz='US/Eastern')
-        c = pd.Categorical(idx, ordered=True)
-        exp = """[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00]
-Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00 < 2011-01-01 10:00:00-05:00 <
-                                             2011-01-01 11:00:00-05:00 < 2011-01-01 12:00:00-05:00 <
-                                             2011-01-01 13:00:00-05:00]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx, ordered=True)
-        exp = """[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00, 2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00]
-Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00 < 2011-01-01 10:00:00-05:00 <
-                                             2011-01-01 11:00:00-05:00 < 2011-01-01 12:00:00-05:00 <
-                                             2011-01-01 13:00:00-05:00]"""
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_period(self):
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=5)
-        c = pd.Categorical(idx)
-        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
-Categories (5, period): [2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00,
-                         2011-01-01 13:00]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx)
-        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00, 2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
-Categories (5, period): [2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00,
-                         2011-01-01 13:00]"""
-        self.assertEqual(repr(c), exp)
-
-        idx = pd.period_range('2011-01', freq='M', periods=5)
-        c = pd.Categorical(idx)
-        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
-Categories (5, period): [2011-01, 2011-02, 2011-03, 2011-04, 2011-05]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx)
-        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05, 2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
-Categories (5, period): [2011-01, 2011-02, 2011-03, 2011-04, 2011-05]"""
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_period_ordered(self):
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=5)
-        c = pd.Categorical(idx, ordered=True)
-        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
-Categories (5, period): [2011-01-01 09:00 < 2011-01-01 10:00 < 2011-01-01 11:00 < 2011-01-01 12:00 <
-                         2011-01-01 13:00]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx, ordered=True)
-        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00, 2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
-Categories (5, period): [2011-01-01 09:00 < 2011-01-01 10:00 < 2011-01-01 11:00 < 2011-01-01 12:00 <
-                         2011-01-01 13:00]"""
-        self.assertEqual(repr(c), exp)
-
-        idx = pd.period_range('2011-01', freq='M', periods=5)
-        c = pd.Categorical(idx, ordered=True)
-        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
-Categories (5, period): [2011-01 < 2011-02 < 2011-03 < 2011-04 < 2011-05]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx, ordered=True)
-        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05, 2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
-Categories (5, period): [2011-01 < 2011-02 < 2011-03 < 2011-04 < 2011-05]"""
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_timedelta(self):
-        idx = pd.timedelta_range('1 days', periods=5)
-        c = pd.Categorical(idx)
-        exp = """[1 days, 2 days, 3 days, 4 days, 5 days]
-Categories (5, timedelta64[ns]): [1 days, 2 days, 3 days, 4 days, 5 days]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx)
-        exp = """[1 days, 2 days, 3 days, 4 days, 5 days, 1 days, 2 days, 3 days, 4 days, 5 days]
-Categories (5, timedelta64[ns]): [1 days, 2 days, 3 days, 4 days, 5 days]"""
-        self.assertEqual(repr(c), exp)
-
-        idx = pd.timedelta_range('1 hours', periods=20)
-        c = pd.Categorical(idx)
-        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
-Length: 20
-Categories (20, timedelta64[ns]): [0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00,
-                                   3 days 01:00:00, ..., 16 days 01:00:00, 17 days 01:00:00,
-                                   18 days 01:00:00, 19 days 01:00:00]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx)
-        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
-Length: 40
-Categories (20, timedelta64[ns]): [0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00,
-                                   3 days 01:00:00, ..., 16 days 01:00:00, 17 days 01:00:00,
-                                   18 days 01:00:00, 19 days 01:00:00]"""
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_timedelta_ordered(self):
-        idx = pd.timedelta_range('1 days', periods=5)
-        c = pd.Categorical(idx, ordered=True)
-        exp = """[1 days, 2 days, 3 days, 4 days, 5 days]
-Categories (5, timedelta64[ns]): [1 days < 2 days < 3 days < 4 days < 5 days]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx, ordered=True)
-        exp = """[1 days, 2 days, 3 days, 4 days, 5 days, 1 days, 2 days, 3 days, 4 days, 5 days]
-Categories (5, timedelta64[ns]): [1 days < 2 days < 3 days < 4 days < 5 days]"""
-        self.assertEqual(repr(c), exp)
-
-        idx = pd.timedelta_range('1 hours', periods=20)
-        c = pd.Categorical(idx, ordered=True)
-        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
-Length: 20
-Categories (20, timedelta64[ns]): [0 days 01:00:00 < 1 days 01:00:00 < 2 days 01:00:00 <
-                                   3 days 01:00:00 ... 16 days 01:00:00 < 17 days 01:00:00 <
-                                   18 days 01:00:00 < 19 days 01:00:00]"""
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx, ordered=True)
-        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
-Length: 40
-Categories (20, timedelta64[ns]): [0 days 01:00:00 < 1 days 01:00:00 < 2 days 01:00:00 <
-                                   3 days 01:00:00 ... 16 days 01:00:00 < 17 days 01:00:00 <
-                                   18 days 01:00:00 < 19 days 01:00:00]"""
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_series_repr(self):
-        s = pd.Series(pd.Categorical([1, 2 ,3]))
-        exp = """0    1
-1    2
-2    3
-dtype: category
-Categories (3, int64): [1, 2, 3]"""
-        self.assertEqual(repr(s), exp)
-
-        s = pd.Series(pd.Categorical(np.arange(10)))
-        exp = """0    0
-1    1
-2    2
-3    3
-4    4
-5    5
-6    6
-7    7
-8    8
-9    9
-dtype: category
-Categories (10, int64): [0, 1, 2, 3, ..., 6, 7, 8, 9]"""
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_ordered(self):
-        s = pd.Series(pd.Categorical([1, 2 ,3], ordered=True))
-        exp = """0    1
-1    2
-2    3
-dtype: category
-Categories (3, int64): [1 < 2 < 3]"""
-        self.assertEqual(repr(s), exp)
-
-        s = pd.Series(pd.Categorical(np.arange(10), ordered=True))
-        exp = """0    0
-1    1
-2    2
-3    3
-4    4
-5    5
-6    6
-7    7
-8    8
-9    9
-dtype: category
-Categories (10, int64): [0 < 1 < 2 < 3 ... 6 < 7 < 8 < 9]"""
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_datetime(self):
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5)
-        s = pd.Series(pd.Categorical(idx))
-        exp = """0   2011-01-01 09:00:00
-1   2011-01-01 10:00:00
-2   2011-01-01 11:00:00
-3   2011-01-01 12:00:00
-4   2011-01-01 13:00:00
-dtype: category
-Categories (5, datetime64[ns]): [2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00,
-                                 2011-01-01 12:00:00, 2011-01-01 13:00:00]"""
-        self.assertEqual(repr(s), exp)
-
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5, tz='US/Eastern')
-        s = pd.Series(pd.Categorical(idx))
-        exp = """0   2011-01-01 09:00:00-05:00
-1   2011-01-01 10:00:00-05:00
-2   2011-01-01 11:00:00-05:00
-3   2011-01-01 12:00:00-05:00
-4   2011-01-01 13:00:00-05:00
-dtype: category
-Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00,
-                                             2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00,
-                                             2011-01-01 13:00:00-05:00]"""
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_datetime_ordered(self):
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5)
-        s = pd.Series(pd.Categorical(idx, ordered=True))
-        exp = """0   2011-01-01 09:00:00
-1   2011-01-01 10:00:00
-2   2011-01-01 11:00:00
-3   2011-01-01 12:00:00
-4   2011-01-01 13:00:00
-dtype: category
-Categories (5, datetime64[ns]): [2011-01-01 09:00:00 < 2011-01-01 10:00:00 < 2011-01-01 11:00:00 <
-                                 2011-01-01 12:00:00 < 2011-01-01 13:00:00]"""
-        self.assertEqual(repr(s), exp)
-
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5, tz='US/Eastern')
-        s = pd.Series(pd.Categorical(idx, ordered=True))
-        exp = """0   2011-01-01 09:00:00-05:00
-1   2011-01-01 10:00:00-05:00
-2   2011-01-01 11:00:00-05:00
-3   2011-01-01 12:00:00-05:00
-4   2011-01-01 13:00:00-05:00
-dtype: category
-Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00 < 2011-01-01 10:00:00-05:00 <
-                                             2011-01-01 11:00:00-05:00 < 2011-01-01 12:00:00-05:00 <
-                                             2011-01-01 13:00:00-05:00]"""
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_period(self):
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=5)
-        s = pd.Series(pd.Categorical(idx))
-        exp = """0   2011-01-01 09:00
-1   2011-01-01 10:00
-2   2011-01-01 11:00
-3   2011-01-01 12:00
-4   2011-01-01 13:00
-dtype: category
-Categories (5, period): [2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00,
-                         2011-01-01 13:00]"""
-        self.assertEqual(repr(s), exp)
-
-        idx = pd.period_range('2011-01', freq='M', periods=5)
-        s = pd.Series(pd.Categorical(idx))
-        exp = """0   2011-01
-1   2011-02
-2   2011-03
-3   2011-04
-4   2011-05
-dtype: category
-Categories (5, period): [2011-01, 2011-02, 2011-03, 2011-04, 2011-05]"""
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_period_ordered(self):
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=5)
-        s = pd.Series(pd.Categorical(idx, ordered=True))
-        exp = """0   2011-01-01 09:00
-1   2011-01-01 10:00
-2   2011-01-01 11:00
-3   2011-01-01 12:00
-4   2011-01-01 13:00
-dtype: category
-Categories (5, period): [2011-01-01 09:00 < 2011-01-01 10:00 < 2011-01-01 11:00 < 2011-01-01 12:00 <
-                         2011-01-01 13:00]"""
-        self.assertEqual(repr(s), exp)
-
-        idx = pd.period_range('2011-01', freq='M', periods=5)
-        s = pd.Series(pd.Categorical(idx, ordered=True))
-        exp = """0   2011-01
-1   2011-02
-2   2011-03
-3   2011-04
-4   2011-05
-dtype: category
-Categories (5, period): [2011-01 < 2011-02 < 2011-03 < 2011-04 < 2011-05]"""
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_timedelta(self):
-        idx = pd.timedelta_range('1 days', periods=5)
-        s = pd.Series(pd.Categorical(idx))
-        exp = """0   1 days
-1   2 days
-2   3 days
-3   4 days
-4   5 days
-dtype: category
-Categories (5, timedelta64[ns]): [1 days, 2 days, 3 days, 4 days, 5 days]"""
-        self.assertEqual(repr(s), exp)
-
-        idx = pd.timedelta_range('1 hours', periods=10)
-        s = pd.Series(pd.Categorical(idx))
-        exp = """0   0 days 01:00:00
-1   1 days 01:00:00
-2   2 days 01:00:00
-3   3 days 01:00:00
-4   4 days 01:00:00
-5   5 days 01:00:00
-6   6 days 01:00:00
-7   7 days 01:00:00
-8   8 days 01:00:00
-9   9 days 01:00:00
-dtype: category
-Categories (10, timedelta64[ns]): [0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00,
-                                   3 days 01:00:00, ..., 6 days 01:00:00, 7 days 01:00:00,
-                                   8 days 01:00:00, 9 days 01:00:00]"""
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_timedelta_ordered(self):
-        idx = pd.timedelta_range('1 days', periods=5)
-        s = pd.Series(pd.Categorical(idx, ordered=True))
-        exp = """0   1 days
-1   2 days
-2   3 days
-3   4 days
-4   5 days
-dtype: category
-Categories (5, timedelta64[ns]): [1 days < 2 days < 3 days < 4 days < 5 days]"""
-        self.assertEqual(repr(s), exp)
-
-        idx = pd.timedelta_range('1 hours', periods=10)
-        s = pd.Series(pd.Categorical(idx, ordered=True))
-        exp = """0   0 days 01:00:00
-1   1 days 01:00:00
-2   2 days 01:00:00
-3   3 days 01:00:00
-4   4 days 01:00:00
-5   5 days 01:00:00
-6   6 days 01:00:00
-7   7 days 01:00:00
-8   8 days 01:00:00
-9   9 days 01:00:00
-dtype: category
-Categories (10, timedelta64[ns]): [0 days 01:00:00 < 1 days 01:00:00 < 2 days 01:00:00 <
-                                   3 days 01:00:00 ... 6 days 01:00:00 < 7 days 01:00:00 <
-                                   8 days 01:00:00 < 9 days 01:00:00]"""
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_index_repr(self):
-        idx = pd.CategoricalIndex(pd.Categorical([1, 2 ,3]))
-        exp = """CategoricalIndex([1, 2, 3], categories=[1, 2, 3], ordered=False, dtype='category')"""
-        self.assertEqual(repr(idx), exp)
-
-        i = pd.CategoricalIndex(pd.Categorical(np.arange(10)))
-        exp = """CategoricalIndex([0, 1, 2, 3, 4, 5, 6, 7, 8, 9], categories=[0, 1, 2, 3, 4, 5, 6, 7, ...], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_ordered(self):
-        i = pd.CategoricalIndex(pd.Categorical([1, 2 ,3], ordered=True))
-        exp = """CategoricalIndex([1, 2, 3], categories=[1, 2, 3], ordered=True, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        i = pd.CategoricalIndex(pd.Categorical(np.arange(10), ordered=True))
-        exp = """CategoricalIndex([0, 1, 2, 3, 4, 5, 6, 7, 8, 9], categories=[0, 1, 2, 3, 4, 5, 6, 7, ...], ordered=True, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_datetime(self):
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01-01 09:00:00', '2011-01-01 10:00:00',
-                  '2011-01-01 11:00:00', '2011-01-01 12:00:00',
-                  '2011-01-01 13:00:00'],
-                 categories=[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5, tz='US/Eastern')
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01-01 09:00:00-05:00', '2011-01-01 10:00:00-05:00',
-                  '2011-01-01 11:00:00-05:00', '2011-01-01 12:00:00-05:00',
-                  '2011-01-01 13:00:00-05:00'],
-                 categories=[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_datetime_ordered(self):
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx, ordered=True))
-        exp = """CategoricalIndex(['2011-01-01 09:00:00', '2011-01-01 10:00:00',
-                  '2011-01-01 11:00:00', '2011-01-01 12:00:00',
-                  '2011-01-01 13:00:00'],
-                 categories=[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00], ordered=True, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5, tz='US/Eastern')
-        i = pd.CategoricalIndex(pd.Categorical(idx, ordered=True))
-        exp = """CategoricalIndex(['2011-01-01 09:00:00-05:00', '2011-01-01 10:00:00-05:00',
-                  '2011-01-01 11:00:00-05:00', '2011-01-01 12:00:00-05:00',
-                  '2011-01-01 13:00:00-05:00'],
-                 categories=[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00], ordered=True, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        i = pd.CategoricalIndex(pd.Categorical(idx.append(idx), ordered=True))
-        exp = """CategoricalIndex(['2011-01-01 09:00:00-05:00', '2011-01-01 10:00:00-05:00',
-                  '2011-01-01 11:00:00-05:00', '2011-01-01 12:00:00-05:00',
-                  '2011-01-01 13:00:00-05:00', '2011-01-01 09:00:00-05:00',
-                  '2011-01-01 10:00:00-05:00', '2011-01-01 11:00:00-05:00',
-                  '2011-01-01 12:00:00-05:00', '2011-01-01 13:00:00-05:00'],
-                 categories=[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00], ordered=True, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_period(self):
-        # test all length
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=1)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01-01 09:00'], categories=[2011-01-01 09:00], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=2)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00'], categories=[2011-01-01 09:00, 2011-01-01 10:00], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=3)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00'], categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00',
-                  '2011-01-01 12:00', '2011-01-01 13:00'],
-                 categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        i = pd.CategoricalIndex(pd.Categorical(idx.append(idx)))
-        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00',
-                  '2011-01-01 12:00', '2011-01-01 13:00', '2011-01-01 09:00',
-                  '2011-01-01 10:00', '2011-01-01 11:00', '2011-01-01 12:00',
-                  '2011-01-01 13:00'],
-                 categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.period_range('2011-01', freq='M', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01', '2011-02', '2011-03', '2011-04', '2011-05'], categories=[2011-01, 2011-02, 2011-03, 2011-04, 2011-05], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_period_ordered(self):
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx, ordered=True))
-        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00',
-                  '2011-01-01 12:00', '2011-01-01 13:00'],
-                 categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00], ordered=True, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.period_range('2011-01', freq='M', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx, ordered=True))
-        exp = """CategoricalIndex(['2011-01', '2011-02', '2011-03', '2011-04', '2011-05'], categories=[2011-01, 2011-02, 2011-03, 2011-04, 2011-05], ordered=True, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_timedelta(self):
-        idx = pd.timedelta_range('1 days', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['1 days', '2 days', '3 days', '4 days', '5 days'], categories=[1 days 00:00:00, 2 days 00:00:00, 3 days 00:00:00, 4 days 00:00:00, 5 days 00:00:00], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.timedelta_range('1 hours', periods=10)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['0 days 01:00:00', '1 days 01:00:00', '2 days 01:00:00',
-                  '3 days 01:00:00', '4 days 01:00:00', '5 days 01:00:00',
-                  '6 days 01:00:00', '7 days 01:00:00', '8 days 01:00:00',
-                  '9 days 01:00:00'],
-                 categories=[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, 5 days 01:00:00, 6 days 01:00:00, 7 days 01:00:00, ...], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_timedelta_ordered(self):
-        idx = pd.timedelta_range('1 days', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx, ordered=True))
-        exp = """CategoricalIndex(['1 days', '2 days', '3 days', '4 days', '5 days'], categories=[1 days 00:00:00, 2 days 00:00:00, 3 days 00:00:00, 4 days 00:00:00, 5 days 00:00:00], ordered=True, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.timedelta_range('1 hours', periods=10)
-        i = pd.CategoricalIndex(pd.Categorical(idx, ordered=True))
-        exp = """CategoricalIndex(['0 days 01:00:00', '1 days 01:00:00', '2 days 01:00:00',
-                  '3 days 01:00:00', '4 days 01:00:00', '5 days 01:00:00',
-                  '6 days 01:00:00', '7 days 01:00:00', '8 days 01:00:00',
-                  '9 days 01:00:00'],
-                 categories=[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, 5 days 01:00:00, 6 days 01:00:00, 7 days 01:00:00, ...], ordered=True, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_frame(self):
-        # normal DataFrame
-        dt = pd.date_range('2011-01-01 09:00', freq='H', periods=5, tz='US/Eastern')
-        p = pd.period_range('2011-01', freq='M', periods=5)
-        df = pd.DataFrame({'dt': dt, 'p': p})
-        exp = """                         dt       p
-0 2011-01-01 09:00:00-05:00 2011-01
-1 2011-01-01 10:00:00-05:00 2011-02
-2 2011-01-01 11:00:00-05:00 2011-03
-3 2011-01-01 12:00:00-05:00 2011-04
-4 2011-01-01 13:00:00-05:00 2011-05"""
-
-        df = pd.DataFrame({'dt': pd.Categorical(dt), 'p': pd.Categorical(p)})
-        self.assertEqual(repr(df), exp)
-
-    def test_info(self):
-
-        # make sure it works
-        n = 2500
-        df = DataFrame({ 'int64' : np.random.randint(100,size=n) })
-        df['category'] = Series(np.array(list('abcdefghij')).take(np.random.randint(0,10,size=n))).astype('category')
-        df.isnull()
-        df.info()
-
-        df2 = df[df['category']=='d']
-        df2.info()
-
-    def test_groupby_sort(self):
-
-        # http://stackoverflow.com/questions/23814368/sorting-pandas-categorical-labels-after-groupby
-        # This should result in a properly sorted Series so that the plot
-        # has a sorted x axis
-        #self.cat.groupby(['value_group'])['value_group'].count().plot(kind='bar')
-
-        res = self.cat.groupby(['value_group'])['value_group'].count()
-        exp = res[sorted(res.index, key=lambda x: float(x.split()[0]))]
-        tm.assert_series_equal(res, exp)
-
-    def test_min_max(self):
-        # unordered cats have no min/max
-        cat = Series(Categorical(["a","b","c","d"], ordered=False))
-        self.assertRaises(TypeError, lambda : cat.min())
-        self.assertRaises(TypeError, lambda : cat.max())
-
-        cat = Series(Categorical(["a","b","c","d"], ordered=True))
-        _min = cat.min()
-        _max = cat.max()
-        self.assertEqual(_min, "a")
-        self.assertEqual(_max, "d")
-
-        cat = Series(Categorical(["a","b","c","d"], categories=['d','c','b','a'], ordered=True))
-        _min = cat.min()
-        _max = cat.max()
-        self.assertEqual(_min, "d")
-        self.assertEqual(_max, "a")
-
-        cat = Series(Categorical([np.nan,"b","c",np.nan], categories=['d','c','b','a'], ordered=True))
-        _min = cat.min()
-        _max = cat.max()
-        self.assertTrue(np.isnan(_min))
-        self.assertEqual(_max, "b")
-
-        cat = Series(Categorical([np.nan,1,2,np.nan], categories=[5,4,3,2,1], ordered=True))
-        _min = cat.min()
-        _max = cat.max()
-        self.assertTrue(np.isnan(_min))
-        self.assertEqual(_max, 1)
-
-    def test_mode(self):
-        s = Series(Categorical([1,1,2,4,5,5,5], categories=[5,4,3,2,1], ordered=True))
-        res = s.mode()
-        exp = Series(Categorical([5], categories=[5,4,3,2,1], ordered=True))
-        tm.assert_series_equal(res, exp)
-        s = Series(Categorical([1,1,1,4,5,5,5], categories=[5,4,3,2,1], ordered=True))
-        res = s.mode()
-        exp = Series(Categorical([5,1], categories=[5,4,3,2,1], ordered=True))
-        tm.assert_series_equal(res, exp)
-        s = Series(Categorical([1,2,3,4,5], categories=[5,4,3,2,1], ordered=True))
-        res = s.mode()
-        exp = Series(Categorical([], categories=[5,4,3,2,1], ordered=True))
-        tm.assert_series_equal(res, exp)
-
-    def test_value_counts(self):
-
-        s = pd.Series(pd.Categorical(["a","b","c","c","c","b"], categories=["c","a","b","d"]))
-        res = s.value_counts(sort=False)
-        exp = Series([3,1,2,0], index=["c","a","b","d"])
-        tm.assert_series_equal(res, exp)
-        res = s.value_counts(sort=True)
-        exp = Series([3,2,1,0], index=["c","b","a","d"])
-        tm.assert_series_equal(res, exp)
-
-    def test_value_counts_with_nan(self):
-        # https://github.com/pydata/pandas/issues/9443
-
-        s = pd.Series(["a", "b", "a"], dtype="category")
-        tm.assert_series_equal(
-            s.value_counts(dropna=True),
-            pd.Series([2, 1], index=["a", "b"]))
-        tm.assert_series_equal(
-            s.value_counts(dropna=False),
-            pd.Series([2, 1], index=["a", "b"]))
-
-        s = pd.Series(["a", "b", None, "a", None, None], dtype="category")
-        tm.assert_series_equal(
-            s.value_counts(dropna=True),
-            pd.Series([2, 1], index=["a", "b"]))
-        tm.assert_series_equal(
-            s.value_counts(dropna=False),
-            pd.Series([3, 2, 1], index=[np.nan, "a", "b"]))
-        # When we aren't sorting by counts, and np.nan isn't a
-        # category, it should be last.
-        tm.assert_series_equal(
-            s.value_counts(dropna=False, sort=False),
-            pd.Series([2, 1, 3], index=["a", "b", np.nan]))
-
-        with tm.assert_produces_warning(FutureWarning):
-            s = pd.Series(pd.Categorical(["a", "b", "a"], categories=["a", "b", np.nan]))
-            tm.assert_series_equal(
-                s.value_counts(dropna=True),
-                pd.Series([2, 1], index=["a", "b"]))
-            tm.assert_series_equal(
-                s.value_counts(dropna=False),
-                pd.Series([2, 1, 0], index=["a", "b", np.nan]))
-
-        with tm.assert_produces_warning(FutureWarning):
-            s = pd.Series(pd.Categorical(["a", "b", None, "a", None, None],
-                                         categories=["a", "b", np.nan]))
-            tm.assert_series_equal(
-                s.value_counts(dropna=True),
-                pd.Series([2, 1], index=["a", "b"]))
-            tm.assert_series_equal(
-                s.value_counts(dropna=False),
-                pd.Series([3, 2, 1], index=[np.nan, "a", "b"]))
-
-    def test_groupby(self):
-
-        cats = Categorical(["a", "a", "a", "b", "b", "b", "c", "c", "c"], categories=["a","b","c","d"], ordered=True)
-        data = DataFrame({"a":[1,1,1,2,2,2,3,4,5], "b":cats})
-
-        expected = DataFrame({'a': Series([1, 2, 4, np.nan],
-                             index=Index(['a', 'b', 'c', 'd'], name='b'))})
-        result = data.groupby("b").mean()
-        tm.assert_frame_equal(result, expected)
-
-        raw_cat1 = Categorical(["a","a","b","b"], categories=["a","b","z"], ordered=True)
-        raw_cat2 = Categorical(["c","d","c","d"], categories=["c","d","y"], ordered=True)
-        df = DataFrame({"A":raw_cat1,"B":raw_cat2, "values":[1,2,3,4]})
-
-        # single grouper
-        gb = df.groupby("A")
-        expected = DataFrame({ 'values' : Series([3,7,np.nan],index=Index(['a','b','z'],name='A')) })
-        result = gb.sum()
-        tm.assert_frame_equal(result, expected)
-
-        # multiple groupers
-        gb = df.groupby(['A','B'])
-        expected = DataFrame({ 'values' : Series([1,2,np.nan,3,4,np.nan,np.nan,np.nan,np.nan],
-                                                 index=pd.MultiIndex.from_product([['a','b','z'],['c','d','y']],names=['A','B'])) })
-        result = gb.sum()
-        tm.assert_frame_equal(result, expected)
-
-        # multiple groupers with a non-cat
-        df = df.copy()
-        df['C'] = ['foo','bar']*2
-        gb = df.groupby(['A','B','C'])
-        expected = DataFrame({ 'values' :
-                               Series(np.nan,index=pd.MultiIndex.from_product([['a','b','z'],
-                                                                               ['c','d','y'],
-                                                                               ['foo','bar']],
-                                                                              names=['A','B','C']))
-                               }).sortlevel()
-        expected.iloc[[1,2,7,8],0] = [1,2,3,4]
-        result = gb.sum()
-        tm.assert_frame_equal(result, expected)
-
-        # GH 8623
-        x=pd.DataFrame([[1,'John P. Doe'],[2,'Jane Dove'],[1,'John P. Doe']],
-                       columns=['person_id','person_name'])
-        x['person_name'] = pd.Categorical(x.person_name)
-
-        g = x.groupby(['person_id'])
-        result = g.transform(lambda x:x)
-        tm.assert_frame_equal(result, x[['person_name']])
-
-        result = x.drop_duplicates('person_name')
-        expected = x.iloc[[0,1]]
-        tm.assert_frame_equal(result, expected)
-
-        def f(x):
-            return x.drop_duplicates('person_name').iloc[0]
-
-        result = g.apply(f)
-        expected = x.iloc[[0,1]].copy()
-        expected.index = Index([1,2],name='person_id')
-        expected['person_name'] = expected['person_name'].astype('object')
-        tm.assert_frame_equal(result, expected)
-
-        # GH 9921
-        # Monotonic
-        df = DataFrame({"a": [5, 15, 25]})
-        c = pd.cut(df.a, bins=[0,10,20,30,40])
-
-        result = df.a.groupby(c).transform(sum)
-        tm.assert_series_equal(result, df['a'], check_names=False)
-        self.assertTrue(result.name is None)
-
-        tm.assert_series_equal(df.a.groupby(c).transform(lambda xs: np.sum(xs)), df['a'])
-        tm.assert_frame_equal(df.groupby(c).transform(sum), df[['a']])
-        tm.assert_frame_equal(df.groupby(c).transform(lambda xs: np.max(xs)), df[['a']])
-
-        # Filter
-        tm.assert_series_equal(df.a.groupby(c).filter(np.all), df['a'])
-        tm.assert_frame_equal(df.groupby(c).filter(np.all), df)
-
-        # Non-monotonic
-        df = DataFrame({"a": [5, 15, 25, -5]})
-        c = pd.cut(df.a, bins=[-10, 0,10,20,30,40])
-
-        result = df.a.groupby(c).transform(sum)
-        tm.assert_series_equal(result, df['a'], check_names=False)
-        self.assertTrue(result.name is None)
-
-        tm.assert_series_equal(df.a.groupby(c).transform(lambda xs: np.sum(xs)), df['a'])
-        tm.assert_frame_equal(df.groupby(c).transform(sum), df[['a']])
-        tm.assert_frame_equal(df.groupby(c).transform(lambda xs: np.sum(xs)), df[['a']])
-
-        # GH 9603
-        df = pd.DataFrame({'a': [1, 0, 0, 0]})
-        c = pd.cut(df.a, [0, 1, 2, 3, 4])
-        result = df.groupby(c).apply(len)
-        expected = pd.Series([1, 0, 0, 0], index=c.values.categories)
-        expected.index.name = 'a'
-        tm.assert_series_equal(result, expected)
-
-    def test_pivot_table(self):
-
-        raw_cat1 = Categorical(["a","a","b","b"], categories=["a","b","z"], ordered=True)
-        raw_cat2 = Categorical(["c","d","c","d"], categories=["c","d","y"], ordered=True)
-        df = DataFrame({"A":raw_cat1,"B":raw_cat2, "values":[1,2,3,4]})
-        result = pd.pivot_table(df, values='values', index=['A', 'B'])
-
-        expected = Series([1,2,np.nan,3,4,np.nan,np.nan,np.nan,np.nan],
-                          index=pd.MultiIndex.from_product([['a','b','z'],['c','d','y']],names=['A','B']),
-                          name='values')
-        tm.assert_series_equal(result, expected)
-
-    def test_count(self):
-
-        s = Series(Categorical([np.nan,1,2,np.nan], categories=[5,4,3,2,1], ordered=True))
-        result = s.count()
-        self.assertEqual(result, 2)
-
-    def test_sort(self):
-
-        c = Categorical(["a","b","b","a"], ordered=False)
-        cat = Series(c)
-
-        # 9816 deprecated
-        with tm.assert_produces_warning(FutureWarning):
-            c.order()
-
-        # sort in the categories order
-        expected = Series(Categorical(["a","a","b","b"], ordered=False),index=[0,3,1,2])
-        result = cat.sort_values()
-        tm.assert_series_equal(result, expected)
-
-        cat = Series(Categorical(["a","c","b","d"], ordered=True))
-        res = cat.sort_values()
-        exp = np.array(["a","b","c","d"])
-        self.assert_numpy_array_equal(res.__array__(), exp)
-
-        cat = Series(Categorical(["a","c","b","d"], categories=["a","b","c","d"], ordered=True))
-        res = cat.sort_values()
-        exp = np.array(["a","b","c","d"])
-        self.assert_numpy_array_equal(res.__array__(), exp)
-
-        res = cat.sort_values(ascending=False)
-        exp = np.array(["d","c","b","a"])
-        self.assert_numpy_array_equal(res.__array__(), exp)
-
-        raw_cat1 = Categorical(["a","b","c","d"], categories=["a","b","c","d"], ordered=False)
-        raw_cat2 = Categorical(["a","b","c","d"], categories=["d","c","b","a"], ordered=True)
-        s = ["a","b","c","d"]
-        df = DataFrame({"unsort":raw_cat1,"sort":raw_cat2, "string":s, "values":[1,2,3,4]})
-
-        # Cats must be sorted in a dataframe
-        res = df.sort_values(by=["string"], ascending=False)
-        exp = np.array(["d", "c", "b", "a"])
-        self.assert_numpy_array_equal(res["sort"].values.__array__(), exp)
-        self.assertEqual(res["sort"].dtype, "category")
-
-        res = df.sort_values(by=["sort"], ascending=False)
-        exp = df.sort_values(by=["string"], ascending=True)
-        self.assert_numpy_array_equal(res["values"], exp["values"])
-        self.assertEqual(res["sort"].dtype, "category")
-        self.assertEqual(res["unsort"].dtype, "category")
-
-        # unordered cat, but we allow this
-        df.sort_values(by=["unsort"], ascending=False)
-
-        # multi-columns sort
-        # GH 7848
-        df = DataFrame({"id":[6,5,4,3,2,1], "raw_grade":['a', 'b', 'b', 'a', 'a', 'e']})
-        df["grade"] = pd.Categorical(df["raw_grade"], ordered=True)
-        df['grade'] = df['grade'].cat.set_categories(['b', 'e', 'a'])
-
-        # sorts 'grade' according to the order of the categories
-        result = df.sort_values(by=['grade'])
-        expected = df.iloc[[1,2,5,0,3,4]]
-        tm.assert_frame_equal(result,expected)
-
-        # multi
-        result = df.sort_values(by=['grade', 'id'])
-        expected = df.iloc[[2,1,5,4,3,0]]
-        tm.assert_frame_equal(result,expected)
-
-        # reverse
-        cat = Categorical(["a","c","c","b","d"], ordered=True)
-        res = cat.sort_values(ascending=False)
-        exp_val = np.array(["d","c", "c", "b","a"],dtype=object)
-        exp_categories = np.array(["a","b","c","d"],dtype=object)
-        self.assert_numpy_array_equal(res.__array__(), exp_val)
-        self.assert_numpy_array_equal(res.categories, exp_categories)
-
-        # some NaN positions
-
-        cat = Categorical(["a","c","b","d", np.nan], ordered=True)
-        res = cat.sort_values(ascending=False, na_position='last')
-        exp_val = np.array(["d","c","b","a", np.nan],dtype=object)
-        exp_categories = np.array(["a","b","c","d"],dtype=object)
-        self.assert_numpy_array_equal(res.__array__(), exp_val)
-        self.assert_numpy_array_equal(res.categories, exp_categories)
-
-        cat = Categorical(["a","c","b","d", np.nan], ordered=True)
-        res = cat.sort_values(ascending=False, na_position='first')
-        exp_val = np.array([np.nan, "d","c","b","a"],dtype=object)
-        exp_categories = np.array(["a","b","c","d"],dtype=object)
-        self.assert_numpy_array_equal(res.__array__(), exp_val)
-        self.assert_numpy_array_equal(res.categories, exp_categories)
-
-        cat = Categorical(["a","c","b","d", np.nan], ordered=True)
-        res = cat.sort_values(ascending=False, na_position='first')
-        exp_val = np.array([np.nan, "d","c","b","a"],dtype=object)
-        exp_categories = np.array(["a","b","c","d"],dtype=object)
-        self.assert_numpy_array_equal(res.__array__(), exp_val)
-        self.assert_numpy_array_equal(res.categories, exp_categories)
-
-        cat = Categorical(["a","c","b","d", np.nan], ordered=True)
-        res = cat.sort_values(ascending=False, na_position='last')
-        exp_val = np.array(["d","c","b","a",np.nan],dtype=object)
-        exp_categories = np.array(["a","b","c","d"],dtype=object)
-        self.assert_numpy_array_equal(res.__array__(), exp_val)
-        self.assert_numpy_array_equal(res.categories, exp_categories)
-
-    def test_slicing(self):
-        cat = Series(Categorical([1,2,3,4]))
-        reversed = cat[::-1]
-        exp = np.array([4,3,2,1])
-        self.assert_numpy_array_equal(reversed.__array__(), exp)
-
-        df = DataFrame({'value': (np.arange(100)+1).astype('int64')})
-        df['D'] = pd.cut(df.value, bins=[0,25,50,75,100])
-
-        expected = Series([11,'(0, 25]'], index=['value','D'], name=10)
-        result = df.iloc[10]
-        tm.assert_series_equal(result, expected)
-
-        expected = DataFrame({'value': np.arange(11,21).astype('int64')},
-                             index=np.arange(10,20).astype('int64'))
-        expected['D'] = pd.cut(expected.value, bins=[0,25,50,75,100])
-        result = df.iloc[10:20]
-        tm.assert_frame_equal(result, expected)
-
-        expected = Series([9,'(0, 25]'],index=['value', 'D'], name=8)
-        result = df.loc[8]
-        tm.assert_series_equal(result, expected)
-
-    def test_slicing_and_getting_ops(self):
-
-        # systematically test the slicing operations:
-        #  for all slicing ops:
-        #   - returning a dataframe
-        #   - returning a column
-        #   - returning a row
-        #   - returning a single value
-
-        cats = pd.Categorical(["a","c","b","c","c","c","c"], categories=["a","b","c"])
-        idx = pd.Index(["h","i","j","k","l","m","n"])
-        values= [1,2,3,4,5,6,7]
-        df = pd.DataFrame({"cats":cats,"values":values}, index=idx)
-
-        # the expected values
-        cats2 = pd.Categorical(["b","c"], categories=["a","b","c"])
-        idx2 = pd.Index(["j","k"])
-        values2= [3,4]
-
-        # 2:4,: | "j":"k",:
-        exp_df = pd.DataFrame({"cats":cats2,"values":values2}, index=idx2)
-
-        # :,"cats" | :,0
-        exp_col = pd.Series(cats,index=idx,name='cats')
-
-        # "j",: | 2,:
-        exp_row = pd.Series(["b",3], index=["cats","values"], dtype="object", name="j")
-
-        # "j","cats | 2,0
-        exp_val = "b"
-
-        # iloc
-        # frame
-        res_df = df.iloc[2:4,:]
-        tm.assert_frame_equal(res_df, exp_df)
-        self.assertTrue(com.is_categorical_dtype(res_df["cats"]))
-
-        # row
-        res_row = df.iloc[2,:]
-        tm.assert_series_equal(res_row, exp_row)
-        tm.assertIsInstance(res_row["cats"], compat.string_types)
-
-        # col
-        res_col = df.iloc[:,0]
-        tm.assert_series_equal(res_col, exp_col)
-        self.assertTrue(com.is_categorical_dtype(res_col))
-
-        # single value
-        res_val = df.iloc[2,0]
-        self.assertEqual(res_val, exp_val)
-
-        # loc
-        # frame
-        res_df = df.loc["j":"k",:]
-        tm.assert_frame_equal(res_df, exp_df)
-        self.assertTrue(com.is_categorical_dtype(res_df["cats"]))
-
-        # row
-        res_row = df.loc["j",:]
-        tm.assert_series_equal(res_row, exp_row)
-        tm.assertIsInstance(res_row["cats"], compat.string_types)
-
-        # col
-        res_col = df.loc[:,"cats"]
-        tm.assert_series_equal(res_col, exp_col)
-        self.assertTrue(com.is_categorical_dtype(res_col))
-
-        # single value
-        res_val = df.loc["j","cats"]
-        self.assertEqual(res_val, exp_val)
-
-        # ix
-        # frame
-        #res_df = df.ix["j":"k",[0,1]] # doesn't work?
-        res_df = df.ix["j":"k",:]
-        tm.assert_frame_equal(res_df, exp_df)
-        self.assertTrue(com.is_categorical_dtype(res_df["cats"]))
-
-        # row
-        res_row = df.ix["j",:]
-        tm.assert_series_equal(res_row, exp_row)
-        tm.assertIsInstance(res_row["cats"], compat.string_types)
-
-        # col
-        res_col = df.ix[:,"cats"]
-        tm.assert_series_equal(res_col, exp_col)
-        self.assertTrue(com.is_categorical_dtype(res_col))
-
-        # single value
-        res_val = df.ix["j",0]
-        self.assertEqual(res_val, exp_val)
-
-        # iat
-        res_val = df.iat[2,0]
-        self.assertEqual(res_val, exp_val)
-
-        # at
-        res_val = df.at["j","cats"]
-        self.assertEqual(res_val, exp_val)
-
-        # fancy indexing
-        exp_fancy = df.iloc[[2]]
-
-        res_fancy = df[df["cats"] == "b"]
-        tm.assert_frame_equal(res_fancy,exp_fancy)
-        res_fancy = df[df["values"] == 3]
-        tm.assert_frame_equal(res_fancy,exp_fancy)
-
-        # get_value
-        res_val = df.get_value("j","cats")
-        self.assertEqual(res_val, exp_val)
-
-        # i : int, slice, or sequence of integers
-        res_row = df.iloc[2]
-        tm.assert_series_equal(res_row, exp_row)
-        tm.assertIsInstance(res_row["cats"], compat.string_types)
-
-        res_df = df.iloc[slice(2,4)]
-        tm.assert_frame_equal(res_df, exp_df)
-        self.assertTrue(com.is_categorical_dtype(res_df["cats"]))
-
-        res_df = df.iloc[[2,3]]
-        tm.assert_frame_equal(res_df, exp_df)
-        self.assertTrue(com.is_categorical_dtype(res_df["cats"]))
-
-        res_col = df.iloc[:,0]
-        tm.assert_series_equal(res_col, exp_col)
-        self.assertTrue(com.is_categorical_dtype(res_col))
-
-        res_df = df.iloc[:,slice(0,2)]
-        tm.assert_frame_equal(res_df, df)
-        self.assertTrue(com.is_categorical_dtype(res_df["cats"]))
-
-        res_df = df.iloc[:,[0,1]]
-        tm.assert_frame_equal(res_df, df)
-        self.assertTrue(com.is_categorical_dtype(res_df["cats"]))
-
-    def test_slicing_doc_examples(self):
-
-        #GH 7918
-        cats = Categorical(["a","b","b","b","c","c","c"], categories=["a","b","c"])
-        idx = Index(["h","i","j","k","l","m","n",])
-        values= [1,2,2,2,3,4,5]
-        df = DataFrame({"cats":cats,"values":values}, index=idx)
-
-        result = df.iloc[2:4,:]
-        expected = DataFrame({"cats":Categorical(['b','b'],categories=['a','b','c']),"values":[2,2]}, index=['j','k'])
-        tm.assert_frame_equal(result, expected)
-
-        result = df.iloc[2:4,:].dtypes
-        expected = Series(['category','int64'],['cats','values'])
-        tm.assert_series_equal(result, expected)
-
-        result = df.loc["h":"j","cats"]
-        expected = Series(Categorical(['a','b','b'],
-                          categories=['a','b','c']), index=['h','i','j'], name='cats')
-        tm.assert_series_equal(result, expected)
-
-        result = df.ix["h":"j",0:1]
-        expected = DataFrame({'cats' : Series(Categorical(['a','b','b'],categories=['a','b','c']),index=['h','i','j']) })
-        tm.assert_frame_equal(result, expected)
-
-    def test_assigning_ops(self):
-
-        # systematically test the assigning operations:
-        # for all slicing ops:
-        #  for value in categories and value not in categories:
-        #   - assign a single value -> exp_single_cats_value
-        #   - assign a complete row (mixed values) -> exp_single_row
-        #   - assign multiple rows (mixed values) (-> array) -> exp_multi_row
-        #   - assign a part of a column with dtype == categorical -> exp_parts_cats_col
-        #   - assign a part of a column with dtype != categorical -> exp_parts_cats_col
-
-        cats = pd.Categorical(["a","a","a","a","a","a","a"], categories=["a","b"])
-        idx = pd.Index(["h","i","j","k","l","m","n"])
-        values = [1,1,1,1,1,1,1]
-        orig = pd.DataFrame({"cats":cats,"values":values}, index=idx)
-
-        ### the expected values
-        # changed single row
-        cats1 = pd.Categorical(["a","a","b","a","a","a","a"], categories=["a","b"])
-        idx1 = pd.Index(["h","i","j","k","l","m","n"])
-        values1 = [1,1,2,1,1,1,1]
-        exp_single_row = pd.DataFrame({"cats":cats1,"values":values1}, index=idx1)
-
-        #changed multiple rows
-        cats2 = pd.Categorical(["a","a","b","b","a","a","a"], categories=["a","b"])
-        idx2 = pd.Index(["h","i","j","k","l","m","n"])
-        values2 = [1,1,2,2,1,1,1]
-        exp_multi_row = pd.DataFrame({"cats":cats2,"values":values2}, index=idx2)
-
-        # changed part of the cats column
-        cats3 = pd.Categorical(["a","a","b","b","a","a","a"], categories=["a","b"])
-        idx3 = pd.Index(["h","i","j","k","l","m","n"])
-        values3 = [1,1,1,1,1,1,1]
-        exp_parts_cats_col = pd.DataFrame({"cats":cats3,"values":values3}, index=idx3)
-
-        # changed single value in cats col
-        cats4 = pd.Categorical(["a","a","b","a","a","a","a"], categories=["a","b"])
-        idx4 = pd.Index(["h","i","j","k","l","m","n"])
-        values4 = [1,1,1,1,1,1,1]
-        exp_single_cats_value = pd.DataFrame({"cats":cats4,"values":values4}, index=idx4)
-
-        ####  iloc #####
-        ################
-        #   - assign a single value -> exp_single_cats_value
-        df = orig.copy()
-        df.iloc[2,0] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-
-        df = orig.copy()
-        df.iloc[df.index == "j",0] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-
-        #   - assign a single value not in the current categories set
-        def f():
-            df = orig.copy()
-            df.iloc[2,0] = "c"
-        self.assertRaises(ValueError, f)
-
-        #   - assign a complete row (mixed values) -> exp_single_row
-        df = orig.copy()
-        df.iloc[2,:] = ["b",2]
-        tm.assert_frame_equal(df, exp_single_row)
-
-        #   - assign a complete row (mixed values) not in categories set
-        def f():
-            df = orig.copy()
-            df.iloc[2,:] = ["c",2]
-        self.assertRaises(ValueError, f)
-
-        #   - assign multiple rows (mixed values) -> exp_multi_row
-        df = orig.copy()
-        df.iloc[2:4,:] = [["b",2],["b",2]]
-        tm.assert_frame_equal(df, exp_multi_row)
-
-        def f():
-            df = orig.copy()
-            df.iloc[2:4,:] = [["c",2],["c",2]]
-        self.assertRaises(ValueError, f)
-
-        #   - assign a part of a column with dtype == categorical -> exp_parts_cats_col
-        df = orig.copy()
-        df.iloc[2:4,0] = pd.Categorical(["b","b"], categories=["a","b"])
-        tm.assert_frame_equal(df, exp_parts_cats_col)
-
-        with tm.assertRaises(ValueError):
-            # different categories -> not sure if this should fail or pass
-            df = orig.copy()
-            df.iloc[2:4,0] = pd.Categorical(["b","b"], categories=["a","b","c"])
-
-        with tm.assertRaises(ValueError):
-            # different values
-            df = orig.copy()
-            df.iloc[2:4,0] = pd.Categorical(["c","c"], categories=["a","b","c"])
-
-        #   - assign a part of a column with dtype != categorical -> exp_parts_cats_col
-        df = orig.copy()
-        df.iloc[2:4,0] = ["b","b"]
-        tm.assert_frame_equal(df, exp_parts_cats_col)
-
-        with tm.assertRaises(ValueError):
-            df.iloc[2:4,0] = ["c","c"]
-
-        ####  loc  #####
-        ################
-        #   - assign a single value -> exp_single_cats_value
-        df = orig.copy()
-        df.loc["j","cats"] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        df = orig.copy()
-        df.loc[df.index == "j","cats"] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        #   - assign a single value not in the current categories set
-        def f():
-            df = orig.copy()
-            df.loc["j","cats"] = "c"
-        self.assertRaises(ValueError, f)
-
-        #   - assign a complete row (mixed values) -> exp_single_row
-        df = orig.copy()
-        df.loc["j",:] = ["b",2]
-        tm.assert_frame_equal(df, exp_single_row)
-
-        #   - assign a complete row (mixed values) not in categories set
-        def f():
-            df = orig.copy()
-            df.loc["j",:] = ["c",2]
-        self.assertRaises(ValueError, f)
-
-        #   - assign multiple rows (mixed values) -> exp_multi_row
-        df = orig.copy()
-        df.loc["j":"k",:] = [["b",2],["b",2]]
-        tm.assert_frame_equal(df, exp_multi_row)
-
-        def f():
-            df = orig.copy()
-            df.loc["j":"k",:] = [["c",2],["c",2]]
-        self.assertRaises(ValueError, f)
-
-        #   - assign a part of a column with dtype == categorical -> exp_parts_cats_col
-        df = orig.copy()
-        df.loc["j":"k","cats"] = pd.Categorical(["b","b"], categories=["a","b"])
-        tm.assert_frame_equal(df, exp_parts_cats_col)
-
-        with tm.assertRaises(ValueError):
-            # different categories -> not sure if this should fail or pass
-            df = orig.copy()
-            df.loc["j":"k","cats"] = pd.Categorical(["b","b"], categories=["a","b","c"])
-
-        with tm.assertRaises(ValueError):
-            # different values
-            df = orig.copy()
-            df.loc["j":"k","cats"] = pd.Categorical(["c","c"], categories=["a","b","c"])
-
-        #   - assign a part of a column with dtype != categorical -> exp_parts_cats_col
-        df = orig.copy()
-        df.loc["j":"k","cats"] = ["b","b"]
-        tm.assert_frame_equal(df, exp_parts_cats_col)
-
-        with tm.assertRaises(ValueError):
-            df.loc["j":"k","cats"] = ["c","c"]
-
-        ####  ix   #####
-        ################
-        #   - assign a single value -> exp_single_cats_value
-        df = orig.copy()
-        df.ix["j",0] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        df = orig.copy()
-        df.ix[df.index == "j",0] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        #   - assign a single value not in the current categories set
-        def f():
-            df = orig.copy()
-            df.ix["j",0] = "c"
-        self.assertRaises(ValueError, f)
-
-        #   - assign a complete row (mixed values) -> exp_single_row
-        df = orig.copy()
-        df.ix["j",:] = ["b",2]
-        tm.assert_frame_equal(df, exp_single_row)
-
-        #   - assign a complete row (mixed values) not in categories set
-        def f():
-            df = orig.copy()
-            df.ix["j",:] = ["c",2]
-        self.assertRaises(ValueError, f)
-
-        #   - assign multiple rows (mixed values) -> exp_multi_row
-        df = orig.copy()
-        df.ix["j":"k",:] = [["b",2],["b",2]]
-        tm.assert_frame_equal(df, exp_multi_row)
-
-        def f():
-            df = orig.copy()
-            df.ix["j":"k",:] = [["c",2],["c",2]]
-        self.assertRaises(ValueError, f)
-
-        #   - assign a part of a column with dtype == categorical -> exp_parts_cats_col
-        df = orig.copy()
-        df.ix["j":"k",0] = pd.Categorical(["b","b"], categories=["a","b"])
-        tm.assert_frame_equal(df, exp_parts_cats_col)
-
-        with tm.assertRaises(ValueError):
-            # different categories -> not sure if this should fail or pass
-            df = orig.copy()
-            df.ix["j":"k",0] = pd.Categorical(["b","b"], categories=["a","b","c"])
-
-        with tm.assertRaises(ValueError):
-            # different values
-            df = orig.copy()
-            df.ix["j":"k",0] = pd.Categorical(["c","c"], categories=["a","b","c"])
-
-        #   - assign a part of a column with dtype != categorical -> exp_parts_cats_col
-        df = orig.copy()
-        df.ix["j":"k",0] = ["b","b"]
-        tm.assert_frame_equal(df, exp_parts_cats_col)
-
-        with tm.assertRaises(ValueError):
-            df.ix["j":"k",0] = ["c","c"]
-
-        # iat
-        df = orig.copy()
-        df.iat[2,0] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        #   - assign a single value not in the current categories set
-        def f():
-            df = orig.copy()
-            df.iat[2,0] = "c"
-        self.assertRaises(ValueError, f)
-
-        # at
-        #   - assign a single value -> exp_single_cats_value
-        df = orig.copy()
-        df.at["j","cats"] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        #   - assign a single value not in the current categories set
-        def f():
-            df = orig.copy()
-            df.at["j","cats"] = "c"
-        self.assertRaises(ValueError, f)
-
-        # fancy indexing
-        catsf = pd.Categorical(["a","a","c","c","a","a","a"], categories=["a","b","c"])
-        idxf = pd.Index(["h","i","j","k","l","m","n"])
-        valuesf = [1,1,3,3,1,1,1]
-        df = pd.DataFrame({"cats":catsf,"values":valuesf}, index=idxf)
-
-        exp_fancy = exp_multi_row.copy()
-        exp_fancy["cats"].cat.set_categories(["a","b","c"], inplace=True)
-
-        df[df["cats"] == "c"] = ["b",2]
-        tm.assert_frame_equal(df, exp_multi_row)
-
-        # set_value
-        df = orig.copy()
-        df.set_value("j","cats", "b")
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        def f():
-            df = orig.copy()
-            df.set_value("j","cats", "c")
-        self.assertRaises(ValueError, f)
-
-        # Assigning a Category to parts of a int/... column uses the values of the Catgorical
-        df = pd.DataFrame({"a":[1,1,1,1,1], "b":["a","a","a","a","a"]})
-        exp = pd.DataFrame({"a":[1,"b","b",1,1], "b":["a","a","b","b","a"]})
-        df.loc[1:2,"a"] = pd.Categorical(["b","b"], categories=["a","b"])
-        df.loc[2:3,"b"] = pd.Categorical(["b","b"], categories=["a","b"])
-        tm.assert_frame_equal(df, exp)
-
-        ######### Series ##########
-        orig = Series(pd.Categorical(["b","b"], categories=["a","b"]))
-        s = orig.copy()
-        s[:] = "a"
-        exp = Series(pd.Categorical(["a","a"], categories=["a","b"]))
-        tm.assert_series_equal(s, exp)
-
-        s = orig.copy()
-        s[1] = "a"
-        exp = Series(pd.Categorical(["b","a"], categories=["a","b"]))
-        tm.assert_series_equal(s, exp)
-
-        s = orig.copy()
-        s[s.index > 0] = "a"
-        exp = Series(pd.Categorical(["b","a"], categories=["a","b"]))
-        tm.assert_series_equal(s, exp)
-
-        s = orig.copy()
-        s[[False, True]] = "a"
-        exp = Series(pd.Categorical(["b","a"], categories=["a","b"]))
-        tm.assert_series_equal(s, exp)
-
-        s = orig.copy()
-        s.index = ["x", "y"]
-        s["y"] = "a"
-        exp = Series(pd.Categorical(["b","a"], categories=["a","b"]), index=["x", "y"])
-        tm.assert_series_equal(s, exp)
-
-        # ensure that one can set something to np.nan
-        s = Series(Categorical([1,2,3]))
-        exp = Series(Categorical([1,np.nan,3]))
-        s[1] = np.nan
-        tm.assert_series_equal(s, exp)
-
-
-    def test_comparisons(self):
-        tests_data = [(list("abc"), list("cba"), list("bbb")),
-                      ([1,2,3], [3,2,1], [2,2,2])]
-        for data , reverse, base in tests_data:
-            cat_rev = pd.Series(pd.Categorical(data, categories=reverse, ordered=True))
-            cat_rev_base = pd.Series(pd.Categorical(base, categories=reverse, ordered=True))
-            cat = pd.Series(pd.Categorical(data, ordered=True))
-            cat_base = pd.Series(pd.Categorical(base, categories=cat.cat.categories, ordered=True))
-            s = Series(base)
-            a = np.array(base)
-
-            # comparisons need to take categories ordering into account
-            res_rev = cat_rev > cat_rev_base
-            exp_rev = Series([True, False, False])
-            tm.assert_series_equal(res_rev, exp_rev)
-
-            res_rev = cat_rev < cat_rev_base
-            exp_rev = Series([False, False, True])
-            tm.assert_series_equal(res_rev, exp_rev)
-
-            res = cat > cat_base
-            exp = Series([False, False, True])
-            tm.assert_series_equal(res, exp)
-
-            scalar = base[1]
-            res = cat > scalar
-            exp = Series([False, False, True])
-            exp2 = cat.values > scalar
-            tm.assert_series_equal(res, exp)
-            tm.assert_numpy_array_equal(res.values, exp2)
-            res_rev = cat_rev > scalar
-            exp_rev = Series([True, False, False])
-            exp_rev2 = cat_rev.values > scalar
-            tm.assert_series_equal(res_rev, exp_rev)
-            tm.assert_numpy_array_equal(res_rev.values, exp_rev2)
-
-            # Only categories with same categories can be compared
-            def f():
-                cat > cat_rev
-            self.assertRaises(TypeError, f)
-
-            # categorical cannot be compared to Series or numpy array, and also not the other way
-            # around
-            self.assertRaises(TypeError, lambda: cat > s)
-            self.assertRaises(TypeError, lambda: cat_rev > s)
-            self.assertRaises(TypeError, lambda: cat > a)
-            self.assertRaises(TypeError, lambda: cat_rev > a)
-
-            self.assertRaises(TypeError, lambda: s < cat)
-            self.assertRaises(TypeError, lambda: s < cat_rev)
-
-            self.assertRaises(TypeError, lambda: a < cat)
-            self.assertRaises(TypeError, lambda: a < cat_rev)
-
-        # unequal comparison should raise for unordered cats
-        cat = Series(Categorical(list("abc")))
-        def f():
-            cat > "b"
-        self.assertRaises(TypeError, f)
-        cat = Series(Categorical(list("abc"), ordered=False))
-        def f():
-            cat > "b"
-        self.assertRaises(TypeError, f)
-
-        # https://github.com/pydata/pandas/issues/9836#issuecomment-92123057 and following
-        # comparisons with scalars not in categories should raise for unequal comps, but not for
-        # equal/not equal
-        cat = Series(Categorical(list("abc"), ordered=True))
-
-        self.assertRaises(TypeError, lambda: cat < "d")
-        self.assertRaises(TypeError, lambda: cat > "d")
-        self.assertRaises(TypeError, lambda: "d" < cat)
-        self.assertRaises(TypeError, lambda: "d" > cat)
-
-        self.assert_series_equal(cat == "d" , Series([False, False, False]))
-        self.assert_series_equal(cat != "d" , Series([True, True, True]))
-
-
-        # And test NaN handling...
-        cat = Series(Categorical(["a","b","c", np.nan]))
-        exp = Series([True, True, True, False])
-        res = (cat == cat)
-        tm.assert_series_equal(res, exp)
-
-    def test_cat_equality(self):
-
-        # GH 8938
-        # allow equality comparisons
-        a = Series(list('abc'),dtype="category")
-        b = Series(list('abc'),dtype="object")
-        c = Series(['a','b','cc'],dtype="object")
-        d = Series(list('acb'),dtype="object")
-        e = Categorical(list('abc'))
-        f = Categorical(list('acb'))
-
-        # vs scalar
-        self.assertFalse((a=='a').all())
-        self.assertTrue(((a!='a') == ~(a=='a')).all())
-
-        self.assertFalse(('a'==a).all())
-        self.assertTrue((a=='a')[0])
-        self.assertTrue(('a'==a)[0])
-        self.assertFalse(('a'!=a)[0])
-
-        # vs list-like
-        self.assertTrue((a==a).all())
-        self.assertFalse((a!=a).all())
-
-        self.assertTrue((a==list(a)).all())
-        self.assertTrue((a==b).all())
-        self.assertTrue((b==a).all())
-        self.assertTrue(((~(a==b))==(a!=b)).all())
-        self.assertTrue(((~(b==a))==(b!=a)).all())
-
-        self.assertFalse((a==c).all())
-        self.assertFalse((c==a).all())
-        self.assertFalse((a==d).all())
-        self.assertFalse((d==a).all())
-
-        # vs a cat-like
-        self.assertTrue((a==e).all())
-        self.assertTrue((e==a).all())
-        self.assertFalse((a==f).all())
-        self.assertFalse((f==a).all())
-
-        self.assertTrue(((~(a==e)==(a!=e)).all()))
-        self.assertTrue(((~(e==a)==(e!=a)).all()))
-        self.assertTrue(((~(a==f)==(a!=f)).all()))
-        self.assertTrue(((~(f==a)==(f!=a)).all()))
-
-        # non-equality is not comparable
-        self.assertRaises(TypeError, lambda: a < b)
-        self.assertRaises(TypeError, lambda: b < a)
-        self.assertRaises(TypeError, lambda: a > b)
-        self.assertRaises(TypeError, lambda: b > a)
-
-    def test_concat(self):
-        cat = pd.Categorical(["a","b"], categories=["a","b"])
-        vals = [1,2]
-        df = pd.DataFrame({"cats":cat, "vals":vals})
-        cat2 = pd.Categorical(["a","b","a","b"], categories=["a","b"])
-        vals2 = [1,2,1,2]
-        exp = pd.DataFrame({"cats":cat2, "vals":vals2}, index=pd.Index([0, 1, 0, 1]))
-
-        res = pd.concat([df,df])
-        tm.assert_frame_equal(exp, res)
-
-        # Concat should raise if the two categoricals do not have the same categories
-        cat3 = pd.Categorical(["a","b"], categories=["a","b","c"])
-        vals3 = [1,2]
-        df_wrong_categories = pd.DataFrame({"cats":cat3, "vals":vals3})
-
-        def f():
-            pd.concat([df,df_wrong_categories])
-        self.assertRaises(ValueError, f)
-
-        # GH 7864
-        # make sure ordering is preserverd
-        df = pd.DataFrame({"id":[1,2,3,4,5,6], "raw_grade":['a', 'b', 'b', 'a', 'a', 'e']})
-        df["grade"] = pd.Categorical(df["raw_grade"])
-        df['grade'].cat.set_categories(['e', 'a', 'b'])
-
-        df1 = df[0:3]
-        df2 = df[3:]
-
-        self.assert_numpy_array_equal(df['grade'].cat.categories, df1['grade'].cat.categories)
-        self.assert_numpy_array_equal(df['grade'].cat.categories, df2['grade'].cat.categories)
-
-        dfx = pd.concat([df1, df2])
-        dfx['grade'].cat.categories
-        self.assert_numpy_array_equal(df['grade'].cat.categories, dfx['grade'].cat.categories)
-
-    def test_concat_preserve(self):
-
-        # GH 8641
-        # series concat not preserving category dtype
-        s = Series(list('abc'),dtype='category')
-        s2 = Series(list('abd'),dtype='category')
-
-        def f():
-            pd.concat([s,s2])
-        self.assertRaises(ValueError, f)
-
-        result = pd.concat([s,s],ignore_index=True)
-        expected = Series(list('abcabc')).astype('category')
-        tm.assert_series_equal(result, expected)
-
-        result = pd.concat([s,s])
-        expected = Series(list('abcabc'),index=[0,1,2,0,1,2]).astype('category')
-        tm.assert_series_equal(result, expected)
-
-        a = Series(np.arange(6,dtype='int64'))
-        b = Series(list('aabbca'))
-
-        df2 = DataFrame({'A' : a, 'B' : b.astype('category',categories=list('cab')) })
-        result = pd.concat([df2,df2])
-        expected = DataFrame({'A' : pd.concat([a,a]), 'B' : pd.concat([b,b]).astype('category',categories=list('cab')) })
-        tm.assert_frame_equal(result, expected)
-
-    def test_categorical_index_preserver(self):
-
-        a = Series(np.arange(6,dtype='int64'))
-        b = Series(list('aabbca'))
-
-        df2 = DataFrame({'A' : a, 'B' : b.astype('category',categories=list('cab')) }).set_index('B')
-        result = pd.concat([df2,df2])
-        expected = DataFrame({'A' : pd.concat([a,a]), 'B' : pd.concat([b,b]).astype('category',categories=list('cab')) }).set_index('B')
-        tm.assert_frame_equal(result, expected)
-
-        # wrong catgories
-        df3 = DataFrame({'A' : a, 'B' : b.astype('category',categories=list('abc')) }).set_index('B')
-        self.assertRaises(TypeError, lambda : pd.concat([df2,df3]))
-
-    def test_append(self):
-        cat = pd.Categorical(["a","b"], categories=["a","b"])
-        vals = [1,2]
-        df = pd.DataFrame({"cats":cat, "vals":vals})
-        cat2 = pd.Categorical(["a","b","a","b"], categories=["a","b"])
-        vals2 = [1,2,1,2]
-        exp = pd.DataFrame({"cats":cat2, "vals":vals2}, index=pd.Index([0, 1, 0, 1]))
-
-        res = df.append(df)
-        tm.assert_frame_equal(exp, res)
-
-        # Concat should raise if the two categoricals do not have the same categories
-        cat3 = pd.Categorical(["a","b"], categories=["a","b","c"])
-        vals3 = [1,2]
-        df_wrong_categories = pd.DataFrame({"cats":cat3, "vals":vals3})
-
-        def f():
-            df.append(df_wrong_categories)
-        self.assertRaises(ValueError, f)
-
-    def test_merge(self):
-        # GH 9426
-
-        right = DataFrame({'c': {0: 'a', 1: 'b', 2: 'c', 3: 'd', 4: 'e'},
-                              'd': {0: 'null', 1: 'null', 2: 'null', 3: 'null', 4: 'null'}})
-        left = DataFrame({'a': {0: 'f', 1: 'f', 2: 'f', 3: 'f', 4: 'f'},
-                          'b': {0: 'g', 1: 'g', 2: 'g', 3: 'g', 4: 'g'}})
-        df = pd.merge(left, right, how='left', left_on='b', right_on='c')
-
-        # object-object
-        expected = df.copy()
-
-        # object-cat
-        cright = right.copy()
-        cright['d'] = cright['d'].astype('category')
-        result = pd.merge(left, cright, how='left', left_on='b', right_on='c')
-        tm.assert_frame_equal(result, expected)
-
-        # cat-object
-        cleft = left.copy()
-        cleft['b'] = cleft['b'].astype('category')
-        result = pd.merge(cleft, cright, how='left', left_on='b', right_on='c')
-        tm.assert_frame_equal(result, expected)
-
-        # cat-cat
-        cright = right.copy()
-        cright['d'] = cright['d'].astype('category')
-        cleft = left.copy()
-        cleft['b'] = cleft['b'].astype('category')
-        result = pd.merge(cleft, cright, how='left', left_on='b', right_on='c')
-        tm.assert_frame_equal(result, expected)
-
-    def test_repeat(self):
-        #GH10183
-        cat = pd.Categorical(["a","b"], categories=["a","b"])
-        exp = pd.Categorical(["a", "a", "b", "b"], categories=["a","b"])
-        res = cat.repeat(2)
-        self.assert_categorical_equal(res, exp)
-
-    def test_na_actions(self):
-
-        cat = pd.Categorical([1,2,3,np.nan], categories=[1,2,3])
-        vals = ["a","b",np.nan,"d"]
-        df = pd.DataFrame({"cats":cat, "vals":vals})
-        cat2 = pd.Categorical([1,2,3,3], categories=[1,2,3])
-        vals2 = ["a","b","b","d"]
-        df_exp_fill = pd.DataFrame({"cats":cat2, "vals":vals2})
-        cat3 = pd.Categorical([1,2,3], categories=[1,2,3])
-        vals3 = ["a","b",np.nan]
-        df_exp_drop_cats = pd.DataFrame({"cats":cat3, "vals":vals3})
-        cat4 = pd.Categorical([1,2], categories=[1,2,3])
-        vals4 = ["a","b"]
-        df_exp_drop_all = pd.DataFrame({"cats":cat4, "vals":vals4})
-
-        # fillna
-        res = df.fillna(value={"cats":3, "vals":"b"})
-        tm.assert_frame_equal(res, df_exp_fill)
-
-        def f():
-            df.fillna(value={"cats":4, "vals":"c"})
-        self.assertRaises(ValueError, f)
-
-        res = df.fillna(method='pad')
-        tm.assert_frame_equal(res, df_exp_fill)
-
-        res = df.dropna(subset=["cats"])
-        tm.assert_frame_equal(res, df_exp_drop_cats)
-
-        res = df.dropna()
-        tm.assert_frame_equal(res, df_exp_drop_all)
-
-        # make sure that fillna takes both missing values and NA categories into account
-        c = Categorical(["a","b",np.nan])
-        with tm.assert_produces_warning(FutureWarning):
-            c.set_categories(["a","b",np.nan], rename=True, inplace=True)
-        c[0] = np.nan
-        df = pd.DataFrame({"cats":c, "vals":[1,2,3]})
-        df_exp = pd.DataFrame({"cats": Categorical(["a","b","a"]), "vals": [1,2,3]})
-
-        res = df.fillna("a")
-        tm.assert_frame_equal(res, df_exp)
-
-
-    def test_astype_to_other(self):
-
-        s = self.cat['value_group']
-        expected = s
-        tm.assert_series_equal(s.astype('category'),expected)
-        tm.assert_series_equal(s.astype(com.CategoricalDtype()),expected)
-        self.assertRaises(ValueError, lambda : s.astype('float64'))
-
-        cat = Series(Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c']))
-        exp = Series(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
-        tm.assert_series_equal(cat.astype('str'), exp)
-        s2 = Series(Categorical.from_array(['1', '2', '3', '4']))
-        exp2 = Series([1,2,3,4]).astype(int)
-        tm.assert_series_equal(s2.astype('int') , exp2)
-
-        # object don't sort correctly, so just compare that we have the same values
-        def cmp(a,b):
-            tm.assert_almost_equal(np.sort(np.unique(a)),np.sort(np.unique(b)))
-        expected = Series(np.array(s.values),name='value_group')
-        cmp(s.astype('object'),expected)
-        cmp(s.astype(np.object_),expected)
-
-        # array conversion
-        tm.assert_almost_equal(np.array(s),np.array(s.values))
-
-        # valid conversion
-        for valid in [lambda x: x.astype('category'),
-                      lambda x: x.astype(com.CategoricalDtype()),
-                      lambda x: x.astype('object').astype('category'),
-                      lambda x: x.astype('object').astype(com.CategoricalDtype())]:
-
-            result = valid(s)
-            tm.assert_series_equal(result,s)
-
-        # invalid conversion (these are NOT a dtype)
-        for invalid in [lambda x: x.astype(pd.Categorical),
-                        lambda x: x.astype('object').astype(pd.Categorical)]:
-            self.assertRaises(TypeError, lambda : invalid(s))
-
-
-    def test_astype_categorical(self):
-
-        cat = Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
-        tm.assert_categorical_equal(cat,cat.astype('category'))
-        tm.assert_almost_equal(np.array(cat),cat.astype('object'))
-
-        self.assertRaises(ValueError, lambda : cat.astype(float))
-
-    def test_to_records(self):
-
-        # GH8626
-
-        # dict creation
-        df = DataFrame({ 'A' : list('abc') }, dtype='category')
-        expected = Series(list('abc'), dtype='category', name='A')
-        tm.assert_series_equal(df['A'], expected)
-
-        # list-like creation
-        df = DataFrame(list('abc'), dtype='category')
-        expected = Series(list('abc'), dtype='category', name=0)
-        tm.assert_series_equal(df[0], expected)
-
-        # to record array
-        # this coerces
-        result = df.to_records()
-        expected = np.rec.array([(0, 'a'), (1, 'b'), (2, 'c')],
-                                dtype=[('index', '=i8'), ('0', 'O')])
-        tm.assert_almost_equal(result, expected)
-
-    def test_numeric_like_ops(self):
-
-        # numeric ops should not succeed
-        for op in ['__add__','__sub__','__mul__','__truediv__']:
-            self.assertRaises(TypeError, lambda : getattr(self.cat,op)(self.cat))
-
-        # reduction ops should not succeed (unless specifically defined, e.g. min/max)
-        s = self.cat['value_group']
-        for op in ['kurt','skew','var','std','mean','sum','median']:
-            self.assertRaises(TypeError, lambda : getattr(s,op)(numeric_only=False))
-
-        # mad technically works because it takes always the numeric data
-
-        # numpy ops
-        s = pd.Series(pd.Categorical([1,2,3,4]))
-        self.assertRaises(TypeError, lambda : np.sum(s))
-
-        # numeric ops on a Series
-        for op in ['__add__','__sub__','__mul__','__truediv__']:
-            self.assertRaises(TypeError, lambda : getattr(s,op)(2))
-
-        # invalid ufunc
-        self.assertRaises(TypeError, lambda : np.log(s))
-
-    def test_cat_tab_completition(self):
-         # test the tab completion display
-        ok_for_cat = ['categories','codes','ordered','set_categories',
-                      'add_categories', 'remove_categories', 'rename_categories',
-                      'reorder_categories', 'remove_unused_categories',
-                      'as_ordered', 'as_unordered']
-        def get_dir(s):
-            results = [ r for r in s.cat.__dir__() if not r.startswith('_') ]
-            return list(sorted(set(results)))
-
-        s = Series(list('aabbcde')).astype('category')
-        results = get_dir(s)
-        tm.assert_almost_equal(results,list(sorted(set(ok_for_cat))))
-
-    def test_cat_accessor_api(self):
-        # GH 9322
-        from pandas.core.categorical import CategoricalAccessor
-        self.assertIs(Series.cat, CategoricalAccessor)
-        s = Series(list('aabbcde')).astype('category')
-        self.assertIsInstance(s.cat, CategoricalAccessor)
-
-        invalid = Series([1])
-        with tm.assertRaisesRegexp(AttributeError, "only use .cat accessor"):
-            invalid.cat
-        self.assertFalse(hasattr(invalid, 'cat'))
-
-    def test_pickle_v0_14_1(self):
-
-        # we have the name warning
-        # 10482
-        with tm.assert_produces_warning(UserWarning):
-            cat = pd.Categorical(values=['a', 'b', 'c'],
-                                 categories=['a', 'b', 'c', 'd'],
-                                 name='foobar', ordered=False)
-        pickle_path = os.path.join(tm.get_data_path(),
-                                   'categorical_0_14_1.pickle')
-        # This code was executed once on v0.14.1 to generate the pickle:
-        #
-        # cat = Categorical(labels=np.arange(3), levels=['a', 'b', 'c', 'd'],
-        #                   name='foobar')
-        # with open(pickle_path, 'wb') as f: pickle.dump(cat, f)
-        #
-        self.assert_categorical_equal(cat, pd.read_pickle(pickle_path))
-
-    def test_pickle_v0_15_2(self):
-        # ordered -> _ordered
-        # GH 9347
-
-        # we have the name warning
-        # 10482
-        with tm.assert_produces_warning(UserWarning):
-            cat = pd.Categorical(values=['a', 'b', 'c'],
-                                 categories=['a', 'b', 'c', 'd'],
-                                 name='foobar', ordered=False)
-        pickle_path = os.path.join(tm.get_data_path(),
-                                   'categorical_0_15_2.pickle')
-        # This code was executed once on v0.15.2 to generate the pickle:
-        #
-        # cat = Categorical(labels=np.arange(3), levels=['a', 'b', 'c', 'd'],
-        #                   name='foobar')
-        # with open(pickle_path, 'wb') as f: pickle.dump(cat, f)
-        #
-        self.assert_categorical_equal(cat, pd.read_pickle(pickle_path))
-
-    def test_concat_categorical(self):
-        # See GH 10177
-        df1 = pd.DataFrame(np.arange(18, dtype='int64').reshape(6, 3), columns=["a", "b", "c"])
-
-        df2 = pd.DataFrame(np.arange(14, dtype='int64').reshape(7, 2), columns=["a", "c"])
-        df2['h'] = pd.Series(pd.Categorical(["one", "one", "two", "one", "two", "two", "one"]))
-
-        df_concat = pd.concat((df1, df2), axis=0).reset_index(drop=True)
-
-        df_expected = pd.DataFrame({'a': [0, 3, 6, 9, 12, 15, 0, 2, 4, 6, 8, 10, 12],
-                                    'b': [1, 4, 7, 10, 13, 16, np.nan, np.nan, np.nan, np.nan, np.nan, np.nan, np.nan],
-                                    'c': [2, 5, 8, 11, 14, 17, 1, 3, 5, 7, 9, 11, 13]})
-        df_expected['h'] = pd.Series(pd.Categorical([None, None, None, None, None, None,
-                                                     "one", "one", "two", "one", "two", "two", "one"]))
-
-        tm.assert_frame_equal(df_expected, df_concat)
-
-
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   # '--with-coverage', '--cover-package=pandas.core']
-                    exit=False)
diff --git a/pandas/tests/test_common.py b/pandas/tests/test_common.py
index 003fd134cf210..61f838eeeeb30 100644
--- a/pandas/tests/test_common.py
+++ b/pandas/tests/test_common.py
@@ -1,62 +1,43 @@
 # -*- coding: utf-8 -*-
+
+import pytest
+import os
 import collections
-from datetime import datetime
-import re
+from functools import partial
 
-import nose
-from nose.tools import assert_equal, assert_true
 import numpy as np
-import pandas as pd
-from pandas.tslib import iNaT, NaT
-from pandas import Series, DataFrame, date_range, DatetimeIndex, Timestamp, Float64Index
-from pandas import compat
-from pandas.compat import range, long, lrange, lmap, u
-from pandas.core.common import notnull, isnull, array_equivalent
+
+from pandas import Series, DataFrame, Timestamp
+from pandas.compat import range, lmap
 import pandas.core.common as com
-import pandas.core.convert as convert
-import pandas.core.format as fmt
+from pandas.core import ops
+from pandas.io.common import _get_handle
 import pandas.util.testing as tm
-import pandas.core.config as cf
-
-_multiprocess_can_split_ = True
 
 
 def test_mut_exclusive():
     msg = "mutually exclusive arguments: '[ab]' and '[ab]'"
-    with tm.assertRaisesRegexp(TypeError, msg):
+    with tm.assert_raises_regex(TypeError, msg):
         com._mut_exclusive(a=1, b=2)
     assert com._mut_exclusive(a=1, b=None) == 1
     assert com._mut_exclusive(major=None, major_axis=None) is None
-
-
-def test_is_sequence():
-    is_seq = com.is_sequence
-    assert(is_seq((1, 2)))
-    assert(is_seq([1, 2]))
-    assert(not is_seq("abcd"))
-    assert(not is_seq(u("abcd")))
-    assert(not is_seq(np.int64))
-
-    class A(object):
-        def __getitem__(self):
-            return 1
-
-    assert(not is_seq(A()))
+    assert com._mut_exclusive(a=None, b=2) == 2
 
 
 def test_get_callable_name():
-    from functools import partial
     getname = com._get_callable_name
 
     def fn(x):
         return x
+
     lambda_ = lambda x: x
     part1 = partial(fn)
     part2 = partial(part1)
 
     class somecall(object):
+
         def __call__(self):
-            return x
+            return x  # noqa
 
     assert getname(fn) == 'fn'
     assert getname(lambda_)
@@ -65,376 +46,25 @@ def __call__(self):
     assert getname(somecall()) == 'somecall'
     assert getname(1) is None
 
-#Issue 10859
-class TestABCClasses(tm.TestCase):
-    tuples = [[1, 2, 2], ['red', 'blue', 'red']]
-    multi_index = pd.MultiIndex.from_arrays(tuples, names=('number', 'color'))
-    datetime_index = pd.to_datetime(['2000/1/1', '2010/1/1'])
-    timedelta_index = pd.to_timedelta(np.arange(5), unit='s')
-    period_index = pd.period_range('2000/1/1', '2010/1/1/', freq='M')
-    categorical = pd.Categorical([1, 2, 3], categories=[2, 3, 1])
-    categorical_df = pd.DataFrame({"values": [1, 2, 3]}, index=categorical)
-    df = pd.DataFrame({'names': ['a', 'b', 'c']}, index=multi_index)
-    sparse_series = pd.Series([1, 2, 3]).to_sparse()
-    sparse_array = pd.SparseArray(np.random.randn(10))
-
-    def test_abc_types(self):
-        self.assertIsInstance(pd.Index(['a', 'b', 'c']), com.ABCIndex)
-        self.assertIsInstance(pd.Int64Index([1, 2, 3]), com.ABCInt64Index)
-        self.assertIsInstance(pd.Float64Index([1, 2, 3]), com.ABCFloat64Index)
-        self.assertIsInstance(self.multi_index, com.ABCMultiIndex)
-        self.assertIsInstance(self.datetime_index, com.ABCDatetimeIndex)
-        self.assertIsInstance(self.timedelta_index, com.ABCTimedeltaIndex)
-        self.assertIsInstance(self.period_index, com.ABCPeriodIndex)
-        self.assertIsInstance(self.categorical_df.index, com.ABCCategoricalIndex)
-        self.assertIsInstance(pd.Index(['a', 'b', 'c']), com.ABCIndexClass)
-        self.assertIsInstance(pd.Int64Index([1, 2, 3]), com.ABCIndexClass)
-        self.assertIsInstance(pd.Series([1, 2, 3]), com.ABCSeries)
-        self.assertIsInstance(self.df, com.ABCDataFrame)
-        self.assertIsInstance(self.df.to_panel(), com.ABCPanel)
-        self.assertIsInstance(self.sparse_series, com.ABCSparseSeries)
-        self.assertIsInstance(self.sparse_array, com.ABCSparseArray)
-        self.assertIsInstance(self.categorical, com.ABCCategorical)
-        self.assertIsInstance(pd.Period('2012', freq='A-DEC'), com.ABCPeriod)
-
-
-def test_notnull():
-    assert notnull(1.)
-    assert not notnull(None)
-    assert not notnull(np.NaN)
-
-    with cf.option_context("mode.use_inf_as_null", False):
-        assert notnull(np.inf)
-        assert notnull(-np.inf)
-
-        arr = np.array([1.5, np.inf, 3.5, -np.inf])
-        result = notnull(arr)
-        assert result.all()
-
-    with cf.option_context("mode.use_inf_as_null", True):
-        assert not notnull(np.inf)
-        assert not notnull(-np.inf)
-
-        arr = np.array([1.5, np.inf, 3.5, -np.inf])
-        result = notnull(arr)
-        assert result.sum() == 2
-
-    with cf.option_context("mode.use_inf_as_null", False):
-        for s in [tm.makeFloatSeries(),tm.makeStringSeries(),
-                  tm.makeObjectSeries(),tm.makeTimeSeries(),tm.makePeriodSeries()]:
-            assert(isinstance(isnull(s), Series))
-
-def test_isnull():
-    assert not isnull(1.)
-    assert isnull(None)
-    assert isnull(np.NaN)
-    assert not isnull(np.inf)
-    assert not isnull(-np.inf)
-
-    # series
-    for s in [tm.makeFloatSeries(),tm.makeStringSeries(),
-              tm.makeObjectSeries(),tm.makeTimeSeries(),tm.makePeriodSeries()]:
-        assert(isinstance(isnull(s), Series))
-
-    # frame
-    for df in [tm.makeTimeDataFrame(),tm.makePeriodFrame(),tm.makeMixedDataFrame()]:
-        result = isnull(df)
-        expected = df.apply(isnull)
-        tm.assert_frame_equal(result, expected)
-
-    # panel
-    for p in [ tm.makePanel(), tm.makePeriodPanel(), tm.add_nans(tm.makePanel()) ]:
-        result = isnull(p)
-        expected = p.apply(isnull)
-        tm.assert_panel_equal(result, expected)
-
-    # panel 4d
-    for p in [ tm.makePanel4D(), tm.add_nans_panel4d(tm.makePanel4D()) ]:
-        result = isnull(p)
-        expected = p.apply(isnull)
-        tm.assert_panel4d_equal(result, expected)
-
-def test_isnull_lists():
-    result = isnull([[False]])
-    exp = np.array([[False]])
-    assert(np.array_equal(result, exp))
-
-    result = isnull([[1], [2]])
-    exp = np.array([[False], [False]])
-    assert(np.array_equal(result, exp))
-
-    # list of strings / unicode
-    result = isnull(['foo', 'bar'])
-    assert(not result.any())
-
-    result = isnull([u('foo'), u('bar')])
-    assert(not result.any())
-
-def test_isnull_nat():
-    result = isnull([NaT])
-    exp = np.array([True])
-    assert(np.array_equal(result, exp))
-
-    result = isnull(np.array([NaT], dtype=object))
-    exp = np.array([True])
-    assert(np.array_equal(result, exp))
-
-def test_isnull_datetime():
-    assert (not isnull(datetime.now()))
-    assert notnull(datetime.now())
-
-    idx = date_range('1/1/1990', periods=20)
-    assert(notnull(idx).all())
-
-    idx = np.asarray(idx)
-    idx[0] = iNaT
-    idx = DatetimeIndex(idx)
-    mask = isnull(idx)
-    assert(mask[0])
-    assert(not mask[1:].any())
-
-    # GH 9129
-    pidx = idx.to_period(freq='M')
-    mask = isnull(pidx)
-    assert(mask[0])
-    assert(not mask[1:].any())
-
-    mask = isnull(pidx[1:])
-    assert(not mask.any())
-
-
-class TestIsNull(tm.TestCase):
-    def test_0d_array(self):
-        self.assertTrue(isnull(np.array(np.nan)))
-        self.assertFalse(isnull(np.array(0.0)))
-        self.assertFalse(isnull(np.array(0)))
-        # test object dtype
-        self.assertTrue(isnull(np.array(np.nan, dtype=object)))
-        self.assertFalse(isnull(np.array(0.0, dtype=object)))
-        self.assertFalse(isnull(np.array(0, dtype=object)))
-
-
-def test_downcast_conv():
-    # test downcasting
-
-    arr = np.array([8.5, 8.6, 8.7, 8.8, 8.9999999999995])
-    result = com._possibly_downcast_to_dtype(arr, 'infer')
-    assert (np.array_equal(result, arr))
-
-    arr = np.array([8., 8., 8., 8., 8.9999999999995])
-    result = com._possibly_downcast_to_dtype(arr, 'infer')
-    expected = np.array([8, 8, 8, 8, 9])
-    assert (np.array_equal(result, expected))
-
-    arr = np.array([8., 8., 8., 8., 9.0000000000005])
-    result = com._possibly_downcast_to_dtype(arr, 'infer')
-    expected = np.array([8, 8, 8, 8, 9])
-    assert (np.array_equal(result, expected))
-
-    # conversions
-
-    expected = np.array([1,2])
-    for dtype in [np.float64,object,np.int64]:
-        arr = np.array([1.0,2.0],dtype=dtype)
-        result = com._possibly_downcast_to_dtype(arr,'infer')
-        tm.assert_almost_equal(result, expected)
-
-    expected = np.array([1.0,2.0,np.nan])
-    for dtype in [np.float64,object]:
-        arr = np.array([1.0,2.0,np.nan],dtype=dtype)
-        result = com._possibly_downcast_to_dtype(arr,'infer')
-        tm.assert_almost_equal(result, expected)
-
-    # empties
-    for dtype in [np.int32,np.float64,np.float32,np.bool_,np.int64,object]:
-        arr = np.array([],dtype=dtype)
-        result = com._possibly_downcast_to_dtype(arr,'int64')
-        tm.assert_almost_equal(result, np.array([],dtype=np.int64))
-        assert result.dtype == np.int64
-
-def test_array_equivalent():
-    assert array_equivalent(np.array([np.nan, np.nan]),
-                            np.array([np.nan, np.nan]))
-    assert array_equivalent(np.array([np.nan, 1, np.nan]),
-                            np.array([np.nan, 1, np.nan]))
-    assert array_equivalent(np.array([np.nan, None], dtype='object'),
-                            np.array([np.nan, None], dtype='object'))
-    assert array_equivalent(np.array([np.nan, 1+1j], dtype='complex'),
-                            np.array([np.nan, 1+1j], dtype='complex'))
-    assert not array_equivalent(np.array([np.nan, 1+1j], dtype='complex'),
-                                np.array([np.nan, 1+2j], dtype='complex'))
-    assert not array_equivalent(np.array([np.nan, 1, np.nan]),
-                                np.array([np.nan, 2, np.nan]))
-    assert not array_equivalent(np.array(['a', 'b', 'c', 'd']), np.array(['e', 'e']))
-    assert array_equivalent(Float64Index([0, np.nan]), Float64Index([0, np.nan]))
-    assert not array_equivalent(Float64Index([0, np.nan]), Float64Index([1, np.nan]))
-    assert array_equivalent(DatetimeIndex([0, np.nan]), DatetimeIndex([0, np.nan]))
-    assert not array_equivalent(DatetimeIndex([0, np.nan]), DatetimeIndex([1, np.nan]))
-
-def test_datetimeindex_from_empty_datetime64_array():
-    for unit in [ 'ms', 'us', 'ns' ]:
-        idx = DatetimeIndex(np.array([], dtype='datetime64[%s]' % unit))
-        assert(len(idx) == 0)
-
-
-def test_nan_to_nat_conversions():
-
-    df = DataFrame(dict({
-        'A' : np.asarray(lrange(10),dtype='float64'),
-        'B' : Timestamp('20010101') }))
-    df.iloc[3:6,:] = np.nan
-    result = df.loc[4,'B'].value
-    assert(result == iNaT)
-
-    s = df['B'].copy()
-    s._data = s._data.setitem(indexer=tuple([slice(8,9)]),value=np.nan)
-    assert(isnull(s[8]))
-
-    # numpy < 1.7.0 is wrong
-    from distutils.version import LooseVersion
-    if LooseVersion(np.__version__) >= '1.7.0':
-        assert(s[8].value == np.datetime64('NaT').astype(np.int64))
-
 
 def test_any_none():
-    assert(com._any_none(1, 2, 3, None))
-    assert(not com._any_none(1, 2, 3, 4))
+    assert (com._any_none(1, 2, 3, None))
+    assert (not com._any_none(1, 2, 3, 4))
 
 
 def test_all_not_none():
-    assert(com._all_not_none(1, 2, 3, 4))
-    assert(not com._all_not_none(1, 2, 3, None))
-    assert(not com._all_not_none(None, None, None, None))
-
-
-def test_repr_binary_type():
-    import string
-    letters = string.ascii_letters
-    btype = compat.binary_type
-    try:
-        raw = btype(letters, encoding=cf.get_option('display.encoding'))
-    except TypeError:
-        raw = btype(letters)
-    b = compat.text_type(compat.bytes_to_str(raw))
-    res = com.pprint_thing(b, quote_strings=True)
-    assert_equal(res, repr(b))
-    res = com.pprint_thing(b, quote_strings=False)
-    assert_equal(res, b)
-
-
-def test_adjoin():
-    data = [['a', 'b', 'c'],
-            ['dd', 'ee', 'ff'],
-            ['ggg', 'hhh', 'iii']]
-    expected = 'a  dd  ggg\nb  ee  hhh\nc  ff  iii'
-
-    adjoined = com.adjoin(2, *data)
-
-    assert(adjoined == expected)
-
-
-
-class TestFormattBase(tm.TestCase):
-
-    def test_adjoin(self):
-        data = [['a', 'b', 'c'],
-                ['dd', 'ee', 'ff'],
-                ['ggg', 'hhh', 'iii']]
-        expected = 'a  dd  ggg\nb  ee  hhh\nc  ff  iii'
-
-        adjoined = com.adjoin(2, *data)
-
-        self.assertEqual(adjoined, expected)
-
-    def test_adjoin_unicode(self):
-        data = [[u'あ', 'b', 'c'],
-                ['dd', u'ええ', 'ff'],
-                ['ggg', 'hhh', u'いいい']]
-        expected = u'あ  dd  ggg\nb  ええ  hhh\nc  ff  いいい'
-        adjoined = com.adjoin(2, *data)
-        self.assertEqual(adjoined, expected)
-
-        adj = fmt.EastAsianTextAdjustment()
-
-        expected = u"""あ  dd    ggg
-b   ええ  hhh
-c   ff    いいい"""
-        adjoined = adj.adjoin(2, *data)
-        self.assertEqual(adjoined, expected)
-        cols = adjoined.split('\n')
-        self.assertEqual(adj.len(cols[0]), 13)
-        self.assertEqual(adj.len(cols[1]), 13)
-        self.assertEqual(adj.len(cols[2]), 16)
-
-        expected = u"""あ       dd         ggg
-b        ええ       hhh
-c        ff         いいい"""
-        adjoined = adj.adjoin(7, *data)
-        self.assertEqual(adjoined, expected)
-        cols = adjoined.split('\n')
-        self.assertEqual(adj.len(cols[0]), 23)
-        self.assertEqual(adj.len(cols[1]), 23)
-        self.assertEqual(adj.len(cols[2]), 26)
-
-    def test_justify(self):
-        adj = fmt.EastAsianTextAdjustment()
-
-        def just(x, *args, **kwargs):
-            # wrapper to test single str
-            return adj.justify([x], *args, **kwargs)[0]
-
-        self.assertEqual(just('abc', 5, mode='left'), 'abc  ')
-        self.assertEqual(just('abc', 5, mode='center'), ' abc ')
-        self.assertEqual(just('abc', 5, mode='right'), '  abc')
-        self.assertEqual(just(u'abc', 5, mode='left'), 'abc  ')
-        self.assertEqual(just(u'abc', 5, mode='center'), ' abc ')
-        self.assertEqual(just(u'abc', 5, mode='right'), '  abc')
-
-        self.assertEqual(just(u'パンダ', 5, mode='left'), u'パンダ')
-        self.assertEqual(just(u'パンダ', 5, mode='center'), u'パンダ')
-        self.assertEqual(just(u'パンダ', 5, mode='right'), u'パンダ')
-
-        self.assertEqual(just(u'パンダ', 10, mode='left'), u'パンダ    ')
-        self.assertEqual(just(u'パンダ', 10, mode='center'), u'  パンダ  ')
-        self.assertEqual(just(u'パンダ', 10, mode='right'), u'    パンダ')
-
-    def test_east_asian_len(self):
-        adj = fmt.EastAsianTextAdjustment()
-
-        self.assertEqual(adj.len('abc'), 3)
-        self.assertEqual(adj.len(u'abc'), 3)
-
-        self.assertEqual(adj.len(u'パンダ'), 6)
-        self.assertEqual(adj.len(u'ﾊﾟﾝﾀﾞ'), 5)
-        self.assertEqual(adj.len(u'パンダpanda'), 11)
-        self.assertEqual(adj.len(u'ﾊﾟﾝﾀﾞpanda'), 10)
-
-
-    def test_ambiguous_width(self):
-        adj = fmt.EastAsianTextAdjustment()
-        self.assertEqual(adj.len(u'¡¡ab'), 4)
-
-        with cf.option_context('display.unicode.ambiguous_as_wide', True):
-            adj = fmt.EastAsianTextAdjustment()
-            self.assertEqual(adj.len(u'¡¡ab'), 6)
-
-        data = [[u'あ', 'b', 'c'],
-                ['dd', u'ええ', 'ff'],
-                ['ggg', u'¡¡ab', u'いいい']]
-        expected = u'あ  dd    ggg \nb   ええ  ¡¡ab\nc   ff    いいい'
-        adjoined = adj.adjoin(2, *data)
-        self.assertEqual(adjoined, expected)
+    assert (com._all_not_none(1, 2, 3, 4))
+    assert (not com._all_not_none(1, 2, 3, None))
+    assert (not com._all_not_none(None, None, None, None))
 
 
 def test_iterpairs():
     data = [1, 2, 3, 4]
-    expected = [(1, 2),
-                (2, 3),
-                (3, 4)]
+    expected = [(1, 2), (2, 3), (3, 4)]
 
     result = list(com.iterpairs(data))
 
-    assert(result == expected)
+    assert (result == expected)
 
 
 def test_split_ranges():
@@ -467,25 +97,13 @@ def test_locs(mask):
     test_locs([1])
 
 
-def test_indent():
-    s = 'a b c\nd e f'
-    result = com.indent(s, spaces=6)
-
-    assert(result == '      a b c\n      d e f')
-
-
-def test_banner():
-    ban = com.banner('hi')
-    assert(ban == ('%s\nhi\n%s' % ('=' * 80, '=' * 80)))
-
-
 def test_map_indices_py():
     data = [4, 3, 2, 1]
     expected = {4: 0, 3: 1, 2: 2, 1: 3}
 
     result = com.map_indices_py(data)
 
-    assert(result == expected)
+    assert (result == expected)
 
 
 def test_union():
@@ -494,7 +112,7 @@ def test_union():
 
     union = sorted(com.union(a, b))
 
-    assert((a + b) == union)
+    assert ((a + b) == union)
 
 
 def test_difference():
@@ -503,7 +121,7 @@ def test_difference():
 
     inter = sorted(com.difference(b, a))
 
-    assert([4, 5, 6] == inter)
+    assert ([4, 5, 6] == inter)
 
 
 def test_intersection():
@@ -512,7 +130,7 @@ def test_intersection():
 
     inter = sorted(com.intersection(a, b))
 
-    assert(a == inter)
+    assert (a == inter)
 
 
 def test_groupby():
@@ -527,640 +145,36 @@ def test_groupby():
         assert v == expected[k]
 
 
-def test_is_list_like():
-    passes = ([], [1], (1,), (1, 2), {'a': 1}, set([1, 'a']), Series([1]),
-              Series([]), Series(['a']).str)
-    fails = (1, '2', object())
-
-    for p in passes:
-        assert com.is_list_like(p)
-
-    for f in fails:
-        assert not com.is_list_like(f)
-
-
-def test_is_hashable():
-
-    # all new-style classes are hashable by default
-    class HashableClass(object):
-        pass
-
-    class UnhashableClass1(object):
-        __hash__ = None
-
-    class UnhashableClass2(object):
-        def __hash__(self):
-            raise TypeError("Not hashable")
-
-    hashable = (
-        1, 3.14, np.float64(3.14), 'a', tuple(), (1,), HashableClass(),
-    )
-    not_hashable = (
-        [], UnhashableClass1(),
-    )
-    abc_hashable_not_really_hashable = (
-        ([],), UnhashableClass2(),
-    )
-
-    for i in hashable:
-        assert com.is_hashable(i)
-    for i in not_hashable:
-        assert not com.is_hashable(i)
-    for i in abc_hashable_not_really_hashable:
-        assert not com.is_hashable(i)
-
-    # numpy.array is no longer collections.Hashable as of
-    # https://github.com/numpy/numpy/pull/5326, just test
-    # pandas.common.is_hashable()
-    assert not com.is_hashable(np.array([]))
-
-    # old-style classes in Python 2 don't appear hashable to
-    # collections.Hashable but also seem to support hash() by default
-    if compat.PY2:
-        class OldStyleClass():
-            pass
-        c = OldStyleClass()
-        assert not isinstance(c, collections.Hashable)
-        assert com.is_hashable(c)
-        hash(c)  # this will not raise
-
-
-def test_ensure_int32():
-    values = np.arange(10, dtype=np.int32)
-    result = com._ensure_int32(values)
-    assert(result.dtype == np.int32)
-
-    values = np.arange(10, dtype=np.int64)
-    result = com._ensure_int32(values)
-    assert(result.dtype == np.int32)
-
-
-def test_ensure_platform_int():
-
-    # verify that when we create certain types of indices
-    # they remain the correct type under platform conversions
-    from pandas.core.index import Int64Index
-
-    # int64
-    x = Int64Index([1, 2, 3], dtype='int64')
-    assert(x.dtype == np.int64)
-
-    pi = com._ensure_platform_int(x)
-    assert(pi.dtype == np.int_)
-
-    # int32
-    x = Int64Index([1, 2, 3], dtype='int32')
-    assert(x.dtype == np.int32)
-
-    pi = com._ensure_platform_int(x)
-    assert(pi.dtype == np.int_)
-
-# TODO: fix this broken test
-
-# def test_console_encode():
-#     """
-#     On Python 2, if sys.stdin.encoding is None (IPython with zmq frontend)
-#     common.console_encode should encode things as utf-8.
-#     """
-#     if compat.PY3:
-#         raise nose.SkipTest
-
-#     with tm.stdin_encoding(encoding=None):
-#         result = com.console_encode(u"\u05d0")
-#         expected = u"\u05d0".encode('utf-8')
-#         assert (result == expected)
-
-
-def test_is_re():
-    passes = re.compile('ad'),
-    fails = 'x', 2, 3, object()
-
-    for p in passes:
-        assert com.is_re(p)
-
-    for f in fails:
-        assert not com.is_re(f)
-
-
-def test_is_recompilable():
-    passes = (r'a', u('x'), r'asdf', re.compile('adsf'),
-              u(r'\u2233\s*'), re.compile(r''))
-    fails = 1, [], object()
-
-    for p in passes:
-        assert com.is_re_compilable(p)
-
-    for f in fails:
-        assert not com.is_re_compilable(f)
-
 def test_random_state():
     import numpy.random as npr
     # Check with seed
     state = com._random_state(5)
-    assert_equal(state.uniform(), npr.RandomState(5).uniform())
+    assert state.uniform() == npr.RandomState(5).uniform()
 
     # Check with random state object
     state2 = npr.RandomState(10)
-    assert_equal(com._random_state(state2).uniform(), npr.RandomState(10).uniform())
+    assert com._random_state(state2).uniform() == npr.RandomState(10).uniform()
 
     # check with no arg random state
-    assert isinstance(com._random_state(), npr.RandomState)
+    assert com._random_state() is np.random
 
     # Error for floats or strings
-    with tm.assertRaises(ValueError):
+    with pytest.raises(ValueError):
         com._random_state('test')
 
-    with tm.assertRaises(ValueError):
+    with pytest.raises(ValueError):
         com._random_state(5.5)
 
 
-def test_maybe_match_name():
-
-    matched = com._maybe_match_name(Series([1], name='x'), Series([2], name='x'))
-    assert(matched == 'x')
-
-    matched = com._maybe_match_name(Series([1], name='x'), Series([2], name='y'))
-    assert(matched is None)
-
-    matched = com._maybe_match_name(Series([1]), Series([2], name='x'))
-    assert(matched is None)
-
-    matched = com._maybe_match_name(Series([1], name='x'), Series([2]))
-    assert(matched is None)
-
-    matched = com._maybe_match_name(Series([1], name='x'), [2])
-    assert(matched == 'x')
-
-    matched = com._maybe_match_name([1], Series([2], name='y'))
-    assert(matched == 'y')
-
-
-class TestTake(tm.TestCase):
-    # standard incompatible fill error
-    fill_error = re.compile("Incompatible type for fill_value")
-
-    _multiprocess_can_split_ = True
-
-    def test_1d_with_out(self):
-        def _test_dtype(dtype, can_hold_na):
-            data = np.random.randint(0, 2, 4).astype(dtype)
-
-            indexer = [2, 1, 0, 1]
-            out = np.empty(4, dtype=dtype)
-            com.take_1d(data, indexer, out=out)
-            expected = data.take(indexer)
-            tm.assert_almost_equal(out, expected)
-
-            indexer = [2, 1, 0, -1]
-            out = np.empty(4, dtype=dtype)
-            if can_hold_na:
-                com.take_1d(data, indexer, out=out)
-                expected = data.take(indexer)
-                expected[3] = np.nan
-                tm.assert_almost_equal(out, expected)
-            else:
-                with tm.assertRaisesRegexp(TypeError, self.fill_error):
-                    com.take_1d(data, indexer, out=out)
-                # no exception o/w
-                data.take(indexer, out=out)
-
-        _test_dtype(np.float64, True)
-        _test_dtype(np.float32, True)
-        _test_dtype(np.uint64, False)
-        _test_dtype(np.uint32, False)
-        _test_dtype(np.uint16, False)
-        _test_dtype(np.uint8, False)
-        _test_dtype(np.int64, False)
-        _test_dtype(np.int32, False)
-        _test_dtype(np.int16, False)
-        _test_dtype(np.int8, False)
-        _test_dtype(np.object_, True)
-        _test_dtype(np.bool, False)
-
-    def test_1d_fill_nonna(self):
-        def _test_dtype(dtype, fill_value, out_dtype):
-            data = np.random.randint(0, 2, 4).astype(dtype)
-
-            indexer = [2, 1, 0, -1]
-
-            result = com.take_1d(data, indexer, fill_value=fill_value)
-            assert((result[[0, 1, 2]] == data[[2, 1, 0]]).all())
-            assert(result[3] == fill_value)
-            assert(result.dtype == out_dtype)
-
-            indexer = [2, 1, 0, 1]
-
-            result = com.take_1d(data, indexer, fill_value=fill_value)
-            assert((result[[0, 1, 2, 3]] == data[indexer]).all())
-            assert(result.dtype == dtype)
-
-        _test_dtype(np.int8, np.int16(127), np.int8)
-        _test_dtype(np.int8, np.int16(128), np.int16)
-        _test_dtype(np.int32, 1, np.int32)
-        _test_dtype(np.int32, 2.0, np.float64)
-        _test_dtype(np.int32, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.int32, True, np.object_)
-        _test_dtype(np.int32, '', np.object_)
-        _test_dtype(np.float64, 1, np.float64)
-        _test_dtype(np.float64, 2.0, np.float64)
-        _test_dtype(np.float64, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.float64, True, np.object_)
-        _test_dtype(np.float64, '', np.object_)
-        _test_dtype(np.complex128, 1, np.complex128)
-        _test_dtype(np.complex128, 2.0, np.complex128)
-        _test_dtype(np.complex128, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.complex128, True, np.object_)
-        _test_dtype(np.complex128, '', np.object_)
-        _test_dtype(np.bool_, 1, np.object_)
-        _test_dtype(np.bool_, 2.0, np.object_)
-        _test_dtype(np.bool_, 3.0 + 4.0j, np.object_)
-        _test_dtype(np.bool_, True, np.bool_)
-        _test_dtype(np.bool_, '', np.object_)
-
-    def test_2d_with_out(self):
-        def _test_dtype(dtype, can_hold_na, writeable=True):
-            data = np.random.randint(0, 2, (5, 3)).astype(dtype)
-            data.flags.writeable = writeable
-
-            indexer = [2, 1, 0, 1]
-            out0 = np.empty((4, 3), dtype=dtype)
-            out1 = np.empty((5, 4), dtype=dtype)
-            com.take_nd(data, indexer, out=out0, axis=0)
-            com.take_nd(data, indexer, out=out1, axis=1)
-            expected0 = data.take(indexer, axis=0)
-            expected1 = data.take(indexer, axis=1)
-            tm.assert_almost_equal(out0, expected0)
-            tm.assert_almost_equal(out1, expected1)
-
-            indexer = [2, 1, 0, -1]
-            out0 = np.empty((4, 3), dtype=dtype)
-            out1 = np.empty((5, 4), dtype=dtype)
-            if can_hold_na:
-                com.take_nd(data, indexer, out=out0, axis=0)
-                com.take_nd(data, indexer, out=out1, axis=1)
-                expected0 = data.take(indexer, axis=0)
-                expected1 = data.take(indexer, axis=1)
-                expected0[3, :] = np.nan
-                expected1[:, 3] = np.nan
-                tm.assert_almost_equal(out0, expected0)
-                tm.assert_almost_equal(out1, expected1)
-            else:
-                for i, out in enumerate([out0, out1]):
-                    with tm.assertRaisesRegexp(TypeError, self.fill_error):
-                        com.take_nd(data, indexer, out=out, axis=i)
-                    # no exception o/w
-                    data.take(indexer, out=out, axis=i)
-
-        for writeable in [True, False]:
-            # Check that take_nd works both with writeable arrays (in which
-            # case fast typed memoryviews implementation) and read-only
-            # arrays alike.
-            _test_dtype(np.float64, True, writeable=writeable)
-            _test_dtype(np.float32, True, writeable=writeable)
-            _test_dtype(np.uint64, False, writeable=writeable)
-            _test_dtype(np.uint32, False, writeable=writeable)
-            _test_dtype(np.uint16, False, writeable=writeable)
-            _test_dtype(np.uint8, False, writeable=writeable)
-            _test_dtype(np.int64, False, writeable=writeable)
-            _test_dtype(np.int32, False, writeable=writeable)
-            _test_dtype(np.int16, False, writeable=writeable)
-            _test_dtype(np.int8, False, writeable=writeable)
-            _test_dtype(np.object_, True, writeable=writeable)
-            _test_dtype(np.bool, False, writeable=writeable)
-
-    def test_2d_fill_nonna(self):
-        def _test_dtype(dtype, fill_value, out_dtype):
-            data = np.random.randint(0, 2, (5, 3)).astype(dtype)
-
-            indexer = [2, 1, 0, -1]
-
-            result = com.take_nd(data, indexer, axis=0, fill_value=fill_value)
-            assert((result[[0, 1, 2], :] == data[[2, 1, 0], :]).all())
-            assert((result[3, :] == fill_value).all())
-            assert(result.dtype == out_dtype)
-
-            result = com.take_nd(data, indexer, axis=1, fill_value=fill_value)
-            assert((result[:, [0, 1, 2]] == data[:, [2, 1, 0]]).all())
-            assert((result[:, 3] == fill_value).all())
-            assert(result.dtype == out_dtype)
-
-            indexer = [2, 1, 0, 1]
-
-            result = com.take_nd(data, indexer, axis=0, fill_value=fill_value)
-            assert((result[[0, 1, 2, 3], :] == data[indexer, :]).all())
-            assert(result.dtype == dtype)
-
-            result = com.take_nd(data, indexer, axis=1, fill_value=fill_value)
-            assert((result[:, [0, 1, 2, 3]] == data[:, indexer]).all())
-            assert(result.dtype == dtype)
-
-        _test_dtype(np.int8, np.int16(127), np.int8)
-        _test_dtype(np.int8, np.int16(128), np.int16)
-        _test_dtype(np.int32, 1, np.int32)
-        _test_dtype(np.int32, 2.0, np.float64)
-        _test_dtype(np.int32, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.int32, True, np.object_)
-        _test_dtype(np.int32, '', np.object_)
-        _test_dtype(np.float64, 1, np.float64)
-        _test_dtype(np.float64, 2.0, np.float64)
-        _test_dtype(np.float64, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.float64, True, np.object_)
-        _test_dtype(np.float64, '', np.object_)
-        _test_dtype(np.complex128, 1, np.complex128)
-        _test_dtype(np.complex128, 2.0, np.complex128)
-        _test_dtype(np.complex128, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.complex128, True, np.object_)
-        _test_dtype(np.complex128, '', np.object_)
-        _test_dtype(np.bool_, 1, np.object_)
-        _test_dtype(np.bool_, 2.0, np.object_)
-        _test_dtype(np.bool_, 3.0 + 4.0j, np.object_)
-        _test_dtype(np.bool_, True, np.bool_)
-        _test_dtype(np.bool_, '', np.object_)
-
-    def test_3d_with_out(self):
-        def _test_dtype(dtype, can_hold_na):
-            data = np.random.randint(0, 2, (5, 4, 3)).astype(dtype)
-
-            indexer = [2, 1, 0, 1]
-            out0 = np.empty((4, 4, 3), dtype=dtype)
-            out1 = np.empty((5, 4, 3), dtype=dtype)
-            out2 = np.empty((5, 4, 4), dtype=dtype)
-            com.take_nd(data, indexer, out=out0, axis=0)
-            com.take_nd(data, indexer, out=out1, axis=1)
-            com.take_nd(data, indexer, out=out2, axis=2)
-            expected0 = data.take(indexer, axis=0)
-            expected1 = data.take(indexer, axis=1)
-            expected2 = data.take(indexer, axis=2)
-            tm.assert_almost_equal(out0, expected0)
-            tm.assert_almost_equal(out1, expected1)
-            tm.assert_almost_equal(out2, expected2)
-
-            indexer = [2, 1, 0, -1]
-            out0 = np.empty((4, 4, 3), dtype=dtype)
-            out1 = np.empty((5, 4, 3), dtype=dtype)
-            out2 = np.empty((5, 4, 4), dtype=dtype)
-            if can_hold_na:
-                com.take_nd(data, indexer, out=out0, axis=0)
-                com.take_nd(data, indexer, out=out1, axis=1)
-                com.take_nd(data, indexer, out=out2, axis=2)
-                expected0 = data.take(indexer, axis=0)
-                expected1 = data.take(indexer, axis=1)
-                expected2 = data.take(indexer, axis=2)
-                expected0[3, :, :] = np.nan
-                expected1[:, 3, :] = np.nan
-                expected2[:, :, 3] = np.nan
-                tm.assert_almost_equal(out0, expected0)
-                tm.assert_almost_equal(out1, expected1)
-                tm.assert_almost_equal(out2, expected2)
-            else:
-                for i, out in enumerate([out0, out1, out2]):
-                    with tm.assertRaisesRegexp(TypeError, self.fill_error):
-                        com.take_nd(data, indexer, out=out, axis=i)
-                    # no exception o/w
-                    data.take(indexer, out=out, axis=i)
-
-        _test_dtype(np.float64, True)
-        _test_dtype(np.float32, True)
-        _test_dtype(np.uint64, False)
-        _test_dtype(np.uint32, False)
-        _test_dtype(np.uint16, False)
-        _test_dtype(np.uint8, False)
-        _test_dtype(np.int64, False)
-        _test_dtype(np.int32, False)
-        _test_dtype(np.int16, False)
-        _test_dtype(np.int8, False)
-        _test_dtype(np.object_, True)
-        _test_dtype(np.bool, False)
-
-    def test_3d_fill_nonna(self):
-        def _test_dtype(dtype, fill_value, out_dtype):
-            data = np.random.randint(0, 2, (5, 4, 3)).astype(dtype)
-
-            indexer = [2, 1, 0, -1]
-
-            result = com.take_nd(data, indexer, axis=0, fill_value=fill_value)
-            assert((result[[0, 1, 2], :, :] == data[[2, 1, 0], :, :]).all())
-            assert((result[3, :, :] == fill_value).all())
-            assert(result.dtype == out_dtype)
-
-            result = com.take_nd(data, indexer, axis=1, fill_value=fill_value)
-            assert((result[:, [0, 1, 2], :] == data[:, [2, 1, 0], :]).all())
-            assert((result[:, 3, :] == fill_value).all())
-            assert(result.dtype == out_dtype)
-
-            result = com.take_nd(data, indexer, axis=2, fill_value=fill_value)
-            assert((result[:, :, [0, 1, 2]] == data[:, :, [2, 1, 0]]).all())
-            assert((result[:, :, 3] == fill_value).all())
-            assert(result.dtype == out_dtype)
-
-            indexer = [2, 1, 0, 1]
-
-            result = com.take_nd(data, indexer, axis=0, fill_value=fill_value)
-            assert((result[[0, 1, 2, 3], :, :] == data[indexer, :, :]).all())
-            assert(result.dtype == dtype)
-
-            result = com.take_nd(data, indexer, axis=1, fill_value=fill_value)
-            assert((result[:, [0, 1, 2, 3], :] == data[:, indexer, :]).all())
-            assert(result.dtype == dtype)
-
-            result = com.take_nd(data, indexer, axis=2, fill_value=fill_value)
-            assert((result[:, :, [0, 1, 2, 3]] == data[:, :, indexer]).all())
-            assert(result.dtype == dtype)
-
-        _test_dtype(np.int8, np.int16(127), np.int8)
-        _test_dtype(np.int8, np.int16(128), np.int16)
-        _test_dtype(np.int32, 1, np.int32)
-        _test_dtype(np.int32, 2.0, np.float64)
-        _test_dtype(np.int32, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.int32, True, np.object_)
-        _test_dtype(np.int32, '', np.object_)
-        _test_dtype(np.float64, 1, np.float64)
-        _test_dtype(np.float64, 2.0, np.float64)
-        _test_dtype(np.float64, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.float64, True, np.object_)
-        _test_dtype(np.float64, '', np.object_)
-        _test_dtype(np.complex128, 1, np.complex128)
-        _test_dtype(np.complex128, 2.0, np.complex128)
-        _test_dtype(np.complex128, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.complex128, True, np.object_)
-        _test_dtype(np.complex128, '', np.object_)
-        _test_dtype(np.bool_, 1, np.object_)
-        _test_dtype(np.bool_, 2.0, np.object_)
-        _test_dtype(np.bool_, 3.0 + 4.0j, np.object_)
-        _test_dtype(np.bool_, True, np.bool_)
-        _test_dtype(np.bool_, '', np.object_)
-
-    def test_1d_other_dtypes(self):
-        arr = np.random.randn(10).astype(np.float32)
-
-        indexer = [1, 2, 3, -1]
-        result = com.take_1d(arr, indexer)
-        expected = arr.take(indexer)
-        expected[-1] = np.nan
-        tm.assert_almost_equal(result, expected)
-
-    def test_2d_other_dtypes(self):
-        arr = np.random.randn(10, 5).astype(np.float32)
-
-        indexer = [1, 2, 3, -1]
-
-        # axis=0
-        result = com.take_nd(arr, indexer, axis=0)
-        expected = arr.take(indexer, axis=0)
-        expected[-1] = np.nan
-        tm.assert_almost_equal(result, expected)
-
-        # axis=1
-        result = com.take_nd(arr, indexer, axis=1)
-        expected = arr.take(indexer, axis=1)
-        expected[:, -1] = np.nan
-        tm.assert_almost_equal(result, expected)
-
-    def test_1d_bool(self):
-        arr = np.array([0, 1, 0], dtype=bool)
-
-        result = com.take_1d(arr, [0, 2, 2, 1])
-        expected = arr.take([0, 2, 2, 1])
-        self.assert_numpy_array_equal(result, expected)
-
-        result = com.take_1d(arr, [0, 2, -1])
-        self.assertEqual(result.dtype, np.object_)
-
-    def test_2d_bool(self):
-        arr = np.array([[0, 1, 0],
-                        [1, 0, 1],
-                        [0, 1, 1]], dtype=bool)
-
-        result = com.take_nd(arr, [0, 2, 2, 1])
-        expected = arr.take([0, 2, 2, 1], axis=0)
-        self.assert_numpy_array_equal(result, expected)
-
-        result = com.take_nd(arr, [0, 2, 2, 1], axis=1)
-        expected = arr.take([0, 2, 2, 1], axis=1)
-        self.assert_numpy_array_equal(result, expected)
-
-        result = com.take_nd(arr, [0, 2, -1])
-        self.assertEqual(result.dtype, np.object_)
-
-    def test_2d_float32(self):
-        arr = np.random.randn(4, 3).astype(np.float32)
-        indexer = [0, 2, -1, 1, -1]
-
-        # axis=0
-        result = com.take_nd(arr, indexer, axis=0)
-        result2 = np.empty_like(result)
-        com.take_nd(arr, indexer, axis=0, out=result2)
-        tm.assert_almost_equal(result, result2)
-
-        expected = arr.take(indexer, axis=0)
-        expected[[2, 4], :] = np.nan
-        tm.assert_almost_equal(result, expected)
-
-        #### this now accepts a float32! # test with float64 out buffer
-        out = np.empty((len(indexer), arr.shape[1]), dtype='float32')
-        com.take_nd(arr, indexer, out=out)  # it works!
-
-        # axis=1
-        result = com.take_nd(arr, indexer, axis=1)
-        result2 = np.empty_like(result)
-        com.take_nd(arr, indexer, axis=1, out=result2)
-        tm.assert_almost_equal(result, result2)
-
-        expected = arr.take(indexer, axis=1)
-        expected[:, [2, 4]] = np.nan
-        tm.assert_almost_equal(result, expected)
-
-    def test_2d_datetime64(self):
-        # 2005/01/01 - 2006/01/01
-        arr = np.random.randint(long(11045376), long(11360736), (5, 3))*100000000000
-        arr = arr.view(dtype='datetime64[ns]')
-        indexer = [0, 2, -1, 1, -1]
-
-        # axis=0
-        result = com.take_nd(arr, indexer, axis=0)
-        result2 = np.empty_like(result)
-        com.take_nd(arr, indexer, axis=0, out=result2)
-        tm.assert_almost_equal(result, result2)
-
-        expected = arr.take(indexer, axis=0)
-        expected.view(np.int64)[[2, 4], :] = iNaT
-        tm.assert_almost_equal(result, expected)
-
-        result = com.take_nd(arr, indexer, axis=0,
-                             fill_value=datetime(2007, 1, 1))
-        result2 = np.empty_like(result)
-        com.take_nd(arr, indexer, out=result2, axis=0,
-                    fill_value=datetime(2007, 1, 1))
-        tm.assert_almost_equal(result, result2)
-
-        expected = arr.take(indexer, axis=0)
-        expected[[2, 4], :] = datetime(2007, 1, 1)
-        tm.assert_almost_equal(result, expected)
-
-        # axis=1
-        result = com.take_nd(arr, indexer, axis=1)
-        result2 = np.empty_like(result)
-        com.take_nd(arr, indexer, axis=1, out=result2)
-        tm.assert_almost_equal(result, result2)
-
-        expected = arr.take(indexer, axis=1)
-        expected.view(np.int64)[:, [2, 4]] = iNaT
-        tm.assert_almost_equal(result, expected)
-
-        result = com.take_nd(arr, indexer, axis=1,
-                             fill_value=datetime(2007, 1, 1))
-        result2 = np.empty_like(result)
-        com.take_nd(arr, indexer, out=result2, axis=1,
-                    fill_value=datetime(2007, 1, 1))
-        tm.assert_almost_equal(result, result2)
-
-        expected = arr.take(indexer, axis=1)
-        expected[:, [2, 4]] = datetime(2007, 1, 1)
-        tm.assert_almost_equal(result, expected)
-
-
-class TestMaybe(tm.TestCase):
-
-    def test_maybe_convert_string_to_array(self):
-        result = com._maybe_convert_string_to_object('x')
-        tm.assert_numpy_array_equal(result, np.array(['x'], dtype=object))
-        self.assertTrue(result.dtype == object)
-
-        result = com._maybe_convert_string_to_object(1)
-        self.assertEqual(result, 1)
-
-        arr = np.array(['x', 'y'], dtype=str)
-        result = com._maybe_convert_string_to_object(arr)
-        tm.assert_numpy_array_equal(result, np.array(['x', 'y'], dtype=object))
-        self.assertTrue(result.dtype == object)
-
-        # unicode
-        arr = np.array(['x', 'y']).astype('U')
-        result = com._maybe_convert_string_to_object(arr)
-        tm.assert_numpy_array_equal(result, np.array(['x', 'y'], dtype=object))
-        self.assertTrue(result.dtype == object)
-
-        # object
-        arr = np.array(['x', 2], dtype=object)
-        result = com._maybe_convert_string_to_object(arr)
-        tm.assert_numpy_array_equal(result, np.array(['x', 2], dtype=object))
-        self.assertTrue(result.dtype == object)
-
-def test_possibly_convert_objects_copy():
-    values = np.array([1, 2])
-
-    out = convert._possibly_convert_objects(values, copy=False)
-    assert_true(values is out)
-
-    out = convert._possibly_convert_objects(values, copy=True)
-    assert_true(values is not out)
-
-    values = np.array(['apply','banana'])
-    out = convert._possibly_convert_objects(values, copy=False)
-    assert_true(values is out)
-
-    out = convert._possibly_convert_objects(values, copy=True)
-    assert_true(values is not out)
+@pytest.mark.parametrize('left, right, expected', [
+    (Series([1], name='x'), Series([2], name='x'), 'x'),
+    (Series([1], name='x'), Series([2], name='y'), None),
+    (Series([1]), Series([2], name='x'), None),
+    (Series([1], name='x'), Series([2]), None),
+    (Series([1], name='x'), [2], 'x'),
+    ([1], Series([2], name='y'), 'y')])
+def test_maybe_match_name(left, right, expected):
+    assert ops._maybe_match_name(left, right) == expected
 
 
 def test_dict_compat():
@@ -1168,11 +182,83 @@ def test_dict_compat():
                        np.datetime64('2015-03-15'): 2}
     data_unchanged = {1: 2, 3: 4, 5: 6}
     expected = {Timestamp('1990-3-15'): 1, Timestamp('2015-03-15'): 2}
-    assert(com._dict_compat(data_datetime64) == expected)
-    assert(com._dict_compat(expected) == expected)
-    assert(com._dict_compat(data_unchanged) == data_unchanged)
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
+    assert (com._dict_compat(data_datetime64) == expected)
+    assert (com._dict_compat(expected) == expected)
+    assert (com._dict_compat(data_unchanged) == data_unchanged)
+
+
+def test_standardize_mapping():
+    # No uninitialized defaultdicts
+    with pytest.raises(TypeError):
+        com.standardize_mapping(collections.defaultdict)
+
+    # No non-mapping subtypes, instance
+    with pytest.raises(TypeError):
+        com.standardize_mapping([])
+
+    # No non-mapping subtypes, class
+    with pytest.raises(TypeError):
+        com.standardize_mapping(list)
+
+    fill = {'bad': 'data'}
+    assert (com.standardize_mapping(fill) == dict)
+
+    # Convert instance to type
+    assert (com.standardize_mapping({}) == dict)
+
+    dd = collections.defaultdict(list)
+    assert isinstance(com.standardize_mapping(dd), partial)
+
+
+@pytest.mark.parametrize('obj', [
+    DataFrame(100 * [[0.123456, 0.234567, 0.567567],
+                     [12.32112, 123123.2, 321321.2]],
+              columns=['X', 'Y', 'Z']),
+    Series(100 * [0.123456, 0.234567, 0.567567], name='X')])
+@pytest.mark.parametrize('method', ['to_pickle', 'to_json', 'to_csv'])
+def test_compression_size(obj, method, compression_only):
+
+    with tm.ensure_clean() as filename:
+        getattr(obj, method)(filename, compression=compression_only)
+        compressed = os.path.getsize(filename)
+        getattr(obj, method)(filename, compression=None)
+        uncompressed = os.path.getsize(filename)
+        assert uncompressed > compressed
+
+
+@pytest.mark.parametrize('obj', [
+    DataFrame(100 * [[0.123456, 0.234567, 0.567567],
+                     [12.32112, 123123.2, 321321.2]],
+              columns=['X', 'Y', 'Z']),
+    Series(100 * [0.123456, 0.234567, 0.567567], name='X')])
+@pytest.mark.parametrize('method', ['to_csv', 'to_json'])
+def test_compression_size_fh(obj, method, compression_only):
+
+    with tm.ensure_clean() as filename:
+        f, _handles = _get_handle(filename, 'w', compression=compression_only)
+        with f:
+            getattr(obj, method)(f)
+            assert not f.closed
+        assert f.closed
+        compressed = os.path.getsize(filename)
+    with tm.ensure_clean() as filename:
+        f, _handles = _get_handle(filename, 'w', compression=None)
+        with f:
+            getattr(obj, method)(f)
+            assert not f.closed
+        assert f.closed
+        uncompressed = os.path.getsize(filename)
+        assert uncompressed > compressed
+
+
+# GH 21227
+def test_compression_warning(compression_only):
+    df = DataFrame(100 * [[0.123456, 0.234567, 0.567567],
+                          [12.32112, 123123.2, 321321.2]],
+                   columns=['X', 'Y', 'Z'])
+    with tm.ensure_clean() as filename:
+        f, _handles = _get_handle(filename, 'w', compression=compression_only)
+        with tm.assert_produces_warning(RuntimeWarning,
+                                        check_stacklevel=False):
+            with f:
+                df.to_csv(f, compression=compression_only)
diff --git a/pandas/tests/test_compat.py b/pandas/tests/test_compat.py
index 13596bd35bb62..79d3aad493182 100644
--- a/pandas/tests/test_compat.py
+++ b/pandas/tests/test_compat.py
@@ -3,25 +3,28 @@
 Testing that functions from compat work as expected
 """
 
-from pandas.compat import (
-    range, zip, map, filter,
-    lrange, lzip, lmap, lfilter,
-    builtins
-)
-import unittest
-import nose
-import pandas.util.testing as tm
-
-class TestBuiltinIterators(tm.TestCase):
-    def check_result(self, actual, expected, lengths):
-        for (iter_res, list_res), exp, length in zip(actual, expected, lengths):
-            self.assertNotIsInstance(iter_res, list)
-            tm.assertIsInstance(list_res, list)
+import pytest
+import re
+from pandas.compat import (range, zip, map, filter, lrange, lzip, lmap,
+                           lfilter, builtins, iterkeys, itervalues, iteritems,
+                           next, get_range_parameters, PY2, re_type)
+
+
+class TestBuiltinIterators(object):
+
+    @classmethod
+    def check_result(cls, actual, expected, lengths):
+        for (iter_res, list_res), exp, length in zip(actual, expected,
+                                                     lengths):
+            assert not isinstance(iter_res, list)
+            assert isinstance(list_res, list)
+
             iter_res = list(iter_res)
-            self.assertEqual(len(list_res), length)
-            self.assertEqual(len(iter_res), length)
-            self.assertEqual(iter_res, exp)
-            self.assertEqual(list_res, exp)
+
+            assert len(list_res) == length
+            assert len(iter_res) == length
+            assert iter_res == exp
+            assert list_res == exp
 
     def test_range(self):
         actual1 = range(10)
@@ -47,7 +50,6 @@ def test_map(self):
         lengths = 10,
         self.check_result(actual, expected, lengths)
 
-
     def test_filter(self):
         func = lambda x: x
         lst = list(builtins.range(10))
@@ -65,7 +67,30 @@ def test_zip(self):
         lengths = 10,
         self.check_result(actual, expected, lengths)
 
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   # '--with-coverage', '--cover-package=pandas.core'],
-                   exit=False)
+    def test_dict_iterators(self):
+        assert next(itervalues({1: 2})) == 2
+        assert next(iterkeys({1: 2})) == 1
+        assert next(iteritems({1: 2})) == (1, 2)
+
+
+class TestCompatFunctions(object):
+
+    @pytest.mark.parametrize(
+        'start,stop,step', [(0, 10, 2), (11, -2, -1), (0, -5, 1), (2, 4, 8)])
+    def test_get_range_parameters(self, start, stop, step):
+        rng = range(start, stop, step)
+        if PY2 and len(rng) == 0:
+            start_expected, stop_expected, step_expected = 0, 0, 1
+        elif PY2 and len(rng) == 1:
+            start_expected, stop_expected, step_expected = start, start + 1, 1
+        else:
+            start_expected, stop_expected, step_expected = start, stop, step
+
+        start_result, stop_result, step_result = get_range_parameters(rng)
+        assert start_result == start_expected
+        assert stop_result == stop_expected
+        assert step_result == step_expected
+
+
+def test_re_type():
+    assert isinstance(re.compile(''), re_type)
diff --git a/pandas/tests/test_config.py b/pandas/tests/test_config.py
index 3a8fdd877f5a0..91ce65dcce9b2 100644
--- a/pandas/tests/test_config.py
+++ b/pandas/tests/test_config.py
@@ -1,31 +1,36 @@
-#!/usr/bin/python
 # -*- coding: utf-8 -*-
+import pytest
+
 import pandas as pd
-import unittest
-import warnings
-import nose
 
+import warnings
 
-class TestConfig(unittest.TestCase):
-    _multiprocess_can_split_ = True
 
-    def __init__(self, *args):
-        super(TestConfig, self).__init__(*args)
+class TestConfig(object):
 
+    @classmethod
+    def setup_class(cls):
         from copy import deepcopy
-        self.cf = pd.core.config
-        self.gc = deepcopy(getattr(self.cf, '_global_config'))
-        self.do = deepcopy(getattr(self.cf, '_deprecated_options'))
-        self.ro = deepcopy(getattr(self.cf, '_registered_options'))
 
-    def setUp(self):
+        cls.cf = pd.core.config
+        cls.gc = deepcopy(getattr(cls.cf, '_global_config'))
+        cls.do = deepcopy(getattr(cls.cf, '_deprecated_options'))
+        cls.ro = deepcopy(getattr(cls.cf, '_registered_options'))
+
+    def setup_method(self, method):
         setattr(self.cf, '_global_config', {})
-        setattr(
-            self.cf, 'options', self.cf.DictWrapper(self.cf._global_config))
+        setattr(self.cf, 'options', self.cf.DictWrapper(
+            self.cf._global_config))
         setattr(self.cf, '_deprecated_options', {})
         setattr(self.cf, '_registered_options', {})
 
-    def tearDown(self):
+        # Our test fixture in conftest.py sets "chained_assignment"
+        # to "raise" only after all test methods have been setup.
+        # However, after this setup, there is no longer any
+        # "chained_assignment" option, so re-register it.
+        self.cf.register_option('chained_assignment', 'raise')
+
+    def teardown_method(self, method):
         setattr(self.cf, '_global_config', self.gc)
         setattr(self.cf, '_deprecated_options', self.do)
         setattr(self.cf, '_registered_options', self.ro)
@@ -33,36 +38,36 @@ def tearDown(self):
     def test_api(self):
 
         # the pandas object exposes the user API
-        self.assertTrue(hasattr(pd, 'get_option'))
-        self.assertTrue(hasattr(pd, 'set_option'))
-        self.assertTrue(hasattr(pd, 'reset_option'))
-        self.assertTrue(hasattr(pd, 'describe_option'))
+        assert hasattr(pd, 'get_option')
+        assert hasattr(pd, 'set_option')
+        assert hasattr(pd, 'reset_option')
+        assert hasattr(pd, 'describe_option')
 
     def test_is_one_of_factory(self):
-        v = self.cf.is_one_of_factory([None,12])
+        v = self.cf.is_one_of_factory([None, 12])
 
         v(12)
         v(None)
-        self.assertRaises(ValueError,v,1.1)
+        pytest.raises(ValueError, v, 1.1)
 
     def test_register_option(self):
         self.cf.register_option('a', 1, 'doc')
 
         # can't register an already registered option
-        self.assertRaises(KeyError, self.cf.register_option, 'a', 1, 'doc')
+        pytest.raises(KeyError, self.cf.register_option, 'a', 1, 'doc')
 
         # can't register an already registered option
-        self.assertRaises(KeyError, self.cf.register_option, 'a.b.c.d1', 1,
-                          'doc')
-        self.assertRaises(KeyError, self.cf.register_option, 'a.b.c.d2', 1,
-                          'doc')
+        pytest.raises(KeyError, self.cf.register_option, 'a.b.c.d1', 1,
+                      'doc')
+        pytest.raises(KeyError, self.cf.register_option, 'a.b.c.d2', 1,
+                      'doc')
 
         # no python keywords
-        self.assertRaises(ValueError, self.cf.register_option, 'for', 0)
-        self.assertRaises(ValueError, self.cf.register_option, 'a.for.b', 0)
+        pytest.raises(ValueError, self.cf.register_option, 'for', 0)
+        pytest.raises(ValueError, self.cf.register_option, 'a.for.b', 0)
         # must be valid identifier (ensure attribute access works)
-        self.assertRaises(ValueError, self.cf.register_option,
-                          'Oh my Goddess!', 0)
+        pytest.raises(ValueError, self.cf.register_option,
+                      'Oh my Goddess!', 0)
 
         # we can register options several levels deep
         # without predefining the intermediate steps
@@ -85,57 +90,42 @@ def test_describe_option(self):
         self.cf.register_option('l', "foo")
 
         # non-existent keys raise KeyError
-        self.assertRaises(KeyError, self.cf.describe_option, 'no.such.key')
+        pytest.raises(KeyError, self.cf.describe_option, 'no.such.key')
 
         # we can get the description for any key we registered
-        self.assertTrue(
-            'doc' in self.cf.describe_option('a', _print_desc=False))
-        self.assertTrue(
-            'doc2' in self.cf.describe_option('b', _print_desc=False))
-        self.assertTrue(
-            'precated' in self.cf.describe_option('b', _print_desc=False))
-
-        self.assertTrue(
-            'doc3' in self.cf.describe_option('c.d.e1', _print_desc=False))
-        self.assertTrue(
-            'doc4' in self.cf.describe_option('c.d.e2', _print_desc=False))
+        assert 'doc' in self.cf.describe_option('a', _print_desc=False)
+        assert 'doc2' in self.cf.describe_option('b', _print_desc=False)
+        assert 'precated' in self.cf.describe_option('b', _print_desc=False)
+        assert 'doc3' in self.cf.describe_option('c.d.e1', _print_desc=False)
+        assert 'doc4' in self.cf.describe_option('c.d.e2', _print_desc=False)
 
         # if no doc is specified we get a default message
         # saying "description not available"
-        self.assertTrue(
-            'vailable' in self.cf.describe_option('f', _print_desc=False))
-        self.assertTrue(
-            'vailable' in self.cf.describe_option('g.h', _print_desc=False))
-        self.assertTrue(
-            'precated' in self.cf.describe_option('g.h', _print_desc=False))
-        self.assertTrue(
-            'k' in self.cf.describe_option('g.h', _print_desc=False))
+        assert 'vailable' in self.cf.describe_option('f', _print_desc=False)
+        assert 'vailable' in self.cf.describe_option('g.h', _print_desc=False)
+        assert 'precated' in self.cf.describe_option('g.h', _print_desc=False)
+        assert 'k' in self.cf.describe_option('g.h', _print_desc=False)
 
         # default is reported
-        self.assertTrue(
-            'foo' in self.cf.describe_option('l', _print_desc=False))
+        assert 'foo' in self.cf.describe_option('l', _print_desc=False)
         # current value is reported
-        self.assertFalse(
-            'bar' in self.cf.describe_option('l', _print_desc=False))
-        self.cf.set_option("l","bar")
-        self.assertTrue(
-            'bar' in self.cf.describe_option('l', _print_desc=False))
+        assert 'bar' not in self.cf.describe_option('l', _print_desc=False)
+        self.cf.set_option("l", "bar")
+        assert 'bar' in self.cf.describe_option('l', _print_desc=False)
 
     def test_case_insensitive(self):
         self.cf.register_option('KanBAN', 1, 'doc')
 
-        self.assertTrue(
-            'doc' in self.cf.describe_option('kanbaN', _print_desc=False))
-        self.assertEqual(self.cf.get_option('kanBaN'), 1)
+        assert 'doc' in self.cf.describe_option('kanbaN', _print_desc=False)
+        assert self.cf.get_option('kanBaN') == 1
         self.cf.set_option('KanBan', 2)
-        self.assertEqual(self.cf.get_option('kAnBaN'), 2)
+        assert self.cf.get_option('kAnBaN') == 2
 
         # gets of non-existent keys fail
-        self.assertRaises(KeyError, self.cf.get_option, 'no_such_option')
+        pytest.raises(KeyError, self.cf.get_option, 'no_such_option')
         self.cf.deprecate_option('KanBan')
 
-        # testing warning with catch_warning was only added in 2.6
-        self.assertTrue(self.cf._is_deprecated('kAnBaN'))
+        assert self.cf._is_deprecated('kAnBaN')
 
     def test_get_option(self):
         self.cf.register_option('a', 1, 'doc')
@@ -143,117 +133,118 @@ def test_get_option(self):
         self.cf.register_option('b.b', None, 'doc2')
 
         # gets of existing keys succeed
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
-        self.assertTrue(self.cf.get_option('b.b') is None)
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
+        assert self.cf.get_option('b.b') is None
 
         # gets of non-existent keys fail
-        self.assertRaises(KeyError, self.cf.get_option, 'no_such_option')
+        pytest.raises(KeyError, self.cf.get_option, 'no_such_option')
 
     def test_set_option(self):
         self.cf.register_option('a', 1, 'doc')
         self.cf.register_option('b.c', 'hullo', 'doc2')
         self.cf.register_option('b.b', None, 'doc2')
 
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
-        self.assertTrue(self.cf.get_option('b.b') is None)
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
+        assert self.cf.get_option('b.b') is None
 
         self.cf.set_option('a', 2)
         self.cf.set_option('b.c', 'wurld')
         self.cf.set_option('b.b', 1.1)
 
-        self.assertEqual(self.cf.get_option('a'), 2)
-        self.assertEqual(self.cf.get_option('b.c'), 'wurld')
-        self.assertEqual(self.cf.get_option('b.b'), 1.1)
-
-        self.assertRaises(KeyError, self.cf.set_option, 'no.such.key', None)
+        assert self.cf.get_option('a') == 2
+        assert self.cf.get_option('b.c') == 'wurld'
+        assert self.cf.get_option('b.b') == 1.1
 
+        pytest.raises(KeyError, self.cf.set_option, 'no.such.key', None)
 
     def test_set_option_empty_args(self):
-        self.assertRaises(ValueError, self.cf.set_option)
+        pytest.raises(ValueError, self.cf.set_option)
 
     def test_set_option_uneven_args(self):
-        self.assertRaises(ValueError, self.cf.set_option, 'a.b', 2, 'b.c')
+        pytest.raises(ValueError, self.cf.set_option, 'a.b', 2, 'b.c')
 
     def test_set_option_invalid_single_argument_type(self):
-        self.assertRaises(ValueError, self.cf.set_option, 2)
+        pytest.raises(ValueError, self.cf.set_option, 2)
 
     def test_set_option_multiple(self):
         self.cf.register_option('a', 1, 'doc')
         self.cf.register_option('b.c', 'hullo', 'doc2')
         self.cf.register_option('b.b', None, 'doc2')
 
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
-        self.assertTrue(self.cf.get_option('b.b') is None)
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
+        assert self.cf.get_option('b.b') is None
 
         self.cf.set_option('a', '2', 'b.c', None, 'b.b', 10.0)
 
-        self.assertEqual(self.cf.get_option('a'), '2')
-        self.assertTrue(self.cf.get_option('b.c') is None)
-        self.assertEqual(self.cf.get_option('b.b'), 10.0)
+        assert self.cf.get_option('a') == '2'
+        assert self.cf.get_option('b.c') is None
+        assert self.cf.get_option('b.b') == 10.0
 
     def test_validation(self):
         self.cf.register_option('a', 1, 'doc', validator=self.cf.is_int)
         self.cf.register_option('b.c', 'hullo', 'doc2',
                                 validator=self.cf.is_text)
-        self.assertRaises(ValueError, self.cf.register_option, 'a.b.c.d2',
-                          'NO', 'doc', validator=self.cf.is_int)
+        pytest.raises(ValueError, self.cf.register_option, 'a.b.c.d2',
+                      'NO', 'doc', validator=self.cf.is_int)
 
         self.cf.set_option('a', 2)  # int is_int
         self.cf.set_option('b.c', 'wurld')  # str is_str
 
-        self.assertRaises(
+        pytest.raises(
             ValueError, self.cf.set_option, 'a', None)  # None not is_int
-        self.assertRaises(ValueError, self.cf.set_option, 'a', 'ab')
-        self.assertRaises(ValueError, self.cf.set_option, 'b.c', 1)
+        pytest.raises(ValueError, self.cf.set_option, 'a', 'ab')
+        pytest.raises(ValueError, self.cf.set_option, 'b.c', 1)
+
+        validator = self.cf.is_one_of_factory([None, self.cf.is_callable])
+        self.cf.register_option('b', lambda: None, 'doc',
+                                validator=validator)
+        self.cf.set_option('b', '%.1f'.format)  # Formatter is callable
+        self.cf.set_option('b', None)  # Formatter is none (default)
+        pytest.raises(ValueError, self.cf.set_option, 'b', '%.1f')
 
     def test_reset_option(self):
         self.cf.register_option('a', 1, 'doc', validator=self.cf.is_int)
         self.cf.register_option('b.c', 'hullo', 'doc2',
                                 validator=self.cf.is_str)
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
 
         self.cf.set_option('a', 2)
         self.cf.set_option('b.c', 'wurld')
-        self.assertEqual(self.cf.get_option('a'), 2)
-        self.assertEqual(self.cf.get_option('b.c'), 'wurld')
+        assert self.cf.get_option('a') == 2
+        assert self.cf.get_option('b.c') == 'wurld'
 
         self.cf.reset_option('a')
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'wurld')
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'wurld'
         self.cf.reset_option('b.c')
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
 
     def test_reset_option_all(self):
         self.cf.register_option('a', 1, 'doc', validator=self.cf.is_int)
         self.cf.register_option('b.c', 'hullo', 'doc2',
                                 validator=self.cf.is_str)
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
 
         self.cf.set_option('a', 2)
         self.cf.set_option('b.c', 'wurld')
-        self.assertEqual(self.cf.get_option('a'), 2)
-        self.assertEqual(self.cf.get_option('b.c'), 'wurld')
+        assert self.cf.get_option('a') == 2
+        assert self.cf.get_option('b.c') == 'wurld'
 
         self.cf.reset_option("all")
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
 
     def test_deprecate_option(self):
-        import sys
-        self.cf.deprecate_option(
-            'foo')  # we can deprecate non-existent options
-
-        # testing warning with catch_warning was only added in 2.6
-        if sys.version_info[:2] < (2, 6):
-            raise nose.SkipTest("Need py > 2.6")
+        # we can deprecate non-existent options
+        self.cf.deprecate_option('foo')
 
-        self.assertTrue(self.cf._is_deprecated('foo'))
+        assert self.cf._is_deprecated('foo')
         with warnings.catch_warnings(record=True) as w:
             warnings.simplefilter('always')
             try:
@@ -263,9 +254,8 @@ def test_deprecate_option(self):
             else:
                 self.fail("Nonexistent option didn't raise KeyError")
 
-            self.assertEqual(len(w), 1)  # should have raised one warning
-            self.assertTrue(
-                'deprecated' in str(w[-1]))  # we get the default message
+            assert len(w) == 1  # should have raised one warning
+            assert 'deprecated' in str(w[-1])  # we get the default message
 
         self.cf.register_option('a', 1, 'doc', validator=self.cf.is_int)
         self.cf.register_option('b.c', 'hullo', 'doc2')
@@ -276,13 +266,11 @@ def test_deprecate_option(self):
             warnings.simplefilter('always')
             self.cf.get_option('a')
 
-            self.assertEqual(len(w), 1)  # should have raised one warning
-            self.assertTrue(
-                'eprecated' in str(w[-1]))  # we get the default message
-            self.assertTrue(
-                'nifty_ver' in str(w[-1]))  # with the removal_ver quoted
+            assert len(w) == 1  # should have raised one warning
+            assert 'eprecated' in str(w[-1])  # we get the default message
+            assert 'nifty_ver' in str(w[-1])  # with the removal_ver quoted
 
-            self.assertRaises(
+            pytest.raises(
                 KeyError, self.cf.deprecate_option, 'a')  # can't depr. twice
 
         self.cf.deprecate_option('b.c', 'zounds!')
@@ -290,66 +278,60 @@ def test_deprecate_option(self):
             warnings.simplefilter('always')
             self.cf.get_option('b.c')
 
-            self.assertEqual(len(w), 1)  # should have raised one warning
-            self.assertTrue(
-                'zounds!' in str(w[-1]))  # we get the custom message
+            assert len(w) == 1  # should have raised one warning
+            assert 'zounds!' in str(w[-1])  # we get the custom message
 
         # test rerouting keys
         self.cf.register_option('d.a', 'foo', 'doc2')
         self.cf.register_option('d.dep', 'bar', 'doc2')
-        self.assertEqual(self.cf.get_option('d.a'), 'foo')
-        self.assertEqual(self.cf.get_option('d.dep'), 'bar')
+        assert self.cf.get_option('d.a') == 'foo'
+        assert self.cf.get_option('d.dep') == 'bar'
 
         self.cf.deprecate_option('d.dep', rkey='d.a')  # reroute d.dep to d.a
         with warnings.catch_warnings(record=True) as w:
             warnings.simplefilter('always')
-            self.assertEqual(self.cf.get_option('d.dep'), 'foo')
+            assert self.cf.get_option('d.dep') == 'foo'
 
-            self.assertEqual(len(w), 1)  # should have raised one warning
-            self.assertTrue(
-                'eprecated' in str(w[-1]))  # we get the custom message
+            assert len(w) == 1  # should have raised one warning
+            assert 'eprecated' in str(w[-1])  # we get the custom message
 
         with warnings.catch_warnings(record=True) as w:
             warnings.simplefilter('always')
             self.cf.set_option('d.dep', 'baz')  # should overwrite "d.a"
 
-            self.assertEqual(len(w), 1)  # should have raised one warning
-            self.assertTrue(
-                'eprecated' in str(w[-1]))  # we get the custom message
+            assert len(w) == 1  # should have raised one warning
+            assert 'eprecated' in str(w[-1])  # we get the custom message
 
         with warnings.catch_warnings(record=True) as w:
             warnings.simplefilter('always')
-            self.assertEqual(self.cf.get_option('d.dep'), 'baz')
+            assert self.cf.get_option('d.dep') == 'baz'
 
-            self.assertEqual(len(w), 1)  # should have raised one warning
-            self.assertTrue(
-                'eprecated' in str(w[-1]))  # we get the custom message
+            assert len(w) == 1  # should have raised one warning
+            assert 'eprecated' in str(w[-1])  # we get the custom message
 
     def test_config_prefix(self):
         with self.cf.config_prefix("base"):
             self.cf.register_option('a', 1, "doc1")
             self.cf.register_option('b', 2, "doc2")
-            self.assertEqual(self.cf.get_option('a'), 1)
-            self.assertEqual(self.cf.get_option('b'), 2)
+            assert self.cf.get_option('a') == 1
+            assert self.cf.get_option('b') == 2
 
             self.cf.set_option('a', 3)
             self.cf.set_option('b', 4)
-            self.assertEqual(self.cf.get_option('a'), 3)
-            self.assertEqual(self.cf.get_option('b'), 4)
+            assert self.cf.get_option('a') == 3
+            assert self.cf.get_option('b') == 4
 
-        self.assertEqual(self.cf.get_option('base.a'), 3)
-        self.assertEqual(self.cf.get_option('base.b'), 4)
-        self.assertTrue(
-            'doc1' in self.cf.describe_option('base.a', _print_desc=False))
-        self.assertTrue(
-            'doc2' in self.cf.describe_option('base.b', _print_desc=False))
+        assert self.cf.get_option('base.a') == 3
+        assert self.cf.get_option('base.b') == 4
+        assert 'doc1' in self.cf.describe_option('base.a', _print_desc=False)
+        assert 'doc2' in self.cf.describe_option('base.b', _print_desc=False)
 
         self.cf.reset_option('base.a')
         self.cf.reset_option('base.b')
 
         with self.cf.config_prefix("base"):
-            self.assertEqual(self.cf.get_option('a'), 1)
-            self.assertEqual(self.cf.get_option('b'), 2)
+            assert self.cf.get_option('a') == 1
+            assert self.cf.get_option('b') == 2
 
     def test_callback(self):
         k = [None]
@@ -364,21 +346,21 @@ def callback(key):
 
         del k[-1], v[-1]
         self.cf.set_option("d.a", "fooz")
-        self.assertEqual(k[-1], "d.a")
-        self.assertEqual(v[-1], "fooz")
+        assert k[-1] == "d.a"
+        assert v[-1] == "fooz"
 
         del k[-1], v[-1]
         self.cf.set_option("d.b", "boo")
-        self.assertEqual(k[-1], "d.b")
-        self.assertEqual(v[-1], "boo")
+        assert k[-1] == "d.b"
+        assert v[-1] == "boo"
 
         del k[-1], v[-1]
         self.cf.reset_option("d.b")
-        self.assertEqual(k[-1], "d.b")
+        assert k[-1] == "d.b"
 
     def test_set_ContextManager(self):
         def eq(val):
-            self.assertEqual(self.cf.get_option("a"), val)
+            assert self.cf.get_option("a") == val
 
         self.cf.register_option('a', 0)
         eq(0)
@@ -408,27 +390,27 @@ def f3(key):
         self.cf.register_option('c', 0, cb=f3)
         options = self.cf.options
 
-        self.assertEqual(options.a, 0)
+        assert options.a == 0
         with self.cf.option_context("a", 15):
-            self.assertEqual(options.a, 15)
+            assert options.a == 15
 
         options.a = 500
-        self.assertEqual(self.cf.get_option("a"), 500)
+        assert self.cf.get_option("a") == 500
 
         self.cf.reset_option("a")
-        self.assertEqual(options.a, self.cf.get_option("a", 0))
+        assert options.a == self.cf.get_option("a", 0)
 
-        self.assertRaises(KeyError, f)
-        self.assertRaises(KeyError, f2)
+        pytest.raises(KeyError, f)
+        pytest.raises(KeyError, f2)
 
         # make sure callback kicks when using this form of setting
         options.c = 1
-        self.assertEqual(len(holder), 1)
+        assert len(holder) == 1
 
     def test_option_context_scope(self):
         # Ensure that creating a context does not affect the existing
         # environment as it is supposed to be used with the `with` statement.
-        # See https://github.com/pydata/pandas/issues/8514
+        # See https://github.com/pandas-dev/pandas/issues/8514
 
         original_value = 60
         context_value = 10
@@ -438,11 +420,17 @@ def test_option_context_scope(self):
 
         # Ensure creating contexts didn't affect the current context.
         ctx = self.cf.option_context(option_name, context_value)
-        self.assertEqual(self.cf.get_option(option_name), original_value)
+        assert self.cf.get_option(option_name) == original_value
 
         # Ensure the correct value is available inside the context.
         with ctx:
-            self.assertEqual(self.cf.get_option(option_name), context_value)
+            assert self.cf.get_option(option_name) == context_value
 
         # Ensure the current context is reset
-        self.assertEqual(self.cf.get_option(option_name), original_value)
+        assert self.cf.get_option(option_name) == original_value
+
+    def test_dictwrapper_getattr(self):
+        options = self.cf.options
+        # GH 19789
+        pytest.raises(self.cf.OptionError, getattr, options, 'bananas')
+        assert not hasattr(options, 'bananas')
diff --git a/pandas/tests/test_downstream.py b/pandas/tests/test_downstream.py
new file mode 100644
index 0000000000000..cf98cff97669a
--- /dev/null
+++ b/pandas/tests/test_downstream.py
@@ -0,0 +1,119 @@
+# -*- coding: utf-8 -*-
+"""
+Testing that we work in the downstream packages
+"""
+import subprocess
+import sys
+
+import pytest
+import numpy as np  # noqa
+from pandas import DataFrame
+from pandas.compat import PY36
+from pandas.util import testing as tm
+import importlib
+
+
+def import_module(name):
+    # we *only* want to skip if the module is truly not available
+    # and NOT just an actual import error because of pandas changes
+
+    if PY36:
+        try:
+            return importlib.import_module(name)
+        except ModuleNotFoundError:  # noqa
+            pytest.skip("skipping as {} not available".format(name))
+
+    else:
+        try:
+            return importlib.import_module(name)
+        except ImportError as e:
+            if "No module named" in str(e) and name in str(e):
+                pytest.skip("skipping as {} not available".format(name))
+            raise
+
+
+@pytest.fixture
+def df():
+    return DataFrame({'A': [1, 2, 3]})
+
+
+def test_dask(df):
+
+    toolz = import_module('toolz')  # noqa
+    dask = import_module('dask')  # noqa
+
+    import dask.dataframe as dd
+
+    ddf = dd.from_pandas(df, npartitions=3)
+    assert ddf.A is not None
+    assert ddf.compute() is not None
+
+
+def test_xarray(df):
+
+    xarray = import_module('xarray')  # noqa
+
+    assert df.to_xarray() is not None
+
+
+def test_oo_optimizable():
+    # GH 21071
+    subprocess.check_call([sys.executable, "-OO", "-c", "import pandas"])
+
+
+@tm.network
+def test_statsmodels():
+
+    statsmodels = import_module('statsmodels')  # noqa
+    import statsmodels.api as sm
+    import statsmodels.formula.api as smf
+    df = sm.datasets.get_rdataset("Guerry", "HistData").data
+    smf.ols('Lottery ~ Literacy + np.log(Pop1831)', data=df).fit()
+
+
+def test_scikit_learn(df):
+
+    sklearn = import_module('sklearn')  # noqa
+    from sklearn import svm, datasets
+
+    digits = datasets.load_digits()
+    clf = svm.SVC(gamma=0.001, C=100.)
+    clf.fit(digits.data[:-1], digits.target[:-1])
+    clf.predict(digits.data[-1:])
+
+
+@tm.network
+def test_seaborn():
+
+    seaborn = import_module('seaborn')
+    tips = seaborn.load_dataset("tips")
+    seaborn.stripplot(x="day", y="total_bill", data=tips)
+
+
+def test_pandas_gbq(df):
+
+    pandas_gbq = import_module('pandas_gbq')  # noqa
+
+
+@pytest.mark.xfail(reason="0.7.0 pending")
+@tm.network
+def test_pandas_datareader():
+
+    pandas_datareader = import_module('pandas_datareader')  # noqa
+    pandas_datareader.DataReader(
+        'F', 'quandl', '2017-01-01', '2017-02-01')
+
+
+def test_geopandas():
+
+    geopandas = import_module('geopandas')  # noqa
+    fp = geopandas.datasets.get_path('naturalearth_lowres')
+    assert geopandas.read_file(fp) is not None
+
+
+def test_pyarrow(df):
+
+    pyarrow = import_module('pyarrow')  # noqa
+    table = pyarrow.Table.from_pandas(df)
+    result = table.to_pandas()
+    tm.assert_frame_equal(result, df)
diff --git a/pandas/tests/test_dtypes.py b/pandas/tests/test_dtypes.py
deleted file mode 100644
index 4403465576848..0000000000000
--- a/pandas/tests/test_dtypes.py
+++ /dev/null
@@ -1,166 +0,0 @@
-# -*- coding: utf-8 -*-
-from itertools import product
-
-import nose
-import numpy as np
-from pandas import Series, Categorical, date_range
-import pandas.core.common as com
-from pandas.core.common import (CategoricalDtype, is_categorical_dtype, is_categorical,
-                                DatetimeTZDtype, is_datetime64tz_dtype, is_datetimetz,
-                                is_dtype_equal, is_datetime64_ns_dtype, is_datetime64_dtype)
-import pandas.util.testing as tm
-
-_multiprocess_can_split_ = True
-
-class Base(object):
-
-    def test_hash(self):
-        hash(self.dtype)
-
-    def test_equality_invalid(self):
-        self.assertRaises(self.dtype == 'foo')
-
-    def test_numpy_informed(self):
-
-        # np.dtype doesn't know about our new dtype
-        def f():
-            np.dtype(self.dtype)
-        self.assertRaises(TypeError, f)
-
-        self.assertNotEqual(self.dtype, np.str_)
-        self.assertNotEqual(np.str_, self.dtype)
-
-    def test_pickle(self):
-        result = self.round_trip_pickle(self.dtype)
-        self.assertEqual(result, self.dtype)
-
-class TestCategoricalDtype(Base, tm.TestCase):
-
-    def setUp(self):
-        self.dtype = CategoricalDtype()
-
-    def test_equality(self):
-        self.assertTrue(is_dtype_equal(self.dtype, 'category'))
-        self.assertTrue(is_dtype_equal(self.dtype, CategoricalDtype()))
-        self.assertFalse(is_dtype_equal(self.dtype, 'foo'))
-
-    def test_construction_from_string(self):
-        result = CategoricalDtype.construct_from_string('category')
-        self.assertTrue(is_dtype_equal(self.dtype, result))
-        self.assertRaises(TypeError, lambda : CategoricalDtype.construct_from_string('foo'))
-
-    def test_is_dtype(self):
-        self.assertTrue(CategoricalDtype.is_dtype(self.dtype))
-        self.assertTrue(CategoricalDtype.is_dtype('category'))
-        self.assertTrue(CategoricalDtype.is_dtype(CategoricalDtype()))
-        self.assertFalse(CategoricalDtype.is_dtype('foo'))
-        self.assertFalse(CategoricalDtype.is_dtype(np.float64))
-
-    def test_basic(self):
-
-        self.assertTrue(is_categorical_dtype(self.dtype))
-
-        factor = Categorical.from_array(['a', 'b', 'b', 'a',
-                                         'a', 'c', 'c', 'c'])
-
-        s = Series(factor,name='A')
-
-        # dtypes
-        self.assertTrue(is_categorical_dtype(s.dtype))
-        self.assertTrue(is_categorical_dtype(s))
-        self.assertFalse(is_categorical_dtype(np.dtype('float64')))
-
-        self.assertTrue(is_categorical(s.dtype))
-        self.assertTrue(is_categorical(s))
-        self.assertFalse(is_categorical(np.dtype('float64')))
-        self.assertFalse(is_categorical(1.0))
-
-class TestDatetimeTZDtype(Base, tm.TestCase):
-
-    def setUp(self):
-        self.dtype = DatetimeTZDtype('ns','US/Eastern')
-
-    def test_construction(self):
-        self.assertRaises(ValueError, lambda : DatetimeTZDtype('ms','US/Eastern'))
-
-    def test_subclass(self):
-        a = DatetimeTZDtype('datetime64[ns, US/Eastern]')
-        b = DatetimeTZDtype('datetime64[ns, CET]')
-
-        self.assertTrue(issubclass(type(a), type(a)))
-        self.assertTrue(issubclass(type(a), type(b)))
-
-    def test_compat(self):
-        self.assertFalse(is_datetime64_ns_dtype(self.dtype))
-        self.assertFalse(is_datetime64_ns_dtype('datetime64[ns, US/Eastern]'))
-        self.assertFalse(is_datetime64_dtype(self.dtype))
-        self.assertFalse(is_datetime64_dtype('datetime64[ns, US/Eastern]'))
-
-    def test_construction_from_string(self):
-        result = DatetimeTZDtype('datetime64[ns, US/Eastern]')
-        self.assertTrue(is_dtype_equal(self.dtype, result))
-        result = DatetimeTZDtype.construct_from_string('datetime64[ns, US/Eastern]')
-        self.assertTrue(is_dtype_equal(self.dtype, result))
-        self.assertRaises(TypeError, lambda : DatetimeTZDtype.construct_from_string('foo'))
-
-    def test_is_dtype(self):
-        self.assertTrue(DatetimeTZDtype.is_dtype(self.dtype))
-        self.assertTrue(DatetimeTZDtype.is_dtype('datetime64[ns, US/Eastern]'))
-        self.assertFalse(DatetimeTZDtype.is_dtype('foo'))
-        self.assertTrue(DatetimeTZDtype.is_dtype(DatetimeTZDtype('ns','US/Pacific')))
-        self.assertFalse(DatetimeTZDtype.is_dtype(np.float64))
-
-    def test_equality(self):
-        self.assertTrue(is_dtype_equal(self.dtype, 'datetime64[ns, US/Eastern]'))
-        self.assertTrue(is_dtype_equal(self.dtype, DatetimeTZDtype('ns','US/Eastern')))
-        self.assertFalse(is_dtype_equal(self.dtype, 'foo'))
-        self.assertFalse(is_dtype_equal(self.dtype, DatetimeTZDtype('ns','CET')))
-        self.assertFalse(is_dtype_equal(DatetimeTZDtype('ns','US/Eastern'), DatetimeTZDtype('ns','US/Pacific')))
-
-        # numpy compat
-        self.assertTrue(is_dtype_equal(np.dtype("M8[ns]"),"datetime64[ns]"))
-
-    def test_basic(self):
-
-        self.assertTrue(is_datetime64tz_dtype(self.dtype))
-
-        dr = date_range('20130101',periods=3,tz='US/Eastern')
-        s = Series(dr,name='A')
-
-        # dtypes
-        self.assertTrue(is_datetime64tz_dtype(s.dtype))
-        self.assertTrue(is_datetime64tz_dtype(s))
-        self.assertFalse(is_datetime64tz_dtype(np.dtype('float64')))
-        self.assertFalse(is_datetime64tz_dtype(1.0))
-
-        self.assertTrue(is_datetimetz(s))
-        self.assertTrue(is_datetimetz(s.dtype))
-        self.assertFalse(is_datetimetz(np.dtype('float64')))
-        self.assertFalse(is_datetimetz(1.0))
-
-    def test_dst(self):
-
-        dr1 = date_range('2013-01-01', periods=3, tz='US/Eastern')
-        s1 = Series(dr1, name='A')
-        self.assertTrue(is_datetimetz(s1))
-
-        dr2 = date_range('2013-08-01', periods=3, tz='US/Eastern')
-        s2 = Series(dr2, name='A')
-        self.assertTrue(is_datetimetz(s2))
-        self.assertEqual(s1.dtype, s2.dtype)
-
-    def test_parser(self):
-        # pr #11245
-        for tz, constructor in product(('UTC', 'US/Eastern'),
-                                       ('M8', 'datetime64')):
-            self.assertEqual(
-                DatetimeTZDtype('%s[ns, %s]' % (constructor, tz)),
-                DatetimeTZDtype('ns', tz),
-            )
-
-
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_errors.py b/pandas/tests/test_errors.py
new file mode 100644
index 0000000000000..7f9cddf9859a5
--- /dev/null
+++ b/pandas/tests/test_errors.py
@@ -0,0 +1,81 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+from warnings import catch_warnings
+import pandas  # noqa
+import pandas as pd
+from pandas.errors import AbstractMethodError
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize(
+    "exc", ['UnsupportedFunctionCall', 'UnsortedIndexError',
+            'OutOfBoundsDatetime',
+            'ParserError', 'PerformanceWarning', 'DtypeWarning',
+            'EmptyDataError', 'ParserWarning', 'MergeError'])
+def test_exception_importable(exc):
+    from pandas import errors
+    e = getattr(errors, exc)
+    assert e is not None
+
+    # check that we can raise on them
+    with pytest.raises(e):
+        raise e()
+
+
+def test_catch_oob():
+    from pandas import errors
+
+    try:
+        pd.Timestamp('15000101')
+    except errors.OutOfBoundsDatetime:
+        pass
+
+
+def test_error_rename():
+    # see gh-12665
+    from pandas.errors import ParserError
+    from pandas.io.common import CParserError
+
+    try:
+        raise CParserError()
+    except ParserError:
+        pass
+
+    try:
+        raise ParserError()
+    except CParserError:
+        pass
+
+    with catch_warnings(record=True):
+        try:
+            raise ParserError()
+        except pd.parser.CParserError:
+            pass
+
+
+class Foo(object):
+    @classmethod
+    def classmethod(cls):
+        raise AbstractMethodError(cls, methodtype='classmethod')
+
+    @property
+    def property(self):
+        raise AbstractMethodError(self, methodtype='property')
+
+    def method(self):
+        raise AbstractMethodError(self)
+
+
+def test_AbstractMethodError_classmethod():
+    xpr = "This classmethod must be defined in the concrete class Foo"
+    with tm.assert_raises_regex(AbstractMethodError, xpr):
+        Foo.classmethod()
+
+    xpr = "This property must be defined in the concrete class Foo"
+    with tm.assert_raises_regex(AbstractMethodError, xpr):
+        Foo().property
+
+    xpr = "This method must be defined in the concrete class Foo"
+    with tm.assert_raises_regex(AbstractMethodError, xpr):
+        Foo().method()
diff --git a/pandas/tests/test_expressions.py b/pandas/tests/test_expressions.py
index 3bd76dfb9da61..56e00fa8af23d 100644
--- a/pandas/tests/test_expressions.py
+++ b/pandas/tests/test_expressions.py
@@ -2,76 +2,81 @@
 from __future__ import print_function
 # pylint: disable-msg=W0612,E1101
 
-import nose
+from warnings import catch_warnings
 import re
+import operator
+import pytest
 
 from numpy.random import randn
 
-import operator
 import numpy as np
 
 from pandas.core.api import DataFrame, Panel
-from pandas.computation import expressions as expr
-from pandas import compat
-
+from pandas.core.computation import expressions as expr
+from pandas import compat, _np_version_under1p11, _np_version_under1p13
 from pandas.util.testing import (assert_almost_equal, assert_series_equal,
-                                 assert_frame_equal, assert_panel_equal,
-                                 assert_panel4d_equal)
+                                 assert_frame_equal, assert_panel_equal)
+from pandas.io.formats.printing import pprint_thing
 import pandas.util.testing as tm
-from numpy.testing.decorators import slow
-
-
-if not expr._USE_NUMEXPR:
-    try:
-        import numexpr
-    except ImportError:
-        msg = "don't have"
-    else:
-        msg = "not using"
-    raise nose.SkipTest("{0} numexpr".format(msg))
-
-_frame  = DataFrame(randn(10000, 4), columns=list('ABCD'), dtype='float64')
-_frame2 = DataFrame(randn(100, 4),   columns = list('ABCD'), dtype='float64')
-_mixed  = DataFrame({ 'A' : _frame['A'].copy(), 'B' : _frame['B'].astype('float32'), 'C' : _frame['C'].astype('int64'), 'D' : _frame['D'].astype('int32') })
-_mixed2 = DataFrame({ 'A' : _frame2['A'].copy(), 'B' : _frame2['B'].astype('float32'), 'C' : _frame2['C'].astype('int64'), 'D' : _frame2['D'].astype('int32') })
-_integer  = DataFrame(np.random.randint(1, 100, size=(10001, 4)), columns = list('ABCD'), dtype='int64')
-_integer2 = DataFrame(np.random.randint(1, 100, size=(101, 4)),
-                      columns=list('ABCD'), dtype='int64')
-_frame_panel = Panel(dict(ItemA=_frame.copy(), ItemB=(_frame.copy() + 3), ItemC=_frame.copy(), ItemD=_frame.copy()))
-_frame2_panel = Panel(dict(ItemA=_frame2.copy(), ItemB=(_frame2.copy() + 3),
-                           ItemC=_frame2.copy(), ItemD=_frame2.copy()))
-_integer_panel = Panel(dict(ItemA=_integer,
-                            ItemB=(_integer + 34).astype('int64')))
-_integer2_panel = Panel(dict(ItemA=_integer2,
-                             ItemB=(_integer2 + 34).astype('int64')))
-_mixed_panel = Panel(dict(ItemA=_mixed, ItemB=(_mixed + 3)))
-_mixed2_panel = Panel(dict(ItemA=_mixed2, ItemB=(_mixed2 + 3)))
-
 
-class TestExpressions(tm.TestCase):
 
-    _multiprocess_can_split_ = False
-
-    def setUp(self):
+_frame = DataFrame(randn(10000, 4), columns=list('ABCD'), dtype='float64')
+_frame2 = DataFrame(randn(100, 4), columns=list('ABCD'), dtype='float64')
+_mixed = DataFrame({'A': _frame['A'].copy(),
+                    'B': _frame['B'].astype('float32'),
+                    'C': _frame['C'].astype('int64'),
+                    'D': _frame['D'].astype('int32')})
+_mixed2 = DataFrame({'A': _frame2['A'].copy(),
+                     'B': _frame2['B'].astype('float32'),
+                     'C': _frame2['C'].astype('int64'),
+                     'D': _frame2['D'].astype('int32')})
+_integer = DataFrame(
+    np.random.randint(1, 100,
+                      size=(10001, 4)),
+    columns=list('ABCD'), dtype='int64')
+_integer2 = DataFrame(np.random.randint(1, 100, size=(101, 4)),
+                      columns=list('ABCD'), dtype='int64')
 
-        self.frame  = _frame.copy()
+with catch_warnings(record=True):
+    _frame_panel = Panel(dict(ItemA=_frame.copy(),
+                              ItemB=(_frame.copy() + 3),
+                              ItemC=_frame.copy(),
+                              ItemD=_frame.copy()))
+    _frame2_panel = Panel(dict(ItemA=_frame2.copy(),
+                               ItemB=(_frame2.copy() + 3),
+                               ItemC=_frame2.copy(),
+                               ItemD=_frame2.copy()))
+    _integer_panel = Panel(dict(ItemA=_integer,
+                                ItemB=(_integer + 34).astype('int64')))
+    _integer2_panel = Panel(dict(ItemA=_integer2,
+                                 ItemB=(_integer2 + 34).astype('int64')))
+    _mixed_panel = Panel(dict(ItemA=_mixed, ItemB=(_mixed + 3)))
+    _mixed2_panel = Panel(dict(ItemA=_mixed2, ItemB=(_mixed2 + 3)))
+
+
+@pytest.mark.skipif(not expr._USE_NUMEXPR, reason='not using numexpr')
+class TestExpressions(object):
+
+    def setup_method(self, method):
+
+        self.frame = _frame.copy()
         self.frame2 = _frame2.copy()
-        self.mixed  = _mixed.copy()
+        self.mixed = _mixed.copy()
         self.mixed2 = _mixed2.copy()
         self.integer = _integer.copy()
         self._MIN_ELEMENTS = expr._MIN_ELEMENTS
 
-    def tearDown(self):
+    def teardown_method(self, method):
         expr._MIN_ELEMENTS = self._MIN_ELEMENTS
 
-    @nose.tools.nottest
-    def run_arithmetic_test(self, df, other, assert_func, check_dtype=False,
-                            test_flex=True):
+    def run_arithmetic(self, df, other, assert_func, check_dtype=False,
+                       test_flex=True):
         expr._MIN_ELEMENTS = 0
-        operations = ['add', 'sub', 'mul', 'mod', 'truediv', 'floordiv', 'pow']
+        operations = ['add', 'sub', 'mul', 'mod', 'truediv', 'floordiv']
         if not compat.PY3:
             operations.append('div')
         for arith in operations:
+
             operator_name = arith
             if arith == 'div':
                 operator_name = 'truediv'
@@ -84,6 +89,7 @@ def run_arithmetic_test(self, df, other, assert_func, check_dtype=False,
             expr.set_use_numexpr(False)
             expected = op(df, other)
             expr.set_use_numexpr(True)
+
             result = op(df, other)
             try:
                 if check_dtype:
@@ -91,19 +97,18 @@ def run_arithmetic_test(self, df, other, assert_func, check_dtype=False,
                         assert expected.dtype.kind == 'f'
                 assert_func(expected, result)
             except Exception:
-                com.pprint_thing("Failed test with operator %r" % op.__name__)
+                pprint_thing("Failed test with operator %r" % op.__name__)
                 raise
 
     def test_integer_arithmetic(self):
-        self.run_arithmetic_test(self.integer, self.integer,
-                                 assert_frame_equal)
-        self.run_arithmetic_test(self.integer.iloc[:,0], self.integer.iloc[:, 0],
-                                 assert_series_equal, check_dtype=True)
-
-    @nose.tools.nottest
-    def run_binary_test(self, df, other, assert_func,
-                        test_flex=False, numexpr_ops=set(['gt', 'lt', 'ge',
-                                                          'le', 'eq', 'ne'])):
+        self.run_arithmetic(self.integer, self.integer,
+                            assert_frame_equal)
+        self.run_arithmetic(self.integer.iloc[:, 0],
+                            self.integer.iloc[:, 0], assert_series_equal,
+                            check_dtype=True)
+
+    def run_binary(self, df, other, assert_func, test_flex=False,
+                   numexpr_ops=set(['gt', 'lt', 'ge', 'le', 'eq', 'ne'])):
         """
         tests solely that the result is the same whether or not numexpr is
         enabled.  Need to test whether the function does the correct thing
@@ -112,6 +117,7 @@ def run_binary_test(self, df, other, assert_func,
         expr._MIN_ELEMENTS = 0
         expr.set_test_mode(True)
         operations = ['gt', 'lt', 'ge', 'le', 'eq', 'ne']
+
         for arith in operations:
             if test_flex:
                 op = lambda x, y: getattr(df, arith)(y)
@@ -131,52 +137,52 @@ def run_binary_test(self, df, other, assert_func,
                     assert not used_numexpr, "Used numexpr unexpectedly."
                 assert_func(expected, result)
             except Exception:
-                com.pprint_thing("Failed test with operation %r" % arith)
-                com.pprint_thing("test_flex was %r" % test_flex)
+                pprint_thing("Failed test with operation %r" % arith)
+                pprint_thing("test_flex was %r" % test_flex)
                 raise
 
     def run_frame(self, df, other, binary_comp=None, run_binary=True,
                   **kwargs):
-        self.run_arithmetic_test(df, other, assert_frame_equal,
-                                 test_flex=False, **kwargs)
-        self.run_arithmetic_test(df, other, assert_frame_equal, test_flex=True,
-                                 **kwargs)
+        self.run_arithmetic(df, other, assert_frame_equal,
+                            test_flex=False, **kwargs)
+        self.run_arithmetic(df, other, assert_frame_equal, test_flex=True,
+                            **kwargs)
         if run_binary:
             if binary_comp is None:
                 expr.set_use_numexpr(False)
                 binary_comp = other + 1
                 expr.set_use_numexpr(True)
-            self.run_binary_test(df, binary_comp, assert_frame_equal,
-                                 test_flex=False, **kwargs)
-            self.run_binary_test(df, binary_comp, assert_frame_equal,
-                                 test_flex=True, **kwargs)
+            self.run_binary(df, binary_comp, assert_frame_equal,
+                            test_flex=False, **kwargs)
+            self.run_binary(df, binary_comp, assert_frame_equal,
+                            test_flex=True, **kwargs)
 
     def run_series(self, ser, other, binary_comp=None, **kwargs):
-        self.run_arithmetic_test(ser, other, assert_series_equal,
-                                 test_flex=False, **kwargs)
-        self.run_arithmetic_test(ser, other, assert_almost_equal,
-                                 test_flex=True, **kwargs)
+        self.run_arithmetic(ser, other, assert_series_equal,
+                            test_flex=False, **kwargs)
+        self.run_arithmetic(ser, other, assert_almost_equal,
+                            test_flex=True, **kwargs)
         # series doesn't uses vec_compare instead of numexpr...
         # if binary_comp is None:
         #     binary_comp = other + 1
-        # self.run_binary_test(ser, binary_comp, assert_frame_equal, test_flex=False,
-        #         **kwargs)
-        # self.run_binary_test(ser, binary_comp, assert_frame_equal, test_flex=True,
-        #         **kwargs)
+        # self.run_binary(ser, binary_comp, assert_frame_equal,
+        # test_flex=False, **kwargs)
+        # self.run_binary(ser, binary_comp, assert_frame_equal,
+        # test_flex=True, **kwargs)
 
     def run_panel(self, panel, other, binary_comp=None, run_binary=True,
                   assert_func=assert_panel_equal, **kwargs):
-        self.run_arithmetic_test(panel, other, assert_func, test_flex=False,
-                                 **kwargs)
-        self.run_arithmetic_test(panel, other, assert_func, test_flex=True,
-                                 **kwargs)
+        self.run_arithmetic(panel, other, assert_func, test_flex=False,
+                            **kwargs)
+        self.run_arithmetic(panel, other, assert_func, test_flex=True,
+                            **kwargs)
         if run_binary:
             if binary_comp is None:
                 binary_comp = other + 1
-            self.run_binary_test(panel, binary_comp, assert_func,
-                                 test_flex=False, **kwargs)
-            self.run_binary_test(panel, binary_comp, assert_func,
-                                 test_flex=True, **kwargs)
+            self.run_binary(panel, binary_comp, assert_func,
+                            test_flex=False, **kwargs)
+            self.run_binary(panel, binary_comp, assert_func,
+                            test_flex=True, **kwargs)
 
     def test_integer_arithmetic_frame(self):
         self.run_frame(self.integer, self.integer)
@@ -184,7 +190,7 @@ def test_integer_arithmetic_frame(self):
     def test_integer_arithmetic_series(self):
         self.run_series(self.integer.iloc[:, 0], self.integer.iloc[:, 0])
 
-    @slow
+    @pytest.mark.slow
     def test_integer_panel(self):
         self.run_panel(_integer2_panel, np.random.randint(1, 100))
 
@@ -194,15 +200,10 @@ def test_float_arithemtic_frame(self):
     def test_float_arithmetic_series(self):
         self.run_series(self.frame2.iloc[:, 0], self.frame2.iloc[:, 0])
 
-    @slow
+    @pytest.mark.slow
     def test_float_panel(self):
         self.run_panel(_frame2_panel, np.random.randn() + 0.1, binary_comp=0.8)
 
-    @slow
-    def test_panel4d(self):
-        self.run_panel(tm.makePanel4D(), np.random.randn() + 0.5,
-                       assert_func=assert_panel4d_equal, binary_comp=3)
-
     def test_mixed_arithmetic_frame(self):
         # TODO: FIGURE OUT HOW TO GET IT TO WORK...
         # can't do arithmetic because comparison methods try to do *entire*
@@ -213,68 +214,89 @@ def test_mixed_arithmetic_series(self):
         for col in self.mixed2.columns:
             self.run_series(self.mixed2[col], self.mixed2[col], binary_comp=4)
 
-    @slow
+    @pytest.mark.slow
     def test_mixed_panel(self):
         self.run_panel(_mixed2_panel, np.random.randint(1, 100),
                        binary_comp=-2)
 
     def test_float_arithemtic(self):
-        self.run_arithmetic_test(self.frame, self.frame, assert_frame_equal)
-        self.run_arithmetic_test(self.frame.iloc[:, 0], self.frame.iloc[:, 0],
-                                 assert_series_equal, check_dtype=True)
+        self.run_arithmetic(self.frame, self.frame, assert_frame_equal)
+        self.run_arithmetic(self.frame.iloc[:, 0], self.frame.iloc[:, 0],
+                            assert_series_equal, check_dtype=True)
 
     def test_mixed_arithmetic(self):
-        self.run_arithmetic_test(self.mixed, self.mixed, assert_frame_equal)
+        self.run_arithmetic(self.mixed, self.mixed, assert_frame_equal)
         for col in self.mixed.columns:
-            self.run_arithmetic_test(self.mixed[col], self.mixed[col],
-                                     assert_series_equal)
+            self.run_arithmetic(self.mixed[col], self.mixed[col],
+                                assert_series_equal)
 
     def test_integer_with_zeros(self):
         self.integer *= np.random.randint(0, 2, size=np.shape(self.integer))
-        self.run_arithmetic_test(self.integer, self.integer, assert_frame_equal)
-        self.run_arithmetic_test(self.integer.iloc[:, 0], self.integer.iloc[:, 0],
-                                 assert_series_equal)
+        self.run_arithmetic(self.integer, self.integer,
+                            assert_frame_equal)
+        self.run_arithmetic(self.integer.iloc[:, 0],
+                            self.integer.iloc[:, 0], assert_series_equal)
 
     def test_invalid(self):
 
         # no op
-        result   = expr._can_use_numexpr(operator.add, None, self.frame, self.frame, 'evaluate')
-        self.assertFalse(result)
+        result = expr._can_use_numexpr(operator.add, None, self.frame,
+                                       self.frame, 'evaluate')
+        assert not result
 
         # mixed
-        result   = expr._can_use_numexpr(operator.add, '+', self.mixed, self.frame, 'evaluate')
-        self.assertFalse(result)
+        result = expr._can_use_numexpr(operator.add, '+', self.mixed,
+                                       self.frame, 'evaluate')
+        assert not result
 
         # min elements
-        result   = expr._can_use_numexpr(operator.add, '+', self.frame2, self.frame2, 'evaluate')
-        self.assertFalse(result)
+        result = expr._can_use_numexpr(operator.add, '+', self.frame2,
+                                       self.frame2, 'evaluate')
+        assert not result
 
         # ok, we only check on first part of expression
-        result   = expr._can_use_numexpr(operator.add, '+', self.frame, self.frame2, 'evaluate')
-        self.assertTrue(result)
+        result = expr._can_use_numexpr(operator.add, '+', self.frame,
+                                       self.frame2, 'evaluate')
+        assert result
 
     def test_binary_ops(self):
-
         def testit():
 
-            for f, f2 in [ (self.frame, self.frame2), (self.mixed, self.mixed2) ]:
+            for f, f2 in [(self.frame, self.frame2),
+                          (self.mixed, self.mixed2)]:
+
+                for op, op_str in [('add', '+'), ('sub', '-'), ('mul', '*'),
+                                   ('div', '/'), ('pow', '**')]:
+
+                    # numpy >= 1.11 doesn't handle integers
+                    # raised to integer powers
+                    # https://github.com/pandas-dev/pandas/issues/15363
+                    if op == 'pow' and not _np_version_under1p11:
+                        continue
 
-                for op, op_str in [('add','+'),('sub','-'),('mul','*'),('div','/'),('pow','**')]:
                     if op == 'div':
                         op = getattr(operator, 'truediv', None)
                     else:
                         op = getattr(operator, op, None)
                     if op is not None:
-                        result   = expr._can_use_numexpr(op, op_str, f, f, 'evaluate')
-                        self.assertNotEqual(result, f._is_mixed_type)
+                        result = expr._can_use_numexpr(op, op_str, f, f,
+                                                       'evaluate')
+                        assert result != f._is_mixed_type
 
-                        result   = expr.evaluate(op, op_str, f, f, use_numexpr=True)
-                        expected = expr.evaluate(op, op_str, f, f, use_numexpr=False)
-                        tm.assert_numpy_array_equal(result,expected.values)
+                        result = expr.evaluate(op, op_str, f, f,
+                                               use_numexpr=True)
+                        expected = expr.evaluate(op, op_str, f, f,
+                                                 use_numexpr=False)
 
-                        result   = expr._can_use_numexpr(op, op_str, f2, f2, 'evaluate')
-                        self.assertFalse(result)
+                        if isinstance(result, DataFrame):
+                            tm.assert_frame_equal(result, expected)
+                        else:
+                            tm.assert_numpy_array_equal(result,
+                                                        expected.values)
 
+                        result = expr._can_use_numexpr(op, op_str, f2, f2,
+                                                       'evaluate')
+                        assert not result
 
         expr.set_use_numexpr(False)
         testit()
@@ -285,10 +307,9 @@ def testit():
         testit()
 
     def test_boolean_ops(self):
-
-
         def testit():
-            for f, f2 in [ (self.frame, self.frame2), (self.mixed, self.mixed2) ]:
+            for f, f2 in [(self.frame, self.frame2),
+                          (self.mixed, self.mixed2)]:
 
                 f11 = f
                 f12 = f + 1
@@ -296,19 +317,27 @@ def testit():
                 f21 = f2
                 f22 = f2 + 1
 
-                for op, op_str in [('gt','>'),('lt','<'),('ge','>='),('le','<='),('eq','=='),('ne','!=')]:
+                for op, op_str in [('gt', '>'), ('lt', '<'), ('ge', '>='),
+                                   ('le', '<='), ('eq', '=='), ('ne', '!=')]:
 
-                    op = getattr(operator,op)
+                    op = getattr(operator, op)
 
-                    result   = expr._can_use_numexpr(op, op_str, f11, f12, 'evaluate')
-                    self.assertNotEqual(result, f11._is_mixed_type)
+                    result = expr._can_use_numexpr(op, op_str, f11, f12,
+                                                   'evaluate')
+                    assert result != f11._is_mixed_type
 
-                    result   = expr.evaluate(op, op_str, f11, f12, use_numexpr=True)
-                    expected = expr.evaluate(op, op_str, f11, f12, use_numexpr=False)
-                    tm.assert_numpy_array_equal(result,expected.values)
+                    result = expr.evaluate(op, op_str, f11, f12,
+                                           use_numexpr=True)
+                    expected = expr.evaluate(op, op_str, f11, f12,
+                                             use_numexpr=False)
+                    if isinstance(result, DataFrame):
+                        tm.assert_frame_equal(result, expected)
+                    else:
+                        tm.assert_numpy_array_equal(result, expected.values)
 
-                    result   = expr._can_use_numexpr(op, op_str, f21, f22, 'evaluate')
-                    self.assertFalse(result)
+                    result = expr._can_use_numexpr(op, op_str, f21, f22,
+                                                   'evaluate')
+                    assert not result
 
         expr.set_use_numexpr(False)
         testit()
@@ -319,18 +348,16 @@ def testit():
         testit()
 
     def test_where(self):
-
         def testit():
-            for f in [ self.frame, self.frame2, self.mixed, self.mixed2 ]:
-
+            for f in [self.frame, self.frame2, self.mixed, self.mixed2]:
 
-                for cond in [ True, False ]:
+                for cond in [True, False]:
 
-                    c = np.empty(f.shape,dtype=np.bool_)
+                    c = np.empty(f.shape, dtype=np.bool_)
                     c.fill(cond)
-                    result   = expr.where(c, f.values, f.values+1)
-                    expected = np.where(c, f.values, f.values+1)
-                    tm.assert_numpy_array_equal(result,expected)
+                    result = expr.where(c, f.values, f.values + 1)
+                    expected = np.where(c, f.values, f.values + 1)
+                    tm.assert_numpy_array_equal(result, expected)
 
         expr.set_use_numexpr(False)
         testit()
@@ -351,22 +378,22 @@ def test_bool_ops_raise_on_arithmetic(self):
                 f = getattr(operator, name)
                 err_msg = re.escape(msg % op)
 
-                with tm.assertRaisesRegexp(NotImplementedError, err_msg):
+                with tm.assert_raises_regex(NotImplementedError, err_msg):
                     f(df, df)
 
-                with tm.assertRaisesRegexp(NotImplementedError, err_msg):
+                with tm.assert_raises_regex(NotImplementedError, err_msg):
                     f(df.a, df.b)
 
-                with tm.assertRaisesRegexp(NotImplementedError, err_msg):
+                with tm.assert_raises_regex(NotImplementedError, err_msg):
                     f(df.a, True)
 
-                with tm.assertRaisesRegexp(NotImplementedError, err_msg):
+                with tm.assert_raises_regex(NotImplementedError, err_msg):
                     f(False, df.a)
 
-                with tm.assertRaisesRegexp(TypeError, err_msg):
+                with tm.assert_raises_regex(TypeError, err_msg):
                     f(False, df)
 
-                with tm.assertRaisesRegexp(TypeError, err_msg):
+                with tm.assert_raises_regex(TypeError, err_msg):
                     f(df, True)
 
     def test_bool_ops_warn_on_arithmetic(self):
@@ -381,6 +408,10 @@ def test_bool_ops_warn_on_arithmetic(self):
             f = getattr(operator, name)
             fe = getattr(operator, sub_funcs[subs[op]])
 
+            # >= 1.13.0 these are now TypeErrors
+            if op == '-' and not _np_version_under1p13:
+                continue
+
             with tm.use_numexpr(True, min_elements=5):
                 with tm.assert_produces_warning(check_stacklevel=False):
                     r = f(df, df)
@@ -411,9 +442,3 @@ def test_bool_ops_warn_on_arithmetic(self):
                     r = f(df, True)
                     e = fe(df, True)
                     tm.assert_frame_equal(r, e)
-
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_format.py b/pandas/tests/test_format.py
deleted file mode 100644
index 140b54225b8e8..0000000000000
--- a/pandas/tests/test_format.py
+++ /dev/null
@@ -1,4082 +0,0 @@
-# -*- coding: utf-8 -*-
-from __future__ import print_function
-from distutils.version import LooseVersion
-import re
-
-from pandas.compat import range, zip, lrange, StringIO, PY3, lzip, u
-import pandas.compat as compat
-import itertools
-import os
-import sys
-from textwrap import dedent
-import warnings
-
-from numpy import nan
-from numpy.random import randn
-import numpy as np
-
-div_style = ''
-try:
-    import IPython
-    if IPython.__version__ < LooseVersion('3.0.0'):
-        div_style = ' style="max-width:1500px;overflow:auto;"'
-except ImportError:
-    pass
-
-from pandas import DataFrame, Series, Index, Timestamp, MultiIndex, date_range, NaT
-
-import pandas.core.format as fmt
-import pandas.util.testing as tm
-import pandas.core.common as com
-from pandas.util.terminal import get_terminal_size
-import pandas as pd
-from pandas.core.config import (set_option, get_option,
-                                option_context, reset_option)
-from datetime import datetime
-
-import nose
-
-_frame = DataFrame(tm.getSeriesData())
-
-
-def curpath():
-    pth, _ = os.path.split(os.path.abspath(__file__))
-    return pth
-
-def has_info_repr(df):
-    r = repr(df)
-    c1 = r.split('\n')[0].startswith("<class")
-    c2 = r.split('\n')[0].startswith(r"&lt;class")  # _repr_html_
-    return c1 or c2
-
-def has_non_verbose_info_repr(df):
-    has_info = has_info_repr(df)
-    r = repr(df)
-    nv = len(r.split('\n')) == 6  # 1. <class>, 2. Index, 3. Columns, 4. dtype, 5. memory usage, 6. trailing newline
-    return has_info and nv
-
-def has_horizontally_truncated_repr(df):
-    try: # Check header row
-        fst_line = np.array(repr(df).splitlines()[0].split())
-        cand_col = np.where(fst_line=='...')[0][0]
-    except:
-        return False
-    # Make sure each row has this ... in the same place
-    r = repr(df)
-    for ix,l in enumerate(r.splitlines()):
-        if not r.split()[cand_col] == '...':
-            return False
-    return True
-
-def has_vertically_truncated_repr(df):
-    r = repr(df)
-    only_dot_row = False
-    for row in r.splitlines():
-        if re.match('^[\.\ ]+$',row):
-            only_dot_row = True
-    return only_dot_row
-
-def has_truncated_repr(df):
-    return has_horizontally_truncated_repr(df) or has_vertically_truncated_repr(df)
-
-def has_doubly_truncated_repr(df):
-    return has_horizontally_truncated_repr(df) and has_vertically_truncated_repr(df)
-
-def has_expanded_repr(df):
-    r = repr(df)
-    for line in r.split('\n'):
-        if line.endswith('\\'):
-            return True
-    return False
-
-class TestDataFrameFormatting(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.warn_filters = warnings.filters
-        warnings.filterwarnings('ignore',
-                                category=FutureWarning,
-                                module=".*format")
-
-        self.frame = _frame.copy()
-
-    def tearDown(self):
-        warnings.filters = self.warn_filters
-
-    def test_repr_embedded_ndarray(self):
-        arr = np.empty(10, dtype=[('err', object)])
-        for i in range(len(arr)):
-            arr['err'][i] = np.random.randn(i)
-
-        df = DataFrame(arr)
-        repr(df['err'])
-        repr(df)
-        df.to_string()
-
-    def test_eng_float_formatter(self):
-        self.frame.ix[5] = 0
-
-        fmt.set_eng_float_format()
-        repr(self.frame)
-
-        fmt.set_eng_float_format(use_eng_prefix=True)
-        repr(self.frame)
-
-        fmt.set_eng_float_format(accuracy=0)
-        repr(self.frame)
-        self.reset_display_options()
-
-    def test_show_null_counts(self):
-
-        df = DataFrame(1,columns=range(10),index=range(10))
-        df.iloc[1,1] = np.nan
-
-        def check(null_counts, result):
-            buf = StringIO()
-            df.info(buf=buf, null_counts=null_counts)
-            self.assertTrue(('non-null' in buf.getvalue()) is result)
-
-        with option_context('display.max_info_rows',20,'display.max_info_columns',20):
-            check(None, True)
-            check(True, True)
-            check(False, False)
-
-        with option_context('display.max_info_rows',5,'display.max_info_columns',5):
-            check(None, False)
-            check(True, False)
-            check(False, False)
-
-    def test_repr_tuples(self):
-        buf = StringIO()
-
-        df = DataFrame({'tups': lzip(range(10), range(10))})
-        repr(df)
-        df.to_string(col_space=10, buf=buf)
-
-    def test_repr_truncation(self):
-        max_len = 20
-        with option_context("display.max_colwidth", max_len):
-            df = DataFrame({'A': np.random.randn(10),
-                            'B': [tm.rands(np.random.randint(max_len - 1,
-                                                             max_len + 1)) for i in range(10)]})
-            r = repr(df)
-            r = r[r.find('\n') + 1:]
-
-            adj = fmt._get_adjustment()
-
-            for line, value in lzip(r.split('\n'), df['B']):
-                if adj.len(value) + 1 > max_len:
-                    self.assertIn('...', line)
-                else:
-                    self.assertNotIn('...', line)
-
-        with option_context("display.max_colwidth", 999999):
-            self.assertNotIn('...', repr(df))
-
-        with option_context("display.max_colwidth", max_len + 2):
-            self.assertNotIn('...', repr(df))
-
-    def test_repr_chop_threshold(self):
-        df = DataFrame([[0.1, 0.5],[0.5, -0.1]])
-        pd.reset_option("display.chop_threshold") # default None
-        self.assertEqual(repr(df), '     0    1\n0  0.1  0.5\n1  0.5 -0.1')
-
-        with option_context("display.chop_threshold", 0.2 ):
-            self.assertEqual(repr(df), '     0    1\n0  0.0  0.5\n1  0.5  0.0')
-
-        with option_context("display.chop_threshold", 0.6 ):
-            self.assertEqual(repr(df), '   0  1\n0  0  0\n1  0  0')
-
-        with option_context("display.chop_threshold", None ):
-            self.assertEqual(repr(df),  '     0    1\n0  0.1  0.5\n1  0.5 -0.1')
-
-    def test_repr_obeys_max_seq_limit(self):
-        with option_context("display.max_seq_items",2000):
-            self.assertTrue(len(com.pprint_thing(lrange(1000))) > 1000)
-
-        with option_context("display.max_seq_items",5):
-            self.assertTrue(len(com.pprint_thing(lrange(1000))) < 100)
-
-    def test_repr_set(self):
-        self.assertEqual(com.pprint_thing(set([1])), '{1}')
-
-    def test_repr_is_valid_construction_code(self):
-        # for the case of Index, where the repr is traditional rather then stylized
-        idx = Index(['a','b'])
-        res = eval("pd."+repr(idx))
-        tm.assert_series_equal(Series(res),Series(idx))
-
-    def test_repr_should_return_str(self):
-        # http://docs.python.org/py3k/reference/datamodel.html#object.__repr__
-        # http://docs.python.org/reference/datamodel.html#object.__repr__
-        # "...The return value must be a string object."
-
-        # (str on py2.x, str (unicode) on py3)
-
-
-        data = [8, 5, 3, 5]
-        index1 = [u("\u03c3"), u("\u03c4"), u("\u03c5"),
-                  u("\u03c6")]
-        cols = [u("\u03c8")]
-        df = DataFrame(data, columns=cols, index=index1)
-        self.assertTrue(type(df.__repr__()) == str)  # both py2 / 3
-
-    def test_repr_no_backslash(self):
-        with option_context('mode.sim_interactive', True):
-            df = DataFrame(np.random.randn(10, 4))
-            self.assertTrue('\\' not in repr(df))
-
-    def test_expand_frame_repr(self):
-        df_small = DataFrame('hello', [0], [0])
-        df_wide = DataFrame('hello', [0], lrange(10))
-        df_tall = DataFrame('hello', lrange(30), lrange(5))
-
-        with option_context('mode.sim_interactive', True):
-            with option_context('display.max_columns', 10,
-                                'display.width',20,
-                                'display.max_rows', 20,
-                                'display.show_dimensions', True):
-                with option_context('display.expand_frame_repr', True):
-                    self.assertFalse(has_truncated_repr(df_small))
-                    self.assertFalse(has_expanded_repr(df_small))
-                    self.assertFalse(has_truncated_repr(df_wide))
-                    self.assertTrue(has_expanded_repr(df_wide))
-                    self.assertTrue(has_vertically_truncated_repr(df_tall))
-                    self.assertTrue(has_expanded_repr(df_tall))
-
-                with option_context('display.expand_frame_repr', False):
-                    self.assertFalse(has_truncated_repr(df_small))
-                    self.assertFalse(has_expanded_repr(df_small))
-                    self.assertFalse(has_horizontally_truncated_repr(df_wide))
-                    self.assertFalse(has_expanded_repr(df_wide))
-                    self.assertTrue(has_vertically_truncated_repr(df_tall))
-                    self.assertFalse(has_expanded_repr(df_tall))
-
-    def test_repr_non_interactive(self):
-        # in non interactive mode, there can be no dependency on the
-        # result of terminal auto size detection
-        df = DataFrame('hello', lrange(1000), lrange(5))
-
-        with option_context('mode.sim_interactive', False,
-                            'display.width', 0,
-                            'display.height', 0,
-                            'display.max_rows',5000):
-            self.assertFalse(has_truncated_repr(df))
-            self.assertFalse(has_expanded_repr(df))
-
-    def test_repr_max_columns_max_rows(self):
-        term_width, term_height = get_terminal_size()
-        if term_width < 10 or term_height < 10:
-            raise nose.SkipTest("terminal size too small, "
-                                "{0} x {1}".format(term_width, term_height))
-
-        def mkframe(n):
-            index = ['%05d' % i for i in range(n)]
-            return DataFrame(0, index, index)
-
-        df6 = mkframe(6)
-        df10 = mkframe(10)
-        with option_context('mode.sim_interactive', True):
-            with option_context('display.width', term_width * 2):
-                with option_context('display.max_rows', 5,
-                                    'display.max_columns', 5):
-                    self.assertFalse(has_expanded_repr(mkframe(4)))
-                    self.assertFalse(has_expanded_repr(mkframe(5)))
-                    self.assertFalse(has_expanded_repr(df6))
-                    self.assertTrue(has_doubly_truncated_repr(df6))
-
-                with option_context('display.max_rows', 20,
-                                    'display.max_columns', 10):
-                    # Out off max_columns boundary, but no extending
-                    # since not exceeding width
-                    self.assertFalse(has_expanded_repr(df6))
-                    self.assertFalse(has_truncated_repr(df6))
-
-                with option_context('display.max_rows', 9,
-                                    'display.max_columns', 10):
-                    # out vertical bounds can not result in exanded repr
-                    self.assertFalse(has_expanded_repr(df10))
-                    self.assertTrue(has_vertically_truncated_repr(df10))
-
-            # width=None in terminal, auto detection
-            with option_context('display.max_columns', 100,
-                                'display.max_rows', term_width * 20,
-                                'display.width', None):
-                df = mkframe((term_width // 7) - 2)
-                self.assertFalse(has_expanded_repr(df))
-                df = mkframe((term_width // 7) + 2)
-                com.pprint_thing(df._repr_fits_horizontal_())
-                self.assertTrue(has_expanded_repr(df))
-
-    def test_str_max_colwidth(self):
-        # GH 7856
-        df = pd.DataFrame([{'a': 'foo', 'b': 'bar',
-                            'c': 'uncomfortably long line with lots of stuff',
-                            'd': 1},
-                           {'a': 'foo', 'b': 'bar', 'c': 'stuff', 'd': 1}])
-        df.set_index(['a', 'b', 'c'])
-        self.assertTrue(str(df) == '     a    b                                           c  d\n'
-                                   '0  foo  bar  uncomfortably long line with lots of stuff  1\n'
-                                   '1  foo  bar                                       stuff  1')
-        with option_context('max_colwidth', 20):
-            self.assertTrue(str(df) == '     a    b                    c  d\n'
-                                       '0  foo  bar  uncomfortably lo...  1\n'
-                                       '1  foo  bar                stuff  1')
-
-    def test_auto_detect(self):
-        term_width, term_height = get_terminal_size()
-        fac = 1.05  # Arbitrary large factor to exceed term widht
-        cols = range(int(term_width * fac))
-        index = range(10)
-        df = DataFrame(index=index, columns=cols)
-        with option_context('mode.sim_interactive', True):
-            with option_context('max_rows',None):
-                with option_context('max_columns',None):
-                    # Wrap around with None
-                    self.assertTrue(has_expanded_repr(df))
-            with option_context('max_rows',0):
-                with option_context('max_columns',0):
-                    # Truncate with auto detection.
-                    self.assertTrue(has_horizontally_truncated_repr(df))
-
-            index = range(int(term_height * fac))
-            df = DataFrame(index=index, columns=cols)
-            with option_context('max_rows',0):
-                with option_context('max_columns',None):
-                    # Wrap around with None
-                    self.assertTrue(has_expanded_repr(df))
-                    # Truncate vertically
-                    self.assertTrue(has_vertically_truncated_repr(df))
-
-            with option_context('max_rows',None):
-                with option_context('max_columns',0):
-                    self.assertTrue(has_horizontally_truncated_repr(df))
-
-
-    def test_to_string_repr_unicode(self):
-        buf = StringIO()
-
-        unicode_values = [u('\u03c3')] * 10
-        unicode_values = np.array(unicode_values, dtype=object)
-        df = DataFrame({'unicode': unicode_values})
-        df.to_string(col_space=10, buf=buf)
-
-        # it works!
-        repr(df)
-
-        idx = Index(['abc', u('\u03c3a'), 'aegdvg'])
-        ser = Series(np.random.randn(len(idx)), idx)
-        rs = repr(ser).split('\n')
-        line_len = len(rs[0])
-        for line in rs[1:]:
-            try:
-                line = line.decode(get_option("display.encoding"))
-            except:
-                pass
-            if not line.startswith('dtype:'):
-                self.assertEqual(len(line), line_len)
-
-        # it works even if sys.stdin in None
-        _stdin= sys.stdin
-        try:
-            sys.stdin = None
-            repr(df)
-        finally:
-            sys.stdin = _stdin
-
-    def test_to_string_unicode_columns(self):
-        df = DataFrame({u('\u03c3'): np.arange(10.)})
-
-        buf = StringIO()
-        df.to_string(buf=buf)
-        buf.getvalue()
-
-        buf = StringIO()
-        df.info(buf=buf)
-        buf.getvalue()
-
-        result = self.frame.to_string()
-        tm.assertIsInstance(result, compat.text_type)
-
-    def test_to_string_utf8_columns(self):
-        n = u("\u05d0").encode('utf-8')
-
-        with option_context('display.max_rows', 1):
-            df = DataFrame([1, 2], columns=[n])
-            repr(df)
-
-    def test_to_string_unicode_two(self):
-        dm = DataFrame({u('c/\u03c3'): []})
-        buf = StringIO()
-        dm.to_string(buf)
-
-    def test_to_string_unicode_three(self):
-        dm = DataFrame(['\xc2'])
-        buf = StringIO()
-        dm.to_string(buf)
-
-    def test_to_string_with_formatters(self):
-        df = DataFrame({'int': [1, 2, 3],
-                        'float': [1.0, 2.0, 3.0],
-                        'object': [(1, 2), True, False]},
-                       columns=['int', 'float', 'object'])
-
-        formatters = [('int', lambda x: '0x%x' % x),
-                      ('float', lambda x: '[% 4.1f]' % x),
-                      ('object', lambda x: '-%s-' % str(x))]
-        result = df.to_string(formatters=dict(formatters))
-        result2 = df.to_string(formatters=lzip(*formatters)[1])
-        self.assertEqual(result, ('  int  float    object\n'
-                                  '0 0x1 [ 1.0]  -(1, 2)-\n'
-                                  '1 0x2 [ 2.0]    -True-\n'
-                                  '2 0x3 [ 3.0]   -False-'))
-        self.assertEqual(result, result2)
-
-    def test_to_string_with_formatters_unicode(self):
-        df = DataFrame({u('c/\u03c3'): [1, 2, 3]})
-        result = df.to_string(formatters={u('c/\u03c3'):
-                              lambda x: '%s' % x})
-        self.assertEqual(result, u('  c/\u03c3\n') +
-                                 '0   1\n1   2\n2   3')
-
-    def test_east_asian_unicode_frame(self):
-        if PY3:
-            _rep = repr
-        else:
-            _rep = unicode
-
-        # not alighned properly because of east asian width
-
-        # mid col
-        df = DataFrame({'a': [u'あ', u'いいい', u'う', u'ええええええ'],
-                        'b': [1, 222, 33333, 4]},
-                       index=['a', 'bb', 'c', 'ddd'])
-        expected = (u"          a      b\na         あ      1\n"
-                    u"bb      いいい    222\nc         う  33333\n"
-                    u"ddd  ええええええ      4")
-        self.assertEqual(_rep(df), expected)
-
-        # last col
-        df = DataFrame({'a': [1, 222, 33333, 4],
-                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                       index=['a', 'bb', 'c', 'ddd'])
-        expected = (u"         a       b\na        1       あ\n"
-                    u"bb     222     いいい\nc    33333       う\n"
-                    u"ddd      4  ええええええ")
-        self.assertEqual(_rep(df), expected)
-
-        # all col
-        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                       index=['a', 'bb', 'c', 'ddd'])
-        expected = (u"         a       b\na    あああああ       あ\n"
-                    u"bb       い     いいい\nc        う       う\n"
-                    u"ddd    えええ  ええええええ")
-        self.assertEqual(_rep(df), expected)
-
-        # column name
-        df = DataFrame({u'あああああ': [1, 222, 33333, 4],
-                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                       index=['a', 'bb', 'c', 'ddd'])
-        expected = (u"          b  あああああ\na         あ      1\n"
-                    u"bb      いいい    222\nc         う  33333\n"
-                    u"ddd  ええええええ      4")
-        self.assertEqual(_rep(df), expected)
-
-        # index
-        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                       index=[u'あああ', u'いいいいいい', u'うう', u'え'])
-        expected = (u"            a       b\nあああ     あああああ       あ\n"
-                    u"いいいいいい      い     いいい\nうう          う       う\n"
-                    u"え         えええ  ええええええ")
-        self.assertEqual(_rep(df), expected)
-
-        # index name
-        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                       index=pd.Index([u'あ', u'い', u'うう', u'え'], name=u'おおおお'))
-        expected = (u"          a       b\nおおおお               \nあ     あああああ       あ\n"
-                    u"い         い     いいい\nうう        う       う\nえ       えええ  ええええええ")
-        self.assertEqual(_rep(df), expected)
-
-        # all
-        df = DataFrame({u'あああ': [u'あああ', u'い', u'う', u'えええええ'],
-                        u'いいいいい': [u'あ', u'いいい', u'う', u'ええ']},
-                       index=pd.Index([u'あ', u'いいい', u'うう', u'え'], name=u'お'))
-        expected = (u"       あああ いいいいい\nお               \nあ      あああ     あ\n"
-                    u"いいい      い   いいい\nうう       う     う\nえ    えええええ    ええ")
-        self.assertEqual(_rep(df), expected)
-
-        # MultiIndex
-        idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'),
-                                         (u'おおお', u'かかかか'), (u'き', u'くく')])
-        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                        'b': [u'あ', u'いいい', u'う', u'ええええええ']}, index=idx)
-        expected = (u"              a       b\nあ   いい    あああああ       あ\n"
-                    u"う   え         い     いいい\nおおお かかかか      う       う\n"
-                    u"き   くく      えええ  ええええええ")
-        self.assertEqual(_rep(df), expected)
-
-        # truncate
-        with option_context('display.max_rows', 3, 'display.max_columns', 3):
-            df = pd.DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                               'b': [u'あ', u'いいい', u'う', u'ええええええ'],
-                               'c': [u'お', u'か', u'ききき', u'くくくくくく'],
-                               u'ああああ': [u'さ', u'し', u'す', u'せ']},
-                              columns=['a', 'b', 'c', u'ああああ'])
-
-            expected = (u"        a ...  ああああ\n0   あああああ ...     さ\n"
-                        u"..    ... ...   ...\n3     えええ ...     せ\n"
-                        u"\n[4 rows x 4 columns]")
-            self.assertEqual(_rep(df), expected)
-
-            df.index = [u'あああ', u'いいいい',  u'う', 'aaa']
-            expected = (u"         a ...  ああああ\nあああ  あああああ ...     さ\n"
-                        u"..     ... ...   ...\naaa    えええ ...     せ\n"
-                        u"\n[4 rows x 4 columns]")
-            self.assertEqual(_rep(df), expected)
-
-        # Emable Unicode option -----------------------------------------
-        with option_context('display.unicode.east_asian_width', True):
-
-            # mid col
-            df = DataFrame({'a': [u'あ', u'いいい', u'う', u'ええええええ'],
-                          'b': [1, 222, 33333, 4]},
-                         index=['a', 'bb', 'c', 'ddd'])
-            expected = (u"                a      b\na              あ      1\n"
-                        u"bb         いいい    222\nc              う  33333\n"
-                        u"ddd  ええええええ      4")
-            self.assertEqual(_rep(df), expected)
-
-            # last col
-            df = DataFrame({'a': [1, 222, 33333, 4],
-                          'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                         index=['a', 'bb', 'c', 'ddd'])
-            expected = (u"         a             b\na        1            あ\n"
-                        u"bb     222        いいい\nc    33333            う\n"
-                        u"ddd      4  ええええええ")
-            self.assertEqual(_rep(df), expected)
-
-            # all col
-            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                          'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                         index=['a', 'bb', 'c', 'ddd'])
-            expected = (u"              a             b\na    あああああ            あ\n"
-                        u"bb           い        いいい\nc            う            う\n"
-                        u"ddd      えええ  ええええええ""")
-            self.assertEqual(_rep(df), expected)
-
-            # column name
-            df = DataFrame({u'あああああ': [1, 222, 33333, 4],
-                          'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                         index=['a', 'bb', 'c', 'ddd'])
-            expected = (u"                b  あああああ\na              あ           1\n"
-                        u"bb         いいい         222\nc              う       33333\n"
-                        u"ddd  ええええええ           4")
-            self.assertEqual(_rep(df), expected)
-
-            # index
-            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                           index=[u'あああ', u'いいいいいい', u'うう', u'え'])
-            expected = (u"                       a             b\nあああ        あああああ            あ\n"
-                        u"いいいいいい          い        いいい\nうう                  う            う\n"
-                        u"え                えええ  ええええええ")
-            self.assertEqual(_rep(df), expected)
-
-            # index name
-            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                           index=pd.Index([u'あ', u'い', u'うう', u'え'], name=u'おおおお'))
-            expected = (u"                   a             b\nおおおお                          \n"
-                        u"あ        あああああ            あ\nい                い        いいい\n"
-                        u"うう              う            う\nえ            えええ  ええええええ")
-            self.assertEqual(_rep(df), expected)
-
-            # all
-            df = DataFrame({u'あああ': [u'あああ', u'い', u'う', u'えええええ'],
-                            u'いいいいい': [u'あ', u'いいい', u'う', u'ええ']},
-                           index=pd.Index([u'あ', u'いいい', u'うう', u'え'], name=u'お'))
-            expected = (u"            あああ いいいいい\nお                           \n"
-                        u"あ          あああ         あ\nいいい          い     いいい\n"
-                        u"うう            う         う\nえ      えええええ       ええ")
-            self.assertEqual(_rep(df), expected)
-
-            # MultiIndex
-            idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'),
-                                             (u'おおお', u'かかかか'), (u'き', u'くく')])
-            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                            'b': [u'あ', u'いいい', u'う', u'ええええええ']}, index=idx)
-            expected = (u"                          a             b\nあ     いい      あああああ            あ\n"
-                        u"う     え                い        いいい\nおおお かかかか          う            う\n"
-                        u"き     くく          えええ  ええええええ")
-            self.assertEqual(_rep(df), expected)
-
-            # truncate
-            with option_context('display.max_rows', 3, 'display.max_columns', 3):
-
-                df = pd.DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                                   'b': [u'あ', u'いいい', u'う', u'ええええええ'],
-                                   'c': [u'お', u'か', u'ききき', u'くくくくくく'],
-                                   u'ああああ': [u'さ', u'し', u'す', u'せ']},
-                                  columns=['a', 'b', 'c', u'ああああ'])
-
-                expected = (u"             a   ...    ああああ\n0   あああああ   ...          さ\n"
-                            u"..         ...   ...         ...\n3       えええ   ...          せ\n"
-                            u"\n[4 rows x 4 columns]")
-                self.assertEqual(_rep(df), expected)
-
-                df.index = [u'あああ', u'いいいい',  u'う', 'aaa']
-                expected = (u"                 a   ...    ああああ\nあああ  あああああ   ...          さ\n"
-                            u"...            ...   ...         ...\naaa         えええ   ...          せ\n"
-                            u"\n[4 rows x 4 columns]")
-                self.assertEqual(_rep(df), expected)
-
-            # ambiguous unicode
-            df = DataFrame({u'あああああ': [1, 222, 33333, 4],
-                          'b': [u'あ', u'いいい', u'¡¡', u'ええええええ']},
-                         index=['a', 'bb', 'c', '¡¡¡'])
-            expected = (u"                b  あああああ\na              あ           1\n"
-                        u"bb         いいい         222\nc              ¡¡       33333\n"
-                        u"¡¡¡  ええええええ           4")
-            self.assertEqual(_rep(df), expected)
-
-    def test_to_string_buffer_all_unicode(self):
-        buf = StringIO()
-
-        empty = DataFrame({u('c/\u03c3'): Series()})
-        nonempty = DataFrame({u('c/\u03c3'): Series([1, 2, 3])})
-
-        print(empty, file=buf)
-        print(nonempty, file=buf)
-
-        # this should work
-        buf.getvalue()
-
-    def test_to_string_with_col_space(self):
-        df = DataFrame(np.random.random(size=(1, 3)))
-        c10 = len(df.to_string(col_space=10).split("\n")[1])
-        c20 = len(df.to_string(col_space=20).split("\n")[1])
-        c30 = len(df.to_string(col_space=30).split("\n")[1])
-        self.assertTrue(c10 < c20 < c30)
-
-        # GH 8230
-        # col_space wasn't being applied with header=False
-        with_header = df.to_string(col_space=20)
-        with_header_row1 = with_header.splitlines()[1]
-        no_header = df.to_string(col_space=20, header=False)
-        self.assertEqual(len(with_header_row1), len(no_header))
-
-    def test_to_string_truncate_indices(self):
-        for index in [ tm.makeStringIndex, tm.makeUnicodeIndex, tm.makeIntIndex,
-                       tm.makeDateIndex, tm.makePeriodIndex ]:
-            for column in [ tm.makeStringIndex ]:
-                for h in [10,20]:
-                    for w in [10,20]:
-                        with option_context("display.expand_frame_repr",False):
-                            df = DataFrame(index=index(h), columns=column(w))
-                            with option_context("display.max_rows", 15):
-                                if h == 20:
-                                    self.assertTrue(has_vertically_truncated_repr(df))
-                                else:
-                                    self.assertFalse(has_vertically_truncated_repr(df))
-                            with option_context("display.max_columns", 15):
-                                if w == 20:
-                                    self.assertTrue(has_horizontally_truncated_repr(df))
-                                else:
-                                    self.assertFalse(has_horizontally_truncated_repr(df))
-                            with option_context("display.max_rows", 15,"display.max_columns", 15):
-                                if h == 20 and w == 20:
-                                    self.assertTrue(has_doubly_truncated_repr(df))
-                                else:
-                                    self.assertFalse(has_doubly_truncated_repr(df))
-
-    def test_to_string_truncate_multilevel(self):
-        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-        df = DataFrame(index=arrays,columns=arrays)
-        with option_context("display.max_rows", 7,"display.max_columns", 7):
-            self.assertTrue(has_doubly_truncated_repr(df))
-
-
-    def test_to_html_with_col_space(self):
-        def check_with_width(df, col_space):
-            import re
-            # check that col_space affects HTML generation
-            # and be very brittle about it.
-            html = df.to_html(col_space=col_space)
-            hdrs = [x for x in html.split("\n") if re.search("<th[>\s]", x)]
-            self.assertTrue(len(hdrs) > 0)
-            for h in hdrs:
-                self.assertTrue("min-width" in h)
-                self.assertTrue(str(col_space) in h)
-
-        df = DataFrame(np.random.random(size=(1, 3)))
-
-        check_with_width(df, 30)
-        check_with_width(df, 50)
-
-    def test_to_html_with_empty_string_label(self):
-        # GH3547, to_html regards empty string labels as repeated labels
-        data = {'c1': ['a', 'b'], 'c2': ['a', ''], 'data': [1, 2]}
-        df = DataFrame(data).set_index(['c1', 'c2'])
-        res = df.to_html()
-        self.assertTrue("rowspan" not in res)
-
-    def test_to_html_unicode(self):
-        df = DataFrame({u('\u03c3'): np.arange(10.)})
-        expected = u'<table border="1" class="dataframe">\n  <thead>\n    <tr style="text-align: right;">\n      <th></th>\n      <th>\u03c3</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>0</th>\n      <td>0</td>\n    </tr>\n    <tr>\n      <th>1</th>\n      <td>1</td>\n    </tr>\n    <tr>\n      <th>2</th>\n      <td>2</td>\n    </tr>\n    <tr>\n      <th>3</th>\n      <td>3</td>\n    </tr>\n    <tr>\n      <th>4</th>\n      <td>4</td>\n    </tr>\n    <tr>\n      <th>5</th>\n      <td>5</td>\n    </tr>\n    <tr>\n      <th>6</th>\n      <td>6</td>\n    </tr>\n    <tr>\n      <th>7</th>\n      <td>7</td>\n    </tr>\n    <tr>\n      <th>8</th>\n      <td>8</td>\n    </tr>\n    <tr>\n      <th>9</th>\n      <td>9</td>\n    </tr>\n  </tbody>\n</table>'
-        self.assertEqual(df.to_html(), expected)
-        df = DataFrame({'A': [u('\u03c3')]})
-        expected = u'<table border="1" class="dataframe">\n  <thead>\n    <tr style="text-align: right;">\n      <th></th>\n      <th>A</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>0</th>\n      <td>\u03c3</td>\n    </tr>\n  </tbody>\n</table>'
-        self.assertEqual(df.to_html(), expected)
-
-    def test_to_html_escaped(self):
-        a = 'str<ing1 &amp;'
-        b = 'stri>ng2 &amp;'
-
-        test_dict = {'co<l1': {a: "<type 'str'>",
-                               b: "<type 'str'>"},
-                     'co>l2':{a: "<type 'str'>",
-                              b: "<type 'str'>"}}
-        rs = DataFrame(test_dict).to_html()
-        xp = """<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th>co&lt;l1</th>
-      <th>co&gt;l2</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>str&lt;ing1 &amp;amp;</th>
-      <td>&lt;type 'str'&gt;</td>
-      <td>&lt;type 'str'&gt;</td>
-    </tr>
-    <tr>
-      <th>stri&gt;ng2 &amp;amp;</th>
-      <td>&lt;type 'str'&gt;</td>
-      <td>&lt;type 'str'&gt;</td>
-    </tr>
-  </tbody>
-</table>"""
-        self.assertEqual(xp, rs)
-
-    def test_to_html_escape_disabled(self):
-        a = 'str<ing1 &amp;'
-        b = 'stri>ng2 &amp;'
-
-        test_dict = {'co<l1': {a: "<b>bold</b>",
-                               b: "<b>bold</b>"},
-                     'co>l2': {a: "<b>bold</b>",
-                               b: "<b>bold</b>"}}
-        rs = DataFrame(test_dict).to_html(escape=False)
-        xp = """<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th>co<l1</th>
-      <th>co>l2</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>str<ing1 &amp;</th>
-      <td><b>bold</b></td>
-      <td><b>bold</b></td>
-    </tr>
-    <tr>
-      <th>stri>ng2 &amp;</th>
-      <td><b>bold</b></td>
-      <td><b>bold</b></td>
-    </tr>
-  </tbody>
-</table>"""
-        self.assertEqual(xp, rs)
-
-    def test_to_html_multiindex_index_false(self):
-        # issue 8452
-        df = DataFrame({
-            'a': range(2),
-            'b': range(3, 5),
-            'c': range(5, 7),
-            'd': range(3, 5)}
-        )
-        df.columns = MultiIndex.from_product([['a', 'b'], ['c', 'd']])
-        result = df.to_html(index=False)
-        expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr>
-      <th colspan="2" halign="left">a</th>
-      <th colspan="2" halign="left">b</th>
-    </tr>
-    <tr>
-      <th>c</th>
-      <th>d</th>
-      <th>c</th>
-      <th>d</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <td>0</td>
-      <td>3</td>
-      <td>5</td>
-      <td>3</td>
-    </tr>
-    <tr>
-      <td>1</td>
-      <td>4</td>
-      <td>6</td>
-      <td>4</td>
-    </tr>
-  </tbody>
-</table>"""
-        self.assertEqual(result, expected)
-
-        df.index = Index(df.index.values, name='idx')
-        result = df.to_html(index=False)
-        self.assertEqual(result, expected)
-
-    def test_to_html_multiindex_sparsify_false_multi_sparse(self):
-        with option_context('display.multi_sparse', False):
-            index = MultiIndex.from_arrays([[0, 0, 1, 1], [0, 1, 0, 1]],
-                                              names=['foo', None])
-
-            df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]], index=index)
-
-            result = df.to_html()
-            expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th></th>
-      <th>0</th>
-      <th>1</th>
-    </tr>
-    <tr>
-      <th>foo</th>
-      <th></th>
-      <th></th>
-      <th></th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>0</th>
-      <th>0</th>
-      <td>0</td>
-      <td>1</td>
-    </tr>
-    <tr>
-      <th>0</th>
-      <th>1</th>
-      <td>2</td>
-      <td>3</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <th>0</th>
-      <td>4</td>
-      <td>5</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <th>1</th>
-      <td>6</td>
-      <td>7</td>
-    </tr>
-  </tbody>
-</table>"""
-            self.assertEqual(result, expected)
-
-            df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]],
-                           columns=index[::2], index=index)
-
-            result = df.to_html()
-            expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr>
-      <th></th>
-      <th>foo</th>
-      <th>0</th>
-      <th>1</th>
-    </tr>
-    <tr>
-      <th></th>
-      <th></th>
-      <th>0</th>
-      <th>0</th>
-    </tr>
-    <tr>
-      <th>foo</th>
-      <th></th>
-      <th></th>
-      <th></th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>0</th>
-      <th>0</th>
-      <td>0</td>
-      <td>1</td>
-    </tr>
-    <tr>
-      <th>0</th>
-      <th>1</th>
-      <td>2</td>
-      <td>3</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <th>0</th>
-      <td>4</td>
-      <td>5</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <th>1</th>
-      <td>6</td>
-      <td>7</td>
-    </tr>
-  </tbody>
-</table>"""
-            self.assertEqual(result, expected)
-
-    def test_to_html_multiindex_sparsify(self):
-        index = MultiIndex.from_arrays([[0, 0, 1, 1], [0, 1, 0, 1]],
-                                          names=['foo', None])
-
-        df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]], index=index)
-
-        result = df.to_html()
-        expected = """<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th></th>
-      <th>0</th>
-      <th>1</th>
-    </tr>
-    <tr>
-      <th>foo</th>
-      <th></th>
-      <th></th>
-      <th></th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th rowspan="2" valign="top">0</th>
-      <th>0</th>
-      <td>0</td>
-      <td>1</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <td>2</td>
-      <td>3</td>
-    </tr>
-    <tr>
-      <th rowspan="2" valign="top">1</th>
-      <th>0</th>
-      <td>4</td>
-      <td>5</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <td>6</td>
-      <td>7</td>
-    </tr>
-  </tbody>
-</table>"""
-        self.assertEqual(result, expected)
-
-        df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]],
-                       columns=index[::2], index=index)
-
-        result = df.to_html()
-        expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr>
-      <th></th>
-      <th>foo</th>
-      <th>0</th>
-      <th>1</th>
-    </tr>
-    <tr>
-      <th></th>
-      <th></th>
-      <th>0</th>
-      <th>0</th>
-    </tr>
-    <tr>
-      <th>foo</th>
-      <th></th>
-      <th></th>
-      <th></th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th rowspan="2" valign="top">0</th>
-      <th>0</th>
-      <td>0</td>
-      <td>1</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <td>2</td>
-      <td>3</td>
-    </tr>
-    <tr>
-      <th rowspan="2" valign="top">1</th>
-      <th>0</th>
-      <td>4</td>
-      <td>5</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <td>6</td>
-      <td>7</td>
-    </tr>
-  </tbody>
-</table>"""
-        self.assertEqual(result, expected)
-
-    def test_to_html_index_formatter(self):
-        df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]],
-                       columns=['foo', None], index=lrange(4))
-
-        f = lambda x: 'abcd'[x]
-        result = df.to_html(formatters={'__index__': f})
-        expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th>foo</th>
-      <th>None</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>a</th>
-      <td>0</td>
-      <td>1</td>
-    </tr>
-    <tr>
-      <th>b</th>
-      <td>2</td>
-      <td>3</td>
-    </tr>
-    <tr>
-      <th>c</th>
-      <td>4</td>
-      <td>5</td>
-    </tr>
-    <tr>
-      <th>d</th>
-      <td>6</td>
-      <td>7</td>
-    </tr>
-  </tbody>
-</table>"""
-        self.assertEqual(result, expected)
-
-    def test_to_html_regression_GH6098(self):
-        df = DataFrame({u('clé1'): [u('a'), u('a'), u('b'), u('b'), u('a')],
-                           u('clé2'): [u('1er'), u('2ème'), u('1er'), u('2ème'), u('1er')],
-                           'données1': np.random.randn(5),
-                           'données2': np.random.randn(5)})
-        # it works
-        df.pivot_table(index=[u('clé1')], columns=[u('clé2')])._repr_html_()
-
-    def test_to_html_truncate(self):
-        raise nose.SkipTest("unreliable on travis")
-        index = pd.DatetimeIndex(start='20010101',freq='D',periods=20)
-        df = DataFrame(index=index,columns=range(20))
-        fmt.set_option('display.max_rows',8)
-        fmt.set_option('display.max_columns',4)
-        result = df._repr_html_()
-        expected = '''\
-<div{0}>
-<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th>0</th>
-      <th>1</th>
-      <th>...</th>
-      <th>18</th>
-      <th>19</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>2001-01-01</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>2001-01-02</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>2001-01-03</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>2001-01-04</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-    </tr>
-    <tr>
-      <th>2001-01-17</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>2001-01-18</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>2001-01-19</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>2001-01-20</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-  </tbody>
-</table>
-<p>20 rows × 20 columns</p>
-</div>'''.format(div_style)
-        if compat.PY2:
-            expected = expected.decode('utf-8')
-        self.assertEqual(result, expected)
-
-    def test_to_html_truncate_multi_index(self):
-        raise nose.SkipTest("unreliable on travis")
-        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-        df = DataFrame(index=arrays,columns=arrays)
-        fmt.set_option('display.max_rows',7)
-        fmt.set_option('display.max_columns',7)
-        result = df._repr_html_()
-        expected = '''\
-<div{0}>
-<table border="1" class="dataframe">
-  <thead>
-    <tr>
-      <th></th>
-      <th></th>
-      <th colspan="2" halign="left">bar</th>
-      <th>baz</th>
-      <th>...</th>
-      <th>foo</th>
-      <th colspan="2" halign="left">qux</th>
-    </tr>
-    <tr>
-      <th></th>
-      <th></th>
-      <th>one</th>
-      <th>two</th>
-      <th>one</th>
-      <th>...</th>
-      <th>two</th>
-      <th>one</th>
-      <th>two</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th rowspan="2" valign="top">bar</th>
-      <th>one</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>two</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>baz</th>
-      <th>one</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <th>...</th>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-    </tr>
-    <tr>
-      <th>foo</th>
-      <th>two</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th rowspan="2" valign="top">qux</th>
-      <th>one</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>two</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-  </tbody>
-</table>
-<p>8 rows × 8 columns</p>
-</div>'''.format(div_style)
-        if compat.PY2:
-            expected = expected.decode('utf-8')
-        self.assertEqual(result, expected)
-
-    def test_to_html_truncate_multi_index_sparse_off(self):
-        raise nose.SkipTest("unreliable on travis")
-        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-        df = DataFrame(index=arrays,columns=arrays)
-        fmt.set_option('display.max_rows',7)
-        fmt.set_option('display.max_columns',7)
-        fmt.set_option('display.multi_sparse',False)
-        result = df._repr_html_()
-        expected = '''\
-<div{0}>
-<table border="1" class="dataframe">
-  <thead>
-    <tr>
-      <th></th>
-      <th></th>
-      <th>bar</th>
-      <th>bar</th>
-      <th>baz</th>
-      <th>...</th>
-      <th>foo</th>
-      <th>qux</th>
-      <th>qux</th>
-    </tr>
-    <tr>
-      <th></th>
-      <th></th>
-      <th>one</th>
-      <th>two</th>
-      <th>one</th>
-      <th>...</th>
-      <th>two</th>
-      <th>one</th>
-      <th>two</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>bar</th>
-      <th>one</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>bar</th>
-      <th>two</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>baz</th>
-      <th>one</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>foo</th>
-      <th>two</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>qux</th>
-      <th>one</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>qux</th>
-      <th>two</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-  </tbody>
-</table>
-<p>8 rows × 8 columns</p>
-</div>'''.format(div_style)
-        if compat.PY2:
-            expected = expected.decode('utf-8')
-        self.assertEqual(result, expected)
-
-
-
-    def test_nonunicode_nonascii_alignment(self):
-        df = DataFrame([["aa\xc3\xa4\xc3\xa4", 1], ["bbbb", 2]])
-        rep_str = df.to_string()
-        lines = rep_str.split('\n')
-        self.assertEqual(len(lines[1]), len(lines[2]))
-
-    def test_unicode_problem_decoding_as_ascii(self):
-        dm = DataFrame({u('c/\u03c3'): Series({'test': np.NaN})})
-        compat.text_type(dm.to_string())
-
-    def test_string_repr_encoding(self):
-        filepath = tm.get_data_path('unicode_series.csv')
-        df = pd.read_csv(filepath, header=None, encoding='latin1')
-        repr(df)
-        repr(df[1])
-
-    def test_repr_corner(self):
-        # representing infs poses no problems
-        df = DataFrame({'foo': np.inf * np.empty(10)})
-        repr(df)
-
-    def test_frame_info_encoding(self):
-        index = ['\'Til There Was You (1997)',
-                 'ldum klaka (Cold Fever) (1994)']
-        fmt.set_option('display.max_rows', 1)
-        df = DataFrame(columns=['a', 'b', 'c'], index=index)
-        repr(df)
-        repr(df.T)
-        fmt.set_option('display.max_rows', 200)
-
-    def test_pprint_thing(self):
-        from pandas.core.common import pprint_thing as pp_t
-
-        if PY3:
-            raise nose.SkipTest("doesn't work on Python 3")
-
-        self.assertEqual(pp_t('a') , u('a'))
-        self.assertEqual(pp_t(u('a')) , u('a'))
-        self.assertEqual(pp_t(None) , 'None')
-        self.assertEqual(pp_t(u('\u05d0'), quote_strings=True),
-                          u("u'\u05d0'"))
-        self.assertEqual(pp_t(u('\u05d0'), quote_strings=False),
-                          u('\u05d0'))
-        self.assertEqual(pp_t((u('\u05d0'),
-                                u('\u05d1')), quote_strings=True),
-                          u("(u'\u05d0', u'\u05d1')"))
-        self.assertEqual(pp_t((u('\u05d0'), (u('\u05d1'),
-                                                  u('\u05d2'))),
-                               quote_strings=True),
-                          u("(u'\u05d0', (u'\u05d1', u'\u05d2'))"))
-        self.assertEqual(pp_t(('foo', u('\u05d0'), (u('\u05d0'),
-                                                         u('\u05d0'))),
-                               quote_strings=True),
-                          u("(u'foo', u'\u05d0', (u'\u05d0', u'\u05d0'))"))
-
-        # escape embedded tabs in string
-        # GH #2038
-        self.assertTrue(not "\t" in pp_t("a\tb", escape_chars=("\t",)))
-
-    def test_wide_repr(self):
-        with option_context('mode.sim_interactive', True, 'display.show_dimensions', True):
-            max_cols = get_option('display.max_columns')
-            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
-            set_option('display.expand_frame_repr', False)
-            rep_str = repr(df)
-
-            assert "10 rows x %d columns" % (max_cols - 1) in rep_str
-            set_option('display.expand_frame_repr', True)
-            wide_repr = repr(df)
-            self.assertNotEqual(rep_str, wide_repr)
-
-            with option_context('display.width', 120):
-                wider_repr = repr(df)
-                self.assertTrue(len(wider_repr) < len(wide_repr))
-
-        reset_option('display.expand_frame_repr')
-
-    def test_wide_repr_wide_columns(self):
-        with option_context('mode.sim_interactive', True):
-            df = DataFrame(randn(5, 3), columns=['a' * 90, 'b' * 90, 'c' * 90])
-            rep_str = repr(df)
-
-            self.assertEqual(len(rep_str.splitlines()), 20)
-
-    def test_wide_repr_named(self):
-        with option_context('mode.sim_interactive', True):
-            max_cols = get_option('display.max_columns')
-            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
-            df.index.name = 'DataFrame Index'
-            set_option('display.expand_frame_repr', False)
-
-            rep_str = repr(df)
-            set_option('display.expand_frame_repr', True)
-            wide_repr = repr(df)
-            self.assertNotEqual(rep_str, wide_repr)
-
-            with option_context('display.width', 150):
-                wider_repr = repr(df)
-                self.assertTrue(len(wider_repr) < len(wide_repr))
-
-            for line in wide_repr.splitlines()[1::13]:
-                self.assertIn('DataFrame Index', line)
-
-        reset_option('display.expand_frame_repr')
-
-    def test_wide_repr_multiindex(self):
-        with option_context('mode.sim_interactive', True):
-            midx = MultiIndex.from_arrays(tm.rands_array(5, size=(2, 10)))
-            max_cols = get_option('display.max_columns')
-            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)),
-                           index=midx)
-            df.index.names = ['Level 0', 'Level 1']
-            set_option('display.expand_frame_repr', False)
-            rep_str = repr(df)
-            set_option('display.expand_frame_repr', True)
-            wide_repr = repr(df)
-            self.assertNotEqual(rep_str, wide_repr)
-
-            with option_context('display.width', 150):
-                wider_repr = repr(df)
-                self.assertTrue(len(wider_repr) < len(wide_repr))
-
-            for line in wide_repr.splitlines()[1::13]:
-                self.assertIn('Level 0 Level 1', line)
-
-        reset_option('display.expand_frame_repr')
-
-    def test_wide_repr_multiindex_cols(self):
-        with option_context('mode.sim_interactive', True):
-            max_cols = get_option('display.max_columns')
-            midx = MultiIndex.from_arrays(
-                tm.rands_array(5, size=(2, 10)))
-            mcols = MultiIndex.from_arrays(
-                tm.rands_array(3, size=(2, max_cols - 1)))
-            df = DataFrame(tm.rands_array(25, (10, max_cols - 1)),
-                           index=midx, columns=mcols)
-            df.index.names = ['Level 0', 'Level 1']
-            set_option('display.expand_frame_repr', False)
-            rep_str = repr(df)
-            set_option('display.expand_frame_repr', True)
-            wide_repr = repr(df)
-            self.assertNotEqual(rep_str, wide_repr)
-
-        with option_context('display.width', 150):
-            wider_repr = repr(df)
-            self.assertTrue(len(wider_repr) < len(wide_repr))
-
-        reset_option('display.expand_frame_repr')
-
-    def test_wide_repr_unicode(self):
-        with option_context('mode.sim_interactive', True):
-            max_cols = get_option('display.max_columns')
-            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
-            set_option('display.expand_frame_repr', False)
-            rep_str = repr(df)
-            set_option('display.expand_frame_repr', True)
-            wide_repr = repr(df)
-            self.assertNotEqual(rep_str, wide_repr)
-
-            with option_context('display.width', 150):
-                wider_repr = repr(df)
-                self.assertTrue(len(wider_repr) < len(wide_repr))
-
-        reset_option('display.expand_frame_repr')
-
-    def test_wide_repr_wide_long_columns(self):
-        with option_context('mode.sim_interactive', True):
-            df = DataFrame(
-                {'a': ['a' * 30, 'b' * 30], 'b': ['c' * 70, 'd' * 80]})
-
-            result = repr(df)
-            self.assertTrue('ccccc' in result)
-            self.assertTrue('ddddd' in result)
-
-    def test_long_series(self):
-        n = 1000
-        s = Series(np.random.randint(-50,50,n),index=['s%04d' % x for x in range(n)], dtype='int64')
-
-        import re
-        str_rep = str(s)
-        nmatches = len(re.findall('dtype',str_rep))
-        self.assertEqual(nmatches, 1)
-
-    def test_index_with_nan(self):
-        #  GH 2850
-        df = DataFrame({'id1': {0: '1a3', 1: '9h4'}, 'id2': {0: np.nan, 1: 'd67'},
-                        'id3': {0: '78d', 1: '79d'}, 'value': {0: 123, 1: 64}})
-
-        # multi-index
-        y = df.set_index(['id1', 'id2', 'id3'])
-        result = y.to_string()
-        expected = u('             value\nid1 id2 id3       \n1a3 NaN 78d    123\n9h4 d67 79d     64')
-        self.assertEqual(result, expected)
-
-        # index
-        y = df.set_index('id2')
-        result = y.to_string()
-        expected = u('     id1  id3  value\nid2                 \nNaN  1a3  78d    123\nd67  9h4  79d     64')
-        self.assertEqual(result, expected)
-
-        # with append (this failed in 0.12)
-        y = df.set_index(['id1', 'id2']).set_index('id3', append=True)
-        result = y.to_string()
-        expected = u('             value\nid1 id2 id3       \n1a3 NaN 78d    123\n9h4 d67 79d     64')
-        self.assertEqual(result, expected)
-
-        # all-nan in mi
-        df2 = df.copy()
-        df2.ix[:,'id2'] = np.nan
-        y = df2.set_index('id2')
-        result = y.to_string()
-        expected = u('     id1  id3  value\nid2                 \nNaN  1a3  78d    123\nNaN  9h4  79d     64')
-        self.assertEqual(result, expected)
-
-        # partial nan in mi
-        df2 = df.copy()
-        df2.ix[:,'id2'] = np.nan
-        y = df2.set_index(['id2','id3'])
-        result = y.to_string()
-        expected = u('         id1  value\nid2 id3            \nNaN 78d  1a3    123\n    79d  9h4     64')
-        self.assertEqual(result, expected)
-
-        df = DataFrame({'id1': {0: np.nan, 1: '9h4'}, 'id2': {0: np.nan, 1: 'd67'},
-                        'id3': {0: np.nan, 1: '79d'}, 'value': {0: 123, 1: 64}})
-
-        y = df.set_index(['id1','id2','id3'])
-        result = y.to_string()
-        expected = u('             value\nid1 id2 id3       \nNaN NaN NaN    123\n9h4 d67 79d     64')
-        self.assertEqual(result, expected)
-
-    def test_to_string(self):
-        from pandas import read_table
-        import re
-
-        # big mixed
-        biggie = DataFrame({'A': randn(200),
-                            'B': tm.makeStringIndex(200)},
-                           index=lrange(200))
-
-        biggie.loc[:20,'A'] = nan
-        biggie.loc[:20,'B'] = nan
-        s = biggie.to_string()
-
-        buf = StringIO()
-        retval = biggie.to_string(buf=buf)
-        self.assertIsNone(retval)
-        self.assertEqual(buf.getvalue(), s)
-
-        tm.assertIsInstance(s, compat.string_types)
-
-        # print in right order
-        result = biggie.to_string(columns=['B', 'A'], col_space=17,
-                                  float_format='%.5f'.__mod__)
-        lines = result.split('\n')
-        header = lines[0].strip().split()
-        joined = '\n'.join([re.sub('\s+', ' ', x).strip() for x in lines[1:]])
-        recons = read_table(StringIO(joined), names=header,
-                            header=None, sep=' ')
-        tm.assert_series_equal(recons['B'], biggie['B'])
-        self.assertEqual(recons['A'].count(), biggie['A'].count())
-        self.assertTrue((np.abs(recons['A'].dropna() -
-                                biggie['A'].dropna()) < 0.1).all())
-
-        # expected = ['B', 'A']
-        # self.assertEqual(header, expected)
-
-        result = biggie.to_string(columns=['A'], col_space=17)
-        header = result.split('\n')[0].strip().split()
-        expected = ['A']
-        self.assertEqual(header, expected)
-
-        biggie.to_string(columns=['B', 'A'],
-                         formatters={'A': lambda x: '%.1f' % x})
-
-        biggie.to_string(columns=['B', 'A'], float_format=str)
-        biggie.to_string(columns=['B', 'A'], col_space=12,
-                         float_format=str)
-
-        frame = DataFrame(index=np.arange(200))
-        frame.to_string()
-
-    def test_to_string_no_header(self):
-        df = DataFrame({'x': [1, 2, 3],
-                        'y': [4, 5, 6]})
-
-        df_s = df.to_string(header=False)
-        expected = "0  1  4\n1  2  5\n2  3  6"
-
-        self.assertEqual(df_s, expected)
-
-    def test_to_string_no_index(self):
-        df = DataFrame({'x': [1, 2, 3],
-                        'y': [4, 5, 6]})
-
-        df_s = df.to_string(index=False)
-        expected = " x  y\n 1  4\n 2  5\n 3  6"
-
-        self.assertEqual(df_s, expected)
-
-    def test_to_string_float_formatting(self):
-        self.reset_display_options()
-        fmt.set_option('display.precision', 5, 'display.column_space',
-                       12, 'display.notebook_repr_html', False)
-
-        df = DataFrame({'x': [0, 0.25, 3456.000, 12e+45, 1.64e+6,
-                              1.7e+8, 1.253456, np.pi, -1e6]})
-
-        df_s = df.to_string()
-
-        # Python 2.5 just wants me to be sad. And debian 32-bit
-        # sys.version_info[0] == 2 and sys.version_info[1] < 6:
-        if _three_digit_exp():
-            expected = ('              x\n0  0.00000e+000\n1  2.50000e-001\n'
-                        '2  3.45600e+003\n3  1.20000e+046\n4  1.64000e+006\n'
-                        '5  1.70000e+008\n6  1.25346e+000\n7  3.14159e+000\n'
-                        '8 -1.00000e+006')
-        else:
-            expected = ('             x\n0  0.00000e+00\n1  2.50000e-01\n'
-                        '2  3.45600e+03\n3  1.20000e+46\n4  1.64000e+06\n'
-                        '5  1.70000e+08\n6  1.25346e+00\n7  3.14159e+00\n'
-                        '8 -1.00000e+06')
-        self.assertEqual(df_s, expected)
-
-        df = DataFrame({'x': [3234, 0.253]})
-        df_s = df.to_string()
-
-        expected = ('          x\n'
-                    '0  3234.000\n'
-                    '1     0.253')
-        self.assertEqual(df_s, expected)
-
-        self.reset_display_options()
-        self.assertEqual(get_option("display.precision"), 6)
-
-        df = DataFrame({'x': [1e9, 0.2512]})
-        df_s = df.to_string()
-        # Python 2.5 just wants me to be sad. And debian 32-bit
-        # sys.version_info[0] == 2 and sys.version_info[1] < 6:
-        if _three_digit_exp():
-            expected = ('               x\n'
-                        '0  1.000000e+009\n'
-                        '1  2.512000e-001')
-        else:
-            expected = ('              x\n'
-                        '0  1.000000e+09\n'
-                        '1  2.512000e-01')
-        self.assertEqual(df_s, expected)
-
-    def test_to_string_small_float_values(self):
-        df = DataFrame({'a': [1.5, 1e-17, -5.5e-7]})
-
-        result = df.to_string()
-        # sadness per above
-        if '%.4g' % 1.7e8 == '1.7e+008':
-            expected = ('               a\n'
-                        '0  1.500000e+000\n'
-                        '1  1.000000e-017\n'
-                        '2 -5.500000e-007')
-        else:
-            expected = ('              a\n'
-                        '0  1.500000e+00\n'
-                        '1  1.000000e-17\n'
-                        '2 -5.500000e-07')
-        self.assertEqual(result, expected)
-
-        # but not all exactly zero
-        df = df * 0
-        result = df.to_string()
-        expected = ('   0\n'
-                    '0  0\n'
-                    '1  0\n'
-                    '2 -0')
-
-    def test_to_string_float_index(self):
-        index = Index([1.5, 2, 3, 4, 5])
-        df = DataFrame(lrange(5), index=index)
-
-        result = df.to_string()
-        expected = ('     0\n'
-                    '1.5  0\n'
-                    '2.0  1\n'
-                    '3.0  2\n'
-                    '4.0  3\n'
-                    '5.0  4')
-        self.assertEqual(result, expected)
-
-    def test_to_string_ascii_error(self):
-        data = [('0  ',
-                 u('                        .gitignore '),
-                 u('     5 '),
-                 ' \xe2\x80\xa2\xe2\x80\xa2\xe2\x80'
-                 '\xa2\xe2\x80\xa2\xe2\x80\xa2')]
-        df = DataFrame(data)
-
-        # it works!
-        repr(df)
-
-    def test_to_string_int_formatting(self):
-        df = DataFrame({'x': [-15, 20, 25, -35]})
-        self.assertTrue(issubclass(df['x'].dtype.type, np.integer))
-
-        output = df.to_string()
-        expected = ('    x\n'
-                    '0 -15\n'
-                    '1  20\n'
-                    '2  25\n'
-                    '3 -35')
-        self.assertEqual(output, expected)
-
-    def test_to_string_index_formatter(self):
-        df = DataFrame([lrange(5), lrange(5, 10), lrange(10, 15)])
-
-        rs = df.to_string(formatters={'__index__': lambda x: 'abc'[x]})
-
-        xp = """\
-    0   1   2   3   4
-a   0   1   2   3   4
-b   5   6   7   8   9
-c  10  11  12  13  14\
-"""
-        self.assertEqual(rs, xp)
-
-    def test_to_string_left_justify_cols(self):
-        self.reset_display_options()
-        df = DataFrame({'x': [3234, 0.253]})
-        df_s = df.to_string(justify='left')
-        expected = ('   x       \n'
-                    '0  3234.000\n'
-                    '1     0.253')
-        self.assertEqual(df_s, expected)
-
-    def test_to_string_format_na(self):
-        self.reset_display_options()
-        df = DataFrame({'A': [np.nan, -1, -2.1234, 3, 4],
-                        'B': [np.nan, 'foo', 'foooo', 'fooooo', 'bar']})
-        result = df.to_string()
-
-        expected = ('        A       B\n'
-                    '0     NaN     NaN\n'
-                    '1 -1.0000     foo\n'
-                    '2 -2.1234   foooo\n'
-                    '3  3.0000  fooooo\n'
-                    '4  4.0000     bar')
-        self.assertEqual(result, expected)
-
-        df = DataFrame({'A': [np.nan, -1., -2., 3., 4.],
-                        'B': [np.nan, 'foo', 'foooo', 'fooooo', 'bar']})
-        result = df.to_string()
-
-        expected = ('    A       B\n'
-                    '0 NaN     NaN\n'
-                    '1  -1     foo\n'
-                    '2  -2   foooo\n'
-                    '3   3  fooooo\n'
-                    '4   4     bar')
-        self.assertEqual(result, expected)
-
-    def test_to_string_line_width(self):
-        df = DataFrame(123, lrange(10, 15), lrange(30))
-        s = df.to_string(line_width=80)
-        self.assertEqual(max(len(l) for l in s.split('\n')), 80)
-
-    def test_show_dimensions(self):
-        df = DataFrame(123, lrange(10, 15), lrange(30))
-
-        with option_context('display.max_rows', 10, 'display.max_columns', 40, 'display.width',
-                            500, 'display.expand_frame_repr', 'info', 'display.show_dimensions', True):
-            self.assertTrue('5 rows' in str(df))
-            self.assertTrue('5 rows' in df._repr_html_())
-        with option_context('display.max_rows', 10, 'display.max_columns', 40, 'display.width',
-                            500, 'display.expand_frame_repr', 'info', 'display.show_dimensions', False):
-            self.assertFalse('5 rows' in str(df))
-            self.assertFalse('5 rows' in df._repr_html_())
-        with option_context('display.max_rows', 2, 'display.max_columns', 2, 'display.width',
-                            500, 'display.expand_frame_repr', 'info', 'display.show_dimensions', 'truncate'):
-            self.assertTrue('5 rows' in str(df))
-            self.assertTrue('5 rows' in df._repr_html_())
-        with option_context('display.max_rows', 10, 'display.max_columns', 40, 'display.width',
-                            500, 'display.expand_frame_repr', 'info', 'display.show_dimensions', 'truncate'):
-            self.assertFalse('5 rows' in str(df))
-            self.assertFalse('5 rows' in df._repr_html_())
-
-    def test_to_html(self):
-        # big mixed
-        biggie = DataFrame({'A': randn(200),
-                            'B': tm.makeStringIndex(200)},
-                           index=lrange(200))
-
-        biggie.loc[:20,'A'] = nan
-        biggie.loc[:20,'B'] = nan
-        s = biggie.to_html()
-
-        buf = StringIO()
-        retval = biggie.to_html(buf=buf)
-        self.assertIsNone(retval)
-        self.assertEqual(buf.getvalue(), s)
-
-        tm.assertIsInstance(s, compat.string_types)
-
-        biggie.to_html(columns=['B', 'A'], col_space=17)
-        biggie.to_html(columns=['B', 'A'],
-                       formatters={'A': lambda x: '%.1f' % x})
-
-        biggie.to_html(columns=['B', 'A'], float_format=str)
-        biggie.to_html(columns=['B', 'A'], col_space=12,
-                       float_format=str)
-
-        frame = DataFrame(index=np.arange(200))
-        frame.to_html()
-
-    def test_to_html_filename(self):
-        biggie = DataFrame({'A': randn(200),
-                            'B': tm.makeStringIndex(200)},
-                           index=lrange(200))
-
-        biggie.loc[:20,'A'] = nan
-        biggie.loc[:20,'B'] = nan
-        with tm.ensure_clean('test.html') as path:
-            biggie.to_html(path)
-            with open(path, 'r') as f:
-                s = biggie.to_html()
-                s2 = f.read()
-                self.assertEqual(s, s2)
-
-        frame = DataFrame(index=np.arange(200))
-        with tm.ensure_clean('test.html') as path:
-            frame.to_html(path)
-            with open(path, 'r') as f:
-                self.assertEqual(frame.to_html(), f.read())
-
-    def test_to_html_with_no_bold(self):
-        x = DataFrame({'x': randn(5)})
-        ashtml = x.to_html(bold_rows=False)
-        self.assertFalse('<strong' in ashtml[ashtml.find("</thead>")])
-
-    def test_to_html_columns_arg(self):
-        result = self.frame.to_html(columns=['A'])
-        self.assertNotIn('<th>B</th>', result)
-
-    def test_to_html_multiindex(self):
-        columns = MultiIndex.from_tuples(list(zip(np.arange(2).repeat(2),
-                                                     np.mod(lrange(4), 2))),
-                                            names=['CL0', 'CL1'])
-        df = DataFrame([list('abcd'), list('efgh')], columns=columns)
-        result = df.to_html(justify='left')
-        expected = ('<table border="1" class="dataframe">\n'
-                    '  <thead>\n'
-                    '    <tr>\n'
-                    '      <th>CL0</th>\n'
-                    '      <th colspan="2" halign="left">0</th>\n'
-                    '      <th colspan="2" halign="left">1</th>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>CL1</th>\n'
-                    '      <th>0</th>\n'
-                    '      <th>1</th>\n'
-                    '      <th>0</th>\n'
-                    '      <th>1</th>\n'
-                    '    </tr>\n'
-                    '  </thead>\n'
-                    '  <tbody>\n'
-                    '    <tr>\n'
-                    '      <th>0</th>\n'
-                    '      <td>a</td>\n'
-                    '      <td>b</td>\n'
-                    '      <td>c</td>\n'
-                    '      <td>d</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>1</th>\n'
-                    '      <td>e</td>\n'
-                    '      <td>f</td>\n'
-                    '      <td>g</td>\n'
-                    '      <td>h</td>\n'
-                    '    </tr>\n'
-                    '  </tbody>\n'
-                    '</table>')
-
-        self.assertEqual(result, expected)
-
-        columns = MultiIndex.from_tuples(list(zip(range(4),
-                                                    np.mod(lrange(4), 2))))
-        df = DataFrame([list('abcd'), list('efgh')], columns=columns)
-
-        result = df.to_html(justify='right')
-        expected = ('<table border="1" class="dataframe">\n'
-                    '  <thead>\n'
-                    '    <tr>\n'
-                    '      <th></th>\n'
-                    '      <th>0</th>\n'
-                    '      <th>1</th>\n'
-                    '      <th>2</th>\n'
-                    '      <th>3</th>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th></th>\n'
-                    '      <th>0</th>\n'
-                    '      <th>1</th>\n'
-                    '      <th>0</th>\n'
-                    '      <th>1</th>\n'
-                    '    </tr>\n'
-                    '  </thead>\n'
-                    '  <tbody>\n'
-                    '    <tr>\n'
-                    '      <th>0</th>\n'
-                    '      <td>a</td>\n'
-                    '      <td>b</td>\n'
-                    '      <td>c</td>\n'
-                    '      <td>d</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>1</th>\n'
-                    '      <td>e</td>\n'
-                    '      <td>f</td>\n'
-                    '      <td>g</td>\n'
-                    '      <td>h</td>\n'
-                    '    </tr>\n'
-                    '  </tbody>\n'
-                    '</table>')
-
-        self.assertEqual(result, expected)
-
-    def test_to_html_justify(self):
-        df = DataFrame({'A': [6, 30000, 2],
-                           'B': [1, 2, 70000],
-                           'C': [223442, 0, 1]},
-                          columns=['A', 'B', 'C'])
-        result = df.to_html(justify='left')
-        expected = ('<table border="1" class="dataframe">\n'
-                    '  <thead>\n'
-                    '    <tr style="text-align: left;">\n'
-                    '      <th></th>\n'
-                    '      <th>A</th>\n'
-                    '      <th>B</th>\n'
-                    '      <th>C</th>\n'
-                    '    </tr>\n'
-                    '  </thead>\n'
-                    '  <tbody>\n'
-                    '    <tr>\n'
-                    '      <th>0</th>\n'
-                    '      <td>6</td>\n'
-                    '      <td>1</td>\n'
-                    '      <td>223442</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>1</th>\n'
-                    '      <td>30000</td>\n'
-                    '      <td>2</td>\n'
-                    '      <td>0</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>2</th>\n'
-                    '      <td>2</td>\n'
-                    '      <td>70000</td>\n'
-                    '      <td>1</td>\n'
-                    '    </tr>\n'
-                    '  </tbody>\n'
-                    '</table>')
-        self.assertEqual(result, expected)
-
-        result = df.to_html(justify='right')
-        expected = ('<table border="1" class="dataframe">\n'
-                    '  <thead>\n'
-                    '    <tr style="text-align: right;">\n'
-                    '      <th></th>\n'
-                    '      <th>A</th>\n'
-                    '      <th>B</th>\n'
-                    '      <th>C</th>\n'
-                    '    </tr>\n'
-                    '  </thead>\n'
-                    '  <tbody>\n'
-                    '    <tr>\n'
-                    '      <th>0</th>\n'
-                    '      <td>6</td>\n'
-                    '      <td>1</td>\n'
-                    '      <td>223442</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>1</th>\n'
-                    '      <td>30000</td>\n'
-                    '      <td>2</td>\n'
-                    '      <td>0</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>2</th>\n'
-                    '      <td>2</td>\n'
-                    '      <td>70000</td>\n'
-                    '      <td>1</td>\n'
-                    '    </tr>\n'
-                    '  </tbody>\n'
-                    '</table>')
-        self.assertEqual(result, expected)
-
-    def test_to_html_index(self):
-        index = ['foo', 'bar', 'baz']
-        df = DataFrame({'A': [1, 2, 3],
-                           'B': [1.2, 3.4, 5.6],
-                           'C': ['one', 'two', np.NaN]},
-                          columns=['A', 'B', 'C'],
-                          index=index)
-        expected_with_index = ('<table border="1" class="dataframe">\n'
-                               '  <thead>\n'
-                               '    <tr style="text-align: right;">\n'
-                               '      <th></th>\n'
-                               '      <th>A</th>\n'
-                               '      <th>B</th>\n'
-                               '      <th>C</th>\n'
-                               '    </tr>\n'
-                               '  </thead>\n'
-                               '  <tbody>\n'
-                               '    <tr>\n'
-                               '      <th>foo</th>\n'
-                               '      <td>1</td>\n'
-                               '      <td>1.2</td>\n'
-                               '      <td>one</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>bar</th>\n'
-                               '      <td>2</td>\n'
-                               '      <td>3.4</td>\n'
-                               '      <td>two</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>baz</th>\n'
-                               '      <td>3</td>\n'
-                               '      <td>5.6</td>\n'
-                               '      <td>NaN</td>\n'
-                               '    </tr>\n'
-                               '  </tbody>\n'
-                               '</table>')
-        self.assertEqual(df.to_html(), expected_with_index)
-
-        expected_without_index = ('<table border="1" class="dataframe">\n'
-                                  '  <thead>\n'
-                                  '    <tr style="text-align: right;">\n'
-                                  '      <th>A</th>\n'
-                                  '      <th>B</th>\n'
-                                  '      <th>C</th>\n'
-                                  '    </tr>\n'
-                                  '  </thead>\n'
-                                  '  <tbody>\n'
-                                  '    <tr>\n'
-                                  '      <td>1</td>\n'
-                                  '      <td>1.2</td>\n'
-                                  '      <td>one</td>\n'
-                                  '    </tr>\n'
-                                  '    <tr>\n'
-                                  '      <td>2</td>\n'
-                                  '      <td>3.4</td>\n'
-                                  '      <td>two</td>\n'
-                                  '    </tr>\n'
-                                  '    <tr>\n'
-                                  '      <td>3</td>\n'
-                                  '      <td>5.6</td>\n'
-                                  '      <td>NaN</td>\n'
-                                  '    </tr>\n'
-                                  '  </tbody>\n'
-                                  '</table>')
-        result = df.to_html(index=False)
-        for i in index:
-            self.assertNotIn(i, result)
-        self.assertEqual(result, expected_without_index)
-        df.index = Index(['foo', 'bar', 'baz'], name='idx')
-        expected_with_index = ('<table border="1" class="dataframe">\n'
-                               '  <thead>\n'
-                               '    <tr style="text-align: right;">\n'
-                               '      <th></th>\n'
-                               '      <th>A</th>\n'
-                               '      <th>B</th>\n'
-                               '      <th>C</th>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>idx</th>\n'
-                               '      <th></th>\n'
-                               '      <th></th>\n'
-                               '      <th></th>\n'
-                               '    </tr>\n'
-                               '  </thead>\n'
-                               '  <tbody>\n'
-                               '    <tr>\n'
-                               '      <th>foo</th>\n'
-                               '      <td>1</td>\n'
-                               '      <td>1.2</td>\n'
-                               '      <td>one</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>bar</th>\n'
-                               '      <td>2</td>\n'
-                               '      <td>3.4</td>\n'
-                               '      <td>two</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>baz</th>\n'
-                               '      <td>3</td>\n'
-                               '      <td>5.6</td>\n'
-                               '      <td>NaN</td>\n'
-                               '    </tr>\n'
-                               '  </tbody>\n'
-                               '</table>')
-        self.assertEqual(df.to_html(), expected_with_index)
-        self.assertEqual(df.to_html(index=False), expected_without_index)
-
-        tuples = [('foo', 'car'), ('foo', 'bike'), ('bar', 'car')]
-        df.index = MultiIndex.from_tuples(tuples)
-
-        expected_with_index = ('<table border="1" class="dataframe">\n'
-                               '  <thead>\n'
-                               '    <tr style="text-align: right;">\n'
-                               '      <th></th>\n'
-                               '      <th></th>\n'
-                               '      <th>A</th>\n'
-                               '      <th>B</th>\n'
-                               '      <th>C</th>\n'
-                               '    </tr>\n'
-                               '  </thead>\n'
-                               '  <tbody>\n'
-                               '    <tr>\n'
-                               '      <th rowspan="2" valign="top">foo</th>\n'
-                               '      <th>car</th>\n'
-                               '      <td>1</td>\n'
-                               '      <td>1.2</td>\n'
-                               '      <td>one</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>bike</th>\n'
-                               '      <td>2</td>\n'
-                               '      <td>3.4</td>\n'
-                               '      <td>two</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>bar</th>\n'
-                               '      <th>car</th>\n'
-                               '      <td>3</td>\n'
-                               '      <td>5.6</td>\n'
-                               '      <td>NaN</td>\n'
-                               '    </tr>\n'
-                               '  </tbody>\n'
-                               '</table>')
-        self.assertEqual(df.to_html(), expected_with_index)
-
-        result = df.to_html(index=False)
-        for i in ['foo', 'bar', 'car', 'bike']:
-            self.assertNotIn(i, result)
-        # must be the same result as normal index
-        self.assertEqual(result, expected_without_index)
-
-        df.index = MultiIndex.from_tuples(tuples, names=['idx1', 'idx2'])
-        expected_with_index = ('<table border="1" class="dataframe">\n'
-                               '  <thead>\n'
-                               '    <tr style="text-align: right;">\n'
-                               '      <th></th>\n'
-                               '      <th></th>\n'
-                               '      <th>A</th>\n'
-                               '      <th>B</th>\n'
-                               '      <th>C</th>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>idx1</th>\n'
-                               '      <th>idx2</th>\n'
-                               '      <th></th>\n'
-                               '      <th></th>\n'
-                               '      <th></th>\n'
-                               '    </tr>\n'
-                               '  </thead>\n'
-                               '  <tbody>\n'
-                               '    <tr>\n'
-                               '      <th rowspan="2" valign="top">foo</th>\n'
-                               '      <th>car</th>\n'
-                               '      <td>1</td>\n'
-                               '      <td>1.2</td>\n'
-                               '      <td>one</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>bike</th>\n'
-                               '      <td>2</td>\n'
-                               '      <td>3.4</td>\n'
-                               '      <td>two</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>bar</th>\n'
-                               '      <th>car</th>\n'
-                               '      <td>3</td>\n'
-                               '      <td>5.6</td>\n'
-                               '      <td>NaN</td>\n'
-                               '    </tr>\n'
-                               '  </tbody>\n'
-                               '</table>')
-        self.assertEqual(df.to_html(), expected_with_index)
-        self.assertEqual(df.to_html(index=False), expected_without_index)
-
-    def test_repr_html(self):
-        self.frame._repr_html_()
-
-        fmt.set_option('display.max_rows', 1, 'display.max_columns', 1)
-        self.frame._repr_html_()
-
-        fmt.set_option('display.notebook_repr_html', False)
-        self.frame._repr_html_()
-
-        self.reset_display_options()
-
-        df = DataFrame([[1, 2], [3, 4]])
-        fmt.set_option('display.show_dimensions', True)
-        self.assertTrue('2 rows' in df._repr_html_())
-        fmt.set_option('display.show_dimensions', False)
-        self.assertFalse('2 rows' in df._repr_html_())
-
-        self.reset_display_options()
-
-    def test_repr_html_wide(self):
-        max_cols = get_option('display.max_columns')
-        df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
-        reg_repr = df._repr_html_()
-        assert "..." not in reg_repr
-
-        wide_df = DataFrame(tm.rands_array(25, size=(10, max_cols + 1)))
-        wide_repr = wide_df._repr_html_()
-        assert "..." in wide_repr
-
-    def test_repr_html_wide_multiindex_cols(self):
-        max_cols = get_option('display.max_columns')
-
-        mcols = MultiIndex.from_product([np.arange(max_cols//2),
-                                             ['foo', 'bar']],
-                                            names=['first', 'second'])
-        df = DataFrame(tm.rands_array(25, size=(10, len(mcols))),
-                       columns=mcols)
-        reg_repr = df._repr_html_()
-        assert '...' not in reg_repr
-
-        mcols = MultiIndex.from_product((np.arange(1+(max_cols//2)),
-                                              ['foo', 'bar']),
-                                             names=['first', 'second'])
-        df = DataFrame(tm.rands_array(25, size=(10, len(mcols))),
-                       columns=mcols)
-        wide_repr = df._repr_html_()
-        assert '...' in wide_repr
-
-    def test_repr_html_long(self):
-        max_rows = get_option('display.max_rows')
-        h = max_rows - 1
-        df = DataFrame({'A':np.arange(1,1+h), 'B':np.arange(41, 41+h)})
-        reg_repr = df._repr_html_()
-        assert '..' not in reg_repr
-        assert str(41 + max_rows // 2) in reg_repr
-
-        h = max_rows + 1
-        df = DataFrame({'A':np.arange(1,1+h), 'B':np.arange(41, 41+h)})
-        long_repr = df._repr_html_()
-        assert '..' in long_repr
-        assert str(41 + max_rows // 2) not in long_repr
-        assert u('%d rows ') % h in long_repr
-        assert u('2 columns') in long_repr
-
-    def test_repr_html_float(self):
-        max_rows = get_option('display.max_rows')
-        h = max_rows - 1
-        df = DataFrame({'idx':np.linspace(-10,10,h), 'A':np.arange(1,1+h), 'B': np.arange(41, 41+h) }).set_index('idx')
-        reg_repr = df._repr_html_()
-        assert '..' not in reg_repr
-        assert str(40 + h) in reg_repr
-
-        h = max_rows + 1
-        df = DataFrame({'idx':np.linspace(-10,10,h), 'A':np.arange(1,1+h), 'B': np.arange(41, 41+h) }).set_index('idx')
-        long_repr = df._repr_html_()
-        assert '..' in long_repr
-        assert '31' not in long_repr
-        assert u('%d rows ') % h in long_repr
-        assert u('2 columns') in long_repr
-
-    def test_repr_html_long_multiindex(self):
-        max_rows = get_option('display.max_rows')
-        max_L1 = max_rows//2
-
-        tuples = list(itertools.product(np.arange(max_L1), ['foo', 'bar']))
-        idx = MultiIndex.from_tuples(tuples, names=['first', 'second'])
-        df = DataFrame(np.random.randn(max_L1*2, 2), index=idx,
-                       columns=['A', 'B'])
-        reg_repr = df._repr_html_()
-        assert '...' not in reg_repr
-
-        tuples = list(itertools.product(np.arange(max_L1+1), ['foo', 'bar']))
-        idx = MultiIndex.from_tuples(tuples, names=['first', 'second'])
-        df = DataFrame(np.random.randn((max_L1+1)*2, 2), index=idx,
-                       columns=['A', 'B'])
-        long_repr = df._repr_html_()
-        assert '...' in long_repr
-
-    def test_repr_html_long_and_wide(self):
-        max_cols = get_option('display.max_columns')
-        max_rows = get_option('display.max_rows')
-
-        h, w = max_rows-1, max_cols-1
-        df = DataFrame(dict((k,np.arange(1,1+h)) for k in np.arange(w)))
-        assert '...'  not in df._repr_html_()
-
-        h, w = max_rows+1, max_cols+1
-        df = DataFrame(dict((k,np.arange(1,1+h)) for k in np.arange(w)))
-        assert '...'  in df._repr_html_()
-
-    def test_info_repr(self):
-        max_rows = get_option('display.max_rows')
-        max_cols = get_option('display.max_columns')
-        # Long
-        h, w = max_rows+1, max_cols-1
-        df = DataFrame(dict((k,np.arange(1,1+h)) for k in np.arange(w)))
-        assert has_vertically_truncated_repr(df)
-        with option_context('display.large_repr', 'info'):
-            assert has_info_repr(df)
-
-        # Wide
-        h, w = max_rows-1, max_cols+1
-        df = DataFrame(dict((k,np.arange(1,1+h)) for k in np.arange(w)))
-        assert has_horizontally_truncated_repr(df)
-        with option_context('display.large_repr', 'info'):
-            assert has_info_repr(df)
-
-    def test_info_repr_max_cols(self):
-        # GH #6939
-        df = DataFrame(randn(10, 5))
-        with option_context('display.large_repr', 'info',
-                            'display.max_columns', 1,
-                            'display.max_info_columns', 4):
-            self.assertTrue(has_non_verbose_info_repr(df))
-
-        with option_context('display.large_repr', 'info',
-                            'display.max_columns', 1,
-                            'display.max_info_columns', 5):
-            self.assertFalse(has_non_verbose_info_repr(df))
-
-        # test verbose overrides
-        # fmt.set_option('display.max_info_columns', 4)  # exceeded
-
-    def test_info_repr_html(self):
-        max_rows = get_option('display.max_rows')
-        max_cols = get_option('display.max_columns')
-        # Long
-        h, w = max_rows+1, max_cols-1
-        df = DataFrame(dict((k,np.arange(1,1+h)) for k in np.arange(w)))
-        assert r'&lt;class' not in df._repr_html_()
-        with option_context('display.large_repr', 'info'):
-            assert r'&lt;class' in df._repr_html_()
-
-        # Wide
-        h, w = max_rows-1, max_cols+1
-        df = DataFrame(dict((k,np.arange(1,1+h)) for k in np.arange(w)))
-        assert '<class' not in df._repr_html_()
-        with option_context('display.large_repr', 'info'):
-            assert '&lt;class' in df._repr_html_()
-
-    def test_fake_qtconsole_repr_html(self):
-        def get_ipython():
-            return {'config':
-                   {'KernelApp':
-                   {'parent_appname': 'ipython-qtconsole'}}}
-
-        repstr = self.frame._repr_html_()
-        self.assertIsNotNone(repstr)
-
-        fmt.set_option('display.max_rows', 5, 'display.max_columns', 2)
-        repstr = self.frame._repr_html_()
-        self.assertIn('class', repstr)  # info fallback
-
-        self.reset_display_options()
-
-    def test_to_html_with_classes(self):
-        df = DataFrame()
-        result = df.to_html(classes="sortable draggable")
-        expected = dedent("""
-
-            <table border="1" class="dataframe sortable draggable">
-              <thead>
-                <tr style="text-align: right;">
-                  <th></th>
-                </tr>
-              </thead>
-              <tbody>
-              </tbody>
-            </table>
-
-        """).strip()
-        self.assertEqual(result, expected)
-
-        result = df.to_html(classes=["sortable", "draggable"])
-        self.assertEqual(result, expected)
-
-    def test_pprint_pathological_object(self):
-        """
-        if the test fails, the stack will overflow and nose crash,
-        but it won't hang.
-        """
-        class A:
-            def __getitem__(self, key):
-                return 3 # obviously simplified
-        df = DataFrame([A()])
-        repr(df) # just don't dine
-
-    def test_float_trim_zeros(self):
-        vals = [2.08430917305e+10, 3.52205017305e+10, 2.30674817305e+10,
-                2.03954217305e+10, 5.59897817305e+10]
-        skip = True
-        for line in repr(DataFrame({'A': vals})).split('\n')[:-2]:
-            if line.startswith('dtype:'):
-                continue
-            if _three_digit_exp():
-                self.assertTrue(('+010' in line) or skip)
-            else:
-                self.assertTrue(('+10' in line) or skip)
-            skip = False
-
-    def test_dict_entries(self):
-        df = DataFrame({'A': [{'a': 1, 'b': 2}]})
-
-        val = df.to_string()
-        self.assertTrue("'a': 1" in val)
-        self.assertTrue("'b': 2" in val)
-
-    def test_to_latex_filename(self):
-        with tm.ensure_clean('test.tex') as path:
-            self.frame.to_latex(path)
-
-            with open(path, 'r') as f:
-                self.assertEqual(self.frame.to_latex(), f.read())
-
-    def test_to_latex(self):
-        # it works!
-        self.frame.to_latex()
-
-        df = DataFrame({'a': [1, 2],
-                        'b': ['b1', 'b2']})
-        withindex_result = df.to_latex()
-        withindex_expected = r"""\begin{tabular}{lrl}
-\toprule
-{} &  a &   b \\
-\midrule
-0 &  1 &  b1 \\
-1 &  2 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-        self.assertEqual(withindex_result, withindex_expected)
-
-        withoutindex_result = df.to_latex(index=False)
-        withoutindex_expected = r"""\begin{tabular}{rl}
-\toprule
- a &   b \\
-\midrule
- 1 &  b1 \\
- 2 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-        self.assertEqual(withoutindex_result, withoutindex_expected)
-
-    def test_to_latex_format(self):
-        # GH Bug #9402
-        self.frame.to_latex(column_format='ccc')
-
-        df = DataFrame({'a': [1, 2],
-                        'b': ['b1', 'b2']})
-        withindex_result = df.to_latex(column_format='ccc')
-        withindex_expected = r"""\begin{tabular}{ccc}
-\toprule
-{} &  a &   b \\
-\midrule
-0 &  1 &  b1 \\
-1 &  2 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-        self.assertEqual(withindex_result, withindex_expected)
-
-    def test_to_latex_multiindex(self):
-        df = DataFrame({('x', 'y'): ['a']})
-        result = df.to_latex()
-        expected = r"""\begin{tabular}{ll}
-\toprule
-{} &  x \\
-{} &  y \\
-\midrule
-0 &  a \\
-\bottomrule
-\end{tabular}
-"""
-        self.assertEqual(result, expected)
-
-        result = df.T.to_latex()
-        expected = r"""\begin{tabular}{lll}
-\toprule
-  &   &  0 \\
-\midrule
-x & y &  a \\
-\bottomrule
-\end{tabular}
-"""
-        self.assertEqual(result, expected)
-
-        df = DataFrame.from_dict({
-            ('c1', 0): pd.Series(dict((x, x) for x in range(4))),
-            ('c1', 1): pd.Series(dict((x, x + 4) for x in range(4))),
-            ('c2', 0): pd.Series(dict((x, x) for x in range(4))),
-            ('c2', 1): pd.Series(dict((x, x + 4) for x in range(4))),
-            ('c3', 0): pd.Series(dict((x, x) for x in range(4))),
-        }).T
-        result = df.to_latex()
-        expected = r"""\begin{tabular}{llrrrr}
-\toprule
-   &   &  0 &  1 &  2 &  3 \\
-\midrule
-c1 & 0 &  0 &  1 &  2 &  3 \\
-   & 1 &  4 &  5 &  6 &  7 \\
-c2 & 0 &  0 &  1 &  2 &  3 \\
-   & 1 &  4 &  5 &  6 &  7 \\
-c3 & 0 &  0 &  1 &  2 &  3 \\
-\bottomrule
-\end{tabular}
-"""
-        self.assertEqual(result, expected)
-
-        # GH 10660
-        df = pd.DataFrame({'a':[0,0,1,1], 'b':list('abab'), 'c':[1,2,3,4]})
-        result = df.set_index(['a', 'b']).to_latex()
-        expected = r"""\begin{tabular}{llr}
-\toprule
-  &   &  c \\
-a & b &    \\
-\midrule
-0 & a &  1 \\
-  & b &  2 \\
-1 & a &  3 \\
-  & b &  4 \\
-\bottomrule
-\end{tabular}
-"""
-        self.assertEqual(result, expected)
-
-        result = df.groupby('a').describe().to_latex()
-        expected = r"""\begin{tabular}{llr}
-\toprule
-  &       &         c \\
-a & {} &           \\
-\midrule
-0 & count &  2.000000 \\
-  & mean &  1.500000 \\
-  & std &  0.707107 \\
-  & min &  1.000000 \\
-  & 25\% &  1.250000 \\
-  & 50\% &  1.500000 \\
-  & 75\% &  1.750000 \\
-  & max &  2.000000 \\
-1 & count &  2.000000 \\
-  & mean &  3.500000 \\
-  & std &  0.707107 \\
-  & min &  3.000000 \\
-  & 25\% &  3.250000 \\
-  & 50\% &  3.500000 \\
-  & 75\% &  3.750000 \\
-  & max &  4.000000 \\
-\bottomrule
-\end{tabular}
-"""
-        self.assertEqual(result, expected)
-
-    def test_to_latex_escape(self):
-        a = 'a'
-        b = 'b'
-
-        test_dict = {u('co^l1')  : {a: "a",
-                                    b: "b"},
-                     u('co$e^x$'): {a: "a",
-                                    b: "b"}}
-
-        unescaped_result = DataFrame(test_dict).to_latex(escape=False)
-        escaped_result   = DataFrame(test_dict).to_latex() # default: escape=True
-
-        unescaped_expected = r'''\begin{tabular}{lll}
-\toprule
-{} & co$e^x$ & co^l1 \\
-\midrule
-a &       a &     a \\
-b &       b &     b \\
-\bottomrule
-\end{tabular}
-'''
-
-        escaped_expected = r'''\begin{tabular}{lll}
-\toprule
-{} & co\$e\textasciicircumx\$ & co\textasciicircuml1 \\
-\midrule
-a &       a &     a \\
-b &       b &     b \\
-\bottomrule
-\end{tabular}
-'''
-        self.assertEqual(unescaped_result, unescaped_expected)
-        self.assertEqual(escaped_result, escaped_expected)
-
-    def test_to_latex_longtable(self):
-        self.frame.to_latex(longtable=True)
-
-        df = DataFrame({'a': [1, 2],
-                        'b': ['b1', 'b2']})
-        withindex_result = df.to_latex(longtable=True)
-        withindex_expected = r"""\begin{longtable}{lrl}
-\toprule
-{} &  a &   b \\
-\midrule
-\endhead
-\midrule
-\multicolumn{3}{r}{{Continued on next page}} \\
-\midrule
-\endfoot
-
-\bottomrule
-\endlastfoot
-0 &  1 &  b1 \\
-1 &  2 &  b2 \\
-\end{longtable}
-"""
-        self.assertEqual(withindex_result, withindex_expected)
-
-        withoutindex_result = df.to_latex(index=False, longtable=True)
-        withoutindex_expected = r"""\begin{longtable}{rl}
-\toprule
- a &   b \\
-\midrule
-\endhead
-\midrule
-\multicolumn{3}{r}{{Continued on next page}} \\
-\midrule
-\endfoot
-
-\bottomrule
-\endlastfoot
- 1 &  b1 \\
- 2 &  b2 \\
-\end{longtable}
-"""
-        self.assertEqual(withoutindex_result, withoutindex_expected)
-
-    def test_to_latex_escape_special_chars(self):
-        special_characters = ['&','%','$','#','_',
-                               '{','}','~','^','\\']
-        df = DataFrame(data=special_characters)
-        observed = df.to_latex()
-        expected = r"""\begin{tabular}{ll}
-\toprule
-{} &  0 \\
-\midrule
-0 &  \& \\
-1 &  \% \\
-2 &  \$ \\
-3 &  \# \\
-4 &  \_ \\
-5 &  \{ \\
-6 &  \} \\
-7 &  \textasciitilde \\
-8 &  \textasciicircum \\
-9 &  \textbackslash \\
-\bottomrule
-\end{tabular}
-"""
-        self.assertEqual(observed, expected)
-
-    def test_to_latex_no_header(self):
-        # GH 7124
-        df = DataFrame({'a': [1, 2],
-                        'b': ['b1', 'b2']})
-        withindex_result = df.to_latex(header=False)
-        withindex_expected = r"""\begin{tabular}{lrl}
-\toprule
-0 &  1 &  b1 \\
-1 &  2 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-        self.assertEqual(withindex_result, withindex_expected)
-
-        withoutindex_result = df.to_latex(index=False, header=False)
-        withoutindex_expected = r"""\begin{tabular}{rl}
-\toprule
- 1 &  b1 \\
- 2 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-        self.assertEqual(withoutindex_result, withoutindex_expected)
-
-    def test_to_csv_quotechar(self):
-        df = DataFrame({'col' : [1,2]})
-        expected = """\
-"","col"
-"0","1"
-"1","2"
-"""
-        with tm.ensure_clean('test.csv') as path:
-            df.to_csv(path, quoting=1) # 1=QUOTE_ALL
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-        with tm.ensure_clean('test.csv') as path:
-            df.to_csv(path, quoting=1, engine='python')
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-
-        expected = """\
-$$,$col$
-$0$,$1$
-$1$,$2$
-"""
-        with tm.ensure_clean('test.csv') as path:
-            df.to_csv(path, quoting=1, quotechar="$")
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-        with tm.ensure_clean('test.csv') as path:
-            df.to_csv(path, quoting=1, quotechar="$", engine='python')
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-
-        with tm.ensure_clean('test.csv') as path:
-            with tm.assertRaisesRegexp(TypeError, 'quotechar'):
-                df.to_csv(path, quoting=1, quotechar=None)
-        with tm.ensure_clean('test.csv') as path:
-            with tm.assertRaisesRegexp(TypeError, 'quotechar'):
-                df.to_csv(path, quoting=1, quotechar=None, engine='python')
-
-    def test_to_csv_doublequote(self):
-        df = DataFrame({'col' : ['a"a', '"bb"']})
-        expected = '''\
-"","col"
-"0","a""a"
-"1","""bb"""
-'''
-        with tm.ensure_clean('test.csv') as path:
-            df.to_csv(path, quoting=1, doublequote=True) # QUOTE_ALL
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-        with tm.ensure_clean('test.csv') as path:
-            df.to_csv(path, quoting=1, doublequote=True, engine='python')
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-
-        from _csv import Error
-        with tm.ensure_clean('test.csv') as path:
-            with tm.assertRaisesRegexp(Error, 'escapechar'):
-                df.to_csv(path, doublequote=False) # no escapechar set
-        with tm.ensure_clean('test.csv') as path:
-            with tm.assertRaisesRegexp(Error, 'escapechar'):
-                df.to_csv(path, doublequote=False, engine='python')
-
-    def test_to_csv_escapechar(self):
-        df = DataFrame({'col' : ['a"a', '"bb"']})
-        expected = """\
-"","col"
-"0","a\\"a"
-"1","\\"bb\\""
-"""
-        with tm.ensure_clean('test.csv') as path:   # QUOTE_ALL
-            df.to_csv(path, quoting=1, doublequote=False, escapechar='\\')
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-        with tm.ensure_clean('test.csv') as path:
-            df.to_csv(path, quoting=1, doublequote=False, escapechar='\\',
-                      engine='python')
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-
-        df = DataFrame({'col' : ['a,a', ',bb,']})
-        expected = """\
-,col
-0,a\\,a
-1,\\,bb\\,
-"""
-        with tm.ensure_clean('test.csv') as path:
-            df.to_csv(path, quoting=3, escapechar='\\') # QUOTE_NONE
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-        with tm.ensure_clean('test.csv') as path:
-            df.to_csv(path, quoting=3, escapechar='\\', engine='python')
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-
-    def test_csv_to_string(self):
-        df = DataFrame({'col' : [1,2]})
-        expected = ',col\n0,1\n1,2\n'
-        self.assertEqual(df.to_csv(), expected)
-
-    def test_to_csv_decimal(self):
-        # GH 781
-        df = DataFrame({'col1' : [1], 'col2' : ['a'], 'col3' : [10.1] })
-
-        expected_default = ',col1,col2,col3\n0,1,a,10.1\n'
-        self.assertEqual(df.to_csv(), expected_default)
-
-        expected_european_excel = ';col1;col2;col3\n0;1;a;10,1\n'
-        self.assertEqual(df.to_csv(decimal=',',sep=';'), expected_european_excel)
-
-        expected_float_format_default = ',col1,col2,col3\n0,1,a,10.10\n'
-        self.assertEqual(df.to_csv(float_format = '%.2f'), expected_float_format_default)
-
-        expected_float_format = ';col1;col2;col3\n0;1;a;10,10\n'
-        self.assertEqual(df.to_csv(decimal=',',sep=';', float_format = '%.2f'), expected_float_format)
-
-    def test_to_csv_date_format(self):
-        # GH 10209
-        df_sec = DataFrame({'A': pd.date_range('20130101',periods=5,freq='s')})
-        df_day = DataFrame({'A': pd.date_range('20130101',periods=5,freq='d')})
-
-        expected_default_sec = ',A\n0,2013-01-01 00:00:00\n1,2013-01-01 00:00:01\n2,2013-01-01 00:00:02' + \
-                               '\n3,2013-01-01 00:00:03\n4,2013-01-01 00:00:04\n'
-        self.assertEqual(df_sec.to_csv(), expected_default_sec)
-
-        expected_ymdhms_day = ',A\n0,2013-01-01 00:00:00\n1,2013-01-02 00:00:00\n2,2013-01-03 00:00:00' + \
-                              '\n3,2013-01-04 00:00:00\n4,2013-01-05 00:00:00\n'
-        self.assertEqual(df_day.to_csv(date_format='%Y-%m-%d %H:%M:%S'), expected_ymdhms_day)
-
-        expected_ymd_sec = ',A\n0,2013-01-01\n1,2013-01-01\n2,2013-01-01\n3,2013-01-01\n4,2013-01-01\n'
-        self.assertEqual(df_sec.to_csv(date_format='%Y-%m-%d'), expected_ymd_sec)
-
-        expected_default_day = ',A\n0,2013-01-01\n1,2013-01-02\n2,2013-01-03\n3,2013-01-04\n4,2013-01-05\n'
-        self.assertEqual(df_day.to_csv(), expected_default_day)
-        self.assertEqual(df_day.to_csv(date_format='%Y-%m-%d'), expected_default_day)
-
-    # deprecation GH11274
-    def test_to_csv_engine_kw_deprecation(self):
-        with tm.assert_produces_warning(FutureWarning):
-            df = DataFrame({'col1' : [1], 'col2' : ['a'], 'col3' : [10.1] })
-            df.to_csv(engine='python')
-
-    def test_round_dataframe(self):
-
-        # GH 2665
-
-        # Test that rounding an empty DataFrame does nothing
-        df = DataFrame()
-        tm.assert_frame_equal(df, df.round())
-
-        # Here's the test frame we'll be working with
-        df = DataFrame(
-            {'col1': [1.123, 2.123, 3.123], 'col2': [1.234, 2.234, 3.234]})
-
-        # Default round to integer (i.e. decimals=0)
-        expected_rounded = DataFrame(
-            {'col1': [1., 2., 3.], 'col2': [1., 2., 3.]})
-        tm.assert_frame_equal(df.round(), expected_rounded)
-
-        # Round with an integer
-        decimals = 2
-        expected_rounded = DataFrame(
-            {'col1': [1.12, 2.12, 3.12], 'col2': [1.23, 2.23, 3.23]})
-        tm.assert_frame_equal(df.round(decimals), expected_rounded)
-
-        # This should also work with np.round (since np.round dispatches to
-        # df.round)
-        tm.assert_frame_equal(np.round(df, decimals), expected_rounded)
-
-        # Round with a list
-        round_list = [1, 2]
-        with self.assertRaises(TypeError):
-            df.round(round_list)
-
-        # Round with a dictionary
-        expected_rounded = DataFrame(
-            {'col1': [1.1, 2.1, 3.1], 'col2': [1.23, 2.23, 3.23]})
-        round_dict = {'col1': 1, 'col2': 2}
-        tm.assert_frame_equal(df.round(round_dict), expected_rounded)
-
-        # Incomplete dict
-        expected_partially_rounded = DataFrame(
-            {'col1': [1.123, 2.123, 3.123], 'col2': [1.2, 2.2, 3.2]})
-        partial_round_dict = {'col2': 1}
-        tm.assert_frame_equal(
-            df.round(partial_round_dict), expected_partially_rounded)
-
-        # Dict with unknown elements
-        wrong_round_dict = {'col3': 2, 'col2': 1}
-        tm.assert_frame_equal(
-            df.round(wrong_round_dict), expected_partially_rounded)
-
-        # float input to `decimals`
-        non_int_round_dict = {'col1': 1, 'col2': 0.5}
-        if sys.version < LooseVersion('2.7'):
-            # np.round([1.123, 2.123], 0.5) is only a warning in Python 2.6
-            with self.assert_produces_warning(DeprecationWarning, check_stacklevel=False):
-                df.round(non_int_round_dict)
-        else:
-            with self.assertRaises(TypeError):
-                df.round(non_int_round_dict)
-
-        # String input
-        non_int_round_dict = {'col1': 1, 'col2': 'foo'}
-        with self.assertRaises(TypeError):
-            df.round(non_int_round_dict)
-
-        non_int_round_Series = Series(non_int_round_dict)
-        with self.assertRaises(TypeError):
-            df.round(non_int_round_Series)
-
-        # List input
-        non_int_round_dict = {'col1': 1, 'col2': [1, 2]}
-        with self.assertRaises(TypeError):
-            df.round(non_int_round_dict)
-
-        non_int_round_Series = Series(non_int_round_dict)
-        with self.assertRaises(TypeError):
-            df.round(non_int_round_Series)
-
-        # Non integer Series inputs
-        non_int_round_Series = Series(non_int_round_dict)
-        with self.assertRaises(TypeError):
-            df.round(non_int_round_Series)
-
-        non_int_round_Series = Series(non_int_round_dict)
-        with self.assertRaises(TypeError):
-            df.round(non_int_round_Series)
-
-        # Negative numbers
-        negative_round_dict = {'col1': -1, 'col2': -2}
-        big_df = df * 100
-        expected_neg_rounded = DataFrame(
-                {'col1':[110., 210, 310], 'col2':[100., 200, 300]})
-        tm.assert_frame_equal(
-            big_df.round(negative_round_dict), expected_neg_rounded)
-
-        # nan in Series round
-        nan_round_Series = Series({'col1': nan, 'col2':1})
-        expected_nan_round = DataFrame(
-                {'col1': [1.123, 2.123, 3.123], 'col2': [1.2, 2.2, 3.2]})
-        if sys.version < LooseVersion('2.7'):
-            # Rounding with decimal is a ValueError in Python < 2.7
-            with self.assertRaises(ValueError):
-                df.round(nan_round_Series)
-        else:
-            with self.assertRaises(TypeError):
-                df.round(nan_round_Series)
-
-        # Make sure this doesn't break existing Series.round
-        tm.assert_series_equal(df['col1'].round(1), expected_rounded['col1'])
-
-class TestSeriesFormatting(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.ts = tm.makeTimeSeries()
-
-    def test_repr_unicode(self):
-        s = Series([u('\u03c3')] * 10)
-        repr(s)
-
-        a = Series([u("\u05d0")] * 1000)
-        a.name = 'title1'
-        repr(a)
-
-    def test_to_string(self):
-        buf = StringIO()
-
-        s = self.ts.to_string()
-
-        retval = self.ts.to_string(buf=buf)
-        self.assertIsNone(retval)
-        self.assertEqual(buf.getvalue().strip(), s)
-
-        # pass float_format
-        format = '%.4f'.__mod__
-        result = self.ts.to_string(float_format=format)
-        result = [x.split()[1] for x in result.split('\n')[:-1]]
-        expected = [format(x) for x in self.ts]
-        self.assertEqual(result, expected)
-
-        # empty string
-        result = self.ts[:0].to_string()
-        self.assertEqual(result, 'Series([], Freq: B)')
-
-        result = self.ts[:0].to_string(length=0)
-        self.assertEqual(result, 'Series([], Freq: B)')
-
-        # name and length
-        cp = self.ts.copy()
-        cp.name = 'foo'
-        result = cp.to_string(length=True, name=True, dtype=True)
-        last_line = result.split('\n')[-1].strip()
-        self.assertEqual(last_line, "Freq: B, Name: foo, Length: %d, dtype: float64" % len(cp))
-
-    def test_freq_name_separation(self):
-        s = Series(np.random.randn(10),
-                   index=date_range('1/1/2000', periods=10), name=0)
-
-        result = repr(s)
-        self.assertTrue('Freq: D, Name: 0' in result)
-
-    def test_to_string_mixed(self):
-        s = Series(['foo', np.nan, -1.23, 4.56])
-        result = s.to_string()
-        expected = (u('0     foo\n') +
-                    u('1     NaN\n') +
-                    u('2   -1.23\n') +
-                    u('3    4.56'))
-        self.assertEqual(result, expected)
-
-        # but don't count NAs as floats
-        s = Series(['foo', np.nan, 'bar', 'baz'])
-        result = s.to_string()
-        expected = (u('0    foo\n') +
-                    '1    NaN\n' +
-                    '2    bar\n' +
-                    '3    baz')
-        self.assertEqual(result, expected)
-
-        s = Series(['foo', 5, 'bar', 'baz'])
-        result = s.to_string()
-        expected = (u('0    foo\n') +
-                    '1      5\n' +
-                    '2    bar\n' +
-                    '3    baz')
-        self.assertEqual(result, expected)
-
-    def test_to_string_float_na_spacing(self):
-        s = Series([0., 1.5678, 2., -3., 4.])
-        s[::2] = np.nan
-
-        result = s.to_string()
-        expected = (u('0       NaN\n') +
-                    '1    1.5678\n' +
-                    '2       NaN\n' +
-                    '3   -3.0000\n' +
-                    '4       NaN')
-        self.assertEqual(result, expected)
-
-    def test_unicode_name_in_footer(self):
-        s = Series([1, 2], name=u('\u05e2\u05d1\u05e8\u05d9\u05ea'))
-        sf = fmt.SeriesFormatter(s, name=u('\u05e2\u05d1\u05e8\u05d9\u05ea'))
-        sf._get_footer()  # should not raise exception
-
-    def test_east_asian_unicode_series(self):
-        if PY3:
-            _rep = repr
-        else:
-            _rep = unicode
-        # not alighned properly because of east asian width
-
-        # unicode index
-        s = Series(['a', 'bb', 'CCC', 'D'],
-                   index=[u'あ', u'いい', u'ううう', u'ええええ'])
-        expected = (u"あ         a\nいい       bb\nううう     CCC\n"
-                    u"ええええ      D\ndtype: object")
-        self.assertEqual(_rep(s), expected)
-
-        # unicode values
-        s = Series([u'あ', u'いい', u'ううう', u'ええええ'], index=['a', 'bb', 'c', 'ddd'])
-        expected = (u"a         あ\nbb       いい\nc       ううう\n"
-                    u"ddd    ええええ\ndtype: object")
-        self.assertEqual(_rep(s), expected)
-
-        # both
-        s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                   index=[u'ああ', u'いいいい', u'う', u'えええ'])
-        expected = (u"ああ         あ\nいいいい      いい\nう        ううう\n"
-                    u"えええ     ええええ\ndtype: object")
-        self.assertEqual(_rep(s), expected)
-
-        # unicode footer
-        s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                   index=[u'ああ', u'いいいい', u'う', u'えええ'],
-                   name=u'おおおおおおお')
-        expected = (u"ああ         あ\nいいいい      いい\nう        ううう\n"
-                    u"えええ     ええええ\nName: おおおおおおお, dtype: object")
-        self.assertEqual(_rep(s), expected)
-
-        # MultiIndex
-        idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'),
-                                         (u'おおお', u'かかかか'), (u'き', u'くく')])
-        s = Series([1, 22, 3333, 44444], index=idx)
-        expected = (u"あ    いい          1\nう    え          22\nおおお  かかかか     3333\n"
-                    u"き    くく      44444\ndtype: int64")
-        self.assertEqual(_rep(s), expected)
-
-        # object dtype, shorter than unicode repr
-        s = Series([1, 22, 3333, 44444], index=[1, 'AB', np.nan, u'あああ'])
-        expected = (u"1          1\nAB        22\nNaN     3333\n"
-                    u"あああ    44444\ndtype: int64")
-        self.assertEqual(_rep(s), expected)
-
-        # object dtype, longer than unicode repr
-        s = Series([1, 22, 3333, 44444],
-                   index=[1, 'AB', pd.Timestamp('2011-01-01'), u'あああ'])
-        expected = (u"1                          1\nAB                        22\n"
-                    u"2011-01-01 00:00:00     3333\nあああ                    44444\ndtype: int64")
-        self.assertEqual(_rep(s), expected)
-
-        # truncate
-        with option_context('display.max_rows', 3):
-            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                       name=u'おおおおおおお')
-
-            expected = (u"0       あ\n     ... \n"
-                        u"3    ええええ\nName: おおおおおおお, dtype: object")
-            self.assertEqual(_rep(s), expected)
-
-            s.index = [u'ああ', u'いいいい', u'う', u'えええ']
-            expected = (u"ああ        あ\n       ... \n"
-                        u"えええ    ええええ\nName: おおおおおおお, dtype: object")
-            self.assertEqual(_rep(s), expected)
-
-        # Emable Unicode option -----------------------------------------
-        with option_context('display.unicode.east_asian_width', True):
-
-            # unicode index
-            s = Series(['a', 'bb', 'CCC', 'D'],
-                       index=[u'あ', u'いい', u'ううう', u'ええええ'])
-            expected = (u"あ            a\nいい         bb\nううう      CCC\n"
-                        u"ええええ      D\ndtype: object")
-            self.assertEqual(_rep(s), expected)
-
-            # unicode values
-            s = Series([u'あ', u'いい', u'ううう', u'ええええ'], index=['a', 'bb', 'c', 'ddd'])
-            expected = (u"a            あ\nbb         いい\nc        ううう\n"
-                        u"ddd    ええええ\ndtype: object")
-            self.assertEqual(_rep(s), expected)
-
-            # both
-            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                       index=[u'ああ', u'いいいい', u'う', u'えええ'])
-            expected = (u"ああ              あ\nいいいい        いい\nう            ううう\n"
-                        u"えええ      ええええ\ndtype: object")
-            self.assertEqual(_rep(s), expected)
-
-            # unicode footer
-            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                       index=[u'ああ', u'いいいい', u'う', u'えええ'],
-                       name=u'おおおおおおお')
-            expected = (u"ああ              あ\nいいいい        いい\nう            ううう\n"
-                        u"えええ      ええええ\nName: おおおおおおお, dtype: object")
-            self.assertEqual(_rep(s), expected)
-
-            # MultiIndex
-            idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'),
-                                             (u'おおお', u'かかかか'), (u'き', u'くく')])
-            s = Series([1, 22, 3333, 44444], index=idx)
-            expected = (u"あ      いい            1\nう      え             22\nおおお  かかかか     3333\n"
-                        u"き      くく        44444\ndtype: int64")
-            self.assertEqual(_rep(s), expected)
-
-            # object dtype, shorter than unicode repr
-            s = Series([1, 22, 3333, 44444], index=[1, 'AB', np.nan, u'あああ'])
-            expected = (u"1             1\nAB           22\nNaN        3333\n"
-                        u"あああ    44444\ndtype: int64")
-            self.assertEqual(_rep(s), expected)
-
-            # object dtype, longer than unicode repr
-            s = Series([1, 22, 3333, 44444],
-                       index=[1, 'AB', pd.Timestamp('2011-01-01'), u'あああ'])
-            expected = (u"1                          1\nAB                        22\n"
-                        u"2011-01-01 00:00:00     3333\nあああ                 44444\ndtype: int64")
-            self.assertEqual(_rep(s), expected)
-
-            # truncate
-            with option_context('display.max_rows', 3):
-                s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                           name=u'おおおおおおお')
-                expected = (u"0          あ\n       ...   \n"
-                            u"3    ええええ\nName: おおおおおおお, dtype: object")
-                self.assertEqual(_rep(s), expected)
-
-                s.index = [u'ああ', u'いいいい', u'う', u'えええ']
-                expected = (u"ああ            あ\n            ...   \n"
-                            u"えええ    ええええ\nName: おおおおおおお, dtype: object")
-                self.assertEqual(_rep(s), expected)
-
-            # ambiguous unicode
-            s = Series([u'¡¡', u'い¡¡', u'ううう', u'ええええ'],
-                       index=[u'ああ', u'¡¡¡¡いい', u'¡¡', u'えええ'])
-            expected = (u"ああ              ¡¡\n¡¡¡¡いい        い¡¡\n¡¡            ううう\n"
-                        u"えええ      ええええ\ndtype: object")
-            self.assertEqual(_rep(s), expected)
-
-    def test_float_trim_zeros(self):
-        vals = [2.08430917305e+10, 3.52205017305e+10, 2.30674817305e+10,
-                2.03954217305e+10, 5.59897817305e+10]
-        for line in repr(Series(vals)).split('\n'):
-            if line.startswith('dtype:'):
-                continue
-            if _three_digit_exp():
-                self.assertIn('+010', line)
-            else:
-                self.assertIn('+10', line)
-
-    def test_datetimeindex(self):
-
-        index = date_range('20130102',periods=6)
-        s = Series(1,index=index)
-        result = s.to_string()
-        self.assertTrue('2013-01-02' in result)
-
-        # nat in index
-        s2 = Series(2, index=[ Timestamp('20130111'), NaT ])
-        s = s2.append(s)
-        result = s.to_string()
-        self.assertTrue('NaT' in result)
-
-        # nat in summary
-        result = str(s2.index)
-        self.assertTrue('NaT' in result)
-
-    def test_timedelta64(self):
-
-        from datetime import datetime, timedelta
-
-        Series(np.array([1100, 20], dtype='timedelta64[ns]')).to_string()
-
-        s = Series(date_range('2012-1-1', periods=3, freq='D'))
-
-        # GH2146
-
-        # adding NaTs
-        y = s-s.shift(1)
-        result = y.to_string()
-        self.assertTrue('1 days' in result)
-        self.assertTrue('00:00:00' not in result)
-        self.assertTrue('NaT' in result)
-
-        # with frac seconds
-        o = Series([datetime(2012,1,1,microsecond=150)]*3)
-        y = s-o
-        result = y.to_string()
-        self.assertTrue('-1 days +23:59:59.999850' in result)
-
-        # rounding?
-        o = Series([datetime(2012,1,1,1)]*3)
-        y = s-o
-        result = y.to_string()
-        self.assertTrue('-1 days +23:00:00' in result)
-        self.assertTrue('1 days 23:00:00' in result)
-
-        o = Series([datetime(2012,1,1,1,1)]*3)
-        y = s-o
-        result = y.to_string()
-        self.assertTrue('-1 days +22:59:00' in result)
-        self.assertTrue('1 days 22:59:00' in result)
-
-        o = Series([datetime(2012,1,1,1,1,microsecond=150)]*3)
-        y = s-o
-        result = y.to_string()
-        self.assertTrue('-1 days +22:58:59.999850' in result)
-        self.assertTrue('0 days 22:58:59.999850' in result)
-
-        # neg time
-        td = timedelta(minutes=5,seconds=3)
-        s2 = Series(date_range('2012-1-1', periods=3, freq='D')) + td
-        y = s - s2
-        result = y.to_string()
-        self.assertTrue('-1 days +23:54:57' in result)
-
-        td = timedelta(microseconds=550)
-        s2 = Series(date_range('2012-1-1', periods=3, freq='D')) + td
-        y = s - td
-        result = y.to_string()
-        self.assertTrue('2012-01-01 23:59:59.999450' in result)
-
-        # no boxing of the actual elements
-        td = Series(pd.timedelta_range('1 days',periods=3))
-        result = td.to_string()
-        self.assertEqual(result,u("0   1 days\n1   2 days\n2   3 days"))
-
-    def test_mixed_datetime64(self):
-        df = DataFrame({'A': [1, 2],
-                        'B': ['2012-01-01', '2012-01-02']})
-        df['B'] = pd.to_datetime(df.B)
-
-        result = repr(df.ix[0])
-        self.assertTrue('2012-01-01' in result)
-
-    def test_max_multi_index_display(self):
-        # GH 7101
-
-        # doc example (indexing.rst)
-
-        # multi-index
-        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-        tuples = list(zip(*arrays))
-        index = MultiIndex.from_tuples(tuples, names=['first', 'second'])
-        s = Series(randn(8), index=index)
-
-        with option_context("display.max_rows", 10):
-            self.assertEqual(len(str(s).split('\n')),10)
-        with option_context("display.max_rows", 3):
-            self.assertEqual(len(str(s).split('\n')),5)
-        with option_context("display.max_rows", 2):
-            self.assertEqual(len(str(s).split('\n')),5)
-        with option_context("display.max_rows", 1):
-            self.assertEqual(len(str(s).split('\n')),4)
-        with option_context("display.max_rows", 0):
-            self.assertEqual(len(str(s).split('\n')),10)
-
-        # index
-        s = Series(randn(8), None)
-
-        with option_context("display.max_rows", 10):
-            self.assertEqual(len(str(s).split('\n')),9)
-        with option_context("display.max_rows", 3):
-            self.assertEqual(len(str(s).split('\n')),4)
-        with option_context("display.max_rows", 2):
-            self.assertEqual(len(str(s).split('\n')),4)
-        with option_context("display.max_rows", 1):
-            self.assertEqual(len(str(s).split('\n')),3)
-        with option_context("display.max_rows", 0):
-            self.assertEqual(len(str(s).split('\n')),9)
-
-    # Make sure #8532 is fixed
-    def test_consistent_format(self):
-        s = pd.Series([1,1,1,1,1,1,1,1,1,1,0.9999,1,1]*10)
-        with option_context("display.max_rows", 10):
-            res = repr(s)
-        exp = ('0      1.0000\n1      1.0000\n2      1.0000\n3      '
-               '1.0000\n4      1.0000\n        ...  \n125    '
-               '1.0000\n126    1.0000\n127    0.9999\n128    '
-               '1.0000\n129    1.0000\ndtype: float64')
-        self.assertEqual(res, exp)
-
-    @staticmethod
-    def gen_test_series():
-        s1 = pd.Series(['a']*100)
-        s2 = pd.Series(['ab']*100)
-        s3 = pd.Series(['a', 'ab', 'abc', 'abcd', 'abcde', 'abcdef'])
-        s4 = s3[::-1]
-        test_sers = {'onel': s1, 'twol': s2, 'asc': s3, 'desc': s4}
-        return test_sers
-
-    def chck_ncols(self, s):
-        with option_context("display.max_rows", 10):
-            res = repr(s)
-        lines = res.split('\n')
-        lines = [line for line in repr(s).split('\n') \
-                 if not re.match('[^\.]*\.+', line)][:-1]
-        ncolsizes = len(set(len(line.strip()) for line in lines))
-        self.assertEqual(ncolsizes, 1)
-
-    def test_format_explicit(self):
-        test_sers = self.gen_test_series()
-        with option_context("display.max_rows", 4):
-            res = repr(test_sers['onel'])
-            exp = '0     a\n1     a\n     ..\n98    a\n99    a\ndtype: object'
-            self.assertEqual(exp, res)
-            res = repr(test_sers['twol'])
-            exp = ('0     ab\n1     ab\n      ..\n98    ab\n99    ab\ndtype:'
-                   ' object')
-            self.assertEqual(exp, res)
-            res = repr(test_sers['asc'])
-            exp = ('0         a\n1        ab\n      ...  \n4     abcde\n5'
-                   '    abcdef\ndtype: object')
-            self.assertEqual(exp, res)
-            res = repr(test_sers['desc'])
-            exp = ('5    abcdef\n4     abcde\n      ...  \n1        ab\n0'
-                   '         a\ndtype: object')
-            self.assertEqual(exp, res)
-
-    def test_ncols(self):
-        test_sers = self.gen_test_series()
-        for s in test_sers.values():
-            self.chck_ncols(s)
-
-    def test_max_rows_eq_one(self):
-        s = Series(range(10),dtype='int64')
-        with option_context("display.max_rows", 1):
-            strrepr = repr(s).split('\n')
-        exp1 = ['0', '0']
-        res1 = strrepr[0].split()
-        self.assertEqual(exp1, res1)
-        exp2 = ['..']
-        res2 = strrepr[1].split()
-        self.assertEqual(exp2, res2)
-
-    def test_truncate_ndots(self):
-        def getndots(s):
-            return len(re.match('[^\.]*(\.*)', s).groups()[0])
-
-        s = Series([0, 2, 3, 6])
-        with option_context("display.max_rows", 2):
-            strrepr = repr(s).replace('\n', '')
-        self.assertEqual(getndots(strrepr), 2)
-
-        s = Series([0, 100, 200, 400])
-        with option_context("display.max_rows", 2):
-            strrepr = repr(s).replace('\n', '')
-        self.assertEqual(getndots(strrepr), 3)
-
-    def test_to_string_name(self):
-        s = Series(range(100),dtype='int64')
-        s.name = 'myser'
-        res = s.to_string(max_rows=2, name=True)
-        exp = '0      0\n      ..\n99    99\nName: myser'
-        self.assertEqual(res, exp)
-        res = s.to_string(max_rows=2, name=False)
-        exp = '0      0\n      ..\n99    99'
-        self.assertEqual(res, exp)
-
-    def test_to_string_dtype(self):
-        s = Series(range(100),dtype='int64')
-        res = s.to_string(max_rows=2, dtype=True)
-        exp = '0      0\n      ..\n99    99\ndtype: int64'
-        self.assertEqual(res, exp)
-        res = s.to_string(max_rows=2, dtype=False)
-        exp = '0      0\n      ..\n99    99'
-        self.assertEqual(res, exp)
-
-    def test_to_string_length(self):
-        s = Series(range(100),dtype='int64')
-        res = s.to_string(max_rows=2, length=True)
-        exp = '0      0\n      ..\n99    99\nLength: 100'
-        self.assertEqual(res, exp)
-
-    def test_to_string_na_rep(self):
-        s = pd.Series(index=range(100))
-        res = s.to_string(na_rep='foo', max_rows=2)
-        exp = '0    foo\n      ..\n99   foo'
-        self.assertEqual(res, exp)
-
-    def test_to_string_float_format(self):
-        s = pd.Series(range(10), dtype='float64')
-        res = s.to_string(float_format=lambda x: '{0:2.1f}'.format(x),
-                          max_rows=2)
-        exp = '0   0.0\n     ..\n9   9.0'
-        self.assertEqual(res, exp)
-
-    def test_to_string_header(self):
-        s = pd.Series(range(10),dtype='int64')
-        s.index.name = 'foo'
-        res = s.to_string(header=True, max_rows=2)
-        exp = 'foo\n0    0\n    ..\n9    9'
-        self.assertEqual(res, exp)
-        res = s.to_string(header=False, max_rows=2)
-        exp = '0    0\n    ..\n9    9'
-        self.assertEqual(res, exp)
-
-
-class TestEngFormatter(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def test_eng_float_formatter(self):
-        df = DataFrame({'A': [1.41, 141., 14100, 1410000.]})
-
-        fmt.set_eng_float_format()
-        result = df.to_string()
-        expected = ('             A\n'
-                    '0    1.410E+00\n'
-                    '1  141.000E+00\n'
-                    '2   14.100E+03\n'
-                    '3    1.410E+06')
-        self.assertEqual(result, expected)
-
-        fmt.set_eng_float_format(use_eng_prefix=True)
-        result = df.to_string()
-        expected = ('         A\n'
-                    '0    1.410\n'
-                    '1  141.000\n'
-                    '2  14.100k\n'
-                    '3   1.410M')
-        self.assertEqual(result, expected)
-
-        fmt.set_eng_float_format(accuracy=0)
-        result = df.to_string()
-        expected = ('         A\n'
-                    '0    1E+00\n'
-                    '1  141E+00\n'
-                    '2   14E+03\n'
-                    '3    1E+06')
-        self.assertEqual(result, expected)
-
-        self.reset_display_options()
-
-    def compare(self, formatter, input, output):
-        formatted_input = formatter(input)
-        msg = ("formatting of %s results in '%s', expected '%s'"
-               % (str(input), formatted_input, output))
-        self.assertEqual(formatted_input, output, msg)
-
-    def compare_all(self, formatter, in_out):
-        """
-        Parameters:
-        -----------
-        formatter: EngFormatter under test
-        in_out: list of tuples. Each tuple = (number, expected_formatting)
-
-        It is tested if 'formatter(number) == expected_formatting'.
-        *number* should be >= 0 because formatter(-number) == fmt is also
-        tested. *fmt* is derived from *expected_formatting*
-        """
-        for input, output in in_out:
-            self.compare(formatter, input, output)
-            self.compare(formatter, -input, "-" + output[1:])
-
-    def test_exponents_with_eng_prefix(self):
-        formatter = fmt.EngFormatter(accuracy=3, use_eng_prefix=True)
-        f = np.sqrt(2)
-        in_out = [(f * 10 ** -24, " 1.414y"),
-                  (f * 10 ** -23, " 14.142y"),
-                  (f * 10 ** -22, " 141.421y"),
-                  (f * 10 ** -21, " 1.414z"),
-                  (f * 10 ** -20, " 14.142z"),
-                  (f * 10 ** -19, " 141.421z"),
-                  (f * 10 ** -18, " 1.414a"),
-                  (f * 10 ** -17, " 14.142a"),
-                  (f * 10 ** -16, " 141.421a"),
-                  (f * 10 ** -15, " 1.414f"),
-                  (f * 10 ** -14, " 14.142f"),
-                  (f * 10 ** -13, " 141.421f"),
-                  (f * 10 ** -12, " 1.414p"),
-                  (f * 10 ** -11, " 14.142p"),
-                  (f * 10 ** -10, " 141.421p"),
-                  (f * 10 ** -9, " 1.414n"),
-                  (f * 10 ** -8, " 14.142n"),
-                  (f * 10 ** -7, " 141.421n"),
-                  (f * 10 ** -6, " 1.414u"),
-                  (f * 10 ** -5, " 14.142u"),
-                  (f * 10 ** -4, " 141.421u"),
-                  (f * 10 ** -3, " 1.414m"),
-                  (f * 10 ** -2, " 14.142m"),
-                  (f * 10 ** -1, " 141.421m"),
-                  (f * 10 ** 0, " 1.414"),
-                  (f * 10 ** 1, " 14.142"),
-                  (f * 10 ** 2, " 141.421"),
-                  (f * 10 ** 3, " 1.414k"),
-                  (f * 10 ** 4, " 14.142k"),
-                  (f * 10 ** 5, " 141.421k"),
-                  (f * 10 ** 6, " 1.414M"),
-                  (f * 10 ** 7, " 14.142M"),
-                  (f * 10 ** 8, " 141.421M"),
-                  (f * 10 ** 9, " 1.414G"),
-                  (f * 10 ** 10, " 14.142G"),
-                  (f * 10 ** 11, " 141.421G"),
-                  (f * 10 ** 12, " 1.414T"),
-                  (f * 10 ** 13, " 14.142T"),
-                  (f * 10 ** 14, " 141.421T"),
-                  (f * 10 ** 15, " 1.414P"),
-                  (f * 10 ** 16, " 14.142P"),
-                  (f * 10 ** 17, " 141.421P"),
-                  (f * 10 ** 18, " 1.414E"),
-                  (f * 10 ** 19, " 14.142E"),
-                  (f * 10 ** 20, " 141.421E"),
-                  (f * 10 ** 21, " 1.414Z"),
-                  (f * 10 ** 22, " 14.142Z"),
-                  (f * 10 ** 23, " 141.421Z"),
-                  (f * 10 ** 24, " 1.414Y"),
-                  (f * 10 ** 25, " 14.142Y"),
-                  (f * 10 ** 26, " 141.421Y")]
-        self.compare_all(formatter, in_out)
-
-    def test_exponents_without_eng_prefix(self):
-        formatter = fmt.EngFormatter(accuracy=4, use_eng_prefix=False)
-        f = np.pi
-        in_out = [(f * 10 ** -24, " 3.1416E-24"),
-                  (f * 10 ** -23, " 31.4159E-24"),
-                  (f * 10 ** -22, " 314.1593E-24"),
-                  (f * 10 ** -21, " 3.1416E-21"),
-                  (f * 10 ** -20, " 31.4159E-21"),
-                  (f * 10 ** -19, " 314.1593E-21"),
-                  (f * 10 ** -18, " 3.1416E-18"),
-                  (f * 10 ** -17, " 31.4159E-18"),
-                  (f * 10 ** -16, " 314.1593E-18"),
-                  (f * 10 ** -15, " 3.1416E-15"),
-                  (f * 10 ** -14, " 31.4159E-15"),
-                  (f * 10 ** -13, " 314.1593E-15"),
-                  (f * 10 ** -12, " 3.1416E-12"),
-                  (f * 10 ** -11, " 31.4159E-12"),
-                  (f * 10 ** -10, " 314.1593E-12"),
-                  (f * 10 ** -9, " 3.1416E-09"),
-                  (f * 10 ** -8, " 31.4159E-09"),
-                  (f * 10 ** -7, " 314.1593E-09"),
-                  (f * 10 ** -6, " 3.1416E-06"),
-                  (f * 10 ** -5, " 31.4159E-06"),
-                  (f * 10 ** -4, " 314.1593E-06"),
-                  (f * 10 ** -3, " 3.1416E-03"),
-                  (f * 10 ** -2, " 31.4159E-03"),
-                  (f * 10 ** -1, " 314.1593E-03"),
-                  (f * 10 ** 0, " 3.1416E+00"),
-                  (f * 10 ** 1, " 31.4159E+00"),
-                  (f * 10 ** 2, " 314.1593E+00"),
-                  (f * 10 ** 3, " 3.1416E+03"),
-                  (f * 10 ** 4, " 31.4159E+03"),
-                  (f * 10 ** 5, " 314.1593E+03"),
-                  (f * 10 ** 6, " 3.1416E+06"),
-                  (f * 10 ** 7, " 31.4159E+06"),
-                  (f * 10 ** 8, " 314.1593E+06"),
-                  (f * 10 ** 9, " 3.1416E+09"),
-                  (f * 10 ** 10, " 31.4159E+09"),
-                  (f * 10 ** 11, " 314.1593E+09"),
-                  (f * 10 ** 12, " 3.1416E+12"),
-                  (f * 10 ** 13, " 31.4159E+12"),
-                  (f * 10 ** 14, " 314.1593E+12"),
-                  (f * 10 ** 15, " 3.1416E+15"),
-                  (f * 10 ** 16, " 31.4159E+15"),
-                  (f * 10 ** 17, " 314.1593E+15"),
-                  (f * 10 ** 18, " 3.1416E+18"),
-                  (f * 10 ** 19, " 31.4159E+18"),
-                  (f * 10 ** 20, " 314.1593E+18"),
-                  (f * 10 ** 21, " 3.1416E+21"),
-                  (f * 10 ** 22, " 31.4159E+21"),
-                  (f * 10 ** 23, " 314.1593E+21"),
-                  (f * 10 ** 24, " 3.1416E+24"),
-                  (f * 10 ** 25, " 31.4159E+24"),
-                  (f * 10 ** 26, " 314.1593E+24")]
-        self.compare_all(formatter, in_out)
-
-    def test_rounding(self):
-        formatter = fmt.EngFormatter(accuracy=3, use_eng_prefix=True)
-        in_out = [(5.55555, ' 5.556'),
-                  (55.5555, ' 55.556'),
-                  (555.555, ' 555.555'),
-                  (5555.55, ' 5.556k'),
-                  (55555.5, ' 55.556k'),
-                  (555555, ' 555.555k')]
-        self.compare_all(formatter, in_out)
-
-        formatter = fmt.EngFormatter(accuracy=1, use_eng_prefix=True)
-        in_out = [(5.55555, ' 5.6'),
-                  (55.5555, ' 55.6'),
-                  (555.555, ' 555.6'),
-                  (5555.55, ' 5.6k'),
-                  (55555.5, ' 55.6k'),
-                  (555555, ' 555.6k')]
-        self.compare_all(formatter, in_out)
-
-        formatter = fmt.EngFormatter(accuracy=0, use_eng_prefix=True)
-        in_out = [(5.55555, ' 6'),
-                  (55.5555, ' 56'),
-                  (555.555, ' 556'),
-                  (5555.55, ' 6k'),
-                  (55555.5, ' 56k'),
-                  (555555, ' 556k')]
-        self.compare_all(formatter, in_out)
-
-        formatter = fmt.EngFormatter(accuracy=3, use_eng_prefix=True)
-        result = formatter(0)
-        self.assertEqual(result, u(' 0.000'))
-
-
-def _three_digit_exp():
-    return '%.4g' % 1.7e8 == '1.7e+008'
-
-
-class TestFloatArrayFormatter(tm.TestCase):
-
-    def test_misc(self):
-        obj = fmt.FloatArrayFormatter(np.array([], dtype=np.float64))
-        result = obj.get_result()
-        self.assertTrue(len(result) == 0)
-
-    def test_format(self):
-        obj = fmt.FloatArrayFormatter(np.array([12, 0], dtype=np.float64))
-        result = obj.get_result()
-        self.assertEqual(result[0], " 12")
-        self.assertEqual(result[1], "  0")
-
-    def test_output_significant_digits(self):
-        # Issue #9764
-
-        # In case default display precision changes:
-        with pd.option_context('display.precision', 6):
-            # DataFrame example from issue #9764
-            d=pd.DataFrame({'col1':[9.999e-8, 1e-7, 1.0001e-7, 2e-7, 4.999e-7, 5e-7, 5.0001e-7, 6e-7, 9.999e-7, 1e-6, 1.0001e-6, 2e-6, 4.999e-6, 5e-6, 5.0001e-6, 6e-6]})
-
-            expected_output={
-                (0,6):'           col1\n0  9.999000e-08\n1  1.000000e-07\n2  1.000100e-07\n3  2.000000e-07\n4  4.999000e-07\n5  5.000000e-07',
-                (1,6):'           col1\n1  1.000000e-07\n2  1.000100e-07\n3  2.000000e-07\n4  4.999000e-07\n5  5.000000e-07',
-                (1,8):'           col1\n1  1.000000e-07\n2  1.000100e-07\n3  2.000000e-07\n4  4.999000e-07\n5  5.000000e-07\n6  5.000100e-07\n7  6.000000e-07',
-                (8,16):'            col1\n8   9.999000e-07\n9   1.000000e-06\n10  1.000100e-06\n11  2.000000e-06\n12  4.999000e-06\n13  5.000000e-06\n14  5.000100e-06\n15  6.000000e-06',
-                (9,16):'        col1\n9   0.000001\n10  0.000001\n11  0.000002\n12  0.000005\n13  0.000005\n14  0.000005\n15  0.000006'
-            }
-
-            for (start, stop), v in expected_output.items():
-                self.assertEqual(str(d[start:stop]), v)
-
-    def test_too_long(self):
-        # GH 10451
-        with pd.option_context('display.precision', 4):
-            # need both a number > 1e8 and something that normally formats to having length > display.precision + 6
-            df = pd.DataFrame(dict(x=[12345.6789]))
-            self.assertEqual(str(df), '            x\n0  12345.6789')
-            df = pd.DataFrame(dict(x=[2e8]))
-            self.assertEqual(str(df), '           x\n0  200000000')
-            df = pd.DataFrame(dict(x=[12345.6789, 2e8]))
-            self.assertEqual(str(df), '            x\n0  1.2346e+04\n1  2.0000e+08')
-
-
-class TestRepr_timedelta64(tm.TestCase):
-
-    def test_none(self):
-        delta_1d = pd.to_timedelta(1, unit='D')
-        delta_0d = pd.to_timedelta(0, unit='D')
-        delta_1s = pd.to_timedelta(1, unit='s')
-        delta_500ms = pd.to_timedelta(500, unit='ms')
-
-        drepr = lambda x: x._repr_base()
-        self.assertEqual(drepr(delta_1d), "1 days")
-        self.assertEqual(drepr(-delta_1d), "-1 days")
-        self.assertEqual(drepr(delta_0d), "0 days")
-        self.assertEqual(drepr(delta_1s), "0 days 00:00:01")
-        self.assertEqual(drepr(delta_500ms), "0 days 00:00:00.500000")
-        self.assertEqual(drepr(delta_1d + delta_1s), "1 days 00:00:01")
-        self.assertEqual(drepr(delta_1d + delta_500ms), "1 days 00:00:00.500000")
-
-    def test_even_day(self):
-        delta_1d = pd.to_timedelta(1, unit='D')
-        delta_0d = pd.to_timedelta(0, unit='D')
-        delta_1s = pd.to_timedelta(1, unit='s')
-        delta_500ms = pd.to_timedelta(500, unit='ms')
-
-        drepr = lambda x: x._repr_base(format='even_day')
-        self.assertEqual(drepr(delta_1d), "1 days")
-        self.assertEqual(drepr(-delta_1d), "-1 days")
-        self.assertEqual(drepr(delta_0d), "0 days")
-        self.assertEqual(drepr(delta_1s), "0 days 00:00:01")
-        self.assertEqual(drepr(delta_500ms), "0 days 00:00:00.500000")
-        self.assertEqual(drepr(delta_1d + delta_1s), "1 days 00:00:01")
-        self.assertEqual(drepr(delta_1d + delta_500ms), "1 days 00:00:00.500000")
-
-    def test_sub_day(self):
-        delta_1d = pd.to_timedelta(1, unit='D')
-        delta_0d = pd.to_timedelta(0, unit='D')
-        delta_1s = pd.to_timedelta(1, unit='s')
-        delta_500ms = pd.to_timedelta(500, unit='ms')
-
-        drepr = lambda x: x._repr_base(format='sub_day')
-        self.assertEqual(drepr(delta_1d), "1 days")
-        self.assertEqual(drepr(-delta_1d), "-1 days")
-        self.assertEqual(drepr(delta_0d), "00:00:00")
-        self.assertEqual(drepr(delta_1s), "00:00:01")
-        self.assertEqual(drepr(delta_500ms), "00:00:00.500000")
-        self.assertEqual(drepr(delta_1d + delta_1s), "1 days 00:00:01")
-        self.assertEqual(drepr(delta_1d + delta_500ms), "1 days 00:00:00.500000")
-
-    def test_long(self):
-        delta_1d = pd.to_timedelta(1, unit='D')
-        delta_0d = pd.to_timedelta(0, unit='D')
-        delta_1s = pd.to_timedelta(1, unit='s')
-        delta_500ms = pd.to_timedelta(500, unit='ms')
-
-        drepr = lambda x: x._repr_base(format='long')
-        self.assertEqual(drepr(delta_1d), "1 days 00:00:00")
-        self.assertEqual(drepr(-delta_1d), "-1 days +00:00:00")
-        self.assertEqual(drepr(delta_0d), "0 days 00:00:00")
-        self.assertEqual(drepr(delta_1s), "0 days 00:00:01")
-        self.assertEqual(drepr(delta_500ms), "0 days 00:00:00.500000")
-        self.assertEqual(drepr(delta_1d + delta_1s), "1 days 00:00:01")
-        self.assertEqual(drepr(delta_1d + delta_500ms), "1 days 00:00:00.500000")
-
-    def test_all(self):
-        delta_1d = pd.to_timedelta(1, unit='D')
-        delta_0d = pd.to_timedelta(0, unit='D')
-        delta_1ns = pd.to_timedelta(1, unit='ns')
-
-        drepr = lambda x: x._repr_base(format='all')
-        self.assertEqual(drepr(delta_1d), "1 days 00:00:00.000000000")
-        self.assertEqual(drepr(delta_0d), "0 days 00:00:00.000000000")
-        self.assertEqual(drepr(delta_1ns), "0 days 00:00:00.000000001")
-
-class TestTimedelta64Formatter(tm.TestCase):
-
-    def test_days(self):
-        x = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='D')
-        result = fmt.Timedelta64Formatter(x,box=True).get_result()
-        self.assertEqual(result[0].strip(), "'0 days'")
-        self.assertEqual(result[1].strip(), "'1 days'")
-
-        result = fmt.Timedelta64Formatter(x[1:2],box=True).get_result()
-        self.assertEqual(result[0].strip(), "'1 days'")
-
-        result = fmt.Timedelta64Formatter(x,box=False).get_result()
-        self.assertEqual(result[0].strip(), "0 days")
-        self.assertEqual(result[1].strip(), "1 days")
-
-        result = fmt.Timedelta64Formatter(x[1:2],box=False).get_result()
-        self.assertEqual(result[0].strip(), "1 days")
-
-    def test_days_neg(self):
-        x = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='D')
-        result = fmt.Timedelta64Formatter(-x,box=True).get_result()
-        self.assertEqual(result[0].strip(), "'0 days'")
-        self.assertEqual(result[1].strip(), "'-1 days'")
-
-    def test_subdays(self):
-        y = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='s')
-        result = fmt.Timedelta64Formatter(y,box=True).get_result()
-        self.assertEqual(result[0].strip(), "'00:00:00'")
-        self.assertEqual(result[1].strip(), "'00:00:01'")
-
-    def test_subdays_neg(self):
-        y = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='s')
-        result = fmt.Timedelta64Formatter(-y,box=True).get_result()
-        self.assertEqual(result[0].strip(), "'00:00:00'")
-        self.assertEqual(result[1].strip(), "'-1 days +23:59:59'")
-
-    def test_zero(self):
-        x = pd.to_timedelta(list(range(1)) + [pd.NaT], unit='D')
-        result = fmt.Timedelta64Formatter(x,box=True).get_result()
-        self.assertEqual(result[0].strip(), "'0 days'")
-
-        x = pd.to_timedelta(list(range(1)), unit='D')
-        result = fmt.Timedelta64Formatter(x,box=True).get_result()
-        self.assertEqual(result[0].strip(), "'0 days'")
-
-
-class TestDatetime64Formatter(tm.TestCase):
-    def test_mixed(self):
-        x = Series([datetime(2013, 1, 1), datetime(2013, 1, 1, 12), pd.NaT])
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01 00:00:00")
-        self.assertEqual(result[1].strip(), "2013-01-01 12:00:00")
-
-    def test_dates(self):
-        x = Series([datetime(2013, 1, 1), datetime(2013, 1, 2), pd.NaT])
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01")
-        self.assertEqual(result[1].strip(), "2013-01-02")
-
-    def test_date_nanos(self):
-        x = Series([Timestamp(200)])
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "1970-01-01 00:00:00.000000200")
-
-    def test_dates_display(self):
-
-        # 10170
-        # make sure that we are consistently display date formatting
-        x = Series(date_range('20130101 09:00:00',periods=5,freq='D'))
-        x.iloc[1] = np.nan
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01 09:00:00")
-        self.assertEqual(result[1].strip(), "NaT")
-        self.assertEqual(result[4].strip(), "2013-01-05 09:00:00")
-
-        x = Series(date_range('20130101 09:00:00',periods=5,freq='s'))
-        x.iloc[1] = np.nan
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01 09:00:00")
-        self.assertEqual(result[1].strip(), "NaT")
-        self.assertEqual(result[4].strip(), "2013-01-01 09:00:04")
-
-        x = Series(date_range('20130101 09:00:00',periods=5,freq='ms'))
-        x.iloc[1] = np.nan
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01 09:00:00.000")
-        self.assertEqual(result[1].strip(), "NaT")
-        self.assertEqual(result[4].strip(), "2013-01-01 09:00:00.004")
-
-        x = Series(date_range('20130101 09:00:00',periods=5,freq='us'))
-        x.iloc[1] = np.nan
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01 09:00:00.000000")
-        self.assertEqual(result[1].strip(), "NaT")
-        self.assertEqual(result[4].strip(), "2013-01-01 09:00:00.000004")
-
-        x = Series(date_range('20130101 09:00:00',periods=5,freq='N'))
-        x.iloc[1] = np.nan
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01 09:00:00.000000000")
-        self.assertEqual(result[1].strip(), "NaT")
-        self.assertEqual(result[4].strip(), "2013-01-01 09:00:00.000000004")
-
-class TestNaTFormatting(tm.TestCase):
-    def test_repr(self):
-        self.assertEqual(repr(pd.NaT), "NaT")
-
-    def test_str(self):
-        self.assertEqual(str(pd.NaT), "NaT")
-
-
-class TestDatetimeIndexFormat(tm.TestCase):
-    def test_datetime(self):
-        formatted = pd.to_datetime([datetime(2003, 1, 1, 12), pd.NaT]).format()
-        self.assertEqual(formatted[0], "2003-01-01 12:00:00")
-        self.assertEqual(formatted[1], "NaT")
-
-    def test_date(self):
-        formatted = pd.to_datetime([datetime(2003, 1, 1), pd.NaT]).format()
-        self.assertEqual(formatted[0], "2003-01-01")
-        self.assertEqual(formatted[1], "NaT")
-
-    def test_date_tz(self):
-        formatted = pd.to_datetime([datetime(2013,1,1)], utc=True).format()
-        self.assertEqual(formatted[0], "2013-01-01 00:00:00+00:00")
-
-        formatted = pd.to_datetime([datetime(2013,1,1), pd.NaT], utc=True).format()
-        self.assertEqual(formatted[0], "2013-01-01 00:00:00+00:00")
-
-    def test_date_explict_date_format(self):
-        formatted = pd.to_datetime([datetime(2003, 2, 1), pd.NaT]).format(date_format="%m-%d-%Y", na_rep="UT")
-        self.assertEqual(formatted[0], "02-01-2003")
-        self.assertEqual(formatted[1], "UT")
-
-
-class TestDatetimeIndexUnicode(tm.TestCase):
-    def test_dates(self):
-        text = str(pd.to_datetime([datetime(2013,1,1), datetime(2014,1,1)]))
-        self.assertTrue("['2013-01-01'," in text)
-        self.assertTrue(", '2014-01-01']" in text)
-
-    def test_mixed(self):
-        text = str(pd.to_datetime([datetime(2013,1,1), datetime(2014,1,1,12), datetime(2014,1,1)]))
-        self.assertTrue("'2013-01-01 00:00:00'," in text)
-        self.assertTrue("'2014-01-01 00:00:00']" in text)
-
-
-class TestStringRepTimestamp(tm.TestCase):
-    def test_no_tz(self):
-        dt_date = datetime(2013, 1, 2)
-        self.assertEqual(str(dt_date), str(Timestamp(dt_date)))
-
-        dt_datetime = datetime(2013, 1, 2, 12, 1, 3)
-        self.assertEqual(str(dt_datetime), str(Timestamp(dt_datetime)))
-
-        dt_datetime_us = datetime(2013, 1, 2, 12, 1, 3, 45)
-        self.assertEqual(str(dt_datetime_us), str(Timestamp(dt_datetime_us)))
-
-        ts_nanos_only = Timestamp(200)
-        self.assertEqual(str(ts_nanos_only), "1970-01-01 00:00:00.000000200")
-
-        ts_nanos_micros = Timestamp(1200)
-        self.assertEqual(str(ts_nanos_micros), "1970-01-01 00:00:00.000001200")
-
-    def test_tz_pytz(self):
-        tm._skip_if_no_pytz()
-
-        import pytz
-
-        dt_date = datetime(2013, 1, 2, tzinfo=pytz.utc)
-        self.assertEqual(str(dt_date), str(Timestamp(dt_date)))
-
-        dt_datetime = datetime(2013, 1, 2, 12, 1, 3, tzinfo=pytz.utc)
-        self.assertEqual(str(dt_datetime), str(Timestamp(dt_datetime)))
-
-        dt_datetime_us = datetime(2013, 1, 2, 12, 1, 3, 45, tzinfo=pytz.utc)
-        self.assertEqual(str(dt_datetime_us), str(Timestamp(dt_datetime_us)))
-
-    def test_tz_dateutil(self):
-        tm._skip_if_no_dateutil()
-        import dateutil
-        utc = dateutil.tz.tzutc()
-
-        dt_date = datetime(2013, 1, 2, tzinfo=utc)
-        self.assertEqual(str(dt_date), str(Timestamp(dt_date)))
-
-        dt_datetime = datetime(2013, 1, 2, 12, 1, 3, tzinfo=utc)
-        self.assertEqual(str(dt_datetime), str(Timestamp(dt_datetime)))
-
-        dt_datetime_us = datetime(2013, 1, 2, 12, 1, 3, 45, tzinfo=utc)
-        self.assertEqual(str(dt_datetime_us), str(Timestamp(dt_datetime_us)))
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_frame.py b/pandas/tests/test_frame.py
deleted file mode 100644
index 172c1e30686e1..0000000000000
--- a/pandas/tests/test_frame.py
+++ /dev/null
@@ -1,16600 +0,0 @@
-# -*- coding: utf-8 -*-
-
-from __future__ import print_function
-# pylint: disable-msg=W0612,E1101
-from copy import deepcopy
-from datetime import datetime, timedelta, time, date
-import sys
-import operator
-import re
-import csv
-import nose
-import functools
-import itertools
-from itertools import product, permutations
-from distutils.version import LooseVersion
-
-from pandas.compat import(
-    map, zip, range, long, lrange, lmap, lzip,
-    OrderedDict, u, StringIO, string_types,
-    is_platform_windows
-)
-from pandas import compat
-
-from numpy import random, nan, inf
-from numpy.random import randn
-import numpy as np
-import numpy.ma as ma
-import numpy.ma.mrecords as mrecords
-
-import pandas.core.nanops as nanops
-import pandas.core.common as com
-import pandas.core.format as fmt
-import pandas.core.datetools as datetools
-from pandas import (DataFrame, Index, Series, Panel, notnull, isnull,
-                    MultiIndex, DatetimeIndex, Timestamp, date_range,
-                    read_csv, timedelta_range, Timedelta, CategoricalIndex,
-                    option_context, period_range)
-from pandas.core.dtypes import DatetimeTZDtype
-import pandas as pd
-from pandas.parser import CParserError
-from pandas.util.misc import is_little_endian
-
-from pandas.util.testing import (assert_almost_equal,
-                                 assert_numpy_array_equal,
-                                 assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp,
-                                 assertRaises,
-                                 makeCustomDataframe as mkdf,
-                                 ensure_clean,
-                                 SubclassedDataFrame)
-from pandas.core.indexing import IndexingError
-from pandas.core.common import PandasError
-
-import pandas.util.testing as tm
-import pandas.lib as lib
-
-from numpy.testing.decorators import slow
-
-#---------------------------------------------------------------------
-# DataFrame test cases
-
-JOIN_TYPES = ['inner', 'outer', 'left', 'right']
-MIXED_FLOAT_DTYPES = ['float16','float32','float64']
-MIXED_INT_DTYPES   = ['uint8','uint16','uint32','uint64','int8','int16',
-                      'int32','int64']
-
-def _check_mixed_float(df, dtype = None):
-
-    # float16 are most likely to be upcasted to float32
-    dtypes = dict(A = 'float32', B = 'float32', C = 'float16', D = 'float64')
-    if isinstance(dtype, compat.string_types):
-        dtypes = dict([ (k,dtype) for k, v in dtypes.items() ])
-    elif isinstance(dtype, dict):
-        dtypes.update(dtype)
-    if dtypes.get('A'):
-        assert(df.dtypes['A'] == dtypes['A'])
-    if dtypes.get('B'):
-        assert(df.dtypes['B'] == dtypes['B'])
-    if dtypes.get('C'):
-        assert(df.dtypes['C'] == dtypes['C'])
-    if dtypes.get('D'):
-        assert(df.dtypes['D'] == dtypes['D'])
-
-
-def _check_mixed_int(df, dtype = None):
-    dtypes = dict(A = 'int32', B = 'uint64', C = 'uint8', D = 'int64')
-    if isinstance(dtype, compat.string_types):
-        dtypes = dict([ (k,dtype) for k, v in dtypes.items() ])
-    elif isinstance(dtype, dict):
-        dtypes.update(dtype)
-    if dtypes.get('A'):
-        assert(df.dtypes['A'] == dtypes['A'])
-    if dtypes.get('B'):
-        assert(df.dtypes['B'] == dtypes['B'])
-    if dtypes.get('C'):
-        assert(df.dtypes['C'] == dtypes['C'])
-    if dtypes.get('D'):
-        assert(df.dtypes['D'] == dtypes['D'])
-
-
-class CheckIndexing(object):
-
-    _multiprocess_can_split_ = True
-
-    def test_getitem(self):
-        # slicing
-        sl = self.frame[:20]
-        self.assertEqual(20, len(sl.index))
-
-        # column access
-
-        for _, series in compat.iteritems(sl):
-            self.assertEqual(20, len(series.index))
-            self.assertTrue(tm.equalContents(series.index, sl.index))
-
-        for key, _ in compat.iteritems(self.frame._series):
-            self.assertIsNotNone(self.frame[key])
-
-        self.assertNotIn('random', self.frame)
-        with assertRaisesRegexp(KeyError, 'random'):
-            self.frame['random']
-
-        df = self.frame.copy()
-        df['$10'] = randn(len(df))
-        ad = randn(len(df))
-        df['@awesome_domain'] = ad
-        self.assertRaises(KeyError, df.__getitem__, 'df["$10"]')
-        res = df['@awesome_domain']
-        assert_numpy_array_equal(ad, res.values)
-
-    def test_getitem_dupe_cols(self):
-        df = DataFrame([[1, 2, 3], [4, 5, 6]], columns=['a', 'a', 'b'])
-        try:
-            df[['baf']]
-        except KeyError:
-            pass
-        else:
-            self.fail("Dataframe failed to raise KeyError")
-
-    def test_get(self):
-        b = self.frame.get('B')
-        assert_series_equal(b, self.frame['B'])
-
-        self.assertIsNone(self.frame.get('foo'))
-        assert_series_equal(self.frame.get('foo', self.frame['B']),
-                            self.frame['B'])
-        # None
-        # GH 5652
-        for df in [DataFrame(), DataFrame(columns=list('AB')), DataFrame(columns=list('AB'),index=range(3)) ]:
-            result = df.get(None)
-            self.assertIsNone(result)
-
-    def test_getitem_iterator(self):
-        idx = iter(['A', 'B', 'C'])
-        result = self.frame.ix[:, idx]
-        expected = self.frame.ix[:, ['A', 'B', 'C']]
-        assert_frame_equal(result, expected)
-
-    def test_getitem_list(self):
-        self.frame.columns.name = 'foo'
-
-        result = self.frame[['B', 'A']]
-        result2 = self.frame[Index(['B', 'A'])]
-
-        expected = self.frame.ix[:, ['B', 'A']]
-        expected.columns.name = 'foo'
-
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
-
-        self.assertEqual(result.columns.name, 'foo')
-
-        with assertRaisesRegexp(KeyError, 'not in index'):
-            self.frame[['B', 'A', 'food']]
-        with assertRaisesRegexp(KeyError, 'not in index'):
-            self.frame[Index(['B', 'A', 'foo'])]
-
-        # tuples
-        df = DataFrame(randn(8, 3),
-                       columns=Index([('foo', 'bar'), ('baz', 'qux'),
-                                      ('peek', 'aboo')], name=['sth', 'sth2']))
-
-        result = df[[('foo', 'bar'), ('baz', 'qux')]]
-        expected = df.ix[:, :2]
-        assert_frame_equal(result, expected)
-        self.assertEqual(result.columns.names, ['sth', 'sth2'])
-
-    def test_setitem_list(self):
-
-        self.frame['E'] = 'foo'
-        data = self.frame[['A', 'B']]
-        self.frame[['B', 'A']] = data
-
-        assert_series_equal(self.frame['B'], data['A'], check_names=False)
-        assert_series_equal(self.frame['A'], data['B'], check_names=False)
-
-        with assertRaisesRegexp(ValueError, 'Columns must be same length as key'):
-            data[['A']] = self.frame[['A', 'B']]
-        with assertRaisesRegexp(ValueError, 'Length of values does not match '
-                                'length of index'):
-            data['A'] = range(len(data.index) - 1)
-
-        df = DataFrame(0, lrange(3), ['tt1', 'tt2'], dtype=np.int_)
-        df.ix[1, ['tt1', 'tt2']] = [1, 2]
-
-        result = df.ix[1, ['tt1', 'tt2']]
-        expected = Series([1, 2], df.columns, dtype=np.int_, name=1)
-        assert_series_equal(result, expected)
-
-        df['tt1'] = df['tt2'] = '0'
-        df.ix[1, ['tt1', 'tt2']] = ['1', '2']
-        result = df.ix[1, ['tt1', 'tt2']]
-        expected = Series(['1', '2'], df.columns, name=1)
-        assert_series_equal(result, expected)
-
-    def test_setitem_list_not_dataframe(self):
-        data = np.random.randn(len(self.frame), 2)
-        self.frame[['A', 'B']] = data
-        assert_almost_equal(self.frame[['A', 'B']].values, data)
-
-    def test_setitem_list_of_tuples(self):
-        tuples = lzip(self.frame['A'], self.frame['B'])
-        self.frame['tuples'] = tuples
-
-        result = self.frame['tuples']
-        expected = Series(tuples, index=self.frame.index, name='tuples')
-        assert_series_equal(result, expected)
-
-    def test_setitem_mulit_index(self):
-        # GH7655, test that assigning to a sub-frame of a frame
-        # with multi-index columns aligns both rows and columns
-        it = ['jim', 'joe', 'jolie'], ['first', 'last'], \
-             ['left', 'center', 'right']
-
-        cols = MultiIndex.from_product(it)
-        index = pd.date_range('20141006',periods=20)
-        vals = np.random.randint(1, 1000, (len(index), len(cols)))
-        df = pd.DataFrame(vals, columns=cols, index=index)
-
-        i, j = df.index.values.copy(), it[-1][:]
-
-        np.random.shuffle(i)
-        df['jim'] = df['jolie'].loc[i, ::-1]
-        assert_frame_equal(df['jim'], df['jolie'])
-
-        np.random.shuffle(j)
-        df[('joe', 'first')] = df[('jolie', 'last')].loc[i, j]
-        assert_frame_equal(df[('joe', 'first')], df[('jolie', 'last')])
-
-        np.random.shuffle(j)
-        df[('joe', 'last')] = df[('jolie', 'first')].loc[i, j]
-        assert_frame_equal(df[('joe', 'last')], df[('jolie', 'first')])
-
-    def test_inplace_ops_alignment(self):
-
-        # inplace ops / ops alignment
-        # GH 8511
-
-        columns = list('abcdefg')
-        X_orig = DataFrame(np.arange(10*len(columns)).reshape(-1,len(columns)), columns=columns, index=range(10))
-        Z = 100*X_orig.iloc[:,1:-1].copy()
-        block1 = list('bedcf')
-        subs = list('bcdef')
-
-        # add
-        X = X_orig.copy()
-        result1 = (X[block1] + Z).reindex(columns=subs)
-
-        X[block1] += Z
-        result2 = X.reindex(columns=subs)
-
-        X = X_orig.copy()
-        result3 = (X[block1] + Z[block1]).reindex(columns=subs)
-
-        X[block1] += Z[block1]
-        result4 = X.reindex(columns=subs)
-
-        assert_frame_equal(result1, result2)
-        assert_frame_equal(result1, result3)
-        assert_frame_equal(result1, result4)
-
-        # sub
-        X = X_orig.copy()
-        result1 = (X[block1] - Z).reindex(columns=subs)
-
-        X[block1] -= Z
-        result2 = X.reindex(columns=subs)
-
-        X = X_orig.copy()
-        result3 = (X[block1] - Z[block1]).reindex(columns=subs)
-
-        X[block1] -= Z[block1]
-        result4 = X.reindex(columns=subs)
-
-        assert_frame_equal(result1, result2)
-        assert_frame_equal(result1, result3)
-        assert_frame_equal(result1, result4)
-
-    def test_inplace_ops_identity(self):
-
-        # GH 5104
-        # make sure that we are actually changing the object
-        s_orig = Series([1, 2, 3])
-        df_orig = DataFrame(np.random.randint(0,5,size=10).reshape(-1,5))
-
-        # no dtype change
-        s = s_orig.copy()
-        s2 = s
-        s += 1
-        assert_series_equal(s,s2)
-        assert_series_equal(s_orig+1,s)
-        self.assertIs(s,s2)
-        self.assertIs(s._data,s2._data)
-
-        df = df_orig.copy()
-        df2 = df
-        df += 1
-        assert_frame_equal(df,df2)
-        assert_frame_equal(df_orig+1,df)
-        self.assertIs(df,df2)
-        self.assertIs(df._data,df2._data)
-
-        # dtype change
-        s = s_orig.copy()
-        s2 = s
-        s += 1.5
-        assert_series_equal(s,s2)
-        assert_series_equal(s_orig+1.5,s)
-
-        df = df_orig.copy()
-        df2 = df
-        df += 1.5
-        assert_frame_equal(df,df2)
-        assert_frame_equal(df_orig+1.5,df)
-        self.assertIs(df,df2)
-        self.assertIs(df._data,df2._data)
-
-        # mixed dtype
-        arr = np.random.randint(0,10,size=5)
-        df_orig = DataFrame({'A' : arr.copy(), 'B' : 'foo'})
-        df = df_orig.copy()
-        df2 = df
-        df['A'] += 1
-        expected = DataFrame({'A' : arr.copy()+1, 'B' : 'foo'})
-        assert_frame_equal(df,expected)
-        assert_frame_equal(df2,expected)
-        self.assertIs(df._data,df2._data)
-
-        df = df_orig.copy()
-        df2 = df
-        df['A'] += 1.5
-        expected = DataFrame({'A' : arr.copy()+1.5, 'B' : 'foo'})
-        assert_frame_equal(df,expected)
-        assert_frame_equal(df2,expected)
-        self.assertIs(df._data,df2._data)
-
-    def test_getitem_boolean(self):
-        # boolean indexing
-        d = self.tsframe.index[10]
-        indexer = self.tsframe.index > d
-        indexer_obj = indexer.astype(object)
-
-        subindex = self.tsframe.index[indexer]
-        subframe = self.tsframe[indexer]
-
-        self.assert_numpy_array_equal(subindex, subframe.index)
-        with assertRaisesRegexp(ValueError, 'Item wrong length'):
-            self.tsframe[indexer[:-1]]
-
-        subframe_obj = self.tsframe[indexer_obj]
-        assert_frame_equal(subframe_obj, subframe)
-
-        with tm.assertRaisesRegexp(ValueError, 'boolean values only'):
-            self.tsframe[self.tsframe]
-
-        # test that Series work
-        indexer_obj = Series(indexer_obj, self.tsframe.index)
-
-        subframe_obj = self.tsframe[indexer_obj]
-        assert_frame_equal(subframe_obj, subframe)
-
-        # test that Series indexers reindex
-        import warnings
-        warnings.filterwarnings(action='ignore', category=UserWarning)
-
-        indexer_obj = indexer_obj.reindex(self.tsframe.index[::-1])
-
-        subframe_obj = self.tsframe[indexer_obj]
-        assert_frame_equal(subframe_obj, subframe)
-
-        warnings.filterwarnings(action='default', category=UserWarning)
-
-        # test df[df > 0]
-        for df in [ self.tsframe, self.mixed_frame, self.mixed_float, self.mixed_int ]:
-
-            data = df._get_numeric_data()
-            bif = df[df > 0]
-            bifw = DataFrame(dict([ (c,np.where(data[c] > 0, data[c], np.nan)) for c in data.columns ]),
-                             index=data.index, columns=data.columns)
-
-            # add back other columns to compare
-            for c in df.columns:
-                if c not in bifw:
-                    bifw[c] = df[c]
-            bifw = bifw.reindex(columns = df.columns)
-
-            assert_frame_equal(bif, bifw, check_dtype=False)
-            for c in df.columns:
-                if bif[c].dtype != bifw[c].dtype:
-                    self.assertEqual(bif[c].dtype, df[c].dtype)
-
-    def test_getitem_boolean_casting(self):
-
-        # don't upcast if we don't need to
-        df = self.tsframe.copy()
-        df['E'] = 1
-        df['E'] = df['E'].astype('int32')
-        df['E1'] = df['E'].copy()
-        df['F'] = 1
-        df['F'] = df['F'].astype('int64')
-        df['F1'] = df['F'].copy()
-
-        casted = df[df>0]
-        result = casted.get_dtype_counts()
-        expected = Series({'float64': 4, 'int32' : 2, 'int64' : 2})
-        assert_series_equal(result, expected)
-
-        # int block splitting
-        df.ix[1:3,['E1','F1']] = 0
-        casted = df[df>0]
-        result = casted.get_dtype_counts()
-        expected = Series({'float64': 6, 'int32' : 1, 'int64' : 1})
-        assert_series_equal(result, expected)
-
-        # where dtype conversions
-        # GH 3733
-        df = DataFrame(data = np.random.randn(100, 50))
-        df = df.where(df > 0) # create nans
-        bools = df > 0
-        mask = isnull(df)
-        expected = bools.astype(float).mask(mask)
-        result = bools.mask(mask)
-        assert_frame_equal(result,expected)
-
-    def test_getitem_boolean_list(self):
-        df = DataFrame(np.arange(12).reshape(3, 4))
-
-        def _checkit(lst):
-            result = df[lst]
-            expected = df.ix[df.index[lst]]
-            assert_frame_equal(result, expected)
-
-        _checkit([True, False, True])
-        _checkit([True, True, True])
-        _checkit([False, False, False])
-
-    def test_getitem_boolean_iadd(self):
-        arr = randn(5, 5)
-
-        df = DataFrame(arr.copy(), columns = ['A','B','C','D','E'])
-
-        df[df < 0] += 1
-        arr[arr < 0] += 1
-
-        assert_almost_equal(df.values, arr)
-
-    def test_boolean_index_empty_corner(self):
-        # #2096
-        blah = DataFrame(np.empty([0, 1]), columns=['A'],
-                         index=DatetimeIndex([]))
-
-        # both of these should succeed trivially
-        k = np.array([], bool)
-
-        blah[k]
-        blah[k] = 0
-
-    def test_getitem_ix_mixed_integer(self):
-        df = DataFrame(np.random.randn(4, 3),
-                       index=[1, 10, 'C', 'E'], columns=[1, 2, 3])
-
-        result = df.ix[:-1]
-        expected = df.ix[df.index[:-1]]
-        assert_frame_equal(result, expected)
-
-        result = df.ix[[1, 10]]
-        expected = df.ix[Index([1, 10], dtype=object)]
-        assert_frame_equal(result, expected)
-
-    def test_getitem_setitem_ix_negative_integers(self):
-        result = self.frame.ix[:, -1]
-        assert_series_equal(result, self.frame['D'])
-
-        result = self.frame.ix[:, [-1]]
-        assert_frame_equal(result, self.frame[['D']])
-
-        result = self.frame.ix[:, [-1, -2]]
-        assert_frame_equal(result, self.frame[['D', 'C']])
-
-        self.frame.ix[:, [-1]] = 0
-        self.assertTrue((self.frame['D'] == 0).all())
-
-        df = DataFrame(np.random.randn(8, 4))
-        self.assertTrue(isnull(df.ix[:, [-1]].values).all())
-
-        # #1942
-        a = DataFrame(randn(20, 2), index=[chr(x + 65) for x in range(20)])
-        a.ix[-1] = a.ix[-2]
-
-        assert_series_equal(a.ix[-1], a.ix[-2], check_names=False)
-        self.assertEqual(a.ix[-1].name, 'T')
-        self.assertEqual(a.ix[-2].name, 'S')
-
-    def test_getattr(self):
-        tm.assert_series_equal(self.frame.A, self.frame['A'])
-        self.assertRaises(AttributeError, getattr, self.frame,
-                          'NONEXISTENT_NAME')
-
-    def test_setattr_column(self):
-        df = DataFrame({'foobar': 1}, index=lrange(10))
-
-        df.foobar = 5
-        self.assertTrue((df.foobar == 5).all())
-
-    def test_setitem(self):
-        # not sure what else to do here
-        series = self.frame['A'][::2]
-        self.frame['col5'] = series
-        self.assertIn('col5', self.frame)
-        tm.assert_dict_equal(series, self.frame['col5'],
-                             compare_keys=False)
-
-        series = self.frame['A']
-        self.frame['col6'] = series
-        tm.assert_dict_equal(series, self.frame['col6'],
-                             compare_keys=False)
-
-        with tm.assertRaises(KeyError):
-            self.frame[randn(len(self.frame) + 1)] = 1
-
-        # set ndarray
-        arr = randn(len(self.frame))
-        self.frame['col9'] = arr
-        self.assertTrue((self.frame['col9'] == arr).all())
-
-        self.frame['col7'] = 5
-        assert((self.frame['col7'] == 5).all())
-
-        self.frame['col0'] = 3.14
-        assert((self.frame['col0'] == 3.14).all())
-
-        self.frame['col8'] = 'foo'
-        assert((self.frame['col8'] == 'foo').all())
-
-        # this is partially a view (e.g. some blocks are view)
-        # so raise/warn
-        smaller = self.frame[:2]
-        def f():
-            smaller['col10'] = ['1', '2']
-        self.assertRaises(com.SettingWithCopyError, f)
-        self.assertEqual(smaller['col10'].dtype, np.object_)
-        self.assertTrue((smaller['col10'] == ['1', '2']).all())
-
-        # with a dtype
-        for dtype in ['int32','int64','float32','float64']:
-            self.frame[dtype] = np.array(arr,dtype=dtype)
-            self.assertEqual(self.frame[dtype].dtype.name, dtype)
-
-        # dtype changing GH4204
-        df = DataFrame([[0,0]])
-        df.iloc[0] = np.nan
-        expected = DataFrame([[np.nan,np.nan]])
-        assert_frame_equal(df,expected)
-
-        df = DataFrame([[0,0]])
-        df.loc[0] = np.nan
-        assert_frame_equal(df,expected)
-
-    def test_setitem_tuple(self):
-        self.frame['A', 'B'] = self.frame['A']
-        assert_series_equal(self.frame['A', 'B'], self.frame['A'], check_names=False)
-
-    def test_setitem_always_copy(self):
-        s = self.frame['A'].copy()
-        self.frame['E'] = s
-
-        self.frame['E'][5:10] = nan
-        self.assertTrue(notnull(s[5:10]).all())
-
-    def test_setitem_boolean(self):
-        df = self.frame.copy()
-        values = self.frame.values
-
-        df[df['A'] > 0] = 4
-        values[values[:, 0] > 0] = 4
-        assert_almost_equal(df.values, values)
-
-        # test that column reindexing works
-        series = df['A'] == 4
-        series = series.reindex(df.index[::-1])
-        df[series] = 1
-        values[values[:, 0] == 4] = 1
-        assert_almost_equal(df.values, values)
-
-        df[df > 0] = 5
-        values[values > 0] = 5
-        assert_almost_equal(df.values, values)
-
-        df[df == 5] = 0
-        values[values == 5] = 0
-        assert_almost_equal(df.values, values)
-
-        # a df that needs alignment first
-        df[df[:-1] < 0] = 2
-        np.putmask(values[:-1], values[:-1] < 0, 2)
-        assert_almost_equal(df.values, values)
-
-        # indexed with same shape but rows-reversed df
-        df[df[::-1] == 2] = 3
-        values[values == 2] = 3
-        assert_almost_equal(df.values, values)
-
-        with assertRaisesRegexp(TypeError, 'Must pass DataFrame with boolean '
-                                'values only'):
-            df[df * 0] = 2
-
-        # index with DataFrame
-        mask = df > np.abs(df)
-        expected = df.copy()
-        df[df > np.abs(df)] = nan
-        expected.values[mask.values] = nan
-        assert_frame_equal(df, expected)
-
-        # set from DataFrame
-        expected = df.copy()
-        df[df > np.abs(df)] = df * 2
-        np.putmask(expected.values, mask.values, df.values * 2)
-        assert_frame_equal(df, expected)
-
-    def test_setitem_cast(self):
-        self.frame['D'] = self.frame['D'].astype('i8')
-        self.assertEqual(self.frame['D'].dtype, np.int64)
-
-        # #669, should not cast?
-        # this is now set to int64, which means a replacement of the column to
-        # the value dtype (and nothing to do with the existing dtype)
-        self.frame['B'] = 0
-        self.assertEqual(self.frame['B'].dtype, np.int64)
-
-        # cast if pass array of course
-        self.frame['B'] = np.arange(len(self.frame))
-        self.assertTrue(issubclass(self.frame['B'].dtype.type, np.integer))
-
-        self.frame['foo'] = 'bar'
-        self.frame['foo'] = 0
-        self.assertEqual(self.frame['foo'].dtype, np.int64)
-
-        self.frame['foo'] = 'bar'
-        self.frame['foo'] = 2.5
-        self.assertEqual(self.frame['foo'].dtype, np.float64)
-
-        self.frame['something'] = 0
-        self.assertEqual(self.frame['something'].dtype, np.int64)
-        self.frame['something'] = 2
-        self.assertEqual(self.frame['something'].dtype, np.int64)
-        self.frame['something'] = 2.5
-        self.assertEqual(self.frame['something'].dtype, np.float64)
-
-        # GH 7704
-        # dtype conversion on setting
-        df = DataFrame(np.random.rand(30, 3), columns=tuple('ABC'))
-        df['event'] = np.nan
-        df.loc[10,'event'] = 'foo'
-        result = df.get_dtype_counts().sort_values()
-        expected = Series({'float64' : 3, 'object' : 1 }).sort_values()
-        assert_series_equal(result, expected)
-
-    def test_setitem_boolean_column(self):
-        expected = self.frame.copy()
-        mask = self.frame['A'] > 0
-
-        self.frame.ix[mask, 'B'] = 0
-        expected.values[mask.values, 1] = 0
-
-        assert_frame_equal(self.frame, expected)
-
-    def test_setitem_corner(self):
-        # corner case
-        df = DataFrame({'B': [1., 2., 3.],
-                        'C': ['a', 'b', 'c']},
-                       index=np.arange(3))
-        del df['B']
-        df['B'] = [1., 2., 3.]
-        self.assertIn('B', df)
-        self.assertEqual(len(df.columns), 2)
-
-        df['A'] = 'beginning'
-        df['E'] = 'foo'
-        df['D'] = 'bar'
-        df[datetime.now()] = 'date'
-        df[datetime.now()] = 5.
-
-        # what to do when empty frame with index
-        dm = DataFrame(index=self.frame.index)
-        dm['A'] = 'foo'
-        dm['B'] = 'bar'
-        self.assertEqual(len(dm.columns), 2)
-        self.assertEqual(dm.values.dtype, np.object_)
-
-        # upcast
-        dm['C'] = 1
-        self.assertEqual(dm['C'].dtype, np.int64)
-
-        dm['E'] = 1.
-        self.assertEqual(dm['E'].dtype, np.float64)
-
-        # set existing column
-        dm['A'] = 'bar'
-        self.assertEqual('bar', dm['A'][0])
-
-        dm = DataFrame(index=np.arange(3))
-        dm['A'] = 1
-        dm['foo'] = 'bar'
-        del dm['foo']
-        dm['foo'] = 'bar'
-        self.assertEqual(dm['foo'].dtype, np.object_)
-
-        dm['coercable'] = ['1', '2', '3']
-        self.assertEqual(dm['coercable'].dtype, np.object_)
-
-    def test_setitem_corner2(self):
-        data = {"title": ['foobar', 'bar', 'foobar'] + ['foobar'] * 17,
-                "cruft": np.random.random(20)}
-
-        df = DataFrame(data)
-        ix = df[df['title'] == 'bar'].index
-
-        df.ix[ix, ['title']] = 'foobar'
-        df.ix[ix, ['cruft']] = 0
-
-        assert(df.ix[1, 'title'] == 'foobar')
-        assert(df.ix[1, 'cruft'] == 0)
-
-    def test_setitem_ambig(self):
-        # difficulties with mixed-type data
-        from decimal import Decimal
-
-        # created as float type
-        dm = DataFrame(index=lrange(3), columns=lrange(3))
-
-        coercable_series = Series([Decimal(1) for _ in range(3)],
-                                  index=lrange(3))
-        uncoercable_series = Series(['foo', 'bzr', 'baz'], index=lrange(3))
-
-        dm[0] = np.ones(3)
-        self.assertEqual(len(dm.columns), 3)
-        # self.assertIsNone(dm.objects)
-
-        dm[1] = coercable_series
-        self.assertEqual(len(dm.columns), 3)
-        # self.assertIsNone(dm.objects)
-
-        dm[2] = uncoercable_series
-        self.assertEqual(len(dm.columns), 3)
-        # self.assertIsNotNone(dm.objects)
-        self.assertEqual(dm[2].dtype, np.object_)
-
-    def test_setitem_clear_caches(self):
-        # GH #304
-        df = DataFrame({'x': [1.1, 2.1, 3.1, 4.1], 'y': [5.1, 6.1, 7.1, 8.1]},
-                       index=[0, 1, 2, 3])
-        df.insert(2, 'z', np.nan)
-
-        # cache it
-        foo = df['z']
-
-        df.ix[2:, 'z'] = 42
-
-        expected = Series([np.nan, np.nan, 42, 42], index=df.index, name='z')
-        self.assertIsNot(df['z'], foo)
-        assert_series_equal(df['z'], expected)
-
-    def test_setitem_None(self):
-        # GH #766
-        self.frame[None] = self.frame['A']
-        assert_series_equal(self.frame.iloc[:,-1], self.frame['A'], check_names=False)
-        assert_series_equal(self.frame.loc[:,None], self.frame['A'], check_names=False)
-        assert_series_equal(self.frame[None], self.frame['A'], check_names=False)
-        repr(self.frame)
-
-    def test_setitem_empty(self):
-        # GH 9596
-        df = pd.DataFrame({'a': ['1', '2', '3'],
-                           'b': ['11', '22', '33'],
-                           'c': ['111', '222', '333']})
-
-        result = df.copy()
-        result.loc[result.b.isnull(), 'a'] = result.a
-        assert_frame_equal(result, df)
-
-    def test_setitem_empty_frame_with_boolean(self):
-        # Test for issue #10126
-
-        for dtype in ('float', 'int64'):
-            for df in [
-                    pd.DataFrame(dtype=dtype),
-                    pd.DataFrame(dtype=dtype, index=[1]),
-                    pd.DataFrame(dtype=dtype, columns=['A']),
-            ]:
-                df2 = df.copy()
-                df[df > df2] = 47
-                assert_frame_equal(df, df2)
-
-    def test_delitem_corner(self):
-        f = self.frame.copy()
-        del f['D']
-        self.assertEqual(len(f.columns), 3)
-        self.assertRaises(KeyError, f.__delitem__, 'D')
-        del f['B']
-        self.assertEqual(len(f.columns), 2)
-
-    def test_getitem_fancy_2d(self):
-        f = self.frame
-        ix = f.ix
-
-        assert_frame_equal(ix[:, ['B', 'A']], f.reindex(columns=['B', 'A']))
-
-        subidx = self.frame.index[[5, 4, 1]]
-        assert_frame_equal(ix[subidx, ['B', 'A']],
-                           f.reindex(index=subidx, columns=['B', 'A']))
-
-        # slicing rows, etc.
-        assert_frame_equal(ix[5:10], f[5:10])
-        assert_frame_equal(ix[5:10, :], f[5:10])
-        assert_frame_equal(ix[:5, ['A', 'B']],
-                           f.reindex(index=f.index[:5], columns=['A', 'B']))
-
-        # slice rows with labels, inclusive!
-        expected = ix[5:11]
-        result = ix[f.index[5]:f.index[10]]
-        assert_frame_equal(expected, result)
-
-        # slice columns
-        assert_frame_equal(ix[:, :2], f.reindex(columns=['A', 'B']))
-
-        # get view
-        exp = f.copy()
-        ix[5:10].values[:] = 5
-        exp.values[5:10] = 5
-        assert_frame_equal(f, exp)
-
-        self.assertRaises(ValueError, ix.__getitem__, f > 0.5)
-
-    def test_slice_floats(self):
-        index = [52195.504153, 52196.303147, 52198.369883]
-        df = DataFrame(np.random.rand(3, 2), index=index)
-
-        s1 = df.ix[52195.1:52196.5]
-        self.assertEqual(len(s1), 2)
-
-        s1 = df.ix[52195.1:52196.6]
-        self.assertEqual(len(s1), 2)
-
-        s1 = df.ix[52195.1:52198.9]
-        self.assertEqual(len(s1), 3)
-
-    def test_getitem_fancy_slice_integers_step(self):
-        df = DataFrame(np.random.randn(10, 5))
-
-        # this is OK
-        result = df.ix[:8:2]
-        df.ix[:8:2] = np.nan
-        self.assertTrue(isnull(df.ix[:8:2]).values.all())
-
-    def test_getitem_setitem_integer_slice_keyerrors(self):
-        df = DataFrame(np.random.randn(10, 5), index=lrange(0, 20, 2))
-
-        # this is OK
-        cp = df.copy()
-        cp.ix[4:10] = 0
-        self.assertTrue((cp.ix[4:10] == 0).values.all())
-
-        # so is this
-        cp = df.copy()
-        cp.ix[3:11] = 0
-        self.assertTrue((cp.ix[3:11] == 0).values.all())
-
-        result = df.ix[4:10]
-        result2 = df.ix[3:11]
-        expected = df.reindex([4, 6, 8, 10])
-
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
-
-        # non-monotonic, raise KeyError
-        df2 = df.iloc[lrange(5) + lrange(5, 10)[::-1]]
-        self.assertRaises(KeyError, df2.ix.__getitem__, slice(3, 11))
-        self.assertRaises(KeyError, df2.ix.__setitem__, slice(3, 11), 0)
-
-    def test_setitem_fancy_2d(self):
-        f = self.frame
-        ix = f.ix
-
-        # case 1
-        frame = self.frame.copy()
-        expected = frame.copy()
-        frame.ix[:, ['B', 'A']] = 1
-        expected['B'] = 1.
-        expected['A'] = 1.
-        assert_frame_equal(frame, expected)
-
-        # case 2
-        frame = self.frame.copy()
-        frame2 = self.frame.copy()
-
-        expected = frame.copy()
-
-        subidx = self.frame.index[[5, 4, 1]]
-        values = randn(3, 2)
-
-        frame.ix[subidx, ['B', 'A']] = values
-        frame2.ix[[5, 4, 1], ['B', 'A']] = values
-
-        expected['B'].ix[subidx] = values[:, 0]
-        expected['A'].ix[subidx] = values[:, 1]
-
-        assert_frame_equal(frame, expected)
-        assert_frame_equal(frame2, expected)
-
-        # case 3: slicing rows, etc.
-        frame = self.frame.copy()
-
-        expected1 = self.frame.copy()
-        frame.ix[5:10] = 1.
-        expected1.values[5:10] = 1.
-        assert_frame_equal(frame, expected1)
-
-        expected2 = self.frame.copy()
-        arr = randn(5, len(frame.columns))
-        frame.ix[5:10] = arr
-        expected2.values[5:10] = arr
-        assert_frame_equal(frame, expected2)
-
-        # case 4
-        frame = self.frame.copy()
-        frame.ix[5:10, :] = 1.
-        assert_frame_equal(frame, expected1)
-        frame.ix[5:10, :] = arr
-        assert_frame_equal(frame, expected2)
-
-        # case 5
-        frame = self.frame.copy()
-        frame2 = self.frame.copy()
-
-        expected = self.frame.copy()
-        values = randn(5, 2)
-
-        frame.ix[:5, ['A', 'B']] = values
-        expected['A'][:5] = values[:, 0]
-        expected['B'][:5] = values[:, 1]
-        assert_frame_equal(frame, expected)
-
-        frame2.ix[:5, [0, 1]] = values
-        assert_frame_equal(frame2, expected)
-
-        # case 6: slice rows with labels, inclusive!
-        frame = self.frame.copy()
-        expected = self.frame.copy()
-
-        frame.ix[frame.index[5]:frame.index[10]] = 5.
-        expected.values[5:11] = 5
-        assert_frame_equal(frame, expected)
-
-        # case 7: slice columns
-        frame = self.frame.copy()
-        frame2 = self.frame.copy()
-        expected = self.frame.copy()
-
-        # slice indices
-        frame.ix[:, 1:3] = 4.
-        expected.values[:, 1:3] = 4.
-        assert_frame_equal(frame, expected)
-
-        # slice with labels
-        frame.ix[:, 'B':'C'] = 4.
-        assert_frame_equal(frame, expected)
-
-        # new corner case of boolean slicing / setting
-        frame = DataFrame(lzip([2, 3, 9, 6, 7], [np.nan] * 5),
-                          columns=['a', 'b'])
-        lst = [100]
-        lst.extend([np.nan] * 4)
-        expected = DataFrame(lzip([100, 3, 9, 6, 7], lst),
-                             columns=['a', 'b'])
-        frame[frame['a'] == 2] = 100
-        assert_frame_equal(frame, expected)
-
-    def test_fancy_getitem_slice_mixed(self):
-        sliced = self.mixed_frame.ix[:, -3:]
-        self.assertEqual(sliced['D'].dtype, np.float64)
-
-        # get view with single block
-        # setting it triggers setting with copy
-        sliced = self.frame.ix[:, -3:]
-        def f():
-            sliced['C'] = 4.
-        self.assertRaises(com.SettingWithCopyError, f)
-        self.assertTrue((self.frame['C'] == 4).all())
-
-    def test_fancy_setitem_int_labels(self):
-        # integer index defers to label-based indexing
-
-        df = DataFrame(np.random.randn(10, 5), index=np.arange(0, 20, 2))
-
-        tmp = df.copy()
-        exp = df.copy()
-        tmp.ix[[0, 2, 4]] = 5
-        exp.values[:3] = 5
-        assert_frame_equal(tmp, exp)
-
-        tmp = df.copy()
-        exp = df.copy()
-        tmp.ix[6] = 5
-        exp.values[3] = 5
-        assert_frame_equal(tmp, exp)
-
-        tmp = df.copy()
-        exp = df.copy()
-        tmp.ix[:, 2] = 5
-
-        # tmp correctly sets the dtype
-        # so match the exp way
-        exp[2] = 5
-        assert_frame_equal(tmp, exp)
-
-    def test_fancy_getitem_int_labels(self):
-        df = DataFrame(np.random.randn(10, 5), index=np.arange(0, 20, 2))
-
-        result = df.ix[[4, 2, 0], [2, 0]]
-        expected = df.reindex(index=[4, 2, 0], columns=[2, 0])
-        assert_frame_equal(result, expected)
-
-        result = df.ix[[4, 2, 0]]
-        expected = df.reindex(index=[4, 2, 0])
-        assert_frame_equal(result, expected)
-
-        result = df.ix[4]
-        expected = df.xs(4)
-        assert_series_equal(result, expected)
-
-        result = df.ix[:, 3]
-        expected = df[3]
-        assert_series_equal(result, expected)
-
-    def test_fancy_index_int_labels_exceptions(self):
-        df = DataFrame(np.random.randn(10, 5), index=np.arange(0, 20, 2))
-
-        # labels that aren't contained
-        self.assertRaises(KeyError, df.ix.__setitem__,
-                          ([0, 1, 2], [2, 3, 4]), 5)
-
-        # try to set indices not contained in frame
-        self.assertRaises(KeyError,
-                          self.frame.ix.__setitem__,
-                          ['foo', 'bar', 'baz'], 1)
-        self.assertRaises(KeyError,
-                          self.frame.ix.__setitem__,
-                          (slice(None, None), ['E']), 1)
-
-        # partial setting now allows this GH2578
-        #self.assertRaises(KeyError,
-        #                  self.frame.ix.__setitem__,
-        #                  (slice(None, None), 'E'), 1)
-
-    def test_setitem_fancy_mixed_2d(self):
-        self.mixed_frame.ix[:5, ['C', 'B', 'A']] = 5
-        result = self.mixed_frame.ix[:5, ['C', 'B', 'A']]
-        self.assertTrue((result.values == 5).all())
-
-        self.mixed_frame.ix[5] = np.nan
-        self.assertTrue(isnull(self.mixed_frame.ix[5]).all())
-
-        self.mixed_frame.ix[5] = self.mixed_frame.ix[6]
-        assert_series_equal(self.mixed_frame.ix[5], self.mixed_frame.ix[6],
-                            check_names=False)
-
-        # #1432
-        df = DataFrame({1: [1., 2., 3.],
-                        2: [3, 4, 5]})
-        self.assertTrue(df._is_mixed_type)
-
-        df.ix[1] = [5, 10]
-
-        expected = DataFrame({1: [1., 5., 3.],
-                              2: [3, 10, 5]})
-
-        assert_frame_equal(df, expected)
-
-    def test_ix_align(self):
-        b = Series(randn(10), name=0).sort_values()
-        df_orig = DataFrame(randn(10, 4))
-        df = df_orig.copy()
-
-        df.ix[:, 0] = b
-        assert_series_equal(df.ix[:, 0].reindex(b.index), b)
-
-        dft = df_orig.T
-        dft.ix[0, :] = b
-        assert_series_equal(dft.ix[0, :].reindex(b.index), b)
-
-        df = df_orig.copy()
-        df.ix[:5, 0] = b
-        s = df.ix[:5, 0]
-        assert_series_equal(s, b.reindex(s.index))
-
-        dft = df_orig.T
-        dft.ix[0, :5] = b
-        s = dft.ix[0, :5]
-        assert_series_equal(s, b.reindex(s.index))
-
-        df = df_orig.copy()
-        idx = [0, 1, 3, 5]
-        df.ix[idx, 0] = b
-        s = df.ix[idx, 0]
-        assert_series_equal(s, b.reindex(s.index))
-
-        dft = df_orig.T
-        dft.ix[0, idx] = b
-        s = dft.ix[0, idx]
-        assert_series_equal(s, b.reindex(s.index))
-
-    def test_ix_frame_align(self):
-        b = DataFrame(np.random.randn(3, 4))
-        df_orig = DataFrame(randn(10, 4))
-        df = df_orig.copy()
-
-        df.ix[:3] = b
-        out = b.ix[:3]
-        assert_frame_equal(out, b)
-
-        b.sort_index(inplace=True)
-
-        df = df_orig.copy()
-        df.ix[[0, 1, 2]] = b
-        out = df.ix[[0, 1, 2]].reindex(b.index)
-        assert_frame_equal(out, b)
-
-        df = df_orig.copy()
-        df.ix[:3] = b
-        out = df.ix[:3]
-        assert_frame_equal(out, b.reindex(out.index))
-
-    def test_getitem_setitem_non_ix_labels(self):
-        df = tm.makeTimeDataFrame()
-
-        start, end = df.index[[5, 10]]
-
-        result = df.ix[start:end]
-        result2 = df[start:end]
-        expected = df[5:11]
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
-
-        result = df.copy()
-        result.ix[start:end] = 0
-        result2 = df.copy()
-        result2[start:end] = 0
-        expected = df.copy()
-        expected[5:11] = 0
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
-
-    def test_ix_multi_take(self):
-        df = DataFrame(np.random.randn(3, 2))
-        rs = df.ix[df.index == 0, :]
-        xp = df.reindex([0])
-        assert_frame_equal(rs, xp)
-
-        """ #1321
-        df = DataFrame(np.random.randn(3, 2))
-        rs = df.ix[df.index==0, df.columns==1]
-        xp = df.reindex([0], [1])
-        assert_frame_equal(rs, xp)
-        """
-
-    def test_ix_multi_take_nonint_index(self):
-        df = DataFrame(np.random.randn(3, 2), index=['x', 'y', 'z'],
-                       columns=['a', 'b'])
-        rs = df.ix[[0], [0]]
-        xp = df.reindex(['x'], columns=['a'])
-        assert_frame_equal(rs, xp)
-
-    def test_ix_multi_take_multiindex(self):
-        df = DataFrame(np.random.randn(3, 2), index=['x', 'y', 'z'],
-                       columns=[['a', 'b'], ['1', '2']])
-        rs = df.ix[[0], [0]]
-        xp = df.reindex(['x'], columns=[('a', '1')])
-        assert_frame_equal(rs, xp)
-
-    def test_ix_dup(self):
-        idx = Index(['a', 'a', 'b', 'c', 'd', 'd'])
-        df = DataFrame(np.random.randn(len(idx), 3), idx)
-
-        sub = df.ix[:'d']
-        assert_frame_equal(sub, df)
-
-        sub = df.ix['a':'c']
-        assert_frame_equal(sub, df.ix[0:4])
-
-        sub = df.ix['b':'d']
-        assert_frame_equal(sub, df.ix[2:])
-
-    def test_getitem_fancy_1d(self):
-        f = self.frame
-        ix = f.ix
-
-        # return self if no slicing...for now
-        self.assertIs(ix[:, :], f)
-
-        # low dimensional slice
-        xs1 = ix[2, ['C', 'B', 'A']]
-        xs2 = f.xs(f.index[2]).reindex(['C', 'B', 'A'])
-        assert_series_equal(xs1, xs2)
-
-        ts1 = ix[5:10, 2]
-        ts2 = f[f.columns[2]][5:10]
-        assert_series_equal(ts1, ts2)
-
-        # positional xs
-        xs1 = ix[0]
-        xs2 = f.xs(f.index[0])
-        assert_series_equal(xs1, xs2)
-
-        xs1 = ix[f.index[5]]
-        xs2 = f.xs(f.index[5])
-        assert_series_equal(xs1, xs2)
-
-        # single column
-        assert_series_equal(ix[:, 'A'], f['A'])
-
-        # return view
-        exp = f.copy()
-        exp.values[5] = 4
-        ix[5][:] = 4
-        assert_frame_equal(exp, f)
-
-        exp.values[:, 1] = 6
-        ix[:, 1][:] = 6
-        assert_frame_equal(exp, f)
-
-        # slice of mixed-frame
-        xs = self.mixed_frame.ix[5]
-        exp = self.mixed_frame.xs(self.mixed_frame.index[5])
-        assert_series_equal(xs, exp)
-
-    def test_setitem_fancy_1d(self):
-
-        # case 1: set cross-section for indices
-        frame = self.frame.copy()
-        expected = self.frame.copy()
-
-        frame.ix[2, ['C', 'B', 'A']] = [1., 2., 3.]
-        expected['C'][2] = 1.
-        expected['B'][2] = 2.
-        expected['A'][2] = 3.
-        assert_frame_equal(frame, expected)
-
-        frame2 = self.frame.copy()
-        frame2.ix[2, [3, 2, 1]] = [1., 2., 3.]
-        assert_frame_equal(frame, expected)
-
-        # case 2, set a section of a column
-        frame = self.frame.copy()
-        expected = self.frame.copy()
-
-        vals = randn(5)
-        expected.values[5:10, 2] = vals
-        frame.ix[5:10, 2] = vals
-        assert_frame_equal(frame, expected)
-
-        frame2 = self.frame.copy()
-        frame2.ix[5:10, 'B'] = vals
-        assert_frame_equal(frame, expected)
-
-        # case 3: full xs
-        frame = self.frame.copy()
-        expected = self.frame.copy()
-
-        frame.ix[4] = 5.
-        expected.values[4] = 5.
-        assert_frame_equal(frame, expected)
-
-        frame.ix[frame.index[4]] = 6.
-        expected.values[4] = 6.
-        assert_frame_equal(frame, expected)
-
-        # single column
-        frame = self.frame.copy()
-        expected = self.frame.copy()
-
-        frame.ix[:, 'A'] = 7.
-        expected['A'] = 7.
-        assert_frame_equal(frame, expected)
-
-    def test_getitem_fancy_scalar(self):
-        f = self.frame
-        ix = f.ix
-        # individual value
-        for col in f.columns:
-            ts = f[col]
-            for idx in f.index[::5]:
-                assert_almost_equal(ix[idx, col], ts[idx])
-
-    def test_setitem_fancy_scalar(self):
-        f = self.frame
-        expected = self.frame.copy()
-        ix = f.ix
-        # individual value
-        for j, col in enumerate(f.columns):
-            ts = f[col]
-            for idx in f.index[::5]:
-                i = f.index.get_loc(idx)
-                val = randn()
-                expected.values[i, j] = val
-                ix[idx, col] = val
-                assert_frame_equal(f, expected)
-
-    def test_getitem_fancy_boolean(self):
-        f = self.frame
-        ix = f.ix
-
-        expected = f.reindex(columns=['B', 'D'])
-        result = ix[:, [False, True, False, True]]
-        assert_frame_equal(result, expected)
-
-        expected = f.reindex(index=f.index[5:10], columns=['B', 'D'])
-        result = ix[5:10, [False, True, False, True]]
-        assert_frame_equal(result, expected)
-
-        boolvec = f.index > f.index[7]
-        expected = f.reindex(index=f.index[boolvec])
-        result = ix[boolvec]
-        assert_frame_equal(result, expected)
-        result = ix[boolvec, :]
-        assert_frame_equal(result, expected)
-
-        result = ix[boolvec, 2:]
-        expected = f.reindex(index=f.index[boolvec],
-                             columns=['C', 'D'])
-        assert_frame_equal(result, expected)
-
-    def test_setitem_fancy_boolean(self):
-        # from 2d, set with booleans
-        frame = self.frame.copy()
-        expected = self.frame.copy()
-
-        mask = frame['A'] > 0
-        frame.ix[mask] = 0.
-        expected.values[mask.values] = 0.
-        assert_frame_equal(frame, expected)
-
-        frame = self.frame.copy()
-        expected = self.frame.copy()
-        frame.ix[mask, ['A', 'B']] = 0.
-        expected.values[mask.values, :2] = 0.
-        assert_frame_equal(frame, expected)
-
-    def test_getitem_fancy_ints(self):
-        result = self.frame.ix[[1, 4, 7]]
-        expected = self.frame.ix[self.frame.index[[1, 4, 7]]]
-        assert_frame_equal(result, expected)
-
-        result = self.frame.ix[:, [2, 0, 1]]
-        expected = self.frame.ix[:, self.frame.columns[[2, 0, 1]]]
-        assert_frame_equal(result, expected)
-
-    def test_getitem_setitem_fancy_exceptions(self):
-        ix = self.frame.ix
-        with assertRaisesRegexp(IndexingError, 'Too many indexers'):
-            ix[:, :, :]
-
-        with assertRaises(IndexingError):
-            ix[:, :, :] = 1
-
-    def test_getitem_setitem_boolean_misaligned(self):
-        # boolean index misaligned labels
-        mask = self.frame['A'][::-1] > 1
-
-        result = self.frame.ix[mask]
-        expected = self.frame.ix[mask[::-1]]
-        assert_frame_equal(result, expected)
-
-        cp = self.frame.copy()
-        expected = self.frame.copy()
-        cp.ix[mask] = 0
-        expected.ix[mask] = 0
-        assert_frame_equal(cp, expected)
-
-    def test_getitem_setitem_boolean_multi(self):
-        df = DataFrame(np.random.randn(3, 2))
-
-        # get
-        k1 = np.array([True, False, True])
-        k2 = np.array([False, True])
-        result = df.ix[k1, k2]
-        expected = df.ix[[0, 2], [1]]
-        assert_frame_equal(result, expected)
-
-        expected = df.copy()
-        df.ix[np.array([True, False, True]),
-              np.array([False, True])] = 5
-        expected.ix[[0, 2], [1]] = 5
-        assert_frame_equal(df, expected)
-
-    def test_getitem_setitem_float_labels(self):
-        index = Index([1.5, 2, 3, 4, 5])
-        df = DataFrame(np.random.randn(5, 5), index=index)
-
-        result = df.ix[1.5:4]
-        expected = df.reindex([1.5, 2, 3, 4])
-        assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 4)
-
-        result = df.ix[4:5]
-        expected = df.reindex([4, 5])
-        assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 2)
-
-        # loc_float changes this to work properly
-        result = df.ix[1:2]
-        expected = df.iloc[0:2]
-        assert_frame_equal(result, expected)
-
-        df.ix[1:2] = 0
-        result = df[1:2]
-        self.assertTrue((result==0).all().all())
-
-        # #2727
-        index = Index([1.0, 2.5, 3.5, 4.5, 5.0])
-        df = DataFrame(np.random.randn(5, 5), index=index)
-
-        # positional slicing only via iloc!
-        # stacklevel=False -> needed stacklevel depends on index type
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = df.iloc[1.0:5]
-
-        expected = df.reindex([2.5, 3.5, 4.5, 5.0])
-        assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 4)
-
-        result = df.iloc[4:5]
-        expected = df.reindex([5.0])
-        assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 1)
-
-        # GH 4892, float indexers in iloc are deprecated
-        import warnings
-        warnings.filterwarnings(action='error', category=FutureWarning)
-
-        cp = df.copy()
-        def f():
-            cp.iloc[1.0:5] = 0
-        self.assertRaises(FutureWarning, f)
-        def f():
-            result = cp.iloc[1.0:5] == 0
-        self.assertRaises(FutureWarning, f)
-        self.assertTrue(result.values.all())
-        self.assertTrue((cp.iloc[0:1] == df.iloc[0:1]).values.all())
-
-        warnings.filterwarnings(action='default', category=FutureWarning)
-
-        cp = df.copy()
-        cp.iloc[4:5] = 0
-        self.assertTrue((cp.iloc[4:5] == 0).values.all())
-        self.assertTrue((cp.iloc[0:4] == df.iloc[0:4]).values.all())
-
-        # float slicing
-        result = df.ix[1.0:5]
-        expected = df
-        assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 5)
-
-        result = df.ix[1.1:5]
-        expected = df.reindex([2.5, 3.5, 4.5, 5.0])
-        assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 4)
-
-        result = df.ix[4.51:5]
-        expected = df.reindex([5.0])
-        assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 1)
-
-        result = df.ix[1.0:5.0]
-        expected = df.reindex([1.0, 2.5, 3.5, 4.5, 5.0])
-        assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 5)
-
-        cp = df.copy()
-        cp.ix[1.0:5.0] = 0
-        result = cp.ix[1.0:5.0]
-        self.assertTrue((result == 0).values.all())
-
-    def test_setitem_single_column_mixed(self):
-        df = DataFrame(randn(5, 3), index=['a', 'b', 'c', 'd', 'e'],
-                       columns=['foo', 'bar', 'baz'])
-        df['str'] = 'qux'
-        df.ix[::2, 'str'] = nan
-        expected = [nan, 'qux', nan, 'qux', nan]
-        assert_almost_equal(df['str'].values, expected)
-
-    def test_setitem_single_column_mixed_datetime(self):
-        df = DataFrame(randn(5, 3), index=['a', 'b', 'c', 'd', 'e'],
-                       columns=['foo', 'bar', 'baz'])
-
-        df['timestamp'] = Timestamp('20010102')
-
-        # check our dtypes
-        result = df.get_dtype_counts()
-        expected = Series({'float64': 3, 'datetime64[ns]': 1})
-        assert_series_equal(result, expected)
-
-        # set an allowable datetime64 type
-        from pandas import tslib
-        df.ix['b', 'timestamp'] = tslib.iNaT
-        self.assertTrue(com.isnull(df.ix['b', 'timestamp']))
-
-        # allow this syntax
-        df.ix['c', 'timestamp'] = nan
-        self.assertTrue(com.isnull(df.ix['c', 'timestamp']))
-
-        # allow this syntax
-        df.ix['d', :] = nan
-        self.assertTrue(com.isnull(df.ix['c', :]).all() == False)
-
-        # as of GH 3216 this will now work!
-        # try to set with a list like item
-        #self.assertRaises(
-        #    Exception, df.ix.__setitem__, ('d', 'timestamp'), [nan])
-
-    def test_setitem_frame(self):
-        piece = self.frame.ix[:2, ['A', 'B']]
-        self.frame.ix[-2:, ['A', 'B']] = piece.values
-        assert_almost_equal(self.frame.ix[-2:, ['A', 'B']].values,
-                            piece.values)
-
-        # GH 3216
-
-        # already aligned
-        f = self.mixed_frame.copy()
-        piece = DataFrame([[ 1, 2], [3, 4]], index=f.index[0:2],columns=['A', 'B'])
-        key = (slice(None,2), ['A', 'B'])
-        f.ix[key] = piece
-        assert_almost_equal(f.ix[0:2, ['A', 'B']].values,
-                            piece.values)
-
-        # rows unaligned
-        f = self.mixed_frame.copy()
-        piece = DataFrame([[ 1, 2 ], [3, 4], [5, 6], [7, 8]], index=list(f.index[0:2]) + ['foo','bar'],columns=['A', 'B'])
-        key = (slice(None,2), ['A', 'B'])
-        f.ix[key] = piece
-        assert_almost_equal(f.ix[0:2:, ['A', 'B']].values,
-                            piece.values[0:2])
-
-        # key is unaligned with values
-        f = self.mixed_frame.copy()
-        piece = f.ix[:2, ['A']]
-        piece.index = f.index[-2:]
-        key = (slice(-2, None), ['A', 'B'])
-        f.ix[key] = piece
-        piece['B'] = np.nan
-        assert_almost_equal(f.ix[-2:, ['A', 'B']].values,
-                            piece.values)
-
-        # ndarray
-        f = self.mixed_frame.copy()
-        piece = self.mixed_frame.ix[:2, ['A', 'B']]
-        key = (slice(-2, None), ['A', 'B'])
-        f.ix[key] = piece.values
-        assert_almost_equal(f.ix[-2:, ['A', 'B']].values,
-                            piece.values)
-
-
-        # needs upcasting
-        df = DataFrame([[1,2,'foo'],[3,4,'bar']],columns=['A','B','C'])
-        df2 = df.copy()
-        df2.ix[:,['A','B']] = df.ix[:,['A','B']]+0.5
-        expected = df.reindex(columns=['A','B'])
-        expected += 0.5
-        expected['C'] = df['C']
-        assert_frame_equal(df2, expected)
-
-    def test_setitem_frame_align(self):
-        piece = self.frame.ix[:2, ['A', 'B']]
-        piece.index = self.frame.index[-2:]
-        piece.columns = ['A', 'B']
-        self.frame.ix[-2:, ['A', 'B']] = piece
-        assert_almost_equal(self.frame.ix[-2:, ['A', 'B']].values,
-                            piece.values)
-
-    def test_setitem_fancy_exceptions(self):
-        pass
-
-    def test_getitem_boolean_missing(self):
-        pass
-
-    def test_setitem_boolean_missing(self):
-        pass
-
-    def test_getitem_setitem_ix_duplicates(self):
-        # #1201
-        df = DataFrame(np.random.randn(5, 3),
-                       index=['foo', 'foo', 'bar', 'baz', 'bar'])
-
-        result = df.ix['foo']
-        expected = df[:2]
-        assert_frame_equal(result, expected)
-
-        result = df.ix['bar']
-        expected = df.ix[[2, 4]]
-        assert_frame_equal(result, expected)
-
-        result = df.ix['baz']
-        expected = df.ix[3]
-        assert_series_equal(result, expected)
-
-    def test_getitem_ix_boolean_duplicates_multiple(self):
-        # #1201
-        df = DataFrame(np.random.randn(5, 3),
-                       index=['foo', 'foo', 'bar', 'baz', 'bar'])
-
-        result = df.ix[['bar']]
-        exp = df.ix[[2, 4]]
-        assert_frame_equal(result, exp)
-
-        result = df.ix[df[1] > 0]
-        exp = df[df[1] > 0]
-        assert_frame_equal(result, exp)
-
-        result = df.ix[df[0] > 0]
-        exp = df[df[0] > 0]
-        assert_frame_equal(result, exp)
-
-    def test_getitem_setitem_ix_bool_keyerror(self):
-        # #2199
-        df = DataFrame({'a': [1, 2, 3]})
-
-        self.assertRaises(KeyError, df.ix.__getitem__, False)
-        self.assertRaises(KeyError, df.ix.__getitem__, True)
-
-        self.assertRaises(KeyError, df.ix.__setitem__, False, 0)
-        self.assertRaises(KeyError, df.ix.__setitem__, True, 0)
-
-    def test_getitem_list_duplicates(self):
-        # #1943
-        df = DataFrame(np.random.randn(4, 4), columns=list('AABC'))
-        df.columns.name = 'foo'
-
-        result = df[['B', 'C']]
-        self.assertEqual(result.columns.name, 'foo')
-
-        expected = df.ix[:, 2:]
-        assert_frame_equal(result, expected)
-
-    def test_get_value(self):
-        for idx in self.frame.index:
-            for col in self.frame.columns:
-                result = self.frame.get_value(idx, col)
-                expected = self.frame[col][idx]
-                assert_almost_equal(result, expected)
-
-    def test_iteritems(self):
-        df = DataFrame([[1, 2, 3], [4, 5, 6]], columns=['a', 'a', 'b'])
-        for k, v in compat.iteritems(df):
-            self.assertEqual(type(v), Series)
-
-    def test_lookup(self):
-        def alt(df, rows, cols):
-            result = []
-            for r, c in zip(rows, cols):
-                result.append(df.get_value(r, c))
-            return result
-
-        def testit(df):
-            rows = list(df.index) * len(df.columns)
-            cols = list(df.columns) * len(df.index)
-            result = df.lookup(rows, cols)
-            expected = alt(df, rows, cols)
-            assert_almost_equal(result, expected)
-
-        testit(self.mixed_frame)
-        testit(self.frame)
-
-        df = DataFrame({'label': ['a', 'b', 'a', 'c'],
-                        'mask_a': [True, True, False, True],
-                        'mask_b': [True, False, False, False],
-                        'mask_c': [False, True, False, True]})
-        df['mask'] = df.lookup(df.index, 'mask_' + df['label'])
-        exp_mask = alt(df, df.index, 'mask_' + df['label'])
-        assert_almost_equal(df['mask'], exp_mask)
-        self.assertEqual(df['mask'].dtype, np.bool_)
-
-        with tm.assertRaises(KeyError):
-            self.frame.lookup(['xyz'], ['A'])
-
-        with tm.assertRaises(KeyError):
-            self.frame.lookup([self.frame.index[0]], ['xyz'])
-
-        with tm.assertRaisesRegexp(ValueError, 'same size'):
-            self.frame.lookup(['a', 'b', 'c'], ['a'])
-
-    def test_set_value(self):
-        for idx in self.frame.index:
-            for col in self.frame.columns:
-                self.frame.set_value(idx, col, 1)
-                assert_almost_equal(self.frame[col][idx], 1)
-
-    def test_set_value_resize(self):
-
-        res = self.frame.set_value('foobar', 'B', 0)
-        self.assertIs(res, self.frame)
-        self.assertEqual(res.index[-1], 'foobar')
-        self.assertEqual(res.get_value('foobar', 'B'), 0)
-
-        self.frame.loc['foobar','qux'] = 0
-        self.assertEqual(self.frame.get_value('foobar', 'qux'), 0)
-
-        res = self.frame.copy()
-        res3 = res.set_value('foobar', 'baz', 'sam')
-        self.assertEqual(res3['baz'].dtype, np.object_)
-
-        res = self.frame.copy()
-        res3 = res.set_value('foobar', 'baz', True)
-        self.assertEqual(res3['baz'].dtype, np.object_)
-
-        res = self.frame.copy()
-        res3 = res.set_value('foobar', 'baz', 5)
-        self.assertTrue(com.is_float_dtype(res3['baz']))
-        self.assertTrue(isnull(res3['baz'].drop(['foobar'])).all())
-        self.assertRaises(ValueError, res3.set_value, 'foobar', 'baz', 'sam')
-
-    def test_set_value_with_index_dtype_change(self):
-        df_orig = DataFrame(randn(3, 3), index=lrange(3), columns=list('ABC'))
-
-        # this is actually ambiguous as the 2 is interpreted as a positional
-        # so column is not created
-        df = df_orig.copy()
-        df.set_value('C', 2, 1.0)
-        self.assertEqual(list(df.index), list(df_orig.index) + ['C'])
-        #self.assertEqual(list(df.columns), list(df_orig.columns) + [2])
-
-        df = df_orig.copy()
-        df.loc['C', 2] = 1.0
-        self.assertEqual(list(df.index), list(df_orig.index) + ['C'])
-        #self.assertEqual(list(df.columns), list(df_orig.columns) + [2])
-
-        # create both new
-        df = df_orig.copy()
-        df.set_value('C', 'D', 1.0)
-        self.assertEqual(list(df.index), list(df_orig.index) + ['C'])
-        self.assertEqual(list(df.columns), list(df_orig.columns) + ['D'])
-
-        df = df_orig.copy()
-        df.loc['C', 'D'] = 1.0
-        self.assertEqual(list(df.index), list(df_orig.index) + ['C'])
-        self.assertEqual(list(df.columns), list(df_orig.columns) + ['D'])
-
-    def test_get_set_value_no_partial_indexing(self):
-        # partial w/ MultiIndex raise exception
-        index = MultiIndex.from_tuples([(0, 1), (0, 2), (1, 1), (1, 2)])
-        df = DataFrame(index=index, columns=lrange(4))
-        self.assertRaises(KeyError, df.get_value, 0, 1)
-        # self.assertRaises(KeyError, df.set_value, 0, 1, 0)
-
-    def test_single_element_ix_dont_upcast(self):
-        self.frame['E'] = 1
-        self.assertTrue(issubclass(self.frame['E'].dtype.type,
-                                   (int, np.integer)))
-
-        result = self.frame.ix[self.frame.index[5], 'E']
-        self.assertTrue(com.is_integer(result))
-
-    def test_irow(self):
-        df = DataFrame(np.random.randn(10, 4), index=lrange(0, 20, 2))
-
-        # 10711, deprecated
-        with tm.assert_produces_warning(FutureWarning):
-            df.irow(1)
-
-        result = df.iloc[1]
-        exp = df.ix[2]
-        assert_series_equal(result, exp)
-
-        result = df.iloc[2]
-        exp = df.ix[4]
-        assert_series_equal(result, exp)
-
-        # slice
-        result = df.iloc[slice(4, 8)]
-        expected = df.ix[8:14]
-        assert_frame_equal(result, expected)
-
-        # verify slice is view
-        # setting it makes it raise/warn
-        def f():
-            result[2] = 0.
-        self.assertRaises(com.SettingWithCopyError, f)
-        exp_col = df[2].copy()
-        exp_col[4:8] = 0.
-        assert_series_equal(df[2], exp_col)
-
-        # list of integers
-        result = df.iloc[[1, 2, 4, 6]]
-        expected = df.reindex(df.index[[1, 2, 4, 6]])
-        assert_frame_equal(result, expected)
-
-    def test_icol(self):
-
-        df = DataFrame(np.random.randn(4, 10), columns=lrange(0, 20, 2))
-
-        # 10711, deprecated
-        with tm.assert_produces_warning(FutureWarning):
-            df.icol(1)
-
-        result = df.iloc[:, 1]
-        exp = df.ix[:, 2]
-        assert_series_equal(result, exp)
-
-        result = df.iloc[:, 2]
-        exp = df.ix[:, 4]
-        assert_series_equal(result, exp)
-
-        # slice
-        result = df.iloc[:, slice(4, 8)]
-        expected = df.ix[:, 8:14]
-        assert_frame_equal(result, expected)
-
-        # verify slice is view
-        # and that we are setting a copy
-        def f():
-            result[8] = 0.
-        self.assertRaises(com.SettingWithCopyError, f)
-        self.assertTrue((df[8] == 0).all())
-
-        # list of integers
-        result = df.iloc[:, [1, 2, 4, 6]]
-        expected = df.reindex(columns=df.columns[[1, 2, 4, 6]])
-        assert_frame_equal(result, expected)
-
-    def test_irow_icol_duplicates(self):
-        # 10711, deprecated
-
-        df = DataFrame(np.random.rand(3, 3), columns=list('ABC'),
-                       index=list('aab'))
-
-        result = df.iloc[0]
-        result2 = df.ix[0]
-        tm.assertIsInstance(result, Series)
-        assert_almost_equal(result.values, df.values[0])
-        assert_series_equal(result, result2)
-
-        result = df.T.iloc[:, 0]
-        result2 = df.T.ix[:, 0]
-        tm.assertIsInstance(result, Series)
-        assert_almost_equal(result.values, df.values[0])
-        assert_series_equal(result, result2)
-
-        # multiindex
-        df = DataFrame(np.random.randn(3, 3), columns=[['i', 'i', 'j'],
-                                                       ['A', 'A', 'B']],
-                       index=[['i', 'i', 'j'], ['X', 'X', 'Y']])
-        rs = df.iloc[0]
-        xp = df.ix[0]
-        assert_series_equal(rs, xp)
-
-        rs = df.iloc[:, 0]
-        xp = df.T.ix[0]
-        assert_series_equal(rs, xp)
-
-        rs = df.iloc[:, [0]]
-        xp = df.ix[:, [0]]
-        assert_frame_equal(rs, xp)
-
-        # #2259
-        df = DataFrame([[1, 2, 3], [4, 5, 6]], columns=[1, 1, 2])
-        result = df.iloc[:, [0]]
-        expected = df.take([0], axis=1)
-        assert_frame_equal(result, expected)
-
-    def test_icol_sparse_propegate_fill_value(self):
-        from pandas.sparse.api import SparseDataFrame
-        df = SparseDataFrame({'A': [999, 1]}, default_fill_value=999)
-        self.assertTrue(len(df['A'].sp_values) == len(df.iloc[:, 0].sp_values))
-
-    def test_iget_value(self):
-        # 10711 deprecated
-
-        with tm.assert_produces_warning(FutureWarning):
-            self.frame.iget_value(0,0)
-
-        for i, row in enumerate(self.frame.index):
-            for j, col in enumerate(self.frame.columns):
-                result = self.frame.iat[i,j]
-                expected = self.frame.at[row, col]
-                assert_almost_equal(result, expected)
-
-    def test_nested_exception(self):
-        # Ignore the strange way of triggering the problem
-        # (which may get fixed), it's just a way to trigger
-        # the issue or reraising an outer exception without
-        # a named argument
-        df = DataFrame({"a": [1, 2, 3], "b": [4, 5, 6], "c": [7, 8,
-                       9]}).set_index(["a", "b"])
-        l = list(df.index)
-        l[0] = ["a", "b"]
-        df.index = l
-
-        try:
-            repr(df)
-        except Exception as e:
-            self.assertNotEqual(type(e), UnboundLocalError)
-
-    def test_reindex_methods(self):
-        df = pd.DataFrame({'x': list(range(5))})
-        target = np.array([-0.1, 0.9, 1.1, 1.5])
-
-        for method, expected_values in [('nearest', [0, 1, 1, 2]),
-                                        ('pad', [np.nan, 0, 1, 1]),
-                                        ('backfill', [0, 1, 2, 2])]:
-            expected = pd.DataFrame({'x': expected_values}, index=target)
-            actual = df.reindex(target, method=method)
-            assert_frame_equal(expected, actual)
-
-            actual = df.reindex_like(df, method=method, tolerance=0)
-            assert_frame_equal(df, actual)
-
-            actual = df.reindex(target, method=method, tolerance=1)
-            assert_frame_equal(expected, actual)
-
-            e2 = expected[::-1]
-            actual = df.reindex(target[::-1], method=method)
-            assert_frame_equal(e2, actual)
-
-            new_order = [3, 0, 2, 1]
-            e2 = expected.iloc[new_order]
-            actual = df.reindex(target[new_order], method=method)
-            assert_frame_equal(e2, actual)
-
-            switched_method = ('pad' if method == 'backfill'
-                               else 'backfill' if method == 'pad'
-                               else method)
-            actual = df[::-1].reindex(target, method=switched_method)
-            assert_frame_equal(expected, actual)
-
-        expected = pd.DataFrame({'x': [0, 1, 1, np.nan]}, index=target)
-        actual = df.reindex(target, method='nearest', tolerance=0.2)
-        assert_frame_equal(expected, actual)
-
-    def test_non_monotonic_reindex_methods(self):
-        dr = pd.date_range('2013-08-01', periods=6, freq='B')
-        data = np.random.randn(6,1)
-        df = pd.DataFrame(data, index=dr, columns=list('A'))
-        df_rev = pd.DataFrame(data, index=dr[[3, 4, 5] + [0, 1, 2]],
-                              columns=list('A'))
-        # index is not monotonic increasing or decreasing
-        self.assertRaises(ValueError, df_rev.reindex, df.index, method='pad')
-        self.assertRaises(ValueError, df_rev.reindex, df.index, method='ffill')
-        self.assertRaises(ValueError, df_rev.reindex, df.index, method='bfill')
-        self.assertRaises(ValueError, df_rev.reindex, df.index, method='nearest')
-
-    def test_reindex_level(self):
-        from itertools import permutations
-        icol = ['jim', 'joe', 'jolie']
-
-        def verify_first_level(df, level, idx):
-            f = lambda val: np.nonzero(df[level] == val)[0]
-            i = np.concatenate(list(map(f, idx)))
-            left = df.set_index(icol).reindex(idx, level=level)
-            right = df.iloc[i].set_index(icol)
-            assert_frame_equal(left, right)
-
-        def verify(df, level, idx, indexer):
-            left = df.set_index(icol).reindex(idx, level=level)
-            right = df.iloc[indexer].set_index(icol)
-            assert_frame_equal(left, right)
-
-        df = pd.DataFrame({'jim':list('B' * 4 + 'A' * 2 + 'C' * 3),
-                           'joe':list('abcdeabcd')[::-1],
-                           'jolie':[10, 20, 30] * 3,
-                           'joline': np.random.randint(0, 1000, 9)})
-
-        target = [['C', 'B', 'A'], ['F', 'C', 'A', 'D'], ['A'], ['D', 'F'],
-                  ['A', 'B', 'C'], ['C', 'A', 'B'], ['C', 'B'], ['C', 'A'],
-                  ['A', 'B'], ['B', 'A', 'C'], ['A', 'C', 'B']]
-
-        for idx in target:
-            verify_first_level(df, 'jim', idx)
-
-        verify(df, 'joe', list('abcde'), [3, 2, 1, 0, 5, 4, 8, 7, 6])
-        verify(df, 'joe', list('abcd'),  [3, 2, 1, 0, 5, 8, 7, 6])
-        verify(df, 'joe', list('abc'),   [3, 2, 1, 8, 7, 6])
-        verify(df, 'joe', list('eca'),   [1, 3, 4, 6, 8])
-        verify(df, 'joe', list('edc'),   [0, 1, 4, 5, 6])
-        verify(df, 'joe', list('eadbc'), [3, 0, 2, 1, 4, 5, 8, 7, 6])
-        verify(df, 'joe', list('edwq'),  [0, 4, 5])
-        verify(df, 'joe', list('wq'),    [])
-
-        df = DataFrame({'jim':['mid'] * 5 + ['btm'] * 8 + ['top'] * 7,
-                        'joe':['3rd'] * 2 + ['1st'] * 3 + ['2nd'] * 3 +
-                              ['1st'] * 2 + ['3rd'] * 3 + ['1st'] * 2 +
-                              ['3rd'] * 3 + ['2nd'] * 2,
-                        # this needs to be jointly unique with jim and joe or
-                        # reindexing will fail ~1.5% of the time, this works
-                        # out to needing unique groups of same size as joe
-                        'jolie': np.concatenate([np.random.choice(1000, x, replace=False)
-                                                 for x in [2, 3, 3, 2, 3, 2, 3, 2]]),
-                        'joline': np.random.randn(20).round(3) * 10})
-
-        for idx in permutations(df['jim'].unique()):
-            for i in range(3):
-                verify_first_level(df, 'jim', idx[:i+1])
-
-        i = [2,3,4,0,1,8,9,5,6,7,10,11,12,13,14,18,19,15,16,17]
-        verify(df, 'joe', ['1st', '2nd', '3rd'], i)
-
-        i = [0,1,2,3,4,10,11,12,5,6,7,8,9,15,16,17,18,19,13,14]
-        verify(df, 'joe', ['3rd', '2nd', '1st'], i)
-
-        i = [0,1,5,6,7,10,11,12,18,19,15,16,17]
-        verify(df, 'joe', ['2nd', '3rd'], i)
-
-        i = [0,1,2,3,4,10,11,12,8,9,15,16,17,13,14]
-        verify(df, 'joe', ['3rd', '1st'], i)
-
-    def test_getitem_ix_float_duplicates(self):
-        df = pd.DataFrame(np.random.randn(3, 3),
-                          index=[0.1, 0.2, 0.2], columns=list('abc'))
-        expect = df.iloc[1:]
-        tm.assert_frame_equal(df.loc[0.2], expect)
-        tm.assert_frame_equal(df.ix[0.2], expect)
-
-        expect = df.iloc[1:, 0]
-        tm.assert_series_equal(df.loc[0.2, 'a'], expect)
-
-        df.index = [1, 0.2, 0.2]
-        expect = df.iloc[1:]
-        tm.assert_frame_equal(df.loc[0.2], expect)
-        tm.assert_frame_equal(df.ix[0.2], expect)
-
-        expect = df.iloc[1:, 0]
-        tm.assert_series_equal(df.loc[0.2, 'a'], expect)
-
-        df = pd.DataFrame(np.random.randn(4, 3),
-                          index=[1, 0.2, 0.2, 1], columns=list('abc'))
-        expect = df.iloc[1:-1]
-        tm.assert_frame_equal(df.loc[0.2], expect)
-        tm.assert_frame_equal(df.ix[0.2], expect)
-
-        expect = df.iloc[1:-1, 0]
-        tm.assert_series_equal(df.loc[0.2, 'a'], expect)
-
-        df.index = [0.1, 0.2, 2, 0.2]
-        expect = df.iloc[[1, -1]]
-        tm.assert_frame_equal(df.loc[0.2], expect)
-        tm.assert_frame_equal(df.ix[0.2], expect)
-
-        expect = df.iloc[[1, -1], 0]
-        tm.assert_series_equal(df.loc[0.2, 'a'], expect)
-
-    def test_setitem_with_sparse_value(self):
-        # GH8131
-        df = pd.DataFrame({'c_1':['a', 'b', 'c'], 'n_1': [1., 2., 3.]})
-        sp_series = pd.Series([0, 0, 1]).to_sparse(fill_value=0)
-        df['new_column'] = sp_series
-        tm.assert_series_equal(df['new_column'], sp_series, check_names=False)
-
-    def test_setitem_with_unaligned_sparse_value(self):
-        df = pd.DataFrame({'c_1':['a', 'b', 'c'], 'n_1': [1., 2., 3.]})
-        sp_series = (pd.Series([0, 0, 1], index=[2, 1, 0])
-                     .to_sparse(fill_value=0))
-        df['new_column'] = sp_series
-        exp = pd.Series([1, 0, 0], name='new_column')
-        tm.assert_series_equal(df['new_column'], exp)
-
-
-_seriesd = tm.getSeriesData()
-_tsd = tm.getTimeSeriesData()
-
-_frame = DataFrame(_seriesd)
-_frame2 = DataFrame(_seriesd, columns=['D', 'C', 'B', 'A'])
-_intframe = DataFrame(dict((k, v.astype(int))
-                           for k, v in compat.iteritems(_seriesd)))
-
-_tsframe = DataFrame(_tsd)
-
-_mixed_frame = _frame.copy()
-_mixed_frame['foo'] = 'bar'
-
-
-class SafeForSparse(object):
-
-    _multiprocess_can_split_ = True
-
-    def test_copy_index_name_checking(self):
-        # don't want to be able to modify the index stored elsewhere after
-        # making a copy
-        for attr in ('index', 'columns'):
-            ind = getattr(self.frame, attr)
-            ind.name = None
-            cp = self.frame.copy()
-            getattr(cp, attr).name = 'foo'
-            self.assertIsNone(getattr(self.frame, attr).name)
-
-    def test_getitem_pop_assign_name(self):
-        s = self.frame['A']
-        self.assertEqual(s.name, 'A')
-
-        s = self.frame.pop('A')
-        self.assertEqual(s.name, 'A')
-
-        s = self.frame.ix[:, 'B']
-        self.assertEqual(s.name, 'B')
-
-        s2 = s.ix[:]
-        self.assertEqual(s2.name, 'B')
-
-    def test_get_value(self):
-        for idx in self.frame.index:
-            for col in self.frame.columns:
-                result = self.frame.get_value(idx, col)
-                expected = self.frame[col][idx]
-                assert_almost_equal(result, expected)
-
-    def test_join_index(self):
-        # left / right
-
-        f = self.frame.reindex(columns=['A', 'B'])[:10]
-        f2 = self.frame.reindex(columns=['C', 'D'])
-
-        joined = f.join(f2)
-        self.assertTrue(f.index.equals(joined.index))
-        self.assertEqual(len(joined.columns), 4)
-
-        joined = f.join(f2, how='left')
-        self.assertTrue(joined.index.equals(f.index))
-        self.assertEqual(len(joined.columns), 4)
-
-        joined = f.join(f2, how='right')
-        self.assertTrue(joined.index.equals(f2.index))
-        self.assertEqual(len(joined.columns), 4)
-
-        # inner
-
-        f = self.frame.reindex(columns=['A', 'B'])[:10]
-        f2 = self.frame.reindex(columns=['C', 'D'])
-
-        joined = f.join(f2, how='inner')
-        self.assertTrue(joined.index.equals(f.index.intersection(f2.index)))
-        self.assertEqual(len(joined.columns), 4)
-
-        # outer
-
-        f = self.frame.reindex(columns=['A', 'B'])[:10]
-        f2 = self.frame.reindex(columns=['C', 'D'])
-
-        joined = f.join(f2, how='outer')
-        self.assertTrue(tm.equalContents(self.frame.index, joined.index))
-        self.assertEqual(len(joined.columns), 4)
-
-        assertRaisesRegexp(ValueError, 'join method', f.join, f2, how='foo')
-
-        # corner case - overlapping columns
-        for how in ('outer', 'left', 'inner'):
-            with assertRaisesRegexp(ValueError, 'columns overlap but no suffix'):
-                self.frame.join(self.frame, how=how)
-
-    def test_join_index_more(self):
-        af = self.frame.ix[:, ['A', 'B']]
-        bf = self.frame.ix[::2, ['C', 'D']]
-
-        expected = af.copy()
-        expected['C'] = self.frame['C'][::2]
-        expected['D'] = self.frame['D'][::2]
-
-        result = af.join(bf)
-        assert_frame_equal(result, expected)
-
-        result = af.join(bf, how='right')
-        assert_frame_equal(result, expected[::2])
-
-        result = bf.join(af, how='right')
-        assert_frame_equal(result, expected.ix[:, result.columns])
-
-    def test_join_index_series(self):
-        df = self.frame.copy()
-        s = df.pop(self.frame.columns[-1])
-        joined = df.join(s)
-
-        assert_frame_equal(joined, self.frame, check_names=False) # TODO should this check_names ?
-
-        s.name = None
-        assertRaisesRegexp(ValueError, 'must have a name', df.join, s)
-
-    def test_join_overlap(self):
-        df1 = self.frame.ix[:, ['A', 'B', 'C']]
-        df2 = self.frame.ix[:, ['B', 'C', 'D']]
-
-        joined = df1.join(df2, lsuffix='_df1', rsuffix='_df2')
-        df1_suf = df1.ix[:, ['B', 'C']].add_suffix('_df1')
-        df2_suf = df2.ix[:, ['B', 'C']].add_suffix('_df2')
-        no_overlap = self.frame.ix[:, ['A', 'D']]
-        expected = df1_suf.join(df2_suf).join(no_overlap)
-
-        # column order not necessarily sorted
-        assert_frame_equal(joined, expected.ix[:, joined.columns])
-
-    def test_add_prefix_suffix(self):
-        with_prefix = self.frame.add_prefix('foo#')
-        expected = ['foo#%s' % c for c in self.frame.columns]
-        self.assert_numpy_array_equal(with_prefix.columns, expected)
-
-        with_suffix = self.frame.add_suffix('#foo')
-        expected = ['%s#foo' % c for c in self.frame.columns]
-        self.assert_numpy_array_equal(with_suffix.columns, expected)
-
-
-class TestDataFrame(tm.TestCase, CheckIndexing,
-                    SafeForSparse):
-    klass = DataFrame
-
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        import warnings
-
-        self.frame = _frame.copy()
-        self.frame2 = _frame2.copy()
-
-        # force these all to int64 to avoid platform testing issues
-        self.intframe = DataFrame(dict([ (c,s) for c,s in compat.iteritems(_intframe) ]), dtype = np.int64)
-        self.tsframe = _tsframe.copy()
-        self.mixed_frame = _mixed_frame.copy()
-        self.mixed_float  = DataFrame({ 'A': _frame['A'].copy().astype('float32'),
-                                        'B': _frame['B'].copy().astype('float32'),
-                                        'C': _frame['C'].copy().astype('float16'),
-                                        'D': _frame['D'].copy().astype('float64') })
-        self.mixed_float2 = DataFrame({ 'A': _frame2['A'].copy().astype('float32'),
-                                        'B': _frame2['B'].copy().astype('float32'),
-                                        'C': _frame2['C'].copy().astype('float16'),
-                                        'D': _frame2['D'].copy().astype('float64') })
-        self.mixed_int    = DataFrame({ 'A': _intframe['A'].copy().astype('int32'),
-                                        'B': np.ones(len(_intframe['B']),dtype='uint64'),
-                                        'C': _intframe['C'].copy().astype('uint8'),
-                                        'D': _intframe['D'].copy().astype('int64') })
-        self.all_mixed    = DataFrame({'a': 1., 'b': 2, 'c': 'foo', 'float32' : np.array([1.]*10,dtype='float32'),
-                                       'int32' : np.array([1]*10,dtype='int32'),
-                                       }, index=np.arange(10))
-        self.tzframe = DataFrame({'A' : date_range('20130101',periods=3),
-                                  'B' : date_range('20130101',periods=3,tz='US/Eastern'),
-                                  'C' : date_range('20130101',periods=3,tz='CET')})
-        self.tzframe.iloc[1,1] = pd.NaT
-        self.tzframe.iloc[1,2] = pd.NaT
-
-        self.ts1 = tm.makeTimeSeries()
-        self.ts2 = tm.makeTimeSeries()[5:]
-        self.ts3 = tm.makeTimeSeries()[-5:]
-        self.ts4 = tm.makeTimeSeries()[1:-1]
-
-        self.ts_dict = {
-            'col1': self.ts1,
-            'col2': self.ts2,
-            'col3': self.ts3,
-            'col4': self.ts4,
-        }
-        self.empty = DataFrame({})
-
-        arr = np.array([[1., 2., 3.],
-                        [4., 5., 6.],
-                        [7., 8., 9.]])
-
-        self.simple = DataFrame(arr, columns=['one', 'two', 'three'],
-                                index=['a', 'b', 'c'])
-
-    def test_get_axis(self):
-        f = self.frame
-        self.assertEqual(f._get_axis_number(0), 0)
-        self.assertEqual(f._get_axis_number(1), 1)
-        self.assertEqual(f._get_axis_number('index'), 0)
-        self.assertEqual(f._get_axis_number('rows'), 0)
-        self.assertEqual(f._get_axis_number('columns'), 1)
-
-        self.assertEqual(f._get_axis_name(0), 'index')
-        self.assertEqual(f._get_axis_name(1), 'columns')
-        self.assertEqual(f._get_axis_name('index'), 'index')
-        self.assertEqual(f._get_axis_name('rows'), 'index')
-        self.assertEqual(f._get_axis_name('columns'), 'columns')
-
-        self.assertIs(f._get_axis(0), f.index)
-        self.assertIs(f._get_axis(1), f.columns)
-
-        assertRaisesRegexp(ValueError, 'No axis named', f._get_axis_number, 2)
-        assertRaisesRegexp(ValueError, 'No axis.*foo', f._get_axis_name, 'foo')
-        assertRaisesRegexp(ValueError, 'No axis.*None', f._get_axis_name, None)
-        assertRaisesRegexp(ValueError, 'No axis named', f._get_axis_number, None)
-
-    def test_set_index(self):
-        idx = Index(np.arange(len(self.mixed_frame)))
-
-        # cache it
-        _ = self.mixed_frame['foo']
-        self.mixed_frame.index = idx
-        self.assertIs(self.mixed_frame['foo'].index, idx)
-        with assertRaisesRegexp(ValueError, 'Length mismatch'):
-            self.mixed_frame.index = idx[::2]
-
-    def test_set_index_cast(self):
-
-        # issue casting an index then set_index
-        df = DataFrame({'A' : [1.1,2.2,3.3], 'B' : [5.0,6.1,7.2]},
-                       index = [2010,2011,2012])
-        expected = df.ix[2010]
-        new_index = df.index.astype(np.int32)
-        df.index = new_index
-        result = df.ix[2010]
-        assert_series_equal(result,expected)
-
-    def test_set_index2(self):
-        df = DataFrame({'A': ['foo', 'foo', 'foo', 'bar', 'bar'],
-                        'B': ['one', 'two', 'three', 'one', 'two'],
-                        'C': ['a', 'b', 'c', 'd', 'e'],
-                        'D': np.random.randn(5),
-                        'E': np.random.randn(5)})
-
-        # new object, single-column
-        result = df.set_index('C')
-        result_nodrop = df.set_index('C', drop=False)
-
-        index = Index(df['C'], name='C')
-
-        expected = df.ix[:, ['A', 'B', 'D', 'E']]
-        expected.index = index
-
-        expected_nodrop = df.copy()
-        expected_nodrop.index = index
-
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result_nodrop, expected_nodrop)
-        self.assertEqual(result.index.name, index.name)
-
-        # inplace, single
-        df2 = df.copy()
-
-        df2.set_index('C', inplace=True)
-
-        assert_frame_equal(df2, expected)
-
-        df3 = df.copy()
-        df3.set_index('C', drop=False, inplace=True)
-
-        assert_frame_equal(df3, expected_nodrop)
-
-        # create new object, multi-column
-        result = df.set_index(['A', 'B'])
-        result_nodrop = df.set_index(['A', 'B'], drop=False)
-
-        index = MultiIndex.from_arrays([df['A'], df['B']], names=['A', 'B'])
-
-        expected = df.ix[:, ['C', 'D', 'E']]
-        expected.index = index
-
-        expected_nodrop = df.copy()
-        expected_nodrop.index = index
-
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result_nodrop, expected_nodrop)
-        self.assertEqual(result.index.names, index.names)
-
-        # inplace
-        df2 = df.copy()
-        df2.set_index(['A', 'B'], inplace=True)
-        assert_frame_equal(df2, expected)
-
-        df3 = df.copy()
-        df3.set_index(['A', 'B'], drop=False, inplace=True)
-        assert_frame_equal(df3, expected_nodrop)
-
-        # corner case
-        with assertRaisesRegexp(ValueError, 'Index has duplicate keys'):
-            df.set_index('A', verify_integrity=True)
-
-        # append
-        result = df.set_index(['A', 'B'], append=True)
-        xp = df.reset_index().set_index(['index', 'A', 'B'])
-        xp.index.names = [None, 'A', 'B']
-        assert_frame_equal(result, xp)
-
-        # append to existing multiindex
-        rdf = df.set_index(['A'], append=True)
-        rdf = rdf.set_index(['B', 'C'], append=True)
-        expected = df.set_index(['A', 'B', 'C'], append=True)
-        assert_frame_equal(rdf, expected)
-
-        # Series
-        result = df.set_index(df.C)
-        self.assertEqual(result.index.name, 'C')
-
-    def test_set_index_nonuniq(self):
-        df = DataFrame({'A': ['foo', 'foo', 'foo', 'bar', 'bar'],
-                        'B': ['one', 'two', 'three', 'one', 'two'],
-                        'C': ['a', 'b', 'c', 'd', 'e'],
-                        'D': np.random.randn(5),
-                        'E': np.random.randn(5)})
-        with assertRaisesRegexp(ValueError, 'Index has duplicate keys'):
-            df.set_index('A', verify_integrity=True, inplace=True)
-        self.assertIn('A', df)
-
-    def test_set_index_bug(self):
-        # GH1590
-        df = DataFrame({'val': [0, 1, 2], 'key': ['a', 'b', 'c']})
-        df2 = df.select(lambda indx: indx >= 1)
-        rs = df2.set_index('key')
-        xp = DataFrame({'val': [1, 2]},
-                       Index(['b', 'c'], name='key'))
-        assert_frame_equal(rs, xp)
-
-    def test_set_index_pass_arrays(self):
-        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                              'foo', 'bar', 'foo', 'foo'],
-                        'B': ['one', 'one', 'two', 'three',
-                              'two', 'two', 'one', 'three'],
-                        'C': np.random.randn(8),
-                        'D': np.random.randn(8)})
-
-        # multiple columns
-        result = df.set_index(['A', df['B'].values], drop=False)
-        expected = df.set_index(['A', 'B'], drop=False)
-        assert_frame_equal(result, expected, check_names=False) # TODO should set_index check_names ?
-
-    def test_construction_with_categorical_index(self):
-
-        ci = tm.makeCategoricalIndex(10)
-
-        # with Categorical
-        df = DataFrame({'A' : np.random.randn(10),
-                        'B' : ci.values })
-        idf = df.set_index('B')
-        str(idf)
-        tm.assert_index_equal(idf.index, ci, check_names=False)
-        self.assertEqual(idf.index.name, 'B')
-
-        # from a CategoricalIndex
-        df = DataFrame({'A' : np.random.randn(10),
-                        'B' : ci })
-        idf = df.set_index('B')
-        str(idf)
-        tm.assert_index_equal(idf.index, ci, check_names=False)
-        self.assertEqual(idf.index.name, 'B')
-
-        idf = df.set_index('B').reset_index().set_index('B')
-        str(idf)
-        tm.assert_index_equal(idf.index, ci, check_names=False)
-        self.assertEqual(idf.index.name, 'B')
-
-        new_df = idf.reset_index()
-        new_df.index = df.B
-        tm.assert_index_equal(new_df.index, ci, check_names=False)
-        self.assertEqual(idf.index.name, 'B')
-
-    def test_set_index_cast_datetimeindex(self):
-        df = DataFrame({'A': [datetime(2000, 1, 1) + timedelta(i)
-                              for i in range(1000)],
-                        'B': np.random.randn(1000)})
-
-        idf = df.set_index('A')
-        tm.assertIsInstance(idf.index, DatetimeIndex)
-
-        # don't cast a DatetimeIndex WITH a tz, leave as object
-        # GH 6032
-        i = pd.DatetimeIndex(pd.tseries.tools.to_datetime(['2013-1-1 13:00','2013-1-2 14:00'], errors="raise")).tz_localize('US/Pacific')
-        df = DataFrame(np.random.randn(2,1),columns=['A'])
-
-        expected = Series(np.array([pd.Timestamp('2013-01-01 13:00:00-0800', tz='US/Pacific'),
-                                    pd.Timestamp('2013-01-02 14:00:00-0800', tz='US/Pacific')], dtype="object"))
-
-        # convert index to series
-        result = Series(i)
-        assert_series_equal(result, expected)
-
-        # assignt to frame
-        df['B'] = i
-        result = df['B']
-        assert_series_equal(result, expected, check_names=False)
-        self.assertEqual(result.name, 'B')
-
-        # keep the timezone
-        result = i.to_series(keep_tz=True)
-        assert_series_equal(result.reset_index(drop=True), expected)
-
-        # convert to utc
-        df['C'] = i.to_series().reset_index(drop=True)
-        result = df['C']
-        comp = DatetimeIndex(expected.values).copy()
-        comp.tz = None
-        self.assert_numpy_array_equal(result.values, comp.values)
-
-        # list of datetimes with a tz
-        df['D'] = i.to_pydatetime()
-        result = df['D']
-        assert_series_equal(result, expected, check_names=False)
-        self.assertEqual(result.name, 'D')
-
-        # GH 6785
-        # set the index manually
-        import pytz
-        df = DataFrame([{'ts':datetime(2014, 4, 1, tzinfo=pytz.utc), 'foo':1}])
-        expected = df.set_index('ts')
-        df.index = df['ts']
-        df.pop('ts')
-        assert_frame_equal(df, expected)
-
-        # GH 3950
-        # reset_index with single level
-        for tz in ['UTC', 'Asia/Tokyo', 'US/Eastern']:
-            idx = pd.date_range('1/1/2011', periods=5, freq='D', tz=tz, name='idx')
-            df = pd.DataFrame({'a': range(5), 'b': ['A', 'B', 'C', 'D', 'E']}, index=idx)
-
-            expected = pd.DataFrame({'idx': [datetime(2011, 1, 1), datetime(2011, 1, 2),
-                                             datetime(2011, 1, 3), datetime(2011, 1, 4),
-                                             datetime(2011, 1, 5)],
-                                     'a': range(5), 'b': ['A', 'B', 'C', 'D', 'E']},
-                                     columns=['idx', 'a', 'b'])
-            expected['idx'] = expected['idx'].apply(lambda d: pd.Timestamp(d, tz=tz))
-            assert_frame_equal(df.reset_index(), expected)
-
-    def test_set_index_multiindexcolumns(self):
-        columns = MultiIndex.from_tuples([('foo', 1), ('foo', 2), ('bar', 1)])
-        df = DataFrame(np.random.randn(3, 3), columns=columns)
-        rs = df.set_index(df.columns[0])
-        xp = df.ix[:, 1:]
-        xp.index = df.ix[:, 0].values
-        xp.index.names = [df.columns[0]]
-        assert_frame_equal(rs, xp)
-
-    def test_set_index_empty_column(self):
-        # #1971
-        df = DataFrame([
-            dict(a=1, p=0),
-            dict(a=2, m=10),
-            dict(a=3, m=11, p=20),
-            dict(a=4, m=12, p=21)
-        ], columns=('a', 'm', 'p', 'x'))
-
-        # it works!
-        result = df.set_index(['a', 'x'])
-        repr(result)
-
-    def test_set_columns(self):
-        cols = Index(np.arange(len(self.mixed_frame.columns)))
-        self.mixed_frame.columns = cols
-        with assertRaisesRegexp(ValueError, 'Length mismatch'):
-            self.mixed_frame.columns = cols[::2]
-
-    def test_keys(self):
-        getkeys = self.frame.keys
-        self.assertIs(getkeys(), self.frame.columns)
-
-    def test_column_contains_typeerror(self):
-        try:
-            self.frame.columns in self.frame
-        except TypeError:
-            pass
-
-    def test_constructor(self):
-        df = DataFrame()
-        self.assertEqual(len(df.index), 0)
-
-        df = DataFrame(data={})
-        self.assertEqual(len(df.index), 0)
-
-    def test_constructor_mixed(self):
-        index, data = tm.getMixedTypeDict()
-
-        indexed_frame = DataFrame(data, index=index)
-        unindexed_frame = DataFrame(data)
-
-        self.assertEqual(self.mixed_frame['foo'].dtype, np.object_)
-
-    def test_constructor_cast_failure(self):
-        foo = DataFrame({'a': ['a', 'b', 'c']}, dtype=np.float64)
-        self.assertEqual(foo['a'].dtype, object)
-
-        # GH 3010, constructing with odd arrays
-        df = DataFrame(np.ones((4,2)))
-
-        # this is ok
-        df['foo'] = np.ones((4,2)).tolist()
-
-        # this is not ok
-        self.assertRaises(ValueError, df.__setitem__, tuple(['test']), np.ones((4,2)))
-
-        # this is ok
-        df['foo2'] = np.ones((4,2)).tolist()
-
-    def test_constructor_dtype_copy(self):
-        orig_df = DataFrame({
-            'col1': [1.],
-            'col2': [2.],
-            'col3': [3.]})
-
-        new_df = pd.DataFrame(orig_df, dtype=float, copy=True)
-
-        new_df['col1'] = 200.
-        self.assertEqual(orig_df['col1'][0], 1.)
-
-    def test_constructor_dtype_nocast_view(self):
-        df = DataFrame([[1, 2]])
-        should_be_view = DataFrame(df, dtype=df[0].dtype)
-        should_be_view[0][0] = 99
-        self.assertEqual(df.values[0, 0], 99)
-
-        should_be_view = DataFrame(df.values, dtype=df[0].dtype)
-        should_be_view[0][0] = 97
-        self.assertEqual(df.values[0, 0], 97)
-
-    def test_constructor_dtype_list_data(self):
-        df = DataFrame([[1, '2'],
-                        [None, 'a']], dtype=object)
-        self.assertIsNone(df.ix[1, 0])
-        self.assertEqual(df.ix[0, 1], '2')
-
-    def test_constructor_list_frames(self):
-
-        # GH 3243
-        result = DataFrame([DataFrame([])])
-        self.assertEqual(result.shape, (1,0))
-
-        result = DataFrame([DataFrame(dict(A = lrange(5)))])
-        tm.assertIsInstance(result.iloc[0,0], DataFrame)
-
-    def test_constructor_mixed_dtypes(self):
-
-        def _make_mixed_dtypes_df(typ, ad = None):
-
-            if typ == 'int':
-                dtypes = MIXED_INT_DTYPES
-                arrays = [ np.array(np.random.rand(10), dtype = d) for d in dtypes ]
-            elif typ == 'float':
-                dtypes = MIXED_FLOAT_DTYPES
-                arrays = [ np.array(np.random.randint(10, size=10), dtype = d) for d in dtypes ]
-
-            zipper = lzip(dtypes,arrays)
-            for d,a in zipper:
-                assert(a.dtype == d)
-            if ad is None:
-                ad = dict()
-            ad.update(dict([ (d,a) for d,a in zipper ]))
-            return DataFrame(ad)
-
-        def _check_mixed_dtypes(df, dtypes = None):
-            if dtypes is None:
-                dtypes = MIXED_FLOAT_DTYPES + MIXED_INT_DTYPES
-            for d in dtypes:
-                if d in df:
-                    assert(df.dtypes[d] == d)
-
-        # mixed floating and integer coexinst in the same frame
-        df     = _make_mixed_dtypes_df('float')
-        _check_mixed_dtypes(df)
-
-        # add lots of types
-        df     = _make_mixed_dtypes_df('float', dict(A = 1, B = 'foo', C = 'bar'))
-        _check_mixed_dtypes(df)
-
-        # GH 622
-        df     = _make_mixed_dtypes_df('int')
-        _check_mixed_dtypes(df)
-
-    def test_constructor_complex_dtypes(self):
-        # GH10952
-        a = np.random.rand(10).astype(np.complex64)
-        b = np.random.rand(10).astype(np.complex128)
-
-        df = DataFrame({'a': a, 'b': b})
-        self.assertEqual(a.dtype, df.a.dtype)
-        self.assertEqual(b.dtype, df.b.dtype)
-
-    def test_constructor_rec(self):
-        rec = self.frame.to_records(index=False)
-
-        # Assigning causes segfault in NumPy < 1.5.1
-        # rec.dtype.names = list(rec.dtype.names)[::-1]
-
-        index = self.frame.index
-
-        df = DataFrame(rec)
-        self.assert_numpy_array_equal(df.columns, rec.dtype.names)
-
-        df2 = DataFrame(rec, index=index)
-        self.assert_numpy_array_equal(df2.columns, rec.dtype.names)
-        self.assertTrue(df2.index.equals(index))
-
-        rng = np.arange(len(rec))[::-1]
-        df3 = DataFrame(rec, index=rng, columns=['C', 'B'])
-        expected = DataFrame(rec, index=rng).reindex(columns=['C', 'B'])
-        assert_frame_equal(df3, expected)
-
-    def test_constructor_bool(self):
-        df = DataFrame({0: np.ones(10, dtype=bool),
-                        1: np.zeros(10, dtype=bool)})
-        self.assertEqual(df.values.dtype, np.bool_)
-
-    def test_constructor_overflow_int64(self):
-        values = np.array([2 ** 64 - i for i in range(1, 10)],
-                          dtype=np.uint64)
-
-        result = DataFrame({'a': values})
-        self.assertEqual(result['a'].dtype, object)
-
-        # #2355
-        data_scores = [(6311132704823138710, 273), (2685045978526272070, 23),
-                       (8921811264899370420, 45), (long(17019687244989530680), 270),
-                       (long(9930107427299601010), 273)]
-        dtype = [('uid', 'u8'), ('score', 'u8')]
-        data = np.zeros((len(data_scores),), dtype=dtype)
-        data[:] = data_scores
-        df_crawls = DataFrame(data)
-        self.assertEqual(df_crawls['uid'].dtype, object)
-
-    def test_constructor_ordereddict(self):
-        import random
-        nitems = 100
-        nums = lrange(nitems)
-        random.shuffle(nums)
-        expected = ['A%d' % i for i in nums]
-        df = DataFrame(OrderedDict(zip(expected, [[0]] * nitems)))
-        self.assertEqual(expected, list(df.columns))
-
-    def test_constructor_dict(self):
-        frame = DataFrame({'col1': self.ts1,
-                           'col2': self.ts2})
-
-        tm.assert_dict_equal(self.ts1, frame['col1'], compare_keys=False)
-        tm.assert_dict_equal(self.ts2, frame['col2'], compare_keys=False)
-
-        frame = DataFrame({'col1': self.ts1,
-                           'col2': self.ts2},
-                          columns=['col2', 'col3', 'col4'])
-
-        self.assertEqual(len(frame), len(self.ts2))
-        self.assertNotIn('col1', frame)
-        self.assertTrue(isnull(frame['col3']).all())
-
-        # Corner cases
-        self.assertEqual(len(DataFrame({})), 0)
-
-        # mix dict and array, wrong size - no spec for which error should raise
-        # first
-        with tm.assertRaises(ValueError):
-            DataFrame({'A': {'a': 'a', 'b': 'b'}, 'B': ['a', 'b', 'c']})
-
-        # Length-one dict micro-optimization
-        frame = DataFrame({'A': {'1': 1, '2': 2}})
-        self.assert_numpy_array_equal(frame.index, ['1', '2'])
-
-        # empty dict plus index
-        idx = Index([0, 1, 2])
-        frame = DataFrame({}, index=idx)
-        self.assertIs(frame.index, idx)
-
-        # empty with index and columns
-        idx = Index([0, 1, 2])
-        frame = DataFrame({}, index=idx, columns=idx)
-        self.assertIs(frame.index, idx)
-        self.assertIs(frame.columns, idx)
-        self.assertEqual(len(frame._series), 3)
-
-        # with dict of empty list and Series
-        frame = DataFrame({'A': [], 'B': []}, columns=['A', 'B'])
-        self.assertTrue(frame.index.equals(Index([])))
-
-        # GH10856
-        # dict with scalar values should raise error, even if columns passed
-        with tm.assertRaises(ValueError):
-            DataFrame({'a': 0.7})
-
-        with tm.assertRaises(ValueError):
-            DataFrame({'a': 0.7}, columns=['a'])
-
-        with tm.assertRaises(ValueError):
-            DataFrame({'a': 0.7}, columns=['b'])
-
-    def test_constructor_multi_index(self):
-        # GH 4078
-        # construction error with mi and all-nan frame
-        tuples = [(2, 3), (3, 3), (3, 3)]
-        mi = MultiIndex.from_tuples(tuples)
-        df = DataFrame(index=mi,columns=mi)
-        self.assertTrue(pd.isnull(df).values.ravel().all())
-
-        tuples = [(3, 3), (2, 3), (3, 3)]
-        mi = MultiIndex.from_tuples(tuples)
-        df = DataFrame(index=mi,columns=mi)
-        self.assertTrue(pd.isnull(df).values.ravel().all())
-
-    def test_constructor_error_msgs(self):
-        msg = "Mixing dicts with non-Series may lead to ambiguous ordering."
-        # mix dict and array, wrong size
-        with assertRaisesRegexp(ValueError, msg):
-            DataFrame({'A': {'a': 'a', 'b': 'b'},
-                       'B': ['a', 'b', 'c']})
-
-        # wrong size ndarray, GH 3105
-        msg = "Shape of passed values is \(3, 4\), indices imply \(3, 3\)"
-        with assertRaisesRegexp(ValueError, msg):
-            DataFrame(np.arange(12).reshape((4, 3)),
-                      columns=['foo', 'bar', 'baz'],
-                      index=date_range('2000-01-01', periods=3))
-
-
-        # higher dim raise exception
-        with assertRaisesRegexp(ValueError, 'Must pass 2-d input'):
-            DataFrame(np.zeros((3, 3, 3)), columns=['A', 'B', 'C'], index=[1])
-
-        # wrong size axis labels
-        with assertRaisesRegexp(ValueError, "Shape of passed values is \(3, 2\), indices imply \(3, 1\)"):
-            DataFrame(np.random.rand(2,3), columns=['A', 'B', 'C'], index=[1])
-
-        with assertRaisesRegexp(ValueError, "Shape of passed values is \(3, 2\), indices imply \(2, 2\)"):
-            DataFrame(np.random.rand(2,3), columns=['A', 'B'], index=[1, 2])
-
-        with assertRaisesRegexp(ValueError, 'If using all scalar values, you must pass an index'):
-            DataFrame({'a': False, 'b': True})
-
-    def test_constructor_with_embedded_frames(self):
-
-        # embedded data frames
-        df1 = DataFrame({'a':[1, 2, 3], 'b':[3, 4, 5]})
-        df2 = DataFrame([df1, df1+10])
-
-        df2.dtypes
-        str(df2)
-
-        result = df2.loc[0,0]
-        assert_frame_equal(result,df1)
-
-        result = df2.loc[1,0]
-        assert_frame_equal(result,df1+10)
-
-    def test_insert_error_msmgs(self):
-
-        # GH 7432
-        df = DataFrame({'foo':['a', 'b', 'c'], 'bar':[1,2,3], 'baz':['d','e','f']}).set_index('foo')
-        s = DataFrame({'foo':['a', 'b', 'c', 'a'], 'fiz':['g','h','i','j']}).set_index('foo')
-        msg = 'cannot reindex from a duplicate axis'
-        with assertRaisesRegexp(ValueError, msg):
-            df['newcol'] = s
-
-        # GH 4107, more descriptive error message
-        df = DataFrame(np.random.randint(0,2,(4,4)),
-                       columns=['a', 'b', 'c', 'd'])
-
-        msg = 'incompatible index of inserted column with frame index'
-        with assertRaisesRegexp(TypeError, msg):
-            df['gr'] = df.groupby(['b', 'c']).count()
-
-    def test_frame_subclassing_and_slicing(self):
-        # Subclass frame and ensure it returns the right class on slicing it
-        # In reference to PR 9632
-
-        class CustomSeries(Series):
-            @property
-            def _constructor(self):
-                return CustomSeries
-
-            def custom_series_function(self):
-                return 'OK'
-
-        class CustomDataFrame(DataFrame):
-            "Subclasses pandas DF, fills DF with simulation results, adds some custom plotting functions."
-
-            def __init__(self, *args, **kw):
-                super(CustomDataFrame, self).__init__(*args, **kw)
-
-            @property
-            def _constructor(self):
-                return CustomDataFrame
-
-            _constructor_sliced = CustomSeries
-
-            def custom_frame_function(self):
-                return 'OK'
-
-        data = {'col1': range(10),
-                'col2': range(10)}
-        cdf = CustomDataFrame(data)
-
-        # Did we get back our own DF class?
-        self.assertTrue(isinstance(cdf, CustomDataFrame))
-
-        # Do we get back our own Series class after selecting a column?
-        cdf_series = cdf.col1
-        self.assertTrue(isinstance(cdf_series, CustomSeries))
-        self.assertEqual(cdf_series.custom_series_function(), 'OK')
-
-        # Do we get back our own DF class after slicing row-wise?
-        cdf_rows = cdf[1:5]
-        self.assertTrue(isinstance(cdf_rows, CustomDataFrame))
-        self.assertEqual(cdf_rows.custom_frame_function(), 'OK')
-
-        # Make sure sliced part of multi-index frame is custom class
-        mcol = pd.MultiIndex.from_tuples([('A', 'A'), ('A', 'B')])
-        cdf_multi = CustomDataFrame([[0, 1], [2, 3]], columns=mcol)
-        self.assertTrue(isinstance(cdf_multi['A'], CustomDataFrame))
-
-        mcol = pd.MultiIndex.from_tuples([('A', ''), ('B', '')])
-        cdf_multi2 = CustomDataFrame([[0, 1], [2, 3]], columns=mcol)
-        self.assertTrue(isinstance(cdf_multi2['A'], CustomSeries))
-
-    def test_constructor_subclass_dict(self):
-        # Test for passing dict subclass to constructor
-        data = {'col1': tm.TestSubDict((x, 10.0 * x) for x in range(10)),
-                'col2': tm.TestSubDict((x, 20.0 * x) for x in range(10))}
-        df = DataFrame(data)
-        refdf = DataFrame(dict((col, dict(compat.iteritems(val)))
-                               for col, val in compat.iteritems(data)))
-        assert_frame_equal(refdf, df)
-
-        data = tm.TestSubDict(compat.iteritems(data))
-        df = DataFrame(data)
-        assert_frame_equal(refdf, df)
-
-        # try with defaultdict
-        from collections import defaultdict
-        data = {}
-        self.frame['B'][:10] = np.nan
-        for k, v in compat.iteritems(self.frame):
-            dct = defaultdict(dict)
-            dct.update(v.to_dict())
-            data[k] = dct
-        frame = DataFrame(data)
-        assert_frame_equal(self.frame.sort_index(), frame)
-
-    def test_constructor_dict_block(self):
-        expected = [[4., 3., 2., 1.]]
-        df = DataFrame({'d': [4.], 'c': [3.], 'b': [2.], 'a': [1.]},
-                       columns=['d', 'c', 'b', 'a'])
-        assert_almost_equal(df.values, expected)
-
-    def test_constructor_dict_cast(self):
-        # cast float tests
-        test_data = {
-            'A': {'1': 1, '2': 2},
-            'B': {'1': '1', '2': '2', '3': '3'},
-        }
-        frame = DataFrame(test_data, dtype=float)
-        self.assertEqual(len(frame), 3)
-        self.assertEqual(frame['B'].dtype, np.float64)
-        self.assertEqual(frame['A'].dtype, np.float64)
-
-        frame = DataFrame(test_data)
-        self.assertEqual(len(frame), 3)
-        self.assertEqual(frame['B'].dtype, np.object_)
-        self.assertEqual(frame['A'].dtype, np.float64)
-
-        # can't cast to float
-        test_data = {
-            'A': dict(zip(range(20), tm.makeStringIndex(20))),
-            'B': dict(zip(range(15), randn(15)))
-        }
-        frame = DataFrame(test_data, dtype=float)
-        self.assertEqual(len(frame), 20)
-        self.assertEqual(frame['A'].dtype, np.object_)
-        self.assertEqual(frame['B'].dtype, np.float64)
-
-    def test_constructor_dict_dont_upcast(self):
-        d = {'Col1': {'Row1': 'A String', 'Row2': np.nan}}
-        df = DataFrame(d)
-        tm.assertIsInstance(df['Col1']['Row2'], float)
-
-        dm = DataFrame([[1, 2], ['a', 'b']], index=[1, 2], columns=[1, 2])
-        tm.assertIsInstance(dm[1][1], int)
-
-    def test_constructor_dict_of_tuples(self):
-        # GH #1491
-        data = {'a': (1, 2, 3), 'b': (4, 5, 6)}
-
-        result = DataFrame(data)
-        expected = DataFrame(dict((k, list(v)) for k, v in compat.iteritems(data)))
-        assert_frame_equal(result, expected, check_dtype=False)
-
-    def test_constructor_dict_multiindex(self):
-        check = lambda result, expected: tm.assert_frame_equal(
-            result, expected, check_dtype=True, check_index_type=True,
-            check_column_type=True, check_names=True)
-        d = {('a', 'a'): {('i', 'i'): 0, ('i', 'j'): 1, ('j', 'i'): 2},
-             ('b', 'a'): {('i', 'i'): 6, ('i', 'j'): 5, ('j', 'i'): 4},
-             ('b', 'c'): {('i', 'i'): 7, ('i', 'j'): 8, ('j', 'i'): 9}}
-        _d = sorted(d.items())
-        df = DataFrame(d)
-        expected = DataFrame(
-            [x[1] for x in _d],
-            index=MultiIndex.from_tuples([x[0] for x in _d])).T
-        expected.index = MultiIndex.from_tuples(expected.index)
-        check(df, expected)
-
-        d['z'] = {'y': 123., ('i', 'i'): 111, ('i', 'j'): 111, ('j', 'i'): 111}
-        _d.insert(0, ('z', d['z']))
-        expected = DataFrame(
-            [x[1] for x in _d],
-            index=Index([x[0] for x in _d], tupleize_cols=False)).T
-        expected.index = Index(expected.index, tupleize_cols=False)
-        df = DataFrame(d)
-        df = df.reindex(columns=expected.columns, index=expected.index)
-        check(df, expected)
-
-    def test_constructor_dict_datetime64_index(self):
-        # GH 10160
-        dates_as_str = ['1984-02-19', '1988-11-06', '1989-12-03', '1990-03-15']
-
-        def create_data(constructor):
-            return dict((i, {constructor(s): 2*i}) for i, s in enumerate(dates_as_str))
-
-        data_datetime64 = create_data(np.datetime64)
-        data_datetime = create_data(lambda x: datetime.strptime(x, '%Y-%m-%d'))
-        data_Timestamp = create_data(Timestamp)
-
-        expected = DataFrame([{0: 0, 1: None, 2: None, 3: None},
-                              {0: None, 1: 2, 2: None, 3: None},
-                              {0: None, 1: None, 2: 4, 3: None},
-                              {0: None, 1: None, 2: None, 3: 6}],
-                             index=[Timestamp(dt) for dt in dates_as_str])
-
-        result_datetime64 = DataFrame(data_datetime64)
-        result_datetime = DataFrame(data_datetime)
-        result_Timestamp = DataFrame(data_Timestamp)
-        assert_frame_equal(result_datetime64, expected)
-        assert_frame_equal(result_datetime, expected)
-        assert_frame_equal(result_Timestamp, expected)
-
-    def test_constructor_dict_timedelta64_index(self):
-        # GH 10160
-        td_as_int = [1, 2, 3, 4]
-
-        def create_data(constructor):
-            return dict((i, {constructor(s): 2*i}) for i, s in enumerate(td_as_int))
-
-        data_timedelta64 = create_data(lambda x: np.timedelta64(x, 'D'))
-        data_timedelta = create_data(lambda x: timedelta(days=x))
-        data_Timedelta = create_data(lambda x: Timedelta(x, 'D'))
-
-        expected = DataFrame([{0: 0, 1: None, 2: None, 3: None},
-                              {0: None, 1: 2, 2: None, 3: None},
-                              {0: None, 1: None, 2: 4, 3: None},
-                              {0: None, 1: None, 2: None, 3: 6}],
-                             index=[Timedelta(td, 'D') for td in td_as_int])
-
-        result_timedelta64 = DataFrame(data_timedelta64)
-        result_timedelta = DataFrame(data_timedelta)
-        result_Timedelta = DataFrame(data_Timedelta)
-        assert_frame_equal(result_timedelta64, expected)
-        assert_frame_equal(result_timedelta, expected)
-        assert_frame_equal(result_Timedelta, expected)
-
-    def test_nested_dict_frame_constructor(self):
-        rng = period_range('1/1/2000', periods=5)
-        df = DataFrame(randn(10, 5), columns=rng)
-
-        data = {}
-        for col in df.columns:
-            for row in df.index:
-                data.setdefault(col, {})[row] = df.get_value(row, col)
-
-        result = DataFrame(data, columns=rng)
-        tm.assert_frame_equal(result, df)
-
-        data = {}
-        for col in df.columns:
-            for row in df.index:
-                data.setdefault(row, {})[col] = df.get_value(row, col)
-
-        result = DataFrame(data, index=rng).T
-        tm.assert_frame_equal(result, df)
-
-
-    def _check_basic_constructor(self, empty):
-        "mat: 2d matrix with shpae (3, 2) to input. empty - makes sized objects"
-        mat = empty((2, 3), dtype=float)
-        # 2-D input
-        frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
-
-        self.assertEqual(len(frame.index), 2)
-        self.assertEqual(len(frame.columns), 3)
-
-        # 1-D input
-        frame = DataFrame(empty((3,)), columns=['A'], index=[1, 2, 3])
-        self.assertEqual(len(frame.index), 3)
-        self.assertEqual(len(frame.columns), 1)
-
-
-        # cast type
-        frame = DataFrame(mat, columns=['A', 'B', 'C'],
-                          index=[1, 2], dtype=np.int64)
-        self.assertEqual(frame.values.dtype, np.int64)
-
-        # wrong size axis labels
-        msg = r'Shape of passed values is \(3, 2\), indices imply \(3, 1\)'
-        with assertRaisesRegexp(ValueError, msg):
-            DataFrame(mat, columns=['A', 'B', 'C'], index=[1])
-        msg = r'Shape of passed values is \(3, 2\), indices imply \(2, 2\)'
-        with assertRaisesRegexp(ValueError, msg):
-            DataFrame(mat, columns=['A', 'B'], index=[1, 2])
-
-        # higher dim raise exception
-        with assertRaisesRegexp(ValueError, 'Must pass 2-d input'):
-            DataFrame(empty((3, 3, 3)), columns=['A', 'B', 'C'],
-                      index=[1])
-
-        # automatic labeling
-        frame = DataFrame(mat)
-        self.assert_numpy_array_equal(frame.index, lrange(2))
-        self.assert_numpy_array_equal(frame.columns, lrange(3))
-
-        frame = DataFrame(mat, index=[1, 2])
-        self.assert_numpy_array_equal(frame.columns, lrange(3))
-
-        frame = DataFrame(mat, columns=['A', 'B', 'C'])
-        self.assert_numpy_array_equal(frame.index, lrange(2))
-
-        # 0-length axis
-        frame = DataFrame(empty((0, 3)))
-        self.assertEqual(len(frame.index), 0)
-
-        frame = DataFrame(empty((3, 0)))
-        self.assertEqual(len(frame.columns), 0)
-
-    def test_constructor_ndarray(self):
-        mat = np.zeros((2, 3), dtype=float)
-        self._check_basic_constructor(np.ones)
-
-        frame = DataFrame(['foo', 'bar'], index=[0, 1], columns=['A'])
-        self.assertEqual(len(frame), 2)
-
-    def test_constructor_maskedarray(self):
-        self._check_basic_constructor(ma.masked_all)
-
-        # Check non-masked values
-        mat = ma.masked_all((2, 3), dtype=float)
-        mat[0, 0] = 1.0
-        mat[1, 2] = 2.0
-        frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
-        self.assertEqual(1.0, frame['A'][1])
-        self.assertEqual(2.0, frame['C'][2])
-
-        # what is this even checking??
-        mat = ma.masked_all((2, 3), dtype=float)
-        frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
-        self.assertTrue(np.all(~np.asarray(frame == frame)))
-
-    def test_constructor_maskedarray_nonfloat(self):
-        # masked int promoted to float
-        mat = ma.masked_all((2, 3), dtype=int)
-        # 2-D input
-        frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
-
-        self.assertEqual(len(frame.index), 2)
-        self.assertEqual(len(frame.columns), 3)
-        self.assertTrue(np.all(~np.asarray(frame == frame)))
-
-        # cast type
-        frame = DataFrame(mat, columns=['A', 'B', 'C'],
-                          index=[1, 2], dtype=np.float64)
-        self.assertEqual(frame.values.dtype, np.float64)
-
-        # Check non-masked values
-        mat2 = ma.copy(mat)
-        mat2[0, 0] = 1
-        mat2[1, 2] = 2
-        frame = DataFrame(mat2, columns=['A', 'B', 'C'], index=[1, 2])
-        self.assertEqual(1, frame['A'][1])
-        self.assertEqual(2, frame['C'][2])
-
-        # masked np.datetime64 stays (use lib.NaT as null)
-        mat = ma.masked_all((2, 3), dtype='M8[ns]')
-        # 2-D input
-        frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
-
-        self.assertEqual(len(frame.index), 2)
-        self.assertEqual(len(frame.columns), 3)
-        self.assertTrue(isnull(frame).values.all())
-
-        # cast type
-        frame = DataFrame(mat, columns=['A', 'B', 'C'],
-                          index=[1, 2], dtype=np.int64)
-        self.assertEqual(frame.values.dtype, np.int64)
-
-        # Check non-masked values
-        mat2 = ma.copy(mat)
-        mat2[0, 0] = 1
-        mat2[1, 2] = 2
-        frame = DataFrame(mat2, columns=['A', 'B', 'C'], index=[1, 2])
-        self.assertEqual(1, frame['A'].view('i8')[1])
-        self.assertEqual(2, frame['C'].view('i8')[2])
-
-        # masked bool promoted to object
-        mat = ma.masked_all((2, 3), dtype=bool)
-        # 2-D input
-        frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
-
-        self.assertEqual(len(frame.index), 2)
-        self.assertEqual(len(frame.columns), 3)
-        self.assertTrue(np.all(~np.asarray(frame == frame)))
-
-        # cast type
-        frame = DataFrame(mat, columns=['A', 'B', 'C'],
-                          index=[1, 2], dtype=object)
-        self.assertEqual(frame.values.dtype, object)
-
-        # Check non-masked values
-        mat2 = ma.copy(mat)
-        mat2[0, 0] = True
-        mat2[1, 2] = False
-        frame = DataFrame(mat2, columns=['A', 'B', 'C'], index=[1, 2])
-        self.assertEqual(True, frame['A'][1])
-        self.assertEqual(False, frame['C'][2])
-
-    def test_constructor_mrecarray(self):
-        # Ensure mrecarray produces frame identical to dict of masked arrays
-        # from GH3479
-
-        assert_fr_equal = functools.partial(assert_frame_equal,
-                                            check_index_type=True,
-                                            check_column_type=True,
-                                            check_frame_type=True)
-        arrays = [
-            ('float', np.array([1.5, 2.0])),
-            ('int', np.array([1, 2])),
-            ('str', np.array(['abc', 'def'])),
-        ]
-        for name, arr in arrays[:]:
-            arrays.append(('masked1_' + name,
-                           np.ma.masked_array(arr, mask=[False, True])))
-        arrays.append(('masked_all', np.ma.masked_all((2,))))
-        arrays.append(('masked_none',
-                       np.ma.masked_array([1.0, 2.5], mask=False)))
-
-        # call assert_frame_equal for all selections of 3 arrays
-        for comb in itertools.combinations(arrays, 3):
-            names, data = zip(*comb)
-            mrecs = mrecords.fromarrays(data, names=names)
-
-            # fill the comb
-            comb = dict([ (k, v.filled()) if hasattr(v,'filled') else (k, v) for k, v in comb ])
-
-            expected = DataFrame(comb,columns=names)
-            result = DataFrame(mrecs)
-            assert_fr_equal(result,expected)
-
-            # specify columns
-            expected = DataFrame(comb,columns=names[::-1])
-            result = DataFrame(mrecs, columns=names[::-1])
-            assert_fr_equal(result,expected)
-
-            # specify index
-            expected = DataFrame(comb,columns=names,index=[1,2])
-            result = DataFrame(mrecs, index=[1,2])
-            assert_fr_equal(result,expected)
-
-    def test_constructor_corner(self):
-        df = DataFrame(index=[])
-        self.assertEqual(df.values.shape, (0, 0))
-
-        # empty but with specified dtype
-        df = DataFrame(index=lrange(10), columns=['a', 'b'], dtype=object)
-        self.assertEqual(df.values.dtype, np.object_)
-
-        # does not error but ends up float
-        df = DataFrame(index=lrange(10), columns=['a', 'b'], dtype=int)
-        self.assertEqual(df.values.dtype, np.object_)
-
-        # #1783 empty dtype object
-        df = DataFrame({}, columns=['foo', 'bar'])
-        self.assertEqual(df.values.dtype, np.object_)
-
-        df = DataFrame({'b': 1}, index=lrange(10), columns=list('abc'),
-                       dtype=int)
-        self.assertEqual(df.values.dtype, np.object_)
-
-
-    def test_constructor_scalar_inference(self):
-        data = {'int': 1, 'bool': True,
-                'float': 3., 'complex': 4j, 'object': 'foo'}
-        df = DataFrame(data, index=np.arange(10))
-
-        self.assertEqual(df['int'].dtype, np.int64)
-        self.assertEqual(df['bool'].dtype, np.bool_)
-        self.assertEqual(df['float'].dtype, np.float64)
-        self.assertEqual(df['complex'].dtype, np.complex128)
-        self.assertEqual(df['object'].dtype, np.object_)
-
-    def test_constructor_arrays_and_scalars(self):
-        df = DataFrame({'a': randn(10), 'b': True})
-        exp = DataFrame({'a': df['a'].values, 'b': [True] * 10})
-
-        assert_frame_equal(df, exp)
-        with tm.assertRaisesRegexp(ValueError, 'must pass an index'):
-            DataFrame({'a': False, 'b': True})
-
-    def test_constructor_DataFrame(self):
-        df = DataFrame(self.frame)
-        assert_frame_equal(df, self.frame)
-
-        df_casted = DataFrame(self.frame, dtype=np.int64)
-        self.assertEqual(df_casted.values.dtype, np.int64)
-
-    def test_constructor_more(self):
-        # used to be in test_matrix.py
-        arr = randn(10)
-        dm = DataFrame(arr, columns=['A'], index=np.arange(10))
-        self.assertEqual(dm.values.ndim, 2)
-
-        arr = randn(0)
-        dm = DataFrame(arr)
-        self.assertEqual(dm.values.ndim, 2)
-        self.assertEqual(dm.values.ndim, 2)
-
-        # no data specified
-        dm = DataFrame(columns=['A', 'B'], index=np.arange(10))
-        self.assertEqual(dm.values.shape, (10, 2))
-
-        dm = DataFrame(columns=['A', 'B'])
-        self.assertEqual(dm.values.shape, (0, 2))
-
-        dm = DataFrame(index=np.arange(10))
-        self.assertEqual(dm.values.shape, (10, 0))
-
-        # corner, silly
-        # TODO: Fix this Exception to be better...
-        with assertRaisesRegexp(PandasError, 'constructor not properly called'):
-            DataFrame((1, 2, 3))
-
-        # can't cast
-        mat = np.array(['foo', 'bar'], dtype=object).reshape(2, 1)
-        with assertRaisesRegexp(ValueError, 'cast'):
-            DataFrame(mat, index=[0, 1], columns=[0], dtype=float)
-
-        dm = DataFrame(DataFrame(self.frame._series))
-        tm.assert_frame_equal(dm, self.frame)
-
-        # int cast
-        dm = DataFrame({'A': np.ones(10, dtype=int),
-                        'B': np.ones(10, dtype=np.float64)},
-                       index=np.arange(10))
-
-        self.assertEqual(len(dm.columns), 2)
-        self.assertEqual(dm.values.dtype, np.float64)
-
-    def test_constructor_empty_list(self):
-        df = DataFrame([], index=[])
-        expected = DataFrame(index=[])
-        assert_frame_equal(df, expected)
-
-        # GH 9939
-        df = DataFrame([], columns=['A', 'B'])
-        expected = DataFrame({}, columns=['A', 'B'])
-        assert_frame_equal(df, expected)
-
-        # Empty generator: list(empty_gen()) == []
-        def empty_gen():
-            return
-            yield
-
-        df = DataFrame(empty_gen(), columns=['A', 'B'])
-        assert_frame_equal(df, expected)
-
-    def test_constructor_list_of_lists(self):
-        # GH #484
-        l = [[1, 'a'], [2, 'b']]
-        df = DataFrame(data=l, columns=["num", "str"])
-        self.assertTrue(com.is_integer_dtype(df['num']))
-        self.assertEqual(df['str'].dtype, np.object_)
-
-        # GH 4851
-        # list of 0-dim ndarrays
-        expected = DataFrame({ 0: range(10) })
-        data = [np.array(x) for x in range(10)]
-        result = DataFrame(data)
-        assert_frame_equal(result, expected)
-
-    def test_constructor_sequence_like(self):
-        # GH 3783
-        # collections.Squence like
-        import collections
-
-        class DummyContainer(collections.Sequence):
-            def __init__(self, lst):
-                self._lst = lst
-            def __getitem__(self, n):
-                return self._lst.__getitem__(n)
-            def __len__(self, n):
-                return self._lst.__len__()
-
-        l = [DummyContainer([1, 'a']), DummyContainer([2, 'b'])]
-        columns = ["num", "str"]
-        result = DataFrame(l, columns=columns)
-        expected = DataFrame([[1,'a'],[2,'b']],columns=columns)
-        assert_frame_equal(result, expected, check_dtype=False)
-
-        # GH 4297
-        # support Array
-        import array
-        result = DataFrame.from_items([('A', array.array('i', range(10)))])
-        expected = DataFrame({ 'A' : list(range(10)) })
-        assert_frame_equal(result, expected, check_dtype=False)
-
-        expected = DataFrame([ list(range(10)), list(range(10)) ])
-        result = DataFrame([ array.array('i', range(10)), array.array('i',range(10)) ])
-        assert_frame_equal(result, expected, check_dtype=False)
-
-    def test_constructor_iterator(self):
-
-        expected = DataFrame([ list(range(10)), list(range(10)) ])
-        result = DataFrame([ range(10), range(10) ])
-        assert_frame_equal(result, expected)
-
-    def test_constructor_generator(self):
-        #related #2305
-
-        gen1 = (i for i in range(10))
-        gen2 = (i for i in range(10))
-
-        expected = DataFrame([ list(range(10)), list(range(10)) ])
-        result = DataFrame([ gen1, gen2 ])
-        assert_frame_equal(result, expected)
-
-        gen = ([ i, 'a'] for i in range(10))
-        result = DataFrame(gen)
-        expected = DataFrame({ 0 : range(10), 1 : 'a' })
-        assert_frame_equal(result, expected, check_dtype=False)
-
-    def test_constructor_list_of_dicts(self):
-        data = [OrderedDict([['a', 1.5], ['b', 3], ['c', 4], ['d', 6]]),
-                OrderedDict([['a', 1.5], ['b', 3], ['d', 6]]),
-                OrderedDict([['a', 1.5], ['d', 6]]),
-                OrderedDict(),
-                OrderedDict([['a', 1.5], ['b', 3], ['c', 4]]),
-                OrderedDict([['b', 3], ['c', 4], ['d', 6]])]
-
-        result = DataFrame(data)
-        expected = DataFrame.from_dict(dict(zip(range(len(data)), data)),
-                                       orient='index')
-        assert_frame_equal(result, expected.reindex(result.index))
-
-        result = DataFrame([{}])
-        expected = DataFrame(index=[0])
-        assert_frame_equal(result, expected)
-
-    def test_constructor_list_of_series(self):
-        data = [OrderedDict([['a', 1.5], ['b', 3.0], ['c', 4.0]]),
-                OrderedDict([['a', 1.5], ['b', 3.0], ['c', 6.0]])]
-        sdict = OrderedDict(zip(['x', 'y'], data))
-        idx = Index(['a', 'b', 'c'])
-
-        # all named
-        data2 = [Series([1.5, 3, 4], idx, dtype='O', name='x'),
-                 Series([1.5, 3, 6], idx, name='y')]
-        result = DataFrame(data2)
-        expected = DataFrame.from_dict(sdict, orient='index')
-        assert_frame_equal(result, expected)
-
-        # some unnamed
-        data2 = [Series([1.5, 3, 4], idx, dtype='O', name='x'),
-                 Series([1.5, 3, 6], idx)]
-        result = DataFrame(data2)
-
-        sdict = OrderedDict(zip(['x', 'Unnamed 0'], data))
-        expected = DataFrame.from_dict(sdict, orient='index')
-        assert_frame_equal(result.sort_index(), expected)
-
-        # none named
-        data = [OrderedDict([['a', 1.5], ['b', 3], ['c', 4], ['d', 6]]),
-                OrderedDict([['a', 1.5], ['b', 3], ['d', 6]]),
-                OrderedDict([['a', 1.5], ['d', 6]]),
-                OrderedDict(),
-                OrderedDict([['a', 1.5], ['b', 3], ['c', 4]]),
-                OrderedDict([['b', 3], ['c', 4], ['d', 6]])]
-        data = [Series(d) for d in data]
-
-        result = DataFrame(data)
-        sdict = OrderedDict(zip(range(len(data)), data))
-        expected = DataFrame.from_dict(sdict, orient='index')
-        assert_frame_equal(result, expected.reindex(result.index))
-
-        result2 = DataFrame(data, index=np.arange(6))
-        assert_frame_equal(result, result2)
-
-        result = DataFrame([Series({})])
-        expected = DataFrame(index=[0])
-        assert_frame_equal(result, expected)
-
-        data = [OrderedDict([['a', 1.5], ['b', 3.0], ['c', 4.0]]),
-                OrderedDict([['a', 1.5], ['b', 3.0], ['c', 6.0]])]
-        sdict = OrderedDict(zip(range(len(data)), data))
-
-        idx = Index(['a', 'b', 'c'])
-        data2 = [Series([1.5, 3, 4], idx, dtype='O'),
-                 Series([1.5, 3, 6], idx)]
-        result = DataFrame(data2)
-        expected = DataFrame.from_dict(sdict, orient='index')
-        assert_frame_equal(result, expected)
-
-    def test_constructor_list_of_derived_dicts(self):
-        class CustomDict(dict):
-            pass
-        d = {'a': 1.5, 'b': 3}
-
-        data_custom = [CustomDict(d)]
-        data = [d]
-
-        result_custom = DataFrame(data_custom)
-        result = DataFrame(data)
-        assert_frame_equal(result, result_custom)
-
-    def test_constructor_ragged(self):
-        data = {'A': randn(10),
-                'B': randn(8)}
-        with assertRaisesRegexp(ValueError, 'arrays must all be same length'):
-            DataFrame(data)
-
-    def test_constructor_scalar(self):
-        idx = Index(lrange(3))
-        df = DataFrame({"a": 0}, index=idx)
-        expected = DataFrame({"a": [0, 0, 0]}, index=idx)
-        assert_frame_equal(df, expected, check_dtype=False)
-
-    def test_constructor_Series_copy_bug(self):
-        df = DataFrame(self.frame['A'], index=self.frame.index, columns=['A'])
-        df.copy()
-
-    def test_constructor_mixed_dict_and_Series(self):
-        data = {}
-        data['A'] = {'foo': 1, 'bar': 2, 'baz': 3}
-        data['B'] = Series([4, 3, 2, 1], index=['bar', 'qux', 'baz', 'foo'])
-
-        result = DataFrame(data)
-        self.assertTrue(result.index.is_monotonic)
-
-        # ordering ambiguous, raise exception
-        with assertRaisesRegexp(ValueError, 'ambiguous ordering'):
-            DataFrame({'A': ['a', 'b'], 'B': {'a': 'a', 'b': 'b'}})
-
-        # this is OK though
-        result = DataFrame({'A': ['a', 'b'],
-                            'B': Series(['a', 'b'], index=['a', 'b'])})
-        expected = DataFrame({'A': ['a', 'b'], 'B': ['a', 'b']},
-                             index=['a', 'b'])
-        assert_frame_equal(result, expected)
-
-    def test_constructor_tuples(self):
-        result = DataFrame({'A': [(1, 2), (3, 4)]})
-        expected = DataFrame({'A': Series([(1, 2), (3, 4)])})
-        assert_frame_equal(result, expected)
-
-    def test_constructor_orient(self):
-        data_dict = self.mixed_frame.T._series
-        recons = DataFrame.from_dict(data_dict, orient='index')
-        expected = self.mixed_frame.sort_index()
-        assert_frame_equal(recons, expected)
-
-        # dict of sequence
-        a = {'hi': [32, 3, 3],
-             'there': [3, 5, 3]}
-        rs = DataFrame.from_dict(a, orient='index')
-        xp = DataFrame.from_dict(a).T.reindex(list(a.keys()))
-        assert_frame_equal(rs, xp)
-
-    def test_constructor_Series_named(self):
-        a = Series([1, 2, 3], index=['a', 'b', 'c'], name='x')
-        df = DataFrame(a)
-        self.assertEqual(df.columns[0], 'x')
-        self.assertTrue(df.index.equals(a.index))
-
-        # ndarray like
-        arr = np.random.randn(10)
-        s = Series(arr,name='x')
-        df = DataFrame(s)
-        expected = DataFrame(dict(x = s))
-        assert_frame_equal(df,expected)
-
-        s = Series(arr,index=range(3,13))
-        df = DataFrame(s)
-        expected = DataFrame({ 0 : s })
-        assert_frame_equal(df,expected)
-
-        self.assertRaises(ValueError, DataFrame, s, columns=[1,2])
-
-        # #2234
-        a = Series([], name='x')
-        df = DataFrame(a)
-        self.assertEqual(df.columns[0], 'x')
-
-        # series with name and w/o
-        s1 = Series(arr,name='x')
-        df = DataFrame([s1, arr]).T
-        expected = DataFrame({ 'x' : s1, 'Unnamed 0' : arr },columns=['x','Unnamed 0'])
-        assert_frame_equal(df,expected)
-
-        # this is a bit non-intuitive here; the series collapse down to arrays
-        df = DataFrame([arr, s1]).T
-        expected = DataFrame({ 1 : s1, 0 : arr },columns=[0,1])
-        assert_frame_equal(df,expected)
-
-    def test_constructor_Series_differently_indexed(self):
-        # name
-        s1 = Series([1, 2, 3], index=['a', 'b', 'c'], name='x')
-
-        # no name
-        s2 = Series([1, 2, 3], index=['a', 'b', 'c'])
-
-        other_index = Index(['a', 'b'])
-
-        df1 = DataFrame(s1, index=other_index)
-        exp1 = DataFrame(s1.reindex(other_index))
-        self.assertEqual(df1.columns[0], 'x')
-        assert_frame_equal(df1, exp1)
-
-        df2 = DataFrame(s2, index=other_index)
-        exp2 = DataFrame(s2.reindex(other_index))
-        self.assertEqual(df2.columns[0], 0)
-        self.assertTrue(df2.index.equals(other_index))
-        assert_frame_equal(df2, exp2)
-
-    def test_constructor_manager_resize(self):
-        index = list(self.frame.index[:5])
-        columns = list(self.frame.columns[:3])
-
-        result = DataFrame(self.frame._data, index=index,
-                           columns=columns)
-        self.assert_numpy_array_equal(result.index, index)
-        self.assert_numpy_array_equal(result.columns, columns)
-
-    def test_constructor_from_items(self):
-        items = [(c, self.frame[c]) for c in self.frame.columns]
-        recons = DataFrame.from_items(items)
-        assert_frame_equal(recons, self.frame)
-
-        # pass some columns
-        recons = DataFrame.from_items(items, columns=['C', 'B', 'A'])
-        assert_frame_equal(recons, self.frame.ix[:, ['C', 'B', 'A']])
-
-        # orient='index'
-
-        row_items = [(idx, self.mixed_frame.xs(idx))
-                     for idx in self.mixed_frame.index]
-
-        recons = DataFrame.from_items(row_items,
-                                      columns=self.mixed_frame.columns,
-                                      orient='index')
-        assert_frame_equal(recons, self.mixed_frame)
-        self.assertEqual(recons['A'].dtype, np.float64)
-
-        with tm.assertRaisesRegexp(TypeError,
-                                   "Must pass columns with orient='index'"):
-            DataFrame.from_items(row_items, orient='index')
-
-        # orient='index', but thar be tuples
-        arr = lib.list_to_object_array(
-            [('bar', 'baz')] * len(self.mixed_frame))
-        self.mixed_frame['foo'] = arr
-        row_items = [(idx, list(self.mixed_frame.xs(idx)))
-                     for idx in self.mixed_frame.index]
-        recons = DataFrame.from_items(row_items,
-                                      columns=self.mixed_frame.columns,
-                                      orient='index')
-        assert_frame_equal(recons, self.mixed_frame)
-        tm.assertIsInstance(recons['foo'][0], tuple)
-
-        rs = DataFrame.from_items([('A', [1, 2, 3]), ('B', [4, 5, 6])],
-                                  orient='index', columns=['one', 'two', 'three'])
-        xp = DataFrame([[1, 2, 3], [4, 5, 6]], index=['A', 'B'],
-                       columns=['one', 'two', 'three'])
-        assert_frame_equal(rs, xp)
-
-    def test_constructor_mix_series_nonseries(self):
-        df = DataFrame({'A': self.frame['A'],
-                        'B': list(self.frame['B'])}, columns=['A', 'B'])
-        assert_frame_equal(df, self.frame.ix[:, ['A', 'B']])
-
-        with tm.assertRaisesRegexp(ValueError, 'does not match index length'):
-            DataFrame({'A': self.frame['A'], 'B': list(self.frame['B'])[:-2]})
-
-    def test_constructor_miscast_na_int_dtype(self):
-        df = DataFrame([[np.nan, 1], [1, 0]], dtype=np.int64)
-        expected = DataFrame([[np.nan, 1], [1, 0]])
-        assert_frame_equal(df, expected)
-
-    def test_constructor_iterator_failure(self):
-        with assertRaisesRegexp(TypeError, 'iterator'):
-            df = DataFrame(iter([1, 2, 3]))
-
-    def test_constructor_column_duplicates(self):
-        # it works! #2079
-        df = DataFrame([[8, 5]], columns=['a', 'a'])
-        edf = DataFrame([[8, 5]])
-        edf.columns = ['a', 'a']
-
-        assert_frame_equal(df, edf)
-
-        idf = DataFrame.from_items(
-            [('a', [8]), ('a', [5])], columns=['a', 'a'])
-        assert_frame_equal(idf, edf)
-
-        self.assertRaises(ValueError, DataFrame.from_items,
-                          [('a', [8]), ('a', [5]), ('b', [6])],
-                          columns=['b', 'a', 'a'])
-
-    def test_constructor_empty_with_string_dtype(self):
-        # GH 9428
-        expected = DataFrame(index=[0, 1], columns=[0, 1], dtype=object)
-
-        df = DataFrame(index=[0, 1], columns=[0, 1], dtype=str)
-        assert_frame_equal(df, expected)
-        df = DataFrame(index=[0, 1], columns=[0, 1], dtype=np.str_)
-        assert_frame_equal(df, expected)
-        df = DataFrame(index=[0, 1], columns=[0, 1], dtype=np.unicode_)
-        assert_frame_equal(df, expected)
-        df = DataFrame(index=[0, 1], columns=[0, 1], dtype='U5')
-        assert_frame_equal(df, expected)
-
-
-    def test_column_dups_operations(self):
-
-        def check(result, expected=None):
-            if expected is not None:
-                assert_frame_equal(result,expected)
-            result.dtypes
-            str(result)
-
-        # assignment
-        # GH 3687
-        arr = np.random.randn(3, 2)
-        idx = lrange(2)
-        df = DataFrame(arr, columns=['A', 'A'])
-        df.columns = idx
-        expected = DataFrame(arr,columns=idx)
-        check(df,expected)
-
-        idx = date_range('20130101',periods=4,freq='Q-NOV')
-        df = DataFrame([[1,1,1,5],[1,1,2,5],[2,1,3,5]],columns=['a','a','a','a'])
-        df.columns = idx
-        expected = DataFrame([[1,1,1,5],[1,1,2,5],[2,1,3,5]],columns=idx)
-        check(df,expected)
-
-        # insert
-        df = DataFrame([[1,1,1,5],[1,1,2,5],[2,1,3,5]],columns=['foo','bar','foo','hello'])
-        df['string'] = 'bah'
-        expected = DataFrame([[1,1,1,5,'bah'],[1,1,2,5,'bah'],[2,1,3,5,'bah']],columns=['foo','bar','foo','hello','string'])
-        check(df,expected)
-        with assertRaisesRegexp(ValueError, 'Length of value'):
-            df.insert(0, 'AnotherColumn', range(len(df.index) - 1))
-
-        # insert same dtype
-        df['foo2'] = 3
-        expected = DataFrame([[1,1,1,5,'bah',3],[1,1,2,5,'bah',3],[2,1,3,5,'bah',3]],columns=['foo','bar','foo','hello','string','foo2'])
-        check(df,expected)
-
-        # set (non-dup)
-        df['foo2'] = 4
-        expected = DataFrame([[1,1,1,5,'bah',4],[1,1,2,5,'bah',4],[2,1,3,5,'bah',4]],columns=['foo','bar','foo','hello','string','foo2'])
-        check(df,expected)
-        df['foo2'] = 3
-
-        # delete (non dup)
-        del df['bar']
-        expected = DataFrame([[1,1,5,'bah',3],[1,2,5,'bah',3],[2,3,5,'bah',3]],columns=['foo','foo','hello','string','foo2'])
-        check(df,expected)
-
-        # try to delete again (its not consolidated)
-        del df['hello']
-        expected = DataFrame([[1,1,'bah',3],[1,2,'bah',3],[2,3,'bah',3]],columns=['foo','foo','string','foo2'])
-        check(df,expected)
-
-        # consolidate
-        df = df.consolidate()
-        expected = DataFrame([[1,1,'bah',3],[1,2,'bah',3],[2,3,'bah',3]],columns=['foo','foo','string','foo2'])
-        check(df,expected)
-
-        # insert
-        df.insert(2,'new_col',5.)
-        expected = DataFrame([[1,1,5.,'bah',3],[1,2,5.,'bah',3],[2,3,5.,'bah',3]],columns=['foo','foo','new_col','string','foo2'])
-        check(df,expected)
-
-        # insert a dup
-        assertRaisesRegexp(ValueError, 'cannot insert', df.insert, 2, 'new_col', 4.)
-        df.insert(2,'new_col',4.,allow_duplicates=True)
-        expected = DataFrame([[1,1,4.,5.,'bah',3],[1,2,4.,5.,'bah',3],[2,3,4.,5.,'bah',3]],columns=['foo','foo','new_col','new_col','string','foo2'])
-        check(df,expected)
-
-        # delete (dup)
-        del df['foo']
-        expected = DataFrame([[4.,5.,'bah',3],[4.,5.,'bah',3],[4.,5.,'bah',3]],columns=['new_col','new_col','string','foo2'])
-        assert_frame_equal(df,expected)
-
-        # dup across dtypes
-        df = DataFrame([[1,1,1.,5],[1,1,2.,5],[2,1,3.,5]],columns=['foo','bar','foo','hello'])
-        check(df)
-
-        df['foo2'] = 7.
-        expected = DataFrame([[1,1,1.,5,7.],[1,1,2.,5,7.],[2,1,3.,5,7.]],columns=['foo','bar','foo','hello','foo2'])
-        check(df,expected)
-
-        result = df['foo']
-        expected = DataFrame([[1,1.],[1,2.],[2,3.]],columns=['foo','foo'])
-        check(result,expected)
-
-        # multiple replacements
-        df['foo'] = 'string'
-        expected = DataFrame([['string',1,'string',5,7.],['string',1,'string',5,7.],['string',1,'string',5,7.]],columns=['foo','bar','foo','hello','foo2'])
-        check(df,expected)
-
-        del df['foo']
-        expected = DataFrame([[1,5,7.],[1,5,7.],[1,5,7.]],columns=['bar','hello','foo2'])
-        check(df,expected)
-
-        # values
-        df = DataFrame([[1,2.5],[3,4.5]], index=[1,2], columns=['x','x'])
-        result = df.values
-        expected = np.array([[1,2.5],[3,4.5]])
-        self.assertTrue((result == expected).all().all())
-
-        # rename, GH 4403
-        df4 = DataFrame({'TClose': [22.02],
-                         'RT': [0.0454],
-                         'TExg': [0.0422]},
-                        index=MultiIndex.from_tuples([(600809, 20130331)], names=['STK_ID', 'RPT_Date']))
-
-        df5 = DataFrame({'STK_ID': [600809] * 3,
-                         'RPT_Date': [20120930,20121231,20130331],
-                         'STK_Name': [u('饡驦'), u('饡驦'), u('饡驦')],
-                         'TClose': [38.05, 41.66, 30.01]},
-                        index=MultiIndex.from_tuples([(600809, 20120930), (600809, 20121231),(600809,20130331)], names=['STK_ID', 'RPT_Date']))
-
-        k = pd.merge(df4,df5,how='inner',left_index=True,right_index=True)
-        result = k.rename(columns={'TClose_x':'TClose', 'TClose_y':'QT_Close'})
-        str(result)
-        result.dtypes
-
-        expected = DataFrame([[0.0454, 22.02, 0.0422, 20130331, 600809, u('饡驦'), 30.01 ]],
-                             columns=['RT','TClose','TExg','RPT_Date','STK_ID','STK_Name','QT_Close']).set_index(['STK_ID','RPT_Date'],drop=False)
-        assert_frame_equal(result,expected)
-
-        # reindex is invalid!
-        df = DataFrame([[1,5,7.],[1,5,7.],[1,5,7.]],columns=['bar','a','a'])
-        self.assertRaises(ValueError, df.reindex, columns=['bar'])
-        self.assertRaises(ValueError, df.reindex, columns=['bar','foo'])
-
-        # drop
-        df = DataFrame([[1,5,7.],[1,5,7.],[1,5,7.]],columns=['bar','a','a'])
-        result = df.drop(['a'],axis=1)
-        expected = DataFrame([[1],[1],[1]],columns=['bar'])
-        check(result,expected)
-        result = df.drop('a',axis=1)
-        check(result,expected)
-
-        # describe
-        df = DataFrame([[1,1,1],[2,2,2],[3,3,3]],columns=['bar','a','a'],dtype='float64')
-        result = df.describe()
-        s = df.iloc[:,0].describe()
-        expected = pd.concat([ s, s, s],keys=df.columns,axis=1)
-        check(result,expected)
-
-        # check column dups with index equal and not equal to df's index
-        df = DataFrame(np.random.randn(5, 3), index=['a', 'b', 'c', 'd', 'e'],
-                       columns=['A', 'B', 'A'])
-        for index in [df.index, pd.Index(list('edcba'))]:
-            this_df = df.copy()
-            expected_ser = pd.Series(index.values, index=this_df.index)
-            expected_df = DataFrame.from_items([('A', expected_ser),
-                                                ('B', this_df['B']),
-                                                ('A', expected_ser)])
-            this_df['A'] = index
-            check(this_df, expected_df)
-
-        # operations
-        for op in ['__add__','__mul__','__sub__','__truediv__']:
-            df = DataFrame(dict(A = np.arange(10), B = np.random.rand(10)))
-            expected = getattr(df,op)(df)
-            expected.columns = ['A','A']
-            df.columns = ['A','A']
-            result = getattr(df,op)(df)
-            check(result,expected)
-
-        # multiple assignments that change dtypes
-        # the location indexer is a slice
-        # GH 6120
-        df = DataFrame(np.random.randn(5,2), columns=['that', 'that'])
-        expected = DataFrame(1.0, index=range(5), columns=['that', 'that'])
-
-        df['that'] = 1.0
-        check(df, expected)
-
-        df = DataFrame(np.random.rand(5,2), columns=['that', 'that'])
-        expected = DataFrame(1, index=range(5), columns=['that', 'that'])
-
-        df['that'] = 1
-        check(df, expected)
-
-    def test_column_dups2(self):
-
-        # drop buggy GH 6240
-        df = DataFrame({'A' : np.random.randn(5),
-                        'B' : np.random.randn(5),
-                        'C' : np.random.randn(5),
-                        'D' : ['a','b','c','d','e'] })
-
-        expected = df.take([0,1,1], axis=1)
-        df2 = df.take([2,0,1,2,1], axis=1)
-        result = df2.drop('C',axis=1)
-        assert_frame_equal(result, expected)
-
-        # dropna
-        df = DataFrame({'A' : np.random.randn(5),
-                        'B' : np.random.randn(5),
-                        'C' : np.random.randn(5),
-                        'D' : ['a','b','c','d','e'] })
-        df.iloc[2,[0,1,2]] = np.nan
-        df.iloc[0,0] = np.nan
-        df.iloc[1,1] = np.nan
-        df.iloc[:,3] = np.nan
-        expected = df.dropna(subset=['A','B','C'],how='all')
-        expected.columns = ['A','A','B','C']
-
-        df.columns = ['A','A','B','C']
-
-        result = df.dropna(subset=['A','C'],how='all')
-        assert_frame_equal(result, expected)
-
-    def test_column_dups_indexing(self):
-        def check(result, expected=None):
-            if expected is not None:
-                assert_frame_equal(result,expected)
-            result.dtypes
-            str(result)
-
-        # boolean indexing
-        # GH 4879
-        dups = ['A', 'A', 'C', 'D']
-        df = DataFrame(np.arange(12).reshape(3,4), columns=['A', 'B', 'C', 'D'],dtype='float64')
-        expected = df[df.C > 6]
-        expected.columns = dups
-        df = DataFrame(np.arange(12).reshape(3,4), columns=dups,dtype='float64')
-        result = df[df.C > 6]
-        check(result,expected)
-
-        # where
-        df = DataFrame(np.arange(12).reshape(3,4), columns=['A', 'B', 'C', 'D'],dtype='float64')
-        expected = df[df > 6]
-        expected.columns = dups
-        df = DataFrame(np.arange(12).reshape(3,4), columns=dups,dtype='float64')
-        result = df[df > 6]
-        check(result,expected)
-
-        # boolean with the duplicate raises
-        df = DataFrame(np.arange(12).reshape(3,4), columns=dups,dtype='float64')
-        self.assertRaises(ValueError, lambda : df[df.A > 6])
-
-        # dup aligining operations should work
-        # GH 5185
-        df1 = DataFrame([1, 2, 3, 4, 5], index=[1, 2, 1, 2, 3])
-        df2 = DataFrame([1, 2, 3], index=[1, 2, 3])
-        expected = DataFrame([0,2,0,2,2],index=[1,1,2,2,3])
-        result = df1.sub(df2)
-        assert_frame_equal(result,expected)
-
-        # equality
-        df1 = DataFrame([[1,2],[2,np.nan],[3,4],[4,4]],columns=['A','B'])
-        df2 = DataFrame([[0,1],[2,4],[2,np.nan],[4,5]],columns=['A','A'])
-
-        # not-comparing like-labelled
-        self.assertRaises(ValueError, lambda : df1 == df2)
-
-        df1r = df1.reindex_like(df2)
-        result = df1r == df2
-        expected = DataFrame([[False,True],[True,False],[False,False],[True,False]],columns=['A','A'])
-        assert_frame_equal(result,expected)
-
-        # mixed column selection
-        # GH 5639
-        dfbool = DataFrame({'one' : Series([True, True, False], index=['a', 'b', 'c']),
-                            'two' : Series([False, False, True, False], index=['a', 'b', 'c', 'd']),
-                            'three': Series([False, True, True, True], index=['a', 'b', 'c', 'd'])})
-        expected = pd.concat([dfbool['one'],dfbool['three'],dfbool['one']],axis=1)
-        result = dfbool[['one', 'three', 'one']]
-        check(result,expected)
-
-        # multi-axis dups
-        # GH 6121
-        df = DataFrame(np.arange(25.).reshape(5,5),
-                       index=['a', 'b', 'c', 'd', 'e'],
-                       columns=['A', 'B', 'C', 'D', 'E'])
-        z = df[['A', 'C', 'A']].copy()
-        expected = z.ix[['a', 'c', 'a']]
-
-        df = DataFrame(np.arange(25.).reshape(5,5),
-                       index=['a', 'b', 'c', 'd', 'e'],
-                       columns=['A', 'B', 'C', 'D', 'E'])
-        z = df[['A', 'C', 'A']]
-        result = z.ix[['a', 'c', 'a']]
-        check(result,expected)
-
-
-    def test_column_dups_indexing2(self):
-
-        # GH 8363
-        # datetime ops with a non-unique index
-        df = DataFrame({'A' : np.arange(5,dtype='int64'),
-                        'B' : np.arange(1,6,dtype='int64')},
-                       index=[2,2,3,3,4])
-        result = df.B-df.A
-        expected = Series(1,index=[2,2,3,3,4])
-        assert_series_equal(result,expected)
-
-        df = DataFrame({'A' : date_range('20130101',periods=5), 'B' : date_range('20130101 09:00:00', periods=5)},index=[2,2,3,3,4])
-        result = df.B-df.A
-        expected = Series(Timedelta('9 hours'),index=[2,2,3,3,4])
-        assert_series_equal(result,expected)
-
-    def test_insert_benchmark(self):
-        # from the vb_suite/frame_methods/frame_insert_columns
-        N = 10
-        K = 5
-        df = DataFrame(index=lrange(N))
-        new_col = np.random.randn(N)
-        for i in range(K):
-            df[i] = new_col
-        expected = DataFrame(np.repeat(new_col,K).reshape(N,K),index=lrange(N))
-        assert_frame_equal(df,expected)
-
-    def test_constructor_single_value(self):
-
-        # expecting single value upcasting here
-        df = DataFrame(0., index=[1, 2, 3], columns=['a', 'b', 'c'])
-        assert_frame_equal(df, DataFrame(np.zeros(df.shape).astype('float64'), df.index,
-                                         df.columns))
-
-        df = DataFrame(0, index=[1, 2, 3], columns=['a', 'b', 'c'])
-        assert_frame_equal(df, DataFrame(np.zeros(df.shape).astype('int64'), df.index,
-                                         df.columns))
-
-
-        df = DataFrame('a', index=[1, 2], columns=['a', 'c'])
-        assert_frame_equal(df, DataFrame(np.array([['a', 'a'],
-                                                   ['a', 'a']],
-                                                  dtype=object),
-                                         index=[1, 2],
-                                         columns=['a', 'c']))
-
-        self.assertRaises(com.PandasError, DataFrame, 'a', [1, 2])
-        self.assertRaises(com.PandasError, DataFrame, 'a', columns=['a', 'c'])
-        with tm.assertRaisesRegexp(TypeError, 'incompatible data and dtype'):
-            DataFrame('a', [1, 2], ['a', 'c'], float)
-
-    def test_constructor_with_datetimes(self):
-        intname = np.dtype(np.int_).name
-        floatname = np.dtype(np.float_).name
-        datetime64name = np.dtype('M8[ns]').name
-        objectname = np.dtype(np.object_).name
-
-        # single item
-        df = DataFrame({'A' : 1, 'B' : 'foo', 'C' : 'bar', 'D' : Timestamp("20010101"), 'E' : datetime(2001,1,2,0,0) },
-                       index=np.arange(10))
-        result = df.get_dtype_counts()
-        expected = Series({'int64': 1, datetime64name: 2, objectname : 2})
-        result.sort_index()
-        expected.sort_index()
-        assert_series_equal(result, expected)
-
-        # check with ndarray construction ndim==0 (e.g. we are passing a ndim 0 ndarray with a dtype specified)
-        df = DataFrame({'a': 1., 'b': 2, 'c': 'foo', floatname : np.array(1.,dtype=floatname),
-                        intname : np.array(1,dtype=intname)}, index=np.arange(10))
-        result = df.get_dtype_counts()
-        expected = { objectname : 1 }
-        if intname == 'int64':
-            expected['int64'] = 2
-        else:
-            expected['int64'] = 1
-            expected[intname] = 1
-        if floatname == 'float64':
-            expected['float64'] = 2
-        else:
-            expected['float64'] = 1
-            expected[floatname] = 1
-
-        result.sort_index()
-        expected = Series(expected)
-        expected.sort_index()
-        assert_series_equal(result, expected)
-
-        # check with ndarray construction ndim>0
-        df = DataFrame({'a': 1., 'b': 2, 'c': 'foo', floatname : np.array([1.]*10,dtype=floatname),
-                        intname : np.array([1]*10,dtype=intname)}, index=np.arange(10))
-        result = df.get_dtype_counts()
-        result.sort_index()
-        assert_series_equal(result, expected)
-
-        # GH 2809
-        ind = date_range(start="2000-01-01", freq="D", periods=10)
-        datetimes = [ts.to_pydatetime() for ts in ind]
-        datetime_s = Series(datetimes)
-        self.assertEqual(datetime_s.dtype, 'M8[ns]')
-        df = DataFrame({'datetime_s':datetime_s})
-        result = df.get_dtype_counts()
-        expected = Series({ datetime64name : 1 })
-        result.sort_index()
-        expected.sort_index()
-        assert_series_equal(result, expected)
-
-        # GH 2810
-        ind = date_range(start="2000-01-01", freq="D", periods=10)
-        datetimes = [ts.to_pydatetime() for ts in ind]
-        dates = [ts.date() for ts in ind]
-        df = DataFrame({'datetimes': datetimes, 'dates':dates})
-        result = df.get_dtype_counts()
-        expected = Series({ datetime64name : 1, objectname : 1 })
-        result.sort_index()
-        expected.sort_index()
-        assert_series_equal(result, expected)
-
-        # GH 7594
-        # don't coerce tz-aware
-        import pytz
-        tz = pytz.timezone('US/Eastern')
-        dt = tz.localize(datetime(2012, 1, 1))
-
-        df = DataFrame({'End Date': dt}, index=[0])
-        self.assertEqual(df.iat[0,0],dt)
-        assert_series_equal(df.dtypes,Series({'End Date' : 'datetime64[ns, US/Eastern]' }))
-
-        df = DataFrame([{'End Date': dt}])
-        self.assertEqual(df.iat[0,0],dt)
-        assert_series_equal(df.dtypes,Series({'End Date' : 'datetime64[ns, US/Eastern]' }))
-
-        # tz-aware (UTC and other tz's)
-        # GH 8411
-        dr = date_range('20130101',periods=3)
-        df = DataFrame({ 'value' : dr})
-        self.assertTrue(df.iat[0,0].tz is None)
-        dr = date_range('20130101',periods=3,tz='UTC')
-        df = DataFrame({ 'value' : dr})
-        self.assertTrue(str(df.iat[0,0].tz) == 'UTC')
-        dr = date_range('20130101',periods=3,tz='US/Eastern')
-        df = DataFrame({ 'value' : dr})
-        self.assertTrue(str(df.iat[0,0].tz) == 'US/Eastern')
-
-        # GH 7822
-        # preserver an index with a tz on dict construction
-        i = date_range('1/1/2011', periods=5, freq='10s', tz = 'US/Eastern')
-
-        expected = DataFrame( {'a' : i.to_series(keep_tz=True).reset_index(drop=True) })
-        df = DataFrame()
-        df['a'] = i
-        assert_frame_equal(df, expected)
-
-        df = DataFrame( {'a' : i } )
-        assert_frame_equal(df, expected)
-
-        # multiples
-        i_no_tz = date_range('1/1/2011', periods=5, freq='10s')
-        df = DataFrame( {'a' : i, 'b' :  i_no_tz } )
-        expected = DataFrame( {'a' : i.to_series(keep_tz=True).reset_index(drop=True), 'b': i_no_tz })
-        assert_frame_equal(df, expected)
-
-    def test_constructor_with_datetime_tz(self):
-
-        # 8260
-        # support datetime64 with tz
-
-        idx = Index(date_range('20130101',periods=3,tz='US/Eastern'),
-                    name='foo')
-        dr = date_range('20130110',periods=3)
-
-        # construction
-        df = DataFrame({'A' : idx, 'B' : dr})
-        self.assertTrue(df['A'].dtype,'M8[ns, US/Eastern')
-        self.assertTrue(df['A'].name == 'A')
-        assert_series_equal(df['A'],Series(idx,name='A'))
-        assert_series_equal(df['B'],Series(dr,name='B'))
-
-        # construction from dict
-        df2 = DataFrame(dict(A=Timestamp('20130102', tz='US/Eastern'), B=Timestamp('20130603', tz='CET')), index=range(5))
-        assert_series_equal(df2.dtypes, Series(['datetime64[ns, US/Eastern]', 'datetime64[ns, CET]'], index=['A','B']))
-
-        # dtypes
-        tzframe = DataFrame({'A' : date_range('20130101',periods=3),
-                             'B' : date_range('20130101',periods=3,tz='US/Eastern'),
-                             'C' : date_range('20130101',periods=3,tz='CET')})
-        tzframe.iloc[1,1] = pd.NaT
-        tzframe.iloc[1,2] = pd.NaT
-        result = tzframe.dtypes.sort_index()
-        expected = Series([ np.dtype('datetime64[ns]'),
-                            DatetimeTZDtype('datetime64[ns, US/Eastern]'),
-                            DatetimeTZDtype('datetime64[ns, CET]') ],
-                          ['A','B','C'])
-
-        # concat
-        df3 = pd.concat([df2.A.to_frame(),df2.B.to_frame()],axis=1)
-        assert_frame_equal(df2, df3)
-
-        # select_dtypes
-        result = df3.select_dtypes(include=['datetime64[ns]'])
-        expected = df3.reindex(columns=[])
-        assert_frame_equal(result, expected)
-
-        # this will select based on issubclass, and these are the same class
-        result = df3.select_dtypes(include=['datetime64[ns, CET]'])
-        expected = df3
-        assert_frame_equal(result, expected)
-
-        # from index
-        idx2 = date_range('20130101',periods=3,tz='US/Eastern',name='foo')
-        df2 = DataFrame(idx2)
-        assert_series_equal(df2['foo'],Series(idx2,name='foo'))
-        df2 = DataFrame(Series(idx2))
-        assert_series_equal(df2['foo'],Series(idx2,name='foo'))
-
-        idx2 = date_range('20130101',periods=3,tz='US/Eastern')
-        df2 = DataFrame(idx2)
-        assert_series_equal(df2[0],Series(idx2,name=0))
-        df2 = DataFrame(Series(idx2))
-        assert_series_equal(df2[0],Series(idx2,name=0))
-
-        # interleave with object
-        result = self.tzframe.assign(D = 'foo').values
-        expected = np.array([[Timestamp('2013-01-01 00:00:00'),
-                              Timestamp('2013-01-02 00:00:00'),
-                              Timestamp('2013-01-03 00:00:00')],
-                             [Timestamp('2013-01-01 00:00:00-0500', tz='US/Eastern'),
-                              pd.NaT,
-                              Timestamp('2013-01-03 00:00:00-0500', tz='US/Eastern')],
-                             [Timestamp('2013-01-01 00:00:00+0100', tz='CET'),
-                              pd.NaT,
-                              Timestamp('2013-01-03 00:00:00+0100', tz='CET')],
-                             ['foo','foo','foo']], dtype=object).T
-        self.assert_numpy_array_equal(result, expected)
-
-        # interleave with only datetime64[ns]
-        result = self.tzframe.values
-        expected = np.array([[Timestamp('2013-01-01 00:00:00'),
-                              Timestamp('2013-01-02 00:00:00'),
-                              Timestamp('2013-01-03 00:00:00')],
-                             [Timestamp('2013-01-01 00:00:00-0500', tz='US/Eastern'),
-                              pd.NaT,
-                              Timestamp('2013-01-03 00:00:00-0500', tz='US/Eastern')],
-                             [Timestamp('2013-01-01 00:00:00+0100', tz='CET'),
-                              pd.NaT,
-                              Timestamp('2013-01-03 00:00:00+0100', tz='CET')]], dtype=object).T
-        self.assert_numpy_array_equal(result, expected)
-
-        # astype
-        expected = np.array([[Timestamp('2013-01-01 00:00:00'),
-                              Timestamp('2013-01-02 00:00:00'),
-                              Timestamp('2013-01-03 00:00:00')],
-                             [Timestamp('2013-01-01 00:00:00-0500', tz='US/Eastern'),
-                              pd.NaT,
-                              Timestamp('2013-01-03 00:00:00-0500', tz='US/Eastern')],
-                             [Timestamp('2013-01-01 00:00:00+0100', tz='CET'),
-                              pd.NaT,
-                              Timestamp('2013-01-03 00:00:00+0100', tz='CET')]], dtype=object).T
-        result = self.tzframe.astype(object)
-        assert_frame_equal(result, DataFrame(expected, index=self.tzframe.index, columns=self.tzframe.columns))
-
-        result = self.tzframe.astype('datetime64[ns]')
-        expected = DataFrame({'A' : date_range('20130101',periods=3),
-                              'B' : date_range('20130101',periods=3,tz='US/Eastern').tz_convert('UTC').tz_localize(None),
-                              'C' : date_range('20130101',periods=3,tz='CET').tz_convert('UTC').tz_localize(None)})
-        expected.iloc[1,1] = pd.NaT
-        expected.iloc[1,2] = pd.NaT
-        assert_frame_equal(result, expected)
-
-        # str formatting
-        result = self.tzframe.astype(str)
-        expected = np.array([['2013-01-01', '2013-01-01 00:00:00-05:00',
-                              '2013-01-01 00:00:00+01:00'],
-                             ['2013-01-02', 'NaT', 'NaT'],
-                             ['2013-01-03', '2013-01-03 00:00:00-05:00',
-                              '2013-01-03 00:00:00+01:00']], dtype=object)
-        self.assert_numpy_array_equal(result, expected)
-
-        result = str(self.tzframe)
-        self.assertTrue('0 2013-01-01 2013-01-01 00:00:00-05:00 2013-01-01 00:00:00+01:00' in result)
-        self.assertTrue('1 2013-01-02                       NaT                       NaT' in result)
-        self.assertTrue('2 2013-01-03 2013-01-03 00:00:00-05:00 2013-01-03 00:00:00+01:00' in result)
-
-        # setitem
-        df['C'] = idx
-        assert_series_equal(df['C'],Series(idx,name='C'))
-
-        df['D'] = 'foo'
-        df['D'] = idx
-        assert_series_equal(df['D'],Series(idx,name='D'))
-        del df['D']
-
-        # assert that A & C are not sharing the same base (e.g. they
-        # are copies)
-        b1 = df._data.blocks[1]
-        b2 = df._data.blocks[2]
-        self.assertTrue(b1.values.equals(b2.values))
-        self.assertFalse(id(b1.values.values.base) == id(b2.values.values.base))
-
-        # with nan
-        df2 = df.copy()
-        df2.iloc[1,1] = pd.NaT
-        df2.iloc[1,2] = pd.NaT
-        result = df2['B']
-        assert_series_equal(notnull(result), Series([True,False,True],name='B'))
-        assert_series_equal(df2.dtypes, df.dtypes)
-
-        # set/reset
-        df = DataFrame({'A' : [0,1,2] }, index=idx)
-        result = df.reset_index()
-        self.assertTrue(result['foo'].dtype,'M8[ns, US/Eastern')
-
-        result = result.set_index('foo')
-        tm.assert_index_equal(df.index,idx)
-
-    def test_constructor_for_list_with_dtypes(self):
-        intname = np.dtype(np.int_).name
-        floatname = np.dtype(np.float_).name
-        datetime64name = np.dtype('M8[ns]').name
-        objectname = np.dtype(np.object_).name
-
-        # test list of lists/ndarrays
-        df = DataFrame([np.arange(5) for x in range(5)])
-        result = df.get_dtype_counts()
-        expected = Series({'int64' : 5})
-
-        df = DataFrame([np.array(np.arange(5),dtype='int32') for x in range(5)])
-        result = df.get_dtype_counts()
-        expected = Series({'int32' : 5})
-
-        # overflow issue? (we always expecte int64 upcasting here)
-        df = DataFrame({'a' : [2**31,2**31+1]})
-        result = df.get_dtype_counts()
-        expected = Series({'int64' : 1 })
-        assert_series_equal(result, expected)
-
-        # GH #2751 (construction with no index specified), make sure we cast to platform values
-        df = DataFrame([1, 2])
-        result = df.get_dtype_counts()
-        expected = Series({'int64': 1 })
-        assert_series_equal(result, expected)
-
-        df = DataFrame([1.,2.])
-        result = df.get_dtype_counts()
-        expected = Series({'float64' : 1 })
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'a' : [1, 2]})
-        result = df.get_dtype_counts()
-        expected = Series({'int64' : 1})
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'a' : [1., 2.]})
-        result = df.get_dtype_counts()
-        expected = Series({'float64' : 1})
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'a' : 1 }, index=lrange(3))
-        result = df.get_dtype_counts()
-        expected = Series({'int64': 1})
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'a' : 1. }, index=lrange(3))
-        result = df.get_dtype_counts()
-        expected = Series({'float64': 1 })
-        assert_series_equal(result, expected)
-
-        # with object list
-        df = DataFrame({'a':[1,2,4,7], 'b':[1.2, 2.3, 5.1, 6.3],
-                        'c':list('abcd'), 'd':[datetime(2000,1,1) for i in range(4)],
-                        'e' : [1.,2,4.,7]})
-        result = df.get_dtype_counts()
-        expected = Series({'int64': 1, 'float64' : 2, datetime64name: 1, objectname : 1})
-        result.sort_index()
-        expected.sort_index()
-        assert_series_equal(result, expected)
-
-    def test_not_hashable(self):
-        df = pd.DataFrame([1])
-        self.assertRaises(TypeError, hash, df)
-        self.assertRaises(TypeError, hash, self.empty)
-
-    def test_timedeltas(self):
-
-        df = DataFrame(dict(A = Series(date_range('2012-1-1', periods=3, freq='D')),
-                            B = Series([ timedelta(days=i) for i in range(3) ])))
-        result = df.get_dtype_counts().sort_values()
-        expected = Series({'datetime64[ns]': 1, 'timedelta64[ns]' : 1 }).sort_values()
-        assert_series_equal(result, expected)
-
-        df['C'] = df['A'] + df['B']
-        expected = Series({'datetime64[ns]': 2, 'timedelta64[ns]' : 1 }).sort_values()
-        result = df.get_dtype_counts().sort_values()
-        assert_series_equal(result, expected)
-
-        # mixed int types
-        df['D'] = 1
-        expected = Series({'datetime64[ns]': 2, 'timedelta64[ns]' : 1, 'int64' : 1 }).sort_values()
-        result = df.get_dtype_counts().sort_values()
-        assert_series_equal(result, expected)
-
-    def test_operators_timedelta64(self):
-
-        from datetime import datetime, timedelta
-        df = DataFrame(dict(A = date_range('2012-1-1', periods=3, freq='D'),
-                            B = date_range('2012-1-2', periods=3, freq='D'),
-                            C = Timestamp('20120101')-timedelta(minutes=5,seconds=5)))
-
-        diffs = DataFrame(dict(A = df['A']-df['C'],
-                               B = df['A']-df['B']))
-
-
-        # min
-        result = diffs.min()
-        self.assertEqual(result[0], diffs.ix[0,'A'])
-        self.assertEqual(result[1], diffs.ix[0,'B'])
-
-        result = diffs.min(axis=1)
-        self.assertTrue((result == diffs.ix[0,'B']).all() == True)
-
-        # max
-        result = diffs.max()
-        self.assertEqual(result[0], diffs.ix[2,'A'])
-        self.assertEqual(result[1], diffs.ix[2,'B'])
-
-        result = diffs.max(axis=1)
-        self.assertTrue((result == diffs['A']).all() == True)
-
-        # abs
-        result = diffs.abs()
-        result2 = abs(diffs)
-        expected = DataFrame(dict(A = df['A']-df['C'],
-                                  B = df['B']-df['A']))
-        assert_frame_equal(result,expected)
-        assert_frame_equal(result2, expected)
-
-        # mixed frame
-        mixed = diffs.copy()
-        mixed['C'] = 'foo'
-        mixed['D'] = 1
-        mixed['E'] = 1.
-        mixed['F'] = Timestamp('20130101')
-
-        # results in an object array
-        from pandas.tseries.timedeltas import _coerce_scalar_to_timedelta_type
-        result = mixed.min()
-        expected = Series([_coerce_scalar_to_timedelta_type(timedelta(seconds=5*60+5)),
-                           _coerce_scalar_to_timedelta_type(timedelta(days=-1)),
-                           'foo',
-                           1,
-                           1.0,
-                           Timestamp('20130101')],
-                          index=mixed.columns)
-        assert_series_equal(result,expected)
-
-        # excludes numeric
-        result = mixed.min(axis=1)
-        expected = Series([1, 1, 1.],index=[0, 1, 2])
-        assert_series_equal(result,expected)
-
-        # works when only those columns are selected
-        result = mixed[['A','B']].min(1)
-        expected = Series([ timedelta(days=-1) ] * 3)
-        assert_series_equal(result,expected)
-
-        result = mixed[['A','B']].min()
-        expected = Series([ timedelta(seconds=5*60+5), timedelta(days=-1) ],index=['A','B'])
-        assert_series_equal(result,expected)
-
-        # GH 3106
-        df = DataFrame({'time' : date_range('20130102',periods=5),
-                        'time2' : date_range('20130105',periods=5) })
-        df['off1'] = df['time2']-df['time']
-        self.assertEqual(df['off1'].dtype, 'timedelta64[ns]')
-
-        df['off2'] = df['time']-df['time2']
-        df._consolidate_inplace()
-        self.assertTrue(df['off1'].dtype == 'timedelta64[ns]')
-        self.assertTrue(df['off2'].dtype == 'timedelta64[ns]')
-
-    def test_datetimelike_setitem_with_inference(self):
-        # GH 7592
-        # assignment of timedeltas with NaT
-
-        one_hour = timedelta(hours=1)
-        df = DataFrame(index=date_range('20130101',periods=4))
-        df['A'] = np.array([1*one_hour]*4, dtype='m8[ns]')
-        df.loc[:,'B'] = np.array([2*one_hour]*4, dtype='m8[ns]')
-        df.loc[:3,'C'] = np.array([3*one_hour]*3, dtype='m8[ns]')
-        df.ix[:,'D'] = np.array([4*one_hour]*4, dtype='m8[ns]')
-        df.ix[:3,'E'] = np.array([5*one_hour]*3, dtype='m8[ns]')
-        df['F'] = np.timedelta64('NaT')
-        df.ix[:-1,'F'] = np.array([6*one_hour]*3, dtype='m8[ns]')
-        df.ix[-3:,'G'] = date_range('20130101',periods=3)
-        df['H'] = np.datetime64('NaT')
-        result = df.dtypes
-        expected = Series([np.dtype('timedelta64[ns]')]*6+[np.dtype('datetime64[ns]')]*2,index=list('ABCDEFGH'))
-        assert_series_equal(result,expected)
-
-    def test_setitem_datetime_coercion(self):
-        # GH 1048
-        df = pd.DataFrame({'c': [pd.Timestamp('2010-10-01')]*3})
-        df.loc[0:1, 'c'] = np.datetime64('2008-08-08')
-        self.assertEqual(pd.Timestamp('2008-08-08'), df.loc[0, 'c'])
-        self.assertEqual(pd.Timestamp('2008-08-08'), df.loc[1, 'c'])
-        df.loc[2, 'c'] = date(2005, 5, 5)
-        self.assertEqual(pd.Timestamp('2005-05-05'), df.loc[2, 'c'])
-
-
-    def test_new_empty_index(self):
-        df1 = DataFrame(randn(0, 3))
-        df2 = DataFrame(randn(0, 3))
-        df1.index.name = 'foo'
-        self.assertIsNone(df2.index.name)
-
-    def test_astype(self):
-        casted = self.frame.astype(int)
-        expected = DataFrame(self.frame.values.astype(int),
-                             index=self.frame.index,
-                             columns=self.frame.columns)
-        assert_frame_equal(casted, expected)
-
-        casted = self.frame.astype(np.int32)
-        expected = DataFrame(self.frame.values.astype(np.int32),
-                             index=self.frame.index,
-                             columns=self.frame.columns)
-        assert_frame_equal(casted, expected)
-
-        self.frame['foo'] = '5'
-        casted = self.frame.astype(int)
-        expected = DataFrame(self.frame.values.astype(int),
-                             index=self.frame.index,
-                             columns=self.frame.columns)
-        assert_frame_equal(casted, expected)
-
-        # mixed casting
-        def _check_cast(df, v):
-            self.assertEqual(list(set([ s.dtype.name for _, s in compat.iteritems(df) ]))[0], v)
-
-        mn = self.all_mixed._get_numeric_data().copy()
-        mn['little_float'] = np.array(12345.,dtype='float16')
-        mn['big_float']    = np.array(123456789101112.,dtype='float64')
-
-        casted = mn.astype('float64')
-        _check_cast(casted, 'float64')
-
-        casted = mn.astype('int64')
-        _check_cast(casted, 'int64')
-
-        casted = self.mixed_float.reindex(columns = ['A','B']).astype('float32')
-        _check_cast(casted, 'float32')
-
-        casted = mn.reindex(columns = ['little_float']).astype('float16')
-        _check_cast(casted, 'float16')
-
-        casted = self.mixed_float.reindex(columns = ['A','B']).astype('float16')
-        _check_cast(casted, 'float16')
-
-        casted = mn.astype('float32')
-        _check_cast(casted, 'float32')
-
-        casted = mn.astype('int32')
-        _check_cast(casted, 'int32')
-
-        # to object
-        casted = mn.astype('O')
-        _check_cast(casted, 'object')
-
-    def test_astype_with_exclude_string(self):
-        df = self.frame.copy()
-        expected = self.frame.astype(int)
-        df['string'] = 'foo'
-        casted = df.astype(int, raise_on_error = False)
-
-        expected['string'] = 'foo'
-        assert_frame_equal(casted, expected)
-
-        df = self.frame.copy()
-        expected = self.frame.astype(np.int32)
-        df['string'] = 'foo'
-        casted = df.astype(np.int32, raise_on_error = False)
-
-        expected['string'] = 'foo'
-        assert_frame_equal(casted, expected)
-
-    def test_astype_with_view(self):
-
-        tf = self.mixed_float.reindex(columns = ['A','B','C'])
-
-        casted = tf.astype(np.int64)
-
-        casted = tf.astype(np.float32)
-
-        # this is the only real reason to do it this way
-        tf = np.round(self.frame).astype(np.int32)
-        casted = tf.astype(np.float32, copy = False)
-
-        tf = self.frame.astype(np.float64)
-        casted = tf.astype(np.int64, copy = False)
-
-    def test_astype_cast_nan_int(self):
-        df = DataFrame(data={"Values": [1.0, 2.0, 3.0, np.nan]})
-        self.assertRaises(ValueError, df.astype, np.int64)
-
-    def test_astype_str(self):
-        # GH9757
-        a = Series(date_range('2010-01-04', periods=5))
-        b = Series(date_range('3/6/2012 00:00', periods=5, tz='US/Eastern'))
-        c = Series([Timedelta(x, unit='d') for x in range(5)])
-        d = Series(range(5))
-        e = Series([0.0, 0.2, 0.4, 0.6, 0.8])
-
-        df = DataFrame({'a' : a, 'b' : b, 'c' : c, 'd' : d, 'e' : e})
-
-        # datetimelike
-        # Test str and unicode on python 2.x and just str on python 3.x
-        for tt in set([str, compat.text_type]):
-            result = df.astype(tt)
-
-            expected = DataFrame({
-                'a' : list(map(tt, map(lambda x: Timestamp(x)._date_repr, a._values))),
-                'b' : list(map(tt, map(Timestamp, b._values))),
-                'c' : list(map(tt, map(lambda x: Timedelta(x)._repr_base(format='all'), c._values))),
-                'd' : list(map(tt, d._values)),
-                'e' : list(map(tt, e._values)),
-                })
-
-            assert_frame_equal(result, expected)
-
-        # float/nan
-        # 11302
-        # consistency in astype(str)
-        for tt in set([str, compat.text_type]):
-            result = DataFrame([np.NaN]).astype(tt)
-            expected = DataFrame(['nan'])
-            assert_frame_equal(result, expected)
-
-            result = DataFrame([1.12345678901234567890]).astype(tt)
-            expected = DataFrame(['1.12345678901'])
-            assert_frame_equal(result, expected)
-
-    def test_array_interface(self):
-        result = np.sqrt(self.frame)
-        tm.assertIsInstance(result, type(self.frame))
-        self.assertIs(result.index, self.frame.index)
-        self.assertIs(result.columns, self.frame.columns)
-
-        assert_frame_equal(result, self.frame.apply(np.sqrt))
-
-    def test_pickle(self):
-        unpickled = self.round_trip_pickle(self.mixed_frame)
-        assert_frame_equal(self.mixed_frame, unpickled)
-
-        # buglet
-        self.mixed_frame._data.ndim
-
-        # empty
-        unpickled = self.round_trip_pickle(self.empty)
-        repr(unpickled)
-
-        # tz frame
-        unpickled = self.round_trip_pickle(self.tzframe)
-        assert_frame_equal(self.tzframe, unpickled)
-
-    def test_to_dict(self):
-        test_data = {
-            'A': {'1': 1, '2': 2},
-            'B': {'1': '1', '2': '2', '3': '3'},
-        }
-        recons_data = DataFrame(test_data).to_dict()
-
-        for k, v in compat.iteritems(test_data):
-            for k2, v2 in compat.iteritems(v):
-                self.assertEqual(v2, recons_data[k][k2])
-
-        recons_data = DataFrame(test_data).to_dict("l")
-
-        for k, v in compat.iteritems(test_data):
-            for k2, v2 in compat.iteritems(v):
-                self.assertEqual(v2, recons_data[k][int(k2) - 1])
-
-        recons_data = DataFrame(test_data).to_dict("s")
-
-        for k, v in compat.iteritems(test_data):
-            for k2, v2 in compat.iteritems(v):
-                self.assertEqual(v2, recons_data[k][k2])
-
-        recons_data = DataFrame(test_data).to_dict("sp")
-
-        expected_split = {'columns': ['A', 'B'], 'index': ['1', '2', '3'],
-                          'data': [[1.0, '1'], [2.0, '2'], [nan, '3']]}
-
-        tm.assert_almost_equal(recons_data, expected_split)
-
-        recons_data = DataFrame(test_data).to_dict("r")
-
-        expected_records = [{'A': 1.0, 'B': '1'},
-                            {'A': 2.0, 'B': '2'},
-                            {'A': nan, 'B': '3'}]
-
-        tm.assert_almost_equal(recons_data, expected_records)
-
-        # GH10844
-        recons_data = DataFrame(test_data).to_dict("i")
-
-        for k, v in compat.iteritems(test_data):
-            for k2, v2 in compat.iteritems(v):
-                self.assertEqual(v2, recons_data[k2][k])
-
-    def test_to_dict_invalid_orient(self):
-        df = DataFrame({'A':[0, 1]})
-        self.assertRaises(ValueError, df.to_dict, orient='xinvalid')
-
-    def test_to_records_dt64(self):
-        df = DataFrame([["one", "two", "three"],
-                        ["four", "five", "six"]],
-                       index=date_range("2012-01-01", "2012-01-02"))
-        self.assertEqual(df.to_records()['index'][0], df.index[0])
-
-        rs = df.to_records(convert_datetime64=False)
-        self.assertEqual(rs['index'][0], df.index.values[0])
-
-    def test_to_records_with_multindex(self):
-        # GH3189
-        index = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-                 ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-        data = np.zeros((8, 4))
-        df = DataFrame(data, index=index)
-        r = df.to_records(index=True)['level_0']
-        self.assertTrue('bar' in r)
-        self.assertTrue('one' not in r)
-
-    def test_to_records_with_Mapping_type(self):
-        import email
-        from email.parser import Parser
-        import collections
-
-        collections.Mapping.register(email.message.Message)
-
-        headers = Parser().parsestr('From: <user@example.com>\n'
-                'To: <someone_else@example.com>\n'
-                'Subject: Test message\n'
-                '\n'
-                'Body would go here\n')
-
-        frame = DataFrame.from_records([headers])
-        all( x in frame for x in ['Type','Subject','From'])
-
-    def test_from_records_to_records(self):
-        # from numpy documentation
-        arr = np.zeros((2,), dtype=('i4,f4,a10'))
-        arr[:] = [(1, 2., 'Hello'), (2, 3., "World")]
-
-        frame = DataFrame.from_records(arr)
-
-        index = np.arange(len(arr))[::-1]
-        indexed_frame = DataFrame.from_records(arr, index=index)
-        self.assert_numpy_array_equal(indexed_frame.index, index)
-
-        # without names, it should go to last ditch
-        arr2 = np.zeros((2,3))
-        tm.assert_frame_equal(DataFrame.from_records(arr2), DataFrame(arr2))
-
-        # wrong length
-        msg = r'Shape of passed values is \(3, 2\), indices imply \(3, 1\)'
-        with assertRaisesRegexp(ValueError, msg):
-            DataFrame.from_records(arr, index=index[:-1])
-
-        indexed_frame = DataFrame.from_records(arr, index='f1')
-
-        # what to do?
-        records = indexed_frame.to_records()
-        self.assertEqual(len(records.dtype.names), 3)
-
-        records = indexed_frame.to_records(index=False)
-        self.assertEqual(len(records.dtype.names), 2)
-        self.assertNotIn('index', records.dtype.names)
-
-    def test_from_records_nones(self):
-        tuples = [(1, 2, None, 3),
-                  (1, 2, None, 3),
-                  (None, 2, 5, 3)]
-
-        df = DataFrame.from_records(tuples, columns=['a', 'b', 'c', 'd'])
-        self.assertTrue(np.isnan(df['c'][0]))
-
-    def test_from_records_iterator(self):
-        arr = np.array([(1.0, 1.0, 2, 2), (3.0, 3.0, 4, 4), (5., 5., 6, 6), (7., 7., 8, 8)],
-                       dtype=[('x', np.float64), ('u', np.float32), ('y', np.int64), ('z', np.int32) ])
-        df = DataFrame.from_records(iter(arr), nrows=2)
-        xp = DataFrame({'x': np.array([1.0, 3.0], dtype=np.float64),
-                        'u': np.array([1.0, 3.0], dtype=np.float32),
-                        'y': np.array([2, 4], dtype=np.int64),
-                        'z': np.array([2, 4], dtype=np.int32)})
-        assert_frame_equal(df.reindex_like(xp), xp)
-
-        # no dtypes specified here, so just compare with the default
-        arr = [(1.0, 2), (3.0, 4), (5., 6), (7., 8)]
-        df = DataFrame.from_records(iter(arr), columns=['x', 'y'],
-                                    nrows=2)
-        assert_frame_equal(df, xp.reindex(columns=['x','y']), check_dtype=False)
-
-    def test_from_records_tuples_generator(self):
-        def tuple_generator(length):
-            for i in range(length):
-                letters = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
-                yield (i, letters[i % len(letters)], i/length)
-
-        columns_names = ['Integer', 'String', 'Float']
-        columns = [[i[j] for i in tuple_generator(10)] for j in range(len(columns_names))]
-        data = {'Integer': columns[0], 'String': columns[1], 'Float': columns[2]}
-        expected = DataFrame(data, columns=columns_names)
-
-        generator = tuple_generator(10)
-        result = DataFrame.from_records(generator, columns=columns_names)
-        assert_frame_equal(result, expected)
-
-    def test_from_records_lists_generator(self):
-        def list_generator(length):
-            for i in range(length):
-                letters = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
-                yield [i, letters[i % len(letters)], i/length]
-
-        columns_names = ['Integer', 'String', 'Float']
-        columns = [[i[j] for i in list_generator(10)] for j in range(len(columns_names))]
-        data = {'Integer': columns[0], 'String': columns[1], 'Float': columns[2]}
-        expected = DataFrame(data, columns=columns_names)
-
-        generator = list_generator(10)
-        result = DataFrame.from_records(generator, columns=columns_names)
-        assert_frame_equal(result, expected)
-
-    def test_from_records_columns_not_modified(self):
-        tuples = [(1, 2, 3),
-                  (1, 2, 3),
-                  (2, 5, 3)]
-
-        columns = ['a', 'b', 'c']
-        original_columns = list(columns)
-        df = DataFrame.from_records(tuples, columns=columns, index='a')
-        self.assertEqual(columns, original_columns)
-
-    def test_from_records_decimal(self):
-        from decimal import Decimal
-
-        tuples = [(Decimal('1.5'),), (Decimal('2.5'),), (None,)]
-
-        df = DataFrame.from_records(tuples, columns=['a'])
-        self.assertEqual(df['a'].dtype, object)
-
-        df = DataFrame.from_records(tuples, columns=['a'], coerce_float=True)
-        self.assertEqual(df['a'].dtype, np.float64)
-        self.assertTrue(np.isnan(df['a'].values[-1]))
-
-    def test_from_records_duplicates(self):
-        result = DataFrame.from_records([(1, 2, 3), (4, 5, 6)],
-                                        columns=['a', 'b', 'a'])
-
-        expected = DataFrame([(1, 2, 3), (4, 5, 6)],
-                             columns=['a', 'b', 'a'])
-
-        assert_frame_equal(result, expected)
-
-    def test_from_records_set_index_name(self):
-        def create_dict(order_id):
-            return {'order_id': order_id, 'quantity': np.random.randint(1, 10),
-                    'price': np.random.randint(1, 10)}
-        documents = [create_dict(i) for i in range(10)]
-        # demo missing data
-        documents.append({'order_id': 10, 'quantity': 5})
-
-        result = DataFrame.from_records(documents, index='order_id')
-        self.assertEqual(result.index.name, 'order_id')
-
-        # MultiIndex
-        result = DataFrame.from_records(documents,
-                                        index=['order_id', 'quantity'])
-        self.assertEqual(result.index.names, ('order_id', 'quantity'))
-
-    def test_from_records_misc_brokenness(self):
-        # #2179
-
-        data = {1: ['foo'], 2: ['bar']}
-
-        result = DataFrame.from_records(data, columns=['a', 'b'])
-        exp = DataFrame(data, columns=['a', 'b'])
-        assert_frame_equal(result, exp)
-
-        # overlap in index/index_names
-
-        data = {'a': [1, 2, 3], 'b': [4, 5, 6]}
-
-        result = DataFrame.from_records(data, index=['a', 'b', 'c'])
-        exp = DataFrame(data, index=['a', 'b', 'c'])
-        assert_frame_equal(result, exp)
-
-
-        # GH 2623
-        rows = []
-        rows.append([datetime(2010, 1, 1), 1])
-        rows.append([datetime(2010, 1, 2), 'hi']) # test col upconverts to obj
-        df2_obj = DataFrame.from_records(rows, columns=['date', 'test'])
-        results = df2_obj.get_dtype_counts()
-        expected = Series({ 'datetime64[ns]' : 1, 'object' : 1 })
-
-        rows = []
-        rows.append([datetime(2010, 1, 1), 1])
-        rows.append([datetime(2010, 1, 2), 1])
-        df2_obj = DataFrame.from_records(rows, columns=['date', 'test'])
-        results = df2_obj.get_dtype_counts()
-        expected = Series({ 'datetime64[ns]' : 1, 'int64' : 1 })
-
-    def test_from_records_empty(self):
-        # 3562
-        result = DataFrame.from_records([], columns=['a','b','c'])
-        expected = DataFrame(columns=['a','b','c'])
-        assert_frame_equal(result, expected)
-
-        result = DataFrame.from_records([], columns=['a','b','b'])
-        expected = DataFrame(columns=['a','b','b'])
-        assert_frame_equal(result, expected)
-
-    def test_from_records_empty_with_nonempty_fields_gh3682(self):
-        a = np.array([(1, 2)], dtype=[('id', np.int64), ('value', np.int64)])
-        df = DataFrame.from_records(a, index='id')
-        assert_numpy_array_equal(df.index, Index([1], name='id'))
-        self.assertEqual(df.index.name, 'id')
-        assert_numpy_array_equal(df.columns, Index(['value']))
-
-        b = np.array([], dtype=[('id', np.int64), ('value', np.int64)])
-        df = DataFrame.from_records(b, index='id')
-        assert_numpy_array_equal(df.index, Index([], name='id'))
-        self.assertEqual(df.index.name, 'id')
-
-    def test_from_records_with_datetimes(self):
-        if sys.version < LooseVersion('2.7'):
-            raise nose.SkipTest('rec arrays dont work properly with py2.6')
-
-        # this may fail on certain platforms because of a numpy issue
-        # related GH6140
-        if not is_little_endian():
-            raise nose.SkipTest("known failure of test on non-little endian")
-
-        # construction with a null in a recarray
-        # GH 6140
-        expected = DataFrame({ 'EXPIRY'  : [datetime(2005, 3, 1, 0, 0), None ]})
-
-        arrdata = [np.array([datetime(2005, 3, 1, 0, 0), None])]
-        dtypes = [('EXPIRY', '<M8[ns]')]
-
-        try:
-            recarray = np.core.records.fromarrays(arrdata, dtype=dtypes)
-        except (ValueError):
-            raise nose.SkipTest("known failure of numpy rec array creation")
-
-        result = DataFrame.from_records(recarray)
-        assert_frame_equal(result,expected)
-
-        # coercion should work too
-        arrdata = [np.array([datetime(2005, 3, 1, 0, 0), None])]
-        dtypes = [('EXPIRY', '<M8[m]')]
-        recarray = np.core.records.fromarrays(arrdata, dtype=dtypes)
-        result = DataFrame.from_records(recarray)
-        assert_frame_equal(result,expected)
-
-    def test_to_records_floats(self):
-        df = DataFrame(np.random.rand(10, 10))
-        df.to_records()
-
-    def test_to_recods_index_name(self):
-        df = DataFrame(np.random.randn(3, 3))
-        df.index.name = 'X'
-        rs = df.to_records()
-        self.assertIn('X', rs.dtype.fields)
-
-        df = DataFrame(np.random.randn(3, 3))
-        rs = df.to_records()
-        self.assertIn('index', rs.dtype.fields)
-
-        df.index = MultiIndex.from_tuples([('a', 'x'), ('a', 'y'), ('b', 'z')])
-        df.index.names = ['A', None]
-        rs = df.to_records()
-        self.assertIn('level_0', rs.dtype.fields)
-
-    def test_join_str_datetime(self):
-        str_dates = ['20120209', '20120222']
-        dt_dates = [datetime(2012, 2, 9), datetime(2012, 2, 22)]
-
-        A = DataFrame(str_dates, index=lrange(2), columns=['aa'])
-        C = DataFrame([[1, 2], [3, 4]], index=str_dates, columns=dt_dates)
-
-        tst = A.join(C, on='aa')
-
-        self.assertEqual(len(tst.columns), 3)
-
-    def test_join_multiindex_leftright(self):
-        # GH 10741
-        df1 = pd.DataFrame([['a', 'x', 0.471780], ['a','y', 0.774908],
-                            ['a', 'z', 0.563634], ['b', 'x', -0.353756],
-                            ['b', 'y', 0.368062], ['b', 'z', -1.721840],
-                            ['c', 'x', 1], ['c', 'y', 2], ['c', 'z', 3]],
-                           columns=['first', 'second', 'value1']).set_index(['first', 'second'])
-        df2 = pd.DataFrame([['a', 10], ['b', 20]], columns=['first', 'value2']).set_index(['first'])
-
-        exp = pd.DataFrame([[0.471780, 10], [0.774908, 10], [0.563634, 10],
-                            [-0.353756, 20], [0.368062, 20], [-1.721840, 20],
-                            [1.000000, np.nan], [2.000000, np.nan], [3.000000, np.nan]],
-                           index=df1.index, columns=['value1', 'value2'])
-
-        # these must be the same results (but columns are flipped)
-        tm.assert_frame_equal(df1.join(df2, how='left'), exp)
-        tm.assert_frame_equal(df2.join(df1, how='right'), exp[['value2', 'value1']])
-
-        exp_idx = pd.MultiIndex.from_product([['a', 'b'], ['x', 'y', 'z']],
-                                             names=['first', 'second'])
-        exp = pd.DataFrame([[0.471780, 10], [0.774908, 10], [0.563634, 10],
-                            [-0.353756, 20], [0.368062, 20], [-1.721840, 20]],
-                           index=exp_idx, columns=['value1', 'value2'])
-
-        tm.assert_frame_equal(df1.join(df2, how='right'), exp)
-        tm.assert_frame_equal(df2.join(df1, how='left'), exp[['value2', 'value1']])
-
-    def test_from_records_sequencelike(self):
-        df = DataFrame({'A' : np.array(np.random.randn(6), dtype = np.float64),
-                        'A1': np.array(np.random.randn(6), dtype = np.float64),
-                        'B' : np.array(np.arange(6), dtype = np.int64),
-                        'C' : ['foo'] * 6,
-                        'D' : np.array([True, False] * 3, dtype=bool),
-                        'E' : np.array(np.random.randn(6), dtype = np.float32),
-                        'E1': np.array(np.random.randn(6), dtype = np.float32),
-                        'F' : np.array(np.arange(6), dtype = np.int32) })
-
-        # this is actually tricky to create the recordlike arrays and have the dtypes be intact
-        blocks = df.blocks
-        tuples = []
-        columns = []
-        dtypes  = []
-        for dtype, b in compat.iteritems(blocks):
-            columns.extend(b.columns)
-            dtypes.extend([ (c,np.dtype(dtype).descr[0][1]) for c in b.columns ])
-        for i in range(len(df.index)):
-            tup = []
-            for _, b in compat.iteritems(blocks):
-                tup.extend(b.iloc[i].values)
-            tuples.append(tuple(tup))
-
-        recarray  = np.array(tuples, dtype=dtypes).view(np.recarray)
-        recarray2 = df.to_records()
-        lists     = [list(x) for x in tuples]
-
-        # tuples (lose the dtype info)
-        result  = DataFrame.from_records(tuples,    columns=columns).reindex(columns=df.columns)
-
-        # created recarray and with to_records recarray (have dtype info)
-        result2 = DataFrame.from_records(recarray,  columns=columns).reindex(columns=df.columns)
-        result3 = DataFrame.from_records(recarray2, columns=columns).reindex(columns=df.columns)
-
-        # list of tupels (no dtype info)
-        result4 = DataFrame.from_records(lists,     columns=columns).reindex(columns=df.columns)
-
-        assert_frame_equal(result, df, check_dtype=False)
-        assert_frame_equal(result2, df)
-        assert_frame_equal(result3, df)
-        assert_frame_equal(result4, df, check_dtype=False)
-
-        # tuples is in the order of the columns
-        result = DataFrame.from_records(tuples)
-        self.assert_numpy_array_equal(result.columns, lrange(8))
-
-        # test exclude parameter & we are casting the results here (as we don't have dtype info to recover)
-        columns_to_test = [ columns.index('C'), columns.index('E1') ]
-
-        exclude = list(set(range(8))-set(columns_to_test))
-        result = DataFrame.from_records(tuples, exclude=exclude)
-        result.columns = [ columns[i] for i in sorted(columns_to_test) ]
-        assert_series_equal(result['C'], df['C'])
-        assert_series_equal(result['E1'], df['E1'].astype('float64'))
-
-        # empty case
-        result = DataFrame.from_records([], columns=['foo', 'bar', 'baz'])
-        self.assertEqual(len(result), 0)
-        self.assert_numpy_array_equal(result.columns, ['foo', 'bar', 'baz'])
-
-        result = DataFrame.from_records([])
-        self.assertEqual(len(result), 0)
-        self.assertEqual(len(result.columns), 0)
-
-    def test_from_records_dictlike(self):
-
-        # test the dict methods
-        df = DataFrame({'A' : np.array(np.random.randn(6), dtype = np.float64),
-                        'A1': np.array(np.random.randn(6), dtype = np.float64),
-                        'B' : np.array(np.arange(6), dtype = np.int64),
-                        'C' : ['foo'] * 6,
-                        'D' : np.array([True, False] * 3, dtype=bool),
-                        'E' : np.array(np.random.randn(6), dtype = np.float32),
-                        'E1': np.array(np.random.randn(6), dtype = np.float32),
-                        'F' : np.array(np.arange(6), dtype = np.int32) })
-
-        # columns is in a different order here than the actual items iterated from the dict
-        columns = []
-        for dtype, b in compat.iteritems(df.blocks):
-            columns.extend(b.columns)
-
-        asdict    = dict((x, y) for x, y in compat.iteritems(df))
-        asdict2   = dict((x, y.values) for x, y in compat.iteritems(df))
-
-        # dict of series & dict of ndarrays (have dtype info)
-        results = []
-        results.append(DataFrame.from_records(asdict).reindex(columns=df.columns))
-        results.append(DataFrame.from_records(asdict,    columns=columns).reindex(columns=df.columns))
-        results.append(DataFrame.from_records(asdict2,   columns=columns).reindex(columns=df.columns))
-
-        for r in results:
-            assert_frame_equal(r, df)
-
-    def test_from_records_with_index_data(self):
-        df = DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'])
-
-        data = np.random.randn(10)
-        df1 = DataFrame.from_records(df, index=data)
-        assert(df1.index.equals(Index(data)))
-
-    def test_from_records_bad_index_column(self):
-        df = DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'])
-
-        # should pass
-        df1 = DataFrame.from_records(df, index=['C'])
-        assert(df1.index.equals(Index(df.C)))
-
-        df1 = DataFrame.from_records(df, index='C')
-        assert(df1.index.equals(Index(df.C)))
-
-        # should fail
-        self.assertRaises(ValueError, DataFrame.from_records, df, index=[2])
-        self.assertRaises(KeyError, DataFrame.from_records, df, index=2)
-
-    def test_from_records_non_tuple(self):
-        class Record(object):
-
-            def __init__(self, *args):
-                self.args = args
-
-            def __getitem__(self, i):
-                return self.args[i]
-
-            def __iter__(self):
-                return iter(self.args)
-
-        recs = [Record(1, 2, 3), Record(4, 5, 6), Record(7, 8, 9)]
-        tups = lmap(tuple, recs)
-
-        result = DataFrame.from_records(recs)
-        expected = DataFrame.from_records(tups)
-        assert_frame_equal(result, expected)
-
-    def test_from_records_len0_with_columns(self):
-        # #2633
-        result = DataFrame.from_records([], index='foo',
-                                        columns=['foo', 'bar'])
-
-        self.assertTrue(np.array_equal(result.columns, ['bar']))
-        self.assertEqual(len(result), 0)
-        self.assertEqual(result.index.name, 'foo')
-
-    def test_get_agg_axis(self):
-        cols = self.frame._get_agg_axis(0)
-        self.assertIs(cols, self.frame.columns)
-
-        idx = self.frame._get_agg_axis(1)
-        self.assertIs(idx, self.frame.index)
-
-        self.assertRaises(ValueError, self.frame._get_agg_axis, 2)
-
-    def test_nonzero(self):
-        self.assertTrue(self.empty.empty)
-
-        self.assertFalse(self.frame.empty)
-        self.assertFalse(self.mixed_frame.empty)
-
-        # corner case
-        df = DataFrame({'A': [1., 2., 3.],
-                        'B': ['a', 'b', 'c']},
-                       index=np.arange(3))
-        del df['A']
-        self.assertFalse(df.empty)
-
-    def test_repr_empty(self):
-        buf = StringIO()
-
-        # empty
-        foo = repr(self.empty)
-
-        # empty with index
-        frame = DataFrame(index=np.arange(1000))
-        foo = repr(frame)
-
-    def test_repr_mixed(self):
-        buf = StringIO()
-
-        # mixed
-        foo = repr(self.mixed_frame)
-        self.mixed_frame.info(verbose=False, buf=buf)
-
-    @slow
-    def test_repr_mixed_big(self):
-        # big mixed
-        biggie = DataFrame({'A': randn(200),
-                            'B': tm.makeStringIndex(200)},
-                           index=lrange(200))
-        biggie.loc[:20,'A'] = nan
-        biggie.loc[:20,'B'] = nan
-
-        foo = repr(biggie)
-
-    def test_repr(self):
-        buf = StringIO()
-
-        # small one
-        foo = repr(self.frame)
-        self.frame.info(verbose=False, buf=buf)
-
-        # even smaller
-        self.frame.reindex(columns=['A']).info(verbose=False, buf=buf)
-        self.frame.reindex(columns=['A', 'B']).info(verbose=False, buf=buf)
-
-        # exhausting cases in DataFrame.info
-
-        # columns but no index
-        no_index = DataFrame(columns=[0, 1, 3])
-        foo = repr(no_index)
-
-        # no columns or index
-        self.empty.info(buf=buf)
-
-        df = DataFrame(["a\n\r\tb"], columns=["a\n\r\td"], index=["a\n\r\tf"])
-        self.assertFalse("\t" in repr(df))
-        self.assertFalse("\r" in repr(df))
-        self.assertFalse("a\n" in repr(df))
-
-    def test_repr_dimensions(self):
-        df = DataFrame([[1, 2,], [3, 4]])
-        with option_context('display.show_dimensions', True):
-            self.assertTrue("2 rows x 2 columns" in repr(df))
-
-        with option_context('display.show_dimensions', False):
-            self.assertFalse("2 rows x 2 columns" in repr(df))
-
-        with option_context('display.show_dimensions', 'truncate'):
-            self.assertFalse("2 rows x 2 columns" in repr(df))
-
-    @slow
-    def test_repr_big(self):
-        buf = StringIO()
-
-        # big one
-        biggie = DataFrame(np.zeros((200, 4)), columns=lrange(4),
-                           index=lrange(200))
-        foo = repr(biggie)
-
-    def test_repr_unsortable(self):
-        # columns are not sortable
-        import warnings
-        warn_filters = warnings.filters
-        warnings.filterwarnings('ignore',
-                                category=FutureWarning,
-                                module=".*format")
-
-        unsortable = DataFrame({'foo': [1] * 50,
-                                datetime.today(): [1] * 50,
-                                'bar': ['bar'] * 50,
-                                datetime.today(
-                                ) + timedelta(1): ['bar'] * 50},
-                               index=np.arange(50))
-        foo = repr(unsortable)
-
-        fmt.set_option('display.precision', 3, 'display.column_space', 10)
-        repr(self.frame)
-
-        fmt.set_option('display.max_rows', 10, 'display.max_columns', 2)
-        repr(self.frame)
-
-        fmt.set_option('display.max_rows', 1000, 'display.max_columns', 1000)
-        repr(self.frame)
-
-        self.reset_display_options()
-
-        warnings.filters = warn_filters
-
-    def test_repr_unicode(self):
-        uval = u('\u03c3\u03c3\u03c3\u03c3')
-        bval = uval.encode('utf-8')
-        df = DataFrame({'A': [uval, uval]})
-
-        result = repr(df)
-        ex_top = '      A'
-        self.assertEqual(result.split('\n')[0].rstrip(), ex_top)
-
-        df = DataFrame({'A': [uval, uval]})
-        result = repr(df)
-        self.assertEqual(result.split('\n')[0].rstrip(), ex_top)
-
-    def test_unicode_string_with_unicode(self):
-        df = DataFrame({'A': [u("\u05d0")]})
-
-        if compat.PY3:
-            str(df)
-        else:
-            compat.text_type(df)
-
-    def test_bytestring_with_unicode(self):
-        df = DataFrame({'A': [u("\u05d0")]})
-        if compat.PY3:
-            bytes(df)
-        else:
-            str(df)
-
-    def test_very_wide_info_repr(self):
-        df = DataFrame(np.random.randn(10, 20),
-                       columns=tm.rands_array(10, 20))
-        repr(df)
-
-    def test_repr_column_name_unicode_truncation_bug(self):
-        # #1906
-        df = DataFrame({'Id': [7117434],
-                        'StringCol': ('Is it possible to modify drop plot code'
-                                      ' so that the output graph is displayed '
-                                      'in iphone simulator, Is it possible to '
-                                      'modify drop plot code so that the '
-                                      'output graph is \xe2\x80\xa8displayed '
-                                      'in iphone simulator.Now we are adding '
-                                      'the CSV file externally. I want to Call'
-                                      ' the File through the code..')})
-
-        result = repr(df)
-        self.assertIn('StringCol', result)
-
-    def test_head_tail(self):
-        assert_frame_equal(self.frame.head(), self.frame[:5])
-        assert_frame_equal(self.frame.tail(), self.frame[-5:])
-        assert_frame_equal(self.frame.head(0), self.frame)
-        assert_frame_equal(self.frame.tail(0), self.frame)
-        assert_frame_equal(self.frame.head(-1), self.frame[:-1])
-        assert_frame_equal(self.frame.tail(-1), self.frame[1:])
-        assert_frame_equal(self.frame.head(1), self.frame[:1])
-        assert_frame_equal(self.frame.tail(1), self.frame[-1:])
-        # with a float index
-        df = self.frame.copy()
-        df.index = np.arange(len(self.frame)) + 0.1
-        assert_frame_equal(df.head(), df.iloc[:5])
-        assert_frame_equal(df.tail(), df.iloc[-5:])
-        assert_frame_equal(df.head(0), df)
-        assert_frame_equal(df.tail(0), df)
-        assert_frame_equal(df.head(-1), df.iloc[:-1])
-        assert_frame_equal(df.tail(-1), df.iloc[1:])
-        #test empty dataframe
-        empty_df = DataFrame()
-        assert_frame_equal(empty_df.tail(), empty_df)
-        assert_frame_equal(empty_df.head(), empty_df)
-
-    def test_insert(self):
-        df = DataFrame(np.random.randn(5, 3), index=np.arange(5),
-                       columns=['c', 'b', 'a'])
-
-        df.insert(0, 'foo', df['a'])
-        self.assert_numpy_array_equal(df.columns, ['foo', 'c', 'b', 'a'])
-        assert_almost_equal(df['a'], df['foo'])
-
-        df.insert(2, 'bar', df['c'])
-        self.assert_numpy_array_equal(df.columns, ['foo', 'c', 'bar', 'b', 'a'])
-        assert_almost_equal(df['c'], df['bar'])
-
-        # diff dtype
-
-        # new item
-        df['x'] = df['a'].astype('float32')
-        result = Series(dict(float64 = 5, float32 = 1))
-        self.assertTrue((df.get_dtype_counts() == result).all())
-
-        # replacing current (in different block)
-        df['a'] = df['a'].astype('float32')
-        result = Series(dict(float64 = 4, float32 = 2))
-        self.assertTrue((df.get_dtype_counts() == result).all())
-
-        df['y'] = df['a'].astype('int32')
-        result = Series(dict(float64 = 4, float32 = 2, int32 = 1))
-        self.assertTrue((df.get_dtype_counts() == result).all())
-
-        with assertRaisesRegexp(ValueError, 'already exists'):
-            df.insert(1, 'a', df['b'])
-        self.assertRaises(ValueError, df.insert, 1, 'c', df['b'])
-
-        df.columns.name = 'some_name'
-        # preserve columns name field
-        df.insert(0, 'baz', df['c'])
-        self.assertEqual(df.columns.name, 'some_name')
-
-    def test_delitem(self):
-        del self.frame['A']
-        self.assertNotIn('A', self.frame)
-
-    def test_pop(self):
-        self.frame.columns.name = 'baz'
-
-        A = self.frame.pop('A')
-        self.assertNotIn('A', self.frame)
-
-        self.frame['foo'] = 'bar'
-        foo = self.frame.pop('foo')
-        self.assertNotIn('foo', self.frame)
-        # TODO self.assertEqual(self.frame.columns.name, 'baz')
-
-        # 10912
-        # inplace ops cause caching issue
-        a = DataFrame([[1,2,3],[4,5,6]], columns=['A','B','C'], index=['X','Y'])
-        b = a.pop('B')
-        b += 1
-
-        # original frame
-        expected = DataFrame([[1,3],[4,6]], columns=['A','C'], index=['X','Y'])
-        assert_frame_equal(a, expected)
-
-        # result
-        expected = Series([2,5],index=['X','Y'],name='B')+1
-        assert_series_equal(b, expected)
-
-    def test_pop_non_unique_cols(self):
-        df = DataFrame({0: [0, 1], 1: [0, 1], 2: [4, 5]})
-        df.columns = ["a", "b", "a"]
-
-        res = df.pop("a")
-        self.assertEqual(type(res), DataFrame)
-        self.assertEqual(len(res), 2)
-        self.assertEqual(len(df.columns), 1)
-        self.assertTrue("b" in df.columns)
-        self.assertFalse("a" in df.columns)
-        self.assertEqual(len(df.index), 2)
-
-    def test_iter(self):
-        self.assertTrue(tm.equalContents(list(self.frame), self.frame.columns))
-
-    def test_iterrows(self):
-        for i, (k, v) in enumerate(self.frame.iterrows()):
-            exp = self.frame.xs(self.frame.index[i])
-            assert_series_equal(v, exp)
-
-        for i, (k, v) in enumerate(self.mixed_frame.iterrows()):
-            exp = self.mixed_frame.xs(self.mixed_frame.index[i])
-            assert_series_equal(v, exp)
-
-    def test_itertuples(self):
-        for i, tup in enumerate(self.frame.itertuples()):
-            s = Series(tup[1:])
-            s.name = tup[0]
-            expected = self.frame.ix[i, :].reset_index(drop=True)
-            assert_series_equal(s, expected)
-
-        df = DataFrame({'floats': np.random.randn(5),
-                        'ints': lrange(5)}, columns=['floats', 'ints'])
-
-        for tup in df.itertuples(index=False):
-            tm.assertIsInstance(tup[1], np.integer)
-
-        df = DataFrame(data={"a": [1, 2, 3], "b": [4, 5, 6]})
-        dfaa = df[['a', 'a']]
-        self.assertEqual(list(dfaa.itertuples()), [(0, 1, 1), (1, 2, 2), (2, 3, 3)])
-
-    def test_len(self):
-        self.assertEqual(len(self.frame), len(self.frame.index))
-
-    def test_operators(self):
-        garbage = random.random(4)
-        colSeries = Series(garbage, index=np.array(self.frame.columns))
-
-        idSum = self.frame + self.frame
-        seriesSum = self.frame + colSeries
-
-        for col, series in compat.iteritems(idSum):
-            for idx, val in compat.iteritems(series):
-                origVal = self.frame[col][idx] * 2
-                if not np.isnan(val):
-                    self.assertEqual(val, origVal)
-                else:
-                    self.assertTrue(np.isnan(origVal))
-
-        for col, series in compat.iteritems(seriesSum):
-            for idx, val in compat.iteritems(series):
-                origVal = self.frame[col][idx] + colSeries[col]
-                if not np.isnan(val):
-                    self.assertEqual(val, origVal)
-                else:
-                    self.assertTrue(np.isnan(origVal))
-
-        added = self.frame2 + self.frame2
-        expected = self.frame2 * 2
-        assert_frame_equal(added, expected)
-
-        df = DataFrame({'a': ['a', None, 'b']})
-        assert_frame_equal(df + df, DataFrame({'a': ['aa', np.nan, 'bb']}))
-
-        # Test for issue #10181
-        for dtype in ('float', 'int64'):
-            frames = [
-                DataFrame(dtype=dtype),
-                DataFrame(columns=['A'], dtype=dtype),
-                DataFrame(index=[0], dtype=dtype),
-            ]
-            for df in frames:
-                self.assertTrue((df + df).equals(df))
-                assert_frame_equal(df + df, df)
-
-    def test_ops_np_scalar(self):
-        vals, xs = np.random.rand(5, 3), [nan, 7, -23, 2.718, -3.14, np.inf]
-        f = lambda x: DataFrame(x, index=list('ABCDE'),
-                columns=['jim', 'joe', 'jolie'])
-
-        df = f(vals)
-
-        for x in xs:
-            assert_frame_equal(df / np.array(x), f(vals / x))
-            assert_frame_equal(np.array(x) * df, f(vals * x))
-            assert_frame_equal(df + np.array(x), f(vals + x))
-            assert_frame_equal(np.array(x) - df, f(x - vals))
-
-    def test_operators_boolean(self):
-
-        # GH 5808
-        # empty frames, non-mixed dtype
-
-        result = DataFrame(index=[1]) & DataFrame(index=[1])
-        assert_frame_equal(result,DataFrame(index=[1]))
-
-        result = DataFrame(index=[1]) | DataFrame(index=[1])
-        assert_frame_equal(result,DataFrame(index=[1]))
-
-        result = DataFrame(index=[1]) & DataFrame(index=[1,2])
-        assert_frame_equal(result,DataFrame(index=[1,2]))
-
-        result = DataFrame(index=[1],columns=['A']) & DataFrame(index=[1],columns=['A'])
-        assert_frame_equal(result,DataFrame(index=[1],columns=['A']))
-
-        result = DataFrame(True,index=[1],columns=['A']) & DataFrame(True,index=[1],columns=['A'])
-        assert_frame_equal(result,DataFrame(True,index=[1],columns=['A']))
-
-        result = DataFrame(True,index=[1],columns=['A']) | DataFrame(True,index=[1],columns=['A'])
-        assert_frame_equal(result,DataFrame(True,index=[1],columns=['A']))
-
-        # boolean ops
-        result = DataFrame(1,index=[1],columns=['A']) | DataFrame(True,index=[1],columns=['A'])
-        assert_frame_equal(result,DataFrame(1,index=[1],columns=['A']))
-
-        def f():
-            DataFrame(1.0,index=[1],columns=['A']) | DataFrame(True,index=[1],columns=['A'])
-        self.assertRaises(TypeError, f)
-
-        def f():
-            DataFrame('foo',index=[1],columns=['A']) | DataFrame(True,index=[1],columns=['A'])
-        self.assertRaises(TypeError, f)
-
-    def test_operators_none_as_na(self):
-        df = DataFrame({"col1": [2, 5.0, 123, None],
-                        "col2": [1, 2, 3, 4]}, dtype=object)
-
-        ops = [operator.add, operator.sub, operator.mul, operator.truediv]
-
-        # since filling converts dtypes from object, changed expected to be object
-        for op in ops:
-            filled = df.fillna(np.nan)
-            result = op(df, 3)
-            expected = op(filled, 3).astype(object)
-            expected[com.isnull(expected)] = None
-            assert_frame_equal(result, expected)
-
-            result = op(df, df)
-            expected = op(filled, filled).astype(object)
-            expected[com.isnull(expected)] = None
-            assert_frame_equal(result, expected)
-
-            result = op(df, df.fillna(7))
-            assert_frame_equal(result, expected)
-
-            result = op(df.fillna(7), df)
-            assert_frame_equal(result, expected, check_dtype=False)
-
-    def test_comparison_invalid(self):
-
-        def check(df,df2):
-
-            for (x, y) in [(df,df2),(df2,df)]:
-                self.assertRaises(TypeError, lambda : x == y)
-                self.assertRaises(TypeError, lambda : x != y)
-                self.assertRaises(TypeError, lambda : x >= y)
-                self.assertRaises(TypeError, lambda : x > y)
-                self.assertRaises(TypeError, lambda : x < y)
-                self.assertRaises(TypeError, lambda : x <= y)
-
-        # GH4968
-        # invalid date/int comparisons
-        df = DataFrame(np.random.randint(10, size=(10, 1)), columns=['a'])
-        df['dates'] = date_range('20010101', periods=len(df))
-
-        df2 = df.copy()
-        df2['dates'] = df['a']
-        check(df,df2)
-
-        df = DataFrame(np.random.randint(10, size=(10, 2)), columns=['a', 'b'])
-        df2 = DataFrame({'a': date_range('20010101', periods=len(df)), 'b': date_range('20100101', periods=len(df))})
-        check(df,df2)
-
-    def test_timestamp_compare(self):
-        # make sure we can compare Timestamps on the right AND left hand side
-        # GH4982
-        df = DataFrame({'dates1': date_range('20010101', periods=10),
-                        'dates2': date_range('20010102', periods=10),
-                        'intcol': np.random.randint(1000000000, size=10),
-                        'floatcol': np.random.randn(10),
-                        'stringcol': list(tm.rands(10))})
-        df.loc[np.random.rand(len(df)) > 0.5, 'dates2'] = pd.NaT
-        ops = {'gt': 'lt', 'lt': 'gt', 'ge': 'le', 'le': 'ge', 'eq': 'eq',
-               'ne': 'ne'}
-        for left, right in ops.items():
-            left_f = getattr(operator, left)
-            right_f = getattr(operator, right)
-
-            # no nats
-            expected = left_f(df, Timestamp('20010109'))
-            result = right_f(Timestamp('20010109'), df)
-            tm.assert_frame_equal(result, expected)
-
-            # nats
-            expected = left_f(df, Timestamp('nat'))
-            result = right_f(Timestamp('nat'), df)
-            tm.assert_frame_equal(result, expected)
-
-    def test_modulo(self):
-
-        # GH3590, modulo as ints
-        p = DataFrame({ 'first' : [3,4,5,8], 'second' : [0,0,0,3] })
-
-        ### this is technically wrong as the integer portion is coerced to float ###
-        expected = DataFrame({ 'first' : Series([0,0,0,0],dtype='float64'), 'second' : Series([np.nan,np.nan,np.nan,0]) })
-        result = p % p
-        assert_frame_equal(result,expected)
-
-        # numpy has a slightly different (wrong) treatement
-        result2 = DataFrame(p.values % p.values,index=p.index,columns=p.columns,dtype='float64')
-        result2.iloc[0:3,1] = np.nan
-        assert_frame_equal(result2,expected)
-
-        result = p % 0
-        expected = DataFrame(np.nan,index=p.index,columns=p.columns)
-        assert_frame_equal(result,expected)
-
-        # numpy has a slightly different (wrong) treatement
-        result2 = DataFrame(p.values.astype('float64') % 0,index=p.index,columns=p.columns)
-        assert_frame_equal(result2,expected)
-
-        # not commutative with series
-        p = DataFrame(np.random.randn(10, 5))
-        s = p[0]
-        res = s % p
-        res2 = p % s
-        self.assertFalse(np.array_equal(res.fillna(0), res2.fillna(0)))
-
-    def test_div(self):
-
-        # integer div, but deal with the 0's (GH 9144)
-        p = DataFrame({ 'first' : [3,4,5,8], 'second' : [0,0,0,3] })
-        result = p / p
-
-        expected = DataFrame({'first': Series([1.0, 1.0, 1.0, 1.0]),
-                              'second': Series([nan, nan, nan, 1])})
-        assert_frame_equal(result,expected)
-
-        result2 = DataFrame(p.values.astype('float') / p.values, index=p.index,
-                            columns=p.columns)
-        assert_frame_equal(result2,expected)
-
-        result = p / 0
-        expected = DataFrame(inf, index=p.index, columns=p.columns)
-        expected.iloc[0:3, 1] = nan
-        assert_frame_equal(result,expected)
-
-        # numpy has a slightly different (wrong) treatement
-        result2 = DataFrame(p.values.astype('float64') / 0, index=p.index,
-                            columns=p.columns)
-        assert_frame_equal(result2,expected)
-
-        p = DataFrame(np.random.randn(10, 5))
-        s = p[0]
-        res = s / p
-        res2 = p / s
-        self.assertFalse(np.array_equal(res.fillna(0), res2.fillna(0)))
-
-    def test_logical_operators(self):
-
-        def _check_bin_op(op):
-            result = op(df1, df2)
-            expected = DataFrame(op(df1.values, df2.values), index=df1.index,
-                                 columns=df1.columns)
-            self.assertEqual(result.values.dtype, np.bool_)
-            assert_frame_equal(result, expected)
-
-        def _check_unary_op(op):
-            result = op(df1)
-            expected = DataFrame(op(df1.values), index=df1.index,
-                                 columns=df1.columns)
-            self.assertEqual(result.values.dtype, np.bool_)
-            assert_frame_equal(result, expected)
-
-        df1 = {'a': {'a': True, 'b': False, 'c': False, 'd': True, 'e': True},
-               'b': {'a': False, 'b': True, 'c': False,
-                     'd': False, 'e': False},
-               'c': {'a': False, 'b': False, 'c': True,
-                     'd': False, 'e': False},
-               'd': {'a': True, 'b': False, 'c': False, 'd': True, 'e': True},
-               'e': {'a': True, 'b': False, 'c': False, 'd': True, 'e': True}}
-
-        df2 = {'a': {'a': True, 'b': False, 'c': True, 'd': False, 'e': False},
-               'b': {'a': False, 'b': True, 'c': False,
-                     'd': False, 'e': False},
-               'c': {'a': True, 'b': False, 'c': True, 'd': False, 'e': False},
-               'd': {'a': False, 'b': False, 'c': False,
-                     'd': True, 'e': False},
-               'e': {'a': False, 'b': False, 'c': False,
-                     'd': False, 'e': True}}
-
-        df1 = DataFrame(df1)
-        df2 = DataFrame(df2)
-
-        _check_bin_op(operator.and_)
-        _check_bin_op(operator.or_)
-        _check_bin_op(operator.xor)
-
-        # operator.neg is deprecated in numpy >= 1.9
-        _check_unary_op(operator.inv)
-
-    def test_logical_typeerror(self):
-        if not compat.PY3:
-            self.assertRaises(TypeError, self.frame.__eq__, 'foo')
-            self.assertRaises(TypeError, self.frame.__lt__, 'foo')
-            self.assertRaises(TypeError, self.frame.__gt__, 'foo')
-            self.assertRaises(TypeError, self.frame.__ne__, 'foo')
-        else:
-            raise nose.SkipTest('test_logical_typeerror not tested on PY3')
-
-    def test_constructor_lists_to_object_dtype(self):
-        # from #1074
-        d = DataFrame({'a': [np.nan, False]})
-        self.assertEqual(d['a'].dtype, np.object_)
-        self.assertFalse(d['a'][1])
-
-    def test_constructor_with_nas(self):
-        # GH 5016
-        # na's in indicies
-
-        def check(df):
-            for i in range(len(df.columns)):
-                df.iloc[:,i]
-
-            # allow single nans to succeed
-            indexer = np.arange(len(df.columns))[isnull(df.columns)]
-
-            if len(indexer) == 1:
-                assert_series_equal(df.iloc[:,indexer[0]],df.loc[:,np.nan])
-
-
-            # multiple nans should fail
-            else:
-
-                def f():
-                    df.loc[:,np.nan]
-                self.assertRaises(ValueError, f)
-
-
-        df = DataFrame([[1,2,3],[4,5,6]], index=[1,np.nan])
-        check(df)
-
-        df = DataFrame([[1,2,3],[4,5,6]], columns=[1.1,2.2,np.nan])
-        check(df)
-
-        df = DataFrame([[0,1,2,3],[4,5,6,7]], columns=[np.nan,1.1,2.2,np.nan])
-        check(df)
-
-        df = DataFrame([[0.0,1,2,3.0],[4,5,6,7]], columns=[np.nan,1.1,2.2,np.nan])
-        check(df)
-
-    def test_logical_with_nas(self):
-        d = DataFrame({'a': [np.nan, False], 'b': [True, True]})
-
-        # GH4947
-        # bool comparisons should return bool
-        result = d['a'] | d['b']
-        expected = Series([False, True])
-        assert_series_equal(result, expected)
-
-        # GH4604, automatic casting here
-        result = d['a'].fillna(False) | d['b']
-        expected = Series([True, True])
-        assert_series_equal(result, expected)
-
-        result = d['a'].fillna(False,downcast=False) | d['b']
-        expected = Series([True, True])
-        assert_series_equal(result, expected)
-
-    def test_neg(self):
-        # what to do?
-        assert_frame_equal(-self.frame, -1 * self.frame)
-
-    def test_invert(self):
-        assert_frame_equal(-(self.frame < 0), ~(self.frame < 0))
-
-    def test_first_last_valid(self):
-        N = len(self.frame.index)
-        mat = randn(N)
-        mat[:5] = nan
-        mat[-5:] = nan
-
-        frame = DataFrame({'foo': mat}, index=self.frame.index)
-        index = frame.first_valid_index()
-
-        self.assertEqual(index, frame.index[5])
-
-        index = frame.last_valid_index()
-        self.assertEqual(index, frame.index[-6])
-
-    def test_arith_flex_frame(self):
-        ops = ['add', 'sub', 'mul', 'div', 'truediv', 'pow', 'floordiv', 'mod']
-        if not compat.PY3:
-            aliases = {}
-        else:
-            aliases = {'div': 'truediv'}
-
-        for op in ops:
-            try:
-                alias = aliases.get(op, op)
-                f = getattr(operator, alias)
-                result = getattr(self.frame, op)(2 * self.frame)
-                exp = f(self.frame, 2 * self.frame)
-                assert_frame_equal(result, exp)
-
-                # vs mix float
-                result = getattr(self.mixed_float, op)(2 * self.mixed_float)
-                exp = f(self.mixed_float, 2 * self.mixed_float)
-                assert_frame_equal(result, exp)
-                _check_mixed_float(result, dtype = dict(C = None))
-
-                # vs mix int
-                if op in ['add','sub','mul']:
-                    result = getattr(self.mixed_int, op)(2 + self.mixed_int)
-                    exp = f(self.mixed_int, 2 + self.mixed_int)
-
-                    # overflow in the uint
-                    dtype = None
-                    if op in ['sub']:
-                        dtype = dict(B = 'object', C = None)
-                    elif op in ['add','mul']:
-                        dtype = dict(C = None)
-                    assert_frame_equal(result, exp)
-                    _check_mixed_int(result, dtype = dtype)
-
-                    # rops
-                    r_f = lambda x, y: f(y, x)
-                    result = getattr(self.frame, 'r' + op)(2 * self.frame)
-                    exp = r_f(self.frame, 2 * self.frame)
-                    assert_frame_equal(result, exp)
-
-                    # vs mix float
-                    result = getattr(self.mixed_float, op)(2 * self.mixed_float)
-                    exp = f(self.mixed_float, 2 * self.mixed_float)
-                    assert_frame_equal(result, exp)
-                    _check_mixed_float(result, dtype = dict(C = None))
-
-                    result = getattr(self.intframe, op)(2 * self.intframe)
-                    exp = f(self.intframe, 2 * self.intframe)
-                    assert_frame_equal(result, exp)
-
-                    # vs mix int
-                    if op in ['add','sub','mul']:
-                        result = getattr(self.mixed_int, op)(2 + self.mixed_int)
-                        exp = f(self.mixed_int, 2 + self.mixed_int)
-
-                        # overflow in the uint
-                        dtype = None
-                        if op in ['sub']:
-                            dtype = dict(B = 'object', C = None)
-                        elif op in ['add','mul']:
-                            dtype = dict(C = None)
-                        assert_frame_equal(result, exp)
-                        _check_mixed_int(result, dtype = dtype)
-            except:
-                com.pprint_thing("Failing operation %r" % op)
-                raise
-
-            # ndim >= 3
-            ndim_5 = np.ones(self.frame.shape + (3, 4, 5))
-            with assertRaisesRegexp(ValueError, 'shape'):
-                f(self.frame, ndim_5)
-
-            with assertRaisesRegexp(ValueError, 'shape'):
-                getattr(self.frame, op)(ndim_5)
-
-
-        # res_add = self.frame.add(self.frame)
-        # res_sub = self.frame.sub(self.frame)
-        # res_mul = self.frame.mul(self.frame)
-        # res_div = self.frame.div(2 * self.frame)
-
-        # assert_frame_equal(res_add, self.frame + self.frame)
-        # assert_frame_equal(res_sub, self.frame - self.frame)
-        # assert_frame_equal(res_mul, self.frame * self.frame)
-        # assert_frame_equal(res_div, self.frame / (2 * self.frame))
-
-        const_add = self.frame.add(1)
-        assert_frame_equal(const_add, self.frame + 1)
-
-        # corner cases
-        result = self.frame.add(self.frame[:0])
-        assert_frame_equal(result, self.frame * np.nan)
-
-        result = self.frame[:0].add(self.frame)
-        assert_frame_equal(result, self.frame * np.nan)
-        with assertRaisesRegexp(NotImplementedError, 'fill_value'):
-            self.frame.add(self.frame.iloc[0], fill_value=3)
-        with assertRaisesRegexp(NotImplementedError, 'fill_value'):
-            self.frame.add(self.frame.iloc[0], axis='index', fill_value=3)
-
-    def test_binary_ops_align(self):
-
-        # test aligning binary ops
-
-        # GH 6681
-        index=MultiIndex.from_product([list('abc'),
-                                       ['one','two','three'],
-                                       [1,2,3]],
-                                      names=['first','second','third'])
-
-        df = DataFrame(np.arange(27*3).reshape(27,3),
-                       index=index,
-                       columns=['value1','value2','value3']).sortlevel()
-
-        idx = pd.IndexSlice
-        for op in ['add','sub','mul','div','truediv']:
-            opa = getattr(operator,op,None)
-            if opa is None:
-                continue
-
-            x = Series([ 1.0, 10.0, 100.0], [1,2,3])
-            result = getattr(df,op)(x,level='third',axis=0)
-
-            expected = pd.concat([ opa(df.loc[idx[:,:,i],:],v) for i, v in x.iteritems() ]).sortlevel()
-            assert_frame_equal(result, expected)
-
-            x = Series([ 1.0, 10.0], ['two','three'])
-            result = getattr(df,op)(x,level='second',axis=0)
-
-            expected = pd.concat([ opa(df.loc[idx[:,i],:],v) for i, v in x.iteritems() ]).reindex_like(df).sortlevel()
-            assert_frame_equal(result, expected)
-
-        ## GH9463 (alignment level of dataframe with series)
-
-        midx = MultiIndex.from_product([['A', 'B'],['a', 'b']])
-        df = DataFrame(np.ones((2,4), dtype='int64'), columns=midx)
-        s = pd.Series({'a':1, 'b':2})
-
-        df2 = df.copy()
-        df2.columns.names = ['lvl0', 'lvl1']
-        s2 = s.copy()
-        s2.index.name = 'lvl1'
-
-        # different cases of integer/string level names:
-        res1 = df.mul(s, axis=1, level=1)
-        res2 = df.mul(s2, axis=1, level=1)
-        res3 = df2.mul(s, axis=1, level=1)
-        res4 = df2.mul(s2, axis=1, level=1)
-        res5 = df2.mul(s, axis=1, level='lvl1')
-        res6 = df2.mul(s2, axis=1, level='lvl1')
-
-        exp = DataFrame(np.array([[1, 2, 1, 2], [1, 2, 1, 2]], dtype='int64'),
-                        columns=midx)
-
-        for res in [res1, res2]:
-            assert_frame_equal(res, exp)
-
-        exp.columns.names = ['lvl0', 'lvl1']
-        for res in [res3, res4, res5, res6]:
-            assert_frame_equal(res, exp)
-
-    def test_arith_mixed(self):
-
-        left = DataFrame({'A': ['a', 'b', 'c'],
-                          'B': [1, 2, 3]})
-
-        result = left + left
-        expected = DataFrame({'A': ['aa', 'bb', 'cc'],
-                              'B': [2, 4, 6]})
-        assert_frame_equal(result, expected)
-
-    def test_arith_getitem_commute(self):
-        df = DataFrame({'A': [1.1, 3.3], 'B': [2.5, -3.9]})
-
-        self._test_op(df, operator.add)
-        self._test_op(df, operator.sub)
-        self._test_op(df, operator.mul)
-        self._test_op(df, operator.truediv)
-        self._test_op(df, operator.floordiv)
-        self._test_op(df, operator.pow)
-
-        self._test_op(df, lambda x, y: y + x)
-        self._test_op(df, lambda x, y: y - x)
-        self._test_op(df, lambda x, y: y * x)
-        self._test_op(df, lambda x, y: y / x)
-        self._test_op(df, lambda x, y: y ** x)
-
-        self._test_op(df, lambda x, y: x + y)
-        self._test_op(df, lambda x, y: x - y)
-        self._test_op(df, lambda x, y: x * y)
-        self._test_op(df, lambda x, y: x / y)
-        self._test_op(df, lambda x, y: x ** y)
-
-    @staticmethod
-    def _test_op(df, op):
-        result = op(df, 1)
-
-        if not df.columns.is_unique:
-            raise ValueError("Only unique columns supported by this test")
-
-        for col in result.columns:
-            assert_series_equal(result[col], op(df[col], 1))
-
-    def test_bool_flex_frame(self):
-        data = np.random.randn(5, 3)
-        other_data = np.random.randn(5, 3)
-        df = DataFrame(data)
-        other = DataFrame(other_data)
-        ndim_5 = np.ones(df.shape + (1, 3))
-
-        # Unaligned
-        def _check_unaligned_frame(meth, op, df, other):
-            part_o = other.ix[3:, 1:].copy()
-            rs = meth(part_o)
-            xp = op(df, part_o.reindex(index=df.index, columns=df.columns))
-            assert_frame_equal(rs, xp)
-
-        # DataFrame
-        self.assertTrue(df.eq(df).values.all())
-        self.assertFalse(df.ne(df).values.any())
-        for op in ['eq', 'ne', 'gt', 'lt', 'ge', 'le']:
-            f = getattr(df, op)
-            o = getattr(operator, op)
-            # No NAs
-            assert_frame_equal(f(other), o(df, other))
-            _check_unaligned_frame(f, o, df, other)
-            # ndarray
-            assert_frame_equal(f(other.values), o(df, other.values))
-            # scalar
-            assert_frame_equal(f(0), o(df, 0))
-            # NAs
-            assert_frame_equal(f(np.nan), o(df, np.nan))
-            with assertRaisesRegexp(ValueError, 'shape'):
-                f(ndim_5)
-
-        # Series
-        def _test_seq(df, idx_ser, col_ser):
-            idx_eq = df.eq(idx_ser, axis=0)
-            col_eq = df.eq(col_ser)
-            idx_ne = df.ne(idx_ser, axis=0)
-            col_ne = df.ne(col_ser)
-            assert_frame_equal(col_eq, df == Series(col_ser))
-            assert_frame_equal(col_eq, -col_ne)
-            assert_frame_equal(idx_eq, -idx_ne)
-            assert_frame_equal(idx_eq, df.T.eq(idx_ser).T)
-            assert_frame_equal(col_eq, df.eq(list(col_ser)))
-            assert_frame_equal(idx_eq, df.eq(Series(idx_ser), axis=0))
-            assert_frame_equal(idx_eq, df.eq(list(idx_ser), axis=0))
-
-            idx_gt = df.gt(idx_ser, axis=0)
-            col_gt = df.gt(col_ser)
-            idx_le = df.le(idx_ser, axis=0)
-            col_le = df.le(col_ser)
-
-            assert_frame_equal(col_gt, df > Series(col_ser))
-            assert_frame_equal(col_gt, -col_le)
-            assert_frame_equal(idx_gt, -idx_le)
-            assert_frame_equal(idx_gt, df.T.gt(idx_ser).T)
-
-            idx_ge = df.ge(idx_ser, axis=0)
-            col_ge = df.ge(col_ser)
-            idx_lt = df.lt(idx_ser, axis=0)
-            col_lt = df.lt(col_ser)
-            assert_frame_equal(col_ge, df >= Series(col_ser))
-            assert_frame_equal(col_ge, -col_lt)
-            assert_frame_equal(idx_ge, -idx_lt)
-            assert_frame_equal(idx_ge, df.T.ge(idx_ser).T)
-
-        idx_ser = Series(np.random.randn(5))
-        col_ser = Series(np.random.randn(3))
-        _test_seq(df, idx_ser, col_ser)
-
-
-        # list/tuple
-        _test_seq(df, idx_ser.values, col_ser.values)
-
-        # NA
-        df.ix[0, 0] = np.nan
-        rs = df.eq(df)
-        self.assertFalse(rs.ix[0, 0])
-        rs = df.ne(df)
-        self.assertTrue(rs.ix[0, 0])
-        rs = df.gt(df)
-        self.assertFalse(rs.ix[0, 0])
-        rs = df.lt(df)
-        self.assertFalse(rs.ix[0, 0])
-        rs = df.ge(df)
-        self.assertFalse(rs.ix[0, 0])
-        rs = df.le(df)
-        self.assertFalse(rs.ix[0, 0])
-
-
-
-        # complex
-        arr = np.array([np.nan, 1, 6, np.nan])
-        arr2 = np.array([2j, np.nan, 7, None])
-        df = DataFrame({'a': arr})
-        df2 = DataFrame({'a': arr2})
-        rs = df.gt(df2)
-        self.assertFalse(rs.values.any())
-        rs = df.ne(df2)
-        self.assertTrue(rs.values.all())
-
-        arr3 = np.array([2j, np.nan, None])
-        df3 = DataFrame({'a': arr3})
-        rs = df3.gt(2j)
-        self.assertFalse(rs.values.any())
-
-        # corner, dtype=object
-        df1 = DataFrame({'col': ['foo', np.nan, 'bar']})
-        df2 = DataFrame({'col': ['foo', datetime.now(), 'bar']})
-        result = df1.ne(df2)
-        exp = DataFrame({'col': [False, True, False]})
-        assert_frame_equal(result, exp)
-
-    def test_arith_flex_series(self):
-        df = self.simple
-
-        row = df.xs('a')
-        col = df['two']
-        # after arithmetic refactor, add truediv here
-        ops = ['add', 'sub', 'mul', 'mod']
-        for op in ops:
-            f = getattr(df, op)
-            op = getattr(operator, op)
-            assert_frame_equal(f(row), op(df, row))
-            assert_frame_equal(f(col, axis=0), op(df.T, col).T)
-
-        # special case for some reason
-        assert_frame_equal(df.add(row, axis=None), df + row)
-
-        # cases which will be refactored after big arithmetic refactor
-        assert_frame_equal(df.div(row), df / row)
-        assert_frame_equal(df.div(col, axis=0), (df.T / col).T)
-
-        # broadcasting issue in GH7325
-        df = DataFrame(np.arange(3*2).reshape((3,2)),dtype='int64')
-        expected = DataFrame([[nan, inf], [1.0, 1.5], [1.0, 1.25]])
-        result = df.div(df[0],axis='index')
-        assert_frame_equal(result,expected)
-
-        df = DataFrame(np.arange(3*2).reshape((3,2)),dtype='float64')
-        expected = DataFrame([[np.nan,np.inf],[1.0,1.5],[1.0,1.25]])
-        result = df.div(df[0],axis='index')
-        assert_frame_equal(result,expected)
-
-    def test_arith_non_pandas_object(self):
-        df = self.simple
-
-        val1 = df.xs('a').values
-        added = DataFrame(df.values + val1, index=df.index, columns=df.columns)
-        assert_frame_equal(df + val1, added)
-
-        added = DataFrame((df.values.T + val1).T,
-                          index=df.index, columns=df.columns)
-        assert_frame_equal(df.add(val1, axis=0), added)
-
-        val2 = list(df['two'])
-
-        added = DataFrame(df.values + val2, index=df.index, columns=df.columns)
-        assert_frame_equal(df + val2, added)
-
-        added = DataFrame((df.values.T + val2).T, index=df.index,
-                          columns=df.columns)
-        assert_frame_equal(df.add(val2, axis='index'), added)
-
-        val3 = np.random.rand(*df.shape)
-        added = DataFrame(df.values + val3, index=df.index, columns=df.columns)
-        assert_frame_equal(df.add(val3), added)
-
-    def test_combineFrame(self):
-        frame_copy = self.frame.reindex(self.frame.index[::2])
-
-        del frame_copy['D']
-        frame_copy['C'][:5] = nan
-
-        added = self.frame + frame_copy
-        tm.assert_dict_equal(added['A'].valid(),
-                             self.frame['A'] * 2,
-                             compare_keys=False)
-
-        self.assertTrue(np.isnan(added['C'].reindex(frame_copy.index)[:5]).all())
-
-        # assert(False)
-
-        self.assertTrue(np.isnan(added['D']).all())
-
-        self_added = self.frame + self.frame
-        self.assertTrue(self_added.index.equals(self.frame.index))
-
-        added_rev = frame_copy + self.frame
-        self.assertTrue(np.isnan(added['D']).all())
-
-        # corner cases
-
-        # empty
-        plus_empty = self.frame + self.empty
-        self.assertTrue(np.isnan(plus_empty.values).all())
-
-        empty_plus = self.empty + self.frame
-        self.assertTrue(np.isnan(empty_plus.values).all())
-
-        empty_empty = self.empty + self.empty
-        self.assertTrue(empty_empty.empty)
-
-        # out of order
-        reverse = self.frame.reindex(columns=self.frame.columns[::-1])
-
-        assert_frame_equal(reverse + self.frame, self.frame * 2)
-
-        # mix vs float64, upcast
-        added = self.frame + self.mixed_float
-        _check_mixed_float(added, dtype = 'float64')
-        added = self.mixed_float + self.frame
-        _check_mixed_float(added, dtype = 'float64')
-
-        # mix vs mix
-        added = self.mixed_float + self.mixed_float2
-        _check_mixed_float(added, dtype = dict(C = None))
-        added = self.mixed_float2 + self.mixed_float
-        _check_mixed_float(added, dtype = dict(C = None))
-
-        # with int
-        added = self.frame + self.mixed_int
-        _check_mixed_float(added, dtype = 'float64')
-
-    def test_combineSeries(self):
-
-        # Series
-        series = self.frame.xs(self.frame.index[0])
-
-        added = self.frame + series
-
-        for key, s in compat.iteritems(added):
-            assert_series_equal(s, self.frame[key] + series[key])
-
-        larger_series = series.to_dict()
-        larger_series['E'] = 1
-        larger_series = Series(larger_series)
-        larger_added = self.frame + larger_series
-
-        for key, s in compat.iteritems(self.frame):
-            assert_series_equal(larger_added[key], s + series[key])
-        self.assertIn('E', larger_added)
-        self.assertTrue(np.isnan(larger_added['E']).all())
-
-        # vs mix (upcast) as needed
-        added = self.mixed_float + series
-        _check_mixed_float(added, dtype = 'float64')
-        added = self.mixed_float + series.astype('float32')
-        _check_mixed_float(added, dtype = dict(C = None))
-        added = self.mixed_float + series.astype('float16')
-        _check_mixed_float(added, dtype = dict(C = None))
-
-        #### these raise with numexpr.....as we are adding an int64 to an uint64....weird
-        # vs int
-        #added = self.mixed_int + (100*series).astype('int64')
-        #_check_mixed_int(added, dtype = dict(A = 'int64', B = 'float64', C = 'int64', D = 'int64'))
-        #added = self.mixed_int + (100*series).astype('int32')
-        #_check_mixed_int(added, dtype = dict(A = 'int32', B = 'float64', C = 'int32', D = 'int64'))
-
-
-        # TimeSeries
-        ts = self.tsframe['A']
-
-        # 10890
-        # we no longer allow auto timeseries broadcasting
-        # and require explict broadcasting
-        added = self.tsframe.add(ts, axis='index')
-
-        for key, col in compat.iteritems(self.tsframe):
-            result = col + ts
-            assert_series_equal(added[key], result, check_names=False)
-            self.assertEqual(added[key].name, key)
-            if col.name == ts.name:
-                self.assertEqual(result.name, 'A')
-            else:
-                self.assertTrue(result.name is None)
-
-        smaller_frame = self.tsframe[:-5]
-        smaller_added = smaller_frame.add(ts, axis='index')
-
-        self.assertTrue(smaller_added.index.equals(self.tsframe.index))
-
-        smaller_ts = ts[:-5]
-        smaller_added2 = self.tsframe.add(smaller_ts, axis='index')
-        assert_frame_equal(smaller_added, smaller_added2)
-
-        # length 0, result is all-nan
-        result = self.tsframe.add(ts[:0], axis='index')
-        expected = DataFrame(np.nan,index=self.tsframe.index,columns=self.tsframe.columns)
-        assert_frame_equal(result, expected)
-
-        # Frame is all-nan
-        result = self.tsframe[:0].add(ts, axis='index')
-        expected = DataFrame(np.nan,index=self.tsframe.index,columns=self.tsframe.columns)
-        assert_frame_equal(result, expected)
-
-        # empty but with non-empty index
-        frame = self.tsframe[:1].reindex(columns=[])
-        result = frame.mul(ts,axis='index')
-        self.assertEqual(len(result), len(ts))
-
-    def test_combineFunc(self):
-        result = self.frame * 2
-        self.assert_numpy_array_equal(result.values, self.frame.values * 2)
-
-        # vs mix
-        result = self.mixed_float * 2
-        for c, s in compat.iteritems(result):
-            self.assert_numpy_array_equal(s.values, self.mixed_float[c].values * 2)
-        _check_mixed_float(result, dtype = dict(C = None))
-
-        result = self.empty * 2
-        self.assertIs(result.index, self.empty.index)
-        self.assertEqual(len(result.columns), 0)
-
-    def test_comparisons(self):
-        df1 = tm.makeTimeDataFrame()
-        df2 = tm.makeTimeDataFrame()
-
-        row = self.simple.xs('a')
-        ndim_5 = np.ones(df1.shape + (1, 1, 1))
-
-        def test_comp(func):
-            result = func(df1, df2)
-            self.assert_numpy_array_equal(result.values,
-                                          func(df1.values, df2.values))
-            with assertRaisesRegexp(ValueError, 'Wrong number of dimensions'):
-                func(df1, ndim_5)
-
-            result2 = func(self.simple, row)
-            self.assert_numpy_array_equal(result2.values,
-                                          func(self.simple.values, row.values))
-
-            result3 = func(self.frame, 0)
-            self.assert_numpy_array_equal(result3.values,
-                                          func(self.frame.values, 0))
-
-
-            with assertRaisesRegexp(ValueError, 'Can only compare '
-                                    'identically-labeled DataFrame'):
-                func(self.simple, self.simple[:2])
-
-        test_comp(operator.eq)
-        test_comp(operator.ne)
-        test_comp(operator.lt)
-        test_comp(operator.gt)
-        test_comp(operator.ge)
-        test_comp(operator.le)
-
-    def test_string_comparison(self):
-        df = DataFrame([{"a": 1, "b": "foo"}, {"a": 2, "b": "bar"}])
-        mask_a = df.a > 1
-        assert_frame_equal(df[mask_a], df.ix[1:1, :])
-        assert_frame_equal(df[-mask_a], df.ix[0:0, :])
-
-        mask_b = df.b == "foo"
-        assert_frame_equal(df[mask_b], df.ix[0:0, :])
-        assert_frame_equal(df[-mask_b], df.ix[1:1, :])
-
-    def test_float_none_comparison(self):
-        df = DataFrame(np.random.randn(8, 3), index=lrange(8),
-                       columns=['A', 'B', 'C'])
-
-        self.assertRaises(TypeError, df.__eq__, None)
-
-    def test_boolean_comparison(self):
-
-        # GH 4576
-        # boolean comparisons with a tuple/list give unexpected results
-        df = DataFrame(np.arange(6).reshape((3,2)))
-        b = np.array([2, 2])
-        b_r = np.atleast_2d([2,2])
-        b_c = b_r.T
-        l = (2,2,2)
-        tup = tuple(l)
-
-        # gt
-        expected = DataFrame([[False,False],[False,True],[True,True]])
-        result = df>b
-        assert_frame_equal(result,expected)
-
-        result = df.values>b
-        assert_numpy_array_equal(result,expected.values)
-
-        result = df>l
-        assert_frame_equal(result,expected)
-
-        result = df>tup
-        assert_frame_equal(result,expected)
-
-        result = df>b_r
-        assert_frame_equal(result,expected)
-
-        result = df.values>b_r
-        assert_numpy_array_equal(result,expected.values)
-
-        self.assertRaises(ValueError, df.__gt__, b_c)
-        self.assertRaises(ValueError, df.values.__gt__, b_c)
-
-        # ==
-        expected = DataFrame([[False,False],[True,False],[False,False]])
-        result = df == b
-        assert_frame_equal(result,expected)
-
-        result = df==l
-        assert_frame_equal(result,expected)
-
-        result = df==tup
-        assert_frame_equal(result,expected)
-
-        result = df == b_r
-        assert_frame_equal(result,expected)
-
-        result = df.values == b_r
-        assert_numpy_array_equal(result,expected.values)
-
-        self.assertRaises(ValueError, lambda : df == b_c)
-        self.assertFalse((df.values == b_c))
-
-        # with alignment
-        df = DataFrame(np.arange(6).reshape((3,2)),columns=list('AB'),index=list('abc'))
-        expected.index=df.index
-        expected.columns=df.columns
-
-        result = df==l
-        assert_frame_equal(result,expected)
-
-        result = df==tup
-        assert_frame_equal(result,expected)
-
-        # not shape compatible
-        self.assertRaises(ValueError, lambda : df == (2,2))
-        self.assertRaises(ValueError, lambda : df == [2,2])
-
-    def test_equals_different_blocks(self):
-        # GH 9330
-        df0 = pd.DataFrame({"A": ["x","y"], "B": [1,2],
-                            "C": ["w","z"]})
-        df1 = df0.reset_index()[["A","B","C"]]
-        # this assert verifies that the above operations have
-        # induced a block rearrangement
-        self.assertTrue(df0._data.blocks[0].dtype !=
-                        df1._data.blocks[0].dtype)
-        # do the real tests
-        assert_frame_equal(df0, df1)
-        self.assertTrue(df0.equals(df1))
-        self.assertTrue(df1.equals(df0))
-
-    def test_copy_blocks(self):
-        # API/ENH 9607
-        df = DataFrame(self.frame, copy=True)
-        column = df.columns[0]
-
-        # use the default copy=True, change a column
-        blocks = df.as_blocks()
-        for dtype, _df in blocks.items():
-            if column in _df:
-                _df.ix[:, column] = _df[column] + 1
-
-        # make sure we did not change the original DataFrame
-        self.assertFalse(_df[column].equals(df[column]))
-
-    def test_no_copy_blocks(self):
-        # API/ENH 9607
-        df = DataFrame(self.frame, copy=True)
-        column = df.columns[0]
-
-        # use the copy=False, change a column
-        blocks = df.as_blocks(copy=False)
-        for dtype, _df in blocks.items():
-            if column in _df:
-                _df.ix[:, column] = _df[column] + 1
-
-        # make sure we did change the original DataFrame
-        self.assertTrue(_df[column].equals(df[column]))
-
-    def test_to_csv_from_csv(self):
-
-        pname = '__tmp_to_csv_from_csv__'
-        with ensure_clean(pname) as path:
-
-            self.frame['A'][:5] = nan
-
-            self.frame.to_csv(path)
-            self.frame.to_csv(path, columns=['A', 'B'])
-            self.frame.to_csv(path, header=False)
-            self.frame.to_csv(path, index=False)
-
-            # test roundtrip
-            self.tsframe.to_csv(path)
-            recons = DataFrame.from_csv(path)
-
-            assert_frame_equal(self.tsframe, recons)
-
-            self.tsframe.to_csv(path, index_label='index')
-            recons = DataFrame.from_csv(path, index_col=None)
-            assert(len(recons.columns) == len(self.tsframe.columns) + 1)
-
-            # no index
-            self.tsframe.to_csv(path, index=False)
-            recons = DataFrame.from_csv(path, index_col=None)
-            assert_almost_equal(self.tsframe.values, recons.values)
-
-            # corner case
-            dm = DataFrame({'s1': Series(lrange(3), lrange(3)),
-                            's2': Series(lrange(2), lrange(2))})
-            dm.to_csv(path)
-            recons = DataFrame.from_csv(path)
-            assert_frame_equal(dm, recons)
-
-        with ensure_clean(pname) as path:
-
-            # duplicate index
-            df = DataFrame(np.random.randn(3, 3), index=['a', 'a', 'b'],
-                           columns=['x', 'y', 'z'])
-            df.to_csv(path)
-            result = DataFrame.from_csv(path)
-            assert_frame_equal(result, df)
-
-            midx = MultiIndex.from_tuples([('A', 1, 2), ('A', 1, 2), ('B', 1, 2)])
-            df = DataFrame(np.random.randn(3, 3), index=midx,
-                           columns=['x', 'y', 'z'])
-            df.to_csv(path)
-            result = DataFrame.from_csv(path, index_col=[0, 1, 2],
-                                        parse_dates=False)
-            assert_frame_equal(result, df, check_names=False)  # TODO from_csv names index ['Unnamed: 1', 'Unnamed: 2'] should it ?
-
-            # column aliases
-            col_aliases = Index(['AA', 'X', 'Y', 'Z'])
-            self.frame2.to_csv(path, header=col_aliases)
-            rs = DataFrame.from_csv(path)
-            xp = self.frame2.copy()
-            xp.columns = col_aliases
-
-            assert_frame_equal(xp, rs)
-
-            self.assertRaises(ValueError, self.frame2.to_csv, path,
-                              header=['AA', 'X'])
-
-        with ensure_clean(pname) as path:
-            df1 = DataFrame(np.random.randn(3, 1))
-            df2 = DataFrame(np.random.randn(3, 1))
-
-            df1.to_csv(path)
-            df2.to_csv(path,mode='a',header=False)
-            xp = pd.concat([df1,df2])
-            rs = pd.read_csv(path,index_col=0)
-            rs.columns = lmap(int,rs.columns)
-            xp.columns = lmap(int,xp.columns)
-            assert_frame_equal(xp,rs)
-
-        with ensure_clean() as path:
-            # GH 10833 (TimedeltaIndex formatting)
-            dt = pd.Timedelta(seconds=1)
-            df = pd.DataFrame({'dt_data': [i*dt for i in range(3)]},
-                              index=pd.Index([i*dt for i in range(3)],
-                                             name='dt_index'))
-            df.to_csv(path)
-
-            result = pd.read_csv(path, index_col='dt_index')
-            result.index = pd.to_timedelta(result.index)
-            # TODO: remove renaming when GH 10875 is solved
-            result.index = result.index.rename('dt_index')
-            result['dt_data'] = pd.to_timedelta(result['dt_data'])
-
-            assert_frame_equal(df, result, check_index_type=True)
-
-        # tz, 8260
-        with ensure_clean(pname) as path:
-
-            self.tzframe.to_csv(path)
-            result = pd.read_csv(path, index_col=0, parse_dates=['A'])
-
-            converter = lambda c: pd.to_datetime(result[c]).dt.tz_localize('UTC').dt.tz_convert(self.tzframe[c].dt.tz)
-            result['B'] = converter('B')
-            result['C'] = converter('C')
-            assert_frame_equal(result, self.tzframe)
-
-    def test_to_csv_cols_reordering(self):
-        # GH3454
-        import pandas as pd
-
-        chunksize=5
-        N = int(chunksize*2.5)
-
-        df= mkdf(N, 3)
-        cs = df.columns
-        cols = [cs[2],cs[0]]
-
-        with ensure_clean() as path:
-            df.to_csv(path,columns = cols,chunksize=chunksize)
-            rs_c = pd.read_csv(path,index_col=0)
-
-        assert_frame_equal(df[cols],rs_c,check_names=False)
-
-    def test_to_csv_legacy_raises_on_dupe_cols(self):
-        df= mkdf(10, 3)
-        df.columns = ['a','a','b']
-        with ensure_clean() as path:
-            with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-                self.assertRaises(NotImplementedError,df.to_csv,path,engine='python')
-
-    def test_to_csv_new_dupe_cols(self):
-        import pandas as pd
-        def _check_df(df,cols=None):
-            with ensure_clean() as path:
-                df.to_csv(path,columns = cols,chunksize=chunksize)
-                rs_c = pd.read_csv(path,index_col=0)
-
-                # we wrote them in a different order
-                # so compare them in that order
-                if cols is not None:
-
-                    if df.columns.is_unique:
-                        rs_c.columns = cols
-                    else:
-                        indexer, missing = df.columns.get_indexer_non_unique(cols)
-                        rs_c.columns = df.columns.take(indexer)
-
-                    for c in cols:
-                        obj_df = df[c]
-                        obj_rs = rs_c[c]
-                        if isinstance(obj_df,Series):
-                            assert_series_equal(obj_df,obj_rs)
-                        else:
-                            assert_frame_equal(obj_df,obj_rs,check_names=False)
-
-                # wrote in the same order
-                else:
-                    rs_c.columns = df.columns
-                    assert_frame_equal(df,rs_c,check_names=False)
-
-        chunksize=5
-        N = int(chunksize*2.5)
-
-        # dupe cols
-        df= mkdf(N, 3)
-        df.columns = ['a','a','b']
-        _check_df(df,None)
-
-        # dupe cols with selection
-        cols = ['b','a']
-        _check_df(df,cols)
-
-    @slow
-    def test_to_csv_moar(self):
-        path = '__tmp_to_csv_moar__'
-
-        def _do_test(df,path,r_dtype=None,c_dtype=None,rnlvl=None,cnlvl=None,
-                     dupe_col=False):
-
-            kwargs = dict(parse_dates=False)
-            if cnlvl:
-                if rnlvl is not None:
-                    kwargs['index_col'] = lrange(rnlvl)
-                kwargs['header'] = lrange(cnlvl)
-                with ensure_clean(path) as path:
-                    df.to_csv(path,encoding='utf8',chunksize=chunksize,tupleize_cols=False)
-                    recons = DataFrame.from_csv(path,tupleize_cols=False,**kwargs)
-            else:
-                kwargs['header'] = 0
-                with ensure_clean(path) as path:
-                    df.to_csv(path,encoding='utf8',chunksize=chunksize)
-                    recons = DataFrame.from_csv(path,**kwargs)
-
-            def _to_uni(x):
-                if not isinstance(x, compat.text_type):
-                    return x.decode('utf8')
-                return x
-            if dupe_col:
-                # read_Csv disambiguates the columns by
-                # labeling them dupe.1,dupe.2, etc'. monkey patch columns
-                recons.columns = df.columns
-            if rnlvl and not cnlvl:
-                delta_lvl = [recons.iloc[:, i].values for i in range(rnlvl-1)]
-                ix=MultiIndex.from_arrays([list(recons.index)]+delta_lvl)
-                recons.index = ix
-                recons = recons.iloc[:,rnlvl-1:]
-
-            type_map = dict(i='i',f='f',s='O',u='O',dt='O',p='O')
-            if r_dtype:
-                if r_dtype == 'u': # unicode
-                    r_dtype='O'
-                    recons.index = np.array(lmap(_to_uni,recons.index),
-                                            dtype=r_dtype)
-                    df.index = np.array(lmap(_to_uni,df.index),dtype=r_dtype)
-                elif r_dtype == 'dt': # unicode
-                    r_dtype='O'
-                    recons.index = np.array(lmap(Timestamp,recons.index),
-                                            dtype=r_dtype)
-                    df.index = np.array(lmap(Timestamp,df.index),dtype=r_dtype)
-                elif r_dtype == 'p':
-                    r_dtype='O'
-                    recons.index = np.array(list(map(Timestamp,
-                                                     recons.index.to_datetime())),
-                                            dtype=r_dtype)
-                    df.index = np.array(list(map(Timestamp,
-                                                 df.index.to_datetime())),
-                                        dtype=r_dtype)
-                else:
-                    r_dtype= type_map.get(r_dtype)
-                    recons.index = np.array(recons.index,dtype=r_dtype )
-                    df.index = np.array(df.index,dtype=r_dtype )
-            if c_dtype:
-                if c_dtype == 'u':
-                    c_dtype='O'
-                    recons.columns = np.array(lmap(_to_uni,recons.columns),
-                                              dtype=c_dtype)
-                    df.columns = np.array(lmap(_to_uni,df.columns),dtype=c_dtype )
-                elif c_dtype == 'dt':
-                    c_dtype='O'
-                    recons.columns = np.array(lmap(Timestamp,recons.columns),
-                                                dtype=c_dtype )
-                    df.columns = np.array(lmap(Timestamp,df.columns),dtype=c_dtype)
-                elif c_dtype == 'p':
-                    c_dtype='O'
-                    recons.columns = np.array(lmap(Timestamp,recons.columns.to_datetime()),
-                                              dtype=c_dtype)
-                    df.columns = np.array(lmap(Timestamp,df.columns.to_datetime()),dtype=c_dtype )
-                else:
-                    c_dtype= type_map.get(c_dtype)
-                    recons.columns = np.array(recons.columns,dtype=c_dtype )
-                    df.columns = np.array(df.columns,dtype=c_dtype )
-
-            assert_frame_equal(df,recons,check_names=False,check_less_precise=True)
-
-        N = 100
-        chunksize=1000
-
-        # GH3437
-        from pandas import NaT
-        def make_dtnat_arr(n,nnat=None):
-            if nnat is None:
-                nnat= int(n*0.1) # 10%
-            s=list(date_range('2000',freq='5min',periods=n))
-            if nnat:
-                for i in np.random.randint(0,len(s),nnat):
-                    s[i] = NaT
-                i = np.random.randint(100)
-                s[-i] = NaT
-                s[i] = NaT
-            return s
-
-        # N=35000
-        s1=make_dtnat_arr(chunksize+5)
-        s2=make_dtnat_arr(chunksize+5,0)
-        path = '1.csv'
-
-        # s3=make_dtnjat_arr(chunksize+5,0)
-        with ensure_clean('.csv') as pth:
-            df=DataFrame(dict(a=s1,b=s2))
-            df.to_csv(pth,chunksize=chunksize)
-            recons = DataFrame.from_csv(pth)._convert(datetime=True,
-                                                             coerce=True)
-            assert_frame_equal(df, recons,check_names=False,check_less_precise=True)
-
-        for ncols in [4]:
-            base = int((chunksize// ncols or 1) or 1)
-            for nrows in [2,10,N-1,N,N+1,N+2,2*N-2,2*N-1,2*N,2*N+1,2*N+2,
-                  base-1,base,base+1]:
-                _do_test(mkdf(nrows, ncols,r_idx_type='dt',
-                              c_idx_type='s'),path, 'dt','s')
-
-
-        for ncols in [4]:
-            base = int((chunksize// ncols or 1) or 1)
-            for nrows in [2,10,N-1,N,N+1,N+2,2*N-2,2*N-1,2*N,2*N+1,2*N+2,
-                  base-1,base,base+1]:
-                _do_test(mkdf(nrows, ncols,r_idx_type='dt',
-                              c_idx_type='s'),path, 'dt','s')
-                pass
-
-        for r_idx_type,c_idx_type  in [('i','i'),('s','s'),('u','dt'),('p','p')]:
-            for ncols in [1,2,3,4]:
-                base = int((chunksize// ncols or 1) or 1)
-                for nrows in [2,10,N-1,N,N+1,N+2,2*N-2,2*N-1,2*N,2*N+1,2*N+2,
-                      base-1,base,base+1]:
-                    _do_test(mkdf(nrows, ncols,r_idx_type=r_idx_type,
-                                  c_idx_type=c_idx_type),path,r_idx_type,c_idx_type)
-
-        for ncols in [1,2,3,4]:
-            base = int((chunksize// ncols or 1) or 1)
-            for nrows in [10,N-2,N-1,N,N+1,N+2,2*N-2,2*N-1,2*N,2*N+1,2*N+2,
-                      base-1,base,base+1]:
-                _do_test(mkdf(nrows, ncols),path)
-
-        for nrows in [10,N-2,N-1,N,N+1,N+2]:
-            df = mkdf(nrows, 3)
-            cols = list(df.columns)
-            cols[:2] = ["dupe","dupe"]
-            cols[-2:] = ["dupe","dupe"]
-            ix = list(df.index)
-            ix[:2] = ["rdupe","rdupe"]
-            ix[-2:] = ["rdupe","rdupe"]
-            df.index=ix
-            df.columns=cols
-            _do_test(df,path,dupe_col=True)
-
-
-        _do_test(DataFrame(index=lrange(10)),path)
-        _do_test(mkdf(chunksize//2+1, 2,r_idx_nlevels=2),path,rnlvl=2)
-        for ncols in [2,3,4]:
-            base = int(chunksize//ncols)
-            for nrows in [10,N-2,N-1,N,N+1,N+2,2*N-2,2*N-1,2*N,2*N+1,2*N+2,
-                      base-1,base,base+1]:
-                _do_test(mkdf(nrows, ncols,r_idx_nlevels=2),path,rnlvl=2)
-                _do_test(mkdf(nrows, ncols,c_idx_nlevels=2),path,cnlvl=2)
-                _do_test(mkdf(nrows, ncols,r_idx_nlevels=2,c_idx_nlevels=2),
-                         path,rnlvl=2,cnlvl=2)
-
-    def test_to_csv_from_csv_w_some_infs(self):
-
-        # test roundtrip with inf, -inf, nan, as full columns and mix
-        self.frame['G'] = np.nan
-        f = lambda x: [np.inf, np.nan][np.random.rand() < .5]
-        self.frame['H'] = self.frame.index.map(f)
-
-        with ensure_clean() as path:
-            self.frame.to_csv(path)
-            recons = DataFrame.from_csv(path)
-
-            assert_frame_equal(self.frame, recons, check_names=False)  # TODO to_csv drops column name
-            assert_frame_equal(np.isinf(self.frame), np.isinf(recons), check_names=False)
-
-    def test_to_csv_from_csv_w_all_infs(self):
-
-        # test roundtrip with inf, -inf, nan, as full columns and mix
-        self.frame['E'] = np.inf
-        self.frame['F'] = -np.inf
-
-        with ensure_clean() as path:
-            self.frame.to_csv(path)
-            recons = DataFrame.from_csv(path)
-
-            assert_frame_equal(self.frame, recons, check_names=False)  # TODO to_csv drops column name
-            assert_frame_equal(np.isinf(self.frame), np.isinf(recons), check_names=False)
-
-    def test_to_csv_no_index(self):
-        # GH 3624, after appending columns, to_csv fails
-        pname = '__tmp_to_csv_no_index__'
-        with ensure_clean(pname) as path:
-            df = DataFrame({'c1':[1,2,3], 'c2':[4,5,6]})
-            df.to_csv(path, index=False)
-            result = read_csv(path)
-            assert_frame_equal(df,result)
-            df['c3'] = Series([7,8,9],dtype='int64')
-            df.to_csv(path, index=False)
-            result = read_csv(path)
-            assert_frame_equal(df,result)
-
-    def test_to_csv_headers(self):
-        # GH6186, the presence or absence of `index` incorrectly
-        # causes to_csv to have different header semantics.
-        pname = '__tmp_to_csv_headers__'
-        from_df = DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
-        to_df  = DataFrame([[1, 2], [3, 4]], columns=['X', 'Y'])
-        with ensure_clean(pname) as path:
-            from_df.to_csv(path, header=['X', 'Y'])
-            recons = DataFrame.from_csv(path)
-            assert_frame_equal(to_df, recons)
-
-            from_df.to_csv(path, index=False, header=['X', 'Y'])
-            recons = DataFrame.from_csv(path)
-            recons.reset_index(inplace=True)
-            assert_frame_equal(to_df, recons)
-
-    def test_to_csv_multiindex(self):
-
-        pname = '__tmp_to_csv_multiindex__'
-        frame = self.frame
-        old_index = frame.index
-        arrays = np.arange(len(old_index) * 2).reshape(2, -1)
-        new_index = MultiIndex.from_arrays(arrays, names=['first', 'second'])
-        frame.index = new_index
-
-        with ensure_clean(pname) as path:
-
-            frame.to_csv(path, header=False)
-            frame.to_csv(path, columns=['A', 'B'])
-
-            # round trip
-            frame.to_csv(path)
-            df = DataFrame.from_csv(path, index_col=[0, 1], parse_dates=False)
-
-            assert_frame_equal(frame, df, check_names=False)  # TODO to_csv drops column name
-            self.assertEqual(frame.index.names, df.index.names)
-            self.frame.index = old_index  # needed if setUP becomes a classmethod
-
-            # try multiindex with dates
-            tsframe = self.tsframe
-            old_index = tsframe.index
-            new_index = [old_index, np.arange(len(old_index))]
-            tsframe.index = MultiIndex.from_arrays(new_index)
-
-            tsframe.to_csv(path, index_label=['time', 'foo'])
-            recons = DataFrame.from_csv(path, index_col=[0, 1])
-            assert_frame_equal(tsframe, recons, check_names=False)  # TODO to_csv drops column name
-
-            # do not load index
-            tsframe.to_csv(path)
-            recons = DataFrame.from_csv(path, index_col=None)
-            np.testing.assert_equal(len(recons.columns), len(tsframe.columns) + 2)
-
-            # no index
-            tsframe.to_csv(path, index=False)
-            recons = DataFrame.from_csv(path, index_col=None)
-            assert_almost_equal(recons.values, self.tsframe.values)
-            self.tsframe.index = old_index  # needed if setUP becomes classmethod
-
-        with ensure_clean(pname) as path:
-            # GH3571, GH1651, GH3141
-
-            def _make_frame(names=None):
-                if names is True:
-                    names = ['first','second']
-                return DataFrame(np.random.randint(0,10,size=(3,3)),
-                                 columns=MultiIndex.from_tuples([('bah', 'foo'),
-                                                                 ('bah', 'bar'),
-                                                                 ('ban', 'baz')],
-                                                                names=names),
-                                 dtype='int64')
-
-            # column & index are multi-index
-            df = mkdf(5,3,r_idx_nlevels=2,c_idx_nlevels=4)
-            df.to_csv(path,tupleize_cols=False)
-            result = read_csv(path,header=[0,1,2,3],index_col=[0,1],tupleize_cols=False)
-            assert_frame_equal(df,result)
-
-            # column is mi
-            df = mkdf(5,3,r_idx_nlevels=1,c_idx_nlevels=4)
-            df.to_csv(path,tupleize_cols=False)
-            result = read_csv(path,header=[0,1,2,3],index_col=0,tupleize_cols=False)
-            assert_frame_equal(df,result)
-
-            # dup column names?
-            df = mkdf(5,3,r_idx_nlevels=3,c_idx_nlevels=4)
-            df.to_csv(path,tupleize_cols=False)
-            result = read_csv(path,header=[0,1,2,3],index_col=[0,1,2],tupleize_cols=False)
-            assert_frame_equal(df,result)
-
-            # writing with no index
-            df = _make_frame()
-            df.to_csv(path,tupleize_cols=False,index=False)
-            result = read_csv(path,header=[0,1],tupleize_cols=False)
-            assert_frame_equal(df,result)
-
-            # we lose the names here
-            df = _make_frame(True)
-            df.to_csv(path,tupleize_cols=False,index=False)
-            result = read_csv(path,header=[0,1],tupleize_cols=False)
-            self.assertTrue(all([ x is None for x in result.columns.names ]))
-            result.columns.names = df.columns.names
-            assert_frame_equal(df,result)
-
-            # tupleize_cols=True and index=False
-            df = _make_frame(True)
-            df.to_csv(path,tupleize_cols=True,index=False)
-            result = read_csv(path,header=0,tupleize_cols=True,index_col=None)
-            result.columns = df.columns
-            assert_frame_equal(df,result)
-
-            # whatsnew example
-            df = _make_frame()
-            df.to_csv(path,tupleize_cols=False)
-            result = read_csv(path,header=[0,1],index_col=[0],tupleize_cols=False)
-            assert_frame_equal(df,result)
-
-            df = _make_frame(True)
-            df.to_csv(path,tupleize_cols=False)
-            result = read_csv(path,header=[0,1],index_col=[0],tupleize_cols=False)
-            assert_frame_equal(df,result)
-
-            # column & index are multi-index (compatibility)
-            df = mkdf(5,3,r_idx_nlevels=2,c_idx_nlevels=4)
-            df.to_csv(path,tupleize_cols=True)
-            result = read_csv(path,header=0,index_col=[0,1],tupleize_cols=True)
-            result.columns = df.columns
-            assert_frame_equal(df,result)
-
-            # invalid options
-            df = _make_frame(True)
-            df.to_csv(path,tupleize_cols=False)
-
-            # catch invalid headers
-            with assertRaisesRegexp(CParserError, 'Passed header=\[0,1,2\] are too many rows for this multi_index of columns'):
-                read_csv(path,tupleize_cols=False,header=lrange(3),index_col=0)
-
-            with assertRaisesRegexp(CParserError, 'Passed header=\[0,1,2,3,4,5,6\], len of 7, but only 6 lines in file'):
-                read_csv(path,tupleize_cols=False,header=lrange(7),index_col=0)
-
-            for i in [4,5,6]:
-                with tm.assertRaises(CParserError):
-                    read_csv(path, tupleize_cols=False, header=lrange(i), index_col=0)
-
-            # write with cols
-            with assertRaisesRegexp(TypeError, 'cannot specify cols with a MultiIndex'):
-                df.to_csv(path, tupleize_cols=False, columns=['foo', 'bar'])
-
-        with ensure_clean(pname) as path:
-            # empty
-            tsframe[:0].to_csv(path)
-            recons = DataFrame.from_csv(path)
-            exp = tsframe[:0]
-            exp.index = []
-
-            self.assertTrue(recons.columns.equals(exp.columns))
-            self.assertEqual(len(recons), 0)
-
-    def test_to_csv_float32_nanrep(self):
-        df = DataFrame(np.random.randn(1, 4).astype(np.float32))
-        df[1] = np.nan
-
-        with ensure_clean('__tmp_to_csv_float32_nanrep__.csv') as path:
-            df.to_csv(path, na_rep=999)
-
-            with open(path) as f:
-                lines = f.readlines()
-                self.assertEqual(lines[1].split(',')[2], '999')
-
-    def test_to_csv_withcommas(self):
-
-        # Commas inside fields should be correctly escaped when saving as CSV.
-        df = DataFrame({'A': [1, 2, 3], 'B': ['5,6', '7,8', '9,0']})
-
-        with ensure_clean('__tmp_to_csv_withcommas__.csv') as path:
-            df.to_csv(path)
-            df2 = DataFrame.from_csv(path)
-            assert_frame_equal(df2, df)
-
-    def test_to_csv_mixed(self):
-
-        def create_cols(name):
-            return [ "%s%03d" % (name,i) for i in range(5) ]
-
-        df_float  = DataFrame(np.random.randn(100, 5),dtype='float64',columns=create_cols('float'))
-        df_int    = DataFrame(np.random.randn(100, 5),dtype='int64',columns=create_cols('int'))
-        df_bool   = DataFrame(True,index=df_float.index,columns=create_cols('bool'))
-        df_object = DataFrame('foo',index=df_float.index,columns=create_cols('object'))
-        df_dt     = DataFrame(Timestamp('20010101'),index=df_float.index,columns=create_cols('date'))
-
-        # add in some nans
-        df_float.ix[30:50,1:3] = np.nan
-
-        #### this is a bug in read_csv right now ####
-        #df_dt.ix[30:50,1:3] = np.nan
-
-        df        = pd.concat([ df_float, df_int, df_bool, df_object, df_dt ], axis=1)
-
-        # dtype
-        dtypes = dict()
-        for n,dtype in [('float',np.float64),('int',np.int64),('bool',np.bool),('object',np.object)]:
-            for c in create_cols(n):
-                dtypes[c] = dtype
-
-        with ensure_clean() as filename:
-            df.to_csv(filename)
-            rs = read_csv(filename, index_col=0, dtype=dtypes, parse_dates=create_cols('date'))
-            assert_frame_equal(rs, df)
-
-    def test_to_csv_dups_cols(self):
-
-        df        = DataFrame(np.random.randn(1000, 30),columns=lrange(15)+lrange(15),dtype='float64')
-
-        with ensure_clean() as filename:
-            df.to_csv(filename) # single dtype, fine
-            result = read_csv(filename,index_col=0)
-            result.columns = df.columns
-            assert_frame_equal(result,df)
-
-        df_float  = DataFrame(np.random.randn(1000, 3),dtype='float64')
-        df_int    = DataFrame(np.random.randn(1000, 3),dtype='int64')
-        df_bool   = DataFrame(True,index=df_float.index,columns=lrange(3))
-        df_object = DataFrame('foo',index=df_float.index,columns=lrange(3))
-        df_dt     = DataFrame(Timestamp('20010101'),index=df_float.index,columns=lrange(3))
-        df        = pd.concat([ df_float, df_int, df_bool, df_object, df_dt ], axis=1, ignore_index=True)
-
-        cols = []
-        for i in range(5):
-            cols.extend([0,1,2])
-        df.columns = cols
-
-        from pandas import to_datetime
-        with ensure_clean() as filename:
-            df.to_csv(filename)
-            result = read_csv(filename,index_col=0)
-
-            # date cols
-            for i in ['0.4','1.4','2.4']:
-                result[i] = to_datetime(result[i])
-
-            result.columns = df.columns
-            assert_frame_equal(result,df)
-
-        # GH3457
-        from pandas.util.testing import makeCustomDataframe as mkdf
-
-        N=10
-        df= mkdf(N, 3)
-        df.columns = ['a','a','b']
-
-        with ensure_clean() as filename:
-            df.to_csv(filename)
-
-            # read_csv will rename the dups columns
-            result = read_csv(filename,index_col=0)
-            result = result.rename(columns={ 'a.1' : 'a' })
-            assert_frame_equal(result,df)
-
-    def test_to_csv_chunking(self):
-
-        aa=DataFrame({'A':lrange(100000)})
-        aa['B'] = aa.A + 1.0
-        aa['C'] = aa.A + 2.0
-        aa['D'] = aa.A + 3.0
-
-        for chunksize in [10000,50000,100000]:
-            with ensure_clean() as filename:
-                aa.to_csv(filename,chunksize=chunksize)
-                rs = read_csv(filename,index_col=0)
-                assert_frame_equal(rs, aa)
-
-    def test_to_csv_wide_frame_formatting(self):
-        # Issue #8621
-        df = DataFrame(np.random.randn(1, 100010), columns=None, index=None)
-        with ensure_clean() as filename:
-            df.to_csv(filename, header=False, index=False)
-            rs = read_csv(filename, header=None)
-            assert_frame_equal(rs, df)
-
-    def test_to_csv_bug(self):
-        f1 = StringIO('a,1.0\nb,2.0')
-        df = DataFrame.from_csv(f1, header=None)
-        newdf = DataFrame({'t': df[df.columns[0]]})
-
-        with ensure_clean() as path:
-            newdf.to_csv(path)
-
-            recons = read_csv(path, index_col=0)
-            assert_frame_equal(recons, newdf, check_names=False)  # don't check_names as t != 1
-
-    def test_to_csv_unicode(self):
-
-        df = DataFrame({u('c/\u03c3'): [1, 2, 3]})
-        with ensure_clean() as path:
-
-            df.to_csv(path, encoding='UTF-8')
-            df2 = read_csv(path, index_col=0, encoding='UTF-8')
-            assert_frame_equal(df, df2)
-
-            df.to_csv(path, encoding='UTF-8', index=False)
-            df2 = read_csv(path, index_col=None, encoding='UTF-8')
-            assert_frame_equal(df, df2)
-
-    def test_to_csv_unicode_index_col(self):
-        buf = StringIO('')
-        df = DataFrame(
-            [[u("\u05d0"), "d2", "d3", "d4"], ["a1", "a2", "a3", "a4"]],
-            columns=[u("\u05d0"),
-                     u("\u05d1"), u("\u05d2"), u("\u05d3")],
-            index=[u("\u05d0"), u("\u05d1")])
-
-        df.to_csv(buf, encoding='UTF-8')
-        buf.seek(0)
-
-        df2 = read_csv(buf, index_col=0, encoding='UTF-8')
-        assert_frame_equal(df, df2)
-
-    def test_to_csv_stringio(self):
-        buf = StringIO()
-        self.frame.to_csv(buf)
-        buf.seek(0)
-        recons = read_csv(buf, index_col=0)
-        assert_frame_equal(recons, self.frame, check_names=False)  # TODO to_csv drops column name
-
-    def test_to_csv_float_format(self):
-
-        df = DataFrame([[0.123456, 0.234567, 0.567567],
-                        [12.32112, 123123.2, 321321.2]],
-                       index=['A', 'B'], columns=['X', 'Y', 'Z'])
-
-        with ensure_clean() as filename:
-
-            df.to_csv(filename, float_format='%.2f')
-
-            rs = read_csv(filename, index_col=0)
-            xp = DataFrame([[0.12, 0.23, 0.57],
-                            [12.32, 123123.20, 321321.20]],
-                           index=['A', 'B'], columns=['X', 'Y', 'Z'])
-            assert_frame_equal(rs, xp)
-
-    def test_to_csv_quoting(self):
-        df = DataFrame({'A': [1, 2, 3], 'B': ['foo', 'bar', 'baz']})
-
-        buf = StringIO()
-        df.to_csv(buf, index=False, quoting=csv.QUOTE_NONNUMERIC)
-
-        result = buf.getvalue()
-        expected = ('"A","B"\n'
-                    '1,"foo"\n'
-                    '2,"bar"\n'
-                    '3,"baz"\n')
-
-        self.assertEqual(result, expected)
-
-        # quoting windows line terminators, presents with encoding?
-        # #3503
-        text = 'a,b,c\n1,"test \r\n",3\n'
-        df = pd.read_csv(StringIO(text))
-        buf = StringIO()
-        df.to_csv(buf, encoding='utf-8', index=False)
-        self.assertEqual(buf.getvalue(), text)
-
-    def test_to_csv_unicodewriter_quoting(self):
-        df = DataFrame({'A': [1, 2, 3], 'B': ['foo', 'bar', 'baz']})
-
-        buf = StringIO()
-        df.to_csv(buf, index=False, quoting=csv.QUOTE_NONNUMERIC,
-                  encoding='utf-8')
-
-        result = buf.getvalue()
-        expected = ('"A","B"\n'
-                    '1,"foo"\n'
-                    '2,"bar"\n'
-                    '3,"baz"\n')
-
-        self.assertEqual(result, expected)
-
-    def test_to_csv_quote_none(self):
-        # GH4328
-        df = DataFrame({'A': ['hello', '{"hello"}']})
-        for encoding in (None, 'utf-8'):
-            buf = StringIO()
-            df.to_csv(buf, quoting=csv.QUOTE_NONE,
-                      encoding=encoding, index=False)
-            result = buf.getvalue()
-            expected = 'A\nhello\n{"hello"}\n'
-            self.assertEqual(result, expected)
-
-    def test_to_csv_index_no_leading_comma(self):
-        df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
-                       index=['one', 'two', 'three'])
-
-        buf = StringIO()
-        df.to_csv(buf, index_label=False)
-        expected = ('A,B\n'
-                    'one,1,4\n'
-                    'two,2,5\n'
-                    'three,3,6\n')
-        self.assertEqual(buf.getvalue(), expected)
-
-    def test_to_csv_line_terminators(self):
-        df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
-                       index=['one', 'two', 'three'])
-
-        buf = StringIO()
-        df.to_csv(buf, line_terminator='\r\n')
-        expected = (',A,B\r\n'
-                    'one,1,4\r\n'
-                    'two,2,5\r\n'
-                    'three,3,6\r\n')
-        self.assertEqual(buf.getvalue(), expected)
-
-        buf = StringIO()
-        df.to_csv(buf)  # The default line terminator remains \n
-        expected = (',A,B\n'
-                    'one,1,4\n'
-                    'two,2,5\n'
-                    'three,3,6\n')
-        self.assertEqual(buf.getvalue(), expected)
-
-    def test_to_csv_from_csv_categorical(self):
-
-        # CSV with categoricals should result in the same output as when one would add a "normal"
-        # Series/DataFrame.
-        s = Series(pd.Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c']))
-        s2 = Series(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
-        res = StringIO()
-        s.to_csv(res)
-        exp = StringIO()
-        s2.to_csv(exp)
-        self.assertEqual(res.getvalue(), exp.getvalue())
-
-        df = DataFrame({"s":s})
-        df2 = DataFrame({"s":s2})
-        res = StringIO()
-        df.to_csv(res)
-        exp = StringIO()
-        df2.to_csv(exp)
-        self.assertEqual(res.getvalue(), exp.getvalue())
-
-    def test_to_csv_path_is_none(self):
-        # GH 8215
-        # Make sure we return string for consistency with
-        # Series.to_csv()
-        csv_str = self.frame.to_csv(path=None)
-        self.assertIsInstance(csv_str, str)
-        recons = pd.read_csv(StringIO(csv_str), index_col=0)
-        assert_frame_equal(self.frame, recons)
-
-    def test_to_csv_compression_gzip(self):
-        ## GH7615
-        ## use the compression kw in to_csv
-        df = DataFrame([[0.123456, 0.234567, 0.567567],
-                        [12.32112, 123123.2, 321321.2]],
-                       index=['A', 'B'], columns=['X', 'Y', 'Z'])
-
-        with ensure_clean() as filename:
-
-            df.to_csv(filename, compression="gzip")
-
-            # test the round trip - to_csv -> read_csv
-            rs = read_csv(filename, compression="gzip", index_col=0)
-            assert_frame_equal(df, rs)
-
-            # explicitly make sure file is gziped
-            import gzip
-            f = gzip.open(filename, 'rb')
-            text = f.read().decode('utf8')
-            f.close()
-            for col in df.columns:
-                self.assertIn(col, text)
-
-    def test_to_csv_compression_bz2(self):
-        ## GH7615
-        ## use the compression kw in to_csv
-        df = DataFrame([[0.123456, 0.234567, 0.567567],
-                        [12.32112, 123123.2, 321321.2]],
-                       index=['A', 'B'], columns=['X', 'Y', 'Z'])
-
-        with ensure_clean() as filename:
-
-            df.to_csv(filename, compression="bz2")
-
-            # test the round trip - to_csv -> read_csv
-            rs = read_csv(filename, compression="bz2", index_col=0)
-            assert_frame_equal(df, rs)
-
-            # explicitly make sure file is bz2ed
-            import bz2
-            f = bz2.BZ2File(filename, 'rb')
-            text = f.read().decode('utf8')
-            f.close()
-            for col in df.columns:
-                self.assertIn(col, text)
-
-    def test_to_csv_compression_value_error(self):
-        ## GH7615
-        ## use the compression kw in to_csv
-        df = DataFrame([[0.123456, 0.234567, 0.567567],
-                        [12.32112, 123123.2, 321321.2]],
-                       index=['A', 'B'], columns=['X', 'Y', 'Z'])
-
-        with ensure_clean() as filename:
-            # zip compression is not supported and should raise ValueError
-            self.assertRaises(ValueError, df.to_csv, filename, compression="zip")
-
-    def test_info(self):
-        io = StringIO()
-        self.frame.info(buf=io)
-        self.tsframe.info(buf=io)
-
-        frame = DataFrame(np.random.randn(5, 3))
-
-        import sys
-        sys.stdout = StringIO()
-        frame.info()
-        frame.info(verbose=False)
-        sys.stdout = sys.__stdout__
-
-    def test_info_wide(self):
-        from pandas import set_option, reset_option
-        io = StringIO()
-        df = DataFrame(np.random.randn(5, 101))
-        df.info(buf=io)
-
-        io = StringIO()
-        df.info(buf=io, max_cols=101)
-        rs = io.getvalue()
-        self.assertTrue(len(rs.splitlines()) > 100)
-        xp = rs
-
-        set_option('display.max_info_columns', 101)
-        io = StringIO()
-        df.info(buf=io)
-        self.assertEqual(rs, xp)
-        reset_option('display.max_info_columns')
-
-    def test_info_duplicate_columns(self):
-        io = StringIO()
-
-        # it works!
-        frame = DataFrame(np.random.randn(1500, 4),
-                          columns=['a', 'a', 'b', 'b'])
-        frame.info(buf=io)
-
-    def test_info_shows_column_dtypes(self):
-        dtypes = ['int64', 'float64', 'datetime64[ns]', 'timedelta64[ns]',
-                  'complex128', 'object', 'bool']
-        data = {}
-        n = 10
-        for i, dtype in enumerate(dtypes):
-            data[i] = np.random.randint(2, size=n).astype(dtype)
-        df = DataFrame(data)
-        buf = StringIO()
-        df.info(buf=buf)
-        res = buf.getvalue()
-        for i, dtype in enumerate(dtypes):
-            name = '%d    %d non-null %s' % (i, n, dtype)
-            assert name in res
-
-    def test_info_max_cols(self):
-        df = DataFrame(np.random.randn(10, 5))
-        for len_, verbose in [(5, None), (5, False), (10, True)]:
-        # For verbose always      ^ setting  ^ summarize ^ full output
-            with option_context('max_info_columns', 4):
-                buf = StringIO()
-                df.info(buf=buf, verbose=verbose)
-                res = buf.getvalue()
-                self.assertEqual(len(res.strip().split('\n')), len_)
-
-        for len_, verbose in [(10, None), (5, False), (10, True)]:
-
-            # max_cols no exceeded
-            with option_context('max_info_columns', 5):
-                buf = StringIO()
-                df.info(buf=buf, verbose=verbose)
-                res = buf.getvalue()
-                self.assertEqual(len(res.strip().split('\n')), len_)
-
-        for len_, max_cols in [(10, 5), (5, 4)]:
-            # setting truncates
-            with option_context('max_info_columns', 4):
-                buf = StringIO()
-                df.info(buf=buf, max_cols=max_cols)
-                res = buf.getvalue()
-                self.assertEqual(len(res.strip().split('\n')), len_)
-
-            # setting wouldn't truncate
-            with option_context('max_info_columns', 5):
-                buf = StringIO()
-                df.info(buf=buf, max_cols=max_cols)
-                res = buf.getvalue()
-                self.assertEqual(len(res.strip().split('\n')), len_)
-
-    def test_info_memory_usage(self):
-        # Ensure memory usage is displayed, when asserted, on the last line
-        dtypes = ['int64', 'float64', 'datetime64[ns]', 'timedelta64[ns]',
-                  'complex128', 'object', 'bool']
-        data = {}
-        n = 10
-        for i, dtype in enumerate(dtypes):
-            data[i] = np.random.randint(2, size=n).astype(dtype)
-        df = DataFrame(data)
-        buf = StringIO()
-        # display memory usage case
-        df.info(buf=buf, memory_usage=True)
-        res = buf.getvalue().splitlines()
-        self.assertTrue("memory usage: " in res[-1])
-        # do not display memory usage cas
-        df.info(buf=buf, memory_usage=False)
-        res = buf.getvalue().splitlines()
-        self.assertTrue("memory usage: " not in res[-1])
-
-        df.info(buf=buf, memory_usage=True)
-        res = buf.getvalue().splitlines()
-        # memory usage is a lower bound, so print it as XYZ+ MB
-        self.assertTrue(re.match(r"memory usage: [^+]+\+", res[-1]))
-
-        df.iloc[:, :5].info(buf=buf, memory_usage=True)
-        res = buf.getvalue().splitlines()
-        # excluded column with object dtype, so estimate is accurate
-        self.assertFalse(re.match(r"memory usage: [^+]+\+", res[-1]))
-
-        df_with_object_index = pd.DataFrame({'a': [1]}, index=['foo'])
-        df_with_object_index.info(buf=buf, memory_usage=True)
-        res = buf.getvalue().splitlines()
-        self.assertTrue(re.match(r"memory usage: [^+]+\+", res[-1]))
-
-        # Test a DataFrame with duplicate columns
-        dtypes = ['int64', 'int64', 'int64', 'float64']
-        data = {}
-        n = 100
-        for i, dtype in enumerate(dtypes):
-            data[i] = np.random.randint(2, size=n).astype(dtype)
-        df = DataFrame(data)
-        df.columns = dtypes
-        # Ensure df size is as expected
-        df_size = df.memory_usage().sum()
-        exp_size = len(dtypes) * n * 8  # cols * rows * bytes
-        self.assertEqual(df_size, exp_size)
-        # Ensure number of cols in memory_usage is the same as df
-        size_df = np.size(df.columns.values)  # index=False; default
-        self.assertEqual(size_df, np.size(df.memory_usage()))
-
-        # test for validity
-        DataFrame(1,index=['a'],columns=['A']).memory_usage(index=True)
-        DataFrame(1,index=['a'],columns=['A']).index.nbytes
-        DataFrame(1,index=pd.MultiIndex.from_product([['a'],range(1000)]),columns=['A']).index.nbytes
-        DataFrame(1,index=pd.MultiIndex.from_product([['a'],range(1000)]),columns=['A']).index.values.nbytes
-        DataFrame(1,index=pd.MultiIndex.from_product([['a'],range(1000)]),columns=['A']).memory_usage(index=True)
-        DataFrame(1,index=pd.MultiIndex.from_product([['a'],range(1000)]),columns=['A']).index.nbytes
-        DataFrame(1,index=pd.MultiIndex.from_product([['a'],range(1000)]),columns=['A']).index.values.nbytes
-
-    def test_dtypes(self):
-        self.mixed_frame['bool'] = self.mixed_frame['A'] > 0
-        result = self.mixed_frame.dtypes
-        expected = Series(dict((k, v.dtype)
-                               for k, v in compat.iteritems(self.mixed_frame)),
-                          index=result.index)
-        assert_series_equal(result, expected)
-
-        # compat, GH 8722
-        with option_context('use_inf_as_null',True):
-            df = DataFrame([[1]])
-            result = df.dtypes
-            assert_series_equal(result,Series({0:np.dtype('int64')}))
-
-    def test_convert_objects(self):
-
-        oops = self.mixed_frame.T.T
-        converted = oops._convert(datetime=True)
-        assert_frame_equal(converted, self.mixed_frame)
-        self.assertEqual(converted['A'].dtype, np.float64)
-
-        # force numeric conversion
-        self.mixed_frame['H'] = '1.'
-        self.mixed_frame['I'] = '1'
-
-        # add in some items that will be nan
-        l = len(self.mixed_frame)
-        self.mixed_frame['J'] = '1.'
-        self.mixed_frame['K'] = '1'
-        self.mixed_frame.ix[0:5,['J','K']] = 'garbled'
-        converted = self.mixed_frame._convert(datetime=True, numeric=True)
-        self.assertEqual(converted['H'].dtype, 'float64')
-        self.assertEqual(converted['I'].dtype, 'int64')
-        self.assertEqual(converted['J'].dtype, 'float64')
-        self.assertEqual(converted['K'].dtype, 'float64')
-        self.assertEqual(len(converted['J'].dropna()), l-5)
-        self.assertEqual(len(converted['K'].dropna()), l-5)
-
-        # via astype
-        converted = self.mixed_frame.copy()
-        converted['H'] = converted['H'].astype('float64')
-        converted['I'] = converted['I'].astype('int64')
-        self.assertEqual(converted['H'].dtype, 'float64')
-        self.assertEqual(converted['I'].dtype, 'int64')
-
-        # via astype, but errors
-        converted = self.mixed_frame.copy()
-        with assertRaisesRegexp(ValueError, 'invalid literal'):
-            converted['H'].astype('int32')
-
-        # mixed in a single column
-        df = DataFrame(dict(s = Series([1, 'na', 3 ,4])))
-        result = df._convert(datetime=True, numeric=True)
-        expected = DataFrame(dict(s = Series([1, np.nan, 3 ,4])))
-        assert_frame_equal(result, expected)
-
-    def test_convert_objects_no_conversion(self):
-        mixed1 = DataFrame(
-            {'a': [1, 2, 3], 'b': [4.0, 5, 6], 'c': ['x', 'y', 'z']})
-        mixed2 = mixed1._convert(datetime=True)
-        assert_frame_equal(mixed1, mixed2)
-
-    def test_append_series_dict(self):
-        df = DataFrame(np.random.randn(5, 4),
-                       columns=['foo', 'bar', 'baz', 'qux'])
-
-        series = df.ix[4]
-        with  assertRaisesRegexp(ValueError, 'Indexes have overlapping values'):
-            df.append(series, verify_integrity=True)
-        series.name = None
-        with assertRaisesRegexp(TypeError, 'Can only append a Series if '
-                                'ignore_index=True'):
-            df.append(series, verify_integrity=True)
-
-        result = df.append(series[::-1], ignore_index=True)
-        expected = df.append(DataFrame({0: series[::-1]}, index=df.columns).T,
-                             ignore_index=True)
-        assert_frame_equal(result, expected)
-
-        # dict
-        result = df.append(series.to_dict(), ignore_index=True)
-        assert_frame_equal(result, expected)
-
-        result = df.append(series[::-1][:3], ignore_index=True)
-        expected = df.append(DataFrame({0: series[::-1][:3]}).T,
-                             ignore_index=True)
-        assert_frame_equal(result, expected.ix[:, result.columns])
-
-        # can append when name set
-        row = df.ix[4]
-        row.name = 5
-        result = df.append(row)
-        expected = df.append(df[-1:], ignore_index=True)
-        assert_frame_equal(result, expected)
-
-    def test_append_list_of_series_dicts(self):
-        df = DataFrame(np.random.randn(5, 4),
-                       columns=['foo', 'bar', 'baz', 'qux'])
-
-        dicts = [x.to_dict() for idx, x in df.iterrows()]
-
-        result = df.append(dicts, ignore_index=True)
-        expected = df.append(df, ignore_index=True)
-        assert_frame_equal(result, expected)
-
-        # different columns
-        dicts = [{'foo': 1, 'bar': 2, 'baz': 3, 'peekaboo': 4},
-                 {'foo': 5, 'bar': 6, 'baz': 7, 'peekaboo': 8}]
-        result = df.append(dicts, ignore_index=True)
-        expected = df.append(DataFrame(dicts), ignore_index=True)
-        assert_frame_equal(result, expected)
-
-    def test_append_empty_dataframe(self):
-
-        # Empty df append empty df
-        df1 = DataFrame([])
-        df2 = DataFrame([])
-        result = df1.append(df2)
-        expected = df1.copy()
-        assert_frame_equal(result, expected)
-
-        # Non-empty df append empty df
-        df1 = DataFrame(np.random.randn(5, 2))
-        df2 = DataFrame()
-        result = df1.append(df2)
-        expected = df1.copy()
-        assert_frame_equal(result, expected)
-
-        # Empty df with columns append empty df
-        df1 = DataFrame(columns=['bar', 'foo'])
-        df2 = DataFrame()
-        result = df1.append(df2)
-        expected = df1.copy()
-        assert_frame_equal(result, expected)
-
-        # Non-Empty df with columns append empty df
-        df1 = DataFrame(np.random.randn(5, 2), columns=['bar', 'foo'])
-        df2 = DataFrame()
-        result = df1.append(df2)
-        expected = df1.copy()
-        assert_frame_equal(result, expected)
-
-    def test_append_dtypes(self):
-
-        # GH 5754
-        # row appends of different dtypes (so need to do by-item)
-        # can sometimes infer the correct type
-
-        df1 = DataFrame({ 'bar' : Timestamp('20130101') }, index=lrange(5))
-        df2 = DataFrame()
-        result = df1.append(df2)
-        expected = df1.copy()
-        assert_frame_equal(result, expected)
-
-        df1 = DataFrame({ 'bar' : Timestamp('20130101') }, index=lrange(1))
-        df2 = DataFrame({ 'bar' : 'foo' }, index=lrange(1,2))
-        result = df1.append(df2)
-        expected = DataFrame({ 'bar' : [ Timestamp('20130101'), 'foo' ]})
-        assert_frame_equal(result, expected)
-
-        df1 = DataFrame({ 'bar' : Timestamp('20130101') }, index=lrange(1))
-        df2 = DataFrame({ 'bar' : np.nan }, index=lrange(1,2))
-        result = df1.append(df2)
-        expected = DataFrame({ 'bar' : Series([ Timestamp('20130101'), np.nan ],dtype='M8[ns]') })
-        assert_frame_equal(result, expected)
-
-        df1 = DataFrame({ 'bar' : Timestamp('20130101') }, index=lrange(1))
-        df2 = DataFrame({ 'bar' : np.nan }, index=lrange(1,2), dtype=object)
-        result = df1.append(df2)
-        expected = DataFrame({ 'bar' : Series([ Timestamp('20130101'), np.nan ],dtype='M8[ns]') })
-        assert_frame_equal(result, expected)
-
-        df1 = DataFrame({ 'bar' : np.nan }, index=lrange(1))
-        df2 = DataFrame({ 'bar' : Timestamp('20130101') }, index=lrange(1,2))
-        result = df1.append(df2)
-        expected = DataFrame({ 'bar' : Series([ np.nan, Timestamp('20130101')] ,dtype='M8[ns]') })
-        assert_frame_equal(result, expected)
-
-        df1 = DataFrame({ 'bar' : Timestamp('20130101') }, index=lrange(1))
-        df2 = DataFrame({ 'bar' : 1 }, index=lrange(1,2), dtype=object)
-        result = df1.append(df2)
-        expected = DataFrame({ 'bar' : Series([ Timestamp('20130101'), 1 ]) })
-        assert_frame_equal(result, expected)
-
-    def test_asfreq(self):
-        offset_monthly = self.tsframe.asfreq(datetools.bmonthEnd)
-        rule_monthly = self.tsframe.asfreq('BM')
-
-        assert_almost_equal(offset_monthly['A'], rule_monthly['A'])
-
-        filled = rule_monthly.asfreq('B', method='pad')
-        # TODO: actually check that this worked.
-
-        # don't forget!
-        filled_dep = rule_monthly.asfreq('B', method='pad')
-
-        # test does not blow up on length-0 DataFrame
-        zero_length = self.tsframe.reindex([])
-        result = zero_length.asfreq('BM')
-        self.assertIsNot(result, zero_length)
-
-    def test_asfreq_datetimeindex(self):
-        df = DataFrame({'A': [1, 2, 3]},
-                       index=[datetime(2011, 11, 1), datetime(2011, 11, 2),
-                              datetime(2011, 11, 3)])
-        df = df.asfreq('B')
-        tm.assertIsInstance(df.index, DatetimeIndex)
-
-        ts = df['A'].asfreq('B')
-        tm.assertIsInstance(ts.index, DatetimeIndex)
-
-    def test_at_time_between_time_datetimeindex(self):
-        index = date_range("2012-01-01", "2012-01-05", freq='30min')
-        df = DataFrame(randn(len(index), 5), index=index)
-        akey = time(12, 0, 0)
-        bkey = slice(time(13, 0, 0), time(14, 0, 0))
-        ainds = [24, 72, 120, 168]
-        binds = [26, 27, 28, 74, 75, 76, 122, 123, 124, 170, 171, 172]
-
-        result = df.at_time(akey)
-        expected = df.ix[akey]
-        expected2 = df.ix[ainds]
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result, expected2)
-        self.assertEqual(len(result), 4)
-
-        result = df.between_time(bkey.start, bkey.stop)
-        expected = df.ix[bkey]
-        expected2 = df.ix[binds]
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result, expected2)
-        self.assertEqual(len(result), 12)
-
-        result = df.copy()
-        result.ix[akey] = 0
-        result = result.ix[akey]
-        expected = df.ix[akey].copy()
-        expected.ix[:] = 0
-        assert_frame_equal(result, expected)
-
-        result = df.copy()
-        result.ix[akey] = 0
-        result.ix[akey] = df.ix[ainds]
-        assert_frame_equal(result, df)
-
-        result = df.copy()
-        result.ix[bkey] = 0
-        result = result.ix[bkey]
-        expected = df.ix[bkey].copy()
-        expected.ix[:] = 0
-        assert_frame_equal(result, expected)
-
-        result = df.copy()
-        result.ix[bkey] = 0
-        result.ix[bkey] = df.ix[binds]
-        assert_frame_equal(result, df)
-
-    def test_as_matrix(self):
-        frame = self.frame
-        mat = frame.as_matrix()
-
-        frameCols = frame.columns
-        for i, row in enumerate(mat):
-            for j, value in enumerate(row):
-                col = frameCols[j]
-                if np.isnan(value):
-                    self.assertTrue(np.isnan(frame[col][i]))
-                else:
-                    self.assertEqual(value, frame[col][i])
-
-        # mixed type
-        mat = self.mixed_frame.as_matrix(['foo', 'A'])
-        self.assertEqual(mat[0, 0], 'bar')
-
-        df = DataFrame({'real': [1, 2, 3], 'complex': [1j, 2j, 3j]})
-        mat = df.as_matrix()
-        self.assertEqual(mat[0, 0], 1j)
-
-        # single block corner case
-        mat = self.frame.as_matrix(['A', 'B'])
-        expected = self.frame.reindex(columns=['A', 'B']).values
-        assert_almost_equal(mat, expected)
-
-    def test_as_matrix_duplicates(self):
-        df = DataFrame([[1, 2, 'a', 'b'],
-                        [1, 2, 'a', 'b']],
-                       columns=['one', 'one', 'two', 'two'])
-
-        result = df.values
-        expected = np.array([[1, 2, 'a', 'b'], [1, 2, 'a', 'b']],
-                            dtype=object)
-
-        self.assertTrue(np.array_equal(result, expected))
-
-    def test_ftypes(self):
-        frame = self.mixed_float
-        expected = Series(dict(A = 'float32:dense',
-                               B = 'float32:dense',
-                               C = 'float16:dense',
-                               D = 'float64:dense')).sort_values()
-        result = frame.ftypes.sort_values()
-        assert_series_equal(result,expected)
-
-    def test_values(self):
-        self.frame.values[:, 0] = 5.
-        self.assertTrue((self.frame.values[:, 0] == 5).all())
-
-    def test_deepcopy(self):
-        cp = deepcopy(self.frame)
-        series = cp['A']
-        series[:] = 10
-        for idx, value in compat.iteritems(series):
-            self.assertNotEqual(self.frame['A'][idx], value)
-
-    def test_copy(self):
-        cop = self.frame.copy()
-        cop['E'] = cop['A']
-        self.assertNotIn('E', self.frame)
-
-        # copy objects
-        copy = self.mixed_frame.copy()
-        self.assertIsNot(copy._data, self.mixed_frame._data)
-
-    def _check_method(self, method='pearson', check_minp=False):
-        if not check_minp:
-            correls = self.frame.corr(method=method)
-            exp = self.frame['A'].corr(self.frame['C'], method=method)
-            assert_almost_equal(correls['A']['C'], exp)
-        else:
-            result = self.frame.corr(min_periods=len(self.frame) - 8)
-            expected = self.frame.corr()
-            expected.ix['A', 'B'] = expected.ix['B', 'A'] = nan
-
-    def test_corr_pearson(self):
-        tm._skip_if_no_scipy()
-        self.frame['A'][:5] = nan
-        self.frame['B'][5:10] = nan
-
-        self._check_method('pearson')
-
-    def test_corr_kendall(self):
-        tm._skip_if_no_scipy()
-        self.frame['A'][:5] = nan
-        self.frame['B'][5:10] = nan
-
-        self._check_method('kendall')
-
-    def test_corr_spearman(self):
-        tm._skip_if_no_scipy()
-        self.frame['A'][:5] = nan
-        self.frame['B'][5:10] = nan
-
-        self._check_method('spearman')
-
-    def test_corr_non_numeric(self):
-        tm._skip_if_no_scipy()
-        self.frame['A'][:5] = nan
-        self.frame['B'][5:10] = nan
-
-        # exclude non-numeric types
-        result = self.mixed_frame.corr()
-        expected = self.mixed_frame.ix[:, ['A', 'B', 'C', 'D']].corr()
-        assert_frame_equal(result, expected)
-
-    def test_corr_nooverlap(self):
-        tm._skip_if_no_scipy()
-
-        # nothing in common
-        for meth in ['pearson', 'kendall', 'spearman']:
-            df = DataFrame({'A': [1, 1.5, 1, np.nan, np.nan, np.nan],
-                            'B': [np.nan, np.nan, np.nan, 1, 1.5, 1]})
-            rs = df.corr(meth)
-            self.assertTrue(isnull(rs.ix['A', 'B']))
-            self.assertTrue(isnull(rs.ix['B', 'A']))
-            self.assertEqual(rs.ix['A', 'A'], 1)
-            self.assertEqual(rs.ix['B', 'B'], 1)
-
-    def test_corr_constant(self):
-        tm._skip_if_no_scipy()
-
-        # constant --> all NA
-
-        for meth in ['pearson', 'spearman']:
-            df = DataFrame({'A': [1, 1, 1, np.nan, np.nan, np.nan],
-                            'B': [np.nan, np.nan, np.nan, 1, 1, 1]})
-            rs = df.corr(meth)
-            self.assertTrue(isnull(rs.values).all())
-
-    def test_corr_int(self):
-        # dtypes other than float64 #1761
-        df3 = DataFrame({"a": [1, 2, 3, 4], "b": [1, 2, 3, 4]})
-
-        # it works!
-        df3.cov()
-        df3.corr()
-
-    def test_cov(self):
-        # min_periods no NAs (corner case)
-        expected = self.frame.cov()
-        result = self.frame.cov(min_periods=len(self.frame))
-
-        assert_frame_equal(expected, result)
-
-        result = self.frame.cov(min_periods=len(self.frame) + 1)
-        self.assertTrue(isnull(result.values).all())
-
-        # with NAs
-        frame = self.frame.copy()
-        frame['A'][:5] = nan
-        frame['B'][5:10] = nan
-        result = self.frame.cov(min_periods=len(self.frame) - 8)
-        expected = self.frame.cov()
-        expected.ix['A', 'B'] = np.nan
-        expected.ix['B', 'A'] = np.nan
-
-        # regular
-        self.frame['A'][:5] = nan
-        self.frame['B'][:10] = nan
-        cov = self.frame.cov()
-
-        assert_almost_equal(cov['A']['C'],
-                            self.frame['A'].cov(self.frame['C']))
-
-        # exclude non-numeric types
-        result = self.mixed_frame.cov()
-        expected = self.mixed_frame.ix[:, ['A', 'B', 'C', 'D']].cov()
-        assert_frame_equal(result, expected)
-
-        # Single column frame
-        df = DataFrame(np.linspace(0.0,1.0,10))
-        result = df.cov()
-        expected = DataFrame(np.cov(df.values.T).reshape((1,1)),
-                             index=df.columns,columns=df.columns)
-        assert_frame_equal(result, expected)
-        df.ix[0] = np.nan
-        result = df.cov()
-        expected = DataFrame(np.cov(df.values[1:].T).reshape((1,1)),
-                             index=df.columns,columns=df.columns)
-        assert_frame_equal(result, expected)
-
-    def test_corrwith(self):
-        a = self.tsframe
-        noise = Series(randn(len(a)), index=a.index)
-
-        b = self.tsframe + noise
-
-        # make sure order does not matter
-        b = b.reindex(columns=b.columns[::-1], index=b.index[::-1][10:])
-        del b['B']
-
-        colcorr = a.corrwith(b, axis=0)
-        assert_almost_equal(colcorr['A'], a['A'].corr(b['A']))
-
-        rowcorr = a.corrwith(b, axis=1)
-        assert_series_equal(rowcorr, a.T.corrwith(b.T, axis=0))
-
-        dropped = a.corrwith(b, axis=0, drop=True)
-        assert_almost_equal(dropped['A'], a['A'].corr(b['A']))
-        self.assertNotIn('B', dropped)
-
-        dropped = a.corrwith(b, axis=1, drop=True)
-        self.assertNotIn(a.index[-1], dropped.index)
-
-        # non time-series data
-        index = ['a', 'b', 'c', 'd', 'e']
-        columns = ['one', 'two', 'three', 'four']
-        df1 = DataFrame(randn(5, 4), index=index, columns=columns)
-        df2 = DataFrame(randn(4, 4), index=index[:4], columns=columns)
-        correls = df1.corrwith(df2, axis=1)
-        for row in index[:4]:
-            assert_almost_equal(correls[row], df1.ix[row].corr(df2.ix[row]))
-
-    def test_corrwith_with_objects(self):
-        df1 = tm.makeTimeDataFrame()
-        df2 = tm.makeTimeDataFrame()
-        cols = ['A', 'B', 'C', 'D']
-
-        df1['obj'] = 'foo'
-        df2['obj'] = 'bar'
-
-        result = df1.corrwith(df2)
-        expected = df1.ix[:, cols].corrwith(df2.ix[:, cols])
-        assert_series_equal(result, expected)
-
-        result = df1.corrwith(df2, axis=1)
-        expected = df1.ix[:, cols].corrwith(df2.ix[:, cols], axis=1)
-        assert_series_equal(result, expected)
-
-    def test_corrwith_series(self):
-        result = self.tsframe.corrwith(self.tsframe['A'])
-        expected = self.tsframe.apply(self.tsframe['A'].corr)
-
-        assert_series_equal(result, expected)
-
-    def test_corrwith_matches_corrcoef(self):
-        df1 = DataFrame(np.arange(10000), columns=['a'])
-        df2 = DataFrame(np.arange(10000)**2, columns=['a'])
-        c1 = df1.corrwith(df2)['a']
-        c2 = np.corrcoef(df1['a'],df2['a'])[0][1]
-
-        assert_almost_equal(c1, c2)
-        self.assertTrue(c1 < 1)
-
-    def test_drop_names(self):
-        df = DataFrame([[1, 2, 3],[3, 4, 5],[5, 6, 7]], index=['a', 'b', 'c'],
-                       columns=['d', 'e', 'f'])
-        df.index.name, df.columns.name = 'first', 'second'
-        df_dropped_b = df.drop('b')
-        df_dropped_e = df.drop('e', axis=1)
-        df_inplace_b, df_inplace_e = df.copy(), df.copy()
-        df_inplace_b.drop('b', inplace=True)
-        df_inplace_e.drop('e', axis=1, inplace=True)
-        for obj in (df_dropped_b, df_dropped_e, df_inplace_b, df_inplace_e):
-            self.assertEqual(obj.index.name, 'first')
-            self.assertEqual(obj.columns.name, 'second')
-        self.assertEqual(list(df.columns), ['d', 'e', 'f'])
-
-        self.assertRaises(ValueError, df.drop, ['g'])
-        self.assertRaises(ValueError, df.drop, ['g'], 1)
-
-        # errors = 'ignore'
-        dropped = df.drop(['g'], errors='ignore')
-        expected = Index(['a', 'b', 'c'], name='first')
-        self.assert_index_equal(dropped.index, expected)
-
-        dropped = df.drop(['b', 'g'], errors='ignore')
-        expected = Index(['a', 'c'], name='first')
-        self.assert_index_equal(dropped.index, expected)
-
-        dropped = df.drop(['g'], axis=1, errors='ignore')
-        expected = Index(['d', 'e', 'f'], name='second')
-        self.assert_index_equal(dropped.columns, expected)
-
-        dropped = df.drop(['d', 'g'], axis=1, errors='ignore')
-        expected = Index(['e', 'f'], name='second')
-        self.assert_index_equal(dropped.columns, expected)
-
-    def test_dropEmptyRows(self):
-        N = len(self.frame.index)
-        mat = randn(N)
-        mat[:5] = nan
-
-        frame = DataFrame({'foo': mat}, index=self.frame.index)
-        original = Series(mat, index=self.frame.index, name='foo')
-        expected = original.dropna()
-        inplace_frame1, inplace_frame2 = frame.copy(), frame.copy()
-
-        smaller_frame = frame.dropna(how='all')
-        # check that original was preserved
-        assert_series_equal(frame['foo'], original)
-        inplace_frame1.dropna(how='all', inplace=True)
-        assert_series_equal(smaller_frame['foo'], expected)
-        assert_series_equal(inplace_frame1['foo'], expected)
-
-        smaller_frame = frame.dropna(how='all', subset=['foo'])
-        inplace_frame2.dropna(how='all', subset=['foo'], inplace=True)
-        assert_series_equal(smaller_frame['foo'], expected)
-        assert_series_equal(inplace_frame2['foo'], expected)
-
-    def test_dropIncompleteRows(self):
-        N = len(self.frame.index)
-        mat = randn(N)
-        mat[:5] = nan
-
-        frame = DataFrame({'foo': mat}, index=self.frame.index)
-        frame['bar'] = 5
-        original = Series(mat, index=self.frame.index, name='foo')
-        inp_frame1, inp_frame2 = frame.copy(), frame.copy()
-
-        smaller_frame = frame.dropna()
-        assert_series_equal(frame['foo'], original)
-        inp_frame1.dropna(inplace=True)
-        self.assert_numpy_array_equal(smaller_frame['foo'], mat[5:])
-        self.assert_numpy_array_equal(inp_frame1['foo'], mat[5:])
-
-        samesize_frame = frame.dropna(subset=['bar'])
-        assert_series_equal(frame['foo'], original)
-        self.assertTrue((frame['bar'] == 5).all())
-        inp_frame2.dropna(subset=['bar'], inplace=True)
-        self.assertTrue(samesize_frame.index.equals(self.frame.index))
-        self.assertTrue(inp_frame2.index.equals(self.frame.index))
-
-    def test_dropna(self):
-        df = DataFrame(np.random.randn(6, 4))
-        df[2][:2] = nan
-
-        dropped = df.dropna(axis=1)
-        expected = df.ix[:, [0, 1, 3]]
-        inp = df.copy()
-        inp.dropna(axis=1, inplace=True)
-        assert_frame_equal(dropped, expected)
-        assert_frame_equal(inp, expected)
-
-        dropped = df.dropna(axis=0)
-        expected = df.ix[lrange(2, 6)]
-        inp = df.copy()
-        inp.dropna(axis=0, inplace=True)
-        assert_frame_equal(dropped, expected)
-        assert_frame_equal(inp, expected)
-
-        # threshold
-        dropped = df.dropna(axis=1, thresh=5)
-        expected = df.ix[:, [0, 1, 3]]
-        inp = df.copy()
-        inp.dropna(axis=1, thresh=5, inplace=True)
-        assert_frame_equal(dropped, expected)
-        assert_frame_equal(inp, expected)
-
-        dropped = df.dropna(axis=0, thresh=4)
-        expected = df.ix[lrange(2, 6)]
-        inp = df.copy()
-        inp.dropna(axis=0, thresh=4, inplace=True)
-        assert_frame_equal(dropped, expected)
-        assert_frame_equal(inp, expected)
-
-        dropped = df.dropna(axis=1, thresh=4)
-        assert_frame_equal(dropped, df)
-
-        dropped = df.dropna(axis=1, thresh=3)
-        assert_frame_equal(dropped, df)
-
-        # subset
-        dropped = df.dropna(axis=0, subset=[0, 1, 3])
-        inp = df.copy()
-        inp.dropna(axis=0, subset=[0, 1, 3], inplace=True)
-        assert_frame_equal(dropped, df)
-        assert_frame_equal(inp, df)
-
-        # all
-        dropped = df.dropna(axis=1, how='all')
-        assert_frame_equal(dropped, df)
-
-        df[2] = nan
-        dropped = df.dropna(axis=1, how='all')
-        expected = df.ix[:, [0, 1, 3]]
-        assert_frame_equal(dropped, expected)
-
-        # bad input
-        self.assertRaises(ValueError, df.dropna, axis=3)
-
-
-    def test_drop_and_dropna_caching(self):
-        # tst that cacher updates
-        original = Series([1, 2, np.nan], name='A')
-        expected = Series([1, 2], dtype=original.dtype, name='A')
-        df = pd.DataFrame({'A': original.values.copy()})
-        df2 = df.copy()
-        df['A'].dropna()
-        assert_series_equal(df['A'], original)
-        df['A'].dropna(inplace=True)
-        assert_series_equal(df['A'], expected)
-        df2['A'].drop([1])
-        assert_series_equal(df2['A'], original)
-        df2['A'].drop([1], inplace=True)
-        assert_series_equal(df2['A'], original.drop([1]))
-
-    def test_dropna_corner(self):
-        # bad input
-        self.assertRaises(ValueError, self.frame.dropna, how='foo')
-        self.assertRaises(TypeError, self.frame.dropna, how=None)
-        # non-existent column - 8303
-        self.assertRaises(KeyError, self.frame.dropna, subset=['A','X'])
-
-    def test_dropna_multiple_axes(self):
-        df = DataFrame([[1, np.nan, 2, 3],
-                        [4, np.nan, 5, 6],
-                        [np.nan, np.nan, np.nan, np.nan],
-                        [7, np.nan, 8, 9]])
-        cp = df.copy()
-        result = df.dropna(how='all', axis=[0, 1])
-        result2 = df.dropna(how='all', axis=(0, 1))
-        expected = df.dropna(how='all').dropna(how='all', axis=1)
-
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
-        assert_frame_equal(df, cp)
-
-        inp = df.copy()
-        inp.dropna(how='all', axis=(0, 1), inplace=True)
-        assert_frame_equal(inp, expected)
-
-    def test_drop_duplicates(self):
-        df = DataFrame({'AAA': ['foo', 'bar', 'foo', 'bar',
-                                'foo', 'bar', 'bar', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': [1, 1, 2, 2, 2, 2, 1, 2],
-                        'D': lrange(8)})
-
-        # single column
-        result = df.drop_duplicates('AAA')
-        expected = df[:2]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('AAA', keep='last')
-        expected = df.ix[[6, 7]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('AAA', keep=False)
-        expected = df.ix[[]]
-        assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 0)
-
-        # deprecate take_last
-        with tm.assert_produces_warning(FutureWarning):
-            result = df.drop_duplicates('AAA', take_last=True)
-            expected = df.ix[[6, 7]]
-            assert_frame_equal(result, expected)
-
-        # multi column
-        expected = df.ix[[0, 1, 2, 3]]
-        result = df.drop_duplicates(np.array(['AAA', 'B']))
-        assert_frame_equal(result, expected)
-        result = df.drop_duplicates(['AAA', 'B'])
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(('AAA', 'B'), keep='last')
-        expected = df.ix[[0, 5, 6, 7]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(('AAA', 'B'), keep=False)
-        expected = df.ix[[0]]
-        assert_frame_equal(result, expected)
-
-        # deprecate take_last
-        with tm.assert_produces_warning(FutureWarning):
-            result = df.drop_duplicates(('AAA', 'B'), take_last=True)
-        expected = df.ix[[0, 5, 6, 7]]
-        assert_frame_equal(result, expected)
-
-        # consider everything
-        df2 = df.ix[:, ['AAA', 'B', 'C']]
-
-        result = df2.drop_duplicates()
-        # in this case only
-        expected = df2.drop_duplicates(['AAA', 'B'])
-        assert_frame_equal(result, expected)
-
-        result = df2.drop_duplicates(keep='last')
-        expected = df2.drop_duplicates(['AAA', 'B'], keep='last')
-        assert_frame_equal(result, expected)
-
-        result = df2.drop_duplicates(keep=False)
-        expected = df2.drop_duplicates(['AAA', 'B'], keep=False)
-        assert_frame_equal(result, expected)
-
-        # deprecate take_last
-        with tm.assert_produces_warning(FutureWarning):
-            result = df2.drop_duplicates(take_last=True)
-        with tm.assert_produces_warning(FutureWarning):
-            expected = df2.drop_duplicates(['AAA', 'B'], take_last=True)
-        assert_frame_equal(result, expected)
-
-        # integers
-        result = df.drop_duplicates('C')
-        expected = df.iloc[[0,2]]
-        assert_frame_equal(result, expected)
-        result = df.drop_duplicates('C',keep='last')
-        expected = df.iloc[[-2,-1]]
-        assert_frame_equal(result, expected)
-
-        df['E'] = df['C'].astype('int8')
-        result = df.drop_duplicates('E')
-        expected = df.iloc[[0,2]]
-        assert_frame_equal(result, expected)
-        result = df.drop_duplicates('E',keep='last')
-        expected = df.iloc[[-2,-1]]
-        assert_frame_equal(result, expected)
-
-    def test_drop_duplicates_for_take_all(self):
-        df = DataFrame({'AAA': ['foo', 'bar', 'baz', 'bar',
-                                'foo', 'bar', 'qux', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': [1, 1, 2, 2, 2, 2, 1, 2],
-                        'D': lrange(8)})
-
-        # single column
-        result = df.drop_duplicates('AAA')
-        expected = df.iloc[[0, 1, 2, 6]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('AAA', keep='last')
-        expected = df.iloc[[2, 5, 6, 7]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('AAA', keep=False)
-        expected = df.iloc[[2, 6]]
-        assert_frame_equal(result, expected)
-
-        # multiple columns
-        result = df.drop_duplicates(['AAA', 'B'])
-        expected = df.iloc[[0, 1, 2, 3, 4, 6]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(['AAA', 'B'], keep='last')
-        expected = df.iloc[[0, 1, 2, 5, 6, 7]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(['AAA', 'B'], keep=False)
-        expected = df.iloc[[0, 1, 2, 6]]
-        assert_frame_equal(result, expected)
-
-    def test_drop_duplicates_deprecated_warning(self):
-        df = DataFrame({'AAA': ['foo', 'bar', 'foo', 'bar',
-                                'foo', 'bar', 'bar', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': [1, 1, 2, 2, 2, 2, 1, 2],
-                        'D': lrange(8)})
-        expected = df[:2]
-
-        # Raises warning
-        with tm.assert_produces_warning(False):
-            result = df.drop_duplicates(subset='AAA')
-        assert_frame_equal(result, expected)
-
-        with tm.assert_produces_warning(FutureWarning):
-            result = df.drop_duplicates(cols='AAA')
-        assert_frame_equal(result, expected)
-
-        # Does not allow both subset and cols
-        self.assertRaises(TypeError, df.drop_duplicates,
-                          kwargs={'cols': 'AAA', 'subset': 'B'})
-
-        # Does not allow unknown kwargs
-        self.assertRaises(TypeError, df.drop_duplicates,
-                          kwargs={'subset': 'AAA', 'bad_arg': True})
-
-        # deprecate take_last
-        # Raises warning
-        with tm.assert_produces_warning(FutureWarning):
-            result = df.drop_duplicates(take_last=False, subset='AAA')
-        assert_frame_equal(result, expected)
-
-        self.assertRaises(ValueError, df.drop_duplicates, keep='invalid_name')
-
-    def test_drop_duplicates_tuple(self):
-        df = DataFrame({('AA', 'AB'): ['foo', 'bar', 'foo', 'bar',
-                                       'foo', 'bar', 'bar', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': [1, 1, 2, 2, 2, 2, 1, 2],
-                        'D': lrange(8)})
-
-        # single column
-        result = df.drop_duplicates(('AA', 'AB'))
-        expected = df[:2]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(('AA', 'AB'), keep='last')
-        expected = df.ix[[6, 7]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(('AA', 'AB'), keep=False)
-        expected = df.ix[[]] # empty df
-        self.assertEqual(len(result), 0)
-        assert_frame_equal(result, expected)
-
-        # deprecate take_last
-        with tm.assert_produces_warning(FutureWarning):
-            result = df.drop_duplicates(('AA', 'AB'), take_last=True)
-        expected = df.ix[[6, 7]]
-        assert_frame_equal(result, expected)
-
-        # multi column
-        expected = df.ix[[0, 1, 2, 3]]
-        result = df.drop_duplicates((('AA', 'AB'), 'B'))
-        assert_frame_equal(result, expected)
-
-    def test_drop_duplicates_NA(self):
-        # none
-        df = DataFrame({'A': [None, None, 'foo', 'bar',
-                              'foo', 'bar', 'bar', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': [1.0, np.nan, np.nan, np.nan, 1., 1., 1, 1.],
-                        'D': lrange(8)})
-
-        # single column
-        result = df.drop_duplicates('A')
-        expected = df.ix[[0, 2, 3]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('A', keep='last')
-        expected = df.ix[[1, 6, 7]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('A', keep=False)
-        expected = df.ix[[]] # empty df
-        assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 0)
-
-        # deprecate take_last
-        with tm.assert_produces_warning(FutureWarning):
-            result = df.drop_duplicates('A', take_last=True)
-        expected = df.ix[[1, 6, 7]]
-        assert_frame_equal(result, expected)
-
-        # multi column
-        result = df.drop_duplicates(['A', 'B'])
-        expected = df.ix[[0, 2, 3, 6]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(['A', 'B'], keep='last')
-        expected = df.ix[[1, 5, 6, 7]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(['A', 'B'], keep=False)
-        expected = df.ix[[6]]
-        assert_frame_equal(result, expected)
-
-        # deprecate take_last
-        with tm.assert_produces_warning(FutureWarning):
-            result = df.drop_duplicates(['A', 'B'], take_last=True)
-        expected = df.ix[[1, 5, 6, 7]]
-        assert_frame_equal(result, expected)
-
-        # nan
-        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                              'foo', 'bar', 'bar', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': [1.0, np.nan, np.nan, np.nan, 1., 1., 1, 1.],
-                        'D': lrange(8)})
-
-        # single column
-        result = df.drop_duplicates('C')
-        expected = df[:2]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('C', keep='last')
-        expected = df.ix[[3, 7]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('C', keep=False)
-        expected = df.ix[[]] # empty df
-        assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 0)
-
-        # deprecate take_last
-        with tm.assert_produces_warning(FutureWarning):
-            result = df.drop_duplicates('C', take_last=True)
-        expected = df.ix[[3, 7]]
-        assert_frame_equal(result, expected)
-
-        # multi column
-        result = df.drop_duplicates(['C', 'B'])
-        expected = df.ix[[0, 1, 2, 4]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(['C', 'B'], keep='last')
-        expected = df.ix[[1, 3, 6, 7]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(['C', 'B'], keep=False)
-        expected = df.ix[[1]]
-        assert_frame_equal(result, expected)
-
-        # deprecate take_last
-        with tm.assert_produces_warning(FutureWarning):
-            result = df.drop_duplicates(['C', 'B'], take_last=True)
-        expected = df.ix[[1, 3, 6, 7]]
-        assert_frame_equal(result, expected)
-
-    def test_drop_duplicates_NA_for_take_all(self):
-        # none
-        df = DataFrame({'A': [None, None, 'foo', 'bar',
-                              'foo', 'baz', 'bar', 'qux'],
-                        'C': [1.0, np.nan, np.nan, np.nan, 1., 2., 3, 1.]})
-
-        # single column
-        result = df.drop_duplicates('A')
-        expected = df.iloc[[0, 2, 3, 5, 7]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('A', keep='last')
-        expected = df.iloc[[1, 4, 5, 6, 7]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('A', keep=False)
-        expected = df.iloc[[5, 7]]
-        assert_frame_equal(result, expected)
-
-        # nan
-
-        # single column
-        result = df.drop_duplicates('C')
-        expected = df.iloc[[0, 1, 5, 6]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('C', keep='last')
-        expected = df.iloc[[3, 5, 6, 7]]
-        assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('C', keep=False)
-        expected = df.iloc[[5, 6]]
-        assert_frame_equal(result, expected)
-
-    def test_drop_duplicates_inplace(self):
-        orig = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                                'foo', 'bar', 'bar', 'foo'],
-                          'B': ['one', 'one', 'two', 'two',
-                                'two', 'two', 'one', 'two'],
-                          'C': [1, 1, 2, 2, 2, 2, 1, 2],
-                          'D': lrange(8)})
-
-        # single column
-        df = orig.copy()
-        df.drop_duplicates('A', inplace=True)
-        expected = orig[:2]
-        result = df
-        assert_frame_equal(result, expected)
-
-        df = orig.copy()
-        df.drop_duplicates('A', keep='last', inplace=True)
-        expected = orig.ix[[6, 7]]
-        result = df
-        assert_frame_equal(result, expected)
-
-        df = orig.copy()
-        df.drop_duplicates('A', keep=False, inplace=True)
-        expected = orig.ix[[]]
-        result = df
-        assert_frame_equal(result, expected)
-        self.assertEqual(len(df), 0)
-
-        # deprecate take_last
-        df = orig.copy()
-        with tm.assert_produces_warning(FutureWarning):
-            df.drop_duplicates('A', take_last=True, inplace=True)
-        expected = orig.ix[[6, 7]]
-        result = df
-        assert_frame_equal(result, expected)
-
-        # multi column
-        df = orig.copy()
-        df.drop_duplicates(['A', 'B'], inplace=True)
-        expected = orig.ix[[0, 1, 2, 3]]
-        result = df
-        assert_frame_equal(result, expected)
-
-        df = orig.copy()
-        df.drop_duplicates(['A', 'B'], keep='last', inplace=True)
-        expected = orig.ix[[0, 5, 6, 7]]
-        result = df
-        assert_frame_equal(result, expected)
-
-        df = orig.copy()
-        df.drop_duplicates(['A', 'B'], keep=False, inplace=True)
-        expected = orig.ix[[0]]
-        result = df
-        assert_frame_equal(result, expected)
-
-        # deprecate take_last
-        df = orig.copy()
-        with tm.assert_produces_warning(FutureWarning):
-            df.drop_duplicates(['A', 'B'], take_last=True, inplace=True)
-        expected = orig.ix[[0, 5, 6, 7]]
-        result = df
-        assert_frame_equal(result, expected)
-
-        # consider everything
-        orig2 = orig.ix[:, ['A', 'B', 'C']].copy()
-
-        df2 = orig2.copy()
-        df2.drop_duplicates(inplace=True)
-        # in this case only
-        expected = orig2.drop_duplicates(['A', 'B'])
-        result = df2
-        assert_frame_equal(result, expected)
-
-        df2 = orig2.copy()
-        df2.drop_duplicates(keep='last', inplace=True)
-        expected = orig2.drop_duplicates(['A', 'B'], keep='last')
-        result = df2
-        assert_frame_equal(result, expected)
-
-        df2 = orig2.copy()
-        df2.drop_duplicates(keep=False, inplace=True)
-        expected = orig2.drop_duplicates(['A', 'B'], keep=False)
-        result = df2
-        assert_frame_equal(result, expected)
-
-        # deprecate take_last
-        df2 = orig2.copy()
-        with tm.assert_produces_warning(FutureWarning):
-            df2.drop_duplicates(take_last=True, inplace=True)
-        with tm.assert_produces_warning(FutureWarning):
-            expected = orig2.drop_duplicates(['A', 'B'], take_last=True)
-        result = df2
-        assert_frame_equal(result, expected)
-
-    def test_duplicated_deprecated_warning(self):
-        df = DataFrame({'AAA': ['foo', 'bar', 'foo', 'bar',
-                                'foo', 'bar', 'bar', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': [1, 1, 2, 2, 2, 2, 1, 2],
-                        'D': lrange(8)})
-
-        # Raises warning
-        with tm.assert_produces_warning(False):
-            result = df.duplicated(subset='AAA')
-
-        with tm.assert_produces_warning(FutureWarning):
-            result = df.duplicated(cols='AAA')
-
-        # Does not allow both subset and cols
-        self.assertRaises(TypeError, df.duplicated,
-                          kwargs={'cols': 'AAA', 'subset': 'B'})
-
-        # Does not allow unknown kwargs
-        self.assertRaises(TypeError, df.duplicated,
-                          kwargs={'subset': 'AAA', 'bad_arg': True})
-
-    def test_drop_col_still_multiindex(self):
-        arrays = [['a', 'b', 'c', 'top'],
-                  ['', '', '', 'OD'],
-                  ['', '', '', 'wx']]
-
-        tuples = sorted(zip(*arrays))
-        index = MultiIndex.from_tuples(tuples)
-
-        df = DataFrame(randn(3, 4), columns=index)
-        del df[('a', '', '')]
-        assert(isinstance(df.columns, MultiIndex))
-
-    def test_drop(self):
-        simple = DataFrame({"A": [1, 2, 3, 4], "B": [0, 1, 2, 3]})
-        assert_frame_equal(simple.drop("A", axis=1), simple[['B']])
-        assert_frame_equal(simple.drop(["A", "B"], axis='columns'),
-                           simple[[]])
-        assert_frame_equal(simple.drop([0, 1, 3], axis=0), simple.ix[[2], :])
-        assert_frame_equal(simple.drop([0, 3], axis='index'), simple.ix[[1, 2], :])
-
-        self.assertRaises(ValueError, simple.drop, 5)
-        self.assertRaises(ValueError, simple.drop, 'C', 1)
-        self.assertRaises(ValueError, simple.drop, [1, 5])
-        self.assertRaises(ValueError, simple.drop, ['A', 'C'], 1)
-
-        # errors = 'ignore'
-        assert_frame_equal(simple.drop(5, errors='ignore'), simple)
-        assert_frame_equal(simple.drop([0, 5], errors='ignore'),
-                           simple.ix[[1, 2, 3], :])
-        assert_frame_equal(simple.drop('C', axis=1, errors='ignore'), simple)
-        assert_frame_equal(simple.drop(['A', 'C'], axis=1, errors='ignore'),
-                           simple[['B']])
-
-        #non-unique - wheee!
-        nu_df = DataFrame(lzip(range(3), range(-3, 1), list('abc')),
-                          columns=['a', 'a', 'b'])
-        assert_frame_equal(nu_df.drop('a', axis=1), nu_df[['b']])
-        assert_frame_equal(nu_df.drop('b', axis='columns'), nu_df['a'])
-
-        nu_df = nu_df.set_index(pd.Index(['X', 'Y', 'X']))
-        nu_df.columns = list('abc')
-        assert_frame_equal(nu_df.drop('X', axis='rows'), nu_df.ix[["Y"], :])
-        assert_frame_equal(nu_df.drop(['X', 'Y'], axis=0), nu_df.ix[[], :])
-
-        # inplace cache issue
-        # GH 5628
-        df = pd.DataFrame(np.random.randn(10,3), columns=list('abc'))
-        expected = df[~(df.b>0)]
-        df.drop(labels=df[df.b>0].index, inplace=True)
-        assert_frame_equal(df,expected)
-
-    def test_fillna(self):
-        self.tsframe.ix[:5,'A'] = nan
-        self.tsframe.ix[-5:,'A'] = nan
-
-        zero_filled = self.tsframe.fillna(0)
-        self.assertTrue((zero_filled.ix[:5,'A'] == 0).all())
-
-        padded = self.tsframe.fillna(method='pad')
-        self.assertTrue(np.isnan(padded.ix[:5,'A']).all())
-        self.assertTrue((padded.ix[-5:,'A'] == padded.ix[-5,'A']).all())
-
-        # mixed type
-        self.mixed_frame.ix[5:20,'foo'] = nan
-        self.mixed_frame.ix[-10:,'A'] = nan
-        result = self.mixed_frame.fillna(value=0)
-        result = self.mixed_frame.fillna(method='pad')
-
-        self.assertRaises(ValueError, self.tsframe.fillna)
-        self.assertRaises(ValueError, self.tsframe.fillna, 5, method='ffill')
-
-        # mixed numeric (but no float16)
-        mf = self.mixed_float.reindex(columns=['A','B','D'])
-        mf.ix[-10:,'A'] = nan
-        result = mf.fillna(value=0)
-        _check_mixed_float(result, dtype = dict(C = None))
-
-        result = mf.fillna(method='pad')
-        _check_mixed_float(result, dtype = dict(C = None))
-
-        # empty frame (GH #2778)
-        df = DataFrame(columns=['x'])
-        for m in ['pad','backfill']:
-            df.x.fillna(method=m,inplace=1)
-            df.x.fillna(method=m)
-
-        # with different dtype (GH3386)
-        df = DataFrame([['a','a',np.nan,'a'],['b','b',np.nan,'b'],['c','c',np.nan,'c']])
-
-        result = df.fillna({ 2: 'foo' })
-        expected = DataFrame([['a','a','foo','a'],['b','b','foo','b'],['c','c','foo','c']])
-        assert_frame_equal(result, expected)
-
-        df.fillna({ 2: 'foo' }, inplace=True)
-        assert_frame_equal(df, expected)
-
-        # limit and value
-        df = DataFrame(np.random.randn(10,3))
-        df.iloc[2:7,0] = np.nan
-        df.iloc[3:5,2] = np.nan
-
-        expected = df.copy()
-        expected.iloc[2,0] = 999
-        expected.iloc[3,2] = 999
-        result = df.fillna(999,limit=1)
-        assert_frame_equal(result, expected)
-
-        # with datelike
-        # GH 6344
-        df = DataFrame({
-            'Date':[pd.NaT, Timestamp("2014-1-1")],
-            'Date2':[ Timestamp("2013-1-1"), pd.NaT]
-            })
-
-        expected = df.copy()
-        expected['Date'] = expected['Date'].fillna(df.ix[0,'Date2'])
-        result = df.fillna(value={'Date':df['Date2']})
-        assert_frame_equal(result, expected)
-
-    def test_fillna_dtype_conversion(self):
-        # make sure that fillna on an empty frame works
-        df = DataFrame(index=["A","B","C"], columns = [1,2,3,4,5])
-        result = df.get_dtype_counts().sort_values()
-        expected = Series({ 'object' : 5 })
-        assert_series_equal(result, expected)
-
-        result = df.fillna(1)
-        expected = DataFrame(1, index=["A","B","C"], columns = [1,2,3,4,5])
-        result = result.get_dtype_counts().sort_values()
-        expected = Series({ 'int64' : 5 })
-        assert_series_equal(result, expected)
-
-        # empty block
-        df = DataFrame(index=lrange(3),columns=['A','B'],dtype='float64')
-        result = df.fillna('nan')
-        expected = DataFrame('nan',index=lrange(3),columns=['A','B'])
-        assert_frame_equal(result, expected)
-
-        # equiv of replace
-        df = DataFrame(dict(A = [1,np.nan], B = [1.,2.]))
-        for v in ['',1,np.nan,1.0]:
-            expected = df.replace(np.nan,v)
-            result = df.fillna(v)
-            assert_frame_equal(result, expected)
-
-    def test_fillna_datetime_columns(self):
-        # GH 7095
-        df = pd.DataFrame({'A': [-1, -2, np.nan],
-                           'B': date_range('20130101', periods=3),
-                           'C': ['foo', 'bar', None],
-                           'D': ['foo2', 'bar2', None]},
-                          index=date_range('20130110', periods=3))
-        result = df.fillna('?')
-        expected = pd.DataFrame({'A': [-1, -2, '?'],
-                                 'B': date_range('20130101', periods=3),
-                                 'C': ['foo', 'bar', '?'],
-                                 'D': ['foo2', 'bar2', '?']},
-                                index=date_range('20130110', periods=3))
-        self.assert_frame_equal(result, expected)
-
-        df = pd.DataFrame({'A': [-1, -2, np.nan],
-                           'B': [pd.Timestamp('2013-01-01'), pd.Timestamp('2013-01-02'), pd.NaT],
-                           'C': ['foo', 'bar', None],
-                           'D': ['foo2', 'bar2', None]},
-                          index=date_range('20130110', periods=3))
-        result = df.fillna('?')
-        expected = pd.DataFrame({'A': [-1, -2, '?'],
-                                 'B': [pd.Timestamp('2013-01-01'), pd.Timestamp('2013-01-02'), '?'],
-                                 'C': ['foo', 'bar', '?'],
-                                 'D': ['foo2', 'bar2', '?']},
-                                index=date_range('20130110', periods=3))
-        self.assert_frame_equal(result, expected)
-
-    def test_ffill(self):
-        self.tsframe['A'][:5] = nan
-        self.tsframe['A'][-5:] = nan
-
-        assert_frame_equal(self.tsframe.ffill(),
-                           self.tsframe.fillna(method='ffill'))
-
-    def test_bfill(self):
-        self.tsframe['A'][:5] = nan
-        self.tsframe['A'][-5:] = nan
-
-        assert_frame_equal(self.tsframe.bfill(),
-                           self.tsframe.fillna(method='bfill'))
-
-    def test_fillna_skip_certain_blocks(self):
-        # don't try to fill boolean, int blocks
-
-        df = DataFrame(np.random.randn(10, 4).astype(int))
-
-        # it works!
-        df.fillna(np.nan)
-
-    def test_fillna_inplace(self):
-        df = DataFrame(np.random.randn(10, 4))
-        df[1][:4] = np.nan
-        df[3][-4:] = np.nan
-
-        expected = df.fillna(value=0)
-        self.assertIsNot(expected, df)
-
-        df.fillna(value=0, inplace=True)
-        assert_frame_equal(df, expected)
-
-        df[1][:4] = np.nan
-        df[3][-4:] = np.nan
-        expected = df.fillna(method='ffill')
-        self.assertIsNot(expected, df)
-
-        df.fillna(method='ffill', inplace=True)
-        assert_frame_equal(df, expected)
-
-    def test_fillna_dict_series(self):
-        df = DataFrame({'a': [nan, 1, 2, nan, nan],
-                        'b': [1, 2, 3, nan, nan],
-                        'c': [nan, 1, 2, 3, 4]})
-
-        result = df.fillna({'a': 0, 'b': 5})
-
-        expected = df.copy()
-        expected['a'] = expected['a'].fillna(0)
-        expected['b'] = expected['b'].fillna(5)
-        assert_frame_equal(result, expected)
-
-        # it works
-        result = df.fillna({'a': 0, 'b': 5, 'd': 7})
-
-        # Series treated same as dict
-        result = df.fillna(df.max())
-        expected = df.fillna(df.max().to_dict())
-        assert_frame_equal(result, expected)
-
-        # disable this for now
-        with assertRaisesRegexp(NotImplementedError, 'column by column'):
-            df.fillna(df.max(1), axis=1)
-
-    def test_fillna_dataframe(self):
-        # GH 8377
-        df = DataFrame({'a': [nan, 1, 2, nan, nan],
-                        'b': [1, 2, 3, nan, nan],
-                        'c': [nan, 1, 2, 3, 4]},
-                       index = list('VWXYZ'))
-
-        # df2 may have different index and columns
-        df2 = DataFrame({'a': [nan, 10, 20, 30, 40],
-                         'b': [50, 60, 70, 80, 90],
-                         'foo': ['bar']*5},
-                        index = list('VWXuZ'))
-
-        result = df.fillna(df2)
-
-        # only those columns and indices which are shared get filled
-        expected = DataFrame({'a': [nan, 1, 2, nan, 40],
-                              'b': [1, 2, 3, nan, 90],
-                              'c': [nan, 1, 2, 3, 4]},
-                             index = list('VWXYZ'))
-
-        assert_frame_equal(result, expected)
-
-    def test_fillna_columns(self):
-        df = DataFrame(np.random.randn(10, 10))
-        df.values[:, ::2] = np.nan
-
-        result = df.fillna(method='ffill', axis=1)
-        expected = df.T.fillna(method='pad').T
-        assert_frame_equal(result, expected)
-
-        df.insert(6, 'foo', 5)
-        result = df.fillna(method='ffill', axis=1)
-        expected = df.astype(float).fillna(method='ffill', axis=1)
-        assert_frame_equal(result, expected)
-
-
-    def test_fillna_invalid_method(self):
-        with assertRaisesRegexp(ValueError, 'ffil'):
-            self.frame.fillna(method='ffil')
-
-    def test_fillna_invalid_value(self):
-        # list
-        self.assertRaises(TypeError, self.frame.fillna, [1, 2])
-        # tuple
-        self.assertRaises(TypeError, self.frame.fillna, (1, 2))
-        # frame with series
-        self.assertRaises(ValueError, self.frame.iloc[:,0].fillna, self.frame)
-
-    def test_replace_inplace(self):
-        self.tsframe['A'][:5] = nan
-        self.tsframe['A'][-5:] = nan
-
-        tsframe = self.tsframe.copy()
-        tsframe.replace(nan, 0, inplace=True)
-        assert_frame_equal(tsframe, self.tsframe.fillna(0))
-
-        self.assertRaises(TypeError, self.tsframe.replace, nan, inplace=True)
-        self.assertRaises(TypeError, self.tsframe.replace, nan)
-
-        # mixed type
-        self.mixed_frame.ix[5:20,'foo'] = nan
-        self.mixed_frame.ix[-10:,'A'] = nan
-
-        result = self.mixed_frame.replace(np.nan, 0)
-        expected = self.mixed_frame.fillna(value=0)
-        assert_frame_equal(result, expected)
-
-        tsframe = self.tsframe.copy()
-        tsframe.replace([nan], [0], inplace=True)
-        assert_frame_equal(tsframe, self.tsframe.fillna(0))
-
-    def test_regex_replace_scalar(self):
-        obj = {'a': list('ab..'), 'b': list('efgh')}
-        dfobj = DataFrame(obj)
-        mix = {'a': lrange(4), 'b': list('ab..')}
-        dfmix = DataFrame(mix)
-
-        ### simplest cases
-        ## regex -> value
-        # obj frame
-        res = dfobj.replace(r'\s*\.\s*', nan, regex=True)
-        assert_frame_equal(dfobj, res.fillna('.'))
-
-        # mixed
-        res = dfmix.replace(r'\s*\.\s*', nan, regex=True)
-        assert_frame_equal(dfmix, res.fillna('.'))
-
-        ## regex -> regex
-        # obj frame
-        res = dfobj.replace(r'\s*(\.)\s*', r'\1\1\1', regex=True)
-        objc = obj.copy()
-        objc['a'] = ['a', 'b', '...', '...']
-        expec = DataFrame(objc)
-        assert_frame_equal(res, expec)
-
-        # with mixed
-        res = dfmix.replace(r'\s*(\.)\s*', r'\1\1\1', regex=True)
-        mixc = mix.copy()
-        mixc['b'] = ['a', 'b', '...', '...']
-        expec = DataFrame(mixc)
-        assert_frame_equal(res, expec)
-
-        # everything with compiled regexs as well
-        res = dfobj.replace(re.compile(r'\s*\.\s*'), nan, regex=True)
-        assert_frame_equal(dfobj, res.fillna('.'))
-
-        # mixed
-        res = dfmix.replace(re.compile(r'\s*\.\s*'), nan, regex=True)
-        assert_frame_equal(dfmix, res.fillna('.'))
-
-        ## regex -> regex
-        # obj frame
-        res = dfobj.replace(re.compile(r'\s*(\.)\s*'), r'\1\1\1')
-        objc = obj.copy()
-        objc['a'] = ['a', 'b', '...', '...']
-        expec = DataFrame(objc)
-        assert_frame_equal(res, expec)
-
-        # with mixed
-        res = dfmix.replace(re.compile(r'\s*(\.)\s*'), r'\1\1\1')
-        mixc = mix.copy()
-        mixc['b'] = ['a', 'b', '...', '...']
-        expec = DataFrame(mixc)
-        assert_frame_equal(res, expec)
-
-        res = dfmix.replace(regex=re.compile(r'\s*(\.)\s*'), value=r'\1\1\1')
-        mixc = mix.copy()
-        mixc['b'] = ['a', 'b', '...', '...']
-        expec = DataFrame(mixc)
-        assert_frame_equal(res, expec)
-
-        res = dfmix.replace(regex=r'\s*(\.)\s*', value=r'\1\1\1')
-        mixc = mix.copy()
-        mixc['b'] = ['a', 'b', '...', '...']
-        expec = DataFrame(mixc)
-        assert_frame_equal(res, expec)
-
-    def test_regex_replace_scalar_inplace(self):
-        obj = {'a': list('ab..'), 'b': list('efgh')}
-        dfobj = DataFrame(obj)
-        mix = {'a': lrange(4), 'b': list('ab..')}
-        dfmix = DataFrame(mix)
-
-        ### simplest cases
-        ## regex -> value
-        # obj frame
-        res = dfobj.copy()
-        res.replace(r'\s*\.\s*', nan, regex=True, inplace=True)
-        assert_frame_equal(dfobj, res.fillna('.'))
-
-        # mixed
-        res = dfmix.copy()
-        res.replace(r'\s*\.\s*', nan, regex=True, inplace=True)
-        assert_frame_equal(dfmix, res.fillna('.'))
-
-        ## regex -> regex
-        # obj frame
-        res = dfobj.copy()
-        res.replace(r'\s*(\.)\s*', r'\1\1\1', regex=True, inplace=True)
-        objc = obj.copy()
-        objc['a'] = ['a', 'b', '...', '...']
-        expec = DataFrame(objc)
-        assert_frame_equal(res, expec)
-
-        # with mixed
-        res = dfmix.copy()
-        res.replace(r'\s*(\.)\s*', r'\1\1\1', regex=True, inplace=True)
-        mixc = mix.copy()
-        mixc['b'] = ['a', 'b', '...', '...']
-        expec = DataFrame(mixc)
-        assert_frame_equal(res, expec)
-
-        # everything with compiled regexs as well
-        res = dfobj.copy()
-        res.replace(re.compile(r'\s*\.\s*'), nan, regex=True, inplace=True)
-        assert_frame_equal(dfobj, res.fillna('.'))
-
-        # mixed
-        res = dfmix.copy()
-        res.replace(re.compile(r'\s*\.\s*'), nan, regex=True, inplace=True)
-        assert_frame_equal(dfmix, res.fillna('.'))
-
-        ## regex -> regex
-        # obj frame
-        res = dfobj.copy()
-        res.replace(re.compile(r'\s*(\.)\s*'), r'\1\1\1', regex=True,
-                    inplace=True)
-        objc = obj.copy()
-        objc['a'] = ['a', 'b', '...', '...']
-        expec = DataFrame(objc)
-        assert_frame_equal(res, expec)
-
-        # with mixed
-        res = dfmix.copy()
-        res.replace(re.compile(r'\s*(\.)\s*'), r'\1\1\1', regex=True,
-                    inplace=True)
-        mixc = mix.copy()
-        mixc['b'] = ['a', 'b', '...', '...']
-        expec = DataFrame(mixc)
-        assert_frame_equal(res, expec)
-
-        res = dfobj.copy()
-        res.replace(regex=r'\s*\.\s*', value=nan, inplace=True)
-        assert_frame_equal(dfobj, res.fillna('.'))
-
-        # mixed
-        res = dfmix.copy()
-        res.replace(regex=r'\s*\.\s*', value=nan, inplace=True)
-        assert_frame_equal(dfmix, res.fillna('.'))
-
-        ## regex -> regex
-        # obj frame
-        res = dfobj.copy()
-        res.replace(regex=r'\s*(\.)\s*', value=r'\1\1\1', inplace=True)
-        objc = obj.copy()
-        objc['a'] = ['a', 'b', '...', '...']
-        expec = DataFrame(objc)
-        assert_frame_equal(res, expec)
-
-        # with mixed
-        res = dfmix.copy()
-        res.replace(regex=r'\s*(\.)\s*', value=r'\1\1\1', inplace=True)
-        mixc = mix.copy()
-        mixc['b'] = ['a', 'b', '...', '...']
-        expec = DataFrame(mixc)
-        assert_frame_equal(res, expec)
-
-        # everything with compiled regexs as well
-        res = dfobj.copy()
-        res.replace(regex=re.compile(r'\s*\.\s*'), value=nan, inplace=True)
-        assert_frame_equal(dfobj, res.fillna('.'))
-
-        # mixed
-        res = dfmix.copy()
-        res.replace(regex=re.compile(r'\s*\.\s*'), value=nan, inplace=True)
-        assert_frame_equal(dfmix, res.fillna('.'))
-
-        ## regex -> regex
-        # obj frame
-        res = dfobj.copy()
-        res.replace(regex=re.compile(r'\s*(\.)\s*'), value=r'\1\1\1',
-                    inplace=True)
-        objc = obj.copy()
-        objc['a'] = ['a', 'b', '...', '...']
-        expec = DataFrame(objc)
-        assert_frame_equal(res, expec)
-
-        # with mixed
-        res = dfmix.copy()
-        res.replace(regex=re.compile(r'\s*(\.)\s*'), value=r'\1\1\1',
-                    inplace=True)
-        mixc = mix.copy()
-        mixc['b'] = ['a', 'b', '...', '...']
-        expec = DataFrame(mixc)
-        assert_frame_equal(res, expec)
-
-    def test_regex_replace_list_obj(self):
-        obj = {'a': list('ab..'), 'b': list('efgh'), 'c': list('helo')}
-        dfobj = DataFrame(obj)
-
-        ## lists of regexes and values
-        # list of [re1, re2, ..., reN] -> [v1, v2, ..., vN]
-        to_replace_res = [r'\s*\.\s*', r'e|f|g']
-        values = [nan, 'crap']
-        res = dfobj.replace(to_replace_res, values, regex=True)
-        expec = DataFrame({'a': ['a', 'b', nan, nan], 'b': ['crap'] * 3 +
-                           ['h'], 'c': ['h', 'crap', 'l', 'o']})
-        assert_frame_equal(res, expec)
-
-        # list of [re1, re2, ..., reN] -> [re1, re2, .., reN]
-        to_replace_res = [r'\s*(\.)\s*', r'(e|f|g)']
-        values = [r'\1\1', r'\1_crap']
-        res = dfobj.replace(to_replace_res, values, regex=True)
-        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['e_crap',
-                                                              'f_crap',
-                                                              'g_crap', 'h'],
-                           'c': ['h', 'e_crap', 'l', 'o']})
-
-        assert_frame_equal(res, expec)
-
-        # list of [re1, re2, ..., reN] -> [(re1 or v1), (re2 or v2), ..., (reN
-        # or vN)]
-        to_replace_res = [r'\s*(\.)\s*', r'e']
-        values = [r'\1\1', r'crap']
-        res = dfobj.replace(to_replace_res, values, regex=True)
-        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['crap', 'f', 'g',
-                                                              'h'],
-                           'c': ['h', 'crap', 'l', 'o']})
-        assert_frame_equal(res, expec)
-
-        to_replace_res = [r'\s*(\.)\s*', r'e']
-        values = [r'\1\1', r'crap']
-        res = dfobj.replace(value=values, regex=to_replace_res)
-        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['crap', 'f', 'g',
-                                                              'h'],
-                           'c': ['h', 'crap', 'l', 'o']})
-        assert_frame_equal(res, expec)
-
-    def test_regex_replace_list_obj_inplace(self):
-        ### same as above with inplace=True
-        ## lists of regexes and values
-        obj = {'a': list('ab..'), 'b': list('efgh'), 'c': list('helo')}
-        dfobj = DataFrame(obj)
-
-        ## lists of regexes and values
-        # list of [re1, re2, ..., reN] -> [v1, v2, ..., vN]
-        to_replace_res = [r'\s*\.\s*', r'e|f|g']
-        values = [nan, 'crap']
-        res = dfobj.copy()
-        res.replace(to_replace_res, values, inplace=True, regex=True)
-        expec = DataFrame({'a': ['a', 'b', nan, nan], 'b': ['crap'] * 3 +
-                           ['h'], 'c': ['h', 'crap', 'l', 'o']})
-        assert_frame_equal(res, expec)
-
-        # list of [re1, re2, ..., reN] -> [re1, re2, .., reN]
-        to_replace_res = [r'\s*(\.)\s*', r'(e|f|g)']
-        values = [r'\1\1', r'\1_crap']
-        res = dfobj.copy()
-        res.replace(to_replace_res, values, inplace=True, regex=True)
-        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['e_crap',
-                                                              'f_crap',
-                                                              'g_crap', 'h'],
-                           'c': ['h', 'e_crap', 'l', 'o']})
-
-        assert_frame_equal(res, expec)
-
-        # list of [re1, re2, ..., reN] -> [(re1 or v1), (re2 or v2), ..., (reN
-        # or vN)]
-        to_replace_res = [r'\s*(\.)\s*', r'e']
-        values = [r'\1\1', r'crap']
-        res = dfobj.copy()
-        res.replace(to_replace_res, values, inplace=True, regex=True)
-        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['crap', 'f', 'g',
-                                                              'h'],
-                           'c': ['h', 'crap', 'l', 'o']})
-        assert_frame_equal(res, expec)
-
-        to_replace_res = [r'\s*(\.)\s*', r'e']
-        values = [r'\1\1', r'crap']
-        res = dfobj.copy()
-        res.replace(value=values, regex=to_replace_res, inplace=True)
-        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['crap', 'f', 'g',
-                                                              'h'],
-                           'c': ['h', 'crap', 'l', 'o']})
-        assert_frame_equal(res, expec)
-
-    def test_regex_replace_list_mixed(self):
-        ## mixed frame to make sure this doesn't break things
-        mix = {'a': lrange(4), 'b': list('ab..')}
-        dfmix = DataFrame(mix)
-
-        ## lists of regexes and values
-        # list of [re1, re2, ..., reN] -> [v1, v2, ..., vN]
-        to_replace_res = [r'\s*\.\s*', r'a']
-        values = [nan, 'crap']
-        mix2 = {'a': lrange(4), 'b': list('ab..'), 'c': list('halo')}
-        dfmix2 = DataFrame(mix2)
-        res = dfmix2.replace(to_replace_res, values, regex=True)
-        expec = DataFrame({'a': mix2['a'], 'b': ['crap', 'b', nan, nan],
-                           'c': ['h', 'crap', 'l', 'o']})
-        assert_frame_equal(res, expec)
-
-        # list of [re1, re2, ..., reN] -> [re1, re2, .., reN]
-        to_replace_res = [r'\s*(\.)\s*', r'(a|b)']
-        values = [r'\1\1', r'\1_crap']
-        res = dfmix.replace(to_replace_res, values, regex=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['a_crap', 'b_crap', '..',
-                                                '..']})
-
-        assert_frame_equal(res, expec)
-
-        # list of [re1, re2, ..., reN] -> [(re1 or v1), (re2 or v2), ..., (reN
-        # or vN)]
-        to_replace_res = [r'\s*(\.)\s*', r'a', r'(b)']
-        values = [r'\1\1', r'crap', r'\1_crap']
-        res = dfmix.replace(to_replace_res, values, regex=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['crap', 'b_crap', '..', '..']})
-        assert_frame_equal(res, expec)
-
-        to_replace_res = [r'\s*(\.)\s*', r'a', r'(b)']
-        values = [r'\1\1', r'crap', r'\1_crap']
-        res = dfmix.replace(regex=to_replace_res, value=values)
-        expec = DataFrame({'a': mix['a'], 'b': ['crap', 'b_crap', '..', '..']})
-        assert_frame_equal(res, expec)
-
-    def test_regex_replace_list_mixed_inplace(self):
-        mix = {'a': lrange(4), 'b': list('ab..')}
-        dfmix = DataFrame(mix)
-        # the same inplace
-        ## lists of regexes and values
-        # list of [re1, re2, ..., reN] -> [v1, v2, ..., vN]
-        to_replace_res = [r'\s*\.\s*', r'a']
-        values = [nan, 'crap']
-        res = dfmix.copy()
-        res.replace(to_replace_res, values, inplace=True, regex=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['crap', 'b', nan, nan]})
-        assert_frame_equal(res, expec)
-
-        # list of [re1, re2, ..., reN] -> [re1, re2, .., reN]
-        to_replace_res = [r'\s*(\.)\s*', r'(a|b)']
-        values = [r'\1\1', r'\1_crap']
-        res = dfmix.copy()
-        res.replace(to_replace_res, values, inplace=True, regex=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['a_crap', 'b_crap', '..',
-                                                '..']})
-
-        assert_frame_equal(res, expec)
-
-        # list of [re1, re2, ..., reN] -> [(re1 or v1), (re2 or v2), ..., (reN
-        # or vN)]
-        to_replace_res = [r'\s*(\.)\s*', r'a', r'(b)']
-        values = [r'\1\1', r'crap', r'\1_crap']
-        res = dfmix.copy()
-        res.replace(to_replace_res, values, inplace=True, regex=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['crap', 'b_crap', '..', '..']})
-        assert_frame_equal(res, expec)
-
-        to_replace_res = [r'\s*(\.)\s*', r'a', r'(b)']
-        values = [r'\1\1', r'crap', r'\1_crap']
-        res = dfmix.copy()
-        res.replace(regex=to_replace_res, value=values, inplace=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['crap', 'b_crap', '..', '..']})
-        assert_frame_equal(res, expec)
-
-    def test_regex_replace_dict_mixed(self):
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
-        dfmix = DataFrame(mix)
-
-        ## dicts
-        # single dict {re1: v1}, search the whole frame
-        # need test for this...
-
-        # list of dicts {re1: v1, re2: v2, ..., re3: v3}, search the whole
-        # frame
-        res = dfmix.replace({'b': r'\s*\.\s*'}, {'b': nan}, regex=True)
-        res2 = dfmix.copy()
-        res2.replace({'b': r'\s*\.\s*'}, {'b': nan}, inplace=True, regex=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', nan, nan], 'c':
-                           mix['c']})
-        assert_frame_equal(res, expec)
-        assert_frame_equal(res2, expec)
-
-        # list of dicts {re1: re11, re2: re12, ..., reN: re1N}, search the
-        # whole frame
-        res = dfmix.replace({'b': r'\s*(\.)\s*'}, {'b': r'\1ty'}, regex=True)
-        res2 = dfmix.copy()
-        res2.replace({'b': r'\s*(\.)\s*'}, {'b': r'\1ty'}, inplace=True,
-                     regex=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', '.ty', '.ty'], 'c':
-                           mix['c']})
-        assert_frame_equal(res, expec)
-        assert_frame_equal(res2, expec)
-
-        res = dfmix.replace(regex={'b': r'\s*(\.)\s*'}, value={'b': r'\1ty'})
-        res2 = dfmix.copy()
-        res2.replace(regex={'b': r'\s*(\.)\s*'}, value={'b': r'\1ty'},
-                     inplace=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', '.ty', '.ty'], 'c':
-                           mix['c']})
-        assert_frame_equal(res, expec)
-        assert_frame_equal(res2, expec)
-
-        # scalar -> dict
-        # to_replace regex, {value: value}
-        expec = DataFrame({'a': mix['a'], 'b': [nan, 'b', '.', '.'], 'c':
-                           mix['c']})
-        res = dfmix.replace('a', {'b': nan}, regex=True)
-        res2 = dfmix.copy()
-        res2.replace('a', {'b': nan}, regex=True, inplace=True)
-        assert_frame_equal(res, expec)
-        assert_frame_equal(res2, expec)
-
-        res = dfmix.replace('a', {'b': nan}, regex=True)
-        res2 = dfmix.copy()
-        res2.replace(regex='a', value={'b': nan}, inplace=True)
-        expec = DataFrame({'a': mix['a'], 'b': [nan, 'b', '.', '.'], 'c':
-                           mix['c']})
-        assert_frame_equal(res, expec)
-        assert_frame_equal(res2, expec)
-
-    def test_regex_replace_dict_nested(self):
-        # nested dicts will not work until this is implemented for Series
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
-        dfmix = DataFrame(mix)
-        res = dfmix.replace({'b': {r'\s*\.\s*': nan}}, regex=True)
-        res2 = dfmix.copy()
-        res4 = dfmix.copy()
-        res2.replace({'b': {r'\s*\.\s*': nan}}, inplace=True, regex=True)
-        res3 = dfmix.replace(regex={'b': {r'\s*\.\s*': nan}})
-        res4.replace(regex={'b': {r'\s*\.\s*': nan}}, inplace=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', nan, nan], 'c':
-                           mix['c']})
-        assert_frame_equal(res, expec)
-        assert_frame_equal(res2, expec)
-        assert_frame_equal(res3, expec)
-        assert_frame_equal(res4, expec)
-
-    def test_regex_replace_dict_nested_gh4115(self):
-        df = pd.DataFrame({'Type':['Q','T','Q','Q','T'], 'tmp':2})
-        expected = DataFrame({'Type': [0,1,0,0,1], 'tmp': 2})
-        assert_frame_equal(df.replace({'Type': {'Q':0,'T':1}}), expected)
-
-    def test_regex_replace_list_to_scalar(self):
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
-        df = DataFrame(mix)
-        res = df.replace([r'\s*\.\s*', 'a|b'], nan, regex=True)
-        res2 = df.copy()
-        res3 = df.copy()
-        res2.replace([r'\s*\.\s*', 'a|b'], nan, regex=True, inplace=True)
-        res3.replace(regex=[r'\s*\.\s*', 'a|b'], value=nan, inplace=True)
-        expec = DataFrame({'a': mix['a'], 'b': np.array([nan] * 4),
-                           'c': [nan, nan, nan, 'd']})
-        assert_frame_equal(res, expec)
-        assert_frame_equal(res2, expec)
-        assert_frame_equal(res3, expec)
-
-    def test_regex_replace_str_to_numeric(self):
-        # what happens when you try to replace a numeric value with a regex?
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
-        df = DataFrame(mix)
-        res = df.replace(r'\s*\.\s*', 0, regex=True)
-        res2 = df.copy()
-        res2.replace(r'\s*\.\s*', 0, inplace=True, regex=True)
-        res3 = df.copy()
-        res3.replace(regex=r'\s*\.\s*', value=0, inplace=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', 0, 0], 'c':
-                           mix['c']})
-        assert_frame_equal(res, expec)
-        assert_frame_equal(res2, expec)
-        assert_frame_equal(res3, expec)
-
-    def test_regex_replace_regex_list_to_numeric(self):
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
-        df = DataFrame(mix)
-        res = df.replace([r'\s*\.\s*', 'b'], 0, regex=True)
-        res2 = df.copy()
-        res2.replace([r'\s*\.\s*', 'b'], 0, regex=True, inplace=True)
-        res3 = df.copy()
-        res3.replace(regex=[r'\s*\.\s*', 'b'], value=0, inplace=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['a', 0, 0, 0], 'c': ['a', 0,
-                                                                     nan,
-                                                                     'd']})
-        assert_frame_equal(res, expec)
-        assert_frame_equal(res2, expec)
-        assert_frame_equal(res3, expec)
-
-    def test_regex_replace_series_of_regexes(self):
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
-        df = DataFrame(mix)
-        s1 = Series({'b': r'\s*\.\s*'})
-        s2 = Series({'b': nan})
-        res = df.replace(s1, s2, regex=True)
-        res2 = df.copy()
-        res2.replace(s1, s2, inplace=True, regex=True)
-        res3 = df.copy()
-        res3.replace(regex=s1, value=s2, inplace=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', nan, nan], 'c':
-                           mix['c']})
-        assert_frame_equal(res, expec)
-        assert_frame_equal(res2, expec)
-        assert_frame_equal(res3, expec)
-
-    def test_regex_replace_numeric_to_object_conversion(self):
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
-        df = DataFrame(mix)
-        res = df.replace(0, 'a')
-        expec = DataFrame({'a': ['a', 1, 2, 3], 'b': mix['b'], 'c': mix['c']})
-        assert_frame_equal(res, expec)
-        self.assertEqual(res.a.dtype, np.object_)
-
-    def test_replace_regex_metachar(self):
-        metachars = '[]', '()', '\d', '\w', '\s'
-
-        for metachar in metachars:
-            df = DataFrame({'a': [metachar, 'else']})
-            result = df.replace({'a': {metachar: 'paren'}})
-            expected = DataFrame({'a': ['paren', 'else']})
-            tm.assert_frame_equal(result, expected)
-
-    def test_replace(self):
-        self.tsframe['A'][:5] = nan
-        self.tsframe['A'][-5:] = nan
-
-        zero_filled = self.tsframe.replace(nan, -1e8)
-        assert_frame_equal(zero_filled, self.tsframe.fillna(-1e8))
-        assert_frame_equal(zero_filled.replace(-1e8, nan), self.tsframe)
-
-        self.tsframe['A'][:5] = nan
-        self.tsframe['A'][-5:] = nan
-        self.tsframe['B'][:5] = -1e8
-
-        # empty
-        df = DataFrame(index=['a', 'b'])
-        assert_frame_equal(df, df.replace(5, 7))
-
-    def test_replace_list(self):
-        obj = {'a': list('ab..'), 'b': list('efgh'), 'c': list('helo')}
-        dfobj = DataFrame(obj)
-
-        ## lists of regexes and values
-        # list of [v1, v2, ..., vN] -> [v1, v2, ..., vN]
-        to_replace_res = [r'.', r'e']
-        values = [nan, 'crap']
-        res = dfobj.replace(to_replace_res, values)
-        expec = DataFrame({'a': ['a', 'b', nan, nan],
-                           'b': ['crap', 'f', 'g', 'h'], 'c': ['h', 'crap',
-                                                               'l', 'o']})
-        assert_frame_equal(res, expec)
-
-        # list of [v1, v2, ..., vN] -> [v1, v2, .., vN]
-        to_replace_res = [r'.', r'f']
-        values = [r'..', r'crap']
-        res = dfobj.replace(to_replace_res, values)
-        expec = DataFrame({'a': ['a', 'b', '..', '..'], 'b': ['e', 'crap', 'g',
-                                                              'h'],
-                           'c': ['h', 'e', 'l', 'o']})
-
-        assert_frame_equal(res, expec)
-
-    def test_replace_series_dict(self):
-        # from GH 3064
-        df = DataFrame({'zero': {'a': 0.0, 'b': 1}, 'one': {'a': 2.0, 'b': 0}})
-        result = df.replace(0, {'zero': 0.5, 'one': 1.0})
-        expected = DataFrame({'zero': {'a': 0.5, 'b': 1}, 'one': {'a': 2.0, 'b': 1.0}})
-        assert_frame_equal(result, expected)
-
-        result = df.replace(0, df.mean())
-        assert_frame_equal(result, expected)
-
-        # series to series/dict
-        df = DataFrame({'zero': {'a': 0.0, 'b': 1}, 'one': {'a': 2.0, 'b': 0}})
-        s = Series({'zero': 0.0, 'one': 2.0})
-        result = df.replace(s, {'zero': 0.5, 'one': 1.0})
-        expected = DataFrame({'zero': {'a': 0.5, 'b': 1}, 'one': {'a': 1.0, 'b': 0.0}})
-        assert_frame_equal(result, expected)
-
-        result = df.replace(s, df.mean())
-        assert_frame_equal(result, expected)
-
-    def test_replace_convert(self):
-        # gh 3907
-        df = DataFrame([['foo', 'bar', 'bah'], ['bar', 'foo', 'bah']])
-        m = {'foo': 1, 'bar': 2, 'bah': 3}
-        rep = df.replace(m)
-        expec = Series([ np.int64] * 3)
-        res = rep.dtypes
-        assert_series_equal(expec, res)
-
-    def test_replace_mixed(self):
-        self.mixed_frame.ix[5:20,'foo'] = nan
-        self.mixed_frame.ix[-10:,'A'] = nan
-
-        result = self.mixed_frame.replace(np.nan, -18)
-        expected = self.mixed_frame.fillna(value=-18)
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result.replace(-18, nan), self.mixed_frame)
-
-        result = self.mixed_frame.replace(np.nan, -1e8)
-        expected = self.mixed_frame.fillna(value=-1e8)
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result.replace(-1e8, nan), self.mixed_frame)
-
-        # int block upcasting
-        df = DataFrame({ 'A' : Series([1.0,2.0],dtype='float64'), 'B' : Series([0,1],dtype='int64') })
-        expected = DataFrame({ 'A' : Series([1.0,2.0],dtype='float64'), 'B' : Series([0.5,1],dtype='float64') })
-        result = df.replace(0, 0.5)
-        assert_frame_equal(result,expected)
-
-        df.replace(0, 0.5, inplace=True)
-        assert_frame_equal(df,expected)
-
-        # int block splitting
-        df = DataFrame({ 'A' : Series([1.0,2.0],dtype='float64'), 'B' : Series([0,1],dtype='int64'), 'C' : Series([1,2],dtype='int64') })
-        expected = DataFrame({ 'A' : Series([1.0,2.0],dtype='float64'), 'B' : Series([0.5,1],dtype='float64'), 'C' : Series([1,2],dtype='int64') })
-        result = df.replace(0, 0.5)
-        assert_frame_equal(result,expected)
-
-        # to object block upcasting
-        df = DataFrame({ 'A' : Series([1.0,2.0],dtype='float64'), 'B' : Series([0,1],dtype='int64') })
-        expected = DataFrame({ 'A' : Series([1,'foo'],dtype='object'), 'B' : Series([0,1],dtype='int64') })
-        result = df.replace(2, 'foo')
-        assert_frame_equal(result,expected)
-
-        expected = DataFrame({ 'A' : Series(['foo','bar'],dtype='object'), 'B' : Series([0,'foo'],dtype='object') })
-        result = df.replace([1,2], ['foo','bar'])
-        assert_frame_equal(result,expected)
-
-        # test case from
-        from pandas.util.testing import makeCustomDataframe as mkdf
-        df = DataFrame({'A' : Series([3,0],dtype='int64'), 'B' : Series([0,3],dtype='int64') })
-        result = df.replace(3, df.mean().to_dict())
-        expected = df.copy().astype('float64')
-        m = df.mean()
-        expected.iloc[0,0] = m[0]
-        expected.iloc[1,1] = m[1]
-        assert_frame_equal(result,expected)
-
-    def test_replace_simple_nested_dict(self):
-        df = DataFrame({'col': range(1, 5)})
-        expected = DataFrame({'col': ['a', 2, 3, 'b']})
-
-        result = df.replace({'col': {1: 'a', 4: 'b'}})
-        tm.assert_frame_equal(expected, result)
-
-        # in this case, should be the same as the not nested version
-        result = df.replace({1: 'a', 4: 'b'})
-        tm.assert_frame_equal(expected, result)
-
-    def test_replace_simple_nested_dict_with_nonexistent_value(self):
-        df = DataFrame({'col': range(1, 5)})
-        expected = DataFrame({'col': ['a', 2, 3, 'b']})
-
-        result = df.replace({-1: '-', 1: 'a', 4: 'b'})
-        tm.assert_frame_equal(expected, result)
-
-        result = df.replace({'col': {-1: '-', 1: 'a', 4: 'b'}})
-        tm.assert_frame_equal(expected, result)
-
-    def test_interpolate(self):
-        pass
-
-    def test_replace_value_is_none(self):
-        self.assertRaises(TypeError, self.tsframe.replace, nan)
-        orig_value = self.tsframe.iloc[0, 0]
-        orig2 = self.tsframe.iloc[1, 0]
-
-        self.tsframe.iloc[0, 0] = nan
-        self.tsframe.iloc[1, 0] = 1
-
-        result = self.tsframe.replace(to_replace={nan: 0})
-        expected = self.tsframe.T.replace(to_replace={nan: 0}).T
-        assert_frame_equal(result, expected)
-
-        result = self.tsframe.replace(to_replace={nan: 0, 1: -1e8})
-        tsframe = self.tsframe.copy()
-        tsframe.iloc[0, 0] = 0
-        tsframe.iloc[1, 0] = -1e8
-        expected = tsframe
-        assert_frame_equal(expected, result)
-        self.tsframe.iloc[0, 0] = orig_value
-        self.tsframe.iloc[1, 0] = orig2
-
-    def test_replace_for_new_dtypes(self):
-
-        # dtypes
-        tsframe = self.tsframe.copy().astype(np.float32)
-        tsframe['A'][:5] = nan
-        tsframe['A'][-5:] = nan
-
-        zero_filled = tsframe.replace(nan, -1e8)
-        assert_frame_equal(zero_filled, tsframe.fillna(-1e8))
-        assert_frame_equal(zero_filled.replace(-1e8, nan), tsframe)
-
-        tsframe['A'][:5] = nan
-        tsframe['A'][-5:] = nan
-        tsframe['B'][:5] = -1e8
-
-        b = tsframe['B']
-        b[b == -1e8] = nan
-        tsframe['B'] = b
-        result = tsframe.fillna(method='bfill')
-        assert_frame_equal(result, tsframe.fillna(method='bfill'))
-
-    def test_replace_dtypes(self):
-        # int
-        df = DataFrame({'ints': [1, 2, 3]})
-        result = df.replace(1, 0)
-        expected = DataFrame({'ints': [0, 2, 3]})
-        assert_frame_equal(result, expected)
-
-        df = DataFrame({'ints': [1, 2, 3]}, dtype=np.int32)
-        result = df.replace(1, 0)
-        expected = DataFrame({'ints': [0, 2, 3]}, dtype=np.int32)
-        assert_frame_equal(result, expected)
-
-        df = DataFrame({'ints': [1, 2, 3]}, dtype=np.int16)
-        result = df.replace(1, 0)
-        expected = DataFrame({'ints': [0, 2, 3]}, dtype=np.int16)
-        assert_frame_equal(result, expected)
-
-        # bools
-        df = DataFrame({'bools': [True, False, True]})
-        result = df.replace(False, True)
-        self.assertTrue(result.values.all())
-
-        # complex blocks
-        df = DataFrame({'complex': [1j, 2j, 3j]})
-        result = df.replace(1j, 0j)
-        expected = DataFrame({'complex': [0j, 2j, 3j]})
-        assert_frame_equal(result, expected)
-
-        # datetime blocks
-        prev = datetime.today()
-        now = datetime.today()
-        df = DataFrame({'datetime64': Index([prev, now, prev])})
-        result = df.replace(prev, now)
-        expected = DataFrame({'datetime64': Index([now] * 3)})
-        assert_frame_equal(result, expected)
-
-    def test_replace_input_formats(self):
-        # both dicts
-        to_rep = {'A': np.nan, 'B': 0, 'C': ''}
-        values = {'A': 0, 'B': -1, 'C': 'missing'}
-        df = DataFrame({'A': [np.nan, 0, np.inf], 'B': [0, 2, 5],
-                        'C': ['', 'asdf', 'fd']})
-        filled = df.replace(to_rep, values)
-        expected = {}
-        for k, v in compat.iteritems(df):
-            expected[k] = v.replace(to_rep[k], values[k])
-        assert_frame_equal(filled, DataFrame(expected))
-
-        result = df.replace([0, 2, 5], [5, 2, 0])
-        expected = DataFrame({'A': [np.nan, 5, np.inf], 'B': [5, 2, 0],
-                              'C': ['', 'asdf', 'fd']})
-        assert_frame_equal(result, expected)
-
-        # dict to scalar
-        filled = df.replace(to_rep, 0)
-        expected = {}
-        for k, v in compat.iteritems(df):
-            expected[k] = v.replace(to_rep[k], 0)
-        assert_frame_equal(filled, DataFrame(expected))
-
-        self.assertRaises(TypeError, df.replace, to_rep, [np.nan, 0, ''])
-
-        # scalar to dict
-        values = {'A': 0, 'B': -1, 'C': 'missing'}
-        df = DataFrame({'A': [np.nan, 0, np.nan], 'B': [0, 2, 5],
-                        'C': ['', 'asdf', 'fd']})
-        filled = df.replace(np.nan, values)
-        expected = {}
-        for k, v in compat.iteritems(df):
-            expected[k] = v.replace(np.nan, values[k])
-        assert_frame_equal(filled, DataFrame(expected))
-
-        # list to list
-        to_rep = [np.nan, 0, '']
-        values = [-2, -1, 'missing']
-        result = df.replace(to_rep, values)
-        expected = df.copy()
-        for i in range(len(to_rep)):
-            expected.replace(to_rep[i], values[i], inplace=True)
-        assert_frame_equal(result, expected)
-
-        self.assertRaises(ValueError, df.replace, to_rep, values[1:])
-
-        # list to scalar
-        to_rep = [np.nan, 0, '']
-        result = df.replace(to_rep, -1)
-        expected = df.copy()
-        for i in range(len(to_rep)):
-            expected.replace(to_rep[i], -1, inplace=True)
-        assert_frame_equal(result, expected)
-
-    def test_replace_limit(self):
-        pass
-
-    def test_replace_dict_no_regex(self):
-        answer = Series({0: 'Strongly Agree', 1: 'Agree', 2: 'Neutral', 3:
-                         'Disagree', 4: 'Strongly Disagree'})
-        weights = {'Agree': 4, 'Disagree': 2, 'Neutral': 3, 'Strongly Agree':
-                   5, 'Strongly Disagree': 1}
-        expected = Series({0: 5, 1: 4, 2: 3, 3: 2, 4: 1})
-        result = answer.replace(weights)
-        tm.assert_series_equal(result, expected)
-
-    def test_replace_series_no_regex(self):
-        answer = Series({0: 'Strongly Agree', 1: 'Agree', 2: 'Neutral', 3:
-                         'Disagree', 4: 'Strongly Disagree'})
-        weights = Series({'Agree': 4, 'Disagree': 2, 'Neutral': 3,
-                          'Strongly Agree': 5, 'Strongly Disagree': 1})
-        expected = Series({0: 5, 1: 4, 2: 3, 3: 2, 4: 1})
-        result = answer.replace(weights)
-        tm.assert_series_equal(result, expected)
-
-    def test_replace_dict_tuple_list_ordering_remains_the_same(self):
-        df = DataFrame(dict(A=[nan, 1]))
-        res1 = df.replace(to_replace={nan: 0, 1: -1e8})
-        res2 = df.replace(to_replace=(1, nan), value=[-1e8, 0])
-        res3 = df.replace(to_replace=[1, nan], value=[-1e8, 0])
-
-        expected = DataFrame({'A': [0, -1e8]})
-        tm.assert_frame_equal(res1, res2)
-        tm.assert_frame_equal(res2, res3)
-        tm.assert_frame_equal(res3, expected)
-
-    def test_replace_doesnt_replace_without_regex(self):
-        from pandas.compat import StringIO
-        raw = """fol T_opp T_Dir T_Enh
-        0    1     0     0    vo
-        1    2    vr     0     0
-        2    2     0     0     0
-        3    3     0    bt     0"""
-        df = read_csv(StringIO(raw), sep=r'\s+')
-        res = df.replace({'\D': 1})
-        tm.assert_frame_equal(df, res)
-
-    def test_replace_bool_with_string(self):
-        df = DataFrame({'a': [True, False], 'b': list('ab')})
-        result = df.replace(True, 'a')
-        expected = DataFrame({'a': ['a', False], 'b': df.b})
-        tm.assert_frame_equal(result, expected)
-
-    def test_replace_pure_bool_with_string_no_op(self):
-        df = DataFrame(np.random.rand(2, 2) > 0.5)
-        result = df.replace('asdf', 'fdsa')
-        tm.assert_frame_equal(df, result)
-
-    def test_replace_bool_with_bool(self):
-        df = DataFrame(np.random.rand(2, 2) > 0.5)
-        result = df.replace(False, True)
-        expected = DataFrame(np.ones((2, 2), dtype=bool))
-        tm.assert_frame_equal(result, expected)
-
-    def test_replace_with_dict_with_bool_keys(self):
-        df = DataFrame({0: [True, False], 1: [False, True]})
-        with tm.assertRaisesRegexp(TypeError, 'Cannot compare types .+'):
-            df.replace({'asdf': 'asdb', True: 'yes'})
-
-    def test_replace_truthy(self):
-        df = DataFrame({'a': [True, True]})
-        r = df.replace([np.inf, -np.inf], np.nan)
-        e = df
-        tm.assert_frame_equal(r, e)
-
-    def test_replace_int_to_int_chain(self):
-        df = DataFrame({'a': lrange(1, 5)})
-        with tm.assertRaisesRegexp(ValueError, "Replacement not allowed .+"):
-            df.replace({'a': dict(zip(range(1, 5), range(2, 6)))})
-
-    def test_replace_str_to_str_chain(self):
-        a = np.arange(1, 5)
-        astr = a.astype(str)
-        bstr = np.arange(2, 6).astype(str)
-        df = DataFrame({'a': astr})
-        with tm.assertRaisesRegexp(ValueError, "Replacement not allowed .+"):
-            df.replace({'a': dict(zip(astr, bstr))})
-
-    def test_replace_swapping_bug(self):
-        df = pd.DataFrame({'a': [True, False, True]})
-        res = df.replace({'a': {True: 'Y', False: 'N'}})
-        expect = pd.DataFrame({'a': ['Y', 'N', 'Y']})
-        tm.assert_frame_equal(res, expect)
-
-        df = pd.DataFrame({'a': [0, 1, 0]})
-        res = df.replace({'a': {0: 'Y', 1: 'N'}})
-        expect = pd.DataFrame({'a': ['Y', 'N', 'Y']})
-        tm.assert_frame_equal(res, expect)
-
-    def test_replace_period(self):
-        d = {'fname':
-             {'out_augmented_AUG_2011.json': pd.Period(year=2011, month=8, freq='M'),
-              'out_augmented_JAN_2011.json': pd.Period(year=2011, month=1, freq='M'),
-              'out_augmented_MAY_2012.json': pd.Period(year=2012, month=5, freq='M'),
-              'out_augmented_SUBSIDY_WEEK.json': pd.Period(year=2011, month=4, freq='M'),
-              'out_augmented_AUG_2012.json': pd.Period(year=2012, month=8, freq='M'),
-              'out_augmented_MAY_2011.json': pd.Period(year=2011, month=5, freq='M'),
-              'out_augmented_SEP_2013.json': pd.Period(year=2013, month=9, freq='M')}}
-
-        df = pd.DataFrame(['out_augmented_AUG_2012.json',
-                           'out_augmented_SEP_2013.json',
-                           'out_augmented_SUBSIDY_WEEK.json',
-                           'out_augmented_MAY_2012.json',
-                           'out_augmented_MAY_2011.json',
-                           'out_augmented_AUG_2011.json',
-                           'out_augmented_JAN_2011.json'], columns=['fname'])
-        tm.assert_equal(set(df.fname.values), set(d['fname'].keys()))
-        expected = DataFrame({'fname': [d['fname'][k]
-                                        for k in df.fname.values]})
-        result = df.replace(d)
-        tm.assert_frame_equal(result, expected)
-
-    def test_replace_datetime(self):
-        d = {'fname':
-             {'out_augmented_AUG_2011.json': pd.Timestamp('2011-08'),
-              'out_augmented_JAN_2011.json': pd.Timestamp('2011-01'),
-              'out_augmented_MAY_2012.json': pd.Timestamp('2012-05'),
-              'out_augmented_SUBSIDY_WEEK.json': pd.Timestamp('2011-04'),
-              'out_augmented_AUG_2012.json': pd.Timestamp('2012-08'),
-              'out_augmented_MAY_2011.json': pd.Timestamp('2011-05'),
-              'out_augmented_SEP_2013.json': pd.Timestamp('2013-09')}}
-
-        df = pd.DataFrame(['out_augmented_AUG_2012.json',
-                           'out_augmented_SEP_2013.json',
-                           'out_augmented_SUBSIDY_WEEK.json',
-                           'out_augmented_MAY_2012.json',
-                           'out_augmented_MAY_2011.json',
-                           'out_augmented_AUG_2011.json',
-                           'out_augmented_JAN_2011.json'], columns=['fname'])
-        tm.assert_equal(set(df.fname.values), set(d['fname'].keys()))
-        expected = DataFrame({'fname': [d['fname'][k]
-                                        for k in df.fname.values]})
-        result = df.replace(d)
-        tm.assert_frame_equal(result, expected)
-
-    def test_combine_multiple_frames_dtypes(self):
-
-        # GH 2759
-        A = DataFrame(data=np.ones((10, 2)), columns=['foo', 'bar'], dtype=np.float64)
-        B = DataFrame(data=np.ones((10, 2)), dtype=np.float32)
-        results = pd.concat((A, B), axis=1).get_dtype_counts()
-        expected = Series(dict( float64 = 2, float32 = 2 ))
-        assert_series_equal(results,expected)
-
-    def test_ops(self):
-
-        # tst ops and reversed ops in evaluation
-        # GH7198
-
-        # smaller hits python, larger hits numexpr
-        for n in [ 4, 4000 ]:
-
-            df = DataFrame(1,index=range(n),columns=list('abcd'))
-            df.iloc[0] = 2
-            m = df.mean()
-
-            for op_str, op, rop in [('+','__add__','__radd__'),
-                                    ('-','__sub__','__rsub__'),
-                                    ('*','__mul__','__rmul__'),
-                                    ('/','__truediv__','__rtruediv__')]:
-
-                base = DataFrame(np.tile(m.values,n).reshape(n,-1),columns=list('abcd'))
-                expected = eval("base{op}df".format(op=op_str))
-
-                # ops as strings
-                result = eval("m{op}df".format(op=op_str))
-                assert_frame_equal(result,expected)
-
-                # these are commutative
-                if op in ['+','*']:
-                    result = getattr(df,op)(m)
-                    assert_frame_equal(result,expected)
-
-                # these are not
-                elif op in ['-','/']:
-                    result = getattr(df,rop)(m)
-                    assert_frame_equal(result,expected)
-
-        # GH7192
-        df = DataFrame(dict(A=np.random.randn(25000)))
-        df.iloc[0:5] = np.nan
-        expected = (1-np.isnan(df.iloc[0:25]))
-        result = (1-np.isnan(df)).iloc[0:25]
-        assert_frame_equal(result,expected)
-
-    def test_truncate(self):
-        offset = datetools.bday
-
-        ts = self.tsframe[::3]
-
-        start, end = self.tsframe.index[3], self.tsframe.index[6]
-
-        start_missing = self.tsframe.index[2]
-        end_missing = self.tsframe.index[7]
-
-        # neither specified
-        truncated = ts.truncate()
-        assert_frame_equal(truncated, ts)
-
-        # both specified
-        expected = ts[1:3]
-
-        truncated = ts.truncate(start, end)
-        assert_frame_equal(truncated, expected)
-
-        truncated = ts.truncate(start_missing, end_missing)
-        assert_frame_equal(truncated, expected)
-
-        # start specified
-        expected = ts[1:]
-
-        truncated = ts.truncate(before=start)
-        assert_frame_equal(truncated, expected)
-
-        truncated = ts.truncate(before=start_missing)
-        assert_frame_equal(truncated, expected)
-
-        # end specified
-        expected = ts[:3]
-
-        truncated = ts.truncate(after=end)
-        assert_frame_equal(truncated, expected)
-
-        truncated = ts.truncate(after=end_missing)
-        assert_frame_equal(truncated, expected)
-
-        self.assertRaises(ValueError, ts.truncate,
-                          before=ts.index[-1] - 1,
-                          after=ts.index[0] +1)
-
-    def test_truncate_copy(self):
-        index = self.tsframe.index
-        truncated = self.tsframe.truncate(index[5], index[10])
-        truncated.values[:] = 5.
-        self.assertFalse((self.tsframe.values[5:11] == 5).any())
-
-    def test_xs(self):
-        idx = self.frame.index[5]
-        xs = self.frame.xs(idx)
-        for item, value in compat.iteritems(xs):
-            if np.isnan(value):
-                self.assertTrue(np.isnan(self.frame[item][idx]))
-            else:
-                self.assertEqual(value, self.frame[item][idx])
-
-        # mixed-type xs
-        test_data = {
-            'A': {'1': 1, '2': 2},
-            'B': {'1': '1', '2': '2', '3': '3'},
-        }
-        frame = DataFrame(test_data)
-        xs = frame.xs('1')
-        self.assertEqual(xs.dtype, np.object_)
-        self.assertEqual(xs['A'], 1)
-        self.assertEqual(xs['B'], '1')
-
-        with tm.assertRaises(KeyError):
-            self.tsframe.xs(self.tsframe.index[0] - datetools.bday)
-
-        # xs get column
-        series = self.frame.xs('A', axis=1)
-        expected = self.frame['A']
-        assert_series_equal(series, expected)
-
-        # view is returned if possible
-        series = self.frame.xs('A', axis=1)
-        series[:] = 5
-        self.assertTrue((expected == 5).all())
-
-    def test_xs_corner(self):
-        # pathological mixed-type reordering case
-        df = DataFrame(index=[0])
-        df['A'] = 1.
-        df['B'] = 'foo'
-        df['C'] = 2.
-        df['D'] = 'bar'
-        df['E'] = 3.
-
-        xs = df.xs(0)
-        assert_almost_equal(xs, [1., 'foo', 2., 'bar', 3.])
-
-        # no columns but index
-        df = DataFrame(index=['a', 'b', 'c'])
-        result = df.xs('a')
-        expected = Series([], name='a')
-        assert_series_equal(result, expected)
-
-    def test_xs_duplicates(self):
-        df = DataFrame(randn(5, 2), index=['b', 'b', 'c', 'b', 'a'])
-
-        cross = df.xs('c')
-        exp = df.iloc[2]
-        assert_series_equal(cross, exp)
-
-    def test_xs_keep_level(self):
-        df = DataFrame({'day': {0: 'sat', 1: 'sun'},
-                        'flavour': {0: 'strawberry', 1: 'strawberry'},
-                        'sales': {0: 10, 1: 12},
-                        'year': {0: 2008, 1: 2008}}).set_index(['year','flavour','day'])
-        result = df.xs('sat', level='day', drop_level=False)
-        expected = df[:1]
-        assert_frame_equal(result, expected)
-
-        result = df.xs([2008, 'sat'], level=['year', 'day'], drop_level=False)
-        assert_frame_equal(result, expected)
-
-    def test_pivot(self):
-        data = {
-            'index': ['A', 'B', 'C', 'C', 'B', 'A'],
-            'columns': ['One', 'One', 'One', 'Two', 'Two', 'Two'],
-            'values': [1., 2., 3., 3., 2., 1.]
-        }
-
-        frame = DataFrame(data)
-        pivoted = frame.pivot(
-            index='index', columns='columns', values='values')
-
-        expected = DataFrame({
-            'One': {'A': 1., 'B': 2., 'C': 3.},
-            'Two': {'A': 1., 'B': 2., 'C': 3.}
-        })
-        expected.index.name, expected.columns.name = 'index', 'columns'
-
-        assert_frame_equal(pivoted, expected)
-
-        # name tracking
-        self.assertEqual(pivoted.index.name, 'index')
-        self.assertEqual(pivoted.columns.name, 'columns')
-
-        # don't specify values
-        pivoted = frame.pivot(index='index', columns='columns')
-        self.assertEqual(pivoted.index.name, 'index')
-        self.assertEqual(pivoted.columns.names, (None, 'columns'))
-
-        # pivot multiple columns
-        wp = tm.makePanel()
-        lp = wp.to_frame()
-        df = lp.reset_index()
-        assert_frame_equal(df.pivot('major', 'minor'), lp.unstack())
-
-    def test_pivot_duplicates(self):
-        data = DataFrame({'a': ['bar', 'bar', 'foo', 'foo', 'foo'],
-                          'b': ['one', 'two', 'one', 'one', 'two'],
-                          'c': [1., 2., 3., 3., 4.]})
-        with assertRaisesRegexp(ValueError, 'duplicate entries'):
-            data.pivot('a', 'b', 'c')
-
-    def test_pivot_empty(self):
-        df = DataFrame({}, columns=['a', 'b', 'c'])
-        result = df.pivot('a', 'b', 'c')
-        expected = DataFrame({})
-        assert_frame_equal(result, expected, check_names=False)
-
-    def test_pivot_integer_bug(self):
-        df = DataFrame(data=[("A", "1", "A1"), ("B", "2", "B2")])
-
-        result = df.pivot(index=1, columns=0, values=2)
-        repr(result)
-        self.assert_numpy_array_equal(result.columns, ['A', 'B'])
-
-    def test_pivot_index_none(self):
-        # gh-3962
-        data = {
-            'index': ['A', 'B', 'C', 'C', 'B', 'A'],
-            'columns': ['One', 'One', 'One', 'Two', 'Two', 'Two'],
-            'values': [1., 2., 3., 3., 2., 1.]
-        }
-
-        frame = DataFrame(data).set_index('index')
-        result = frame.pivot(columns='columns', values='values')
-        expected = DataFrame({
-            'One': {'A': 1., 'B': 2., 'C': 3.},
-            'Two': {'A': 1., 'B': 2., 'C': 3.}
-        })
-
-        expected.index.name, expected.columns.name = 'index', 'columns'
-        assert_frame_equal(result, expected)
-
-        # omit values
-        result = frame.pivot(columns='columns')
-
-        expected.columns = pd.MultiIndex.from_tuples([('values', 'One'),
-                                                     ('values', 'Two')],
-                                                     names=[None, 'columns'])
-        expected.index.name = 'index'
-        assert_frame_equal(result, expected, check_names=False)
-        self.assertEqual(result.index.name, 'index',)
-        self.assertEqual(result.columns.names, (None, 'columns'))
-        expected.columns = expected.columns.droplevel(0)
-
-        data = {
-            'index': range(7),
-            'columns': ['One', 'One', 'One', 'Two', 'Two', 'Two'],
-            'values': [1., 2., 3., 3., 2., 1.]
-        }
-
-        result = frame.pivot(columns='columns', values='values')
-
-        expected.columns.name = 'columns'
-        assert_frame_equal(result, expected)
-
-    def test_reindex(self):
-        newFrame = self.frame.reindex(self.ts1.index)
-
-        for col in newFrame.columns:
-            for idx, val in compat.iteritems(newFrame[col]):
-                if idx in self.frame.index:
-                    if np.isnan(val):
-                        self.assertTrue(np.isnan(self.frame[col][idx]))
-                    else:
-                        self.assertEqual(val, self.frame[col][idx])
-                else:
-                    self.assertTrue(np.isnan(val))
-
-        for col, series in compat.iteritems(newFrame):
-            self.assertTrue(tm.equalContents(series.index, newFrame.index))
-        emptyFrame = self.frame.reindex(Index([]))
-        self.assertEqual(len(emptyFrame.index), 0)
-
-        # Cython code should be unit-tested directly
-        nonContigFrame = self.frame.reindex(self.ts1.index[::2])
-
-        for col in nonContigFrame.columns:
-            for idx, val in compat.iteritems(nonContigFrame[col]):
-                if idx in self.frame.index:
-                    if np.isnan(val):
-                        self.assertTrue(np.isnan(self.frame[col][idx]))
-                    else:
-                        self.assertEqual(val, self.frame[col][idx])
-                else:
-                    self.assertTrue(np.isnan(val))
-
-        for col, series in compat.iteritems(nonContigFrame):
-            self.assertTrue(tm.equalContents(series.index,
-                                          nonContigFrame.index))
-
-        # corner cases
-
-        # Same index, copies values but not index if copy=False
-        newFrame = self.frame.reindex(self.frame.index, copy=False)
-        self.assertIs(newFrame.index, self.frame.index)
-
-        # length zero
-        newFrame = self.frame.reindex([])
-        self.assertTrue(newFrame.empty)
-        self.assertEqual(len(newFrame.columns), len(self.frame.columns))
-
-        # length zero with columns reindexed with non-empty index
-        newFrame = self.frame.reindex([])
-        newFrame = newFrame.reindex(self.frame.index)
-        self.assertEqual(len(newFrame.index), len(self.frame.index))
-        self.assertEqual(len(newFrame.columns), len(self.frame.columns))
-
-        # pass non-Index
-        newFrame = self.frame.reindex(list(self.ts1.index))
-        self.assertTrue(newFrame.index.equals(self.ts1.index))
-
-        # copy with no axes
-        result = self.frame.reindex()
-        assert_frame_equal(result,self.frame)
-        self.assertFalse(result is self.frame)
-
-    def test_reindex_nan(self):
-        df = pd.DataFrame([[1, 2], [3, 5], [7, 11], [9, 23]],
-                index=[2, np.nan, 1, 5], columns=['joe', 'jim'])
-
-        i, j = [np.nan, 5, 5, np.nan, 1, 2, np.nan], [1, 3, 3, 1, 2, 0, 1]
-        tm.assert_frame_equal(df.reindex(i), df.iloc[j])
-
-        df.index = df.index.astype('object')
-        tm.assert_frame_equal(df.reindex(i), df.iloc[j])
-
-        # GH10388
-        df = pd.DataFrame({'other':['a', 'b', np.nan, 'c'],
-                           'date':['2015-03-22', np.nan, '2012-01-08', np.nan],
-                           'amount':[2, 3, 4, 5]})
-
-        df['date'] = pd.to_datetime(df.date)
-        df['delta'] = (pd.to_datetime('2015-06-18') - df['date']).shift(1)
-
-        left = df.set_index(['delta', 'other', 'date']).reset_index()
-        right = df.reindex(columns=['delta', 'other', 'date', 'amount'])
-        assert_frame_equal(left, right)
-
-    def test_reindex_name_remains(self):
-        s = Series(random.rand(10))
-        df = DataFrame(s, index=np.arange(len(s)))
-        i = Series(np.arange(10), name='iname')
-
-        df = df.reindex(i)
-        self.assertEqual(df.index.name, 'iname')
-
-        df = df.reindex(Index(np.arange(10), name='tmpname'))
-        self.assertEqual(df.index.name, 'tmpname')
-
-        s = Series(random.rand(10))
-        df = DataFrame(s.T, index=np.arange(len(s)))
-        i = Series(np.arange(10), name='iname')
-        df = df.reindex(columns=i)
-        self.assertEqual(df.columns.name, 'iname')
-
-    def test_reindex_int(self):
-        smaller = self.intframe.reindex(self.intframe.index[::2])
-
-        self.assertEqual(smaller['A'].dtype, np.int64)
-
-        bigger = smaller.reindex(self.intframe.index)
-        self.assertEqual(bigger['A'].dtype, np.float64)
-
-        smaller = self.intframe.reindex(columns=['A', 'B'])
-        self.assertEqual(smaller['A'].dtype, np.int64)
-
-    def test_reindex_like(self):
-        other = self.frame.reindex(index=self.frame.index[:10],
-                                   columns=['C', 'B'])
-
-        assert_frame_equal(other, self.frame.reindex_like(other))
-
-    def test_reindex_columns(self):
-        newFrame = self.frame.reindex(columns=['A', 'B', 'E'])
-
-        assert_series_equal(newFrame['B'], self.frame['B'])
-        self.assertTrue(np.isnan(newFrame['E']).all())
-        self.assertNotIn('C', newFrame)
-
-        # length zero
-        newFrame = self.frame.reindex(columns=[])
-        self.assertTrue(newFrame.empty)
-
-    def test_reindex_axes(self):
-
-        # GH 3317, reindexing by both axes loses freq of the index
-        from datetime import datetime
-        df = DataFrame(np.ones((3, 3)), index=[datetime(2012, 1, 1), datetime(2012, 1, 2), datetime(2012, 1, 3)], columns=['a', 'b', 'c'])
-        time_freq = date_range('2012-01-01', '2012-01-03', freq='d')
-        some_cols = ['a', 'b']
-
-        index_freq = df.reindex(index=time_freq).index.freq
-        both_freq = df.reindex(index=time_freq, columns=some_cols).index.freq
-        seq_freq = df.reindex(index=time_freq).reindex(columns=some_cols).index.freq
-        self.assertEqual(index_freq, both_freq)
-        self.assertEqual(index_freq, seq_freq)
-
-    def test_reindex_fill_value(self):
-        df = DataFrame(np.random.randn(10, 4))
-
-        # axis=0
-        result = df.reindex(lrange(15))
-        self.assertTrue(np.isnan(result.values[-5:]).all())
-
-        result = df.reindex(lrange(15), fill_value=0)
-        expected = df.reindex(lrange(15)).fillna(0)
-        assert_frame_equal(result, expected)
-
-        # axis=1
-        result = df.reindex(columns=lrange(5), fill_value=0.)
-        expected = df.copy()
-        expected[4] = 0.
-        assert_frame_equal(result, expected)
-
-        result = df.reindex(columns=lrange(5), fill_value=0)
-        expected = df.copy()
-        expected[4] = 0
-        assert_frame_equal(result, expected)
-
-        result = df.reindex(columns=lrange(5), fill_value='foo')
-        expected = df.copy()
-        expected[4] = 'foo'
-        assert_frame_equal(result, expected)
-
-        # reindex_axis
-        result = df.reindex_axis(lrange(15), fill_value=0., axis=0)
-        expected = df.reindex(lrange(15)).fillna(0)
-        assert_frame_equal(result, expected)
-
-        result = df.reindex_axis(lrange(5), fill_value=0., axis=1)
-        expected = df.reindex(columns=lrange(5)).fillna(0)
-        assert_frame_equal(result, expected)
-
-        # other dtypes
-        df['foo'] = 'foo'
-        result = df.reindex(lrange(15), fill_value=0)
-        expected = df.reindex(lrange(15)).fillna(0)
-        assert_frame_equal(result, expected)
-
-    def test_reindex_dups(self):
-
-        # GH4746, reindex on duplicate index error messages
-        arr = np.random.randn(10)
-        df = DataFrame(arr,index=[1,2,3,4,5,1,2,3,4,5])
-
-        # set index is ok
-        result = df.copy()
-        result.index = list(range(len(df)))
-        expected = DataFrame(arr,index=list(range(len(df))))
-        assert_frame_equal(result,expected)
-
-        # reindex fails
-        self.assertRaises(ValueError, df.reindex, index=list(range(len(df))))
-
-    def test_align(self):
-        af, bf = self.frame.align(self.frame)
-        self.assertIsNot(af._data, self.frame._data)
-
-        af, bf = self.frame.align(self.frame, copy=False)
-        self.assertIs(af._data, self.frame._data)
-
-        # axis = 0
-        other = self.frame.ix[:-5, :3]
-        af, bf = self.frame.align(other, axis=0, fill_value=-1)
-        self.assertTrue(bf.columns.equals(other.columns))
-        # test fill value
-        join_idx = self.frame.index.join(other.index)
-        diff_a = self.frame.index.difference(join_idx)
-        diff_b = other.index.difference(join_idx)
-        diff_a_vals = af.reindex(diff_a).values
-        diff_b_vals = bf.reindex(diff_b).values
-        self.assertTrue((diff_a_vals == -1).all())
-
-        af, bf = self.frame.align(other, join='right', axis=0)
-        self.assertTrue(bf.columns.equals(other.columns))
-        self.assertTrue(bf.index.equals(other.index))
-        self.assertTrue(af.index.equals(other.index))
-
-        # axis = 1
-        other = self.frame.ix[:-5, :3].copy()
-        af, bf = self.frame.align(other, axis=1)
-        self.assertTrue(bf.columns.equals(self.frame.columns))
-        self.assertTrue(bf.index.equals(other.index))
-
-        # test fill value
-        join_idx = self.frame.index.join(other.index)
-        diff_a = self.frame.index.difference(join_idx)
-        diff_b = other.index.difference(join_idx)
-        diff_a_vals = af.reindex(diff_a).values
-        diff_b_vals = bf.reindex(diff_b).values
-        self.assertTrue((diff_a_vals == -1).all())
-
-        af, bf = self.frame.align(other, join='inner', axis=1)
-        self.assertTrue(bf.columns.equals(other.columns))
-
-        af, bf = self.frame.align(other, join='inner', axis=1, method='pad')
-        self.assertTrue(bf.columns.equals(other.columns))
-
-        # test other non-float types
-        af, bf = self.intframe.align(other, join='inner', axis=1, method='pad')
-        self.assertTrue(bf.columns.equals(other.columns))
-
-        af, bf = self.mixed_frame.align(self.mixed_frame,
-                                        join='inner', axis=1, method='pad')
-        self.assertTrue(bf.columns.equals(self.mixed_frame.columns))
-
-        af, bf = self.frame.align(other.ix[:, 0], join='inner', axis=1,
-                                  method=None, fill_value=None)
-        self.assertTrue(bf.index.equals(Index([])))
-
-        af, bf = self.frame.align(other.ix[:, 0], join='inner', axis=1,
-                                  method=None, fill_value=0)
-        self.assertTrue(bf.index.equals(Index([])))
-
-        # mixed floats/ints
-        af, bf = self.mixed_float.align(other.ix[:, 0], join='inner', axis=1,
-                                        method=None, fill_value=0)
-        self.assertTrue(bf.index.equals(Index([])))
-
-        af, bf = self.mixed_int.align(other.ix[:, 0], join='inner', axis=1,
-                                        method=None, fill_value=0)
-        self.assertTrue(bf.index.equals(Index([])))
-
-        # try to align dataframe to series along bad axis
-        self.assertRaises(ValueError, self.frame.align, af.ix[0, :3],
-                          join='inner', axis=2)
-
-        # align dataframe to series with broadcast or not
-        idx = self.frame.index
-        s = Series(range(len(idx)), index=idx)
-
-        left, right = self.frame.align(s, axis=0)
-        tm.assert_index_equal(left.index, self.frame.index)
-        tm.assert_index_equal(right.index, self.frame.index)
-        self.assertTrue(isinstance(right, Series))
-
-        left, right = self.frame.align(s, broadcast_axis=1)
-        tm.assert_index_equal(left.index, self.frame.index)
-        expected = {}
-        for c in self.frame.columns:
-            expected[c] = s
-        expected = DataFrame(expected, index=self.frame.index,
-                             columns=self.frame.columns)
-        assert_frame_equal(right, expected)
-
-        # GH 9558
-        df = DataFrame({'a':[1,2,3], 'b':[4,5,6]})
-        result = df[df['a'] == 2]
-        expected = DataFrame([[2, 5]], index=[1], columns=['a', 'b'])
-        assert_frame_equal(result, expected)
-
-        result = df.where(df['a'] == 2, 0)
-        expected = DataFrame({'a':[0, 2, 0], 'b':[0, 5, 0]})
-        assert_frame_equal(result, expected)
-
-    def _check_align(self, a, b, axis, fill_axis, how, method, limit=None):
-        aa, ab = a.align(b, axis=axis, join=how, method=method, limit=limit,
-                         fill_axis=fill_axis)
-
-        join_index, join_columns = None, None
-
-        ea, eb = a, b
-        if axis is None or axis == 0:
-            join_index = a.index.join(b.index, how=how)
-            ea = ea.reindex(index=join_index)
-            eb = eb.reindex(index=join_index)
-
-        if axis is None or axis == 1:
-            join_columns = a.columns.join(b.columns, how=how)
-            ea = ea.reindex(columns=join_columns)
-            eb = eb.reindex(columns=join_columns)
-
-        ea = ea.fillna(axis=fill_axis, method=method, limit=limit)
-        eb = eb.fillna(axis=fill_axis, method=method, limit=limit)
-
-        assert_frame_equal(aa, ea)
-        assert_frame_equal(ab, eb)
-
-    def test_align_fill_method_inner(self):
-        for meth in ['pad', 'bfill']:
-            for ax in [0, 1, None]:
-                for fax in [0, 1]:
-                    self._check_align_fill('inner', meth, ax, fax)
-
-    def test_align_fill_method_outer(self):
-        for meth in ['pad', 'bfill']:
-            for ax in [0, 1, None]:
-                for fax in [0, 1]:
-                    self._check_align_fill('outer', meth, ax, fax)
-
-    def test_align_fill_method_left(self):
-        for meth in ['pad', 'bfill']:
-            for ax in [0, 1, None]:
-                for fax in [0, 1]:
-                    self._check_align_fill('left', meth, ax, fax)
-
-    def test_align_fill_method_right(self):
-        for meth in ['pad', 'bfill']:
-            for ax in [0, 1, None]:
-                for fax in [0, 1]:
-                    self._check_align_fill('right', meth, ax, fax)
-
-    def _check_align_fill(self, kind, meth, ax, fax):
-        left = self.frame.ix[0:4, :10]
-        right = self.frame.ix[2:, 6:]
-        empty = self.frame.ix[:0, :0]
-
-        self._check_align(left, right, axis=ax, fill_axis=fax,
-                          how=kind, method=meth)
-        self._check_align(left, right, axis=ax, fill_axis=fax,
-                          how=kind, method=meth, limit=1)
-
-        # empty left
-        self._check_align(empty, right, axis=ax, fill_axis=fax,
-                          how=kind, method=meth)
-        self._check_align(empty, right, axis=ax, fill_axis=fax,
-                          how=kind, method=meth, limit=1)
-
-        # empty right
-        self._check_align(left, empty, axis=ax, fill_axis=fax,
-                          how=kind, method=meth)
-        self._check_align(left, empty, axis=ax, fill_axis=fax,
-                          how=kind, method=meth, limit=1)
-
-        # both empty
-        self._check_align(empty, empty, axis=ax, fill_axis=fax,
-                          how=kind, method=meth)
-        self._check_align(empty, empty, axis=ax, fill_axis=fax,
-                          how=kind, method=meth, limit=1)
-
-    def test_align_int_fill_bug(self):
-        # GH #910
-        X = np.arange(10*10, dtype='float64').reshape(10, 10)
-        Y = np.ones((10, 1), dtype=int)
-
-        df1 = DataFrame(X)
-        df1['0.X'] = Y.squeeze()
-
-        df2 = df1.astype(float)
-
-        result = df1 - df1.mean()
-        expected = df2 - df2.mean()
-        assert_frame_equal(result, expected)
-
-    def test_align_multiindex(self):
-        # GH 10665
-        # same test cases as test_align_multiindex in test_series.py
-
-        midx = pd.MultiIndex.from_product([range(2), range(3), range(2)],
-                                 names=('a', 'b', 'c'))
-        idx = pd.Index(range(2), name='b')
-        df1 = pd.DataFrame(np.arange(12,dtype='int64'), index=midx)
-        df2 = pd.DataFrame(np.arange(2,dtype='int64'), index=idx)
-
-        # these must be the same results (but flipped)
-        res1l, res1r = df1.align(df2, join='left')
-        res2l, res2r = df2.align(df1, join='right')
-
-        expl = df1
-        tm.assert_frame_equal(expl, res1l)
-        tm.assert_frame_equal(expl, res2r)
-        expr = pd.DataFrame([0, 0, 1, 1, np.nan, np.nan] * 2, index=midx)
-        tm.assert_frame_equal(expr, res1r)
-        tm.assert_frame_equal(expr, res2l)
-
-        res1l, res1r = df1.align(df2, join='right')
-        res2l, res2r = df2.align(df1, join='left')
-
-        exp_idx = pd.MultiIndex.from_product([range(2), range(2), range(2)],
-                                             names=('a', 'b', 'c'))
-        expl = pd.DataFrame([0, 1, 2, 3, 6, 7, 8, 9], index=exp_idx)
-        tm.assert_frame_equal(expl, res1l)
-        tm.assert_frame_equal(expl, res2r)
-        expr = pd.DataFrame([0, 0, 1, 1] * 2, index=exp_idx)
-        tm.assert_frame_equal(expr, res1r)
-        tm.assert_frame_equal(expr, res2l)
-
-    def test_where(self):
-        default_frame = DataFrame(np.random.randn(5, 3),columns=['A','B','C'])
-
-        def _safe_add(df):
-            # only add to the numeric items
-            def is_ok(s):
-                return issubclass(s.dtype.type, (np.integer,np.floating)) and s.dtype != 'uint8'
-            return DataFrame(dict([ (c,s+1) if is_ok(s) else (c,s) for c, s in compat.iteritems(df) ]))
-
-        def _check_get(df, cond, check_dtypes = True):
-            other1 = _safe_add(df)
-            rs = df.where(cond, other1)
-            rs2 = df.where(cond.values, other1)
-            for k, v in rs.iteritems():
-                exp = Series(np.where(cond[k], df[k], other1[k]),index=v.index)
-                assert_series_equal(v, exp, check_names=False)
-            assert_frame_equal(rs, rs2)
-
-            # dtypes
-            if check_dtypes:
-                self.assertTrue((rs.dtypes == df.dtypes).all() == True)
-
-        # check getting
-        for df in [ default_frame, self.mixed_frame, self.mixed_float, self.mixed_int ]:
-            cond = df > 0
-            _check_get(df, cond)
-
-
-        # upcasting case (GH # 2794)
-        df = DataFrame(dict([ (c,Series([1]*3,dtype=c)) for c in ['int64','int32','float32','float64'] ]))
-        df.ix[1,:] = 0
-        result = df.where(df>=0).get_dtype_counts()
-
-        #### when we don't preserve boolean casts ####
-        #expected = Series({ 'float32' : 1, 'float64' : 3 })
-
-        expected = Series({ 'float32' : 1, 'float64' : 1, 'int32' : 1, 'int64' : 1 })
-        assert_series_equal(result, expected)
-
-        # aligning
-        def _check_align(df, cond, other, check_dtypes = True):
-            rs = df.where(cond, other)
-            for i, k in enumerate(rs.columns):
-                result = rs[k]
-                d = df[k].values
-                c = cond[k].reindex(df[k].index).fillna(False).values
-
-                if np.isscalar(other):
-                    o = other
-                else:
-                    if isinstance(other,np.ndarray):
-                        o = Series(other[:,i],index=result.index).values
-                    else:
-                        o = other[k].values
-
-                new_values = d if c.all() else np.where(c, d, o)
-                expected = Series(new_values, index=result.index, name=k)
-
-                # since we can't always have the correct numpy dtype
-                # as numpy doesn't know how to downcast, don't check
-                assert_series_equal(result, expected, check_dtype=False)
-
-            # dtypes
-            # can't check dtype when other is an ndarray
-
-            if check_dtypes and not isinstance(other,np.ndarray):
-                self.assertTrue((rs.dtypes == df.dtypes).all() == True)
-
-        for df in [ self.mixed_frame, self.mixed_float, self.mixed_int ]:
-
-            # other is a frame
-            cond = (df > 0)[1:]
-            _check_align(df, cond, _safe_add(df))
-
-            # check other is ndarray
-            cond = df > 0
-            _check_align(df, cond, (_safe_add(df).values))
-
-            # integers are upcast, so don't check the dtypes
-            cond = df > 0
-            check_dtypes = all([ not issubclass(s.type,np.integer) for s in df.dtypes ])
-            _check_align(df, cond, np.nan, check_dtypes = check_dtypes)
-
-        # invalid conditions
-        df = default_frame
-        err1 = (df + 1).values[0:2, :]
-        self.assertRaises(ValueError, df.where, cond, err1)
-
-        err2 = cond.ix[:2, :].values
-        other1 = _safe_add(df)
-        self.assertRaises(ValueError, df.where, err2, other1)
-
-        self.assertRaises(ValueError, df.mask, True)
-        self.assertRaises(ValueError, df.mask, 0)
-
-        # where inplace
-        def _check_set(df, cond, check_dtypes = True):
-            dfi = df.copy()
-            econd = cond.reindex_like(df).fillna(True)
-            expected = dfi.mask(~econd)
-
-            dfi.where(cond, np.nan, inplace=True)
-            assert_frame_equal(dfi, expected)
-
-            # dtypes (and confirm upcasts)x
-            if check_dtypes:
-                for k, v in compat.iteritems(df.dtypes):
-                    if issubclass(v.type,np.integer) and not cond[k].all():
-                        v = np.dtype('float64')
-                    self.assertEqual(dfi[k].dtype, v)
-
-        for df in [ default_frame, self.mixed_frame, self.mixed_float, self.mixed_int ]:
-
-            cond = df > 0
-            _check_set(df, cond)
-
-            cond = df >= 0
-            _check_set(df, cond)
-
-            # aligining
-            cond = (df >= 0)[1:]
-            _check_set(df, cond)
-
-        # GH 10218
-        # test DataFrame.where with Series slicing
-        df = DataFrame({'a': range(3), 'b': range(4, 7)})
-        result = df.where(df['a'] == 1)
-        expected = df[df['a'] == 1].reindex(df.index)
-        assert_frame_equal(result, expected)
-
-    def test_where_bug(self):
-
-        # GH 2793
-
-        df = DataFrame({'a': [1.0, 2.0, 3.0, 4.0], 'b': [4.0, 3.0, 2.0, 1.0]}, dtype = 'float64')
-        expected = DataFrame({'a': [np.nan, np.nan, 3.0, 4.0], 'b': [4.0, 3.0, np.nan, np.nan]}, dtype = 'float64')
-        result   = df.where(df > 2, np.nan)
-        assert_frame_equal(result, expected)
-
-        result = df.copy()
-        result.where(result > 2, np.nan, inplace=True)
-        assert_frame_equal(result, expected)
-
-        # mixed
-        for dtype in ['int16','int8','int32','int64']:
-            df = DataFrame({'a': np.array([1, 2, 3, 4],dtype=dtype), 'b': np.array([4.0, 3.0, 2.0, 1.0], dtype = 'float64') })
-            expected = DataFrame({'a': [np.nan, np.nan, 3.0, 4.0], 'b': [4.0, 3.0, np.nan, np.nan]}, dtype = 'float64')
-            result   = df.where(df > 2, np.nan)
-            assert_frame_equal(result, expected)
-
-            result = df.copy()
-            result.where(result > 2, np.nan, inplace=True)
-            assert_frame_equal(result, expected)
-
-        # transpositional issue
-        # GH7506
-        a = DataFrame({ 0 : [1,2], 1 : [3,4], 2 : [5,6]})
-        b = DataFrame({ 0 : [np.nan,8], 1:[9,np.nan], 2:[np.nan,np.nan]})
-        do_not_replace = b.isnull() | (a > b)
-
-        expected = a.copy()
-        expected[~do_not_replace] = b
-
-        result = a.where(do_not_replace,b)
-        assert_frame_equal(result,expected)
-
-        a = DataFrame({ 0 : [4,6], 1 : [1,0]})
-        b = DataFrame({ 0 : [np.nan,3],1:[3,np.nan]})
-        do_not_replace = b.isnull() | (a > b)
-
-        expected = a.copy()
-        expected[~do_not_replace] = b
-
-        result = a.where(do_not_replace,b)
-        assert_frame_equal(result,expected)
-
-    def test_where_datetime(self):
-
-        # GH 3311
-        df = DataFrame(dict(A = date_range('20130102',periods=5),
-                            B = date_range('20130104',periods=5),
-                            C = np.random.randn(5)))
-
-        stamp = datetime(2013,1,3)
-        result = df[df>stamp]
-        expected = df.copy()
-        expected.loc[[0,1],'A'] = np.nan
-        assert_frame_equal(result,expected)
-
-    def test_where_none(self):
-        # GH 4667
-        # setting with None changes dtype
-        df = DataFrame({'series': Series(range(10))}).astype(float)
-        df[df > 7] = None
-        expected = DataFrame({'series': Series([0,1,2,3,4,5,6,7,np.nan,np.nan]) })
-        assert_frame_equal(df, expected)
-
-        # GH 7656
-        df = DataFrame([{'A': 1, 'B': np.nan, 'C': 'Test'}, {'A': np.nan, 'B': 'Test', 'C': np.nan}])
-        expected = df.where(~isnull(df), None)
-        with tm.assertRaisesRegexp(TypeError, 'boolean setting on mixed-type'):
-            df.where(~isnull(df), None, inplace=True)
-
-    def test_where_align(self):
-
-        def create():
-            df = DataFrame(np.random.randn(10,3))
-            df.iloc[3:5,0] = np.nan
-            df.iloc[4:6,1] = np.nan
-            df.iloc[5:8,2] = np.nan
-            return df
-
-        # series
-        df = create()
-        expected = df.fillna(df.mean())
-        result = df.where(pd.notnull(df),df.mean(),axis='columns')
-        assert_frame_equal(result, expected)
-
-        df.where(pd.notnull(df),df.mean(),inplace=True,axis='columns')
-        assert_frame_equal(df, expected)
-
-        df = create().fillna(0)
-        expected = df.apply(lambda x, y: x.where(x>0,y), y=df[0])
-        result = df.where(df>0,df[0],axis='index')
-        assert_frame_equal(result, expected)
-        result = df.where(df>0,df[0],axis='rows')
-        assert_frame_equal(result, expected)
-
-        # frame
-        df = create()
-        expected = df.fillna(1)
-        result = df.where(pd.notnull(df),DataFrame(1,index=df.index,columns=df.columns))
-        assert_frame_equal(result, expected)
-
-    def test_where_complex(self):
-        # GH 6345
-        expected = DataFrame([[1+1j, 2], [np.nan, 4+1j]], columns=['a', 'b'])
-        df = DataFrame([[1+1j, 2], [5+1j, 4+1j]], columns=['a', 'b'])
-        df[df.abs() >= 5] = np.nan
-        assert_frame_equal(df,expected)
-
-    def test_where_axis(self):
-        # GH 9736
-        df = DataFrame(np.random.randn(2, 2))
-        mask = DataFrame([[False, False], [False, False]])
-        s = Series([0, 1])
-
-        expected = DataFrame([[0, 0], [1, 1]], dtype='float64')
-        result = df.where(mask, s, axis='index')
-        assert_frame_equal(result, expected)
-
-        result = df.copy()
-        result.where(mask, s, axis='index', inplace=True)
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame([[0, 1], [0, 1]], dtype='float64')
-        result = df.where(mask, s, axis='columns')
-        assert_frame_equal(result, expected)
-
-        result = df.copy()
-        result.where(mask, s, axis='columns', inplace=True)
-        assert_frame_equal(result, expected)
-
-        # Upcast needed
-        df = DataFrame([[1, 2], [3, 4]], dtype='int64')
-        mask = DataFrame([[False, False], [False, False]])
-        s = Series([0, np.nan])
-
-        expected = DataFrame([[0, 0], [np.nan, np.nan]], dtype='float64')
-        result = df.where(mask, s, axis='index')
-        assert_frame_equal(result, expected)
-
-        result = df.copy()
-        result.where(mask, s, axis='index', inplace=True)
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame([[0, np.nan], [0, np.nan]], dtype='float64')
-        result = df.where(mask, s, axis='columns')
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame({0 : np.array([0, 0], dtype='int64'),
-                              1 : np.array([np.nan, np.nan], dtype='float64')})
-        result = df.copy()
-        result.where(mask, s, axis='columns', inplace=True)
-        assert_frame_equal(result, expected)
-
-        # Multiple dtypes (=> multiple Blocks)
-        df = pd.concat([DataFrame(np.random.randn(10, 2)),
-                     DataFrame(np.random.randint(0, 10, size=(10, 2)))],
-                     ignore_index=True, axis=1)
-        mask = DataFrame(False, columns=df.columns, index=df.index)
-        s1 = Series(1, index=df.columns)
-        s2 = Series(2, index=df.index)
-
-        result = df.where(mask, s1, axis='columns')
-        expected = DataFrame(1.0, columns=df.columns, index=df.index)
-        expected[2] = expected[2].astype(int)
-        expected[3] = expected[3].astype(int)
-        assert_frame_equal(result, expected)
-
-        result = df.copy()
-        result.where(mask, s1, axis='columns', inplace=True)
-        assert_frame_equal(result, expected)
-
-        result = df.where(mask, s2, axis='index')
-        expected = DataFrame(2.0, columns=df.columns, index=df.index)
-        expected[2] = expected[2].astype(int)
-        expected[3] = expected[3].astype(int)
-        assert_frame_equal(result, expected)
-
-        result = df.copy()
-        result.where(mask, s2, axis='index', inplace=True)
-        assert_frame_equal(result, expected)
-
-        # DataFrame vs DataFrame
-        d1 = df.copy().drop(1, axis=0)
-        expected = df.copy()
-        expected.loc[1, :] = np.nan
-
-        result = df.where(mask, d1)
-        assert_frame_equal(result, expected)
-        result = df.where(mask, d1, axis='index')
-        assert_frame_equal(result, expected)
-        result = df.copy()
-        result.where(mask, d1, inplace=True)
-        assert_frame_equal(result, expected)
-        result = df.copy()
-        result.where(mask, d1, inplace=True, axis='index')
-        assert_frame_equal(result, expected)
-
-        d2 = df.copy().drop(1, axis=1)
-        expected = df.copy()
-        expected.loc[:, 1] = np.nan
-
-        result = df.where(mask, d2)
-        assert_frame_equal(result, expected)
-        result = df.where(mask, d2, axis='columns')
-        assert_frame_equal(result, expected)
-        result = df.copy()
-        result.where(mask, d2, inplace=True)
-        assert_frame_equal(result, expected)
-        result = df.copy()
-        result.where(mask, d2, inplace=True, axis='columns')
-        assert_frame_equal(result, expected)
-
-    def test_mask(self):
-        df = DataFrame(np.random.randn(5, 3))
-        cond = df > 0
-
-        rs = df.where(cond, np.nan)
-        assert_frame_equal(rs, df.mask(df <= 0))
-        assert_frame_equal(rs, df.mask(~cond))
-
-        other = DataFrame(np.random.randn(5, 3))
-        rs = df.where(cond, other)
-        assert_frame_equal(rs, df.mask(df <= 0, other))
-        assert_frame_equal(rs, df.mask(~cond, other))
-
-    def test_mask_inplace(self):
-        # GH8801
-        df = DataFrame(np.random.randn(5, 3))
-        cond = df > 0
-
-        rdf = df.copy()
-
-        rdf.where(cond, inplace=True)
-        assert_frame_equal(rdf, df.where(cond))
-        assert_frame_equal(rdf, df.mask(~cond))
-
-        rdf = df.copy()
-        rdf.where(cond, -df, inplace=True)
-        assert_frame_equal(rdf, df.where(cond, -df))
-        assert_frame_equal(rdf, df.mask(~cond, -df))
-
-    def test_mask_edge_case_1xN_frame(self):
-        # GH4071
-        df = DataFrame([[1, 2]])
-        res = df.mask(DataFrame([[True, False]]))
-        expec = DataFrame([[nan, 2]])
-        assert_frame_equal(res, expec)
-
-    #----------------------------------------------------------------------
-    # Transposing
-
-    def test_transpose(self):
-        frame = self.frame
-        dft = frame.T
-        for idx, series in compat.iteritems(dft):
-            for col, value in compat.iteritems(series):
-                if np.isnan(value):
-                    self.assertTrue(np.isnan(frame[col][idx]))
-                else:
-                    self.assertEqual(value, frame[col][idx])
-
-        # mixed type
-        index, data = tm.getMixedTypeDict()
-        mixed = DataFrame(data, index=index)
-
-        mixed_T = mixed.T
-        for col, s in compat.iteritems(mixed_T):
-            self.assertEqual(s.dtype, np.object_)
-
-    def test_transpose_get_view(self):
-        dft = self.frame.T
-        dft.values[:, 5:10] = 5
-
-        self.assertTrue((self.frame.values[5:10] == 5).all())
-
-    #----------------------------------------------------------------------
-    # Renaming
-
-    def test_rename(self):
-        mapping = {
-            'A': 'a',
-            'B': 'b',
-            'C': 'c',
-            'D': 'd'
-        }
-
-        renamed = self.frame.rename(columns=mapping)
-        renamed2 = self.frame.rename(columns=str.lower)
-
-        assert_frame_equal(renamed, renamed2)
-        assert_frame_equal(renamed2.rename(columns=str.upper),
-                           self.frame, check_names=False)
-
-        # index
-        data = {
-            'A': {'foo': 0, 'bar': 1}
-        }
-
-        # gets sorted alphabetical
-        df = DataFrame(data)
-        renamed = df.rename(index={'foo': 'bar', 'bar': 'foo'})
-        self.assert_numpy_array_equal(renamed.index, ['foo', 'bar'])
-
-        renamed = df.rename(index=str.upper)
-        self.assert_numpy_array_equal(renamed.index, ['BAR', 'FOO'])
-
-        # have to pass something
-        self.assertRaises(TypeError, self.frame.rename)
-
-        # partial columns
-        renamed = self.frame.rename(columns={'C': 'foo', 'D': 'bar'})
-        self.assert_numpy_array_equal(renamed.columns, ['A', 'B', 'foo', 'bar'])
-
-        # other axis
-        renamed = self.frame.T.rename(index={'C': 'foo', 'D': 'bar'})
-        self.assert_numpy_array_equal(renamed.index, ['A', 'B', 'foo', 'bar'])
-
-        # index with name
-        index = Index(['foo', 'bar'], name='name')
-        renamer = DataFrame(data, index=index)
-        renamed = renamer.rename(index={'foo': 'bar', 'bar': 'foo'})
-        self.assert_numpy_array_equal(renamed.index, ['bar', 'foo'])
-        self.assertEqual(renamed.index.name, renamer.index.name)
-
-        # MultiIndex
-        tuples_index = [('foo1', 'bar1'), ('foo2', 'bar2')]
-        tuples_columns = [('fizz1', 'buzz1'), ('fizz2', 'buzz2')]
-        index = MultiIndex.from_tuples(tuples_index, names=['foo', 'bar'])
-        columns = MultiIndex.from_tuples(tuples_columns, names=['fizz', 'buzz'])
-        renamer = DataFrame([(0,0),(1,1)], index=index, columns=columns)
-        renamed = renamer.rename(index={'foo1': 'foo3', 'bar2': 'bar3'},
-                                 columns={'fizz1': 'fizz3', 'buzz2': 'buzz3'})
-        new_index = MultiIndex.from_tuples([('foo3', 'bar1'), ('foo2', 'bar3')])
-        new_columns = MultiIndex.from_tuples([('fizz3', 'buzz1'), ('fizz2', 'buzz3')])
-        self.assert_numpy_array_equal(renamed.index, new_index)
-        self.assert_numpy_array_equal(renamed.columns, new_columns)
-        self.assertEqual(renamed.index.names, renamer.index.names)
-        self.assertEqual(renamed.columns.names, renamer.columns.names)
-
-    def test_rename_nocopy(self):
-        renamed = self.frame.rename(columns={'C': 'foo'}, copy=False)
-        renamed['foo'] = 1.
-        self.assertTrue((self.frame['C'] == 1.).all())
-
-    def test_rename_inplace(self):
-        self.frame.rename(columns={'C': 'foo'})
-        self.assertIn('C', self.frame)
-        self.assertNotIn('foo', self.frame)
-
-        c_id = id(self.frame['C'])
-        frame = self.frame.copy()
-        frame.rename(columns={'C': 'foo'}, inplace=True)
-
-        self.assertNotIn('C', frame)
-        self.assertIn('foo', frame)
-        self.assertNotEqual(id(frame['foo']), c_id)
-
-    def test_rename_bug(self):
-        # GH 5344
-        # rename set ref_locs, and set_index was not resetting
-        df = DataFrame({ 0 : ['foo','bar'], 1 : ['bah','bas'], 2 : [1,2]})
-        df = df.rename(columns={0 : 'a'})
-        df = df.rename(columns={1 : 'b'})
-        df = df.set_index(['a','b'])
-        df.columns = ['2001-01-01']
-        expected = DataFrame([[1],[2]],index=MultiIndex.from_tuples([('foo','bah'),('bar','bas')],
-                                                                    names=['a','b']),
-                             columns=['2001-01-01'])
-        assert_frame_equal(df,expected)
-
-    #----------------------------------------------------------------------
-    # Time series related
-    def test_diff(self):
-        the_diff = self.tsframe.diff(1)
-
-        assert_series_equal(the_diff['A'],
-                            self.tsframe['A'] - self.tsframe['A'].shift(1))
-
-        # int dtype
-        a = 10000000000000000
-        b = a + 1
-        s = Series([a, b])
-
-        rs = DataFrame({'s': s}).diff()
-        self.assertEqual(rs.s[1], 1)
-
-        # mixed numeric
-        tf = self.tsframe.astype('float32')
-        the_diff = tf.diff(1)
-        assert_series_equal(the_diff['A'],
-                            tf['A'] - tf['A'].shift(1))
-
-        # issue 10907
-        df = pd.DataFrame({'y': pd.Series([2]), 'z': pd.Series([3])})
-        df.insert(0, 'x', 1)
-        result = df.diff(axis=1)
-        expected = pd.DataFrame({'x':np.nan, 'y':pd.Series(1), 'z':pd.Series(1)}).astype('float64')
-        assert_frame_equal(result, expected)
-
-
-    def test_diff_timedelta(self):
-        # GH 4533
-        df = DataFrame(dict(time=[Timestamp('20130101 9:01'),
-                                  Timestamp('20130101 9:02')],
-                            value=[1.0,2.0]))
-
-        res = df.diff()
-        exp = DataFrame([[pd.NaT, np.nan],
-                         [Timedelta('00:01:00'), 1]],
-                        columns=['time', 'value'])
-        assert_frame_equal(res, exp)
-
-    def test_diff_mixed_dtype(self):
-        df = DataFrame(np.random.randn(5, 3))
-        df['A'] = np.array([1, 2, 3, 4, 5], dtype=object)
-
-        result = df.diff()
-        self.assertEqual(result[0].dtype, np.float64)
-
-    def test_diff_neg_n(self):
-        rs = self.tsframe.diff(-1)
-        xp = self.tsframe - self.tsframe.shift(-1)
-        assert_frame_equal(rs, xp)
-
-    def test_diff_float_n(self):
-        rs = self.tsframe.diff(1.)
-        xp = self.tsframe.diff(1)
-        assert_frame_equal(rs, xp)
-
-    def test_diff_axis(self):
-        # GH 9727
-        df = DataFrame([[1., 2.], [3., 4.]])
-        assert_frame_equal(df.diff(axis=1), DataFrame([[np.nan, 1.], [np.nan, 1.]]))
-        assert_frame_equal(df.diff(axis=0), DataFrame([[np.nan, np.nan], [2., 2.]]))
-
-    def test_pct_change(self):
-        rs = self.tsframe.pct_change(fill_method=None)
-        assert_frame_equal(rs, self.tsframe / self.tsframe.shift(1) - 1)
-
-        rs = self.tsframe.pct_change(2)
-        filled = self.tsframe.fillna(method='pad')
-        assert_frame_equal(rs, filled / filled.shift(2) - 1)
-
-        rs = self.tsframe.pct_change(fill_method='bfill', limit=1)
-        filled = self.tsframe.fillna(method='bfill', limit=1)
-        assert_frame_equal(rs, filled / filled.shift(1) - 1)
-
-        rs = self.tsframe.pct_change(freq='5D')
-        filled = self.tsframe.fillna(method='pad')
-        assert_frame_equal(rs, filled / filled.shift(freq='5D') - 1)
-
-    def test_pct_change_shift_over_nas(self):
-        s = Series([1., 1.5, np.nan, 2.5, 3.])
-
-        df = DataFrame({'a': s, 'b': s})
-
-        chg = df.pct_change()
-        expected = Series([np.nan, 0.5, np.nan, 2.5 / 1.5 - 1, .2])
-        edf = DataFrame({'a': expected, 'b': expected})
-        assert_frame_equal(chg, edf)
-
-    def test_shift(self):
-        # naive shift
-        shiftedFrame = self.tsframe.shift(5)
-        self.assertTrue(shiftedFrame.index.equals(self.tsframe.index))
-
-        shiftedSeries = self.tsframe['A'].shift(5)
-        assert_series_equal(shiftedFrame['A'], shiftedSeries)
-
-        shiftedFrame = self.tsframe.shift(-5)
-        self.assertTrue(shiftedFrame.index.equals(self.tsframe.index))
-
-        shiftedSeries = self.tsframe['A'].shift(-5)
-        assert_series_equal(shiftedFrame['A'], shiftedSeries)
-
-        # shift by 0
-        unshifted = self.tsframe.shift(0)
-        assert_frame_equal(unshifted, self.tsframe)
-
-        # shift by DateOffset
-        shiftedFrame = self.tsframe.shift(5, freq=datetools.BDay())
-        self.assertEqual(len(shiftedFrame), len(self.tsframe))
-
-        shiftedFrame2 = self.tsframe.shift(5, freq='B')
-        assert_frame_equal(shiftedFrame, shiftedFrame2)
-
-        d = self.tsframe.index[0]
-        shifted_d = d + datetools.BDay(5)
-        assert_series_equal(self.tsframe.xs(d),
-                            shiftedFrame.xs(shifted_d), check_names=False)
-
-        # shift int frame
-        int_shifted = self.intframe.shift(1)
-
-        # Shifting with PeriodIndex
-        ps = tm.makePeriodFrame()
-        shifted = ps.shift(1)
-        unshifted = shifted.shift(-1)
-        self.assertTrue(shifted.index.equals(ps.index))
-
-        tm.assert_dict_equal(unshifted.ix[:, 0].valid(), ps.ix[:, 0],
-                             compare_keys=False)
-
-        shifted2 = ps.shift(1, 'B')
-        shifted3 = ps.shift(1, datetools.bday)
-        assert_frame_equal(shifted2, shifted3)
-        assert_frame_equal(ps, shifted2.shift(-1, 'B'))
-
-        assertRaisesRegexp(ValueError, 'does not match PeriodIndex freq',
-                           ps.shift, freq='D')
-
-
-        # shift other axis
-        # GH 6371
-        df = DataFrame(np.random.rand(10,5))
-        expected = pd.concat([DataFrame(np.nan,index=df.index,columns=[0]),df.iloc[:,0:-1]],ignore_index=True,axis=1)
-        result = df.shift(1,axis=1)
-        assert_frame_equal(result,expected)
-
-        # shift named axis
-        df = DataFrame(np.random.rand(10,5))
-        expected = pd.concat([DataFrame(np.nan,index=df.index,columns=[0]),df.iloc[:,0:-1]],ignore_index=True,axis=1)
-        result = df.shift(1,axis='columns')
-        assert_frame_equal(result,expected)
-
-    def test_shift_bool(self):
-        df = DataFrame({'high': [True, False],
-                        'low': [False, False]})
-        rs = df.shift(1)
-        xp = DataFrame(np.array([[np.nan, np.nan],
-                                 [True, False]], dtype=object),
-                       columns=['high', 'low'])
-        assert_frame_equal(rs, xp)
-
-    def test_shift_categorical(self):
-        # GH 9416
-        s1 = pd.Series(['a', 'b', 'c'], dtype='category')
-        s2 = pd.Series(['A', 'B', 'C'], dtype='category')
-        df = DataFrame({'one': s1, 'two': s2})
-        rs = df.shift(1)
-        xp = DataFrame({'one': s1.shift(1), 'two': s2.shift(1)})
-        assert_frame_equal(rs, xp)
-
-    def test_shift_empty(self):
-        # Regression test for #8019
-        df = DataFrame({'foo': []})
-        rs = df.shift(-1)
-
-        assert_frame_equal(df, rs)
-
-    def test_tshift(self):
-        # PeriodIndex
-        ps = tm.makePeriodFrame()
-        shifted = ps.tshift(1)
-        unshifted = shifted.tshift(-1)
-
-        assert_frame_equal(unshifted, ps)
-
-        shifted2 = ps.tshift(freq='B')
-        assert_frame_equal(shifted, shifted2)
-
-        shifted3 = ps.tshift(freq=datetools.bday)
-        assert_frame_equal(shifted, shifted3)
-
-        assertRaisesRegexp(ValueError, 'does not match', ps.tshift, freq='M')
-
-        # DatetimeIndex
-        shifted = self.tsframe.tshift(1)
-        unshifted = shifted.tshift(-1)
-
-        assert_frame_equal(self.tsframe, unshifted)
-
-        shifted2 = self.tsframe.tshift(freq=self.tsframe.index.freq)
-        assert_frame_equal(shifted, shifted2)
-
-        inferred_ts = DataFrame(self.tsframe.values,
-                                Index(np.asarray(self.tsframe.index)),
-                                columns=self.tsframe.columns)
-        shifted = inferred_ts.tshift(1)
-        unshifted = shifted.tshift(-1)
-        assert_frame_equal(shifted, self.tsframe.tshift(1))
-        assert_frame_equal(unshifted, inferred_ts)
-
-        no_freq = self.tsframe.ix[[0, 5, 7], :]
-        self.assertRaises(ValueError, no_freq.tshift)
-
-    def test_apply(self):
-        # ufunc
-        applied = self.frame.apply(np.sqrt)
-        assert_series_equal(np.sqrt(self.frame['A']), applied['A'])
-
-        # aggregator
-        applied = self.frame.apply(np.mean)
-        self.assertEqual(applied['A'], np.mean(self.frame['A']))
-
-        d = self.frame.index[0]
-        applied = self.frame.apply(np.mean, axis=1)
-        self.assertEqual(applied[d], np.mean(self.frame.xs(d)))
-        self.assertIs(applied.index, self.frame.index)  # want this
-
-        # invalid axis
-        df = DataFrame(
-            [[1, 2, 3], [4, 5, 6], [7, 8, 9]], index=['a', 'a', 'c'])
-        self.assertRaises(ValueError, df.apply, lambda x: x, 2)
-
-        # GH9573
-        df = DataFrame({'c0':['A','A','B','B'], 'c1':['C','C','D','D']})
-        df = df.apply(lambda ts: ts.astype('category'))
-        self.assertEqual(df.shape, (4, 2))
-        self.assertTrue(isinstance(df['c0'].dtype, com.CategoricalDtype))
-        self.assertTrue(isinstance(df['c1'].dtype, com.CategoricalDtype))
-
-    def test_apply_mixed_datetimelike(self):
-        # mixed datetimelike
-        # GH 7778
-        df = DataFrame({ 'A' : date_range('20130101',periods=3), 'B' : pd.to_timedelta(np.arange(3),unit='s') })
-        result = df.apply(lambda x: x, axis=1)
-        assert_frame_equal(result, df)
-
-    def test_apply_empty(self):
-        # empty
-        applied = self.empty.apply(np.sqrt)
-        self.assertTrue(applied.empty)
-
-        applied = self.empty.apply(np.mean)
-        self.assertTrue(applied.empty)
-
-        no_rows = self.frame[:0]
-        result = no_rows.apply(lambda x: x.mean())
-        expected = Series(np.nan, index=self.frame.columns)
-        assert_series_equal(result, expected)
-
-        no_cols = self.frame.ix[:, []]
-        result = no_cols.apply(lambda x: x.mean(), axis=1)
-        expected = Series(np.nan, index=self.frame.index)
-        assert_series_equal(result, expected)
-
-        # 2476
-        xp = DataFrame(index=['a'])
-        rs = xp.apply(lambda x: x['a'], axis=1)
-        assert_frame_equal(xp, rs)
-
-        # reduce with an empty DataFrame
-        x = []
-        result = self.empty.apply(x.append, axis=1, reduce=False)
-        assert_frame_equal(result, self.empty)
-        result = self.empty.apply(x.append, axis=1, reduce=True)
-        assert_series_equal(result, Series([]))
-
-        empty_with_cols = DataFrame(columns=['a', 'b', 'c'])
-        result = empty_with_cols.apply(x.append, axis=1, reduce=False)
-        assert_frame_equal(result, empty_with_cols)
-        result = empty_with_cols.apply(x.append, axis=1, reduce=True)
-        assert_series_equal(result, Series([]))
-
-        # Ensure that x.append hasn't been called
-        self.assertEqual(x, [])
-
-    def test_apply_standard_nonunique(self):
-        df = DataFrame(
-            [[1, 2, 3], [4, 5, 6], [7, 8, 9]], index=['a', 'a', 'c'])
-        rs = df.apply(lambda s: s[0], axis=1)
-        xp = Series([1, 4, 7], ['a', 'a', 'c'])
-        assert_series_equal(rs, xp)
-
-        rs = df.T.apply(lambda s: s[0], axis=0)
-        assert_series_equal(rs, xp)
-
-    def test_apply_broadcast(self):
-        broadcasted = self.frame.apply(np.mean, broadcast=True)
-        agged = self.frame.apply(np.mean)
-
-        for col, ts in compat.iteritems(broadcasted):
-            self.assertTrue((ts == agged[col]).all())
-
-        broadcasted = self.frame.apply(np.mean, axis=1, broadcast=True)
-        agged = self.frame.apply(np.mean, axis=1)
-        for idx in broadcasted.index:
-            self.assertTrue((broadcasted.xs(idx) == agged[idx]).all())
-
-    def test_apply_raw(self):
-        result0 = self.frame.apply(np.mean, raw=True)
-        result1 = self.frame.apply(np.mean, axis=1, raw=True)
-
-        expected0 = self.frame.apply(lambda x: x.values.mean())
-        expected1 = self.frame.apply(lambda x: x.values.mean(), axis=1)
-
-        assert_series_equal(result0, expected0)
-        assert_series_equal(result1, expected1)
-
-        # no reduction
-        result = self.frame.apply(lambda x: x * 2, raw=True)
-        expected = self.frame * 2
-        assert_frame_equal(result, expected)
-
-    def test_apply_axis1(self):
-        d = self.frame.index[0]
-        tapplied = self.frame.apply(np.mean, axis=1)
-        self.assertEqual(tapplied[d], np.mean(self.frame.xs(d)))
-
-    def test_apply_ignore_failures(self):
-        result = self.mixed_frame._apply_standard(np.mean, 0,
-                                                  ignore_failures=True)
-        expected = self.mixed_frame._get_numeric_data().apply(np.mean)
-        assert_series_equal(result, expected)
-
-    def test_apply_mixed_dtype_corner(self):
-        df = DataFrame({'A': ['foo'],
-                        'B': [1.]})
-        result = df[:0].apply(np.mean, axis=1)
-        # the result here is actually kind of ambiguous, should it be a Series
-        # or a DataFrame?
-        expected = Series(np.nan, index=[])
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'A': ['foo'],
-                        'B': [1.]})
-        result = df.apply(lambda x: x['A'], axis=1)
-        expected = Series(['foo'],index=[0])
-        assert_series_equal(result, expected)
-
-        result = df.apply(lambda x: x['B'], axis=1)
-        expected = Series([1.],index=[0])
-        assert_series_equal(result, expected)
-
-    def test_apply_empty_infer_type(self):
-        no_cols = DataFrame(index=['a', 'b', 'c'])
-        no_index = DataFrame(columns=['a', 'b', 'c'])
-
-        def _check(df, f):
-            test_res = f(np.array([], dtype='f8'))
-            is_reduction = not isinstance(test_res, np.ndarray)
-
-            def _checkit(axis=0, raw=False):
-                res = df.apply(f, axis=axis, raw=raw)
-                if is_reduction:
-                    agg_axis = df._get_agg_axis(axis)
-                    tm.assertIsInstance(res, Series)
-                    self.assertIs(res.index, agg_axis)
-                else:
-                    tm.assertIsInstance(res, DataFrame)
-
-            _checkit()
-            _checkit(axis=1)
-            _checkit(raw=True)
-            _checkit(axis=0, raw=True)
-
-        _check(no_cols, lambda x: x)
-        _check(no_cols, lambda x: x.mean())
-        _check(no_index, lambda x: x)
-        _check(no_index, lambda x: x.mean())
-
-        result = no_cols.apply(lambda x: x.mean(), broadcast=True)
-        tm.assertIsInstance(result, DataFrame)
-
-    def test_apply_with_args_kwds(self):
-        def add_some(x, howmuch=0):
-            return x + howmuch
-
-        def agg_and_add(x, howmuch=0):
-            return x.mean() + howmuch
-
-        def subtract_and_divide(x, sub, divide=1):
-            return (x - sub) / divide
-
-        result = self.frame.apply(add_some, howmuch=2)
-        exp = self.frame.apply(lambda x: x + 2)
-        assert_frame_equal(result, exp)
-
-        result = self.frame.apply(agg_and_add, howmuch=2)
-        exp = self.frame.apply(lambda x: x.mean() + 2)
-        assert_series_equal(result, exp)
-
-        res = self.frame.apply(subtract_and_divide, args=(2,), divide=2)
-        exp = self.frame.apply(lambda x: (x - 2.) / 2.)
-        assert_frame_equal(res, exp)
-
-    def test_apply_yield_list(self):
-        result = self.frame.apply(list)
-        assert_frame_equal(result, self.frame)
-
-    def test_apply_reduce_Series(self):
-        self.frame.ix[::2, 'A'] = np.nan
-        expected = self.frame.mean(1)
-        result = self.frame.apply(np.mean, axis=1)
-        assert_series_equal(result, expected)
-
-    def test_apply_differently_indexed(self):
-        df = DataFrame(np.random.randn(20, 10))
-
-        result0 = df.apply(Series.describe, axis=0)
-        expected0 = DataFrame(dict((i, v.describe())
-                                   for i, v in compat.iteritems(df)),
-                              columns=df.columns)
-        assert_frame_equal(result0, expected0)
-
-        result1 = df.apply(Series.describe, axis=1)
-        expected1 = DataFrame(dict((i, v.describe())
-                                   for i, v in compat.iteritems(df.T)),
-                              columns=df.index).T
-        assert_frame_equal(result1, expected1)
-
-    def test_apply_modify_traceback(self):
-        data = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
-                                'bar', 'bar', 'bar', 'bar',
-                                'foo', 'foo', 'foo'],
-                          'B': ['one', 'one', 'one', 'two',
-                                'one', 'one', 'one', 'two',
-                                'two', 'two', 'one'],
-                          'C': ['dull', 'dull', 'shiny', 'dull',
-                                'dull', 'shiny', 'shiny', 'dull',
-                                'shiny', 'shiny', 'shiny'],
-                          'D': np.random.randn(11),
-                          'E': np.random.randn(11),
-                          'F': np.random.randn(11)})
-
-        data.loc[4,'C'] = np.nan
-
-        def transform(row):
-            if row['C'].startswith('shin') and row['A'] == 'foo':
-                row['D'] = 7
-            return row
-
-        def transform2(row):
-            if (notnull(row['C']) and row['C'].startswith('shin')
-                    and row['A'] == 'foo'):
-                row['D'] = 7
-            return row
-
-        try:
-            transformed = data.apply(transform, axis=1)
-        except AttributeError as e:
-            self.assertEqual(len(e.args), 2)
-            self.assertEqual(e.args[1], 'occurred at index 4')
-            self.assertEqual(e.args[0], "'float' object has no attribute 'startswith'")
-
-    def test_apply_bug(self):
-
-        # GH 6125
-        import datetime
-        positions = pd.DataFrame([[1, 'ABC0', 50], [1, 'YUM0', 20],
-                                  [1, 'DEF0', 20], [2, 'ABC1', 50],
-                                  [2, 'YUM1', 20], [2, 'DEF1', 20]],
-                                 columns=['a', 'market', 'position'])
-        def f(r):
-            return r['market']
-        expected = positions.apply(f, axis=1)
-
-        positions = DataFrame([[datetime.datetime(2013, 1, 1), 'ABC0', 50],
-                               [datetime.datetime(2013, 1, 2), 'YUM0', 20],
-                               [datetime.datetime(2013, 1, 3), 'DEF0', 20],
-                               [datetime.datetime(2013, 1, 4), 'ABC1', 50],
-                               [datetime.datetime(2013, 1, 5), 'YUM1', 20],
-                               [datetime.datetime(2013, 1, 6), 'DEF1', 20]],
-                                                columns=['a', 'market', 'position'])
-        result = positions.apply(f, axis=1)
-        assert_series_equal(result,expected)
-
-    def test_swapaxes(self):
-        df = DataFrame(np.random.randn(10, 5))
-        assert_frame_equal(df.T, df.swapaxes(0, 1))
-        assert_frame_equal(df.T, df.swapaxes(1, 0))
-        assert_frame_equal(df, df.swapaxes(0, 0))
-        self.assertRaises(ValueError, df.swapaxes, 2, 5)
-
-    def test_apply_convert_objects(self):
-        data = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
-                                'bar', 'bar', 'bar', 'bar',
-                                'foo', 'foo', 'foo'],
-                          'B': ['one', 'one', 'one', 'two',
-                                'one', 'one', 'one', 'two',
-                                'two', 'two', 'one'],
-                          'C': ['dull', 'dull', 'shiny', 'dull',
-                                'dull', 'shiny', 'shiny', 'dull',
-                                'shiny', 'shiny', 'shiny'],
-                          'D': np.random.randn(11),
-                          'E': np.random.randn(11),
-                          'F': np.random.randn(11)})
-
-        result = data.apply(lambda x: x, axis=1)
-        assert_frame_equal(result._convert(datetime=True), data)
-
-    def test_apply_attach_name(self):
-        result = self.frame.apply(lambda x: x.name)
-        expected = Series(self.frame.columns, index=self.frame.columns)
-        assert_series_equal(result, expected)
-
-        result = self.frame.apply(lambda x: x.name, axis=1)
-        expected = Series(self.frame.index, index=self.frame.index)
-        assert_series_equal(result, expected)
-
-        # non-reductions
-        result = self.frame.apply(lambda x: np.repeat(x.name, len(x)))
-        expected = DataFrame(np.tile(self.frame.columns,
-                                     (len(self.frame.index), 1)),
-                             index=self.frame.index,
-                             columns=self.frame.columns)
-        assert_frame_equal(result, expected)
-
-        result = self.frame.apply(lambda x: np.repeat(x.name, len(x)),
-                                  axis=1)
-        expected = DataFrame(np.tile(self.frame.index,
-                                     (len(self.frame.columns), 1)).T,
-                             index=self.frame.index,
-                             columns=self.frame.columns)
-        assert_frame_equal(result, expected)
-
-    def test_apply_multi_index(self):
-        s = DataFrame([[1,2], [3,4], [5,6]])
-        s.index = MultiIndex.from_arrays([['a','a','b'], ['c','d','d']])
-        s.columns = ['col1','col2']
-        res = s.apply(lambda x: Series({'min': min(x), 'max': max(x)}), 1)
-        tm.assertIsInstance(res.index, MultiIndex)
-
-    def test_apply_dict(self):
-
-        # GH 8735
-        A = DataFrame([['foo', 'bar'], ['spam', 'eggs']])
-        A_dicts = pd.Series([dict([(0, 'foo'), (1, 'spam')]),
-                             dict([(0, 'bar'), (1, 'eggs')])])
-        B = DataFrame([[0, 1], [2, 3]])
-        B_dicts = pd.Series([dict([(0, 0), (1, 2)]), dict([(0, 1), (1, 3)])])
-        fn = lambda x: x.to_dict()
-
-        for df, dicts in [(A, A_dicts), (B, B_dicts)]:
-            reduce_true = df.apply(fn, reduce=True)
-            reduce_false = df.apply(fn, reduce=False)
-            reduce_none = df.apply(fn, reduce=None)
-
-            assert_series_equal(reduce_true, dicts)
-            assert_frame_equal(reduce_false, df)
-            assert_series_equal(reduce_none, dicts)
-
-    def test_applymap(self):
-        applied = self.frame.applymap(lambda x: x * 2)
-        assert_frame_equal(applied, self.frame * 2)
-        result = self.frame.applymap(type)
-
-        # GH #465, function returning tuples
-        result = self.frame.applymap(lambda x: (x, x))
-        tm.assertIsInstance(result['A'][0], tuple)
-
-        # GH 2909, object conversion to float in constructor?
-        df = DataFrame(data=[1,'a'])
-        result = df.applymap(lambda x: x)
-        self.assertEqual(result.dtypes[0], object)
-
-        df = DataFrame(data=[1.,'a'])
-        result = df.applymap(lambda x: x)
-        self.assertEqual(result.dtypes[0], object)
-
-        # GH2786
-        df  = DataFrame(np.random.random((3,4)))
-        df2 = df.copy()
-        cols = ['a','a','a','a']
-        df.columns = cols
-
-        expected = df2.applymap(str)
-        expected.columns = cols
-        result = df.applymap(str)
-        assert_frame_equal(result,expected)
-
-        # datetime/timedelta
-        df['datetime'] = Timestamp('20130101')
-        df['timedelta'] = Timedelta('1 min')
-        result = df.applymap(str)
-        for f in ['datetime','timedelta']:
-            self.assertEqual(result.loc[0,f],str(df.loc[0,f]))
-
-    def test_filter(self):
-        # items
-        filtered = self.frame.filter(['A', 'B', 'E'])
-        self.assertEqual(len(filtered.columns), 2)
-        self.assertNotIn('E', filtered)
-
-        filtered = self.frame.filter(['A', 'B', 'E'], axis='columns')
-        self.assertEqual(len(filtered.columns), 2)
-        self.assertNotIn('E', filtered)
-
-        # other axis
-        idx = self.frame.index[0:4]
-        filtered = self.frame.filter(idx, axis='index')
-        expected = self.frame.reindex(index=idx)
-        assert_frame_equal(filtered, expected)
-
-        # like
-        fcopy = self.frame.copy()
-        fcopy['AA'] = 1
-
-        filtered = fcopy.filter(like='A')
-        self.assertEqual(len(filtered.columns), 2)
-        self.assertIn('AA', filtered)
-
-        # like with ints in column names
-        df = DataFrame(0., index=[0, 1, 2], columns=[0, 1, '_A', '_B'])
-        filtered = df.filter(like='_')
-        self.assertEqual(len(filtered.columns), 2)
-
-        # regex with ints in column names
-        # from PR #10384
-        df = DataFrame(0., index=[0, 1, 2], columns=['A1', 1, 'B', 2, 'C'])
-        expected = DataFrame(0., index=[0, 1, 2], columns=[1, 2])
-        filtered = df.filter(regex='^[0-9]+$')
-        assert_frame_equal(filtered, expected)
-
-        expected = DataFrame(0., index=[0, 1, 2], columns=[0, '0', 1, '1'])
-        filtered = expected.filter(regex='^[0-9]+$')  # shouldn't remove anything
-        assert_frame_equal(filtered, expected)
-
-        # pass in None
-        with assertRaisesRegexp(TypeError, 'Must pass'):
-            self.frame.filter(items=None)
-
-        # objects
-        filtered = self.mixed_frame.filter(like='foo')
-        self.assertIn('foo', filtered)
-
-        # unicode columns, won't ascii-encode
-        df = self.frame.rename(columns={'B': u('\u2202')})
-        filtered = df.filter(like='C')
-        self.assertTrue('C' in filtered)
-
-    def test_filter_regex_search(self):
-        fcopy = self.frame.copy()
-        fcopy['AA'] = 1
-
-        # regex
-        filtered = fcopy.filter(regex='[A]+')
-        self.assertEqual(len(filtered.columns), 2)
-        self.assertIn('AA', filtered)
-
-        # doesn't have to be at beginning
-        df = DataFrame({'aBBa': [1, 2],
-                        'BBaBB': [1, 2],
-                        'aCCa': [1, 2],
-                        'aCCaBB': [1, 2]})
-
-        result = df.filter(regex='BB')
-        exp = df[[x for x in df.columns if 'BB' in x]]
-        assert_frame_equal(result, exp)
-
-    def test_filter_corner(self):
-        empty = DataFrame()
-
-        result = empty.filter([])
-        assert_frame_equal(result, empty)
-
-        result = empty.filter(like='foo')
-        assert_frame_equal(result, empty)
-
-    def test_select(self):
-        f = lambda x: x.weekday() == 2
-        result = self.tsframe.select(f, axis=0)
-        expected = self.tsframe.reindex(
-            index=self.tsframe.index[[f(x) for x in self.tsframe.index]])
-        assert_frame_equal(result, expected)
-
-        result = self.frame.select(lambda x: x in ('B', 'D'), axis=1)
-        expected = self.frame.reindex(columns=['B', 'D'])
-
-        assert_frame_equal(result, expected, check_names=False)  # TODO should reindex check_names?
-
-    def test_reorder_levels(self):
-        index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
-                           labels=[[0, 0, 0, 0, 0, 0],
-                                   [0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1]],
-                           names=['L0', 'L1', 'L2'])
-        df = DataFrame({'A': np.arange(6), 'B': np.arange(6)}, index=index)
-
-        # no change, position
-        result = df.reorder_levels([0, 1, 2])
-        assert_frame_equal(df, result)
-
-        # no change, labels
-        result = df.reorder_levels(['L0', 'L1', 'L2'])
-        assert_frame_equal(df, result)
-
-        # rotate, position
-        result = df.reorder_levels([1, 2, 0])
-        e_idx = MultiIndex(levels=[['one', 'two', 'three'], [0, 1], ['bar']],
-                           labels=[[0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1],
-                                   [0, 0, 0, 0, 0, 0]],
-                           names=['L1', 'L2', 'L0'])
-        expected = DataFrame({'A': np.arange(6), 'B': np.arange(6)},
-                             index=e_idx)
-        assert_frame_equal(result, expected)
-
-        result = df.reorder_levels([0, 0, 0])
-        e_idx = MultiIndex(levels=[['bar'], ['bar'], ['bar']],
-                           labels=[[0, 0, 0, 0, 0, 0],
-                                   [0, 0, 0, 0, 0, 0],
-                                   [0, 0, 0, 0, 0, 0]],
-                           names=['L0', 'L0', 'L0'])
-        expected = DataFrame({'A': np.arange(6), 'B': np.arange(6)},
-                             index=e_idx)
-        assert_frame_equal(result, expected)
-
-        result = df.reorder_levels(['L0', 'L0', 'L0'])
-        assert_frame_equal(result, expected)
-
-    def test_sort_values(self):
-
-        # API for 9816
-
-        # sort_index
-        frame = DataFrame(np.arange(16).reshape(4, 4), index=[1, 2, 3, 4],
-                          columns=['A', 'B', 'C', 'D'])
-
-        # 9816 deprecated
-        with tm.assert_produces_warning(FutureWarning):
-            frame.sort(columns='A')
-        with tm.assert_produces_warning(FutureWarning):
-            frame.sort()
-
-        unordered = frame.ix[[3, 2, 4, 1]]
-        expected = unordered.sort_index()
-
-        result = unordered.sort_index(axis=0)
-        assert_frame_equal(result, expected)
-
-        unordered = frame.ix[:, [2, 1, 3, 0]]
-        expected = unordered.sort_index(axis=1)
-
-        result = unordered.sort_index(axis=1)
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result, expected)
-
-        # sortlevel
-        mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
-        df = DataFrame([[1, 2], [3, 4]], mi)
-
-        result = df.sort_index(level='A', sort_remaining=False)
-        expected = df.sortlevel('A', sort_remaining=False)
-        assert_frame_equal(result, expected)
-
-        df = df.T
-        result = df.sort_index(level='A', axis=1, sort_remaining=False)
-        expected = df.sortlevel('A', axis=1, sort_remaining=False)
-        assert_frame_equal(result, expected)
-
-        # MI sort, but no by
-        mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
-        df = DataFrame([[1, 2], [3, 4]], mi)
-        result = df.sort_index(sort_remaining=False)
-        expected = df.sort_index()
-        assert_frame_equal(result, expected)
-
-    def test_sort_index(self):
-        frame = DataFrame(np.arange(16).reshape(4, 4), index=[1, 2, 3, 4],
-                          columns=['A', 'B', 'C', 'D'])
-
-        # axis=0
-        unordered = frame.ix[[3, 2, 4, 1]]
-        sorted_df = unordered.sort_index(axis=0)
-        expected = frame
-        assert_frame_equal(sorted_df, expected)
-
-        sorted_df = unordered.sort_index(ascending=False)
-        expected = frame[::-1]
-        assert_frame_equal(sorted_df, expected)
-
-        # axis=1
-        unordered = frame.ix[:, ['D', 'B', 'C', 'A']]
-        sorted_df = unordered.sort_index(axis=1)
-        expected = frame
-        assert_frame_equal(sorted_df, expected)
-
-        sorted_df = unordered.sort_index(axis=1, ascending=False)
-        expected = frame.ix[:, ::-1]
-        assert_frame_equal(sorted_df, expected)
-
-        # by column
-        sorted_df = frame.sort_values(by='A')
-        indexer = frame['A'].argsort().values
-        expected = frame.ix[frame.index[indexer]]
-        assert_frame_equal(sorted_df, expected)
-
-        sorted_df = frame.sort_values(by='A', ascending=False)
-        indexer = indexer[::-1]
-        expected = frame.ix[frame.index[indexer]]
-        assert_frame_equal(sorted_df, expected)
-
-        sorted_df = frame.sort_values(by='A', ascending=False)
-        assert_frame_equal(sorted_df, expected)
-
-        # GH4839
-        sorted_df = frame.sort_values(by=['A'], ascending=[False])
-        assert_frame_equal(sorted_df, expected)
-
-        # check for now
-        sorted_df = frame.sort_values(by='A')
-        assert_frame_equal(sorted_df, expected[::-1])
-        expected = frame.sort_values(by='A')
-        assert_frame_equal(sorted_df, expected)
-
-        expected = frame.sort_values(by=['A', 'B'], ascending=False)
-        sorted_df = frame.sort_values(by=['A', 'B'])
-        assert_frame_equal(sorted_df, expected[::-1])
-
-        self.assertRaises(ValueError, lambda : frame.sort_values(by=['A','B'], axis=2, inplace=True))
-
-        msg = 'When sorting by column, axis must be 0'
-        with assertRaisesRegexp(ValueError, msg):
-            frame.sort_values(by='A', axis=1)
-
-        msg = r'Length of ascending \(5\) != length of by \(2\)'
-        with assertRaisesRegexp(ValueError, msg):
-            frame.sort_values(by=['A', 'B'], axis=0, ascending=[True] * 5)
-
-    def test_sort_index_categorical_index(self):
-
-        df = DataFrame({'A' : np.arange(6,dtype='int64'),
-                        'B' : Series(list('aabbca')).astype('category',categories=list('cab')) }).set_index('B')
-
-        result = df.sort_index()
-        expected = df.iloc[[4,0,1,5,2,3]]
-        assert_frame_equal(result, expected)
-
-        result = df.sort_index(ascending=False)
-        expected = df.iloc[[3,2,5,1,0,4]]
-        assert_frame_equal(result, expected)
-
-    def test_sort_nan(self):
-        # GH3917
-        nan = np.nan
-        df = DataFrame({'A': [1, 2, nan, 1, 6, 8, 4],
-                        'B': [9, nan, 5, 2, 5, 4, 5]})
-
-        # sort one column only
-        expected = DataFrame(
-            {'A': [nan, 1, 1, 2, 4, 6, 8],
-             'B': [5, 9, 2, nan, 5, 5, 4]},
-            index=[2, 0, 3, 1, 6, 4, 5])
-        sorted_df = df.sort_values(['A'], na_position='first')
-        assert_frame_equal(sorted_df, expected)
-
-        expected = DataFrame(
-            {'A': [nan, 8, 6, 4, 2, 1, 1],
-             'B': [5, 4, 5, 5, nan, 9, 2]},
-            index=[2, 5, 4, 6, 1, 0, 3])
-        sorted_df = df.sort_values(['A'], na_position='first', ascending=False)
-        assert_frame_equal(sorted_df, expected)
-
-        # na_position='last', order
-        expected = DataFrame(
-            {'A': [1, 1, 2, 4, 6, 8, nan],
-             'B': [2, 9, nan, 5, 5, 4, 5]},
-            index=[3, 0, 1, 6, 4, 5, 2])
-        sorted_df = df.sort_values(['A','B'])
-        assert_frame_equal(sorted_df, expected)
-
-        # na_position='first', order
-        expected = DataFrame(
-            {'A': [nan, 1, 1, 2, 4, 6, 8],
-             'B': [5, 2, 9, nan, 5, 5, 4]},
-            index=[2, 3, 0, 1, 6, 4, 5])
-        sorted_df = df.sort_values(['A','B'], na_position='first')
-        assert_frame_equal(sorted_df, expected)
-
-        # na_position='first', not order
-        expected = DataFrame(
-            {'A': [nan, 1, 1, 2, 4, 6, 8],
-             'B': [5, 9, 2, nan, 5, 5, 4]},
-            index=[2, 0, 3, 1, 6, 4, 5])
-        sorted_df = df.sort_values(['A','B'], ascending=[1,0], na_position='first')
-        assert_frame_equal(sorted_df, expected)
-
-        # na_position='last', not order
-        expected = DataFrame(
-            {'A': [8, 6, 4, 2, 1, 1, nan],
-             'B': [4, 5, 5, nan, 2, 9, 5]},
-            index=[5, 4, 6, 1, 3, 0, 2])
-        sorted_df = df.sort_values(['A','B'], ascending=[0,1], na_position='last')
-        assert_frame_equal(sorted_df, expected)
-
-        # Test DataFrame with nan label
-        df = DataFrame({'A': [1, 2, nan, 1, 6, 8, 4],
-                        'B': [9, nan, 5, 2, 5, 4, 5]},
-                       index = [1, 2, 3, 4, 5, 6, nan])
-
-        # NaN label, ascending=True, na_position='last'
-        sorted_df = df.sort_index(kind='quicksort', ascending=True, na_position='last')
-        expected = DataFrame({'A': [1, 2, nan, 1, 6, 8, 4],
-                              'B': [9, nan, 5, 2, 5, 4, 5]},
-                             index = [1, 2, 3, 4, 5, 6, nan])
-        assert_frame_equal(sorted_df, expected)
-
-        # NaN label, ascending=True, na_position='first'
-        sorted_df = df.sort_index(na_position='first')
-        expected = DataFrame({'A': [4, 1, 2, nan, 1, 6, 8],
-                              'B': [5, 9, nan, 5, 2, 5, 4]},
-                             index = [nan, 1, 2, 3, 4, 5, 6])
-        assert_frame_equal(sorted_df, expected)
-
-        # NaN label, ascending=False, na_position='last'
-        sorted_df = df.sort_index(kind='quicksort', ascending=False)
-        expected = DataFrame({'A': [8, 6, 1, nan, 2,   1, 4],
-                              'B': [4, 5, 2, 5,   nan, 9, 5]},
-                             index = [6, 5, 4, 3, 2, 1, nan])
-        assert_frame_equal(sorted_df, expected)
-
-        # NaN label, ascending=False, na_position='first'
-        sorted_df = df.sort_index(kind='quicksort', ascending=False, na_position='first')
-        expected = DataFrame({'A': [4, 8, 6, 1, nan, 2,   1],
-                              'B': [5, 4, 5, 2, 5,   nan, 9]},
-                             index = [nan, 6, 5, 4, 3, 2, 1])
-        assert_frame_equal(sorted_df, expected)
-
-    def test_stable_descending_sort(self):
-        # GH #6399
-        df = DataFrame([[2, 'first'], [2, 'second'], [1, 'a'], [1, 'b']],
-                       columns=['sort_col', 'order'])
-        sorted_df = df.sort_values(by='sort_col', kind='mergesort',
-                                   ascending=False)
-        assert_frame_equal(df, sorted_df)
-
-    def test_stable_descending_multicolumn_sort(self):
-        nan = np.nan
-        df = DataFrame({'A': [1, 2, nan, 1, 6, 8, 4],
-                        'B': [9, nan, 5, 2, 5, 4, 5]})
-        # test stable mergesort
-        expected = DataFrame(
-            {'A': [nan, 8, 6, 4, 2, 1, 1],
-             'B': [5, 4, 5, 5, nan, 2, 9]},
-            index=[2, 5, 4, 6, 1, 3, 0])
-        sorted_df = df.sort_values(['A','B'], ascending=[0,1], na_position='first',
-                                   kind='mergesort')
-        assert_frame_equal(sorted_df, expected)
-
-        expected = DataFrame(
-            {'A': [nan, 8, 6, 4, 2, 1, 1],
-             'B': [5, 4, 5, 5, nan, 9, 2]},
-            index=[2, 5, 4, 6, 1, 0, 3])
-        sorted_df = df.sort_values(['A','B'], ascending=[0,0], na_position='first',
-                                   kind='mergesort')
-        assert_frame_equal(sorted_df, expected)
-
-    def test_sort_index_multicolumn(self):
-        import random
-        A = np.arange(5).repeat(20)
-        B = np.tile(np.arange(5), 20)
-        random.shuffle(A)
-        random.shuffle(B)
-        frame = DataFrame({'A': A, 'B': B,
-                           'C': np.random.randn(100)})
-
-        # use .sort_values #9816
-        with tm.assert_produces_warning(FutureWarning):
-            frame.sort_index(by=['A', 'B'])
-        result = frame.sort_values(by=['A', 'B'])
-        indexer = np.lexsort((frame['B'], frame['A']))
-        expected = frame.take(indexer)
-        assert_frame_equal(result, expected)
-
-        # use .sort_values #9816
-        with tm.assert_produces_warning(FutureWarning):
-            frame.sort_index(by=['A', 'B'], ascending=False)
-        result = frame.sort_values(by=['A', 'B'], ascending=False)
-        indexer = np.lexsort((frame['B'].rank(ascending=False),
-                              frame['A'].rank(ascending=False)))
-        expected = frame.take(indexer)
-        assert_frame_equal(result, expected)
-
-        # use .sort_values #9816
-        with tm.assert_produces_warning(FutureWarning):
-            frame.sort_index(by=['B', 'A'])
-        result = frame.sort_values(by=['B', 'A'])
-        indexer = np.lexsort((frame['A'], frame['B']))
-        expected = frame.take(indexer)
-        assert_frame_equal(result, expected)
-
-    def test_sort_index_inplace(self):
-        frame = DataFrame(np.random.randn(4, 4), index=[1, 2, 3, 4],
-                          columns=['A', 'B', 'C', 'D'])
-
-        # axis=0
-        unordered = frame.ix[[3, 2, 4, 1]]
-        a_id = id(unordered['A'])
-        df = unordered.copy()
-        df.sort_index(inplace=True)
-        expected = frame
-        assert_frame_equal(df, expected)
-        self.assertNotEqual(a_id, id(df['A']))
-
-        df = unordered.copy()
-        df.sort_index(ascending=False, inplace=True)
-        expected = frame[::-1]
-        assert_frame_equal(df, expected)
-
-        # axis=1
-        unordered = frame.ix[:, ['D', 'B', 'C', 'A']]
-        df = unordered.copy()
-        df.sort_index(axis=1, inplace=True)
-        expected = frame
-        assert_frame_equal(df, expected)
-
-        df = unordered.copy()
-        df.sort_index(axis=1, ascending=False, inplace=True)
-        expected = frame.ix[:, ::-1]
-        assert_frame_equal(df, expected)
-
-    def test_sort_index_different_sortorder(self):
-        import random
-        A = np.arange(20).repeat(5)
-        B = np.tile(np.arange(5), 20)
-
-        indexer = np.random.permutation(100)
-        A = A.take(indexer)
-        B = B.take(indexer)
-
-        df = DataFrame({'A': A, 'B': B,
-                        'C': np.random.randn(100)})
-
-        # use .sort_values #9816
-        with tm.assert_produces_warning(FutureWarning):
-            df.sort_index(by=['A', 'B'], ascending=[1, 0])
-        result = df.sort_values(by=['A', 'B'], ascending=[1, 0])
-
-        ex_indexer = np.lexsort((df.B.max() - df.B, df.A))
-        expected = df.take(ex_indexer)
-        assert_frame_equal(result, expected)
-
-        # test with multiindex, too
-        idf = df.set_index(['A', 'B'])
-
-        result = idf.sort_index(ascending=[1, 0])
-        expected = idf.take(ex_indexer)
-        assert_frame_equal(result, expected)
-
-        # also, Series!
-        result = idf['C'].sort_index(ascending=[1, 0])
-        assert_series_equal(result, expected['C'])
-
-    def test_sort_inplace(self):
-        frame = DataFrame(np.random.randn(4, 4), index=[1, 2, 3, 4],
-                          columns=['A', 'B', 'C', 'D'])
-
-        sorted_df = frame.copy()
-        sorted_df.sort_values(by='A', inplace=True)
-        expected = frame.sort_values(by='A')
-        assert_frame_equal(sorted_df, expected)
-
-        sorted_df = frame.copy()
-        sorted_df.sort_values(by='A', ascending=False, inplace=True)
-        expected = frame.sort_values(by='A', ascending=False)
-        assert_frame_equal(sorted_df, expected)
-
-        sorted_df = frame.copy()
-        sorted_df.sort_values(by=['A', 'B'], ascending=False, inplace=True)
-        expected = frame.sort_values(by=['A', 'B'], ascending=False)
-        assert_frame_equal(sorted_df, expected)
-
-    def test_sort_index_duplicates(self):
-
-        ### with 9816, these are all translated to .sort_values
-
-        df = DataFrame([lrange(5,9), lrange(4)],
-                       columns=['a', 'a', 'b', 'b'])
-
-        with assertRaisesRegexp(ValueError, 'duplicate'):
-            # use .sort_values #9816
-            with tm.assert_produces_warning(FutureWarning):
-                df.sort_index(by='a')
-        with assertRaisesRegexp(ValueError, 'duplicate'):
-                df.sort_values(by='a')
-
-        with assertRaisesRegexp(ValueError, 'duplicate'):
-            # use .sort_values #9816
-            with tm.assert_produces_warning(FutureWarning):
-                df.sort_index(by=['a'])
-        with assertRaisesRegexp(ValueError, 'duplicate'):
-            df.sort_values(by=['a'])
-
-        with assertRaisesRegexp(ValueError, 'duplicate'):
-            # use .sort_values #9816
-            with tm.assert_produces_warning(FutureWarning):
-                # multi-column 'by' is separate codepath
-                df.sort_index(by=['a', 'b'])
-        with assertRaisesRegexp(ValueError, 'duplicate'):
-            # multi-column 'by' is separate codepath
-            df.sort_values(by=['a', 'b'])
-
-        # with multi-index
-        # GH4370
-        df = DataFrame(np.random.randn(4,2),columns=MultiIndex.from_tuples([('a',0),('a',1)]))
-        with assertRaisesRegexp(ValueError, 'levels'):
-            # use .sort_values #9816
-            with tm.assert_produces_warning(FutureWarning):
-                df.sort_index(by='a')
-        with assertRaisesRegexp(ValueError, 'levels'):
-            df.sort_values(by='a')
-
-        # convert tuples to a list of tuples
-        # use .sort_values #9816
-        with tm.assert_produces_warning(FutureWarning):
-            df.sort_index(by=[('a',1)])
-        expected = df.sort_values(by=[('a',1)])
-
-        # use .sort_values #9816
-        with tm.assert_produces_warning(FutureWarning):
-            df.sort_index(by=('a',1))
-        result = df.sort_values(by=('a',1))
-        assert_frame_equal(result, expected)
-
-    def test_sortlevel(self):
-        mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
-        df = DataFrame([[1, 2], [3, 4]], mi)
-        res = df.sortlevel('A', sort_remaining=False)
-        assert_frame_equal(df, res)
-
-        res = df.sortlevel(['A', 'B'], sort_remaining=False)
-        assert_frame_equal(df, res)
-
-    def test_sort_datetimes(self):
-
-        # GH 3461, argsort / lexsort differences for a datetime column
-        df = DataFrame(['a','a','a','b','c','d','e','f','g'],
-                       columns=['A'],
-                       index=date_range('20130101',periods=9))
-        dts = [Timestamp(x)
-               for x in  ['2004-02-11','2004-01-21','2004-01-26',
-                          '2005-09-20','2010-10-04','2009-05-12',
-                          '2008-11-12','2010-09-28','2010-09-28']]
-        df['B'] = dts[::2] + dts[1::2]
-        df['C'] = 2.
-        df['A1'] = 3.
-
-        df1 = df.sort_values(by='A')
-        df2 = df.sort_values(by=['A'])
-        assert_frame_equal(df1,df2)
-
-        df1 = df.sort_values(by='B')
-        df2 = df.sort_values(by=['B'])
-        assert_frame_equal(df1,df2)
-
-    def test_frame_column_inplace_sort_exception(self):
-        s = self.frame['A']
-        with assertRaisesRegexp(ValueError, "This Series is a view"):
-            s.sort_values(inplace=True)
-
-        cp = s.copy()
-        cp.sort_values() # it works!
-
-    def test_combine_first(self):
-        # disjoint
-        head, tail = self.frame[:5], self.frame[5:]
-
-        combined = head.combine_first(tail)
-        reordered_frame = self.frame.reindex(combined.index)
-        assert_frame_equal(combined, reordered_frame)
-        self.assertTrue(tm.equalContents(combined.columns, self.frame.columns))
-        assert_series_equal(combined['A'], reordered_frame['A'])
-
-        # same index
-        fcopy = self.frame.copy()
-        fcopy['A'] = 1
-        del fcopy['C']
-
-        fcopy2 = self.frame.copy()
-        fcopy2['B'] = 0
-        del fcopy2['D']
-
-        combined = fcopy.combine_first(fcopy2)
-
-        self.assertTrue((combined['A'] == 1).all())
-        assert_series_equal(combined['B'], fcopy['B'])
-        assert_series_equal(combined['C'], fcopy2['C'])
-        assert_series_equal(combined['D'], fcopy['D'])
-
-        # overlap
-        head, tail = reordered_frame[:10].copy(), reordered_frame
-        head['A'] = 1
-
-        combined = head.combine_first(tail)
-        self.assertTrue((combined['A'][:10] == 1).all())
-
-        # reverse overlap
-        tail['A'][:10] = 0
-        combined = tail.combine_first(head)
-        self.assertTrue((combined['A'][:10] == 0).all())
-
-        # no overlap
-        f = self.frame[:10]
-        g = self.frame[10:]
-        combined = f.combine_first(g)
-        assert_series_equal(combined['A'].reindex(f.index), f['A'])
-        assert_series_equal(combined['A'].reindex(g.index), g['A'])
-
-        # corner cases
-        comb = self.frame.combine_first(self.empty)
-        assert_frame_equal(comb, self.frame)
-
-        comb = self.empty.combine_first(self.frame)
-        assert_frame_equal(comb, self.frame)
-
-        comb = self.frame.combine_first(DataFrame(index=["faz", "boo"]))
-        self.assertTrue("faz" in comb.index)
-
-        # #2525
-        df = DataFrame({'a': [1]}, index=[datetime(2012, 1, 1)])
-        df2 = DataFrame({}, columns=['b'])
-        result = df.combine_first(df2)
-        self.assertTrue('b' in result)
-
-    def test_combine_first_mixed_bug(self):
-        idx = Index(['a', 'b', 'c', 'e'])
-        ser1 = Series([5.0, -9.0, 4.0, 100.], index=idx)
-        ser2 = Series(['a', 'b', 'c', 'e'], index=idx)
-        ser3 = Series([12, 4, 5, 97], index=idx)
-
-        frame1 = DataFrame({"col0": ser1,
-                            "col2": ser2,
-                            "col3": ser3})
-
-        idx = Index(['a', 'b', 'c', 'f'])
-        ser1 = Series([5.0, -9.0, 4.0, 100.], index=idx)
-        ser2 = Series(['a', 'b', 'c', 'f'], index=idx)
-        ser3 = Series([12, 4, 5, 97], index=idx)
-
-        frame2 = DataFrame({"col1": ser1,
-                            "col2": ser2,
-                            "col5": ser3})
-
-        combined = frame1.combine_first(frame2)
-        self.assertEqual(len(combined.columns), 5)
-
-        # gh 3016 (same as in update)
-        df = DataFrame([[1.,2.,False, True],[4.,5.,True,False]],
-                       columns=['A','B','bool1','bool2'])
-
-        other = DataFrame([[45,45]],index=[0],columns=['A','B'])
-        result = df.combine_first(other)
-        assert_frame_equal(result, df)
-
-        df.ix[0,'A'] = np.nan
-        result = df.combine_first(other)
-        df.ix[0,'A'] = 45
-        assert_frame_equal(result, df)
-
-        # doc example
-        df1 = DataFrame({'A' : [1., np.nan, 3., 5., np.nan],
-                         'B' : [np.nan, 2., 3., np.nan, 6.]})
-
-        df2 = DataFrame({'A' : [5., 2., 4., np.nan, 3., 7.],
-                         'B' : [np.nan, np.nan, 3., 4., 6., 8.]})
-
-        result = df1.combine_first(df2)
-        expected = DataFrame({ 'A' : [1,2,3,5,3,7.], 'B' : [np.nan,2,3,4,6,8] })
-        assert_frame_equal(result,expected)
-
-        # GH3552, return object dtype with bools
-        df1 = DataFrame([[np.nan, 3.,True], [-4.6, np.nan, True], [np.nan, 7., False]])
-        df2 = DataFrame([[-42.6, np.nan, True], [-5., 1.6, False]], index=[1, 2])
-
-        result = df1.combine_first(df2)[2]
-        expected = Series([True, True, False], name=2)
-        assert_series_equal(result, expected)
-
-        # GH 3593, converting datetime64[ns] incorrecly
-        df0 = DataFrame({"a":[datetime(2000, 1, 1), datetime(2000, 1, 2), datetime(2000, 1, 3)]})
-        df1 = DataFrame({"a":[None, None, None]})
-        df2 = df1.combine_first(df0)
-        assert_frame_equal(df2, df0)
-
-        df2 = df0.combine_first(df1)
-        assert_frame_equal(df2, df0)
-
-        df0 = DataFrame({"a":[datetime(2000, 1, 1), datetime(2000, 1, 2), datetime(2000, 1, 3)]})
-        df1 = DataFrame({"a":[datetime(2000, 1, 2), None, None]})
-        df2 = df1.combine_first(df0)
-        result = df0.copy()
-        result.iloc[0,:] = df1.iloc[0,:]
-        assert_frame_equal(df2, result)
-
-        df2 = df0.combine_first(df1)
-        assert_frame_equal(df2, df0)
-
-    def test_update(self):
-        df = DataFrame([[1.5, nan, 3.],
-                        [1.5, nan, 3.],
-                        [1.5, nan, 3],
-                        [1.5, nan, 3]])
-
-        other = DataFrame([[3.6, 2., np.nan],
-                           [np.nan, np.nan, 7]], index=[1, 3])
-
-        df.update(other)
-
-        expected = DataFrame([[1.5, nan, 3],
-                              [3.6, 2, 3],
-                              [1.5, nan, 3],
-                              [1.5, nan, 7.]])
-        assert_frame_equal(df, expected)
-
-    def test_update_dtypes(self):
-
-        # gh 3016
-        df = DataFrame([[1.,2.,False, True],[4.,5.,True,False]],
-                       columns=['A','B','bool1','bool2'])
-
-        other = DataFrame([[45,45]],index=[0],columns=['A','B'])
-        df.update(other)
-
-        expected = DataFrame([[45.,45.,False, True],[4.,5.,True,False]],
-                             columns=['A','B','bool1','bool2'])
-        assert_frame_equal(df, expected)
-
-    def test_update_nooverwrite(self):
-        df = DataFrame([[1.5, nan, 3.],
-                        [1.5, nan, 3.],
-                        [1.5, nan, 3],
-                        [1.5, nan, 3]])
-
-        other = DataFrame([[3.6, 2., np.nan],
-                           [np.nan, np.nan, 7]], index=[1, 3])
-
-        df.update(other, overwrite=False)
-
-        expected = DataFrame([[1.5, nan, 3],
-                              [1.5, 2, 3],
-                              [1.5, nan, 3],
-                              [1.5, nan, 3.]])
-        assert_frame_equal(df, expected)
-
-    def test_update_filtered(self):
-        df = DataFrame([[1.5, nan, 3.],
-                        [1.5, nan, 3.],
-                        [1.5, nan, 3],
-                        [1.5, nan, 3]])
-
-        other = DataFrame([[3.6, 2., np.nan],
-                           [np.nan, np.nan, 7]], index=[1, 3])
-
-        df.update(other, filter_func=lambda x: x > 2)
-
-        expected = DataFrame([[1.5, nan, 3],
-                              [1.5, nan, 3],
-                              [1.5, nan, 3],
-                              [1.5, nan, 7.]])
-        assert_frame_equal(df, expected)
-
-    def test_update_raise(self):
-        df = DataFrame([[1.5, 1, 3.],
-                        [1.5, nan, 3.],
-                        [1.5, nan, 3],
-                        [1.5, nan, 3]])
-
-        other = DataFrame([[2., nan],
-                           [nan, 7]], index=[1, 3], columns=[1, 2])
-        with assertRaisesRegexp(ValueError, "Data overlaps"):
-            df.update(other, raise_conflict=True)
-
-    def test_update_from_non_df(self):
-        d = {'a': Series([1, 2, 3, 4]), 'b': Series([5, 6, 7, 8])}
-        df = DataFrame(d)
-
-        d['a'] = Series([5, 6, 7, 8])
-        df.update(d)
-
-        expected = DataFrame(d)
-
-        assert_frame_equal(df, expected)
-
-        d = {'a': [1, 2, 3, 4], 'b': [5, 6, 7, 8]}
-        df = DataFrame(d)
-
-        d['a'] = [5, 6, 7, 8]
-        df.update(d)
-
-        expected = DataFrame(d)
-
-        assert_frame_equal(df, expected)
-
-    def test_combineAdd(self):
-
-        with tm.assert_produces_warning(FutureWarning):
-            # trivial
-            comb = self.frame.combineAdd(self.frame)
-            assert_frame_equal(comb, self.frame * 2)
-
-            # more rigorous
-            a = DataFrame([[1., nan, nan, 2., nan]],
-                          columns=np.arange(5))
-            b = DataFrame([[2., 3., nan, 2., 6., nan]],
-                          columns=np.arange(6))
-            expected = DataFrame([[3., 3., nan, 4., 6., nan]],
-                                 columns=np.arange(6))
-
-            result = a.combineAdd(b)
-            assert_frame_equal(result, expected)
-            result2 = a.T.combineAdd(b.T)
-            assert_frame_equal(result2, expected.T)
-
-            expected2 = a.combine(b, operator.add, fill_value=0.)
-            assert_frame_equal(expected, expected2)
-
-            # corner cases
-            comb = self.frame.combineAdd(self.empty)
-            assert_frame_equal(comb, self.frame)
-
-            comb = self.empty.combineAdd(self.frame)
-            assert_frame_equal(comb, self.frame)
-
-            # integer corner case
-            df1 = DataFrame({'x': [5]})
-            df2 = DataFrame({'x': [1]})
-            df3 = DataFrame({'x': [6]})
-            comb = df1.combineAdd(df2)
-            assert_frame_equal(comb, df3)
-
-            # mixed type GH2191
-            df1 = DataFrame({'A': [1, 2], 'B': [3, 4]})
-            df2 = DataFrame({'A': [1, 2], 'C': [5, 6]})
-            rs = df1.combineAdd(df2)
-            xp = DataFrame({'A': [2, 4], 'B': [3, 4.], 'C': [5, 6.]})
-            assert_frame_equal(xp, rs)
-
-        # TODO: test integer fill corner?
-
-    def test_combineMult(self):
-
-        with tm.assert_produces_warning(FutureWarning):
-            # trivial
-            comb = self.frame.combineMult(self.frame)
-
-            assert_frame_equal(comb, self.frame ** 2)
-
-            # corner cases
-            comb = self.frame.combineMult(self.empty)
-            assert_frame_equal(comb, self.frame)
-
-            comb = self.empty.combineMult(self.frame)
-            assert_frame_equal(comb, self.frame)
-
-    def test_combine_generic(self):
-        df1 = self.frame
-        df2 = self.frame.ix[:-5, ['A', 'B', 'C']]
-
-        combined = df1.combine(df2, np.add)
-        combined2 = df2.combine(df1, np.add)
-        self.assertTrue(combined['D'].isnull().all())
-        self.assertTrue(combined2['D'].isnull().all())
-
-        chunk = combined.ix[:-5, ['A', 'B', 'C']]
-        chunk2 = combined2.ix[:-5, ['A', 'B', 'C']]
-
-        exp = self.frame.ix[:-5, ['A', 'B', 'C']].reindex_like(chunk) * 2
-        assert_frame_equal(chunk, exp)
-        assert_frame_equal(chunk2, exp)
-
-    def test_clip(self):
-        median = self.frame.median().median()
-
-        capped = self.frame.clip_upper(median)
-        self.assertFalse((capped.values > median).any())
-
-        floored = self.frame.clip_lower(median)
-        self.assertFalse((floored.values < median).any())
-
-        double = self.frame.clip(upper=median, lower=median)
-        self.assertFalse((double.values != median).any())
-
-    def test_dataframe_clip(self):
-
-        # GH #2747
-        df = DataFrame(np.random.randn(1000,2))
-
-        for lb, ub in [(-1,1),(1,-1)]:
-            clipped_df = df.clip(lb, ub)
-
-            lb, ub = min(lb,ub), max(ub,lb)
-            lb_mask = df.values <= lb
-            ub_mask = df.values >= ub
-            mask = ~lb_mask & ~ub_mask
-            self.assertTrue((clipped_df.values[lb_mask] == lb).all() == True)
-            self.assertTrue((clipped_df.values[ub_mask] == ub).all() == True)
-            self.assertTrue((clipped_df.values[mask] == df.values[mask]).all() == True)
-
-    def test_clip_against_series(self):
-        # GH #6966
-
-        df = DataFrame(np.random.randn(1000, 2))
-        lb = Series(np.random.randn(1000))
-        ub = lb + 1
-
-        clipped_df = df.clip(lb, ub, axis=0)
-
-        for i in range(2):
-            lb_mask = df.iloc[:, i] <= lb
-            ub_mask = df.iloc[:, i] >= ub
-            mask = ~lb_mask & ~ub_mask
-
-            result = clipped_df.loc[lb_mask, i]
-            assert_series_equal(result, lb[lb_mask], check_names=False)
-            self.assertEqual(result.name, i)
-
-            result = clipped_df.loc[ub_mask, i]
-            assert_series_equal(result, ub[ub_mask], check_names=False)
-            self.assertEqual(result.name, i)
-
-            assert_series_equal(clipped_df.loc[mask, i], df.loc[mask, i])
-
-    def test_clip_against_frame(self):
-        df = DataFrame(np.random.randn(1000, 2))
-        lb = DataFrame(np.random.randn(1000, 2))
-        ub = lb + 1
-
-        clipped_df = df.clip(lb, ub)
-
-        lb_mask = df <= lb
-        ub_mask = df >= ub
-        mask = ~lb_mask & ~ub_mask
-
-        assert_frame_equal(clipped_df[lb_mask], lb[lb_mask])
-        assert_frame_equal(clipped_df[ub_mask], ub[ub_mask])
-        assert_frame_equal(clipped_df[mask], df[mask])
-
-    def test_get_X_columns(self):
-        # numeric and object columns
-
-        df = DataFrame({'a': [1, 2, 3],
-                        'b' : [True, False, True],
-                        'c': ['foo', 'bar', 'baz'],
-                        'd': [None, None, None],
-                        'e': [3.14, 0.577, 2.773]})
-
-        self.assert_numpy_array_equal(df._get_numeric_data().columns,
-                                      ['a', 'b', 'e'])
-
-    def test_is_mixed_type(self):
-        self.assertFalse(self.frame._is_mixed_type)
-        self.assertTrue(self.mixed_frame._is_mixed_type)
-
-    def test_get_numeric_data(self):
-        intname = np.dtype(np.int_).name
-        floatname = np.dtype(np.float_).name
-        datetime64name = np.dtype('M8[ns]').name
-        objectname = np.dtype(np.object_).name
-
-        df = DataFrame({'a': 1., 'b': 2, 'c': 'foo', 'f' : Timestamp('20010102')},
-                       index=np.arange(10))
-        result = df.get_dtype_counts()
-        expected = Series({'int64': 1, 'float64' : 1, datetime64name: 1, objectname : 1})
-        result.sort_index()
-        expected.sort_index()
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'a': 1., 'b': 2, 'c': 'foo',
-                        'd' : np.array([1.]*10,dtype='float32'),
-                        'e' : np.array([1]*10,dtype='int32'),
-                        'f' : np.array([1]*10,dtype='int16'),
-                        'g' : Timestamp('20010102')},
-                       index=np.arange(10))
-
-        result = df._get_numeric_data()
-        expected = df.ix[:, ['a', 'b','d','e','f']]
-        assert_frame_equal(result, expected)
-
-        only_obj = df.ix[:, ['c','g']]
-        result = only_obj._get_numeric_data()
-        expected = df.ix[:, []]
-        assert_frame_equal(result, expected)
-
-        df = DataFrame.from_dict({'a':[1,2], 'b':['foo','bar'],'c':[np.pi,np.e]})
-        result = df._get_numeric_data()
-        expected = DataFrame.from_dict({'a':[1,2], 'c':[np.pi,np.e]})
-        assert_frame_equal(result, expected)
-
-        df = result.copy()
-        result = df._get_numeric_data()
-        expected = df
-        assert_frame_equal(result, expected)
-
-    def test_bool_describe_in_mixed_frame(self):
-        df = DataFrame({
-            'string_data': ['a', 'b', 'c', 'd', 'e'],
-            'bool_data': [True, True, False, False, False],
-            'int_data': [10, 20, 30, 40, 50],
-        })
-
-        # Boolean data and integer data is included in .describe() output, string data isn't
-        self.assert_numpy_array_equal(df.describe().columns, ['bool_data', 'int_data'])
-
-        bool_describe = df.describe()['bool_data']
-
-        # Both the min and the max values should stay booleans
-        self.assertEqual(bool_describe['min'].dtype, np.bool_)
-        self.assertEqual(bool_describe['max'].dtype, np.bool_)
-
-        self.assertFalse(bool_describe['min'])
-        self.assertTrue(bool_describe['max'])
-
-        # For numeric operations, like mean or median, the values True/False are cast to
-        # the integer values 1 and 0
-        assert_almost_equal(bool_describe['mean'], 0.4)
-        assert_almost_equal(bool_describe['50%'], 0)
-
-    def test_reduce_mixed_frame(self):
-        # GH 6806
-        df = DataFrame({
-            'bool_data': [True, True, False, False, False],
-            'int_data': [10, 20, 30, 40, 50],
-            'string_data': ['a', 'b', 'c', 'd', 'e'],
-        })
-        df.reindex(columns=['bool_data', 'int_data', 'string_data'])
-        test = df.sum(axis=0)
-        assert_almost_equal(test.values, [2, 150, 'abcde'])
-        assert_series_equal(test, df.T.sum(axis=1))
-
-    def test_count(self):
-        f = lambda s: notnull(s).sum()
-        self._check_stat_op('count', f,
-                            has_skipna=False,
-                            has_numeric_only=True,
-                            check_dtype=False,
-                            check_dates=True)
-
-        # corner case
-        frame = DataFrame()
-        ct1 = frame.count(1)
-        tm.assertIsInstance(ct1, Series)
-
-        ct2 = frame.count(0)
-        tm.assertIsInstance(ct2, Series)
-
-        # GH #423
-        df = DataFrame(index=lrange(10))
-        result = df.count(1)
-        expected = Series(0, index=df.index)
-        assert_series_equal(result, expected)
-
-        df = DataFrame(columns=lrange(10))
-        result = df.count(0)
-        expected = Series(0, index=df.columns)
-        assert_series_equal(result, expected)
-
-        df = DataFrame()
-        result = df.count()
-        expected = Series(0, index=[])
-        assert_series_equal(result, expected)
-
-    def test_sum(self):
-        self._check_stat_op('sum', np.sum, has_numeric_only=True)
-
-        # mixed types (with upcasting happening)
-        self._check_stat_op('sum', np.sum, frame=self.mixed_float.astype('float32'),
-                            has_numeric_only=True, check_dtype=False, check_less_precise=True)
-
-    def test_stat_operators_attempt_obj_array(self):
-        data = {
-            'a': [-0.00049987540199591344, -0.0016467257772919831,
-                  0.00067695870775883013],
-            'b': [-0, -0, 0.0],
-            'c': [0.00031111847529610595, 0.0014902627951905339,
-                  -0.00094099200035979691]
-        }
-        df1 = DataFrame(data, index=['foo', 'bar', 'baz'],
-                        dtype='O')
-        methods = ['sum', 'mean', 'prod', 'var', 'std', 'skew', 'min', 'max']
-
-        # GH #676
-        df2 = DataFrame({0: [np.nan, 2], 1: [np.nan, 3],
-                        2: [np.nan, 4]}, dtype=object)
-
-        for df in [df1, df2]:
-            for meth in methods:
-                self.assertEqual(df.values.dtype, np.object_)
-                result = getattr(df, meth)(1)
-                expected = getattr(df.astype('f8'), meth)(1)
-
-                if not tm._incompat_bottleneck_version(meth):
-                    assert_series_equal(result, expected)
-
-    def test_mean(self):
-        self._check_stat_op('mean', np.mean, check_dates=True)
-
-    def test_product(self):
-        self._check_stat_op('product', np.prod)
-
-    def test_median(self):
-        def wrapper(x):
-            if isnull(x).any():
-                return np.nan
-            return np.median(x)
-
-        self._check_stat_op('median', wrapper, check_dates=True)
-
-    def test_min(self):
-        self._check_stat_op('min', np.min, check_dates=True)
-        self._check_stat_op('min', np.min, frame=self.intframe)
-
-    def test_cummin(self):
-        self.tsframe.ix[5:10, 0] = nan
-        self.tsframe.ix[10:15, 1] = nan
-        self.tsframe.ix[15:, 2] = nan
-
-        # axis = 0
-        cummin = self.tsframe.cummin()
-        expected = self.tsframe.apply(Series.cummin)
-        assert_frame_equal(cummin, expected)
-
-        # axis = 1
-        cummin = self.tsframe.cummin(axis=1)
-        expected = self.tsframe.apply(Series.cummin, axis=1)
-        assert_frame_equal(cummin, expected)
-
-        # works
-        df = DataFrame({'A': np.arange(20)}, index=np.arange(20))
-        result = df.cummin()
-
-        # fix issue
-        cummin_xs = self.tsframe.cummin(axis=1)
-        self.assertEqual(np.shape(cummin_xs), np.shape(self.tsframe))
-
-    def test_cummax(self):
-        self.tsframe.ix[5:10, 0] = nan
-        self.tsframe.ix[10:15, 1] = nan
-        self.tsframe.ix[15:, 2] = nan
-
-        # axis = 0
-        cummax = self.tsframe.cummax()
-        expected = self.tsframe.apply(Series.cummax)
-        assert_frame_equal(cummax, expected)
-
-        # axis = 1
-        cummax = self.tsframe.cummax(axis=1)
-        expected = self.tsframe.apply(Series.cummax, axis=1)
-        assert_frame_equal(cummax, expected)
-
-        # works
-        df = DataFrame({'A': np.arange(20)}, index=np.arange(20))
-        result = df.cummax()
-
-        # fix issue
-        cummax_xs = self.tsframe.cummax(axis=1)
-        self.assertEqual(np.shape(cummax_xs), np.shape(self.tsframe))
-
-    def test_max(self):
-        self._check_stat_op('max', np.max, check_dates=True)
-        self._check_stat_op('max', np.max, frame=self.intframe)
-
-    def test_mad(self):
-        f = lambda x: np.abs(x - x.mean()).mean()
-        self._check_stat_op('mad', f)
-
-    def test_var_std(self):
-        alt = lambda x: np.var(x, ddof=1)
-        self._check_stat_op('var', alt)
-
-        alt = lambda x: np.std(x, ddof=1)
-        self._check_stat_op('std', alt)
-
-        result = self.tsframe.std(ddof=4)
-        expected = self.tsframe.apply(lambda x: x.std(ddof=4))
-        assert_almost_equal(result, expected)
-
-        result = self.tsframe.var(ddof=4)
-        expected = self.tsframe.apply(lambda x: x.var(ddof=4))
-        assert_almost_equal(result, expected)
-
-        arr = np.repeat(np.random.random((1, 1000)), 1000, 0)
-        result = nanops.nanvar(arr, axis=0)
-        self.assertFalse((result < 0).any())
-        if nanops._USE_BOTTLENECK:
-            nanops._USE_BOTTLENECK = False
-            result = nanops.nanvar(arr, axis=0)
-            self.assertFalse((result < 0).any())
-            nanops._USE_BOTTLENECK = True
-
-    def test_numeric_only_flag(self):
-        # GH #9201
-        methods = ['sem', 'var', 'std']
-        df1 = DataFrame(np.random.randn(5, 3), columns=['foo', 'bar', 'baz'])
-        # set one entry to a number in str format
-        df1.ix[0, 'foo'] = '100'
-
-        df2 = DataFrame(np.random.randn(5, 3), columns=['foo', 'bar', 'baz'])
-        # set one entry to a non-number str
-        df2.ix[0, 'foo'] = 'a'
-
-        for meth in methods:
-            result = getattr(df1, meth)(axis=1, numeric_only=True)
-            expected = getattr(df1[['bar', 'baz']], meth)(axis=1)
-            assert_series_equal(expected, result)
-
-            result = getattr(df2, meth)(axis=1, numeric_only=True)
-            expected = getattr(df2[['bar', 'baz']], meth)(axis=1)
-            assert_series_equal(expected, result)
-
-            # df1 has all numbers, df2 has a letter inside
-            self.assertRaises(TypeError, lambda : getattr(df1, meth)(axis=1, numeric_only=False))
-            self.assertRaises(TypeError, lambda : getattr(df2, meth)(axis=1, numeric_only=False))
-
-    def test_sem(self):
-        alt = lambda x: np.std(x, ddof=1)/np.sqrt(len(x))
-        self._check_stat_op('sem', alt)
-
-        result = self.tsframe.sem(ddof=4)
-        expected = self.tsframe.apply(lambda x: x.std(ddof=4)/np.sqrt(len(x)))
-        assert_almost_equal(result, expected)
-
-        arr = np.repeat(np.random.random((1, 1000)), 1000, 0)
-        result = nanops.nansem(arr, axis=0)
-        self.assertFalse((result < 0).any())
-        if nanops._USE_BOTTLENECK:
-            nanops._USE_BOTTLENECK = False
-            result = nanops.nansem(arr, axis=0)
-            self.assertFalse((result < 0).any())
-            nanops._USE_BOTTLENECK = True
-
-    def test_skew(self):
-        tm._skip_if_no_scipy()
-        from scipy.stats import skew
-
-        def alt(x):
-            if len(x) < 3:
-                return np.nan
-            return skew(x, bias=False)
-
-        self._check_stat_op('skew', alt)
-
-    def test_kurt(self):
-        tm._skip_if_no_scipy()
-
-        from scipy.stats import kurtosis
-
-        def alt(x):
-            if len(x) < 4:
-                return np.nan
-            return kurtosis(x, bias=False)
-
-        self._check_stat_op('kurt', alt)
-
-        index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
-                           labels=[[0, 0, 0, 0, 0, 0],
-                                   [0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1]])
-        df = DataFrame(np.random.randn(6, 3), index=index)
-
-        kurt = df.kurt()
-        kurt2 = df.kurt(level=0).xs('bar')
-        assert_series_equal(kurt, kurt2, check_names=False)
-        self.assertTrue(kurt.name is None)
-        self.assertEqual(kurt2.name, 'bar')
-
-    def _check_stat_op(self, name, alternative, frame=None, has_skipna=True,
-                       has_numeric_only=False, check_dtype=True, check_dates=False,
-                       check_less_precise=False):
-        if frame is None:
-            frame = self.frame
-            # set some NAs
-            frame.ix[5:10] = np.nan
-            frame.ix[15:20, -2:] = np.nan
-
-        f = getattr(frame, name)
-
-        if check_dates:
-            df = DataFrame({'b': date_range('1/1/2001', periods=2)})
-            _f = getattr(df, name)
-            result = _f()
-            self.assertIsInstance(result, Series)
-
-            df['a'] = lrange(len(df))
-            result = getattr(df, name)()
-            self.assertIsInstance(result, Series)
-            self.assertTrue(len(result))
-
-        if has_skipna:
-            def skipna_wrapper(x):
-                nona = x.dropna()
-                if len(nona) == 0:
-                    return np.nan
-                return alternative(nona)
-
-            def wrapper(x):
-                return alternative(x.values)
-
-            result0 = f(axis=0, skipna=False)
-            result1 = f(axis=1, skipna=False)
-            assert_series_equal(result0, frame.apply(wrapper),
-                                check_dtype=check_dtype,
-                                check_less_precise=check_less_precise)
-            assert_series_equal(result1, frame.apply(wrapper, axis=1),
-                                check_dtype=False,
-                                check_less_precise=check_less_precise)  # HACK: win32
-        else:
-            skipna_wrapper = alternative
-            wrapper = alternative
-
-        result0 = f(axis=0)
-        result1 = f(axis=1)
-        assert_series_equal(result0, frame.apply(skipna_wrapper),
-                            check_dtype=check_dtype,
-                            check_less_precise=check_less_precise)
-        if not tm._incompat_bottleneck_version(name):
-            assert_series_equal(result1, frame.apply(skipna_wrapper, axis=1),
-                                check_dtype=False,
-                                check_less_precise=check_less_precise)
-
-        # check dtypes
-        if check_dtype:
-            lcd_dtype = frame.values.dtype
-            self.assertEqual(lcd_dtype, result0.dtype)
-            self.assertEqual(lcd_dtype, result1.dtype)
-
-        # result = f(axis=1)
-        # comp = frame.apply(alternative, axis=1).reindex(result.index)
-        # assert_series_equal(result, comp)
-
-        # bad axis
-        assertRaisesRegexp(ValueError, 'No axis named 2', f, axis=2)
-        # make sure works on mixed-type frame
-        getattr(self.mixed_frame, name)(axis=0)
-        getattr(self.mixed_frame, name)(axis=1)
-
-        if has_numeric_only:
-            getattr(self.mixed_frame, name)(axis=0, numeric_only=True)
-            getattr(self.mixed_frame, name)(axis=1, numeric_only=True)
-            getattr(self.frame, name)(axis=0, numeric_only=False)
-            getattr(self.frame, name)(axis=1, numeric_only=False)
-
-        # all NA case
-        if has_skipna:
-            all_na = self.frame * np.NaN
-            r0 = getattr(all_na, name)(axis=0)
-            r1 = getattr(all_na, name)(axis=1)
-            if not tm._incompat_bottleneck_version(name):
-                self.assertTrue(np.isnan(r0).all())
-                self.assertTrue(np.isnan(r1).all())
-
-    def test_mode(self):
-        df = pd.DataFrame({"A": [12, 12, 11, 12, 19, 11],
-                           "B": [10, 10, 10, np.nan, 3, 4],
-                           "C": [8, 8, 8, 9, 9, 9],
-                           "D": np.arange(6,dtype='int64'),
-                           "E": [8, 8, 1, 1, 3, 3]})
-        assert_frame_equal(df[["A"]].mode(),
-                           pd.DataFrame({"A": [12]}))
-        expected = pd.Series([], dtype='int64', name='D').to_frame()
-        assert_frame_equal(df[["D"]].mode(), expected)
-        expected = pd.Series([1, 3, 8], dtype='int64', name='E').to_frame()
-        assert_frame_equal(df[["E"]].mode(), expected)
-        assert_frame_equal(df[["A", "B"]].mode(),
-                           pd.DataFrame({"A": [12], "B": [10.]}))
-        assert_frame_equal(df.mode(),
-                           pd.DataFrame({"A": [12, np.nan, np.nan],
-                                         "B": [10, np.nan, np.nan],
-                                         "C": [8, 9, np.nan],
-                                         "D": [np.nan, np.nan, np.nan],
-                                         "E": [1, 3, 8]}))
-
-        # outputs in sorted order
-        df["C"] = list(reversed(df["C"]))
-        com.pprint_thing(df["C"])
-        com.pprint_thing(df["C"].mode())
-        a, b = (df[["A", "B", "C"]].mode(),
-                           pd.DataFrame({"A": [12, np.nan],
-                                         "B": [10, np.nan],
-                                         "C": [8, 9]}))
-        com.pprint_thing(a)
-        com.pprint_thing(b)
-        assert_frame_equal(a, b)
-        # should work with heterogeneous types
-        df = pd.DataFrame({"A": np.arange(6,dtype='int64'),
-                           "B": pd.date_range('2011', periods=6),
-                           "C": list('abcdef')})
-        exp = pd.DataFrame({"A": pd.Series([], dtype=df["A"].dtype),
-                            "B": pd.Series([], dtype=df["B"].dtype),
-                            "C": pd.Series([], dtype=df["C"].dtype)})
-        assert_frame_equal(df.mode(), exp)
-
-        # and also when not empty
-        df.loc[1, "A"] = 0
-        df.loc[4, "B"] = df.loc[3, "B"]
-        df.loc[5, "C"] = 'e'
-        exp = pd.DataFrame({"A": pd.Series([0], dtype=df["A"].dtype),
-                            "B": pd.Series([df.loc[3, "B"]], dtype=df["B"].dtype),
-                            "C": pd.Series(['e'], dtype=df["C"].dtype)})
-
-        assert_frame_equal(df.mode(), exp)
-
-    def test_sum_corner(self):
-        axis0 = self.empty.sum(0)
-        axis1 = self.empty.sum(1)
-        tm.assertIsInstance(axis0, Series)
-        tm.assertIsInstance(axis1, Series)
-        self.assertEqual(len(axis0), 0)
-        self.assertEqual(len(axis1), 0)
-
-    def test_sum_object(self):
-        values = self.frame.values.astype(int)
-        frame = DataFrame(values, index=self.frame.index,
-                          columns=self.frame.columns)
-        deltas = frame * timedelta(1)
-        deltas.sum()
-
-    def test_sum_bool(self):
-        # ensure this works, bug report
-        bools = np.isnan(self.frame)
-        bools.sum(1)
-        bools.sum(0)
-
-    def test_mean_corner(self):
-        # unit test when have object data
-        the_mean = self.mixed_frame.mean(axis=0)
-        the_sum = self.mixed_frame.sum(axis=0, numeric_only=True)
-        self.assertTrue(the_sum.index.equals(the_mean.index))
-        self.assertTrue(len(the_mean.index) < len(self.mixed_frame.columns))
-
-        # xs sum mixed type, just want to know it works...
-        the_mean = self.mixed_frame.mean(axis=1)
-        the_sum = self.mixed_frame.sum(axis=1, numeric_only=True)
-        self.assertTrue(the_sum.index.equals(the_mean.index))
-
-        # take mean of boolean column
-        self.frame['bool'] = self.frame['A'] > 0
-        means = self.frame.mean(0)
-        self.assertEqual(means['bool'], self.frame['bool'].values.mean())
-
-    def test_stats_mixed_type(self):
-        # don't blow up
-        self.mixed_frame.std(1)
-        self.mixed_frame.var(1)
-        self.mixed_frame.mean(1)
-        self.mixed_frame.skew(1)
-
-    def test_median_corner(self):
-        def wrapper(x):
-            if isnull(x).any():
-                return np.nan
-            return np.median(x)
-
-        self._check_stat_op('median', wrapper, frame=self.intframe,
-                            check_dtype=False, check_dates=True)
-
-    def test_quantile(self):
-        from numpy import percentile
-
-        q = self.tsframe.quantile(0.1, axis=0)
-        self.assertEqual(q['A'], percentile(self.tsframe['A'], 10))
-        q = self.tsframe.quantile(0.9, axis=1)
-        q = self.intframe.quantile(0.1)
-        self.assertEqual(q['A'], percentile(self.intframe['A'], 10))
-
-        # test degenerate case
-        q = DataFrame({'x': [], 'y': []}).quantile(0.1, axis=0)
-        assert(np.isnan(q['x']) and np.isnan(q['y']))
-
-        # non-numeric exclusion
-        df = DataFrame({'col1':['A','A','B','B'], 'col2':[1,2,3,4]})
-        rs = df.quantile(0.5)
-        xp = df.median()
-        assert_series_equal(rs, xp)
-
-        # axis
-        df = DataFrame({"A": [1, 2, 3], "B": [2, 3, 4]}, index=[1, 2, 3])
-        result = df.quantile(.5, axis=1)
-        expected = Series([1.5, 2.5, 3.5], index=[1, 2, 3])
-        assert_series_equal(result, expected)
-
-        result = df.quantile([.5, .75], axis=1)
-        expected = DataFrame({1: [1.5, 1.75], 2: [2.5, 2.75],
-                              3: [3.5, 3.75]}, index=[0.5, 0.75])
-        assert_frame_equal(result, expected, check_index_type=True)
-
-        # We may want to break API in the future to change this
-        # so that we exclude non-numeric along the same axis
-        # See GH #7312
-        df = DataFrame([[1, 2, 3],
-                        ['a', 'b', 4]])
-        result = df.quantile(.5, axis=1)
-        expected = Series([3., 4.], index=[0, 1])
-        assert_series_equal(result, expected)
-
-    def test_quantile_axis_parameter(self):
-        # GH 9543/9544
-        from numpy import percentile
-
-        df = DataFrame({"A": [1, 2, 3], "B": [2, 3, 4]}, index=[1, 2, 3])
-
-        result = df.quantile(.5, axis=0)
-
-        expected = Series([2., 3.], index=["A", "B"])
-        assert_series_equal(result, expected)
-
-        expected = df.quantile(.5, axis="index")
-        assert_series_equal(result, expected)
-
-        result = df.quantile(.5, axis=1)
-
-        expected = Series([1.5, 2.5, 3.5], index=[1, 2, 3])
-        assert_series_equal(result, expected)
-
-        result = df.quantile(.5, axis="columns")
-        assert_series_equal(result, expected)
-
-        self.assertRaises(ValueError, df.quantile, 0.1, axis=-1)
-        self.assertRaises(ValueError, df.quantile, 0.1, axis="column")
-
-    def test_quantile_multi(self):
-        df = DataFrame([[1, 1, 1], [2, 2, 2], [3, 3, 3]],
-                       columns=['a', 'b', 'c'])
-        result = df.quantile([.25, .5])
-        expected = DataFrame([[1.5, 1.5, 1.5], [2., 2., 2.]],
-                             index=[.25, .5], columns=['a', 'b', 'c'])
-        assert_frame_equal(result, expected)
-
-        # axis = 1
-        result = df.quantile([.25, .5], axis=1)
-        expected = DataFrame([[1.5, 1.5, 1.5], [2., 2., 2.]],
-                             index=[.25, .5], columns=[0, 1, 2])
-
-        # empty
-        result = DataFrame({'x': [], 'y': []}).quantile([0.1, .9], axis=0)
-        expected = DataFrame({'x': [np.nan, np.nan], 'y': [np.nan, np.nan]},
-                             index=[.1, .9])
-        assert_frame_equal(result, expected)
-
-    def test_quantile_datetime(self):
-        df = DataFrame({'a': pd.to_datetime(['2010', '2011']), 'b': [0, 5]})
-
-        # exclude datetime
-        result = df.quantile(.5)
-        expected = Series([2.5], index=['b'])
-
-        # datetime
-        result = df.quantile(.5, numeric_only=False)
-        expected = Series([Timestamp('2010-07-02 12:00:00'), 2.5],
-                          index=['a', 'b'])
-        assert_series_equal(result, expected)
-
-        # datetime w/ multi
-        result = df.quantile([.5], numeric_only=False)
-        expected = DataFrame([[Timestamp('2010-07-02 12:00:00'), 2.5]],
-                             index=[.5], columns=['a', 'b'])
-        assert_frame_equal(result, expected)
-
-        # axis = 1
-        df['c'] = pd.to_datetime(['2011', '2012'])
-        result = df[['a', 'c']].quantile(.5, axis=1, numeric_only=False)
-        expected = Series([Timestamp('2010-07-02 12:00:00'),
-                           Timestamp('2011-07-02 12:00:00')],
-                          index=[0, 1])
-        assert_series_equal(result, expected)
-
-        result = df[['a', 'c']].quantile([.5], axis=1, numeric_only=False)
-        expected = DataFrame([[Timestamp('2010-07-02 12:00:00'),
-                               Timestamp('2011-07-02 12:00:00')]],
-                             index=[0.5], columns=[0, 1])
-        assert_frame_equal(result, expected)
-
-    def test_quantile_invalid(self):
-        msg = 'percentiles should all be in the interval \\[0, 1\\]'
-        for invalid in [-1, 2, [0.5, -1], [0.5, 2]]:
-            with tm.assertRaisesRegexp(ValueError, msg):
-                self.tsframe.quantile(invalid)
-
-    def test_cumsum(self):
-        self.tsframe.ix[5:10, 0] = nan
-        self.tsframe.ix[10:15, 1] = nan
-        self.tsframe.ix[15:, 2] = nan
-
-        # axis = 0
-        cumsum = self.tsframe.cumsum()
-        expected = self.tsframe.apply(Series.cumsum)
-        assert_frame_equal(cumsum, expected)
-
-        # axis = 1
-        cumsum = self.tsframe.cumsum(axis=1)
-        expected = self.tsframe.apply(Series.cumsum, axis=1)
-        assert_frame_equal(cumsum, expected)
-
-        # works
-        df = DataFrame({'A': np.arange(20)}, index=np.arange(20))
-        result = df.cumsum()
-
-        # fix issue
-        cumsum_xs = self.tsframe.cumsum(axis=1)
-        self.assertEqual(np.shape(cumsum_xs), np.shape(self.tsframe))
-
-    def test_cumprod(self):
-        self.tsframe.ix[5:10, 0] = nan
-        self.tsframe.ix[10:15, 1] = nan
-        self.tsframe.ix[15:, 2] = nan
-
-        # axis = 0
-        cumprod = self.tsframe.cumprod()
-        expected = self.tsframe.apply(Series.cumprod)
-        assert_frame_equal(cumprod, expected)
-
-        # axis = 1
-        cumprod = self.tsframe.cumprod(axis=1)
-        expected = self.tsframe.apply(Series.cumprod, axis=1)
-        assert_frame_equal(cumprod, expected)
-
-        # fix issue
-        cumprod_xs = self.tsframe.cumprod(axis=1)
-        self.assertEqual(np.shape(cumprod_xs), np.shape(self.tsframe))
-
-        # ints
-        df = self.tsframe.fillna(0).astype(int)
-        df.cumprod(0)
-        df.cumprod(1)
-
-        # ints32
-        df = self.tsframe.fillna(0).astype(np.int32)
-        df.cumprod(0)
-        df.cumprod(1)
-
-    def test_rank(self):
-        tm._skip_if_no_scipy()
-        from scipy.stats import rankdata
-
-        self.frame['A'][::2] = np.nan
-        self.frame['B'][::3] = np.nan
-        self.frame['C'][::4] = np.nan
-        self.frame['D'][::5] = np.nan
-
-        ranks0 = self.frame.rank()
-        ranks1 = self.frame.rank(1)
-        mask = np.isnan(self.frame.values)
-
-        fvals = self.frame.fillna(np.inf).values
-
-        exp0 = np.apply_along_axis(rankdata, 0, fvals)
-        exp0[mask] = np.nan
-
-        exp1 = np.apply_along_axis(rankdata, 1, fvals)
-        exp1[mask] = np.nan
-
-        assert_almost_equal(ranks0.values, exp0)
-        assert_almost_equal(ranks1.values, exp1)
-
-        # integers
-        df = DataFrame(np.random.randint(0, 5, size=40).reshape((10, 4)))
-
-        result = df.rank()
-        exp = df.astype(float).rank()
-        assert_frame_equal(result, exp)
-
-        result = df.rank(1)
-        exp = df.astype(float).rank(1)
-        assert_frame_equal(result, exp)
-
-    def test_rank2(self):
-        from datetime import datetime
-        df = DataFrame([[1, 3, 2], [1, 2, 3]])
-        expected = DataFrame([[1.0, 3.0, 2.0], [1, 2, 3]]) / 3.0
-        result = df.rank(1, pct=True)
-        assert_frame_equal(result, expected)
-
-        df = DataFrame([[1, 3, 2], [1, 2, 3]])
-        expected = df.rank(0) / 2.0
-        result = df.rank(0, pct=True)
-        assert_frame_equal(result, expected)
-
-
-
-        df = DataFrame([['b', 'c', 'a'], ['a', 'c', 'b']])
-        expected = DataFrame([[2.0, 3.0, 1.0], [1, 3, 2]])
-        result = df.rank(1, numeric_only=False)
-        assert_frame_equal(result, expected)
-
-
-        expected = DataFrame([[2.0, 1.5, 1.0], [1, 1.5, 2]])
-        result = df.rank(0, numeric_only=False)
-        assert_frame_equal(result, expected)
-
-        df = DataFrame([['b', np.nan, 'a'], ['a', 'c', 'b']])
-        expected = DataFrame([[2.0, nan, 1.0], [1.0, 3.0, 2.0]])
-        result = df.rank(1, numeric_only=False)
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame([[2.0, nan, 1.0], [1.0, 1.0, 2.0]])
-        result = df.rank(0, numeric_only=False)
-        assert_frame_equal(result, expected)
-
-        # f7u12, this does not work without extensive workaround
-        data = [[datetime(2001, 1, 5), nan, datetime(2001, 1, 2)],
-                [datetime(2000, 1, 2), datetime(2000, 1, 3),
-                 datetime(2000, 1, 1)]]
-        df = DataFrame(data)
-
-        # check the rank
-        expected = DataFrame([[2., nan, 1.],
-                              [2., 3., 1.]])
-        result = df.rank(1, numeric_only=False)
-        assert_frame_equal(result, expected)
-
-        # mixed-type frames
-        self.mixed_frame['datetime'] = datetime.now()
-        self.mixed_frame['timedelta'] = timedelta(days=1,seconds=1)
-
-        result = self.mixed_frame.rank(1)
-        expected = self.mixed_frame.rank(1, numeric_only=True)
-        assert_frame_equal(result, expected)
-
-        df = DataFrame({"a":[1e-20, -5, 1e-20+1e-40, 10, 1e60, 1e80, 1e-30]})
-        exp = DataFrame({"a":[ 3.5,  1. ,  3.5,  5. ,  6. ,  7. ,  2. ]})
-        assert_frame_equal(df.rank(), exp)
-
-    def test_rank_na_option(self):
-        tm._skip_if_no_scipy()
-        from scipy.stats import rankdata
-
-        self.frame['A'][::2] = np.nan
-        self.frame['B'][::3] = np.nan
-        self.frame['C'][::4] = np.nan
-        self.frame['D'][::5] = np.nan
-
-        # bottom
-        ranks0 = self.frame.rank(na_option='bottom')
-        ranks1 = self.frame.rank(1, na_option='bottom')
-
-        fvals = self.frame.fillna(np.inf).values
-
-        exp0 = np.apply_along_axis(rankdata, 0, fvals)
-        exp1 = np.apply_along_axis(rankdata, 1, fvals)
-
-        assert_almost_equal(ranks0.values, exp0)
-        assert_almost_equal(ranks1.values, exp1)
-
-        # top
-        ranks0 = self.frame.rank(na_option='top')
-        ranks1 = self.frame.rank(1, na_option='top')
-
-        fval0 = self.frame.fillna((self.frame.min() - 1).to_dict()).values
-        fval1 = self.frame.T
-        fval1 = fval1.fillna((fval1.min() - 1).to_dict()).T
-        fval1 = fval1.fillna(np.inf).values
-
-        exp0 = np.apply_along_axis(rankdata, 0, fval0)
-        exp1 = np.apply_along_axis(rankdata, 1, fval1)
-
-        assert_almost_equal(ranks0.values, exp0)
-        assert_almost_equal(ranks1.values, exp1)
-
-        # descending
-
-        # bottom
-        ranks0 = self.frame.rank(na_option='top', ascending=False)
-        ranks1 = self.frame.rank(1, na_option='top', ascending=False)
-
-        fvals = self.frame.fillna(np.inf).values
-
-        exp0 = np.apply_along_axis(rankdata, 0, -fvals)
-        exp1 = np.apply_along_axis(rankdata, 1, -fvals)
-
-        assert_almost_equal(ranks0.values, exp0)
-        assert_almost_equal(ranks1.values, exp1)
-
-        # descending
-
-        # top
-        ranks0 = self.frame.rank(na_option='bottom', ascending=False)
-        ranks1 = self.frame.rank(1, na_option='bottom', ascending=False)
-
-        fval0 = self.frame.fillna((self.frame.min() - 1).to_dict()).values
-        fval1 = self.frame.T
-        fval1 = fval1.fillna((fval1.min() - 1).to_dict()).T
-        fval1 = fval1.fillna(np.inf).values
-
-        exp0 = np.apply_along_axis(rankdata, 0, -fval0)
-        exp1 = np.apply_along_axis(rankdata, 1, -fval1)
-
-        assert_almost_equal(ranks0.values, exp0)
-        assert_almost_equal(ranks1.values, exp1)
-
-    def test_axis_aliases(self):
-
-        f = self.frame
-
-        # reg name
-        expected = f.sum(axis=0)
-        result = f.sum(axis='index')
-        assert_series_equal(result, expected)
-
-        expected = f.sum(axis=1)
-        result = f.sum(axis='columns')
-        assert_series_equal(result, expected)
-
-    def test_combine_first_mixed(self):
-        a = Series(['a', 'b'], index=lrange(2))
-        b = Series(lrange(2), index=lrange(2))
-        f = DataFrame({'A': a, 'B': b})
-
-        a = Series(['a', 'b'], index=lrange(5, 7))
-        b = Series(lrange(2), index=lrange(5, 7))
-        g = DataFrame({'A': a, 'B': b})
-
-        combined = f.combine_first(g)
-
-    def test_more_asMatrix(self):
-        values = self.mixed_frame.as_matrix()
-        self.assertEqual(values.shape[1], len(self.mixed_frame.columns))
-
-    def test_reindex_boolean(self):
-        frame = DataFrame(np.ones((10, 2), dtype=bool),
-                          index=np.arange(0, 20, 2),
-                          columns=[0, 2])
-
-        reindexed = frame.reindex(np.arange(10))
-        self.assertEqual(reindexed.values.dtype, np.object_)
-        self.assertTrue(isnull(reindexed[0][1]))
-
-        reindexed = frame.reindex(columns=lrange(3))
-        self.assertEqual(reindexed.values.dtype, np.object_)
-        self.assertTrue(isnull(reindexed[1]).all())
-
-    def test_reindex_objects(self):
-        reindexed = self.mixed_frame.reindex(columns=['foo', 'A', 'B'])
-        self.assertIn('foo', reindexed)
-
-        reindexed = self.mixed_frame.reindex(columns=['A', 'B'])
-        self.assertNotIn('foo', reindexed)
-
-    def test_reindex_corner(self):
-        index = Index(['a', 'b', 'c'])
-        dm = self.empty.reindex(index=[1, 2, 3])
-        reindexed = dm.reindex(columns=index)
-        self.assertTrue(reindexed.columns.equals(index))
-
-        # ints are weird
-
-        smaller = self.intframe.reindex(columns=['A', 'B', 'E'])
-        self.assertEqual(smaller['E'].dtype, np.float64)
-
-    def test_reindex_axis(self):
-        cols = ['A', 'B', 'E']
-        reindexed1 = self.intframe.reindex_axis(cols, axis=1)
-        reindexed2 = self.intframe.reindex(columns=cols)
-        assert_frame_equal(reindexed1, reindexed2)
-
-        rows = self.intframe.index[0:5]
-        reindexed1 = self.intframe.reindex_axis(rows, axis=0)
-        reindexed2 = self.intframe.reindex(index=rows)
-        assert_frame_equal(reindexed1, reindexed2)
-
-        self.assertRaises(ValueError, self.intframe.reindex_axis, rows, axis=2)
-
-        # no-op case
-        cols = self.frame.columns.copy()
-        newFrame = self.frame.reindex_axis(cols, axis=1)
-        assert_frame_equal(newFrame, self.frame)
-
-    def test_reindex_with_nans(self):
-        df = DataFrame([[1, 2], [3, 4], [np.nan, np.nan], [7, 8], [9, 10]],
-                       columns=['a', 'b'],
-                       index=[100.0, 101.0, np.nan, 102.0, 103.0])
-
-        result = df.reindex(index=[101.0, 102.0, 103.0])
-        expected = df.iloc[[1, 3, 4]]
-        assert_frame_equal(result, expected)
-
-        result = df.reindex(index=[103.0])
-        expected = df.iloc[[4]]
-        assert_frame_equal(result, expected)
-
-        result = df.reindex(index=[101.0])
-        expected = df.iloc[[1]]
-        assert_frame_equal(result, expected)
-
-    def test_reindex_multi(self):
-        df = DataFrame(np.random.randn(3, 3))
-
-        result = df.reindex(lrange(4), lrange(4))
-        expected = df.reindex(lrange(4)).reindex(columns=lrange(4))
-
-        assert_frame_equal(result, expected)
-
-        df = DataFrame(np.random.randint(0, 10, (3, 3)))
-
-        result = df.reindex(lrange(4), lrange(4))
-        expected = df.reindex(lrange(4)).reindex(columns=lrange(4))
-
-        assert_frame_equal(result, expected)
-
-        df = DataFrame(np.random.randint(0, 10, (3, 3)))
-
-        result = df.reindex(lrange(2), lrange(2))
-        expected = df.reindex(lrange(2)).reindex(columns=lrange(2))
-
-        assert_frame_equal(result, expected)
-
-        df = DataFrame(np.random.randn(5, 3) + 1j, columns=['a', 'b', 'c'])
-
-        result = df.reindex(index=[0, 1], columns=['a', 'b'])
-        expected = df.reindex([0, 1]).reindex(columns=['a', 'b'])
-
-        assert_frame_equal(result, expected)
-
-    def test_rename_objects(self):
-        renamed = self.mixed_frame.rename(columns=str.upper)
-        self.assertIn('FOO', renamed)
-        self.assertNotIn('foo', renamed)
-
-    def test_fill_corner(self):
-        self.mixed_frame.ix[5:20,'foo'] = nan
-        self.mixed_frame.ix[-10:,'A'] = nan
-
-        filled = self.mixed_frame.fillna(value=0)
-        self.assertTrue((filled.ix[5:20,'foo'] == 0).all())
-        del self.mixed_frame['foo']
-
-        empty_float = self.frame.reindex(columns=[])
-        result = empty_float.fillna(value=0)
-
-    def test_count_objects(self):
-        dm = DataFrame(self.mixed_frame._series)
-        df = DataFrame(self.mixed_frame._series)
-
-        tm.assert_series_equal(dm.count(), df.count())
-        tm.assert_series_equal(dm.count(1), df.count(1))
-
-    def test_cumsum_corner(self):
-        dm = DataFrame(np.arange(20).reshape(4, 5),
-                       index=lrange(4), columns=lrange(5))
-        result = dm.cumsum()
-
-    #----------------------------------------------------------------------
-    # Stacking / unstacking
-
-    def test_stack_unstack(self):
-        stacked = self.frame.stack()
-        stacked_df = DataFrame({'foo': stacked, 'bar': stacked})
-
-        unstacked = stacked.unstack()
-        unstacked_df = stacked_df.unstack()
-
-        assert_frame_equal(unstacked, self.frame)
-        assert_frame_equal(unstacked_df['bar'], self.frame)
-
-        unstacked_cols = stacked.unstack(0)
-        unstacked_cols_df = stacked_df.unstack(0)
-        assert_frame_equal(unstacked_cols.T, self.frame)
-        assert_frame_equal(unstacked_cols_df['bar'].T, self.frame)
-
-    def test_stack_ints(self):
-        df = DataFrame(
-             np.random.randn(30, 27),
-             columns=MultiIndex.from_tuples(
-                list(itertools.product(range(3), repeat=3))
-            )
-        )
-        assert_frame_equal(
-            df.stack(level=[1, 2]),
-            df.stack(level=1).stack(level=1)
-        )
-        assert_frame_equal(
-            df.stack(level=[-2, -1]),
-            df.stack(level=1).stack(level=1)
-        )
-
-        df_named = df.copy()
-        df_named.columns.set_names(range(3), inplace=True)
-        assert_frame_equal(
-            df_named.stack(level=[1, 2]),
-            df_named.stack(level=1).stack(level=1)
-        )
-
-    def test_stack_mixed_levels(self):
-        columns = MultiIndex.from_tuples(
-            [('A', 'cat', 'long'), ('B', 'cat', 'long'),
-             ('A', 'dog', 'short'), ('B', 'dog', 'short')],
-            names=['exp', 'animal', 'hair_length']
-        )
-        df = DataFrame(randn(4, 4), columns=columns)
-
-        animal_hair_stacked = df.stack(level=['animal', 'hair_length'])
-        exp_hair_stacked = df.stack(level=['exp', 'hair_length'])
-
-        # GH #8584: Need to check that stacking works when a number
-        # is passed that is both a level name and in the range of
-        # the level numbers
-        df2 = df.copy()
-        df2.columns.names = ['exp', 'animal', 1]
-        assert_frame_equal(df2.stack(level=['animal', 1]),
-                           animal_hair_stacked,  check_names=False)
-        assert_frame_equal(df2.stack(level=['exp', 1]),
-                           exp_hair_stacked,  check_names=False)
-
-        # When mixed types are passed and the ints are not level
-        # names, raise
-        self.assertRaises(ValueError, df2.stack, level=['animal', 0])
-
-        # GH #8584: Having 0 in the level names could raise a
-        # strange error about lexsort depth
-        df3 = df.copy()
-        df3.columns.names = ['exp', 'animal', 0]
-        assert_frame_equal(df3.stack(level=['animal', 0]),
-                           animal_hair_stacked, check_names=False)
-
-    def test_stack_int_level_names(self):
-        columns = MultiIndex.from_tuples(
-            [('A', 'cat', 'long'), ('B', 'cat', 'long'),
-             ('A', 'dog', 'short'), ('B', 'dog', 'short')],
-            names=['exp', 'animal', 'hair_length']
-        )
-        df = DataFrame(randn(4, 4), columns=columns)
-
-        exp_animal_stacked = df.stack(level=['exp', 'animal'])
-        animal_hair_stacked = df.stack(level=['animal', 'hair_length'])
-        exp_hair_stacked = df.stack(level=['exp', 'hair_length'])
-
-        df2 = df.copy()
-        df2.columns.names = [0, 1, 2]
-        assert_frame_equal(df2.stack(level=[1, 2]), animal_hair_stacked,
-                           check_names=False )
-        assert_frame_equal(df2.stack(level=[0, 1]), exp_animal_stacked,
-                           check_names=False)
-        assert_frame_equal(df2.stack(level=[0, 2]), exp_hair_stacked,
-                           check_names=False)
-
-        # Out-of-order int column names
-        df3 = df.copy()
-        df3.columns.names = [2, 0, 1]
-        assert_frame_equal(df3.stack(level=[0, 1]), animal_hair_stacked,
-                           check_names=False)
-        assert_frame_equal(df3.stack(level=[2, 0]), exp_animal_stacked,
-                           check_names=False)
-        assert_frame_equal(df3.stack(level=[2, 1]), exp_hair_stacked,
-                           check_names=False)
-
-
-    def test_unstack_bool(self):
-        df = DataFrame([False, False],
-                       index=MultiIndex.from_arrays([['a', 'b'], ['c', 'l']]),
-                       columns=['col'])
-        rs = df.unstack()
-        xp = DataFrame(np.array([[False, np.nan], [np.nan, False]],
-                                dtype=object),
-                       index=['a', 'b'],
-                       columns=MultiIndex.from_arrays([['col', 'col'],
-                                                       ['c', 'l']]))
-        assert_frame_equal(rs, xp)
-
-    def test_unstack_level_binding(self):
-        # GH9856
-        mi = pd.MultiIndex(
-                levels=[[u('foo'), u('bar')], [u('one'), u('two')],
-                        [u('a'), u('b')]],
-                labels=[[0, 0, 1, 1], [0, 1, 0, 1], [1, 0, 1, 0]],
-                names=[u('first'), u('second'), u('third')])
-        s = pd.Series(0, index=mi)
-        result = s.unstack([1, 2]).stack(0)
-
-        expected_mi = pd.MultiIndex(
-                        levels=[['foo', 'bar'], ['one', 'two']],
-                        labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                        names=['first', 'second'])
-
-        expected = pd.DataFrame(np.array([[np.nan, 0],
-                                          [0, np.nan],
-                                          [np.nan, 0],
-                                          [0, np.nan]],
-                                         dtype=np.float64),
-                                index=expected_mi,
-                                columns=pd.Index(['a', 'b'], name='third'))
-
-        assert_frame_equal(result, expected)
-
-    def test_unstack_to_series(self):
-        # check reversibility
-        data = self.frame.unstack()
-
-        self.assertTrue(isinstance(data, Series))
-        undo = data.unstack().T
-        assert_frame_equal(undo, self.frame)
-
-        # check NA handling
-        data = DataFrame({'x': [1, 2, np.NaN], 'y': [3.0, 4, np.NaN]})
-        data.index = Index(['a', 'b', 'c'])
-        result = data.unstack()
-
-        midx = MultiIndex(levels=[['x', 'y'], ['a', 'b', 'c']],
-                          labels=[[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 1, 2]])
-        expected = Series([1, 2, np.NaN, 3, 4, np.NaN], index=midx)
-
-        assert_series_equal(result, expected)
-
-        # check composability of unstack
-        old_data = data.copy()
-        for _ in range(4):
-            data = data.unstack()
-        assert_frame_equal(old_data, data)
-
-    def test_unstack_dtypes(self):
-
-        # GH 2929
-        rows = [[1, 1, 3, 4],
-                [1, 2, 3, 4],
-                [2, 1, 3, 4],
-                [2, 2, 3, 4]]
-
-        df = DataFrame(rows, columns=list('ABCD'))
-        result = df.get_dtype_counts()
-        expected = Series({'int64' : 4})
-        assert_series_equal(result, expected)
-
-        # single dtype
-        df2 = df.set_index(['A','B'])
-        df3 = df2.unstack('B')
-        result = df3.get_dtype_counts()
-        expected = Series({'int64' : 4})
-        assert_series_equal(result, expected)
-
-        # mixed
-        df2 = df.set_index(['A','B'])
-        df2['C'] = 3.
-        df3 = df2.unstack('B')
-        result = df3.get_dtype_counts()
-        expected = Series({'int64' : 2, 'float64' : 2})
-        assert_series_equal(result, expected)
-
-        df2['D'] = 'foo'
-        df3 = df2.unstack('B')
-        result = df3.get_dtype_counts()
-        expected = Series({'float64' : 2, 'object' : 2})
-        assert_series_equal(result, expected)
-
-        # GH7405
-        for c, d in (np.zeros(5), np.zeros(5)), \
-                    (np.arange(5, dtype='f8'), np.arange(5, 10, dtype='f8')):
-
-            df = DataFrame({'A': ['a']*5, 'C':c, 'D':d,
-                            'B':pd.date_range('2012-01-01', periods=5)})
-
-            right = df.iloc[:3].copy(deep=True)
-
-            df = df.set_index(['A', 'B'])
-            df['D'] = df['D'].astype('int64')
-
-            left = df.iloc[:3].unstack(0)
-            right = right.set_index(['A', 'B']).unstack(0)
-            right[('D', 'a')] = right[('D', 'a')].astype('int64')
-
-            self.assertEqual(left.shape, (3, 2))
-            tm.assert_frame_equal(left, right)
-
-    def test_unstack_non_unique_index_names(self):
-        idx = MultiIndex.from_tuples([('a', 'b'), ('c', 'd')],
-                                     names=['c1', 'c1'])
-        df = DataFrame([1, 2], index=idx)
-        with tm.assertRaises(ValueError):
-            df.unstack('c1')
-
-        with tm.assertRaises(ValueError):
-            df.T.stack('c1')
-
-    def test_unstack_nan_index(self):  # GH7466
-        cast = lambda val: '{0:1}'.format('' if val != val else val)
-        nan = np.nan
-
-        def verify(df):
-            mk_list = lambda a: list(a) if isinstance(a, tuple) else [a]
-            rows, cols = df.notnull().values.nonzero()
-            for i, j in zip(rows, cols):
-                left = sorted(df.iloc[i, j].split('.'))
-                right = mk_list(df.index[i]) + mk_list(df.columns[j])
-                right = sorted(list(map(cast, right)))
-                self.assertEqual(left, right)
-
-        df = DataFrame({'jim':['a', 'b', nan, 'd'],
-                        'joe':['w', 'x', 'y', 'z'],
-                        'jolie':['a.w', 'b.x', ' .y', 'd.z']})
-
-        left  = df.set_index(['jim', 'joe']).unstack()['jolie']
-        right = df.set_index(['joe', 'jim']).unstack()['jolie'].T
-        assert_frame_equal(left, right)
-
-        for idx in permutations(df.columns[:2]):
-            mi = df.set_index(list(idx))
-            for lev in range(2):
-                udf = mi.unstack(level=lev)
-                self.assertEqual(udf.notnull().values.sum(), len(df))
-                verify(udf['jolie'])
-
-        df = DataFrame({'1st':['d'] * 3 + [nan] * 5 + ['a'] * 2 +
-                              ['c'] * 3 + ['e'] * 2 + ['b'] * 5,
-                        '2nd':['y'] * 2 + ['w'] * 3 + [nan] * 3 +
-                              ['z'] * 4 + [nan] * 3 + ['x'] * 3 + [nan] * 2,
-                        '3rd':[67,39,53,72,57,80,31,18,11,30,59,
-                               50,62,59,76,52,14,53,60,51]})
-
-        df['4th'], df['5th'] = \
-                df.apply(lambda r: '.'.join(map(cast, r)), axis=1), \
-                df.apply(lambda r: '.'.join(map(cast, r.iloc[::-1])), axis=1)
-
-        for idx in permutations(['1st', '2nd', '3rd']):
-            mi = df.set_index(list(idx))
-            for lev in range(3):
-                udf = mi.unstack(level=lev)
-                self.assertEqual(udf.notnull().values.sum(), 2 * len(df))
-                for col in ['4th', '5th']:
-                    verify(udf[col])
-
-        # GH7403
-        df = pd.DataFrame({'A': list('aaaabbbb'),'B':range(8), 'C':range(8)})
-        df.iloc[3, 1] = np.NaN
-        left = df.set_index(['A', 'B']).unstack(0)
-
-        vals = [[3, 0, 1, 2, nan, nan, nan, nan],
-                [nan, nan, nan, nan, 4, 5, 6, 7]]
-        vals = list(map(list, zip(*vals)))
-        idx = Index([nan, 0, 1, 2, 4, 5, 6, 7], name='B')
-        cols = MultiIndex(levels=[['C'], ['a', 'b']],
-                          labels=[[0, 0], [0, 1]],
-                          names=[None, 'A'])
-
-        right = DataFrame(vals, columns=cols, index=idx)
-        assert_frame_equal(left, right)
-
-        df = DataFrame({'A': list('aaaabbbb'), 'B':list(range(4))*2,
-                        'C':range(8)})
-        df.iloc[2,1] = np.NaN
-        left = df.set_index(['A', 'B']).unstack(0)
-
-        vals = [[2, nan], [0, 4], [1, 5], [nan, 6], [3, 7]]
-        cols = MultiIndex(levels=[['C'], ['a', 'b']],
-                          labels=[[0, 0], [0, 1]],
-                          names=[None, 'A'])
-        idx = Index([nan, 0, 1, 2, 3], name='B')
-        right = DataFrame(vals, columns=cols, index=idx)
-        assert_frame_equal(left, right)
-
-        df = pd.DataFrame({'A': list('aaaabbbb'),'B':list(range(4))*2,
-                           'C':range(8)})
-        df.iloc[3,1] = np.NaN
-        left = df.set_index(['A', 'B']).unstack(0)
-
-        vals = [[3, nan], [0, 4], [1, 5], [2, 6], [nan, 7]]
-        cols = MultiIndex(levels=[['C'], ['a', 'b']],
-                          labels=[[0, 0], [0, 1]],
-                          names=[None, 'A'])
-        idx = Index([nan, 0, 1, 2, 3], name='B')
-        right = DataFrame(vals, columns=cols, index=idx)
-        assert_frame_equal(left, right)
-
-        # GH7401
-        df = pd.DataFrame({'A': list('aaaaabbbbb'), 'C':np.arange(10),
-            'B':date_range('2012-01-01', periods=5).tolist()*2 })
-
-        df.iloc[3,1] = np.NaN
-        left = df.set_index(['A', 'B']).unstack()
-
-        vals = np.array([[3, 0, 1, 2, nan, 4], [nan, 5, 6, 7, 8, 9]])
-        idx = Index(['a', 'b'], name='A')
-        cols = MultiIndex(levels=[['C'], date_range('2012-01-01', periods=5)],
-                          labels=[[0, 0, 0, 0, 0, 0], [-1, 0, 1, 2, 3, 4]],
-                          names=[None, 'B'])
-
-        right = DataFrame(vals, columns=cols, index=idx)
-        assert_frame_equal(left, right)
-
-        # GH4862
-        vals = [['Hg', nan, nan, 680585148],
-                ['U', 0.0, nan, 680585148],
-                ['Pb', 7.07e-06, nan, 680585148],
-                ['Sn', 2.3614e-05, 0.0133, 680607017],
-                ['Ag', 0.0, 0.0133, 680607017],
-                ['Hg', -0.00015, 0.0133, 680607017]]
-        df = DataFrame(vals, columns=['agent', 'change', 'dosage', 's_id'],
-                index=[17263, 17264, 17265, 17266, 17267, 17268])
-
-        left = df.copy().set_index(['s_id','dosage','agent']).unstack()
-
-        vals = [[nan, nan, 7.07e-06, nan, 0.0],
-                [0.0, -0.00015, nan, 2.3614e-05, nan]]
-
-        idx = MultiIndex(levels=[[680585148, 680607017], [0.0133]],
-                         labels=[[0, 1], [-1, 0]],
-                         names=['s_id', 'dosage'])
-
-        cols = MultiIndex(levels=[['change'], ['Ag', 'Hg', 'Pb', 'Sn', 'U']],
-                          labels=[[0, 0, 0, 0, 0], [0, 1, 2, 3, 4]],
-                          names=[None, 'agent'])
-
-        right = DataFrame(vals, columns=cols, index=idx)
-        assert_frame_equal(left, right)
-
-        left = df.ix[17264:].copy().set_index(['s_id','dosage','agent'])
-        assert_frame_equal(left.unstack(), right)
-
-        # GH9497 - multiple unstack with nulls
-        df = DataFrame({'1st':[1, 2, 1, 2, 1, 2],
-                        '2nd':pd.date_range('2014-02-01', periods=6, freq='D'),
-                        'jim':100 + np.arange(6),
-                        'joe':(np.random.randn(6) * 10).round(2)})
-
-        df['3rd'] = df['2nd'] - pd.Timestamp('2014-02-02')
-        df.loc[1, '2nd'] = df.loc[3, '2nd'] = nan
-        df.loc[1, '3rd'] = df.loc[4, '3rd'] = nan
-
-        left = df.set_index(['1st', '2nd', '3rd']).unstack(['2nd', '3rd'])
-        self.assertEqual(left.notnull().values.sum(), 2 * len(df))
-
-        for col in ['jim', 'joe']:
-           for _, r in df.iterrows():
-               key = r['1st'], (col, r['2nd'], r['3rd'])
-               self.assertEqual(r[col], left.loc[key])
-
-    def test_stack_datetime_column_multiIndex(self):
-        # GH 8039
-        t = datetime(2014, 1, 1)
-        df = DataFrame([1, 2, 3, 4], columns=MultiIndex.from_tuples([(t, 'A', 'B')]))
-        result = df.stack()
-
-        eidx = MultiIndex.from_product([(0, 1, 2, 3), ('B',)])
-        ecols = MultiIndex.from_tuples([(t, 'A')])
-        expected = DataFrame([1, 2, 3, 4], index=eidx, columns=ecols)
-        assert_frame_equal(result, expected)
-
-    def test_stack_partial_multiIndex(self):
-        # GH 8844
-        def _test_stack_with_multiindex(multiindex):
-            df = DataFrame(np.arange(3 * len(multiindex)).reshape(3, len(multiindex)),
-                           columns=multiindex)
-            for level in (-1, 0, 1, [0, 1], [1, 0]):
-                result = df.stack(level=level, dropna=False)
-
-                if isinstance(level, int):
-                    # Stacking a single level should not make any all-NaN rows,
-                    # so df.stack(level=level, dropna=False) should be the same
-                    # as df.stack(level=level, dropna=True).
-                    expected = df.stack(level=level, dropna=True)
-                    if isinstance(expected, Series):
-                        assert_series_equal(result, expected)
-                    else:
-                        assert_frame_equal(result, expected)
-
-                df.columns = MultiIndex.from_tuples(df.columns.get_values(),
-                                                    names=df.columns.names)
-                expected = df.stack(level=level, dropna=False)
-                if isinstance(expected, Series):
-                    assert_series_equal(result, expected)
-                else:
-                    assert_frame_equal(result, expected)
-
-        full_multiindex = MultiIndex.from_tuples([('B', 'x'), ('B', 'z'),
-                                                  ('A', 'y'),
-                                                  ('C', 'x'), ('C', 'u')],
-                                                 names=['Upper', 'Lower'])
-        for multiindex_columns in ([0, 1, 2, 3, 4],
-                                   [0, 1, 2, 3], [0, 1, 2, 4],
-                                   [0, 1, 2], [1, 2, 3], [2, 3, 4],
-                                   [0, 1], [0, 2], [0, 3],
-                                   [0], [2], [4]):
-            _test_stack_with_multiindex(full_multiindex[multiindex_columns])
-            if len(multiindex_columns) > 1:
-                multiindex_columns.reverse()
-                _test_stack_with_multiindex(full_multiindex[multiindex_columns])
-
-        df = DataFrame(np.arange(6).reshape(2, 3), columns=full_multiindex[[0, 1, 3]])
-        result = df.stack(dropna=False)
-        expected = DataFrame([[0, 2], [1, nan], [3, 5], [4, nan]],
-                             index=MultiIndex(levels=[[0, 1], ['u', 'x', 'y', 'z']],
-                                              labels=[[0, 0, 1, 1], [1, 3, 1, 3]],
-                                              names=[None, 'Lower']),
-                             columns=Index(['B', 'C'], name='Upper'),
-                             dtype=df.dtypes[0])
-        assert_frame_equal(result, expected)
-
-    def test_repr_with_mi_nat(self):
-        df = DataFrame({'X': [1, 2]},
-                       index=[[pd.NaT, pd.Timestamp('20130101')], ['a', 'b']])
-        res = repr(df)
-        exp = '              X\nNaT        a  1\n2013-01-01 b  2'
-        nose.tools.assert_equal(res, exp)
-
-    def test_reset_index(self):
-        stacked = self.frame.stack()[::2]
-        stacked = DataFrame({'foo': stacked, 'bar': stacked})
-
-        names = ['first', 'second']
-        stacked.index.names = names
-        deleveled = stacked.reset_index()
-        for i, (lev, lab) in enumerate(zip(stacked.index.levels,
-                                           stacked.index.labels)):
-            values = lev.take(lab)
-            name = names[i]
-            assert_almost_equal(values, deleveled[name])
-
-        stacked.index.names = [None, None]
-        deleveled2 = stacked.reset_index()
-        self.assert_numpy_array_equal(deleveled['first'],
-                                      deleveled2['level_0'])
-        self.assert_numpy_array_equal(deleveled['second'],
-                                      deleveled2['level_1'])
-
-        # default name assigned
-        rdf = self.frame.reset_index()
-        self.assert_numpy_array_equal(rdf['index'], self.frame.index.values)
-
-        # default name assigned, corner case
-        df = self.frame.copy()
-        df['index'] = 'foo'
-        rdf = df.reset_index()
-        self.assert_numpy_array_equal(rdf['level_0'], self.frame.index.values)
-
-        # but this is ok
-        self.frame.index.name = 'index'
-        deleveled = self.frame.reset_index()
-        self.assert_numpy_array_equal(deleveled['index'],
-                                      self.frame.index.values)
-        self.assert_numpy_array_equal(deleveled.index,
-                                      np.arange(len(deleveled)))
-
-        # preserve column names
-        self.frame.columns.name = 'columns'
-        resetted = self.frame.reset_index()
-        self.assertEqual(resetted.columns.name, 'columns')
-
-        # only remove certain columns
-        frame = self.frame.reset_index().set_index(['index', 'A', 'B'])
-        rs = frame.reset_index(['A', 'B'])
-
-        assert_frame_equal(rs, self.frame, check_names=False)  # TODO should reset_index check_names ?
-
-        rs = frame.reset_index(['index', 'A', 'B'])
-        assert_frame_equal(rs, self.frame.reset_index(), check_names=False)
-
-        rs = frame.reset_index(['index', 'A', 'B'])
-        assert_frame_equal(rs, self.frame.reset_index(), check_names=False)
-
-        rs = frame.reset_index('A')
-        xp = self.frame.reset_index().set_index(['index', 'B'])
-        assert_frame_equal(rs, xp, check_names=False)
-
-        # test resetting in place
-        df = self.frame.copy()
-        resetted = self.frame.reset_index()
-        df.reset_index(inplace=True)
-        assert_frame_equal(df, resetted, check_names=False)
-
-        frame = self.frame.reset_index().set_index(['index', 'A', 'B'])
-        rs = frame.reset_index('A', drop=True)
-        xp = self.frame.copy()
-        del xp['A']
-        xp = xp.set_index(['B'], append=True)
-        assert_frame_equal(rs, xp, check_names=False)
-
-    def test_reset_index_right_dtype(self):
-        time = np.arange(0.0, 10, np.sqrt(2) / 2)
-        s1 = Series((9.81 * time ** 2) / 2,
-                    index=Index(time, name='time'),
-                    name='speed')
-        df = DataFrame(s1)
-
-        resetted = s1.reset_index()
-        self.assertEqual(resetted['time'].dtype, np.float64)
-
-        resetted = df.reset_index()
-        self.assertEqual(resetted['time'].dtype, np.float64)
-
-    def test_reset_index_multiindex_col(self):
-        vals = np.random.randn(3, 3).astype(object)
-        idx = ['x', 'y', 'z']
-        full = np.hstack(([[x] for x in idx], vals))
-        df = DataFrame(vals, Index(idx, name='a'),
-                       columns=[['b', 'b', 'c'], ['mean', 'median', 'mean']])
-        rs = df.reset_index()
-        xp = DataFrame(full, columns=[['a', 'b', 'b', 'c'],
-                                      ['', 'mean', 'median', 'mean']])
-        assert_frame_equal(rs, xp)
-
-        rs = df.reset_index(col_fill=None)
-        xp = DataFrame(full, columns=[['a', 'b', 'b', 'c'],
-                                      ['a', 'mean', 'median', 'mean']])
-        assert_frame_equal(rs, xp)
-
-        rs = df.reset_index(col_level=1, col_fill='blah')
-        xp = DataFrame(full, columns=[['blah', 'b', 'b', 'c'],
-                                      ['a', 'mean', 'median', 'mean']])
-        assert_frame_equal(rs, xp)
-
-        df = DataFrame(vals,
-                       MultiIndex.from_arrays([[0, 1, 2], ['x', 'y', 'z']],
-                                              names=['d', 'a']),
-                       columns=[['b', 'b', 'c'], ['mean', 'median', 'mean']])
-        rs = df.reset_index('a', )
-        xp = DataFrame(full, Index([0, 1, 2], name='d'),
-                       columns=[['a', 'b', 'b', 'c'],
-                                ['', 'mean', 'median', 'mean']])
-        assert_frame_equal(rs, xp)
-
-        rs = df.reset_index('a', col_fill=None)
-        xp = DataFrame(full, Index(lrange(3), name='d'),
-                       columns=[['a', 'b', 'b', 'c'],
-                                ['a', 'mean', 'median', 'mean']])
-        assert_frame_equal(rs, xp)
-
-        rs = df.reset_index('a', col_fill='blah', col_level=1)
-        xp = DataFrame(full, Index(lrange(3), name='d'),
-                       columns=[['blah', 'b', 'b', 'c'],
-                                ['a', 'mean', 'median', 'mean']])
-        assert_frame_equal(rs, xp)
-
-    def test_reset_index_with_datetimeindex_cols(self):
-        # GH5818
-        #
-        df = pd.DataFrame([[1, 2], [3, 4]],
-                          columns=pd.date_range('1/1/2013', '1/2/2013'),
-                          index=['A', 'B'])
-
-        result = df.reset_index()
-        expected = pd.DataFrame([['A', 1, 2], ['B', 3, 4]],
-                          columns=['index', datetime(2013, 1, 1),
-                                   datetime(2013, 1, 2)])
-        assert_frame_equal(result, expected)
-
-    #----------------------------------------------------------------------
-    # Tests to cope with refactored internals
-    def test_as_matrix_numeric_cols(self):
-        self.frame['foo'] = 'bar'
-
-        values = self.frame.as_matrix(['A', 'B', 'C', 'D'])
-        self.assertEqual(values.dtype, np.float64)
-
-    def test_as_matrix_lcd(self):
-
-        # mixed lcd
-        values = self.mixed_float.as_matrix(['A', 'B', 'C', 'D'])
-        self.assertEqual(values.dtype, np.float64)
-
-        values = self.mixed_float.as_matrix(['A', 'B', 'C' ])
-        self.assertEqual(values.dtype, np.float32)
-
-        values = self.mixed_float.as_matrix(['C'])
-        self.assertEqual(values.dtype, np.float16)
-
-        values = self.mixed_int.as_matrix(['A','B','C','D'])
-        self.assertEqual(values.dtype, np.int64)
-
-        values = self.mixed_int.as_matrix(['A','D'])
-        self.assertEqual(values.dtype, np.int64)
-
-        # guess all ints are cast to uints....
-        values = self.mixed_int.as_matrix(['A','B','C'])
-        self.assertEqual(values.dtype, np.int64)
-
-        values = self.mixed_int.as_matrix(['A','C'])
-        self.assertEqual(values.dtype, np.int32)
-
-        values = self.mixed_int.as_matrix(['C','D'])
-        self.assertEqual(values.dtype, np.int64)
-
-        values = self.mixed_int.as_matrix(['A'])
-        self.assertEqual(values.dtype, np.int32)
-
-        values = self.mixed_int.as_matrix(['C'])
-        self.assertEqual(values.dtype, np.uint8)
-
-    def test_constructor_with_convert(self):
-        # this is actually mostly a test of lib.maybe_convert_objects
-        # #2845
-        df = DataFrame({'A' : [2**63-1] })
-        result = df['A']
-        expected = Series(np.asarray([2**63-1], np.int64), name='A')
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'A' : [2**63] })
-        result = df['A']
-        expected = Series(np.asarray([2**63], np.object_), name='A')
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'A' : [datetime(2005, 1, 1), True] })
-        result = df['A']
-        expected = Series(np.asarray([datetime(2005, 1, 1), True], np.object_),
-                          name='A')
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'A' : [None, 1] })
-        result = df['A']
-        expected = Series(np.asarray([np.nan, 1], np.float_), name='A')
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'A' : [1.0, 2] })
-        result = df['A']
-        expected = Series(np.asarray([1.0, 2], np.float_), name='A')
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'A' : [1.0+2.0j, 3] })
-        result = df['A']
-        expected = Series(np.asarray([1.0+2.0j, 3], np.complex_), name='A')
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'A' : [1.0+2.0j, 3.0] })
-        result = df['A']
-        expected = Series(np.asarray([1.0+2.0j, 3.0], np.complex_), name='A')
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'A' : [1.0+2.0j, True] })
-        result = df['A']
-        expected = Series(np.asarray([1.0+2.0j, True], np.object_), name='A')
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'A' : [1.0, None] })
-        result = df['A']
-        expected = Series(np.asarray([1.0, np.nan], np.float_), name='A')
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'A' : [1.0+2.0j, None] })
-        result = df['A']
-        expected = Series(np.asarray([1.0+2.0j, np.nan], np.complex_), name='A')
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'A' : [2.0, 1, True, None] })
-        result = df['A']
-        expected = Series(np.asarray([2.0, 1, True, None], np.object_), name='A')
-        assert_series_equal(result, expected)
-
-        df = DataFrame({'A' : [2.0, 1, datetime(2006, 1, 1), None] })
-        result = df['A']
-        expected = Series(np.asarray([2.0, 1, datetime(2006, 1, 1),
-                                      None], np.object_), name='A')
-        assert_series_equal(result, expected)
-
-    def test_construction_with_mixed(self):
-        # test construction edge cases with mixed types
-
-        # f7u12, this does not work without extensive workaround
-        data = [[datetime(2001, 1, 5), nan, datetime(2001, 1, 2)],
-                [datetime(2000, 1, 2), datetime(2000, 1, 3),
-                 datetime(2000, 1, 1)]]
-        df = DataFrame(data)
-
-        # check dtypes
-        result = df.get_dtype_counts().sort_values()
-        expected = Series({ 'datetime64[ns]' : 3 })
-
-        # mixed-type frames
-        self.mixed_frame['datetime'] = datetime.now()
-        self.mixed_frame['timedelta'] = timedelta(days=1,seconds=1)
-        self.assertEqual(self.mixed_frame['datetime'].dtype, 'M8[ns]')
-        self.assertEqual(self.mixed_frame['timedelta'].dtype, 'm8[ns]')
-        result = self.mixed_frame.get_dtype_counts().sort_values()
-        expected = Series({ 'float64' : 4,
-                            'object' : 1,
-                            'datetime64[ns]' : 1,
-                            'timedelta64[ns]' : 1}).sort_values()
-        assert_series_equal(result,expected)
-
-    def test_construction_with_conversions(self):
-
-        # convert from a numpy array of non-ns timedelta64
-        arr = np.array([1,2,3],dtype='timedelta64[s]')
-        s = Series(arr)
-        expected = Series(timedelta_range('00:00:01',periods=3,freq='s'))
-        assert_series_equal(s,expected)
-
-        df = DataFrame(index=range(3))
-        df['A'] = arr
-        expected = DataFrame({'A' : timedelta_range('00:00:01',periods=3,freq='s')},
-                             index=range(3))
-        assert_frame_equal(df,expected)
-
-        # convert from a numpy array of non-ns datetime64
-        #### note that creating a numpy datetime64 is in LOCAL time!!!!
-        #### seems to work for M8[D], but not for M8[s]
-
-        s = Series(np.array(['2013-01-01','2013-01-02','2013-01-03'],dtype='datetime64[D]'))
-        assert_series_equal(s,Series(date_range('20130101',periods=3,freq='D')))
-        #s = Series(np.array(['2013-01-01 00:00:01','2013-01-01 00:00:02','2013-01-01 00:00:03'],dtype='datetime64[s]'))
-        #assert_series_equal(s,date_range('20130101 00:00:01',period=3,freq='s'))
-
-        expected = DataFrame({
-            'dt1' : Timestamp('20130101'),
-            'dt2' : date_range('20130101',periods=3),
-            #'dt3' : date_range('20130101 00:00:01',periods=3,freq='s'),
-            },index=range(3))
-
-
-        df = DataFrame(index=range(3))
-        df['dt1'] = np.datetime64('2013-01-01')
-        df['dt2'] = np.array(['2013-01-01','2013-01-02','2013-01-03'],dtype='datetime64[D]')
-        #df['dt3'] = np.array(['2013-01-01 00:00:01','2013-01-01 00:00:02','2013-01-01 00:00:03'],dtype='datetime64[s]')
-        assert_frame_equal(df, expected)
-
-    def test_constructor_frame_copy(self):
-        cop = DataFrame(self.frame, copy=True)
-        cop['A'] = 5
-        self.assertTrue((cop['A'] == 5).all())
-        self.assertFalse((self.frame['A'] == 5).all())
-
-    def test_constructor_ndarray_copy(self):
-        df = DataFrame(self.frame.values)
-
-        self.frame.values[5] = 5
-        self.assertTrue((df.values[5] == 5).all())
-
-        df = DataFrame(self.frame.values, copy=True)
-        self.frame.values[6] = 6
-        self.assertFalse((df.values[6] == 6).all())
-
-    def test_constructor_series_copy(self):
-        series = self.frame._series
-
-        df = DataFrame({'A': series['A']})
-        df['A'][:] = 5
-
-        self.assertFalse((series['A'] == 5).all())
-
-    def test_constructor_compound_dtypes(self):
-        # GH 5191
-        # compound dtypes should raise not-implementederror
-
-        def f(dtype):
-            return DataFrame(data = list(itertools.repeat((datetime(2001, 1, 1), "aa", 20), 9)),
-                             columns=["A", "B", "C"], dtype=dtype)
-
-        self.assertRaises(NotImplementedError, f, [("A","datetime64[h]"), ("B","str"), ("C","int32")])
-
-        # these work (though results may be unexpected)
-        f('int64')
-        f('float64')
-
-        # 10822
-        # invalid error message on dt inference
-        if not is_platform_windows():
-            f('M8[ns]')
-
-    def test_assign_columns(self):
-        self.frame['hi'] = 'there'
-
-        frame = self.frame.copy()
-        frame.columns = ['foo', 'bar', 'baz', 'quux', 'foo2']
-        assert_series_equal(self.frame['C'], frame['baz'], check_names=False)
-        assert_series_equal(self.frame['hi'], frame['foo2'], check_names=False)
-
-    def test_columns_with_dups(self):
-
-        # GH 3468 related
-
-        # basic
-        df = DataFrame([[1,2]], columns=['a','a'])
-        df.columns = ['a','a.1']
-        str(df)
-        expected = DataFrame([[1,2]], columns=['a','a.1'])
-        assert_frame_equal(df, expected)
-
-        df = DataFrame([[1,2,3]], columns=['b','a','a'])
-        df.columns = ['b','a','a.1']
-        str(df)
-        expected = DataFrame([[1,2,3]], columns=['b','a','a.1'])
-        assert_frame_equal(df, expected)
-
-        # with a dup index
-        df = DataFrame([[1,2]], columns=['a','a'])
-        df.columns = ['b','b']
-        str(df)
-        expected = DataFrame([[1,2]], columns=['b','b'])
-        assert_frame_equal(df, expected)
-
-        # multi-dtype
-        df = DataFrame([[1,2,1.,2.,3.,'foo','bar']], columns=['a','a','b','b','d','c','c'])
-        df.columns = list('ABCDEFG')
-        str(df)
-        expected = DataFrame([[1,2,1.,2.,3.,'foo','bar']], columns=list('ABCDEFG'))
-        assert_frame_equal(df, expected)
-
-        # this is an error because we cannot disambiguate the dup columns
-        self.assertRaises(Exception, lambda x: DataFrame([[1,2,'foo','bar']], columns=['a','a','a','a']))
-
-        # dups across blocks
-        df_float  = DataFrame(np.random.randn(10, 3),dtype='float64')
-        df_int    = DataFrame(np.random.randn(10, 3),dtype='int64')
-        df_bool   = DataFrame(True,index=df_float.index,columns=df_float.columns)
-        df_object = DataFrame('foo',index=df_float.index,columns=df_float.columns)
-        df_dt     = DataFrame(Timestamp('20010101'),index=df_float.index,columns=df_float.columns)
-        df        = pd.concat([ df_float, df_int, df_bool, df_object, df_dt ], axis=1)
-
-        self.assertEqual(len(df._data._blknos), len(df.columns))
-        self.assertEqual(len(df._data._blklocs), len(df.columns))
-
-        # testing iget
-        for i in range(len(df.columns)):
-            df.iloc[:,i]
-
-        # dup columns across dtype GH 2079/2194
-        vals = [[1, -1, 2.], [2, -2, 3.]]
-        rs = DataFrame(vals, columns=['A', 'A', 'B'])
-        xp = DataFrame(vals)
-        xp.columns = ['A', 'A', 'B']
-        assert_frame_equal(rs, xp)
-
-    def test_insert_column_bug_4032(self):
-
-        # GH4032, inserting a column and renaming causing errors
-        df = DataFrame({'b': [1.1, 2.2]})
-        df = df.rename(columns={})
-        df.insert(0, 'a', [1, 2])
-
-        result = df.rename(columns={})
-        str(result)
-        expected = DataFrame([[1,1.1],[2, 2.2]],columns=['a','b'])
-        assert_frame_equal(result,expected)
-        df.insert(0, 'c', [1.3, 2.3])
-
-        result = df.rename(columns={})
-        str(result)
-
-        expected = DataFrame([[1.3,1,1.1],[2.3,2, 2.2]],columns=['c','a','b'])
-        assert_frame_equal(result,expected)
-
-    def test_cast_internals(self):
-        casted = DataFrame(self.frame._data, dtype=int)
-        expected = DataFrame(self.frame._series, dtype=int)
-        assert_frame_equal(casted, expected)
-
-        casted = DataFrame(self.frame._data, dtype=np.int32)
-        expected = DataFrame(self.frame._series, dtype=np.int32)
-        assert_frame_equal(casted, expected)
-
-    def test_consolidate(self):
-        self.frame['E'] = 7.
-        consolidated = self.frame.consolidate()
-        self.assertEqual(len(consolidated._data.blocks), 1)
-
-        # Ensure copy, do I want this?
-        recons = consolidated.consolidate()
-        self.assertIsNot(recons, consolidated)
-        assert_frame_equal(recons, consolidated)
-
-        self.frame['F'] = 8.
-        self.assertEqual(len(self.frame._data.blocks), 3)
-        self.frame.consolidate(inplace=True)
-        self.assertEqual(len(self.frame._data.blocks), 1)
-
-    def test_consolidate_inplace(self):
-        frame = self.frame.copy()
-
-        # triggers in-place consolidation
-        for letter in range(ord('A'), ord('Z')):
-            self.frame[chr(letter)] = chr(letter)
-
-    def test_as_matrix_consolidate(self):
-        self.frame['E'] = 7.
-        self.assertFalse(self.frame._data.is_consolidated())
-        _ = self.frame.as_matrix()
-        self.assertTrue(self.frame._data.is_consolidated())
-
-    def test_modify_values(self):
-        self.frame.values[5] = 5
-        self.assertTrue((self.frame.values[5] == 5).all())
-
-        # unconsolidated
-        self.frame['E'] = 7.
-        self.frame.values[6] = 6
-        self.assertTrue((self.frame.values[6] == 6).all())
-
-    def test_boolean_set_uncons(self):
-        self.frame['E'] = 7.
-
-        expected = self.frame.values.copy()
-        expected[expected > 1] = 2
-
-        self.frame[self.frame > 1] = 2
-        assert_almost_equal(expected, self.frame.values)
-
-    def test_xs_view(self):
-        """
-        in 0.14 this will return a view if possible
-        a copy otherwise, but this is numpy dependent
-        """
-
-        dm = DataFrame(np.arange(20.).reshape(4, 5),
-                       index=lrange(4), columns=lrange(5))
-
-        dm.xs(2)[:] = 10
-        self.assertTrue((dm.xs(2) == 10).all())
-
-    def test_boolean_indexing(self):
-        idx = lrange(3)
-        cols = ['A','B','C']
-        df1 = DataFrame(index=idx, columns=cols,
-                        data=np.array([[0.0, 0.5, 1.0],
-                                       [1.5, 2.0, 2.5],
-                                       [3.0, 3.5, 4.0]],
-                                      dtype=float))
-        df2 = DataFrame(index=idx, columns=cols,
-                        data=np.ones((len(idx), len(cols))))
-
-        expected = DataFrame(index=idx, columns=cols,
-                             data=np.array([[0.0, 0.5, 1.0],
-                                            [1.5, 2.0, -1],
-                                            [-1, -1, -1]], dtype=float))
-
-        df1[df1 > 2.0 * df2] = -1
-        assert_frame_equal(df1, expected)
-        with assertRaisesRegexp(ValueError, 'Item wrong length'):
-            df1[df1.index[:-1] > 2] = -1
-
-    def test_boolean_indexing_mixed(self):
-        df = DataFrame(
-            {long(0): {35: np.nan, 40: np.nan, 43: np.nan, 49: np.nan, 50: np.nan},
-             long(1): {35: np.nan,
-                  40: 0.32632316859446198,
-                  43: np.nan,
-                  49: 0.32632316859446198,
-                  50: 0.39114724480578139},
-             long(2): {35: np.nan, 40: np.nan, 43: 0.29012581014105987, 49: np.nan, 50: np.nan},
-             long(3): {35: np.nan, 40: np.nan, 43: np.nan, 49: np.nan, 50: np.nan},
-             long(4): {35: 0.34215328467153283, 40: np.nan, 43: np.nan, 49: np.nan, 50: np.nan},
-             'y': {35: 0, 40: 0, 43: 0, 49: 0, 50: 1}})
-
-        # mixed int/float ok
-        df2 = df.copy()
-        df2[df2>0.3] = 1
-        expected = df.copy()
-        expected.loc[40,1] = 1
-        expected.loc[49,1] = 1
-        expected.loc[50,1] = 1
-        expected.loc[35,4] = 1
-        assert_frame_equal(df2,expected)
-
-        df['foo'] = 'test'
-        with tm.assertRaisesRegexp(TypeError, 'boolean setting on mixed-type'):
-            df[df > 0.3] = 1
-
-    def test_sum_bools(self):
-        df = DataFrame(index=lrange(1), columns=lrange(10))
-        bools = isnull(df)
-        self.assertEqual(bools.sum(axis=1)[0], 10)
-
-    def test_fillna_col_reordering(self):
-        idx = lrange(20)
-        cols = ["COL." + str(i) for i in range(5, 0, -1)]
-        data = np.random.rand(20, 5)
-        df = DataFrame(index=lrange(20), columns=cols, data=data)
-        filled = df.fillna(method='ffill')
-        self.assertEqual(df.columns.tolist(), filled.columns.tolist())
-
-    def test_take(self):
-
-        # homogeneous
-        #----------------------------------------
-        order  = [3, 1, 2, 0]
-        for df in [self.frame]:
-
-            result = df.take(order, axis=0)
-            expected = df.reindex(df.index.take(order))
-            assert_frame_equal(result, expected)
-
-            # axis = 1
-            result = df.take(order, axis=1)
-            expected = df.ix[:, ['D', 'B', 'C', 'A']]
-            assert_frame_equal(result, expected, check_names=False)
-
-        # neg indicies
-        order = [2,1,-1]
-        for df in [self.frame]:
-
-            result = df.take(order, axis=0)
-            expected = df.reindex(df.index.take(order))
-            assert_frame_equal(result, expected)
-
-            # axis = 1
-            result = df.take(order, axis=1)
-            expected = df.ix[:, ['C', 'B', 'D']]
-            assert_frame_equal(result, expected, check_names=False)
-
-        # illegal indices
-        self.assertRaises(IndexError, df.take, [3,1,2,30], axis=0)
-        self.assertRaises(IndexError, df.take, [3,1,2,-31], axis=0)
-        self.assertRaises(IndexError, df.take, [3,1,2,5], axis=1)
-        self.assertRaises(IndexError, df.take, [3,1,2,-5], axis=1)
-
-        # mixed-dtype
-        #----------------------------------------
-        order  = [4, 1, 2, 0, 3]
-        for df in [self.mixed_frame]:
-
-            result = df.take(order, axis=0)
-            expected = df.reindex(df.index.take(order))
-            assert_frame_equal(result, expected)
-
-            # axis = 1
-            result = df.take(order, axis=1)
-            expected = df.ix[:, ['foo', 'B', 'C', 'A', 'D']]
-            assert_frame_equal(result, expected)
-
-        # neg indicies
-        order = [4,1,-2]
-        for df in [self.mixed_frame]:
-
-            result = df.take(order, axis=0)
-            expected = df.reindex(df.index.take(order))
-            assert_frame_equal(result, expected)
-
-            # axis = 1
-            result = df.take(order, axis=1)
-            expected = df.ix[:, ['foo', 'B', 'D']]
-            assert_frame_equal(result, expected)
-
-        # by dtype
-        order = [1, 2, 0, 3]
-        for df in [self.mixed_float,self.mixed_int]:
-
-            result = df.take(order, axis=0)
-            expected = df.reindex(df.index.take(order))
-            assert_frame_equal(result, expected)
-
-            # axis = 1
-            result = df.take(order, axis=1)
-            expected = df.ix[:, ['B', 'C', 'A', 'D']]
-            assert_frame_equal(result, expected)
-
-    def test_iterkv_deprecation(self):
-        with tm.assert_produces_warning(FutureWarning):
-            self.mixed_float.iterkv()
-
-    def test_iterkv_names(self):
-        for k, v in compat.iteritems(self.mixed_frame):
-            self.assertEqual(v.name, k)
-
-    def test_series_put_names(self):
-        series = self.mixed_frame._series
-        for k, v in compat.iteritems(series):
-            self.assertEqual(v.name, k)
-
-    def test_dot(self):
-        a = DataFrame(np.random.randn(3, 4), index=['a', 'b', 'c'],
-                      columns=['p', 'q', 'r', 's'])
-        b = DataFrame(np.random.randn(4, 2), index=['p', 'q', 'r', 's'],
-                      columns=['one', 'two'])
-
-        result = a.dot(b)
-        expected = DataFrame(np.dot(a.values, b.values),
-                             index=['a', 'b', 'c'],
-                             columns=['one', 'two'])
-        # Check alignment
-        b1 = b.reindex(index=reversed(b.index))
-        result = a.dot(b)
-        assert_frame_equal(result, expected)
-
-        # Check series argument
-        result = a.dot(b['one'])
-        assert_series_equal(result, expected['one'], check_names=False)
-        self.assertTrue(result.name is None)
-
-        result = a.dot(b1['one'])
-        assert_series_equal(result, expected['one'], check_names=False)
-        self.assertTrue(result.name is None)
-
-        # can pass correct-length arrays
-        row = a.ix[0].values
-
-        result = a.dot(row)
-        exp = a.dot(a.ix[0])
-        assert_series_equal(result, exp)
-
-        with assertRaisesRegexp(ValueError, 'Dot product shape mismatch'):
-            a.dot(row[:-1])
-
-        a = np.random.rand(1, 5)
-        b = np.random.rand(5, 1)
-        A = DataFrame(a)
-        B = DataFrame(b)
-
-        # it works
-        result = A.dot(b)
-
-        # unaligned
-        df = DataFrame(randn(3, 4), index=[1, 2, 3], columns=lrange(4))
-        df2 = DataFrame(randn(5, 3), index=lrange(5), columns=[1, 2, 3])
-
-        assertRaisesRegexp(ValueError, 'aligned', df.dot, df2)
-
-    def test_idxmin(self):
-        frame = self.frame
-        frame.ix[5:10] = np.nan
-        frame.ix[15:20, -2:] = np.nan
-        for skipna in [True, False]:
-            for axis in [0, 1]:
-                for df in [frame, self.intframe]:
-                    result = df.idxmin(axis=axis, skipna=skipna)
-                    expected = df.apply(
-                        Series.idxmin, axis=axis, skipna=skipna)
-                    assert_series_equal(result, expected)
-
-        self.assertRaises(ValueError, frame.idxmin, axis=2)
-
-    def test_idxmax(self):
-        frame = self.frame
-        frame.ix[5:10] = np.nan
-        frame.ix[15:20, -2:] = np.nan
-        for skipna in [True, False]:
-            for axis in [0, 1]:
-                for df in [frame, self.intframe]:
-                    result = df.idxmax(axis=axis, skipna=skipna)
-                    expected = df.apply(
-                        Series.idxmax, axis=axis, skipna=skipna)
-                    assert_series_equal(result, expected)
-
-        self.assertRaises(ValueError, frame.idxmax, axis=2)
-
-    def test_stale_cached_series_bug_473(self):
-
-        # this is chained, but ok
-        with option_context('chained_assignment',None):
-            Y = DataFrame(np.random.random((4, 4)), index=('a', 'b', 'c', 'd'),
-                          columns=('e', 'f', 'g', 'h'))
-            repr(Y)
-            Y['e'] = Y['e'].astype('object')
-            Y['g']['c'] = np.NaN
-            repr(Y)
-            result = Y.sum()
-            exp = Y['g'].sum()
-            self.assertTrue(isnull(Y['g']['c']))
-
-    def test_index_namedtuple(self):
-        from collections import namedtuple
-        IndexType = namedtuple("IndexType", ["a", "b"])
-        idx1 = IndexType("foo", "bar")
-        idx2 = IndexType("baz", "bof")
-        index = Index([idx1, idx2],
-                      name="composite_index", tupleize_cols=False)
-        df = DataFrame([(1, 2), (3, 4)], index=index, columns=["A", "B"])
-        result = df.ix[IndexType("foo", "bar")]["A"]
-        self.assertEqual(result, 1)
-
-    def test_empty_nonzero(self):
-        df = DataFrame([1, 2, 3])
-        self.assertFalse(df.empty)
-        df = DataFrame(index=['a', 'b'], columns=['c', 'd']).dropna()
-        self.assertTrue(df.empty)
-        self.assertTrue(df.T.empty)
-
-    def test_any_all(self):
-
-        self._check_bool_op('any', np.any, has_skipna=True, has_bool_only=True)
-        self._check_bool_op('all', np.all, has_skipna=True, has_bool_only=True)
-
-        df = DataFrame(randn(10, 4)) > 0
-        df.any(1)
-        df.all(1)
-        df.any(1, bool_only=True)
-        df.all(1, bool_only=True)
-
-        # skip pathological failure cases
-        # class CantNonzero(object):
-
-        #     def __nonzero__(self):
-        #         raise ValueError
-
-        # df[4] = CantNonzero()
-
-        # it works!
-        # df.any(1)
-        # df.all(1)
-        # df.any(1, bool_only=True)
-        # df.all(1, bool_only=True)
-
-        # df[4][4] = np.nan
-        # df.any(1)
-        # df.all(1)
-        # df.any(1, bool_only=True)
-        # df.all(1, bool_only=True)
-
-    def test_consolidate_datetime64(self):
-        # numpy vstack bug
-
-        data = """\
-starting,ending,measure
-2012-06-21 00:00,2012-06-23 07:00,77
-2012-06-23 07:00,2012-06-23 16:30,65
-2012-06-23 16:30,2012-06-25 08:00,77
-2012-06-25 08:00,2012-06-26 12:00,0
-2012-06-26 12:00,2012-06-27 08:00,77
-"""
-        df = read_csv(StringIO(data), parse_dates=[0, 1])
-
-        ser_starting = df.starting
-        ser_starting.index = ser_starting.values
-        ser_starting = ser_starting.tz_localize('US/Eastern')
-        ser_starting = ser_starting.tz_convert('UTC')
-
-        ser_ending = df.ending
-        ser_ending.index = ser_ending.values
-        ser_ending = ser_ending.tz_localize('US/Eastern')
-        ser_ending = ser_ending.tz_convert('UTC')
-
-        df.starting = ser_starting.index
-        df.ending = ser_ending.index
-
-        tm.assert_index_equal(pd.DatetimeIndex(df.starting), ser_starting.index)
-        tm.assert_index_equal(pd.DatetimeIndex(df.ending), ser_ending.index)
-
-    def _check_bool_op(self, name, alternative, frame=None, has_skipna=True,
-                       has_bool_only=False):
-        if frame is None:
-            frame = self.frame > 0
-            # set some NAs
-            frame = DataFrame(frame.values.astype(object), frame.index,
-                              frame.columns)
-            frame.ix[5:10] = np.nan
-            frame.ix[15:20, -2:] = np.nan
-
-        f = getattr(frame, name)
-
-        if has_skipna:
-            def skipna_wrapper(x):
-                nona = x.dropna().values
-                return alternative(nona)
-
-            def wrapper(x):
-                return alternative(x.values)
-
-            result0 = f(axis=0, skipna=False)
-            result1 = f(axis=1, skipna=False)
-            assert_series_equal(result0, frame.apply(wrapper))
-            assert_series_equal(result1, frame.apply(wrapper, axis=1),
-                                check_dtype=False)  # HACK: win32
-        else:
-            skipna_wrapper = alternative
-            wrapper = alternative
-
-        result0 = f(axis=0)
-        result1 = f(axis=1)
-        assert_series_equal(result0, frame.apply(skipna_wrapper))
-        assert_series_equal(result1, frame.apply(skipna_wrapper, axis=1),
-                            check_dtype=False)
-
-        # result = f(axis=1)
-        # comp = frame.apply(alternative, axis=1).reindex(result.index)
-        # assert_series_equal(result, comp)
-
-        # bad axis
-        self.assertRaises(ValueError, f, axis=2)
-
-        # make sure works on mixed-type frame
-        mixed = self.mixed_frame
-        mixed['_bool_'] = np.random.randn(len(mixed)) > 0
-        getattr(mixed, name)(axis=0)
-        getattr(mixed, name)(axis=1)
-
-        class NonzeroFail:
-
-            def __nonzero__(self):
-                raise ValueError
-
-        mixed['_nonzero_fail_'] = NonzeroFail()
-
-        if has_bool_only:
-            getattr(mixed, name)(axis=0, bool_only=True)
-            getattr(mixed, name)(axis=1, bool_only=True)
-            getattr(frame, name)(axis=0, bool_only=False)
-            getattr(frame, name)(axis=1, bool_only=False)
-
-        # all NA case
-        if has_skipna:
-            all_na = frame * np.NaN
-            r0 = getattr(all_na, name)(axis=0)
-            r1 = getattr(all_na, name)(axis=1)
-            if name == 'any':
-                self.assertFalse(r0.any())
-                self.assertFalse(r1.any())
-            else:
-                self.assertTrue(r0.all())
-                self.assertTrue(r1.all())
-
-    def test_strange_column_corruption_issue(self):
-
-        df = DataFrame(index=[0, 1])
-        df[0] = nan
-        wasCol = {}
-        # uncommenting these makes the results match
-        # for col in xrange(100, 200):
-        #    wasCol[col] = 1
-        #    df[col] = nan
-
-        for i, dt in enumerate(df.index):
-            for col in range(100, 200):
-                if not col in wasCol:
-                    wasCol[col] = 1
-                    df[col] = nan
-                df[col][dt] = i
-
-        myid = 100
-
-        first = len(df.ix[isnull(df[myid]), [myid]])
-        second = len(df.ix[isnull(df[myid]), [myid]])
-        self.assertTrue(first == second == 0)
-
-    def test_inplace_return_self(self):
-        # re #1893
-
-        data = DataFrame({'a': ['foo', 'bar', 'baz', 'qux'],
-                          'b': [0, 0, 1, 1],
-                          'c': [1, 2, 3, 4]})
-
-        def _check_f(base, f):
-            result = f(base)
-            self.assertTrue(result is None)
-
-        # -----DataFrame-----
-
-        # set_index
-        f = lambda x: x.set_index('a', inplace=True)
-        _check_f(data.copy(), f)
-
-        # reset_index
-        f = lambda x: x.reset_index(inplace=True)
-        _check_f(data.set_index('a'), f)
-
-        # drop_duplicates
-        f = lambda x: x.drop_duplicates(inplace=True)
-        _check_f(data.copy(), f)
-
-        # sort
-        f = lambda x: x.sort_values('b', inplace=True)
-        _check_f(data.copy(), f)
-
-        # sort_index
-        f = lambda x: x.sort_index(inplace=True)
-        _check_f(data.copy(), f)
-
-        # sortlevel
-        f = lambda x: x.sortlevel(0, inplace=True)
-        _check_f(data.set_index(['a', 'b']), f)
-
-        # fillna
-        f = lambda x: x.fillna(0, inplace=True)
-        _check_f(data.copy(), f)
-
-        # replace
-        f = lambda x: x.replace(1, 0, inplace=True)
-        _check_f(data.copy(), f)
-
-        # rename
-        f = lambda x: x.rename({1: 'foo'}, inplace=True)
-        _check_f(data.copy(), f)
-
-        # -----Series-----
-        d = data.copy()['c']
-
-        # reset_index
-        f = lambda x: x.reset_index(inplace=True, drop=True)
-        _check_f(data.set_index('a')['c'], f)
-
-        # fillna
-        f = lambda x: x.fillna(0, inplace=True)
-        _check_f(d.copy(), f)
-
-        # replace
-        f = lambda x: x.replace(1, 0, inplace=True)
-        _check_f(d.copy(), f)
-
-        # rename
-        f = lambda x: x.rename({1: 'foo'}, inplace=True)
-        _check_f(d.copy(), f)
-
-    def test_isin(self):
-        # GH #4211
-        df = DataFrame({'vals': [1, 2, 3, 4], 'ids': ['a', 'b', 'f', 'n'],
-                        'ids2': ['a', 'n', 'c', 'n']},
-                        index=['foo', 'bar', 'baz', 'qux'])
-        other = ['a', 'b', 'c']
-
-        result = df.isin(other)
-        expected = DataFrame([df.loc[s].isin(other) for s in df.index])
-        assert_frame_equal(result, expected)
-
-    def test_isin_empty(self):
-        df = DataFrame({'A': ['a', 'b', 'c'], 'B': ['a', 'e', 'f']})
-        result = df.isin([])
-        expected = pd.DataFrame(False, df.index, df.columns)
-        assert_frame_equal(result, expected)
-
-    def test_isin_dict(self):
-        df = DataFrame({'A': ['a', 'b', 'c'], 'B': ['a', 'e', 'f']})
-        d = {'A': ['a']}
-
-        expected = DataFrame(False, df.index, df.columns)
-        expected.loc[0, 'A'] = True
-
-        result = df.isin(d)
-        assert_frame_equal(result, expected)
-
-        # non unique columns
-        df = DataFrame({'A': ['a', 'b', 'c'], 'B': ['a', 'e', 'f']})
-        df.columns = ['A', 'A']
-        expected = DataFrame(False, df.index, df.columns)
-        expected.loc[0, 'A'] = True
-        result = df.isin(d)
-        assert_frame_equal(result, expected)
-
-    def test_isin_with_string_scalar(self):
-        #GH4763
-        df = DataFrame({'vals': [1, 2, 3, 4], 'ids': ['a', 'b', 'f', 'n'],
-                        'ids2': ['a', 'n', 'c', 'n']},
-                        index=['foo', 'bar', 'baz', 'qux'])
-        with tm.assertRaises(TypeError):
-            df.isin('a')
-
-        with tm.assertRaises(TypeError):
-            df.isin('aaa')
-
-    def test_isin_df(self):
-        df1 = DataFrame({'A': [1, 2, 3, 4], 'B': [2, np.nan, 4, 4]})
-        df2 = DataFrame({'A': [0, 2, 12, 4], 'B': [2, np.nan, 4, 5]})
-        expected = DataFrame(False, df1.index, df1.columns)
-        result = df1.isin(df2)
-        expected['A'].loc[[1, 3]] = True
-        expected['B'].loc[[0, 2]] = True
-        assert_frame_equal(result, expected)
-
-        # partial overlapping columns
-        df2.columns = ['A', 'C']
-        result = df1.isin(df2)
-        expected['B'] = False
-        assert_frame_equal(result, expected)
-
-    def test_isin_df_dupe_values(self):
-        df1 = DataFrame({'A': [1, 2, 3, 4], 'B': [2, np.nan, 4, 4]})
-        # just cols duped
-        df2 = DataFrame([[0, 2], [12, 4], [2, np.nan], [4, 5]],
-                        columns=['B', 'B'])
-        with tm.assertRaises(ValueError):
-            df1.isin(df2)
-
-        # just index duped
-        df2 = DataFrame([[0, 2], [12, 4], [2, np.nan], [4, 5]],
-                        columns=['A', 'B'], index=[0, 0, 1, 1])
-        with tm.assertRaises(ValueError):
-            df1.isin(df2)
-
-        # cols and index:
-        df2.columns = ['B', 'B']
-        with tm.assertRaises(ValueError):
-            df1.isin(df2)
-
-    def test_isin_dupe_self(self):
-        other = DataFrame({'A': [1, 0, 1, 0], 'B': [1, 1, 0, 0]})
-        df = DataFrame([[1, 1], [1, 0], [0, 0]], columns=['A','A'])
-        result = df.isin(other)
-        expected = DataFrame(False, index=df.index, columns=df.columns)
-        expected.loc[0] = True
-        expected.iloc[1, 1] = True
-        assert_frame_equal(result, expected)
-
-    def test_isin_against_series(self):
-        df = pd.DataFrame({'A': [1, 2, 3, 4], 'B': [2, np.nan, 4, 4]},
-                          index=['a', 'b', 'c', 'd'])
-        s = pd.Series([1, 3, 11, 4], index=['a', 'b', 'c', 'd'])
-        expected = DataFrame(False, index=df.index, columns=df.columns)
-        expected['A'].loc['a'] = True
-        expected.loc['d'] = True
-        result = df.isin(s)
-        assert_frame_equal(result, expected)
-
-    def test_isin_multiIndex(self):
-        idx = MultiIndex.from_tuples([(0, 'a', 'foo'), (0, 'a', 'bar'),
-                                      (0, 'b', 'bar'), (0, 'b', 'baz'),
-                                      (2, 'a', 'foo'), (2, 'a', 'bar'),
-                                      (2, 'c', 'bar'), (2, 'c', 'baz'),
-                                      (1, 'b', 'foo'), (1, 'b', 'bar'),
-                                      (1, 'c', 'bar'), (1, 'c', 'baz')])
-        df1 = DataFrame({'A': np.ones(12),
-                         'B': np.zeros(12)}, index=idx)
-        df2 = DataFrame({'A': [1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1],
-                         'B': [1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1]})
-        # against regular index
-        expected = DataFrame(False, index=df1.index, columns=df1.columns)
-        result = df1.isin(df2)
-        assert_frame_equal(result, expected)
-
-        df2.index = idx
-        expected = df2.values.astype(np.bool)
-        expected[:, 1] = ~expected[:, 1]
-        expected = DataFrame(expected, columns=['A', 'B'], index=idx)
-
-        result = df1.isin(df2)
-        assert_frame_equal(result, expected)
-
-    def test_to_csv_date_format(self):
-        from pandas import to_datetime
-        pname = '__tmp_to_csv_date_format__'
-        with ensure_clean(pname) as path:
-            for engine in [None, 'python']:
-                w = FutureWarning if engine == 'python' else None
-
-                dt_index = self.tsframe.index
-                datetime_frame = DataFrame({'A': dt_index, 'B': dt_index.shift(1)}, index=dt_index)
-
-                with tm.assert_produces_warning(w, check_stacklevel=False):
-                    datetime_frame.to_csv(path, date_format='%Y%m%d', engine=engine)
-
-                # Check that the data was put in the specified format
-                test = read_csv(path, index_col=0)
-
-                datetime_frame_int = datetime_frame.applymap(lambda x: int(x.strftime('%Y%m%d')))
-                datetime_frame_int.index = datetime_frame_int.index.map(lambda x: int(x.strftime('%Y%m%d')))
-
-                assert_frame_equal(test, datetime_frame_int)
-
-                with tm.assert_produces_warning(w, check_stacklevel=False):
-                    datetime_frame.to_csv(path, date_format='%Y-%m-%d', engine=engine)
-
-                # Check that the data was put in the specified format
-                test = read_csv(path, index_col=0)
-                datetime_frame_str = datetime_frame.applymap(lambda x: x.strftime('%Y-%m-%d'))
-                datetime_frame_str.index = datetime_frame_str.index.map(lambda x: x.strftime('%Y-%m-%d'))
-
-                assert_frame_equal(test, datetime_frame_str)
-
-                # Check that columns get converted
-                datetime_frame_columns = datetime_frame.T
-
-                with tm.assert_produces_warning(w, check_stacklevel=False):
-                    datetime_frame_columns.to_csv(path, date_format='%Y%m%d', engine=engine)
-
-                test = read_csv(path, index_col=0)
-
-                datetime_frame_columns = datetime_frame_columns.applymap(lambda x: int(x.strftime('%Y%m%d')))
-                # Columns don't get converted to ints by read_csv
-                datetime_frame_columns.columns = datetime_frame_columns.columns.map(lambda x: x.strftime('%Y%m%d'))
-
-                assert_frame_equal(test, datetime_frame_columns)
-
-                # test NaTs
-                nat_index = to_datetime(['NaT'] * 10 + ['2000-01-01', '1/1/2000', '1-1-2000'])
-                nat_frame = DataFrame({'A': nat_index}, index=nat_index)
-
-                with tm.assert_produces_warning(w, check_stacklevel=False):
-                    nat_frame.to_csv(path, date_format='%Y-%m-%d', engine=engine)
-
-                test = read_csv(path, parse_dates=[0, 1], index_col=0)
-
-                assert_frame_equal(test, nat_frame)
-
-    def test_concat_empty_dataframe_dtypes(self):
-        df = DataFrame(columns=list("abc"))
-        df['a'] = df['a'].astype(np.bool_)
-        df['b'] = df['b'].astype(np.int32)
-        df['c'] = df['c'].astype(np.float64)
-
-        result = pd.concat([df, df])
-        self.assertEqual(result['a'].dtype, np.bool_)
-        self.assertEqual(result['b'].dtype, np.int32)
-        self.assertEqual(result['c'].dtype, np.float64)
-
-        result = pd.concat([df, df.astype(np.float64)])
-        self.assertEqual(result['a'].dtype, np.object_)
-        self.assertEqual(result['b'].dtype, np.float64)
-        self.assertEqual(result['c'].dtype, np.float64)
-
-    def test_empty_frame_dtypes_ftypes(self):
-        empty_df = pd.DataFrame()
-        assert_series_equal(empty_df.dtypes, pd.Series(dtype=np.object))
-        assert_series_equal(empty_df.ftypes, pd.Series(dtype=np.object))
-
-        nocols_df = pd.DataFrame(index=[1,2,3])
-        assert_series_equal(nocols_df.dtypes, pd.Series(dtype=np.object))
-        assert_series_equal(nocols_df.ftypes, pd.Series(dtype=np.object))
-
-        norows_df = pd.DataFrame(columns=list("abc"))
-        assert_series_equal(norows_df.dtypes, pd.Series(np.object, index=list("abc")))
-        assert_series_equal(norows_df.ftypes, pd.Series('object:dense', index=list("abc")))
-
-        norows_int_df = pd.DataFrame(columns=list("abc")).astype(np.int32)
-        assert_series_equal(norows_int_df.dtypes, pd.Series(np.dtype('int32'), index=list("abc")))
-        assert_series_equal(norows_int_df.ftypes, pd.Series('int32:dense', index=list("abc")))
-
-        odict = OrderedDict
-        df = pd.DataFrame(odict([('a', 1), ('b', True), ('c', 1.0)]), index=[1, 2, 3])
-        assert_series_equal(df.dtypes, pd.Series(odict([('a', np.int64),
-                                                        ('b', np.bool),
-                                                        ('c', np.float64)])))
-        assert_series_equal(df.ftypes, pd.Series(odict([('a', 'int64:dense'),
-                                                        ('b', 'bool:dense'),
-                                                        ('c', 'float64:dense')])))
-
-        # same but for empty slice of df
-        assert_series_equal(df[:0].dtypes, pd.Series(odict([('a', np.int64),
-                                                            ('b', np.bool),
-                                                            ('c', np.float64)])))
-        assert_series_equal(df[:0].ftypes, pd.Series(odict([('a', 'int64:dense'),
-                                                            ('b', 'bool:dense'),
-                                                            ('c', 'float64:dense')])))
-
-    def test_dtypes_are_correct_after_column_slice(self):
-        # GH6525
-        df = pd.DataFrame(index=range(5), columns=list("abc"), dtype=np.float_)
-        odict = OrderedDict
-        assert_series_equal(df.dtypes,
-                            pd.Series(odict([('a', np.float_), ('b', np.float_),
-                                             ('c', np.float_),])))
-        assert_series_equal(df.iloc[:,2:].dtypes,
-                            pd.Series(odict([('c', np.float_)])))
-        assert_series_equal(df.dtypes,
-                            pd.Series(odict([('a', np.float_), ('b', np.float_),
-                                             ('c', np.float_),])))
-
-    def test_set_index_names(self):
-        df = pd.util.testing.makeDataFrame()
-        df.index.name = 'name'
-
-        self.assertEqual(df.set_index(df.index).index.names, ['name'])
-
-        mi = MultiIndex.from_arrays(df[['A', 'B']].T.values, names=['A', 'B'])
-        mi2 = MultiIndex.from_arrays(df[['A', 'B', 'A', 'B']].T.values,
-                                     names=['A', 'B', 'A', 'B'])
-
-        df = df.set_index(['A', 'B'])
-
-        self.assertEqual(df.set_index(df.index).index.names, ['A', 'B'])
-
-        # Check that set_index isn't converting a MultiIndex into an Index
-        self.assertTrue(isinstance(df.set_index(df.index).index, MultiIndex))
-
-        # Check actual equality
-        tm.assert_index_equal(df.set_index(df.index).index, mi)
-
-        # Check that [MultiIndex, MultiIndex] yields a MultiIndex rather
-        # than a pair of tuples
-        self.assertTrue(isinstance(df.set_index([df.index, df.index]).index, MultiIndex))
-
-        # Check equality
-        tm.assert_index_equal(df.set_index([df.index, df.index]).index, mi2)
-
-    def test_select_dtypes_include(self):
-        df = DataFrame({'a': list('abc'),
-                        'b': list(range(1, 4)),
-                        'c': np.arange(3, 6).astype('u1'),
-                        'd': np.arange(4.0, 7.0, dtype='float64'),
-                        'e': [True, False, True],
-                        'f': pd.Categorical(list('abc'))})
-        ri = df.select_dtypes(include=[np.number])
-        ei = df[['b', 'c', 'd']]
-        tm.assert_frame_equal(ri, ei)
-
-        ri = df.select_dtypes(include=[np.number,'category'])
-        ei = df[['b', 'c', 'd', 'f']]
-        tm.assert_frame_equal(ri, ei)
-
-    def test_select_dtypes_exclude(self):
-        df = DataFrame({'a': list('abc'),
-                        'b': list(range(1, 4)),
-                        'c': np.arange(3, 6).astype('u1'),
-                        'd': np.arange(4.0, 7.0, dtype='float64'),
-                        'e': [True, False, True]})
-        re = df.select_dtypes(exclude=[np.number])
-        ee = df[['a', 'e']]
-        tm.assert_frame_equal(re, ee)
-
-    def test_select_dtypes_exclude_include(self):
-        df = DataFrame({'a': list('abc'),
-                        'b': list(range(1, 4)),
-                        'c': np.arange(3, 6).astype('u1'),
-                        'd': np.arange(4.0, 7.0, dtype='float64'),
-                        'e': [True, False, True],
-                        'f': pd.date_range('now', periods=3).values})
-        exclude = np.datetime64,
-        include = np.bool_, 'integer'
-        r = df.select_dtypes(include=include, exclude=exclude)
-        e = df[['b', 'c', 'e']]
-        tm.assert_frame_equal(r, e)
-
-        exclude = 'datetime',
-        include = 'bool', 'int64', 'int32'
-        r = df.select_dtypes(include=include, exclude=exclude)
-        e = df[['b', 'e']]
-        tm.assert_frame_equal(r, e)
-
-    def test_select_dtypes_not_an_attr_but_still_valid_dtype(self):
-        df = DataFrame({'a': list('abc'),
-                        'b': list(range(1, 4)),
-                        'c': np.arange(3, 6).astype('u1'),
-                        'd': np.arange(4.0, 7.0, dtype='float64'),
-                        'e': [True, False, True],
-                        'f': pd.date_range('now', periods=3).values})
-        df['g'] = df.f.diff()
-        assert not hasattr(np, 'u8')
-        r = df.select_dtypes(include=['i8', 'O'], exclude=['timedelta'])
-        e = df[['a', 'b']]
-        tm.assert_frame_equal(r, e)
-
-        r = df.select_dtypes(include=['i8', 'O', 'timedelta64[ns]'])
-        e = df[['a', 'b', 'g']]
-        tm.assert_frame_equal(r, e)
-
-    def test_select_dtypes_empty(self):
-        df = DataFrame({'a': list('abc'), 'b': list(range(1, 4))})
-        with tm.assertRaisesRegexp(ValueError, 'at least one of include or '
-                                   'exclude must be nonempty'):
-            df.select_dtypes()
-
-    def test_select_dtypes_raises_on_string(self):
-        df = DataFrame({'a': list('abc'), 'b': list(range(1, 4))})
-        with tm.assertRaisesRegexp(TypeError, 'include and exclude .+ non-'):
-            df.select_dtypes(include='object')
-        with tm.assertRaisesRegexp(TypeError, 'include and exclude .+ non-'):
-            df.select_dtypes(exclude='object')
-        with tm.assertRaisesRegexp(TypeError, 'include and exclude .+ non-'):
-            df.select_dtypes(include=int, exclude='object')
-
-    def test_select_dtypes_bad_datetime64(self):
-        df = DataFrame({'a': list('abc'),
-                        'b': list(range(1, 4)),
-                        'c': np.arange(3, 6).astype('u1'),
-                        'd': np.arange(4.0, 7.0, dtype='float64'),
-                        'e': [True, False, True],
-                        'f': pd.date_range('now', periods=3).values})
-        with tm.assertRaisesRegexp(ValueError, '.+ is too specific'):
-            df.select_dtypes(include=['datetime64[D]'])
-
-        with tm.assertRaisesRegexp(ValueError, '.+ is too specific'):
-            df.select_dtypes(exclude=['datetime64[as]'])
-
-    def test_select_dtypes_str_raises(self):
-        df = DataFrame({'a': list('abc'),
-                        'g': list(u('abc')),
-                        'b': list(range(1, 4)),
-                        'c': np.arange(3, 6).astype('u1'),
-                        'd': np.arange(4.0, 7.0, dtype='float64'),
-                        'e': [True, False, True],
-                        'f': pd.date_range('now', periods=3).values})
-        string_dtypes = set((str, 'str', np.string_, 'S1',
-                             'unicode', np.unicode_, 'U1'))
-        try:
-            string_dtypes.add(unicode)
-        except NameError:
-            pass
-        for dt in string_dtypes:
-            with tm.assertRaisesRegexp(TypeError,
-                                       'string dtypes are not allowed'):
-                df.select_dtypes(include=[dt])
-            with tm.assertRaisesRegexp(TypeError,
-                                       'string dtypes are not allowed'):
-                df.select_dtypes(exclude=[dt])
-
-    def test_select_dtypes_bad_arg_raises(self):
-        df = DataFrame({'a': list('abc'),
-                        'g': list(u('abc')),
-                        'b': list(range(1, 4)),
-                        'c': np.arange(3, 6).astype('u1'),
-                        'd': np.arange(4.0, 7.0, dtype='float64'),
-                        'e': [True, False, True],
-                        'f': pd.date_range('now', periods=3).values})
-        with tm.assertRaisesRegexp(TypeError, 'data type.*not understood'):
-            df.select_dtypes(['blargy, blarg, blarg'])
-
-    def test_assign(self):
-        df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
-        original = df.copy()
-        result = df.assign(C=df.B / df.A)
-        expected = df.copy()
-        expected['C'] = [4, 2.5, 2]
-        assert_frame_equal(result, expected)
-
-        # lambda syntax
-        result = df.assign(C=lambda x: x.B / x.A)
-        assert_frame_equal(result, expected)
-
-        # original is unmodified
-        assert_frame_equal(df, original)
-
-        # Non-Series array-like
-        result = df.assign(C=[4, 2.5, 2])
-        assert_frame_equal(result, expected)
-        # original is unmodified
-        assert_frame_equal(df, original)
-
-        result = df.assign(B=df.B / df.A)
-        expected = expected.drop('B', axis=1).rename(columns={'C': 'B'})
-        assert_frame_equal(result, expected)
-
-        # overwrite
-        result = df.assign(A=df.A + df.B)
-        expected = df.copy()
-        expected['A'] = [5, 7, 9]
-        assert_frame_equal(result, expected)
-
-        # lambda
-        result = df.assign(A=lambda x: x.A + x.B)
-        assert_frame_equal(result, expected)
-
-    def test_assign_multiple(self):
-        df = DataFrame([[1, 4], [2, 5], [3, 6]], columns=['A', 'B'])
-        result = df.assign(C=[7, 8, 9], D=df.A, E=lambda x: x.B)
-        expected = DataFrame([[1, 4, 7, 1, 4], [2, 5, 8, 2, 5],
-                              [3, 6, 9, 3, 6]], columns=list('ABCDE'))
-        assert_frame_equal(result, expected)
-
-    def test_assign_alphabetical(self):
-        # GH 9818
-        df = DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
-        result = df.assign(D=df.A + df.B, C=df.A - df.B)
-        expected = DataFrame([[1, 2, -1, 3], [3, 4, -1, 7]],
-                             columns=list('ABCD'))
-        assert_frame_equal(result, expected)
-        result = df.assign(C=df.A - df.B, D=df.A + df.B)
-        assert_frame_equal(result, expected)
-
-    def test_assign_bad(self):
-        df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
-        # non-keyword argument
-        with tm.assertRaises(TypeError):
-            df.assign(lambda x: x.A)
-        with tm.assertRaises(AttributeError):
-            df.assign(C=df.A, D=df.A + df.C)
-        with tm.assertRaises(KeyError):
-            df.assign(C=lambda df: df.A, D=lambda df: df['A'] + df['C'])
-        with tm.assertRaises(KeyError):
-            df.assign(C=df.A, D=lambda x: x['A'] + x['C'])
-
-    def test_dataframe_metadata(self):
-
-        df = SubclassedDataFrame({'X': [1, 2, 3], 'Y': [1, 2, 3]},
-                                 index=['a', 'b', 'c'])
-        df.testattr = 'XXX'
-
-        self.assertEqual(df.testattr, 'XXX')
-        self.assertEqual(df[['X']].testattr, 'XXX')
-        self.assertEqual(df.loc[['a', 'b'], :].testattr, 'XXX')
-        self.assertEqual(df.iloc[[0, 1], :].testattr, 'XXX')
-
-        # GH9776
-        self.assertEqual(df.iloc[0:1, :].testattr, 'XXX')
-
-        # GH10553
-        unpickled = self.round_trip_pickle(df)
-        assert_frame_equal(df, unpickled)
-        self.assertEqual(df._metadata, unpickled._metadata)
-        self.assertEqual(df.testattr, unpickled.testattr)
-
-    def test_nlargest(self):
-        # GH10393
-        from string import ascii_lowercase
-        df = pd.DataFrame({'a': np.random.permutation(10),
-                           'b': list(ascii_lowercase[:10])})
-        result = df.nlargest(5, 'a')
-        expected = df.sort_values('a', ascending=False).head(5)
-        tm.assert_frame_equal(result, expected)
-
-    def test_nlargest_multiple_columns(self):
-        from string import ascii_lowercase
-        df = pd.DataFrame({'a': np.random.permutation(10),
-                           'b': list(ascii_lowercase[:10]),
-                           'c': np.random.permutation(10).astype('float64')})
-        result = df.nlargest(5, ['a', 'b'])
-        expected = df.sort_values(['a', 'b'], ascending=False).head(5)
-        tm.assert_frame_equal(result, expected)
-
-    def test_nsmallest(self):
-        from string import ascii_lowercase
-        df = pd.DataFrame({'a': np.random.permutation(10),
-                           'b': list(ascii_lowercase[:10])})
-        result = df.nsmallest(5, 'a')
-        expected = df.sort_values('a').head(5)
-        tm.assert_frame_equal(result, expected)
-
-    def test_nsmallest_multiple_columns(self):
-        from string import ascii_lowercase
-        df = pd.DataFrame({'a': np.random.permutation(10),
-                           'b': list(ascii_lowercase[:10]),
-                           'c': np.random.permutation(10).astype('float64')})
-        result = df.nsmallest(5, ['a', 'c'])
-        expected = df.sort_values(['a', 'c']).head(5)
-        tm.assert_frame_equal(result, expected)
-
-    def test_to_panel_expanddim(self):
-        # GH 9762
-
-        class SubclassedFrame(DataFrame):
-            @property
-            def _constructor_expanddim(self):
-                return SubclassedPanel
-
-        class SubclassedPanel(Panel):
-            pass
-
-        index = MultiIndex.from_tuples([(0, 0), (0, 1), (0, 2)])
-        df = SubclassedFrame({'X':[1, 2, 3], 'Y': [4, 5, 6]}, index=index)
-        result = df.to_panel()
-        self.assertTrue(isinstance(result, SubclassedPanel))
-        expected = SubclassedPanel([[[1, 2, 3]], [[4, 5, 6]]],
-                                   items=['X', 'Y'], major_axis=[0],
-                                   minor_axis=[0, 1, 2],
-                                   dtype='int64')
-        tm.assert_panel_equal(result, expected)
-
-
-def skip_if_no_ne(engine='numexpr'):
-    if engine == 'numexpr':
-        try:
-            import numexpr as ne
-        except ImportError:
-            raise nose.SkipTest("cannot query engine numexpr when numexpr not "
-                                "installed")
-
-
-def skip_if_no_pandas_parser(parser):
-    if parser != 'pandas':
-        raise nose.SkipTest("cannot evaluate with parser {0!r}".format(parser))
-
-
-class TestDataFrameQueryWithMultiIndex(object):
-    def check_query_with_named_multiindex(self, parser, engine):
-        tm.skip_if_no_ne(engine)
-        a = tm.choice(['red', 'green'], size=10)
-        b = tm.choice(['eggs', 'ham'], size=10)
-        index = MultiIndex.from_arrays([a, b], names=['color', 'food'])
-        df = DataFrame(randn(10, 2), index=index)
-        ind = Series(df.index.get_level_values('color').values, index=index,
-                     name='color')
-
-        # equality
-        res1 = df.query('color == "red"', parser=parser, engine=engine)
-        res2 = df.query('"red" == color', parser=parser, engine=engine)
-        exp = df[ind == 'red']
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        # inequality
-        res1 = df.query('color != "red"', parser=parser, engine=engine)
-        res2 = df.query('"red" != color', parser=parser, engine=engine)
-        exp = df[ind != 'red']
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        # list equality (really just set membership)
-        res1 = df.query('color == ["red"]', parser=parser, engine=engine)
-        res2 = df.query('["red"] == color', parser=parser, engine=engine)
-        exp = df[ind.isin(['red'])]
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        res1 = df.query('color != ["red"]', parser=parser, engine=engine)
-        res2 = df.query('["red"] != color', parser=parser, engine=engine)
-        exp = df[~ind.isin(['red'])]
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        # in/not in ops
-        res1 = df.query('["red"] in color', parser=parser, engine=engine)
-        res2 = df.query('"red" in color', parser=parser, engine=engine)
-        exp = df[ind.isin(['red'])]
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        res1 = df.query('["red"] not in color', parser=parser, engine=engine)
-        res2 = df.query('"red" not in color', parser=parser, engine=engine)
-        exp = df[~ind.isin(['red'])]
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-    def test_query_with_named_multiindex(self):
-        for parser, engine in product(['pandas'], ENGINES):
-            yield self.check_query_with_named_multiindex, parser, engine
-
-    def check_query_with_unnamed_multiindex(self, parser, engine):
-        tm.skip_if_no_ne(engine)
-        a = tm.choice(['red', 'green'], size=10)
-        b = tm.choice(['eggs', 'ham'], size=10)
-        index = MultiIndex.from_arrays([a, b])
-        df = DataFrame(randn(10, 2), index=index)
-        ind = Series(df.index.get_level_values(0).values, index=index)
-
-        res1 = df.query('ilevel_0 == "red"', parser=parser, engine=engine)
-        res2 = df.query('"red" == ilevel_0', parser=parser, engine=engine)
-        exp = df[ind == 'red']
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        # inequality
-        res1 = df.query('ilevel_0 != "red"', parser=parser, engine=engine)
-        res2 = df.query('"red" != ilevel_0', parser=parser, engine=engine)
-        exp = df[ind != 'red']
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        # list equality (really just set membership)
-        res1 = df.query('ilevel_0 == ["red"]', parser=parser, engine=engine)
-        res2 = df.query('["red"] == ilevel_0', parser=parser, engine=engine)
-        exp = df[ind.isin(['red'])]
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        res1 = df.query('ilevel_0 != ["red"]', parser=parser, engine=engine)
-        res2 = df.query('["red"] != ilevel_0', parser=parser, engine=engine)
-        exp = df[~ind.isin(['red'])]
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        # in/not in ops
-        res1 = df.query('["red"] in ilevel_0', parser=parser, engine=engine)
-        res2 = df.query('"red" in ilevel_0', parser=parser, engine=engine)
-        exp = df[ind.isin(['red'])]
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        res1 = df.query('["red"] not in ilevel_0', parser=parser, engine=engine)
-        res2 = df.query('"red" not in ilevel_0', parser=parser, engine=engine)
-        exp = df[~ind.isin(['red'])]
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        #### LEVEL 1 ####
-        ind = Series(df.index.get_level_values(1).values, index=index)
-        res1 = df.query('ilevel_1 == "eggs"', parser=parser, engine=engine)
-        res2 = df.query('"eggs" == ilevel_1', parser=parser, engine=engine)
-        exp = df[ind == 'eggs']
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        # inequality
-        res1 = df.query('ilevel_1 != "eggs"', parser=parser, engine=engine)
-        res2 = df.query('"eggs" != ilevel_1', parser=parser, engine=engine)
-        exp = df[ind != 'eggs']
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        # list equality (really just set membership)
-        res1 = df.query('ilevel_1 == ["eggs"]', parser=parser, engine=engine)
-        res2 = df.query('["eggs"] == ilevel_1', parser=parser, engine=engine)
-        exp = df[ind.isin(['eggs'])]
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        res1 = df.query('ilevel_1 != ["eggs"]', parser=parser, engine=engine)
-        res2 = df.query('["eggs"] != ilevel_1', parser=parser, engine=engine)
-        exp = df[~ind.isin(['eggs'])]
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        # in/not in ops
-        res1 = df.query('["eggs"] in ilevel_1', parser=parser, engine=engine)
-        res2 = df.query('"eggs" in ilevel_1', parser=parser, engine=engine)
-        exp = df[ind.isin(['eggs'])]
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-        res1 = df.query('["eggs"] not in ilevel_1', parser=parser, engine=engine)
-        res2 = df.query('"eggs" not in ilevel_1', parser=parser, engine=engine)
-        exp = df[~ind.isin(['eggs'])]
-        assert_frame_equal(res1, exp)
-        assert_frame_equal(res2, exp)
-
-    def test_query_with_unnamed_multiindex(self):
-        for parser, engine in product(['pandas'], ENGINES):
-            yield self.check_query_with_unnamed_multiindex, parser, engine
-
-    def check_query_with_partially_named_multiindex(self, parser, engine):
-        tm.skip_if_no_ne(engine)
-        a = tm.choice(['red', 'green'], size=10)
-        b = np.arange(10)
-        index = MultiIndex.from_arrays([a, b])
-        index.names = [None, 'rating']
-        df = DataFrame(randn(10, 2), index=index)
-        res = df.query('rating == 1', parser=parser, engine=engine)
-        ind = Series(df.index.get_level_values('rating').values, index=index,
-                     name='rating')
-        exp = df[ind == 1]
-        assert_frame_equal(res, exp)
-
-        res = df.query('rating != 1', parser=parser, engine=engine)
-        ind = Series(df.index.get_level_values('rating').values, index=index,
-                     name='rating')
-        exp = df[ind != 1]
-        assert_frame_equal(res, exp)
-
-        res = df.query('ilevel_0 == "red"', parser=parser, engine=engine)
-        ind = Series(df.index.get_level_values(0).values, index=index)
-        exp = df[ind == "red"]
-        assert_frame_equal(res, exp)
-
-        res = df.query('ilevel_0 != "red"', parser=parser, engine=engine)
-        ind = Series(df.index.get_level_values(0).values, index=index)
-        exp = df[ind != "red"]
-        assert_frame_equal(res, exp)
-
-    def test_query_with_partially_named_multiindex(self):
-        for parser, engine in product(['pandas'], ENGINES):
-            yield self.check_query_with_partially_named_multiindex, parser, engine
-
-    def test_query_multiindex_get_index_resolvers(self):
-        for parser, engine in product(['pandas'], ENGINES):
-            yield self.check_query_multiindex_get_index_resolvers, parser, engine
-
-    def check_query_multiindex_get_index_resolvers(self, parser, engine):
-        df = mkdf(10, 3, r_idx_nlevels=2, r_idx_names=['spam', 'eggs'])
-        resolvers = df._get_index_resolvers()
-
-        def to_series(mi, level):
-            level_values = mi.get_level_values(level)
-            s = level_values.to_series()
-            s.index = mi
-            return s
-
-        col_series = df.columns.to_series()
-        expected = {'index': df.index,
-                    'columns': col_series,
-                    'spam': to_series(df.index, 'spam'),
-                    'eggs': to_series(df.index, 'eggs'),
-                    'C0': col_series}
-        for k, v in resolvers.items():
-            if isinstance(v, Index):
-                assert v.is_(expected[k])
-            elif isinstance(v, Series):
-                tm.assert_series_equal(v, expected[k])
-            else:
-                raise AssertionError("object must be a Series or Index")
-
-    def test_raise_on_panel_with_multiindex(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_raise_on_panel_with_multiindex, parser, engine
-
-    def check_raise_on_panel_with_multiindex(self, parser, engine):
-        tm.skip_if_no_ne()
-        p = tm.makePanel(7)
-        p.items = tm.makeCustomIndex(len(p.items), nlevels=2)
-        with tm.assertRaises(NotImplementedError):
-            pd.eval('p + 1', parser=parser, engine=engine)
-
-    def test_raise_on_panel4d_with_multiindex(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_raise_on_panel4d_with_multiindex, parser, engine
-
-    def check_raise_on_panel4d_with_multiindex(self, parser, engine):
-        tm.skip_if_no_ne()
-        p4d = tm.makePanel4D(7)
-        p4d.items = tm.makeCustomIndex(len(p4d.items), nlevels=2)
-        with tm.assertRaises(NotImplementedError):
-            pd.eval('p4d + 1', parser=parser, engine=engine)
-
-
-class TestDataFrameQueryNumExprPandas(tm.TestCase):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameQueryNumExprPandas, cls).setUpClass()
-        cls.engine = 'numexpr'
-        cls.parser = 'pandas'
-        tm.skip_if_no_ne(cls.engine)
-
-    @classmethod
-    def tearDownClass(cls):
-        super(TestDataFrameQueryNumExprPandas, cls).tearDownClass()
-        del cls.engine, cls.parser
-
-    def test_date_query_with_attribute_access(self):
-        engine, parser = self.engine, self.parser
-        skip_if_no_pandas_parser(parser)
-        df = DataFrame(randn(5, 3))
-        df['dates1'] = date_range('1/1/2012', periods=5)
-        df['dates2'] = date_range('1/1/2013', periods=5)
-        df['dates3'] = date_range('1/1/2014', periods=5)
-        res = df.query('@df.dates1 < 20130101 < @df.dates3', engine=engine,
-                       parser=parser)
-        expec = df[(df.dates1 < '20130101') & ('20130101' < df.dates3)]
-        assert_frame_equal(res, expec)
-
-    def test_date_query_no_attribute_access(self):
-        engine, parser = self.engine, self.parser
-        df = DataFrame(randn(5, 3))
-        df['dates1'] = date_range('1/1/2012', periods=5)
-        df['dates2'] = date_range('1/1/2013', periods=5)
-        df['dates3'] = date_range('1/1/2014', periods=5)
-        res = df.query('dates1 < 20130101 < dates3', engine=engine,
-                       parser=parser)
-        expec = df[(df.dates1 < '20130101') & ('20130101' < df.dates3)]
-        tm.assert_frame_equal(res, expec)
-
-    def test_date_query_with_NaT(self):
-        engine, parser = self.engine, self.parser
-        n = 10
-        df = DataFrame(randn(n, 3))
-        df['dates1'] = date_range('1/1/2012', periods=n)
-        df['dates2'] = date_range('1/1/2013', periods=n)
-        df['dates3'] = date_range('1/1/2014', periods=n)
-        df.loc[np.random.rand(n) > 0.5, 'dates1'] = pd.NaT
-        df.loc[np.random.rand(n) > 0.5, 'dates3'] = pd.NaT
-        res = df.query('dates1 < 20130101 < dates3', engine=engine,
-                       parser=parser)
-        expec = df[(df.dates1 < '20130101') & ('20130101' < df.dates3)]
-        assert_frame_equal(res, expec)
-
-    def test_date_index_query(self):
-        engine, parser = self.engine, self.parser
-        n = 10
-        df = DataFrame(randn(n, 3))
-        df['dates1'] = date_range('1/1/2012', periods=n)
-        df['dates3'] = date_range('1/1/2014', periods=n)
-        df.set_index('dates1', inplace=True, drop=True)
-        res = df.query('index < 20130101 < dates3', engine=engine,
-                       parser=parser)
-        expec = df[(df.index < '20130101') & ('20130101' < df.dates3)]
-        assert_frame_equal(res, expec)
-
-    def test_date_index_query_with_NaT(self):
-        engine, parser = self.engine, self.parser
-        n = 10
-        df = DataFrame(randn(n, 3))
-        df['dates1'] = date_range('1/1/2012', periods=n)
-        df['dates3'] = date_range('1/1/2014', periods=n)
-        df.iloc[0, 0] = pd.NaT
-        df.set_index('dates1', inplace=True, drop=True)
-        res = df.query('index < 20130101 < dates3', engine=engine,
-                       parser=parser)
-        expec = df[(df.index < '20130101') & ('20130101' < df.dates3)]
-        assert_frame_equal(res, expec)
-
-    def test_date_index_query_with_NaT_duplicates(self):
-        engine, parser = self.engine, self.parser
-        n = 10
-        d = {}
-        d['dates1'] = date_range('1/1/2012', periods=n)
-        d['dates3'] = date_range('1/1/2014', periods=n)
-        df = DataFrame(d)
-        df.loc[np.random.rand(n) > 0.5, 'dates1'] = pd.NaT
-        df.set_index('dates1', inplace=True, drop=True)
-        res = df.query('index < 20130101 < dates3', engine=engine, parser=parser)
-        expec = df[(df.index.to_series() < '20130101') & ('20130101' < df.dates3)]
-        assert_frame_equal(res, expec)
-
-    def test_date_query_with_non_date(self):
-        engine, parser = self.engine, self.parser
-
-        n = 10
-        df = DataFrame({'dates': date_range('1/1/2012', periods=n),
-                        'nondate': np.arange(n)})
-
-        ops = '==', '!=', '<', '>', '<=', '>='
-
-        for op in ops:
-            with tm.assertRaises(TypeError):
-                df.query('dates %s nondate' % op, parser=parser, engine=engine)
-
-    def test_query_syntax_error(self):
-        engine, parser = self.engine, self.parser
-        df = DataFrame({"i": lrange(10), "+": lrange(3, 13),
-                        "r": lrange(4, 14)})
-        with tm.assertRaises(SyntaxError):
-            df.query('i - +', engine=engine, parser=parser)
-
-    def test_query_scope(self):
-        from pandas.computation.ops import UndefinedVariableError
-        engine, parser = self.engine, self.parser
-        skip_if_no_pandas_parser(parser)
-
-        df = DataFrame(np.random.randn(20, 2), columns=list('ab'))
-
-        a, b = 1, 2
-        res = df.query('a > b', engine=engine, parser=parser)
-        expected = df[df.a > df.b]
-        tm.assert_frame_equal(res, expected)
-
-        res = df.query('@a > b', engine=engine, parser=parser)
-        expected = df[a > df.b]
-        tm.assert_frame_equal(res, expected)
-
-        # no local variable c
-        with tm.assertRaises(UndefinedVariableError):
-            df.query('@a > b > @c', engine=engine, parser=parser)
-
-        # no column named 'c'
-        with tm.assertRaises(UndefinedVariableError):
-            df.query('@a > b > c', engine=engine, parser=parser)
-
-    def test_query_doesnt_pickup_local(self):
-        from pandas.computation.ops import UndefinedVariableError
-
-        engine, parser = self.engine, self.parser
-        n = m = 10
-        df = DataFrame(np.random.randint(m, size=(n, 3)), columns=list('abc'))
-
-        from numpy import sin
-
-        # we don't pick up the local 'sin'
-        with tm.assertRaises(UndefinedVariableError):
-            df.query('sin > 5', engine=engine, parser=parser)
-
-    def test_query_builtin(self):
-        from pandas.computation.engines import NumExprClobberingError
-        engine, parser = self.engine, self.parser
-
-        n = m = 10
-        df = DataFrame(np.random.randint(m, size=(n, 3)), columns=list('abc'))
-
-        df.index.name = 'sin'
-        with tm.assertRaisesRegexp(NumExprClobberingError,
-                                  'Variables in expression.+'):
-            df.query('sin > 5', engine=engine, parser=parser)
-
-    def test_query(self):
-        engine, parser = self.engine, self.parser
-        df = DataFrame(np.random.randn(10, 3), columns=['a', 'b', 'c'])
-
-        assert_frame_equal(df.query('a < b', engine=engine, parser=parser),
-                           df[df.a < df.b])
-        assert_frame_equal(df.query('a + b > b * c', engine=engine,
-                                    parser=parser),
-                           df[df.a + df.b > df.b * df.c])
-
-    def test_query_index_with_name(self):
-        engine, parser = self.engine, self.parser
-        df = DataFrame(np.random.randint(10, size=(10, 3)),
-                       index=Index(range(10), name='blob'),
-                       columns=['a', 'b', 'c'])
-        res = df.query('(blob < 5) & (a < b)', engine=engine, parser=parser)
-        expec = df[(df.index < 5) & (df.a < df.b)]
-        assert_frame_equal(res, expec)
-
-        res = df.query('blob < b', engine=engine, parser=parser)
-        expec = df[df.index < df.b]
-
-        assert_frame_equal(res, expec)
-
-    def test_query_index_without_name(self):
-        engine, parser = self.engine, self.parser
-        df = DataFrame(np.random.randint(10, size=(10, 3)),
-                       index=range(10), columns=['a', 'b', 'c'])
-
-        # "index" should refer to the index
-        res = df.query('index < b', engine=engine, parser=parser)
-        expec = df[df.index < df.b]
-        assert_frame_equal(res, expec)
-
-        # test against a scalar
-        res = df.query('index < 5', engine=engine, parser=parser)
-        expec = df[df.index < 5]
-        assert_frame_equal(res, expec)
-
-    def test_nested_scope(self):
-        engine = self.engine
-        parser = self.parser
-
-        skip_if_no_pandas_parser(parser)
-
-        df = DataFrame(np.random.randn(5, 3))
-        df2 = DataFrame(np.random.randn(5, 3))
-        expected = df[(df > 0) & (df2 > 0)]
-
-        result = df.query('(@df > 0) & (@df2 > 0)', engine=engine, parser=parser)
-        assert_frame_equal(result, expected)
-
-        result = pd.eval('df[df > 0 and df2 > 0]', engine=engine,
-                         parser=parser)
-        assert_frame_equal(result, expected)
-
-        result = pd.eval('df[df > 0 and df2 > 0 and df[df > 0] > 0]',
-                         engine=engine, parser=parser)
-        expected = df[(df > 0) & (df2 > 0) & (df[df > 0] > 0)]
-        assert_frame_equal(result, expected)
-
-        result = pd.eval('df[(df>0) & (df2>0)]', engine=engine, parser=parser)
-        expected = df.query('(@df>0) & (@df2>0)', engine=engine, parser=parser)
-        assert_frame_equal(result, expected)
-
-    def test_nested_raises_on_local_self_reference(self):
-        from pandas.computation.ops import UndefinedVariableError
-
-        df = DataFrame(np.random.randn(5, 3))
-
-        # can't reference ourself b/c we're a local so @ is necessary
-        with tm.assertRaises(UndefinedVariableError):
-            df.query('df > 0', engine=self.engine, parser=self.parser)
-
-    def test_local_syntax(self):
-        skip_if_no_pandas_parser(self.parser)
-
-        engine, parser = self.engine, self.parser
-        df = DataFrame(randn(100, 10), columns=list('abcdefghij'))
-        b = 1
-        expect = df[df.a < b]
-        result = df.query('a < @b', engine=engine, parser=parser)
-        assert_frame_equal(result, expect)
-
-        expect = df[df.a < df.b]
-        result = df.query('a < b', engine=engine, parser=parser)
-        assert_frame_equal(result, expect)
-
-    def test_chained_cmp_and_in(self):
-        skip_if_no_pandas_parser(self.parser)
-        engine, parser = self.engine, self.parser
-        cols = list('abc')
-        df = DataFrame(randn(100, len(cols)), columns=cols)
-        res = df.query('a < b < c and a not in b not in c', engine=engine,
-                       parser=parser)
-        ind = (df.a < df.b) & (df.b < df.c) & ~df.b.isin(df.a) & ~df.c.isin(df.b)
-        expec = df[ind]
-        assert_frame_equal(res, expec)
-
-    def test_local_variable_with_in(self):
-        engine, parser = self.engine, self.parser
-        skip_if_no_pandas_parser(parser)
-        a = Series(np.random.randint(3, size=15), name='a')
-        b = Series(np.random.randint(10, size=15), name='b')
-        df = DataFrame({'a': a, 'b': b})
-
-        expected = df.loc[(df.b - 1).isin(a)]
-        result = df.query('b - 1 in a', engine=engine, parser=parser)
-        tm.assert_frame_equal(expected, result)
-
-        b = Series(np.random.randint(10, size=15), name='b')
-        expected = df.loc[(b - 1).isin(a)]
-        result = df.query('@b - 1 in a', engine=engine, parser=parser)
-        tm.assert_frame_equal(expected, result)
-
-    def test_at_inside_string(self):
-        engine, parser = self.engine, self.parser
-        skip_if_no_pandas_parser(parser)
-        c = 1
-        df = DataFrame({'a': ['a', 'a', 'b', 'b', '@c', '@c']})
-        result = df.query('a == "@c"', engine=engine, parser=parser)
-        expected = df[df.a == "@c"]
-        tm.assert_frame_equal(result, expected)
-
-    def test_query_undefined_local(self):
-        from pandas.computation.ops import UndefinedVariableError
-        engine, parser = self.engine, self.parser
-        skip_if_no_pandas_parser(parser)
-        df = DataFrame(np.random.rand(10, 2), columns=list('ab'))
-        with tm.assertRaisesRegexp(UndefinedVariableError,
-                                   "local variable 'c' is not defined"):
-            df.query('a == @c', engine=engine, parser=parser)
-
-    def test_index_resolvers_come_after_columns_with_the_same_name(self):
-        n = 1
-        a = np.r_[20:101:20]
-
-        df = DataFrame({'index': a, 'b': np.random.randn(a.size)})
-        df.index.name = 'index'
-        result = df.query('index > 5', engine=self.engine, parser=self.parser)
-        expected = df[df['index'] > 5]
-        tm.assert_frame_equal(result, expected)
-
-        df = DataFrame({'index': a, 'b': np.random.randn(a.size)})
-        result = df.query('ilevel_0 > 5', engine=self.engine, parser=self.parser)
-        expected = df.loc[df.index[df.index > 5]]
-        tm.assert_frame_equal(result, expected)
-
-        df = DataFrame({'a': a, 'b': np.random.randn(a.size)})
-        df.index.name = 'a'
-        result = df.query('a > 5', engine=self.engine, parser=self.parser)
-        expected = df[df.a > 5]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.query('index > 5', engine=self.engine, parser=self.parser)
-        expected = df.loc[df.index[df.index > 5]]
-        tm.assert_frame_equal(result, expected)
-
-    def test_inf(self):
-        n = 10
-        df = DataFrame({'a': np.random.rand(n), 'b': np.random.rand(n)})
-        df.loc[::2, 0] = np.inf
-        ops = '==', '!='
-        d = dict(zip(ops, (operator.eq, operator.ne)))
-        for op, f in d.items():
-            q = 'a %s inf' % op
-            expected = df[f(df.a, np.inf)]
-            result = df.query(q, engine=self.engine, parser=self.parser)
-            tm.assert_frame_equal(result, expected)
-
-
-class TestDataFrameQueryNumExprPython(TestDataFrameQueryNumExprPandas):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameQueryNumExprPython, cls).setUpClass()
-        cls.engine = 'numexpr'
-        cls.parser = 'python'
-        tm.skip_if_no_ne(cls.engine)
-        cls.frame = _frame.copy()
-
-    def test_date_query_no_attribute_access(self):
-        engine, parser = self.engine, self.parser
-        df = DataFrame(randn(5, 3))
-        df['dates1'] = date_range('1/1/2012', periods=5)
-        df['dates2'] = date_range('1/1/2013', periods=5)
-        df['dates3'] = date_range('1/1/2014', periods=5)
-        res = df.query('(dates1 < 20130101) & (20130101 < dates3)',
-                       engine=engine, parser=parser)
-        expec = df[(df.dates1 < '20130101') & ('20130101' < df.dates3)]
-        tm.assert_frame_equal(res, expec)
-    def test_date_query_with_NaT(self):
-        engine, parser = self.engine, self.parser
-        n = 10
-        df = DataFrame(randn(n, 3))
-        df['dates1'] = date_range('1/1/2012', periods=n)
-        df['dates2'] = date_range('1/1/2013', periods=n)
-        df['dates3'] = date_range('1/1/2014', periods=n)
-        df.loc[np.random.rand(n) > 0.5, 'dates1'] = pd.NaT
-        df.loc[np.random.rand(n) > 0.5, 'dates3'] = pd.NaT
-        res = df.query('(dates1 < 20130101) & (20130101 < dates3)',
-                       engine=engine, parser=parser)
-        expec = df[(df.dates1 < '20130101') & ('20130101' < df.dates3)]
-        assert_frame_equal(res, expec)
-
-    def test_date_index_query(self):
-        engine, parser = self.engine, self.parser
-        n = 10
-        df = DataFrame(randn(n, 3))
-        df['dates1'] = date_range('1/1/2012', periods=n)
-        df['dates3'] = date_range('1/1/2014', periods=n)
-        df.set_index('dates1', inplace=True, drop=True)
-        res = df.query('(index < 20130101) & (20130101 < dates3)',
-                       engine=engine, parser=parser)
-        expec = df[(df.index < '20130101') & ('20130101' < df.dates3)]
-        assert_frame_equal(res, expec)
-
-    def test_date_index_query_with_NaT(self):
-        engine, parser = self.engine, self.parser
-        n = 10
-        df = DataFrame(randn(n, 3))
-        df['dates1'] = date_range('1/1/2012', periods=n)
-        df['dates3'] = date_range('1/1/2014', periods=n)
-        df.iloc[0, 0] = pd.NaT
-        df.set_index('dates1', inplace=True, drop=True)
-        res = df.query('(index < 20130101) & (20130101 < dates3)',
-                       engine=engine, parser=parser)
-        expec = df[(df.index < '20130101') & ('20130101' < df.dates3)]
-        assert_frame_equal(res, expec)
-
-    def test_date_index_query_with_NaT_duplicates(self):
-        engine, parser = self.engine, self.parser
-        n = 10
-        df = DataFrame(randn(n, 3))
-        df['dates1'] = date_range('1/1/2012', periods=n)
-        df['dates3'] = date_range('1/1/2014', periods=n)
-        df.loc[np.random.rand(n) > 0.5, 'dates1'] = pd.NaT
-        df.set_index('dates1', inplace=True, drop=True)
-        with tm.assertRaises(NotImplementedError):
-            df.query('index < 20130101 < dates3', engine=engine, parser=parser)
-
-    def test_nested_scope(self):
-        from pandas.computation.ops import UndefinedVariableError
-        engine = self.engine
-        parser = self.parser
-        # smoke test
-        x = 1
-        result = pd.eval('x + 1', engine=engine, parser=parser)
-        self.assertEqual(result, 2)
-
-        df  = DataFrame(np.random.randn(5, 3))
-        df2 = DataFrame(np.random.randn(5, 3))
-
-        # don't have the pandas parser
-        with tm.assertRaises(SyntaxError):
-            df.query('(@df>0) & (@df2>0)', engine=engine, parser=parser)
-
-        with tm.assertRaises(UndefinedVariableError):
-            df.query('(df>0) & (df2>0)', engine=engine, parser=parser)
-
-        expected = df[(df > 0) & (df2 > 0)]
-        result = pd.eval('df[(df > 0) & (df2 > 0)]', engine=engine,
-                         parser=parser)
-        tm.assert_frame_equal(expected, result)
-
-        expected = df[(df > 0) & (df2 > 0) & (df[df > 0] > 0)]
-        result = pd.eval('df[(df > 0) & (df2 > 0) & (df[df > 0] > 0)]',
-                         engine=engine, parser=parser)
-        tm.assert_frame_equal(expected, result)
-
-
-class TestDataFrameQueryPythonPandas(TestDataFrameQueryNumExprPandas):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameQueryPythonPandas, cls).setUpClass()
-        cls.engine = 'python'
-        cls.parser = 'pandas'
-        cls.frame = _frame.copy()
-
-    def test_query_builtin(self):
-        from pandas.computation.engines import NumExprClobberingError
-        engine, parser = self.engine, self.parser
-
-        n = m = 10
-        df = DataFrame(np.random.randint(m, size=(n, 3)), columns=list('abc'))
-
-        df.index.name = 'sin'
-        expected = df[df.index > 5]
-        result = df.query('sin > 5', engine=engine, parser=parser)
-        tm.assert_frame_equal(expected, result)
-
-
-class TestDataFrameQueryPythonPython(TestDataFrameQueryNumExprPython):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameQueryPythonPython, cls).setUpClass()
-        cls.engine = cls.parser = 'python'
-        cls.frame = _frame.copy()
-
-    def test_query_builtin(self):
-        from pandas.computation.engines import NumExprClobberingError
-        engine, parser = self.engine, self.parser
-
-        n = m = 10
-        df = DataFrame(np.random.randint(m, size=(n, 3)), columns=list('abc'))
-
-        df.index.name = 'sin'
-        expected = df[df.index > 5]
-        result = df.query('sin > 5', engine=engine, parser=parser)
-        tm.assert_frame_equal(expected, result)
-
-
-PARSERS = 'python', 'pandas'
-ENGINES = 'python', 'numexpr'
-
-
-class TestDataFrameQueryStrings(object):
-    def check_str_query_method(self, parser, engine):
-        tm.skip_if_no_ne(engine)
-        df = DataFrame(randn(10, 1), columns=['b'])
-        df['strings'] = Series(list('aabbccddee'))
-        expect = df[df.strings == 'a']
-
-        if parser != 'pandas':
-            col = 'strings'
-            lst = '"a"'
-
-            lhs = [col] * 2 + [lst] * 2
-            rhs = lhs[::-1]
-
-            eq, ne = '==', '!='
-            ops = 2 * ([eq] + [ne])
-
-            for lhs, op, rhs in zip(lhs, ops, rhs):
-                ex = '{lhs} {op} {rhs}'.format(lhs=lhs, op=op, rhs=rhs)
-                assertRaises(NotImplementedError, df.query, ex, engine=engine,
-                             parser=parser, local_dict={'strings': df.strings})
-        else:
-            res = df.query('"a" == strings', engine=engine, parser=parser)
-            assert_frame_equal(res, expect)
-
-            res = df.query('strings == "a"', engine=engine, parser=parser)
-            assert_frame_equal(res, expect)
-            assert_frame_equal(res, df[df.strings.isin(['a'])])
-
-            expect = df[df.strings != 'a']
-            res = df.query('strings != "a"', engine=engine, parser=parser)
-            assert_frame_equal(res, expect)
-
-            res = df.query('"a" != strings', engine=engine, parser=parser)
-            assert_frame_equal(res, expect)
-            assert_frame_equal(res, df[~df.strings.isin(['a'])])
-
-    def test_str_query_method(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_str_query_method, parser, engine
-
-    def test_str_list_query_method(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_str_list_query_method, parser, engine
-
-    def check_str_list_query_method(self, parser, engine):
-        tm.skip_if_no_ne(engine)
-        df = DataFrame(randn(10, 1), columns=['b'])
-        df['strings'] = Series(list('aabbccddee'))
-        expect = df[df.strings.isin(['a', 'b'])]
-
-        if parser != 'pandas':
-            col = 'strings'
-            lst = '["a", "b"]'
-
-            lhs = [col] * 2 + [lst] * 2
-            rhs = lhs[::-1]
-
-            eq, ne = '==', '!='
-            ops = 2 * ([eq] + [ne])
-
-            for lhs, op, rhs in zip(lhs, ops, rhs):
-                ex = '{lhs} {op} {rhs}'.format(lhs=lhs, op=op, rhs=rhs)
-                with tm.assertRaises(NotImplementedError):
-                    df.query(ex, engine=engine, parser=parser)
-        else:
-            res = df.query('strings == ["a", "b"]', engine=engine,
-                           parser=parser)
-            assert_frame_equal(res, expect)
-
-            res = df.query('["a", "b"] == strings', engine=engine,
-                           parser=parser)
-            assert_frame_equal(res, expect)
-
-            expect = df[~df.strings.isin(['a', 'b'])]
-
-            res = df.query('strings != ["a", "b"]', engine=engine,
-                           parser=parser)
-            assert_frame_equal(res, expect)
-
-            res = df.query('["a", "b"] != strings', engine=engine,
-                           parser=parser)
-            assert_frame_equal(res, expect)
-
-    def check_query_with_string_columns(self, parser, engine):
-        tm.skip_if_no_ne(engine)
-        df = DataFrame({'a': list('aaaabbbbcccc'),
-                        'b': list('aabbccddeeff'),
-                        'c': np.random.randint(5, size=12),
-                        'd': np.random.randint(9, size=12)})
-        if parser == 'pandas':
-            res = df.query('a in b', parser=parser, engine=engine)
-            expec = df[df.a.isin(df.b)]
-            assert_frame_equal(res, expec)
-
-            res = df.query('a in b and c < d', parser=parser, engine=engine)
-            expec = df[df.a.isin(df.b) & (df.c < df.d)]
-            assert_frame_equal(res, expec)
-        else:
-            with assertRaises(NotImplementedError):
-                df.query('a in b', parser=parser, engine=engine)
-
-            with assertRaises(NotImplementedError):
-                df.query('a in b and c < d', parser=parser, engine=engine)
-
-    def test_query_with_string_columns(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_query_with_string_columns, parser, engine
-
-    def check_object_array_eq_ne(self, parser, engine):
-        tm.skip_if_no_ne(engine)
-        df = DataFrame({'a': list('aaaabbbbcccc'),
-                        'b': list('aabbccddeeff'),
-                        'c': np.random.randint(5, size=12),
-                        'd': np.random.randint(9, size=12)})
-        res = df.query('a == b', parser=parser, engine=engine)
-        exp = df[df.a == df.b]
-        assert_frame_equal(res, exp)
-
-        res = df.query('a != b', parser=parser, engine=engine)
-        exp = df[df.a != df.b]
-        assert_frame_equal(res, exp)
-
-    def test_object_array_eq_ne(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_object_array_eq_ne, parser, engine
-
-    def check_query_with_nested_strings(self, parser, engine):
-        tm.skip_if_no_ne(engine)
-        skip_if_no_pandas_parser(parser)
-        from pandas.compat import StringIO
-        raw = """id          event          timestamp
-        1   "page 1 load"   1/1/2014 0:00:01
-        1   "page 1 exit"   1/1/2014 0:00:31
-        2   "page 2 load"   1/1/2014 0:01:01
-        2   "page 2 exit"   1/1/2014 0:01:31
-        3   "page 3 load"   1/1/2014 0:02:01
-        3   "page 3 exit"   1/1/2014 0:02:31
-        4   "page 1 load"   2/1/2014 1:00:01
-        4   "page 1 exit"   2/1/2014 1:00:31
-        5   "page 2 load"   2/1/2014 1:01:01
-        5   "page 2 exit"   2/1/2014 1:01:31
-        6   "page 3 load"   2/1/2014 1:02:01
-        6   "page 3 exit"   2/1/2014 1:02:31
-        """
-        df = pd.read_csv(StringIO(raw), sep=r'\s{2,}', engine='python',
-                         parse_dates=['timestamp'])
-        expected = df[df.event == '"page 1 load"']
-        res = df.query("""'"page 1 load"' in event""", parser=parser,
-                       engine=engine)
-        tm.assert_frame_equal(expected, res)
-
-    def test_query_with_nested_string(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_query_with_nested_strings, parser, engine
-
-    def check_query_with_nested_special_character(self, parser, engine):
-        skip_if_no_pandas_parser(parser)
-        tm.skip_if_no_ne(engine)
-        df = DataFrame({'a': ['a', 'b', 'test & test'],
-                        'b': [1, 2, 3]})
-        res = df.query('a == "test & test"', parser=parser, engine=engine)
-        expec = df[df.a == 'test & test']
-        tm.assert_frame_equal(res, expec)
-
-    def test_query_with_nested_special_character(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_query_with_nested_special_character, parser, engine
-
-    def check_query_lex_compare_strings(self, parser, engine):
-        tm.skip_if_no_ne(engine=engine)
-        import operator as opr
-
-        a = Series(tm.choice(list('abcde'), 20))
-        b = Series(np.arange(a.size))
-        df = DataFrame({'X': a, 'Y': b})
-
-        ops = {'<': opr.lt, '>': opr.gt, '<=': opr.le, '>=': opr.ge}
-
-        for op, func in ops.items():
-            res = df.query('X %s "d"' % op, engine=engine, parser=parser)
-            expected = df[func(df.X, 'd')]
-            assert_frame_equal(res, expected)
-
-    def test_query_lex_compare_strings(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_query_lex_compare_strings, parser, engine
-
-    def check_query_single_element_booleans(self, parser, engine):
-        tm.skip_if_no_ne(engine)
-        columns = 'bid', 'bidsize', 'ask', 'asksize'
-        data = np.random.randint(2, size=(1, len(columns))).astype(bool)
-        df = DataFrame(data, columns=columns)
-        res = df.query('bid & ask', engine=engine, parser=parser)
-        expected = df[df.bid & df.ask]
-        assert_frame_equal(res, expected)
-
-    def test_query_single_element_booleans(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_query_single_element_booleans, parser, engine
-
-    def check_query_string_scalar_variable(self, parser, engine):
-        tm.skip_if_no_ne(engine)
-        df = pd.DataFrame({'Symbol': ['BUD US', 'BUD US', 'IBM US', 'IBM US'],
-                           'Price': [109.70, 109.72, 183.30, 183.35]})
-        e = df[df.Symbol == 'BUD US']
-        symb = 'BUD US'
-        r = df.query('Symbol == @symb', parser=parser, engine=engine)
-        tm.assert_frame_equal(e, r)
-
-    def test_query_string_scalar_variable(self):
-        for parser, engine in product(['pandas'], ENGINES):
-            yield self.check_query_string_scalar_variable, parser, engine
-
-
-class TestDataFrameEvalNumExprPandas(tm.TestCase):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameEvalNumExprPandas, cls).setUpClass()
-        cls.engine = 'numexpr'
-        cls.parser = 'pandas'
-        tm.skip_if_no_ne()
-
-    def setUp(self):
-        self.frame = DataFrame(randn(10, 3), columns=list('abc'))
-
-    def tearDown(self):
-        del self.frame
-
-    def test_simple_expr(self):
-        res = self.frame.eval('a + b', engine=self.engine, parser=self.parser)
-        expect = self.frame.a + self.frame.b
-        assert_series_equal(res, expect)
-
-    def test_bool_arith_expr(self):
-        res = self.frame.eval('a[a < 1] + b', engine=self.engine,
-                              parser=self.parser)
-        expect = self.frame.a[self.frame.a < 1] + self.frame.b
-        assert_series_equal(res, expect)
-
-    def test_invalid_type_for_operator_raises(self):
-        df = DataFrame({'a': [1, 2], 'b': ['c', 'd']})
-        ops = '+', '-', '*', '/'
-        for op in ops:
-            with tm.assertRaisesRegexp(TypeError,
-                                       "unsupported operand type\(s\) for "
-                                       ".+: '.+' and '.+'"):
-                df.eval('a {0} b'.format(op), engine=self.engine,
-                        parser=self.parser)
-
-
-class TestDataFrameEvalNumExprPython(TestDataFrameEvalNumExprPandas):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameEvalNumExprPython, cls).setUpClass()
-        cls.engine = 'numexpr'
-        cls.parser = 'python'
-        tm.skip_if_no_ne(cls.engine)
-
-
-class TestDataFrameEvalPythonPandas(TestDataFrameEvalNumExprPandas):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameEvalPythonPandas, cls).setUpClass()
-        cls.engine = 'python'
-        cls.parser = 'pandas'
-
-
-class TestDataFrameEvalPythonPython(TestDataFrameEvalNumExprPython):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameEvalPythonPython, cls).tearDownClass()
-        cls.engine = cls.parser = 'python'
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_generic.py b/pandas/tests/test_generic.py
deleted file mode 100644
index 061382e0e16de..0000000000000
--- a/pandas/tests/test_generic.py
+++ /dev/null
@@ -1,1865 +0,0 @@
-# -*- coding: utf-8 -*-
-# pylint: disable-msg=E1101,W0612
-
-from datetime import datetime, timedelta
-import nose
-import numpy as np
-from numpy import nan
-import pandas as pd
-
-from pandas import (Index, Series, DataFrame, Panel,
-                    isnull, notnull, date_range, period_range)
-from pandas.core.index import Index, MultiIndex
-
-import pandas.core.common as com
-
-from pandas.compat import StringIO, lrange, range, zip, u, OrderedDict, long
-from pandas import compat
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal,
-                                 assert_panel_equal,
-                                 assert_almost_equal,
-                                 assert_equal,
-                                 ensure_clean)
-import pandas.util.testing as tm
-
-
-def _skip_if_no_pchip():
-    try:
-        from scipy.interpolate import pchip_interpolate
-    except ImportError:
-        raise nose.SkipTest('scipy.interpolate.pchip missing')
-
-#------------------------------------------------------------------------------
-# Generic types test cases
-
-
-class Generic(object):
-
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        import warnings
-        warnings.filterwarnings(action='ignore', category=FutureWarning)
-
-    @property
-    def _ndim(self):
-        return self._typ._AXIS_LEN
-
-    def _axes(self):
-        """ return the axes for my object typ """
-        return self._typ._AXIS_ORDERS
-
-    def _construct(self, shape, value=None, dtype=None, **kwargs):
-        """ construct an object for the given shape
-            if value is specified use that if its a scalar
-            if value is an array, repeat it as needed """
-
-        if isinstance(shape,int):
-            shape = tuple([shape] * self._ndim)
-        if value is not None:
-            if np.isscalar(value):
-                if value == 'empty':
-                    arr = None
-
-                    # remove the info axis
-                    kwargs.pop(self._typ._info_axis_name,None)
-                else:
-                    arr = np.empty(shape,dtype=dtype)
-                    arr.fill(value)
-            else:
-                fshape = np.prod(shape)
-                arr = value.ravel()
-                new_shape = fshape/arr.shape[0]
-                if fshape % arr.shape[0] != 0:
-                    raise Exception("invalid value passed in _construct")
-
-                arr = np.repeat(arr,new_shape).reshape(shape)
-        else:
-            arr = np.random.randn(*shape)
-        return self._typ(arr,dtype=dtype,**kwargs)
-
-    def _compare(self, result, expected):
-        self._comparator(result,expected)
-
-    def test_rename(self):
-
-        # single axis
-        for axis in self._axes():
-            kwargs = { axis : list('ABCD') }
-            obj = self._construct(4,**kwargs)
-
-            # no values passed
-            #self.assertRaises(Exception, o.rename(str.lower))
-
-            # rename a single axis
-            result = obj.rename(**{ axis : str.lower })
-            expected = obj.copy()
-            setattr(expected,axis,list('abcd'))
-            self._compare(result, expected)
-
-        # multiple axes at once
-
-    def test_get_numeric_data(self):
-
-        n = 4
-        kwargs = { }
-        for i in range(self._ndim):
-            kwargs[self._typ._AXIS_NAMES[i]] = list(range(n))
-
-        # get the numeric data
-        o = self._construct(n,**kwargs)
-        result = o._get_numeric_data()
-        self._compare(result, o)
-
-        # non-inclusion
-        result = o._get_bool_data()
-        expected = self._construct(n,value='empty',**kwargs)
-        self._compare(result,expected)
-
-        # get the bool data
-        arr = np.array([True,True,False,True])
-        o = self._construct(n,value=arr,**kwargs)
-        result = o._get_numeric_data()
-        self._compare(result, o)
-
-        # _get_numeric_data is includes _get_bool_data, so can't test for non-inclusion
-
-    def test_get_default(self):
-
-        # GH 7725
-        d0 = "a", "b", "c", "d"
-        d1 = np.arange(4, dtype='int64')
-        others = "e", 10
-
-        for data, index in ((d0, d1), (d1, d0)):
-            s = Series(data, index=index)
-            for i,d in zip(index, data):
-                self.assertEqual(s.get(i), d)
-                self.assertEqual(s.get(i, d), d)
-                self.assertEqual(s.get(i, "z"), d)
-                for other in others:
-                    self.assertEqual(s.get(other, "z"), "z")
-                    self.assertEqual(s.get(other, other), other)
-
-    def test_nonzero(self):
-
-        # GH 4633
-        # look at the boolean/nonzero behavior for objects
-        obj = self._construct(shape=4)
-        self.assertRaises(ValueError, lambda : bool(obj == 0))
-        self.assertRaises(ValueError, lambda : bool(obj == 1))
-        self.assertRaises(ValueError, lambda : bool(obj))
-
-        obj = self._construct(shape=4,value=1)
-        self.assertRaises(ValueError, lambda : bool(obj == 0))
-        self.assertRaises(ValueError, lambda : bool(obj == 1))
-        self.assertRaises(ValueError, lambda : bool(obj))
-
-        obj = self._construct(shape=4,value=np.nan)
-        self.assertRaises(ValueError, lambda : bool(obj == 0))
-        self.assertRaises(ValueError, lambda : bool(obj == 1))
-        self.assertRaises(ValueError, lambda : bool(obj))
-
-        # empty
-        obj = self._construct(shape=0)
-        self.assertRaises(ValueError, lambda : bool(obj))
-
-        # invalid behaviors
-
-        obj1 = self._construct(shape=4,value=1)
-        obj2 = self._construct(shape=4,value=1)
-
-        def f():
-            if obj1:
-                com.pprint_thing("this works and shouldn't")
-        self.assertRaises(ValueError, f)
-        self.assertRaises(ValueError, lambda : obj1 and obj2)
-        self.assertRaises(ValueError, lambda : obj1 or obj2)
-        self.assertRaises(ValueError, lambda : not obj1)
-
-    def test_numpy_1_7_compat_numeric_methods(self):
-        # GH 4435
-        # numpy in 1.7 tries to pass addtional arguments to pandas functions
-
-        o = self._construct(shape=4)
-        for op in ['min','max','max','var','std','prod','sum','cumsum','cumprod',
-                   'median','skew','kurt','compound','cummax','cummin','all','any']:
-            f = getattr(np,op,None)
-            if f is not None:
-                f(o)
-
-    def test_downcast(self):
-        # test close downcasting
-
-        o = self._construct(shape=4, value=9, dtype=np.int64)
-        result = o.copy()
-        result._data = o._data.downcast(dtypes='infer')
-        self._compare(result, o)
-
-        o = self._construct(shape=4, value=9.)
-        expected = o.astype(np.int64)
-        result = o.copy()
-        result._data = o._data.downcast(dtypes='infer')
-        self._compare(result, expected)
-
-        o = self._construct(shape=4, value=9.5)
-        result = o.copy()
-        result._data = o._data.downcast(dtypes='infer')
-        self._compare(result, o)
-
-        # are close
-        o = self._construct(shape=4, value=9.000000000005)
-        result = o.copy()
-        result._data = o._data.downcast(dtypes='infer')
-        expected = o.astype(np.int64)
-        self._compare(result, expected)
-
-    def test_constructor_compound_dtypes(self):
-        # GH 5191
-        # compound dtypes should raise not-implementederror
-
-        def f(dtype):
-            return self._construct(shape=3, dtype=dtype)
-
-        self.assertRaises(NotImplementedError, f, [("A","datetime64[h]"), ("B","str"), ("C","int32")])
-
-        # these work (though results may be unexpected)
-        f('int64')
-        f('float64')
-        f('M8[ns]')
-
-    def check_metadata(self, x, y=None):
-        for m in x._metadata:
-            v = getattr(x,m,None)
-            if y is None:
-                self.assertIsNone(v)
-            else:
-                self.assertEqual(v, getattr(y,m,None))
-
-    def test_metadata_propagation(self):
-        # check that the metadata matches up on the resulting ops
-
-        o = self._construct(shape=3)
-        o.name = 'foo'
-        o2 = self._construct(shape=3)
-        o2.name = 'bar'
-
-        # TODO
-        # Once panel can do non-trivial combine operations
-        # (currently there is an a raise in the Panel arith_ops to prevent
-        # this, though it actually does work)
-        # can remove all of these try: except: blocks on the actual operations
-
-
-        # ----------
-        # preserving
-        # ----------
-
-        # simple ops with scalars
-        for op in [ '__add__','__sub__','__truediv__','__mul__' ]:
-            result = getattr(o,op)(1)
-            self.check_metadata(o,result)
-
-        # ops with like
-        for op in [ '__add__','__sub__','__truediv__','__mul__' ]:
-            try:
-                result = getattr(o,op)(o)
-                self.check_metadata(o,result)
-            except (ValueError, AttributeError):
-                pass
-
-        # simple boolean
-        for op in [ '__eq__','__le__', '__ge__' ]:
-            v1 = getattr(o,op)(o)
-            self.check_metadata(o,v1)
-
-            try:
-                self.check_metadata(o, v1 & v1)
-            except (ValueError):
-                pass
-
-            try:
-                self.check_metadata(o, v1 | v1)
-            except (ValueError):
-                pass
-
-        # combine_first
-        try:
-            result = o.combine_first(o2)
-            self.check_metadata(o,result)
-        except (AttributeError):
-            pass
-
-        # ---------------------------
-        # non-preserving (by default)
-        # ---------------------------
-
-        # add non-like
-        try:
-            result = o + o2
-            self.check_metadata(result)
-        except (ValueError, AttributeError):
-            pass
-
-        # simple boolean
-        for op in [ '__eq__','__le__', '__ge__' ]:
-
-            # this is a name matching op
-            v1 = getattr(o,op)(o)
-
-            v2 = getattr(o,op)(o2)
-            self.check_metadata(v2)
-
-            try:
-                self.check_metadata(v1 & v2)
-            except (ValueError):
-                pass
-
-            try:
-                self.check_metadata(v1 | v2)
-            except (ValueError):
-                pass
-
-    def test_head_tail(self):
-        # GH5370
-
-        o = self._construct(shape=10)
-
-        # check all index types
-        for index in [ tm.makeFloatIndex, tm.makeIntIndex,
-                       tm.makeStringIndex, tm.makeUnicodeIndex,
-                       tm.makeDateIndex, tm.makePeriodIndex ]:
-            axis = o._get_axis_name(0)
-            setattr(o,axis,index(len(getattr(o,axis))))
-
-            # Panel + dims
-            try:
-                o.head()
-            except (NotImplementedError):
-                raise nose.SkipTest('not implemented on {0}'.format(o.__class__.__name__))
-
-            self._compare(o.head(), o.iloc[:5])
-            self._compare(o.tail(), o.iloc[-5:])
-
-            # 0-len
-            self._compare(o.head(0), o.iloc[:])
-            self._compare(o.tail(0), o.iloc[0:])
-
-            # bounded
-            self._compare(o.head(len(o)+1), o)
-            self._compare(o.tail(len(o)+1), o)
-
-            # neg index
-            self._compare(o.head(-3), o.head(7))
-            self._compare(o.tail(-3), o.tail(7))
-
-    def test_sample(self):
-        # Fixes issue: 2419
-
-        o = self._construct(shape=10)
-
-        ###
-        # Check behavior of random_state argument
-        ###
-
-        # Check for stability when receives seed or random state -- run 10 times.
-        for test in range(10):
-            seed = np.random.randint(0,100)
-            self._compare(o.sample(n=4, random_state=seed), o.sample(n=4, random_state=seed))
-            self._compare(o.sample(frac=0.7,random_state=seed), o.sample(frac=0.7, random_state=seed))
-
-            self._compare(o.sample(n=4, random_state=np.random.RandomState(test)),
-                          o.sample(n=4, random_state=np.random.RandomState(test)))
-
-            self._compare(o.sample(frac=0.7,random_state=np.random.RandomState(test)),
-                          o.sample(frac=0.7, random_state=np.random.RandomState(test)))
-
-
-        # Check for error when random_state argument invalid.
-        with tm.assertRaises(ValueError):
-            o.sample(random_state='astring!')
-
-        ###
-        # Check behavior of `frac` and `N`
-        ###
-
-        # Giving both frac and N throws error
-        with tm.assertRaises(ValueError):
-            o.sample(n=3, frac=0.3)
-
-        # Check that raises right error for negative lengths
-        with tm.assertRaises(ValueError):
-            o.sample(n=-3)
-        with tm.assertRaises(ValueError):
-            o.sample(frac=-0.3)
-
-        # Make sure float values of `n` give error
-        with tm.assertRaises(ValueError):
-            o.sample(n= 3.2)
-
-        # Check lengths are right
-        self.assertTrue(len(o.sample(n=4) == 4))
-        self.assertTrue(len(o.sample(frac=0.34) == 3))
-        self.assertTrue(len(o.sample(frac=0.36) == 4))
-
-        ###
-        # Check weights
-        ###
-
-        # Weight length must be right
-        with tm.assertRaises(ValueError):
-            o.sample(n=3, weights=[0,1])
-
-        with tm.assertRaises(ValueError):
-            bad_weights = [0.5]*11
-            o.sample(n=3, weights=bad_weights)
-
-        with tm.assertRaises(ValueError):
-            bad_weight_series = Series([0,0,0.2])
-            o.sample(n=4, weights=bad_weight_series)
-
-        # Check won't accept negative weights
-        with tm.assertRaises(ValueError):
-            bad_weights = [-0.1]*10
-            o.sample(n=3, weights=bad_weights)
-
-        # Check inf and -inf throw errors:
-        with tm.assertRaises(ValueError):
-            weights_with_inf = [0.1]*10
-            weights_with_inf[0] = np.inf
-            o.sample(n=3, weights=weights_with_inf)
-
-        with tm.assertRaises(ValueError):
-            weights_with_ninf = [0.1]*10
-            weights_with_ninf[0] =  -np.inf
-            o.sample(n=3, weights=weights_with_ninf)
-
-        # All zeros raises errors
-        zero_weights = [0]*10
-        with tm.assertRaises(ValueError):
-            o.sample(n=3, weights=zero_weights)
-
-        # All missing weights
-        nan_weights = [np.nan]*10
-        with tm.assertRaises(ValueError):
-            o.sample(n=3, weights=nan_weights)
-
-
-        # A few dataframe test with degenerate weights.
-        easy_weight_list = [0]*10
-        easy_weight_list[5] = 1
-
-        df = pd.DataFrame({'col1':range(10,20),
-                           'col2':range(20,30),
-                           'colString': ['a']*10,
-                           'easyweights':easy_weight_list})
-        sample1 = df.sample(n=1, weights='easyweights')
-        assert_frame_equal(sample1, df.iloc[5:6])
-
-        # Ensure proper error if string given as weight for Series, panel, or
-        # DataFrame with axis = 1.
-        s = Series(range(10))
-        with tm.assertRaises(ValueError):
-            s.sample(n=3, weights='weight_column')
-
-        panel = pd.Panel(items = [0,1,2], major_axis = [2,3,4], minor_axis = [3,4,5])
-        with tm.assertRaises(ValueError):
-            panel.sample(n=1, weights='weight_column')
-
-        with tm.assertRaises(ValueError):
-            df.sample(n=1, weights='weight_column', axis = 1)
-
-        # Check weighting key error
-        with tm.assertRaises(KeyError):
-            df.sample(n=3, weights='not_a_real_column_name')
-
-         # Check np.nan are replaced by zeros.
-        weights_with_nan = [np.nan]*10
-        weights_with_nan[5] = 0.5
-        self._compare(o.sample(n=1, axis=0, weights=weights_with_nan), o.iloc[5:6])
-
-        # Check None are also replaced by zeros.
-        weights_with_None = [None]*10
-        weights_with_None[5] = 0.5
-        self._compare(o.sample(n=1, axis=0, weights=weights_with_None), o.iloc[5:6])
-
-        # Check that re-normalizes weights that don't sum to one.
-        weights_less_than_1 = [0]*10
-        weights_less_than_1[0] = 0.5
-        tm.assert_frame_equal(df.sample(n=1, weights=weights_less_than_1), df.iloc[:1])
-
-
-        ###
-        # Test axis argument
-        ###
-
-        # Test axis argument
-        df = pd.DataFrame({'col1':range(10), 'col2':['a']*10})
-        second_column_weight = [0,1]
-        assert_frame_equal(df.sample(n=1, axis=1, weights=second_column_weight), df[['col2']])
-
-        # Different axis arg types
-        assert_frame_equal(df.sample(n=1, axis='columns', weights=second_column_weight),
-                           df[['col2']])
-
-        weight = [0]*10
-        weight[5] = 0.5
-        assert_frame_equal(df.sample(n=1, axis='rows', weights=weight),
-                           df.iloc[5:6])
-        assert_frame_equal(df.sample(n=1, axis='index', weights=weight),
-                           df.iloc[5:6])
-
-        # Check out of range axis values
-        with tm.assertRaises(ValueError):
-            df.sample(n=1, axis=2)
-
-        with tm.assertRaises(ValueError):
-            df.sample(n=1, axis='not_a_name')
-
-        with tm.assertRaises(ValueError):
-            s = pd.Series(range(10))
-            s.sample(n=1, axis=1)
-
-        # Test weight length compared to correct axis
-        with tm.assertRaises(ValueError):
-            df.sample(n=1, axis=1, weights=[0.5]*10)
-
-        # Check weights with axis = 1
-        easy_weight_list = [0]*3
-        easy_weight_list[2] = 1
-
-        df = pd.DataFrame({'col1':range(10,20),
-                           'col2':range(20,30),
-                           'colString': ['a']*10})
-        sample1 = df.sample(n=1, axis=1, weights=easy_weight_list)
-        assert_frame_equal(sample1, df[['colString']])
-
-        # Test default axes
-        p = pd.Panel(items = ['a','b','c'], major_axis=[2,4,6], minor_axis=[1,3,5])
-        assert_panel_equal(p.sample(n=3, random_state=42), p.sample(n=3, axis=1, random_state=42))
-        assert_frame_equal(df.sample(n=3, random_state=42), df.sample(n=3, axis=0, random_state=42))
-
-        # Test that function aligns weights with frame
-        df = DataFrame({'col1':[5,6,7], 'col2':['a','b','c'], }, index = [9,5,3])
-        s = Series([1,0,0], index=[3,5,9])
-        assert_frame_equal(df.loc[[3]], df.sample(1, weights=s))
-
-        # Weights have index values to be dropped because not in
-        # sampled DataFrame
-        s2 = Series([0.001,0,10000], index=[3,5,10])
-        assert_frame_equal(df.loc[[3]], df.sample(1, weights=s2))
-
-        # Weights have empty values to be filed with zeros
-        s3 = Series([0.01,0], index=[3,5])
-        assert_frame_equal(df.loc[[3]], df.sample(1, weights=s3))
-
-        # No overlap in weight and sampled DataFrame indices
-        s4 = Series([1,0], index=[1,2])
-        with tm.assertRaises(ValueError):
-            df.sample(1, weights=s4)
-
-
-    def test_size_compat(self):
-        # GH8846
-        # size property should be defined
-
-        o = self._construct(shape=10)
-        self.assertTrue(o.size == np.prod(o.shape))
-        self.assertTrue(o.size == 10**len(o.axes))
-
-    def test_split_compat(self):
-        # xref GH8846
-        o = self._construct(shape=10)
-        self.assertTrue(len(np.array_split(o,5)) == 5)
-        self.assertTrue(len(np.array_split(o,2)) == 2)
-
-    def test_unexpected_keyword(self):  # GH8597
-        from pandas.util.testing import assertRaisesRegexp
-
-        df = DataFrame(np.random.randn(5, 2), columns=['jim', 'joe'])
-        ca = pd.Categorical([0, 0, 2, 2, 3, np.nan])
-        ts = df['joe'].copy()
-        ts[2] = np.nan
-
-        with assertRaisesRegexp(TypeError, 'unexpected keyword'):
-            df.drop('joe', axis=1, in_place=True)
-
-        with assertRaisesRegexp(TypeError, 'unexpected keyword'):
-            df.reindex([1, 0], inplace=True)
-
-        with assertRaisesRegexp(TypeError, 'unexpected keyword'):
-            ca.fillna(0, inplace=True)
-
-        with assertRaisesRegexp(TypeError, 'unexpected keyword'):
-            ts.fillna(0, in_place=True)
-
-class TestSeries(tm.TestCase, Generic):
-    _typ = Series
-    _comparator = lambda self, x, y: assert_series_equal(x,y)
-
-    def setUp(self):
-        self.ts = tm.makeTimeSeries()  # Was at top level in test_series
-        self.ts.name = 'ts'
-
-        self.series = tm.makeStringSeries()
-        self.series.name = 'series'
-
-    def test_rename_mi(self):
-        s = Series([11,21,31],
-                   index=MultiIndex.from_tuples([("A",x) for x in ["a","B","c"]]))
-        result = s.rename(str.lower)
-
-    def test_get_numeric_data_preserve_dtype(self):
-
-        # get the numeric data
-        o = Series([1,2,3])
-        result = o._get_numeric_data()
-        self._compare(result, o)
-
-        o = Series([1,'2',3.])
-        result = o._get_numeric_data()
-        expected = Series([],dtype=object)
-        self._compare(result, expected)
-
-        o = Series([True,False,True])
-        result = o._get_numeric_data()
-        self._compare(result, o)
-
-        o = Series([True,False,True])
-        result = o._get_bool_data()
-        self._compare(result, o)
-
-        o = Series(date_range('20130101',periods=3))
-        result = o._get_numeric_data()
-        expected = Series([],dtype='M8[ns]')
-        self._compare(result, expected)
-
-    def test_nonzero_single_element(self):
-
-        # allow single item via bool method
-        s = Series([True])
-        self.assertTrue(s.bool())
-
-        s = Series([False])
-        self.assertFalse(s.bool())
-
-        # single item nan to raise
-        for s in [ Series([np.nan]), Series([pd.NaT]), Series([True]), Series([False]) ]:
-            self.assertRaises(ValueError, lambda : bool(s))
-
-        for s in [ Series([np.nan]), Series([pd.NaT])]:
-            self.assertRaises(ValueError, lambda : s.bool())
-
-        # multiple bool are still an error
-        for s in [Series([True,True]), Series([False, False])]:
-            self.assertRaises(ValueError, lambda : bool(s))
-            self.assertRaises(ValueError, lambda : s.bool())
-
-        # single non-bool are an error
-        for s in [Series([1]), Series([0]),
-                  Series(['a']), Series([0.0])]:
-            self.assertRaises(ValueError, lambda : bool(s))
-            self.assertRaises(ValueError, lambda : s.bool())
-
-    def test_metadata_propagation_indiv(self):
-        # check that the metadata matches up on the resulting ops
-
-        o = Series(range(3),range(3))
-        o.name = 'foo'
-        o2 = Series(range(3),range(3))
-        o2.name = 'bar'
-
-        result = o.T
-        self.check_metadata(o,result)
-
-        # resample
-        ts = Series(np.random.rand(1000),
-                    index=date_range('20130101',periods=1000,freq='s'),
-                    name='foo')
-        result = ts.resample('1T')
-        self.check_metadata(ts,result)
-
-        result = ts.resample('1T',how='min')
-        self.check_metadata(ts,result)
-
-        result = ts.resample('1T',how=lambda x: x.sum())
-        self.check_metadata(ts,result)
-
-        _metadata = Series._metadata
-        _finalize = Series.__finalize__
-        Series._metadata = ['name','filename']
-        o.filename = 'foo'
-        o2.filename = 'bar'
-
-        def finalize(self, other, method=None, **kwargs):
-            for name in self._metadata:
-                if method == 'concat' and name == 'filename':
-                    value = '+'.join([ getattr(o,name) for o in other.objs if getattr(o,name,None) ])
-                    object.__setattr__(self, name, value)
-                else:
-                    object.__setattr__(self, name, getattr(other, name, None))
-
-            return self
-
-        Series.__finalize__ = finalize
-
-        result = pd.concat([o, o2])
-        self.assertEqual(result.filename,'foo+bar')
-        self.assertIsNone(result.name)
-
-        # reset
-        Series._metadata = _metadata
-        Series.__finalize__ = _finalize
-
-    def test_interpolate(self):
-        ts = Series(np.arange(len(self.ts), dtype=float), self.ts.index)
-
-        ts_copy = ts.copy()
-        ts_copy[5:10] = np.NaN
-
-        linear_interp = ts_copy.interpolate(method='linear')
-        self.assert_numpy_array_equal(linear_interp, ts)
-
-        ord_ts = Series([d.toordinal() for d in self.ts.index],
-                        index=self.ts.index).astype(float)
-
-        ord_ts_copy = ord_ts.copy()
-        ord_ts_copy[5:10] = np.NaN
-
-        time_interp = ord_ts_copy.interpolate(method='time')
-        self.assert_numpy_array_equal(time_interp, ord_ts)
-
-        # try time interpolation on a non-TimeSeries
-        # Only raises ValueError if there are NaNs.
-        non_ts = self.series.copy()
-        non_ts[0] = np.NaN
-        self.assertRaises(ValueError, non_ts.interpolate, method='time')
-
-    def test_interp_regression(self):
-        tm._skip_if_no_scipy()
-        _skip_if_no_pchip()
-
-        ser = Series(np.sort(np.random.uniform(size=100)))
-
-        # interpolate at new_index
-        new_index = ser.index.union(Index([49.25, 49.5, 49.75, 50.25, 50.5, 50.75]))
-        interp_s = ser.reindex(new_index).interpolate(method='pchip')
-        # does not blow up, GH5977
-        interp_s[49:51]
-
-    def test_interpolate_corners(self):
-        s = Series([np.nan, np.nan])
-        assert_series_equal(s.interpolate(), s)
-
-        s = Series([]).interpolate()
-        assert_series_equal(s.interpolate(), s)
-
-        tm._skip_if_no_scipy()
-        s = Series([np.nan, np.nan])
-        assert_series_equal(s.interpolate(method='polynomial', order=1), s)
-
-        s = Series([]).interpolate()
-        assert_series_equal(s.interpolate(method='polynomial', order=1), s)
-
-    def test_interpolate_index_values(self):
-        s = Series(np.nan, index=np.sort(np.random.rand(30)))
-        s[::3] = np.random.randn(10)
-
-        vals = s.index.values.astype(float)
-
-        result = s.interpolate(method='index')
-
-        expected = s.copy()
-        bad = isnull(expected.values)
-        good = ~bad
-        expected = Series(
-            np.interp(vals[bad], vals[good], s.values[good]), index=s.index[bad])
-
-        assert_series_equal(result[bad], expected)
-
-        # 'values' is synonymous with 'index' for the method kwarg
-        other_result = s.interpolate(method='values')
-
-        assert_series_equal(other_result, result)
-        assert_series_equal(other_result[bad], expected)
-
-    def test_interpolate_non_ts(self):
-        s = Series([1, 3, np.nan, np.nan, np.nan, 11])
-        with tm.assertRaises(ValueError):
-            s.interpolate(method='time')
-
-    # New interpolation tests
-    def test_nan_interpolate(self):
-        s = Series([0, 1, np.nan, 3])
-        result = s.interpolate()
-        expected = Series([0., 1., 2., 3.])
-        assert_series_equal(result, expected)
-
-        tm._skip_if_no_scipy()
-        result = s.interpolate(method='polynomial', order=1)
-        assert_series_equal(result, expected)
-
-    def test_nan_irregular_index(self):
-        s = Series([1, 2, np.nan, 4], index=[1, 3, 5, 9])
-        result = s.interpolate()
-        expected = Series([1., 2., 3., 4.], index=[1, 3, 5, 9])
-        assert_series_equal(result, expected)
-
-    def test_nan_str_index(self):
-        s = Series([0, 1, 2, np.nan], index=list('abcd'))
-        result = s.interpolate()
-        expected = Series([0., 1., 2., 2.], index=list('abcd'))
-        assert_series_equal(result, expected)
-
-    def test_interp_quad(self):
-        tm._skip_if_no_scipy()
-        sq = Series([1, 4, np.nan, 16], index=[1, 2, 3, 4])
-        result = sq.interpolate(method='quadratic')
-        expected = Series([1., 4., 9., 16.], index=[1, 2, 3, 4])
-        assert_series_equal(result, expected)
-
-    def test_interp_scipy_basic(self):
-        tm._skip_if_no_scipy()
-        s = Series([1, 3, np.nan, 12, np.nan, 25])
-        # slinear
-        expected = Series([1., 3., 7.5, 12., 18.5, 25.])
-        result = s.interpolate(method='slinear')
-        assert_series_equal(result, expected)
-
-        result = s.interpolate(method='slinear', downcast='infer')
-        assert_series_equal(result, expected)
-        # nearest
-        expected = Series([1, 3, 3, 12, 12, 25])
-        result = s.interpolate(method='nearest')
-        assert_series_equal(result, expected.astype('float'))
-
-        result = s.interpolate(method='nearest', downcast='infer')
-        assert_series_equal(result, expected)
-        # zero
-        expected = Series([1, 3, 3, 12, 12, 25])
-        result = s.interpolate(method='zero')
-        assert_series_equal(result, expected.astype('float'))
-
-        result = s.interpolate(method='zero', downcast='infer')
-        assert_series_equal(result, expected)
-        # quadratic
-        expected = Series([1, 3., 6.769231, 12., 18.230769, 25.])
-        result = s.interpolate(method='quadratic')
-        assert_series_equal(result, expected)
-
-        result = s.interpolate(method='quadratic', downcast='infer')
-        assert_series_equal(result, expected)
-        # cubic
-        expected = Series([1., 3., 6.8, 12., 18.2, 25.])
-        result = s.interpolate(method='cubic')
-        assert_series_equal(result, expected)
-
-    def test_interp_limit(self):
-        s = Series([1, 3, np.nan, np.nan, np.nan, 11])
-
-        expected = Series([1., 3., 5., 7., np.nan, 11.])
-        result = s.interpolate(method='linear', limit=2)
-        assert_series_equal(result, expected)
-
-    def test_interp_limit_forward(self):
-        s = Series([1, 3, np.nan, np.nan, np.nan, 11])
-
-        # Provide 'forward' (the default) explicitly here.
-        expected = Series([1., 3., 5., 7., np.nan, 11.])
-
-        result = s.interpolate(
-            method='linear', limit=2, limit_direction='forward')
-        assert_series_equal(result, expected)
-
-        result = s.interpolate(
-            method='linear', limit=2, limit_direction='FORWARD')
-        assert_series_equal(result, expected)
-
-    def test_interp_limit_bad_direction(self):
-        s = Series([1, 3, np.nan, np.nan, np.nan, 11])
-
-        self.assertRaises(ValueError, s.interpolate,
-                          method='linear', limit=2,
-                          limit_direction='abc')
-
-        # raises an error even if no limit is specified.
-        self.assertRaises(ValueError, s.interpolate,
-                          method='linear',
-                          limit_direction='abc')
-
-    def test_interp_limit_direction(self):
-        # These tests are for issue #9218 -- fill NaNs in both directions.
-        s = Series([1, 3, np.nan, np.nan, np.nan, 11])
-
-        expected = Series([1., 3., np.nan, 7., 9., 11.])
-        result = s.interpolate(
-            method='linear', limit=2, limit_direction='backward')
-        assert_series_equal(result, expected)
-
-        expected = Series([1., 3., 5., np.nan, 9., 11.])
-        result = s.interpolate(
-            method='linear', limit=1, limit_direction='both')
-        assert_series_equal(result, expected)
-
-        # Check that this works on a longer series of nans.
-        s = Series([1, 3, np.nan, np.nan, np.nan, 7, 9, np.nan, np.nan, 12, np.nan])
-
-        expected = Series([1., 3., 4., 5., 6., 7., 9., 10., 11., 12., 12.])
-        result = s.interpolate(
-            method='linear', limit=2, limit_direction='both')
-        assert_series_equal(result, expected)
-
-        expected = Series([1., 3., 4., np.nan, 6., 7., 9., 10., 11., 12., 12.])
-        result = s.interpolate(
-            method='linear', limit=1, limit_direction='both')
-        assert_series_equal(result, expected)
-
-    def test_interp_limit_to_ends(self):
-        # These test are for issue #10420 -- flow back to beginning.
-        s = Series([np.nan, np.nan, 5, 7, 9, np.nan])
-
-        expected = Series([5., 5., 5., 7., 9., np.nan])
-        result = s.interpolate(
-            method='linear', limit=2, limit_direction='backward')
-        assert_series_equal(result, expected)
-
-        expected = Series([5., 5., 5., 7., 9., 9.])
-        result = s.interpolate(
-            method='linear', limit=2, limit_direction='both')
-        assert_series_equal(result, expected)
-
-    def test_interp_limit_before_ends(self):
-        # These test are for issue #11115 -- limit ends properly.
-        s = Series([np.nan, np.nan, 5, 7, np.nan, np.nan])
-
-        expected = Series([np.nan, np.nan, 5., 7., 7., np.nan])
-        result = s.interpolate(
-            method='linear', limit=1, limit_direction='forward')
-        assert_series_equal(result, expected)
-
-        expected = Series([np.nan, 5., 5., 7., np.nan, np.nan])
-        result = s.interpolate(
-            method='linear', limit=1, limit_direction='backward')
-        assert_series_equal(result, expected)
-
-        expected = Series([np.nan, 5., 5., 7., 7., np.nan])
-        result = s.interpolate(
-            method='linear', limit=1, limit_direction='both')
-        assert_series_equal(result, expected)
-
-    def test_interp_all_good(self):
-        # scipy
-        tm._skip_if_no_scipy()
-        s = Series([1, 2, 3])
-        result = s.interpolate(method='polynomial', order=1)
-        assert_series_equal(result, s)
-
-        # non-scipy
-        result = s.interpolate()
-        assert_series_equal(result, s)
-
-    def test_interp_multiIndex(self):
-        idx = MultiIndex.from_tuples([(0, 'a'), (1, 'b'), (2, 'c')])
-        s = Series([1, 2, np.nan], index=idx)
-
-        expected = s.copy()
-        expected.loc[2] = 2
-        result = s.interpolate()
-        assert_series_equal(result, expected)
-
-        tm._skip_if_no_scipy()
-        with tm.assertRaises(ValueError):
-            s.interpolate(method='polynomial', order=1)
-
-    def test_interp_nonmono_raise(self):
-        tm._skip_if_no_scipy()
-        s = Series([1, np.nan, 3], index=[0, 2, 1])
-        with tm.assertRaises(ValueError):
-            s.interpolate(method='krogh')
-
-    def test_interp_datetime64(self):
-        tm._skip_if_no_scipy()
-        df = Series([1, np.nan, 3], index=date_range('1/1/2000', periods=3))
-        result = df.interpolate(method='nearest')
-        expected = Series([1., 1., 3.], index=date_range('1/1/2000', periods=3))
-        assert_series_equal(result, expected)
-
-    def test_interp_limit_no_nans(self):
-        # GH 7173
-        s = pd.Series([1., 2., 3.])
-        result = s.interpolate(limit=1)
-        expected = s
-        assert_series_equal(result, expected)
-
-    def test_describe(self):
-        _ = self.series.describe()
-        _ = self.ts.describe()
-
-    def test_describe_objects(self):
-        s = Series(['a', 'b', 'b', np.nan, np.nan, np.nan, 'c', 'd', 'a', 'a'])
-        result = s.describe()
-        expected = Series({'count': 7, 'unique': 4,
-                           'top': 'a', 'freq': 3}, index=result.index)
-        assert_series_equal(result, expected)
-
-        dt = list(self.ts.index)
-        dt.append(dt[0])
-        ser = Series(dt)
-        rs = ser.describe()
-        min_date = min(dt)
-        max_date = max(dt)
-        xp = Series({'count': len(dt),
-                     'unique': len(self.ts.index),
-                     'first': min_date, 'last': max_date, 'freq': 2,
-                     'top': min_date}, index=rs.index)
-        assert_series_equal(rs, xp)
-
-    def test_describe_empty(self):
-        result = pd.Series().describe()
-
-        self.assertEqual(result['count'], 0)
-        self.assertTrue(result.drop('count').isnull().all())
-
-        nanSeries = Series([np.nan])
-        nanSeries.name = 'NaN'
-        result = nanSeries.describe()
-        self.assertEqual(result['count'], 0)
-        self.assertTrue(result.drop('count').isnull().all())
-
-    def test_describe_none(self):
-        noneSeries = Series([None])
-        noneSeries.name = 'None'
-        expected = Series([0, 0], index=['count', 'unique'], name='None')
-        assert_series_equal(noneSeries.describe(), expected)
-
-
-class TestDataFrame(tm.TestCase, Generic):
-    _typ = DataFrame
-    _comparator = lambda self, x, y: assert_frame_equal(x,y)
-
-    def test_rename_mi(self):
-        df = DataFrame([11,21,31],
-                       index=MultiIndex.from_tuples([("A",x) for x in ["a","B","c"]]))
-        result = df.rename(str.lower)
-
-    def test_nonzero_single_element(self):
-
-        # allow single item via bool method
-        df = DataFrame([[True]])
-        self.assertTrue(df.bool())
-
-        df = DataFrame([[False]])
-        self.assertFalse(df.bool())
-
-        df = DataFrame([[False, False]])
-        self.assertRaises(ValueError, lambda : df.bool())
-        self.assertRaises(ValueError, lambda : bool(df))
-
-    def test_get_numeric_data_preserve_dtype(self):
-
-        # get the numeric data
-        o = DataFrame({'A': [1, '2', 3.]})
-        result = o._get_numeric_data()
-        expected = DataFrame(index=[0, 1, 2], dtype=object)
-        self._compare(result, expected)
-
-    def test_interp_basic(self):
-        df = DataFrame({'A': [1, 2, np.nan, 4], 'B': [1, 4, 9, np.nan],
-                        'C': [1, 2, 3, 5], 'D': list('abcd')})
-        expected = DataFrame({'A': [1., 2., 3., 4.], 'B': [1., 4., 9., 9.],
-                              'C': [1, 2, 3, 5], 'D': list('abcd')})
-        result = df.interpolate()
-        assert_frame_equal(result, expected)
-
-        result = df.set_index('C').interpolate()
-        expected = df.set_index('C')
-        expected.loc[3,'A'] = 3
-        expected.loc[5,'B'] = 9
-        assert_frame_equal(result, expected)
-
-    def test_interp_bad_method(self):
-        df = DataFrame({'A': [1, 2, np.nan, 4], 'B': [1, 4, 9, np.nan],
-                        'C': [1, 2, 3, 5], 'D': list('abcd')})
-        with tm.assertRaises(ValueError):
-            df.interpolate(method='not_a_method')
-
-    def test_interp_combo(self):
-        df = DataFrame({'A': [1., 2., np.nan, 4.], 'B': [1, 4, 9, np.nan],
-                        'C': [1, 2, 3, 5], 'D': list('abcd')})
-
-        result = df['A'].interpolate()
-        expected = Series([1., 2., 3., 4.], name='A')
-        assert_series_equal(result, expected)
-
-        result = df['A'].interpolate(downcast='infer')
-        expected = Series([1, 2, 3, 4], name='A')
-        assert_series_equal(result, expected)
-
-    def test_interp_nan_idx(self):
-        df = DataFrame({'A': [1, 2, np.nan, 4], 'B': [np.nan, 2, 3, 4]})
-        df = df.set_index('A')
-        with tm.assertRaises(NotImplementedError):
-            df.interpolate(method='values')
-
-    def test_interp_various(self):
-        tm._skip_if_no_scipy()
-        df = DataFrame({'A': [1, 2, np.nan, 4, 5, np.nan, 7],
-                        'C': [1, 2, 3, 5, 8, 13, 21]})
-        df = df.set_index('C')
-        expected = df.copy()
-        result = df.interpolate(method='polynomial', order=1)
-
-        expected.A.loc[3] = 2.66666667
-        expected.A.loc[13] = 5.76923076
-        assert_frame_equal(result, expected)
-
-        result = df.interpolate(method='cubic')
-        expected.A.loc[3] = 2.81621174
-        expected.A.loc[13] = 5.64146581
-        assert_frame_equal(result, expected)
-
-        result = df.interpolate(method='nearest')
-        expected.A.loc[3] = 2
-        expected.A.loc[13] = 5
-        assert_frame_equal(result, expected, check_dtype=False)
-
-        result = df.interpolate(method='quadratic')
-        expected.A.loc[3] = 2.82533638
-        expected.A.loc[13] = 6.02817974
-        assert_frame_equal(result, expected)
-
-        result = df.interpolate(method='slinear')
-        expected.A.loc[3] = 2.66666667
-        expected.A.loc[13] = 5.76923077
-        assert_frame_equal(result, expected)
-
-        result = df.interpolate(method='zero')
-        expected.A.loc[3] = 2.
-        expected.A.loc[13] = 5
-        assert_frame_equal(result, expected, check_dtype=False)
-
-        result = df.interpolate(method='quadratic')
-        expected.A.loc[3] = 2.82533638
-        expected.A.loc[13] = 6.02817974
-        assert_frame_equal(result, expected)
-
-    def test_interp_alt_scipy(self):
-        tm._skip_if_no_scipy()
-        df = DataFrame({'A': [1, 2, np.nan, 4, 5, np.nan, 7],
-                        'C': [1, 2, 3, 5, 8, 13, 21]})
-        result = df.interpolate(method='barycentric')
-        expected = df.copy()
-        expected.ix[2,'A'] = 3
-        expected.ix[5,'A'] = 6
-        assert_frame_equal(result, expected)
-
-        result = df.interpolate(method='barycentric', downcast='infer')
-        assert_frame_equal(result, expected.astype(np.int64))
-
-        result = df.interpolate(method='krogh')
-        expectedk = df.copy()
-        expectedk['A'] = expected['A']
-        assert_frame_equal(result, expectedk)
-
-        _skip_if_no_pchip()
-        result = df.interpolate(method='pchip')
-        expected.ix[2,'A'] = 3
-        expected.ix[5,'A'] = 6.125
-        assert_frame_equal(result, expected)
-
-    def test_interp_rowwise(self):
-        df = DataFrame({0: [1, 2, np.nan, 4],
-                        1: [2, 3, 4, np.nan],
-                        2: [np.nan, 4, 5, 6],
-                        3: [4, np.nan, 6, 7],
-                        4: [1, 2, 3, 4]})
-        result = df.interpolate(axis=1)
-        expected = df.copy()
-        expected.loc[3,1] = 5
-        expected.loc[0,2] = 3
-        expected.loc[1,3] = 3
-        expected[4] = expected[4].astype(np.float64)
-        assert_frame_equal(result, expected)
-
-        # scipy route
-        tm._skip_if_no_scipy()
-        result = df.interpolate(axis=1, method='values')
-        assert_frame_equal(result, expected)
-
-        result = df.interpolate(axis=0)
-        expected = df.interpolate()
-        assert_frame_equal(result, expected)
-
-    def test_rowwise_alt(self):
-        df = DataFrame({0: [0, .5, 1., np.nan, 4, 8, np.nan, np.nan, 64],
-                        1: [1, 2, 3, 4, 3, 2, 1, 0, -1]})
-        df.interpolate(axis=0)
-
-    def test_interp_leading_nans(self):
-        df = DataFrame({"A": [np.nan, np.nan, .5, .25, 0],
-                        "B": [np.nan, -3, -3.5, np.nan, -4]})
-        result = df.interpolate()
-        expected = df.copy()
-        expected['B'].loc[3] = -3.75
-        assert_frame_equal(result, expected)
-
-        tm._skip_if_no_scipy()
-        result = df.interpolate(method='polynomial', order=1)
-        assert_frame_equal(result, expected)
-
-    def test_interp_raise_on_only_mixed(self):
-        df = DataFrame({'A': [1, 2, np.nan, 4], 'B': ['a', 'b', 'c', 'd'],
-                        'C': [np.nan, 2, 5, 7], 'D': [np.nan, np.nan, 9, 9],
-                        'E': [1, 2, 3, 4]})
-        with tm.assertRaises(TypeError):
-            df.interpolate(axis=1)
-
-    def test_interp_inplace(self):
-        df = DataFrame({'a': [1., 2., np.nan, 4.]})
-        expected = DataFrame({'a': [1., 2., 3., 4.]})
-        result = df.copy()
-        result['a'].interpolate(inplace=True)
-        assert_frame_equal(result, expected)
-
-        result = df.copy()
-        result['a'].interpolate(inplace=True, downcast='infer')
-        assert_frame_equal(result, expected.astype('int64'))
-
-    def test_interp_inplace_row(self):
-        # GH 10395
-        result = DataFrame({'a': [1.,2.,3.,4.], 'b': [np.nan, 2., 3., 4.],
-                            'c': [3, 2, 2, 2]})
-        expected = result.interpolate(method='linear', axis=1, inplace=False)
-        result.interpolate(method='linear', axis=1, inplace=True)
-        assert_frame_equal(result, expected)
-
-    def test_interp_ignore_all_good(self):
-        # GH
-        df = DataFrame({'A': [1, 2, np.nan, 4],
-                        'B': [1, 2, 3, 4],
-                        'C': [1., 2., np.nan, 4.],
-                        'D': [1., 2., 3., 4.]})
-        expected = DataFrame({'A': np.array([1, 2, 3, 4], dtype='float64'),
-                              'B': np.array([1, 2, 3, 4], dtype='int64'),
-                              'C': np.array([1., 2., 3, 4.], dtype='float64'),
-                              'D': np.array([1., 2., 3., 4.], dtype='float64')})
-
-        result = df.interpolate(downcast=None)
-        assert_frame_equal(result, expected)
-
-        # all good
-        result = df[['B', 'D']].interpolate(downcast=None)
-        assert_frame_equal(result, df[['B', 'D']])
-
-    def test_describe(self):
-        desc = tm.makeDataFrame().describe()
-        desc = tm.makeMixedDataFrame().describe()
-        desc = tm.makeTimeDataFrame().describe()
-
-    def test_describe_percentiles_percent_or_raw(self):
-        msg = 'percentiles should all be in the interval \\[0, 1\\]'
-
-        df = tm.makeDataFrame()
-        with tm.assertRaisesRegexp(ValueError, msg):
-            df.describe(percentiles=[10, 50, 100])
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            df.describe(percentiles=[2])
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            df.describe(percentiles=[-2])
-
-    def test_describe_percentiles_equivalence(self):
-        df = tm.makeDataFrame()
-        d1 = df.describe()
-        d2 = df.describe(percentiles=[.25, .75])
-        assert_frame_equal(d1, d2)
-
-    def test_describe_percentiles_insert_median(self):
-        df = tm.makeDataFrame()
-        d1 = df.describe(percentiles=[.25, .75])
-        d2 = df.describe(percentiles=[.25, .5, .75])
-        assert_frame_equal(d1, d2)
-        self.assertTrue('25%' in d1.index)
-        self.assertTrue('75%' in d2.index)
-
-        # none above
-        d1 = df.describe(percentiles=[.25, .45])
-        d2 = df.describe(percentiles=[.25, .45, .5])
-        assert_frame_equal(d1, d2)
-        self.assertTrue('25%' in d1.index)
-        self.assertTrue('45%' in d2.index)
-
-        # none below
-        d1 = df.describe(percentiles=[.75, 1])
-        d2 = df.describe(percentiles=[.5, .75, 1])
-        assert_frame_equal(d1, d2)
-        self.assertTrue('75%' in d1.index)
-        self.assertTrue('100%' in d2.index)
-
-        # edge
-        d1 = df.describe(percentiles=[0, 1])
-        d2 = df.describe(percentiles=[0, .5, 1])
-        assert_frame_equal(d1, d2)
-        self.assertTrue('0%' in d1.index)
-        self.assertTrue('100%' in d2.index)
-
-    def test_describe_no_numeric(self):
-        df = DataFrame({'A': ['foo', 'foo', 'bar'] * 8,
-                        'B': ['a', 'b', 'c', 'd'] * 6})
-        desc = df.describe()
-        expected = DataFrame(dict((k, v.describe())
-                                  for k, v in compat.iteritems(df)),
-                             columns=df.columns)
-        assert_frame_equal(desc, expected)
-
-        ts = tm.makeTimeSeries()
-        df = DataFrame({'time': ts.index})
-        desc = df.describe()
-        self.assertEqual(desc.time['first'], min(ts.index))
-
-    def test_describe_empty_int_columns(self):
-        df = DataFrame([[0, 1], [1, 2]])
-        desc = df[df[0] < 0].describe()  # works
-        assert_series_equal(desc.xs('count'),
-                            Series([0, 0], dtype=float, name='count'))
-        self.assertTrue(isnull(desc.ix[1:]).all().all())
-
-    def test_describe_objects(self):
-        df = DataFrame({"C1": ['a', 'a', 'c'], "C2": ['d', 'd', 'f']})
-        result = df.describe()
-        expected = DataFrame({"C1": [3, 2, 'a', 2], "C2": [3, 2, 'd', 2]},
-                             index=['count', 'unique', 'top', 'freq'])
-        assert_frame_equal(result, expected)
-
-        df = DataFrame({"C1": pd.date_range('2010-01-01', periods=4, freq='D')})
-        df.loc[4] = pd.Timestamp('2010-01-04')
-        result = df.describe()
-        expected = DataFrame({"C1": [5, 4, pd.Timestamp('2010-01-04'), 2,
-                                     pd.Timestamp('2010-01-01'),
-                                     pd.Timestamp('2010-01-04')]},
-                             index=['count', 'unique', 'top', 'freq',
-                                    'first', 'last'])
-        assert_frame_equal(result, expected)
-
-        # mix time and str
-        df['C2'] = ['a', 'a', 'b', 'c', 'a']
-        result = df.describe()
-        expected['C2'] = [5, 3, 'a', 3, np.nan, np.nan]
-        assert_frame_equal(result, expected)
-
-        # just str
-        expected = DataFrame({'C2': [5, 3, 'a', 4]},
-                             index=['count', 'unique', 'top', 'freq'])
-        result = df[['C2']].describe()
-
-        # mix of time, str, numeric
-        df['C3'] = [2, 4, 6, 8, 2]
-        result = df.describe()
-        expected = DataFrame({"C3": [5., 4.4, 2.607681, 2., 2., 4., 6., 8.]},
-                             index=['count', 'mean', 'std', 'min', '25%',
-                                    '50%', '75%', 'max'])
-        assert_frame_equal(result, expected)
-        assert_frame_equal(df.describe(), df[['C3']].describe())
-
-        assert_frame_equal(df[['C1', 'C3']].describe(), df[['C3']].describe())
-        assert_frame_equal(df[['C2', 'C3']].describe(), df[['C3']].describe())
-
-    def test_describe_typefiltering(self):
-        df = DataFrame({'catA': ['foo', 'foo', 'bar'] * 8,
-                        'catB': ['a', 'b', 'c', 'd'] * 6,
-                        'numC': np.arange(24, dtype='int64'),
-                        'numD': np.arange(24.) + .5,
-                        'ts': tm.makeTimeSeries()[:24].index})
-
-        descN = df.describe()
-        expected_cols = ['numC', 'numD',]
-        expected = DataFrame(dict((k, df[k].describe())
-                                  for k in expected_cols),
-                             columns=expected_cols)
-        assert_frame_equal(descN, expected)
-
-        desc = df.describe(include=['number'])
-        assert_frame_equal(desc, descN)
-        desc = df.describe(exclude=['object', 'datetime'])
-        assert_frame_equal(desc, descN)
-        desc = df.describe(include=['float'])
-        assert_frame_equal(desc, descN.drop('numC',1))
-
-        descC = df.describe(include=['O'])
-        expected_cols = ['catA', 'catB']
-        expected = DataFrame(dict((k, df[k].describe())
-                                  for k in expected_cols),
-                             columns=expected_cols)
-        assert_frame_equal(descC, expected)
-
-        descD = df.describe(include=['datetime'])
-        assert_series_equal( descD.ts, df.ts.describe())
-
-        desc = df.describe(include=['object','number', 'datetime'])
-        assert_frame_equal(desc.loc[:,["numC","numD"]].dropna(), descN)
-        assert_frame_equal(desc.loc[:,["catA","catB"]].dropna(), descC)
-        descDs = descD.sort_index() # the index order change for mixed-types
-        assert_frame_equal(desc.loc[:,"ts":].dropna().sort_index(), descDs)
-
-        desc = df.loc[:,'catA':'catB'].describe(include='all')
-        assert_frame_equal(desc, descC)
-        desc = df.loc[:,'numC':'numD'].describe(include='all')
-        assert_frame_equal(desc, descN)
-
-        desc = df.describe(percentiles = [], include='all')
-        cnt = Series(data=[4,4,6,6,6], index=['catA','catB','numC','numD','ts'])
-        assert_series_equal( desc.count(), cnt)
-        self.assertTrue('count' in desc.index)
-        self.assertTrue('unique' in desc.index)
-        self.assertTrue('50%' in desc.index)
-        self.assertTrue('first' in desc.index)
-
-        desc = df.drop("ts", 1).describe(percentiles = [], include='all')
-        assert_series_equal( desc.count(), cnt.drop("ts"))
-        self.assertTrue('first' not in desc.index)
-        desc = df.drop(["numC","numD"], 1).describe(percentiles = [], include='all')
-        assert_series_equal( desc.count(), cnt.drop(["numC","numD"]))
-        self.assertTrue('50%' not in desc.index)
-
-    def test_describe_typefiltering_category_bool(self):
-        df = DataFrame({'A_cat': pd.Categorical(['foo', 'foo', 'bar'] * 8),
-                        'B_str': ['a', 'b', 'c', 'd'] * 6,
-                        'C_bool': [True] * 12 + [False] * 12,
-                        'D_num': np.arange(24.) + .5,
-                        'E_ts': tm.makeTimeSeries()[:24].index})
-
-        # bool is considered numeric in describe, although not an np.number
-        desc = df.describe()
-        expected_cols = ['C_bool', 'D_num']
-        expected = DataFrame(dict((k, df[k].describe())
-                                  for k in expected_cols),
-                             columns=expected_cols)
-        assert_frame_equal(desc, expected)
-
-        desc = df.describe(include=["category"])
-        self.assertTrue(desc.columns.tolist() == ["A_cat"])
-
-        # 'all' includes numpy-dtypes + category
-        desc1 = df.describe(include="all")
-        desc2 = df.describe(include=[np.generic, "category"])
-        assert_frame_equal(desc1, desc2)
-
-    def test_describe_timedelta(self):
-        df = DataFrame({"td": pd.to_timedelta(np.arange(24)%20,"D")})
-        self.assertTrue(df.describe().loc["mean"][0] == pd.to_timedelta("8d4h"))
-
-    def test_describe_typefiltering_dupcol(self):
-        df = DataFrame({'catA': ['foo', 'foo', 'bar'] * 8,
-                        'catB': ['a', 'b', 'c', 'd'] * 6,
-                        'numC': np.arange(24),
-                        'numD': np.arange(24.) + .5,
-                        'ts': tm.makeTimeSeries()[:24].index})
-        s = df.describe(include='all').shape[1]
-        df = pd.concat([df, df], axis=1)
-        s2 = df.describe(include='all').shape[1]
-        self.assertTrue(s2 == 2 * s)
-
-    def test_describe_typefiltering_groupby(self):
-        df = DataFrame({'catA': ['foo', 'foo', 'bar'] * 8,
-                'catB': ['a', 'b', 'c', 'd'] * 6,
-                'numC': np.arange(24),
-                'numD': np.arange(24.) + .5,
-                'ts': tm.makeTimeSeries()[:24].index})
-        G = df.groupby('catA')
-        self.assertTrue(G.describe(include=['number']).shape == (16, 2))
-        self.assertTrue(G.describe(include=['number', 'object']).shape == (22, 3))
-        self.assertTrue(G.describe(include='all').shape == (26, 4))
-
-    def test_no_order(self):
-        tm._skip_if_no_scipy()
-        s = Series([0, 1, np.nan, 3])
-        with tm.assertRaises(ValueError):
-            s.interpolate(method='polynomial')
-        with tm.assertRaises(ValueError):
-            s.interpolate(method='spline')
-
-    def test_spline(self):
-        tm._skip_if_no_scipy()
-        s = Series([1, 2, np.nan, 4, 5, np.nan, 7])
-        result = s.interpolate(method='spline', order=1)
-        expected = Series([1., 2., 3., 4., 5., 6., 7.])
-        assert_series_equal(result, expected)
-
-    def test_spline_extrapolate(self):
-        tm.skip_if_no_package('scipy', '0.15', 'setting ext on scipy.interpolate.UnivariateSpline')
-        s = Series([1, 2, 3, 4, np.nan, 6, np.nan])
-        result3 = s.interpolate(method='spline', order=1, ext=3)
-        expected3 = Series([1., 2., 3., 4., 5., 6., 6.])
-        assert_series_equal(result3, expected3)
-
-        result1 = s.interpolate(method='spline', order=1, ext=0)
-        expected1 = Series([1., 2., 3., 4., 5., 6., 7.])
-        assert_series_equal(result1, expected1)
-
-    def test_spline_smooth(self):
-        tm._skip_if_no_scipy()
-        s = Series([1, 2, np.nan, 4, 5.1, np.nan, 7])
-        self.assertNotEqual(s.interpolate(method='spline', order=3, s=0)[5],
-                            s.interpolate(method='spline', order=3)[5])
-
-    def test_spline_interpolation(self):
-        tm._skip_if_no_scipy()
-
-        s = Series(np.arange(10)**2)
-        s[np.random.randint(0,9,3)] = np.nan
-        result1 = s.interpolate(method='spline', order=1)
-        expected1 = s.interpolate(method='spline', order=1)
-        assert_series_equal(result1, expected1)
-
-    # GH #10633
-    def test_spline_error(self):
-        tm._skip_if_no_scipy()
-
-        s = pd.Series(np.arange(10)**2)
-        s[np.random.randint(0,9,3)] = np.nan
-        with tm.assertRaises(ValueError):
-            s.interpolate(method='spline')
-
-        with tm.assertRaises(ValueError):
-            s.interpolate(method='spline', order=0)
-
-    def test_metadata_propagation_indiv(self):
-
-        # groupby
-        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                              'foo', 'bar', 'foo', 'foo'],
-                        'B': ['one', 'one', 'two', 'three',
-                              'two', 'two', 'one', 'three'],
-                        'C': np.random.randn(8),
-                        'D': np.random.randn(8)})
-        result = df.groupby('A').sum()
-        self.check_metadata(df,result)
-
-        # resample
-        df = DataFrame(np.random.randn(1000,2),
-                       index=date_range('20130101',periods=1000,freq='s'))
-        result = df.resample('1T')
-        self.check_metadata(df,result)
-
-        # merging with override
-        # GH 6923
-        _metadata = DataFrame._metadata
-        _finalize = DataFrame.__finalize__
-
-        np.random.seed(10)
-        df1 = DataFrame(np.random.randint(0, 4, (3, 2)), columns=['a', 'b'])
-        df2 = DataFrame(np.random.randint(0, 4, (3, 2)), columns=['c', 'd'])
-        DataFrame._metadata = ['filename']
-        df1.filename = 'fname1.csv'
-        df2.filename = 'fname2.csv'
-
-        def finalize(self, other, method=None, **kwargs):
-
-            for name in self._metadata:
-                if method == 'merge':
-                    left, right = other.left, other.right
-                    value = getattr(left, name, '') + '|' + getattr(right, name, '')
-                    object.__setattr__(self, name, value)
-                else:
-                    object.__setattr__(self, name, getattr(other, name, ''))
-
-            return self
-
-        DataFrame.__finalize__ = finalize
-        result = df1.merge(df2, left_on=['a'], right_on=['c'], how='inner')
-        self.assertEqual(result.filename,'fname1.csv|fname2.csv')
-
-        # concat
-        # GH 6927
-        DataFrame._metadata = ['filename']
-        df1 = DataFrame(np.random.randint(0, 4, (3, 2)), columns=list('ab'))
-        df1.filename = 'foo'
-
-        def finalize(self, other, method=None, **kwargs):
-            for name in self._metadata:
-                if method == 'concat':
-                    value = '+'.join([ getattr(o,name) for o in other.objs if getattr(o,name,None) ])
-                    object.__setattr__(self, name, value)
-                else:
-                    object.__setattr__(self, name, getattr(other, name, None))
-
-            return self
-
-        DataFrame.__finalize__ = finalize
-
-        result = pd.concat([df1, df1])
-        self.assertEqual(result.filename,'foo+foo')
-
-        # reset
-        DataFrame._metadata = _metadata
-        DataFrame.__finalize__ = _finalize
-
-    def test_tz_convert_and_localize(self):
-        l0 = date_range('20140701', periods=5, freq='D')
-
-        # TODO: l1 should be a PeriodIndex for testing
-        #       after GH2106 is addressed
-        with tm.assertRaises(NotImplementedError):
-            period_range('20140701', periods=1).tz_convert('UTC')
-        with tm.assertRaises(NotImplementedError):
-            period_range('20140701', periods=1).tz_localize('UTC')
-        # l1 = period_range('20140701', periods=5, freq='D')
-        l1 = date_range('20140701', periods=5, freq='D')
-
-        int_idx = Index(range(5))
-
-        for fn in ['tz_localize', 'tz_convert']:
-
-            if fn == 'tz_convert':
-                l0 = l0.tz_localize('UTC')
-                l1 = l1.tz_localize('UTC')
-
-            for idx in [l0, l1]:
-
-                l0_expected  = getattr(idx, fn)('US/Pacific')
-                l1_expected  = getattr(idx, fn)('US/Pacific')
-
-                df1 = DataFrame(np.ones(5), index=l0)
-                df1 = getattr(df1, fn)('US/Pacific')
-                self.assertTrue(df1.index.equals(l0_expected))
-
-                # MultiIndex
-                # GH7846
-                df2 = DataFrame(np.ones(5),
-                                MultiIndex.from_arrays([l0, l1]))
-
-                df3 = getattr(df2, fn)('US/Pacific', level=0)
-                self.assertFalse(df3.index.levels[0].equals(l0))
-                self.assertTrue(df3.index.levels[0].equals(l0_expected))
-                self.assertTrue(df3.index.levels[1].equals(l1))
-                self.assertFalse(df3.index.levels[1].equals(l1_expected))
-
-                df3 = getattr(df2, fn)('US/Pacific', level=1)
-                self.assertTrue(df3.index.levels[0].equals(l0))
-                self.assertFalse(df3.index.levels[0].equals(l0_expected))
-                self.assertTrue(df3.index.levels[1].equals(l1_expected))
-                self.assertFalse(df3.index.levels[1].equals(l1))
-
-                df4 = DataFrame(np.ones(5),
-                                MultiIndex.from_arrays([int_idx, l0]))
-
-                df5 = getattr(df4, fn)('US/Pacific', level=1)
-                self.assertTrue(df3.index.levels[0].equals(l0))
-                self.assertFalse(df3.index.levels[0].equals(l0_expected))
-                self.assertTrue(df3.index.levels[1].equals(l1_expected))
-                self.assertFalse(df3.index.levels[1].equals(l1))
-
-        # Bad Inputs
-        for fn in ['tz_localize', 'tz_convert']:
-            # Not DatetimeIndex / PeriodIndex
-            with tm.assertRaisesRegexp(TypeError, 'DatetimeIndex'):
-                df = DataFrame(index=int_idx)
-                df = getattr(df, fn)('US/Pacific')
-
-            # Not DatetimeIndex / PeriodIndex
-            with tm.assertRaisesRegexp(TypeError, 'DatetimeIndex'):
-                df = DataFrame(np.ones(5),
-                            MultiIndex.from_arrays([int_idx, l0]))
-                df = getattr(df, fn)('US/Pacific', level=0)
-
-            # Invalid level
-            with tm.assertRaisesRegexp(ValueError, 'not valid'):
-                df = DataFrame(index=l0)
-                df = getattr(df, fn)('US/Pacific', level=1)
-
-    def test_set_attribute(self):
-        # Test for consistent setattr behavior when an attribute and a column
-        # have the same name (Issue #8994)
-        df = DataFrame({'x':[1, 2, 3]})
-
-        df.y = 2
-        df['y'] = [2, 4, 6]
-        df.y = 5
-
-        assert_equal(df.y, 5)
-        assert_series_equal(df['y'], Series([2, 4, 6], name='y'))
-
-
-class TestPanel(tm.TestCase, Generic):
-    _typ = Panel
-    _comparator = lambda self, x, y: assert_panel_equal(x, y)
-
-
-class TestNDFrame(tm.TestCase):
-    # tests that don't fit elsewhere
-
-    def test_squeeze(self):
-        # noop
-        for s in [ tm.makeFloatSeries(), tm.makeStringSeries(), tm.makeObjectSeries() ]:
-            tm.assert_series_equal(s.squeeze(),s)
-        for df in [ tm.makeTimeDataFrame() ]:
-            tm.assert_frame_equal(df.squeeze(),df)
-        for p in [ tm.makePanel() ]:
-            tm.assert_panel_equal(p.squeeze(),p)
-        for p4d in [ tm.makePanel4D() ]:
-            tm.assert_panel4d_equal(p4d.squeeze(),p4d)
-
-        # squeezing
-        df = tm.makeTimeDataFrame().reindex(columns=['A'])
-        tm.assert_series_equal(df.squeeze(),df['A'])
-
-        p = tm.makePanel().reindex(items=['ItemA'])
-        tm.assert_frame_equal(p.squeeze(),p['ItemA'])
-
-        p = tm.makePanel().reindex(items=['ItemA'],minor_axis=['A'])
-        tm.assert_series_equal(p.squeeze(),p.ix['ItemA',:,'A'])
-
-        p4d = tm.makePanel4D().reindex(labels=['label1'])
-        tm.assert_panel_equal(p4d.squeeze(),p4d['label1'])
-
-        p4d = tm.makePanel4D().reindex(labels=['label1'],items=['ItemA'])
-        tm.assert_frame_equal(p4d.squeeze(),p4d.ix['label1','ItemA'])
-
-        # don't fail with 0 length dimensions GH11229 & GH8999
-        empty_series=pd.Series([], name='five')
-        empty_frame=pd.DataFrame([empty_series])
-        empty_panel=pd.Panel({'six':empty_frame})
-
-        [tm.assert_series_equal(empty_series, higher_dim.squeeze())
-         for higher_dim in [empty_series, empty_frame, empty_panel]]
-
-
-    def test_equals(self):
-        s1 = pd.Series([1, 2, 3], index=[0, 2, 1])
-        s2 = s1.copy()
-        self.assertTrue(s1.equals(s2))
-
-        s1[1] = 99
-        self.assertFalse(s1.equals(s2))
-
-        # NaNs compare as equal
-        s1 = pd.Series([1, np.nan, 3, np.nan], index=[0, 2, 1, 3])
-        s2 = s1.copy()
-        self.assertTrue(s1.equals(s2))
-
-        s2[0] = 9.9
-        self.assertFalse(s1.equals(s2))
-
-        idx = MultiIndex.from_tuples([(0, 'a'), (1, 'b'), (2, 'c')])
-        s1 = Series([1, 2, np.nan], index=idx)
-        s2 = s1.copy()
-        self.assertTrue(s1.equals(s2))
-
-        # Add object dtype column with nans
-        index = np.random.random(10)
-        df1 = DataFrame(np.random.random(10,), index=index, columns=['floats'])
-        df1['text'] = 'the sky is so blue. we could use more chocolate.'.split()
-        df1['start'] = date_range('2000-1-1', periods=10, freq='T')
-        df1['end'] = date_range('2000-1-1', periods=10, freq='D')
-        df1['diff'] = df1['end'] - df1['start']
-        df1['bool'] = (np.arange(10) % 3 == 0)
-        df1.ix[::2] = nan
-        df2 = df1.copy()
-        self.assertTrue(df1['text'].equals(df2['text']))
-        self.assertTrue(df1['start'].equals(df2['start']))
-        self.assertTrue(df1['end'].equals(df2['end']))
-        self.assertTrue(df1['diff'].equals(df2['diff']))
-        self.assertTrue(df1['bool'].equals(df2['bool']))
-        self.assertTrue(df1.equals(df2))
-        self.assertFalse(df1.equals(object))
-
-        # different dtype
-        different = df1.copy()
-        different['floats'] = different['floats'].astype('float32')
-        self.assertFalse(df1.equals(different))
-
-        # different index
-        different_index = -index
-        different = df2.set_index(different_index)
-        self.assertFalse(df1.equals(different))
-
-        # different columns
-        different = df2.copy()
-        different.columns = df2.columns[::-1]
-        self.assertFalse(df1.equals(different))
-
-        # DatetimeIndex
-        index = pd.date_range('2000-1-1', periods=10, freq='T')
-        df1 = df1.set_index(index)
-        df2 = df1.copy()
-        self.assertTrue(df1.equals(df2))
-
-        # MultiIndex
-        df3 = df1.set_index(['text'], append=True)
-        df2 = df1.set_index(['text'], append=True)
-        self.assertTrue(df3.equals(df2))
-
-        df2 = df1.set_index(['floats'], append=True)
-        self.assertFalse(df3.equals(df2))
-
-        # NaN in index
-        df3 = df1.set_index(['floats'], append=True)
-        df2 = df1.set_index(['floats'], append=True)
-        self.assertTrue(df3.equals(df2))
-
-        # GH 8437
-        a = pd.Series([False, np.nan])
-        b = pd.Series([False, np.nan])
-        c = pd.Series(index=range(2))
-        d = pd.Series(index=range(2))
-        e = pd.Series(index=range(2))
-        f = pd.Series(index=range(2))
-        c[:-1] = d[:-1] = e[0] = f[0] = False
-        self.assertTrue(a.equals(a))
-        self.assertTrue(a.equals(b))
-        self.assertTrue(a.equals(c))
-        self.assertTrue(a.equals(d))
-        self.assertFalse(a.equals(e))
-        self.assertTrue(e.equals(f))
-
-    def test_describe_raises(self):
-        with tm.assertRaises(NotImplementedError):
-            tm.makePanel().describe()
-
-    def test_pipe(self):
-        df = DataFrame({'A': [1, 2, 3]})
-        f = lambda x, y: x ** y
-        result = df.pipe(f, 2)
-        expected = DataFrame({'A': [1, 4, 9]})
-        self.assert_frame_equal(result, expected)
-
-        result = df.A.pipe(f, 2)
-        self.assert_series_equal(result, expected.A)
-
-    def test_pipe_tuple(self):
-        df = DataFrame({'A': [1, 2, 3]})
-        f = lambda x, y: y
-        result = df.pipe((f, 'y'), 0)
-        self.assert_frame_equal(result, df)
-
-        result = df.A.pipe((f, 'y'), 0)
-        self.assert_series_equal(result, df.A)
-
-    def test_pipe_tuple_error(self):
-        df = DataFrame({"A": [1, 2, 3]})
-        f = lambda x, y: y
-        with tm.assertRaises(ValueError):
-            result = df.pipe((f, 'y'), x=1, y=0)
-
-        with tm.assertRaises(ValueError):
-            result = df.A.pipe((f, 'y'), x=1, y=0)
-
-    def test_pipe_panel(self):
-        wp = Panel({'r1': DataFrame({"A": [1, 2, 3]})})
-        f = lambda x, y: x + y
-        result = wp.pipe(f, 2)
-        expected = wp + 2
-        assert_panel_equal(result, expected)
-
-        result = wp.pipe((f, 'y'), x=1)
-        expected = wp + 1
-        assert_panel_equal(result, expected)
-
-        with tm.assertRaises(ValueError):
-            result = wp.pipe((f, 'y'), x=1, y=1)
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_graphics.py b/pandas/tests/test_graphics.py
deleted file mode 100644
index b2d8ff8ba0b00..0000000000000
--- a/pandas/tests/test_graphics.py
+++ /dev/null
@@ -1,3764 +0,0 @@
-#!/usr/bin/env python
-# coding: utf-8
-
-import nose
-import itertools
-import os
-import string
-import warnings
-from distutils.version import LooseVersion
-
-from datetime import datetime, date
-
-from pandas import (Series, DataFrame, MultiIndex, PeriodIndex, date_range,
-                    bdate_range)
-from pandas.compat import (range, lrange, StringIO, lmap, lzip, u, zip,
-                           iteritems, OrderedDict, PY3)
-from pandas.util.decorators import cache_readonly
-import pandas.core.common as com
-import pandas.util.testing as tm
-from pandas.util.testing import ensure_clean
-from pandas.core.config import set_option
-
-
-import numpy as np
-from numpy import random
-from numpy.random import rand, randn
-
-from numpy.testing import assert_allclose
-from numpy.testing.decorators import slow
-import pandas.tools.plotting as plotting
-
-
-"""
-These tests are for ``Dataframe.plot`` and ``Series.plot``.
-Other plot methods such as ``.hist``, ``.boxplot`` and other miscellaneous
-are tested in test_graphics_others.py
-"""
-
-
-def _skip_if_no_scipy_gaussian_kde():
-    try:
-        import scipy
-        from scipy.stats import gaussian_kde
-    except ImportError:
-        raise nose.SkipTest("scipy version doesn't support gaussian_kde")
-
-
-def _ok_for_gaussian_kde(kind):
-    if kind in ['kde','density']:
-        try:
-            import scipy
-            from scipy.stats import gaussian_kde
-        except ImportError:
-            return False
-    return True
-
-
-@tm.mplskip
-class TestPlotBase(tm.TestCase):
-
-    def setUp(self):
-
-        import matplotlib as mpl
-        mpl.rcdefaults()
-
-        n = 100
-        with tm.RNGContext(42):
-            gender = tm.choice(['Male', 'Female'], size=n)
-            classroom = tm.choice(['A', 'B', 'C'], size=n)
-
-            self.hist_df = DataFrame({'gender': gender,
-                                      'classroom': classroom,
-                                      'height': random.normal(66, 4, size=n),
-                                      'weight': random.normal(161, 32, size=n),
-                                      'category': random.randint(4, size=n)})
-
-        self.mpl_le_1_2_1 = plotting._mpl_le_1_2_1()
-        self.mpl_ge_1_3_1 = plotting._mpl_ge_1_3_1()
-        self.mpl_ge_1_4_0 = plotting._mpl_ge_1_4_0()
-        self.mpl_ge_1_5_0 = plotting._mpl_ge_1_5_0()
-
-        if self.mpl_ge_1_4_0:
-            self.bp_n_objects = 7
-        else:
-            self.bp_n_objects = 8
-        if self.mpl_ge_1_5_0:
-            # 1.5 added PolyCollections to legend handler
-            # so we have twice as many items.
-            self.polycollection_factor = 2
-        else:
-            self.polycollection_factor = 1
-
-
-    def tearDown(self):
-        tm.close()
-
-    @cache_readonly
-    def plt(self):
-        import matplotlib.pyplot as plt
-        return plt
-
-    @cache_readonly
-    def colorconverter(self):
-        import matplotlib.colors as colors
-        return colors.colorConverter
-
-    def _check_legend_labels(self, axes, labels=None, visible=True):
-        """
-        Check each axes has expected legend labels
-
-        Parameters
-        ----------
-        axes : matplotlib Axes object, or its list-like
-        labels : list-like
-            expected legend labels
-        visible : bool
-            expected legend visibility. labels are checked only when visible is True
-        """
-
-        if visible and (labels is None):
-            raise ValueError('labels must be specified when visible is True')
-        axes = self._flatten_visible(axes)
-        for ax in axes:
-            if visible:
-                self.assertTrue(ax.get_legend() is not None)
-                self._check_text_labels(ax.get_legend().get_texts(), labels)
-            else:
-                self.assertTrue(ax.get_legend() is None)
-
-    def _check_data(self, xp, rs):
-        """
-        Check each axes has identical lines
-
-        Parameters
-        ----------
-        xp : matplotlib Axes object
-        rs : matplotlib Axes object
-        """
-        xp_lines = xp.get_lines()
-        rs_lines = rs.get_lines()
-
-        def check_line(xpl, rsl):
-            xpdata = xpl.get_xydata()
-            rsdata = rsl.get_xydata()
-            assert_allclose(xpdata, rsdata)
-
-        self.assertEqual(len(xp_lines), len(rs_lines))
-        [check_line(xpl, rsl) for xpl, rsl in zip(xp_lines, rs_lines)]
-        tm.close()
-
-    def _check_visible(self, collections, visible=True):
-        """
-        Check each artist is visible or not
-
-        Parameters
-        ----------
-        collections : matplotlib Artist or its list-like
-            target Artist or its list or collection
-        visible : bool
-            expected visibility
-        """
-        from matplotlib.collections import Collection
-        if not isinstance(collections, Collection) and not com.is_list_like(collections):
-            collections = [collections]
-
-        for patch in collections:
-            self.assertEqual(patch.get_visible(), visible)
-
-    def _get_colors_mapped(self, series, colors):
-        unique = series.unique()
-        # unique and colors length can be differed
-        # depending on slice value
-        mapped = dict(zip(unique, colors))
-        return [mapped[v] for v in series.values]
-
-    def _check_colors(self, collections, linecolors=None, facecolors=None,
-                      mapping=None):
-        """
-        Check each artist has expected line colors and face colors
-
-        Parameters
-        ----------
-        collections : list-like
-            list or collection of target artist
-        linecolors : list-like which has the same length as collections
-            list of expected line colors
-        facecolors : list-like which has the same length as collections
-            list of expected face colors
-        mapping : Series
-            Series used for color grouping key
-            used for andrew_curves, parallel_coordinates, radviz test
-        """
-
-        from matplotlib.lines import Line2D
-        from matplotlib.collections import Collection, PolyCollection
-        conv = self.colorconverter
-        if linecolors is not None:
-
-            if mapping is not None:
-                linecolors = self._get_colors_mapped(mapping, linecolors)
-                linecolors = linecolors[:len(collections)]
-
-            self.assertEqual(len(collections), len(linecolors))
-            for patch, color in zip(collections, linecolors):
-                if isinstance(patch, Line2D):
-                    result = patch.get_color()
-                    # Line2D may contains string color expression
-                    result = conv.to_rgba(result)
-                elif isinstance(patch, PolyCollection):
-                    result = tuple(patch.get_edgecolor()[0])
-                else:
-                    result = patch.get_edgecolor()
-
-                expected = conv.to_rgba(color)
-                self.assertEqual(result, expected)
-
-        if facecolors is not None:
-
-            if mapping is not None:
-                facecolors = self._get_colors_mapped(mapping, facecolors)
-                facecolors = facecolors[:len(collections)]
-
-            self.assertEqual(len(collections), len(facecolors))
-            for patch, color in zip(collections, facecolors):
-                if isinstance(patch, Collection):
-                    # returned as list of np.array
-                    result = patch.get_facecolor()[0]
-                else:
-                    result = patch.get_facecolor()
-
-                if isinstance(result, np.ndarray):
-                    result = tuple(result)
-
-                expected = conv.to_rgba(color)
-                self.assertEqual(result, expected)
-
-    def _check_text_labels(self, texts, expected):
-        """
-        Check each text has expected labels
-
-        Parameters
-        ----------
-        texts : matplotlib Text object, or its list-like
-            target text, or its list
-        expected : str or list-like which has the same length as texts
-            expected text label, or its list
-        """
-        if not com.is_list_like(texts):
-            self.assertEqual(texts.get_text(), expected)
-        else:
-            labels = [t.get_text() for t in texts]
-            self.assertEqual(len(labels), len(expected))
-            for l, e in zip(labels, expected):
-                self.assertEqual(l, e)
-
-    def _check_ticks_props(self, axes, xlabelsize=None, xrot=None,
-                           ylabelsize=None, yrot=None):
-        """
-        Check each axes has expected tick properties
-
-        Parameters
-        ----------
-        axes : matplotlib Axes object, or its list-like
-        xlabelsize : number
-            expected xticks font size
-        xrot : number
-            expected xticks rotation
-        ylabelsize : number
-            expected yticks font size
-        yrot : number
-            expected yticks rotation
-        """
-        from matplotlib.ticker import NullFormatter
-        axes = self._flatten_visible(axes)
-        for ax in axes:
-            if xlabelsize or xrot:
-                if isinstance(ax.xaxis.get_minor_formatter(), NullFormatter):
-                    # If minor ticks has NullFormatter, rot / fontsize are not retained
-                    labels = ax.get_xticklabels()
-                else:
-                    labels = ax.get_xticklabels() + ax.get_xticklabels(minor=True)
-
-                for label in labels:
-                    if xlabelsize is not None:
-                        self.assertAlmostEqual(label.get_fontsize(), xlabelsize)
-                    if xrot is not None:
-                        self.assertAlmostEqual(label.get_rotation(), xrot)
-
-            if ylabelsize or yrot:
-                if isinstance(ax.yaxis.get_minor_formatter(), NullFormatter):
-                    labels = ax.get_yticklabels()
-                else:
-                    labels = ax.get_yticklabels() + ax.get_yticklabels(minor=True)
-
-                for label in labels:
-                    if ylabelsize is not None:
-                        self.assertAlmostEqual(label.get_fontsize(), ylabelsize)
-                    if yrot is not None:
-                        self.assertAlmostEqual(label.get_rotation(), yrot)
-
-    def _check_ax_scales(self, axes, xaxis='linear', yaxis='linear'):
-        """
-        Check each axes has expected scales
-
-        Parameters
-        ----------
-        axes : matplotlib Axes object, or its list-like
-        xaxis : {'linear', 'log'}
-            expected xaxis scale
-        yaxis :  {'linear', 'log'}
-            expected yaxis scale
-        """
-        axes = self._flatten_visible(axes)
-        for ax in axes:
-            self.assertEqual(ax.xaxis.get_scale(), xaxis)
-            self.assertEqual(ax.yaxis.get_scale(), yaxis)
-
-    def _check_axes_shape(self, axes, axes_num=None, layout=None, figsize=(8.0, 6.0)):
-        """
-        Check expected number of axes is drawn in expected layout
-
-        Parameters
-        ----------
-        axes : matplotlib Axes object, or its list-like
-        axes_num : number
-            expected number of axes. Unnecessary axes should be set to invisible.
-        layout :  tuple
-            expected layout, (expected number of rows , columns)
-        figsize : tuple
-            expected figsize. default is matplotlib default
-        """
-        visible_axes = self._flatten_visible(axes)
-
-        if axes_num is not None:
-            self.assertEqual(len(visible_axes), axes_num)
-            for ax in visible_axes:
-                # check something drawn on visible axes
-                self.assertTrue(len(ax.get_children()) > 0)
-
-        if layout is not None:
-            result = self._get_axes_layout(plotting._flatten(axes))
-            self.assertEqual(result, layout)
-
-        self.assert_numpy_array_equal(np.round(visible_axes[0].figure.get_size_inches()),
-                                      np.array(figsize))
-
-    def _get_axes_layout(self, axes):
-        x_set = set()
-        y_set = set()
-        for ax in axes:
-            # check axes coordinates to estimate layout
-            points = ax.get_position().get_points()
-            x_set.add(points[0][0])
-            y_set.add(points[0][1])
-        return (len(y_set), len(x_set))
-
-    def _flatten_visible(self, axes):
-        """
-        Flatten axes, and filter only visible
-
-        Parameters
-        ----------
-        axes : matplotlib Axes object, or its list-like
-
-        """
-        axes = plotting._flatten(axes)
-        axes = [ax for ax in axes if ax.get_visible()]
-        return axes
-
-    def _check_has_errorbars(self, axes, xerr=0, yerr=0):
-        """
-        Check axes has expected number of errorbars
-
-        Parameters
-        ----------
-        axes : matplotlib Axes object, or its list-like
-        xerr : number
-            expected number of x errorbar
-        yerr : number
-            expected number of y errorbar
-        """
-        axes = self._flatten_visible(axes)
-        for ax in axes:
-            containers = ax.containers
-            xerr_count = 0
-            yerr_count = 0
-            for c in containers:
-                has_xerr = getattr(c, 'has_xerr', False)
-                has_yerr = getattr(c, 'has_yerr', False)
-                if has_xerr:
-                    xerr_count += 1
-                if has_yerr:
-                    yerr_count += 1
-            self.assertEqual(xerr, xerr_count)
-            self.assertEqual(yerr, yerr_count)
-
-    def _check_box_return_type(self, returned, return_type, expected_keys=None,
-                               check_ax_title=True):
-        """
-        Check box returned type is correct
-
-        Parameters
-        ----------
-        returned : object to be tested, returned from boxplot
-        return_type : str
-            return_type passed to boxplot
-        expected_keys : list-like, optional
-            group labels in subplot case. If not passed,
-            the function checks assuming boxplot uses single ax
-        check_ax_title : bool
-            Whether to check the ax.title is the same as expected_key
-            Intended to be checked by calling from ``boxplot``.
-            Normal ``plot`` doesn't attach ``ax.title``, it must be disabled.
-        """
-        from matplotlib.axes import Axes
-        types = {'dict': dict, 'axes': Axes, 'both': tuple}
-        if expected_keys is None:
-            # should be fixed when the returning default is changed
-            if return_type is None:
-                return_type = 'dict'
-
-            self.assertTrue(isinstance(returned, types[return_type]))
-            if return_type == 'both':
-                self.assertIsInstance(returned.ax, Axes)
-                self.assertIsInstance(returned.lines, dict)
-        else:
-            # should be fixed when the returning default is changed
-            if return_type is None:
-                for r in self._flatten_visible(returned):
-                    self.assertIsInstance(r, Axes)
-                return
-
-            self.assertTrue(isinstance(returned, OrderedDict))
-            self.assertEqual(sorted(returned.keys()), sorted(expected_keys))
-            for key, value in iteritems(returned):
-                self.assertTrue(isinstance(value, types[return_type]))
-                # check returned dict has correct mapping
-                if return_type == 'axes':
-                    if check_ax_title:
-                        self.assertEqual(value.get_title(), key)
-                elif return_type == 'both':
-                    if check_ax_title:
-                        self.assertEqual(value.ax.get_title(), key)
-                    self.assertIsInstance(value.ax, Axes)
-                    self.assertIsInstance(value.lines, dict)
-                elif return_type == 'dict':
-                    line = value['medians'][0]
-                    if check_ax_title:
-                        self.assertEqual(line.get_axes().get_title(), key)
-                else:
-                    raise AssertionError
-
-    def _check_grid_settings(self, obj, kinds, kws={}):
-        # Make sure plot defaults to rcParams['axes.grid'] setting, GH 9792
-
-        import matplotlib as mpl
-
-        def is_grid_on():
-            xoff = all(not g.gridOn for g in self.plt.gca().xaxis.get_major_ticks())
-            yoff = all(not g.gridOn for g in self.plt.gca().yaxis.get_major_ticks())
-            return not(xoff and yoff)
-
-        spndx=1
-        for kind in kinds:
-            if not _ok_for_gaussian_kde(kind):
-                continue
-
-            self.plt.subplot(1,4*len(kinds),spndx); spndx+=1
-            mpl.rc('axes',grid=False)
-            obj.plot(kind=kind, **kws)
-            self.assertFalse(is_grid_on())
-
-            self.plt.subplot(1,4*len(kinds),spndx); spndx+=1
-            mpl.rc('axes',grid=True)
-            obj.plot(kind=kind, grid=False, **kws)
-            self.assertFalse(is_grid_on())
-
-            if kind != 'pie':
-                self.plt.subplot(1,4*len(kinds),spndx); spndx+=1
-                mpl.rc('axes',grid=True)
-                obj.plot(kind=kind, **kws)
-                self.assertTrue(is_grid_on())
-
-                self.plt.subplot(1,4*len(kinds),spndx); spndx+=1
-                mpl.rc('axes',grid=False)
-                obj.plot(kind=kind, grid=True, **kws)
-                self.assertTrue(is_grid_on())
-
-    def _maybe_unpack_cycler(self, rcParams, field='color'):
-        """
-        Compat layer for MPL 1.5 change to color cycle
-
-        Before: plt.rcParams['axes.color_cycle'] -> ['b', 'g', 'r'...]
-        After : plt.rcParams['axes.prop_cycle'] -> cycler(...)
-        """
-        if self.mpl_ge_1_5_0:
-            cyl = rcParams['axes.prop_cycle']
-            colors = [v[field] for v in cyl]
-        else:
-            colors = rcParams['axes.color_cycle']
-        return colors
-
-
-@tm.mplskip
-class TestSeriesPlots(TestPlotBase):
-
-    def setUp(self):
-        TestPlotBase.setUp(self)
-        import matplotlib as mpl
-        mpl.rcdefaults()
-
-        self.ts = tm.makeTimeSeries()
-        self.ts.name = 'ts'
-
-        self.series = tm.makeStringSeries()
-        self.series.name = 'series'
-
-        self.iseries = tm.makePeriodSeries()
-        self.iseries.name = 'iseries'
-
-    @slow
-    def test_plot(self):
-        _check_plot_works(self.ts.plot, label='foo')
-        _check_plot_works(self.ts.plot, use_index=False)
-        axes = _check_plot_works(self.ts.plot, rot=0)
-        self._check_ticks_props(axes, xrot=0)
-
-        ax = _check_plot_works(self.ts.plot, style='.', logy=True)
-        self._check_ax_scales(ax, yaxis='log')
-
-        ax = _check_plot_works(self.ts.plot, style='.', logx=True)
-        self._check_ax_scales(ax, xaxis='log')
-
-        ax = _check_plot_works(self.ts.plot, style='.', loglog=True)
-        self._check_ax_scales(ax, xaxis='log', yaxis='log')
-
-        _check_plot_works(self.ts[:10].plot.bar)
-        _check_plot_works(self.ts.plot.area, stacked=False)
-        _check_plot_works(self.iseries.plot)
-
-        for kind in ['line', 'bar', 'barh', 'kde', 'hist', 'box']:
-            if not _ok_for_gaussian_kde(kind):
-                continue
-            _check_plot_works(self.series[:5].plot, kind=kind)
-
-        _check_plot_works(self.series[:10].plot.barh)
-        ax = _check_plot_works(Series(randn(10)).plot.bar, color='black')
-        self._check_colors([ax.patches[0]], facecolors=['black'])
-
-        # GH 6951
-        ax = _check_plot_works(self.ts.plot, subplots=True)
-        self._check_axes_shape(ax, axes_num=1, layout=(1, 1))
-
-        ax = _check_plot_works(self.ts.plot, subplots=True, layout=(-1, 1))
-        self._check_axes_shape(ax, axes_num=1, layout=(1, 1))
-        ax = _check_plot_works(self.ts.plot, subplots=True, layout=(1, -1))
-        self._check_axes_shape(ax, axes_num=1, layout=(1, 1))
-
-    @slow
-    def test_plot_figsize_and_title(self):
-        # figsize and title
-        ax = self.series.plot(title='Test', figsize=(16, 8))
-        self._check_text_labels(ax.title, 'Test')
-        self._check_axes_shape(ax, axes_num=1, layout=(1, 1), figsize=(16, 8))
-
-    def test_dont_modify_rcParams(self):
-        # GH 8242
-        if self.mpl_ge_1_5_0:
-            key = 'axes.prop_cycle'
-        else:
-            key = 'axes.color_cycle'
-        colors = self.plt.rcParams[key]
-        Series([1, 2, 3]).plot()
-        self.assertEqual(colors, self.plt.rcParams[key])
-
-    def test_ts_line_lim(self):
-        ax = self.ts.plot()
-        xmin, xmax = ax.get_xlim()
-        lines = ax.get_lines()
-        self.assertEqual(xmin, lines[0].get_data(orig=False)[0][0])
-        self.assertEqual(xmax, lines[0].get_data(orig=False)[0][-1])
-        tm.close()
-
-        ax = self.ts.plot(secondary_y=True)
-        xmin, xmax = ax.get_xlim()
-        lines = ax.get_lines()
-        self.assertEqual(xmin, lines[0].get_data(orig=False)[0][0])
-        self.assertEqual(xmax, lines[0].get_data(orig=False)[0][-1])
-
-    def test_ts_area_lim(self):
-        ax = self.ts.plot.area(stacked=False)
-        xmin, xmax = ax.get_xlim()
-        line = ax.get_lines()[0].get_data(orig=False)[0]
-        self.assertEqual(xmin, line[0])
-        self.assertEqual(xmax, line[-1])
-        tm.close()
-
-        # GH 7471
-        ax = self.ts.plot.area(stacked=False, x_compat=True)
-        xmin, xmax = ax.get_xlim()
-        line = ax.get_lines()[0].get_data(orig=False)[0]
-        self.assertEqual(xmin, line[0])
-        self.assertEqual(xmax, line[-1])
-        tm.close()
-
-        tz_ts = self.ts.copy()
-        tz_ts.index = tz_ts.tz_localize('GMT').tz_convert('CET')
-        ax = tz_ts.plot.area(stacked=False, x_compat=True)
-        xmin, xmax = ax.get_xlim()
-        line = ax.get_lines()[0].get_data(orig=False)[0]
-        self.assertEqual(xmin, line[0])
-        self.assertEqual(xmax, line[-1])
-        tm.close()
-
-        ax = tz_ts.plot.area(stacked=False, secondary_y=True)
-        xmin, xmax = ax.get_xlim()
-        line = ax.get_lines()[0].get_data(orig=False)[0]
-        self.assertEqual(xmin, line[0])
-        self.assertEqual(xmax, line[-1])
-
-    def test_label(self):
-        s = Series([1, 2])
-        ax = s.plot(label='LABEL', legend=True)
-        self._check_legend_labels(ax, labels=['LABEL'])
-        self.plt.close()
-        ax = s.plot(legend=True)
-        self._check_legend_labels(ax, labels=['None'])
-        self.plt.close()
-        # get name from index
-        s.name = 'NAME'
-        ax = s.plot(legend=True)
-        self._check_legend_labels(ax, labels=['NAME'])
-        self.plt.close()
-        # override the default
-        ax = s.plot(legend=True, label='LABEL')
-        self._check_legend_labels(ax, labels=['LABEL'])
-        self.plt.close()
-        # Add lebel info, but don't draw
-        ax = s.plot(legend=False, label='LABEL')
-        self.assertEqual(ax.get_legend(), None)  # Hasn't been drawn
-        ax.legend()  # draw it
-        self._check_legend_labels(ax, labels=['LABEL'])
-
-    def test_line_area_nan_series(self):
-        values = [1, 2, np.nan, 3]
-        s = Series(values)
-        ts = Series(values, index=tm.makeDateIndex(k=4))
-
-        for d in [s, ts]:
-            ax = _check_plot_works(d.plot)
-            masked = ax.lines[0].get_ydata()
-            # remove nan for comparison purpose
-            self.assert_numpy_array_equal(np.delete(masked.data, 2), np.array([1, 2, 3]))
-            self.assert_numpy_array_equal(masked.mask, np.array([False, False, True, False]))
-
-            expected = np.array([1, 2, 0, 3])
-            ax = _check_plot_works(d.plot, stacked=True)
-            self.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected)
-            ax = _check_plot_works(d.plot.area)
-            self.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected)
-            ax = _check_plot_works(d.plot.area, stacked=False)
-            self.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected)
-
-    def test_line_use_index_false(self):
-        s = Series([1, 2, 3], index=['a', 'b', 'c'])
-        s.index.name = 'The Index'
-        ax = s.plot(use_index=False)
-        label = ax.get_xlabel()
-        self.assertEqual(label, '')
-        ax2 = s.plot.bar(use_index=False)
-        label2 = ax2.get_xlabel()
-        self.assertEqual(label2, '')
-
-    @slow
-    def test_bar_log(self):
-        expected = np.array([1., 10., 100., 1000.])
-
-        if not self.mpl_le_1_2_1:
-            expected = np.hstack((.1, expected, 1e4))
-
-        ax = Series([200, 500]).plot.bar(log=True)
-        tm.assert_numpy_array_equal(ax.yaxis.get_ticklocs(), expected)
-        tm.close()
-
-        ax = Series([200, 500]).plot.barh(log=True)
-        tm.assert_numpy_array_equal(ax.xaxis.get_ticklocs(), expected)
-        tm.close()
-
-        # GH 9905
-        expected = np.array([1.0e-03, 1.0e-02, 1.0e-01, 1.0e+00])
-
-        if not self.mpl_le_1_2_1:
-            expected = np.hstack((1.0e-04, expected, 1.0e+01))
-
-        ax = Series([0.1, 0.01, 0.001]).plot(log=True, kind='bar')
-        tm.assert_numpy_array_equal(ax.get_ylim(), (0.001, 0.10000000000000001))
-        tm.assert_numpy_array_equal(ax.yaxis.get_ticklocs(), expected)
-        tm.close()
-
-        ax = Series([0.1, 0.01, 0.001]).plot(log=True, kind='barh')
-        tm.assert_numpy_array_equal(ax.get_xlim(), (0.001, 0.10000000000000001))
-        tm.assert_numpy_array_equal(ax.xaxis.get_ticklocs(), expected)
-
-    @slow
-    def test_bar_ignore_index(self):
-        df = Series([1, 2, 3, 4], index=['a', 'b', 'c', 'd'])
-        ax = df.plot.bar(use_index=False)
-        self._check_text_labels(ax.get_xticklabels(), ['0', '1', '2', '3'])
-
-    def test_rotation(self):
-        df = DataFrame(randn(5, 5))
-        # Default rot 0
-        axes = df.plot()
-        self._check_ticks_props(axes, xrot=0)
-
-        axes = df.plot(rot=30)
-        self._check_ticks_props(axes, xrot=30)
-
-    def test_irregular_datetime(self):
-        rng = date_range('1/1/2000', '3/1/2000')
-        rng = rng[[0, 1, 2, 3, 5, 9, 10, 11, 12]]
-        ser = Series(randn(len(rng)), rng)
-        ax = ser.plot()
-        xp = datetime(1999, 1, 1).toordinal()
-        ax.set_xlim('1/1/1999', '1/1/2001')
-        self.assertEqual(xp, ax.get_xlim()[0])
-
-    @slow
-    def test_pie_series(self):
-        # if sum of values is less than 1.0, pie handle them as rate and draw semicircle.
-        series = Series(np.random.randint(1, 5),
-                        index=['a', 'b', 'c', 'd', 'e'], name='YLABEL')
-        ax = _check_plot_works(series.plot.pie)
-        self._check_text_labels(ax.texts, series.index)
-        self.assertEqual(ax.get_ylabel(), 'YLABEL')
-
-        # without wedge labels
-        ax = _check_plot_works(series.plot.pie, labels=None)
-        self._check_text_labels(ax.texts, [''] * 5)
-
-        # with less colors than elements
-        color_args = ['r', 'g', 'b']
-        ax = _check_plot_works(series.plot.pie, colors=color_args)
-
-        color_expected = ['r', 'g', 'b', 'r', 'g']
-        self._check_colors(ax.patches, facecolors=color_expected)
-
-        # with labels and colors
-        labels = ['A', 'B', 'C', 'D', 'E']
-        color_args = ['r', 'g', 'b', 'c', 'm']
-        ax = _check_plot_works(series.plot.pie, labels=labels, colors=color_args)
-        self._check_text_labels(ax.texts, labels)
-        self._check_colors(ax.patches, facecolors=color_args)
-
-        # with autopct and fontsize
-        ax = _check_plot_works(series.plot.pie, colors=color_args,
-                               autopct='%.2f', fontsize=7)
-        pcts = ['{0:.2f}'.format(s * 100) for s in series.values / float(series.sum())]
-        iters = [iter(series.index), iter(pcts)]
-        expected_texts = list(next(it) for it in itertools.cycle(iters))
-        self._check_text_labels(ax.texts, expected_texts)
-        for t in ax.texts:
-            self.assertEqual(t.get_fontsize(), 7)
-
-        # includes negative value
-        with tm.assertRaises(ValueError):
-            series = Series([1, 2, 0, 4, -1], index=['a', 'b', 'c', 'd', 'e'])
-            series.plot.pie()
-
-        # includes nan
-        series = Series([1, 2, np.nan, 4],
-                        index=['a', 'b', 'c', 'd'], name='YLABEL')
-        ax = _check_plot_works(series.plot.pie)
-        self._check_text_labels(ax.texts, ['a', 'b', '', 'd'])
-
-    def test_pie_nan(self):
-        s = Series([1, np.nan, 1, 1])
-        ax = s.plot.pie(legend=True)
-        expected = ['0', '', '2', '3']
-        result = [x.get_text() for x in ax.texts]
-        self.assertEqual(result, expected)
-
-    @slow
-    def test_hist_df_kwargs(self):
-        df = DataFrame(np.random.randn(10, 2))
-        ax = df.plot.hist(bins=5)
-        self.assertEqual(len(ax.patches), 10)
-
-    @slow
-    def test_hist_df_with_nonnumerics(self):
-        # GH 9853
-        with tm.RNGContext(1):
-            df = DataFrame(np.random.randn(10, 4), columns=['A', 'B', 'C', 'D'])
-        df['E'] = ['x', 'y'] * 5
-        ax = df.plot.hist(bins=5)
-        self.assertEqual(len(ax.patches), 20)
-
-        ax = df.plot.hist() # bins=10
-        self.assertEqual(len(ax.patches), 40)
-
-    @slow
-    def test_hist_legacy(self):
-        _check_plot_works(self.ts.hist)
-        _check_plot_works(self.ts.hist, grid=False)
-        _check_plot_works(self.ts.hist, figsize=(8, 10))
-        _check_plot_works(self.ts.hist, filterwarnings='ignore', by=self.ts.index.month)
-        _check_plot_works(self.ts.hist, filterwarnings='ignore', by=self.ts.index.month, bins=5)
-
-        fig, ax = self.plt.subplots(1, 1)
-        _check_plot_works(self.ts.hist, ax=ax)
-        _check_plot_works(self.ts.hist, ax=ax, figure=fig)
-        _check_plot_works(self.ts.hist, figure=fig)
-        tm.close()
-
-        fig, (ax1, ax2) = self.plt.subplots(1, 2)
-        _check_plot_works(self.ts.hist, figure=fig, ax=ax1)
-        _check_plot_works(self.ts.hist, figure=fig, ax=ax2)
-
-        with tm.assertRaises(ValueError):
-            self.ts.hist(by=self.ts.index, figure=fig)
-
-    @slow
-    def test_hist_bins_legacy(self):
-        df = DataFrame(np.random.randn(10, 2))
-        ax = df.hist(bins=2)[0][0]
-        self.assertEqual(len(ax.patches), 2)
-
-    @slow
-    def test_hist_layout(self):
-        df = self.hist_df
-        with tm.assertRaises(ValueError):
-            df.height.hist(layout=(1, 1))
-
-        with tm.assertRaises(ValueError):
-            df.height.hist(layout=[1, 1])
-
-    @slow
-    def test_hist_layout_with_by(self):
-        df = self.hist_df
-
-        axes = _check_plot_works(df.height.hist, filterwarnings='ignore',
-                                 by=df.gender, layout=(2, 1))
-        self._check_axes_shape(axes, axes_num=2, layout=(2, 1))
-
-        axes = _check_plot_works(df.height.hist, filterwarnings='ignore',
-                                 by=df.gender, layout=(3, -1))
-        self._check_axes_shape(axes, axes_num=2, layout=(3, 1))
-
-        axes = _check_plot_works(df.height.hist, filterwarnings='ignore',
-                                 by=df.category, layout=(4, 1))
-        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
-
-        axes = _check_plot_works(df.height.hist, filterwarnings='ignore',
-                                 by=df.category, layout=(2, -1))
-        self._check_axes_shape(axes, axes_num=4, layout=(2, 2))
-
-        axes = _check_plot_works(df.height.hist, filterwarnings='ignore',
-                                 by=df.category, layout=(3, -1))
-        self._check_axes_shape(axes, axes_num=4, layout=(3, 2))
-
-        axes = _check_plot_works(df.height.hist, filterwarnings='ignore',
-                                 by=df.category, layout=(-1, 4))
-        self._check_axes_shape(axes, axes_num=4, layout=(1, 4))
-
-        axes = _check_plot_works(df.height.hist, filterwarnings='ignore',
-                                 by=df.classroom, layout=(2, 2))
-        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
-
-        axes = df.height.hist(by=df.category, layout=(4, 2), figsize=(12, 7))
-        self._check_axes_shape(axes, axes_num=4, layout=(4, 2), figsize=(12, 7))
-
-    @slow
-    def test_hist_no_overlap(self):
-        from matplotlib.pyplot import subplot, gcf
-        x = Series(randn(2))
-        y = Series(randn(2))
-        subplot(121)
-        x.hist()
-        subplot(122)
-        y.hist()
-        fig = gcf()
-        axes = fig.get_axes()
-        self.assertEqual(len(axes), 2)
-
-    @slow
-    def test_hist_secondary_legend(self):
-        # GH 9610
-        df = DataFrame(np.random.randn(30, 4), columns=list('abcd'))
-
-        # primary -> secondary
-        ax = df['a'].plot.hist(legend=True)
-        df['b'].plot.hist(ax=ax, legend=True, secondary_y=True)
-        # both legends are dran on left ax
-        # left and right axis must be visible
-        self._check_legend_labels(ax, labels=['a', 'b (right)'])
-        self.assertTrue(ax.get_yaxis().get_visible())
-        self.assertTrue(ax.right_ax.get_yaxis().get_visible())
-        tm.close()
-
-        # secondary -> secondary
-        ax = df['a'].plot.hist(legend=True, secondary_y=True)
-        df['b'].plot.hist(ax=ax, legend=True, secondary_y=True)
-        # both legends are draw on left ax
-        # left axis must be invisible, right axis must be visible
-        self._check_legend_labels(ax.left_ax, labels=['a (right)', 'b (right)'])
-        self.assertFalse(ax.left_ax.get_yaxis().get_visible())
-        self.assertTrue(ax.get_yaxis().get_visible())
-        tm.close()
-
-        # secondary -> primary
-        ax = df['a'].plot.hist(legend=True, secondary_y=True)
-        # right axes is returned
-        df['b'].plot.hist(ax=ax, legend=True)
-        # both legends are draw on left ax
-        # left and right axis must be visible
-        self._check_legend_labels(ax.left_ax, labels=['a (right)', 'b'])
-        self.assertTrue(ax.left_ax.get_yaxis().get_visible())
-        self.assertTrue(ax.get_yaxis().get_visible())
-        tm.close()
-
-    @slow
-    def test_df_series_secondary_legend(self):
-        # GH 9779
-        df = DataFrame(np.random.randn(30, 3), columns=list('abc'))
-        s = Series(np.random.randn(30), name='x')
-
-        # primary -> secondary (without passing ax)
-        ax = df.plot()
-        s.plot(legend=True, secondary_y=True)
-        # both legends are dran on left ax
-        # left and right axis must be visible
-        self._check_legend_labels(ax, labels=['a', 'b', 'c', 'x (right)'])
-        self.assertTrue(ax.get_yaxis().get_visible())
-        self.assertTrue(ax.right_ax.get_yaxis().get_visible())
-        tm.close()
-
-        # primary -> secondary (with passing ax)
-        ax = df.plot()
-        s.plot(ax=ax, legend=True, secondary_y=True)
-        # both legends are dran on left ax
-        # left and right axis must be visible
-        self._check_legend_labels(ax, labels=['a', 'b', 'c', 'x (right)'])
-        self.assertTrue(ax.get_yaxis().get_visible())
-        self.assertTrue(ax.right_ax.get_yaxis().get_visible())
-        tm.close()
-
-        # seconcary -> secondary (without passing ax)
-        ax = df.plot(secondary_y=True)
-        s.plot(legend=True, secondary_y=True)
-        # both legends are dran on left ax
-        # left axis must be invisible and right axis must be visible
-        expected = ['a (right)', 'b (right)', 'c (right)', 'x (right)']
-        self._check_legend_labels(ax.left_ax, labels=expected)
-        self.assertFalse(ax.left_ax.get_yaxis().get_visible())
-        self.assertTrue(ax.get_yaxis().get_visible())
-        tm.close()
-
-        # secondary -> secondary (with passing ax)
-        ax = df.plot(secondary_y=True)
-        s.plot(ax=ax, legend=True, secondary_y=True)
-        # both legends are dran on left ax
-        # left axis must be invisible and right axis must be visible
-        expected = ['a (right)', 'b (right)', 'c (right)', 'x (right)']
-        self._check_legend_labels(ax.left_ax, expected)
-        self.assertFalse(ax.left_ax.get_yaxis().get_visible())
-        self.assertTrue(ax.get_yaxis().get_visible())
-        tm.close()
-
-        # secondary -> secondary (with passing ax)
-        ax = df.plot(secondary_y=True, mark_right=False)
-        s.plot(ax=ax, legend=True, secondary_y=True)
-        # both legends are dran on left ax
-        # left axis must be invisible and right axis must be visible
-        expected = ['a', 'b', 'c', 'x (right)']
-        self._check_legend_labels(ax.left_ax, expected)
-        self.assertFalse(ax.left_ax.get_yaxis().get_visible())
-        self.assertTrue(ax.get_yaxis().get_visible())
-        tm.close()
-
-    @slow
-    def test_plot_fails_with_dupe_color_and_style(self):
-        x = Series(randn(2))
-        with tm.assertRaises(ValueError):
-            x.plot(style='k--', color='k')
-
-    @slow
-    def test_hist_kde(self):
-        ax = self.ts.plot.hist(logy=True)
-        self._check_ax_scales(ax, yaxis='log')
-        xlabels = ax.get_xticklabels()
-        # ticks are values, thus ticklabels are blank
-        self._check_text_labels(xlabels, [''] * len(xlabels))
-        ylabels = ax.get_yticklabels()
-        self._check_text_labels(ylabels, [''] * len(ylabels))
-
-        tm._skip_if_no_scipy()
-        _skip_if_no_scipy_gaussian_kde()
-        _check_plot_works(self.ts.plot.kde)
-        _check_plot_works(self.ts.plot.density)
-        ax = self.ts.plot.kde(logy=True)
-        self._check_ax_scales(ax, yaxis='log')
-        xlabels = ax.get_xticklabels()
-        self._check_text_labels(xlabels, [''] * len(xlabels))
-        ylabels = ax.get_yticklabels()
-        self._check_text_labels(ylabels, [''] * len(ylabels))
-
-    @slow
-    def test_kde_kwargs(self):
-        tm._skip_if_no_scipy()
-        _skip_if_no_scipy_gaussian_kde()
-        from numpy import linspace
-        _check_plot_works(self.ts.plot.kde, bw_method=.5, ind=linspace(-100,100,20))
-        _check_plot_works(self.ts.plot.density, bw_method=.5, ind=linspace(-100,100,20))
-        ax = self.ts.plot.kde(logy=True, bw_method=.5, ind=linspace(-100,100,20))
-        self._check_ax_scales(ax, yaxis='log')
-        self._check_text_labels(ax.yaxis.get_label(), 'Density')
-
-    @slow
-    def test_kde_missing_vals(self):
-        tm._skip_if_no_scipy()
-        _skip_if_no_scipy_gaussian_kde()
-        s = Series(np.random.uniform(size=50))
-        s[0] = np.nan
-        ax = _check_plot_works(s.plot.kde)
-
-    @slow
-    def test_hist_kwargs(self):
-        ax = self.ts.plot.hist(bins=5)
-        self.assertEqual(len(ax.patches), 5)
-        self._check_text_labels(ax.yaxis.get_label(), 'Frequency')
-        tm.close()
-
-        if self.mpl_ge_1_3_1:
-            ax = self.ts.plot.hist(orientation='horizontal')
-            self._check_text_labels(ax.xaxis.get_label(), 'Frequency')
-            tm.close()
-
-            ax = self.ts.plot.hist(align='left', stacked=True)
-            tm.close()
-
-    @slow
-    def test_hist_kde_color(self):
-        ax = self.ts.plot.hist(logy=True, bins=10, color='b')
-        self._check_ax_scales(ax, yaxis='log')
-        self.assertEqual(len(ax.patches), 10)
-        self._check_colors(ax.patches, facecolors=['b'] * 10)
-
-        tm._skip_if_no_scipy()
-        _skip_if_no_scipy_gaussian_kde()
-        ax = self.ts.plot.kde(logy=True, color='r')
-        self._check_ax_scales(ax, yaxis='log')
-        lines = ax.get_lines()
-        self.assertEqual(len(lines), 1)
-        self._check_colors(lines, ['r'])
-
-    @slow
-    def test_boxplot_series(self):
-        ax = self.ts.plot.box(logy=True)
-        self._check_ax_scales(ax, yaxis='log')
-        xlabels = ax.get_xticklabels()
-        self._check_text_labels(xlabels, [self.ts.name])
-        ylabels = ax.get_yticklabels()
-        self._check_text_labels(ylabels, [''] * len(ylabels))
-
-    @slow
-    def test_kind_both_ways(self):
-        s = Series(range(3))
-        for kind in plotting._common_kinds + plotting._series_kinds:
-            if not _ok_for_gaussian_kde(kind):
-                continue
-            s.plot(kind=kind)
-            getattr(s.plot, kind)()
-
-    @slow
-    def test_invalid_plot_data(self):
-        s = Series(list('abcd'))
-        for kind in plotting._common_kinds:
-            if not _ok_for_gaussian_kde(kind):
-                continue
-            with tm.assertRaises(TypeError):
-                s.plot(kind=kind)
-
-    @slow
-    def test_valid_object_plot(self):
-        s = Series(lrange(10), dtype=object)
-        for kind in plotting._common_kinds:
-            if not _ok_for_gaussian_kde(kind):
-                continue
-            _check_plot_works(s.plot, kind=kind)
-
-    def test_partially_invalid_plot_data(self):
-        s = Series(['a', 'b', 1.0, 2])
-        for kind in plotting._common_kinds:
-            if not _ok_for_gaussian_kde(kind):
-                continue
-            with tm.assertRaises(TypeError):
-                s.plot(kind=kind)
-
-    def test_invalid_kind(self):
-        s = Series([1, 2])
-        with tm.assertRaises(ValueError):
-            s.plot(kind='aasdf')
-
-    @slow
-    def test_dup_datetime_index_plot(self):
-        dr1 = date_range('1/1/2009', periods=4)
-        dr2 = date_range('1/2/2009', periods=4)
-        index = dr1.append(dr2)
-        values = randn(index.size)
-        s = Series(values, index=index)
-        _check_plot_works(s.plot)
-
-    @slow
-    def test_errorbar_plot(self):
-
-        s = Series(np.arange(10), name='x')
-        s_err = np.random.randn(10)
-        d_err =  DataFrame(randn(10, 2), index=s.index, columns=['x', 'y'])
-        # test line and bar plots
-        kinds = ['line', 'bar']
-        for kind in kinds:
-            ax = _check_plot_works(s.plot, yerr=Series(s_err), kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=1)
-            ax = _check_plot_works(s.plot, yerr=s_err, kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=1)
-            ax = _check_plot_works(s.plot, yerr=s_err.tolist(), kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=1)
-            ax = _check_plot_works(s.plot, yerr=d_err, kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=1)
-            ax = _check_plot_works(s.plot, xerr=0.2, yerr=0.2, kind=kind)
-            self._check_has_errorbars(ax, xerr=1, yerr=1)
-
-        ax = _check_plot_works(s.plot, xerr=s_err)
-        self._check_has_errorbars(ax, xerr=1, yerr=0)
-
-        # test time series plotting
-        ix = date_range('1/1/2000', '1/1/2001', freq='M')
-        ts = Series(np.arange(12), index=ix, name='x')
-        ts_err = Series(np.random.randn(12), index=ix)
-        td_err =  DataFrame(randn(12, 2), index=ix, columns=['x', 'y'])
-
-        ax = _check_plot_works(ts.plot, yerr=ts_err)
-        self._check_has_errorbars(ax, xerr=0, yerr=1)
-        ax = _check_plot_works(ts.plot, yerr=td_err)
-        self._check_has_errorbars(ax, xerr=0, yerr=1)
-
-        # check incorrect lengths and types
-        with tm.assertRaises(ValueError):
-            s.plot(yerr=np.arange(11))
-
-        s_err = ['zzz']*10
-        # in mpl 1.5+ this is a TypeError
-        with tm.assertRaises((ValueError, TypeError)):
-            s.plot(yerr=s_err)
-
-    def test_table(self):
-        _check_plot_works(self.series.plot, table=True)
-        _check_plot_works(self.series.plot, table=self.series)
-
-    @slow
-    def test_series_grid_settings(self):
-        # Make sure plot defaults to rcParams['axes.grid'] setting, GH 9792
-        self._check_grid_settings(Series([1,2,3]),
-            plotting._series_kinds + plotting._common_kinds)
-
-    @slow
-    def test_standard_colors(self):
-        for c in ['r', 'red', 'green', '#FF0000']:
-            result = plotting._get_standard_colors(1, color=c)
-            self.assertEqual(result, [c])
-
-            result = plotting._get_standard_colors(1, color=[c])
-            self.assertEqual(result, [c])
-
-            result = plotting._get_standard_colors(3, color=c)
-            self.assertEqual(result, [c] * 3)
-
-            result = plotting._get_standard_colors(3, color=[c])
-            self.assertEqual(result, [c] * 3)
-
-    @slow
-    def test_standard_colors_all(self):
-        import matplotlib.colors as colors
-
-        # multiple colors like mediumaquamarine
-        for c in colors.cnames:
-            result = plotting._get_standard_colors(num_colors=1, color=c)
-            self.assertEqual(result, [c])
-
-            result = plotting._get_standard_colors(num_colors=1, color=[c])
-            self.assertEqual(result, [c])
-
-            result = plotting._get_standard_colors(num_colors=3, color=c)
-            self.assertEqual(result, [c] * 3)
-
-            result = plotting._get_standard_colors(num_colors=3, color=[c])
-            self.assertEqual(result, [c] * 3)
-
-        # single letter colors like k
-        for c in colors.ColorConverter.colors:
-            result = plotting._get_standard_colors(num_colors=1, color=c)
-            self.assertEqual(result, [c])
-
-            result = plotting._get_standard_colors(num_colors=1, color=[c])
-            self.assertEqual(result, [c])
-
-            result = plotting._get_standard_colors(num_colors=3, color=c)
-            self.assertEqual(result, [c] * 3)
-
-            result = plotting._get_standard_colors(num_colors=3, color=[c])
-            self.assertEqual(result, [c] * 3)
-
-    def test_series_plot_color_kwargs(self):
-        # GH1890
-        ax = Series(np.arange(12) + 1).plot(color='green')
-        self._check_colors(ax.get_lines(), linecolors=['green'])
-
-    def test_time_series_plot_color_kwargs(self):
-        # #1890
-        ax = Series(np.arange(12) + 1, index=date_range(
-            '1/1/2000', periods=12)).plot(color='green')
-        self._check_colors(ax.get_lines(), linecolors=['green'])
-
-    def test_time_series_plot_color_with_empty_kwargs(self):
-        import matplotlib as mpl
-
-        if self.mpl_ge_1_5_0:
-            def_colors = self._maybe_unpack_cycler(mpl.rcParams)
-        else:
-            def_colors = mpl.rcParams['axes.color_cycle']
-        index = date_range('1/1/2000', periods=12)
-        s = Series(np.arange(1, 13), index=index)
-
-        ncolors = 3
-
-        for i in range(ncolors):
-            ax = s.plot()
-        self._check_colors(ax.get_lines(), linecolors=def_colors[:ncolors])
-
-
-@tm.mplskip
-class TestDataFramePlots(TestPlotBase):
-    def setUp(self):
-        TestPlotBase.setUp(self)
-        import matplotlib as mpl
-        mpl.rcdefaults()
-
-        self.tdf = tm.makeTimeDataFrame()
-        self.hexbin_df = DataFrame({"A": np.random.uniform(size=20),
-                               "B": np.random.uniform(size=20),
-                               "C": np.arange(20) + np.random.uniform(size=20)})
-
-        from pandas import read_csv
-        path = os.path.join(curpath(), 'data', 'iris.csv')
-        self.iris = read_csv(path)
-
-    @slow
-    def test_plot(self):
-        df = self.tdf
-        _check_plot_works(df.plot, filterwarnings='ignore', grid=False)
-        axes = _check_plot_works(df.plot, filterwarnings='ignore', subplots=True)
-        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
-
-        axes = _check_plot_works(df.plot, filterwarnings='ignore',
-                                 subplots=True, layout=(-1, 2))
-        self._check_axes_shape(axes, axes_num=4, layout=(2, 2))
-
-        axes = _check_plot_works(df.plot, filterwarnings='ignore',
-                                 subplots=True, use_index=False)
-        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
-
-        df = DataFrame({'x': [1, 2], 'y': [3, 4]})
-        with tm.assertRaises(TypeError):
-            df.plot.line(blarg=True)
-
-        df = DataFrame(np.random.rand(10, 3),
-                       index=list(string.ascii_letters[:10]))
-
-        _check_plot_works(df.plot, use_index=True)
-        _check_plot_works(df.plot, sort_columns=False)
-        _check_plot_works(df.plot, yticks=[1, 5, 10])
-        _check_plot_works(df.plot, xticks=[1, 5, 10])
-        _check_plot_works(df.plot, ylim=(-100, 100), xlim=(-100, 100))
-
-        _check_plot_works(df.plot, filterwarnings='ignore', subplots=True, title='blah')
-        # We have to redo it here because _check_plot_works does two plots, once without an ax
-        # kwarg and once with an ax kwarg and the new sharex behaviour does not remove the
-        # visibility of the latter axis (as ax is present).
-        # see: https://github.com/pydata/pandas/issues/9737
-        axes = df.plot(subplots=True, title='blah')
-        self._check_axes_shape(axes, axes_num=3, layout=(3, 1))
-        #axes[0].figure.savefig("test.png")
-        for ax in axes[:2]:
-            self._check_visible(ax.xaxis)   # xaxis must be visible for grid
-            self._check_visible(ax.get_xticklabels(), visible=False)
-            self._check_visible(ax.get_xticklabels(minor=True), visible=False)
-            self._check_visible([ax.xaxis.get_label()], visible=False)
-        for ax in [axes[2]]:
-            self._check_visible(ax.xaxis)
-            self._check_visible(ax.get_xticklabels())
-            self._check_visible([ax.xaxis.get_label()])
-            self._check_ticks_props(ax, xrot=0)
-
-        _check_plot_works(df.plot, title='blah')
-
-        tuples = lzip(string.ascii_letters[:10], range(10))
-        df = DataFrame(np.random.rand(10, 3),
-                       index=MultiIndex.from_tuples(tuples))
-        _check_plot_works(df.plot, use_index=True)
-
-        # unicode
-        index = MultiIndex.from_tuples([(u('\u03b1'), 0),
-                                        (u('\u03b1'), 1),
-                                        (u('\u03b2'), 2),
-                                        (u('\u03b2'), 3),
-                                        (u('\u03b3'), 4),
-                                        (u('\u03b3'), 5),
-                                        (u('\u03b4'), 6),
-                                        (u('\u03b4'), 7)], names=['i0', 'i1'])
-        columns = MultiIndex.from_tuples([('bar', u('\u0394')),
-                                        ('bar', u('\u0395'))], names=['c0',
-                                                                    'c1'])
-        df = DataFrame(np.random.randint(0, 10, (8, 2)),
-                       columns=columns,
-                       index=index)
-        _check_plot_works(df.plot, title=u('\u03A3'))
-
-        # GH 6951
-        # Test with single column
-        df = DataFrame({'x': np.random.rand(10)})
-        axes = _check_plot_works(df.plot.bar, subplots=True)
-        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
-
-        axes = _check_plot_works(df.plot.bar, subplots=True,
-                                layout=(-1, 1))
-        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
-        # When ax is supplied and required number of axes is 1,
-        # passed ax should be used:
-        fig, ax = self.plt.subplots()
-        axes = df.plot.bar(subplots=True, ax=ax)
-        self.assertEqual(len(axes), 1)
-        if self.mpl_ge_1_5_0:
-            result = ax.axes
-        else:
-            result = ax.get_axes()  # deprecated
-        self.assertIs(result, axes[0])
-
-    def test_color_and_style_arguments(self):
-        df = DataFrame({'x': [1, 2], 'y': [3, 4]})
-        # passing both 'color' and 'style' arguments should be allowed
-        # if there is no color symbol in the style strings:
-        ax = df.plot(color = ['red', 'black'], style = ['-', '--'])
-        # check that the linestyles are correctly set:
-        linestyle = [line.get_linestyle() for line in ax.lines]
-        self.assertEqual(linestyle, ['-', '--'])
-        # check that the colors are correctly set:
-        color = [line.get_color() for line in ax.lines]
-        self.assertEqual(color, ['red', 'black'])
-        # passing both 'color' and 'style' arguments should not be allowed
-        # if there is a color symbol in the style strings:
-        with tm.assertRaises(ValueError):
-            df.plot(color = ['red', 'black'], style = ['k-', 'r--'])
-
-    def test_nonnumeric_exclude(self):
-        df = DataFrame({'A': ["x", "y", "z"], 'B': [1, 2, 3]})
-        ax = df.plot()
-        self.assertEqual(len(ax.get_lines()), 1)  # B was plotted
-
-    @slow
-    def test_implicit_label(self):
-        df = DataFrame(randn(10, 3), columns=['a', 'b', 'c'])
-        ax = df.plot(x='a', y='b')
-        self._check_text_labels(ax.xaxis.get_label(), 'a')
-
-    @slow
-    def test_donot_overwrite_index_name(self):
-        # GH 8494
-        df = DataFrame(randn(2, 2), columns=['a', 'b'])
-        df.index.name = 'NAME'
-        df.plot(y='b', label='LABEL')
-        self.assertEqual(df.index.name, 'NAME')
-
-    @slow
-    def test_plot_xy(self):
-        # columns.inferred_type == 'string'
-        df = self.tdf
-        self._check_data(df.plot(x=0, y=1),
-                         df.set_index('A')['B'].plot())
-        self._check_data(df.plot(x=0), df.set_index('A').plot())
-        self._check_data(df.plot(y=0), df.B.plot())
-        self._check_data(df.plot(x='A', y='B'),
-                         df.set_index('A').B.plot())
-        self._check_data(df.plot(x='A'), df.set_index('A').plot())
-        self._check_data(df.plot(y='B'), df.B.plot())
-
-        # columns.inferred_type == 'integer'
-        df.columns = lrange(1, len(df.columns) + 1)
-        self._check_data(df.plot(x=1, y=2),
-                         df.set_index(1)[2].plot())
-        self._check_data(df.plot(x=1), df.set_index(1).plot())
-        self._check_data(df.plot(y=1), df[1].plot())
-
-        # figsize and title
-        ax = df.plot(x=1, y=2, title='Test', figsize=(16, 8))
-        self._check_text_labels(ax.title, 'Test')
-        self._check_axes_shape(ax, axes_num=1, layout=(1, 1), figsize=(16., 8.))
-
-        # columns.inferred_type == 'mixed'
-        # TODO add MultiIndex test
-
-    @slow
-    def test_logscales(self):
-        df = DataFrame({'a': np.arange(100)},
-                       index=np.arange(100))
-        ax = df.plot(logy=True)
-        self._check_ax_scales(ax, yaxis='log')
-
-        ax = df.plot(logx=True)
-        self._check_ax_scales(ax, xaxis='log')
-
-        ax = df.plot(loglog=True)
-        self._check_ax_scales(ax, xaxis='log', yaxis='log')
-
-    @slow
-    def test_xcompat(self):
-        import pandas as pd
-
-        df = self.tdf
-        ax = df.plot(x_compat=True)
-        lines = ax.get_lines()
-        self.assertNotIsInstance(lines[0].get_xdata(), PeriodIndex)
-
-        tm.close()
-        pd.plot_params['xaxis.compat'] = True
-        ax = df.plot()
-        lines = ax.get_lines()
-        self.assertNotIsInstance(lines[0].get_xdata(), PeriodIndex)
-
-        tm.close()
-        pd.plot_params['x_compat'] = False
-        ax = df.plot()
-        lines = ax.get_lines()
-        self.assertNotIsInstance(lines[0].get_xdata(), PeriodIndex)
-        self.assertIsInstance(PeriodIndex(lines[0].get_xdata()), PeriodIndex)
-
-        tm.close()
-        # useful if you're plotting a bunch together
-        with pd.plot_params.use('x_compat', True):
-            ax = df.plot()
-            lines = ax.get_lines()
-            self.assertNotIsInstance(lines[0].get_xdata(), PeriodIndex)
-
-        tm.close()
-        ax = df.plot()
-        lines = ax.get_lines()
-        self.assertNotIsInstance(lines[0].get_xdata(), PeriodIndex)
-        self.assertIsInstance(PeriodIndex(lines[0].get_xdata()), PeriodIndex)
-
-    def test_period_compat(self):
-        # GH 9012
-        # period-array conversions
-        df = DataFrame(
-            np.random.rand(21, 2),
-            index=bdate_range(datetime(2000, 1, 1), datetime(2000, 1, 31)),
-            columns=['a', 'b'])
-
-        df.plot()
-        self.plt.axhline(y=0)
-        tm.close()
-
-    def test_unsorted_index(self):
-        df = DataFrame({'y': np.arange(100)},
-                       index=np.arange(99, -1, -1), dtype=np.int64)
-        ax = df.plot()
-        l = ax.get_lines()[0]
-        rs = l.get_xydata()
-        rs = Series(rs[:, 1], rs[:, 0], dtype=np.int64, name='y')
-        tm.assert_series_equal(rs, df.y)
-
-    @slow
-    def test_subplots(self):
-        df = DataFrame(np.random.rand(10, 3),
-                       index=list(string.ascii_letters[:10]))
-
-        for kind in ['bar', 'barh', 'line', 'area']:
-            axes = df.plot(kind=kind, subplots=True, sharex=True, legend=True)
-            self._check_axes_shape(axes, axes_num=3, layout=(3, 1))
-            self.assertEqual(axes.shape, (3, ))
-
-            for ax, column in zip(axes, df.columns):
-                self._check_legend_labels(ax, labels=[com.pprint_thing(column)])
-
-            for ax in axes[:-2]:
-                self._check_visible(ax.xaxis)   # xaxis must be visible for grid
-                self._check_visible(ax.get_xticklabels(), visible=False)
-                self._check_visible(ax.get_xticklabels(minor=True), visible=False)
-                self._check_visible(ax.xaxis.get_label(), visible=False)
-                self._check_visible(ax.get_yticklabels())
-
-            self._check_visible(axes[-1].xaxis)
-            self._check_visible(axes[-1].get_xticklabels())
-            self._check_visible(axes[-1].get_xticklabels(minor=True))
-            self._check_visible(axes[-1].xaxis.get_label())
-            self._check_visible(axes[-1].get_yticklabels())
-
-            axes = df.plot(kind=kind, subplots=True, sharex=False)
-            for ax in axes:
-                self._check_visible(ax.xaxis)
-                self._check_visible(ax.get_xticklabels())
-                self._check_visible(ax.get_xticklabels(minor=True))
-                self._check_visible(ax.xaxis.get_label())
-                self._check_visible(ax.get_yticklabels())
-
-            axes = df.plot(kind=kind, subplots=True, legend=False)
-            for ax in axes:
-                self.assertTrue(ax.get_legend() is None)
-
-    @slow
-    def test_subplots_timeseries(self):
-        idx = date_range(start='2014-07-01', freq='M', periods=10)
-        df = DataFrame(np.random.rand(10, 3), index=idx)
-
-        for kind in ['line', 'area']:
-            axes = df.plot(kind=kind, subplots=True, sharex=True)
-            self._check_axes_shape(axes, axes_num=3, layout=(3, 1))
-
-            for ax in axes[:-2]:
-                # GH 7801
-                self._check_visible(ax.xaxis)   # xaxis must be visible for grid
-                self._check_visible(ax.get_xticklabels(), visible=False)
-                self._check_visible(ax.get_xticklabels(minor=True), visible=False)
-                self._check_visible(ax.xaxis.get_label(), visible=False)
-                self._check_visible(ax.get_yticklabels())
-
-            self._check_visible(axes[-1].xaxis)
-            self._check_visible(axes[-1].get_xticklabels())
-            self._check_visible(axes[-1].get_xticklabels(minor=True))
-            self._check_visible(axes[-1].xaxis.get_label())
-            self._check_visible(axes[-1].get_yticklabels())
-            self._check_ticks_props(axes, xrot=0)
-
-            axes = df.plot(kind=kind, subplots=True, sharex=False, rot=45, fontsize=7)
-            for ax in axes:
-                self._check_visible(ax.xaxis)
-                self._check_visible(ax.get_xticklabels())
-                self._check_visible(ax.get_xticklabels(minor=True))
-                self._check_visible(ax.xaxis.get_label())
-                self._check_visible(ax.get_yticklabels())
-                self._check_ticks_props(ax, xlabelsize=7, xrot=45, ylabelsize=7)
-
-    @slow
-    def test_subplots_layout(self):
-        # GH 6667
-        df = DataFrame(np.random.rand(10, 3),
-                       index=list(string.ascii_letters[:10]))
-
-        axes = df.plot(subplots=True, layout=(2, 2))
-        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
-        self.assertEqual(axes.shape, (2, 2))
-
-        axes = df.plot(subplots=True, layout=(-1, 2))
-        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
-        self.assertEqual(axes.shape, (2, 2))
-
-        axes = df.plot(subplots=True, layout=(2, -1))
-        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
-        self.assertEqual(axes.shape, (2, 2))
-
-        axes = df.plot(subplots=True, layout=(1, 4))
-        self._check_axes_shape(axes, axes_num=3, layout=(1, 4))
-        self.assertEqual(axes.shape, (1, 4))
-
-        axes = df.plot(subplots=True, layout=(-1, 4))
-        self._check_axes_shape(axes, axes_num=3, layout=(1, 4))
-        self.assertEqual(axes.shape, (1, 4))
-
-        axes = df.plot(subplots=True, layout=(4, -1))
-        self._check_axes_shape(axes, axes_num=3, layout=(4, 1))
-        self.assertEqual(axes.shape, (4, 1))
-
-        with tm.assertRaises(ValueError):
-            axes = df.plot(subplots=True, layout=(1, 1))
-        with tm.assertRaises(ValueError):
-            axes = df.plot(subplots=True, layout=(-1, -1))
-
-        # single column
-        df = DataFrame(np.random.rand(10, 1),
-                       index=list(string.ascii_letters[:10]))
-        axes = df.plot(subplots=True)
-        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
-        self.assertEqual(axes.shape, (1, ))
-
-        axes = df.plot(subplots=True, layout=(3, 3))
-        self._check_axes_shape(axes, axes_num=1, layout=(3, 3))
-        self.assertEqual(axes.shape, (3, 3))
-
-    @slow
-    def test_subplots_warnings(self):
-        # GH 9464
-        warnings.simplefilter('error')
-        try:
-            df = DataFrame(np.random.randn(100, 4))
-            df.plot(subplots=True, layout=(3, 2))
-
-            df = DataFrame(np.random.randn(100, 4),
-                           index=date_range('1/1/2000', periods=100))
-            df.plot(subplots=True, layout=(3, 2))
-        except Warning as w:
-            self.fail(w)
-        warnings.simplefilter('default')
-
-    @slow
-    def test_subplots_multiple_axes(self):
-        # GH 5353, 6970, GH 7069
-        fig, axes = self.plt.subplots(2, 3)
-        df = DataFrame(np.random.rand(10, 3),
-                       index=list(string.ascii_letters[:10]))
-
-        returned = df.plot(subplots=True, ax=axes[0], sharex=False, sharey=False)
-        self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
-        self.assertEqual(returned.shape, (3, ))
-        self.assertIs(returned[0].figure, fig)
-        # draw on second row
-        returned = df.plot(subplots=True, ax=axes[1], sharex=False, sharey=False)
-        self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
-        self.assertEqual(returned.shape, (3, ))
-        self.assertIs(returned[0].figure, fig)
-        self._check_axes_shape(axes, axes_num=6, layout=(2, 3))
-        tm.close()
-
-        with tm.assertRaises(ValueError):
-            fig, axes = self.plt.subplots(2, 3)
-            # pass different number of axes from required
-            df.plot(subplots=True, ax=axes)
-
-        # pass 2-dim axes and invalid layout
-        # invalid lauout should not affect to input and return value
-        # (show warning is tested in
-        # TestDataFrameGroupByPlots.test_grouped_box_multiple_axes
-        fig, axes = self.plt.subplots(2, 2)
-        with warnings.catch_warnings():
-            warnings.simplefilter('ignore')
-            df = DataFrame(np.random.rand(10, 4),
-                           index=list(string.ascii_letters[:10]))
-
-            returned = df.plot(subplots=True, ax=axes, layout=(2, 1),
-                               sharex=False, sharey=False)
-            self._check_axes_shape(returned, axes_num=4, layout=(2, 2))
-            self.assertEqual(returned.shape, (4, ))
-
-            returned = df.plot(subplots=True, ax=axes, layout=(2, -1),
-                               sharex=False, sharey=False)
-            self._check_axes_shape(returned, axes_num=4, layout=(2, 2))
-            self.assertEqual(returned.shape, (4, ))
-
-            returned = df.plot(subplots=True, ax=axes, layout=(-1, 2),
-                               sharex=False, sharey=False)
-        self._check_axes_shape(returned, axes_num=4, layout=(2, 2))
-        self.assertEqual(returned.shape, (4, ))
-
-        # single column
-        fig, axes = self.plt.subplots(1, 1)
-        df = DataFrame(np.random.rand(10, 1),
-                       index=list(string.ascii_letters[:10]))
-
-        axes = df.plot(subplots=True, ax=[axes], sharex=False, sharey=False)
-        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
-        self.assertEqual(axes.shape, (1, ))
-
-    def test_subplots_ts_share_axes(self):
-        # GH 3964
-        fig, axes = self.plt.subplots(3, 3, sharex=True, sharey=True)
-        self.plt.subplots_adjust(left=0.05, right=0.95, hspace=0.3, wspace=0.3)
-        df = DataFrame(np.random.randn(10, 9), index=date_range(start='2014-07-01', freq='M', periods=10))
-        for i, ax in enumerate(axes.ravel()):
-            df[i].plot(ax=ax, fontsize=5)
-
-        #Rows other than bottom should not be visible
-        for ax in axes[0:-1].ravel():
-            self._check_visible(ax.get_xticklabels(), visible=False)
-
-        #Bottom row should be visible
-        for ax in axes[-1].ravel():
-            self._check_visible(ax.get_xticklabels(), visible=True)
-
-        #First column should be visible
-        for ax in axes[[0, 1, 2], [0]].ravel():
-            self._check_visible(ax.get_yticklabels(), visible=True)
-
-        #Other columns should not be visible
-        for ax in axes[[0, 1, 2], [1]].ravel():
-            self._check_visible(ax.get_yticklabels(), visible=False)
-        for ax in axes[[0, 1, 2], [2]].ravel():
-            self._check_visible(ax.get_yticklabels(), visible=False)
-
-    def test_subplots_sharex_axes_existing_axes(self):
-        # GH 9158
-        d = {'A': [1., 2., 3., 4.], 'B': [4., 3., 2., 1.], 'C': [5, 1, 3, 4]}
-        df = DataFrame(d, index=date_range('2014 10 11', '2014 10 14'))
-
-        axes = df[['A', 'B']].plot(subplots=True)
-        df['C'].plot(ax=axes[0], secondary_y=True)
-
-        self._check_visible(axes[0].get_xticklabels(), visible=False)
-        self._check_visible(axes[1].get_xticklabels(), visible=True)
-        for ax in axes.ravel():
-            self._check_visible(ax.get_yticklabels(), visible=True)
-
-    @slow
-    def test_subplots_dup_columns(self):
-        # GH 10962
-        df = DataFrame(np.random.rand(5, 5), columns=list('aaaaa'))
-        axes = df.plot(subplots=True)
-        for ax in axes:
-            self._check_legend_labels(ax, labels=['a'])
-            self.assertEqual(len(ax.lines), 1)
-        tm.close()
-
-        axes = df.plot(subplots=True, secondary_y='a')
-        for ax in axes:
-            # (right) is only attached when subplots=False
-            self._check_legend_labels(ax, labels=['a'])
-            self.assertEqual(len(ax.lines), 1)
-        tm.close()
-
-        ax = df.plot(secondary_y='a')
-        self._check_legend_labels(ax, labels=['a (right)'] * 5)
-        self.assertEqual(len(ax.lines), 0)
-        self.assertEqual(len(ax.right_ax.lines), 5)
-
-    def test_negative_log(self):
-        df = - DataFrame(rand(6, 4),
-                       index=list(string.ascii_letters[:6]),
-                       columns=['x', 'y', 'z', 'four'])
-
-        with tm.assertRaises(ValueError):
-            df.plot.area(logy=True)
-        with tm.assertRaises(ValueError):
-            df.plot.area(loglog=True)
-
-    def _compare_stacked_y_cood(self, normal_lines, stacked_lines):
-        base = np.zeros(len(normal_lines[0].get_data()[1]))
-        for nl, sl in zip(normal_lines, stacked_lines):
-            base += nl.get_data()[1] # get y coodinates
-            sy = sl.get_data()[1]
-            self.assert_numpy_array_equal(base, sy)
-
-    def test_line_area_stacked(self):
-        with tm.RNGContext(42):
-            df = DataFrame(rand(6, 4),
-                           columns=['w', 'x', 'y', 'z'])
-            neg_df = - df
-            # each column has either positive or negative value
-            sep_df = DataFrame({'w': rand(6), 'x': rand(6),
-                                'y': - rand(6), 'z': - rand(6)})
-            # each column has positive-negative mixed value
-            mixed_df = DataFrame(randn(6, 4), index=list(string.ascii_letters[:6]),
-                                 columns=['w', 'x', 'y', 'z'])
-
-            for kind in ['line', 'area']:
-                ax1 = _check_plot_works(df.plot, kind=kind, stacked=False)
-                ax2 = _check_plot_works(df.plot, kind=kind, stacked=True)
-                self._compare_stacked_y_cood(ax1.lines, ax2.lines)
-
-                ax1 = _check_plot_works(neg_df.plot, kind=kind, stacked=False)
-                ax2 = _check_plot_works(neg_df.plot, kind=kind, stacked=True)
-                self._compare_stacked_y_cood(ax1.lines, ax2.lines)
-
-                ax1 = _check_plot_works(sep_df.plot, kind=kind, stacked=False)
-                ax2 = _check_plot_works(sep_df.plot, kind=kind, stacked=True)
-                self._compare_stacked_y_cood(ax1.lines[:2], ax2.lines[:2])
-                self._compare_stacked_y_cood(ax1.lines[2:], ax2.lines[2:])
-
-                _check_plot_works(mixed_df.plot, stacked=False)
-                with tm.assertRaises(ValueError):
-                    mixed_df.plot(stacked=True)
-
-                _check_plot_works(df.plot, kind=kind, logx=True, stacked=True)
-
-    def test_line_area_nan_df(self):
-        values1 = [1, 2, np.nan, 3]
-        values2 = [3, np.nan, 2, 1]
-        df = DataFrame({'a': values1, 'b': values2})
-        tdf = DataFrame({'a': values1, 'b': values2}, index=tm.makeDateIndex(k=4))
-
-        for d in [df, tdf]:
-            ax = _check_plot_works(d.plot)
-            masked1 = ax.lines[0].get_ydata()
-            masked2 = ax.lines[1].get_ydata()
-            # remove nan for comparison purpose
-            self.assert_numpy_array_equal(np.delete(masked1.data, 2), np.array([1, 2, 3]))
-            self.assert_numpy_array_equal(np.delete(masked2.data, 1), np.array([3, 2, 1]))
-            self.assert_numpy_array_equal(masked1.mask, np.array([False, False, True, False]))
-            self.assert_numpy_array_equal(masked2.mask, np.array([False, True, False, False]))
-
-            expected1 = np.array([1, 2, 0, 3])
-            expected2 = np.array([3, 0, 2, 1])
-
-            ax = _check_plot_works(d.plot, stacked=True)
-            self.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected1)
-            self.assert_numpy_array_equal(ax.lines[1].get_ydata(), expected1 + expected2)
-
-            ax = _check_plot_works(d.plot.area)
-            self.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected1)
-            self.assert_numpy_array_equal(ax.lines[1].get_ydata(), expected1 + expected2)
-
-            ax = _check_plot_works(d.plot.area, stacked=False)
-            self.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected1)
-            self.assert_numpy_array_equal(ax.lines[1].get_ydata(), expected2)
-
-    def test_line_lim(self):
-        df = DataFrame(rand(6, 3), columns=['x', 'y', 'z'])
-        ax = df.plot()
-        xmin, xmax = ax.get_xlim()
-        lines = ax.get_lines()
-        self.assertEqual(xmin, lines[0].get_data()[0][0])
-        self.assertEqual(xmax, lines[0].get_data()[0][-1])
-
-        ax = df.plot(secondary_y=True)
-        xmin, xmax = ax.get_xlim()
-        lines = ax.get_lines()
-        self.assertEqual(xmin, lines[0].get_data()[0][0])
-        self.assertEqual(xmax, lines[0].get_data()[0][-1])
-
-        axes = df.plot(secondary_y=True, subplots=True)
-        self._check_axes_shape(axes, axes_num=3, layout=(3, 1))
-        for ax in axes:
-            self.assertTrue(hasattr(ax, 'left_ax'))
-            self.assertFalse(hasattr(ax, 'right_ax'))
-            xmin, xmax = ax.get_xlim()
-            lines = ax.get_lines()
-            self.assertEqual(xmin, lines[0].get_data()[0][0])
-            self.assertEqual(xmax, lines[0].get_data()[0][-1])
-
-    def test_area_lim(self):
-        df = DataFrame(rand(6, 4),
-                       columns=['x', 'y', 'z', 'four'])
-
-        neg_df = - df
-        for stacked in [True, False]:
-            ax = _check_plot_works(df.plot.area, stacked=stacked)
-            xmin, xmax = ax.get_xlim()
-            ymin, ymax = ax.get_ylim()
-            lines = ax.get_lines()
-            self.assertEqual(xmin, lines[0].get_data()[0][0])
-            self.assertEqual(xmax, lines[0].get_data()[0][-1])
-            self.assertEqual(ymin, 0)
-
-            ax = _check_plot_works(neg_df.plot.area, stacked=stacked)
-            ymin, ymax = ax.get_ylim()
-            self.assertEqual(ymax, 0)
-
-    @slow
-    def test_bar_colors(self):
-        import matplotlib.pyplot as plt
-        default_colors = self._maybe_unpack_cycler(plt.rcParams)
-
-        df = DataFrame(randn(5, 5))
-        ax = df.plot.bar()
-        self._check_colors(ax.patches[::5], facecolors=default_colors[:5])
-        tm.close()
-
-        custom_colors = 'rgcby'
-        ax = df.plot.bar(color=custom_colors)
-        self._check_colors(ax.patches[::5], facecolors=custom_colors)
-        tm.close()
-
-        from matplotlib import cm
-        # Test str -> colormap functionality
-        ax = df.plot.bar(colormap='jet')
-        rgba_colors = lmap(cm.jet, np.linspace(0, 1, 5))
-        self._check_colors(ax.patches[::5], facecolors=rgba_colors)
-        tm.close()
-
-        # Test colormap functionality
-        ax = df.plot.bar(colormap=cm.jet)
-        rgba_colors = lmap(cm.jet, np.linspace(0, 1, 5))
-        self._check_colors(ax.patches[::5], facecolors=rgba_colors)
-        tm.close()
-
-        ax = df.ix[:, [0]].plot.bar(color='DodgerBlue')
-        self._check_colors([ax.patches[0]], facecolors=['DodgerBlue'])
-        tm.close()
-
-        ax = df.plot(kind='bar', color='green')
-        self._check_colors(ax.patches[::5], facecolors=['green'] * 5)
-        tm.close()
-
-    @slow
-    def test_bar_linewidth(self):
-        df = DataFrame(randn(5, 5))
-
-        # regular
-        ax = df.plot.bar(linewidth=2)
-        for r in ax.patches:
-            self.assertEqual(r.get_linewidth(), 2)
-
-        # stacked
-        ax = df.plot.bar(stacked=True, linewidth=2)
-        for r in ax.patches:
-            self.assertEqual(r.get_linewidth(), 2)
-
-        # subplots
-        axes = df.plot.bar(linewidth=2, subplots=True)
-        self._check_axes_shape(axes, axes_num=5, layout=(5, 1))
-        for ax in axes:
-            for r in ax.patches:
-                self.assertEqual(r.get_linewidth(), 2)
-
-    @slow
-    def test_bar_barwidth(self):
-        df = DataFrame(randn(5, 5))
-
-        width = 0.9
-
-        # regular
-        ax = df.plot.bar(width=width)
-        for r in ax.patches:
-            self.assertEqual(r.get_width(), width / len(df.columns))
-
-        # stacked
-        ax = df.plot.bar(stacked=True, width=width)
-        for r in ax.patches:
-            self.assertEqual(r.get_width(), width)
-
-        # horizontal regular
-        ax = df.plot.barh(width=width)
-        for r in ax.patches:
-            self.assertEqual(r.get_height(), width / len(df.columns))
-
-        # horizontal stacked
-        ax = df.plot.barh(stacked=True, width=width)
-        for r in ax.patches:
-            self.assertEqual(r.get_height(), width)
-
-        # subplots
-        axes = df.plot.bar(width=width, subplots=True)
-        for ax in axes:
-            for r in ax.patches:
-                self.assertEqual(r.get_width(), width)
-
-        # horizontal subplots
-        axes = df.plot.barh(width=width, subplots=True)
-        for ax in axes:
-            for r in ax.patches:
-                self.assertEqual(r.get_height(), width)
-
-    @slow
-    def test_bar_barwidth_position(self):
-        df = DataFrame(randn(5, 5))
-        self._check_bar_alignment(df, kind='bar', stacked=False, width=0.9, position=0.2)
-        self._check_bar_alignment(df, kind='bar', stacked=True, width=0.9, position=0.2)
-        self._check_bar_alignment(df, kind='barh', stacked=False, width=0.9, position=0.2)
-        self._check_bar_alignment(df, kind='barh', stacked=True, width=0.9, position=0.2)
-        self._check_bar_alignment(df, kind='bar', subplots=True, width=0.9, position=0.2)
-        self._check_bar_alignment(df, kind='barh', subplots=True, width=0.9, position=0.2)
-
-    @slow
-    def test_bar_bottom_left(self):
-        df = DataFrame(rand(5, 5))
-        ax = df.plot.bar(stacked=False, bottom=1)
-        result = [p.get_y() for p in ax.patches]
-        self.assertEqual(result, [1] * 25)
-
-        ax = df.plot.bar(stacked=True, bottom=[-1, -2, -3, -4, -5])
-        result = [p.get_y() for p in ax.patches[:5]]
-        self.assertEqual(result, [-1, -2, -3, -4, -5])
-
-        ax = df.plot.barh(stacked=False, left=np.array([1, 1, 1, 1, 1]))
-        result = [p.get_x() for p in ax.patches]
-        self.assertEqual(result, [1] * 25)
-
-        ax = df.plot.barh(stacked=True, left=[1, 2, 3, 4, 5])
-        result = [p.get_x() for p in ax.patches[:5]]
-        self.assertEqual(result, [1, 2, 3, 4, 5])
-
-        axes = df.plot.bar(subplots=True, bottom=-1)
-        for ax in axes:
-            result = [p.get_y() for p in ax.patches]
-            self.assertEqual(result, [-1] * 5)
-
-        axes = df.plot.barh(subplots=True, left=np.array([1, 1, 1, 1, 1]))
-        for ax in axes:
-            result = [p.get_x() for p in ax.patches]
-            self.assertEqual(result, [1] * 5)
-
-    @slow
-    def test_bar_nan(self):
-        df = DataFrame({'A': [10, np.nan, 20], 'B': [5, 10, 20],
-                        'C': [1, 2, 3]})
-        ax = df.plot.bar()
-        expected = [10, 0, 20, 5, 10, 20, 1, 2, 3]
-        result = [p.get_height() for p in ax.patches]
-        self.assertEqual(result, expected)
-
-        ax = df.plot.bar(stacked=True)
-        result = [p.get_height() for p in ax.patches]
-        self.assertEqual(result, expected)
-
-        result = [p.get_y() for p in ax.patches]
-        expected = [0.0, 0.0, 0.0, 10.0, 0.0, 20.0, 15.0, 10.0, 40.0]
-        self.assertEqual(result, expected)
-
-    @slow
-    def test_plot_scatter(self):
-        df = DataFrame(randn(6, 4),
-                       index=list(string.ascii_letters[:6]),
-                       columns=['x', 'y', 'z', 'four'])
-
-        _check_plot_works(df.plot.scatter, x='x', y='y')
-        _check_plot_works(df.plot.scatter, x=1, y=2)
-
-        with tm.assertRaises(TypeError):
-            df.plot.scatter(x='x')
-        with tm.assertRaises(TypeError):
-            df.plot.scatter(y='y')
-
-        # GH 6951
-        axes = df.plot(x='x', y='y', kind='scatter', subplots=True)
-        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
-
-    @slow
-    def test_plot_scatter_with_c(self):
-        df = DataFrame(randn(6, 4),
-                       index=list(string.ascii_letters[:6]),
-                       columns=['x', 'y', 'z', 'four'])
-
-        axes = [df.plot.scatter(x='x', y='y', c='z'),
-                df.plot.scatter(x=0, y=1, c=2)]
-        for ax in axes:
-            # default to Greys
-            self.assertEqual(ax.collections[0].cmap.name, 'Greys')
-
-            if self.mpl_ge_1_3_1:
-
-                # n.b. there appears to be no public method to get the colorbar
-                # label
-                self.assertEqual(ax.collections[0].colorbar._label, 'z')
-
-        cm = 'cubehelix'
-        ax = df.plot.scatter(x='x', y='y', c='z', colormap=cm)
-        self.assertEqual(ax.collections[0].cmap.name, cm)
-
-        # verify turning off colorbar works
-        ax = df.plot.scatter(x='x', y='y', c='z', colorbar=False)
-        self.assertIs(ax.collections[0].colorbar, None)
-
-        # verify that we can still plot a solid color
-        ax = df.plot.scatter(x=0, y=1, c='red')
-        self.assertIs(ax.collections[0].colorbar, None)
-        self._check_colors(ax.collections, facecolors=['r'])
-
-        # Ensure that we can pass an np.array straight through to matplotlib,
-        # this functionality was accidentally removed previously.
-        # See https://github.com/pydata/pandas/issues/8852 for bug report
-        #
-        # Exercise colormap path and non-colormap path as they are independent
-        #
-        df = DataFrame({'A': [1, 2], 'B': [3, 4]})
-        red_rgba = [1.0, 0.0, 0.0, 1.0]
-        green_rgba = [0.0, 1.0, 0.0, 1.0]
-        rgba_array = np.array([red_rgba, green_rgba])
-        ax = df.plot.scatter(x='A', y='B', c=rgba_array)
-        # expect the face colors of the points in the non-colormap path to be
-        # identical to the values we supplied, normally we'd be on shaky ground
-        # comparing floats for equality but here we expect them to be
-        # identical.
-        self.assertTrue(
-            np.array_equal(
-                ax.collections[0].get_facecolor(),
-                rgba_array))
-        # we don't test the colors of the faces in this next plot because they
-        # are dependent on the spring colormap, which may change its colors
-        # later.
-        float_array = np.array([0.0, 1.0])
-        df.plot.scatter(x='A', y='B', c=float_array, cmap='spring')
-
-    def test_scatter_colors(self):
-        df = DataFrame({'a': [1, 2, 3], 'b': [1, 2, 3], 'c': [1, 2, 3]})
-        with tm.assertRaises(TypeError):
-            df.plot.scatter(x='a', y='b', c='c', color='green')
-
-        ax = df.plot.scatter(x='a', y='b', c='c')
-        tm.assert_numpy_array_equal(ax.collections[0].get_facecolor()[0],
-                                    (0, 0, 1, 1))
-
-        ax = df.plot.scatter(x='a', y='b', color='white')
-        tm.assert_numpy_array_equal(ax.collections[0].get_facecolor()[0],
-                                    (1, 1, 1, 1))
-
-    @slow
-    def test_plot_bar(self):
-        df = DataFrame(randn(6, 4),
-                       index=list(string.ascii_letters[:6]),
-                       columns=['one', 'two', 'three', 'four'])
-
-        _check_plot_works(df.plot.bar)
-        _check_plot_works(df.plot.bar, legend=False)
-        _check_plot_works(df.plot.bar, filterwarnings='ignore', subplots=True)
-        _check_plot_works(df.plot.bar, stacked=True)
-
-        df = DataFrame(randn(10, 15),
-                       index=list(string.ascii_letters[:10]),
-                       columns=lrange(15))
-        _check_plot_works(df.plot.bar)
-
-        df = DataFrame({'a': [0, 1], 'b': [1, 0]})
-        ax = _check_plot_works(df.plot.bar)
-        self._check_ticks_props(ax, xrot=90)
-
-        ax = df.plot.bar(rot=35, fontsize=10)
-        self._check_ticks_props(ax, xrot=35, xlabelsize=10, ylabelsize=10)
-
-        ax = _check_plot_works(df.plot.barh)
-        self._check_ticks_props(ax, yrot=0)
-
-        ax = df.plot.barh(rot=55, fontsize=11)
-        self._check_ticks_props(ax, yrot=55, ylabelsize=11, xlabelsize=11)
-
-    def _check_bar_alignment(self, df, kind='bar', stacked=False,
-                             subplots=False, align='center',
-                             width=0.5, position=0.5):
-
-        axes = df.plot(kind=kind, stacked=stacked, subplots=subplots,
-                       align=align, width=width, position=position,
-                       grid=True)
-
-        axes = self._flatten_visible(axes)
-
-        for ax in axes:
-            if kind == 'bar':
-                axis = ax.xaxis
-                ax_min, ax_max = ax.get_xlim()
-                min_edge = min([p.get_x() for p in ax.patches])
-                max_edge = max([p.get_x() + p.get_width() for p in ax.patches])
-            elif kind == 'barh':
-                axis = ax.yaxis
-                ax_min, ax_max = ax.get_ylim()
-                min_edge = min([p.get_y() for p in ax.patches])
-                max_edge = max([p.get_y() + p.get_height() for p in ax.patches])
-            else:
-                raise ValueError
-
-            # GH 7498
-            # compare margins between lim and bar edges
-            self.assertAlmostEqual(ax_min, min_edge - 0.25)
-            self.assertAlmostEqual(ax_max, max_edge + 0.25)
-
-            p = ax.patches[0]
-            if kind == 'bar' and (stacked is True or subplots is True):
-                edge = p.get_x()
-                center = edge + p.get_width() * position
-            elif kind == 'bar' and stacked is False:
-                center = p.get_x() + p.get_width() * len(df.columns) * position
-                edge = p.get_x()
-            elif kind == 'barh' and (stacked is True or subplots is True):
-                center = p.get_y() + p.get_height() * position
-                edge = p.get_y()
-            elif kind == 'barh' and stacked is False:
-                center = p.get_y() + p.get_height() * len(df.columns) * position
-                edge = p.get_y()
-            else:
-                raise ValueError
-
-            # Check the ticks locates on integer
-            self.assertTrue((axis.get_ticklocs() == np.arange(len(df))).all())
-
-            if align == 'center':
-                # Check whether the bar locates on center
-                self.assertAlmostEqual(axis.get_ticklocs()[0], center)
-            elif align == 'edge':
-                # Check whether the bar's edge starts from the tick
-                self.assertAlmostEqual(axis.get_ticklocs()[0], edge)
-            else:
-                raise ValueError
-
-        return axes
-
-    @slow
-    def test_bar_stacked_center(self):
-        # GH2157
-        df = DataFrame({'A': [3] * 5, 'B': lrange(5)}, index=lrange(5))
-        self._check_bar_alignment(df, kind='bar', stacked=True)
-        self._check_bar_alignment(df, kind='bar', stacked=True, width=0.9)
-        self._check_bar_alignment(df, kind='barh', stacked=True)
-        self._check_bar_alignment(df, kind='barh', stacked=True, width=0.9)
-
-    @slow
-    def test_bar_center(self):
-        df = DataFrame({'A': [3] * 5, 'B': lrange(5)}, index=lrange(5))
-        self._check_bar_alignment(df, kind='bar', stacked=False)
-        self._check_bar_alignment(df, kind='bar', stacked=False, width=0.9)
-        self._check_bar_alignment(df, kind='barh', stacked=False)
-        self._check_bar_alignment(df, kind='barh', stacked=False, width=0.9)
-
-    @slow
-    def test_bar_subplots_center(self):
-        df = DataFrame({'A': [3] * 5, 'B': lrange(5)}, index=lrange(5))
-        self._check_bar_alignment(df, kind='bar', subplots=True)
-        self._check_bar_alignment(df, kind='bar', subplots=True, width=0.9)
-        self._check_bar_alignment(df, kind='barh', subplots=True)
-        self._check_bar_alignment(df, kind='barh', subplots=True, width=0.9)
-
-    @slow
-    def test_bar_align_single_column(self):
-        df = DataFrame(randn(5))
-        self._check_bar_alignment(df, kind='bar', stacked=False)
-        self._check_bar_alignment(df, kind='bar', stacked=True)
-        self._check_bar_alignment(df, kind='barh', stacked=False)
-        self._check_bar_alignment(df, kind='barh', stacked=True)
-        self._check_bar_alignment(df, kind='bar', subplots=True)
-        self._check_bar_alignment(df, kind='barh', subplots=True)
-
-    @slow
-    def test_bar_edge(self):
-        df = DataFrame({'A': [3] * 5, 'B': lrange(5)}, index=lrange(5))
-
-        self._check_bar_alignment(df, kind='bar', stacked=True, align='edge')
-        self._check_bar_alignment(df, kind='bar', stacked=True,
-                                  width=0.9, align='edge')
-        self._check_bar_alignment(df, kind='barh', stacked=True, align='edge')
-        self._check_bar_alignment(df, kind='barh', stacked=True,
-                                  width=0.9, align='edge')
-
-        self._check_bar_alignment(df, kind='bar', stacked=False, align='edge')
-        self._check_bar_alignment(df, kind='bar', stacked=False,
-                                  width=0.9, align='edge')
-        self._check_bar_alignment(df, kind='barh', stacked=False, align='edge')
-        self._check_bar_alignment(df, kind='barh', stacked=False,
-                                  width=0.9, align='edge')
-
-        self._check_bar_alignment(df, kind='bar', subplots=True, align='edge')
-        self._check_bar_alignment(df, kind='bar', subplots=True,
-                                  width=0.9, align='edge')
-        self._check_bar_alignment(df, kind='barh', subplots=True, align='edge')
-        self._check_bar_alignment(df, kind='barh', subplots=True,
-                                  width=0.9, align='edge')
-
-    @slow
-    def test_bar_log_no_subplots(self):
-        # GH3254, GH3298 matplotlib/matplotlib#1882, #1892
-        # regressions in 1.2.1
-        expected = np.array([1., 10.])
-
-        if not self.mpl_le_1_2_1:
-            expected = np.hstack((.1, expected, 100))
-
-        # no subplots
-        df = DataFrame({'A': [3] * 5, 'B': lrange(1, 6)}, index=lrange(5))
-        ax = df.plot.bar(grid=True, log=True)
-        tm.assert_numpy_array_equal(ax.yaxis.get_ticklocs(), expected)
-
-    @slow
-    def test_bar_log_subplots(self):
-        expected = np.array([1., 10., 100., 1000.])
-        if not self.mpl_le_1_2_1:
-            expected = np.hstack((.1, expected, 1e4))
-
-        ax = DataFrame([Series([200, 300]),
-                        Series([300, 500])]).plot.bar(log=True, subplots=True)
-
-        tm.assert_numpy_array_equal(ax[0].yaxis.get_ticklocs(), expected)
-        tm.assert_numpy_array_equal(ax[1].yaxis.get_ticklocs(), expected)
-
-    @slow
-    def test_boxplot(self):
-        df = self.hist_df
-        series = df['height']
-        numeric_cols = df._get_numeric_data().columns
-        labels = [com.pprint_thing(c) for c in numeric_cols]
-
-        ax = _check_plot_works(df.plot.box)
-        self._check_text_labels(ax.get_xticklabels(), labels)
-        tm.assert_numpy_array_equal(ax.xaxis.get_ticklocs(),
-                           np.arange(1, len(numeric_cols) + 1))
-        self.assertEqual(len(ax.lines),
-                         self.bp_n_objects * len(numeric_cols))
-
-        # different warning on py3
-        if not PY3:
-            axes = _check_plot_works(df.plot.box,
-                                     subplots=True, logy=True)
-
-            self._check_axes_shape(axes, axes_num=3, layout=(1, 3))
-            self._check_ax_scales(axes, yaxis='log')
-            for ax, label in zip(axes, labels):
-                self._check_text_labels(ax.get_xticklabels(), [label])
-                self.assertEqual(len(ax.lines), self.bp_n_objects)
-
-        axes = series.plot.box(rot=40)
-        self._check_ticks_props(axes, xrot=40, yrot=0)
-        tm.close()
-
-        ax = _check_plot_works(series.plot.box)
-
-        positions = np.array([1, 6, 7])
-        ax = df.plot.box(positions=positions)
-        numeric_cols = df._get_numeric_data().columns
-        labels = [com.pprint_thing(c) for c in numeric_cols]
-        self._check_text_labels(ax.get_xticklabels(), labels)
-        tm.assert_numpy_array_equal(ax.xaxis.get_ticklocs(), positions)
-        self.assertEqual(len(ax.lines), self.bp_n_objects * len(numeric_cols))
-
-    @slow
-    def test_boxplot_vertical(self):
-        df = self.hist_df
-        numeric_cols = df._get_numeric_data().columns
-        labels = [com.pprint_thing(c) for c in numeric_cols]
-
-        # if horizontal, yticklabels are rotated
-        ax = df.plot.box(rot=50, fontsize=8, vert=False)
-        self._check_ticks_props(ax, xrot=0, yrot=50, ylabelsize=8)
-        self._check_text_labels(ax.get_yticklabels(), labels)
-        self.assertEqual(len(ax.lines), self.bp_n_objects * len(numeric_cols))
-
-        axes = _check_plot_works(df.plot.box, filterwarnings='ignore', subplots=True,
-                                 vert=False, logx=True)
-        self._check_axes_shape(axes, axes_num=3, layout=(1, 3))
-        self._check_ax_scales(axes, xaxis='log')
-        for ax, label in zip(axes, labels):
-            self._check_text_labels(ax.get_yticklabels(), [label])
-            self.assertEqual(len(ax.lines), self.bp_n_objects)
-
-        positions = np.array([3, 2, 8])
-        ax = df.plot.box(positions=positions, vert=False)
-        self._check_text_labels(ax.get_yticklabels(), labels)
-        tm.assert_numpy_array_equal(ax.yaxis.get_ticklocs(), positions)
-        self.assertEqual(len(ax.lines), self.bp_n_objects * len(numeric_cols))
-
-    @slow
-    def test_boxplot_return_type(self):
-        df = DataFrame(randn(6, 4),
-                       index=list(string.ascii_letters[:6]),
-                       columns=['one', 'two', 'three', 'four'])
-        with tm.assertRaises(ValueError):
-            df.plot.box(return_type='NOTATYPE')
-
-        result = df.plot.box(return_type='dict')
-        self._check_box_return_type(result, 'dict')
-
-        result = df.plot.box(return_type='axes')
-        self._check_box_return_type(result, 'axes')
-
-        result = df.plot.box(return_type='both')
-        self._check_box_return_type(result, 'both')
-
-    @slow
-    def test_boxplot_subplots_return_type(self):
-        df = self.hist_df
-
-        # normal style: return_type=None
-        result = df.plot.box(subplots=True)
-        self.assertIsInstance(result, np.ndarray)
-        self._check_box_return_type(result, None,
-                                    expected_keys=['height', 'weight', 'category'])
-
-        for t in ['dict', 'axes', 'both']:
-            returned = df.plot.box(return_type=t, subplots=True)
-            self._check_box_return_type(returned, t,
-                                        expected_keys=['height', 'weight', 'category'],
-                                        check_ax_title=False)
-
-    @slow
-    def test_kde_df(self):
-        tm._skip_if_no_scipy()
-        _skip_if_no_scipy_gaussian_kde()
-        df = DataFrame(randn(100, 4))
-        ax = _check_plot_works(df.plot, kind='kde')
-        expected = [com.pprint_thing(c) for c in df.columns]
-        self._check_legend_labels(ax, labels=expected)
-        self._check_ticks_props(ax, xrot=0)
-
-        ax = df.plot(kind='kde', rot=20, fontsize=5)
-        self._check_ticks_props(ax, xrot=20, xlabelsize=5, ylabelsize=5)
-
-        axes = _check_plot_works(df.plot, filterwarnings='ignore', kind='kde', subplots=True)
-        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
-
-        axes = df.plot(kind='kde', logy=True, subplots=True)
-        self._check_ax_scales(axes, yaxis='log')
-
-    @slow
-    def test_kde_missing_vals(self):
-        tm._skip_if_no_scipy()
-        _skip_if_no_scipy_gaussian_kde()
-        df = DataFrame(np.random.uniform(size=(100, 4)))
-        df.loc[0, 0] = np.nan
-        ax = _check_plot_works(df.plot, kind='kde')
-
-    @slow
-    def test_hist_df(self):
-        from matplotlib.patches import Rectangle
-        if self.mpl_le_1_2_1:
-            raise nose.SkipTest("not supported in matplotlib <= 1.2.x")
-
-        df = DataFrame(randn(100, 4))
-        series = df[0]
-
-        ax = _check_plot_works(df.plot.hist)
-        expected = [com.pprint_thing(c) for c in df.columns]
-        self._check_legend_labels(ax, labels=expected)
-
-        axes = _check_plot_works(df.plot.hist, filterwarnings='ignore', subplots=True, logy=True)
-        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
-        self._check_ax_scales(axes, yaxis='log')
-
-        axes = series.plot.hist(rot=40)
-        self._check_ticks_props(axes, xrot=40, yrot=0)
-        tm.close()
-
-        ax = series.plot.hist(normed=True, cumulative=True, bins=4)
-        # height of last bin (index 5) must be 1.0
-        rects = [x for x in ax.get_children() if isinstance(x, Rectangle)]
-        self.assertAlmostEqual(rects[-1].get_height(), 1.0)
-        tm.close()
-
-        ax = series.plot.hist(cumulative=True, bins=4)
-        rects = [x for x in ax.get_children() if isinstance(x, Rectangle)]
-
-        self.assertAlmostEqual(rects[-2].get_height(), 100.0)
-        tm.close()
-
-        # if horizontal, yticklabels are rotated
-        axes = df.plot.hist(rot=50, fontsize=8, orientation='horizontal')
-        self._check_ticks_props(axes, xrot=0, yrot=50, ylabelsize=8)
-
-    def _check_box_coord(self, patches, expected_y=None, expected_h=None,
-                         expected_x=None, expected_w=None):
-        result_y = np.array([p.get_y() for p in patches])
-        result_height = np.array([p.get_height() for p in patches])
-        result_x = np.array([p.get_x() for p in patches])
-        result_width = np.array([p.get_width() for p in patches])
-
-        if expected_y is not None:
-            self.assert_numpy_array_equal(result_y, expected_y)
-        if expected_h is not None:
-            self.assert_numpy_array_equal(result_height, expected_h)
-        if expected_x is not None:
-            self.assert_numpy_array_equal(result_x, expected_x)
-        if expected_w is not None:
-            self.assert_numpy_array_equal(result_width, expected_w)
-
-    @slow
-    def test_hist_df_coord(self):
-        normal_df = DataFrame({'A': np.repeat(np.array([1, 2, 3, 4, 5]),
-                                              np.array([10, 9, 8, 7, 6])),
-                               'B': np.repeat(np.array([1, 2, 3, 4, 5]),
-                                              np.array([8, 8, 8, 8, 8])),
-                               'C': np.repeat(np.array([1, 2, 3, 4, 5]),
-                                              np.array([6, 7, 8, 9, 10]))},
-                               columns=['A', 'B', 'C'])
-
-        nan_df = DataFrame({'A': np.repeat(np.array([np.nan, 1, 2, 3, 4, 5]),
-                                           np.array([3, 10, 9, 8, 7, 6])),
-                            'B': np.repeat(np.array([1, np.nan, 2, 3, 4, 5]),
-                                           np.array([8, 3, 8, 8, 8, 8])),
-                            'C': np.repeat(np.array([1, 2, 3, np.nan, 4, 5]),
-                                           np.array([6, 7, 8, 3, 9, 10]))},
-                           columns=['A', 'B', 'C'])
-
-        for df in [normal_df, nan_df]:
-            ax = df.plot.hist(bins=5)
-            self._check_box_coord(ax.patches[:5], expected_y=np.array([0, 0, 0, 0, 0]),
-                                  expected_h=np.array([10, 9, 8, 7, 6]))
-            self._check_box_coord(ax.patches[5:10], expected_y=np.array([0, 0, 0, 0, 0]),
-                                  expected_h=np.array([8, 8, 8, 8, 8]))
-            self._check_box_coord(ax.patches[10:], expected_y=np.array([0, 0, 0, 0, 0]),
-                                  expected_h=np.array([6, 7, 8, 9, 10]))
-
-            ax = df.plot.hist(bins=5, stacked=True)
-            self._check_box_coord(ax.patches[:5], expected_y=np.array([0, 0, 0, 0, 0]),
-                                  expected_h=np.array([10, 9, 8, 7, 6]))
-            self._check_box_coord(ax.patches[5:10], expected_y=np.array([10, 9, 8, 7, 6]),
-                                  expected_h=np.array([8, 8, 8, 8, 8]))
-            self._check_box_coord(ax.patches[10:], expected_y=np.array([18, 17, 16, 15, 14]),
-                                  expected_h=np.array([6, 7, 8, 9, 10]))
-
-            axes = df.plot.hist(bins=5, stacked=True, subplots=True)
-            self._check_box_coord(axes[0].patches, expected_y=np.array([0, 0, 0, 0, 0]),
-                                  expected_h=np.array([10, 9, 8, 7, 6]))
-            self._check_box_coord(axes[1].patches, expected_y=np.array([0, 0, 0, 0, 0]),
-                                  expected_h=np.array([8, 8, 8, 8, 8]))
-            self._check_box_coord(axes[2].patches, expected_y=np.array([0, 0, 0, 0, 0]),
-                                  expected_h=np.array([6, 7, 8, 9, 10]))
-
-            if self.mpl_ge_1_3_1:
-
-                # horizontal
-                ax = df.plot.hist(bins=5, orientation='horizontal')
-                self._check_box_coord(ax.patches[:5], expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([10, 9, 8, 7, 6]))
-                self._check_box_coord(ax.patches[5:10], expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([8, 8, 8, 8, 8]))
-                self._check_box_coord(ax.patches[10:], expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([6, 7, 8, 9, 10]))
-
-                ax = df.plot.hist(bins=5, stacked=True, orientation='horizontal')
-                self._check_box_coord(ax.patches[:5], expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([10, 9, 8, 7, 6]))
-                self._check_box_coord(ax.patches[5:10], expected_x=np.array([10, 9, 8, 7, 6]),
-                                      expected_w=np.array([8, 8, 8, 8, 8]))
-                self._check_box_coord(ax.patches[10:], expected_x=np.array([18, 17, 16, 15, 14]),
-                                      expected_w=np.array([6, 7, 8, 9, 10]))
-
-                axes = df.plot.hist(bins=5, stacked=True,
-                               subplots=True, orientation='horizontal')
-                self._check_box_coord(axes[0].patches, expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([10, 9, 8, 7, 6]))
-                self._check_box_coord(axes[1].patches, expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([8, 8, 8, 8, 8]))
-                self._check_box_coord(axes[2].patches, expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([6, 7, 8, 9, 10]))
-
-    @slow
-    def test_plot_int_columns(self):
-        df = DataFrame(randn(100, 4)).cumsum()
-        _check_plot_works(df.plot, legend=True)
-
-    @slow
-    def test_df_legend_labels(self):
-        kinds = ['line', 'bar', 'barh', 'kde', 'area', 'hist']
-        df = DataFrame(rand(3, 3), columns=['a', 'b', 'c'])
-        df2 = DataFrame(rand(3, 3), columns=['d', 'e', 'f'])
-        df3 = DataFrame(rand(3, 3), columns=['g', 'h', 'i'])
-        df4 = DataFrame(rand(3, 3), columns=['j', 'k', 'l'])
-
-        for kind in kinds:
-            if not _ok_for_gaussian_kde(kind):
-                continue
-
-            ax = df.plot(kind=kind, legend=True)
-            self._check_legend_labels(ax, labels=df.columns)
-
-            ax = df2.plot(kind=kind, legend=False, ax=ax)
-            self._check_legend_labels(ax, labels=df.columns)
-
-            ax = df3.plot(kind=kind, legend=True, ax=ax)
-            self._check_legend_labels(ax, labels=df.columns.union(df3.columns))
-
-            ax = df4.plot(kind=kind, legend='reverse', ax=ax)
-            expected = list(df.columns.union(df3.columns)) + list(reversed(df4.columns))
-            self._check_legend_labels(ax, labels=expected)
-
-        # Secondary Y
-        ax = df.plot(legend=True, secondary_y='b')
-        self._check_legend_labels(ax, labels=['a', 'b (right)', 'c'])
-        ax = df2.plot(legend=False, ax=ax)
-        self._check_legend_labels(ax, labels=['a', 'b (right)', 'c'])
-        ax = df3.plot(kind='bar', legend=True, secondary_y='h', ax=ax)
-        self._check_legend_labels(ax, labels=['a', 'b (right)', 'c', 'g', 'h (right)', 'i'])
-
-        # Time Series
-        ind = date_range('1/1/2014', periods=3)
-        df = DataFrame(randn(3, 3), columns=['a', 'b', 'c'], index=ind)
-        df2 = DataFrame(randn(3, 3), columns=['d', 'e', 'f'], index=ind)
-        df3 = DataFrame(randn(3, 3), columns=['g', 'h', 'i'], index=ind)
-        ax = df.plot(legend=True, secondary_y='b')
-        self._check_legend_labels(ax, labels=['a', 'b (right)', 'c'])
-        ax = df2.plot(legend=False, ax=ax)
-        self._check_legend_labels(ax, labels=['a', 'b (right)', 'c'])
-        ax = df3.plot(legend=True, ax=ax)
-        self._check_legend_labels(ax, labels=['a', 'b (right)', 'c', 'g', 'h', 'i'])
-
-        # scatter
-        ax = df.plot.scatter(x='a', y='b', label='data1')
-        self._check_legend_labels(ax, labels=['data1'])
-        ax = df2.plot.scatter(x='d', y='e', legend=False,
-                              label='data2', ax=ax)
-        self._check_legend_labels(ax, labels=['data1'])
-        ax = df3.plot.scatter(x='g', y='h', label='data3', ax=ax)
-        self._check_legend_labels(ax, labels=['data1', 'data3'])
-
-        # ensure label args pass through and
-        # index name does not mutate
-        # column names don't mutate
-        df5 = df.set_index('a')
-        ax = df5.plot(y='b')
-        self._check_legend_labels(ax, labels=['b'])
-        ax = df5.plot(y='b', label='LABEL_b')
-        self._check_legend_labels(ax, labels=['LABEL_b'])
-        self._check_text_labels(ax.xaxis.get_label(), 'a')
-        ax = df5.plot(y='c', label='LABEL_c', ax=ax)
-        self._check_legend_labels(ax, labels=['LABEL_b','LABEL_c'])
-        self.assertTrue(df5.columns.tolist() == ['b','c'])
-
-
-    def test_legend_name(self):
-        multi = DataFrame(randn(4, 4),
-                          columns=[np.array(['a', 'a', 'b', 'b']),
-                                   np.array(['x', 'y', 'x', 'y'])])
-        multi.columns.names = ['group', 'individual']
-
-        ax = multi.plot()
-        leg_title = ax.legend_.get_title()
-        self._check_text_labels(leg_title, 'group,individual')
-
-        df = DataFrame(randn(5, 5))
-        ax = df.plot(legend=True, ax=ax)
-        leg_title = ax.legend_.get_title()
-        self._check_text_labels(leg_title, 'group,individual')
-
-        df.columns.name = 'new'
-        ax = df.plot(legend=False, ax=ax)
-        leg_title = ax.legend_.get_title()
-        self._check_text_labels(leg_title, 'group,individual')
-
-        ax = df.plot(legend=True, ax=ax)
-        leg_title = ax.legend_.get_title()
-        self._check_text_labels(leg_title, 'new')
-
-    @slow
-    def test_no_legend(self):
-        kinds = ['line', 'bar', 'barh', 'kde', 'area', 'hist']
-        df = DataFrame(rand(3, 3), columns=['a', 'b', 'c'])
-
-        for kind in kinds:
-            if not _ok_for_gaussian_kde(kind):
-                continue
-
-            ax = df.plot(kind=kind, legend=False)
-            self._check_legend_labels(ax, visible=False)
-
-    @slow
-    def test_style_by_column(self):
-        import matplotlib.pyplot as plt
-        fig = plt.gcf()
-
-        df = DataFrame(randn(100, 3))
-        for markers in [{0: '^', 1: '+', 2: 'o'},
-                        {0: '^', 1: '+'},
-                        ['^', '+', 'o'],
-                        ['^', '+']]:
-            fig.clf()
-            fig.add_subplot(111)
-            ax = df.plot(style=markers)
-            for i, l in enumerate(ax.get_lines()[:len(markers)]):
-                self.assertEqual(l.get_marker(), markers[i])
-
-    @slow
-    def test_line_label_none(self):
-        s = Series([1, 2])
-        ax = s.plot()
-        self.assertEqual(ax.get_legend(), None)
-
-        ax = s.plot(legend=True)
-        self.assertEqual(ax.get_legend().get_texts()[0].get_text(),
-                         'None')
-
-    @slow
-    def test_line_colors(self):
-        import sys
-        from matplotlib import cm
-
-        custom_colors = 'rgcby'
-        df = DataFrame(randn(5, 5))
-
-        ax = df.plot(color=custom_colors)
-        self._check_colors(ax.get_lines(), linecolors=custom_colors)
-
-        tmp = sys.stderr
-        sys.stderr = StringIO()
-        try:
-            tm.close()
-            ax2 = df.plot(colors=custom_colors)
-            lines2 = ax2.get_lines()
-            for l1, l2 in zip(ax.get_lines(), lines2):
-                self.assertEqual(l1.get_color(), l2.get_color())
-        finally:
-            sys.stderr = tmp
-
-        tm.close()
-
-        ax = df.plot(colormap='jet')
-        rgba_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
-        self._check_colors(ax.get_lines(), linecolors=rgba_colors)
-        tm.close()
-
-        ax = df.plot(colormap=cm.jet)
-        rgba_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
-        self._check_colors(ax.get_lines(), linecolors=rgba_colors)
-        tm.close()
-
-        # make color a list if plotting one column frame
-        # handles cases like df.plot(color='DodgerBlue')
-        ax = df.ix[:, [0]].plot(color='DodgerBlue')
-        self._check_colors(ax.lines, linecolors=['DodgerBlue'])
-
-        ax = df.plot(color='red')
-        self._check_colors(ax.get_lines(), linecolors=['red'] * 5)
-        tm.close()
-
-    @slow
-    def test_line_colors_and_styles_subplots(self):
-        # GH 9894
-        from matplotlib import cm
-        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
-
-        df = DataFrame(randn(5, 5))
-
-        axes = df.plot(subplots=True)
-        for ax, c in zip(axes, list(default_colors)):
-            self._check_colors(ax.get_lines(), linecolors=c)
-        tm.close()
-
-        # single color char
-        axes = df.plot(subplots=True, color='k')
-        for ax in axes:
-            self._check_colors(ax.get_lines(), linecolors=['k'])
-        tm.close()
-
-        # single color str
-        axes = df.plot(subplots=True, color='green')
-        for ax in axes:
-            self._check_colors(ax.get_lines(), linecolors=['green'])
-        tm.close()
-
-        custom_colors = 'rgcby'
-        axes = df.plot(color=custom_colors, subplots=True)
-        for ax, c in zip(axes, list(custom_colors)):
-            self._check_colors(ax.get_lines(), linecolors=[c])
-        tm.close()
-
-        axes = df.plot(color=list(custom_colors), subplots=True)
-        for ax, c in zip(axes, list(custom_colors)):
-            self._check_colors(ax.get_lines(), linecolors=[c])
-        tm.close()
-
-        rgba_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
-        for cmap in ['jet', cm.jet]:
-            axes = df.plot(colormap=cmap, subplots=True)
-            for ax, c in zip(axes, rgba_colors):
-                self._check_colors(ax.get_lines(), linecolors=[c])
-            tm.close()
-
-        # make color a list if plotting one column frame
-        # handles cases like df.plot(color='DodgerBlue')
-        axes = df.ix[:, [0]].plot(color='DodgerBlue', subplots=True)
-        self._check_colors(axes[0].lines, linecolors=['DodgerBlue'])
-
-        # single character style
-        axes = df.plot(style='r', subplots=True)
-        for ax in axes:
-            self._check_colors(ax.get_lines(), linecolors=['r'])
-        tm.close()
-
-        # list of styles
-        styles = list('rgcby')
-        axes = df.plot(style=styles, subplots=True)
-        for ax, c in zip(axes, styles):
-            self._check_colors(ax.get_lines(), linecolors=[c])
-        tm.close()
-
-    @slow
-    def test_area_colors(self):
-        from matplotlib import cm
-        from matplotlib.collections import PolyCollection
-
-        custom_colors = 'rgcby'
-        df = DataFrame(rand(5, 5))
-
-        ax = df.plot.area(color=custom_colors)
-        self._check_colors(ax.get_lines(), linecolors=custom_colors)
-        poly = [o for o in ax.get_children() if isinstance(o, PolyCollection)]
-        self._check_colors(poly, facecolors=custom_colors)
-
-        handles, labels = ax.get_legend_handles_labels()
-        # legend is stored as Line2D, thus check linecolors
-        linehandles = [x for x in handles if not isinstance(x, PolyCollection)]
-        self._check_colors(linehandles, linecolors=custom_colors)
-        for h in handles:
-            self.assertTrue(h.get_alpha() is None)
-        tm.close()
-
-        ax = df.plot.area(colormap='jet')
-        jet_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
-        self._check_colors(ax.get_lines(), linecolors=jet_colors)
-        poly = [o for o in ax.get_children() if isinstance(o, PolyCollection)]
-        self._check_colors(poly, facecolors=jet_colors)
-
-        handles, labels = ax.get_legend_handles_labels()
-        linehandles = [x for x in handles if not isinstance(x, PolyCollection)]
-        self._check_colors(linehandles, linecolors=jet_colors)
-        for h in handles:
-            self.assertTrue(h.get_alpha() is None)
-        tm.close()
-
-        # When stacked=False, alpha is set to 0.5
-        ax = df.plot.area(colormap=cm.jet, stacked=False)
-        self._check_colors(ax.get_lines(), linecolors=jet_colors)
-        poly = [o for o in ax.get_children() if isinstance(o, PolyCollection)]
-        jet_with_alpha = [(c[0], c[1], c[2], 0.5) for c in jet_colors]
-        self._check_colors(poly, facecolors=jet_with_alpha)
-
-        handles, labels = ax.get_legend_handles_labels()
-        # Line2D can't have alpha in its linecolor
-        self._check_colors(handles[:len(jet_colors)], linecolors=jet_colors)
-        for h in handles:
-            self.assertEqual(h.get_alpha(), 0.5)
-
-    @slow
-    def test_hist_colors(self):
-        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
-
-        df = DataFrame(randn(5, 5))
-        ax = df.plot.hist()
-        self._check_colors(ax.patches[::10], facecolors=default_colors[:5])
-        tm.close()
-
-        custom_colors = 'rgcby'
-        ax = df.plot.hist( color=custom_colors)
-        self._check_colors(ax.patches[::10], facecolors=custom_colors)
-        tm.close()
-
-        from matplotlib import cm
-        # Test str -> colormap functionality
-        ax = df.plot.hist( colormap='jet')
-        rgba_colors = lmap(cm.jet, np.linspace(0, 1, 5))
-        self._check_colors(ax.patches[::10], facecolors=rgba_colors)
-        tm.close()
-
-        # Test colormap functionality
-        ax = df.plot.hist( colormap=cm.jet)
-        rgba_colors = lmap(cm.jet, np.linspace(0, 1, 5))
-        self._check_colors(ax.patches[::10], facecolors=rgba_colors)
-        tm.close()
-
-        ax = df.ix[:, [0]].plot.hist(color='DodgerBlue')
-        self._check_colors([ax.patches[0]], facecolors=['DodgerBlue'])
-
-        ax = df.plot(kind='hist', color='green')
-        self._check_colors(ax.patches[::10], facecolors=['green'] * 5)
-        tm.close()
-
-    @slow
-    def test_kde_colors(self):
-        tm._skip_if_no_scipy()
-        _skip_if_no_scipy_gaussian_kde()
-
-        from matplotlib import cm
-
-        custom_colors = 'rgcby'
-        df = DataFrame(rand(5, 5))
-
-        ax = df.plot.kde(color=custom_colors)
-        self._check_colors(ax.get_lines(), linecolors=custom_colors)
-        tm.close()
-
-        ax = df.plot.kde(colormap='jet')
-        rgba_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
-        self._check_colors(ax.get_lines(), linecolors=rgba_colors)
-        tm.close()
-
-        ax = df.plot.kde(colormap=cm.jet)
-        rgba_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
-        self._check_colors(ax.get_lines(), linecolors=rgba_colors)
-
-    @slow
-    def test_kde_colors_and_styles_subplots(self):
-        tm._skip_if_no_scipy()
-        _skip_if_no_scipy_gaussian_kde()
-
-        from matplotlib import cm
-        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
-
-        df = DataFrame(randn(5, 5))
-
-        axes = df.plot(kind='kde', subplots=True)
-        for ax, c in zip(axes, list(default_colors)):
-            self._check_colors(ax.get_lines(), linecolors=[c])
-        tm.close()
-
-        # single color char
-        axes = df.plot(kind='kde', color='k', subplots=True)
-        for ax in axes:
-            self._check_colors(ax.get_lines(), linecolors=['k'])
-        tm.close()
-
-        # single color str
-        axes = df.plot(kind='kde', color='red', subplots=True)
-        for ax in axes:
-            self._check_colors(ax.get_lines(), linecolors=['red'])
-        tm.close()
-
-        custom_colors = 'rgcby'
-        axes = df.plot(kind='kde', color=custom_colors, subplots=True)
-        for ax, c in zip(axes, list(custom_colors)):
-            self._check_colors(ax.get_lines(), linecolors=[c])
-        tm.close()
-
-        rgba_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
-        for cmap in ['jet', cm.jet]:
-            axes = df.plot(kind='kde', colormap=cmap, subplots=True)
-            for ax, c in zip(axes, rgba_colors):
-                self._check_colors(ax.get_lines(), linecolors=[c])
-            tm.close()
-
-        # make color a list if plotting one column frame
-        # handles cases like df.plot(color='DodgerBlue')
-        axes = df.ix[:, [0]].plot(kind='kde', color='DodgerBlue', subplots=True)
-        self._check_colors(axes[0].lines, linecolors=['DodgerBlue'])
-
-        # single character style
-        axes = df.plot(kind='kde', style='r', subplots=True)
-        for ax in axes:
-            self._check_colors(ax.get_lines(), linecolors=['r'])
-        tm.close()
-
-        # list of styles
-        styles = list('rgcby')
-        axes = df.plot(kind='kde', style=styles, subplots=True)
-        for ax, c in zip(axes, styles):
-            self._check_colors(ax.get_lines(), linecolors=[c])
-        tm.close()
-
-    @slow
-    def test_boxplot_colors(self):
-
-        def _check_colors(bp, box_c, whiskers_c, medians_c, caps_c='k', fliers_c='b'):
-            self._check_colors(bp['boxes'], linecolors=[box_c] * len(bp['boxes']))
-            self._check_colors(bp['whiskers'], linecolors=[whiskers_c] * len(bp['whiskers']))
-            self._check_colors(bp['medians'], linecolors=[medians_c] * len(bp['medians']))
-            self._check_colors(bp['fliers'], linecolors=[fliers_c] * len(bp['fliers']))
-            self._check_colors(bp['caps'], linecolors=[caps_c] * len(bp['caps']))
-
-        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
-
-        df = DataFrame(randn(5, 5))
-        bp = df.plot.box(return_type='dict')
-        _check_colors(bp, default_colors[0], default_colors[0], default_colors[2])
-        tm.close()
-
-        dict_colors = dict(boxes='#572923', whiskers='#982042',
-                           medians='#804823', caps='#123456')
-        bp = df.plot.box(color=dict_colors, sym='r+', return_type='dict')
-        _check_colors(bp, dict_colors['boxes'], dict_colors['whiskers'],
-                      dict_colors['medians'], dict_colors['caps'], 'r')
-        tm.close()
-
-        # partial colors
-        dict_colors = dict(whiskers='c', medians='m')
-        bp = df.plot.box(color=dict_colors, return_type='dict')
-        _check_colors(bp, default_colors[0], 'c', 'm')
-        tm.close()
-
-        from matplotlib import cm
-        # Test str -> colormap functionality
-        bp = df.plot.box(colormap='jet', return_type='dict')
-        jet_colors = lmap(cm.jet, np.linspace(0, 1, 3))
-        _check_colors(bp, jet_colors[0], jet_colors[0], jet_colors[2])
-        tm.close()
-
-        # Test colormap functionality
-        bp = df.plot.box(colormap=cm.jet, return_type='dict')
-        _check_colors(bp, jet_colors[0], jet_colors[0], jet_colors[2])
-        tm.close()
-
-        # string color is applied to all artists except fliers
-        bp = df.plot.box(color='DodgerBlue', return_type='dict')
-        _check_colors(bp, 'DodgerBlue', 'DodgerBlue', 'DodgerBlue',
-                      'DodgerBlue')
-
-        # tuple is also applied to all artists except fliers
-        bp = df.plot.box(color=(0, 1, 0), sym='#123456', return_type='dict')
-        _check_colors(bp, (0, 1, 0), (0, 1, 0), (0, 1, 0), (0, 1, 0), '#123456')
-
-        with tm.assertRaises(ValueError):
-            # Color contains invalid key results in ValueError
-            df.plot.box(color=dict(boxes='red', xxxx='blue'))
-
-    def test_default_color_cycle(self):
-        import matplotlib.pyplot as plt
-        colors = list('rgbk')
-        if self.mpl_ge_1_5_0:
-            import cycler
-            plt.rcParams['axes.prop_cycle'] = cycler.cycler('color', colors)
-        else:
-            plt.rcParams['axes.color_cycle'] = colors
-
-        df = DataFrame(randn(5, 3))
-        ax = df.plot()
-
-        expected = self._maybe_unpack_cycler(plt.rcParams)[:3]
-        self._check_colors(ax.get_lines(), linecolors=expected)
-
-    def test_unordered_ts(self):
-        df = DataFrame(np.array([3.0, 2.0, 1.0]),
-                       index=[date(2012, 10, 1),
-                              date(2012, 9, 1),
-                              date(2012, 8, 1)],
-                       columns=['test'])
-        ax = df.plot()
-        xticks = ax.lines[0].get_xdata()
-        self.assertTrue(xticks[0] < xticks[1])
-        ydata = ax.lines[0].get_ydata()
-        tm.assert_numpy_array_equal(ydata, np.array([1.0, 2.0, 3.0]))
-
-    def test_kind_both_ways(self):
-        df = DataFrame({'x': [1, 2, 3]})
-        for kind in plotting._common_kinds:
-            if not _ok_for_gaussian_kde(kind):
-                continue
-            df.plot(kind=kind)
-            getattr(df.plot, kind)()
-        for kind in ['scatter', 'hexbin']:
-            df.plot('x', 'x', kind=kind)
-            getattr(df.plot, kind)('x', 'x')
-
-    def test_all_invalid_plot_data(self):
-        df = DataFrame(list('abcd'))
-        for kind in plotting._common_kinds:
-            if not _ok_for_gaussian_kde(kind):
-                continue
-            with tm.assertRaises(TypeError):
-                df.plot(kind=kind)
-
-    @slow
-    def test_partially_invalid_plot_data(self):
-        with tm.RNGContext(42):
-            df = DataFrame(randn(10, 2), dtype=object)
-            df[np.random.rand(df.shape[0]) > 0.5] = 'a'
-            for kind in plotting._common_kinds:
-                if not _ok_for_gaussian_kde(kind):
-                    continue
-                with tm.assertRaises(TypeError):
-                    df.plot(kind=kind)
-
-        with tm.RNGContext(42):
-            # area plot doesn't support positive/negative mixed data
-            kinds = ['area']
-            df = DataFrame(rand(10, 2), dtype=object)
-            df[np.random.rand(df.shape[0]) > 0.5] = 'a'
-            for kind in kinds:
-                with tm.assertRaises(TypeError):
-                    df.plot(kind=kind)
-
-    def test_invalid_kind(self):
-        df = DataFrame(randn(10, 2))
-        with tm.assertRaises(ValueError):
-            df.plot(kind='aasdf')
-
-    @slow
-    def test_hexbin_basic(self):
-        df = self.hexbin_df
-
-        ax = df.plot.hexbin(x='A', y='B', gridsize=10)
-        # TODO: need better way to test. This just does existence.
-        self.assertEqual(len(ax.collections), 1)
-
-        # GH 6951
-        axes = df.plot.hexbin(x='A', y='B', subplots=True)
-        # hexbin should have 2 axes in the figure, 1 for plotting and another is colorbar
-        self.assertEqual(len(axes[0].figure.axes), 2)
-        # return value is single axes
-        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
-
-    @slow
-    def test_hexbin_with_c(self):
-        df = self.hexbin_df
-
-        ax = df.plot.hexbin(x='A', y='B', C='C')
-        self.assertEqual(len(ax.collections), 1)
-
-        ax = df.plot.hexbin(x='A', y='B', C='C', reduce_C_function=np.std)
-        self.assertEqual(len(ax.collections), 1)
-
-    @slow
-    def test_hexbin_cmap(self):
-        df = self.hexbin_df
-
-        # Default to BuGn
-        ax = df.plot.hexbin(x='A', y='B')
-        self.assertEqual(ax.collections[0].cmap.name, 'BuGn')
-
-        cm = 'cubehelix'
-        ax = df.plot.hexbin(x='A', y='B', colormap=cm)
-        self.assertEqual(ax.collections[0].cmap.name, cm)
-
-    @slow
-    def test_no_color_bar(self):
-        df = self.hexbin_df
-
-        ax = df.plot.hexbin(x='A', y='B', colorbar=None)
-        self.assertIs(ax.collections[0].colorbar, None)
-
-    @slow
-    def test_allow_cmap(self):
-        df = self.hexbin_df
-
-        ax = df.plot.hexbin(x='A', y='B', cmap='YlGn')
-        self.assertEqual(ax.collections[0].cmap.name, 'YlGn')
-
-        with tm.assertRaises(TypeError):
-            df.plot.hexbin(x='A', y='B', cmap='YlGn',
-                           colormap='BuGn')
-
-    @slow
-    def test_pie_df(self):
-        df = DataFrame(np.random.rand(5, 3), columns=['X', 'Y', 'Z'],
-                       index=['a', 'b', 'c', 'd', 'e'])
-        with tm.assertRaises(ValueError):
-            df.plot.pie()
-
-        ax = _check_plot_works(df.plot.pie, y='Y')
-        self._check_text_labels(ax.texts, df.index)
-
-        ax = _check_plot_works(df.plot.pie, y=2)
-        self._check_text_labels(ax.texts, df.index)
-
-        axes = _check_plot_works(df.plot.pie, filterwarnings='ignore', subplots=True)
-        self.assertEqual(len(axes), len(df.columns))
-        for ax in axes:
-            self._check_text_labels(ax.texts, df.index)
-        for ax, ylabel in zip(axes, df.columns):
-            self.assertEqual(ax.get_ylabel(), ylabel)
-
-        labels = ['A', 'B', 'C', 'D', 'E']
-        color_args = ['r', 'g', 'b', 'c', 'm']
-        axes = _check_plot_works(df.plot.pie, filterwarnings='ignore', subplots=True,
-                                 labels=labels, colors=color_args)
-        self.assertEqual(len(axes), len(df.columns))
-
-        for ax in axes:
-            self._check_text_labels(ax.texts, labels)
-            self._check_colors(ax.patches, facecolors=color_args)
-
-    def test_pie_df_nan(self):
-        df = DataFrame(np.random.rand(4, 4))
-        for i in range(4):
-            df.iloc[i, i] = np.nan
-        fig, axes = self.plt.subplots(ncols=4)
-        df.plot.pie(subplots=True, ax=axes, legend=True)
-
-        base_expected = ['0', '1', '2', '3']
-        for i, ax in enumerate(axes):
-            expected = list(base_expected)  # force copy
-            expected[i] = ''
-            result = [x.get_text() for x in ax.texts]
-            self.assertEqual(result, expected)
-            # legend labels
-            # NaN's not included in legend with subplots
-            # see https://github.com/pydata/pandas/issues/8390
-            self.assertEqual([x.get_text() for x in
-                              ax.get_legend().get_texts()],
-                             base_expected[:i] + base_expected[i+1:])
-
-    def test_errorbar_plot(self):
-        d = {'x': np.arange(12), 'y': np.arange(12, 0, -1)}
-        df = DataFrame(d)
-        d_err = {'x': np.ones(12)*0.2, 'y': np.ones(12)*0.4}
-        df_err = DataFrame(d_err)
-
-        # check line plots
-        ax = _check_plot_works(df.plot, yerr=df_err, logy=True)
-        self._check_has_errorbars(ax, xerr=0, yerr=2)
-        ax = _check_plot_works(df.plot, yerr=df_err, logx=True, logy=True)
-        self._check_has_errorbars(ax, xerr=0, yerr=2)
-        ax = _check_plot_works(df.plot, yerr=df_err, loglog=True)
-        self._check_has_errorbars(ax, xerr=0, yerr=2)
-
-        kinds = ['line', 'bar', 'barh']
-        for kind in kinds:
-            ax = _check_plot_works(df.plot, yerr=df_err['x'], kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=2)
-            ax = _check_plot_works(df.plot, yerr=d_err, kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=2)
-            ax = _check_plot_works(df.plot, yerr=df_err, xerr=df_err, kind=kind)
-            self._check_has_errorbars(ax, xerr=2, yerr=2)
-            ax = _check_plot_works(df.plot, yerr=df_err['x'], xerr=df_err['x'], kind=kind)
-            self._check_has_errorbars(ax, xerr=2, yerr=2)
-            ax = _check_plot_works(df.plot, xerr=0.2, yerr=0.2, kind=kind)
-            self._check_has_errorbars(ax, xerr=2, yerr=2)
-            axes = _check_plot_works(df.plot, filterwarnings='ignore', yerr=df_err,
-                                     xerr=df_err, subplots=True, kind=kind)
-            self._check_has_errorbars(axes, xerr=1, yerr=1)
-
-        ax = _check_plot_works((df+1).plot, yerr=df_err, xerr=df_err, kind='bar', log=True)
-        self._check_has_errorbars(ax, xerr=2, yerr=2)
-
-        # yerr is raw error values
-        ax = _check_plot_works(df['y'].plot, yerr=np.ones(12)*0.4)
-        self._check_has_errorbars(ax, xerr=0, yerr=1)
-        ax = _check_plot_works(df.plot, yerr=np.ones((2, 12))*0.4)
-        self._check_has_errorbars(ax, xerr=0, yerr=2)
-
-        # yerr is iterator
-        import itertools
-        ax = _check_plot_works(df.plot, yerr=itertools.repeat(0.1, len(df)))
-        self._check_has_errorbars(ax, xerr=0, yerr=2)
-
-        # yerr is column name
-        for yerr in ['yerr', u('誤差')]:
-            s_df = df.copy()
-            s_df[yerr] = np.ones(12)*0.2
-            ax = _check_plot_works(s_df.plot, yerr=yerr)
-            self._check_has_errorbars(ax, xerr=0, yerr=2)
-            ax = _check_plot_works(s_df.plot, y='y', x='x', yerr=yerr)
-            self._check_has_errorbars(ax, xerr=0, yerr=1)
-
-        with tm.assertRaises(ValueError):
-            df.plot(yerr=np.random.randn(11))
-
-        df_err = DataFrame({'x': ['zzz']*12, 'y': ['zzz']*12})
-        with tm.assertRaises((ValueError, TypeError)):
-            df.plot(yerr=df_err)
-
-    @slow
-    def test_errorbar_with_integer_column_names(self):
-        # test with integer column names
-        df = DataFrame(np.random.randn(10, 2))
-        df_err = DataFrame(np.random.randn(10, 2))
-        ax = _check_plot_works(df.plot, yerr=df_err)
-        self._check_has_errorbars(ax, xerr=0, yerr=2)
-        ax = _check_plot_works(df.plot, y=0, yerr=1)
-        self._check_has_errorbars(ax, xerr=0, yerr=1)
-
-    @slow
-    def test_errorbar_with_partial_columns(self):
-        df = DataFrame(np.random.randn(10, 3))
-        df_err = DataFrame(np.random.randn(10, 2), columns=[0, 2])
-        kinds = ['line', 'bar']
-        for kind in kinds:
-            ax = _check_plot_works(df.plot, yerr=df_err, kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=2)
-
-        ix = date_range('1/1/2000', periods=10, freq='M')
-        df.set_index(ix, inplace=True)
-        df_err.set_index(ix, inplace=True)
-        ax = _check_plot_works(df.plot, yerr=df_err, kind='line')
-        self._check_has_errorbars(ax, xerr=0, yerr=2)
-
-        d = {'x': np.arange(12), 'y': np.arange(12, 0, -1)}
-        df = DataFrame(d)
-        d_err = {'x': np.ones(12)*0.2, 'z': np.ones(12)*0.4}
-        df_err = DataFrame(d_err)
-        for err in [d_err, df_err]:
-            ax = _check_plot_works(df.plot, yerr=err)
-            self._check_has_errorbars(ax, xerr=0, yerr=1)
-
-    @slow
-    def test_errorbar_timeseries(self):
-
-        d = {'x': np.arange(12), 'y': np.arange(12, 0, -1)}
-        d_err = {'x': np.ones(12)*0.2, 'y': np.ones(12)*0.4}
-
-        # check time-series plots
-        ix = date_range('1/1/2000', '1/1/2001', freq='M')
-        tdf = DataFrame(d, index=ix)
-        tdf_err = DataFrame(d_err, index=ix)
-
-        kinds = ['line', 'bar', 'barh']
-        for kind in kinds:
-            ax = _check_plot_works(tdf.plot, yerr=tdf_err, kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=2)
-            ax = _check_plot_works(tdf.plot, yerr=d_err, kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=2)
-            ax = _check_plot_works(tdf.plot, y='y', yerr=tdf_err['x'], kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=1)
-            ax = _check_plot_works(tdf.plot, y='y', yerr='x', kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=1)
-            ax = _check_plot_works(tdf.plot, yerr=tdf_err, kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=2)
-            axes = _check_plot_works(tdf.plot, filterwarnings='ignore', kind=kind,
-                                     yerr=tdf_err, subplots=True)
-            self._check_has_errorbars(axes, xerr=0, yerr=1)
-
-    def test_errorbar_asymmetrical(self):
-
-        np.random.seed(0)
-        err = np.random.rand(3, 2, 5)
-
-        data = np.random.randn(5, 3)
-        df = DataFrame(data)
-
-        ax = df.plot(yerr=err, xerr=err/2)
-
-        self.assertEqual(ax.lines[7].get_ydata()[0], data[0,1]-err[1,0,0])
-        self.assertEqual(ax.lines[8].get_ydata()[0], data[0,1]+err[1,1,0])
-
-        self.assertEqual(ax.lines[5].get_xdata()[0], -err[1,0,0]/2)
-        self.assertEqual(ax.lines[6].get_xdata()[0], err[1,1,0]/2)
-
-        with tm.assertRaises(ValueError):
-            df.plot(yerr=err.T)
-
-        tm.close()
-
-    def test_table(self):
-        df = DataFrame(np.random.rand(10, 3),
-                       index=list(string.ascii_letters[:10]))
-        _check_plot_works(df.plot, table=True)
-        _check_plot_works(df.plot, table=df)
-
-        ax = df.plot()
-        self.assertTrue(len(ax.tables) == 0)
-        plotting.table(ax, df.T)
-        self.assertTrue(len(ax.tables) == 1)
-
-    def test_errorbar_scatter(self):
-        df = DataFrame(np.random.randn(5, 2), index=range(5), columns=['x', 'y'])
-        df_err = DataFrame(np.random.randn(5, 2) / 5,
-                           index=range(5), columns=['x', 'y'])
-
-        ax = _check_plot_works(df.plot.scatter, x='x', y='y')
-        self._check_has_errorbars(ax, xerr=0, yerr=0)
-        ax = _check_plot_works(df.plot.scatter, x='x', y='y', xerr=df_err)
-        self._check_has_errorbars(ax, xerr=1, yerr=0)
-
-        ax = _check_plot_works(df.plot.scatter, x='x', y='y', yerr=df_err)
-        self._check_has_errorbars(ax, xerr=0, yerr=1)
-        ax = _check_plot_works(df.plot.scatter, x='x', y='y',
-                               xerr=df_err, yerr=df_err)
-        self._check_has_errorbars(ax, xerr=1, yerr=1)
-
-        def _check_errorbar_color(containers, expected, has_err='has_xerr'):
-            errs = [c.lines[1][0] for c in ax.containers if getattr(c, has_err, False)]
-            self._check_colors(errs, linecolors=[expected] * len(errs))
-
-        # GH 8081
-        df = DataFrame(np.random.randn(10, 5), columns=['a', 'b', 'c', 'd', 'e'])
-        ax = df.plot.scatter(x='a', y='b', xerr='d', yerr='e', c='red')
-        self._check_has_errorbars(ax, xerr=1, yerr=1)
-        _check_errorbar_color(ax.containers, 'red', has_err='has_xerr')
-        _check_errorbar_color(ax.containers, 'red', has_err='has_yerr')
-
-        ax = df.plot.scatter(x='a', y='b', yerr='e', color='green')
-        self._check_has_errorbars(ax, xerr=0, yerr=1)
-        _check_errorbar_color(ax.containers, 'green', has_err='has_yerr')
-
-    @slow
-    def test_sharex_and_ax(self):
-        # https://github.com/pydata/pandas/issues/9737
-        # using gridspec, the axis in fig.get_axis() are sorted differently than pandas expected
-        # them, so make sure that only the right ones are removed
-        import matplotlib.pyplot as plt
-        plt.close('all')
-        gs, axes = _generate_4_axes_via_gridspec()
-
-        df = DataFrame({"a": [1, 2, 3, 4, 5, 6],
-                        "b": [1, 2, 3, 4, 5, 6],
-                        "c": [1, 2, 3, 4, 5, 6],
-                        "d": [1, 2, 3, 4, 5, 6]})
-
-        def _check(axes):
-            for ax in axes:
-                self.assertEqual(len(ax.lines), 1)
-                self._check_visible(ax.get_yticklabels(), visible=True)
-            for ax in [axes[0], axes[2]]:
-                self._check_visible(ax.get_xticklabels(), visible=False)
-                self._check_visible(ax.get_xticklabels(minor=True), visible=False)
-            for ax in [axes[1], axes[3]]:
-                self._check_visible(ax.get_xticklabels(), visible=True)
-                self._check_visible(ax.get_xticklabels(minor=True), visible=True)
-
-        for ax in axes:
-            df.plot(x="a", y="b", title="title", ax=ax, sharex=True)
-        gs.tight_layout(plt.gcf())
-        _check(axes)
-        tm.close()
-
-        gs, axes = _generate_4_axes_via_gridspec()
-        with tm.assert_produces_warning(UserWarning):
-            axes = df.plot(subplots=True, ax=axes, sharex=True)
-        _check(axes)
-        tm.close()
-
-        gs, axes = _generate_4_axes_via_gridspec()
-        # without sharex, no labels should be touched!
-        for ax in axes:
-            df.plot(x="a", y="b", title="title", ax=ax)
-
-        gs.tight_layout(plt.gcf())
-        for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
-            self._check_visible(ax.get_yticklabels(), visible=True)
-            self._check_visible(ax.get_xticklabels(), visible=True)
-            self._check_visible(ax.get_xticklabels(minor=True), visible=True)
-        tm.close()
-
-    @slow
-    def test_sharey_and_ax(self):
-        # https://github.com/pydata/pandas/issues/9737
-        # using gridspec, the axis in fig.get_axis() are sorted differently than pandas expected
-        # them, so make sure that only the right ones are removed
-        import matplotlib.pyplot as plt
-
-        gs, axes = _generate_4_axes_via_gridspec()
-
-        df = DataFrame({"a": [1, 2, 3, 4, 5, 6],
-                        "b": [1, 2, 3, 4, 5, 6],
-                        "c": [1, 2, 3, 4, 5, 6],
-                        "d": [1, 2, 3, 4, 5, 6]})
-
-        def _check(axes):
-            for ax in axes:
-                self.assertEqual(len(ax.lines), 1)
-                self._check_visible(ax.get_xticklabels(), visible=True)
-                self._check_visible(ax.get_xticklabels(minor=True), visible=True)
-            for ax in [axes[0], axes[1]]:
-                self._check_visible(ax.get_yticklabels(), visible=True)
-            for ax in [axes[2], axes[3]]:
-                self._check_visible(ax.get_yticklabels(), visible=False)
-
-        for ax in axes:
-            df.plot(x="a", y="b", title="title", ax=ax, sharey=True)
-        gs.tight_layout(plt.gcf())
-        _check(axes)
-        tm.close()
-
-        gs, axes = _generate_4_axes_via_gridspec()
-        with tm.assert_produces_warning(UserWarning):
-            axes = df.plot(subplots=True, ax=axes, sharey=True)
-
-        gs.tight_layout(plt.gcf())
-        _check(axes)
-        tm.close()
-
-        gs, axes = _generate_4_axes_via_gridspec()
-        # without sharex, no labels should be touched!
-        for ax in axes:
-            df.plot(x="a", y="b", title="title", ax=ax)
-
-        gs.tight_layout(plt.gcf())
-        for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
-            self._check_visible(ax.get_yticklabels(), visible=True)
-            self._check_visible(ax.get_xticklabels(), visible=True)
-            self._check_visible(ax.get_xticklabels(minor=True), visible=True)
-
-    def test_memory_leak(self):
-        """ Check that every plot type gets properly collected. """
-        import weakref
-        import gc
-
-        results = {}
-        for kind in plotting._plot_klass.keys():
-            if not _ok_for_gaussian_kde(kind):
-                continue
-            args = {}
-            if kind in ['hexbin', 'scatter', 'pie']:
-                df = self.hexbin_df
-                args = {'x': 'A', 'y': 'B'}
-            elif kind == 'area':
-                df = self.tdf.abs()
-            else:
-                df = self.tdf
-
-            # Use a weakref so we can see if the object gets collected without
-            # also preventing it from being collected
-            results[kind] = weakref.proxy(df.plot(kind=kind, **args))
-
-        # have matplotlib delete all the figures
-        tm.close()
-        # force a garbage collection
-        gc.collect()
-        for key in results:
-            # check that every plot was collected
-            with tm.assertRaises(ReferenceError):
-                # need to actually access something to get an error
-                results[key].lines
-
-    @slow
-    def test_df_subplots_patterns_minorticks(self):
-        # GH 10657
-        import matplotlib.pyplot as plt
-
-        df = DataFrame(np.random.randn(10, 2),
-                       index=date_range('1/1/2000', periods=10),
-                       columns=list('AB'))
-
-        # shared subplots
-        fig, axes = plt.subplots(2, 1, sharex=True)
-        axes = df.plot(subplots=True, ax=axes)
-        for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
-            self._check_visible(ax.get_yticklabels(), visible=True)
-        # xaxis of 1st ax must be hidden
-        self._check_visible(axes[0].get_xticklabels(), visible=False)
-        self._check_visible(axes[0].get_xticklabels(minor=True), visible=False)
-        self._check_visible(axes[1].get_xticklabels(), visible=True)
-        self._check_visible(axes[1].get_xticklabels(minor=True), visible=True)
-        tm.close()
-
-        fig, axes = plt.subplots(2, 1)
-        with tm.assert_produces_warning(UserWarning):
-            axes = df.plot(subplots=True, ax=axes, sharex=True)
-        for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
-            self._check_visible(ax.get_yticklabels(), visible=True)
-        # xaxis of 1st ax must be hidden
-        self._check_visible(axes[0].get_xticklabels(), visible=False)
-        self._check_visible(axes[0].get_xticklabels(minor=True), visible=False)
-        self._check_visible(axes[1].get_xticklabels(), visible=True)
-        self._check_visible(axes[1].get_xticklabels(minor=True), visible=True)
-        tm.close()
-
-        # not shared
-        fig, axes = plt.subplots(2, 1)
-        axes = df.plot(subplots=True, ax=axes)
-        for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
-            self._check_visible(ax.get_yticklabels(), visible=True)
-            self._check_visible(ax.get_xticklabels(), visible=True)
-            self._check_visible(ax.get_xticklabels(minor=True), visible=True)
-        tm.close()
-
-    @slow
-    def test_df_gridspec_patterns(self):
-        # GH 10819
-        import matplotlib.pyplot as plt
-        import matplotlib.gridspec as gridspec
-
-        ts = Series(np.random.randn(10),
-                    index=date_range('1/1/2000', periods=10))
-
-        df = DataFrame(np.random.randn(10, 2), index=ts.index,
-                       columns=list('AB'))
-
-        def _get_vertical_grid():
-            gs = gridspec.GridSpec(3, 1)
-            fig = plt.figure()
-            ax1 = fig.add_subplot(gs[:2, :])
-            ax2 = fig.add_subplot(gs[2, :])
-            return ax1, ax2
-
-        def _get_horizontal_grid():
-            gs = gridspec.GridSpec(1, 3)
-            fig = plt.figure()
-            ax1 = fig.add_subplot(gs[:, :2])
-            ax2 = fig.add_subplot(gs[:, 2])
-            return ax1, ax2
-
-        for ax1, ax2 in [_get_vertical_grid(), _get_horizontal_grid()]:
-            ax1 = ts.plot(ax=ax1)
-            self.assertEqual(len(ax1.lines), 1)
-            ax2 = df.plot(ax=ax2)
-            self.assertEqual(len(ax2.lines), 2)
-            for ax in [ax1, ax2]:
-                self._check_visible(ax.get_yticklabels(), visible=True)
-                self._check_visible(ax.get_xticklabels(), visible=True)
-                self._check_visible(ax.get_xticklabels(minor=True), visible=True)
-            tm.close()
-
-        # subplots=True
-        for ax1, ax2 in [_get_vertical_grid(), _get_horizontal_grid()]:
-            axes = df.plot(subplots=True, ax=[ax1, ax2])
-            self.assertEqual(len(ax1.lines), 1)
-            self.assertEqual(len(ax2.lines), 1)
-            for ax in axes:
-                self._check_visible(ax.get_yticklabels(), visible=True)
-                self._check_visible(ax.get_xticklabels(), visible=True)
-                self._check_visible(ax.get_xticklabels(minor=True), visible=True)
-            tm.close()
-
-        # vertical / subplots / sharex=True / sharey=True
-        ax1, ax2 = _get_vertical_grid()
-        with tm.assert_produces_warning(UserWarning):
-            axes = df.plot(subplots=True, ax=[ax1, ax2],
-                           sharex=True, sharey=True)
-        self.assertEqual(len(axes[0].lines), 1)
-        self.assertEqual(len(axes[1].lines), 1)
-        for ax in [ax1, ax2]:
-            # yaxis are visible because there is only one column
-            self._check_visible(ax.get_yticklabels(), visible=True)
-        # xaxis of axes0 (top) are hidden
-        self._check_visible(axes[0].get_xticklabels(), visible=False)
-        self._check_visible(axes[0].get_xticklabels(minor=True), visible=False)
-        self._check_visible(axes[1].get_xticklabels(), visible=True)
-        self._check_visible(axes[1].get_xticklabels(minor=True), visible=True)
-        tm.close()
-
-        # horizontal / subplots / sharex=True / sharey=True
-        ax1, ax2 = _get_horizontal_grid()
-        with tm.assert_produces_warning(UserWarning):
-            axes = df.plot(subplots=True, ax=[ax1, ax2],
-                           sharex=True, sharey=True)
-        self.assertEqual(len(axes[0].lines), 1)
-        self.assertEqual(len(axes[1].lines), 1)
-        self._check_visible(axes[0].get_yticklabels(), visible=True)
-        # yaxis of axes1 (right) are hidden
-        self._check_visible(axes[1].get_yticklabels(), visible=False)
-        for ax in [ax1, ax2]:
-            # xaxis are visible because there is only one column
-            self._check_visible(ax.get_xticklabels(), visible=True)
-            self._check_visible(ax.get_xticklabels(minor=True), visible=True)
-        tm.close()
-
-        # boxed
-        def _get_boxed_grid():
-            gs = gridspec.GridSpec(3,3)
-            fig = plt.figure()
-            ax1 = fig.add_subplot(gs[:2, :2])
-            ax2 = fig.add_subplot(gs[:2, 2])
-            ax3 = fig.add_subplot(gs[2, :2])
-            ax4 = fig.add_subplot(gs[2, 2])
-            return ax1, ax2, ax3, ax4
-
-        axes = _get_boxed_grid()
-        df = DataFrame(np.random.randn(10, 4),
-                      index=ts.index, columns=list('ABCD'))
-        axes = df.plot(subplots=True, ax=axes)
-        for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
-            # axis are visible because these are not shared
-            self._check_visible(ax.get_yticklabels(), visible=True)
-            self._check_visible(ax.get_xticklabels(), visible=True)
-            self._check_visible(ax.get_xticklabels(minor=True), visible=True)
-        tm.close()
-
-        # subplots / sharex=True / sharey=True
-        axes = _get_boxed_grid()
-        with tm.assert_produces_warning(UserWarning):
-            axes = df.plot(subplots=True, ax=axes, sharex=True, sharey=True)
-        for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
-        for ax in [axes[0], axes[2]]: # left column
-            self._check_visible(ax.get_yticklabels(), visible=True)
-        for ax in [axes[1], axes[3]]: # right column
-            self._check_visible(ax.get_yticklabels(), visible=False)
-        for ax in [axes[0], axes[1]]: # top row
-            self._check_visible(ax.get_xticklabels(), visible=False)
-            self._check_visible(ax.get_xticklabels(minor=True), visible=False)
-        for ax in [axes[2], axes[3]]: # bottom row
-            self._check_visible(ax.get_xticklabels(), visible=True)
-            self._check_visible(ax.get_xticklabels(minor=True), visible=True)
-        tm.close()
-
-    @slow
-    def test_df_grid_settings(self):
-        # Make sure plot defaults to rcParams['axes.grid'] setting, GH 9792
-        self._check_grid_settings(DataFrame({'a':[1,2,3],'b':[2,3,4]}),
-            plotting._dataframe_kinds, kws={'x':'a','y':'b'})
-
-    def test_option_mpl_style(self):
-        set_option('display.mpl_style', 'default')
-        set_option('display.mpl_style', None)
-        set_option('display.mpl_style', False)
-
-        with tm.assertRaises(ValueError):
-            set_option('display.mpl_style', 'default2')
-
-    def test_invalid_colormap(self):
-        df = DataFrame(randn(3, 2), columns=['A', 'B'])
-
-        with tm.assertRaises(ValueError):
-            df.plot(colormap='invalid_colormap')
-
-
-@tm.mplskip
-class TestDataFrameGroupByPlots(TestPlotBase):
-
-    def test_series_groupby_plotting_nominally_works(self):
-        n = 10
-        weight = Series(np.random.normal(166, 20, size=n))
-        height = Series(np.random.normal(60, 10, size=n))
-        with tm.RNGContext(42):
-            gender = tm.choice(['male', 'female'], size=n)
-
-        weight.groupby(gender).plot()
-        tm.close()
-        height.groupby(gender).hist()
-        tm.close()
-        #Regression test for GH8733
-        height.groupby(gender).plot(alpha=0.5)
-        tm.close()
-
-    def test_plotting_with_float_index_works(self):
-        # GH 7025
-        df = DataFrame({'def': [1,1,1,2,2,2,3,3,3],
-                        'val': np.random.randn(9)},
-                       index=[1.0,2.0,3.0,1.0,2.0,3.0,1.0,2.0,3.0])
-
-        df.groupby('def')['val'].plot()
-        tm.close()
-        df.groupby('def')['val'].apply(lambda x: x.plot())
-        tm.close()
-
-    def test_hist_single_row(self):
-        # GH10214
-        bins = np.arange(80, 100 + 2, 1)
-        df = DataFrame({"Name": ["AAA", "BBB"], "ByCol": [1, 2], "Mark": [85, 89]})
-        df["Mark"].hist(by=df["ByCol"], bins=bins)
-        df = DataFrame({"Name": ["AAA"], "ByCol": [1], "Mark": [85]})
-        df["Mark"].hist(by=df["ByCol"], bins=bins)
-
-    def test_plot_submethod_works(self):
-        df = DataFrame({'x': [1, 2, 3, 4, 5],
-                        'y': [1, 2, 3, 2, 1],
-                        'z': list('ababa')})
-        df.groupby('z').plot.scatter('x', 'y')
-        tm.close()
-        df.groupby('z')['x'].plot.line()
-        tm.close()
-
-
-def assert_is_valid_plot_return_object(objs):
-    import matplotlib.pyplot as plt
-    if isinstance(objs, np.ndarray):
-        for el in objs.flat:
-            assert isinstance(el, plt.Axes), ('one of \'objs\' is not a '
-                                              'matplotlib Axes instance, '
-                                              'type encountered {0!r}'
-                                              ''.format(el.__class__.__name__))
-    else:
-        assert isinstance(objs, (plt.Artist, tuple, dict)), \
-                ('objs is neither an ndarray of Artist instances nor a '
-                 'single Artist instance, tuple, or dict, "objs" is a {0!r} '
-                 ''.format(objs.__class__.__name__))
-
-
-def _check_plot_works(f, filterwarnings='always', **kwargs):
-    import matplotlib.pyplot as plt
-    ret = None
-    with warnings.catch_warnings():
-        warnings.simplefilter(filterwarnings)
-        try:
-            try:
-                fig = kwargs['figure']
-            except KeyError:
-                fig = plt.gcf()
-
-            plt.clf()
-
-            ax = kwargs.get('ax', fig.add_subplot(211))
-            ret = f(**kwargs)
-
-            assert_is_valid_plot_return_object(ret)
-
-            try:
-                kwargs['ax'] = fig.add_subplot(212)
-                ret = f(**kwargs)
-            except Exception:
-                pass
-            else:
-                assert_is_valid_plot_return_object(ret)
-
-            with ensure_clean(return_filelike=True) as path:
-                plt.savefig(path)
-        finally:
-            tm.close(fig)
-
-        return ret
-
-def _generate_4_axes_via_gridspec():
-    import matplotlib.pyplot as plt
-    import matplotlib as mpl
-    import matplotlib.gridspec
-
-    gs = mpl.gridspec.GridSpec(2, 2)
-    ax_tl = plt.subplot(gs[0,0])
-    ax_ll = plt.subplot(gs[1,0])
-    ax_tr = plt.subplot(gs[0,1])
-    ax_lr = plt.subplot(gs[1,1])
-
-    return gs, [ax_tl, ax_ll, ax_tr, ax_lr]
-
-
-def curpath():
-    pth, _ = os.path.split(os.path.abspath(__file__))
-    return pth
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_graphics_others.py b/pandas/tests/test_graphics_others.py
deleted file mode 100644
index b18cbae600b43..0000000000000
--- a/pandas/tests/test_graphics_others.py
+++ /dev/null
@@ -1,920 +0,0 @@
-#!/usr/bin/env python
-# coding: utf-8
-
-import nose
-import itertools
-import os
-import string
-import warnings
-from distutils.version import LooseVersion
-
-from datetime import datetime, date
-
-from pandas import (Series, DataFrame, MultiIndex, PeriodIndex, date_range,
-                    bdate_range)
-from pandas.compat import (range, lrange, StringIO, lmap, lzip, u, zip,
-                           iteritems, OrderedDict, PY3)
-from pandas.util.decorators import cache_readonly
-import pandas.core.common as com
-import pandas.util.testing as tm
-from pandas.util.testing import ensure_clean
-from pandas.core.config import set_option
-
-
-import numpy as np
-from numpy import random
-from numpy.random import rand, randn
-
-from numpy.testing import assert_array_equal, assert_allclose
-from numpy.testing.decorators import slow
-import pandas.tools.plotting as plotting
-
-from pandas.tests.test_graphics import (TestPlotBase, _check_plot_works,
-                                        curpath, _ok_for_gaussian_kde)
-
-
-"""
-These tests are for ``DataFrame.hist``, ``DataFrame.boxplot`` and
-other miscellaneous plots.
-`Dataframe.plot`` and ``Series.plot`` are tested in test_graphics.py
-"""
-
-
-def _skip_if_mpl_14_or_dev_boxplot():
-    # GH 8382
-    # Boxplot failures on 1.4 and 1.4.1
-    # Don't need try / except since that's done at class level
-    import matplotlib
-    if str(matplotlib.__version__) >= LooseVersion('1.4'):
-        raise nose.SkipTest("Matplotlib Regression in 1.4 and current dev.")
-
-
-@tm.mplskip
-class TestSeriesPlots(TestPlotBase):
-
-    def setUp(self):
-        TestPlotBase.setUp(self)
-        import matplotlib as mpl
-        mpl.rcdefaults()
-
-        self.ts = tm.makeTimeSeries()
-        self.ts.name = 'ts'
-
-        self.series = tm.makeStringSeries()
-        self.series.name = 'series'
-
-        self.iseries = tm.makePeriodSeries()
-        self.iseries.name = 'iseries'
-
-    @slow
-    def test_hist_legacy(self):
-        _check_plot_works(self.ts.hist)
-        _check_plot_works(self.ts.hist, grid=False)
-        _check_plot_works(self.ts.hist, figsize=(8, 10))
-        _check_plot_works(self.ts.hist, by=self.ts.index.month)
-        _check_plot_works(self.ts.hist, by=self.ts.index.month, bins=5)
-
-        fig, ax = self.plt.subplots(1, 1)
-        _check_plot_works(self.ts.hist, ax=ax)
-        _check_plot_works(self.ts.hist, ax=ax, figure=fig)
-        _check_plot_works(self.ts.hist, figure=fig)
-        tm.close()
-
-        fig, (ax1, ax2) = self.plt.subplots(1, 2)
-        _check_plot_works(self.ts.hist, figure=fig, ax=ax1)
-        _check_plot_works(self.ts.hist, figure=fig, ax=ax2)
-
-        with tm.assertRaises(ValueError):
-            self.ts.hist(by=self.ts.index, figure=fig)
-
-    @slow
-    def test_hist_bins_legacy(self):
-        df = DataFrame(np.random.randn(10, 2))
-        ax = df.hist(bins=2)[0][0]
-        self.assertEqual(len(ax.patches), 2)
-
-    @slow
-    def test_hist_layout(self):
-        df = self.hist_df
-        with tm.assertRaises(ValueError):
-            df.height.hist(layout=(1, 1))
-
-        with tm.assertRaises(ValueError):
-            df.height.hist(layout=[1, 1])
-
-    @slow
-    def test_hist_layout_with_by(self):
-        df = self.hist_df
-
-        axes = _check_plot_works(df.height.hist, by=df.gender, layout=(2, 1))
-        self._check_axes_shape(axes, axes_num=2, layout=(2, 1))
-
-        axes = _check_plot_works(df.height.hist, by=df.gender, layout=(3, -1))
-        self._check_axes_shape(axes, axes_num=2, layout=(3, 1))
-
-        axes = _check_plot_works(df.height.hist, by=df.category, layout=(4, 1))
-        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
-
-        axes = _check_plot_works(df.height.hist, by=df.category, layout=(2, -1))
-        self._check_axes_shape(axes, axes_num=4, layout=(2, 2))
-
-        axes = _check_plot_works(df.height.hist, by=df.category, layout=(3, -1))
-        self._check_axes_shape(axes, axes_num=4, layout=(3, 2))
-
-        axes = _check_plot_works(df.height.hist, by=df.category, layout=(-1, 4))
-        self._check_axes_shape(axes, axes_num=4, layout=(1, 4))
-
-        axes = _check_plot_works(df.height.hist, by=df.classroom, layout=(2, 2))
-        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
-
-        axes = df.height.hist(by=df.category, layout=(4, 2), figsize=(12, 7))
-        self._check_axes_shape(axes, axes_num=4, layout=(4, 2), figsize=(12, 7))
-
-    @slow
-    def test_hist_no_overlap(self):
-        from matplotlib.pyplot import subplot, gcf
-        x = Series(randn(2))
-        y = Series(randn(2))
-        subplot(121)
-        x.hist()
-        subplot(122)
-        y.hist()
-        fig = gcf()
-        axes = fig.get_axes()
-        self.assertEqual(len(axes), 2)
-
-    @slow
-    def test_hist_by_no_extra_plots(self):
-        df = self.hist_df
-        axes = df.height.hist(by=df.gender)
-        self.assertEqual(len(self.plt.get_fignums()), 1)
-
-    @slow
-    def test_plot_fails_when_ax_differs_from_figure(self):
-        from pylab import figure
-        fig1 = figure()
-        fig2 = figure()
-        ax1 = fig1.add_subplot(111)
-        with tm.assertRaises(AssertionError):
-            self.ts.hist(ax=ax1, figure=fig2)
-
-    @slow
-    def test_autocorrelation_plot(self):
-        from pandas.tools.plotting import autocorrelation_plot
-        _check_plot_works(autocorrelation_plot, series=self.ts)
-        _check_plot_works(autocorrelation_plot, series=self.ts.values)
-
-        ax = autocorrelation_plot(self.ts, label='Test')
-        self._check_legend_labels(ax, labels=['Test'])
-
-    @slow
-    def test_lag_plot(self):
-        from pandas.tools.plotting import lag_plot
-        _check_plot_works(lag_plot, series=self.ts)
-        _check_plot_works(lag_plot, series=self.ts, lag=5)
-
-    @slow
-    def test_bootstrap_plot(self):
-        from pandas.tools.plotting import bootstrap_plot
-        _check_plot_works(bootstrap_plot, series=self.ts, size=10)
-
-
-@tm.mplskip
-class TestDataFramePlots(TestPlotBase):
-
-    def setUp(self):
-        TestPlotBase.setUp(self)
-        import matplotlib as mpl
-        mpl.rcdefaults()
-
-        self.tdf = tm.makeTimeDataFrame()
-        self.hexbin_df = DataFrame({"A": np.random.uniform(size=20),
-                               "B": np.random.uniform(size=20),
-                               "C": np.arange(20) + np.random.uniform(size=20)})
-
-        from pandas import read_csv
-        path = os.path.join(curpath(), 'data', 'iris.csv')
-        self.iris = read_csv(path)
-
-    @slow
-    def test_boxplot_legacy(self):
-        df = DataFrame(randn(6, 4),
-                       index=list(string.ascii_letters[:6]),
-                       columns=['one', 'two', 'three', 'four'])
-        df['indic'] = ['foo', 'bar'] * 3
-        df['indic2'] = ['foo', 'bar', 'foo'] * 2
-
-        _check_plot_works(df.boxplot, return_type='dict')
-        _check_plot_works(df.boxplot, column=['one', 'two'], return_type='dict')
-        _check_plot_works(df.boxplot, column=['one', 'two'], by='indic')
-        _check_plot_works(df.boxplot, column='one', by=['indic', 'indic2'])
-        _check_plot_works(df.boxplot, by='indic')
-        _check_plot_works(df.boxplot, by=['indic', 'indic2'])
-        _check_plot_works(plotting.boxplot, data=df['one'], return_type='dict')
-        _check_plot_works(df.boxplot, notch=1, return_type='dict')
-        _check_plot_works(df.boxplot, by='indic', notch=1)
-
-        df = DataFrame(np.random.rand(10, 2), columns=['Col1', 'Col2'])
-        df['X'] = Series(['A', 'A', 'A', 'A', 'A', 'B', 'B', 'B', 'B', 'B'])
-        df['Y'] = Series(['A'] * 10)
-        _check_plot_works(df.boxplot, by='X')
-
-        # When ax is supplied and required number of axes is 1,
-        # passed ax should be used:
-        fig, ax = self.plt.subplots()
-        axes = df.boxplot('Col1', by='X', ax=ax)
-        self.assertIs(ax.get_axes(), axes)
-
-        fig, ax = self.plt.subplots()
-        axes = df.groupby('Y').boxplot(ax=ax, return_type='axes')
-        self.assertIs(ax.get_axes(), axes['A'])
-
-        # Multiple columns with an ax argument should use same figure
-        fig, ax = self.plt.subplots()
-        axes = df.boxplot(column=['Col1', 'Col2'], by='X', ax=ax, return_type='axes')
-        self.assertIs(axes['Col1'].get_figure(), fig)
-
-        # When by is None, check that all relevant lines are present in the dict
-        fig, ax = self.plt.subplots()
-        d = df.boxplot(ax=ax, return_type='dict')
-        lines = list(itertools.chain.from_iterable(d.values()))
-        self.assertEqual(len(ax.get_lines()), len(lines))
-
-    @slow
-    def test_boxplot_return_type_legacy(self):
-        # API change in https://github.com/pydata/pandas/pull/7096
-        import matplotlib as mpl
-
-        df = DataFrame(randn(6, 4),
-                       index=list(string.ascii_letters[:6]),
-                       columns=['one', 'two', 'three', 'four'])
-        with tm.assertRaises(ValueError):
-            df.boxplot(return_type='NOTATYPE')
-
-        with tm.assert_produces_warning(FutureWarning):
-            result = df.boxplot()
-        # change to Axes in future
-        self._check_box_return_type(result, 'dict')
-
-        with tm.assert_produces_warning(False):
-            result = df.boxplot(return_type='dict')
-        self._check_box_return_type(result, 'dict')
-
-        with tm.assert_produces_warning(False):
-            result = df.boxplot(return_type='axes')
-        self._check_box_return_type(result, 'axes')
-
-        with tm.assert_produces_warning(False):
-            result = df.boxplot(return_type='both')
-        self._check_box_return_type(result, 'both')
-
-    @slow
-    def test_boxplot_axis_limits(self):
-
-        def _check_ax_limits(col, ax):
-            y_min, y_max = ax.get_ylim()
-            self.assertTrue(y_min <= col.min())
-            self.assertTrue(y_max >= col.max())
-
-        df = self.hist_df.copy()
-        df['age'] = np.random.randint(1, 20, df.shape[0])
-        # One full row
-        height_ax, weight_ax = df.boxplot(['height', 'weight'], by='category')
-        _check_ax_limits(df['height'], height_ax)
-        _check_ax_limits(df['weight'], weight_ax)
-        self.assertEqual(weight_ax._sharey, height_ax)
-
-        # Two rows, one partial
-        p = df.boxplot(['height', 'weight', 'age'], by='category')
-        height_ax, weight_ax, age_ax = p[0, 0], p[0, 1], p[1, 0]
-        dummy_ax = p[1, 1]
-        _check_ax_limits(df['height'], height_ax)
-        _check_ax_limits(df['weight'], weight_ax)
-        _check_ax_limits(df['age'], age_ax)
-        self.assertEqual(weight_ax._sharey, height_ax)
-        self.assertEqual(age_ax._sharey, height_ax)
-        self.assertIsNone(dummy_ax._sharey)
-
-    @slow
-    def test_boxplot_empty_column(self):
-        _skip_if_mpl_14_or_dev_boxplot()
-        df = DataFrame(np.random.randn(20, 4))
-        df.loc[:, 0] = np.nan
-        _check_plot_works(df.boxplot, return_type='axes')
-
-    @slow
-    def test_hist_df_legacy(self):
-        from matplotlib.patches import Rectangle
-        _check_plot_works(self.hist_df.hist)
-
-        # make sure layout is handled
-        df = DataFrame(randn(100, 3))
-        axes = _check_plot_works(df.hist, grid=False)
-        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
-        self.assertFalse(axes[1, 1].get_visible())
-
-        df = DataFrame(randn(100, 1))
-        _check_plot_works(df.hist)
-
-        # make sure layout is handled
-        df = DataFrame(randn(100, 6))
-        axes = _check_plot_works(df.hist, layout=(4, 2))
-        self._check_axes_shape(axes, axes_num=6, layout=(4, 2))
-
-        # make sure sharex, sharey is handled
-        _check_plot_works(df.hist, sharex=True, sharey=True)
-
-        # handle figsize arg
-        _check_plot_works(df.hist, figsize=(8, 10))
-
-        # check bins argument
-        _check_plot_works(df.hist, bins=5)
-
-        # make sure xlabelsize and xrot are handled
-        ser = df[0]
-        xf, yf = 20, 18
-        xrot, yrot = 30, 40
-        axes = ser.hist(xlabelsize=xf, xrot=xrot, ylabelsize=yf, yrot=yrot)
-        self._check_ticks_props(axes, xlabelsize=xf, xrot=xrot,
-                                ylabelsize=yf, yrot=yrot)
-
-        xf, yf = 20, 18
-        xrot, yrot = 30, 40
-        axes = df.hist(xlabelsize=xf, xrot=xrot, ylabelsize=yf, yrot=yrot)
-        self._check_ticks_props(axes, xlabelsize=xf, xrot=xrot,
-                                ylabelsize=yf, yrot=yrot)
-
-        tm.close()
-        # make sure kwargs to hist are handled
-        ax = ser.hist(normed=True, cumulative=True, bins=4)
-        # height of last bin (index 5) must be 1.0
-        rects = [x for x in ax.get_children() if isinstance(x, Rectangle)]
-        self.assertAlmostEqual(rects[-1].get_height(), 1.0)
-
-        tm.close()
-        ax = ser.hist(log=True)
-        # scale of y must be 'log'
-        self._check_ax_scales(ax, yaxis='log')
-
-        tm.close()
-
-        # propagate attr exception from matplotlib.Axes.hist
-        with tm.assertRaises(AttributeError):
-            ser.hist(foo='bar')
-
-    @slow
-    def test_hist_layout(self):
-        df = DataFrame(randn(100, 3))
-
-        layout_to_expected_size = (
-            {'layout': None, 'expected_size': (2, 2)},  # default is 2x2
-            {'layout': (2, 2), 'expected_size': (2, 2)},
-            {'layout': (4, 1), 'expected_size': (4, 1)},
-            {'layout': (1, 4), 'expected_size': (1, 4)},
-            {'layout': (3, 3), 'expected_size': (3, 3)},
-            {'layout': (-1, 4), 'expected_size': (1, 4)},
-            {'layout': (4, -1), 'expected_size': (4, 1)},
-            {'layout': (-1, 2), 'expected_size': (2, 2)},
-            {'layout': (2, -1), 'expected_size': (2, 2)}
-        )
-
-        for layout_test in layout_to_expected_size:
-            axes = df.hist(layout=layout_test['layout'])
-            expected = layout_test['expected_size']
-            self._check_axes_shape(axes, axes_num=3, layout=expected)
-
-        # layout too small for all 4 plots
-        with tm.assertRaises(ValueError):
-            df.hist(layout=(1, 1))
-
-        # invalid format for layout
-        with tm.assertRaises(ValueError):
-            df.hist(layout=(1,))
-        with tm.assertRaises(ValueError):
-            df.hist(layout=(-1, -1))
-
-    @slow
-    def test_scatter_plot_legacy(self):
-        tm._skip_if_no_scipy()
-
-        df = DataFrame(randn(100, 2))
-
-        def scat(**kwds):
-            return plotting.scatter_matrix(df, **kwds)
-
-        _check_plot_works(scat)
-        _check_plot_works(scat, marker='+')
-        _check_plot_works(scat, vmin=0)
-        if _ok_for_gaussian_kde('kde'):
-            _check_plot_works(scat, diagonal='kde')
-        if _ok_for_gaussian_kde('density'):
-            _check_plot_works(scat, diagonal='density')
-        _check_plot_works(scat, diagonal='hist')
-        _check_plot_works(scat, range_padding=.1)
-
-        def scat2(x, y, by=None, ax=None, figsize=None):
-            return plotting.scatter_plot(df, x, y, by, ax, figsize=None)
-
-        _check_plot_works(scat2, x=0, y=1)
-        grouper = Series(np.repeat([1, 2, 3, 4, 5], 20), df.index)
-        _check_plot_works(scat2, x=0, y=1, by=grouper)
-
-    def test_scatter_matrix_axis(self):
-        tm._skip_if_no_scipy()
-        scatter_matrix = plotting.scatter_matrix
-
-        with tm.RNGContext(42):
-            df = DataFrame(randn(100, 3))
-
-        axes = _check_plot_works(scatter_matrix, filterwarnings='always', frame=df,
-                                 range_padding=.1)
-        axes0_labels = axes[0][0].yaxis.get_majorticklabels()
-        # GH 5662
-        expected = ['-2', '-1', '0', '1', '2']
-        self._check_text_labels(axes0_labels, expected)
-        self._check_ticks_props(axes, xlabelsize=8, xrot=90, ylabelsize=8, yrot=0)
-
-        df[0] = ((df[0] - 2) / 3)
-        axes = _check_plot_works(scatter_matrix, filterwarnings='always', frame=df,
-                                 range_padding=.1)
-        axes0_labels = axes[0][0].yaxis.get_majorticklabels()
-        expected = ['-1.2', '-1.0', '-0.8', '-0.6', '-0.4', '-0.2', '0.0']
-        self._check_text_labels(axes0_labels, expected)
-        self._check_ticks_props(axes, xlabelsize=8, xrot=90, ylabelsize=8, yrot=0)
-
-    @slow
-    def test_andrews_curves(self):
-        from pandas.tools.plotting import andrews_curves
-        from matplotlib import cm
-
-        df = self.iris
-
-        _check_plot_works(andrews_curves, frame=df, class_column='Name')
-
-        rgba = ('#556270', '#4ECDC4', '#C7F464')
-        ax = _check_plot_works(andrews_curves, frame=df, class_column='Name', color=rgba)
-        self._check_colors(ax.get_lines()[:10], linecolors=rgba, mapping=df['Name'][:10])
-
-        cnames = ['dodgerblue', 'aquamarine', 'seagreen']
-        ax = _check_plot_works(andrews_curves, frame=df, class_column='Name', color=cnames)
-        self._check_colors(ax.get_lines()[:10], linecolors=cnames, mapping=df['Name'][:10])
-
-        ax = _check_plot_works(andrews_curves, frame=df, class_column='Name', colormap=cm.jet)
-        cmaps = lmap(cm.jet, np.linspace(0, 1, df['Name'].nunique()))
-        self._check_colors(ax.get_lines()[:10], linecolors=cmaps, mapping=df['Name'][:10])
-
-        colors = ['b', 'g', 'r']
-        df = DataFrame({"A": [1, 2, 3],
-                        "B": [1, 2, 3],
-                        "C": [1, 2, 3],
-                        "Name": colors})
-        ax = andrews_curves(df, 'Name', color=colors)
-        handles, labels = ax.get_legend_handles_labels()
-        self._check_colors(handles, linecolors=colors)
-
-        with tm.assert_produces_warning(FutureWarning):
-            andrews_curves(data=df, class_column='Name')
-
-    @slow
-    def test_parallel_coordinates(self):
-        from pandas.tools.plotting import parallel_coordinates
-        from matplotlib import cm
-
-        df = self.iris
-
-        ax = _check_plot_works(parallel_coordinates, frame=df, class_column='Name')
-        nlines = len(ax.get_lines())
-        nxticks = len(ax.xaxis.get_ticklabels())
-
-        rgba = ('#556270', '#4ECDC4', '#C7F464')
-        ax = _check_plot_works(parallel_coordinates, frame=df, class_column='Name', color=rgba)
-        self._check_colors(ax.get_lines()[:10], linecolors=rgba, mapping=df['Name'][:10])
-
-        cnames = ['dodgerblue', 'aquamarine', 'seagreen']
-        ax = _check_plot_works(parallel_coordinates, frame=df, class_column='Name', color=cnames)
-        self._check_colors(ax.get_lines()[:10], linecolors=cnames, mapping=df['Name'][:10])
-
-        ax = _check_plot_works(parallel_coordinates, frame=df, class_column='Name', colormap=cm.jet)
-        cmaps = lmap(cm.jet, np.linspace(0, 1, df['Name'].nunique()))
-        self._check_colors(ax.get_lines()[:10], linecolors=cmaps, mapping=df['Name'][:10])
-
-        ax = _check_plot_works(parallel_coordinates, frame=df, class_column='Name', axvlines=False)
-        assert len(ax.get_lines()) == (nlines - nxticks)
-
-        colors = ['b', 'g', 'r']
-        df = DataFrame({"A": [1, 2, 3],
-                        "B": [1, 2, 3],
-                        "C": [1, 2, 3],
-                        "Name": colors})
-        ax = parallel_coordinates(df, 'Name', color=colors)
-        handles, labels = ax.get_legend_handles_labels()
-        self._check_colors(handles, linecolors=colors)
-
-        with tm.assert_produces_warning(FutureWarning):
-            parallel_coordinates(data=df, class_column='Name')
-        with tm.assert_produces_warning(FutureWarning):
-            parallel_coordinates(df, 'Name', colors=colors)
-
-    @slow
-    def test_radviz(self):
-        from pandas.tools.plotting import radviz
-        from matplotlib import cm
-
-        df = self.iris
-        _check_plot_works(radviz, frame=df, class_column='Name')
-
-        rgba = ('#556270', '#4ECDC4', '#C7F464')
-        ax = _check_plot_works(radviz, frame=df, class_column='Name', color=rgba)
-        # skip Circle drawn as ticks
-        patches = [p for p in ax.patches[:20] if p.get_label() != '']
-        self._check_colors(patches[:10], facecolors=rgba, mapping=df['Name'][:10])
-
-        cnames = ['dodgerblue', 'aquamarine', 'seagreen']
-        _check_plot_works(radviz, frame=df, class_column='Name', color=cnames)
-        patches = [p for p in ax.patches[:20] if p.get_label() != '']
-        self._check_colors(patches, facecolors=cnames, mapping=df['Name'][:10])
-
-        _check_plot_works(radviz, frame=df, class_column='Name', colormap=cm.jet)
-        cmaps = lmap(cm.jet, np.linspace(0, 1, df['Name'].nunique()))
-        patches = [p for p in ax.patches[:20] if p.get_label() != '']
-        self._check_colors(patches, facecolors=cmaps, mapping=df['Name'][:10])
-
-        colors = [[0., 0., 1., 1.],
-                  [0., 0.5, 1., 1.],
-                  [1., 0., 0., 1.]]
-        df = DataFrame({"A": [1, 2, 3],
-                        "B": [2, 1, 3],
-                        "C": [3, 2, 1],
-                        "Name": ['b', 'g', 'r']})
-        ax = radviz(df, 'Name', color=colors)
-        handles, labels = ax.get_legend_handles_labels()
-        self._check_colors(handles, facecolors=colors)
-
-
-@tm.mplskip
-class TestDataFrameGroupByPlots(TestPlotBase):
-
-    @slow
-    def test_boxplot_legacy(self):
-        grouped = self.hist_df.groupby(by='gender')
-        with warnings.catch_warnings():
-            warnings.simplefilter('ignore')
-            axes = _check_plot_works(grouped.boxplot, return_type='axes')
-        self._check_axes_shape(list(axes.values()), axes_num=2, layout=(1, 2))
-
-        axes = _check_plot_works(grouped.boxplot, subplots=False,
-                                 return_type='axes')
-        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
-        tuples = lzip(string.ascii_letters[:10], range(10))
-        df = DataFrame(np.random.rand(10, 3),
-                       index=MultiIndex.from_tuples(tuples))
-
-        grouped = df.groupby(level=1)
-        axes = _check_plot_works(grouped.boxplot, return_type='axes')
-        self._check_axes_shape(list(axes.values()), axes_num=10, layout=(4, 3))
-
-        axes = _check_plot_works(grouped.boxplot, subplots=False,
-                                 return_type='axes')
-        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
-
-        grouped = df.unstack(level=1).groupby(level=0, axis=1)
-        axes = _check_plot_works(grouped.boxplot, return_type='axes')
-        self._check_axes_shape(list(axes.values()), axes_num=3, layout=(2, 2))
-
-        axes = _check_plot_works(grouped.boxplot, subplots=False,
-                                 return_type='axes')
-        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
-
-    @slow
-    def test_grouped_plot_fignums(self):
-        n = 10
-        weight = Series(np.random.normal(166, 20, size=n))
-        height = Series(np.random.normal(60, 10, size=n))
-        with tm.RNGContext(42):
-            gender = tm.choice(['male', 'female'], size=n)
-        df = DataFrame({'height': height, 'weight': weight, 'gender': gender})
-        gb = df.groupby('gender')
-
-        res = gb.plot()
-        self.assertEqual(len(self.plt.get_fignums()), 2)
-        self.assertEqual(len(res), 2)
-        tm.close()
-
-        res = gb.boxplot(return_type='axes')
-        self.assertEqual(len(self.plt.get_fignums()), 1)
-        self.assertEqual(len(res), 2)
-        tm.close()
-
-        # now works with GH 5610 as gender is excluded
-        res = df.groupby('gender').hist()
-        tm.close()
-
-    @slow
-    def test_grouped_hist_legacy(self):
-        from matplotlib.patches import Rectangle
-
-        df = DataFrame(randn(500, 2), columns=['A', 'B'])
-        df['C'] = np.random.randint(0, 4, 500)
-        df['D'] = ['X'] * 500
-
-        axes = plotting.grouped_hist(df.A, by=df.C)
-        self._check_axes_shape(axes, axes_num=4, layout=(2, 2))
-
-        tm.close()
-        axes = df.hist(by=df.C)
-        self._check_axes_shape(axes, axes_num=4, layout=(2, 2))
-
-        tm.close()
-        # group by a key with single value
-        axes = df.hist(by='D', rot=30)
-        self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
-        self._check_ticks_props(axes, xrot=30)
-
-        tm.close()
-        # make sure kwargs to hist are handled
-        xf, yf = 20, 18
-        xrot, yrot = 30, 40
-        axes = plotting.grouped_hist(df.A, by=df.C, normed=True,
-                                     cumulative=True, bins=4,
-                                     xlabelsize=xf, xrot=xrot, ylabelsize=yf, yrot=yrot)
-        # height of last bin (index 5) must be 1.0
-        for ax in axes.ravel():
-            rects = [x for x in ax.get_children() if isinstance(x, Rectangle)]
-            height = rects[-1].get_height()
-            self.assertAlmostEqual(height, 1.0)
-        self._check_ticks_props(axes, xlabelsize=xf, xrot=xrot,
-                                ylabelsize=yf, yrot=yrot)
-
-        tm.close()
-        axes = plotting.grouped_hist(df.A, by=df.C, log=True)
-        # scale of y must be 'log'
-        self._check_ax_scales(axes, yaxis='log')
-
-        tm.close()
-        # propagate attr exception from matplotlib.Axes.hist
-        with tm.assertRaises(AttributeError):
-            plotting.grouped_hist(df.A, by=df.C, foo='bar')
-
-        with tm.assert_produces_warning(FutureWarning):
-            df.hist(by='C', figsize='default')
-
-    @slow
-    def test_grouped_hist_legacy2(self):
-        n = 10
-        weight = Series(np.random.normal(166, 20, size=n))
-        height = Series(np.random.normal(60, 10, size=n))
-        with tm.RNGContext(42):
-            gender_int = tm.choice([0, 1], size=n)
-        df_int = DataFrame({'height': height, 'weight': weight,
-                            'gender': gender_int})
-        gb = df_int.groupby('gender')
-        axes = gb.hist()
-        self.assertEqual(len(axes), 2)
-        self.assertEqual(len(self.plt.get_fignums()), 2)
-        tm.close()
-
-    @slow
-    def test_grouped_box_return_type(self):
-        df = self.hist_df
-
-        # old style: return_type=None
-        result = df.boxplot(by='gender')
-        self.assertIsInstance(result, np.ndarray)
-        self._check_box_return_type(result, None,
-                                    expected_keys=['height', 'weight', 'category'])
-
-        # now for groupby
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = df.groupby('gender').boxplot()
-        self._check_box_return_type(result, 'dict', expected_keys=['Male', 'Female'])
-
-        columns2 = 'X B C D A G Y N Q O'.split()
-        df2 = DataFrame(random.randn(50, 10), columns=columns2)
-        categories2 = 'A B C D E F G H I J'.split()
-        df2['category'] = categories2 * 5
-
-        for t in ['dict', 'axes', 'both']:
-            returned = df.groupby('classroom').boxplot(return_type=t)
-            self._check_box_return_type(returned, t, expected_keys=['A', 'B', 'C'])
-
-            returned = df.boxplot(by='classroom', return_type=t)
-            self._check_box_return_type(returned, t,
-                                        expected_keys=['height', 'weight', 'category'])
-
-            returned = df2.groupby('category').boxplot(return_type=t)
-            self._check_box_return_type(returned, t, expected_keys=categories2)
-
-            returned = df2.boxplot(by='category', return_type=t)
-            self._check_box_return_type(returned, t, expected_keys=columns2)
-
-    @slow
-    def test_grouped_box_layout(self):
-        df = self.hist_df
-
-        self.assertRaises(ValueError, df.boxplot, column=['weight', 'height'],
-                          by=df.gender, layout=(1, 1))
-        self.assertRaises(ValueError, df.boxplot, column=['height', 'weight', 'category'],
-                          layout=(2, 1), return_type='dict')
-        self.assertRaises(ValueError, df.boxplot, column=['weight', 'height'],
-                          by=df.gender, layout=(-1, -1))
-
-        box = _check_plot_works(df.groupby('gender').boxplot, column='height',
-                                return_type='dict')
-        self._check_axes_shape(self.plt.gcf().axes, axes_num=2, layout=(1, 2))
-
-        box = _check_plot_works(df.groupby('category').boxplot, column='height',
-                                return_type='dict')
-        self._check_axes_shape(self.plt.gcf().axes, axes_num=4, layout=(2, 2))
-
-        # GH 6769
-        box = _check_plot_works(df.groupby('classroom').boxplot,
-                                column='height', return_type='dict')
-        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(2, 2))
-
-        # GH 5897
-        axes = df.boxplot(column=['height', 'weight', 'category'], by='gender',
-                          return_type='axes')
-        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(2, 2))
-        for ax in [axes['height']]:
-            self._check_visible(ax.get_xticklabels(), visible=False)
-            self._check_visible([ax.xaxis.get_label()], visible=False)
-        for ax in [axes['weight'], axes['category']]:
-            self._check_visible(ax.get_xticklabels())
-            self._check_visible([ax.xaxis.get_label()])
-
-        box = df.groupby('classroom').boxplot(
-            column=['height', 'weight', 'category'], return_type='dict')
-        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(2, 2))
-
-        box = _check_plot_works(df.groupby('category').boxplot, column='height',
-                                layout=(3, 2), return_type='dict')
-        self._check_axes_shape(self.plt.gcf().axes, axes_num=4, layout=(3, 2))
-        box = _check_plot_works(df.groupby('category').boxplot, column='height',
-                                layout=(3, -1), return_type='dict')
-        self._check_axes_shape(self.plt.gcf().axes, axes_num=4, layout=(3, 2))
-
-        box = df.boxplot(column=['height', 'weight', 'category'], by='gender',
-                         layout=(4, 1))
-        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(4, 1))
-
-        box = df.boxplot(column=['height', 'weight', 'category'], by='gender',
-                         layout=(-1, 1))
-        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(3, 1))
-
-        box = df.groupby('classroom').boxplot(
-            column=['height', 'weight', 'category'], layout=(1, 4),
-            return_type='dict')
-        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(1, 4))
-
-        box = df.groupby('classroom').boxplot(
-            column=['height', 'weight', 'category'], layout=(1, -1),
-            return_type='dict')
-        self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(1, 3))
-
-    @slow
-    def test_grouped_box_multiple_axes(self):
-        # GH 6970, GH 7069
-        df = self.hist_df
-
-        # check warning to ignore sharex / sharey
-        # this check should be done in the first function which
-        # passes multiple axes to plot, hist or boxplot
-        # location should be changed if other test is added
-        # which has earlier alphabetical order
-        with tm.assert_produces_warning(UserWarning):
-            fig, axes = self.plt.subplots(2, 2)
-            df.groupby('category').boxplot(column='height', return_type='axes', ax=axes)
-            self._check_axes_shape(self.plt.gcf().axes, axes_num=4, layout=(2, 2))
-
-        fig, axes = self.plt.subplots(2, 3)
-        with warnings.catch_warnings():
-            warnings.simplefilter('ignore')
-            returned = df.boxplot(column=['height', 'weight', 'category'],
-                                  by='gender', return_type='axes', ax=axes[0])
-        returned = np.array(list(returned.values()))
-        self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
-        self.assert_numpy_array_equal(returned, axes[0])
-        self.assertIs(returned[0].figure, fig)
-
-        # draw on second row
-        with warnings.catch_warnings():
-            warnings.simplefilter('ignore')
-            returned = df.groupby('classroom').boxplot(
-                column=['height', 'weight', 'category'],
-                return_type='axes', ax=axes[1])
-        returned = np.array(list(returned.values()))
-        self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
-        self.assert_numpy_array_equal(returned, axes[1])
-        self.assertIs(returned[0].figure, fig)
-
-        with tm.assertRaises(ValueError):
-            fig, axes = self.plt.subplots(2, 3)
-            # pass different number of axes from required
-            axes = df.groupby('classroom').boxplot(ax=axes)
-
-    @slow
-    def test_grouped_hist_layout(self):
-        df = self.hist_df
-        self.assertRaises(ValueError, df.hist, column='weight', by=df.gender,
-                          layout=(1, 1))
-        self.assertRaises(ValueError, df.hist, column='height', by=df.category,
-                          layout=(1, 3))
-        self.assertRaises(ValueError, df.hist, column='height', by=df.category,
-                          layout=(-1, -1))
-
-        axes = _check_plot_works(df.hist, column='height', by=df.gender,
-                                 layout=(2, 1))
-        self._check_axes_shape(axes, axes_num=2, layout=(2, 1))
-
-        axes = _check_plot_works(df.hist, column='height', by=df.gender,
-                                 layout=(2, -1))
-        self._check_axes_shape(axes, axes_num=2, layout=(2, 1))
-
-        axes = df.hist(column='height', by=df.category, layout=(4, 1))
-        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
-
-        axes = df.hist(column='height', by=df.category, layout=(-1, 1))
-        self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
-
-        axes = df.hist(column='height', by=df.category, layout=(4, 2), figsize=(12, 8))
-        self._check_axes_shape(axes, axes_num=4, layout=(4, 2), figsize=(12, 8))
-        tm.close()
-
-        # GH 6769
-        axes = _check_plot_works(df.hist, column='height', by='classroom', layout=(2, 2))
-        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
-
-        # without column
-        axes = _check_plot_works(df.hist, by='classroom')
-        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
-
-        axes = df.hist(by='gender', layout=(3, 5))
-        self._check_axes_shape(axes, axes_num=2, layout=(3, 5))
-
-        axes = df.hist(column=['height', 'weight', 'category'])
-        self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
-
-    @slow
-    def test_grouped_hist_multiple_axes(self):
-        # GH 6970, GH 7069
-        df = self.hist_df
-
-        fig, axes = self.plt.subplots(2, 3)
-        returned = df.hist(column=['height', 'weight', 'category'], ax=axes[0])
-        self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
-        self.assert_numpy_array_equal(returned, axes[0])
-        self.assertIs(returned[0].figure, fig)
-        returned = df.hist(by='classroom', ax=axes[1])
-        self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
-        self.assert_numpy_array_equal(returned, axes[1])
-        self.assertIs(returned[0].figure, fig)
-
-        with tm.assertRaises(ValueError):
-            fig, axes = self.plt.subplots(2, 3)
-            # pass different number of axes from required
-            axes = df.hist(column='height', ax=axes)
-
-    @slow
-    def test_axis_share_x(self):
-        df = self.hist_df
-        # GH4089
-        ax1, ax2 = df.hist(column='height', by=df.gender, sharex=True)
-
-        # share x
-        self.assertTrue(ax1._shared_x_axes.joined(ax1, ax2))
-        self.assertTrue(ax2._shared_x_axes.joined(ax1, ax2))
-
-        # don't share y
-        self.assertFalse(ax1._shared_y_axes.joined(ax1, ax2))
-        self.assertFalse(ax2._shared_y_axes.joined(ax1, ax2))
-
-    @slow
-    def test_axis_share_y(self):
-        df = self.hist_df
-        ax1, ax2 = df.hist(column='height', by=df.gender, sharey=True)
-
-        # share y
-        self.assertTrue(ax1._shared_y_axes.joined(ax1, ax2))
-        self.assertTrue(ax2._shared_y_axes.joined(ax1, ax2))
-
-        # don't share x
-        self.assertFalse(ax1._shared_x_axes.joined(ax1, ax2))
-        self.assertFalse(ax2._shared_x_axes.joined(ax1, ax2))
-
-    @slow
-    def test_axis_share_xy(self):
-        df = self.hist_df
-        ax1, ax2 = df.hist(column='height', by=df.gender, sharex=True,
-                           sharey=True)
-
-        # share both x and y
-        self.assertTrue(ax1._shared_x_axes.joined(ax1, ax2))
-        self.assertTrue(ax2._shared_x_axes.joined(ax1, ax2))
-
-        self.assertTrue(ax1._shared_y_axes.joined(ax1, ax2))
-        self.assertTrue(ax2._shared_y_axes.joined(ax1, ax2))
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_groupby.py b/pandas/tests/test_groupby.py
deleted file mode 100644
index 8eb641ce8f494..0000000000000
--- a/pandas/tests/test_groupby.py
+++ /dev/null
@@ -1,5585 +0,0 @@
-# -*- coding: utf-8 -*-
-from __future__ import print_function
-import nose
-
-from numpy.testing.decorators import slow
-
-from datetime import datetime
-from numpy import nan
-
-from pandas import date_range,bdate_range, Timestamp
-from pandas.core.index import Index, MultiIndex, Int64Index, CategoricalIndex
-from pandas.core.api import Categorical, DataFrame
-from pandas.core.groupby import (SpecificationError, DataError,
-                                 _nargsort, _lexsort_indexer)
-from pandas.core.series import Series
-from pandas.core.config import option_context
-from pandas.util.testing import (assert_panel_equal, assert_frame_equal,
-                                 assert_series_equal, assert_almost_equal,
-                                 assert_index_equal, assertRaisesRegexp)
-from pandas.compat import(
-    range, long, lrange, StringIO, lmap, lzip, map,
-    zip, builtins, OrderedDict, product as cart_product
-)
-from pandas import compat
-from pandas.core.panel import Panel
-from pandas.tools.merge import concat
-from collections import defaultdict
-from functools import partial
-import pandas.core.common as com
-import numpy as np
-
-import pandas.core.nanops as nanops
-
-import pandas.util.testing as tm
-import pandas as pd
-from numpy.testing import assert_equal
-
-
-def commonSetUp(self):
-    self.dateRange = bdate_range('1/1/2005', periods=250)
-    self.stringIndex = Index([rands(8).upper() for x in range(250)])
-
-    self.groupId = Series([x[0] for x in self.stringIndex],
-                          index=self.stringIndex)
-    self.groupDict = dict((k, v) for k, v in compat.iteritems(self.groupId))
-
-    self.columnIndex = Index(['A', 'B', 'C', 'D', 'E'])
-
-    randMat = np.random.randn(250, 5)
-    self.stringMatrix = DataFrame(randMat, columns=self.columnIndex,
-                                  index=self.stringIndex)
-
-    self.timeMatrix = DataFrame(randMat, columns=self.columnIndex,
-                                index=self.dateRange)
-
-
-class TestGroupBy(tm.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.ts = tm.makeTimeSeries()
-
-        self.seriesd = tm.getSeriesData()
-        self.tsd = tm.getTimeSeriesData()
-        self.frame = DataFrame(self.seriesd)
-        self.tsframe = DataFrame(self.tsd)
-
-        self.df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                                   'foo', 'bar', 'foo', 'foo'],
-                             'B': ['one', 'one', 'two', 'three',
-                                   'two', 'two', 'one', 'three'],
-                             'C': np.random.randn(8),
-                             'D': np.random.randn(8)})
-
-        self.df_mixed_floats = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                                                'foo', 'bar', 'foo', 'foo'],
-                                          'B': ['one', 'one', 'two', 'three',
-                                                'two', 'two', 'one', 'three'],
-                                          'C': np.random.randn(8),
-                                          'D': np.array(np.random.randn(8),
-                                                        dtype='float32')})
-
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['first', 'second'])
-        self.mframe = DataFrame(np.random.randn(10, 3), index=index,
-                                columns=['A', 'B', 'C'])
-
-        self.three_group = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
-                                            'bar', 'bar', 'bar', 'bar',
-                                            'foo', 'foo', 'foo'],
-                                      'B': ['one', 'one', 'one', 'two',
-                                            'one', 'one', 'one', 'two',
-                                            'two', 'two', 'one'],
-                                      'C': ['dull', 'dull', 'shiny', 'dull',
-                                            'dull', 'shiny', 'shiny', 'dull',
-                                            'shiny', 'shiny', 'shiny'],
-                                      'D': np.random.randn(11),
-                                      'E': np.random.randn(11),
-                                      'F': np.random.randn(11)})
-
-    def test_basic(self):
-
-        def checkit(dtype):
-            data = Series(np.arange(9) // 3, index=np.arange(9), dtype=dtype)
-
-            index = np.arange(9)
-            np.random.shuffle(index)
-            data = data.reindex(index)
-
-            grouped = data.groupby(lambda x: x // 3)
-
-            for k, v in grouped:
-                self.assertEqual(len(v), 3)
-
-            agged = grouped.aggregate(np.mean)
-            self.assertEqual(agged[1], 1)
-
-            assert_series_equal(agged, grouped.agg(np.mean))  # shorthand
-            assert_series_equal(agged, grouped.mean())
-            assert_series_equal(grouped.agg(np.sum), grouped.sum())
-
-            expected = grouped.apply(lambda x: x * x.sum())
-            transformed = grouped.transform(lambda x: x * x.sum())
-            self.assertEqual(transformed[7], 12)
-            assert_series_equal(transformed, expected)
-
-            value_grouped = data.groupby(data)
-            assert_series_equal(value_grouped.aggregate(np.mean), agged)
-
-            # complex agg
-            agged = grouped.aggregate([np.mean, np.std])
-            agged = grouped.aggregate({'one': np.mean,
-                                       'two': np.std})
-
-            group_constants = {
-                0: 10,
-                1: 20,
-                2: 30
-                }
-            agged = grouped.agg(lambda x: group_constants[x.name] + x.mean())
-            self.assertEqual(agged[1], 21)
-
-            # corner cases
-            self.assertRaises(Exception, grouped.aggregate, lambda x: x * 2)
-
-        for dtype in ['int64', 'int32', 'float64', 'float32']:
-            checkit(dtype)
-
-    def test_select_bad_cols(self):
-        df = DataFrame([[1, 2]], columns=['A', 'B'])
-        g = df.groupby('A')
-        self.assertRaises(KeyError, g.__getitem__, ['C'])  # g[['C']]
-
-        self.assertRaises(KeyError, g.__getitem__, ['A', 'C'])  # g[['A', 'C']]
-        with assertRaisesRegexp(KeyError, '^[^A]+$'):
-            # A should not be referenced as a bad column...
-            # will have to rethink regex if you change message!
-            g[['A', 'C']]
-
-    def test_first_last_nth(self):
-        # tests for first / last / nth
-        grouped = self.df.groupby('A')
-        first = grouped.first()
-        expected = self.df.ix[[1, 0], ['B','C','D']]
-        expected.index = Index(['bar', 'foo'],name='A')
-        expected = expected.sort_index()
-        assert_frame_equal(first, expected)
-
-        nth = grouped.nth(0)
-        assert_frame_equal(nth, expected)
-
-        last = grouped.last()
-        expected = self.df.ix[[5, 7], ['B','C','D']]
-        expected.index = Index(['bar', 'foo'],name='A')
-        assert_frame_equal(last, expected)
-
-        nth = grouped.nth(-1)
-        assert_frame_equal(nth, expected)
-
-        nth = grouped.nth(1)
-        expected = self.df.ix[[2, 3],['B','C','D']].copy()
-        expected.index = Index(['foo', 'bar'],name='A')
-        expected = expected.sort_index()
-        assert_frame_equal(nth, expected)
-
-        # it works!
-        grouped['B'].first()
-        grouped['B'].last()
-        grouped['B'].nth(0)
-
-        self.df.loc[self.df['A'] == 'foo', 'B'] = np.nan
-        self.assertTrue(com.isnull(grouped['B'].first()['foo']))
-        self.assertTrue(com.isnull(grouped['B'].last()['foo']))
-        self.assertTrue(com.isnull(grouped['B'].nth(0)[0]))  # not sure what this is testing
-
-        # v0.14.0 whatsnew
-        df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
-        g = df.groupby('A')
-        result = g.first()
-        expected = df.iloc[[1,2]].set_index('A')
-        assert_frame_equal(result, expected)
-
-        expected = df.iloc[[1,2]].set_index('A')
-        result = g.nth(0,dropna='any')
-        assert_frame_equal(result, expected)
-
-    def test_first_last_nth_dtypes(self):
-
-        df = self.df_mixed_floats.copy()
-        df['E'] = True
-        df['F'] = 1
-
-        # tests for first / last / nth
-        grouped = df.groupby('A')
-        first = grouped.first()
-        expected = df.ix[[1, 0], ['B', 'C', 'D', 'E', 'F']]
-        expected.index = Index(['bar', 'foo'], name='A')
-        expected = expected.sort_index()
-        assert_frame_equal(first, expected)
-
-        last = grouped.last()
-        expected = df.ix[[5, 7], ['B', 'C', 'D', 'E', 'F']]
-        expected.index = Index(['bar', 'foo'], name='A')
-        expected = expected.sort_index()
-        assert_frame_equal(last, expected)
-
-        nth = grouped.nth(1)
-        expected = df.ix[[3, 2],['B', 'C', 'D', 'E', 'F']]
-        expected.index = Index(['bar', 'foo'], name='A')
-        expected = expected.sort_index()
-        assert_frame_equal(nth, expected)
-
-        # GH 2763, first/last shifting dtypes
-        idx = lrange(10)
-        idx.append(9)
-        s = Series(data=lrange(11), index=idx, name='IntCol')
-        self.assertEqual(s.dtype, 'int64')
-        f = s.groupby(level=0).first()
-        self.assertEqual(f.dtype, 'int64')
-
-    def test_nth(self):
-        df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
-        g = df.groupby('A')
-
-        assert_frame_equal(g.nth(0), df.iloc[[0, 2]].set_index('A'))
-        assert_frame_equal(g.nth(1), df.iloc[[1]].set_index('A'))
-        assert_frame_equal(g.nth(2), df.loc[[],['B']])
-        assert_frame_equal(g.nth(-1), df.iloc[[1, 2]].set_index('A'))
-        assert_frame_equal(g.nth(-2), df.iloc[[0]].set_index('A'))
-        assert_frame_equal(g.nth(-3), df.loc[[],['B']])
-        assert_series_equal(g.B.nth(0), df.B.iloc[[0, 2]])
-        assert_series_equal(g.B.nth(1), df.B.iloc[[1]])
-        assert_frame_equal(g[['B']].nth(0), df.ix[[0, 2], ['A', 'B']].set_index('A'))
-
-        exp = df.set_index('A')
-        assert_frame_equal(g.nth(0, dropna='any'), exp.iloc[[1, 2]])
-        assert_frame_equal(g.nth(-1, dropna='any'), exp.iloc[[1, 2]])
-
-        exp['B'] = np.nan
-        assert_frame_equal(g.nth(7, dropna='any'), exp.iloc[[1, 2]])
-        assert_frame_equal(g.nth(2, dropna='any'), exp.iloc[[1, 2]])
-
-        # out of bounds, regression from 0.13.1
-        # GH 6621
-        df = DataFrame({'color': {0: 'green', 1: 'green', 2: 'red', 3: 'red', 4: 'red'},
-                        'food': {0: 'ham', 1: 'eggs', 2: 'eggs', 3: 'ham', 4: 'pork'},
-                        'two': {0: 1.5456590000000001, 1: -0.070345000000000005, 2: -2.4004539999999999, 3: 0.46206000000000003, 4: 0.52350799999999997},
-                        'one': {0: 0.56573799999999996, 1: -0.9742360000000001, 2: 1.033801, 3: -0.78543499999999999, 4: 0.70422799999999997}}).set_index(['color', 'food'])
-
-        result = df.groupby(level=0).nth(2)
-        expected = df.iloc[[-1]]
-        assert_frame_equal(result,expected)
-
-        result = df.groupby(level=0).nth(3)
-        expected = df.loc[[]]
-        assert_frame_equal(result,expected)
-
-        # GH 7559
-        # from the vbench
-        df = DataFrame(np.random.randint(1, 10, (100, 2)),dtype='int64')
-        s = df[1]
-        g = df[0]
-        expected = s.groupby(g).first()
-        expected2 = s.groupby(g).apply(lambda x: x.iloc[0])
-        assert_series_equal(expected2, expected, check_names=False)
-        self.assertTrue(expected.name, 0)
-        self.assertEqual(expected.name, 1)
-
-        # validate first
-        v = s[g==1].iloc[0]
-        self.assertEqual(expected.iloc[0],v)
-        self.assertEqual(expected2.iloc[0],v)
-
-        # this is NOT the same as .first (as sorted is default!)
-        # as it keeps the order in the series (and not the group order)
-        # related GH 7287
-        expected = s.groupby(g,sort=False).first()
-        expected.index = pd.Index(range(1,10), name=0)
-        result = s.groupby(g).nth(0, dropna='all')
-        assert_series_equal(result, expected)
-
-        # doc example
-        df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
-        g = df.groupby('A')
-        result = g.B.nth(0, dropna=True)
-        expected = g.B.first()
-        assert_series_equal(result,expected)
-
-        # test multiple nth values
-        df = DataFrame([[1, np.nan], [1, 3], [1, 4], [5, 6], [5, 7]],
-                       columns=['A', 'B'])
-        g = df.groupby('A')
-
-        assert_frame_equal(g.nth(0), df.iloc[[0, 3]].set_index('A'))
-        assert_frame_equal(g.nth([0]), df.iloc[[0, 3]].set_index('A'))
-        assert_frame_equal(g.nth([0, 1]), df.iloc[[0, 1, 3, 4]].set_index('A'))
-        assert_frame_equal(g.nth([0, -1]), df.iloc[[0, 2, 3, 4]].set_index('A'))
-        assert_frame_equal(g.nth([0, 1, 2]), df.iloc[[0, 1, 2, 3, 4]].set_index('A'))
-        assert_frame_equal(g.nth([0, 1, -1]), df.iloc[[0, 1, 2, 3, 4]].set_index('A'))
-        assert_frame_equal(g.nth([2]), df.iloc[[2]].set_index('A'))
-        assert_frame_equal(g.nth([3, 4]), df.loc[[],['B']])
-
-        business_dates = pd.date_range(start='4/1/2014', end='6/30/2014', freq='B')
-        df = DataFrame(1, index=business_dates, columns=['a', 'b'])
-        # get the first, fourth and last two business days for each month
-        result = df.groupby((df.index.year, df.index.month)).nth([0, 3, -2, -1])
-        expected_dates = pd.to_datetime(['2014/4/1', '2014/4/4', '2014/4/29', '2014/4/30',
-                                         '2014/5/1', '2014/5/6', '2014/5/29', '2014/5/30',
-                                         '2014/6/2', '2014/6/5', '2014/6/27', '2014/6/30'])
-        expected = DataFrame(1, columns=['a', 'b'], index=expected_dates)
-        assert_frame_equal(result, expected)
-
-    def test_nth_multi_index(self):
-        # PR 9090, related to issue 8979
-        # test nth on MultiIndex, should match .first()
-        grouped = self.three_group.groupby(['A', 'B'])
-        result = grouped.nth(0)
-        expected = grouped.first()
-        assert_frame_equal(result, expected)
-
-
-    def test_nth_multi_index_as_expected(self):
-        # PR 9090, related to issue 8979
-        # test nth on MultiIndex
-        three_group = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
-                                       'bar', 'bar', 'bar', 'bar',
-                                       'foo', 'foo', 'foo'],
-                                 'B': ['one', 'one', 'one', 'two',
-                                       'one', 'one', 'one', 'two',
-                                       'two', 'two', 'one'],
-                                 'C': ['dull', 'dull', 'shiny', 'dull',
-                                       'dull', 'shiny', 'shiny', 'dull',
-                                       'shiny', 'shiny', 'shiny']})
-        grouped = three_group.groupby(['A', 'B'])
-        result = grouped.nth(0)
-        expected = DataFrame({'C': ['dull', 'dull', 'dull', 'dull']},
-                             index=MultiIndex.from_arrays([['bar', 'bar', 'foo', 'foo'], ['one', 'two', 'one', 'two']],
-                                                          names=['A', 'B']))
-        assert_frame_equal(result, expected)
-
-
-    def test_grouper_index_types(self):
-        # related GH5375
-        # groupby misbehaving when using a Floatlike index
-        df = DataFrame(np.arange(10).reshape(5,2),columns=list('AB'))
-        for index in [ tm.makeFloatIndex, tm.makeStringIndex,
-                       tm.makeUnicodeIndex, tm.makeIntIndex,
-                       tm.makeDateIndex, tm.makePeriodIndex ]:
-
-            df.index = index(len(df))
-            df.groupby(list('abcde')).apply(lambda x: x)
-
-            df.index = list(reversed(df.index.tolist()))
-            df.groupby(list('abcde')).apply(lambda x: x)
-
-    def test_grouper_multilevel_freq(self):
-
-        # GH 7885
-        # with level and freq specified in a pd.Grouper
-        from datetime import date, timedelta
-        d0 = date.today() - timedelta(days=14)
-        dates = date_range(d0, date.today())
-        date_index = pd.MultiIndex.from_product([dates, dates], names=['foo', 'bar'])
-        df = pd.DataFrame(np.random.randint(0, 100, 225), index=date_index)
-
-        # Check string level
-        expected = df.reset_index().groupby([pd.Grouper(key='foo', freq='W'),
-                                             pd.Grouper(key='bar', freq='W')]).sum()
-        result = df.groupby([pd.Grouper(level='foo', freq='W'),
-                             pd.Grouper(level='bar', freq='W')]).sum()
-        assert_frame_equal(result, expected)
-
-        # Check integer level
-        result = df.groupby([pd.Grouper(level=0, freq='W'),
-                             pd.Grouper(level=1, freq='W')]).sum()
-        assert_frame_equal(result, expected)
-
-    def test_grouper_creation_bug(self):
-
-        # GH 8795
-        df = DataFrame({'A':[0,0,1,1,2,2], 'B':[1,2,3,4,5,6]})
-        g = df.groupby('A')
-        expected = g.sum()
-
-        g = df.groupby(pd.Grouper(key='A'))
-        result = g.sum()
-        assert_frame_equal(result, expected)
-
-        result = g.apply(lambda x: x.sum())
-        assert_frame_equal(result, expected)
-
-        g = df.groupby(pd.Grouper(key='A',axis=0))
-        result = g.sum()
-        assert_frame_equal(result, expected)
-
-        # GH8866
-        s = Series(np.arange(8,dtype='int64'),
-                   index=pd.MultiIndex.from_product([list('ab'),
-                                                     range(2),
-                                                     date_range('20130101',periods=2)],
-                                                    names=['one','two','three']))
-        result = s.groupby(pd.Grouper(level='three',freq='M')).sum()
-        expected = Series([28],index=Index([Timestamp('2013-01-31')],freq='M',name='three'))
-        assert_series_equal(result, expected)
-
-        # just specifying a level breaks
-        result = s.groupby(pd.Grouper(level='one')).sum()
-        expected = s.groupby(level='one').sum()
-        assert_series_equal(result, expected)
-
-    def test_grouper_getting_correct_binner(self):
-
-        # GH 10063
-        # using a non-time-based grouper and a time-based grouper
-        # and specifying levels
-        df = DataFrame({'A' : 1 },
-                       index=pd.MultiIndex.from_product([list('ab'),
-                                                         date_range('20130101',periods=80)],
-                                                        names=['one','two']))
-        result = df.groupby([pd.Grouper(level='one'),pd.Grouper(level='two',freq='M')]).sum()
-        expected = DataFrame({'A' : [31,28,21,31,28,21]},
-                              index=MultiIndex.from_product([list('ab'),date_range('20130101',freq='M',periods=3)],
-                                                            names=['one','two']))
-        assert_frame_equal(result, expected)
-
-    def test_grouper_iter(self):
-        self.assertEqual(sorted(self.df.groupby('A').grouper), ['bar', 'foo'])
-
-    def test_empty_groups(self):
-        # GH # 1048
-        self.assertRaises(ValueError, self.df.groupby, [])
-
-    def test_groupby_grouper(self):
-        grouped = self.df.groupby('A')
-
-        result = self.df.groupby(grouped.grouper).mean()
-        expected = grouped.mean()
-        assert_frame_equal(result, expected)
-
-    def test_groupby_duplicated_column_errormsg(self):
-        # GH7511
-        df = DataFrame(columns=['A','B','A','C'], \
-                data=[range(4), range(2,6), range(0, 8, 2)])
-
-        self.assertRaises(ValueError, df.groupby, 'A')
-        self.assertRaises(ValueError, df.groupby, ['A', 'B'])
-
-        grouped = df.groupby('B')
-        c = grouped.count()
-        self.assertTrue(c.columns.nlevels == 1)
-        self.assertTrue(c.columns.size == 3)
-
-    def test_groupby_dict_mapping(self):
-        # GH #679
-        from pandas import Series
-        s = Series({'T1': 5})
-        result = s.groupby({'T1': 'T2'}).agg(sum)
-        expected = s.groupby(['T2']).agg(sum)
-        assert_series_equal(result, expected)
-
-        s = Series([1., 2., 3., 4.], index=list('abcd'))
-        mapping = {'a': 0, 'b': 0, 'c': 1, 'd': 1}
-
-        result = s.groupby(mapping).mean()
-        result2 = s.groupby(mapping).agg(np.mean)
-        expected = s.groupby([0, 0, 1, 1]).mean()
-        expected2 = s.groupby([0, 0, 1, 1]).mean()
-        assert_series_equal(result, expected)
-        assert_series_equal(result, result2)
-        assert_series_equal(result, expected2)
-
-    def test_groupby_bounds_check(self):
-        # groupby_X is code-generated, so if one variant
-        # does, the rest probably do to
-        a = np.array([1,2],dtype='object')
-        b = np.array([1,2,3],dtype='object')
-        self.assertRaises(AssertionError, pd.algos.groupby_object,a, b)
-
-    def test_groupby_grouper_f_sanity_checked(self):
-        dates = date_range('01-Jan-2013', periods=12, freq='MS')
-        ts = Series(np.random.randn(12), index=dates)
-
-        # GH3035
-        # index.map is used to apply grouper to the index
-        # if it fails on the elements, map tries it on the entire index as
-        # a sequence. That can yield invalid results that cause trouble
-        # down the line.
-        # the surprise comes from using key[0:6] rather then str(key)[0:6]
-        # when the elements are Timestamp.
-        # the result is Index[0:6], very confusing.
-
-        self.assertRaises(AssertionError, ts.groupby,lambda key: key[0:6])
-
-    def test_groupby_nonobject_dtype(self):
-        key = self.mframe.index.labels[0]
-        grouped = self.mframe.groupby(key)
-        result = grouped.sum()
-
-        expected = self.mframe.groupby(key.astype('O')).sum()
-        assert_frame_equal(result, expected)
-
-        # GH 3911, mixed frame non-conversion
-        df = self.df_mixed_floats.copy()
-        df['value'] = lrange(len(df))
-
-        def max_value(group):
-            return group.ix[group['value'].idxmax()]
-
-        applied = df.groupby('A').apply(max_value)
-        result = applied.get_dtype_counts().sort_values()
-        expected = Series({ 'object' : 2, 'float64' : 2, 'int64' : 1 }).sort_values()
-        assert_series_equal(result,expected)
-
-    def test_groupby_return_type(self):
-
-        # GH2893, return a reduced type
-        df1 = DataFrame([{"val1": 1, "val2" : 20}, {"val1":1, "val2": 19},
-                         {"val1":2, "val2": 27}, {"val1":2, "val2": 12}])
-
-        def func(dataf):
-            return dataf["val2"]  - dataf["val2"].mean()
-
-        result = df1.groupby("val1", squeeze=True).apply(func)
-        tm.assertIsInstance(result,Series)
-
-        df2 = DataFrame([{"val1": 1, "val2" : 20}, {"val1":1, "val2": 19},
-                         {"val1":1, "val2": 27}, {"val1":1, "val2": 12}])
-        def func(dataf):
-            return dataf["val2"]  - dataf["val2"].mean()
-
-        result = df2.groupby("val1", squeeze=True).apply(func)
-        tm.assertIsInstance(result,Series)
-
-        # GH3596, return a consistent type (regression in 0.11 from 0.10.1)
-        df = DataFrame([[1,1],[1,1]],columns=['X','Y'])
-        result = df.groupby('X',squeeze=False).count()
-        tm.assertIsInstance(result,DataFrame)
-
-        # GH5592
-        # inconcistent return type
-        df = DataFrame(dict(A = [ 'Tiger', 'Tiger', 'Tiger', 'Lamb', 'Lamb', 'Pony', 'Pony' ],
-                            B = Series(np.arange(7),dtype='int64'),
-                            C = date_range('20130101',periods=7)))
-
-        def f(grp):
-            return grp.iloc[0]
-        expected = df.groupby('A').first()[['B']]
-        result = df.groupby('A').apply(f)[['B']]
-        assert_frame_equal(result,expected)
-
-        def f(grp):
-            if grp.name == 'Tiger':
-                return None
-            return grp.iloc[0]
-        result = df.groupby('A').apply(f)[['B']]
-        e = expected.copy()
-        e.loc['Tiger'] = np.nan
-        assert_frame_equal(result,e)
-
-        def f(grp):
-            if grp.name == 'Pony':
-                return None
-            return grp.iloc[0]
-        result = df.groupby('A').apply(f)[['B']]
-        e = expected.copy()
-        e.loc['Pony'] = np.nan
-        assert_frame_equal(result,e)
-
-        # 5592 revisited, with datetimes
-        def f(grp):
-            if grp.name == 'Pony':
-                return None
-            return grp.iloc[0]
-        result = df.groupby('A').apply(f)[['C']]
-        e = df.groupby('A').first()[['C']]
-        e.loc['Pony'] = pd.NaT
-        assert_frame_equal(result,e)
-
-        # scalar outputs
-        def f(grp):
-            if grp.name == 'Pony':
-                return None
-            return grp.iloc[0].loc['C']
-        result = df.groupby('A').apply(f)
-        e = df.groupby('A').first()['C'].copy()
-        e.loc['Pony'] = np.nan
-        e.name = None
-        assert_series_equal(result,e)
-
-    def test_agg_api(self):
-
-        # GH 6337
-        # http://stackoverflow.com/questions/21706030/pandas-groupby-agg-function-column-dtype-error
-        # different api for agg when passed custom function with mixed frame
-
-        df = DataFrame({'data1':np.random.randn(5),
-                        'data2':np.random.randn(5),
-                        'key1':['a','a','b','b','a'],
-                        'key2':['one','two','one','two','one']})
-        grouped = df.groupby('key1')
-
-        def peak_to_peak(arr):
-            return arr.max() - arr.min()
-
-        expected = grouped.agg([peak_to_peak])
-        expected.columns=['data1','data2']
-        result = grouped.agg(peak_to_peak)
-        assert_frame_equal(result,expected)
-
-    def test_agg_regression1(self):
-        grouped = self.tsframe.groupby([lambda x: x.year, lambda x: x.month])
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        assert_frame_equal(result, expected)
-
-    def test_agg_datetimes_mixed(self):
-        data = [[1, '2012-01-01', 1.0],
-                [2, '2012-01-02', 2.0],
-                [3, None, 3.0]]
-
-        df1 = DataFrame({'key': [x[0] for x in data],
-                         'date': [x[1] for x in data],
-                         'value': [x[2] for x in data]})
-
-        data = [[row[0], datetime.strptime(row[1], '%Y-%m-%d').date()
-                if row[1] else None, row[2]] for row in data]
-
-        df2 = DataFrame({'key': [x[0] for x in data],
-                         'date': [x[1] for x in data],
-                         'value': [x[2] for x in data]})
-
-        df1['weights'] = df1['value'] / df1['value'].sum()
-        gb1 = df1.groupby('date').aggregate(np.sum)
-
-        df2['weights'] = df1['value'] / df1['value'].sum()
-        gb2 = df2.groupby('date').aggregate(np.sum)
-
-        assert(len(gb1) == len(gb2))
-
-    def test_agg_period_index(self):
-        from pandas import period_range, PeriodIndex
-        prng = period_range('2012-1-1', freq='M', periods=3)
-        df = DataFrame(np.random.randn(3, 2), index=prng)
-        rs = df.groupby(level=0).sum()
-        tm.assertIsInstance(rs.index, PeriodIndex)
-
-        # GH 3579
-        index = period_range(start='1999-01', periods=5, freq='M')
-        s1 = Series(np.random.rand(len(index)), index=index)
-        s2 = Series(np.random.rand(len(index)), index=index)
-        series = [('s1', s1), ('s2',s2)]
-        df = DataFrame.from_items(series)
-        grouped = df.groupby(df.index.month)
-        list(grouped)
-
-    def test_agg_must_agg(self):
-        grouped = self.df.groupby('A')['C']
-        self.assertRaises(Exception, grouped.agg, lambda x: x.describe())
-        self.assertRaises(Exception, grouped.agg, lambda x: x.index[:2])
-
-    def test_agg_ser_multi_key(self):
-        ser = self.df.C
-        f = lambda x: x.sum()
-        results = self.df.C.groupby([self.df.A, self.df.B]).aggregate(f)
-        expected = self.df.groupby(['A', 'B']).sum()['C']
-        assert_series_equal(results, expected)
-
-    def test_get_group(self):
-        wp = tm.makePanel()
-        grouped = wp.groupby(lambda x: x.month, axis='major')
-
-        gp = grouped.get_group(1)
-        expected = wp.reindex(major=[x for x in wp.major_axis if x.month == 1])
-        assert_panel_equal(gp, expected)
-
-        # GH 5267
-        # be datelike friendly
-        df = DataFrame({'DATE' : pd.to_datetime(['10-Oct-2013', '10-Oct-2013', '10-Oct-2013',
-                                                 '11-Oct-2013', '11-Oct-2013', '11-Oct-2013']),
-                        'label' : ['foo','foo','bar','foo','foo','bar'],
-                        'VAL' : [1,2,3,4,5,6]})
-
-        g = df.groupby('DATE')
-        key = list(g.groups)[0]
-        result1 = g.get_group(key)
-        result2 = g.get_group(Timestamp(key).to_datetime())
-        result3 = g.get_group(str(Timestamp(key)))
-        assert_frame_equal(result1,result2)
-        assert_frame_equal(result1,result3)
-
-        g = df.groupby(['DATE','label'])
-
-        key = list(g.groups)[0]
-        result1 = g.get_group(key)
-        result2 = g.get_group((Timestamp(key[0]).to_datetime(),key[1]))
-        result3 = g.get_group((str(Timestamp(key[0])),key[1]))
-        assert_frame_equal(result1,result2)
-        assert_frame_equal(result1,result3)
-
-        # must pass a same-length tuple with multiple keys
-        self.assertRaises(ValueError, lambda : g.get_group('foo'))
-        self.assertRaises(ValueError, lambda : g.get_group(('foo')))
-        self.assertRaises(ValueError, lambda : g.get_group(('foo','bar','baz')))
-
-    def test_get_group_grouped_by_tuple(self):
-        # GH 8121
-        df = DataFrame([[(1,), (1, 2), (1,), (1, 2)]],
-                       index=['ids']).T
-        gr = df.groupby('ids')
-        expected = DataFrame({'ids': [(1,), (1,)]}, index=[0, 2])
-        result = gr.get_group((1,))
-        assert_frame_equal(result, expected)
-
-        dt = pd.to_datetime(['2010-01-01', '2010-01-02', '2010-01-01',
-                            '2010-01-02'])
-        df = DataFrame({'ids': [(x,) for x in dt]})
-        gr = df.groupby('ids')
-        result = gr.get_group(('2010-01-01',))
-        expected = DataFrame({'ids': [(dt[0],), (dt[0],)]}, index=[0, 2])
-        assert_frame_equal(result, expected)
-
-    def test_agg_apply_corner(self):
-        # nothing to group, all NA
-        grouped = self.ts.groupby(self.ts * np.nan)
-
-        assert_series_equal(grouped.sum(), Series([]))
-        assert_series_equal(grouped.agg(np.sum), Series([]))
-        assert_series_equal(grouped.apply(np.sum), Series([]))
-
-        # DataFrame
-        grouped = self.tsframe.groupby(self.tsframe['A'] * np.nan)
-        exp_df = DataFrame(columns=self.tsframe.columns, dtype=float)
-        assert_frame_equal(grouped.sum(), exp_df, check_names=False)
-        assert_frame_equal(grouped.agg(np.sum), exp_df, check_names=False)
-        assert_frame_equal(grouped.apply(np.sum), DataFrame({}, dtype=float))
-
-    def test_agg_grouping_is_list_tuple(self):
-        from pandas.core.groupby import Grouping
-
-        df = tm.makeTimeDataFrame()
-
-        grouped = df.groupby(lambda x: x.year)
-        grouper = grouped.grouper.groupings[0].grouper
-        grouped.grouper.groupings[0] = Grouping(self.ts.index, list(grouper))
-
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        tm.assert_frame_equal(result, expected)
-
-        grouped.grouper.groupings[0] = Grouping(self.ts.index, tuple(grouper))
-
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        tm.assert_frame_equal(result, expected)
-
-    def test_grouping_error_on_multidim_input(self):
-        from pandas.core.groupby import Grouping
-        self.assertRaises(ValueError, \
-            Grouping, self.df.index, self.df[['A','A']])
-
-    def test_agg_python_multiindex(self):
-        grouped = self.mframe.groupby(['A', 'B'])
-
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        tm.assert_frame_equal(result, expected)
-
-    def test_apply_describe_bug(self):
-        grouped = self.mframe.groupby(level='first')
-        result = grouped.describe()  # it works!
-
-    def test_apply_issues(self):
-        # GH 5788
-
-        s="""2011.05.16,00:00,1.40893
-2011.05.16,01:00,1.40760
-2011.05.16,02:00,1.40750
-2011.05.16,03:00,1.40649
-2011.05.17,02:00,1.40893
-2011.05.17,03:00,1.40760
-2011.05.17,04:00,1.40750
-2011.05.17,05:00,1.40649
-2011.05.18,02:00,1.40893
-2011.05.18,03:00,1.40760
-2011.05.18,04:00,1.40750
-2011.05.18,05:00,1.40649"""
-
-        df = pd.read_csv(StringIO(s), header=None, names=['date', 'time', 'value'], parse_dates=[['date', 'time']])
-        df = df.set_index('date_time')
-
-        expected = df.groupby(df.index.date).idxmax()
-        result = df.groupby(df.index.date).apply(lambda x: x.idxmax())
-        assert_frame_equal(result,expected)
-
-        # GH 5789
-        # don't auto coerce dates
-        df = pd.read_csv(StringIO(s), header=None, names=['date', 'time', 'value'])
-        exp_idx = pd.Index(['2011.05.16','2011.05.17','2011.05.18'], dtype=object, name='date')
-        expected = Series(['00:00','02:00','02:00'], index=exp_idx)
-        result = df.groupby('date').apply(lambda x: x['time'][x['value'].idxmax()])
-        assert_series_equal(result, expected)
-
-    def test_len(self):
-        df = tm.makeTimeDataFrame()
-        grouped = df.groupby([lambda x: x.year,
-                              lambda x: x.month,
-                              lambda x: x.day])
-        self.assertEqual(len(grouped), len(df))
-
-        grouped = df.groupby([lambda x: x.year,
-                              lambda x: x.month])
-        expected = len(set([(x.year, x.month) for x in df.index]))
-        self.assertEqual(len(grouped), expected)
-
-        # issue 11016
-        df = pd.DataFrame(dict(a=[np.nan]*3, b=[1,2,3]))
-        self.assertEqual(len(df.groupby(('a'))), 0)
-        self.assertEqual(len(df.groupby(('b'))), 3)
-        self.assertEqual(len(df.groupby(('a', 'b'))), 3)
-
-    def test_groups(self):
-        grouped = self.df.groupby(['A'])
-        groups = grouped.groups
-        self.assertIs(groups, grouped.groups)  # caching works
-
-        for k, v in compat.iteritems(grouped.groups):
-            self.assertTrue((self.df.ix[v]['A'] == k).all())
-
-        grouped = self.df.groupby(['A', 'B'])
-        groups = grouped.groups
-        self.assertIs(groups, grouped.groups)  # caching works
-        for k, v in compat.iteritems(grouped.groups):
-            self.assertTrue((self.df.ix[v]['A'] == k[0]).all())
-            self.assertTrue((self.df.ix[v]['B'] == k[1]).all())
-
-    def test_aggregate_str_func(self):
-
-        def _check_results(grouped):
-            # single series
-            result = grouped['A'].agg('std')
-            expected = grouped['A'].std()
-            assert_series_equal(result, expected)
-
-            # group frame by function name
-            result = grouped.aggregate('var')
-            expected = grouped.var()
-            assert_frame_equal(result, expected)
-
-            # group frame by function dict
-            result = grouped.agg(OrderedDict([['A', 'var'],
-                                              ['B', 'std'],
-                                              ['C', 'mean'],
-                                              ['D', 'sem']]))
-            expected = DataFrame(OrderedDict([['A', grouped['A'].var()],
-                                              ['B', grouped['B'].std()],
-                                              ['C', grouped['C'].mean()],
-                                              ['D', grouped['D'].sem()]]))
-            assert_frame_equal(result, expected)
-
-        by_weekday = self.tsframe.groupby(lambda x: x.weekday())
-        _check_results(by_weekday)
-
-        by_mwkday = self.tsframe.groupby([lambda x: x.month,
-                                          lambda x: x.weekday()])
-        _check_results(by_mwkday)
-
-    def test_aggregate_item_by_item(self):
-
-        df = self.df.copy()
-        df['E'] = ['a'] * len(self.df)
-        grouped = self.df.groupby('A')
-
-        # API change in 0.11
-        # def aggfun(ser):
-        #     return len(ser + 'a')
-        # result = grouped.agg(aggfun)
-        # self.assertEqual(len(result.columns), 1)
-
-        aggfun = lambda ser: ser.size
-        result = grouped.agg(aggfun)
-        foo = (self.df.A == 'foo').sum()
-        bar = (self.df.A == 'bar').sum()
-        K = len(result.columns)
-
-        # GH5782
-        # odd comparisons can result here, so cast to make easy
-        assert_almost_equal(result.xs('foo'), np.array([foo] * K).astype('float64'))
-        assert_almost_equal(result.xs('bar'), np.array([bar] * K).astype('float64'))
-
-        def aggfun(ser):
-            return ser.size
-        result = DataFrame().groupby(self.df.A).agg(aggfun)
-        tm.assertIsInstance(result, DataFrame)
-        self.assertEqual(len(result), 0)
-
-    def test_agg_item_by_item_raise_typeerror(self):
-        from numpy.random import randint
-
-        df = DataFrame(randint(10, size=(20, 10)))
-
-        def raiseException(df):
-            com.pprint_thing('----------------------------------------')
-            com.pprint_thing(df.to_string())
-            raise TypeError
-
-        self.assertRaises(TypeError, df.groupby(0).agg,
-                          raiseException)
-
-    def test_basic_regression(self):
-        # regression
-        T = [1.0 * x for x in lrange(1, 10) * 10][:1095]
-        result = Series(T, lrange(0, len(T)))
-
-        groupings = np.random.random((1100,))
-        groupings = Series(groupings, lrange(0, len(groupings))) * 10.
-
-        grouped = result.groupby(groupings)
-        grouped.mean()
-
-    def test_transform(self):
-        data = Series(np.arange(9) // 3, index=np.arange(9))
-
-        index = np.arange(9)
-        np.random.shuffle(index)
-        data = data.reindex(index)
-
-        grouped = data.groupby(lambda x: x // 3)
-
-        transformed = grouped.transform(lambda x: x * x.sum())
-        self.assertEqual(transformed[7], 12)
-
-        # GH 8046
-        # make sure that we preserve the input order
-
-        df = DataFrame(np.arange(6,dtype='int64').reshape(3,2), columns=["a","b"], index=[0,2,1])
-        key = [0,0,1]
-        expected = df.sort_index().groupby(key).transform(lambda x: x-x.mean()).groupby(key).mean()
-        result = df.groupby(key).transform(lambda x: x-x.mean()).groupby(key).mean()
-        assert_frame_equal(result, expected)
-
-        def demean(arr):
-            return arr - arr.mean()
-
-        people = DataFrame(np.random.randn(5, 5),
-                           columns=['a', 'b', 'c', 'd', 'e'],
-                           index=['Joe', 'Steve', 'Wes', 'Jim', 'Travis'])
-        key = ['one', 'two', 'one', 'two', 'one']
-        result = people.groupby(key).transform(demean).groupby(key).mean()
-        expected = people.groupby(key).apply(demean).groupby(key).mean()
-        assert_frame_equal(result, expected)
-
-        # GH 8430
-        df = tm.makeTimeDataFrame()
-        g = df.groupby(pd.TimeGrouper('M'))
-        g.transform(lambda x: x-1)
-
-        # GH 9700
-        df = DataFrame({'a' : range(5, 10), 'b' : range(5)})
-        result = df.groupby('a').transform(max)
-        expected = DataFrame({'b' : range(5)})
-        tm.assert_frame_equal(result, expected)
-
-    def test_transform_fast(self):
-
-        df = DataFrame( { 'id' : np.arange( 100000 ) / 3,
-                          'val': np.random.randn( 100000) } )
-
-        grp=df.groupby('id')['val']
-
-        values = np.repeat(grp.mean().values, com._ensure_platform_int(grp.count().values))
-        expected = pd.Series(values,index=df.index)
-        result = grp.transform(np.mean)
-        assert_series_equal(result,expected)
-
-        result = grp.transform('mean')
-        assert_series_equal(result,expected)
-
-    def test_transform_broadcast(self):
-        grouped = self.ts.groupby(lambda x: x.month)
-        result = grouped.transform(np.mean)
-
-        self.assertTrue(result.index.equals(self.ts.index))
-        for _, gp in grouped:
-            assert_fp_equal(result.reindex(gp.index), gp.mean())
-
-        grouped = self.tsframe.groupby(lambda x: x.month)
-        result = grouped.transform(np.mean)
-        self.assertTrue(result.index.equals(self.tsframe.index))
-        for _, gp in grouped:
-            agged = gp.mean()
-            res = result.reindex(gp.index)
-            for col in self.tsframe:
-                assert_fp_equal(res[col], agged[col])
-
-        # group columns
-        grouped = self.tsframe.groupby({'A': 0, 'B': 0, 'C': 1, 'D': 1},
-                                       axis=1)
-        result = grouped.transform(np.mean)
-        self.assertTrue(result.index.equals(self.tsframe.index))
-        self.assertTrue(result.columns.equals(self.tsframe.columns))
-        for _, gp in grouped:
-            agged = gp.mean(1)
-            res = result.reindex(columns=gp.columns)
-            for idx in gp.index:
-                assert_fp_equal(res.xs(idx), agged[idx])
-
-    def test_transform_dtype(self):
-        # GH 9807
-        # Check transform dtype output is preserved
-        df = DataFrame([[1, 3], [2, 3]])
-        result = df.groupby(1).transform('mean')
-        expected = DataFrame([[1.5], [1.5]])
-        assert_frame_equal(result, expected)
-
-    def test_transform_bug(self):
-        # GH 5712
-        # transforming on a datetime column
-        df = DataFrame(dict(A = Timestamp('20130101'), B = np.arange(5)))
-        result = df.groupby('A')['B'].transform(lambda x: x.rank(ascending=False))
-        expected = Series(np.arange(5,0,step=-1),name='B')
-        assert_series_equal(result,expected)
-
-    def test_transform_multiple(self):
-        grouped = self.ts.groupby([lambda x: x.year, lambda x: x.month])
-
-        transformed = grouped.transform(lambda x: x * 2)
-        broadcasted = grouped.transform(np.mean)
-
-    def test_dispatch_transform(self):
-        df = self.tsframe[::5].reindex(self.tsframe.index)
-
-        grouped = df.groupby(lambda x: x.month)
-
-        filled = grouped.fillna(method='pad')
-        fillit = lambda x: x.fillna(method='pad')
-        expected = df.groupby(lambda x: x.month).transform(fillit)
-        assert_frame_equal(filled, expected)
-
-    def test_transform_select_columns(self):
-        f = lambda x: x.mean()
-        result = self.df.groupby('A')['C', 'D'].transform(f)
-
-        selection = self.df[['C', 'D']]
-        expected = selection.groupby(self.df['A']).transform(f)
-
-        assert_frame_equal(result, expected)
-
-    def test_transform_exclude_nuisance(self):
-
-        # this also tests orderings in transform between
-        # series/frame to make sure it's consistent
-        expected = {}
-        grouped = self.df.groupby('A')
-        expected['C'] = grouped['C'].transform(np.mean)
-        expected['D'] = grouped['D'].transform(np.mean)
-        expected = DataFrame(expected)
-        result = self.df.groupby('A').transform(np.mean)
-
-        assert_frame_equal(result, expected)
-
-    def test_transform_function_aliases(self):
-        result = self.df.groupby('A').transform('mean')
-        expected = self.df.groupby('A').transform(np.mean)
-        assert_frame_equal(result, expected)
-
-        result = self.df.groupby('A')['C'].transform('mean')
-        expected = self.df.groupby('A')['C'].transform(np.mean)
-        assert_series_equal(result, expected)
-
-    def test_transform_length(self):
-        # GH 9697
-        df = pd.DataFrame({'col1':[1,1,2,2], 'col2':[1,2,3,np.nan]})
-        expected = pd.Series([3.0]*4)
-        def nsum(x):
-            return np.nansum(x)
-        results = [df.groupby('col1').transform(sum)['col2'],
-                   df.groupby('col1')['col2'].transform(sum),
-                   df.groupby('col1').transform(nsum)['col2'],
-                   df.groupby('col1')['col2'].transform(nsum)]
-        for result in results:
-            assert_series_equal(result, expected, check_names=False)
-
-    def test_with_na(self):
-        index = Index(np.arange(10))
-
-        for dtype in ['float64','float32','int64','int32','int16','int8']:
-            values = Series(np.ones(10), index, dtype=dtype)
-            labels = Series([nan, 'foo', 'bar', 'bar', nan, nan, 'bar',
-                             'bar', nan, 'foo'], index=index)
-
-
-            # this SHOULD be an int
-            grouped = values.groupby(labels)
-            agged = grouped.agg(len)
-            expected = Series([4, 2], index=['bar', 'foo'])
-
-            assert_series_equal(agged, expected, check_dtype=False)
-            #self.assertTrue(issubclass(agged.dtype.type, np.integer))
-
-            # explicity return a float from my function
-            def f(x):
-                return float(len(x))
-
-            agged = grouped.agg(f)
-            expected = Series([4, 2], index=['bar', 'foo'])
-
-            assert_series_equal(agged, expected, check_dtype=False)
-            self.assertTrue(issubclass(agged.dtype.type, np.dtype(dtype).type))
-
-    def test_groupby_transform_with_int(self):
-
-        # GH 3740, make sure that we might upcast on item-by-item transform
-
-        # floats
-        df = DataFrame(dict(A = [1,1,1,2,2,2], B = Series(1,dtype='float64'), C = Series([1,2,3,1,2,3],dtype='float64'), D = 'foo'))
-        result = df.groupby('A').transform(lambda x: (x-x.mean())/x.std())
-        expected = DataFrame(dict(B = np.nan, C = Series([-1,0,1,-1,0,1],dtype='float64')))
-        assert_frame_equal(result,expected)
-
-        # int case
-        df = DataFrame(dict(A = [1,1,1,2,2,2], B = 1, C = [1,2,3,1,2,3], D = 'foo'))
-        result = df.groupby('A').transform(lambda x: (x-x.mean())/x.std())
-        expected = DataFrame(dict(B = np.nan, C = [-1,0,1,-1,0,1]))
-        assert_frame_equal(result,expected)
-
-        # int that needs float conversion
-        s = Series([2,3,4,10,5,-1])
-        df = DataFrame(dict(A = [1,1,1,2,2,2], B = 1, C = s, D = 'foo'))
-        result = df.groupby('A').transform(lambda x: (x-x.mean())/x.std())
-
-        s1 = s.iloc[0:3]
-        s1 = (s1-s1.mean())/s1.std()
-        s2 = s.iloc[3:6]
-        s2 = (s2-s2.mean())/s2.std()
-        expected = DataFrame(dict(B = np.nan, C = concat([s1,s2])))
-        assert_frame_equal(result,expected)
-
-        # int downcasting
-        result = df.groupby('A').transform(lambda x: x*2/2)
-        expected = DataFrame(dict(B = 1, C = [2,3,4,10,5,-1]))
-        assert_frame_equal(result,expected)
-
-    def test_indices_concatenation_order(self):
-
-        # GH 2808
-
-        def f1(x):
-            y = x[(x.b % 2) == 1]**2
-            if y.empty:
-                multiindex = MultiIndex(
-                    levels = [[]]*2,
-                    labels = [[]]*2,
-                    names = ['b', 'c']
-                    )
-                res = DataFrame(None,
-                                   columns=['a'],
-                                   index=multiindex)
-                return res
-            else:
-                y = y.set_index(['b','c'])
-                return y
-
-        def f2(x):
-            y = x[(x.b % 2) == 1]**2
-            if y.empty:
-                return DataFrame()
-            else:
-                y = y.set_index(['b','c'])
-                return y
-
-        def f3(x):
-            y = x[(x.b % 2) == 1]**2
-            if y.empty:
-                multiindex = MultiIndex(
-                    levels = [[]]*2,
-                    labels = [[]]*2,
-                    names = ['foo', 'bar']
-                    )
-                res = DataFrame(None,
-                                columns=['a','b'],
-                                index=multiindex)
-                return res
-            else:
-                return y
-
-        df = DataFrame({'a':[1,2,2,2],
-                        'b':lrange(4),
-                        'c':lrange(5,9)})
-
-        df2 = DataFrame({'a':[3,2,2,2],
-                         'b':lrange(4),
-                         'c':lrange(5,9)})
-
-
-        # correct result
-        result1 = df.groupby('a').apply(f1)
-        result2 = df2.groupby('a').apply(f1)
-        assert_frame_equal(result1, result2)
-
-        # should fail (not the same number of levels)
-        self.assertRaises(AssertionError, df.groupby('a').apply, f2)
-        self.assertRaises(AssertionError, df2.groupby('a').apply, f2)
-
-        # should fail (incorrect shape)
-        self.assertRaises(AssertionError, df.groupby('a').apply, f3)
-        self.assertRaises(AssertionError, df2.groupby('a').apply, f3)
-
-    def test_attr_wrapper(self):
-        grouped = self.ts.groupby(lambda x: x.weekday())
-
-        result = grouped.std()
-        expected = grouped.agg(lambda x: np.std(x, ddof=1))
-        assert_series_equal(result, expected)
-
-        # this is pretty cool
-        result = grouped.describe()
-        expected = {}
-        for name, gp in grouped:
-            expected[name] = gp.describe()
-        expected = DataFrame(expected).T
-        assert_frame_equal(result.unstack(), expected)
-
-        # get attribute
-        result = grouped.dtype
-        expected = grouped.agg(lambda x: x.dtype)
-
-        # make sure raises error
-        self.assertRaises(AttributeError, getattr, grouped, 'foo')
-
-    def test_series_describe_multikey(self):
-        ts = tm.makeTimeSeries()
-        grouped = ts.groupby([lambda x: x.year, lambda x: x.month])
-        result = grouped.describe().unstack()
-        assert_series_equal(result['mean'], grouped.mean(), check_names=False)
-        assert_series_equal(result['std'], grouped.std(), check_names=False)
-        assert_series_equal(result['min'], grouped.min(), check_names=False)
-
-    def test_series_describe_single(self):
-        ts = tm.makeTimeSeries()
-        grouped = ts.groupby(lambda x: x.month)
-        result = grouped.apply(lambda x: x.describe())
-        expected = grouped.describe()
-        assert_series_equal(result, expected)
-
-    def test_series_agg_multikey(self):
-        ts = tm.makeTimeSeries()
-        grouped = ts.groupby([lambda x: x.year, lambda x: x.month])
-
-        result = grouped.agg(np.sum)
-        expected = grouped.sum()
-        assert_series_equal(result, expected)
-
-    def test_series_agg_multi_pure_python(self):
-        data = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
-                                'bar', 'bar', 'bar', 'bar',
-                                'foo', 'foo', 'foo'],
-                          'B': ['one', 'one', 'one', 'two',
-                                'one', 'one', 'one', 'two',
-                                'two', 'two', 'one'],
-                          'C': ['dull', 'dull', 'shiny', 'dull',
-                                'dull', 'shiny', 'shiny', 'dull',
-                                'shiny', 'shiny', 'shiny'],
-                          'D': np.random.randn(11),
-                          'E': np.random.randn(11),
-                          'F': np.random.randn(11)})
-
-        def bad(x):
-            assert(len(x.base) > 0)
-            return 'foo'
-
-        result = data.groupby(['A', 'B']).agg(bad)
-        expected = data.groupby(['A', 'B']).agg(lambda x: 'foo')
-        assert_frame_equal(result, expected)
-
-    def test_series_index_name(self):
-        grouped = self.df.ix[:, ['C']].groupby(self.df['A'])
-        result = grouped.agg(lambda x: x.mean())
-        self.assertEqual(result.index.name, 'A')
-
-    def test_frame_describe_multikey(self):
-        grouped = self.tsframe.groupby([lambda x: x.year,
-                                        lambda x: x.month])
-        result = grouped.describe()
-
-        for col in self.tsframe:
-            expected = grouped[col].describe()
-            assert_series_equal(result[col], expected, check_names=False)
-
-        groupedT = self.tsframe.groupby({'A': 0, 'B': 0,
-                                         'C': 1, 'D': 1}, axis=1)
-        result = groupedT.describe()
-
-        for name, group in groupedT:
-            assert_frame_equal(result[name], group.describe())
-
-    def test_frame_groupby(self):
-        grouped = self.tsframe.groupby(lambda x: x.weekday())
-
-        # aggregate
-        aggregated = grouped.aggregate(np.mean)
-        self.assertEqual(len(aggregated), 5)
-        self.assertEqual(len(aggregated.columns), 4)
-
-        # by string
-        tscopy = self.tsframe.copy()
-        tscopy['weekday'] = [x.weekday() for x in tscopy.index]
-        stragged = tscopy.groupby('weekday').aggregate(np.mean)
-        assert_frame_equal(stragged, aggregated, check_names=False)
-
-        # transform
-        grouped = self.tsframe.head(30).groupby(lambda x: x.weekday())
-        transformed = grouped.transform(lambda x: x - x.mean())
-        self.assertEqual(len(transformed), 30)
-        self.assertEqual(len(transformed.columns), 4)
-
-        # transform propagate
-        transformed = grouped.transform(lambda x: x.mean())
-        for name, group in grouped:
-            mean = group.mean()
-            for idx in group.index:
-                assert_almost_equal(transformed.xs(idx), mean)
-
-        # iterate
-        for weekday, group in grouped:
-            self.assertEqual(group.index[0].weekday(), weekday)
-
-        # groups / group_indices
-        groups = grouped.groups
-        indices = grouped.indices
-
-        for k, v in compat.iteritems(groups):
-            samething = self.tsframe.index.take(indices[k])
-            self.assertTrue((samething == v).all())
-
-    def test_grouping_is_iterable(self):
-        # this code path isn't used anywhere else
-        # not sure it's useful
-        grouped = self.tsframe.groupby([lambda x: x.weekday(),
-                                        lambda x: x.year])
-
-        # test it works
-        for g in grouped.grouper.groupings[0]:
-            pass
-
-    def test_frame_groupby_columns(self):
-        mapping = {
-            'A': 0, 'B': 0, 'C': 1, 'D': 1
-        }
-        grouped = self.tsframe.groupby(mapping, axis=1)
-
-        # aggregate
-        aggregated = grouped.aggregate(np.mean)
-        self.assertEqual(len(aggregated), len(self.tsframe))
-        self.assertEqual(len(aggregated.columns), 2)
-
-        # transform
-        tf = lambda x: x - x.mean()
-        groupedT = self.tsframe.T.groupby(mapping, axis=0)
-        assert_frame_equal(groupedT.transform(tf).T, grouped.transform(tf))
-
-        # iterate
-        for k, v in grouped:
-            self.assertEqual(len(v.columns), 2)
-
-    def test_frame_set_name_single(self):
-        grouped = self.df.groupby('A')
-
-        result = grouped.mean()
-        self.assertEqual(result.index.name, 'A')
-
-        result = self.df.groupby('A', as_index=False).mean()
-        self.assertNotEqual(result.index.name, 'A')
-
-        result = grouped.agg(np.mean)
-        self.assertEqual(result.index.name, 'A')
-
-        result = grouped.agg({'C': np.mean, 'D': np.std})
-        self.assertEqual(result.index.name, 'A')
-
-        result = grouped['C'].mean()
-        self.assertEqual(result.index.name, 'A')
-        result = grouped['C'].agg(np.mean)
-        self.assertEqual(result.index.name, 'A')
-        result = grouped['C'].agg([np.mean, np.std])
-        self.assertEqual(result.index.name, 'A')
-
-        result = grouped['C'].agg({'foo': np.mean, 'bar': np.std})
-        self.assertEqual(result.index.name, 'A')
-
-    def test_multi_iter(self):
-        s = Series(np.arange(6))
-        k1 = np.array(['a', 'a', 'a', 'b', 'b', 'b'])
-        k2 = np.array(['1', '2', '1', '2', '1', '2'])
-
-        grouped = s.groupby([k1, k2])
-
-        iterated = list(grouped)
-        expected = [('a', '1', s[[0, 2]]),
-                    ('a', '2', s[[1]]),
-                    ('b', '1', s[[4]]),
-                    ('b', '2', s[[3, 5]])]
-        for i, ((one, two), three) in enumerate(iterated):
-            e1, e2, e3 = expected[i]
-            self.assertEqual(e1, one)
-            self.assertEqual(e2, two)
-            assert_series_equal(three, e3)
-
-    def test_multi_iter_frame(self):
-        k1 = np.array(['b', 'b', 'b', 'a', 'a', 'a'])
-        k2 = np.array(['1', '2', '1', '2', '1', '2'])
-        df = DataFrame({'v1': np.random.randn(6),
-                        'v2': np.random.randn(6),
-                        'k1': k1, 'k2': k2},
-                       index=['one', 'two', 'three', 'four', 'five', 'six'])
-
-        grouped = df.groupby(['k1', 'k2'])
-
-        # things get sorted!
-        iterated = list(grouped)
-        idx = df.index
-        expected = [('a', '1', df.ix[idx[[4]]]),
-                    ('a', '2', df.ix[idx[[3, 5]]]),
-                    ('b', '1', df.ix[idx[[0, 2]]]),
-                    ('b', '2', df.ix[idx[[1]]])]
-        for i, ((one, two), three) in enumerate(iterated):
-            e1, e2, e3 = expected[i]
-            self.assertEqual(e1, one)
-            self.assertEqual(e2, two)
-            assert_frame_equal(three, e3)
-
-        # don't iterate through groups with no data
-        df['k1'] = np.array(['b', 'b', 'b', 'a', 'a', 'a'])
-        df['k2'] = np.array(['1', '1', '1', '2', '2', '2'])
-        grouped = df.groupby(['k1', 'k2'])
-        groups = {}
-        for key, gp in grouped:
-            groups[key] = gp
-        self.assertEqual(len(groups), 2)
-
-        # axis = 1
-        three_levels = self.three_group.groupby(['A', 'B', 'C']).mean()
-        grouped = three_levels.T.groupby(axis=1, level=(1, 2))
-        for key, group in grouped:
-            pass
-
-    def test_multi_iter_panel(self):
-        wp = tm.makePanel()
-        grouped = wp.groupby([lambda x: x.month, lambda x: x.weekday()],
-                             axis=1)
-
-        for (month, wd), group in grouped:
-            exp_axis = [x for x in wp.major_axis
-                        if x.month == month and x.weekday() == wd]
-            expected = wp.reindex(major=exp_axis)
-            assert_panel_equal(group, expected)
-
-    def test_multi_func(self):
-        col1 = self.df['A']
-        col2 = self.df['B']
-
-        grouped = self.df.groupby([col1.get, col2.get])
-        agged = grouped.mean()
-        expected = self.df.groupby(['A', 'B']).mean()
-        assert_frame_equal(agged.ix[:, ['C', 'D']],
-                           expected.ix[:, ['C', 'D']],
-                           check_names=False)  # TODO groupby get drops names
-
-        # some "groups" with no data
-        df = DataFrame({'v1': np.random.randn(6),
-                        'v2': np.random.randn(6),
-                        'k1': np.array(['b', 'b', 'b', 'a', 'a', 'a']),
-                        'k2': np.array(['1', '1', '1', '2', '2', '2'])},
-                       index=['one', 'two', 'three', 'four', 'five', 'six'])
-        # only verify that it works for now
-        grouped = df.groupby(['k1', 'k2'])
-        grouped.agg(np.sum)
-
-    def test_multi_key_multiple_functions(self):
-        grouped = self.df.groupby(['A', 'B'])['C']
-
-        agged = grouped.agg([np.mean, np.std])
-        expected = DataFrame({'mean': grouped.agg(np.mean),
-                              'std': grouped.agg(np.std)})
-        assert_frame_equal(agged, expected)
-
-    def test_frame_multi_key_function_list(self):
-        data = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
-                                'bar', 'bar', 'bar', 'bar',
-                                'foo', 'foo', 'foo'],
-                          'B': ['one', 'one', 'one', 'two',
-                                'one', 'one', 'one', 'two',
-                                'two', 'two', 'one'],
-                          'C': ['dull', 'dull', 'shiny', 'dull',
-                                'dull', 'shiny', 'shiny', 'dull',
-                                'shiny', 'shiny', 'shiny'],
-                          'D': np.random.randn(11),
-                          'E': np.random.randn(11),
-                          'F': np.random.randn(11)})
-
-        grouped = data.groupby(['A', 'B'])
-        funcs = [np.mean, np.std]
-        agged = grouped.agg(funcs)
-        expected = concat([grouped['D'].agg(funcs), grouped['E'].agg(funcs),
-                           grouped['F'].agg(funcs)],
-                          keys=['D', 'E', 'F'], axis=1)
-        assert(isinstance(agged.index, MultiIndex))
-        assert(isinstance(expected.index, MultiIndex))
-        assert_frame_equal(agged, expected)
-
-    def test_groupby_multiple_columns(self):
-        data = self.df
-        grouped = data.groupby(['A', 'B'])
-
-        def _check_op(op):
-
-            result1 = op(grouped)
-
-            expected = defaultdict(dict)
-            for n1, gp1 in data.groupby('A'):
-                for n2, gp2 in gp1.groupby('B'):
-                    expected[n1][n2] = op(gp2.ix[:, ['C', 'D']])
-            expected = dict((k, DataFrame(v)) for k, v in compat.iteritems(expected))
-            expected = Panel.fromDict(expected).swapaxes(0, 1)
-            expected.major_axis.name, expected.minor_axis.name = 'A', 'B'
-
-            # a little bit crude
-            for col in ['C', 'D']:
-                result_col = op(grouped[col])
-                exp = expected[col]
-                pivoted = result1[col].unstack()
-                pivoted2 = result_col.unstack()
-                assert_frame_equal(pivoted.reindex_like(exp), exp)
-                assert_frame_equal(pivoted2.reindex_like(exp), exp)
-
-        _check_op(lambda x: x.sum())
-        _check_op(lambda x: x.mean())
-
-        # test single series works the same
-        result = data['C'].groupby([data['A'], data['B']]).mean()
-        expected = data.groupby(['A', 'B']).mean()['C']
-
-        assert_series_equal(result, expected)
-
-    def test_groupby_as_index_agg(self):
-        grouped = self.df.groupby('A', as_index=False)
-
-        # single-key
-
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        assert_frame_equal(result, expected)
-
-        result2 = grouped.agg(OrderedDict([['C', np.mean], ['D', np.sum]]))
-        expected2 = grouped.mean()
-        expected2['D'] = grouped.sum()['D']
-        assert_frame_equal(result2, expected2)
-
-        grouped = self.df.groupby('A', as_index=True)
-        expected3 = grouped['C'].sum()
-        expected3 = DataFrame(expected3).rename(columns={'C': 'Q'})
-        result3 = grouped['C'].agg({'Q': np.sum})
-        assert_frame_equal(result3, expected3)
-
-        # multi-key
-
-        grouped = self.df.groupby(['A', 'B'], as_index=False)
-
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        assert_frame_equal(result, expected)
-
-        result2 = grouped.agg(OrderedDict([['C', np.mean], ['D', np.sum]]))
-        expected2 = grouped.mean()
-        expected2['D'] = grouped.sum()['D']
-        assert_frame_equal(result2, expected2)
-
-        expected3 = grouped['C'].sum()
-        expected3 = DataFrame(expected3).rename(columns={'C': 'Q'})
-        result3 = grouped['C'].agg({'Q': np.sum})
-        assert_frame_equal(result3, expected3)
-
-        # GH7115 & GH8112 & GH8582
-        df = DataFrame(np.random.randint(0, 100, (50, 3)),
-                       columns=['jim', 'joe', 'jolie'])
-        ts = Series(np.random.randint(5, 10, 50), name='jim')
-
-        gr = df.groupby(ts)
-        _ = gr.nth(0)  # invokes _set_selection_from_grouper internally
-        assert_frame_equal(gr.apply(sum), df.groupby(ts).apply(sum))
-
-        for attr in ['mean', 'max', 'count', 'idxmax', 'cumsum', 'all']:
-            gr = df.groupby(ts, as_index=False)
-            left = getattr(gr, attr)()
-
-            gr = df.groupby(ts.values, as_index=True)
-            right = getattr(gr, attr)().reset_index(drop=True)
-
-            assert_frame_equal(left, right)
-
-    def test_series_groupby_nunique(self):
-        from itertools import product
-        from string import ascii_lowercase
-
-        def check_nunique(df, keys):
-            for sort, dropna in product((False, True), repeat=2):
-                gr = df.groupby(keys, sort=sort)
-                left = gr['julie'].nunique(dropna=dropna)
-
-                gr = df.groupby(keys, sort=sort)
-                right = gr['julie'].apply(Series.nunique, dropna=dropna)
-
-                assert_series_equal(left, right)
-
-        days = date_range('2015-08-23', periods=10)
-
-        for n, m in product(10**np.arange(2, 6), (10, 100, 1000)):
-            frame = DataFrame({
-                'jim':np.random.choice(list(ascii_lowercase), n),
-                'joe':np.random.choice(days, n),
-                'julie':np.random.randint(0, m, n)})
-
-            check_nunique(frame, ['jim'])
-            check_nunique(frame, ['jim', 'joe'])
-
-            frame.loc[1::17, 'jim'] = None
-            frame.loc[3::37, 'joe'] = None
-            frame.loc[7::19, 'julie'] = None
-            frame.loc[8::19, 'julie'] = None
-            frame.loc[9::19, 'julie'] = None
-
-            check_nunique(frame, ['jim'])
-            check_nunique(frame, ['jim', 'joe'])
-
-    def test_series_groupby_value_counts(self):
-        from itertools import product
-
-        def rebuild_index(df):
-            arr = list(map(df.index.get_level_values, range(df.index.nlevels)))
-            df.index = MultiIndex.from_arrays(arr, names=df.index.names)
-            return df
-
-        def check_value_counts(df, keys, bins):
-            for isort, normalize, sort, ascending, dropna \
-                    in product((False, True), repeat=5):
-
-                kwargs = dict(normalize=normalize, sort=sort,
-                              ascending=ascending, dropna=dropna,
-                              bins=bins)
-
-                gr = df.groupby(keys, sort=isort)
-                left = gr['3rd'].value_counts(**kwargs)
-
-                gr = df.groupby(keys, sort=isort)
-                right = gr['3rd'].apply(Series.value_counts, **kwargs)
-                right.index.names = right.index.names[:-1] + ['3rd']
-
-                # have to sort on index because of unstable sort on values
-                left, right = map(rebuild_index, (left, right)) # xref GH9212
-                assert_series_equal(left.sort_index(), right.sort_index())
-
-        def loop(df):
-            bins = None, np.arange(0, max(5, df['3rd'].max()) + 1, 2)
-            keys = '1st', '2nd', ('1st', '2nd')
-            for k, b in product(keys, bins):
-                check_value_counts(df, k, b)
-
-        days = date_range('2015-08-24', periods=10)
-
-        for n, m in product((100, 10000), (5, 20)):
-            frame = DataFrame({
-                '1st':np.random.choice(list('abcd'), n),
-                '2nd':np.random.choice(days, n),
-                '3rd':np.random.randint(1, m + 1, n)})
-
-            loop(frame)
-
-            frame.loc[1::11, '1st'] = nan
-            frame.loc[3::17, '2nd'] = nan
-            frame.loc[7::19, '3rd'] = nan
-            frame.loc[8::19, '3rd'] = nan
-            frame.loc[9::19, '3rd'] = nan
-
-            loop(frame)
-
-    def test_mulitindex_passthru(self):
-
-        # GH 7997
-        # regression from 0.14.1
-        df = pd.DataFrame([[1,2,3],[4,5,6],[7,8,9]])
-        df.columns = pd.MultiIndex.from_tuples([(0,1),(1,1),(2,1)])
-
-        result = df.groupby(axis=1, level=[0,1]).first()
-        assert_frame_equal(result, df)
-
-    def test_multifunc_select_col_integer_cols(self):
-        df = self.df
-        df.columns = np.arange(len(df.columns))
-
-        # it works!
-        result = df.groupby(1, as_index=False)[2].agg({'Q': np.mean})
-
-    def test_as_index_series_return_frame(self):
-        grouped = self.df.groupby('A', as_index=False)
-        grouped2 = self.df.groupby(['A', 'B'], as_index=False)
-
-        result = grouped['C'].agg(np.sum)
-        expected = grouped.agg(np.sum).ix[:, ['A', 'C']]
-        tm.assertIsInstance(result, DataFrame)
-        assert_frame_equal(result, expected)
-
-        result2 = grouped2['C'].agg(np.sum)
-        expected2 = grouped2.agg(np.sum).ix[:, ['A', 'B', 'C']]
-        tm.assertIsInstance(result2, DataFrame)
-        assert_frame_equal(result2, expected2)
-
-        result = grouped['C'].sum()
-        expected = grouped.sum().ix[:, ['A', 'C']]
-        tm.assertIsInstance(result, DataFrame)
-        assert_frame_equal(result, expected)
-
-        result2 = grouped2['C'].sum()
-        expected2 = grouped2.sum().ix[:, ['A', 'B', 'C']]
-        tm.assertIsInstance(result2, DataFrame)
-        assert_frame_equal(result2, expected2)
-
-        # corner case
-        self.assertRaises(Exception, grouped['C'].__getitem__,
-                          'D')
-
-    def test_groupby_as_index_cython(self):
-        data = self.df
-
-        # single-key
-        grouped = data.groupby('A', as_index=False)
-        result = grouped.mean()
-        expected = data.groupby(['A']).mean()
-        expected.insert(0, 'A', expected.index)
-        expected.index = np.arange(len(expected))
-        assert_frame_equal(result, expected)
-
-        # multi-key
-        grouped = data.groupby(['A', 'B'], as_index=False)
-        result = grouped.mean()
-        expected = data.groupby(['A', 'B']).mean()
-
-        arrays = lzip(*expected.index._tuple_index)
-        expected.insert(0, 'A', arrays[0])
-        expected.insert(1, 'B', arrays[1])
-        expected.index = np.arange(len(expected))
-        assert_frame_equal(result, expected)
-
-    def test_groupby_as_index_series_scalar(self):
-        grouped = self.df.groupby(['A', 'B'], as_index=False)
-
-        # GH #421
-
-        result = grouped['C'].agg(len)
-        expected = grouped.agg(len).ix[:, ['A', 'B', 'C']]
-        assert_frame_equal(result, expected)
-
-    def test_groupby_as_index_corner(self):
-        self.assertRaises(TypeError, self.ts.groupby,
-                          lambda x: x.weekday(), as_index=False)
-
-        self.assertRaises(ValueError, self.df.groupby,
-                          lambda x: x.lower(), as_index=False, axis=1)
-
-    def test_groupby_as_index_apply(self):
-        # GH #4648 and #3417
-        df = DataFrame({'item_id': ['b', 'b', 'a', 'c', 'a', 'b'],
-                        'user_id': [1,2,1,1,3,1],
-                        'time': range(6)})
-
-        g_as = df.groupby('user_id', as_index=True)
-        g_not_as = df.groupby('user_id', as_index=False)
-
-        res_as = g_as.head(2).index
-        res_not_as = g_not_as.head(2).index
-        exp = Index([0, 1, 2, 4])
-        assert_index_equal(res_as, exp)
-        assert_index_equal(res_not_as, exp)
-
-        res_as_apply = g_as.apply(lambda x: x.head(2)).index
-        res_not_as_apply = g_not_as.apply(lambda x: x.head(2)).index
-
-        # apply doesn't maintain the original ordering
-        # changed in GH5610 as the as_index=False returns a MI here
-        exp_not_as_apply = MultiIndex.from_tuples([(0, 0), (0, 2), (1, 1), (2, 4)])
-        tp = [(1, 0), (1, 2), (2, 1), (3, 4)]
-        exp_as_apply = MultiIndex.from_tuples(tp, names=['user_id', None])
-
-        assert_index_equal(res_as_apply, exp_as_apply)
-        assert_index_equal(res_not_as_apply, exp_not_as_apply)
-
-        ind = Index(list('abcde'))
-        df = DataFrame([[1, 2], [2, 3], [1, 4], [1, 5], [2, 6]], index=ind)
-        res = df.groupby(0, as_index=False).apply(lambda x: x).index
-        assert_index_equal(res, ind)
-
-    def test_groupby_head_tail(self):
-        df = DataFrame([[1, 2], [1, 4], [5, 6]], columns=['A', 'B'])
-        g_as = df.groupby('A', as_index=True)
-        g_not_as = df.groupby('A', as_index=False)
-
-        # as_index= False, much easier
-        assert_frame_equal(df.loc[[0, 2]], g_not_as.head(1))
-        assert_frame_equal(df.loc[[1, 2]], g_not_as.tail(1))
-
-        empty_not_as = DataFrame(columns=df.columns)
-        empty_not_as['A'] = empty_not_as['A'].astype(df.A.dtype)
-        empty_not_as['B'] = empty_not_as['B'].astype(df.B.dtype)
-        assert_frame_equal(empty_not_as, g_not_as.head(0))
-        assert_frame_equal(empty_not_as, g_not_as.tail(0))
-        assert_frame_equal(empty_not_as, g_not_as.head(-1))
-        assert_frame_equal(empty_not_as, g_not_as.tail(-1))
-
-        assert_frame_equal(df, g_not_as.head(7)) # contains all
-        assert_frame_equal(df, g_not_as.tail(7))
-
-        # as_index=True, (used to be different)
-        df_as = df
-
-        assert_frame_equal(df_as.loc[[0, 2]], g_as.head(1))
-        assert_frame_equal(df_as.loc[[1, 2]], g_as.tail(1))
-
-        empty_as = DataFrame(index=df_as.index[:0], columns=df.columns)
-        empty_as['A'] = empty_not_as['A'].astype(df.A.dtype)
-        empty_as['B'] = empty_not_as['B'].astype(df.B.dtype)
-        assert_frame_equal(empty_as, g_as.head(0))
-        assert_frame_equal(empty_as, g_as.tail(0))
-        assert_frame_equal(empty_as, g_as.head(-1))
-        assert_frame_equal(empty_as, g_as.tail(-1))
-
-        assert_frame_equal(df_as, g_as.head(7)) # contains all
-        assert_frame_equal(df_as, g_as.tail(7))
-
-        # test with selection
-        assert_frame_equal(g_as[[]].head(1), df_as.loc[[0,2], []])
-        assert_frame_equal(g_as[['A']].head(1), df_as.loc[[0,2], ['A']])
-        assert_frame_equal(g_as[['B']].head(1), df_as.loc[[0,2], ['B']])
-        assert_frame_equal(g_as[['A', 'B']].head(1), df_as.loc[[0,2]])
-
-        assert_frame_equal(g_not_as[[]].head(1), df_as.loc[[0,2], []])
-        assert_frame_equal(g_not_as[['A']].head(1), df_as.loc[[0,2], ['A']])
-        assert_frame_equal(g_not_as[['B']].head(1), df_as.loc[[0,2], ['B']])
-        assert_frame_equal(g_not_as[['A', 'B']].head(1), df_as.loc[[0,2]])
-
-    def test_groupby_multiple_key(self):
-        df = tm.makeTimeDataFrame()
-        grouped = df.groupby([lambda x: x.year,
-                              lambda x: x.month,
-                              lambda x: x.day])
-        agged = grouped.sum()
-        assert_almost_equal(df.values, agged.values)
-
-        grouped = df.T.groupby([lambda x: x.year,
-                                lambda x: x.month,
-                                lambda x: x.day], axis=1)
-
-        agged = grouped.agg(lambda x: x.sum())
-        self.assertTrue(agged.index.equals(df.columns))
-        assert_almost_equal(df.T.values, agged.values)
-
-        agged = grouped.agg(lambda x: x.sum())
-        assert_almost_equal(df.T.values, agged.values)
-
-    def test_groupby_multi_corner(self):
-        # test that having an all-NA column doesn't mess you up
-        df = self.df.copy()
-        df['bad'] = np.nan
-        agged = df.groupby(['A', 'B']).mean()
-
-        expected = self.df.groupby(['A', 'B']).mean()
-        expected['bad'] = np.nan
-
-        assert_frame_equal(agged, expected)
-
-    def test_omit_nuisance(self):
-        grouped = self.df.groupby('A')
-
-        result = grouped.mean()
-        expected = self.df.ix[:, ['A', 'C', 'D']].groupby('A').mean()
-        assert_frame_equal(result, expected)
-
-        agged = grouped.agg(np.mean)
-        exp = grouped.mean()
-        assert_frame_equal(agged, exp)
-
-        df = self.df.ix[:, ['A', 'C', 'D']]
-        df['E'] = datetime.now()
-        grouped = df.groupby('A')
-        result = grouped.agg(np.sum)
-        expected = grouped.sum()
-        assert_frame_equal(result, expected)
-
-        # won't work with axis = 1
-        grouped = df.groupby({'A': 0, 'C': 0, 'D': 1, 'E': 1}, axis=1)
-        result = self.assertRaises(TypeError, grouped.agg,
-                                   lambda x: x.sum(0, numeric_only=False))
-
-    def test_omit_nuisance_python_multiple(self):
-        grouped = self.three_group.groupby(['A', 'B'])
-
-        agged = grouped.agg(np.mean)
-        exp = grouped.mean()
-        assert_frame_equal(agged, exp)
-
-    def test_empty_groups_corner(self):
-        # handle empty groups
-        df = DataFrame({'k1': np.array(['b', 'b', 'b', 'a', 'a', 'a']),
-                        'k2': np.array(['1', '1', '1', '2', '2', '2']),
-                        'k3': ['foo', 'bar'] * 3,
-                        'v1': np.random.randn(6),
-                        'v2': np.random.randn(6)})
-
-        grouped = df.groupby(['k1', 'k2'])
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        assert_frame_equal(result, expected)
-
-        grouped = self.mframe[3:5].groupby(level=0)
-        agged = grouped.apply(lambda x: x.mean())
-        agged_A = grouped['A'].apply(np.mean)
-        assert_series_equal(agged['A'], agged_A)
-        self.assertEqual(agged.index.name, 'first')
-
-    def test_apply_concat_preserve_names(self):
-        grouped = self.three_group.groupby(['A', 'B'])
-
-        def desc(group):
-            result = group.describe()
-            result.index.name = 'stat'
-            return result
-
-        def desc2(group):
-            result = group.describe()
-            result.index.name = 'stat'
-            result = result[:len(group)]
-            # weirdo
-            return result
-
-        def desc3(group):
-            result = group.describe()
-
-            # names are different
-            result.index.name = 'stat_%d' % len(group)
-
-            result = result[:len(group)]
-            # weirdo
-            return result
-
-        result = grouped.apply(desc)
-        self.assertEqual(result.index.names, ('A', 'B', 'stat'))
-
-        result2 = grouped.apply(desc2)
-        self.assertEqual(result2.index.names, ('A', 'B', 'stat'))
-
-        result3 = grouped.apply(desc3)
-        self.assertEqual(result3.index.names, ('A', 'B', None))
-
-    def test_nonsense_func(self):
-        df = DataFrame([0])
-        self.assertRaises(Exception, df.groupby, lambda x: x + 'foo')
-
-    def test_builtins_apply(self): # GH8155
-        df = pd.DataFrame(np.random.randint(1, 50, (1000, 2)),
-                          columns=['jim', 'joe'])
-        df['jolie'] = np.random.randn(1000)
-
-        for keys in ['jim', ['jim', 'joe']]:  # single key & multi-key
-            if keys == 'jim': continue
-            for f in [max, min, sum]:
-                fname = f.__name__
-                result = df.groupby(keys).apply(f)
-                _shape = result.shape
-                ngroups = len(df.drop_duplicates(subset=keys))
-                assert result.shape == (ngroups, 3), 'invalid frame shape: '\
-                        '{} (expected ({}, 3))'.format(result.shape, ngroups)
-
-                assert_frame_equal(result,  # numpy's equivalent function
-                                   df.groupby(keys).apply(getattr(np, fname)))
-
-                if f != sum:
-                    expected = df.groupby(keys).agg(fname).reset_index()
-                    expected.set_index(keys, inplace=True, drop=False)
-                    assert_frame_equal(result, expected, check_dtype=False)
-
-                assert_series_equal(getattr(result, fname)(),
-                                    getattr(df, fname)())
-
-    def test_cythonized_aggers(self):
-        data = {'A': [0, 0, 0, 0, 1, 1, 1, 1, 1, 1., nan, nan],
-                'B': ['A', 'B'] * 6,
-                'C': np.random.randn(12)}
-        df = DataFrame(data)
-        df.loc[2:10:2,'C'] = nan
-
-        def _testit(name):
-
-            op = lambda x: getattr(x,name)()
-
-            # single column
-            grouped = df.drop(['B'], axis=1).groupby('A')
-            exp = {}
-            for cat, group in grouped:
-                exp[cat] = op(group['C'])
-            exp = DataFrame({'C': exp})
-            exp.index.name = 'A'
-            result = op(grouped)
-            assert_frame_equal(result, exp)
-
-            # multiple columns
-            grouped = df.groupby(['A', 'B'])
-            expd = {}
-            for (cat1, cat2), group in grouped:
-                expd.setdefault(cat1, {})[cat2] = op(group['C'])
-            exp = DataFrame(expd).T.stack(dropna=False)
-            exp.index.names = ['A', 'B']
-            exp.name = 'C'
-
-            result = op(grouped)['C']
-            if not tm._incompat_bottleneck_version(name):
-                assert_series_equal(result, exp)
-
-        _testit('count')
-        _testit('sum')
-        _testit('std')
-        _testit('var')
-        _testit('sem')
-        _testit('mean')
-        _testit('median')
-        _testit('prod')
-        _testit('min')
-        _testit('max')
-
-    def test_max_min_non_numeric(self):
-        # #2700
-        aa = DataFrame({'nn':[11,11,22,22],'ii':[1,2,3,4],'ss':4*['mama']})
-
-        result = aa.groupby('nn').max()
-        self.assertTrue('ss' in result)
-
-        result = aa.groupby('nn').min()
-        self.assertTrue('ss' in result)
-
-    def test_cython_agg_boolean(self):
-        frame = DataFrame({'a': np.random.randint(0, 5, 50),
-                           'b': np.random.randint(0, 2, 50).astype('bool')})
-        result = frame.groupby('a')['b'].mean()
-        expected = frame.groupby('a')['b'].agg(np.mean)
-
-        assert_series_equal(result, expected)
-
-    def test_cython_agg_nothing_to_agg(self):
-        frame = DataFrame({'a': np.random.randint(0, 5, 50),
-                           'b': ['foo', 'bar'] * 25})
-        self.assertRaises(DataError, frame.groupby('a')['b'].mean)
-
-        frame = DataFrame({'a': np.random.randint(0, 5, 50),
-                           'b': ['foo', 'bar'] * 25})
-        self.assertRaises(DataError, frame[['b']].groupby(frame['a']).mean)
-
-    def test_cython_agg_nothing_to_agg_with_dates(self):
-        frame = DataFrame({'a': np.random.randint(0, 5, 50),
-                           'b': ['foo', 'bar'] * 25,
-                           'dates': pd.date_range('now', periods=50,
-                                                  freq='T')})
-        with tm.assertRaisesRegexp(DataError, "No numeric types to aggregate"):
-            frame.groupby('b').dates.mean()
-
-    def test_groupby_timedelta_cython_count(self):
-        df = DataFrame({'g': list('ab' * 2),
-                        'delt': np.arange(4).astype('timedelta64[ns]')})
-        expected = Series([2, 2], index=pd.Index(['a', 'b'], name='g'), name='delt')
-        result = df.groupby('g').delt.count()
-        tm.assert_series_equal(expected, result)
-
-    def test_cython_agg_frame_columns(self):
-        # #2113
-        df = DataFrame({'x': [1, 2, 3], 'y': [3, 4, 5]})
-
-        result = df.groupby(level=0, axis='columns').mean()
-        result = df.groupby(level=0, axis='columns').mean()
-        result = df.groupby(level=0, axis='columns').mean()
-        _ = df.groupby(level=0, axis='columns').mean()
-
-    def test_wrap_aggregated_output_multindex(self):
-        df = self.mframe.T
-        df['baz', 'two'] = 'peekaboo'
-
-        keys = [np.array([0, 0, 1]), np.array([0, 0, 1])]
-        agged = df.groupby(keys).agg(np.mean)
-        tm.assertIsInstance(agged.columns, MultiIndex)
-
-        def aggfun(ser):
-            if ser.name == ('foo', 'one'):
-                raise TypeError
-            else:
-                return ser.sum()
-        agged2 = df.groupby(keys).aggregate(aggfun)
-        self.assertEqual(len(agged2.columns) + 1, len(df.columns))
-
-    def test_groupby_level(self):
-        frame = self.mframe
-        deleveled = frame.reset_index()
-
-        result0 = frame.groupby(level=0).sum()
-        result1 = frame.groupby(level=1).sum()
-
-        expected0 = frame.groupby(deleveled['first'].values).sum()
-        expected1 = frame.groupby(deleveled['second'].values).sum()
-
-        expected0 = expected0.reindex(frame.index.levels[0])
-        expected1 = expected1.reindex(frame.index.levels[1])
-
-        self.assertEqual(result0.index.name, 'first')
-        self.assertEqual(result1.index.name, 'second')
-
-        assert_frame_equal(result0, expected0)
-        assert_frame_equal(result1, expected1)
-        self.assertEqual(result0.index.name, frame.index.names[0])
-        self.assertEqual(result1.index.name, frame.index.names[1])
-
-        # groupby level name
-        result0 = frame.groupby(level='first').sum()
-        result1 = frame.groupby(level='second').sum()
-        assert_frame_equal(result0, expected0)
-        assert_frame_equal(result1, expected1)
-
-        # axis=1
-
-        result0 = frame.T.groupby(level=0, axis=1).sum()
-        result1 = frame.T.groupby(level=1, axis=1).sum()
-        assert_frame_equal(result0, expected0.T)
-        assert_frame_equal(result1, expected1.T)
-
-        # raise exception for non-MultiIndex
-        self.assertRaises(ValueError, self.df.groupby, level=1)
-
-
-
-
-    def test_groupby_level_index_names(self):
-        ## GH4014 this used to raise ValueError since 'exp'>1 (in py2)
-        df = DataFrame({'exp' : ['A']*3 + ['B']*3, 'var1' : lrange(6),}).set_index('exp')
-        df.groupby(level='exp')
-        self.assertRaises(ValueError, df.groupby, level='foo')
-
-    def test_groupby_level_with_nas(self):
-        index = MultiIndex(levels=[[1, 0], [0, 1, 2, 3]],
-                           labels=[[1, 1, 1, 1, 0, 0, 0, 0],
-                                   [0, 1, 2, 3, 0, 1, 2, 3]])
-
-        # factorizing doesn't confuse things
-        s = Series(np.arange(8.), index=index)
-        result = s.groupby(level=0).sum()
-        expected = Series([22., 6.], index=[1, 0])
-        assert_series_equal(result, expected)
-
-        index = MultiIndex(levels=[[1, 0], [0, 1, 2, 3]],
-                           labels=[[1, 1, 1, 1, -1, 0, 0, 0],
-                                   [0, 1, 2, 3, 0, 1, 2, 3]])
-
-        # factorizing doesn't confuse things
-        s = Series(np.arange(8.), index=index)
-        result = s.groupby(level=0).sum()
-        expected = Series([18., 6.], index=[1, 0])
-        assert_series_equal(result, expected)
-
-    def test_groupby_level_apply(self):
-        frame = self.mframe
-
-        result = frame.groupby(level=0).count()
-        self.assertEqual(result.index.name, 'first')
-        result = frame.groupby(level=1).count()
-        self.assertEqual(result.index.name, 'second')
-
-        result = frame['A'].groupby(level=0).count()
-        self.assertEqual(result.index.name, 'first')
-
-    def test_groupby_args(self):
-        #PR8618 and issue 8015
-        frame = self.mframe
-        def j():
-             frame.groupby()
-        self.assertRaisesRegexp(TypeError, "You have to supply one of 'by' and 'level'", j)
-
-        def k():
-            frame.groupby(by=None, level=None)
-        self.assertRaisesRegexp(TypeError,  "You have to supply one of 'by' and 'level'", k)
-
-    def test_groupby_level_mapper(self):
-        frame = self.mframe
-        deleveled = frame.reset_index()
-
-        mapper0 = {'foo': 0, 'bar': 0,
-                   'baz': 1, 'qux': 1}
-        mapper1 = {'one': 0, 'two': 0, 'three': 1}
-
-        result0 = frame.groupby(mapper0, level=0).sum()
-        result1 = frame.groupby(mapper1, level=1).sum()
-
-        mapped_level0 = np.array([mapper0.get(x) for x in deleveled['first']])
-        mapped_level1 = np.array([mapper1.get(x) for x in deleveled['second']])
-        expected0 = frame.groupby(mapped_level0).sum()
-        expected1 = frame.groupby(mapped_level1).sum()
-        expected0.index.name, expected1.index.name = 'first', 'second'
-
-        assert_frame_equal(result0, expected0)
-        assert_frame_equal(result1, expected1)
-
-    def test_groupby_level_0_nonmulti(self):
-        # #1313
-        a = Series([1, 2, 3, 10, 4, 5, 20, 6], Index([1, 2, 3, 1,
-                   4, 5, 2, 6], name='foo'))
-
-        result = a.groupby(level=0).sum()
-        self.assertEqual(result.index.name, a.index.name)
-
-    def test_level_preserve_order(self):
-        grouped = self.mframe.groupby(level=0)
-        exp_labels = np.array([0, 0, 0, 1, 1, 2, 2, 3, 3, 3])
-        assert_almost_equal(grouped.grouper.labels[0], exp_labels)
-
-    def test_grouping_labels(self):
-        grouped = self.mframe.groupby(self.mframe.index.get_level_values(0))
-        exp_labels = np.array([2, 2, 2, 0, 0, 1, 1, 3, 3, 3])
-        assert_almost_equal(grouped.grouper.labels[0], exp_labels)
-
-    def test_cython_fail_agg(self):
-        dr = bdate_range('1/1/2000', periods=50)
-        ts = Series(['A', 'B', 'C', 'D', 'E'] * 10, index=dr)
-
-        grouped = ts.groupby(lambda x: x.month)
-        summed = grouped.sum()
-        expected = grouped.agg(np.sum)
-        assert_series_equal(summed, expected)
-
-    def test_apply_series_to_frame(self):
-        def f(piece):
-            return DataFrame({'value': piece,
-                              'demeaned': piece - piece.mean(),
-                              'logged': np.log(piece)})
-
-        dr = bdate_range('1/1/2000', periods=100)
-        ts = Series(np.random.randn(100), index=dr)
-
-        grouped = ts.groupby(lambda x: x.month)
-        result = grouped.apply(f)
-
-        tm.assertIsInstance(result, DataFrame)
-        self.assertTrue(result.index.equals(ts.index))
-
-    def test_apply_series_yield_constant(self):
-        result = self.df.groupby(['A', 'B'])['C'].apply(len)
-        self.assertEqual(result.index.names[:2], ('A', 'B'))
-
-    def test_apply_frame_to_series(self):
-        grouped = self.df.groupby(['A', 'B'])
-        result = grouped.apply(len)
-        expected = grouped.count()['C']
-        self.assertTrue(result.index.equals(expected.index))
-        self.assert_numpy_array_equal(result.values, expected.values)
-
-    def test_apply_frame_concat_series(self):
-        def trans(group):
-            return group.groupby('B')['C'].sum().sort_values()[:2]
-
-        def trans2(group):
-            grouped = group.groupby(df.reindex(group.index)['B'])
-            return grouped.sum().sort_values()[:2]
-
-        df = DataFrame({'A': np.random.randint(0, 5, 1000),
-                        'B': np.random.randint(0, 5, 1000),
-                        'C': np.random.randn(1000)})
-
-        result = df.groupby('A').apply(trans)
-        exp = df.groupby('A')['C'].apply(trans2)
-        assert_series_equal(result, exp, check_names=False)
-        self.assertEqual(result.name, 'C')
-
-    def test_apply_transform(self):
-        grouped = self.ts.groupby(lambda x: x.month)
-        result = grouped.apply(lambda x: x * 2)
-        expected = grouped.transform(lambda x: x * 2)
-        assert_series_equal(result, expected)
-
-    def test_apply_multikey_corner(self):
-        grouped = self.tsframe.groupby([lambda x: x.year,
-                                        lambda x: x.month])
-
-        def f(group):
-            return group.sort_values('A')[-5:]
-
-        result = grouped.apply(f)
-        for key, group in grouped:
-            assert_frame_equal(result.ix[key], f(group))
-
-    def test_mutate_groups(self):
-
-        # GH3380
-
-        mydf = DataFrame({
-                'cat1' : ['a'] * 8 + ['b'] * 6,
-                'cat2' : ['c'] * 2 + ['d'] * 2 + ['e'] * 2 + ['f'] * 2 + ['c'] * 2 + ['d'] * 2 + ['e'] * 2,
-                'cat3' : lmap(lambda x: 'g%s' % x, lrange(1,15)),
-                'val' : np.random.randint(100, size=14),
-                })
-
-        def f_copy(x):
-            x = x.copy()
-            x['rank'] = x.val.rank(method='min')
-            return x.groupby('cat2')['rank'].min()
-
-        def f_no_copy(x):
-            x['rank'] = x.val.rank(method='min')
-            return x.groupby('cat2')['rank'].min()
-
-        grpby_copy    = mydf.groupby('cat1').apply(f_copy)
-        grpby_no_copy = mydf.groupby('cat1').apply(f_no_copy)
-        assert_series_equal(grpby_copy,grpby_no_copy)
-
-    def test_no_mutate_but_looks_like(self):
-
-        # GH 8467
-        # first show's mutation indicator
-        # second does not, but should yield the same results
-        df = DataFrame({'key': [1, 1, 1, 2, 2, 2, 3, 3, 3],
-                        'value': range(9)})
-
-        result1 = df.groupby('key', group_keys=True).apply(lambda x: x[:].key)
-        result2 = df.groupby('key', group_keys=True).apply(lambda x: x.key)
-        assert_series_equal(result1, result2)
-
-    def test_apply_chunk_view(self):
-        # Low level tinkering could be unsafe, make sure not
-        df = DataFrame({'key': [1, 1, 1, 2, 2, 2, 3, 3, 3],
-                        'value': lrange(9)})
-
-        # return view
-        f = lambda x: x[:2]
-
-        result = df.groupby('key', group_keys=False).apply(f)
-        expected = df.take([0, 1, 3, 4, 6, 7])
-        assert_frame_equal(result, expected)
-
-    def test_apply_no_name_column_conflict(self):
-        df = DataFrame({'name': [1, 1, 1, 1, 1, 1, 2, 2, 2, 2],
-                        'name2': [0, 0, 0, 1, 1, 1, 0, 0, 1, 1],
-                        'value': lrange(10)[::-1]})
-
-        # it works! #2605
-        grouped = df.groupby(['name', 'name2'])
-        grouped.apply(lambda x: x.sort_values('value',inplace=True))
-
-    def test_groupby_series_indexed_differently(self):
-        s1 = Series([5.0, -9.0, 4.0, 100., -5., 55., 6.7],
-                    index=Index(['a', 'b', 'c', 'd', 'e', 'f', 'g']))
-        s2 = Series([1.0, 1.0, 4.0, 5.0, 5.0, 7.0],
-                    index=Index(['a', 'b', 'd', 'f', 'g', 'h']))
-
-        grouped = s1.groupby(s2)
-        agged = grouped.mean()
-        exp = s1.groupby(s2.reindex(s1.index).get).mean()
-        assert_series_equal(agged, exp)
-
-    def test_groupby_with_hier_columns(self):
-        tuples = list(zip(*[['bar', 'bar', 'baz', 'baz',
-                        'foo', 'foo', 'qux', 'qux'],
-                       ['one', 'two', 'one', 'two',
-                        'one', 'two', 'one', 'two']]))
-        index = MultiIndex.from_tuples(tuples)
-        columns = MultiIndex.from_tuples([('A', 'cat'), ('B', 'dog'),
-                                          ('B', 'cat'), ('A', 'dog')])
-        df = DataFrame(np.random.randn(8, 4), index=index,
-                       columns=columns)
-
-        result = df.groupby(level=0).mean()
-        self.assertTrue(result.columns.equals(columns))
-
-        result = df.groupby(level=0, axis=1).mean()
-        self.assertTrue(result.index.equals(df.index))
-
-        result = df.groupby(level=0).agg(np.mean)
-        self.assertTrue(result.columns.equals(columns))
-
-        result = df.groupby(level=0).apply(lambda x: x.mean())
-        self.assertTrue(result.columns.equals(columns))
-
-        result = df.groupby(level=0, axis=1).agg(lambda x: x.mean(1))
-        self.assertTrue(result.columns.equals(Index(['A', 'B'])))
-        self.assertTrue(result.index.equals(df.index))
-
-        # add a nuisance column
-        sorted_columns, _ = columns.sortlevel(0)
-        df['A', 'foo'] = 'bar'
-        result = df.groupby(level=0).mean()
-        self.assertTrue(result.columns.equals(df.columns[:-1]))
-
-    def test_pass_args_kwargs(self):
-        from numpy import percentile
-
-        def f(x, q=None, axis=0):
-            return percentile(x, q, axis=axis)
-        g = lambda x: percentile(x, 80, axis=0)
-
-        # Series
-        ts_grouped = self.ts.groupby(lambda x: x.month)
-        agg_result = ts_grouped.agg(percentile, 80, axis=0)
-        apply_result = ts_grouped.apply(percentile, 80, axis=0)
-        trans_result = ts_grouped.transform(percentile, 80, axis=0)
-
-        agg_expected = ts_grouped.quantile(.8)
-        trans_expected = ts_grouped.transform(g)
-
-        assert_series_equal(apply_result, agg_expected)
-        assert_series_equal(agg_result, agg_expected)
-        assert_series_equal(trans_result, trans_expected)
-
-        agg_result = ts_grouped.agg(f, q=80)
-        apply_result = ts_grouped.apply(f, q=80)
-        trans_result = ts_grouped.transform(f, q=80)
-        assert_series_equal(agg_result, agg_expected)
-        assert_series_equal(apply_result, agg_expected)
-        assert_series_equal(trans_result, trans_expected)
-
-        # DataFrame
-        df_grouped = self.tsframe.groupby(lambda x: x.month)
-        agg_result = df_grouped.agg(percentile, 80, axis=0)
-        apply_result = df_grouped.apply(DataFrame.quantile, .8)
-        expected = df_grouped.quantile(.8)
-        assert_frame_equal(apply_result, expected)
-        assert_frame_equal(agg_result, expected)
-
-        agg_result = df_grouped.agg(f, q=80)
-        apply_result = df_grouped.apply(DataFrame.quantile, q=.8)
-        assert_frame_equal(agg_result, expected)
-        assert_frame_equal(apply_result, expected)
-
-    # def test_cython_na_bug(self):
-    #     values = np.random.randn(10)
-    #     shape = (5, 5)
-    #     label_list = [np.array([0, 0, 0, 0, 1, 1, 1, 1, 2, 2], dtype=np.int32),
-    # np.array([1, 2, 3, 4, 0, 1, 2, 3, 3, 4], dtype=np.int32)]
-
-    #     lib.group_aggregate(values, label_list, shape)
-
-    def test_size(self):
-        grouped = self.df.groupby(['A', 'B'])
-        result = grouped.size()
-        for key, group in grouped:
-            self.assertEqual(result[key], len(group))
-
-        grouped = self.df.groupby('A')
-        result = grouped.size()
-        for key, group in grouped:
-            self.assertEqual(result[key], len(group))
-
-        grouped = self.df.groupby('B')
-        result = grouped.size()
-        for key, group in grouped:
-            self.assertEqual(result[key], len(group))
-
-        df = DataFrame(np.random.choice(20, (1000, 3)), columns=list('abc'))
-        for sort, key in cart_product((False, True), ('a', 'b', ['a', 'b'])):
-            left = df.groupby(key, sort=sort).size()
-            right = df.groupby(key, sort=sort)['c'].apply(lambda a: a.shape[0])
-            assert_series_equal(left, right, check_names=False)
-
-    def test_count(self):
-        from string import ascii_lowercase
-        n = 1 << 15
-        dr = date_range('2015-08-30', periods=n // 10, freq='T')
-
-        df = DataFrame({
-                '1st':np.random.choice(list(ascii_lowercase), n),
-                '2nd':np.random.randint(0, 5, n),
-                '3rd':np.random.randn(n).round(3),
-                '4th':np.random.randint(-10, 10, n),
-                '5th':np.random.choice(dr, n),
-                '6th':np.random.randn(n).round(3),
-                '7th':np.random.randn(n).round(3),
-                '8th':np.random.choice(dr, n) - np.random.choice(dr, 1),
-                '9th':np.random.choice(list(ascii_lowercase), n)})
-
-        for col in df.columns.drop(['1st', '2nd', '4th']):
-            df.loc[np.random.choice(n, n // 10), col] = np.nan
-
-        df['9th'] = df['9th'].astype('category')
-
-        for key in '1st', '2nd', ['1st', '2nd']:
-            left = df.groupby(key).count()
-            right = df.groupby(key).apply(DataFrame.count).drop(key, axis=1)
-            assert_frame_equal(left, right)
-
-        # GH5610
-        # count counts non-nulls
-        df = pd.DataFrame([[1, 2, 'foo'], [1, nan, 'bar'], [3, nan, nan]],
-                          columns=['A', 'B', 'C'])
-
-        count_as = df.groupby('A').count()
-        count_not_as = df.groupby('A', as_index=False).count()
-
-        expected = DataFrame([[1, 2], [0, 0]], columns=['B', 'C'], index=[1,3])
-        expected.index.name='A'
-        assert_frame_equal(count_not_as, expected.reset_index())
-        assert_frame_equal(count_as, expected)
-
-        count_B = df.groupby('A')['B'].count()
-        assert_series_equal(count_B, expected['B'])
-
-    def test_count_object(self):
-        df = pd.DataFrame({'a': ['a'] * 3 + ['b'] * 3,
-                           'c': [2] * 3 + [3] * 3})
-        result = df.groupby('c').a.count()
-        expected = pd.Series([3, 3], index=pd.Index([2, 3], name='c'), name='a')
-        tm.assert_series_equal(result, expected)
-
-        df = pd.DataFrame({'a': ['a', np.nan, np.nan] + ['b'] * 3,
-                           'c': [2] * 3 + [3] * 3})
-        result = df.groupby('c').a.count()
-        expected = pd.Series([1, 3], index=pd.Index([2, 3], name='c'), name='a')
-        tm.assert_series_equal(result, expected)
-
-    def test_count_cross_type(self):  # GH8169
-        vals = np.hstack((np.random.randint(0,5,(100,2)),
-                          np.random.randint(0,2,(100,2))))
-
-        df = pd.DataFrame(vals, columns=['a', 'b', 'c', 'd'])
-        df[df==2] = np.nan
-        expected = df.groupby(['c', 'd']).count()
-
-        for t in ['float32', 'object']:
-            df['a'] = df['a'].astype(t)
-            df['b'] = df['b'].astype(t)
-            result = df.groupby(['c', 'd']).count()
-            tm.assert_frame_equal(result, expected)
-
-    def test_non_cython_api(self):
-
-        # GH5610
-        # non-cython calls should not include the grouper
-
-        df = DataFrame([[1, 2, 'foo'], [1, nan, 'bar',], [3, nan, 'baz']], columns=['A', 'B','C'])
-        g = df.groupby('A')
-        gni = df.groupby('A',as_index=False)
-
-        # mad
-        expected = DataFrame([[0],[nan]],columns=['B'],index=[1,3])
-        expected.index.name = 'A'
-        result = g.mad()
-        assert_frame_equal(result,expected)
-
-        expected = DataFrame([[0.,0.],[0,nan]],columns=['A','B'],index=[0,1])
-        result = gni.mad()
-        assert_frame_equal(result,expected)
-
-        # describe
-        expected = DataFrame(dict(B = concat([df.loc[[0,1],'B'].describe(),df.loc[[2],'B'].describe()],keys=[1,3])))
-        expected.index.names = ['A',None]
-        result = g.describe()
-        assert_frame_equal(result,expected)
-
-        expected = concat([df.loc[[0,1],['A','B']].describe(),df.loc[[2],['A','B']].describe()],keys=[0,1])
-        result = gni.describe()
-        assert_frame_equal(result,expected)
-
-        # any
-        expected = DataFrame([[True, True],[False, True]],columns=['B','C'],index=[1,3])
-        expected.index.name = 'A'
-        result = g.any()
-        assert_frame_equal(result,expected)
-
-        # idxmax
-        expected = DataFrame([[0],[nan]],columns=['B'],index=[1,3])
-        expected.index.name = 'A'
-        result = g.idxmax()
-        assert_frame_equal(result,expected)
-
-    def test_cython_api2(self):
-
-        # this takes the fast apply path
-
-        # cumsum (GH5614)
-        df = DataFrame([[1, 2, np.nan], [1, np.nan, 9], [3, 4, 9]], columns=['A', 'B', 'C'])
-        expected = DataFrame([[2, np.nan], [np.nan, 9], [4, 9]], columns=['B', 'C'])
-        result = df.groupby('A').cumsum()
-        assert_frame_equal(result,expected)
-
-        expected = DataFrame([[1, 2, np.nan], [2, np.nan, 9], [3, 4, 9]], columns=['A', 'B', 'C']).astype('float64')
-        result = df.groupby('A', as_index=False).cumsum()
-        assert_frame_equal(result,expected)
-
-    def test_grouping_ndarray(self):
-        grouped = self.df.groupby(self.df['A'].values)
-
-        result = grouped.sum()
-        expected = self.df.groupby('A').sum()
-        assert_frame_equal(result, expected, check_names=False)  # Note: no names when grouping by value
-
-    def test_agg_consistency(self):
-        # agg with ([]) and () not consistent
-        # GH 6715
-
-        def P1(a):
-            try:
-                return np.percentile(a.dropna(), q=1)
-            except:
-                return np.nan
-
-        import datetime as dt
-        df = DataFrame({'col1':[1,2,3,4],
-                        'col2':[10,25,26,31],
-                        'date':[dt.date(2013,2,10),dt.date(2013,2,10),dt.date(2013,2,11),dt.date(2013,2,11)]})
-
-        g = df.groupby('date')
-
-        expected = g.agg([P1])
-        expected.columns = expected.columns.levels[0]
-
-        result = g.agg(P1)
-        assert_frame_equal(result, expected)
-
-    def test_apply_typecast_fail(self):
-        df = DataFrame({'d': [1., 1., 1., 2., 2., 2.],
-                        'c': np.tile(['a', 'b', 'c'], 2),
-                        'v': np.arange(1., 7.)})
-
-        def f(group):
-            v = group['v']
-            group['v2'] = (v - v.min()) / (v.max() - v.min())
-            return group
-
-        result = df.groupby('d').apply(f)
-
-        expected = df.copy()
-        expected['v2'] = np.tile([0., 0.5, 1], 2)
-
-        assert_frame_equal(result, expected)
-
-    def test_apply_multiindex_fail(self):
-        index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1],
-                                        [1, 2, 3, 1, 2, 3]])
-        df = DataFrame({'d': [1., 1., 1., 2., 2., 2.],
-                        'c': np.tile(['a', 'b', 'c'], 2),
-                        'v': np.arange(1., 7.)}, index=index)
-
-        def f(group):
-            v = group['v']
-            group['v2'] = (v - v.min()) / (v.max() - v.min())
-            return group
-
-        result = df.groupby('d').apply(f)
-
-        expected = df.copy()
-        expected['v2'] = np.tile([0., 0.5, 1], 2)
-
-        assert_frame_equal(result, expected)
-
-    def test_apply_corner(self):
-        result = self.tsframe.groupby(lambda x: x.year).apply(lambda x: x * 2)
-        expected = self.tsframe * 2
-        assert_frame_equal(result, expected)
-
-    def test_apply_without_copy(self):
-        # GH 5545
-        # returning a non-copy in an applied function fails
-
-        data = DataFrame({'id_field' : [100, 100, 200, 300], 'category' : ['a','b','c','c'], 'value' : [1,2,3,4]})
-
-        def filt1(x):
-            if x.shape[0] == 1:
-                return x.copy()
-            else:
-                return x[x.category == 'c']
-
-        def filt2(x):
-            if x.shape[0] == 1:
-                return x
-            else:
-                return x[x.category == 'c']
-
-        expected = data.groupby('id_field').apply(filt1)
-        result = data.groupby('id_field').apply(filt2)
-        assert_frame_equal(result,expected)
-
-    def test_apply_use_categorical_name(self):
-        from pandas import qcut
-        cats = qcut(self.df.C, 4)
-
-        def get_stats(group):
-            return {'min': group.min(), 'max': group.max(),
-                    'count': group.count(), 'mean': group.mean()}
-
-        result = self.df.groupby(cats).D.apply(get_stats)
-        self.assertEqual(result.index.names[0], 'C')
-
-    def test_apply_categorical_data(self):
-        # GH 10138
-        for ordered in [True, False]:
-            dense = Categorical(list('abc'), ordered=ordered)
-            # 'b' is in the categories but not in the list
-            missing = Categorical(list('aaa'), categories=['a', 'b'], ordered=ordered)
-            values = np.arange(len(dense))
-            df = DataFrame({'missing': missing,
-                            'dense': dense,
-                            'values': values})
-            grouped = df.groupby(['missing', 'dense'])
-
-            # missing category 'b' should still exist in the output index
-            idx = MultiIndex.from_product([['a', 'b'], ['a', 'b', 'c']],
-                                          names=['missing', 'dense'])
-            expected = DataFrame([0, 1, 2, np.nan, np.nan, np.nan],
-                                 index=idx,
-                                 columns=['values'])
-
-            assert_frame_equal(grouped.apply(lambda x: np.mean(x)), expected)
-            assert_frame_equal(grouped.mean(), expected)
-            assert_frame_equal(grouped.agg(np.mean), expected)
-
-            # but for transform we should still get back the original index
-            idx = MultiIndex.from_product([['a'], ['a', 'b', 'c']],
-                                          names=['missing', 'dense'])
-            expected = Series(1, index=idx)
-            assert_series_equal(grouped.apply(lambda x: 1), expected)
-
-    def test_apply_corner_cases(self):
-        # #535, can't use sliding iterator
-
-        N = 1000
-        labels = np.random.randint(0, 100, size=N)
-        df = DataFrame({'key': labels,
-                        'value1': np.random.randn(N),
-                        'value2': ['foo', 'bar', 'baz', 'qux'] * (N // 4)})
-
-        grouped = df.groupby('key')
-
-        def f(g):
-            g['value3'] = g['value1'] * 2
-            return g
-
-        result = grouped.apply(f)
-        self.assertTrue('value3' in result)
-
-    def test_transform_mixed_type(self):
-        index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1],
-                                        [1, 2, 3, 1, 2, 3]])
-        df = DataFrame({'d': [1., 1., 1., 2., 2., 2.],
-                        'c': np.tile(['a', 'b', 'c'], 2),
-                        'v': np.arange(1., 7.)}, index=index)
-
-        def f(group):
-            group['g'] = group['d'] * 2
-            return group[:1]
-
-        grouped = df.groupby('c')
-        result = grouped.apply(f)
-
-        self.assertEqual(result['d'].dtype, np.float64)
-
-        # this is by definition a mutating operation!
-        with option_context('mode.chained_assignment',None):
-            for key, group in grouped:
-                res = f(group)
-                assert_frame_equal(res, result.ix[key])
-
-    def test_groupby_wrong_multi_labels(self):
-        from pandas import read_csv
-        data = """index,foo,bar,baz,spam,data
-0,foo1,bar1,baz1,spam2,20
-1,foo1,bar2,baz1,spam3,30
-2,foo2,bar2,baz1,spam2,40
-3,foo1,bar1,baz2,spam1,50
-4,foo3,bar1,baz2,spam1,60"""
-        data = read_csv(StringIO(data), index_col=0)
-
-        grouped = data.groupby(['foo', 'bar', 'baz', 'spam'])
-
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        assert_frame_equal(result, expected)
-
-    def test_groupby_series_with_name(self):
-        result = self.df.groupby(self.df['A']).mean()
-        result2 = self.df.groupby(self.df['A'], as_index=False).mean()
-        self.assertEqual(result.index.name, 'A')
-        self.assertIn('A', result2)
-
-        result = self.df.groupby([self.df['A'], self.df['B']]).mean()
-        result2 = self.df.groupby([self.df['A'], self.df['B']],
-                                  as_index=False).mean()
-        self.assertEqual(result.index.names, ('A', 'B'))
-        self.assertIn('A', result2)
-        self.assertIn('B', result2)
-
-    def test_seriesgroupby_name_attr(self):
-        # GH 6265
-        result = self.df.groupby('A')['C']
-        self.assertEqual(result.count().name, 'C')
-        self.assertEqual(result.mean().name, 'C')
-
-        testFunc = lambda x: np.sum(x)*2
-        self.assertEqual(result.agg(testFunc).name, 'C')
-
-    def test_groupby_name_propagation(self):
-        # GH 6124
-        def summarize(df, name=None):
-            return Series({
-                'count': 1,
-                'mean': 2,
-                'omissions': 3,
-            }, name=name)
-
-        def summarize_random_name(df):
-            # Provide a different name for each Series.  In this case, groupby
-            # should not attempt to propagate the Series name since they are
-            # inconsistent.
-            return Series({
-                'count': 1,
-                'mean': 2,
-                'omissions': 3,
-            }, name=df.iloc[0]['A'])
-
-        metrics = self.df.groupby('A').apply(summarize)
-        self.assertEqual(metrics.columns.name, None)
-        metrics = self.df.groupby('A').apply(summarize, 'metrics')
-        self.assertEqual(metrics.columns.name, 'metrics')
-        metrics = self.df.groupby('A').apply(summarize_random_name)
-        self.assertEqual(metrics.columns.name, None)
-
-    def test_groupby_nonstring_columns(self):
-        df = DataFrame([np.arange(10) for x in range(10)])
-        grouped = df.groupby(0)
-        result = grouped.mean()
-        expected = df.groupby(df[0]).mean()
-        assert_frame_equal(result, expected)
-
-    def test_cython_grouper_series_bug_noncontig(self):
-        arr = np.empty((100, 100))
-        arr.fill(np.nan)
-        obj = Series(arr[:, 0], index=lrange(100))
-        inds = np.tile(lrange(10), 10)
-
-        result = obj.groupby(inds).agg(Series.median)
-        self.assertTrue(result.isnull().all())
-
-    def test_series_grouper_noncontig_index(self):
-        index = Index(tm.rands_array(10, 100))
-
-        values = Series(np.random.randn(50), index=index[::2])
-        labels = np.random.randint(0, 5, 50)
-
-        # it works!
-        grouped = values.groupby(labels)
-
-        # accessing the index elements causes segfault
-        f = lambda x: len(set(map(id, x.index)))
-        grouped.agg(f)
-
-    def test_convert_objects_leave_decimal_alone(self):
-
-        from decimal import Decimal
-
-        s = Series(lrange(5))
-        labels = np.array(['a', 'b', 'c', 'd', 'e'], dtype='O')
-
-        def convert_fast(x):
-            return Decimal(str(x.mean()))
-
-        def convert_force_pure(x):
-            # base will be length 0
-            assert(len(x.base) > 0)
-            return Decimal(str(x.mean()))
-
-        grouped = s.groupby(labels)
-
-        result = grouped.agg(convert_fast)
-        self.assertEqual(result.dtype, np.object_)
-        tm.assertIsInstance(result[0], Decimal)
-
-        result = grouped.agg(convert_force_pure)
-        self.assertEqual(result.dtype, np.object_)
-        tm.assertIsInstance(result[0], Decimal)
-
-    def test_fast_apply(self):
-        # make sure that fast apply is correctly called
-        # rather than raising any kind of error
-        # otherwise the python path will be callsed
-        # which slows things down
-        N = 1000
-        labels = np.random.randint(0, 2000, size=N)
-        labels2 = np.random.randint(0, 3, size=N)
-        df = DataFrame({'key': labels,
-                        'key2': labels2,
-                        'value1': np.random.randn(N),
-                        'value2': ['foo', 'bar', 'baz', 'qux'] * (N // 4)})
-        def f(g):
-            return 1
-
-        g = df.groupby(['key', 'key2'])
-
-        grouper = g.grouper
-
-        splitter = grouper._get_splitter(g._selected_obj, axis=g.axis)
-        group_keys = grouper._get_group_keys()
-
-        values, mutated = splitter.fast_apply(f, group_keys)
-        self.assertFalse(mutated)
-
-    def test_apply_with_mixed_dtype(self):
-        # GH3480, apply with mixed dtype on axis=1 breaks in 0.11
-        df = DataFrame({'foo1' : ['one', 'two', 'two', 'three', 'one', 'two'],
-                        'foo2' : np.random.randn(6)})
-        result = df.apply(lambda x: x, axis=1)
-        assert_series_equal(df.get_dtype_counts(), result.get_dtype_counts())
-
-
-        # GH 3610 incorrect dtype conversion with as_index=False
-        df = DataFrame({"c1" : [1,2,6,6,8]})
-        df["c2"] = df.c1/2.0
-        result1 = df.groupby("c2").mean().reset_index().c2
-        result2 = df.groupby("c2", as_index=False).mean().c2
-        assert_series_equal(result1,result2)
-
-    def test_groupby_aggregation_mixed_dtype(self):
-
-        # GH 6212
-        expected = DataFrame({
-            'v1': [5,5,7,np.nan,3,3,4,1],
-            'v2': [55,55,77,np.nan,33,33,44,11]},
-            index=MultiIndex.from_tuples([(1,95),(1,99),(2,95),(2,99),('big','damp'),
-                                          ('blue','dry'),('red','red'),('red','wet')],
-                                         names=['by1','by2']))
-
-        df = DataFrame({
-            'v1': [1,3,5,7,8,3,5,np.nan,4,5,7,9],
-            'v2': [11,33,55,77,88,33,55,np.nan,44,55,77,99],
-            'by1': ["red", "blue", 1, 2, np.nan, "big", 1, 2, "red", 1, np.nan, 12],
-            'by2': ["wet", "dry", 99, 95, np.nan, "damp", 95, 99, "red", 99, np.nan,
-                    np.nan]
-            })
-
-        g = df.groupby(['by1','by2'])
-        result = g[['v1','v2']].mean()
-        assert_frame_equal(result,expected)
-
-    def test_groupby_dtype_inference_empty(self):
-        # GH 6733
-        df = DataFrame({'x': [], 'range': np.arange(0,dtype='int64')})
-        result = df.groupby('x').first()
-        expected = DataFrame({'range' : Series([],index=Index([],name='x'),dtype='int64') })
-        assert_frame_equal(result,expected,by_blocks=True)
-
-    def test_groupby_list_infer_array_like(self):
-        result = self.df.groupby(list(self.df['A'])).mean()
-        expected = self.df.groupby(self.df['A']).mean()
-        assert_frame_equal(result, expected, check_names=False)
-
-        self.assertRaises(Exception, self.df.groupby, list(self.df['A'][:-1]))
-
-        # pathological case of ambiguity
-        df = DataFrame({'foo': [0, 1], 'bar': [3, 4],
-                        'val': np.random.randn(2)})
-
-        result = df.groupby(['foo', 'bar']).mean()
-        expected = df.groupby([df['foo'], df['bar']]).mean()[['val']]
-
-    def test_groupby_keys_same_size_as_index(self):
-        # GH 11185
-        freq = 's'
-        index = pd.date_range(start=np.datetime64(
-            '2015-09-29T11:34:44-0700'), periods=2, freq=freq)
-        df = pd.DataFrame([['A', 10], ['B', 15]], columns=[
-                          'metric', 'values'], index=index)
-        result = df.groupby([pd.Grouper(level=0, freq=freq), 'metric']).mean()
-        expected = df.set_index([df.index, 'metric'])
-
-        assert_frame_equal(result, expected)
-
-    def test_groupby_nat_exclude(self):
-        # GH 6992
-        df = pd.DataFrame({'values': np.random.randn(8),
-                   'dt': [np.nan, pd.Timestamp('2013-01-01'), np.nan, pd.Timestamp('2013-02-01'),
-                          np.nan, pd.Timestamp('2013-02-01'), np.nan, pd.Timestamp('2013-01-01')],
-                    'str': [np.nan, 'a', np.nan, 'a',
-                          np.nan, 'a', np.nan, 'b']})
-        grouped = df.groupby('dt')
-
-        expected = [[1, 7], [3, 5]]
-        keys = sorted(grouped.groups.keys())
-        self.assertEqual(len(keys), 2)
-        for k, e in zip(keys, expected):
-            # grouped.groups keys are np.datetime64 with system tz
-            # not to be affected by tz, only compare values
-            self.assertEqual(grouped.groups[k], e)
-
-        # confirm obj is not filtered
-        tm.assert_frame_equal(grouped.grouper.groupings[0].obj, df)
-        self.assertEqual(grouped.ngroups, 2)
-        expected = {Timestamp('2013-01-01 00:00:00'): np.array([1, 7]),
-                    Timestamp('2013-02-01 00:00:00'): np.array([3, 5])}
-        for k in grouped.indices:
-            self.assert_numpy_array_equal(grouped.indices[k], expected[k])
-
-        tm.assert_frame_equal(grouped.get_group(Timestamp('2013-01-01')), df.iloc[[1, 7]])
-        tm.assert_frame_equal(grouped.get_group(Timestamp('2013-02-01')), df.iloc[[3, 5]])
-
-        self.assertRaises(KeyError, grouped.get_group, pd.NaT)
-
-        nan_df = DataFrame({'nan': [np.nan, np.nan, np.nan],
-                            'nat': [pd.NaT, pd.NaT, pd.NaT]})
-        self.assertEqual(nan_df['nan'].dtype, 'float64')
-        self.assertEqual(nan_df['nat'].dtype, 'datetime64[ns]')
-
-        for key in ['nan', 'nat']:
-            grouped = nan_df.groupby(key)
-            self.assertEqual(grouped.groups, {})
-            self.assertEqual(grouped.ngroups, 0)
-            self.assertEqual(grouped.indices, {})
-            self.assertRaises(KeyError, grouped.get_group, np.nan)
-            self.assertRaises(KeyError, grouped.get_group, pd.NaT)
-
-    def test_dictify(self):
-        dict(iter(self.df.groupby('A')))
-        dict(iter(self.df.groupby(['A', 'B'])))
-        dict(iter(self.df['C'].groupby(self.df['A'])))
-        dict(iter(self.df['C'].groupby([self.df['A'], self.df['B']])))
-        dict(iter(self.df.groupby('A')['C']))
-        dict(iter(self.df.groupby(['A', 'B'])['C']))
-
-    def test_sparse_friendly(self):
-        sdf = self.df[['C', 'D']].to_sparse()
-        panel = tm.makePanel()
-        tm.add_nans(panel)
-
-        def _check_work(gp):
-            gp.mean()
-            gp.agg(np.mean)
-            dict(iter(gp))
-
-        # it works!
-        _check_work(sdf.groupby(lambda x: x // 2))
-        _check_work(sdf['C'].groupby(lambda x: x // 2))
-        _check_work(sdf.groupby(self.df['A']))
-
-        # do this someday
-        # _check_work(panel.groupby(lambda x: x.month, axis=1))
-
-    def test_panel_groupby(self):
-        self.panel = tm.makePanel()
-        tm.add_nans(self.panel)
-        grouped = self.panel.groupby({'ItemA': 0, 'ItemB': 0, 'ItemC': 1},
-                                     axis='items')
-        agged = grouped.mean()
-        agged2 = grouped.agg(lambda x: x.mean('items'))
-
-        tm.assert_panel_equal(agged, agged2)
-
-        self.assert_numpy_array_equal(agged.items, [0, 1])
-
-        grouped = self.panel.groupby(lambda x: x.month, axis='major')
-        agged = grouped.mean()
-
-        self.assert_numpy_array_equal(agged.major_axis, sorted(list(set(self.panel.major_axis.month))))
-
-        grouped = self.panel.groupby({'A': 0, 'B': 0, 'C': 1, 'D': 1},
-                                     axis='minor')
-        agged = grouped.mean()
-        self.assert_numpy_array_equal(agged.minor_axis, [0, 1])
-
-    def test_numpy_groupby(self):
-        from pandas.core.groupby import numpy_groupby
-
-        data = np.random.randn(100, 100)
-        labels = np.random.randint(0, 10, size=100)
-
-        df = DataFrame(data)
-
-        result = df.groupby(labels).sum().values
-        expected = numpy_groupby(data, labels)
-        assert_almost_equal(result, expected)
-
-        result = df.groupby(labels, axis=1).sum().values
-        expected = numpy_groupby(data, labels, axis=1)
-        assert_almost_equal(result, expected)
-
-    def test_groupby_2d_malformed(self):
-        d = DataFrame(index=lrange(2))
-        d['group'] = ['g1', 'g2']
-        d['zeros'] = [0, 0]
-        d['ones'] = [1, 1]
-        d['label'] = ['l1', 'l2']
-        tmp = d.groupby(['group']).mean()
-        res_values = np.array([[0., 1.], [0., 1.]])
-        self.assert_numpy_array_equal(tmp.columns, ['zeros', 'ones'])
-        self.assert_numpy_array_equal(tmp.values, res_values)
-
-    def test_int32_overflow(self):
-        B = np.concatenate((np.arange(10000), np.arange(10000),
-                            np.arange(5000)))
-        A = np.arange(25000)
-        df = DataFrame({'A': A, 'B': B,
-                        'C': A, 'D': B,
-                        'E': np.random.randn(25000)})
-
-        left = df.groupby(['A', 'B', 'C', 'D']).sum()
-        right = df.groupby(['D', 'C', 'B', 'A']).sum()
-        self.assertEqual(len(left), len(right))
-
-    def test_int64_overflow(self):
-        from pandas.core.groupby import _int64_overflow_possible
-
-        B = np.concatenate((np.arange(1000), np.arange(1000),
-                            np.arange(500)))
-        A = np.arange(2500)
-        df = DataFrame({'A': A, 'B': B,
-                        'C': A, 'D': B,
-                        'E': A, 'F': B,
-                        'G': A, 'H': B,
-                        'values': np.random.randn(2500)})
-
-        lg = df.groupby(['A', 'B', 'C', 'D', 'E', 'F', 'G', 'H'])
-        rg = df.groupby(['H', 'G', 'F', 'E', 'D', 'C', 'B', 'A'])
-
-        left = lg.sum()['values']
-        right = rg.sum()['values']
-
-        exp_index, _ = left.index.sortlevel(0)
-        self.assertTrue(left.index.equals(exp_index))
-
-        exp_index, _ = right.index.sortlevel(0)
-        self.assertTrue(right.index.equals(exp_index))
-
-        tups = list(map(tuple, df[['A', 'B', 'C', 'D',
-                              'E', 'F', 'G', 'H']].values))
-        tups = com._asarray_tuplesafe(tups)
-        expected = df.groupby(tups).sum()['values']
-
-        for k, v in compat.iteritems(expected):
-            self.assertEqual(left[k], right[k[::-1]])
-            self.assertEqual(left[k], v)
-        self.assertEqual(len(left), len(right))
-
-        # GH9096
-        values = range(55109)
-        data = pd.DataFrame.from_dict({'a': values, 'b': values,
-                                       'c': values, 'd': values})
-        grouped = data.groupby(['a', 'b', 'c', 'd'])
-        self.assertEqual(len(grouped), len(values))
-
-        arr = np.random.randint(- 1 << 12, 1 << 12, (1 << 15, 5))
-        i = np.random.choice(len(arr), len(arr) * 4)
-        arr = np.vstack((arr, arr[i]))  # add sume duplicate rows
-
-        i = np.random.permutation(len(arr))
-        arr = arr[i]  # shuffle rows
-
-        df = DataFrame(arr, columns=list('abcde'))
-        df['jim'], df['joe'] = np.random.randn(2, len(df)) * 10
-        gr = df.groupby(list('abcde'))
-
-        # verify this is testing what it is supposed to test!
-        self.assertTrue(_int64_overflow_possible(gr.grouper.shape))
-
-        # mannually compute groupings
-        jim, joe = defaultdict(list), defaultdict(list)
-        for key, a, b in zip(map(tuple, arr), df['jim'], df['joe']):
-            jim[key].append(a)
-            joe[key].append(b)
-
-        self.assertEqual(len(gr), len(jim))
-        mi = MultiIndex.from_tuples(jim.keys(), names=list('abcde'))
-
-        def aggr(func):
-            f = lambda a: np.fromiter(map(func, a), dtype='f8')
-            arr = np.vstack((f(jim.values()), f(joe.values()))).T
-            res = DataFrame(arr, columns=['jim', 'joe'], index=mi)
-            return res.sort_index()
-
-        assert_frame_equal(gr.mean(), aggr(np.mean))
-        assert_frame_equal(gr.median(), aggr(np.median))
-
-    def test_groupby_sort_multi(self):
-        df = DataFrame({'a': ['foo', 'bar', 'baz'],
-                        'b': [3, 2, 1],
-                        'c': [0, 1, 2],
-                        'd': np.random.randn(3)})
-
-        tups = lmap(tuple, df[['a', 'b', 'c']].values)
-        tups = com._asarray_tuplesafe(tups)
-        result = df.groupby(['a', 'b', 'c'], sort=True).sum()
-        self.assert_numpy_array_equal(result.index.values,
-                                      tups[[1, 2, 0]])
-
-        tups = lmap(tuple, df[['c', 'a', 'b']].values)
-        tups = com._asarray_tuplesafe(tups)
-        result = df.groupby(['c', 'a', 'b'], sort=True).sum()
-        self.assert_numpy_array_equal(result.index.values, tups)
-
-        tups = lmap(tuple, df[['b', 'c', 'a']].values)
-        tups = com._asarray_tuplesafe(tups)
-        result = df.groupby(['b', 'c', 'a'], sort=True).sum()
-        self.assert_numpy_array_equal(result.index.values,
-                                      tups[[2, 1, 0]])
-
-        df = DataFrame({'a': [0, 1, 2, 0, 1, 2],
-                        'b': [0, 0, 0, 1, 1, 1],
-                        'd': np.random.randn(6)})
-        grouped = df.groupby(['a', 'b'])['d']
-        result = grouped.sum()
-        _check_groupby(df, result, ['a', 'b'], 'd')
-
-    def test_intercept_builtin_sum(self):
-        s = Series([1., 2., np.nan, 3.])
-        grouped = s.groupby([0, 1, 2, 2])
-
-        result = grouped.agg(builtins.sum)
-        result2 = grouped.apply(builtins.sum)
-        expected = grouped.sum()
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-
-    def test_column_select_via_attr(self):
-        result = self.df.groupby('A').C.sum()
-        expected = self.df.groupby('A')['C'].sum()
-        assert_series_equal(result, expected)
-
-        self.df['mean'] = 1.5
-        result = self.df.groupby('A').mean()
-        expected = self.df.groupby('A').agg(np.mean)
-        assert_frame_equal(result, expected)
-
-    def test_rank_apply(self):
-        lev1 = tm.rands_array(10, 100)
-        lev2 = tm.rands_array(10, 130)
-        lab1 = np.random.randint(0, 100, size=500)
-        lab2 = np.random.randint(0, 130, size=500)
-
-        df = DataFrame({'value': np.random.randn(500),
-                        'key1': lev1.take(lab1),
-                        'key2': lev2.take(lab2)})
-
-        result = df.groupby(['key1', 'key2']).value.rank()
-
-        expected = []
-        for key, piece in df.groupby(['key1', 'key2']):
-            expected.append(piece.value.rank())
-        expected = concat(expected, axis=0)
-        expected = expected.reindex(result.index)
-        assert_series_equal(result, expected, check_names=False)
-        self.assertTrue(result.name is None)
-
-        result = df.groupby(['key1', 'key2']).value.rank(pct=True)
-
-        expected = []
-        for key, piece in df.groupby(['key1', 'key2']):
-            expected.append(piece.value.rank(pct=True))
-        expected = concat(expected, axis=0)
-        expected = expected.reindex(result.index)
-        assert_series_equal(result, expected, check_names=False)
-        self.assertTrue(result.name is None)
-
-    def test_dont_clobber_name_column(self):
-        df = DataFrame({'key': ['a', 'a', 'a', 'b', 'b', 'b'],
-                        'name': ['foo', 'bar', 'baz'] * 2})
-
-        result = df.groupby('key').apply(lambda x: x)
-        assert_frame_equal(result, df)
-
-    def test_skip_group_keys(self):
-        from pandas import concat
-
-        tsf = tm.makeTimeDataFrame()
-
-        grouped = tsf.groupby(lambda x: x.month, group_keys=False)
-        result = grouped.apply(lambda x: x.sort_values(by='A')[:3])
-
-        pieces = []
-        for key, group in grouped:
-            pieces.append(group.sort_values(by='A')[:3])
-
-        expected = concat(pieces)
-        assert_frame_equal(result, expected)
-
-        grouped = tsf['A'].groupby(lambda x: x.month, group_keys=False)
-        result = grouped.apply(lambda x: x.sort_values()[:3])
-
-        pieces = []
-        for key, group in grouped:
-            pieces.append(group.sort_values()[:3])
-
-        expected = concat(pieces)
-        assert_series_equal(result, expected, check_names=False)
-        self.assertTrue(result.name is None)
-
-    def test_no_nonsense_name(self):
-        # GH #995
-        s = self.frame['C'].copy()
-        s.name = None
-
-        result = s.groupby(self.frame['A']).agg(np.sum)
-        self.assertIsNone(result.name)
-
-    def test_wrap_agg_out(self):
-        grouped = self.three_group.groupby(['A', 'B'])
-
-        def func(ser):
-            if ser.dtype == np.object:
-                raise TypeError
-            else:
-                return ser.sum()
-        result = grouped.aggregate(func)
-        exp_grouped = self.three_group.ix[:, self.three_group.columns != 'C']
-        expected = exp_grouped.groupby(['A', 'B']).aggregate(func)
-        assert_frame_equal(result, expected)
-
-    def test_multifunc_sum_bug(self):
-        # GH #1065
-        x = DataFrame(np.arange(9).reshape(3, 3))
-        x['test'] = 0
-        x['fl'] = [1.3, 1.5, 1.6]
-
-        grouped = x.groupby('test')
-        result = grouped.agg({'fl': 'sum', 2: 'size'})
-        self.assertEqual(result['fl'].dtype, np.float64)
-
-    def test_handle_dict_return_value(self):
-        def f(group):
-            return {'min': group.min(), 'max': group.max()}
-
-        def g(group):
-            return Series({'min': group.min(), 'max': group.max()})
-
-        result = self.df.groupby('A')['C'].apply(f)
-        expected = self.df.groupby('A')['C'].apply(g)
-
-        tm.assertIsInstance(result, Series)
-        assert_series_equal(result, expected)
-
-    def test_getitem_list_of_columns(self):
-        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                              'foo', 'bar', 'foo', 'foo'],
-                        'B': ['one', 'one', 'two', 'three',
-                              'two', 'two', 'one', 'three'],
-                        'C': np.random.randn(8),
-                        'D': np.random.randn(8),
-                        'E': np.random.randn(8)})
-
-        result = df.groupby('A')[['C', 'D']].mean()
-        result2 = df.groupby('A')['C', 'D'].mean()
-        result3 = df.groupby('A')[df.columns[2:4]].mean()
-
-        expected = df.ix[:, ['A', 'C', 'D']].groupby('A').mean()
-
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
-        assert_frame_equal(result3, expected)
-
-    def test_agg_multiple_functions_maintain_order(self):
-        # GH #610
-        funcs = [('mean', np.mean), ('max', np.max), ('min', np.min)]
-        result = self.df.groupby('A')['C'].agg(funcs)
-        exp_cols = ['mean', 'max', 'min']
-
-        self.assert_numpy_array_equal(result.columns, exp_cols)
-
-    def test_multiple_functions_tuples_and_non_tuples(self):
-        # #1359
-
-        funcs = [('foo', 'mean'), 'std']
-        ex_funcs = [('foo', 'mean'), ('std', 'std')]
-
-        result = self.df.groupby('A')['C'].agg(funcs)
-        expected = self.df.groupby('A')['C'].agg(ex_funcs)
-        assert_frame_equal(result, expected)
-
-        result = self.df.groupby('A').agg(funcs)
-        expected = self.df.groupby('A').agg(ex_funcs)
-        assert_frame_equal(result, expected)
-
-    def test_agg_multiple_functions_too_many_lambdas(self):
-        grouped = self.df.groupby('A')
-        funcs = ['mean', lambda x: x.mean(), lambda x: x.std()]
-
-        self.assertRaises(SpecificationError, grouped.agg, funcs)
-
-    def test_more_flexible_frame_multi_function(self):
-        from pandas import concat
-
-        grouped = self.df.groupby('A')
-
-        exmean = grouped.agg(OrderedDict([['C', np.mean], ['D', np.mean]]))
-        exstd = grouped.agg(OrderedDict([['C', np.std], ['D', np.std]]))
-
-        expected = concat([exmean, exstd], keys=['mean', 'std'], axis=1)
-        expected = expected.swaplevel(0, 1, axis=1).sortlevel(0, axis=1)
-
-        d = OrderedDict([['C', [np.mean, np.std]], ['D', [np.mean, np.std]]])
-        result = grouped.aggregate(d)
-
-        assert_frame_equal(result, expected)
-
-        # be careful
-        result = grouped.aggregate(OrderedDict([['C', np.mean],
-                                                ['D', [np.mean, np.std]]]))
-        expected = grouped.aggregate(OrderedDict([['C', np.mean],
-                                                  ['D', [np.mean, np.std]]]))
-        assert_frame_equal(result, expected)
-
-        def foo(x):
-            return np.mean(x)
-
-        def bar(x):
-            return np.std(x, ddof=1)
-        d = OrderedDict([['C', np.mean],
-                         ['D', OrderedDict([['foo', np.mean],
-                                            ['bar', np.std]])]])
-        result = grouped.aggregate(d)
-
-        d = OrderedDict([['C', [np.mean]], ['D', [foo, bar]]])
-        expected = grouped.aggregate(d)
-
-        assert_frame_equal(result, expected)
-
-    def test_multi_function_flexible_mix(self):
-        # GH #1268
-        grouped = self.df.groupby('A')
-
-        d = OrderedDict([['C', OrderedDict([['foo', 'mean'],
-                                            [
-                                            'bar', 'std']])],
-                         ['D', 'sum']])
-        result = grouped.aggregate(d)
-        d2 = OrderedDict([['C', OrderedDict([['foo', 'mean'],
-                                             [
-                                             'bar', 'std']])],
-                          ['D', ['sum']]])
-        result2 = grouped.aggregate(d2)
-
-        d3 = OrderedDict([['C', OrderedDict([['foo', 'mean'],
-                                             [
-                                             'bar', 'std']])],
-                          ['D', {'sum': 'sum'}]])
-        expected = grouped.aggregate(d3)
-
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
-
-    def test_agg_callables(self):
-        # GH 7929
-        df = DataFrame({'foo' : [1,2], 'bar' :[3,4]}).astype(np.int64)
-
-        class fn_class(object):
-            def __call__(self, x):
-                return sum(x)
-
-        equiv_callables = [sum, np.sum,
-                           lambda x: sum(x),
-                           lambda x: x.sum(),
-                           partial(sum), fn_class()]
-
-        expected = df.groupby("foo").agg(sum)
-        for ecall in equiv_callables:
-            result = df.groupby('foo').agg(ecall)
-            assert_frame_equal(result, expected)
-
-    def test_set_group_name(self):
-        def f(group):
-            assert group.name is not None
-            return group
-
-        def freduce(group):
-            assert group.name is not None
-            return group.sum()
-
-        def foo(x):
-            return freduce(x)
-
-        def _check_all(grouped):
-            # make sure all these work
-            grouped.apply(f)
-            grouped.aggregate(freduce)
-            grouped.aggregate({'C': freduce, 'D': freduce})
-            grouped.transform(f)
-
-            grouped['C'].apply(f)
-            grouped['C'].aggregate(freduce)
-            grouped['C'].aggregate([freduce, foo])
-            grouped['C'].transform(f)
-
-        _check_all(self.df.groupby('A'))
-        _check_all(self.df.groupby(['A', 'B']))
-
-    def test_no_dummy_key_names(self):
-        # GH #1291
-
-        result = self.df.groupby(self.df['A'].values).sum()
-        self.assertIsNone(result.index.name)
-
-        result = self.df.groupby([self.df['A'].values,
-                                  self.df['B'].values]).sum()
-        self.assertEqual(result.index.names, (None, None))
-
-    def test_groupby_sort_categorical(self):
-        # dataframe groupby sort was being ignored # GH 8868
-        df = DataFrame([['(7.5, 10]', 10, 10],
-                        ['(7.5, 10]', 8, 20],
-                        ['(2.5, 5]', 5, 30],
-                        ['(5, 7.5]', 6, 40],
-                        ['(2.5, 5]', 4, 50],
-                        ['(0, 2.5]', 1, 60],
-                        ['(5, 7.5]', 7, 70]], columns=['range', 'foo', 'bar'])
-        df['range'] = Categorical(df['range'],ordered=True)
-        index = Index(['(0, 2.5]', '(2.5, 5]', '(5, 7.5]', '(7.5, 10]'], dtype='object')
-        index.name = 'range'
-        result_sort = DataFrame([[1, 60], [5, 30], [6, 40], [10, 10]], columns=['foo', 'bar'])
-        result_sort.index = index
-        index = Index(['(7.5, 10]', '(2.5, 5]', '(5, 7.5]', '(0, 2.5]'], dtype='object')
-        index.name = 'range'
-        result_nosort = DataFrame([[10, 10], [5, 30], [6, 40], [1, 60]], index=index, columns=['foo', 'bar'])
-        result_nosort.index = index
-
-        col = 'range'
-        assert_frame_equal(result_sort, df.groupby(col, sort=True).first())
-        # when categories is ordered, group is ordered by category's order
-        assert_frame_equal(result_sort, df.groupby(col, sort=False).first())
-
-        df['range'] = Categorical(df['range'],ordered=False)
-        index = Index(['(0, 2.5]', '(2.5, 5]', '(5, 7.5]', '(7.5, 10]'], dtype='object')
-        index.name = 'range'
-        result_sort = DataFrame([[1, 60], [5, 30], [6, 40], [10, 10]], columns=['foo', 'bar'])
-        result_sort.index = index
-        index = Index(['(7.5, 10]', '(2.5, 5]', '(5, 7.5]', '(0, 2.5]'], dtype='object')
-        index.name = 'range'
-        result_nosort = DataFrame([[10, 10], [5, 30], [6, 40], [1, 60]], index=index, columns=['foo', 'bar'])
-        result_nosort.index = index
-
-        col = 'range'
-
-        #### this is an unordered categorical, but we allow this ####
-        assert_frame_equal(result_sort, df.groupby(col, sort=True).first())
-        assert_frame_equal(result_nosort, df.groupby(col, sort=False).first())
-
-    def test_groupby_sort_categorical_datetimelike(self):
-        # GH10505
-
-        # use same data as test_groupby_sort_categorical, which category is
-        # corresponding to datetime.month
-        df = DataFrame({'dt': [datetime(2011, 7, 1), datetime(2011, 7, 1),
-                               datetime(2011, 2, 1), datetime(2011, 5, 1),
-                               datetime(2011, 2, 1), datetime(2011, 1, 1),
-                               datetime(2011, 5, 1)],
-                        'foo': [10, 8, 5, 6, 4, 1, 7],
-                        'bar': [10, 20, 30, 40, 50, 60, 70]},
-                       columns=['dt', 'foo', 'bar'])
-
-        # ordered=True
-        df['dt'] = Categorical(df['dt'], ordered=True)
-        index = [datetime(2011, 1, 1), datetime(2011, 2, 1),
-                 datetime(2011, 5, 1), datetime(2011, 7, 1)]
-        result_sort = DataFrame([[1, 60], [5, 30], [6, 40], [10, 10]], columns=['foo', 'bar'])
-        result_sort.index = CategoricalIndex(index, name='dt', ordered=True)
-
-        index = [datetime(2011, 7, 1), datetime(2011, 2, 1),
-                 datetime(2011, 5, 1), datetime(2011, 1, 1)]
-        result_nosort = DataFrame([[10, 10], [5, 30], [6, 40], [1, 60]],
-                                  columns=['foo', 'bar'])
-        result_nosort.index = CategoricalIndex(index, categories=index,
-                                               name='dt', ordered=True)
-
-        col = 'dt'
-        assert_frame_equal(result_sort, df.groupby(col, sort=True).first())
-        # when categories is ordered, group is ordered by category's order
-        assert_frame_equal(result_sort, df.groupby(col, sort=False).first())
-
-        # ordered = False
-        df['dt'] = Categorical(df['dt'], ordered=False)
-        index = [datetime(2011, 1, 1), datetime(2011, 2, 1),
-                 datetime(2011, 5, 1), datetime(2011, 7, 1)]
-        result_sort = DataFrame([[1, 60], [5, 30], [6, 40], [10, 10]], columns=['foo', 'bar'])
-        result_sort.index = CategoricalIndex(index, name='dt')
-
-        index = [datetime(2011, 7, 1), datetime(2011, 2, 1),
-                 datetime(2011, 5, 1), datetime(2011, 1, 1)]
-        result_nosort = DataFrame([[10, 10], [5, 30], [6, 40], [1, 60]],
-                                  columns=['foo', 'bar'])
-        result_nosort.index = CategoricalIndex(index, categories=index, name='dt')
-
-        col = 'dt'
-        assert_frame_equal(result_sort, df.groupby(col, sort=True).first())
-        assert_frame_equal(result_nosort, df.groupby(col, sort=False).first())
-
-
-    def test_groupby_sort_multiindex_series(self):
-        # series multiindex groupby sort argument was not being passed through _compress_group_index
-        # GH 9444
-        index = MultiIndex(levels=[[1, 2], [1, 2]],
-                           labels=[[0, 0, 0, 0, 1, 1], [1, 1, 0, 0, 0, 0]],
-                           names=['a', 'b'])
-        mseries = Series([0, 1, 2, 3, 4, 5], index=index)
-        index = MultiIndex(levels=[[1, 2], [1, 2]],
-                           labels=[[0, 0, 1], [1, 0, 0]],
-                           names=['a', 'b'])
-        mseries_result = Series([0, 2, 4], index=index)
-
-        result = mseries.groupby(level=['a', 'b'], sort=False).first()
-        assert_series_equal(result, mseries_result)
-        result = mseries.groupby(level=['a', 'b'], sort=True).first()
-        assert_series_equal(result, mseries_result.sort_index())
-
-    def test_groupby_categorical(self):
-        levels = ['foo', 'bar', 'baz', 'qux']
-        codes = np.random.randint(0, 4, size=100)
-
-        cats = Categorical.from_codes(codes, levels, ordered=True)
-
-        data = DataFrame(np.random.randn(100, 4))
-
-        result = data.groupby(cats).mean()
-
-        expected = data.groupby(np.asarray(cats)).mean()
-        expected = expected.reindex(levels)
-
-        assert_frame_equal(result, expected)
-
-        grouped = data.groupby(cats)
-        desc_result = grouped.describe()
-
-        idx = cats.codes.argsort()
-        ord_labels = np.asarray(cats).take(idx)
-        ord_data = data.take(idx)
-        expected = ord_data.groupby(ord_labels, sort=False).describe()
-        expected.index.names = [None, None]
-        assert_frame_equal(desc_result, expected)
-
-        # GH 10460
-        expc = Categorical.from_codes(np.arange(4).repeat(8), levels, ordered=True)
-        exp = CategoricalIndex(expc)
-        self.assert_index_equal(desc_result.index.get_level_values(0), exp)
-        exp = Index(['count', 'mean', 'std', 'min', '25%', '50%', '75%', 'max'] * 4)
-        self.assert_index_equal(desc_result.index.get_level_values(1), exp)
-
-    def test_groupby_datetime_categorical(self):
-        # GH9049: ensure backward compatibility
-        levels = pd.date_range('2014-01-01', periods=4)
-        codes = np.random.randint(0, 4, size=100)
-
-        cats = Categorical.from_codes(codes, levels, ordered=True)
-
-        data = DataFrame(np.random.randn(100, 4))
-        result = data.groupby(cats).mean()
-
-        expected = data.groupby(np.asarray(cats)).mean()
-        expected = expected.reindex(levels)
-        expected.index = CategoricalIndex(expected.index, categories=expected.index,
-                                          ordered=True)
-
-        assert_frame_equal(result, expected)
-
-        grouped = data.groupby(cats)
-        desc_result = grouped.describe()
-
-        idx = cats.codes.argsort()
-        ord_labels = cats.take_nd(idx)
-        ord_data = data.take(idx)
-        expected = ord_data.groupby(ord_labels).describe()
-        expected.index.names = [None, None]
-        assert_frame_equal(desc_result, expected)
-        tm.assert_index_equal(desc_result.index, expected.index)
-        tm.assert_index_equal(desc_result.index.get_level_values(0), expected.index.get_level_values(0))
-
-        # GH 10460
-        expc = Categorical.from_codes(np.arange(4).repeat(8), levels, ordered=True)
-        exp = CategoricalIndex(expc)
-        self.assert_index_equal(desc_result.index.get_level_values(0), exp)
-        exp = Index(['count', 'mean', 'std', 'min', '25%', '50%', '75%', 'max'] * 4)
-        self.assert_index_equal(desc_result.index.get_level_values(1), exp)
-
-
-    def test_groupby_categorical_index(self):
-
-        levels = ['foo', 'bar', 'baz', 'qux']
-        codes = np.random.randint(0, 4, size=20)
-        cats = Categorical.from_codes(codes, levels, ordered=True)
-        df = DataFrame(np.repeat(np.arange(20),4).reshape(-1,4), columns=list('abcd'))
-        df['cats'] = cats
-
-        # with a cat index
-        result = df.set_index('cats').groupby(level=0).sum()
-        expected = df[list('abcd')].groupby(cats.codes).sum()
-        expected.index = CategoricalIndex(Categorical.from_codes([0,1,2,3], levels, ordered=True),name='cats')
-        assert_frame_equal(result, expected)
-
-        # with a cat column, should produce a cat index
-        result = df.groupby('cats').sum()
-        expected = df[list('abcd')].groupby(cats.codes).sum()
-        expected.index = CategoricalIndex(Categorical.from_codes([0,1,2,3], levels, ordered=True),name='cats')
-        assert_frame_equal(result, expected)
-
-    def test_groupby_groups_datetimeindex(self):
-        # #1430
-        from pandas.tseries.api import DatetimeIndex
-        periods = 1000
-        ind = DatetimeIndex(start='2012/1/1', freq='5min', periods=periods)
-        df = DataFrame({'high': np.arange(periods),
-                        'low': np.arange(periods)}, index=ind)
-        grouped = df.groupby(lambda x: datetime(x.year, x.month, x.day))
-
-        # it works!
-        groups = grouped.groups
-        tm.assertIsInstance(list(groups.keys())[0], datetime)
-
-    def test_groupby_groups_datetimeindex_tz(self):
-        # GH 3950
-        dates = ['2011-07-19 07:00:00', '2011-07-19 08:00:00', '2011-07-19 09:00:00',
-                 '2011-07-19 07:00:00', '2011-07-19 08:00:00', '2011-07-19 09:00:00']
-        df = DataFrame({'label': ['a', 'a', 'a', 'b', 'b', 'b'],
-                        'datetime': dates,
-                        'value1': np.arange(6,dtype='int64'),
-                        'value2': [1, 2] * 3})
-        df['datetime'] = df['datetime'].apply(lambda d: Timestamp(d, tz='US/Pacific'))
-
-        exp_idx1 = pd.DatetimeIndex(['2011-07-19 07:00:00', '2011-07-19 07:00:00',
-                                     '2011-07-19 08:00:00', '2011-07-19 08:00:00',
-                                     '2011-07-19 09:00:00', '2011-07-19 09:00:00'],
-                                    tz='US/Pacific', name='datetime')
-        exp_idx2 = Index(['a', 'b'] * 3, name='label')
-        exp_idx = MultiIndex.from_arrays([exp_idx1, exp_idx2])
-        expected = DataFrame({'value1': [0, 3, 1, 4, 2, 5], 'value2': [1, 2, 2, 1, 1, 2]},
-                             index=exp_idx, columns=['value1', 'value2'])
-
-        result = df.groupby(['datetime', 'label']).sum()
-        assert_frame_equal(result, expected)
-
-        # by level
-        didx = pd.DatetimeIndex(dates, tz='Asia/Tokyo')
-        df = DataFrame({'value1': np.arange(6,dtype='int64'),
-                        'value2': [1, 2, 3, 1, 2, 3]},
-                       index=didx)
-
-        exp_idx = pd.DatetimeIndex(['2011-07-19 07:00:00', '2011-07-19 08:00:00',
-                                    '2011-07-19 09:00:00'], tz='Asia/Tokyo')
-        expected = DataFrame({'value1': [3, 5, 7], 'value2': [2, 4, 6]},
-                             index=exp_idx, columns=['value1', 'value2'])
-
-        result = df.groupby(level=0).sum()
-        assert_frame_equal(result, expected)
-
-    def test_groupby_multi_timezone(self):
-
-        # combining multiple / different timezones yields UTC
-
-        data="""0,2000-01-28 16:47:00,America/Chicago
-1,2000-01-29 16:48:00,America/Chicago
-2,2000-01-30 16:49:00,America/Los_Angeles
-3,2000-01-31 16:50:00,America/Chicago
-4,2000-01-01 16:50:00,America/New_York"""
-
-        df = pd.read_csv(StringIO(data),header=None, names=['value','date','tz'])
-        result = df.groupby('tz').date.apply(lambda x: pd.to_datetime(x).dt.tz_localize(x.name))
-
-        expected = pd.to_datetime(Series(['2000-01-28 22:47:00', '2000-01-29 22:48:00', '2000-01-31 00:49:00', '2000-01-31 22:50:00', '2000-01-01 21:50:00']))
-        assert_series_equal(result, expected)
-
-        tz = 'America/Chicago'
-        result = pd.to_datetime(df.groupby('tz').date.get_group(tz)).dt.tz_localize(tz)
-        expected = pd.to_datetime(Series(['2000-01-28 16:47:00', '2000-01-29 16:48:00','2000-01-31 16:50:00'],
-                                         index=[0,1,3],
-                                         name='date')).dt.tz_localize(tz)
-        assert_series_equal(result, expected)
-
-    def test_groupby_reindex_inside_function(self):
-        from pandas.tseries.api import DatetimeIndex
-
-        periods = 1000
-        ind = DatetimeIndex(start='2012/1/1', freq='5min', periods=periods)
-        df = DataFrame({'high': np.arange(
-            periods), 'low': np.arange(periods)}, index=ind)
-
-        def agg_before(hour, func, fix=False):
-            """
-                Run an aggregate func on the subset of data.
-            """
-            def _func(data):
-                d = data.select(lambda x: x.hour < 11).dropna()
-                if fix:
-                    data[data.index[0]]
-                if len(d) == 0:
-                    return None
-                return func(d)
-            return _func
-
-        def afunc(data):
-            d = data.select(lambda x: x.hour < 11).dropna()
-            return np.max(d)
-
-        grouped = df.groupby(lambda x: datetime(x.year, x.month, x.day))
-        closure_bad = grouped.agg({'high': agg_before(11, np.max)})
-        closure_good = grouped.agg({'high': agg_before(11, np.max, True)})
-
-        assert_frame_equal(closure_bad, closure_good)
-
-    def test_multiindex_columns_empty_level(self):
-        l = [['count', 'values'], ['to filter', '']]
-        midx = MultiIndex.from_tuples(l)
-
-        df = DataFrame([[long(1), 'A']], columns=midx)
-
-        grouped = df.groupby('to filter').groups
-        self.assert_numpy_array_equal(grouped['A'], [0])
-
-        grouped = df.groupby([('to filter', '')]).groups
-        self.assert_numpy_array_equal(grouped['A'], [0])
-
-        df = DataFrame([[long(1), 'A'], [long(2), 'B']], columns=midx)
-
-        expected = df.groupby('to filter').groups
-        result = df.groupby([('to filter', '')]).groups
-        self.assertEqual(result, expected)
-
-        df = DataFrame([[long(1), 'A'], [long(2), 'A']], columns=midx)
-
-        expected = df.groupby('to filter').groups
-        result = df.groupby([('to filter', '')]).groups
-        self.assertEqual(result, expected)
-
-    def test_cython_median(self):
-        df = DataFrame(np.random.randn(1000))
-        df.values[::2] = np.nan
-
-        labels = np.random.randint(0, 50, size=1000).astype(float)
-        labels[::17] = np.nan
-
-        result = df.groupby(labels).median()
-        exp = df.groupby(labels).agg(nanops.nanmedian)
-        assert_frame_equal(result, exp)
-
-        df = DataFrame(np.random.randn(1000, 5))
-        rs = df.groupby(labels).agg(np.median)
-        xp = df.groupby(labels).median()
-        assert_frame_equal(rs, xp)
-
-    def test_groupby_categorical_no_compress(self):
-        data = Series(np.random.randn(9))
-
-        codes = np.array([0, 0, 0, 1, 1, 1, 2, 2, 2])
-        cats = Categorical.from_codes(codes, [0, 1, 2], ordered=True)
-
-        result = data.groupby(cats).mean()
-        exp = data.groupby(codes).mean()
-
-        exp.index = CategoricalIndex(exp.index,categories=cats.categories,ordered=cats.ordered)
-        assert_series_equal(result, exp)
-
-        codes = np.array([0, 0, 0, 1, 1, 1, 3, 3, 3])
-        cats = Categorical.from_codes(codes, [0, 1, 2, 3], ordered=True)
-
-        result = data.groupby(cats).mean()
-        exp = data.groupby(codes).mean().reindex(cats.categories)
-        exp.index = CategoricalIndex(exp.index,categories=cats.categories,ordered=cats.ordered)
-        assert_series_equal(result, exp)
-
-        cats = Categorical(["a", "a", "a", "b", "b", "b", "c", "c", "c"],
-                           categories=["a","b","c","d"], ordered=True)
-        data = DataFrame({"a":[1,1,1,2,2,2,3,4,5], "b":cats})
-
-        result = data.groupby("b").mean()
-        result = result["a"].values
-        exp = np.array([1,2,4,np.nan])
-        self.assert_numpy_array_equal(result, exp)
-
-    def test_groupby_non_arithmetic_agg_types(self):
-        # GH9311, GH6620
-        df = pd.DataFrame([{'a': 1, 'b': 1},
-                           {'a': 1, 'b': 2},
-                           {'a': 2, 'b': 3},
-                           {'a': 2, 'b': 4}])
-
-        dtypes = ['int8', 'int16', 'int32', 'int64',
-                  'float32', 'float64']
-
-        grp_exp = {'first': {'df': [{'a': 1, 'b': 1}, {'a': 2, 'b': 3}]},
-                   'last': {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 4}]},
-                   'min': {'df': [{'a': 1, 'b': 1}, {'a': 2, 'b': 3}]},
-                   'max': {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 4}]},
-                   'nth': {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 4}],
-                           'args': [1]},
-                   'count': {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 2}],
-                             'out_type': 'int64'}}
-
-        for dtype in dtypes:
-            df_in = df.copy()
-            df_in['b'] = df_in.b.astype(dtype)
-
-            for method, data in compat.iteritems(grp_exp):
-                if 'args' not in data:
-                    data['args'] = []
-
-                if 'out_type' in data:
-                    out_type = data['out_type']
-                else:
-                    out_type = dtype
-
-                exp = data['df']
-                df_out = pd.DataFrame(exp)
-
-                df_out['b'] = df_out.b.astype(out_type)
-                df_out.set_index('a', inplace=True)
-
-                grpd = df_in.groupby('a')
-                t = getattr(grpd, method)(*data['args'])
-                assert_frame_equal(t, df_out)
-
-    def test_groupby_non_arithmetic_agg_intlike_precision(self):
-        # GH9311, GH6620
-        c = 24650000000000000
-
-        inputs = ((Timestamp('2011-01-15 12:50:28.502376'),
-                   Timestamp('2011-01-20 12:50:28.593448')),
-                  (1 + c, 2 + c))
-
-        for i in inputs:
-            df = pd.DataFrame([{'a': 1,
-                                'b': i[0]},
-                               {'a': 1,
-                                'b': i[1]}])
-
-            grp_exp = {'first': {'expected': i[0]},
-                       'last': {'expected': i[1]},
-                       'min': {'expected': i[0]},
-                       'max': {'expected': i[1]},
-                       'nth': {'expected': i[1], 'args': [1]},
-                       'count': {'expected': 2}}
-
-            for method, data in compat.iteritems(grp_exp):
-                if 'args' not in data:
-                    data['args'] = []
-
-                grpd = df.groupby('a')
-                res = getattr(grpd, method)(*data['args'])
-                self.assertEqual(res.iloc[0].b, data['expected'])
-
-    def test_groupby_first_datetime64(self):
-        df = DataFrame([(1, 1351036800000000000), (2, 1351036800000000000)])
-        df[1] = df[1].view('M8[ns]')
-
-        self.assertTrue(issubclass(df[1].dtype.type, np.datetime64))
-
-        result = df.groupby(level=0).first()
-        got_dt = result[1].dtype
-        self.assertTrue(issubclass(got_dt.type, np.datetime64))
-
-        result = df[1].groupby(level=0).first()
-        got_dt = result.dtype
-        self.assertTrue(issubclass(got_dt.type, np.datetime64))
-
-    def test_groupby_max_datetime64(self):
-        # GH 5869
-        # datetimelike dtype conversion from int
-        df = DataFrame(dict(A = Timestamp('20130101'), B = np.arange(5)))
-        expected = df.groupby('A')['A'].apply(lambda x: x.max())
-        result = df.groupby('A')['A'].max()
-        assert_series_equal(result,expected)
-
-    def test_groupby_datetime64_32_bit(self):
-        # GH 6410 / numpy 4328
-        # 32-bit under 1.9-dev indexing issue
-
-        df = DataFrame({"A": range(2), "B": [pd.Timestamp('2000-01-1')]*2})
-        result = df.groupby("A")["B"].transform(min)
-        expected = Series([pd.Timestamp('2000-01-1')]*2)
-        assert_series_equal(result,expected)
-
-    def test_groupby_categorical_unequal_len(self):
-        #GH3011
-        series = Series([np.nan, np.nan, 1, 1, 2, 2, 3, 3, 4, 4])
-        # The raises only happens with categorical, not with series of types category
-        bins =  pd.cut(series.dropna().values, 4)
-
-        # len(bins) != len(series) here
-        self.assertRaises(ValueError,lambda : series.groupby(bins).mean())
-
-    def test_groupby_multiindex_missing_pair(self):
-        # GH9049
-        df = DataFrame({'group1': ['a','a','a','b'],
-                        'group2': ['c','c','d','c'],
-                        'value': [1,1,1,5]})
-        df = df.set_index(['group1', 'group2'])
-        df_grouped = df.groupby(level=['group1','group2'], sort=True)
-
-        res = df_grouped.agg('sum')
-        idx = MultiIndex.from_tuples([('a','c'), ('a','d'), ('b','c')], names=['group1', 'group2'])
-        exp = DataFrame([[2], [1], [5]], index=idx, columns=['value'])
-
-        tm.assert_frame_equal(res, exp)
-
-    def test_groupby_levels_and_columns(self):
-        # GH9344, GH9049
-        idx_names = ['x', 'y']
-        idx = pd.MultiIndex.from_tuples([(1, 1), (1, 2), (3, 4), (5, 6)], names=idx_names)
-        df = pd.DataFrame(np.arange(12).reshape(-1, 3), index=idx)
-
-        by_levels = df.groupby(level=idx_names).mean()
-        by_columns = df.reset_index().groupby(idx_names).mean()
-
-        tm.assert_frame_equal(by_levels, by_columns)
-
-    def test_gb_apply_list_of_unequal_len_arrays(self):
-
-        # GH1738
-        df = DataFrame({'group1': ['a','a','a','b','b','b','a','a','a','b','b','b'],
-                               'group2': ['c','c','d','d','d','e','c','c','d','d','d','e'],
-                               'weight': [1.1,2,3,4,5,6,2,4,6,8,1,2],
-                               'value': [7.1,8,9,10,11,12,8,7,6,5,4,3]
-        })
-        df = df.set_index(['group1', 'group2'])
-        df_grouped = df.groupby(level=['group1','group2'], sort=True)
-
-        def noddy(value, weight):
-            out = np.array( value * weight ).repeat(3)
-            return out
-
-        # the kernel function returns arrays of unequal length
-        # pandas sniffs the first one, sees it's an array and not
-        # a list, and assumed the rest are of equal length
-        # and so tries a vstack
-
-        # don't die
-        no_toes = df_grouped.apply(lambda x: noddy(x.value, x.weight ))
-
-    def test_groupby_with_empty(self):
-        index = pd.DatetimeIndex(())
-        data = ()
-        series = pd.Series(data, index)
-        grouper = pd.tseries.resample.TimeGrouper('D')
-        grouped = series.groupby(grouper)
-        assert next(iter(grouped), None) is None
-
-    def test_groupby_with_timegrouper(self):
-        # GH 4161
-        # TimeGrouper requires a sorted index
-        # also verifies that the resultant index has the correct name
-        import datetime as DT
-        df_original = DataFrame({
-            'Buyer': 'Carl Carl Carl Carl Joe Carl'.split(),
-            'Quantity': [18,3,5,1,9,3],
-            'Date' : [
-                DT.datetime(2013,9,1,13,0),
-                DT.datetime(2013,9,1,13,5),
-                DT.datetime(2013,10,1,20,0),
-                DT.datetime(2013,10,3,10,0),
-                DT.datetime(2013,12,2,12,0),
-                DT.datetime(2013,9,2,14,0),
-                ]})
-
-        # GH 6908 change target column's order
-        df_reordered = df_original.sort_values(by='Quantity')
-
-        for df in [df_original, df_reordered]:
-            df = df.set_index(['Date'])
-
-            expected = DataFrame({ 'Quantity' : np.nan },
-                                 index=date_range('20130901 13:00:00','20131205 13:00:00',
-                                                  freq='5D',name='Date',closed='left'))
-            expected.iloc[[0,6,18],0] = np.array([24.,6.,9.],dtype='float64')
-
-            result1 = df.resample('5D',how=sum)
-            assert_frame_equal(result1, expected)
-
-            df_sorted = df.sort_index()
-            result2 = df_sorted.groupby(pd.TimeGrouper(freq='5D')).sum()
-            assert_frame_equal(result2, expected)
-
-            result3 = df.groupby(pd.TimeGrouper(freq='5D')).sum()
-            assert_frame_equal(result3, expected)
-
-    def test_groupby_with_timegrouper_methods(self):
-        # GH 3881
-        # make sure API of timegrouper conforms
-
-        import datetime as DT
-        df_original = pd.DataFrame({
-            'Branch' : 'A A A A A B'.split(),
-            'Buyer': 'Carl Mark Carl Joe Joe Carl'.split(),
-            'Quantity': [1,3,5,8,9,3],
-            'Date' : [
-                DT.datetime(2013,1,1,13,0),
-                DT.datetime(2013,1,1,13,5),
-                DT.datetime(2013,10,1,20,0),
-                DT.datetime(2013,10,2,10,0),
-                DT.datetime(2013,12,2,12,0),
-                DT.datetime(2013,12,2,14,0),
-                ]})
-
-        df_sorted = df_original.sort_values(by='Quantity', ascending=False)
-
-        for df in [df_original, df_sorted]:
-            df = df.set_index('Date', drop=False)
-            g = df.groupby(pd.TimeGrouper('6M'))
-            self.assertTrue(g.group_keys)
-            self.assertTrue(isinstance(g.grouper,pd.core.groupby.BinGrouper))
-            groups = g.groups
-            self.assertTrue(isinstance(groups,dict))
-            self.assertTrue(len(groups) == 3)
-
-    def test_timegrouper_with_reg_groups(self):
-
-        # GH 3794
-        # allow combinateion of timegrouper/reg groups
-
-        import datetime as DT
-
-        df_original = DataFrame({
-            'Branch' : 'A A A A A A A B'.split(),
-            'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
-            'Quantity': [1,3,5,1,8,1,9,3],
-            'Date' : [
-                DT.datetime(2013,1,1,13,0),
-                DT.datetime(2013,1,1,13,5),
-                DT.datetime(2013,10,1,20,0),
-                DT.datetime(2013,10,2,10,0),
-                DT.datetime(2013,10,1,20,0),
-                DT.datetime(2013,10,2,10,0),
-                DT.datetime(2013,12,2,12,0),
-                DT.datetime(2013,12,2,14,0),
-                ]}).set_index('Date')
-
-        df_sorted = df_original.sort_values(by='Quantity', ascending=False)
-
-        for df in [df_original, df_sorted]:
-            expected = DataFrame({
-                'Buyer': 'Carl Joe Mark'.split(),
-                'Quantity': [10,18,3],
-                'Date' : [
-                    DT.datetime(2013,12,31,0,0),
-                    DT.datetime(2013,12,31,0,0),
-                    DT.datetime(2013,12,31,0,0),
-                    ]}).set_index(['Date','Buyer'])
-
-            result = df.groupby([pd.Grouper(freq='A'),'Buyer']).sum()
-            assert_frame_equal(result,expected)
-
-            expected = DataFrame({
-                'Buyer': 'Carl Mark Carl Joe'.split(),
-                'Quantity': [1,3,9,18],
-                'Date' : [
-                    DT.datetime(2013,1,1,0,0),
-                    DT.datetime(2013,1,1,0,0),
-                    DT.datetime(2013,7,1,0,0),
-                    DT.datetime(2013,7,1,0,0),
-                    ]}).set_index(['Date','Buyer'])
-            result = df.groupby([pd.Grouper(freq='6MS'),'Buyer']).sum()
-            assert_frame_equal(result,expected)
-
-        df_original = DataFrame({
-            'Branch' : 'A A A A A A A B'.split(),
-            'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
-            'Quantity': [1,3,5,1,8,1,9,3],
-            'Date' : [
-                DT.datetime(2013,10,1,13,0),
-                DT.datetime(2013,10,1,13,5),
-                DT.datetime(2013,10,1,20,0),
-                DT.datetime(2013,10,2,10,0),
-                DT.datetime(2013,10,1,20,0),
-                DT.datetime(2013,10,2,10,0),
-                DT.datetime(2013,10,2,12,0),
-                DT.datetime(2013,10,2,14,0),
-                ]}).set_index('Date')
-
-        df_sorted = df_original.sort_values(by='Quantity', ascending=False)
-        for df in [df_original, df_sorted]:
-
-            expected = DataFrame({
-                'Buyer': 'Carl Joe Mark Carl Joe'.split(),
-                'Quantity': [6,8,3,4,10],
-                'Date' : [
-                    DT.datetime(2013,10,1,0,0),
-                    DT.datetime(2013,10,1,0,0),
-                    DT.datetime(2013,10,1,0,0),
-                    DT.datetime(2013,10,2,0,0),
-                    DT.datetime(2013,10,2,0,0),
-                    ]}).set_index(['Date','Buyer'])
-
-            result = df.groupby([pd.Grouper(freq='1D'),'Buyer']).sum()
-            assert_frame_equal(result,expected)
-
-            result = df.groupby([pd.Grouper(freq='1M'),'Buyer']).sum()
-            expected = DataFrame({
-                'Buyer': 'Carl Joe Mark'.split(),
-                'Quantity': [10,18,3],
-                'Date' : [
-                    DT.datetime(2013,10,31,0,0),
-                    DT.datetime(2013,10,31,0,0),
-                    DT.datetime(2013,10,31,0,0),
-                    ]}).set_index(['Date','Buyer'])
-            assert_frame_equal(result,expected)
-
-            # passing the name
-            df = df.reset_index()
-            result = df.groupby([pd.Grouper(freq='1M',key='Date'),'Buyer']).sum()
-            assert_frame_equal(result,expected)
-
-            self.assertRaises(KeyError, lambda : df.groupby([pd.Grouper(freq='1M',key='foo'),'Buyer']).sum())
-
-            # passing the level
-            df = df.set_index('Date')
-            result = df.groupby([pd.Grouper(freq='1M',level='Date'),'Buyer']).sum()
-            assert_frame_equal(result,expected)
-            result = df.groupby([pd.Grouper(freq='1M',level=0),'Buyer']).sum()
-            assert_frame_equal(result,expected)
-
-            self.assertRaises(ValueError, lambda : df.groupby([pd.Grouper(freq='1M',level='foo'),'Buyer']).sum())
-
-            # multi names
-            df = df.copy()
-            df['Date'] = df.index + pd.offsets.MonthEnd(2)
-            result = df.groupby([pd.Grouper(freq='1M',key='Date'),'Buyer']).sum()
-            expected = DataFrame({
-                'Buyer': 'Carl Joe Mark'.split(),
-                'Quantity': [10,18,3],
-                'Date' : [
-                    DT.datetime(2013,11,30,0,0),
-                    DT.datetime(2013,11,30,0,0),
-                    DT.datetime(2013,11,30,0,0),
-                    ]}).set_index(['Date','Buyer'])
-            assert_frame_equal(result,expected)
-
-            # error as we have both a level and a name!
-            self.assertRaises(ValueError, lambda : df.groupby([pd.Grouper(freq='1M',key='Date',level='Date'),'Buyer']).sum())
-
-
-            # single groupers
-            expected = DataFrame({ 'Quantity' : [31],
-                                   'Date' : [DT.datetime(2013,10,31,0,0)] }).set_index('Date')
-            result = df.groupby(pd.Grouper(freq='1M')).sum()
-            assert_frame_equal(result, expected)
-
-            result = df.groupby([pd.Grouper(freq='1M')]).sum()
-            assert_frame_equal(result, expected)
-
-            expected = DataFrame({ 'Quantity' : [31],
-                                   'Date' : [DT.datetime(2013,11,30,0,0)] }).set_index('Date')
-            result = df.groupby(pd.Grouper(freq='1M',key='Date')).sum()
-            assert_frame_equal(result, expected)
-
-            result = df.groupby([pd.Grouper(freq='1M',key='Date')]).sum()
-            assert_frame_equal(result, expected)
-
-        # GH 6764 multiple grouping with/without sort
-        df = DataFrame({
-            'date' : pd.to_datetime([
-                '20121002','20121007','20130130','20130202','20130305','20121002',
-                '20121207','20130130','20130202','20130305','20130202','20130305']),
-            'user_id' : [1,1,1,1,1,3,3,3,5,5,5,5],
-            'whole_cost' : [1790,364,280,259,201,623,90,312,359,301,359,801],
-            'cost1' : [12,15,10,24,39,1,0,90,45,34,1,12] }).set_index('date')
-
-        for freq in ['D', 'M', 'A', 'Q-APR']:
-            expected = df.groupby('user_id')['whole_cost'].resample(
-                                  freq, how='sum').dropna().reorder_levels(
-                                  ['date','user_id']).sortlevel().astype('int64')
-            expected.name = 'whole_cost'
-
-            result1 = df.sort_index().groupby([pd.TimeGrouper(freq=freq), 'user_id'])['whole_cost'].sum()
-            assert_series_equal(result1, expected)
-
-            result2 = df.groupby([pd.TimeGrouper(freq=freq), 'user_id'])['whole_cost'].sum()
-            assert_series_equal(result2, expected)
-
-    def test_timegrouper_get_group(self):
-        # GH 6914
-
-        df_original = DataFrame({
-            'Buyer': 'Carl Joe Joe Carl Joe Carl'.split(),
-            'Quantity': [18,3,5,1,9,3],
-            'Date' : [datetime(2013,9,1,13,0), datetime(2013,9,1,13,5),
-                      datetime(2013,10,1,20,0), datetime(2013,10,3,10,0),
-                      datetime(2013,12,2,12,0), datetime(2013,9,2,14,0),]})
-        df_reordered = df_original.sort_values(by='Quantity')
-
-        # single grouping
-        expected_list = [df_original.iloc[[0, 1, 5]], df_original.iloc[[2, 3]],
-                         df_original.iloc[[4]]]
-        dt_list = ['2013-09-30', '2013-10-31', '2013-12-31']
-
-        for df in [df_original, df_reordered]:
-            grouped = df.groupby(pd.Grouper(freq='M', key='Date'))
-            for t, expected in zip(dt_list, expected_list):
-                dt = pd.Timestamp(t)
-                result = grouped.get_group(dt)
-                assert_frame_equal(result, expected)
-
-        # multiple grouping
-        expected_list = [df_original.iloc[[1]], df_original.iloc[[3]],
-                         df_original.iloc[[4]]]
-        g_list = [('Joe', '2013-09-30'), ('Carl', '2013-10-31'), ('Joe', '2013-12-31')]
-
-        for df in [df_original, df_reordered]:
-            grouped = df.groupby(['Buyer', pd.Grouper(freq='M', key='Date')])
-            for (b, t), expected in zip(g_list, expected_list):
-                dt = pd.Timestamp(t)
-                result = grouped.get_group((b, dt))
-                assert_frame_equal(result, expected)
-
-        # with index
-        df_original = df_original.set_index('Date')
-        df_reordered = df_original.sort_values(by='Quantity')
-
-        expected_list = [df_original.iloc[[0, 1, 5]], df_original.iloc[[2, 3]],
-                         df_original.iloc[[4]]]
-
-        for df in [df_original, df_reordered]:
-            grouped = df.groupby(pd.Grouper(freq='M'))
-            for t, expected in zip(dt_list, expected_list):
-                dt = pd.Timestamp(t)
-                result = grouped.get_group(dt)
-                assert_frame_equal(result, expected)
-
-    def test_cumcount(self):
-        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'])
-        g = df.groupby('A')
-        sg = g.A
-
-        expected = Series([0, 1, 2, 0, 3])
-
-        assert_series_equal(expected, g.cumcount())
-        assert_series_equal(expected, sg.cumcount())
-
-    def test_cumcount_empty(self):
-        ge = DataFrame().groupby(level=0)
-        se = Series().groupby(level=0)
-
-        e = Series(dtype='int64')  # edge case, as this is usually considered float
-
-        assert_series_equal(e, ge.cumcount())
-        assert_series_equal(e, se.cumcount())
-
-    def test_cumcount_dupe_index(self):
-        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'], index=[0] * 5)
-        g = df.groupby('A')
-        sg = g.A
-
-        expected = Series([0, 1, 2, 0, 3], index=[0] * 5)
-
-        assert_series_equal(expected, g.cumcount())
-        assert_series_equal(expected, sg.cumcount())
-
-    def test_cumcount_mi(self):
-        mi = MultiIndex.from_tuples([[0, 1], [1, 2], [2, 2], [2, 2], [1, 0]])
-        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'], index=mi)
-        g = df.groupby('A')
-        sg = g.A
-
-        expected = Series([0, 1, 2, 0, 3], index=mi)
-
-        assert_series_equal(expected, g.cumcount())
-        assert_series_equal(expected, sg.cumcount())
-
-    def test_cumcount_groupby_not_col(self):
-        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'], index=[0] * 5)
-        g = df.groupby([0, 0, 0, 1, 0])
-        sg = g.A
-
-        expected = Series([0, 1, 2, 0, 3], index=[0] * 5)
-
-        assert_series_equal(expected, g.cumcount())
-        assert_series_equal(expected, sg.cumcount())
-
-    def test_filter_series(self):
-        s = pd.Series([1, 3, 20, 5, 22, 24, 7])
-        expected_odd = pd.Series([1, 3, 5, 7], index=[0, 1, 3, 6])
-        expected_even = pd.Series([20, 22, 24], index=[2, 4, 5])
-        grouper = s.apply(lambda x: x % 2)
-        grouped = s.groupby(grouper)
-        assert_series_equal(
-            grouped.filter(lambda x: x.mean() < 10), expected_odd)
-        assert_series_equal(
-            grouped.filter(lambda x: x.mean() > 10), expected_even)
-        # Test dropna=False.
-        assert_series_equal(
-            grouped.filter(lambda x: x.mean() < 10, dropna=False),
-            expected_odd.reindex(s.index))
-        assert_series_equal(
-            grouped.filter(lambda x: x.mean() > 10, dropna=False),
-            expected_even.reindex(s.index))
-
-    def test_filter_single_column_df(self):
-        df = pd.DataFrame([1, 3, 20, 5, 22, 24, 7])
-        expected_odd = pd.DataFrame([1, 3, 5, 7], index=[0, 1, 3, 6])
-        expected_even = pd.DataFrame([20, 22, 24], index=[2, 4, 5])
-        grouper = df[0].apply(lambda x: x % 2)
-        grouped = df.groupby(grouper)
-        assert_frame_equal(
-            grouped.filter(lambda x: x.mean() < 10), expected_odd)
-        assert_frame_equal(
-            grouped.filter(lambda x: x.mean() > 10), expected_even)
-        # Test dropna=False.
-        assert_frame_equal(
-            grouped.filter(lambda x: x.mean() < 10, dropna=False),
-                           expected_odd.reindex(df.index))
-        assert_frame_equal(
-            grouped.filter(lambda x: x.mean() > 10, dropna=False),
-                           expected_even.reindex(df.index))
-
-    def test_filter_multi_column_df(self):
-        df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': [1, 1, 1, 1]})
-        grouper = df['A'].apply(lambda x: x % 2)
-        grouped = df.groupby(grouper)
-        expected = pd.DataFrame({'A': [12, 12], 'B': [1, 1]}, index=[1, 2])
-        assert_frame_equal(
-            grouped.filter(lambda x: x['A'].sum() - x['B'].sum() > 10), expected)
-
-    def test_filter_mixed_df(self):
-        df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': 'a b c d'.split()})
-        grouper = df['A'].apply(lambda x: x % 2)
-        grouped = df.groupby(grouper)
-        expected = pd.DataFrame({'A': [12, 12], 'B': ['b', 'c']},
-                                index=[1, 2])
-        assert_frame_equal(
-            grouped.filter(lambda x: x['A'].sum() > 10), expected)
-
-    def test_filter_out_all_groups(self):
-        s = pd.Series([1, 3, 20, 5, 22, 24, 7])
-        grouper = s.apply(lambda x: x % 2)
-        grouped = s.groupby(grouper)
-        assert_series_equal(
-            grouped.filter(lambda x: x.mean() > 1000), s[[]])
-        df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': 'a b c d'.split()})
-        grouper = df['A'].apply(lambda x: x % 2)
-        grouped = df.groupby(grouper)
-        assert_frame_equal(
-            grouped.filter(lambda x: x['A'].sum() > 1000), df.ix[[]])
-
-    def test_filter_out_no_groups(self):
-        s = pd.Series([1, 3, 20, 5, 22, 24, 7])
-        grouper = s.apply(lambda x: x % 2)
-        grouped = s.groupby(grouper)
-        filtered = grouped.filter(lambda x: x.mean() > 0)
-        assert_series_equal(filtered, s)
-        df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': 'a b c d'.split()})
-        grouper = df['A'].apply(lambda x: x % 2)
-        grouped = df.groupby(grouper)
-        filtered = grouped.filter(lambda x: x['A'].mean() > 0)
-        assert_frame_equal(filtered, df)
-
-    def test_filter_condition_raises(self):
-        def raise_if_sum_is_zero(x):
-            if x.sum() == 0:
-                raise ValueError
-            else:
-                return x.sum() > 0
-        s = pd.Series([-1,0,1,2])
-        grouper = s.apply(lambda x: x % 2)
-        grouped = s.groupby(grouper)
-        self.assertRaises(TypeError,
-                          lambda: grouped.filter(raise_if_sum_is_zero))
-
-    def test_filter_with_axis_in_groupby(self):
-        # issue 11041
-        index = pd.MultiIndex.from_product([range(10), [0, 1]])
-        data = pd.DataFrame(np.arange(100).reshape(-1, 20), columns=index, dtype='int64')
-        result = data.groupby(level=0, axis=1).filter(lambda x: x.iloc[0, 0] > 10)
-        expected = data.iloc[:,12:20]
-        assert_frame_equal(result, expected)
-
-    def test_filter_bad_shapes(self):
-        df = DataFrame({'A': np.arange(8), 'B': list('aabbbbcc'), 'C': np.arange(8)})
-        s = df['B']
-        g_df = df.groupby('B')
-        g_s = s.groupby(s)
-
-        f = lambda x: x
-        self.assertRaises(TypeError, lambda: g_df.filter(f))
-        self.assertRaises(TypeError, lambda: g_s.filter(f))
-
-        f = lambda x: x == 1
-        self.assertRaises(TypeError, lambda: g_df.filter(f))
-        self.assertRaises(TypeError, lambda: g_s.filter(f))
-
-        f = lambda x: np.outer(x, x)
-        self.assertRaises(TypeError, lambda: g_df.filter(f))
-        self.assertRaises(TypeError, lambda: g_s.filter(f))
-
-    def test_filter_nan_is_false(self):
-        df = DataFrame({'A': np.arange(8), 'B': list('aabbbbcc'), 'C': np.arange(8)})
-        s = df['B']
-        g_df = df.groupby(df['B'])
-        g_s = s.groupby(s)
-
-        f = lambda x: np.nan
-        assert_frame_equal(g_df.filter(f), df.loc[[]])
-        assert_series_equal(g_s.filter(f), s[[]])
-
-    def test_filter_against_workaround(self):
-        np.random.seed(0)
-        # Series of ints
-        s = Series(np.random.randint(0,100,1000))
-        grouper = s.apply(lambda x: np.round(x, -1))
-        grouped = s.groupby(grouper)
-        f = lambda x: x.mean() > 10
-        old_way = s[grouped.transform(f).astype('bool')]
-        new_way = grouped.filter(f)
-        assert_series_equal(new_way.sort_values(), old_way.sort_values())
-
-        # Series of floats
-        s = 100*Series(np.random.random(1000))
-        grouper = s.apply(lambda x: np.round(x, -1))
-        grouped = s.groupby(grouper)
-        f = lambda x: x.mean() > 10
-        old_way = s[grouped.transform(f).astype('bool')]
-        new_way = grouped.filter(f)
-        assert_series_equal(new_way.sort_values(), old_way.sort_values())
-
-        # Set up DataFrame of ints, floats, strings.
-        from string import ascii_lowercase
-        letters = np.array(list(ascii_lowercase))
-        N = 1000
-        random_letters = letters.take(np.random.randint(0, 26, N))
-        df = DataFrame({'ints': Series(np.random.randint(0, 100, N)),
-                        'floats': N/10*Series(np.random.random(N)),
-                        'letters': Series(random_letters)})
-
-        # Group by ints; filter on floats.
-        grouped = df.groupby('ints')
-        old_way = df[grouped.floats.\
-            transform(lambda x: x.mean() > N/20).astype('bool')]
-        new_way = grouped.filter(lambda x: x['floats'].mean() > N/20)
-        assert_frame_equal(new_way, old_way)
-
-        # Group by floats (rounded); filter on strings.
-        grouper = df.floats.apply(lambda x: np.round(x, -1))
-        grouped = df.groupby(grouper)
-        old_way = df[grouped.letters.\
-            transform(lambda x: len(x) < N/10).astype('bool')]
-        new_way = grouped.filter(
-            lambda x: len(x.letters) < N/10)
-        assert_frame_equal(new_way, old_way)
-
-        # Group by strings; filter on ints.
-        grouped = df.groupby('letters')
-        old_way = df[grouped.ints.\
-            transform(lambda x: x.mean() > N/20).astype('bool')]
-        new_way = grouped.filter(lambda x: x['ints'].mean() > N/20)
-        assert_frame_equal(new_way, old_way)
-
-    def test_filter_using_len(self):
-        # BUG GH4447
-        df = DataFrame({'A': np.arange(8), 'B': list('aabbbbcc'), 'C': np.arange(8)})
-        grouped = df.groupby('B')
-        actual = grouped.filter(lambda x: len(x) > 2)
-        expected = DataFrame({'A': np.arange(2, 6), 'B': list('bbbb'), 'C': np.arange(2, 6)}, index=np.arange(2, 6))
-        assert_frame_equal(actual, expected)
-
-        actual = grouped.filter(lambda x: len(x) > 4)
-        expected = df.ix[[]]
-        assert_frame_equal(actual, expected)
-
-        # Series have always worked properly, but we'll test anyway.
-        s = df['B']
-        grouped = s.groupby(s)
-        actual = grouped.filter(lambda x: len(x) > 2)
-        expected = Series(4*['b'], index=np.arange(2, 6), name='B')
-        assert_series_equal(actual, expected)
-
-        actual = grouped.filter(lambda x: len(x) > 4)
-        expected = s[[]]
-        assert_series_equal(actual, expected)
-
-    def test_filter_maintains_ordering(self):
-        # Simple case: index is sequential. #4621
-        df = DataFrame({'pid' : [1,1,1,2,2,3,3,3],
-                        'tag' : [23,45,62,24,45,34,25,62]})
-        s = df['pid']
-        grouped = df.groupby('tag')
-        actual = grouped.filter(lambda x: len(x) > 1)
-        expected = df.iloc[[1, 2, 4, 7]]
-        assert_frame_equal(actual, expected)
-
-        grouped = s.groupby(df['tag'])
-        actual = grouped.filter(lambda x: len(x) > 1)
-        expected = s.iloc[[1, 2, 4, 7]]
-        assert_series_equal(actual, expected)
-
-        # Now index is sequentially decreasing.
-        df.index = np.arange(len(df) - 1, -1, -1)
-        s = df['pid']
-        grouped = df.groupby('tag')
-        actual = grouped.filter(lambda x: len(x) > 1)
-        expected = df.iloc[[1, 2, 4, 7]]
-        assert_frame_equal(actual, expected)
-
-        grouped = s.groupby(df['tag'])
-        actual = grouped.filter(lambda x: len(x) > 1)
-        expected = s.iloc[[1, 2, 4, 7]]
-        assert_series_equal(actual, expected)
-
-        # Index is shuffled.
-        SHUFFLED = [4, 6, 7, 2, 1, 0, 5, 3]
-        df.index = df.index[SHUFFLED]
-        s = df['pid']
-        grouped = df.groupby('tag')
-        actual = grouped.filter(lambda x: len(x) > 1)
-        expected = df.iloc[[1, 2, 4, 7]]
-        assert_frame_equal(actual, expected)
-
-        grouped = s.groupby(df['tag'])
-        actual = grouped.filter(lambda x: len(x) > 1)
-        expected = s.iloc[[1, 2, 4, 7]]
-        assert_series_equal(actual, expected)
-
-    def test_filter_multiple_timestamp(self):
-        # GH 10114
-        df = DataFrame({'A' : np.arange(5,dtype='int64'),
-                        'B' : ['foo','bar','foo','bar','bar'],
-                        'C' : Timestamp('20130101') })
-
-        grouped = df.groupby(['B', 'C'])
-
-        result = grouped['A'].filter(lambda x: True)
-        assert_series_equal(df['A'], result)
-
-        result = grouped['A'].transform(len)
-        expected = Series([2, 3, 2, 3, 3], name='A')
-        assert_series_equal(result, expected)
-
-        result = grouped.filter(lambda x: True)
-        assert_frame_equal(df, result)
-
-        result = grouped.transform('sum')
-        expected = DataFrame({'A' : [2, 8, 2, 8, 8]})
-        assert_frame_equal(result, expected)
-
-        result = grouped.transform(len)
-        expected = DataFrame({'A' : [2, 3, 2, 3, 3]})
-        assert_frame_equal(result, expected)
-
-    def test_filter_and_transform_with_non_unique_int_index(self):
-        # GH4620
-        index = [1, 1, 1, 2, 1, 1, 0, 1]
-        df = DataFrame({'pid' : [1,1,1,2,2,3,3,3],
-                       'tag' : [23,45,62,24,45,34,25,62]}, index=index)
-        grouped_df = df.groupby('tag')
-        ser = df['pid']
-        grouped_ser = ser.groupby(df['tag'])
-        expected_indexes = [1, 2, 4, 7]
-
-        # Filter DataFrame
-        actual = grouped_df.filter(lambda x: len(x) > 1)
-        expected = df.iloc[expected_indexes]
-        assert_frame_equal(actual, expected)
-
-        actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
-        expected = df.copy()
-        expected.iloc[[0, 3, 5, 6]] = np.nan
-        assert_frame_equal(actual, expected)
-
-        # Filter Series
-        actual = grouped_ser.filter(lambda x: len(x) > 1)
-        expected = ser.take(expected_indexes)
-        assert_series_equal(actual, expected)
-
-        actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
-        NA = np.nan
-        expected = Series([NA,1,1,NA,2,NA,NA,3], index, name='pid')
-        # ^ made manually because this can get confusing!
-        assert_series_equal(actual, expected)
-
-        # Transform Series
-        actual = grouped_ser.transform(len)
-        expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
-        assert_series_equal(actual, expected)
-
-        # Transform (a column from) DataFrameGroupBy
-        actual = grouped_df.pid.transform(len)
-        assert_series_equal(actual, expected)
-
-    def test_filter_and_transform_with_multiple_non_unique_int_index(self):
-        # GH4620
-        index = [1, 1, 1, 2, 0, 0, 0, 1]
-        df = DataFrame({'pid' : [1,1,1,2,2,3,3,3],
-                       'tag' : [23,45,62,24,45,34,25,62]}, index=index)
-        grouped_df = df.groupby('tag')
-        ser = df['pid']
-        grouped_ser = ser.groupby(df['tag'])
-        expected_indexes = [1, 2, 4, 7]
-
-        # Filter DataFrame
-        actual = grouped_df.filter(lambda x: len(x) > 1)
-        expected = df.iloc[expected_indexes]
-        assert_frame_equal(actual, expected)
-
-        actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
-        expected = df.copy()
-        expected.iloc[[0, 3, 5, 6]] = np.nan
-        assert_frame_equal(actual, expected)
-
-        # Filter Series
-        actual = grouped_ser.filter(lambda x: len(x) > 1)
-        expected = ser.take(expected_indexes)
-        assert_series_equal(actual, expected)
-
-        actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
-        NA = np.nan
-        expected = Series([NA,1,1,NA,2,NA,NA,3], index, name='pid')
-        # ^ made manually because this can get confusing!
-        assert_series_equal(actual, expected)
-
-        # Transform Series
-        actual = grouped_ser.transform(len)
-        expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
-        assert_series_equal(actual, expected)
-
-        # Transform (a column from) DataFrameGroupBy
-        actual = grouped_df.pid.transform(len)
-        assert_series_equal(actual, expected)
-
-    def test_filter_and_transform_with_non_unique_float_index(self):
-        # GH4620
-        index = np.array([1, 1, 1, 2, 1, 1, 0, 1], dtype=float)
-        df = DataFrame({'pid' : [1,1,1,2,2,3,3,3],
-                       'tag' : [23,45,62,24,45,34,25,62]}, index=index)
-        grouped_df = df.groupby('tag')
-        ser = df['pid']
-        grouped_ser = ser.groupby(df['tag'])
-        expected_indexes = [1, 2, 4, 7]
-
-        # Filter DataFrame
-        actual = grouped_df.filter(lambda x: len(x) > 1)
-        expected = df.iloc[expected_indexes]
-        assert_frame_equal(actual, expected)
-
-        actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
-        expected = df.copy()
-        expected.iloc[[0, 3, 5, 6]] = np.nan
-        assert_frame_equal(actual, expected)
-
-        # Filter Series
-        actual = grouped_ser.filter(lambda x: len(x) > 1)
-        expected = ser.take(expected_indexes)
-        assert_series_equal(actual, expected)
-
-        actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
-        NA = np.nan
-        expected = Series([NA,1,1,NA,2,NA,NA,3], index, name='pid')
-        # ^ made manually because this can get confusing!
-        assert_series_equal(actual, expected)
-
-        # Transform Series
-        actual = grouped_ser.transform(len)
-        expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index)
-        assert_series_equal(actual, expected)
-
-        # Transform (a column from) DataFrameGroupBy
-        actual = grouped_df.pid.transform(len)
-        assert_series_equal(actual, expected)
-
-    def test_filter_and_transform_with_non_unique_float_index(self):
-        # GH4620
-        index = np.array([1, 1, 1, 2, 0, 0, 0, 1], dtype=float)
-        df = DataFrame({'pid' : [1,1,1,2,2,3,3,3],
-                       'tag' : [23,45,62,24,45,34,25,62]}, index=index)
-        grouped_df = df.groupby('tag')
-        ser = df['pid']
-        grouped_ser = ser.groupby(df['tag'])
-        expected_indexes = [1, 2, 4, 7]
-
-        # Filter DataFrame
-        actual = grouped_df.filter(lambda x: len(x) > 1)
-        expected = df.iloc[expected_indexes]
-        assert_frame_equal(actual, expected)
-
-        actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
-        expected = df.copy()
-        expected.iloc[[0, 3, 5, 6]] = np.nan
-        assert_frame_equal(actual, expected)
-
-        # Filter Series
-        actual = grouped_ser.filter(lambda x: len(x) > 1)
-        expected = ser.take(expected_indexes)
-        assert_series_equal(actual, expected)
-
-        actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
-        NA = np.nan
-        expected = Series([NA,1,1,NA,2,NA,NA,3], index, name='pid')
-        # ^ made manually because this can get confusing!
-        assert_series_equal(actual, expected)
-
-        # Transform Series
-        actual = grouped_ser.transform(len)
-        expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
-        assert_series_equal(actual, expected)
-
-        # Transform (a column from) DataFrameGroupBy
-        actual = grouped_df.pid.transform(len)
-        assert_series_equal(actual, expected)
-
-    def test_filter_and_transform_with_non_unique_timestamp_index(self):
-        # GH4620
-        t0 = Timestamp('2013-09-30 00:05:00')
-        t1 = Timestamp('2013-10-30 00:05:00')
-        t2 = Timestamp('2013-11-30 00:05:00')
-        index = [t1, t1, t1, t2, t1, t1, t0, t1]
-        df = DataFrame({'pid' : [1,1,1,2,2,3,3,3],
-                       'tag' : [23,45,62,24,45,34,25,62]}, index=index)
-        grouped_df = df.groupby('tag')
-        ser = df['pid']
-        grouped_ser = ser.groupby(df['tag'])
-        expected_indexes = [1, 2, 4, 7]
-
-        # Filter DataFrame
-        actual = grouped_df.filter(lambda x: len(x) > 1)
-        expected = df.iloc[expected_indexes]
-        assert_frame_equal(actual, expected)
-
-        actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
-        expected = df.copy()
-        expected.iloc[[0, 3, 5, 6]] = np.nan
-        assert_frame_equal(actual, expected)
-
-        # Filter Series
-        actual = grouped_ser.filter(lambda x: len(x) > 1)
-        expected = ser.take(expected_indexes)
-        assert_series_equal(actual, expected)
-
-        actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
-        NA = np.nan
-        expected = Series([NA,1,1,NA,2,NA,NA,3], index, name='pid')
-        # ^ made manually because this can get confusing!
-        assert_series_equal(actual, expected)
-
-        # Transform Series
-        actual = grouped_ser.transform(len)
-        expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
-        assert_series_equal(actual, expected)
-
-        # Transform (a column from) DataFrameGroupBy
-        actual = grouped_df.pid.transform(len)
-        assert_series_equal(actual, expected)
-
-    def test_filter_and_transform_with_non_unique_string_index(self):
-        # GH4620
-        index = list('bbbcbbab')
-        df = DataFrame({'pid' : [1,1,1,2,2,3,3,3],
-                       'tag' : [23,45,62,24,45,34,25,62]}, index=index)
-        grouped_df = df.groupby('tag')
-        ser = df['pid']
-        grouped_ser = ser.groupby(df['tag'])
-        expected_indexes = [1, 2, 4, 7]
-
-        # Filter DataFrame
-        actual = grouped_df.filter(lambda x: len(x) > 1)
-        expected = df.iloc[expected_indexes]
-        assert_frame_equal(actual, expected)
-
-        actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
-        expected = df.copy()
-        expected.iloc[[0, 3, 5, 6]] = np.nan
-        assert_frame_equal(actual, expected)
-
-        # Filter Series
-        actual = grouped_ser.filter(lambda x: len(x) > 1)
-        expected = ser.take(expected_indexes)
-        assert_series_equal(actual, expected)
-
-        actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
-        NA = np.nan
-        expected = Series([NA,1,1,NA,2,NA,NA,3], index, name='pid')
-        # ^ made manually because this can get confusing!
-        assert_series_equal(actual, expected)
-
-        # Transform Series
-        actual = grouped_ser.transform(len)
-        expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
-        assert_series_equal(actual, expected)
-
-        # Transform (a column from) DataFrameGroupBy
-        actual = grouped_df.pid.transform(len)
-        assert_series_equal(actual, expected)
-
-    def test_filter_has_access_to_grouped_cols(self):
-        df = DataFrame([[1, 2], [1, 3], [5, 6]], columns=['A', 'B'])
-        g = df.groupby('A')
-        # previously didn't have access to col A #????
-        filt = g.filter(lambda x: x['A'].sum() == 2)
-        assert_frame_equal(filt, df.iloc[[0, 1]])
-
-    def test_filter_enforces_scalarness(self):
-        df  = pd.DataFrame([
-            ['best', 'a', 'x'],
-            ['worst', 'b', 'y'],
-            ['best', 'c', 'x'],
-            ['best','d', 'y'],
-            ['worst','d', 'y'],
-            ['worst','d', 'y'],
-            ['best','d', 'z'],
-        ], columns=['a', 'b', 'c'])
-        with tm.assertRaisesRegexp(TypeError, 'filter function returned a.*'):
-            df.groupby('c').filter(lambda g: g['a'] == 'best')
-
-    def test_filter_non_bool_raises(self):
-        df  = pd.DataFrame([
-            ['best', 'a', 1],
-            ['worst', 'b', 1],
-            ['best', 'c', 1],
-            ['best','d', 1],
-            ['worst','d', 1],
-            ['worst','d', 1],
-            ['best','d', 1],
-        ], columns=['a', 'b', 'c'])
-        with tm.assertRaisesRegexp(TypeError, 'filter function returned a.*'):
-            df.groupby('a').filter(lambda g: g.c.mean())
-
-    def test_fill_constistency(self):
-
-        # GH9221
-        # pass thru keyword arguments to the generated wrapper
-        # are set if the passed kw is None (only)
-        df = DataFrame(index=pd.MultiIndex.from_product([['value1','value2'],
-                                                         date_range('2014-01-01','2014-01-06')]),
-                       columns=Index(['1','2'], name='id'))
-        df['1'] = [np.nan, 1, np.nan, np.nan, 11, np.nan, np.nan, 2, np.nan, np.nan, 22, np.nan]
-        df['2'] = [np.nan, 3, np.nan, np.nan, 33, np.nan, np.nan, 4, np.nan, np.nan, 44, np.nan]
-
-        expected = df.groupby(level=0, axis=0).fillna(method='ffill')
-        result = df.T.groupby(level=0, axis=1).fillna(method='ffill').T
-        assert_frame_equal(result, expected)
-
-    def test_index_label_overlaps_location(self):
-        # checking we don't have any label/location confusion in the
-        # the wake of GH5375
-        df = DataFrame(list('ABCDE'), index=[2, 0, 2, 1, 1])
-        g = df.groupby(list('ababb'))
-        actual = g.filter(lambda x: len(x) > 2)
-        expected = df.iloc[[1, 3, 4]]
-        assert_frame_equal(actual, expected)
-
-        ser = df[0]
-        g = ser.groupby(list('ababb'))
-        actual = g.filter(lambda x: len(x) > 2)
-        expected = ser.take([1, 3, 4])
-        assert_series_equal(actual, expected)
-
-        # ... and again, with a generic Index of floats
-        df.index = df.index.astype(float)
-        g = df.groupby(list('ababb'))
-        actual = g.filter(lambda x: len(x) > 2)
-        expected = df.iloc[[1, 3, 4]]
-        assert_frame_equal(actual, expected)
-
-        ser = df[0]
-        g = ser.groupby(list('ababb'))
-        actual = g.filter(lambda x: len(x) > 2)
-        expected = ser.take([1, 3, 4])
-        assert_series_equal(actual, expected)
-
-    def test_groupby_selection_with_methods(self):
-        # some methods which require DatetimeIndex
-        rng = pd.date_range('2014', periods=len(self.df))
-        self.df.index = rng
-
-        g = self.df.groupby(['A'])[['C']]
-        g_exp = self.df[['C']].groupby(self.df['A'])
-        # TODO check groupby with > 1 col ?
-
-        # methods which are called as .foo()
-        methods = ['count',
-                   'corr',
-                   'cummax', 'cummin', 'cumprod',
-                   'describe', 'rank',
-                   'quantile',
-                   'diff', 'shift',
-                   'all', 'any',
-                   'idxmin', 'idxmax',
-                   'ffill', 'bfill',
-                   'pct_change',
-                   'tshift',
-                   #'ohlc'
-                   ]
-
-        for m in methods:
-            res = getattr(g, m)()
-            exp = getattr(g_exp, m)()
-            assert_frame_equal(res, exp)  # should always be frames!
-
-        # methods which aren't just .foo()
-        assert_frame_equal(g.fillna(0), g_exp.fillna(0))
-        assert_frame_equal(g.dtypes, g_exp.dtypes)
-        assert_frame_equal(g.apply(lambda x: x.sum()),
-                           g_exp.apply(lambda x: x.sum()))
-
-        assert_frame_equal(g.resample('D'), g_exp.resample('D'))
-        assert_frame_equal(g.resample('D', how='ohlc'),
-                           g_exp.resample('D', how='ohlc'))
-
-        assert_frame_equal(g.filter(lambda x: len(x) == 3),
-                           g_exp.filter(lambda x: len(x) == 3))
-
-    def test_groupby_whitelist(self):
-        from string import ascii_lowercase
-        letters = np.array(list(ascii_lowercase))
-        N = 10
-        random_letters = letters.take(np.random.randint(0, 26, N))
-        df = DataFrame({'floats': N / 10 * Series(np.random.random(N)),
-                        'letters': Series(random_letters)})
-        s = df.floats
-
-        df_whitelist = frozenset([
-            'last', 'first',
-            'mean', 'sum', 'min', 'max',
-            'head', 'tail',
-            'cumsum', 'cumprod', 'cummin', 'cummax', 'cumcount',
-            'resample',
-            'describe',
-            'rank', 'quantile',
-            'fillna',
-            'mad',
-            'any', 'all',
-            'take',
-            'idxmax', 'idxmin',
-            'shift', 'tshift',
-            'ffill', 'bfill',
-            'pct_change', 'skew',
-            'plot', 'boxplot', 'hist',
-            'median', 'dtypes',
-            'corrwith', 'corr', 'cov',
-            'diff',
-        ])
-        s_whitelist = frozenset([
-            'last', 'first',
-            'mean', 'sum', 'min', 'max',
-            'head', 'tail',
-            'cumsum', 'cumprod', 'cummin', 'cummax', 'cumcount',
-            'resample',
-            'describe',
-            'rank', 'quantile',
-            'fillna',
-            'mad',
-            'any', 'all',
-            'take',
-            'idxmax', 'idxmin',
-            'shift', 'tshift',
-            'ffill', 'bfill',
-            'pct_change', 'skew',
-            'plot', 'hist',
-            'median', 'dtype',
-            'corr', 'cov',
-            'diff',
-            'unique',
-            # 'nlargest', 'nsmallest',
-        ])
-
-        for obj, whitelist in zip((df, s),
-                                  (df_whitelist, s_whitelist)):
-            gb = obj.groupby(df.letters)
-            self.assertEqual(whitelist, gb._apply_whitelist)
-            for m in whitelist:
-                getattr(type(gb), m)
-
-    AGG_FUNCTIONS = ['sum', 'prod', 'min', 'max', 'median', 'mean', 'skew',
-                     'mad', 'std', 'var', 'sem']
-    AGG_FUNCTIONS_WITH_SKIPNA = ['skew', 'mad']
-
-    def test_groupby_whitelist_deprecations(self):
-        from string import ascii_lowercase
-        letters = np.array(list(ascii_lowercase))
-        N = 10
-        random_letters = letters.take(np.random.randint(0, 26, N))
-        df = DataFrame({'floats': N / 10 * Series(np.random.random(N)),
-                        'letters': Series(random_letters)})
-
-        # 10711 deprecated
-        with tm.assert_produces_warning(FutureWarning):
-            df.groupby('letters').irow(0)
-        with tm.assert_produces_warning(FutureWarning):
-            df.groupby('letters').floats.irow(0)
-
-    def test_regression_whitelist_methods(self) :
-
-        # GH6944
-        # explicity test the whitelest methods
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['first', 'second'])
-        raw_frame = DataFrame(np.random.randn(10, 3), index=index,
-                               columns=Index(['A', 'B', 'C'], name='exp'))
-        raw_frame.ix[1, [1, 2]] = np.nan
-        raw_frame.ix[7, [0, 1]] = np.nan
-
-        for op, level, axis, skipna in cart_product(self.AGG_FUNCTIONS,
-                                                    lrange(2), lrange(2),
-                                                    [True,False]) :
-
-            if axis == 0 :
-                frame = raw_frame
-            else :
-                frame = raw_frame.T
-
-            if op in self.AGG_FUNCTIONS_WITH_SKIPNA :
-                grouped = frame.groupby(level=level,axis=axis)
-                result = getattr(grouped,op)(skipna=skipna)
-                expected = getattr(frame,op)(level=level,axis=axis,skipna=skipna)
-                assert_frame_equal(result, expected)
-            else :
-                grouped = frame.groupby(level=level,axis=axis)
-                result = getattr(grouped,op)()
-                expected = getattr(frame,op)(level=level,axis=axis)
-                assert_frame_equal(result, expected)
-
-    def test_groupby_blacklist(self):
-        from string import ascii_lowercase
-        letters = np.array(list(ascii_lowercase))
-        N = 10
-        random_letters = letters.take(np.random.randint(0, 26, N))
-        df = DataFrame({'floats': N / 10 * Series(np.random.random(N)),
-                        'letters': Series(random_letters)})
-        s = df.floats
-
-        blacklist = [
-            'eval', 'query', 'abs', 'where',
-            'mask', 'align', 'groupby', 'clip', 'astype',
-            'at', 'combine', 'consolidate', 'convert_objects',
-        ]
-        to_methods = [method for method in dir(df) if method.startswith('to_')]
-
-        blacklist.extend(to_methods)
-
-        # e.g., to_csv
-        defined_but_not_allowed = ("(?:^Cannot.+{0!r}.+{1!r}.+try using the "
-                                   "'apply' method$)")
-
-        # e.g., query, eval
-        not_defined = "(?:^{1!r} object has no attribute {0!r}$)"
-        fmt = defined_but_not_allowed + '|' + not_defined
-        for bl in blacklist:
-            for obj in (df, s):
-                gb = obj.groupby(df.letters)
-                msg = fmt.format(bl, type(gb).__name__)
-                with tm.assertRaisesRegexp(AttributeError, msg):
-                    getattr(gb, bl)
-
-    def test_tab_completion(self):
-        grp = self.mframe.groupby(level='second')
-        results = set([v for v in dir(grp) if not v.startswith('_')])
-        expected = set(['A','B','C',
-                        'agg','aggregate','apply','boxplot','filter','first','get_group',
-                        'groups','hist','indices','last','max','mean','median',
-                        'min','name','ngroups','nth','ohlc','plot', 'prod',
-                        'size', 'std', 'sum', 'transform', 'var', 'sem', 'count', 'head',
-                        'irow',
-                        'describe', 'cummax', 'quantile', 'rank', 'cumprod', 'tail',
-                        'resample', 'cummin', 'fillna', 'cumsum', 'cumcount',
-                        'all', 'shift', 'skew', 'bfill', 'ffill',
-                        'take', 'tshift', 'pct_change', 'any', 'mad', 'corr', 'corrwith',
-                        'cov', 'dtypes', 'diff', 'idxmax', 'idxmin'
-                        ])
-        self.assertEqual(results, expected)
-
-    def test_lexsort_indexer(self):
-        keys = [[nan]*5 + list(range(100)) + [nan]*5]
-        # orders=True, na_position='last'
-        result = _lexsort_indexer(keys, orders=True, na_position='last')
-        expected = list(range(5, 105)) + list(range(5)) + list(range(105, 110))
-        assert_equal(result, expected)
-
-        # orders=True, na_position='first'
-        result = _lexsort_indexer(keys, orders=True, na_position='first')
-        expected = list(range(5)) + list(range(105, 110)) + list(range(5, 105))
-        assert_equal(result, expected)
-
-        # orders=False, na_position='last'
-        result = _lexsort_indexer(keys, orders=False, na_position='last')
-        expected = list(range(104, 4, -1)) + list(range(5)) + list(range(105, 110))
-        assert_equal(result, expected)
-
-        # orders=False, na_position='first'
-        result = _lexsort_indexer(keys, orders=False, na_position='first')
-        expected = list(range(5)) + list(range(105, 110)) + list(range(104, 4, -1))
-        assert_equal(result, expected)
-
-    def test_nargsort(self):
-        # np.argsort(items) places NaNs last
-        items = [nan]*5 + list(range(100)) + [nan]*5
-        # np.argsort(items2) may not place NaNs first
-        items2 = np.array(items, dtype='O')
-
-        try:
-            # GH 2785; due to a regression in NumPy1.6.2
-            np.argsort(np.array([[1, 2], [1, 3], [1, 2]], dtype='i'))
-            np.argsort(items2, kind='mergesort')
-        except TypeError as err:
-            raise nose.SkipTest('requested sort not available for type')
-
-        # mergesort is the most difficult to get right because we want it to be stable.
-
-        # According to numpy/core/tests/test_multiarray, """The number
-        # of sorted items must be greater than ~50 to check the actual algorithm
-        # because quick and merge sort fall over to insertion sort for small
-        # arrays."""
-
-
-        # mergesort, ascending=True, na_position='last'
-        result = _nargsort(
-            items, kind='mergesort', ascending=True, na_position='last')
-        expected = list(range(5, 105)) + list(range(5)) + list(range(105, 110))
-        assert_equal(result, expected)
-
-        # mergesort, ascending=True, na_position='first'
-        result = _nargsort(
-            items, kind='mergesort', ascending=True, na_position='first')
-        expected = list(range(5)) + list(range(105, 110)) + list(range(5, 105))
-        assert_equal(result, expected)
-
-        # mergesort, ascending=False, na_position='last'
-        result = _nargsort(
-            items, kind='mergesort', ascending=False, na_position='last')
-        expected = list(range(104, 4, -1)) + list(range(5)) + list(range(105, 110))
-        assert_equal(result, expected)
-
-        # mergesort, ascending=False, na_position='first'
-        result = _nargsort(
-            items, kind='mergesort', ascending=False, na_position='first')
-        expected = list(range(5)) + list(range(105, 110)) + list(range(104, 4, -1))
-        assert_equal(result, expected)
-
-        # mergesort, ascending=True, na_position='last'
-        result = _nargsort(
-            items2, kind='mergesort', ascending=True, na_position='last')
-        expected = list(range(5, 105)) + list(range(5)) + list(range(105, 110))
-        assert_equal(result, expected)
-
-        # mergesort, ascending=True, na_position='first'
-        result = _nargsort(
-            items2, kind='mergesort', ascending=True, na_position='first')
-        expected = list(range(5)) + list(range(105, 110)) + list(range(5, 105))
-        assert_equal(result, expected)
-
-        # mergesort, ascending=False, na_position='last'
-        result = _nargsort(
-            items2, kind='mergesort', ascending=False, na_position='last')
-        expected = list(range(104, 4, -1)) + list(range(5)) + list(range(105, 110))
-        assert_equal(result, expected)
-
-        # mergesort, ascending=False, na_position='first'
-        result = _nargsort(
-            items2, kind='mergesort', ascending=False, na_position='first')
-        expected = list(range(5)) + list(range(105, 110)) + list(range(104, 4, -1))
-        assert_equal(result, expected)
-
-    def test_datetime_count(self):
-        df = DataFrame({'a': [1,2,3] * 2,
-                        'dates': pd.date_range('now', periods=6, freq='T')})
-        result = df.groupby('a').dates.count()
-        expected = Series([2, 2, 2], index=Index([1, 2, 3], name='a'),
-                          name='dates')
-        tm.assert_series_equal(result, expected)
-
-    def test_lower_int_prec_count(self):
-        df = DataFrame({'a': np.array([0, 1, 2, 100], np.int8),
-                        'b': np.array([1, 2, 3, 6], np.uint32),
-                        'c': np.array([4, 5, 6, 8], np.int16),
-                        'grp': list('ab' * 2)})
-        result = df.groupby('grp').count()
-        expected = DataFrame({'a': [2, 2],
-                              'b': [2, 2],
-                              'c': [2, 2]}, index=pd.Index(list('ab'),
-                                                           name='grp'))
-        tm.assert_frame_equal(result, expected)
-
-    def test_count_uses_size_on_exception(self):
-        class RaisingObjectException(Exception):
-            pass
-
-        class RaisingObject(object):
-            def __init__(self, msg='I will raise inside Cython'):
-                super(RaisingObject, self).__init__()
-                self.msg = msg
-
-            def __eq__(self, other):
-                # gets called in Cython to check that raising calls the method
-                raise RaisingObjectException(self.msg)
-
-        df = DataFrame({'a': [RaisingObject() for _ in range(4)],
-                        'grp': list('ab' * 2)})
-        result = df.groupby('grp').count()
-        expected = DataFrame({'a': [2, 2]}, index=pd.Index(list('ab'),
-                                                           name='grp'))
-        tm.assert_frame_equal(result, expected)
-
-    def test__cython_agg_general(self):
-        ops = [('mean', np.mean),
-               ('median', np.median),
-               ('var', np.var),
-               ('add', np.sum),
-               ('prod', np.prod),
-               ('min', np.min),
-               ('max', np.max),
-               ('first', lambda x: x.iloc[0]),
-               ('last', lambda x: x.iloc[-1]),
-               ]
-        df = DataFrame(np.random.randn(1000))
-        labels = np.random.randint(0, 50, size=1000).astype(float)
-
-        for op, targop in ops:
-            result = df.groupby(labels)._cython_agg_general(op)
-            expected = df.groupby(labels).agg(targop)
-            try:
-                tm.assert_frame_equal(result, expected)
-            except BaseException as exc:
-                exc.args += ('operation: %s' % op,)
-                raise
-
-    def test_ops_general(self):
-        ops = [('mean', np.mean),
-               ('median', np.median),
-               ('std', np.std),
-               ('var', np.var),
-               ('sum', np.sum),
-               ('prod', np.prod),
-               ('min', np.min),
-               ('max', np.max),
-               ('first', lambda x: x.iloc[0]),
-               ('last', lambda x: x.iloc[-1]),
-               ('count', np.size),
-               ]
-        try:
-            from scipy.stats import sem
-        except ImportError:
-            pass
-        else:
-            ops.append(('sem', sem))
-        df = DataFrame(np.random.randn(1000))
-        labels = np.random.randint(0, 50, size=1000).astype(float)
-
-        for op, targop in ops:
-            result = getattr(df.groupby(labels), op)().astype(float)
-            expected = df.groupby(labels).agg(targop)
-            try:
-                tm.assert_frame_equal(result, expected)
-            except BaseException as exc:
-                exc.args += ('operation: %s' % op,)
-                raise
-
-    def test_max_nan_bug(self):
-        raw = """,Date,app,File
-2013-04-23,2013-04-23 00:00:00,,log080001.log
-2013-05-06,2013-05-06 00:00:00,,log.log
-2013-05-07,2013-05-07 00:00:00,OE,xlsx"""
-        df = pd.read_csv(StringIO(raw), parse_dates=[0])
-        gb = df.groupby('Date')
-        r = gb[['File']].max()
-        e = gb['File'].max().to_frame()
-        tm.assert_frame_equal(r, e)
-        self.assertFalse(r['File'].isnull().any())
-
-    def test_nlargest(self):
-        a = Series([1, 3, 5, 7, 2, 9, 0, 4, 6, 10])
-        b = Series(list('a' * 5 + 'b' * 5))
-        gb = a.groupby(b)
-        r = gb.nlargest(3)
-        e = Series([7, 5, 3, 10, 9, 6],
-                   index=MultiIndex.from_arrays([list('aaabbb'),
-                                                 [3, 2, 1, 9, 5, 8]]))
-        tm.assert_series_equal(r, e)
-
-
-        a = Series([1, 1, 3, 2, 0, 3, 3, 2, 1, 0])
-        gb = a.groupby(b)
-        e = Series([3, 2, 1, 3, 3, 2],
-                   index=MultiIndex.from_arrays([list('aaabbb'),
-                                                 [2, 3, 1, 6, 5, 7]]))
-        assert_series_equal(gb.nlargest(3, keep='last'), e)
-        with tm.assert_produces_warning(FutureWarning):
-            assert_series_equal(gb.nlargest(3, take_last=True), e)
-
-    def test_nsmallest(self):
-        a = Series([1, 3, 5, 7, 2, 9, 0, 4, 6, 10])
-        b = Series(list('a' * 5 + 'b' * 5))
-        gb = a.groupby(b)
-        r = gb.nsmallest(3)
-        e = Series([1, 2, 3, 0, 4, 6],
-                   index=MultiIndex.from_arrays([list('aaabbb'),
-                                                 [0, 4, 1, 6, 7, 8]]))
-        tm.assert_series_equal(r, e)
-
-        a = Series([1, 1, 3, 2, 0, 3, 3, 2, 1, 0])
-        gb = a.groupby(b)
-        e = Series([0, 1, 1, 0, 1, 2],
-                   index=MultiIndex.from_arrays([list('aaabbb'),
-                                                 [4, 1, 0, 9, 8, 7]]))
-        assert_series_equal(gb.nsmallest(3, keep='last'), e)
-        with tm.assert_produces_warning(FutureWarning):
-            assert_series_equal(gb.nsmallest(3, take_last=True), e)
-
-    def test_transform_doesnt_clobber_ints(self):
-        # GH 7972
-        n = 6
-        x = np.arange(n)
-        df = DataFrame({'a': x // 2, 'b': 2.0 * x, 'c': 3.0 * x})
-        df2 = DataFrame({'a': x // 2 * 1.0, 'b': 2.0 * x, 'c': 3.0 * x})
-
-        gb = df.groupby('a')
-        result = gb.transform('mean')
-
-        gb2 = df2.groupby('a')
-        expected = gb2.transform('mean')
-        tm.assert_frame_equal(result, expected)
-
-    def test_groupby_categorical_two_columns(self):
-
-        # https://github.com/pydata/pandas/issues/8138
-        d = {'cat': pd.Categorical(["a","b","a","b"], categories=["a", "b", "c"], ordered=True),
-             'ints': [1, 1, 2, 2],'val': [10, 20, 30, 40]}
-        test = pd.DataFrame(d)
-
-        # Grouping on a single column
-        groups_single_key = test.groupby("cat")
-        res = groups_single_key.agg('mean')
-        exp = DataFrame({"ints":[1.5,1.5,np.nan], "val":[20,30,np.nan]},
-                        index=pd.Index(["a", "b", "c"], name="cat"))
-        tm.assert_frame_equal(res, exp)
-
-        # Grouping on two columns
-        groups_double_key = test.groupby(["cat","ints"])
-        res = groups_double_key.agg('mean')
-        exp = DataFrame({"val":[10,30,20,40,np.nan,np.nan],
-                         "cat": ["a","a","b","b","c","c"],
-                         "ints": [1,2,1,2,1,2]}).set_index(["cat","ints"])
-        tm.assert_frame_equal(res, exp)
-
-        # GH 10132
-        for key in [('a', 1), ('b', 2), ('b', 1), ('a', 2)]:
-            c, i = key
-            result = groups_double_key.get_group(key)
-            expected = test[(test.cat == c) & (test.ints == i)]
-            assert_frame_equal(result, expected)
-
-        d = {'C1': [3, 3, 4, 5], 'C2': [1, 2, 3, 4], 'C3': [10, 100, 200, 34]}
-        test = pd.DataFrame(d)
-        values = pd.cut(test['C1'], [1, 2, 3, 6])
-        values.name = "cat"
-        groups_double_key = test.groupby([values,'C2'])
-
-        res = groups_double_key.agg('mean')
-        nan = np.nan
-        idx = MultiIndex.from_product([["(1, 2]", "(2, 3]", "(3, 6]"],[1,2,3,4]],
-                                      names=["cat", "C2"])
-        exp = DataFrame({"C1":[nan,nan,nan,nan,  3,  3,nan,nan, nan,nan,  4, 5],
-                         "C3":[nan,nan,nan,nan, 10,100,nan,nan, nan,nan,200,34]}, index=idx)
-        tm.assert_frame_equal(res, exp)
-
-    def test_groupby_apply_all_none(self):
-        # Tests to make sure no errors if apply function returns all None
-        # values. Issue 9684.
-        test_df = DataFrame({'groups': [0,0,1,1], 'random_vars': [8,7,4,5]})
-
-        def test_func(x):
-            pass
-        result = test_df.groupby('groups').apply(test_func)
-        expected = DataFrame()
-        tm.assert_frame_equal(result, expected)
-
-    def test_first_last_max_min_on_time_data(self):
-        # GH 10295
-        # Verify that NaT is not in the result of max, min, first and last on
-        # Dataframe with datetime or timedelta values.
-        from datetime import timedelta as td
-        df_test=DataFrame({'dt':[nan,'2015-07-24 10:10','2015-07-25 11:11','2015-07-23 12:12',nan],
-                           'td':[nan,td(days=1),td(days=2),td(days=3),nan]})
-        df_test.dt=pd.to_datetime(df_test.dt)
-        df_test['group']='A'
-        df_ref=df_test[df_test.dt.notnull()]
-
-        grouped_test=df_test.groupby('group')
-        grouped_ref=df_ref.groupby('group')
-
-        assert_frame_equal(grouped_ref.max(),grouped_test.max())
-        assert_frame_equal(grouped_ref.min(),grouped_test.min())
-        assert_frame_equal(grouped_ref.first(),grouped_test.first())
-        assert_frame_equal(grouped_ref.last(),grouped_test.last())
-
-    def test_groupby_preserves_sort(self):
-        # Test to ensure that groupby always preserves sort order of original
-        # object. Issue #8588 and #9651
-
-        df = DataFrame({'int_groups':[3,1,0,1,0,3,3,3],
-                        'string_groups':['z','a','z','a','a','g','g','g'],
-                        'ints':[8,7,4,5,2,9,1,1],
-                        'floats':[2.3,5.3,6.2,-2.4,2.2,1.1,1.1,5],
-                        'strings':['z','d','a','e','word','word2','42','47']})
-
-        # Try sorting on different types and with different group types
-        for sort_column in ['ints', 'floats', 'strings', ['ints','floats'],
-                  ['ints','strings']]:
-            for group_column in ['int_groups', 'string_groups',
-                                 ['int_groups','string_groups']]:
-
-                df = df.sort_values(by=sort_column)
-
-                g = df.groupby(group_column)
-
-                def test_sort(x):
-                    assert_frame_equal(x, x.sort_values(by=sort_column))
-
-                g.apply(test_sort)
-
-    def test_nunique_with_object(self):
-        # GH 11077
-        data = pd.DataFrame(
-            [[100, 1, 'Alice'],
-             [200, 2, 'Bob'],
-             [300, 3, 'Charlie'],
-             [-400, 4, 'Dan'],
-             [500, 5, 'Edith']],
-            columns=['amount', 'id', 'name']
-        )
-
-        result = data.groupby(['id', 'amount'])['name'].nunique()
-        index = MultiIndex.from_arrays([data.id, data.amount])
-        expected = pd.Series([1] * 5, name='name', index=index)
-        tm.assert_series_equal(result, expected)
-
-
-def assert_fp_equal(a, b):
-    assert (np.abs(a - b) < 1e-12).all()
-
-
-def _check_groupby(df, result, keys, field, f=lambda x: x.sum()):
-    tups = lmap(tuple, df[keys].values)
-    tups = com._asarray_tuplesafe(tups)
-    expected = f(df.groupby(tups)[field])
-    for k, v in compat.iteritems(expected):
-        assert(result[k] == v)
-
-
-def test_decons():
-    from pandas.core.groupby import decons_group_index, get_group_index
-
-    def testit(label_list, shape):
-        group_index = get_group_index(label_list, shape, sort=True, xnull=True)
-        label_list2 = decons_group_index(group_index, shape)
-
-        for a, b in zip(label_list, label_list2):
-            assert(np.array_equal(a, b))
-
-    shape = (4, 5, 6)
-    label_list = [np.tile([0, 1, 2, 3, 0, 1, 2, 3], 100),
-                  np.tile([0, 2, 4, 3, 0, 1, 2, 3], 100),
-                  np.tile([5, 1, 0, 2, 3, 0, 5, 4], 100)]
-    testit(label_list, shape)
-
-    shape = (10000, 10000)
-    label_list = [np.tile(np.arange(10000), 5),
-                  np.tile(np.arange(10000), 5)]
-    testit(label_list, shape)
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure',
-                         '-s'], exit=False)
diff --git a/pandas/tests/test_index.py b/pandas/tests/test_index.py
deleted file mode 100644
index f7d93a978a46a..0000000000000
--- a/pandas/tests/test_index.py
+++ /dev/null
@@ -1,5695 +0,0 @@
-# -*- coding: utf-8 -*-
-# pylint: disable=E1101,E1103,W0232
-
-from datetime import datetime, timedelta, time
-from pandas.compat import range, lrange, lzip, u, zip, PY3
-import operator
-import re
-import nose
-import warnings
-import os
-
-import numpy as np
-
-from pandas import (period_range, date_range, Categorical, Series,
-                    Index, Float64Index, Int64Index, MultiIndex,
-                    CategoricalIndex, DatetimeIndex, TimedeltaIndex, PeriodIndex)
-from pandas.core.index import InvalidIndexError, NumericIndex
-from pandas.util.testing import (assert_almost_equal, assertRaisesRegexp,
-                                 assert_copy)
-from pandas import compat
-from pandas.compat import long, is_platform_windows
-
-import pandas.util.testing as tm
-import pandas.core.config as cf
-
-from pandas.tseries.index import _to_m8
-import pandas.tseries.offsets as offsets
-
-import pandas as pd
-from pandas.lib import Timestamp
-from itertools import product
-
-
-class Base(object):
-    """ base class for index sub-class tests """
-    _holder = None
-    _compat_props = ['shape', 'ndim', 'size', 'itemsize', 'nbytes']
-
-    def setup_indices(self):
-        # setup the test indices in the self.indicies dict
-        for name, ind in self.indices.items():
-            setattr(self, name, ind)
-
-    def verify_pickle(self,index):
-        unpickled = self.round_trip_pickle(index)
-        self.assertTrue(index.equals(unpickled))
-
-    def test_pickle_compat_construction(self):
-        # this is testing for pickle compat
-        if self._holder is None:
-            return
-
-        # need an object to create with
-        self.assertRaises(TypeError, self._holder)
-
-    def test_numeric_compat(self):
-
-        idx = self.create_index()
-        tm.assertRaisesRegexp(TypeError,
-                              "cannot perform __mul__",
-                              lambda : idx * 1)
-        tm.assertRaisesRegexp(TypeError,
-                              "cannot perform __mul__",
-                              lambda : 1 * idx)
-
-        div_err = "cannot perform __truediv__" if compat.PY3 else "cannot perform __div__"
-        tm.assertRaisesRegexp(TypeError,
-                              div_err,
-                              lambda : idx / 1)
-        tm.assertRaisesRegexp(TypeError,
-                              div_err,
-                              lambda : 1 / idx)
-        tm.assertRaisesRegexp(TypeError,
-                              "cannot perform __floordiv__",
-                              lambda : idx // 1)
-        tm.assertRaisesRegexp(TypeError,
-                              "cannot perform __floordiv__",
-                              lambda : 1 // idx)
-
-    def test_logical_compat(self):
-        idx = self.create_index()
-        tm.assertRaisesRegexp(TypeError,
-                              'cannot perform all',
-                              lambda : idx.all())
-        tm.assertRaisesRegexp(TypeError,
-                              'cannot perform any',
-                              lambda : idx.any())
-
-    def test_boolean_context_compat(self):
-
-        # boolean context compat
-        idx = self.create_index()
-        def f():
-            if idx:
-                pass
-        tm.assertRaisesRegexp(ValueError,'The truth value of a',f)
-
-    def test_reindex_base(self):
-        idx = self.create_index()
-        expected = np.arange(idx.size)
-
-        actual = idx.get_indexer(idx)
-        tm.assert_numpy_array_equal(expected, actual)
-
-        with tm.assertRaisesRegexp(ValueError, 'Invalid fill method'):
-            idx.get_indexer(idx, method='invalid')
-
-    def test_ndarray_compat_properties(self):
-
-        idx = self.create_index()
-        self.assertTrue(idx.T.equals(idx))
-        self.assertTrue(idx.transpose().equals(idx))
-
-        values = idx.values
-        for prop in self._compat_props:
-            self.assertEqual(getattr(idx, prop), getattr(values, prop))
-
-        # test for validity
-        idx.nbytes
-        idx.values.nbytes
-
-    def test_repr_roundtrip(self):
-
-        idx = self.create_index()
-        tm.assert_index_equal(eval(repr(idx)),idx)
-
-    def test_str(self):
-
-        # test the string repr
-        idx = self.create_index()
-        idx.name = 'foo'
-        self.assertTrue("'foo'" in str(idx))
-        self.assertTrue(idx.__class__.__name__ in str(idx))
-
-    def test_dtype_str(self):
-        for idx in self.indices.values():
-            dtype = idx.dtype_str
-            self.assertIsInstance(dtype, compat.string_types)
-            if isinstance(idx, PeriodIndex):
-                self.assertEqual(dtype, 'period')
-            else:
-                self.assertEqual(dtype, str(idx.dtype))
-
-    def test_repr_max_seq_item_setting(self):
-        # GH10182
-        idx = self.create_index()
-        idx = idx.repeat(50)
-        with pd.option_context("display.max_seq_items", None):
-            repr(idx)
-            self.assertFalse('...' in str(idx))
-
-    def test_wrong_number_names(self):
-        def testit(ind):
-            ind.names = ["apple", "banana", "carrot"]
-
-        for ind in self.indices.values():
-            assertRaisesRegexp(ValueError, "^Length", testit, ind)
-
-    def test_set_name_methods(self):
-        new_name = "This is the new name for this index"
-        for ind in self.indices.values():
-
-            # don't tests a MultiIndex here (as its tested separated)
-            if isinstance(ind, MultiIndex):
-                continue
-
-            original_name = ind.name
-            new_ind = ind.set_names([new_name])
-            self.assertEqual(new_ind.name, new_name)
-            self.assertEqual(ind.name, original_name)
-            res = ind.rename(new_name, inplace=True)
-
-            # should return None
-            self.assertIsNone(res)
-            self.assertEqual(ind.name, new_name)
-            self.assertEqual(ind.names, [new_name])
-            #with assertRaisesRegexp(TypeError, "list-like"):
-            #    # should still fail even if it would be the right length
-            #    ind.set_names("a")
-            with assertRaisesRegexp(ValueError, "Level must be None"):
-                ind.set_names("a", level=0)
-
-            # rename in place just leaves tuples and other containers alone
-            name = ('A', 'B')
-            ind.rename(name, inplace=True)
-            self.assertEqual(ind.name, name)
-            self.assertEqual(ind.names, [name])
-
-    def test_hash_error(self):
-        for ind in self.indices.values():
-            with tm.assertRaisesRegexp(TypeError,
-                                       "unhashable type: %r" %
-                                       type(ind).__name__):
-                hash(ind)
-
-    def test_copy_and_deepcopy(self):
-        from copy import copy, deepcopy
-
-        for ind in self.indices.values():
-
-            # don't tests a MultiIndex here (as its tested separated)
-            if isinstance(ind, MultiIndex):
-                continue
-
-            for func in (copy, deepcopy):
-                idx_copy = func(ind)
-                self.assertIsNot(idx_copy, ind)
-                self.assertTrue(idx_copy.equals(ind))
-
-            new_copy = ind.copy(deep=True, name="banana")
-            self.assertEqual(new_copy.name, "banana")
-
-    def test_duplicates(self):
-        for ind in self.indices.values():
-
-            if not len(ind):
-                continue
-            if isinstance(ind, MultiIndex):
-                continue
-            idx = self._holder([ind[0]]*5)
-            self.assertFalse(idx.is_unique)
-            self.assertTrue(idx.has_duplicates)
-
-            # GH 10115
-            # preserve names
-            idx.name = 'foo'
-            result = idx.drop_duplicates()
-            self.assertEqual(result.name, 'foo')
-            self.assert_index_equal(result, Index([ind[0]],name='foo'))
-
-    def test_sort(self):
-        for ind in self.indices.values():
-            self.assertRaises(TypeError, ind.sort)
-
-    def test_order(self):
-        for ind in self.indices.values():
-            # 9816 deprecated
-            with tm.assert_produces_warning(FutureWarning):
-                ind.order()
-
-    def test_mutability(self):
-        for ind in self.indices.values():
-            if not len(ind):
-                continue
-            self.assertRaises(TypeError, ind.__setitem__, 0, ind[0])
-
-    def test_view(self):
-        for ind in self.indices.values():
-            i_view = ind.view()
-            self.assertEqual(i_view.name, ind.name)
-
-    def test_compat(self):
-        for ind in self.indices.values():
-            self.assertEqual(ind.tolist(),list(ind))
-
-    def test_argsort(self):
-        for k, ind in self.indices.items():
-
-            # sep teststed
-            if k in ['catIndex']:
-                continue
-
-            result = ind.argsort()
-            expected = np.array(ind).argsort()
-            tm.assert_numpy_array_equal(result, expected)
-
-    def test_pickle(self):
-        for ind in self.indices.values():
-            self.verify_pickle(ind)
-            ind.name = 'foo'
-            self.verify_pickle(ind)
-
-    def test_take(self):
-        indexer = [4, 3, 0, 2]
-        for k, ind in self.indices.items():
-
-            # separate
-            if k in ['boolIndex','tuples','empty']:
-                continue
-
-            result = ind.take(indexer)
-            expected = ind[indexer]
-            self.assertTrue(result.equals(expected))
-
-            if not isinstance(ind, (DatetimeIndex, PeriodIndex, TimedeltaIndex)):
-                # GH 10791
-                with tm.assertRaises(AttributeError):
-                    ind.freq
-
-    def test_setops_errorcases(self):
-        for name, idx in compat.iteritems(self.indices):
-            # # non-iterable input
-            cases = [0.5, 'xxx']
-            methods = [idx.intersection, idx.union, idx.difference, idx.sym_diff]
-
-            for method in methods:
-                for case in cases:
-                    assertRaisesRegexp(TypeError,
-                                       "Input must be Index or array-like",
-                                       method, case)
-
-    def test_intersection_base(self):
-        for name, idx in compat.iteritems(self.indices):
-            first = idx[:5]
-            second = idx[:3]
-            intersect = first.intersection(second)
-
-            if isinstance(idx, CategoricalIndex):
-                pass
-            else:
-                self.assertTrue(tm.equalContents(intersect, second))
-
-            # GH 10149
-            cases = [klass(second.values) for klass in [np.array, Series, list]]
-            for case in cases:
-                if isinstance(idx, PeriodIndex):
-                    msg = "can only call with other PeriodIndex-ed objects"
-                    with tm.assertRaisesRegexp(ValueError, msg):
-                        result = first.intersection(case)
-                elif isinstance(idx, CategoricalIndex):
-                    pass
-                else:
-                    result = first.intersection(case)
-                    self.assertTrue(tm.equalContents(result, second))
-
-            if isinstance(idx, MultiIndex):
-                msg = "other must be a MultiIndex or a list of tuples"
-                with tm.assertRaisesRegexp(TypeError, msg):
-                    result = first.intersection([1, 2, 3])
-
-    def test_union_base(self):
-        for name, idx in compat.iteritems(self.indices):
-            first = idx[3:]
-            second = idx[:5]
-            everything = idx
-            union = first.union(second)
-            self.assertTrue(tm.equalContents(union, everything))
-
-            # GH 10149
-            cases = [klass(second.values) for klass in [np.array, Series, list]]
-            for case in cases:
-                if isinstance(idx, PeriodIndex):
-                    msg = "can only call with other PeriodIndex-ed objects"
-                    with tm.assertRaisesRegexp(ValueError, msg):
-                        result = first.union(case)
-                elif isinstance(idx, CategoricalIndex):
-                    pass
-                else:
-                    result = first.union(case)
-                    self.assertTrue(tm.equalContents(result, everything))
-
-            if isinstance(idx, MultiIndex):
-                msg = "other must be a MultiIndex or a list of tuples"
-                with tm.assertRaisesRegexp(TypeError, msg):
-                    result = first.union([1, 2, 3])
-
-    def test_difference_base(self):
-        for name, idx in compat.iteritems(self.indices):
-            first = idx[2:]
-            second = idx[:4]
-            answer = idx[4:]
-            result = first.difference(second)
-
-            if isinstance(idx, CategoricalIndex):
-                pass
-            else:
-                self.assertTrue(tm.equalContents(result, answer))
-
-            # GH 10149
-            cases = [klass(second.values) for klass in [np.array, Series, list]]
-            for case in cases:
-                if isinstance(idx, PeriodIndex):
-                    msg = "can only call with other PeriodIndex-ed objects"
-                    with tm.assertRaisesRegexp(ValueError, msg):
-                        result = first.difference(case)
-                elif isinstance(idx, CategoricalIndex):
-                    pass
-                elif isinstance(idx, (DatetimeIndex, TimedeltaIndex)):
-                    self.assertEqual(result.__class__, answer.__class__)
-                    tm.assert_numpy_array_equal(result.asi8, answer.asi8)
-                else:
-                    result = first.difference(case)
-                    self.assertTrue(tm.equalContents(result, answer))
-
-            if isinstance(idx, MultiIndex):
-                msg = "other must be a MultiIndex or a list of tuples"
-                with tm.assertRaisesRegexp(TypeError, msg):
-                    result = first.difference([1, 2, 3])
-
-    def test_symmetric_diff(self):
-        for name, idx in compat.iteritems(self.indices):
-            first = idx[1:]
-            second = idx[:-1]
-            if isinstance(idx, CategoricalIndex):
-                pass
-            else:
-                answer = idx[[0, -1]]
-                result = first.sym_diff(second)
-                self.assertTrue(tm.equalContents(result, answer))
-
-            # GH 10149
-            cases = [klass(second.values) for klass in [np.array, Series, list]]
-            for case in cases:
-                if isinstance(idx, PeriodIndex):
-                    msg = "can only call with other PeriodIndex-ed objects"
-                    with tm.assertRaisesRegexp(ValueError, msg):
-                        result = first.sym_diff(case)
-                elif isinstance(idx, CategoricalIndex):
-                    pass
-                else:
-                    result = first.sym_diff(case)
-                    self.assertTrue(tm.equalContents(result, answer))
-
-            if isinstance(idx, MultiIndex):
-                msg = "other must be a MultiIndex or a list of tuples"
-                with tm.assertRaisesRegexp(TypeError, msg):
-                    result = first.sym_diff([1, 2, 3])
-
-    def test_insert_base(self):
-
-        for name, idx in compat.iteritems(self.indices):
-            result = idx[1:4]
-
-            if not len(idx):
-                continue
-
-            #test 0th element
-            self.assertTrue(idx[0:4].equals(
-                result.insert(0, idx[0])))
-
-    def test_delete_base(self):
-
-        for name, idx in compat.iteritems(self.indices):
-
-            if not len(idx):
-                continue
-
-            expected = idx[1:]
-            result = idx.delete(0)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-
-            expected = idx[:-1]
-            result = idx.delete(-1)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-
-            with tm.assertRaises((IndexError, ValueError)):
-                # either depending on numpy version
-                result = idx.delete(len(idx))
-
-    def test_equals_op(self):
-        # GH9947, GH10637
-        index_a = self.create_index()
-        if isinstance(index_a, PeriodIndex):
-            return
-
-        n = len(index_a)
-        index_b = index_a[0:-1]
-        index_c = index_a[0:-1].append(index_a[-2:-1])
-        index_d = index_a[0:1]
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
-            index_a == index_b
-        expected1 = np.array([True] * n)
-        expected2 = np.array([True] * (n - 1) + [False])
-        tm.assert_numpy_array_equal(index_a == index_a, expected1)
-        tm.assert_numpy_array_equal(index_a == index_c, expected2)
-
-        # test comparisons with numpy arrays
-        array_a = np.array(index_a)
-        array_b = np.array(index_a[0:-1])
-        array_c = np.array(index_a[0:-1].append(index_a[-2:-1]))
-        array_d = np.array(index_a[0:1])
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
-            index_a == array_b
-        tm.assert_numpy_array_equal(index_a == array_a, expected1)
-        tm.assert_numpy_array_equal(index_a == array_c, expected2)
-
-        # test comparisons with Series
-        series_a = Series(array_a)
-        series_b = Series(array_b)
-        series_c = Series(array_c)
-        series_d = Series(array_d)
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
-            index_a == series_b
-        tm.assert_numpy_array_equal(index_a == series_a, expected1)
-        tm.assert_numpy_array_equal(index_a == series_c, expected2)
-
-        # cases where length is 1 for one of them
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
-            index_a == index_d
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
-            index_a == series_d
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
-            index_a == array_d
-        with tm.assertRaisesRegexp(ValueError, "Series lengths must match"):
-            series_a == series_d
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
-            series_a == array_d
-
-        # comparing with a scalar should broadcast; note that we are excluding
-        # MultiIndex because in this case each item in the index is a tuple of
-        # length 2, and therefore is considered an array of length 2 in the
-        # comparison instead of a scalar
-        if not isinstance(index_a, MultiIndex):
-            expected3 = np.array([False] * (len(index_a) - 2) + [True, False])
-            # assuming the 2nd to last item is unique in the data
-            item = index_a[-2]
-            tm.assert_numpy_array_equal(index_a == item, expected3)
-            tm.assert_numpy_array_equal(series_a == item, expected3)
-
-    def test_numpy_ufuncs(self):
-        # test ufuncs of numpy 1.9.2. see:
-        # http://docs.scipy.org/doc/numpy/reference/ufuncs.html
-
-        # some functions are skipped because it may return different result
-        # for unicode input depending on numpy version
-
-        for name, idx in compat.iteritems(self.indices):
-            for func in [np.exp, np.exp2, np.expm1, np.log, np.log2, np.log10,
-                         np.log1p, np.sqrt, np.sin, np.cos,
-                         np.tan, np.arcsin, np.arccos, np.arctan,
-                         np.sinh, np.cosh, np.tanh, np.arcsinh, np.arccosh,
-                         np.arctanh, np.deg2rad, np.rad2deg]:
-                if isinstance(idx, pd.tseries.base.DatetimeIndexOpsMixin):
-                    # raise TypeError or ValueError (PeriodIndex)
-                    # PeriodIndex behavior should be changed in future version
-                    with tm.assertRaises(Exception):
-                        func(idx)
-                elif isinstance(idx, (Float64Index, Int64Index)):
-                    # coerces to float (e.g. np.sin)
-                    result = func(idx)
-                    exp = Index(func(idx.values), name=idx.name)
-                    self.assert_index_equal(result, exp)
-                    self.assertIsInstance(result, pd.Float64Index)
-                else:
-                    # raise AttributeError or TypeError
-                    if len(idx) == 0:
-                        continue
-                    else:
-                        with tm.assertRaises(Exception):
-                            func(idx)
-
-            for func in [np.isfinite, np.isinf, np.isnan, np.signbit]:
-                if isinstance(idx, pd.tseries.base.DatetimeIndexOpsMixin):
-                    # raise TypeError or ValueError (PeriodIndex)
-                    with tm.assertRaises(Exception):
-                        func(idx)
-                elif isinstance(idx, (Float64Index, Int64Index)):
-                    # results in bool array
-                    result = func(idx)
-                    exp = func(idx.values)
-                    self.assertIsInstance(result, np.ndarray)
-                    tm.assertNotIsInstance(result, Index)
-                else:
-                    if len(idx) == 0:
-                        continue
-                    else:
-                        with tm.assertRaises(Exception):
-                            func(idx)
-
-
-class TestIndex(Base, tm.TestCase):
-    _holder = Index
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.indices = dict(
-            unicodeIndex = tm.makeUnicodeIndex(100),
-            strIndex = tm.makeStringIndex(100),
-            dateIndex = tm.makeDateIndex(100),
-            periodIndex = tm.makePeriodIndex(100),
-            tdIndex = tm.makeTimedeltaIndex(100),
-            intIndex = tm.makeIntIndex(100),
-            floatIndex = tm.makeFloatIndex(100),
-            boolIndex = Index([True,False]),
-            catIndex = tm.makeCategoricalIndex(100),
-            empty = Index([]),
-            tuples = MultiIndex.from_tuples(lzip(['foo', 'bar', 'baz'],
-                                                 [1, 2, 3]))
-        )
-        self.setup_indices()
-
-    def create_index(self):
-        return Index(list('abcde'))
-
-    def test_new_axis(self):
-        new_index = self.dateIndex[None, :]
-        self.assertEqual(new_index.ndim, 2)
-        tm.assertIsInstance(new_index, np.ndarray)
-
-    def test_copy_and_deepcopy(self):
-        super(TestIndex, self).test_copy_and_deepcopy()
-
-        new_copy2 = self.intIndex.copy(dtype=int)
-        self.assertEqual(new_copy2.dtype.kind, 'i')
-
-    def test_constructor(self):
-        # regular instance creation
-        tm.assert_contains_all(self.strIndex, self.strIndex)
-        tm.assert_contains_all(self.dateIndex, self.dateIndex)
-
-        # casting
-        arr = np.array(self.strIndex)
-        index = Index(arr)
-        tm.assert_contains_all(arr, index)
-        tm.assert_numpy_array_equal(self.strIndex, index)
-
-        # copy
-        arr = np.array(self.strIndex)
-        index = Index(arr, copy=True, name='name')
-        tm.assertIsInstance(index, Index)
-        self.assertEqual(index.name, 'name')
-        tm.assert_numpy_array_equal(arr, index)
-        arr[0] = "SOMEBIGLONGSTRING"
-        self.assertNotEqual(index[0], "SOMEBIGLONGSTRING")
-
-        # what to do here?
-        # arr = np.array(5.)
-        # self.assertRaises(Exception, arr.view, Index)
-
-    def test_constructor_corner(self):
-        # corner case
-        self.assertRaises(TypeError, Index, 0)
-
-    def test_construction_list_mixed_tuples(self):
-        # 10697
-        # if we are constructing from a mixed list of tuples, make sure that we
-        # are independent of the sorting order
-        idx1 = Index([('A',1),'B'])
-        self.assertIsInstance(idx1, Index) and self.assertNotInstance(idx1, MultiIndex)
-        idx2 = Index(['B',('A',1)])
-        self.assertIsInstance(idx2, Index) and self.assertNotInstance(idx2, MultiIndex)
-
-    def test_constructor_from_series(self):
-
-        expected = DatetimeIndex([Timestamp('20110101'),Timestamp('20120101'),Timestamp('20130101')])
-        s = Series([Timestamp('20110101'),Timestamp('20120101'),Timestamp('20130101')])
-        result = Index(s)
-        self.assertTrue(result.equals(expected))
-        result = DatetimeIndex(s)
-        self.assertTrue(result.equals(expected))
-
-        # GH 6273
-        # create from a series, passing a freq
-        s = Series(pd.to_datetime(['1-1-1990', '2-1-1990', '3-1-1990', '4-1-1990', '5-1-1990']))
-        result = DatetimeIndex(s, freq='MS')
-        expected = DatetimeIndex(['1-1-1990', '2-1-1990', '3-1-1990', '4-1-1990', '5-1-1990'],freq='MS')
-        self.assertTrue(result.equals(expected))
-
-        df = pd.DataFrame(np.random.rand(5,3))
-        df['date'] = ['1-1-1990', '2-1-1990', '3-1-1990', '4-1-1990', '5-1-1990']
-        result = DatetimeIndex(df['date'], freq='MS')
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(df['date'].dtype, object)
-
-        exp = pd.Series(['1-1-1990', '2-1-1990', '3-1-1990', '4-1-1990', '5-1-1990'], name='date')
-        self.assert_series_equal(df['date'], exp)
-
-        # GH 6274
-        # infer freq of same
-        result = pd.infer_freq(df['date'])
-        self.assertEqual(result,'MS')
-
-    def test_constructor_ndarray_like(self):
-        # GH 5460#issuecomment-44474502
-        # it should be possible to convert any object that satisfies the numpy
-        # ndarray interface directly into an Index
-        class ArrayLike(object):
-            def __init__(self, array):
-                self.array = array
-            def __array__(self, dtype=None):
-                return self.array
-
-        for array in [np.arange(5),
-                      np.array(['a', 'b', 'c']),
-                      date_range('2000-01-01', periods=3).values]:
-            expected = pd.Index(array)
-            result = pd.Index(ArrayLike(array))
-            self.assertTrue(result.equals(expected))
-
-    def test_index_ctor_infer_periodindex(self):
-        xp = period_range('2012-1-1', freq='M', periods=3)
-        rs = Index(xp)
-        tm.assert_numpy_array_equal(rs, xp)
-        tm.assertIsInstance(rs, PeriodIndex)
-
-    def test_constructor_simple_new(self):
-        idx = Index([1, 2, 3, 4, 5], name='int')
-        result = idx._simple_new(idx, 'int')
-        self.assertTrue(result.equals(idx))
-
-        idx = Index([1.1, np.nan, 2.2, 3.0], name='float')
-        result = idx._simple_new(idx, 'float')
-        self.assertTrue(result.equals(idx))
-
-        idx = Index(['A', 'B', 'C', np.nan], name='obj')
-        result = idx._simple_new(idx, 'obj')
-        self.assertTrue(result.equals(idx))
-
-    def test_constructor_dtypes(self):
-
-        for idx in [Index(np.array([1, 2, 3], dtype=int)),
-                    Index(np.array([1, 2, 3], dtype=int), dtype=int),
-                    Index(np.array([1., 2., 3.], dtype=float), dtype=int),
-                    Index([1, 2, 3], dtype=int),
-                    Index([1., 2., 3.], dtype=int)]:
-            self.assertIsInstance(idx, Int64Index)
-
-        for idx in [Index(np.array([1., 2., 3.], dtype=float)),
-                    Index(np.array([1, 2, 3], dtype=int), dtype=float),
-                    Index(np.array([1., 2., 3.], dtype=float), dtype=float),
-                    Index([1, 2, 3], dtype=float),
-                    Index([1., 2., 3.], dtype=float)]:
-            self.assertIsInstance(idx, Float64Index)
-
-        for idx in [Index(np.array([True, False, True], dtype=bool)),
-                    Index([True, False, True]),
-                    Index(np.array([True, False, True], dtype=bool), dtype=bool),
-                    Index([True, False, True], dtype=bool)]:
-            self.assertIsInstance(idx, Index)
-            self.assertEqual(idx.dtype, object)
-
-        for idx in [Index(np.array([1, 2, 3], dtype=int), dtype='category'),
-                    Index([1, 2, 3], dtype='category'),
-                    Index(np.array([np.datetime64('2011-01-01'), np.datetime64('2011-01-02')]), dtype='category'),
-                    Index([datetime(2011, 1, 1), datetime(2011, 1, 2)], dtype='category')]:
-            self.assertIsInstance(idx, CategoricalIndex)
-
-        for idx in [Index(np.array([np.datetime64('2011-01-01'), np.datetime64('2011-01-02')])),
-                    Index([datetime(2011, 1, 1), datetime(2011, 1, 2)])]:
-            self.assertIsInstance(idx, DatetimeIndex)
-
-        for idx in [Index(np.array([np.datetime64('2011-01-01'), np.datetime64('2011-01-02')]), dtype=object),
-                    Index([datetime(2011, 1, 1), datetime(2011, 1, 2)], dtype=object)]:
-            self.assertNotIsInstance(idx, DatetimeIndex)
-            self.assertIsInstance(idx, Index)
-            self.assertEqual(idx.dtype, object)
-
-        for idx in [Index(np.array([np.timedelta64(1, 'D'), np.timedelta64(1, 'D')])),
-                    Index([timedelta(1), timedelta(1)])]:
-            self.assertIsInstance(idx, TimedeltaIndex)
-
-        for idx in [Index(np.array([np.timedelta64(1, 'D'), np.timedelta64(1, 'D')]), dtype=object),
-                    Index([timedelta(1), timedelta(1)], dtype=object)]:
-            self.assertNotIsInstance(idx, TimedeltaIndex)
-            self.assertIsInstance(idx, Index)
-            self.assertEqual(idx.dtype, object)
-
-    def test_view_with_args(self):
-
-        restricted = ['unicodeIndex','strIndex','catIndex','boolIndex','empty']
-
-        for i in restricted:
-            ind = self.indices[i]
-
-            # with arguments
-            self.assertRaises(TypeError, lambda : ind.view('i8'))
-
-        # these are ok
-        for i in list(set(self.indices.keys())-set(restricted)):
-            ind = self.indices[i]
-
-            # with arguments
-            ind.view('i8')
-
-    def test_legacy_pickle_identity(self):
-
-        # GH 8431
-        pth = tm.get_data_path()
-        s1 = pd.read_pickle(os.path.join(pth,'s1-0.12.0.pickle'))
-        s2 = pd.read_pickle(os.path.join(pth,'s2-0.12.0.pickle'))
-        self.assertFalse(s1.index.identical(s2.index))
-        self.assertFalse(s1.index.equals(s2.index))
-
-    def test_astype(self):
-        casted = self.intIndex.astype('i8')
-
-        # it works!
-        casted.get_loc(5)
-
-        # pass on name
-        self.intIndex.name = 'foobar'
-        casted = self.intIndex.astype('i8')
-        self.assertEqual(casted.name, 'foobar')
-
-    def test_equals(self):
-        # same
-        self.assertTrue(Index(['a', 'b', 'c']).equals(Index(['a', 'b', 'c'])))
-
-        # different length
-        self.assertFalse(Index(['a', 'b', 'c']).equals(Index(['a', 'b'])))
-
-        # same length, different values
-        self.assertFalse(Index(['a', 'b', 'c']).equals(Index(['a', 'b', 'd'])))
-
-        # Must also be an Index
-        self.assertFalse(Index(['a', 'b', 'c']).equals(['a', 'b', 'c']))
-
-    def test_insert(self):
-
-        # GH 7256
-        # validate neg/pos inserts
-        result = Index(['b', 'c', 'd'])
-
-        #test 0th element
-        self.assertTrue(Index(['a', 'b', 'c', 'd']).equals(
-            result.insert(0, 'a')))
-
-        #test Nth element that follows Python list behavior
-        self.assertTrue(Index(['b', 'c', 'e', 'd']).equals(
-            result.insert(-1, 'e')))
-
-        #test loc +/- neq (0, -1)
-        self.assertTrue(result.insert(1, 'z').equals(
-            result.insert(-2, 'z')))
-
-        #test empty
-        null_index = Index([])
-        self.assertTrue(Index(['a']).equals(
-            null_index.insert(0, 'a')))
-
-    def test_delete(self):
-        idx = Index(['a', 'b', 'c', 'd'], name='idx')
-
-        expected = Index(['b', 'c', 'd'], name='idx')
-        result = idx.delete(0)
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.name, expected.name)
-
-        expected = Index(['a', 'b', 'c'], name='idx')
-        result = idx.delete(-1)
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.name, expected.name)
-
-        with tm.assertRaises((IndexError, ValueError)):
-            # either depeidnig on numpy version
-            result = idx.delete(5)
-
-    def test_identical(self):
-
-        # index
-        i1 = Index(['a', 'b', 'c'])
-        i2 = Index(['a', 'b', 'c'])
-
-        self.assertTrue(i1.identical(i2))
-
-        i1 = i1.rename('foo')
-        self.assertTrue(i1.equals(i2))
-        self.assertFalse(i1.identical(i2))
-
-        i2 = i2.rename('foo')
-        self.assertTrue(i1.identical(i2))
-
-        i3 = Index([('a', 'a'), ('a', 'b'), ('b', 'a')])
-        i4 = Index([('a', 'a'), ('a', 'b'), ('b', 'a')], tupleize_cols=False)
-        self.assertFalse(i3.identical(i4))
-
-    def test_is_(self):
-        ind = Index(range(10))
-        self.assertTrue(ind.is_(ind))
-        self.assertTrue(ind.is_(ind.view().view().view().view()))
-        self.assertFalse(ind.is_(Index(range(10))))
-        self.assertFalse(ind.is_(ind.copy()))
-        self.assertFalse(ind.is_(ind.copy(deep=False)))
-        self.assertFalse(ind.is_(ind[:]))
-        self.assertFalse(ind.is_(ind.view(np.ndarray).view(Index)))
-        self.assertFalse(ind.is_(np.array(range(10))))
-
-        # quasi-implementation dependent
-        self.assertTrue(ind.is_(ind.view()))
-        ind2 = ind.view()
-        ind2.name = 'bob'
-        self.assertTrue(ind.is_(ind2))
-        self.assertTrue(ind2.is_(ind))
-        # doesn't matter if Indices are *actually* views of underlying data,
-        self.assertFalse(ind.is_(Index(ind.values)))
-        arr = np.array(range(1, 11))
-        ind1 = Index(arr, copy=False)
-        ind2 = Index(arr, copy=False)
-        self.assertFalse(ind1.is_(ind2))
-
-    def test_asof(self):
-        d = self.dateIndex[0]
-        self.assertEqual(self.dateIndex.asof(d), d)
-        self.assertTrue(np.isnan(self.dateIndex.asof(d - timedelta(1))))
-
-        d = self.dateIndex[-1]
-        self.assertEqual(self.dateIndex.asof(d + timedelta(1)), d)
-
-        d = self.dateIndex[0].to_datetime()
-        tm.assertIsInstance(self.dateIndex.asof(d), Timestamp)
-
-    def test_asof_datetime_partial(self):
-        idx = pd.date_range('2010-01-01', periods=2, freq='m')
-        expected = Timestamp('2010-02-28')
-        result = idx.asof('2010-02')
-        self.assertEqual(result, expected)
-        self.assertFalse(isinstance(result, Index))
-
-    def test_nanosecond_index_access(self):
-        s = Series([Timestamp('20130101')]).values.view('i8')[0]
-        r = DatetimeIndex([s + 50 + i for i in range(100)])
-        x = Series(np.random.randn(100), index=r)
-
-        first_value = x.asof(x.index[0])
-
-        # this does not yet work, as parsing strings is done via dateutil
-        #self.assertEqual(first_value, x['2013-01-01 00:00:00.000000050+0000'])
-
-        self.assertEqual(first_value, x[Timestamp(np.datetime64('2013-01-01 00:00:00.000000050+0000', 'ns'))])
-
-    def test_comparators(self):
-        index = self.dateIndex
-        element = index[len(index) // 2]
-        element = _to_m8(element)
-
-        arr = np.array(index)
-
-        def _check(op):
-            arr_result = op(arr, element)
-            index_result = op(index, element)
-
-            self.assertIsInstance(index_result, np.ndarray)
-            tm.assert_numpy_array_equal(arr_result, index_result)
-
-        _check(operator.eq)
-        _check(operator.ne)
-        _check(operator.gt)
-        _check(operator.lt)
-        _check(operator.ge)
-        _check(operator.le)
-
-    def test_booleanindex(self):
-        boolIdx = np.repeat(True, len(self.strIndex)).astype(bool)
-        boolIdx[5:30:2] = False
-
-        subIndex = self.strIndex[boolIdx]
-
-        for i, val in enumerate(subIndex):
-            self.assertEqual(subIndex.get_loc(val), i)
-
-        subIndex = self.strIndex[list(boolIdx)]
-        for i, val in enumerate(subIndex):
-            self.assertEqual(subIndex.get_loc(val), i)
-
-    def test_fancy(self):
-        sl = self.strIndex[[1, 2, 3]]
-        for i in sl:
-            self.assertEqual(i, sl[sl.get_loc(i)])
-
-    def test_empty_fancy(self):
-        empty_farr = np.array([], dtype=np.float_)
-        empty_iarr = np.array([], dtype=np.int_)
-        empty_barr = np.array([], dtype=np.bool_)
-
-        # pd.DatetimeIndex is excluded, because it overrides getitem and should
-        # be tested separately.
-        for idx in [self.strIndex, self.intIndex, self.floatIndex]:
-            empty_idx = idx.__class__([])
-            values = idx.values
-
-            self.assertTrue(idx[[]].identical(empty_idx))
-            self.assertTrue(idx[empty_iarr].identical(empty_idx))
-            self.assertTrue(idx[empty_barr].identical(empty_idx))
-
-            # np.ndarray only accepts ndarray of int & bool dtypes, so should
-            # Index.
-            self.assertRaises(IndexError, idx.__getitem__, empty_farr)
-
-    def test_getitem(self):
-        arr = np.array(self.dateIndex)
-        exp = self.dateIndex[5]
-        exp = _to_m8(exp)
-
-        self.assertEqual(exp, arr[5])
-
-    def test_shift(self):
-        shifted = self.dateIndex.shift(0, timedelta(1))
-        self.assertIs(shifted, self.dateIndex)
-
-        shifted = self.dateIndex.shift(5, timedelta(1))
-        tm.assert_numpy_array_equal(shifted, self.dateIndex + timedelta(5))
-
-        shifted = self.dateIndex.shift(1, 'B')
-        tm.assert_numpy_array_equal(shifted, self.dateIndex + offsets.BDay())
-
-        shifted.name = 'shifted'
-        self.assertEqual(shifted.name, shifted.shift(1, 'D').name)
-
-    def test_intersection(self):
-        first = self.strIndex[:20]
-        second = self.strIndex[:10]
-        intersect = first.intersection(second)
-        self.assertTrue(tm.equalContents(intersect, second))
-
-        # Corner cases
-        inter = first.intersection(first)
-        self.assertIs(inter, first)
-
-        idx1 = Index([1, 2, 3, 4, 5], name='idx')
-        # if target has the same name, it is preserved
-        idx2 = Index([3, 4, 5, 6, 7], name='idx')
-        expected2 = Index([3, 4, 5], name='idx')
-        result2 = idx1.intersection(idx2)
-        self.assertTrue(result2.equals(expected2))
-        self.assertEqual(result2.name, expected2.name)
-
-        # if target name is different, it will be reset
-        idx3 = Index([3, 4, 5, 6, 7], name='other')
-        expected3 = Index([3, 4, 5], name=None)
-        result3 = idx1.intersection(idx3)
-        self.assertTrue(result3.equals(expected3))
-        self.assertEqual(result3.name, expected3.name)
-
-        # non monotonic
-        idx1 = Index([5, 3, 2, 4, 1], name='idx')
-        idx2 = Index([4, 7, 6, 5, 3], name='idx')
-        result2 = idx1.intersection(idx2)
-        self.assertTrue(tm.equalContents(result2, expected2))
-        self.assertEqual(result2.name, expected2.name)
-
-        idx3 = Index([4, 7, 6, 5, 3], name='other')
-        result3 = idx1.intersection(idx3)
-        self.assertTrue(tm.equalContents(result3, expected3))
-        self.assertEqual(result3.name, expected3.name)
-
-        # non-monotonic non-unique
-        idx1 = Index(['A','B','A','C'])
-        idx2 = Index(['B','D'])
-        expected = Index(['B'], dtype='object')
-        result = idx1.intersection(idx2)
-        self.assertTrue(result.equals(expected))
-
-    def test_union(self):
-        first = self.strIndex[5:20]
-        second = self.strIndex[:10]
-        everything = self.strIndex[:20]
-        union = first.union(second)
-        self.assertTrue(tm.equalContents(union, everything))
-
-        # GH 10149
-        cases = [klass(second.values) for klass in [np.array, Series, list]]
-        for case in cases:
-            result = first.union(case)
-            self.assertTrue(tm.equalContents(result, everything))
-
-        # Corner cases
-        union = first.union(first)
-        self.assertIs(union, first)
-
-        union = first.union([])
-        self.assertIs(union, first)
-
-        union = Index([]).union(first)
-        self.assertIs(union, first)
-
-        # preserve names
-        first.name = 'A'
-        second.name = 'A'
-        union = first.union(second)
-        self.assertEqual(union.name, 'A')
-
-        second.name = 'B'
-        union = first.union(second)
-        self.assertIsNone(union.name)
-
-    def test_add(self):
-
-        # - API change GH 8226
-        with tm.assert_produces_warning():
-            self.strIndex + self.strIndex
-        with tm.assert_produces_warning():
-            self.strIndex + self.strIndex.tolist()
-        with tm.assert_produces_warning():
-            self.strIndex.tolist() + self.strIndex
-
-        with tm.assert_produces_warning(RuntimeWarning):
-            firstCat = self.strIndex.union(self.dateIndex)
-        secondCat = self.strIndex.union(self.strIndex)
-
-        if self.dateIndex.dtype == np.object_:
-            appended = np.append(self.strIndex, self.dateIndex)
-        else:
-            appended = np.append(self.strIndex, self.dateIndex.astype('O'))
-
-        self.assertTrue(tm.equalContents(firstCat, appended))
-        self.assertTrue(tm.equalContents(secondCat, self.strIndex))
-        tm.assert_contains_all(self.strIndex, firstCat)
-        tm.assert_contains_all(self.strIndex, secondCat)
-        tm.assert_contains_all(self.dateIndex, firstCat)
-
-        # test add and radd
-        idx = Index(list('abc'))
-        expected = Index(['a1', 'b1', 'c1'])
-        self.assert_index_equal(idx + '1', expected)
-        expected = Index(['1a', '1b', '1c'])
-        self.assert_index_equal('1' + idx, expected)
-
-    def test_append_multiple(self):
-        index = Index(['a', 'b', 'c', 'd', 'e', 'f'])
-
-        foos = [index[:2], index[2:4], index[4:]]
-        result = foos[0].append(foos[1:])
-        self.assertTrue(result.equals(index))
-
-        # empty
-        result = index.append([])
-        self.assertTrue(result.equals(index))
-
-    def test_append_empty_preserve_name(self):
-        left = Index([], name='foo')
-        right = Index([1, 2, 3], name='foo')
-
-        result = left.append(right)
-        self.assertEqual(result.name, 'foo')
-
-        left = Index([], name='foo')
-        right = Index([1, 2, 3], name='bar')
-
-        result = left.append(right)
-        self.assertIsNone(result.name)
-
-    def test_add_string(self):
-        # from bug report
-        index = Index(['a', 'b', 'c'])
-        index2 = index + 'foo'
-
-        self.assertNotIn('a', index2)
-        self.assertIn('afoo', index2)
-
-    def test_iadd_string(self):
-        index = pd.Index(['a', 'b', 'c'])
-        # doesn't fail test unless there is a check before `+=`
-        self.assertIn('a', index)
-
-        index += '_x'
-        self.assertIn('a_x', index)
-
-    def test_difference(self):
-
-        first = self.strIndex[5:20]
-        second = self.strIndex[:10]
-        answer = self.strIndex[10:20]
-        first.name = 'name'
-        # different names
-        result = first.difference(second)
-
-        self.assertTrue(tm.equalContents(result, answer))
-        self.assertEqual(result.name, None)
-
-        # same names
-        second.name = 'name'
-        result = first.difference(second)
-        self.assertEqual(result.name, 'name')
-
-        # with empty
-        result = first.difference([])
-        self.assertTrue(tm.equalContents(result, first))
-        self.assertEqual(result.name, first.name)
-
-        # with everythin
-        result = first.difference(first)
-        self.assertEqual(len(result), 0)
-        self.assertEqual(result.name, first.name)
-
-    def test_symmetric_diff(self):
-        # smoke
-        idx1 = Index([1, 2, 3, 4], name='idx1')
-        idx2 = Index([2, 3, 4, 5])
-        result = idx1.sym_diff(idx2)
-        expected = Index([1, 5])
-        self.assertTrue(tm.equalContents(result, expected))
-        self.assertIsNone(result.name)
-
-        # __xor__ syntax
-        expected = idx1 ^ idx2
-        self.assertTrue(tm.equalContents(result, expected))
-        self.assertIsNone(result.name)
-
-        # multiIndex
-        idx1 = MultiIndex.from_tuples(self.tuples)
-        idx2 = MultiIndex.from_tuples([('foo', 1), ('bar', 3)])
-        result = idx1.sym_diff(idx2)
-        expected = MultiIndex.from_tuples([('bar', 2), ('baz', 3), ('bar', 3)])
-        self.assertTrue(tm.equalContents(result, expected))
-
-        # nans:
-        # GH #6444, sorting of nans. Make sure the number of nans is right
-        # and the correct non-nan values are there. punt on sorting.
-        idx1 = Index([1, 2, 3, np.nan])
-        idx2 = Index([0, 1, np.nan])
-        result = idx1.sym_diff(idx2)
-        # expected = Index([0.0, np.nan, 2.0, 3.0, np.nan])
-
-        nans = pd.isnull(result)
-        self.assertEqual(nans.sum(), 1)
-        self.assertEqual((~nans).sum(), 3)
-        [self.assertIn(x, result) for x in [0.0, 2.0, 3.0]]
-
-        # other not an Index:
-        idx1 = Index([1, 2, 3, 4], name='idx1')
-        idx2 = np.array([2, 3, 4, 5])
-        expected = Index([1, 5])
-        result = idx1.sym_diff(idx2)
-        self.assertTrue(tm.equalContents(result, expected))
-        self.assertEqual(result.name, 'idx1')
-
-        result = idx1.sym_diff(idx2, result_name='new_name')
-        self.assertTrue(tm.equalContents(result, expected))
-        self.assertEqual(result.name, 'new_name')
-
-    def test_is_numeric(self):
-        self.assertFalse(self.dateIndex.is_numeric())
-        self.assertFalse(self.strIndex.is_numeric())
-        self.assertTrue(self.intIndex.is_numeric())
-        self.assertTrue(self.floatIndex.is_numeric())
-        self.assertFalse(self.catIndex.is_numeric())
-
-    def test_is_object(self):
-        self.assertTrue(self.strIndex.is_object())
-        self.assertTrue(self.boolIndex.is_object())
-        self.assertFalse(self.catIndex.is_object())
-        self.assertFalse(self.intIndex.is_object())
-        self.assertFalse(self.dateIndex.is_object())
-        self.assertFalse(self.floatIndex.is_object())
-
-    def test_is_all_dates(self):
-        self.assertTrue(self.dateIndex.is_all_dates)
-        self.assertFalse(self.strIndex.is_all_dates)
-        self.assertFalse(self.intIndex.is_all_dates)
-
-    def test_summary(self):
-        self._check_method_works(Index.summary)
-        # GH3869
-        ind = Index(['{other}%s', "~:{range}:0"], name='A')
-        result = ind.summary()
-        # shouldn't be formatted accidentally.
-        self.assertIn('~:{range}:0', result)
-        self.assertIn('{other}%s', result)
-
-    def test_format(self):
-        self._check_method_works(Index.format)
-
-        index = Index([datetime.now()])
-
-
-        # windows has different precision on datetime.datetime.now (it doesn't include us
-        # since the default for Timestamp shows these but Index formating does not
-        # we are skipping
-        if not is_platform_windows():
-            formatted = index.format()
-            expected = [str(index[0])]
-            self.assertEqual(formatted, expected)
-
-        # 2845
-        index = Index([1, 2.0+3.0j, np.nan])
-        formatted = index.format()
-        expected = [str(index[0]), str(index[1]), u('NaN')]
-        self.assertEqual(formatted, expected)
-
-        # is this really allowed?
-        index = Index([1, 2.0+3.0j, None])
-        formatted = index.format()
-        expected = [str(index[0]), str(index[1]), u('NaN')]
-        self.assertEqual(formatted, expected)
-
-        self.strIndex[:0].format()
-
-    def test_format_with_name_time_info(self):
-        # bug I fixed 12/20/2011
-        inc = timedelta(hours=4)
-        dates = Index([dt + inc for dt in self.dateIndex], name='something')
-
-        formatted = dates.format(name=True)
-        self.assertEqual(formatted[0], 'something')
-
-    def test_format_datetime_with_time(self):
-        t = Index([datetime(2012, 2, 7), datetime(2012, 2, 7, 23)])
-
-        result = t.format()
-        expected = ['2012-02-07 00:00:00', '2012-02-07 23:00:00']
-        self.assertEqual(len(result), 2)
-        self.assertEqual(result, expected)
-
-    def test_format_none(self):
-        values = ['a', 'b', 'c', None]
-
-        idx = Index(values)
-        idx.format()
-        self.assertIsNone(idx[3])
-
-    def test_logical_compat(self):
-        idx = self.create_index()
-        self.assertEqual(idx.all(), idx.values.all())
-        self.assertEqual(idx.any(), idx.values.any())
-
-    def _check_method_works(self, method):
-        method(self.empty)
-        method(self.dateIndex)
-        method(self.unicodeIndex)
-        method(self.strIndex)
-        method(self.intIndex)
-        method(self.tuples)
-        method(self.catIndex)
-
-    def test_get_indexer(self):
-        idx1 = Index([1, 2, 3, 4, 5])
-        idx2 = Index([2, 4, 6])
-
-        r1 = idx1.get_indexer(idx2)
-        assert_almost_equal(r1, [1, 3, -1])
-
-        r1 = idx2.get_indexer(idx1, method='pad')
-        e1 = [-1, 0, 0, 1, 1]
-        assert_almost_equal(r1, e1)
-
-        r2 = idx2.get_indexer(idx1[::-1], method='pad')
-        assert_almost_equal(r2, e1[::-1])
-
-        rffill1 = idx2.get_indexer(idx1, method='ffill')
-        assert_almost_equal(r1, rffill1)
-
-        r1 = idx2.get_indexer(idx1, method='backfill')
-        e1 = [0, 0, 1, 1, 2]
-        assert_almost_equal(r1, e1)
-
-        rbfill1 = idx2.get_indexer(idx1, method='bfill')
-        assert_almost_equal(r1, rbfill1)
-
-        r2 = idx2.get_indexer(idx1[::-1], method='backfill')
-        assert_almost_equal(r2, e1[::-1])
-
-    def test_get_indexer_invalid(self):
-        # GH10411
-        idx = Index(np.arange(10))
-
-        with tm.assertRaisesRegexp(ValueError, 'tolerance argument'):
-            idx.get_indexer([1, 0], tolerance=1)
-
-        with tm.assertRaisesRegexp(ValueError, 'limit argument'):
-            idx.get_indexer([1, 0], limit=1)
-
-    def test_get_indexer_nearest(self):
-        idx = Index(np.arange(10))
-
-        all_methods = ['pad', 'backfill', 'nearest']
-        for method in all_methods:
-            actual = idx.get_indexer([0, 5, 9], method=method)
-            tm.assert_numpy_array_equal(actual, [0, 5, 9])
-
-            actual = idx.get_indexer([0, 5, 9], method=method, tolerance=0)
-            tm.assert_numpy_array_equal(actual, [0, 5, 9])
-
-        for method, expected in zip(all_methods, [[0, 1, 8], [1, 2, 9], [0, 2, 9]]):
-            actual = idx.get_indexer([0.2, 1.8, 8.5], method=method)
-            tm.assert_numpy_array_equal(actual, expected)
-
-            actual = idx.get_indexer([0.2, 1.8, 8.5], method=method, tolerance=1)
-            tm.assert_numpy_array_equal(actual, expected)
-
-        for method, expected in zip(all_methods, [[0, -1, -1], [-1, 2, -1], [0, 2, -1]]):
-            actual = idx.get_indexer([0.2, 1.8, 8.5], method=method, tolerance=0.2)
-            tm.assert_numpy_array_equal(actual, expected)
-
-        with tm.assertRaisesRegexp(ValueError, 'limit argument'):
-            idx.get_indexer([1, 0], method='nearest', limit=1)
-
-    def test_get_indexer_nearest_decreasing(self):
-        idx = Index(np.arange(10))[::-1]
-
-        all_methods = ['pad', 'backfill', 'nearest']
-        for method in all_methods:
-            actual = idx.get_indexer([0, 5, 9], method=method)
-            tm.assert_numpy_array_equal(actual, [9, 4, 0])
-
-        for method, expected in zip(all_methods, [[8, 7, 0], [9, 8, 1], [9, 7, 0]]):
-            actual = idx.get_indexer([0.2, 1.8, 8.5], method=method)
-            tm.assert_numpy_array_equal(actual, expected)
-
-    def test_get_indexer_strings(self):
-        idx = pd.Index(['b', 'c'])
-
-        actual = idx.get_indexer(['a', 'b', 'c', 'd'], method='pad')
-        expected = [-1, 0, 1, 1]
-        tm.assert_numpy_array_equal(actual, expected)
-
-        actual = idx.get_indexer(['a', 'b', 'c', 'd'], method='backfill')
-        expected = [0, 0, 1, -1]
-        tm.assert_numpy_array_equal(actual, expected)
-
-        with tm.assertRaises(TypeError):
-            idx.get_indexer(['a', 'b', 'c', 'd'], method='nearest')
-
-        with tm.assertRaises(TypeError):
-            idx.get_indexer(['a', 'b', 'c', 'd'], method='pad', tolerance=2)
-
-    def test_get_loc(self):
-        idx = pd.Index([0, 1, 2])
-        all_methods = [None, 'pad', 'backfill', 'nearest']
-        for method in all_methods:
-            self.assertEqual(idx.get_loc(1, method=method), 1)
-            if method is not None:
-                self.assertEqual(idx.get_loc(1, method=method, tolerance=0), 1)
-            with tm.assertRaises(TypeError):
-                idx.get_loc([1, 2], method=method)
-
-        for method, loc in [('pad', 1), ('backfill', 2), ('nearest', 1)]:
-            self.assertEqual(idx.get_loc(1.1, method), loc)
-
-        for method, loc in [('pad', 1), ('backfill', 2), ('nearest', 1)]:
-            self.assertEqual(idx.get_loc(1.1, method, tolerance=1), loc)
-
-        for method in ['pad', 'backfill', 'nearest']:
-            with tm.assertRaises(KeyError):
-                idx.get_loc(1.1, method, tolerance=0.05)
-
-        with tm.assertRaisesRegexp(ValueError, 'must be numeric'):
-            idx.get_loc(1.1, 'nearest', tolerance='invalid')
-        with tm.assertRaisesRegexp(ValueError, 'tolerance .* valid if'):
-            idx.get_loc(1.1, tolerance=1)
-
-        idx = pd.Index(['a', 'c'])
-        with tm.assertRaises(TypeError):
-            idx.get_loc('a', method='nearest')
-        with tm.assertRaises(TypeError):
-            idx.get_loc('a', method='pad', tolerance='invalid')
-
-    def test_slice_locs(self):
-        for dtype in [int, float]:
-            idx = Index(np.array([0, 1, 2, 5, 6, 7, 9, 10], dtype=dtype))
-            n = len(idx)
-
-            self.assertEqual(idx.slice_locs(start=2), (2, n))
-            self.assertEqual(idx.slice_locs(start=3), (3, n))
-            self.assertEqual(idx.slice_locs(3, 8), (3, 6))
-            self.assertEqual(idx.slice_locs(5, 10), (3, n))
-            self.assertEqual(idx.slice_locs(end=8), (0, 6))
-            self.assertEqual(idx.slice_locs(end=9), (0, 7))
-
-            # reversed
-            idx2 = idx[::-1]
-            self.assertEqual(idx2.slice_locs(8, 2), (2, 6))
-            self.assertEqual(idx2.slice_locs(7, 3), (2, 5))
-
-        # float slicing
-        idx = Index(np.array([0, 1, 2, 5, 6, 7, 9, 10], dtype=float))
-        n = len(idx)
-        self.assertEqual(idx.slice_locs(5.0, 10.0), (3, n))
-        self.assertEqual(idx.slice_locs(4.5, 10.5), (3, 8))
-        idx2 = idx[::-1]
-        self.assertEqual(idx2.slice_locs(8.5, 1.5), (2, 6))
-        self.assertEqual(idx2.slice_locs(10.5, -1), (0, n))
-
-        # int slicing with floats
-        idx = Index(np.array([0, 1, 2, 5, 6, 7, 9, 10], dtype=int))
-        self.assertEqual(idx.slice_locs(5.0, 10.0), (3, n))
-        self.assertEqual(idx.slice_locs(4.5, 10.5), (3, 8))
-        idx2 = idx[::-1]
-        self.assertEqual(idx2.slice_locs(8.5, 1.5), (2, 6))
-        self.assertEqual(idx2.slice_locs(10.5, -1), (0, n))
-
-    def test_slice_locs_dup(self):
-        idx = Index(['a', 'a', 'b', 'c', 'd', 'd'])
-        self.assertEqual(idx.slice_locs('a', 'd'), (0, 6))
-        self.assertEqual(idx.slice_locs(end='d'), (0, 6))
-        self.assertEqual(idx.slice_locs('a', 'c'), (0, 4))
-        self.assertEqual(idx.slice_locs('b', 'd'), (2, 6))
-
-        idx2 = idx[::-1]
-        self.assertEqual(idx2.slice_locs('d', 'a'), (0, 6))
-        self.assertEqual(idx2.slice_locs(end='a'), (0, 6))
-        self.assertEqual(idx2.slice_locs('d', 'b'), (0, 4))
-        self.assertEqual(idx2.slice_locs('c', 'a'), (2, 6))
-
-        for dtype in [int, float]:
-            idx = Index(np.array([10, 12, 12, 14], dtype=dtype))
-            self.assertEqual(idx.slice_locs(12, 12), (1, 3))
-            self.assertEqual(idx.slice_locs(11, 13), (1, 3))
-
-            idx2 = idx[::-1]
-            self.assertEqual(idx2.slice_locs(12, 12), (1, 3))
-            self.assertEqual(idx2.slice_locs(13, 11), (1, 3))
-
-    def test_slice_locs_na(self):
-        idx = Index([np.nan, 1, 2])
-        self.assertRaises(KeyError, idx.slice_locs, start=1.5)
-        self.assertRaises(KeyError, idx.slice_locs, end=1.5)
-        self.assertEqual(idx.slice_locs(1), (1, 3))
-        self.assertEqual(idx.slice_locs(np.nan), (0, 3))
-
-        idx = Index([0, np.nan, np.nan, 1, 2])
-        self.assertEqual(idx.slice_locs(np.nan), (1, 5))
-
-    def test_slice_locs_negative_step(self):
-        idx = Index(list('bcdxy'))
-
-        SLC = pd.IndexSlice
-
-        def check_slice(in_slice, expected):
-            s_start, s_stop = idx.slice_locs(in_slice.start, in_slice.stop,
-                                             in_slice.step)
-            result = idx[s_start:s_stop:in_slice.step]
-            expected = pd.Index(list(expected))
-            self.assertTrue(result.equals(expected))
-
-        for in_slice, expected in [
-                (SLC[::-1], 'yxdcb'), (SLC['b':'y':-1], ''),
-                (SLC['b'::-1], 'b'), (SLC[:'b':-1], 'yxdcb'),
-                (SLC[:'y':-1], 'y'), (SLC['y'::-1], 'yxdcb'),
-                (SLC['y'::-4], 'yb'),
-                # absent labels
-                (SLC[:'a':-1], 'yxdcb'), (SLC[:'a':-2], 'ydb'),
-                (SLC['z'::-1], 'yxdcb'), (SLC['z'::-3], 'yc'),
-                (SLC['m'::-1], 'dcb'), (SLC[:'m':-1], 'yx'),
-                (SLC['a':'a':-1], ''), (SLC['z':'z':-1], ''),
-                (SLC['m':'m':-1], '')
-        ]:
-            check_slice(in_slice, expected)
-
-    def test_drop(self):
-        n = len(self.strIndex)
-
-        drop = self.strIndex[lrange(5, 10)]
-        dropped = self.strIndex.drop(drop)
-        expected = self.strIndex[lrange(5) + lrange(10, n)]
-        self.assertTrue(dropped.equals(expected))
-
-        self.assertRaises(ValueError, self.strIndex.drop, ['foo', 'bar'])
-        self.assertRaises(ValueError, self.strIndex.drop, ['1', 'bar'])
-
-        # errors='ignore'
-        mixed = drop.tolist() + ['foo']
-        dropped = self.strIndex.drop(mixed, errors='ignore')
-        expected = self.strIndex[lrange(5) + lrange(10, n)]
-        self.assert_index_equal(dropped, expected)
-
-        dropped = self.strIndex.drop(['foo', 'bar'], errors='ignore')
-        expected = self.strIndex[lrange(n)]
-        self.assert_index_equal(dropped, expected)
-
-        dropped = self.strIndex.drop(self.strIndex[0])
-        expected = self.strIndex[1:]
-        self.assert_index_equal(dropped, expected)
-
-        ser = Index([1, 2, 3])
-        dropped = ser.drop(1)
-        expected = Index([2, 3])
-        self.assert_index_equal(dropped, expected)
-
-        # errors='ignore'
-        self.assertRaises(ValueError, ser.drop, [3, 4])
-
-        dropped = ser.drop(4, errors='ignore')
-        expected = Index([1, 2, 3])
-        self.assert_index_equal(dropped, expected)
-
-        dropped = ser.drop([3, 4, 5], errors='ignore')
-        expected = Index([1, 2])
-        self.assert_index_equal(dropped, expected)
-
-    def test_tuple_union_bug(self):
-        import pandas
-        import numpy as np
-
-        aidx1 = np.array([(1, 'A'), (2, 'A'), (1, 'B'), (2, 'B')],
-                         dtype=[('num', int), ('let', 'a1')])
-        aidx2 = np.array([(1, 'A'), (2, 'A'), (1, 'B'), (2, 'B'), (1, 'C'), (2,
-                         'C')], dtype=[('num', int), ('let', 'a1')])
-
-        idx1 = pandas.Index(aidx1)
-        idx2 = pandas.Index(aidx2)
-
-        # intersection broken?
-        int_idx = idx1.intersection(idx2)
-        # needs to be 1d like idx1 and idx2
-        expected = idx1[:4]  # pandas.Index(sorted(set(idx1) & set(idx2)))
-        self.assertEqual(int_idx.ndim, 1)
-        self.assertTrue(int_idx.equals(expected))
-
-        # union broken
-        union_idx = idx1.union(idx2)
-        expected = idx2
-        self.assertEqual(union_idx.ndim, 1)
-        self.assertTrue(union_idx.equals(expected))
-
-    def test_is_monotonic_incomparable(self):
-        index = Index([5, datetime.now(), 7])
-        self.assertFalse(index.is_monotonic)
-        self.assertFalse(index.is_monotonic_decreasing)
-
-    def test_get_set_value(self):
-        values = np.random.randn(100)
-        date = self.dateIndex[67]
-
-        assert_almost_equal(self.dateIndex.get_value(values, date),
-                            values[67])
-
-        self.dateIndex.set_value(values, date, 10)
-        self.assertEqual(values[67], 10)
-
-    def test_isin(self):
-        values = ['foo', 'bar', 'quux']
-
-        idx = Index(['qux', 'baz', 'foo', 'bar'])
-        result = idx.isin(values)
-        expected = np.array([False, False, True, True])
-        tm.assert_numpy_array_equal(result, expected)
-
-        # empty, return dtype bool
-        idx = Index([])
-        result = idx.isin(values)
-        self.assertEqual(len(result), 0)
-        self.assertEqual(result.dtype, np.bool_)
-
-    def test_isin_nan(self):
-        tm.assert_numpy_array_equal(
-            Index(['a', np.nan]).isin([np.nan]), [False, True])
-        tm.assert_numpy_array_equal(
-            Index(['a', pd.NaT]).isin([pd.NaT]), [False, True])
-        tm.assert_numpy_array_equal(
-            Index(['a', np.nan]).isin([float('nan')]), [False, False])
-        tm.assert_numpy_array_equal(
-            Index(['a', np.nan]).isin([pd.NaT]), [False, False])
-        # Float64Index overrides isin, so must be checked separately
-        tm.assert_numpy_array_equal(
-            Float64Index([1.0, np.nan]).isin([np.nan]), [False, True])
-        tm.assert_numpy_array_equal(
-            Float64Index([1.0, np.nan]).isin([float('nan')]), [False, True])
-        tm.assert_numpy_array_equal(
-            Float64Index([1.0, np.nan]).isin([pd.NaT]), [False, True])
-
-    def test_isin_level_kwarg(self):
-        def check_idx(idx):
-            values = idx.tolist()[-2:] + ['nonexisting']
-
-            expected = np.array([False, False, True, True])
-            tm.assert_numpy_array_equal(expected, idx.isin(values, level=0))
-            tm.assert_numpy_array_equal(expected, idx.isin(values, level=-1))
-
-            self.assertRaises(IndexError, idx.isin, values, level=1)
-            self.assertRaises(IndexError, idx.isin, values, level=10)
-            self.assertRaises(IndexError, idx.isin, values, level=-2)
-
-            self.assertRaises(KeyError, idx.isin, values, level=1.0)
-            self.assertRaises(KeyError, idx.isin, values, level='foobar')
-
-            idx.name = 'foobar'
-            tm.assert_numpy_array_equal(expected,
-                                          idx.isin(values, level='foobar'))
-
-            self.assertRaises(KeyError, idx.isin, values, level='xyzzy')
-            self.assertRaises(KeyError, idx.isin, values, level=np.nan)
-
-        check_idx(Index(['qux', 'baz', 'foo', 'bar']))
-        # Float64Index overrides isin, so must be checked separately
-        check_idx(Float64Index([1.0, 2.0, 3.0, 4.0]))
-
-    def test_boolean_cmp(self):
-        values = [1, 2, 3, 4]
-
-        idx = Index(values)
-        res = (idx == values)
-
-        tm.assert_numpy_array_equal(res,np.array([True,True,True,True],dtype=bool))
-
-    def test_get_level_values(self):
-        result = self.strIndex.get_level_values(0)
-        self.assertTrue(result.equals(self.strIndex))
-
-    def test_slice_keep_name(self):
-        idx = Index(['a', 'b'], name='asdf')
-        self.assertEqual(idx.name, idx[1:].name)
-
-    def test_join_self(self):
-        # instance attributes of the form self.<name>Index
-        indices = 'unicode', 'str', 'date', 'int', 'float'
-        kinds = 'outer', 'inner', 'left', 'right'
-        for index_kind in indices:
-            res = getattr(self, '{0}Index'.format(index_kind))
-
-            for kind in kinds:
-                joined = res.join(res, how=kind)
-                self.assertIs(res, joined)
-    def test_str_attribute(self):
-        # GH9068
-        methods = ['strip', 'rstrip', 'lstrip']
-        idx = Index([' jack', 'jill ', ' jesse ', 'frank'])
-        for method in methods:
-            expected = Index([getattr(str, method)(x) for x in idx.values])
-            tm.assert_index_equal(getattr(Index.str, method)(idx.str), expected)
-
-        # create a few instances that are not able to use .str accessor
-        indices = [Index(range(5)),
-                   tm.makeDateIndex(10),
-                   MultiIndex.from_tuples([('foo', '1'), ('bar', '3')]),
-                   PeriodIndex(start='2000', end='2010', freq='A')]
-        for idx in indices:
-            with self.assertRaisesRegexp(AttributeError, 'only use .str accessor'):
-                idx.str.repeat(2)
-
-        idx = Index(['a b c', 'd e', 'f'])
-        expected = Index([['a', 'b', 'c'], ['d', 'e'], ['f']])
-        tm.assert_index_equal(idx.str.split(), expected)
-        tm.assert_index_equal(idx.str.split(expand=False), expected)
-
-        expected = MultiIndex.from_tuples([('a', 'b', 'c'),
-                                           ('d', 'e', np.nan),
-                                           ('f', np.nan, np.nan)])
-        tm.assert_index_equal(idx.str.split(expand=True), expected)
-
-        # test boolean case, should return np.array instead of boolean Index
-        idx = Index(['a1', 'a2', 'b1', 'b2'])
-        expected = np.array([True, True, False, False])
-        tm.assert_numpy_array_equal(idx.str.startswith('a'), expected)
-        self.assertIsInstance(idx.str.startswith('a'), np.ndarray)
-        s = Series(range(4), index=idx)
-        expected = Series(range(2), index=['a1', 'a2'])
-        tm.assert_series_equal(s[s.index.str.startswith('a')], expected)
-
-    def test_tab_completion(self):
-        # GH 9910
-        idx = Index(list('abcd'))
-        self.assertTrue('str' in dir(idx))
-
-        idx = Index(range(4))
-        self.assertTrue('str' not in dir(idx))
-
-    def test_indexing_doesnt_change_class(self):
-        idx = Index([1, 2, 3, 'a', 'b', 'c'])
-
-        self.assertTrue(idx[1:3].identical(
-            pd.Index([2, 3], dtype=np.object_)))
-        self.assertTrue(idx[[0,1]].identical(
-            pd.Index([1, 2], dtype=np.object_)))
-
-    def test_outer_join_sort(self):
-        left_idx = Index(np.random.permutation(15))
-        right_idx = tm.makeDateIndex(10)
-
-        with tm.assert_produces_warning(RuntimeWarning):
-            joined = left_idx.join(right_idx, how='outer')
-
-        # right_idx in this case because DatetimeIndex has join precedence over
-        # Int64Index
-        with tm.assert_produces_warning(RuntimeWarning):
-            expected = right_idx.astype(object).union(left_idx.astype(object))
-        tm.assert_index_equal(joined, expected)
-
-    def test_nan_first_take_datetime(self):
-        idx = Index([pd.NaT, Timestamp('20130101'), Timestamp('20130102')])
-        res = idx.take([-1, 0, 1])
-        exp = Index([idx[-1], idx[0], idx[1]])
-        tm.assert_index_equal(res, exp)
-
-    def test_reindex_preserves_name_if_target_is_list_or_ndarray(self):
-        # GH6552
-        idx = pd.Index([0, 1, 2])
-
-        dt_idx = pd.date_range('20130101', periods=3)
-
-        idx.name = None
-        self.assertEqual(idx.reindex([])[0].name, None)
-        self.assertEqual(idx.reindex(np.array([]))[0].name, None)
-        self.assertEqual(idx.reindex(idx.tolist())[0].name, None)
-        self.assertEqual(idx.reindex(idx.tolist()[:-1])[0].name, None)
-        self.assertEqual(idx.reindex(idx.values)[0].name, None)
-        self.assertEqual(idx.reindex(idx.values[:-1])[0].name, None)
-
-        # Must preserve name even if dtype changes.
-        self.assertEqual(idx.reindex(dt_idx.values)[0].name, None)
-        self.assertEqual(idx.reindex(dt_idx.tolist())[0].name, None)
-
-        idx.name = 'foobar'
-        self.assertEqual(idx.reindex([])[0].name, 'foobar')
-        self.assertEqual(idx.reindex(np.array([]))[0].name, 'foobar')
-        self.assertEqual(idx.reindex(idx.tolist())[0].name, 'foobar')
-        self.assertEqual(idx.reindex(idx.tolist()[:-1])[0].name, 'foobar')
-        self.assertEqual(idx.reindex(idx.values)[0].name, 'foobar')
-        self.assertEqual(idx.reindex(idx.values[:-1])[0].name, 'foobar')
-
-        # Must preserve name even if dtype changes.
-        self.assertEqual(idx.reindex(dt_idx.values)[0].name, 'foobar')
-        self.assertEqual(idx.reindex(dt_idx.tolist())[0].name, 'foobar')
-
-    def test_reindex_preserves_type_if_target_is_empty_list_or_array(self):
-        # GH7774
-        idx = pd.Index(list('abc'))
-        def get_reindex_type(target):
-            return idx.reindex(target)[0].dtype.type
-
-        self.assertEqual(get_reindex_type([]), np.object_)
-        self.assertEqual(get_reindex_type(np.array([])), np.object_)
-        self.assertEqual(get_reindex_type(np.array([], dtype=np.int64)),
-                         np.object_)
-
-    def test_reindex_doesnt_preserve_type_if_target_is_empty_index(self):
-        # GH7774
-        idx = pd.Index(list('abc'))
-        def get_reindex_type(target):
-            return idx.reindex(target)[0].dtype.type
-
-        self.assertEqual(get_reindex_type(pd.Int64Index([])), np.int64)
-        self.assertEqual(get_reindex_type(pd.Float64Index([])), np.float64)
-        self.assertEqual(get_reindex_type(pd.DatetimeIndex([])), np.datetime64)
-
-        reindexed = idx.reindex(pd.MultiIndex([pd.Int64Index([]),
-                                               pd.Float64Index([])],
-                                              [[], []]))[0]
-        self.assertEqual(reindexed.levels[0].dtype.type, np.int64)
-        self.assertEqual(reindexed.levels[1].dtype.type, np.float64)
-
-    def test_groupby(self):
-        idx = Index(range(5))
-        groups = idx.groupby(np.array([1,1,2,2,2]))
-        exp = {1: [0, 1], 2: [2, 3, 4]}
-        tm.assert_dict_equal(groups, exp)
-
-    def test_equals_op_multiindex(self):
-        # GH9785
-        # test comparisons of multiindex
-        from pandas.compat import StringIO
-        df = pd.read_csv(StringIO('a,b,c\n1,2,3\n4,5,6'), index_col=[0, 1])
-        tm.assert_numpy_array_equal(df.index == df.index, np.array([True, True]))
-
-        mi1 = MultiIndex.from_tuples([(1, 2), (4, 5)])
-        tm.assert_numpy_array_equal(df.index == mi1, np.array([True, True]))
-        mi2 = MultiIndex.from_tuples([(1, 2), (4, 6)])
-        tm.assert_numpy_array_equal(df.index == mi2, np.array([True, False]))
-        mi3 = MultiIndex.from_tuples([(1, 2), (4, 5), (8, 9)])
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
-            df.index == mi3
-
-        index_a = Index(['foo', 'bar', 'baz'])
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
-            df.index == index_a
-        tm.assert_numpy_array_equal(index_a == mi3, np.array([False, False, False]))
-
-    def test_conversion_preserves_name(self):
-        #GH 10875
-        i = pd.Index(['01:02:03', '01:02:04'], name='label')
-        self.assertEqual(i.name, pd.to_datetime(i).name)
-        self.assertEqual(i.name, pd.to_timedelta(i).name)
-
-    def test_string_index_repr(self):
-        # py3/py2 repr can differ because of "u" prefix
-        # which also affects to displayed element size
-
-        # short
-        idx = pd.Index(['a', 'bb', 'ccc'])
-        if PY3:
-            expected = u"""Index(['a', 'bb', 'ccc'], dtype='object')"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""Index([u'a', u'bb', u'ccc'], dtype='object')"""
-            self.assertEqual(unicode(idx), expected)
-
-        # multiple lines
-        idx = pd.Index(['a', 'bb', 'ccc'] * 10)
-        if PY3:
-            expected = u"""Index(['a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc',
-       'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc',
-       'a', 'bb', 'ccc', 'a', 'bb', 'ccc'],
-      dtype='object')"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""Index([u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a',
-       u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb',
-       u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc'],
-      dtype='object')"""
-            self.assertEqual(unicode(idx), expected)
-
-        # truncated
-        idx = pd.Index(['a', 'bb', 'ccc'] * 100)
-        if PY3:
-            expected = u"""Index(['a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a',
-       ...
-       'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc'],
-      dtype='object', length=300)"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""Index([u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a',
-       ...
-       u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc'],
-      dtype='object', length=300)"""
-            self.assertEqual(unicode(idx), expected)
-
-        # short
-        idx = pd.Index([u'あ', u'いい', u'ううう'])
-        if PY3:
-            expected = u"""Index(['あ', 'いい', 'ううう'], dtype='object')"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""Index([u'あ', u'いい', u'ううう'], dtype='object')"""
-            self.assertEqual(unicode(idx), expected)
-
-        # multiple lines
-        idx = pd.Index([u'あ', u'いい', u'ううう'] * 10)
-        if PY3:
-            expected = u"""Index(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',
-       'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',
-       'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう'],
-      dtype='object')"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""Index([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
-       u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい',
-       u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう'],
-      dtype='object')"""
-            self.assertEqual(unicode(idx), expected)
-
-        # truncated
-        idx = pd.Index([u'あ', u'いい', u'ううう'] * 100)
-        if PY3:
-            expected = u"""Index(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ',
-       ...
-       'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう'],
-      dtype='object', length=300)"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""Index([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
-       ...
-       u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう'],
-      dtype='object', length=300)"""
-            self.assertEqual(unicode(idx), expected)
-
-        # Emable Unicode option -----------------------------------------
-        with cf.option_context('display.unicode.east_asian_width', True):
-
-            # short
-            idx = pd.Index([u'あ', u'いい', u'ううう'])
-            if PY3:
-                expected = u"""Index(['あ', 'いい', 'ううう'], dtype='object')"""
-                self.assertEqual(repr(idx), expected)
-            else:
-                expected = u"""Index([u'あ', u'いい', u'ううう'], dtype='object')"""
-                self.assertEqual(unicode(idx), expected)
-
-            # multiple lines
-            idx = pd.Index([u'あ', u'いい', u'ううう'] * 10)
-            if PY3:
-                expected = u"""Index(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',
-       'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',
-       'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',
-       'あ', 'いい', 'ううう'],
-      dtype='object')"""
-                self.assertEqual(repr(idx), expected)
-            else:
-                expected = u"""Index([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい',
-       u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
-       u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい',
-       u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう'],
-      dtype='object')"""
-                self.assertEqual(unicode(idx), expected)
-
-            # truncated
-            idx = pd.Index([u'あ', u'いい', u'ううう'] * 100)
-            if PY3:
-                expected = u"""Index(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',
-       'あ',
-       ...
-       'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい',
-       'ううう'],
-      dtype='object', length=300)"""
-                self.assertEqual(repr(idx), expected)
-            else:
-                expected = u"""Index([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい',
-       u'ううう', u'あ',
-       ...
-       u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
-       u'いい', u'ううう'],
-      dtype='object', length=300)"""
-                self.assertEqual(unicode(idx), expected)
-
-
-class TestCategoricalIndex(Base, tm.TestCase):
-    _holder = CategoricalIndex
-
-    def setUp(self):
-        self.indices = dict(catIndex = tm.makeCategoricalIndex(100))
-        self.setup_indices()
-
-    def create_index(self, categories=None, ordered=False):
-        if categories is None:
-            categories = list('cab')
-        return CategoricalIndex(list('aabbca'), categories=categories, ordered=ordered)
-
-    def test_construction(self):
-
-        ci = self.create_index(categories=list('abcd'))
-        categories = ci.categories
-
-        result = Index(ci)
-        tm.assert_index_equal(result,ci,exact=True)
-        self.assertFalse(result.ordered)
-
-        result = Index(ci.values)
-        tm.assert_index_equal(result,ci,exact=True)
-        self.assertFalse(result.ordered)
-
-        # empty
-        result = CategoricalIndex(categories=categories)
-        self.assertTrue(result.categories.equals(Index(categories)))
-        tm.assert_numpy_array_equal(result.codes, np.array([],dtype='int8'))
-        self.assertFalse(result.ordered)
-
-        # passing categories
-        result = CategoricalIndex(list('aabbca'),categories=categories)
-        self.assertTrue(result.categories.equals(Index(categories)))
-        tm.assert_numpy_array_equal(result.codes,np.array([0,0,1,1,2,0],dtype='int8'))
-
-        c = pd.Categorical(list('aabbca'))
-        result = CategoricalIndex(c)
-        self.assertTrue(result.categories.equals(Index(list('abc'))))
-        tm.assert_numpy_array_equal(result.codes,np.array([0,0,1,1,2,0],dtype='int8'))
-        self.assertFalse(result.ordered)
-
-        result = CategoricalIndex(c,categories=categories)
-        self.assertTrue(result.categories.equals(Index(categories)))
-        tm.assert_numpy_array_equal(result.codes,np.array([0,0,1,1,2,0],dtype='int8'))
-        self.assertFalse(result.ordered)
-
-        ci = CategoricalIndex(c,categories=list('abcd'))
-        result = CategoricalIndex(ci)
-        self.assertTrue(result.categories.equals(Index(categories)))
-        tm.assert_numpy_array_equal(result.codes,np.array([0,0,1,1,2,0],dtype='int8'))
-        self.assertFalse(result.ordered)
-
-        result = CategoricalIndex(ci, categories=list('ab'))
-        self.assertTrue(result.categories.equals(Index(list('ab'))))
-        tm.assert_numpy_array_equal(result.codes,np.array([0,0,1,1,-1,0],dtype='int8'))
-        self.assertFalse(result.ordered)
-
-        result = CategoricalIndex(ci, categories=list('ab'), ordered=True)
-        self.assertTrue(result.categories.equals(Index(list('ab'))))
-        tm.assert_numpy_array_equal(result.codes,np.array([0,0,1,1,-1,0],dtype='int8'))
-        self.assertTrue(result.ordered)
-
-        # turn me to an Index
-        result = Index(np.array(ci))
-        self.assertIsInstance(result, Index)
-        self.assertNotIsInstance(result, CategoricalIndex)
-
-    def test_construction_with_dtype(self):
-
-        # specify dtype
-        ci = self.create_index(categories=list('abc'))
-
-        result = Index(np.array(ci), dtype='category')
-        tm.assert_index_equal(result,ci,exact=True)
-
-        result = Index(np.array(ci).tolist(), dtype='category')
-        tm.assert_index_equal(result,ci,exact=True)
-
-        # these are generally only equal when the categories are reordered
-        ci = self.create_index()
-
-        result = Index(np.array(ci), dtype='category').reorder_categories(ci.categories)
-        tm.assert_index_equal(result,ci,exact=True)
-
-        # make sure indexes are handled
-        expected = CategoricalIndex([0,1,2], categories=[0,1,2], ordered=True)
-        idx = Index(range(3))
-        result = CategoricalIndex(idx, categories=idx, ordered=True)
-        tm.assert_index_equal(result, expected, exact=True)
-
-    def test_disallow_set_ops(self):
-
-        # GH 10039
-        # set ops (+/-) raise TypeError
-        idx = pd.Index(pd.Categorical(['a', 'b']))
-
-        self.assertRaises(TypeError, lambda : idx - idx)
-        self.assertRaises(TypeError, lambda : idx + idx)
-        self.assertRaises(TypeError, lambda : idx - ['a','b'])
-        self.assertRaises(TypeError, lambda : idx + ['a','b'])
-        self.assertRaises(TypeError, lambda : ['a','b'] - idx)
-        self.assertRaises(TypeError, lambda : ['a','b'] + idx)
-
-    def test_method_delegation(self):
-
-        ci = CategoricalIndex(list('aabbca'), categories=list('cabdef'))
-        result = ci.set_categories(list('cab'))
-        tm.assert_index_equal(result, CategoricalIndex(list('aabbca'), categories=list('cab')))
-
-        ci = CategoricalIndex(list('aabbca'), categories=list('cab'))
-        result = ci.rename_categories(list('efg'))
-        tm.assert_index_equal(result, CategoricalIndex(list('ffggef'), categories=list('efg')))
-
-        ci = CategoricalIndex(list('aabbca'), categories=list('cab'))
-        result = ci.add_categories(['d'])
-        tm.assert_index_equal(result, CategoricalIndex(list('aabbca'), categories=list('cabd')))
-
-        ci = CategoricalIndex(list('aabbca'), categories=list('cab'))
-        result = ci.remove_categories(['c'])
-        tm.assert_index_equal(result, CategoricalIndex(list('aabb') + [np.nan] + ['a'], categories=list('ab')))
-
-        ci = CategoricalIndex(list('aabbca'), categories=list('cabdef'))
-        result = ci.as_unordered()
-        tm.assert_index_equal(result, ci)
-
-        ci = CategoricalIndex(list('aabbca'), categories=list('cabdef'))
-        result = ci.as_ordered()
-        tm.assert_index_equal(result, CategoricalIndex(list('aabbca'), categories=list('cabdef'), ordered=True))
-
-        # invalid
-        self.assertRaises(ValueError, lambda : ci.set_categories(list('cab'), inplace=True))
-
-    def test_contains(self):
-
-        ci = self.create_index(categories=list('cabdef'))
-
-        self.assertTrue('a' in ci)
-        self.assertTrue('z' not in ci)
-        self.assertTrue('e' not in ci)
-        self.assertTrue(np.nan not in ci)
-
-        # assert codes NOT in index
-        self.assertFalse(0 in ci)
-        self.assertFalse(1 in ci)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            ci = CategoricalIndex(list('aabbca'), categories=list('cabdef') + [np.nan])
-        self.assertFalse(np.nan in ci)
-
-        ci = CategoricalIndex(list('aabbca') + [np.nan], categories=list('cabdef'))
-        self.assertTrue(np.nan in ci)
-
-    def test_min_max(self):
-
-        ci = self.create_index(ordered=False)
-        self.assertRaises(TypeError, lambda : ci.min())
-        self.assertRaises(TypeError, lambda : ci.max())
-
-        ci = self.create_index(ordered=True)
-
-        self.assertEqual(ci.min(),'c')
-        self.assertEqual(ci.max(),'b')
-
-    def test_append(self):
-
-        ci = self.create_index()
-        categories = ci.categories
-
-        # append cats with the same categories
-        result = ci[:3].append(ci[3:])
-        tm.assert_index_equal(result,ci,exact=True)
-
-        foos = [ci[:1], ci[1:3], ci[3:]]
-        result = foos[0].append(foos[1:])
-        tm.assert_index_equal(result,ci,exact=True)
-
-        # empty
-        result = ci.append([])
-        tm.assert_index_equal(result,ci,exact=True)
-
-        # appending with different categories or reoreded is not ok
-        self.assertRaises(TypeError, lambda : ci.append(ci.values.set_categories(list('abcd'))))
-        self.assertRaises(TypeError, lambda : ci.append(ci.values.reorder_categories(list('abc'))))
-
-        # with objects
-        result = ci.append(['c','a'])
-        expected = CategoricalIndex(list('aabbcaca'), categories=categories)
-        tm.assert_index_equal(result,expected,exact=True)
-
-        # invalid objects
-        self.assertRaises(TypeError, lambda : ci.append(['a','d']))
-
-    def test_insert(self):
-
-        ci = self.create_index()
-        categories = ci.categories
-
-        #test 0th element
-        result = ci.insert(0, 'a')
-        expected = CategoricalIndex(list('aaabbca'),categories=categories)
-        tm.assert_index_equal(result,expected,exact=True)
-
-        #test Nth element that follows Python list behavior
-        result = ci.insert(-1, 'a')
-        expected = CategoricalIndex(list('aabbcaa'),categories=categories)
-        tm.assert_index_equal(result,expected,exact=True)
-
-        #test empty
-        result = CategoricalIndex(categories=categories).insert(0, 'a')
-        expected = CategoricalIndex(['a'],categories=categories)
-        tm.assert_index_equal(result,expected,exact=True)
-
-        # invalid
-        self.assertRaises(TypeError, lambda : ci.insert(0,'d'))
-
-    def test_delete(self):
-
-        ci = self.create_index()
-        categories = ci.categories
-
-        result = ci.delete(0)
-        expected = CategoricalIndex(list('abbca'),categories=categories)
-        tm.assert_index_equal(result,expected,exact=True)
-
-        result = ci.delete(-1)
-        expected = CategoricalIndex(list('aabbc'),categories=categories)
-        tm.assert_index_equal(result,expected,exact=True)
-
-        with tm.assertRaises((IndexError, ValueError)):
-            # either depeidnig on numpy version
-            result = ci.delete(10)
-
-    def test_astype(self):
-
-        ci = self.create_index()
-        result = ci.astype('category')
-        tm.assert_index_equal(result,ci,exact=True)
-
-        result = ci.astype(object)
-        self.assertTrue(result.equals(Index(np.array(ci))))
-
-        # this IS equal, but not the same class
-        self.assertTrue(result.equals(ci))
-        self.assertIsInstance(result, Index)
-        self.assertNotIsInstance(result, CategoricalIndex)
-
-    def test_reindex_base(self):
-
-        # determined by cat ordering
-        idx = self.create_index()
-        expected = np.array([4,0,1,5,2,3])
-
-        actual = idx.get_indexer(idx)
-        tm.assert_numpy_array_equal(expected, actual)
-
-        with tm.assertRaisesRegexp(ValueError, 'Invalid fill method'):
-            idx.get_indexer(idx, method='invalid')
-
-    def test_reindexing(self):
-
-        ci = self.create_index()
-        oidx = Index(np.array(ci))
-
-        for n in [1,2,5,len(ci)]:
-            finder = oidx[np.random.randint(0,len(ci),size=n)]
-            expected = oidx.get_indexer_non_unique(finder)[0]
-
-            actual = ci.get_indexer(finder)
-            tm.assert_numpy_array_equal(expected, actual)
-
-    def test_duplicates(self):
-
-        idx = CategoricalIndex([0, 0, 0], name='foo')
-        self.assertFalse(idx.is_unique)
-        self.assertTrue(idx.has_duplicates)
-
-        expected = CategoricalIndex([0], name='foo')
-        self.assert_index_equal(idx.drop_duplicates(), expected)
-
-    def test_get_indexer(self):
-
-        idx1 = CategoricalIndex(list('aabcde'),categories=list('edabc'))
-        idx2 = CategoricalIndex(list('abf'))
-
-        for indexer in [idx2, list('abf'), Index(list('abf'))]:
-            r1 = idx1.get_indexer(idx2)
-            assert_almost_equal(r1, [0, 1, 2, -1])
-
-        self.assertRaises(NotImplementedError, lambda : idx2.get_indexer(idx1, method='pad'))
-        self.assertRaises(NotImplementedError, lambda : idx2.get_indexer(idx1, method='backfill'))
-        self.assertRaises(NotImplementedError, lambda : idx2.get_indexer(idx1, method='nearest'))
-
-    def test_repr_roundtrip(self):
-
-        ci = CategoricalIndex(['a', 'b'], categories=['a', 'b'], ordered=True)
-        str(ci)
-        tm.assert_index_equal(eval(repr(ci)),ci,exact=True)
-
-        # formatting
-        if compat.PY3:
-            str(ci)
-        else:
-            compat.text_type(ci)
-
-        # long format
-        # this is not reprable
-        ci = CategoricalIndex(np.random.randint(0,5,size=100))
-        if compat.PY3:
-            str(ci)
-        else:
-            compat.text_type(ci)
-
-    def test_isin(self):
-
-        ci = CategoricalIndex(list('aabca') + [np.nan],categories=['c','a','b'])
-        tm.assert_numpy_array_equal(ci.isin(['c']),np.array([False,False,False,True,False,False]))
-        tm.assert_numpy_array_equal(ci.isin(['c','a','b']),np.array([True]*5 + [False]))
-        tm.assert_numpy_array_equal(ci.isin(['c','a','b',np.nan]),np.array([True]*6))
-
-        # mismatched categorical -> coerced to ndarray so doesn't matter
-        tm.assert_numpy_array_equal(ci.isin(ci.set_categories(list('abcdefghi'))),np.array([True]*6))
-        tm.assert_numpy_array_equal(ci.isin(ci.set_categories(list('defghi'))),np.array([False]*5 + [True]))
-
-    def test_identical(self):
-
-        ci1 = CategoricalIndex(['a', 'b'], categories=['a', 'b'], ordered=True)
-        ci2 = CategoricalIndex(['a', 'b'], categories=['a', 'b', 'c'], ordered=True)
-        self.assertTrue(ci1.identical(ci1))
-        self.assertTrue(ci1.identical(ci1.copy()))
-        self.assertFalse(ci1.identical(ci2))
-
-    def test_equals(self):
-
-        ci1 = CategoricalIndex(['a', 'b'], categories=['a', 'b'], ordered=True)
-        ci2 = CategoricalIndex(['a', 'b'], categories=['a', 'b', 'c'], ordered=True)
-
-        self.assertTrue(ci1.equals(ci1))
-        self.assertFalse(ci1.equals(ci2))
-        self.assertTrue(ci1.equals(ci1.astype(object)))
-        self.assertTrue(ci1.astype(object).equals(ci1))
-
-        self.assertTrue((ci1 == ci1).all())
-        self.assertFalse((ci1 != ci1).all())
-        self.assertFalse((ci1 > ci1).all())
-        self.assertFalse((ci1 < ci1).all())
-        self.assertTrue((ci1 <= ci1).all())
-        self.assertTrue((ci1 >= ci1).all())
-
-        self.assertFalse((ci1 == 1).all())
-        self.assertTrue((ci1 == Index(['a','b'])).all())
-        self.assertTrue((ci1 == ci1.values).all())
-
-        # invalid comparisons
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
-            ci1 == Index(['a','b','c'])
-        self.assertRaises(TypeError, lambda : ci1 == ci2)
-        self.assertRaises(TypeError, lambda : ci1 == Categorical(ci1.values, ordered=False))
-        self.assertRaises(TypeError, lambda : ci1 == Categorical(ci1.values, categories=list('abc')))
-
-        # tests
-        # make sure that we are testing for category inclusion properly
-        self.assertTrue(CategoricalIndex(list('aabca'),categories=['c','a','b']).equals(list('aabca')))
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assertTrue(CategoricalIndex(list('aabca'),categories=['c','a','b',np.nan]).equals(list('aabca')))
-
-        self.assertFalse(CategoricalIndex(list('aabca') + [np.nan],categories=['c','a','b']).equals(list('aabca')))
-        self.assertTrue(CategoricalIndex(list('aabca') + [np.nan],categories=['c','a','b']).equals(list('aabca') + [np.nan]))
-
-    def test_string_categorical_index_repr(self):
-        # short
-        idx = pd.CategoricalIndex(['a', 'bb', 'ccc'])
-        if PY3:
-            expected = u"""CategoricalIndex(['a', 'bb', 'ccc'], categories=['a', 'bb', 'ccc'], ordered=False, dtype='category')"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""CategoricalIndex([u'a', u'bb', u'ccc'], categories=[u'a', u'bb', u'ccc'], ordered=False, dtype='category')"""
-            self.assertEqual(unicode(idx), expected)
-
-        # multiple lines
-        idx = pd.CategoricalIndex(['a', 'bb', 'ccc'] * 10)
-        if PY3:
-            expected = u"""CategoricalIndex(['a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a',
-                  'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb',
-                  'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc'],
-                 categories=['a', 'bb', 'ccc'], ordered=False, dtype='category')"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""CategoricalIndex([u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb',
-                  u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a',
-                  u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc',
-                  u'a', u'bb', u'ccc', u'a', u'bb', u'ccc'],
-                 categories=[u'a', u'bb', u'ccc'], ordered=False, dtype='category')"""
-            self.assertEqual(unicode(idx), expected)
-
-        # truncated
-        idx = pd.CategoricalIndex(['a', 'bb', 'ccc'] * 100)
-        if PY3:
-            expected = u"""CategoricalIndex(['a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a',
-                  ...
-                  'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc'],
-                 categories=['a', 'bb', 'ccc'], ordered=False, dtype='category', length=300)"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""CategoricalIndex([u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb',
-                  u'ccc', u'a',
-                  ...
-                  u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a',
-                  u'bb', u'ccc'],
-                 categories=[u'a', u'bb', u'ccc'], ordered=False, dtype='category', length=300)"""
-            self.assertEqual(unicode(idx), expected)
-
-        # larger categories
-        idx = pd.CategoricalIndex(list('abcdefghijklmmo'))
-        if PY3:
-            expected = u"""CategoricalIndex(['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l',
-                  'm', 'm', 'o'],
-                 categories=['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', ...], ordered=False, dtype='category')"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""CategoricalIndex([u'a', u'b', u'c', u'd', u'e', u'f', u'g', u'h', u'i', u'j',
-                  u'k', u'l', u'm', u'm', u'o'],
-                 categories=[u'a', u'b', u'c', u'd', u'e', u'f', u'g', u'h', ...], ordered=False, dtype='category')"""
-
-            self.assertEqual(unicode(idx), expected)
-
-        # short
-        idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'])
-        if PY3:
-            expected = u"""CategoricalIndex(['あ', 'いい', 'ううう'], categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう'], categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""
-            self.assertEqual(unicode(idx), expected)
-
-        # multiple lines
-        idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'] * 10)
-        if PY3:
-            expected = u"""CategoricalIndex(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ',
-                  'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい',
-                  'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう'],
-                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい',
-                  u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
-                  u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう',
-                  u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう'],
-                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""
-            self.assertEqual(unicode(idx), expected)
-
-        # truncated
-        idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'] * 100)
-        if PY3:
-            expected = u"""CategoricalIndex(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ',
-                  ...
-                  'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう'],
-                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category', length=300)"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい',
-                  u'ううう', u'あ',
-                  ...
-                  u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
-                  u'いい', u'ううう'],
-                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category', length=300)"""
-            self.assertEqual(unicode(idx), expected)
-
-        # larger categories
-        idx = pd.CategoricalIndex(list(u'あいうえおかきくけこさしすせそ'))
-        if PY3:
-            expected = u"""CategoricalIndex(['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', 'け', 'こ', 'さ', 'し',
-                  'す', 'せ', 'そ'],
-                 categories=['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', ...], ordered=False, dtype='category')"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""CategoricalIndex([u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く', u'け', u'こ',
-                  u'さ', u'し', u'す', u'せ', u'そ'],
-                 categories=[u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く', ...], ordered=False, dtype='category')"""
-            self.assertEqual(unicode(idx), expected)
-
-        # Emable Unicode option -----------------------------------------
-        with cf.option_context('display.unicode.east_asian_width', True):
-
-            # short
-            idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'])
-            if PY3:
-                expected = u"""CategoricalIndex(['あ', 'いい', 'ううう'], categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""
-                self.assertEqual(repr(idx), expected)
-            else:
-                expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう'], categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""
-                self.assertEqual(unicode(idx), expected)
-
-            # multiple lines
-            idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'] * 10)
-            if PY3:
-                expected = u"""CategoricalIndex(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい',
-                  'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',
-                  'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい',
-                  'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう'],
-                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""
-                self.assertEqual(repr(idx), expected)
-            else:
-                expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
-                  u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
-                  u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
-                  u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
-                  u'いい', u'ううう', u'あ', u'いい', u'ううう'],
-                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""
-                self.assertEqual(unicode(idx), expected)
-
-            # truncated
-            idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'] * 100)
-            if PY3:
-                expected = u"""CategoricalIndex(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい',
-                  'ううう', 'あ',
-                  ...
-                  'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',
-                  'あ', 'いい', 'ううう'],
-                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category', length=300)"""
-                self.assertEqual(repr(idx), expected)
-            else:
-                expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
-                  u'いい', u'ううう', u'あ',
-                  ...
-                  u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい',
-                  u'ううう', u'あ', u'いい', u'ううう'],
-                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category', length=300)"""
-                self.assertEqual(unicode(idx), expected)
-
-            # larger categories
-            idx = pd.CategoricalIndex(list(u'あいうえおかきくけこさしすせそ'))
-            if PY3:
-                expected = u"""CategoricalIndex(['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', 'け', 'こ',
-                  'さ', 'し', 'す', 'せ', 'そ'],
-                 categories=['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', ...], ordered=False, dtype='category')"""
-                self.assertEqual(repr(idx), expected)
-            else:
-                expected = u"""CategoricalIndex([u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く',
-                  u'け', u'こ', u'さ', u'し', u'す', u'せ', u'そ'],
-                 categories=[u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く', ...], ordered=False, dtype='category')"""
-                self.assertEqual(unicode(idx), expected)
-
-
-class Numeric(Base):
-
-    def test_numeric_compat(self):
-
-        idx = self._holder(np.arange(5,dtype='int64'))
-        didx = self._holder(np.arange(5,dtype='int64')**2
-                            )
-        result = idx * 1
-        tm.assert_index_equal(result, idx)
-
-        result = 1 * idx
-        tm.assert_index_equal(result, idx)
-
-        result = idx * idx
-        tm.assert_index_equal(result, didx)
-
-        result = idx / 1
-        tm.assert_index_equal(result, idx)
-
-        result = idx // 1
-        tm.assert_index_equal(result, idx)
-
-        result = idx * np.array(5,dtype='int64')
-        tm.assert_index_equal(result, self._holder(np.arange(5,dtype='int64')*5))
-
-        result = idx * np.arange(5,dtype='int64')
-        tm.assert_index_equal(result, didx)
-
-        result = idx * Series(np.arange(5,dtype='int64'))
-        tm.assert_index_equal(result, didx)
-
-        result = idx * Series(np.arange(5,dtype='float64')+0.1)
-        tm.assert_index_equal(result,
-                              Float64Index(np.arange(5,dtype='float64')*(np.arange(5,dtype='float64')+0.1)))
-
-        # invalid
-        self.assertRaises(TypeError, lambda : idx * date_range('20130101',periods=5))
-        self.assertRaises(ValueError, lambda : idx * self._holder(np.arange(3)))
-        self.assertRaises(ValueError, lambda : idx * np.array([1,2]))
-
-
-    def test_explicit_conversions(self):
-
-        # GH 8608
-        # add/sub are overriden explicity for Float/Int Index
-        idx = self._holder(np.arange(5,dtype='int64'))
-
-        # float conversions
-        arr = np.arange(5,dtype='int64')*3.2
-        expected = Float64Index(arr)
-        fidx = idx * 3.2
-        tm.assert_index_equal(fidx,expected)
-        fidx = 3.2 * idx
-        tm.assert_index_equal(fidx,expected)
-
-        # interops with numpy arrays
-        expected = Float64Index(arr)
-        a = np.zeros(5,dtype='float64')
-        result = fidx - a
-        tm.assert_index_equal(result,expected)
-
-        expected = Float64Index(-arr)
-        a = np.zeros(5,dtype='float64')
-        result = a - fidx
-        tm.assert_index_equal(result,expected)
-
-    def test_ufunc_compat(self):
-        idx = self._holder(np.arange(5,dtype='int64'))
-        result = np.sin(idx)
-        expected = Float64Index(np.sin(np.arange(5,dtype='int64')))
-        tm.assert_index_equal(result, expected)
-
-    def test_index_groupby(self):
-        int_idx = Index(range(6))
-        float_idx = Index(np.arange(0, 0.6, 0.1))
-        obj_idx = Index('A B C D E F'.split())
-        dt_idx = pd.date_range('2013-01-01', freq='M', periods=6)
-
-        for idx in [int_idx, float_idx, obj_idx, dt_idx]:
-            to_groupby = np.array([1, 2, np.nan, np.nan, 2, 1])
-            self.assertEqual(idx.groupby(to_groupby),
-                             {1.0: [idx[0], idx[5]], 2.0: [idx[1], idx[4]]})
-
-            to_groupby = Index([datetime(2011, 11, 1), datetime(2011, 12, 1),
-                                pd.NaT, pd.NaT,
-                                datetime(2011, 12, 1), datetime(2011, 11, 1)], tz='UTC').values
-
-            ex_keys = pd.tslib.datetime_to_datetime64(np.array([Timestamp('2011-11-01'), Timestamp('2011-12-01')]))
-            expected = {ex_keys[0][0]: [idx[0], idx[5]], ex_keys[0][1]: [idx[1], idx[4]]}
-            self.assertEqual(idx.groupby(to_groupby), expected)
-
-
-class TestFloat64Index(Numeric, tm.TestCase):
-    _holder = Float64Index
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.indices = dict(mixed = Float64Index([1.5, 2, 3, 4, 5]),
-                            float = Float64Index(np.arange(5) * 2.5))
-        self.setup_indices()
-
-    def create_index(self):
-        return Float64Index(np.arange(5, dtype='float64'))
-
-    def test_repr_roundtrip(self):
-        for ind in (self.mixed, self.float):
-            tm.assert_index_equal(eval(repr(ind)), ind)
-
-    def check_is_index(self, i):
-        self.assertIsInstance(i, Index)
-        self.assertNotIsInstance(i, Float64Index)
-
-    def check_coerce(self, a, b, is_float_index=True):
-        self.assertTrue(a.equals(b))
-        if is_float_index:
-            self.assertIsInstance(b, Float64Index)
-        else:
-            self.check_is_index(b)
-
-    def test_constructor(self):
-
-        # explicit construction
-        index = Float64Index([1,2,3,4,5])
-        self.assertIsInstance(index, Float64Index)
-        self.assertTrue((index.values == np.array([1,2,3,4,5],dtype='float64')).all())
-        index = Float64Index(np.array([1,2,3,4,5]))
-        self.assertIsInstance(index, Float64Index)
-        index = Float64Index([1.,2,3,4,5])
-        self.assertIsInstance(index, Float64Index)
-        index = Float64Index(np.array([1.,2,3,4,5]))
-        self.assertIsInstance(index, Float64Index)
-        self.assertEqual(index.dtype, float)
-
-        index = Float64Index(np.array([1.,2,3,4,5]),dtype=np.float32)
-        self.assertIsInstance(index, Float64Index)
-        self.assertEqual(index.dtype, np.float64)
-
-        index = Float64Index(np.array([1,2,3,4,5]),dtype=np.float32)
-        self.assertIsInstance(index, Float64Index)
-        self.assertEqual(index.dtype, np.float64)
-
-        # nan handling
-        result = Float64Index([np.nan, np.nan])
-        self.assertTrue(pd.isnull(result.values).all())
-        result = Float64Index(np.array([np.nan]))
-        self.assertTrue(pd.isnull(result.values).all())
-        result = Index(np.array([np.nan]))
-        self.assertTrue(pd.isnull(result.values).all())
-
-    def test_constructor_invalid(self):
-
-        # invalid
-        self.assertRaises(TypeError, Float64Index, 0.)
-        self.assertRaises(TypeError, Float64Index, ['a','b',0.])
-        self.assertRaises(TypeError, Float64Index, [Timestamp('20130101')])
-
-    def test_constructor_coerce(self):
-
-        self.check_coerce(self.mixed,Index([1.5, 2, 3, 4, 5]))
-        self.check_coerce(self.float,Index(np.arange(5) * 2.5))
-        self.check_coerce(self.float,Index(np.array(np.arange(5) * 2.5, dtype=object)))
-
-    def test_constructor_explicit(self):
-
-        # these don't auto convert
-        self.check_coerce(self.float,Index((np.arange(5) * 2.5), dtype=object),
-                          is_float_index=False)
-        self.check_coerce(self.mixed,Index([1.5, 2, 3, 4, 5],dtype=object),
-                          is_float_index=False)
-
-    def test_astype(self):
-
-        result = self.float.astype(object)
-        self.assertTrue(result.equals(self.float))
-        self.assertTrue(self.float.equals(result))
-        self.check_is_index(result)
-
-        i = self.mixed.copy()
-        i.name = 'foo'
-        result = i.astype(object)
-        self.assertTrue(result.equals(i))
-        self.assertTrue(i.equals(result))
-        self.check_is_index(result)
-
-    def test_equals(self):
-
-        i = Float64Index([1.0,2.0])
-        self.assertTrue(i.equals(i))
-        self.assertTrue(i.identical(i))
-
-        i2 = Float64Index([1.0,2.0])
-        self.assertTrue(i.equals(i2))
-
-        i = Float64Index([1.0,np.nan])
-        self.assertTrue(i.equals(i))
-        self.assertTrue(i.identical(i))
-
-        i2 = Float64Index([1.0,np.nan])
-        self.assertTrue(i.equals(i2))
-
-    def test_get_indexer(self):
-        idx = Float64Index([0.0, 1.0, 2.0])
-        tm.assert_numpy_array_equal(idx.get_indexer(idx), [0, 1, 2])
-
-        target = [-0.1, 0.5, 1.1]
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'), [-1, 0, 1])
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'), [0, 1, 2])
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'), [0, 1, 1])
-
-    def test_get_loc(self):
-        idx = Float64Index([0.0, 1.0, 2.0])
-        for method in [None, 'pad', 'backfill', 'nearest']:
-            self.assertEqual(idx.get_loc(1, method), 1)
-            if method is not None:
-                self.assertEqual(idx.get_loc(1, method, tolerance=0), 1)
-
-        for method, loc in [('pad', 1), ('backfill', 2), ('nearest', 1)]:
-            self.assertEqual(idx.get_loc(1.1, method), loc)
-            self.assertEqual(idx.get_loc(1.1, method, tolerance=0.9), loc)
-
-        self.assertRaises(KeyError, idx.get_loc, 'foo')
-        self.assertRaises(KeyError, idx.get_loc, 1.5)
-        self.assertRaises(KeyError, idx.get_loc, 1.5,
-                          method='pad', tolerance=0.1)
-
-        with tm.assertRaisesRegexp(ValueError, 'must be numeric'):
-            idx.get_loc(1.4, method='nearest', tolerance='foo')
-
-    def test_get_loc_na(self):
-        idx = Float64Index([np.nan, 1, 2])
-        self.assertEqual(idx.get_loc(1), 1)
-        self.assertEqual(idx.get_loc(np.nan), 0)
-
-        idx = Float64Index([np.nan, 1, np.nan])
-        self.assertEqual(idx.get_loc(1), 1)
-
-        # representable by slice [0:2:2]
-        # self.assertRaises(KeyError, idx.slice_locs, np.nan)
-        sliced = idx.slice_locs(np.nan)
-        self.assertTrue(isinstance(sliced, tuple))
-        self.assertEqual(sliced, (0, 3))
-
-        # not representable by slice
-        idx = Float64Index([np.nan, 1, np.nan, np.nan])
-        self.assertEqual(idx.get_loc(1), 1)
-        self.assertRaises(KeyError, idx.slice_locs, np.nan)
-
-    def test_contains_nans(self):
-        i = Float64Index([1.0, 2.0, np.nan])
-        self.assertTrue(np.nan in i)
-
-    def test_contains_not_nans(self):
-        i = Float64Index([1.0, 2.0, np.nan])
-        self.assertTrue(1.0 in i)
-
-    def test_doesnt_contain_all_the_things(self):
-        i = Float64Index([np.nan])
-        self.assertFalse(i.isin([0]).item())
-        self.assertFalse(i.isin([1]).item())
-        self.assertTrue(i.isin([np.nan]).item())
-
-    def test_nan_multiple_containment(self):
-        i = Float64Index([1.0, np.nan])
-        tm.assert_numpy_array_equal(i.isin([1.0]), np.array([True, False]))
-        tm.assert_numpy_array_equal(i.isin([2.0, np.pi]),
-                                    np.array([False, False]))
-        tm.assert_numpy_array_equal(i.isin([np.nan]),
-                                    np.array([False, True]))
-        tm.assert_numpy_array_equal(i.isin([1.0, np.nan]),
-                                    np.array([True, True]))
-        i = Float64Index([1.0, 2.0])
-        tm.assert_numpy_array_equal(i.isin([np.nan]),
-                                    np.array([False, False]))
-
-    def test_astype_from_object(self):
-        index = Index([1.0, np.nan, 0.2], dtype='object')
-        result = index.astype(float)
-        expected = Float64Index([1.0, np.nan, 0.2])
-        tm.assert_equal(result.dtype, expected.dtype)
-        tm.assert_index_equal(result, expected)
-
-
-class TestInt64Index(Numeric, tm.TestCase):
-    _holder = Int64Index
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.indices = dict(index = Int64Index(np.arange(0, 20, 2)))
-        self.setup_indices()
-
-    def create_index(self):
-        return Int64Index(np.arange(5, dtype='int64'))
-
-    def test_too_many_names(self):
-        def testit():
-            self.index.names = ["roger", "harold"]
-        assertRaisesRegexp(ValueError, "^Length", testit)
-
-    def test_constructor(self):
-        # pass list, coerce fine
-        index = Int64Index([-5, 0, 1, 2])
-        expected = np.array([-5, 0, 1, 2], dtype=np.int64)
-        tm.assert_numpy_array_equal(index, expected)
-
-        # from iterable
-        index = Int64Index(iter([-5, 0, 1, 2]))
-        tm.assert_numpy_array_equal(index, expected)
-
-        # scalar raise Exception
-        self.assertRaises(TypeError, Int64Index, 5)
-
-        # copy
-        arr = self.index.values
-        new_index = Int64Index(arr, copy=True)
-        tm.assert_numpy_array_equal(new_index, self.index)
-        val = arr[0] + 3000
-        # this should not change index
-        arr[0] = val
-        self.assertNotEqual(new_index[0], val)
-
-    def test_constructor_corner(self):
-        arr = np.array([1, 2, 3, 4], dtype=object)
-        index = Int64Index(arr)
-        self.assertEqual(index.values.dtype, np.int64)
-        self.assertTrue(index.equals(arr))
-
-        # preventing casting
-        arr = np.array([1, '2', 3, '4'], dtype=object)
-        with tm.assertRaisesRegexp(TypeError, 'casting'):
-            Int64Index(arr)
-
-        arr_with_floats = [0, 2, 3, 4, 5, 1.25, 3, -1]
-        with tm.assertRaisesRegexp(TypeError, 'casting'):
-            Int64Index(arr_with_floats)
-
-    def test_copy(self):
-        i = Int64Index([], name='Foo')
-        i_copy = i.copy()
-        self.assertEqual(i_copy.name, 'Foo')
-
-    def test_view(self):
-        super(TestInt64Index, self).test_view()
-
-        i = Int64Index([], name='Foo')
-        i_view = i.view()
-        self.assertEqual(i_view.name, 'Foo')
-
-        i_view = i.view('i8')
-        tm.assert_index_equal(i, Int64Index(i_view, name='Foo'))
-
-        i_view = i.view(Int64Index)
-        tm.assert_index_equal(i, Int64Index(i_view, name='Foo'))
-
-    def test_coerce_list(self):
-        # coerce things
-        arr = Index([1, 2, 3, 4])
-        tm.assertIsInstance(arr, Int64Index)
-
-        # but not if explicit dtype passed
-        arr = Index([1, 2, 3, 4], dtype=object)
-        tm.assertIsInstance(arr, Index)
-
-    def test_dtype(self):
-        self.assertEqual(self.index.dtype, np.int64)
-
-    def test_is_monotonic(self):
-        self.assertTrue(self.index.is_monotonic)
-        self.assertTrue(self.index.is_monotonic_increasing)
-        self.assertFalse(self.index.is_monotonic_decreasing)
-
-        index = Int64Index([4, 3, 2, 1])
-        self.assertFalse(index.is_monotonic)
-        self.assertTrue(index.is_monotonic_decreasing)
-
-        index = Int64Index([1])
-        self.assertTrue(index.is_monotonic)
-        self.assertTrue(index.is_monotonic_increasing)
-        self.assertTrue(index.is_monotonic_decreasing)
-
-    def test_is_monotonic_na(self):
-        examples = [Index([np.nan]),
-                    Index([np.nan, 1]),
-                    Index([1, 2, np.nan]),
-                    Index(['a', 'b', np.nan]),
-                    pd.to_datetime(['NaT']),
-                    pd.to_datetime(['NaT', '2000-01-01']),
-                    pd.to_datetime(['2000-01-01', 'NaT', '2000-01-02']),
-                    pd.to_timedelta(['1 day', 'NaT']),
-                   ]
-        for index in examples:
-            self.assertFalse(index.is_monotonic_increasing)
-            self.assertFalse(index.is_monotonic_decreasing)
-
-    def test_equals(self):
-        same_values = Index(self.index, dtype=object)
-        self.assertTrue(self.index.equals(same_values))
-        self.assertTrue(same_values.equals(self.index))
-
-    def test_logical_compat(self):
-        idx = self.create_index()
-        self.assertEqual(idx.all(), idx.values.all())
-        self.assertEqual(idx.any(), idx.values.any())
-
-    def test_identical(self):
-        i = Index(self.index.copy())
-        self.assertTrue(i.identical(self.index))
-
-        same_values_different_type = Index(i, dtype=object)
-        self.assertFalse(i.identical(same_values_different_type))
-
-        i = self.index.copy(dtype=object)
-        i = i.rename('foo')
-        same_values = Index(i, dtype=object)
-        self.assertTrue(same_values.identical(self.index.copy(dtype=object)))
-
-        self.assertFalse(i.identical(self.index))
-        self.assertTrue(Index(same_values, name='foo', dtype=object
-                              ).identical(i))
-
-        self.assertFalse(
-            self.index.copy(dtype=object)
-            .identical(self.index.copy(dtype='int64')))
-
-    def test_get_indexer(self):
-        target = Int64Index(np.arange(10))
-        indexer = self.index.get_indexer(target)
-        expected = np.array([0, -1, 1, -1, 2, -1, 3, -1, 4, -1])
-        tm.assert_numpy_array_equal(indexer, expected)
-
-    def test_get_indexer_pad(self):
-        target = Int64Index(np.arange(10))
-        indexer = self.index.get_indexer(target, method='pad')
-        expected = np.array([0, 0, 1, 1, 2, 2, 3, 3, 4, 4])
-        tm.assert_numpy_array_equal(indexer, expected)
-
-    def test_get_indexer_backfill(self):
-        target = Int64Index(np.arange(10))
-        indexer = self.index.get_indexer(target, method='backfill')
-        expected = np.array([0, 1, 1, 2, 2, 3, 3, 4, 4, 5])
-        tm.assert_numpy_array_equal(indexer, expected)
-
-    def test_join_outer(self):
-        other = Int64Index([7, 12, 25, 1, 2, 5])
-        other_mono = Int64Index([1, 2, 5, 7, 12, 25])
-
-        # not monotonic
-        # guarantee of sortedness
-        res, lidx, ridx = self.index.join(other, how='outer',
-                                          return_indexers=True)
-        noidx_res = self.index.join(other, how='outer')
-        self.assertTrue(res.equals(noidx_res))
-
-        eres = Int64Index([0, 1, 2, 4, 5, 6, 7, 8, 10, 12, 14, 16, 18, 25])
-        elidx = np.array([0, -1, 1, 2, -1, 3, -1, 4, 5, 6, 7, 8, 9, -1],
-                         dtype=np.int64)
-        eridx = np.array([-1, 3, 4, -1, 5, -1, 0, -1, -1, 1, -1, -1, -1, 2],
-                         dtype=np.int64)
-
-        tm.assertIsInstance(res, Int64Index)
-        self.assertTrue(res.equals(eres))
-        tm.assert_numpy_array_equal(lidx, elidx)
-        tm.assert_numpy_array_equal(ridx, eridx)
-
-        # monotonic
-        res, lidx, ridx = self.index.join(other_mono, how='outer',
-                                          return_indexers=True)
-        noidx_res = self.index.join(other_mono, how='outer')
-        self.assertTrue(res.equals(noidx_res))
-
-        eridx = np.array([-1, 0, 1, -1, 2, -1, 3, -1, -1, 4, -1, -1, -1, 5],
-                         dtype=np.int64)
-        tm.assertIsInstance(res, Int64Index)
-        self.assertTrue(res.equals(eres))
-        tm.assert_numpy_array_equal(lidx, elidx)
-        tm.assert_numpy_array_equal(ridx, eridx)
-
-    def test_join_inner(self):
-        other = Int64Index([7, 12, 25, 1, 2, 5])
-        other_mono = Int64Index([1, 2, 5, 7, 12, 25])
-
-        # not monotonic
-        res, lidx, ridx = self.index.join(other, how='inner',
-                                          return_indexers=True)
-
-        # no guarantee of sortedness, so sort for comparison purposes
-        ind = res.argsort()
-        res = res.take(ind)
-        lidx = lidx.take(ind)
-        ridx = ridx.take(ind)
-
-        eres = Int64Index([2, 12])
-        elidx = np.array([1, 6])
-        eridx = np.array([4, 1])
-
-        tm.assertIsInstance(res, Int64Index)
-        self.assertTrue(res.equals(eres))
-        tm.assert_numpy_array_equal(lidx, elidx)
-        tm.assert_numpy_array_equal(ridx, eridx)
-
-        # monotonic
-        res, lidx, ridx = self.index.join(other_mono, how='inner',
-                                          return_indexers=True)
-
-        res2 = self.index.intersection(other_mono)
-        self.assertTrue(res.equals(res2))
-
-        eridx = np.array([1, 4])
-        tm.assertIsInstance(res, Int64Index)
-        self.assertTrue(res.equals(eres))
-        tm.assert_numpy_array_equal(lidx, elidx)
-        tm.assert_numpy_array_equal(ridx, eridx)
-
-    def test_join_left(self):
-        other = Int64Index([7, 12, 25, 1, 2, 5])
-        other_mono = Int64Index([1, 2, 5, 7, 12, 25])
-
-        # not monotonic
-        res, lidx, ridx = self.index.join(other, how='left',
-                                          return_indexers=True)
-        eres = self.index
-        eridx = np.array([-1, 4, -1, -1, -1, -1, 1, -1, -1, -1],
-                         dtype=np.int64)
-
-        tm.assertIsInstance(res, Int64Index)
-        self.assertTrue(res.equals(eres))
-        self.assertIsNone(lidx)
-        tm.assert_numpy_array_equal(ridx, eridx)
-
-        # monotonic
-        res, lidx, ridx = self.index.join(other_mono, how='left',
-                                          return_indexers=True)
-        eridx = np.array([-1, 1, -1, -1, -1, -1, 4, -1, -1, -1],
-                         dtype=np.int64)
-        tm.assertIsInstance(res, Int64Index)
-        self.assertTrue(res.equals(eres))
-        self.assertIsNone(lidx)
-        tm.assert_numpy_array_equal(ridx, eridx)
-
-        # non-unique
-        """
-        idx = Index([1,1,2,5])
-        idx2 = Index([1,2,5,7,9])
-        res, lidx, ridx = idx2.join(idx, how='left', return_indexers=True)
-        eres = idx2
-        eridx = np.array([0, 2, 3, -1, -1])
-        elidx = np.array([0, 1, 2, 3, 4])
-        self.assertTrue(res.equals(eres))
-        tm.assert_numpy_array_equal(lidx, elidx)
-        tm.assert_numpy_array_equal(ridx, eridx)
-        """
-
-    def test_join_right(self):
-        other = Int64Index([7, 12, 25, 1, 2, 5])
-        other_mono = Int64Index([1, 2, 5, 7, 12, 25])
-
-        # not monotonic
-        res, lidx, ridx = self.index.join(other, how='right',
-                                          return_indexers=True)
-        eres = other
-        elidx = np.array([-1, 6, -1, -1, 1, -1],
-                         dtype=np.int64)
-
-        tm.assertIsInstance(other, Int64Index)
-        self.assertTrue(res.equals(eres))
-        tm.assert_numpy_array_equal(lidx, elidx)
-        self.assertIsNone(ridx)
-
-        # monotonic
-        res, lidx, ridx = self.index.join(other_mono, how='right',
-                                          return_indexers=True)
-        eres = other_mono
-        elidx = np.array([-1, 1, -1, -1, 6, -1],
-                         dtype=np.int64)
-        tm.assertIsInstance(other, Int64Index)
-        self.assertTrue(res.equals(eres))
-        tm.assert_numpy_array_equal(lidx, elidx)
-        self.assertIsNone(ridx)
-
-        # non-unique
-        """
-        idx = Index([1,1,2,5])
-        idx2 = Index([1,2,5,7,9])
-        res, lidx, ridx = idx.join(idx2, how='right', return_indexers=True)
-        eres = idx2
-        elidx = np.array([0, 2, 3, -1, -1])
-        eridx = np.array([0, 1, 2, 3, 4])
-        self.assertTrue(res.equals(eres))
-        tm.assert_numpy_array_equal(lidx, elidx)
-        tm.assert_numpy_array_equal(ridx, eridx)
-
-        idx = Index([1,1,2,5])
-        idx2 = Index([1,2,5,9,7])
-        res = idx.join(idx2, how='right', return_indexers=False)
-        eres = idx2
-        self.assert(res.equals(eres))
-        """
-
-    def test_join_non_int_index(self):
-        other = Index([3, 6, 7, 8, 10], dtype=object)
-
-        outer = self.index.join(other, how='outer')
-        outer2 = other.join(self.index, how='outer')
-        expected = Index([0, 2, 3, 4, 6, 7, 8, 10, 12, 14,
-                          16, 18], dtype=object)
-        self.assertTrue(outer.equals(outer2))
-        self.assertTrue(outer.equals(expected))
-
-        inner = self.index.join(other, how='inner')
-        inner2 = other.join(self.index, how='inner')
-        expected = Index([6, 8, 10], dtype=object)
-        self.assertTrue(inner.equals(inner2))
-        self.assertTrue(inner.equals(expected))
-
-        left = self.index.join(other, how='left')
-        self.assertTrue(left.equals(self.index))
-
-        left2 = other.join(self.index, how='left')
-        self.assertTrue(left2.equals(other))
-
-        right = self.index.join(other, how='right')
-        self.assertTrue(right.equals(other))
-
-        right2 = other.join(self.index, how='right')
-        self.assertTrue(right2.equals(self.index))
-
-    def test_join_non_unique(self):
-        left = Index([4, 4, 3, 3])
-
-        joined, lidx, ridx = left.join(left, return_indexers=True)
-
-        exp_joined = Index([3, 3, 3, 3, 4, 4, 4, 4])
-        self.assertTrue(joined.equals(exp_joined))
-
-        exp_lidx = np.array([2, 2, 3, 3, 0, 0, 1, 1], dtype=np.int64)
-        tm.assert_numpy_array_equal(lidx, exp_lidx)
-
-        exp_ridx = np.array([2, 3, 2, 3, 0, 1, 0, 1], dtype=np.int64)
-        tm.assert_numpy_array_equal(ridx, exp_ridx)
-
-    def test_join_self(self):
-        kinds = 'outer', 'inner', 'left', 'right'
-        for kind in kinds:
-            joined = self.index.join(self.index, how=kind)
-            self.assertIs(self.index, joined)
-
-    def test_intersection(self):
-        other = Index([1, 2, 3, 4, 5])
-        result = self.index.intersection(other)
-        expected = np.sort(np.intersect1d(self.index.values, other.values))
-        tm.assert_numpy_array_equal(result, expected)
-
-        result = other.intersection(self.index)
-        expected = np.sort(np.asarray(np.intersect1d(self.index.values,
-                                                     other.values)))
-        tm.assert_numpy_array_equal(result, expected)
-
-    def test_intersect_str_dates(self):
-        dt_dates = [datetime(2012, 2, 9), datetime(2012, 2, 22)]
-
-        i1 = Index(dt_dates, dtype=object)
-        i2 = Index(['aa'], dtype=object)
-        res = i2.intersection(i1)
-
-        self.assertEqual(len(res), 0)
-
-    def test_union_noncomparable(self):
-        from datetime import datetime, timedelta
-        # corner case, non-Int64Index
-        now = datetime.now()
-        other = Index([now + timedelta(i) for i in range(4)], dtype=object)
-        result = self.index.union(other)
-        expected = np.concatenate((self.index, other))
-        tm.assert_numpy_array_equal(result, expected)
-
-        result = other.union(self.index)
-        expected = np.concatenate((other, self.index))
-        tm.assert_numpy_array_equal(result, expected)
-
-    def test_cant_or_shouldnt_cast(self):
-        # can't
-        data = ['foo', 'bar', 'baz']
-        self.assertRaises(TypeError, Int64Index, data)
-
-        # shouldn't
-        data = ['0', '1', '2']
-        self.assertRaises(TypeError, Int64Index, data)
-
-    def test_view_Index(self):
-        self.index.view(Index)
-
-    def test_prevent_casting(self):
-        result = self.index.astype('O')
-        self.assertEqual(result.dtype, np.object_)
-
-    def test_take_preserve_name(self):
-        index = Int64Index([1, 2, 3, 4], name='foo')
-        taken = index.take([3, 0, 1])
-        self.assertEqual(index.name, taken.name)
-
-    def test_int_name_format(self):
-        from pandas import Series, DataFrame
-        index = Index(['a', 'b', 'c'], name=0)
-        s = Series(lrange(3), index)
-        df = DataFrame(lrange(3), index=index)
-        repr(s)
-        repr(df)
-
-    def test_print_unicode_columns(self):
-        df = pd.DataFrame(
-            {u("\u05d0"): [1, 2, 3], "\u05d1": [4, 5, 6], "c": [7, 8, 9]})
-        repr(df.columns)  # should not raise UnicodeDecodeError
-
-    def test_repr_summary(self):
-        with cf.option_context('display.max_seq_items', 10):
-            r = repr(pd.Index(np.arange(1000)))
-            self.assertTrue(len(r) < 200)
-            self.assertTrue("..." in r)
-
-    def test_repr_roundtrip(self):
-        tm.assert_index_equal(eval(repr(self.index)), self.index)
-
-    def test_unicode_string_with_unicode(self):
-        idx = Index(lrange(1000))
-
-        if compat.PY3:
-            str(idx)
-        else:
-            compat.text_type(idx)
-
-    def test_bytestring_with_unicode(self):
-        idx = Index(lrange(1000))
-        if compat.PY3:
-            bytes(idx)
-        else:
-            str(idx)
-
-    def test_slice_keep_name(self):
-        idx = Int64Index([1, 2], name='asdf')
-        self.assertEqual(idx.name, idx[1:].name)
-
-    def test_ufunc_coercions(self):
-        idx = pd.Int64Index([1, 2, 3, 4, 5], name='x')
-
-        result = np.sqrt(idx)
-        tm.assertIsInstance(result, Float64Index)
-        exp = pd.Float64Index(np.sqrt(np.array([1, 2, 3, 4, 5])), name='x')
-        tm.assert_index_equal(result, exp)
-
-        result = np.divide(idx, 2.)
-        tm.assertIsInstance(result, Float64Index)
-        exp = pd.Float64Index([0.5, 1., 1.5, 2., 2.5], name='x')
-        tm.assert_index_equal(result, exp)
-
-        # _evaluate_numeric_binop
-        result = idx + 2.
-        tm.assertIsInstance(result, Float64Index)
-        exp = pd.Float64Index([3., 4., 5., 6., 7.], name='x')
-        tm.assert_index_equal(result, exp)
-
-        result = idx - 2.
-        tm.assertIsInstance(result, Float64Index)
-        exp = pd.Float64Index([-1., 0., 1., 2., 3.], name='x')
-        tm.assert_index_equal(result, exp)
-
-        result = idx * 1.
-        tm.assertIsInstance(result, Float64Index)
-        exp = pd.Float64Index([1., 2., 3., 4., 5.], name='x')
-        tm.assert_index_equal(result, exp)
-
-        result = idx / 2.
-        tm.assertIsInstance(result, Float64Index)
-        exp = pd.Float64Index([0.5, 1., 1.5, 2., 2.5], name='x')
-        tm.assert_index_equal(result, exp)
-
-
-class DatetimeLike(Base):
-
-    def test_str(self):
-
-        # test the string repr
-        idx = self.create_index()
-        idx.name = 'foo'
-        self.assertFalse("length=%s" % len(idx) in str(idx))
-        self.assertTrue("'foo'" in str(idx))
-        self.assertTrue(idx.__class__.__name__ in str(idx))
-
-        if hasattr(idx,'tz'):
-            if idx.tz is not None:
-                self.assertTrue(idx.tz in str(idx))
-        if hasattr(idx,'freq'):
-            self.assertTrue("freq='%s'" % idx.freqstr in str(idx))
-
-    def test_view(self):
-        super(DatetimeLike, self).test_view()
-
-        i = self.create_index()
-
-        i_view = i.view('i8')
-        result = self._holder(i)
-        tm.assert_index_equal(result, i)
-
-        i_view = i.view(self._holder)
-        result = self._holder(i)
-        tm.assert_index_equal(result, i)
-
-class TestDatetimeIndex(DatetimeLike, tm.TestCase):
-    _holder = DatetimeIndex
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.indices = dict(index = tm.makeDateIndex(10))
-        self.setup_indices()
-
-    def create_index(self):
-        return date_range('20130101', periods=5)
-
-    def test_construction_with_alt(self):
-
-        i = pd.date_range('20130101',periods=5,freq='H',tz='US/Eastern')
-        i2 = DatetimeIndex(i, dtype=i.dtype)
-        self.assert_index_equal(i, i2)
-
-        i2 = DatetimeIndex(i.tz_localize(None).asi8, tz=i.dtype.tz)
-        self.assert_index_equal(i, i2)
-
-        i2 = DatetimeIndex(i.tz_localize(None).asi8, dtype=i.dtype)
-        self.assert_index_equal(i, i2)
-
-        i2 = DatetimeIndex(i.tz_localize(None).asi8, dtype=i.dtype, tz=i.dtype.tz)
-        self.assert_index_equal(i, i2)
-
-        # localize into the provided tz
-        i2 = DatetimeIndex(i.tz_localize(None).asi8, tz='UTC')
-        expected = i.tz_localize(None).tz_localize('UTC')
-        self.assert_index_equal(i2, expected)
-
-        i2 = DatetimeIndex(i, tz='UTC')
-        expected = i.tz_convert('UTC')
-        self.assert_index_equal(i2, expected)
-
-        # incompat tz/dtype
-        self.assertRaises(ValueError, lambda : DatetimeIndex(i.tz_localize(None).asi8, dtype=i.dtype, tz='US/Pacific'))
-
-    def test_pickle_compat_construction(self):
-        pass
-
-    def test_get_loc(self):
-        idx = pd.date_range('2000-01-01', periods=3)
-
-        for method in [None, 'pad', 'backfill', 'nearest']:
-            self.assertEqual(idx.get_loc(idx[1], method), 1)
-            self.assertEqual(idx.get_loc(idx[1].to_pydatetime(), method), 1)
-            self.assertEqual(idx.get_loc(str(idx[1]), method), 1)
-            if method is not None:
-                self.assertEqual(idx.get_loc(idx[1], method,
-                                             tolerance=pd.Timedelta('0 days')),
-                                 1)
-
-        self.assertEqual(idx.get_loc('2000-01-01', method='nearest'), 0)
-        self.assertEqual(idx.get_loc('2000-01-01T12', method='nearest'), 1)
-
-        self.assertEqual(idx.get_loc('2000-01-01T12', method='nearest',
-                                     tolerance='1 day'), 1)
-        self.assertEqual(idx.get_loc('2000-01-01T12', method='nearest',
-                                     tolerance=pd.Timedelta('1D')), 1)
-        self.assertEqual(idx.get_loc('2000-01-01T12', method='nearest',
-                                     tolerance=np.timedelta64(1, 'D')), 1)
-        self.assertEqual(idx.get_loc('2000-01-01T12', method='nearest',
-                                     tolerance=timedelta(1)), 1)
-        with tm.assertRaisesRegexp(ValueError, 'must be convertible'):
-            idx.get_loc('2000-01-01T12', method='nearest', tolerance='foo')
-        with tm.assertRaises(KeyError):
-            idx.get_loc('2000-01-01T03', method='nearest',
-                        tolerance='2 hours')
-
-        self.assertEqual(idx.get_loc('2000', method='nearest'), slice(0, 3))
-        self.assertEqual(idx.get_loc('2000-01', method='nearest'), slice(0, 3))
-
-        self.assertEqual(idx.get_loc('1999', method='nearest'), 0)
-        self.assertEqual(idx.get_loc('2001', method='nearest'), 2)
-
-        with tm.assertRaises(KeyError):
-            idx.get_loc('1999', method='pad')
-        with tm.assertRaises(KeyError):
-            idx.get_loc('2001', method='backfill')
-
-        with tm.assertRaises(KeyError):
-            idx.get_loc('foobar')
-        with tm.assertRaises(TypeError):
-            idx.get_loc(slice(2))
-
-        idx = pd.to_datetime(['2000-01-01', '2000-01-04'])
-        self.assertEqual(idx.get_loc('2000-01-02', method='nearest'), 0)
-        self.assertEqual(idx.get_loc('2000-01-03', method='nearest'), 1)
-        self.assertEqual(idx.get_loc('2000-01', method='nearest'), slice(0, 2))
-
-        # time indexing
-        idx = pd.date_range('2000-01-01', periods=24, freq='H')
-        tm.assert_numpy_array_equal(idx.get_loc(time(12)), [12])
-        tm.assert_numpy_array_equal(idx.get_loc(time(12, 30)), [])
-        with tm.assertRaises(NotImplementedError):
-            idx.get_loc(time(12, 30), method='pad')
-
-    def test_get_indexer(self):
-        idx = pd.date_range('2000-01-01', periods=3)
-        tm.assert_numpy_array_equal(idx.get_indexer(idx), [0, 1, 2])
-
-        target = idx[0] + pd.to_timedelta(['-1 hour', '12 hours', '1 day 1 hour'])
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'), [-1, 0, 1])
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'), [0, 1, 2])
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'), [0, 1, 1])
-        tm.assert_numpy_array_equal(
-            idx.get_indexer(target, 'nearest', tolerance=pd.Timedelta('1 hour')),
-            [0, -1, 1])
-        with tm.assertRaises(ValueError):
-            idx.get_indexer(idx[[0]], method='nearest', tolerance='foo')
-
-    def test_roundtrip_pickle_with_tz(self):
-
-        # GH 8367
-        # round-trip of timezone
-        index=date_range('20130101',periods=3,tz='US/Eastern',name='foo')
-        unpickled = self.round_trip_pickle(index)
-        self.assertTrue(index.equals(unpickled))
-
-    def test_reindex_preserves_tz_if_target_is_empty_list_or_array(self):
-        # GH7774
-        index = date_range('20130101', periods=3, tz='US/Eastern')
-        self.assertEqual(str(index.reindex([])[0].tz), 'US/Eastern')
-        self.assertEqual(str(index.reindex(np.array([]))[0].tz), 'US/Eastern')
-
-    def test_time_loc(self):  # GH8667
-        from datetime import time
-        from pandas.index import _SIZE_CUTOFF
-
-        ns = _SIZE_CUTOFF + np.array([-100, 100],dtype=np.int64)
-        key = time(15, 11, 30)
-        start = key.hour * 3600 + key.minute * 60 + key.second
-        step = 24 * 3600
-
-        for n in ns:
-            idx = pd.date_range('2014-11-26', periods=n, freq='S')
-            ts = pd.Series(np.random.randn(n), index=idx)
-            i = np.arange(start, n, step)
-
-            tm.assert_numpy_array_equal(ts.index.get_loc(key), i)
-            tm.assert_series_equal(ts[key], ts.iloc[i])
-
-            left, right = ts.copy(), ts.copy()
-            left[key] *= -10
-            right.iloc[i] *= -10
-            tm.assert_series_equal(left, right)
-
-    def test_time_overflow_for_32bit_machines(self):
-        # GH8943.  On some machines NumPy defaults to np.int32 (for example,
-        # 32-bit Linux machines).  In the function _generate_regular_range
-        # found in tseries/index.py, `periods` gets multiplied by `strides`
-        # (which has value 1e9) and since the max value for np.int32 is ~2e9,
-        # and since those machines won't promote np.int32 to np.int64, we get
-        # overflow.
-        periods = np.int_(1000)
-
-        idx1 = pd.date_range(start='2000', periods=periods, freq='S')
-        self.assertEqual(len(idx1), periods)
-
-        idx2 = pd.date_range(end='2000', periods=periods, freq='S')
-        self.assertEqual(len(idx2), periods)
-
-    def test_intersection(self):
-        first = self.index
-        second = self.index[5:]
-        intersect = first.intersection(second)
-        self.assertTrue(tm.equalContents(intersect, second))
-
-        # GH 10149
-        cases = [klass(second.values) for klass in [np.array, Series, list]]
-        for case in cases:
-            result = first.intersection(case)
-            self.assertTrue(tm.equalContents(result, second))
-
-        third = Index(['a', 'b', 'c'])
-        result = first.intersection(third)
-        expected = pd.Index([], dtype=object)
-        self.assert_index_equal(result, expected)
-
-    def test_union(self):
-        first = self.index[:5]
-        second = self.index[5:]
-        everything = self.index
-        union = first.union(second)
-        self.assertTrue(tm.equalContents(union, everything))
-
-        # GH 10149
-        cases = [klass(second.values) for klass in [np.array, Series, list]]
-        for case in cases:
-            result = first.union(case)
-            self.assertTrue(tm.equalContents(result, everything))
-
-    def test_nat(self):
-        self.assertIs(DatetimeIndex([np.nan])[0], pd.NaT)
-
-
-    def test_ufunc_coercions(self):
-        idx = date_range('2011-01-01', periods=3, freq='2D', name='x')
-
-        delta = np.timedelta64(1, 'D')
-        for result in [idx + delta, np.add(idx, delta)]:
-            tm.assertIsInstance(result, DatetimeIndex)
-            exp = date_range('2011-01-02', periods=3, freq='2D', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, '2D')
-
-        for result in [idx - delta, np.subtract(idx, delta)]:
-            tm.assertIsInstance(result, DatetimeIndex)
-            exp = date_range('2010-12-31', periods=3, freq='2D', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, '2D')
-
-        delta = np.array([np.timedelta64(1, 'D'), np.timedelta64(2, 'D'),
-                          np.timedelta64(3, 'D')])
-        for result in [idx + delta, np.add(idx, delta)]:
-            tm.assertIsInstance(result, DatetimeIndex)
-            exp = DatetimeIndex(['2011-01-02', '2011-01-05', '2011-01-08'],
-                                freq='3D', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, '3D')
-
-        for result in [idx - delta, np.subtract(idx, delta)]:
-            tm.assertIsInstance(result, DatetimeIndex)
-            exp = DatetimeIndex(['2010-12-31', '2011-01-01', '2011-01-02'],
-                                freq='D', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, 'D')
-
-
-class TestPeriodIndex(DatetimeLike, tm.TestCase):
-    _holder = PeriodIndex
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.indices = dict(index = tm.makePeriodIndex(10))
-        self.setup_indices()
-
-    def create_index(self):
-        return period_range('20130101', periods=5, freq='D')
-
-    def test_pickle_compat_construction(self):
-        pass
-
-    def test_get_loc(self):
-        idx = pd.period_range('2000-01-01', periods=3)
-
-        for method in [None, 'pad', 'backfill', 'nearest']:
-            self.assertEqual(idx.get_loc(idx[1], method), 1)
-            self.assertEqual(idx.get_loc(idx[1].asfreq('H', how='start'), method), 1)
-            self.assertEqual(idx.get_loc(idx[1].to_timestamp(), method), 1)
-            self.assertEqual(idx.get_loc(idx[1].to_timestamp().to_pydatetime(), method), 1)
-            self.assertEqual(idx.get_loc(str(idx[1]), method), 1)
-
-        idx = pd.period_range('2000-01-01', periods=5)[::2]
-        self.assertEqual(idx.get_loc('2000-01-02T12', method='nearest',
-                                     tolerance='1 day'), 1)
-        self.assertEqual(idx.get_loc('2000-01-02T12', method='nearest',
-                                     tolerance=pd.Timedelta('1D')), 1)
-        self.assertEqual(idx.get_loc('2000-01-02T12', method='nearest',
-                                     tolerance=np.timedelta64(1, 'D')), 1)
-        self.assertEqual(idx.get_loc('2000-01-02T12', method='nearest',
-                                     tolerance=timedelta(1)), 1)
-        with tm.assertRaisesRegexp(ValueError, 'must be convertible'):
-            idx.get_loc('2000-01-10', method='nearest', tolerance='foo')
-
-        msg = 'Input has different freq from PeriodIndex\\(freq=D\\)'
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx.get_loc('2000-01-10', method='nearest', tolerance='1 hour')
-        with tm.assertRaises(KeyError):
-            idx.get_loc('2000-01-10', method='nearest', tolerance='1 day')
-
-    def test_get_indexer(self):
-        idx = pd.period_range('2000-01-01', periods=3).asfreq('H', how='start')
-        tm.assert_numpy_array_equal(idx.get_indexer(idx), [0, 1, 2])
-
-        target = pd.PeriodIndex(['1999-12-31T23', '2000-01-01T12',
-                                 '2000-01-02T01'], freq='H')
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'), [-1, 0, 1])
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'), [0, 1, 2])
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'), [0, 1, 1])
-        tm.assert_numpy_array_equal(
-            idx.get_indexer(target, 'nearest', tolerance='1 hour'),
-            [0, -1, 1])
-
-        msg = 'Input has different freq from PeriodIndex\\(freq=H\\)'
-        with self.assertRaisesRegexp(ValueError, msg):
-            idx.get_indexer(target, 'nearest', tolerance='1 minute')
-
-        tm.assert_numpy_array_equal(
-            idx.get_indexer(target, 'nearest', tolerance='1 day'), [0, 1, 1])
-
-    def test_repeat(self):
-        # GH10183
-        idx = pd.period_range('2000-01-01', periods=3, freq='D')
-        res = idx.repeat(3)
-        exp = PeriodIndex(idx.values.repeat(3), freq='D')
-        self.assert_index_equal(res, exp)
-        self.assertEqual(res.freqstr, 'D')
-
-    def test_period_index_indexer(self):
-
-        #GH4125
-        idx = pd.period_range('2002-01','2003-12', freq='M')
-        df = pd.DataFrame(pd.np.random.randn(24,10), index=idx)
-        self.assert_frame_equal(df, df.ix[idx])
-        self.assert_frame_equal(df, df.ix[list(idx)])
-        self.assert_frame_equal(df, df.loc[list(idx)])
-        self.assert_frame_equal(df.iloc[0:5], df.loc[idx[0:5]])
-        self.assert_frame_equal(df, df.loc[list(idx)])
-
-class TestTimedeltaIndex(DatetimeLike, tm.TestCase):
-    _holder = TimedeltaIndex
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.indices = dict(index = tm.makeTimedeltaIndex(10))
-        self.setup_indices()
-
-    def create_index(self):
-        return pd.to_timedelta(range(5), unit='d') + pd.offsets.Hour(1)
-
-    def test_get_loc(self):
-        idx = pd.to_timedelta(['0 days', '1 days', '2 days'])
-
-        for method in [None, 'pad', 'backfill', 'nearest']:
-            self.assertEqual(idx.get_loc(idx[1], method), 1)
-            self.assertEqual(idx.get_loc(idx[1].to_pytimedelta(), method), 1)
-            self.assertEqual(idx.get_loc(str(idx[1]), method), 1)
-
-        self.assertEqual(idx.get_loc(idx[1], 'pad', tolerance=pd.Timedelta(0)), 1)
-        self.assertEqual(idx.get_loc(idx[1], 'pad', tolerance=np.timedelta64(0, 's')), 1)
-        self.assertEqual(idx.get_loc(idx[1], 'pad', tolerance=timedelta(0)), 1)
-
-        with tm.assertRaisesRegexp(ValueError, 'must be convertible'):
-            idx.get_loc(idx[1], method='nearest', tolerance='foo')
-
-        for method, loc in [('pad', 1), ('backfill', 2), ('nearest', 1)]:
-            self.assertEqual(idx.get_loc('1 day 1 hour', method), loc)
-
-    def test_get_indexer(self):
-        idx = pd.to_timedelta(['0 days', '1 days', '2 days'])
-        tm.assert_numpy_array_equal(idx.get_indexer(idx), [0, 1, 2])
-
-        target = pd.to_timedelta(['-1 hour', '12 hours', '1 day 1 hour'])
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'), [-1, 0, 1])
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'), [0, 1, 2])
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'), [0, 1, 1])
-        tm.assert_numpy_array_equal(
-            idx.get_indexer(target, 'nearest',
-                            tolerance=pd.Timedelta('1 hour')),
-            [0, -1, 1])
-
-    def test_numeric_compat(self):
-
-        idx = self._holder(np.arange(5,dtype='int64'))
-        didx = self._holder(np.arange(5,dtype='int64')**2
-                            )
-        result = idx * 1
-        tm.assert_index_equal(result, idx)
-
-        result = 1 * idx
-        tm.assert_index_equal(result, idx)
-
-        result = idx / 1
-        tm.assert_index_equal(result, idx)
-
-        result = idx // 1
-        tm.assert_index_equal(result, idx)
-
-        result = idx * np.array(5,dtype='int64')
-        tm.assert_index_equal(result, self._holder(np.arange(5,dtype='int64')*5))
-
-        result = idx * np.arange(5,dtype='int64')
-        tm.assert_index_equal(result, didx)
-
-        result = idx * Series(np.arange(5,dtype='int64'))
-        tm.assert_index_equal(result, didx)
-
-        result = idx * Series(np.arange(5,dtype='float64')+0.1)
-        tm.assert_index_equal(result,
-                              Float64Index(np.arange(5,dtype='float64')*(np.arange(5,dtype='float64')+0.1)))
-
-
-        # invalid
-        self.assertRaises(TypeError, lambda : idx * idx)
-        self.assertRaises(ValueError, lambda : idx * self._holder(np.arange(3)))
-        self.assertRaises(ValueError, lambda : idx * np.array([1,2]))
-
-    def test_pickle_compat_construction(self):
-        pass
-
-    def test_ufunc_coercions(self):
-        # normal ops are also tested in tseries/test_timedeltas.py
-        idx = TimedeltaIndex(['2H', '4H', '6H', '8H', '10H'],
-                              freq='2H', name='x')
-
-        for result in [idx * 2, np.multiply(idx, 2)]:
-            tm.assertIsInstance(result, TimedeltaIndex)
-            exp = TimedeltaIndex(['4H', '8H', '12H', '16H', '20H'],
-                                 freq='4H', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, '4H')
-
-        for result in [idx / 2, np.divide(idx, 2)]:
-            tm.assertIsInstance(result, TimedeltaIndex)
-            exp = TimedeltaIndex(['1H', '2H', '3H', '4H', '5H'],
-                                 freq='H', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, 'H')
-
-        idx = TimedeltaIndex(['2H', '4H', '6H', '8H', '10H'],
-                             freq='2H', name='x')
-        for result in [ - idx, np.negative(idx)]:
-            tm.assertIsInstance(result, TimedeltaIndex)
-            exp = TimedeltaIndex(['-2H', '-4H', '-6H', '-8H', '-10H'],
-                                 freq='-2H', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, '-2H')
-
-        idx = TimedeltaIndex(['-2H', '-1H', '0H', '1H', '2H'],
-                             freq='H', name='x')
-        for result in [ abs(idx), np.absolute(idx)]:
-            tm.assertIsInstance(result, TimedeltaIndex)
-            exp = TimedeltaIndex(['2H', '1H', '0H', '1H', '2H'],
-                                 freq=None, name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, None)
-
-
-class TestMultiIndex(Base, tm.TestCase):
-    _holder = MultiIndex
-    _multiprocess_can_split_ = True
-    _compat_props = ['shape', 'ndim', 'size', 'itemsize']
-
-    def setUp(self):
-        major_axis = Index(['foo', 'bar', 'baz', 'qux'])
-        minor_axis = Index(['one', 'two'])
-
-        major_labels = np.array([0, 0, 1, 2, 3, 3])
-        minor_labels = np.array([0, 1, 0, 1, 0, 1])
-        self.index_names = ['first', 'second']
-        self.indices = dict(index = MultiIndex(levels=[major_axis, minor_axis],
-                                               labels=[major_labels, minor_labels],
-                                               names=self.index_names, verify_integrity=False))
-        self.setup_indices()
-
-    def create_index(self):
-        return self.index
-
-    def test_boolean_context_compat2(self):
-
-        # boolean context compat
-        # GH7897
-        i1 = MultiIndex.from_tuples([('A', 1), ('A', 2)])
-        i2 = MultiIndex.from_tuples([('A', 1), ('A', 3)])
-        common = i1.intersection(i2)
-
-        def f():
-            if common:
-                pass
-        tm.assertRaisesRegexp(ValueError,'The truth value of a',f)
-
-    def test_labels_dtypes(self):
-
-        # GH 8456
-        i = MultiIndex.from_tuples([('A', 1), ('A', 2)])
-        self.assertTrue(i.labels[0].dtype == 'int8')
-        self.assertTrue(i.labels[1].dtype == 'int8')
-
-        i = MultiIndex.from_product([['a'],range(40)])
-        self.assertTrue(i.labels[1].dtype == 'int8')
-        i = MultiIndex.from_product([['a'],range(400)])
-        self.assertTrue(i.labels[1].dtype == 'int16')
-        i = MultiIndex.from_product([['a'],range(40000)])
-        self.assertTrue(i.labels[1].dtype == 'int32')
-
-        i = pd.MultiIndex.from_product([['a'],range(1000)])
-        self.assertTrue((i.labels[0]>=0).all())
-        self.assertTrue((i.labels[1]>=0).all())
-
-    def test_set_name_methods(self):
-        # so long as these are synonyms, we don't need to test set_names
-        self.assertEqual(self.index.rename, self.index.set_names)
-        new_names = [name + "SUFFIX" for name in self.index_names]
-        ind = self.index.set_names(new_names)
-        self.assertEqual(self.index.names, self.index_names)
-        self.assertEqual(ind.names, new_names)
-        with assertRaisesRegexp(ValueError, "^Length"):
-            ind.set_names(new_names + new_names)
-        new_names2 = [name + "SUFFIX2" for name in new_names]
-        res = ind.set_names(new_names2, inplace=True)
-        self.assertIsNone(res)
-        self.assertEqual(ind.names, new_names2)
-
-        # set names for specific level (# GH7792)
-        ind = self.index.set_names(new_names[0], level=0)
-        self.assertEqual(self.index.names, self.index_names)
-        self.assertEqual(ind.names, [new_names[0], self.index_names[1]])
-
-        res = ind.set_names(new_names2[0], level=0, inplace=True)
-        self.assertIsNone(res)
-        self.assertEqual(ind.names, [new_names2[0], self.index_names[1]])
-
-        # set names for multiple levels
-        ind = self.index.set_names(new_names, level=[0, 1])
-        self.assertEqual(self.index.names, self.index_names)
-        self.assertEqual(ind.names, new_names)
-
-        res = ind.set_names(new_names2, level=[0, 1], inplace=True)
-        self.assertIsNone(res)
-        self.assertEqual(ind.names, new_names2)
-
-
-    def test_set_levels(self):
-
-        # side note - you probably wouldn't want to use levels and labels
-        # directly like this - but it is possible.
-        levels, labels = self.index.levels, self.index.labels
-        new_levels = [[lev + 'a' for lev in level] for level in levels]
-
-        def assert_matching(actual, expected):
-            # avoid specifying internal representation
-            # as much as possible
-            self.assertEqual(len(actual), len(expected))
-            for act, exp in zip(actual, expected):
-                act = np.asarray(act)
-                exp = np.asarray(exp)
-                assert_almost_equal(act, exp)
-
-        # level changing [w/o mutation]
-        ind2 = self.index.set_levels(new_levels)
-        assert_matching(ind2.levels, new_levels)
-        assert_matching(self.index.levels, levels)
-
-        # level changing [w/ mutation]
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_levels(new_levels, inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.levels, new_levels)
-
-        # level changing specific level [w/o mutation]
-        ind2 = self.index.set_levels(new_levels[0], level=0)
-        assert_matching(ind2.levels, [new_levels[0], levels[1]])
-        assert_matching(self.index.levels, levels)
-
-        ind2 = self.index.set_levels(new_levels[1], level=1)
-        assert_matching(ind2.levels, [levels[0], new_levels[1]])
-        assert_matching(self.index.levels, levels)
-
-        # level changing multiple levels [w/o mutation]
-        ind2 = self.index.set_levels(new_levels, level=[0, 1])
-        assert_matching(ind2.levels, new_levels)
-        assert_matching(self.index.levels, levels)
-
-        # level changing specific level [w/ mutation]
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_levels(new_levels[0], level=0, inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.levels, [new_levels[0], levels[1]])
-        assert_matching(self.index.levels, levels)
-
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_levels(new_levels[1], level=1, inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.levels, [levels[0], new_levels[1]])
-        assert_matching(self.index.levels, levels)
-
-        # level changing multiple levels [w/ mutation]
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_levels(new_levels, level=[0, 1], inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.levels, new_levels)
-        assert_matching(self.index.levels, levels)
-
-    def test_set_labels(self):
-        # side note - you probably wouldn't want to use levels and labels
-        # directly like this - but it is possible.
-        levels, labels = self.index.levels, self.index.labels
-        major_labels, minor_labels = labels
-        major_labels = [(x + 1) % 3 for x in major_labels]
-        minor_labels = [(x + 1) % 1 for x in minor_labels]
-        new_labels = [major_labels, minor_labels]
-
-        def assert_matching(actual, expected):
-            # avoid specifying internal representation
-            # as much as possible
-            self.assertEqual(len(actual), len(expected))
-            for act, exp in zip(actual, expected):
-                act = np.asarray(act)
-                exp = np.asarray(exp)
-                assert_almost_equal(act, exp)
-
-        # label changing [w/o mutation]
-        ind2 = self.index.set_labels(new_labels)
-        assert_matching(ind2.labels, new_labels)
-        assert_matching(self.index.labels, labels)
-
-        # label changing [w/ mutation]
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_labels(new_labels, inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.labels, new_labels)
-
-        # label changing specific level [w/o mutation]
-        ind2 = self.index.set_labels(new_labels[0], level=0)
-        assert_matching(ind2.labels, [new_labels[0], labels[1]])
-        assert_matching(self.index.labels, labels)
-
-        ind2 = self.index.set_labels(new_labels[1], level=1)
-        assert_matching(ind2.labels, [labels[0], new_labels[1]])
-        assert_matching(self.index.labels, labels)
-
-        # label changing multiple levels [w/o mutation]
-        ind2 = self.index.set_labels(new_labels, level=[0, 1])
-        assert_matching(ind2.labels, new_labels)
-        assert_matching(self.index.labels, labels)
-
-        # label changing specific level [w/ mutation]
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_labels(new_labels[0], level=0, inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.labels, [new_labels[0], labels[1]])
-        assert_matching(self.index.labels, labels)
-
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_labels(new_labels[1], level=1, inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.labels, [labels[0], new_labels[1]])
-        assert_matching(self.index.labels, labels)
-
-        # label changing multiple levels [w/ mutation]
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_labels(new_labels, level=[0, 1], inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.labels, new_labels)
-        assert_matching(self.index.labels, labels)
-
-    def test_set_levels_labels_names_bad_input(self):
-        levels, labels = self.index.levels, self.index.labels
-        names = self.index.names
-
-        with tm.assertRaisesRegexp(ValueError, 'Length of levels'):
-            self.index.set_levels([levels[0]])
-
-        with tm.assertRaisesRegexp(ValueError, 'Length of labels'):
-            self.index.set_labels([labels[0]])
-
-        with tm.assertRaisesRegexp(ValueError, 'Length of names'):
-            self.index.set_names([names[0]])
-
-        # shouldn't scalar data error, instead should demand list-like
-        with tm.assertRaisesRegexp(TypeError, 'list of lists-like'):
-            self.index.set_levels(levels[0])
-
-        # shouldn't scalar data error, instead should demand list-like
-        with tm.assertRaisesRegexp(TypeError, 'list of lists-like'):
-            self.index.set_labels(labels[0])
-
-        # shouldn't scalar data error, instead should demand list-like
-        with tm.assertRaisesRegexp(TypeError, 'list-like'):
-            self.index.set_names(names[0])
-
-        # should have equal lengths
-        with tm.assertRaisesRegexp(TypeError, 'list of lists-like'):
-            self.index.set_levels(levels[0], level=[0, 1])
-
-        with tm.assertRaisesRegexp(TypeError, 'list-like'):
-            self.index.set_levels(levels, level=0)
-
-        # should have equal lengths
-        with tm.assertRaisesRegexp(TypeError, 'list of lists-like'):
-            self.index.set_labels(labels[0], level=[0, 1])
-
-        with tm.assertRaisesRegexp(TypeError, 'list-like'):
-            self.index.set_labels(labels, level=0)
-
-        # should have equal lengths
-        with tm.assertRaisesRegexp(ValueError, 'Length of names'):
-            self.index.set_names(names[0], level=[0, 1])
-
-        with tm.assertRaisesRegexp(TypeError, 'string'):
-            self.index.set_names(names, level=0)
-
-    def test_metadata_immutable(self):
-        levels, labels = self.index.levels, self.index.labels
-        # shouldn't be able to set at either the top level or base level
-        mutable_regex = re.compile('does not support mutable operations')
-        with assertRaisesRegexp(TypeError, mutable_regex):
-            levels[0] = levels[0]
-        with assertRaisesRegexp(TypeError, mutable_regex):
-            levels[0][0] = levels[0][0]
-        # ditto for labels
-        with assertRaisesRegexp(TypeError, mutable_regex):
-            labels[0] = labels[0]
-        with assertRaisesRegexp(TypeError, mutable_regex):
-            labels[0][0] = labels[0][0]
-        # and for names
-        names = self.index.names
-        with assertRaisesRegexp(TypeError, mutable_regex):
-            names[0] = names[0]
-
-    def test_inplace_mutation_resets_values(self):
-        levels = [['a', 'b', 'c'], [4]]
-        levels2 = [[1, 2, 3], ['a']]
-        labels = [[0, 1, 0, 2, 2, 0], [0, 0, 0, 0, 0, 0]]
-        mi1 = MultiIndex(levels=levels, labels=labels)
-        mi2 = MultiIndex(levels=levels2, labels=labels)
-        vals = mi1.values.copy()
-        vals2 = mi2.values.copy()
-        self.assertIsNotNone(mi1._tuples)
-
-        # make sure level setting works
-        new_vals = mi1.set_levels(levels2).values
-        assert_almost_equal(vals2, new_vals)
-        # non-inplace doesn't kill _tuples [implementation detail]
-        assert_almost_equal(mi1._tuples, vals)
-        # and values is still same too
-        assert_almost_equal(mi1.values, vals)
-
-        # inplace should kill _tuples
-        mi1.set_levels(levels2, inplace=True)
-        assert_almost_equal(mi1.values, vals2)
-
-        # make sure label setting works too
-        labels2 = [[0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0]]
-        exp_values = np.empty((6, ), dtype=object)
-        exp_values[:] = [(long(1), 'a')] * 6
-        # must be 1d array of tuples
-        self.assertEqual(exp_values.shape, (6, ))
-        new_values = mi2.set_labels(labels2).values
-        # not inplace shouldn't change
-        assert_almost_equal(mi2._tuples, vals2)
-        # should have correct values
-        assert_almost_equal(exp_values, new_values)
-
-        # and again setting inplace should kill _tuples, etc
-        mi2.set_labels(labels2, inplace=True)
-        assert_almost_equal(mi2.values, new_values)
-
-    def test_copy_in_constructor(self):
-        levels = np.array(["a", "b", "c"])
-        labels = np.array([1, 1, 2, 0, 0, 1, 1])
-        val = labels[0]
-        mi = MultiIndex(levels=[levels, levels], labels=[labels, labels],
-                        copy=True)
-        self.assertEqual(mi.labels[0][0], val)
-        labels[0] = 15
-        self.assertEqual(mi.labels[0][0], val)
-        val = levels[0]
-        levels[0] = "PANDA"
-        self.assertEqual(mi.levels[0][0], val)
-
-    def test_set_value_keeps_names(self):
-        # motivating example from #3742
-        lev1 = ['hans', 'hans', 'hans', 'grethe', 'grethe', 'grethe']
-        lev2 = ['1', '2', '3'] * 2
-        idx = pd.MultiIndex.from_arrays(
-            [lev1, lev2],
-            names=['Name', 'Number'])
-        df = pd.DataFrame(
-            np.random.randn(6, 4),
-            columns=['one', 'two', 'three', 'four'],
-            index=idx)
-        df = df.sortlevel()
-        self.assertIsNone(df.is_copy)
-        self.assertEqual(df.index.names, ('Name', 'Number'))
-        df = df.set_value(('grethe', '4'), 'one', 99.34)
-        self.assertIsNone(df.is_copy)
-        self.assertEqual(df.index.names, ('Name', 'Number'))
-
-    def test_names(self):
-
-        # names are assigned in __init__
-        names = self.index_names
-        level_names = [level.name for level in self.index.levels]
-        self.assertEqual(names, level_names)
-
-        # setting bad names on existing
-        index = self.index
-        assertRaisesRegexp(ValueError, "^Length of names", setattr, index,
-                           "names", list(index.names) + ["third"])
-        assertRaisesRegexp(ValueError, "^Length of names", setattr, index,
-                           "names", [])
-
-        # initializing with bad names (should always be equivalent)
-        major_axis, minor_axis = self.index.levels
-        major_labels, minor_labels = self.index.labels
-        assertRaisesRegexp(ValueError, "^Length of names", MultiIndex,
-                           levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels],
-                           names=['first'])
-        assertRaisesRegexp(ValueError, "^Length of names", MultiIndex,
-                           levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels],
-                           names=['first', 'second', 'third'])
-
-        # names are assigned
-        index.names = ["a", "b"]
-        ind_names = list(index.names)
-        level_names = [level.name for level in index.levels]
-        self.assertEqual(ind_names, level_names)
-
-    def test_reference_duplicate_name(self):
-        idx = MultiIndex.from_tuples([('a', 'b'), ('c', 'd')], names=['x', 'x'])
-        self.assertTrue(idx._reference_duplicate_name('x'))
-
-        idx = MultiIndex.from_tuples([('a', 'b'), ('c', 'd')], names=['x', 'y'])
-        self.assertFalse(idx._reference_duplicate_name('x'))
-
-    def test_astype(self):
-        expected = self.index.copy()
-        actual = self.index.astype('O')
-        assert_copy(actual.levels, expected.levels)
-        assert_copy(actual.labels, expected.labels)
-        self.check_level_names(actual, expected.names)
-
-        with assertRaisesRegexp(TypeError, "^Setting.*dtype.*object"):
-            self.index.astype(np.dtype(int))
-
-    def test_constructor_single_level(self):
-        single_level = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux']],
-                                  labels=[[0, 1, 2, 3]],
-                                  names=['first'])
-        tm.assertIsInstance(single_level, Index)
-        self.assertNotIsInstance(single_level, MultiIndex)
-        self.assertEqual(single_level.name, 'first')
-
-        single_level = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux']],
-                                  labels=[[0, 1, 2, 3]])
-        self.assertIsNone(single_level.name)
-
-    def test_constructor_no_levels(self):
-        assertRaisesRegexp(ValueError, "non-zero number of levels/labels",
-                           MultiIndex, levels=[], labels=[])
-        both_re = re.compile('Must pass both levels and labels')
-        with tm.assertRaisesRegexp(TypeError, both_re):
-            MultiIndex(levels=[])
-        with tm.assertRaisesRegexp(TypeError, both_re):
-            MultiIndex(labels=[])
-
-    def test_constructor_mismatched_label_levels(self):
-        labels = [np.array([1]), np.array([2]), np.array([3])]
-        levels = ["a"]
-        assertRaisesRegexp(ValueError, "Length of levels and labels must be"
-                           " the same", MultiIndex, levels=levels,
-                           labels=labels)
-        length_error = re.compile('>= length of level')
-        label_error = re.compile(r'Unequal label lengths: \[4, 2\]')
-
-        # important to check that it's looking at the right thing.
-        with tm.assertRaisesRegexp(ValueError, length_error):
-            MultiIndex(levels=[['a'], ['b']], labels=[[0, 1, 2, 3], [0, 3, 4, 1]])
-
-        with tm.assertRaisesRegexp(ValueError, label_error):
-            MultiIndex(levels=[['a'], ['b']], labels=[[0, 0, 0, 0], [0, 0]])
-
-        # external API
-        with tm.assertRaisesRegexp(ValueError, length_error):
-            self.index.copy().set_levels([['a'], ['b']])
-
-        with tm.assertRaisesRegexp(ValueError, label_error):
-            self.index.copy().set_labels([[0, 0, 0, 0], [0, 0]])
-
-        # deprecated properties
-        with warnings.catch_warnings():
-            warnings.simplefilter('ignore')
-
-            with tm.assertRaisesRegexp(ValueError, length_error):
-                self.index.copy().levels = [['a'], ['b']]
-
-            with tm.assertRaisesRegexp(ValueError, label_error):
-                self.index.copy().labels = [[0, 0, 0, 0], [0, 0]]
-
-
-    def assert_multiindex_copied(self, copy, original):
-        # levels shoudl be (at least, shallow copied)
-        assert_copy(copy.levels, original.levels)
-
-        assert_almost_equal(copy.labels, original.labels)
-
-        # labels doesn't matter which way copied
-        assert_almost_equal(copy.labels, original.labels)
-        self.assertIsNot(copy.labels, original.labels)
-
-        # names doesn't matter which way copied
-        self.assertEqual(copy.names, original.names)
-        self.assertIsNot(copy.names, original.names)
-
-        # sort order should be copied
-        self.assertEqual(copy.sortorder, original.sortorder)
-
-    def test_copy(self):
-        i_copy = self.index.copy()
-
-        self.assert_multiindex_copied(i_copy, self.index)
-
-    def test_shallow_copy(self):
-        i_copy = self.index._shallow_copy()
-
-        self.assert_multiindex_copied(i_copy, self.index)
-
-    def test_view(self):
-        i_view = self.index.view()
-
-        self.assert_multiindex_copied(i_view, self.index)
-
-    def check_level_names(self, index, names):
-        self.assertEqual([level.name for level in index.levels], list(names))
-
-    def test_changing_names(self):
-
-        # names should be applied to levels
-        level_names = [level.name for level in self.index.levels]
-        self.check_level_names(self.index, self.index.names)
-
-        view = self.index.view()
-        copy = self.index.copy()
-        shallow_copy = self.index._shallow_copy()
-
-        # changing names should change level names on object
-        new_names = [name + "a" for name in self.index.names]
-        self.index.names = new_names
-        self.check_level_names(self.index, new_names)
-
-        # but not on copies
-        self.check_level_names(view, level_names)
-        self.check_level_names(copy, level_names)
-        self.check_level_names(shallow_copy, level_names)
-
-        # and copies shouldn't change original
-        shallow_copy.names = [name + "c" for name in shallow_copy.names]
-        self.check_level_names(self.index, new_names)
-
-    def test_duplicate_names(self):
-        self.index.names = ['foo', 'foo']
-        assertRaisesRegexp(KeyError, 'Level foo not found',
-                           self.index._get_level_number, 'foo')
-
-    def test_get_level_number_integer(self):
-        self.index.names = [1, 0]
-        self.assertEqual(self.index._get_level_number(1), 0)
-        self.assertEqual(self.index._get_level_number(0), 1)
-        self.assertRaises(IndexError, self.index._get_level_number, 2)
-        assertRaisesRegexp(KeyError, 'Level fourth not found',
-                           self.index._get_level_number, 'fourth')
-
-    def test_from_arrays(self):
-        arrays = []
-        for lev, lab in zip(self.index.levels, self.index.labels):
-            arrays.append(np.asarray(lev).take(lab))
-
-        result = MultiIndex.from_arrays(arrays)
-        self.assertEqual(list(result), list(self.index))
-
-        # infer correctly
-        result = MultiIndex.from_arrays([[pd.NaT, Timestamp('20130101')], ['a', 'b']])
-        self.assertTrue(result.levels[0].equals(Index([Timestamp('20130101')])))
-        self.assertTrue(result.levels[1].equals(Index(['a','b'])))
-
-    def test_from_product(self):
-
-        first = ['foo', 'bar', 'buz']
-        second = ['a', 'b', 'c']
-        names = ['first', 'second']
-        result = MultiIndex.from_product([first, second], names=names)
-
-        tuples = [('foo', 'a'), ('foo', 'b'), ('foo', 'c'),
-                  ('bar', 'a'), ('bar', 'b'), ('bar', 'c'),
-                  ('buz', 'a'), ('buz', 'b'), ('buz', 'c')]
-        expected = MultiIndex.from_tuples(tuples, names=names)
-
-        tm.assert_numpy_array_equal(result, expected)
-        self.assertEqual(result.names, names)
-
-    def test_from_product_datetimeindex(self):
-        dt_index = date_range('2000-01-01', periods=2)
-        mi = pd.MultiIndex.from_product([[1, 2], dt_index])
-        etalon = pd.lib.list_to_object_array([(1, pd.Timestamp('2000-01-01')),
-                                              (1, pd.Timestamp('2000-01-02')),
-                                              (2, pd.Timestamp('2000-01-01')),
-                                              (2, pd.Timestamp('2000-01-02'))])
-        tm.assert_numpy_array_equal(mi.values, etalon)
-
-    def test_values_boxed(self):
-        tuples = [(1, pd.Timestamp('2000-01-01')),
-                  (2, pd.NaT),
-                  (3, pd.Timestamp('2000-01-03')),
-                  (1, pd.Timestamp('2000-01-04')),
-                  (2, pd.Timestamp('2000-01-02')),
-                  (3, pd.Timestamp('2000-01-03'))]
-        mi = pd.MultiIndex.from_tuples(tuples)
-        tm.assert_numpy_array_equal(mi.values, pd.lib.list_to_object_array(tuples))
-        # Check that code branches for boxed values produce identical results
-        tm.assert_numpy_array_equal(mi.values[:4], mi[:4].values)
-
-    def test_append(self):
-        result = self.index[:3].append(self.index[3:])
-        self.assertTrue(result.equals(self.index))
-
-        foos = [self.index[:1], self.index[1:3], self.index[3:]]
-        result = foos[0].append(foos[1:])
-        self.assertTrue(result.equals(self.index))
-
-        # empty
-        result = self.index.append([])
-        self.assertTrue(result.equals(self.index))
-
-    def test_get_level_values(self):
-        result = self.index.get_level_values(0)
-        expected = ['foo', 'foo', 'bar', 'baz', 'qux', 'qux']
-        tm.assert_numpy_array_equal(result, expected)
-
-        self.assertEqual(result.name, 'first')
-
-        result = self.index.get_level_values('first')
-        expected = self.index.get_level_values(0)
-        tm.assert_numpy_array_equal(result, expected)
-
-        # GH 10460
-        index = MultiIndex(levels=[CategoricalIndex(['A', 'B']),
-                                   CategoricalIndex([1, 2, 3])],
-                           labels=[np.array([0, 0, 0, 1, 1, 1]),
-                                   np.array([0, 1, 2, 0, 1, 2])])
-        exp = CategoricalIndex(['A', 'A', 'A', 'B', 'B', 'B'])
-        self.assert_index_equal(index.get_level_values(0), exp)
-        exp = CategoricalIndex([1, 2 ,3, 1, 2, 3])
-        self.assert_index_equal(index.get_level_values(1), exp)
-
-    def test_get_level_values_na(self):
-        arrays = [['a', 'b', 'b'], [1, np.nan, 2]]
-        index = pd.MultiIndex.from_arrays(arrays)
-        values = index.get_level_values(1)
-        expected = [1, np.nan, 2]
-        tm.assert_numpy_array_equal(values.values.astype(float), expected)
-
-        arrays = [['a', 'b', 'b'], [np.nan, np.nan, 2]]
-        index = pd.MultiIndex.from_arrays(arrays)
-        values = index.get_level_values(1)
-        expected = [np.nan, np.nan, 2]
-        tm.assert_numpy_array_equal(values.values.astype(float), expected)
-
-        arrays = [[np.nan, np.nan, np.nan], ['a', np.nan, 1]]
-        index = pd.MultiIndex.from_arrays(arrays)
-        values = index.get_level_values(0)
-        expected = [np.nan, np.nan, np.nan]
-        tm.assert_numpy_array_equal(values.values.astype(float), expected)
-        values = index.get_level_values(1)
-        expected = np.array(['a', np.nan, 1],dtype=object)
-        tm.assert_numpy_array_equal(values.values, expected)
-
-        arrays = [['a', 'b', 'b'], pd.DatetimeIndex([0, 1, pd.NaT])]
-        index = pd.MultiIndex.from_arrays(arrays)
-        values = index.get_level_values(1)
-        expected = pd.DatetimeIndex([0, 1, pd.NaT])
-        tm.assert_numpy_array_equal(values.values, expected.values)
-
-        arrays = [[], []]
-        index = pd.MultiIndex.from_arrays(arrays)
-        values = index.get_level_values(0)
-        self.assertEqual(values.shape, (0,))
-
-    def test_reorder_levels(self):
-        # this blows up
-        assertRaisesRegexp(IndexError, '^Too many levels',
-                           self.index.reorder_levels, [2, 1, 0])
-
-    def test_nlevels(self):
-        self.assertEqual(self.index.nlevels, 2)
-
-    def test_iter(self):
-        result = list(self.index)
-        expected = [('foo', 'one'), ('foo', 'two'), ('bar', 'one'),
-                    ('baz', 'two'), ('qux', 'one'), ('qux', 'two')]
-        self.assertEqual(result, expected)
-
-    def test_legacy_pickle(self):
-        if compat.PY3:
-            raise nose.SkipTest("testing for legacy pickles not support on py3")
-
-        path = tm.get_data_path('multiindex_v1.pickle')
-        obj = pd.read_pickle(path)
-
-        obj2 = MultiIndex.from_tuples(obj.values)
-        self.assertTrue(obj.equals(obj2))
-
-        res = obj.get_indexer(obj)
-        exp = np.arange(len(obj))
-        assert_almost_equal(res, exp)
-
-        res = obj.get_indexer(obj2[::-1])
-        exp = obj.get_indexer(obj[::-1])
-        exp2 = obj2.get_indexer(obj2[::-1])
-        assert_almost_equal(res, exp)
-        assert_almost_equal(exp, exp2)
-
-    def test_legacy_v2_unpickle(self):
-
-        # 0.7.3 -> 0.8.0 format manage
-        path = tm.get_data_path('mindex_073.pickle')
-        obj = pd.read_pickle(path)
-
-        obj2 = MultiIndex.from_tuples(obj.values)
-        self.assertTrue(obj.equals(obj2))
-
-        res = obj.get_indexer(obj)
-        exp = np.arange(len(obj))
-        assert_almost_equal(res, exp)
-
-        res = obj.get_indexer(obj2[::-1])
-        exp = obj.get_indexer(obj[::-1])
-        exp2 = obj2.get_indexer(obj2[::-1])
-        assert_almost_equal(res, exp)
-        assert_almost_equal(exp, exp2)
-
-    def test_roundtrip_pickle_with_tz(self):
-
-        # GH 8367
-        # round-trip of timezone
-        index=MultiIndex.from_product([[1,2],['a','b'],date_range('20130101',periods=3,tz='US/Eastern')],names=['one','two','three'])
-        unpickled = self.round_trip_pickle(index)
-        self.assertTrue(index.equal_levels(unpickled))
-
-    def test_from_tuples_index_values(self):
-        result = MultiIndex.from_tuples(self.index)
-        self.assertTrue((result.values == self.index.values).all())
-
-    def test_contains(self):
-        self.assertIn(('foo', 'two'), self.index)
-        self.assertNotIn(('bar', 'two'), self.index)
-        self.assertNotIn(None, self.index)
-
-    def test_is_all_dates(self):
-        self.assertFalse(self.index.is_all_dates)
-
-    def test_is_numeric(self):
-        # MultiIndex is never numeric
-        self.assertFalse(self.index.is_numeric())
-
-    def test_getitem(self):
-        # scalar
-        self.assertEqual(self.index[2], ('bar', 'one'))
-
-        # slice
-        result = self.index[2:5]
-        expected = self.index[[2, 3, 4]]
-        self.assertTrue(result.equals(expected))
-
-        # boolean
-        result = self.index[[True, False, True, False, True, True]]
-        result2 = self.index[np.array([True, False, True, False, True, True])]
-        expected = self.index[[0, 2, 4, 5]]
-        self.assertTrue(result.equals(expected))
-        self.assertTrue(result2.equals(expected))
-
-    def test_getitem_group_select(self):
-        sorted_idx, _ = self.index.sortlevel(0)
-        self.assertEqual(sorted_idx.get_loc('baz'), slice(3, 4))
-        self.assertEqual(sorted_idx.get_loc('foo'), slice(0, 2))
-
-    def test_get_loc(self):
-        self.assertEqual(self.index.get_loc(('foo', 'two')), 1)
-        self.assertEqual(self.index.get_loc(('baz', 'two')), 3)
-        self.assertRaises(KeyError, self.index.get_loc, ('bar', 'two'))
-        self.assertRaises(KeyError, self.index.get_loc, 'quux')
-
-        self.assertRaises(NotImplementedError, self.index.get_loc, 'foo',
-                          method='nearest')
-
-        # 3 levels
-        index = MultiIndex(levels=[Index(lrange(4)),
-                                   Index(lrange(4)),
-                                   Index(lrange(4))],
-                           labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]),
-                                   np.array([0, 1, 0, 0, 0, 1, 0, 1]),
-                                   np.array([1, 0, 1, 1, 0, 0, 1, 0])])
-        self.assertRaises(KeyError, index.get_loc, (1, 1))
-        self.assertEqual(index.get_loc((2, 0)), slice(3, 5))
-
-    def test_get_loc_duplicates(self):
-        index = Index([2, 2, 2, 2])
-        result = index.get_loc(2)
-        expected = slice(0, 4)
-        self.assertEqual(result, expected)
-        # self.assertRaises(Exception, index.get_loc, 2)
-
-        index = Index(['c', 'a', 'a', 'b', 'b'])
-        rs = index.get_loc('c')
-        xp = 0
-        assert(rs == xp)
-
-    def test_get_loc_level(self):
-        index = MultiIndex(levels=[Index(lrange(4)),
-                                   Index(lrange(4)),
-                                   Index(lrange(4))],
-                           labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]),
-                                   np.array([0, 1, 0, 0, 0, 1, 0, 1]),
-                                   np.array([1, 0, 1, 1, 0, 0, 1, 0])])
-
-        loc, new_index = index.get_loc_level((0, 1))
-        expected = slice(1, 2)
-        exp_index = index[expected].droplevel(0).droplevel(0)
-        self.assertEqual(loc, expected)
-        self.assertTrue(new_index.equals(exp_index))
-
-        loc, new_index = index.get_loc_level((0, 1, 0))
-        expected = 1
-        self.assertEqual(loc, expected)
-        self.assertIsNone(new_index)
-
-        self.assertRaises(KeyError, index.get_loc_level, (2, 2))
-
-        index = MultiIndex(levels=[[2000], lrange(4)],
-                           labels=[np.array([0, 0, 0, 0]),
-                                   np.array([0, 1, 2, 3])])
-        result, new_index = index.get_loc_level((2000, slice(None, None)))
-        expected = slice(None, None)
-        self.assertEqual(result, expected)
-        self.assertTrue(new_index.equals(index.droplevel(0)))
-
-    def test_slice_locs(self):
-        df = tm.makeTimeDataFrame()
-        stacked = df.stack()
-        idx = stacked.index
-
-        slob = slice(*idx.slice_locs(df.index[5], df.index[15]))
-        sliced = stacked[slob]
-        expected = df[5:16].stack()
-        tm.assert_almost_equal(sliced.values, expected.values)
-
-        slob = slice(*idx.slice_locs(df.index[5] + timedelta(seconds=30),
-                                     df.index[15] - timedelta(seconds=30)))
-        sliced = stacked[slob]
-        expected = df[6:15].stack()
-        tm.assert_almost_equal(sliced.values, expected.values)
-
-    def test_slice_locs_with_type_mismatch(self):
-        df = tm.makeTimeDataFrame()
-        stacked = df.stack()
-        idx = stacked.index
-        assertRaisesRegexp(TypeError, '^Level type mismatch', idx.slice_locs,
-                           (1, 3))
-        assertRaisesRegexp(TypeError, '^Level type mismatch', idx.slice_locs,
-                           df.index[5] + timedelta(seconds=30), (5, 2))
-        df = tm.makeCustomDataframe(5, 5)
-        stacked = df.stack()
-        idx = stacked.index
-        with assertRaisesRegexp(TypeError, '^Level type mismatch'):
-            idx.slice_locs(timedelta(seconds=30))
-        # TODO: Try creating a UnicodeDecodeError in exception message
-        with assertRaisesRegexp(TypeError, '^Level type mismatch'):
-            idx.slice_locs(df.index[1], (16, "a"))
-
-    def test_slice_locs_not_sorted(self):
-        index = MultiIndex(levels=[Index(lrange(4)),
-                                   Index(lrange(4)),
-                                   Index(lrange(4))],
-                           labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]),
-                                   np.array([0, 1, 0, 0, 0, 1, 0, 1]),
-                                   np.array([1, 0, 1, 1, 0, 0, 1, 0])])
-
-        assertRaisesRegexp(KeyError, "[Kk]ey length.*greater than MultiIndex"
-                           " lexsort depth", index.slice_locs, (1, 0, 1),
-                           (2, 1, 0))
-
-        # works
-        sorted_index, _ = index.sortlevel(0)
-        # should there be a test case here???
-        sorted_index.slice_locs((1, 0, 1), (2, 1, 0))
-
-    def test_slice_locs_partial(self):
-        sorted_idx, _ = self.index.sortlevel(0)
-
-        result = sorted_idx.slice_locs(('foo', 'two'), ('qux', 'one'))
-        self.assertEqual(result, (1, 5))
-
-        result = sorted_idx.slice_locs(None, ('qux', 'one'))
-        self.assertEqual(result, (0, 5))
-
-        result = sorted_idx.slice_locs(('foo', 'two'), None)
-        self.assertEqual(result, (1, len(sorted_idx)))
-
-        result = sorted_idx.slice_locs('bar', 'baz')
-        self.assertEqual(result, (2, 4))
-
-    def test_slice_locs_not_contained(self):
-        # some searchsorted action
-
-        index = MultiIndex(levels=[[0, 2, 4, 6], [0, 2, 4]],
-                           labels=[[0, 0, 0, 1, 1, 2, 3, 3, 3],
-                                   [0, 1, 2, 1, 2, 2, 0, 1, 2]],
-                           sortorder=0)
-
-        result = index.slice_locs((1, 0), (5, 2))
-        self.assertEqual(result, (3, 6))
-
-        result = index.slice_locs(1, 5)
-        self.assertEqual(result, (3, 6))
-
-        result = index.slice_locs((2, 2), (5, 2))
-        self.assertEqual(result, (3, 6))
-
-        result = index.slice_locs(2, 5)
-        self.assertEqual(result, (3, 6))
-
-        result = index.slice_locs((1, 0), (6, 3))
-        self.assertEqual(result, (3, 8))
-
-        result = index.slice_locs(-1, 10)
-        self.assertEqual(result, (0, len(index)))
-
-    def test_consistency(self):
-        # need to construct an overflow
-        major_axis = lrange(70000)
-        minor_axis = lrange(10)
-
-        major_labels = np.arange(70000)
-        minor_labels = np.repeat(lrange(10), 7000)
-
-        # the fact that is works means it's consistent
-        index = MultiIndex(levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels])
-
-        # inconsistent
-        major_labels = np.array([0, 0, 1, 1, 1, 2, 2, 3, 3])
-        minor_labels = np.array([0, 1, 0, 1, 1, 0, 1, 0, 1])
-        index = MultiIndex(levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels])
-
-        self.assertFalse(index.is_unique)
-
-    def test_truncate(self):
-        major_axis = Index(lrange(4))
-        minor_axis = Index(lrange(2))
-
-        major_labels = np.array([0, 0, 1, 2, 3, 3])
-        minor_labels = np.array([0, 1, 0, 1, 0, 1])
-
-        index = MultiIndex(levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels])
-
-        result = index.truncate(before=1)
-        self.assertNotIn('foo', result.levels[0])
-        self.assertIn(1, result.levels[0])
-
-        result = index.truncate(after=1)
-        self.assertNotIn(2, result.levels[0])
-        self.assertIn(1, result.levels[0])
-
-        result = index.truncate(before=1, after=2)
-        self.assertEqual(len(result.levels[0]), 2)
-
-        # after < before
-        self.assertRaises(ValueError, index.truncate, 3, 1)
-
-    def test_get_indexer(self):
-        major_axis = Index(lrange(4))
-        minor_axis = Index(lrange(2))
-
-        major_labels = np.array([0, 0, 1, 2, 2, 3, 3])
-        minor_labels = np.array([0, 1, 0, 0, 1, 0, 1])
-
-        index = MultiIndex(levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels])
-        idx1 = index[:5]
-        idx2 = index[[1, 3, 5]]
-
-        r1 = idx1.get_indexer(idx2)
-        assert_almost_equal(r1, [1, 3, -1])
-
-        r1 = idx2.get_indexer(idx1, method='pad')
-        e1 = [-1, 0, 0, 1, 1]
-        assert_almost_equal(r1, e1)
-
-        r2 = idx2.get_indexer(idx1[::-1], method='pad')
-        assert_almost_equal(r2, e1[::-1])
-
-        rffill1 = idx2.get_indexer(idx1, method='ffill')
-        assert_almost_equal(r1, rffill1)
-
-        r1 = idx2.get_indexer(idx1, method='backfill')
-        e1 = [0, 0, 1, 1, 2]
-        assert_almost_equal(r1, e1)
-
-        r2 = idx2.get_indexer(idx1[::-1], method='backfill')
-        assert_almost_equal(r2, e1[::-1])
-
-        rbfill1 = idx2.get_indexer(idx1, method='bfill')
-        assert_almost_equal(r1, rbfill1)
-
-        # pass non-MultiIndex
-        r1 = idx1.get_indexer(idx2._tuple_index)
-        rexp1 = idx1.get_indexer(idx2)
-        assert_almost_equal(r1, rexp1)
-
-        r1 = idx1.get_indexer([1, 2, 3])
-        self.assertTrue((r1 == [-1, -1, -1]).all())
-
-        # create index with duplicates
-        idx1 = Index(lrange(10) + lrange(10))
-        idx2 = Index(lrange(20))
-        assertRaisesRegexp(InvalidIndexError, "Reindexing only valid with"
-                           " uniquely valued Index objects",
-                           idx1.get_indexer, idx2)
-
-    def test_get_indexer_nearest(self):
-        midx = MultiIndex.from_tuples([('a', 1), ('b', 2)])
-        with tm.assertRaises(NotImplementedError):
-            midx.get_indexer(['a'], method='nearest')
-        with tm.assertRaises(NotImplementedError):
-            midx.get_indexer(['a'], method='pad', tolerance=2)
-
-    def test_format(self):
-        self.index.format()
-        self.index[:0].format()
-
-    def test_format_integer_names(self):
-        index = MultiIndex(levels=[[0, 1], [0, 1]],
-                           labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                           names=[0, 1])
-        index.format(names=True)
-
-    def test_format_sparse_display(self):
-        index = MultiIndex(levels=[[0, 1], [0, 1], [0, 1], [0]],
-                           labels=[[0, 0, 0, 1, 1, 1],
-                                   [0, 0, 1, 0, 0, 1],
-                                   [0, 1, 0, 0, 1, 0],
-                                   [0, 0, 0, 0, 0, 0]])
-
-        result = index.format()
-        self.assertEqual(result[3], '1  0  0  0')
-
-    def test_format_sparse_config(self):
-        warn_filters = warnings.filters
-        warnings.filterwarnings('ignore',
-                                category=FutureWarning,
-                                module=".*format")
-        # GH1538
-        pd.set_option('display.multi_sparse', False)
-
-        result = self.index.format()
-        self.assertEqual(result[1], 'foo  two')
-
-        self.reset_display_options()
-
-        warnings.filters = warn_filters
-
-    def test_to_hierarchical(self):
-        index = MultiIndex.from_tuples([(1, 'one'), (1, 'two'),
-                                        (2, 'one'), (2, 'two')])
-        result = index.to_hierarchical(3)
-        expected = MultiIndex(levels=[[1, 2], ['one', 'two']],
-                              labels=[[0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1],
-                                      [0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1]])
-        tm.assert_index_equal(result, expected)
-        self.assertEqual(result.names, index.names)
-
-        # K > 1
-        result = index.to_hierarchical(3, 2)
-        expected = MultiIndex(levels=[[1, 2], ['one', 'two']],
-                              labels=[[0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1],
-                                      [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1]])
-        tm.assert_index_equal(result, expected)
-        self.assertEqual(result.names, index.names)
-
-        # non-sorted
-        index = MultiIndex.from_tuples([(2, 'c'), (1, 'b'),
-                                        (2, 'a'), (2, 'b')],
-                                       names=['N1', 'N2'])
-
-        result = index.to_hierarchical(2)
-        expected = MultiIndex.from_tuples([(2, 'c'), (2, 'c'), (1, 'b'), (1, 'b'),
-                                           (2, 'a'), (2, 'a'), (2, 'b'), (2, 'b')],
-                                          names=['N1', 'N2'])
-        tm.assert_index_equal(result, expected)
-        self.assertEqual(result.names, index.names)
-
-    def test_bounds(self):
-        self.index._bounds
-
-    def test_equals(self):
-        self.assertTrue(self.index.equals(self.index))
-        self.assertTrue(self.index.equal_levels(self.index))
-
-        self.assertFalse(self.index.equals(self.index[:-1]))
-
-        self.assertTrue(self.index.equals(self.index._tuple_index))
-
-        # different number of levels
-        index = MultiIndex(levels=[Index(lrange(4)),
-                                   Index(lrange(4)),
-                                   Index(lrange(4))],
-                           labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]),
-                                   np.array([0, 1, 0, 0, 0, 1, 0, 1]),
-                                   np.array([1, 0, 1, 1, 0, 0, 1, 0])])
-
-        index2 = MultiIndex(levels=index.levels[:-1],
-                            labels=index.labels[:-1])
-        self.assertFalse(index.equals(index2))
-        self.assertFalse(index.equal_levels(index2))
-
-        # levels are different
-        major_axis = Index(lrange(4))
-        minor_axis = Index(lrange(2))
-
-        major_labels = np.array([0, 0, 1, 2, 2, 3])
-        minor_labels = np.array([0, 1, 0, 0, 1, 0])
-
-        index = MultiIndex(levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels])
-        self.assertFalse(self.index.equals(index))
-        self.assertFalse(self.index.equal_levels(index))
-
-        # some of the labels are different
-        major_axis = Index(['foo', 'bar', 'baz', 'qux'])
-        minor_axis = Index(['one', 'two'])
-
-        major_labels = np.array([0, 0, 2, 2, 3, 3])
-        minor_labels = np.array([0, 1, 0, 1, 0, 1])
-
-        index = MultiIndex(levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels])
-        self.assertFalse(self.index.equals(index))
-
-    def test_identical(self):
-        mi = self.index.copy()
-        mi2 = self.index.copy()
-        self.assertTrue(mi.identical(mi2))
-
-        mi = mi.set_names(['new1', 'new2'])
-        self.assertTrue(mi.equals(mi2))
-        self.assertFalse(mi.identical(mi2))
-
-        mi2 = mi2.set_names(['new1', 'new2'])
-        self.assertTrue(mi.identical(mi2))
-
-        mi3 = Index(mi.tolist(), names=mi.names)
-        mi4 = Index(mi.tolist(), names=mi.names, tupleize_cols=False)
-        self.assertTrue(mi.identical(mi3))
-        self.assertFalse(mi.identical(mi4))
-        self.assertTrue(mi.equals(mi4))
-
-    def test_is_(self):
-
-        mi = MultiIndex.from_tuples(lzip(range(10), range(10)))
-        self.assertTrue(mi.is_(mi))
-        self.assertTrue(mi.is_(mi.view()))
-        self.assertTrue(mi.is_(mi.view().view().view().view()))
-        mi2 = mi.view()
-        # names are metadata, they don't change id
-        mi2.names = ["A", "B"]
-        self.assertTrue(mi2.is_(mi))
-        self.assertTrue(mi.is_(mi2))
-
-        self.assertTrue(mi.is_(mi.set_names(["C", "D"])))
-        mi2 = mi.view()
-        mi2.set_names(["E", "F"], inplace=True)
-        self.assertTrue(mi.is_(mi2))
-        # levels are inherent properties, they change identity
-        mi3 = mi2.set_levels([lrange(10), lrange(10)])
-        self.assertFalse(mi3.is_(mi2))
-        # shouldn't change
-        self.assertTrue(mi2.is_(mi))
-        mi4 = mi3.view()
-        mi4.set_levels([[1 for _ in range(10)], lrange(10)], inplace=True)
-        self.assertFalse(mi4.is_(mi3))
-        mi5 = mi.view()
-        mi5.set_levels(mi5.levels, inplace=True)
-        self.assertFalse(mi5.is_(mi))
-
-    def test_union(self):
-        piece1 = self.index[:5][::-1]
-        piece2 = self.index[3:]
-
-        the_union = piece1 | piece2
-
-        tups = sorted(self.index._tuple_index)
-        expected = MultiIndex.from_tuples(tups)
-
-        self.assertTrue(the_union.equals(expected))
-
-        # corner case, pass self or empty thing:
-        the_union = self.index.union(self.index)
-        self.assertIs(the_union, self.index)
-
-        the_union = self.index.union(self.index[:0])
-        self.assertIs(the_union, self.index)
-
-        # won't work in python 3
-        # tuples = self.index._tuple_index
-        # result = self.index[:4] | tuples[4:]
-        # self.assertTrue(result.equals(tuples))
-
-    # not valid for python 3
-    # def test_union_with_regular_index(self):
-    #     other = Index(['A', 'B', 'C'])
-
-    #     result = other.union(self.index)
-    #     self.assertIn(('foo', 'one'), result)
-    #     self.assertIn('B', result)
-
-    #     result2 = self.index.union(other)
-    #     self.assertTrue(result.equals(result2))
-
-    def test_intersection(self):
-        piece1 = self.index[:5][::-1]
-        piece2 = self.index[3:]
-
-        the_int = piece1 & piece2
-        tups = sorted(self.index[3:5]._tuple_index)
-        expected = MultiIndex.from_tuples(tups)
-        self.assertTrue(the_int.equals(expected))
-
-        # corner case, pass self
-        the_int = self.index.intersection(self.index)
-        self.assertIs(the_int, self.index)
-
-        # empty intersection: disjoint
-        empty = self.index[:2] & self.index[2:]
-        expected = self.index[:0]
-        self.assertTrue(empty.equals(expected))
-
-        # can't do in python 3
-        # tuples = self.index._tuple_index
-        # result = self.index & tuples
-        # self.assertTrue(result.equals(tuples))
-
-    def test_difference(self):
-
-        first = self.index
-        result = first.difference(self.index[-3:])
-
-        # - API change GH 8226
-        with tm.assert_produces_warning():
-            first - self.index[-3:]
-        with tm.assert_produces_warning():
-            self.index[-3:] - first
-        with tm.assert_produces_warning():
-            self.index[-3:] - first.tolist()
-
-        self.assertRaises(TypeError, lambda : first.tolist() - self.index[-3:])
-
-        expected = MultiIndex.from_tuples(sorted(self.index[:-3].values),
-                                          sortorder=0,
-                                          names=self.index.names)
-
-        tm.assertIsInstance(result, MultiIndex)
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.names, self.index.names)
-
-        # empty difference: reflexive
-        result = self.index.difference(self.index)
-        expected = self.index[:0]
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.names, self.index.names)
-
-        # empty difference: superset
-        result = self.index[-3:].difference(self.index)
-        expected = self.index[:0]
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.names, self.index.names)
-
-        # empty difference: degenerate
-        result = self.index[:0].difference(self.index)
-        expected = self.index[:0]
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.names, self.index.names)
-
-        # names not the same
-        chunklet = self.index[-3:]
-        chunklet.names = ['foo', 'baz']
-        result = first.difference(chunklet)
-        self.assertEqual(result.names, (None, None))
-
-        # empty, but non-equal
-        result = self.index.difference(self.index.sortlevel(1)[0])
-        self.assertEqual(len(result), 0)
-
-        # raise Exception called with non-MultiIndex
-        result = first.difference(first._tuple_index)
-        self.assertTrue(result.equals(first[:0]))
-
-        # name from empty array
-        result = first.difference([])
-        self.assertTrue(first.equals(result))
-        self.assertEqual(first.names, result.names)
-
-        # name from non-empty array
-        result = first.difference([('foo', 'one')])
-        expected = pd.MultiIndex.from_tuples([('bar', 'one'), ('baz', 'two'),
-                                            ('foo', 'two'), ('qux', 'one'),
-                                            ('qux', 'two')])
-        expected.names = first.names
-        self.assertEqual(first.names, result.names)
-        assertRaisesRegexp(TypeError, "other must be a MultiIndex or a list"
-                           " of tuples", first.difference, [1, 2, 3, 4, 5])
-
-    def test_from_tuples(self):
-        assertRaisesRegexp(TypeError, 'Cannot infer number of levels from'
-                           ' empty list', MultiIndex.from_tuples, [])
-
-        idx = MultiIndex.from_tuples(((1, 2), (3, 4)), names=['a', 'b'])
-        self.assertEqual(len(idx), 2)
-
-    def test_argsort(self):
-        result = self.index.argsort()
-        expected = self.index._tuple_index.argsort()
-        tm.assert_numpy_array_equal(result, expected)
-
-    def test_sortlevel(self):
-        import random
-
-        tuples = list(self.index)
-        random.shuffle(tuples)
-
-        index = MultiIndex.from_tuples(tuples)
-
-        sorted_idx, _ = index.sortlevel(0)
-        expected = MultiIndex.from_tuples(sorted(tuples))
-        self.assertTrue(sorted_idx.equals(expected))
-
-        sorted_idx, _ = index.sortlevel(0, ascending=False)
-        self.assertTrue(sorted_idx.equals(expected[::-1]))
-
-        sorted_idx, _ = index.sortlevel(1)
-        by1 = sorted(tuples, key=lambda x: (x[1], x[0]))
-        expected = MultiIndex.from_tuples(by1)
-        self.assertTrue(sorted_idx.equals(expected))
-
-        sorted_idx, _ = index.sortlevel(1, ascending=False)
-        self.assertTrue(sorted_idx.equals(expected[::-1]))
-
-    def test_sortlevel_not_sort_remaining(self):
-        mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
-        sorted_idx, _ = mi.sortlevel('A', sort_remaining=False)
-        self.assertTrue(sorted_idx.equals(mi))
-
-    def test_sortlevel_deterministic(self):
-        tuples = [('bar', 'one'), ('foo', 'two'), ('qux', 'two'),
-                  ('foo', 'one'), ('baz', 'two'), ('qux', 'one')]
-
-        index = MultiIndex.from_tuples(tuples)
-
-        sorted_idx, _ = index.sortlevel(0)
-        expected = MultiIndex.from_tuples(sorted(tuples))
-        self.assertTrue(sorted_idx.equals(expected))
-
-        sorted_idx, _ = index.sortlevel(0, ascending=False)
-        self.assertTrue(sorted_idx.equals(expected[::-1]))
-
-        sorted_idx, _ = index.sortlevel(1)
-        by1 = sorted(tuples, key=lambda x: (x[1], x[0]))
-        expected = MultiIndex.from_tuples(by1)
-        self.assertTrue(sorted_idx.equals(expected))
-
-        sorted_idx, _ = index.sortlevel(1, ascending=False)
-        self.assertTrue(sorted_idx.equals(expected[::-1]))
-
-    def test_dims(self):
-        pass
-
-    def test_drop(self):
-        dropped = self.index.drop([('foo', 'two'), ('qux', 'one')])
-
-        index = MultiIndex.from_tuples([('foo', 'two'), ('qux', 'one')])
-        dropped2 = self.index.drop(index)
-
-        expected = self.index[[0, 2, 3, 5]]
-        self.assert_index_equal(dropped, expected)
-        self.assert_index_equal(dropped2, expected)
-
-        dropped = self.index.drop(['bar'])
-        expected = self.index[[0, 1, 3, 4, 5]]
-        self.assert_index_equal(dropped, expected)
-
-        dropped = self.index.drop('foo')
-        expected = self.index[[2, 3, 4, 5]]
-        self.assert_index_equal(dropped, expected)
-
-        index = MultiIndex.from_tuples([('bar', 'two')])
-        self.assertRaises(KeyError, self.index.drop, [('bar', 'two')])
-        self.assertRaises(KeyError, self.index.drop, index)
-        self.assertRaises(KeyError, self.index.drop, ['foo', 'two'])
-
-        # partially correct argument
-        mixed_index = MultiIndex.from_tuples([('qux', 'one'), ('bar', 'two')])
-        self.assertRaises(KeyError, self.index.drop, mixed_index)
-
-        # error='ignore'
-        dropped = self.index.drop(index, errors='ignore')
-        expected = self.index[[0, 1, 2, 3, 4, 5]]
-        self.assert_index_equal(dropped, expected)
-
-        dropped = self.index.drop(mixed_index, errors='ignore')
-        expected = self.index[[0, 1, 2, 3, 5]]
-        self.assert_index_equal(dropped, expected)
-
-        dropped = self.index.drop(['foo', 'two'], errors='ignore')
-        expected = self.index[[2, 3, 4, 5]]
-        self.assert_index_equal(dropped, expected)
-
-        # mixed partial / full drop
-        dropped = self.index.drop(['foo', ('qux', 'one')])
-        expected = self.index[[2, 3, 5]]
-        self.assert_index_equal(dropped, expected)
-
-        # mixed partial / full drop / error='ignore'
-        mixed_index = ['foo', ('qux', 'one'), 'two']
-        self.assertRaises(KeyError, self.index.drop, mixed_index)
-        dropped = self.index.drop(mixed_index, errors='ignore')
-        expected = self.index[[2, 3, 5]]
-        self.assert_index_equal(dropped, expected)
-
-    def test_droplevel_with_names(self):
-        index = self.index[self.index.get_loc('foo')]
-        dropped = index.droplevel(0)
-        self.assertEqual(dropped.name, 'second')
-
-        index = MultiIndex(levels=[Index(lrange(4)),
-                                   Index(lrange(4)),
-                                   Index(lrange(4))],
-                           labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]),
-                                   np.array([0, 1, 0, 0, 0, 1, 0, 1]),
-                                   np.array([1, 0, 1, 1, 0, 0, 1, 0])],
-                           names=['one', 'two', 'three'])
-        dropped = index.droplevel(0)
-        self.assertEqual(dropped.names, ('two', 'three'))
-
-        dropped = index.droplevel('two')
-        expected = index.droplevel(1)
-        self.assertTrue(dropped.equals(expected))
-
-    def test_droplevel_multiple(self):
-        index = MultiIndex(levels=[Index(lrange(4)),
-                                   Index(lrange(4)),
-                                   Index(lrange(4))],
-                           labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]),
-                                   np.array([0, 1, 0, 0, 0, 1, 0, 1]),
-                                   np.array([1, 0, 1, 1, 0, 0, 1, 0])],
-                           names=['one', 'two', 'three'])
-
-        dropped = index[:2].droplevel(['three', 'one'])
-        expected = index[:2].droplevel(2).droplevel(0)
-        self.assertTrue(dropped.equals(expected))
-
-    def test_insert(self):
-        # key contained in all levels
-        new_index = self.index.insert(0, ('bar', 'two'))
-        self.assertTrue(new_index.equal_levels(self.index))
-        self.assertEqual(new_index[0], ('bar', 'two'))
-
-        # key not contained in all levels
-        new_index = self.index.insert(0, ('abc', 'three'))
-        tm.assert_numpy_array_equal(new_index.levels[0],
-                                      list(self.index.levels[0]) + ['abc'])
-        tm.assert_numpy_array_equal(new_index.levels[1],
-                                      list(self.index.levels[1]) + ['three'])
-        self.assertEqual(new_index[0], ('abc', 'three'))
-
-        # key wrong length
-        assertRaisesRegexp(ValueError, "Item must have length equal to number"
-                           " of levels", self.index.insert, 0, ('foo2',))
-
-        left = pd.DataFrame([['a', 'b', 0], ['b', 'd', 1]],
-                            columns=['1st', '2nd', '3rd'])
-        left.set_index(['1st', '2nd'], inplace=True)
-        ts = left['3rd'].copy(deep=True)
-
-        left.loc[('b', 'x'), '3rd'] = 2
-        left.loc[('b', 'a'), '3rd'] = -1
-        left.loc[('b', 'b'), '3rd'] = 3
-        left.loc[('a', 'x'), '3rd'] = 4
-        left.loc[('a', 'w'), '3rd'] = 5
-        left.loc[('a', 'a'), '3rd'] = 6
-
-        ts.loc[('b', 'x')] = 2
-        ts.loc['b', 'a'] = -1
-        ts.loc[('b', 'b')] = 3
-        ts.loc['a', 'x'] = 4
-        ts.loc[('a', 'w')] = 5
-        ts.loc['a', 'a'] = 6
-
-        right = pd.DataFrame([['a', 'b',  0],
-                              ['b', 'd',  1],
-                              ['b', 'x',  2],
-                              ['b', 'a', -1],
-                              ['b', 'b',  3],
-                              ['a', 'x',  4],
-                              ['a', 'w',  5],
-                              ['a', 'a',  6]],
-                              columns=['1st', '2nd', '3rd'])
-        right.set_index(['1st', '2nd'], inplace=True)
-        # FIXME data types changes to float because
-        # of intermediate nan insertion;
-        tm.assert_frame_equal(left, right, check_dtype=False)
-        tm.assert_series_equal(ts, right['3rd'])
-
-        # GH9250
-        idx = [('test1', i) for i in range(5)] + \
-                [('test2', i) for i in range(6)] + \
-                [('test', 17), ('test', 18)]
-
-        left = pd.Series(np.linspace(0, 10, 11),
-                         pd.MultiIndex.from_tuples(idx[:-2]))
-
-        left.loc[('test', 17)] = 11
-        left.ix[('test', 18)] = 12
-
-        right = pd.Series(np.linspace(0, 12, 13),
-                          pd.MultiIndex.from_tuples(idx))
-
-        tm.assert_series_equal(left, right)
-
-    def test_take_preserve_name(self):
-        taken = self.index.take([3, 0, 1])
-        self.assertEqual(taken.names, self.index.names)
-
-    def test_join_level(self):
-        def _check_how(other, how):
-            join_index, lidx, ridx = other.join(self.index, how=how,
-                                                level='second',
-                                                return_indexers=True)
-
-            exp_level = other.join(self.index.levels[1], how=how)
-            self.assertTrue(join_index.levels[0].equals(self.index.levels[0]))
-            self.assertTrue(join_index.levels[1].equals(exp_level))
-
-            # pare down levels
-            mask = np.array(
-                [x[1] in exp_level for x in self.index], dtype=bool)
-            exp_values = self.index.values[mask]
-            tm.assert_numpy_array_equal(join_index.values, exp_values)
-
-            if how in ('outer', 'inner'):
-                join_index2, ridx2, lidx2 = \
-                    self.index.join(other, how=how, level='second',
-                                    return_indexers=True)
-
-                self.assertTrue(join_index.equals(join_index2))
-                tm.assert_numpy_array_equal(lidx, lidx2)
-                tm.assert_numpy_array_equal(ridx, ridx2)
-                tm.assert_numpy_array_equal(join_index2.values, exp_values)
-
-        def _check_all(other):
-            _check_how(other, 'outer')
-            _check_how(other, 'inner')
-            _check_how(other, 'left')
-            _check_how(other, 'right')
-
-        _check_all(Index(['three', 'one', 'two']))
-        _check_all(Index(['one']))
-        _check_all(Index(['one', 'three']))
-
-        # some corner cases
-        idx = Index(['three', 'one', 'two'])
-        result = idx.join(self.index, level='second')
-        tm.assertIsInstance(result, MultiIndex)
-
-        assertRaisesRegexp(TypeError, "Join.*MultiIndex.*ambiguous",
-                           self.index.join, self.index, level=1)
-
-    def test_join_self(self):
-        kinds = 'outer', 'inner', 'left', 'right'
-        for kind in kinds:
-            res = self.index
-            joined = res.join(res, how=kind)
-            self.assertIs(res, joined)
-
-    def test_join_multi(self):
-        # GH 10665
-        midx = pd.MultiIndex.from_product([np.arange(4), np.arange(4)], names=['a', 'b'])
-        idx = pd.Index([1, 2, 5], name='b')
-
-        # inner
-        jidx, lidx, ridx = midx.join(idx, how='inner', return_indexers=True)
-        exp_idx = pd.MultiIndex.from_product([np.arange(4), [1, 2]], names=['a', 'b'])
-        exp_lidx = np.array([1, 2, 5, 6, 9, 10, 13, 14])
-        exp_ridx = np.array([0, 1, 0, 1, 0, 1, 0, 1])
-        self.assert_index_equal(jidx, exp_idx)
-        self.assert_numpy_array_equal(lidx, exp_lidx)
-        self.assert_numpy_array_equal(ridx, exp_ridx)
-        # flip
-        jidx, ridx, lidx = idx.join(midx, how='inner', return_indexers=True)
-        self.assert_index_equal(jidx, exp_idx)
-        self.assert_numpy_array_equal(lidx, exp_lidx)
-        self.assert_numpy_array_equal(ridx, exp_ridx)
-
-        # keep MultiIndex
-        jidx, lidx, ridx = midx.join(idx, how='left', return_indexers=True)
-        exp_ridx = np.array([-1, 0, 1, -1, -1, 0, 1, -1, -1, 0, 1, -1, -1, 0, 1, -1])
-        self.assert_index_equal(jidx, midx)
-        self.assertIsNone(lidx)
-        self.assert_numpy_array_equal(ridx, exp_ridx)
-        # flip
-        jidx, ridx, lidx = idx.join(midx, how='right', return_indexers=True)
-        self.assert_index_equal(jidx, midx)
-        self.assertIsNone(lidx)
-        self.assert_numpy_array_equal(ridx, exp_ridx)
-
-    def test_reindex(self):
-        result, indexer = self.index.reindex(list(self.index[:4]))
-        tm.assertIsInstance(result, MultiIndex)
-        self.check_level_names(result, self.index[:4].names)
-
-        result, indexer = self.index.reindex(list(self.index))
-        tm.assertIsInstance(result, MultiIndex)
-        self.assertIsNone(indexer)
-        self.check_level_names(result, self.index.names)
-
-    def test_reindex_level(self):
-        idx = Index(['one'])
-
-        target, indexer = self.index.reindex(idx, level='second')
-        target2, indexer2 = idx.reindex(self.index, level='second')
-
-        exp_index = self.index.join(idx, level='second', how='right')
-        exp_index2 = self.index.join(idx, level='second', how='left')
-
-        self.assertTrue(target.equals(exp_index))
-        exp_indexer = np.array([0, 2, 4])
-        tm.assert_numpy_array_equal(indexer, exp_indexer)
-
-        self.assertTrue(target2.equals(exp_index2))
-        exp_indexer2 = np.array([0, -1, 0, -1, 0, -1])
-        tm.assert_numpy_array_equal(indexer2, exp_indexer2)
-
-        assertRaisesRegexp(TypeError, "Fill method not supported",
-                           self.index.reindex, self.index, method='pad',
-                           level='second')
-
-        assertRaisesRegexp(TypeError, "Fill method not supported",
-                           idx.reindex, idx, method='bfill', level='first')
-
-    def test_duplicates(self):
-        self.assertFalse(self.index.has_duplicates)
-        self.assertTrue(self.index.append(self.index).has_duplicates)
-
-        index = MultiIndex(levels=[[0, 1], [0, 1, 2]],
-                           labels=[[0, 0, 0, 0, 1, 1, 1],
-                                   [0, 1, 2, 0, 0, 1, 2]])
-        self.assertTrue(index.has_duplicates)
-
-        # GH 9075
-        t = [(u('x'), u('out'), u('z'), 5, u('y'), u('in'), u('z'), 169),
-             (u('x'), u('out'), u('z'), 7, u('y'), u('in'), u('z'), 119),
-             (u('x'), u('out'), u('z'), 9, u('y'), u('in'), u('z'), 135),
-             (u('x'), u('out'), u('z'), 13, u('y'), u('in'), u('z'), 145),
-             (u('x'), u('out'), u('z'), 14, u('y'), u('in'), u('z'), 158),
-             (u('x'), u('out'), u('z'), 16, u('y'), u('in'), u('z'), 122),
-             (u('x'), u('out'), u('z'), 17, u('y'), u('in'), u('z'), 160),
-             (u('x'), u('out'), u('z'), 18, u('y'), u('in'), u('z'), 180),
-             (u('x'), u('out'), u('z'), 20, u('y'), u('in'), u('z'), 143),
-             (u('x'), u('out'), u('z'), 21, u('y'), u('in'), u('z'), 128),
-             (u('x'), u('out'), u('z'), 22, u('y'), u('in'), u('z'), 129),
-             (u('x'), u('out'), u('z'), 25, u('y'), u('in'), u('z'), 111),
-             (u('x'), u('out'), u('z'), 28, u('y'), u('in'), u('z'), 114),
-             (u('x'), u('out'), u('z'), 29, u('y'), u('in'), u('z'), 121),
-             (u('x'), u('out'), u('z'), 31, u('y'), u('in'), u('z'), 126),
-             (u('x'), u('out'), u('z'), 32, u('y'), u('in'), u('z'), 155),
-             (u('x'), u('out'), u('z'), 33, u('y'), u('in'), u('z'), 123),
-             (u('x'), u('out'), u('z'), 12, u('y'), u('in'), u('z'), 144)]
-
-        index = pd.MultiIndex.from_tuples(t)
-        self.assertFalse(index.has_duplicates)
-
-        # handle int64 overflow if possible
-        def check(nlevels, with_nulls):
-            labels = np.tile(np.arange(500), 2)
-            level = np.arange(500)
-
-            if with_nulls:  # inject some null values
-                labels[500] = -1  # common nan value
-                labels = list(labels.copy() for i in range(nlevels))
-                for i in range(nlevels):
-                    labels[i][500 + i - nlevels // 2 ] = -1
-
-                labels += [np.array([-1, 1]).repeat(500)]
-            else:
-                labels = [labels] * nlevels + [np.arange(2).repeat(500)]
-
-            levels = [level] * nlevels + [[0, 1]]
-
-            # no dups
-            index = MultiIndex(levels=levels, labels=labels)
-            self.assertFalse(index.has_duplicates)
-
-            # with a dup
-            if with_nulls:
-                f = lambda a: np.insert(a, 1000, a[0])
-                labels = list(map(f, labels))
-                index = MultiIndex(levels=levels, labels=labels)
-            else:
-                values = index.values.tolist()
-                index = MultiIndex.from_tuples(values + [values[0]])
-
-            self.assertTrue(index.has_duplicates)
-
-        # no overflow
-        check(4, False)
-        check(4, True)
-
-        # overflow possible
-        check(8, False)
-        check(8, True)
-
-        # GH 9125
-        n, k = 200, 5000
-        levels = [np.arange(n), tm.makeStringIndex(n), 1000 + np.arange(n)]
-        labels = [np.random.choice(n, k * n) for lev in levels]
-        mi = MultiIndex(levels=levels, labels=labels)
-
-        for keep in ['first', 'last', False]:
-            left = mi.duplicated(keep=keep)
-            right = pd.lib.duplicated(mi.values, keep=keep)
-            tm.assert_numpy_array_equal(left, right)
-
-        # GH5873
-        for a in [101, 102]:
-            mi = MultiIndex.from_arrays([[101, a], [3.5, np.nan]])
-            self.assertFalse(mi.has_duplicates)
-            self.assertEqual(mi.get_duplicates(), [])
-            tm.assert_numpy_array_equal(mi.duplicated(), np.zeros(2, dtype='bool'))
-
-        for n in range(1, 6):  # 1st level shape
-            for m in range(1, 5):  # 2nd level shape
-                # all possible unique combinations, including nan
-                lab = product(range(-1, n), range(-1, m))
-                mi = MultiIndex(levels=[list('abcde')[:n], list('WXYZ')[:m]],
-                                labels=np.random.permutation(list(lab)).T)
-                self.assertEqual(len(mi), (n + 1) * (m + 1))
-                self.assertFalse(mi.has_duplicates)
-                self.assertEqual(mi.get_duplicates(), [])
-                tm.assert_numpy_array_equal(mi.duplicated(),
-                                            np.zeros(len(mi), dtype='bool'))
-
-    def test_duplicate_meta_data(self):
-        # GH 10115
-        index = MultiIndex(levels=[[0, 1], [0, 1, 2]],
-                           labels=[[0, 0, 0, 0, 1, 1, 1],
-                                   [0, 1, 2, 0, 0, 1, 2]])
-        for idx in [index,
-                    index.set_names([None, None]),
-                    index.set_names([None, 'Num']),
-                    index.set_names(['Upper','Num']),
-                   ]:
-            self.assertTrue(idx.has_duplicates)
-            self.assertEqual(idx.drop_duplicates().names, idx.names)
-
-    def test_tolist(self):
-        result = self.index.tolist()
-        exp = list(self.index.values)
-        self.assertEqual(result, exp)
-
-    def test_repr_with_unicode_data(self):
-        with pd.core.config.option_context("display.encoding",'UTF-8'):
-            d = {"a": [u("\u05d0"), 2, 3], "b": [4, 5, 6], "c": [7, 8, 9]}
-            index = pd.DataFrame(d).set_index(["a", "b"]).index
-            self.assertFalse("\\u" in repr(index))  # we don't want unicode-escaped
-
-    def test_repr_roundtrip(self):
-
-        mi = MultiIndex.from_product([list('ab'),range(3)],names=['first','second'])
-        str(mi)
-
-        if compat.PY3:
-            tm.assert_index_equal(eval(repr(mi)), mi, exact=True)
-        else:
-            result = eval(repr(mi))
-            # string coerces to unicode
-            tm.assert_index_equal(result, mi, exact=False)
-            self.assertEqual(mi.get_level_values('first').inferred_type, 'string')
-            self.assertEqual(result.get_level_values('first').inferred_type, 'unicode')
-
-        mi_u = MultiIndex.from_product([list(u'ab'),range(3)],names=['first','second'])
-        result = eval(repr(mi_u))
-        tm.assert_index_equal(result, mi_u, exact=True)
-
-        # formatting
-        if compat.PY3:
-            str(mi)
-        else:
-            compat.text_type(mi)
-
-        # long format
-        mi = MultiIndex.from_product([list('abcdefg'),range(10)],names=['first','second'])
-        result = str(mi)
-
-        if compat.PY3:
-            tm.assert_index_equal(eval(repr(mi)), mi, exact=True)
-        else:
-            result = eval(repr(mi))
-            # string coerces to unicode
-            tm.assert_index_equal(result, mi, exact=False)
-            self.assertEqual(mi.get_level_values('first').inferred_type, 'string')
-            self.assertEqual(result.get_level_values('first').inferred_type, 'unicode')
-
-        mi = MultiIndex.from_product([list(u'abcdefg'),range(10)],names=['first','second'])
-        result = eval(repr(mi_u))
-        tm.assert_index_equal(result, mi_u, exact=True)
-
-    def test_str(self):
-        # tested elsewhere
-        pass
-
-    def test_unicode_string_with_unicode(self):
-        d = {"a": [u("\u05d0"), 2, 3], "b": [4, 5, 6], "c": [7, 8, 9]}
-        idx = pd.DataFrame(d).set_index(["a", "b"]).index
-
-        if compat.PY3:
-            str(idx)
-        else:
-            compat.text_type(idx)
-
-    def test_bytestring_with_unicode(self):
-        d = {"a": [u("\u05d0"), 2, 3], "b": [4, 5, 6], "c": [7, 8, 9]}
-        idx = pd.DataFrame(d).set_index(["a", "b"]).index
-
-        if compat.PY3:
-            bytes(idx)
-        else:
-            str(idx)
-
-    def test_slice_keep_name(self):
-        x = MultiIndex.from_tuples([('a', 'b'), (1, 2), ('c', 'd')],
-                                   names=['x', 'y'])
-        self.assertEqual(x[1:].names, x.names)
-
-    def test_isnull_behavior(self):
-        # should not segfault GH5123
-        # NOTE: if MI representation changes, may make sense to allow
-        # isnull(MI)
-        with tm.assertRaises(NotImplementedError):
-            pd.isnull(self.index)
-
-    def test_level_setting_resets_attributes(self):
-        ind = MultiIndex.from_arrays([
-            ['A', 'A', 'B', 'B', 'B'],
-            [1, 2, 1, 2, 3]])
-        assert ind.is_monotonic
-        ind.set_levels([['A', 'B', 'A', 'A', 'B'], [2, 1, 3, -2, 5]],
-                       inplace=True)
-        # if this fails, probably didn't reset the cache correctly.
-        assert not ind.is_monotonic
-
-    def test_isin(self):
-        values = [('foo', 2), ('bar', 3), ('quux', 4)]
-
-        idx = MultiIndex.from_arrays([['qux', 'baz', 'foo', 'bar'],
-                                      np.arange(4)])
-        result = idx.isin(values)
-        expected = np.array([False, False, True, True])
-        tm.assert_numpy_array_equal(result, expected)
-
-        # empty, return dtype bool
-        idx = MultiIndex.from_arrays([[], []])
-        result = idx.isin(values)
-        self.assertEqual(len(result), 0)
-        self.assertEqual(result.dtype, np.bool_)
-
-    def test_isin_nan(self):
-        idx = MultiIndex.from_arrays([['foo', 'bar'], [1.0, np.nan]])
-        tm.assert_numpy_array_equal(idx.isin([('bar', np.nan)]),
-                                      [False, False])
-        tm.assert_numpy_array_equal(idx.isin([('bar', float('nan'))]),
-                                      [False, False])
-
-    def test_isin_level_kwarg(self):
-        idx = MultiIndex.from_arrays([['qux', 'baz', 'foo', 'bar'],
-                                      np.arange(4)])
-
-        vals_0 = ['foo', 'bar', 'quux']
-        vals_1 = [2, 3, 10]
-
-        expected = np.array([False, False, True, True])
-        tm.assert_numpy_array_equal(expected, idx.isin(vals_0, level=0))
-        tm.assert_numpy_array_equal(expected, idx.isin(vals_0, level=-2))
-
-        tm.assert_numpy_array_equal(expected, idx.isin(vals_1, level=1))
-        tm.assert_numpy_array_equal(expected, idx.isin(vals_1, level=-1))
-
-        self.assertRaises(IndexError, idx.isin, vals_0, level=5)
-        self.assertRaises(IndexError, idx.isin, vals_0, level=-5)
-
-        self.assertRaises(KeyError, idx.isin, vals_0, level=1.0)
-        self.assertRaises(KeyError, idx.isin, vals_1, level=-1.0)
-        self.assertRaises(KeyError, idx.isin, vals_1, level='A')
-
-        idx.names = ['A', 'B']
-        tm.assert_numpy_array_equal(expected, idx.isin(vals_0, level='A'))
-        tm.assert_numpy_array_equal(expected, idx.isin(vals_1, level='B'))
-
-        self.assertRaises(KeyError, idx.isin, vals_1, level='C')
-
-    def test_reindex_preserves_names_when_target_is_list_or_ndarray(self):
-        # GH6552
-        idx = self.index.copy()
-        target = idx.copy()
-        idx.names = target.names = [None, None]
-
-        other_dtype = pd.MultiIndex.from_product([[1, 2], [3, 4]])
-
-        # list & ndarray cases
-        self.assertEqual(idx.reindex([])[0].names, [None, None])
-        self.assertEqual(idx.reindex(np.array([]))[0].names, [None, None])
-        self.assertEqual(idx.reindex(target.tolist())[0].names, [None, None])
-        self.assertEqual(idx.reindex(target.values)[0].names, [None, None])
-        self.assertEqual(idx.reindex(other_dtype.tolist())[0].names, [None, None])
-        self.assertEqual(idx.reindex(other_dtype.values)[0].names, [None, None])
-
-        idx.names = ['foo', 'bar']
-        self.assertEqual(idx.reindex([])[0].names, ['foo', 'bar'])
-        self.assertEqual(idx.reindex(np.array([]))[0].names, ['foo', 'bar'])
-        self.assertEqual(idx.reindex(target.tolist())[0].names, ['foo', 'bar'])
-        self.assertEqual(idx.reindex(target.values)[0].names, ['foo', 'bar'])
-        self.assertEqual(idx.reindex(other_dtype.tolist())[0].names, ['foo', 'bar'])
-        self.assertEqual(idx.reindex(other_dtype.values)[0].names, ['foo', 'bar'])
-
-    def test_reindex_lvl_preserves_names_when_target_is_list_or_array(self):
-        # GH7774
-        idx = pd.MultiIndex.from_product([[0, 1], ['a', 'b']],
-                                         names=['foo', 'bar'])
-        self.assertEqual(idx.reindex([], level=0)[0].names, ['foo', 'bar'])
-        self.assertEqual(idx.reindex([], level=1)[0].names, ['foo', 'bar'])
-
-    def test_reindex_lvl_preserves_type_if_target_is_empty_list_or_array(self):
-        # GH7774
-        idx = pd.MultiIndex.from_product([[0, 1], ['a', 'b']])
-        self.assertEqual(idx.reindex([], level=0)[0].levels[0].dtype.type,
-                         np.int64)
-        self.assertEqual(idx.reindex([], level=1)[0].levels[1].dtype.type,
-                         np.object_)
-
-    def test_groupby(self):
-        groups = self.index.groupby(np.array([1, 1, 1, 2, 2, 2]))
-        labels = self.index.get_values().tolist()
-        exp = {1: labels[:3], 2: labels[3:]}
-        tm.assert_dict_equal(groups, exp)
-
-        # GH5620
-        groups = self.index.groupby(self.index)
-        exp = dict((key, [key]) for key in self.index)
-        tm.assert_dict_equal(groups, exp)
-
-    def test_index_name_retained(self):
-        # GH9857
-        result = pd.DataFrame({'x': [1, 2, 6],
-                               'y': [2, 2, 8],
-                               'z': [-5, 0, 5]})
-        result = result.set_index('z')
-        result.loc[10] = [9, 10]
-        df_expected = pd.DataFrame({'x': [1, 2, 6, 9],
-                                    'y': [2, 2, 8, 10],
-                                    'z': [-5, 0, 5, 10]})
-        df_expected = df_expected.set_index('z')
-        tm.assert_frame_equal(result, df_expected)
-
-    def test_equals_operator(self):
-        # GH9785
-        self.assertTrue((self.index == self.index).all())
-
-
-def test_get_combined_index():
-    from pandas.core.index import _get_combined_index
-    result = _get_combined_index([])
-    assert(result.equals(Index([])))
-
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_indexing.py b/pandas/tests/test_indexing.py
deleted file mode 100644
index 90f85b3f4576d..0000000000000
--- a/pandas/tests/test_indexing.py
+++ /dev/null
@@ -1,5028 +0,0 @@
-# -*- coding: utf-8 -*-
-# pylint: disable-msg=W0612,E1101
-import sys
-import nose
-import itertools
-import warnings
-from datetime import datetime
-
-from pandas.compat import range, lrange, lzip, StringIO, lmap, map
-from pandas.tslib import NaT
-from numpy import nan
-from numpy.random import randn
-import numpy as np
-
-import pandas as pd
-import pandas.core.common as com
-from pandas import option_context
-from pandas.core.api import (DataFrame, Index, Series, Panel, isnull,
-                             MultiIndex, Float64Index, Timestamp, Timedelta)
-from pandas.util.testing import (assert_almost_equal, assert_series_equal,
-                                 assert_frame_equal, assert_panel_equal,
-                                 assert_attr_equal)
-from pandas import concat, lib
-from pandas.io.common import PerformanceWarning
-
-import pandas.util.testing as tm
-from pandas import date_range
-
-_verbose = False
-
-#-------------------------------------------------------------------------------
-# Indexing test cases
-
-
-def _generate_indices(f, values=False):
-    """ generate the indicies
-          if values is True , use the axis values
-                    is False, use the range
-                    """
-
-    axes = f.axes
-    if values:
-        axes = [ lrange(len(a)) for a in axes ]
-
-    return itertools.product(*axes)
-
-def _get_value(f, i, values=False):
-    """ return the value for the location i """
-
-    # check agains values
-    if values:
-        return f.values[i]
-
-    # this is equiv of f[col][row].....
-    #v = f
-    #for a in reversed(i):
-    #    v = v.__getitem__(a)
-    #return v
-    return f.ix[i]
-
-def _get_result(obj, method, key, axis):
-    """ return the result for this obj with this key and this axis """
-
-    if isinstance(key, dict):
-        key = key[axis]
-
-    # use an artifical conversion to map the key as integers to the labels
-    # so ix can work for comparisions
-    if method == 'indexer':
-        method = 'ix'
-        key    = obj._get_axis(axis)[key]
-
-    # in case we actually want 0 index slicing
-    try:
-        xp  = getattr(obj, method).__getitem__(_axify(obj,key,axis))
-    except:
-        xp  = getattr(obj, method).__getitem__(key)
-
-    return xp
-
-def _axify(obj, key, axis):
-    # create a tuple accessor
-    if axis is not None:
-        axes = [ slice(None) ] * obj.ndim
-        axes[axis] = key
-        return tuple(axes)
-    return k
-
-
-def _mklbl(prefix,n):
-    return ["%s%s" % (prefix,i)  for i in range(n)]
-
-class TestIndexing(tm.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    _objs = set(['series','frame','panel'])
-    _typs = set(['ints','labels','mixed','ts','floats','empty'])
-
-    def setUp(self):
-
-        import warnings
-        warnings.filterwarnings(action='ignore', category=FutureWarning)
-
-        self.series_ints = Series(np.random.rand(4), index=lrange(0,8,2))
-        self.frame_ints = DataFrame(np.random.randn(4, 4), index=lrange(0, 8, 2), columns=lrange(0,12,3))
-        self.panel_ints = Panel(np.random.rand(4,4,4), items=lrange(0,8,2),major_axis=lrange(0,12,3),minor_axis=lrange(0,16,4))
-
-        self.series_labels = Series(np.random.randn(4), index=list('abcd'))
-        self.frame_labels  = DataFrame(np.random.randn(4, 4), index=list('abcd'), columns=list('ABCD'))
-        self.panel_labels  = Panel(np.random.randn(4,4,4), items=list('abcd'), major_axis=list('ABCD'), minor_axis=list('ZYXW'))
-
-        self.series_mixed  = Series(np.random.randn(4), index=[2, 4, 'null', 8])
-        self.frame_mixed   = DataFrame(np.random.randn(4, 4), index=[2, 4, 'null', 8])
-        self.panel_mixed   = Panel(np.random.randn(4,4,4), items=[2,4,'null',8])
-
-        self.series_ts     = Series(np.random.randn(4), index=date_range('20130101', periods=4))
-        self.frame_ts      = DataFrame(np.random.randn(4, 4), index=date_range('20130101', periods=4))
-        self.panel_ts      = Panel(np.random.randn(4, 4, 4), items=date_range('20130101', periods=4))
-
-        #self.series_floats = Series(np.random.randn(4), index=[1.00, 2.00, 3.00, 4.00])
-        #self.frame_floats  = DataFrame(np.random.randn(4, 4), columns=[1.00, 2.00, 3.00, 4.00])
-        #self.panel_floats  = Panel(np.random.rand(4,4,4), items = [1.00,2.00,3.00,4.00])
-
-        self.frame_empty   = DataFrame({})
-        self.series_empty  = Series({})
-        self.panel_empty   = Panel({})
-
-        # form agglomerates
-        for o in self._objs:
-
-            d = dict()
-            for t in self._typs:
-                d[t] = getattr(self,'%s_%s' % (o,t),None)
-
-            setattr(self,o,d)
-
-    def check_values(self, f, func, values = False):
-
-        if f is None: return
-        axes = f.axes
-        indicies = itertools.product(*axes)
-
-        for i in indicies:
-            result = getattr(f,func)[i]
-
-            # check agains values
-            if values:
-                expected = f.values[i]
-            else:
-                expected = f
-                for a in reversed(i):
-                    expected = expected.__getitem__(a)
-
-            assert_almost_equal(result, expected)
-
-
-    def check_result(self, name, method1, key1, method2, key2, typs = None, objs = None, axes = None, fails = None):
-
-
-        def _eq(t, o, a, obj, k1, k2):
-            """ compare equal for these 2 keys """
-
-            if a is not None and a > obj.ndim-1:
-                return
-
-            def _print(result, error = None):
-                if error is not None:
-                    error = str(error)
-                v = "%-16.16s [%-16.16s]: [typ->%-8.8s,obj->%-8.8s,key1->(%-4.4s),key2->(%-4.4s),axis->%s] %s" % (name,result,t,o,method1,method2,a,error or '')
-                if _verbose:
-                    com.pprint_thing(v)
-
-            try:
-
-                ### good debug location ###
-                #if name == 'bool' and t == 'empty' and o == 'series' and method1 == 'loc':
-                #    import pdb; pdb.set_trace()
-
-                rs  = getattr(obj, method1).__getitem__(_axify(obj,k1,a))
-
-                try:
-                    xp = _get_result(obj,method2,k2,a)
-                except:
-                    result = 'no comp'
-                    _print(result)
-                    return
-
-                try:
-                    if np.isscalar(rs) and np.isscalar(xp):
-                        self.assertEqual(rs, xp)
-                    elif xp.ndim == 1:
-                        assert_series_equal(rs,xp)
-                    elif xp.ndim == 2:
-                        assert_frame_equal(rs,xp)
-                    elif xp.ndim == 3:
-                        assert_panel_equal(rs,xp)
-                    result = 'ok'
-                except (AssertionError):
-                    result = 'fail'
-
-                # reverse the checks
-                if fails is True:
-                    if result == 'fail':
-                        result = 'ok (fail)'
-
-                if not result.startswith('ok'):
-                    raise AssertionError(_print(result))
-
-                _print(result)
-
-            except AssertionError:
-                raise
-            except Exception as detail:
-
-                # if we are in fails, the ok, otherwise raise it
-                if fails is not None:
-                    if isinstance(detail, fails):
-                        result = 'ok (%s)' % type(detail).__name__
-                        _print(result)
-                        return
-
-                result = type(detail).__name__
-                raise AssertionError(_print(result, error = detail))
-
-        if typs is None:
-            typs = self._typs
-
-        if objs is None:
-            objs = self._objs
-
-        if axes is not None:
-            if not isinstance(axes,(tuple,list)):
-                axes = [ axes ]
-            else:
-                axes = list(axes)
-        else:
-            axes = [ 0, 1, 2]
-
-        # check
-        for o in objs:
-            if o not in self._objs:
-                continue
-
-            d = getattr(self,o)
-            for a in axes:
-                for t in typs:
-                    if t not in self._typs:
-                        continue
-
-                    obj = d[t]
-                    if obj is not None:
-                        obj = obj.copy()
-
-                        k2 = key2
-                        _eq(t, o, a, obj, key1, k2)
-
-    def test_indexer_caching(self):
-        # GH5727
-        # make sure that indexers are in the _internal_names_set
-        n = 1000001
-        arrays = [lrange(n), lrange(n)]
-        index = MultiIndex.from_tuples(lzip(*arrays))
-        s = Series(np.zeros(n), index=index)
-        str(s)
-
-        # setitem
-        expected = Series(np.ones(n), index=index)
-        s = Series(np.zeros(n), index=index)
-        s[s==0] = 1
-        assert_series_equal(s,expected)
-
-    def test_at_and_iat_get(self):
-
-        def _check(f, func, values = False):
-
-            if f is not None:
-                indicies = _generate_indices(f, values)
-                for i in indicies:
-                    result = getattr(f,func)[i]
-                    expected = _get_value(f,i,values)
-                    assert_almost_equal(result, expected)
-
-        for o in self._objs:
-
-            d = getattr(self,o)
-
-            # iat
-            _check(d['ints'],'iat', values=True)
-            for f in [d['labels'],d['ts'],d['floats']]:
-                if f is not None:
-                    self.assertRaises(ValueError, self.check_values, f, 'iat')
-
-            # at
-            _check(d['ints'],  'at')
-            _check(d['labels'],'at')
-            _check(d['ts'],    'at')
-            _check(d['floats'],'at')
-
-    def test_at_and_iat_set(self):
-
-        def _check(f, func, values = False):
-
-            if f is not None:
-                indicies = _generate_indices(f, values)
-                for i in indicies:
-                    getattr(f,func)[i] = 1
-                    expected = _get_value(f,i,values)
-                    assert_almost_equal(expected, 1)
-
-        for t in self._objs:
-
-            d = getattr(self,t)
-
-            _check(d['ints'],'iat',values=True)
-            for f in [d['labels'],d['ts'],d['floats']]:
-                if f is not None:
-                    self.assertRaises(ValueError, _check, f, 'iat')
-
-            # at
-            _check(d['ints'],  'at')
-            _check(d['labels'],'at')
-            _check(d['ts'],    'at')
-            _check(d['floats'],'at')
-
-    def test_at_iat_coercion(self):
-
-        # as timestamp is not a tuple!
-        dates = date_range('1/1/2000', periods=8)
-        df = DataFrame(randn(8, 4), index=dates, columns=['A', 'B', 'C', 'D'])
-        s = df['A']
-
-        result = s.at[dates[5]]
-        xp     = s.values[5]
-        self.assertEqual(result, xp)
-
-        # GH 7729
-        # make sure we are boxing the returns
-        s = Series(['2014-01-01', '2014-02-02'], dtype='datetime64[ns]')
-        expected = Timestamp('2014-02-02')
-
-        for r in [ lambda : s.iat[1], lambda : s.iloc[1] ]:
-            result = r()
-            self.assertEqual(result, expected)
-
-        s = Series(['1 days','2 days'], dtype='timedelta64[ns]')
-        expected = Timedelta('2 days')
-
-        for r in [ lambda : s.iat[1], lambda : s.iloc[1] ]:
-            result = r()
-            self.assertEqual(result, expected)
-
-    def test_iat_invalid_args(self):
-        pass
-
-    def test_imethods_with_dups(self):
-
-        # GH6493
-        # iat/iloc with dups
-
-        s = Series(range(5), index=[1,1,2,2,3], dtype='int64')
-        result = s.iloc[2]
-        self.assertEqual(result,2)
-        result = s.iat[2]
-        self.assertEqual(result,2)
-
-        self.assertRaises(IndexError, lambda : s.iat[10])
-        self.assertRaises(IndexError, lambda : s.iat[-10])
-
-        result = s.iloc[[2,3]]
-        expected = Series([2,3],[2,2],dtype='int64')
-        assert_series_equal(result,expected)
-
-        df = s.to_frame()
-        result = df.iloc[2]
-        expected = Series(2, index=[0], name=2)
-        assert_series_equal(result, expected)
-
-        result = df.iat[2,0]
-        expected = 2
-        self.assertEqual(result,2)
-
-    def test_repeated_getitem_dups(self):
-        # GH 5678
-        # repeated gettitems on a dup index returing a ndarray
-        df = DataFrame(np.random.random_sample((20,5)), index=['ABCDE'[x%5] for x in range(20)])
-        expected = df.loc['A',0]
-        result = df.loc[:,0].loc['A']
-        assert_series_equal(result,expected)
-
-    def test_iloc_exceeds_bounds(self):
-
-        # GH6296
-        # iloc should allow indexers that exceed the bounds
-        df = DataFrame(np.random.random_sample((20,5)), columns=list('ABCDE'))
-        expected = df
-
-        # lists of positions should raise IndexErrror!
-        with tm.assertRaisesRegexp(IndexError, 'positional indexers are out-of-bounds'):
-            df.iloc[:,[0,1,2,3,4,5]]
-        self.assertRaises(IndexError, lambda : df.iloc[[1,30]])
-        self.assertRaises(IndexError, lambda : df.iloc[[1,-30]])
-        self.assertRaises(IndexError, lambda : df.iloc[[100]])
-
-        s = df['A']
-        self.assertRaises(IndexError, lambda : s.iloc[[100]])
-        self.assertRaises(IndexError, lambda : s.iloc[[-100]])
-
-        # still raise on a single indexer
-        with tm.assertRaisesRegexp(IndexError, 'single positional indexer is out-of-bounds'):
-            df.iloc[30]
-        self.assertRaises(IndexError, lambda : df.iloc[-30])
-
-        # GH10779
-        # single positive/negative indexer exceeding Series bounds should raise an IndexError
-        with tm.assertRaisesRegexp(IndexError, 'single positional indexer is out-of-bounds'):
-            s.iloc[30]
-        self.assertRaises(IndexError, lambda : s.iloc[-30])
-
-        # slices are ok
-        result = df.iloc[:,4:10]  # 0 < start < len < stop
-        expected = df.iloc[:,4:]
-        assert_frame_equal(result,expected)
-
-        result = df.iloc[:,-4:-10]  # stop < 0 < start < len
-        expected = df.iloc[:,:0]
-        assert_frame_equal(result,expected)
-
-        result = df.iloc[:,10:4:-1]  # 0 < stop < len < start (down)
-        expected = df.iloc[:,:4:-1]
-        assert_frame_equal(result,expected)
-
-        result = df.iloc[:,4:-10:-1]  # stop < 0 < start < len (down)
-        expected = df.iloc[:,4::-1]
-        assert_frame_equal(result,expected)
-
-        result = df.iloc[:,-10:4]  # start < 0 < stop < len
-        expected = df.iloc[:,:4]
-        assert_frame_equal(result,expected)
-
-        result = df.iloc[:,10:4]  # 0 < stop < len < start
-        expected = df.iloc[:,:0]
-        assert_frame_equal(result,expected)
-
-        result = df.iloc[:,-10:-11:-1]  # stop < start < 0 < len (down)
-        expected = df.iloc[:,:0]
-        assert_frame_equal(result,expected)
-
-        result = df.iloc[:,10:11]  # 0 < len < start < stop
-        expected = df.iloc[:,:0]
-        assert_frame_equal(result,expected)
-
-        # slice bounds exceeding is ok
-        result = s.iloc[18:30]
-        expected = s.iloc[18:]
-        assert_series_equal(result,expected)
-
-        result = s.iloc[30:]
-        expected = s.iloc[:0]
-        assert_series_equal(result,expected)
-
-        result = s.iloc[30::-1]
-        expected = s.iloc[::-1]
-        assert_series_equal(result,expected)
-
-        # doc example
-        def check(result,expected):
-            str(result)
-            result.dtypes
-            assert_frame_equal(result,expected)
-
-        dfl = DataFrame(np.random.randn(5,2),columns=list('AB'))
-        check(dfl.iloc[:,2:3],DataFrame(index=dfl.index))
-        check(dfl.iloc[:,1:3],dfl.iloc[:,[1]])
-        check(dfl.iloc[4:6],dfl.iloc[[4]])
-
-        self.assertRaises(IndexError, lambda : dfl.iloc[[4,5,6]])
-        self.assertRaises(IndexError, lambda : dfl.iloc[:,4])
-
-    def test_iloc_getitem_int(self):
-
-        # integer
-        self.check_result('integer', 'iloc', 2, 'ix', { 0 : 4, 1: 6, 2: 8 }, typs = ['ints'])
-        self.check_result('integer', 'iloc', 2, 'indexer', 2, typs = ['labels','mixed','ts','floats','empty'], fails = IndexError)
-
-    def test_iloc_getitem_neg_int(self):
-
-        # neg integer
-        self.check_result('neg int', 'iloc', -1, 'ix', { 0 : 6, 1: 9, 2: 12 }, typs = ['ints'])
-        self.check_result('neg int', 'iloc', -1, 'indexer', -1, typs = ['labels','mixed','ts','floats','empty'], fails = IndexError)
-
-    def test_iloc_getitem_list_int(self):
-
-        # list of ints
-        self.check_result('list int', 'iloc', [0,1,2], 'ix', { 0 : [0,2,4], 1 : [0,3,6], 2: [0,4,8] }, typs = ['ints'])
-        self.check_result('list int', 'iloc', [2], 'ix', { 0 : [4], 1 : [6], 2: [8] }, typs = ['ints'])
-        self.check_result('list int', 'iloc', [0,1,2], 'indexer', [0,1,2], typs = ['labels','mixed','ts','floats','empty'], fails = IndexError)
-
-        # array of ints
-        # (GH5006), make sure that a single indexer is returning the correct type
-        self.check_result('array int', 'iloc', np.array([0,1,2]), 'ix', { 0 : [0,2,4], 1 : [0,3,6], 2: [0,4,8] }, typs = ['ints'])
-        self.check_result('array int', 'iloc', np.array([2]), 'ix', { 0 : [4], 1 : [6], 2: [8] }, typs = ['ints'])
-        self.check_result('array int', 'iloc', np.array([0,1,2]), 'indexer', [0,1,2], typs = ['labels','mixed','ts','floats','empty'], fails = IndexError)
-
-    def test_iloc_getitem_neg_int_can_reach_first_index(self):
-        # GH10547 and GH10779
-        # negative integers should be able to reach index 0
-        df = DataFrame({'A': [2, 3, 5], 'B': [7, 11, 13]})
-        s = df['A']
-
-        expected = df.iloc[0]
-        result = df.iloc[-3]
-        assert_series_equal(result, expected)
-
-        expected = df.iloc[[0]]
-        result = df.iloc[[-3]]
-        assert_frame_equal(result, expected)
-
-        expected = s.iloc[0]
-        result = s.iloc[-3]
-        self.assertEqual(result, expected)
-
-        expected = s.iloc[[0]]
-        result = s.iloc[[-3]]
-        assert_series_equal(result, expected)
-
-        # check the length 1 Series case highlighted in GH10547
-        expected = pd.Series(['a'], index=['A'])
-        result = expected.iloc[[-1]]
-        assert_series_equal(result, expected)
-
-    def test_iloc_getitem_dups(self):
-
-        # no dups in panel (bug?)
-        self.check_result('list int (dups)', 'iloc', [0,1,1,3], 'ix', { 0 : [0,2,2,6], 1 : [0,3,3,9] }, objs = ['series','frame'], typs = ['ints'])
-
-        # GH 6766
-        df1 = DataFrame([{'A':None, 'B':1},{'A':2, 'B':2}])
-        df2 = DataFrame([{'A':3, 'B':3},{'A':4, 'B':4}])
-        df = concat([df1, df2], axis=1)
-
-        # cross-sectional indexing
-        result = df.iloc[0,0]
-        self.assertTrue(isnull(result))
-
-        result = df.iloc[0,:]
-        expected = Series([np.nan, 1, 3, 3], index=['A','B','A','B'], name=0)
-        assert_series_equal(result,expected)
-
-    def test_iloc_getitem_array(self):
-
-        # array like
-        s = Series(index=lrange(1,4))
-        self.check_result('array like', 'iloc', s.index, 'ix', { 0 : [2,4,6], 1 : [3,6,9], 2: [4,8,12] }, typs = ['ints'])
-
-    def test_iloc_getitem_bool(self):
-
-        # boolean indexers
-        b = [True,False,True,False,]
-        self.check_result('bool', 'iloc', b, 'ix', b, typs = ['ints'])
-        self.check_result('bool', 'iloc', b, 'ix', b, typs = ['labels','mixed','ts','floats','empty'], fails = IndexError)
-
-    def test_iloc_getitem_slice(self):
-
-        # slices
-        self.check_result('slice', 'iloc', slice(1,3), 'ix', { 0 : [2,4], 1: [3,6], 2: [4,8] }, typs = ['ints'])
-        self.check_result('slice', 'iloc', slice(1,3), 'indexer', slice(1,3), typs = ['labels','mixed','ts','floats','empty'], fails = IndexError)
-
-    def test_iloc_getitem_slice_dups(self):
-
-        df1 = DataFrame(np.random.randn(10,4),columns=['A','A','B','B'])
-        df2 = DataFrame(np.random.randint(0,10,size=20).reshape(10,2),columns=['A','C'])
-
-        # axis=1
-        df = concat([df1,df2],axis=1)
-        assert_frame_equal(df.iloc[:,:4],df1)
-        assert_frame_equal(df.iloc[:,4:],df2)
-
-        df = concat([df2,df1],axis=1)
-        assert_frame_equal(df.iloc[:,:2],df2)
-        assert_frame_equal(df.iloc[:,2:],df1)
-
-        assert_frame_equal(df.iloc[:,0:3],concat([df2,df1.iloc[:,[0]]],axis=1))
-
-        # axis=0
-        df = concat([df,df],axis=0)
-        assert_frame_equal(df.iloc[0:10,:2],df2)
-        assert_frame_equal(df.iloc[0:10,2:],df1)
-        assert_frame_equal(df.iloc[10:,:2],df2)
-        assert_frame_equal(df.iloc[10:,2:],df1)
-
-    def test_iloc_getitem_multiindex(self):
-
-        arr = np.random.randn(3, 3)
-        df = DataFrame(arr,
-                       columns=[[2,2,4],[6,8,10]],
-                       index=[[4,4,8],[8,10,12]])
-
-        rs = df.iloc[2]
-        xp = Series(arr[2],index=df.columns)
-        assert_series_equal(rs, xp)
-
-        rs = df.iloc[:,2]
-        xp = Series(arr[:, 2],index=df.index)
-        assert_series_equal(rs, xp)
-
-        rs = df.iloc[2,2]
-        xp = df.values[2,2]
-        self.assertEqual(rs, xp)
-
-        # for multiple items
-        # GH 5528
-        rs = df.iloc[[0,1]]
-        xp = df.xs(4,drop_level=False)
-        assert_frame_equal(rs,xp)
-
-        tup = zip(*[['a','a','b','b'],['x','y','x','y']])
-        index = MultiIndex.from_tuples(tup)
-        df = DataFrame(np.random.randn(4, 4), index=index)
-        rs = df.iloc[[2, 3]]
-        xp = df.xs('b',drop_level=False)
-        assert_frame_equal(rs,xp)
-
-    def test_iloc_setitem(self):
-        df = self.frame_ints
-
-        df.iloc[1,1] = 1
-        result = df.iloc[1,1]
-        self.assertEqual(result, 1)
-
-        df.iloc[:,2:3] = 0
-        expected = df.iloc[:,2:3]
-        result = df.iloc[:,2:3]
-        assert_frame_equal(result, expected)
-
-        # GH5771
-        s = Series(0,index=[4,5,6])
-        s.iloc[1:2] += 1
-        expected = Series([0,1,0],index=[4,5,6])
-        assert_series_equal(s, expected)
-
-    def test_ix_loc_setitem_consistency(self):
-
-        # GH 5771
-        # loc with slice and series
-        s = Series(0,index=[4,5,6])
-        s.loc[4:5] += 1
-        expected = Series([1,1,0],index=[4,5,6])
-        assert_series_equal(s, expected)
-
-        # GH 5928
-        # chained indexing assignment
-        df = DataFrame({'a' : [0,1,2] })
-        expected = df.copy()
-        expected.ix[[0,1,2],'a'] = -expected.ix[[0,1,2],'a']
-
-        df['a'].ix[[0,1,2]] = -df['a'].ix[[0,1,2]]
-        assert_frame_equal(df,expected)
-
-        df = DataFrame({'a' : [0,1,2], 'b' :[0,1,2] })
-        df['a'].ix[[0,1,2]] = -df['a'].ix[[0,1,2]].astype('float64') + 0.5
-        expected = DataFrame({'a' : [0.5,-0.5,-1.5], 'b' : [0,1,2] })
-        assert_frame_equal(df,expected)
-
-        # GH 8607
-        # ix setitem consistency
-        df = DataFrame(
-            {'timestamp':[1413840976, 1413842580, 1413760580],
-             'delta':[1174, 904, 161],
-             'elapsed':[7673, 9277, 1470]
-             })
-        expected = DataFrame(
-            {'timestamp':pd.to_datetime([1413840976, 1413842580, 1413760580], unit='s'),
-             'delta':[1174, 904, 161],
-             'elapsed':[7673, 9277, 1470]
-             })
-
-        df2 = df.copy()
-        df2['timestamp'] = pd.to_datetime(df['timestamp'], unit='s')
-        assert_frame_equal(df2,expected)
-
-        df2 = df.copy()
-        df2.loc[:,'timestamp'] = pd.to_datetime(df['timestamp'], unit='s')
-        assert_frame_equal(df2,expected)
-
-        df2 = df.copy()
-        df2.ix[:,2] = pd.to_datetime(df['timestamp'], unit='s')
-        assert_frame_equal(df2,expected)
-
-    def test_ix_loc_consistency(self):
-
-        # GH 8613
-        # some edge cases where ix/loc should return the same
-        # this is not an exhaustive case
-
-        def compare(result, expected):
-            if lib.isscalar(expected):
-                self.assertEqual(result, expected)
-            else:
-                self.assertTrue(expected.equals(result))
-
-        # failure cases for .loc, but these work for .ix
-        df = pd.DataFrame(np.random.randn(5,4), columns=list('ABCD'))
-        for key in [ slice(1,3), tuple([slice(0,2),slice(0,2)]), tuple([slice(0,2),df.columns[0:2]]) ]:
-
-            for index in [ tm.makeStringIndex, tm.makeUnicodeIndex,
-                           tm.makeDateIndex, tm.makePeriodIndex, tm.makeTimedeltaIndex ]:
-                df.index = index(len(df.index))
-                df.ix[key]
-
-                self.assertRaises(TypeError, lambda : df.loc[key])
-
-        df = pd.DataFrame(np.random.randn(5,4), columns=list('ABCD'), index=pd.date_range('2012-01-01', periods=5))
-
-        for key in [ '2012-01-03',
-                     '2012-01-31',
-                     slice('2012-01-03','2012-01-03'),
-                     slice('2012-01-03','2012-01-04'),
-                     slice('2012-01-03','2012-01-06',2),
-                     slice('2012-01-03','2012-01-31'),
-                     tuple([[True,True,True,False,True]]),
-                     ]:
-
-            # getitem
-
-            # if the expected raises, then compare the exceptions
-            try:
-                expected = df.ix[key]
-            except KeyError:
-                self.assertRaises(KeyError, lambda : df.loc[key])
-                continue
-
-            result = df.loc[key]
-            compare(result, expected)
-
-            # setitem
-            df1 = df.copy()
-            df2 = df.copy()
-
-            df1.ix[key] = 10
-            df2.loc[key] = 10
-            compare(df2, df1)
-
-        # edge cases
-        s = Series([1,2,3,4], index=list('abde'))
-
-        result1 = s['a':'c']
-        result2 = s.ix['a':'c']
-        result3 = s.loc['a':'c']
-        assert_series_equal(result1,result2)
-        assert_series_equal(result1,result3)
-
-        # now work rather than raising KeyError
-        s = Series(range(5),[-2,-1,1,2,3])
-
-        result1 = s.ix[-10:3]
-        result2 = s.loc[-10:3]
-        assert_series_equal(result1,result2)
-
-        result1 = s.ix[0:3]
-        result2 = s.loc[0:3]
-        assert_series_equal(result1,result2)
-
-    def test_loc_setitem_multiindex(self):
-
-        # GH7190
-        index = pd.MultiIndex.from_product([np.arange(0,100), np.arange(0, 80)], names=['time', 'firm'])
-        t, n = 0, 2
-
-        df = DataFrame(np.nan,columns=['A', 'w', 'l', 'a', 'x', 'X', 'd', 'profit'], index=index)
-        df.loc[(t,n),'X'] = 0
-        result = df.loc[(t,n),'X']
-        self.assertEqual(result, 0)
-
-        df = DataFrame(-999,columns=['A', 'w', 'l', 'a', 'x', 'X', 'd', 'profit'], index=index)
-        df.loc[(t,n),'X'] = 1
-        result = df.loc[(t,n),'X']
-        self.assertEqual(result, 1)
-
-        df = DataFrame(columns=['A', 'w', 'l', 'a', 'x', 'X', 'd', 'profit'], index=index)
-        df.loc[(t,n),'X'] = 2
-        result = df.loc[(t,n),'X']
-        self.assertEqual(result, 2)
-
-        # GH 7218, assinging with 0-dim arrays
-        df = DataFrame(-999,columns=['A', 'w', 'l', 'a', 'x', 'X', 'd', 'profit'], index=index)
-        df.loc[(t,n), 'X'] = np.array(3)
-        result = df.loc[(t,n),'X']
-        self.assertEqual(result,3)
-
-    def test_indexing_with_datetime_tz(self):
-
-        # 8260
-        # support datetime64 with tz
-
-        idx = Index(date_range('20130101',periods=3,tz='US/Eastern'),
-                    name='foo')
-        dr = date_range('20130110',periods=3)
-        df = DataFrame({'A' : idx, 'B' : dr})
-        df['C'] = idx
-        df.iloc[1,1] = pd.NaT
-        df.iloc[1,2] = pd.NaT
-
-        # indexing
-        result = df.iloc[1]
-        expected = Series([Timestamp('2013-01-02 00:00:00-0500', tz='US/Eastern'), np.nan, np.nan],
-                          index=list('ABC'), dtype='object', name=1)
-        assert_series_equal(result, expected)
-        result = df.loc[1]
-        expected = Series([Timestamp('2013-01-02 00:00:00-0500', tz='US/Eastern'), np.nan, np.nan],
-                          index=list('ABC'), dtype='object', name=1)
-        assert_series_equal(result, expected)
-
-        # indexing - fast_xs
-        df = DataFrame({'a': date_range('2014-01-01', periods=10, tz='UTC')})
-        result = df.iloc[5]
-        expected = Timestamp('2014-01-06 00:00:00+0000', tz='UTC', offset='D')
-        self.assertEqual(result, expected)
-
-        result = df.loc[5]
-        self.assertEqual(result, expected)
-
-        # indexing - boolean
-        result = df[df.a > df.a[3]]
-        expected = df.iloc[4:]
-        assert_frame_equal(result, expected)
-
-        # indexing - setting an element
-        df = DataFrame( data = pd.to_datetime(['2015-03-30 20:12:32','2015-03-12 00:11:11']) ,columns=['time'] )
-        df['new_col']=['new','old']
-        df.time=df.set_index('time').index.tz_localize('UTC')
-        v = df[df.new_col=='new'].set_index('time').index.tz_convert('US/Pacific')
-
-        # trying to set a single element on a part of a different timezone
-        def f():
-            df.loc[df.new_col=='new','time'] = v
-        self.assertRaises(ValueError, f)
-
-        v = df.loc[df.new_col=='new','time'] + pd.Timedelta('1s')
-        df.loc[df.new_col=='new','time'] = v
-        assert_series_equal(df.loc[df.new_col=='new','time'],v)
-
-    def test_loc_setitem_dups(self):
-
-        # GH 6541
-        df_orig = DataFrame({'me' : list('rttti'),
-                             'foo': list('aaade'),
-                             'bar': np.arange(5,dtype='float64')*1.34+2,
-                             'bar2': np.arange(5,dtype='float64')*-.34+2}).set_index('me')
-
-        indexer = tuple(['r',['bar','bar2']])
-        df = df_orig.copy()
-        df.loc[indexer]*=2.0
-        assert_series_equal(df.loc[indexer],2.0*df_orig.loc[indexer])
-
-        indexer = tuple(['r','bar'])
-        df = df_orig.copy()
-        df.loc[indexer]*=2.0
-        self.assertEqual(df.loc[indexer],2.0*df_orig.loc[indexer])
-
-        indexer = tuple(['t',['bar','bar2']])
-        df = df_orig.copy()
-        df.loc[indexer]*=2.0
-        assert_frame_equal(df.loc[indexer],2.0*df_orig.loc[indexer])
-
-    def test_iloc_setitem_dups(self):
-
-        # GH 6766
-        # iloc with a mask aligning from another iloc
-        df1 = DataFrame([{'A':None, 'B':1},{'A':2, 'B':2}])
-        df2 = DataFrame([{'A':3, 'B':3},{'A':4, 'B':4}])
-        df = concat([df1, df2], axis=1)
-
-        expected = df.fillna(3)
-        expected['A'] = expected['A'].astype('float64')
-        inds = np.isnan(df.iloc[:, 0])
-        mask = inds[inds].index
-        df.iloc[mask,0] = df.iloc[mask,2]
-        assert_frame_equal(df, expected)
-
-        # del a dup column across blocks
-        expected = DataFrame({ 0 : [1,2], 1 : [3,4] })
-        expected.columns=['B','B']
-        del df['A']
-        assert_frame_equal(df, expected)
-
-        # assign back to self
-        df.iloc[[0,1],[0,1]] = df.iloc[[0,1],[0,1]]
-        assert_frame_equal(df, expected)
-
-        # reversed x 2
-        df.iloc[[1,0],[0,1]] = df.iloc[[1,0],[0,1]].reset_index(drop=True)
-        df.iloc[[1,0],[0,1]] = df.iloc[[1,0],[0,1]].reset_index(drop=True)
-        assert_frame_equal(df, expected)
-
-    def test_chained_getitem_with_lists(self):
-
-        # GH6394
-        # Regression in chained getitem indexing with embedded list-like from 0.12
-        def check(result, expected):
-            tm.assert_numpy_array_equal(result,expected)
-            tm.assertIsInstance(result, np.ndarray)
-
-
-        df = DataFrame({'A': 5*[np.zeros(3)], 'B':5*[np.ones(3)]})
-        expected = df['A'].iloc[2]
-        result = df.loc[2,'A']
-        check(result, expected)
-        result2 = df.iloc[2]['A']
-        check(result2, expected)
-        result3 = df['A'].loc[2]
-        check(result3, expected)
-        result4 = df['A'].iloc[2]
-        check(result4, expected)
-
-    def test_loc_getitem_int(self):
-
-        # int label
-        self.check_result('int label', 'loc', 2, 'ix', 2, typs = ['ints'], axes = 0)
-        self.check_result('int label', 'loc', 3, 'ix', 3, typs = ['ints'], axes = 1)
-        self.check_result('int label', 'loc', 4, 'ix', 4, typs = ['ints'], axes = 2)
-        self.check_result('int label', 'loc', 2, 'ix', 2, typs = ['label'], fails = KeyError)
-
-    def test_loc_getitem_label(self):
-
-        # label
-        self.check_result('label', 'loc', 'c',    'ix', 'c',    typs = ['labels'], axes=0)
-        self.check_result('label', 'loc', 'null', 'ix', 'null', typs = ['mixed'] , axes=0)
-        self.check_result('label', 'loc', 8,      'ix', 8,      typs = ['mixed'] , axes=0)
-        self.check_result('label', 'loc', Timestamp('20130102'), 'ix', 1, typs = ['ts'], axes=0)
-        self.check_result('label', 'loc', 'c', 'ix', 'c', typs = ['empty'], fails = KeyError)
-
-    def test_loc_getitem_label_out_of_range(self):
-
-        # out of range label
-        self.check_result('label range', 'loc', 'f', 'ix', 'f', typs = ['ints','labels','mixed','ts'], fails=KeyError)
-        self.check_result('label range', 'loc', 'f', 'ix', 'f', typs = ['floats'], fails=TypeError)
-        self.check_result('label range', 'loc', 20, 'ix', 20, typs = ['ints','labels','mixed'], fails=KeyError)
-        self.check_result('label range', 'loc', 20, 'ix', 20, typs = ['ts'], axes=0, fails=TypeError)
-        self.check_result('label range', 'loc', 20, 'ix', 20, typs = ['floats'], axes=0, fails=TypeError)
-
-    def test_loc_getitem_label_list(self):
-
-        # list of labels
-        self.check_result('list lbl', 'loc', [0,2,4], 'ix', [0,2,4], typs = ['ints'], axes=0)
-        self.check_result('list lbl', 'loc', [3,6,9], 'ix', [3,6,9], typs = ['ints'], axes=1)
-        self.check_result('list lbl', 'loc', [4,8,12], 'ix', [4,8,12], typs = ['ints'], axes=2)
-        self.check_result('list lbl', 'loc', ['a','b','d'], 'ix', ['a','b','d'], typs = ['labels'], axes=0)
-        self.check_result('list lbl', 'loc', ['A','B','C'], 'ix', ['A','B','C'], typs = ['labels'], axes=1)
-        self.check_result('list lbl', 'loc', ['Z','Y','W'], 'ix', ['Z','Y','W'], typs = ['labels'], axes=2)
-        self.check_result('list lbl', 'loc', [2,8,'null'], 'ix', [2,8,'null'], typs = ['mixed'], axes=0)
-        self.check_result('list lbl', 'loc', [Timestamp('20130102'),Timestamp('20130103')], 'ix',
-                          [Timestamp('20130102'),Timestamp('20130103')], typs = ['ts'], axes=0)
-
-        self.check_result('list lbl', 'loc', [0,1,2], 'indexer', [0,1,2], typs = ['empty'], fails = KeyError)
-        self.check_result('list lbl', 'loc', [0,2,3], 'ix', [0,2,3], typs = ['ints'], axes=0, fails = KeyError)
-        self.check_result('list lbl', 'loc', [3,6,7], 'ix', [3,6,7], typs = ['ints'], axes=1, fails = KeyError)
-        self.check_result('list lbl', 'loc', [4,8,10], 'ix', [4,8,10], typs = ['ints'], axes=2, fails = KeyError)
-
-        # fails
-        self.check_result('list lbl', 'loc', [20,30,40], 'ix', [20,30,40], typs = ['ints'], axes=1, fails = KeyError)
-        self.check_result('list lbl', 'loc', [20,30,40], 'ix', [20,30,40], typs = ['ints'], axes=2, fails = KeyError)
-
-        # array like
-        self.check_result('array like', 'loc', Series(index=[0,2,4]).index, 'ix', [0,2,4], typs = ['ints'], axes=0)
-        self.check_result('array like', 'loc', Series(index=[3,6,9]).index, 'ix', [3,6,9], typs = ['ints'], axes=1)
-        self.check_result('array like', 'loc', Series(index=[4,8,12]).index, 'ix', [4,8,12], typs = ['ints'], axes=2)
-
-    def test_loc_getitem_bool(self):
-
-        # boolean indexers
-        b = [True,False,True,False]
-        self.check_result('bool', 'loc', b, 'ix', b, typs = ['ints','labels','mixed','ts','floats'])
-        self.check_result('bool', 'loc', b, 'ix', b, typs = ['empty'], fails = KeyError)
-
-    def test_loc_getitem_int_slice(self):
-
-        # ok
-        self.check_result('int slice2', 'loc', slice(2,4), 'ix', [2,4], typs = ['ints'], axes = 0)
-        self.check_result('int slice2', 'loc', slice(3,6), 'ix', [3,6], typs = ['ints'], axes = 1)
-        self.check_result('int slice2', 'loc', slice(4,8), 'ix', [4,8], typs = ['ints'], axes = 2)
-
-        # GH 3053
-        # loc should treat integer slices like label slices
-        from itertools import product
-
-        index = MultiIndex.from_tuples([t for t in product([6,7,8], ['a', 'b'])])
-        df = DataFrame(np.random.randn(6, 6), index, index)
-        result = df.loc[6:8,:]
-        expected = df.ix[6:8,:]
-        assert_frame_equal(result,expected)
-
-        index = MultiIndex.from_tuples([t for t in product([10, 20, 30], ['a', 'b'])])
-        df = DataFrame(np.random.randn(6, 6), index, index)
-        result = df.loc[20:30,:]
-        expected = df.ix[20:30,:]
-        assert_frame_equal(result,expected)
-
-        # doc examples
-        result = df.loc[10,:]
-        expected = df.ix[10,:]
-        assert_frame_equal(result,expected)
-
-        result = df.loc[:,10]
-        #expected = df.ix[:,10] (this fails)
-        expected = df[10]
-        assert_frame_equal(result,expected)
-
-    def test_loc_to_fail(self):
-
-        # GH3449
-        df = DataFrame(np.random.random((3, 3)),
-                       index=['a', 'b', 'c'],
-                       columns=['e', 'f', 'g'])
-
-        # raise a KeyError?
-        self.assertRaises(KeyError, df.loc.__getitem__, tuple([[1, 2], [1, 2]]))
-
-        # GH  7496
-        # loc should not fallback
-
-        s = Series()
-        s.loc[1] = 1
-        s.loc['a'] = 2
-
-        self.assertRaises(KeyError, lambda : s.loc[-1])
-        self.assertRaises(KeyError, lambda : s.loc[[-1, -2]])
-
-        self.assertRaises(KeyError, lambda : s.loc[['4']])
-
-        s.loc[-1] = 3
-        result = s.loc[[-1,-2]]
-        expected = Series([3,np.nan],index=[-1,-2])
-        assert_series_equal(result, expected)
-
-        s['a'] = 2
-        self.assertRaises(KeyError, lambda : s.loc[[-2]])
-
-        del s['a']
-        def f():
-            s.loc[[-2]] = 0
-        self.assertRaises(KeyError, f)
-
-        # inconsistency between .loc[values] and .loc[values,:]
-        # GH 7999
-        df = DataFrame([['a'],['b']],index=[1,2],columns=['value'])
-
-        def f():
-            df.loc[[3],:]
-        self.assertRaises(KeyError, f)
-
-        def f():
-            df.loc[[3]]
-        self.assertRaises(KeyError, f)
-
-        # at should not fallback
-        # GH 7814
-        s = Series([1,2,3], index=list('abc'))
-        result = s.at['a']
-        self.assertEqual(result, 1)
-        self.assertRaises(ValueError, lambda : s.at[0])
-
-        df = DataFrame({'A' : [1,2,3]},index=list('abc'))
-        result = df.at['a','A']
-        self.assertEqual(result, 1)
-        self.assertRaises(ValueError, lambda : df.at['a',0])
-
-        s = Series([1,2,3], index=[3,2,1])
-        result = s.at[1]
-        self.assertEqual(result, 3)
-        self.assertRaises(ValueError, lambda : s.at['a'])
-
-        df = DataFrame({0 : [1,2,3]},index=[3,2,1])
-        result = df.at[1,0]
-        self.assertEqual(result, 3)
-        self.assertRaises(ValueError, lambda : df.at['a',0])
-
-    def test_loc_getitem_label_slice(self):
-
-        # label slices (with ints)
-        self.check_result('lab slice', 'loc', slice(1,3), 'ix', slice(1,3), typs = ['labels','mixed','empty','ts','floats'], fails=TypeError)
-
-        # real label slices
-        self.check_result('lab slice', 'loc', slice('a','c'), 'ix', slice('a','c'), typs = ['labels'], axes=0)
-        self.check_result('lab slice', 'loc', slice('A','C'), 'ix', slice('A','C'), typs = ['labels'], axes=1)
-        self.check_result('lab slice', 'loc', slice('W','Z'), 'ix', slice('W','Z'), typs = ['labels'], axes=2)
-
-        self.check_result('ts  slice', 'loc', slice('20130102','20130104'), 'ix', slice('20130102','20130104'), typs = ['ts'], axes=0)
-        self.check_result('ts  slice', 'loc', slice('20130102','20130104'), 'ix', slice('20130102','20130104'), typs = ['ts'], axes=1, fails=TypeError)
-        self.check_result('ts  slice', 'loc', slice('20130102','20130104'), 'ix', slice('20130102','20130104'), typs = ['ts'], axes=2, fails=TypeError)
-
-        self.check_result('mixed slice', 'loc', slice(2,8), 'ix', slice(2,8), typs = ['mixed'], axes=0, fails=TypeError)
-        self.check_result('mixed slice', 'loc', slice(2,8), 'ix', slice(2,8), typs = ['mixed'], axes=1, fails=KeyError)
-        self.check_result('mixed slice', 'loc', slice(2,8), 'ix', slice(2,8), typs = ['mixed'], axes=2, fails=KeyError)
-
-        self.check_result('mixed slice', 'loc', slice(2,4,2), 'ix', slice(2,4,2), typs = ['mixed'], axes=0, fails=TypeError)
-
-    def test_loc_general(self):
-
-        df = DataFrame(np.random.rand(4,4),columns=['A','B','C','D'], index=['A','B','C','D'])
-
-        # want this to work
-        result = df.loc[:,"A":"B"].iloc[0:2,:]
-        self.assertTrue((result.columns == ['A','B']).all() == True)
-        self.assertTrue((result.index == ['A','B']).all() == True)
-
-        # mixed type
-        result = DataFrame({ 'a' : [Timestamp('20130101')], 'b' : [1] }).iloc[0]
-        expected = Series([ Timestamp('20130101'), 1], index=['a','b'], name=0)
-        assert_series_equal(result, expected)
-        self.assertEqual(result.dtype, object)
-
-    def test_loc_setitem_consistency(self):
-
-        # GH 6149
-        # coerce similary for setitem and loc when rows have a null-slice
-        expected = DataFrame({ 'date': Series(0,index=range(5),dtype=np.int64),
-                               'val' : Series(range(5),dtype=np.int64) })
-
-        df = DataFrame({ 'date': date_range('2000-01-01','2000-01-5'),
-                         'val' : Series(range(5),dtype=np.int64) })
-        df.loc[:,'date'] = 0
-        assert_frame_equal(df,expected)
-
-        df = DataFrame({ 'date': date_range('2000-01-01','2000-01-5'),
-                         'val' : Series(range(5),dtype=np.int64) })
-        df.loc[:,'date'] = np.array(0,dtype=np.int64)
-        assert_frame_equal(df,expected)
-
-        df = DataFrame({ 'date': date_range('2000-01-01','2000-01-5'),
-                         'val' : Series(range(5),dtype=np.int64) })
-        df.loc[:,'date'] = np.array([0,0,0,0,0],dtype=np.int64)
-        assert_frame_equal(df,expected)
-
-        expected = DataFrame({ 'date': Series('foo',index=range(5)),
-                               'val' : Series(range(5),dtype=np.int64) })
-        df = DataFrame({ 'date': date_range('2000-01-01','2000-01-5'),
-                         'val' : Series(range(5),dtype=np.int64) })
-        df.loc[:,'date'] = 'foo'
-        assert_frame_equal(df,expected)
-
-        expected = DataFrame({ 'date': Series(1.0,index=range(5)),
-                               'val' : Series(range(5),dtype=np.int64) })
-        df = DataFrame({ 'date': date_range('2000-01-01','2000-01-5'),
-                         'val' : Series(range(5),dtype=np.int64) })
-        df.loc[:,'date'] = 1.0
-        assert_frame_equal(df,expected)
-
-        # empty (essentially noops)
-        expected = DataFrame(columns=['x', 'y'])
-        expected['x'] = expected['x'].astype(np.int64)
-        df = DataFrame(columns=['x', 'y'])
-        df.loc[:, 'x'] = 1
-        assert_frame_equal(df,expected)
-
-        df = DataFrame(columns=['x', 'y'])
-        df['x'] = 1
-        assert_frame_equal(df,expected)
-
-        # .loc[:,column] setting with slice == len of the column
-        # GH10408
-        data = """Level_0,,,Respondent,Respondent,Respondent,OtherCat,OtherCat
-Level_1,,,Something,StartDate,EndDate,Yes/No,SomethingElse
-Region,Site,RespondentID,,,,,
-Region_1,Site_1,3987227376,A,5/25/2015 10:59,5/25/2015 11:22,Yes,
-Region_1,Site_1,3980680971,A,5/21/2015 9:40,5/21/2015 9:52,Yes,Yes
-Region_1,Site_2,3977723249,A,5/20/2015 8:27,5/20/2015 8:41,Yes,
-Region_1,Site_2,3977723089,A,5/20/2015 8:33,5/20/2015 9:09,Yes,No"""
-
-        df = pd.read_csv(StringIO(data),header=[0,1], index_col=[0,1,2])
-        df.loc[:,('Respondent','StartDate')] = pd.to_datetime(df.loc[:,('Respondent','StartDate')])
-        df.loc[:,('Respondent','EndDate')] = pd.to_datetime(df.loc[:,('Respondent','EndDate')])
-        df.loc[:,('Respondent','Duration')] = df.loc[:,('Respondent','EndDate')] - df.loc[:,('Respondent','StartDate')]
-
-        df.loc[:,('Respondent','Duration')] = df.loc[:,('Respondent','Duration')].astype('timedelta64[s]')
-        expected = Series([1380,720,840,2160.],index=df.index,name=('Respondent','Duration'))
-        assert_series_equal(df[('Respondent','Duration')],expected)
-
-    def test_loc_setitem_frame(self):
-        df = self.frame_labels
-
-        result = df.iloc[0,0]
-
-        df.loc['a','A'] = 1
-        result = df.loc['a','A']
-        self.assertEqual(result, 1)
-
-        result = df.iloc[0,0]
-        self.assertEqual(result, 1)
-
-        df.loc[:,'B':'D'] = 0
-        expected = df.loc[:,'B':'D']
-        result = df.ix[:,1:]
-        assert_frame_equal(result, expected)
-
-        # GH 6254
-        # setting issue
-        df = DataFrame(index=[3, 5, 4], columns=['A'])
-        df.loc[[4, 3, 5], 'A'] = np.array([1, 2, 3],dtype='int64')
-        expected = DataFrame(dict(A = Series([1,2,3],index=[4, 3, 5]))).reindex(index=[3,5,4])
-        assert_frame_equal(df, expected)
-
-        # GH 6252
-        # setting with an empty frame
-        keys1 = ['@' + str(i) for i in range(5)]
-        val1 = np.arange(5,dtype='int64')
-
-        keys2 = ['@' + str(i) for i in range(4)]
-        val2 = np.arange(4,dtype='int64')
-
-        index = list(set(keys1).union(keys2))
-        df = DataFrame(index = index)
-        df['A'] = nan
-        df.loc[keys1, 'A'] = val1
-
-        df['B'] = nan
-        df.loc[keys2, 'B'] = val2
-
-        expected = DataFrame(dict(A = Series(val1,index=keys1), B = Series(val2,index=keys2))).reindex(index=index)
-        assert_frame_equal(df, expected)
-
-        # GH 8669
-        # invalid coercion of nan -> int
-        df = DataFrame({'A' : [1,2,3], 'B' : np.nan })
-        df.loc[df.B > df.A, 'B'] = df.A
-        expected = DataFrame({'A' : [1,2,3], 'B' : np.nan})
-        assert_frame_equal(df, expected)
-
-        # GH 6546
-        # setting with mixed labels
-        df = DataFrame({1:[1,2],2:[3,4],'a':['a','b']})
-
-        result = df.loc[0, [1,2]]
-        expected = Series([1,3],index=[1,2],dtype=object, name=0)
-        assert_series_equal(result, expected)
-
-        expected = DataFrame({1:[5,2],2:[6,4],'a':['a','b']})
-        df.loc[0, [1,2]] = [5,6]
-        assert_frame_equal(df, expected)
-
-    def test_loc_setitem_frame_multiples(self):
-        # multiple setting
-        df = DataFrame({ 'A' : ['foo','bar','baz'],
-                         'B' : Series(range(3),dtype=np.int64) })
-        rhs = df.loc[1:2]
-        rhs.index = df.index[0:2]
-        df.loc[0:1] = rhs
-        expected = DataFrame({ 'A' : ['bar','baz','baz'],
-                               'B' : Series([1,2,2],dtype=np.int64) })
-        assert_frame_equal(df, expected)
-
-
-        # multiple setting with frame on rhs (with M8)
-        df = DataFrame({ 'date' : date_range('2000-01-01','2000-01-5'),
-                         'val'  : Series(range(5),dtype=np.int64) })
-        expected = DataFrame({ 'date' : [Timestamp('20000101'),Timestamp('20000102'),Timestamp('20000101'),
-                                         Timestamp('20000102'),Timestamp('20000103')],
-                               'val'  : Series([0,1,0,1,2],dtype=np.int64) })
-        rhs = df.loc[0:2]
-        rhs.index = df.index[2:5]
-        df.loc[2:4] = rhs
-        assert_frame_equal(df, expected)
-
-    def test_iloc_getitem_frame(self):
-        df = DataFrame(np.random.randn(10, 4), index=lrange(0, 20, 2), columns=lrange(0,8,2))
-
-        result = df.iloc[2]
-        exp = df.ix[4]
-        assert_series_equal(result, exp)
-
-        result = df.iloc[2,2]
-        exp = df.ix[4,4]
-        self.assertEqual(result, exp)
-
-        # slice
-        result = df.iloc[4:8]
-        expected = df.ix[8:14]
-        assert_frame_equal(result, expected)
-
-        result = df.iloc[:,2:3]
-        expected = df.ix[:,4:5]
-        assert_frame_equal(result, expected)
-
-        # list of integers
-        result = df.iloc[[0,1,3]]
-        expected = df.ix[[0,2,6]]
-        assert_frame_equal(result, expected)
-
-        result = df.iloc[[0,1,3],[0,1]]
-        expected = df.ix[[0,2,6],[0,2]]
-        assert_frame_equal(result, expected)
-
-        # neg indicies
-        result = df.iloc[[-1,1,3],[-1,1]]
-        expected = df.ix[[18,2,6],[6,2]]
-        assert_frame_equal(result, expected)
-
-        # dups indicies
-        result = df.iloc[[-1,-1,1,3],[-1,1]]
-        expected = df.ix[[18,18,2,6],[6,2]]
-        assert_frame_equal(result, expected)
-
-        # with index-like
-        s = Series(index=lrange(1,5))
-        result = df.iloc[s.index]
-        expected = df.ix[[2,4,6,8]]
-        assert_frame_equal(result, expected)
-
-        # try with labelled frame
-        df = DataFrame(np.random.randn(10, 4), index=list('abcdefghij'), columns=list('ABCD'))
-
-        result = df.iloc[1,1]
-        exp = df.ix['b','B']
-        self.assertEqual(result, exp)
-
-        result = df.iloc[:,2:3]
-        expected = df.ix[:,['C']]
-        assert_frame_equal(result, expected)
-
-        # negative indexing
-        result = df.iloc[-1,-1]
-        exp = df.ix['j','D']
-        self.assertEqual(result, exp)
-
-        # out-of-bounds exception
-        self.assertRaises(IndexError, df.iloc.__getitem__, tuple([10,5]))
-
-        # trying to use a label
-        self.assertRaises(ValueError, df.iloc.__getitem__, tuple(['j','D']))
-
-    def test_iloc_getitem_panel(self):
-
-        # GH 7189
-        p = Panel(np.arange(4*3*2).reshape(4,3,2),
-                  items=['A','B','C','D'],
-                  major_axis=['a','b','c'],
-                  minor_axis=['one','two'])
-
-        result = p.iloc[1]
-        expected = p.loc['B']
-        assert_frame_equal(result, expected)
-
-        result = p.iloc[1,1]
-        expected = p.loc['B','b']
-        assert_series_equal(result, expected)
-
-        result = p.iloc[1,1,1]
-        expected = p.loc['B','b','two']
-        self.assertEqual(result,expected)
-
-        # slice
-        result = p.iloc[1:3]
-        expected = p.loc[['B','C']]
-        assert_panel_equal(result, expected)
-
-        result = p.iloc[:,0:2]
-        expected = p.loc[:,['a','b']]
-        assert_panel_equal(result, expected)
-
-        # list of integers
-        result = p.iloc[[0,2]]
-        expected = p.loc[['A','C']]
-        assert_panel_equal(result, expected)
-
-        # neg indicies
-        result = p.iloc[[-1,1],[-1,1]]
-        expected = p.loc[['D','B'],['c','b']]
-        assert_panel_equal(result, expected)
-
-        # dups indicies
-        result = p.iloc[[-1,-1,1],[-1,1]]
-        expected = p.loc[['D','D','B'],['c','b']]
-        assert_panel_equal(result, expected)
-
-        # combined
-        result = p.iloc[0,[True,True],[0,1]]
-        expected = p.loc['A',['a','b'],['one','two']]
-        assert_frame_equal(result, expected)
-
-        # out-of-bounds exception
-        self.assertRaises(IndexError, p.iloc.__getitem__, tuple([10,5]))
-        def f():
-            p.iloc[0,[True,True],[0,1,2]]
-        self.assertRaises(IndexError, f)
-
-        # trying to use a label
-        self.assertRaises(ValueError, p.iloc.__getitem__, tuple(['j','D']))
-
-        # GH
-        p = Panel(np.random.rand(4,3,2), items=['A','B','C','D'], major_axis=['U','V','W'], minor_axis=['X','Y'])
-        expected = p['A']
-
-        result = p.iloc[0,:,:]
-        assert_frame_equal(result, expected)
-
-        result = p.iloc[0,[True,True,True],:]
-        assert_frame_equal(result, expected)
-
-        result = p.iloc[0,[True,True,True],[0,1]]
-        assert_frame_equal(result, expected)
-
-        def f():
-            p.iloc[0,[True,True,True],[0,1,2]]
-        self.assertRaises(IndexError, f)
-
-        def f():
-            p.iloc[0,[True,True,True],[2]]
-        self.assertRaises(IndexError, f)
-
-        # GH 7199
-        # Panel with multi-index
-        multi_index = pd.MultiIndex.from_tuples([('ONE', 'one'),
-                                                 ('TWO', 'two'),
-                                                 ('THREE', 'three')],
-                                                names=['UPPER', 'lower'])
-
-        simple_index = [x[0] for x in multi_index]
-        wd1 = Panel(items=['First', 'Second'],
-                    major_axis=['a', 'b', 'c', 'd'],
-                    minor_axis=multi_index)
-
-        wd2 = Panel(items=['First', 'Second'],
-                    major_axis=['a', 'b', 'c', 'd'],
-                    minor_axis=simple_index)
-
-        expected1 = wd1['First'].iloc[[True, True, True, False], [0, 2]]
-        result1 = wd1.iloc[0, [True, True, True, False], [0, 2]]  # WRONG
-        assert_frame_equal(result1,expected1)
-
-        expected2 = wd2['First'].iloc[[True, True, True, False], [0, 2]]
-        result2 = wd2.iloc[0, [True, True, True, False], [0, 2]]
-        assert_frame_equal(result2,expected2)
-
-        expected1 = DataFrame(index=['a'],columns=multi_index,dtype='float64')
-        result1 = wd1.iloc[0,[0],[0,1,2]]
-        assert_frame_equal(result1,expected1)
-
-        expected2 = DataFrame(index=['a'],columns=simple_index,dtype='float64')
-        result2 = wd2.iloc[0,[0],[0,1,2]]
-        assert_frame_equal(result2,expected2)
-
-        # GH 7516
-        mi = MultiIndex.from_tuples([(0,'x'), (1,'y'), (2,'z')])
-        p = Panel(np.arange(3*3*3,dtype='int64').reshape(3,3,3), items=['a','b','c'], major_axis=mi, minor_axis=['u','v','w'])
-        result = p.iloc[:, 1, 0]
-        expected = Series([3,12,21],index=['a','b','c'], name='u')
-        assert_series_equal(result,expected)
-
-        result = p.loc[:, (1,'y'), 'u']
-        assert_series_equal(result,expected)
-
-    def test_iloc_getitem_doc_issue(self):
-
-        # multi axis slicing issue with single block
-        # surfaced in GH 6059
-
-        arr = np.random.randn(6,4)
-        index = date_range('20130101',periods=6)
-        columns = list('ABCD')
-        df = DataFrame(arr,index=index,columns=columns)
-
-        # defines ref_locs
-        df.describe()
-
-        result = df.iloc[3:5,0:2]
-        str(result)
-        result.dtypes
-
-        expected = DataFrame(arr[3:5,0:2],index=index[3:5],columns=columns[0:2])
-        assert_frame_equal(result,expected)
-
-        # for dups
-        df.columns = list('aaaa')
-        result = df.iloc[3:5,0:2]
-        str(result)
-        result.dtypes
-
-        expected = DataFrame(arr[3:5,0:2],index=index[3:5],columns=list('aa'))
-        assert_frame_equal(result,expected)
-
-        # related
-        arr = np.random.randn(6,4)
-        index = list(range(0,12,2))
-        columns = list(range(0,8,2))
-        df = DataFrame(arr,index=index,columns=columns)
-
-        df._data.blocks[0].mgr_locs
-        result = df.iloc[1:5,2:4]
-        str(result)
-        result.dtypes
-        expected = DataFrame(arr[1:5,2:4],index=index[1:5],columns=columns[2:4])
-        assert_frame_equal(result,expected)
-
-    def test_setitem_ndarray_1d(self):
-        # GH5508
-
-        # len of indexer vs length of the 1d ndarray
-        df = DataFrame(index=Index(lrange(1,11)))
-        df['foo'] = np.zeros(10, dtype=np.float64)
-        df['bar'] = np.zeros(10, dtype=np.complex)
-
-        # invalid
-        def f():
-            df.ix[2:5, 'bar'] = np.array([2.33j, 1.23+0.1j, 2.2])
-        self.assertRaises(ValueError, f)
-
-        # valid
-        df.ix[2:5, 'bar'] = np.array([2.33j, 1.23+0.1j, 2.2, 1.0])
-
-        result = df.ix[2:5, 'bar']
-        expected = Series([2.33j, 1.23+0.1j, 2.2, 1.0], index=[2,3,4,5], name='bar')
-        assert_series_equal(result, expected)
-
-        # dtype getting changed?
-        df = DataFrame(index=Index(lrange(1,11)))
-        df['foo'] = np.zeros(10, dtype=np.float64)
-        df['bar'] = np.zeros(10, dtype=np.complex)
-
-        def f():
-            df[2:5] = np.arange(1,4)*1j
-        self.assertRaises(ValueError, f)
-
-    def test_iloc_setitem_series(self):
-        df = DataFrame(np.random.randn(10, 4), index=list('abcdefghij'), columns=list('ABCD'))
-
-        df.iloc[1,1] = 1
-        result = df.iloc[1,1]
-        self.assertEqual(result, 1)
-
-        df.iloc[:,2:3] = 0
-        expected = df.iloc[:,2:3]
-        result = df.iloc[:,2:3]
-        assert_frame_equal(result, expected)
-
-        s = Series(np.random.randn(10), index=lrange(0,20,2))
-
-        s.iloc[1] = 1
-        result = s.iloc[1]
-        self.assertEqual(result, 1)
-
-        s.iloc[:4] = 0
-        expected = s.iloc[:4]
-        result = s.iloc[:4]
-        assert_series_equal(result, expected)
-
-        s= Series([-1]*6)
-        s.iloc[0::2]= [0,2,4]
-        s.iloc[1::2]= [1,3,5]
-        result  = s
-        expected= Series([0,1,2,3,4,5])
-        assert_series_equal(result, expected)
-
-    def test_iloc_setitem_list_of_lists(self):
-
-        # GH 7551
-        # list-of-list is set incorrectly in mixed vs. single dtyped frames
-        df = DataFrame(dict(A = np.arange(5,dtype='int64'), B = np.arange(5,10,dtype='int64')))
-        df.iloc[2:4] = [[10,11],[12,13]]
-        expected = DataFrame(dict(A = [0,1,10,12,4], B = [5,6,11,13,9]))
-        assert_frame_equal(df, expected)
-
-        df = DataFrame(dict(A = list('abcde'), B = np.arange(5,10,dtype='int64')))
-        df.iloc[2:4] = [['x',11],['y',13]]
-        expected = DataFrame(dict(A = ['a','b','x','y','e'], B = [5,6,11,13,9]))
-        assert_frame_equal(df, expected)
-
-    def test_iloc_getitem_multiindex(self):
-        mi_labels = DataFrame(np.random.randn(4, 3), columns=[['i', 'i', 'j'],
-                                                              ['A', 'A', 'B']],
-                              index=[['i', 'i', 'j', 'k'], ['X', 'X', 'Y','Y']])
-
-        mi_int    = DataFrame(np.random.randn(3, 3),
-                              columns=[[2,2,4],[6,8,10]],
-                              index=[[4,4,8],[8,10,12]])
-
-
-        # the first row
-        rs = mi_int.iloc[0]
-        xp = mi_int.ix[4].ix[8]
-        assert_series_equal(rs, xp, check_names=False)
-        self.assertEqual(rs.name, (4, 8))
-        self.assertEqual(xp.name, 8)
-
-        # 2nd (last) columns
-        rs = mi_int.iloc[:,2]
-        xp = mi_int.ix[:,2]
-        assert_series_equal(rs, xp)
-
-        # corner column
-        rs = mi_int.iloc[2,2]
-        xp = mi_int.ix[:,2].ix[2]
-        self.assertEqual(rs, xp)
-
-        # this is basically regular indexing
-        rs = mi_labels.iloc[2,2]
-        xp = mi_labels.ix['j'].ix[:,'j'].ix[0,0]
-        self.assertEqual(rs, xp)
-
-    def test_loc_multiindex(self):
-
-        mi_labels = DataFrame(np.random.randn(3, 3), columns=[['i', 'i', 'j'],
-                                                              ['A', 'A', 'B']],
-                              index=[['i', 'i', 'j'], ['X', 'X', 'Y']])
-
-        mi_int    = DataFrame(np.random.randn(3, 3),
-                              columns=[[2,2,4],[6,8,10]],
-                              index=[[4,4,8],[8,10,12]])
-
-        # the first row
-        rs = mi_labels.loc['i']
-        xp = mi_labels.ix['i']
-        assert_frame_equal(rs, xp)
-
-        # 2nd (last) columns
-        rs = mi_labels.loc[:,'j']
-        xp = mi_labels.ix[:,'j']
-        assert_frame_equal(rs, xp)
-
-        # corner column
-        rs = mi_labels.loc['j'].loc[:,'j']
-        xp = mi_labels.ix['j'].ix[:,'j']
-        assert_frame_equal(rs,xp)
-
-        # with a tuple
-        rs = mi_labels.loc[('i','X')]
-        xp = mi_labels.ix[('i','X')]
-        assert_frame_equal(rs,xp)
-
-        rs = mi_int.loc[4]
-        xp = mi_int.ix[4]
-        assert_frame_equal(rs,xp)
-
-        # GH6788
-        # multi-index indexer is None (meaning take all)
-        attributes = ['Attribute' + str(i) for i in range(1)]
-        attribute_values = ['Value' + str(i) for i in range(5)]
-
-        index = MultiIndex.from_product([attributes,attribute_values])
-        df = 0.1 * np.random.randn(10, 1 * 5) + 0.5
-        df = DataFrame(df, columns=index)
-        result = df[attributes]
-        assert_frame_equal(result, df)
-
-        # GH 7349
-        # loc with a multi-index seems to be doing fallback
-        df = DataFrame(np.arange(12).reshape(-1,1),index=pd.MultiIndex.from_product([[1,2,3,4],[1,2,3]]))
-
-        expected = df.loc[([1,2],),:]
-        result = df.loc[[1,2]]
-        assert_frame_equal(result, expected)
-
-        # GH 7399
-        # incomplete indexers
-        s = pd.Series(np.arange(15,dtype='int64'),MultiIndex.from_product([range(5), ['a', 'b', 'c']]))
-        expected = s.loc[:, 'a':'c']
-
-        result = s.loc[0:4, 'a':'c']
-        assert_series_equal(result, expected)
-        assert_series_equal(result, expected)
-
-        result = s.loc[:4, 'a':'c']
-        assert_series_equal(result, expected)
-        assert_series_equal(result, expected)
-
-        result = s.loc[0:, 'a':'c']
-        assert_series_equal(result, expected)
-        assert_series_equal(result, expected)
-
-        # GH 7400
-        # multiindexer gettitem with list of indexers skips wrong element
-        s = pd.Series(np.arange(15,dtype='int64'),MultiIndex.from_product([range(5), ['a', 'b', 'c']]))
-        expected = s.iloc[[6,7,8,12,13,14]]
-        result = s.loc[2:4:2, 'a':'c']
-        assert_series_equal(result, expected)
-
-    def test_multiindex_perf_warn(self):
-
-        if sys.version_info < (2, 7):
-            raise nose.SkipTest('python version < 2.7')
-
-        df = DataFrame({'jim':[0, 0, 1, 1],
-                        'joe':['x', 'x', 'z', 'y'],
-                        'jolie':np.random.rand(4)}).set_index(['jim', 'joe'])
-
-        with tm.assert_produces_warning(PerformanceWarning, clear=[pd.core.index]):
-            _ = df.loc[(1, 'z')]
-
-        df = df.iloc[[2,1,3,0]]
-        with tm.assert_produces_warning(PerformanceWarning):
-            _ = df.loc[(0,)]
-
-    def test_multiindex_get_loc(self):  # GH7724, GH2646
-
-        # ignore the warning here
-        warnings.simplefilter('ignore', PerformanceWarning)
-
-        # test indexing into a multi-index before & past the lexsort depth
-        from numpy.random import randint, choice, randn
-        cols = ['jim', 'joe', 'jolie', 'joline', 'jolia']
-
-        def validate(mi, df, key):
-            mask = np.ones(len(df)).astype('bool')
-
-            # test for all partials of this key
-            for i, k in enumerate(key):
-                mask &= df.iloc[:, i] == k
-
-                if not mask.any():
-                    self.assertNotIn(key[:i+1], mi.index)
-                    continue
-
-                self.assertIn(key[:i+1], mi.index)
-                right = df[mask].copy()
-
-                if i + 1 != len(key):  # partial key
-                    right.drop(cols[:i+1], axis=1, inplace=True)
-                    right.set_index(cols[i+1:-1], inplace=True)
-                    assert_frame_equal(mi.loc[key[:i+1]], right)
-
-                else:  # full key
-                    right.set_index(cols[:-1], inplace=True)
-                    if len(right) == 1:  # single hit
-                        right = Series(right['jolia'].values,
-                                name=right.index[0], index=['jolia'])
-                        assert_series_equal(mi.loc[key[:i+1]], right)
-                    else:  # multi hit
-                        assert_frame_equal(mi.loc[key[:i+1]], right)
-
-        def loop(mi, df, keys):
-            for key in keys:
-                validate(mi, df, key)
-
-        n, m = 1000, 50
-
-        vals = [randint(0, 10, n), choice(list('abcdefghij'), n),
-                choice(pd.date_range('20141009', periods=10).tolist(), n),
-                choice(list('ZYXWVUTSRQ'), n), randn(n)]
-        vals = list(map(tuple, zip(*vals)))
-
-        # bunch of keys for testing
-        keys = [randint(0, 11, m), choice(list('abcdefghijk'), m),
-                choice(pd.date_range('20141009', periods=11).tolist(), m),
-                choice(list('ZYXWVUTSRQP'), m)]
-        keys = list(map(tuple, zip(*keys)))
-        keys += list(map(lambda t: t[:-1], vals[::n//m]))
-
-        # covers both unique index and non-unique index
-        df = pd.DataFrame(vals, columns=cols)
-        a, b = pd.concat([df, df]), df.drop_duplicates(subset=cols[:-1])
-
-        for frame in a, b:
-            for i in range(5):  # lexsort depth
-                df = frame.copy() if i == 0 else frame.sort_values(by=cols[:i])
-                mi = df.set_index(cols[:-1])
-                assert not mi.index.lexsort_depth < i
-                loop(mi, df, keys)
-
-        # restore
-        warnings.simplefilter('always', PerformanceWarning)
-
-    def test_series_getitem_multiindex(self):
-
-        # GH 6018
-        # series regression getitem with a multi-index
-
-        s = Series([1,2,3])
-        s.index = MultiIndex.from_tuples([(0,0),(1,1), (2,1)])
-
-        result = s[:,0]
-        expected = Series([1],index=[0])
-        assert_series_equal(result,expected)
-
-        result = s.ix[:,1]
-        expected = Series([2,3],index=[1,2])
-        assert_series_equal(result,expected)
-
-        # xs
-        result = s.xs(0,level=0)
-        expected = Series([1],index=[0])
-        assert_series_equal(result,expected)
-
-        result = s.xs(1,level=1)
-        expected = Series([2,3],index=[1,2])
-        assert_series_equal(result,expected)
-
-        # GH6258
-        s = Series([1,3,4,1,3,4],
-                   index=MultiIndex.from_product([list('AB'),
-                                                  list(date_range('20130903',periods=3))]))
-        result = s.xs('20130903',level=1)
-        expected = Series([1,1],index=list('AB'))
-        assert_series_equal(result,expected)
-
-        # GH5684
-        idx = MultiIndex.from_tuples([('a', 'one'), ('a', 'two'),
-                                      ('b', 'one'), ('b', 'two')])
-        s = Series([1, 2, 3, 4], index=idx)
-        s.index.set_names(['L1', 'L2'], inplace=True)
-        result = s.xs('one', level='L2')
-        expected = Series([1, 3], index=['a', 'b'])
-        expected.index.set_names(['L1'], inplace=True)
-        assert_series_equal(result, expected)
-
-    def test_ix_general(self):
-
-        # ix general issues
-
-        # GH 2817
-        data = {'amount': {0: 700, 1: 600, 2: 222, 3: 333, 4: 444},
-                'col': {0: 3.5, 1: 3.5, 2: 4.0, 3: 4.0, 4: 4.0},
-                'year': {0: 2012, 1: 2011, 2: 2012, 3: 2012, 4: 2012}}
-        df = DataFrame(data).set_index(keys=['col', 'year'])
-        key = 4.0, 2012
-
-        # emits a PerformanceWarning, ok
-        with self.assert_produces_warning(PerformanceWarning):
-            tm.assert_frame_equal(df.ix[key], df.iloc[2:])
-
-        # this is ok
-        df.sortlevel(inplace=True)
-        res = df.ix[key]
-        index = MultiIndex.from_arrays([[4] * 3, [2012] * 3],
-                                       names=['col', 'year'])
-        expected = DataFrame({'amount': [222, 333, 444]}, index=index)
-        tm.assert_frame_equal(res, expected)
-
-    def test_ix_weird_slicing(self):
-        ## http://stackoverflow.com/q/17056560/1240268
-        df = DataFrame({'one' : [1, 2, 3, np.nan, np.nan], 'two' : [1, 2, 3, 4, 5]})
-        df.ix[df['one']>1, 'two'] = -df['two']
-
-        expected = DataFrame({'one': {0: 1.0, 1: 2.0, 2: 3.0, 3: nan, 4: nan},
-                              'two': {0: 1, 1: -2, 2: -3, 3: 4, 4: 5}})
-        assert_frame_equal(df, expected)
-
-    def test_xs_multiindex(self):
-
-        # GH2903
-        columns = MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'), ('b', 'hello'), ('b', 'world')], names=['lvl0', 'lvl1'])
-        df = DataFrame(np.random.randn(4, 4), columns=columns)
-        df.sortlevel(axis=1,inplace=True)
-        result = df.xs('a', level='lvl0', axis=1)
-        expected = df.iloc[:,0:2].loc[:,'a']
-        assert_frame_equal(result,expected)
-
-        result = df.xs('foo', level='lvl1', axis=1)
-        expected = df.iloc[:, 1:2].copy()
-        expected.columns = expected.columns.droplevel('lvl1')
-        assert_frame_equal(result, expected)
-
-    def test_per_axis_per_level_getitem(self):
-
-        # GH6134
-        # example test case
-        ix = MultiIndex.from_product([_mklbl('A',5),_mklbl('B',7),_mklbl('C',4),_mklbl('D',2)])
-        df = DataFrame(np.arange(len(ix.get_values())),index=ix)
-
-        result = df.loc[(slice('A1','A3'),slice(None), ['C1','C3']),:]
-        expected = df.loc[[ tuple([a,b,c,d]) for a,b,c,d in df.index.values if (
-            a == 'A1' or a == 'A2' or a == 'A3') and (c == 'C1' or c == 'C3')]]
-        assert_frame_equal(result, expected)
-
-        expected = df.loc[[ tuple([a,b,c,d]) for a,b,c,d in df.index.values if (
-            a == 'A1' or a == 'A2' or a == 'A3') and (c == 'C1' or c == 'C2' or c == 'C3')]]
-        result = df.loc[(slice('A1','A3'),slice(None), slice('C1','C3')),:]
-        assert_frame_equal(result, expected)
-
-        # test multi-index slicing with per axis and per index controls
-        index = MultiIndex.from_tuples([('A',1),('A',2),('A',3),('B',1)],
-                                       names=['one','two'])
-        columns = MultiIndex.from_tuples([('a','foo'),('a','bar'),('b','foo'),('b','bah')],
-                                         names=['lvl0', 'lvl1'])
-
-        df = DataFrame(np.arange(16,dtype='int64').reshape(4, 4), index=index, columns=columns)
-        df = df.sortlevel(axis=0).sortlevel(axis=1)
-
-        # identity
-        result = df.loc[(slice(None),slice(None)),:]
-        assert_frame_equal(result, df)
-        result = df.loc[(slice(None),slice(None)),(slice(None),slice(None))]
-        assert_frame_equal(result, df)
-        result = df.loc[:,(slice(None),slice(None))]
-        assert_frame_equal(result, df)
-
-        # index
-        result = df.loc[(slice(None),[1]),:]
-        expected = df.iloc[[0,3]]
-        assert_frame_equal(result, expected)
-
-        result = df.loc[(slice(None),1),:]
-        expected = df.iloc[[0,3]]
-        assert_frame_equal(result, expected)
-
-        # columns
-        result = df.loc[:,(slice(None),['foo'])]
-        expected = df.iloc[:,[1,3]]
-        assert_frame_equal(result, expected)
-
-        # both
-        result = df.loc[(slice(None),1),(slice(None),['foo'])]
-        expected = df.iloc[[0,3],[1,3]]
-        assert_frame_equal(result, expected)
-
-        result = df.loc['A','a']
-        expected = DataFrame(dict(bar = [1,5,9], foo = [0,4,8]),
-                             index=Index([1,2,3],name='two'),
-                             columns=Index(['bar','foo'],name='lvl1'))
-        assert_frame_equal(result, expected)
-
-        result = df.loc[(slice(None),[1,2]),:]
-        expected = df.iloc[[0,1,3]]
-        assert_frame_equal(result, expected)
-
-        # multi-level series
-        s = Series(np.arange(len(ix.get_values())),index=ix)
-        result = s.loc['A1':'A3', :, ['C1','C3']]
-        expected = s.loc[[ tuple([a,b,c,d]) for a,b,c,d in s.index.values if (
-            a == 'A1' or a == 'A2' or a == 'A3') and (c == 'C1' or c == 'C3')]]
-        assert_series_equal(result, expected)
-
-        # boolean indexers
-        result = df.loc[(slice(None),df.loc[:,('a','bar')]>5),:]
-        expected = df.iloc[[2,3]]
-        assert_frame_equal(result, expected)
-
-        def f():
-            df.loc[(slice(None),np.array([True,False])),:]
-        self.assertRaises(ValueError, f)
-
-        # ambiguous cases
-        # these can be multiply interpreted (e.g. in this case
-        # as df.loc[slice(None),[1]] as well
-        self.assertRaises(KeyError, lambda : df.loc[slice(None),[1]])
-
-        result = df.loc[(slice(None),[1]),:]
-        expected = df.iloc[[0,3]]
-        assert_frame_equal(result, expected)
-
-        # not lexsorted
-        self.assertEqual(df.index.lexsort_depth,2)
-        df = df.sortlevel(level=1,axis=0)
-        self.assertEqual(df.index.lexsort_depth,0)
-        with tm.assertRaisesRegexp(KeyError, 'MultiIndex Slicing requires the index to be fully lexsorted tuple len \(2\), lexsort depth \(0\)'):
-            df.loc[(slice(None),df.loc[:,('a','bar')]>5),:]
-
-    def test_multiindex_slicers_non_unique(self):
-
-        # GH 7106
-        # non-unique mi index support
-        df = DataFrame(dict(A = ['foo','foo','foo','foo'],
-                            B = ['a','a','a','a'],
-                            C = [1,2,1,3],
-                            D = [1,2,3,4])).set_index(['A','B','C']).sortlevel()
-        self.assertFalse(df.index.is_unique)
-        expected = DataFrame(dict(A = ['foo','foo'],
-                                  B = ['a','a'],
-                                  C = [1,1],
-                                  D = [1,3])).set_index(['A','B','C']).sortlevel()
-        result = df.loc[(slice(None),slice(None),1),:]
-        assert_frame_equal(result, expected)
-
-        # this is equivalent of an xs expression
-        result = df.xs(1,level=2,drop_level=False)
-        assert_frame_equal(result, expected)
-
-        df = DataFrame(dict(A = ['foo','foo','foo','foo'],
-                            B = ['a','a','a','a'],
-                            C = [1,2,1,2],
-                            D = [1,2,3,4])).set_index(['A','B','C']).sortlevel()
-        self.assertFalse(df.index.is_unique)
-        expected = DataFrame(dict(A = ['foo','foo'],
-                                  B = ['a','a'],
-                                  C = [1,1],
-                                  D = [1,3])).set_index(['A','B','C']).sortlevel()
-        result = df.loc[(slice(None),slice(None),1),:]
-        self.assertFalse(result.index.is_unique)
-        assert_frame_equal(result, expected)
-
-    def test_multiindex_slicers_datetimelike(self):
-
-        # GH 7429
-        # buggy/inconsistent behavior when slicing with datetime-like
-        import datetime
-        dates = [datetime.datetime(2012,1,1,12,12,12) + datetime.timedelta(days=i) for i in range(6)]
-        freq = [1,2]
-        index = MultiIndex.from_product([dates,freq], names=['date','frequency'])
-
-        df = DataFrame(np.arange(6*2*4,dtype='int64').reshape(-1,4),index=index,columns=list('ABCD'))
-
-        # multi-axis slicing
-        idx = pd.IndexSlice
-        expected = df.iloc[[0,2,4],[0,1]]
-        result = df.loc[(slice(Timestamp('2012-01-01 12:12:12'),Timestamp('2012-01-03 12:12:12')),slice(1,1)), slice('A','B')]
-        assert_frame_equal(result,expected)
-
-        result = df.loc[(idx[Timestamp('2012-01-01 12:12:12'):Timestamp('2012-01-03 12:12:12')],idx[1:1]), slice('A','B')]
-        assert_frame_equal(result,expected)
-
-        result = df.loc[(slice(Timestamp('2012-01-01 12:12:12'),Timestamp('2012-01-03 12:12:12')),1), slice('A','B')]
-        assert_frame_equal(result,expected)
-
-        # with strings
-        result = df.loc[(slice('2012-01-01 12:12:12','2012-01-03 12:12:12'),slice(1,1)), slice('A','B')]
-        assert_frame_equal(result,expected)
-
-        result = df.loc[(idx['2012-01-01 12:12:12':'2012-01-03 12:12:12'],1), idx['A','B']]
-        assert_frame_equal(result,expected)
-
-
-    def test_multiindex_slicers_edges(self):
-
-        # GH 8132
-        # various edge cases
-        df = DataFrame({'A': ['A0'] * 5 + ['A1']*5 + ['A2']*5,
-                        'B': ['B0','B0','B1','B1','B2'] * 3,
-                        'DATE': ["2013-06-11",
-                                 "2013-07-02",
-                                 "2013-07-09",
-                                 "2013-07-30",
-                                 "2013-08-06",
-                                 "2013-06-11",
-                                 "2013-07-02",
-                                 "2013-07-09",
-                                 "2013-07-30",
-                                 "2013-08-06",
-                                 "2013-09-03",
-                                 "2013-10-01",
-                                 "2013-07-09",
-                                 "2013-08-06",
-                                 "2013-09-03"],
-                        'VALUES': [22, 35, 14,  9,  4, 40, 18, 4, 2, 5, 1, 2, 3,4, 2]})
-
-        df['DATE'] = pd.to_datetime(df['DATE'])
-        df1 = df.set_index(['A', 'B', 'DATE'])
-        df1 = df1.sortlevel()
-        df2 = df.set_index('DATE')
-
-        # A1 - Get all values under "A0" and "A1"
-        result = df1.loc[(slice('A1')),:]
-        expected = df1.iloc[0:10]
-        assert_frame_equal(result, expected)
-
-        # A2 - Get all values from the start to "A2"
-        result = df1.loc[(slice('A2')),:]
-        expected = df1
-        assert_frame_equal(result, expected)
-
-        # A3 - Get all values under "B1" or "B2"
-        result = df1.loc[(slice(None),slice('B1','B2')),:]
-        expected = df1.iloc[[2,3,4,7,8,9,12,13,14]]
-        assert_frame_equal(result, expected)
-
-        # A4 - Get all values between 2013-07-02 and 2013-07-09
-        result = df1.loc[(slice(None),slice(None),slice('20130702','20130709')),:]
-        expected = df1.iloc[[1,2,6,7,12]]
-        assert_frame_equal(result, expected)
-
-        # B1 - Get all values in B0 that are also under A0, A1 and A2
-        result = df1.loc[(slice('A2'),slice('B0')),:]
-        expected = df1.iloc[[0,1,5,6,10,11]]
-        assert_frame_equal(result, expected)
-
-        # B2 - Get all values in B0, B1 and B2 (similar to what #2 is doing for the As)
-        result = df1.loc[(slice(None),slice('B2')),:]
-        expected = df1
-        assert_frame_equal(result, expected)
-
-        # B3 - Get all values from B1 to B2 and up to 2013-08-06
-        result = df1.loc[(slice(None),slice('B1','B2'),slice('2013-08-06')),:]
-        expected = df1.iloc[[2,3,4,7,8,9,12,13]]
-        assert_frame_equal(result, expected)
-
-        # B4 - Same as A4 but the start of the date slice is not a key.
-        #      shows indexing on a partial selection slice
-        result = df1.loc[(slice(None),slice(None),slice('20130701','20130709')),:]
-        expected = df1.iloc[[1,2,6,7,12]]
-        assert_frame_equal(result, expected)
-
-    def test_per_axis_per_level_doc_examples(self):
-
-        # test index maker
-        idx = pd.IndexSlice
-
-        # from indexing.rst / advanced
-        index = MultiIndex.from_product([_mklbl('A',4),
-                                         _mklbl('B',2),
-                                         _mklbl('C',4),
-                                         _mklbl('D',2)])
-        columns = MultiIndex.from_tuples([('a','foo'),('a','bar'),
-                                          ('b','foo'),('b','bah')],
-                                         names=['lvl0', 'lvl1'])
-        df = DataFrame(np.arange(len(index)*len(columns),dtype='int64').reshape((len(index),len(columns))),
-                       index=index,
-                       columns=columns)
-        result = df.loc[(slice('A1','A3'),slice(None), ['C1','C3']),:]
-        expected = df.loc[[ tuple([a,b,c,d]) for a,b,c,d in df.index.values if (
-            a == 'A1' or a == 'A2' or a == 'A3') and (c == 'C1' or c == 'C3')]]
-        assert_frame_equal(result, expected)
-        result = df.loc[idx['A1':'A3',:,['C1','C3']],:]
-        assert_frame_equal(result, expected)
-
-        result = df.loc[(slice(None),slice(None), ['C1','C3']),:]
-        expected = df.loc[[ tuple([a,b,c,d]) for a,b,c,d in df.index.values if (
-            c == 'C1' or c == 'C3')]]
-        assert_frame_equal(result, expected)
-        result = df.loc[idx[:,:,['C1','C3']],:]
-        assert_frame_equal(result, expected)
-
-        # not sorted
-        def f():
-            df.loc['A1',(slice(None),'foo')]
-        self.assertRaises(KeyError, f)
-        df = df.sortlevel(axis=1)
-
-        # slicing
-        df.loc['A1',(slice(None),'foo')]
-        df.loc[(slice(None),slice(None), ['C1','C3']),(slice(None),'foo')]
-
-        # setitem
-        df.loc(axis=0)[:,:,['C1','C3']] = -10
-
-    def test_loc_arguments(self):
-
-        index = MultiIndex.from_product([_mklbl('A',4),
-                                         _mklbl('B',2),
-                                         _mklbl('C',4),
-                                         _mklbl('D',2)])
-        columns = MultiIndex.from_tuples([('a','foo'),('a','bar'),
-                                          ('b','foo'),('b','bah')],
-                                         names=['lvl0', 'lvl1'])
-        df = DataFrame(np.arange(len(index)*len(columns),dtype='int64').reshape((len(index),len(columns))),
-                       index=index,
-                       columns=columns).sortlevel().sortlevel(axis=1)
-
-
-        # axis 0
-        result = df.loc(axis=0)['A1':'A3',:,['C1','C3']]
-        expected = df.loc[[ tuple([a,b,c,d]) for a,b,c,d in df.index.values if (
-            a == 'A1' or a == 'A2' or a == 'A3') and (c == 'C1' or c == 'C3')]]
-        assert_frame_equal(result, expected)
-
-        result = df.loc(axis='index')[:,:,['C1','C3']]
-        expected = df.loc[[ tuple([a,b,c,d]) for a,b,c,d in df.index.values if (
-            c == 'C1' or c == 'C3')]]
-        assert_frame_equal(result, expected)
-
-        # axis 1
-        result = df.loc(axis=1)[:,'foo']
-        expected = df.loc[:,(slice(None),'foo')]
-        assert_frame_equal(result, expected)
-
-        result = df.loc(axis='columns')[:,'foo']
-        expected = df.loc[:,(slice(None),'foo')]
-        assert_frame_equal(result, expected)
-
-        # invalid axis
-        def f():
-            df.loc(axis=-1)[:,:,['C1','C3']]
-        self.assertRaises(ValueError, f)
-
-        def f():
-            df.loc(axis=2)[:,:,['C1','C3']]
-        self.assertRaises(ValueError, f)
-
-        def f():
-            df.loc(axis='foo')[:,:,['C1','C3']]
-        self.assertRaises(ValueError, f)
-
-    def test_per_axis_per_level_setitem(self):
-
-        # test index maker
-        idx = pd.IndexSlice
-
-        # test multi-index slicing with per axis and per index controls
-        index = MultiIndex.from_tuples([('A',1),('A',2),('A',3),('B',1)],
-                                       names=['one','two'])
-        columns = MultiIndex.from_tuples([('a','foo'),('a','bar'),('b','foo'),('b','bah')],
-                                         names=['lvl0', 'lvl1'])
-
-        df_orig = DataFrame(np.arange(16,dtype='int64').reshape(4, 4), index=index, columns=columns)
-        df_orig = df_orig.sortlevel(axis=0).sortlevel(axis=1)
-
-        # identity
-        df = df_orig.copy()
-        df.loc[(slice(None),slice(None)),:] = 100
-        expected = df_orig.copy()
-        expected.iloc[:,:] = 100
-        assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc(axis=0)[:,:] = 100
-        expected = df_orig.copy()
-        expected.iloc[:,:] = 100
-        assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc[(slice(None),slice(None)),(slice(None),slice(None))] = 100
-        expected = df_orig.copy()
-        expected.iloc[:,:] = 100
-        assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc[:,(slice(None),slice(None))] = 100
-        expected = df_orig.copy()
-        expected.iloc[:,:] = 100
-        assert_frame_equal(df, expected)
-
-        # index
-        df = df_orig.copy()
-        df.loc[(slice(None),[1]),:] = 100
-        expected = df_orig.copy()
-        expected.iloc[[0,3]] = 100
-        assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc[(slice(None),1),:] = 100
-        expected = df_orig.copy()
-        expected.iloc[[0,3]] = 100
-        assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc(axis=0)[:,1] = 100
-        expected = df_orig.copy()
-        expected.iloc[[0,3]] = 100
-        assert_frame_equal(df, expected)
-
-        # columns
-        df = df_orig.copy()
-        df.loc[:,(slice(None),['foo'])] = 100
-        expected = df_orig.copy()
-        expected.iloc[:,[1,3]] = 100
-        assert_frame_equal(df, expected)
-
-        # both
-        df = df_orig.copy()
-        df.loc[(slice(None),1),(slice(None),['foo'])] = 100
-        expected = df_orig.copy()
-        expected.iloc[[0,3],[1,3]] = 100
-        assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc[idx[:,1],idx[:,['foo']]] = 100
-        expected = df_orig.copy()
-        expected.iloc[[0,3],[1,3]] = 100
-        assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc['A','a'] = 100
-        expected = df_orig.copy()
-        expected.iloc[0:3,0:2] = 100
-        assert_frame_equal(df, expected)
-
-        # setting with a list-like
-        df = df_orig.copy()
-        df.loc[(slice(None),1),(slice(None),['foo'])] = np.array([[100, 100], [100, 100]],dtype='int64')
-        expected = df_orig.copy()
-        expected.iloc[[0,3],[1,3]] = 100
-        assert_frame_equal(df, expected)
-
-        # not enough values
-        df = df_orig.copy()
-        def f():
-            df.loc[(slice(None),1),(slice(None),['foo'])] = np.array([[100], [100, 100]],dtype='int64')
-        self.assertRaises(ValueError, f)
-        def f():
-            df.loc[(slice(None),1),(slice(None),['foo'])] = np.array([100, 100, 100, 100],dtype='int64')
-        self.assertRaises(ValueError, f)
-
-        # with an alignable rhs
-        df = df_orig.copy()
-        df.loc[(slice(None),1),(slice(None),['foo'])] = df.loc[(slice(None),1),(slice(None),['foo'])] * 5
-        expected = df_orig.copy()
-        expected.iloc[[0,3],[1,3]] = expected.iloc[[0,3],[1,3]] * 5
-        assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc[(slice(None),1),(slice(None),['foo'])] *= df.loc[(slice(None),1),(slice(None),['foo'])]
-        expected = df_orig.copy()
-        expected.iloc[[0,3],[1,3]] *= expected.iloc[[0,3],[1,3]]
-        assert_frame_equal(df, expected)
-
-        rhs = df_orig.loc[(slice(None),1),(slice(None),['foo'])].copy()
-        rhs.loc[:,('c','bah')] = 10
-        df = df_orig.copy()
-        df.loc[(slice(None),1),(slice(None),['foo'])] *= rhs
-        expected = df_orig.copy()
-        expected.iloc[[0,3],[1,3]] *= expected.iloc[[0,3],[1,3]]
-        assert_frame_equal(df, expected)
-
-    def test_multiindex_setitem(self):
-
-        # GH 3738
-        # setting with a multi-index right hand side
-        arrays = [np.array(['bar', 'bar', 'baz', 'qux', 'qux', 'bar']),
-                  np.array(['one', 'two', 'one', 'one', 'two', 'one']),
-                  np.arange(0, 6, 1)]
-
-        df_orig = pd.DataFrame(np.random.randn(6, 3),
-                               index=arrays,
-                               columns=['A', 'B', 'C']).sort_index()
-
-        expected = df_orig.loc[['bar']]*2
-        df = df_orig.copy()
-        df.loc[['bar']] *= 2
-        assert_frame_equal(df.loc[['bar']],expected)
-
-        # raise because these have differing levels
-        def f():
-            df.loc['bar'] *= 2
-        self.assertRaises(TypeError, f)
-
-        # from SO
-        #http://stackoverflow.com/questions/24572040/pandas-access-the-level-of-multiindex-for-inplace-operation
-        df_orig = DataFrame.from_dict({'price': {
-            ('DE', 'Coal', 'Stock'): 2,
-            ('DE', 'Gas', 'Stock'): 4,
-            ('DE', 'Elec', 'Demand'): 1,
-            ('FR', 'Gas', 'Stock'): 5,
-            ('FR', 'Solar', 'SupIm'): 0,
-            ('FR', 'Wind', 'SupIm'): 0}})
-        df_orig.index = MultiIndex.from_tuples(df_orig.index, names=['Sit', 'Com', 'Type'])
-
-        expected = df_orig.copy()
-        expected.iloc[[0,2,3]] *= 2
-
-        idx = pd.IndexSlice
-        df = df_orig.copy()
-        df.loc[idx[:,:,'Stock'],:] *= 2
-        assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc[idx[:,:,'Stock'],'price'] *= 2
-        assert_frame_equal(df, expected)
-
-    def test_getitem_multiindex(self):
-
-        # GH 5725
-        # the 'A' happens to be a valid Timestamp so the doesn't raise the appropriate
-        # error, only in PY3 of course!
-        index = MultiIndex(levels=[['D', 'B', 'C'], [0, 26, 27, 37, 57, 67, 75, 82]],
-                           labels=[[0, 0, 0, 1, 2, 2, 2, 2, 2, 2], [1, 3, 4, 6, 0, 2, 2, 3, 5, 7]],
-                           names=['tag', 'day'])
-        arr = np.random.randn(len(index),1)
-        df = DataFrame(arr,index=index,columns=['val'])
-        result = df.val['D']
-        expected = Series(arr.ravel()[0:3],name='val',index=Index([26,37,57],name='day'))
-        assert_series_equal(result,expected)
-
-        def f():
-            df.val['A']
-        self.assertRaises(KeyError, f)
-
-        def f():
-            df.val['X']
-        self.assertRaises(KeyError, f)
-
-        # A is treated as a special Timestamp
-        index = MultiIndex(levels=[['A', 'B', 'C'], [0, 26, 27, 37, 57, 67, 75, 82]],
-                           labels=[[0, 0, 0, 1, 2, 2, 2, 2, 2, 2], [1, 3, 4, 6, 0, 2, 2, 3, 5, 7]],
-                           names=['tag', 'day'])
-        df = DataFrame(arr,index=index,columns=['val'])
-        result = df.val['A']
-        expected = Series(arr.ravel()[0:3],name='val',index=Index([26,37,57],name='day'))
-        assert_series_equal(result,expected)
-
-        def f():
-            df.val['X']
-        self.assertRaises(KeyError, f)
-
-
-        # GH 7866
-        # multi-index slicing with missing indexers
-        s = pd.Series(np.arange(9,dtype='int64'),
-                      index=pd.MultiIndex.from_product([['A','B','C'],['foo','bar','baz']],
-                                                       names=['one','two'])
-                      ).sortlevel()
-
-        expected = pd.Series(np.arange(3,dtype='int64'),
-                             index=pd.MultiIndex.from_product([['A'],['foo','bar','baz']],
-                                                              names=['one','two'])
-                             ).sortlevel()
-
-        result = s.loc[['A']]
-        assert_series_equal(result,expected)
-        result = s.loc[['A','D']]
-        assert_series_equal(result,expected)
-
-        # not any values found
-        self.assertRaises(KeyError, lambda : s.loc[['D']])
-
-        # empty ok
-        result = s.loc[[]]
-        expected = s.iloc[[]]
-        assert_series_equal(result,expected)
-
-        idx = pd.IndexSlice
-        expected = pd.Series([0,3,6],
-                             index=pd.MultiIndex.from_product([['A','B','C'],['foo']],
-                                                              names=['one','two'])
-                             ).sortlevel()
-
-        result = s.loc[idx[:,['foo']]]
-        assert_series_equal(result,expected)
-        result = s.loc[idx[:,['foo','bah']]]
-        assert_series_equal(result,expected)
-
-        # GH 8737
-        # empty indexer
-        multi_index = pd.MultiIndex.from_product((['foo', 'bar', 'baz'], ['alpha', 'beta']))
-        df = DataFrame(np.random.randn(5, 6), index=range(5), columns=multi_index)
-        df = df.sortlevel(0, axis=1)
-
-        expected = DataFrame(index=range(5),columns=multi_index.reindex([])[0])
-        result1 = df.loc[:, ([], slice(None))]
-        result2 = df.loc[:, (['foo'], [])]
-        assert_frame_equal(result1, expected)
-        assert_frame_equal(result2, expected)
-
-        # regression from < 0.14.0
-        # GH 7914
-        df = DataFrame([[np.mean, np.median],['mean','median']],
-                       columns=MultiIndex.from_tuples([('functs','mean'),
-                                                       ('functs','median')]),
-                       index=['function', 'name'])
-        result = df.loc['function',('functs','mean')]
-        self.assertEqual(result,np.mean)
-
-    def test_setitem_dtype_upcast(self):
-
-        # GH3216
-        df = DataFrame([{"a": 1}, {"a": 3, "b": 2}])
-        df['c'] = np.nan
-        self.assertEqual(df['c'].dtype, np.float64)
-
-        df.ix[0,'c'] = 'foo'
-        expected = DataFrame([{"a": 1, "c" : 'foo'}, {"a": 3, "b": 2, "c" : np.nan}])
-        assert_frame_equal(df,expected)
-
-        # GH10280
-        df = DataFrame(np.arange(6,dtype='int64').reshape(2, 3),
-                       index=list('ab'),
-                       columns=['foo', 'bar', 'baz'])
-
-        for val in [3.14, 'wxyz']:
-            left = df.copy()
-            left.loc['a', 'bar'] = val
-            right = DataFrame([[0, val, 2], [3, 4, 5]],
-                              index=list('ab'),
-                              columns=['foo', 'bar', 'baz'])
-
-            assert_frame_equal(left, right)
-            self.assertTrue(com.is_integer_dtype(left['foo']))
-            self.assertTrue(com.is_integer_dtype(left['baz']))
-
-        left = DataFrame(np.arange(6,dtype='int64').reshape(2, 3) / 10.0,
-                         index=list('ab'),
-                         columns=['foo', 'bar', 'baz'])
-        left.loc['a', 'bar'] = 'wxyz'
-
-        right = DataFrame([[0, 'wxyz', .2], [.3, .4, .5]],
-                          index=list('ab'),
-                          columns=['foo', 'bar', 'baz'])
-
-        assert_frame_equal(left, right)
-        self.assertTrue(com.is_float_dtype(left['foo']))
-        self.assertTrue(com.is_float_dtype(left['baz']))
-
-    def test_setitem_iloc(self):
-
-
-        # setitem with an iloc list
-        df = DataFrame(np.arange(9).reshape((3, 3)), index=["A", "B", "C"], columns=["A", "B", "C"])
-        df.iloc[[0,1],[1,2]]
-        df.iloc[[0,1],[1,2]] += 100
-
-        expected = DataFrame(np.array([0,101,102,3,104,105,6,7,8]).reshape((3, 3)), index=["A", "B", "C"], columns=["A", "B", "C"])
-        assert_frame_equal(df,expected)
-
-    def test_dups_fancy_indexing(self):
-
-        # GH 3455
-        from pandas.util.testing import makeCustomDataframe as mkdf
-        df= mkdf(10, 3)
-        df.columns = ['a','a','b']
-        cols = ['b','a']
-        result = df[['b','a']].columns
-        expected = Index(['b','a','a'])
-        self.assertTrue(result.equals(expected))
-
-        # across dtypes
-        df = DataFrame([[1,2,1.,2.,3.,'foo','bar']], columns=list('aaaaaaa'))
-        df.head()
-        str(df)
-        result = DataFrame([[1,2,1.,2.,3.,'foo','bar']])
-        result.columns = list('aaaaaaa')
-
-        df_v  = df.iloc[:,4]
-        res_v = result.iloc[:,4]
-
-        assert_frame_equal(df,result)
-
-        # GH 3561, dups not in selected order
-        df = DataFrame({'test': [5,7,9,11], 'test1': [4.,5,6,7], 'other': list('abcd') }, index=['A', 'A', 'B', 'C'])
-        rows = ['C', 'B']
-        expected = DataFrame({'test' : [11,9], 'test1': [ 7., 6], 'other': ['d','c']},index=rows)
-        result = df.ix[rows]
-        assert_frame_equal(result, expected)
-
-        result = df.ix[Index(rows)]
-        assert_frame_equal(result, expected)
-
-        rows = ['C','B','E']
-        expected = DataFrame({'test' : [11,9,np.nan], 'test1': [7.,6,np.nan], 'other': ['d','c',np.nan]},index=rows)
-
-        result = df.ix[rows]
-        assert_frame_equal(result, expected)
-
-        # see GH5553, make sure we use the right indexer
-        rows = ['F','G','H','C','B','E']
-        expected = DataFrame({'test' : [np.nan,np.nan,np.nan,11,9,np.nan],
-                              'test1': [np.nan,np.nan,np.nan,7.,6,np.nan],
-                              'other': [np.nan,np.nan,np.nan,'d','c',np.nan]},index=rows)
-        result = df.ix[rows]
-        assert_frame_equal(result, expected)
-
-        # inconsistent returns for unique/duplicate indices when values are missing
-        df = DataFrame(randn(4,3),index=list('ABCD'))
-        expected = df.ix[['E']]
-
-        dfnu = DataFrame(randn(5,3),index=list('AABCD'))
-        result = dfnu.ix[['E']]
-        assert_frame_equal(result, expected)
-
-        # GH 4619; duplicate indexer with missing label
-        df = DataFrame({"A": [0, 1, 2]})
-        result = df.ix[[0,8,0]]
-        expected = DataFrame({"A": [0, np.nan, 0]},index=[0,8,0])
-        assert_frame_equal(result,expected)
-
-        df = DataFrame({"A": list('abc')})
-        result = df.ix[[0,8,0]]
-        expected = DataFrame({"A": ['a', np.nan, 'a']},index=[0,8,0])
-        assert_frame_equal(result,expected)
-
-        # non unique with non unique selector
-        df = DataFrame({'test': [5,7,9,11]}, index=['A','A','B','C'])
-        expected = DataFrame({'test' : [5,7,5,7,np.nan]},index=['A','A','A','A','E'])
-        result = df.ix[['A','A','E']]
-        assert_frame_equal(result, expected)
-
-        # GH 5835
-        # dups on index and missing values
-        df = DataFrame(np.random.randn(5,5),columns=['A','B','B','B','A'])
-
-        expected = pd.concat([df.ix[:,['A','B']],DataFrame(np.nan,columns=['C'],index=df.index)],axis=1)
-        result = df.ix[:,['A','B','C']]
-        assert_frame_equal(result, expected)
-
-        # GH 6504, multi-axis indexing
-        df = DataFrame(np.random.randn(9,2), index=[1,1,1,2,2,2,3,3,3], columns=['a', 'b'])
-
-        expected = df.iloc[0:6]
-        result = df.loc[[1, 2]]
-        assert_frame_equal(result, expected)
-
-        expected = df
-        result = df.loc[:,['a', 'b']]
-        assert_frame_equal(result, expected)
-
-        expected = df.iloc[0:6,:]
-        result = df.loc[[1, 2], ['a', 'b']]
-        assert_frame_equal(result, expected)
-
-    def test_indexing_mixed_frame_bug(self):
-
-        # GH3492
-        df=DataFrame({'a':{1:'aaa',2:'bbb',3:'ccc'},'b':{1:111,2:222,3:333}})
-
-        # this works, new column is created correctly
-        df['test']=df['a'].apply(lambda x: '_' if x=='aaa' else x)
-
-        # this does not work, ie column test is not changed
-        idx=df['test']=='_'
-        temp=df.ix[idx,'a'].apply(lambda x: '-----' if x=='aaa' else x)
-        df.ix[idx,'test']=temp
-        self.assertEqual(df.iloc[0,2], '-----')
-
-        #if I look at df, then element [0,2] equals '_'. If instead I type df.ix[idx,'test'], I get '-----', finally by typing df.iloc[0,2] I get '_'.
-
-    def test_multitype_list_index_access(self):
-        #GH 10610
-        df = pd.DataFrame(np.random.random((10, 5)), columns=["a"] + [20, 21, 22, 23])
-        with self.assertRaises(IndexError):
-            vals = df[[22, 26, -8]]
-        self.assertEqual(df[21].shape[0], df.shape[0])
-
-    def test_set_index_nan(self):
-
-        # GH 3586
-        df = DataFrame({'PRuid': {17: 'nonQC', 18: 'nonQC', 19: 'nonQC', 20: '10', 21: '11', 22: '12', 23: '13',
-                                  24: '24', 25: '35', 26: '46', 27: '47', 28: '48', 29: '59', 30: '10'},
-                        'QC': {17: 0.0, 18: 0.0, 19: 0.0, 20: nan, 21: nan, 22: nan, 23: nan, 24: 1.0, 25: nan,
-                               26: nan, 27: nan, 28: nan, 29: nan, 30: nan},
-                        'data': {17: 7.9544899999999998, 18: 8.0142609999999994, 19: 7.8591520000000008, 20: 0.86140349999999999,
-                                 21: 0.87853110000000001, 22: 0.8427041999999999, 23: 0.78587700000000005, 24: 0.73062459999999996,
-                                 25: 0.81668560000000001, 26: 0.81927080000000008, 27: 0.80705009999999999, 28: 0.81440240000000008,
-                                 29: 0.80140849999999997, 30: 0.81307740000000006},
-                        'year': {17: 2006, 18: 2007, 19: 2008, 20: 1985, 21: 1985, 22: 1985, 23: 1985,
-                                 24: 1985, 25: 1985, 26: 1985, 27: 1985, 28: 1985, 29: 1985, 30: 1986}}).reset_index()
-
-        result = df.set_index(['year','PRuid','QC']).reset_index().reindex(columns=df.columns)
-        assert_frame_equal(result,df)
-
-    def test_multi_nan_indexing(self):
-
-        # GH 3588
-        df = DataFrame({"a":['R1', 'R2', np.nan, 'R4'], 'b':["C1", "C2", "C3" , "C4"], "c":[10, 15, np.nan , 20]})
-        result = df.set_index(['a','b'], drop=False)
-        expected = DataFrame({"a":['R1', 'R2', np.nan, 'R4'], 'b':["C1", "C2", "C3" , "C4"], "c":[10, 15, np.nan , 20]},
-                             index = [Index(['R1','R2',np.nan,'R4'],name='a'),Index(['C1','C2','C3','C4'],name='b')])
-        assert_frame_equal(result,expected)
-
-
-    def test_iloc_panel_issue(self):
-
-        # GH 3617
-        p = Panel(randn(4, 4, 4))
-
-        self.assertEqual(p.iloc[:3, :3, :3].shape, (3,3,3))
-        self.assertEqual(p.iloc[1, :3, :3].shape, (3,3))
-        self.assertEqual(p.iloc[:3, 1, :3].shape, (3,3))
-        self.assertEqual(p.iloc[:3, :3, 1].shape, (3,3))
-        self.assertEqual(p.iloc[1, 1, :3].shape, (3,))
-        self.assertEqual(p.iloc[1, :3, 1].shape, (3,))
-        self.assertEqual(p.iloc[:3, 1, 1].shape, (3,))
-
-    def test_panel_getitem(self):
-        # GH4016, date selection returns a frame when a partial string selection
-        ind = date_range(start="2000", freq="D", periods=1000)
-        df = DataFrame(np.random.randn(len(ind), 5), index=ind, columns=list('ABCDE'))
-        panel = Panel(dict([ ('frame_'+c,df) for c in list('ABC') ]))
-
-        test2 = panel.ix[:, "2002":"2002-12-31"]
-        test1 = panel.ix[:, "2002"]
-        tm.assert_panel_equal(test1,test2)
-
-        # GH8710
-        # multi-element getting with a list
-        panel = tm.makePanel()
-
-        expected = panel.iloc[[0,1]]
-
-        result = panel.loc[['ItemA','ItemB']]
-        tm.assert_panel_equal(result,expected)
-
-        result = panel.loc[['ItemA','ItemB'],:,:]
-        tm.assert_panel_equal(result,expected)
-
-        result = panel[['ItemA','ItemB']]
-        tm.assert_panel_equal(result,expected)
-
-        result = panel.loc['ItemA':'ItemB']
-        tm.assert_panel_equal(result,expected)
-
-        result = panel.ix['ItemA':'ItemB']
-        tm.assert_panel_equal(result,expected)
-
-        result = panel.ix[['ItemA','ItemB']]
-        tm.assert_panel_equal(result,expected)
-
-        # with an object-like
-        # GH 9140
-        class TestObject:
-            def __str__(self):
-                return "TestObject"
-
-        obj = TestObject()
-
-        p = Panel(np.random.randn(1,5,4), items=[obj],
-                  major_axis = date_range('1/1/2000', periods=5),
-                  minor_axis=['A', 'B', 'C', 'D'])
-
-        expected = p.iloc[0]
-        result = p[obj]
-        tm.assert_frame_equal(result, expected)
-
-    def test_panel_setitem(self):
-
-        # GH 7763
-        # loc and setitem have setting differences
-        np.random.seed(0)
-        index=range(3)
-        columns = list('abc')
-
-        panel = Panel({'A' : DataFrame(np.random.randn(3, 3), index=index, columns=columns),
-                       'B' : DataFrame(np.random.randn(3, 3), index=index, columns=columns),
-                       'C' : DataFrame(np.random.randn(3, 3), index=index, columns=columns)
-                       })
-
-        replace = DataFrame(np.eye(3,3), index=range(3), columns=columns)
-        expected = Panel({ 'A' : replace, 'B' : replace, 'C' : replace })
-
-        p = panel.copy()
-        for idx in list('ABC'):
-            p[idx] = replace
-        tm.assert_panel_equal(p, expected)
-
-        p = panel.copy()
-        for idx in list('ABC'):
-            p.loc[idx,:,:] = replace
-        tm.assert_panel_equal(p, expected)
-
-
-    def test_panel_setitem_with_multiindex(self):
-
-        # 10360
-        # failing with a multi-index
-        arr = np.array([[[1,2,3],[0,0,0]],[[0,0,0],[0,0,0]]],dtype=np.float64)
-
-        # reg index
-        axes = dict(items=['A', 'B'], major_axis=[0, 1], minor_axis=['X', 'Y' ,'Z'])
-        p1 = Panel(0., **axes)
-        p1.iloc[0, 0, :] = [1, 2, 3]
-        expected = Panel(arr, **axes)
-        tm.assert_panel_equal(p1, expected)
-
-        # multi-indexes
-        axes['items'] = pd.MultiIndex.from_tuples([('A','a'), ('B','b')])
-        p2 = Panel(0., **axes)
-        p2.iloc[0, 0, :] = [1, 2, 3]
-        expected = Panel(arr, **axes)
-        tm.assert_panel_equal(p2, expected)
-
-        axes['major_axis']=pd.MultiIndex.from_tuples([('A',1),('A',2)])
-        p3 = Panel(0., **axes)
-        p3.iloc[0, 0, :] = [1, 2, 3]
-        expected = Panel(arr, **axes)
-        tm.assert_panel_equal(p3, expected)
-
-        axes['minor_axis']=pd.MultiIndex.from_product([['X'],range(3)])
-        p4 = Panel(0., **axes)
-        p4.iloc[0, 0, :] = [1, 2, 3]
-        expected = Panel(arr, **axes)
-        tm.assert_panel_equal(p4, expected)
-
-        arr = np.array([[[1,0,0],[2,0,0]],[[0,0,0],[0,0,0]]],dtype=np.float64)
-        p5 = Panel(0., **axes)
-        p5.iloc[0, :, 0] = [1, 2]
-        expected = Panel(arr, **axes)
-        tm.assert_panel_equal(p5, expected)
-
-    def test_panel_assignment(self):
-
-        # GH3777
-        wp = Panel(randn(2, 5, 4), items=['Item1', 'Item2'], major_axis=date_range('1/1/2000', periods=5), minor_axis=['A', 'B', 'C', 'D'])
-        wp2 = Panel(randn(2, 5, 4), items=['Item1', 'Item2'], major_axis=date_range('1/1/2000', periods=5), minor_axis=['A', 'B', 'C', 'D'])
-        expected = wp.loc[['Item1', 'Item2'], :, ['A', 'B']]
-
-        def f():
-            wp.loc[['Item1', 'Item2'], :, ['A', 'B']] = wp2.loc[['Item1', 'Item2'], :, ['A', 'B']]
-        self.assertRaises(NotImplementedError, f)
-
-        #wp.loc[['Item1', 'Item2'], :, ['A', 'B']] = wp2.loc[['Item1', 'Item2'], :, ['A', 'B']]
-        #result = wp.loc[['Item1', 'Item2'], :, ['A', 'B']]
-        #tm.assert_panel_equal(result,expected)
-
-    def test_multiindex_assignment(self):
-
-        # GH3777 part 2
-
-        # mixed dtype
-        df = DataFrame(np.random.randint(5,10,size=9).reshape(3, 3),
-                       columns=list('abc'),
-                       index=[[4,4,8],[8,10,12]])
-        df['d'] = np.nan
-        arr = np.array([0.,1.])
-
-        df.ix[4,'d'] = arr
-        assert_series_equal(df.ix[4,'d'],Series(arr,index=[8,10],name='d'))
-
-        # single dtype
-        df = DataFrame(np.random.randint(5,10,size=9).reshape(3, 3),
-                       columns=list('abc'),
-                       index=[[4,4,8],[8,10,12]])
-
-        df.ix[4,'c'] = arr
-        assert_series_equal(df.ix[4,'c'],Series(arr,index=[8,10],name='c',dtype='int64'))
-
-        # scalar ok
-        df.ix[4,'c'] = 10
-        assert_series_equal(df.ix[4,'c'],Series(10,index=[8,10],name='c',dtype='int64'))
-
-        # invalid assignments
-        def f():
-            df.ix[4,'c'] = [0,1,2,3]
-        self.assertRaises(ValueError, f)
-
-        def f():
-            df.ix[4,'c'] = [0]
-        self.assertRaises(ValueError, f)
-
-        # groupby example
-        NUM_ROWS = 100
-        NUM_COLS = 10
-        col_names = ['A'+num for num in map(str,np.arange(NUM_COLS).tolist())]
-        index_cols = col_names[:5]
-
-        df = DataFrame(np.random.randint(5, size=(NUM_ROWS,NUM_COLS)), dtype=np.int64, columns=col_names)
-        df = df.set_index(index_cols).sort_index()
-        grp = df.groupby(level=index_cols[:4])
-        df['new_col'] = np.nan
-
-        f_index = np.arange(5)
-        def f(name,df2):
-            return Series(np.arange(df2.shape[0]),name=df2.index.values[0]).reindex(f_index)
-        new_df = pd.concat([ f(name,df2) for name, df2 in grp ],axis=1).T
-
-        # we are actually operating on a copy here
-        # but in this case, that's ok
-        for name, df2 in grp:
-            new_vals = np.arange(df2.shape[0])
-            df.ix[name, 'new_col'] = new_vals
-
-    def test_multi_assign(self):
-
-        # GH 3626, an assignement of a sub-df to a df
-        df = DataFrame({'FC':['a','b','a','b','a','b'],
-                        'PF':[0,0,0,0,1,1],
-                        'col1':lrange(6),
-                        'col2':lrange(6,12)})
-        df.ix[1,0]=np.nan
-        df2 = df.copy()
-
-        mask=~df2.FC.isnull()
-        cols=['col1', 'col2']
-
-        dft = df2 * 2
-        dft.ix[3,3] = np.nan
-
-        expected = DataFrame({'FC':['a',np.nan,'a','b','a','b'],
-                              'PF':[0,0,0,0,1,1],
-                              'col1':Series([0,1,4,6,8,10]),
-                              'col2':[12,7,16,np.nan,20,22]})
-
-
-        # frame on rhs
-        df2.ix[mask, cols]= dft.ix[mask, cols]
-        assert_frame_equal(df2,expected)
-
-        df2.ix[mask, cols]= dft.ix[mask, cols]
-        assert_frame_equal(df2,expected)
-
-        # with an ndarray on rhs
-        df2 = df.copy()
-        df2.ix[mask, cols]= dft.ix[mask, cols].values
-        assert_frame_equal(df2,expected)
-        df2.ix[mask, cols]= dft.ix[mask, cols].values
-        assert_frame_equal(df2,expected)
-
-        # broadcasting on the rhs is required
-        df = DataFrame(dict(A = [1,2,0,0,0],B=[0,0,0,10,11],C=[0,0,0,10,11],D=[3,4,5,6,7]))
-
-        expected = df.copy()
-        mask = expected['A'] == 0
-        for col in ['A','B']:
-            expected.loc[mask,col] = df['D']
-
-        df.loc[df['A']==0,['A','B']] = df['D']
-        assert_frame_equal(df,expected)
-
-    def test_ix_assign_column_mixed(self):
-        # GH #1142
-        df = DataFrame(tm.getSeriesData())
-        df['foo'] = 'bar'
-
-        orig = df.ix[:, 'B'].copy()
-        df.ix[:, 'B'] = df.ix[:, 'B'] + 1
-        assert_series_equal(df.B, orig + 1)
-
-        # GH 3668, mixed frame with series value
-        df = DataFrame({'x':lrange(10), 'y':lrange(10,20),'z' : 'bar'})
-        expected = df.copy()
-
-        for i in range(5):
-            indexer = i*2
-            v = 1000 + i*200
-            expected.ix[indexer, 'y'] = v
-            self.assertEqual(expected.ix[indexer, 'y'], v)
-
-        df.ix[df.x % 2 == 0, 'y'] = df.ix[df.x % 2 == 0, 'y'] * 100
-        assert_frame_equal(df,expected)
-
-        # GH 4508, making sure consistency of assignments
-        df = DataFrame({'a':[1,2,3],'b':[0,1,2]})
-        df.ix[[0,2,],'b'] = [100,-100]
-        expected = DataFrame({'a' : [1,2,3], 'b' : [100,1,-100] })
-        assert_frame_equal(df,expected)
-
-        df = pd.DataFrame({'a': lrange(4) })
-        df['b'] = np.nan
-        df.ix[[1,3],'b'] = [100,-100]
-        expected = DataFrame({'a' : [0,1,2,3], 'b' : [np.nan,100,np.nan,-100] })
-        assert_frame_equal(df,expected)
-
-        # ok, but chained assignments are dangerous
-        # if we turn off chained assignement it will work
-        with option_context('chained_assignment',None):
-            df = pd.DataFrame({'a': lrange(4) })
-            df['b'] = np.nan
-            df['b'].ix[[1,3]] = [100,-100]
-            assert_frame_equal(df,expected)
-
-    def test_ix_get_set_consistency(self):
-
-        # GH 4544
-        # ix/loc get/set not consistent when
-        # a mixed int/string index
-        df = DataFrame(np.arange(16).reshape((4, 4)),
-                       columns=['a', 'b', 8, 'c'],
-                       index=['e', 7, 'f', 'g'])
-
-        self.assertEqual(df.ix['e', 8], 2)
-        self.assertEqual(df.loc['e', 8], 2)
-
-        df.ix['e', 8] = 42
-        self.assertEqual(df.ix['e', 8], 42)
-        self.assertEqual(df.loc['e', 8], 42)
-
-        df.loc['e', 8] = 45
-        self.assertEqual(df.ix['e', 8], 45)
-        self.assertEqual(df.loc['e', 8], 45)
-
-    def test_setitem_list(self):
-
-        # GH 6043
-        # ix with a list
-        df = DataFrame(index=[0,1], columns=[0])
-        df.ix[1,0] = [1,2,3]
-        df.ix[1,0] = [1,2]
-
-        result = DataFrame(index=[0,1], columns=[0])
-        result.ix[1,0] = [1,2]
-
-        assert_frame_equal(result,df)
-
-        # ix with an object
-        class TO(object):
-            def __init__(self, value):
-                self.value = value
-            def __str__(self):
-                return "[{0}]".format(self.value)
-            __repr__ = __str__
-            def __eq__(self, other):
-                return self.value == other.value
-            def view(self):
-                return self
-
-        df = DataFrame(index=[0,1], columns=[0])
-        df.ix[1,0] = TO(1)
-        df.ix[1,0] = TO(2)
-
-        result = DataFrame(index=[0,1], columns=[0])
-        result.ix[1,0] = TO(2)
-
-        assert_frame_equal(result,df)
-
-        # remains object dtype even after setting it back
-        df = DataFrame(index=[0,1], columns=[0])
-        df.ix[1,0] = TO(1)
-        df.ix[1,0] = np.nan
-        result = DataFrame(index=[0,1], columns=[0])
-
-        assert_frame_equal(result, df)
-
-    def test_iloc_mask(self):
-
-        # GH 3631, iloc with a mask (of a series) should raise
-        df = DataFrame(lrange(5), list('ABCDE'), columns=['a'])
-        mask = (df.a%2 == 0)
-        self.assertRaises(ValueError, df.iloc.__getitem__, tuple([mask]))
-        mask.index = lrange(len(mask))
-        self.assertRaises(NotImplementedError, df.iloc.__getitem__, tuple([mask]))
-
-        # ndarray ok
-        result = df.iloc[np.array([True] * len(mask),dtype=bool)]
-        assert_frame_equal(result,df)
-
-        # the possibilities
-        locs = np.arange(4)
-        nums = 2**locs
-        reps = lmap(bin, nums)
-        df = DataFrame({'locs':locs, 'nums':nums}, reps)
-
-        expected = {
-            (None,'')     : '0b1100',
-            (None,'.loc')  : '0b1100',
-            (None,'.iloc') : '0b1100',
-            ('index','')  : '0b11',
-            ('index','.loc')  : '0b11',
-            ('index','.iloc') : 'iLocation based boolean indexing cannot use an indexable as a mask',
-            ('locs','')      : 'Unalignable boolean Series key provided',
-            ('locs','.loc')   : 'Unalignable boolean Series key provided',
-            ('locs','.iloc')  : 'iLocation based boolean indexing on an integer type is not available',
-            }
-
-        warnings.filterwarnings(action='ignore', category=UserWarning)
-        result = dict()
-        for idx in [None, 'index', 'locs']:
-            mask = (df.nums>2).values
-            if idx:
-                mask = Series(mask, list(reversed(getattr(df, idx))))
-            for method in ['', '.loc', '.iloc']:
-                try:
-                    if method:
-                        accessor = getattr(df, method[1:])
-                    else:
-                        accessor = df
-                    ans = str(bin(accessor[mask]['nums'].sum()))
-                except Exception as e:
-                    ans = str(e)
-
-                key = tuple([idx,method])
-                r = expected.get(key)
-                if r != ans:
-                    raise AssertionError("[%s] does not match [%s], received [%s]" %
-                                         (key,ans,r))
-        warnings.filterwarnings(action='always', category=UserWarning)
-
-    def test_ix_slicing_strings(self):
-        ##GH3836
-        data = {'Classification': ['SA EQUITY CFD', 'bbb', 'SA EQUITY', 'SA SSF', 'aaa'],
-                'Random': [1,2,3,4,5],
-                'X': ['correct', 'wrong','correct', 'correct','wrong']}
-        df = DataFrame(data)
-        x = df[~df.Classification.isin(['SA EQUITY CFD', 'SA EQUITY', 'SA SSF'])]
-        df.ix[x.index,'X'] = df['Classification']
-
-        expected = DataFrame({'Classification': {0: 'SA EQUITY CFD', 1: 'bbb',
-                                                2: 'SA EQUITY', 3: 'SA SSF', 4: 'aaa'},
-                            'Random': {0: 1, 1: 2, 2: 3, 3: 4, 4: 5},
-                            'X': {0: 'correct', 1: 'bbb', 2: 'correct',
-                            3: 'correct', 4: 'aaa'}})  # bug was 4: 'bbb'
-
-        assert_frame_equal(df, expected)
-
-    def test_non_unique_loc(self):
-        ## GH3659
-        ## non-unique indexer with loc slice
-        ## https://groups.google.com/forum/?fromgroups#!topic/pydata/zTm2No0crYs
-
-        # these are going to raise becuase the we are non monotonic
-        df = DataFrame({'A' : [1,2,3,4,5,6], 'B' : [3,4,5,6,7,8]}, index = [0,1,0,1,2,3])
-        self.assertRaises(KeyError, df.loc.__getitem__, tuple([slice(1,None)]))
-        self.assertRaises(KeyError, df.loc.__getitem__, tuple([slice(0,None)]))
-        self.assertRaises(KeyError, df.loc.__getitem__, tuple([slice(1,2)]))
-
-        # monotonic are ok
-        df = DataFrame({'A' : [1,2,3,4,5,6], 'B' : [3,4,5,6,7,8]}, index = [0,1,0,1,2,3]).sort_index(axis=0)
-        result = df.loc[1:]
-        expected = DataFrame({'A' : [2,4,5,6], 'B' : [4, 6,7,8]}, index = [1,1,2,3])
-        assert_frame_equal(result,expected)
-
-        result = df.loc[0:]
-        assert_frame_equal(result,df)
-
-        result = df.loc[1:2]
-        expected = DataFrame({'A' : [2,4,5], 'B' : [4,6,7]}, index = [1,1,2])
-        assert_frame_equal(result,expected)
-
-    def test_loc_name(self):
-        # GH 3880
-        df = DataFrame([[1, 1], [1, 1]])
-        df.index.name = 'index_name'
-        result = df.iloc[[0, 1]].index.name
-        self.assertEqual(result, 'index_name')
-
-        result = df.ix[[0, 1]].index.name
-        self.assertEqual(result, 'index_name')
-
-        result = df.loc[[0, 1]].index.name
-        self.assertEqual(result, 'index_name')
-
-    def test_iloc_non_unique_indexing(self):
-
-        #GH 4017, non-unique indexing (on the axis)
-        df = DataFrame({'A' : [0.1] * 3000, 'B' : [1] * 3000})
-        idx = np.array(lrange(30)) * 99
-        expected = df.iloc[idx]
-
-        df3 = pd.concat([df, 2*df, 3*df])
-        result = df3.iloc[idx]
-
-        assert_frame_equal(result, expected)
-
-        df2 = DataFrame({'A' : [0.1] * 1000, 'B' : [1] * 1000})
-        df2 = pd.concat([df2, 2*df2, 3*df2])
-
-        sidx = df2.index.to_series()
-        expected = df2.iloc[idx[idx<=sidx.max()]]
-
-        new_list = []
-        for r, s in expected.iterrows():
-            new_list.append(s)
-            new_list.append(s*2)
-            new_list.append(s*3)
-
-        expected = DataFrame(new_list)
-        expected = pd.concat([ expected, DataFrame(index=idx[idx>sidx.max()]) ])
-        result = df2.loc[idx]
-        assert_frame_equal(result, expected)
-
-    def test_mi_access(self):
-
-        # GH 4145
-        data = """h1 main  h3 sub  h5
-0  a    A   1  A1   1
-1  b    B   2  B1   2
-2  c    B   3  A1   3
-3  d    A   4  B2   4
-4  e    A   5  B2   5
-5  f    B   6  A2   6
-"""
-
-        df = pd.read_csv(StringIO(data),sep='\s+',index_col=0)
-        df2 = df.set_index(['main', 'sub']).T.sort_index(1)
-        index = Index(['h1','h3','h5'])
-        columns = MultiIndex.from_tuples([('A','A1')],names=['main','sub'])
-        expected = DataFrame([['a',1,1]],index=columns,columns=index).T
-
-        result = df2.loc[:,('A','A1')]
-        assert_frame_equal(result,expected)
-
-        result = df2[('A','A1')]
-        assert_frame_equal(result,expected)
-
-        # GH 4146, not returning a block manager when selecting a unique index
-        # from a duplicate index
-        # as of 4879, this returns a Series (which is similar to what happens with a non-unique)
-        expected = Series(['a',1,1], index=['h1','h3','h5'], name='A1')
-        result = df2['A']['A1']
-        assert_series_equal(result, expected)
-
-        # selecting a non_unique from the 2nd level
-        expected = DataFrame([['d',4,4],['e',5,5]],index=Index(['B2','B2'],name='sub'),columns=['h1','h3','h5'],).T
-        result = df2['A']['B2']
-        assert_frame_equal(result, expected)
-
-    def test_non_unique_loc_memory_error(self):
-
-        # GH 4280
-        # non_unique index with a large selection triggers a memory error
-
-        columns = list('ABCDEFG')
-        def gen_test(l,l2):
-            return pd.concat([ DataFrame(randn(l,len(columns)),index=lrange(l),columns=columns),
-                               DataFrame(np.ones((l2,len(columns))),index=[0]*l2,columns=columns) ])
-
-
-        def gen_expected(df,mask):
-            l = len(mask)
-            return pd.concat([
-                df.take([0],convert=False),
-                DataFrame(np.ones((l,len(columns))),index=[0]*l,columns=columns),
-                df.take(mask[1:],convert=False) ])
-
-        df = gen_test(900,100)
-        self.assertFalse(df.index.is_unique)
-
-        mask = np.arange(100)
-        result = df.loc[mask]
-        expected = gen_expected(df,mask)
-        assert_frame_equal(result,expected)
-
-        df = gen_test(900000,100000)
-        self.assertFalse(df.index.is_unique)
-
-        mask = np.arange(100000)
-        result = df.loc[mask]
-        expected = gen_expected(df,mask)
-        assert_frame_equal(result,expected)
-
-    def test_astype_assignment(self):
-
-        # GH4312 (iloc)
-        df_orig = DataFrame([['1','2','3','.4',5,6.,'foo']],columns=list('ABCDEFG'))
-
-        df = df_orig.copy()
-        df.iloc[:,0:2] = df.iloc[:,0:2].astype(np.int64)
-        expected = DataFrame([[1,2,'3','.4',5,6.,'foo']],columns=list('ABCDEFG'))
-        assert_frame_equal(df,expected)
-
-        df = df_orig.copy()
-        df.iloc[:,0:2] = df.iloc[:,0:2]._convert(datetime=True, numeric=True)
-        expected =  DataFrame([[1,2,'3','.4',5,6.,'foo']],columns=list('ABCDEFG'))
-        assert_frame_equal(df,expected)
-
-        # GH5702 (loc)
-        df = df_orig.copy()
-        df.loc[:,'A'] = df.loc[:,'A'].astype(np.int64)
-        expected = DataFrame([[1,'2','3','.4',5,6.,'foo']],columns=list('ABCDEFG'))
-        assert_frame_equal(df,expected)
-
-        df = df_orig.copy()
-        df.loc[:,['B','C']] = df.loc[:,['B','C']].astype(np.int64)
-        expected =  DataFrame([['1',2,3,'.4',5,6.,'foo']],columns=list('ABCDEFG'))
-        assert_frame_equal(df,expected)
-
-        # full replacements / no nans
-        df = DataFrame({'A': [1., 2., 3., 4.]})
-        df.iloc[:, 0] = df['A'].astype(np.int64)
-        expected = DataFrame({'A': [1, 2, 3, 4]})
-        assert_frame_equal(df,expected)
-
-        df = DataFrame({'A': [1., 2., 3., 4.]})
-        df.loc[:, 'A'] = df['A'].astype(np.int64)
-        expected = DataFrame({'A': [1, 2, 3, 4]})
-        assert_frame_equal(df,expected)
-
-    def test_astype_assignment_with_dups(self):
-
-        # GH 4686
-        # assignment with dups that has a dtype change
-        df = DataFrame(
-            np.arange(3).reshape((1,3)),
-            columns=pd.MultiIndex.from_tuples(
-                [('A', '1'), ('B', '1'), ('A', '2')]
-                ),
-            dtype=object
-            )
-        index = df.index.copy()
-
-        df['A'] = df['A'].astype(np.float64)
-        result = df.get_dtype_counts().sort_index()
-        expected = Series({ 'float64' : 2, 'object' : 1 }).sort_index()
-        self.assertTrue(df.index.equals(index))
-
-    def test_dups_loc(self):
-
-        # GH4726
-        # dup indexing with iloc/loc
-        df = DataFrame([[1, 2, 'foo', 'bar', Timestamp('20130101')]],
-                       columns=['a','a','a','a','a'], index=[1])
-        expected = Series([1, 2, 'foo', 'bar', Timestamp('20130101')],
-                          index=['a','a','a','a','a'], name=1)
-
-        result = df.iloc[0]
-        assert_series_equal(result, expected)
-
-        result = df.loc[1]
-        assert_series_equal(result, expected)
-
-    def test_partial_setting(self):
-
-        # GH2578, allow ix and friends to partially set
-
-        ### series ###
-        s_orig = Series([1,2,3])
-
-        s = s_orig.copy()
-        s[5] = 5
-        expected = Series([1,2,3,5],index=[0,1,2,5])
-        assert_series_equal(s,expected)
-
-        s = s_orig.copy()
-        s.loc[5] = 5
-        expected = Series([1,2,3,5],index=[0,1,2,5])
-        assert_series_equal(s,expected)
-
-        s = s_orig.copy()
-        s[5] = 5.
-        expected = Series([1,2,3,5.],index=[0,1,2,5])
-        assert_series_equal(s,expected)
-
-        s = s_orig.copy()
-        s.loc[5] = 5.
-        expected = Series([1,2,3,5.],index=[0,1,2,5])
-        assert_series_equal(s,expected)
-
-        # iloc/iat raise
-        s = s_orig.copy()
-        def f():
-            s.iloc[3] = 5.
-        self.assertRaises(IndexError, f)
-        def f():
-            s.iat[3] = 5.
-        self.assertRaises(IndexError, f)
-
-        ### frame ###
-
-        df_orig = DataFrame(np.arange(6).reshape(3,2),columns=['A','B'],dtype='int64')
-
-        # iloc/iat raise
-        df = df_orig.copy()
-        def f():
-            df.iloc[4,2] = 5.
-        self.assertRaises(IndexError, f)
-        def f():
-            df.iat[4,2] = 5.
-        self.assertRaises(IndexError, f)
-
-        # row setting where it exists
-        expected = DataFrame(dict({ 'A' : [0,4,4], 'B' : [1,5,5] }))
-        df = df_orig.copy()
-        df.iloc[1] = df.iloc[2]
-        assert_frame_equal(df,expected)
-
-        expected = DataFrame(dict({ 'A' : [0,4,4], 'B' : [1,5,5] }))
-        df = df_orig.copy()
-        df.loc[1] = df.loc[2]
-        assert_frame_equal(df,expected)
-
-        # like 2578, partial setting with dtype preservation
-        expected = DataFrame(dict({ 'A' : [0,2,4,4], 'B' : [1,3,5,5] }))
-        df = df_orig.copy()
-        df.loc[3] = df.loc[2]
-        assert_frame_equal(df,expected)
-
-        # single dtype frame, overwrite
-        expected = DataFrame(dict({ 'A' : [0,2,4], 'B' : [0,2,4] }))
-        df = df_orig.copy()
-        df.ix[:,'B'] = df.ix[:,'A']
-        assert_frame_equal(df,expected)
-
-        # mixed dtype frame, overwrite
-        expected = DataFrame(dict({ 'A' : [0,2,4], 'B' : Series([0,2,4]) }))
-        df = df_orig.copy()
-        df['B'] = df['B'].astype(np.float64)
-        df.ix[:,'B'] = df.ix[:,'A']
-        assert_frame_equal(df,expected)
-
-        # single dtype frame, partial setting
-        expected = df_orig.copy()
-        expected['C'] = df['A']
-        df = df_orig.copy()
-        df.ix[:,'C'] = df.ix[:,'A']
-        assert_frame_equal(df,expected)
-
-        # mixed frame, partial setting
-        expected = df_orig.copy()
-        expected['C'] = df['A']
-        df = df_orig.copy()
-        df.ix[:,'C'] = df.ix[:,'A']
-        assert_frame_equal(df,expected)
-
-        ### panel ###
-        p_orig = Panel(np.arange(16).reshape(2,4,2),items=['Item1','Item2'],major_axis=pd.date_range('2001/1/12',periods=4),minor_axis=['A','B'],dtype='float64')
-
-        # panel setting via item
-        p_orig = Panel(np.arange(16).reshape(2,4,2),items=['Item1','Item2'],major_axis=pd.date_range('2001/1/12',periods=4),minor_axis=['A','B'],dtype='float64')
-        expected = p_orig.copy()
-        expected['Item3'] = expected['Item1']
-        p = p_orig.copy()
-        p.loc['Item3'] = p['Item1']
-        assert_panel_equal(p,expected)
-
-        # panel with aligned series
-        expected = p_orig.copy()
-        expected = expected.transpose(2,1,0)
-        expected['C'] = DataFrame({ 'Item1' : [30,30,30,30], 'Item2' : [32,32,32,32] },index=p_orig.major_axis)
-        expected = expected.transpose(2,1,0)
-        p = p_orig.copy()
-        p.loc[:,:,'C'] = Series([30,32],index=p_orig.items)
-        assert_panel_equal(p,expected)
-
-        # GH 8473
-        dates = date_range('1/1/2000', periods=8)
-        df_orig = DataFrame(np.random.randn(8, 4), index=dates, columns=['A', 'B', 'C', 'D'])
-
-        expected = pd.concat([df_orig,DataFrame({'A' : 7},index=[dates[-1]+1])])
-        df = df_orig.copy()
-        df.loc[dates[-1]+1, 'A'] = 7
-        assert_frame_equal(df,expected)
-        df = df_orig.copy()
-        df.at[dates[-1]+1, 'A'] = 7
-        assert_frame_equal(df,expected)
-
-        expected = pd.concat([df_orig,DataFrame({0 : 7},index=[dates[-1]+1])],axis=1)
-        df = df_orig.copy()
-        df.loc[dates[-1]+1, 0] = 7
-        assert_frame_equal(df,expected)
-        df = df_orig.copy()
-        df.at[dates[-1]+1, 0] = 7
-        assert_frame_equal(df,expected)
-
-    def test_partial_setting_mixed_dtype(self):
-
-        # in a mixed dtype environment, try to preserve dtypes
-        # by appending
-        df = DataFrame([[True, 1],[False, 2]],
-                       columns = ["female","fitness"])
-
-        s = df.loc[1].copy()
-        s.name = 2
-        expected = df.append(s)
-
-        df.loc[2] = df.loc[1]
-        assert_frame_equal(df, expected)
-
-        # columns will align
-        df = DataFrame(columns=['A','B'])
-        df.loc[0] = Series(1,index=range(4))
-        assert_frame_equal(df,DataFrame(columns=['A','B'],index=[0]))
-
-        # columns will align
-        df = DataFrame(columns=['A','B'])
-        df.loc[0] = Series(1,index=['B'])
-        assert_frame_equal(df,DataFrame([[np.nan, 1]], columns=['A','B'],index=[0],dtype='float64'))
-
-        # list-like must conform
-        df = DataFrame(columns=['A','B'])
-        def f():
-            df.loc[0] = [1,2,3]
-        self.assertRaises(ValueError, f)
-
-        # these are coerced to float unavoidably (as its a list-like to begin)
-        df = DataFrame(columns=['A','B'])
-        df.loc[3] = [6,7]
-        assert_frame_equal(df,DataFrame([[6,7]],index=[3],columns=['A','B'],dtype='float64'))
-
-    def test_partial_setting_with_datetimelike_dtype(self):
-
-        # GH9478
-        # a datetimeindex alignment issue with partial setting
-        df = pd.DataFrame(np.arange(6.).reshape(3,2), columns=list('AB'),
-                          index=pd.date_range('1/1/2000', periods=3, freq='1H'))
-        expected = df.copy()
-        expected['C'] = [expected.index[0]] + [pd.NaT,pd.NaT]
-
-        mask = df.A < 1
-        df.loc[mask, 'C'] = df.loc[mask].index
-        assert_frame_equal(df, expected)
-
-    def test_loc_setitem_datetime(self):
-
-        # GH 9516
-        dt1 = Timestamp('20130101 09:00:00')
-        dt2 = Timestamp('20130101 10:00:00')
-
-        for conv in [lambda x: x, lambda x: x.to_datetime64(),
-                     lambda x: x.to_pydatetime(), lambda x: np.datetime64(x)]:
-
-            df = pd.DataFrame()
-            df.loc[conv(dt1),'one'] = 100
-            df.loc[conv(dt2),'one'] = 200
-
-            expected = DataFrame({'one' : [100.0,200.0]},index=[dt1,dt2])
-            assert_frame_equal(df, expected)
-
-    def test_series_partial_set(self):
-        # partial set with new index
-        # Regression from GH4825
-        ser = Series([0.1, 0.2], index=[1, 2])
-
-        # loc
-        expected = Series([np.nan, 0.2, np.nan], index=[3, 2, 3])
-        result = ser.loc[[3, 2, 3]]
-        assert_series_equal(result, expected)
-
-        # raises as nothing in in the index
-        self.assertRaises(KeyError, lambda : ser.loc[[3, 3, 3]])
-
-        expected = Series([0.2, 0.2, np.nan], index=[2, 2, 3])
-        result = ser.loc[[2, 2, 3]]
-        assert_series_equal(result, expected)
-
-        expected = Series([0.3, np.nan, np.nan], index=[3, 4, 4])
-        result = Series([0.1, 0.2, 0.3], index=[1,2,3]).loc[[3,4,4]]
-        assert_series_equal(result, expected)
-
-        expected = Series([np.nan, 0.3, 0.3], index=[5, 3, 3])
-        result = Series([0.1, 0.2, 0.3, 0.4], index=[1,2,3,4]).loc[[5,3,3]]
-        assert_series_equal(result, expected)
-
-        expected = Series([np.nan, 0.4, 0.4], index=[5, 4, 4])
-        result = Series([0.1, 0.2, 0.3, 0.4], index=[1,2,3,4]).loc[[5,4,4]]
-        assert_series_equal(result, expected)
-
-        expected = Series([0.4, np.nan, np.nan], index=[7, 2, 2])
-        result = Series([0.1, 0.2, 0.3, 0.4], index=[4,5,6,7]).loc[[7,2,2]]
-        assert_series_equal(result, expected)
-
-        expected = Series([0.4, np.nan, np.nan], index=[4, 5, 5])
-        result = Series([0.1, 0.2, 0.3, 0.4], index=[1,2,3,4]).loc[[4,5,5]]
-        assert_series_equal(result, expected)
-
-        # iloc
-        expected = Series([0.2,0.2,0.1,0.1], index=[2,2,1,1])
-        result = ser.iloc[[1,1,0,0]]
-        assert_series_equal(result, expected)
-
-    def test_partial_set_invalid(self):
-
-        # GH 4940
-        # allow only setting of 'valid' values
-
-        df = tm.makeTimeDataFrame()
-
-        # don't allow not string inserts
-        def f():
-            df.loc[100.0, :] = df.ix[0]
-        self.assertRaises(TypeError, f)
-        def f():
-            df.loc[100,:] = df.ix[0]
-        self.assertRaises(TypeError, f)
-
-        def f():
-            df.ix[100.0, :] = df.ix[0]
-        self.assertRaises(ValueError, f)
-        def f():
-            df.ix[100,:] = df.ix[0]
-        self.assertRaises(ValueError, f)
-
-        # allow object conversion here
-        df.loc['a',:] = df.ix[0]
-
-    def test_partial_set_empty(self):
-
-        # GH5226
-
-        # partially set with an empty object
-        # series
-        s = Series()
-        s.loc[1] = 1
-        assert_series_equal(s,Series([1],index=[1]))
-        s.loc[3] = 3
-        assert_series_equal(s,Series([1,3],index=[1,3]))
-
-        s = Series()
-        s.loc[1] = 1.
-        assert_series_equal(s,Series([1.],index=[1]))
-        s.loc[3] = 3.
-        assert_series_equal(s,Series([1.,3.],index=[1,3]))
-
-        s = Series()
-        s.loc['foo'] = 1
-        assert_series_equal(s,Series([1],index=['foo']))
-        s.loc['bar'] = 3
-        assert_series_equal(s,Series([1,3],index=['foo','bar']))
-        s.loc[3] = 4
-        assert_series_equal(s,Series([1,3,4],index=['foo','bar',3]))
-
-        # partially set with an empty object
-        # frame
-        df = DataFrame()
-
-        def f():
-            df.loc[1] = 1
-        self.assertRaises(ValueError, f)
-        def f():
-            df.loc[1] = Series([1],index=['foo'])
-        self.assertRaises(ValueError, f)
-        def f():
-            df.loc[:,1] = 1
-        self.assertRaises(ValueError, f)
-
-        # these work as they don't really change
-        # anything but the index
-        # GH5632
-        expected = DataFrame(columns=['foo'])
-        def f():
-            df = DataFrame()
-            df['foo'] = Series([], dtype='object')
-            return df
-        assert_frame_equal(f(), expected)
-        def f():
-            df = DataFrame()
-            df['foo'] = Series(df.index)
-            return df
-        assert_frame_equal(f(), expected)
-        def f():
-            df = DataFrame()
-            df['foo'] = df.index
-            return df
-        assert_frame_equal(f(), expected)
-
-        expected = DataFrame(columns=['foo'])
-        expected['foo'] = expected['foo'].astype('float64')
-        def f():
-            df = DataFrame()
-            df['foo'] = []
-            return df
-        assert_frame_equal(f(), expected)
-        def f():
-            df = DataFrame()
-            df['foo'] = Series(range(len(df)))
-            return df
-        assert_frame_equal(f(), expected)
-        def f():
-            df = DataFrame()
-            df['foo'] = range(len(df))
-            return df
-        assert_frame_equal(f(), expected)
-
-        df = DataFrame()
-        df2 = DataFrame()
-        df2[1] = Series([1],index=['foo'])
-        df.loc[:,1] = Series([1],index=['foo'])
-        assert_frame_equal(df,DataFrame([[1]],index=['foo'],columns=[1]))
-        assert_frame_equal(df,df2)
-
-        # no index to start
-        expected = DataFrame({ 0 : Series(1,index=range(4)) },columns=['A','B',0])
-
-        df = DataFrame(columns=['A','B'])
-        df[0] = Series(1,index=range(4))
-        df.dtypes
-        str(df)
-        assert_frame_equal(df,expected)
-
-        df = DataFrame(columns=['A','B'])
-        df.loc[:,0] = Series(1,index=range(4))
-        df.dtypes
-        str(df)
-        assert_frame_equal(df,expected)
-
-        # GH5720, GH5744
-        # don't create rows when empty
-        expected = DataFrame(columns=['A','B','New'])
-        expected['A'] = expected['A'].astype('int64')
-        expected['B'] = expected['B'].astype('float64')
-        expected['New'] = expected['New'].astype('float64')
-        df = DataFrame({"A": [1, 2, 3], "B": [1.2, 4.2, 5.2]})
-        y = df[df.A > 5]
-        y['New'] = np.nan
-        assert_frame_equal(y,expected)
-        #assert_frame_equal(y,expected)
-
-        expected = DataFrame(columns=['a','b','c c','d'])
-        expected['d'] = expected['d'].astype('int64')
-        df = DataFrame(columns=['a', 'b', 'c c'])
-        df['d'] = 3
-        assert_frame_equal(df,expected)
-        assert_series_equal(df['c c'],Series(name='c c',dtype=object))
-
-        # reindex columns is ok
-        df = DataFrame({"A": [1, 2, 3], "B": [1.2, 4.2, 5.2]})
-        y = df[df.A > 5]
-        result = y.reindex(columns=['A','B','C'])
-        expected = DataFrame(columns=['A','B','C'])
-        expected['A'] = expected['A'].astype('int64')
-        expected['B'] = expected['B'].astype('float64')
-        expected['C'] = expected['C'].astype('float64')
-        assert_frame_equal(result,expected)
-
-        # GH 5756
-        # setting with empty Series
-        df = DataFrame(Series())
-        assert_frame_equal(df, DataFrame({ 0 : Series() }))
-
-        df = DataFrame(Series(name='foo'))
-        assert_frame_equal(df, DataFrame({ 'foo' : Series() }))
-
-        # GH 5932
-        # copy on empty with assignment fails
-        df = DataFrame(index=[0])
-        df = df.copy()
-        df['a'] = 0
-        expected = DataFrame(0,index=[0],columns=['a'])
-        assert_frame_equal(df, expected)
-
-        # GH 6171
-        # consistency on empty frames
-        df = DataFrame(columns=['x', 'y'])
-        df['x'] = [1, 2]
-        expected = DataFrame(dict(x = [1,2], y = [np.nan,np.nan]))
-        assert_frame_equal(df, expected, check_dtype=False)
-
-        df = DataFrame(columns=['x', 'y'])
-        df['x'] = ['1', '2']
-        expected = DataFrame(dict(x = ['1','2'], y = [np.nan,np.nan]),dtype=object)
-        assert_frame_equal(df, expected)
-
-        df = DataFrame(columns=['x', 'y'])
-        df.loc[0, 'x'] = 1
-        expected = DataFrame(dict(x = [1], y = [np.nan]))
-        assert_frame_equal(df, expected, check_dtype=False)
-
-    def test_cache_updating(self):
-        # GH 4939, make sure to update the cache on setitem
-
-        df = tm.makeDataFrame()
-        df['A'] # cache series
-        df.ix["Hello Friend"] = df.ix[0]
-        self.assertIn("Hello Friend", df['A'].index)
-        self.assertIn("Hello Friend", df['B'].index)
-
-        panel = tm.makePanel()
-        panel.ix[0] # get first item into cache
-        panel.ix[:, :, 'A+1'] = panel.ix[:, :, 'A'] + 1
-        self.assertIn("A+1", panel.ix[0].columns)
-        self.assertIn("A+1", panel.ix[1].columns)
-
-        # 5216
-        # make sure that we don't try to set a dead cache
-        a = np.random.rand(10, 3)
-        df = DataFrame(a, columns=['x', 'y', 'z'])
-        tuples = [(i, j) for i in range(5) for j in range(2)]
-        index = MultiIndex.from_tuples(tuples)
-        df.index = index
-
-        # setting via chained assignment
-        # but actually works, since everything is a view
-        df.loc[0]['z'].iloc[0] = 1.
-        result = df.loc[(0,0),'z']
-        self.assertEqual(result, 1)
-
-        # correct setting
-        df.loc[(0,0),'z'] = 2
-        result = df.loc[(0,0),'z']
-        self.assertEqual(result, 2)
-
-        # 10264
-        df = DataFrame(np.zeros((5,5),dtype='int64'),columns=['a','b','c','d','e'],index=range(5))
-        df['f'] = 0
-        df.f.values[3] = 1
-        y = df.iloc[np.arange(2,len(df))]
-        df.f.values[3] = 2
-        expected = DataFrame(np.zeros((5,6),dtype='int64'),columns=['a','b','c','d','e','f'],index=range(5))
-        expected.at[3,'f'] = 2
-        assert_frame_equal(df, expected)
-        expected = Series([0,0,0,2,0],name='f')
-        assert_series_equal(df.f, expected)
-
-    def test_slice_consolidate_invalidate_item_cache(self):
-
-        # this is chained assignment, but will 'work'
-        with option_context('chained_assignment',None):
-
-            # #3970
-            df = DataFrame({ "aa":lrange(5), "bb":[2.2]*5})
-
-            # Creates a second float block
-            df["cc"] = 0.0
-
-            # caches a reference to the 'bb' series
-            df["bb"]
-
-            # repr machinery triggers consolidation
-            repr(df)
-
-            # Assignment to wrong series
-            df['bb'].iloc[0] = 0.17
-            df._clear_item_cache()
-            self.assertAlmostEqual(df['bb'][0], 0.17)
-
-    def test_setitem_cache_updating(self):
-        # GH 5424
-        cont = ['one', 'two','three', 'four', 'five', 'six', 'seven']
-
-        for do_ref in [False,False]:
-            df = DataFrame({'a' : cont, "b":cont[3:]+cont[:3] ,'c' : np.arange(7)})
-
-            # ref the cache
-            if do_ref:
-                df.ix[0,"c"]
-
-            # set it
-            df.ix[7,'c'] = 1
-
-            self.assertEqual(df.ix[0,'c'], 0.0)
-            self.assertEqual(df.ix[7,'c'], 1.0)
-
-        # GH 7084
-        # not updating cache on series setting with slices
-        expected = DataFrame({'A': [600, 600, 600]}, index=date_range('5/7/2014', '5/9/2014'))
-        out = DataFrame({'A': [0, 0, 0]}, index=date_range('5/7/2014', '5/9/2014'))
-        df = DataFrame({'C': ['A', 'A', 'A'], 'D': [100, 200, 300]})
-
-        #loop through df to update out
-        six = Timestamp('5/7/2014')
-        eix = Timestamp('5/9/2014')
-        for ix, row in df.iterrows():
-            out.loc[six:eix,row['C']] = out.loc[six:eix,row['C']] + row['D']
-
-        assert_frame_equal(out, expected)
-        assert_series_equal(out['A'], expected['A'])
-
-        # try via a chain indexing
-        # this actually works
-        out = DataFrame({'A': [0, 0, 0]}, index=date_range('5/7/2014', '5/9/2014'))
-        for ix, row in df.iterrows():
-            v = out[row['C']][six:eix] + row['D']
-            out[row['C']][six:eix] = v
-
-        assert_frame_equal(out, expected)
-        assert_series_equal(out['A'], expected['A'])
-
-        out = DataFrame({'A': [0, 0, 0]}, index=date_range('5/7/2014', '5/9/2014'))
-        for ix, row in df.iterrows():
-            out.loc[six:eix,row['C']] += row['D']
-
-        assert_frame_equal(out, expected)
-        assert_series_equal(out['A'], expected['A'])
-
-    def test_setitem_chained_setfault(self):
-
-        # GH6026
-        # setfaults under numpy 1.7.1 (ok on 1.8)
-        data = ['right', 'left', 'left', 'left', 'right', 'left', 'timeout']
-        mdata = ['right', 'left', 'left', 'left', 'right', 'left', 'none']
-
-        df = DataFrame({'response': np.array(data)})
-        mask = df.response == 'timeout'
-        df.response[mask] = 'none'
-        assert_frame_equal(df, DataFrame({'response': mdata }))
-
-        recarray = np.rec.fromarrays([data], names=['response'])
-        df = DataFrame(recarray)
-        mask = df.response == 'timeout'
-        df.response[mask] = 'none'
-        assert_frame_equal(df, DataFrame({'response': mdata }))
-
-        df = DataFrame({'response': data, 'response1' : data })
-        mask = df.response == 'timeout'
-        df.response[mask] = 'none'
-        assert_frame_equal(df, DataFrame({'response': mdata, 'response1' : data }))
-
-        # GH 6056
-        expected = DataFrame(dict(A = [np.nan,'bar','bah','foo','bar']))
-        df = DataFrame(dict(A = np.array(['foo','bar','bah','foo','bar'])))
-        df['A'].iloc[0] = np.nan
-        result = df.head()
-        assert_frame_equal(result, expected)
-
-        df = DataFrame(dict(A = np.array(['foo','bar','bah','foo','bar'])))
-        df.A.iloc[0] = np.nan
-        result = df.head()
-        assert_frame_equal(result, expected)
-
-    def test_detect_chained_assignment(self):
-
-        pd.set_option('chained_assignment','raise')
-
-        # work with the chain
-        expected = DataFrame([[-5,1],[-6,3]],columns=list('AB'))
-        df = DataFrame(np.arange(4).reshape(2,2),columns=list('AB'),dtype='int64')
-        self.assertIsNone(df.is_copy)
-        df['A'][0] = -5
-        df['A'][1] = -6
-        assert_frame_equal(df, expected)
-
-        # test with the chaining
-        df = DataFrame({ 'A' : Series(range(2),dtype='int64'), 'B' : np.array(np.arange(2,4),dtype=np.float64)})
-        self.assertIsNone(df.is_copy)
-        def f():
-            df['A'][0] = -5
-        self.assertRaises(com.SettingWithCopyError, f)
-        def f():
-            df['A'][1] = np.nan
-        self.assertRaises(com.SettingWithCopyError, f)
-        self.assertIsNone(df['A'].is_copy)
-
-        # using a copy (the chain), fails
-        df = DataFrame({ 'A' : Series(range(2),dtype='int64'), 'B' : np.array(np.arange(2,4),dtype=np.float64)})
-        def f():
-            df.loc[0]['A'] = -5
-        self.assertRaises(com.SettingWithCopyError, f)
-
-        # doc example
-        df = DataFrame({'a' : ['one', 'one', 'two',
-                               'three', 'two', 'one', 'six'],
-                        'c' : Series(range(7),dtype='int64') })
-        self.assertIsNone(df.is_copy)
-        expected = DataFrame({'a' : ['one', 'one', 'two',
-                                     'three', 'two', 'one', 'six'],
-                              'c' : [42,42,2,3,4,42,6]})
-
-        def f():
-            indexer = df.a.str.startswith('o')
-            df[indexer]['c'] = 42
-        self.assertRaises(com.SettingWithCopyError, f)
-
-        expected = DataFrame({'A':[111,'bbb','ccc'],'B':[1,2,3]})
-        df = DataFrame({'A':['aaa','bbb','ccc'],'B':[1,2,3]})
-        def f():
-            df['A'][0] = 111
-        self.assertRaises(com.SettingWithCopyError, f)
-        def f():
-            df.loc[0]['A'] = 111
-        self.assertRaises(com.SettingWithCopyError, f)
-
-        df.loc[0,'A'] = 111
-        assert_frame_equal(df,expected)
-
-        # make sure that is_copy is picked up reconstruction
-        # GH5475
-        df = DataFrame({"A": [1,2]})
-        self.assertIsNone(df.is_copy)
-        with tm.ensure_clean('__tmp__pickle') as path:
-            df.to_pickle(path)
-            df2 = pd.read_pickle(path)
-            df2["B"] = df2["A"]
-            df2["B"] = df2["A"]
-
-        # a suprious raise as we are setting the entire column here
-        # GH5597
-        from string import ascii_letters as letters
-
-        def random_text(nobs=100):
-            df = []
-            for i in range(nobs):
-                idx= np.random.randint(len(letters), size=2)
-                idx.sort()
-                df.append([letters[idx[0]:idx[1]]])
-
-            return DataFrame(df, columns=['letters'])
-
-        df = random_text(100000)
-
-        # always a copy
-        x = df.iloc[[0,1,2]]
-        self.assertIsNotNone(x.is_copy)
-        x = df.iloc[[0,1,2,4]]
-        self.assertIsNotNone(x.is_copy)
-
-        # explicity copy
-        indexer = df.letters.apply(lambda x : len(x) > 10)
-        df = df.ix[indexer].copy()
-        self.assertIsNone(df.is_copy)
-        df['letters'] = df['letters'].apply(str.lower)
-
-        # implicity take
-        df = random_text(100000)
-        indexer = df.letters.apply(lambda x : len(x) > 10)
-        df = df.ix[indexer]
-        self.assertIsNotNone(df.is_copy)
-        df['letters'] = df['letters'].apply(str.lower)
-
-        # implicity take 2
-        df = random_text(100000)
-        indexer = df.letters.apply(lambda x : len(x) > 10)
-        df = df.ix[indexer]
-        self.assertIsNotNone(df.is_copy)
-        df.loc[:,'letters'] = df['letters'].apply(str.lower)
-
-        # should be ok even though it's a copy!
-        self.assertIsNone(df.is_copy)
-        df['letters'] = df['letters'].apply(str.lower)
-        self.assertIsNone(df.is_copy)
-
-        df = random_text(100000)
-        indexer = df.letters.apply(lambda x : len(x) > 10)
-        df.ix[indexer,'letters'] = df.ix[indexer,'letters'].apply(str.lower)
-
-        # an identical take, so no copy
-        df = DataFrame({'a' : [1]}).dropna()
-        self.assertIsNone(df.is_copy)
-        df['a'] += 1
-
-        # inplace ops
-        # original from: http://stackoverflow.com/questions/20508968/series-fillna-in-a-multiindex-dataframe-does-not-fill-is-this-a-bug
-        a = [12, 23]
-        b = [123, None]
-        c = [1234, 2345]
-        d = [12345, 23456]
-        tuples = [('eyes', 'left'), ('eyes', 'right'), ('ears', 'left'), ('ears', 'right')]
-        events = {('eyes', 'left'): a, ('eyes', 'right'): b, ('ears', 'left'): c, ('ears', 'right'): d}
-        multiind = MultiIndex.from_tuples(tuples, names=['part', 'side'])
-        zed = DataFrame(events, index=['a', 'b'], columns=multiind)
-        def f():
-            zed['eyes']['right'].fillna(value=555, inplace=True)
-        self.assertRaises(com.SettingWithCopyError, f)
-
-        df = DataFrame(np.random.randn(10,4))
-        s = df.iloc[:,0].sort_values()
-        assert_series_equal(s,df.iloc[:,0].sort_values())
-        assert_series_equal(s,df[0].sort_values())
-
-        # false positives GH6025
-        df = DataFrame ({'column1':['a', 'a', 'a'], 'column2': [4,8,9] })
-        str(df)
-        df['column1'] = df['column1'] + 'b'
-        str(df)
-        df = df [df['column2']!=8]
-        str(df)
-        df['column1'] = df['column1'] + 'c'
-        str(df)
-
-        # from SO: http://stackoverflow.com/questions/24054495/potential-bug-setting-value-for-undefined-column-using-iloc
-        df = DataFrame(np.arange(0,9), columns=['count'])
-        df['group'] = 'b'
-        def f():
-            df.iloc[0:5]['group'] = 'a'
-        self.assertRaises(com.SettingWithCopyError, f)
-
-        # mixed type setting
-        # same dtype & changing dtype
-        df = DataFrame(dict(A=date_range('20130101',periods=5),B=np.random.randn(5),C=np.arange(5,dtype='int64'),D=list('abcde')))
-
-        def f():
-            df.ix[2]['D'] = 'foo'
-        self.assertRaises(com.SettingWithCopyError, f)
-        def f():
-            df.ix[2]['C'] = 'foo'
-        self.assertRaises(com.SettingWithCopyError, f)
-        def f():
-            df['C'][2] = 'foo'
-        self.assertRaises(com.SettingWithCopyError, f)
-
-    def test_setting_with_copy_bug(self):
-
-        # operating on a copy
-        df = pd.DataFrame({'a': list(range(4)), 'b': list('ab..'), 'c': ['a', 'b', np.nan, 'd']})
-        mask = pd.isnull(df.c)
-
-        def f():
-            df[['c']][mask] = df[['b']][mask]
-        self.assertRaises(com.SettingWithCopyError, f)
-
-        # invalid warning as we are returning a new object
-        # GH 8730
-        df1 = DataFrame({'x': Series(['a','b','c']), 'y': Series(['d','e','f'])})
-        df2 = df1[['x']]
-
-        # this should not raise
-        df2['y'] = ['g', 'h', 'i']
-
-    def test_detect_chained_assignment_warnings(self):
-
-        # warnings
-        with option_context('chained_assignment','warn'):
-            df = DataFrame({'A':['aaa','bbb','ccc'],'B':[1,2,3]})
-            with tm.assert_produces_warning(expected_warning=com.SettingWithCopyWarning):
-                df.loc[0]['A'] = 111
-
-    def test_float64index_slicing_bug(self):
-        # GH 5557, related to slicing a float index
-        ser = {256: 2321.0, 1: 78.0, 2: 2716.0, 3: 0.0, 4: 369.0, 5: 0.0, 6: 269.0, 7: 0.0, 8: 0.0, 9: 0.0, 10: 3536.0, 11: 0.0, 12: 24.0, 13: 0.0, 14: 931.0, 15: 0.0, 16: 101.0, 17: 78.0, 18: 9643.0, 19: 0.0, 20: 0.0, 21: 0.0, 22: 63761.0, 23: 0.0, 24: 446.0, 25: 0.0, 26: 34773.0, 27: 0.0, 28: 729.0, 29: 78.0, 30: 0.0, 31: 0.0, 32: 3374.0, 33: 0.0, 34: 1391.0, 35: 0.0, 36: 361.0, 37: 0.0, 38: 61808.0, 39: 0.0, 40: 0.0, 41: 0.0, 42: 6677.0, 43: 0.0, 44: 802.0, 45: 0.0, 46: 2691.0, 47: 0.0, 48: 3582.0, 49: 0.0, 50: 734.0, 51: 0.0, 52: 627.0, 53: 70.0, 54: 2584.0, 55: 0.0, 56: 324.0, 57: 0.0, 58: 605.0, 59: 0.0, 60: 0.0, 61: 0.0, 62: 3989.0, 63: 10.0, 64: 42.0, 65: 0.0, 66: 904.0, 67: 0.0, 68: 88.0, 69: 70.0, 70: 8172.0, 71: 0.0, 72: 0.0, 73: 0.0, 74: 64902.0, 75: 0.0, 76: 347.0, 77: 0.0, 78: 36605.0, 79: 0.0, 80: 379.0, 81: 70.0, 82: 0.0, 83: 0.0, 84: 3001.0, 85: 0.0, 86: 1630.0, 87: 7.0, 88: 364.0, 89: 0.0, 90: 67404.0, 91: 9.0, 92: 0.0, 93: 0.0, 94: 7685.0, 95: 0.0, 96: 1017.0, 97: 0.0, 98: 2831.0, 99: 0.0, 100: 2963.0, 101: 0.0, 102: 854.0, 103: 0.0, 104: 0.0, 105: 0.0, 106: 0.0, 107: 0.0, 108: 0.0, 109: 0.0, 110: 0.0, 111: 0.0, 112: 0.0, 113: 0.0, 114: 0.0, 115: 0.0, 116: 0.0, 117: 0.0, 118: 0.0, 119: 0.0, 120: 0.0, 121: 0.0, 122: 0.0, 123: 0.0, 124: 0.0, 125: 0.0, 126: 67744.0, 127: 22.0, 128: 264.0, 129: 0.0, 260: 197.0, 268: 0.0, 265: 0.0, 269: 0.0, 261: 0.0, 266: 1198.0, 267: 0.0, 262: 2629.0, 258: 775.0, 257: 0.0, 263: 0.0, 259: 0.0, 264: 163.0, 250: 10326.0, 251: 0.0, 252: 1228.0, 253: 0.0, 254: 2769.0, 255: 0.0}
-
-        # smoke test for the repr
-        s = Series(ser)
-        result  = s.value_counts()
-        str(result)
-
-    def test_floating_index_doc_example(self):
-
-        index = Index([1.5, 2, 3, 4.5, 5])
-        s = Series(range(5),index=index)
-        self.assertEqual(s[3], 2)
-        self.assertEqual(s.ix[3], 2)
-        self.assertEqual(s.loc[3], 2)
-        self.assertEqual(s.iloc[3], 3)
-
-    def test_floating_index(self):
-
-        # related 236
-        # scalar/slicing of a float index
-        s = Series(np.arange(5), index=np.arange(5) * 2.5, dtype=np.int64)
-
-        # label based slicing
-        result1 = s[1.0:3.0]
-        result2 = s.ix[1.0:3.0]
-        result3 = s.loc[1.0:3.0]
-        assert_series_equal(result1, result2)
-        assert_series_equal(result1, result3)
-
-        # exact indexing when found
-        result1 = s[5.0]
-        result2 = s.loc[5.0]
-        result3 = s.ix[5.0]
-        self.assertEqual(result1, result2)
-        self.assertEqual(result1, result3)
-
-        result1 = s[5]
-        result2 = s.loc[5]
-        result3 = s.ix[5]
-        self.assertEqual(result1, result2)
-        self.assertEqual(result1, result3)
-
-        self.assertEqual(s[5.0], s[5])
-
-        # value not found (and no fallbacking at all)
-
-        # scalar integers
-        self.assertRaises(KeyError, lambda : s.loc[4])
-        self.assertRaises(KeyError, lambda : s.ix[4])
-        self.assertRaises(KeyError, lambda : s[4])
-
-        # fancy floats/integers create the correct entry (as nan)
-        # fancy tests
-        expected = Series([2, 0], index=Float64Index([5.0, 0.0]))
-        for fancy_idx in [[5.0, 0.0], [5, 0], np.array([5.0, 0.0]), np.array([5, 0])]:
-            assert_series_equal(s[fancy_idx], expected)
-            assert_series_equal(s.loc[fancy_idx], expected)
-            assert_series_equal(s.ix[fancy_idx], expected)
-
-        # all should return the same as we are slicing 'the same'
-        result1 = s.loc[2:5]
-        result2 = s.loc[2.0:5.0]
-        result3 = s.loc[2.0:5]
-        result4 = s.loc[2.1:5]
-        assert_series_equal(result1, result2)
-        assert_series_equal(result1, result3)
-        assert_series_equal(result1, result4)
-
-        # previously this did fallback indexing
-        result1 = s[2:5]
-        result2 = s[2.0:5.0]
-        result3 = s[2.0:5]
-        result4 = s[2.1:5]
-        assert_series_equal(result1, result2)
-        assert_series_equal(result1, result3)
-        assert_series_equal(result1, result4)
-
-        result1 = s.ix[2:5]
-        result2 = s.ix[2.0:5.0]
-        result3 = s.ix[2.0:5]
-        result4 = s.ix[2.1:5]
-        assert_series_equal(result1, result2)
-        assert_series_equal(result1, result3)
-        assert_series_equal(result1, result4)
-
-        # combined test
-        result1 = s.loc[2:5]
-        result2 = s.ix[2:5]
-        result3 = s[2:5]
-
-        assert_series_equal(result1, result2)
-        assert_series_equal(result1, result3)
-
-        # list selection
-        result1 = s[[0.0,5,10]]
-        result2 = s.loc[[0.0,5,10]]
-        result3 = s.ix[[0.0,5,10]]
-        result4 = s.iloc[[0,2,4]]
-        assert_series_equal(result1, result2)
-        assert_series_equal(result1, result3)
-        assert_series_equal(result1, result4)
-
-        result1 = s[[1.6,5,10]]
-        result2 = s.loc[[1.6,5,10]]
-        result3 = s.ix[[1.6,5,10]]
-        assert_series_equal(result1, result2)
-        assert_series_equal(result1, result3)
-        assert_series_equal(result1, Series([np.nan,2,4],index=[1.6,5,10]))
-
-        result1 = s[[0,1,2]]
-        result2 = s.ix[[0,1,2]]
-        result3 = s.loc[[0,1,2]]
-        assert_series_equal(result1, result2)
-        assert_series_equal(result1, result3)
-        assert_series_equal(result1, Series([0.0,np.nan,np.nan],index=[0,1,2]))
-
-        result1 = s.loc[[2.5, 5]]
-        result2 = s.ix[[2.5, 5]]
-        assert_series_equal(result1, result2)
-        assert_series_equal(result1, Series([1,2],index=[2.5,5.0]))
-
-        result1 = s[[2.5]]
-        result2 = s.ix[[2.5]]
-        result3 = s.loc[[2.5]]
-        assert_series_equal(result1, result2)
-        assert_series_equal(result1, result3)
-        assert_series_equal(result1, Series([1],index=[2.5]))
-
-    def test_scalar_indexer(self):
-        # float indexing checked above
-
-        def check_invalid(index, loc=None, iloc=None, ix=None, getitem=None):
-
-            # related 236/4850
-            # trying to access with a float index
-            s = Series(np.arange(len(index)),index=index)
-
-            if iloc is None:
-                iloc = TypeError
-            self.assertRaises(iloc, lambda : s.iloc[3.5])
-            if loc is None:
-                loc = TypeError
-            self.assertRaises(loc, lambda : s.loc[3.5])
-            if ix is None:
-                ix = TypeError
-            self.assertRaises(ix, lambda : s.ix[3.5])
-            if getitem is None:
-                getitem = TypeError
-            self.assertRaises(getitem, lambda : s[3.5])
-
-        for index in [ tm.makeStringIndex, tm.makeUnicodeIndex, tm.makeIntIndex,
-                       tm.makeDateIndex, tm.makePeriodIndex ]:
-            check_invalid(index())
-        check_invalid(Index(np.arange(5) * 2.5),loc=KeyError, ix=KeyError, getitem=KeyError)
-
-        def check_index(index, error):
-            index = index()
-            s = Series(np.arange(len(index)),index=index)
-
-            # positional selection
-            result1 = s[5]
-            result2 = s[5.0]
-            result3 = s.iloc[5]
-            result4 = s.iloc[5.0]
-
-            # by value
-            self.assertRaises(error, lambda : s.loc[5])
-            self.assertRaises(error, lambda : s.loc[5.0])
-
-            # this is fallback, so it works
-            result5 = s.ix[5]
-            result6 = s.ix[5.0]
-
-            self.assertEqual(result1, result2)
-            self.assertEqual(result1, result3)
-            self.assertEqual(result1, result4)
-            self.assertEqual(result1, result5)
-            self.assertEqual(result1, result6)
-
-        # string-like
-        for index in [ tm.makeStringIndex, tm.makeUnicodeIndex ]:
-            check_index(index, KeyError)
-
-        # datetimelike
-        for index in [ tm.makeDateIndex, tm.makeTimedeltaIndex, tm.makePeriodIndex ]:
-            check_index(index, TypeError)
-
-        # exact indexing when found on IntIndex
-        s = Series(np.arange(10),dtype='int64')
-
-        result1 = s[5.0]
-        result2 = s.loc[5.0]
-        result3 = s.ix[5.0]
-        result4 = s[5]
-        result5 = s.loc[5]
-        result6 = s.ix[5]
-        self.assertEqual(result1, result2)
-        self.assertEqual(result1, result3)
-        self.assertEqual(result1, result4)
-        self.assertEqual(result1, result5)
-        self.assertEqual(result1, result6)
-
-    def test_slice_indexer(self):
-
-        def check_iloc_compat(s):
-            # invalid type for iloc (but works with a warning)
-            # check_stacklevel=False -> impossible to get it right for all
-            # index types
-            with self.assert_produces_warning(
-                    FutureWarning, check_stacklevel=False):
-                s.iloc[6.0:8]
-            with self.assert_produces_warning(
-                    FutureWarning, check_stacklevel=False):
-                s.iloc[6.0:8.0]
-            with self.assert_produces_warning(
-                    FutureWarning, check_stacklevel=False):
-                s.iloc[6:8.0]
-
-        def check_slicing_positional(index):
-
-            s = Series(np.arange(len(index))+10,index=index)
-
-            # these are all positional
-            result1 = s[2:5]
-            result2 = s.ix[2:5]
-            result3 = s.iloc[2:5]
-            assert_series_equal(result1, result2)
-            assert_series_equal(result1, result3)
-
-            # loc will fail
-            self.assertRaises(TypeError, lambda : s.loc[2:5])
-
-            # make all float slicing fail
-            self.assertRaises(TypeError, lambda : s[2.0:5])
-            self.assertRaises(TypeError, lambda : s[2.0:5.0])
-            self.assertRaises(TypeError, lambda : s[2:5.0])
-
-            self.assertRaises(TypeError, lambda : s.ix[2.0:5])
-            self.assertRaises(TypeError, lambda : s.ix[2.0:5.0])
-            self.assertRaises(TypeError, lambda : s.ix[2:5.0])
-
-            self.assertRaises(TypeError, lambda : s.loc[2.0:5])
-            self.assertRaises(TypeError, lambda : s.loc[2.0:5.0])
-            self.assertRaises(TypeError, lambda : s.loc[2:5.0])
-
-            check_iloc_compat(s)
-
-        # all index types except int, float
-        for index in [ tm.makeStringIndex, tm.makeUnicodeIndex,
-                       tm.makeDateIndex, tm.makeTimedeltaIndex, tm.makePeriodIndex ]:
-            check_slicing_positional(index())
-
-        ############
-        # IntIndex #
-        ############
-        index = tm.makeIntIndex()
-        s = Series(np.arange(len(index),dtype='int64')+10,index+5)
-
-        # this is positional
-        result1 = s[2:5]
-        result4 = s.iloc[2:5]
-        assert_series_equal(result1, result4)
-
-        # these are all label based
-        result2 = s.ix[2:5]
-        result3 = s.loc[2:5]
-        assert_series_equal(result2, result3)
-
-        # float slicers on an int index
-        expected = Series([11,12,13],index=[6,7,8])
-        for method in [lambda x: x.loc, lambda x: x.ix]:
-            result = method(s)[6.0:8.5]
-            assert_series_equal(result, expected)
-
-            result = method(s)[5.5:8.5]
-            assert_series_equal(result, expected)
-
-            result = method(s)[5.5:8.0]
-            assert_series_equal(result, expected)
-
-        # make all float slicing fail for [] with an int index
-        self.assertRaises(TypeError, lambda : s[6.0:8])
-        self.assertRaises(TypeError, lambda : s[6.0:8.0])
-        self.assertRaises(TypeError, lambda : s[6:8.0])
-
-        check_iloc_compat(s)
-
-        ##############
-        # FloatIndex #
-        ##############
-        s.index = s.index.astype('float64')
-
-        # these are all value based
-        result1 = s[6:8]
-        result2 = s.ix[6:8]
-        result3 = s.loc[6:8]
-        assert_series_equal(result1, result2)
-        assert_series_equal(result1, result3)
-
-        # these are valid for all methods
-        # these are treated like labels (e.g. the rhs IS included)
-        def compare(slicers, expected):
-            for method in [lambda x: x, lambda x: x.loc, lambda x: x.ix ]:
-                for slices in slicers:
-
-                    result = method(s)[slices]
-                    assert_series_equal(result, expected)
-
-        compare([slice(6.0,8),slice(6.0,8.0),slice(6,8.0)],
-                s[(s.index>=6.0)&(s.index<=8)])
-        compare([slice(6.5,8),slice(6.5,8.5)],
-                s[(s.index>=6.5)&(s.index<=8.5)])
-        compare([slice(6,8.5)],
-                s[(s.index>=6.0)&(s.index<=8.5)])
-        compare([slice(6.5,6.5)],
-                s[(s.index>=6.5)&(s.index<=6.5)])
-
-        check_iloc_compat(s)
-
-    def test_set_ix_out_of_bounds_axis_0(self):
-        df = pd.DataFrame(randn(2, 5), index=["row%s" % i for i in range(2)], columns=["col%s" % i for i in range(5)])
-        self.assertRaises(ValueError, df.ix.__setitem__, (2, 0), 100)
-
-    def test_set_ix_out_of_bounds_axis_1(self):
-        df = pd.DataFrame(randn(5, 2), index=["row%s" % i for i in range(5)], columns=["col%s" % i for i in range(2)])
-        self.assertRaises(ValueError, df.ix.__setitem__, (0 , 2), 100)
-
-    def test_iloc_empty_list_indexer_is_ok(self):
-        from pandas.util.testing import makeCustomDataframe as mkdf
-        df = mkdf(5, 2)
-        # vertical empty
-        assert_frame_equal(df.iloc[:, []], df.iloc[:, :0],
-                           check_index_type=True, check_column_type=True)
-        # horizontal empty
-        assert_frame_equal(df.iloc[[], :], df.iloc[:0, :],
-                           check_index_type=True, check_column_type=True)
-        # horizontal empty
-        assert_frame_equal(df.iloc[[]], df.iloc[:0, :],
-                           check_index_type=True, check_column_type=True)
-
-    def test_loc_empty_list_indexer_is_ok(self):
-        from pandas.util.testing import makeCustomDataframe as mkdf
-        df = mkdf(5, 2)
-        # vertical empty
-        assert_frame_equal(df.loc[:, []], df.iloc[:, :0],
-                           check_index_type=True, check_column_type=True)
-        # horizontal empty
-        assert_frame_equal(df.loc[[], :], df.iloc[:0, :],
-                           check_index_type=True, check_column_type=True)
-        # horizontal empty
-        assert_frame_equal(df.loc[[]], df.iloc[:0, :],
-                           check_index_type=True, check_column_type=True)
-
-    def test_ix_empty_list_indexer_is_ok(self):
-        from pandas.util.testing import makeCustomDataframe as mkdf
-        df = mkdf(5, 2)
-        # vertical empty
-        assert_frame_equal(df.ix[:, []], df.iloc[:, :0],
-                           check_index_type=True, check_column_type=True)
-        # horizontal empty
-        assert_frame_equal(df.ix[[], :], df.iloc[:0, :],
-                           check_index_type=True, check_column_type=True)
-        # horizontal empty
-        assert_frame_equal(df.ix[[]], df.iloc[:0, :],
-                           check_index_type=True, check_column_type=True)
-
-    def test_deprecate_float_indexers(self):
-
-        # GH 4892
-        # deprecate allowing float indexers that are equal to ints to be used
-        # as indexers in non-float indices
-
-        import warnings
-        warnings.filterwarnings(action='error', category=FutureWarning)
-
-        def check_index(index):
-            i = index(5)
-
-            for s in  [ Series(np.arange(len(i)),index=i), DataFrame(np.random.randn(len(i),len(i)),index=i,columns=i) ]:
-                self.assertRaises(FutureWarning, lambda :
-                                  s.iloc[3.0])
-
-                # setting
-                def f():
-                    s.iloc[3.0] = 0
-                self.assertRaises(FutureWarning, f)
-
-            # fallsback to position selection ,series only
-            s = Series(np.arange(len(i)),index=i)
-            s[3]
-            self.assertRaises(FutureWarning, lambda : s[3.0])
-
-        for index in [ tm.makeStringIndex, tm.makeUnicodeIndex,
-                       tm.makeDateIndex, tm.makeTimedeltaIndex, tm.makePeriodIndex ]:
-            check_index(index)
-
-        # ints
-        i = index(5)
-        for s in [ Series(np.arange(len(i))), DataFrame(np.random.randn(len(i),len(i)),index=i,columns=i) ]:
-            self.assertRaises(FutureWarning, lambda :
-                              s.iloc[3.0])
-
-            # on some arch's this doesn't provide a warning (and thus raise)
-            # and some it does
-            try:
-                s[3.0]
-            except:
-                pass
-
-            # setting
-            def f():
-                s.iloc[3.0] = 0
-            self.assertRaises(FutureWarning, f)
-
-        # floats: these are all ok!
-        i = np.arange(5.)
-
-        for s in [ Series(np.arange(len(i)),index=i), DataFrame(np.random.randn(len(i),len(i)),index=i,columns=i) ]:
-            with tm.assert_produces_warning(False):
-                s[3.0]
-
-            with tm.assert_produces_warning(False):
-                s[3]
-
-            self.assertRaises(FutureWarning, lambda :
-                              s.iloc[3.0])
-
-            with tm.assert_produces_warning(False):
-                s.iloc[3]
-
-            with tm.assert_produces_warning(False):
-                s.loc[3.0]
-
-            with tm.assert_produces_warning(False):
-                s.loc[3]
-
-            def f():
-                s.iloc[3.0] = 0
-            self.assertRaises(FutureWarning, f)
-
-        # slices
-        for index in [ tm.makeIntIndex, tm.makeFloatIndex,
-                       tm.makeStringIndex, tm.makeUnicodeIndex,
-                       tm.makeDateIndex, tm.makePeriodIndex ]:
-
-            index = index(5)
-            for s in [ Series(range(5),index=index), DataFrame(np.random.randn(5,2),index=index) ]:
-
-                # getitem
-                self.assertRaises(FutureWarning, lambda :
-                                  s.iloc[3.0:4])
-                self.assertRaises(FutureWarning, lambda :
-                                  s.iloc[3.0:4.0])
-                self.assertRaises(FutureWarning, lambda :
-                                  s.iloc[3:4.0])
-
-                # setitem
-                def f():
-                    s.iloc[3.0:4] = 0
-                self.assertRaises(FutureWarning, f)
-                def f():
-                    s.iloc[3:4.0] = 0
-                self.assertRaises(FutureWarning, f)
-                def f():
-                    s.iloc[3.0:4.0] = 0
-                self.assertRaises(FutureWarning, f)
-
-        warnings.filterwarnings(action='ignore', category=FutureWarning)
-
-    def test_float_index_to_mixed(self):
-        df = DataFrame({0.0: np.random.rand(10),
-                        1.0: np.random.rand(10)})
-        df['a'] = 10
-        tm.assert_frame_equal(DataFrame({0.0: df[0.0],
-                                         1.0: df[1.0],
-                                         'a': [10] * 10}),
-                              df)
-
-    def test_duplicate_ix_returns_series(self):
-        df = DataFrame(np.random.randn(3, 3), index=[0.1, 0.2, 0.2],
-                       columns=list('abc'))
-        r = df.ix[0.2, 'a']
-        e = df.loc[0.2, 'a']
-        tm.assert_series_equal(r, e)
-
-    def test_float_index_non_scalar_assignment(self):
-        df = DataFrame({'a': [1,2,3], 'b': [3,4,5]},index=[1.,2.,3.])
-        df.loc[df.index[:2]] = 1
-        expected = DataFrame({'a':[1,1,3],'b':[1,1,5]},index=df.index)
-        tm.assert_frame_equal(expected, df)
-
-        df = DataFrame({'a': [1,2,3], 'b': [3,4,5]},index=[1.,2.,3.])
-        df2 = df.copy()
-        df.loc[df.index] = df.loc[df.index]
-        tm.assert_frame_equal(df,df2)
-
-    def test_float_index_at_iat(self):
-        s = pd.Series([1, 2, 3], index=[0.1, 0.2, 0.3])
-        for el, item in s.iteritems():
-            self.assertEqual(s.at[el], item)
-        for i in range(len(s)):
-            self.assertEqual(s.iat[i], i + 1)
-
-    def test_rhs_alignment(self):
-        # GH8258, tests that both rows & columns are aligned to what is
-        # assigned to. covers both uniform data-type & multi-type cases
-        def run_tests(df, rhs, right):
-            # label, index, slice
-            r, i, s = list('bcd'), [1, 2, 3], slice(1, 4)
-            c, j, l = ['joe', 'jolie'], [1, 2], slice(1, 3)
-
-            left = df.copy()
-            left.loc[r, c] = rhs
-            assert_frame_equal(left, right)
-
-            left = df.copy()
-            left.iloc[i, j] = rhs
-            assert_frame_equal(left, right)
-
-            left = df.copy()
-            left.ix[s, l] = rhs
-            assert_frame_equal(left, right)
-
-            left = df.copy()
-            left.ix[i, j] = rhs
-            assert_frame_equal(left, right)
-
-            left = df.copy()
-            left.ix[r, c] = rhs
-            assert_frame_equal(left, right)
-
-        xs = np.arange(20).reshape(5, 4)
-        cols = ['jim', 'joe', 'jolie', 'joline']
-        df = pd.DataFrame(xs, columns=cols, index=list('abcde'))
-
-        # right hand side; permute the indices and multiplpy by -2
-        rhs = - 2 * df.iloc[3:0:-1, 2:0:-1]
-
-        # expected `right` result; just multiply by -2
-        right = df.copy()
-        right.iloc[1:4, 1:3] *= -2
-
-        # run tests with uniform dtypes
-        run_tests(df, rhs, right)
-
-        # make frames multi-type & re-run tests
-        for frame in [df, rhs, right]:
-            frame['joe'] = frame['joe'].astype('float64')
-            frame['jolie'] = frame['jolie'].map('@{0}'.format)
-
-        run_tests(df, rhs, right)
-
-    def test_str_label_slicing_with_negative_step(self):
-        SLC = pd.IndexSlice
-
-        def assert_slices_equivalent(l_slc, i_slc):
-            assert_series_equal(s.loc[l_slc], s.iloc[i_slc])
-
-            if not idx.is_integer:
-                # For integer indices, ix and plain getitem are position-based.
-                assert_series_equal(s[l_slc], s.iloc[i_slc])
-                assert_series_equal(s.ix[l_slc], s.iloc[i_slc])
-
-        for idx in [_mklbl('A', 20), np.arange(20) + 100,
-                    np.linspace(100, 150, 20)]:
-            idx = Index(idx)
-            s = Series(np.arange(20), index=idx)
-            assert_slices_equivalent(SLC[idx[9]::-1], SLC[9::-1])
-            assert_slices_equivalent(SLC[:idx[9]:-1], SLC[:8:-1])
-            assert_slices_equivalent(SLC[idx[13]:idx[9]:-1], SLC[13:8:-1])
-            assert_slices_equivalent(SLC[idx[9]:idx[13]:-1], SLC[:0])
-
-    def test_multiindex_label_slicing_with_negative_step(self):
-        s = Series(np.arange(20),
-                   MultiIndex.from_product([list('abcde'), np.arange(4)]))
-        SLC = pd.IndexSlice
-
-        def assert_slices_equivalent(l_slc, i_slc):
-            assert_series_equal(s.loc[l_slc], s.iloc[i_slc])
-            assert_series_equal(s[l_slc], s.iloc[i_slc])
-            assert_series_equal(s.ix[l_slc], s.iloc[i_slc])
-
-        assert_slices_equivalent(SLC[::-1], SLC[::-1])
-
-        assert_slices_equivalent(SLC['d'::-1], SLC[15::-1])
-        assert_slices_equivalent(SLC[('d',)::-1], SLC[15::-1])
-
-        assert_slices_equivalent(SLC[:'d':-1], SLC[:11:-1])
-        assert_slices_equivalent(SLC[:('d',):-1], SLC[:11:-1])
-
-        assert_slices_equivalent(SLC['d':'b':-1], SLC[15:3:-1])
-        assert_slices_equivalent(SLC[('d',):'b':-1], SLC[15:3:-1])
-        assert_slices_equivalent(SLC['d':('b',):-1], SLC[15:3:-1])
-        assert_slices_equivalent(SLC[('d',):('b',):-1], SLC[15:3:-1])
-        assert_slices_equivalent(SLC['b':'d':-1], SLC[:0])
-
-        assert_slices_equivalent(SLC[('c', 2)::-1], SLC[10::-1])
-        assert_slices_equivalent(SLC[:('c', 2):-1], SLC[:9:-1])
-        assert_slices_equivalent(SLC[('e', 0):('c', 2):-1], SLC[16:9:-1])
-
-    def test_slice_with_zero_step_raises(self):
-        s = Series(np.arange(20), index=_mklbl('A', 20))
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: s[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: s.loc[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: s.ix[::0])
-
-    def test_indexing_assignment_dict_already_exists(self):
-        df = pd.DataFrame({'x': [1, 2, 6],
-                           'y': [2, 2, 8],
-                           'z': [-5, 0, 5]}).set_index('z')
-        expected = df.copy()
-        rhs = dict(x=9, y=99)
-        df.loc[5] = rhs
-        expected.loc[5] = [9, 99]
-        tm.assert_frame_equal(df, expected)
-
-    def test_indexing_dtypes_on_empty(self):
-        # Check that .iloc and .ix return correct dtypes GH9983
-        df = DataFrame({'a':[1,2,3],'b':['b','b2','b3']})
-        df2 = df.ix[[],:]
-
-        self.assertEqual(df2.loc[:,'a'].dtype, np.int64)
-        assert_series_equal(df2.loc[:,'a'], df2.iloc[:,0])
-        assert_series_equal(df2.loc[:,'a'], df2.ix[:,0])
-
-    def test_large_dataframe_indexing(self):
-        #GH10692
-        result = DataFrame({'x': range(10**6)},dtype='int64')
-        result.loc[len(result)] = len(result) + 1
-        expected = DataFrame({'x': range(10**6 + 1)},dtype='int64')
-        assert_frame_equal(result, expected)
-
-    def test_large_mi_dataframe_indexing(self):
-        #GH10645
-        result = MultiIndex.from_arrays([range(10**6), range(10**6)])
-        assert(not (10**6, 0) in result)
-
-class TestCategoricalIndex(tm.TestCase):
-
-    def setUp(self):
-
-        self.df = DataFrame({'A' : np.arange(6,dtype='int64'),
-                             'B' : Series(list('aabbca')).astype('category',categories=list('cab')) }).set_index('B')
-        self.df2 = DataFrame({'A' : np.arange(6,dtype='int64'),
-                              'B' : Series(list('aabbca')).astype('category',categories=list('cabe')) }).set_index('B')
-        self.df3 = DataFrame({'A' : np.arange(6,dtype='int64'),
-                              'B' : Series([1,1,2,1,3,2]).astype('category',categories=[3,2,1],ordered=True) }).set_index('B')
-        self.df4 = DataFrame({'A' : np.arange(6,dtype='int64'),
-                              'B' : Series([1,1,2,1,3,2]).astype('category',categories=[3,2,1],ordered=False) }).set_index('B')
-
-
-    def test_loc_scalar(self):
-
-        result = self.df.loc['a']
-        expected = DataFrame({'A' : [0,1,5],
-                              'B' : Series(list('aaa')).astype('category',categories=list('cab')) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-
-        df = self.df.copy()
-        df.loc['a'] = 20
-        expected = DataFrame({'A' : [20,20,2,3,4,20],
-                              'B' : Series(list('aabbca')).astype('category',categories=list('cab')) }).set_index('B')
-        assert_frame_equal(df, expected)
-
-        # value not in the categories
-        self.assertRaises(KeyError, lambda : df.loc['d'])
-
-        def f():
-            df.loc['d'] = 10
-        self.assertRaises(TypeError, f)
-
-        def f():
-            df.loc['d','A'] = 10
-        self.assertRaises(TypeError, f)
-
-        def f():
-            df.loc['d','C'] = 10
-        self.assertRaises(TypeError, f)
-
-    def test_loc_listlike(self):
-
-        # list of labels
-        result = self.df.loc[['c','a']]
-        expected = self.df.iloc[[4,0,1,5]]
-        assert_frame_equal(result, expected)
-
-        result = self.df2.loc[['a','b','e']]
-        expected = DataFrame({'A' : [0,1,5,2,3,np.nan],
-                              'B' : Series(list('aaabbe')).astype('category',categories=list('cabe')) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-        # element in the categories but not in the values
-        self.assertRaises(KeyError, lambda : self.df2.loc['e'])
-
-        # assign is ok
-        df = self.df2.copy()
-        df.loc['e'] = 20
-        result = df.loc[['a','b','e']]
-        expected = DataFrame({'A' : [0,1,5,2,3,20],
-                              'B' : Series(list('aaabbe')).astype('category',categories=list('cabe')) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-        df = self.df2.copy()
-        result = df.loc[['a','b','e']]
-        expected = DataFrame({'A' : [0,1,5,2,3,np.nan],
-                              'B' : Series(list('aaabbe')).astype('category',categories=list('cabe')) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-
-        # not all labels in the categories
-        self.assertRaises(KeyError, lambda : self.df2.loc[['a','d']])
-
-    def test_read_only_source(self):
-        # GH 10043
-        rw_array = np.eye(10)
-        rw_df = DataFrame(rw_array)
-
-        ro_array = np.eye(10)
-        ro_array.setflags(write=False)
-        ro_df = DataFrame(ro_array)
-
-        assert_frame_equal(rw_df.iloc[[1,2,3]],ro_df.iloc[[1,2,3]])
-        assert_frame_equal(rw_df.iloc[[1]],ro_df.iloc[[1]])
-        assert_series_equal(rw_df.iloc[1],ro_df.iloc[1])
-        assert_frame_equal(rw_df.iloc[1:3],ro_df.iloc[1:3])
-
-        assert_frame_equal(rw_df.loc[[1,2,3]],ro_df.loc[[1,2,3]])
-        assert_frame_equal(rw_df.loc[[1]],ro_df.loc[[1]])
-        assert_series_equal(rw_df.loc[1],ro_df.loc[1])
-        assert_frame_equal(rw_df.loc[1:3],ro_df.loc[1:3])
-
-    def test_reindexing(self):
-
-        # reindexing
-        # convert to a regular index
-        result = self.df2.reindex(['a','b','e'])
-        expected = DataFrame({'A' : [0,1,5,2,3,np.nan],
-                              'B' : Series(list('aaabbe')) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-        result = self.df2.reindex(['a','b'])
-        expected = DataFrame({'A' : [0,1,5,2,3],
-                              'B' : Series(list('aaabb')) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-        result = self.df2.reindex(['e'])
-        expected = DataFrame({'A' : [np.nan],
-                              'B' : Series(['e']) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-        result = self.df2.reindex(['d'])
-        expected = DataFrame({'A' : [np.nan],
-                              'B' : Series(['d']) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-        # since we are actually reindexing with a Categorical
-        # then return a Categorical
-        cats = list('cabe')
-
-        result = self.df2.reindex(pd.Categorical(['a','d'],categories=cats))
-        expected = DataFrame({'A' : [0,1,5,np.nan],
-                              'B' : Series(list('aaad')).astype('category',categories=cats) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-        result = self.df2.reindex(pd.Categorical(['a'],categories=cats))
-        expected = DataFrame({'A' : [0,1,5],
-                              'B' : Series(list('aaa')).astype('category',categories=cats) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-        result = self.df2.reindex(['a','b','e'])
-        expected = DataFrame({'A' : [0,1,5,2,3,np.nan],
-                              'B' : Series(list('aaabbe')) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-        result = self.df2.reindex(['a','b'])
-        expected = DataFrame({'A' : [0,1,5,2,3],
-                              'B' : Series(list('aaabb')) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-        result = self.df2.reindex(['e'])
-        expected = DataFrame({'A' : [np.nan],
-                              'B' : Series(['e']) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-        # give back the type of categorical that we received
-        result = self.df2.reindex(pd.Categorical(['a','d'],categories=cats,ordered=True))
-        expected = DataFrame({'A' : [0,1,5,np.nan],
-                              'B' : Series(list('aaad')).astype('category',categories=cats,ordered=True) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-        result = self.df2.reindex(pd.Categorical(['a','d'],categories=['a','d']))
-        expected = DataFrame({'A' : [0,1,5,np.nan],
-                              'B' : Series(list('aaad')).astype('category',categories=['a','d']) }).set_index('B')
-        assert_frame_equal(result, expected)
-
-        # passed duplicate indexers are not allowed
-        self.assertRaises(ValueError, lambda : self.df2.reindex(['a','a']))
-
-        # args NotImplemented ATM
-        self.assertRaises(NotImplementedError, lambda : self.df2.reindex(['a'],method='ffill'))
-        self.assertRaises(NotImplementedError, lambda : self.df2.reindex(['a'],level=1))
-        self.assertRaises(NotImplementedError, lambda : self.df2.reindex(['a'],limit=2))
-
-    def test_loc_slice(self):
-
-        # slicing
-        # not implemented ATM
-        # GH9748
-
-        self.assertRaises(TypeError, lambda : self.df.loc[1:5])
-
-        #result = df.loc[1:5]
-        #expected = df.iloc[[1,2,3,4]]
-        #assert_frame_equal(result, expected)
-
-    def test_boolean_selection(self):
-
-        df3 = self.df3
-        df4 = self.df4
-
-        result = df3[df3.index == 'a']
-        expected = df3.iloc[[]]
-        assert_frame_equal(result,expected)
-
-        result = df4[df4.index == 'a']
-        expected = df4.iloc[[]]
-        assert_frame_equal(result,expected)
-
-        result = df3[df3.index == 1]
-        expected = df3.iloc[[0,1,3]]
-        assert_frame_equal(result,expected)
-
-        result = df4[df4.index == 1]
-        expected = df4.iloc[[0,1,3]]
-        assert_frame_equal(result,expected)
-
-        # since we have an ordered categorical
-
-        # CategoricalIndex([1, 1, 2, 1, 3, 2],
-        #         categories=[3, 2, 1],
-        #         ordered=True,
-        #         name=u'B')
-        result = df3[df3.index < 2]
-        expected = df3.iloc[[4]]
-        assert_frame_equal(result,expected)
-
-        result = df3[df3.index > 1]
-        expected = df3.iloc[[]]
-        assert_frame_equal(result,expected)
-
-        # unordered
-        # cannot be compared
-
-        # CategoricalIndex([1, 1, 2, 1, 3, 2],
-        #         categories=[3, 2, 1],
-        #         ordered=False,
-        #         name=u'B')
-        self.assertRaises(TypeError, lambda : df4[df4.index < 2])
-        self.assertRaises(TypeError, lambda : df4[df4.index > 1])
-
-class TestSeriesNoneCoercion(tm.TestCase):
-    EXPECTED_RESULTS = [
-        # For numeric series, we should coerce to NaN.
-        ([1, 2, 3], [np.nan, 2, 3]),
-        ([1.0, 2.0, 3.0], [np.nan, 2.0, 3.0]),
-
-        # For datetime series, we should coerce to NaT.
-        ([datetime(2000, 1, 1), datetime(2000, 1, 2), datetime(2000, 1, 3)],
-         [NaT, datetime(2000, 1, 2), datetime(2000, 1, 3)]),
-
-        # For objects, we should preserve the None value.
-        (["foo", "bar", "baz"], [None, "bar", "baz"]),
-    ]
-
-    def test_coercion_with_setitem(self):
-        for start_data, expected_result in self.EXPECTED_RESULTS:
-            start_series = Series(start_data)
-            start_series[0] = None
-
-            expected_series = Series(expected_result)
-
-            assert_attr_equal('dtype', start_series, expected_series)
-            tm.assert_numpy_array_equal(
-                start_series.values,
-                expected_series.values, strict_nan=True)
-
-    def test_coercion_with_loc_setitem(self):
-        for start_data, expected_result in self.EXPECTED_RESULTS:
-            start_series = Series(start_data)
-            start_series.loc[0] = None
-
-            expected_series = Series(expected_result)
-
-            assert_attr_equal('dtype', start_series, expected_series)
-            tm.assert_numpy_array_equal(
-                start_series.values,
-                expected_series.values, strict_nan=True)
-
-    def test_coercion_with_setitem_and_series(self):
-        for start_data, expected_result in self.EXPECTED_RESULTS:
-            start_series = Series(start_data)
-            start_series[start_series == start_series[0]] = None
-
-            expected_series = Series(expected_result)
-
-            assert_attr_equal('dtype', start_series, expected_series)
-            tm.assert_numpy_array_equal(
-                start_series.values,
-                expected_series.values, strict_nan=True)
-
-    def test_coercion_with_loc_and_series(self):
-        for start_data, expected_result in self.EXPECTED_RESULTS:
-            start_series = Series(start_data)
-            start_series.loc[start_series == start_series[0]] = None
-
-            expected_series = Series(expected_result)
-
-            assert_attr_equal('dtype', start_series, expected_series)
-            tm.assert_numpy_array_equal(
-                start_series.values,
-                expected_series.values, strict_nan=True)
-
-
-class TestDataframeNoneCoercion(tm.TestCase):
-    EXPECTED_SINGLE_ROW_RESULTS = [
-        # For numeric series, we should coerce to NaN.
-        ([1, 2, 3], [np.nan, 2, 3]),
-        ([1.0, 2.0, 3.0], [np.nan, 2.0, 3.0]),
-
-        # For datetime series, we should coerce to NaT.
-        ([datetime(2000, 1, 1), datetime(2000, 1, 2), datetime(2000, 1, 3)],
-         [NaT, datetime(2000, 1, 2), datetime(2000, 1, 3)]),
-
-        # For objects, we should preserve the None value.
-        (["foo", "bar", "baz"], [None, "bar", "baz"]),
-    ]
-
-    def test_coercion_with_loc(self):
-        for start_data, expected_result, in self.EXPECTED_SINGLE_ROW_RESULTS:
-            start_dataframe = DataFrame({'foo': start_data})
-            start_dataframe.loc[0, ['foo']] = None
-
-            expected_dataframe = DataFrame({'foo': expected_result})
-
-            assert_attr_equal('dtype', start_dataframe['foo'], expected_dataframe['foo'])
-            tm.assert_numpy_array_equal(
-                start_dataframe['foo'].values,
-                expected_dataframe['foo'].values, strict_nan=True)
-
-    def test_coercion_with_setitem_and_dataframe(self):
-        for start_data, expected_result, in self.EXPECTED_SINGLE_ROW_RESULTS:
-            start_dataframe = DataFrame({'foo': start_data})
-            start_dataframe[start_dataframe['foo'] == start_dataframe['foo'][0]] = None
-
-            expected_dataframe = DataFrame({'foo': expected_result})
-
-            assert_attr_equal('dtype', start_dataframe['foo'], expected_dataframe['foo'])
-            tm.assert_numpy_array_equal(
-                start_dataframe['foo'].values,
-                expected_dataframe['foo'].values, strict_nan=True)
-
-    def test_none_coercion_loc_and_dataframe(self):
-        for start_data, expected_result, in self.EXPECTED_SINGLE_ROW_RESULTS:
-            start_dataframe = DataFrame({'foo': start_data})
-            start_dataframe.loc[start_dataframe['foo'] == start_dataframe['foo'][0]] = None
-
-            expected_dataframe = DataFrame({'foo': expected_result})
-
-            assert_attr_equal('dtype', start_dataframe['foo'], expected_dataframe['foo'])
-            tm.assert_numpy_array_equal(
-                start_dataframe['foo'].values,
-                expected_dataframe['foo'].values, strict_nan=True)
-
-    def test_none_coercion_mixed_dtypes(self):
-        start_dataframe = DataFrame({
-            'a': [1, 2, 3],
-            'b': [1.0, 2.0, 3.0],
-            'c': [datetime(2000, 1, 1), datetime(2000, 1, 2), datetime(2000, 1, 3)],
-            'd': ['a', 'b', 'c']})
-        start_dataframe.iloc[0] = None
-
-        expected_dataframe = DataFrame({
-            'a': [np.nan, 2, 3],
-            'b': [np.nan, 2.0, 3.0],
-            'c': [NaT, datetime(2000, 1, 2), datetime(2000, 1, 3)],
-            'd': [None, 'b', 'c']})
-
-        for column in expected_dataframe.columns:
-            assert_attr_equal('dtype', start_dataframe[column], expected_dataframe[column])
-            tm.assert_numpy_array_equal(
-                start_dataframe[column].values,
-                expected_dataframe[column].values, strict_nan=True)
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_internals.py b/pandas/tests/test_internals.py
deleted file mode 100644
index 00553102e172f..0000000000000
--- a/pandas/tests/test_internals.py
+++ /dev/null
@@ -1,1145 +0,0 @@
-# -*- coding: utf-8 -*-
-# pylint: disable=W0102
-
-from datetime import datetime, date
-
-import nose
-import numpy as np
-
-import re
-import itertools
-from pandas import Index, MultiIndex, DataFrame, DatetimeIndex, Series, Categorical
-from pandas.compat import OrderedDict, lrange
-from pandas.sparse.array import SparseArray
-from pandas.core.internals import (BlockPlacement, SingleBlockManager, make_block,
-                                   BlockManager)
-import pandas.core.common as com
-import pandas.core.internals as internals
-import pandas.util.testing as tm
-import pandas as pd
-from pandas.util.testing import (
-    assert_almost_equal, assert_frame_equal, randn, assert_series_equal)
-from pandas.compat import zip, u
-
-
-def assert_block_equal(left, right):
-    assert_almost_equal(left.values, right.values)
-    assert(left.dtype == right.dtype)
-    assert_almost_equal(left.mgr_locs, right.mgr_locs)
-
-
-def get_numeric_mat(shape):
-    arr = np.arange(shape[0])
-    return np.lib.stride_tricks.as_strided(
-        x=arr, shape=shape,
-        strides=(arr.itemsize,) + (0,) * (len(shape) - 1)).copy()
-
-
-N = 10
-
-
-def create_block(typestr, placement, item_shape=None, num_offset=0):
-    """
-    Supported typestr:
-
-        * float, f8, f4, f2
-        * int, i8, i4, i2, i1
-        * uint, u8, u4, u2, u1
-        * complex, c16, c8
-        * bool
-        * object, string, O
-        * datetime, dt, M8[ns], M8[ns, tz]
-        * timedelta, td, m8[ns]
-        * sparse (SparseArray with fill_value=0.0)
-        * sparse_na (SparseArray with fill_value=np.nan)
-        * category, category2
-
-    """
-    placement = BlockPlacement(placement)
-    num_items = len(placement)
-
-    if item_shape is None:
-        item_shape = (N,)
-
-    shape = (num_items,) + item_shape
-
-    mat = get_numeric_mat(shape)
-
-    if typestr in ('float', 'f8', 'f4', 'f2',
-                   'int', 'i8', 'i4', 'i2', 'i1',
-                   'uint', 'u8', 'u4', 'u2', 'u1'):
-        values = mat.astype(typestr) + num_offset
-    elif typestr in ('complex', 'c16', 'c8'):
-        values = 1.j * (mat.astype(typestr) + num_offset)
-    elif typestr in ('object', 'string', 'O'):
-        values = np.reshape(['A%d' % i for i in mat.ravel() + num_offset],
-                            shape)
-    elif typestr in ('b','bool',):
-        values = np.ones(shape, dtype=np.bool_)
-    elif typestr in ('datetime', 'dt', 'M8[ns]'):
-        values = (mat * 1e9).astype('M8[ns]')
-    elif typestr.startswith('M8[ns'):
-        # datetime with tz
-        m = re.search('M8\[ns,\s*(\w+\/?\w*)\]', typestr)
-        assert m is not None, "incompatible typestr -> {0}".format(typestr)
-        tz = m.groups()[0]
-        assert num_items == 1, "must have only 1 num items for a tz-aware"
-        values = DatetimeIndex(np.arange(N) * 1e9, tz=tz)
-    elif typestr in ('timedelta', 'td', 'm8[ns]'):
-        values = (mat * 1).astype('m8[ns]')
-    elif typestr in ('category',):
-        values = Categorical([1,1,2,2,3,3,3,3,4,4])
-    elif typestr in ('category2',):
-        values = Categorical(['a','a','a','a','b','b','c','c','c','d'])
-    elif typestr in ('sparse', 'sparse_na'):
-        # FIXME: doesn't support num_rows != 10
-        assert shape[-1] == 10
-        assert all(s == 1 for s in shape[:-1])
-        if typestr.endswith('_na'):
-            fill_value = np.nan
-        else:
-            fill_value = 0.0
-        values = SparseArray([fill_value, fill_value, 1, 2, 3, fill_value,
-                              4, 5, fill_value, 6], fill_value=fill_value)
-        arr = values.sp_values.view()
-        arr += (num_offset - 1)
-    else:
-        raise ValueError('Unsupported typestr: "%s"' % typestr)
-
-    return make_block(values, placement=placement, ndim=len(shape))
-
-
-def create_single_mgr(typestr, num_rows=None):
-    if num_rows is None:
-        num_rows = N
-
-    return SingleBlockManager(
-        create_block(typestr, placement=slice(0, num_rows), item_shape=()),
-        np.arange(num_rows))
-
-
-def create_mgr(descr, item_shape=None):
-    """
-    Construct BlockManager from string description.
-
-    String description syntax looks similar to np.matrix initializer.  It looks
-    like this::
-
-        a,b,c: f8; d,e,f: i8
-
-    Rules are rather simple:
-
-    * see list of supported datatypes in `create_block` method
-    * components are semicolon-separated
-    * each component is `NAME,NAME,NAME: DTYPE_ID`
-    * whitespace around colons & semicolons are removed
-    * components with same DTYPE_ID are combined into single block
-    * to force multiple blocks with same dtype, use '-SUFFIX'::
-
-        'a:f8-1; b:f8-2; c:f8-foobar'
-
-    """
-    if item_shape is None:
-        item_shape = (N,)
-
-    offset = 0
-    mgr_items = []
-    block_placements = OrderedDict()
-    for d in descr.split(';'):
-        d = d.strip()
-        names, blockstr = d.partition(':')[::2]
-        blockstr = blockstr.strip()
-        names = names.strip().split(',')
-
-        mgr_items.extend(names)
-        placement = list(np.arange(len(names)) + offset)
-        try:
-            block_placements[blockstr].extend(placement)
-        except KeyError:
-            block_placements[blockstr] = placement
-        offset += len(names)
-
-    mgr_items = Index(mgr_items)
-
-    blocks = []
-    num_offset = 0
-    for blockstr, placement in block_placements.items():
-        typestr = blockstr.split('-')[0]
-        blocks.append(create_block(typestr, placement, item_shape=item_shape,
-                                   num_offset=num_offset,))
-        num_offset += len(placement)
-
-    return BlockManager(sorted(blocks, key=lambda b: b.mgr_locs[0]),
-                        [mgr_items] + [np.arange(n) for n in item_shape])
-
-
-
-class TestBlock(tm.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        # self.fblock = get_float_ex()  # a,c,e
-        # self.cblock = get_complex_ex() #
-        # self.oblock = get_obj_ex()
-        # self.bool_block = get_bool_ex()
-        # self.int_block = get_int_ex()
-
-        self.fblock = create_block('float', [0, 2, 4])
-        self.cblock = create_block('complex', [7])
-        self.oblock = create_block('object', [1, 3])
-        self.bool_block = create_block('bool', [5])
-        self.int_block = create_block('int', [6])
-
-    def test_constructor(self):
-        int32block = create_block('i4', [0])
-        self.assertEqual(int32block.dtype, np.int32)
-
-    def test_pickle(self):
-
-        def _check(blk):
-            assert_block_equal(self.round_trip_pickle(blk), blk)
-
-        _check(self.fblock)
-        _check(self.cblock)
-        _check(self.oblock)
-        _check(self.bool_block)
-
-    def test_mgr_locs(self):
-        assert_almost_equal(self.fblock.mgr_locs, [0, 2, 4])
-
-    def test_attrs(self):
-        self.assertEqual(self.fblock.shape, self.fblock.values.shape)
-        self.assertEqual(self.fblock.dtype, self.fblock.values.dtype)
-        self.assertEqual(len(self.fblock), len(self.fblock.values))
-
-    def test_merge(self):
-        avals = randn(2, 10)
-        bvals = randn(2, 10)
-
-        ref_cols = Index(['e', 'a', 'b', 'd', 'f'])
-
-        ablock = make_block(avals,
-                            ref_cols.get_indexer(['e', 'b']))
-        bblock = make_block(bvals,
-                            ref_cols.get_indexer(['a', 'd']))
-        merged = ablock.merge(bblock)
-        assert_almost_equal(merged.mgr_locs, [0, 1, 2, 3])
-        assert_almost_equal(merged.values[[0, 2]], avals)
-        assert_almost_equal(merged.values[[1, 3]], bvals)
-
-        # TODO: merge with mixed type?
-
-    def test_copy(self):
-        cop = self.fblock.copy()
-        self.assertIsNot(cop, self.fblock)
-        assert_block_equal(self.fblock, cop)
-
-    def test_reindex_index(self):
-        pass
-
-    def test_reindex_cast(self):
-        pass
-
-    def test_insert(self):
-        pass
-
-    def test_delete(self):
-        newb = self.fblock.copy()
-        newb.delete(0)
-        assert_almost_equal(newb.mgr_locs, [2, 4])
-        self.assertTrue((newb.values[0] == 1).all())
-
-        newb = self.fblock.copy()
-        newb.delete(1)
-        assert_almost_equal(newb.mgr_locs, [0, 4])
-        self.assertTrue((newb.values[1] == 2).all())
-
-        newb = self.fblock.copy()
-        newb.delete(2)
-        assert_almost_equal(newb.mgr_locs, [0, 2])
-        self.assertTrue((newb.values[1] == 1).all())
-
-        newb = self.fblock.copy()
-        self.assertRaises(Exception, newb.delete, 3)
-
-    def test_split_block_at(self):
-
-        # with dup column support this method was taken out
-        # GH3679
-        raise nose.SkipTest("skipping for now")
-
-        bs = list(self.fblock.split_block_at('a'))
-        self.assertEqual(len(bs), 1)
-        self.assertTrue(np.array_equal(bs[0].items, ['c', 'e']))
-
-        bs = list(self.fblock.split_block_at('c'))
-        self.assertEqual(len(bs), 2)
-        self.assertTrue(np.array_equal(bs[0].items, ['a']))
-        self.assertTrue(np.array_equal(bs[1].items, ['e']))
-
-        bs = list(self.fblock.split_block_at('e'))
-        self.assertEqual(len(bs), 1)
-        self.assertTrue(np.array_equal(bs[0].items, ['a', 'c']))
-
-        bblock = get_bool_ex(['f'])
-        bs = list(bblock.split_block_at('f'))
-        self.assertEqual(len(bs), 0)
-
-    def test_get(self):
-        pass
-
-    def test_set(self):
-        pass
-
-    def test_fillna(self):
-        pass
-
-    def test_repr(self):
-        pass
-
-
-class TestDatetimeBlock(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def test_try_coerce_arg(self):
-        block = create_block('datetime', [0])
-
-        # coerce None
-        none_coerced = block._try_coerce_args(block.values, None)[1]
-        self.assertTrue(pd.Timestamp(none_coerced) is pd.NaT)
-
-        # coerce different types of date bojects
-        vals = (np.datetime64('2010-10-10'),
-                datetime(2010, 10, 10),
-                date(2010, 10, 10))
-        for val in vals:
-            coerced = block._try_coerce_args(block.values, val)[1]
-            self.assertEqual(np.int64, type(coerced))
-            self.assertEqual(pd.Timestamp('2010-10-10'), pd.Timestamp(coerced))
-
-
-class TestBlockManager(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.mgr = create_mgr('a: f8; b: object; c: f8; d: object; e: f8;'
-                              'f: bool; g: i8; h: complex')
-
-    def test_constructor_corner(self):
-        pass
-
-    def test_attrs(self):
-        mgr = create_mgr('a,b,c: f8-1; d,e,f: f8-2')
-        self.assertEqual(mgr.nblocks, 2)
-        self.assertEqual(len(mgr), 6)
-
-    def test_is_mixed_dtype(self):
-        self.assertFalse(create_mgr('a,b:f8').is_mixed_type)
-        self.assertFalse(create_mgr('a:f8-1; b:f8-2').is_mixed_type)
-
-        self.assertTrue(create_mgr('a,b:f8; c,d: f4').is_mixed_type)
-        self.assertTrue(create_mgr('a,b:f8; c,d: object').is_mixed_type)
-
-    def test_is_indexed_like(self):
-        mgr1 = create_mgr('a,b: f8')
-        mgr2 = create_mgr('a:i8; b:bool')
-        mgr3 = create_mgr('a,b,c: f8')
-        self.assertTrue(mgr1._is_indexed_like(mgr1))
-        self.assertTrue(mgr1._is_indexed_like(mgr2))
-        self.assertTrue(mgr1._is_indexed_like(mgr3))
-
-        self.assertFalse(mgr1._is_indexed_like(
-            mgr1.get_slice(slice(-1), axis=1)))
-
-    def test_duplicate_ref_loc_failure(self):
-        tmp_mgr = create_mgr('a:bool; a: f8')
-
-        axes, blocks = tmp_mgr.axes, tmp_mgr.blocks
-
-        blocks[0].mgr_locs = np.array([0])
-        blocks[1].mgr_locs = np.array([0])
-        # test trying to create block manager with overlapping ref locs
-        self.assertRaises(AssertionError, BlockManager, blocks, axes)
-
-        blocks[0].mgr_locs = np.array([0])
-        blocks[1].mgr_locs = np.array([1])
-        mgr = BlockManager(blocks, axes)
-        mgr.iget(1)
-
-    def test_contains(self):
-        self.assertIn('a', self.mgr)
-        self.assertNotIn('baz', self.mgr)
-
-    def test_pickle(self):
-
-        mgr2 = self.round_trip_pickle(self.mgr)
-        assert_frame_equal(DataFrame(self.mgr), DataFrame(mgr2))
-
-        # share ref_items
-        # self.assertIs(mgr2.blocks[0].ref_items, mgr2.blocks[1].ref_items)
-
-        # GH2431
-        self.assertTrue(hasattr(mgr2, "_is_consolidated"))
-        self.assertTrue(hasattr(mgr2, "_known_consolidated"))
-
-        # reset to False on load
-        self.assertFalse(mgr2._is_consolidated)
-        self.assertFalse(mgr2._known_consolidated)
-
-    def test_non_unique_pickle(self):
-
-        mgr = create_mgr('a,a,a:f8')
-        mgr2 = self.round_trip_pickle(mgr)
-        assert_frame_equal(DataFrame(mgr), DataFrame(mgr2))
-
-        mgr = create_mgr('a: f8; a: i8')
-        mgr2 = self.round_trip_pickle(mgr)
-        assert_frame_equal(DataFrame(mgr), DataFrame(mgr2))
-
-    def test_categorical_block_pickle(self):
-        mgr = create_mgr('a: category')
-        mgr2 = self.round_trip_pickle(mgr)
-        assert_frame_equal(DataFrame(mgr), DataFrame(mgr2))
-
-        smgr = create_single_mgr('category')
-        smgr2 = self.round_trip_pickle(smgr)
-        assert_series_equal(Series(smgr), Series(smgr2))
-
-    def test_get_scalar(self):
-        for item in self.mgr.items:
-            for i, index in enumerate(self.mgr.axes[1]):
-                res = self.mgr.get_scalar((item, index))
-                exp = self.mgr.get(item, fastpath=False)[i]
-                assert_almost_equal(res, exp)
-                exp = self.mgr.get(item).internal_values()[i]
-                assert_almost_equal(res, exp)
-
-    def test_get(self):
-        cols = Index(list('abc'))
-        values = np.random.rand(3, 3)
-        block = make_block(values=values.copy(),
-                           placement=np.arange(3))
-        mgr = BlockManager(blocks=[block], axes=[cols, np.arange(3)])
-
-        assert_almost_equal(mgr.get('a', fastpath=False), values[0])
-        assert_almost_equal(mgr.get('b', fastpath=False), values[1])
-        assert_almost_equal(mgr.get('c', fastpath=False), values[2])
-        assert_almost_equal(mgr.get('a').internal_values(), values[0])
-        assert_almost_equal(mgr.get('b').internal_values(), values[1])
-        assert_almost_equal(mgr.get('c').internal_values(), values[2])
-
-    def test_set(self):
-        mgr = create_mgr('a,b,c: int', item_shape=(3,))
-
-        mgr.set('d', np.array(['foo'] * 3))
-        mgr.set('b', np.array(['bar'] * 3))
-        assert_almost_equal(mgr.get('a').internal_values(), [0] * 3)
-        assert_almost_equal(mgr.get('b').internal_values(), ['bar'] * 3)
-        assert_almost_equal(mgr.get('c').internal_values(), [2] * 3)
-        assert_almost_equal(mgr.get('d').internal_values(), ['foo'] * 3)
-
-    def test_insert(self):
-        self.mgr.insert(0, 'inserted', np.arange(N))
-
-        self.assertEqual(self.mgr.items[0], 'inserted')
-        assert_almost_equal(self.mgr.get('inserted'), np.arange(N))
-
-        for blk in self.mgr.blocks:
-            yield self.assertIs, self.mgr.items, blk.ref_items
-
-    def test_set_change_dtype(self):
-        self.mgr.set('baz', np.zeros(N, dtype=bool))
-
-        self.mgr.set('baz', np.repeat('foo', N))
-        self.assertEqual(self.mgr.get('baz').dtype, np.object_)
-
-        mgr2 = self.mgr.consolidate()
-        mgr2.set('baz', np.repeat('foo', N))
-        self.assertEqual(mgr2.get('baz').dtype, np.object_)
-
-        mgr2.set('quux', randn(N).astype(int))
-        self.assertEqual(mgr2.get('quux').dtype, np.int_)
-
-        mgr2.set('quux', randn(N))
-        self.assertEqual(mgr2.get('quux').dtype, np.float_)
-
-    def test_set_change_dtype_slice(self): # GH8850
-        cols = MultiIndex.from_tuples([('1st','a'), ('2nd','b'), ('3rd','c')])
-        df = DataFrame([[1.0, 2, 3], [4.0, 5, 6]], columns=cols)
-        df['2nd'] = df['2nd'] * 2.0
-
-        self.assertEqual(sorted(df.blocks.keys()), ['float64', 'int64'])
-        assert_frame_equal(df.blocks['float64'],
-                DataFrame([[1.0, 4.0], [4.0, 10.0]], columns=cols[:2]))
-        assert_frame_equal(df.blocks['int64'],
-                DataFrame([[3], [6]], columns=cols[2:]))
-
-    def test_copy(self):
-        shallow = self.mgr.copy(deep=False)
-
-        # we don't guaranteee block ordering
-        for blk in self.mgr.blocks:
-            found = False
-            for cp_blk in shallow.blocks:
-                if cp_blk.values is blk.values:
-                    found = True
-                    break
-            self.assertTrue(found)
-
-    def test_sparse(self):
-        mgr = create_mgr('a: sparse-1; b: sparse-2')
-        # what to test here?
-        self.assertEqual(mgr.as_matrix().dtype, np.float64)
-
-    def test_sparse_mixed(self):
-        mgr = create_mgr('a: sparse-1; b: sparse-2; c: f8')
-        self.assertEqual(len(mgr.blocks), 3)
-        self.assertIsInstance(mgr, BlockManager)
-
-        # what to test here?
-
-    def test_as_matrix_float(self):
-        mgr = create_mgr('c: f4; d: f2; e: f8')
-        self.assertEqual(mgr.as_matrix().dtype, np.float64)
-
-        mgr = create_mgr('c: f4; d: f2')
-        self.assertEqual(mgr.as_matrix().dtype, np.float32)
-
-    def test_as_matrix_int_bool(self):
-        mgr = create_mgr('a: bool-1; b: bool-2')
-        self.assertEqual(mgr.as_matrix().dtype, np.bool_)
-
-        mgr = create_mgr('a: i8-1; b: i8-2; c: i4; d: i2; e: u1')
-        self.assertEqual(mgr.as_matrix().dtype, np.int64)
-
-        mgr = create_mgr('c: i4; d: i2; e: u1')
-        self.assertEqual(mgr.as_matrix().dtype, np.int32)
-
-    def test_as_matrix_datetime(self):
-        mgr = create_mgr('h: datetime-1; g: datetime-2')
-        self.assertEqual(mgr.as_matrix().dtype, 'M8[ns]')
-
-    def test_as_matrix_datetime_tz(self):
-        mgr = create_mgr('h: M8[ns, US/Eastern]; g: M8[ns, CET]')
-        self.assertEqual(mgr.get('h').dtype, 'datetime64[ns, US/Eastern]')
-        self.assertEqual(mgr.get('g').dtype, 'datetime64[ns, CET]')
-        self.assertEqual(mgr.as_matrix().dtype, 'object')
-
-    def test_astype(self):
-        # coerce all
-        mgr = create_mgr('c: f4; d: f2; e: f8')
-        for t in ['float16', 'float32', 'float64', 'int32', 'int64']:
-            t = np.dtype(t)
-            tmgr = mgr.astype(t)
-            self.assertEqual(tmgr.get('c').dtype.type, t)
-            self.assertEqual(tmgr.get('d').dtype.type, t)
-            self.assertEqual(tmgr.get('e').dtype.type, t)
-
-        # mixed
-        mgr = create_mgr('a,b: object; c: bool; d: datetime;'
-                         'e: f4; f: f2; g: f8')
-        for t in ['float16', 'float32', 'float64', 'int32', 'int64']:
-            t = np.dtype(t)
-            tmgr = mgr.astype(t, raise_on_error=False)
-            self.assertEqual(tmgr.get('c').dtype.type, t)
-            self.assertEqual(tmgr.get('e').dtype.type, t)
-            self.assertEqual(tmgr.get('f').dtype.type, t)
-            self.assertEqual(tmgr.get('g').dtype.type, t)
-
-            self.assertEqual(tmgr.get('a').dtype.type, np.object_)
-            self.assertEqual(tmgr.get('b').dtype.type, np.object_)
-            if t != np.int64:
-                self.assertEqual(tmgr.get('d').dtype.type, np.datetime64)
-            else:
-                self.assertEqual(tmgr.get('d').dtype.type, t)
-
-    def test_convert(self):
-        def _compare(old_mgr, new_mgr):
-            """ compare the blocks, numeric compare ==, object don't """
-            old_blocks = set(old_mgr.blocks)
-            new_blocks = set(new_mgr.blocks)
-            self.assertEqual(len(old_blocks), len(new_blocks))
-
-            # compare non-numeric
-            for b in old_blocks:
-                found = False
-                for nb in new_blocks:
-                    if (b.values == nb.values).all():
-                        found = True
-                        break
-                self.assertTrue(found)
-
-            for b in new_blocks:
-                found = False
-                for ob in old_blocks:
-                    if (b.values == ob.values).all():
-                        found = True
-                        break
-                self.assertTrue(found)
-
-        # noops
-        mgr = create_mgr('f: i8; g: f8')
-        new_mgr = mgr.convert()
-        _compare(mgr,new_mgr)
-
-        mgr = create_mgr('a, b: object; f: i8; g: f8')
-        new_mgr = mgr.convert()
-        _compare(mgr,new_mgr)
-
-        # convert
-        mgr = create_mgr('a,b,foo: object; f: i8; g: f8')
-        mgr.set('a', np.array(['1'] * N, dtype=np.object_))
-        mgr.set('b', np.array(['2.'] * N, dtype=np.object_))
-        mgr.set('foo', np.array(['foo.'] * N, dtype=np.object_))
-        new_mgr = mgr.convert(numeric=True)
-        self.assertEqual(new_mgr.get('a').dtype, np.int64)
-        self.assertEqual(new_mgr.get('b').dtype, np.float64)
-        self.assertEqual(new_mgr.get('foo').dtype, np.object_)
-        self.assertEqual(new_mgr.get('f').dtype, np.int64)
-        self.assertEqual(new_mgr.get('g').dtype, np.float64)
-
-        mgr = create_mgr('a,b,foo: object; f: i4; bool: bool; dt: datetime;'
-                         'i: i8; g: f8; h: f2')
-        mgr.set('a', np.array(['1'] * N, dtype=np.object_))
-        mgr.set('b', np.array(['2.'] * N, dtype=np.object_))
-        mgr.set('foo', np.array(['foo.'] * N, dtype=np.object_))
-        new_mgr = mgr.convert(numeric=True)
-        self.assertEqual(new_mgr.get('a').dtype, np.int64)
-        self.assertEqual(new_mgr.get('b').dtype, np.float64)
-        self.assertEqual(new_mgr.get('foo').dtype, np.object_)
-        self.assertEqual(new_mgr.get('f').dtype, np.int32)
-        self.assertEqual(new_mgr.get('bool').dtype, np.bool_)
-        self.assertEqual(new_mgr.get('dt').dtype.type, np.datetime64)
-        self.assertEqual(new_mgr.get('i').dtype, np.int64)
-        self.assertEqual(new_mgr.get('g').dtype, np.float64)
-        self.assertEqual(new_mgr.get('h').dtype, np.float16)
-
-    def test_interleave(self):
-
-
-        # self
-        for dtype in ['f8','i8','object','bool','complex','M8[ns]','m8[ns]']:
-            mgr = create_mgr('a: {0}'.format(dtype))
-            self.assertEqual(mgr.as_matrix().dtype,dtype)
-            mgr = create_mgr('a: {0}; b: {0}'.format(dtype))
-            self.assertEqual(mgr.as_matrix().dtype,dtype)
-
-        # will be converted according the actual dtype of the underlying
-        mgr = create_mgr('a: category')
-        self.assertEqual(mgr.as_matrix().dtype,'i8')
-        mgr = create_mgr('a: category; b: category')
-        self.assertEqual(mgr.as_matrix().dtype,'i8'),
-        mgr = create_mgr('a: category; b: category2')
-        self.assertEqual(mgr.as_matrix().dtype,'object')
-        mgr = create_mgr('a: category2')
-        self.assertEqual(mgr.as_matrix().dtype,'object')
-        mgr = create_mgr('a: category2; b: category2')
-        self.assertEqual(mgr.as_matrix().dtype,'object')
-
-        # combinations
-        mgr = create_mgr('a: f8')
-        self.assertEqual(mgr.as_matrix().dtype,'f8')
-        mgr = create_mgr('a: f8; b: i8')
-        self.assertEqual(mgr.as_matrix().dtype,'f8')
-        mgr = create_mgr('a: f4; b: i8')
-        self.assertEqual(mgr.as_matrix().dtype,'f4')
-        mgr = create_mgr('a: f4; b: i8; d: object')
-        self.assertEqual(mgr.as_matrix().dtype,'object')
-        mgr = create_mgr('a: bool; b: i8')
-        self.assertEqual(mgr.as_matrix().dtype,'object')
-        mgr = create_mgr('a: complex')
-        self.assertEqual(mgr.as_matrix().dtype,'complex')
-        mgr = create_mgr('a: f8; b: category')
-        self.assertEqual(mgr.as_matrix().dtype,'object')
-        mgr = create_mgr('a: M8[ns]; b: category')
-        self.assertEqual(mgr.as_matrix().dtype,'object')
-        mgr = create_mgr('a: M8[ns]; b: bool')
-        self.assertEqual(mgr.as_matrix().dtype,'object')
-        mgr = create_mgr('a: M8[ns]; b: i8')
-        self.assertEqual(mgr.as_matrix().dtype,'object')
-        mgr = create_mgr('a: m8[ns]; b: bool')
-        self.assertEqual(mgr.as_matrix().dtype,'object')
-        mgr = create_mgr('a: m8[ns]; b: i8')
-        self.assertEqual(mgr.as_matrix().dtype,'object')
-        mgr = create_mgr('a: M8[ns]; b: m8[ns]')
-        self.assertEqual(mgr.as_matrix().dtype,'object')
-
-    def test_interleave_non_unique_cols(self):
-        df = DataFrame([
-            [pd.Timestamp('20130101'), 3.5],
-            [pd.Timestamp('20130102'), 4.5]],
-            columns=['x', 'x'],
-            index=[1, 2])
-
-        df_unique = df.copy()
-        df_unique.columns = ['x', 'y']
-        self.assertEqual(df_unique.values.shape, df.values.shape)
-        tm.assert_numpy_array_equal(df_unique.values[0], df.values[0])
-        tm.assert_numpy_array_equal(df_unique.values[1], df.values[1])
-
-    def test_consolidate(self):
-        pass
-
-    def test_consolidate_ordering_issues(self):
-        self.mgr.set('f', randn(N))
-        self.mgr.set('d', randn(N))
-        self.mgr.set('b', randn(N))
-        self.mgr.set('g', randn(N))
-        self.mgr.set('h', randn(N))
-
-        cons = self.mgr.consolidate()
-        self.assertEqual(cons.nblocks, 1)
-        assert_almost_equal(cons.blocks[0].mgr_locs,
-                            np.arange(len(cons.items)))
-
-    def test_reindex_index(self):
-        pass
-
-    def test_reindex_items(self):
-        # mgr is not consolidated, f8 & f8-2 blocks
-        mgr = create_mgr('a: f8; b: i8; c: f8; d: i8; e: f8;'
-                         'f: bool; g: f8-2')
-
-        reindexed = mgr.reindex_axis(['g', 'c', 'a', 'd'], axis=0)
-        self.assertEqual(reindexed.nblocks, 2)
-        assert_almost_equal(reindexed.items, ['g', 'c', 'a', 'd'])
-        assert_almost_equal(mgr.get('g',fastpath=False), reindexed.get('g',fastpath=False))
-        assert_almost_equal(mgr.get('c',fastpath=False), reindexed.get('c',fastpath=False))
-        assert_almost_equal(mgr.get('a',fastpath=False), reindexed.get('a',fastpath=False))
-        assert_almost_equal(mgr.get('d',fastpath=False), reindexed.get('d',fastpath=False))
-        assert_almost_equal(mgr.get('g').internal_values(), reindexed.get('g').internal_values())
-        assert_almost_equal(mgr.get('c').internal_values(), reindexed.get('c').internal_values())
-        assert_almost_equal(mgr.get('a').internal_values(), reindexed.get('a').internal_values())
-        assert_almost_equal(mgr.get('d').internal_values(), reindexed.get('d').internal_values())
-
-    def test_multiindex_xs(self):
-        mgr = create_mgr('a,b,c: f8; d,e,f: i8')
-
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['first', 'second'])
-
-        mgr.set_axis(1, index)
-        result = mgr.xs('bar', axis=1)
-        self.assertEqual(result.shape, (6, 2))
-        self.assertEqual(result.axes[1][0], ('bar', 'one'))
-        self.assertEqual(result.axes[1][1], ('bar', 'two'))
-
-    def test_get_numeric_data(self):
-        mgr = create_mgr('int: int; float: float; complex: complex;'
-                         'str: object; bool: bool; obj: object; dt: datetime',
-                         item_shape=(3,))
-        mgr.set('obj', np.array([1, 2, 3], dtype=np.object_))
-
-        numeric = mgr.get_numeric_data()
-        assert_almost_equal(numeric.items, ['int', 'float', 'complex', 'bool'])
-        assert_almost_equal(mgr.get('float',fastpath=False), numeric.get('float',fastpath=False))
-        assert_almost_equal(mgr.get('float').internal_values(), numeric.get('float').internal_values())
-
-        # Check sharing
-        numeric.set('float', np.array([100., 200., 300.]))
-        assert_almost_equal(mgr.get('float',fastpath=False), np.array([100., 200., 300.]))
-        assert_almost_equal(mgr.get('float').internal_values(), np.array([100., 200., 300.]))
-
-        numeric2 = mgr.get_numeric_data(copy=True)
-        assert_almost_equal(numeric.items, ['int', 'float', 'complex', 'bool'])
-        numeric2.set('float', np.array([1000., 2000., 3000.]))
-        assert_almost_equal(mgr.get('float',fastpath=False), np.array([100., 200., 300.]))
-        assert_almost_equal(mgr.get('float').internal_values(), np.array([100., 200., 300.]))
-
-    def test_get_bool_data(self):
-        mgr = create_mgr('int: int; float: float; complex: complex;'
-                         'str: object; bool: bool; obj: object; dt: datetime',
-                         item_shape=(3,))
-        mgr.set('obj', np.array([True, False, True], dtype=np.object_))
-
-        bools = mgr.get_bool_data()
-        assert_almost_equal(bools.items, ['bool'])
-        assert_almost_equal(mgr.get('bool',fastpath=False), bools.get('bool',fastpath=False))
-        assert_almost_equal(mgr.get('bool').internal_values(), bools.get('bool').internal_values())
-
-        bools.set('bool', np.array([True, False, True]))
-        assert_almost_equal(mgr.get('bool',fastpath=False), [True, False, True])
-        assert_almost_equal(mgr.get('bool').internal_values(), [True, False, True])
-
-        # Check sharing
-        bools2 = mgr.get_bool_data(copy=True)
-        bools2.set('bool', np.array([False, True, False]))
-        assert_almost_equal(mgr.get('bool',fastpath=False), [True, False, True])
-        assert_almost_equal(mgr.get('bool').internal_values(), [True, False, True])
-
-    def test_unicode_repr_doesnt_raise(self):
-        str_repr = repr(create_mgr(u('b,\u05d0: object')))
-
-    def test_missing_unicode_key(self):
-        df = DataFrame({"a": [1]})
-        try:
-            df.ix[:, u("\u05d0")]  # should not raise UnicodeEncodeError
-        except KeyError:
-            pass  # this is the expected exception
-
-    def test_equals(self):
-        # unique items
-        bm1 = create_mgr('a,b,c: i8-1; d,e,f: i8-2')
-        bm2 = BlockManager(bm1.blocks[::-1], bm1.axes)
-        self.assertTrue(bm1.equals(bm2))
-
-        bm1 = create_mgr('a,a,a: i8-1; b,b,b: i8-2')
-        bm2 = BlockManager(bm1.blocks[::-1], bm1.axes)
-        self.assertTrue(bm1.equals(bm2))
-
-    def test_equals_block_order_different_dtypes(self):
-        # GH 9330
-
-        mgr_strings = [
-            "a:i8;b:f8", # basic case
-            "a:i8;b:f8;c:c8;d:b", # many types
-            "a:i8;e:dt;f:td;g:string", # more types
-            "a:i8;b:category;c:category2;d:category2", # categories
-            "c:sparse;d:sparse_na;b:f8", # sparse
-            ]
-
-        for mgr_string in mgr_strings:
-            bm = create_mgr(mgr_string)
-            block_perms = itertools.permutations(bm.blocks)
-            for bm_perm in block_perms:
-                bm_this = BlockManager(bm_perm, bm.axes)
-                self.assertTrue(bm.equals(bm_this))
-                self.assertTrue(bm_this.equals(bm))
-
-    def test_single_mgr_ctor(self):
-        mgr = create_single_mgr('f8', num_rows=5)
-        self.assertEqual(mgr.as_matrix().tolist(), [0., 1., 2., 3., 4.])
-
-
-class TestIndexing(object):
-    # Nosetests-style data-driven tests.
-    #
-    # This test applies different indexing routines to block managers and
-    # compares the outcome to the result of same operations on np.ndarray.
-    #
-    # NOTE: sparse (SparseBlock with fill_value != np.nan) fail a lot of tests
-    #       and are disabled.
-
-    MANAGERS = [
-        create_single_mgr('f8', N),
-        create_single_mgr('i8', N),
-        #create_single_mgr('sparse', N),
-        create_single_mgr('sparse_na', N),
-
-        # 2-dim
-        create_mgr('a,b,c,d,e,f: f8', item_shape=(N,)),
-        create_mgr('a,b,c,d,e,f: i8', item_shape=(N,)),
-        create_mgr('a,b: f8; c,d: i8; e,f: string', item_shape=(N,)),
-        create_mgr('a,b: f8; c,d: i8; e,f: f8', item_shape=(N,)),
-        #create_mgr('a: sparse', item_shape=(N,)),
-        create_mgr('a: sparse_na', item_shape=(N,)),
-
-        # 3-dim
-        create_mgr('a,b,c,d,e,f: f8', item_shape=(N, N)),
-        create_mgr('a,b,c,d,e,f: i8', item_shape=(N, N)),
-        create_mgr('a,b: f8; c,d: i8; e,f: string', item_shape=(N, N)),
-        create_mgr('a,b: f8; c,d: i8; e,f: f8', item_shape=(N, N)),
-        # create_mgr('a: sparse', item_shape=(1, N)),
-    ]
-
-    # MANAGERS = [MANAGERS[6]]
-
-    def test_get_slice(self):
-        def assert_slice_ok(mgr, axis, slobj):
-            # import pudb; pudb.set_trace()
-            mat = mgr.as_matrix()
-
-            # we maybe using an ndarray to test slicing and
-            # might not be the full length of the axis
-            if isinstance(slobj, np.ndarray):
-                ax = mgr.axes[axis]
-                if len(ax) and len(slobj) and len(slobj) != len(ax):
-                    slobj = np.concatenate([slobj, np.zeros(len(ax)-len(slobj),dtype=bool)])
-            sliced = mgr.get_slice(slobj, axis=axis)
-            mat_slobj = (slice(None),) * axis + (slobj,)
-            assert_almost_equal(mat[mat_slobj], sliced.as_matrix())
-            assert_almost_equal(mgr.axes[axis][slobj], sliced.axes[axis])
-
-        for mgr in self.MANAGERS:
-            for ax in range(mgr.ndim):
-                # slice
-                yield assert_slice_ok, mgr, ax, slice(None)
-                yield assert_slice_ok, mgr, ax, slice(3)
-                yield assert_slice_ok, mgr, ax, slice(100)
-                yield assert_slice_ok, mgr, ax, slice(1, 4)
-                yield assert_slice_ok, mgr, ax, slice(3, 0, -2)
-
-                # boolean mask
-                yield assert_slice_ok, mgr, ax, np.array([], dtype=np.bool_)
-                yield (assert_slice_ok, mgr, ax,
-                       np.ones(mgr.shape[ax], dtype=np.bool_))
-                yield (assert_slice_ok, mgr, ax,
-                       np.zeros(mgr.shape[ax], dtype=np.bool_))
-
-                if mgr.shape[ax] >= 3:
-                    yield (assert_slice_ok, mgr, ax,
-                           np.arange(mgr.shape[ax]) % 3 == 0)
-                    yield (assert_slice_ok, mgr, ax,
-                           np.array([True, True, False], dtype=np.bool_))
-
-                # fancy indexer
-                yield assert_slice_ok, mgr, ax, []
-                yield assert_slice_ok, mgr, ax, lrange(mgr.shape[ax])
-
-                if mgr.shape[ax] >= 3:
-                    yield assert_slice_ok, mgr, ax, [0, 1, 2]
-                    yield assert_slice_ok, mgr, ax, [-1, -2, -3]
-
-    def test_take(self):
-        def assert_take_ok(mgr, axis, indexer):
-            mat = mgr.as_matrix()
-            taken = mgr.take(indexer, axis)
-            assert_almost_equal(np.take(mat, indexer, axis),
-                                taken.as_matrix())
-            assert_almost_equal(mgr.axes[axis].take(indexer),
-                                taken.axes[axis])
-
-        for mgr in self.MANAGERS:
-            for ax in range(mgr.ndim):
-                # take/fancy indexer
-                yield assert_take_ok, mgr, ax, []
-                yield assert_take_ok, mgr, ax, [0, 0, 0]
-                yield assert_take_ok, mgr, ax, lrange(mgr.shape[ax])
-
-                if mgr.shape[ax] >= 3:
-                    yield assert_take_ok, mgr, ax, [0, 1, 2]
-                    yield assert_take_ok, mgr, ax, [-1, -2, -3]
-
-    def test_reindex_axis(self):
-        def assert_reindex_axis_is_ok(mgr, axis, new_labels,
-                                      fill_value):
-            mat = mgr.as_matrix()
-            indexer = mgr.axes[axis].get_indexer_for(new_labels)
-
-            reindexed = mgr.reindex_axis(new_labels, axis,
-                                         fill_value=fill_value)
-            assert_almost_equal(com.take_nd(mat, indexer, axis,
-                                            fill_value=fill_value),
-                                reindexed.as_matrix())
-            assert_almost_equal(reindexed.axes[axis], new_labels)
-
-        for mgr in self.MANAGERS:
-            for ax in range(mgr.ndim):
-                for fill_value in (None, np.nan, 100.):
-                    yield assert_reindex_axis_is_ok, mgr, ax, [], fill_value
-                    yield (assert_reindex_axis_is_ok, mgr, ax,
-                           mgr.axes[ax], fill_value)
-                    yield (assert_reindex_axis_is_ok, mgr, ax,
-                           mgr.axes[ax][[0, 0, 0]], fill_value)
-                    yield (assert_reindex_axis_is_ok, mgr, ax,
-                           ['foo', 'bar', 'baz'], fill_value)
-                    yield (assert_reindex_axis_is_ok, mgr, ax,
-                           ['foo', mgr.axes[ax][0], 'baz'], fill_value)
-
-                    if mgr.shape[ax] >= 3:
-                        yield (assert_reindex_axis_is_ok, mgr, ax,
-                               mgr.axes[ax][:-3], fill_value)
-                        yield (assert_reindex_axis_is_ok, mgr, ax,
-                               mgr.axes[ax][-3::-1], fill_value)
-                        yield (assert_reindex_axis_is_ok, mgr, ax,
-                               mgr.axes[ax][[0, 1, 2, 0, 1, 2]], fill_value)
-
-    def test_reindex_indexer(self):
-        def assert_reindex_indexer_is_ok(mgr, axis, new_labels, indexer,
-                                         fill_value):
-            mat = mgr.as_matrix()
-            reindexed_mat = com.take_nd(mat, indexer, axis,
-                                        fill_value=fill_value)
-            reindexed = mgr.reindex_indexer(new_labels, indexer, axis,
-                                            fill_value=fill_value)
-            assert_almost_equal(reindexed_mat, reindexed.as_matrix())
-            assert_almost_equal(reindexed.axes[axis], new_labels)
-
-        for mgr in self.MANAGERS:
-            for ax in range(mgr.ndim):
-                for fill_value in (None, np.nan, 100.):
-                    yield (assert_reindex_indexer_is_ok, mgr, ax,
-                           [], [], fill_value)
-                    yield (assert_reindex_indexer_is_ok, mgr, ax,
-                           mgr.axes[ax], np.arange(mgr.shape[ax]), fill_value)
-                    yield (assert_reindex_indexer_is_ok, mgr, ax,
-                           ['foo'] * mgr.shape[ax], np.arange(mgr.shape[ax]),
-                           fill_value)
-
-                    yield (assert_reindex_indexer_is_ok, mgr, ax,
-                           mgr.axes[ax][::-1], np.arange(mgr.shape[ax]),
-                           fill_value)
-                    yield (assert_reindex_indexer_is_ok, mgr, ax,
-                           mgr.axes[ax], np.arange(mgr.shape[ax])[::-1],
-                           fill_value)
-                    yield (assert_reindex_indexer_is_ok, mgr, ax,
-                           ['foo', 'bar', 'baz'], [0, 0, 0], fill_value)
-                    yield (assert_reindex_indexer_is_ok, mgr, ax,
-                           ['foo', 'bar', 'baz'], [-1, 0, -1], fill_value)
-                    yield (assert_reindex_indexer_is_ok, mgr, ax,
-                           ['foo', mgr.axes[ax][0], 'baz'], [-1, -1, -1],
-                           fill_value)
-
-                    if mgr.shape[ax] >= 3:
-                        yield (assert_reindex_indexer_is_ok, mgr, ax,
-                               ['foo', 'bar', 'baz'], [0, 1, 2], fill_value)
-
-
-    # test_get_slice(slice_like, axis)
-    # take(indexer, axis)
-    # reindex_axis(new_labels, axis)
-    # reindex_indexer(new_labels, indexer, axis)
-
-
-class TestBlockPlacement(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def test_slice_len(self):
-        self.assertEqual(len(BlockPlacement(slice(0, 4))), 4)
-        self.assertEqual(len(BlockPlacement(slice(0, 4, 2))), 2)
-        self.assertEqual(len(BlockPlacement(slice(0, 3, 2))), 2)
-
-        self.assertEqual(len(BlockPlacement(slice(0, 1, 2))), 1)
-        self.assertEqual(len(BlockPlacement(slice(1, 0, -1))), 1)
-
-    def test_zero_step_raises(self):
-        self.assertRaises(ValueError, BlockPlacement, slice(1, 1, 0))
-        self.assertRaises(ValueError, BlockPlacement, slice(1, 2, 0))
-
-    def test_unbounded_slice_raises(self):
-        def assert_unbounded_slice_error(slc):
-            # assertRaisesRegexp is not available in py2.6
-            # self.assertRaisesRegexp(ValueError, "unbounded slice",
-            #                         lambda: BlockPlacement(slc))
-            self.assertRaises(ValueError, BlockPlacement, slc)
-
-        assert_unbounded_slice_error(slice(None, None))
-        assert_unbounded_slice_error(slice(10, None))
-        assert_unbounded_slice_error(slice(None, None, -1))
-        assert_unbounded_slice_error(slice(None, 10, -1))
-
-        # These are "unbounded" because negative index will change depending on
-        # container shape.
-        assert_unbounded_slice_error(slice(-1, None))
-        assert_unbounded_slice_error(slice(None, -1))
-        assert_unbounded_slice_error(slice(-1, -1))
-        assert_unbounded_slice_error(slice(-1, None, -1))
-        assert_unbounded_slice_error(slice(None, -1, -1))
-        assert_unbounded_slice_error(slice(-1, -1, -1))
-
-    def test_not_slice_like_slices(self):
-        def assert_not_slice_like(slc):
-            self.assertTrue(not BlockPlacement(slc).is_slice_like)
-
-        assert_not_slice_like(slice(0, 0))
-        assert_not_slice_like(slice(100, 0))
-
-        assert_not_slice_like(slice(100, 100, -1))
-        assert_not_slice_like(slice(0, 100, -1))
-
-        self.assertTrue(not BlockPlacement(slice(0, 0)).is_slice_like)
-        self.assertTrue(not BlockPlacement(slice(100, 100)).is_slice_like)
-
-    def test_array_to_slice_conversion(self):
-        def assert_as_slice_equals(arr, slc):
-            self.assertEqual(BlockPlacement(arr).as_slice, slc)
-
-        assert_as_slice_equals([0], slice(0, 1, 1))
-        assert_as_slice_equals([100], slice(100, 101, 1))
-
-        assert_as_slice_equals([0, 1, 2], slice(0, 3, 1))
-        assert_as_slice_equals([0, 5, 10], slice(0, 15, 5))
-        assert_as_slice_equals([0, 100], slice(0, 200, 100))
-
-        assert_as_slice_equals([2, 1], slice(2, 0, -1))
-        assert_as_slice_equals([2, 1, 0], slice(2, None, -1))
-        assert_as_slice_equals([100, 0], slice(100, None, -100))
-
-    def test_not_slice_like_arrays(self):
-        def assert_not_slice_like(arr):
-            self.assertTrue(not BlockPlacement(arr).is_slice_like)
-
-        assert_not_slice_like([])
-        assert_not_slice_like([-1])
-        assert_not_slice_like([-1, -2, -3])
-        assert_not_slice_like([-10])
-        assert_not_slice_like([-1])
-        assert_not_slice_like([-1, 0, 1, 2])
-        assert_not_slice_like([-2, 0, 2, 4])
-        assert_not_slice_like([1, 0, -1])
-        assert_not_slice_like([1, 1, 1])
-
-    def test_slice_iter(self):
-        self.assertEqual(list(BlockPlacement(slice(0, 3))), [0, 1, 2])
-        self.assertEqual(list(BlockPlacement(slice(0, 0))), [])
-        self.assertEqual(list(BlockPlacement(slice(3, 0))), [])
-
-        self.assertEqual(list(BlockPlacement(slice(3, 0, -1))), [3, 2, 1])
-        self.assertEqual(list(BlockPlacement(slice(3, None, -1))),
-                          [3, 2, 1, 0])
-
-    def test_slice_to_array_conversion(self):
-        def assert_as_array_equals(slc, asarray):
-            tm.assert_numpy_array_equal(
-                BlockPlacement(slc).as_array,
-                np.asarray(asarray))
-
-        assert_as_array_equals(slice(0, 3), [0, 1, 2])
-        assert_as_array_equals(slice(0, 0), [])
-        assert_as_array_equals(slice(3, 0), [])
-
-        assert_as_array_equals(slice(3, 0, -1), [3, 2, 1])
-        assert_as_array_equals(slice(3, None, -1), [3, 2, 1, 0])
-        assert_as_array_equals(slice(31, None, -10), [31, 21, 11, 1])
-
-    def test_blockplacement_add(self):
-        bpl = BlockPlacement(slice(0, 5))
-        self.assertEqual(bpl.add(1).as_slice, slice(1, 6, 1))
-        self.assertEqual(bpl.add(np.arange(5)).as_slice,
-                          slice(0, 10, 2))
-        self.assertEqual(list(bpl.add(np.arange(5, 0, -1))),
-                          [5, 5, 5, 5, 5])
-
-    def test_blockplacement_add_int(self):
-        def assert_add_equals(val, inc, result):
-            self.assertEqual(list(BlockPlacement(val).add(inc)),
-                              result)
-
-        assert_add_equals(slice(0, 0), 0, [])
-        assert_add_equals(slice(1, 4), 0, [1, 2, 3])
-        assert_add_equals(slice(3, 0, -1), 0, [3, 2, 1])
-        assert_add_equals(slice(2, None, -1), 0, [2, 1, 0])
-        assert_add_equals([1, 2, 4], 0, [1, 2, 4])
-
-        assert_add_equals(slice(0, 0), 10, [])
-        assert_add_equals(slice(1, 4), 10, [11, 12, 13])
-        assert_add_equals(slice(3, 0, -1), 10, [13, 12, 11])
-        assert_add_equals(slice(2, None, -1), 10, [12, 11, 10])
-        assert_add_equals([1, 2, 4], 10, [11, 12, 14])
-
-        assert_add_equals(slice(0, 0), -1, [])
-        assert_add_equals(slice(1, 4), -1, [0, 1, 2])
-        assert_add_equals(slice(3, 0, -1), -1, [2, 1, 0])
-        assert_add_equals([1, 2, 4], -1, [0, 1, 3])
-
-        self.assertRaises(ValueError,
-                          lambda: BlockPlacement(slice(1, 4)).add(-10))
-        self.assertRaises(ValueError,
-                          lambda: BlockPlacement([1, 2, 4]).add(-10))
-        self.assertRaises(ValueError,
-                          lambda: BlockPlacement(slice(2, None, -1)).add(-1))
-
-    # def test_blockplacement_array_add(self):
-
-    #     assert_add_equals(slice(0, 2), [0, 1, 1], [0, 2, 3])
-    #     assert_add_equals(slice(2, None, -1), [1, 1, 0], [3, 2, 0])
-
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_join.py b/pandas/tests/test_join.py
new file mode 100644
index 0000000000000..af946436b55c7
--- /dev/null
+++ b/pandas/tests/test_join.py
@@ -0,0 +1,235 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+from pandas import Index, DataFrame, Categorical, merge
+
+from pandas._libs import join as _join
+import pandas.util.testing as tm
+from pandas.util.testing import assert_almost_equal, assert_frame_equal
+
+
+class TestIndexer(object):
+
+    def test_outer_join_indexer(self):
+        typemap = [('int32', _join.outer_join_indexer_int32),
+                   ('int64', _join.outer_join_indexer_int64),
+                   ('float32', _join.outer_join_indexer_float32),
+                   ('float64', _join.outer_join_indexer_float64),
+                   ('object', _join.outer_join_indexer_object)]
+
+        for dtype, indexer in typemap:
+            left = np.arange(3, dtype=dtype)
+            right = np.arange(2, 5, dtype=dtype)
+            empty = np.array([], dtype=dtype)
+
+            result, lindexer, rindexer = indexer(left, right)
+            assert isinstance(result, np.ndarray)
+            assert isinstance(lindexer, np.ndarray)
+            assert isinstance(rindexer, np.ndarray)
+            tm.assert_numpy_array_equal(result, np.arange(5, dtype=dtype))
+            exp = np.array([0, 1, 2, -1, -1], dtype=np.int64)
+            tm.assert_numpy_array_equal(lindexer, exp)
+            exp = np.array([-1, -1, 0, 1, 2], dtype=np.int64)
+            tm.assert_numpy_array_equal(rindexer, exp)
+
+            result, lindexer, rindexer = indexer(empty, right)
+            tm.assert_numpy_array_equal(result, right)
+            exp = np.array([-1, -1, -1], dtype=np.int64)
+            tm.assert_numpy_array_equal(lindexer, exp)
+            exp = np.array([0, 1, 2], dtype=np.int64)
+            tm.assert_numpy_array_equal(rindexer, exp)
+
+            result, lindexer, rindexer = indexer(left, empty)
+            tm.assert_numpy_array_equal(result, left)
+            exp = np.array([0, 1, 2], dtype=np.int64)
+            tm.assert_numpy_array_equal(lindexer, exp)
+            exp = np.array([-1, -1, -1], dtype=np.int64)
+            tm.assert_numpy_array_equal(rindexer, exp)
+
+
+def test_left_join_indexer_unique():
+    a = np.array([1, 2, 3, 4, 5], dtype=np.int64)
+    b = np.array([2, 2, 3, 4, 4], dtype=np.int64)
+
+    result = _join.left_join_indexer_unique_int64(b, a)
+    expected = np.array([1, 1, 2, 3, 3], dtype=np.int64)
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_left_outer_join_bug():
+    left = np.array([0, 1, 0, 1, 1, 2, 3, 1, 0, 2, 1, 2, 0, 1, 1, 2, 3, 2, 3,
+                     2, 1, 1, 3, 0, 3, 2, 3, 0, 0, 2, 3, 2, 0, 3, 1, 3, 0, 1,
+                     3, 0, 0, 1, 0, 3, 1, 0, 1, 0, 1, 1, 0, 2, 2, 2, 2, 2, 0,
+                     3, 1, 2, 0, 0, 3, 1, 3, 2, 2, 0, 1, 3, 0, 2, 3, 2, 3, 3,
+                     2, 3, 3, 1, 3, 2, 0, 0, 3, 1, 1, 1, 0, 2, 3, 3, 1, 2, 0,
+                     3, 1, 2, 0, 2], dtype=np.int64)
+
+    right = np.array([3, 1], dtype=np.int64)
+    max_groups = 4
+
+    lidx, ridx = _join.left_outer_join(left, right, max_groups, sort=False)
+
+    exp_lidx = np.arange(len(left), dtype=np.int64)
+    exp_ridx = -np.ones(len(left), dtype=np.int64)
+
+    exp_ridx[left == 1] = 1
+    exp_ridx[left == 3] = 0
+
+    tm.assert_numpy_array_equal(lidx, exp_lidx)
+    tm.assert_numpy_array_equal(ridx, exp_ridx)
+
+
+def test_inner_join_indexer():
+    a = np.array([1, 2, 3, 4, 5], dtype=np.int64)
+    b = np.array([0, 3, 5, 7, 9], dtype=np.int64)
+
+    index, ares, bres = _join.inner_join_indexer_int64(a, b)
+
+    index_exp = np.array([3, 5], dtype=np.int64)
+    assert_almost_equal(index, index_exp)
+
+    aexp = np.array([2, 4], dtype=np.int64)
+    bexp = np.array([1, 2], dtype=np.int64)
+    assert_almost_equal(ares, aexp)
+    assert_almost_equal(bres, bexp)
+
+    a = np.array([5], dtype=np.int64)
+    b = np.array([5], dtype=np.int64)
+
+    index, ares, bres = _join.inner_join_indexer_int64(a, b)
+    tm.assert_numpy_array_equal(index, np.array([5], dtype=np.int64))
+    tm.assert_numpy_array_equal(ares, np.array([0], dtype=np.int64))
+    tm.assert_numpy_array_equal(bres, np.array([0], dtype=np.int64))
+
+
+def test_outer_join_indexer():
+    a = np.array([1, 2, 3, 4, 5], dtype=np.int64)
+    b = np.array([0, 3, 5, 7, 9], dtype=np.int64)
+
+    index, ares, bres = _join.outer_join_indexer_int64(a, b)
+
+    index_exp = np.array([0, 1, 2, 3, 4, 5, 7, 9], dtype=np.int64)
+    assert_almost_equal(index, index_exp)
+
+    aexp = np.array([-1, 0, 1, 2, 3, 4, -1, -1], dtype=np.int64)
+    bexp = np.array([0, -1, -1, 1, -1, 2, 3, 4], dtype=np.int64)
+    assert_almost_equal(ares, aexp)
+    assert_almost_equal(bres, bexp)
+
+    a = np.array([5], dtype=np.int64)
+    b = np.array([5], dtype=np.int64)
+
+    index, ares, bres = _join.outer_join_indexer_int64(a, b)
+    tm.assert_numpy_array_equal(index, np.array([5], dtype=np.int64))
+    tm.assert_numpy_array_equal(ares, np.array([0], dtype=np.int64))
+    tm.assert_numpy_array_equal(bres, np.array([0], dtype=np.int64))
+
+
+def test_left_join_indexer():
+    a = np.array([1, 2, 3, 4, 5], dtype=np.int64)
+    b = np.array([0, 3, 5, 7, 9], dtype=np.int64)
+
+    index, ares, bres = _join.left_join_indexer_int64(a, b)
+
+    assert_almost_equal(index, a)
+
+    aexp = np.array([0, 1, 2, 3, 4], dtype=np.int64)
+    bexp = np.array([-1, -1, 1, -1, 2], dtype=np.int64)
+    assert_almost_equal(ares, aexp)
+    assert_almost_equal(bres, bexp)
+
+    a = np.array([5], dtype=np.int64)
+    b = np.array([5], dtype=np.int64)
+
+    index, ares, bres = _join.left_join_indexer_int64(a, b)
+    tm.assert_numpy_array_equal(index, np.array([5], dtype=np.int64))
+    tm.assert_numpy_array_equal(ares, np.array([0], dtype=np.int64))
+    tm.assert_numpy_array_equal(bres, np.array([0], dtype=np.int64))
+
+
+def test_left_join_indexer2():
+    idx = Index([1, 1, 2, 5])
+    idx2 = Index([1, 2, 5, 7, 9])
+
+    res, lidx, ridx = _join.left_join_indexer_int64(idx2.values, idx.values)
+
+    exp_res = np.array([1, 1, 2, 5, 7, 9], dtype=np.int64)
+    assert_almost_equal(res, exp_res)
+
+    exp_lidx = np.array([0, 0, 1, 2, 3, 4], dtype=np.int64)
+    assert_almost_equal(lidx, exp_lidx)
+
+    exp_ridx = np.array([0, 1, 2, 3, -1, -1], dtype=np.int64)
+    assert_almost_equal(ridx, exp_ridx)
+
+
+def test_outer_join_indexer2():
+    idx = Index([1, 1, 2, 5])
+    idx2 = Index([1, 2, 5, 7, 9])
+
+    res, lidx, ridx = _join.outer_join_indexer_int64(idx2.values, idx.values)
+
+    exp_res = np.array([1, 1, 2, 5, 7, 9], dtype=np.int64)
+    assert_almost_equal(res, exp_res)
+
+    exp_lidx = np.array([0, 0, 1, 2, 3, 4], dtype=np.int64)
+    assert_almost_equal(lidx, exp_lidx)
+
+    exp_ridx = np.array([0, 1, 2, 3, -1, -1], dtype=np.int64)
+    assert_almost_equal(ridx, exp_ridx)
+
+
+def test_inner_join_indexer2():
+    idx = Index([1, 1, 2, 5])
+    idx2 = Index([1, 2, 5, 7, 9])
+
+    res, lidx, ridx = _join.inner_join_indexer_int64(idx2.values, idx.values)
+
+    exp_res = np.array([1, 1, 2, 5], dtype=np.int64)
+    assert_almost_equal(res, exp_res)
+
+    exp_lidx = np.array([0, 0, 1, 2], dtype=np.int64)
+    assert_almost_equal(lidx, exp_lidx)
+
+    exp_ridx = np.array([0, 1, 2, 3], dtype=np.int64)
+    assert_almost_equal(ridx, exp_ridx)
+
+
+def test_merge_join_categorical_multiindex():
+    # From issue 16627
+    a = {'Cat1': Categorical(['a', 'b', 'a', 'c', 'a', 'b'],
+                             ['a', 'b', 'c']),
+         'Int1': [0, 1, 0, 1, 0, 0]}
+    a = DataFrame(a)
+
+    b = {'Cat': Categorical(['a', 'b', 'c', 'a', 'b', 'c'],
+                            ['a', 'b', 'c']),
+         'Int': [0, 0, 0, 1, 1, 1],
+         'Factor': [1.1, 1.2, 1.3, 1.4, 1.5, 1.6]}
+    b = DataFrame(b).set_index(['Cat', 'Int'])['Factor']
+
+    expected = merge(a, b.reset_index(), left_on=['Cat1', 'Int1'],
+                     right_on=['Cat', 'Int'], how='left')
+    result = a.join(b, on=['Cat1', 'Int1'])
+    expected = expected.drop(['Cat', 'Int'], axis=1)
+    assert_frame_equal(expected, result)
+
+    # Same test, but with ordered categorical
+    a = {'Cat1': Categorical(['a', 'b', 'a', 'c', 'a', 'b'],
+                             ['b', 'a', 'c'],
+                             ordered=True),
+         'Int1': [0, 1, 0, 1, 0, 0]}
+    a = DataFrame(a)
+
+    b = {'Cat': Categorical(['a', 'b', 'c', 'a', 'b', 'c'],
+                            ['b', 'a', 'c'],
+                            ordered=True),
+         'Int': [0, 0, 0, 1, 1, 1],
+         'Factor': [1.1, 1.2, 1.3, 1.4, 1.5, 1.6]}
+    b = DataFrame(b).set_index(['Cat', 'Int'])['Factor']
+
+    expected = merge(a, b.reset_index(), left_on=['Cat1', 'Int1'],
+                     right_on=['Cat', 'Int'], how='left')
+    result = a.join(b, on=['Cat1', 'Int1'])
+    expected = expected.drop(['Cat', 'Int'], axis=1)
+    assert_frame_equal(expected, result)
diff --git a/pandas/tests/test_lib.py b/pandas/tests/test_lib.py
index cfc98f5c20360..3e34b48fb6795 100644
--- a/pandas/tests/test_lib.py
+++ b/pandas/tests/test_lib.py
@@ -1,43 +1,47 @@
 # -*- coding: utf-8 -*-
-from datetime import datetime, timedelta, date, time
 
-import numpy as np
+import pytest
 
-import pandas as pd
-import pandas.lib as lib
+import numpy as np
+from pandas import Index
+from pandas._libs import lib, writers as libwriters
 import pandas.util.testing as tm
-from pandas.compat import u, PY2
 
 
-class TestMisc(tm.TestCase):
+class TestMisc(object):
 
     def test_max_len_string_array(self):
 
         arr = a = np.array(['foo', 'b', np.nan], dtype='object')
-        self.assertTrue(lib.max_len_string_array(arr), 3)
+        assert libwriters.max_len_string_array(arr) == 3
 
         # unicode
         arr = a.astype('U').astype(object)
-        self.assertTrue(lib.max_len_string_array(arr), 3)
+        assert libwriters.max_len_string_array(arr) == 3
 
         # bytes for python3
         arr = a.astype('S').astype(object)
-        self.assertTrue(lib.max_len_string_array(arr), 3)
+        assert libwriters.max_len_string_array(arr) == 3
 
         # raises
-        tm.assertRaises(TypeError,
-                        lambda: lib.max_len_string_array(arr.astype('U')))
+        pytest.raises(TypeError,
+                      lambda: libwriters.max_len_string_array(arr.astype('U')))
+
+    def test_fast_unique_multiple_list_gen_sort(self):
+        keys = [['p', 'a'], ['n', 'd'], ['a', 's']]
 
-    def test_infer_dtype_bytes(self):
-        compare = 'string' if PY2 else 'bytes'
+        gen = (key for key in keys)
+        expected = np.array(['a', 'd', 'n', 'p', 's'])
+        out = lib.fast_unique_multiple_list_gen(gen, sort=True)
+        tm.assert_numpy_array_equal(np.array(out), expected)
 
-        # string array of bytes
-        arr = np.array(list('abc'), dtype='S1')
-        self.assertEqual(pd.lib.infer_dtype(arr), compare)
+        gen = (key for key in keys)
+        expected = np.array(['p', 'a', 'n', 'd', 's'])
+        out = lib.fast_unique_multiple_list_gen(gen, sort=False)
+        tm.assert_numpy_array_equal(np.array(out), expected)
 
-        # object array of bytes
-        arr = arr.astype(object)
-        self.assertEqual(pd.lib.infer_dtype(arr), compare)
+
+class TestIndexing(object):
 
     def test_maybe_indices_to_slice_left_edge(self):
         target = np.arange(100)
@@ -45,29 +49,36 @@ def test_maybe_indices_to_slice_left_edge(self):
         # slice
         indices = np.array([], dtype=np.int64)
         maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-        self.assertTrue(isinstance(maybe_slice, slice))
-        self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+        assert isinstance(maybe_slice, slice)
+        tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
 
         for end in [1, 2, 5, 20, 99]:
             for step in [1, 2, 4]:
                 indices = np.arange(0, end, step, dtype=np.int64)
                 maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-                self.assertTrue(isinstance(maybe_slice, slice))
-                self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+                assert isinstance(maybe_slice, slice)
+                tm.assert_numpy_array_equal(target[indices],
+                                            target[maybe_slice])
 
                 # reverse
                 indices = indices[::-1]
                 maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-                self.assertTrue(isinstance(maybe_slice, slice))
-                self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+                assert isinstance(maybe_slice, slice)
+                tm.assert_numpy_array_equal(target[indices],
+                                            target[maybe_slice])
 
         # not slice
-        for case in [[2, 1, 2, 0], [2, 2, 1, 0], [0, 1, 2, 1], [-2, 0, 2], [2, 0, -2]]:
+        for case in [[2, 1, 2, 0], [2, 2, 1, 0], [0, 1, 2, 1], [-2, 0, 2],
+                     [2, 0, -2]]:
             indices = np.array(case, dtype=np.int64)
             maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-            self.assertFalse(isinstance(maybe_slice, slice))
-            self.assert_numpy_array_equal(maybe_slice, indices)
-            self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+            assert not isinstance(maybe_slice, slice)
+            tm.assert_numpy_array_equal(maybe_slice, indices)
+            tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
 
     def test_maybe_indices_to_slice_right_edge(self):
         target = np.arange(100)
@@ -77,40 +88,49 @@ def test_maybe_indices_to_slice_right_edge(self):
             for step in [1, 2, 4]:
                 indices = np.arange(start, 99, step, dtype=np.int64)
                 maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-                self.assertTrue(isinstance(maybe_slice, slice))
-                self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+                assert isinstance(maybe_slice, slice)
+                tm.assert_numpy_array_equal(target[indices],
+                                            target[maybe_slice])
 
                 # reverse
                 indices = indices[::-1]
                 maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-                self.assertTrue(isinstance(maybe_slice, slice))
-                self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+                assert isinstance(maybe_slice, slice)
+                tm.assert_numpy_array_equal(target[indices],
+                                            target[maybe_slice])
 
         # not slice
         indices = np.array([97, 98, 99, 100], dtype=np.int64)
         maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-        self.assertFalse(isinstance(maybe_slice, slice))
-        self.assert_numpy_array_equal(maybe_slice, indices)
-        with self.assertRaises(IndexError):
+
+        assert not isinstance(maybe_slice, slice)
+        tm.assert_numpy_array_equal(maybe_slice, indices)
+
+        with pytest.raises(IndexError):
             target[indices]
-        with self.assertRaises(IndexError):
+        with pytest.raises(IndexError):
             target[maybe_slice]
 
         indices = np.array([100, 99, 98, 97], dtype=np.int64)
         maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-        self.assertFalse(isinstance(maybe_slice, slice))
-        self.assert_numpy_array_equal(maybe_slice, indices)
-        with self.assertRaises(IndexError):
+
+        assert not isinstance(maybe_slice, slice)
+        tm.assert_numpy_array_equal(maybe_slice, indices)
+
+        with pytest.raises(IndexError):
             target[indices]
-        with self.assertRaises(IndexError):
+        with pytest.raises(IndexError):
             target[maybe_slice]
 
         for case in [[99, 97, 99, 96], [99, 99, 98, 97], [98, 98, 97, 96]]:
             indices = np.array(case, dtype=np.int64)
             maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-            self.assertFalse(isinstance(maybe_slice, slice))
-            self.assert_numpy_array_equal(maybe_slice, indices)
-            self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+            assert not isinstance(maybe_slice, slice)
+            tm.assert_numpy_array_equal(maybe_slice, indices)
+            tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
 
     def test_maybe_indices_to_slice_both_edges(self):
         target = np.arange(10)
@@ -119,22 +139,22 @@ def test_maybe_indices_to_slice_both_edges(self):
         for step in [1, 2, 4, 5, 8, 9]:
             indices = np.arange(0, 9, step, dtype=np.int64)
             maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-            self.assertTrue(isinstance(maybe_slice, slice))
-            self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+            assert isinstance(maybe_slice, slice)
+            tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
 
             # reverse
             indices = indices[::-1]
             maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-            self.assertTrue(isinstance(maybe_slice, slice))
-            self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+            assert isinstance(maybe_slice, slice)
+            tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
 
         # not slice
         for case in [[4, 2, 0, -2], [2, 2, 1, 0], [0, 1, 2, 1]]:
             indices = np.array(case, dtype=np.int64)
             maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-            self.assertFalse(isinstance(maybe_slice, slice))
-            self.assert_numpy_array_equal(maybe_slice, indices)
-            self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+            assert not isinstance(maybe_slice, slice)
+            tm.assert_numpy_array_equal(maybe_slice, indices)
+            tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
 
     def test_maybe_indices_to_slice_middle(self):
         target = np.arange(100)
@@ -144,92 +164,43 @@ def test_maybe_indices_to_slice_middle(self):
             for step in [1, 2, 4, 20]:
                 indices = np.arange(start, end, step, dtype=np.int64)
                 maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-                self.assertTrue(isinstance(maybe_slice, slice))
-                self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+                assert isinstance(maybe_slice, slice)
+                tm.assert_numpy_array_equal(target[indices],
+                                            target[maybe_slice])
 
                 # reverse
                 indices = indices[::-1]
                 maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-                self.assertTrue(isinstance(maybe_slice, slice))
-                self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+                assert isinstance(maybe_slice, slice)
+                tm.assert_numpy_array_equal(target[indices],
+                                            target[maybe_slice])
 
         # not slice
         for case in [[14, 12, 10, 12], [12, 12, 11, 10], [10, 11, 12, 11]]:
             indices = np.array(case, dtype=np.int64)
             maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-            self.assertFalse(isinstance(maybe_slice, slice))
-            self.assert_numpy_array_equal(maybe_slice, indices)
-            self.assert_numpy_array_equal(target[indices], target[maybe_slice])
-
-
-class Testisscalar(tm.TestCase):
-
-    def test_isscalar_builtin_scalars(self):
-        self.assertTrue(lib.isscalar(None))
-        self.assertTrue(lib.isscalar(True))
-        self.assertTrue(lib.isscalar(False))
-        self.assertTrue(lib.isscalar(0.))
-        self.assertTrue(lib.isscalar(np.nan))
-        self.assertTrue(lib.isscalar('foobar'))
-        self.assertTrue(lib.isscalar(b'foobar'))
-        self.assertTrue(lib.isscalar(u('efoobar')))
-        self.assertTrue(lib.isscalar(datetime(2014, 1, 1)))
-        self.assertTrue(lib.isscalar(date(2014, 1, 1)))
-        self.assertTrue(lib.isscalar(time(12, 0)))
-        self.assertTrue(lib.isscalar(timedelta(hours=1)))
-        self.assertTrue(lib.isscalar(pd.NaT))
-
-    def test_isscalar_builtin_nonscalars(self):
-        self.assertFalse(lib.isscalar({}))
-        self.assertFalse(lib.isscalar([]))
-        self.assertFalse(lib.isscalar([1]))
-        self.assertFalse(lib.isscalar(()))
-        self.assertFalse(lib.isscalar((1,)))
-        self.assertFalse(lib.isscalar(slice(None)))
-        self.assertFalse(lib.isscalar(Ellipsis))
-
-    def test_isscalar_numpy_array_scalars(self):
-        self.assertTrue(lib.isscalar(np.int64(1)))
-        self.assertTrue(lib.isscalar(np.float64(1.)))
-        self.assertTrue(lib.isscalar(np.int32(1)))
-        self.assertTrue(lib.isscalar(np.object_('foobar')))
-        self.assertTrue(lib.isscalar(np.str_('foobar')))
-        self.assertTrue(lib.isscalar(np.unicode_(u('foobar'))))
-        self.assertTrue(lib.isscalar(np.bytes_(b'foobar')))
-        self.assertTrue(lib.isscalar(np.datetime64('2014-01-01')))
-        self.assertTrue(lib.isscalar(np.timedelta64(1, 'h')))
-
-    def test_isscalar_numpy_zerodim_arrays(self):
-        for zerodim in [np.array(1),
-                        np.array('foobar'),
-                        np.array(np.datetime64('2014-01-01')),
-                        np.array(np.timedelta64(1, 'h'))]:
-            self.assertFalse(lib.isscalar(zerodim))
-            self.assertTrue(lib.isscalar(lib.item_from_zerodim(zerodim)))
-
-    def test_isscalar_numpy_arrays(self):
-        self.assertFalse(lib.isscalar(np.array([])))
-        self.assertFalse(lib.isscalar(np.array([[]])))
-        self.assertFalse(lib.isscalar(np.matrix('1; 2')))
-
-    def test_isscalar_pandas_scalars(self):
-        self.assertTrue(lib.isscalar(pd.Timestamp('2014-01-01')))
-        self.assertTrue(lib.isscalar(pd.Timedelta(hours=1)))
-        self.assertTrue(lib.isscalar(pd.Period('2014-01-01')))
-
-    def test_lisscalar_pandas_containers(self):
-        self.assertFalse(lib.isscalar(pd.Series()))
-        self.assertFalse(lib.isscalar(pd.Series([1])))
-        self.assertFalse(lib.isscalar(pd.DataFrame()))
-        self.assertFalse(lib.isscalar(pd.DataFrame([[1]])))
-        self.assertFalse(lib.isscalar(pd.Panel()))
-        self.assertFalse(lib.isscalar(pd.Panel([[[1]]])))
-        self.assertFalse(lib.isscalar(pd.Index([])))
-        self.assertFalse(lib.isscalar(pd.Index([1])))
-
-
-if __name__ == '__main__':
-    import nose
-
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
\ No newline at end of file
+
+            assert not isinstance(maybe_slice, slice)
+            tm.assert_numpy_array_equal(maybe_slice, indices)
+            tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+    def test_maybe_booleans_to_slice(self):
+        arr = np.array([0, 0, 1, 1, 1, 0, 1], dtype=np.uint8)
+        result = lib.maybe_booleans_to_slice(arr)
+        assert result.dtype == np.bool_
+
+        result = lib.maybe_booleans_to_slice(arr[:0])
+        assert result == slice(0, 0)
+
+    def test_get_reverse_indexer(self):
+        indexer = np.array([-1, -1, 1, 2, 0, -1, 3, 4], dtype=np.int64)
+        result = lib.get_reverse_indexer(indexer, 5)
+        expected = np.array([4, 2, 3, 6, 7], dtype=np.int64)
+        tm.assert_numpy_array_equal(result, expected)
+
+
+def test_cache_readonly_preserve_docstrings():
+    # GH18197
+    assert Index.hasnans.__doc__ is not None
diff --git a/pandas/tests/test_msgpack/test_case.py b/pandas/tests/test_msgpack/test_case.py
deleted file mode 100644
index 187668b242495..0000000000000
--- a/pandas/tests/test_msgpack/test_case.py
+++ /dev/null
@@ -1,102 +0,0 @@
-#!/usr/bin/env python
-# coding: utf-8
-
-from pandas.msgpack import packb, unpackb
-
-
-def check(length, obj):
-    v = packb(obj)
-    assert len(v) == length, \
-        "%r length should be %r but get %r" % (obj, length, len(v))
-    assert unpackb(v, use_list=0) == obj
-
-def test_1():
-    for o in [None, True, False, 0, 1, (1 << 6), (1 << 7) - 1, -1,
-              -((1<<5)-1), -(1<<5)]:
-        check(1, o)
-
-def test_2():
-    for o in [1 << 7, (1 << 8) - 1,
-              -((1<<5)+1), -(1<<7)
-             ]:
-        check(2, o)
-
-def test_3():
-    for o in [1 << 8, (1 << 16) - 1,
-              -((1<<7)+1), -(1<<15)]:
-        check(3, o)
-
-def test_5():
-    for o in [1 << 16, (1 << 32) - 1,
-              -((1<<15)+1), -(1<<31)]:
-        check(5, o)
-
-def test_9():
-    for o in [1 << 32, (1 << 64) - 1,
-              -((1<<31)+1), -(1<<63),
-              1.0, 0.1, -0.1, -1.0]:
-        check(9, o)
-
-
-def check_raw(overhead, num):
-    check(num + overhead, b" " * num)
-
-def test_fixraw():
-    check_raw(1, 0)
-    check_raw(1, (1<<5) - 1)
-
-def test_raw16():
-    check_raw(3, 1<<5)
-    check_raw(3, (1<<16) - 1)
-
-def test_raw32():
-    check_raw(5, 1<<16)
-
-
-def check_array(overhead, num):
-    check(num + overhead, (None,) * num)
-
-def test_fixarray():
-    check_array(1, 0)
-    check_array(1, (1 << 4) - 1)
-
-def test_array16():
-    check_array(3, 1 << 4)
-    check_array(3, (1<<16)-1)
-
-def test_array32():
-    check_array(5, (1<<16))
-
-
-def match(obj, buf):
-    assert packb(obj) == buf
-    assert unpackb(buf, use_list=0) == obj
-
-def test_match():
-    cases = [
-        (None, b'\xc0'),
-        (False, b'\xc2'),
-        (True, b'\xc3'),
-        (0, b'\x00'),
-        (127, b'\x7f'),
-        (128, b'\xcc\x80'),
-        (256, b'\xcd\x01\x00'),
-        (-1, b'\xff'),
-        (-33, b'\xd0\xdf'),
-        (-129, b'\xd1\xff\x7f'),
-        ({1:1}, b'\x81\x01\x01'),
-        (1.0, b"\xcb\x3f\xf0\x00\x00\x00\x00\x00\x00"),
-        ((), b'\x90'),
-        (tuple(range(15)),b"\x9f\x00\x01\x02\x03\x04\x05\x06\x07\x08\x09\x0a\x0b\x0c\x0d\x0e"),
-        (tuple(range(16)),b"\xdc\x00\x10\x00\x01\x02\x03\x04\x05\x06\x07\x08\x09\x0a\x0b\x0c\x0d\x0e\x0f"),
-        ({}, b'\x80'),
-        (dict([(x,x) for x in range(15)]), b'\x8f\x00\x00\x01\x01\x02\x02\x03\x03\x04\x04\x05\x05\x06\x06\x07\x07\x08\x08\t\t\n\n\x0b\x0b\x0c\x0c\r\r\x0e\x0e'),
-        (dict([(x,x) for x in range(16)]), b'\xde\x00\x10\x00\x00\x01\x01\x02\x02\x03\x03\x04\x04\x05\x05\x06\x06\x07\x07\x08\x08\t\t\n\n\x0b\x0b\x0c\x0c\r\r\x0e\x0e\x0f\x0f'),
-        ]
-
-    for v, p in cases:
-        match(v, p)
-
-def test_unicode():
-    assert unpackb(packb('foobar'), use_list=1) == b'foobar'
-
diff --git a/pandas/tests/test_msgpack/test_except.py b/pandas/tests/test_msgpack/test_except.py
deleted file mode 100644
index a0239336ca20d..0000000000000
--- a/pandas/tests/test_msgpack/test_except.py
+++ /dev/null
@@ -1,29 +0,0 @@
-#!/usr/bin/env python
-# coding: utf-8
-
-import unittest
-import nose
-
-import datetime
-from pandas.msgpack import packb, unpackb
-
-class DummyException(Exception):
-    pass
-
-class TestExceptions(unittest.TestCase):
-
-    def test_raise_on_find_unsupported_value(self):
-        import datetime
-        self.assertRaises(TypeError, packb, datetime.datetime.now())
-
-    def test_raise_from_object_hook(self):
-        def hook(obj):
-            raise DummyException
-        self.assertRaises(DummyException, unpackb, packb({}), object_hook=hook)
-        self.assertRaises(DummyException, unpackb, packb({'fizz': 'buzz'}), object_hook=hook)
-        self.assertRaises(DummyException, unpackb, packb({'fizz': 'buzz'}), object_pairs_hook=hook)
-        self.assertRaises(DummyException, unpackb, packb({'fizz': {'buzz': 'spam'}}), object_hook=hook)
-        self.assertRaises(DummyException, unpackb, packb({'fizz': {'buzz': 'spam'}}), object_pairs_hook=hook)
-
-    def test_invalidvalue(self):
-        self.assertRaises(ValueError, unpackb, b'\xd9\x97#DL_')
diff --git a/pandas/tests/test_msgpack/test_extension.py b/pandas/tests/test_msgpack/test_extension.py
deleted file mode 100644
index 3172605c0aae1..0000000000000
--- a/pandas/tests/test_msgpack/test_extension.py
+++ /dev/null
@@ -1,57 +0,0 @@
-from __future__ import print_function
-import array
-import pandas.msgpack as msgpack
-from pandas.msgpack import ExtType
-
-
-def test_pack_ext_type():
-    def p(s):
-        packer = msgpack.Packer()
-        packer.pack_ext_type(0x42, s)
-        return packer.bytes()
-    assert p(b'A')        == b'\xd4\x42A'          # fixext 1
-    assert p(b'AB')       == b'\xd5\x42AB'         # fixext 2
-    assert p(b'ABCD')     == b'\xd6\x42ABCD'       # fixext 4
-    assert p(b'ABCDEFGH') == b'\xd7\x42ABCDEFGH'   # fixext 8
-    assert p(b'A'*16)     == b'\xd8\x42' + b'A'*16 # fixext 16
-    assert p(b'ABC')      == b'\xc7\x03\x42ABC'        # ext 8
-    assert p(b'A'*0x0123)     == b'\xc8\x01\x23\x42' + b'A'*0x0123 # ext 16
-    assert p(b'A'*0x00012345) == b'\xc9\x00\x01\x23\x45\x42' + b'A'*0x00012345 # ext 32
-
-
-def test_unpack_ext_type():
-    def check(b, expected):
-        assert msgpack.unpackb(b) == expected
-
-    check(b'\xd4\x42A',         ExtType(0x42, b'A'))        # fixext 1
-    check(b'\xd5\x42AB',        ExtType(0x42, b'AB'))       # fixext 2
-    check(b'\xd6\x42ABCD',      ExtType(0x42, b'ABCD'))     # fixext 4
-    check(b'\xd7\x42ABCDEFGH',  ExtType(0x42, b'ABCDEFGH')) # fixext 8
-    check(b'\xd8\x42' + b'A'*16, ExtType(0x42, b'A'*16))    # fixext 16
-    check(b'\xc7\x03\x42ABC',   ExtType(0x42, b'ABC'))      # ext 8
-    check(b'\xc8\x01\x23\x42' + b'A'*0x0123,
-          ExtType(0x42, b'A'*0x0123))                        # ext 16
-    check(b'\xc9\x00\x01\x23\x45\x42' + b'A'*0x00012345,
-          ExtType(0x42, b'A'*0x00012345))                   # ext 32
-
-
-def test_extension_type():
-    def default(obj):
-        print('default called', obj)
-        if isinstance(obj, array.array):
-            typecode = 123 # application specific typecode
-            data = obj.tostring()
-            return ExtType(typecode, data)
-        raise TypeError("Unknwon type object %r" % (obj,))
-
-    def ext_hook(code, data):
-        print('ext_hook called', code, data)
-        assert code == 123
-        obj = array.array('d')
-        obj.fromstring(data)
-        return obj
-
-    obj = [42, b'hello', array.array('d', [1.1, 2.2, 3.3])]
-    s = msgpack.packb(obj, default=default)
-    obj2 = msgpack.unpackb(s, ext_hook=ext_hook)
-    assert obj == obj2
diff --git a/pandas/tests/test_msgpack/test_format.py b/pandas/tests/test_msgpack/test_format.py
deleted file mode 100644
index 706c48436d7d3..0000000000000
--- a/pandas/tests/test_msgpack/test_format.py
+++ /dev/null
@@ -1,70 +0,0 @@
-#!/usr/bin/env python
-# coding: utf-8
-
-from pandas.msgpack import unpackb
-
-def check(src, should, use_list=0):
-    assert unpackb(src, use_list=use_list) == should
-
-def testSimpleValue():
-    check(b"\x93\xc0\xc2\xc3", 
-            (None, False, True,))
-
-def testFixnum():
-    check(b"\x92\x93\x00\x40\x7f\x93\xe0\xf0\xff",
-          ((0,64,127,), (-32,-16,-1,),)
-          )
-
-def testFixArray():
-    check(b"\x92\x90\x91\x91\xc0",
-          ((),((None,),),),
-          )
-
-def testFixRaw():
-    check(b"\x94\xa0\xa1a\xa2bc\xa3def",
-          (b"", b"a", b"bc", b"def",),
-          )
-
-def testFixMap():
-    check(
-          b"\x82\xc2\x81\xc0\xc0\xc3\x81\xc0\x80",
-          {False: {None: None}, True:{None:{}}},
-          )
-
-def testUnsignedInt():
-    check(
-          b"\x99\xcc\x00\xcc\x80\xcc\xff\xcd\x00\x00\xcd\x80\x00"
-          b"\xcd\xff\xff\xce\x00\x00\x00\x00\xce\x80\x00\x00\x00"
-          b"\xce\xff\xff\xff\xff",
-          (0, 128, 255, 0, 32768, 65535, 0, 2147483648, 4294967295,),
-          )
-
-def testSignedInt():
-    check(b"\x99\xd0\x00\xd0\x80\xd0\xff\xd1\x00\x00\xd1\x80\x00"
-          b"\xd1\xff\xff\xd2\x00\x00\x00\x00\xd2\x80\x00\x00\x00"
-          b"\xd2\xff\xff\xff\xff",
-          (0, -128, -1, 0, -32768, -1, 0, -2147483648, -1,))
-
-def testRaw():
-    check(b"\x96\xda\x00\x00\xda\x00\x01a\xda\x00\x02ab\xdb\x00\x00"
-        b"\x00\x00\xdb\x00\x00\x00\x01a\xdb\x00\x00\x00\x02ab",
-        (b"", b"a", b"ab", b"", b"a", b"ab"))
-
-def testArray():
-    check(b"\x96\xdc\x00\x00\xdc\x00\x01\xc0\xdc\x00\x02\xc2\xc3\xdd\x00"
-        b"\x00\x00\x00\xdd\x00\x00\x00\x01\xc0\xdd\x00\x00\x00\x02"
-        b"\xc2\xc3",
-        ((), (None,), (False,True), (), (None,), (False,True))
-        )
-
-def testMap():
-    check(
-        b"\x96"
-            b"\xde\x00\x00"
-            b"\xde\x00\x01\xc0\xc2"
-            b"\xde\x00\x02\xc0\xc2\xc3\xc2"
-            b"\xdf\x00\x00\x00\x00"
-            b"\xdf\x00\x00\x00\x01\xc0\xc2"
-            b"\xdf\x00\x00\x00\x02\xc0\xc2\xc3\xc2",
-        ({}, {None: False}, {True: False, None: False}, {},
-            {None: False}, {True: False, None: False}))
diff --git a/pandas/tests/test_msgpack/test_limits.py b/pandas/tests/test_msgpack/test_limits.py
deleted file mode 100644
index d9aa957182d65..0000000000000
--- a/pandas/tests/test_msgpack/test_limits.py
+++ /dev/null
@@ -1,94 +0,0 @@
-#!/usr/bin/env python
-# coding: utf-8
-from __future__ import absolute_import, division, print_function, unicode_literals
-import pandas.util.testing as tm
-
-from pandas.msgpack import packb, unpackb, Packer, Unpacker, ExtType
-
-class TestLimits(tm.TestCase):
-    def test_integer(self):
-        x = -(2 ** 63)
-        assert unpackb(packb(x)) == x
-        self.assertRaises((OverflowError, ValueError), packb, x-1)
-        x = 2 ** 64 - 1
-        assert unpackb(packb(x)) == x
-        self.assertRaises((OverflowError, ValueError), packb, x+1)
-
-
-    def test_array_header(self):
-        packer = Packer()
-        packer.pack_array_header(2**32-1)
-        self.assertRaises((OverflowError, ValueError),
-                          packer.pack_array_header, 2**32)
-
-
-    def test_map_header(self):
-        packer = Packer()
-        packer.pack_map_header(2**32-1)
-        self.assertRaises((OverflowError, ValueError),
-                          packer.pack_array_header, 2**32)
-
-
-    def test_max_str_len(self):
-        d = 'x' * 3
-        packed = packb(d)
-
-        unpacker = Unpacker(max_str_len=3, encoding='utf-8')
-        unpacker.feed(packed)
-        assert unpacker.unpack() == d
-
-        unpacker = Unpacker(max_str_len=2, encoding='utf-8')
-        unpacker.feed(packed)
-        self.assertRaises(ValueError, unpacker.unpack)
-
-
-    def test_max_bin_len(self):
-        d = b'x' * 3
-        packed = packb(d, use_bin_type=True)
-
-        unpacker = Unpacker(max_bin_len=3)
-        unpacker.feed(packed)
-        assert unpacker.unpack() == d
-
-        unpacker = Unpacker(max_bin_len=2)
-        unpacker.feed(packed)
-        self.assertRaises(ValueError, unpacker.unpack)
-
-
-    def test_max_array_len(self):
-        d = [1, 2, 3]
-        packed = packb(d)
-
-        unpacker = Unpacker(max_array_len=3)
-        unpacker.feed(packed)
-        assert unpacker.unpack() == d
-
-        unpacker = Unpacker(max_array_len=2)
-        unpacker.feed(packed)
-        self.assertRaises(ValueError, unpacker.unpack)
-
-
-    def test_max_map_len(self):
-        d = {1: 2, 3: 4, 5: 6}
-        packed = packb(d)
-
-        unpacker = Unpacker(max_map_len=3)
-        unpacker.feed(packed)
-        assert unpacker.unpack() == d
-
-        unpacker = Unpacker(max_map_len=2)
-        unpacker.feed(packed)
-        self.assertRaises(ValueError, unpacker.unpack)
-
-
-    def test_max_ext_len(self):
-        d = ExtType(42, b"abc")
-        packed = packb(d)
-
-        unpacker = Unpacker(max_ext_len=3)
-        unpacker.feed(packed)
-        assert unpacker.unpack() == d
-
-        unpacker = Unpacker(max_ext_len=2)
-        unpacker.feed(packed)
-        self.assertRaises(ValueError, unpacker.unpack)
diff --git a/pandas/tests/test_msgpack/test_newspec.py b/pandas/tests/test_msgpack/test_newspec.py
deleted file mode 100644
index 8532ab8cfb1a4..0000000000000
--- a/pandas/tests/test_msgpack/test_newspec.py
+++ /dev/null
@@ -1,88 +0,0 @@
-# coding: utf-8
-
-from pandas.msgpack import packb, unpackb, ExtType
-
-
-def test_str8():
-    header = b'\xd9'
-    data = b'x' * 32
-    b = packb(data.decode(), use_bin_type=True)
-    assert len(b) == len(data) + 2
-    assert b[0:2] == header + b'\x20'
-    assert b[2:] == data
-    assert unpackb(b) == data
-
-    data = b'x' * 255
-    b = packb(data.decode(), use_bin_type=True)
-    assert len(b) == len(data) + 2
-    assert b[0:2] == header + b'\xff'
-    assert b[2:] == data
-    assert unpackb(b) == data
-
-
-def test_bin8():
-    header = b'\xc4'
-    data = b''
-    b = packb(data, use_bin_type=True)
-    assert len(b) == len(data) + 2
-    assert b[0:2] == header + b'\x00'
-    assert b[2:] == data
-    assert unpackb(b) == data
-
-    data = b'x' * 255
-    b = packb(data, use_bin_type=True)
-    assert len(b) == len(data) + 2
-    assert b[0:2] == header + b'\xff'
-    assert b[2:] == data
-    assert unpackb(b) == data
-
-
-def test_bin16():
-    header = b'\xc5'
-    data = b'x' * 256
-    b = packb(data, use_bin_type=True)
-    assert len(b) == len(data) + 3
-    assert b[0:1] == header
-    assert b[1:3] == b'\x01\x00'
-    assert b[3:] == data
-    assert unpackb(b) == data
-
-    data = b'x' * 65535
-    b = packb(data, use_bin_type=True)
-    assert len(b) == len(data) + 3
-    assert b[0:1] == header
-    assert b[1:3] == b'\xff\xff'
-    assert b[3:] == data
-    assert unpackb(b) == data
-
-
-def test_bin32():
-    header = b'\xc6'
-    data = b'x' * 65536
-    b = packb(data, use_bin_type=True)
-    assert len(b) == len(data) + 5
-    assert b[0:1] == header
-    assert b[1:5] == b'\x00\x01\x00\x00'
-    assert b[5:] == data
-    assert unpackb(b) == data
-
-def test_ext():
-    def check(ext, packed):
-        assert packb(ext) == packed
-        assert unpackb(packed) == ext
-    check(ExtType(0x42, b'Z'), b'\xd4\x42Z') # fixext 1
-    check(ExtType(0x42, b'ZZ'), b'\xd5\x42ZZ') # fixext 2
-    check(ExtType(0x42, b'Z'*4), b'\xd6\x42' + b'Z'*4) # fixext 4
-    check(ExtType(0x42, b'Z'*8), b'\xd7\x42' + b'Z'*8) # fixext 8
-    check(ExtType(0x42, b'Z'*16), b'\xd8\x42' + b'Z'*16) # fixext 16
-    # ext 8
-    check(ExtType(0x42, b''), b'\xc7\x00\x42')
-    check(ExtType(0x42, b'Z'*255), b'\xc7\xff\x42' + b'Z'*255)
-    # ext 16
-    check(ExtType(0x42, b'Z'*256), b'\xc8\x01\x00\x42' + b'Z'*256)
-    check(ExtType(0x42, b'Z'*0xffff), b'\xc8\xff\xff\x42' + b'Z'*0xffff)
-    # ext 32
-    check(ExtType(0x42, b'Z'*0x10000), b'\xc9\x00\x01\x00\x00\x42' + b'Z'*0x10000)
-    # needs large memory
-    #check(ExtType(0x42, b'Z'*0xffffffff),
-    #              b'\xc9\xff\xff\xff\xff\x42' + b'Z'*0xffffffff)
diff --git a/pandas/tests/test_msgpack/test_obj.py b/pandas/tests/test_msgpack/test_obj.py
deleted file mode 100644
index 886fec522d4f3..0000000000000
--- a/pandas/tests/test_msgpack/test_obj.py
+++ /dev/null
@@ -1,71 +0,0 @@
-# coding: utf-8
-
-import unittest
-import nose
-
-import datetime
-from pandas.msgpack import packb, unpackb
-
-class DecodeError(Exception):
-    pass
-
-class TestObj(unittest.TestCase):
-
-    def _arr_to_str(self, arr):
-        return ''.join(str(c) for c in arr)
-
-    def bad_complex_decoder(self, o):
-        raise DecodeError("Ooops!")
-
-    def _decode_complex(self, obj):
-        if b'__complex__' in obj:
-            return complex(obj[b'real'], obj[b'imag'])
-        return obj
-
-    def _encode_complex(self, obj):
-        if isinstance(obj, complex):
-            return {b'__complex__': True, b'real': 1, b'imag': 2}
-        return obj
-
-    def test_encode_hook(self):
-        packed = packb([3, 1+2j], default=self._encode_complex)
-        unpacked = unpackb(packed, use_list=1)
-        assert unpacked[1] == {b'__complex__': True, b'real': 1, b'imag': 2}
-
-    def test_decode_hook(self):
-        packed = packb([3, {b'__complex__': True, b'real': 1, b'imag': 2}])
-        unpacked = unpackb(packed, object_hook=self._decode_complex, use_list=1)
-        assert unpacked[1] == 1+2j
-
-    def test_decode_pairs_hook(self):
-        packed = packb([3, {1: 2, 3: 4}])
-        prod_sum = 1 * 2 + 3 * 4
-        unpacked = unpackb(packed, object_pairs_hook=lambda l: sum(k * v for k, v in l), use_list=1)
-        assert unpacked[1] == prod_sum
-
-    def test_only_one_obj_hook(self):
-        self.assertRaises(TypeError, unpackb, b'', object_hook=lambda x: x, object_pairs_hook=lambda x: x)
-
-    def test_bad_hook(self):
-        def f():
-            packed = packb([3, 1+2j], default=lambda o: o)
-            unpacked = unpackb(packed, use_list=1)
-        self.assertRaises(TypeError, f)
-
-    def test_array_hook(self):
-        packed = packb([1,2,3])
-        unpacked = unpackb(packed, list_hook=self._arr_to_str, use_list=1)
-        assert unpacked == '123'
-
-    def test_an_exception_in_objecthook1(self):
-        def f():
-            packed = packb({1: {'__complex__': True, 'real': 1, 'imag': 2}})
-            unpackb(packed, object_hook=self.bad_complex_decoder)
-        self.assertRaises(DecodeError, f)
-
-
-    def test_an_exception_in_objecthook2(self):
-        def f():
-            packed = packb({1: [{'__complex__': True, 'real': 1, 'imag': 2}]})
-            unpackb(packed, list_hook=self.bad_complex_decoder, use_list=1)
-        self.assertRaises(DecodeError, f)
diff --git a/pandas/tests/test_msgpack/test_pack.py b/pandas/tests/test_msgpack/test_pack.py
deleted file mode 100644
index 22df6df5e2e45..0000000000000
--- a/pandas/tests/test_msgpack/test_pack.py
+++ /dev/null
@@ -1,144 +0,0 @@
-#!/usr/bin/env python
-# coding: utf-8
-
-import unittest
-import nose
-
-import struct
-from pandas import compat
-from pandas.compat import u, OrderedDict
-from pandas.msgpack import packb, unpackb, Unpacker, Packer
-
-class TestPack(unittest.TestCase):
-
-    def check(self, data, use_list=False):
-        re = unpackb(packb(data), use_list=use_list)
-        assert re == data
-
-    def testPack(self):
-        test_data = [
-            0, 1, 127, 128, 255, 256, 65535, 65536,
-            -1, -32, -33, -128, -129, -32768, -32769,
-            1.0,
-            b"", b"a", b"a"*31, b"a"*32,
-            None, True, False,
-            (), ((),), ((), None,),
-            {None: 0},
-            (1<<23),
-            ]
-        for td in test_data:
-            self.check(td)
-
-    def testPackUnicode(self):
-        test_data = [
-            u(""), u("abcd"), [u("defgh")], u("Русский текст"),
-            ]
-        for td in test_data:
-            re = unpackb(packb(td, encoding='utf-8'), use_list=1, encoding='utf-8')
-            assert re == td
-            packer = Packer(encoding='utf-8')
-            data = packer.pack(td)
-            re = Unpacker(compat.BytesIO(data), encoding='utf-8', use_list=1).unpack()
-            assert re == td
-
-    def testPackUTF32(self):
-        test_data = [
-            compat.u(""),
-            compat.u("abcd"),
-            [compat.u("defgh")],
-            compat.u("Русский текст"),
-            ]
-        for td in test_data:
-            re = unpackb(packb(td, encoding='utf-32'), use_list=1, encoding='utf-32')
-            assert re == td
-
-    def testPackBytes(self):
-        test_data = [
-            b"", b"abcd", (b"defgh",),
-            ]
-        for td in test_data:
-            self.check(td)
-
-    def testIgnoreUnicodeErrors(self):
-        re = unpackb(packb(b'abc\xeddef'), encoding='utf-8', unicode_errors='ignore', use_list=1)
-        assert re == "abcdef"
-
-    def testStrictUnicodeUnpack(self):
-        self.assertRaises(UnicodeDecodeError, unpackb, packb(b'abc\xeddef'), encoding='utf-8', use_list=1)
-
-    def testStrictUnicodePack(self):
-        self.assertRaises(UnicodeEncodeError, packb, compat.u("abc\xeddef"), encoding='ascii', unicode_errors='strict')
-
-    def testIgnoreErrorsPack(self):
-        re = unpackb(packb(compat.u("abcФФФdef"), encoding='ascii', unicode_errors='ignore'), encoding='utf-8', use_list=1)
-        assert re == compat.u("abcdef")
-
-    def testNoEncoding(self):
-        self.assertRaises(TypeError, packb, compat.u("abc"), encoding=None)
-
-    def testDecodeBinary(self):
-        re = unpackb(packb("abc"), encoding=None, use_list=1)
-        assert re == b"abc"
-
-    def testPackFloat(self):
-        assert packb(1.0, use_single_float=True)  == b'\xca' + struct.pack('>f', 1.0)
-        assert packb(1.0, use_single_float=False) == b'\xcb' + struct.pack('>d', 1.0)
-
-    def testArraySize(self, sizes=[0, 5, 50, 1000]):
-        bio = compat.BytesIO()
-        packer = Packer()
-        for size in sizes:
-            bio.write(packer.pack_array_header(size))
-            for i in range(size):
-                bio.write(packer.pack(i))
-
-        bio.seek(0)
-        unpacker = Unpacker(bio, use_list=1)
-        for size in sizes:
-            assert unpacker.unpack() == list(range(size))
-
-    def test_manualreset(self, sizes=[0, 5, 50, 1000]):
-        packer = Packer(autoreset=False)
-        for size in sizes:
-            packer.pack_array_header(size)
-            for i in range(size):
-                packer.pack(i)
-
-        bio = compat.BytesIO(packer.bytes())
-        unpacker = Unpacker(bio, use_list=1)
-        for size in sizes:
-            assert unpacker.unpack() == list(range(size))
-
-        packer.reset()
-        assert packer.bytes() == b''
-
-    def testMapSize(self, sizes=[0, 5, 50, 1000]):
-        bio = compat.BytesIO()
-        packer = Packer()
-        for size in sizes:
-            bio.write(packer.pack_map_header(size))
-            for i in range(size):
-                bio.write(packer.pack(i)) # key
-                bio.write(packer.pack(i * 2)) # value
-
-        bio.seek(0)
-        unpacker = Unpacker(bio)
-        for size in sizes:
-            assert unpacker.unpack() == dict((i, i * 2) for i in range(size))
-
-
-    def test_odict(self):
-        seq = [(b'one', 1), (b'two', 2), (b'three', 3), (b'four', 4)]
-        od = OrderedDict(seq)
-        assert unpackb(packb(od), use_list=1) == dict(seq)
-        def pair_hook(seq):
-            return list(seq)
-        assert unpackb(packb(od), object_pairs_hook=pair_hook, use_list=1) == seq
-
-
-    def test_pairlist(self):
-        pairlist = [(b'a', 1), (2, b'b'), (b'foo', b'bar')]
-        packer = Packer()
-        packed = packer.pack_map_pairs(pairlist)
-        unpacked = unpackb(packed, object_pairs_hook=list)
-        assert pairlist == unpacked
diff --git a/pandas/tests/test_msgpack/test_seq.py b/pandas/tests/test_msgpack/test_seq.py
deleted file mode 100644
index 464ff6d0174af..0000000000000
--- a/pandas/tests/test_msgpack/test_seq.py
+++ /dev/null
@@ -1,41 +0,0 @@
-#!/usr/bin/env python
-# coding: utf-8
-
-import io
-import pandas.msgpack as msgpack
-
-
-binarydata = bytes(bytearray(range(256)))
-
-def gen_binary_data(idx):
-    return binarydata[:idx % 300]
-
-
-def test_exceeding_unpacker_read_size():
-    dumpf = io.BytesIO()
-
-    packer = msgpack.Packer()
-
-    NUMBER_OF_STRINGS = 6
-    read_size = 16
-                                # 5 ok for read_size=16, while 6 glibc detected *** python: double free or corruption (fasttop):
-                                # 20 ok for read_size=256, while 25 segfaults / glibc detected *** python: double free or corruption (!prev)
-                                # 40 ok for read_size=1024, while 50 introduces errors
-                                # 7000 ok for read_size=1024*1024, while 8000 leads to  glibc detected *** python: double free or corruption (!prev):
-
-    for idx in range(NUMBER_OF_STRINGS):
-        data = gen_binary_data(idx)
-        dumpf.write(packer.pack(data))
-
-    f = io.BytesIO(dumpf.getvalue())
-    dumpf.close()
-
-    unpacker = msgpack.Unpacker(f, read_size=read_size, use_list=1)
-
-    read_count = 0
-    for idx, o in enumerate(unpacker):
-        assert type(o) == bytes
-        assert o == gen_binary_data(idx)
-        read_count += 1
-
-    assert read_count == NUMBER_OF_STRINGS
diff --git a/pandas/tests/test_msgpack/test_sequnpack.py b/pandas/tests/test_msgpack/test_sequnpack.py
deleted file mode 100644
index 72ceed0471437..0000000000000
--- a/pandas/tests/test_msgpack/test_sequnpack.py
+++ /dev/null
@@ -1,96 +0,0 @@
-#!/usr/bin/env python
-# coding: utf-8
-
-import unittest
-import nose
-
-from pandas import compat
-from pandas.msgpack import Unpacker, BufferFull
-from pandas.msgpack import OutOfData
-
-class TestPack(unittest.TestCase):
-
-    def test_partialdata(self):
-        unpacker = Unpacker()
-        unpacker.feed(b'\xa5')
-        self.assertRaises(StopIteration, next, iter(unpacker))
-        unpacker.feed(b'h')
-        self.assertRaises(StopIteration, next, iter(unpacker))
-        unpacker.feed(b'a')
-        self.assertRaises(StopIteration, next, iter(unpacker))
-        unpacker.feed(b'l')
-        self.assertRaises(StopIteration, next, iter(unpacker))
-        unpacker.feed(b'l')
-        self.assertRaises(StopIteration, next, iter(unpacker))
-        unpacker.feed(b'o')
-        assert next(iter(unpacker)) == b'hallo'
-
-    def test_foobar(self):
-        unpacker = Unpacker(read_size=3, use_list=1)
-        unpacker.feed(b'foobar')
-        assert unpacker.unpack() == ord(b'f')
-        assert unpacker.unpack() == ord(b'o')
-        assert unpacker.unpack() == ord(b'o')
-        assert unpacker.unpack() == ord(b'b')
-        assert unpacker.unpack() == ord(b'a')
-        assert unpacker.unpack() == ord(b'r')
-        self.assertRaises(OutOfData, unpacker.unpack)
-
-        unpacker.feed(b'foo')
-        unpacker.feed(b'bar')
-
-        k = 0
-        for o, e in zip(unpacker, 'foobarbaz'):
-            assert o == ord(e)
-            k += 1
-        assert k == len(b'foobar')
-
-    def test_foobar_skip(self):
-        unpacker = Unpacker(read_size=3, use_list=1)
-        unpacker.feed(b'foobar')
-        assert unpacker.unpack() == ord(b'f')
-        unpacker.skip()
-        assert unpacker.unpack() == ord(b'o')
-        unpacker.skip()
-        assert unpacker.unpack() == ord(b'a')
-        unpacker.skip()
-        self.assertRaises(OutOfData, unpacker.unpack)
-
-    def test_maxbuffersize(self):
-        self.assertRaises(ValueError, Unpacker, read_size=5, max_buffer_size=3)
-        unpacker = Unpacker(read_size=3, max_buffer_size=3, use_list=1)
-        unpacker.feed(b'fo')
-        self.assertRaises(BufferFull, unpacker.feed, b'ob')
-        unpacker.feed(b'o')
-        assert ord('f') == next(unpacker)
-        unpacker.feed(b'b')
-        assert ord('o') == next(unpacker)
-        assert ord('o') == next(unpacker)
-        assert ord('b') == next(unpacker)
-
-    def test_readbytes(self):
-        unpacker = Unpacker(read_size=3)
-        unpacker.feed(b'foobar')
-        assert unpacker.unpack() == ord(b'f')
-        assert unpacker.read_bytes(3) == b'oob'
-        assert unpacker.unpack() == ord(b'a')
-        assert unpacker.unpack() == ord(b'r')
-
-        # Test buffer refill
-        unpacker = Unpacker(compat.BytesIO(b'foobar'), read_size=3)
-        assert unpacker.unpack() == ord(b'f')
-        assert unpacker.read_bytes(3) == b'oob'
-        assert unpacker.unpack() == ord(b'a')
-        assert unpacker.unpack() == ord(b'r')
-
-    def test_issue124(self):
-        unpacker = Unpacker()
-        unpacker.feed(b'\xa1?\xa1!')
-        assert tuple(unpacker) == (b'?', b'!')
-        assert tuple(unpacker) == ()
-        unpacker.feed(b"\xa1?\xa1")
-        assert tuple(unpacker) == (b'?',)
-        assert tuple(unpacker) == ()
-        unpacker.feed(b"!")
-        assert tuple(unpacker) == (b'!',)
-        assert tuple(unpacker) == ()
diff --git a/pandas/tests/test_multilevel.py b/pandas/tests/test_multilevel.py
index df61387734cb3..3caee2b44c579 100644
--- a/pandas/tests/test_multilevel.py
+++ b/pandas/tests/test_multilevel.py
@@ -1,38 +1,35 @@
 # -*- coding: utf-8 -*-
 # pylint: disable-msg=W0612,E1101,W0141
+from warnings import catch_warnings
 import datetime
 import itertools
-import nose
+import pytest
+import pytz
 
 from numpy.random import randn
 import numpy as np
 
 from pandas.core.index import Index, MultiIndex
-from pandas import Panel, DataFrame, Series, notnull, isnull, Timestamp
+from pandas import Panel, DataFrame, Series, notna, isna, Timestamp
 
-from pandas.util.testing import (assert_almost_equal,
-                                 assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp)
+from pandas.core.dtypes.common import is_float_dtype, is_integer_dtype
 import pandas.core.common as com
 import pandas.util.testing as tm
-from pandas.compat import (range, lrange, StringIO, lzip, u,
-                                product as cart_product, zip)
+from pandas.compat import (range, lrange, StringIO, lzip, u, product as
+                           cart_product, zip)
 import pandas as pd
+import pandas._libs.index as _index
 
-import pandas.index as _index
+AGG_FUNCTIONS = ['sum', 'prod', 'min', 'max', 'median', 'mean', 'skew', 'mad',
+                 'std', 'var', 'sem']
 
 
-class TestMultiLevel(tm.TestCase):
+class Base(object):
 
-    _multiprocess_can_split_ = True
+    def setup_method(self, method):
 
-    def setUp(self):
-        import warnings
-        warnings.filterwarnings(action='ignore', category=FutureWarning)
-
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
+        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
+                                                                  'three']],
                            labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
                                    [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
                            names=['first', 'second'])
@@ -40,8 +37,7 @@ def setUp(self):
                                columns=Index(['A', 'B', 'C'], name='exp'))
 
         self.single_level = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux']],
-                                       labels=[[0, 1, 2, 3]],
-                                       names=['first'])
+                                       labels=[[0, 1, 2, 3]], names=['first'])
 
         # create test series object
         arrays = [['bar', 'bar', 'baz', 'baz', 'qux', 'qux', 'foo', 'foo'],
@@ -59,10 +55,12 @@ def setUp(self):
 
         # use Int64Index, to make sure things work
         self.ymd.index.set_levels([lev.astype('i8')
-                                 for lev in self.ymd.index.levels],
-                                 inplace=True)
-        self.ymd.index.set_names(['year', 'month', 'day'],
-                                 inplace=True)
+                                   for lev in self.ymd.index.levels],
+                                  inplace=True)
+        self.ymd.index.set_names(['year', 'month', 'day'], inplace=True)
+
+
+class TestMultiLevel(Base):
 
     def test_append(self):
         a, b = self.frame[:5], self.frame[5:]
@@ -74,10 +72,9 @@ def test_append(self):
         tm.assert_series_equal(result, self.frame['A'])
 
     def test_append_index(self):
-        tm._skip_if_no_pytz()
-
         idx1 = Index([1.1, 1.2, 1.3])
-        idx2 = pd.date_range('2011-01-01', freq='D', periods=3, tz='Asia/Tokyo')
+        idx2 = pd.date_range('2011-01-01', freq='D', periods=3,
+                             tz='Asia/Tokyo')
         idx3 = Index(['A', 'B', 'C'])
 
         midx_lv2 = MultiIndex.from_arrays([idx1, idx2])
@@ -85,58 +82,57 @@ def test_append_index(self):
 
         result = idx1.append(midx_lv2)
 
-        # GH 7112
-        import pytz
+        # see gh-7112
         tz = pytz.timezone('Asia/Tokyo')
-        expected_tuples = [(1.1, datetime.datetime(2011, 1, 1, tzinfo=tz)),
-                           (1.2, datetime.datetime(2011, 1, 2, tzinfo=tz)),
-                           (1.3, datetime.datetime(2011, 1, 3, tzinfo=tz))]
+        expected_tuples = [(1.1, tz.localize(datetime.datetime(2011, 1, 1))),
+                           (1.2, tz.localize(datetime.datetime(2011, 1, 2))),
+                           (1.3, tz.localize(datetime.datetime(2011, 1, 3)))]
         expected = Index([1.1, 1.2, 1.3] + expected_tuples)
-        self.assertTrue(result.equals(expected))
+        tm.assert_index_equal(result, expected)
 
         result = midx_lv2.append(idx1)
         expected = Index(expected_tuples + [1.1, 1.2, 1.3])
-        self.assertTrue(result.equals(expected))
+        tm.assert_index_equal(result, expected)
 
         result = midx_lv2.append(midx_lv2)
-        expected = MultiIndex.from_arrays([idx1.append(idx1), idx2.append(idx2)])
-        self.assertTrue(result.equals(expected))
+        expected = MultiIndex.from_arrays([idx1.append(idx1),
+                                           idx2.append(idx2)])
+        tm.assert_index_equal(result, expected)
 
         result = midx_lv2.append(midx_lv3)
-        self.assertTrue(result.equals(expected))
+        tm.assert_index_equal(result, expected)
 
         result = midx_lv3.append(midx_lv2)
         expected = Index._simple_new(
-            np.array([(1.1, datetime.datetime(2011, 1, 1, tzinfo=tz), 'A'),
-                      (1.2, datetime.datetime(2011, 1, 2, tzinfo=tz), 'B'),
-                      (1.3, datetime.datetime(2011, 1, 3, tzinfo=tz), 'C')]
-                      + expected_tuples), None)
-        self.assertTrue(result.equals(expected))
+            np.array([(1.1, tz.localize(datetime.datetime(2011, 1, 1)), 'A'),
+                      (1.2, tz.localize(datetime.datetime(2011, 1, 2)), 'B'),
+                      (1.3, tz.localize(datetime.datetime(2011, 1, 3)), 'C')] +
+                     expected_tuples), None)
+        tm.assert_index_equal(result, expected)
 
     def test_dataframe_constructor(self):
         multi = DataFrame(np.random.randn(4, 4),
                           index=[np.array(['a', 'a', 'b', 'b']),
                                  np.array(['x', 'y', 'x', 'y'])])
-        tm.assertIsInstance(multi.index, MultiIndex)
-        self.assertNotIsInstance(multi.columns, MultiIndex)
+        assert isinstance(multi.index, MultiIndex)
+        assert not isinstance(multi.columns, MultiIndex)
 
         multi = DataFrame(np.random.randn(4, 4),
                           columns=[['a', 'a', 'b', 'b'],
                                    ['x', 'y', 'x', 'y']])
-        tm.assertIsInstance(multi.columns, MultiIndex)
+        assert isinstance(multi.columns, MultiIndex)
 
     def test_series_constructor(self):
-        multi = Series(1., index=[np.array(['a', 'a', 'b', 'b']),
-                                  np.array(['x', 'y', 'x', 'y'])])
-        tm.assertIsInstance(multi.index, MultiIndex)
+        multi = Series(1., index=[np.array(['a', 'a', 'b', 'b']), np.array(
+            ['x', 'y', 'x', 'y'])])
+        assert isinstance(multi.index, MultiIndex)
 
-        multi = Series(1., index=[['a', 'a', 'b', 'b'],
-                                  ['x', 'y', 'x', 'y']])
-        tm.assertIsInstance(multi.index, MultiIndex)
+        multi = Series(1., index=[['a', 'a', 'b', 'b'], ['x', 'y', 'x', 'y']])
+        assert isinstance(multi.index, MultiIndex)
 
         multi = Series(lrange(4), index=[['a', 'a', 'b', 'b'],
-                                        ['x', 'y', 'x', 'y']])
-        tm.assertIsInstance(multi.index, MultiIndex)
+                                         ['x', 'y', 'x', 'y']])
+        assert isinstance(multi.index, MultiIndex)
 
     def test_reindex_level(self):
         # axis=0
@@ -144,18 +140,18 @@ def test_reindex_level(self):
         result = month_sums.reindex(self.ymd.index, level=1)
         expected = self.ymd.groupby(level='month').transform(np.sum)
 
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         # Series
         result = month_sums['A'].reindex(self.ymd.index, level=1)
         expected = self.ymd['A'].groupby(level='month').transform(np.sum)
-        assert_series_equal(result, expected, check_names=False)
+        tm.assert_series_equal(result, expected, check_names=False)
 
         # axis=1
         month_sums = self.ymd.T.sum(axis=1, level='month')
         result = month_sums.reindex(columns=self.ymd.index, level=1)
         expected = self.ymd.groupby(level='month').transform(np.sum).T
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
     def test_binops_level(self):
         def _check_op(opname):
@@ -165,16 +161,16 @@ def _check_op(opname):
 
             broadcasted = self.ymd.groupby(level='month').transform(np.sum)
             expected = op(self.ymd, broadcasted)
-            assert_frame_equal(result, expected)
+            tm.assert_frame_equal(result, expected)
 
             # Series
             op = getattr(Series, opname)
             result = op(self.ymd['A'], month_sums['A'], level='month')
-            broadcasted = self.ymd['A'].groupby(
-                level='month').transform(np.sum)
+            broadcasted = self.ymd['A'].groupby(level='month').transform(
+                np.sum)
             expected = op(self.ymd['A'], broadcasted)
             expected.name = 'A'
-            assert_series_equal(result, expected)
+            tm.assert_series_equal(result, expected)
 
         _check_op('sub')
         _check_op('add')
@@ -182,10 +178,9 @@ def _check_op(opname):
         _check_op('div')
 
     def test_pickle(self):
-
         def _test_roundtrip(frame):
-            unpickled = self.round_trip_pickle(frame)
-            assert_frame_equal(frame, unpickled)
+            unpickled = tm.round_trip_pickle(frame)
+            tm.assert_frame_equal(frame, unpickled)
 
         _test_roundtrip(self.frame)
         _test_roundtrip(self.frame.T)
@@ -193,66 +188,32 @@ def _test_roundtrip(frame):
         _test_roundtrip(self.ymd.T)
 
     def test_reindex(self):
-        reindexed = self.frame.ix[[('foo', 'one'), ('bar', 'one')]]
-        expected = self.frame.ix[[0, 3]]
-        assert_frame_equal(reindexed, expected)
+        expected = self.frame.iloc[[0, 3]]
+        reindexed = self.frame.loc[[('foo', 'one'), ('bar', 'one')]]
+        tm.assert_frame_equal(reindexed, expected)
+
+        with catch_warnings(record=True):
+            reindexed = self.frame.ix[[('foo', 'one'), ('bar', 'one')]]
+        tm.assert_frame_equal(reindexed, expected)
 
     def test_reindex_preserve_levels(self):
         new_index = self.ymd.index[::10]
         chunk = self.ymd.reindex(new_index)
-        self.assertIs(chunk.index, new_index)
+        assert chunk.index is new_index
+
+        chunk = self.ymd.loc[new_index]
+        assert chunk.index is new_index
 
-        chunk = self.ymd.ix[new_index]
-        self.assertIs(chunk.index, new_index)
+        with catch_warnings(record=True):
+            chunk = self.ymd.ix[new_index]
+        assert chunk.index is new_index
 
         ymdT = self.ymd.T
         chunk = ymdT.reindex(columns=new_index)
-        self.assertIs(chunk.columns, new_index)
-
-        chunk = ymdT.ix[:, new_index]
-        self.assertIs(chunk.columns, new_index)
-
-    def test_sort_index_preserve_levels(self):
-        result = self.frame.sort_index()
-        self.assertEqual(result.index.names, self.frame.index.names)
-
-    def test_sorting_repr_8017(self):
-
-        np.random.seed(0)
-        data = np.random.randn(3,4)
-
-        for gen, extra in [([1.,3.,2.,5.],4.),
-                           ([1,3,2,5],4),
-                           ([Timestamp('20130101'),Timestamp('20130103'),Timestamp('20130102'),Timestamp('20130105')],Timestamp('20130104')),
-                           (['1one','3one','2one','5one'],'4one')]:
-            columns = MultiIndex.from_tuples([('red', i) for i in gen])
-            df = DataFrame(data, index=list('def'), columns=columns)
-            df2 = pd.concat([df,DataFrame('world',
-                                          index=list('def'),
-                                          columns=MultiIndex.from_tuples([('red', extra)]))],axis=1)
+        assert chunk.columns is new_index
 
-            # check that the repr is good
-            # make sure that we have a correct sparsified repr
-            # e.g. only 1 header of read
-            self.assertEqual(str(df2).splitlines()[0].split(),['red'])
-
-            # GH 8017
-            # sorting fails after columns added
-
-            # construct single-dtype then sort
-            result = df.copy().sort_index(axis=1)
-            expected = df.iloc[:,[0,2,1,3]]
-            assert_frame_equal(result, expected)
-
-            result = df2.sort_index(axis=1)
-            expected = df2.iloc[:,[0,2,1,4,3]]
-            assert_frame_equal(result, expected)
-
-            # setitem then sort
-            result = df.copy()
-            result[('red',extra)] = 'world'
-            result = result.sort_index(axis=1)
-            assert_frame_equal(result, expected)
+        chunk = ymdT.loc[:, new_index]
+        assert chunk.columns is new_index
 
     def test_repr_to_string(self):
         repr(self.frame)
@@ -273,59 +234,68 @@ def test_repr_name_coincide(self):
         df = DataFrame({'value': [0, 1]}, index=index)
 
         lines = repr(df).split('\n')
-        self.assertTrue(lines[2].startswith('a 0 foo'))
+        assert lines[2].startswith('a 0 foo')
 
     def test_getitem_simple(self):
         df = self.frame.T
 
         col = df['foo', 'one']
-        assert_almost_equal(col.values, df.values[:, 0])
-        self.assertRaises(KeyError, df.__getitem__, ('foo', 'four'))
-        self.assertRaises(KeyError, df.__getitem__, 'foobar')
+        tm.assert_almost_equal(col.values, df.values[:, 0])
+        with pytest.raises(KeyError):
+            df[('foo', 'four')]
+        with pytest.raises(KeyError):
+            df['foobar']
 
     def test_series_getitem(self):
         s = self.ymd['A']
 
         result = s[2000, 3]
-        result2 = s.ix[2000, 3]
+
+        # TODO(wesm): unused?
+        # result2 = s.loc[2000, 3]
+
         expected = s.reindex(s.index[42:65])
         expected.index = expected.index.droplevel(0).droplevel(0)
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
         result = s[2000, 3, 10]
         expected = s[49]
-        self.assertEqual(result, expected)
+        assert result == expected
 
         # fancy
-        result = s.ix[[(2000, 3, 10), (2000, 3, 13)]]
         expected = s.reindex(s.index[49:51])
-        assert_series_equal(result, expected)
+        result = s.loc[[(2000, 3, 10), (2000, 3, 13)]]
+        tm.assert_series_equal(result, expected)
+
+        with catch_warnings(record=True):
+            result = s.ix[[(2000, 3, 10), (2000, 3, 13)]]
+        tm.assert_series_equal(result, expected)
 
         # key error
-        self.assertRaises(KeyError, s.__getitem__, (2000, 3, 4))
+        pytest.raises(KeyError, s.__getitem__, (2000, 3, 4))
 
     def test_series_getitem_corner(self):
         s = self.ymd['A']
 
         # don't segfault, GH #495
         # out of bounds access
-        self.assertRaises(IndexError, s.__getitem__, len(self.ymd))
+        pytest.raises(IndexError, s.__getitem__, len(self.ymd))
 
         # generator
         result = s[(x > 0 for x in s)]
         expected = s[s > 0]
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
     def test_series_setitem(self):
         s = self.ymd['A']
 
         s[2000, 3] = np.nan
-        self.assertTrue(isnull(s.values[42:65]).all())
-        self.assertTrue(notnull(s.values[:42]).all())
-        self.assertTrue(notnull(s.values[65:]).all())
+        assert isna(s.values[42:65]).all()
+        assert notna(s.values[:42]).all()
+        assert notna(s.values[65:]).all()
 
         s[2000, 3, 10] = np.nan
-        self.assertTrue(isnull(s[49]))
+        assert isna(s[49])
 
     def test_series_slice_partial(self):
         pass
@@ -336,36 +306,36 @@ def test_frame_getitem_setitem_boolean(self):
 
         result = df[df > 0]
         expected = df.where(df > 0)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         df[df > 0] = 5
         values[values > 0] = 5
-        assert_almost_equal(df.values, values)
+        tm.assert_almost_equal(df.values, values)
 
         df[df == 5] = 0
         values[values == 5] = 0
-        assert_almost_equal(df.values, values)
+        tm.assert_almost_equal(df.values, values)
 
         # a df that needs alignment first
         df[df[:-1] < 0] = 2
         np.putmask(values[:-1], values[:-1] < 0, 2)
-        assert_almost_equal(df.values, values)
+        tm.assert_almost_equal(df.values, values)
 
-        with assertRaisesRegexp(TypeError, 'boolean values only'):
+        with tm.assert_raises_regex(TypeError, 'boolean values only'):
             df[df * 0] = 2
 
     def test_frame_getitem_setitem_slice(self):
         # getitem
-        result = self.frame.ix[:4]
+        result = self.frame.iloc[:4]
         expected = self.frame[:4]
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         # setitem
         cp = self.frame.copy()
-        cp.ix[:4] = 0
+        cp.iloc[:4] = 0
 
-        self.assertTrue((cp.values[:4] == 0).all())
-        self.assertTrue((cp.values[4:] != 0).all())
+        assert (cp.values[:4] == 0).all()
+        assert (cp.values[4:] != 0).all()
 
     def test_frame_getitem_setitem_multislice(self):
         levels = [['t1', 't2'], ['a', 'b', 'c']]
@@ -373,34 +343,36 @@ def test_frame_getitem_setitem_multislice(self):
         midx = MultiIndex(labels=labels, levels=levels, names=[None, 'id'])
         df = DataFrame({'value': [1, 2, 3, 7, 8]}, index=midx)
 
-        result = df.ix[:, 'value']
-        assert_series_equal(df['value'], result)
+        result = df.loc[:, 'value']
+        tm.assert_series_equal(df['value'], result)
+
+        with catch_warnings(record=True):
+            result = df.ix[:, 'value']
+        tm.assert_series_equal(df['value'], result)
 
-        result = df.ix[1:3, 'value']
-        assert_series_equal(df['value'][1:3], result)
+        result = df.loc[df.index[1:3], 'value']
+        tm.assert_series_equal(df['value'][1:3], result)
 
-        result = df.ix[:, :]
-        assert_frame_equal(df, result)
+        result = df.loc[:, :]
+        tm.assert_frame_equal(df, result)
 
         result = df
-        df.ix[:, 'value'] = 10
+        df.loc[:, 'value'] = 10
         result['value'] = 10
-        assert_frame_equal(df, result)
+        tm.assert_frame_equal(df, result)
 
-        df.ix[:, :] = 10
-        assert_frame_equal(df, result)
+        df.loc[:, :] = 10
+        tm.assert_frame_equal(df, result)
 
     def test_frame_getitem_multicolumn_empty_level(self):
-        f = DataFrame({'a': ['1', '2', '3'],
-                       'b': ['2', '3', '4']})
-        f.columns = [['level1 item1', 'level1 item2'],
-                     ['', 'level2 item2'],
+        f = DataFrame({'a': ['1', '2', '3'], 'b': ['2', '3', '4']})
+        f.columns = [['level1 item1', 'level1 item2'], ['', 'level2 item2'],
                      ['level3 item1', 'level3 item2']]
 
         result = f['level1 item1']
         expected = DataFrame([['1'], ['2'], ['3']], index=f.index,
                              columns=['level3 item1'])
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
     def test_frame_setitem_multi_column(self):
         df = DataFrame(randn(10, 4), columns=[['a', 'a', 'b', 'b'],
@@ -408,21 +380,21 @@ def test_frame_setitem_multi_column(self):
 
         cp = df.copy()
         cp['a'] = cp['b']
-        assert_frame_equal(cp['a'], cp['b'])
+        tm.assert_frame_equal(cp['a'], cp['b'])
 
         # set with ndarray
         cp = df.copy()
         cp['a'] = cp['b'].values
-        assert_frame_equal(cp['a'], cp['b'])
+        tm.assert_frame_equal(cp['a'], cp['b'])
 
-        #----------------------------------------
+        # ---------------------------------------
         # #1803
         columns = MultiIndex.from_tuples([('A', '1'), ('A', '2'), ('B', '1')])
         df = DataFrame(index=[1, 3, 5], columns=columns)
 
         # Works, but adds a column instead of updating the two existing ones
         df['A'] = 0.0  # Doesn't work
-        self.assertTrue((df['A'].values == 0).all())
+        assert (df['A'].values == 0).all()
 
         # it broadcasts
         df['B', '1'] = [1, 2, 3]
@@ -431,11 +403,11 @@ def test_frame_setitem_multi_column(self):
         sliced_a1 = df['A', '1']
         sliced_a2 = df['A', '2']
         sliced_b1 = df['B', '1']
-        assert_series_equal(sliced_a1, sliced_b1, check_names=False)
-        assert_series_equal(sliced_a2, sliced_b1, check_names=False)
-        self.assertEqual(sliced_a1.name, ('A', '1'))
-        self.assertEqual(sliced_a2.name, ('A', '2'))
-        self.assertEqual(sliced_b1.name, ('B', '1'))
+        tm.assert_series_equal(sliced_a1, sliced_b1, check_names=False)
+        tm.assert_series_equal(sliced_a2, sliced_b1, check_names=False)
+        assert sliced_a1.name == ('A', '1')
+        assert sliced_a2.name == ('A', '2')
+        assert sliced_b1.name == ('B', '1')
 
     def test_getitem_tuple_plus_slice(self):
         # GH #671
@@ -446,95 +418,88 @@ def test_getitem_tuple_plus_slice(self):
 
         idf = df.set_index(['a', 'b'])
 
-        result = idf.ix[(0, 0), :]
-        expected = idf.ix[0, 0]
+        result = idf.loc[(0, 0), :]
+        expected = idf.loc[0, 0]
         expected2 = idf.xs((0, 0))
+        with catch_warnings(record=True):
+            expected3 = idf.ix[0, 0]
 
-        assert_series_equal(result, expected)
-        assert_series_equal(result, expected2)
+        tm.assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected2)
+        tm.assert_series_equal(result, expected3)
 
     def test_getitem_setitem_tuple_plus_columns(self):
         # GH #1013
 
         df = self.ymd[:5]
 
-        result = df.ix[(2000, 1, 6), ['A', 'B', 'C']]
-        expected = df.ix[2000, 1, 6][['A', 'B', 'C']]
-        assert_series_equal(result, expected)
-
-    def test_getitem_multilevel_index_tuple_unsorted(self):
-        index_columns = list("abc")
-        df = DataFrame([[0, 1, 0, "x"], [0, 0, 1, "y"]],
-                       columns=index_columns + ["data"])
-        df = df.set_index(index_columns)
-        query_index = df.index[:1]
-        rs = df.ix[query_index, "data"]
-
-        xp_idx = MultiIndex.from_tuples([(0, 1, 0)], names=['a', 'b', 'c'])
-        xp = Series(['x'], index=xp_idx, name='data')
-        assert_series_equal(rs, xp)
+        result = df.loc[(2000, 1, 6), ['A', 'B', 'C']]
+        expected = df.loc[2000, 1, 6][['A', 'B', 'C']]
+        tm.assert_series_equal(result, expected)
 
     def test_xs(self):
         xs = self.frame.xs(('bar', 'two'))
-        xs2 = self.frame.ix[('bar', 'two')]
+        xs2 = self.frame.loc[('bar', 'two')]
 
-        assert_series_equal(xs, xs2)
-        assert_almost_equal(xs.values, self.frame.values[4])
+        tm.assert_series_equal(xs, xs2)
+        tm.assert_almost_equal(xs.values, self.frame.values[4])
 
         # GH 6574
         # missing values in returned index should be preserrved
         acc = [
-            ('a','abcde',1),
-            ('b','bbcde',2),
-            ('y','yzcde',25),
-            ('z','xbcde',24),
-            ('z',None,26),
-            ('z','zbcde',25),
-            ('z','ybcde',26),
-            ]
-        df = DataFrame(acc, columns=['a1','a2','cnt']).set_index(['a1','a2'])
-        expected = DataFrame({ 'cnt' : [24,26,25,26] }, index=Index(['xbcde',np.nan,'zbcde','ybcde'],name='a2'))
-
-        result = df.xs('z',level='a1')
-        assert_frame_equal(result, expected)
+            ('a', 'abcde', 1),
+            ('b', 'bbcde', 2),
+            ('y', 'yzcde', 25),
+            ('z', 'xbcde', 24),
+            ('z', None, 26),
+            ('z', 'zbcde', 25),
+            ('z', 'ybcde', 26),
+        ]
+        df = DataFrame(acc,
+                       columns=['a1', 'a2', 'cnt']).set_index(['a1', 'a2'])
+        expected = DataFrame({'cnt': [24, 26, 25, 26]}, index=Index(
+            ['xbcde', np.nan, 'zbcde', 'ybcde'], name='a2'))
+
+        result = df.xs('z', level='a1')
+        tm.assert_frame_equal(result, expected)
 
     def test_xs_partial(self):
         result = self.frame.xs('foo')
-        result2 = self.frame.ix['foo']
+        result2 = self.frame.loc['foo']
         expected = self.frame.T['foo'].T
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result, result2)
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, result2)
 
         result = self.ymd.xs((2000, 4))
-        expected = self.ymd.ix[2000, 4]
-        assert_frame_equal(result, expected)
+        expected = self.ymd.loc[2000, 4]
+        tm.assert_frame_equal(result, expected)
 
         # ex from #1796
         index = MultiIndex(levels=[['foo', 'bar'], ['one', 'two'], [-1, 1]],
                            labels=[[0, 0, 0, 0, 1, 1, 1, 1],
-                                   [0, 0, 1, 1, 0, 0, 1, 1],
-                                   [0, 1, 0, 1, 0, 1, 0, 1]])
+                                   [0, 0, 1, 1, 0, 0, 1, 1], [0, 1, 0, 1, 0, 1,
+                                                              0, 1]])
         df = DataFrame(np.random.randn(8, 4), index=index,
                        columns=list('abcd'))
 
         result = df.xs(['foo', 'one'])
-        expected = df.ix['foo', 'one']
-        assert_frame_equal(result, expected)
+        expected = df.loc['foo', 'one']
+        tm.assert_frame_equal(result, expected)
 
     def test_xs_level(self):
         result = self.frame.xs('two', level='second')
         expected = self.frame[self.frame.index.get_level_values(1) == 'two']
         expected.index = expected.index.droplevel(1)
 
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
-        index = MultiIndex.from_tuples([('x', 'y', 'z'), ('a', 'b', 'c'),
-                                        ('p', 'q', 'r')])
+        index = MultiIndex.from_tuples([('x', 'y', 'z'), ('a', 'b', 'c'), (
+            'p', 'q', 'r')])
         df = DataFrame(np.random.randn(3, 5), index=index)
         result = df.xs('c', level=2)
         expected = df[1:2]
         expected.index = expected.index.droplevel(2)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         # this is a copy in 0.14
         result = self.frame.xs('two', level='second')
@@ -543,7 +508,8 @@ def test_xs_level(self):
         # as we are trying to write a view
         def f(x):
             x[:] = 10
-        self.assertRaises(com.SettingWithCopyError, f, result)
+
+        pytest.raises(com.SettingWithCopyError, f, result)
 
     def test_xs_level_multiple(self):
         from pandas import read_table
@@ -553,11 +519,11 @@ def test_xs_level_multiple(self):
 a   q   20      4     0.4473  1.4152  0.2834  1.00661  0.1744
 x   q   30      3    -0.6662 -0.5243 -0.3580  0.89145  2.5838"""
 
-        df = read_table(StringIO(text), sep='\s+', engine='python')
+        df = read_table(StringIO(text), sep=r'\s+', engine='python')
 
         result = df.xs(('a', 4), level=['one', 'four'])
         expected = df.xs('a').xs(4, level='four')
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         # this is a copy in 0.14
         result = df.xs(('a', 4), level=['one', 'four'])
@@ -566,7 +532,8 @@ def test_xs_level_multiple(self):
         # as we are trying to write a view
         def f(x):
             x[:] = 10
-        self.assertRaises(com.SettingWithCopyError, f, result)
+
+        pytest.raises(com.SettingWithCopyError, f, result)
 
         # GH2107
         dates = lrange(20111201, 20111205)
@@ -574,9 +541,10 @@ def f(x):
         idx = MultiIndex.from_tuples([x for x in cart_product(dates, ids)])
         idx.names = ['date', 'secid']
         df = DataFrame(np.random.randn(len(idx), 3), idx, ['X', 'Y', 'Z'])
+
         rs = df.xs(20111201, level='date')
-        xp = df.ix[20111201, :]
-        assert_frame_equal(rs, xp)
+        xp = df.loc[20111201, :]
+        tm.assert_frame_equal(rs, xp)
 
     def test_xs_level0(self):
         from pandas import read_table
@@ -586,33 +554,33 @@ def test_xs_level0(self):
 a   q   20      4     0.4473  1.4152  0.2834  1.00661  0.1744
 x   q   30      3    -0.6662 -0.5243 -0.3580  0.89145  2.5838"""
 
-        df = read_table(StringIO(text), sep='\s+', engine='python')
+        df = read_table(StringIO(text), sep=r'\s+', engine='python')
 
         result = df.xs('a', level=0)
         expected = df.xs('a')
-        self.assertEqual(len(result), 2)
-        assert_frame_equal(result, expected)
+        assert len(result) == 2
+        tm.assert_frame_equal(result, expected)
 
     def test_xs_level_series(self):
         s = self.frame['A']
         result = s[:, 'two']
         expected = self.frame.xs('two', level=1)['A']
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
         s = self.ymd['A']
         result = s[2000, 5]
-        expected = self.ymd.ix[2000, 5]['A']
-        assert_series_equal(result, expected)
+        expected = self.ymd.loc[2000, 5]['A']
+        tm.assert_series_equal(result, expected)
 
         # not implementing this for now
 
-        self.assertRaises(TypeError, s.__getitem__, (2000, slice(3, 4)))
+        pytest.raises(TypeError, s.__getitem__, (2000, slice(3, 4)))
 
         # result = s[2000, 3:4]
         # lv =s.index.get_level_values(1)
         # expected = s[(lv == 3) | (lv == 4)]
         # expected.index = expected.index.droplevel(0)
-        # assert_series_equal(result, expected)
+        # tm.assert_series_equal(result, expected)
 
         # can do this though
 
@@ -628,38 +596,37 @@ def test_getitem_toplevel(self):
         result = df['foo']
         expected = df.reindex(columns=df.columns[:3])
         expected.columns = expected.columns.droplevel(0)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         result = df['bar']
-        result2 = df.ix[:, 'bar']
+        result2 = df.loc[:, 'bar']
 
         expected = df.reindex(columns=df.columns[3:5])
         expected.columns = expected.columns.droplevel(0)
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result, result2)
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, result2)
 
     def test_getitem_setitem_slice_integers(self):
         index = MultiIndex(levels=[[0, 1, 2], [0, 2]],
-                           labels=[[0, 0, 1, 1, 2, 2],
-                                   [0, 1, 0, 1, 0, 1]])
+                           labels=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]])
 
         frame = DataFrame(np.random.randn(len(index), 4), index=index,
                           columns=['a', 'b', 'c', 'd'])
-        res = frame.ix[1:2]
+        res = frame.loc[1:2]
         exp = frame.reindex(frame.index[2:])
-        assert_frame_equal(res, exp)
+        tm.assert_frame_equal(res, exp)
 
-        frame.ix[1:2] = 7
-        self.assertTrue((frame.ix[1:2] == 7).values.all())
+        frame.loc[1:2] = 7
+        assert (frame.loc[1:2] == 7).values.all()
 
         series = Series(np.random.randn(len(index)), index=index)
 
-        res = series.ix[1:2]
+        res = series.loc[1:2]
         exp = series.reindex(series.index[2:])
-        assert_series_equal(res, exp)
+        tm.assert_series_equal(res, exp)
 
-        series.ix[1:2] = 7
-        self.assertTrue((series.ix[1:2] == 7).values.all())
+        series.loc[1:2] = 7
+        assert (series.loc[1:2] == 7).values.all()
 
     def test_getitem_int(self):
         levels = [[0, 1], [0, 1, 2]]
@@ -668,18 +635,18 @@ def test_getitem_int(self):
 
         frame = DataFrame(np.random.randn(6, 2), index=index)
 
-        result = frame.ix[1]
+        result = frame.loc[1]
         expected = frame[-3:]
         expected.index = expected.index.droplevel(0)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         # raises exception
-        self.assertRaises(KeyError, frame.ix.__getitem__, 3)
+        pytest.raises(KeyError, frame.loc.__getitem__, 3)
 
         # however this will work
-        result = self.frame.ix[2]
+        result = self.frame.iloc[2]
         expected = self.frame.xs(self.frame.index[2])
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
     def test_getitem_partial(self):
         ymd = self.ymd.T
@@ -687,142 +654,85 @@ def test_getitem_partial(self):
 
         expected = ymd.reindex(columns=ymd.columns[ymd.columns.labels[1] == 1])
         expected.columns = expected.columns.droplevel(0).droplevel(0)
-        assert_frame_equal(result, expected)
-
-    def test_getitem_slice_not_sorted(self):
-        df = self.frame.sortlevel(1).T
-
-        # buglet with int typechecking
-        result = df.ix[:, :np.int32(3)]
-        expected = df.reindex(columns=df.columns[:3])
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
     def test_setitem_change_dtype(self):
         dft = self.frame.T
         s = dft['foo', 'two']
         dft['foo', 'two'] = s > s.median()
-        assert_series_equal(dft['foo', 'two'], s > s.median())
-        # tm.assertIsInstance(dft._data.blocks[1].items, MultiIndex)
+        tm.assert_series_equal(dft['foo', 'two'], s > s.median())
+        # assert isinstance(dft._data.blocks[1].items, MultiIndex)
 
         reindexed = dft.reindex(columns=[('foo', 'two')])
-        assert_series_equal(reindexed['foo', 'two'], s > s.median())
+        tm.assert_series_equal(reindexed['foo', 'two'], s > s.median())
 
     def test_frame_setitem_ix(self):
-        self.frame.ix[('bar', 'two'), 'B'] = 5
-        self.assertEqual(self.frame.ix[('bar', 'two'), 'B'], 5)
+        self.frame.loc[('bar', 'two'), 'B'] = 5
+        assert self.frame.loc[('bar', 'two'), 'B'] == 5
 
         # with integer labels
         df = self.frame.copy()
         df.columns = lrange(3)
-        df.ix[('bar', 'two'), 1] = 7
-        self.assertEqual(df.ix[('bar', 'two'), 1], 7)
+        df.loc[('bar', 'two'), 1] = 7
+        assert df.loc[('bar', 'two'), 1] == 7
+
+        with catch_warnings(record=True):
+            df = self.frame.copy()
+            df.columns = lrange(3)
+            df.ix[('bar', 'two'), 1] = 7
+        assert df.loc[('bar', 'two'), 1] == 7
 
     def test_fancy_slice_partial(self):
-        result = self.frame.ix['bar':'baz']
+        result = self.frame.loc['bar':'baz']
         expected = self.frame[3:7]
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
-        result = self.ymd.ix[(2000, 2):(2000, 4)]
+        result = self.ymd.loc[(2000, 2):(2000, 4)]
         lev = self.ymd.index.labels[1]
         expected = self.ymd[(lev >= 1) & (lev <= 3)]
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
     def test_getitem_partial_column_select(self):
         idx = MultiIndex(labels=[[0, 0, 0], [0, 1, 1], [1, 0, 1]],
                          levels=[['a', 'b'], ['x', 'y'], ['p', 'q']])
         df = DataFrame(np.random.rand(3, 2), index=idx)
 
-        result = df.ix[('a', 'y'), :]
-        expected = df.ix[('a', 'y')]
-        assert_frame_equal(result, expected)
-
-        result = df.ix[('a', 'y'), [1, 0]]
-        expected = df.ix[('a', 'y')][[1, 0]]
-        assert_frame_equal(result, expected)
-
-        self.assertRaises(KeyError, df.ix.__getitem__,
-                          (('a', 'foo'), slice(None, None)))
-
-    def test_sortlevel(self):
-        df = self.frame.copy()
-        df.index = np.arange(len(df))
-
-        # axis=1
-
-        # series
-        a_sorted = self.frame['A'].sortlevel(0)
-
-        # preserve names
-        self.assertEqual(a_sorted.index.names, self.frame.index.names)
-
-        # inplace
-        rs = self.frame.copy()
-        rs.sortlevel(0, inplace=True)
-        assert_frame_equal(rs, self.frame.sortlevel(0))
+        result = df.loc[('a', 'y'), :]
+        expected = df.loc[('a', 'y')]
+        tm.assert_frame_equal(result, expected)
 
-    def test_sortlevel_large_cardinality(self):
+        result = df.loc[('a', 'y'), [1, 0]]
+        expected = df.loc[('a', 'y')][[1, 0]]
+        tm.assert_frame_equal(result, expected)
 
-        # #2684 (int64)
-        index = MultiIndex.from_arrays([np.arange(4000)]*3)
-        df = DataFrame(np.random.randn(4000), index=index, dtype = np.int64)
+        with catch_warnings(record=True):
+            result = df.ix[('a', 'y'), [1, 0]]
+        tm.assert_frame_equal(result, expected)
 
-        # it works!
-        result = df.sortlevel(0)
-        self.assertTrue(result.index.lexsort_depth == 3)
-
-        # #2684 (int32)
-        index = MultiIndex.from_arrays([np.arange(4000)]*3)
-        df = DataFrame(np.random.randn(4000), index=index, dtype = np.int32)
-
-        # it works!
-        result = df.sortlevel(0)
-        self.assertTrue((result.dtypes.values == df.dtypes.values).all() == True)
-        self.assertTrue(result.index.lexsort_depth == 3)
+        pytest.raises(KeyError, df.loc.__getitem__,
+                      (('a', 'foo'), slice(None, None)))
 
     def test_delevel_infer_dtype(self):
-        tuples = [tuple for tuple in cart_product(['foo', 'bar'],
-                                                  [10, 20], [1.0, 1.1])]
-        index = MultiIndex.from_tuples(tuples,
-                                       names=['prm0', 'prm1', 'prm2'])
+        tuples = [tuple
+                  for tuple in cart_product(
+                      ['foo', 'bar'], [10, 20], [1.0, 1.1])]
+        index = MultiIndex.from_tuples(tuples, names=['prm0', 'prm1', 'prm2'])
         df = DataFrame(np.random.randn(8, 3), columns=['A', 'B', 'C'],
                        index=index)
         deleveled = df.reset_index()
-        self.assertTrue(com.is_integer_dtype(deleveled['prm1']))
-        self.assertTrue(com.is_float_dtype(deleveled['prm2']))
+        assert is_integer_dtype(deleveled['prm1'])
+        assert is_float_dtype(deleveled['prm2'])
 
     def test_reset_index_with_drop(self):
         deleveled = self.ymd.reset_index(drop=True)
-        self.assertEqual(len(deleveled.columns), len(self.ymd.columns))
+        assert len(deleveled.columns) == len(self.ymd.columns)
 
         deleveled = self.series.reset_index()
-        tm.assertIsInstance(deleveled, DataFrame)
-        self.assertEqual(len(deleveled.columns),
-                         len(self.series.index.levels) + 1)
+        assert isinstance(deleveled, DataFrame)
+        assert len(deleveled.columns) == len(self.series.index.levels) + 1
 
         deleveled = self.series.reset_index(drop=True)
-        tm.assertIsInstance(deleveled, Series)
-
-    def test_sortlevel_by_name(self):
-        self.frame.index.names = ['first', 'second']
-        result = self.frame.sortlevel(level='second')
-        expected = self.frame.sortlevel(level=1)
-        assert_frame_equal(result, expected)
-
-    def test_sortlevel_mixed(self):
-        sorted_before = self.frame.sortlevel(1)
-
-        df = self.frame.copy()
-        df['foo'] = 'bar'
-        sorted_after = df.sortlevel(1)
-        assert_frame_equal(sorted_before, sorted_after.drop(['foo'], axis=1))
-
-        dft = self.frame.T
-        sorted_before = dft.sortlevel(1, axis=1)
-        dft['foo', 'three'] = 'bar'
-
-        sorted_after = dft.sortlevel(1, axis=1)
-        assert_frame_equal(sorted_before.drop([('foo', 'three')], axis=1),
-                           sorted_after.drop([('foo', 'three')], axis=1))
+        assert isinstance(deleveled, Series)
 
     def test_count_level(self):
         def _check_counts(frame, axis=0):
@@ -831,12 +741,12 @@ def _check_counts(frame, axis=0):
                 result = frame.count(axis=axis, level=i)
                 expected = frame.groupby(axis=axis, level=i).count()
                 expected = expected.reindex_like(result).astype('i8')
-                assert_frame_equal(result, expected)
+                tm.assert_frame_equal(result, expected)
 
-        self.frame.ix[1, [1, 2]] = np.nan
-        self.frame.ix[7, [0, 1]] = np.nan
-        self.ymd.ix[1, [1, 2]] = np.nan
-        self.ymd.ix[7, [0, 1]] = np.nan
+        self.frame.iloc[1, [1, 2]] = np.nan
+        self.frame.iloc[7, [0, 1]] = np.nan
+        self.ymd.iloc[1, [1, 2]] = np.nan
+        self.ymd.iloc[7, [0, 1]] = np.nan
 
         _check_counts(self.frame)
         _check_counts(self.ymd)
@@ -845,117 +755,118 @@ def _check_counts(frame, axis=0):
 
         # can't call with level on regular DataFrame
         df = tm.makeTimeDataFrame()
-        assertRaisesRegexp(TypeError, 'hierarchical', df.count, level=0)
+        tm.assert_raises_regex(
+            TypeError, 'hierarchical', df.count, level=0)
 
         self.frame['D'] = 'foo'
         result = self.frame.count(level=0, numeric_only=True)
-        assert_almost_equal(result.columns, ['A', 'B', 'C'])
+        tm.assert_index_equal(result.columns, Index(list('ABC'), name='exp'))
 
     def test_count_level_series(self):
-        index = MultiIndex(levels=[['foo', 'bar', 'baz'],
-                                   ['one', 'two', 'three', 'four']],
-                           labels=[[0, 0, 0, 2, 2],
-                                   [2, 0, 1, 1, 2]])
+        index = MultiIndex(levels=[['foo', 'bar', 'baz'], ['one', 'two',
+                                                           'three', 'four']],
+                           labels=[[0, 0, 0, 2, 2], [2, 0, 1, 1, 2]])
 
         s = Series(np.random.randn(len(index)), index=index)
 
         result = s.count(level=0)
         expected = s.groupby(level=0).count()
-        assert_series_equal(result.astype('f8'),
-                            expected.reindex(result.index).fillna(0))
+        tm.assert_series_equal(
+            result.astype('f8'), expected.reindex(result.index).fillna(0))
 
         result = s.count(level=1)
         expected = s.groupby(level=1).count()
-        assert_series_equal(result.astype('f8'),
-                            expected.reindex(result.index).fillna(0))
+        tm.assert_series_equal(
+            result.astype('f8'), expected.reindex(result.index).fillna(0))
 
     def test_count_level_corner(self):
         s = self.frame['A'][:0]
         result = s.count(level=0)
         expected = Series(0, index=s.index.levels[0], name='A')
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
         df = self.frame[:0]
         result = df.count(level=0)
         expected = DataFrame({}, index=s.index.levels[0],
                              columns=df.columns).fillna(0).astype(np.int64)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
     def test_get_level_number_out_of_bounds(self):
-        with assertRaisesRegexp(IndexError, "Too many levels"):
+        with tm.assert_raises_regex(IndexError, "Too many levels"):
             self.frame.index._get_level_number(2)
-        with assertRaisesRegexp(IndexError, "not a valid level number"):
+        with tm.assert_raises_regex(IndexError,
+                                    "not a valid level number"):
             self.frame.index._get_level_number(-3)
 
     def test_unstack(self):
         # just check that it works for now
         unstacked = self.ymd.unstack()
-        unstacked2 = unstacked.unstack()
+        unstacked.unstack()
 
         # test that ints work
-        unstacked = self.ymd.astype(int).unstack()
+        self.ymd.astype(int).unstack()
 
         # test that int32 work
-        unstacked = self.ymd.astype(np.int32).unstack()
+        self.ymd.astype(np.int32).unstack()
 
     def test_unstack_multiple_no_empty_columns(self):
-        index = MultiIndex.from_tuples([(0, 'foo', 0), (0, 'bar', 0),
-                                        (1, 'baz', 1), (1, 'qux', 1)])
+        index = MultiIndex.from_tuples([(0, 'foo', 0), (0, 'bar', 0), (
+            1, 'baz', 1), (1, 'qux', 1)])
 
         s = Series(np.random.randn(4), index=index)
 
         unstacked = s.unstack([1, 2])
         expected = unstacked.dropna(axis=1, how='all')
-        assert_frame_equal(unstacked, expected)
+        tm.assert_frame_equal(unstacked, expected)
 
     def test_stack(self):
         # regular roundtrip
         unstacked = self.ymd.unstack()
         restacked = unstacked.stack()
-        assert_frame_equal(restacked, self.ymd)
+        tm.assert_frame_equal(restacked, self.ymd)
 
-        unlexsorted = self.ymd.sortlevel(2)
+        unlexsorted = self.ymd.sort_index(level=2)
 
         unstacked = unlexsorted.unstack(2)
         restacked = unstacked.stack()
-        assert_frame_equal(restacked.sortlevel(0), self.ymd)
+        tm.assert_frame_equal(restacked.sort_index(level=0), self.ymd)
 
         unlexsorted = unlexsorted[::-1]
         unstacked = unlexsorted.unstack(1)
         restacked = unstacked.stack().swaplevel(1, 2)
-        assert_frame_equal(restacked.sortlevel(0), self.ymd)
+        tm.assert_frame_equal(restacked.sort_index(level=0), self.ymd)
 
         unlexsorted = unlexsorted.swaplevel(0, 1)
         unstacked = unlexsorted.unstack(0).swaplevel(0, 1, axis=1)
         restacked = unstacked.stack(0).swaplevel(1, 2)
-        assert_frame_equal(restacked.sortlevel(0), self.ymd)
+        tm.assert_frame_equal(restacked.sort_index(level=0), self.ymd)
 
         # columns unsorted
         unstacked = self.ymd.unstack()
         unstacked = unstacked.sort_index(axis=1, ascending=False)
         restacked = unstacked.stack()
-        assert_frame_equal(restacked, self.ymd)
+        tm.assert_frame_equal(restacked, self.ymd)
 
         # more than 2 levels in the columns
         unstacked = self.ymd.unstack(1).unstack(1)
 
         result = unstacked.stack(1)
         expected = self.ymd.unstack()
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         result = unstacked.stack(2)
         expected = self.ymd.unstack(1)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         result = unstacked.stack(0)
         expected = self.ymd.stack().unstack(1).unstack(1)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         # not all levels present in each echelon
-        unstacked = self.ymd.unstack(2).ix[:, ::3]
+        unstacked = self.ymd.unstack(2).loc[:, ::3]
         stacked = unstacked.stack().stack()
         ymd_stacked = self.ymd.stack()
-        assert_series_equal(stacked, ymd_stacked.reindex(stacked.index))
+        tm.assert_series_equal(stacked, ymd_stacked.reindex(stacked.index))
 
         # stack with negative number
         result = self.ymd.unstack(0).stack(-2)
@@ -963,28 +874,27 @@ def test_stack(self):
 
         # GH10417
         def check(left, right):
-            assert_series_equal(left, right)
-            self.assertFalse(left.index.is_unique)
+            tm.assert_series_equal(left, right)
+            assert not left.index.is_unique
             li, ri = left.index, right.index
-            for i in range(ri.nlevels):
-                tm.assert_numpy_array_equal(li.levels[i], ri.levels[i])
-                tm.assert_numpy_array_equal(li.labels[i], ri.labels[i])
+            tm.assert_index_equal(li, ri)
 
         df = DataFrame(np.arange(12).reshape(4, 3),
                        index=list('abab'),
                        columns=['1st', '2nd', '3rd'])
 
         mi = MultiIndex(levels=[['a', 'b'], ['1st', '2nd', '3rd']],
-                        labels=[np.tile(np.arange(2).repeat(3), 2),
-                                np.tile(np.arange(3), 4)])
+                        labels=[np.tile(
+                            np.arange(2).repeat(3), 2), np.tile(
+                                np.arange(3), 4)])
 
         left, right = df.stack(), Series(np.arange(12), index=mi)
         check(left, right)
 
         df.columns = ['1st', '2nd', '1st']
-        mi = MultiIndex(levels=[['a', 'b'], ['1st', '2nd']],
-                        labels=[np.tile(np.arange(2).repeat(3), 2),
-                                np.tile([0, 1, 0], 4)])
+        mi = MultiIndex(levels=[['a', 'b'], ['1st', '2nd']], labels=[np.tile(
+            np.arange(2).repeat(3), 2), np.tile(
+                [0, 1, 0], 4)])
 
         left, right = df.stack(), Series(np.arange(12), index=mi)
         check(left, right)
@@ -992,9 +902,10 @@ def check(left, right):
         tpls = ('a', 2), ('b', 1), ('a', 1), ('b', 2)
         df.index = MultiIndex.from_tuples(tpls)
         mi = MultiIndex(levels=[['a', 'b'], [1, 2], ['1st', '2nd']],
-                        labels=[np.tile(np.arange(2).repeat(3), 2),
-                                np.repeat([1, 0, 1], [3, 6, 3]),
-                                np.tile([0, 1, 0], 4)])
+                        labels=[np.tile(
+                            np.arange(2).repeat(3), 2), np.repeat(
+                                [1, 0, 1], [3, 6, 3]), np.tile(
+                                    [0, 1, 0], 4)])
 
         left, right = df.stack(), Series(np.arange(12), index=mi)
         check(left, right)
@@ -1019,22 +930,22 @@ def test_unstack_odd_failure(self):
         result = df.unstack(2)
 
         recons = result.stack()
-        assert_frame_equal(recons, df)
+        tm.assert_frame_equal(recons, df)
 
     def test_stack_mixed_dtype(self):
         df = self.frame.T
         df['foo', 'four'] = 'foo'
-        df = df.sortlevel(1, axis=1)
+        df = df.sort_index(level=1, axis=1)
 
         stacked = df.stack()
-        result = df['foo'].stack()
-        assert_series_equal(stacked['foo'], result, check_names=False)
-        self.assertIs(result.name, None)
-        self.assertEqual(stacked['bar'].dtype, np.float_)
+        result = df['foo'].stack().sort_index()
+        tm.assert_series_equal(stacked['foo'], result, check_names=False)
+        assert result.name is None
+        assert stacked['bar'].dtype == np.float_
 
     def test_unstack_bug(self):
-        df = DataFrame({'state': ['naive', 'naive', 'naive',
-                                  'activ', 'activ', 'activ'],
+        df = DataFrame({'state': ['naive', 'naive', 'naive', 'activ', 'activ',
+                                  'activ'],
                         'exp': ['a', 'b', 'b', 'b', 'a', 'a'],
                         'barcode': [1, 2, 3, 4, 1, 3],
                         'v': ['hi', 'hi', 'bye', 'bye', 'bye', 'peace'],
@@ -1044,74 +955,74 @@ def test_unstack_bug(self):
 
         unstacked = result.unstack()
         restacked = unstacked.stack()
-        assert_series_equal(restacked,
-                            result.reindex(restacked.index).astype(float))
+        tm.assert_series_equal(
+            restacked, result.reindex(restacked.index).astype(float))
 
     def test_stack_unstack_preserve_names(self):
         unstacked = self.frame.unstack()
-        self.assertEqual(unstacked.index.name, 'first')
-        self.assertEqual(unstacked.columns.names, ['exp', 'second'])
+        assert unstacked.index.name == 'first'
+        assert unstacked.columns.names == ['exp', 'second']
 
         restacked = unstacked.stack()
-        self.assertEqual(restacked.index.names, self.frame.index.names)
+        assert restacked.index.names == self.frame.index.names
 
     def test_unstack_level_name(self):
         result = self.frame.unstack('second')
         expected = self.frame.unstack(level=1)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
     def test_stack_level_name(self):
         unstacked = self.frame.unstack('second')
         result = unstacked.stack('exp')
         expected = self.frame.unstack().stack(0)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         result = self.frame.stack('exp')
         expected = self.frame.stack()
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
     def test_stack_unstack_multiple(self):
         unstacked = self.ymd.unstack(['year', 'month'])
         expected = self.ymd.unstack('year').unstack('month')
-        assert_frame_equal(unstacked, expected)
-        self.assertEqual(unstacked.columns.names,
-                          expected.columns.names)
+        tm.assert_frame_equal(unstacked, expected)
+        assert unstacked.columns.names == expected.columns.names
 
         # series
         s = self.ymd['A']
         s_unstacked = s.unstack(['year', 'month'])
-        assert_frame_equal(s_unstacked, expected['A'])
+        tm.assert_frame_equal(s_unstacked, expected['A'])
 
         restacked = unstacked.stack(['year', 'month'])
         restacked = restacked.swaplevel(0, 1).swaplevel(1, 2)
-        restacked = restacked.sortlevel(0)
+        restacked = restacked.sort_index(level=0)
 
-        assert_frame_equal(restacked, self.ymd)
-        self.assertEqual(restacked.index.names, self.ymd.index.names)
+        tm.assert_frame_equal(restacked, self.ymd)
+        assert restacked.index.names == self.ymd.index.names
 
         # GH #451
         unstacked = self.ymd.unstack([1, 2])
         expected = self.ymd.unstack(1).unstack(1).dropna(axis=1, how='all')
-        assert_frame_equal(unstacked, expected)
+        tm.assert_frame_equal(unstacked, expected)
 
         unstacked = self.ymd.unstack([2, 1])
         expected = self.ymd.unstack(2).unstack(1).dropna(axis=1, how='all')
-        assert_frame_equal(unstacked, expected.ix[:, unstacked.columns])
+        tm.assert_frame_equal(unstacked, expected.loc[:, unstacked.columns])
 
     def test_stack_names_and_numbers(self):
         unstacked = self.ymd.unstack(['year', 'month'])
 
         # Can't use mixture of names and numbers to stack
-        with assertRaisesRegexp(ValueError, "level should contain"):
+        with tm.assert_raises_regex(ValueError, "level should contain"):
             unstacked.stack([0, 'month'])
 
     def test_stack_multiple_out_of_bounds(self):
         # nlevels == 3
         unstacked = self.ymd.unstack(['year', 'month'])
 
-        with assertRaisesRegexp(IndexError, "Too many levels"):
+        with tm.assert_raises_regex(IndexError, "Too many levels"):
             unstacked.stack([2, 3])
-        with assertRaisesRegexp(IndexError, "not a valid level number"):
+        with tm.assert_raises_regex(IndexError,
+                                    "not a valid level number"):
             unstacked.stack([-4, -3])
 
     def test_unstack_period_series(self):
@@ -1128,48 +1039,53 @@ def test_unstack_period_series(self):
         result2 = s.unstack(level=1)
         result3 = s.unstack(level=0)
 
-        e_idx = pd.PeriodIndex(['2013-01', '2013-02', '2013-03'], freq='M', name='period')
+        e_idx = pd.PeriodIndex(
+            ['2013-01', '2013-02', '2013-03'], freq='M', name='period')
         expected = DataFrame({'A': [1, 3, 5], 'B': [2, 4, 6]}, index=e_idx,
                              columns=['A', 'B'])
         expected.columns.name = 'str'
 
-        assert_frame_equal(result1, expected)
-        assert_frame_equal(result2, expected)
-        assert_frame_equal(result3, expected.T)
+        tm.assert_frame_equal(result1, expected)
+        tm.assert_frame_equal(result2, expected)
+        tm.assert_frame_equal(result3, expected.T)
 
         idx1 = pd.PeriodIndex(['2013-01', '2013-01', '2013-02', '2013-02',
                                '2013-03', '2013-03'], freq='M', name='period1')
 
         idx2 = pd.PeriodIndex(['2013-12', '2013-11', '2013-10', '2013-09',
                                '2013-08', '2013-07'], freq='M', name='period2')
-        idx = pd.MultiIndex.from_arrays([idx1, idx2])
+        idx = MultiIndex.from_arrays([idx1, idx2])
         s = Series(value, index=idx)
 
         result1 = s.unstack()
         result2 = s.unstack(level=1)
         result3 = s.unstack(level=0)
 
-        e_idx = pd.PeriodIndex(['2013-01', '2013-02', '2013-03'], freq='M', name='period1')
+        e_idx = pd.PeriodIndex(
+            ['2013-01', '2013-02', '2013-03'], freq='M', name='period1')
         e_cols = pd.PeriodIndex(['2013-07', '2013-08', '2013-09', '2013-10',
-                                 '2013-11', '2013-12'], freq='M', name='period2')
+                                 '2013-11', '2013-12'],
+                                freq='M', name='period2')
         expected = DataFrame([[np.nan, np.nan, np.nan, np.nan, 2, 1],
                               [np.nan, np.nan, 4, 3, np.nan, np.nan],
                               [6, 5, np.nan, np.nan, np.nan, np.nan]],
                              index=e_idx, columns=e_cols)
 
-        assert_frame_equal(result1, expected)
-        assert_frame_equal(result2, expected)
-        assert_frame_equal(result3, expected.T)
+        tm.assert_frame_equal(result1, expected)
+        tm.assert_frame_equal(result2, expected)
+        tm.assert_frame_equal(result3, expected.T)
 
     def test_unstack_period_frame(self):
         # GH 4342
-        idx1 = pd.PeriodIndex(['2014-01', '2014-02', '2014-02', '2014-02', '2014-01', '2014-01'],
+        idx1 = pd.PeriodIndex(['2014-01', '2014-02', '2014-02', '2014-02',
+                               '2014-01', '2014-01'],
                               freq='M', name='period1')
-        idx2 = pd.PeriodIndex(['2013-12', '2013-12', '2014-02', '2013-10', '2013-10', '2014-02'],
+        idx2 = pd.PeriodIndex(['2013-12', '2013-12', '2014-02', '2013-10',
+                               '2013-10', '2014-02'],
                               freq='M', name='period2')
         value = {'A': [1, 2, 3, 4, 5, 6], 'B': [6, 5, 4, 3, 2, 1]}
-        idx = pd.MultiIndex.from_arrays([idx1, idx2])
-        df = pd.DataFrame(value, index=idx)
+        idx = MultiIndex.from_arrays([idx1, idx2])
+        df = DataFrame(value, index=idx)
 
         result1 = df.unstack()
         result2 = df.unstack(level=1)
@@ -1178,21 +1094,22 @@ def test_unstack_period_frame(self):
         e_1 = pd.PeriodIndex(['2014-01', '2014-02'], freq='M', name='period1')
         e_2 = pd.PeriodIndex(['2013-10', '2013-12', '2014-02', '2013-10',
                               '2013-12', '2014-02'], freq='M', name='period2')
-        e_cols = pd.MultiIndex.from_arrays(['A A A B B B'.split(), e_2])
+        e_cols = MultiIndex.from_arrays(['A A A B B B'.split(), e_2])
         expected = DataFrame([[5, 1, 6, 2, 6, 1], [4, 2, 3, 3, 5, 4]],
                              index=e_1, columns=e_cols)
 
-        assert_frame_equal(result1, expected)
-        assert_frame_equal(result2, expected)
+        tm.assert_frame_equal(result1, expected)
+        tm.assert_frame_equal(result2, expected)
 
         e_1 = pd.PeriodIndex(['2014-01', '2014-02', '2014-01',
                               '2014-02'], freq='M', name='period1')
-        e_2 = pd.PeriodIndex(['2013-10', '2013-12', '2014-02'], freq='M', name='period2')
-        e_cols = pd.MultiIndex.from_arrays(['A A B B'.split(), e_1])
+        e_2 = pd.PeriodIndex(
+            ['2013-10', '2013-12', '2014-02'], freq='M', name='period2')
+        e_cols = MultiIndex.from_arrays(['A A B B'.split(), e_1])
         expected = DataFrame([[5, 4, 2, 3], [1, 2, 6, 5], [6, 3, 1, 4]],
                              index=e_2, columns=e_cols)
 
-        assert_frame_equal(result3, expected)
+        tm.assert_frame_equal(result3, expected)
 
     def test_stack_multiple_bug(self):
         """ bug when some uniques are not present in the data #3170"""
@@ -1205,30 +1122,28 @@ def test_stack_multiple_bug(self):
         multi = df.set_index(['DATE', 'ID'])
         multi.columns.name = 'Params'
         unst = multi.unstack('ID')
-        down = unst.resample('W-THU')
+        down = unst.resample('W-THU').mean()
 
         rs = down.stack('ID')
-        xp = unst.ix[:, ['VAR1']].resample('W-THU').stack('ID')
+        xp = unst.loc[:, ['VAR1']].resample('W-THU').mean().stack('ID')
         xp.columns.name = 'Params'
-        assert_frame_equal(rs, xp)
+        tm.assert_frame_equal(rs, xp)
 
     def test_stack_dropna(self):
         # GH #3997
-        df = pd.DataFrame({'A': ['a1', 'a2'],
-                           'B': ['b1', 'b2'],
-                           'C': [1, 1]})
+        df = DataFrame({'A': ['a1', 'a2'], 'B': ['b1', 'b2'], 'C': [1, 1]})
         df = df.set_index(['A', 'B'])
 
         stacked = df.unstack().stack(dropna=False)
-        self.assertTrue(len(stacked) > len(stacked.dropna()))
+        assert len(stacked) > len(stacked.dropna())
 
         stacked = df.unstack().stack(dropna=True)
-        assert_frame_equal(stacked, stacked.dropna())
+        tm.assert_frame_equal(stacked, stacked.dropna())
 
     def test_unstack_multiple_hierarchical(self):
         df = DataFrame(index=[[0, 0, 0, 0, 1, 1, 1, 1],
-                              [0, 0, 1, 1, 0, 0, 1, 1],
-                              [0, 1, 0, 1, 0, 1, 0, 1]],
+                              [0, 0, 1, 1, 0, 0, 1, 1], [0, 1, 0, 1, 0, 1, 0, 1
+                                                         ]],
                        columns=[[0, 0, 1, 1], [0, 1, 0, 1]])
 
         df.index.names = ['a', 'b', 'c']
@@ -1246,7 +1161,7 @@ def test_groupby_transform(self):
         applied = grouped.apply(lambda x: x * 2)
         expected = grouped.transform(lambda x: x * 2)
         result = applied.reindex(expected.index)
-        assert_series_equal(result, expected, check_names=False)
+        tm.assert_series_equal(result, expected, check_names=False)
 
     def test_unstack_sparse_keyspace(self):
         # memory problems with naive impl #2278
@@ -1275,14 +1190,46 @@ def test_unstack_unobserved_keys(self):
         df = DataFrame(np.random.randn(4, 2), index=index)
 
         result = df.unstack()
-        self.assertEqual(len(result.columns), 4)
+        assert len(result.columns) == 4
 
         recons = result.stack()
-        assert_frame_equal(recons, df)
+        tm.assert_frame_equal(recons, df)
+
+    def test_stack_order_with_unsorted_levels(self):
+        # GH 16323
+
+        def manual_compare_stacked(df, df_stacked, lev0, lev1):
+            assert all(df.loc[row, col] ==
+                       df_stacked.loc[(row, col[lev0]), col[lev1]]
+                       for row in df.index for col in df.columns)
+
+        # deep check for 1-row case
+        for width in [2, 3]:
+            levels_poss = itertools.product(
+                itertools.permutations([0, 1, 2], width),
+                repeat=2)
+
+            for levels in levels_poss:
+                columns = MultiIndex(levels=levels,
+                                     labels=[[0, 0, 1, 1],
+                                             [0, 1, 0, 1]])
+                df = DataFrame(columns=columns, data=[range(4)])
+                for stack_lev in range(2):
+                    df_stacked = df.stack(stack_lev)
+                    manual_compare_stacked(df, df_stacked,
+                                           stack_lev, 1 - stack_lev)
+
+        # check multi-row case
+        mi = MultiIndex(levels=[["A", "C", "B"], ["B", "A", "C"]],
+                        labels=[np.repeat(range(3), 3), np.tile(range(3), 3)])
+        df = DataFrame(columns=mi, index=range(5),
+                       data=np.arange(5 * len(mi)).reshape(5, -1))
+        manual_compare_stacked(df, df.stack(0), 0, 1)
 
     def test_groupby_corner(self):
         midx = MultiIndex(levels=[['foo'], ['bar'], ['baz']],
-                          labels=[[0], [0], [0]], names=['one', 'two', 'three'])
+                          labels=[[0], [0], [0]],
+                          names=['one', 'two', 'three'])
         df = DataFrame([np.random.rand(4)], columns=['a', 'b', 'c', 'd'],
                        index=midx)
         # should work
@@ -1290,115 +1237,107 @@ def test_groupby_corner(self):
 
     def test_groupby_level_no_obs(self):
         # #1697
-        midx = MultiIndex.from_tuples([('f1', 's1'), ('f1', 's2'),
-                                       ('f2', 's1'), ('f2', 's2'),
-                                       ('f3', 's1'), ('f3', 's2')])
+        midx = MultiIndex.from_tuples([('f1', 's1'), ('f1', 's2'), (
+            'f2', 's1'), ('f2', 's2'), ('f3', 's1'), ('f3', 's2')])
         df = DataFrame(
             [[1, 2, 3, 4, 5, 6], [7, 8, 9, 10, 11, 12]], columns=midx)
-        df1 = df.select(lambda u: u[0] in ['f2', 'f3'], axis=1)
+        df1 = df.loc(axis=1)[df.columns.map(
+            lambda u: u[0] in ['f2', 'f3'])]
 
         grouped = df1.groupby(axis=1, level=0)
         result = grouped.sum()
-        self.assertTrue((result.columns == ['f2', 'f3']).all())
+        assert (result.columns == ['f2', 'f3']).all()
 
     def test_join(self):
-        a = self.frame.ix[:5, ['A']]
-        b = self.frame.ix[2:, ['B', 'C']]
+        a = self.frame.loc[self.frame.index[:5], ['A']]
+        b = self.frame.loc[self.frame.index[2:], ['B', 'C']]
 
         joined = a.join(b, how='outer').reindex(self.frame.index)
         expected = self.frame.copy()
         expected.values[np.isnan(joined.values)] = np.nan
 
-        self.assertFalse(np.isnan(joined.values).all())
+        assert not np.isnan(joined.values).all()
 
-        assert_frame_equal(joined, expected, check_names=False)  # TODO what should join do with names ?
+        # TODO what should join do with names ?
+        tm.assert_frame_equal(joined, expected, check_names=False)
 
     def test_swaplevel(self):
-        swapped = self.frame['A'].swaplevel(0, 1)
-        swapped2 = self.frame['A'].swaplevel('first', 'second')
-        self.assertFalse(swapped.index.equals(self.frame.index))
-        assert_series_equal(swapped, swapped2)
-
-        back = swapped.swaplevel(0, 1)
-        back2 = swapped.swaplevel('second', 'first')
-        self.assertTrue(back.index.equals(self.frame.index))
-        assert_series_equal(back, back2)
+        swapped = self.frame['A'].swaplevel()
+        swapped2 = self.frame['A'].swaplevel(0)
+        swapped3 = self.frame['A'].swaplevel(0, 1)
+        swapped4 = self.frame['A'].swaplevel('first', 'second')
+        assert not swapped.index.equals(self.frame.index)
+        tm.assert_series_equal(swapped, swapped2)
+        tm.assert_series_equal(swapped, swapped3)
+        tm.assert_series_equal(swapped, swapped4)
+
+        back = swapped.swaplevel()
+        back2 = swapped.swaplevel(0)
+        back3 = swapped.swaplevel(0, 1)
+        back4 = swapped.swaplevel('second', 'first')
+        assert back.index.equals(self.frame.index)
+        tm.assert_series_equal(back, back2)
+        tm.assert_series_equal(back, back3)
+        tm.assert_series_equal(back, back4)
 
         ft = self.frame.T
         swapped = ft.swaplevel('first', 'second', axis=1)
         exp = self.frame.swaplevel('first', 'second').T
-        assert_frame_equal(swapped, exp)
+        tm.assert_frame_equal(swapped, exp)
 
     def test_swaplevel_panel(self):
-        panel = Panel({'ItemA': self.frame,
-                       'ItemB': self.frame * 2})
+        with catch_warnings(record=True):
+            panel = Panel({'ItemA': self.frame, 'ItemB': self.frame * 2})
+            expected = panel.copy()
+            expected.major_axis = expected.major_axis.swaplevel(0, 1)
 
-        result = panel.swaplevel(0, 1, axis='major')
-        expected = panel.copy()
-        expected.major_axis = expected.major_axis.swaplevel(0, 1)
-        tm.assert_panel_equal(result, expected)
+            for result in (panel.swaplevel(axis='major'),
+                           panel.swaplevel(0, axis='major'),
+                           panel.swaplevel(0, 1, axis='major')):
+                tm.assert_panel_equal(result, expected)
 
     def test_reorder_levels(self):
         result = self.ymd.reorder_levels(['month', 'day', 'year'])
         expected = self.ymd.swaplevel(0, 1).swaplevel(1, 2)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         result = self.ymd['A'].reorder_levels(['month', 'day', 'year'])
         expected = self.ymd['A'].swaplevel(0, 1).swaplevel(1, 2)
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
         result = self.ymd.T.reorder_levels(['month', 'day', 'year'], axis=1)
         expected = self.ymd.T.swaplevel(0, 1, axis=1).swaplevel(1, 2, axis=1)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
-        with assertRaisesRegexp(TypeError, 'hierarchical axis'):
+        with tm.assert_raises_regex(TypeError, 'hierarchical axis'):
             self.ymd.reorder_levels([1, 2], axis=1)
 
-        with assertRaisesRegexp(IndexError, 'Too many levels'):
+        with tm.assert_raises_regex(IndexError, 'Too many levels'):
             self.ymd.index.reorder_levels([1, 2, 3])
 
     def test_insert_index(self):
         df = self.ymd[:5].T
         df[2000, 1, 10] = df[2000, 1, 7]
-        tm.assertIsInstance(df.columns, MultiIndex)
-        self.assertTrue((df[2000, 1, 10] == df[2000, 1, 7]).all())
+        assert isinstance(df.columns, MultiIndex)
+        assert (df[2000, 1, 10] == df[2000, 1, 7]).all()
 
     def test_alignment(self):
-        x = Series(data=[1, 2, 3],
-                   index=MultiIndex.from_tuples([("A", 1), ("A", 2), ("B", 3)]))
+        x = Series(data=[1, 2, 3], index=MultiIndex.from_tuples([("A", 1), (
+            "A", 2), ("B", 3)]))
 
-        y = Series(data=[4, 5, 6],
-                   index=MultiIndex.from_tuples([("Z", 1), ("Z", 2), ("B", 3)]))
+        y = Series(data=[4, 5, 6], index=MultiIndex.from_tuples([("Z", 1), (
+            "Z", 2), ("B", 3)]))
 
         res = x - y
         exp_index = x.index.union(y.index)
         exp = x.reindex(exp_index) - y.reindex(exp_index)
-        assert_series_equal(res, exp)
+        tm.assert_series_equal(res, exp)
 
         # hit non-monotonic code path
         res = x[::-1] - y[::-1]
         exp_index = x.index.union(y.index)
         exp = x.reindex(exp_index) - y.reindex(exp_index)
-        assert_series_equal(res, exp)
-
-    def test_is_lexsorted(self):
-        levels = [[0, 1], [0, 1, 2]]
-
-        index = MultiIndex(levels=levels,
-                           labels=[[0, 0, 0, 1, 1, 1],
-                                   [0, 1, 2, 0, 1, 2]])
-        self.assertTrue(index.is_lexsorted())
-
-        index = MultiIndex(levels=levels,
-                           labels=[[0, 0, 0, 1, 1, 1],
-                                   [0, 1, 2, 0, 2, 1]])
-        self.assertFalse(index.is_lexsorted())
-
-        index = MultiIndex(levels=levels,
-                           labels=[[0, 0, 1, 0, 1, 1],
-                                   [0, 1, 0, 2, 2, 1]])
-        self.assertFalse(index.is_lexsorted())
-        self.assertEqual(index.lexsort_depth, 0)
+        tm.assert_series_equal(res, exp)
 
     def test_frame_getitem_view(self):
         df = self.frame.T.copy()
@@ -1406,60 +1345,24 @@ def test_frame_getitem_view(self):
         # this works because we are modifying the underlying array
         # really a no-no
         df['foo'].values[:] = 0
-        self.assertTrue((df['foo'].values == 0).all())
+        assert (df['foo'].values == 0).all()
 
         # but not if it's mixed-type
         df['foo', 'four'] = 'foo'
-        df = df.sortlevel(0, axis=1)
+        df = df.sort_index(level=0, axis=1)
 
         # this will work, but will raise/warn as its chained assignment
         def f():
             df['foo']['one'] = 2
             return df
-        self.assertRaises(com.SettingWithCopyError, f)
+
+        pytest.raises(com.SettingWithCopyError, f)
 
         try:
             df = f()
         except:
             pass
-        self.assertTrue((df['foo', 'one'] == 0).all())
-
-    def test_frame_getitem_not_sorted(self):
-        df = self.frame.T
-        df['foo', 'four'] = 'foo'
-
-        arrays = [np.array(x) for x in zip(*df.columns._tuple_index)]
-
-        result = df['foo']
-        result2 = df.ix[:, 'foo']
-        expected = df.reindex(columns=df.columns[arrays[0] == 'foo'])
-        expected.columns = expected.columns.droplevel(0)
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
-
-        df = df.T
-        result = df.xs('foo')
-        result2 = df.ix['foo']
-        expected = df.reindex(df.index[arrays[0] == 'foo'])
-        expected.index = expected.index.droplevel(0)
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
-
-    def test_series_getitem_not_sorted(self):
-        arrays = [['bar', 'bar', 'baz', 'baz', 'qux', 'qux', 'foo', 'foo'],
-                 ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-        tuples = lzip(*arrays)
-        index = MultiIndex.from_tuples(tuples)
-        s = Series(randn(8), index=index)
-
-        arrays = [np.array(x) for x in zip(*index._tuple_index)]
-
-        result = s['qux']
-        result2 = s.ix['qux']
-        expected = s[arrays[0] == 'qux']
-        expected.index = expected.index.droplevel(0)
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
+        assert (df['foo', 'one'] == 0).all()
 
     def test_count(self):
         frame = self.frame.copy()
@@ -1467,79 +1370,86 @@ def test_count(self):
 
         result = frame.count(level='b')
         expect = self.frame.count(level=1)
-        assert_frame_equal(result, expect, check_names=False)
+        tm.assert_frame_equal(result, expect, check_names=False)
 
         result = frame.count(level='a')
         expect = self.frame.count(level=0)
-        assert_frame_equal(result, expect, check_names=False)
+        tm.assert_frame_equal(result, expect, check_names=False)
 
         series = self.series.copy()
         series.index.names = ['a', 'b']
 
         result = series.count(level='b')
         expect = self.series.count(level=1)
-        assert_series_equal(result, expect, check_names=False)
-        self.assertEqual(result.index.name, 'b')
+        tm.assert_series_equal(result, expect, check_names=False)
+        assert result.index.name == 'b'
 
         result = series.count(level='a')
         expect = self.series.count(level=0)
-        assert_series_equal(result, expect, check_names=False)
-        self.assertEqual(result.index.name, 'a')
-
-        self.assertRaises(KeyError, series.count, 'x')
-        self.assertRaises(KeyError, frame.count, level='x')
-
-    AGG_FUNCTIONS = ['sum', 'prod', 'min', 'max', 'median', 'mean', 'skew',
-                     'mad', 'std', 'var', 'sem']
-
-    def test_series_group_min_max(self):
-        for op, level, skipna in cart_product(self.AGG_FUNCTIONS,
-                                              lrange(2),
-                                              [False, True]):
-            grouped = self.series.groupby(level=level)
-            aggf = lambda x: getattr(x, op)(skipna=skipna)
-            # skipna=True
-            leftside = grouped.agg(aggf)
-            rightside = getattr(self.series, op)(level=level, skipna=skipna)
-            assert_series_equal(leftside, rightside)
-
-    def test_frame_group_ops(self):
-        self.frame.ix[1, [1, 2]] = np.nan
-        self.frame.ix[7, [0, 1]] = np.nan
-
-        for op, level, axis, skipna in cart_product(self.AGG_FUNCTIONS,
-                                                    lrange(2), lrange(2),
-                                                    [False, True]):
-            if axis == 0:
-                frame = self.frame
-            else:
-                frame = self.frame.T
-
-            grouped = frame.groupby(level=level, axis=axis)
-
-            pieces = []
-
-            def aggf(x):
-                pieces.append(x)
-                return getattr(x, op)(skipna=skipna, axis=axis)
-            leftside = grouped.agg(aggf)
-            rightside = getattr(frame, op)(level=level, axis=axis,
-                                           skipna=skipna)
-
-            # for good measure, groupby detail
-            level_index = frame._get_axis(axis).levels[level]
-
-            self.assertTrue(leftside._get_axis(axis).equals(level_index))
-            self.assertTrue(rightside._get_axis(axis).equals(level_index))
-
-            assert_frame_equal(leftside, rightside)
+        tm.assert_series_equal(result, expect, check_names=False)
+        assert result.index.name == 'a'
+
+        pytest.raises(KeyError, series.count, 'x')
+        pytest.raises(KeyError, frame.count, level='x')
+
+    @pytest.mark.parametrize('op', AGG_FUNCTIONS)
+    @pytest.mark.parametrize('level', [0, 1])
+    @pytest.mark.parametrize('skipna', [True, False])
+    @pytest.mark.parametrize('sort', [True, False])
+    def test_series_group_min_max(self, op, level, skipna, sort):
+        # GH 17537
+        grouped = self.series.groupby(level=level, sort=sort)
+        # skipna=True
+        leftside = grouped.agg(lambda x: getattr(x, op)(skipna=skipna))
+        rightside = getattr(self.series, op)(level=level, skipna=skipna)
+        if sort:
+            rightside = rightside.sort_index(level=level)
+        tm.assert_series_equal(leftside, rightside)
+
+    @pytest.mark.parametrize('op', AGG_FUNCTIONS)
+    @pytest.mark.parametrize('level', [0, 1])
+    @pytest.mark.parametrize('axis', [0, 1])
+    @pytest.mark.parametrize('skipna', [True, False])
+    @pytest.mark.parametrize('sort', [True, False])
+    def test_frame_group_ops(self, op, level, axis, skipna, sort):
+        # GH 17537
+        self.frame.iloc[1, [1, 2]] = np.nan
+        self.frame.iloc[7, [0, 1]] = np.nan
+
+        if axis == 0:
+            frame = self.frame
+        else:
+            frame = self.frame.T
+
+        grouped = frame.groupby(level=level, axis=axis, sort=sort)
+
+        pieces = []
+
+        def aggf(x):
+            pieces.append(x)
+            return getattr(x, op)(skipna=skipna, axis=axis)
+
+        leftside = grouped.agg(aggf)
+        rightside = getattr(frame, op)(level=level, axis=axis,
+                                       skipna=skipna)
+        if sort:
+            rightside = rightside.sort_index(level=level, axis=axis)
+            frame = frame.sort_index(level=level, axis=axis)
+
+        # for good measure, groupby detail
+        level_index = frame._get_axis(axis).levels[level]
+
+        tm.assert_index_equal(leftside._get_axis(axis), level_index)
+        tm.assert_index_equal(rightside._get_axis(axis), level_index)
+
+        tm.assert_frame_equal(leftside, rightside)
 
     def test_stat_op_corner(self):
         obj = Series([10.0], index=MultiIndex.from_tuples([(2, 3)]))
 
         result = obj.sum(level=0)
         expected = Series([10.0], index=[2])
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
     def test_frame_any_all_group(self):
         df = DataFrame(
@@ -1550,15 +1460,15 @@ def test_frame_any_all_group(self):
 
         result = df.any(level=0)
         ex = DataFrame({'data': [False, True]}, index=['one', 'two'])
-        assert_frame_equal(result, ex)
+        tm.assert_frame_equal(result, ex)
 
         result = df.all(level=0)
         ex = DataFrame({'data': [False, False]}, index=['one', 'two'])
-        assert_frame_equal(result, ex)
+        tm.assert_frame_equal(result, ex)
 
     def test_std_var_pass_ddof(self):
-        index = MultiIndex.from_arrays([np.arange(5).repeat(10),
-                                        np.tile(np.arange(10), 5)])
+        index = MultiIndex.from_arrays([np.arange(5).repeat(10), np.tile(
+            np.arange(10), 5)])
         df = DataFrame(np.random.randn(len(index), 5), index=index)
 
         for meth in ['var', 'std']:
@@ -1567,20 +1477,20 @@ def test_std_var_pass_ddof(self):
 
             result = getattr(df[0], meth)(level=0, ddof=ddof)
             expected = df[0].groupby(level=0).agg(alt)
-            assert_series_equal(result, expected)
+            tm.assert_series_equal(result, expected)
 
             result = getattr(df, meth)(level=0, ddof=ddof)
             expected = df.groupby(level=0).agg(alt)
-            assert_frame_equal(result, expected)
+            tm.assert_frame_equal(result, expected)
 
     def test_frame_series_agg_multiple_levels(self):
         result = self.ymd.sum(level=['year', 'month'])
         expected = self.ymd.groupby(level=['year', 'month']).sum()
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         result = self.ymd['A'].sum(level=['year', 'month'])
         expected = self.ymd['A'].groupby(level=['year', 'month']).sum()
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
     def test_groupby_multilevel(self):
         result = self.ymd.groupby(level=[0, 1]).mean()
@@ -1590,52 +1500,53 @@ def test_groupby_multilevel(self):
 
         expected = self.ymd.groupby([k1, k2]).mean()
 
-        assert_frame_equal(result, expected, check_names=False)  # TODO groupby with level_values drops names
-        self.assertEqual(result.index.names, self.ymd.index.names[:2])
+        # TODO groupby with level_values drops names
+        tm.assert_frame_equal(result, expected, check_names=False)
+        assert result.index.names == self.ymd.index.names[:2]
 
         result2 = self.ymd.groupby(level=self.ymd.index.names[:2]).mean()
-        assert_frame_equal(result, result2)
+        tm.assert_frame_equal(result, result2)
 
     def test_groupby_multilevel_with_transform(self):
         pass
 
     def test_multilevel_consolidate(self):
-        index = MultiIndex.from_tuples([('foo', 'one'), ('foo', 'two'),
-                                        ('bar', 'one'), ('bar', 'two')])
+        index = MultiIndex.from_tuples([('foo', 'one'), ('foo', 'two'), (
+            'bar', 'one'), ('bar', 'two')])
         df = DataFrame(np.random.randn(4, 4), index=index, columns=index)
         df['Totals', ''] = df.sum(1)
-        df = df.consolidate()
+        df = df._consolidate()
 
     def test_ix_preserve_names(self):
-        result = self.ymd.ix[2000]
-        result2 = self.ymd['A'].ix[2000]
-        self.assertEqual(result.index.names, self.ymd.index.names[1:])
-        self.assertEqual(result2.index.names, self.ymd.index.names[1:])
+        result = self.ymd.loc[2000]
+        result2 = self.ymd['A'].loc[2000]
+        assert result.index.names == self.ymd.index.names[1:]
+        assert result2.index.names == self.ymd.index.names[1:]
 
-        result = self.ymd.ix[2000, 2]
-        result2 = self.ymd['A'].ix[2000, 2]
-        self.assertEqual(result.index.name, self.ymd.index.names[2])
-        self.assertEqual(result2.index.name, self.ymd.index.names[2])
+        result = self.ymd.loc[2000, 2]
+        result2 = self.ymd['A'].loc[2000, 2]
+        assert result.index.name == self.ymd.index.names[2]
+        assert result2.index.name == self.ymd.index.names[2]
 
     def test_partial_set(self):
         # GH #397
         df = self.ymd.copy()
         exp = self.ymd.copy()
-        df.ix[2000, 4] = 0
-        exp.ix[2000, 4].values[:] = 0
-        assert_frame_equal(df, exp)
+        df.loc[2000, 4] = 0
+        exp.loc[2000, 4].values[:] = 0
+        tm.assert_frame_equal(df, exp)
 
-        df['A'].ix[2000, 4] = 1
-        exp['A'].ix[2000, 4].values[:] = 1
-        assert_frame_equal(df, exp)
+        df['A'].loc[2000, 4] = 1
+        exp['A'].loc[2000, 4].values[:] = 1
+        tm.assert_frame_equal(df, exp)
 
-        df.ix[2000] = 5
-        exp.ix[2000].values[:] = 5
-        assert_frame_equal(df, exp)
+        df.loc[2000] = 5
+        exp.loc[2000].values[:] = 5
+        tm.assert_frame_equal(df, exp)
 
         # this works...for now
-        df['A'].ix[14] = 5
-        self.assertEqual(df['A'][14], 5)
+        df['A'].iloc[14] = 5
+        assert df['A'][14] == 5
 
     def test_unstack_preserve_types(self):
         # GH #403
@@ -1643,9 +1554,9 @@ def test_unstack_preserve_types(self):
         self.ymd['F'] = 2
 
         unstacked = self.ymd.unstack('month')
-        self.assertEqual(unstacked['A', 1].dtype, np.float64)
-        self.assertEqual(unstacked['E', 1].dtype, np.object_)
-        self.assertEqual(unstacked['F', 1].dtype, np.float64)
+        assert unstacked['A', 1].dtype == np.float64
+        assert unstacked['E', 1].dtype == np.object_
+        assert unstacked['F', 1].dtype == np.float64
 
     def test_unstack_group_index_overflow(self):
         labels = np.tile(np.arange(500), 2)
@@ -1656,12 +1567,11 @@ def test_unstack_group_index_overflow(self):
 
         s = Series(np.arange(1000), index=index)
         result = s.unstack()
-        self.assertEqual(result.shape, (500, 2))
+        assert result.shape == (500, 2)
 
         # test roundtrip
         stacked = result.stack()
-        assert_series_equal(s,
-                            stacked.reindex(s.index))
+        tm.assert_series_equal(s, stacked.reindex(s.index))
 
         # put it at beginning
         index = MultiIndex(levels=[[0, 1]] + [level] * 8,
@@ -1669,46 +1579,77 @@ def test_unstack_group_index_overflow(self):
 
         s = Series(np.arange(1000), index=index)
         result = s.unstack(0)
-        self.assertEqual(result.shape, (500, 2))
+        assert result.shape == (500, 2)
 
         # put it in middle
         index = MultiIndex(levels=[level] * 4 + [[0, 1]] + [level] * 4,
-                           labels=([labels] * 4 + [np.arange(2).repeat(500)]
-                                   + [labels] * 4))
+                           labels=([labels] * 4 + [np.arange(2).repeat(500)] +
+                                   [labels] * 4))
 
         s = Series(np.arange(1000), index=index)
         result = s.unstack(4)
-        self.assertEqual(result.shape, (500, 2))
+        assert result.shape == (500, 2)
+
+    def test_pyint_engine(self):
+        # GH 18519 : when combinations of codes cannot be represented in 64
+        # bits, the index underlying the MultiIndex engine works with Python
+        # integers, rather than uint64.
+        N = 5
+        keys = [tuple(l) for l in [[0] * 10 * N,
+                                   [1] * 10 * N,
+                                   [2] * 10 * N,
+                                   [np.nan] * N + [2] * 9 * N,
+                                   [0] * N + [2] * 9 * N,
+                                   [np.nan] * N + [2] * 8 * N + [0] * N]]
+        # Each level contains 4 elements (including NaN), so it is represented
+        # in 2 bits, for a total of 2*N*10 = 100 > 64 bits. If we were using a
+        # 64 bit engine and truncating the first levels, the fourth and fifth
+        # keys would collide; if truncating the last levels, the fifth and
+        # sixth; if rotating bits rather than shifting, the third and fifth.
+
+        for idx in range(len(keys)):
+            index = MultiIndex.from_tuples(keys)
+            assert index.get_loc(keys[idx]) == idx
+
+            expected = np.arange(idx + 1, dtype=np.intp)
+            result = index.get_indexer([keys[i] for i in expected])
+            tm.assert_numpy_array_equal(result, expected)
+
+        # With missing key:
+        idces = range(len(keys))
+        expected = np.array([-1] + list(idces), dtype=np.intp)
+        missing = tuple([0, 1] * 5 * N)
+        result = index.get_indexer([missing] + [keys[i] for i in idces])
+        tm.assert_numpy_array_equal(result, expected)
 
     def test_getitem_lowerdim_corner(self):
-        self.assertRaises(KeyError, self.frame.ix.__getitem__,
-                          (('bar', 'three'), 'B'))
-
+        pytest.raises(KeyError, self.frame.loc.__getitem__,
+                      (('bar', 'three'), 'B'))
 
         # in theory should be inserting in a sorted space????
-        self.frame.ix[('bar','three'),'B'] = 0
-        self.assertEqual(self.frame.sortlevel().ix[('bar','three'),'B'], 0)
+        self.frame.loc[('bar', 'three'), 'B'] = 0
+        assert self.frame.sort_index().loc[('bar', 'three'), 'B'] == 0
 
-    #----------------------------------------------------------------------
+    # ---------------------------------------------------------------------
     # AMBIGUOUS CASES!
 
     def test_partial_ix_missing(self):
-        raise nose.SkipTest("skipping for now")
+        pytest.skip("skipping for now")
 
-        result = self.ymd.ix[2000, 0]
-        expected = self.ymd.ix[2000]['A']
-        assert_series_equal(result, expected)
+        result = self.ymd.loc[2000, 0]
+        expected = self.ymd.loc[2000]['A']
+        tm.assert_series_equal(result, expected)
 
         # need to put in some work here
 
-        # self.ymd.ix[2000, 0] = 0
-        # self.assertTrue((self.ymd.ix[2000]['A'] == 0).all())
+        # self.ymd.loc[2000, 0] = 0
+        # assert (self.ymd.loc[2000]['A'] == 0).all()
 
         # Pretty sure the second (and maybe even the first) is already wrong.
-        self.assertRaises(Exception, self.ymd.ix.__getitem__, (2000, 6))
-        self.assertRaises(Exception, self.ymd.ix.__getitem__, (2000, 6), 0)
+        pytest.raises(Exception, self.ymd.loc.__getitem__, (2000, 6))
+        pytest.raises(Exception, self.ymd.loc.__getitem__, (2000, 6), 0)
 
-    #----------------------------------------------------------------------
+    # ---------------------------------------------------------------------
 
     def test_to_html(self):
         self.ymd.columns.name = 'foo'
@@ -1716,85 +1657,90 @@ def test_to_html(self):
         self.ymd.T.to_html()
 
     def test_level_with_tuples(self):
-        index = MultiIndex(levels=[[('foo', 'bar', 0), ('foo', 'baz', 0),
-                                    ('foo', 'qux', 0)],
-                                   [0, 1]],
-                           labels=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]])
+        index = MultiIndex(levels=[[('foo', 'bar', 0), ('foo', 'baz', 0), (
+            'foo', 'qux', 0)], [0, 1]],
+            labels=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]])
 
         series = Series(np.random.randn(6), index=index)
         frame = DataFrame(np.random.randn(6, 4), index=index)
 
         result = series[('foo', 'bar', 0)]
-        result2 = series.ix[('foo', 'bar', 0)]
+        result2 = series.loc[('foo', 'bar', 0)]
         expected = series[:2]
         expected.index = expected.index.droplevel(0)
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
+        tm.assert_series_equal(result, expected)
+        tm.assert_series_equal(result2, expected)
 
-        self.assertRaises(KeyError, series.__getitem__, (('foo', 'bar', 0), 2))
+        pytest.raises(KeyError, series.__getitem__, (('foo', 'bar', 0), 2))
 
-        result = frame.ix[('foo', 'bar', 0)]
+        result = frame.loc[('foo', 'bar', 0)]
         result2 = frame.xs(('foo', 'bar', 0))
         expected = frame[:2]
         expected.index = expected.index.droplevel(0)
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result2, expected)
 
-        index = MultiIndex(levels=[[('foo', 'bar'), ('foo', 'baz'),
-                                    ('foo', 'qux')],
-                                   [0, 1]],
-                           labels=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]])
+        index = MultiIndex(levels=[[('foo', 'bar'), ('foo', 'baz'), (
+            'foo', 'qux')], [0, 1]],
+            labels=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]])
 
         series = Series(np.random.randn(6), index=index)
         frame = DataFrame(np.random.randn(6, 4), index=index)
 
         result = series[('foo', 'bar')]
-        result2 = series.ix[('foo', 'bar')]
+        result2 = series.loc[('foo', 'bar')]
         expected = series[:2]
         expected.index = expected.index.droplevel(0)
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
+        tm.assert_series_equal(result, expected)
+        tm.assert_series_equal(result2, expected)
 
-        result = frame.ix[('foo', 'bar')]
+        result = frame.loc[('foo', 'bar')]
         result2 = frame.xs(('foo', 'bar'))
         expected = frame[:2]
         expected.index = expected.index.droplevel(0)
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result2, expected)
 
     def test_int_series_slicing(self):
         s = self.ymd['A']
         result = s[5:]
         expected = s.reindex(s.index[5:])
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
         exp = self.ymd['A'].copy()
         s[5:] = 0
         exp.values[5:] = 0
-        self.assert_numpy_array_equal(s.values, exp.values)
+        tm.assert_numpy_array_equal(s.values, exp.values)
 
         result = self.ymd[5:]
         expected = self.ymd.reindex(s.index[5:])
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('unicode_strings', [True, False])
+    def test_mixed_depth_get(self, unicode_strings):
+        # If unicode_strings is True, the column labels in dataframe
+        # construction will use unicode strings in Python 2 (pull request
+        # #17099).
 
-    def test_mixed_depth_get(self):
         arrays = [['a', 'top', 'top', 'routine1', 'routine1', 'routine2'],
                   ['', 'OD', 'OD', 'result1', 'result2', 'result1'],
                   ['', 'wx', 'wy', '', '', '']]
 
+        if unicode_strings:
+            arrays = [[u(s) for s in arr] for arr in arrays]
+
         tuples = sorted(zip(*arrays))
         index = MultiIndex.from_tuples(tuples)
-        df = DataFrame(randn(4, 6), columns=index)
+        df = DataFrame(np.random.randn(4, 6), columns=index)
 
         result = df['a']
-        expected = df['a', '', '']
-        assert_series_equal(result, expected, check_names=False)
-        self.assertEqual(result.name, 'a')
+        expected = df['a', '', ''].rename('a')
+        tm.assert_series_equal(result, expected)
 
         result = df['routine1', 'result1']
         expected = df['routine1', 'result1', '']
-        assert_series_equal(result, expected, check_names=False)
-        self.assertEqual(result.name, ('routine1', 'result1'))
+        expected = expected.rename(('routine1', 'result1'))
+        tm.assert_series_equal(result, expected)
 
     def test_mixed_depth_insert(self):
         arrays = [['a', 'top', 'top', 'routine1', 'routine1', 'routine2'],
@@ -1809,7 +1755,7 @@ def test_mixed_depth_insert(self):
         expected = df.copy()
         result['b'] = [1, 2, 3, 4]
         expected['b', '', ''] = [1, 2, 3, 4]
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
     def test_mixed_depth_drop(self):
         arrays = [['a', 'top', 'top', 'routine1', 'routine1', 'routine2'],
@@ -1822,16 +1768,16 @@ def test_mixed_depth_drop(self):
 
         result = df.drop('a', axis=1)
         expected = df.drop([('a', '', '')], axis=1)
-        assert_frame_equal(expected, result)
+        tm.assert_frame_equal(expected, result)
 
         result = df.drop(['top'], axis=1)
         expected = df.drop([('top', 'OD', 'wx')], axis=1)
         expected = expected.drop([('top', 'OD', 'wy')], axis=1)
-        assert_frame_equal(expected, result)
+        tm.assert_frame_equal(expected, result)
 
         result = df.drop(('top', 'OD', 'wx'), axis=1)
         expected = df.drop([('top', 'OD', 'wx')], axis=1)
-        assert_frame_equal(expected, result)
+        tm.assert_frame_equal(expected, result)
 
         expected = df.drop([('top', 'OD', 'wy')], axis=1)
         expected = df.drop('top', axis=1)
@@ -1839,7 +1785,7 @@ def test_mixed_depth_drop(self):
         result = df.drop('result1', level=1, axis=1)
         expected = df.drop([('routine1', 'result1', ''),
                             ('routine2', 'result1', '')], axis=1)
-        assert_frame_equal(expected, result)
+        tm.assert_frame_equal(expected, result)
 
     def test_drop_nonunique(self):
         df = DataFrame([["x-a", "x", "a", 1.5], ["x-a", "x", "a", 1.2],
@@ -1850,7 +1796,7 @@ def test_drop_nonunique(self):
                        columns=["var1", "var2", "var3", "var4"])
 
         grp_size = df.groupby("var1").size()
-        drop_idx = grp_size.ix[grp_size == 1]
+        drop_idx = grp_size.loc[grp_size == 1]
 
         idf = df.set_index(["var1", "var2", "var3"])
 
@@ -1860,7 +1806,7 @@ def test_drop_nonunique(self):
 
         result.index = expected.index
 
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
     def test_mixed_depth_pop(self):
         arrays = [['a', 'top', 'top', 'routine1', 'routine1', 'routine2'],
@@ -1875,78 +1821,97 @@ def test_mixed_depth_pop(self):
         df2 = df.copy()
         result = df1.pop('a')
         expected = df2.pop(('a', '', ''))
-        assert_series_equal(expected, result, check_names=False)
-        assert_frame_equal(df1, df2)
-        self.assertEqual(result.name, 'a')
+        tm.assert_series_equal(expected, result, check_names=False)
+        tm.assert_frame_equal(df1, df2)
+        assert result.name == 'a'
 
         expected = df1['top']
         df1 = df1.drop(['top'], axis=1)
         result = df2.pop('top')
-        assert_frame_equal(expected, result)
-        assert_frame_equal(df1, df2)
+        tm.assert_frame_equal(expected, result)
+        tm.assert_frame_equal(df1, df2)
 
     def test_reindex_level_partial_selection(self):
         result = self.frame.reindex(['foo', 'qux'], level=0)
-        expected = self.frame.ix[[0, 1, 2, 7, 8, 9]]
-        assert_frame_equal(result, expected)
+        expected = self.frame.iloc[[0, 1, 2, 7, 8, 9]]
+        tm.assert_frame_equal(result, expected)
 
-        result = self.frame.T.reindex_axis(['foo', 'qux'], axis=1, level=0)
-        assert_frame_equal(result, expected.T)
+        result = self.frame.T.reindex(['foo', 'qux'], axis=1, level=0)
+        tm.assert_frame_equal(result, expected.T)
 
-        result = self.frame.ix[['foo', 'qux']]
-        assert_frame_equal(result, expected)
+        result = self.frame.loc[['foo', 'qux']]
+        tm.assert_frame_equal(result, expected)
 
-        result = self.frame['A'].ix[['foo', 'qux']]
-        assert_series_equal(result, expected['A'])
+        result = self.frame['A'].loc[['foo', 'qux']]
+        tm.assert_series_equal(result, expected['A'])
 
-        result = self.frame.T.ix[:, ['foo', 'qux']]
-        assert_frame_equal(result, expected.T)
+        result = self.frame.T.loc[:, ['foo', 'qux']]
+        tm.assert_frame_equal(result, expected.T)
 
     def test_setitem_multiple_partial(self):
         expected = self.frame.copy()
         result = self.frame.copy()
-        result.ix[['foo', 'bar']] = 0
-        expected.ix['foo'] = 0
-        expected.ix['bar'] = 0
-        assert_frame_equal(result, expected)
+        result.loc[['foo', 'bar']] = 0
+        expected.loc['foo'] = 0
+        expected.loc['bar'] = 0
+        tm.assert_frame_equal(result, expected)
 
         expected = self.frame.copy()
         result = self.frame.copy()
-        result.ix['foo':'bar'] = 0
-        expected.ix['foo'] = 0
-        expected.ix['bar'] = 0
-        assert_frame_equal(result, expected)
+        result.loc['foo':'bar'] = 0
+        expected.loc['foo'] = 0
+        expected.loc['bar'] = 0
+        tm.assert_frame_equal(result, expected)
 
         expected = self.frame['A'].copy()
         result = self.frame['A'].copy()
-        result.ix[['foo', 'bar']] = 0
-        expected.ix['foo'] = 0
-        expected.ix['bar'] = 0
-        assert_series_equal(result, expected)
+        result.loc[['foo', 'bar']] = 0
+        expected.loc['foo'] = 0
+        expected.loc['bar'] = 0
+        tm.assert_series_equal(result, expected)
 
         expected = self.frame['A'].copy()
         result = self.frame['A'].copy()
-        result.ix['foo':'bar'] = 0
-        expected.ix['foo'] = 0
-        expected.ix['bar'] = 0
-        assert_series_equal(result, expected)
+        result.loc['foo':'bar'] = 0
+        expected.loc['foo'] = 0
+        expected.loc['bar'] = 0
+        tm.assert_series_equal(result, expected)
 
     def test_drop_level(self):
         result = self.frame.drop(['bar', 'qux'], level='first')
-        expected = self.frame.ix[[0, 1, 2, 5, 6]]
-        assert_frame_equal(result, expected)
+        expected = self.frame.iloc[[0, 1, 2, 5, 6]]
+        tm.assert_frame_equal(result, expected)
 
         result = self.frame.drop(['two'], level='second')
-        expected = self.frame.ix[[0, 2, 3, 6, 7, 9]]
-        assert_frame_equal(result, expected)
+        expected = self.frame.iloc[[0, 2, 3, 6, 7, 9]]
+        tm.assert_frame_equal(result, expected)
 
         result = self.frame.T.drop(['bar', 'qux'], axis=1, level='first')
-        expected = self.frame.ix[[0, 1, 2, 5, 6]].T
-        assert_frame_equal(result, expected)
+        expected = self.frame.iloc[[0, 1, 2, 5, 6]].T
+        tm.assert_frame_equal(result, expected)
 
         result = self.frame.T.drop(['two'], axis=1, level='second')
-        expected = self.frame.ix[[0, 2, 3, 6, 7, 9]].T
-        assert_frame_equal(result, expected)
+        expected = self.frame.iloc[[0, 2, 3, 6, 7, 9]].T
+        tm.assert_frame_equal(result, expected)
+
+    def test_drop_level_nonunique_datetime(self):
+        # GH 12701
+        idx = Index([2, 3, 4, 4, 5], name='id')
+        idxdt = pd.to_datetime(['201603231400',
+                                '201603231500',
+                                '201603231600',
+                                '201603231600',
+                                '201603231700'])
+        df = DataFrame(np.arange(10).reshape(5, 2),
+                       columns=list('ab'), index=idx)
+        df['tstamp'] = idxdt
+        df = df.set_index('tstamp', append=True)
+        ts = Timestamp('201603231600')
+        assert not df.index.is_unique
+
+        result = df.drop(ts, level='tstamp')
+        expected = df.loc[idx != 4]
+        tm.assert_frame_equal(result, expected)
 
     def test_drop_preserve_names(self):
         index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1],
@@ -1956,7 +1921,7 @@ def test_drop_preserve_names(self):
         df = DataFrame(np.random.randn(6, 3), index=index)
 
         result = df.drop([(0, 2)])
-        self.assertEqual(result.index.names, ('one', 'two'))
+        assert result.index.names == ('one', 'two')
 
     def test_unicode_repr_issues(self):
         levels = [Index([u('a/\u03c3'), u('b/\u03c3'), u('c/\u03c3')]),
@@ -1980,12 +1945,12 @@ def test_unicode_repr_level_names(self):
 
     def test_dataframe_insert_column_all_na(self):
         # GH #1534
-        mix = MultiIndex.from_tuples(
-            [('1a', '2a'), ('1a', '2b'), ('1a', '2c')])
+        mix = MultiIndex.from_tuples([('1a', '2a'), ('1a', '2b'), ('1a', '2c')
+                                      ])
         df = DataFrame([[1, 2], [3, 4], [5, 6]], index=mix)
         s = Series({(1, 1): 1, (1, 2): 2})
         df['new'] = s
-        self.assertTrue(df['new'].isnull().all())
+        assert df['new'].isna().all()
 
     def test_join_segfault(self):
         # 1532
@@ -2000,37 +1965,39 @@ def test_join_segfault(self):
     def test_set_column_scalar_with_ix(self):
         subset = self.frame.index[[1, 4, 5]]
 
-        self.frame.ix[subset] = 99
-        self.assertTrue((self.frame.ix[subset].values == 99).all())
+        self.frame.loc[subset] = 99
+        assert (self.frame.loc[subset].values == 99).all()
 
         col = self.frame['B']
         col[subset] = 97
-        self.assertTrue((self.frame.ix[subset, 'B'] == 97).all())
+        assert (self.frame.loc[subset, 'B'] == 97).all()
 
     def test_frame_dict_constructor_empty_series(self):
-        s1 = Series([1, 2, 3, 4], index=MultiIndex.from_tuples([(1, 2), (1, 3),
-                                                              (2, 2), (2, 4)]))
-        s2 = Series([1, 2, 3, 4],
-                    index=MultiIndex.from_tuples([(1, 2), (1, 3), (3, 2), (3, 4)]))
+        s1 = Series([
+            1, 2, 3, 4
+        ], index=MultiIndex.from_tuples([(1, 2), (1, 3), (2, 2), (2, 4)]))
+        s2 = Series([
+            1, 2, 3, 4
+        ], index=MultiIndex.from_tuples([(1, 2), (1, 3), (3, 2), (3, 4)]))
         s3 = Series()
 
         # it works!
-        df = DataFrame({'foo': s1, 'bar': s2, 'baz': s3})
-        df = DataFrame.from_dict({'foo': s1, 'baz': s3, 'bar': s2})
+        DataFrame({'foo': s1, 'bar': s2, 'baz': s3})
+        DataFrame.from_dict({'foo': s1, 'baz': s3, 'bar': s2})
 
     def test_indexing_ambiguity_bug_1678(self):
-        columns = MultiIndex.from_tuples([('Ohio', 'Green'), ('Ohio', 'Red'),
-                                          ('Colorado', 'Green')])
-        index = MultiIndex.from_tuples(
-            [('a', 1), ('a', 2), ('b', 1), ('b', 2)])
+        columns = MultiIndex.from_tuples([('Ohio', 'Green'), ('Ohio', 'Red'), (
+            'Colorado', 'Green')])
+        index = MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1), ('b', 2)
+                                        ])
 
         frame = DataFrame(np.arange(12).reshape((4, 3)), index=index,
                           columns=columns)
 
-        result = frame.ix[:, 1]
+        result = frame.iloc[:, 1]
         exp = frame.loc[:, ('Ohio', 'Red')]
-        tm.assertIsInstance(result, Series)
-        assert_series_equal(result, exp)
+        assert isinstance(result, Series)
+        tm.assert_series_equal(result, exp)
 
     def test_nonunique_assignment_1750(self):
         df = DataFrame([[1, 1, "x", "X"], [1, 1, "y", "Y"], [1, 2, "z", "Z"]],
@@ -2039,9 +2006,9 @@ def test_nonunique_assignment_1750(self):
         df = df.set_index(['A', 'B'])
         ix = MultiIndex.from_tuples([(1, 1)])
 
-        df.ix[ix, "C"] = '_'
+        df.loc[ix, "C"] = '_'
 
-        self.assertTrue((df.xs((1, 1))['C'] == '_').all())
+        assert (df.xs((1, 1))['C'] == '_').all()
 
     def test_indexing_over_hashtable_size_cutoff(self):
         n = 10000
@@ -2053,9 +2020,9 @@ def test_indexing_over_hashtable_size_cutoff(self):
                    MultiIndex.from_arrays((["a"] * n, np.arange(n))))
 
         # hai it works!
-        self.assertEqual(s[("a", 5)], 5)
-        self.assertEqual(s[("a", 6)], 6)
-        self.assertEqual(s[("a", 7)], 7)
+        assert s[("a", 5)] == 5
+        assert s[("a", 6)] == 6
+        assert s[("a", 7)] == 7
 
         _index._SIZE_CUTOFF = old_cutoff
 
@@ -2092,70 +2059,64 @@ def test_assign_index_sequences(self):
 
     def test_tuples_have_na(self):
         index = MultiIndex(levels=[[1, 0], [0, 1, 2, 3]],
-                           labels=[[1, 1, 1, 1, -1, 0, 0, 0],
-                                   [0, 1, 2, 3, 0, 1, 2, 3]])
+                           labels=[[1, 1, 1, 1, -1, 0, 0, 0], [0, 1, 2, 3, 0,
+                                                               1, 2, 3]])
 
-        self.assertTrue(isnull(index[4][0]))
-        self.assertTrue(isnull(index.values[4][0]))
+        assert isna(index[4][0])
+        assert isna(index.values[4][0])
 
     def test_duplicate_groupby_issues(self):
         idx_tp = [('600809', '20061231'), ('600809', '20070331'),
                   ('600809', '20070630'), ('600809', '20070331')]
-        dt = ['demo','demo','demo','demo']
+        dt = ['demo', 'demo', 'demo', 'demo']
 
-        idx = MultiIndex.from_tuples(idx_tp,names = ['STK_ID','RPT_Date'])
+        idx = MultiIndex.from_tuples(idx_tp, names=['STK_ID', 'RPT_Date'])
         s = Series(dt, index=idx)
 
         result = s.groupby(s.index).first()
-        self.assertEqual(len(result), 3)
+        assert len(result) == 3
 
     def test_duplicate_mi(self):
         # GH 4516
-        df = DataFrame([['foo','bar',1.0,1],['foo','bar',2.0,2],['bah','bam',3.0,3],
-                        ['bah','bam',4.0,4],['foo','bar',5.0,5],['bah','bam',6.0,6]],
+        df = DataFrame([['foo', 'bar', 1.0, 1], ['foo', 'bar', 2.0, 2],
+                        ['bah', 'bam', 3.0, 3],
+                        ['bah', 'bam', 4.0, 4], ['foo', 'bar', 5.0, 5],
+                        ['bah', 'bam', 6.0, 6]],
                        columns=list('ABCD'))
-        df = df.set_index(['A','B'])
-        df = df.sortlevel(0)
-        expected = DataFrame([['foo','bar',1.0,1],['foo','bar',2.0,2],['foo','bar',5.0,5]],
-                             columns=list('ABCD')).set_index(['A','B'])
-        result = df.loc[('foo','bar')]
-        assert_frame_equal(result,expected)
+        df = df.set_index(['A', 'B'])
+        df = df.sort_index(level=0)
+        expected = DataFrame([['foo', 'bar', 1.0, 1], ['foo', 'bar', 2.0, 2],
+                              ['foo', 'bar', 5.0, 5]],
+                             columns=list('ABCD')).set_index(['A', 'B'])
+        result = df.loc[('foo', 'bar')]
+        tm.assert_frame_equal(result, expected)
 
     def test_duplicated_drop_duplicates(self):
         # GH 4060
-        idx = MultiIndex.from_arrays(([1, 2, 3, 1, 2 ,3], [1, 1, 1, 1, 2, 2]))
+        idx = MultiIndex.from_arrays(([1, 2, 3, 1, 2, 3], [1, 1, 1, 1, 2, 2]))
 
-        expected = np.array([False, False, False, True, False, False], dtype=bool)
+        expected = np.array(
+            [False, False, False, True, False, False], dtype=bool)
         duplicated = idx.duplicated()
         tm.assert_numpy_array_equal(duplicated, expected)
-        self.assertTrue(duplicated.dtype == bool)
-        expected = MultiIndex.from_arrays(([1, 2, 3, 2 ,3], [1, 1, 1, 2, 2]))
+        assert duplicated.dtype == bool
+        expected = MultiIndex.from_arrays(([1, 2, 3, 2, 3], [1, 1, 1, 2, 2]))
         tm.assert_index_equal(idx.drop_duplicates(), expected)
 
         expected = np.array([True, False, False, False, False, False])
         duplicated = idx.duplicated(keep='last')
         tm.assert_numpy_array_equal(duplicated, expected)
-        self.assertTrue(duplicated.dtype == bool)
-        expected = MultiIndex.from_arrays(([2, 3, 1, 2 ,3], [1, 1, 1, 2, 2]))
+        assert duplicated.dtype == bool
+        expected = MultiIndex.from_arrays(([2, 3, 1, 2, 3], [1, 1, 1, 2, 2]))
         tm.assert_index_equal(idx.drop_duplicates(keep='last'), expected)
 
         expected = np.array([True, False, False, True, False, False])
         duplicated = idx.duplicated(keep=False)
         tm.assert_numpy_array_equal(duplicated, expected)
-        self.assertTrue(duplicated.dtype == bool)
-        expected = MultiIndex.from_arrays(([2, 3, 2 ,3], [1, 1, 2, 2]))
+        assert duplicated.dtype == bool
+        expected = MultiIndex.from_arrays(([2, 3, 2, 3], [1, 1, 2, 2]))
         tm.assert_index_equal(idx.drop_duplicates(keep=False), expected)
 
-        # deprecate take_last
-        expected = np.array([True, False, False, False, False, False])
-        with tm.assert_produces_warning(FutureWarning):
-            duplicated = idx.duplicated(take_last=True)
-        tm.assert_numpy_array_equal(duplicated, expected)
-        self.assertTrue(duplicated.dtype == bool)
-        expected = MultiIndex.from_arrays(([2, 3, 1, 2 ,3], [1, 1, 1, 2, 2]))
-        with tm.assert_produces_warning(FutureWarning):
-            tm.assert_index_equal(idx.drop_duplicates(take_last=True), expected)
-
     def test_multiindex_set_index(self):
         # segfault in #3308
         d = {'t1': [2, 2.5, 3], 't2': [4, 5, 6]}
@@ -2168,14 +2129,18 @@ def test_multiindex_set_index(self):
         df.set_index(index)
 
     def test_datetimeindex(self):
-        idx1 = pd.DatetimeIndex(['2013-04-01 9:00', '2013-04-02 9:00', '2013-04-03 9:00'] * 2, tz='Asia/Tokyo')
-        idx2 = pd.date_range('2010/01/01', periods=6, freq='M', tz='US/Eastern')
+        idx1 = pd.DatetimeIndex(
+            ['2013-04-01 9:00', '2013-04-02 9:00', '2013-04-03 9:00'
+             ] * 2, tz='Asia/Tokyo')
+        idx2 = pd.date_range('2010/01/01', periods=6, freq='M',
+                             tz='US/Eastern')
         idx = MultiIndex.from_arrays([idx1, idx2])
 
-        expected1 = pd.DatetimeIndex(['2013-04-01 9:00', '2013-04-02 9:00', '2013-04-03 9:00'], tz='Asia/Tokyo')
+        expected1 = pd.DatetimeIndex(['2013-04-01 9:00', '2013-04-02 9:00',
+                                      '2013-04-03 9:00'], tz='Asia/Tokyo')
 
-        self.assertTrue(idx.levels[0].equals(expected1))
-        self.assertTrue(idx.levels[1].equals(idx2))
+        tm.assert_index_equal(idx.levels[0], expected1)
+        tm.assert_index_equal(idx.levels[1], idx2)
 
         # from datetime combos
         # GH 7888
@@ -2183,10 +2148,11 @@ def test_datetimeindex(self):
         date2 = datetime.datetime.today()
         date3 = Timestamp.today()
 
-        for d1, d2 in itertools.product([date1,date2,date3],[date1,date2,date3]):
-            index = pd.MultiIndex.from_product([[d1],[d2]])
-            self.assertIsInstance(index.levels[0],pd.DatetimeIndex)
-            self.assertIsInstance(index.levels[1],pd.DatetimeIndex)
+        for d1, d2 in itertools.product(
+                [date1, date2, date3], [date1, date2, date3]):
+            index = MultiIndex.from_product([[d1], [d2]])
+            assert isinstance(index.levels[0], pd.DatetimeIndex)
+            assert isinstance(index.levels[1], pd.DatetimeIndex)
 
     def test_constructor_with_tz(self):
 
@@ -2205,32 +2171,38 @@ def test_constructor_with_tz(self):
 
     def test_set_index_datetime(self):
         # GH 3950
-        df = pd.DataFrame({'label':['a', 'a', 'a', 'b', 'b', 'b'],
-                           'datetime':['2011-07-19 07:00:00', '2011-07-19 08:00:00',
-                                       '2011-07-19 09:00:00', '2011-07-19 07:00:00',
-                                       '2011-07-19 08:00:00', '2011-07-19 09:00:00'],
-                           'value':range(6)})
+        df = DataFrame(
+            {'label': ['a', 'a', 'a', 'b', 'b', 'b'],
+             'datetime': ['2011-07-19 07:00:00', '2011-07-19 08:00:00',
+                          '2011-07-19 09:00:00', '2011-07-19 07:00:00',
+                          '2011-07-19 08:00:00', '2011-07-19 09:00:00'],
+             'value': range(6)})
         df.index = pd.to_datetime(df.pop('datetime'), utc=True)
-        df.index = df.index.tz_localize('UTC').tz_convert('US/Pacific')
+        df.index = df.index.tz_convert('US/Pacific')
 
-        expected = pd.DatetimeIndex(['2011-07-19 07:00:00', '2011-07-19 08:00:00', '2011-07-19 09:00:00'])
+        expected = pd.DatetimeIndex(['2011-07-19 07:00:00',
+                                     '2011-07-19 08:00:00',
+                                     '2011-07-19 09:00:00'], name='datetime')
         expected = expected.tz_localize('UTC').tz_convert('US/Pacific')
 
         df = df.set_index('label', append=True)
-        self.assertTrue(df.index.levels[0].equals(expected))
-        self.assertTrue(df.index.levels[1].equals(pd.Index(['a', 'b'])))
+        tm.assert_index_equal(df.index.levels[0], expected)
+        tm.assert_index_equal(df.index.levels[1],
+                              Index(['a', 'b'], name='label'))
 
         df = df.swaplevel(0, 1)
-        self.assertTrue(df.index.levels[0].equals(pd.Index(['a', 'b'])))
-        self.assertTrue(df.index.levels[1].equals(expected))
-
+        tm.assert_index_equal(df.index.levels[0],
+                              Index(['a', 'b'], name='label'))
+        tm.assert_index_equal(df.index.levels[1], expected)
 
         df = DataFrame(np.random.random(6))
         idx1 = pd.DatetimeIndex(['2011-07-19 07:00:00', '2011-07-19 08:00:00',
                                  '2011-07-19 09:00:00', '2011-07-19 07:00:00',
-                                 '2011-07-19 08:00:00', '2011-07-19 09:00:00'], tz='US/Eastern')
-        idx2 = pd.DatetimeIndex(['2012-04-01 09:00', '2012-04-01 09:00', '2012-04-01 09:00',
-                                 '2012-04-02 09:00', '2012-04-02 09:00', '2012-04-02 09:00'],
+                                 '2011-07-19 08:00:00', '2011-07-19 09:00:00'],
+                                tz='US/Eastern')
+        idx2 = pd.DatetimeIndex(['2012-04-01 09:00', '2012-04-01 09:00',
+                                 '2012-04-01 09:00', '2012-04-02 09:00',
+                                 '2012-04-02 09:00', '2012-04-02 09:00'],
                                 tz='US/Eastern')
         idx3 = pd.date_range('2011-01-01 09:00', periods=6, tz='Asia/Tokyo')
 
@@ -2238,86 +2210,158 @@ def test_set_index_datetime(self):
         df = df.set_index(idx2, append=True)
         df = df.set_index(idx3, append=True)
 
-        expected1 = pd.DatetimeIndex(['2011-07-19 07:00:00', '2011-07-19 08:00:00',
-                                     '2011-07-19 09:00:00'], tz='US/Eastern')
-        expected2 = pd.DatetimeIndex(['2012-04-01 09:00', '2012-04-02 09:00'], tz='US/Eastern')
+        expected1 = pd.DatetimeIndex(['2011-07-19 07:00:00',
+                                      '2011-07-19 08:00:00',
+                                      '2011-07-19 09:00:00'], tz='US/Eastern')
+        expected2 = pd.DatetimeIndex(['2012-04-01 09:00', '2012-04-02 09:00'],
+                                     tz='US/Eastern')
 
-        self.assertTrue(df.index.levels[0].equals(expected1))
-        self.assertTrue(df.index.levels[1].equals(expected2))
-        self.assertTrue(df.index.levels[2].equals(idx3))
+        tm.assert_index_equal(df.index.levels[0], expected1)
+        tm.assert_index_equal(df.index.levels[1], expected2)
+        tm.assert_index_equal(df.index.levels[2], idx3)
 
         # GH 7092
-        self.assertTrue(df.index.get_level_values(0).equals(idx1))
-        self.assertTrue(df.index.get_level_values(1).equals(idx2))
-        self.assertTrue(df.index.get_level_values(2).equals(idx3))
+        tm.assert_index_equal(df.index.get_level_values(0), idx1)
+        tm.assert_index_equal(df.index.get_level_values(1), idx2)
+        tm.assert_index_equal(df.index.get_level_values(2), idx3)
 
     def test_reset_index_datetime(self):
         # GH 3950
         for tz in ['UTC', 'Asia/Tokyo', 'US/Eastern']:
-            idx1 = pd.date_range('1/1/2011', periods=5, freq='D', tz=tz, name='idx1')
-            idx2 = pd.Index(range(5), name='idx2',dtype='int64')
-            idx = pd.MultiIndex.from_arrays([idx1, idx2])
-            df = pd.DataFrame({'a': np.arange(5,dtype='int64'), 'b': ['A', 'B', 'C', 'D', 'E']}, index=idx)
-
-            expected = pd.DataFrame({'idx1': [datetime.datetime(2011, 1, 1),
-                                              datetime.datetime(2011, 1, 2),
-                                              datetime.datetime(2011, 1, 3),
-                                              datetime.datetime(2011, 1, 4),
-                                              datetime.datetime(2011, 1, 5)],
-                                     'idx2': np.arange(5,dtype='int64'),
-                                     'a': np.arange(5,dtype='int64'), 'b': ['A', 'B', 'C', 'D', 'E']},
-                                     columns=['idx1', 'idx2', 'a', 'b'])
-            expected['idx1'] = expected['idx1'].apply(lambda d: pd.Timestamp(d, tz=tz))
-
-            assert_frame_equal(df.reset_index(), expected)
-
-            idx3 = pd.date_range('1/1/2012', periods=5, freq='MS', tz='Europe/Paris', name='idx3')
-            idx = pd.MultiIndex.from_arrays([idx1, idx2, idx3])
-            df = pd.DataFrame({'a': np.arange(5,dtype='int64'), 'b': ['A', 'B', 'C', 'D', 'E']}, index=idx)
-
-            expected = pd.DataFrame({'idx1': [datetime.datetime(2011, 1, 1),
-                                              datetime.datetime(2011, 1, 2),
-                                              datetime.datetime(2011, 1, 3),
-                                              datetime.datetime(2011, 1, 4),
-                                              datetime.datetime(2011, 1, 5)],
-                                     'idx2': np.arange(5,dtype='int64'),
-                                     'idx3': [datetime.datetime(2012, 1, 1),
-                                              datetime.datetime(2012, 2, 1),
-                                              datetime.datetime(2012, 3, 1),
-                                              datetime.datetime(2012, 4, 1),
-                                              datetime.datetime(2012, 5, 1)],
-                                     'a': np.arange(5,dtype='int64'), 'b': ['A', 'B', 'C', 'D', 'E']},
-                                     columns=['idx1', 'idx2', 'idx3', 'a', 'b'])
-            expected['idx1'] = expected['idx1'].apply(lambda d: pd.Timestamp(d, tz=tz))
-            expected['idx3'] = expected['idx3'].apply(lambda d: pd.Timestamp(d, tz='Europe/Paris'))
-            assert_frame_equal(df.reset_index(), expected)
+            idx1 = pd.date_range('1/1/2011', periods=5, freq='D', tz=tz,
+                                 name='idx1')
+            idx2 = Index(range(5), name='idx2', dtype='int64')
+            idx = MultiIndex.from_arrays([idx1, idx2])
+            df = DataFrame(
+                {'a': np.arange(5, dtype='int64'),
+                 'b': ['A', 'B', 'C', 'D', 'E']}, index=idx)
+
+            expected = DataFrame({'idx1': [datetime.datetime(2011, 1, 1),
+                                           datetime.datetime(2011, 1, 2),
+                                           datetime.datetime(2011, 1, 3),
+                                           datetime.datetime(2011, 1, 4),
+                                           datetime.datetime(2011, 1, 5)],
+                                  'idx2': np.arange(5, dtype='int64'),
+                                  'a': np.arange(5, dtype='int64'),
+                                  'b': ['A', 'B', 'C', 'D', 'E']},
+                                 columns=['idx1', 'idx2', 'a', 'b'])
+            expected['idx1'] = expected['idx1'].apply(
+                lambda d: Timestamp(d, tz=tz))
+
+            tm.assert_frame_equal(df.reset_index(), expected)
+
+            idx3 = pd.date_range('1/1/2012', periods=5, freq='MS',
+                                 tz='Europe/Paris', name='idx3')
+            idx = MultiIndex.from_arrays([idx1, idx2, idx3])
+            df = DataFrame(
+                {'a': np.arange(5, dtype='int64'),
+                 'b': ['A', 'B', 'C', 'D', 'E']}, index=idx)
+
+            expected = DataFrame({'idx1': [datetime.datetime(2011, 1, 1),
+                                           datetime.datetime(2011, 1, 2),
+                                           datetime.datetime(2011, 1, 3),
+                                           datetime.datetime(2011, 1, 4),
+                                           datetime.datetime(2011, 1, 5)],
+                                  'idx2': np.arange(5, dtype='int64'),
+                                  'idx3': [datetime.datetime(2012, 1, 1),
+                                           datetime.datetime(2012, 2, 1),
+                                           datetime.datetime(2012, 3, 1),
+                                           datetime.datetime(2012, 4, 1),
+                                           datetime.datetime(2012, 5, 1)],
+                                  'a': np.arange(5, dtype='int64'),
+                                  'b': ['A', 'B', 'C', 'D', 'E']},
+                                 columns=['idx1', 'idx2', 'idx3', 'a', 'b'])
+            expected['idx1'] = expected['idx1'].apply(
+                lambda d: Timestamp(d, tz=tz))
+            expected['idx3'] = expected['idx3'].apply(
+                lambda d: Timestamp(d, tz='Europe/Paris'))
+            tm.assert_frame_equal(df.reset_index(), expected)
 
             # GH 7793
-            idx = pd.MultiIndex.from_product([['a','b'], pd.date_range('20130101', periods=3, tz=tz)])
-            df = pd.DataFrame(np.arange(6,dtype='int64').reshape(6,1), columns=['a'], index=idx)
-
-            expected = pd.DataFrame({'level_0': 'a a a b b b'.split(),
-                                     'level_1': [datetime.datetime(2013, 1, 1),
-                                                 datetime.datetime(2013, 1, 2),
-                                                 datetime.datetime(2013, 1, 3)] * 2,
-                                     'a': np.arange(6, dtype='int64')},
-                                     columns=['level_0', 'level_1', 'a'])
-            expected['level_1'] = expected['level_1'].apply(lambda d: pd.Timestamp(d, offset='D', tz=tz))
-            assert_frame_equal(df.reset_index(), expected)
+            idx = MultiIndex.from_product([['a', 'b'], pd.date_range(
+                '20130101', periods=3, tz=tz)])
+            df = DataFrame(
+                np.arange(6, dtype='int64').reshape(
+                    6, 1), columns=['a'], index=idx)
+
+            expected = DataFrame({'level_0': 'a a a b b b'.split(),
+                                  'level_1': [
+                                  datetime.datetime(2013, 1, 1),
+                                  datetime.datetime(2013, 1, 2),
+                                  datetime.datetime(2013, 1, 3)] * 2,
+                                  'a': np.arange(6, dtype='int64')},
+                                 columns=['level_0', 'level_1', 'a'])
+            expected['level_1'] = expected['level_1'].apply(
+                lambda d: Timestamp(d, freq='D', tz=tz))
+            tm.assert_frame_equal(df.reset_index(), expected)
 
     def test_reset_index_period(self):
         # GH 7746
-        idx = pd.MultiIndex.from_product([pd.period_range('20130101', periods=3, freq='M'),
-                                         ['a','b','c']], names=['month', 'feature'])
-
-        df = pd.DataFrame(np.arange(9,dtype='int64').reshape(-1,1), index=idx, columns=['a'])
-        expected = pd.DataFrame({'month': [pd.Period('2013-01', freq='M')] * 3 +
-                                          [pd.Period('2013-02', freq='M')] * 3 +
-                                          [pd.Period('2013-03', freq='M')] * 3,
-                                 'feature': ['a', 'b', 'c'] * 3,
-                                 'a': np.arange(9, dtype='int64')},
-                                columns=['month', 'feature', 'a'])
-        assert_frame_equal(df.reset_index(), expected)
+        idx = MultiIndex.from_product(
+            [pd.period_range('20130101', periods=3, freq='M'), list('abc')],
+            names=['month', 'feature'])
+
+        df = DataFrame(np.arange(9, dtype='int64').reshape(-1, 1),
+                       index=idx, columns=['a'])
+        expected = DataFrame({
+            'month': ([pd.Period('2013-01', freq='M')] * 3 +
+                      [pd.Period('2013-02', freq='M')] * 3 +
+                      [pd.Period('2013-03', freq='M')] * 3),
+            'feature': ['a', 'b', 'c'] * 3,
+            'a': np.arange(9, dtype='int64')
+        }, columns=['month', 'feature', 'a'])
+        tm.assert_frame_equal(df.reset_index(), expected)
+
+    def test_reset_index_multiindex_columns(self):
+        levels = [['A', ''], ['B', 'b']]
+        df = DataFrame([[0, 2], [1, 3]],
+                       columns=MultiIndex.from_tuples(levels))
+        result = df[['B']].rename_axis('A').reset_index()
+        tm.assert_frame_equal(result, df)
+
+        # gh-16120: already existing column
+        with tm.assert_raises_regex(ValueError,
+                                    (r"cannot insert \('A', ''\), "
+                                     "already exists")):
+            df.rename_axis('A').reset_index()
+
+        # gh-16164: multiindex (tuple) full key
+        result = df.set_index([('A', '')]).reset_index()
+        tm.assert_frame_equal(result, df)
+
+        # with additional (unnamed) index level
+        idx_col = DataFrame([[0], [1]],
+                            columns=MultiIndex.from_tuples([('level_0', '')]))
+        expected = pd.concat([idx_col, df[[('B', 'b'), ('A', '')]]], axis=1)
+        result = df.set_index([('B', 'b')], append=True).reset_index()
+        tm.assert_frame_equal(result, expected)
+
+        # with index name which is a too long tuple...
+        with tm.assert_raises_regex(ValueError,
+                                    ("Item must have length equal to number "
+                                     "of levels.")):
+            df.rename_axis([('C', 'c', 'i')]).reset_index()
+
+        # or too short...
+        levels = [['A', 'a', ''], ['B', 'b', 'i']]
+        df2 = DataFrame([[0, 2], [1, 3]],
+                        columns=MultiIndex.from_tuples(levels))
+        idx_col = DataFrame([[0], [1]],
+                            columns=MultiIndex.from_tuples([('C', 'c', 'ii')]))
+        expected = pd.concat([idx_col, df2], axis=1)
+        result = df2.rename_axis([('C', 'c')]).reset_index(col_fill='ii')
+        tm.assert_frame_equal(result, expected)
+
+        # ... which is incompatible with col_fill=None
+        with tm.assert_raises_regex(ValueError,
+                                    ("col_fill=None is incompatible with "
+                                     r"incomplete column name \('C', 'c'\)")):
+            df2.rename_axis([('C', 'c')]).reset_index(col_fill=None)
+
+        # with col_level != 0
+        result = df2.rename_axis([('c', 'ii')]).reset_index(col_level=1,
+                                                            col_fill='C')
+        tm.assert_frame_equal(result, expected)
 
     def test_set_index_period(self):
         # GH 6631
@@ -2326,7 +2370,7 @@ def test_set_index_period(self):
         idx1 = idx1.append(idx1)
         idx2 = pd.period_range('2013-01-01 09:00', periods=2, freq='H')
         idx2 = idx2.append(idx2).append(idx2)
-        idx3 = pd.period_range('2005', periods=6, freq='Y')
+        idx3 = pd.period_range('2005', periods=6, freq='A')
 
         df = df.set_index(idx1)
         df = df.set_index(idx2, append=True)
@@ -2335,26 +2379,456 @@ def test_set_index_period(self):
         expected1 = pd.period_range('2011-01-01', periods=3, freq='M')
         expected2 = pd.period_range('2013-01-01 09:00', periods=2, freq='H')
 
-        self.assertTrue(df.index.levels[0].equals(expected1))
-        self.assertTrue(df.index.levels[1].equals(expected2))
-        self.assertTrue(df.index.levels[2].equals(idx3))
+        tm.assert_index_equal(df.index.levels[0], expected1)
+        tm.assert_index_equal(df.index.levels[1], expected2)
+        tm.assert_index_equal(df.index.levels[2], idx3)
 
-        self.assertTrue(df.index.get_level_values(0).equals(idx1))
-        self.assertTrue(df.index.get_level_values(1).equals(idx2))
-        self.assertTrue(df.index.get_level_values(2).equals(idx3))
+        tm.assert_index_equal(df.index.get_level_values(0), idx1)
+        tm.assert_index_equal(df.index.get_level_values(1), idx2)
+        tm.assert_index_equal(df.index.get_level_values(2), idx3)
 
     def test_repeat(self):
         # GH 9361
         # fixed by # GH 7891
-        m_idx = pd.MultiIndex.from_tuples([(1, 2), (3, 4),
-                                           (5, 6), (7, 8)])
+        m_idx = MultiIndex.from_tuples([(1, 2), (3, 4), (5, 6), (7, 8)])
         data = ['a', 'b', 'c', 'd']
-        m_df = pd.Series(data, index=m_idx)
-        assert m_df.repeat(3).shape == (3 * len(data),)
+        m_df = Series(data, index=m_idx)
+        assert m_df.repeat(3).shape == (3 * len(data), )
+
+    def test_iloc_mi(self):
+        # GH 13797
+        # Test if iloc can handle integer locations in MultiIndexed DataFrame
+
+        data = [['str00', 'str01'], ['str10', 'str11'], ['str20', 'srt21'],
+                ['str30', 'str31'], ['str40', 'str41']]
+
+        mi = MultiIndex.from_tuples(
+            [('CC', 'A'), ('CC', 'B'), ('CC', 'B'), ('BB', 'a'), ('BB', 'b')])
 
+        expected = DataFrame(data)
+        df_mi = DataFrame(data, index=mi)
 
-if __name__ == '__main__':
+        result = DataFrame([[df_mi.iloc[r, c] for c in range(2)]
+                            for r in range(5)])
+
+        tm.assert_frame_equal(result, expected)
+
+
+class TestSorted(Base):
+    """ everything you wanted to test about sorting """
+
+    def test_sort_index_preserve_levels(self):
+        result = self.frame.sort_index()
+        assert result.index.names == self.frame.index.names
+
+    def test_sorting_repr_8017(self):
+
+        np.random.seed(0)
+        data = np.random.randn(3, 4)
+
+        for gen, extra in [([1., 3., 2., 5.], 4.), ([1, 3, 2, 5], 4),
+                           ([Timestamp('20130101'), Timestamp('20130103'),
+                             Timestamp('20130102'), Timestamp('20130105')],
+                            Timestamp('20130104')),
+                           (['1one', '3one', '2one', '5one'], '4one')]:
+            columns = MultiIndex.from_tuples([('red', i) for i in gen])
+            df = DataFrame(data, index=list('def'), columns=columns)
+            df2 = pd.concat([df,
+                             DataFrame('world', index=list('def'),
+                                       columns=MultiIndex.from_tuples(
+                                           [('red', extra)]))], axis=1)
+
+            # check that the repr is good
+            # make sure that we have a correct sparsified repr
+            # e.g. only 1 header of read
+            assert str(df2).splitlines()[0].split() == ['red']
 
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
+            # GH 8017
+            # sorting fails after columns added
+
+            # construct single-dtype then sort
+            result = df.copy().sort_index(axis=1)
+            expected = df.iloc[:, [0, 2, 1, 3]]
+            tm.assert_frame_equal(result, expected)
+
+            result = df2.sort_index(axis=1)
+            expected = df2.iloc[:, [0, 2, 1, 4, 3]]
+            tm.assert_frame_equal(result, expected)
+
+            # setitem then sort
+            result = df.copy()
+            result[('red', extra)] = 'world'
+
+            result = result.sort_index(axis=1)
+            tm.assert_frame_equal(result, expected)
+
+    def test_sort_index_level(self):
+        df = self.frame.copy()
+        df.index = np.arange(len(df))
+
+        # axis=1
+
+        # series
+        a_sorted = self.frame['A'].sort_index(level=0)
+
+        # preserve names
+        assert a_sorted.index.names == self.frame.index.names
+
+        # inplace
+        rs = self.frame.copy()
+        rs.sort_index(level=0, inplace=True)
+        tm.assert_frame_equal(rs, self.frame.sort_index(level=0))
+
+    def test_sort_index_level_large_cardinality(self):
+
+        # #2684 (int64)
+        index = MultiIndex.from_arrays([np.arange(4000)] * 3)
+        df = DataFrame(np.random.randn(4000), index=index, dtype=np.int64)
+
+        # it works!
+        result = df.sort_index(level=0)
+        assert result.index.lexsort_depth == 3
+
+        # #2684 (int32)
+        index = MultiIndex.from_arrays([np.arange(4000)] * 3)
+        df = DataFrame(np.random.randn(4000), index=index, dtype=np.int32)
+
+        # it works!
+        result = df.sort_index(level=0)
+        assert (result.dtypes.values == df.dtypes.values).all()
+        assert result.index.lexsort_depth == 3
+
+    def test_sort_index_level_by_name(self):
+        self.frame.index.names = ['first', 'second']
+        result = self.frame.sort_index(level='second')
+        expected = self.frame.sort_index(level=1)
+        tm.assert_frame_equal(result, expected)
+
+    def test_sort_index_level_mixed(self):
+        sorted_before = self.frame.sort_index(level=1)
+
+        df = self.frame.copy()
+        df['foo'] = 'bar'
+        sorted_after = df.sort_index(level=1)
+        tm.assert_frame_equal(sorted_before,
+                              sorted_after.drop(['foo'], axis=1))
+
+        dft = self.frame.T
+        sorted_before = dft.sort_index(level=1, axis=1)
+        dft['foo', 'three'] = 'bar'
+
+        sorted_after = dft.sort_index(level=1, axis=1)
+        tm.assert_frame_equal(sorted_before.drop([('foo', 'three')], axis=1),
+                              sorted_after.drop([('foo', 'three')], axis=1))
+
+    def test_is_lexsorted(self):
+        levels = [[0, 1], [0, 1, 2]]
+
+        index = MultiIndex(levels=levels,
+                           labels=[[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 1, 2]])
+        assert index.is_lexsorted()
+
+        index = MultiIndex(levels=levels,
+                           labels=[[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 2, 1]])
+        assert not index.is_lexsorted()
+
+        index = MultiIndex(levels=levels,
+                           labels=[[0, 0, 1, 0, 1, 1], [0, 1, 0, 2, 2, 1]])
+        assert not index.is_lexsorted()
+        assert index.lexsort_depth == 0
+
+    def test_getitem_multilevel_index_tuple_not_sorted(self):
+        index_columns = list("abc")
+        df = DataFrame([[0, 1, 0, "x"], [0, 0, 1, "y"]],
+                       columns=index_columns + ["data"])
+        df = df.set_index(index_columns)
+        query_index = df.index[:1]
+        rs = df.loc[query_index, "data"]
+
+        xp_idx = MultiIndex.from_tuples([(0, 1, 0)], names=['a', 'b', 'c'])
+        xp = Series(['x'], index=xp_idx, name='data')
+        tm.assert_series_equal(rs, xp)
+
+    def test_getitem_slice_not_sorted(self):
+        df = self.frame.sort_index(level=1).T
+
+        # buglet with int typechecking
+        result = df.iloc[:, :np.int32(3)]
+        expected = df.reindex(columns=df.columns[:3])
+        tm.assert_frame_equal(result, expected)
+
+    def test_frame_getitem_not_sorted2(self):
+        # 13431
+        df = DataFrame({'col1': ['b', 'd', 'b', 'a'],
+                        'col2': [3, 1, 1, 2],
+                        'data': ['one', 'two', 'three', 'four']})
+
+        df2 = df.set_index(['col1', 'col2'])
+        df2_original = df2.copy()
+
+        df2.index.set_levels(['b', 'd', 'a'], level='col1', inplace=True)
+        df2.index.set_labels([0, 1, 0, 2], level='col1', inplace=True)
+        assert not df2.index.is_lexsorted()
+        assert not df2.index.is_monotonic
+
+        assert df2_original.index.equals(df2.index)
+        expected = df2.sort_index()
+        assert expected.index.is_lexsorted()
+        assert expected.index.is_monotonic
+
+        result = df2.sort_index(level=0)
+        assert result.index.is_lexsorted()
+        assert result.index.is_monotonic
+        tm.assert_frame_equal(result, expected)
+
+    def test_frame_getitem_not_sorted(self):
+        df = self.frame.T
+        df['foo', 'four'] = 'foo'
+
+        arrays = [np.array(x) for x in zip(*df.columns.values)]
+
+        result = df['foo']
+        result2 = df.loc[:, 'foo']
+        expected = df.reindex(columns=df.columns[arrays[0] == 'foo'])
+        expected.columns = expected.columns.droplevel(0)
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result2, expected)
+
+        df = df.T
+        result = df.xs('foo')
+        result2 = df.loc['foo']
+        expected = df.reindex(df.index[arrays[0] == 'foo'])
+        expected.index = expected.index.droplevel(0)
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result2, expected)
+
+    def test_series_getitem_not_sorted(self):
+        arrays = [['bar', 'bar', 'baz', 'baz', 'qux', 'qux', 'foo', 'foo'],
+                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+        tuples = lzip(*arrays)
+        index = MultiIndex.from_tuples(tuples)
+        s = Series(randn(8), index=index)
+
+        arrays = [np.array(x) for x in zip(*index.values)]
+
+        result = s['qux']
+        result2 = s.loc['qux']
+        expected = s[arrays[0] == 'qux']
+        expected.index = expected.index.droplevel(0)
+        tm.assert_series_equal(result, expected)
+        tm.assert_series_equal(result2, expected)
+
+    def test_sort_index_and_reconstruction(self):
+
+        # 15622
+        # lexsortedness should be identical
+        # across MultiIndex consruction methods
+
+        df = DataFrame([[1, 1], [2, 2]], index=list('ab'))
+        expected = DataFrame([[1, 1], [2, 2], [1, 1], [2, 2]],
+                             index=MultiIndex.from_tuples([(0.5, 'a'),
+                                                           (0.5, 'b'),
+                                                           (0.8, 'a'),
+                                                           (0.8, 'b')]))
+        assert expected.index.is_lexsorted()
+
+        result = DataFrame(
+            [[1, 1], [2, 2], [1, 1], [2, 2]],
+            index=MultiIndex.from_product([[0.5, 0.8], list('ab')]))
+        result = result.sort_index()
+        assert result.index.is_lexsorted()
+        assert result.index.is_monotonic
+
+        tm.assert_frame_equal(result, expected)
+
+        result = DataFrame(
+            [[1, 1], [2, 2], [1, 1], [2, 2]],
+            index=MultiIndex(levels=[[0.5, 0.8], ['a', 'b']],
+                             labels=[[0, 0, 1, 1], [0, 1, 0, 1]]))
+        result = result.sort_index()
+        assert result.index.is_lexsorted()
+
+        tm.assert_frame_equal(result, expected)
+
+        concatted = pd.concat([df, df], keys=[0.8, 0.5])
+        result = concatted.sort_index()
+
+        assert result.index.is_lexsorted()
+        assert result.index.is_monotonic
+
+        tm.assert_frame_equal(result, expected)
+
+        # 14015
+        df = DataFrame([[1, 2], [6, 7]],
+                       columns=MultiIndex.from_tuples(
+                           [(0, '20160811 12:00:00'),
+                            (0, '20160809 12:00:00')],
+                           names=['l1', 'Date']))
+
+        df.columns.set_levels(pd.to_datetime(df.columns.levels[1]),
+                              level=1,
+                              inplace=True)
+        assert not df.columns.is_lexsorted()
+        assert not df.columns.is_monotonic
+        result = df.sort_index(axis=1)
+        assert result.columns.is_lexsorted()
+        assert result.columns.is_monotonic
+        result = df.sort_index(axis=1, level=1)
+        assert result.columns.is_lexsorted()
+        assert result.columns.is_monotonic
+
+    def test_sort_index_and_reconstruction_doc_example(self):
+        # doc example
+        df = DataFrame({'value': [1, 2, 3, 4]},
+                       index=MultiIndex(
+                           levels=[['a', 'b'], ['bb', 'aa']],
+                           labels=[[0, 0, 1, 1], [0, 1, 0, 1]]))
+        assert df.index.is_lexsorted()
+        assert not df.index.is_monotonic
+
+        # sort it
+        expected = DataFrame({'value': [2, 1, 4, 3]},
+                             index=MultiIndex(
+                                 levels=[['a', 'b'], ['aa', 'bb']],
+                                 labels=[[0, 0, 1, 1], [0, 1, 0, 1]]))
+        result = df.sort_index()
+        assert result.index.is_lexsorted()
+        assert result.index.is_monotonic
+
+        tm.assert_frame_equal(result, expected)
+
+        # reconstruct
+        result = df.sort_index().copy()
+        result.index = result.index._sort_levels_monotonic()
+        assert result.index.is_lexsorted()
+        assert result.index.is_monotonic
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_sort_index_reorder_on_ops(self):
+        # 15687
+        df = DataFrame(
+            np.random.randn(8, 2),
+            index=MultiIndex.from_product(
+                [['a', 'b'], ['big', 'small'], ['red', 'blu']],
+                names=['letter', 'size', 'color']),
+            columns=['near', 'far'])
+        df = df.sort_index()
+
+        def my_func(group):
+            group.index = ['newz', 'newa']
+            return group
+
+        result = df.groupby(level=['letter', 'size']).apply(
+            my_func).sort_index()
+        expected = MultiIndex.from_product(
+            [['a', 'b'], ['big', 'small'], ['newa', 'newz']],
+            names=['letter', 'size', None])
+
+        tm.assert_index_equal(result.index, expected)
+
+    def test_sort_non_lexsorted(self):
+        # degenerate case where we sort but don't
+        # have a satisfying result :<
+        # GH 15797
+        idx = MultiIndex([['A', 'B', 'C'],
+                          ['c', 'b', 'a']],
+                         [[0, 1, 2, 0, 1, 2],
+                          [0, 2, 1, 1, 0, 2]])
+
+        df = DataFrame({'col': range(len(idx))},
+                       index=idx,
+                       dtype='int64')
+        assert df.index.is_lexsorted() is False
+        assert df.index.is_monotonic is False
+
+        sorted = df.sort_index()
+        assert sorted.index.is_lexsorted() is True
+        assert sorted.index.is_monotonic is True
+
+        expected = DataFrame(
+            {'col': [1, 4, 5, 2]},
+            index=MultiIndex.from_tuples([('B', 'a'), ('B', 'c'),
+                                          ('C', 'a'), ('C', 'b')]),
+            dtype='int64')
+        result = sorted.loc[pd.IndexSlice['B':'C', 'a':'c'], :]
+        tm.assert_frame_equal(result, expected)
+
+    def test_sort_index_nan(self):
+        # GH 14784
+        # incorrect sorting w.r.t. nans
+        tuples = [[12, 13], [np.nan, np.nan], [np.nan, 3], [1, 2]]
+        mi = MultiIndex.from_tuples(tuples)
+
+        df = DataFrame(np.arange(16).reshape(4, 4),
+                       index=mi, columns=list('ABCD'))
+        s = Series(np.arange(4), index=mi)
+
+        df2 = DataFrame({
+            'date': pd.to_datetime([
+                '20121002', '20121007', '20130130', '20130202', '20130305',
+                '20121002', '20121207', '20130130', '20130202', '20130305',
+                '20130202', '20130305'
+            ]),
+            'user_id': [1, 1, 1, 1, 1, 3, 3, 3, 5, 5, 5, 5],
+            'whole_cost': [1790, np.nan, 280, 259, np.nan, 623, 90, 312,
+                           np.nan, 301, 359, 801],
+            'cost': [12, 15, 10, 24, 39, 1, 0, np.nan, 45, 34, 1, 12]
+        }).set_index(['date', 'user_id'])
+
+        # sorting frame, default nan position is last
+        result = df.sort_index()
+        expected = df.iloc[[3, 0, 2, 1], :]
+        tm.assert_frame_equal(result, expected)
+
+        # sorting frame, nan position last
+        result = df.sort_index(na_position='last')
+        expected = df.iloc[[3, 0, 2, 1], :]
+        tm.assert_frame_equal(result, expected)
+
+        # sorting frame, nan position first
+        result = df.sort_index(na_position='first')
+        expected = df.iloc[[1, 2, 3, 0], :]
+        tm.assert_frame_equal(result, expected)
+
+        # sorting frame with removed rows
+        result = df2.dropna().sort_index()
+        expected = df2.sort_index().dropna()
+        tm.assert_frame_equal(result, expected)
+
+        # sorting series, default nan position is last
+        result = s.sort_index()
+        expected = s.iloc[[3, 0, 2, 1]]
+        tm.assert_series_equal(result, expected)
+
+        # sorting series, nan position last
+        result = s.sort_index(na_position='last')
+        expected = s.iloc[[3, 0, 2, 1]]
+        tm.assert_series_equal(result, expected)
+
+        # sorting series, nan position first
+        result = s.sort_index(na_position='first')
+        expected = s.iloc[[1, 2, 3, 0]]
+        tm.assert_series_equal(result, expected)
+
+    def test_sort_ascending_list(self):
+        # GH: 16934
+
+        # Set up a Series with a three level MultiIndex
+        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two'],
+                  [4, 3, 2, 1, 4, 3, 2, 1]]
+        tuples = lzip(*arrays)
+        mi = MultiIndex.from_tuples(tuples, names=['first', 'second', 'third'])
+        s = Series(range(8), index=mi)
+
+        # Sort with boolean ascending
+        result = s.sort_index(level=['third', 'first'], ascending=False)
+        expected = s.iloc[[4, 0, 5, 1, 6, 2, 7, 3]]
+        tm.assert_series_equal(result, expected)
+
+        # Sort with list of boolean ascending
+        result = s.sort_index(level=['third', 'first'],
+                              ascending=[False, True])
+        expected = s.iloc[[0, 4, 1, 5, 2, 6, 3, 7]]
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/test_nanops.py b/pandas/tests/test_nanops.py
index 6d6c289a6dfa6..a70ee80aee180 100644
--- a/pandas/tests/test_nanops.py
+++ b/pandas/tests/test_nanops.py
@@ -3,17 +3,24 @@
 
 from functools import partial
 
+import pytest
+import warnings
 import numpy as np
-from pandas import Series
-from pandas.core.common import isnull, is_integer_dtype
+
+import pandas as pd
+from pandas import Series, isna
+from pandas.core.dtypes.common import is_integer_dtype
 import pandas.core.nanops as nanops
 import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas.compat.numpy import _np_version_under1p13
 
 use_bn = nanops._USE_BOTTLENECK
 
-class TestnanopsDataFrame(tm.TestCase):
 
-    def setUp(self):
+class TestnanopsDataFrame(object):
+
+    def setup_method(self, method):
         np.random.seed(11235)
         nanops._USE_BOTTLENECK = False
 
@@ -21,7 +28,7 @@ def setUp(self):
 
         self.arr_float = np.random.randn(*self.arr_shape)
         self.arr_float1 = np.random.randn(*self.arr_shape)
-        self.arr_complex = self.arr_float + self.arr_float1*1j
+        self.arr_complex = self.arr_float + self.arr_float1 * 1j
         self.arr_int = np.random.randint(-10, 10, self.arr_shape)
         self.arr_bool = np.random.randint(0, 2, self.arr_shape) == 0
         self.arr_str = np.abs(self.arr_float).astype('S')
@@ -37,37 +44,33 @@ def setUp(self):
         self.arr_nan_float1 = np.vstack([self.arr_nan, self.arr_float1])
         self.arr_nan_nan = np.vstack([self.arr_nan, self.arr_nan])
 
-        self.arr_inf = self.arr_float*np.inf
+        self.arr_inf = self.arr_float * np.inf
         self.arr_float_inf = np.vstack([self.arr_float, self.arr_inf])
         self.arr_float1_inf = np.vstack([self.arr_float1, self.arr_inf])
         self.arr_inf_float1 = np.vstack([self.arr_inf, self.arr_float1])
         self.arr_inf_inf = np.vstack([self.arr_inf, self.arr_inf])
 
         self.arr_nan_inf = np.vstack([self.arr_nan, self.arr_inf])
-        self.arr_float_nan_inf = np.vstack([self.arr_float,
-                                            self.arr_nan,
+        self.arr_float_nan_inf = np.vstack([self.arr_float, self.arr_nan,
                                             self.arr_inf])
-        self.arr_nan_float1_inf = np.vstack([self.arr_float,
-                                             self.arr_inf,
+        self.arr_nan_float1_inf = np.vstack([self.arr_float, self.arr_inf,
                                              self.arr_nan])
-        self.arr_nan_nan_inf = np.vstack([self.arr_nan,
-                                          self.arr_nan,
+        self.arr_nan_nan_inf = np.vstack([self.arr_nan, self.arr_nan,
                                           self.arr_inf])
-        self.arr_obj = np.vstack([self.arr_float.astype('O'),
-                                  self.arr_int.astype('O'),
-                                  self.arr_bool.astype('O'),
-                                  self.arr_complex.astype('O'),
-                                  self.arr_str.astype('O'),
-                                  self.arr_utf.astype('O'),
-                                  self.arr_date.astype('O'),
-                                  self.arr_tdelta.astype('O')])
-
-        self.arr_nan_nanj = self.arr_nan + self.arr_nan*1j
-        self.arr_complex_nan = np.vstack([self.arr_complex, self.arr_nan_nanj])
-
-        self.arr_nan_infj = self.arr_inf*1j
-        self.arr_complex_nan_infj = np.vstack([self.arr_complex,
-                                              self.arr_nan_infj])
+        self.arr_obj = np.vstack([self.arr_float.astype(
+            'O'), self.arr_int.astype('O'), self.arr_bool.astype(
+                'O'), self.arr_complex.astype('O'), self.arr_str.astype(
+                    'O'), self.arr_utf.astype('O'), self.arr_date.astype('O'),
+            self.arr_tdelta.astype('O')])
+
+        with np.errstate(invalid='ignore'):
+            self.arr_nan_nanj = self.arr_nan + self.arr_nan * 1j
+            self.arr_complex_nan = np.vstack([self.arr_complex,
+                                              self.arr_nan_nanj])
+
+            self.arr_nan_infj = self.arr_inf * 1j
+            self.arr_complex_nan_infj = np.vstack([self.arr_complex,
+                                                   self.arr_nan_infj])
 
         self.arr_float_2d = self.arr_float[:, :, 0]
         self.arr_float1_2d = self.arr_float1[:, :, 0]
@@ -117,16 +120,16 @@ def setUp(self):
         self.arr_float_nan_inf_1d = self.arr_float_nan_inf[:, 0, 0]
         self.arr_nan_nan_inf_1d = self.arr_nan_nan_inf[:, 0, 0]
 
-    def tearDown(self):
+    def teardown_method(self, method):
         nanops._USE_BOTTLENECK = use_bn
 
-    def check_results(self, targ, res, axis):
+    def check_results(self, targ, res, axis, check_dtype=True):
         res = getattr(res, 'asm8', res)
         res = getattr(res, 'values', res)
 
         # timedeltas are a beast here
         def _coerce_tds(targ, res):
-            if targ.dtype == 'm8[ns]':
+            if hasattr(targ, 'dtype') and targ.dtype == 'm8[ns]':
                 if len(targ) == 1:
                     targ = targ[0].item()
                     res = res.item()
@@ -135,18 +138,20 @@ def _coerce_tds(targ, res):
             return targ, res
 
         try:
-            if axis != 0 and hasattr(targ, 'shape') and targ.ndim:
+            if axis != 0 and hasattr(
+                    targ, 'shape') and targ.ndim and targ.shape != res.shape:
                 res = np.split(res, [targ.shape[0]], axis=0)[0]
         except:
             targ, res = _coerce_tds(targ, res)
 
         try:
-            tm.assert_almost_equal(targ, res)
+            tm.assert_almost_equal(targ, res, check_dtype=check_dtype)
         except:
 
-            if targ.dtype == 'm8[ns]':
+            # handle timedelta dtypes
+            if hasattr(targ, 'dtype') and targ.dtype == 'm8[ns]':
                 targ, res = _coerce_tds(targ, res)
-                tm.assert_almost_equal(targ, res)
+                tm.assert_almost_equal(targ, res, check_dtype=check_dtype)
                 return
 
             # There are sometimes rounding errors with
@@ -172,32 +177,42 @@ def _coerce_tds(targ, res):
             # but nanops doesn't, so make that an exception
             elif targ.dtype.kind == 'O':
                 raise
-            tm.assert_almost_equal(targ.real, res.real)
-            tm.assert_almost_equal(targ.imag, res.imag)
-
-    def check_fun_data(self, testfunc, targfunc,
-                       testarval, targarval, targarnanval, **kwargs):
-        for axis in list(range(targarval.ndim))+[None]:
+            tm.assert_almost_equal(targ.real, res.real,
+                                   check_dtype=check_dtype)
+            tm.assert_almost_equal(targ.imag, res.imag,
+                                   check_dtype=check_dtype)
+
+    def check_fun_data(self, testfunc, targfunc, testarval, targarval,
+                       targarnanval, check_dtype=True, empty_targfunc=None,
+                       **kwargs):
+        for axis in list(range(targarval.ndim)) + [None]:
             for skipna in [False, True]:
                 targartempval = targarval if skipna else targarnanval
-                try:
+                if skipna and empty_targfunc and isna(targartempval).all():
+                    targ = empty_targfunc(targartempval, axis=axis, **kwargs)
+                else:
                     targ = targfunc(targartempval, axis=axis, **kwargs)
+
+                try:
                     res = testfunc(testarval, axis=axis, skipna=skipna,
                                    **kwargs)
-                    self.check_results(targ, res, axis)
+                    self.check_results(targ, res, axis,
+                                       check_dtype=check_dtype)
                     if skipna:
                         res = testfunc(testarval, axis=axis, **kwargs)
-                        self.check_results(targ, res, axis)
+                        self.check_results(targ, res, axis,
+                                           check_dtype=check_dtype)
                     if axis is None:
                         res = testfunc(testarval, skipna=skipna, **kwargs)
-                        self.check_results(targ, res, axis)
+                        self.check_results(targ, res, axis,
+                                           check_dtype=check_dtype)
                     if skipna and axis is None:
                         res = testfunc(testarval, **kwargs)
-                        self.check_results(targ, res, axis)
+                        self.check_results(targ, res, axis,
+                                           check_dtype=check_dtype)
                 except BaseException as exc:
-                    exc.args += ('axis: %s of %s' % (axis, testarval.ndim-1),
-                                 'skipna: %s' % skipna,
-                                 'kwargs: %s' % kwargs)
+                    exc.args += ('axis: %s of %s' % (axis, testarval.ndim - 1),
+                                 'skipna: %s' % skipna, 'kwargs: %s' % kwargs)
                     raise
 
         if testarval.ndim <= 1:
@@ -209,13 +224,12 @@ def check_fun_data(self, testfunc, targfunc,
             targarnanval2 = np.take(targarnanval, 0, axis=-1)
         except ValueError:
             return
-        self.check_fun_data(testfunc, targfunc,
-                            testarval2, targarval2, targarnanval2,
-                            **kwargs)
+        self.check_fun_data(testfunc, targfunc, testarval2, targarval2,
+                            targarnanval2, check_dtype=check_dtype,
+                            empty_targfunc=empty_targfunc, **kwargs)
 
-    def check_fun(self, testfunc, targfunc,
-                  testar, targar=None, targarnan=None,
-                  **kwargs):
+    def check_fun(self, testfunc, targfunc, testar, targar=None,
+                  targarnan=None, empty_targfunc=None, **kwargs):
         if targar is None:
             targar = testar
         if targarnan is None:
@@ -224,25 +238,23 @@ def check_fun(self, testfunc, targfunc,
         targarval = getattr(self, targar)
         targarnanval = getattr(self, targarnan)
         try:
-            self.check_fun_data(testfunc, targfunc,
-                                testarval, targarval, targarnanval, **kwargs)
+            self.check_fun_data(testfunc, targfunc, testarval, targarval,
+                                targarnanval, empty_targfunc=empty_targfunc,
+                                **kwargs)
         except BaseException as exc:
-            exc.args += ('testar: %s' % testar,
-                         'targar: %s' % targar,
+            exc.args += ('testar: %s' % testar, 'targar: %s' % targar,
                          'targarnan: %s' % targarnan)
             raise
 
-    def check_funs(self, testfunc, targfunc,
-                   allow_complex=True, allow_all_nan=True, allow_str=True,
-                   allow_date=True, allow_tdelta=True, allow_obj=True,
-                   **kwargs):
+    def check_funs(self, testfunc, targfunc, allow_complex=True,
+                   allow_all_nan=True, allow_str=True, allow_date=True,
+                   allow_tdelta=True, allow_obj=True, **kwargs):
         self.check_fun(testfunc, targfunc, 'arr_float', **kwargs)
         self.check_fun(testfunc, targfunc, 'arr_float_nan', 'arr_float',
                        **kwargs)
         self.check_fun(testfunc, targfunc, 'arr_int', **kwargs)
         self.check_fun(testfunc, targfunc, 'arr_bool', **kwargs)
-        objs = [self.arr_float.astype('O'),
-                self.arr_int.astype('O'),
+        objs = [self.arr_float.astype('O'), self.arr_int.astype('O'),
                 self.arr_bool.astype('O')]
 
         if allow_all_nan:
@@ -250,8 +262,8 @@ def check_funs(self, testfunc, targfunc,
 
         if allow_complex:
             self.check_fun(testfunc, targfunc, 'arr_complex', **kwargs)
-            self.check_fun(testfunc, targfunc,
-                           'arr_complex_nan', 'arr_complex', **kwargs)
+            self.check_fun(testfunc, targfunc, 'arr_complex_nan',
+                           'arr_complex', **kwargs)
             if allow_all_nan:
                 self.check_fun(testfunc, targfunc, 'arr_nan_nanj', **kwargs)
             objs += [self.arr_complex.astype('O')]
@@ -259,8 +271,7 @@ def check_funs(self, testfunc, targfunc,
         if allow_str:
             self.check_fun(testfunc, targfunc, 'arr_str', **kwargs)
             self.check_fun(testfunc, targfunc, 'arr_utf', **kwargs)
-            objs += [self.arr_str.astype('O'),
-                     self.arr_utf.astype('O')]
+            objs += [self.arr_str.astype('O'), self.arr_utf.astype('O')]
 
         if allow_date:
             try:
@@ -286,23 +297,10 @@ def check_funs(self, testfunc, targfunc,
             # counterparts, so the numpy functions need to be given something
             # else
             if allow_obj == 'convert':
-                targfunc = partial(self._badobj_wrap,
-                                   func=targfunc, allow_complex=allow_complex)
+                targfunc = partial(self._badobj_wrap, func=targfunc,
+                                   allow_complex=allow_complex)
             self.check_fun(testfunc, targfunc, 'arr_obj', **kwargs)
 
-    def check_funs_ddof(self, testfunc, targfunc,
-                        allow_complex=True, allow_all_nan=True, allow_str=True,
-                        allow_date=False, allow_tdelta=False, allow_obj=True,):
-        for ddof in range(3):
-            try:
-                self.check_funs(testfunc, targfunc,
-                                allow_complex, allow_all_nan, allow_str,
-                                allow_date, allow_tdelta, allow_obj,
-                                ddof=ddof)
-            except BaseException as exc:
-                exc.args += ('ddof %s' % ddof,)
-                raise
-
     def _badobj_wrap(self, value, func, allow_complex=True, **kwargs):
         if value.dtype.kind == 'O':
             if allow_complex:
@@ -312,42 +310,40 @@ def _badobj_wrap(self, value, func, allow_complex=True, **kwargs):
         return func(value, **kwargs)
 
     def test_nanany(self):
-        self.check_funs(nanops.nanany, np.any,
-                        allow_all_nan=False, allow_str=False, allow_date=False, allow_tdelta=False)
+        self.check_funs(nanops.nanany, np.any, allow_all_nan=False,
+                        allow_str=False, allow_date=False, allow_tdelta=False)
 
     def test_nanall(self):
-        self.check_funs(nanops.nanall, np.all,
-                        allow_all_nan=False, allow_str=False, allow_date=False, allow_tdelta=False)
+        self.check_funs(nanops.nanall, np.all, allow_all_nan=False,
+                        allow_str=False, allow_date=False, allow_tdelta=False)
 
     def test_nansum(self):
-        self.check_funs(nanops.nansum, np.sum,
-                        allow_str=False, allow_date=False, allow_tdelta=True)
+        self.check_funs(nanops.nansum, np.sum, allow_str=False,
+                        allow_date=False, allow_tdelta=True, check_dtype=False,
+                        empty_targfunc=np.nansum)
 
     def test_nanmean(self):
-        self.check_funs(nanops.nanmean, np.mean,
-                        allow_complex=False, allow_obj=False,
-                        allow_str=False, allow_date=False, allow_tdelta=True)
+        self.check_funs(nanops.nanmean, np.mean, allow_complex=False,
+                        allow_obj=False, allow_str=False, allow_date=False,
+                        allow_tdelta=True)
 
     def test_nanmean_overflow(self):
         # GH 10155
         # In the previous implementation mean can overflow for int dtypes, it
         # is now consistent with numpy
 
-        # numpy < 1.9.0 is not computing this correctly
-        from distutils.version import LooseVersion
-        if LooseVersion(np.__version__) >= '1.9.0':
-            for a in [2 ** 55, -2 ** 55, 20150515061816532]:
-                s = Series(a, index=range(500), dtype=np.int64)
-                result = s.mean()
-                np_result = s.values.mean()
-                self.assertEqual(result, a)
-                self.assertEqual(result, np_result)
-                self.assertTrue(result.dtype == np.float64)
+        for a in [2 ** 55, -2 ** 55, 20150515061816532]:
+            s = Series(a, index=range(500), dtype=np.int64)
+            result = s.mean()
+            np_result = s.values.mean()
+            assert result == a
+            assert result == np_result
+            assert result.dtype == np.float64
 
     def test_returned_dtype(self):
 
         dtypes = [np.int16, np.int32, np.int64, np.float32, np.float64]
-        if hasattr(np,'float128'):
+        if hasattr(np, 'float128'):
             dtypes.append(np.float128)
 
         for dtype in dtypes:
@@ -357,64 +353,61 @@ def test_returned_dtype(self):
             for method in group_a + group_b:
                 result = getattr(s, method)()
                 if is_integer_dtype(dtype) and method in group_a:
-                    self.assertTrue(result.dtype == np.float64,
-                                    "return dtype expected from %s is np.float64, got %s instead" % (method, result.dtype))
+                    assert result.dtype == np.float64
                 else:
-                    self.assertTrue(result.dtype == dtype,
-                                    "return dtype expected from %s is %s, got %s instead" % (method, dtype, result.dtype))
+                    assert result.dtype == dtype
 
     def test_nanmedian(self):
-        self.check_funs(nanops.nanmedian, np.median,
-                        allow_complex=False, allow_str=False, allow_date=False,
-                        allow_tdelta=True,
-                        allow_obj='convert')
-
-    def test_nanvar(self):
-        self.check_funs_ddof(nanops.nanvar, np.var,
-                             allow_complex=False,
-                             allow_str=False,
-                             allow_date=False,
-                             allow_tdelta=True,
-                             allow_obj='convert')
-
-    def test_nanstd(self):
-        self.check_funs_ddof(nanops.nanstd, np.std,
-                             allow_complex=False,
-                             allow_str=False,
-                             allow_date=False,
-                             allow_tdelta=True,
-                             allow_obj='convert')
-
-    def test_nansem(self):
-        tm.skip_if_no_package('scipy.stats')
+        with warnings.catch_warnings(record=True):
+            self.check_funs(nanops.nanmedian, np.median, allow_complex=False,
+                            allow_str=False, allow_date=False,
+                            allow_tdelta=True, allow_obj='convert')
+
+    @pytest.mark.parametrize('ddof', range(3))
+    def test_nanvar(self, ddof):
+        self.check_funs(nanops.nanvar, np.var, allow_complex=False,
+                        allow_str=False, allow_date=False,
+                        allow_tdelta=True, allow_obj='convert', ddof=ddof)
+
+    @pytest.mark.parametrize('ddof', range(3))
+    def test_nanstd(self, ddof):
+        self.check_funs(nanops.nanstd, np.std, allow_complex=False,
+                        allow_str=False, allow_date=False,
+                        allow_tdelta=True, allow_obj='convert', ddof=ddof)
+
+    @td.skip_if_no('scipy', min_version='0.17.0')
+    @pytest.mark.parametrize('ddof', range(3))
+    def test_nansem(self, ddof):
         from scipy.stats import sem
-        self.check_funs_ddof(nanops.nansem, sem,
-                             allow_complex=False,
-                             allow_str=False,
-                             allow_date=False,
-                             allow_tdelta=True,
-                             allow_obj='convert')
+        with np.errstate(invalid='ignore'):
+            self.check_funs(nanops.nansem, sem, allow_complex=False,
+                            allow_str=False, allow_date=False,
+                            allow_tdelta=False, allow_obj='convert', ddof=ddof)
 
     def _minmax_wrap(self, value, axis=None, func=None):
+
+        # numpy warns if all nan
         res = func(value, axis)
         if res.dtype.kind == 'm':
             res = np.atleast_1d(res)
         return res
 
     def test_nanmin(self):
-        func = partial(self._minmax_wrap, func=np.min)
-        self.check_funs(nanops.nanmin, func,
-                        allow_str=False, allow_obj=False)
+        with warnings.catch_warnings(record=True):
+            func = partial(self._minmax_wrap, func=np.min)
+            self.check_funs(nanops.nanmin, func,
+                            allow_str=False, allow_obj=False)
 
     def test_nanmax(self):
-        func = partial(self._minmax_wrap, func=np.max)
-        self.check_funs(nanops.nanmax, func,
-                        allow_str=False, allow_obj=False)
+        with warnings.catch_warnings(record=True):
+            func = partial(self._minmax_wrap, func=np.max)
+            self.check_funs(nanops.nanmax, func,
+                            allow_str=False, allow_obj=False)
 
     def _argminmax_wrap(self, value, axis=None, func=None):
         res = func(value, axis)
         nans = np.min(value, axis)
-        nullnan = isnull(nans)
+        nullnan = isna(nans)
         if res.ndim:
             res[nullnan] = -1
         elif (hasattr(nullnan, 'all') and nullnan.all() or
@@ -423,22 +416,17 @@ def _argminmax_wrap(self, value, axis=None, func=None):
         return res
 
     def test_nanargmax(self):
-        func = partial(self._argminmax_wrap, func=np.argmax)
-        self.check_funs(nanops.nanargmax, func,
-                        allow_str=False, allow_obj=False,
-                        allow_date=True,
-                        allow_tdelta=True)
+        with warnings.catch_warnings(record=True):
+            func = partial(self._argminmax_wrap, func=np.argmax)
+            self.check_funs(nanops.nanargmax, func,
+                            allow_str=False, allow_obj=False,
+                            allow_date=True, allow_tdelta=True)
 
     def test_nanargmin(self):
-        func = partial(self._argminmax_wrap, func=np.argmin)
-        if tm.sys.version_info[0:2] == (2, 6):
-            self.check_funs(nanops.nanargmin, func,
-                            allow_date=True,
-                            allow_tdelta=True,
-                            allow_str=False, allow_obj=False)
-        else:
-            self.check_funs(nanops.nanargmin, func,
-                            allow_str=False, allow_obj=False)
+        with warnings.catch_warnings(record=True):
+            func = partial(self._argminmax_wrap, func=np.argmin)
+            self.check_funs(nanops.nanargmin, func, allow_str=False,
+                            allow_obj=False)
 
     def _skew_kurt_wrap(self, values, axis=None, func=None):
         if not isinstance(values.dtype.type, np.floating):
@@ -452,57 +440,55 @@ def _skew_kurt_wrap(self, values, axis=None, func=None):
             return 0.
         return result
 
+    @td.skip_if_no('scipy', min_version='0.17.0')
     def test_nanskew(self):
-        tm.skip_if_no_package('scipy.stats')
         from scipy.stats import skew
         func = partial(self._skew_kurt_wrap, func=skew)
-        self.check_funs(nanops.nanskew, func,
-                        allow_complex=False, allow_str=False, allow_date=False, allow_tdelta=False)
+        with np.errstate(invalid='ignore'):
+            self.check_funs(nanops.nanskew, func, allow_complex=False,
+                            allow_str=False, allow_date=False,
+                            allow_tdelta=False)
 
+    @td.skip_if_no('scipy', min_version='0.17.0')
     def test_nankurt(self):
-        tm.skip_if_no_package('scipy.stats')
         from scipy.stats import kurtosis
         func1 = partial(kurtosis, fisher=True)
         func = partial(self._skew_kurt_wrap, func=func1)
-        self.check_funs(nanops.nankurt, func,
-                        allow_complex=False, allow_str=False, allow_date=False, allow_tdelta=False)
+        with np.errstate(invalid='ignore'):
+            self.check_funs(nanops.nankurt, func, allow_complex=False,
+                            allow_str=False, allow_date=False,
+                            allow_tdelta=False)
 
+    @td.skip_if_no("numpy", min_version="1.10.0")
     def test_nanprod(self):
-        self.check_funs(nanops.nanprod, np.prod,
-                        allow_str=False, allow_date=False, allow_tdelta=False)
+        self.check_funs(nanops.nanprod, np.prod, allow_str=False,
+                        allow_date=False, allow_tdelta=False,
+                        empty_targfunc=np.nanprod)
 
     def check_nancorr_nancov_2d(self, checkfun, targ0, targ1, **kwargs):
-        res00 = checkfun(self.arr_float_2d, self.arr_float1_2d,
-                         **kwargs)
+        res00 = checkfun(self.arr_float_2d, self.arr_float1_2d, **kwargs)
         res01 = checkfun(self.arr_float_2d, self.arr_float1_2d,
-                         min_periods=len(self.arr_float_2d)-1,
-                         **kwargs)
+                         min_periods=len(self.arr_float_2d) - 1, **kwargs)
         tm.assert_almost_equal(targ0, res00)
         tm.assert_almost_equal(targ0, res01)
 
         res10 = checkfun(self.arr_float_nan_2d, self.arr_float1_nan_2d,
                          **kwargs)
         res11 = checkfun(self.arr_float_nan_2d, self.arr_float1_nan_2d,
-                         min_periods=len(self.arr_float_2d)-1,
-                         **kwargs)
+                         min_periods=len(self.arr_float_2d) - 1, **kwargs)
         tm.assert_almost_equal(targ1, res10)
         tm.assert_almost_equal(targ1, res11)
 
         targ2 = np.nan
-        res20 = checkfun(self.arr_nan_2d, self.arr_float1_2d,
-                         **kwargs)
-        res21 = checkfun(self.arr_float_2d, self.arr_nan_2d,
-                         **kwargs)
-        res22 = checkfun(self.arr_nan_2d, self.arr_nan_2d,
-                         **kwargs)
+        res20 = checkfun(self.arr_nan_2d, self.arr_float1_2d, **kwargs)
+        res21 = checkfun(self.arr_float_2d, self.arr_nan_2d, **kwargs)
+        res22 = checkfun(self.arr_nan_2d, self.arr_nan_2d, **kwargs)
         res23 = checkfun(self.arr_float_nan_2d, self.arr_nan_float1_2d,
                          **kwargs)
         res24 = checkfun(self.arr_float_nan_2d, self.arr_nan_float1_2d,
-                         min_periods=len(self.arr_float_2d)-1,
-                         **kwargs)
+                         min_periods=len(self.arr_float_2d) - 1, **kwargs)
         res25 = checkfun(self.arr_float_2d, self.arr_float1_2d,
-                         min_periods=len(self.arr_float_2d)+1,
-                         **kwargs)
+                         min_periods=len(self.arr_float_2d) + 1, **kwargs)
         tm.assert_almost_equal(targ2, res20)
         tm.assert_almost_equal(targ2, res21)
         tm.assert_almost_equal(targ2, res22)
@@ -511,42 +497,29 @@ def check_nancorr_nancov_2d(self, checkfun, targ0, targ1, **kwargs):
         tm.assert_almost_equal(targ2, res25)
 
     def check_nancorr_nancov_1d(self, checkfun, targ0, targ1, **kwargs):
-        res00 = checkfun(self.arr_float_1d, self.arr_float1_1d,
-                         **kwargs)
+        res00 = checkfun(self.arr_float_1d, self.arr_float1_1d, **kwargs)
         res01 = checkfun(self.arr_float_1d, self.arr_float1_1d,
-                         min_periods=len(self.arr_float_1d)-1,
-                         **kwargs)
+                         min_periods=len(self.arr_float_1d) - 1, **kwargs)
         tm.assert_almost_equal(targ0, res00)
         tm.assert_almost_equal(targ0, res01)
 
-        res10 = checkfun(self.arr_float_nan_1d,
-                         self.arr_float1_nan_1d,
-                         **kwargs)
-        res11 = checkfun(self.arr_float_nan_1d,
-                         self.arr_float1_nan_1d,
-                         min_periods=len(self.arr_float_1d)-1,
+        res10 = checkfun(self.arr_float_nan_1d, self.arr_float1_nan_1d,
                          **kwargs)
+        res11 = checkfun(self.arr_float_nan_1d, self.arr_float1_nan_1d,
+                         min_periods=len(self.arr_float_1d) - 1, **kwargs)
         tm.assert_almost_equal(targ1, res10)
         tm.assert_almost_equal(targ1, res11)
 
         targ2 = np.nan
-        res20 = checkfun(self.arr_nan_1d, self.arr_float1_1d,
-                         **kwargs)
-        res21 = checkfun(self.arr_float_1d, self.arr_nan_1d,
-                         **kwargs)
-        res22 = checkfun(self.arr_nan_1d, self.arr_nan_1d,
-                         **kwargs)
-        res23 = checkfun(self.arr_float_nan_1d,
-                         self.arr_nan_float1_1d,
-                         **kwargs)
-        res24 = checkfun(self.arr_float_nan_1d,
-                         self.arr_nan_float1_1d,
-                         min_periods=len(self.arr_float_1d)-1,
-                         **kwargs)
-        res25 = checkfun(self.arr_float_1d,
-                         self.arr_float1_1d,
-                         min_periods=len(self.arr_float_1d)+1,
+        res20 = checkfun(self.arr_nan_1d, self.arr_float1_1d, **kwargs)
+        res21 = checkfun(self.arr_float_1d, self.arr_nan_1d, **kwargs)
+        res22 = checkfun(self.arr_nan_1d, self.arr_nan_1d, **kwargs)
+        res23 = checkfun(self.arr_float_nan_1d, self.arr_nan_float1_1d,
                          **kwargs)
+        res24 = checkfun(self.arr_float_nan_1d, self.arr_nan_float1_1d,
+                         min_periods=len(self.arr_float_1d) - 1, **kwargs)
+        res25 = checkfun(self.arr_float_1d, self.arr_float1_1d,
+                         min_periods=len(self.arr_float_1d) + 1, **kwargs)
         tm.assert_almost_equal(targ2, res20)
         tm.assert_almost_equal(targ2, res21)
         tm.assert_almost_equal(targ2, res22)
@@ -577,8 +550,8 @@ def test_nancorr_pearson(self):
         self.check_nancorr_nancov_1d(nanops.nancorr, targ0, targ1,
                                      method='pearson')
 
+    @td.skip_if_no_scipy
     def test_nancorr_kendall(self):
-        tm.skip_if_no_package('scipy.stats')
         from scipy.stats import kendalltau
         targ0 = kendalltau(self.arr_float_2d, self.arr_float1_2d)[0]
         targ1 = kendalltau(self.arr_float_2d.flat, self.arr_float1_2d.flat)[0]
@@ -589,8 +562,8 @@ def test_nancorr_kendall(self):
         self.check_nancorr_nancov_1d(nanops.nancorr, targ0, targ1,
                                      method='kendall')
 
+    @td.skip_if_no_scipy
     def test_nancorr_spearman(self):
-        tm.skip_if_no_package('scipy.stats')
         from scipy.stats import spearmanr
         targ0 = spearmanr(self.arr_float_2d, self.arr_float1_2d)[0]
         targ1 = spearmanr(self.arr_float_2d.flat, self.arr_float1_2d.flat)[0]
@@ -628,13 +601,13 @@ def check_nancomp(self, checkfun, targ0):
                 else:
                     targ1 = np.hstack([targ0, arr_nan])
                 res1 = checkfun(arr_float_nan, arr_float1_nan)
-                tm.assert_almost_equal(targ1, res1)
+                tm.assert_numpy_array_equal(targ1, res1, check_dtype=False)
 
                 targ2 = arr_nan_nan
                 res2 = checkfun(arr_float_nan, arr_nan_float1)
-                tm.assert_almost_equal(targ2, res2)
+                tm.assert_numpy_array_equal(targ2, res2, check_dtype=False)
             except Exception as exc:
-                exc.args += ('ndim: %s' % arr_float.ndim,)
+                exc.args += ('ndim: %s' % arr_float.ndim, )
                 raise
 
             try:
@@ -678,11 +651,11 @@ def check_bool(self, func, value, correct, *args, **kwargs):
             try:
                 res0 = func(value, *args, **kwargs)
                 if correct:
-                    self.assertTrue(res0)
+                    assert res0
                 else:
-                    self.assertFalse(res0)
+                    assert not res0
             except BaseException as exc:
-                exc.args += ('dim: %s' % getattr(value, 'ndim', value),)
+                exc.args += ('dim: %s' % getattr(value, 'ndim', value), )
                 raise
             if not hasattr(value, 'ndim'):
                 break
@@ -692,26 +665,15 @@ def check_bool(self, func, value, correct, *args, **kwargs):
                 break
 
     def test__has_infs(self):
-        pairs = [('arr_complex', False),
-                 ('arr_int', False),
-                 ('arr_bool', False),
-                 ('arr_str', False),
-                 ('arr_utf', False),
-                 ('arr_complex', False),
-                 ('arr_complex_nan', False),
-
-                 ('arr_nan_nanj', False),
-                 ('arr_nan_infj', True),
+        pairs = [('arr_complex', False), ('arr_int', False),
+                 ('arr_bool', False), ('arr_str', False), ('arr_utf', False),
+                 ('arr_complex', False), ('arr_complex_nan', False),
+                 ('arr_nan_nanj', False), ('arr_nan_infj', True),
                  ('arr_complex_nan_infj', True)]
-        pairs_float = [('arr_float', False),
-                       ('arr_nan', False),
-                       ('arr_float_nan', False),
-                       ('arr_nan_nan', False),
-
-                       ('arr_float_inf', True),
-                       ('arr_inf', True),
-                       ('arr_nan_inf', True),
-                       ('arr_float_nan_inf', True),
+        pairs_float = [('arr_float', False), ('arr_nan', False),
+                       ('arr_float_nan', False), ('arr_nan_nan', False),
+                       ('arr_float_inf', True), ('arr_inf', True),
+                       ('arr_nan_inf', True), ('arr_float_nan_inf', True),
                        ('arr_nan_nan_inf', True)]
 
         for arr, correct in pairs:
@@ -719,7 +681,7 @@ def test__has_infs(self):
             try:
                 self.check_bool(nanops._has_infs, val, correct)
             except BaseException as exc:
-                exc.args += (arr,)
+                exc.args += (arr, )
                 raise
 
         for arr, correct in pairs_float:
@@ -729,40 +691,32 @@ def test__has_infs(self):
                 self.check_bool(nanops._has_infs, val.astype('f4'), correct)
                 self.check_bool(nanops._has_infs, val.astype('f2'), correct)
             except BaseException as exc:
-                exc.args += (arr,)
+                exc.args += (arr, )
                 raise
 
     def test__isfinite(self):
-        pairs = [('arr_complex', False),
-                 ('arr_int', False),
-                 ('arr_bool', False),
-                 ('arr_str', False),
-                 ('arr_utf', False),
-                 ('arr_complex', False),
-                 ('arr_complex_nan', True),
-
-                 ('arr_nan_nanj', True),
-                 ('arr_nan_infj', True),
+        pairs = [('arr_complex', False), ('arr_int', False),
+                 ('arr_bool', False), ('arr_str', False), ('arr_utf', False),
+                 ('arr_complex', False), ('arr_complex_nan', True),
+                 ('arr_nan_nanj', True), ('arr_nan_infj', True),
                  ('arr_complex_nan_infj', True)]
-        pairs_float = [('arr_float', False),
-                       ('arr_nan', True),
-                       ('arr_float_nan', True),
-                       ('arr_nan_nan', True),
-
-                       ('arr_float_inf', True),
-                       ('arr_inf', True),
-                       ('arr_nan_inf', True),
-                       ('arr_float_nan_inf', True),
+        pairs_float = [('arr_float', False), ('arr_nan', True),
+                       ('arr_float_nan', True), ('arr_nan_nan', True),
+                       ('arr_float_inf', True), ('arr_inf', True),
+                       ('arr_nan_inf', True), ('arr_float_nan_inf', True),
                        ('arr_nan_nan_inf', True)]
 
         func1 = lambda x: np.any(nanops._isfinite(x).ravel())
-        func2 = lambda x: np.any(nanops._isfinite(x).values.ravel())
+
+        # TODO: unused?
+        # func2 = lambda x: np.any(nanops._isfinite(x).values.ravel())
+
         for arr, correct in pairs:
             val = getattr(self, arr)
             try:
                 self.check_bool(func1, val, correct)
             except BaseException as exc:
-                exc.args += (arr,)
+                exc.args += (arr, )
                 raise
 
         for arr, correct in pairs_float:
@@ -772,74 +726,66 @@ def test__isfinite(self):
                 self.check_bool(func1, val.astype('f4'), correct)
                 self.check_bool(func1, val.astype('f2'), correct)
             except BaseException as exc:
-                exc.args += (arr,)
+                exc.args += (arr, )
                 raise
 
     def test__bn_ok_dtype(self):
-        self.assertTrue(nanops._bn_ok_dtype(self.arr_float.dtype, 'test'))
-        self.assertTrue(nanops._bn_ok_dtype(self.arr_complex.dtype, 'test'))
-        self.assertTrue(nanops._bn_ok_dtype(self.arr_int.dtype, 'test'))
-        self.assertTrue(nanops._bn_ok_dtype(self.arr_bool.dtype, 'test'))
-        self.assertTrue(nanops._bn_ok_dtype(self.arr_str.dtype, 'test'))
-        self.assertTrue(nanops._bn_ok_dtype(self.arr_utf.dtype, 'test'))
-        self.assertFalse(nanops._bn_ok_dtype(self.arr_date.dtype, 'test'))
-        self.assertFalse(nanops._bn_ok_dtype(self.arr_tdelta.dtype, 'test'))
-        self.assertFalse(nanops._bn_ok_dtype(self.arr_obj.dtype, 'test'))
-
-
-class TestEnsureNumeric(tm.TestCase):
+        assert nanops._bn_ok_dtype(self.arr_float.dtype, 'test')
+        assert nanops._bn_ok_dtype(self.arr_complex.dtype, 'test')
+        assert nanops._bn_ok_dtype(self.arr_int.dtype, 'test')
+        assert nanops._bn_ok_dtype(self.arr_bool.dtype, 'test')
+        assert nanops._bn_ok_dtype(self.arr_str.dtype, 'test')
+        assert nanops._bn_ok_dtype(self.arr_utf.dtype, 'test')
+        assert not nanops._bn_ok_dtype(self.arr_date.dtype, 'test')
+        assert not nanops._bn_ok_dtype(self.arr_tdelta.dtype, 'test')
+        assert not nanops._bn_ok_dtype(self.arr_obj.dtype, 'test')
+
+
+class TestEnsureNumeric(object):
+
     def test_numeric_values(self):
         # Test integer
-        self.assertEqual(nanops._ensure_numeric(1), 1, 'Failed for int')
+        assert nanops._ensure_numeric(1) == 1
+
         # Test float
-        self.assertEqual(nanops._ensure_numeric(1.1), 1.1, 'Failed for float')
+        assert nanops._ensure_numeric(1.1) == 1.1
+
         # Test complex
-        self.assertEqual(nanops._ensure_numeric(1 + 2j), 1 + 2j,
-                         'Failed for complex')
+        assert nanops._ensure_numeric(1 + 2j) == 1 + 2j
 
     def test_ndarray(self):
         # Test numeric ndarray
         values = np.array([1, 2, 3])
-        self.assertTrue(np.allclose(nanops._ensure_numeric(values), values),
-                        'Failed for numeric ndarray')
+        assert np.allclose(nanops._ensure_numeric(values), values)
 
         # Test object ndarray
         o_values = values.astype(object)
-        self.assertTrue(np.allclose(nanops._ensure_numeric(o_values), values),
-                        'Failed for object ndarray')
+        assert np.allclose(nanops._ensure_numeric(o_values), values)
 
         # Test convertible string ndarray
         s_values = np.array(['1', '2', '3'], dtype=object)
-        self.assertTrue(np.allclose(nanops._ensure_numeric(s_values), values),
-                        'Failed for convertible string ndarray')
+        assert np.allclose(nanops._ensure_numeric(s_values), values)
 
         # Test non-convertible string ndarray
         s_values = np.array(['foo', 'bar', 'baz'], dtype=object)
-        self.assertRaises(ValueError,
-                          lambda: nanops._ensure_numeric(s_values))
+        pytest.raises(ValueError, lambda: nanops._ensure_numeric(s_values))
 
     def test_convertable_values(self):
-        self.assertTrue(np.allclose(nanops._ensure_numeric('1'), 1.0),
-                        'Failed for convertible integer string')
-        self.assertTrue(np.allclose(nanops._ensure_numeric('1.1'), 1.1),
-                        'Failed for convertible float string')
-        self.assertTrue(np.allclose(nanops._ensure_numeric('1+1j'), 1 + 1j),
-                        'Failed for convertible complex string')
+        assert np.allclose(nanops._ensure_numeric('1'), 1.0)
+        assert np.allclose(nanops._ensure_numeric('1.1'), 1.1)
+        assert np.allclose(nanops._ensure_numeric('1+1j'), 1 + 1j)
 
     def test_non_convertable_values(self):
-        self.assertRaises(TypeError,
-                          lambda: nanops._ensure_numeric('foo'))
-        self.assertRaises(TypeError,
-                          lambda: nanops._ensure_numeric({}))
-        self.assertRaises(TypeError,
-                          lambda: nanops._ensure_numeric([]))
+        pytest.raises(TypeError, lambda: nanops._ensure_numeric('foo'))
+        pytest.raises(TypeError, lambda: nanops._ensure_numeric({}))
+        pytest.raises(TypeError, lambda: nanops._ensure_numeric([]))
 
 
-class TestNanvarFixedValues(tm.TestCase):
+class TestNanvarFixedValues(object):
 
     # xref GH10242
 
-    def setUp(self):
+    def setup_method(self, method):
         # Samples from a normal distribution.
         self.variance = variance = 3.0
         self.samples = self.prng.normal(scale=variance ** 0.5, size=100000)
@@ -847,32 +793,31 @@ def setUp(self):
     def test_nanvar_all_finite(self):
         samples = self.samples
         actual_variance = nanops.nanvar(samples)
-        np.testing.assert_almost_equal(
-            actual_variance, self.variance, decimal=2)
+        tm.assert_almost_equal(actual_variance, self.variance,
+                               check_less_precise=2)
 
     def test_nanvar_nans(self):
         samples = np.nan * np.ones(2 * self.samples.shape[0])
         samples[::2] = self.samples
 
         actual_variance = nanops.nanvar(samples, skipna=True)
-        np.testing.assert_almost_equal(
-            actual_variance, self.variance, decimal=2)
+        tm.assert_almost_equal(actual_variance, self.variance,
+                               check_less_precise=2)
 
         actual_variance = nanops.nanvar(samples, skipna=False)
-        np.testing.assert_almost_equal(
-            actual_variance, np.nan, decimal=2)
+        tm.assert_almost_equal(actual_variance, np.nan, check_less_precise=2)
 
     def test_nanstd_nans(self):
         samples = np.nan * np.ones(2 * self.samples.shape[0])
         samples[::2] = self.samples
 
         actual_std = nanops.nanstd(samples, skipna=True)
-        np.testing.assert_almost_equal(
-            actual_std, self.variance ** 0.5, decimal=2)
+        tm.assert_almost_equal(actual_std, self.variance ** 0.5,
+                               check_less_precise=2)
 
         actual_std = nanops.nanvar(samples, skipna=False)
-        np.testing.assert_almost_equal(
-            actual_std, np.nan, decimal=2)
+        tm.assert_almost_equal(actual_std, np.nan,
+                               check_less_precise=2)
 
     def test_nanvar_axis(self):
         # Generate some sample data.
@@ -881,12 +826,12 @@ def test_nanvar_axis(self):
         samples = np.vstack([samples_norm, samples_unif])
 
         actual_variance = nanops.nanvar(samples, axis=1)
-        np.testing.assert_array_almost_equal(
-            actual_variance, np.array([self.variance, 1.0 / 12]), decimal=2)
+        tm.assert_almost_equal(actual_variance, np.array(
+            [self.variance, 1.0 / 12]), check_less_precise=2)
 
     def test_nanvar_ddof(self):
         n = 5
-        samples = self.prng.uniform(size=(10000, n+1))
+        samples = self.prng.uniform(size=(10000, n + 1))
         samples[:, -1] = np.nan  # Force use of our own algorithm.
 
         variance_0 = nanops.nanvar(samples, axis=1, skipna=True, ddof=0).mean()
@@ -895,49 +840,46 @@ def test_nanvar_ddof(self):
 
         # The unbiased estimate.
         var = 1.0 / 12
-        np.testing.assert_almost_equal(variance_1, var, decimal=2)
+        tm.assert_almost_equal(variance_1, var,
+                               check_less_precise=2)
+
         # The underestimated variance.
-        np.testing.assert_almost_equal(
-            variance_0,  (n - 1.0) / n * var, decimal=2)
+        tm.assert_almost_equal(variance_0, (n - 1.0) / n * var,
+                               check_less_precise=2)
+
         # The overestimated variance.
-        np.testing.assert_almost_equal(
-            variance_2,  (n - 1.0) / (n - 2.0) * var, decimal=2)
+        tm.assert_almost_equal(variance_2, (n - 1.0) / (n - 2.0) * var,
+                               check_less_precise=2)
 
     def test_ground_truth(self):
         # Test against values that were precomputed with Numpy.
         samples = np.empty((4, 4))
-        samples[:3, :3] = np.array([[0.97303362, 0.21869576, 0.55560287],
-                                    [0.72980153, 0.03109364, 0.99155171],
+        samples[:3, :3] = np.array([[0.97303362, 0.21869576, 0.55560287
+                                     ], [0.72980153, 0.03109364, 0.99155171],
                                     [0.09317602, 0.60078248, 0.15871292]])
         samples[3] = samples[:, 3] = np.nan
 
         # Actual variances along axis=0, 1 for ddof=0, 1, 2
-        variance = np.array(
-            [[[0.13762259, 0.05619224, 0.11568816],
-              [0.20643388, 0.08428837, 0.17353224],
-              [0.41286776, 0.16857673, 0.34706449]],
-             [[0.09519783, 0.16435395, 0.05082054],
-              [0.14279674, 0.24653093, 0.07623082],
-              [0.28559348, 0.49306186, 0.15246163]]]
-        )
+        variance = np.array([[[0.13762259, 0.05619224, 0.11568816
+                               ], [0.20643388, 0.08428837, 0.17353224],
+                              [0.41286776, 0.16857673, 0.34706449]],
+                             [[0.09519783, 0.16435395, 0.05082054
+                               ], [0.14279674, 0.24653093, 0.07623082],
+                              [0.28559348, 0.49306186, 0.15246163]]])
 
         # Test nanvar.
         for axis in range(2):
             for ddof in range(3):
                 var = nanops.nanvar(samples, skipna=True, axis=axis, ddof=ddof)
-                np.testing.assert_array_almost_equal(
-                    var[:3], variance[axis, ddof]
-                )
-                np.testing.assert_equal(var[3], np.nan)
+                tm.assert_almost_equal(var[:3], variance[axis, ddof])
+                assert np.isnan(var[3])
 
         # Test nanstd.
         for axis in range(2):
             for ddof in range(3):
                 std = nanops.nanstd(samples, skipna=True, axis=axis, ddof=ddof)
-                np.testing.assert_array_almost_equal(
-                    std[:3], variance[axis, ddof] ** 0.5
-                )
-                np.testing.assert_equal(std[3], np.nan)
+                tm.assert_almost_equal(std[:3], variance[axis, ddof] ** 0.5)
+                assert np.isnan(std[3])
 
     def test_nanstd_roundoff(self):
         # Regression test for GH 10242 (test data taken from GH 10489). Ensure
@@ -945,14 +887,152 @@ def test_nanstd_roundoff(self):
         data = Series(766897346 * np.ones(10))
         for ddof in range(3):
             result = data.std(ddof=ddof)
-            self.assertEqual(result, 0.0)
+            assert result == 0.0
+
+    @property
+    def prng(self):
+        return np.random.RandomState(1234)
+
+
+class TestNanskewFixedValues(object):
+
+    # xref GH 11974
+
+    def setup_method(self, method):
+        # Test data + skewness value (computed with scipy.stats.skew)
+        self.samples = np.sin(np.linspace(0, 1, 200))
+        self.actual_skew = -0.1875895205961754
+
+    def test_constant_series(self):
+        # xref GH 11974
+        for val in [3075.2, 3075.3, 3075.5]:
+            data = val * np.ones(300)
+            skew = nanops.nanskew(data)
+            assert skew == 0.0
+
+    def test_all_finite(self):
+        alpha, beta = 0.3, 0.1
+        left_tailed = self.prng.beta(alpha, beta, size=100)
+        assert nanops.nanskew(left_tailed) < 0
+
+        alpha, beta = 0.1, 0.3
+        right_tailed = self.prng.beta(alpha, beta, size=100)
+        assert nanops.nanskew(right_tailed) > 0
+
+    def test_ground_truth(self):
+        skew = nanops.nanskew(self.samples)
+        tm.assert_almost_equal(skew, self.actual_skew)
+
+    def test_axis(self):
+        samples = np.vstack([self.samples,
+                             np.nan * np.ones(len(self.samples))])
+        skew = nanops.nanskew(samples, axis=1)
+        tm.assert_almost_equal(skew, np.array([self.actual_skew, np.nan]))
+
+    def test_nans(self):
+        samples = np.hstack([self.samples, np.nan])
+        skew = nanops.nanskew(samples, skipna=False)
+        assert np.isnan(skew)
+
+    def test_nans_skipna(self):
+        samples = np.hstack([self.samples, np.nan])
+        skew = nanops.nanskew(samples, skipna=True)
+        tm.assert_almost_equal(skew, self.actual_skew)
+
+    @property
+    def prng(self):
+        return np.random.RandomState(1234)
+
+
+class TestNankurtFixedValues(object):
+
+    # xref GH 11974
+
+    def setup_method(self, method):
+        # Test data + kurtosis value (computed with scipy.stats.kurtosis)
+        self.samples = np.sin(np.linspace(0, 1, 200))
+        self.actual_kurt = -1.2058303433799713
+
+    def test_constant_series(self):
+        # xref GH 11974
+        for val in [3075.2, 3075.3, 3075.5]:
+            data = val * np.ones(300)
+            kurt = nanops.nankurt(data)
+            assert kurt == 0.0
+
+    def test_all_finite(self):
+        alpha, beta = 0.3, 0.1
+        left_tailed = self.prng.beta(alpha, beta, size=100)
+        assert nanops.nankurt(left_tailed) < 0
+
+        alpha, beta = 0.1, 0.3
+        right_tailed = self.prng.beta(alpha, beta, size=100)
+        assert nanops.nankurt(right_tailed) > 0
+
+    def test_ground_truth(self):
+        kurt = nanops.nankurt(self.samples)
+        tm.assert_almost_equal(kurt, self.actual_kurt)
+
+    def test_axis(self):
+        samples = np.vstack([self.samples,
+                             np.nan * np.ones(len(self.samples))])
+        kurt = nanops.nankurt(samples, axis=1)
+        tm.assert_almost_equal(kurt, np.array([self.actual_kurt, np.nan]))
+
+    def test_nans(self):
+        samples = np.hstack([self.samples, np.nan])
+        kurt = nanops.nankurt(samples, skipna=False)
+        assert np.isnan(kurt)
+
+    def test_nans_skipna(self):
+        samples = np.hstack([self.samples, np.nan])
+        kurt = nanops.nankurt(samples, skipna=True)
+        tm.assert_almost_equal(kurt, self.actual_kurt)
 
     @property
     def prng(self):
         return np.random.RandomState(1234)
 
 
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure',
-                         '-s'], exit=False)
+def test_use_bottleneck():
+
+    if nanops._BOTTLENECK_INSTALLED:
+
+        pd.set_option('use_bottleneck', True)
+        assert pd.get_option('use_bottleneck')
+
+        pd.set_option('use_bottleneck', False)
+        assert not pd.get_option('use_bottleneck')
+
+        pd.set_option('use_bottleneck', use_bn)
+
+
+@pytest.mark.parametrize("numpy_op, expected", [
+    (np.sum, 10),
+    (np.nansum, 10),
+    (np.mean, 2.5),
+    (np.nanmean, 2.5),
+    (np.median, 2.5),
+    (np.nanmedian, 2.5),
+    (np.min, 1),
+    (np.max, 4),
+])
+def test_numpy_ops(numpy_op, expected):
+    # GH8383
+    result = numpy_op(pd.Series([1, 2, 3, 4]))
+    assert result == expected
+
+
+@pytest.mark.parametrize("numpy_op, expected", [
+    (np.nanmin, 1),
+    (np.nanmax, 4),
+])
+def test_numpy_ops_np_version_under1p13(numpy_op, expected):
+    # GH8383
+    result = numpy_op(pd.Series([1, 2, 3, 4]))
+    if _np_version_under1p13:
+        # bug for numpy < 1.13, where result is a series, should be a scalar
+        with pytest.raises(ValueError):
+            assert result == expected
+    else:
+        assert result == expected
diff --git a/pandas/tests/test_panel.py b/pandas/tests/test_panel.py
index 0dad55a9133b6..2f8bc228cf86e 100644
--- a/pandas/tests/test_panel.py
+++ b/pandas/tests/test_panel.py
@@ -1,119 +1,129 @@
 # -*- coding: utf-8 -*-
 # pylint: disable=W0612,E1101
 
+from warnings import catch_warnings
 from datetime import datetime
-from inspect import getargspec
 import operator
-import nose
+import pytest
 
 import numpy as np
-import pandas as pd
 
-from pandas import Series, DataFrame, Index, isnull, notnull, pivot, MultiIndex
-from pandas.core.datetools import bday
+from pandas.core.dtypes.common import is_float_dtype
+from pandas import (Series, DataFrame, Index, date_range, isna, notna,
+                    pivot, MultiIndex)
 from pandas.core.nanops import nanall, nanany
 from pandas.core.panel import Panel
-from pandas.core.series import remove_na
-import pandas.core.common as com
+
+from pandas.io.formats.printing import pprint_thing
 from pandas import compat
-from pandas.compat import range, lrange, StringIO, OrderedDict
-
-from pandas.util.testing import (assert_panel_equal,
-                                 assert_frame_equal,
-                                 assert_series_equal,
-                                 assert_almost_equal,
-                                 assert_produces_warning,
-                                 ensure_clean,
-                                 assertRaisesRegexp,
-                                 makeCustomDataframe as mkdf,
-                                 makeMixedDataFrame
-    )
+from pandas.compat import range, lrange, StringIO, OrderedDict, signature
+
+from pandas.tseries.offsets import BDay, MonthEnd
+from pandas.util.testing import (assert_panel_equal, assert_frame_equal,
+                                 assert_series_equal, assert_almost_equal,
+                                 ensure_clean, makeMixedDataFrame,
+                                 makeCustomDataframe as mkdf)
 import pandas.core.panel as panelm
 import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+
+def make_test_panel():
+    with catch_warnings(record=True):
+        _panel = tm.makePanel()
+        tm.add_nans(_panel)
+        _panel = _panel.copy()
+    return _panel
 
 
 class PanelTests(object):
     panel = None
 
     def test_pickle(self):
-        unpickled = self.round_trip_pickle(self.panel)
-        assert_frame_equal(unpickled['ItemA'], self.panel['ItemA'])
+        with catch_warnings(record=True):
+            unpickled = tm.round_trip_pickle(self.panel)
+            assert_frame_equal(unpickled['ItemA'], self.panel['ItemA'])
+
+    def test_rank(self):
+        with catch_warnings(record=True):
+            pytest.raises(NotImplementedError, lambda: self.panel.rank())
 
     def test_cumsum(self):
-        cumsum = self.panel.cumsum()
-        assert_frame_equal(cumsum['ItemA'], self.panel['ItemA'].cumsum())
+        with catch_warnings(record=True):
+            cumsum = self.panel.cumsum()
+            assert_frame_equal(cumsum['ItemA'], self.panel['ItemA'].cumsum())
 
     def not_hashable(self):
-        c_empty = Panel()
-        c = Panel(Panel([[[1]]]))
-        self.assertRaises(TypeError, hash, c_empty)
-        self.assertRaises(TypeError, hash, c)
+        with catch_warnings(record=True):
+            c_empty = Panel()
+            c = Panel(Panel([[[1]]]))
+            pytest.raises(TypeError, hash, c_empty)
+            pytest.raises(TypeError, hash, c)
 
 
 class SafeForLongAndSparse(object):
-    _multiprocess_can_split_ = True
 
     def test_repr(self):
-        foo = repr(self.panel)
+        repr(self.panel)
 
     def test_copy_names(self):
-        for attr in ('major_axis', 'minor_axis'):
-            getattr(self.panel, attr).name = None
-            cp = self.panel.copy()
-            getattr(cp, attr).name = 'foo'
-            self.assertIsNone(getattr(self.panel, attr).name)
+        with catch_warnings(record=True):
+            for attr in ('major_axis', 'minor_axis'):
+                getattr(self.panel, attr).name = None
+                cp = self.panel.copy()
+                getattr(cp, attr).name = 'foo'
+                assert getattr(self.panel, attr).name is None
 
     def test_iter(self):
         tm.equalContents(list(self.panel), self.panel.items)
 
     def test_count(self):
-        f = lambda s: notnull(s).sum()
+        f = lambda s: notna(s).sum()
         self._check_stat_op('count', f, obj=self.panel, has_skipna=False)
 
     def test_sum(self):
-        self._check_stat_op('sum', np.sum)
+        self._check_stat_op('sum', np.sum, skipna_alternative=np.nansum)
 
     def test_mean(self):
         self._check_stat_op('mean', np.mean)
 
+    @td.skip_if_no("numpy", min_version="1.10.0")
     def test_prod(self):
-        self._check_stat_op('prod', np.prod)
+        self._check_stat_op('prod', np.prod, skipna_alternative=np.nanprod)
 
     def test_median(self):
         def wrapper(x):
-            if isnull(x).any():
+            if isna(x).any():
                 return np.nan
             return np.median(x)
 
         self._check_stat_op('median', wrapper)
 
     def test_min(self):
-        self._check_stat_op('min', np.min)
+        with catch_warnings(record=True):
+            self._check_stat_op('min', np.min)
 
     def test_max(self):
-        self._check_stat_op('max', np.max)
+        with catch_warnings(record=True):
+            self._check_stat_op('max', np.max)
 
+    @td.skip_if_no_scipy
     def test_skew(self):
-        try:
-            from scipy.stats import skew
-        except ImportError:
-            raise nose.SkipTest("no scipy.stats.skew")
+        from scipy.stats import skew
 
         def this_skew(x):
             if len(x) < 3:
                 return np.nan
             return skew(x, bias=False)
-        self._check_stat_op('skew', this_skew)
 
-    # def test_mad(self):
-    #     f = lambda x: np.abs(x - x.mean()).mean()
-    #     self._check_stat_op('mad', f)
+        self._check_stat_op('skew', this_skew)
 
     def test_var(self):
         def alt(x):
             if len(x) < 2:
                 return np.nan
             return np.var(x, ddof=1)
+
         self._check_stat_op('var', alt)
 
     def test_std(self):
@@ -121,41 +131,32 @@ def alt(x):
             if len(x) < 2:
                 return np.nan
             return np.std(x, ddof=1)
+
         self._check_stat_op('std', alt)
 
     def test_sem(self):
         def alt(x):
             if len(x) < 2:
                 return np.nan
-            return np.std(x, ddof=1)/np.sqrt(len(x))
-        self._check_stat_op('sem', alt)
-
-    # def test_skew(self):
-    #     from scipy.stats import skew
+            return np.std(x, ddof=1) / np.sqrt(len(x))
 
-    #     def alt(x):
-    #         if len(x) < 3:
-    #             return np.nan
-    #         return skew(x, bias=False)
-
-    #     self._check_stat_op('skew', alt)
+        self._check_stat_op('sem', alt)
 
-    def _check_stat_op(self, name, alternative, obj=None, has_skipna=True):
+    def _check_stat_op(self, name, alternative, obj=None, has_skipna=True,
+                       skipna_alternative=None):
         if obj is None:
             obj = self.panel
 
             # # set some NAs
-            # obj.ix[5:10] = np.nan
-            # obj.ix[15:20, -2:] = np.nan
+            # obj.loc[5:10] = np.nan
+            # obj.loc[15:20, -2:] = np.nan
 
         f = getattr(obj, name)
 
         if has_skipna:
-            def skipna_wrapper(x):
-                nona = remove_na(x)
-                if len(nona) == 0:
-                    return np.nan
-                return alternative(nona)
+
+            skipna_wrapper = tm._make_skipna_wrapper(alternative,
+                                                     skipna_alternative)
 
             def wrapper(x):
                 return alternative(np.asarray(x))
@@ -169,28 +170,23 @@ def wrapper(x):
 
         for i in range(obj.ndim):
             result = f(axis=i)
-            if not tm._incompat_bottleneck_version(name):
+            if name in ['sum', 'prod']:
                 assert_frame_equal(result, obj.apply(skipna_wrapper, axis=i))
 
-        self.assertRaises(Exception, f, axis=obj.ndim)
+        pytest.raises(Exception, f, axis=obj.ndim)
 
         # Unimplemented numeric_only parameter.
-        if 'numeric_only' in getargspec(f).args:
-            self.assertRaisesRegexp(NotImplementedError, name, f,
-                                    numeric_only=True)
+        if 'numeric_only' in signature(f).args:
+            tm.assert_raises_regex(NotImplementedError, name, f,
+                                   numeric_only=True)
 
 
 class SafeForSparse(object):
-    _multiprocess_can_split_ = True
-
-    @classmethod
-    def assert_panel_equal(cls, x, y):
-        assert_panel_equal(x, y)
 
     def test_get_axis(self):
-        assert(self.panel._get_axis(0) is self.panel.items)
-        assert(self.panel._get_axis(1) is self.panel.major_axis)
-        assert(self.panel._get_axis(2) is self.panel.minor_axis)
+        assert (self.panel._get_axis(0) is self.panel.items)
+        assert (self.panel._get_axis(1) is self.panel.major_axis)
+        assert (self.panel._get_axis(2) is self.panel.minor_axis)
 
     def test_set_axis(self):
         new_items = Index(np.arange(len(self.panel.items)))
@@ -202,28 +198,38 @@ def test_set_axis(self):
         self.panel.items = new_items
 
         if hasattr(self.panel, '_item_cache'):
-            self.assertNotIn('ItemA', self.panel._item_cache)
-        self.assertIs(self.panel.items, new_items)
+            assert 'ItemA' not in self.panel._item_cache
+        assert self.panel.items is new_items
+
+        # TODO: unused?
+        item = self.panel[0]  # noqa
 
-        item = self.panel[0]
         self.panel.major_axis = new_major
-        self.assertIs(self.panel[0].index, new_major)
-        self.assertIs(self.panel.major_axis, new_major)
+        assert self.panel[0].index is new_major
+        assert self.panel.major_axis is new_major
+
+        # TODO: unused?
+        item = self.panel[0]  # noqa
 
-        item = self.panel[0]
         self.panel.minor_axis = new_minor
-        self.assertIs(self.panel[0].columns, new_minor)
-        self.assertIs(self.panel.minor_axis, new_minor)
+        assert self.panel[0].columns is new_minor
+        assert self.panel.minor_axis is new_minor
 
     def test_get_axis_number(self):
-        self.assertEqual(self.panel._get_axis_number('items'), 0)
-        self.assertEqual(self.panel._get_axis_number('major'), 1)
-        self.assertEqual(self.panel._get_axis_number('minor'), 2)
+        assert self.panel._get_axis_number('items') == 0
+        assert self.panel._get_axis_number('major') == 1
+        assert self.panel._get_axis_number('minor') == 2
+
+        with tm.assert_raises_regex(ValueError, "No axis named foo"):
+            self.panel._get_axis_number('foo')
+
+        with tm.assert_raises_regex(ValueError, "No axis named foo"):
+            self.panel.__ge__(self.panel, axis='foo')
 
     def test_get_axis_name(self):
-        self.assertEqual(self.panel._get_axis_name(0), 'items')
-        self.assertEqual(self.panel._get_axis_name(1), 'major_axis')
-        self.assertEqual(self.panel._get_axis_name(2), 'minor_axis')
+        assert self.panel._get_axis_name(0) == 'items'
+        assert self.panel._get_axis_name(1) == 'major_axis'
+        assert self.panel._get_axis_name(2) == 'minor_axis'
 
     def test_get_plane_axes(self):
         # what to do here?
@@ -234,47 +240,48 @@ def test_get_plane_axes(self):
         index, columns = self.panel._get_plane_axes(0)
 
     def test_truncate(self):
-        dates = self.panel.major_axis
-        start, end = dates[1], dates[5]
-
-        trunced = self.panel.truncate(start, end, axis='major')
-        expected = self.panel['ItemA'].truncate(start, end)
+        with catch_warnings(record=True):
+            dates = self.panel.major_axis
+            start, end = dates[1], dates[5]
 
-        assert_frame_equal(trunced['ItemA'], expected)
+            trunced = self.panel.truncate(start, end, axis='major')
+            expected = self.panel['ItemA'].truncate(start, end)
 
-        trunced = self.panel.truncate(before=start, axis='major')
-        expected = self.panel['ItemA'].truncate(before=start)
+            assert_frame_equal(trunced['ItemA'], expected)
 
-        assert_frame_equal(trunced['ItemA'], expected)
+            trunced = self.panel.truncate(before=start, axis='major')
+            expected = self.panel['ItemA'].truncate(before=start)
 
-        trunced = self.panel.truncate(after=end, axis='major')
-        expected = self.panel['ItemA'].truncate(after=end)
+            assert_frame_equal(trunced['ItemA'], expected)
 
-        assert_frame_equal(trunced['ItemA'], expected)
+            trunced = self.panel.truncate(after=end, axis='major')
+            expected = self.panel['ItemA'].truncate(after=end)
 
-        # XXX test other axes
+            assert_frame_equal(trunced['ItemA'], expected)
 
     def test_arith(self):
-        self._test_op(self.panel, operator.add)
-        self._test_op(self.panel, operator.sub)
-        self._test_op(self.panel, operator.mul)
-        self._test_op(self.panel, operator.truediv)
-        self._test_op(self.panel, operator.floordiv)
-        self._test_op(self.panel, operator.pow)
-
-        self._test_op(self.panel, lambda x, y: y + x)
-        self._test_op(self.panel, lambda x, y: y - x)
-        self._test_op(self.panel, lambda x, y: y * x)
-        self._test_op(self.panel, lambda x, y: y / x)
-        self._test_op(self.panel, lambda x, y: y ** x)
-
-        self._test_op(self.panel, lambda x, y: x + y)  # panel + 1
-        self._test_op(self.panel, lambda x, y: x - y)  # panel - 1
-        self._test_op(self.panel, lambda x, y: x * y)  # panel * 1
-        self._test_op(self.panel, lambda x, y: x / y)  # panel / 1
-        self._test_op(self.panel, lambda x, y: x ** y)  # panel ** 1
-
-        self.assertRaises(Exception, self.panel.__add__, self.panel['ItemA'])
+        with catch_warnings(record=True):
+            self._test_op(self.panel, operator.add)
+            self._test_op(self.panel, operator.sub)
+            self._test_op(self.panel, operator.mul)
+            self._test_op(self.panel, operator.truediv)
+            self._test_op(self.panel, operator.floordiv)
+            self._test_op(self.panel, operator.pow)
+
+            self._test_op(self.panel, lambda x, y: y + x)
+            self._test_op(self.panel, lambda x, y: y - x)
+            self._test_op(self.panel, lambda x, y: y * x)
+            self._test_op(self.panel, lambda x, y: y / x)
+            self._test_op(self.panel, lambda x, y: y ** x)
+
+            self._test_op(self.panel, lambda x, y: x + y)  # panel + 1
+            self._test_op(self.panel, lambda x, y: x - y)  # panel - 1
+            self._test_op(self.panel, lambda x, y: x * y)  # panel * 1
+            self._test_op(self.panel, lambda x, y: x / y)  # panel / 1
+            self._test_op(self.panel, lambda x, y: x ** y)  # panel ** 1
+
+            pytest.raises(Exception, self.panel.__add__,
+                          self.panel['ItemA'])
 
     @staticmethod
     def _test_op(panel, op):
@@ -287,333 +294,343 @@ def test_keys(self):
     def test_iteritems(self):
         # Test panel.iteritems(), aka panel.iteritems()
         # just test that it works
-        for k, v in compat.iteritems(self.panel):
+        for k, v in self.panel.iteritems():
             pass
 
-        self.assertEqual(len(list(compat.iteritems(self.panel))),
-                         len(self.panel.items))
+        assert len(list(self.panel.iteritems())) == len(self.panel.items)
 
     def test_combineFrame(self):
-        def check_op(op, name):
-            # items
-            df = self.panel['ItemA']
+        with catch_warnings(record=True):
+            def check_op(op, name):
+                # items
+                df = self.panel['ItemA']
 
-            func = getattr(self.panel, name)
+                func = getattr(self.panel, name)
 
-            result = func(df, axis='items')
+                result = func(df, axis='items')
 
-            assert_frame_equal(result['ItemB'], op(self.panel['ItemB'], df))
+                assert_frame_equal(
+                    result['ItemB'], op(self.panel['ItemB'], df))
 
-            # major
-            xs = self.panel.major_xs(self.panel.major_axis[0])
-            result = func(xs, axis='major')
+                # major
+                xs = self.panel.major_xs(self.panel.major_axis[0])
+                result = func(xs, axis='major')
 
-            idx = self.panel.major_axis[1]
+                idx = self.panel.major_axis[1]
 
-            assert_frame_equal(result.major_xs(idx),
-                               op(self.panel.major_xs(idx), xs))
+                assert_frame_equal(result.major_xs(idx),
+                                   op(self.panel.major_xs(idx), xs))
 
-            # minor
-            xs = self.panel.minor_xs(self.panel.minor_axis[0])
-            result = func(xs, axis='minor')
+                # minor
+                xs = self.panel.minor_xs(self.panel.minor_axis[0])
+                result = func(xs, axis='minor')
 
-            idx = self.panel.minor_axis[1]
+                idx = self.panel.minor_axis[1]
 
-            assert_frame_equal(result.minor_xs(idx),
-                               op(self.panel.minor_xs(idx), xs))
-        from pandas import SparsePanel
-        ops = ['add', 'sub', 'mul', 'truediv', 'floordiv']
-        if not compat.PY3:
-            ops.append('div')
-        # pow, mod not supported for SparsePanel as flex ops (for now)
-        if not isinstance(self.panel, SparsePanel):
-            ops.extend(['pow', 'mod'])
-        else:
-            idx = self.panel.minor_axis[1]
-            with assertRaisesRegexp(ValueError, "Simple arithmetic.*scalar"):
-                self.panel.pow(self.panel.minor_xs(idx), axis='minor')
-            with assertRaisesRegexp(ValueError, "Simple arithmetic.*scalar"):
-                self.panel.mod(self.panel.minor_xs(idx), axis='minor')
+                assert_frame_equal(result.minor_xs(idx),
+                                   op(self.panel.minor_xs(idx), xs))
 
-        for op in ops:
-            try:
-                check_op(getattr(operator, op), op)
-            except:
-                com.pprint_thing("Failing operation: %r" % op)
-                raise
-        if compat.PY3:
-            try:
-                check_op(operator.truediv, 'div')
-            except:
-                com.pprint_thing("Failing operation: %r" % name)
-                raise
+            ops = ['add', 'sub', 'mul', 'truediv', 'floordiv', 'pow', 'mod']
+            if not compat.PY3:
+                ops.append('div')
+
+            for op in ops:
+                try:
+                    check_op(getattr(operator, op), op)
+                except:
+                    pprint_thing("Failing operation: %r" % op)
+                    raise
+            if compat.PY3:
+                try:
+                    check_op(operator.truediv, 'div')
+                except:
+                    pprint_thing("Failing operation: %r" % 'div')
+                    raise
 
     def test_combinePanel(self):
-        result = self.panel.add(self.panel)
-        self.assert_panel_equal(result, self.panel * 2)
+        with catch_warnings(record=True):
+            result = self.panel.add(self.panel)
+            assert_panel_equal(result, self.panel * 2)
 
     def test_neg(self):
-        self.assert_panel_equal(-self.panel, self.panel * -1)
+        with catch_warnings(record=True):
+            assert_panel_equal(-self.panel, self.panel * -1)
 
     # issue 7692
     def test_raise_when_not_implemented(self):
-        p = Panel(np.arange(3*4*5).reshape(3,4,5), items=['ItemA','ItemB','ItemC'], 
-            major_axis=pd.date_range('20130101',periods=4),minor_axis=list('ABCDE'))
-        d = p.sum(axis=1).ix[0]
-        ops = ['add', 'sub', 'mul', 'truediv', 'floordiv', 'div', 'mod', 'pow']
-        for op in ops:
-            with self.assertRaises(NotImplementedError):
-                getattr(p,op)(d, axis=0)
+        with catch_warnings(record=True):
+            p = Panel(np.arange(3 * 4 * 5).reshape(3, 4, 5),
+                      items=['ItemA', 'ItemB', 'ItemC'],
+                      major_axis=date_range('20130101', periods=4),
+                      minor_axis=list('ABCDE'))
+            d = p.sum(axis=1).iloc[0]
+            ops = ['add', 'sub', 'mul', 'truediv',
+                   'floordiv', 'div', 'mod', 'pow']
+            for op in ops:
+                with pytest.raises(NotImplementedError):
+                    getattr(p, op)(d, axis=0)
 
     def test_select(self):
-        p = self.panel
-
-        # select items
-        result = p.select(lambda x: x in ('ItemA', 'ItemC'), axis='items')
-        expected = p.reindex(items=['ItemA', 'ItemC'])
-        self.assert_panel_equal(result, expected)
-
-        # select major_axis
-        result = p.select(lambda x: x >= datetime(2000, 1, 15), axis='major')
-        new_major = p.major_axis[p.major_axis >= datetime(2000, 1, 15)]
-        expected = p.reindex(major=new_major)
-        self.assert_panel_equal(result, expected)
-
-        # select minor_axis
-        result = p.select(lambda x: x in ('D', 'A'), axis=2)
-        expected = p.reindex(minor=['A', 'D'])
-        self.assert_panel_equal(result, expected)
-
-        # corner case, empty thing
-        result = p.select(lambda x: x in ('foo',), axis='items')
-        self.assert_panel_equal(result, p.reindex(items=[]))
+        with catch_warnings(record=True):
+            p = self.panel
+
+            # select items
+            result = p.select(lambda x: x in ('ItemA', 'ItemC'), axis='items')
+            expected = p.reindex(items=['ItemA', 'ItemC'])
+            assert_panel_equal(result, expected)
+
+            # select major_axis
+            result = p.select(lambda x: x >= datetime(
+                2000, 1, 15), axis='major')
+            new_major = p.major_axis[p.major_axis >= datetime(2000, 1, 15)]
+            expected = p.reindex(major=new_major)
+            assert_panel_equal(result, expected)
+
+            # select minor_axis
+            result = p.select(lambda x: x in ('D', 'A'), axis=2)
+            expected = p.reindex(minor=['A', 'D'])
+            assert_panel_equal(result, expected)
+
+            # corner case, empty thing
+            result = p.select(lambda x: x in ('foo', ), axis='items')
+            assert_panel_equal(result, p.reindex(items=[]))
 
     def test_get_value(self):
         for item in self.panel.items:
             for mjr in self.panel.major_axis[::2]:
                 for mnr in self.panel.minor_axis:
-                    result = self.panel.get_value(item, mjr, mnr)
+                    with tm.assert_produces_warning(FutureWarning,
+                                                    check_stacklevel=False):
+                        result = self.panel.get_value(item, mjr, mnr)
                     expected = self.panel[item][mnr][mjr]
                     assert_almost_equal(result, expected)
 
     def test_abs(self):
-        result = self.panel.abs()
-        result2 = abs(self.panel)
-        expected = np.abs(self.panel)
-        self.assert_panel_equal(result, expected)
-        self.assert_panel_equal(result2, expected)
-
-        df = self.panel['ItemA']
-        result = df.abs()
-        result2 = abs(df)
-        expected = np.abs(df)
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
 
-        s = df['A']
-        result = s.abs()
-        result2 = abs(s)
-        expected = np.abs(s)
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-        self.assertEqual(result.name, 'A')
-        self.assertEqual(result2.name, 'A')
+        with catch_warnings(record=True):
+            result = self.panel.abs()
+            result2 = abs(self.panel)
+            expected = np.abs(self.panel)
+            assert_panel_equal(result, expected)
+            assert_panel_equal(result2, expected)
+
+            df = self.panel['ItemA']
+            result = df.abs()
+            result2 = abs(df)
+            expected = np.abs(df)
+            assert_frame_equal(result, expected)
+            assert_frame_equal(result2, expected)
+
+            s = df['A']
+            result = s.abs()
+            result2 = abs(s)
+            expected = np.abs(s)
+            assert_series_equal(result, expected)
+            assert_series_equal(result2, expected)
+            assert result.name == 'A'
+            assert result2.name == 'A'
 
 
 class CheckIndexing(object):
 
-    _multiprocess_can_split_ = True
-
     def test_getitem(self):
-        self.assertRaises(Exception, self.panel.__getitem__, 'ItemQ')
+        pytest.raises(Exception, self.panel.__getitem__, 'ItemQ')
 
     def test_delitem_and_pop(self):
-        expected = self.panel['ItemA']
-        result = self.panel.pop('ItemA')
-        assert_frame_equal(expected, result)
-        self.assertNotIn('ItemA', self.panel.items)
+        with catch_warnings(record=True):
+            expected = self.panel['ItemA']
+            result = self.panel.pop('ItemA')
+            assert_frame_equal(expected, result)
+            assert 'ItemA' not in self.panel.items
 
-        del self.panel['ItemB']
-        self.assertNotIn('ItemB', self.panel.items)
-        self.assertRaises(Exception, self.panel.__delitem__, 'ItemB')
+            del self.panel['ItemB']
+            assert 'ItemB' not in self.panel.items
+            pytest.raises(Exception, self.panel.__delitem__, 'ItemB')
 
-        values = np.empty((3, 3, 3))
-        values[0] = 0
-        values[1] = 1
-        values[2] = 2
+            values = np.empty((3, 3, 3))
+            values[0] = 0
+            values[1] = 1
+            values[2] = 2
 
-        panel = Panel(values, lrange(3), lrange(3), lrange(3))
+            panel = Panel(values, lrange(3), lrange(3), lrange(3))
 
-        # did we delete the right row?
+            # did we delete the right row?
 
-        panelc = panel.copy()
-        del panelc[0]
-        assert_frame_equal(panelc[1], panel[1])
-        assert_frame_equal(panelc[2], panel[2])
+            panelc = panel.copy()
+            del panelc[0]
+            tm.assert_frame_equal(panelc[1], panel[1])
+            tm.assert_frame_equal(panelc[2], panel[2])
 
-        panelc = panel.copy()
-        del panelc[1]
-        assert_frame_equal(panelc[0], panel[0])
-        assert_frame_equal(panelc[2], panel[2])
+            panelc = panel.copy()
+            del panelc[1]
+            tm.assert_frame_equal(panelc[0], panel[0])
+            tm.assert_frame_equal(panelc[2], panel[2])
 
-        panelc = panel.copy()
-        del panelc[2]
-        assert_frame_equal(panelc[1], panel[1])
-        assert_frame_equal(panelc[0], panel[0])
+            panelc = panel.copy()
+            del panelc[2]
+            tm.assert_frame_equal(panelc[1], panel[1])
+            tm.assert_frame_equal(panelc[0], panel[0])
 
     def test_setitem(self):
-        # LongPanel with one item
-        lp = self.panel.filter(['ItemA', 'ItemB']).to_frame()
-        with tm.assertRaises(ValueError):
-            self.panel['ItemE'] = lp
-
-        # DataFrame
-        df = self.panel['ItemA'][2:].filter(items=['A', 'B'])
-        self.panel['ItemF'] = df
-        self.panel['ItemE'] = df
-
-        df2 = self.panel['ItemF']
-
-        assert_frame_equal(df, df2.reindex(index=df.index,
-                                           columns=df.columns))
-
-        # scalar
-        self.panel['ItemG'] = 1
-        self.panel['ItemE'] = True
-        self.assertEqual(self.panel['ItemG'].values.dtype, np.int64)
-        self.assertEqual(self.panel['ItemE'].values.dtype, np.bool_)
-
-        # object dtype
-        self.panel['ItemQ'] = 'foo'
-        self.assertEqual(self.panel['ItemQ'].values.dtype, np.object_)
-
-        # boolean dtype
-        self.panel['ItemP'] = self.panel['ItemA'] > 0
-        self.assertEqual(self.panel['ItemP'].values.dtype, np.bool_)
-
-        self.assertRaises(TypeError, self.panel.__setitem__, 'foo',
-                          self.panel.ix[['ItemP']])
-
-        # bad shape
-        p = Panel(np.random.randn(4, 3, 2))
-        with tm.assertRaisesRegexp(ValueError,
-                                   "shape of value must be \(3, 2\), "
-                                   "shape of given object was \(4, 2\)"):
-            p[0] = np.random.randn(4, 2)
+        with catch_warnings(record=True):
+            lp = self.panel.filter(['ItemA', 'ItemB']).to_frame()
+            with pytest.raises(ValueError):
+                self.panel['ItemE'] = lp
+
+            # DataFrame
+            df = self.panel['ItemA'][2:].filter(items=['A', 'B'])
+            self.panel['ItemF'] = df
+            self.panel['ItemE'] = df
+
+            df2 = self.panel['ItemF']
+
+            assert_frame_equal(df, df2.reindex(
+                index=df.index, columns=df.columns))
+
+            # scalar
+            self.panel['ItemG'] = 1
+            self.panel['ItemE'] = True
+            assert self.panel['ItemG'].values.dtype == np.int64
+            assert self.panel['ItemE'].values.dtype == np.bool_
+
+            # object dtype
+            self.panel['ItemQ'] = 'foo'
+            assert self.panel['ItemQ'].values.dtype == np.object_
+
+            # boolean dtype
+            self.panel['ItemP'] = self.panel['ItemA'] > 0
+            assert self.panel['ItemP'].values.dtype == np.bool_
+
+            pytest.raises(TypeError, self.panel.__setitem__, 'foo',
+                          self.panel.loc[['ItemP']])
+
+            # bad shape
+            p = Panel(np.random.randn(4, 3, 2))
+            with tm.assert_raises_regex(ValueError,
+                                        r"shape of value must be "
+                                        r"\(3, 2\), shape of given "
+                                        r"object was \(4, 2\)"):
+                p[0] = np.random.randn(4, 2)
 
     def test_setitem_ndarray(self):
-        from pandas import date_range, datetools
-
-        timeidx = date_range(start=datetime(2009, 1, 1),
-                             end=datetime(2009, 12, 31),
-                             freq=datetools.MonthEnd())
-        lons_coarse = np.linspace(-177.5, 177.5, 72)
-        lats_coarse = np.linspace(-87.5, 87.5, 36)
-        P = Panel(items=timeidx, major_axis=lons_coarse,
-                  minor_axis=lats_coarse)
-        data = np.random.randn(72 * 36).reshape((72, 36))
-        key = datetime(2009, 2, 28)
-        P[key] = data
-
-        assert_almost_equal(P[key].values, data)
+        with catch_warnings(record=True):
+            timeidx = date_range(start=datetime(2009, 1, 1),
+                                 end=datetime(2009, 12, 31),
+                                 freq=MonthEnd())
+            lons_coarse = np.linspace(-177.5, 177.5, 72)
+            lats_coarse = np.linspace(-87.5, 87.5, 36)
+            P = Panel(items=timeidx, major_axis=lons_coarse,
+                      minor_axis=lats_coarse)
+            data = np.random.randn(72 * 36).reshape((72, 36))
+            key = datetime(2009, 2, 28)
+            P[key] = data
+
+            assert_almost_equal(P[key].values, data)
 
     def test_set_minor_major(self):
-        # GH 11014
-        df1 = DataFrame(['a', 'a', 'a', np.nan, 'a', np.nan])
-        df2 = DataFrame([1.0, np.nan, 1.0, np.nan, 1.0, 1.0])
-        panel = Panel({'Item1' : df1, 'Item2': df2})
-
-        newminor = notnull(panel.iloc[:, :, 0])
-        panel.loc[:, :, 'NewMinor'] = newminor
-        assert_frame_equal(panel.loc[:, :, 'NewMinor'], newminor.astype(object))
-
-        newmajor = notnull(panel.iloc[:, 0, :])
-        panel.loc[:, 'NewMajor', :] = newmajor
-        assert_frame_equal(panel.loc[:, 'NewMajor', :], newmajor.astype(object))
+        with catch_warnings(record=True):
+            # GH 11014
+            df1 = DataFrame(['a', 'a', 'a', np.nan, 'a', np.nan])
+            df2 = DataFrame([1.0, np.nan, 1.0, np.nan, 1.0, 1.0])
+            panel = Panel({'Item1': df1, 'Item2': df2})
+
+            newminor = notna(panel.iloc[:, :, 0])
+            panel.loc[:, :, 'NewMinor'] = newminor
+            assert_frame_equal(panel.loc[:, :, 'NewMinor'],
+                               newminor.astype(object))
+
+            newmajor = notna(panel.iloc[:, 0, :])
+            panel.loc[:, 'NewMajor', :] = newmajor
+            assert_frame_equal(panel.loc[:, 'NewMajor', :],
+                               newmajor.astype(object))
 
     def test_major_xs(self):
-        ref = self.panel['ItemA']
+        with catch_warnings(record=True):
+            ref = self.panel['ItemA']
 
-        idx = self.panel.major_axis[5]
-        xs = self.panel.major_xs(idx)
+            idx = self.panel.major_axis[5]
+            xs = self.panel.major_xs(idx)
 
-        result = xs['ItemA']
-        assert_series_equal(result, ref.xs(idx), check_names=False)
-        self.assertEqual(result.name, 'ItemA')
+            result = xs['ItemA']
+            assert_series_equal(result, ref.xs(idx), check_names=False)
+            assert result.name == 'ItemA'
 
-        # not contained
-        idx = self.panel.major_axis[0] - bday
-        self.assertRaises(Exception, self.panel.major_xs, idx)
+            # not contained
+            idx = self.panel.major_axis[0] - BDay()
+            pytest.raises(Exception, self.panel.major_xs, idx)
 
     def test_major_xs_mixed(self):
-        self.panel['ItemD'] = 'foo'
-        xs = self.panel.major_xs(self.panel.major_axis[0])
-        self.assertEqual(xs['ItemA'].dtype, np.float64)
-        self.assertEqual(xs['ItemD'].dtype, np.object_)
+        with catch_warnings(record=True):
+            self.panel['ItemD'] = 'foo'
+            xs = self.panel.major_xs(self.panel.major_axis[0])
+            assert xs['ItemA'].dtype == np.float64
+            assert xs['ItemD'].dtype == np.object_
 
     def test_minor_xs(self):
-        ref = self.panel['ItemA']
+        with catch_warnings(record=True):
+            ref = self.panel['ItemA']
 
-        idx = self.panel.minor_axis[1]
-        xs = self.panel.minor_xs(idx)
+            idx = self.panel.minor_axis[1]
+            xs = self.panel.minor_xs(idx)
 
-        assert_series_equal(xs['ItemA'], ref[idx], check_names=False)
+            assert_series_equal(xs['ItemA'], ref[idx], check_names=False)
 
-        # not contained
-        self.assertRaises(Exception, self.panel.minor_xs, 'E')
+            # not contained
+            pytest.raises(Exception, self.panel.minor_xs, 'E')
 
     def test_minor_xs_mixed(self):
-        self.panel['ItemD'] = 'foo'
+        with catch_warnings(record=True):
+            self.panel['ItemD'] = 'foo'
 
-        xs = self.panel.minor_xs('D')
-        self.assertEqual(xs['ItemA'].dtype, np.float64)
-        self.assertEqual(xs['ItemD'].dtype, np.object_)
+            xs = self.panel.minor_xs('D')
+            assert xs['ItemA'].dtype == np.float64
+            assert xs['ItemD'].dtype == np.object_
 
     def test_xs(self):
-        itemA = self.panel.xs('ItemA', axis=0)
-        expected = self.panel['ItemA']
-        assert_frame_equal(itemA, expected)
+        with catch_warnings(record=True):
+            itemA = self.panel.xs('ItemA', axis=0)
+            expected = self.panel['ItemA']
+            tm.assert_frame_equal(itemA, expected)
 
-        # get a view by default
-        itemA_view = self.panel.xs('ItemA', axis=0)
-        itemA_view.values[:] = np.nan
-        self.assertTrue(np.isnan(self.panel['ItemA'].values).all())
+            # Get a view by default.
+            itemA_view = self.panel.xs('ItemA', axis=0)
+            itemA_view.values[:] = np.nan
 
-        # mixed-type yields a copy
-        self.panel['strings'] = 'foo'
-        result = self.panel.xs('D', axis=2)
-        self.assertIsNotNone(result.is_copy)
+            assert np.isnan(self.panel['ItemA'].values).all()
+
+            # Mixed-type yields a copy.
+            self.panel['strings'] = 'foo'
+            result = self.panel.xs('D', axis=2)
+            assert result._is_copy is not None
 
     def test_getitem_fancy_labels(self):
-        p = self.panel
+        with catch_warnings(record=True):
+            p = self.panel
 
-        items = p.items[[1, 0]]
-        dates = p.major_axis[::2]
-        cols = ['D', 'C', 'F']
+            items = p.items[[1, 0]]
+            dates = p.major_axis[::2]
+            cols = ['D', 'C', 'F']
 
-        # all 3 specified
-        assert_panel_equal(p.ix[items, dates, cols],
-                           p.reindex(items=items, major=dates, minor=cols))
+            # all 3 specified
+            assert_panel_equal(p.loc[items, dates, cols],
+                               p.reindex(items=items, major=dates, minor=cols))
 
-        # 2 specified
-        assert_panel_equal(p.ix[:, dates, cols],
-                           p.reindex(major=dates, minor=cols))
+            # 2 specified
+            assert_panel_equal(p.loc[:, dates, cols],
+                               p.reindex(major=dates, minor=cols))
 
-        assert_panel_equal(p.ix[items, :, cols],
-                           p.reindex(items=items, minor=cols))
+            assert_panel_equal(p.loc[items, :, cols],
+                               p.reindex(items=items, minor=cols))
 
-        assert_panel_equal(p.ix[items, dates, :],
-                           p.reindex(items=items, major=dates))
+            assert_panel_equal(p.loc[items, dates, :],
+                               p.reindex(items=items, major=dates))
 
-        # only 1
-        assert_panel_equal(p.ix[items, :, :],
-                           p.reindex(items=items))
+            # only 1
+            assert_panel_equal(p.loc[items, :, :], p.reindex(items=items))
 
-        assert_panel_equal(p.ix[:, dates, :],
-                           p.reindex(major=dates))
+            assert_panel_equal(p.loc[:, dates, :], p.reindex(major=dates))
 
-        assert_panel_equal(p.ix[:, :, cols],
-                           p.reindex(minor=cols))
+            assert_panel_equal(p.loc[:, :, cols], p.reindex(minor=cols))
 
     def test_getitem_fancy_slice(self):
         pass
@@ -622,8 +639,8 @@ def test_getitem_fancy_ints(self):
         p = self.panel
 
         # #1603
-        result = p.ix[:, -1, :]
-        expected = p.ix[:, p.major_axis[-1], :]
+        result = p.iloc[:, -1, :]
+        expected = p.loc[:, p.major_axis[-1], :]
         assert_frame_equal(result, expected)
 
     def test_getitem_fancy_xs(self):
@@ -635,1300 +652,1534 @@ def test_getitem_fancy_xs(self):
 
         # get DataFrame
         # item
-        assert_frame_equal(p.ix[item], p[item])
-        assert_frame_equal(p.ix[item, :], p[item])
-        assert_frame_equal(p.ix[item, :, :], p[item])
+        assert_frame_equal(p.loc[item], p[item])
+        assert_frame_equal(p.loc[item, :], p[item])
+        assert_frame_equal(p.loc[item, :, :], p[item])
 
         # major axis, axis=1
-        assert_frame_equal(p.ix[:, date], p.major_xs(date))
-        assert_frame_equal(p.ix[:, date, :], p.major_xs(date))
+        assert_frame_equal(p.loc[:, date], p.major_xs(date))
+        assert_frame_equal(p.loc[:, date, :], p.major_xs(date))
 
         # minor axis, axis=2
-        assert_frame_equal(p.ix[:, :, 'C'], p.minor_xs('C'))
+        assert_frame_equal(p.loc[:, :, 'C'], p.minor_xs('C'))
 
         # get Series
-        assert_series_equal(p.ix[item, date], p[item].ix[date])
-        assert_series_equal(p.ix[item, date, :], p[item].ix[date])
-        assert_series_equal(p.ix[item, :, col], p[item][col])
-        assert_series_equal(p.ix[:, date, col], p.major_xs(date).ix[col])
+        assert_series_equal(p.loc[item, date], p[item].loc[date])
+        assert_series_equal(p.loc[item, date, :], p[item].loc[date])
+        assert_series_equal(p.loc[item, :, col], p[item][col])
+        assert_series_equal(p.loc[:, date, col], p.major_xs(date).loc[col])
 
     def test_getitem_fancy_xs_check_view(self):
-        item = 'ItemB'
-        date = self.panel.major_axis[5]
-        col = 'C'
-
-        # make sure it's always a view
-        NS = slice(None, None)
-
-        # DataFrames
-        comp = assert_frame_equal
-        self._check_view(item, comp)
-        self._check_view((item, NS), comp)
-        self._check_view((item, NS, NS), comp)
-        self._check_view((NS, date), comp)
-        self._check_view((NS, date, NS), comp)
-        self._check_view((NS, NS, 'C'), comp)
-
-        # Series
-        comp = assert_series_equal
-        self._check_view((item, date), comp)
-        self._check_view((item, date, NS), comp)
-        self._check_view((item, NS, 'C'), comp)
-        self._check_view((NS, date, 'C'), comp)
+        with catch_warnings(record=True):
+            item = 'ItemB'
+            date = self.panel.major_axis[5]
+
+            # make sure it's always a view
+            NS = slice(None, None)
+
+            # DataFrames
+            comp = assert_frame_equal
+            self._check_view(item, comp)
+            self._check_view((item, NS), comp)
+            self._check_view((item, NS, NS), comp)
+            self._check_view((NS, date), comp)
+            self._check_view((NS, date, NS), comp)
+            self._check_view((NS, NS, 'C'), comp)
+
+            # Series
+            comp = assert_series_equal
+            self._check_view((item, date), comp)
+            self._check_view((item, date, NS), comp)
+            self._check_view((item, NS, 'C'), comp)
+            self._check_view((NS, date, 'C'), comp)
+
+    def test_getitem_callable(self):
+        with catch_warnings(record=True):
+            p = self.panel
+            # GH 12533
+
+            assert_frame_equal(p[lambda x: 'ItemB'], p.loc['ItemB'])
+            assert_panel_equal(p[lambda x: ['ItemB', 'ItemC']],
+                               p.loc[['ItemB', 'ItemC']])
 
     def test_ix_setitem_slice_dataframe(self):
-        a = Panel(items=[1, 2, 3], major_axis=[11, 22, 33],
-                  minor_axis=[111, 222, 333])
-        b = DataFrame(np.random.randn(2, 3), index=[111, 333],
-                      columns=[1, 2, 3])
+        with catch_warnings(record=True):
+            a = Panel(items=[1, 2, 3], major_axis=[11, 22, 33],
+                      minor_axis=[111, 222, 333])
+            b = DataFrame(np.random.randn(2, 3), index=[111, 333],
+                          columns=[1, 2, 3])
 
-        a.ix[:, 22, [111, 333]] = b
+            a.loc[:, 22, [111, 333]] = b
 
-        assert_frame_equal(a.ix[:, 22, [111, 333]], b)
+            assert_frame_equal(a.loc[:, 22, [111, 333]], b)
 
     def test_ix_align(self):
-        from pandas import Series
-        b = Series(np.random.randn(10), name=0)
-        b.sort()
-        df_orig = Panel(np.random.randn(3, 10, 2))
-        df = df_orig.copy()
+        with catch_warnings(record=True):
+            from pandas import Series
+            b = Series(np.random.randn(10), name=0)
+            b.sort_values()
+            df_orig = Panel(np.random.randn(3, 10, 2))
+            df = df_orig.copy()
 
-        df.ix[0, :, 0] = b
-        assert_series_equal(df.ix[0, :, 0].reindex(b.index), b)
+            df.loc[0, :, 0] = b
+            assert_series_equal(df.loc[0, :, 0].reindex(b.index), b)
 
-        df = df_orig.swapaxes(0, 1)
-        df.ix[:, 0, 0] = b
-        assert_series_equal(df.ix[:, 0, 0].reindex(b.index), b)
+            df = df_orig.swapaxes(0, 1)
+            df.loc[:, 0, 0] = b
+            assert_series_equal(df.loc[:, 0, 0].reindex(b.index), b)
 
-        df = df_orig.swapaxes(1, 2)
-        df.ix[0, 0, :] = b
-        assert_series_equal(df.ix[0, 0, :].reindex(b.index), b)
+            df = df_orig.swapaxes(1, 2)
+            df.loc[0, 0, :] = b
+            assert_series_equal(df.loc[0, 0, :].reindex(b.index), b)
 
     def test_ix_frame_align(self):
-        from pandas import DataFrame
-        p_orig = tm.makePanel()
-        df = p_orig.ix[0].copy()
-        assert_frame_equal(p_orig['ItemA'],df)
-
-        p = p_orig.copy()
-        p.ix[0, :, :] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p.ix[0] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p.iloc[0, :, :] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p.iloc[0] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p.loc['ItemA'] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p.loc['ItemA', :, :] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p['ItemA'] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p.ix[0, [0, 1, 3, 5], -2:] = df
-        out = p.ix[0, [0, 1, 3, 5], -2:]
-        assert_frame_equal(out, df.iloc[[0,1,3,5],[2,3]])
-
-        # GH3830, panel assignent by values/frame
-        for dtype in ['float64','int64']:
-
-            panel = Panel(np.arange(40).reshape((2,4,5)), items=['a1','a2'], dtype=dtype)
-            df1 = panel.iloc[0]
-            df2 = panel.iloc[1]
-
-            tm.assert_frame_equal(panel.loc['a1'], df1)
-            tm.assert_frame_equal(panel.loc['a2'], df2)
-
-            # Assignment by Value Passes for 'a2'
-            panel.loc['a2'] = df1.values
-            tm.assert_frame_equal(panel.loc['a1'], df1)
-            tm.assert_frame_equal(panel.loc['a2'], df1)
-
-            # Assignment by DataFrame Ok w/o loc 'a2'
-            panel['a2'] = df2
-            tm.assert_frame_equal(panel.loc['a1'], df1)
-            tm.assert_frame_equal(panel.loc['a2'], df2)
-
-            # Assignment by DataFrame Fails for 'a2'
-            panel.loc['a2'] = df2
-            tm.assert_frame_equal(panel.loc['a1'], df1)
-            tm.assert_frame_equal(panel.loc['a2'], df2)
+        with catch_warnings(record=True):
+            p_orig = tm.makePanel()
+            df = p_orig.iloc[0].copy()
+            assert_frame_equal(p_orig['ItemA'], df)
+
+            p = p_orig.copy()
+            p.iloc[0, :, :] = df
+            assert_panel_equal(p, p_orig)
+
+            p = p_orig.copy()
+            p.iloc[0] = df
+            assert_panel_equal(p, p_orig)
+
+            p = p_orig.copy()
+            p.iloc[0, :, :] = df
+            assert_panel_equal(p, p_orig)
+
+            p = p_orig.copy()
+            p.iloc[0] = df
+            assert_panel_equal(p, p_orig)
+
+            p = p_orig.copy()
+            p.loc['ItemA'] = df
+            assert_panel_equal(p, p_orig)
+
+            p = p_orig.copy()
+            p.loc['ItemA', :, :] = df
+            assert_panel_equal(p, p_orig)
+
+            p = p_orig.copy()
+            p['ItemA'] = df
+            assert_panel_equal(p, p_orig)
+
+            p = p_orig.copy()
+            p.iloc[0, [0, 1, 3, 5], -2:] = df
+            out = p.iloc[0, [0, 1, 3, 5], -2:]
+            assert_frame_equal(out, df.iloc[[0, 1, 3, 5], [2, 3]])
+
+            # GH3830, panel assignent by values/frame
+            for dtype in ['float64', 'int64']:
+
+                panel = Panel(np.arange(40).reshape((2, 4, 5)),
+                              items=['a1', 'a2'], dtype=dtype)
+                df1 = panel.iloc[0]
+                df2 = panel.iloc[1]
+
+                tm.assert_frame_equal(panel.loc['a1'], df1)
+                tm.assert_frame_equal(panel.loc['a2'], df2)
+
+                # Assignment by Value Passes for 'a2'
+                panel.loc['a2'] = df1.values
+                tm.assert_frame_equal(panel.loc['a1'], df1)
+                tm.assert_frame_equal(panel.loc['a2'], df1)
+
+                # Assignment by DataFrame Ok w/o loc 'a2'
+                panel['a2'] = df2
+                tm.assert_frame_equal(panel.loc['a1'], df1)
+                tm.assert_frame_equal(panel.loc['a2'], df2)
+
+                # Assignment by DataFrame Fails for 'a2'
+                panel.loc['a2'] = df2
+                tm.assert_frame_equal(panel.loc['a1'], df1)
+                tm.assert_frame_equal(panel.loc['a2'], df2)
 
     def _check_view(self, indexer, comp):
         cp = self.panel.copy()
-        obj = cp.ix[indexer]
+        obj = cp.loc[indexer]
         obj.values[:] = 0
-        self.assertTrue((obj.values == 0).all())
-        comp(cp.ix[indexer].reindex_like(obj), obj)
+        assert (obj.values == 0).all()
+        comp(cp.loc[indexer].reindex_like(obj), obj)
 
     def test_logical_with_nas(self):
-        d = Panel({'ItemA': {'a': [np.nan, False]}, 'ItemB': {
-                  'a': [True, True]}})
+        with catch_warnings(record=True):
+            d = Panel({'ItemA': {'a': [np.nan, False]},
+                       'ItemB': {'a': [True, True]}})
 
-        result = d['ItemA'] | d['ItemB']
-        expected = DataFrame({'a': [np.nan, True]})
-        assert_frame_equal(result, expected)
+            result = d['ItemA'] | d['ItemB']
+            expected = DataFrame({'a': [np.nan, True]})
+            assert_frame_equal(result, expected)
 
-        # this is autodowncasted here
-        result = d['ItemA'].fillna(False) | d['ItemB']
-        expected = DataFrame({'a': [True, True]})
-        assert_frame_equal(result, expected)
+            # this is autodowncasted here
+            result = d['ItemA'].fillna(False) | d['ItemB']
+            expected = DataFrame({'a': [True, True]})
+            assert_frame_equal(result, expected)
 
     def test_neg(self):
-        # what to do?
-        assert_panel_equal(-self.panel, -1 * self.panel)
+        with catch_warnings(record=True):
+            assert_panel_equal(-self.panel, -1 * self.panel)
 
     def test_invert(self):
-        assert_panel_equal(-(self.panel < 0), ~(self.panel < 0))
+        with catch_warnings(record=True):
+            assert_panel_equal(-(self.panel < 0), ~(self.panel < 0))
 
     def test_comparisons(self):
-        p1 = tm.makePanel()
-        p2 = tm.makePanel()
+        with catch_warnings(record=True):
+            p1 = tm.makePanel()
+            p2 = tm.makePanel()
 
-        tp = p1.reindex(items=p1.items + ['foo'])
-        df = p1[p1.items[0]]
+            tp = p1.reindex(items=p1.items + ['foo'])
+            df = p1[p1.items[0]]
 
-        def test_comp(func):
+            def test_comp(func):
 
-            # versus same index
-            result = func(p1, p2)
-            self.assert_numpy_array_equal(result.values,
-                                          func(p1.values, p2.values))
+                # versus same index
+                result = func(p1, p2)
+                tm.assert_numpy_array_equal(result.values,
+                                            func(p1.values, p2.values))
 
-            # versus non-indexed same objs
-            self.assertRaises(Exception, func, p1, tp)
+                # versus non-indexed same objs
+                pytest.raises(Exception, func, p1, tp)
 
-            # versus different objs
-            self.assertRaises(Exception, func, p1, df)
+                # versus different objs
+                pytest.raises(Exception, func, p1, df)
 
-            # versus scalar
-            result3 = func(self.panel, 0)
-            self.assert_numpy_array_equal(result3.values,
-                                          func(self.panel.values, 0))
+                # versus scalar
+                result3 = func(self.panel, 0)
+                tm.assert_numpy_array_equal(result3.values,
+                                            func(self.panel.values, 0))
 
-        test_comp(operator.eq)
-        test_comp(operator.ne)
-        test_comp(operator.lt)
-        test_comp(operator.gt)
-        test_comp(operator.ge)
-        test_comp(operator.le)
+            with np.errstate(invalid='ignore'):
+                test_comp(operator.eq)
+                test_comp(operator.ne)
+                test_comp(operator.lt)
+                test_comp(operator.gt)
+                test_comp(operator.ge)
+                test_comp(operator.le)
 
     def test_get_value(self):
-        for item in self.panel.items:
-            for mjr in self.panel.major_axis[::2]:
-                for mnr in self.panel.minor_axis:
-                    result = self.panel.get_value(item, mjr, mnr)
-                    expected = self.panel[item][mnr][mjr]
-                    assert_almost_equal(result, expected)
-        with tm.assertRaisesRegexp(TypeError,
-                                   "There must be an argument for each axis"):
-            self.panel.get_value('a')
+        with catch_warnings(record=True):
+            for item in self.panel.items:
+                for mjr in self.panel.major_axis[::2]:
+                    for mnr in self.panel.minor_axis:
+                        result = self.panel.get_value(item, mjr, mnr)
+                        expected = self.panel[item][mnr][mjr]
+                        assert_almost_equal(result, expected)
+            with tm.assert_raises_regex(TypeError,
+                                        "There must be an argument "
+                                        "for each axis"):
+                self.panel.get_value('a')
 
     def test_set_value(self):
-        for item in self.panel.items:
-            for mjr in self.panel.major_axis[::2]:
-                for mnr in self.panel.minor_axis:
-                    self.panel.set_value(item, mjr, mnr, 1.)
-                    assert_almost_equal(self.panel[item][mnr][mjr], 1.)
+        with catch_warnings(record=True):
+            for item in self.panel.items:
+                for mjr in self.panel.major_axis[::2]:
+                    for mnr in self.panel.minor_axis:
+                        self.panel.set_value(item, mjr, mnr, 1.)
+                        tm.assert_almost_equal(self.panel[item][mnr][mjr], 1.)
 
-        # resize
-        res = self.panel.set_value('ItemE', 'foo', 'bar', 1.5)
-        tm.assertIsInstance(res, Panel)
-        self.assertIsNot(res, self.panel)
-        self.assertEqual(res.get_value('ItemE', 'foo', 'bar'), 1.5)
+            # resize
+            res = self.panel.set_value('ItemE', 'foo', 'bar', 1.5)
+            assert isinstance(res, Panel)
+            assert res is not self.panel
+            assert res.get_value('ItemE', 'foo', 'bar') == 1.5
 
-        res3 = self.panel.set_value('ItemE', 'foobar', 'baz', 5)
-        self.assertTrue(com.is_float_dtype(res3['ItemE'].values))
-        with tm.assertRaisesRegexp(TypeError,
-                                   "There must be an argument for each axis"
-                                   " plus the value provided"):
-            self.panel.set_value('a')
+            res3 = self.panel.set_value('ItemE', 'foobar', 'baz', 5)
+            assert is_float_dtype(res3['ItemE'].values)
 
-_panel = tm.makePanel()
-tm.add_nans(_panel)
+            msg = ("There must be an argument for each "
+                   "axis plus the value provided")
+            with tm.assert_raises_regex(TypeError, msg):
+                self.panel.set_value('a')
 
 
-class TestPanel(tm.TestCase, PanelTests, CheckIndexing,
-                SafeForLongAndSparse,
+class TestPanel(PanelTests, CheckIndexing, SafeForLongAndSparse,
                 SafeForSparse):
-    _multiprocess_can_split_ = True
 
-    @classmethod
-    def assert_panel_equal(cls, x, y):
-        assert_panel_equal(x, y)
-
-    def setUp(self):
-        import warnings
-        warnings.filterwarnings(action='ignore', category=FutureWarning)
-
-        self.panel = _panel.copy()
+    def setup_method(self, method):
+        self.panel = make_test_panel()
         self.panel.major_axis.name = None
         self.panel.minor_axis.name = None
         self.panel.items.name = None
 
-    def test_panel_warnings(self):
-        with tm.assert_produces_warning(FutureWarning):
-            shifted1 = self.panel.shift(lags=1)
-
-        with tm.assert_produces_warning(False):
-            shifted2 = self.panel.shift(periods=1)
-
-        tm.assert_panel_equal(shifted1, shifted2)
-
-        with tm.assert_produces_warning(False):
-            shifted3 = self.panel.shift()
-
-        tm.assert_panel_equal(shifted1, shifted3)
-
     def test_constructor(self):
-        # with BlockManager
-        wp = Panel(self.panel._data)
-        self.assertIs(wp._data, self.panel._data)
-
-        wp = Panel(self.panel._data, copy=True)
-        self.assertIsNot(wp._data, self.panel._data)
-        assert_panel_equal(wp, self.panel)
-
-        # strings handled prop
-        wp = Panel([[['foo', 'foo', 'foo', ],
-                     ['foo', 'foo', 'foo']]])
-        self.assertEqual(wp.values.dtype, np.object_)
-
-        vals = self.panel.values
-
-        # no copy
-        wp = Panel(vals)
-        self.assertIs(wp.values, vals)
-
-        # copy
-        wp = Panel(vals, copy=True)
-        self.assertIsNot(wp.values, vals)
-
-        # GH #8285, test when scalar data is used to construct a Panel
-        # if dtype is not passed, it should be inferred
-        value_and_dtype = [(1, 'int64'), (3.14, 'float64'), ('foo', np.object_)]
-        for (val, dtype) in value_and_dtype:
-            wp = Panel(val, items=range(2), major_axis=range(3), minor_axis=range(4))
-            vals = np.empty((2, 3, 4), dtype=dtype)
-            vals.fill(val)
-            assert_panel_equal(wp, Panel(vals, dtype=dtype))
-
-        # test the case when dtype is passed
-        wp = Panel(1, items=range(2), major_axis=range(3), minor_axis=range(4), dtype='float32')
-        vals = np.empty((2, 3, 4), dtype='float32')
-        vals.fill(1)
-        assert_panel_equal(wp, Panel(vals, dtype='float32'))
+        with catch_warnings(record=True):
+            # with BlockManager
+            wp = Panel(self.panel._data)
+            assert wp._data is self.panel._data
+
+            wp = Panel(self.panel._data, copy=True)
+            assert wp._data is not self.panel._data
+            tm.assert_panel_equal(wp, self.panel)
+
+            # strings handled prop
+            wp = Panel([[['foo', 'foo', 'foo', ], ['foo', 'foo', 'foo']]])
+            assert wp.values.dtype == np.object_
+
+            vals = self.panel.values
+
+            # no copy
+            wp = Panel(vals)
+            assert wp.values is vals
+
+            # copy
+            wp = Panel(vals, copy=True)
+            assert wp.values is not vals
+
+            # GH #8285, test when scalar data is used to construct a Panel
+            # if dtype is not passed, it should be inferred
+            value_and_dtype = [(1, 'int64'), (3.14, 'float64'),
+                               ('foo', np.object_)]
+            for (val, dtype) in value_and_dtype:
+                wp = Panel(val, items=range(2), major_axis=range(3),
+                           minor_axis=range(4))
+                vals = np.empty((2, 3, 4), dtype=dtype)
+                vals.fill(val)
+
+                tm.assert_panel_equal(wp, Panel(vals, dtype=dtype))
+
+            # test the case when dtype is passed
+            wp = Panel(1, items=range(2), major_axis=range(3),
+                       minor_axis=range(4),
+                       dtype='float32')
+            vals = np.empty((2, 3, 4), dtype='float32')
+            vals.fill(1)
+
+            tm.assert_panel_equal(wp, Panel(vals, dtype='float32'))
 
     def test_constructor_cast(self):
-        zero_filled = self.panel.fillna(0)
+        with catch_warnings(record=True):
+            zero_filled = self.panel.fillna(0)
 
-        casted = Panel(zero_filled._data, dtype=int)
-        casted2 = Panel(zero_filled.values, dtype=int)
+            casted = Panel(zero_filled._data, dtype=int)
+            casted2 = Panel(zero_filled.values, dtype=int)
 
-        exp_values = zero_filled.values.astype(int)
-        assert_almost_equal(casted.values, exp_values)
-        assert_almost_equal(casted2.values, exp_values)
+            exp_values = zero_filled.values.astype(int)
+            assert_almost_equal(casted.values, exp_values)
+            assert_almost_equal(casted2.values, exp_values)
 
-        casted = Panel(zero_filled._data, dtype=np.int32)
-        casted2 = Panel(zero_filled.values, dtype=np.int32)
+            casted = Panel(zero_filled._data, dtype=np.int32)
+            casted2 = Panel(zero_filled.values, dtype=np.int32)
 
-        exp_values = zero_filled.values.astype(np.int32)
-        assert_almost_equal(casted.values, exp_values)
-        assert_almost_equal(casted2.values, exp_values)
+            exp_values = zero_filled.values.astype(np.int32)
+            assert_almost_equal(casted.values, exp_values)
+            assert_almost_equal(casted2.values, exp_values)
 
-        # can't cast
-        data = [[['foo', 'bar', 'baz']]]
-        self.assertRaises(ValueError, Panel, data, dtype=float)
+            # can't cast
+            data = [[['foo', 'bar', 'baz']]]
+            pytest.raises(ValueError, Panel, data, dtype=float)
 
     def test_constructor_empty_panel(self):
-        empty = Panel()
-        self.assertEqual(len(empty.items), 0)
-        self.assertEqual(len(empty.major_axis), 0)
-        self.assertEqual(len(empty.minor_axis), 0)
+        with catch_warnings(record=True):
+            empty = Panel()
+            assert len(empty.items) == 0
+            assert len(empty.major_axis) == 0
+            assert len(empty.minor_axis) == 0
 
     def test_constructor_observe_dtype(self):
-        # GH #411
-        panel = Panel(items=lrange(3), major_axis=lrange(3),
-                      minor_axis=lrange(3), dtype='O')
-        self.assertEqual(panel.values.dtype, np.object_)
+        with catch_warnings(record=True):
+            # GH #411
+            panel = Panel(items=lrange(3), major_axis=lrange(3),
+                          minor_axis=lrange(3), dtype='O')
+            assert panel.values.dtype == np.object_
 
     def test_constructor_dtypes(self):
-        # GH #797
+        with catch_warnings(record=True):
+            # GH #797
+
+            def _check_dtype(panel, dtype):
+                for i in panel.items:
+                    assert panel[i].values.dtype.name == dtype
+
+            # only nan holding types allowed here
+            for dtype in ['float64', 'float32', 'object']:
+                panel = Panel(items=lrange(2), major_axis=lrange(10),
+                              minor_axis=lrange(5), dtype=dtype)
+                _check_dtype(panel, dtype)
+
+            for dtype in ['float64', 'float32', 'int64', 'int32', 'object']:
+                panel = Panel(np.array(np.random.randn(2, 10, 5), dtype=dtype),
+                              items=lrange(2),
+                              major_axis=lrange(10),
+                              minor_axis=lrange(5), dtype=dtype)
+                _check_dtype(panel, dtype)
+
+            for dtype in ['float64', 'float32', 'int64', 'int32', 'object']:
+                panel = Panel(np.array(np.random.randn(2, 10, 5), dtype='O'),
+                              items=lrange(2),
+                              major_axis=lrange(10),
+                              minor_axis=lrange(5), dtype=dtype)
+                _check_dtype(panel, dtype)
+
+            for dtype in ['float64', 'float32', 'int64', 'int32', 'object']:
+                panel = Panel(
+                    np.random.randn(2, 10, 5),
+                    items=lrange(2), major_axis=lrange(10),
+                    minor_axis=lrange(5),
+                    dtype=dtype)
+                _check_dtype(panel, dtype)
+
+            for dtype in ['float64', 'float32', 'int64', 'int32', 'object']:
+                df1 = DataFrame(np.random.randn(2, 5),
+                                index=lrange(2), columns=lrange(5))
+                df2 = DataFrame(np.random.randn(2, 5),
+                                index=lrange(2), columns=lrange(5))
+                panel = Panel.from_dict({'a': df1, 'b': df2}, dtype=dtype)
+                _check_dtype(panel, dtype)
 
-        def _check_dtype(panel, dtype):
-            for i in panel.items:
-                self.assertEqual(panel[i].values.dtype.name, dtype)
+    def test_constructor_fails_with_not_3d_input(self):
+        with catch_warnings(record=True):
+            with tm.assert_raises_regex(ValueError, "The number of dimensions required is 3"):  # noqa
+                    Panel(np.random.randn(10, 2))
 
-        # only nan holding types allowed here
-        for dtype in ['float64','float32','object']:
-            panel = Panel(items=lrange(2),major_axis=lrange(10),minor_axis=lrange(5),dtype=dtype)
-            _check_dtype(panel,dtype)
+    def test_consolidate(self):
+        with catch_warnings(record=True):
+            assert self.panel._data.is_consolidated()
 
-        for dtype in ['float64','float32','int64','int32','object']:
-            panel = Panel(np.array(np.random.randn(2,10,5),dtype=dtype),items=lrange(2),major_axis=lrange(10),minor_axis=lrange(5),dtype=dtype)
-            _check_dtype(panel,dtype)
+            self.panel['foo'] = 1.
+            assert not self.panel._data.is_consolidated()
 
-        for dtype in ['float64','float32','int64','int32','object']:
-            panel = Panel(np.array(np.random.randn(2,10,5),dtype='O'),items=lrange(2),major_axis=lrange(10),minor_axis=lrange(5),dtype=dtype)
-            _check_dtype(panel,dtype)
+            panel = self.panel._consolidate()
+            assert panel._data.is_consolidated()
 
-        for dtype in ['float64','float32','int64','int32','object']:
-            panel = Panel(np.random.randn(2,10,5),items=lrange(2),major_axis=lrange(10),minor_axis=lrange(5),dtype=dtype)
-            _check_dtype(panel,dtype)
+    def test_ctor_dict(self):
+        with catch_warnings(record=True):
+            itema = self.panel['ItemA']
+            itemb = self.panel['ItemB']
 
-        for dtype in ['float64', 'float32', 'int64', 'int32', 'object']:
-            df1 = DataFrame(np.random.randn(2, 5), index=lrange(2), columns=lrange(5))
-            df2 = DataFrame(np.random.randn(2, 5), index=lrange(2), columns=lrange(5))
-            panel = Panel.from_dict({'a': df1, 'b': df2}, dtype=dtype)
-            _check_dtype(panel, dtype)
+            d = {'A': itema, 'B': itemb[5:]}
+            d2 = {'A': itema._series, 'B': itemb[5:]._series}
+            d3 = {'A': None,
+                  'B': DataFrame(itemb[5:]._series),
+                  'C': DataFrame(itema._series)}
 
-    def test_constructor_fails_with_not_3d_input(self):
-        with tm.assertRaisesRegexp(ValueError,
-                                   "The number of dimensions required is 3"):
-            Panel(np.random.randn(10, 2))
+            wp = Panel.from_dict(d)
+            wp2 = Panel.from_dict(d2)  # nested Dict
 
-    def test_consolidate(self):
-        self.assertTrue(self.panel._data.is_consolidated())
+            # TODO: unused?
+            wp3 = Panel.from_dict(d3)  # noqa
 
-        self.panel['foo'] = 1.
-        self.assertFalse(self.panel._data.is_consolidated())
+            tm.assert_index_equal(wp.major_axis, self.panel.major_axis)
+            assert_panel_equal(wp, wp2)
 
-        panel = self.panel.consolidate()
-        self.assertTrue(panel._data.is_consolidated())
+            # intersect
+            wp = Panel.from_dict(d, intersect=True)
+            tm.assert_index_equal(wp.major_axis, itemb.index[5:])
 
-    def test_ctor_dict(self):
-        itema = self.panel['ItemA']
-        itemb = self.panel['ItemB']
-
-        d = {'A': itema, 'B': itemb[5:]}
-        d2 = {'A': itema._series, 'B': itemb[5:]._series}
-        d3 = {'A': None,
-              'B': DataFrame(itemb[5:]._series),
-              'C': DataFrame(itema._series)}
-
-        wp = Panel.from_dict(d)
-        wp2 = Panel.from_dict(d2)  # nested Dict
-        wp3 = Panel.from_dict(d3)
-        self.assertTrue(wp.major_axis.equals(self.panel.major_axis))
-        assert_panel_equal(wp, wp2)
-
-        # intersect
-        wp = Panel.from_dict(d, intersect=True)
-        self.assertTrue(wp.major_axis.equals(itemb.index[5:]))
-
-        # use constructor
-        assert_panel_equal(Panel(d), Panel.from_dict(d))
-        assert_panel_equal(Panel(d2), Panel.from_dict(d2))
-        assert_panel_equal(Panel(d3), Panel.from_dict(d3))
-
-        # a pathological case
-        d4 = {'A': None, 'B': None}
-        wp4 = Panel.from_dict(d4)
-        assert_panel_equal(Panel(d4), Panel(items=['A', 'B']))
-
-        # cast
-        dcasted = dict((k, v.reindex(wp.major_axis).fillna(0))
-                       for k, v in compat.iteritems(d))
-        result = Panel(dcasted, dtype=int)
-        expected = Panel(dict((k, v.astype(int))
-                              for k, v in compat.iteritems(dcasted)))
-        assert_panel_equal(result, expected)
-
-        result = Panel(dcasted, dtype=np.int32)
-        expected = Panel(dict((k, v.astype(np.int32))
-                              for k, v in compat.iteritems(dcasted)))
-        assert_panel_equal(result, expected)
+            # use constructor
+            assert_panel_equal(Panel(d), Panel.from_dict(d))
+            assert_panel_equal(Panel(d2), Panel.from_dict(d2))
+            assert_panel_equal(Panel(d3), Panel.from_dict(d3))
 
-    def test_constructor_dict_mixed(self):
-        data = dict((k, v.values) for k, v in compat.iteritems(self.panel))
-        result = Panel(data)
-        exp_major = Index(np.arange(len(self.panel.major_axis)))
-        self.assertTrue(result.major_axis.equals(exp_major))
+            # a pathological case
+            d4 = {'A': None, 'B': None}
 
-        result = Panel(data, items=self.panel.items,
-                       major_axis=self.panel.major_axis,
-                       minor_axis=self.panel.minor_axis)
-        assert_panel_equal(result, self.panel)
+            # TODO: unused?
+            wp4 = Panel.from_dict(d4)  # noqa
 
-        data['ItemC'] = self.panel['ItemC']
-        result = Panel(data)
-        assert_panel_equal(result, self.panel)
+            assert_panel_equal(Panel(d4), Panel(items=['A', 'B']))
 
-        # corner, blow up
-        data['ItemB'] = data['ItemB'][:-1]
-        self.assertRaises(Exception, Panel, data)
+            # cast
+            dcasted = {k: v.reindex(wp.major_axis).fillna(0)
+                       for k, v in compat.iteritems(d)}
+            result = Panel(dcasted, dtype=int)
+            expected = Panel({k: v.astype(int)
+                              for k, v in compat.iteritems(dcasted)})
+            assert_panel_equal(result, expected)
 
-        data['ItemB'] = self.panel['ItemB'].values[:, :-1]
-        self.assertRaises(Exception, Panel, data)
+            result = Panel(dcasted, dtype=np.int32)
+            expected = Panel({k: v.astype(np.int32)
+                              for k, v in compat.iteritems(dcasted)})
+            assert_panel_equal(result, expected)
 
-    def test_ctor_orderedDict(self):
-        keys = list(set(np.random.randint(0,5000,100)))[:50] # unique random int  keys
-        d = OrderedDict([(k,mkdf(10,5)) for k in keys])
-        p = Panel(d)
-        self.assertTrue(list(p.items) == keys)
+    def test_constructor_dict_mixed(self):
+        with catch_warnings(record=True):
+            data = {k: v.values for k, v in self.panel.iteritems()}
+            result = Panel(data)
+            exp_major = Index(np.arange(len(self.panel.major_axis)))
+            tm.assert_index_equal(result.major_axis, exp_major)
 
-        p = Panel.from_dict(d)
-        self.assertTrue(list(p.items) == keys)
+            result = Panel(data, items=self.panel.items,
+                           major_axis=self.panel.major_axis,
+                           minor_axis=self.panel.minor_axis)
+            assert_panel_equal(result, self.panel)
 
-    def test_constructor_resize(self):
-        data = self.panel._data
-        items = self.panel.items[:-1]
-        major = self.panel.major_axis[:-1]
-        minor = self.panel.minor_axis[:-1]
+            data['ItemC'] = self.panel['ItemC']
+            result = Panel(data)
+            assert_panel_equal(result, self.panel)
 
-        result = Panel(data, items=items, major_axis=major,
-                       minor_axis=minor)
-        expected = self.panel.reindex(items=items, major=major, minor=minor)
-        assert_panel_equal(result, expected)
+            # corner, blow up
+            data['ItemB'] = data['ItemB'][:-1]
+            pytest.raises(Exception, Panel, data)
 
-        result = Panel(data, items=items, major_axis=major)
-        expected = self.panel.reindex(items=items, major=major)
-        assert_panel_equal(result, expected)
+            data['ItemB'] = self.panel['ItemB'].values[:, :-1]
+            pytest.raises(Exception, Panel, data)
 
-        result = Panel(data, items=items)
-        expected = self.panel.reindex(items=items)
-        assert_panel_equal(result, expected)
+    def test_ctor_orderedDict(self):
+        with catch_warnings(record=True):
+            keys = list(set(np.random.randint(0, 5000, 100)))[
+                :50]  # unique random int  keys
+            d = OrderedDict([(k, mkdf(10, 5)) for k in keys])
+            p = Panel(d)
+            assert list(p.items) == keys
 
-        result = Panel(data, minor_axis=minor)
-        expected = self.panel.reindex(minor=minor)
-        assert_panel_equal(result, expected)
+            p = Panel.from_dict(d)
+            assert list(p.items) == keys
+
+    def test_constructor_resize(self):
+        with catch_warnings(record=True):
+            data = self.panel._data
+            items = self.panel.items[:-1]
+            major = self.panel.major_axis[:-1]
+            minor = self.panel.minor_axis[:-1]
+
+            result = Panel(data, items=items,
+                           major_axis=major, minor_axis=minor)
+            expected = self.panel.reindex(
+                items=items, major=major, minor=minor)
+            assert_panel_equal(result, expected)
+
+            result = Panel(data, items=items, major_axis=major)
+            expected = self.panel.reindex(items=items, major=major)
+            assert_panel_equal(result, expected)
+
+            result = Panel(data, items=items)
+            expected = self.panel.reindex(items=items)
+            assert_panel_equal(result, expected)
+
+            result = Panel(data, minor_axis=minor)
+            expected = self.panel.reindex(minor=minor)
+            assert_panel_equal(result, expected)
 
     def test_from_dict_mixed_orient(self):
-        df = tm.makeDataFrame()
-        df['foo'] = 'bar'
+        with catch_warnings(record=True):
+            df = tm.makeDataFrame()
+            df['foo'] = 'bar'
 
-        data = {'k1': df,
-                'k2': df}
+            data = {'k1': df, 'k2': df}
 
-        panel = Panel.from_dict(data, orient='minor')
+            panel = Panel.from_dict(data, orient='minor')
 
-        self.assertEqual(panel['foo'].values.dtype, np.object_)
-        self.assertEqual(panel['A'].values.dtype, np.float64)
+            assert panel['foo'].values.dtype == np.object_
+            assert panel['A'].values.dtype == np.float64
 
     def test_constructor_error_msgs(self):
-
-        def testit():
-            Panel(np.random.randn(3,4,5), lrange(4), lrange(5), lrange(5))
-        assertRaisesRegexp(ValueError, "Shape of passed values is \(3, 4, 5\), indices imply \(4, 5, 5\)", testit)
-
-        def testit():
-            Panel(np.random.randn(3,4,5), lrange(5), lrange(4), lrange(5))
-        assertRaisesRegexp(ValueError, "Shape of passed values is \(3, 4, 5\), indices imply \(5, 4, 5\)", testit)
-
-        def testit():
-            Panel(np.random.randn(3,4,5), lrange(5), lrange(5), lrange(4))
-        assertRaisesRegexp(ValueError, "Shape of passed values is \(3, 4, 5\), indices imply \(5, 5, 4\)", testit)
+        with catch_warnings(record=True):
+            def testit():
+                Panel(np.random.randn(3, 4, 5),
+                      lrange(4), lrange(5), lrange(5))
+
+            tm.assert_raises_regex(ValueError,
+                                   r"Shape of passed values is "
+                                   r"\(3, 4, 5\), indices imply "
+                                   r"\(4, 5, 5\)",
+                                   testit)
+
+            def testit():
+                Panel(np.random.randn(3, 4, 5),
+                      lrange(5), lrange(4), lrange(5))
+
+            tm.assert_raises_regex(ValueError,
+                                   r"Shape of passed values is "
+                                   r"\(3, 4, 5\), indices imply "
+                                   r"\(5, 4, 5\)",
+                                   testit)
+
+            def testit():
+                Panel(np.random.randn(3, 4, 5),
+                      lrange(5), lrange(5), lrange(4))
+
+            tm.assert_raises_regex(ValueError,
+                                   r"Shape of passed values is "
+                                   r"\(3, 4, 5\), indices imply "
+                                   r"\(5, 5, 4\)",
+                                   testit)
 
     def test_conform(self):
-        df = self.panel['ItemA'][:-5].filter(items=['A', 'B'])
-        conformed = self.panel.conform(df)
+        with catch_warnings(record=True):
+            df = self.panel['ItemA'][:-5].filter(items=['A', 'B'])
+            conformed = self.panel.conform(df)
 
-        assert(conformed.index.equals(self.panel.major_axis))
-        assert(conformed.columns.equals(self.panel.minor_axis))
+            tm.assert_index_equal(conformed.index, self.panel.major_axis)
+            tm.assert_index_equal(conformed.columns, self.panel.minor_axis)
 
     def test_convert_objects(self):
+        with catch_warnings(record=True):
 
-        # GH 4937
-        p = Panel(dict(A = dict(a = ['1','1.0'])))
-        expected = Panel(dict(A = dict(a = [1,1.0])))
-        result = p._convert(numeric=True, coerce=True)
-        assert_panel_equal(result, expected)
+            # GH 4937
+            p = Panel(dict(A=dict(a=['1', '1.0'])))
+            expected = Panel(dict(A=dict(a=[1, 1.0])))
+            result = p._convert(numeric=True, coerce=True)
+            assert_panel_equal(result, expected)
 
     def test_dtypes(self):
 
         result = self.panel.dtypes
-        expected = Series(np.dtype('float64'),index=self.panel.items)
+        expected = Series(np.dtype('float64'), index=self.panel.items)
         assert_series_equal(result, expected)
 
+    def test_astype(self):
+        with catch_warnings(record=True):
+            # GH7271
+            data = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+            panel = Panel(data, ['a', 'b'], ['c', 'd'], ['e', 'f'])
+
+            str_data = np.array([[['1', '2'], ['3', '4']],
+                                 [['5', '6'], ['7', '8']]])
+            expected = Panel(str_data, ['a', 'b'], ['c', 'd'], ['e', 'f'])
+            assert_panel_equal(panel.astype(str), expected)
+
+            pytest.raises(NotImplementedError, panel.astype, {0: str})
+
     def test_apply(self):
-        # GH1148
-
-        from pandas import Series,DataFrame
-
-        # ufunc
-        applied = self.panel.apply(np.sqrt)
-        self.assertTrue(assert_almost_equal(applied.values,
-                                            np.sqrt(self.panel.values)))
-
-        # ufunc same shape
-        result = self.panel.apply(lambda x: x*2, axis='items')
-        expected = self.panel*2
-        assert_panel_equal(result, expected)
-        result = self.panel.apply(lambda x: x*2, axis='major_axis')
-        expected = self.panel*2
-        assert_panel_equal(result, expected)
-        result = self.panel.apply(lambda x: x*2, axis='minor_axis')
-        expected = self.panel*2
-        assert_panel_equal(result, expected)
-
-        # reduction to DataFrame
-        result = self.panel.apply(lambda x: x.dtype, axis='items')
-        expected = DataFrame(np.dtype('float64'),index=self.panel.major_axis,columns=self.panel.minor_axis)
-        assert_frame_equal(result,expected)
-        result = self.panel.apply(lambda x: x.dtype, axis='major_axis')
-        expected = DataFrame(np.dtype('float64'),index=self.panel.minor_axis,columns=self.panel.items)
-        assert_frame_equal(result,expected)
-        result = self.panel.apply(lambda x: x.dtype, axis='minor_axis')
-        expected = DataFrame(np.dtype('float64'),index=self.panel.major_axis,columns=self.panel.items)
-        assert_frame_equal(result,expected)
-
-        # reductions via other dims
-        expected = self.panel.sum(0)
-        result = self.panel.apply(lambda x: x.sum(), axis='items')
-        assert_frame_equal(result,expected)
-        expected = self.panel.sum(1)
-        result = self.panel.apply(lambda x: x.sum(), axis='major_axis')
-        assert_frame_equal(result,expected)
-        expected = self.panel.sum(2)
-        result = self.panel.apply(lambda x: x.sum(), axis='minor_axis')
-        assert_frame_equal(result,expected)
-
-        # pass kwargs
-        result = self.panel.apply(lambda x, y: x.sum() + y, axis='items', y=5)
-        expected = self.panel.sum(0) + 5
-        assert_frame_equal(result,expected)
+        with catch_warnings(record=True):
+            # GH1148
+
+            # ufunc
+            applied = self.panel.apply(np.sqrt)
+            with np.errstate(invalid='ignore'):
+                expected = np.sqrt(self.panel.values)
+            assert_almost_equal(applied.values, expected)
+
+            # ufunc same shape
+            result = self.panel.apply(lambda x: x * 2, axis='items')
+            expected = self.panel * 2
+            assert_panel_equal(result, expected)
+            result = self.panel.apply(lambda x: x * 2, axis='major_axis')
+            expected = self.panel * 2
+            assert_panel_equal(result, expected)
+            result = self.panel.apply(lambda x: x * 2, axis='minor_axis')
+            expected = self.panel * 2
+            assert_panel_equal(result, expected)
+
+            # reduction to DataFrame
+            result = self.panel.apply(lambda x: x.dtype, axis='items')
+            expected = DataFrame(np.dtype('float64'),
+                                 index=self.panel.major_axis,
+                                 columns=self.panel.minor_axis)
+            assert_frame_equal(result, expected)
+            result = self.panel.apply(lambda x: x.dtype, axis='major_axis')
+            expected = DataFrame(np.dtype('float64'),
+                                 index=self.panel.minor_axis,
+                                 columns=self.panel.items)
+            assert_frame_equal(result, expected)
+            result = self.panel.apply(lambda x: x.dtype, axis='minor_axis')
+            expected = DataFrame(np.dtype('float64'),
+                                 index=self.panel.major_axis,
+                                 columns=self.panel.items)
+            assert_frame_equal(result, expected)
+
+            # reductions via other dims
+            expected = self.panel.sum(0)
+            result = self.panel.apply(lambda x: x.sum(), axis='items')
+            assert_frame_equal(result, expected)
+            expected = self.panel.sum(1)
+            result = self.panel.apply(lambda x: x.sum(), axis='major_axis')
+            assert_frame_equal(result, expected)
+            expected = self.panel.sum(2)
+            result = self.panel.apply(lambda x: x.sum(), axis='minor_axis')
+            assert_frame_equal(result, expected)
+
+            # pass kwargs
+            result = self.panel.apply(
+                lambda x, y: x.sum() + y, axis='items', y=5)
+            expected = self.panel.sum(0) + 5
+            assert_frame_equal(result, expected)
 
     def test_apply_slabs(self):
-
-        # same shape as original
-        result = self.panel.apply(lambda x: x*2, axis = ['items','major_axis'])
-        expected = (self.panel*2).transpose('minor_axis','major_axis','items')
-        assert_panel_equal(result,expected)
-        result = self.panel.apply(lambda x: x*2, axis = ['major_axis','items'])
-        assert_panel_equal(result,expected)
-
-        result = self.panel.apply(lambda x: x*2, axis = ['items','minor_axis'])
-        expected = (self.panel*2).transpose('major_axis','minor_axis','items')
-        assert_panel_equal(result,expected)
-        result = self.panel.apply(lambda x: x*2, axis = ['minor_axis','items'])
-        assert_panel_equal(result,expected)
-
-        result = self.panel.apply(lambda x: x*2, axis = ['major_axis','minor_axis'])
-        expected = self.panel*2
-        assert_panel_equal(result,expected)
-        result = self.panel.apply(lambda x: x*2, axis = ['minor_axis','major_axis'])
-        assert_panel_equal(result,expected)
-
-        # reductions
-        result = self.panel.apply(lambda x: x.sum(0), axis = ['items','major_axis'])
-        expected = self.panel.sum(1).T
-        assert_frame_equal(result,expected)
-
-        result = self.panel.apply(lambda x: x.sum(1), axis = ['items','major_axis'])
-        expected = self.panel.sum(0)
-        assert_frame_equal(result,expected)
-
-        # transforms
-        f = lambda x: ((x.T-x.mean(1))/x.std(1)).T
+        with catch_warnings(record=True):
+
+            # same shape as original
+            result = self.panel.apply(lambda x: x * 2,
+                                      axis=['items', 'major_axis'])
+            expected = (self.panel * 2).transpose('minor_axis', 'major_axis',
+                                                  'items')
+            assert_panel_equal(result, expected)
+            result = self.panel.apply(lambda x: x * 2,
+                                      axis=['major_axis', 'items'])
+            assert_panel_equal(result, expected)
+
+            result = self.panel.apply(lambda x: x * 2,
+                                      axis=['items', 'minor_axis'])
+            expected = (self.panel * 2).transpose('major_axis', 'minor_axis',
+                                                  'items')
+            assert_panel_equal(result, expected)
+            result = self.panel.apply(lambda x: x * 2,
+                                      axis=['minor_axis', 'items'])
+            assert_panel_equal(result, expected)
+
+            result = self.panel.apply(lambda x: x * 2,
+                                      axis=['major_axis', 'minor_axis'])
+            expected = self.panel * 2
+            assert_panel_equal(result, expected)
+            result = self.panel.apply(lambda x: x * 2,
+                                      axis=['minor_axis', 'major_axis'])
+            assert_panel_equal(result, expected)
+
+            # reductions
+            result = self.panel.apply(lambda x: x.sum(0), axis=[
+                'items', 'major_axis'
+            ])
+            expected = self.panel.sum(1).T
+            assert_frame_equal(result, expected)
 
         # make sure that we don't trigger any warnings
-        with tm.assert_produces_warning(False):
-            result = self.panel.apply(f, axis = ['items','major_axis'])
-            expected = Panel(dict([ (ax,f(self.panel.loc[:,:,ax])) for ax in self.panel.minor_axis ]))
-            assert_panel_equal(result,expected)
-
-        result = self.panel.apply(f, axis = ['major_axis','minor_axis'])
-        expected = Panel(dict([ (ax,f(self.panel.loc[ax])) for ax in self.panel.items ]))
-        assert_panel_equal(result,expected)
-
-        result = self.panel.apply(f, axis = ['minor_axis','items'])
-        expected = Panel(dict([ (ax,f(self.panel.loc[:,ax])) for ax in self.panel.major_axis ]))
-        assert_panel_equal(result,expected)
-
-        # with multi-indexes
-        # GH7469
-        index = MultiIndex.from_tuples([('one', 'a'), ('one', 'b'), ('two', 'a'), ('two', 'b')])
-        dfa = DataFrame(np.array(np.arange(12, dtype='int64')).reshape(4,3), columns=list("ABC"), index=index)
-        dfb = DataFrame(np.array(np.arange(10, 22, dtype='int64')).reshape(4,3), columns=list("ABC"), index=index)
-        p = Panel({'f':dfa, 'g':dfb})
-        result = p.apply(lambda x: x.sum(), axis=0)
-
-        # on windows this will be in32
-        result = result.astype('int64')
-        expected = p.sum(0)
-        assert_frame_equal(result,expected)
+        with catch_warnings(record=True):
+            result = self.panel.apply(lambda x: x.sum(1), axis=[
+                'items', 'major_axis'
+            ])
+            expected = self.panel.sum(0)
+            assert_frame_equal(result, expected)
+
+            # transforms
+            f = lambda x: ((x.T - x.mean(1)) / x.std(1)).T
+
+            # make sure that we don't trigger any warnings
+            result = self.panel.apply(f, axis=['items', 'major_axis'])
+            expected = Panel({ax: f(self.panel.loc[:, :, ax])
+                              for ax in self.panel.minor_axis})
+            assert_panel_equal(result, expected)
+
+            result = self.panel.apply(f, axis=['major_axis', 'minor_axis'])
+            expected = Panel({ax: f(self.panel.loc[ax])
+                              for ax in self.panel.items})
+            assert_panel_equal(result, expected)
+
+            result = self.panel.apply(f, axis=['minor_axis', 'items'])
+            expected = Panel({ax: f(self.panel.loc[:, ax])
+                              for ax in self.panel.major_axis})
+            assert_panel_equal(result, expected)
+
+            # with multi-indexes
+            # GH7469
+            index = MultiIndex.from_tuples([('one', 'a'), ('one', 'b'), (
+                'two', 'a'), ('two', 'b')])
+            dfa = DataFrame(np.array(np.arange(12, dtype='int64')).reshape(
+                4, 3), columns=list("ABC"), index=index)
+            dfb = DataFrame(np.array(np.arange(10, 22, dtype='int64')).reshape(
+                4, 3), columns=list("ABC"), index=index)
+            p = Panel({'f': dfa, 'g': dfb})
+            result = p.apply(lambda x: x.sum(), axis=0)
+
+            # on windows this will be in32
+            result = result.astype('int64')
+            expected = p.sum(0)
+            assert_frame_equal(result, expected)
 
     def test_apply_no_or_zero_ndim(self):
-        # GH10332
-        self.panel = Panel(np.random.rand(5, 5, 5))
+        with catch_warnings(record=True):
+            # GH10332
+            self.panel = Panel(np.random.rand(5, 5, 5))
 
-        result_int = self.panel.apply(lambda df: 0, axis=[1, 2])
-        result_float = self.panel.apply(lambda df: 0.0, axis=[1, 2])
-        result_int64 = self.panel.apply(lambda df: np.int64(0), axis=[1, 2])
-        result_float64 = self.panel.apply(lambda df: np.float64(0.0),
-                                          axis=[1, 2])
+            result_int = self.panel.apply(lambda df: 0, axis=[1, 2])
+            result_float = self.panel.apply(lambda df: 0.0, axis=[1, 2])
+            result_int64 = self.panel.apply(
+                lambda df: np.int64(0), axis=[1, 2])
+            result_float64 = self.panel.apply(lambda df: np.float64(0.0),
+                                              axis=[1, 2])
 
-        expected_int = expected_int64 = Series([0] * 5)
-        expected_float = expected_float64 = Series([0.0] * 5)
-
-        assert_series_equal(result_int, expected_int)
-        assert_series_equal(result_int64, expected_int64)
-        assert_series_equal(result_float, expected_float)
-        assert_series_equal(result_float64, expected_float64)
+            expected_int = expected_int64 = Series([0] * 5)
+            expected_float = expected_float64 = Series([0.0] * 5)
 
+            assert_series_equal(result_int, expected_int)
+            assert_series_equal(result_int64, expected_int64)
+            assert_series_equal(result_float, expected_float)
+            assert_series_equal(result_float64, expected_float64)
 
     def test_reindex(self):
-        ref = self.panel['ItemB']
+        with catch_warnings(record=True):
+            ref = self.panel['ItemB']
 
-        # items
-        result = self.panel.reindex(items=['ItemA', 'ItemB'])
-        assert_frame_equal(result['ItemB'], ref)
+            # items
+            result = self.panel.reindex(items=['ItemA', 'ItemB'])
+            assert_frame_equal(result['ItemB'], ref)
 
-        # major
-        new_major = list(self.panel.major_axis[:10])
-        result = self.panel.reindex(major=new_major)
-        assert_frame_equal(result['ItemB'], ref.reindex(index=new_major))
+            # major
+            new_major = list(self.panel.major_axis[:10])
+            result = self.panel.reindex(major=new_major)
+            assert_frame_equal(result['ItemB'], ref.reindex(index=new_major))
 
-        # raise exception put both major and major_axis
-        self.assertRaises(Exception, self.panel.reindex,
-                          major_axis=new_major, major=new_major)
+            # raise exception put both major and major_axis
+            pytest.raises(Exception, self.panel.reindex,
+                          major_axis=new_major,
+                          major=new_major)
 
-        # minor
-        new_minor = list(self.panel.minor_axis[:2])
-        result = self.panel.reindex(minor=new_minor)
-        assert_frame_equal(result['ItemB'], ref.reindex(columns=new_minor))
+            # minor
+            new_minor = list(self.panel.minor_axis[:2])
+            result = self.panel.reindex(minor=new_minor)
+            assert_frame_equal(result['ItemB'], ref.reindex(columns=new_minor))
 
-        # this ok
-        result = self.panel.reindex()
-        assert_panel_equal(result,self.panel)
-        self.assertFalse(result is self.panel)
+            # raise exception put both major and major_axis
+            pytest.raises(Exception, self.panel.reindex,
+                          minor_axis=new_minor,
+                          minor=new_minor)
 
-        # with filling
-        smaller_major = self.panel.major_axis[::5]
-        smaller = self.panel.reindex(major=smaller_major)
+            # this ok
+            result = self.panel.reindex()
+            assert_panel_equal(result, self.panel)
+            assert result is not self.panel
 
-        larger = smaller.reindex(major=self.panel.major_axis,
-                                 method='pad')
+            # with filling
+            smaller_major = self.panel.major_axis[::5]
+            smaller = self.panel.reindex(major=smaller_major)
 
-        assert_frame_equal(larger.major_xs(self.panel.major_axis[1]),
-                           smaller.major_xs(smaller_major[0]))
+            larger = smaller.reindex(major=self.panel.major_axis, method='pad')
 
-        # don't necessarily copy
-        result = self.panel.reindex(major=self.panel.major_axis, copy=False)
-        assert_panel_equal(result,self.panel)
-        self.assertTrue(result is self.panel)
+            assert_frame_equal(larger.major_xs(self.panel.major_axis[1]),
+                               smaller.major_xs(smaller_major[0]))
 
-    def test_reindex_multi(self):
+            # don't necessarily copy
+            result = self.panel.reindex(
+                major=self.panel.major_axis, copy=False)
+            assert_panel_equal(result, self.panel)
+            assert result is self.panel
 
-        # with and without copy full reindexing
-        result = self.panel.reindex(items=self.panel.items,
-                                    major=self.panel.major_axis,
-                                    minor=self.panel.minor_axis,
-                                    copy = False)
-
-        self.assertIs(result.items, self.panel.items)
-        self.assertIs(result.major_axis, self.panel.major_axis)
-        self.assertIs(result.minor_axis, self.panel.minor_axis)
-
-        result = self.panel.reindex(items=self.panel.items,
-                                    major=self.panel.major_axis,
-                                    minor=self.panel.minor_axis,
-                                    copy = False)
-        assert_panel_equal(result,self.panel)
-
-        # multi-axis indexing consistency
-        # GH 5900
-        df = DataFrame(np.random.randn(4,3))
-        p = Panel({ 'Item1' : df })
-        expected = Panel({ 'Item1' : df })
-        expected['Item2'] = np.nan
-
-        items = ['Item1','Item2']
-        major_axis = np.arange(4)
-        minor_axis = np.arange(3)
-
-        results = []
-        results.append(p.reindex(items=items, major_axis=major_axis, copy=True))
-        results.append(p.reindex(items=items, major_axis=major_axis, copy=False))
-        results.append(p.reindex(items=items, minor_axis=minor_axis, copy=True))
-        results.append(p.reindex(items=items, minor_axis=minor_axis, copy=False))
-        results.append(p.reindex(items=items, major_axis=major_axis, minor_axis=minor_axis, copy=True))
-        results.append(p.reindex(items=items, major_axis=major_axis, minor_axis=minor_axis, copy=False))
-
-        for i, r in enumerate(results):
-            assert_panel_equal(expected,r)
+    def test_reindex_axis_style(self):
+        with catch_warnings(record=True):
+            panel = Panel(np.random.rand(5, 5, 5))
+            expected0 = Panel(panel.values).iloc[[0, 1]]
+            expected1 = Panel(panel.values).iloc[:, [0, 1]]
+            expected2 = Panel(panel.values).iloc[:, :, [0, 1]]
 
-    def test_reindex_like(self):
-        # reindex_like
-        smaller = self.panel.reindex(items=self.panel.items[:-1],
-                                     major=self.panel.major_axis[:-1],
-                                     minor=self.panel.minor_axis[:-1])
-        smaller_like = self.panel.reindex_like(smaller)
-        assert_panel_equal(smaller, smaller_like)
+            result = panel.reindex([0, 1], axis=0)
+            assert_panel_equal(result, expected0)
 
-    def test_take(self):
-        # axis == 0
-        result = self.panel.take([2, 0, 1], axis=0)
-        expected = self.panel.reindex(items=['ItemC', 'ItemA', 'ItemB'])
-        assert_panel_equal(result, expected)
+            result = panel.reindex([0, 1], axis=1)
+            assert_panel_equal(result, expected1)
 
-        # axis >= 1
-        result = self.panel.take([3, 0, 1, 2], axis=2)
-        expected = self.panel.reindex(minor=['D', 'A', 'B', 'C'])
-        assert_panel_equal(result, expected)
+            result = panel.reindex([0, 1], axis=2)
+            assert_panel_equal(result, expected2)
 
-        # neg indicies ok
-        expected = self.panel.reindex(minor=['D', 'D', 'B', 'C'])
-        result = self.panel.take([3, -1, 1, 2], axis=2)
-        assert_panel_equal(result, expected)
+            result = panel.reindex([0, 1], axis=2)
+            assert_panel_equal(result, expected2)
 
-        self.assertRaises(Exception, self.panel.take, [4, 0, 1, 2], axis=2)
+    def test_reindex_multi(self):
+        with catch_warnings(record=True):
+
+            # with and without copy full reindexing
+            result = self.panel.reindex(
+                items=self.panel.items,
+                major=self.panel.major_axis,
+                minor=self.panel.minor_axis, copy=False)
+
+            assert result.items is self.panel.items
+            assert result.major_axis is self.panel.major_axis
+            assert result.minor_axis is self.panel.minor_axis
+
+            result = self.panel.reindex(
+                items=self.panel.items,
+                major=self.panel.major_axis,
+                minor=self.panel.minor_axis, copy=False)
+            assert_panel_equal(result, self.panel)
+
+            # multi-axis indexing consistency
+            # GH 5900
+            df = DataFrame(np.random.randn(4, 3))
+            p = Panel({'Item1': df})
+            expected = Panel({'Item1': df})
+            expected['Item2'] = np.nan
+
+            items = ['Item1', 'Item2']
+            major_axis = np.arange(4)
+            minor_axis = np.arange(3)
+
+            results = []
+            results.append(p.reindex(items=items, major_axis=major_axis,
+                                     copy=True))
+            results.append(p.reindex(items=items, major_axis=major_axis,
+                                     copy=False))
+            results.append(p.reindex(items=items, minor_axis=minor_axis,
+                                     copy=True))
+            results.append(p.reindex(items=items, minor_axis=minor_axis,
+                                     copy=False))
+            results.append(p.reindex(items=items, major_axis=major_axis,
+                                     minor_axis=minor_axis, copy=True))
+            results.append(p.reindex(items=items, major_axis=major_axis,
+                                     minor_axis=minor_axis, copy=False))
+
+            for i, r in enumerate(results):
+                assert_panel_equal(expected, r)
 
-    def test_sort_index(self):
-        import random
+    def test_reindex_like(self):
+        with catch_warnings(record=True):
+            # reindex_like
+            smaller = self.panel.reindex(items=self.panel.items[:-1],
+                                         major=self.panel.major_axis[:-1],
+                                         minor=self.panel.minor_axis[:-1])
+            smaller_like = self.panel.reindex_like(smaller)
+            assert_panel_equal(smaller, smaller_like)
 
-        ritems = list(self.panel.items)
-        rmajor = list(self.panel.major_axis)
-        rminor = list(self.panel.minor_axis)
-        random.shuffle(ritems)
-        random.shuffle(rmajor)
-        random.shuffle(rminor)
+    def test_take(self):
+        with catch_warnings(record=True):
+            # axis == 0
+            result = self.panel.take([2, 0, 1], axis=0)
+            expected = self.panel.reindex(items=['ItemC', 'ItemA', 'ItemB'])
+            assert_panel_equal(result, expected)
 
-        random_order = self.panel.reindex(items=ritems)
-        sorted_panel = random_order.sort_index(axis=0)
-        assert_panel_equal(sorted_panel, self.panel)
+            # axis >= 1
+            result = self.panel.take([3, 0, 1, 2], axis=2)
+            expected = self.panel.reindex(minor=['D', 'A', 'B', 'C'])
+            assert_panel_equal(result, expected)
 
-        # descending
-        random_order = self.panel.reindex(items=ritems)
-        sorted_panel = random_order.sort_index(axis=0, ascending=False)
-        assert_panel_equal(sorted_panel,
-                           self.panel.reindex(items=self.panel.items[::-1]))
+            # neg indices ok
+            expected = self.panel.reindex(minor=['D', 'D', 'B', 'C'])
+            result = self.panel.take([3, -1, 1, 2], axis=2)
+            assert_panel_equal(result, expected)
 
-        random_order = self.panel.reindex(major=rmajor)
-        sorted_panel = random_order.sort_index(axis=1)
-        assert_panel_equal(sorted_panel, self.panel)
+            pytest.raises(Exception, self.panel.take, [4, 0, 1, 2], axis=2)
 
-        random_order = self.panel.reindex(minor=rminor)
-        sorted_panel = random_order.sort_index(axis=2)
-        assert_panel_equal(sorted_panel, self.panel)
+    def test_sort_index(self):
+        with catch_warnings(record=True):
+            import random
+
+            ritems = list(self.panel.items)
+            rmajor = list(self.panel.major_axis)
+            rminor = list(self.panel.minor_axis)
+            random.shuffle(ritems)
+            random.shuffle(rmajor)
+            random.shuffle(rminor)
+
+            random_order = self.panel.reindex(items=ritems)
+            sorted_panel = random_order.sort_index(axis=0)
+            assert_panel_equal(sorted_panel, self.panel)
+
+            # descending
+            random_order = self.panel.reindex(items=ritems)
+            sorted_panel = random_order.sort_index(axis=0, ascending=False)
+            assert_panel_equal(
+                sorted_panel,
+                self.panel.reindex(items=self.panel.items[::-1]))
+
+            random_order = self.panel.reindex(major=rmajor)
+            sorted_panel = random_order.sort_index(axis=1)
+            assert_panel_equal(sorted_panel, self.panel)
+
+            random_order = self.panel.reindex(minor=rminor)
+            sorted_panel = random_order.sort_index(axis=2)
+            assert_panel_equal(sorted_panel, self.panel)
 
     def test_fillna(self):
-        filled = self.panel.fillna(0)
-        self.assertTrue(np.isfinite(filled.values).all())
-
-        filled = self.panel.fillna(method='backfill')
-        assert_frame_equal(filled['ItemA'],
-                           self.panel['ItemA'].fillna(method='backfill'))
-
-        panel = self.panel.copy()
-        panel['str'] = 'foo'
-
-        filled = panel.fillna(method='backfill')
-        assert_frame_equal(filled['ItemA'],
-                           panel['ItemA'].fillna(method='backfill'))
-
-        empty = self.panel.reindex(items=[])
-        filled = empty.fillna(0)
-        assert_panel_equal(filled, empty)
-
-        self.assertRaises(ValueError, self.panel.fillna)
-        self.assertRaises(ValueError, self.panel.fillna, 5, method='ffill')
-
-        self.assertRaises(TypeError, self.panel.fillna, [1, 2])
-        self.assertRaises(TypeError, self.panel.fillna, (1, 2))
-
-        # limit not implemented when only value is specified
-        p = Panel(np.random.randn(3,4,5))
-        p.iloc[0:2,0:2,0:2] = np.nan
-        self.assertRaises(NotImplementedError, lambda : p.fillna(999,limit=1))
+        with catch_warnings(record=True):
+            filled = self.panel.fillna(0)
+            assert np.isfinite(filled.values).all()
+
+            filled = self.panel.fillna(method='backfill')
+            assert_frame_equal(filled['ItemA'],
+                               self.panel['ItemA'].fillna(method='backfill'))
+
+            panel = self.panel.copy()
+            panel['str'] = 'foo'
+
+            filled = panel.fillna(method='backfill')
+            assert_frame_equal(filled['ItemA'],
+                               panel['ItemA'].fillna(method='backfill'))
+
+            empty = self.panel.reindex(items=[])
+            filled = empty.fillna(0)
+            assert_panel_equal(filled, empty)
+
+            pytest.raises(ValueError, self.panel.fillna)
+            pytest.raises(ValueError, self.panel.fillna, 5, method='ffill')
+
+            pytest.raises(TypeError, self.panel.fillna, [1, 2])
+            pytest.raises(TypeError, self.panel.fillna, (1, 2))
+
+            # limit not implemented when only value is specified
+            p = Panel(np.random.randn(3, 4, 5))
+            p.iloc[0:2, 0:2, 0:2] = np.nan
+            pytest.raises(NotImplementedError,
+                          lambda: p.fillna(999, limit=1))
+
+            # Test in place fillNA
+            # Expected result
+            expected = Panel([[[0, 1], [2, 1]], [[10, 11], [12, 11]]],
+                             items=['a', 'b'], minor_axis=['x', 'y'],
+                             dtype=np.float64)
+            # method='ffill'
+            p1 = Panel([[[0, 1], [2, np.nan]], [[10, 11], [12, np.nan]]],
+                       items=['a', 'b'], minor_axis=['x', 'y'],
+                       dtype=np.float64)
+            p1.fillna(method='ffill', inplace=True)
+            assert_panel_equal(p1, expected)
+
+            # method='bfill'
+            p2 = Panel([[[0, np.nan], [2, 1]], [[10, np.nan], [12, 11]]],
+                       items=['a', 'b'], minor_axis=['x', 'y'],
+                       dtype=np.float64)
+            p2.fillna(method='bfill', inplace=True)
+            assert_panel_equal(p2, expected)
 
     def test_ffill_bfill(self):
-        assert_panel_equal(self.panel.ffill(),
-                           self.panel.fillna(method='ffill'))
-        assert_panel_equal(self.panel.bfill(),
-                           self.panel.fillna(method='bfill'))
+        with catch_warnings(record=True):
+            assert_panel_equal(self.panel.ffill(),
+                               self.panel.fillna(method='ffill'))
+            assert_panel_equal(self.panel.bfill(),
+                               self.panel.fillna(method='bfill'))
 
     def test_truncate_fillna_bug(self):
-        # #1823
-        result = self.panel.truncate(before=None, after=None, axis='items')
+        with catch_warnings(record=True):
+            # #1823
+            result = self.panel.truncate(before=None, after=None, axis='items')
 
-        # it works!
-        result.fillna(value=0.0)
+            # it works!
+            result.fillna(value=0.0)
 
     def test_swapaxes(self):
-        result = self.panel.swapaxes('items', 'minor')
-        self.assertIs(result.items, self.panel.minor_axis)
+        with catch_warnings(record=True):
+            result = self.panel.swapaxes('items', 'minor')
+            assert result.items is self.panel.minor_axis
 
-        result = self.panel.swapaxes('items', 'major')
-        self.assertIs(result.items, self.panel.major_axis)
+            result = self.panel.swapaxes('items', 'major')
+            assert result.items is self.panel.major_axis
 
-        result = self.panel.swapaxes('major', 'minor')
-        self.assertIs(result.major_axis, self.panel.minor_axis)
+            result = self.panel.swapaxes('major', 'minor')
+            assert result.major_axis is self.panel.minor_axis
 
-        panel = self.panel.copy()
-        result = panel.swapaxes('major', 'minor')
-        panel.values[0, 0, 1] = np.nan
-        expected = panel.swapaxes('major', 'minor')
-        assert_panel_equal(result, expected)
+            panel = self.panel.copy()
+            result = panel.swapaxes('major', 'minor')
+            panel.values[0, 0, 1] = np.nan
+            expected = panel.swapaxes('major', 'minor')
+            assert_panel_equal(result, expected)
 
-        # this should also work
-        result = self.panel.swapaxes(0, 1)
-        self.assertIs(result.items, self.panel.major_axis)
+            # this should also work
+            result = self.panel.swapaxes(0, 1)
+            assert result.items is self.panel.major_axis
 
-        # this works, but return a copy
-        result = self.panel.swapaxes('items', 'items')
-        assert_panel_equal(self.panel,result)
-        self.assertNotEqual(id(self.panel), id(result))
+            # this works, but return a copy
+            result = self.panel.swapaxes('items', 'items')
+            assert_panel_equal(self.panel, result)
+            assert id(self.panel) != id(result)
 
     def test_transpose(self):
-        result = self.panel.transpose('minor', 'major', 'items')
-        expected = self.panel.swapaxes('items', 'minor')
-        assert_panel_equal(result, expected)
-
-        # test kwargs
-        result = self.panel.transpose(items='minor', major='major',
-                                      minor='items')
-        expected = self.panel.swapaxes('items', 'minor')
-        assert_panel_equal(result, expected)
-
-        # text mixture of args
-        result = self.panel.transpose('minor', major='major', minor='items')
-        expected = self.panel.swapaxes('items', 'minor')
-        assert_panel_equal(result, expected)
-
-        result = self.panel.transpose('minor', 'major', minor='items')
-        expected = self.panel.swapaxes('items', 'minor')
-        assert_panel_equal(result, expected)
-
-        # duplicate axes
-        with tm.assertRaisesRegexp(TypeError, 'not enough/duplicate arguments'):
-            self.panel.transpose('minor', maj='major', minor='items')
-
-        with tm.assertRaisesRegexp(ValueError, 'repeated axis in transpose'):
-            self.panel.transpose('minor', 'major', major='minor', minor='items')
-
-        result = self.panel.transpose(2, 1, 0)
-        assert_panel_equal(result, expected)
-
-        result = self.panel.transpose('minor', 'items', 'major')
-        expected = self.panel.swapaxes('items', 'minor')
-        expected = expected.swapaxes('major', 'minor')
-        assert_panel_equal(result, expected)
-
-        result = self.panel.transpose(2, 0, 1)
-        assert_panel_equal(result, expected)
-
-        self.assertRaises(ValueError, self.panel.transpose, 0, 0, 1)
+        with catch_warnings(record=True):
+            result = self.panel.transpose('minor', 'major', 'items')
+            expected = self.panel.swapaxes('items', 'minor')
+            assert_panel_equal(result, expected)
+
+            # test kwargs
+            result = self.panel.transpose(items='minor', major='major',
+                                          minor='items')
+            expected = self.panel.swapaxes('items', 'minor')
+            assert_panel_equal(result, expected)
+
+            # text mixture of args
+            result = self.panel.transpose(
+                'minor', major='major', minor='items')
+            expected = self.panel.swapaxes('items', 'minor')
+            assert_panel_equal(result, expected)
+
+            result = self.panel.transpose('minor',
+                                          'major',
+                                          minor='items')
+            expected = self.panel.swapaxes('items', 'minor')
+            assert_panel_equal(result, expected)
+
+            # duplicate axes
+            with tm.assert_raises_regex(TypeError,
+                                        'not enough/duplicate arguments'):
+                self.panel.transpose('minor', maj='major', minor='items')
+
+            with tm.assert_raises_regex(ValueError,
+                                        'repeated axis in transpose'):
+                self.panel.transpose('minor', 'major', major='minor',
+                                     minor='items')
+
+            result = self.panel.transpose(2, 1, 0)
+            assert_panel_equal(result, expected)
+
+            result = self.panel.transpose('minor', 'items', 'major')
+            expected = self.panel.swapaxes('items', 'minor')
+            expected = expected.swapaxes('major', 'minor')
+            assert_panel_equal(result, expected)
+
+            result = self.panel.transpose(2, 0, 1)
+            assert_panel_equal(result, expected)
+
+            pytest.raises(ValueError, self.panel.transpose, 0, 0, 1)
 
     def test_transpose_copy(self):
-        panel = self.panel.copy()
-        result = panel.transpose(2, 0, 1, copy=True)
-        expected = panel.swapaxes('items', 'minor')
-        expected = expected.swapaxes('major', 'minor')
-        assert_panel_equal(result, expected)
+        with catch_warnings(record=True):
+            panel = self.panel.copy()
+            result = panel.transpose(2, 0, 1, copy=True)
+            expected = panel.swapaxes('items', 'minor')
+            expected = expected.swapaxes('major', 'minor')
+            assert_panel_equal(result, expected)
 
-        panel.values[0, 1, 1] = np.nan
-        self.assertTrue(notnull(result.values[1, 0, 1]))
+            panel.values[0, 1, 1] = np.nan
+            assert notna(result.values[1, 0, 1])
 
     def test_to_frame(self):
-        # filtered
-        filtered = self.panel.to_frame()
-        expected = self.panel.to_frame().dropna(how='any')
-        assert_frame_equal(filtered, expected)
-
-        # unfiltered
-        unfiltered = self.panel.to_frame(filter_observations=False)
-        assert_panel_equal(unfiltered.to_panel(), self.panel)
-
-        # names
-        self.assertEqual(unfiltered.index.names, ('major', 'minor'))
-
-        # unsorted, round trip
-        df = self.panel.to_frame(filter_observations=False)
-        unsorted = df.take(np.random.permutation(len(df)))
-        pan = unsorted.to_panel()
-        assert_panel_equal(pan, self.panel)
-
-        # preserve original index names
-        df = DataFrame(np.random.randn(6, 2),
-                       index=[['a', 'a', 'b', 'b', 'c', 'c'],
-                              [0, 1, 0, 1, 0, 1]],
-                       columns=['one', 'two'])
-        df.index.names = ['foo', 'bar']
-        df.columns.name = 'baz'
-
-        rdf = df.to_panel().to_frame()
-        self.assertEqual(rdf.index.names, df.index.names)
-        self.assertEqual(rdf.columns.names, df.columns.names)
+        with catch_warnings(record=True):
+            # filtered
+            filtered = self.panel.to_frame()
+            expected = self.panel.to_frame().dropna(how='any')
+            assert_frame_equal(filtered, expected)
+
+            # unfiltered
+            unfiltered = self.panel.to_frame(filter_observations=False)
+            assert_panel_equal(unfiltered.to_panel(), self.panel)
+
+            # names
+            assert unfiltered.index.names == ('major', 'minor')
+
+            # unsorted, round trip
+            df = self.panel.to_frame(filter_observations=False)
+            unsorted = df.take(np.random.permutation(len(df)))
+            pan = unsorted.to_panel()
+            assert_panel_equal(pan, self.panel)
+
+            # preserve original index names
+            df = DataFrame(np.random.randn(6, 2),
+                           index=[['a', 'a', 'b', 'b', 'c', 'c'],
+                                  [0, 1, 0, 1, 0, 1]],
+                           columns=['one', 'two'])
+            df.index.names = ['foo', 'bar']
+            df.columns.name = 'baz'
+
+            rdf = df.to_panel().to_frame()
+            assert rdf.index.names == df.index.names
+            assert rdf.columns.names == df.columns.names
 
     def test_to_frame_mixed(self):
-        panel = self.panel.fillna(0)
-        panel['str'] = 'foo'
-        panel['bool'] = panel['ItemA'] > 0
-
-        lp = panel.to_frame()
-        wp = lp.to_panel()
-        self.assertEqual(wp['bool'].values.dtype, np.bool_)
-        # Previously, this was mutating the underlying index and changing its name
-        assert_frame_equal(wp['bool'], panel['bool'], check_names=False)
-
-        # GH 8704
-        # with categorical
-        df = panel.to_frame()
-        df['category'] = df['str'].astype('category')
-
-        # to_panel
-        # TODO: this converts back to object
-        p = df.to_panel()
-        expected = panel.copy()
-        expected['category'] = 'foo'
-        assert_panel_equal(p,expected)
+        with catch_warnings(record=True):
+            panel = self.panel.fillna(0)
+            panel['str'] = 'foo'
+            panel['bool'] = panel['ItemA'] > 0
+
+            lp = panel.to_frame()
+            wp = lp.to_panel()
+            assert wp['bool'].values.dtype == np.bool_
+            # Previously, this was mutating the underlying
+            # index and changing its name
+            assert_frame_equal(wp['bool'], panel['bool'], check_names=False)
+
+            # GH 8704
+            # with categorical
+            df = panel.to_frame()
+            df['category'] = df['str'].astype('category')
+
+            # to_panel
+            # TODO: this converts back to object
+            p = df.to_panel()
+            expected = panel.copy()
+            expected['category'] = 'foo'
+            assert_panel_equal(p, expected)
 
     def test_to_frame_multi_major(self):
-        idx = MultiIndex.from_tuples([(1, 'one'), (1, 'two'), (2, 'one'),
-                                      (2, 'two')])
-        df = DataFrame([[1, 'a', 1], [2, 'b', 1], [3, 'c', 1], [4, 'd', 1]],
-                       columns=['A', 'B', 'C'], index=idx)
-        wp = Panel({'i1': df, 'i2': df})
-        expected_idx = MultiIndex.from_tuples([(1, 'one', 'A'), (1, 'one', 'B'),
-                                               (1, 'one', 'C'), (1, 'two', 'A'),
-                                               (1, 'two', 'B'), (1, 'two', 'C'),
-                                               (2, 'one', 'A'), (2, 'one', 'B'),
-                                               (2, 'one', 'C'), (2, 'two', 'A'),
-                                               (2, 'two', 'B'), (2, 'two', 'C')],
-                                              names=[None, None, 'minor'])
-        expected = DataFrame({'i1': [1, 'a', 1, 2, 'b', 1, 3, 'c', 1, 4, 'd', 1],
-                              'i2': [1, 'a', 1, 2, 'b', 1, 3, 'c', 1, 4, 'd', 1]},
-                             index=expected_idx)
-        result = wp.to_frame()
-        assert_frame_equal(result, expected)
-
-        wp.iloc[0, 0].iloc[0] = np.nan  # BUG on setting. GH #5773
-        result = wp.to_frame()
-        assert_frame_equal(result, expected[1:])
-
-        idx = MultiIndex.from_tuples([(1, 'two'), (1, 'one'), (2, 'one'),
-                                      (np.nan, 'two')])
-        df = DataFrame([[1, 'a', 1], [2, 'b', 1], [3, 'c', 1], [4, 'd', 1]],
-                       columns=['A', 'B', 'C'], index=idx)
-        wp = Panel({'i1': df, 'i2': df})
-        ex_idx = MultiIndex.from_tuples([(1, 'two', 'A'), (1, 'two', 'B'), (1, 'two', 'C'),
-                                         (1, 'one', 'A'), (1, 'one', 'B'), (1, 'one', 'C'),
-                                         (2, 'one', 'A'), (2, 'one', 'B'), (2, 'one', 'C'),
-                                         (np.nan, 'two', 'A'), (np.nan, 'two', 'B'),
-                                         (np.nan, 'two', 'C')],
-                                         names=[None, None, 'minor'])
-        expected.index = ex_idx
-        result = wp.to_frame()
-        assert_frame_equal(result, expected)
+        with catch_warnings(record=True):
+            idx = MultiIndex.from_tuples(
+                [(1, 'one'), (1, 'two'), (2, 'one'), (2, 'two')])
+            df = DataFrame([[1, 'a', 1], [2, 'b', 1],
+                            [3, 'c', 1], [4, 'd', 1]],
+                           columns=['A', 'B', 'C'], index=idx)
+            wp = Panel({'i1': df, 'i2': df})
+            expected_idx = MultiIndex.from_tuples(
+                [
+                    (1, 'one', 'A'), (1, 'one', 'B'),
+                    (1, 'one', 'C'), (1, 'two', 'A'),
+                    (1, 'two', 'B'), (1, 'two', 'C'),
+                    (2, 'one', 'A'), (2, 'one', 'B'),
+                    (2, 'one', 'C'), (2, 'two', 'A'),
+                    (2, 'two', 'B'), (2, 'two', 'C')
+                ],
+                names=[None, None, 'minor'])
+            expected = DataFrame({'i1': [1, 'a', 1, 2, 'b', 1, 3,
+                                         'c', 1, 4, 'd', 1],
+                                  'i2': [1, 'a', 1, 2, 'b',
+                                         1, 3, 'c', 1, 4, 'd', 1]},
+                                 index=expected_idx)
+            result = wp.to_frame()
+            assert_frame_equal(result, expected)
+
+            wp.iloc[0, 0].iloc[0] = np.nan  # BUG on setting. GH #5773
+            result = wp.to_frame()
+            assert_frame_equal(result, expected[1:])
+
+            idx = MultiIndex.from_tuples(
+                [(1, 'two'), (1, 'one'), (2, 'one'), (np.nan, 'two')])
+            df = DataFrame([[1, 'a', 1], [2, 'b', 1],
+                            [3, 'c', 1], [4, 'd', 1]],
+                           columns=['A', 'B', 'C'], index=idx)
+            wp = Panel({'i1': df, 'i2': df})
+            ex_idx = MultiIndex.from_tuples([(1, 'two', 'A'), (1, 'two', 'B'),
+                                             (1, 'two', 'C'),
+                                             (1, 'one', 'A'),
+                                             (1, 'one', 'B'),
+                                             (1, 'one', 'C'),
+                                             (2, 'one', 'A'),
+                                             (2, 'one', 'B'),
+                                             (2, 'one', 'C'),
+                                             (np.nan, 'two', 'A'),
+                                             (np.nan, 'two', 'B'),
+                                             (np.nan, 'two', 'C')],
+                                            names=[None, None, 'minor'])
+            expected.index = ex_idx
+            result = wp.to_frame()
+            assert_frame_equal(result, expected)
 
     def test_to_frame_multi_major_minor(self):
-        cols = MultiIndex(levels=[['C_A', 'C_B'], ['C_1', 'C_2']],
-                          labels=[[0, 0, 1, 1], [0, 1, 0, 1]])
-        idx = MultiIndex.from_tuples([(1, 'one'), (1, 'two'), (2, 'one'),
-                                      (2, 'two'), (3, 'three'), (4, 'four')])
-        df = DataFrame([[1, 2, 11, 12], [3, 4, 13, 14], ['a', 'b', 'w', 'x'],
-                        ['c', 'd', 'y', 'z'], [-1, -2, -3, -4], [-5, -6, -7, -8]
-                        ], columns=cols, index=idx)
-        wp = Panel({'i1': df, 'i2': df})
-
-        exp_idx = MultiIndex.from_tuples([(1, 'one', 'C_A', 'C_1'), (1, 'one', 'C_A', 'C_2'),
-                                          (1, 'one', 'C_B', 'C_1'), (1, 'one', 'C_B', 'C_2'),
-                                          (1, 'two', 'C_A', 'C_1'), (1, 'two', 'C_A', 'C_2'),
-                                          (1, 'two', 'C_B', 'C_1'), (1, 'two', 'C_B', 'C_2'),
-                                          (2, 'one', 'C_A', 'C_1'), (2, 'one', 'C_A', 'C_2'),
-                                          (2, 'one', 'C_B', 'C_1'), (2, 'one', 'C_B', 'C_2'),
-                                          (2, 'two', 'C_A', 'C_1'), (2, 'two', 'C_A', 'C_2'),
-                                          (2, 'two', 'C_B', 'C_1'), (2, 'two', 'C_B', 'C_2'),
-                                          (3, 'three', 'C_A', 'C_1'), (3, 'three', 'C_A', 'C_2'),
-                                          (3, 'three', 'C_B', 'C_1'), (3, 'three', 'C_B', 'C_2'),
-                                          (4, 'four', 'C_A', 'C_1'), (4, 'four', 'C_A', 'C_2'),
-                                          (4, 'four', 'C_B', 'C_1'), (4, 'four', 'C_B', 'C_2')],
-                                         names=[None, None, None, None])
-        exp_val = [[1, 1], [2, 2], [11, 11], [12, 12], [3, 3], [4, 4], [13, 13],
-                   [14, 14], ['a', 'a'], ['b', 'b'], ['w', 'w'], ['x', 'x'],
-                   ['c', 'c'], ['d', 'd'], ['y', 'y'], ['z', 'z'], [-1, -1],
-                   [-2, -2], [-3, -3], [-4, -4], [-5, -5], [-6, -6], [-7, -7],
-                   [-8, -8]]
-        result = wp.to_frame()
-        expected = DataFrame(exp_val, columns=['i1', 'i2'], index=exp_idx)
-        assert_frame_equal(result, expected)
+        with catch_warnings(record=True):
+            cols = MultiIndex(levels=[['C_A', 'C_B'], ['C_1', 'C_2']],
+                              labels=[[0, 0, 1, 1], [0, 1, 0, 1]])
+            idx = MultiIndex.from_tuples([(1, 'one'), (1, 'two'), (2, 'one'), (
+                2, 'two'), (3, 'three'), (4, 'four')])
+            df = DataFrame([[1, 2, 11, 12], [3, 4, 13, 14],
+                            ['a', 'b', 'w', 'x'],
+                            ['c', 'd', 'y', 'z'], [-1, -2, -3, -4],
+                            [-5, -6, -7, -8]], columns=cols, index=idx)
+            wp = Panel({'i1': df, 'i2': df})
+
+            exp_idx = MultiIndex.from_tuples(
+                [(1, 'one', 'C_A', 'C_1'), (1, 'one', 'C_A', 'C_2'),
+                 (1, 'one', 'C_B', 'C_1'), (1, 'one', 'C_B', 'C_2'),
+                 (1, 'two', 'C_A', 'C_1'), (1, 'two', 'C_A', 'C_2'),
+                 (1, 'two', 'C_B', 'C_1'), (1, 'two', 'C_B', 'C_2'),
+                 (2, 'one', 'C_A', 'C_1'), (2, 'one', 'C_A', 'C_2'),
+                 (2, 'one', 'C_B', 'C_1'), (2, 'one', 'C_B', 'C_2'),
+                 (2, 'two', 'C_A', 'C_1'), (2, 'two', 'C_A', 'C_2'),
+                 (2, 'two', 'C_B', 'C_1'), (2, 'two', 'C_B', 'C_2'),
+                 (3, 'three', 'C_A', 'C_1'), (3, 'three', 'C_A', 'C_2'),
+                 (3, 'three', 'C_B', 'C_1'), (3, 'three', 'C_B', 'C_2'),
+                 (4, 'four', 'C_A', 'C_1'), (4, 'four', 'C_A', 'C_2'),
+                 (4, 'four', 'C_B', 'C_1'), (4, 'four', 'C_B', 'C_2')],
+                names=[None, None, None, None])
+            exp_val = [[1, 1], [2, 2], [11, 11], [12, 12],
+                       [3, 3], [4, 4],
+                       [13, 13], [14, 14], ['a', 'a'],
+                       ['b', 'b'], ['w', 'w'],
+                       ['x', 'x'], ['c', 'c'], ['d', 'd'], [
+                           'y', 'y'], ['z', 'z'],
+                       [-1, -1], [-2, -2], [-3, -3], [-4, -4],
+                       [-5, -5], [-6, -6],
+                       [-7, -7], [-8, -8]]
+            result = wp.to_frame()
+            expected = DataFrame(exp_val, columns=['i1', 'i2'], index=exp_idx)
+            assert_frame_equal(result, expected)
 
     def test_to_frame_multi_drop_level(self):
-        idx = MultiIndex.from_tuples([(1, 'one'), (2, 'one'), (2, 'two')])
-        df = DataFrame({'A': [np.nan, 1, 2]}, index=idx)
-        wp = Panel({'i1': df, 'i2': df})
-        result = wp.to_frame()
-        exp_idx = MultiIndex.from_tuples([(2, 'one', 'A'), (2, 'two', 'A')],
-                                         names=[None, None, 'minor'])
-        expected = DataFrame({'i1': [1., 2], 'i2': [1., 2]}, index=exp_idx)
-        assert_frame_equal(result, expected)
+        with catch_warnings(record=True):
+            idx = MultiIndex.from_tuples([(1, 'one'), (2, 'one'), (2, 'two')])
+            df = DataFrame({'A': [np.nan, 1, 2]}, index=idx)
+            wp = Panel({'i1': df, 'i2': df})
+            result = wp.to_frame()
+            exp_idx = MultiIndex.from_tuples(
+                [(2, 'one', 'A'), (2, 'two', 'A')],
+                names=[None, None, 'minor'])
+            expected = DataFrame({'i1': [1., 2], 'i2': [1., 2]}, index=exp_idx)
+            assert_frame_equal(result, expected)
 
     def test_to_panel_na_handling(self):
-        df = DataFrame(np.random.randint(0, 10, size=20).reshape((10, 2)),
-                       index=[[0, 0, 0, 0, 0, 0, 1, 1, 1, 1],
-                              [0, 1, 2, 3, 4, 5, 2, 3, 4, 5]])
+        with catch_warnings(record=True):
+            df = DataFrame(np.random.randint(0, 10, size=20).reshape((10, 2)),
+                           index=[[0, 0, 0, 0, 0, 0, 1, 1, 1, 1],
+                                  [0, 1, 2, 3, 4, 5, 2, 3, 4, 5]])
 
-        panel = df.to_panel()
-        self.assertTrue(isnull(panel[0].ix[1, [0, 1]]).all())
+            panel = df.to_panel()
+            assert isna(panel[0].loc[1, [0, 1]]).all()
 
     def test_to_panel_duplicates(self):
         # #2441
-        df = DataFrame({'a': [0, 0, 1], 'b': [1, 1, 1], 'c': [1, 2, 3]})
-        idf = df.set_index(['a', 'b'])
-        assertRaisesRegexp(ValueError, 'non-uniquely indexed', idf.to_panel)
+        with catch_warnings(record=True):
+            df = DataFrame({'a': [0, 0, 1], 'b': [1, 1, 1], 'c': [1, 2, 3]})
+            idf = df.set_index(['a', 'b'])
+            tm.assert_raises_regex(
+                ValueError, 'non-uniquely indexed', idf.to_panel)
 
     def test_panel_dups(self):
+        with catch_warnings(record=True):
 
-        # GH 4960
-        # duplicates in an index
+            # GH 4960
+            # duplicates in an index
 
-        # items
-        data = np.random.randn(5, 100, 5)
-        no_dup_panel = Panel(data, items=list("ABCDE"))
-        panel = Panel(data, items=list("AACDE"))
+            # items
+            data = np.random.randn(5, 100, 5)
+            no_dup_panel = Panel(data, items=list("ABCDE"))
+            panel = Panel(data, items=list("AACDE"))
 
-        expected = no_dup_panel['A']
-        result = panel.iloc[0]
-        assert_frame_equal(result, expected)
+            expected = no_dup_panel['A']
+            result = panel.iloc[0]
+            assert_frame_equal(result, expected)
 
-        expected = no_dup_panel['E']
-        result = panel.loc['E']
-        assert_frame_equal(result, expected)
+            expected = no_dup_panel['E']
+            result = panel.loc['E']
+            assert_frame_equal(result, expected)
 
-        expected = no_dup_panel.loc[['A','B']]
-        expected.items = ['A','A']
-        result = panel.loc['A']
-        assert_panel_equal(result, expected)
+            expected = no_dup_panel.loc[['A', 'B']]
+            expected.items = ['A', 'A']
+            result = panel.loc['A']
+            assert_panel_equal(result, expected)
 
-        # major
-        data = np.random.randn(5, 5, 5)
-        no_dup_panel = Panel(data, major_axis=list("ABCDE"))
-        panel = Panel(data, major_axis=list("AACDE"))
+            # major
+            data = np.random.randn(5, 5, 5)
+            no_dup_panel = Panel(data, major_axis=list("ABCDE"))
+            panel = Panel(data, major_axis=list("AACDE"))
 
-        expected = no_dup_panel.loc[:,'A']
-        result = panel.iloc[:,0]
-        assert_frame_equal(result, expected)
+            expected = no_dup_panel.loc[:, 'A']
+            result = panel.iloc[:, 0]
+            assert_frame_equal(result, expected)
 
-        expected = no_dup_panel.loc[:,'E']
-        result = panel.loc[:,'E']
-        assert_frame_equal(result, expected)
+            expected = no_dup_panel.loc[:, 'E']
+            result = panel.loc[:, 'E']
+            assert_frame_equal(result, expected)
 
-        expected = no_dup_panel.loc[:,['A','B']]
-        expected.major_axis = ['A','A']
-        result = panel.loc[:,'A']
-        assert_panel_equal(result, expected)
+            expected = no_dup_panel.loc[:, ['A', 'B']]
+            expected.major_axis = ['A', 'A']
+            result = panel.loc[:, 'A']
+            assert_panel_equal(result, expected)
 
-        # minor
-        data = np.random.randn(5, 100, 5)
-        no_dup_panel = Panel(data, minor_axis=list("ABCDE"))
-        panel = Panel(data, minor_axis=list("AACDE"))
+            # minor
+            data = np.random.randn(5, 100, 5)
+            no_dup_panel = Panel(data, minor_axis=list("ABCDE"))
+            panel = Panel(data, minor_axis=list("AACDE"))
 
-        expected = no_dup_panel.loc[:,:,'A']
-        result = panel.iloc[:,:,0]
-        assert_frame_equal(result, expected)
+            expected = no_dup_panel.loc[:, :, 'A']
+            result = panel.iloc[:, :, 0]
+            assert_frame_equal(result, expected)
 
-        expected = no_dup_panel.loc[:,:,'E']
-        result = panel.loc[:,:,'E']
-        assert_frame_equal(result, expected)
+            expected = no_dup_panel.loc[:, :, 'E']
+            result = panel.loc[:, :, 'E']
+            assert_frame_equal(result, expected)
 
-        expected = no_dup_panel.loc[:,:,['A','B']]
-        expected.minor_axis = ['A','A']
-        result = panel.loc[:,:,'A']
-        assert_panel_equal(result, expected)
+            expected = no_dup_panel.loc[:, :, ['A', 'B']]
+            expected.minor_axis = ['A', 'A']
+            result = panel.loc[:, :, 'A']
+            assert_panel_equal(result, expected)
 
     def test_filter(self):
         pass
 
     def test_compound(self):
-        compounded = self.panel.compound()
+        with catch_warnings(record=True):
+            compounded = self.panel.compound()
 
-        assert_series_equal(compounded['ItemA'],
-                            (1 + self.panel['ItemA']).product(0) - 1,
-                            check_names=False)
+            assert_series_equal(compounded['ItemA'],
+                                (1 + self.panel['ItemA']).product(0) - 1,
+                                check_names=False)
 
     def test_shift(self):
-        # major
-        idx = self.panel.major_axis[0]
-        idx_lag = self.panel.major_axis[1]
-        shifted = self.panel.shift(1)
-        assert_frame_equal(self.panel.major_xs(idx),
-                           shifted.major_xs(idx_lag))
-
-        # minor
-        idx = self.panel.minor_axis[0]
-        idx_lag = self.panel.minor_axis[1]
-        shifted = self.panel.shift(1, axis='minor')
-        assert_frame_equal(self.panel.minor_xs(idx),
-                           shifted.minor_xs(idx_lag))
-
-        # items
-        idx = self.panel.items[0]
-        idx_lag = self.panel.items[1]
-        shifted = self.panel.shift(1, axis='items')
-        assert_frame_equal(self.panel[idx],
-                           shifted[idx_lag])
-
-        # negative numbers, #2164
-        result = self.panel.shift(-1)
-        expected = Panel(dict((i, f.shift(-1)[:-1])
-                              for i, f in compat.iteritems(self.panel)))
-        assert_panel_equal(result, expected)
-
-        # mixed dtypes #6959
-        data = [('item '+ch, makeMixedDataFrame()) for ch in list('abcde')]
-        data = dict(data)
-        mixed_panel = Panel.from_dict(data, orient='minor')
-        shifted = mixed_panel.shift(1)
-        assert_series_equal(mixed_panel.dtypes, shifted.dtypes)
+        with catch_warnings(record=True):
+            # major
+            idx = self.panel.major_axis[0]
+            idx_lag = self.panel.major_axis[1]
+            shifted = self.panel.shift(1)
+            assert_frame_equal(self.panel.major_xs(idx),
+                               shifted.major_xs(idx_lag))
+
+            # minor
+            idx = self.panel.minor_axis[0]
+            idx_lag = self.panel.minor_axis[1]
+            shifted = self.panel.shift(1, axis='minor')
+            assert_frame_equal(self.panel.minor_xs(idx),
+                               shifted.minor_xs(idx_lag))
+
+            # items
+            idx = self.panel.items[0]
+            idx_lag = self.panel.items[1]
+            shifted = self.panel.shift(1, axis='items')
+            assert_frame_equal(self.panel[idx], shifted[idx_lag])
+
+            # negative numbers, #2164
+            result = self.panel.shift(-1)
+            expected = Panel({i: f.shift(-1)[:-1]
+                              for i, f in self.panel.iteritems()})
+            assert_panel_equal(result, expected)
+
+            # mixed dtypes #6959
+            data = [('item ' + ch, makeMixedDataFrame())
+                    for ch in list('abcde')]
+            data = dict(data)
+            mixed_panel = Panel.from_dict(data, orient='minor')
+            shifted = mixed_panel.shift(1)
+            assert_series_equal(mixed_panel.dtypes, shifted.dtypes)
 
     def test_tshift(self):
         # PeriodIndex
-        ps = tm.makePeriodPanel()
-        shifted = ps.tshift(1)
-        unshifted = shifted.tshift(-1)
+        with catch_warnings(record=True):
+            ps = tm.makePeriodPanel()
+            shifted = ps.tshift(1)
+            unshifted = shifted.tshift(-1)
 
-        assert_panel_equal(unshifted, ps)
+            assert_panel_equal(unshifted, ps)
 
-        shifted2 = ps.tshift(freq='B')
-        assert_panel_equal(shifted, shifted2)
+            shifted2 = ps.tshift(freq='B')
+            assert_panel_equal(shifted, shifted2)
 
-        shifted3 = ps.tshift(freq=bday)
-        assert_panel_equal(shifted, shifted3)
+            shifted3 = ps.tshift(freq=BDay())
+            assert_panel_equal(shifted, shifted3)
 
-        assertRaisesRegexp(ValueError, 'does not match', ps.tshift, freq='M')
+            tm.assert_raises_regex(ValueError, 'does not match',
+                                   ps.tshift, freq='M')
 
-        # DatetimeIndex
-        panel = _panel
-        shifted = panel.tshift(1)
-        unshifted = shifted.tshift(-1)
+            # DatetimeIndex
+            panel = make_test_panel()
+            shifted = panel.tshift(1)
+            unshifted = shifted.tshift(-1)
 
-        assert_panel_equal(panel, unshifted)
+            assert_panel_equal(panel, unshifted)
 
-        shifted2 = panel.tshift(freq=panel.major_axis.freq)
-        assert_panel_equal(shifted, shifted2)
+            shifted2 = panel.tshift(freq=panel.major_axis.freq)
+            assert_panel_equal(shifted, shifted2)
 
-        inferred_ts = Panel(panel.values,
-                                items=panel.items,
+            inferred_ts = Panel(panel.values, items=panel.items,
                                 major_axis=Index(np.asarray(panel.major_axis)),
                                 minor_axis=panel.minor_axis)
-        shifted = inferred_ts.tshift(1)
-        unshifted = shifted.tshift(-1)
-        assert_panel_equal(shifted, panel.tshift(1))
-        assert_panel_equal(unshifted, inferred_ts)
+            shifted = inferred_ts.tshift(1)
+            unshifted = shifted.tshift(-1)
+            assert_panel_equal(shifted, panel.tshift(1))
+            assert_panel_equal(unshifted, inferred_ts)
 
-        no_freq = panel.ix[:, [0, 5, 7], :]
-        self.assertRaises(ValueError, no_freq.tshift)
+            no_freq = panel.iloc[:, [0, 5, 7], :]
+            pytest.raises(ValueError, no_freq.tshift)
 
     def test_pct_change(self):
-        df1 = DataFrame({'c1': [1, 2, 5], 'c2': [3, 4, 6]})
-        df2 = df1 + 1
-        df3 = DataFrame({'c1': [3, 4, 7], 'c2': [5, 6, 8]})
-        wp = Panel({'i1': df1, 'i2': df2, 'i3': df3})
-        # major, 1
-        result = wp.pct_change()  # axis='major'
-        expected = Panel({'i1': df1.pct_change(),
-                          'i2': df2.pct_change(),
-                          'i3': df3.pct_change()})
-        assert_panel_equal(result, expected)
-        result = wp.pct_change(axis=1)
-        assert_panel_equal(result, expected)
-        # major, 2
-        result = wp.pct_change(periods=2)
-        expected = Panel({'i1': df1.pct_change(2),
-                          'i2': df2.pct_change(2),
-                          'i3': df3.pct_change(2)})
-        assert_panel_equal(result, expected)
-        # minor, 1
-        result = wp.pct_change(axis='minor')
-        expected = Panel({'i1': df1.pct_change(axis=1),
-                          'i2': df2.pct_change(axis=1),
-                          'i3': df3.pct_change(axis=1)})
-        assert_panel_equal(result, expected)
-        result = wp.pct_change(axis=2)
-        assert_panel_equal(result, expected)
-        # minor, 2
-        result = wp.pct_change(periods=2, axis='minor')
-        expected = Panel({'i1': df1.pct_change(periods=2, axis=1),
-                          'i2': df2.pct_change(periods=2, axis=1),
-                          'i3': df3.pct_change(periods=2, axis=1)})
-        assert_panel_equal(result, expected)
-        # items, 1
-        result = wp.pct_change(axis='items')
-        expected = Panel({'i1': DataFrame({'c1': [np.nan, np.nan, np.nan],
-                                           'c2': [np.nan, np.nan, np.nan]}),
-                          'i2': DataFrame({'c1': [1, 0.5, .2],
-                                           'c2': [1./3, 0.25, 1./6]}),
-                          'i3': DataFrame({'c1': [.5, 1./3, 1./6],
-                                           'c2': [.25, .2, 1./7]})})
-        assert_panel_equal(result, expected)
-        result = wp.pct_change(axis=0)
-        assert_panel_equal(result, expected)
-        # items, 2
-        result = wp.pct_change(periods=2, axis='items')
-        expected = Panel({'i1': DataFrame({'c1': [np.nan, np.nan, np.nan],
-                                           'c2': [np.nan, np.nan, np.nan]}),
-                          'i2': DataFrame({'c1': [np.nan, np.nan, np.nan],
-                                           'c2': [np.nan, np.nan, np.nan]}),
-                          'i3': DataFrame({'c1': [2, 1, .4],
-                                           'c2': [2./3, .5, 1./3]})})
-        assert_panel_equal(result, expected)
+        with catch_warnings(record=True):
+            df1 = DataFrame({'c1': [1, 2, 5], 'c2': [3, 4, 6]})
+            df2 = df1 + 1
+            df3 = DataFrame({'c1': [3, 4, 7], 'c2': [5, 6, 8]})
+            wp = Panel({'i1': df1, 'i2': df2, 'i3': df3})
+            # major, 1
+            result = wp.pct_change()  # axis='major'
+            expected = Panel({'i1': df1.pct_change(),
+                              'i2': df2.pct_change(),
+                              'i3': df3.pct_change()})
+            assert_panel_equal(result, expected)
+            result = wp.pct_change(axis=1)
+            assert_panel_equal(result, expected)
+            # major, 2
+            result = wp.pct_change(periods=2)
+            expected = Panel({'i1': df1.pct_change(2),
+                              'i2': df2.pct_change(2),
+                              'i3': df3.pct_change(2)})
+            assert_panel_equal(result, expected)
+            # minor, 1
+            result = wp.pct_change(axis='minor')
+            expected = Panel({'i1': df1.pct_change(axis=1),
+                              'i2': df2.pct_change(axis=1),
+                              'i3': df3.pct_change(axis=1)})
+            assert_panel_equal(result, expected)
+            result = wp.pct_change(axis=2)
+            assert_panel_equal(result, expected)
+            # minor, 2
+            result = wp.pct_change(periods=2, axis='minor')
+            expected = Panel({'i1': df1.pct_change(periods=2, axis=1),
+                              'i2': df2.pct_change(periods=2, axis=1),
+                              'i3': df3.pct_change(periods=2, axis=1)})
+            assert_panel_equal(result, expected)
+            # items, 1
+            result = wp.pct_change(axis='items')
+            expected = Panel(
+                {'i1': DataFrame({'c1': [np.nan, np.nan, np.nan],
+                                  'c2': [np.nan, np.nan, np.nan]}),
+                 'i2': DataFrame({'c1': [1, 0.5, .2],
+                                  'c2': [1. / 3, 0.25, 1. / 6]}),
+                 'i3': DataFrame({'c1': [.5, 1. / 3, 1. / 6],
+                                  'c2': [.25, .2, 1. / 7]})})
+            assert_panel_equal(result, expected)
+            result = wp.pct_change(axis=0)
+            assert_panel_equal(result, expected)
+            # items, 2
+            result = wp.pct_change(periods=2, axis='items')
+            expected = Panel(
+                {'i1': DataFrame({'c1': [np.nan, np.nan, np.nan],
+                                  'c2': [np.nan, np.nan, np.nan]}),
+                 'i2': DataFrame({'c1': [np.nan, np.nan, np.nan],
+                                  'c2': [np.nan, np.nan, np.nan]}),
+                 'i3': DataFrame({'c1': [2, 1, .4],
+                                  'c2': [2. / 3, .5, 1. / 3]})})
+            assert_panel_equal(result, expected)
+
+    def test_round(self):
+        with catch_warnings(record=True):
+            values = [[[-3.2, 2.2], [0, -4.8213], [3.123, 123.12],
+                       [-1566.213, 88.88], [-12, 94.5]],
+                      [[-5.82, 3.5], [6.21, -73.272], [-9.087, 23.12],
+                       [272.212, -99.99], [23, -76.5]]]
+            evalues = [[[float(np.around(i)) for i in j] for j in k]
+                       for k in values]
+            p = Panel(values, items=['Item1', 'Item2'],
+                      major_axis=date_range('1/1/2000', periods=5),
+                      minor_axis=['A', 'B'])
+            expected = Panel(evalues, items=['Item1', 'Item2'],
+                             major_axis=date_range('1/1/2000', periods=5),
+                             minor_axis=['A', 'B'])
+            result = p.round()
+            assert_panel_equal(expected, result)
+
+    def test_numpy_round(self):
+        with catch_warnings(record=True):
+            values = [[[-3.2, 2.2], [0, -4.8213], [3.123, 123.12],
+                       [-1566.213, 88.88], [-12, 94.5]],
+                      [[-5.82, 3.5], [6.21, -73.272], [-9.087, 23.12],
+                       [272.212, -99.99], [23, -76.5]]]
+            evalues = [[[float(np.around(i)) for i in j] for j in k]
+                       for k in values]
+            p = Panel(values, items=['Item1', 'Item2'],
+                      major_axis=date_range('1/1/2000', periods=5),
+                      minor_axis=['A', 'B'])
+            expected = Panel(evalues, items=['Item1', 'Item2'],
+                             major_axis=date_range('1/1/2000', periods=5),
+                             minor_axis=['A', 'B'])
+            result = np.round(p)
+            assert_panel_equal(expected, result)
+
+            msg = "the 'out' parameter is not supported"
+            tm.assert_raises_regex(ValueError, msg, np.round, p, out=p)
 
     def test_multiindex_get(self):
-        ind = MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1), ('b', 2)],
-                                     names=['first', 'second'])
-        wp = Panel(np.random.random((4, 5, 5)),
-                   items=ind,
-                   major_axis=np.arange(5),
-                   minor_axis=np.arange(5))
-        f1 = wp['a']
-        f2 = wp.ix['a']
-        assert_panel_equal(f1, f2)
-
-        self.assertTrue((f1.items == [1, 2]).all())
-        self.assertTrue((f2.items == [1, 2]).all())
-
-        ind = MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)],
-                                     names=['first', 'second'])
+        with catch_warnings(record=True):
+            ind = MultiIndex.from_tuples(
+                [('a', 1), ('a', 2), ('b', 1), ('b', 2)],
+                names=['first', 'second'])
+            wp = Panel(np.random.random((4, 5, 5)),
+                       items=ind,
+                       major_axis=np.arange(5),
+                       minor_axis=np.arange(5))
+            f1 = wp['a']
+            f2 = wp.loc['a']
+            assert_panel_equal(f1, f2)
+
+            assert (f1.items == [1, 2]).all()
+            assert (f2.items == [1, 2]).all()
+
+            MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)],
+                                   names=['first', 'second'])
 
     def test_multiindex_blocks(self):
-        ind = MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)],
-                                     names=['first', 'second'])
-        wp = Panel(self.panel._data)
-        wp.items = ind
-        f1 = wp['a']
-        self.assertTrue((f1.items == [1, 2]).all())
+        with catch_warnings(record=True):
+            ind = MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)],
+                                         names=['first', 'second'])
+            wp = Panel(self.panel._data)
+            wp.items = ind
+            f1 = wp['a']
+            assert (f1.items == [1, 2]).all()
 
-        f1 = wp[('b', 1)]
-        self.assertTrue((f1.columns == ['A', 'B', 'C', 'D']).all())
+            f1 = wp[('b', 1)]
+            assert (f1.columns == ['A', 'B', 'C', 'D']).all()
 
     def test_repr_empty(self):
-        empty = Panel()
-        repr(empty)
+        with catch_warnings(record=True):
+            empty = Panel()
+            repr(empty)
 
     def test_rename(self):
-        mapper = {
-            'ItemA': 'foo',
-            'ItemB': 'bar',
-            'ItemC': 'baz'
-        }
+        with catch_warnings(record=True):
+            mapper = {'ItemA': 'foo', 'ItemB': 'bar', 'ItemC': 'baz'}
 
-        renamed = self.panel.rename_axis(mapper, axis=0)
-        exp = Index(['foo', 'bar', 'baz'])
-        self.assertTrue(renamed.items.equals(exp))
+            renamed = self.panel.rename_axis(mapper, axis=0)
+            exp = Index(['foo', 'bar', 'baz'])
+            tm.assert_index_equal(renamed.items, exp)
 
-        renamed = self.panel.rename_axis(str.lower, axis=2)
-        exp = Index(['a', 'b', 'c', 'd'])
-        self.assertTrue(renamed.minor_axis.equals(exp))
+            renamed = self.panel.rename_axis(str.lower, axis=2)
+            exp = Index(['a', 'b', 'c', 'd'])
+            tm.assert_index_equal(renamed.minor_axis, exp)
 
-        # don't copy
-        renamed_nocopy = self.panel.rename_axis(mapper, axis=0, copy=False)
-        renamed_nocopy['foo'] = 3.
-        self.assertTrue((self.panel['ItemA'].values == 3).all())
+            # don't copy
+            renamed_nocopy = self.panel.rename_axis(mapper, axis=0, copy=False)
+            renamed_nocopy['foo'] = 3.
+            assert (self.panel['ItemA'].values == 3).all()
 
     def test_get_attr(self):
         assert_frame_equal(self.panel['ItemA'], self.panel.ItemA)
@@ -1939,540 +2190,527 @@ def test_get_attr(self):
         self.panel['i'] = self.panel['ItemA']
         assert_frame_equal(self.panel['i'], self.panel.i)
 
-
     def test_from_frame_level1_unsorted(self):
-        tuples = [('MSFT', 3), ('MSFT', 2), ('AAPL', 2),
-                  ('AAPL', 1), ('MSFT', 1)]
-        midx = MultiIndex.from_tuples(tuples)
-        df = DataFrame(np.random.rand(5, 4), index=midx)
-        p = df.to_panel()
-        assert_frame_equal(p.minor_xs(2), df.xs(2, level=1).sort_index())
+        with catch_warnings(record=True):
+            tuples = [('MSFT', 3), ('MSFT', 2), ('AAPL', 2), ('AAPL', 1),
+                      ('MSFT', 1)]
+            midx = MultiIndex.from_tuples(tuples)
+            df = DataFrame(np.random.rand(5, 4), index=midx)
+            p = df.to_panel()
+            assert_frame_equal(p.minor_xs(2), df.xs(2, level=1).sort_index())
 
     def test_to_excel(self):
-        import os
         try:
-            import xlwt
-            import xlrd
-            import openpyxl
+            import xlwt  # noqa
+            import xlrd  # noqa
+            import openpyxl  # noqa
             from pandas.io.excel import ExcelFile
         except ImportError:
-            raise nose.SkipTest("need xlwt xlrd openpyxl")
+            pytest.skip("need xlwt xlrd openpyxl")
 
         for ext in ['xls', 'xlsx']:
-            path = '__tmp__.' + ext
-            with ensure_clean(path) as path:
+            with ensure_clean('__tmp__.' + ext) as path:
                 self.panel.to_excel(path)
                 try:
                     reader = ExcelFile(path)
                 except ImportError:
-                    raise nose.SkipTest("need xlwt xlrd openpyxl")
+                    pytest.skip("need xlwt xlrd openpyxl")
 
-                for item, df in compat.iteritems(self.panel):
+                for item, df in self.panel.iteritems():
                     recdf = reader.parse(str(item), index_col=0)
                     assert_frame_equal(df, recdf)
 
     def test_to_excel_xlsxwriter(self):
         try:
-            import xlrd
-            import xlsxwriter
+            import xlrd  # noqa
+            import xlsxwriter  # noqa
             from pandas.io.excel import ExcelFile
         except ImportError:
-            raise nose.SkipTest("Requires xlrd and xlsxwriter. Skipping test.")
+            pytest.skip("Requires xlrd and xlsxwriter. Skipping test.")
 
-        path = '__tmp__.xlsx'
-        with ensure_clean(path) as path:
+        with ensure_clean('__tmp__.xlsx') as path:
             self.panel.to_excel(path, engine='xlsxwriter')
             try:
                 reader = ExcelFile(path)
             except ImportError as e:
-                raise nose.SkipTest("cannot write excel file: %s" % e)
+                pytest.skip("cannot write excel file: %s" % e)
 
-            for item, df in compat.iteritems(self.panel):
+            for item, df in self.panel.iteritems():
                 recdf = reader.parse(str(item), index_col=0)
                 assert_frame_equal(df, recdf)
 
     def test_dropna(self):
-        p = Panel(np.random.randn(4, 5, 6), major_axis=list('abcde'))
-        p.ix[:, ['b', 'd'], 0] = np.nan
+        with catch_warnings(record=True):
+            p = Panel(np.random.randn(4, 5, 6), major_axis=list('abcde'))
+            p.loc[:, ['b', 'd'], 0] = np.nan
 
-        result = p.dropna(axis=1)
-        exp = p.ix[:, ['a', 'c', 'e'], :]
-        assert_panel_equal(result, exp)
-        inp = p.copy()
-        inp.dropna(axis=1, inplace=True)
-        assert_panel_equal(inp, exp)
+            result = p.dropna(axis=1)
+            exp = p.loc[:, ['a', 'c', 'e'], :]
+            assert_panel_equal(result, exp)
+            inp = p.copy()
+            inp.dropna(axis=1, inplace=True)
+            assert_panel_equal(inp, exp)
 
-        result = p.dropna(axis=1, how='all')
-        assert_panel_equal(result, p)
+            result = p.dropna(axis=1, how='all')
+            assert_panel_equal(result, p)
 
-        p.ix[:, ['b', 'd'], :] = np.nan
-        result = p.dropna(axis=1, how='all')
-        exp = p.ix[:, ['a', 'c', 'e'], :]
-        assert_panel_equal(result, exp)
+            p.loc[:, ['b', 'd'], :] = np.nan
+            result = p.dropna(axis=1, how='all')
+            exp = p.loc[:, ['a', 'c', 'e'], :]
+            assert_panel_equal(result, exp)
 
-        p = Panel(np.random.randn(4, 5, 6), items=list('abcd'))
-        p.ix[['b'], :, 0] = np.nan
+            p = Panel(np.random.randn(4, 5, 6), items=list('abcd'))
+            p.loc[['b'], :, 0] = np.nan
 
-        result = p.dropna()
-        exp = p.ix[['a', 'c', 'd']]
-        assert_panel_equal(result, exp)
+            result = p.dropna()
+            exp = p.loc[['a', 'c', 'd']]
+            assert_panel_equal(result, exp)
 
-        result = p.dropna(how='all')
-        assert_panel_equal(result, p)
+            result = p.dropna(how='all')
+            assert_panel_equal(result, p)
 
-        p.ix['b'] = np.nan
-        result = p.dropna(how='all')
-        exp = p.ix[['a', 'c', 'd']]
-        assert_panel_equal(result, exp)
+            p.loc['b'] = np.nan
+            result = p.dropna(how='all')
+            exp = p.loc[['a', 'c', 'd']]
+            assert_panel_equal(result, exp)
 
     def test_drop(self):
-        df = DataFrame({"A": [1, 2], "B": [3, 4]})
-        panel = Panel({"One": df, "Two": df})
+        with catch_warnings(record=True):
+            df = DataFrame({"A": [1, 2], "B": [3, 4]})
+            panel = Panel({"One": df, "Two": df})
 
-        def check_drop(drop_val, axis_number, aliases, expected):
-            try:
-                actual = panel.drop(drop_val, axis=axis_number)
-                assert_panel_equal(actual, expected)
-                for alias in aliases:
-                    actual = panel.drop(drop_val, axis=alias)
+            def check_drop(drop_val, axis_number, aliases, expected):
+                try:
+                    actual = panel.drop(drop_val, axis=axis_number)
                     assert_panel_equal(actual, expected)
-            except AssertionError:
-                com.pprint_thing("Failed with axis_number %d and aliases: %s" %
+                    for alias in aliases:
+                        actual = panel.drop(drop_val, axis=alias)
+                        assert_panel_equal(actual, expected)
+                except AssertionError:
+                    pprint_thing("Failed with axis_number %d and aliases: %s" %
                                  (axis_number, aliases))
-                raise
-        # Items
-        expected = Panel({"One": df})
-        check_drop('Two', 0, ['items'], expected)
-
-        self.assertRaises(ValueError, panel.drop, 'Three')
-
-        # errors = 'ignore'
-        dropped = panel.drop('Three', errors='ignore')
-        assert_panel_equal(dropped, panel)
-        dropped = panel.drop(['Two', 'Three'], errors='ignore')
-        expected = Panel({"One": df})
-        assert_panel_equal(dropped, expected)
-
-        # Major
-        exp_df = DataFrame({"A": [2], "B": [4]}, index=[1])
-        expected = Panel({"One": exp_df, "Two": exp_df})
-        check_drop(0, 1, ['major_axis', 'major'], expected)
-
-        exp_df = DataFrame({"A": [1], "B": [3]}, index=[0])
-        expected = Panel({"One": exp_df, "Two": exp_df})
-        check_drop([1], 1, ['major_axis', 'major'], expected)
-
-        # Minor
-        exp_df = df[['B']]
-        expected = Panel({"One": exp_df, "Two": exp_df})
-        check_drop(["A"], 2, ['minor_axis', 'minor'], expected)
-
-        exp_df = df[['A']]
-        expected = Panel({"One": exp_df, "Two": exp_df})
-        check_drop("B", 2, ['minor_axis', 'minor'], expected)
+                    raise
+            # Items
+            expected = Panel({"One": df})
+            check_drop('Two', 0, ['items'], expected)
+
+            pytest.raises(KeyError, panel.drop, 'Three')
+
+            # errors = 'ignore'
+            dropped = panel.drop('Three', errors='ignore')
+            assert_panel_equal(dropped, panel)
+            dropped = panel.drop(['Two', 'Three'], errors='ignore')
+            expected = Panel({"One": df})
+            assert_panel_equal(dropped, expected)
+
+            # Major
+            exp_df = DataFrame({"A": [2], "B": [4]}, index=[1])
+            expected = Panel({"One": exp_df, "Two": exp_df})
+            check_drop(0, 1, ['major_axis', 'major'], expected)
+
+            exp_df = DataFrame({"A": [1], "B": [3]}, index=[0])
+            expected = Panel({"One": exp_df, "Two": exp_df})
+            check_drop([1], 1, ['major_axis', 'major'], expected)
+
+            # Minor
+            exp_df = df[['B']]
+            expected = Panel({"One": exp_df, "Two": exp_df})
+            check_drop(["A"], 2, ['minor_axis', 'minor'], expected)
+
+            exp_df = df[['A']]
+            expected = Panel({"One": exp_df, "Two": exp_df})
+            check_drop("B", 2, ['minor_axis', 'minor'], expected)
 
     def test_update(self):
-        pan = Panel([[[1.5, np.nan, 3.],
-                    [1.5, np.nan, 3.],
-                    [1.5, np.nan, 3.],
-                    [1.5, np.nan, 3.]],
-            [[1.5, np.nan, 3.],
-             [1.5, np.nan, 3.],
-             [1.5, np.nan, 3.],
-             [1.5, np.nan, 3.]]])
-
-        other = Panel([[[3.6, 2., np.nan],
-                        [np.nan, np.nan, 7]]], items=[1])
-
-        pan.update(other)
-
-        expected = Panel([[[1.5, np.nan, 3.],
-                           [1.5, np.nan, 3.],
-                           [1.5, np.nan, 3.],
-                           [1.5, np.nan, 3.]],
-                          [[3.6, 2., 3],
-                              [1.5, np.nan, 7],
-                              [1.5, np.nan, 3.],
-                              [1.5, np.nan, 3.]]])
-
-        assert_panel_equal(pan, expected)
+        with catch_warnings(record=True):
+            pan = Panel([[[1.5, np.nan, 3.], [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.]],
+                         [[1.5, np.nan, 3.], [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.]]])
+
+            other = Panel(
+                [[[3.6, 2., np.nan], [np.nan, np.nan, 7]]], items=[1])
+
+            pan.update(other)
+
+            expected = Panel([[[1.5, np.nan, 3.], [1.5, np.nan, 3.],
+                               [1.5, np.nan, 3.], [1.5, np.nan, 3.]],
+                              [[3.6, 2., 3], [1.5, np.nan, 7],
+                               [1.5, np.nan, 3.],
+                               [1.5, np.nan, 3.]]])
+
+            assert_panel_equal(pan, expected)
 
     def test_update_from_dict(self):
-        pan = Panel({'one': DataFrame([[1.5, np.nan, 3],
-                                       [1.5, np.nan, 3],
-                                       [1.5, np.nan, 3.],
-                                       [1.5, np.nan, 3.]]),
-                     'two': DataFrame([[1.5, np.nan, 3.],
-                                       [1.5, np.nan, 3.],
-                                       [1.5, np.nan, 3.],
-                                       [1.5, np.nan, 3.]])})
-
-        other = {'two': DataFrame([[3.6, 2., np.nan],
-                                   [np.nan, np.nan, 7]])}
-
-        pan.update(other)
-
-        expected = Panel({'two': DataFrame([[3.6, 2., 3],
-                                            [1.5, np.nan, 7],
-                                            [1.5, np.nan, 3.],
-                                            [1.5, np.nan, 3.]]),
-                          'one': DataFrame([[1.5, np.nan, 3.],
-                                            [1.5, np.nan, 3.],
-                                            [1.5, np.nan, 3.],
-                                            [1.5, np.nan, 3.]])})
-
-        assert_panel_equal(pan, expected)
+        with catch_warnings(record=True):
+            pan = Panel({'one': DataFrame([[1.5, np.nan, 3],
+                                           [1.5, np.nan, 3],
+                                           [1.5, np.nan, 3.],
+                                           [1.5, np.nan, 3.]]),
+                         'two': DataFrame([[1.5, np.nan, 3.],
+                                           [1.5, np.nan, 3.],
+                                           [1.5, np.nan, 3.],
+                                           [1.5, np.nan, 3.]])})
+
+            other = {'two': DataFrame(
+                [[3.6, 2., np.nan], [np.nan, np.nan, 7]])}
+
+            pan.update(other)
+
+            expected = Panel(
+                {'one': DataFrame([[1.5, np.nan, 3.],
+                                   [1.5, np.nan, 3.],
+                                   [1.5, np.nan, 3.],
+                                   [1.5, np.nan, 3.]]),
+                 'two': DataFrame([[3.6, 2., 3],
+                                  [1.5, np.nan, 7],
+                                  [1.5, np.nan, 3.],
+                                  [1.5, np.nan, 3.]])
+                 }
+            )
+
+            assert_panel_equal(pan, expected)
 
     def test_update_nooverwrite(self):
-        pan = Panel([[[1.5, np.nan, 3.],
-                    [1.5, np.nan, 3.],
-                    [1.5, np.nan, 3.],
-                    [1.5, np.nan, 3.]],
-            [[1.5, np.nan, 3.],
-             [1.5, np.nan, 3.],
-             [1.5, np.nan, 3.],
-             [1.5, np.nan, 3.]]])
-
-        other = Panel([[[3.6, 2., np.nan],
-                        [np.nan, np.nan, 7]]], items=[1])
-
-        pan.update(other, overwrite=False)
-
-        expected = Panel([[[1.5, np.nan, 3],
-                           [1.5, np.nan, 3],
-                           [1.5, np.nan, 3.],
-                           [1.5, np.nan, 3.]],
-                          [[1.5, 2., 3.],
-                              [1.5, np.nan, 3.],
-                              [1.5, np.nan, 3.],
-                              [1.5, np.nan, 3.]]])
-
-        assert_panel_equal(pan, expected)
+        with catch_warnings(record=True):
+            pan = Panel([[[1.5, np.nan, 3.], [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.]],
+                         [[1.5, np.nan, 3.], [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.]]])
+
+            other = Panel(
+                [[[3.6, 2., np.nan], [np.nan, np.nan, 7]]], items=[1])
+
+            pan.update(other, overwrite=False)
+
+            expected = Panel([[[1.5, np.nan, 3], [1.5, np.nan, 3],
+                               [1.5, np.nan, 3.], [1.5, np.nan, 3.]],
+                              [[1.5, 2., 3.], [1.5, np.nan, 3.],
+                               [1.5, np.nan, 3.],
+                               [1.5, np.nan, 3.]]])
+
+            assert_panel_equal(pan, expected)
 
     def test_update_filtered(self):
-        pan = Panel([[[1.5, np.nan, 3.],
-                    [1.5, np.nan, 3.],
-                    [1.5, np.nan, 3.],
-                    [1.5, np.nan, 3.]],
-            [[1.5, np.nan, 3.],
-             [1.5, np.nan, 3.],
-             [1.5, np.nan, 3.],
-             [1.5, np.nan, 3.]]])
-
-        other = Panel([[[3.6, 2., np.nan],
-                        [np.nan, np.nan, 7]]], items=[1])
-
-        pan.update(other, filter_func=lambda x: x > 2)
-
-        expected = Panel([[[1.5, np.nan, 3.],
-                           [1.5, np.nan, 3.],
-                           [1.5, np.nan, 3.],
-                           [1.5, np.nan, 3.]],
-                          [[1.5, np.nan, 3],
-                              [1.5, np.nan, 7],
-                              [1.5, np.nan, 3.],
-                              [1.5, np.nan, 3.]]])
-
-        assert_panel_equal(pan, expected)
+        with catch_warnings(record=True):
+            pan = Panel([[[1.5, np.nan, 3.], [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.]],
+                         [[1.5, np.nan, 3.], [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.]]])
+
+            other = Panel(
+                [[[3.6, 2., np.nan], [np.nan, np.nan, 7]]], items=[1])
+
+            pan.update(other, filter_func=lambda x: x > 2)
+
+            expected = Panel([[[1.5, np.nan, 3.], [1.5, np.nan, 3.],
+                               [1.5, np.nan, 3.], [1.5, np.nan, 3.]],
+                              [[1.5, np.nan, 3], [1.5, np.nan, 7],
+                               [1.5, np.nan, 3.], [1.5, np.nan, 3.]]])
+
+            assert_panel_equal(pan, expected)
 
     def test_update_raise(self):
-        pan = Panel([[[1.5, np.nan, 3.],
-                    [1.5, np.nan, 3.],
-                    [1.5, np.nan, 3.],
-                    [1.5, np.nan, 3.]],
-            [[1.5, np.nan, 3.],
-             [1.5, np.nan, 3.],
-             [1.5, np.nan, 3.],
-             [1.5, np.nan, 3.]]])
-
-        np.testing.assert_raises(Exception, pan.update, *(pan,),
-                                 **{'raise_conflict': True})
+        with catch_warnings(record=True):
+            pan = Panel([[[1.5, np.nan, 3.], [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.]],
+                         [[1.5, np.nan, 3.], [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.],
+                          [1.5, np.nan, 3.]]])
+
+            pytest.raises(Exception, pan.update, *(pan, ),
+                          **{'raise_conflict': True})
 
     def test_all_any(self):
-        self.assertTrue((self.panel.all(axis=0).values ==
-                         nanall(self.panel, axis=0)).all())
-        self.assertTrue((self.panel.all(axis=1).values ==
-                         nanall(self.panel, axis=1).T).all())
-        self.assertTrue((self.panel.all(axis=2).values ==
-                         nanall(self.panel, axis=2).T).all())
-        self.assertTrue((self.panel.any(axis=0).values ==
-                         nanany(self.panel, axis=0)).all())
-        self.assertTrue((self.panel.any(axis=1).values ==
-                         nanany(self.panel, axis=1).T).all())
-        self.assertTrue((self.panel.any(axis=2).values ==
-                         nanany(self.panel, axis=2).T).all())
+        assert (self.panel.all(axis=0).values == nanall(
+            self.panel, axis=0)).all()
+        assert (self.panel.all(axis=1).values == nanall(
+            self.panel, axis=1).T).all()
+        assert (self.panel.all(axis=2).values == nanall(
+            self.panel, axis=2).T).all()
+        assert (self.panel.any(axis=0).values == nanany(
+            self.panel, axis=0)).all()
+        assert (self.panel.any(axis=1).values == nanany(
+            self.panel, axis=1).T).all()
+        assert (self.panel.any(axis=2).values == nanany(
+            self.panel, axis=2).T).all()
 
     def test_all_any_unhandled(self):
-        self.assertRaises(NotImplementedError, self.panel.all, bool_only=True)
-        self.assertRaises(NotImplementedError, self.panel.any, bool_only=True)
+        pytest.raises(NotImplementedError, self.panel.all, bool_only=True)
+        pytest.raises(NotImplementedError, self.panel.any, bool_only=True)
 
+    # GH issue 15960
+    def test_sort_values(self):
+        pytest.raises(NotImplementedError, self.panel.sort_values)
+        pytest.raises(NotImplementedError, self.panel.sort_values, 'ItemA')
 
-class TestLongPanel(tm.TestCase):
+
+class TestPanelFrame(object):
     """
-    LongPanel no longer exists, but...
+    Check that conversions to and from Panel to DataFrame work.
     """
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        import warnings
-        warnings.filterwarnings(action='ignore', category=FutureWarning)
-
-        panel = tm.makePanel()
-        tm.add_nans(panel)
 
+    def setup_method(self, method):
+        panel = make_test_panel()
         self.panel = panel.to_frame()
         self.unfiltered_panel = panel.to_frame(filter_observations=False)
 
     def test_ops_differently_indexed(self):
-        # trying to set non-identically indexed panel
-        wp = self.panel.to_panel()
-        wp2 = wp.reindex(major=wp.major_axis[:-1])
-        lp2 = wp2.to_frame()
+        with catch_warnings(record=True):
+            # trying to set non-identically indexed panel
+            wp = self.panel.to_panel()
+            wp2 = wp.reindex(major=wp.major_axis[:-1])
+            lp2 = wp2.to_frame()
 
-        result = self.panel + lp2
-        assert_frame_equal(result.reindex(lp2.index), lp2 * 2)
+            result = self.panel + lp2
+            assert_frame_equal(result.reindex(lp2.index), lp2 * 2)
 
-        # careful, mutation
-        self.panel['foo'] = lp2['ItemA']
-        assert_series_equal(self.panel['foo'].reindex(lp2.index),
-                            lp2['ItemA'], check_names=False)
+            # careful, mutation
+            self.panel['foo'] = lp2['ItemA']
+            assert_series_equal(self.panel['foo'].reindex(lp2.index),
+                                lp2['ItemA'],
+                                check_names=False)
 
     def test_ops_scalar(self):
-        result = self.panel.mul(2)
-        expected = DataFrame.__mul__(self.panel, 2)
-        assert_frame_equal(result, expected)
+        with catch_warnings(record=True):
+            result = self.panel.mul(2)
+            expected = DataFrame.__mul__(self.panel, 2)
+            assert_frame_equal(result, expected)
 
     def test_combineFrame(self):
-        wp = self.panel.to_panel()
-        result = self.panel.add(wp['ItemA'].stack(), axis=0)
-        assert_frame_equal(result.to_panel()['ItemA'], wp['ItemA'] * 2)
+        with catch_warnings(record=True):
+            wp = self.panel.to_panel()
+            result = self.panel.add(wp['ItemA'].stack(), axis=0)
+            assert_frame_equal(result.to_panel()['ItemA'], wp['ItemA'] * 2)
 
     def test_combinePanel(self):
-        wp = self.panel.to_panel()
-        result = self.panel.add(self.panel)
-        wide_result = result.to_panel()
-        assert_frame_equal(wp['ItemA'] * 2, wide_result['ItemA'])
+        with catch_warnings(record=True):
+            wp = self.panel.to_panel()
+            result = self.panel.add(self.panel)
+            wide_result = result.to_panel()
+            assert_frame_equal(wp['ItemA'] * 2, wide_result['ItemA'])
 
-        # one item
-        result = self.panel.add(self.panel.filter(['ItemA']))
+            # one item
+            result = self.panel.add(self.panel.filter(['ItemA']))
 
     def test_combine_scalar(self):
-        result = self.panel.mul(2)
-        expected = DataFrame(self.panel._data) * 2
-        assert_frame_equal(result, expected)
+        with catch_warnings(record=True):
+            result = self.panel.mul(2)
+            expected = DataFrame(self.panel._data) * 2
+            assert_frame_equal(result, expected)
 
     def test_combine_series(self):
-        s = self.panel['ItemA'][:10]
-        result = self.panel.add(s, axis=0)
-        expected = DataFrame.add(self.panel, s, axis=0)
-        assert_frame_equal(result, expected)
+        with catch_warnings(record=True):
+            s = self.panel['ItemA'][:10]
+            result = self.panel.add(s, axis=0)
+            expected = DataFrame.add(self.panel, s, axis=0)
+            assert_frame_equal(result, expected)
 
-        s = self.panel.ix[5]
-        result = self.panel + s
-        expected = DataFrame.add(self.panel, s, axis=1)
-        assert_frame_equal(result, expected)
+            s = self.panel.iloc[5]
+            result = self.panel + s
+            expected = DataFrame.add(self.panel, s, axis=1)
+            assert_frame_equal(result, expected)
 
     def test_operators(self):
-        wp = self.panel.to_panel()
-        result = (self.panel + 1).to_panel()
-        assert_frame_equal(wp['ItemA'] + 1, result['ItemA'])
+        with catch_warnings(record=True):
+            wp = self.panel.to_panel()
+            result = (self.panel + 1).to_panel()
+            assert_frame_equal(wp['ItemA'] + 1, result['ItemA'])
 
     def test_arith_flex_panel(self):
-        ops = ['add', 'sub', 'mul', 'div', 'truediv', 'pow', 'floordiv', 'mod']
-        if not compat.PY3:
-            aliases = {}
-        else:
-            aliases = {'div': 'truediv'}
-        self.panel = self.panel.to_panel()
-
-        for n in [ np.random.randint(-50, -1), np.random.randint(1, 50), 0]:
-            for op in ops:
-                alias = aliases.get(op, op)
-                f = getattr(operator, alias)
-                exp = f(self.panel, n)
-                result = getattr(self.panel, op)(n)
-                assert_panel_equal(result, exp, check_panel_type=True)
-
-                # rops
-                r_f = lambda x, y: f(y, x)
-                exp = r_f(self.panel, n)
-                result = getattr(self.panel, 'r' + op)(n)
-                assert_panel_equal(result, exp)
+        with catch_warnings(record=True):
+            ops = ['add', 'sub', 'mul', 'div',
+                   'truediv', 'pow', 'floordiv', 'mod']
+            if not compat.PY3:
+                aliases = {}
+            else:
+                aliases = {'div': 'truediv'}
+            self.panel = self.panel.to_panel()
+
+            for n in [np.random.randint(-50, -1), np.random.randint(1, 50), 0]:
+                for op in ops:
+                    alias = aliases.get(op, op)
+                    f = getattr(operator, alias)
+                    exp = f(self.panel, n)
+                    result = getattr(self.panel, op)(n)
+                    assert_panel_equal(result, exp, check_panel_type=True)
+
+                    # rops
+                    r_f = lambda x, y: f(y, x)
+                    exp = r_f(self.panel, n)
+                    result = getattr(self.panel, 'r' + op)(n)
+                    assert_panel_equal(result, exp)
 
     def test_sort(self):
         def is_sorted(arr):
             return (arr[1:] > arr[:-1]).any()
 
-        sorted_minor = self.panel.sortlevel(level=1)
-        self.assertTrue(is_sorted(sorted_minor.index.labels[1]))
+        sorted_minor = self.panel.sort_index(level=1)
+        assert is_sorted(sorted_minor.index.labels[1])
 
-        sorted_major = sorted_minor.sortlevel(level=0)
-        self.assertTrue(is_sorted(sorted_major.index.labels[0]))
+        sorted_major = sorted_minor.sort_index(level=0)
+        assert is_sorted(sorted_major.index.labels[0])
 
     def test_to_string(self):
         buf = StringIO()
         self.panel.to_string(buf)
 
+    def test_to_sparse(self):
+        if isinstance(self.panel, Panel):
+            msg = 'sparsifying is not supported'
+            tm.assert_raises_regex(NotImplementedError, msg,
+                                   self.panel.to_sparse)
+
     def test_truncate(self):
-        dates = self.panel.index.levels[0]
-        start, end = dates[1], dates[5]
+        with catch_warnings(record=True):
+            dates = self.panel.index.levels[0]
+            start, end = dates[1], dates[5]
 
-        trunced = self.panel.truncate(start, end).to_panel()
-        expected = self.panel.to_panel()['ItemA'].truncate(start, end)
+            trunced = self.panel.truncate(start, end).to_panel()
+            expected = self.panel.to_panel()['ItemA'].truncate(start, end)
 
-        assert_frame_equal(trunced['ItemA'], expected, check_names=False)  # TODO trucate drops index.names
+            # TODO truncate drops index.names
+            assert_frame_equal(trunced['ItemA'], expected, check_names=False)
 
-        trunced = self.panel.truncate(before=start).to_panel()
-        expected = self.panel.to_panel()['ItemA'].truncate(before=start)
+            trunced = self.panel.truncate(before=start).to_panel()
+            expected = self.panel.to_panel()['ItemA'].truncate(before=start)
 
-        assert_frame_equal(trunced['ItemA'], expected, check_names=False)  # TODO trucate drops index.names
+            # TODO truncate drops index.names
+            assert_frame_equal(trunced['ItemA'], expected, check_names=False)
 
-        trunced = self.panel.truncate(after=end).to_panel()
-        expected = self.panel.to_panel()['ItemA'].truncate(after=end)
+            trunced = self.panel.truncate(after=end).to_panel()
+            expected = self.panel.to_panel()['ItemA'].truncate(after=end)
 
-        assert_frame_equal(trunced['ItemA'], expected, check_names=False)  # TODO trucate drops index.names
+            # TODO truncate drops index.names
+            assert_frame_equal(trunced['ItemA'], expected, check_names=False)
 
-        # truncate on dates that aren't in there
-        wp = self.panel.to_panel()
-        new_index = wp.major_axis[::5]
+            # truncate on dates that aren't in there
+            wp = self.panel.to_panel()
+            new_index = wp.major_axis[::5]
 
-        wp2 = wp.reindex(major=new_index)
+            wp2 = wp.reindex(major=new_index)
 
-        lp2 = wp2.to_frame()
-        lp_trunc = lp2.truncate(wp.major_axis[2], wp.major_axis[-2])
+            lp2 = wp2.to_frame()
+            lp_trunc = lp2.truncate(wp.major_axis[2], wp.major_axis[-2])
 
-        wp_trunc = wp2.truncate(wp.major_axis[2], wp.major_axis[-2])
+            wp_trunc = wp2.truncate(wp.major_axis[2], wp.major_axis[-2])
 
-        assert_panel_equal(wp_trunc, lp_trunc.to_panel())
+            assert_panel_equal(wp_trunc, lp_trunc.to_panel())
 
-        # throw proper exception
-        self.assertRaises(Exception, lp2.truncate, wp.major_axis[-2],
+            # throw proper exception
+            pytest.raises(Exception, lp2.truncate, wp.major_axis[-2],
                           wp.major_axis[2])
 
     def test_axis_dummies(self):
-        from pandas.core.reshape import make_axis_dummies
+        from pandas.core.reshape.reshape import make_axis_dummies
 
-        minor_dummies = make_axis_dummies(self.panel, 'minor')
-        self.assertEqual(len(minor_dummies.columns),
-                         len(self.panel.index.levels[1]))
+        minor_dummies = make_axis_dummies(self.panel, 'minor').astype(np.uint8)
+        assert len(minor_dummies.columns) == len(self.panel.index.levels[1])
 
-        major_dummies = make_axis_dummies(self.panel, 'major')
-        self.assertEqual(len(major_dummies.columns),
-                         len(self.panel.index.levels[0]))
+        major_dummies = make_axis_dummies(self.panel, 'major').astype(np.uint8)
+        assert len(major_dummies.columns) == len(self.panel.index.levels[0])
 
-        mapping = {'A': 'one',
-                   'B': 'one',
-                   'C': 'two',
-                   'D': 'two'}
+        mapping = {'A': 'one', 'B': 'one', 'C': 'two', 'D': 'two'}
 
         transformed = make_axis_dummies(self.panel, 'minor',
-                                        transform=mapping.get)
-        self.assertEqual(len(transformed.columns), 2)
-        self.assert_numpy_array_equal(transformed.columns, ['one', 'two'])
+                                        transform=mapping.get).astype(np.uint8)
+        assert len(transformed.columns) == 2
+        tm.assert_index_equal(transformed.columns, Index(['one', 'two']))
 
         # TODO: test correctness
 
     def test_get_dummies(self):
-        from pandas.core.reshape import get_dummies, make_axis_dummies
+        from pandas.core.reshape.reshape import get_dummies, make_axis_dummies
 
         self.panel['Label'] = self.panel.index.labels[1]
-        minor_dummies = make_axis_dummies(self.panel, 'minor')
+        minor_dummies = make_axis_dummies(self.panel, 'minor').astype(np.uint8)
         dummies = get_dummies(self.panel['Label'])
-        self.assert_numpy_array_equal(dummies.values, minor_dummies.values)
+        tm.assert_numpy_array_equal(dummies.values, minor_dummies.values)
 
     def test_mean(self):
-        means = self.panel.mean(level='minor')
+        with catch_warnings(record=True):
+            means = self.panel.mean(level='minor')
 
-        # test versus Panel version
-        wide_means = self.panel.to_panel().mean('major')
-        assert_frame_equal(means, wide_means)
+            # test versus Panel version
+            wide_means = self.panel.to_panel().mean('major')
+            assert_frame_equal(means, wide_means)
 
     def test_sum(self):
-        sums = self.panel.sum(level='minor')
+        with catch_warnings(record=True):
+            sums = self.panel.sum(level='minor')
 
-        # test versus Panel version
-        wide_sums = self.panel.to_panel().sum('major')
-        assert_frame_equal(sums, wide_sums)
+            # test versus Panel version
+            wide_sums = self.panel.to_panel().sum('major')
+            assert_frame_equal(sums, wide_sums)
 
     def test_count(self):
-        index = self.panel.index
+        with catch_warnings(record=True):
+            index = self.panel.index
 
-        major_count = self.panel.count(level=0)['ItemA']
-        labels = index.labels[0]
-        for i, idx in enumerate(index.levels[0]):
-            self.assertEqual(major_count[i], (labels == i).sum())
+            major_count = self.panel.count(level=0)['ItemA']
+            labels = index.labels[0]
+            for i, idx in enumerate(index.levels[0]):
+                assert major_count[i] == (labels == i).sum()
 
-        minor_count = self.panel.count(level=1)['ItemA']
-        labels = index.labels[1]
-        for i, idx in enumerate(index.levels[1]):
-            self.assertEqual(minor_count[i], (labels == i).sum())
+            minor_count = self.panel.count(level=1)['ItemA']
+            labels = index.labels[1]
+            for i, idx in enumerate(index.levels[1]):
+                assert minor_count[i] == (labels == i).sum()
 
     def test_join(self):
-        lp1 = self.panel.filter(['ItemA', 'ItemB'])
-        lp2 = self.panel.filter(['ItemC'])
+        with catch_warnings(record=True):
+            lp1 = self.panel.filter(['ItemA', 'ItemB'])
+            lp2 = self.panel.filter(['ItemC'])
 
-        joined = lp1.join(lp2)
+            joined = lp1.join(lp2)
 
-        self.assertEqual(len(joined.columns), 3)
+            assert len(joined.columns) == 3
 
-        self.assertRaises(Exception, lp1.join,
+            pytest.raises(Exception, lp1.join,
                           self.panel.filter(['ItemB', 'ItemC']))
 
     def test_pivot(self):
-        from pandas.core.reshape import _slow_pivot
-
-        one, two, three = (np.array([1, 2, 3, 4, 5]),
-                           np.array(['a', 'b', 'c', 'd', 'e']),
-                           np.array([1, 2, 3, 5, 4.]))
-        df = pivot(one, two, three)
-        self.assertEqual(df['a'][1], 1)
-        self.assertEqual(df['b'][2], 2)
-        self.assertEqual(df['c'][3], 3)
-        self.assertEqual(df['d'][4], 5)
-        self.assertEqual(df['e'][5], 4)
-        assert_frame_equal(df, _slow_pivot(one, two, three))
-
-        # weird overlap, TODO: test?
-        a, b, c = (np.array([1, 2, 3, 4, 4]),
-                   np.array(['a', 'a', 'a', 'a', 'a']),
-                   np.array([1., 2., 3., 4., 5.]))
-        self.assertRaises(Exception, pivot, a, b, c)
-
-        # corner case, empty
-        df = pivot(np.array([]), np.array([]), np.array([]))
-
-
-def test_monotonic():
-    pos = np.array([1, 2, 3, 5])
-
-    def _monotonic(arr):
-        return not (arr[1:] < arr[:-1]).any()
-
-    assert _monotonic(pos)
-
-    neg = np.array([1, 2, 3, 4, 3])
-
-    assert not _monotonic(neg)
-
-    neg2 = np.array([5, 1, 2, 3, 4, 5])
-
-    assert not _monotonic(neg2)
+        with catch_warnings(record=True):
+            from pandas.core.reshape.reshape import _slow_pivot
+
+            one, two, three = (np.array([1, 2, 3, 4, 5]),
+                               np.array(['a', 'b', 'c', 'd', 'e']),
+                               np.array([1, 2, 3, 5, 4.]))
+            df = pivot(one, two, three)
+            assert df['a'][1] == 1
+            assert df['b'][2] == 2
+            assert df['c'][3] == 3
+            assert df['d'][4] == 5
+            assert df['e'][5] == 4
+            assert_frame_equal(df, _slow_pivot(one, two, three))
+
+            # weird overlap, TODO: test?
+            a, b, c = (np.array([1, 2, 3, 4, 4]),
+                       np.array(['a', 'a', 'a', 'a', 'a']),
+                       np.array([1., 2., 3., 4., 5.]))
+            pytest.raises(Exception, pivot, a, b, c)
+
+            # corner case, empty
+            df = pivot(np.array([]), np.array([]), np.array([]))
 
 
 def test_panel_index():
     index = panelm.panel_index([1, 2, 3, 4], [1, 2, 3])
     expected = MultiIndex.from_arrays([np.tile([1, 2, 3, 4], 3),
-                                       np.repeat([1, 2, 3], 4)])
-    assert(index.equals(expected))
-
+                                       np.repeat([1, 2, 3], 4)],
+                                      names=['time', 'panel'])
+    tm.assert_index_equal(index, expected)
 
-def test_import_warnings():
-    # GH8152
-    panel = Panel(np.random.rand(3, 3, 3))
-    with assert_produces_warning():
-        panel.major_xs(1, copy=False)
 
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
+def test_panel_np_all():
+    with catch_warnings(record=True):
+        wp = Panel({"A": DataFrame({'b': [1, 2]})})
+    result = np.all(wp)
+    assert result == np.bool_(True)
diff --git a/pandas/tests/test_panel4d.py b/pandas/tests/test_panel4d.py
deleted file mode 100644
index 3772d4b9c272b..0000000000000
--- a/pandas/tests/test_panel4d.py
+++ /dev/null
@@ -1,1104 +0,0 @@
-# -*- coding: utf-8 -*-
-from datetime import datetime
-from pandas.compat import range, lrange
-import os
-import operator
-import nose
-
-import numpy as np
-
-from pandas import Series, DataFrame, Index, isnull, notnull, pivot, MultiIndex
-from pandas.core.datetools import bday
-from pandas.core.panel import Panel
-from pandas.core.panel4d import Panel4D
-from pandas.core.series import remove_na
-import pandas.core.common as com
-import pandas.core.panel as panelmod
-from pandas import compat
-
-from pandas.util.testing import (assert_panel_equal,
-                                 assert_panel4d_equal,
-                                 assert_frame_equal,
-                                 assert_series_equal,
-                                 assert_almost_equal)
-import pandas.util.testing as tm
-import pandas.compat as compat
-
-
-def add_nans(panel4d):
-    for l, label in enumerate(panel4d.labels):
-        panel = panel4d[label]
-        tm.add_nans(panel)
-
-
-class SafeForLongAndSparse(object):
-
-    _multiprocess_can_split_ = True
-
-    def test_repr(self):
-        foo = repr(self.panel4d)
-
-    def test_iter(self):
-        tm.equalContents(list(self.panel4d), self.panel4d.labels)
-
-    def test_count(self):
-        f = lambda s: notnull(s).sum()
-        self._check_stat_op('count', f, obj=self.panel4d, has_skipna=False)
-
-    def test_sum(self):
-        self._check_stat_op('sum', np.sum)
-
-    def test_mean(self):
-        self._check_stat_op('mean', np.mean)
-
-    def test_prod(self):
-        self._check_stat_op('prod', np.prod)
-
-    def test_median(self):
-        def wrapper(x):
-            if isnull(x).any():
-                return np.nan
-            return np.median(x)
-
-        self._check_stat_op('median', wrapper)
-
-    def test_min(self):
-        self._check_stat_op('min', np.min)
-
-    def test_max(self):
-        self._check_stat_op('max', np.max)
-
-    def test_skew(self):
-        try:
-            from scipy.stats import skew
-        except ImportError:
-            raise nose.SkipTest("no scipy.stats.skew")
-
-        def this_skew(x):
-            if len(x) < 3:
-                return np.nan
-            return skew(x, bias=False)
-        self._check_stat_op('skew', this_skew)
-
-    # def test_mad(self):
-    #     f = lambda x: np.abs(x - x.mean()).mean()
-    #     self._check_stat_op('mad', f)
-
-    def test_var(self):
-        def alt(x):
-            if len(x) < 2:
-                return np.nan
-            return np.var(x, ddof=1)
-        self._check_stat_op('var', alt)
-
-    def test_std(self):
-        def alt(x):
-            if len(x) < 2:
-                return np.nan
-            return np.std(x, ddof=1)
-        self._check_stat_op('std', alt)
-
-    def test_sem(self):
-        def alt(x):
-            if len(x) < 2:
-                return np.nan
-            return np.std(x, ddof=1)/np.sqrt(len(x))
-        self._check_stat_op('sem', alt)
-
-    # def test_skew(self):
-    #     from scipy.stats import skew
-
-    #     def alt(x):
-    #         if len(x) < 3:
-    #             return np.nan
-    #         return skew(x, bias=False)
-
-    #     self._check_stat_op('skew', alt)
-
-    def _check_stat_op(self, name, alternative, obj=None, has_skipna=True):
-        if obj is None:
-            obj = self.panel4d
-
-            # # set some NAs
-            # obj.ix[5:10] = np.nan
-            # obj.ix[15:20, -2:] = np.nan
-
-        f = getattr(obj, name)
-
-        if has_skipna:
-            def skipna_wrapper(x):
-                nona = remove_na(x)
-                if len(nona) == 0:
-                    return np.nan
-                return alternative(nona)
-
-            def wrapper(x):
-                return alternative(np.asarray(x))
-
-            for i in range(obj.ndim):
-                result = f(axis=i, skipna=False)
-                assert_panel_equal(result, obj.apply(wrapper, axis=i))
-        else:
-            skipna_wrapper = alternative
-            wrapper = alternative
-
-        for i in range(obj.ndim):
-            result = f(axis=i)
-            if not tm._incompat_bottleneck_version(name):
-                assert_panel_equal(result, obj.apply(skipna_wrapper, axis=i))
-
-        self.assertRaises(Exception, f, axis=obj.ndim)
-
-
-class SafeForSparse(object):
-
-    _multiprocess_can_split_ = True
-
-    @classmethod
-    def assert_panel_equal(cls, x, y):
-        assert_panel_equal(x, y)
-
-    @classmethod
-    def assert_panel4d_equal(cls, x, y):
-        assert_panel4d_equal(x, y)
-
-    def test_get_axis(self):
-        assert(self.panel4d._get_axis(0) is self.panel4d.labels)
-        assert(self.panel4d._get_axis(1) is self.panel4d.items)
-        assert(self.panel4d._get_axis(2) is self.panel4d.major_axis)
-        assert(self.panel4d._get_axis(3) is self.panel4d.minor_axis)
-
-    def test_set_axis(self):
-        new_labels = Index(np.arange(len(self.panel4d.labels)))
-        new_items = Index(np.arange(len(self.panel4d.items)))
-        new_major = Index(np.arange(len(self.panel4d.major_axis)))
-        new_minor = Index(np.arange(len(self.panel4d.minor_axis)))
-
-        # ensure propagate to potentially prior-cached items too
-        label = self.panel4d['l1']
-        self.panel4d.labels = new_labels
-
-        if hasattr(self.panel4d, '_item_cache'):
-            self.assertNotIn('l1', self.panel4d._item_cache)
-        self.assertIs(self.panel4d.labels, new_labels)
-
-        self.panel4d.major_axis = new_major
-        self.assertIs(self.panel4d[0].major_axis, new_major)
-        self.assertIs(self.panel4d.major_axis, new_major)
-
-        self.panel4d.minor_axis = new_minor
-        self.assertIs(self.panel4d[0].minor_axis, new_minor)
-        self.assertIs(self.panel4d.minor_axis, new_minor)
-
-    def test_get_axis_number(self):
-        self.assertEqual(self.panel4d._get_axis_number('labels'), 0)
-        self.assertEqual(self.panel4d._get_axis_number('items'), 1)
-        self.assertEqual(self.panel4d._get_axis_number('major'), 2)
-        self.assertEqual(self.panel4d._get_axis_number('minor'), 3)
-
-    def test_get_axis_name(self):
-        self.assertEqual(self.panel4d._get_axis_name(0), 'labels')
-        self.assertEqual(self.panel4d._get_axis_name(1), 'items')
-        self.assertEqual(self.panel4d._get_axis_name(2), 'major_axis')
-        self.assertEqual(self.panel4d._get_axis_name(3), 'minor_axis')
-
-    def test_arith(self):
-        self._test_op(self.panel4d, operator.add)
-        self._test_op(self.panel4d, operator.sub)
-        self._test_op(self.panel4d, operator.mul)
-        self._test_op(self.panel4d, operator.truediv)
-        self._test_op(self.panel4d, operator.floordiv)
-        self._test_op(self.panel4d, operator.pow)
-
-        self._test_op(self.panel4d, lambda x, y: y + x)
-        self._test_op(self.panel4d, lambda x, y: y - x)
-        self._test_op(self.panel4d, lambda x, y: y * x)
-        self._test_op(self.panel4d, lambda x, y: y / x)
-        self._test_op(self.panel4d, lambda x, y: y ** x)
-
-        self.assertRaises(Exception, self.panel4d.__add__, self.panel4d['l1'])
-
-    @staticmethod
-    def _test_op(panel4d, op):
-        result = op(panel4d, 1)
-        assert_panel_equal(result['l1'], op(panel4d['l1'], 1))
-
-    def test_keys(self):
-        tm.equalContents(list(self.panel4d.keys()), self.panel4d.labels)
-
-    def test_iteritems(self):
-        """Test panel4d.iteritems()"""
-
-        self.assertEqual(len(list(compat.iteritems(self.panel4d))),
-                         len(self.panel4d.labels))
-
-    def test_combinePanel4d(self):
-        result = self.panel4d.add(self.panel4d)
-        self.assert_panel4d_equal(result, self.panel4d * 2)
-
-    def test_neg(self):
-        self.assert_panel4d_equal(-self.panel4d, self.panel4d * -1)
-
-    def test_select(self):
-        p = self.panel4d
-
-        # select labels
-        result = p.select(lambda x: x in ('l1', 'l3'), axis='labels')
-        expected = p.reindex(labels=['l1', 'l3'])
-        self.assert_panel4d_equal(result, expected)
-
-        # select items
-        result = p.select(lambda x: x in ('ItemA', 'ItemC'), axis='items')
-        expected = p.reindex(items=['ItemA', 'ItemC'])
-        self.assert_panel4d_equal(result, expected)
-
-        # select major_axis
-        result = p.select(lambda x: x >= datetime(2000, 1, 15), axis='major')
-        new_major = p.major_axis[p.major_axis >= datetime(2000, 1, 15)]
-        expected = p.reindex(major=new_major)
-        self.assert_panel4d_equal(result, expected)
-
-        # select minor_axis
-        result = p.select(lambda x: x in ('D', 'A'), axis=3)
-        expected = p.reindex(minor=['A', 'D'])
-        self.assert_panel4d_equal(result, expected)
-
-        # corner case, empty thing
-        result = p.select(lambda x: x in ('foo',), axis='items')
-        self.assert_panel4d_equal(result, p.reindex(items=[]))
-
-    def test_get_value(self):
-        for item in self.panel.items:
-            for mjr in self.panel.major_axis[::2]:
-                for mnr in self.panel.minor_axis:
-                    result = self.panel.get_value(item, mjr, mnr)
-                    expected = self.panel[item][mnr][mjr]
-                    assert_almost_equal(result, expected)
-
-    def test_abs(self):
-        result = self.panel4d.abs()
-        expected = np.abs(self.panel4d)
-        self.assert_panel4d_equal(result, expected)
-
-        p = self.panel4d['l1']
-        result = p.abs()
-        expected = np.abs(p)
-        assert_panel_equal(result, expected)
-
-        df = p['ItemA']
-        result = df.abs()
-        expected = np.abs(df)
-        assert_frame_equal(result, expected)
-
-
-class CheckIndexing(object):
-
-    _multiprocess_can_split_ = True
-
-    def test_getitem(self):
-        self.assertRaises(Exception, self.panel4d.__getitem__, 'ItemQ')
-
-    def test_delitem_and_pop(self):
-        expected = self.panel4d['l2']
-        result = self.panel4d.pop('l2')
-        assert_panel_equal(expected, result)
-        self.assertNotIn('l2', self.panel4d.labels)
-
-        del self.panel4d['l3']
-        self.assertNotIn('l3', self.panel4d.labels)
-        self.assertRaises(Exception, self.panel4d.__delitem__, 'l3')
-
-        values = np.empty((4, 4, 4, 4))
-        values[0] = 0
-        values[1] = 1
-        values[2] = 2
-        values[3] = 3
-
-        panel4d = Panel4D(values, lrange(4), lrange(4), lrange(4), lrange(4))
-
-        # did we delete the right row?
-
-        panel4dc = panel4d.copy()
-        del panel4dc[0]
-        assert_panel_equal(panel4dc[1], panel4d[1])
-        assert_panel_equal(panel4dc[2], panel4d[2])
-        assert_panel_equal(panel4dc[3], panel4d[3])
-
-        panel4dc = panel4d.copy()
-        del panel4dc[1]
-        assert_panel_equal(panel4dc[0], panel4d[0])
-        assert_panel_equal(panel4dc[2], panel4d[2])
-        assert_panel_equal(panel4dc[3], panel4d[3])
-
-        panel4dc = panel4d.copy()
-        del panel4dc[2]
-        assert_panel_equal(panel4dc[1], panel4d[1])
-        assert_panel_equal(panel4dc[0], panel4d[0])
-        assert_panel_equal(panel4dc[3], panel4d[3])
-
-        panel4dc = panel4d.copy()
-        del panel4dc[3]
-        assert_panel_equal(panel4dc[1], panel4d[1])
-        assert_panel_equal(panel4dc[2], panel4d[2])
-        assert_panel_equal(panel4dc[0], panel4d[0])
-
-    def test_setitem(self):
-        ## LongPanel with one item
-        # lp = self.panel.filter(['ItemA', 'ItemB']).to_frame()
-        # self.assertRaises(Exception, self.panel.__setitem__,
-        #                  'ItemE', lp)
-
-        # Panel
-        p = Panel(dict(
-            ItemA=self.panel4d['l1']['ItemA'][2:].filter(items=['A', 'B'])))
-        self.panel4d['l4'] = p
-        self.panel4d['l5'] = p
-
-        p2 = self.panel4d['l4']
-
-        assert_panel_equal(p, p2.reindex(items=p.items,
-                                         major_axis=p.major_axis,
-                                         minor_axis=p.minor_axis))
-
-        # scalar
-        self.panel4d['lG'] = 1
-        self.panel4d['lE'] = True
-        self.assertEqual(self.panel4d['lG'].values.dtype, np.int64)
-        self.assertEqual(self.panel4d['lE'].values.dtype, np.bool_)
-
-        # object dtype
-        self.panel4d['lQ'] = 'foo'
-        self.assertEqual(self.panel4d['lQ'].values.dtype, np.object_)
-
-        # boolean dtype
-        self.panel4d['lP'] = self.panel4d['l1'] > 0
-        self.assertEqual(self.panel4d['lP'].values.dtype, np.bool_)
-
-    def test_setitem_by_indexer(self):
-
-        # Panel
-        panel4dc = self.panel4d.copy()
-        p = panel4dc.iloc[0]
-        def func():
-            self.panel4d.iloc[0] = p
-        self.assertRaises(NotImplementedError, func)
-
-        # DataFrame
-        panel4dc = self.panel4d.copy()
-        df = panel4dc.iloc[0,0]
-        df.iloc[:] = 1
-        panel4dc.iloc[0,0] = df
-        self.assertTrue((panel4dc.iloc[0,0].values == 1).all())
-
-        # Series
-        panel4dc = self.panel4d.copy()
-        s = panel4dc.iloc[0,0,:,0]
-        s.iloc[:] = 1
-        panel4dc.iloc[0,0,:,0] = s
-        self.assertTrue((panel4dc.iloc[0,0,:,0].values == 1).all())
-
-        # scalar
-        panel4dc = self.panel4d.copy()
-        panel4dc.iloc[0] = 1
-        panel4dc.iloc[1] = True
-        panel4dc.iloc[2] = 'foo'
-        self.assertTrue((panel4dc.iloc[0].values == 1).all())
-        self.assertTrue(panel4dc.iloc[1].values.all())
-        self.assertTrue((panel4dc.iloc[2].values == 'foo').all())
-
-    def test_setitem_by_indexer_mixed_type(self):
-        # GH 8702
-        self.panel4d['foo'] = 'bar'
-
-        # scalar
-        panel4dc = self.panel4d.copy()
-        panel4dc.iloc[0] = 1
-        panel4dc.iloc[1] = True
-        panel4dc.iloc[2] = 'foo'
-        self.assertTrue((panel4dc.iloc[0].values == 1).all())
-        self.assertTrue(panel4dc.iloc[1].values.all())
-        self.assertTrue((panel4dc.iloc[2].values == 'foo').all())
-
-
-
-    def test_comparisons(self):
-        p1 = tm.makePanel4D()
-        p2 = tm.makePanel4D()
-
-        tp = p1.reindex(labels=p1.labels + ['foo'])
-        p = p1[p1.labels[0]]
-
-        def test_comp(func):
-            result = func(p1, p2)
-            self.assert_numpy_array_equal(result.values,
-                                          func(p1.values, p2.values))
-
-            # versus non-indexed same objs
-            self.assertRaises(Exception, func, p1, tp)
-
-            # versus different objs
-            self.assertRaises(Exception, func, p1, p)
-
-            result3 = func(self.panel4d, 0)
-            self.assert_numpy_array_equal(result3.values,
-                                          func(self.panel4d.values, 0))
-
-        test_comp(operator.eq)
-        test_comp(operator.ne)
-        test_comp(operator.lt)
-        test_comp(operator.gt)
-        test_comp(operator.ge)
-        test_comp(operator.le)
-
-    def test_setitem_ndarray(self):
-        raise nose.SkipTest("skipping for now")
-    #    from pandas import DateRange, datetools
-
-    #    timeidx = DateRange(start=datetime(2009,1,1),
-    #                        end=datetime(2009,12,31),
-    #                        offset=datetools.MonthEnd())
-    #    lons_coarse = np.linspace(-177.5, 177.5, 72)
-    #    lats_coarse = np.linspace(-87.5, 87.5, 36)
-    #    P = Panel(items=timeidx, major_axis=lons_coarse, minor_axis=lats_coarse)
-    #    data = np.random.randn(72*36).reshape((72,36))
-    #    key = datetime(2009,2,28)
-    #    P[key] = data#
-
-    #    assert_almost_equal(P[key].values, data)
-
-    def test_major_xs(self):
-        ref = self.panel4d['l1']['ItemA']
-
-        idx = self.panel4d.major_axis[5]
-        xs = self.panel4d.major_xs(idx)
-
-        assert_series_equal(xs['l1'].T['ItemA'], ref.xs(idx), check_names=False)
-
-        # not contained
-        idx = self.panel4d.major_axis[0] - bday
-        self.assertRaises(Exception, self.panel4d.major_xs, idx)
-
-    def test_major_xs_mixed(self):
-        self.panel4d['l4'] = 'foo'
-        xs = self.panel4d.major_xs(self.panel4d.major_axis[0])
-        self.assertEqual(xs['l1']['A'].dtype, np.float64)
-        self.assertEqual(xs['l4']['A'].dtype, np.object_)
-
-    def test_minor_xs(self):
-        ref = self.panel4d['l1']['ItemA']
-
-        idx = self.panel4d.minor_axis[1]
-        xs = self.panel4d.minor_xs(idx)
-
-        assert_series_equal(xs['l1'].T['ItemA'], ref[idx], check_names=False)
-
-        # not contained
-        self.assertRaises(Exception, self.panel4d.minor_xs, 'E')
-
-    def test_minor_xs_mixed(self):
-        self.panel4d['l4'] = 'foo'
-
-        xs = self.panel4d.minor_xs('D')
-        self.assertEqual(xs['l1'].T['ItemA'].dtype, np.float64)
-        self.assertEqual(xs['l4'].T['ItemA'].dtype, np.object_)
-
-    def test_xs(self):
-        l1 = self.panel4d.xs('l1', axis=0)
-        expected = self.panel4d['l1']
-        assert_panel_equal(l1, expected)
-
-        # view if possible
-        l1_view = self.panel4d.xs('l1', axis=0)
-        l1_view.values[:] = np.nan
-        self.assertTrue(np.isnan(self.panel4d['l1'].values).all())
-
-        # mixed-type
-        self.panel4d['strings'] = 'foo'
-        result = self.panel4d.xs('D', axis=3)
-        self.assertIsNotNone(result.is_copy)
-
-    def test_getitem_fancy_labels(self):
-        panel4d = self.panel4d
-
-        labels = panel4d.labels[[1, 0]]
-        items = panel4d.items[[1, 0]]
-        dates = panel4d.major_axis[::2]
-        cols = ['D', 'C', 'F']
-
-        # all 4 specified
-        assert_panel4d_equal(panel4d.ix[labels, items, dates, cols],
-                             panel4d.reindex(labels=labels, items=items, major=dates, minor=cols))
-
-        # 3 specified
-        assert_panel4d_equal(panel4d.ix[:, items, dates, cols],
-                             panel4d.reindex(items=items, major=dates, minor=cols))
-
-        # 2 specified
-        assert_panel4d_equal(panel4d.ix[:, :, dates, cols],
-                             panel4d.reindex(major=dates, minor=cols))
-
-        assert_panel4d_equal(panel4d.ix[:, items, :, cols],
-                             panel4d.reindex(items=items, minor=cols))
-
-        assert_panel4d_equal(panel4d.ix[:, items, dates, :],
-                             panel4d.reindex(items=items, major=dates))
-
-        # only 1
-        assert_panel4d_equal(panel4d.ix[:, items, :, :],
-                             panel4d.reindex(items=items))
-
-        assert_panel4d_equal(panel4d.ix[:, :, dates, :],
-                             panel4d.reindex(major=dates))
-
-        assert_panel4d_equal(panel4d.ix[:, :, :, cols],
-                             panel4d.reindex(minor=cols))
-
-    def test_getitem_fancy_slice(self):
-        pass
-
-    def test_getitem_fancy_ints(self):
-        pass
-
-    def test_getitem_fancy_xs(self):
-        raise nose.SkipTest("skipping for now")
-        # self.assertRaises(NotImplementedError, self.panel4d.major_xs)
-        # self.assertRaises(NotImplementedError, self.panel4d.minor_xs)
-
-    def test_get_value(self):
-        for label in self.panel4d.labels:
-            for item in self.panel4d.items:
-                for mjr in self.panel4d.major_axis[::2]:
-                    for mnr in self.panel4d.minor_axis:
-                        result = self.panel4d.get_value(
-                            label, item, mjr, mnr)
-                        expected = self.panel4d[label][item][mnr][mjr]
-                        assert_almost_equal(result, expected)
-
-    def test_set_value(self):
-        for label in self.panel4d.labels:
-            for item in self.panel4d.items:
-                for mjr in self.panel4d.major_axis[::2]:
-                    for mnr in self.panel4d.minor_axis:
-                        self.panel4d.set_value(label, item, mjr, mnr, 1.)
-                        assert_almost_equal(
-                            self.panel4d[label][item][mnr][mjr], 1.)
-
-        # resize
-        res = self.panel4d.set_value('l4', 'ItemE', 'foo', 'bar', 1.5)
-        tm.assertIsInstance(res, Panel4D)
-        self.assertIsNot(res, self.panel4d)
-        self.assertEqual(res.get_value('l4', 'ItemE', 'foo', 'bar'), 1.5)
-
-        res3 = self.panel4d.set_value('l4', 'ItemE', 'foobar', 'baz', 5)
-        self.assertTrue(com.is_float_dtype(res3['l4'].values))
-
-
-class TestPanel4d(tm.TestCase, CheckIndexing, SafeForSparse,
-                  SafeForLongAndSparse):
-
-    _multiprocess_can_split_ = True
-
-    @classmethod
-    def assert_panel4d_equal(cls, x, y):
-        assert_panel4d_equal(x, y)
-
-    def setUp(self):
-        self.panel4d = tm.makePanel4D(nper=8)
-        add_nans(self.panel4d)
-
-    def test_constructor(self):
-        # with BlockManager
-        panel4d = Panel4D(self.panel4d._data)
-        self.assertIs(panel4d._data, self.panel4d._data)
-
-        panel4d = Panel4D(self.panel4d._data, copy=True)
-        self.assertIsNot(panel4d._data, self.panel4d._data)
-        assert_panel4d_equal(panel4d, self.panel4d)
-
-        # strings handled prop
-        # panel4d = Panel4D([[['foo', 'foo', 'foo',],
-        #                 ['foo', 'foo', 'foo']]])
-        # self.assertEqual(wp.values.dtype, np.object_)
-
-        vals = self.panel4d.values
-
-        # no copy
-        panel4d = Panel4D(vals)
-        self.assertIs(panel4d.values, vals)
-
-        # copy
-        panel4d = Panel4D(vals, copy=True)
-        self.assertIsNot(panel4d.values, vals)
-
-        # GH #8285, test when scalar data is used to construct a Panel4D
-        # if dtype is not passed, it should be inferred
-        value_and_dtype = [(1, 'int64'), (3.14, 'float64'), ('foo', np.object_)]
-        for (val, dtype) in value_and_dtype:
-            panel4d = Panel4D(val, labels=range(2), items=range(3), major_axis=range(4), minor_axis=range(5))
-            vals = np.empty((2, 3, 4, 5), dtype=dtype)
-            vals.fill(val)
-            assert_panel4d_equal(panel4d, Panel4D(vals, dtype=dtype))
-
-        # test the case when dtype is passed
-        panel4d = Panel4D(1, labels=range(2), items=range(3), major_axis=range(4), minor_axis=range(5), dtype='float32')
-        vals = np.empty((2, 3, 4, 5), dtype='float32')
-        vals.fill(1)
-        assert_panel4d_equal(panel4d, Panel4D(vals, dtype='float32'))
-
-    def test_constructor_cast(self):
-        zero_filled = self.panel4d.fillna(0)
-
-        casted = Panel4D(zero_filled._data, dtype=int)
-        casted2 = Panel4D(zero_filled.values, dtype=int)
-
-        exp_values = zero_filled.values.astype(int)
-        assert_almost_equal(casted.values, exp_values)
-        assert_almost_equal(casted2.values, exp_values)
-
-        casted = Panel4D(zero_filled._data, dtype=np.int32)
-        casted2 = Panel4D(zero_filled.values, dtype=np.int32)
-
-        exp_values = zero_filled.values.astype(np.int32)
-        assert_almost_equal(casted.values, exp_values)
-        assert_almost_equal(casted2.values, exp_values)
-
-        # can't cast
-        data = [[['foo', 'bar', 'baz']]]
-        self.assertRaises(ValueError, Panel, data, dtype=float)
-
-    def test_constructor_empty_panel(self):
-        empty = Panel()
-        self.assertEqual(len(empty.items), 0)
-        self.assertEqual(len(empty.major_axis), 0)
-        self.assertEqual(len(empty.minor_axis), 0)
-
-    def test_constructor_observe_dtype(self):
-        # GH #411
-        panel = Panel(items=lrange(3), major_axis=lrange(3),
-                      minor_axis=lrange(3), dtype='O')
-        self.assertEqual(panel.values.dtype, np.object_)
-
-    def test_consolidate(self):
-        self.assertTrue(self.panel4d._data.is_consolidated())
-
-        self.panel4d['foo'] = 1.
-        self.assertFalse(self.panel4d._data.is_consolidated())
-
-        panel4d = self.panel4d.consolidate()
-        self.assertTrue(panel4d._data.is_consolidated())
-
-    def test_ctor_dict(self):
-        l1 = self.panel4d['l1']
-        l2 = self.panel4d['l2']
-
-        d = {'A': l1, 'B': l2.ix[['ItemB'], :, :]}
-        # d2 = {'A' : itema._series, 'B' : itemb[5:]._series}
-        # d3 = {'A' : DataFrame(itema._series),
-        #      'B' : DataFrame(itemb[5:]._series)}
-
-        panel4d = Panel4D(d)
-        # wp2 = Panel.from_dict(d2) # nested Dict
-        # wp3 = Panel.from_dict(d3)
-        # self.assertTrue(wp.major_axis.equals(self.panel.major_axis))
-        assert_panel_equal(panel4d['A'], self.panel4d['l1'])
-        assert_frame_equal(panel4d.ix['B', 'ItemB', :, :],
-                           self.panel4d.ix['l2', ['ItemB'], :, :]['ItemB'])
-
-        # intersect
-        # wp = Panel.from_dict(d, intersect=True)
-        # self.assertTrue(wp.major_axis.equals(itemb.index[5:]))
-
-        # use constructor
-        # assert_panel_equal(Panel(d), Panel.from_dict(d))
-        # assert_panel_equal(Panel(d2), Panel.from_dict(d2))
-        # assert_panel_equal(Panel(d3), Panel.from_dict(d3))
-
-        # cast
-        # dcasted = dict((k, v.reindex(wp.major_axis).fillna(0))
-        #               for k, v in d.iteritems())
-        # result = Panel(dcasted, dtype=int)
-        # expected = Panel(dict((k, v.astype(int))
-        #                      for k, v in dcasted.iteritems()))
-        # assert_panel_equal(result, expected)
-
-    def test_constructor_dict_mixed(self):
-        data = dict((k, v.values) for k, v in compat.iteritems(self.panel4d))
-        result = Panel4D(data)
-        exp_major = Index(np.arange(len(self.panel4d.major_axis)))
-        self.assertTrue(result.major_axis.equals(exp_major))
-
-        result = Panel4D(data,
-                         labels=self.panel4d.labels,
-                         items=self.panel4d.items,
-                         major_axis=self.panel4d.major_axis,
-                         minor_axis=self.panel4d.minor_axis)
-        assert_panel4d_equal(result, self.panel4d)
-
-        data['l2'] = self.panel4d['l2']
-        result = Panel4D(data)
-        assert_panel4d_equal(result, self.panel4d)
-
-        # corner, blow up
-        data['l2'] = data['l2']['ItemB']
-        self.assertRaises(Exception, Panel4D, data)
-
-        data['l2'] = self.panel4d['l2'].values[:, :, :-1]
-        self.assertRaises(Exception, Panel4D, data)
-
-    def test_constructor_resize(self):
-        data = self.panel4d._data
-        labels = self.panel4d.labels[:-1]
-        items = self.panel4d.items[:-1]
-        major = self.panel4d.major_axis[:-1]
-        minor = self.panel4d.minor_axis[:-1]
-
-        result = Panel4D(data, labels=labels, items=items,
-                         major_axis=major, minor_axis=minor)
-        expected = self.panel4d.reindex(
-            labels=labels, items=items, major=major, minor=minor)
-        assert_panel4d_equal(result, expected)
-
-        result = Panel4D(data, items=items, major_axis=major)
-        expected = self.panel4d.reindex(items=items, major=major)
-        assert_panel4d_equal(result, expected)
-
-        result = Panel4D(data, items=items)
-        expected = self.panel4d.reindex(items=items)
-        assert_panel4d_equal(result, expected)
-
-        result = Panel4D(data, minor_axis=minor)
-        expected = self.panel4d.reindex(minor=minor)
-        assert_panel4d_equal(result, expected)
-
-    def test_from_dict_mixed_orient(self):
-        raise nose.SkipTest("skipping for now")
-    #    df = tm.makeDataFrame()
-    #    df['foo'] = 'bar'
-
-    #    data = {'k1' : df,
-    #            'k2' : df}
-
-    #    panel = Panel.from_dict(data, orient='minor')
-
-    #    self.assertEqual(panel['foo'].values.dtype, np.object_)
-    #    self.assertEqual(panel['A'].values.dtype, np.float64)
-
-    def test_values(self):
-        self.assertRaises(Exception, Panel, np.random.randn(5, 5, 5),
-                          lrange(5), lrange(5), lrange(4))
-
-    def test_conform(self):
-        p = self.panel4d['l1'].filter(items=['ItemA', 'ItemB'])
-        conformed = self.panel4d.conform(p)
-
-        assert(conformed.items.equals(self.panel4d.labels))
-        assert(conformed.major_axis.equals(self.panel4d.major_axis))
-        assert(conformed.minor_axis.equals(self.panel4d.minor_axis))
-
-    def test_reindex(self):
-        ref = self.panel4d['l2']
-
-        # labels
-        result = self.panel4d.reindex(labels=['l1', 'l2'])
-        assert_panel_equal(result['l2'], ref)
-
-        # items
-        result = self.panel4d.reindex(items=['ItemA', 'ItemB'])
-        assert_frame_equal(result['l2']['ItemB'], ref['ItemB'])
-
-        # major
-        new_major = list(self.panel4d.major_axis[:10])
-        result = self.panel4d.reindex(major=new_major)
-        assert_frame_equal(
-            result['l2']['ItemB'], ref['ItemB'].reindex(index=new_major))
-
-        # raise exception put both major and major_axis
-        self.assertRaises(Exception, self.panel4d.reindex,
-                          major_axis=new_major, major=new_major)
-
-        # minor
-        new_minor = list(self.panel4d.minor_axis[:2])
-        result = self.panel4d.reindex(minor=new_minor)
-        assert_frame_equal(
-            result['l2']['ItemB'], ref['ItemB'].reindex(columns=new_minor))
-
-        result = self.panel4d.reindex(labels=self.panel4d.labels,
-                                      items=self.panel4d.items,
-                                      major=self.panel4d.major_axis,
-                                      minor=self.panel4d.minor_axis)
-
-        # don't necessarily copy
-        result = self.panel4d.reindex()
-        assert_panel4d_equal(result,self.panel4d)
-        self.assertFalse(result is self.panel4d)
-
-        # with filling
-        smaller_major = self.panel4d.major_axis[::5]
-        smaller = self.panel4d.reindex(major=smaller_major)
-
-        larger = smaller.reindex(major=self.panel4d.major_axis,
-                                 method='pad')
-
-        assert_panel_equal(larger.ix[:, :, self.panel4d.major_axis[1], :],
-                           smaller.ix[:, :, smaller_major[0], :])
-
-        # don't necessarily copy
-        result = self.panel4d.reindex(
-            major=self.panel4d.major_axis, copy=False)
-        assert_panel4d_equal(result,self.panel4d)
-        self.assertTrue(result is self.panel4d)
-
-    def test_not_hashable(self):
-        p4D_empty = Panel4D()
-        self.assertRaises(TypeError, hash, p4D_empty)
-        self.assertRaises(TypeError, hash, self.panel4d)
-
-    def test_reindex_like(self):
-        # reindex_like
-        smaller = self.panel4d.reindex(labels=self.panel4d.labels[:-1],
-                                       items=self.panel4d.items[:-1],
-                                       major=self.panel4d.major_axis[:-1],
-                                       minor=self.panel4d.minor_axis[:-1])
-        smaller_like = self.panel4d.reindex_like(smaller)
-        assert_panel4d_equal(smaller, smaller_like)
-
-    def test_take(self):
-        raise nose.SkipTest("skipping for now")
-
-    #    # axis == 0
-    #    result = self.panel.take([2, 0, 1], axis=0)
-    #    expected = self.panel.reindex(items=['ItemC', 'ItemA', 'ItemB'])
-    #    assert_panel_equal(result, expected)#
-
-    #    # axis >= 1
-    #    result = self.panel.take([3, 0, 1, 2], axis=2)
-    #    expected = self.panel.reindex(minor=['D', 'A', 'B', 'C'])
-    #    assert_panel_equal(result, expected)
-
-    #    self.assertRaises(Exception, self.panel.take, [3, -1, 1, 2], axis=2)
-    #    self.assertRaises(Exception, self.panel.take, [4, 0, 1, 2], axis=2)
-
-    def test_sort_index(self):
-        import random
-
-        rlabels = list(self.panel4d.labels)
-        ritems = list(self.panel4d.items)
-        rmajor = list(self.panel4d.major_axis)
-        rminor = list(self.panel4d.minor_axis)
-        random.shuffle(rlabels)
-        random.shuffle(ritems)
-        random.shuffle(rmajor)
-        random.shuffle(rminor)
-
-        random_order = self.panel4d.reindex(labels=rlabels)
-        sorted_panel4d = random_order.sort_index(axis=0)
-        assert_panel4d_equal(sorted_panel4d, self.panel4d)
-
-        # descending
-        # random_order = self.panel.reindex(items=ritems)
-        # sorted_panel = random_order.sort_index(axis=0, ascending=False)
-        # assert_panel_equal(sorted_panel,
-        #                   self.panel.reindex(items=self.panel.items[::-1]))
-
-        # random_order = self.panel.reindex(major=rmajor)
-        # sorted_panel = random_order.sort_index(axis=1)
-        # assert_panel_equal(sorted_panel, self.panel)
-
-        # random_order = self.panel.reindex(minor=rminor)
-        # sorted_panel = random_order.sort_index(axis=2)
-        # assert_panel_equal(sorted_panel, self.panel)
-
-    def test_fillna(self):
-        self.assertFalse(np.isfinite(self.panel4d.values).all())
-        filled = self.panel4d.fillna(0)
-        self.assertTrue(np.isfinite(filled.values).all())
-
-        self.assertRaises(NotImplementedError, self.panel4d.fillna, method='pad')
-
-    def test_swapaxes(self):
-        result = self.panel4d.swapaxes('labels', 'items')
-        self.assertIs(result.items, self.panel4d.labels)
-
-        result = self.panel4d.swapaxes('labels', 'minor')
-        self.assertIs(result.labels, self.panel4d.minor_axis)
-
-        result = self.panel4d.swapaxes('items', 'minor')
-        self.assertIs(result.items, self.panel4d.minor_axis)
-
-        result = self.panel4d.swapaxes('items', 'major')
-        self.assertIs(result.items, self.panel4d.major_axis)
-
-        result = self.panel4d.swapaxes('major', 'minor')
-        self.assertIs(result.major_axis, self.panel4d.minor_axis)
-
-        # this should also work
-        result = self.panel4d.swapaxes(0, 1)
-        self.assertIs(result.labels, self.panel4d.items)
-
-        # this works, but return a copy
-        result = self.panel4d.swapaxes('items', 'items')
-        assert_panel4d_equal(self.panel4d,result)
-        self.assertNotEqual(id(self.panel4d), id(result))
-
-    def test_to_frame(self):
-        raise nose.SkipTest("skipping for now")
-    #    # filtered
-    #    filtered = self.panel.to_frame()
-    #    expected = self.panel.to_frame().dropna(how='any')
-    #    assert_frame_equal(filtered, expected)
-
-    #    # unfiltered
-    #    unfiltered = self.panel.to_frame(filter_observations=False)
-    #    assert_panel_equal(unfiltered.to_panel(), self.panel)
-
-    #    # names
-    #    self.assertEqual(unfiltered.index.names, ('major', 'minor'))
-
-    def test_to_frame_mixed(self):
-        raise nose.SkipTest("skipping for now")
-    #    panel = self.panel.fillna(0)
-    #    panel['str'] = 'foo'
-    #    panel['bool'] = panel['ItemA'] > 0
-
-    #    lp = panel.to_frame()
-    #    wp = lp.to_panel()
-    #    self.assertEqual(wp['bool'].values.dtype, np.bool_)
-    #    assert_frame_equal(wp['bool'], panel['bool'])
-
-    def test_update(self):
-
-        p4d = Panel4D([[[[1.5, np.nan, 3.],
-                         [1.5, np.nan, 3.],
-                         [1.5, np.nan, 3.],
-                         [1.5, np.nan, 3.]],
-                        [[1.5, np.nan, 3.],
-                         [1.5, np.nan, 3.],
-                         [1.5, np.nan, 3.],
-                         [1.5, np.nan, 3.]]]])
-
-        other = Panel4D([[[[3.6, 2., np.nan]],
-                          [[np.nan, np.nan, 7]]]])
-
-        p4d.update(other)
-
-        expected = Panel4D([[[[3.6, 2, 3.],
-                              [1.5, np.nan, 3.],
-                              [1.5, np.nan, 3.],
-                              [1.5, np.nan, 3.]],
-                             [[1.5, np.nan, 7],
-                              [1.5, np.nan, 3.],
-                              [1.5, np.nan, 3.],
-                              [1.5, np.nan, 3.]]]])
-
-        assert_panel4d_equal(p4d, expected)
-
-    def test_filter(self):
-        raise nose.SkipTest("skipping for now")
-
-    def test_apply(self):
-        raise nose.SkipTest("skipping for now")
-
-    def test_dtypes(self):
-
-        result = self.panel4d.dtypes
-        expected = Series(np.dtype('float64'),index=self.panel4d.labels)
-        assert_series_equal(result, expected)
-
-    def test_compound(self):
-        raise nose.SkipTest("skipping for now")
-    #    compounded = self.panel.compound()
-
-    #    assert_series_equal(compounded['ItemA'],
-    #                        (1 + self.panel['ItemA']).product(0) - 1)
-
-    def test_shift(self):
-        raise nose.SkipTest("skipping for now")
-    #    # major
-    #    idx = self.panel.major_axis[0]
-    #    idx_lag = self.panel.major_axis[1]
-
-    #    shifted = self.panel.shift(1)
-
-    #    assert_frame_equal(self.panel.major_xs(idx),
-    #                       shifted.major_xs(idx_lag))
-
-    #    # minor
-    #    idx = self.panel.minor_axis[0]
-    #    idx_lag = self.panel.minor_axis[1]
-
-    #    shifted = self.panel.shift(1, axis='minor')
-
-    #    assert_frame_equal(self.panel.minor_xs(idx),
-    #                       shifted.minor_xs(idx_lag))
-
-    #    self.assertRaises(Exception, self.panel.shift, 1, axis='items')
-
-    def test_multiindex_get(self):
-        raise nose.SkipTest("skipping for now")
-    #    ind = MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1), ('b',2)],
-    #                                 names=['first', 'second'])
-    #    wp = Panel(np.random.random((4,5,5)),
-    #                                items=ind,
-    #                                major_axis=np.arange(5),
-    #                                minor_axis=np.arange(5))
-    #    f1 = wp['a']
-    #    f2 = wp.ix['a']
-    #    assert_panel_equal(f1, f2)
-
-    #    self.assertTrue((f1.items == [1, 2]).all())
-    #    self.assertTrue((f2.items == [1, 2]).all())
-
-    #    ind = MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)],
-    #                                 names=['first', 'second'])
-
-    def test_multiindex_blocks(self):
-        raise nose.SkipTest("skipping for now")
-    #    ind = MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)],
-    #                                 names=['first', 'second'])
-    #    wp = Panel(self.panel._data)
-    #    wp.items = ind
-    #    f1 = wp['a']
-    #    self.assertTrue((f1.items == [1, 2]).all())
-
-    #    f1 = wp[('b',1)]
-    #    self.assertTrue((f1.columns == ['A', 'B', 'C', 'D']).all())
-
-    def test_repr_empty(self):
-        empty = Panel4D()
-        repr(empty)
-
-    def test_rename(self):
-        mapper = {
-            'l1': 'foo',
-            'l2': 'bar',
-            'l3': 'baz'
-        }
-
-        renamed = self.panel4d.rename_axis(mapper, axis=0)
-        exp = Index(['foo', 'bar', 'baz'])
-        self.assertTrue(renamed.labels.equals(exp))
-
-        renamed = self.panel4d.rename_axis(str.lower, axis=3)
-        exp = Index(['a', 'b', 'c', 'd'])
-        self.assertTrue(renamed.minor_axis.equals(exp))
-
-        # don't copy
-        renamed_nocopy = self.panel4d.rename_axis(mapper, axis=0, copy=False)
-        renamed_nocopy['foo'] = 3.
-        self.assertTrue((self.panel4d['l1'].values == 3).all())
-
-    def test_get_attr(self):
-        assert_panel_equal(self.panel4d['l1'], self.panel4d.l1)
-
-
-    def test_from_frame_level1_unsorted(self):
-        raise nose.SkipTest("skipping for now")
-
-    def test_to_excel(self):
-        raise nose.SkipTest("skipping for now")
-
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_panelnd.py b/pandas/tests/test_panelnd.py
deleted file mode 100644
index 67d015b940885..0000000000000
--- a/pandas/tests/test_panelnd.py
+++ /dev/null
@@ -1,111 +0,0 @@
-# -*- coding: utf-8 -*-
-from datetime import datetime
-import os
-import operator
-import nose
-
-import numpy as np
-
-from pandas.core import panelnd
-from pandas.core.panel import Panel
-import pandas.core.common as com
-from pandas import compat
-
-from pandas.util.testing import (assert_panel_equal,
-                                 assert_panel4d_equal,
-                                 assert_frame_equal,
-                                 assert_series_equal,
-                                 assert_almost_equal)
-import pandas.util.testing as tm
-
-
-class TestPanelnd(tm.TestCase):
-
-    def setUp(self):
-        pass
-
-    def test_4d_construction(self):
-
-        # create a 4D
-        Panel4D = panelnd.create_nd_panel_factory(
-            klass_name='Panel4D',
-            orders=['labels', 'items', 'major_axis', 'minor_axis'],
-            slices={'items': 'items', 'major_axis': 'major_axis',
-                    'minor_axis': 'minor_axis'},
-            slicer=Panel,
-            aliases={'major': 'major_axis', 'minor': 'minor_axis'},
-            stat_axis=2)
-
-        p4d = Panel4D(dict(L1=tm.makePanel(), L2=tm.makePanel()))
-
-    def test_4d_construction_alt(self):
-
-        # create a 4D
-        Panel4D = panelnd.create_nd_panel_factory(
-            klass_name='Panel4D',
-            orders=['labels', 'items', 'major_axis', 'minor_axis'],
-            slices={'items': 'items', 'major_axis': 'major_axis',
-                    'minor_axis': 'minor_axis'},
-            slicer='Panel',
-            aliases={'major': 'major_axis', 'minor': 'minor_axis'},
-            stat_axis=2)
-
-        p4d = Panel4D(dict(L1=tm.makePanel(), L2=tm.makePanel()))
-
-    def test_4d_construction_error(self):
-
-        # create a 4D
-        self.assertRaises(Exception,
-                          panelnd.create_nd_panel_factory,
-                          klass_name='Panel4D',
-                          orders=['labels', 'items', 'major_axis',
-                                  'minor_axis'],
-                          slices={'items': 'items',
-                                  'major_axis': 'major_axis',
-                                  'minor_axis': 'minor_axis'},
-                          slicer='foo',
-                          aliases={'major': 'major_axis',
-                                   'minor': 'minor_axis'},
-                          stat_axis=2)
-
-    def test_5d_construction(self):
-
-        # create a 4D
-        Panel4D = panelnd.create_nd_panel_factory(
-            klass_name='Panel4D',
-            orders=['labels1', 'items', 'major_axis', 'minor_axis'],
-            slices={'items': 'items', 'major_axis': 'major_axis',
-                    'minor_axis': 'minor_axis'},
-            slicer=Panel,
-            aliases={'major': 'major_axis', 'minor': 'minor_axis'},
-            stat_axis=2)
-
-        p4d = Panel4D(dict(L1=tm.makePanel(), L2=tm.makePanel()))
-
-        # create a 5D
-        Panel5D = panelnd.create_nd_panel_factory(
-            klass_name='Panel5D',
-            orders=['cool1', 'labels1', 'items', 'major_axis',
-                    'minor_axis'],
-            slices={'labels1': 'labels1', 'items': 'items',
-                    'major_axis': 'major_axis',
-                    'minor_axis': 'minor_axis'},
-            slicer=Panel4D,
-            aliases={'major': 'major_axis', 'minor': 'minor_axis'},
-            stat_axis=2)
-
-        p5d = Panel5D(dict(C1=p4d))
-
-        # slice back to 4d
-        results = p5d.ix['C1', :, :, 0:3, :]
-        expected = p4d.ix[:, :, 0:3, :]
-        assert_panel_equal(results['L1'], expected['L1'])
-
-        # test a transpose
-        # results  = p5d.transpose(1,2,3,4,0)
-        # expected =
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_register_accessor.py b/pandas/tests/test_register_accessor.py
new file mode 100644
index 0000000000000..33b9798b7606a
--- /dev/null
+++ b/pandas/tests/test_register_accessor.py
@@ -0,0 +1,89 @@
+import contextlib
+
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+
+
+@contextlib.contextmanager
+def ensure_removed(obj, attr):
+    """Ensure that an attribute added to 'obj' during the test is
+    removed when we're done"""
+    try:
+        yield
+    finally:
+        try:
+            delattr(obj, attr)
+        except AttributeError:
+            pass
+        obj._accessors.discard(attr)
+
+
+class MyAccessor(object):
+
+    def __init__(self, obj):
+        self.obj = obj
+        self.item = 'item'
+
+    @property
+    def prop(self):
+        return self.item
+
+    def method(self):
+        return self.item
+
+
+@pytest.mark.parametrize('obj, registrar', [
+    (pd.Series, pd.api.extensions.register_series_accessor),
+    (pd.DataFrame, pd.api.extensions.register_dataframe_accessor),
+    (pd.Index, pd.api.extensions.register_index_accessor)
+])
+def test_register(obj, registrar):
+    with ensure_removed(obj, 'mine'):
+        before = set(dir(obj))
+        registrar('mine')(MyAccessor)
+        assert obj([]).mine.prop == 'item'
+        after = set(dir(obj))
+        assert (before ^ after) == {'mine'}
+        assert 'mine' in obj._accessors
+
+
+def test_accessor_works():
+    with ensure_removed(pd.Series, 'mine'):
+        pd.api.extensions.register_series_accessor('mine')(MyAccessor)
+
+        s = pd.Series([1, 2])
+        assert s.mine.obj is s
+
+        assert s.mine.prop == 'item'
+        assert s.mine.method() == 'item'
+
+
+def test_overwrite_warns():
+    # Need to restore mean
+    mean = pd.Series.mean
+    try:
+        with tm.assert_produces_warning(UserWarning) as w:
+            pd.api.extensions.register_series_accessor('mean')(MyAccessor)
+            s = pd.Series([1, 2])
+            assert s.mean.prop == 'item'
+        msg = str(w[0].message)
+        assert 'mean' in msg
+        assert 'MyAccessor' in msg
+        assert 'Series' in msg
+    finally:
+        pd.Series.mean = mean
+
+
+def test_raises_attribute_error():
+
+    with ensure_removed(pd.Series, 'bad'):
+
+        @pd.api.extensions.register_series_accessor("bad")
+        class Bad(object):
+            def __init__(self, data):
+                raise AttributeError("whoops")
+
+        with tm.assert_raises_regex(AttributeError, "whoops"):
+            pd.Series([]).bad
diff --git a/pandas/tests/test_resample.py b/pandas/tests/test_resample.py
new file mode 100644
index 0000000000000..60f23309b11d9
--- /dev/null
+++ b/pandas/tests/test_resample.py
@@ -0,0 +1,3423 @@
+# pylint: disable=E1101
+
+from warnings import catch_warnings
+from datetime import datetime, timedelta
+from functools import partial
+from textwrap import dedent
+from operator import methodcaller
+
+import pytz
+import pytest
+import dateutil
+import numpy as np
+
+import pandas as pd
+import pandas.tseries.offsets as offsets
+import pandas.util.testing as tm
+from pandas import (Series, DataFrame, Panel, Index, isna,
+                    notna, Timestamp)
+
+from pandas.compat import range, lrange, zip, OrderedDict
+from pandas.errors import UnsupportedFunctionCall
+from pandas.core.groupby.groupby import DataError
+import pandas.core.common as com
+
+from pandas.tseries.frequencies import to_offset
+from pandas.core.indexes.datetimes import date_range
+from pandas.tseries.offsets import Minute, BDay
+from pandas.core.indexes.period import period_range, PeriodIndex, Period
+from pandas.core.resample import DatetimeIndex, TimeGrouper
+from pandas.core.indexes.timedeltas import timedelta_range, TimedeltaIndex
+from pandas.util.testing import (assert_series_equal, assert_almost_equal,
+                                 assert_frame_equal, assert_index_equal)
+from pandas._libs.tslibs.period import IncompatibleFrequency
+from pandas._libs.tslibs.ccalendar import DAYS, MONTHS
+
+bday = BDay()
+
+# The various methods we support
+downsample_methods = ['min', 'max', 'first', 'last', 'sum', 'mean', 'sem',
+                      'median', 'prod', 'var', 'ohlc']
+upsample_methods = ['count', 'size']
+series_methods = ['nunique']
+resample_methods = downsample_methods + upsample_methods + series_methods
+
+
+def _simple_ts(start, end, freq='D'):
+    rng = date_range(start, end, freq=freq)
+    return Series(np.random.randn(len(rng)), index=rng)
+
+
+def _simple_pts(start, end, freq='D'):
+    rng = period_range(start, end, freq=freq)
+    return Series(np.random.randn(len(rng)), index=rng)
+
+
+class TestResampleAPI(object):
+
+    def setup_method(self, method):
+        dti = DatetimeIndex(start=datetime(2005, 1, 1),
+                            end=datetime(2005, 1, 10), freq='Min')
+
+        self.series = Series(np.random.rand(len(dti)), dti)
+        self.frame = DataFrame(
+            {'A': self.series, 'B': self.series, 'C': np.arange(len(dti))})
+
+    def test_str(self):
+
+        r = self.series.resample('H')
+        assert ('DatetimeIndexResampler [freq=<Hour>, axis=0, closed=left, '
+                'label=left, convention=start, base=0]' in str(r))
+
+    def test_api(self):
+
+        r = self.series.resample('H')
+        result = r.mean()
+        assert isinstance(result, Series)
+        assert len(result) == 217
+
+        r = self.series.to_frame().resample('H')
+        result = r.mean()
+        assert isinstance(result, DataFrame)
+        assert len(result) == 217
+
+    def test_groupby_resample_api(self):
+
+        # GH 12448
+        # .groupby(...).resample(...) hitting warnings
+        # when appropriate
+        df = DataFrame({'date': pd.date_range(start='2016-01-01',
+                                              periods=4,
+                                              freq='W'),
+                        'group': [1, 1, 2, 2],
+                        'val': [5, 6, 7, 8]}).set_index('date')
+
+        # replication step
+        i = pd.date_range('2016-01-03', periods=8).tolist() + \
+            pd.date_range('2016-01-17', periods=8).tolist()
+        index = pd.MultiIndex.from_arrays([[1] * 8 + [2] * 8, i],
+                                          names=['group', 'date'])
+        expected = DataFrame({'val': [5] * 7 + [6] + [7] * 7 + [8]},
+                             index=index)
+        result = df.groupby('group').apply(
+            lambda x: x.resample('1D').ffill())[['val']]
+        assert_frame_equal(result, expected)
+
+    def test_groupby_resample_on_api(self):
+
+        # GH 15021
+        # .groupby(...).resample(on=...) results in an unexpected
+        # keyword warning.
+        df = DataFrame({'key': ['A', 'B'] * 5,
+                        'dates': pd.date_range('2016-01-01', periods=10),
+                        'values': np.random.randn(10)})
+
+        expected = df.set_index('dates').groupby('key').resample('D').mean()
+
+        result = df.groupby('key').resample('D', on='dates').mean()
+        assert_frame_equal(result, expected)
+
+    def test_pipe(self):
+        # GH17905
+
+        # series
+        r = self.series.resample('H')
+        expected = r.max() - r.mean()
+        result = r.pipe(lambda x: x.max() - x.mean())
+        tm.assert_series_equal(result, expected)
+
+        # dataframe
+        r = self.frame.resample('H')
+        expected = r.max() - r.mean()
+        result = r.pipe(lambda x: x.max() - x.mean())
+        tm.assert_frame_equal(result, expected)
+
+    def test_getitem(self):
+
+        r = self.frame.resample('H')
+        tm.assert_index_equal(r._selected_obj.columns, self.frame.columns)
+
+        r = self.frame.resample('H')['B']
+        assert r._selected_obj.name == self.frame.columns[1]
+
+        # technically this is allowed
+        r = self.frame.resample('H')['A', 'B']
+        tm.assert_index_equal(r._selected_obj.columns,
+                              self.frame.columns[[0, 1]])
+
+        r = self.frame.resample('H')['A', 'B']
+        tm.assert_index_equal(r._selected_obj.columns,
+                              self.frame.columns[[0, 1]])
+
+    def test_select_bad_cols(self):
+
+        g = self.frame.resample('H')
+        pytest.raises(KeyError, g.__getitem__, ['D'])
+
+        pytest.raises(KeyError, g.__getitem__, ['A', 'D'])
+        with tm.assert_raises_regex(KeyError, '^[^A]+$'):
+            # A should not be referenced as a bad column...
+            # will have to rethink regex if you change message!
+            g[['A', 'D']]
+
+    def test_attribute_access(self):
+
+        r = self.frame.resample('H')
+        tm.assert_series_equal(r.A.sum(), r['A'].sum())
+
+    def test_api_compat_before_use(self):
+
+        # make sure that we are setting the binner
+        # on these attributes
+        for attr in ['groups', 'ngroups', 'indices']:
+            rng = pd.date_range('1/1/2012', periods=100, freq='S')
+            ts = Series(np.arange(len(rng)), index=rng)
+            rs = ts.resample('30s')
+
+            # before use
+            getattr(rs, attr)
+
+            # after grouper is initialized is ok
+            rs.mean()
+            getattr(rs, attr)
+
+    def tests_skip_nuisance(self):
+
+        df = self.frame
+        df['D'] = 'foo'
+        r = df.resample('H')
+        result = r[['A', 'B']].sum()
+        expected = pd.concat([r.A.sum(), r.B.sum()], axis=1)
+        assert_frame_equal(result, expected)
+
+        expected = r[['A', 'B', 'C']].sum()
+        result = r.sum()
+        assert_frame_equal(result, expected)
+
+    def test_downsample_but_actually_upsampling(self):
+
+        # this is reindex / asfreq
+        rng = pd.date_range('1/1/2012', periods=100, freq='S')
+        ts = Series(np.arange(len(rng), dtype='int64'), index=rng)
+        result = ts.resample('20s').asfreq()
+        expected = Series([0, 20, 40, 60, 80],
+                          index=pd.date_range('2012-01-01 00:00:00',
+                                              freq='20s',
+                                              periods=5))
+        assert_series_equal(result, expected)
+
+    def test_combined_up_downsampling_of_irregular(self):
+
+        # since we are reallydoing an operation like this
+        # ts2.resample('2s').mean().ffill()
+        # preserve these semantics
+
+        rng = pd.date_range('1/1/2012', periods=100, freq='S')
+        ts = Series(np.arange(len(rng)), index=rng)
+        ts2 = ts.iloc[[0, 1, 2, 3, 5, 7, 11, 15, 16, 25, 30]]
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = ts2.resample('2s', how='mean', fill_method='ffill')
+        expected = ts2.resample('2s').mean().ffill()
+        assert_series_equal(result, expected)
+
+    def test_transform(self):
+
+        r = self.series.resample('20min')
+        expected = self.series.groupby(
+            pd.Grouper(freq='20min')).transform('mean')
+        result = r.transform('mean')
+        assert_series_equal(result, expected)
+
+    def test_fillna(self):
+
+        # need to upsample here
+        rng = pd.date_range('1/1/2012', periods=10, freq='2S')
+        ts = Series(np.arange(len(rng), dtype='int64'), index=rng)
+        r = ts.resample('s')
+
+        expected = r.ffill()
+        result = r.fillna(method='ffill')
+        assert_series_equal(result, expected)
+
+        expected = r.bfill()
+        result = r.fillna(method='bfill')
+        assert_series_equal(result, expected)
+
+        with pytest.raises(ValueError):
+            r.fillna(0)
+
+    def test_apply_without_aggregation(self):
+
+        # both resample and groupby should work w/o aggregation
+        r = self.series.resample('20min')
+        g = self.series.groupby(pd.Grouper(freq='20min'))
+
+        for t in [g, r]:
+            result = t.apply(lambda x: x)
+            assert_series_equal(result, self.series)
+
+    def test_agg_consistency(self):
+
+        # make sure that we are consistent across
+        # similar aggregations with and w/o selection list
+        df = DataFrame(np.random.randn(1000, 3),
+                       index=pd.date_range('1/1/2012', freq='S', periods=1000),
+                       columns=['A', 'B', 'C'])
+
+        r = df.resample('3T')
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            expected = r[['A', 'B', 'C']].agg({'r1': 'mean', 'r2': 'sum'})
+            result = r.agg({'r1': 'mean', 'r2': 'sum'})
+        assert_frame_equal(result, expected)
+
+    # TODO: once GH 14008 is fixed, move these tests into
+    # `Base` test class
+    def test_agg(self):
+        # test with all three Resampler apis and TimeGrouper
+
+        np.random.seed(1234)
+        index = date_range(datetime(2005, 1, 1),
+                           datetime(2005, 1, 10), freq='D')
+        index.name = 'date'
+        df = DataFrame(np.random.rand(10, 2), columns=list('AB'), index=index)
+        df_col = df.reset_index()
+        df_mult = df_col.copy()
+        df_mult.index = pd.MultiIndex.from_arrays([range(10), df.index],
+                                                  names=['index', 'date'])
+        r = df.resample('2D')
+        cases = [
+            r,
+            df_col.resample('2D', on='date'),
+            df_mult.resample('2D', level='date'),
+            df.groupby(pd.Grouper(freq='2D'))
+        ]
+
+        a_mean = r['A'].mean()
+        a_std = r['A'].std()
+        a_sum = r['A'].sum()
+        b_mean = r['B'].mean()
+        b_std = r['B'].std()
+        b_sum = r['B'].sum()
+
+        expected = pd.concat([a_mean, a_std, b_mean, b_std], axis=1)
+        expected.columns = pd.MultiIndex.from_product([['A', 'B'],
+                                                       ['mean', 'std']])
+        for t in cases:
+            result = t.aggregate([np.mean, np.std])
+            assert_frame_equal(result, expected)
+
+        expected = pd.concat([a_mean, b_std], axis=1)
+        for t in cases:
+            result = t.aggregate({'A': np.mean,
+                                  'B': np.std})
+            assert_frame_equal(result, expected, check_like=True)
+
+        expected = pd.concat([a_mean, a_std], axis=1)
+        expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
+                                                      ('A', 'std')])
+        for t in cases:
+            result = t.aggregate({'A': ['mean', 'std']})
+            assert_frame_equal(result, expected)
+
+        expected = pd.concat([a_mean, a_sum], axis=1)
+        expected.columns = ['mean', 'sum']
+        for t in cases:
+            result = t['A'].aggregate(['mean', 'sum'])
+        assert_frame_equal(result, expected)
+
+        expected = pd.concat([a_mean, a_sum], axis=1)
+        expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
+                                                      ('A', 'sum')])
+        for t in cases:
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = t.aggregate({'A': {'mean': 'mean', 'sum': 'sum'}})
+            assert_frame_equal(result, expected, check_like=True)
+
+        expected = pd.concat([a_mean, a_sum, b_mean, b_sum], axis=1)
+        expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
+                                                      ('A', 'sum'),
+                                                      ('B', 'mean2'),
+                                                      ('B', 'sum2')])
+        for t in cases:
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = t.aggregate({'A': {'mean': 'mean', 'sum': 'sum'},
+                                      'B': {'mean2': 'mean', 'sum2': 'sum'}})
+            assert_frame_equal(result, expected, check_like=True)
+
+        expected = pd.concat([a_mean, a_std, b_mean, b_std], axis=1)
+        expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
+                                                      ('A', 'std'),
+                                                      ('B', 'mean'),
+                                                      ('B', 'std')])
+        for t in cases:
+            result = t.aggregate({'A': ['mean', 'std'],
+                                  'B': ['mean', 'std']})
+            assert_frame_equal(result, expected, check_like=True)
+
+        expected = pd.concat([a_mean, a_sum, b_mean, b_sum], axis=1)
+        expected.columns = pd.MultiIndex.from_tuples([('r1', 'A', 'mean'),
+                                                      ('r1', 'A', 'sum'),
+                                                      ('r2', 'B', 'mean'),
+                                                      ('r2', 'B', 'sum')])
+
+    def test_agg_misc(self):
+        # test with all three Resampler apis and TimeGrouper
+
+        np.random.seed(1234)
+        index = date_range(datetime(2005, 1, 1),
+                           datetime(2005, 1, 10), freq='D')
+        index.name = 'date'
+        df = DataFrame(np.random.rand(10, 2), columns=list('AB'), index=index)
+        df_col = df.reset_index()
+        df_mult = df_col.copy()
+        df_mult.index = pd.MultiIndex.from_arrays([range(10), df.index],
+                                                  names=['index', 'date'])
+
+        r = df.resample('2D')
+        cases = [
+            r,
+            df_col.resample('2D', on='date'),
+            df_mult.resample('2D', level='date'),
+            df.groupby(pd.Grouper(freq='2D'))
+        ]
+
+        # passed lambda
+        for t in cases:
+            result = t.agg({'A': np.sum,
+                            'B': lambda x: np.std(x, ddof=1)})
+            rcustom = t['B'].apply(lambda x: np.std(x, ddof=1))
+            expected = pd.concat([r['A'].sum(), rcustom], axis=1)
+            assert_frame_equal(result, expected, check_like=True)
+
+        # agg with renamers
+        expected = pd.concat([t['A'].sum(),
+                              t['B'].sum(),
+                              t['A'].mean(),
+                              t['B'].mean()],
+                             axis=1)
+        expected.columns = pd.MultiIndex.from_tuples([('result1', 'A'),
+                                                      ('result1', 'B'),
+                                                      ('result2', 'A'),
+                                                      ('result2', 'B')])
+
+        for t in cases:
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = t[['A', 'B']].agg(OrderedDict([('result1', np.sum),
+                                                        ('result2', np.mean)]))
+            assert_frame_equal(result, expected, check_like=True)
+
+        # agg with different hows
+        expected = pd.concat([t['A'].sum(),
+                              t['A'].std(),
+                              t['B'].mean(),
+                              t['B'].std()],
+                             axis=1)
+        expected.columns = pd.MultiIndex.from_tuples([('A', 'sum'),
+                                                      ('A', 'std'),
+                                                      ('B', 'mean'),
+                                                      ('B', 'std')])
+        for t in cases:
+            result = t.agg(OrderedDict([('A', ['sum', 'std']),
+                                        ('B', ['mean', 'std'])]))
+            assert_frame_equal(result, expected, check_like=True)
+
+        # equivalent of using a selection list / or not
+        for t in cases:
+            result = t[['A', 'B']].agg({'A': ['sum', 'std'],
+                                        'B': ['mean', 'std']})
+            assert_frame_equal(result, expected, check_like=True)
+
+        # series like aggs
+        for t in cases:
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = t['A'].agg({'A': ['sum', 'std']})
+            expected = pd.concat([t['A'].sum(),
+                                  t['A'].std()],
+                                 axis=1)
+            expected.columns = pd.MultiIndex.from_tuples([('A', 'sum'),
+                                                          ('A', 'std')])
+            assert_frame_equal(result, expected, check_like=True)
+
+            expected = pd.concat([t['A'].agg(['sum', 'std']),
+                                  t['A'].agg(['mean', 'std'])],
+                                 axis=1)
+            expected.columns = pd.MultiIndex.from_tuples([('A', 'sum'),
+                                                          ('A', 'std'),
+                                                          ('B', 'mean'),
+                                                          ('B', 'std')])
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = t['A'].agg({'A': ['sum', 'std'],
+                                     'B': ['mean', 'std']})
+            assert_frame_equal(result, expected, check_like=True)
+
+        # errors
+        # invalid names in the agg specification
+        for t in cases:
+            def f():
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    t[['A']].agg({'A': ['sum', 'std'],
+                                  'B': ['mean', 'std']})
+
+            pytest.raises(KeyError, f)
+
+    def test_agg_nested_dicts(self):
+
+        np.random.seed(1234)
+        index = date_range(datetime(2005, 1, 1),
+                           datetime(2005, 1, 10), freq='D')
+        index.name = 'date'
+        df = DataFrame(np.random.rand(10, 2), columns=list('AB'), index=index)
+        df_col = df.reset_index()
+        df_mult = df_col.copy()
+        df_mult.index = pd.MultiIndex.from_arrays([range(10), df.index],
+                                                  names=['index', 'date'])
+        r = df.resample('2D')
+        cases = [
+            r,
+            df_col.resample('2D', on='date'),
+            df_mult.resample('2D', level='date'),
+            df.groupby(pd.Grouper(freq='2D'))
+        ]
+
+        for t in cases:
+            def f():
+                t.aggregate({'r1': {'A': ['mean', 'sum']},
+                             'r2': {'B': ['mean', 'sum']}})
+                pytest.raises(ValueError, f)
+
+        for t in cases:
+            expected = pd.concat([t['A'].mean(), t['A'].std(), t['B'].mean(),
+                                  t['B'].std()], axis=1)
+            expected.columns = pd.MultiIndex.from_tuples([('ra', 'mean'), (
+                'ra', 'std'), ('rb', 'mean'), ('rb', 'std')])
+
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = t[['A', 'B']].agg({'A': {'ra': ['mean', 'std']},
+                                            'B': {'rb': ['mean', 'std']}})
+            assert_frame_equal(result, expected, check_like=True)
+
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = t.agg({'A': {'ra': ['mean', 'std']},
+                                'B': {'rb': ['mean', 'std']}})
+            assert_frame_equal(result, expected, check_like=True)
+
+    def test_try_aggregate_non_existing_column(self):
+        # GH 16766
+        data = [
+            {'dt': datetime(2017, 6, 1, 0), 'x': 1.0, 'y': 2.0},
+            {'dt': datetime(2017, 6, 1, 1), 'x': 2.0, 'y': 2.0},
+            {'dt': datetime(2017, 6, 1, 2), 'x': 3.0, 'y': 1.5}
+        ]
+        df = DataFrame(data).set_index('dt')
+
+        # Error as we don't have 'z' column
+        with pytest.raises(KeyError):
+            df.resample('30T').agg({'x': ['mean'],
+                                    'y': ['median'],
+                                    'z': ['sum']})
+
+    def test_selection_api_validation(self):
+        # GH 13500
+        index = date_range(datetime(2005, 1, 1),
+                           datetime(2005, 1, 10), freq='D')
+
+        rng = np.arange(len(index), dtype=np.int64)
+        df = DataFrame({'date': index, 'a': rng},
+                       index=pd.MultiIndex.from_arrays([rng, index],
+                                                       names=['v', 'd']))
+        df_exp = DataFrame({'a': rng}, index=index)
+
+        # non DatetimeIndex
+        with pytest.raises(TypeError):
+            df.resample('2D', level='v')
+
+        with pytest.raises(ValueError):
+            df.resample('2D', on='date', level='d')
+
+        with pytest.raises(TypeError):
+            df.resample('2D', on=['a', 'date'])
+
+        with pytest.raises(KeyError):
+            df.resample('2D', level=['a', 'date'])
+
+        # upsampling not allowed
+        with pytest.raises(ValueError):
+            df.resample('2D', level='d').asfreq()
+
+        with pytest.raises(ValueError):
+            df.resample('2D', on='date').asfreq()
+
+        exp = df_exp.resample('2D').sum()
+        exp.index.name = 'date'
+        assert_frame_equal(exp, df.resample('2D', on='date').sum())
+
+        exp.index.name = 'd'
+        assert_frame_equal(exp, df.resample('2D', level='d').sum())
+
+
+class Base(object):
+    """
+    base class for resampling testing, calling
+    .create_series() generates a series of each index type
+    """
+
+    def create_index(self, *args, **kwargs):
+        """ return the _index_factory created using the args, kwargs """
+        factory = self._index_factory()
+        return factory(*args, **kwargs)
+
+    @pytest.fixture
+    def _index_start(self):
+        return datetime(2005, 1, 1)
+
+    @pytest.fixture
+    def _index_end(self):
+        return datetime(2005, 1, 10)
+
+    @pytest.fixture
+    def _index_freq(self):
+        return 'D'
+
+    @pytest.fixture
+    def index(self, _index_start, _index_end, _index_freq):
+        return self.create_index(_index_start, _index_end, freq=_index_freq)
+
+    @pytest.fixture
+    def _series_name(self):
+        raise com.AbstractMethodError(self)
+
+    @pytest.fixture
+    def _static_values(self, index):
+        return np.arange(len(index))
+
+    @pytest.fixture
+    def series(self, index, _series_name, _static_values):
+        return Series(_static_values, index=index, name=_series_name)
+
+    @pytest.fixture
+    def frame(self, index, _static_values):
+        return DataFrame({'value': _static_values}, index=index)
+
+    @pytest.fixture(params=[Series, DataFrame])
+    def series_and_frame(self, request, index, _series_name, _static_values):
+        if request.param == Series:
+            return Series(_static_values, index=index, name=_series_name)
+        if request.param == DataFrame:
+            return DataFrame({'value': _static_values}, index=index)
+
+    @pytest.mark.parametrize('freq', ['2D', '1H'])
+    def test_asfreq(self, series_and_frame, freq):
+        obj = series_and_frame
+
+        result = obj.resample(freq).asfreq()
+        if freq == '2D':
+            new_index = obj.index.take(np.arange(0, len(obj.index), 2))
+            new_index.freq = to_offset('2D')
+        else:
+            new_index = self.create_index(obj.index[0], obj.index[-1],
+                                          freq=freq)
+        expected = obj.reindex(new_index)
+        assert_almost_equal(result, expected)
+
+    def test_asfreq_fill_value(self):
+        # test for fill value during resampling, issue 3715
+
+        s = self.create_series()
+
+        result = s.resample('1H').asfreq()
+        new_index = self.create_index(s.index[0], s.index[-1], freq='1H')
+        expected = s.reindex(new_index)
+        assert_series_equal(result, expected)
+
+        frame = s.to_frame('value')
+        frame.iloc[1] = None
+        result = frame.resample('1H').asfreq(fill_value=4.0)
+        new_index = self.create_index(frame.index[0],
+                                      frame.index[-1], freq='1H')
+        expected = frame.reindex(new_index, fill_value=4.0)
+        assert_frame_equal(result, expected)
+
+    def test_resample_interpolate(self):
+        # # 12925
+        df = self.create_series().to_frame('value')
+        assert_frame_equal(
+            df.resample('1T').asfreq().interpolate(),
+            df.resample('1T').interpolate())
+
+    def test_raises_on_non_datetimelike_index(self):
+        # this is a non datetimelike index
+        xp = DataFrame()
+        pytest.raises(TypeError, lambda: xp.resample('A').mean())
+
+    def test_resample_empty_series(self):
+        # GH12771 & GH12868
+
+        s = self.create_series()[:0]
+
+        for freq in ['M', 'D', 'H']:
+            # need to test for ohlc from GH13083
+            methods = [method for method in resample_methods
+                       if method != 'ohlc']
+            for method in methods:
+                result = getattr(s.resample(freq), method)()
+
+                expected = s.copy()
+                expected.index = s.index._shallow_copy(freq=freq)
+                assert_index_equal(result.index, expected.index)
+                assert result.index.freq == expected.index.freq
+                assert_series_equal(result, expected, check_dtype=False)
+
+    def test_resample_empty_dataframe(self):
+        # GH13212
+        index = self.create_series().index[:0]
+        f = DataFrame(index=index)
+
+        for freq in ['M', 'D', 'H']:
+            # count retains dimensions too
+            methods = downsample_methods + upsample_methods
+            for method in methods:
+                result = getattr(f.resample(freq), method)()
+                if method != 'size':
+                    expected = f.copy()
+                else:
+                    # GH14962
+                    expected = Series([])
+
+                expected.index = f.index._shallow_copy(freq=freq)
+                assert_index_equal(result.index, expected.index)
+                assert result.index.freq == expected.index.freq
+                assert_almost_equal(result, expected, check_dtype=False)
+
+            # test size for GH13212 (currently stays as df)
+
+    @pytest.mark.parametrize("index", tm.all_timeseries_index_generator(0))
+    @pytest.mark.parametrize(
+        "dtype",
+        [np.float, np.int, np.object, 'datetime64[ns]'])
+    def test_resample_empty_dtypes(self, index, dtype):
+
+        # Empty series were sometimes causing a segfault (for the functions
+        # with Cython bounds-checking disabled) or an IndexError.  We just run
+        # them to ensure they no longer do.  (GH #10228)
+        for how in downsample_methods + upsample_methods:
+            empty_series = Series([], index, dtype)
+            try:
+                getattr(empty_series.resample('d'), how)()
+            except DataError:
+                # Ignore these since some combinations are invalid
+                # (ex: doing mean with dtype of np.object)
+                pass
+
+    def test_resample_loffset_arg_type(self):
+        # GH 13218, 15002
+        df = self.create_series().to_frame('value')
+        expected_means = [df.values[i:i + 2].mean()
+                          for i in range(0, len(df.values), 2)]
+        expected_index = self.create_index(df.index[0],
+                                           periods=len(df.index) / 2,
+                                           freq='2D')
+
+        # loffset coerces PeriodIndex to DateTimeIndex
+        if isinstance(expected_index, PeriodIndex):
+            expected_index = expected_index.to_timestamp()
+
+        expected_index += timedelta(hours=2)
+        expected = DataFrame({'value': expected_means}, index=expected_index)
+
+        for arg in ['mean', {'value': 'mean'}, ['mean']]:
+
+            result_agg = df.resample('2D', loffset='2H').agg(arg)
+
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result_how = df.resample('2D', how=arg, loffset='2H')
+
+            if isinstance(arg, list):
+                expected.columns = pd.MultiIndex.from_tuples([('value',
+                                                               'mean')])
+
+            # GH 13022, 7687 - TODO: fix resample w/ TimedeltaIndex
+            if isinstance(expected.index, TimedeltaIndex):
+                with pytest.raises(AssertionError):
+                    assert_frame_equal(result_agg, expected)
+                    assert_frame_equal(result_how, expected)
+            else:
+                assert_frame_equal(result_agg, expected)
+                assert_frame_equal(result_how, expected)
+
+    def test_apply_to_empty_series(self):
+        # GH 14313
+        series = self.create_series()[:0]
+
+        for freq in ['M', 'D', 'H']:
+            result = series.resample(freq).apply(lambda x: 1)
+            expected = series.resample(freq).apply(np.sum)
+
+            assert_series_equal(result, expected, check_dtype=False)
+
+
+class TestDatetimeIndex(Base):
+    _index_factory = lambda x: date_range
+
+    @pytest.fixture
+    def _series_name(self):
+        return 'dti'
+
+    def setup_method(self, method):
+        dti = DatetimeIndex(start=datetime(2005, 1, 1),
+                            end=datetime(2005, 1, 10), freq='Min')
+
+        self.series = Series(np.random.rand(len(dti)), dti)
+
+    def create_series(self):
+        i = date_range(datetime(2005, 1, 1),
+                       datetime(2005, 1, 10), freq='D')
+
+        return Series(np.arange(len(i)), index=i, name='dti')
+
+    def test_custom_grouper(self):
+
+        dti = DatetimeIndex(freq='Min', start=datetime(2005, 1, 1),
+                            end=datetime(2005, 1, 10))
+
+        s = Series(np.array([1] * len(dti)), index=dti, dtype='int64')
+
+        b = TimeGrouper(Minute(5))
+        g = s.groupby(b)
+
+        # check all cython functions work
+        funcs = ['add', 'mean', 'prod', 'ohlc', 'min', 'max', 'var']
+        for f in funcs:
+            g._cython_agg_general(f)
+
+        b = TimeGrouper(Minute(5), closed='right', label='right')
+        g = s.groupby(b)
+        # check all cython functions work
+        funcs = ['add', 'mean', 'prod', 'ohlc', 'min', 'max', 'var']
+        for f in funcs:
+            g._cython_agg_general(f)
+
+        assert g.ngroups == 2593
+        assert notna(g.mean()).all()
+
+        # construct expected val
+        arr = [1] + [5] * 2592
+        idx = dti[0:-1:5]
+        idx = idx.append(dti[-1:])
+        expect = Series(arr, index=idx)
+
+        # GH2763 - return in put dtype if we can
+        result = g.agg(np.sum)
+        assert_series_equal(result, expect)
+
+        df = DataFrame(np.random.rand(len(dti), 10),
+                       index=dti, dtype='float64')
+        r = df.groupby(b).agg(np.sum)
+
+        assert len(r.columns) == 10
+        assert len(r.index) == 2593
+
+    def test_resample_basic(self):
+        rng = date_range('1/1/2000 00:00:00', '1/1/2000 00:13:00', freq='min',
+                         name='index')
+        s = Series(np.random.randn(14), index=rng)
+
+        result = s.resample('5min', closed='right', label='right').mean()
+
+        exp_idx = date_range('1/1/2000', periods=4, freq='5min', name='index')
+        expected = Series([s[0], s[1:6].mean(), s[6:11].mean(), s[11:].mean()],
+                          index=exp_idx)
+        assert_series_equal(result, expected)
+        assert result.index.name == 'index'
+
+        result = s.resample('5min', closed='left', label='right').mean()
+
+        exp_idx = date_range('1/1/2000 00:05', periods=3, freq='5min',
+                             name='index')
+        expected = Series([s[:5].mean(), s[5:10].mean(),
+                           s[10:].mean()], index=exp_idx)
+        assert_series_equal(result, expected)
+
+        s = self.series
+        result = s.resample('5Min').last()
+        grouper = TimeGrouper(Minute(5), closed='left', label='left')
+        expect = s.groupby(grouper).agg(lambda x: x[-1])
+        assert_series_equal(result, expect)
+
+    def test_resample_string_kwargs(self):
+        # Test for issue #19303
+        rng = date_range('1/1/2000 00:00:00', '1/1/2000 00:13:00', freq='min',
+                         name='index')
+        s = Series(np.random.randn(14), index=rng)
+
+        # Check that wrong keyword argument strings raise an error
+        with pytest.raises(ValueError):
+            s.resample('5min', label='righttt').mean()
+        with pytest.raises(ValueError):
+            s.resample('5min', closed='righttt').mean()
+        with pytest.raises(ValueError):
+            s.resample('5min', convention='starttt').mean()
+
+    def test_resample_how(self):
+        rng = date_range('1/1/2000 00:00:00', '1/1/2000 00:13:00', freq='min',
+                         name='index')
+        s = Series(np.random.randn(14), index=rng)
+        grouplist = np.ones_like(s)
+        grouplist[0] = 0
+        grouplist[1:6] = 1
+        grouplist[6:11] = 2
+        grouplist[11:] = 3
+        args = downsample_methods
+
+        def _ohlc(group):
+            if isna(group).all():
+                return np.repeat(np.nan, 4)
+            return [group[0], group.max(), group.min(), group[-1]]
+
+        inds = date_range('1/1/2000', periods=4, freq='5min', name='index')
+
+        for arg in args:
+            if arg == 'ohlc':
+                func = _ohlc
+            else:
+                func = arg
+            try:
+                result = getattr(s.resample(
+                    '5min', closed='right', label='right'), arg)()
+
+                expected = s.groupby(grouplist).agg(func)
+                assert result.index.name == 'index'
+                if arg == 'ohlc':
+                    expected = DataFrame(expected.values.tolist())
+                    expected.columns = ['open', 'high', 'low', 'close']
+                    expected.index = Index(inds, name='index')
+                    assert_frame_equal(result, expected)
+                else:
+                    expected.index = inds
+                    assert_series_equal(result, expected)
+            except BaseException as exc:
+
+                exc.args += ('how=%s' % arg,)
+                raise
+
+    def test_numpy_compat(self):
+        # see gh-12811
+        s = Series([1, 2, 3, 4, 5], index=date_range(
+            '20130101', periods=5, freq='s'))
+        r = s.resample('2s')
+
+        msg = "numpy operations are not valid with resample"
+
+        for func in ('min', 'max', 'sum', 'prod',
+                     'mean', 'var', 'std'):
+            tm.assert_raises_regex(UnsupportedFunctionCall, msg,
+                                   getattr(r, func),
+                                   func, 1, 2, 3)
+            tm.assert_raises_regex(UnsupportedFunctionCall, msg,
+                                   getattr(r, func), axis=1)
+
+    def test_resample_how_callables(self):
+        # GH 7929
+        data = np.arange(5, dtype=np.int64)
+        ind = pd.DatetimeIndex(start='2014-01-01', periods=len(data), freq='d')
+        df = DataFrame({"A": data, "B": data}, index=ind)
+
+        def fn(x, a=1):
+            return str(type(x))
+
+        class FnClass(object):
+
+            def __call__(self, x):
+                return str(type(x))
+
+        df_standard = df.resample("M").apply(fn)
+        df_lambda = df.resample("M").apply(lambda x: str(type(x)))
+        df_partial = df.resample("M").apply(partial(fn))
+        df_partial2 = df.resample("M").apply(partial(fn, a=2))
+        df_class = df.resample("M").apply(FnClass())
+
+        assert_frame_equal(df_standard, df_lambda)
+        assert_frame_equal(df_standard, df_partial)
+        assert_frame_equal(df_standard, df_partial2)
+        assert_frame_equal(df_standard, df_class)
+
+    def test_resample_with_timedeltas(self):
+
+        expected = DataFrame({'A': np.arange(1480)})
+        expected = expected.groupby(expected.index // 30).sum()
+        expected.index = pd.timedelta_range('0 days', freq='30T', periods=50)
+
+        df = DataFrame({'A': np.arange(1480)}, index=pd.to_timedelta(
+            np.arange(1480), unit='T'))
+        result = df.resample('30T').sum()
+
+        assert_frame_equal(result, expected)
+
+        s = df['A']
+        result = s.resample('30T').sum()
+        assert_series_equal(result, expected['A'])
+
+    def test_resample_single_period_timedelta(self):
+
+        s = Series(list(range(5)), index=pd.timedelta_range(
+            '1 day', freq='s', periods=5))
+        result = s.resample('2s').sum()
+        expected = Series([1, 5, 4], index=pd.timedelta_range(
+            '1 day', freq='2s', periods=3))
+        assert_series_equal(result, expected)
+
+    def test_resample_timedelta_idempotency(self):
+
+        # GH 12072
+        index = pd.timedelta_range('0', periods=9, freq='10L')
+        series = Series(range(9), index=index)
+        result = series.resample('10L').mean()
+        expected = series
+        assert_series_equal(result, expected)
+
+    def test_resample_rounding(self):
+        # GH 8371
+        # odd results when rounding is needed
+
+        data = """date,time,value
+11-08-2014,00:00:01.093,1
+11-08-2014,00:00:02.159,1
+11-08-2014,00:00:02.667,1
+11-08-2014,00:00:03.175,1
+11-08-2014,00:00:07.058,1
+11-08-2014,00:00:07.362,1
+11-08-2014,00:00:08.324,1
+11-08-2014,00:00:08.830,1
+11-08-2014,00:00:08.982,1
+11-08-2014,00:00:09.815,1
+11-08-2014,00:00:10.540,1
+11-08-2014,00:00:11.061,1
+11-08-2014,00:00:11.617,1
+11-08-2014,00:00:13.607,1
+11-08-2014,00:00:14.535,1
+11-08-2014,00:00:15.525,1
+11-08-2014,00:00:17.960,1
+11-08-2014,00:00:20.674,1
+11-08-2014,00:00:21.191,1"""
+
+        from pandas.compat import StringIO
+        df = pd.read_csv(StringIO(data), parse_dates={'timestamp': [
+            'date', 'time']}, index_col='timestamp')
+        df.index.name = None
+        result = df.resample('6s').sum()
+        expected = DataFrame({'value': [
+            4, 9, 4, 2
+        ]}, index=date_range('2014-11-08', freq='6s', periods=4))
+        assert_frame_equal(result, expected)
+
+        result = df.resample('7s').sum()
+        expected = DataFrame({'value': [
+            4, 10, 4, 1
+        ]}, index=date_range('2014-11-08', freq='7s', periods=4))
+        assert_frame_equal(result, expected)
+
+        result = df.resample('11s').sum()
+        expected = DataFrame({'value': [
+            11, 8
+        ]}, index=date_range('2014-11-08', freq='11s', periods=2))
+        assert_frame_equal(result, expected)
+
+        result = df.resample('13s').sum()
+        expected = DataFrame({'value': [
+            13, 6
+        ]}, index=date_range('2014-11-08', freq='13s', periods=2))
+        assert_frame_equal(result, expected)
+
+        result = df.resample('17s').sum()
+        expected = DataFrame({'value': [
+            16, 3
+        ]}, index=date_range('2014-11-08', freq='17s', periods=2))
+        assert_frame_equal(result, expected)
+
+    def test_resample_basic_from_daily(self):
+        # from daily
+        dti = DatetimeIndex(start=datetime(2005, 1, 1),
+                            end=datetime(2005, 1, 10), freq='D', name='index')
+
+        s = Series(np.random.rand(len(dti)), dti)
+
+        # to weekly
+        result = s.resample('w-sun').last()
+
+        assert len(result) == 3
+        assert (result.index.dayofweek == [6, 6, 6]).all()
+        assert result.iloc[0] == s['1/2/2005']
+        assert result.iloc[1] == s['1/9/2005']
+        assert result.iloc[2] == s.iloc[-1]
+
+        result = s.resample('W-MON').last()
+        assert len(result) == 2
+        assert (result.index.dayofweek == [0, 0]).all()
+        assert result.iloc[0] == s['1/3/2005']
+        assert result.iloc[1] == s['1/10/2005']
+
+        result = s.resample('W-TUE').last()
+        assert len(result) == 2
+        assert (result.index.dayofweek == [1, 1]).all()
+        assert result.iloc[0] == s['1/4/2005']
+        assert result.iloc[1] == s['1/10/2005']
+
+        result = s.resample('W-WED').last()
+        assert len(result) == 2
+        assert (result.index.dayofweek == [2, 2]).all()
+        assert result.iloc[0] == s['1/5/2005']
+        assert result.iloc[1] == s['1/10/2005']
+
+        result = s.resample('W-THU').last()
+        assert len(result) == 2
+        assert (result.index.dayofweek == [3, 3]).all()
+        assert result.iloc[0] == s['1/6/2005']
+        assert result.iloc[1] == s['1/10/2005']
+
+        result = s.resample('W-FRI').last()
+        assert len(result) == 2
+        assert (result.index.dayofweek == [4, 4]).all()
+        assert result.iloc[0] == s['1/7/2005']
+        assert result.iloc[1] == s['1/10/2005']
+
+        # to biz day
+        result = s.resample('B').last()
+        assert len(result) == 7
+        assert (result.index.dayofweek == [4, 0, 1, 2, 3, 4, 0]).all()
+
+        assert result.iloc[0] == s['1/2/2005']
+        assert result.iloc[1] == s['1/3/2005']
+        assert result.iloc[5] == s['1/9/2005']
+        assert result.index.name == 'index'
+
+    def test_resample_upsampling_picked_but_not_correct(self):
+
+        # Test for issue #3020
+        dates = date_range('01-Jan-2014', '05-Jan-2014', freq='D')
+        series = Series(1, index=dates)
+
+        result = series.resample('D').mean()
+        assert result.index[0] == dates[0]
+
+        # GH 5955
+        # incorrect deciding to upsample when the axis frequency matches the
+        # resample frequency
+
+        import datetime
+        s = Series(np.arange(1., 6), index=[datetime.datetime(
+            1975, 1, i, 12, 0) for i in range(1, 6)])
+        expected = Series(np.arange(1., 6), index=date_range(
+            '19750101', periods=5, freq='D'))
+
+        result = s.resample('D').count()
+        assert_series_equal(result, Series(1, index=expected.index))
+
+        result1 = s.resample('D').sum()
+        result2 = s.resample('D').mean()
+        assert_series_equal(result1, expected)
+        assert_series_equal(result2, expected)
+
+    def test_resample_frame_basic(self):
+        df = tm.makeTimeDataFrame()
+
+        b = TimeGrouper('M')
+        g = df.groupby(b)
+
+        # check all cython functions work
+        funcs = ['add', 'mean', 'prod', 'min', 'max', 'var']
+        for f in funcs:
+            g._cython_agg_general(f)
+
+        result = df.resample('A').mean()
+        assert_series_equal(result['A'], df['A'].resample('A').mean())
+
+        result = df.resample('M').mean()
+        assert_series_equal(result['A'], df['A'].resample('M').mean())
+
+        df.resample('M', kind='period').mean()
+        df.resample('W-WED', kind='period').mean()
+
+    def test_resample_loffset(self):
+        rng = date_range('1/1/2000 00:00:00', '1/1/2000 00:13:00', freq='min')
+        s = Series(np.random.randn(14), index=rng)
+
+        result = s.resample('5min', closed='right', label='right',
+                            loffset=timedelta(minutes=1)).mean()
+        idx = date_range('1/1/2000', periods=4, freq='5min')
+        expected = Series([s[0], s[1:6].mean(), s[6:11].mean(), s[11:].mean()],
+                          index=idx + timedelta(minutes=1))
+        assert_series_equal(result, expected)
+
+        expected = s.resample(
+            '5min', closed='right', label='right',
+            loffset='1min').mean()
+        assert_series_equal(result, expected)
+
+        expected = s.resample(
+            '5min', closed='right', label='right',
+            loffset=Minute(1)).mean()
+        assert_series_equal(result, expected)
+
+        assert result.index.freq == Minute(5)
+
+        # from daily
+        dti = DatetimeIndex(start=datetime(2005, 1, 1),
+                            end=datetime(2005, 1, 10), freq='D')
+        ser = Series(np.random.rand(len(dti)), dti)
+
+        # to weekly
+        result = ser.resample('w-sun').last()
+        expected = ser.resample('w-sun', loffset=-bday).last()
+        assert result.index[0] - bday == expected.index[0]
+
+    def test_resample_loffset_upsample(self):
+        # GH 20744
+        rng = date_range('1/1/2000 00:00:00', '1/1/2000 00:13:00', freq='min')
+        s = Series(np.random.randn(14), index=rng)
+
+        result = s.resample('5min', closed='right', label='right',
+                            loffset=timedelta(minutes=1)).ffill()
+        idx = date_range('1/1/2000', periods=4, freq='5min')
+        expected = Series([s[0], s[5], s[10], s[-1]],
+                          index=idx + timedelta(minutes=1))
+
+        assert_series_equal(result, expected)
+
+    def test_resample_loffset_count(self):
+        # GH 12725
+        start_time = '1/1/2000 00:00:00'
+        rng = date_range(start_time, periods=100, freq='S')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        result = ts.resample('10S', loffset='1s').count()
+
+        expected_index = (
+            date_range(start_time, periods=10, freq='10S') +
+            timedelta(seconds=1)
+        )
+        expected = Series(10, index=expected_index)
+
+        assert_series_equal(result, expected)
+
+        # Same issue should apply to .size() since it goes through
+        #   same code path
+        result = ts.resample('10S', loffset='1s').size()
+
+        assert_series_equal(result, expected)
+
+    def test_resample_upsample(self):
+        # from daily
+        dti = DatetimeIndex(start=datetime(2005, 1, 1),
+                            end=datetime(2005, 1, 10), freq='D', name='index')
+
+        s = Series(np.random.rand(len(dti)), dti)
+
+        # to minutely, by padding
+        result = s.resample('Min').pad()
+        assert len(result) == 12961
+        assert result[0] == s[0]
+        assert result[-1] == s[-1]
+
+        assert result.index.name == 'index'
+
+    def test_resample_how_method(self):
+        # GH9915
+        s = Series([11, 22],
+                   index=[Timestamp('2015-03-31 21:48:52.672000'),
+                          Timestamp('2015-03-31 21:49:52.739000')])
+        expected = Series([11, np.NaN, np.NaN, np.NaN, np.NaN, np.NaN, 22],
+                          index=[Timestamp('2015-03-31 21:48:50'),
+                                 Timestamp('2015-03-31 21:49:00'),
+                                 Timestamp('2015-03-31 21:49:10'),
+                                 Timestamp('2015-03-31 21:49:20'),
+                                 Timestamp('2015-03-31 21:49:30'),
+                                 Timestamp('2015-03-31 21:49:40'),
+                                 Timestamp('2015-03-31 21:49:50')])
+        assert_series_equal(s.resample("10S").mean(), expected)
+
+    def test_resample_extra_index_point(self):
+        # GH 9756
+        index = DatetimeIndex(start='20150101', end='20150331', freq='BM')
+        expected = DataFrame({'A': Series([21, 41, 63], index=index)})
+
+        index = DatetimeIndex(start='20150101', end='20150331', freq='B')
+        df = DataFrame(
+            {'A': Series(range(len(index)), index=index)}, dtype='int64')
+        result = df.resample('BM').last()
+        assert_frame_equal(result, expected)
+
+    def test_upsample_with_limit(self):
+        rng = date_range('1/1/2000', periods=3, freq='5t')
+        ts = Series(np.random.randn(len(rng)), rng)
+
+        result = ts.resample('t').ffill(limit=2)
+        expected = ts.reindex(result.index, method='ffill', limit=2)
+        assert_series_equal(result, expected)
+
+    def test_nearest_upsample_with_limit(self):
+        rng = date_range('1/1/2000', periods=3, freq='5t')
+        ts = Series(np.random.randn(len(rng)), rng)
+
+        result = ts.resample('t').nearest(limit=2)
+        expected = ts.reindex(result.index, method='nearest', limit=2)
+        assert_series_equal(result, expected)
+
+    def test_resample_ohlc(self):
+        s = self.series
+
+        grouper = TimeGrouper(Minute(5))
+        expect = s.groupby(grouper).agg(lambda x: x[-1])
+        result = s.resample('5Min').ohlc()
+
+        assert len(result) == len(expect)
+        assert len(result.columns) == 4
+
+        xs = result.iloc[-2]
+        assert xs['open'] == s[-6]
+        assert xs['high'] == s[-6:-1].max()
+        assert xs['low'] == s[-6:-1].min()
+        assert xs['close'] == s[-2]
+
+        xs = result.iloc[0]
+        assert xs['open'] == s[0]
+        assert xs['high'] == s[:5].max()
+        assert xs['low'] == s[:5].min()
+        assert xs['close'] == s[4]
+
+    def test_resample_ohlc_result(self):
+
+        # GH 12332
+        index = pd.date_range('1-1-2000', '2-15-2000', freq='h')
+        index = index.union(pd.date_range('4-15-2000', '5-15-2000', freq='h'))
+        s = Series(range(len(index)), index=index)
+
+        a = s.loc[:'4-15-2000'].resample('30T').ohlc()
+        assert isinstance(a, DataFrame)
+
+        b = s.loc[:'4-14-2000'].resample('30T').ohlc()
+        assert isinstance(b, DataFrame)
+
+        # GH12348
+        # raising on odd period
+        rng = date_range('2013-12-30', '2014-01-07')
+        index = rng.drop([Timestamp('2014-01-01'),
+                          Timestamp('2013-12-31'),
+                          Timestamp('2014-01-04'),
+                          Timestamp('2014-01-05')])
+        df = DataFrame(data=np.arange(len(index)), index=index)
+        result = df.resample('B').mean()
+        expected = df.reindex(index=date_range(rng[0], rng[-1], freq='B'))
+        assert_frame_equal(result, expected)
+
+    def test_resample_ohlc_dataframe(self):
+        df = (
+            DataFrame({
+                'PRICE': {
+                    Timestamp('2011-01-06 10:59:05', tz=None): 24990,
+                    Timestamp('2011-01-06 12:43:33', tz=None): 25499,
+                    Timestamp('2011-01-06 12:54:09', tz=None): 25499},
+                'VOLUME': {
+                    Timestamp('2011-01-06 10:59:05', tz=None): 1500000000,
+                    Timestamp('2011-01-06 12:43:33', tz=None): 5000000000,
+                    Timestamp('2011-01-06 12:54:09', tz=None): 100000000}})
+        ).reindex(['VOLUME', 'PRICE'], axis=1)
+        res = df.resample('H').ohlc()
+        exp = pd.concat([df['VOLUME'].resample('H').ohlc(),
+                         df['PRICE'].resample('H').ohlc()],
+                        axis=1,
+                        keys=['VOLUME', 'PRICE'])
+        assert_frame_equal(exp, res)
+
+        df.columns = [['a', 'b'], ['c', 'd']]
+        res = df.resample('H').ohlc()
+        exp.columns = pd.MultiIndex.from_tuples([
+            ('a', 'c', 'open'), ('a', 'c', 'high'), ('a', 'c', 'low'),
+            ('a', 'c', 'close'), ('b', 'd', 'open'), ('b', 'd', 'high'),
+            ('b', 'd', 'low'), ('b', 'd', 'close')])
+        assert_frame_equal(exp, res)
+
+        # dupe columns fail atm
+        # df.columns = ['PRICE', 'PRICE']
+
+    def test_resample_dup_index(self):
+
+        # GH 4812
+        # dup columns with resample raising
+        df = DataFrame(np.random.randn(4, 12), index=[2000, 2000, 2000, 2000],
+                       columns=[Period(year=2000, month=i + 1, freq='M')
+                                for i in range(12)])
+        df.iloc[3, :] = np.nan
+        result = df.resample('Q', axis=1).mean()
+        expected = df.groupby(lambda x: int((x.month - 1) / 3), axis=1).mean()
+        expected.columns = [
+            Period(year=2000, quarter=i + 1, freq='Q') for i in range(4)]
+        assert_frame_equal(result, expected)
+
+    def test_resample_reresample(self):
+        dti = DatetimeIndex(start=datetime(2005, 1, 1),
+                            end=datetime(2005, 1, 10), freq='D')
+        s = Series(np.random.rand(len(dti)), dti)
+        bs = s.resample('B', closed='right', label='right').mean()
+        result = bs.resample('8H').mean()
+        assert len(result) == 22
+        assert isinstance(result.index.freq, offsets.DateOffset)
+        assert result.index.freq == offsets.Hour(8)
+
+    def test_resample_timestamp_to_period(self):
+        ts = _simple_ts('1/1/1990', '1/1/2000')
+
+        result = ts.resample('A-DEC', kind='period').mean()
+        expected = ts.resample('A-DEC').mean()
+        expected.index = period_range('1990', '2000', freq='a-dec')
+        assert_series_equal(result, expected)
+
+        result = ts.resample('A-JUN', kind='period').mean()
+        expected = ts.resample('A-JUN').mean()
+        expected.index = period_range('1990', '2000', freq='a-jun')
+        assert_series_equal(result, expected)
+
+        result = ts.resample('M', kind='period').mean()
+        expected = ts.resample('M').mean()
+        expected.index = period_range('1990-01', '2000-01', freq='M')
+        assert_series_equal(result, expected)
+
+        result = ts.resample('M', kind='period').mean()
+        expected = ts.resample('M').mean()
+        expected.index = period_range('1990-01', '2000-01', freq='M')
+        assert_series_equal(result, expected)
+
+    def test_ohlc_5min(self):
+        def _ohlc(group):
+            if isna(group).all():
+                return np.repeat(np.nan, 4)
+            return [group[0], group.max(), group.min(), group[-1]]
+
+        rng = date_range('1/1/2000 00:00:00', '1/1/2000 5:59:50', freq='10s')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        resampled = ts.resample('5min', closed='right',
+                                label='right').ohlc()
+
+        assert (resampled.loc['1/1/2000 00:00'] == ts[0]).all()
+
+        exp = _ohlc(ts[1:31])
+        assert (resampled.loc['1/1/2000 00:05'] == exp).all()
+
+        exp = _ohlc(ts['1/1/2000 5:55:01':])
+        assert (resampled.loc['1/1/2000 6:00:00'] == exp).all()
+
+    def test_downsample_non_unique(self):
+        rng = date_range('1/1/2000', '2/29/2000')
+        rng2 = rng.repeat(5).values
+        ts = Series(np.random.randn(len(rng2)), index=rng2)
+
+        result = ts.resample('M').mean()
+
+        expected = ts.groupby(lambda x: x.month).mean()
+        assert len(result) == 2
+        assert_almost_equal(result[0], expected[1])
+        assert_almost_equal(result[1], expected[2])
+
+    def test_asfreq_non_unique(self):
+        # GH #1077
+        rng = date_range('1/1/2000', '2/29/2000')
+        rng2 = rng.repeat(2).values
+        ts = Series(np.random.randn(len(rng2)), index=rng2)
+
+        pytest.raises(Exception, ts.asfreq, 'B')
+
+    def test_resample_axis1(self):
+        rng = date_range('1/1/2000', '2/29/2000')
+        df = DataFrame(np.random.randn(3, len(rng)), columns=rng,
+                       index=['a', 'b', 'c'])
+
+        result = df.resample('M', axis=1).mean()
+        expected = df.T.resample('M').mean().T
+        tm.assert_frame_equal(result, expected)
+
+    def test_resample_panel(self):
+        rng = date_range('1/1/2000', '6/30/2000')
+        n = len(rng)
+
+        with catch_warnings(record=True):
+            panel = Panel(np.random.randn(3, n, 5),
+                          items=['one', 'two', 'three'],
+                          major_axis=rng,
+                          minor_axis=['a', 'b', 'c', 'd', 'e'])
+
+            result = panel.resample('M', axis=1).mean()
+
+            def p_apply(panel, f):
+                result = {}
+                for item in panel.items:
+                    result[item] = f(panel[item])
+                return Panel(result, items=panel.items)
+
+            expected = p_apply(panel, lambda x: x.resample('M').mean())
+            tm.assert_panel_equal(result, expected)
+
+            panel2 = panel.swapaxes(1, 2)
+            result = panel2.resample('M', axis=2).mean()
+            expected = p_apply(panel2,
+                               lambda x: x.resample('M', axis=1).mean())
+            tm.assert_panel_equal(result, expected)
+
+    def test_resample_panel_numpy(self):
+        rng = date_range('1/1/2000', '6/30/2000')
+        n = len(rng)
+
+        with catch_warnings(record=True):
+            panel = Panel(np.random.randn(3, n, 5),
+                          items=['one', 'two', 'three'],
+                          major_axis=rng,
+                          minor_axis=['a', 'b', 'c', 'd', 'e'])
+
+            result = panel.resample('M', axis=1).apply(lambda x: x.mean(1))
+            expected = panel.resample('M', axis=1).mean()
+            tm.assert_panel_equal(result, expected)
+
+            panel = panel.swapaxes(1, 2)
+            result = panel.resample('M', axis=2).apply(lambda x: x.mean(2))
+            expected = panel.resample('M', axis=2).mean()
+            tm.assert_panel_equal(result, expected)
+
+    def test_resample_anchored_ticks(self):
+        # If a fixed delta (5 minute, 4 hour) evenly divides a day, we should
+        # "anchor" the origin at midnight so we get regular intervals rather
+        # than starting from the first timestamp which might start in the
+        # middle of a desired interval
+
+        rng = date_range('1/1/2000 04:00:00', periods=86400, freq='s')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+        ts[:2] = np.nan  # so results are the same
+
+        freqs = ['t', '5t', '15t', '30t', '4h', '12h']
+        for freq in freqs:
+            result = ts[2:].resample(freq, closed='left', label='left').mean()
+            expected = ts.resample(freq, closed='left', label='left').mean()
+            assert_series_equal(result, expected)
+
+    def test_resample_single_group(self):
+        mysum = lambda x: x.sum()
+
+        rng = date_range('2000-1-1', '2000-2-10', freq='D')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+        assert_series_equal(ts.resample('M').sum(),
+                            ts.resample('M').apply(mysum))
+
+        rng = date_range('2000-1-1', '2000-1-10', freq='D')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+        assert_series_equal(ts.resample('M').sum(),
+                            ts.resample('M').apply(mysum))
+
+        # GH 3849
+        s = Series([30.1, 31.6], index=[Timestamp('20070915 15:30:00'),
+                                        Timestamp('20070915 15:40:00')])
+        expected = Series([0.75], index=[Timestamp('20070915')])
+        result = s.resample('D').apply(lambda x: np.std(x))
+        assert_series_equal(result, expected)
+
+    def test_resample_base(self):
+        rng = date_range('1/1/2000 00:00:00', '1/1/2000 02:00', freq='s')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        resampled = ts.resample('5min', base=2).mean()
+        exp_rng = date_range('12/31/1999 23:57:00', '1/1/2000 01:57',
+                             freq='5min')
+        tm.assert_index_equal(resampled.index, exp_rng)
+
+    def test_resample_base_with_timedeltaindex(self):
+
+        # GH 10530
+        rng = timedelta_range(start='0s', periods=25, freq='s')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        with_base = ts.resample('2s', base=5).mean()
+        without_base = ts.resample('2s').mean()
+
+        exp_without_base = timedelta_range(start='0s', end='25s', freq='2s')
+        exp_with_base = timedelta_range(start='5s', end='29s', freq='2s')
+
+        tm.assert_index_equal(without_base.index, exp_without_base)
+        tm.assert_index_equal(with_base.index, exp_with_base)
+
+    def test_resample_categorical_data_with_timedeltaindex(self):
+        # GH #12169
+        df = DataFrame({'Group_obj': 'A'},
+                       index=pd.to_timedelta(list(range(20)), unit='s'))
+        df['Group'] = df['Group_obj'].astype('category')
+        result = df.resample('10s').agg(lambda x: (x.value_counts().index[0]))
+        expected = DataFrame({'Group_obj': ['A', 'A'],
+                              'Group': ['A', 'A']},
+                             index=pd.to_timedelta([0, 10], unit='s'))
+        expected = expected.reindex(['Group_obj', 'Group'], axis=1)
+        tm.assert_frame_equal(result, expected)
+
+    def test_resample_daily_anchored(self):
+        rng = date_range('1/1/2000 0:00:00', periods=10000, freq='T')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+        ts[:2] = np.nan  # so results are the same
+
+        result = ts[2:].resample('D', closed='left', label='left').mean()
+        expected = ts.resample('D', closed='left', label='left').mean()
+        assert_series_equal(result, expected)
+
+    def test_resample_to_period_monthly_buglet(self):
+        # GH #1259
+
+        rng = date_range('1/1/2000', '12/31/2000')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        result = ts.resample('M', kind='period').mean()
+        exp_index = period_range('Jan-2000', 'Dec-2000', freq='M')
+        tm.assert_index_equal(result.index, exp_index)
+
+    def test_period_with_agg(self):
+
+        # aggregate a period resampler with a lambda
+        s2 = Series(np.random.randint(0, 5, 50),
+                    index=pd.period_range('2012-01-01', freq='H', periods=50),
+                    dtype='float64')
+
+        expected = s2.to_timestamp().resample('D').mean().to_period()
+        result = s2.resample('D').agg(lambda x: x.mean())
+        assert_series_equal(result, expected)
+
+    def test_resample_segfault(self):
+        # GH 8573
+        # segfaulting in older versions
+        all_wins_and_wagers = [
+            (1, datetime(2013, 10, 1, 16, 20), 1, 0),
+            (2, datetime(2013, 10, 1, 16, 10), 1, 0),
+            (2, datetime(2013, 10, 1, 18, 15), 1, 0),
+            (2, datetime(2013, 10, 1, 16, 10, 31), 1, 0)]
+
+        df = DataFrame.from_records(all_wins_and_wagers,
+                                    columns=("ID", "timestamp", "A", "B")
+                                    ).set_index("timestamp")
+        result = df.groupby("ID").resample("5min").sum()
+        expected = df.groupby("ID").apply(lambda x: x.resample("5min").sum())
+        assert_frame_equal(result, expected)
+
+    def test_resample_dtype_preservation(self):
+
+        # GH 12202
+        # validation tests for dtype preservation
+
+        df = DataFrame({'date': pd.date_range(start='2016-01-01',
+                                              periods=4, freq='W'),
+                        'group': [1, 1, 2, 2],
+                        'val': Series([5, 6, 7, 8],
+                                      dtype='int32')}
+                       ).set_index('date')
+
+        result = df.resample('1D').ffill()
+        assert result.val.dtype == np.int32
+
+        result = df.groupby('group').resample('1D').ffill()
+        assert result.val.dtype == np.int32
+
+    def test_resample_dtype_coerceion(self):
+
+        pytest.importorskip('scipy.interpolate')
+
+        # GH 16361
+        df = {"a": [1, 3, 1, 4]}
+        df = DataFrame(df, index=pd.date_range("2017-01-01", "2017-01-04"))
+
+        expected = (df.astype("float64")
+                    .resample("H")
+                    .mean()
+                    ["a"]
+                    .interpolate("cubic")
+                    )
+
+        result = df.resample("H")["a"].mean().interpolate("cubic")
+        tm.assert_series_equal(result, expected)
+
+        result = df.resample("H").mean()["a"].interpolate("cubic")
+        tm.assert_series_equal(result, expected)
+
+    def test_weekly_resample_buglet(self):
+        # #1327
+        rng = date_range('1/1/2000', freq='B', periods=20)
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        resampled = ts.resample('W').mean()
+        expected = ts.resample('W-SUN').mean()
+        assert_series_equal(resampled, expected)
+
+    def test_monthly_resample_error(self):
+        # #1451
+        dates = date_range('4/16/2012 20:00', periods=5000, freq='h')
+        ts = Series(np.random.randn(len(dates)), index=dates)
+        # it works!
+        ts.resample('M')
+
+    def test_nanosecond_resample_error(self):
+        # GH 12307 - Values falls after last bin when
+        # Resampling using pd.tseries.offsets.Nano as period
+        start = 1443707890427
+        exp_start = 1443707890400
+        indx = pd.date_range(
+            start=pd.to_datetime(start),
+            periods=10,
+            freq='100n'
+        )
+        ts = Series(range(len(indx)), index=indx)
+        r = ts.resample(pd.tseries.offsets.Nano(100))
+        result = r.agg('mean')
+
+        exp_indx = pd.date_range(
+            start=pd.to_datetime(exp_start),
+            periods=10,
+            freq='100n'
+        )
+        exp = Series(range(len(exp_indx)), index=exp_indx)
+
+        assert_series_equal(result, exp)
+
+    def test_resample_anchored_intraday(self):
+        # #1471, #1458
+
+        rng = date_range('1/1/2012', '4/1/2012', freq='100min')
+        df = DataFrame(rng.month, index=rng)
+
+        result = df.resample('M').mean()
+        expected = df.resample(
+            'M', kind='period').mean().to_timestamp(how='end')
+        tm.assert_frame_equal(result, expected)
+
+        result = df.resample('M', closed='left').mean()
+        exp = df.tshift(1, freq='D').resample('M', kind='period').mean()
+        exp = exp.to_timestamp(how='end')
+
+        tm.assert_frame_equal(result, exp)
+
+        rng = date_range('1/1/2012', '4/1/2012', freq='100min')
+        df = DataFrame(rng.month, index=rng)
+
+        result = df.resample('Q').mean()
+        expected = df.resample(
+            'Q', kind='period').mean().to_timestamp(how='end')
+        tm.assert_frame_equal(result, expected)
+
+        result = df.resample('Q', closed='left').mean()
+        expected = df.tshift(1, freq='D').resample('Q', kind='period',
+                                                   closed='left').mean()
+        expected = expected.to_timestamp(how='end')
+        tm.assert_frame_equal(result, expected)
+
+        ts = _simple_ts('2012-04-29 23:00', '2012-04-30 5:00', freq='h')
+        resampled = ts.resample('M').mean()
+        assert len(resampled) == 1
+
+    def test_resample_anchored_monthstart(self):
+        ts = _simple_ts('1/1/2000', '12/31/2002')
+
+        freqs = ['MS', 'BMS', 'QS-MAR', 'AS-DEC', 'AS-JUN']
+
+        for freq in freqs:
+            ts.resample(freq).mean()
+
+    def test_resample_anchored_multiday(self):
+        # When resampling a range spanning multiple days, ensure that the
+        # start date gets used to determine the offset.  Fixes issue where
+        # a one day period is not a multiple of the frequency.
+        #
+        # See: https://github.com/pandas-dev/pandas/issues/8683
+
+        index = pd.date_range(
+            '2014-10-14 23:06:23.206', periods=3, freq='400L'
+        ) | pd.date_range(
+            '2014-10-15 23:00:00', periods=2, freq='2200L')
+
+        s = Series(np.random.randn(5), index=index)
+
+        # Ensure left closing works
+        result = s.resample('2200L').mean()
+        assert result.index[-1] == Timestamp('2014-10-15 23:00:02.000')
+
+        # Ensure right closing works
+        result = s.resample('2200L', label='right').mean()
+        assert result.index[-1] == Timestamp('2014-10-15 23:00:04.200')
+
+    def test_corner_cases(self):
+        # miscellaneous test coverage
+
+        rng = date_range('1/1/2000', periods=12, freq='t')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        result = ts.resample('5t', closed='right', label='left').mean()
+        ex_index = date_range('1999-12-31 23:55', periods=4, freq='5t')
+        tm.assert_index_equal(result.index, ex_index)
+
+        len0pts = _simple_pts('2007-01', '2010-05', freq='M')[:0]
+        # it works
+        result = len0pts.resample('A-DEC').mean()
+        assert len(result) == 0
+
+        # resample to periods
+        ts = _simple_ts('2000-04-28', '2000-04-30 11:00', freq='h')
+        result = ts.resample('M', kind='period').mean()
+        assert len(result) == 1
+        assert result.index[0] == Period('2000-04', freq='M')
+
+    def test_anchored_lowercase_buglet(self):
+        dates = date_range('4/16/2012 20:00', periods=50000, freq='s')
+        ts = Series(np.random.randn(len(dates)), index=dates)
+        # it works!
+        ts.resample('d').mean()
+
+    def test_upsample_apply_functions(self):
+        # #1596
+        rng = pd.date_range('2012-06-12', periods=4, freq='h')
+
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        result = ts.resample('20min').aggregate(['mean', 'sum'])
+        assert isinstance(result, DataFrame)
+
+    def test_resample_not_monotonic(self):
+        rng = pd.date_range('2012-06-12', periods=200, freq='h')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        ts = ts.take(np.random.permutation(len(ts)))
+
+        result = ts.resample('D').sum()
+        exp = ts.sort_index().resample('D').sum()
+        assert_series_equal(result, exp)
+
+    def test_resample_median_bug_1688(self):
+
+        for dtype in ['int64', 'int32', 'float64', 'float32']:
+            df = DataFrame([1, 2], index=[datetime(2012, 1, 1, 0, 0, 0),
+                                          datetime(2012, 1, 1, 0, 5, 0)],
+                           dtype=dtype)
+
+            result = df.resample("T").apply(lambda x: x.mean())
+            exp = df.asfreq('T')
+            tm.assert_frame_equal(result, exp)
+
+            result = df.resample("T").median()
+            exp = df.asfreq('T')
+            tm.assert_frame_equal(result, exp)
+
+    def test_how_lambda_functions(self):
+
+        ts = _simple_ts('1/1/2000', '4/1/2000')
+
+        result = ts.resample('M').apply(lambda x: x.mean())
+        exp = ts.resample('M').mean()
+        tm.assert_series_equal(result, exp)
+
+        foo_exp = ts.resample('M').mean()
+        foo_exp.name = 'foo'
+        bar_exp = ts.resample('M').std()
+        bar_exp.name = 'bar'
+
+        result = ts.resample('M').apply(
+            [lambda x: x.mean(), lambda x: x.std(ddof=1)])
+        result.columns = ['foo', 'bar']
+        tm.assert_series_equal(result['foo'], foo_exp)
+        tm.assert_series_equal(result['bar'], bar_exp)
+
+        # this is a MI Series, so comparing the names of the results
+        # doesn't make sense
+        result = ts.resample('M').aggregate({'foo': lambda x: x.mean(),
+                                             'bar': lambda x: x.std(ddof=1)})
+        tm.assert_series_equal(result['foo'], foo_exp, check_names=False)
+        tm.assert_series_equal(result['bar'], bar_exp, check_names=False)
+
+    def test_resample_unequal_times(self):
+        # #1772
+        start = datetime(1999, 3, 1, 5)
+        # end hour is less than start
+        end = datetime(2012, 7, 31, 4)
+        bad_ind = date_range(start, end, freq="30min")
+        df = DataFrame({'close': 1}, index=bad_ind)
+
+        # it works!
+        df.resample('AS').sum()
+
+    def test_resample_consistency(self):
+
+        # GH 6418
+        # resample with bfill / limit / reindex consistency
+
+        i30 = pd.date_range('2002-02-02', periods=4, freq='30T')
+        s = Series(np.arange(4.), index=i30)
+        s[2] = np.NaN
+
+        # Upsample by factor 3 with reindex() and resample() methods:
+        i10 = pd.date_range(i30[0], i30[-1], freq='10T')
+
+        s10 = s.reindex(index=i10, method='bfill')
+        s10_2 = s.reindex(index=i10, method='bfill', limit=2)
+        rl = s.reindex_like(s10, method='bfill', limit=2)
+        r10_2 = s.resample('10Min').bfill(limit=2)
+        r10 = s.resample('10Min').bfill()
+
+        # s10_2, r10, r10_2, rl should all be equal
+        assert_series_equal(s10_2, r10)
+        assert_series_equal(s10_2, r10_2)
+        assert_series_equal(s10_2, rl)
+
+    def test_resample_timegrouper(self):
+        # GH 7227
+        dates1 = [datetime(2014, 10, 1), datetime(2014, 9, 3),
+                  datetime(2014, 11, 5), datetime(2014, 9, 5),
+                  datetime(2014, 10, 8), datetime(2014, 7, 15)]
+
+        dates2 = dates1[:2] + [pd.NaT] + dates1[2:4] + [pd.NaT] + dates1[4:]
+        dates3 = [pd.NaT] + dates1 + [pd.NaT]
+
+        for dates in [dates1, dates2, dates3]:
+            df = DataFrame(dict(A=dates, B=np.arange(len(dates))))
+            result = df.set_index('A').resample('M').count()
+            exp_idx = pd.DatetimeIndex(['2014-07-31', '2014-08-31',
+                                        '2014-09-30',
+                                        '2014-10-31', '2014-11-30'],
+                                       freq='M', name='A')
+            expected = DataFrame({'B': [1, 0, 2, 2, 1]}, index=exp_idx)
+            assert_frame_equal(result, expected)
+
+            result = df.groupby(pd.Grouper(freq='M', key='A')).count()
+            assert_frame_equal(result, expected)
+
+            df = DataFrame(dict(A=dates, B=np.arange(len(dates)), C=np.arange(
+                len(dates))))
+            result = df.set_index('A').resample('M').count()
+            expected = DataFrame({'B': [1, 0, 2, 2, 1], 'C': [1, 0, 2, 2, 1]},
+                                 index=exp_idx, columns=['B', 'C'])
+            assert_frame_equal(result, expected)
+
+            result = df.groupby(pd.Grouper(freq='M', key='A')).count()
+            assert_frame_equal(result, expected)
+
+    def test_resample_nunique(self):
+
+        # GH 12352
+        df = DataFrame({
+            'ID': {Timestamp('2015-06-05 00:00:00'): '0010100903',
+                   Timestamp('2015-06-08 00:00:00'): '0010150847'},
+            'DATE': {Timestamp('2015-06-05 00:00:00'): '2015-06-05',
+                     Timestamp('2015-06-08 00:00:00'): '2015-06-08'}})
+        r = df.resample('D')
+        g = df.groupby(pd.Grouper(freq='D'))
+        expected = df.groupby(pd.Grouper(freq='D')).ID.apply(lambda x:
+                                                             x.nunique())
+        assert expected.name == 'ID'
+
+        for t in [r, g]:
+            result = r.ID.nunique()
+            assert_series_equal(result, expected)
+
+        result = df.ID.resample('D').nunique()
+        assert_series_equal(result, expected)
+
+        result = df.ID.groupby(pd.Grouper(freq='D')).nunique()
+        assert_series_equal(result, expected)
+
+    def test_resample_nunique_with_date_gap(self):
+        # GH 13453
+        index = pd.date_range('1-1-2000', '2-15-2000', freq='h')
+        index2 = pd.date_range('4-15-2000', '5-15-2000', freq='h')
+        index3 = index.append(index2)
+        s = Series(range(len(index3)), index=index3, dtype='int64')
+        r = s.resample('M')
+
+        # Since all elements are unique, these should all be the same
+        results = [
+            r.count(),
+            r.nunique(),
+            r.agg(Series.nunique),
+            r.agg('nunique')
+        ]
+
+        assert_series_equal(results[0], results[1])
+        assert_series_equal(results[0], results[2])
+        assert_series_equal(results[0], results[3])
+
+    @pytest.mark.parametrize('n', [10000, 100000])
+    @pytest.mark.parametrize('k', [10, 100, 1000])
+    def test_resample_group_info(self, n, k):
+        # GH10914
+        dr = date_range(start='2015-08-27', periods=n // 10, freq='T')
+        ts = Series(np.random.randint(0, n // k, n).astype('int64'),
+                    index=np.random.choice(dr, n))
+
+        left = ts.resample('30T').nunique()
+        ix = date_range(start=ts.index.min(), end=ts.index.max(),
+                        freq='30T')
+
+        vals = ts.values
+        bins = np.searchsorted(ix.values, ts.index, side='right')
+
+        sorter = np.lexsort((vals, bins))
+        vals, bins = vals[sorter], bins[sorter]
+
+        mask = np.r_[True, vals[1:] != vals[:-1]]
+        mask |= np.r_[True, bins[1:] != bins[:-1]]
+
+        arr = np.bincount(bins[mask] - 1,
+                          minlength=len(ix)).astype('int64', copy=False)
+        right = Series(arr, index=ix)
+
+        assert_series_equal(left, right)
+
+    def test_resample_size(self):
+        n = 10000
+        dr = date_range('2015-09-19', periods=n, freq='T')
+        ts = Series(np.random.randn(n), index=np.random.choice(dr, n))
+
+        left = ts.resample('7T').size()
+        ix = date_range(start=left.index.min(), end=ts.index.max(), freq='7T')
+
+        bins = np.searchsorted(ix.values, ts.index.values, side='right')
+        val = np.bincount(bins, minlength=len(ix) + 1)[1:].astype('int64',
+                                                                  copy=False)
+
+        right = Series(val, index=ix)
+        assert_series_equal(left, right)
+
+    def test_resample_across_dst(self):
+        # The test resamples a DatetimeIndex with values before and after a
+        # DST change
+        # Issue: 14682
+
+        # The DatetimeIndex we will start with
+        # (note that DST happens at 03:00+02:00 -> 02:00+01:00)
+        # 2016-10-30 02:23:00+02:00, 2016-10-30 02:23:00+01:00
+        df1 = DataFrame([1477786980, 1477790580], columns=['ts'])
+        dti1 = DatetimeIndex(pd.to_datetime(df1.ts, unit='s')
+                             .dt.tz_localize('UTC')
+                             .dt.tz_convert('Europe/Madrid'))
+
+        # The expected DatetimeIndex after resampling.
+        # 2016-10-30 02:00:00+02:00, 2016-10-30 02:00:00+01:00
+        df2 = DataFrame([1477785600, 1477789200], columns=['ts'])
+        dti2 = DatetimeIndex(pd.to_datetime(df2.ts, unit='s')
+                             .dt.tz_localize('UTC')
+                             .dt.tz_convert('Europe/Madrid'))
+        df = DataFrame([5, 5], index=dti1)
+
+        result = df.resample(rule='H').sum()
+        expected = DataFrame([5, 5], index=dti2)
+
+        assert_frame_equal(result, expected)
+
+    def test_resample_dst_anchor(self):
+        # 5172
+        dti = DatetimeIndex([datetime(2012, 11, 4, 23)], tz='US/Eastern')
+        df = DataFrame([5], index=dti)
+        assert_frame_equal(df.resample(rule='D').sum(),
+                           DataFrame([5], index=df.index.normalize()))
+        df.resample(rule='MS').sum()
+        assert_frame_equal(
+            df.resample(rule='MS').sum(),
+            DataFrame([5], index=DatetimeIndex([datetime(2012, 11, 1)],
+                                               tz='US/Eastern')))
+
+        dti = date_range('2013-09-30', '2013-11-02', freq='30Min',
+                         tz='Europe/Paris')
+        values = range(dti.size)
+        df = DataFrame({"a": values,
+                        "b": values,
+                        "c": values}, index=dti, dtype='int64')
+        how = {"a": "min", "b": "max", "c": "count"}
+
+        assert_frame_equal(
+            df.resample("W-MON").agg(how)[["a", "b", "c"]],
+            DataFrame({"a": [0, 48, 384, 720, 1056, 1394],
+                       "b": [47, 383, 719, 1055, 1393, 1586],
+                       "c": [48, 336, 336, 336, 338, 193]},
+                      index=date_range('9/30/2013', '11/4/2013',
+                                       freq='W-MON', tz='Europe/Paris')),
+            'W-MON Frequency')
+
+        assert_frame_equal(
+            df.resample("2W-MON").agg(how)[["a", "b", "c"]],
+            DataFrame({"a": [0, 48, 720, 1394],
+                       "b": [47, 719, 1393, 1586],
+                       "c": [48, 672, 674, 193]},
+                      index=date_range('9/30/2013', '11/11/2013',
+                                       freq='2W-MON', tz='Europe/Paris')),
+            '2W-MON Frequency')
+
+        assert_frame_equal(
+            df.resample("MS").agg(how)[["a", "b", "c"]],
+            DataFrame({"a": [0, 48, 1538],
+                       "b": [47, 1537, 1586],
+                       "c": [48, 1490, 49]},
+                      index=date_range('9/1/2013', '11/1/2013',
+                                       freq='MS', tz='Europe/Paris')),
+            'MS Frequency')
+
+        assert_frame_equal(
+            df.resample("2MS").agg(how)[["a", "b", "c"]],
+            DataFrame({"a": [0, 1538],
+                       "b": [1537, 1586],
+                       "c": [1538, 49]},
+                      index=date_range('9/1/2013', '11/1/2013',
+                                       freq='2MS', tz='Europe/Paris')),
+            '2MS Frequency')
+
+        df_daily = df['10/26/2013':'10/29/2013']
+        assert_frame_equal(
+            df_daily.resample("D").agg({"a": "min", "b": "max", "c": "count"})
+            [["a", "b", "c"]],
+            DataFrame({"a": [1248, 1296, 1346, 1394],
+                       "b": [1295, 1345, 1393, 1441],
+                       "c": [48, 50, 48, 48]},
+                      index=date_range('10/26/2013', '10/29/2013',
+                                       freq='D', tz='Europe/Paris')),
+            'D Frequency')
+
+    def test_downsample_across_dst(self):
+        # GH 8531
+        tz = pytz.timezone('Europe/Berlin')
+        dt = datetime(2014, 10, 26)
+        dates = date_range(tz.localize(dt), periods=4, freq='2H')
+        result = Series(5, index=dates).resample('H').mean()
+        expected = Series([5., np.nan] * 3 + [5.],
+                          index=date_range(tz.localize(dt), periods=7,
+                                           freq='H'))
+        tm.assert_series_equal(result, expected)
+
+    def test_resample_with_nat(self):
+        # GH 13020
+        index = DatetimeIndex([pd.NaT,
+                               '1970-01-01 00:00:00',
+                               pd.NaT,
+                               '1970-01-01 00:00:01',
+                               '1970-01-01 00:00:02'])
+        frame = DataFrame([2, 3, 5, 7, 11], index=index)
+
+        index_1s = DatetimeIndex(['1970-01-01 00:00:00',
+                                  '1970-01-01 00:00:01',
+                                  '1970-01-01 00:00:02'])
+        frame_1s = DataFrame([3, 7, 11], index=index_1s)
+        assert_frame_equal(frame.resample('1s').mean(), frame_1s)
+
+        index_2s = DatetimeIndex(['1970-01-01 00:00:00',
+                                  '1970-01-01 00:00:02'])
+        frame_2s = DataFrame([5, 11], index=index_2s)
+        assert_frame_equal(frame.resample('2s').mean(), frame_2s)
+
+        index_3s = DatetimeIndex(['1970-01-01 00:00:00'])
+        frame_3s = DataFrame([7], index=index_3s)
+        assert_frame_equal(frame.resample('3s').mean(), frame_3s)
+
+        assert_frame_equal(frame.resample('60s').mean(), frame_3s)
+
+    def test_resample_timedelta_values(self):
+        # GH 13119
+        # check that timedelta dtype is preserved when NaT values are
+        # introduced by the resampling
+
+        times = timedelta_range('1 day', '4 day', freq='4D')
+        df = DataFrame({'time': times}, index=times)
+
+        times2 = timedelta_range('1 day', '4 day', freq='2D')
+        exp = Series(times2, index=times2, name='time')
+        exp.iloc[1] = pd.NaT
+
+        res = df.resample('2D').first()['time']
+        tm.assert_series_equal(res, exp)
+        res = df['time'].resample('2D').first()
+        tm.assert_series_equal(res, exp)
+
+    def test_resample_datetime_values(self):
+        # GH 13119
+        # check that datetime dtype is preserved when NaT values are
+        # introduced by the resampling
+
+        dates = [datetime(2016, 1, 15), datetime(2016, 1, 19)]
+        df = DataFrame({'timestamp': dates}, index=dates)
+
+        exp = Series([datetime(2016, 1, 15), pd.NaT, datetime(2016, 1, 19)],
+                     index=date_range('2016-01-15', periods=3, freq='2D'),
+                     name='timestamp')
+
+        res = df.resample('2D').first()['timestamp']
+        tm.assert_series_equal(res, exp)
+        res = df['timestamp'].resample('2D').first()
+        tm.assert_series_equal(res, exp)
+
+
+class TestPeriodIndex(Base):
+    _index_factory = lambda x: period_range
+
+    @pytest.fixture
+    def _series_name(self):
+        return 'pi'
+
+    def create_series(self):
+        # TODO: replace calls to .create_series() by injecting the series
+        # fixture
+        i = period_range(datetime(2005, 1, 1),
+                         datetime(2005, 1, 10), freq='D')
+
+        return Series(np.arange(len(i)), index=i, name='pi')
+
+    @pytest.mark.parametrize('freq', ['2D', '1H', '2H'])
+    @pytest.mark.parametrize('kind', ['period', None, 'timestamp'])
+    def test_asfreq(self, series_and_frame, freq, kind):
+        # GH 12884, 15944
+        # make sure .asfreq() returns PeriodIndex (except kind='timestamp')
+
+        obj = series_and_frame
+        if kind == 'timestamp':
+            expected = obj.to_timestamp().resample(freq).asfreq()
+        else:
+            start = obj.index[0].to_timestamp(how='start')
+            end = (obj.index[-1] + 1).to_timestamp(how='start')
+            new_index = date_range(start=start, end=end, freq=freq,
+                                   closed='left')
+            expected = obj.to_timestamp().reindex(new_index).to_period(freq)
+        result = obj.resample(freq, kind=kind).asfreq()
+        assert_almost_equal(result, expected)
+
+    def test_asfreq_fill_value(self):
+        # test for fill value during resampling, issue 3715
+
+        s = self.create_series()
+        new_index = date_range(s.index[0].to_timestamp(how='start'),
+                               (s.index[-1]).to_timestamp(how='start'),
+                               freq='1H')
+        expected = s.to_timestamp().reindex(new_index, fill_value=4.0)
+        result = s.resample('1H', kind='timestamp').asfreq(fill_value=4.0)
+        assert_series_equal(result, expected)
+
+        frame = s.to_frame('value')
+        new_index = date_range(frame.index[0].to_timestamp(how='start'),
+                               (frame.index[-1]).to_timestamp(how='start'),
+                               freq='1H')
+        expected = frame.to_timestamp().reindex(new_index, fill_value=3.0)
+        result = frame.resample('1H', kind='timestamp').asfreq(fill_value=3.0)
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('freq', ['H', '12H', '2D', 'W'])
+    @pytest.mark.parametrize('kind', [None, 'period', 'timestamp'])
+    def test_selection(self, index, freq, kind):
+        # This is a bug, these should be implemented
+        # GH 14008
+        rng = np.arange(len(index), dtype=np.int64)
+        df = DataFrame({'date': index, 'a': rng},
+                       index=pd.MultiIndex.from_arrays([rng, index],
+                                                       names=['v', 'd']))
+        with pytest.raises(NotImplementedError):
+            df.resample(freq, on='date', kind=kind)
+        with pytest.raises(NotImplementedError):
+            df.resample(freq, level='d', kind=kind)
+
+    def test_annual_upsample_D_s_f(self):
+        self._check_annual_upsample_cases('D', 'start', 'ffill')
+
+    def test_annual_upsample_D_e_f(self):
+        self._check_annual_upsample_cases('D', 'end', 'ffill')
+
+    def test_annual_upsample_D_s_b(self):
+        self._check_annual_upsample_cases('D', 'start', 'bfill')
+
+    def test_annual_upsample_D_e_b(self):
+        self._check_annual_upsample_cases('D', 'end', 'bfill')
+
+    def test_annual_upsample_B_s_f(self):
+        self._check_annual_upsample_cases('B', 'start', 'ffill')
+
+    def test_annual_upsample_B_e_f(self):
+        self._check_annual_upsample_cases('B', 'end', 'ffill')
+
+    def test_annual_upsample_B_s_b(self):
+        self._check_annual_upsample_cases('B', 'start', 'bfill')
+
+    def test_annual_upsample_B_e_b(self):
+        self._check_annual_upsample_cases('B', 'end', 'bfill')
+
+    def test_annual_upsample_M_s_f(self):
+        self._check_annual_upsample_cases('M', 'start', 'ffill')
+
+    def test_annual_upsample_M_e_f(self):
+        self._check_annual_upsample_cases('M', 'end', 'ffill')
+
+    def test_annual_upsample_M_s_b(self):
+        self._check_annual_upsample_cases('M', 'start', 'bfill')
+
+    def test_annual_upsample_M_e_b(self):
+        self._check_annual_upsample_cases('M', 'end', 'bfill')
+
+    def _check_annual_upsample_cases(self, targ, conv, meth, end='12/31/1991'):
+        for month in MONTHS:
+            ts = _simple_pts('1/1/1990', end, freq='A-%s' % month)
+
+            result = getattr(ts.resample(targ, convention=conv), meth)()
+            expected = result.to_timestamp(targ, how=conv)
+            expected = expected.asfreq(targ, meth).to_period()
+            assert_series_equal(result, expected)
+
+    def test_basic_downsample(self):
+        ts = _simple_pts('1/1/1990', '6/30/1995', freq='M')
+        result = ts.resample('a-dec').mean()
+
+        expected = ts.groupby(ts.index.year).mean()
+        expected.index = period_range('1/1/1990', '6/30/1995', freq='a-dec')
+        assert_series_equal(result, expected)
+
+        # this is ok
+        assert_series_equal(ts.resample('a-dec').mean(), result)
+        assert_series_equal(ts.resample('a').mean(), result)
+
+    def test_not_subperiod(self):
+        # These are incompatible period rules for resampling
+        ts = _simple_pts('1/1/1990', '6/30/1995', freq='w-wed')
+        pytest.raises(ValueError, lambda: ts.resample('a-dec').mean())
+        pytest.raises(ValueError, lambda: ts.resample('q-mar').mean())
+        pytest.raises(ValueError, lambda: ts.resample('M').mean())
+        pytest.raises(ValueError, lambda: ts.resample('w-thu').mean())
+
+    @pytest.mark.parametrize('freq', ['D', '2D'])
+    def test_basic_upsample(self, freq):
+        ts = _simple_pts('1/1/1990', '6/30/1995', freq='M')
+        result = ts.resample('a-dec').mean()
+
+        resampled = result.resample(freq, convention='end').ffill()
+        expected = result.to_timestamp(freq, how='end')
+        expected = expected.asfreq(freq, 'ffill').to_period(freq)
+        assert_series_equal(resampled, expected)
+
+    def test_upsample_with_limit(self):
+        rng = period_range('1/1/2000', periods=5, freq='A')
+        ts = Series(np.random.randn(len(rng)), rng)
+
+        result = ts.resample('M', convention='end').ffill(limit=2)
+        expected = ts.asfreq('M').reindex(result.index, method='ffill',
+                                          limit=2)
+        assert_series_equal(result, expected)
+
+    def test_annual_upsample(self):
+        ts = _simple_pts('1/1/1990', '12/31/1995', freq='A-DEC')
+        df = DataFrame({'a': ts})
+        rdf = df.resample('D').ffill()
+        exp = df['a'].resample('D').ffill()
+        assert_series_equal(rdf['a'], exp)
+
+        rng = period_range('2000', '2003', freq='A-DEC')
+        ts = Series([1, 2, 3, 4], index=rng)
+
+        result = ts.resample('M').ffill()
+        ex_index = period_range('2000-01', '2003-12', freq='M')
+
+        expected = ts.asfreq('M', how='start').reindex(ex_index,
+                                                       method='ffill')
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('month', MONTHS)
+    @pytest.mark.parametrize('target', ['D', 'B', 'M'])
+    @pytest.mark.parametrize('convention', ['start', 'end'])
+    def test_quarterly_upsample(self, month, target, convention):
+        freq = 'Q-{month}'.format(month=month)
+        ts = _simple_pts('1/1/1990', '12/31/1995', freq=freq)
+        result = ts.resample(target, convention=convention).ffill()
+        expected = result.to_timestamp(target, how=convention)
+        expected = expected.asfreq(target, 'ffill').to_period()
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('target', ['D', 'B'])
+    @pytest.mark.parametrize('convention', ['start', 'end'])
+    def test_monthly_upsample(self, target, convention):
+        ts = _simple_pts('1/1/1990', '12/31/1995', freq='M')
+        result = ts.resample(target, convention=convention).ffill()
+        expected = result.to_timestamp(target, how=convention)
+        expected = expected.asfreq(target, 'ffill').to_period()
+        assert_series_equal(result, expected)
+
+    def test_resample_basic(self):
+        # GH3609
+        s = Series(range(100), index=date_range(
+            '20130101', freq='s', periods=100, name='idx'), dtype='float')
+        s[10:30] = np.nan
+        index = PeriodIndex([
+            Period('2013-01-01 00:00', 'T'),
+            Period('2013-01-01 00:01', 'T')], name='idx')
+        expected = Series([34.5, 79.5], index=index)
+        result = s.to_period().resample('T', kind='period').mean()
+        assert_series_equal(result, expected)
+        result2 = s.resample('T', kind='period').mean()
+        assert_series_equal(result2, expected)
+
+    @pytest.mark.parametrize('freq,expected_vals', [('M', [31, 29, 31, 9]),
+                                                    ('2M', [31 + 29, 31 + 9])])
+    def test_resample_count(self, freq, expected_vals):
+        # GH12774
+        series = Series(1, index=pd.period_range(start='2000', periods=100))
+        result = series.resample(freq).count()
+        expected_index = pd.period_range(start='2000', freq=freq,
+                                         periods=len(expected_vals))
+        expected = Series(expected_vals, index=expected_index)
+        assert_series_equal(result, expected)
+
+    def test_resample_same_freq(self):
+
+        # GH12770
+        series = Series(range(3), index=pd.period_range(
+            start='2000', periods=3, freq='M'))
+        expected = series
+
+        for method in resample_methods:
+            result = getattr(series.resample('M'), method)()
+            assert_series_equal(result, expected)
+
+    def test_resample_incompat_freq(self):
+
+        with pytest.raises(IncompatibleFrequency):
+            Series(range(3), index=pd.period_range(
+                start='2000', periods=3, freq='M')).resample('W').mean()
+
+    def test_with_local_timezone_pytz(self):
+        # see gh-5430
+        local_timezone = pytz.timezone('America/Los_Angeles')
+
+        start = datetime(year=2013, month=11, day=1, hour=0, minute=0,
+                         tzinfo=pytz.utc)
+        # 1 day later
+        end = datetime(year=2013, month=11, day=2, hour=0, minute=0,
+                       tzinfo=pytz.utc)
+
+        index = pd.date_range(start, end, freq='H')
+
+        series = Series(1, index=index)
+        series = series.tz_convert(local_timezone)
+        result = series.resample('D', kind='period').mean()
+
+        # Create the expected series
+        # Index is moved back a day with the timezone conversion from UTC to
+        # Pacific
+        expected_index = (pd.period_range(start=start, end=end, freq='D') - 1)
+        expected = Series(1, index=expected_index)
+        assert_series_equal(result, expected)
+
+    def test_resample_with_pytz(self):
+        # GH 13238
+        s = Series(2, index=pd.date_range('2017-01-01', periods=48, freq="H",
+                                          tz="US/Eastern"))
+        result = s.resample("D").mean()
+        expected = Series(2, index=pd.DatetimeIndex(['2017-01-01',
+                                                     '2017-01-02'],
+                                                    tz="US/Eastern"))
+        assert_series_equal(result, expected)
+        # Especially assert that the timezone is LMT for pytz
+        assert result.index.tz == pytz.timezone('US/Eastern')
+
+    def test_with_local_timezone_dateutil(self):
+        # see gh-5430
+        local_timezone = 'dateutil/America/Los_Angeles'
+
+        start = datetime(year=2013, month=11, day=1, hour=0, minute=0,
+                         tzinfo=dateutil.tz.tzutc())
+        # 1 day later
+        end = datetime(year=2013, month=11, day=2, hour=0, minute=0,
+                       tzinfo=dateutil.tz.tzutc())
+
+        index = pd.date_range(start, end, freq='H', name='idx')
+
+        series = Series(1, index=index)
+        series = series.tz_convert(local_timezone)
+        result = series.resample('D', kind='period').mean()
+
+        # Create the expected series
+        # Index is moved back a day with the timezone conversion from UTC to
+        # Pacific
+        expected_index = (pd.period_range(start=start, end=end, freq='D',
+                                          name='idx') - 1)
+        expected = Series(1, index=expected_index)
+        assert_series_equal(result, expected)
+
+    def test_fill_method_and_how_upsample(self):
+        # GH2073
+        s = Series(np.arange(9, dtype='int64'),
+                   index=date_range('2010-01-01', periods=9, freq='Q'))
+        last = s.resample('M').ffill()
+        both = s.resample('M').ffill().resample('M').last().astype('int64')
+        assert_series_equal(last, both)
+
+    @pytest.mark.parametrize('day', DAYS)
+    @pytest.mark.parametrize('target', ['D', 'B'])
+    @pytest.mark.parametrize('convention', ['start', 'end'])
+    def test_weekly_upsample(self, day, target, convention):
+        freq = 'W-{day}'.format(day=day)
+        ts = _simple_pts('1/1/1990', '12/31/1995', freq=freq)
+        result = ts.resample(target, convention=convention).ffill()
+        expected = result.to_timestamp(target, how=convention)
+        expected = expected.asfreq(target, 'ffill').to_period()
+        assert_series_equal(result, expected)
+
+    def test_resample_to_timestamps(self):
+        ts = _simple_pts('1/1/1990', '12/31/1995', freq='M')
+
+        result = ts.resample('A-DEC', kind='timestamp').mean()
+        expected = ts.to_timestamp(how='end').resample('A-DEC').mean()
+        assert_series_equal(result, expected)
+
+    def test_resample_to_quarterly(self):
+        for month in MONTHS:
+            ts = _simple_pts('1990', '1992', freq='A-%s' % month)
+            quar_ts = ts.resample('Q-%s' % month).ffill()
+
+            stamps = ts.to_timestamp('D', how='start')
+            qdates = period_range(ts.index[0].asfreq('D', 'start'),
+                                  ts.index[-1].asfreq('D', 'end'),
+                                  freq='Q-%s' % month)
+
+            expected = stamps.reindex(qdates.to_timestamp('D', 's'),
+                                      method='ffill')
+            expected.index = qdates
+
+            assert_series_equal(quar_ts, expected)
+
+        # conforms, but different month
+        ts = _simple_pts('1990', '1992', freq='A-JUN')
+
+        for how in ['start', 'end']:
+            result = ts.resample('Q-MAR', convention=how).ffill()
+            expected = ts.asfreq('Q-MAR', how=how)
+            expected = expected.reindex(result.index, method='ffill')
+
+            # .to_timestamp('D')
+            # expected = expected.resample('Q-MAR').ffill()
+
+            assert_series_equal(result, expected)
+
+    def test_resample_fill_missing(self):
+        rng = PeriodIndex([2000, 2005, 2007, 2009], freq='A')
+
+        s = Series(np.random.randn(4), index=rng)
+
+        stamps = s.to_timestamp()
+        filled = s.resample('A').ffill()
+        expected = stamps.resample('A').ffill().to_period('A')
+        assert_series_equal(filled, expected)
+
+    def test_cant_fill_missing_dups(self):
+        rng = PeriodIndex([2000, 2005, 2005, 2007, 2007], freq='A')
+        s = Series(np.random.randn(5), index=rng)
+        pytest.raises(Exception, lambda: s.resample('A').ffill())
+
+    @pytest.mark.parametrize('freq', ['5min'])
+    @pytest.mark.parametrize('kind', ['period', None, 'timestamp'])
+    def test_resample_5minute(self, freq, kind):
+        rng = period_range('1/1/2000', '1/5/2000', freq='T')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+        expected = ts.to_timestamp().resample(freq).mean()
+        if kind != 'timestamp':
+            expected = expected.to_period(freq)
+        result = ts.resample(freq, kind=kind).mean()
+        assert_series_equal(result, expected)
+
+    def test_upsample_daily_business_daily(self):
+        ts = _simple_pts('1/1/2000', '2/1/2000', freq='B')
+
+        result = ts.resample('D').asfreq()
+        expected = ts.asfreq('D').reindex(period_range('1/3/2000', '2/1/2000'))
+        assert_series_equal(result, expected)
+
+        ts = _simple_pts('1/1/2000', '2/1/2000')
+        result = ts.resample('H', convention='s').asfreq()
+        exp_rng = period_range('1/1/2000', '2/1/2000 23:00', freq='H')
+        expected = ts.asfreq('H', how='s').reindex(exp_rng)
+        assert_series_equal(result, expected)
+
+    def test_resample_irregular_sparse(self):
+        dr = date_range(start='1/1/2012', freq='5min', periods=1000)
+        s = Series(np.array(100), index=dr)
+        # subset the data.
+        subset = s[:'2012-01-04 06:55']
+
+        result = subset.resample('10min').apply(len)
+        expected = s.resample('10min').apply(len).loc[result.index]
+        assert_series_equal(result, expected)
+
+    def test_resample_weekly_all_na(self):
+        rng = date_range('1/1/2000', periods=10, freq='W-WED')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        result = ts.resample('W-THU').asfreq()
+
+        assert result.isna().all()
+
+        result = ts.resample('W-THU').asfreq().ffill()[:-1]
+        expected = ts.asfreq('W-THU').ffill()
+        assert_series_equal(result, expected)
+
+    def test_resample_tz_localized(self):
+        dr = date_range(start='2012-4-13', end='2012-5-1')
+        ts = Series(lrange(len(dr)), dr)
+
+        ts_utc = ts.tz_localize('UTC')
+        ts_local = ts_utc.tz_convert('America/Los_Angeles')
+
+        result = ts_local.resample('W').mean()
+
+        ts_local_naive = ts_local.copy()
+        ts_local_naive.index = [x.replace(tzinfo=None)
+                                for x in ts_local_naive.index.to_pydatetime()]
+
+        exp = ts_local_naive.resample(
+            'W').mean().tz_localize('America/Los_Angeles')
+
+        assert_series_equal(result, exp)
+
+        # it works
+        result = ts_local.resample('D').mean()
+
+        # #2245
+        idx = date_range('2001-09-20 15:59', '2001-09-20 16:00', freq='T',
+                         tz='Australia/Sydney')
+        s = Series([1, 2], index=idx)
+
+        result = s.resample('D', closed='right', label='right').mean()
+        ex_index = date_range('2001-09-21', periods=1, freq='D',
+                              tz='Australia/Sydney')
+        expected = Series([1.5], index=ex_index)
+
+        assert_series_equal(result, expected)
+
+        # for good measure
+        result = s.resample('D', kind='period').mean()
+        ex_index = period_range('2001-09-20', periods=1, freq='D')
+        expected = Series([1.5], index=ex_index)
+        assert_series_equal(result, expected)
+
+        # GH 6397
+        # comparing an offset that doesn't propagate tz's
+        rng = date_range('1/1/2011', periods=20000, freq='H')
+        rng = rng.tz_localize('EST')
+        ts = DataFrame(index=rng)
+        ts['first'] = np.random.randn(len(rng))
+        ts['second'] = np.cumsum(np.random.randn(len(rng)))
+        expected = DataFrame(
+            {
+                'first': ts.resample('A').sum()['first'],
+                'second': ts.resample('A').mean()['second']},
+            columns=['first', 'second'])
+        result = ts.resample(
+            'A').agg({'first': np.sum,
+                      'second': np.mean}).reindex(columns=['first', 'second'])
+        assert_frame_equal(result, expected)
+
+    def test_closed_left_corner(self):
+        # #1465
+        s = Series(np.random.randn(21),
+                   index=date_range(start='1/1/2012 9:30',
+                                    freq='1min', periods=21))
+        s[0] = np.nan
+
+        result = s.resample('10min', closed='left', label='right').mean()
+        exp = s[1:].resample('10min', closed='left', label='right').mean()
+        assert_series_equal(result, exp)
+
+        result = s.resample('10min', closed='left', label='left').mean()
+        exp = s[1:].resample('10min', closed='left', label='left').mean()
+
+        ex_index = date_range(start='1/1/2012 9:30', freq='10min', periods=3)
+
+        tm.assert_index_equal(result.index, ex_index)
+        assert_series_equal(result, exp)
+
+    def test_quarterly_resampling(self):
+        rng = period_range('2000Q1', periods=10, freq='Q-DEC')
+        ts = Series(np.arange(10), index=rng)
+
+        result = ts.resample('A').mean()
+        exp = ts.to_timestamp().resample('A').mean().to_period()
+        assert_series_equal(result, exp)
+
+    def test_resample_weekly_bug_1726(self):
+        # 8/6/12 is a Monday
+        ind = DatetimeIndex(start="8/6/2012", end="8/26/2012", freq="D")
+        n = len(ind)
+        data = [[x] * 5 for x in range(n)]
+        df = DataFrame(data, columns=['open', 'high', 'low', 'close', 'vol'],
+                       index=ind)
+
+        # it works!
+        df.resample('W-MON', closed='left', label='left').first()
+
+    def test_resample_with_dst_time_change(self):
+        # GH 15549
+        index = pd.DatetimeIndex([1457537600000000000, 1458059600000000000],
+                                 tz='UTC').tz_convert('America/Chicago')
+        df = pd.DataFrame([1, 2], index=index)
+        result = df.resample('12h', closed='right',
+                             label='right').last().ffill()
+
+        expected_index_values = ['2016-03-09 12:00:00-06:00',
+                                 '2016-03-10 00:00:00-06:00',
+                                 '2016-03-10 12:00:00-06:00',
+                                 '2016-03-11 00:00:00-06:00',
+                                 '2016-03-11 12:00:00-06:00',
+                                 '2016-03-12 00:00:00-06:00',
+                                 '2016-03-12 12:00:00-06:00',
+                                 '2016-03-13 00:00:00-06:00',
+                                 '2016-03-13 13:00:00-05:00',
+                                 '2016-03-14 01:00:00-05:00',
+                                 '2016-03-14 13:00:00-05:00',
+                                 '2016-03-15 01:00:00-05:00',
+                                 '2016-03-15 13:00:00-05:00']
+        index = pd.DatetimeIndex(expected_index_values,
+                                 tz='UTC').tz_convert('America/Chicago')
+        expected = pd.DataFrame([1.0, 1.0, 1.0, 1.0, 1.0,
+                                 1.0, 1.0, 1.0, 1.0, 1.0,
+                                 1.0, 1.0, 2.0], index=index)
+        assert_frame_equal(result, expected)
+
+    def test_resample_bms_2752(self):
+        # GH2753
+        foo = Series(index=pd.bdate_range('20000101', '20000201'))
+        res1 = foo.resample("BMS").mean()
+        res2 = foo.resample("BMS").mean().resample("B").mean()
+        assert res1.index[0] == Timestamp('20000103')
+        assert res1.index[0] == res2.index[0]
+
+    # def test_monthly_convention_span(self):
+    #     rng = period_range('2000-01', periods=3, freq='M')
+    #     ts = Series(np.arange(3), index=rng)
+
+    #     # hacky way to get same thing
+    #     exp_index = period_range('2000-01-01', '2000-03-31', freq='D')
+    #     expected = ts.asfreq('D', how='end').reindex(exp_index)
+    #     expected = expected.fillna(method='bfill')
+
+    #     result = ts.resample('D', convention='span').mean()
+
+    #     assert_series_equal(result, expected)
+
+    def test_default_right_closed_label(self):
+        end_freq = ['D', 'Q', 'M', 'D']
+        end_types = ['M', 'A', 'Q', 'W']
+
+        for from_freq, to_freq in zip(end_freq, end_types):
+            idx = DatetimeIndex(start='8/15/2012', periods=100, freq=from_freq)
+            df = DataFrame(np.random.randn(len(idx), 2), idx)
+
+            resampled = df.resample(to_freq).mean()
+            assert_frame_equal(resampled, df.resample(to_freq, closed='right',
+                                                      label='right').mean())
+
+    def test_default_left_closed_label(self):
+        others = ['MS', 'AS', 'QS', 'D', 'H']
+        others_freq = ['D', 'Q', 'M', 'H', 'T']
+
+        for from_freq, to_freq in zip(others_freq, others):
+            idx = DatetimeIndex(start='8/15/2012', periods=100, freq=from_freq)
+            df = DataFrame(np.random.randn(len(idx), 2), idx)
+
+            resampled = df.resample(to_freq).mean()
+            assert_frame_equal(resampled, df.resample(to_freq, closed='left',
+                                                      label='left').mean())
+
+    def test_all_values_single_bin(self):
+        # 2070
+        index = period_range(start="2012-01-01", end="2012-12-31", freq="M")
+        s = Series(np.random.randn(len(index)), index=index)
+
+        result = s.resample("A").mean()
+        tm.assert_almost_equal(result[0], s.mean())
+
+    def test_evenly_divisible_with_no_extra_bins(self):
+        # 4076
+        # when the frequency is evenly divisible, sometimes extra bins
+
+        df = DataFrame(np.random.randn(9, 3),
+                       index=date_range('2000-1-1', periods=9))
+        result = df.resample('5D').mean()
+        expected = pd.concat(
+            [df.iloc[0:5].mean(), df.iloc[5:].mean()], axis=1).T
+        expected.index = [Timestamp('2000-1-1'), Timestamp('2000-1-6')]
+        assert_frame_equal(result, expected)
+
+        index = date_range(start='2001-5-4', periods=28)
+        df = DataFrame(
+            [{'REST_KEY': 1, 'DLY_TRN_QT': 80, 'DLY_SLS_AMT': 90,
+              'COOP_DLY_TRN_QT': 30, 'COOP_DLY_SLS_AMT': 20}] * 28 +
+            [{'REST_KEY': 2, 'DLY_TRN_QT': 70, 'DLY_SLS_AMT': 10,
+              'COOP_DLY_TRN_QT': 50, 'COOP_DLY_SLS_AMT': 20}] * 28,
+            index=index.append(index)).sort_index()
+
+        index = date_range('2001-5-4', periods=4, freq='7D')
+        expected = DataFrame(
+            [{'REST_KEY': 14, 'DLY_TRN_QT': 14, 'DLY_SLS_AMT': 14,
+              'COOP_DLY_TRN_QT': 14, 'COOP_DLY_SLS_AMT': 14}] * 4,
+            index=index)
+        result = df.resample('7D').count()
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame(
+            [{'REST_KEY': 21, 'DLY_TRN_QT': 1050, 'DLY_SLS_AMT': 700,
+              'COOP_DLY_TRN_QT': 560, 'COOP_DLY_SLS_AMT': 280}] * 4,
+            index=index)
+        result = df.resample('7D').sum()
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('kind', ['period', None, 'timestamp'])
+    @pytest.mark.parametrize('agg_arg', ['mean', {'value': 'mean'}, ['mean']])
+    def test_loffset_returns_datetimeindex(self, frame, kind, agg_arg):
+        # make sure passing loffset returns DatetimeIndex in all cases
+        # basic method taken from Base.test_resample_loffset_arg_type()
+        df = frame
+        expected_means = [df.values[i:i + 2].mean()
+                          for i in range(0, len(df.values), 2)]
+        expected_index = self.create_index(df.index[0],
+                                           periods=len(df.index) / 2,
+                                           freq='2D')
+
+        # loffset coerces PeriodIndex to DateTimeIndex
+        expected_index = expected_index.to_timestamp()
+        expected_index += timedelta(hours=2)
+        expected = DataFrame({'value': expected_means}, index=expected_index)
+
+        result_agg = df.resample('2D', loffset='2H', kind=kind).agg(agg_arg)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result_how = df.resample('2D', how=agg_arg, loffset='2H',
+                                     kind=kind)
+        if isinstance(agg_arg, list):
+            expected.columns = pd.MultiIndex.from_tuples([('value', 'mean')])
+        assert_frame_equal(result_agg, expected)
+        assert_frame_equal(result_how, expected)
+
+    @pytest.mark.parametrize('freq, period_mult', [('H', 24), ('12H', 2)])
+    @pytest.mark.parametrize('kind', [None, 'period'])
+    def test_upsampling_ohlc(self, freq, period_mult, kind):
+        # GH 13083
+        pi = PeriodIndex(start='2000', freq='D', periods=10)
+        s = Series(range(len(pi)), index=pi)
+        expected = s.to_timestamp().resample(freq).ohlc().to_period(freq)
+
+        # timestamp-based resampling doesn't include all sub-periods
+        # of the last original period, so extend accordingly:
+        new_index = PeriodIndex(start='2000', freq=freq,
+                                periods=period_mult * len(pi))
+        expected = expected.reindex(new_index)
+        result = s.resample(freq, kind=kind).ohlc()
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('periods, values',
+                             [([pd.NaT, '1970-01-01 00:00:00', pd.NaT,
+                                '1970-01-01 00:00:02', '1970-01-01 00:00:03'],
+                               [2, 3, 5, 7, 11]),
+                              ([pd.NaT, pd.NaT, '1970-01-01 00:00:00', pd.NaT,
+                                pd.NaT, pd.NaT, '1970-01-01 00:00:02',
+                                '1970-01-01 00:00:03', pd.NaT, pd.NaT],
+                               [1, 2, 3, 5, 6, 8, 7, 11, 12, 13])])
+    @pytest.mark.parametrize('freq, expected_values',
+                             [('1s', [3, np.NaN, 7, 11]),
+                              ('2s', [3, int((7 + 11) / 2)]),
+                              ('3s', [int((3 + 7) / 2), 11])])
+    def test_resample_with_nat(self, periods, values, freq, expected_values):
+        # GH 13224
+        index = PeriodIndex(periods, freq='S')
+        frame = DataFrame(values, index=index)
+
+        expected_index = period_range('1970-01-01 00:00:00',
+                                      periods=len(expected_values), freq=freq)
+        expected = DataFrame(expected_values, index=expected_index)
+        result = frame.resample(freq).mean()
+        assert_frame_equal(result, expected)
+
+    def test_resample_with_only_nat(self):
+        # GH 13224
+        pi = PeriodIndex([pd.NaT] * 3, freq='S')
+        frame = DataFrame([2, 3, 5], index=pi)
+        expected_index = PeriodIndex(data=[], freq=pi.freq)
+        expected = DataFrame([], index=expected_index)
+        result = frame.resample('1s').mean()
+        assert_frame_equal(result, expected)
+
+
+class TestTimedeltaIndex(Base):
+    _index_factory = lambda x: timedelta_range
+
+    @pytest.fixture
+    def _index_start(self):
+        return '1 day'
+
+    @pytest.fixture
+    def _index_end(self):
+        return '10 day'
+
+    @pytest.fixture
+    def _series_name(self):
+        return 'tdi'
+
+    def create_series(self):
+        i = timedelta_range('1 day',
+                            '10 day', freq='D')
+
+        return Series(np.arange(len(i)), index=i, name='tdi')
+
+    def test_asfreq_bug(self):
+        import datetime as dt
+        df = DataFrame(data=[1, 3],
+                       index=[dt.timedelta(), dt.timedelta(minutes=3)])
+        result = df.resample('1T').asfreq()
+        expected = DataFrame(data=[1, np.nan, np.nan, 3],
+                             index=timedelta_range('0 day',
+                                                   periods=4,
+                                                   freq='1T'))
+        assert_frame_equal(result, expected)
+
+
+class TestResamplerGrouper(object):
+
+    def setup_method(self, method):
+        self.frame = DataFrame({'A': [1] * 20 + [2] * 12 + [3] * 8,
+                                'B': np.arange(40)},
+                               index=date_range('1/1/2000',
+                                                freq='s',
+                                                periods=40))
+
+    def test_tab_complete_ipython6_warning(self, ip):
+        from IPython.core.completer import provisionalcompleter
+        code = dedent("""\
+        import pandas.util.testing as tm
+        s = tm.makeTimeSeries()
+        rs = s.resample("D")
+        """)
+        ip.run_code(code)
+
+        with tm.assert_produces_warning(None):
+            with provisionalcompleter('ignore'):
+                list(ip.Completer.completions('rs.', 1))
+
+    def test_deferred_with_groupby(self):
+
+        # GH 12486
+        # support deferred resample ops with groupby
+        data = [['2010-01-01', 'A', 2], ['2010-01-02', 'A', 3],
+                ['2010-01-05', 'A', 8], ['2010-01-10', 'A', 7],
+                ['2010-01-13', 'A', 3], ['2010-01-01', 'B', 5],
+                ['2010-01-03', 'B', 2], ['2010-01-04', 'B', 1],
+                ['2010-01-11', 'B', 7], ['2010-01-14', 'B', 3]]
+
+        df = DataFrame(data, columns=['date', 'id', 'score'])
+        df.date = pd.to_datetime(df.date)
+        f = lambda x: x.set_index('date').resample('D').asfreq()
+        expected = df.groupby('id').apply(f)
+        result = df.set_index('date').groupby('id').resample('D').asfreq()
+        assert_frame_equal(result, expected)
+
+        df = DataFrame({'date': pd.date_range(start='2016-01-01',
+                                              periods=4,
+                                              freq='W'),
+                        'group': [1, 1, 2, 2],
+                        'val': [5, 6, 7, 8]}).set_index('date')
+
+        f = lambda x: x.resample('1D').ffill()
+        expected = df.groupby('group').apply(f)
+        result = df.groupby('group').resample('1D').ffill()
+        assert_frame_equal(result, expected)
+
+    def test_getitem(self):
+        g = self.frame.groupby('A')
+
+        expected = g.B.apply(lambda x: x.resample('2s').mean())
+
+        result = g.resample('2s').B.mean()
+        assert_series_equal(result, expected)
+
+        result = g.B.resample('2s').mean()
+        assert_series_equal(result, expected)
+
+        result = g.resample('2s').mean().B
+        assert_series_equal(result, expected)
+
+    def test_getitem_multiple(self):
+
+        # GH 13174
+        # multiple calls after selection causing an issue with aliasing
+        data = [{'id': 1, 'buyer': 'A'}, {'id': 2, 'buyer': 'B'}]
+        df = DataFrame(data, index=pd.date_range('2016-01-01', periods=2))
+        r = df.groupby('id').resample('1D')
+        result = r['buyer'].count()
+        expected = Series([1, 1],
+                          index=pd.MultiIndex.from_tuples(
+                              [(1, Timestamp('2016-01-01')),
+                               (2, Timestamp('2016-01-02'))],
+                              names=['id', None]),
+                          name='buyer')
+        assert_series_equal(result, expected)
+
+        result = r['buyer'].count()
+        assert_series_equal(result, expected)
+
+    def test_groupby_resample_on_api_with_getitem(self):
+        # GH 17813
+        df = pd.DataFrame({'id': list('aabbb'),
+                           'date': pd.date_range('1-1-2016', periods=5),
+                           'data': 1})
+        exp = df.set_index('date').groupby('id').resample('2D')['data'].sum()
+        result = df.groupby('id').resample('2D', on='date')['data'].sum()
+        assert_series_equal(result, exp)
+
+    def test_nearest(self):
+
+        # GH 17496
+        # Resample nearest
+        index = pd.date_range('1/1/2000', periods=3, freq='T')
+        result = Series(range(3), index=index).resample('20s').nearest()
+
+        expected = Series(
+            [0, 0, 1, 1, 1, 2, 2],
+            index=pd.DatetimeIndex(
+                ['2000-01-01 00:00:00', '2000-01-01 00:00:20',
+                 '2000-01-01 00:00:40', '2000-01-01 00:01:00',
+                 '2000-01-01 00:01:20', '2000-01-01 00:01:40',
+                 '2000-01-01 00:02:00'],
+                dtype='datetime64[ns]',
+                freq='20S'))
+        assert_series_equal(result, expected)
+
+    def test_methods(self):
+        g = self.frame.groupby('A')
+        r = g.resample('2s')
+
+        for f in ['first', 'last', 'median', 'sem', 'sum', 'mean',
+                  'min', 'max']:
+            result = getattr(r, f)()
+            expected = g.apply(lambda x: getattr(x.resample('2s'), f)())
+            assert_frame_equal(result, expected)
+
+        for f in ['size']:
+            result = getattr(r, f)()
+            expected = g.apply(lambda x: getattr(x.resample('2s'), f)())
+            assert_series_equal(result, expected)
+
+        for f in ['count']:
+            result = getattr(r, f)()
+            expected = g.apply(lambda x: getattr(x.resample('2s'), f)())
+            assert_frame_equal(result, expected)
+
+        # series only
+        for f in ['nunique']:
+            result = getattr(r.B, f)()
+            expected = g.B.apply(lambda x: getattr(x.resample('2s'), f)())
+            assert_series_equal(result, expected)
+
+        for f in ['nearest', 'backfill', 'ffill', 'asfreq']:
+            result = getattr(r, f)()
+            expected = g.apply(lambda x: getattr(x.resample('2s'), f)())
+            assert_frame_equal(result, expected)
+
+        result = r.ohlc()
+        expected = g.apply(lambda x: x.resample('2s').ohlc())
+        assert_frame_equal(result, expected)
+
+        for f in ['std', 'var']:
+            result = getattr(r, f)(ddof=1)
+            expected = g.apply(lambda x: getattr(x.resample('2s'), f)(ddof=1))
+            assert_frame_equal(result, expected)
+
+    def test_apply(self):
+
+        g = self.frame.groupby('A')
+        r = g.resample('2s')
+
+        # reduction
+        expected = g.resample('2s').sum()
+
+        def f(x):
+            return x.resample('2s').sum()
+
+        result = r.apply(f)
+        assert_frame_equal(result, expected)
+
+        def f(x):
+            return x.resample('2s').apply(lambda y: y.sum())
+
+        result = g.apply(f)
+        assert_frame_equal(result, expected)
+
+    def test_apply_with_mutated_index(self):
+        # GH 15169
+        index = pd.date_range('1-1-2015', '12-31-15', freq='D')
+        df = DataFrame(data={'col1': np.random.rand(len(index))}, index=index)
+
+        def f(x):
+            s = Series([1, 2], index=['a', 'b'])
+            return s
+
+        expected = df.groupby(pd.Grouper(freq='M')).apply(f)
+
+        result = df.resample('M').apply(f)
+        assert_frame_equal(result, expected)
+
+        # A case for series
+        expected = df['col1'].groupby(pd.Grouper(freq='M')).apply(f)
+        result = df['col1'].resample('M').apply(f)
+        assert_series_equal(result, expected)
+
+    def test_resample_groupby_with_label(self):
+        # GH 13235
+        index = date_range('2000-01-01', freq='2D', periods=5)
+        df = DataFrame(index=index,
+                       data={'col0': [0, 0, 1, 1, 2], 'col1': [1, 1, 1, 1, 1]}
+                       )
+        result = df.groupby('col0').resample('1W', label='left').sum()
+
+        mi = [np.array([0, 0, 1, 2]),
+              pd.to_datetime(np.array(['1999-12-26', '2000-01-02',
+                                       '2000-01-02', '2000-01-02'])
+                             )
+              ]
+        mindex = pd.MultiIndex.from_arrays(mi, names=['col0', None])
+        expected = DataFrame(data={'col0': [0, 0, 2, 2], 'col1': [1, 1, 2, 1]},
+                             index=mindex
+                             )
+
+        assert_frame_equal(result, expected)
+
+    def test_consistency_with_window(self):
+
+        # consistent return values with window
+        df = self.frame
+        expected = pd.Int64Index([1, 2, 3], name='A')
+        result = df.groupby('A').resample('2s').mean()
+        assert result.index.nlevels == 2
+        tm.assert_index_equal(result.index.levels[0], expected)
+
+        result = df.groupby('A').rolling(20).mean()
+        assert result.index.nlevels == 2
+        tm.assert_index_equal(result.index.levels[0], expected)
+
+    def test_median_duplicate_columns(self):
+        # GH 14233
+
+        df = DataFrame(np.random.randn(20, 3),
+                       columns=list('aaa'),
+                       index=pd.date_range('2012-01-01', periods=20, freq='s'))
+        df2 = df.copy()
+        df2.columns = ['a', 'b', 'c']
+        expected = df2.resample('5s').median()
+        result = df.resample('5s').median()
+        expected.columns = result.columns
+        assert_frame_equal(result, expected)
+
+
+class TestTimeGrouper(object):
+
+    def setup_method(self, method):
+        self.ts = Series(np.random.randn(1000),
+                         index=date_range('1/1/2000', periods=1000))
+
+    def test_apply(self):
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            grouper = pd.TimeGrouper(freq='A', label='right', closed='right')
+
+        grouped = self.ts.groupby(grouper)
+
+        f = lambda x: x.sort_values()[-3:]
+
+        applied = grouped.apply(f)
+        expected = self.ts.groupby(lambda x: x.year).apply(f)
+
+        applied.index = applied.index.droplevel(0)
+        expected.index = expected.index.droplevel(0)
+        assert_series_equal(applied, expected)
+
+    def test_count(self):
+        self.ts[::3] = np.nan
+
+        expected = self.ts.groupby(lambda x: x.year).count()
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            grouper = pd.TimeGrouper(freq='A', label='right', closed='right')
+        result = self.ts.groupby(grouper).count()
+        expected.index = result.index
+        assert_series_equal(result, expected)
+
+        result = self.ts.resample('A').count()
+        expected.index = result.index
+        assert_series_equal(result, expected)
+
+    def test_numpy_reduction(self):
+        result = self.ts.resample('A', closed='right').prod()
+
+        expected = self.ts.groupby(lambda x: x.year).agg(np.prod)
+        expected.index = result.index
+
+        assert_series_equal(result, expected)
+
+    def test_apply_iteration(self):
+        # #2300
+        N = 1000
+        ind = pd.date_range(start="2000-01-01", freq="D", periods=N)
+        df = DataFrame({'open': 1, 'close': 2}, index=ind)
+        tg = TimeGrouper('M')
+
+        _, grouper, _ = tg._get_grouper(df)
+
+        # Errors
+        grouped = df.groupby(grouper, group_keys=False)
+        f = lambda df: df['close'] / df['open']
+
+        # it works!
+        result = grouped.apply(f)
+        tm.assert_index_equal(result.index, df.index)
+
+    def test_panel_aggregation(self):
+        ind = pd.date_range('1/1/2000', periods=100)
+        data = np.random.randn(2, len(ind), 4)
+
+        with catch_warnings(record=True):
+            wp = Panel(data, items=['Item1', 'Item2'], major_axis=ind,
+                       minor_axis=['A', 'B', 'C', 'D'])
+
+            tg = TimeGrouper('M', axis=1)
+            _, grouper, _ = tg._get_grouper(wp)
+            bingrouped = wp.groupby(grouper)
+            binagg = bingrouped.mean()
+
+            def f(x):
+                assert (isinstance(x, Panel))
+                return x.mean(1)
+
+            result = bingrouped.agg(f)
+            tm.assert_panel_equal(result, binagg)
+
+    def test_fails_on_no_datetime_index(self):
+        index_names = ('Int64Index', 'Index', 'Float64Index', 'MultiIndex')
+        index_funcs = (tm.makeIntIndex,
+                       tm.makeUnicodeIndex, tm.makeFloatIndex,
+                       lambda m: tm.makeCustomIndex(m, 2))
+        n = 2
+        for name, func in zip(index_names, index_funcs):
+            index = func(n)
+            df = DataFrame({'a': np.random.randn(n)}, index=index)
+            with tm.assert_raises_regex(TypeError,
+                                        "Only valid with "
+                                        "DatetimeIndex, TimedeltaIndex "
+                                        "or PeriodIndex, but got an "
+                                        "instance of %r" % name):
+                df.groupby(TimeGrouper('D'))
+
+    def test_aaa_group_order(self):
+        # GH 12840
+        # check TimeGrouper perform stable sorts
+        n = 20
+        data = np.random.randn(n, 4)
+        df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+        df['key'] = [datetime(2013, 1, 1), datetime(2013, 1, 2),
+                     datetime(2013, 1, 3), datetime(2013, 1, 4),
+                     datetime(2013, 1, 5)] * 4
+        grouped = df.groupby(TimeGrouper(key='key', freq='D'))
+
+        tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 1)),
+                              df[::5])
+        tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 2)),
+                              df[1::5])
+        tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 3)),
+                              df[2::5])
+        tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 4)),
+                              df[3::5])
+        tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 5)),
+                              df[4::5])
+
+    def test_aggregate_normal(self):
+        # check TimeGrouper's aggregation is identical as normal groupby
+
+        n = 20
+        data = np.random.randn(n, 4)
+        normal_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+        normal_df['key'] = [1, 2, 3, 4, 5] * 4
+
+        dt_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+        dt_df['key'] = [datetime(2013, 1, 1), datetime(2013, 1, 2),
+                        datetime(2013, 1, 3), datetime(2013, 1, 4),
+                        datetime(2013, 1, 5)] * 4
+
+        normal_grouped = normal_df.groupby('key')
+        dt_grouped = dt_df.groupby(TimeGrouper(key='key', freq='D'))
+
+        for func in ['min', 'max', 'prod', 'var', 'std', 'mean']:
+            expected = getattr(normal_grouped, func)()
+            dt_result = getattr(dt_grouped, func)()
+            expected.index = date_range(start='2013-01-01', freq='D',
+                                        periods=5, name='key')
+            assert_frame_equal(expected, dt_result)
+
+        for func in ['count', 'sum']:
+            expected = getattr(normal_grouped, func)()
+            expected.index = date_range(start='2013-01-01', freq='D',
+                                        periods=5, name='key')
+            dt_result = getattr(dt_grouped, func)()
+            assert_frame_equal(expected, dt_result)
+
+        # GH 7453
+        for func in ['size']:
+            expected = getattr(normal_grouped, func)()
+            expected.index = date_range(start='2013-01-01', freq='D',
+                                        periods=5, name='key')
+            dt_result = getattr(dt_grouped, func)()
+            assert_series_equal(expected, dt_result)
+
+        # GH 7453
+        for func in ['first', 'last']:
+            expected = getattr(normal_grouped, func)()
+            expected.index = date_range(start='2013-01-01', freq='D',
+                                        periods=5, name='key')
+            dt_result = getattr(dt_grouped, func)()
+            assert_frame_equal(expected, dt_result)
+
+        # if TimeGrouper is used included, 'nth' doesn't work yet
+
+        """
+        for func in ['nth']:
+            expected = getattr(normal_grouped, func)(3)
+            expected.index = date_range(start='2013-01-01',
+                                        freq='D', periods=5, name='key')
+            dt_result = getattr(dt_grouped, func)(3)
+            assert_frame_equal(expected, dt_result)
+        """
+
+    @pytest.mark.parametrize('method, unit', [
+        ('sum', 0),
+        ('prod', 1),
+    ])
+    def test_resample_entirly_nat_window(self, method, unit):
+        s = pd.Series([0] * 2 + [np.nan] * 2,
+                      index=pd.date_range('2017', periods=4))
+        # 0 / 1 by default
+        result = methodcaller(method)(s.resample("2d"))
+        expected = pd.Series([0.0, unit],
+                             index=pd.to_datetime(['2017-01-01',
+                                                   '2017-01-03']))
+        tm.assert_series_equal(result, expected)
+
+        # min_count=0
+        result = methodcaller(method, min_count=0)(s.resample("2d"))
+        expected = pd.Series([0.0, unit],
+                             index=pd.to_datetime(['2017-01-01',
+                                                   '2017-01-03']))
+        tm.assert_series_equal(result, expected)
+
+        # min_count=1
+        result = methodcaller(method, min_count=1)(s.resample("2d"))
+        expected = pd.Series([0.0, np.nan],
+                             index=pd.to_datetime(['2017-01-01',
+                                                   '2017-01-03']))
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('func, fill_value', [
+        ('min', np.nan),
+        ('max', np.nan),
+        ('sum', 0),
+        ('prod', 1),
+        ('count', 0),
+    ])
+    def test_aggregate_with_nat(self, func, fill_value):
+        # check TimeGrouper's aggregation is identical as normal groupby
+        # if NaT is included, 'var', 'std', 'mean', 'first','last'
+        # and 'nth' doesn't work yet
+
+        n = 20
+        data = np.random.randn(n, 4).astype('int64')
+        normal_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+        normal_df['key'] = [1, 2, np.nan, 4, 5] * 4
+
+        dt_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+        dt_df['key'] = [datetime(2013, 1, 1), datetime(2013, 1, 2), pd.NaT,
+                        datetime(2013, 1, 4), datetime(2013, 1, 5)] * 4
+
+        normal_grouped = normal_df.groupby('key')
+        dt_grouped = dt_df.groupby(TimeGrouper(key='key', freq='D'))
+
+        normal_result = getattr(normal_grouped, func)()
+        dt_result = getattr(dt_grouped, func)()
+
+        pad = DataFrame([[fill_value] * 4], index=[3],
+                        columns=['A', 'B', 'C', 'D'])
+        expected = normal_result.append(pad)
+        expected = expected.sort_index()
+        expected.index = date_range(start='2013-01-01', freq='D',
+                                    periods=5, name='key')
+        assert_frame_equal(expected, dt_result)
+        assert dt_result.index.name == 'key'
+
+    def test_aggregate_with_nat_size(self):
+        # GH 9925
+        n = 20
+        data = np.random.randn(n, 4).astype('int64')
+        normal_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+        normal_df['key'] = [1, 2, np.nan, 4, 5] * 4
+
+        dt_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+        dt_df['key'] = [datetime(2013, 1, 1), datetime(2013, 1, 2), pd.NaT,
+                        datetime(2013, 1, 4), datetime(2013, 1, 5)] * 4
+
+        normal_grouped = normal_df.groupby('key')
+        dt_grouped = dt_df.groupby(TimeGrouper(key='key', freq='D'))
+
+        normal_result = normal_grouped.size()
+        dt_result = dt_grouped.size()
+
+        pad = Series([0], index=[3])
+        expected = normal_result.append(pad)
+        expected = expected.sort_index()
+        expected.index = date_range(start='2013-01-01', freq='D',
+                                    periods=5, name='key')
+        assert_series_equal(expected, dt_result)
+        assert dt_result.index.name == 'key'
+
+    def test_repr(self):
+        # GH18203
+        result = repr(TimeGrouper(key='A', freq='H'))
+        expected = ("TimeGrouper(key='A', freq=<Hour>, axis=0, sort=True, "
+                    "closed='left', label='left', how='mean', "
+                    "convention='e', base=0)")
+        assert result == expected
+
+    @pytest.mark.parametrize('method, unit', [
+        ('sum', 0),
+        ('prod', 1),
+    ])
+    def test_upsample_sum(self, method, unit):
+        s = pd.Series(1, index=pd.date_range("2017", periods=2, freq="H"))
+        resampled = s.resample("30T")
+        index = pd.to_datetime(['2017-01-01T00:00:00',
+                                '2017-01-01T00:30:00',
+                                '2017-01-01T01:00:00'])
+
+        # 0 / 1 by default
+        result = methodcaller(method)(resampled)
+        expected = pd.Series([1, unit, 1], index=index)
+        tm.assert_series_equal(result, expected)
+
+        # min_count=0
+        result = methodcaller(method, min_count=0)(resampled)
+        expected = pd.Series([1, unit, 1], index=index)
+        tm.assert_series_equal(result, expected)
+
+        # min_count=1
+        result = methodcaller(method, min_count=1)(resampled)
+        expected = pd.Series([1, np.nan, 1], index=index)
+        tm.assert_series_equal(result, expected)
+
+        # min_count>1
+        result = methodcaller(method, min_count=2)(resampled)
+        expected = pd.Series([np.nan, np.nan, np.nan], index=index)
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/test_reshape.py b/pandas/tests/test_reshape.py
deleted file mode 100644
index 2961301366188..0000000000000
--- a/pandas/tests/test_reshape.py
+++ /dev/null
@@ -1,464 +0,0 @@
-# -*- coding: utf-8 -*-
-# pylint: disable-msg=W0612,E1101
-from copy import deepcopy
-from datetime import datetime, timedelta
-import operator
-import os
-
-import nose
-
-from pandas import DataFrame, Series
-from pandas.core.sparse import SparseDataFrame
-import pandas as pd
-
-from numpy import nan
-import numpy as np
-
-from pandas.util.testing import assert_frame_equal
-
-from pandas.core.reshape import (melt, lreshape, get_dummies,
-                                 wide_to_long)
-import pandas.util.testing as tm
-from pandas.compat import StringIO, cPickle, range, u
-
-_multiprocess_can_split_ = True
-
-
-class TestMelt(tm.TestCase):
-
-    def setUp(self):
-        self.df = tm.makeTimeDataFrame()[:10]
-        self.df['id1'] = (self.df['A'] > 0).astype(np.int64)
-        self.df['id2'] = (self.df['B'] > 0).astype(np.int64)
-
-        self.var_name = 'var'
-        self.value_name = 'val'
-
-        self.df1 = pd.DataFrame([[ 1.067683, -1.110463,  0.20867 ],
-                                 [-1.321405,  0.368915, -1.055342],
-                                 [-0.807333,  0.08298 , -0.873361]])
-        self.df1.columns = [list('ABC'), list('abc')]
-        self.df1.columns.names = ['CAP', 'low']
-
-    def test_default_col_names(self):
-        result = melt(self.df)
-        self.assertEqual(result.columns.tolist(), ['variable', 'value'])
-
-        result1 = melt(self.df, id_vars=['id1'])
-        self.assertEqual(result1.columns.tolist(), ['id1', 'variable', 'value'])
-
-        result2 = melt(self.df, id_vars=['id1', 'id2'])
-        self.assertEqual(result2.columns.tolist(), ['id1', 'id2', 'variable', 'value'])
-
-    def test_value_vars(self):
-        result3 = melt(self.df, id_vars=['id1', 'id2'], value_vars='A')
-        self.assertEqual(len(result3), 10)
-
-        result4 = melt(self.df, id_vars=['id1', 'id2'], value_vars=['A', 'B'])
-        expected4 = DataFrame({'id1': self.df['id1'].tolist() * 2,
-                               'id2': self.df['id2'].tolist() * 2,
-                               'variable': ['A']*10 + ['B']*10,
-                               'value': self.df['A'].tolist() + self.df['B'].tolist()},
-                              columns=['id1', 'id2', 'variable', 'value'])
-        tm.assert_frame_equal(result4, expected4)
-
-    def test_custom_var_name(self):
-        result5 = melt(self.df, var_name=self.var_name)
-        self.assertEqual(result5.columns.tolist(), ['var', 'value'])
-
-        result6 = melt(self.df, id_vars=['id1'], var_name=self.var_name)
-        self.assertEqual(result6.columns.tolist(), ['id1', 'var', 'value'])
-
-        result7 = melt(self.df, id_vars=['id1', 'id2'], var_name=self.var_name)
-        self.assertEqual(result7.columns.tolist(), ['id1', 'id2', 'var', 'value'])
-
-        result8 = melt(self.df, id_vars=['id1', 'id2'],
-                       value_vars='A', var_name=self.var_name)
-        self.assertEqual(result8.columns.tolist(), ['id1', 'id2', 'var', 'value'])
-
-        result9 = melt(self.df, id_vars=['id1', 'id2'],
-                       value_vars=['A', 'B'], var_name=self.var_name)
-        expected9 = DataFrame({'id1': self.df['id1'].tolist() * 2,
-                               'id2': self.df['id2'].tolist() * 2,
-                               self.var_name: ['A']*10 + ['B']*10,
-                               'value': self.df['A'].tolist() + self.df['B'].tolist()},
-                              columns=['id1', 'id2', self.var_name, 'value'])
-        tm.assert_frame_equal(result9, expected9)
-
-    def test_custom_value_name(self):
-        result10 = melt(self.df, value_name=self.value_name)
-        self.assertEqual(result10.columns.tolist(), ['variable', 'val'])
-
-        result11 = melt(self.df, id_vars=['id1'], value_name=self.value_name)
-        self.assertEqual(result11.columns.tolist(), ['id1', 'variable', 'val'])
-
-        result12 = melt(self.df, id_vars=['id1', 'id2'], value_name=self.value_name)
-        self.assertEqual(result12.columns.tolist(), ['id1', 'id2', 'variable', 'val'])
-
-        result13 = melt(self.df, id_vars=['id1', 'id2'],
-                        value_vars='A', value_name=self.value_name)
-        self.assertEqual(result13.columns.tolist(), ['id1', 'id2', 'variable', 'val'])
-
-        result14 = melt(self.df, id_vars=['id1', 'id2'],
-                        value_vars=['A', 'B'], value_name=self.value_name)
-        expected14 = DataFrame({'id1': self.df['id1'].tolist() * 2,
-                                'id2': self.df['id2'].tolist() * 2,
-                                'variable': ['A']*10 + ['B']*10,
-                                self.value_name: self.df['A'].tolist() + self.df['B'].tolist()},
-                               columns=['id1', 'id2', 'variable', self.value_name])
-        tm.assert_frame_equal(result14, expected14)
-
-    def test_custom_var_and_value_name(self):
-
-        result15 = melt(self.df, var_name=self.var_name, value_name=self.value_name)
-        self.assertEqual(result15.columns.tolist(), ['var', 'val'])
-
-        result16 = melt(self.df, id_vars=['id1'], var_name=self.var_name, value_name=self.value_name)
-        self.assertEqual(result16.columns.tolist(), ['id1', 'var', 'val'])
-
-        result17 = melt(self.df, id_vars=['id1', 'id2'],
-                        var_name=self.var_name, value_name=self.value_name)
-        self.assertEqual(result17.columns.tolist(), ['id1', 'id2', 'var', 'val'])
-
-        result18 = melt(self.df, id_vars=['id1', 'id2'],
-                        value_vars='A', var_name=self.var_name, value_name=self.value_name)
-        self.assertEqual(result18.columns.tolist(), ['id1', 'id2', 'var', 'val'])
-
-        result19 = melt(self.df, id_vars=['id1', 'id2'],
-                        value_vars=['A', 'B'], var_name=self.var_name, value_name=self.value_name)
-        expected19 = DataFrame({'id1': self.df['id1'].tolist() * 2,
-                                'id2': self.df['id2'].tolist() * 2,
-                                self.var_name: ['A']*10 + ['B']*10,
-                                self.value_name: self.df['A'].tolist() + self.df['B'].tolist()},
-                               columns=['id1', 'id2', self.var_name, self.value_name])
-        tm.assert_frame_equal(result19, expected19)
-
-        df20 = self.df.copy()
-        df20.columns.name = 'foo'
-        result20 = melt(df20)
-        self.assertEqual(result20.columns.tolist(), ['foo', 'value'])
-
-    def test_col_level(self):
-        res1 = melt(self.df1, col_level=0)
-        res2 = melt(self.df1, col_level='CAP')
-        self.assertEqual(res1.columns.tolist(), ['CAP', 'value'])
-        self.assertEqual(res1.columns.tolist(), ['CAP', 'value'])
-
-    def test_multiindex(self):
-        res = pd.melt(self.df1)
-        self.assertEqual(res.columns.tolist(), ['CAP', 'low', 'value'])
-
-
-class TestGetDummies(tm.TestCase):
-
-    sparse = False
-
-    def setUp(self):
-        self.df = DataFrame({'A': ['a', 'b', 'a'], 'B': ['b', 'b', 'c'],
-                             'C': [1, 2, 3]})
-
-    def test_basic(self):
-        s_list = list('abc')
-        s_series = Series(s_list)
-        s_series_index = Series(s_list, list('ABC'))
-
-        expected = DataFrame({'a': {0: 1.0, 1: 0.0, 2: 0.0},
-                              'b': {0: 0.0, 1: 1.0, 2: 0.0},
-                              'c': {0: 0.0, 1: 0.0, 2: 1.0}})
-        assert_frame_equal(get_dummies(s_list, sparse=self.sparse), expected)
-        assert_frame_equal(get_dummies(s_series, sparse=self.sparse), expected)
-
-        expected.index = list('ABC')
-        assert_frame_equal(get_dummies(s_series_index, sparse=self.sparse), expected)
-
-    def test_basic_types(self):
-        # GH 10531
-        s_list = list('abc')
-        s_series = Series(s_list)
-        s_df = DataFrame({'a': [0, 1, 0, 1, 2],
-                          'b': ['A', 'A', 'B', 'C', 'C'],
-                          'c': [2, 3, 3, 3, 2]})
-
-        if not self.sparse:
-            exp_df_type = DataFrame 
-            exp_blk_type = pd.core.internals.FloatBlock
-        else:
-            exp_df_type = SparseDataFrame
-            exp_blk_type = pd.core.internals.SparseBlock
-
-        self.assertEqual(type(get_dummies(s_list, sparse=self.sparse)), exp_df_type)
-        self.assertEqual(type(get_dummies(s_series, sparse=self.sparse)), exp_df_type)
-
-        r = get_dummies(s_df, sparse=self.sparse, columns=s_df.columns)
-        self.assertEqual(type(r), exp_df_type)
-
-        r = get_dummies(s_df, sparse=self.sparse, columns=['a'])
-        self.assertEqual(type(r[['a_0']]._data.blocks[0]), exp_blk_type)
-        self.assertEqual(type(r[['a_1']]._data.blocks[0]), exp_blk_type)
-        self.assertEqual(type(r[['a_2']]._data.blocks[0]), exp_blk_type)
-
-
-    def test_just_na(self):
-        just_na_list = [np.nan]
-        just_na_series = Series(just_na_list)
-        just_na_series_index = Series(just_na_list, index = ['A'])
-
-        res_list = get_dummies(just_na_list, sparse=self.sparse)
-        res_series = get_dummies(just_na_series, sparse=self.sparse)
-        res_series_index = get_dummies(just_na_series_index, sparse=self.sparse)
-
-        self.assertEqual(res_list.empty, True)
-        self.assertEqual(res_series.empty, True)
-        self.assertEqual(res_series_index.empty, True)
-
-        self.assertEqual(res_list.index.tolist(), [0])
-        self.assertEqual(res_series.index.tolist(), [0])
-        self.assertEqual(res_series_index.index.tolist(), ['A'])
-
-    def test_include_na(self):
-        s = ['a', 'b', np.nan]
-        res = get_dummies(s, sparse=self.sparse)
-        exp = DataFrame({'a': {0: 1.0, 1: 0.0, 2: 0.0},
-                         'b': {0: 0.0, 1: 1.0, 2: 0.0}})
-        assert_frame_equal(res, exp)
-
-        # Sparse dataframes do not allow nan labelled columns, see #GH8822
-        res_na = get_dummies(s, dummy_na=True, sparse=self.sparse)
-        exp_na = DataFrame({nan: {0: 0.0, 1: 0.0, 2: 1.0},
-                            'a': {0: 1.0, 1: 0.0, 2: 0.0},
-                            'b': {0: 0.0, 1: 1.0, 2: 0.0}}).reindex_axis(['a', 'b', nan], 1)
-        # hack (NaN handling in assert_index_equal)
-        exp_na.columns = res_na.columns
-        assert_frame_equal(res_na, exp_na)
-
-        res_just_na = get_dummies([nan], dummy_na=True, sparse=self.sparse)
-        exp_just_na = DataFrame(Series(1.0,index=[0]),columns=[nan])
-        tm.assert_numpy_array_equal(res_just_na.values, exp_just_na.values)
-
-    def test_unicode(self):  # See GH 6885 - get_dummies chokes on unicode values
-        import unicodedata
-        e = 'e'
-        eacute = unicodedata.lookup('LATIN SMALL LETTER E WITH ACUTE')
-        s = [e, eacute, eacute]
-        res = get_dummies(s, prefix='letter', sparse=self.sparse)
-        exp = DataFrame({'letter_e': {0: 1.0, 1: 0.0, 2: 0.0},
-                        u('letter_%s') % eacute: {0: 0.0, 1: 1.0, 2: 1.0}})
-        assert_frame_equal(res, exp)
-
-    def test_dataframe_dummies_all_obj(self):
-        df = self.df[['A', 'B']]
-        result = get_dummies(df, sparse=self.sparse)
-        expected = DataFrame({'A_a': [1., 0, 1], 'A_b': [0., 1, 0],
-                              'B_b': [1., 1, 0], 'B_c': [0., 0, 1]})
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_mix_default(self):
-        df = self.df
-        result = get_dummies(df, sparse=self.sparse)
-        expected = DataFrame({'C': [1, 2, 3], 'A_a': [1., 0, 1],
-                              'A_b': [0., 1, 0], 'B_b': [1., 1, 0],
-                              'B_c': [0., 0, 1]})
-        expected = expected[['C', 'A_a', 'A_b', 'B_b', 'B_c']]
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_prefix_list(self):
-        prefixes = ['from_A', 'from_B']
-        df = DataFrame({'A': ['a', 'b', 'a'], 'B': ['b', 'b', 'c'],
-                        'C': [1, 2, 3]})
-        result = get_dummies(df, prefix=prefixes, sparse=self.sparse)
-        expected = DataFrame({'C': [1, 2, 3], 'from_A_a': [1., 0, 1],
-                              'from_A_b': [0., 1, 0], 'from_B_b': [1., 1, 0],
-                              'from_B_c': [0., 0, 1]})
-        expected = expected[['C', 'from_A_a', 'from_A_b', 'from_B_b',
-                             'from_B_c']]
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_prefix_str(self):
-        # not that you should do this...
-        df = self.df
-        result = get_dummies(df, prefix='bad', sparse=self.sparse)
-        expected = DataFrame([[1, 1., 0., 1., 0.],
-                              [2, 0., 1., 1., 0.],
-                              [3, 1., 0., 0., 1.]],
-                             columns=['C', 'bad_a', 'bad_b', 'bad_b', 'bad_c'])
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_subset(self):
-        df = self.df
-        result = get_dummies(df, prefix=['from_A'],
-                             columns=['A'], sparse=self.sparse)
-        expected = DataFrame({'from_A_a': [1., 0, 1], 'from_A_b': [0., 1, 0],
-                              'B': ['b', 'b', 'c'], 'C': [1, 2, 3]})
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_prefix_sep(self):
-        df = self.df
-        result = get_dummies(df, prefix_sep='..', sparse=self.sparse)
-        expected = DataFrame({'C': [1, 2, 3], 'A..a': [1., 0, 1],
-                              'A..b': [0., 1, 0], 'B..b': [1., 1, 0],
-                              'B..c': [0., 0, 1]})
-        expected = expected[['C', 'A..a', 'A..b', 'B..b', 'B..c']]
-        assert_frame_equal(result, expected)
-
-        result = get_dummies(df, prefix_sep=['..', '__'], sparse=self.sparse)
-        expected = expected.rename(columns={'B..b': 'B__b', 'B..c': 'B__c'})
-        assert_frame_equal(result, expected)
-
-        result = get_dummies(df, prefix_sep={'A': '..', 'B': '__'}, sparse=self.sparse)
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_prefix_bad_length(self):
-        with tm.assertRaises(ValueError):
-            get_dummies(self.df, prefix=['too few'], sparse=self.sparse)
-
-    def test_dataframe_dummies_prefix_sep_bad_length(self):
-        with tm.assertRaises(ValueError):
-            get_dummies(self.df, prefix_sep=['bad'], sparse=self.sparse)
-
-    def test_dataframe_dummies_prefix_dict(self):
-        prefixes = {'A': 'from_A', 'B': 'from_B'}
-        df = DataFrame({'A': ['a', 'b', 'a'], 'B': ['b', 'b', 'c'],
-                        'C': [1, 2, 3]})
-        result = get_dummies(df, prefix=prefixes, sparse=self.sparse)
-        expected = DataFrame({'from_A_a': [1., 0, 1], 'from_A_b': [0., 1, 0],
-                              'from_B_b': [1., 1, 0], 'from_B_c': [0., 0, 1],
-                              'C': [1, 2, 3]})
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_with_na(self):
-        df = self.df
-        df.loc[3, :] = [np.nan, np.nan, np.nan]
-        result = get_dummies(df, dummy_na=True, sparse=self.sparse)
-        expected = DataFrame({'C': [1, 2, 3, np.nan], 'A_a': [1., 0, 1, 0],
-            'A_b': [0., 1, 0, 0], 'A_nan': [0., 0, 0, 1], 'B_b': [1., 1, 0, 0],
-            'B_c': [0., 0, 1, 0], 'B_nan': [0., 0, 0, 1]})
-        expected = expected[['C', 'A_a', 'A_b', 'A_nan', 'B_b', 'B_c',
-                             'B_nan']]
-        assert_frame_equal(result, expected)
-
-        result = get_dummies(df, dummy_na=False, sparse=self.sparse)
-        expected = expected[['C', 'A_a', 'A_b', 'B_b', 'B_c']]
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_with_categorical(self):
-        df = self.df
-        df['cat'] = pd.Categorical(['x', 'y', 'y'])
-        result = get_dummies(df, sparse=self.sparse)
-        expected = DataFrame({'C': [1, 2, 3], 'A_a': [1., 0, 1],
-                              'A_b': [0., 1, 0], 'B_b': [1., 1, 0],
-                              'B_c': [0., 0, 1], 'cat_x': [1., 0, 0],
-                              'cat_y': [0., 1, 1]})
-        expected = expected[['C', 'A_a', 'A_b', 'B_b', 'B_c',
-                             'cat_x', 'cat_y']]
-        assert_frame_equal(result, expected)
-
-
-class TestGetDummiesSparse(TestGetDummies):
-    sparse = True
-
-
-class TestLreshape(tm.TestCase):
-
-    def test_pairs(self):
-        data = {'birthdt': ['08jan2009', '20dec2008', '30dec2008',
-                            '21dec2008', '11jan2009'],
-                'birthwt': [1766, 3301, 1454, 3139, 4133],
-                'id': [101, 102, 103, 104, 105],
-                'sex': ['Male', 'Female', 'Female', 'Female', 'Female'],
-                'visitdt1': ['11jan2009', '22dec2008', '04jan2009',
-                             '29dec2008', '20jan2009'],
-                'visitdt2': ['21jan2009', nan, '22jan2009', '31dec2008', '03feb2009'],
-                'visitdt3': ['05feb2009', nan, nan, '02jan2009', '15feb2009'],
-                'wt1': [1823, 3338, 1549, 3298, 4306],
-                'wt2': [2011.0, nan, 1892.0, 3338.0, 4575.0],
-                'wt3': [2293.0, nan, nan, 3377.0, 4805.0]}
-
-        df = DataFrame(data)
-
-        spec = {'visitdt': ['visitdt%d' % i for i in range(1, 4)],
-                'wt': ['wt%d' % i for i in range(1, 4)]}
-        result = lreshape(df, spec)
-
-        exp_data = {'birthdt': ['08jan2009', '20dec2008', '30dec2008',
-                                '21dec2008', '11jan2009', '08jan2009',
-                                '30dec2008', '21dec2008', '11jan2009',
-                                '08jan2009', '21dec2008', '11jan2009'],
-                    'birthwt': [1766, 3301, 1454, 3139, 4133, 1766,
-                                1454, 3139, 4133, 1766, 3139, 4133],
-                    'id': [101, 102, 103, 104, 105, 101,
-                           103, 104, 105, 101, 104, 105],
-                    'sex': ['Male', 'Female', 'Female', 'Female', 'Female',
-                            'Male', 'Female', 'Female', 'Female', 'Male',
-                            'Female', 'Female'],
-                    'visitdt': ['11jan2009', '22dec2008', '04jan2009', '29dec2008',
-                                '20jan2009', '21jan2009', '22jan2009', '31dec2008',
-                                '03feb2009', '05feb2009', '02jan2009', '15feb2009'],
-                    'wt': [1823.0, 3338.0, 1549.0, 3298.0, 4306.0, 2011.0,
-                           1892.0, 3338.0, 4575.0, 2293.0, 3377.0, 4805.0]}
-        exp = DataFrame(exp_data, columns=result.columns)
-        tm.assert_frame_equal(result, exp)
-
-        result = lreshape(df, spec, dropna=False)
-        exp_data = {'birthdt': ['08jan2009', '20dec2008', '30dec2008',
-                                '21dec2008', '11jan2009',
-                                '08jan2009', '20dec2008', '30dec2008',
-                                '21dec2008', '11jan2009',
-                                '08jan2009', '20dec2008', '30dec2008',
-                                '21dec2008', '11jan2009'],
-                    'birthwt': [1766, 3301, 1454, 3139, 4133,
-                                1766, 3301, 1454, 3139, 4133,
-                                1766, 3301, 1454, 3139, 4133],
-                    'id': [101, 102, 103, 104, 105,
-                           101, 102, 103, 104, 105,
-                           101, 102, 103, 104, 105],
-                    'sex': ['Male', 'Female', 'Female', 'Female', 'Female',
-                            'Male', 'Female', 'Female', 'Female', 'Female',
-                            'Male', 'Female', 'Female', 'Female', 'Female'],
-                    'visitdt': ['11jan2009', '22dec2008', '04jan2009',
-                                '29dec2008', '20jan2009',
-                                '21jan2009', nan, '22jan2009',
-                                '31dec2008', '03feb2009',
-                                '05feb2009', nan, nan, '02jan2009', '15feb2009'],
-                    'wt': [1823.0, 3338.0, 1549.0, 3298.0, 4306.0, 2011.0,
-                           nan, 1892.0, 3338.0, 4575.0, 2293.0, nan, nan,
-                           3377.0, 4805.0]}
-        exp = DataFrame(exp_data, columns=result.columns)
-        tm.assert_frame_equal(result, exp)
-
-        spec = {'visitdt': ['visitdt%d' % i for i in range(1, 3)],
-                'wt': ['wt%d' % i for i in range(1, 4)]}
-        self.assertRaises(ValueError, lreshape, df, spec)
-
-class TestWideToLong(tm.TestCase):
-    def test_simple(self):
-        np.random.seed(123)
-        x = np.random.randn(3)
-        df = pd.DataFrame({"A1970" : {0 : "a", 1 : "b", 2 : "c"},
-                           "A1980" : {0 : "d", 1 : "e", 2 : "f"},
-                           "B1970" : {0 : 2.5, 1 : 1.2, 2 : .7},
-                           "B1980" : {0 : 3.2, 1 : 1.3, 2 : .1},
-                           "X"     : dict(zip(range(3), x))
-                          })
-        df["id"] = df.index
-        exp_data = {"X" : x.tolist() + x.tolist(),
-                    "A" : ['a', 'b', 'c', 'd', 'e', 'f'],
-                    "B" : [2.5, 1.2, 0.7, 3.2, 1.3, 0.1],
-                    "year" : [1970, 1970, 1970, 1980, 1980, 1980],
-                    "id" : [0, 1, 2, 0, 1, 2]}
-        exp_frame = DataFrame(exp_data)
-        exp_frame = exp_frame.set_index(['id', 'year'])[["X", "A", "B"]]
-        long_frame = wide_to_long(df, ["A", "B"], i="id", j="year")
-        tm.assert_frame_equal(long_frame, exp_frame)
-
-    def test_stubs(self):
-        # GH9204
-        df = pd.DataFrame([[0,1,2,3,8],[4,5,6,7,9]])
-        df.columns = ['id', 'inc1', 'inc2', 'edu1', 'edu2']
-        stubs = ['inc', 'edu']
-        df_long = pd.wide_to_long(df, stubs, i='id', j='age')
-
-        self.assertEqual(stubs,['inc', 'edu'])
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_rplot.py b/pandas/tests/test_rplot.py
deleted file mode 100644
index e79acfcbc58d8..0000000000000
--- a/pandas/tests/test_rplot.py
+++ /dev/null
@@ -1,299 +0,0 @@
-# -*- coding: utf-8 -*-
-from pandas.compat import range
-import pandas.tools.rplot as rplot
-import pandas.util.testing as tm
-from pandas import read_csv
-import os
-
-import nose
-
-
-def curpath():
-    pth, _ = os.path.split(os.path.abspath(__file__))
-    return pth
-
-
-def between(a, b, x):
-    """Check if x is in the somewhere between a and b.
-
-    Parameters:
-    -----------
-    a: float, interval start
-    b: float, interval end
-    x: float, value to test for
-
-    Returns:
-    --------
-    True if x is between a and b, False otherwise
-    """
-    if a < b:
-        return x >= a and x <= b
-    else:
-        return x <= a and x >= b
-
-
-@tm.mplskip
-class TestUtilityFunctions(tm.TestCase):
-    """
-    Tests for RPlot utility functions.
-    """
-    def setUp(self):
-        path = os.path.join(curpath(), 'data/iris.csv')
-        self.data = read_csv(path, sep=',')
-
-    def test_make_aes1(self):
-        aes = rplot.make_aes()
-        self.assertTrue(aes['x'] is None)
-        self.assertTrue(aes['y'] is None)
-        self.assertTrue(aes['size'] is None)
-        self.assertTrue(aes['colour'] is None)
-        self.assertTrue(aes['shape'] is None)
-        self.assertTrue(aes['alpha'] is None)
-        self.assertTrue(isinstance(aes, dict))
-
-    def test_make_aes2(self):
-        self.assertRaises(ValueError, rplot.make_aes,
-                          size=rplot.ScaleShape('test'))
-        self.assertRaises(ValueError, rplot.make_aes,
-                          colour=rplot.ScaleShape('test'))
-        self.assertRaises(ValueError, rplot.make_aes,
-                          shape=rplot.ScaleSize('test'))
-        self.assertRaises(ValueError, rplot.make_aes,
-                          alpha=rplot.ScaleShape('test'))
-
-    def test_dictionary_union(self):
-        dict1 = {1 : 1, 2 : 2, 3 : 3}
-        dict2 = {1 : 1, 2 : 2, 4 : 4}
-        union = rplot.dictionary_union(dict1, dict2)
-        self.assertEqual(len(union), 4)
-        keys = list(union.keys())
-        self.assertTrue(1 in keys)
-        self.assertTrue(2 in keys)
-        self.assertTrue(3 in keys)
-        self.assertTrue(4 in keys)
-        self.assertEqual(rplot.dictionary_union(dict1, {}), dict1)
-        self.assertEqual(rplot.dictionary_union({}, dict1), dict1)
-        self.assertEqual(rplot.dictionary_union({}, {}), {})
-
-    def test_merge_aes(self):
-        layer1 = rplot.Layer(size=rplot.ScaleSize('test'))
-        layer2 = rplot.Layer(shape=rplot.ScaleShape('test'))
-        rplot.merge_aes(layer1, layer2)
-        self.assertTrue(isinstance(layer2.aes['size'], rplot.ScaleSize))
-        self.assertTrue(isinstance(layer2.aes['shape'], rplot.ScaleShape))
-        self.assertEqual(layer2.aes['size'], layer1.aes['size'])
-        for key in layer2.aes.keys():
-            if key != 'size' and key != 'shape':
-                self.assertTrue(layer2.aes[key] is None)
-
-    def test_sequence_layers(self):
-        layer1 = rplot.Layer(self.data)
-        layer2 = rplot.GeomPoint(x='SepalLength', y='SepalWidth',
-                                 size=rplot.ScaleSize('PetalLength'))
-        layer3 = rplot.GeomPolyFit(2)
-        result = rplot.sequence_layers([layer1, layer2, layer3])
-        self.assertEqual(len(result), 3)
-        last = result[-1]
-        self.assertEqual(last.aes['x'], 'SepalLength')
-        self.assertEqual(last.aes['y'], 'SepalWidth')
-        self.assertTrue(isinstance(last.aes['size'], rplot.ScaleSize))
-        self.assertTrue(self.data is last.data)
-        self.assertTrue(rplot.sequence_layers([layer1])[0] is layer1)
-
-
-@tm.mplskip
-class TestTrellis(tm.TestCase):
-    def setUp(self):
-        path = os.path.join(curpath(), 'data/tips.csv')
-        self.data = read_csv(path, sep=',')
-        layer1 = rplot.Layer(self.data)
-        layer2 = rplot.GeomPoint(x='total_bill', y='tip')
-        layer3 = rplot.GeomPolyFit(2)
-        self.layers = rplot.sequence_layers([layer1, layer2, layer3])
-        self.trellis1 = rplot.TrellisGrid(['sex', 'smoker'])
-        self.trellis2 = rplot.TrellisGrid(['sex', '.'])
-        self.trellis3 = rplot.TrellisGrid(['.', 'smoker'])
-        self.trellised1 = self.trellis1.trellis(self.layers)
-        self.trellised2 = self.trellis2.trellis(self.layers)
-        self.trellised3 = self.trellis3.trellis(self.layers)
-
-    def test_grid_sizes(self):
-        self.assertEqual(len(self.trellised1), 3)
-        self.assertEqual(len(self.trellised2), 3)
-        self.assertEqual(len(self.trellised3), 3)
-        self.assertEqual(len(self.trellised1[0]), 2)
-        self.assertEqual(len(self.trellised1[0][0]), 2)
-        self.assertEqual(len(self.trellised2[0]), 2)
-        self.assertEqual(len(self.trellised2[0][0]), 1)
-        self.assertEqual(len(self.trellised3[0]), 1)
-        self.assertEqual(len(self.trellised3[0][0]), 2)
-        self.assertEqual(len(self.trellised1[1]), 2)
-        self.assertEqual(len(self.trellised1[1][0]), 2)
-        self.assertEqual(len(self.trellised2[1]), 2)
-        self.assertEqual(len(self.trellised2[1][0]), 1)
-        self.assertEqual(len(self.trellised3[1]), 1)
-        self.assertEqual(len(self.trellised3[1][0]), 2)
-        self.assertEqual(len(self.trellised1[2]), 2)
-        self.assertEqual(len(self.trellised1[2][0]), 2)
-        self.assertEqual(len(self.trellised2[2]), 2)
-        self.assertEqual(len(self.trellised2[2][0]), 1)
-        self.assertEqual(len(self.trellised3[2]), 1)
-        self.assertEqual(len(self.trellised3[2][0]), 2)
-
-    def test_trellis_cols_rows(self):
-        self.assertEqual(self.trellis1.cols, 2)
-        self.assertEqual(self.trellis1.rows, 2)
-        self.assertEqual(self.trellis2.cols, 1)
-        self.assertEqual(self.trellis2.rows, 2)
-        self.assertEqual(self.trellis3.cols, 2)
-        self.assertEqual(self.trellis3.rows, 1)
-
-
-@tm.mplskip
-class TestScaleGradient(tm.TestCase):
-    def setUp(self):
-        path = os.path.join(curpath(), 'data/iris.csv')
-        self.data = read_csv(path, sep=',')
-        self.gradient = rplot.ScaleGradient("SepalLength", colour1=(0.2, 0.3,
-                                                                    0.4),
-                                            colour2=(0.8, 0.7, 0.6))
-
-    def test_gradient(self):
-        for index in range(len(self.data)):
-            row = self.data.iloc[index]
-            r, g, b = self.gradient(self.data, index)
-            r1, g1, b1 = self.gradient.colour1
-            r2, g2, b2 = self.gradient.colour2
-            self.assertTrue(between(r1, r2, r))
-            self.assertTrue(between(g1, g2, g))
-            self.assertTrue(between(b1, b2, b))
-
-
-@tm.mplskip
-class TestScaleGradient2(tm.TestCase):
-    def setUp(self):
-        path = os.path.join(curpath(), 'data/iris.csv')
-        self.data = read_csv(path, sep=',')
-        self.gradient = rplot.ScaleGradient2("SepalLength", colour1=(0.2, 0.3, 0.4), colour2=(0.8, 0.7, 0.6), colour3=(0.5, 0.5, 0.5))
-
-    def test_gradient2(self):
-        for index in range(len(self.data)):
-            row = self.data.iloc[index]
-            r, g, b = self.gradient(self.data, index)
-            r1, g1, b1 = self.gradient.colour1
-            r2, g2, b2 = self.gradient.colour2
-            r3, g3, b3 = self.gradient.colour3
-            value = row[self.gradient.column]
-            a_ = min(self.data[self.gradient.column])
-            b_ = max(self.data[self.gradient.column])
-            scaled = (value - a_) / (b_ - a_)
-            if scaled < 0.5:
-                self.assertTrue(between(r1, r2, r))
-                self.assertTrue(between(g1, g2, g))
-                self.assertTrue(between(b1, b2, b))
-            else:
-                self.assertTrue(between(r2, r3, r))
-                self.assertTrue(between(g2, g3, g))
-                self.assertTrue(between(b2, b3, b))
-
-
-@tm.mplskip
-class TestScaleRandomColour(tm.TestCase):
-    def setUp(self):
-        path = os.path.join(curpath(), 'data/iris.csv')
-        self.data = read_csv(path, sep=',')
-        self.colour = rplot.ScaleRandomColour('SepalLength')
-
-    def test_random_colour(self):
-        for index in range(len(self.data)):
-            colour = self.colour(self.data, index)
-            self.assertEqual(len(colour), 3)
-            r, g, b = colour
-            self.assertTrue(r >= 0.0)
-            self.assertTrue(g >= 0.0)
-            self.assertTrue(b >= 0.0)
-            self.assertTrue(r <= 1.0)
-            self.assertTrue(g <= 1.0)
-            self.assertTrue(b <= 1.0)
-
-
-@tm.mplskip
-class TestScaleConstant(tm.TestCase):
-    def test_scale_constant(self):
-        scale = rplot.ScaleConstant(1.0)
-        self.assertEqual(scale(None, None), 1.0)
-        scale = rplot.ScaleConstant("test")
-        self.assertEqual(scale(None, None), "test")
-
-
-class TestScaleSize(tm.TestCase):
-    def setUp(self):
-        path = os.path.join(curpath(), 'data/iris.csv')
-        self.data = read_csv(path, sep=',')
-        self.scale1 = rplot.ScaleShape('Name')
-        self.scale2 = rplot.ScaleShape('PetalLength')
-
-    def test_scale_size(self):
-        for index in range(len(self.data)):
-            marker = self.scale1(self.data, index)
-            self.assertTrue(marker in ['o', '+', 's', '*', '^', '<', '>', 'v', '|', 'x'])
-
-    def test_scale_overflow(self):
-        def f():
-            for index in range(len(self.data)):
-                self.scale2(self.data, index)
-
-        self.assertRaises(ValueError, f)
-
-
-@tm.mplskip
-class TestRPlot(tm.TestCase):
-    def test_rplot1(self):
-        import matplotlib.pyplot as plt
-        path = os.path.join(curpath(), 'data/tips.csv')
-        plt.figure()
-        self.data = read_csv(path, sep=',')
-        self.plot = rplot.RPlot(self.data, x='tip', y='total_bill')
-        self.plot.add(rplot.TrellisGrid(['sex', 'smoker']))
-        self.plot.add(rplot.GeomPoint(colour=rplot.ScaleRandomColour('day'), shape=rplot.ScaleShape('size')))
-        self.fig = plt.gcf()
-        self.plot.render(self.fig)
-
-    def test_rplot2(self):
-        import matplotlib.pyplot as plt
-        path = os.path.join(curpath(), 'data/tips.csv')
-        plt.figure()
-        self.data = read_csv(path, sep=',')
-        self.plot = rplot.RPlot(self.data, x='tip', y='total_bill')
-        self.plot.add(rplot.TrellisGrid(['.', 'smoker']))
-        self.plot.add(rplot.GeomPoint(colour=rplot.ScaleRandomColour('day'), shape=rplot.ScaleShape('size')))
-        self.fig = plt.gcf()
-        self.plot.render(self.fig)
-
-    def test_rplot3(self):
-        import matplotlib.pyplot as plt
-        path = os.path.join(curpath(), 'data/tips.csv')
-        plt.figure()
-        self.data = read_csv(path, sep=',')
-        self.plot = rplot.RPlot(self.data, x='tip', y='total_bill')
-        self.plot.add(rplot.TrellisGrid(['sex', '.']))
-        self.plot.add(rplot.GeomPoint(colour=rplot.ScaleRandomColour('day'), shape=rplot.ScaleShape('size')))
-        self.fig = plt.gcf()
-        self.plot.render(self.fig)
-
-    def test_rplot_iris(self):
-        import matplotlib.pyplot as plt
-        path = os.path.join(curpath(), 'data/iris.csv')
-        plt.figure()
-        self.data = read_csv(path, sep=',')
-        plot = rplot.RPlot(self.data, x='SepalLength', y='SepalWidth')
-        plot.add(rplot.GeomPoint(colour=rplot.ScaleGradient('PetalLength', colour1=(0.0, 1.0, 0.5), colour2=(1.0, 0.0, 0.5)),
-            size=rplot.ScaleSize('PetalWidth', min_size=10.0, max_size=200.0),
-            shape=rplot.ScaleShape('Name')))
-        self.fig = plt.gcf()
-        plot.render(self.fig)
-
-
-if __name__ == '__main__':
-    import unittest
-    unittest.main()
diff --git a/pandas/tests/test_series.py b/pandas/tests/test_series.py
deleted file mode 100644
index 9c86c3f894c67..0000000000000
--- a/pandas/tests/test_series.py
+++ /dev/null
@@ -1,7983 +0,0 @@
-# coding=utf-8
-# pylint: disable-msg=E1101,W0612
-
-import re
-import sys
-from datetime import datetime, timedelta
-import operator
-import string
-from inspect import getargspec
-from itertools import product, starmap
-from distutils.version import LooseVersion
-import warnings
-import random
-
-import nose
-
-from numpy import nan, inf
-import numpy as np
-import numpy.ma as ma
-import pandas as pd
-
-from pandas import (Index, Series, DataFrame, isnull, notnull, bdate_range,
-                    date_range, period_range, timedelta_range, _np_version_under1p8)
-from pandas.core.index import MultiIndex
-from pandas.core.indexing import IndexingError
-from pandas.tseries.period import PeriodIndex
-from pandas.tseries.index import Timestamp, DatetimeIndex
-from pandas.tseries.tdi import Timedelta, TimedeltaIndex
-import pandas.core.common as com
-import pandas.core.config as cf
-import pandas.lib as lib
-
-import pandas.core.datetools as datetools
-import pandas.core.nanops as nanops
-
-from pandas.compat import StringIO, lrange, range, zip, u, OrderedDict, long
-from pandas import compat
-from pandas.util.testing import (assert_series_equal,
-                                 assert_almost_equal,
-                                 assert_frame_equal,
-                                 assert_index_equal,
-                                 ensure_clean)
-import pandas.util.testing as tm
-
-
-#------------------------------------------------------------------------------
-# Series test cases
-
-JOIN_TYPES = ['inner', 'outer', 'left', 'right']
-
-
-class CheckNameIntegration(object):
-
-    _multiprocess_can_split_ = True
-
-    def test_scalarop_preserve_name(self):
-        result = self.ts * 2
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_copy_name(self):
-        result = self.ts.copy()
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_copy_index_name_checking(self):
-        # don't want to be able to modify the index stored elsewhere after
-        # making a copy
-
-        self.ts.index.name = None
-        self.assertIsNone(self.ts.index.name)
-        self.assertIs(self.ts, self.ts)
-
-        cp = self.ts.copy()
-        cp.index.name = 'foo'
-        com.pprint_thing(self.ts.index.name)
-        self.assertIsNone(self.ts.index.name)
-
-    def test_append_preserve_name(self):
-        result = self.ts[:5].append(self.ts[5:])
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_dt_namespace_accessor(self):
-
-        # GH 7207
-        # test .dt namespace accessor
-
-        ok_for_base = ['year','month','day','hour','minute','second','weekofyear','week','dayofweek','weekday','dayofyear','quarter','freq','days_in_month','daysinmonth']
-        ok_for_period = ok_for_base + ['qyear']
-        ok_for_period_methods = ['strftime']
-        ok_for_dt = ok_for_base + ['date','time','microsecond','nanosecond', 'is_month_start', 'is_month_end', 'is_quarter_start',
-                                   'is_quarter_end', 'is_year_start', 'is_year_end', 'tz']
-        ok_for_dt_methods = ['to_period','to_pydatetime','tz_localize','tz_convert', 'normalize', 'strftime']
-        ok_for_td = ['days','seconds','microseconds','nanoseconds']
-        ok_for_td_methods = ['components','to_pytimedelta','total_seconds']
-
-        def get_expected(s, name):
-            result = getattr(Index(s._values),prop)
-            if isinstance(result, np.ndarray):
-                if com.is_integer_dtype(result):
-                    result = result.astype('int64')
-            elif not com.is_list_like(result):
-                return result
-            return Series(result,index=s.index)
-
-        def compare(s, name):
-            a = getattr(s.dt,prop)
-            b = get_expected(s,prop)
-            if not (com.is_list_like(a) and com.is_list_like(b)):
-                self.assertEqual(a,b)
-            else:
-                tm.assert_series_equal(a,b)
-
-        # datetimeindex
-        for s in [Series(date_range('20130101',periods=5)),
-                  Series(date_range('20130101',periods=5,freq='s')),
-                  Series(date_range('20130101 00:00:00',periods=5,freq='ms'))]:
-            for prop in ok_for_dt:
-                # we test freq below
-                if prop != 'freq':
-                    compare(s, prop)
-
-            for prop in ok_for_dt_methods:
-                getattr(s.dt, prop)
-
-            result = s.dt.to_pydatetime()
-            self.assertIsInstance(result,np.ndarray)
-            self.assertTrue(result.dtype == object)
-
-            result = s.dt.tz_localize('US/Eastern')
-            expected = Series(DatetimeIndex(s.values).tz_localize('US/Eastern'),index=s.index)
-            tm.assert_series_equal(result, expected)
-
-            tz_result = result.dt.tz
-            self.assertEqual(str(tz_result), 'US/Eastern')
-            freq_result = s.dt.freq
-            self.assertEqual(freq_result, DatetimeIndex(s.values, freq='infer').freq)
-
-            # let's localize, then convert
-            result = s.dt.tz_localize('UTC').dt.tz_convert('US/Eastern')
-            expected = Series(DatetimeIndex(s.values).tz_localize('UTC').tz_convert('US/Eastern'),index=s.index)
-            tm.assert_series_equal(result, expected)
-
-        # datetimeindex with tz
-        s = Series(date_range('20130101',periods=5,tz='US/Eastern'))
-        for prop in ok_for_dt:
-
-            # we test freq below
-            if prop != 'freq':
-                compare(s, prop)
-
-        for prop in ok_for_dt_methods:
-            getattr(s.dt,prop)
-
-        result = s.dt.to_pydatetime()
-        self.assertIsInstance(result,np.ndarray)
-        self.assertTrue(result.dtype == object)
-
-        result = s.dt.tz_convert('CET')
-        expected = Series(s._values.tz_convert('CET'),index=s.index)
-        tm.assert_series_equal(result, expected)
-
-        tz_result = result.dt.tz
-        self.assertEqual(str(tz_result), 'CET')
-        freq_result = s.dt.freq
-        self.assertEqual(freq_result, DatetimeIndex(s.values, freq='infer').freq)
-
-        # timedeltaindex
-        for s in [Series(timedelta_range('1 day',periods=5),index=list('abcde')),
-                  Series(timedelta_range('1 day 01:23:45',periods=5,freq='s')),
-                  Series(timedelta_range('2 days 01:23:45.012345',periods=5,freq='ms'))]:
-            for prop in ok_for_td:
-                # we test freq below
-                if prop != 'freq':
-                    compare(s, prop)
-
-            for prop in ok_for_td_methods:
-                getattr(s.dt, prop)
-
-            result = s.dt.components
-            self.assertIsInstance(result,DataFrame)
-            tm.assert_index_equal(result.index,s.index)
-
-            result = s.dt.to_pytimedelta()
-            self.assertIsInstance(result,np.ndarray)
-            self.assertTrue(result.dtype == object)
-
-            result = s.dt.total_seconds()
-            self.assertIsInstance(result,pd.Series)
-            self.assertTrue(result.dtype == 'float64')
-
-            freq_result = s.dt.freq
-            self.assertEqual(freq_result, TimedeltaIndex(s.values, freq='infer').freq)
-
-        # both
-        index = date_range('20130101',periods=3,freq='D')
-        s = Series(date_range('20140204',periods=3,freq='s'),index=index)
-        tm.assert_series_equal(s.dt.year,Series(np.array([2014,2014,2014],dtype='int64'),index=index))
-        tm.assert_series_equal(s.dt.month,Series(np.array([2,2,2],dtype='int64'),index=index))
-        tm.assert_series_equal(s.dt.second,Series(np.array([0,1,2],dtype='int64'),index=index))
-        tm.assert_series_equal(s.dt.normalize(), pd.Series([s[0]] * 3, index=index))
-
-        # periodindex
-        for s in [Series(period_range('20130101',periods=5,freq='D'))]:
-            for prop in ok_for_period:
-                # we test freq below
-                if prop != 'freq':
-                    compare(s, prop)
-
-            for prop in ok_for_period_methods:
-                getattr(s.dt, prop)
-
-            freq_result = s.dt.freq
-            self.assertEqual(freq_result, PeriodIndex(s.values).freq)
-
-        # test limited display api
-        def get_dir(s):
-            results = [ r for r in s.dt.__dir__() if not r.startswith('_') ]
-            return list(sorted(set(results)))
-
-        s = Series(date_range('20130101',periods=5,freq='D'))
-        results = get_dir(s)
-        tm.assert_almost_equal(results,list(sorted(set(ok_for_dt + ok_for_dt_methods))))
-
-        s = Series(period_range('20130101',periods=5,freq='D').asobject)
-        results = get_dir(s)
-        tm.assert_almost_equal(results, list(sorted(set(ok_for_period + ok_for_period_methods))))
-
-        # 11295
-        # ambiguous time error on the conversions
-        s = Series(pd.date_range('2015-01-01', '2016-01-01', freq='T'))
-        s = s.dt.tz_localize('UTC').dt.tz_convert('America/Chicago')
-        results = get_dir(s)
-        tm.assert_almost_equal(results, list(sorted(set(ok_for_dt + ok_for_dt_methods))))
-        expected = Series(pd.date_range('2015-01-01',
-                                        '2016-01-01',
-                                        freq='T',
-                                        tz='UTC').tz_convert('America/Chicago'))
-        tm.assert_series_equal(s, expected)
-
-        # no setting allowed
-        s = Series(date_range('20130101',periods=5,freq='D'))
-        with tm.assertRaisesRegexp(ValueError, "modifications"):
-            s.dt.hour = 5
-
-        # trying to set a copy
-        with pd.option_context('chained_assignment','raise'):
-            def f():
-                s.dt.hour[0] = 5
-            self.assertRaises(com.SettingWithCopyError, f)
-
-    def test_strftime(self):
-        # GH 10086
-        s = Series(date_range('20130101', periods=5))
-        result = s.dt.strftime('%Y/%m/%d')
-        expected = Series(['2013/01/01', '2013/01/02', '2013/01/03', '2013/01/04', '2013/01/05'])
-        tm.assert_series_equal(result, expected)
-
-        s = Series(date_range('2015-02-03 11:22:33.4567', periods=5))
-        result = s.dt.strftime('%Y/%m/%d %H-%M-%S')
-        expected = Series(['2015/02/03 11-22-33', '2015/02/04 11-22-33', '2015/02/05 11-22-33',
-                           '2015/02/06 11-22-33', '2015/02/07 11-22-33'])
-        tm.assert_series_equal(result, expected)
-
-        s = Series(period_range('20130101', periods=5))
-        result = s.dt.strftime('%Y/%m/%d')
-        expected = Series(['2013/01/01', '2013/01/02', '2013/01/03', '2013/01/04', '2013/01/05'])
-        tm.assert_series_equal(result, expected)
-
-        s = Series(period_range('2015-02-03 11:22:33.4567', periods=5, freq='s'))
-        result = s.dt.strftime('%Y/%m/%d %H-%M-%S')
-        expected = Series(['2015/02/03 11-22-33', '2015/02/03 11-22-34', '2015/02/03 11-22-35',
-                           '2015/02/03 11-22-36', '2015/02/03 11-22-37'])
-        tm.assert_series_equal(result, expected)
-
-        s = Series(date_range('20130101', periods=5))
-        s.iloc[0] = pd.NaT
-        result = s.dt.strftime('%Y/%m/%d')
-        expected = Series(['NaT', '2013/01/02', '2013/01/03', '2013/01/04', '2013/01/05'])
-        tm.assert_series_equal(result, expected)
-
-        datetime_index = date_range('20150301', periods=5)
-        result = datetime_index.strftime("%Y/%m/%d")
-        expected = np.array(['2015/03/01', '2015/03/02', '2015/03/03', '2015/03/04', '2015/03/05'], dtype=object)
-        self.assert_numpy_array_equal(result, expected)
-
-        period_index = period_range('20150301', periods=5)
-        result = period_index.strftime("%Y/%m/%d")
-        expected = np.array(['2015/03/01', '2015/03/02', '2015/03/03', '2015/03/04', '2015/03/05'], dtype=object)
-        self.assert_numpy_array_equal(result, expected)
-
-        s = Series([datetime(2013, 1, 1, 2, 32, 59), datetime(2013, 1, 2, 14, 32, 1)])
-        result = s.dt.strftime('%Y-%m-%d %H:%M:%S')
-        expected = Series(["2013-01-01 02:32:59", "2013-01-02 14:32:01"])
-        tm.assert_series_equal(result, expected)
-
-        s = Series(period_range('20130101', periods=4, freq='H'))
-        result = s.dt.strftime('%Y/%m/%d %H:%M:%S')
-        expected = Series(["2013/01/01 00:00:00", "2013/01/01 01:00:00",
-                           "2013/01/01 02:00:00", "2013/01/01 03:00:00"])
-
-        s = Series(period_range('20130101', periods=4, freq='L'))
-        result = s.dt.strftime('%Y/%m/%d %H:%M:%S.%l')
-        expected = Series(["2013/01/01 00:00:00.000", "2013/01/01 00:00:00.001",
-                           "2013/01/01 00:00:00.002", "2013/01/01 00:00:00.003"])
-        tm.assert_series_equal(result, expected)
-
-    def test_valid_dt_with_missing_values(self):
-
-        from datetime import date, time
-
-        # GH 8689
-        s = Series(date_range('20130101',periods=5,freq='D'))
-        s.iloc[2] = pd.NaT
-
-        for attr in ['microsecond','nanosecond','second','minute','hour','day']:
-            expected = getattr(s.dt,attr).copy()
-            expected.iloc[2] = np.nan
-            result = getattr(s.dt,attr)
-            tm.assert_series_equal(result, expected)
-
-        result = s.dt.date
-        expected = Series([date(2013,1,1),date(2013,1,2),np.nan,date(2013,1,4),date(2013,1,5)],dtype='object')
-        tm.assert_series_equal(result, expected)
-
-        result = s.dt.time
-        expected = Series([time(0),time(0),np.nan,time(0),time(0)],dtype='object')
-        tm.assert_series_equal(result, expected)
-
-    def test_dt_accessor_api(self):
-        # GH 9322
-        from pandas.tseries.common import (CombinedDatetimelikeProperties,
-                                           DatetimeProperties)
-        self.assertIs(Series.dt, CombinedDatetimelikeProperties)
-
-        s = Series(date_range('2000-01-01', periods=3))
-        self.assertIsInstance(s.dt, DatetimeProperties)
-
-        for s in [Series(np.arange(5)),
-                  Series(list('abcde')),
-                  Series(np.random.randn(5))]:
-            with tm.assertRaisesRegexp(AttributeError,
-                                       "only use .dt accessor"):
-                s.dt
-            self.assertFalse(hasattr(s, 'dt'))
-
-    def test_tab_completion(self):
-        # GH 9910
-        s = Series(list('abcd'))
-        # Series of str values should have .str but not .dt/.cat in __dir__
-        self.assertTrue('str' in dir(s))
-        self.assertTrue('dt' not in dir(s))
-        self.assertTrue('cat' not in dir(s))
-
-        # similiarly for .dt
-        s = Series(date_range('1/1/2015', periods=5))
-        self.assertTrue('dt' in dir(s))
-        self.assertTrue('str' not in dir(s))
-        self.assertTrue('cat' not in dir(s))
-
-        # similiarly for .cat
-        s = Series(list('abbcd'), dtype="category")
-        self.assertTrue('cat' in dir(s))
-        self.assertTrue('str' not in dir(s))
-        self.assertTrue('dt' not in dir(s))
-
-    def test_binop_maybe_preserve_name(self):
-        # names match, preserve
-        result = self.ts * self.ts
-        self.assertEqual(result.name, self.ts.name)
-        result = self.ts.mul(self.ts)
-        self.assertEqual(result.name, self.ts.name)
-
-        result = self.ts * self.ts[:-2]
-        self.assertEqual(result.name, self.ts.name)
-
-        # names don't match, don't preserve
-        cp = self.ts.copy()
-        cp.name = 'something else'
-        result = self.ts + cp
-        self.assertIsNone(result.name)
-        result = self.ts.add(cp)
-        self.assertIsNone(result.name)
-
-        ops = ['add', 'sub', 'mul', 'div', 'truediv', 'floordiv', 'mod', 'pow']
-        ops = ops + ['r' + op for op in ops]
-        for op in ops:
-            # names match, preserve
-            s = self.ts.copy()
-            result = getattr(s, op)(s)
-            self.assertEqual(result.name, self.ts.name)
-
-            # names don't match, don't preserve
-            cp = self.ts.copy()
-            cp.name = 'changed'
-            result = getattr(s, op)(cp)
-            self.assertIsNone(result.name)
-
-    def test_combine_first_name(self):
-        result = self.ts.combine_first(self.ts[:5])
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_combine_first_dt64(self):
-        from pandas.tseries.tools import to_datetime
-        s0 = to_datetime(Series(["2010", np.NaN]))
-        s1 = to_datetime(Series([np.NaN, "2011"]))
-        rs = s0.combine_first(s1)
-        xp = to_datetime(Series(['2010', '2011']))
-        assert_series_equal(rs, xp)
-
-        s0 = to_datetime(Series(["2010", np.NaN]))
-        s1 = Series([np.NaN, "2011"])
-        rs = s0.combine_first(s1)
-        xp = Series([datetime(2010, 1, 1), '2011'])
-        assert_series_equal(rs, xp)
-
-    def test_get(self):
-
-        # GH 6383
-        s = Series(np.array([43, 48, 60, 48, 50, 51, 50, 45, 57, 48, 56,
-                             45, 51, 39, 55, 43, 54, 52, 51, 54]))
-
-        result = s.get(25, 0)
-        expected = 0
-        self.assertEqual(result,expected)
-
-        s = Series(np.array([43, 48, 60, 48, 50, 51, 50, 45, 57, 48, 56,
-                             45, 51, 39, 55, 43, 54, 52, 51, 54]),
-                   index=pd.Float64Index([25.0, 36.0, 49.0, 64.0, 81.0, 100.0,
-                                          121.0, 144.0, 169.0, 196.0, 1225.0,
-                                          1296.0, 1369.0, 1444.0, 1521.0, 1600.0,
-                                          1681.0, 1764.0, 1849.0, 1936.0],
-                                         dtype='object'))
-
-        result = s.get(25, 0)
-        expected = 43
-        self.assertEqual(result,expected)
-
-        # GH 7407
-        # with a boolean accessor
-        df = pd.DataFrame({'i':[0]*3, 'b':[False]*3})
-        vc = df.i.value_counts()
-        result = vc.get(99,default='Missing')
-        self.assertEqual(result,'Missing')
-
-        vc = df.b.value_counts()
-        result = vc.get(False,default='Missing')
-        self.assertEqual(result,3)
-
-        result = vc.get(True,default='Missing')
-        self.assertEqual(result,'Missing')
-
-    def test_delitem(self):
-
-        # GH 5542
-        # should delete the item inplace
-        s = Series(lrange(5))
-        del s[0]
-
-        expected = Series(lrange(1,5),index=lrange(1,5))
-        assert_series_equal(s, expected)
-
-        del s[1]
-        expected = Series(lrange(2,5),index=lrange(2,5))
-        assert_series_equal(s, expected)
-
-        # empty
-        s = Series()
-        def f():
-            del s[0]
-        self.assertRaises(KeyError, f)
-
-        # only 1 left, del, add, del
-        s = Series(1)
-        del s[0]
-        assert_series_equal(s, Series(dtype='int64'))
-        s[0] = 1
-        assert_series_equal(s, Series(1))
-        del s[0]
-        assert_series_equal(s, Series(dtype='int64'))
-
-    def test_getitem_preserve_name(self):
-        result = self.ts[self.ts > 0]
-        self.assertEqual(result.name, self.ts.name)
-
-        result = self.ts[[0, 2, 4]]
-        self.assertEqual(result.name, self.ts.name)
-
-        result = self.ts[5:10]
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_getitem_setitem_ellipsis(self):
-        s = Series(np.random.randn(10))
-
-        np.fix(s)
-
-        result = s[...]
-        assert_series_equal(result, s)
-
-        s[...] = 5
-        self.assertTrue((result == 5).all())
-
-    def test_getitem_negative_out_of_bounds(self):
-        s = Series(tm.rands_array(5, 10), index=tm.rands_array(10, 10))
-
-        self.assertRaises(IndexError, s.__getitem__, -11)
-        self.assertRaises(IndexError, s.__setitem__, -11, 'foo')
-
-    def test_multilevel_name_print(self):
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['first', 'second'])
-        s = Series(lrange(0, len(index)), index=index, name='sth')
-        expected = ["first  second",
-                    "foo    one       0",
-                    "       two       1",
-                    "       three     2",
-                    "bar    one       3",
-                    "       two       4",
-                    "baz    two       5",
-                    "       three     6",
-                    "qux    one       7",
-                    "       two       8",
-                    "       three     9",
-                    "Name: sth, dtype: int64"]
-        expected = "\n".join(expected)
-        self.assertEqual(repr(s), expected)
-
-    def test_multilevel_preserve_name(self):
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['first', 'second'])
-        s = Series(np.random.randn(len(index)), index=index, name='sth')
-
-        result = s['foo']
-        result2 = s.ix['foo']
-        self.assertEqual(result.name, s.name)
-        self.assertEqual(result2.name, s.name)
-
-    def test_name_printing(self):
-        # test small series
-        s = Series([0, 1, 2])
-        s.name = "test"
-        self.assertIn("Name: test", repr(s))
-        s.name = None
-        self.assertNotIn("Name:", repr(s))
-        # test big series (diff code path)
-        s = Series(lrange(0, 1000))
-        s.name = "test"
-        self.assertIn("Name: test", repr(s))
-        s.name = None
-        self.assertNotIn("Name:", repr(s))
-
-        s = Series(index=date_range('20010101', '20020101'), name='test')
-        self.assertIn("Name: test", repr(s))
-
-    def test_pickle_preserve_name(self):
-        unpickled = self._pickle_roundtrip_name(self.ts)
-        self.assertEqual(unpickled.name, self.ts.name)
-
-    def _pickle_roundtrip_name(self, obj):
-
-        with ensure_clean() as path:
-            obj.to_pickle(path)
-            unpickled = pd.read_pickle(path)
-            return unpickled
-
-    def test_argsort_preserve_name(self):
-        result = self.ts.argsort()
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_sort_index_name(self):
-        result = self.ts.sort_index(ascending=False)
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_to_sparse_pass_name(self):
-        result = self.ts.to_sparse()
-        self.assertEqual(result.name, self.ts.name)
-
-
-class TestNanops(tm.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    def test_comparisons(self):
-        left = np.random.randn(10)
-        right = np.random.randn(10)
-        left[:3] = np.nan
-
-        result = nanops.nangt(left, right)
-        expected = (left > right).astype('O')
-        expected[:3] = np.nan
-
-        assert_almost_equal(result, expected)
-
-        s = Series(['a', 'b', 'c'])
-        s2 = Series([False, True, False])
-
-        # it works!
-        s == s2
-        s2 == s
-
-    def test_sum_zero(self):
-        arr = np.array([])
-        self.assertEqual(nanops.nansum(arr), 0)
-
-        arr = np.empty((10, 0))
-        self.assertTrue((nanops.nansum(arr, axis=1) == 0).all())
-
-        # GH #844
-        s = Series([], index=[])
-        self.assertEqual(s.sum(), 0)
-
-        df = DataFrame(np.empty((10, 0)))
-        self.assertTrue((df.sum(1) == 0).all())
-
-    def test_nansum_buglet(self):
-        s = Series([1.0, np.nan], index=[0, 1])
-        result = np.nansum(s)
-        assert_almost_equal(result, 1)
-
-    def test_overflow(self):
-        # GH 6915
-        # overflowing on the smaller int dtypes
-        for dtype in ['int32','int64']:
-            v = np.arange(5000000,dtype=dtype)
-            s = Series(v)
-
-            # no bottleneck
-            result = s.sum(skipna=False)
-            self.assertEqual(int(result),v.sum(dtype='int64'))
-            result = s.min(skipna=False)
-            self.assertEqual(int(result),0)
-            result = s.max(skipna=False)
-            self.assertEqual(int(result),v[-1])
-
-            # use bottleneck if available
-            result = s.sum()
-            self.assertEqual(int(result),v.sum(dtype='int64'))
-            result = s.min()
-            self.assertEqual(int(result),0)
-            result = s.max()
-            self.assertEqual(int(result),v[-1])
-
-        for dtype in ['float32', 'float64']:
-            v = np.arange(5000000, dtype=dtype)
-            s = Series(v)
-
-            # no bottleneck
-            result = s.sum(skipna=False)
-            self.assertEqual(result, v.sum(dtype=dtype))
-            result = s.min(skipna=False)
-            self.assertTrue(np.allclose(float(result), 0.0))
-            result = s.max(skipna=False)
-            self.assertTrue(np.allclose(float(result), v[-1]))
-
-            # use bottleneck if available
-            result = s.sum()
-            self.assertEqual(result, v.sum(dtype=dtype))
-            result = s.min()
-            self.assertTrue(np.allclose(float(result), 0.0))
-            result = s.max()
-            self.assertTrue(np.allclose(float(result), v[-1]))
-
-class SafeForSparse(object):
-    pass
-
-_ts = tm.makeTimeSeries()
-
-class TestSeries(tm.TestCase, CheckNameIntegration):
-
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        import warnings
-
-        self.ts = _ts.copy()
-        self.ts.name = 'ts'
-
-        self.series = tm.makeStringSeries()
-        self.series.name = 'series'
-
-        self.objSeries = tm.makeObjectSeries()
-        self.objSeries.name = 'objects'
-
-        self.empty = Series([], index=[])
-
-    def test_scalar_conversion(self):
-
-        # Pass in scalar is disabled
-        scalar = Series(0.5)
-        self.assertNotIsInstance(scalar, float)
-
-        # coercion
-        self.assertEqual(float(Series([1.])), 1.0)
-        self.assertEqual(int(Series([1.])), 1)
-        self.assertEqual(long(Series([1.])), 1)
-
-
-    def test_astype(self):
-        s = Series(np.random.randn(5),name='foo')
-
-        for dtype in ['float32','float64','int64','int32']:
-            astyped = s.astype(dtype)
-            self.assertEqual(astyped.dtype, dtype)
-            self.assertEqual(astyped.name, s.name)
-
-    def test_TimeSeries_deprecation(self):
-
-        # deprecation TimeSeries, #10890
-        with tm.assert_produces_warning(FutureWarning):
-            pd.TimeSeries(1,index=date_range('20130101',periods=3))
-
-    def test_constructor(self):
-        # Recognize TimeSeries
-        with tm.assert_produces_warning(FutureWarning):
-            self.assertTrue(self.ts.is_time_series)
-        self.assertTrue(self.ts.index.is_all_dates)
-
-        # Pass in Series
-        derived = Series(self.ts)
-        with tm.assert_produces_warning(FutureWarning):
-            self.assertTrue(derived.is_time_series)
-        self.assertTrue(derived.index.is_all_dates)
-
-        self.assertTrue(tm.equalContents(derived.index, self.ts.index))
-        # Ensure new index is not created
-        self.assertEqual(id(self.ts.index), id(derived.index))
-
-        # Mixed type Series
-        mixed = Series(['hello', np.NaN], index=[0, 1])
-        self.assertEqual(mixed.dtype, np.object_)
-        self.assertIs(mixed[1], np.NaN)
-
-        with tm.assert_produces_warning(FutureWarning):
-            self.assertFalse(self.empty.is_time_series)
-        self.assertFalse(self.empty.index.is_all_dates)
-        with tm.assert_produces_warning(FutureWarning):
-            self.assertFalse(Series({}).is_time_series)
-        self.assertFalse(Series({}).index.is_all_dates)
-        self.assertRaises(Exception, Series, np.random.randn(3, 3),
-                          index=np.arange(3))
-
-        mixed.name = 'Series'
-        rs = Series(mixed).name
-        xp = 'Series'
-        self.assertEqual(rs, xp)
-
-        # raise on MultiIndex GH4187
-        m = MultiIndex.from_arrays([[1, 2], [3, 4]])
-        self.assertRaises(NotImplementedError, Series, m)
-
-    def test_constructor_empty(self):
-        empty = Series()
-        empty2 = Series([])
-        assert_series_equal(empty, empty2)
-
-        empty = Series(index=lrange(10))
-        empty2 = Series(np.nan, index=lrange(10))
-        assert_series_equal(empty, empty2)
-
-    def test_constructor_series(self):
-        index1 = ['d', 'b', 'a', 'c']
-        index2 = sorted(index1)
-        s1 = Series([4, 7, -5, 3], index=index1)
-        s2 = Series(s1, index=index2)
-
-        assert_series_equal(s2, s1.sort_index())
-
-    def test_constructor_iterator(self):
-
-        expected = Series(list(range(10)),dtype='int64')
-        result = Series(range(10),dtype='int64')
-        assert_series_equal(result, expected)
-
-    def test_constructor_generator(self):
-        gen = (i for i in range(10))
-
-        result = Series(gen)
-        exp = Series(lrange(10))
-        assert_series_equal(result, exp)
-
-        gen = (i for i in range(10))
-        result = Series(gen, index=lrange(10, 20))
-        exp.index = lrange(10, 20)
-        assert_series_equal(result, exp)
-
-    def test_constructor_map(self):
-        # GH8909
-        m = map(lambda x: x, range(10))
-
-        result = Series(m)
-        exp = Series(lrange(10))
-        assert_series_equal(result, exp)
-
-        m = map(lambda x: x, range(10))
-        result = Series(m, index=lrange(10, 20))
-        exp.index = lrange(10, 20)
-        assert_series_equal(result, exp)
-
-    def test_constructor_categorical(self):
-        cat = pd.Categorical([0, 1, 2, 0, 1, 2], ['a', 'b', 'c'], fastpath=True)
-        res = Series(cat)
-        self.assertTrue(res.values.equals(cat))
-
-    def test_constructor_maskedarray(self):
-        data = ma.masked_all((3,), dtype=float)
-        result = Series(data)
-        expected = Series([nan, nan, nan])
-        assert_series_equal(result, expected)
-
-        data[0] = 0.0
-        data[2] = 2.0
-        index = ['a', 'b', 'c']
-        result = Series(data, index=index)
-        expected = Series([0.0, nan, 2.0], index=index)
-        assert_series_equal(result, expected)
-
-        data[1] = 1.0
-        result = Series(data, index=index)
-        expected = Series([0.0, 1.0, 2.0], index=index)
-        assert_series_equal(result, expected)
-
-        data = ma.masked_all((3,), dtype=int)
-        result = Series(data)
-        expected = Series([nan, nan, nan], dtype=float)
-        assert_series_equal(result, expected)
-
-        data[0] = 0
-        data[2] = 2
-        index = ['a', 'b', 'c']
-        result = Series(data, index=index)
-        expected = Series([0, nan, 2], index=index, dtype=float)
-        assert_series_equal(result, expected)
-
-        data[1] = 1
-        result = Series(data, index=index)
-        expected = Series([0, 1, 2], index=index, dtype=int)
-        assert_series_equal(result, expected)
-
-        data = ma.masked_all((3,), dtype=bool)
-        result = Series(data)
-        expected = Series([nan, nan, nan], dtype=object)
-        assert_series_equal(result, expected)
-
-        data[0] = True
-        data[2] = False
-        index = ['a', 'b', 'c']
-        result = Series(data, index=index)
-        expected = Series([True, nan, False], index=index, dtype=object)
-        assert_series_equal(result, expected)
-
-        data[1] = True
-        result = Series(data, index=index)
-        expected = Series([True, True, False], index=index, dtype=bool)
-        assert_series_equal(result, expected)
-
-        from pandas import tslib
-        data = ma.masked_all((3,), dtype='M8[ns]')
-        result = Series(data)
-        expected = Series([tslib.iNaT, tslib.iNaT, tslib.iNaT], dtype='M8[ns]')
-        assert_series_equal(result, expected)
-
-        data[0] = datetime(2001, 1, 1)
-        data[2] = datetime(2001, 1, 3)
-        index = ['a', 'b', 'c']
-        result = Series(data, index=index)
-        expected = Series([datetime(2001, 1, 1), tslib.iNaT,
-                           datetime(2001, 1, 3)], index=index, dtype='M8[ns]')
-        assert_series_equal(result, expected)
-
-        data[1] = datetime(2001, 1, 2)
-        result = Series(data, index=index)
-        expected = Series([datetime(2001, 1, 1), datetime(2001, 1, 2),
-                           datetime(2001, 1, 3)], index=index, dtype='M8[ns]')
-        assert_series_equal(result, expected)
-
-    def test_constructor_default_index(self):
-        s = Series([0, 1, 2])
-        assert_almost_equal(s.index, np.arange(3))
-
-    def test_constructor_corner(self):
-        df = tm.makeTimeDataFrame()
-        objs = [df, df]
-        s = Series(objs, index=[0, 1])
-        tm.assertIsInstance(s, Series)
-
-    def test_constructor_sanitize(self):
-        s = Series(np.array([1., 1., 8.]), dtype='i8')
-        self.assertEqual(s.dtype, np.dtype('i8'))
-
-        s = Series(np.array([1., 1., np.nan]), copy=True, dtype='i8')
-        self.assertEqual(s.dtype, np.dtype('f8'))
-
-    def test_constructor_pass_none(self):
-        s = Series(None, index=lrange(5))
-        self.assertEqual(s.dtype, np.float64)
-
-        s = Series(None, index=lrange(5), dtype=object)
-        self.assertEqual(s.dtype, np.object_)
-
-        # GH 7431
-        # inference on the index
-        s = Series(index=np.array([None]))
-        expected = Series(index=Index([None]))
-        assert_series_equal(s,expected)
-
-    def test_constructor_cast(self):
-        self.assertRaises(ValueError, Series, ['a', 'b', 'c'], dtype=float)
-
-    def test_constructor_dtype_nocast(self):
-        # 1572
-        s = Series([1, 2, 3])
-
-        s2 = Series(s, dtype=np.int64)
-
-        s2[1] = 5
-        self.assertEqual(s[1], 5)
-
-    def test_constructor_datelike_coercion(self):
-
-        # GH 9477
-        # incorrectly infering on dateimelike looking when object dtype is specified
-        s = Series([Timestamp('20130101'),'NOV'],dtype=object)
-        self.assertEqual(s.iloc[0],Timestamp('20130101'))
-        self.assertEqual(s.iloc[1],'NOV')
-        self.assertTrue(s.dtype == object)
-
-        # the dtype was being reset on the slicing and re-inferred to datetime even
-        # thought the blocks are mixed
-        belly = '216 3T19'.split()
-        wing1 = '2T15 4H19'.split()
-        wing2 = '416 4T20'.split()
-        mat = pd.to_datetime('2016-01-22 2019-09-07'.split())
-        df = pd.DataFrame({'wing1':wing1, 'wing2':wing2, 'mat':mat}, index=belly)
-
-        result = df.loc['3T19']
-        self.assertTrue(result.dtype == object)
-        result = df.loc['216']
-        self.assertTrue(result.dtype == object)
-
-    def test_constructor_dtype_datetime64(self):
-        import pandas.tslib as tslib
-
-        s = Series(tslib.iNaT, dtype='M8[ns]', index=lrange(5))
-        self.assertTrue(isnull(s).all())
-
-        # in theory this should be all nulls, but since
-        # we are not specifying a dtype is ambiguous
-        s = Series(tslib.iNaT, index=lrange(5))
-        self.assertFalse(isnull(s).all())
-
-        s = Series(nan, dtype='M8[ns]', index=lrange(5))
-        self.assertTrue(isnull(s).all())
-
-        s = Series([datetime(2001, 1, 2, 0, 0), tslib.iNaT], dtype='M8[ns]')
-        self.assertTrue(isnull(s[1]))
-        self.assertEqual(s.dtype, 'M8[ns]')
-
-        s = Series([datetime(2001, 1, 2, 0, 0), nan], dtype='M8[ns]')
-        self.assertTrue(isnull(s[1]))
-        self.assertEqual(s.dtype, 'M8[ns]')
-
-        # GH3416
-        dates = [
-            np.datetime64(datetime(2013, 1, 1)),
-            np.datetime64(datetime(2013, 1, 2)),
-            np.datetime64(datetime(2013, 1, 3)),
-            ]
-
-        s = Series(dates)
-        self.assertEqual(s.dtype, 'M8[ns]')
-
-        s.ix[0] = np.nan
-        self.assertEqual(s.dtype, 'M8[ns]')
-
-        # invalid astypes
-        for t in ['s', 'D', 'us', 'ms']:
-            self.assertRaises(TypeError, s.astype, 'M8[%s]' % t)
-
-        # GH3414 related
-        self.assertRaises(TypeError, lambda x: Series(
-            Series(dates).astype('int') / 1000000, dtype='M8[ms]'))
-        self.assertRaises(
-            TypeError, lambda x: Series(dates, dtype='datetime64'))
-
-        # invalid dates can be help as object
-        result = Series([datetime(2,1,1)])
-        self.assertEqual(result[0], datetime(2,1,1,0,0))
-
-        result = Series([datetime(3000,1,1)])
-        self.assertEqual(result[0], datetime(3000,1,1,0,0))
-
-        # don't mix types
-        result = Series([ Timestamp('20130101'), 1],index=['a','b'])
-        self.assertEqual(result['a'], Timestamp('20130101'))
-        self.assertEqual(result['b'], 1)
-
-        # GH6529
-        # coerce datetime64 non-ns properly
-        dates = date_range('01-Jan-2015', '01-Dec-2015', freq='M')
-        values2 = dates.view(np.ndarray).astype('datetime64[ns]')
-        expected = Series(values2, dates)
-
-        for dtype in ['s', 'D', 'ms', 'us', 'ns']:
-            values1 = dates.view(np.ndarray).astype('M8[{0}]'.format(dtype))
-            result = Series(values1, dates)
-            assert_series_equal(result,expected)
-
-        # leave datetime.date alone
-        dates2 = np.array([d.date() for d in dates.to_pydatetime()],
-                          dtype=object)
-        series1 = Series(dates2, dates)
-        self.assert_numpy_array_equal(series1.values,dates2)
-        self.assertEqual(series1.dtype,object)
-
-        # these will correctly infer a datetime
-        s = Series([None, pd.NaT, '2013-08-05 15:30:00.000001'])
-        self.assertEqual(s.dtype,'datetime64[ns]')
-        s = Series([np.nan, pd.NaT, '2013-08-05 15:30:00.000001'])
-        self.assertEqual(s.dtype,'datetime64[ns]')
-        s = Series([pd.NaT, None, '2013-08-05 15:30:00.000001'])
-        self.assertEqual(s.dtype,'datetime64[ns]')
-        s = Series([pd.NaT, np.nan, '2013-08-05 15:30:00.000001'])
-        self.assertEqual(s.dtype,'datetime64[ns]')
-
-        # tz-aware (UTC and other tz's)
-        # GH 8411
-        dr = date_range('20130101',periods=3)
-        self.assertTrue(Series(dr).iloc[0].tz is None)
-        dr = date_range('20130101',periods=3,tz='UTC')
-        self.assertTrue(str(Series(dr).iloc[0].tz) == 'UTC')
-        dr = date_range('20130101',periods=3,tz='US/Eastern')
-        self.assertTrue(str(Series(dr).iloc[0].tz) == 'US/Eastern')
-
-        # non-convertible
-        s = Series([1479596223000, -1479590, pd.NaT])
-        self.assertTrue(s.dtype == 'object')
-        self.assertTrue(s[2] is pd.NaT)
-        self.assertTrue('NaT' in str(s))
-
-        # if we passed a NaT it remains
-        s = Series([datetime(2010, 1, 1), datetime(2, 1, 1), pd.NaT])
-        self.assertTrue(s.dtype == 'object')
-        self.assertTrue(s[2] is pd.NaT)
-        self.assertTrue('NaT' in str(s))
-
-        # if we passed a nan it remains
-        s = Series([datetime(2010, 1, 1), datetime(2, 1, 1), np.nan])
-        self.assertTrue(s.dtype == 'object')
-        self.assertTrue(s[2] is np.nan)
-        self.assertTrue('NaN' in str(s))
-
-    def test_constructor_with_datetime_tz(self):
-
-        # 8260
-        # support datetime64 with tz
-
-        dr = date_range('20130101',periods=3,tz='US/Eastern')
-        s = Series(dr)
-        self.assertTrue(s.dtype.name == 'datetime64[ns, US/Eastern]')
-        self.assertTrue(s.dtype == 'datetime64[ns, US/Eastern]')
-        self.assertTrue(com.is_datetime64tz_dtype(s.dtype))
-        self.assertTrue('datetime64[ns, US/Eastern]' in str(s))
-
-        # export
-        result = s.values
-        self.assertIsInstance(result, np.ndarray)
-        self.assertTrue(result.dtype == 'datetime64[ns]')
-        self.assertTrue(dr.equals(pd.DatetimeIndex(result).tz_localize('UTC').tz_convert(tz=s.dt.tz)))
-
-        # indexing
-        result = s.iloc[0]
-        self.assertEqual(result,Timestamp('2013-01-01 00:00:00-0500', tz='US/Eastern', offset='D'))
-        result = s[0]
-        self.assertEqual(result,Timestamp('2013-01-01 00:00:00-0500', tz='US/Eastern', offset='D'))
-
-        result = s[Series([True,True,False],index=s.index)]
-        assert_series_equal(result,s[0:2])
-
-        result = s.iloc[0:1]
-        assert_series_equal(result,Series(dr[0:1]))
-
-        # concat
-        result = pd.concat([s.iloc[0:1],s.iloc[1:]])
-        assert_series_equal(result,s)
-
-        # astype
-        result = s.astype(object)
-        expected = Series(DatetimeIndex(s._values).asobject)
-        assert_series_equal(result, expected)
-
-        result = Series(s.values).dt.tz_localize('UTC').dt.tz_convert(s.dt.tz)
-        assert_series_equal(result, s)
-
-        # astype - datetime64[ns, tz]
-        result = Series(s.values).astype('datetime64[ns, US/Eastern]')
-        assert_series_equal(result, s)
-
-        result = Series(s.values).astype(s.dtype)
-        assert_series_equal(result, s)
-
-        result = s.astype('datetime64[ns, CET]')
-        expected = Series(date_range('20130101 06:00:00',periods=3,tz='CET'))
-        assert_series_equal(result, expected)
-
-        # short str
-        self.assertTrue('datetime64[ns, US/Eastern]' in str(s))
-
-        # formatting with NaT
-        result = s.shift()
-        self.assertTrue('datetime64[ns, US/Eastern]' in str(result))
-        self.assertTrue('NaT' in str(result))
-
-        # long str
-        t = Series(date_range('20130101',periods=1000,tz='US/Eastern'))
-        self.assertTrue('datetime64[ns, US/Eastern]' in str(t))
-
-        result = pd.DatetimeIndex(s,freq='infer')
-        tm.assert_index_equal(result, dr)
-
-        # inference
-        s = Series([pd.Timestamp('2013-01-01 13:00:00-0800', tz='US/Pacific'),pd.Timestamp('2013-01-02 14:00:00-0800', tz='US/Pacific')])
-        self.assertTrue(s.dtype == 'datetime64[ns, US/Pacific]')
-        self.assertTrue(lib.infer_dtype(s) == 'datetime64')
-
-        s = Series([pd.Timestamp('2013-01-01 13:00:00-0800', tz='US/Pacific'),pd.Timestamp('2013-01-02 14:00:00-0800', tz='US/Eastern')])
-        self.assertTrue(s.dtype == 'object')
-        self.assertTrue(lib.infer_dtype(s) == 'datetime')
-
-    def test_constructor_periodindex(self):
-        # GH7932
-        # converting a PeriodIndex when put in a Series
-
-        pi = period_range('20130101',periods=5,freq='D')
-        s = Series(pi)
-        expected = Series(pi.asobject)
-        assert_series_equal(s, expected)
-
-    def test_constructor_dict(self):
-        d = {'a': 0., 'b': 1., 'c': 2.}
-        result = Series(d, index=['b', 'c', 'd', 'a'])
-        expected = Series([1, 2, nan, 0], index=['b', 'c', 'd', 'a'])
-        assert_series_equal(result, expected)
-
-        pidx = tm.makePeriodIndex(100)
-        d = {pidx[0]: 0, pidx[1]: 1}
-        result = Series(d, index=pidx)
-        expected = Series(np.nan, pidx)
-        expected.ix[0] = 0
-        expected.ix[1] = 1
-        assert_series_equal(result, expected)
-
-    def test_constructor_dict_multiindex(self):
-        check = lambda result, expected: tm.assert_series_equal(
-            result, expected, check_dtype=True, check_index_type=True,
-            check_series_type=True)
-        d = {('a', 'a'): 0., ('b', 'a'): 1., ('b', 'c'): 2.}
-        _d = sorted(d.items())
-        ser = Series(d)
-        expected = Series([x[1] for x in _d],
-                          index=MultiIndex.from_tuples([x[0] for x in _d]))
-        check(ser, expected)
-
-        d['z'] = 111.
-        _d.insert(0, ('z', d['z']))
-        ser = Series(d)
-        expected = Series(
-            [x[1] for x in _d],
-            index=Index([x[0] for x in _d], tupleize_cols=False))
-        ser = ser.reindex(index=expected.index)
-        check(ser, expected)
-
-    def test_constructor_subclass_dict(self):
-        data = tm.TestSubDict((x, 10.0 * x) for x in range(10))
-        series = Series(data)
-        refseries = Series(dict(compat.iteritems(data)))
-        assert_series_equal(refseries, series)
-
-    def test_constructor_dict_datetime64_index(self):
-        # GH 9456
-
-        dates_as_str = ['1984-02-19', '1988-11-06', '1989-12-03', '1990-03-15']
-        values = [42544017.198965244, 1234565, 40512335.181958228, -1]
-
-        def create_data(constructor):
-            return dict(zip((constructor(x) for x in dates_as_str), values))
-
-        data_datetime64 = create_data(np.datetime64)
-        data_datetime = create_data(lambda x: datetime.strptime(x, '%Y-%m-%d'))
-        data_Timestamp = create_data(Timestamp)
-
-        expected = Series(values, (Timestamp(x) for x in dates_as_str))
-
-        result_datetime64 = Series(data_datetime64)
-        result_datetime = Series(data_datetime)
-        result_Timestamp = Series(data_Timestamp)
-
-        assert_series_equal(result_datetime64, expected)
-        assert_series_equal(result_datetime, expected)
-        assert_series_equal(result_Timestamp, expected)
-
-    def test_orderedDict_ctor(self):
-        # GH3283
-        import pandas
-        import random
-        data = OrderedDict([('col%s' % i, random.random()) for i in range(12)])
-        s = pandas.Series(data)
-        self.assertTrue(all(s.values == list(data.values())))
-
-    def test_orderedDict_subclass_ctor(self):
-        # GH3283
-        import pandas
-        import random
-
-        class A(OrderedDict):
-            pass
-        data = A([('col%s' % i, random.random()) for i in range(12)])
-        s = pandas.Series(data)
-        self.assertTrue(all(s.values == list(data.values())))
-
-    def test_constructor_list_of_tuples(self):
-        data = [(1, 1), (2, 2), (2, 3)]
-        s = Series(data)
-        self.assertEqual(list(s), data)
-
-    def test_constructor_tuple_of_tuples(self):
-        data = ((1, 1), (2, 2), (2, 3))
-        s = Series(data)
-        self.assertEqual(tuple(s), data)
-
-    def test_constructor_set(self):
-        values = set([1, 2, 3, 4, 5])
-        self.assertRaises(TypeError, Series, values)
-        values = frozenset(values)
-        self.assertRaises(TypeError, Series, values)
-
-    def test_fromDict(self):
-        data = {'a': 0, 'b': 1, 'c': 2, 'd': 3}
-
-        series = Series(data)
-        self.assertTrue(tm.is_sorted(series.index))
-
-        data = {'a': 0, 'b': '1', 'c': '2', 'd': datetime.now()}
-        series = Series(data)
-        self.assertEqual(series.dtype, np.object_)
-
-        data = {'a': 0, 'b': '1', 'c': '2', 'd': '3'}
-        series = Series(data)
-        self.assertEqual(series.dtype, np.object_)
-
-        data = {'a': '0', 'b': '1'}
-        series = Series(data, dtype=float)
-        self.assertEqual(series.dtype, np.float64)
-
-    def test_setindex(self):
-        # wrong type
-        series = self.series.copy()
-        self.assertRaises(TypeError, setattr, series, 'index', None)
-
-        # wrong length
-        series = self.series.copy()
-        self.assertRaises(Exception, setattr, series, 'index',
-                          np.arange(len(series) - 1))
-
-        # works
-        series = self.series.copy()
-        series.index = np.arange(len(series))
-        tm.assertIsInstance(series.index, Index)
-
-    def test_array_finalize(self):
-        pass
-
-    def test_pop(self):
-        # GH 6600
-        df = DataFrame({
-            'A': 0,
-            'B': np.arange(5,dtype='int64'),
-            'C': 0,
-            })
-        k = df.iloc[4]
-
-        result = k.pop('B')
-        self.assertEqual(result, 4)
-
-        expected = Series([0, 0], index=['A', 'C'], name=4)
-        assert_series_equal(k, expected)
-
-    def test_not_hashable(self):
-        s_empty = Series()
-        s = Series([1])
-        self.assertRaises(TypeError, hash, s_empty)
-        self.assertRaises(TypeError, hash, s)
-
-    def test_fromValue(self):
-
-        nans = Series(np.NaN, index=self.ts.index)
-        self.assertEqual(nans.dtype, np.float_)
-        self.assertEqual(len(nans), len(self.ts))
-
-        strings = Series('foo', index=self.ts.index)
-        self.assertEqual(strings.dtype, np.object_)
-        self.assertEqual(len(strings), len(self.ts))
-
-        d = datetime.now()
-        dates = Series(d, index=self.ts.index)
-        self.assertEqual(dates.dtype, 'M8[ns]')
-        self.assertEqual(len(dates), len(self.ts))
-
-    def test_contains(self):
-        tm.assert_contains_all(self.ts.index, self.ts)
-
-    def test_pickle(self):
-        unp_series = self._pickle_roundtrip(self.series)
-        unp_ts = self._pickle_roundtrip(self.ts)
-        assert_series_equal(unp_series, self.series)
-        assert_series_equal(unp_ts, self.ts)
-
-    def _pickle_roundtrip(self, obj):
-
-        with ensure_clean() as path:
-            obj.to_pickle(path)
-            unpickled = pd.read_pickle(path)
-            return unpickled
-
-    def test_getitem_get(self):
-        idx1 = self.series.index[5]
-        idx2 = self.objSeries.index[5]
-
-        self.assertEqual(self.series[idx1], self.series.get(idx1))
-        self.assertEqual(self.objSeries[idx2], self.objSeries.get(idx2))
-
-        self.assertEqual(self.series[idx1], self.series[5])
-        self.assertEqual(self.objSeries[idx2], self.objSeries[5])
-
-        self.assertEqual(
-            self.series.get(-1), self.series.get(self.series.index[-1]))
-        self.assertEqual(self.series[5], self.series.get(self.series.index[5]))
-
-        # missing
-        d = self.ts.index[0] - datetools.bday
-        self.assertRaises(KeyError, self.ts.__getitem__, d)
-
-        # None
-        # GH 5652
-        for s in [Series(), Series(index=list('abc'))]:
-            result = s.get(None)
-            self.assertIsNone(result)
-
-    def test_iget(self):
-
-        s = Series(np.random.randn(10), index=lrange(0, 20, 2))
-
-        # 10711, deprecated
-        with tm.assert_produces_warning(FutureWarning):
-            s.iget(1)
-
-        # 10711, deprecated
-        with tm.assert_produces_warning(FutureWarning):
-            s.irow(1)
-
-        # 10711, deprecated
-        with tm.assert_produces_warning(FutureWarning):
-            s.iget_value(1)
-
-        for i in range(len(s)):
-            result = s.iloc[i]
-            exp = s[s.index[i]]
-            assert_almost_equal(result, exp)
-
-        # pass a slice
-        result = s.iloc[slice(1, 3)]
-        expected = s.ix[2:4]
-        assert_series_equal(result, expected)
-
-        # test slice is a view
-        result[:] = 0
-        self.assertTrue((s[1:3] == 0).all())
-
-        # list of integers
-        result = s.iloc[[0, 2, 3, 4, 5]]
-        expected = s.reindex(s.index[[0, 2, 3, 4, 5]])
-        assert_series_equal(result, expected)
-
-    def test_iget_nonunique(self):
-        s = Series([0, 1, 2], index=[0, 1, 0])
-        self.assertEqual(s.iloc[2], 2)
-
-    def test_getitem_regression(self):
-        s = Series(lrange(5), index=lrange(5))
-        result = s[lrange(5)]
-        assert_series_equal(result, s)
-
-    def test_getitem_setitem_slice_bug(self):
-        s = Series(lrange(10), lrange(10))
-        result = s[-12:]
-        assert_series_equal(result, s)
-
-        result = s[-7:]
-        assert_series_equal(result, s[3:])
-
-        result = s[:-12]
-        assert_series_equal(result, s[:0])
-
-        s = Series(lrange(10), lrange(10))
-        s[-12:] = 0
-        self.assertTrue((s == 0).all())
-
-        s[:-12] = 5
-        self.assertTrue((s == 0).all())
-
-    def test_getitem_int64(self):
-        idx = np.int64(5)
-        self.assertEqual(self.ts[idx], self.ts[5])
-
-    def test_getitem_fancy(self):
-        slice1 = self.series[[1, 2, 3]]
-        slice2 = self.objSeries[[1, 2, 3]]
-        self.assertEqual(self.series.index[2], slice1.index[1])
-        self.assertEqual(self.objSeries.index[2], slice2.index[1])
-        self.assertEqual(self.series[2], slice1[1])
-        self.assertEqual(self.objSeries[2], slice2[1])
-
-    def test_getitem_boolean(self):
-        s = self.series
-        mask = s > s.median()
-
-        # passing list is OK
-        result = s[list(mask)]
-        expected = s[mask]
-        assert_series_equal(result, expected)
-        self.assert_numpy_array_equal(result.index, s.index[mask])
-
-    def test_getitem_boolean_empty(self):
-        s = Series([], dtype=np.int64)
-        s.index.name = 'index_name'
-        s = s[s.isnull()]
-        self.assertEqual(s.index.name, 'index_name')
-        self.assertEqual(s.dtype, np.int64)
-
-        # GH5877
-        # indexing with empty series
-        s = Series(['A', 'B'])
-        expected = Series(np.nan,index=['C'],dtype=object)
-        result = s[Series(['C'], dtype=object)]
-        assert_series_equal(result, expected)
-
-        s = Series(['A', 'B'])
-        expected = Series(dtype=object)
-        result = s[Series([], dtype=object)]
-        assert_series_equal(result, expected)
-
-        # invalid because of the boolean indexer
-        # that's empty or not-aligned
-        def f():
-            s[Series([], dtype=bool)]
-        self.assertRaises(IndexingError, f)
-
-        def f():
-            s[Series([True], dtype=bool)]
-        self.assertRaises(IndexingError, f)
-
-    def test_getitem_generator(self):
-        gen = (x > 0 for x in self.series)
-        result = self.series[gen]
-        result2 = self.series[iter(self.series > 0)]
-        expected = self.series[self.series > 0]
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-
-    def test_getitem_boolean_object(self):
-        # using column from DataFrame
-
-        s = self.series
-        mask = s > s.median()
-        omask = mask.astype(object)
-
-        # getitem
-        result = s[omask]
-        expected = s[mask]
-        assert_series_equal(result, expected)
-
-        # setitem
-        s2  = s.copy()
-        cop = s.copy()
-        cop[omask] = 5
-        s2[mask] = 5
-        assert_series_equal(cop, s2)
-
-        # nans raise exception
-        omask[5:10] = np.nan
-        self.assertRaises(Exception, s.__getitem__, omask)
-        self.assertRaises(Exception, s.__setitem__, omask, 5)
-
-    def test_getitem_setitem_boolean_corner(self):
-        ts = self.ts
-        mask_shifted = ts.shift(1, freq=datetools.bday) > ts.median()
-
-        # these used to raise...??
-
-        self.assertRaises(Exception, ts.__getitem__, mask_shifted)
-        self.assertRaises(Exception, ts.__setitem__, mask_shifted, 1)
-        #ts[mask_shifted]
-        #ts[mask_shifted] = 1
-
-        self.assertRaises(Exception, ts.ix.__getitem__, mask_shifted)
-        self.assertRaises(Exception, ts.ix.__setitem__, mask_shifted, 1)
-        #ts.ix[mask_shifted]
-        #ts.ix[mask_shifted] = 2
-
-    def test_getitem_setitem_slice_integers(self):
-        s = Series(np.random.randn(8), index=[2, 4, 6, 8, 10, 12, 14, 16])
-
-        result = s[:4]
-        expected = s.reindex([2, 4, 6, 8])
-        assert_series_equal(result, expected)
-
-        s[:4] = 0
-        self.assertTrue((s[:4] == 0).all())
-        self.assertTrue(not (s[4:] == 0).any())
-
-    def test_getitem_out_of_bounds(self):
-        # don't segfault, GH #495
-        self.assertRaises(IndexError, self.ts.__getitem__, len(self.ts))
-
-        # GH #917
-        s = Series([])
-        self.assertRaises(IndexError, s.__getitem__, -1)
-
-    def test_getitem_setitem_integers(self):
-        # caused bug without test
-        s = Series([1, 2, 3], ['a', 'b', 'c'])
-
-        self.assertEqual(s.ix[0], s['a'])
-        s.ix[0] = 5
-        self.assertAlmostEqual(s['a'], 5)
-
-    def test_getitem_box_float64(self):
-        value = self.ts[5]
-        tm.assertIsInstance(value, np.float64)
-
-    def test_getitem_ambiguous_keyerror(self):
-        s = Series(lrange(10), index=lrange(0, 20, 2))
-        self.assertRaises(KeyError, s.__getitem__, 1)
-        self.assertRaises(KeyError, s.ix.__getitem__, 1)
-
-    def test_getitem_unordered_dup(self):
-        obj = Series(lrange(5), index=['c', 'a', 'a', 'b', 'b'])
-        self.assertTrue(np.isscalar(obj['c']))
-        self.assertEqual(obj['c'], 0)
-
-    def test_getitem_dups_with_missing(self):
-
-        # breaks reindex, so need to use .ix internally
-        # GH 4246
-        s = Series([1, 2, 3, 4], ['foo', 'bar', 'foo', 'bah'])
-        expected = s.ix[['foo', 'bar', 'bah', 'bam']]
-        result = s[['foo', 'bar', 'bah', 'bam']]
-        assert_series_equal(result, expected)
-
-    def test_getitem_dups(self):
-        s = Series(range(5),index=['A','A','B','C','C'],dtype=np.int64)
-        expected = Series([3,4],index=['C','C'],dtype=np.int64)
-        result = s['C']
-        assert_series_equal(result, expected)
-
-    def test_getitem_dataframe(self):
-        rng = list(range(10))
-        s   = pd.Series(10, index=rng)
-        df  = pd.DataFrame(rng, index=rng)
-        self.assertRaises(TypeError, s.__getitem__, df>5)
-
-    def test_setitem_ambiguous_keyerror(self):
-        s = Series(lrange(10), index=lrange(0, 20, 2))
-
-        # equivalent of an append
-        s2 = s.copy()
-        s2[1] = 5
-        expected = s.append(Series([5],index=[1]))
-        assert_series_equal(s2,expected)
-
-        s2 = s.copy()
-        s2.ix[1] = 5
-        expected = s.append(Series([5],index=[1]))
-        assert_series_equal(s2,expected)
-
-    def test_setitem_float_labels(self):
-        # note labels are floats
-        s = Series(['a', 'b', 'c'], index=[0, 0.5, 1])
-        tmp = s.copy()
-
-        s.ix[1] = 'zoo'
-        tmp.iloc[2] = 'zoo'
-
-        assert_series_equal(s, tmp)
-
-    def test_slice(self):
-        numSlice = self.series[10:20]
-        numSliceEnd = self.series[-10:]
-        objSlice = self.objSeries[10:20]
-
-        self.assertNotIn(self.series.index[9], numSlice.index)
-        self.assertNotIn(self.objSeries.index[9], objSlice.index)
-
-        self.assertEqual(len(numSlice), len(numSlice.index))
-        self.assertEqual(self.series[numSlice.index[0]],
-                         numSlice[numSlice.index[0]])
-
-        self.assertEqual(numSlice.index[1], self.series.index[11])
-
-        self.assertTrue(tm.equalContents(numSliceEnd,
-                                         np.array(self.series)[-10:]))
-
-        # test return view
-        sl = self.series[10:20]
-        sl[:] = 0
-        self.assertTrue((self.series[10:20] == 0).all())
-
-    def test_slice_can_reorder_not_uniquely_indexed(self):
-        s = Series(1, index=['a', 'a', 'b', 'b', 'c'])
-        result = s[::-1]  # it works!
-
-    def test_slice_float_get_set(self):
-
-        self.assertRaises(TypeError, lambda : self.ts[4.0:10.0])
-        def f():
-            self.ts[4.0:10.0] = 0
-        self.assertRaises(TypeError, f)
-
-        self.assertRaises(TypeError, self.ts.__getitem__, slice(4.5, 10.0))
-        self.assertRaises(TypeError, self.ts.__setitem__, slice(4.5, 10.0), 0)
-
-    def test_slice_floats2(self):
-        s = Series(np.random.rand(10), index=np.arange(10, 20, dtype=float))
-
-        self.assertEqual(len(s.ix[12.0:]), 8)
-        self.assertEqual(len(s.ix[12.5:]), 7)
-
-        i = np.arange(10, 20, dtype=float)
-        i[2] = 12.2
-        s.index = i
-        self.assertEqual(len(s.ix[12.0:]), 8)
-        self.assertEqual(len(s.ix[12.5:]), 7)
-
-    def test_slice_float64(self):
-
-        values = np.arange(10., 50., 2)
-        index = Index(values)
-
-        start, end = values[[5, 15]]
-
-        s = Series(np.random.randn(20), index=index)
-
-        result = s[start:end]
-        expected = s.iloc[5:16]
-        assert_series_equal(result, expected)
-
-        result = s.loc[start:end]
-        assert_series_equal(result, expected)
-
-        df = DataFrame(np.random.randn(20, 3), index=index)
-
-        result = df[start:end]
-        expected = df.iloc[5:16]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc[start:end]
-        tm.assert_frame_equal(result, expected)
-
-    def test_setitem(self):
-        self.ts[self.ts.index[5]] = np.NaN
-        self.ts[[1, 2, 17]] = np.NaN
-        self.ts[6] = np.NaN
-        self.assertTrue(np.isnan(self.ts[6]))
-        self.assertTrue(np.isnan(self.ts[2]))
-        self.ts[np.isnan(self.ts)] = 5
-        self.assertFalse(np.isnan(self.ts[2]))
-
-        # caught this bug when writing tests
-        series = Series(tm.makeIntIndex(20).astype(float),
-                        index=tm.makeIntIndex(20))
-
-        series[::2] = 0
-        self.assertTrue((series[::2] == 0).all())
-
-        # set item that's not contained
-        s = self.series.copy()
-        s['foobar'] = 1
-
-        app = Series([1], index=['foobar'], name='series')
-        expected = self.series.append(app)
-        assert_series_equal(s, expected)
-
-        # Test for issue #10193
-        key = pd.Timestamp('2012-01-01')
-        series = pd.Series()
-        series[key] = 47
-        expected = pd.Series(47, [key])
-        assert_series_equal(series, expected)
-
-        series = pd.Series([], pd.DatetimeIndex([], freq='D'))
-        series[key] = 47
-        expected = pd.Series(47, pd.DatetimeIndex([key], freq='D'))
-        assert_series_equal(series, expected)
-
-    def test_setitem_dtypes(self):
-
-        # change dtypes
-        # GH 4463
-        expected = Series([np.nan,2,3])
-
-        s = Series([1,2,3])
-        s.iloc[0] = np.nan
-        assert_series_equal(s,expected)
-
-        s = Series([1,2,3])
-        s.loc[0] = np.nan
-        assert_series_equal(s,expected)
-
-        s = Series([1,2,3])
-        s[0] = np.nan
-        assert_series_equal(s,expected)
-
-        s = Series([False])
-        s.loc[0] = np.nan
-        assert_series_equal(s,Series([np.nan]))
-
-        s = Series([False,True])
-        s.loc[0] = np.nan
-        assert_series_equal(s,Series([np.nan,1.0]))
-
-    def test_set_value(self):
-        idx = self.ts.index[10]
-        res = self.ts.set_value(idx, 0)
-        self.assertIs(res, self.ts)
-        self.assertEqual(self.ts[idx], 0)
-
-        # equiv
-        s = self.series.copy()
-        res = s.set_value('foobar', 0)
-        self.assertIs(res, s)
-        self.assertEqual(res.index[-1], 'foobar')
-        self.assertEqual(res['foobar'], 0)
-
-        s = self.series.copy()
-        s.loc['foobar'] = 0
-        self.assertEqual(s.index[-1], 'foobar')
-        self.assertEqual(s['foobar'], 0)
-
-    def test_setslice(self):
-        sl = self.ts[5:20]
-        self.assertEqual(len(sl), len(sl.index))
-        self.assertTrue(sl.index.is_unique)
-
-    def test_basic_getitem_setitem_corner(self):
-        # invalid tuples, e.g. self.ts[:, None] vs. self.ts[:, 2]
-        with tm.assertRaisesRegexp(ValueError, 'tuple-index'):
-            self.ts[:, 2]
-        with tm.assertRaisesRegexp(ValueError, 'tuple-index'):
-            self.ts[:, 2] = 2
-
-        # weird lists. [slice(0, 5)] will work but not two slices
-        result = self.ts[[slice(None, 5)]]
-        expected = self.ts[:5]
-        assert_series_equal(result, expected)
-
-        # OK
-        self.assertRaises(Exception, self.ts.__getitem__,
-                          [5, slice(None, None)])
-        self.assertRaises(Exception, self.ts.__setitem__,
-                          [5, slice(None, None)], 2)
-
-    def test_reshape_non_2d(self):
-        # GH 4554
-        x = Series(np.random.random(201), name='x')
-        self.assertTrue(x.reshape(x.shape,) is x)
-
-        # GH 2719
-        a = Series([1, 2, 3, 4])
-        result = a.reshape(2, 2)
-        expected = a.values.reshape(2, 2)
-        tm.assert_numpy_array_equal(result, expected)
-        self.assertTrue(type(result) is type(expected))
-
-    def test_reshape_2d_return_array(self):
-        x = Series(np.random.random(201), name='x')
-        result = x.reshape((-1, 1))
-        self.assertNotIsInstance(result, Series)
-
-        result2 = np.reshape(x, (-1, 1))
-        self.assertNotIsInstance(result2, Series)
-
-        result = x[:, None]
-        expected = x.reshape((-1, 1))
-        assert_almost_equal(result, expected)
-
-    def test_basic_getitem_with_labels(self):
-        indices = self.ts.index[[5, 10, 15]]
-
-        result = self.ts[indices]
-        expected = self.ts.reindex(indices)
-        assert_series_equal(result, expected)
-
-        result = self.ts[indices[0]:indices[2]]
-        expected = self.ts.ix[indices[0]:indices[2]]
-        assert_series_equal(result, expected)
-
-        # integer indexes, be careful
-        s = Series(np.random.randn(10), index=lrange(0, 20, 2))
-        inds = [0, 2, 5, 7, 8]
-        arr_inds = np.array([0, 2, 5, 7, 8])
-        result = s[inds]
-        expected = s.reindex(inds)
-        assert_series_equal(result, expected)
-
-        result = s[arr_inds]
-        expected = s.reindex(arr_inds)
-        assert_series_equal(result, expected)
-
-    def test_basic_setitem_with_labels(self):
-        indices = self.ts.index[[5, 10, 15]]
-
-        cp = self.ts.copy()
-        exp = self.ts.copy()
-        cp[indices] = 0
-        exp.ix[indices] = 0
-        assert_series_equal(cp, exp)
-
-        cp = self.ts.copy()
-        exp = self.ts.copy()
-        cp[indices[0]:indices[2]] = 0
-        exp.ix[indices[0]:indices[2]] = 0
-        assert_series_equal(cp, exp)
-
-        # integer indexes, be careful
-        s = Series(np.random.randn(10), index=lrange(0, 20, 2))
-        inds = [0, 4, 6]
-        arr_inds = np.array([0, 4, 6])
-
-        cp = s.copy()
-        exp = s.copy()
-        s[inds] = 0
-        s.ix[inds] = 0
-        assert_series_equal(cp, exp)
-
-        cp = s.copy()
-        exp = s.copy()
-        s[arr_inds] = 0
-        s.ix[arr_inds] = 0
-        assert_series_equal(cp, exp)
-
-        inds_notfound = [0, 4, 5, 6]
-        arr_inds_notfound = np.array([0, 4, 5, 6])
-        self.assertRaises(Exception, s.__setitem__, inds_notfound, 0)
-        self.assertRaises(Exception, s.__setitem__, arr_inds_notfound, 0)
-
-    def test_ix_getitem(self):
-        inds = self.series.index[[3, 4, 7]]
-        assert_series_equal(self.series.ix[inds], self.series.reindex(inds))
-        assert_series_equal(self.series.ix[5::2], self.series[5::2])
-
-        # slice with indices
-        d1, d2 = self.ts.index[[5, 15]]
-        result = self.ts.ix[d1:d2]
-        expected = self.ts.truncate(d1, d2)
-        assert_series_equal(result, expected)
-
-        # boolean
-        mask = self.series > self.series.median()
-        assert_series_equal(self.series.ix[mask], self.series[mask])
-
-        # ask for index value
-        self.assertEqual(self.ts.ix[d1], self.ts[d1])
-        self.assertEqual(self.ts.ix[d2], self.ts[d2])
-
-    def test_ix_getitem_not_monotonic(self):
-        d1, d2 = self.ts.index[[5, 15]]
-
-        ts2 = self.ts[::2][[1, 2, 0]]
-
-        self.assertRaises(KeyError, ts2.ix.__getitem__, slice(d1, d2))
-        self.assertRaises(KeyError, ts2.ix.__setitem__, slice(d1, d2), 0)
-
-    def test_ix_getitem_setitem_integer_slice_keyerrors(self):
-        s = Series(np.random.randn(10), index=lrange(0, 20, 2))
-
-        # this is OK
-        cp = s.copy()
-        cp.ix[4:10] = 0
-        self.assertTrue((cp.ix[4:10] == 0).all())
-
-        # so is this
-        cp = s.copy()
-        cp.ix[3:11] = 0
-        self.assertTrue((cp.ix[3:11] == 0).values.all())
-
-        result = s.ix[4:10]
-        result2 = s.ix[3:11]
-        expected = s.reindex([4, 6, 8, 10])
-
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-
-        # non-monotonic, raise KeyError
-        s2 = s.iloc[lrange(5) + lrange(5, 10)[::-1]]
-        self.assertRaises(KeyError, s2.ix.__getitem__, slice(3, 11))
-        self.assertRaises(KeyError, s2.ix.__setitem__, slice(3, 11), 0)
-
-    def test_ix_getitem_iterator(self):
-        idx = iter(self.series.index[:10])
-        result = self.series.ix[idx]
-        assert_series_equal(result, self.series[:10])
-
-    def test_where(self):
-        s = Series(np.random.randn(5))
-        cond = s > 0
-
-        rs = s.where(cond).dropna()
-        rs2 = s[cond]
-        assert_series_equal(rs, rs2)
-
-        rs = s.where(cond, -s)
-        assert_series_equal(rs, s.abs())
-
-        rs = s.where(cond)
-        assert(s.shape == rs.shape)
-        assert(rs is not s)
-
-        # test alignment
-        cond = Series([True,False,False,True,False],index=s.index)
-        s2 = -(s.abs())
-
-        expected = s2[cond].reindex(s2.index[:3]).reindex(s2.index)
-        rs = s2.where(cond[:3])
-        assert_series_equal(rs, expected)
-
-        expected = s2.abs()
-        expected.ix[0] = s2[0]
-        rs = s2.where(cond[:3], -s2)
-        assert_series_equal(rs, expected)
-
-        self.assertRaises(ValueError, s.where, 1)
-        self.assertRaises(ValueError, s.where, cond[:3].values, -s)
-
-        # GH 2745
-        s = Series([1, 2])
-        s[[True, False]] = [0, 1]
-        expected = Series([0, 2])
-        assert_series_equal(s, expected)
-
-        # failures
-        self.assertRaises(
-            ValueError, s.__setitem__, tuple([[[True, False]]]), [0, 2, 3])
-        self.assertRaises(
-            ValueError, s.__setitem__, tuple([[[True, False]]]), [])
-
-        # unsafe dtype changes
-        for dtype in [np.int8, np.int16, np.int32, np.int64, np.float16, np.float32, np.float64]:
-            s = Series(np.arange(10), dtype=dtype)
-            mask = s < 5
-            s[mask] = lrange(2, 7)
-            expected = Series(lrange(2, 7) + lrange(5, 10), dtype=dtype)
-            assert_series_equal(s, expected)
-            self.assertEqual(s.dtype, expected.dtype)
-
-        # these are allowed operations, but are upcasted
-        for dtype in [np.int64, np.float64]:
-            s = Series(np.arange(10), dtype=dtype)
-            mask = s < 5
-            values = [2.5, 3.5, 4.5, 5.5, 6.5]
-            s[mask] = values
-            expected = Series(values + lrange(5, 10), dtype='float64')
-            assert_series_equal(s, expected)
-            self.assertEqual(s.dtype, expected.dtype)
-
-        # GH 9731
-        s = Series(np.arange(10), dtype='int64')
-        mask = s > 5
-        values = [2.5, 3.5, 4.5, 5.5]
-        s[mask] = values
-        expected = Series(lrange(6) + values, dtype='float64')
-        assert_series_equal(s, expected)
-
-        # can't do these as we are forced to change the itemsize of the input
-        # to something we cannot
-        for dtype in [np.int8, np.int16, np.int32, np.float16, np.float32]:
-            s = Series(np.arange(10), dtype=dtype)
-            mask = s < 5
-            values = [2.5, 3.5, 4.5, 5.5, 6.5]
-            self.assertRaises(Exception, s.__setitem__, tuple(mask), values)
-
-        # GH3235
-        s = Series(np.arange(10), dtype='int64')
-        mask = s < 5
-        s[mask] = lrange(2, 7)
-        expected = Series(lrange(2, 7) + lrange(5, 10), dtype='int64')
-        assert_series_equal(s, expected)
-        self.assertEqual(s.dtype, expected.dtype)
-
-        s = Series(np.arange(10), dtype='int64')
-        mask = s > 5
-        s[mask] = [0] * 4
-        expected = Series([0, 1, 2, 3, 4, 5] + [0] * 4, dtype='int64')
-        assert_series_equal(s, expected)
-
-        s = Series(np.arange(10))
-        mask = s > 5
-        def f():
-            s[mask] = [5,4,3,2,1]
-        self.assertRaises(ValueError, f)
-        def f():
-            s[mask] = [0] * 5
-        self.assertRaises(ValueError, f)
-
-        # dtype changes
-        s = Series([1,2,3,4])
-        result = s.where(s>2,np.nan)
-        expected = Series([np.nan,np.nan,3,4])
-        assert_series_equal(result, expected)
-
-        # GH 4667
-        # setting with None changes dtype
-        s = Series(range(10)).astype(float)
-        s[8] = None
-        result = s[8]
-        self.assertTrue(isnull(result))
-
-        s = Series(range(10)).astype(float)
-        s[s > 8] = None
-        result = s[isnull(s)]
-        expected = Series(np.nan,index=[9])
-        assert_series_equal(result, expected)
-
-    def test_where_setitem_invalid(self):
-
-        # GH 2702
-        # make sure correct exceptions are raised on invalid list assignment
-
-        # slice
-        s = Series(list('abc'))
-        def f():
-            s[0:3] = list(range(27))
-        self.assertRaises(ValueError, f)
-
-        s[0:3] = list(range(3))
-        expected = Series([0,1,2])
-        assert_series_equal(s.astype(np.int64), expected, )
-
-        # slice with step
-        s = Series(list('abcdef'))
-        def f():
-            s[0:4:2] = list(range(27))
-        self.assertRaises(ValueError, f)
-
-        s = Series(list('abcdef'))
-        s[0:4:2] = list(range(2))
-        expected = Series([0,'b',1,'d','e','f'])
-        assert_series_equal(s, expected)
-
-        # neg slices
-        s = Series(list('abcdef'))
-        def f():
-            s[:-1] = list(range(27))
-        self.assertRaises(ValueError, f)
-
-        s[-3:-1] = list(range(2))
-        expected = Series(['a','b','c',0,1,'f'])
-        assert_series_equal(s, expected)
-
-        # list
-        s = Series(list('abc'))
-        def f():
-            s[[0,1,2]] = list(range(27))
-        self.assertRaises(ValueError, f)
-
-        s = Series(list('abc'))
-        def f():
-            s[[0,1,2]] = list(range(2))
-        self.assertRaises(ValueError, f)
-
-        # scalar
-        s = Series(list('abc'))
-        s[0] = list(range(10))
-        expected = Series([list(range(10)),'b','c'])
-        assert_series_equal(s, expected)
-
-    def test_where_broadcast(self):
-        # Test a variety of differently sized series
-        for size in range(2, 6):
-            # Test a variety of boolean indices
-            for selection in [np.resize([True, False, False, False, False], size),  # First element should be set
-                              # Set alternating elements]
-                              np.resize([True, False], size),
-                              np.resize([False], size)]:  # No element should be set
-                # Test a variety of different numbers as content
-                for item in [2.0, np.nan, np.finfo(np.float).max, np.finfo(np.float).min]:
-                    # Test numpy arrays, lists and tuples as the input to be
-                    # broadcast
-                    for arr in [np.array([item]), [item], (item,)]:
-                        data = np.arange(size, dtype=float)
-                        s = Series(data)
-                        s[selection] = arr
-                        # Construct the expected series by taking the source
-                        # data or item based on the selection
-                        expected = Series([item if use_item else data[i]
-                                          for i, use_item in enumerate(selection)])
-                        assert_series_equal(s, expected)
-
-                        s = Series(data)
-                        result = s.where(~selection, arr)
-                        assert_series_equal(result, expected)
-
-    def test_where_inplace(self):
-        s = Series(np.random.randn(5))
-        cond = s > 0
-
-        rs = s.copy()
-
-        rs.where(cond, inplace=True)
-        assert_series_equal(rs.dropna(), s[cond])
-        assert_series_equal(rs, s.where(cond))
-
-        rs = s.copy()
-        rs.where(cond, -s, inplace=True)
-        assert_series_equal(rs, s.where(cond, -s))
-
-    def test_where_dups(self):
-        # GH 4550
-        # where crashes with dups in index
-        s1 = Series(list(range(3)))
-        s2 = Series(list(range(3)))
-        comb = pd.concat([s1,s2])
-        result = comb.where(comb < 2)
-        expected = Series([0,1,np.nan,0,1,np.nan],index=[0,1,2,0,1,2])
-        assert_series_equal(result, expected)
-
-        # GH 4548
-        # inplace updating not working with dups
-        comb[comb<1] = 5
-        expected = Series([5,1,2,5,1,2],index=[0,1,2,0,1,2])
-        assert_series_equal(comb, expected)
-
-        comb[comb<2] += 10
-        expected = Series([5,11,2,5,11,2],index=[0,1,2,0,1,2])
-        assert_series_equal(comb, expected)
-
-    def test_where_datetime(self):
-        s = Series(date_range('20130102', periods=2))
-        expected = Series([10, 10], dtype='datetime64[ns]')
-        mask = np.array([False, False])
-
-        rs = s.where(mask, [10, 10])
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, 10)
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, 10.0)
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, [10.0, 10.0])
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, [10.0, np.nan])
-        expected = Series([10, None], dtype='datetime64[ns]')
-        assert_series_equal(rs, expected)
-
-    def test_where_timedelta(self):
-        s = Series([1, 2], dtype='timedelta64[ns]')
-        expected = Series([10, 10], dtype='timedelta64[ns]')
-        mask = np.array([False, False])
-
-        rs = s.where(mask, [10, 10])
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, 10)
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, 10.0)
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, [10.0, 10.0])
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, [10.0, np.nan])
-        expected = Series([10, None], dtype='timedelta64[ns]')
-        assert_series_equal(rs, expected)
-
-    def test_mask(self):
-        # compare with tested results in test_where
-        s = Series(np.random.randn(5))
-        cond = s > 0
-
-        rs = s.where(~cond, np.nan)
-        assert_series_equal(rs, s.mask(cond))
-
-        rs = s.where(~cond)
-        rs2 = s.mask(cond)
-        assert_series_equal(rs, rs2)
-
-        rs = s.where(~cond, -s)
-        rs2 = s.mask(cond, -s)
-        assert_series_equal(rs, rs2)
-
-        cond = Series([True, False, False, True, False], index=s.index)
-        s2 = -(s.abs())
-        rs = s2.where(~cond[:3])
-        rs2 = s2.mask(cond[:3])
-        assert_series_equal(rs, rs2)
-
-        rs = s2.where(~cond[:3], -s2)
-        rs2 = s2.mask(cond[:3], -s2)
-        assert_series_equal(rs, rs2)
-
-        self.assertRaises(ValueError, s.mask, 1)
-        self.assertRaises(ValueError, s.mask, cond[:3].values, -s)
-
-        # dtype changes
-        s = Series([1,2,3,4])
-        result = s.mask(s>2, np.nan)
-        expected = Series([1, 2, np.nan, np.nan])
-        assert_series_equal(result, expected)
-
-    def test_mask_broadcast(self):
-        # GH 8801
-        # copied from test_where_broadcast
-        for size in range(2, 6):
-            for selection in [np.resize([True, False, False, False, False], size),  # First element should be set
-                              # Set alternating elements]
-                              np.resize([True, False], size),
-                              np.resize([False], size)]:  # No element should be set
-                for item in [2.0, np.nan, np.finfo(np.float).max, np.finfo(np.float).min]:
-                    for arr in [np.array([item]), [item], (item,)]:
-                        data = np.arange(size, dtype=float)
-                        s = Series(data)
-                        result = s.mask(selection, arr)
-                        expected = Series([item if use_item else data[i]
-                                          for i, use_item in enumerate(selection)])
-                        assert_series_equal(result, expected)
-
-    def test_mask_inplace(self):
-        s = Series(np.random.randn(5))
-        cond = s > 0
-
-        rs = s.copy()
-        rs.mask(cond, inplace=True)
-        assert_series_equal(rs.dropna(), s[~cond])
-        assert_series_equal(rs, s.mask(cond))
-
-        rs = s.copy()
-        rs.mask(cond, -s, inplace=True)
-        assert_series_equal(rs, s.mask(cond, -s))
-
-    def test_drop(self):
-
-        # unique
-        s = Series([1,2],index=['one','two'])
-        expected = Series([1],index=['one'])
-        result = s.drop(['two'])
-        assert_series_equal(result,expected)
-        result = s.drop('two', axis='rows')
-        assert_series_equal(result,expected)
-
-        # non-unique
-        # GH 5248
-        s = Series([1,1,2],index=['one','two','one'])
-        expected = Series([1,2],index=['one','one'])
-        result = s.drop(['two'], axis=0)
-        assert_series_equal(result,expected)
-        result = s.drop('two')
-        assert_series_equal(result,expected)
-
-        expected = Series([1],index=['two'])
-        result = s.drop(['one'])
-        assert_series_equal(result,expected)
-        result = s.drop('one')
-        assert_series_equal(result,expected)
-
-        # single string/tuple-like
-        s = Series(range(3),index=list('abc'))
-        self.assertRaises(ValueError, s.drop, 'bc')
-        self.assertRaises(ValueError, s.drop, ('a',))
-
-        # errors='ignore'
-        s = Series(range(3),index=list('abc'))
-        result = s.drop('bc', errors='ignore')
-        assert_series_equal(result, s)
-        result = s.drop(['a', 'd'], errors='ignore')
-        expected = s.ix[1:]
-        assert_series_equal(result, expected)
-
-        # bad axis
-        self.assertRaises(ValueError, s.drop, 'one', axis='columns')
-
-        # GH 8522
-        s = Series([2,3], index=[True, False])
-        self.assertTrue(s.index.is_object())
-        result = s.drop(True)
-        expected = Series([3],index=[False])
-        assert_series_equal(result,expected)
-
-    def test_ix_setitem(self):
-        inds = self.series.index[[3, 4, 7]]
-
-        result = self.series.copy()
-        result.ix[inds] = 5
-
-        expected = self.series.copy()
-        expected[[3, 4, 7]] = 5
-        assert_series_equal(result, expected)
-
-        result.ix[5:10] = 10
-        expected[5:10] = 10
-        assert_series_equal(result, expected)
-
-        # set slice with indices
-        d1, d2 = self.series.index[[5, 15]]
-        result.ix[d1:d2] = 6
-        expected[5:16] = 6  # because it's inclusive
-        assert_series_equal(result, expected)
-
-        # set index value
-        self.series.ix[d1] = 4
-        self.series.ix[d2] = 6
-        self.assertEqual(self.series[d1], 4)
-        self.assertEqual(self.series[d2], 6)
-
-    def test_where_numeric_with_string(self):
-        # GH 9280
-        s = pd.Series([1, 2, 3])
-        w = s.where(s>1, 'X')
-
-        self.assertFalse(com.is_integer(w[0]))
-        self.assertTrue(com.is_integer(w[1]))
-        self.assertTrue(com.is_integer(w[2]))
-        self.assertTrue(isinstance(w[0], str))
-        self.assertTrue(w.dtype == 'object')
-
-        w = s.where(s>1, ['X', 'Y', 'Z'])
-        self.assertFalse(com.is_integer(w[0]))
-        self.assertTrue(com.is_integer(w[1]))
-        self.assertTrue(com.is_integer(w[2]))
-        self.assertTrue(isinstance(w[0], str))
-        self.assertTrue(w.dtype == 'object')
-
-        w = s.where(s>1, np.array(['X', 'Y', 'Z']))
-        self.assertFalse(com.is_integer(w[0]))
-        self.assertTrue(com.is_integer(w[1]))
-        self.assertTrue(com.is_integer(w[2]))
-        self.assertTrue(isinstance(w[0], str))
-        self.assertTrue(w.dtype == 'object')
-
-    def test_setitem_boolean(self):
-        mask = self.series > self.series.median()
-
-        # similiar indexed series
-        result = self.series.copy()
-        result[mask] = self.series * 2
-        expected = self.series * 2
-        assert_series_equal(result[mask], expected[mask])
-
-        # needs alignment
-        result = self.series.copy()
-        result[mask] = (self.series * 2)[0:5]
-        expected = (self.series * 2)[0:5].reindex_like(self.series)
-        expected[-mask] = self.series[mask]
-        assert_series_equal(result[mask], expected[mask])
-
-    def test_ix_setitem_boolean(self):
-        mask = self.series > self.series.median()
-
-        result = self.series.copy()
-        result.ix[mask] = 0
-        expected = self.series
-        expected[mask] = 0
-        assert_series_equal(result, expected)
-
-    def test_ix_setitem_corner(self):
-        inds = list(self.series.index[[5, 8, 12]])
-        self.series.ix[inds] = 5
-        self.assertRaises(Exception, self.series.ix.__setitem__,
-                          inds + ['foo'], 5)
-
-    def test_get_set_boolean_different_order(self):
-        ordered = self.series.sort_values()
-
-        # setting
-        copy = self.series.copy()
-        copy[ordered > 0] = 0
-
-        expected = self.series.copy()
-        expected[expected > 0] = 0
-
-        assert_series_equal(copy, expected)
-
-        # getting
-        sel = self.series[ordered > 0]
-        exp = self.series[self.series > 0]
-        assert_series_equal(sel, exp)
-
-    def test_repr(self):
-        str(self.ts)
-        str(self.series)
-        str(self.series.astype(int))
-        str(self.objSeries)
-
-        str(Series(tm.randn(1000), index=np.arange(1000)))
-        str(Series(tm.randn(1000), index=np.arange(1000, 0, step=-1)))
-
-        # empty
-        str(self.empty)
-
-        # with NaNs
-        self.series[5:7] = np.NaN
-        str(self.series)
-
-        # with Nones
-        ots = self.ts.astype('O')
-        ots[::2] = None
-        repr(ots)
-
-        # various names
-        for name in ['', 1, 1.2, 'foo', u('\u03B1\u03B2\u03B3'),
-                     'loooooooooooooooooooooooooooooooooooooooooooooooooooong',
-                     ('foo', 'bar', 'baz'),
-                     (1, 2),
-                     ('foo', 1, 2.3),
-                     (u('\u03B1'), u('\u03B2'), u('\u03B3')),
-                     (u('\u03B1'), 'bar')]:
-            self.series.name = name
-            repr(self.series)
-
-        biggie = Series(tm.randn(1000), index=np.arange(1000),
-                        name=('foo', 'bar', 'baz'))
-        repr(biggie)
-
-        # 0 as name
-        ser = Series(np.random.randn(100), name=0)
-        rep_str = repr(ser)
-        self.assertIn("Name: 0", rep_str)
-
-        # tidy repr
-        ser = Series(np.random.randn(1001), name=0)
-        rep_str = repr(ser)
-        self.assertIn("Name: 0", rep_str)
-
-        ser = Series(["a\n\r\tb"], name=["a\n\r\td"], index=["a\n\r\tf"])
-        self.assertFalse("\t" in repr(ser))
-        self.assertFalse("\r" in repr(ser))
-        self.assertFalse("a\n" in repr(ser))
-
-        # with empty series (#4651)
-        s = Series([], dtype=np.int64, name='foo')
-        self.assertEqual(repr(s), 'Series([], Name: foo, dtype: int64)')
-
-        s = Series([], dtype=np.int64, name=None)
-        self.assertEqual(repr(s), 'Series([], dtype: int64)')
-
-    def test_tidy_repr(self):
-        a = Series([u("\u05d0")] * 1000)
-        a.name = 'title1'
-        repr(a)         # should not raise exception
-
-    def test_repr_bool_fails(self):
-        s = Series([DataFrame(np.random.randn(2, 2)) for i in range(5)])
-
-        import sys
-
-        buf = StringIO()
-        tmp = sys.stderr
-        sys.stderr = buf
-        try:
-        # it works (with no Cython exception barf)!
-            repr(s)
-        finally:
-            sys.stderr = tmp
-        self.assertEqual(buf.getvalue(), '')
-
-    def test_repr_name_iterable_indexable(self):
-        s = Series([1, 2, 3], name=np.int64(3))
-
-        # it works!
-        repr(s)
-
-        s.name = (u("\u05d0"),) * 2
-        repr(s)
-
-    def test_repr_should_return_str(self):
-        # http://docs.python.org/py3k/reference/datamodel.html#object.__repr__
-        # http://docs.python.org/reference/datamodel.html#object.__repr__
-        # ...The return value must be a string object.
-
-        # (str on py2.x, str (unicode) on py3)
-
-        data = [8, 5, 3, 5]
-        index1 = [u("\u03c3"), u("\u03c4"), u("\u03c5"), u("\u03c6")]
-        df = Series(data, index=index1)
-        self.assertTrue(type(df.__repr__() == str))  # both py2 / 3
-
-    def test_repr_max_rows(self):
-        # GH 6863
-        with pd.option_context('max_rows', None):
-            str(Series(range(1001))) # should not raise exception
-
-    def test_unicode_string_with_unicode(self):
-        df = Series([u("\u05d0")], name=u("\u05d1"))
-        if compat.PY3:
-            str(df)
-        else:
-            compat.text_type(df)
-
-    def test_bytestring_with_unicode(self):
-        df = Series([u("\u05d0")], name=u("\u05d1"))
-        if compat.PY3:
-            bytes(df)
-        else:
-            str(df)
-
-    def test_timeseries_repr_object_dtype(self):
-        index = Index([datetime(2000, 1, 1) + timedelta(i)
-                       for i in range(1000)], dtype=object)
-        ts = Series(np.random.randn(len(index)), index)
-        repr(ts)
-
-        ts = tm.makeTimeSeries(1000)
-        self.assertTrue(repr(ts).splitlines()[-1].startswith('Freq:'))
-
-        ts2 = ts.ix[np.random.randint(0, len(ts) - 1, 400)]
-        repr(ts2).splitlines()[-1]
-
-    def test_timeseries_periodindex(self):
-        # GH2891
-        from pandas import period_range
-        prng = period_range('1/1/2011', '1/1/2012', freq='M')
-        ts = Series(np.random.randn(len(prng)), prng)
-        new_ts = self.round_trip_pickle(ts)
-        self.assertEqual(new_ts.index.freq, 'M')
-
-    def test_iter(self):
-        for i, val in enumerate(self.series):
-            self.assertEqual(val, self.series[i])
-
-        for i, val in enumerate(self.ts):
-            self.assertEqual(val, self.ts[i])
-
-    def test_keys(self):
-        # HACK: By doing this in two stages, we avoid 2to3 wrapping the call
-        # to .keys() in a list()
-        getkeys = self.ts.keys
-        self.assertIs(getkeys(), self.ts.index)
-
-    def test_values(self):
-        self.assert_numpy_array_equal(self.ts, self.ts.values)
-
-    def test_iteritems(self):
-        for idx, val in compat.iteritems(self.series):
-            self.assertEqual(val, self.series[idx])
-
-        for idx, val in compat.iteritems(self.ts):
-            self.assertEqual(val, self.ts[idx])
-
-        # assert is lazy (genrators don't define reverse, lists do)
-        self.assertFalse(hasattr(self.series.iteritems(), 'reverse'))
-
-    def test_sum(self):
-        self._check_stat_op('sum', np.sum, check_allna=True)
-
-    def test_sum_inf(self):
-        import pandas.core.nanops as nanops
-
-        s = Series(np.random.randn(10))
-        s2 = s.copy()
-
-        s[5:8] = np.inf
-        s2[5:8] = np.nan
-
-        self.assertTrue(np.isinf(s.sum()))
-
-        arr = np.random.randn(100, 100).astype('f4')
-        arr[:, 2] = np.inf
-
-        with cf.option_context("mode.use_inf_as_null", True):
-            assert_almost_equal(s.sum(), s2.sum())
-
-        res = nanops.nansum(arr, axis=1)
-        self.assertTrue(np.isinf(res).all())
-
-    def test_mean(self):
-        self._check_stat_op('mean', np.mean)
-
-    def test_median(self):
-        self._check_stat_op('median', np.median)
-
-        # test with integers, test failure
-        int_ts = Series(np.ones(10, dtype=int), index=lrange(10))
-        self.assertAlmostEqual(np.median(int_ts), int_ts.median())
-
-    def test_mode(self):
-        s = Series([12, 12, 11, 10, 19, 11])
-        exp = Series([11, 12])
-        assert_series_equal(s.mode(), exp)
-
-        assert_series_equal(Series([1, 2, 3]).mode(), Series([], dtype='int64'))
-
-        lst = [5] * 20 + [1] * 10 + [6] * 25
-        np.random.shuffle(lst)
-        s = Series(lst)
-        assert_series_equal(s.mode(), Series([6]))
-
-        s = Series([5] * 10)
-        assert_series_equal(s.mode(), Series([5]))
-
-        s = Series(lst)
-        s[0] = np.nan
-        assert_series_equal(s.mode(), Series([6.]))
-
-        s = Series(list('adfasbasfwewefwefweeeeasdfasnbam'))
-        assert_series_equal(s.mode(), Series(['e']))
-
-        s = Series(['2011-01-03', '2013-01-02', '1900-05-03'], dtype='M8[ns]')
-        assert_series_equal(s.mode(), Series([], dtype="M8[ns]"))
-        s = Series(['2011-01-03', '2013-01-02', '1900-05-03', '2011-01-03',
-                    '2013-01-02'], dtype='M8[ns]')
-        assert_series_equal(s.mode(), Series(['2011-01-03', '2013-01-02'],
-                                             dtype='M8[ns]'))
-
-    def test_prod(self):
-        self._check_stat_op('prod', np.prod)
-
-    def test_min(self):
-        self._check_stat_op('min', np.min, check_objects=True)
-
-    def test_max(self):
-        self._check_stat_op('max', np.max, check_objects=True)
-
-    def test_var_std(self):
-        alt = lambda x: np.std(x, ddof=1)
-        self._check_stat_op('std', alt)
-
-        alt = lambda x: np.var(x, ddof=1)
-        self._check_stat_op('var', alt)
-
-        result = self.ts.std(ddof=4)
-        expected = np.std(self.ts.values, ddof=4)
-        assert_almost_equal(result, expected)
-
-        result = self.ts.var(ddof=4)
-        expected = np.var(self.ts.values, ddof=4)
-        assert_almost_equal(result, expected)
-
-        # 1 - element series with ddof=1
-        s = self.ts.iloc[[0]]
-        result = s.var(ddof=1)
-        self.assertTrue(isnull(result))
-
-        result = s.std(ddof=1)
-        self.assertTrue(isnull(result))
-
-    def test_sem(self):
-        alt = lambda x: np.std(x, ddof=1)/np.sqrt(len(x))
-        self._check_stat_op('sem', alt)
-
-        result = self.ts.sem(ddof=4)
-        expected = np.std(self.ts.values, ddof=4)/np.sqrt(len(self.ts.values))
-        assert_almost_equal(result, expected)
-
-        # 1 - element series with ddof=1
-        s = self.ts.iloc[[0]]
-        result = s.sem(ddof=1)
-        self.assertTrue(isnull(result))
-
-    def test_skew(self):
-        tm._skip_if_no_scipy()
-
-        from scipy.stats import skew
-        alt = lambda x: skew(x, bias=False)
-        self._check_stat_op('skew', alt)
-
-        # test corner cases, skew() returns NaN unless there's at least 3 values
-        min_N = 3
-        for i in range(1, min_N + 1):
-            s = Series(np.ones(i))
-            df = DataFrame(np.ones((i, i)))
-            if i < min_N:
-                self.assertTrue(np.isnan(s.skew()))
-                self.assertTrue(np.isnan(df.skew()).all())
-            else:
-                self.assertEqual(0, s.skew())
-                self.assertTrue((df.skew() == 0).all())
-
-    def test_kurt(self):
-        tm._skip_if_no_scipy()
-
-        from scipy.stats import kurtosis
-        alt = lambda x: kurtosis(x, bias=False)
-        self._check_stat_op('kurt', alt)
-
-        index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
-                           labels=[[0, 0, 0, 0, 0, 0],
-                                   [0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1]])
-        s = Series(np.random.randn(6), index=index)
-        self.assertAlmostEqual(s.kurt(), s.kurt(level=0)['bar'])
-
-        # test corner cases, kurt() returns NaN unless there's at least 4 values
-        min_N = 4
-        for i in range(1, min_N + 1):
-            s = Series(np.ones(i))
-            df = DataFrame(np.ones((i, i)))
-            if i < min_N:
-                self.assertTrue(np.isnan(s.kurt()))
-                self.assertTrue(np.isnan(df.kurt()).all())
-            else:
-                self.assertEqual(0, s.kurt())
-                self.assertTrue((df.kurt() == 0).all())
-
-    def test_argsort(self):
-        self._check_accum_op('argsort')
-        argsorted = self.ts.argsort()
-        self.assertTrue(issubclass(argsorted.dtype.type, np.integer))
-
-        # GH 2967 (introduced bug in 0.11-dev I think)
-        s = Series([Timestamp('201301%02d' % (i + 1)) for i in range(5)])
-        self.assertEqual(s.dtype, 'datetime64[ns]')
-        shifted = s.shift(-1)
-        self.assertEqual(shifted.dtype, 'datetime64[ns]')
-        self.assertTrue(isnull(shifted[4]))
-
-        result = s.argsort()
-        expected = Series(lrange(5), dtype='int64')
-        assert_series_equal(result, expected)
-
-        result = shifted.argsort()
-        expected = Series(lrange(4) + [-1], dtype='int64')
-        assert_series_equal(result, expected)
-
-    def test_argsort_stable(self):
-        s = Series(np.random.randint(0, 100, size=10000))
-        mindexer = s.argsort(kind='mergesort')
-        qindexer = s.argsort()
-
-        mexpected = np.argsort(s.values, kind='mergesort')
-        qexpected = np.argsort(s.values, kind='quicksort')
-
-        self.assert_numpy_array_equal(mindexer, mexpected)
-        self.assert_numpy_array_equal(qindexer, qexpected)
-        self.assertFalse(np.array_equal(qindexer, mindexer))
-
-    def test_reorder_levels(self):
-        index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
-                           labels=[[0, 0, 0, 0, 0, 0],
-                                   [0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1]],
-                           names=['L0', 'L1', 'L2'])
-        s = Series(np.arange(6), index=index)
-
-        # no change, position
-        result = s.reorder_levels([0, 1, 2])
-        assert_series_equal(s, result)
-
-        # no change, labels
-        result = s.reorder_levels(['L0', 'L1', 'L2'])
-        assert_series_equal(s, result)
-
-        # rotate, position
-        result = s.reorder_levels([1, 2, 0])
-        e_idx = MultiIndex(levels=[['one', 'two', 'three'], [0, 1], ['bar']],
-                           labels=[[0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1],
-                                   [0, 0, 0, 0, 0, 0]],
-                           names=['L1', 'L2', 'L0'])
-        expected = Series(np.arange(6), index=e_idx)
-        assert_series_equal(result, expected)
-
-        result = s.reorder_levels([0, 0, 0])
-        e_idx = MultiIndex(levels=[['bar'], ['bar'], ['bar']],
-                           labels=[[0, 0, 0, 0, 0, 0],
-                                   [0, 0, 0, 0, 0, 0],
-                                   [0, 0, 0, 0, 0, 0]],
-                           names=['L0', 'L0', 'L0'])
-        expected = Series(range(6), index=e_idx)
-        assert_series_equal(result, expected)
-
-        result = s.reorder_levels(['L0', 'L0', 'L0'])
-        assert_series_equal(result, expected)
-
-    def test_cumsum(self):
-        self._check_accum_op('cumsum')
-
-    def test_cumprod(self):
-        self._check_accum_op('cumprod')
-
-    def test_cummin(self):
-        self.assert_numpy_array_equal(self.ts.cummin(),
-                                      np.minimum.accumulate(np.array(self.ts)))
-        ts = self.ts.copy()
-        ts[::2] = np.NaN
-        result = ts.cummin()[1::2]
-        expected = np.minimum.accumulate(ts.valid())
-
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_cummax(self):
-        self.assert_numpy_array_equal(self.ts.cummax(),
-                                      np.maximum.accumulate(np.array(self.ts)))
-        ts = self.ts.copy()
-        ts[::2] = np.NaN
-        result = ts.cummax()[1::2]
-        expected = np.maximum.accumulate(ts.valid())
-
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_cummin_datetime64(self):
-        s = pd.Series(pd.to_datetime(
-            ['NaT', '2000-1-2', 'NaT', '2000-1-1', 'NaT', '2000-1-3']))
-
-        expected = pd.Series(pd.to_datetime(
-            ['NaT', '2000-1-2', 'NaT', '2000-1-1', 'NaT', '2000-1-1']))
-        result = s.cummin(skipna=True)
-        self.assert_series_equal(expected, result)
-
-        expected = pd.Series(pd.to_datetime(
-            ['NaT', '2000-1-2', '2000-1-2', '2000-1-1', '2000-1-1', '2000-1-1']))
-        result = s.cummin(skipna=False)
-        self.assert_series_equal(expected, result)
-
-    def test_cummax_datetime64(self):
-        s = pd.Series(pd.to_datetime(
-            ['NaT', '2000-1-2', 'NaT', '2000-1-1', 'NaT', '2000-1-3']))
-
-        expected = pd.Series(pd.to_datetime(
-            ['NaT', '2000-1-2', 'NaT', '2000-1-2', 'NaT', '2000-1-3']))
-        result = s.cummax(skipna=True)
-        self.assert_series_equal(expected, result)
-
-        expected = pd.Series(pd.to_datetime(
-            ['NaT', '2000-1-2', '2000-1-2', '2000-1-2', '2000-1-2', '2000-1-3']))
-        result = s.cummax(skipna=False)
-        self.assert_series_equal(expected, result)
-
-    def test_cummin_timedelta64(self):
-        s = pd.Series(pd.to_timedelta(
-            ['NaT', '2 min', 'NaT', '1 min', 'NaT', '3 min', ]))
-
-        expected = pd.Series(pd.to_timedelta(
-            ['NaT', '2 min', 'NaT', '1 min', 'NaT', '1 min', ]))
-        result = s.cummin(skipna=True)
-        self.assert_series_equal(expected, result)
-
-        expected = pd.Series(pd.to_timedelta(
-            ['NaT', '2 min', '2 min', '1 min', '1 min', '1 min', ]))
-        result = s.cummin(skipna=False)
-        self.assert_series_equal(expected, result)
-
-    def test_cummax_timedelta64(self):
-        s = pd.Series(pd.to_timedelta(
-            ['NaT', '2 min', 'NaT', '1 min', 'NaT', '3 min', ]))
-
-        expected = pd.Series(pd.to_timedelta(
-            ['NaT', '2 min', 'NaT', '2 min', 'NaT', '3 min', ]))
-        result = s.cummax(skipna=True)
-        self.assert_series_equal(expected, result)
-
-        expected = pd.Series(pd.to_timedelta(
-            ['NaT', '2 min', '2 min', '2 min', '2 min', '3 min', ]))
-        result = s.cummax(skipna=False)
-        self.assert_series_equal(expected, result)
-
-    def test_npdiff(self):
-        raise nose.SkipTest("skipping due to Series no longer being an "
-                            "ndarray")
-
-        # no longer works as the return type of np.diff is now nd.array
-        s = Series(np.arange(5))
-
-        r = np.diff(s)
-        assert_series_equal(Series([nan, 0, 0, 0, nan]), r)
-
-    def _check_stat_op(self, name, alternate, check_objects=False, check_allna=False):
-        import pandas.core.nanops as nanops
-
-        def testit():
-            f = getattr(Series, name)
-
-            # add some NaNs
-            self.series[5:15] = np.NaN
-
-            # idxmax, idxmin, min, and max are valid for dates
-            if name not in ['max','min']:
-                ds = Series(date_range('1/1/2001', periods=10))
-                self.assertRaises(TypeError, f, ds)
-
-            # skipna or no
-            self.assertTrue(notnull(f(self.series)))
-            self.assertTrue(isnull(f(self.series, skipna=False)))
-
-            # check the result is correct
-            nona = self.series.dropna()
-            assert_almost_equal(f(nona), alternate(nona.values))
-            assert_almost_equal(f(self.series), alternate(nona.values))
-
-            allna = self.series * nan
-
-            if check_allna:
-                # xref 9422
-                # bottleneck >= 1.0 give 0.0 for an allna Series sum
-                try:
-                    self.assertTrue(nanops._USE_BOTTLENECK)
-                    import bottleneck as bn
-                    self.assertTrue(bn.__version__ >= LooseVersion('1.0'))
-                    self.assertEqual(f(allna),0.0)
-                except:
-                    self.assertTrue(np.isnan(f(allna)))
-
-            # dtype=object with None, it works!
-            s = Series([1, 2, 3, None, 5])
-            f(s)
-
-            # 2888
-            l = [0]
-            l.extend(lrange(2 ** 40, 2 ** 40+1000))
-            s = Series(l, dtype='int64')
-            assert_almost_equal(float(f(s)), float(alternate(s.values)))
-
-            # check date range
-            if check_objects:
-                s = Series(bdate_range('1/1/2000', periods=10))
-                res = f(s)
-                exp = alternate(s)
-                self.assertEqual(res, exp)
-
-            # check on string data
-            if name not in ['sum','min','max']:
-                self.assertRaises(TypeError, f, Series(list('abc')))
-
-            # Invalid axis.
-            self.assertRaises(ValueError, f, self.series, axis=1)
-
-            # Unimplemented numeric_only parameter.
-            if 'numeric_only' in getargspec(f).args:
-                self.assertRaisesRegexp(NotImplementedError, name, f,
-                                        self.series, numeric_only=True)
-
-        testit()
-
-        try:
-            import bottleneck as bn
-            nanops._USE_BOTTLENECK = False
-            testit()
-            nanops._USE_BOTTLENECK = True
-        except ImportError:
-            pass
-
-    def _check_accum_op(self, name):
-        func = getattr(np, name)
-        self.assert_numpy_array_equal(func(self.ts), func(np.array(self.ts)))
-
-        # with missing values
-        ts = self.ts.copy()
-        ts[::2] = np.NaN
-
-        result = func(ts)[1::2]
-        expected = func(np.array(ts.valid()))
-
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_round(self):
-        # numpy.round doesn't preserve metadata, probably a numpy bug,
-        # re: GH #314
-        result = np.round(self.ts, 2)
-        expected = Series(np.round(self.ts.values, 2), index=self.ts.index,
-                          name='ts')
-        assert_series_equal(result, expected)
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_prod_numpy16_bug(self):
-        s = Series([1., 1., 1.], index=lrange(3))
-        result = s.prod()
-        self.assertNotIsInstance(result, Series)
-
-    def test_quantile(self):
-        from numpy import percentile
-
-        q = self.ts.quantile(0.1)
-        self.assertEqual(q, percentile(self.ts.valid(), 10))
-
-        q = self.ts.quantile(0.9)
-        self.assertEqual(q, percentile(self.ts.valid(), 90))
-
-        # object dtype
-        q = Series(self.ts,dtype=object).quantile(0.9)
-        self.assertEqual(q, percentile(self.ts.valid(), 90))
-
-        # datetime64[ns] dtype
-        dts = self.ts.index.to_series()
-        q = dts.quantile(.2)
-        self.assertEqual(q, Timestamp('2000-01-10 19:12:00'))
-
-        # timedelta64[ns] dtype
-        tds = dts.diff()
-        q = tds.quantile(.25)
-        self.assertEqual(q, pd.to_timedelta('24:00:00'))
-
-        # GH7661
-        result = Series([np.timedelta64('NaT')]).sum()
-        self.assertTrue(result is pd.NaT)
-
-        msg = 'percentiles should all be in the interval \\[0, 1\\]'
-        for invalid in [-1, 2, [0.5, -1], [0.5, 2]]:
-            with tm.assertRaisesRegexp(ValueError, msg):
-                self.ts.quantile(invalid)
-
-    def test_quantile_multi(self):
-        from numpy import percentile
-
-        qs = [.1, .9]
-        result = self.ts.quantile(qs)
-        expected = pd.Series([percentile(self.ts.valid(), 10),
-                              percentile(self.ts.valid(), 90)],
-                             index=qs, name=self.ts.name)
-        assert_series_equal(result, expected)
-
-        dts = self.ts.index.to_series()
-        dts.name = 'xxx'
-        result = dts.quantile((.2, .2))
-        expected = Series([Timestamp('2000-01-10 19:12:00'),
-                           Timestamp('2000-01-10 19:12:00')],
-                          index=[.2, .2], name='xxx')
-        assert_series_equal(result, expected)
-
-        result = self.ts.quantile([])
-        expected = pd.Series([], name=self.ts.name)
-        assert_series_equal(result, expected)
-
-    def test_append(self):
-        appendedSeries = self.series.append(self.objSeries)
-        for idx, value in compat.iteritems(appendedSeries):
-            if idx in self.series.index:
-                self.assertEqual(value, self.series[idx])
-            elif idx in self.objSeries.index:
-                self.assertEqual(value, self.objSeries[idx])
-            else:
-                self.fail("orphaned index!")
-
-        self.assertRaises(ValueError, self.ts.append, self.ts,
-                          verify_integrity=True)
-
-    def test_append_many(self):
-        pieces = [self.ts[:5], self.ts[5:10], self.ts[10:]]
-
-        result = pieces[0].append(pieces[1:])
-        assert_series_equal(result, self.ts)
-
-    def test_all_any(self):
-        ts = tm.makeTimeSeries()
-        bool_series = ts > 0
-        self.assertFalse(bool_series.all())
-        self.assertTrue(bool_series.any())
-
-        # Alternative types, with implicit 'object' dtype.
-        s = Series(['abc', True])
-        self.assertEqual('abc', s.any())  # 'abc' || True => 'abc'
-
-    def test_all_any_params(self):
-        # Check skipna, with implicit 'object' dtype.
-        s1 = Series([np.nan, True])
-        s2 = Series([np.nan, False])
-        self.assertTrue(s1.all(skipna=False))  # nan && True => True
-        self.assertTrue(s1.all(skipna=True))
-        self.assertTrue(np.isnan(s2.any(skipna=False)))  # nan || False => nan
-        self.assertFalse(s2.any(skipna=True))
-
-        # Check level.
-        s = pd.Series([False, False, True, True, False, True],
-                      index=[0, 0, 1, 1, 2, 2])
-        assert_series_equal(s.all(level=0), Series([False, True, False]))
-        assert_series_equal(s.any(level=0), Series([False, True, True]))
-
-        # bool_only is not implemented with level option.
-        self.assertRaises(NotImplementedError, s.any, bool_only=True, level=0)
-        self.assertRaises(NotImplementedError, s.all, bool_only=True, level=0)
-
-        # bool_only is not implemented alone.
-        self.assertRaises(NotImplementedError, s.any, bool_only=True)
-        self.assertRaises(NotImplementedError, s.all, bool_only=True)
-
-    def test_op_method(self):
-        def check(series, other, check_reverse=False):
-            simple_ops = ['add', 'sub', 'mul', 'floordiv', 'truediv', 'pow']
-            if not compat.PY3:
-                simple_ops.append('div')
-
-            for opname in simple_ops:
-                op = getattr(Series, opname)
-
-                if op == 'div':
-                    alt = operator.truediv
-                else:
-                    alt = getattr(operator, opname)
-
-                result = op(series, other)
-                expected = alt(series, other)
-                tm.assert_almost_equal(result, expected)
-                if check_reverse:
-                    rop = getattr(Series, "r" + opname)
-                    result = rop(series, other)
-                    expected = alt(other, series)
-                    tm.assert_almost_equal(result, expected)
-
-        check(self.ts, self.ts * 2)
-        check(self.ts, self.ts[::2])
-        check(self.ts, 5, check_reverse=True)
-        check(tm.makeFloatSeries(), tm.makeFloatSeries(), check_reverse=True)
-
-    def test_neg(self):
-        assert_series_equal(-self.series, -1 * self.series)
-
-    def test_invert(self):
-        assert_series_equal(-(self.series < 0), ~(self.series < 0))
-
-    def test_modulo(self):
-
-        # GH3590, modulo as ints
-        p = DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
-        result = p['first'] % p['second']
-        expected = Series(p['first'].values %
-                          p['second'].values, dtype='float64')
-        expected.iloc[0:3] = np.nan
-        assert_series_equal(result, expected)
-
-        result = p['first'] % 0
-        expected = Series(np.nan, index=p.index, name='first')
-        assert_series_equal(result, expected)
-
-        p = p.astype('float64')
-        result = p['first'] % p['second']
-        expected = Series(p['first'].values % p['second'].values)
-        assert_series_equal(result, expected)
-
-        p = p.astype('float64')
-        result = p['first'] % p['second']
-        result2 = p['second'] % p['first']
-        self.assertFalse(np.array_equal(result, result2))
-
-        # GH 9144
-        s = Series([0, 1])
-
-        result = s % 0
-        expected = Series([nan, nan])
-        assert_series_equal(result, expected)
-
-        result = 0 % s
-        expected = Series([nan, 0.0])
-        assert_series_equal(result, expected)
-
-    def test_div(self):
-
-        # no longer do integer div for any ops, but deal with the 0's
-        p = DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
-        result = p['first'] / p['second']
-        expected = Series(p['first'].values.astype(float) / p['second'].values,
-                          dtype='float64')
-        expected.iloc[0:3] = np.inf
-        assert_series_equal(result, expected)
-
-        result = p['first'] / 0
-        expected = Series(np.inf, index=p.index, name='first')
-        assert_series_equal(result, expected)
-
-        p = p.astype('float64')
-        result = p['first'] / p['second']
-        expected = Series(p['first'].values / p['second'].values)
-        assert_series_equal(result, expected)
-
-        p = DataFrame({'first': [3, 4, 5, 8], 'second': [1, 1, 1, 1]})
-        result = p['first'] / p['second']
-        assert_series_equal(result, p['first'].astype('float64'), check_names=False)
-        self.assertTrue(result.name is None)
-        self.assertFalse(np.array_equal(result, p['second'] / p['first']))
-
-        # inf signing
-        s = Series([np.nan,1.,-1.])
-        result = s / 0
-        expected = Series([np.nan,np.inf,-np.inf])
-        assert_series_equal(result, expected)
-
-        # float/integer issue
-        # GH 7785
-        p = DataFrame({'first': (1,0), 'second': (-0.01,-0.02)})
-        expected = Series([-0.01,-np.inf])
-
-        result = p['second'].div(p['first'])
-        assert_series_equal(result, expected, check_names=False)
-
-        result = p['second'] / p['first']
-        assert_series_equal(result, expected)
-
-        # GH 9144
-        s = Series([-1, 0, 1])
-
-        result = 0 / s
-        expected = Series([0.0, nan, 0.0])
-        assert_series_equal(result, expected)
-
-        result = s / 0
-        expected = Series([-inf, nan, inf])
-        assert_series_equal(result, expected)
-
-        result = s // 0
-        expected = Series([-inf, nan, inf])
-        assert_series_equal(result, expected)
-
-    def test_operators(self):
-
-        def _check_op(series, other, op, pos_only=False):
-            left = np.abs(series) if pos_only else series
-            right = np.abs(other) if pos_only else other
-
-            cython_or_numpy = op(left, right)
-            python = left.combine(right, op)
-            tm.assert_almost_equal(cython_or_numpy, python)
-
-        def check(series, other):
-            simple_ops = ['add', 'sub', 'mul', 'truediv', 'floordiv', 'mod']
-
-            for opname in simple_ops:
-                _check_op(series, other, getattr(operator, opname))
-
-            _check_op(series, other, operator.pow, pos_only=True)
-
-            _check_op(series, other, lambda x, y: operator.add(y, x))
-            _check_op(series, other, lambda x, y: operator.sub(y, x))
-            _check_op(series, other, lambda x, y: operator.truediv(y, x))
-            _check_op(series, other, lambda x, y: operator.floordiv(y, x))
-            _check_op(series, other, lambda x, y: operator.mul(y, x))
-            _check_op(series, other, lambda x, y: operator.pow(y, x),
-                      pos_only=True)
-            _check_op(series, other, lambda x, y: operator.mod(y, x))
-
-        check(self.ts, self.ts * 2)
-        check(self.ts, self.ts * 0)
-        check(self.ts, self.ts[::2])
-        check(self.ts, 5)
-
-        def check_comparators(series, other):
-            _check_op(series, other, operator.gt)
-            _check_op(series, other, operator.ge)
-            _check_op(series, other, operator.eq)
-            _check_op(series, other, operator.lt)
-            _check_op(series, other, operator.le)
-
-        check_comparators(self.ts, 5)
-        check_comparators(self.ts, self.ts + 1)
-
-    def test_operators_empty_int_corner(self):
-        s1 = Series([], [], dtype=np.int32)
-        s2 = Series({'x': 0.})
-        tm.assert_series_equal(s1 * s2, Series([np.nan], index=['x']))
-
-    def test_constructor_dtype_timedelta64(self):
-
-        # basic
-        td = Series([timedelta(days=i) for i in range(3)])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
-
-        td = Series([timedelta(days=1)])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
-
-        td = Series([timedelta(days=1),timedelta(days=2),np.timedelta64(1,'s')])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
-
-        # mixed with NaT
-        from pandas import tslib
-        td = Series([timedelta(days=1),tslib.NaT ], dtype='m8[ns]' )
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
-
-        td = Series([timedelta(days=1),np.nan ], dtype='m8[ns]' )
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
-
-        td = Series([np.timedelta64(300000000), pd.NaT],dtype='m8[ns]')
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
-
-        # improved inference
-        # GH5689
-        td = Series([np.timedelta64(300000000), pd.NaT])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
-
-        td = Series([np.timedelta64(300000000), tslib.iNaT])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
-
-        td = Series([np.timedelta64(300000000), np.nan])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
-
-        td = Series([pd.NaT, np.timedelta64(300000000)])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
-
-        td = Series([np.timedelta64(1,'s')])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
-
-        # these are frequency conversion astypes
-        #for t in ['s', 'D', 'us', 'ms']:
-        #    self.assertRaises(TypeError, td.astype, 'm8[%s]' % t)
-
-        # valid astype
-        td.astype('int64')
-
-        # invalid casting
-        self.assertRaises(TypeError, td.astype, 'int32')
-
-        # this is an invalid casting
-        def f():
-            Series([timedelta(days=1), 'foo'],dtype='m8[ns]')
-        self.assertRaises(Exception, f)
-
-        # leave as object here
-        td = Series([timedelta(days=i) for i in range(3)] + ['foo'])
-        self.assertEqual(td.dtype, 'object')
-
-        # these will correctly infer a timedelta
-        s = Series([None, pd.NaT, '1 Day'])
-        self.assertEqual(s.dtype,'timedelta64[ns]')
-        s = Series([np.nan, pd.NaT, '1 Day'])
-        self.assertEqual(s.dtype,'timedelta64[ns]')
-        s = Series([pd.NaT, None, '1 Day'])
-        self.assertEqual(s.dtype,'timedelta64[ns]')
-        s = Series([pd.NaT, np.nan, '1 Day'])
-        self.assertEqual(s.dtype,'timedelta64[ns]')
-
-    def test_operators_timedelta64(self):
-
-        # invalid ops
-        self.assertRaises(Exception, self.objSeries.__add__, 1)
-        self.assertRaises(
-            Exception, self.objSeries.__add__, np.array(1, dtype=np.int64))
-        self.assertRaises(Exception, self.objSeries.__sub__, 1)
-        self.assertRaises(
-            Exception, self.objSeries.__sub__, np.array(1, dtype=np.int64))
-
-        # seriese ops
-        v1 = date_range('2012-1-1', periods=3, freq='D')
-        v2 = date_range('2012-1-2', periods=3, freq='D')
-        rs = Series(v2) - Series(v1)
-        xp = Series(1e9 * 3600 * 24, rs.index).astype(
-            'int64').astype('timedelta64[ns]')
-        assert_series_equal(rs, xp)
-        self.assertEqual(rs.dtype, 'timedelta64[ns]')
-
-        df = DataFrame(dict(A=v1))
-        td = Series([timedelta(days=i) for i in range(3)])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
-
-        # series on the rhs
-        result = df['A'] - df['A'].shift()
-        self.assertEqual(result.dtype, 'timedelta64[ns]')
-
-        result = df['A'] + td
-        self.assertEqual(result.dtype, 'M8[ns]')
-
-        # scalar Timestamp on rhs
-        maxa = df['A'].max()
-        tm.assertIsInstance(maxa, Timestamp)
-
-        resultb = df['A'] - df['A'].max()
-        self.assertEqual(resultb.dtype, 'timedelta64[ns]')
-
-        # timestamp on lhs
-        result = resultb + df['A']
-        values = [Timestamp('20111230'), Timestamp('20120101'), Timestamp('20120103')]
-        expected = Series(values, name='A')
-        assert_series_equal(result, expected)
-
-        # datetimes on rhs
-        result = df['A'] - datetime(2001, 1, 1)
-        expected = Series([timedelta(days=4017 + i) for i in range(3)], name='A')
-        assert_series_equal(result, expected)
-        self.assertEqual(result.dtype, 'm8[ns]')
-
-        d = datetime(2001, 1, 1, 3, 4)
-        resulta = df['A'] - d
-        self.assertEqual(resulta.dtype, 'm8[ns]')
-
-        # roundtrip
-        resultb = resulta + d
-        assert_series_equal(df['A'], resultb)
-
-        # timedeltas on rhs
-        td = timedelta(days=1)
-        resulta = df['A'] + td
-        resultb = resulta - td
-        assert_series_equal(resultb, df['A'])
-        self.assertEqual(resultb.dtype, 'M8[ns]')
-
-        # roundtrip
-        td = timedelta(minutes=5, seconds=3)
-        resulta = df['A'] + td
-        resultb = resulta - td
-        assert_series_equal(df['A'], resultb)
-        self.assertEqual(resultb.dtype, 'M8[ns]')
-
-        # inplace
-        value = rs[2] + np.timedelta64(timedelta(minutes=5,seconds=1))
-        rs[2] += np.timedelta64(timedelta(minutes=5,seconds=1))
-        self.assertEqual(rs[2], value)
-
-    def test_timedeltas_with_DateOffset(self):
-
-        # GH 4532
-        # operate with pd.offsets
-        s = Series([Timestamp('20130101 9:01'), Timestamp('20130101 9:02')])
-
-        result = s + pd.offsets.Second(5)
-        result2 = pd.offsets.Second(5) + s
-        expected = Series(
-            [Timestamp('20130101 9:01:05'), Timestamp('20130101 9:02:05')])
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-
-        result = s + pd.offsets.Milli(5)
-        result2 = pd.offsets.Milli(5) + s
-        expected = Series(
-            [Timestamp('20130101 9:01:00.005'), Timestamp('20130101 9:02:00.005')])
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-
-        result = s + pd.offsets.Minute(5) + pd.offsets.Milli(5)
-        expected = Series(
-            [Timestamp('20130101 9:06:00.005'), Timestamp('20130101 9:07:00.005')])
-        assert_series_equal(result, expected)
-
-        # operate with np.timedelta64 correctly
-        result = s + np.timedelta64(1, 's')
-        result2 = np.timedelta64(1, 's') + s
-        expected = Series(
-            [Timestamp('20130101 9:01:01'), Timestamp('20130101 9:02:01')])
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-
-        result = s + np.timedelta64(5, 'ms')
-        result2 = np.timedelta64(5, 'ms') + s
-        expected = Series(
-            [Timestamp('20130101 9:01:00.005'), Timestamp('20130101 9:02:00.005')])
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-
-        # valid DateOffsets
-        for do in [ 'Hour', 'Minute', 'Second', 'Day', 'Micro',
-                    'Milli', 'Nano' ]:
-            op = getattr(pd.offsets,do)
-            s + op(5)
-            op(5) + s
-
-
-    def test_timedelta64_operations_with_DateOffset(self):
-        # GH 10699
-        td = Series([timedelta(minutes=5, seconds=3)] * 3)
-        result = td + pd.offsets.Minute(1)
-        expected = Series([timedelta(minutes=6, seconds=3)] * 3)
-        assert_series_equal(result, expected)
-
-        result = td - pd.offsets.Minute(1)
-        expected = Series([timedelta(minutes=4, seconds=3)] * 3)
-        assert_series_equal(result, expected)
-
-        result = td + Series([pd.offsets.Minute(1), pd.offsets.Second(3),
-                              pd.offsets.Hour(2)])
-        expected = Series([timedelta(minutes=6, seconds=3),
-                           timedelta(minutes=5, seconds=6),
-                           timedelta(hours=2, minutes=5, seconds=3)])
-        assert_series_equal(result, expected)
-
-        result = td + pd.offsets.Minute(1) + pd.offsets.Second(12)
-        expected = Series([timedelta(minutes=6, seconds=15)] * 3)
-        assert_series_equal(result, expected)
-
-        # valid DateOffsets
-        for do in [ 'Hour', 'Minute', 'Second', 'Day', 'Micro',
-                    'Milli', 'Nano' ]:
-            op = getattr(pd.offsets,do)
-            td + op(5)
-            op(5) + td
-            td - op(5)
-            op(5) - td
-
-    def test_timedelta64_operations_with_timedeltas(self):
-
-        # td operate with td
-        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
-        td2 = timedelta(minutes=5, seconds=4)
-        result = td1 - td2
-        expected = Series([timedelta(seconds=0)] * 3) -Series(
-            [timedelta(seconds=1)] * 3)
-        self.assertEqual(result.dtype, 'm8[ns]')
-        assert_series_equal(result, expected)
-
-        result2 = td2 - td1
-        expected = (Series([timedelta(seconds=1)] * 3) -
-                    Series([timedelta(seconds=0)] * 3))
-        assert_series_equal(result2, expected)
-
-        # roundtrip
-        assert_series_equal(result + td2,td1)
-
-        # Now again, using pd.to_timedelta, which should build
-        # a Series or a scalar, depending on input.
-        td1 = Series(pd.to_timedelta(['00:05:03'] * 3))
-        td2 = pd.to_timedelta('00:05:04')
-        result = td1 - td2
-        expected = Series([timedelta(seconds=0)] * 3) -Series(
-            [timedelta(seconds=1)] * 3)
-        self.assertEqual(result.dtype, 'm8[ns]')
-        assert_series_equal(result, expected)
-
-        result2 = td2 - td1
-        expected = (Series([timedelta(seconds=1)] * 3) -
-                    Series([timedelta(seconds=0)] * 3))
-        assert_series_equal(result2, expected)
-
-        # roundtrip
-        assert_series_equal(result + td2,td1)
-
-    def test_timedelta64_operations_with_integers(self):
-
-        # GH 4521
-        # divide/multiply by integers
-        startdate = Series(date_range('2013-01-01', '2013-01-03'))
-        enddate = Series(date_range('2013-03-01', '2013-03-03'))
-
-        s1 = enddate - startdate
-        s1[2] = np.nan
-        s2 = Series([2, 3, 4])
-        expected = Series(s1.values.astype(np.int64) / s2, dtype='m8[ns]')
-        expected[2] = np.nan
-        result = s1 / s2
-        assert_series_equal(result,expected)
-
-        s2 = Series([20, 30, 40])
-        expected = Series(s1.values.astype(np.int64) / s2, dtype='m8[ns]')
-        expected[2] = np.nan
-        result = s1 / s2
-        assert_series_equal(result,expected)
-
-        result = s1 / 2
-        expected = Series(s1.values.astype(np.int64) / 2, dtype='m8[ns]')
-        expected[2] = np.nan
-        assert_series_equal(result,expected)
-
-        s2 = Series([20, 30, 40])
-        expected = Series(s1.values.astype(np.int64) * s2, dtype='m8[ns]')
-        expected[2] = np.nan
-        result = s1 * s2
-        assert_series_equal(result,expected)
-
-        for dtype in ['int32','int16','uint32','uint64','uint32','uint16','uint8']:
-            s2 = Series([20, 30, 40],dtype=dtype)
-            expected = Series(s1.values.astype(np.int64) * s2.astype(np.int64), dtype='m8[ns]')
-            expected[2] = np.nan
-            result = s1 * s2
-            assert_series_equal(result,expected)
-
-        result = s1 * 2
-        expected = Series(s1.values.astype(np.int64) * 2, dtype='m8[ns]')
-        expected[2] = np.nan
-        assert_series_equal(result,expected)
-
-        result = s1 * -1
-        expected = Series(s1.values.astype(np.int64) * -1, dtype='m8[ns]')
-        expected[2] = np.nan
-        assert_series_equal(result,expected)
-
-        # invalid ops
-        for op in ['__true_div__','__div__','__mul__']:
-            sop = getattr(s1,op,None)
-            if sop is not None:
-                self.assertRaises(TypeError, sop, s2.astype(float))
-                self.assertRaises(TypeError, sop, 2.)
-
-        for op in ['__add__','__sub__']:
-            sop = getattr(s1,op,None)
-            if sop is not None:
-                self.assertRaises(TypeError, sop, 1)
-                self.assertRaises(TypeError, sop, s2.values)
-
-    def test_timedelta64_conversions(self):
-        startdate = Series(date_range('2013-01-01', '2013-01-03'))
-        enddate = Series(date_range('2013-03-01', '2013-03-03'))
-
-        s1 = enddate - startdate
-        s1[2] = np.nan
-
-        for m in [1, 3, 10]:
-            for unit in ['D','h','m','s','ms','us','ns']:
-
-                # op
-                expected = s1.apply(lambda x: x / np.timedelta64(m,unit))
-                result = s1 / np.timedelta64(m,unit)
-                assert_series_equal(result, expected)
-
-                if m == 1 and unit != 'ns':
-
-                    # astype
-                    result = s1.astype("timedelta64[{0}]".format(unit))
-                    assert_series_equal(result, expected)
-
-                # reverse op
-                expected = s1.apply(lambda x: np.timedelta64(m,unit) / x)
-                result = np.timedelta64(m,unit) / s1
-
-        # astype
-        s = Series(date_range('20130101',periods=3))
-        result = s.astype(object)
-        self.assertIsInstance(result.iloc[0],datetime)
-        self.assertTrue(result.dtype == np.object_)
-
-        result = s1.astype(object)
-        self.assertIsInstance(result.iloc[0],timedelta)
-        self.assertTrue(result.dtype == np.object_)
-
-    def test_timedelta64_equal_timedelta_supported_ops(self):
-        ser = Series([Timestamp('20130301'), Timestamp('20130228 23:00:00'),
-                      Timestamp('20130228 22:00:00'),
-                      Timestamp('20130228 21:00:00')])
-
-        intervals = 'D', 'h', 'm', 's', 'us'
-        npy16_mappings = {'D': 24 * 60 * 60 * 1000000, 'h': 60 * 60 * 1000000,
-                          'm': 60 * 1000000, 's': 1000000, 'us': 1}
-
-        def timedelta64(*args):
-            return sum(starmap(np.timedelta64, zip(args, intervals)))
-
-        for op, d, h, m, s, us in product([operator.add, operator.sub],
-                                          *([range(2)] * 5)):
-            nptd = timedelta64(d, h, m, s, us)
-            pytd = timedelta(days=d, hours=h, minutes=m, seconds=s,
-                             microseconds=us)
-            lhs = op(ser, nptd)
-            rhs = op(ser, pytd)
-
-            try:
-                assert_series_equal(lhs, rhs)
-            except:
-                raise AssertionError(
-                    "invalid comparsion [op->{0},d->{1},h->{2},m->{3},s->{4},us->{5}]\n{6}\n{7}\n".format(op, d, h, m, s, us, lhs, rhs))
-
-    def test_timedelta_assignment(self):
-        # GH 8209
-        s = Series([])
-        s.loc['B'] = timedelta(1)
-        tm.assert_series_equal(s,Series(Timedelta('1 days'),index=['B']))
-
-        s = s.reindex(s.index.insert(0, 'A'))
-        tm.assert_series_equal(s,Series([np.nan,Timedelta('1 days')],index=['A','B']))
-
-        result = s.fillna(timedelta(1))
-        expected = Series(Timedelta('1 days'),index=['A','B'])
-        tm.assert_series_equal(result, expected)
-
-        s.loc['A'] = timedelta(1)
-        tm.assert_series_equal(s, expected)
-
-    def test_operators_datetimelike(self):
-
-        def run_ops(ops, get_ser, test_ser):
-
-            # check that we are getting a TypeError
-            # with 'operate' (from core/ops.py) for the ops that are not defined
-            for op_str in ops:
-                op = getattr(get_ser, op_str, None)
-                with tm.assertRaisesRegexp(TypeError, 'operate'):
-                    op(test_ser)
-
-        ### timedelta64 ###
-        td1 = Series([timedelta(minutes=5,seconds=3)]*3)
-        td1.iloc[2] = np.nan
-        td2 = timedelta(minutes=5,seconds=4)
-        ops = ['__mul__','__floordiv__','__pow__',
-               '__rmul__','__rfloordiv__','__rpow__']
-        run_ops(ops, td1, td2)
-        td1 + td2
-        td2 + td1
-        td1 - td2
-        td2 - td1
-        td1 / td2
-        td2 / td1
-
-        ### datetime64 ###
-        dt1 = Series([Timestamp('20111230'), Timestamp('20120101'),
-                      Timestamp('20120103')])
-        dt1.iloc[2] = np.nan
-        dt2 = Series([Timestamp('20111231'), Timestamp('20120102'),
-                      Timestamp('20120104')])
-        ops = ['__add__', '__mul__', '__floordiv__', '__truediv__', '__div__',
-               '__pow__', '__radd__', '__rmul__', '__rfloordiv__',
-               '__rtruediv__', '__rdiv__', '__rpow__']
-        run_ops(ops, dt1, dt2)
-        dt1 - dt2
-        dt2 - dt1
-
-        ### datetime64 with timetimedelta ###
-        ops = ['__mul__', '__floordiv__', '__truediv__', '__div__', '__pow__',
-               '__rmul__', '__rfloordiv__', '__rtruediv__', '__rdiv__',
-               '__rpow__']
-        run_ops(ops, dt1, td1)
-        dt1 + td1
-        td1 + dt1
-        dt1 - td1
-        # TODO: Decide if this ought to work.
-        # td1 - dt1
-
-        ### timetimedelta with datetime64 ###
-        ops = ['__sub__', '__mul__', '__floordiv__', '__truediv__', '__div__',
-               '__pow__', '__rsub__', '__rmul__', '__rfloordiv__',
-               '__rtruediv__', '__rdiv__', '__rpow__']
-        run_ops(ops, td1, dt1)
-        td1 + dt1
-        dt1 + td1
-
-        # 8260, 10763
-        # datetime64 with tz
-        ops = ['__mul__', '__floordiv__', '__truediv__', '__div__', '__pow__',
-               '__rmul__', '__rfloordiv__', '__rtruediv__', '__rdiv__',
-               '__rpow__']
-        dt1 = Series(date_range('2000-01-01 09:00:00',periods=5,tz='US/Eastern'),name='foo')
-        dt2 = dt1.copy()
-        dt2.iloc[2] = np.nan
-        td1 = Series(timedelta_range('1 days 1 min',periods=5, freq='H'))
-        td2 = td1.copy()
-        td2.iloc[1] = np.nan
-        run_ops(ops, dt1, td1)
-
-        result = dt1 + td1[0]
-        expected = (dt1.dt.tz_localize(None) + td1[0]).dt.tz_localize('US/Eastern')
-        assert_series_equal(result, expected)
-
-        result = dt2 + td2[0]
-        expected = (dt2.dt.tz_localize(None) + td2[0]).dt.tz_localize('US/Eastern')
-        assert_series_equal(result, expected)
-
-        # odd numpy behavior with scalar timedeltas
-        if not _np_version_under1p8:
-            result = td1[0] + dt1
-            expected = (dt1.dt.tz_localize(None) + td1[0]).dt.tz_localize('US/Eastern')
-            assert_series_equal(result, expected)
-
-            result = td2[0] + dt2
-            expected = (dt2.dt.tz_localize(None) + td2[0]).dt.tz_localize('US/Eastern')
-            assert_series_equal(result, expected)
-
-        result = dt1 - td1[0]
-        expected = (dt1.dt.tz_localize(None) - td1[0]).dt.tz_localize('US/Eastern')
-        assert_series_equal(result, expected)
-        self.assertRaises(TypeError, lambda: td1[0] - dt1)
-
-        result = dt2 - td2[0]
-        expected = (dt2.dt.tz_localize(None) - td2[0]).dt.tz_localize('US/Eastern')
-        assert_series_equal(result, expected)
-        self.assertRaises(TypeError, lambda: td2[0] - dt2)
-
-        result = dt1 + td1
-        expected = (dt1.dt.tz_localize(None) + td1).dt.tz_localize('US/Eastern')
-        assert_series_equal(result, expected)
-
-        result = dt2 + td2
-        expected = (dt2.dt.tz_localize(None) + td2).dt.tz_localize('US/Eastern')
-        assert_series_equal(result, expected)
-
-        result = dt1 - td1
-        expected = (dt1.dt.tz_localize(None) - td1).dt.tz_localize('US/Eastern')
-        assert_series_equal(result, expected)
-
-        result = dt2 - td2
-        expected = (dt2.dt.tz_localize(None) - td2).dt.tz_localize('US/Eastern')
-        assert_series_equal(result, expected)
-
-        self.assertRaises(TypeError, lambda: td1 - dt1)
-        self.assertRaises(TypeError, lambda: td2 - dt2)
-
-    def test_ops_datetimelike_align(self):
-        # GH 7500
-        # datetimelike ops need to align
-        dt = Series(date_range('2012-1-1', periods=3, freq='D'))
-        dt.iloc[2] = np.nan
-        dt2 = dt[::-1]
-
-        expected = Series([timedelta(0), timedelta(0), pd.NaT])
-        # name is reset
-        result = dt2 - dt
-        assert_series_equal(result, expected)
-
-        expected = Series(expected, name=0)
-        result = (dt2.to_frame() - dt.to_frame())[0]
-        assert_series_equal(result, expected)
-
-    def test_timedelta64_functions(self):
-
-        from datetime import timedelta
-        from pandas import date_range
-
-        # index min/max
-        td = Series(date_range('2012-1-1', periods=3, freq='D')) - \
-                    Timestamp('20120101')
-
-        result = td.idxmin()
-        self.assertEqual(result, 0)
-
-        result = td.idxmax()
-        self.assertEqual(result, 2)
-
-        # GH 2982
-        # with NaT
-        td[0] = np.nan
-
-        result = td.idxmin()
-        self.assertEqual(result, 1)
-
-        result = td.idxmax()
-        self.assertEqual(result, 2)
-
-        # abs
-        s1 = Series(date_range('20120101', periods=3))
-        s2 = Series(date_range('20120102', periods=3))
-        expected = Series(s2 - s1)
-
-        # this fails as numpy returns timedelta64[us]
-        #result = np.abs(s1-s2)
-        # assert_frame_equal(result,expected)
-
-        result = (s1 - s2).abs()
-        assert_series_equal(result, expected)
-
-        # max/min
-        result = td.max()
-        expected = Timedelta('2 days')
-        self.assertEqual(result, expected)
-
-        result = td.min()
-        expected = Timedelta('1 days')
-        self.assertEqual(result, expected)
-
-    def test_ops_consistency_on_empty(self):
-
-        # GH 7869
-        # consistency on empty
-
-        # float
-        result = Series(dtype=float).sum()
-        self.assertEqual(result,0)
-
-        result = Series(dtype=float).mean()
-        self.assertTrue(isnull(result))
-
-        result = Series(dtype=float).median()
-        self.assertTrue(isnull(result))
-
-        # timedelta64[ns]
-        result = Series(dtype='m8[ns]').sum()
-        self.assertEqual(result, Timedelta(0))
-
-        result = Series(dtype='m8[ns]').mean()
-        self.assertTrue(result is pd.NaT)
-
-        result = Series(dtype='m8[ns]').median()
-        self.assertTrue(result is pd.NaT)
-
-    def test_timedelta_fillna(self):
-        #GH 3371
-        s = Series([Timestamp('20130101'), Timestamp('20130101'),
-                    Timestamp('20130102'), Timestamp('20130103 9:01:01')])
-        td = s.diff()
-
-        # reg fillna
-        result = td.fillna(0)
-        expected = Series([timedelta(0), timedelta(0), timedelta(1),
-                           timedelta(days=1, seconds=9*3600+60+1)])
-        assert_series_equal(result, expected)
-
-        # interprested as seconds
-        result = td.fillna(1)
-        expected = Series([timedelta(seconds=1), timedelta(0),
-                           timedelta(1), timedelta(days=1, seconds=9*3600+60+1)])
-        assert_series_equal(result, expected)
-
-        result = td.fillna(timedelta(days=1, seconds=1))
-        expected = Series([timedelta(days=1, seconds=1), timedelta(0),
-                           timedelta(1), timedelta(days=1, seconds=9*3600+60+1)])
-        assert_series_equal(result, expected)
-
-        result = td.fillna(np.timedelta64(int(1e9)))
-        expected = Series([timedelta(seconds=1), timedelta(0), timedelta(1),
-                           timedelta(days=1, seconds=9*3600+60+1)])
-        assert_series_equal(result, expected)
-
-        from pandas import tslib
-        result = td.fillna(tslib.NaT)
-        expected = Series([tslib.NaT, timedelta(0), timedelta(1),
-                           timedelta(days=1, seconds=9*3600+60+1)], dtype='m8[ns]')
-        assert_series_equal(result, expected)
-
-        # ffill
-        td[2] = np.nan
-        result = td.ffill()
-        expected = td.fillna(0)
-        expected[0] = np.nan
-        assert_series_equal(result, expected)
-
-        # bfill
-        td[2] = np.nan
-        result = td.bfill()
-        expected = td.fillna(0)
-        expected[2] = timedelta(days=1, seconds=9*3600+60+1)
-        assert_series_equal(result, expected)
-
-    def test_datetime64_fillna(self):
-
-        s = Series([Timestamp('20130101'), Timestamp('20130101'),
-                    Timestamp('20130102'), Timestamp('20130103 9:01:01')])
-        s[2] = np.nan
-
-        # reg fillna
-        result = s.fillna(Timestamp('20130104'))
-        expected = Series([Timestamp('20130101'), Timestamp('20130101'),
-                           Timestamp('20130104'), Timestamp('20130103 9:01:01')])
-        assert_series_equal(result, expected)
-
-        from pandas import tslib
-        result = s.fillna(tslib.NaT)
-        expected = s
-        assert_series_equal(result, expected)
-
-        # ffill
-        result = s.ffill()
-        expected = Series([Timestamp('20130101'), Timestamp('20130101'),
-                           Timestamp('20130101'), Timestamp('20130103 9:01:01')])
-        assert_series_equal(result, expected)
-
-        # bfill
-        result = s.bfill()
-        expected = Series([Timestamp('20130101'), Timestamp('20130101'),
-                           Timestamp('20130103 9:01:01'),
-                           Timestamp('20130103 9:01:01')])
-        assert_series_equal(result, expected)
-
-        # GH 6587
-        # make sure that we are treating as integer when filling
-        # this also tests inference of a datetime-like with NaT's
-        s = Series([pd.NaT, pd.NaT, '2013-08-05 15:30:00.000001'])
-        expected = Series(['2013-08-05 15:30:00.000001', '2013-08-05 15:30:00.000001', '2013-08-05 15:30:00.000001'], dtype='M8[ns]')
-        result = s.fillna(method='backfill')
-        assert_series_equal(result, expected)
-
-    def test_datetime64_tz_fillna(self):
-        for tz in ['US/Eastern', 'Asia/Tokyo']:
-            # DatetimeBlock
-            s = Series([Timestamp('2011-01-01 10:00'), pd.NaT,
-                        Timestamp('2011-01-03 10:00'), pd.NaT])
-            result = s.fillna(pd.Timestamp('2011-01-02 10:00'))
-            expected = Series([Timestamp('2011-01-01 10:00'), Timestamp('2011-01-02 10:00'),
-                               Timestamp('2011-01-03 10:00'), Timestamp('2011-01-02 10:00')])
-            self.assert_series_equal(expected, result)
-
-            result = s.fillna(pd.Timestamp('2011-01-02 10:00', tz=tz))
-            expected = Series([Timestamp('2011-01-01 10:00'),
-                               Timestamp('2011-01-02 10:00', tz=tz),
-                               Timestamp('2011-01-03 10:00'),
-                               Timestamp('2011-01-02 10:00', tz=tz)])
-            self.assert_series_equal(expected, result)
-
-            result = s.fillna('AAA')
-            expected = Series([Timestamp('2011-01-01 10:00'), 'AAA',
-                               Timestamp('2011-01-03 10:00'), 'AAA'], dtype=object)
-            self.assert_series_equal(expected, result)
-
-            result = s.fillna({1: pd.Timestamp('2011-01-02 10:00', tz=tz),
-                               3: pd.Timestamp('2011-01-04 10:00')})
-            expected = Series([Timestamp('2011-01-01 10:00'),
-                               Timestamp('2011-01-02 10:00', tz=tz),
-                               Timestamp('2011-01-03 10:00'),
-                               Timestamp('2011-01-04 10:00')])
-            self.assert_series_equal(expected, result)
-
-            result = s.fillna({1: pd.Timestamp('2011-01-02 10:00'),
-                               3: pd.Timestamp('2011-01-04 10:00')})
-            expected = Series([Timestamp('2011-01-01 10:00'), Timestamp('2011-01-02 10:00'),
-                               Timestamp('2011-01-03 10:00'), Timestamp('2011-01-04 10:00')])
-            self.assert_series_equal(expected, result)
-
-            # DatetimeBlockTZ
-            idx = pd.DatetimeIndex(['2011-01-01 10:00', pd.NaT,
-                                    '2011-01-03 10:00', pd.NaT], tz=tz)
-            s = pd.Series(idx)
-            result = s.fillna(pd.Timestamp('2011-01-02 10:00'))
-            expected = Series([Timestamp('2011-01-01 10:00', tz=tz),
-                               Timestamp('2011-01-02 10:00'),
-                               Timestamp('2011-01-03 10:00', tz=tz),
-                               Timestamp('2011-01-02 10:00')])
-            self.assert_series_equal(expected, result)
-
-            result = s.fillna(pd.Timestamp('2011-01-02 10:00', tz=tz))
-            idx = pd.DatetimeIndex(['2011-01-01 10:00', '2011-01-02 10:00',
-                                    '2011-01-03 10:00', '2011-01-02 10:00'],
-                                   tz=tz)
-            expected = Series(idx)
-            self.assert_series_equal(expected, result)
-
-            result = s.fillna(pd.Timestamp('2011-01-02 10:00', tz=tz).to_pydatetime())
-            idx = pd.DatetimeIndex(['2011-01-01 10:00', '2011-01-02 10:00',
-                                    '2011-01-03 10:00', '2011-01-02 10:00'],
-                                   tz=tz)
-            expected = Series(idx)
-            self.assert_series_equal(expected, result)
-
-            result = s.fillna('AAA')
-            expected = Series([Timestamp('2011-01-01 10:00', tz=tz), 'AAA',
-                               Timestamp('2011-01-03 10:00', tz=tz), 'AAA'],
-                              dtype=object)
-            self.assert_series_equal(expected, result)
-
-            result = s.fillna({1: pd.Timestamp('2011-01-02 10:00', tz=tz),
-                               3: pd.Timestamp('2011-01-04 10:00')})
-            expected = Series([Timestamp('2011-01-01 10:00', tz=tz),
-                               Timestamp('2011-01-02 10:00', tz=tz),
-                               Timestamp('2011-01-03 10:00', tz=tz),
-                               Timestamp('2011-01-04 10:00')])
-            self.assert_series_equal(expected, result)
-
-            result = s.fillna({1: pd.Timestamp('2011-01-02 10:00', tz=tz),
-                               3: pd.Timestamp('2011-01-04 10:00', tz=tz)})
-            expected = Series([Timestamp('2011-01-01 10:00', tz=tz),
-                               Timestamp('2011-01-02 10:00', tz=tz),
-                               Timestamp('2011-01-03 10:00', tz=tz),
-                               Timestamp('2011-01-04 10:00', tz=tz)])
-            self.assert_series_equal(expected, result)
-
-    def test_fillna_int(self):
-        s = Series(np.random.randint(-100, 100, 50))
-        s.fillna(method='ffill', inplace=True)
-        assert_series_equal(s.fillna(method='ffill', inplace=False), s)
-
-    def test_fillna_raise(self):
-        s = Series(np.random.randint(-100, 100, 50))
-        self.assertRaises(TypeError, s.fillna, [1, 2])
-        self.assertRaises(TypeError, s.fillna, (1, 2))
-
-    def test_raise_on_info(self):
-        s = Series(np.random.randn(10))
-        with tm.assertRaises(AttributeError):
-            s.info()
-
-    def test_isnull_for_inf(self):
-        s = Series(['a', np.inf, np.nan, 1.0])
-        with pd.option_context('mode.use_inf_as_null', True):
-            r = s.isnull()
-            dr = s.dropna()
-        e = Series([False, True, True, False])
-        de = Series(['a', 1.0], index=[0, 3])
-        tm.assert_series_equal(r, e)
-        tm.assert_series_equal(dr, de)
-
-
-# TimeSeries-specific
-
-    def test_fillna(self):
-        ts = Series([0., 1., 2., 3., 4.], index=tm.makeDateIndex(5))
-
-        self.assert_numpy_array_equal(ts, ts.fillna(method='ffill'))
-
-        ts[2] = np.NaN
-
-        self.assert_numpy_array_equal(ts.fillna(method='ffill'),
-                                      [0., 1., 1., 3., 4.])
-        self.assert_numpy_array_equal(ts.fillna(method='backfill'),
-                                      [0., 1., 3., 3., 4.])
-
-        self.assert_numpy_array_equal(ts.fillna(value=5), [0., 1., 5., 3., 4.])
-
-        self.assertRaises(ValueError, ts.fillna)
-        self.assertRaises(ValueError, self.ts.fillna, value=0, method='ffill')
-
-        # GH 5703
-        s1 = Series([np.nan])
-        s2 = Series([1])
-        result = s1.fillna(s2)
-        expected = Series([1.])
-        assert_series_equal(result,expected)
-        result = s1.fillna({})
-        assert_series_equal(result,s1)
-        result = s1.fillna(Series(()))
-        assert_series_equal(result,s1)
-        result = s2.fillna(s1)
-        assert_series_equal(result,s2)
-        result = s1.fillna({ 0 : 1})
-        assert_series_equal(result,expected)
-        result = s1.fillna({ 1 : 1})
-        assert_series_equal(result,Series([np.nan]))
-        result = s1.fillna({ 0 : 1, 1 : 1})
-        assert_series_equal(result,expected)
-        result = s1.fillna(Series({ 0 : 1, 1 : 1}))
-        assert_series_equal(result,expected)
-        result = s1.fillna(Series({ 0 : 1, 1 : 1},index=[4,5]))
-        assert_series_equal(result,s1)
-
-        s1 = Series([0, 1, 2], list('abc'))
-        s2 = Series([0, np.nan, 2], list('bac'))
-        result = s2.fillna(s1)
-        expected = Series([0,0,2.], list('bac'))
-        assert_series_equal(result,expected)
-
-        # limit
-        s = Series(np.nan,index=[0,1,2])
-        result = s.fillna(999,limit=1)
-        expected = Series([999,np.nan,np.nan],index=[0,1,2])
-        assert_series_equal(result,expected)
-
-        result = s.fillna(999,limit=2)
-        expected = Series([999,999,np.nan],index=[0,1,2])
-        assert_series_equal(result,expected)
-
-        # GH 9043
-        # make sure a string representation of int/float values can be filled
-        # correctly without raising errors or being converted
-        vals = ['0', '1.5', '-0.3']
-        for val in vals:
-            s = Series([0, 1, np.nan, np.nan, 4], dtype='float64')
-            result = s.fillna(val)
-            expected = Series([0, 1, val, val, 4], dtype='object')
-            assert_series_equal(result, expected)
-
-    def test_fillna_bug(self):
-        x = Series([nan, 1., nan, 3., nan], ['z', 'a', 'b', 'c', 'd'])
-        filled = x.fillna(method='ffill')
-        expected = Series([nan, 1., 1., 3., 3.], x.index)
-        assert_series_equal(filled, expected)
-
-        filled = x.fillna(method='bfill')
-        expected = Series([1., 1., 3., 3., nan], x.index)
-        assert_series_equal(filled, expected)
-
-    def test_fillna_inplace(self):
-        x = Series([nan, 1., nan, 3., nan], ['z', 'a', 'b', 'c', 'd'])
-        y = x.copy()
-
-        y.fillna(value=0, inplace=True)
-
-        expected = x.fillna(value=0)
-        assert_series_equal(y, expected)
-
-    def test_fillna_invalid_method(self):
-        try:
-            self.ts.fillna(method='ffil')
-        except ValueError as inst:
-            self.assertIn('ffil', str(inst))
-
-    def test_ffill(self):
-        ts = Series([0., 1., 2., 3., 4.], index=tm.makeDateIndex(5))
-        ts[2] = np.NaN
-        assert_series_equal(ts.ffill(), ts.fillna(method='ffill'))
-
-    def test_bfill(self):
-        ts = Series([0., 1., 2., 3., 4.], index=tm.makeDateIndex(5))
-        ts[2] = np.NaN
-        assert_series_equal(ts.bfill(), ts.fillna(method='bfill'))
-
-    def test_sub_of_datetime_from_TimeSeries(self):
-        from pandas.tseries.timedeltas import to_timedelta
-        from datetime import datetime
-        a = Timestamp(datetime(1993, 0o1, 0o7, 13, 30, 00))
-        b = datetime(1993, 6, 22, 13, 30)
-        a = Series([a])
-        result = to_timedelta(np.abs(a - b))
-        self.assertEqual(result.dtype, 'timedelta64[ns]')
-
-    def test_datetime64_with_index(self):
-
-        # arithmetic integer ops with an index
-        s = Series(np.random.randn(5))
-        expected = s - s.index.to_series()
-        result = s - s.index
-        assert_series_equal(result, expected)
-
-        # GH 4629
-        # arithmetic datetime64 ops with an index
-        s = Series(date_range('20130101', periods=5),
-                   index=date_range('20130101', periods=5))
-        expected = s - s.index.to_series()
-        result = s - s.index
-        assert_series_equal(result, expected)
-
-        result = s - s.index.to_period()
-        assert_series_equal(result, expected)
-
-        df = DataFrame(np.random.randn(5,2),
-                      index=date_range('20130101', periods=5))
-        df['date'] = Timestamp('20130102')
-        df['expected'] = df['date'] - df.index.to_series()
-        df['result'] = df['date'] - df.index
-        assert_series_equal(df['result'], df['expected'], check_names=False)
-
-    def test_timedelta64_nan(self):
-
-        from pandas import tslib
-        td = Series([timedelta(days=i) for i in range(10)])
-
-        # nan ops on timedeltas
-        td1 = td.copy()
-        td1[0] = np.nan
-        self.assertTrue(isnull(td1[0]))
-        self.assertEqual(td1[0].value, tslib.iNaT)
-        td1[0] = td[0]
-        self.assertFalse(isnull(td1[0]))
-
-        td1[1] = tslib.iNaT
-        self.assertTrue(isnull(td1[1]))
-        self.assertEqual(td1[1].value, tslib.iNaT)
-        td1[1] = td[1]
-        self.assertFalse(isnull(td1[1]))
-
-        td1[2] = tslib.NaT
-        self.assertTrue(isnull(td1[2]))
-        self.assertEqual(td1[2].value, tslib.iNaT)
-        td1[2] = td[2]
-        self.assertFalse(isnull(td1[2]))
-
-        # boolean setting
-        # this doesn't work, not sure numpy even supports it
-        #result = td[(td>np.timedelta64(timedelta(days=3))) & (td<np.timedelta64(timedelta(days=7)))] = np.nan
-        #self.assertEqual(isnull(result).sum(), 7)
-
-    # NumPy limitiation =(
-
-    # def test_logical_range_select(self):
-    #     np.random.seed(12345)
-    #     selector = -0.5 <= self.ts <= 0.5
-    #     expected = (self.ts >= -0.5) & (self.ts <= 0.5)
-    #     assert_series_equal(selector, expected)
-
-    def test_operators_na_handling(self):
-        from decimal import Decimal
-        from datetime import date
-        s = Series([Decimal('1.3'), Decimal('2.3')],
-                   index=[date(2012, 1, 1), date(2012, 1, 2)])
-
-        result = s + s.shift(1)
-        result2 = s.shift(1) + s
-        self.assertTrue(isnull(result[0]))
-        self.assertTrue(isnull(result2[0]))
-
-        s = Series(['foo', 'bar', 'baz', np.nan])
-        result = 'prefix_' + s
-        expected = Series(['prefix_foo', 'prefix_bar', 'prefix_baz', np.nan])
-        assert_series_equal(result, expected)
-
-        result = s + '_suffix'
-        expected = Series(['foo_suffix', 'bar_suffix', 'baz_suffix', np.nan])
-        assert_series_equal(result, expected)
-
-    def test_object_comparisons(self):
-        s = Series(['a', 'b', np.nan, 'c', 'a'])
-
-        result = s == 'a'
-        expected = Series([True, False, False, False, True])
-        assert_series_equal(result, expected)
-
-        result = s < 'a'
-        expected = Series([False, False, False, False, False])
-        assert_series_equal(result, expected)
-
-        result = s != 'a'
-        expected = -(s == 'a')
-        assert_series_equal(result, expected)
-
-    def test_comparison_operators_with_nas(self):
-        s = Series(bdate_range('1/1/2000', periods=10), dtype=object)
-        s[::2] = np.nan
-
-        # test that comparisons work
-        ops = ['lt', 'le', 'gt', 'ge', 'eq', 'ne']
-        for op in ops:
-            val = s[5]
-
-            f = getattr(operator, op)
-            result = f(s, val)
-
-            expected = f(s.dropna(), val).reindex(s.index)
-
-            if op == 'ne':
-                expected = expected.fillna(True).astype(bool)
-            else:
-                expected = expected.fillna(False).astype(bool)
-
-            assert_series_equal(result, expected)
-
-            # fffffffuuuuuuuuuuuu
-            # result = f(val, s)
-            # expected = f(val, s.dropna()).reindex(s.index)
-            # assert_series_equal(result, expected)
-
-        # boolean &, |, ^ should work with object arrays and propagate NAs
-
-        ops = ['and_', 'or_', 'xor']
-        mask = s.isnull()
-        for bool_op in ops:
-            f = getattr(operator, bool_op)
-
-            filled = s.fillna(s[0])
-
-            result = f(s < s[9], s > s[3])
-
-            expected = f(filled < filled[9], filled > filled[3])
-            expected[mask] = False
-            assert_series_equal(result, expected)
-
-    def test_comparison_object_numeric_nas(self):
-        s = Series(np.random.randn(10), dtype=object)
-        shifted = s.shift(2)
-
-        ops = ['lt', 'le', 'gt', 'ge', 'eq', 'ne']
-        for op in ops:
-            f = getattr(operator, op)
-
-            result = f(s, shifted)
-            expected = f(s.astype(float), shifted.astype(float))
-            assert_series_equal(result, expected)
-
-    def test_comparison_invalid(self):
-
-        # GH4968
-        # invalid date/int comparisons
-        s = Series(range(5))
-        s2 = Series(date_range('20010101', periods=5))
-
-        for (x, y) in [(s,s2),(s2,s)]:
-            self.assertRaises(TypeError, lambda : x == y)
-            self.assertRaises(TypeError, lambda : x != y)
-            self.assertRaises(TypeError, lambda : x >= y)
-            self.assertRaises(TypeError, lambda : x > y)
-            self.assertRaises(TypeError, lambda : x < y)
-            self.assertRaises(TypeError, lambda : x <= y)
-
-    def test_more_na_comparisons(self):
-        left = Series(['a', np.nan, 'c'])
-        right = Series(['a', np.nan, 'd'])
-
-        result = left == right
-        expected = Series([True, False, False])
-        assert_series_equal(result, expected)
-
-        result = left != right
-        expected = Series([False, True, True])
-        assert_series_equal(result, expected)
-
-        result = left == np.nan
-        expected = Series([False, False, False])
-        assert_series_equal(result, expected)
-
-        result = left != np.nan
-        expected = Series([True, True, True])
-        assert_series_equal(result, expected)
-
-    def test_comparison_different_length(self):
-        a = Series(['a', 'b', 'c'])
-        b = Series(['b', 'a'])
-        self.assertRaises(ValueError, a.__lt__, b)
-
-        a = Series([1, 2])
-        b = Series([2, 3, 4])
-        self.assertRaises(ValueError, a.__eq__, b)
-
-    def test_comparison_label_based(self):
-
-        # GH 4947
-        # comparisons should be label based
-
-        a = Series([True, False, True], list('bca'))
-        b = Series([False, True, False], list('abc'))
-
-        expected = Series([True, False, False], list('bca'))
-        result = a & b
-        assert_series_equal(result,expected)
-
-        expected = Series([True, False, True], list('bca'))
-        result = a | b
-        assert_series_equal(result,expected)
-
-        expected = Series([False, False, True], list('bca'))
-        result = a ^ b
-        assert_series_equal(result,expected)
-
-        # rhs is bigger
-        a = Series([True, False, True], list('bca'))
-        b = Series([False, True, False, True], list('abcd'))
-
-        expected = Series([True, False, False], list('bca'))
-        result = a & b
-        assert_series_equal(result,expected)
-
-        expected = Series([True, False, True], list('bca'))
-        result = a | b
-        assert_series_equal(result,expected)
-
-        # filling
-
-        # vs empty
-        result = a & Series([])
-        expected = Series([False, False, False], list('bca'))
-        assert_series_equal(result,expected)
-
-        result = a | Series([])
-        expected = Series([True, False, True], list('bca'))
-        assert_series_equal(result,expected)
-
-        # vs non-matching
-        result = a & Series([1],['z'])
-        expected = Series([False, False, False], list('bca'))
-        assert_series_equal(result,expected)
-
-        result = a | Series([1],['z'])
-        expected = Series([True, False, True], list('bca'))
-        assert_series_equal(result,expected)
-
-        # identity
-        # we would like s[s|e] == s to hold for any e, whether empty or not
-        for e in [Series([]),Series([1],['z']),Series(['z']),Series(np.nan,b.index),Series(np.nan,a.index)]:
-            result = a[a | e]
-            assert_series_equal(result,a[a])
-
-        # vs scalars
-        index = list('bca')
-        t = Series([True,False,True])
-
-        for v in [True,1,2]:
-            result = Series([True,False,True],index=index) | v
-            expected = Series([True,True,True],index=index)
-            assert_series_equal(result,expected)
-
-        for v in [np.nan,'foo']:
-            self.assertRaises(TypeError, lambda : t | v)
-
-        for v in [False,0]:
-            result = Series([True,False,True],index=index) | v
-            expected = Series([True,False,True],index=index)
-            assert_series_equal(result,expected)
-
-        for v in [True,1]:
-            result = Series([True,False,True],index=index) & v
-            expected = Series([True,False,True],index=index)
-            assert_series_equal(result,expected)
-
-        for v in [False,0]:
-            result = Series([True,False,True],index=index) & v
-            expected = Series([False,False,False],index=index)
-            assert_series_equal(result,expected)
-        for v in [np.nan]:
-            self.assertRaises(TypeError, lambda : t & v)
-
-    def test_operators_bitwise(self):
-        # GH 9016: support bitwise op for integer types
-        index = list('bca')
-
-        s_tft = Series([True, False, True], index=index)
-        s_fff = Series([False, False, False], index=index)
-        s_tff = Series([True, False, False], index=index)
-        s_empty = Series([])
-        s_0101 = Series([0,1,0,1])
-        s_0123 = Series(range(4),dtype='int64')
-        s_3333 = Series([3] * 4)
-        s_4444 = Series([4] * 4)
-
-        res = s_tft & s_empty
-        expected = s_fff
-        assert_series_equal(res, expected)
-
-        res = s_tft | s_empty
-        expected = s_tft
-        assert_series_equal(res, expected)
-
-        res = s_0123 & s_3333
-        expected = Series(range(4),dtype='int64')
-        assert_series_equal(res, expected)
-
-        res = s_0123 | s_4444
-        expected = Series(range(4, 8),dtype='int64')
-        assert_series_equal(res, expected)
-
-        s_a0b1c0 = Series([1], list('b'))
-
-        res = s_tft & s_a0b1c0
-        expected = s_tff
-        assert_series_equal(res, expected)
-
-        res = s_tft | s_a0b1c0
-        expected = s_tft
-        assert_series_equal(res, expected)
-
-        n0 = 0
-        res = s_tft & n0
-        expected = s_fff
-        assert_series_equal(res, expected)
-
-        res = s_0123 & n0
-        expected = Series([0] * 4)
-        assert_series_equal(res, expected)
-
-        n1 = 1
-        res = s_tft & n1
-        expected = s_tft
-        assert_series_equal(res, expected)
-
-        res = s_0123 & n1
-        expected = Series([0, 1, 0, 1])
-        assert_series_equal(res, expected)
-
-        s_1111 = Series([1]*4, dtype='int8')
-        res = s_0123 & s_1111
-        expected = Series([0, 1, 0, 1], dtype='int64')
-        assert_series_equal(res, expected)
-
-        res = s_0123.astype(np.int16) | s_1111.astype(np.int32)
-        expected = Series([1, 1, 3, 3], dtype='int32')
-        assert_series_equal(res, expected)
-
-        self.assertRaises(TypeError, lambda: s_1111 & 'a')
-        self.assertRaises(TypeError, lambda: s_1111 & ['a','b','c','d'])
-        self.assertRaises(TypeError, lambda: s_0123 & np.NaN)
-        self.assertRaises(TypeError, lambda: s_0123 & 3.14)
-        self.assertRaises(TypeError, lambda: s_0123 & [0.1, 4, 3.14, 2])
-
-        # s_0123 will be all false now because of reindexing like s_tft
-        assert_series_equal(s_tft & s_0123, Series([False] * 3, list('bca')))
-        # s_tft will be all false now because of reindexing like s_0123
-        assert_series_equal(s_0123 & s_tft, Series([False] * 4))
-        assert_series_equal(s_0123 & False, Series([False] * 4))
-        assert_series_equal(s_0123 ^ False, Series([False, True, True, True]))
-        assert_series_equal(s_0123 & [False], Series([False] * 4))
-        assert_series_equal(s_0123 & (False), Series([False] * 4))
-        assert_series_equal(s_0123 & Series([False, np.NaN, False, False]), Series([False] * 4))
-
-        s_ftft = Series([False, True, False, True])
-        assert_series_equal(s_0123 & Series([0.1, 4, -3.14, 2]), s_ftft)
-
-        s_abNd = Series(['a','b',np.NaN,'d'])
-        res = s_0123 & s_abNd
-        expected = s_ftft
-        assert_series_equal(res, expected)
-
-    def test_between(self):
-        s = Series(bdate_range('1/1/2000', periods=20).asobject)
-        s[::2] = np.nan
-
-        result = s[s.between(s[3], s[17])]
-        expected = s[3:18].dropna()
-        assert_series_equal(result, expected)
-
-        result = s[s.between(s[3], s[17], inclusive=False)]
-        expected = s[5:16].dropna()
-        assert_series_equal(result, expected)
-
-    def test_setitem_na(self):
-        # these induce dtype changes
-        expected = Series([np.nan, 3, np.nan, 5, np.nan, 7, np.nan, 9, np.nan])
-        s = Series([2, 3, 4, 5, 6, 7, 8, 9, 10])
-        s[::2] = np.nan
-        assert_series_equal(s, expected)
-
-        # get's coerced to float, right?
-        expected = Series([np.nan, 1, np.nan, 0])
-        s = Series([True, True, False, False])
-        s[::2] = np.nan
-        assert_series_equal(s, expected)
-
-        expected = Series([np.nan, np.nan, np.nan, np.nan, np.nan, 5, 6, 7, 8, 9])
-        s = Series(np.arange(10))
-        s[:5] = np.nan
-        assert_series_equal(s, expected)
-
-    def test_scalar_na_cmp_corners(self):
-        s = Series([2, 3, 4, 5, 6, 7, 8, 9, 10])
-
-        def tester(a, b):
-            return a & b
-
-        self.assertRaises(TypeError, tester, s, datetime(2005, 1, 1))
-
-        s = Series([2, 3, 4, 5, 6, 7, 8, 9, datetime(2005, 1, 1)])
-        s[::2] = np.nan
-
-        expected = Series(True,index=s.index)
-        expected[::2] = False
-        assert_series_equal(tester(s, list(s)), expected)
-
-        d = DataFrame({'A': s})
-        # TODO: Fix this exception - needs to be fixed! (see GH5035)
-        # (previously this was a TypeError because series returned
-        # NotImplemented
-        self.assertRaises(ValueError, tester, s, d)
-
-    def test_idxmin(self):
-        # test idxmin
-        # _check_stat_op approach can not be used here because of isnull check.
-
-        # add some NaNs
-        self.series[5:15] = np.NaN
-
-        # skipna or no
-        self.assertEqual(self.series[self.series.idxmin()], self.series.min())
-        self.assertTrue(isnull(self.series.idxmin(skipna=False)))
-
-        # no NaNs
-        nona = self.series.dropna()
-        self.assertEqual(nona[nona.idxmin()], nona.min())
-        self.assertEqual(nona.index.values.tolist().index(nona.idxmin()),
-                         nona.values.argmin())
-
-        # all NaNs
-        allna = self.series * nan
-        self.assertTrue(isnull(allna.idxmin()))
-
-        # datetime64[ns]
-        from pandas import date_range
-        s = Series(date_range('20130102', periods=6))
-        result = s.idxmin()
-        self.assertEqual(result, 0)
-
-        s[0] = np.nan
-        result = s.idxmin()
-        self.assertEqual(result, 1)
-
-    def test_idxmax(self):
-        # test idxmax
-        # _check_stat_op approach can not be used here because of isnull check.
-
-        # add some NaNs
-        self.series[5:15] = np.NaN
-
-        # skipna or no
-        self.assertEqual(self.series[self.series.idxmax()], self.series.max())
-        self.assertTrue(isnull(self.series.idxmax(skipna=False)))
-
-        # no NaNs
-        nona = self.series.dropna()
-        self.assertEqual(nona[nona.idxmax()], nona.max())
-        self.assertEqual(nona.index.values.tolist().index(nona.idxmax()),
-                         nona.values.argmax())
-
-        # all NaNs
-        allna = self.series * nan
-        self.assertTrue(isnull(allna.idxmax()))
-
-        from pandas import date_range
-        s = Series(date_range('20130102', periods=6))
-        result = s.idxmax()
-        self.assertEqual(result, 5)
-
-        s[5] = np.nan
-        result = s.idxmax()
-        self.assertEqual(result, 4)
-
-        # Float64Index
-        # GH 5914
-        s = pd.Series([1,2,3],[1.1,2.1,3.1])
-        result = s.idxmax()
-        self.assertEqual(result, 3.1)
-        result = s.idxmin()
-        self.assertEqual(result, 1.1)
-
-        s = pd.Series(s.index, s.index)
-        result = s.idxmax()
-        self.assertEqual(result, 3.1)
-        result = s.idxmin()
-        self.assertEqual(result, 1.1)
-
-    def test_ndarray_compat(self):
-
-        # test numpy compat with Series as sub-class of NDFrame
-        tsdf = DataFrame(np.random.randn(1000, 3), columns=['A', 'B', 'C'],
-                         index=date_range('1/1/2000', periods=1000))
-
-        def f(x):
-            return x[x.argmax()]
-        result = tsdf.apply(f)
-        expected = tsdf.max()
-        assert_series_equal(result,expected)
-
-        # .item()
-        s = Series([1])
-        result = s.item()
-        self.assertEqual(result, 1)
-        self.assertEqual(s.item(), s.iloc[0])
-
-        # using an ndarray like function
-        s = Series(np.random.randn(10))
-        result = np.ones_like(s)
-        expected = Series(1,index=range(10),dtype='float64')
-        #assert_series_equal(result,expected)
-
-        # ravel
-        s = Series(np.random.randn(10))
-        tm.assert_almost_equal(s.ravel(order='F'),s.values.ravel(order='F'))
-
-        # compress
-        # GH 6658
-        s = Series([0,1.,-1],index=list('abc'))
-        result = np.compress(s>0,s)
-        assert_series_equal(result, Series([1.],index=['b']))
-
-        result = np.compress(s<-1,s)
-        assert_series_equal(result, Series([],dtype='float64'))
-
-    def test_complexx(self):
-
-        # GH4819
-        # complex access for ndarray compat
-        a = np.arange(5)
-        b = Series(a + 4j*a)
-        tm.assert_almost_equal(a,b.real)
-        tm.assert_almost_equal(4*a,b.imag)
-
-        b.real = np.arange(5)+5
-        tm.assert_almost_equal(a+5,b.real)
-        tm.assert_almost_equal(4*a,b.imag)
-
-    def test_underlying_data_conversion(self):
-
-        # GH 4080
-        df = DataFrame(dict((c, [1,2,3]) for c in ['a', 'b', 'c']))
-        df.set_index(['a', 'b', 'c'], inplace=True)
-        s = Series([1], index=[(2,2,2)])
-        df['val'] = 0
-        df
-        df['val'].update(s)
-
-        expected = DataFrame(dict(a = [1,2,3], b = [1,2,3], c = [1,2,3], val = [0,1,0]))
-        expected.set_index(['a', 'b', 'c'], inplace=True)
-        tm.assert_frame_equal(df,expected)
-
-        # GH 3970
-        # these are chained assignments as well
-        pd.set_option('chained_assignment',None)
-        df = DataFrame({ "aa":range(5), "bb":[2.2]*5})
-        df["cc"] = 0.0
-        ck = [True]*len(df)
-        df["bb"].iloc[0] = .13
-        df_tmp = df.iloc[ck]
-        df["bb"].iloc[0] = .15
-        self.assertEqual(df['bb'].iloc[0], 0.15)
-        pd.set_option('chained_assignment','raise')
-
-        # GH 3217
-        df = DataFrame(dict(a = [1,3], b = [np.nan, 2]))
-        df['c'] = np.nan
-        df['c'].update(pd.Series(['foo'],index=[0]))
-
-        expected = DataFrame(dict(a = [1,3], b = [np.nan, 2], c = ['foo',np.nan]))
-        tm.assert_frame_equal(df,expected)
-
-    def test_operators_corner(self):
-        series = self.ts
-
-        empty = Series([], index=Index([]))
-
-        result = series + empty
-        self.assertTrue(np.isnan(result).all())
-
-        result = empty + Series([], index=Index([]))
-        self.assertEqual(len(result), 0)
-
-        # TODO: this returned NotImplemented earlier, what to do?
-        # deltas = Series([timedelta(1)] * 5, index=np.arange(5))
-        # sub_deltas = deltas[::2]
-        # deltas5 = deltas * 5
-        # deltas = deltas + sub_deltas
-
-        # float + int
-        int_ts = self.ts.astype(int)[:-5]
-        added = self.ts + int_ts
-        expected = self.ts.values[:-5] + int_ts.values
-        self.assert_numpy_array_equal(added[:-5], expected)
-
-    def test_operators_reverse_object(self):
-        # GH 56
-        arr = Series(np.random.randn(10), index=np.arange(10),
-                     dtype=object)
-
-        def _check_op(arr, op):
-            result = op(1., arr)
-            expected = op(1., arr.astype(float))
-            assert_series_equal(result.astype(float), expected)
-
-        _check_op(arr, operator.add)
-        _check_op(arr, operator.sub)
-        _check_op(arr, operator.mul)
-        _check_op(arr, operator.truediv)
-        _check_op(arr, operator.floordiv)
-
-    def test_series_frame_radd_bug(self):
-        import operator
-
-        # GH 353
-        vals = Series(tm.rands_array(5, 10))
-        result = 'foo_' + vals
-        expected = vals.map(lambda x: 'foo_' + x)
-        assert_series_equal(result, expected)
-
-        frame = DataFrame({'vals': vals})
-        result = 'foo_' + frame
-        expected = DataFrame({'vals': vals.map(lambda x: 'foo_' + x)})
-        tm.assert_frame_equal(result, expected)
-
-        # really raise this time
-        self.assertRaises(TypeError, operator.add, datetime.now(), self.ts)
-
-    def test_operators_frame(self):
-        # rpow does not work with DataFrame
-        df = DataFrame({'A': self.ts})
-
-        tm.assert_almost_equal(self.ts + self.ts, self.ts + df['A'])
-        tm.assert_almost_equal(self.ts ** self.ts, self.ts ** df['A'])
-        tm.assert_almost_equal(self.ts < self.ts, self.ts < df['A'])
-        tm.assert_almost_equal(self.ts / self.ts, self.ts / df['A'])
-
-    def test_operators_combine(self):
-        def _check_fill(meth, op, a, b, fill_value=0):
-            exp_index = a.index.union(b.index)
-            a = a.reindex(exp_index)
-            b = b.reindex(exp_index)
-
-            amask = isnull(a)
-            bmask = isnull(b)
-
-            exp_values = []
-            for i in range(len(exp_index)):
-                if amask[i]:
-                    if bmask[i]:
-                        exp_values.append(nan)
-                        continue
-                    exp_values.append(op(fill_value, b[i]))
-                elif bmask[i]:
-                    if amask[i]:
-                        exp_values.append(nan)
-                        continue
-                    exp_values.append(op(a[i], fill_value))
-                else:
-                    exp_values.append(op(a[i], b[i]))
-
-            result = meth(a, b, fill_value=fill_value)
-            expected = Series(exp_values, exp_index)
-            assert_series_equal(result, expected)
-
-        a = Series([nan, 1., 2., 3., nan], index=np.arange(5))
-        b = Series([nan, 1, nan, 3, nan, 4.], index=np.arange(6))
-
-        pairings = []
-        for op in ['add', 'sub', 'mul', 'pow', 'truediv', 'floordiv']:
-            fv = 0
-            lop = getattr(Series, op)
-            lequiv = getattr(operator, op)
-            rop = getattr(Series, 'r' + op)
-            # bind op at definition time...
-            requiv = lambda x, y, op=op: getattr(operator, op)(y, x)
-            pairings.append((lop, lequiv, fv))
-            pairings.append((rop, requiv, fv))
-
-        if compat.PY3:
-            pairings.append((Series.div, operator.truediv, 1))
-            pairings.append((Series.rdiv, lambda x, y: operator.truediv(y, x), 1))
-        else:
-            pairings.append((Series.div, operator.div, 1))
-            pairings.append((Series.rdiv, lambda x, y: operator.div(y, x), 1))
-
-        for op, equiv_op, fv in pairings:
-            result = op(a, b)
-            exp = equiv_op(a, b)
-            assert_series_equal(result, exp)
-            _check_fill(op, equiv_op, a, b, fill_value=fv)
-            # should accept axis=0 or axis='rows'
-            op(a, b, axis=0)
-
-    def test_combine_first(self):
-        values = tm.makeIntIndex(20).values.astype(float)
-        series = Series(values, index=tm.makeIntIndex(20))
-
-        series_copy = series * 2
-        series_copy[::2] = np.NaN
-
-        # nothing used from the input
-        combined = series.combine_first(series_copy)
-
-        self.assert_numpy_array_equal(combined, series)
-
-        # Holes filled from input
-        combined = series_copy.combine_first(series)
-        self.assertTrue(np.isfinite(combined).all())
-
-        self.assert_numpy_array_equal(combined[::2], series[::2])
-        self.assert_numpy_array_equal(combined[1::2], series_copy[1::2])
-
-        # mixed types
-        index = tm.makeStringIndex(20)
-        floats = Series(tm.randn(20), index=index)
-        strings = Series(tm.makeStringIndex(10), index=index[::2])
-
-        combined = strings.combine_first(floats)
-
-        tm.assert_dict_equal(strings, combined, compare_keys=False)
-        tm.assert_dict_equal(floats[1::2], combined, compare_keys=False)
-
-        # corner case
-        s = Series([1., 2, 3], index=[0, 1, 2])
-        result = s.combine_first(Series([], index=[]))
-        assert_series_equal(s, result)
-
-    def test_update(self):
-        s = Series([1.5, nan, 3., 4., nan])
-        s2 = Series([nan, 3.5, nan, 5.])
-        s.update(s2)
-
-        expected = Series([1.5, 3.5, 3., 5., np.nan])
-        assert_series_equal(s, expected)
-
-        # GH 3217
-        df = DataFrame([{"a": 1}, {"a": 3, "b": 2}])
-        df['c'] = np.nan
-
-        # this will fail as long as series is a sub-class of ndarray
-        # df['c'].update(Series(['foo'],index=[0])) #####
-
-    def test_corr(self):
-        tm._skip_if_no_scipy()
-
-        import scipy.stats as stats
-
-        # full overlap
-        self.assertAlmostEqual(self.ts.corr(self.ts), 1)
-
-        # partial overlap
-        self.assertAlmostEqual(self.ts[:15].corr(self.ts[5:]), 1)
-
-        self.assertTrue(isnull(self.ts[:15].corr(self.ts[5:], min_periods=12)))
-
-        ts1 = self.ts[:15].reindex(self.ts.index)
-        ts2 = self.ts[5:].reindex(self.ts.index)
-        self.assertTrue(isnull(ts1.corr(ts2, min_periods=12)))
-
-        # No overlap
-        self.assertTrue(np.isnan(self.ts[::2].corr(self.ts[1::2])))
-
-        # all NA
-        cp = self.ts[:10].copy()
-        cp[:] = np.nan
-        self.assertTrue(isnull(cp.corr(cp)))
-
-        A = tm.makeTimeSeries()
-        B = tm.makeTimeSeries()
-        result = A.corr(B)
-        expected, _ = stats.pearsonr(A, B)
-        self.assertAlmostEqual(result, expected)
-
-    def test_corr_rank(self):
-        tm._skip_if_no_scipy()
-
-        import scipy
-        import scipy.stats as stats
-
-        # kendall and spearman
-        A = tm.makeTimeSeries()
-        B = tm.makeTimeSeries()
-        A[-5:] = A[:5]
-        result = A.corr(B, method='kendall')
-        expected = stats.kendalltau(A, B)[0]
-        self.assertAlmostEqual(result, expected)
-
-        result = A.corr(B, method='spearman')
-        expected = stats.spearmanr(A, B)[0]
-        self.assertAlmostEqual(result, expected)
-
-        # these methods got rewritten in 0.8
-        if scipy.__version__ < LooseVersion('0.9'):
-            raise nose.SkipTest("skipping corr rank because of scipy version "
-                                "{0}".format(scipy.__version__))
-
-        # results from R
-        A = Series([-0.89926396, 0.94209606, -1.03289164, -0.95445587,
-                    0.76910310, -0.06430576, -2.09704447, 0.40660407,
-                    -0.89926396, 0.94209606])
-        B = Series([-1.01270225, -0.62210117, -1.56895827, 0.59592943,
-                    -0.01680292, 1.17258718, -1.06009347, -0.10222060,
-                    -0.89076239, 0.89372375])
-        kexp = 0.4319297
-        sexp = 0.5853767
-        self.assertAlmostEqual(A.corr(B, method='kendall'), kexp)
-        self.assertAlmostEqual(A.corr(B, method='spearman'), sexp)
-
-    def test_cov(self):
-        # full overlap
-        self.assertAlmostEqual(self.ts.cov(self.ts), self.ts.std() ** 2)
-
-        # partial overlap
-        self.assertAlmostEqual(
-            self.ts[:15].cov(self.ts[5:]), self.ts[5:15].std() ** 2)
-
-        # No overlap
-        self.assertTrue(np.isnan(self.ts[::2].cov(self.ts[1::2])))
-
-        # all NA
-        cp = self.ts[:10].copy()
-        cp[:] = np.nan
-        self.assertTrue(isnull(cp.cov(cp)))
-
-        # min_periods
-        self.assertTrue(isnull(self.ts[:15].cov(self.ts[5:], min_periods=12)))
-
-        ts1 = self.ts[:15].reindex(self.ts.index)
-        ts2 = self.ts[5:].reindex(self.ts.index)
-        self.assertTrue(isnull(ts1.cov(ts2, min_periods=12)))
-
-    def test_copy(self):
-        ts = self.ts.copy()
-
-        ts[::2] = np.NaN
-
-        # Did not modify original Series
-        self.assertFalse(np.isnan(self.ts[0]))
-
-    def test_count(self):
-        self.assertEqual(self.ts.count(), len(self.ts))
-
-        self.ts[::2] = np.NaN
-
-        self.assertEqual(self.ts.count(), np.isfinite(self.ts).sum())
-
-        mi = MultiIndex.from_arrays([list('aabbcc'), [1, 2, 2, nan, 1, 2]])
-        ts = Series(np.arange(len(mi)), index=mi)
-
-        left = ts.count(level=1)
-        right = Series([2, 3, 1], index=[1, 2, nan])
-        assert_series_equal(left, right)
-
-        ts.iloc[[0, 3, 5]] = nan
-        assert_series_equal(ts.count(level=1), right - 1)
-
-    def test_dtype(self):
-
-        self.assertEqual(self.ts.dtype, np.dtype('float64'))
-        self.assertEqual(self.ts.dtypes, np.dtype('float64'))
-        self.assertEqual(self.ts.ftype, 'float64:dense')
-        self.assertEqual(self.ts.ftypes, 'float64:dense')
-        assert_series_equal(self.ts.get_dtype_counts(),Series(1,['float64']))
-        assert_series_equal(self.ts.get_ftype_counts(),Series(1,['float64:dense']))
-
-    def test_dot(self):
-        a = Series(np.random.randn(4), index=['p', 'q', 'r', 's'])
-        b = DataFrame(np.random.randn(3, 4), index=['1', '2', '3'],
-                      columns=['p', 'q', 'r', 's']).T
-
-        result = a.dot(b)
-        expected = Series(np.dot(a.values, b.values),
-                             index=['1', '2', '3'])
-        assert_series_equal(result, expected)
-
-        # Check index alignment
-        b2 = b.reindex(index=reversed(b.index))
-        result = a.dot(b)
-        assert_series_equal(result, expected)
-
-        # Check ndarray argument
-        result = a.dot(b.values)
-        self.assertTrue(np.all(result == expected.values))
-        assert_almost_equal(a.dot(b['2'].values), expected['2'])
-
-        # Check series argument
-        assert_almost_equal(a.dot(b['1']), expected['1'])
-        assert_almost_equal(a.dot(b2['1']), expected['1'])
-
-        self.assertRaises(Exception, a.dot, a.values[:3])
-        self.assertRaises(ValueError, a.dot, b.T)
-
-    def test_value_counts_nunique(self):
-
-        # basics.rst doc example
-        series = Series(np.random.randn(500))
-        series[20:500] = np.nan
-        series[10:20]  = 5000
-        result = series.nunique()
-        self.assertEqual(result, 11)
-
-    def test_unique(self):
-
-        # 714 also, dtype=float
-        s = Series([1.2345] * 100)
-        s[::2] = np.nan
-        result = s.unique()
-        self.assertEqual(len(result), 2)
-
-        s = Series([1.2345] * 100, dtype='f4')
-        s[::2] = np.nan
-        result = s.unique()
-        self.assertEqual(len(result), 2)
-
-        # NAs in object arrays #714
-        s = Series(['foo'] * 100, dtype='O')
-        s[::2] = np.nan
-        result = s.unique()
-        self.assertEqual(len(result), 2)
-
-        # decision about None
-        s = Series([1, 2, 3, None, None, None], dtype=object)
-        result = s.unique()
-        expected = np.array([1, 2, 3, None], dtype=object)
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_dropna_empty(self):
-        s = Series([])
-        self.assertEqual(len(s.dropna()), 0)
-        s.dropna(inplace=True)
-        self.assertEqual(len(s), 0)
-
-        # invalid axis
-        self.assertRaises(ValueError, s.dropna, axis=1)
-
-
-    def test_datetime64_tz_dropna(self):
-        # DatetimeBlock
-        s = Series([Timestamp('2011-01-01 10:00'), pd.NaT,
-                    Timestamp('2011-01-03 10:00'), pd.NaT])
-        result = s.dropna()
-        expected = Series([Timestamp('2011-01-01 10:00'),
-                           Timestamp('2011-01-03 10:00')], index=[0, 2])
-        self.assert_series_equal(result, expected)
-
-        # DatetimeBlockTZ
-        idx = pd.DatetimeIndex(['2011-01-01 10:00', pd.NaT,
-                                '2011-01-03 10:00', pd.NaT],
-                               tz='Asia/Tokyo')
-        s = pd.Series(idx)
-        self.assertEqual(s.dtype, 'datetime64[ns, Asia/Tokyo]')
-        result = s.dropna()
-        expected = Series([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
-                           Timestamp('2011-01-03 10:00', tz='Asia/Tokyo')],
-                          index=[0, 2])
-        self.assertEqual(result.dtype, 'datetime64[ns, Asia/Tokyo]')
-        self.assert_series_equal(result, expected)
-
-    def test_axis_alias(self):
-        s = Series([1, 2, np.nan])
-        assert_series_equal(s.dropna(axis='rows'), s.dropna(axis='index'))
-        self.assertEqual(s.dropna().sum('rows'), 3)
-        self.assertEqual(s._get_axis_number('rows'), 0)
-        self.assertEqual(s._get_axis_name('rows'), 'index')
-
-    def test_drop_duplicates(self):
-        # check both int and object
-        for s in [Series([1, 2, 3, 3]), Series(['1', '2', '3', '3'])]:
-            expected = Series([False, False, False, True])
-            assert_series_equal(s.duplicated(), expected)
-            assert_series_equal(s.drop_duplicates(), s[~expected])
-            sc = s.copy()
-            sc.drop_duplicates(inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-            expected = Series([False, False, True, False])
-            assert_series_equal(s.duplicated(keep='last'), expected)
-            assert_series_equal(s.drop_duplicates(keep='last'), s[~expected])
-            sc = s.copy()
-            sc.drop_duplicates(keep='last', inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-            # deprecate take_last
-            with tm.assert_produces_warning(FutureWarning):
-                assert_series_equal(s.duplicated(take_last=True), expected)
-            with tm.assert_produces_warning(FutureWarning):
-                assert_series_equal(s.drop_duplicates(take_last=True), s[~expected])
-            sc = s.copy()
-            with tm.assert_produces_warning(FutureWarning):
-                sc.drop_duplicates(take_last=True, inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-            expected = Series([False, False, True, True])
-            assert_series_equal(s.duplicated(keep=False), expected)
-            assert_series_equal(s.drop_duplicates(keep=False), s[~expected])
-            sc = s.copy()
-            sc.drop_duplicates(keep=False, inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-        for s in [Series([1, 2, 3, 5, 3, 2, 4]),
-                  Series(['1', '2', '3', '5', '3', '2', '4'])]:
-            expected = Series([False, False, False, False, True, True, False])
-            assert_series_equal(s.duplicated(), expected)
-            assert_series_equal(s.drop_duplicates(), s[~expected])
-            sc = s.copy()
-            sc.drop_duplicates(inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-            expected = Series([False, True, True, False, False, False, False])
-            assert_series_equal(s.duplicated(keep='last'), expected)
-            assert_series_equal(s.drop_duplicates(keep='last'), s[~expected])
-            sc = s.copy()
-            sc.drop_duplicates(keep='last', inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-            # deprecate take_last
-            with tm.assert_produces_warning(FutureWarning):
-                assert_series_equal(s.duplicated(take_last=True), expected)
-            with tm.assert_produces_warning(FutureWarning):
-                assert_series_equal(s.drop_duplicates(take_last=True), s[~expected])
-            sc = s.copy()
-            with tm.assert_produces_warning(FutureWarning):
-                sc.drop_duplicates(take_last=True, inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-            expected = Series([False, True, True, False, True, True, False])
-            assert_series_equal(s.duplicated(keep=False), expected)
-            assert_series_equal(s.drop_duplicates(keep=False), s[~expected])
-            sc = s.copy()
-            sc.drop_duplicates(keep=False, inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-    def test_sort_values(self):
-
-        ts = self.ts.copy()
-
-        # 9816 deprecated
-        with tm.assert_produces_warning(FutureWarning):
-            ts.sort()
-
-        self.assert_numpy_array_equal(ts, self.ts.sort_values())
-        self.assert_numpy_array_equal(ts.index, self.ts.sort_values().index)
-
-        ts.sort_values(ascending=False, inplace=True)
-        self.assert_numpy_array_equal(ts, self.ts.sort_values(ascending=False))
-        self.assert_numpy_array_equal(ts.index,
-                                      self.ts.sort_values(ascending=False).index)
-
-        # GH 5856/5853
-        # Series.sort_values operating on a view
-        df = DataFrame(np.random.randn(10,4))
-        s = df.iloc[:,0]
-        def f():
-            s.sort_values(inplace=True)
-        self.assertRaises(ValueError, f)
-
-        # test order/sort inplace
-        # GH6859
-        ts1 = self.ts.copy()
-        ts1.sort_values(ascending=False, inplace=True)
-        ts2 = self.ts.copy()
-        ts2.sort_values(ascending=False, inplace=True)
-        assert_series_equal(ts1,ts2)
-
-        ts1 = self.ts.copy()
-        ts1 = ts1.sort_values(ascending=False, inplace=False)
-        ts2 = self.ts.copy()
-        ts2 = ts.sort_values(ascending=False)
-        assert_series_equal(ts1,ts2)
-
-    def test_sort_index(self):
-        rindex = list(self.ts.index)
-        random.shuffle(rindex)
-
-        random_order = self.ts.reindex(rindex)
-        sorted_series = random_order.sort_index()
-        assert_series_equal(sorted_series, self.ts)
-
-        # descending
-        sorted_series = random_order.sort_index(ascending=False)
-        assert_series_equal(sorted_series,
-                            self.ts.reindex(self.ts.index[::-1]))
-
-    def test_sort_API(self):
-
-        # API for 9816
-
-        # sortlevel
-        mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
-        s = Series([1, 2], mi)
-        backwards = s.iloc[[1, 0]]
-
-        res = s.sort_index(level='A')
-        assert_series_equal(backwards, res)
-
-        # sort_index
-        rindex = list(self.ts.index)
-        random.shuffle(rindex)
-
-        random_order = self.ts.reindex(rindex)
-        sorted_series = random_order.sort_index(level=0)
-        assert_series_equal(sorted_series, self.ts)
-
-        # compat on axis
-        sorted_series = random_order.sort_index(axis=0)
-        assert_series_equal(sorted_series, self.ts)
-
-        self.assertRaises(ValueError, lambda : random_order.sort_values(axis=1))
-
-        sorted_series = random_order.sort_index(level=0, axis=0)
-        assert_series_equal(sorted_series, self.ts)
-
-        self.assertRaises(ValueError, lambda : random_order.sort_index(level=0, axis=1))
-
-    def test_order(self):
-
-        # 9816 deprecated
-        with tm.assert_produces_warning(FutureWarning):
-            self.ts.order()
-
-        ts = self.ts.copy()
-        ts[:5] = np.NaN
-        vals = ts.values
-
-        result = ts.sort_values()
-        self.assertTrue(np.isnan(result[-5:]).all())
-        self.assert_numpy_array_equal(result[:-5], np.sort(vals[5:]))
-
-        result = ts.sort_values(na_position='first')
-        self.assertTrue(np.isnan(result[:5]).all())
-        self.assert_numpy_array_equal(result[5:], np.sort(vals[5:]))
-
-        # something object-type
-        ser = Series(['A', 'B'], [1, 2])
-        # no failure
-        ser.sort_values()
-
-        # ascending=False
-        ordered = ts.sort_values(ascending=False)
-        expected = np.sort(ts.valid().values)[::-1]
-        assert_almost_equal(expected, ordered.valid().values)
-        ordered = ts.sort_values(ascending=False, na_position='first')
-        assert_almost_equal(expected, ordered.valid().values)
-
-    def test_nsmallest_nlargest(self):
-        # float, int, datetime64 (use i8), timedelts64 (same),
-        # object that are numbers, object that are strings
-
-        base = [3, 2, 1, 2, 5]
-
-        s_list = [
-            Series(base, dtype='int8'),
-            Series(base, dtype='int16'),
-            Series(base, dtype='int32'),
-            Series(base, dtype='int64'),
-            Series(base, dtype='float32'),
-            Series(base, dtype='float64'),
-            Series(base, dtype='uint8'),
-            Series(base, dtype='uint16'),
-            Series(base, dtype='uint32'),
-            Series(base, dtype='uint64'),
-            Series(base).astype('timedelta64[ns]'),
-            Series(pd.to_datetime(['2003', '2002', '2001', '2002', '2005'])),
-        ]
-
-        raising = [
-            Series([3., 2, 1, 2, '5'], dtype='object'),
-            Series([3., 2, 1, 2, 5], dtype='object'),
-            # not supported on some archs
-            # Series([3., 2, 1, 2, 5], dtype='complex256'),
-            Series([3., 2, 1, 2, 5], dtype='complex128'),
-        ]
-
-        for r in raising:
-            dt = r.dtype
-            msg = "Cannot use method 'n(larg|small)est' with dtype %s" % dt
-            args = 2, len(r), 0, -1
-            methods = r.nlargest, r.nsmallest
-            for method, arg in product(methods, args):
-                with tm.assertRaisesRegexp(TypeError, msg):
-                    method(arg)
-
-        for s in s_list:
-
-            assert_series_equal(s.nsmallest(2), s.iloc[[2, 1]])
-
-            assert_series_equal(s.nsmallest(2, keep='last'), s.iloc[[2, 3]])
-            with tm.assert_produces_warning(FutureWarning):
-                assert_series_equal(s.nsmallest(2, take_last=True), s.iloc[[2, 3]])
-
-            assert_series_equal(s.nlargest(3), s.iloc[[4, 0, 1]])
-
-            assert_series_equal(s.nlargest(3, keep='last'), s.iloc[[4, 0, 3]])
-            with tm.assert_produces_warning(FutureWarning):
-                assert_series_equal(s.nlargest(3, take_last=True), s.iloc[[4, 0, 3]])
-
-            empty = s.iloc[0:0]
-            assert_series_equal(s.nsmallest(0), empty)
-            assert_series_equal(s.nsmallest(-1), empty)
-            assert_series_equal(s.nlargest(0), empty)
-            assert_series_equal(s.nlargest(-1), empty)
-
-            assert_series_equal(s.nsmallest(len(s)), s.sort_values())
-            assert_series_equal(s.nsmallest(len(s) + 1), s.sort_values())
-            assert_series_equal(s.nlargest(len(s)), s.iloc[[4, 0, 1, 3, 2]])
-            assert_series_equal(s.nlargest(len(s) + 1),
-                                s.iloc[[4, 0, 1, 3, 2]])
-
-        s = Series([3., np.nan, 1, 2, 5])
-        assert_series_equal(s.nlargest(), s.iloc[[4, 0, 3, 2]])
-        assert_series_equal(s.nsmallest(), s.iloc[[2, 3, 0, 4]])
-
-        msg = 'keep must be either "first", "last"'
-        with tm.assertRaisesRegexp(ValueError, msg):
-            s.nsmallest(keep='invalid')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            s.nlargest(keep='invalid')
-
-    def test_rank(self):
-        tm._skip_if_no_scipy()
-        from scipy.stats import rankdata
-
-        self.ts[::2] = np.nan
-        self.ts[:10][::3] = 4.
-
-        ranks = self.ts.rank()
-        oranks = self.ts.astype('O').rank()
-
-        assert_series_equal(ranks, oranks)
-
-        mask = np.isnan(self.ts)
-        filled = self.ts.fillna(np.inf)
-
-        # rankdata returns a ndarray
-        exp = Series(rankdata(filled),index=filled.index)
-        exp[mask] = np.nan
-
-        assert_almost_equal(ranks, exp)
-
-        iseries = Series(np.arange(5).repeat(2))
-
-        iranks = iseries.rank()
-        exp = iseries.astype(float).rank()
-        assert_series_equal(iranks, exp)
-        iseries = Series(np.arange(5)) + 1.0
-        exp = iseries / 5.0
-        iranks = iseries.rank(pct=True)
-
-        assert_series_equal(iranks, exp)
-
-        iseries = Series(np.repeat(1, 100))
-        exp = Series(np.repeat(0.505, 100))
-        iranks = iseries.rank(pct=True)
-        assert_series_equal(iranks, exp)
-
-        iseries[1] = np.nan
-        exp = Series(np.repeat(50.0 / 99.0, 100))
-        exp[1] =  np.nan
-        iranks = iseries.rank(pct=True)
-        assert_series_equal(iranks, exp)
-
-        iseries = Series(np.arange(5)) + 1.0
-        iseries[4] = np.nan
-        exp = iseries / 4.0
-        iranks = iseries.rank(pct=True)
-        assert_series_equal(iranks, exp)
-
-        iseries = Series(np.repeat(np.nan, 100))
-        exp = iseries.copy()
-        iranks = iseries.rank(pct=True)
-        assert_series_equal(iranks, exp)
-
-        iseries = Series(np.arange(5)) + 1
-        iseries[4] = np.nan
-        exp = iseries / 4.0
-        iranks = iseries.rank(pct=True)
-        assert_series_equal(iranks, exp)
-
-        rng = date_range('1/1/1990', periods=5)
-        iseries = Series(np.arange(5), rng) + 1
-        iseries.ix[4] = np.nan
-        exp = iseries / 4.0
-        iranks = iseries.rank(pct=True)
-        assert_series_equal(iranks, exp)
-
-        iseries = Series([1e-50, 1e-100, 1e-20, 1e-2, 1e-20+1e-30, 1e-1])
-        exp = Series([2, 1, 3, 5, 4, 6.0])
-        iranks = iseries.rank()
-        assert_series_equal(iranks, exp)
-
-        values = np.array([-50, -1, -1e-20, -1e-25, -1e-50, 0, 1e-40, 1e-20, 1e-10, 2, 40], dtype='float64')
-        random_order = np.random.permutation(len(values))
-        iseries = Series(values[random_order])
-        exp = Series(random_order + 1.0, dtype='float64')
-        iranks = iseries.rank()
-        assert_series_equal(iranks, exp)
-
-    def test_rank_inf(self):
-        raise nose.SkipTest('DataFrame.rank does not currently rank np.inf and -np.inf properly')
-
-        values = np.array([-np.inf, -50, -1, -1e-20, -1e-25, -1e-50, 0, 1e-40, 1e-20, 1e-10, 2, 40, np.inf], dtype='float64')
-        random_order = np.random.permutation(len(values))
-        iseries = Series(values[random_order])
-        exp = Series(random_order + 1.0, dtype='float64')
-        iranks = iseries.rank()
-        assert_series_equal(iranks, exp)
-
-
-    def test_from_csv(self):
-
-        with ensure_clean() as path:
-            self.ts.to_csv(path)
-            ts = Series.from_csv(path)
-            assert_series_equal(self.ts, ts, check_names=False)
-            self.assertTrue(ts.name is None)
-            self.assertTrue(ts.index.name is None)
-
-            # GH10483
-            self.ts.to_csv(path, header=True)
-            ts_h = Series.from_csv(path, header=0)
-            self.assertTrue(ts_h.name == 'ts')
-
-            self.series.to_csv(path)
-            series = Series.from_csv(path)
-            self.assertIsNone(series.name)
-            self.assertIsNone(series.index.name)
-            assert_series_equal(self.series, series, check_names=False)
-            self.assertTrue(series.name is None)
-            self.assertTrue(series.index.name is None)
-
-            self.series.to_csv(path, header=True)
-            series_h = Series.from_csv(path, header=0)
-            self.assertTrue(series_h.name == 'series')
-
-            outfile = open(path, 'w')
-            outfile.write('1998-01-01|1.0\n1999-01-01|2.0')
-            outfile.close()
-            series = Series.from_csv(path, sep='|')
-            checkseries = Series(
-                 {datetime(1998, 1, 1): 1.0, datetime(1999, 1, 1): 2.0})
-            assert_series_equal(checkseries, series)
-
-            series = Series.from_csv(path, sep='|', parse_dates=False)
-            checkseries = Series({'1998-01-01': 1.0, '1999-01-01': 2.0})
-            assert_series_equal(checkseries, series)
-
-    def test_to_csv(self):
-        import io
-
-        with ensure_clean() as path:
-            self.ts.to_csv(path)
-
-            lines = io.open(path, newline=None).readlines()
-            assert(lines[1] != '\n')
-
-            self.ts.to_csv(path, index=False)
-            arr = np.loadtxt(path)
-            assert_almost_equal(arr, self.ts.values)
-
-    def test_to_csv_unicode_index(self):
-        buf = StringIO()
-        s = Series([u("\u05d0"), "d2"], index=[u("\u05d0"), u("\u05d1")])
-
-        s.to_csv(buf, encoding='UTF-8')
-        buf.seek(0)
-
-        s2 = Series.from_csv(buf, index_col=0, encoding='UTF-8')
-
-        assert_series_equal(s, s2)
-
-    def test_tolist(self):
-        rs = self.ts.tolist()
-        xp = self.ts.values.tolist()
-        assert_almost_equal(rs, xp)
-
-        # datetime64
-        s = Series(self.ts.index)
-        rs = s.tolist()
-        self.assertEqual(self.ts.index[0], rs[0])
-
-    def test_to_frame(self):
-        self.ts.name = None
-        rs = self.ts.to_frame()
-        xp = pd.DataFrame(self.ts.values, index=self.ts.index)
-        assert_frame_equal(rs, xp)
-
-        self.ts.name = 'testname'
-        rs = self.ts.to_frame()
-        xp = pd.DataFrame(dict(testname=self.ts.values), index=self.ts.index)
-        assert_frame_equal(rs, xp)
-
-        rs = self.ts.to_frame(name='testdifferent')
-        xp = pd.DataFrame(dict(testdifferent=self.ts.values), index=self.ts.index)
-        assert_frame_equal(rs, xp)
-
-    def test_to_dict(self):
-        self.assert_numpy_array_equal(Series(self.ts.to_dict()), self.ts)
-
-    def test_to_csv_float_format(self):
-
-        with ensure_clean() as filename:
-            ser = Series([0.123456, 0.234567, 0.567567])
-            ser.to_csv(filename, float_format='%.2f')
-
-            rs = Series.from_csv(filename)
-            xp = Series([0.12, 0.23, 0.57])
-            assert_series_equal(rs, xp)
-
-    def test_to_csv_list_entries(self):
-        s = Series(['jack and jill', 'jesse and frank'])
-
-        split = s.str.split(r'\s+and\s+')
-
-        buf = StringIO()
-        split.to_csv(buf)
-
-    def test_to_csv_path_is_none(self):
-        # GH 8215
-        # Series.to_csv() was returning None, inconsistent with
-        # DataFrame.to_csv() which returned string
-        s = Series([1, 2, 3])
-        csv_str = s.to_csv(path=None)
-        self.assertIsInstance(csv_str, str)
-
-    def test_str_attribute(self):
-        # GH9068
-        methods = ['strip', 'rstrip', 'lstrip']
-        s = Series([' jack', 'jill ', ' jesse ', 'frank'])
-        for method in methods:
-            expected = Series([getattr(str, method)(x) for x in s.values])
-            assert_series_equal(getattr(Series.str, method)(s.str), expected)
-
-        # str accessor only valid with string values
-        s = Series(range(5))
-        with self.assertRaisesRegexp(AttributeError, 'only use .str accessor'):
-            s.str.repeat(2)
-
-    def test_clip(self):
-        val = self.ts.median()
-
-        self.assertEqual(self.ts.clip_lower(val).min(), val)
-        self.assertEqual(self.ts.clip_upper(val).max(), val)
-
-        self.assertEqual(self.ts.clip(lower=val).min(), val)
-        self.assertEqual(self.ts.clip(upper=val).max(), val)
-
-        result = self.ts.clip(-0.5, 0.5)
-        expected = np.clip(self.ts, -0.5, 0.5)
-        assert_series_equal(result, expected)
-        tm.assertIsInstance(expected, Series)
-
-    def test_clip_types_and_nulls(self):
-
-        sers = [Series([np.nan, 1.0, 2.0, 3.0]),
-                Series([None, 'a', 'b', 'c']),
-                Series(pd.to_datetime([np.nan, 1, 2, 3], unit='D'))]
-
-        for s in sers:
-            thresh = s[2]
-            l = s.clip_lower(thresh)
-            u = s.clip_upper(thresh)
-            self.assertEqual(l[notnull(l)].min(), thresh)
-            self.assertEqual(u[notnull(u)].max(), thresh)
-            self.assertEqual(list(isnull(s)), list(isnull(l)))
-            self.assertEqual(list(isnull(s)), list(isnull(u)))
-
-    def test_clip_against_series(self):
-        # GH #6966
-
-        s = Series([1.0, 1.0, 4.0])
-        threshold = Series([1.0, 2.0, 3.0])
-
-        assert_series_equal(s.clip_lower(threshold), Series([1.0, 2.0, 4.0]))
-        assert_series_equal(s.clip_upper(threshold), Series([1.0, 1.0, 3.0]))
-
-        lower = Series([1.0, 2.0, 3.0])
-        upper = Series([1.5, 2.5, 3.5])
-        assert_series_equal(s.clip(lower, upper), Series([1.0, 2.0, 3.5]))
-        assert_series_equal(s.clip(1.5, upper), Series([1.5, 1.5, 3.5]))
-
-    def test_valid(self):
-        ts = self.ts.copy()
-        ts[::2] = np.NaN
-
-        result = ts.valid()
-        self.assertEqual(len(result), ts.count())
-
-        tm.assert_dict_equal(result, ts, compare_keys=False)
-
-    def test_isnull(self):
-        ser = Series([0, 5.4, 3, nan, -0.001])
-        np.array_equal(
-            ser.isnull(), Series([False, False, False, True, False]).values)
-        ser = Series(["hi", "", nan])
-        np.array_equal(ser.isnull(), Series([False, False, True]).values)
-
-    def test_notnull(self):
-        ser = Series([0, 5.4, 3, nan, -0.001])
-        np.array_equal(
-            ser.notnull(), Series([True, True, True, False, True]).values)
-        ser = Series(["hi", "", nan])
-        np.array_equal(ser.notnull(), Series([True, True, False]).values)
-
-    def test_shift(self):
-        shifted = self.ts.shift(1)
-        unshifted = shifted.shift(-1)
-
-        tm.assert_dict_equal(unshifted.valid(), self.ts, compare_keys=False)
-
-        offset = datetools.bday
-        shifted = self.ts.shift(1, freq=offset)
-        unshifted = shifted.shift(-1, freq=offset)
-
-        assert_series_equal(unshifted, self.ts)
-
-        unshifted = self.ts.shift(0, freq=offset)
-        assert_series_equal(unshifted, self.ts)
-
-        shifted = self.ts.shift(1, freq='B')
-        unshifted = shifted.shift(-1, freq='B')
-
-        assert_series_equal(unshifted, self.ts)
-
-        # corner case
-        unshifted = self.ts.shift(0)
-        assert_series_equal(unshifted, self.ts)
-
-        # Shifting with PeriodIndex
-        ps = tm.makePeriodSeries()
-        shifted = ps.shift(1)
-        unshifted = shifted.shift(-1)
-        tm.assert_dict_equal(unshifted.valid(), ps, compare_keys=False)
-
-        shifted2 = ps.shift(1, 'B')
-        shifted3 = ps.shift(1, datetools.bday)
-        assert_series_equal(shifted2, shifted3)
-        assert_series_equal(ps, shifted2.shift(-1, 'B'))
-
-        self.assertRaises(ValueError, ps.shift, freq='D')
-
-        # legacy support
-        shifted4 = ps.shift(1, freq='B')
-        assert_series_equal(shifted2, shifted4)
-
-        shifted5 = ps.shift(1, freq=datetools.bday)
-        assert_series_equal(shifted5, shifted4)
-
-        # 32-bit taking
-        # GH 8129
-        index=date_range('2000-01-01',periods=5)
-        for dtype in ['int32','int64']:
-            s1 = Series(np.arange(5,dtype=dtype),index=index)
-            p = s1.iloc[1]
-            result = s1.shift(periods=p)
-            expected = Series([np.nan,0,1,2,3],index=index)
-            assert_series_equal(result,expected)
-
-        # xref 8260
-        # with tz
-        s = Series(date_range('2000-01-01 09:00:00',periods=5,tz='US/Eastern'),name='foo')
-        result = s-s.shift()
-        assert_series_equal(result,Series(TimedeltaIndex(['NaT'] + ['1 days']*4),name='foo'))
-
-        # incompat tz
-        s2 = Series(date_range('2000-01-01 09:00:00',periods=5,tz='CET'),name='foo')
-        self.assertRaises(ValueError, lambda : s-s2)
-
-    def test_tshift(self):
-        # PeriodIndex
-        ps = tm.makePeriodSeries()
-        shifted = ps.tshift(1)
-        unshifted = shifted.tshift(-1)
-
-        assert_series_equal(unshifted, ps)
-
-        shifted2 = ps.tshift(freq='B')
-        assert_series_equal(shifted, shifted2)
-
-        shifted3 = ps.tshift(freq=datetools.bday)
-        assert_series_equal(shifted, shifted3)
-
-        self.assertRaises(ValueError, ps.tshift, freq='M')
-
-        # DatetimeIndex
-        shifted = self.ts.tshift(1)
-        unshifted = shifted.tshift(-1)
-
-        assert_series_equal(self.ts, unshifted)
-
-        shifted2 = self.ts.tshift(freq=self.ts.index.freq)
-        assert_series_equal(shifted, shifted2)
-
-        inferred_ts = Series(self.ts.values, Index(np.asarray(self.ts.index)),
-                             name='ts')
-        shifted = inferred_ts.tshift(1)
-        unshifted = shifted.tshift(-1)
-        assert_series_equal(shifted, self.ts.tshift(1))
-        assert_series_equal(unshifted, inferred_ts)
-
-        no_freq = self.ts[[0, 5, 7]]
-        self.assertRaises(ValueError, no_freq.tshift)
-
-    def test_shift_int(self):
-        ts = self.ts.astype(int)
-        shifted = ts.shift(1)
-        expected = ts.astype(float).shift(1)
-        assert_series_equal(shifted, expected)
-
-    def test_shift_categorical(self):
-        # GH 9416
-        s = pd.Series(['a', 'b', 'c', 'd'], dtype='category')
-
-        assert_series_equal(s.iloc[:-1], s.shift(1).shift(-1).valid())
-
-        sp1 = s.shift(1)
-        assert_index_equal(s.index, sp1.index)
-        self.assertTrue(np.all(sp1.values.codes[:1] == -1))
-        self.assertTrue(np.all(s.values.codes[:-1] == sp1.values.codes[1:]))
-
-        sn2 = s.shift(-2)
-        assert_index_equal(s.index, sn2.index)
-        self.assertTrue(np.all(sn2.values.codes[-2:] == -1))
-        self.assertTrue(np.all(s.values.codes[2:] == sn2.values.codes[:-2]))
-
-        assert_index_equal(s.values.categories, sp1.values.categories)
-        assert_index_equal(s.values.categories, sn2.values.categories)
-
-    def test_truncate(self):
-        offset = datetools.bday
-
-        ts = self.ts[::3]
-
-        start, end = self.ts.index[3], self.ts.index[6]
-        start_missing, end_missing = self.ts.index[2], self.ts.index[7]
-
-        # neither specified
-        truncated = ts.truncate()
-        assert_series_equal(truncated, ts)
-
-        # both specified
-        expected = ts[1:3]
-
-        truncated = ts.truncate(start, end)
-        assert_series_equal(truncated, expected)
-
-        truncated = ts.truncate(start_missing, end_missing)
-        assert_series_equal(truncated, expected)
-
-        # start specified
-        expected = ts[1:]
-
-        truncated = ts.truncate(before=start)
-        assert_series_equal(truncated, expected)
-
-        truncated = ts.truncate(before=start_missing)
-        assert_series_equal(truncated, expected)
-
-        # end specified
-        expected = ts[:3]
-
-        truncated = ts.truncate(after=end)
-        assert_series_equal(truncated, expected)
-
-        truncated = ts.truncate(after=end_missing)
-        assert_series_equal(truncated, expected)
-
-        # corner case, empty series returned
-        truncated = ts.truncate(after=self.ts.index[0] - offset)
-        assert(len(truncated) == 0)
-
-        truncated = ts.truncate(before=self.ts.index[-1] + offset)
-        assert(len(truncated) == 0)
-
-        self.assertRaises(ValueError, ts.truncate,
-                          before=self.ts.index[-1] + offset,
-                          after=self.ts.index[0] - offset)
-
-    def test_ptp(self):
-        N = 1000
-        arr = np.random.randn(N)
-        ser = Series(arr)
-        self.assertEqual(np.ptp(ser), np.ptp(arr))
-
-    def test_asof(self):
-        # array or list or dates
-        N = 50
-        rng = date_range('1/1/1990', periods=N, freq='53s')
-        ts = Series(np.random.randn(N), index=rng)
-        ts[15:30] = np.nan
-        dates = date_range('1/1/1990', periods=N * 3, freq='25s')
-
-        result = ts.asof(dates)
-        self.assertTrue(notnull(result).all())
-        lb = ts.index[14]
-        ub = ts.index[30]
-
-        result = ts.asof(list(dates))
-        self.assertTrue(notnull(result).all())
-        lb = ts.index[14]
-        ub = ts.index[30]
-
-        mask = (result.index >= lb) & (result.index < ub)
-        rs = result[mask]
-        self.assertTrue((rs == ts[lb]).all())
-
-        val = result[result.index[result.index >= ub][0]]
-        self.assertEqual(ts[ub], val)
-
-        self.ts[5:10] = np.NaN
-        self.ts[15:20] = np.NaN
-
-        val1 = self.ts.asof(self.ts.index[7])
-        val2 = self.ts.asof(self.ts.index[19])
-
-        self.assertEqual(val1, self.ts[4])
-        self.assertEqual(val2, self.ts[14])
-
-        # accepts strings
-        val1 = self.ts.asof(str(self.ts.index[7]))
-        self.assertEqual(val1, self.ts[4])
-
-        # in there
-        self.assertEqual(self.ts.asof(self.ts.index[3]), self.ts[3])
-
-        # no as of value
-        d = self.ts.index[0] - datetools.bday
-        self.assertTrue(np.isnan(self.ts.asof(d)))
-
-    def test_getitem_setitem_datetimeindex(self):
-        from pandas import date_range
-        N = 50
-        # testing with timezone, GH #2785
-        rng = date_range('1/1/1990', periods=N, freq='H', tz='US/Eastern')
-        ts = Series(np.random.randn(N), index=rng)
-
-        result = ts["1990-01-01 04:00:00"]
-        expected = ts[4]
-        self.assertEqual(result, expected)
-
-        result = ts.copy()
-        result["1990-01-01 04:00:00"] = 0
-        result["1990-01-01 04:00:00"] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts["1990-01-01 04:00:00":"1990-01-01 07:00:00"]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        result = ts.copy()
-        result["1990-01-01 04:00:00":"1990-01-01 07:00:00"] = 0
-        result["1990-01-01 04:00:00":"1990-01-01 07:00:00"] = ts[4:8]
-        assert_series_equal(result, ts)
-
-        lb = "1990-01-01 04:00:00"
-        rb = "1990-01-01 07:00:00"
-        result = ts[(ts.index >= lb) & (ts.index <= rb)]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        # repeat all the above with naive datetimes
-        result = ts[datetime(1990, 1, 1, 4)]
-        expected = ts[4]
-        self.assertEqual(result, expected)
-
-        result = ts.copy()
-        result[datetime(1990, 1, 1, 4)] = 0
-        result[datetime(1990, 1, 1, 4)] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts[datetime(1990, 1, 1, 4):datetime(1990, 1, 1, 7)]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        result = ts.copy()
-        result[datetime(1990, 1, 1, 4):datetime(1990, 1, 1, 7)] = 0
-        result[datetime(1990, 1, 1, 4):datetime(1990, 1, 1, 7)] = ts[4:8]
-        assert_series_equal(result, ts)
-
-        lb = datetime(1990, 1, 1, 4)
-        rb = datetime(1990, 1, 1, 7)
-        result = ts[(ts.index >= lb) & (ts.index <= rb)]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        result = ts[ts.index[4]]
-        expected = ts[4]
-        self.assertEqual(result, expected)
-
-        result = ts[ts.index[4:8]]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        result = ts.copy()
-        result[ts.index[4:8]] = 0
-        result[4:8] = ts[4:8]
-        assert_series_equal(result, ts)
-
-        # also test partial date slicing
-        result = ts["1990-01-02"]
-        expected = ts[24:48]
-        assert_series_equal(result, expected)
-
-        result = ts.copy()
-        result["1990-01-02"] = 0
-        result["1990-01-02"] = ts[24:48]
-        assert_series_equal(result, ts)
-
-    def test_getitem_setitem_datetime_tz_pytz(self):
-        tm._skip_if_no_pytz();
-        from pytz import timezone as tz
-
-        from pandas import date_range
-        N = 50
-        # testing with timezone, GH #2785
-        rng = date_range('1/1/1990', periods=N, freq='H', tz='US/Eastern')
-        ts = Series(np.random.randn(N), index=rng)
-
-        # also test Timestamp tz handling, GH #2789
-        result = ts.copy()
-        result["1990-01-01 09:00:00+00:00"] = 0
-        result["1990-01-01 09:00:00+00:00"] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts.copy()
-        result["1990-01-01 03:00:00-06:00"] = 0
-        result["1990-01-01 03:00:00-06:00"] = ts[4]
-        assert_series_equal(result, ts)
-
-        # repeat with datetimes
-        result = ts.copy()
-        result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = 0
-        result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts.copy()
-
-        # comparison dates with datetime MUST be localized!
-        date = tz('US/Central').localize(datetime(1990, 1, 1, 3))
-        result[date] = 0
-        result[date] = ts[4]
-        assert_series_equal(result, ts)
-
-
-    def test_getitem_setitem_datetime_tz_dateutil(self):
-        tm._skip_if_no_dateutil();
-        from dateutil.tz import tzutc
-        from pandas.tslib import _dateutil_gettz as gettz
-
-        tz = lambda x: tzutc() if x == 'UTC' else gettz(x)  # handle special case for utc in dateutil
-
-        from pandas import date_range
-        N = 50
-        # testing with timezone, GH #2785
-        rng = date_range('1/1/1990', periods=N, freq='H', tz='US/Eastern')
-        ts = Series(np.random.randn(N), index=rng)
-
-        # also test Timestamp tz handling, GH #2789
-        result = ts.copy()
-        result["1990-01-01 09:00:00+00:00"] = 0
-        result["1990-01-01 09:00:00+00:00"] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts.copy()
-        result["1990-01-01 03:00:00-06:00"] = 0
-        result["1990-01-01 03:00:00-06:00"] = ts[4]
-        assert_series_equal(result, ts)
-
-        # repeat with datetimes
-        result = ts.copy()
-        result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = 0
-        result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts.copy()
-        result[datetime(1990, 1, 1, 3, tzinfo=tz('US/Central'))] = 0
-        result[datetime(1990, 1, 1, 3, tzinfo=tz('US/Central'))] = ts[4]
-        assert_series_equal(result, ts)
-
-    def test_getitem_setitem_periodindex(self):
-        from pandas import period_range
-        N = 50
-        rng = period_range('1/1/1990', periods=N, freq='H')
-        ts = Series(np.random.randn(N), index=rng)
-
-        result = ts["1990-01-01 04"]
-        expected = ts[4]
-        self.assertEqual(result, expected)
-
-        result = ts.copy()
-        result["1990-01-01 04"] = 0
-        result["1990-01-01 04"] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts["1990-01-01 04":"1990-01-01 07"]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        result = ts.copy()
-        result["1990-01-01 04":"1990-01-01 07"] = 0
-        result["1990-01-01 04":"1990-01-01 07"] = ts[4:8]
-        assert_series_equal(result, ts)
-
-        lb = "1990-01-01 04"
-        rb = "1990-01-01 07"
-        result = ts[(ts.index >= lb) & (ts.index <= rb)]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        # GH 2782
-        result = ts[ts.index[4]]
-        expected = ts[4]
-        self.assertEqual(result, expected)
-
-        result = ts[ts.index[4:8]]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        result = ts.copy()
-        result[ts.index[4:8]] = 0
-        result[4:8] = ts[4:8]
-        assert_series_equal(result, ts)
-
-    def test_asof_periodindex(self):
-        from pandas import period_range, PeriodIndex
-        # array or list or dates
-        N = 50
-        rng = period_range('1/1/1990', periods=N, freq='H')
-        ts = Series(np.random.randn(N), index=rng)
-        ts[15:30] = np.nan
-        dates = date_range('1/1/1990', periods=N * 3, freq='37min')
-
-        result = ts.asof(dates)
-        self.assertTrue(notnull(result).all())
-        lb = ts.index[14]
-        ub = ts.index[30]
-
-        result = ts.asof(list(dates))
-        self.assertTrue(notnull(result).all())
-        lb = ts.index[14]
-        ub = ts.index[30]
-
-        pix = PeriodIndex(result.index.values, freq='H')
-        mask = (pix >= lb) & (pix < ub)
-        rs = result[mask]
-        self.assertTrue((rs == ts[lb]).all())
-
-        ts[5:10] = np.NaN
-        ts[15:20] = np.NaN
-
-        val1 = ts.asof(ts.index[7])
-        val2 = ts.asof(ts.index[19])
-
-        self.assertEqual(val1, ts[4])
-        self.assertEqual(val2, ts[14])
-
-        # accepts strings
-        val1 = ts.asof(str(ts.index[7]))
-        self.assertEqual(val1, ts[4])
-
-        # in there
-        self.assertEqual(ts.asof(ts.index[3]), ts[3])
-
-        # no as of value
-        d = ts.index[0].to_timestamp() - datetools.bday
-        self.assertTrue(np.isnan(ts.asof(d)))
-
-    def test_asof_more(self):
-        from pandas import date_range
-        s = Series([nan, nan, 1, 2, nan, nan, 3, 4, 5],
-                   index=date_range('1/1/2000', periods=9))
-
-        dates = s.index[[4, 5, 6, 2, 1]]
-
-        result = s.asof(dates)
-        expected = Series([2, 2, 3, 1, np.nan], index=dates)
-
-        assert_series_equal(result, expected)
-
-        s = Series([1.5, 2.5, 1, 2, nan, nan, 3, 4, 5],
-                   index=date_range('1/1/2000', periods=9))
-        result = s.asof(s.index[0])
-        self.assertEqual(result, s[0])
-
-    def test_cast_on_putmask(self):
-
-        # GH 2746
-
-        # need to upcast
-        s = Series([1, 2], index=[1, 2], dtype='int64')
-        s[[True, False]] = Series([0], index=[1], dtype='int64')
-        expected = Series([0, 2], index=[1, 2], dtype='int64')
-
-        assert_series_equal(s, expected)
-
-    def test_type_promote_putmask(self):
-
-        # GH8387: test that changing types does not break alignment
-        ts = Series(np.random.randn(100), index=np.arange(100,0,-1)).round(5)
-        left, mask = ts.copy(), ts > 0
-        right = ts[mask].copy().map(str)
-        left[mask] = right
-        assert_series_equal(left, ts.map(lambda t: str(t) if t > 0 else t))
-
-        s = Series([0, 1, 2, 0 ])
-        mask = s > 0
-        s2 = s[ mask ].map( str )
-        s[mask] = s2
-        assert_series_equal(s, Series([0, '1', '2', 0]))
-
-        s = Series([0, 'foo', 'bar', 0 ])
-        mask = Series([False, True, True, False])
-        s2 = s[ mask ]
-        s[mask] = s2
-        assert_series_equal(s, Series([0, 'foo','bar', 0]))
-
-    def test_astype_cast_nan_int(self):
-        df = Series([1.0, 2.0, 3.0, np.nan])
-        self.assertRaises(ValueError, df.astype, np.int64)
-
-    def test_astype_cast_object_int(self):
-        arr = Series(["car", "house", "tree", "1"])
-
-        self.assertRaises(ValueError, arr.astype, int)
-        self.assertRaises(ValueError, arr.astype, np.int64)
-        self.assertRaises(ValueError, arr.astype, np.int8)
-
-        arr = Series(['1', '2', '3', '4'], dtype=object)
-        result = arr.astype(int)
-        self.assert_numpy_array_equal(result, np.arange(1, 5))
-
-    def test_astype_datetimes(self):
-        import pandas.tslib as tslib
-
-        s = Series(tslib.iNaT, dtype='M8[ns]', index=lrange(5))
-        s = s.astype('O')
-        self.assertEqual(s.dtype, np.object_)
-
-        s = Series([datetime(2001, 1, 2, 0, 0)])
-        s = s.astype('O')
-        self.assertEqual(s.dtype, np.object_)
-
-        s = Series([datetime(2001, 1, 2, 0, 0) for i in range(3)])
-        s[1] = np.nan
-        self.assertEqual(s.dtype, 'M8[ns]')
-        s = s.astype('O')
-        self.assertEqual(s.dtype, np.object_)
-
-    def test_astype_str(self):
-        # GH4405
-        digits = string.digits
-        s1 = Series([digits * 10, tm.rands(63), tm.rands(64),
-                    tm.rands(1000)])
-        s2 = Series([digits * 10, tm.rands(63), tm.rands(64), nan, 1.0])
-        types = (compat.text_type, np.str_)
-        for typ in types:
-            for s in (s1, s2):
-                res = s.astype(typ)
-                expec = s.map(compat.text_type)
-                assert_series_equal(res, expec)
-
-        # GH9757
-        # Test str and unicode on python 2.x and just str on python 3.x
-        for tt in set([str, compat.text_type]):
-            ts = Series([Timestamp('2010-01-04 00:00:00')])
-            s = ts.astype(tt)
-            expected = Series([tt('2010-01-04')])
-            assert_series_equal(s, expected)
-
-            ts = Series([Timestamp('2010-01-04 00:00:00', tz='US/Eastern')])
-            s = ts.astype(tt)
-            expected = Series([tt('2010-01-04 00:00:00-05:00')])
-            assert_series_equal(s, expected)
-
-            td = Series([Timedelta(1, unit='d')])
-            s = td.astype(tt)
-            expected = Series([tt('1 days 00:00:00.000000000')])
-            assert_series_equal(s, expected)
-
-    def test_astype_unicode(self):
-
-        # GH7758
-        # a bit of magic is required to set default encoding encoding to utf-8
-        digits = string.digits
-        test_series = [
-            Series([digits * 10, tm.rands(63), tm.rands(64), tm.rands(1000)]),
-            Series([u('データーサイエンス、お前はもう死んでいる')]),
-
-        ]
-
-        former_encoding = None
-        if not compat.PY3:
-            # in python we can force the default encoding
-            # for this test
-            former_encoding = sys.getdefaultencoding()
-            reload(sys)
-            sys.setdefaultencoding("utf-8")
-        if sys.getdefaultencoding() == "utf-8":
-            test_series.append(Series([u('野菜食べないとやばい').encode("utf-8")]))
-        for s in test_series:
-            res = s.astype("unicode")
-            expec = s.map(compat.text_type)
-            assert_series_equal(res, expec)
-        # restore the former encoding
-        if former_encoding is not None and former_encoding != "utf-8":
-            reload(sys)
-            sys.setdefaultencoding(former_encoding)
-
-
-    def test_map(self):
-        index, data = tm.getMixedTypeDict()
-
-        source = Series(data['B'], index=data['C'])
-        target = Series(data['C'][:4], index=data['D'][:4])
-
-        merged = target.map(source)
-
-        for k, v in compat.iteritems(merged):
-            self.assertEqual(v, source[target[k]])
-
-        # input could be a dict
-        merged = target.map(source.to_dict())
-
-        for k, v in compat.iteritems(merged):
-            self.assertEqual(v, source[target[k]])
-
-        # function
-        result = self.ts.map(lambda x: x * 2)
-        self.assert_numpy_array_equal(result, self.ts * 2)
-
-        # GH 10324
-        a = Series([1, 2, 3, 4])
-        b = Series(["even", "odd", "even", "odd"], dtype="category")
-        c = Series(["even", "odd", "even", "odd"])
-
-        exp = Series(["odd", "even", "odd", np.nan], dtype="category")
-        self.assert_series_equal(a.map(b), exp)
-        exp = Series(["odd", "even", "odd", np.nan])
-        self.assert_series_equal(a.map(c), exp)
-
-        a = Series(['a', 'b', 'c', 'd'])
-        b = Series([1, 2, 3, 4], index=pd.CategoricalIndex(['b', 'c', 'd', 'e']))
-        c = Series([1, 2, 3, 4], index=Index(['b', 'c', 'd', 'e']))
-
-        exp = Series([np.nan, 1, 2, 3])
-        self.assert_series_equal(a.map(b), exp)
-        exp = Series([np.nan, 1, 2, 3])
-        self.assert_series_equal(a.map(c), exp)
-
-        a = Series(['a', 'b', 'c', 'd'])
-        b = Series(['B', 'C', 'D', 'E'], dtype='category',
-                   index=pd.CategoricalIndex(['b', 'c', 'd', 'e']))
-        c = Series(['B', 'C', 'D', 'E'], index=Index(['b', 'c', 'd', 'e']))
-
-        exp = Series([np.nan, 'B', 'C', 'D'], dtype='category')
-        self.assert_series_equal(a.map(b), exp)
-        exp = Series([np.nan, 'B', 'C', 'D'])
-        self.assert_series_equal(a.map(c), exp)
-
-    def test_map_compat(self):
-        # related GH 8024
-        s = Series([True,True,False],index=[1,2,3])
-        result = s.map({ True : 'foo', False : 'bar' })
-        expected = Series(['foo','foo','bar'],index=[1,2,3])
-        assert_series_equal(result,expected)
-
-    def test_map_int(self):
-        left = Series({'a': 1., 'b': 2., 'c': 3., 'd': 4})
-        right = Series({1: 11, 2: 22, 3: 33})
-
-        self.assertEqual(left.dtype, np.float_)
-        self.assertTrue(issubclass(right.dtype.type, np.integer))
-
-        merged = left.map(right)
-        self.assertEqual(merged.dtype, np.float_)
-        self.assertTrue(isnull(merged['d']))
-        self.assertTrue(not isnull(merged['c']))
-
-    def test_map_type_inference(self):
-        s = Series(lrange(3))
-        s2 = s.map(lambda x: np.where(x == 0, 0, 1))
-        self.assertTrue(issubclass(s2.dtype.type, np.integer))
-
-    def test_divide_decimal(self):
-        ''' resolves issue #9787 '''
-        from decimal import Decimal
-
-        expected = Series([Decimal(5)])
-
-        s =  Series([Decimal(10)])
-        s =  s/Decimal(2)
-
-        tm.assert_series_equal(expected, s)
-
-        s =  Series([Decimal(10)])
-        s =  s//Decimal(2)
-
-        tm.assert_series_equal(expected, s)
-
-    def test_map_decimal(self):
-        from decimal import Decimal
-
-        result = self.series.map(lambda x: Decimal(str(x)))
-        self.assertEqual(result.dtype, np.object_)
-        tm.assertIsInstance(result[0], Decimal)
-
-    def test_map_na_exclusion(self):
-        s = Series([1.5, np.nan, 3, np.nan, 5])
-
-        result = s.map(lambda x: x * 2, na_action='ignore')
-        exp = s * 2
-        assert_series_equal(result, exp)
-
-    def test_map_dict_with_tuple_keys(self):
-        '''
-        Due to new MultiIndex-ing behaviour in v0.14.0,
-        dicts with tuple keys passed to map were being
-        converted to a multi-index, preventing tuple values
-        from being mapped properly.
-        '''
-        df = pd.DataFrame({'a': [(1,), (2,), (3, 4), (5, 6)]})
-        label_mappings = {
-            (1,): 'A',
-            (2,): 'B',
-            (3, 4): 'A',
-            (5, 6): 'B'
-        }
-        df['labels'] = df['a'].map(label_mappings)
-        df['expected_labels'] = pd.Series(['A', 'B', 'A', 'B'], index=df.index)
-        # All labels should be filled now
-        tm.assert_series_equal(df['labels'], df['expected_labels'], check_names=False)
-
-    def test_apply(self):
-        assert_series_equal(self.ts.apply(np.sqrt), np.sqrt(self.ts))
-
-        # elementwise-apply
-        import math
-        assert_series_equal(self.ts.apply(math.exp), np.exp(self.ts))
-
-        # how to handle Series result, #2316
-        result = self.ts.apply(lambda x: Series([x, x ** 2],
-                                                index=['x', 'x^2']))
-        expected = DataFrame({'x': self.ts, 'x^2': self.ts ** 2})
-        tm.assert_frame_equal(result, expected)
-
-        # empty series
-        s = Series(dtype=object, name='foo', index=pd.Index([], name='bar'))
-        rs = s.apply(lambda x: x)
-        tm.assert_series_equal(s, rs)
-        # check all metadata (GH 9322)
-        self.assertIsNot(s, rs)
-        self.assertIs(s.index, rs.index)
-        self.assertEqual(s.dtype, rs.dtype)
-        self.assertEqual(s.name, rs.name)
-
-        # index but no data
-        s = Series(index=[1, 2, 3])
-        rs = s.apply(lambda x: x)
-        tm.assert_series_equal(s, rs)
-
-    def test_apply_same_length_inference_bug(self):
-        s = Series([1, 2])
-        f = lambda x: (x, x + 1)
-
-        result = s.apply(f)
-        expected = s.map(f)
-        assert_series_equal(result, expected)
-
-        s = Series([1, 2, 3])
-        result = s.apply(f)
-        expected = s.map(f)
-        assert_series_equal(result, expected)
-
-    def test_apply_dont_convert_dtype(self):
-        s = Series(np.random.randn(10))
-
-        f = lambda x: x if x > 0 else np.nan
-        result = s.apply(f, convert_dtype=False)
-        self.assertEqual(result.dtype, object)
-
-    def test_convert_objects(self):
-
-        s = Series([1., 2, 3], index=['a', 'b', 'c'])
-        with tm.assert_produces_warning(FutureWarning):
-            result = s.convert_objects(convert_dates=False, convert_numeric=True)
-        assert_series_equal(result, s)
-
-        # force numeric conversion
-        r = s.copy().astype('O')
-        r['a'] = '1'
-        with tm.assert_produces_warning(FutureWarning):
-            result = r.convert_objects(convert_dates=False, convert_numeric=True)
-        assert_series_equal(result, s)
-
-        r = s.copy().astype('O')
-        r['a'] = '1.'
-        with tm.assert_produces_warning(FutureWarning):
-            result = r.convert_objects(convert_dates=False, convert_numeric=True)
-        assert_series_equal(result, s)
-
-        r = s.copy().astype('O')
-        r['a'] = 'garbled'
-        expected = s.copy()
-        expected['a'] = np.nan
-        with tm.assert_produces_warning(FutureWarning):
-            result = r.convert_objects(convert_dates=False, convert_numeric=True)
-        assert_series_equal(result, expected)
-
-        # GH 4119, not converting a mixed type (e.g.floats and object)
-        s = Series([1, 'na', 3, 4])
-        with tm.assert_produces_warning(FutureWarning):
-            result = s.convert_objects(convert_numeric=True)
-        expected = Series([1, np.nan, 3, 4])
-        assert_series_equal(result, expected)
-
-        s = Series([1, '', 3, 4])
-        with tm.assert_produces_warning(FutureWarning):
-            result = s.convert_objects(convert_numeric=True)
-        expected = Series([1, np.nan, 3, 4])
-        assert_series_equal(result, expected)
-
-        # dates
-        s = Series(
-            [datetime(2001, 1, 1, 0, 0), datetime(2001, 1, 2, 0, 0), datetime(2001, 1, 3, 0, 0)])
-        s2 = Series([datetime(2001, 1, 1, 0, 0), datetime(2001, 1, 2, 0, 0), datetime(
-            2001, 1, 3, 0, 0), 'foo', 1.0, 1, Timestamp('20010104'), '20010105'], dtype='O')
-        with tm.assert_produces_warning(FutureWarning):
-            result = s.convert_objects(convert_dates=True, convert_numeric=False)
-        expected = Series(
-            [Timestamp('20010101'), Timestamp('20010102'), Timestamp('20010103')], dtype='M8[ns]')
-        assert_series_equal(result, expected)
-
-        with tm.assert_produces_warning(FutureWarning):
-            result = s.convert_objects(convert_dates='coerce',
-                                       convert_numeric=False)
-        with tm.assert_produces_warning(FutureWarning):
-            result = s.convert_objects(convert_dates='coerce',
-                                       convert_numeric=True)
-        assert_series_equal(result, expected)
-
-        expected = Series(
-            [Timestamp(
-                '20010101'), Timestamp('20010102'), Timestamp('20010103'),
-                          lib.NaT, lib.NaT, lib.NaT, Timestamp('20010104'), Timestamp('20010105')], dtype='M8[ns]')
-        with tm.assert_produces_warning(FutureWarning):
-            result = s2.convert_objects(convert_dates='coerce',
-                                        convert_numeric=False)
-        assert_series_equal(result, expected)
-        with tm.assert_produces_warning(FutureWarning):
-            result = s2.convert_objects(convert_dates='coerce',
-                                        convert_numeric=True)
-        assert_series_equal(result, expected)
-
-        # preserver all-nans (if convert_dates='coerce')
-        s = Series(['foo', 'bar', 1, 1.0], dtype='O')
-        with tm.assert_produces_warning(FutureWarning):
-            result = s.convert_objects(convert_dates='coerce',
-                                       convert_numeric=False)
-        assert_series_equal(result, s)
-
-        # preserver if non-object
-        s = Series([1], dtype='float32')
-        with tm.assert_produces_warning(FutureWarning):
-            result = s.convert_objects(convert_dates='coerce',
-                                       convert_numeric=False)
-        assert_series_equal(result, s)
-
-        #r = s.copy()
-        #r[0] = np.nan
-        #result = r.convert_objects(convert_dates=True,convert_numeric=False)
-        #self.assertEqual(result.dtype, 'M8[ns]')
-
-        # dateutil parses some single letters into today's value as a date
-        for x in 'abcdefghijklmnopqrstuvwxyz':
-            s = Series([x])
-            with tm.assert_produces_warning(FutureWarning):
-                result = s.convert_objects(convert_dates='coerce')
-            assert_series_equal(result, s)
-            s = Series([x.upper()])
-            with tm.assert_produces_warning(FutureWarning):
-                result = s.convert_objects(convert_dates='coerce')
-            assert_series_equal(result, s)
-
-    def test_convert_objects_preserve_bool(self):
-        s = Series([1, True, 3, 5], dtype=object)
-        with tm.assert_produces_warning(FutureWarning):
-            r = s.convert_objects(convert_numeric=True)
-        e = Series([1, 1, 3, 5], dtype='i8')
-        tm.assert_series_equal(r, e)
-
-    def test_convert_objects_preserve_all_bool(self):
-        s = Series([False, True, False, False], dtype=object)
-        with tm.assert_produces_warning(FutureWarning):
-            r = s.convert_objects(convert_numeric=True)
-        e = Series([False, True, False, False], dtype=bool)
-        tm.assert_series_equal(r, e)
-
-    # GH 10265
-    def test_convert(self):
-        # Tests: All to nans, coerce, true
-        # Test coercion returns correct type
-        s = Series(['a', 'b', 'c'])
-        results = s._convert(datetime=True, coerce=True)
-        expected = Series([lib.NaT] * 3)
-        assert_series_equal(results, expected)
-
-        results = s._convert(numeric=True, coerce=True)
-        expected = Series([np.nan] * 3)
-        assert_series_equal(results, expected)
-
-        expected = Series([lib.NaT] * 3, dtype=np.dtype('m8[ns]'))
-        results = s._convert(timedelta=True, coerce=True)
-        assert_series_equal(results, expected)
-
-        dt = datetime(2001, 1, 1, 0, 0)
-        td = dt - datetime(2000, 1, 1, 0, 0)
-
-        # Test coercion with mixed types
-        s = Series(['a', '3.1415', dt, td])
-        results = s._convert(datetime=True, coerce=True)
-        expected = Series([lib.NaT, lib.NaT, dt, lib.NaT])
-        assert_series_equal(results, expected)
-
-        results = s._convert(numeric=True, coerce=True)
-        expected = Series([nan, 3.1415, nan, nan])
-        assert_series_equal(results, expected)
-
-        results = s._convert(timedelta=True, coerce=True)
-        expected = Series([lib.NaT, lib.NaT, lib.NaT, td],
-                          dtype=np.dtype('m8[ns]'))
-        assert_series_equal(results, expected)
-
-        # Test standard conversion returns original
-        results = s._convert(datetime=True)
-        assert_series_equal(results, s)
-        results = s._convert(numeric=True)
-        expected = Series([nan, 3.1415, nan, nan])
-        assert_series_equal(results, expected)
-        results = s._convert(timedelta=True)
-        assert_series_equal(results, s)
-
-        # test pass-through and non-conversion when other types selected
-        s = Series(['1.0','2.0','3.0'])
-        results = s._convert(datetime=True, numeric=True, timedelta=True)
-        expected = Series([1.0,2.0,3.0])
-        assert_series_equal(results, expected)
-        results = s._convert(True,False,True)
-        assert_series_equal(results, s)
-
-        s = Series([datetime(2001, 1, 1, 0, 0),datetime(2001, 1, 1, 0, 0)],
-                   dtype='O')
-        results = s._convert(datetime=True, numeric=True, timedelta=True)
-        expected = Series([datetime(2001, 1, 1, 0, 0),datetime(2001, 1, 1, 0, 0)])
-        assert_series_equal(results, expected)
-        results = s._convert(datetime=False,numeric=True,timedelta=True)
-        assert_series_equal(results, s)
-
-        td = datetime(2001, 1, 1, 0, 0) - datetime(2000, 1, 1, 0, 0)
-        s = Series([td, td], dtype='O')
-        results = s._convert(datetime=True, numeric=True, timedelta=True)
-        expected = Series([td, td])
-        assert_series_equal(results, expected)
-        results = s._convert(True,True,False)
-        assert_series_equal(results, s)
-
-
-        s = Series([1., 2, 3], index=['a', 'b', 'c'])
-        result = s._convert(numeric=True)
-        assert_series_equal(result, s)
-
-        # force numeric conversion
-        r = s.copy().astype('O')
-        r['a'] = '1'
-        result = r._convert(numeric=True)
-        assert_series_equal(result, s)
-
-        r = s.copy().astype('O')
-        r['a'] = '1.'
-        result = r._convert(numeric=True)
-        assert_series_equal(result, s)
-
-        r = s.copy().astype('O')
-        r['a'] = 'garbled'
-        result = r._convert(numeric=True)
-        expected = s.copy()
-        expected['a'] = nan
-        assert_series_equal(result, expected)
-
-        # GH 4119, not converting a mixed type (e.g.floats and object)
-        s = Series([1, 'na', 3, 4])
-        result = s._convert(datetime=True, numeric=True)
-        expected = Series([1, nan, 3, 4])
-        assert_series_equal(result, expected)
-
-        s = Series([1, '', 3, 4])
-        result = s._convert(datetime=True, numeric=True)
-        assert_series_equal(result, expected)
-
-        # dates
-        s = Series(
-            [datetime(2001, 1, 1, 0, 0), datetime(2001, 1, 2, 0, 0), datetime(2001, 1, 3, 0, 0)])
-        s2 = Series([datetime(2001, 1, 1, 0, 0), datetime(2001, 1, 2, 0, 0), datetime(
-            2001, 1, 3, 0, 0), 'foo', 1.0, 1, Timestamp('20010104'), '20010105'], dtype='O')
-
-        result = s._convert(datetime=True)
-        expected = Series(
-            [Timestamp('20010101'), Timestamp('20010102'), Timestamp('20010103')], dtype='M8[ns]')
-        assert_series_equal(result, expected)
-
-        result = s._convert(datetime=True, coerce=True)
-        assert_series_equal(result, expected)
-
-        expected = Series(
-            [Timestamp(
-                '20010101'), Timestamp('20010102'), Timestamp('20010103'),
-                          lib.NaT, lib.NaT, lib.NaT, Timestamp('20010104'), Timestamp('20010105')], dtype='M8[ns]')
-        result = s2._convert(datetime=True,
-                                    numeric=False,
-                                    timedelta=False,
-                                    coerce=True)
-        assert_series_equal(result, expected)
-        result = s2._convert(datetime=True, coerce=True)
-        assert_series_equal(result, expected)
-
-        s = Series(['foo', 'bar', 1, 1.0], dtype='O')
-        result = s._convert(datetime=True, coerce=True)
-        expected = Series([lib.NaT]*4)
-        assert_series_equal(result, expected)
-
-        # preserver if non-object
-        s = Series([1], dtype='float32')
-        result = s._convert(datetime=True, coerce=True)
-        assert_series_equal(result, s)
-
-        #r = s.copy()
-        #r[0] = np.nan
-        #result = r._convert(convert_dates=True,convert_numeric=False)
-        #self.assertEqual(result.dtype, 'M8[ns]')
-
-        # dateutil parses some single letters into today's value as a date
-        expected = Series([lib.NaT])
-        for x in 'abcdefghijklmnopqrstuvwxyz':
-            s = Series([x])
-            result = s._convert(datetime=True, coerce=True)
-            assert_series_equal(result, expected)
-            s = Series([x.upper()])
-            result = s._convert(datetime=True, coerce=True)
-            assert_series_equal(result, expected)
-
-    def test_convert_no_arg_error(self):
-        s = Series(['1.0','2'])
-        self.assertRaises(ValueError, s._convert)
-
-    def test_convert_preserve_bool(self):
-        s = Series([1, True, 3, 5], dtype=object)
-        r = s._convert(datetime=True, numeric=True)
-        e = Series([1, 1, 3, 5], dtype='i8')
-        tm.assert_series_equal(r, e)
-
-    def test_convert_preserve_all_bool(self):
-        s = Series([False, True, False, False], dtype=object)
-        r = s._convert(datetime=True, numeric=True)
-        e = Series([False, True, False, False], dtype=bool)
-        tm.assert_series_equal(r, e)
-
-    def test_apply_args(self):
-        s = Series(['foo,bar'])
-
-        result = s.apply(str.split, args=(',',))
-        self.assertEqual(result[0], ['foo', 'bar'])
-        tm.assertIsInstance(result[0], list)
-
-    def test_align(self):
-        def _check_align(a, b, how='left', fill=None):
-            aa, ab = a.align(b, join=how, fill_value=fill)
-
-            join_index = a.index.join(b.index, how=how)
-            if fill is not None:
-                diff_a = aa.index.difference(join_index)
-                diff_b = ab.index.difference(join_index)
-                if len(diff_a) > 0:
-                    self.assertTrue((aa.reindex(diff_a) == fill).all())
-                if len(diff_b) > 0:
-                    self.assertTrue((ab.reindex(diff_b) == fill).all())
-
-            ea = a.reindex(join_index)
-            eb = b.reindex(join_index)
-
-            if fill is not None:
-                ea = ea.fillna(fill)
-                eb = eb.fillna(fill)
-
-            assert_series_equal(aa, ea)
-            assert_series_equal(ab, eb)
-            self.assertEqual(aa.name, 'ts')
-            self.assertEqual(ea.name, 'ts')
-            self.assertEqual(ab.name, 'ts')
-            self.assertEqual(eb.name, 'ts')
-
-        for kind in JOIN_TYPES:
-            _check_align(self.ts[2:], self.ts[:-5], how=kind)
-            _check_align(self.ts[2:], self.ts[:-5], how=kind, fill=-1)
-
-            # empty left
-            _check_align(self.ts[:0], self.ts[:-5], how=kind)
-            _check_align(self.ts[:0], self.ts[:-5], how=kind, fill=-1)
-
-            # empty right
-            _check_align(self.ts[:-5], self.ts[:0], how=kind)
-            _check_align(self.ts[:-5], self.ts[:0], how=kind, fill=-1)
-
-            # both empty
-            _check_align(self.ts[:0], self.ts[:0], how=kind)
-            _check_align(self.ts[:0], self.ts[:0], how=kind, fill=-1)
-
-    def test_align_fill_method(self):
-        def _check_align(a, b, how='left', method='pad', limit=None):
-            aa, ab = a.align(b, join=how, method=method, limit=limit)
-
-            join_index = a.index.join(b.index, how=how)
-            ea = a.reindex(join_index)
-            eb = b.reindex(join_index)
-
-            ea = ea.fillna(method=method, limit=limit)
-            eb = eb.fillna(method=method, limit=limit)
-
-            assert_series_equal(aa, ea)
-            assert_series_equal(ab, eb)
-
-        for kind in JOIN_TYPES:
-            for meth in ['pad', 'bfill']:
-                _check_align(self.ts[2:], self.ts[:-5], how=kind, method=meth)
-                _check_align(self.ts[2:], self.ts[:-5], how=kind,
-                             method=meth, limit=1)
-
-                # empty left
-                _check_align(self.ts[:0], self.ts[:-5], how=kind, method=meth)
-                _check_align(self.ts[:0], self.ts[:-5], how=kind, method=meth,
-                             limit=1)
-
-                # empty right
-                _check_align(self.ts[:-5], self.ts[:0], how=kind, method=meth)
-                _check_align(self.ts[:-5], self.ts[:0], how=kind, method=meth,
-                             limit=1)
-
-                # both empty
-                _check_align(self.ts[:0], self.ts[:0], how=kind, method=meth)
-                _check_align(self.ts[:0], self.ts[:0], how=kind, method=meth,
-                             limit=1)
-
-    def test_align_nocopy(self):
-        b = self.ts[:5].copy()
-
-        # do copy
-        a = self.ts.copy()
-        ra, _ = a.align(b, join='left')
-        ra[:5] = 5
-        self.assertFalse((a[:5] == 5).any())
-
-        # do not copy
-        a = self.ts.copy()
-        ra, _ = a.align(b, join='left', copy=False)
-        ra[:5] = 5
-        self.assertTrue((a[:5] == 5).all())
-
-        # do copy
-        a = self.ts.copy()
-        b = self.ts[:5].copy()
-        _, rb = a.align(b, join='right')
-        rb[:3] = 5
-        self.assertFalse((b[:3] == 5).any())
-
-        # do not copy
-        a = self.ts.copy()
-        b = self.ts[:5].copy()
-        _, rb = a.align(b, join='right', copy=False)
-        rb[:2] = 5
-        self.assertTrue((b[:2] == 5).all())
-
-    def test_align_sameindex(self):
-        a, b = self.ts.align(self.ts, copy=False)
-        self.assertIs(a.index, self.ts.index)
-        self.assertIs(b.index, self.ts.index)
-
-        # a, b = self.ts.align(self.ts, copy=True)
-        # self.assertIsNot(a.index, self.ts.index)
-        # self.assertIsNot(b.index, self.ts.index)
-
-    def test_align_multiindex(self):
-        # GH 10665
-
-        midx = pd.MultiIndex.from_product([range(2), range(3), range(2)],
-                                 names=('a', 'b', 'c'))
-        idx = pd.Index(range(2), name='b')
-        s1 = pd.Series(np.arange(12,dtype='int64'), index=midx)
-        s2 = pd.Series(np.arange(2,dtype='int64'), index=idx)
-
-        # these must be the same results (but flipped)
-        res1l, res1r = s1.align(s2, join='left')
-        res2l, res2r = s2.align(s1, join='right')
-
-        expl = s1
-        tm.assert_series_equal(expl, res1l)
-        tm.assert_series_equal(expl, res2r)
-        expr = pd.Series([0, 0, 1, 1, np.nan, np.nan] * 2, index=midx)
-        tm.assert_series_equal(expr, res1r)
-        tm.assert_series_equal(expr, res2l)
-
-        res1l, res1r = s1.align(s2, join='right')
-        res2l, res2r = s2.align(s1, join='left')
-
-        exp_idx = pd.MultiIndex.from_product([range(2), range(2), range(2)],
-                                             names=('a', 'b', 'c'))
-        expl = pd.Series([0, 1, 2, 3, 6, 7, 8, 9], index=exp_idx)
-        tm.assert_series_equal(expl, res1l)
-        tm.assert_series_equal(expl, res2r)
-        expr = pd.Series([0, 0, 1, 1] * 2, index=exp_idx)
-        tm.assert_series_equal(expr, res1r)
-        tm.assert_series_equal(expr, res2l)
-
-    def test_reindex(self):
-
-        identity = self.series.reindex(self.series.index)
-
-        # __array_interface__ is not defined for older numpies
-        # and on some pythons
-        try:
-            self.assertTrue(np.may_share_memory(self.series.index, identity.index))
-        except (AttributeError):
-            pass
-
-        self.assertTrue(identity.index.is_(self.series.index))
-        self.assertTrue(identity.index.identical(self.series.index))
-
-        subIndex = self.series.index[10:20]
-        subSeries = self.series.reindex(subIndex)
-
-        for idx, val in compat.iteritems(subSeries):
-            self.assertEqual(val, self.series[idx])
-
-        subIndex2 = self.ts.index[10:20]
-        subTS = self.ts.reindex(subIndex2)
-
-        for idx, val in compat.iteritems(subTS):
-            self.assertEqual(val, self.ts[idx])
-        stuffSeries = self.ts.reindex(subIndex)
-
-        self.assertTrue(np.isnan(stuffSeries).all())
-
-        # This is extremely important for the Cython code to not screw up
-        nonContigIndex = self.ts.index[::2]
-        subNonContig = self.ts.reindex(nonContigIndex)
-        for idx, val in compat.iteritems(subNonContig):
-            self.assertEqual(val, self.ts[idx])
-
-        # return a copy the same index here
-        result = self.ts.reindex()
-        self.assertFalse((result is self.ts))
-
-    def test_reindex_nan(self):
-        ts = Series([2, 3, 5, 7], index=[1, 4, nan, 8])
-
-        i, j = [nan, 1, nan, 8, 4, nan], [2, 0, 2, 3, 1, 2]
-        assert_series_equal(ts.reindex(i), ts.iloc[j])
-
-        ts.index = ts.index.astype('object')
-        assert_series_equal(ts.reindex(i), ts.iloc[j])
-
-    def test_reindex_corner(self):
-        # (don't forget to fix this) I think it's fixed
-        reindexed_dep = self.empty.reindex(self.ts.index, method='pad')
-
-        # corner case: pad empty series
-        reindexed = self.empty.reindex(self.ts.index, method='pad')
-
-        # pass non-Index
-        reindexed = self.ts.reindex(list(self.ts.index))
-        assert_series_equal(self.ts, reindexed)
-
-        # bad fill method
-        ts = self.ts[::2]
-        self.assertRaises(Exception, ts.reindex, self.ts.index, method='foo')
-
-    def test_reindex_pad(self):
-
-        s = Series(np.arange(10),dtype='int64')
-        s2 = s[::2]
-
-        reindexed = s2.reindex(s.index, method='pad')
-        reindexed2 = s2.reindex(s.index, method='ffill')
-        assert_series_equal(reindexed, reindexed2)
-
-        expected = Series([0, 0, 2, 2, 4, 4, 6, 6, 8, 8], index=np.arange(10))
-        assert_series_equal(reindexed, expected)
-
-        # GH4604
-        s = Series([1,2,3,4,5], index=['a', 'b', 'c', 'd', 'e'])
-        new_index = ['a','g','c','f']
-        expected = Series([1,1,3,3],index=new_index)
-
-        # this changes dtype because the ffill happens after
-        result = s.reindex(new_index).ffill()
-        assert_series_equal(result, expected.astype('float64'))
-
-        result = s.reindex(new_index).ffill(downcast='infer')
-        assert_series_equal(result, expected)
-
-        expected = Series([1, 5, 3, 5], index=new_index)
-        result = s.reindex(new_index, method='ffill')
-        assert_series_equal(result, expected)
-
-        # inferrence of new dtype
-        s = Series([True,False,False,True],index=list('abcd'))
-        new_index='agc'
-        result = s.reindex(list(new_index)).ffill()
-        expected = Series([True,True,False],index=list(new_index))
-        assert_series_equal(result, expected)
-
-        # GH4618 shifted series downcasting
-        s = Series(False,index=lrange(0,5))
-        result = s.shift(1).fillna(method='bfill')
-        expected = Series(False,index=lrange(0,5))
-        assert_series_equal(result, expected)
-
-    def test_reindex_nearest(self):
-        s = Series(np.arange(10, dtype='int64'))
-        target = [0.1, 0.9, 1.5, 2.0]
-        actual = s.reindex(target, method='nearest')
-        expected = Series(np.around(target).astype('int64'), target)
-        assert_series_equal(expected, actual)
-
-        actual = s.reindex_like(actual, method='nearest')
-        assert_series_equal(expected, actual)
-
-        actual = s.reindex_like(actual, method='nearest', tolerance=1)
-        assert_series_equal(expected, actual)
-
-        actual = s.reindex(target, method='nearest', tolerance=0.2)
-        expected = Series([0, 1, np.nan, 2], target)
-        assert_series_equal(expected, actual)
-
-    def test_reindex_backfill(self):
-        pass
-
-    def test_reindex_int(self):
-        ts = self.ts[::2]
-        int_ts = Series(np.zeros(len(ts), dtype=int), index=ts.index)
-
-        # this should work fine
-        reindexed_int = int_ts.reindex(self.ts.index)
-
-        # if NaNs introduced
-        self.assertEqual(reindexed_int.dtype, np.float_)
-
-        # NO NaNs introduced
-        reindexed_int = int_ts.reindex(int_ts.index[::2])
-        self.assertEqual(reindexed_int.dtype, np.int_)
-
-    def test_reindex_bool(self):
-
-        # A series other than float, int, string, or object
-        ts = self.ts[::2]
-        bool_ts = Series(np.zeros(len(ts), dtype=bool), index=ts.index)
-
-        # this should work fine
-        reindexed_bool = bool_ts.reindex(self.ts.index)
-
-        # if NaNs introduced
-        self.assertEqual(reindexed_bool.dtype, np.object_)
-
-        # NO NaNs introduced
-        reindexed_bool = bool_ts.reindex(bool_ts.index[::2])
-        self.assertEqual(reindexed_bool.dtype, np.bool_)
-
-    def test_reindex_bool_pad(self):
-        # fail
-        ts = self.ts[5:]
-        bool_ts = Series(np.zeros(len(ts), dtype=bool), index=ts.index)
-        filled_bool = bool_ts.reindex(self.ts.index, method='pad')
-        self.assertTrue(isnull(filled_bool[:5]).all())
-
-    def test_reindex_like(self):
-        other = self.ts[::2]
-        assert_series_equal(self.ts.reindex(other.index),
-                            self.ts.reindex_like(other))
-
-        # GH 7179
-        day1 = datetime(2013,3,5)
-        day2 = datetime(2013,5,5)
-        day3 = datetime(2014,3,5)
-
-        series1 = Series([5, None, None],[day1, day2, day3])
-        series2 = Series([None, None], [day1, day3])
-
-        result = series1.reindex_like(series2, method='pad')
-        expected = Series([5, np.nan], index=[day1, day3])
-        assert_series_equal(result, expected)
-
-    def test_reindex_fill_value(self):
-        #------------------------------------------------------------
-        # floats
-        floats = Series([1., 2., 3.])
-        result = floats.reindex([1, 2, 3])
-        expected = Series([2., 3., np.nan], index=[1, 2, 3])
-        assert_series_equal(result, expected)
-
-        result = floats.reindex([1, 2, 3], fill_value=0)
-        expected = Series([2., 3., 0], index=[1, 2, 3])
-        assert_series_equal(result, expected)
-
-        #------------------------------------------------------------
-        # ints
-        ints = Series([1, 2, 3])
-
-        result = ints.reindex([1, 2, 3])
-        expected = Series([2., 3., np.nan], index=[1, 2, 3])
-        assert_series_equal(result, expected)
-
-        # don't upcast
-        result = ints.reindex([1, 2, 3], fill_value=0)
-        expected = Series([2, 3, 0], index=[1, 2, 3])
-        self.assertTrue(issubclass(result.dtype.type, np.integer))
-        assert_series_equal(result, expected)
-
-        #------------------------------------------------------------
-        # objects
-        objects = Series([1, 2, 3], dtype=object)
-
-        result = objects.reindex([1, 2, 3])
-        expected = Series([2, 3, np.nan], index=[1, 2, 3], dtype=object)
-        assert_series_equal(result, expected)
-
-        result = objects.reindex([1, 2, 3], fill_value='foo')
-        expected = Series([2, 3, 'foo'], index=[1, 2, 3], dtype=object)
-        assert_series_equal(result, expected)
-
-        #------------------------------------------------------------
-        # bools
-        bools = Series([True, False, True])
-
-        result = bools.reindex([1, 2, 3])
-        expected = Series([False, True, np.nan], index=[1, 2, 3], dtype=object)
-        assert_series_equal(result, expected)
-
-        result = bools.reindex([1, 2, 3], fill_value=False)
-        expected = Series([False, True, False], index=[1, 2, 3])
-        assert_series_equal(result, expected)
-
-    def test_rename(self):
-        renamer = lambda x: x.strftime('%Y%m%d')
-        renamed = self.ts.rename(renamer)
-        self.assertEqual(renamed.index[0], renamer(self.ts.index[0]))
-
-        # dict
-        rename_dict = dict(zip(self.ts.index, renamed.index))
-        renamed2 = self.ts.rename(rename_dict)
-        assert_series_equal(renamed, renamed2)
-
-        # partial dict
-        s = Series(np.arange(4), index=['a', 'b', 'c', 'd'], dtype='int64')
-        renamed = s.rename({'b': 'foo', 'd': 'bar'})
-        self.assert_numpy_array_equal(renamed.index, ['a', 'foo', 'c', 'bar'])
-
-        # index with name
-        renamer = Series(
-            np.arange(4), index=Index(['a', 'b', 'c', 'd'], name='name'), dtype='int64')
-        renamed = renamer.rename({})
-        self.assertEqual(renamed.index.name, renamer.index.name)
-
-    def test_rename_inplace(self):
-        renamer = lambda x: x.strftime('%Y%m%d')
-        expected = renamer(self.ts.index[0])
-
-        self.ts.rename(renamer, inplace=True)
-        self.assertEqual(self.ts.index[0], expected)
-
-    def test_preserveRefs(self):
-        seq = self.ts[[5, 10, 15]]
-        seq[1] = np.NaN
-        self.assertFalse(np.isnan(self.ts[10]))
-
-    def test_ne(self):
-        ts = Series([3, 4, 5, 6, 7], [3, 4, 5, 6, 7], dtype=float)
-        expected = [True, True, False, True, True]
-        self.assertTrue(tm.equalContents(ts.index != 5, expected))
-        self.assertTrue(tm.equalContents(~(ts.index == 5), expected))
-
-    def test_pad_nan(self):
-        x = Series([np.nan, 1., np.nan, 3., np.nan],
-                   ['z', 'a', 'b', 'c', 'd'], dtype=float)
-
-        x.fillna(method='pad', inplace=True)
-
-        expected = Series([np.nan, 1.0, 1.0, 3.0, 3.0],
-                          ['z', 'a', 'b', 'c', 'd'], dtype=float)
-        assert_series_equal(x[1:], expected[1:])
-        self.assertTrue(np.isnan(x[0]), np.isnan(expected[0]))
-
-    def test_unstack(self):
-        from numpy import nan
-        from pandas.util.testing import assert_frame_equal
-
-        index = MultiIndex(levels=[['bar', 'foo'], ['one', 'three', 'two']],
-                           labels=[[1, 1, 0, 0], [0, 1, 0, 2]])
-
-        s = Series(np.arange(4.), index=index)
-        unstacked = s.unstack()
-
-        expected = DataFrame([[2., nan, 3.], [0., 1., nan]],
-                             index=['bar', 'foo'],
-                             columns=['one', 'three', 'two'])
-
-        assert_frame_equal(unstacked, expected)
-
-        unstacked = s.unstack(level=0)
-        assert_frame_equal(unstacked, expected.T)
-
-        index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
-                           labels=[[0, 0, 0, 0, 0, 0],
-                                   [0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1]])
-        s = Series(np.random.randn(6), index=index)
-        exp_index = MultiIndex(levels=[['one', 'two', 'three'], [0, 1]],
-                               labels=[[0, 1, 2, 0, 1, 2],
-                                       [0, 1, 0, 1, 0, 1]])
-        expected = DataFrame({'bar': s.values}, index=exp_index).sortlevel(0)
-        unstacked = s.unstack(0)
-        assert_frame_equal(unstacked, expected)
-
-        # GH5873
-        idx = pd.MultiIndex.from_arrays([[101, 102], [3.5, np.nan]])
-        ts = pd.Series([1,2], index=idx)
-        left = ts.unstack()
-        right = DataFrame([[nan, 1], [2, nan]], index=[101, 102],
-                          columns=[nan, 3.5])
-        print(left)
-        print(right)
-        assert_frame_equal(left, right)
-
-        idx = pd.MultiIndex.from_arrays([['cat', 'cat', 'cat', 'dog', 'dog'],
-                ['a', 'a', 'b', 'a', 'b'], [1, 2, 1, 1, np.nan]])
-        ts = pd.Series([1.0, 1.1, 1.2, 1.3, 1.4], index=idx)
-        right = DataFrame([[1.0, 1.3], [1.1, nan], [nan, 1.4], [1.2, nan]],
-                          columns=['cat', 'dog'])
-        tpls = [('a', 1), ('a', 2), ('b', nan), ('b', 1)]
-        right.index = pd.MultiIndex.from_tuples(tpls)
-        assert_frame_equal(ts.unstack(level=0), right)
-
-    def test_sortlevel(self):
-        mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
-        s = Series([1, 2], mi)
-        backwards = s.iloc[[1, 0]]
-
-        res = s.sortlevel('A')
-        assert_series_equal(backwards, res)
-
-        res = s.sortlevel(['A', 'B'])
-        assert_series_equal(backwards, res)
-
-        res = s.sortlevel('A', sort_remaining=False)
-        assert_series_equal(s, res)
-
-        res = s.sortlevel(['A', 'B'], sort_remaining=False)
-        assert_series_equal(s, res)
-
-    def test_head_tail(self):
-        assert_series_equal(self.series.head(), self.series[:5])
-        assert_series_equal(self.series.tail(), self.series[-5:])
-
-    def test_isin(self):
-        s = Series(['A', 'B', 'C', 'a', 'B', 'B', 'A', 'C'])
-
-        result = s.isin(['A', 'C'])
-        expected = Series([True, False, True, False, False, False, True, True])
-        assert_series_equal(result, expected)
-
-    def test_isin_with_string_scalar(self):
-        # GH4763
-        s = Series(['A', 'B', 'C', 'a', 'B', 'B', 'A', 'C'])
-        with tm.assertRaises(TypeError):
-            s.isin('a')
-
-        with tm.assertRaises(TypeError):
-            s = Series(['aaa', 'b', 'c'])
-            s.isin('aaa')
-
-    def test_isin_with_i8(self):
-        # GH 5021
-
-        expected = Series([True,True,False,False,False])
-        expected2 = Series([False,True,False,False,False])
-
-        # datetime64[ns]
-        s = Series(date_range('jan-01-2013','jan-05-2013'))
-
-        result = s.isin(s[0:2])
-        assert_series_equal(result, expected)
-
-        result = s.isin(s[0:2].values)
-        assert_series_equal(result, expected)
-
-        # fails on dtype conversion in the first place
-        result = s.isin(s[0:2].values.astype('datetime64[D]'))
-        assert_series_equal(result, expected)
-
-        result = s.isin([s[1]])
-        assert_series_equal(result, expected2)
-
-        result = s.isin([np.datetime64(s[1])])
-        assert_series_equal(result, expected2)
-
-        # timedelta64[ns]
-        s = Series(pd.to_timedelta(lrange(5),unit='d'))
-        result = s.isin(s[0:2])
-        assert_series_equal(result, expected)
-
-#------------------------------------------------------------------------------
-# TimeSeries-specific
-    def test_cummethods_bool(self):
-        # GH 6270
-        # looks like a buggy np.maximum.accumulate for numpy 1.6.1, py 3.2
-        def cummin(x):
-            return np.minimum.accumulate(x)
-
-        def cummax(x):
-            return np.maximum.accumulate(x)
-
-        a = pd.Series([False, False, False, True, True, False, False])
-        b = ~a
-        c = pd.Series([False] * len(b))
-        d = ~c
-        methods = {'cumsum': np.cumsum, 'cumprod': np.cumprod,
-                   'cummin': cummin, 'cummax': cummax}
-        args = product((a, b, c, d), methods)
-        for s, method in args:
-            expected = Series(methods[method](s.values))
-            result = getattr(s, method)()
-            assert_series_equal(result, expected)
-
-        e = pd.Series([False, True, nan, False])
-        cse = pd.Series([0, 1, nan, 1], dtype=object)
-        cpe = pd.Series([False, 0, nan, 0])
-        cmin = pd.Series([False, False, nan, False])
-        cmax = pd.Series([False, True, nan, True])
-        expecteds = {'cumsum': cse, 'cumprod': cpe, 'cummin': cmin,
-                     'cummax': cmax}
-
-        for method in methods:
-            res = getattr(e, method)()
-            assert_series_equal(res, expecteds[method])
-
-    def test_replace(self):
-        N = 100
-        ser = Series(np.random.randn(N))
-        ser[0:4] = np.nan
-        ser[6:10] = 0
-
-        # replace list with a single value
-        ser.replace([np.nan], -1, inplace=True)
-
-        exp = ser.fillna(-1)
-        assert_series_equal(ser, exp)
-
-        rs = ser.replace(0., np.nan)
-        ser[ser == 0.] = np.nan
-        assert_series_equal(rs, ser)
-
-        ser = Series(np.fabs(np.random.randn(N)), tm.makeDateIndex(N),
-                     dtype=object)
-        ser[:5] = np.nan
-        ser[6:10] = 'foo'
-        ser[20:30] = 'bar'
-
-        # replace list with a single value
-        rs = ser.replace([np.nan, 'foo', 'bar'], -1)
-
-        self.assertTrue((rs[:5] == -1).all())
-        self.assertTrue((rs[6:10] == -1).all())
-        self.assertTrue((rs[20:30] == -1).all())
-        self.assertTrue((isnull(ser[:5])).all())
-
-        # replace with different values
-        rs = ser.replace({np.nan: -1, 'foo': -2, 'bar': -3})
-
-        self.assertTrue((rs[:5] == -1).all())
-        self.assertTrue((rs[6:10] == -2).all())
-        self.assertTrue((rs[20:30] == -3).all())
-        self.assertTrue((isnull(ser[:5])).all())
-
-        # replace with different values with 2 lists
-        rs2 = ser.replace([np.nan, 'foo', 'bar'], [-1, -2, -3])
-        assert_series_equal(rs, rs2)
-
-        # replace inplace
-        ser.replace([np.nan, 'foo', 'bar'], -1, inplace=True)
-
-        self.assertTrue((ser[:5] == -1).all())
-        self.assertTrue((ser[6:10] == -1).all())
-        self.assertTrue((ser[20:30] == -1).all())
-
-        ser = Series([np.nan, 0, np.inf])
-        assert_series_equal(ser.replace(np.nan, 0), ser.fillna(0))
-
-        ser = Series([np.nan, 0, 'foo', 'bar', np.inf, None, lib.NaT])
-        assert_series_equal(ser.replace(np.nan, 0), ser.fillna(0))
-        filled = ser.copy()
-        filled[4] = 0
-        assert_series_equal(ser.replace(np.inf, 0), filled)
-
-        ser = Series(self.ts.index)
-        assert_series_equal(ser.replace(np.nan, 0), ser.fillna(0))
-
-        # malformed
-        self.assertRaises(ValueError, ser.replace, [1, 2, 3], [np.nan, 0])
-
-        # make sure that we aren't just masking a TypeError because bools don't
-        # implement indexing
-        with tm.assertRaisesRegexp(TypeError, 'Cannot compare types .+'):
-            ser.replace([1, 2], [np.nan, 0])
-
-        ser = Series([0, 1, 2, 3, 4])
-        result = ser.replace([0, 1, 2, 3, 4], [4, 3, 2, 1, 0])
-        assert_series_equal(result, Series([4, 3, 2, 1, 0]))
-
-        # API change from 0.12?
-        # GH 5319
-        ser = Series([0, np.nan, 2, 3, 4])
-        expected = ser.ffill()
-        result = ser.replace([np.nan])
-        assert_series_equal(result, expected)
-
-        ser = Series([0, np.nan, 2, 3, 4])
-        expected = ser.ffill()
-        result = ser.replace(np.nan)
-        assert_series_equal(result, expected)
-        #GH 5797
-        ser = Series(date_range('20130101', periods=5))
-        expected = ser.copy()
-        expected.loc[2] = Timestamp('20120101')
-        result = ser.replace({Timestamp('20130103'):
-                              Timestamp('20120101')})
-        assert_series_equal(result, expected)
-        result = ser.replace(Timestamp('20130103'), Timestamp('20120101'))
-        assert_series_equal(result, expected)
-
-    def test_replace_with_single_list(self):
-        ser = Series([0, 1, 2, 3, 4])
-        result = ser.replace([1,2,3])
-        assert_series_equal(result, Series([0,0,0,0,4]))
-
-        s = ser.copy()
-        s.replace([1,2,3],inplace=True)
-        assert_series_equal(s, Series([0,0,0,0,4]))
-
-        # make sure things don't get corrupted when fillna call fails
-        s = ser.copy()
-        with tm.assertRaises(ValueError):
-            s.replace([1,2,3],inplace=True,method='crash_cymbal')
-        assert_series_equal(s, ser)
-
-    def test_replace_mixed_types(self):
-        s = Series(np.arange(5),dtype='int64')
-
-        def check_replace(to_rep, val, expected):
-            sc = s.copy()
-            r = s.replace(to_rep, val)
-            sc.replace(to_rep, val, inplace=True)
-            assert_series_equal(expected, r)
-            assert_series_equal(expected, sc)
-
-        # should NOT upcast to float
-        e = Series([0,1,2,3,4])
-        tr, v = [3], [3.0]
-        check_replace(tr, v, e)
-
-        # MUST upcast to float
-        e = Series([0,1,2,3.5,4])
-        tr, v = [3], [3.5]
-        check_replace(tr, v, e)
-
-        # casts to object
-        e = Series([0,1,2,3.5,'a'])
-        tr, v = [3,4], [3.5,'a']
-        check_replace(tr, v, e)
-
-        # again casts to object
-        e = Series([0,1,2,3.5,Timestamp('20130101')])
-        tr, v = [3,4],[3.5,Timestamp('20130101')]
-        check_replace(tr, v, e)
-
-        # casts to float
-        e = Series([0,1,2,3.5,1])
-        tr, v = [3,4],[3.5,True]
-        check_replace(tr, v, e)
-
-        # test an object with dates + floats + integers + strings
-        dr = date_range('1/1/2001', '1/10/2001',
-                        freq='D').to_series().reset_index(drop=True)
-        result = dr.astype(object).replace([dr[0],dr[1],dr[2]], [1.0,2,'a'])
-        expected = Series([1.0,2,'a'] + dr[3:].tolist(),dtype=object)
-        assert_series_equal(result, expected)
-
-    def test_replace_bool_with_string_no_op(self):
-        s = Series([True, False, True])
-        result = s.replace('fun', 'in-the-sun')
-        tm.assert_series_equal(s, result)
-
-    def test_replace_bool_with_string(self):
-        # nonexistent elements
-        s = Series([True, False, True])
-        result = s.replace(True, '2u')
-        expected = Series(['2u', False, '2u'])
-        tm.assert_series_equal(expected, result)
-
-    def test_replace_bool_with_bool(self):
-        s = Series([True, False, True])
-        result = s.replace(True, False)
-        expected = Series([False] * len(s))
-        tm.assert_series_equal(expected, result)
-
-    def test_replace_with_dict_with_bool_keys(self):
-        s = Series([True, False, True])
-        with tm.assertRaisesRegexp(TypeError, 'Cannot compare types .+'):
-            s.replace({'asdf': 'asdb', True: 'yes'})
-
-    def test_asfreq(self):
-        ts = Series([0., 1., 2.], index=[datetime(2009, 10, 30),
-                                         datetime(2009, 11, 30),
-                                         datetime(2009, 12, 31)])
-
-        daily_ts = ts.asfreq('B')
-        monthly_ts = daily_ts.asfreq('BM')
-        self.assert_numpy_array_equal(monthly_ts, ts)
-
-        daily_ts = ts.asfreq('B', method='pad')
-        monthly_ts = daily_ts.asfreq('BM')
-        self.assert_numpy_array_equal(monthly_ts, ts)
-
-        daily_ts = ts.asfreq(datetools.bday)
-        monthly_ts = daily_ts.asfreq(datetools.bmonthEnd)
-        self.assert_numpy_array_equal(monthly_ts, ts)
-
-        result = ts[:0].asfreq('M')
-        self.assertEqual(len(result), 0)
-        self.assertIsNot(result, ts)
-
-    def test_diff(self):
-        # Just run the function
-        self.ts.diff()
-
-        # int dtype
-        a = 10000000000000000
-        b = a + 1
-        s = Series([a, b])
-
-        rs = s.diff()
-        self.assertEqual(rs[1], 1)
-
-        # neg n
-        rs = self.ts.diff(-1)
-        xp = self.ts - self.ts.shift(-1)
-        assert_series_equal(rs, xp)
-
-        # 0
-        rs = self.ts.diff(0)
-        xp = self.ts - self.ts
-        assert_series_equal(rs, xp)
-
-        # datetime diff (GH3100)
-        s = Series(date_range('20130102', periods=5))
-        rs = s - s.shift(1)
-        xp = s.diff()
-        assert_series_equal(rs, xp)
-
-        # timedelta diff
-        nrs = rs - rs.shift(1)
-        nxp = xp.diff()
-        assert_series_equal(nrs, nxp)
-
-        # with tz
-        s = Series(date_range('2000-01-01 09:00:00',periods=5,tz='US/Eastern'), name='foo')
-        result = s.diff()
-        assert_series_equal(result,Series(TimedeltaIndex(['NaT'] + ['1 days']*4),name='foo'))
-
-    def test_pct_change(self):
-        rs = self.ts.pct_change(fill_method=None)
-        assert_series_equal(rs, self.ts / self.ts.shift(1) - 1)
-
-        rs = self.ts.pct_change(2)
-        filled = self.ts.fillna(method='pad')
-        assert_series_equal(rs, filled / filled.shift(2) - 1)
-
-        rs = self.ts.pct_change(fill_method='bfill', limit=1)
-        filled = self.ts.fillna(method='bfill', limit=1)
-        assert_series_equal(rs, filled / filled.shift(1) - 1)
-
-        rs = self.ts.pct_change(freq='5D')
-        filled = self.ts.fillna(method='pad')
-        assert_series_equal(rs, filled / filled.shift(freq='5D') - 1)
-
-    def test_pct_change_shift_over_nas(self):
-        s = Series([1., 1.5, np.nan, 2.5, 3.])
-
-        chg = s.pct_change()
-        expected = Series([np.nan, 0.5, np.nan, 2.5 / 1.5 - 1, .2])
-        assert_series_equal(chg, expected)
-
-    def test_autocorr(self):
-        # Just run the function
-        corr1 = self.ts.autocorr()
-
-        # Now run it with the lag parameter
-        corr2 = self.ts.autocorr(lag=1)
-
-        # corr() with lag needs Series of at least length 2
-        if len(self.ts) <= 2:
-            self.assertTrue(np.isnan(corr1))
-            self.assertTrue(np.isnan(corr2))
-        else:
-            self.assertEqual(corr1, corr2)
-
-        # Choose a random lag between 1 and length of Series - 2
-        # and compare the result with the Series corr() function
-        n = 1 + np.random.randint(max(1, len(self.ts) - 2))
-        corr1 = self.ts.corr(self.ts.shift(n))
-        corr2 = self.ts.autocorr(lag=n)
-
-        # corr() with lag needs Series of at least length 2
-        if len(self.ts) <= 2:
-            self.assertTrue(np.isnan(corr1))
-            self.assertTrue(np.isnan(corr2))
-        else:
-            self.assertEqual(corr1, corr2)
-
-    def test_first_last_valid(self):
-        ts = self.ts.copy()
-        ts[:5] = np.NaN
-
-        index = ts.first_valid_index()
-        self.assertEqual(index, ts.index[5])
-
-        ts[-5:] = np.NaN
-        index = ts.last_valid_index()
-        self.assertEqual(index, ts.index[-6])
-
-        ts[:] = np.nan
-        self.assertIsNone(ts.last_valid_index())
-        self.assertIsNone(ts.first_valid_index())
-
-        ser = Series([], index=[])
-        self.assertIsNone(ser.last_valid_index())
-        self.assertIsNone(ser.first_valid_index())
-
-    def test_mpl_compat_hack(self):
-        result = self.ts[:, np.newaxis]
-        expected = self.ts.values[:, np.newaxis]
-        assert_almost_equal(result, expected)
-
-#------------------------------------------------------------------------------
-# GroupBy
-
-    def test_select(self):
-        n = len(self.ts)
-        result = self.ts.select(lambda x: x >= self.ts.index[n // 2])
-        expected = self.ts.reindex(self.ts.index[n // 2:])
-        assert_series_equal(result, expected)
-
-        result = self.ts.select(lambda x: x.weekday() == 2)
-        expected = self.ts[self.ts.index.weekday == 2]
-        assert_series_equal(result, expected)
-
-#------------------------------------------------------------------------------
-# Misc not safe for sparse
-
-    def test_dropna_preserve_name(self):
-        self.ts[:5] = np.nan
-        result = self.ts.dropna()
-        self.assertEqual(result.name, self.ts.name)
-        name = self.ts.name
-        ts = self.ts.copy()
-        ts.dropna(inplace=True)
-        self.assertEqual(ts.name, name)
-
-    def test_numpy_unique(self):
-        # it works!
-        result = np.unique(self.ts)
-
-    def test_concat_empty_series_dtypes_roundtrips(self):
-
-        # round-tripping with self & like self
-        dtypes = map(np.dtype,['float64','int8','uint8','bool','m8[ns]','M8[ns]'])
-
-        for dtype in dtypes:
-            self.assertEqual(pd.concat([Series(dtype=dtype)]).dtype, dtype)
-            self.assertEqual(pd.concat([Series(dtype=dtype),
-                                        Series(dtype=dtype)]).dtype, dtype)
-
-        def int_result_type(dtype, dtype2):
-            typs = set([dtype.kind,dtype2.kind])
-            if not len(typs-set(['i','u','b'])) and (dtype.kind == 'i' or dtype2.kind == 'i'):
-                return 'i'
-            elif not len(typs-set(['u','b'])) and (dtype.kind == 'u' or dtype2.kind == 'u'):
-                 return 'u'
-            return None
-
-        def float_result_type(dtype, dtype2):
-            typs = set([dtype.kind,dtype2.kind])
-            if not len(typs-set(['f','i','u'])) and (dtype.kind == 'f' or dtype2.kind == 'f'):
-                return 'f'
-            return None
-
-        def get_result_type(dtype, dtype2):
-            result = float_result_type(dtype, dtype2)
-            if result is not None:
-                return result
-            result = int_result_type(dtype, dtype2)
-            if result is not None:
-                return result
-            return 'O'
-
-        for dtype in dtypes:
-            for dtype2 in dtypes:
-                if dtype == dtype2:
-                    continue
-
-                expected = get_result_type(dtype, dtype2)
-                result = pd.concat([Series(dtype=dtype),
-                                    Series(dtype=dtype2)]).dtype
-                self.assertEqual(result.kind, expected)
-
-    def test_concat_empty_series_dtypes(self):
-
-        # bools
-        self.assertEqual(pd.concat([Series(dtype=np.bool_),
-                                    Series(dtype=np.int32)]).dtype, np.int32)
-        self.assertEqual(pd.concat([Series(dtype=np.bool_),
-                                    Series(dtype=np.float32)]).dtype, np.object_)
-
-        # datetimelike
-        self.assertEqual(pd.concat([Series(dtype='m8[ns]'),
-                                    Series(dtype=np.bool)]).dtype, np.object_)
-        self.assertEqual(pd.concat([Series(dtype='m8[ns]'),
-                                    Series(dtype=np.int64)]).dtype, np.object_)
-        self.assertEqual(pd.concat([Series(dtype='M8[ns]'),
-                                    Series(dtype=np.bool)]).dtype, np.object_)
-        self.assertEqual(pd.concat([Series(dtype='M8[ns]'),
-                                    Series(dtype=np.int64)]).dtype, np.object_)
-        self.assertEqual(pd.concat([Series(dtype='M8[ns]'),
-                                    Series(dtype=np.bool_),
-                                    Series(dtype=np.int64)]).dtype, np.object_)
-
-        # categorical
-        self.assertEqual(pd.concat([Series(dtype='category'),
-                                    Series(dtype='category')]).dtype, 'category')
-        self.assertEqual(pd.concat([Series(dtype='category'),
-                                    Series(dtype='float64')]).dtype, np.object_)
-        self.assertEqual(pd.concat([Series(dtype='category'),
-                                    Series(dtype='object')]).dtype, 'category')
-
-        # sparse
-        result = pd.concat([Series(dtype='float64').to_sparse(),
-                            Series(dtype='float64').to_sparse()])
-        self.assertEqual(result.dtype,np.float64)
-        self.assertEqual(result.ftype,'float64:sparse')
-
-        result = pd.concat([Series(dtype='float64').to_sparse(),
-                            Series(dtype='float64')])
-        self.assertEqual(result.dtype,np.float64)
-        self.assertEqual(result.ftype,'float64:sparse')
-
-        result = pd.concat([Series(dtype='float64').to_sparse(),
-                            Series(dtype='object')])
-        self.assertEqual(result.dtype,np.object_)
-        self.assertEqual(result.ftype,'object:dense')
-
-    def test_searchsorted_numeric_dtypes_scalar(self):
-        s = Series([1, 2, 90, 1000, 3e9])
-        r = s.searchsorted(30)
-        e = 2
-        tm.assert_equal(r, e)
-
-        r = s.searchsorted([30])
-        e = np.array([2])
-        tm.assert_numpy_array_equal(r, e)
-
-    def test_searchsorted_numeric_dtypes_vector(self):
-        s = Series([1, 2, 90, 1000, 3e9])
-        r = s.searchsorted([91, 2e6])
-        e = np.array([3, 4])
-        tm.assert_numpy_array_equal(r, e)
-
-    def test_search_sorted_datetime64_scalar(self):
-        s = Series(pd.date_range('20120101', periods=10, freq='2D'))
-        v = pd.Timestamp('20120102')
-        r = s.searchsorted(v)
-        e = 1
-        tm.assert_equal(r, e)
-
-    def test_search_sorted_datetime64_list(self):
-        s = Series(pd.date_range('20120101', periods=10, freq='2D'))
-        v = [pd.Timestamp('20120102'), pd.Timestamp('20120104')]
-        r = s.searchsorted(v)
-        e = np.array([1, 2])
-        tm.assert_numpy_array_equal(r, e)
-
-    def test_searchsorted_sorter(self):
-        # GH8490
-        s = Series([3, 1, 2])
-        r = s.searchsorted([0, 3], sorter=np.argsort(s))
-        e = np.array([0, 2])
-        tm.assert_numpy_array_equal(r, e)
-
-    def test_to_frame_expanddim(self):
-        # GH 9762
-
-        class SubclassedSeries(Series):
-            @property
-            def _constructor_expanddim(self):
-                return SubclassedFrame
-
-        class SubclassedFrame(DataFrame):
-            pass
-
-        s = SubclassedSeries([1, 2, 3], name='X')
-        result = s.to_frame()
-        self.assertTrue(isinstance(result, SubclassedFrame))
-        expected = SubclassedFrame({'X': [1, 2, 3]})
-        assert_frame_equal(result, expected)
-
-
-class TestSeriesNonUnique(tm.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        pass
-
-    def test_basic_indexing(self):
-        s = Series(np.random.randn(5), index=['a', 'b', 'a', 'a', 'b'])
-
-        self.assertRaises(IndexError, s.__getitem__, 5)
-        self.assertRaises(IndexError, s.__setitem__, 5, 0)
-
-        self.assertRaises(KeyError, s.__getitem__, 'c')
-
-        s = s.sort_index()
-
-        self.assertRaises(IndexError, s.__getitem__, 5)
-        self.assertRaises(IndexError, s.__setitem__, 5, 0)
-
-
-    def test_int_indexing(self):
-        s = Series(np.random.randn(6), index=[0, 0, 1, 1, 2, 2])
-
-        self.assertRaises(KeyError, s.__getitem__, 5)
-
-        self.assertRaises(KeyError, s.__getitem__, 'c')
-
-        # not monotonic
-        s = Series(np.random.randn(6), index=[2, 2, 0, 0, 1, 1])
-
-        self.assertRaises(KeyError, s.__getitem__, 5)
-
-        self.assertRaises(KeyError, s.__getitem__, 'c')
-
-    def test_datetime_indexing(self):
-        from pandas import date_range
-
-        index = date_range('1/1/2000', '1/7/2000')
-        index = index.repeat(3)
-
-        s = Series(len(index), index=index)
-        stamp = Timestamp('1/8/2000')
-
-        self.assertRaises(KeyError, s.__getitem__, stamp)
-        s[stamp] = 0
-        self.assertEqual(s[stamp], 0)
-
-        # not monotonic
-        s = Series(len(index), index=index)
-        s = s[::-1]
-
-        self.assertRaises(KeyError, s.__getitem__, stamp)
-        s[stamp] = 0
-        self.assertEqual(s[stamp], 0)
-
-    def test_reset_index(self):
-        df = tm.makeDataFrame()[:5]
-        ser = df.stack()
-        ser.index.names = ['hash', 'category']
-
-        ser.name = 'value'
-        df = ser.reset_index()
-        self.assertIn('value', df)
-
-        df = ser.reset_index(name='value2')
-        self.assertIn('value2', df)
-
-        # check inplace
-        s = ser.reset_index(drop=True)
-        s2 = ser
-        s2.reset_index(drop=True, inplace=True)
-        assert_series_equal(s, s2)
-
-        # level
-        index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
-                           labels=[[0, 0, 0, 0, 0, 0],
-                                   [0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1]])
-        s = Series(np.random.randn(6), index=index)
-        rs = s.reset_index(level=1)
-        self.assertEqual(len(rs.columns), 2)
-
-        rs = s.reset_index(level=[0, 2], drop=True)
-        self.assertTrue(rs.index.equals(Index(index.get_level_values(1))))
-        tm.assertIsInstance(rs, Series)
-
-    def test_set_index_makes_timeseries(self):
-        idx = tm.makeDateIndex(10)
-
-        s = Series(lrange(10))
-        s.index = idx
-
-        with tm.assert_produces_warning(FutureWarning):
-            self.assertTrue(s.is_time_series == True)
-        self.assertTrue(s.index.is_all_dates == True)
-
-    def test_timeseries_coercion(self):
-        idx = tm.makeDateIndex(10000)
-        ser = Series(np.random.randn(len(idx)), idx.astype(object))
-        with tm.assert_produces_warning(FutureWarning):
-            self.assertTrue(ser.is_time_series)
-        self.assertTrue(ser.index.is_all_dates)
-        self.assertIsInstance(ser.index, DatetimeIndex)
-
-    def test_replace(self):
-        N = 100
-        ser = Series(np.fabs(np.random.randn(N)), tm.makeDateIndex(N),
-                     dtype=object)
-        ser[:5] = np.nan
-        ser[6:10] = 'foo'
-        ser[20:30] = 'bar'
-
-        # replace list with a single value
-        rs = ser.replace([np.nan, 'foo', 'bar'], -1)
-
-        self.assertTrue((rs[:5] == -1).all())
-        self.assertTrue((rs[6:10] == -1).all())
-        self.assertTrue((rs[20:30] == -1).all())
-        self.assertTrue((isnull(ser[:5])).all())
-
-        # replace with different values
-        rs = ser.replace({np.nan: -1, 'foo': -2, 'bar': -3})
-
-        self.assertTrue((rs[:5] == -1).all())
-        self.assertTrue((rs[6:10] == -2).all())
-        self.assertTrue((rs[20:30] == -3).all())
-        self.assertTrue((isnull(ser[:5])).all())
-
-        # replace with different values with 2 lists
-        rs2 = ser.replace([np.nan, 'foo', 'bar'], [-1, -2, -3])
-        assert_series_equal(rs, rs2)
-
-        # replace inplace
-        ser.replace([np.nan, 'foo', 'bar'], -1, inplace=True)
-        self.assertTrue((ser[:5] == -1).all())
-        self.assertTrue((ser[6:10] == -1).all())
-        self.assertTrue((ser[20:30] == -1).all())
-
-    def test_repeat(self):
-        s = Series(np.random.randn(3), index=['a', 'b', 'c'])
-
-        reps = s.repeat(5)
-        exp = Series(s.values.repeat(5), index=s.index.values.repeat(5))
-        assert_series_equal(reps, exp)
-
-        to_rep = [2, 3, 4]
-        reps = s.repeat(to_rep)
-        exp = Series(s.values.repeat(to_rep),
-                     index=s.index.values.repeat(to_rep))
-        assert_series_equal(reps, exp)
-
-    def test_unique_data_ownership(self):
-        # it works! #1807
-        Series(Series(["a", "c", "b"]).unique()).sort_values()
-
-    def test_datetime_timedelta_quantiles(self):
-        # covers #9694
-        self.assertTrue(pd.isnull(Series([],dtype='M8[ns]').quantile(.5)))
-        self.assertTrue(pd.isnull(Series([],dtype='m8[ns]').quantile(.5)))
-
-    def test_empty_timeseries_redections_return_nat(self):
-        # covers #11245
-        for dtype in ('m8[ns]', 'm8[ns]', 'M8[ns]', 'M8[ns, UTC]'):
-            self.assertIs(Series([], dtype=dtype).min(), pd.NaT)
-            self.assertIs(Series([], dtype=dtype).max(), pd.NaT)
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_sorting.py b/pandas/tests/test_sorting.py
new file mode 100644
index 0000000000000..d0350ba252329
--- /dev/null
+++ b/pandas/tests/test_sorting.py
@@ -0,0 +1,437 @@
+import pytest
+from itertools import product
+from collections import defaultdict
+import warnings
+from datetime import datetime
+
+import numpy as np
+from numpy import nan
+from pandas.core import common as com
+from pandas import (DataFrame, MultiIndex, merge, concat, Series, compat,
+                    _np_version_under1p10)
+from pandas.util import testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+from pandas.core.sorting import (is_int64_overflow_possible,
+                                 decons_group_index,
+                                 get_group_index,
+                                 nargsort,
+                                 lexsort_indexer,
+                                 safe_sort)
+
+
+class TestSorting(object):
+
+    @pytest.mark.slow
+    def test_int64_overflow(self):
+
+        B = np.concatenate((np.arange(1000), np.arange(1000), np.arange(500)))
+        A = np.arange(2500)
+        df = DataFrame({'A': A,
+                        'B': B,
+                        'C': A,
+                        'D': B,
+                        'E': A,
+                        'F': B,
+                        'G': A,
+                        'H': B,
+                        'values': np.random.randn(2500)})
+
+        lg = df.groupby(['A', 'B', 'C', 'D', 'E', 'F', 'G', 'H'])
+        rg = df.groupby(['H', 'G', 'F', 'E', 'D', 'C', 'B', 'A'])
+
+        left = lg.sum()['values']
+        right = rg.sum()['values']
+
+        exp_index, _ = left.index.sortlevel()
+        tm.assert_index_equal(left.index, exp_index)
+
+        exp_index, _ = right.index.sortlevel(0)
+        tm.assert_index_equal(right.index, exp_index)
+
+        tups = list(map(tuple, df[['A', 'B', 'C', 'D', 'E', 'F', 'G', 'H'
+                                   ]].values))
+        tups = com._asarray_tuplesafe(tups)
+
+        expected = df.groupby(tups).sum()['values']
+
+        for k, v in compat.iteritems(expected):
+            assert left[k] == right[k[::-1]]
+            assert left[k] == v
+        assert len(left) == len(right)
+
+    def test_int64_overflow_moar(self):
+
+        # GH9096
+        values = range(55109)
+        data = DataFrame.from_dict(
+            {'a': values, 'b': values, 'c': values, 'd': values})
+        grouped = data.groupby(['a', 'b', 'c', 'd'])
+        assert len(grouped) == len(values)
+
+        arr = np.random.randint(-1 << 12, 1 << 12, (1 << 15, 5))
+        i = np.random.choice(len(arr), len(arr) * 4)
+        arr = np.vstack((arr, arr[i]))  # add sume duplicate rows
+
+        i = np.random.permutation(len(arr))
+        arr = arr[i]  # shuffle rows
+
+        df = DataFrame(arr, columns=list('abcde'))
+        df['jim'], df['joe'] = np.random.randn(2, len(df)) * 10
+        gr = df.groupby(list('abcde'))
+
+        # verify this is testing what it is supposed to test!
+        assert is_int64_overflow_possible(gr.grouper.shape)
+
+        # manually compute groupings
+        jim, joe = defaultdict(list), defaultdict(list)
+        for key, a, b in zip(map(tuple, arr), df['jim'], df['joe']):
+            jim[key].append(a)
+            joe[key].append(b)
+
+        assert len(gr) == len(jim)
+        mi = MultiIndex.from_tuples(jim.keys(), names=list('abcde'))
+
+        def aggr(func):
+            f = lambda a: np.fromiter(map(func, a), dtype='f8')
+            arr = np.vstack((f(jim.values()), f(joe.values()))).T
+            res = DataFrame(arr, columns=['jim', 'joe'], index=mi)
+            return res.sort_index()
+
+        assert_frame_equal(gr.mean(), aggr(np.mean))
+        assert_frame_equal(gr.median(), aggr(np.median))
+
+    def test_lexsort_indexer(self):
+        keys = [[nan] * 5 + list(range(100)) + [nan] * 5]
+        # orders=True, na_position='last'
+        result = lexsort_indexer(keys, orders=True, na_position='last')
+        exp = list(range(5, 105)) + list(range(5)) + list(range(105, 110))
+        tm.assert_numpy_array_equal(result, np.array(exp, dtype=np.intp))
+
+        # orders=True, na_position='first'
+        result = lexsort_indexer(keys, orders=True, na_position='first')
+        exp = list(range(5)) + list(range(105, 110)) + list(range(5, 105))
+        tm.assert_numpy_array_equal(result, np.array(exp, dtype=np.intp))
+
+        # orders=False, na_position='last'
+        result = lexsort_indexer(keys, orders=False, na_position='last')
+        exp = list(range(104, 4, -1)) + list(range(5)) + list(range(105, 110))
+        tm.assert_numpy_array_equal(result, np.array(exp, dtype=np.intp))
+
+        # orders=False, na_position='first'
+        result = lexsort_indexer(keys, orders=False, na_position='first')
+        exp = list(range(5)) + list(range(105, 110)) + list(range(104, 4, -1))
+        tm.assert_numpy_array_equal(result, np.array(exp, dtype=np.intp))
+
+    def test_nargsort(self):
+        # np.argsort(items) places NaNs last
+        items = [nan] * 5 + list(range(100)) + [nan] * 5
+        # np.argsort(items2) may not place NaNs first
+        items2 = np.array(items, dtype='O')
+
+        try:
+            # GH 2785; due to a regression in NumPy1.6.2
+            np.argsort(np.array([[1, 2], [1, 3], [1, 2]], dtype='i'))
+            np.argsort(items2, kind='mergesort')
+        except TypeError:
+            pytest.skip('requested sort not available for type')
+
+        # mergesort is the most difficult to get right because we want it to be
+        # stable.
+
+        # According to numpy/core/tests/test_multiarray, """The number of
+        # sorted items must be greater than ~50 to check the actual algorithm
+        # because quick and merge sort fall over to insertion sort for small
+        # arrays."""
+
+        # mergesort, ascending=True, na_position='last'
+        result = nargsort(items, kind='mergesort', ascending=True,
+                          na_position='last')
+        exp = list(range(5, 105)) + list(range(5)) + list(range(105, 110))
+        tm.assert_numpy_array_equal(result, np.array(exp), check_dtype=False)
+
+        # mergesort, ascending=True, na_position='first'
+        result = nargsort(items, kind='mergesort', ascending=True,
+                          na_position='first')
+        exp = list(range(5)) + list(range(105, 110)) + list(range(5, 105))
+        tm.assert_numpy_array_equal(result, np.array(exp), check_dtype=False)
+
+        # mergesort, ascending=False, na_position='last'
+        result = nargsort(items, kind='mergesort', ascending=False,
+                          na_position='last')
+        exp = list(range(104, 4, -1)) + list(range(5)) + list(range(105, 110))
+        tm.assert_numpy_array_equal(result, np.array(exp), check_dtype=False)
+
+        # mergesort, ascending=False, na_position='first'
+        result = nargsort(items, kind='mergesort', ascending=False,
+                          na_position='first')
+        exp = list(range(5)) + list(range(105, 110)) + list(range(104, 4, -1))
+        tm.assert_numpy_array_equal(result, np.array(exp), check_dtype=False)
+
+        # mergesort, ascending=True, na_position='last'
+        result = nargsort(items2, kind='mergesort', ascending=True,
+                          na_position='last')
+        exp = list(range(5, 105)) + list(range(5)) + list(range(105, 110))
+        tm.assert_numpy_array_equal(result, np.array(exp), check_dtype=False)
+
+        # mergesort, ascending=True, na_position='first'
+        result = nargsort(items2, kind='mergesort', ascending=True,
+                          na_position='first')
+        exp = list(range(5)) + list(range(105, 110)) + list(range(5, 105))
+        tm.assert_numpy_array_equal(result, np.array(exp), check_dtype=False)
+
+        # mergesort, ascending=False, na_position='last'
+        result = nargsort(items2, kind='mergesort', ascending=False,
+                          na_position='last')
+        exp = list(range(104, 4, -1)) + list(range(5)) + list(range(105, 110))
+        tm.assert_numpy_array_equal(result, np.array(exp), check_dtype=False)
+
+        # mergesort, ascending=False, na_position='first'
+        result = nargsort(items2, kind='mergesort', ascending=False,
+                          na_position='first')
+        exp = list(range(5)) + list(range(105, 110)) + list(range(104, 4, -1))
+        tm.assert_numpy_array_equal(result, np.array(exp), check_dtype=False)
+
+
+class TestMerge(object):
+
+    @pytest.mark.slow
+    def test_int64_overflow_issues(self):
+
+        # #2690, combinatorial explosion
+        df1 = DataFrame(np.random.randn(1000, 7),
+                        columns=list('ABCDEF') + ['G1'])
+        df2 = DataFrame(np.random.randn(1000, 7),
+                        columns=list('ABCDEF') + ['G2'])
+
+        # it works!
+        result = merge(df1, df2, how='outer')
+        assert len(result) == 2000
+
+        low, high, n = -1 << 10, 1 << 10, 1 << 20
+        left = DataFrame(np.random.randint(low, high, (n, 7)),
+                         columns=list('ABCDEFG'))
+        left['left'] = left.sum(axis=1)
+
+        # one-2-one match
+        i = np.random.permutation(len(left))
+        right = left.iloc[i].copy()
+        right.columns = right.columns[:-1].tolist() + ['right']
+        right.index = np.arange(len(right))
+        right['right'] *= -1
+
+        out = merge(left, right, how='outer')
+        assert len(out) == len(left)
+        assert_series_equal(out['left'], - out['right'], check_names=False)
+        result = out.iloc[:, :-2].sum(axis=1)
+        assert_series_equal(out['left'], result, check_names=False)
+        assert result.name is None
+
+        out.sort_values(out.columns.tolist(), inplace=True)
+        out.index = np.arange(len(out))
+        for how in ['left', 'right', 'outer', 'inner']:
+            assert_frame_equal(out, merge(left, right, how=how, sort=True))
+
+        # check that left merge w/ sort=False maintains left frame order
+        out = merge(left, right, how='left', sort=False)
+        assert_frame_equal(left, out[left.columns.tolist()])
+
+        out = merge(right, left, how='left', sort=False)
+        assert_frame_equal(right, out[right.columns.tolist()])
+
+        # one-2-many/none match
+        n = 1 << 11
+        left = DataFrame(np.random.randint(low, high, (n, 7)).astype('int64'),
+                         columns=list('ABCDEFG'))
+
+        # confirm that this is checking what it is supposed to check
+        shape = left.apply(Series.nunique).values
+        assert is_int64_overflow_possible(shape)
+
+        # add duplicates to left frame
+        left = concat([left, left], ignore_index=True)
+
+        right = DataFrame(np.random.randint(low, high, (n // 2, 7))
+                          .astype('int64'),
+                          columns=list('ABCDEFG'))
+
+        # add duplicates & overlap with left to the right frame
+        i = np.random.choice(len(left), n)
+        right = concat([right, right, left.iloc[i]], ignore_index=True)
+
+        left['left'] = np.random.randn(len(left))
+        right['right'] = np.random.randn(len(right))
+
+        # shuffle left & right frames
+        i = np.random.permutation(len(left))
+        left = left.iloc[i].copy()
+        left.index = np.arange(len(left))
+
+        i = np.random.permutation(len(right))
+        right = right.iloc[i].copy()
+        right.index = np.arange(len(right))
+
+        # manually compute outer merge
+        ldict, rdict = defaultdict(list), defaultdict(list)
+
+        for idx, row in left.set_index(list('ABCDEFG')).iterrows():
+            ldict[idx].append(row['left'])
+
+        for idx, row in right.set_index(list('ABCDEFG')).iterrows():
+            rdict[idx].append(row['right'])
+
+        vals = []
+        for k, lval in ldict.items():
+            rval = rdict.get(k, [np.nan])
+            for lv, rv in product(lval, rval):
+                vals.append(k + tuple([lv, rv]))
+
+        for k, rval in rdict.items():
+            if k not in ldict:
+                for rv in rval:
+                    vals.append(k + tuple([np.nan, rv]))
+
+        def align(df):
+            df = df.sort_values(df.columns.tolist())
+            df.index = np.arange(len(df))
+            return df
+
+        def verify_order(df):
+            kcols = list('ABCDEFG')
+            assert_frame_equal(df[kcols].copy(),
+                               df[kcols].sort_values(kcols, kind='mergesort'))
+
+        out = DataFrame(vals, columns=list('ABCDEFG') + ['left', 'right'])
+        out = align(out)
+
+        jmask = {'left': out['left'].notna(),
+                 'right': out['right'].notna(),
+                 'inner': out['left'].notna() & out['right'].notna(),
+                 'outer': np.ones(len(out), dtype='bool')}
+
+        for how in 'left', 'right', 'outer', 'inner':
+            mask = jmask[how]
+            frame = align(out[mask].copy())
+            assert mask.all() ^ mask.any() or how == 'outer'
+
+            for sort in [False, True]:
+                res = merge(left, right, how=how, sort=sort)
+                if sort:
+                    verify_order(res)
+
+                # as in GH9092 dtypes break with outer/right join
+                assert_frame_equal(frame, align(res),
+                                   check_dtype=how not in ('right', 'outer'))
+
+
+def test_decons():
+
+    def testit(label_list, shape):
+        group_index = get_group_index(label_list, shape, sort=True, xnull=True)
+        label_list2 = decons_group_index(group_index, shape)
+
+        for a, b in zip(label_list, label_list2):
+            tm.assert_numpy_array_equal(a, b)
+
+    shape = (4, 5, 6)
+    label_list = [np.tile([0, 1, 2, 3, 0, 1, 2, 3], 100).astype(np.int64),
+                  np.tile([0, 2, 4, 3, 0, 1, 2, 3], 100).astype(np.int64),
+                  np.tile([5, 1, 0, 2, 3, 0, 5, 4], 100).astype(np.int64)]
+    testit(label_list, shape)
+
+    shape = (10000, 10000)
+    label_list = [np.tile(np.arange(10000, dtype=np.int64), 5),
+                  np.tile(np.arange(10000, dtype=np.int64), 5)]
+    testit(label_list, shape)
+
+
+class TestSafeSort(object):
+
+    def test_basic_sort(self):
+        values = [3, 1, 2, 0, 4]
+        result = safe_sort(values)
+        expected = np.array([0, 1, 2, 3, 4])
+        tm.assert_numpy_array_equal(result, expected)
+
+        values = list("baaacb")
+        result = safe_sort(values)
+        expected = np.array(list("aaabbc"), dtype='object')
+        tm.assert_numpy_array_equal(result, expected)
+
+        values = []
+        result = safe_sort(values)
+        expected = np.array([])
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_labels(self):
+        values = [3, 1, 2, 0, 4]
+        expected = np.array([0, 1, 2, 3, 4])
+
+        labels = [0, 1, 1, 2, 3, 0, -1, 4]
+        result, result_labels = safe_sort(values, labels)
+        expected_labels = np.array([3, 1, 1, 2, 0, 3, -1, 4], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result_labels, expected_labels)
+
+        # na_sentinel
+        labels = [0, 1, 1, 2, 3, 0, 99, 4]
+        result, result_labels = safe_sort(values, labels,
+                                          na_sentinel=99)
+        expected_labels = np.array([3, 1, 1, 2, 0, 3, 99, 4], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result_labels, expected_labels)
+
+        # out of bound indices
+        labels = [0, 101, 102, 2, 3, 0, 99, 4]
+        result, result_labels = safe_sort(values, labels)
+        expected_labels = np.array([3, -1, -1, 2, 0, 3, -1, 4], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result_labels, expected_labels)
+
+        labels = []
+        result, result_labels = safe_sort(values, labels)
+        expected_labels = np.array([], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result_labels, expected_labels)
+
+    def test_mixed_integer(self):
+        values = np.array(['b', 1, 0, 'a', 0, 'b'], dtype=object)
+        result = safe_sort(values)
+        expected = np.array([0, 0, 1, 'a', 'b', 'b'], dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        values = np.array(['b', 1, 0, 'a'], dtype=object)
+        labels = [0, 1, 2, 3, 0, -1, 1]
+        result, result_labels = safe_sort(values, labels)
+        expected = np.array([0, 1, 'a', 'b'], dtype=object)
+        expected_labels = np.array([3, 1, 0, 2, 3, -1, 1], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result_labels, expected_labels)
+
+    def test_mixed_integer_from_list(self):
+        values = ['b', 1, 0, 'a', 0, 'b']
+        result = safe_sort(values)
+        expected = np.array([0, 0, 1, 'a', 'b', 'b'], dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_unsortable(self):
+        # GH 13714
+        arr = np.array([1, 2, datetime.now(), 0, 3], dtype=object)
+        if compat.PY2 and not _np_version_under1p10:
+            # RuntimeWarning: tp_compare didn't return -1 or -2 for exception
+            with warnings.catch_warnings():
+                pytest.raises(TypeError, safe_sort, arr)
+        else:
+            pytest.raises(TypeError, safe_sort, arr)
+
+    def test_exceptions(self):
+        with tm.assert_raises_regex(TypeError,
+                                    "Only list-like objects are allowed"):
+            safe_sort(values=1)
+
+        with tm.assert_raises_regex(TypeError,
+                                    "Only list-like objects or None"):
+            safe_sort(values=[0, 1, 2], labels=1)
+
+        with tm.assert_raises_regex(ValueError,
+                                    "values should be unique"):
+            safe_sort(values=[0, 1, 2, 1], labels=[0, 1])
diff --git a/pandas/tests/test_stats.py b/pandas/tests/test_stats.py
deleted file mode 100644
index 9acd7c2233b7b..0000000000000
--- a/pandas/tests/test_stats.py
+++ /dev/null
@@ -1,175 +0,0 @@
-# -*- coding: utf-8 -*-
-from pandas import compat
-import nose
-
-from numpy import nan
-import numpy as np
-
-from pandas import Series, DataFrame
-
-from pandas.compat import product
-from pandas.util.testing import (assert_frame_equal,
-                                 assert_series_equal,
-                                 assert_almost_equal)
-import pandas.util.testing as tm
-
-class TestRank(tm.TestCase):
-    _multiprocess_can_split_ = True
-    s = Series([1, 3, 4, 2, nan, 2, 1, 5, nan, 3])
-    df = DataFrame({'A': s, 'B': s})
-
-    results = {
-        'average': np.array([1.5, 5.5, 7.0, 3.5, nan,
-                             3.5, 1.5, 8.0, nan, 5.5]),
-        'min': np.array([1, 5, 7, 3, nan, 3, 1, 8, nan, 5]),
-        'max': np.array([2, 6, 7, 4, nan, 4, 2, 8, nan, 6]),
-        'first': np.array([1, 5, 7, 3, nan, 4, 2, 8, nan, 6]),
-        'dense': np.array([1, 3, 4, 2, nan, 2, 1, 5, nan, 3]),
-    }
-
-    def test_rank_tie_methods(self):
-        s = self.s
-
-        def _check(s, expected, method='average'):
-            result = s.rank(method=method)
-            assert_almost_equal(result, expected)
-
-        dtypes = [None, object]
-        disabled = set([(object, 'first')])
-        results = self.results
-
-        for method, dtype in product(results, dtypes):
-            if (dtype, method) in disabled:
-                continue
-            series = s if dtype is None else s.astype(dtype)
-            _check(series, results[method], method=method)
-
-    def test_rank_methods_series(self):
-        tm.skip_if_no_package('scipy', '0.13', 'scipy.stats.rankdata')
-        from scipy.stats import rankdata
-
-        xs = np.random.randn(9)
-        xs = np.concatenate([xs[i:] for i in range(0, 9, 2)]) # add duplicates
-        np.random.shuffle(xs)
-
-        index = [chr(ord('a') + i) for i in range(len(xs))]
-
-        for vals in [xs, xs + 1e6, xs * 1e-6]:
-            ts = Series(vals, index=index)
-
-            for m in ['average', 'min', 'max', 'first', 'dense']:
-                result = ts.rank(m)
-                sprank = rankdata(vals, m if m != 'first' else 'ordinal')
-                tm.assert_series_equal(result, Series(sprank, index=index))
-
-    def test_rank_methods_frame(self):
-        tm.skip_if_no_package('scipy', '0.13', 'scipy.stats.rankdata')
-        from scipy.stats import rankdata
-
-        xs = np.random.randint(0, 21, (100, 26))
-        xs = (xs - 10.0) / 10.0
-        cols = [chr(ord('z') - i) for i in range(xs.shape[1])]
-
-        for vals in [xs, xs + 1e6, xs * 1e-6]:
-            df = DataFrame(vals, columns=cols)
-
-            for ax in [0, 1]:
-                for m in ['average', 'min', 'max', 'first', 'dense']:
-                    result = df.rank(axis=ax, method=m)
-                    sprank = np.apply_along_axis(rankdata, ax, vals,
-                                      m if m != 'first' else 'ordinal')
-                    expected = DataFrame(sprank, columns=cols)
-                    tm.assert_frame_equal(result, expected)
-
-    def test_rank_dense_method(self):
-        dtypes = ['O', 'f8', 'i8']
-        in_out = [([1], [1]),
-                  ([2], [1]),
-                  ([0], [1]),
-                  ([2,2], [1,1]),
-                  ([1,2,3], [1,2,3]),
-                  ([4,2,1], [3,2,1],),
-                  ([1,1,5,5,3], [1,1,3,3,2]),
-                  ([-5,-4,-3,-2,-1], [1,2,3,4,5])]
-
-        for ser, exp in in_out:
-            for dtype in dtypes:
-                s = Series(ser).astype(dtype)
-                result = s.rank(method='dense')
-                expected = Series(exp).astype(result.dtype)
-                assert_series_equal(result, expected)
-
-    def test_rank_descending(self):
-        dtypes = ['O', 'f8', 'i8']
-
-        for dtype, method in product(dtypes, self.results):
-            if 'i' in dtype:
-                s = self.s.dropna()
-                df = self.df.dropna()
-            else:
-                s = self.s.astype(dtype)
-                df = self.df.astype(dtype)
-
-            res = s.rank(ascending=False)
-            expected = (s.max() - s).rank()
-            assert_series_equal(res, expected)
-
-            res = df.rank(ascending=False)
-            expected = (df.max() - df).rank()
-            assert_frame_equal(res, expected)
-
-            if method == 'first' and dtype == 'O':
-                continue
-
-            expected = (s.max() - s).rank(method=method)
-            res2 = s.rank(method=method, ascending=False)
-            assert_series_equal(res2, expected)
-
-            expected = (df.max() - df).rank(method=method)
-
-            if dtype != 'O':
-                res2 = df.rank(method=method, ascending=False,
-                               numeric_only=True)
-                assert_frame_equal(res2, expected)
-
-            res3 = df.rank(method=method, ascending=False,
-                           numeric_only=False)
-            assert_frame_equal(res3, expected)
-
-    def test_rank_2d_tie_methods(self):
-        s = self.s
-        df = self.df
-
-        def _check2d(df, expected, method='average', axis=0):
-            exp_df = DataFrame({'A': expected, 'B': expected})
-
-            if axis == 1:
-                df = df.T
-                exp_df = exp_df.T
-
-            result = df.rank(method=method, axis=axis)
-            assert_frame_equal(result, exp_df)
-
-        dtypes = [None, object]
-        disabled = set([(object, 'first')])
-        results = self.results
-
-        for method, axis, dtype in product(results, [0, 1], dtypes):
-            if (dtype, method) in disabled:
-                continue
-            frame = df if dtype is None else df.astype(dtype)
-            _check2d(frame, results[method], method=method, axis=axis)
-
-    def test_rank_int(self):
-        s = self.s.dropna().astype('i8')
-
-        for method, res in compat.iteritems(self.results):
-            result = s.rank(method=method)
-            expected = Series(res).dropna()
-            expected.index = result.index
-            assert_series_equal(result, expected)
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_strings.py b/pandas/tests/test_strings.py
index 31623d5c277c4..9d008dfd25c90 100644
--- a/pandas/tests/test_strings.py
+++ b/pandas/tests/test_strings.py
@@ -1,45 +1,45 @@
 # -*- coding: utf-8 -*-
 # pylint: disable-msg=E1101,W0612
 
-from datetime import datetime, timedelta, date
-import os
-import operator
+from datetime import datetime, timedelta
+import pytest
 import re
-import warnings
-
-import nose
 
 from numpy import nan as NA
 import numpy as np
 from numpy.random import randint
 
-from pandas.compat import range, lrange, u, unichr
+from pandas.compat import range, u
 import pandas.compat as compat
-from pandas import (Index, Series, DataFrame, isnull, notnull,
-                    bdate_range, date_range, MultiIndex)
-import pandas.core.common as com
+from pandas import Index, Series, DataFrame, isna, MultiIndex, notna, concat
 
-from pandas.util.testing import assert_series_equal, assert_almost_equal
+from pandas.util.testing import assert_series_equal, assert_index_equal
 import pandas.util.testing as tm
 
 import pandas.core.strings as strings
 
 
-class TestStringMethods(tm.TestCase):
+def assert_series_or_index_equal(left, right):
+    if isinstance(left, Series):
+        assert_series_equal(left, right)
+    else:  # Index
+        assert_index_equal(left, right)
+
 
-    _multiprocess_can_split_ = True
+class TestStringMethods(object):
 
     def test_api(self):
 
         # GH 6106, GH 9322
-        self.assertIs(Series.str, strings.StringMethods)
-        self.assertIsInstance(Series(['']).str, strings.StringMethods)
+        assert Series.str is strings.StringMethods
+        assert isinstance(Series(['']).str, strings.StringMethods)
 
         # GH 9184
         invalid = Series([1])
-        with tm.assertRaisesRegexp(AttributeError, "only use .str accessor"):
+        with tm.assert_raises_regex(AttributeError,
+                                    "only use .str accessor"):
             invalid.str
-        self.assertFalse(hasattr(invalid, 'str'))
+        assert not hasattr(invalid, 'str')
 
     def test_iter(self):
         # GH3638
@@ -48,20 +48,20 @@ def test_iter(self):
 
         for s in ds.str:
             # iter must yield a Series
-            tm.assertIsInstance(s, Series)
+            assert isinstance(s, Series)
 
             # indices of each yielded Series should be equal to the index of
             # the original Series
-            tm.assert_numpy_array_equal(s.index, ds.index)
+            tm.assert_index_equal(s.index, ds.index)
 
             for el in s:
                 # each element of the series is either a basestring/str or nan
-                self.assertTrue(isinstance(el, compat.string_types) or isnull(el))
+                assert isinstance(el, compat.string_types) or isna(el)
 
         # desired behavior is to iterate until everything would be nan on the
         # next iter so make sure the last element of the iterator was 'l' in
         # this case since 'wikitravel' is the longest string
-        self.assertEqual(s.dropna().values.item(), 'l')
+        assert s.dropna().values.item() == 'l'
 
     def test_iter_empty(self):
         ds = Series([], dtype=object)
@@ -73,8 +73,8 @@ def test_iter_empty(self):
 
         # nothing to iterate over so nothing defined values should remain
         # unchanged
-        self.assertEqual(i, 100)
-        self.assertEqual(s, 1)
+        assert i == 100
+        assert s == 1
 
     def test_iter_single_element(self):
         ds = Series(['a'])
@@ -82,143 +82,495 @@ def test_iter_single_element(self):
         for i, s in enumerate(ds.str):
             pass
 
-        self.assertFalse(i)
+        assert not i
         assert_series_equal(ds, s)
 
     def test_iter_object_try_string(self):
-        ds = Series([slice(None, randint(10), randint(10, 20))
-                     for _ in range(4)])
+        ds = Series([slice(None, randint(10), randint(10, 20)) for _ in range(
+            4)])
 
         i, s = 100, 'h'
 
         for i, s in enumerate(ds.str):
             pass
 
-        self.assertEqual(i, 100)
-        self.assertEqual(s, 'h')
+        assert i == 100
+        assert s == 'h'
 
     def test_cat(self):
-        one = ['a', 'a', 'b', 'b', 'c', NA]
-        two = ['a', NA, 'b', 'd', 'foo', NA]
+        one = np.array(['a', 'a', 'b', 'b', 'c', NA], dtype=np.object_)
+        two = np.array(['a', NA, 'b', 'd', 'foo', NA], dtype=np.object_)
 
         # single array
         result = strings.str_cat(one)
-        self.assertTrue(isnull(result))
+        exp = 'aabbc'
+        assert result == exp
 
         result = strings.str_cat(one, na_rep='NA')
         exp = 'aabbcNA'
-        self.assertEqual(result, exp)
+        assert result == exp
 
         result = strings.str_cat(one, na_rep='-')
         exp = 'aabbc-'
-        self.assertEqual(result, exp)
+        assert result == exp
 
         result = strings.str_cat(one, sep='_', na_rep='NA')
         exp = 'a_a_b_b_c_NA'
-        self.assertEqual(result, exp)
+        assert result == exp
+
+        result = strings.str_cat(two, sep='-')
+        exp = 'a-b-d-foo'
+        assert result == exp
 
         # Multiple arrays
         result = strings.str_cat(one, [two], na_rep='NA')
-        exp = ['aa', 'aNA', 'bb', 'bd', 'cfoo', 'NANA']
-        self.assert_numpy_array_equal(result, exp)
+        exp = np.array(['aa', 'aNA', 'bb', 'bd', 'cfoo', 'NANA'],
+                       dtype=np.object_)
+        tm.assert_numpy_array_equal(result, exp)
 
         result = strings.str_cat(one, two)
-        exp = ['aa', NA, 'bb', 'bd', 'cfoo', NA]
+        exp = np.array(['aa', NA, 'bb', 'bd', 'cfoo', NA], dtype=np.object_)
         tm.assert_almost_equal(result, exp)
 
+        # error for incorrect lengths
+        rgx = 'All arrays must be same length'
+        three = Series(['1', '2', '3'])
+
+        with tm.assert_raises_regex(ValueError, rgx):
+            strings.str_cat(one, three)
+
+        # error for incorrect type
+        rgx = "Must pass arrays containing strings to str_cat"
+        with tm.assert_raises_regex(ValueError, rgx):
+            strings.str_cat(one, 'three')
+
+    @pytest.mark.parametrize('container', [Series, Index])
+    @pytest.mark.parametrize('other', [None, Series, Index])
+    def test_str_cat_name(self, container, other):
+        # https://github.com/pandas-dev/pandas/issues/21053
+        values = ['a', 'b']
+        if other:
+            other = other(values)
+        else:
+            other = values
+        result = container(values, name='name').str.cat(other, sep=',',
+                                                        join='left')
+        assert result.name == 'name'
+
+    @pytest.mark.parametrize('series_or_index', ['series', 'index'])
+    def test_str_cat(self, series_or_index):
+        # test_cat above tests "str_cat" from ndarray to ndarray;
+        # here testing "str.cat" from Series/Index to Series/Index/ndarray/list
+        s = Index(['a', 'a', 'b', 'b', 'c', np.nan])
+        if series_or_index == 'series':
+            s = Series(s)
+        t = Index(['a', np.nan, 'b', 'd', 'foo', np.nan])
+
+        # single array
+        result = s.str.cat()
+        exp = 'aabbc'
+        assert result == exp
+
+        result = s.str.cat(na_rep='-')
+        exp = 'aabbc-'
+        assert result == exp
+
+        result = s.str.cat(sep='_', na_rep='NA')
+        exp = 'a_a_b_b_c_NA'
+        assert result == exp
+
+        # Series/Index with Index
+        exp = Index(['aa', 'a-', 'bb', 'bd', 'cfoo', '--'])
+        if series_or_index == 'series':
+            exp = Series(exp)
+        # s.index / s is different from t (as Index) -> warning
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # FutureWarning to switch to alignment by default
+            assert_series_or_index_equal(s.str.cat(t, na_rep='-'), exp)
+
+        # Series/Index with Series
+        t = Series(t)
+        # s as Series has same index as t -> no warning
+        # s as Index is different from t.index -> warning (tested below)
+        if series_or_index == 'series':
+            assert_series_equal(s.str.cat(t, na_rep='-'), exp)
+
+        # Series/Index with Series: warning if different indexes
+        t.index = t.index + 1
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # FutureWarning to switch to alignment by default
+            assert_series_or_index_equal(s.str.cat(t, na_rep='-'), exp)
+
+        # Series/Index with array
+        assert_series_or_index_equal(s.str.cat(t.values, na_rep='-'), exp)
+
+        # Series/Index with list
+        assert_series_or_index_equal(s.str.cat(list(t), na_rep='-'), exp)
+
+        # errors for incorrect lengths
+        rgx = 'All arrays must be same length, except.*'
+        z = Series(['1', '2', '3'])
+
+        with tm.assert_raises_regex(ValueError, rgx):
+            s.str.cat(z)
+
+        with tm.assert_raises_regex(ValueError, rgx):
+            s.str.cat(z.values)
+
+        with tm.assert_raises_regex(ValueError, rgx):
+            s.str.cat(list(z))
+
+    @pytest.mark.parametrize('series_or_index', ['series', 'index'])
+    def test_str_cat_raises_intuitive_error(self, series_or_index):
+        # https://github.com/pandas-dev/pandas/issues/11334
+        s = Index(['a', 'b', 'c', 'd'])
+        if series_or_index == 'series':
+            s = Series(s)
+        message = "Did you mean to supply a `sep` keyword?"
+        with tm.assert_raises_regex(ValueError, message):
+            s.str.cat('|')
+        with tm.assert_raises_regex(ValueError, message):
+            s.str.cat('    ')
+
+    @pytest.mark.parametrize('series_or_index, dtype_caller, dtype_target', [
+        ('series', 'object', 'object'),
+        ('series', 'object', 'category'),
+        ('series', 'category', 'object'),
+        ('series', 'category', 'category'),
+        ('index', 'object', 'object'),
+        ('index', 'object', 'category'),
+        ('index', 'category', 'object'),
+        ('index', 'category', 'category')
+    ])
+    def test_str_cat_categorical(self, series_or_index,
+                                 dtype_caller, dtype_target):
+        s = Index(['a', 'a', 'b', 'a'], dtype=dtype_caller)
+        if series_or_index == 'series':
+            s = Series(s)
+        t = Index(['b', 'a', 'b', 'c'], dtype=dtype_target)
+
+        exp = Index(['ab', 'aa', 'bb', 'ac'])
+        if series_or_index == 'series':
+            exp = Series(exp)
+
+        # Series/Index with Index
+        # s.index / s is different from t (as Index) -> warning
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # FutureWarning to switch to alignment by default
+            assert_series_or_index_equal(s.str.cat(t), exp)
+
+        # Series/Index with Series
+        t = Series(t)
+        # s as Series has same index as t -> no warning
+        # s as Index is different from t.index -> warning (tested below)
+        if series_or_index == 'series':
+            assert_series_equal(s.str.cat(t), exp)
+
+        # Series/Index with Series: warning if different indexes
+        t.index = t.index + 1
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # FutureWarning to switch to alignment by default
+            assert_series_or_index_equal(s.str.cat(t, na_rep='-'), exp)
+
+    @pytest.mark.parametrize('series_or_index', ['series', 'index'])
+    def test_str_cat_mixed_inputs(self, series_or_index):
+        s = Index(['a', 'b', 'c', 'd'])
+        if series_or_index == 'series':
+            s = Series(s)
+        t = Series(['A', 'B', 'C', 'D'])
+        d = concat([t, Series(s)], axis=1)
+
+        exp = Index(['aAa', 'bBb', 'cCc', 'dDd'])
+        if series_or_index == 'series':
+            exp = Series(exp)
+
+        # Series/Index with DataFrame
+        # s as Series has same index as d -> no warning
+        # s as Index is different from d.index -> warning (tested below)
+        if series_or_index == 'series':
+            assert_series_equal(s.str.cat(d), exp)
+
+        # Series/Index with DataFrame: warning if different indexes
+        d.index = d.index + 1
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # FutureWarning to switch to alignment by default
+            assert_series_or_index_equal(s.str.cat(d), exp)
+
+        # Series/Index with two-dimensional ndarray
+        assert_series_or_index_equal(s.str.cat(d.values), exp)
+
+        # Series/Index with list of Series
+        # s as Series has same index as t, s -> no warning
+        # s as Index is different from t.index -> warning (tested below)
+        if series_or_index == 'series':
+            assert_series_equal(s.str.cat([t, s]), exp)
+
+        # Series/Index with list of Series: warning if different indexes
+        tt = t.copy()
+        tt.index = tt.index + 1
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # FutureWarning to switch to alignment by default
+            assert_series_or_index_equal(s.str.cat([tt, s]), exp)
+
+        # Series/Index with list of list-likes
+        assert_series_or_index_equal(s.str.cat([t.values, list(s)]), exp)
+
+        # Series/Index with mixed list of Series/list-like
+        # s as Series has same index as t -> no warning
+        # s as Index is different from t.index -> warning (tested below)
+        if series_or_index == 'series':
+            assert_series_equal(s.str.cat([t, s.values]), exp)
+
+        # Series/Index with mixed list: warning if different indexes
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # FutureWarning to switch to alignment by default
+            assert_series_or_index_equal(s.str.cat([tt, s.values]), exp)
+
+        # Series/Index with iterator of list-likes
+        assert_series_or_index_equal(s.str.cat(iter([t.values, list(s)])), exp)
+
+        # errors for incorrect lengths
+        rgx = 'All arrays must be same length, except.*'
+        z = Series(['1', '2', '3'])
+        e = concat([z, z], axis=1)
+
+        # DataFrame
+        with tm.assert_raises_regex(ValueError, rgx):
+            s.str.cat(e)
+
+        # two-dimensional ndarray
+        with tm.assert_raises_regex(ValueError, rgx):
+            s.str.cat(e.values)
+
+        # list of Series
+        with tm.assert_raises_regex(ValueError, rgx):
+            s.str.cat([z, s])
+
+        # list of list-likes
+        with tm.assert_raises_regex(ValueError, rgx):
+            s.str.cat([z.values, list(s)])
+
+        # mixed list of Series/list-like
+        with tm.assert_raises_regex(ValueError, rgx):
+            s.str.cat([z, list(s)])
+
+        # errors for incorrect arguments in list-like
+        rgx = 'others must be Series, Index, DataFrame,.*'
+        # make sure None/NaN do not crash checks in _get_series_list
+        u = Series(['a', np.nan, 'c', None])
+
+        # mix of string and Series
+        with tm.assert_raises_regex(TypeError, rgx):
+            s.str.cat([u, 'u'])
+
+        # DataFrame in list
+        with tm.assert_raises_regex(TypeError, rgx):
+            s.str.cat([u, d])
+
+        # 2-dim ndarray in list
+        with tm.assert_raises_regex(TypeError, rgx):
+            s.str.cat([u, d.values])
+
+        # nested lists
+        with tm.assert_raises_regex(TypeError, rgx):
+            s.str.cat([u, [u, d]])
+
+        # forbidden input type, e.g. int
+        with tm.assert_raises_regex(TypeError, rgx):
+            s.str.cat(1)
+
+    @pytest.mark.parametrize('series_or_index, join', [
+        ('series', 'left'), ('series', 'outer'),
+        ('series', 'inner'), ('series', 'right'),
+        ('index', 'left'), ('index', 'outer'),
+        ('index', 'inner'), ('index', 'right')
+    ])
+    def test_str_cat_align_indexed(self, series_or_index, join):
+        # https://github.com/pandas-dev/pandas/issues/18657
+        s = Series(['a', 'b', 'c', 'd'], index=['a', 'b', 'c', 'd'])
+        t = Series(['D', 'A', 'E', 'B'], index=['d', 'a', 'e', 'b'])
+        sa, ta = s.align(t, join=join)
+        # result after manual alignment of inputs
+        exp = sa.str.cat(ta, na_rep='-')
+
+        if series_or_index == 'index':
+            s = Index(s)
+            sa = Index(sa)
+            exp = Index(exp)
+
+        assert_series_or_index_equal(s.str.cat(t, join=join, na_rep='-'), exp)
+
+    @pytest.mark.parametrize('join', ['left', 'outer', 'inner', 'right'])
+    def test_str_cat_align_mixed_inputs(self, join):
+        s = Series(['a', 'b', 'c', 'd'])
+        t = Series(['d', 'a', 'e', 'b'], index=[3, 0, 4, 1])
+        d = concat([t, t], axis=1)
+
+        exp_outer = Series(['aaa', 'bbb', 'c--', 'ddd', '-ee'])
+        sa, ta = s.align(t, join=join)
+        exp = exp_outer.loc[ta.index]
+
+        # list of Series
+        tm.assert_series_equal(s.str.cat([t, t], join=join, na_rep='-'), exp)
+
+        # DataFrame
+        tm.assert_series_equal(s.str.cat(d, join=join, na_rep='-'), exp)
+
+        # mixed list of indexed/unindexed
+        u = ['A', 'B', 'C', 'D']
+        exp_outer = Series(['aaA', 'bbB', 'c-C', 'ddD', '-e-'])
+        # u will be forced have index of s -> use s here as placeholder
+        e = concat([t, s], axis=1, join=(join if join == 'inner' else 'outer'))
+        sa, ea = s.align(e, join=join)
+        exp = exp_outer.loc[ea.index]
+        tm.assert_series_equal(s.str.cat([t, u], join=join, na_rep='-'), exp)
+
+        # errors for incorrect lengths
+        rgx = 'If `others` contains arrays or lists.*'
+        z = ['1', '2', '3']
+
+        # unindexed object of wrong length
+        with tm.assert_raises_regex(ValueError, rgx):
+            s.str.cat(z, join=join)
+
+        # unindexed object of wrong length in list
+        with tm.assert_raises_regex(ValueError, rgx):
+            s.str.cat([t, z], join=join)
+
+    def test_str_cat_special_cases(self):
+        s = Series(['a', 'b', 'c', 'd'])
+        t = Series(['d', 'a', 'e', 'b'], index=[3, 0, 4, 1])
+
+        # iterator of elements with different types
+        exp = Series(['aaA', 'bbB', 'c-C', 'ddD', '-e-'])
+        tm.assert_series_equal(s.str.cat(iter([t, ['A', 'B', 'C', 'D']]),
+                                         join='outer', na_rep='-'), exp)
+
+        # right-align with different indexes in others
+        exp = Series(['aa-', 'd-d'], index=[0, 3])
+        tm.assert_series_equal(s.str.cat([t.loc[[0]], t.loc[[3]]],
+                                         join='right', na_rep='-'), exp)
+
+    def test_cat_on_filtered_index(self):
+        df = DataFrame(index=MultiIndex.from_product(
+            [[2011, 2012], [1, 2, 3]], names=['year', 'month']))
+
+        df = df.reset_index()
+        df = df[df.month > 1]
+
+        str_year = df.year.astype('str')
+        str_month = df.month.astype('str')
+        str_both = str_year.str.cat(str_month, sep=' ', join='left')
+
+        assert str_both.loc[1] == '2011 2'
+
+        str_multiple = str_year.str.cat([str_month, str_month],
+                                        sep=' ', join='left')
+
+        assert str_multiple.loc[1] == '2011 2 2'
+
     def test_count(self):
-        values = ['foo', 'foofoo', NA, 'foooofooofommmfoo']
+        values = np.array(['foo', 'foofoo', NA, 'foooofooofommmfoo'],
+                          dtype=np.object_)
 
         result = strings.str_count(values, 'f[o]+')
-        exp = [1, 2, NA, 4]
-        tm.assert_almost_equal(result, exp)
+        exp = np.array([1, 2, NA, 4])
+        tm.assert_numpy_array_equal(result, exp)
 
         result = Series(values).str.count('f[o]+')
-        tm.assertIsInstance(result, Series)
-        tm.assert_almost_equal(result, exp)
+        exp = Series([1, 2, NA, 4])
+        assert isinstance(result, Series)
+        tm.assert_series_equal(result, exp)
 
         # mixed
         mixed = ['a', NA, 'b', True, datetime.today(), 'foo', None, 1, 2.]
         rs = strings.str_count(mixed, 'a')
-        xp = [1, NA, 0, NA, NA, 0, NA, NA, NA]
-        tm.assert_almost_equal(rs, xp)
+        xp = np.array([1, NA, 0, NA, NA, 0, NA, NA, NA])
+        tm.assert_numpy_array_equal(rs, xp)
 
         rs = Series(mixed).str.count('a')
-        tm.assertIsInstance(rs, Series)
-        tm.assert_almost_equal(rs, xp)
+        xp = Series([1, NA, 0, NA, NA, 0, NA, NA, NA])
+        assert isinstance(rs, Series)
+        tm.assert_series_equal(rs, xp)
 
         # unicode
         values = [u('foo'), u('foofoo'), NA, u('foooofooofommmfoo')]
 
         result = strings.str_count(values, 'f[o]+')
-        exp = [1, 2, NA, 4]
-        tm.assert_almost_equal(result, exp)
+        exp = np.array([1, 2, NA, 4])
+        tm.assert_numpy_array_equal(result, exp)
 
         result = Series(values).str.count('f[o]+')
-        tm.assertIsInstance(result, Series)
-        tm.assert_almost_equal(result, exp)
+        exp = Series([1, 2, NA, 4])
+        assert isinstance(result, Series)
+        tm.assert_series_equal(result, exp)
 
     def test_contains(self):
-        values = ['foo', NA, 'fooommm__foo', 'mmm_', 'foommm[_]+bar']
+        values = np.array(['foo', NA, 'fooommm__foo',
+                           'mmm_', 'foommm[_]+bar'], dtype=np.object_)
         pat = 'mmm[_]+'
 
         result = strings.str_contains(values, pat)
-        expected = [False, NA, True, True, False]
-        tm.assert_almost_equal(result, expected)
+        expected = np.array([False, NA, True, True, False], dtype=np.object_)
+        tm.assert_numpy_array_equal(result, expected)
 
         result = strings.str_contains(values, pat, regex=False)
-        expected = [False, NA, False, False, True]
-        tm.assert_almost_equal(result, expected)
+        expected = np.array([False, NA, False, False, True], dtype=np.object_)
+        tm.assert_numpy_array_equal(result, expected)
 
         values = ['foo', 'xyz', 'fooommm__foo', 'mmm_']
         result = strings.str_contains(values, pat)
-        expected = [False, False, True, True]
-        self.assertEqual(result.dtype, np.bool_)
-        tm.assert_almost_equal(result, expected)
+        expected = np.array([False, False, True, True])
+        assert result.dtype == np.bool_
+        tm.assert_numpy_array_equal(result, expected)
 
         # case insensitive using regex
         values = ['Foo', 'xYz', 'fOOomMm__fOo', 'MMM_']
         result = strings.str_contains(values, 'FOO|mmm', case=False)
-        expected = [True, False, True, True]
-        tm.assert_almost_equal(result, expected)
+        expected = np.array([True, False, True, True])
+        tm.assert_numpy_array_equal(result, expected)
 
         # case insensitive without regex
         result = strings.str_contains(values, 'foo', regex=False, case=False)
-        expected = [True, False, True, False]
-        tm.assert_almost_equal(result, expected)
+        expected = np.array([True, False, True, False])
+        tm.assert_numpy_array_equal(result, expected)
 
         # mixed
         mixed = ['a', NA, 'b', True, datetime.today(), 'foo', None, 1, 2.]
         rs = strings.str_contains(mixed, 'o')
-        xp = [False, NA, False, NA, NA, True, NA, NA, NA]
-        tm.assert_almost_equal(rs, xp)
+        xp = np.array([False, NA, False, NA, NA, True, NA, NA, NA],
+                      dtype=np.object_)
+        tm.assert_numpy_array_equal(rs, xp)
 
         rs = Series(mixed).str.contains('o')
-        tm.assertIsInstance(rs, Series)
-        tm.assert_almost_equal(rs, xp)
+        xp = Series([False, NA, False, NA, NA, True, NA, NA, NA])
+        assert isinstance(rs, Series)
+        tm.assert_series_equal(rs, xp)
 
         # unicode
-        values = [u('foo'), NA, u('fooommm__foo'), u('mmm_')]
+        values = np.array([u'foo', NA, u'fooommm__foo', u'mmm_'],
+                          dtype=np.object_)
         pat = 'mmm[_]+'
 
         result = strings.str_contains(values, pat)
-        expected = [False, np.nan, True, True]
-        tm.assert_almost_equal(result, expected)
+        expected = np.array([False, np.nan, True, True], dtype=np.object_)
+        tm.assert_numpy_array_equal(result, expected)
 
         result = strings.str_contains(values, pat, na=False)
-        expected = [False, False, True, True]
-        tm.assert_almost_equal(result, expected)
+        expected = np.array([False, False, True, True])
+        tm.assert_numpy_array_equal(result, expected)
 
-        values = ['foo', 'xyz', 'fooommm__foo', 'mmm_']
+        values = np.array(['foo', 'xyz', 'fooommm__foo', 'mmm_'],
+                          dtype=np.object_)
         result = strings.str_contains(values, pat)
-        expected = [False, False, True, True]
-        self.assertEqual(result.dtype, np.bool_)
-        tm.assert_almost_equal(result, expected)
+        expected = np.array([False, False, True, True])
+        assert result.dtype == np.bool_
+        tm.assert_numpy_array_equal(result, expected)
 
         # na
-        values = Series(['om', 'foo',np.nan])
+        values = Series(['om', 'foo', np.nan])
         res = values.str.contains('foo', na="foo")
-        self.assertEqual (res.ix[2], "foo")
+        assert res.loc[2] == "foo"
 
     def test_startswith(self):
         values = Series(['om', NA, 'foo_nom', 'nom', 'bar_foo', NA, 'foo'])
@@ -228,14 +580,17 @@ def test_startswith(self):
         tm.assert_series_equal(result, exp)
 
         # mixed
-        mixed = ['a', NA, 'b', True, datetime.today(), 'foo', None, 1, 2.]
+        mixed = np.array(['a', NA, 'b', True, datetime.today(),
+                          'foo', None, 1, 2.], dtype=np.object_)
         rs = strings.str_startswith(mixed, 'f')
-        xp = [False, NA, False, NA, NA, True, NA, NA, NA]
-        tm.assert_almost_equal(rs, xp)
+        xp = np.array([False, NA, False, NA, NA, True, NA, NA, NA],
+                      dtype=np.object_)
+        tm.assert_numpy_array_equal(rs, xp)
 
         rs = Series(mixed).str.startswith('f')
-        tm.assertIsInstance(rs, Series)
-        tm.assert_almost_equal(rs, xp)
+        assert isinstance(rs, Series)
+        xp = Series([False, NA, False, NA, NA, True, NA, NA, NA])
+        tm.assert_series_equal(rs, xp)
 
         # unicode
         values = Series([u('om'), NA, u('foo_nom'), u('nom'), u('bar_foo'), NA,
@@ -258,12 +613,14 @@ def test_endswith(self):
         # mixed
         mixed = ['a', NA, 'b', True, datetime.today(), 'foo', None, 1, 2.]
         rs = strings.str_endswith(mixed, 'f')
-        xp = [False, NA, False, NA, NA, False, NA, NA, NA]
-        tm.assert_almost_equal(rs, xp)
+        xp = np.array([False, NA, False, NA, NA, False, NA, NA, NA],
+                      dtype=np.object_)
+        tm.assert_numpy_array_equal(rs, xp)
 
         rs = Series(mixed).str.endswith('f')
-        tm.assertIsInstance(rs, Series)
-        tm.assert_almost_equal(rs, xp)
+        xp = Series([False, NA, False, NA, NA, False, NA, NA, NA])
+        assert isinstance(rs, Series)
+        tm.assert_series_equal(rs, xp)
 
         # unicode
         values = Series([u('om'), NA, u('foo_nom'), u('nom'), u('bar_foo'), NA,
@@ -284,8 +641,8 @@ def test_title(self):
         tm.assert_series_equal(result, exp)
 
         # mixed
-        mixed = Series(["FOO", NA, "bar", True, datetime.today(),
-                        "blah", None, 1, 2.])
+        mixed = Series(["FOO", NA, "bar", True, datetime.today(), "blah", None,
+                        1, 2.])
         mixed = mixed.str.title()
         exp = Series(["Foo", NA, "Bar", NA, NA, "Blah", NA, NA, NA])
         tm.assert_almost_equal(mixed, exp)
@@ -309,13 +666,13 @@ def test_lower_upper(self):
         tm.assert_series_equal(result, values)
 
         # mixed
-        mixed = Series(['a', NA, 'b', True, datetime.today(), 'foo', None,
-                        1, 2.])
+        mixed = Series(['a', NA, 'b', True, datetime.today(), 'foo', None, 1,
+                        2.])
         mixed = mixed.str.upper()
         rs = Series(mixed).str.lower()
-        xp = ['a', NA, 'b', NA, NA, 'foo', NA, NA, NA]
-        tm.assertIsInstance(rs, Series)
-        tm.assert_almost_equal(rs, xp)
+        xp = Series(['a', NA, 'b', NA, NA, 'foo', NA, NA, NA])
+        assert isinstance(rs, Series)
+        tm.assert_series_equal(rs, xp)
 
         # unicode
         values = Series([u('om'), NA, u('nom'), u('nom')])
@@ -334,8 +691,8 @@ def test_capitalize(self):
         tm.assert_series_equal(result, exp)
 
         # mixed
-        mixed = Series(["FOO", NA, "bar", True, datetime.today(),
-                        "blah", None, 1, 2.])
+        mixed = Series(["FOO", NA, "bar", True, datetime.today(), "blah", None,
+                        1, 2.])
         mixed = mixed.str.capitalize()
         exp = Series(["Foo", NA, "Bar", NA, NA, "Blah", NA, NA, NA])
         tm.assert_almost_equal(mixed, exp)
@@ -353,8 +710,8 @@ def test_swapcase(self):
         tm.assert_series_equal(result, exp)
 
         # mixed
-        mixed = Series(["FOO", NA, "bar", True, datetime.today(),
-                        "Blah", None, 1, 2.])
+        mixed = Series(["FOO", NA, "bar", True, datetime.today(), "Blah", None,
+                        1, 2.])
         mixed = mixed.str.swapcase()
         exp = Series(["foo", NA, "BAR", NA, NA, "bLAH", NA, NA, NA])
         tm.assert_almost_equal(mixed, exp)
@@ -368,11 +725,11 @@ def test_swapcase(self):
     def test_casemethods(self):
         values = ['aaa', 'bbb', 'CCC', 'Dddd', 'eEEE']
         s = Series(values)
-        self.assertEqual(s.str.lower().tolist(), [v.lower() for v in values])
-        self.assertEqual(s.str.upper().tolist(), [v.upper() for v in values])
-        self.assertEqual(s.str.title().tolist(), [v.title() for v in values])
-        self.assertEqual(s.str.capitalize().tolist(), [v.capitalize() for v in values])
-        self.assertEqual(s.str.swapcase().tolist(), [v.swapcase() for v in values])
+        assert s.str.lower().tolist() == [v.lower() for v in values]
+        assert s.str.upper().tolist() == [v.upper() for v in values]
+        assert s.str.title().tolist() == [v.title() for v in values]
+        assert s.str.capitalize().tolist() == [v.capitalize() for v in values]
+        assert s.str.swapcase().tolist() == [v.swapcase() for v in values]
 
     def test_replace(self):
         values = Series(['fooBAD__barBAD', NA])
@@ -390,8 +747,8 @@ def test_replace(self):
                         None, 1, 2.])
 
         rs = Series(mixed).str.replace('BAD[_]*', '')
-        xp = ['a', NA, 'b', NA, NA, 'foo', NA, NA, NA]
-        tm.assertIsInstance(rs, Series)
+        xp = Series(['a', NA, 'b', NA, NA, 'foo', NA, NA, NA])
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
@@ -405,103 +762,208 @@ def test_replace(self):
         exp = Series([u('foobarBAD'), NA])
         tm.assert_series_equal(result, exp)
 
-        #flags + unicode
+        # flags + unicode
         values = Series([b"abcd,\xc3\xa0".decode("utf-8")])
         exp = Series([b"abcd, \xc3\xa0".decode("utf-8")])
-        result = values.str.replace("(?<=\w),(?=\w)", ", ", flags=re.UNICODE)
+        result = values.str.replace(r"(?<=\w),(?=\w)", ", ", flags=re.UNICODE)
         tm.assert_series_equal(result, exp)
 
-    def test_repeat(self):
-        values = Series(['a', 'b', NA, 'c', NA, 'd'])
+        # GH 13438
+        for klass in (Series, Index):
+            for repl in (None, 3, {'a': 'b'}):
+                for data in (['a', 'b', None], ['a', 'b', 'c', 'ad']):
+                    values = klass(data)
+                    pytest.raises(TypeError, values.str.replace, 'a', repl)
 
-        result = values.str.repeat(3)
-        exp = Series(['aaa', 'bbb', NA, 'ccc', NA, 'ddd'])
+    def test_replace_callable(self):
+        # GH 15055
+        values = Series(['fooBAD__barBAD', NA])
+
+        # test with callable
+        repl = lambda m: m.group(0).swapcase()
+        result = values.str.replace('[a-z][A-Z]{2}', repl, n=2)
+        exp = Series(['foObaD__baRbaD', NA])
         tm.assert_series_equal(result, exp)
 
-        result = values.str.repeat([1, 2, 3, 4, 5, 6])
-        exp = Series(['a', 'bb', NA, 'cccc', NA, 'dddddd'])
+        # test with wrong number of arguments, raising an error
+        if compat.PY2:
+            p_err = r'takes (no|(exactly|at (least|most)) ?\d+) arguments?'
+        else:
+            p_err = (r'((takes)|(missing)) (?(2)from \d+ to )?\d+ '
+                     r'(?(3)required )positional arguments?')
+
+        repl = lambda: None
+        with tm.assert_raises_regex(TypeError, p_err):
+            values.str.replace('a', repl)
+
+        repl = lambda m, x: None
+        with tm.assert_raises_regex(TypeError, p_err):
+            values.str.replace('a', repl)
+
+        repl = lambda m, x, y=None: None
+        with tm.assert_raises_regex(TypeError, p_err):
+            values.str.replace('a', repl)
+
+        # test regex named groups
+        values = Series(['Foo Bar Baz', NA])
+        pat = r"(?P<first>\w+) (?P<middle>\w+) (?P<last>\w+)"
+        repl = lambda m: m.group('middle').swapcase()
+        result = values.str.replace(pat, repl)
+        exp = Series(['bAR', NA])
+        tm.assert_series_equal(result, exp)
+
+    def test_replace_compiled_regex(self):
+        # GH 15446
+        values = Series(['fooBAD__barBAD', NA])
+
+        # test with compiled regex
+        pat = re.compile(r'BAD[_]*')
+        result = values.str.replace(pat, '')
+        exp = Series(['foobar', NA])
         tm.assert_series_equal(result, exp)
 
         # mixed
-        mixed = Series(['a', NA, 'b', True, datetime.today(), 'foo',
+        mixed = Series(['aBAD', NA, 'bBAD', True, datetime.today(), 'fooBAD',
                         None, 1, 2.])
 
-        rs = Series(mixed).str.repeat(3)
-        xp = ['aaa', NA, 'bbb', NA, NA, 'foofoofoo', NA, NA, NA]
-        tm.assertIsInstance(rs, Series)
+        rs = Series(mixed).str.replace(pat, '')
+        xp = Series(['a', NA, 'b', NA, NA, 'foo', NA, NA, NA])
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
-        values = Series([u('a'), u('b'), NA, u('c'), NA,
-                         u('d')])
+        values = Series([u('fooBAD__barBAD'), NA])
 
-        result = values.str.repeat(3)
-        exp = Series([u('aaa'), u('bbb'), NA, u('ccc'), NA,
-                      u('ddd')])
+        result = values.str.replace(pat, '')
+        exp = Series([u('foobar'), NA])
         tm.assert_series_equal(result, exp)
 
-        result = values.str.repeat([1, 2, 3, 4, 5, 6])
-        exp = Series([u('a'), u('bb'), NA, u('cccc'), NA,
-                      u('dddddd')])
+        result = values.str.replace(pat, '', n=1)
+        exp = Series([u('foobarBAD'), NA])
         tm.assert_series_equal(result, exp)
 
-    def test_deprecated_match(self):
-        # Old match behavior, deprecated (but still default) in 0.13
-        values = Series(['fooBAD__barBAD', NA, 'foo'])
+        # flags + unicode
+        values = Series([b"abcd,\xc3\xa0".decode("utf-8")])
+        exp = Series([b"abcd, \xc3\xa0".decode("utf-8")])
+        pat = re.compile(r"(?<=\w),(?=\w)", flags=re.UNICODE)
+        result = values.str.replace(pat, ", ")
+        tm.assert_series_equal(result, exp)
+
+        # case and flags provided to str.replace will have no effect
+        # and will produce warnings
+        values = Series(['fooBAD__barBAD__bad', NA])
+        pat = re.compile(r'BAD[_]*')
+
+        with tm.assert_raises_regex(ValueError,
+                                    "case and flags cannot be"):
+            result = values.str.replace(pat, '', flags=re.IGNORECASE)
+
+        with tm.assert_raises_regex(ValueError,
+                                    "case and flags cannot be"):
+            result = values.str.replace(pat, '', case=False)
+
+        with tm.assert_raises_regex(ValueError,
+                                    "case and flags cannot be"):
+            result = values.str.replace(pat, '', case=True)
+
+        # test with callable
+        values = Series(['fooBAD__barBAD', NA])
+        repl = lambda m: m.group(0).swapcase()
+        pat = re.compile('[a-z][A-Z]{2}')
+        result = values.str.replace(pat, repl, n=2)
+        exp = Series(['foObaD__baRbaD', NA])
+        tm.assert_series_equal(result, exp)
+
+    def test_replace_literal(self):
+        # GH16808 literal replace (regex=False vs regex=True)
+        values = Series(['f.o', 'foo', NA])
+        exp = Series(['bao', 'bao', NA])
+        result = values.str.replace('f.', 'ba')
+        tm.assert_series_equal(result, exp)
+
+        exp = Series(['bao', 'foo', NA])
+        result = values.str.replace('f.', 'ba', regex=False)
+        tm.assert_series_equal(result, exp)
+
+        # Cannot do a literal replace if given a callable repl or compiled
+        # pattern
+        callable_repl = lambda m: m.group(0).swapcase()
+        compiled_pat = re.compile('[a-z][A-Z]{2}')
+
+        pytest.raises(ValueError, values.str.replace, 'abc', callable_repl,
+                      regex=False)
+        pytest.raises(ValueError, values.str.replace, compiled_pat, '',
+                      regex=False)
 
-        with tm.assert_produces_warning():
-            result = values.str.match('.*(BAD[_]+).*(BAD)')
-        exp = Series([('BAD__', 'BAD'), NA, []])
+    def test_repeat(self):
+        values = Series(['a', 'b', NA, 'c', NA, 'd'])
+
+        result = values.str.repeat(3)
+        exp = Series(['aaa', 'bbb', NA, 'ccc', NA, 'ddd'])
+        tm.assert_series_equal(result, exp)
+
+        result = values.str.repeat([1, 2, 3, 4, 5, 6])
+        exp = Series(['a', 'bb', NA, 'cccc', NA, 'dddddd'])
         tm.assert_series_equal(result, exp)
 
         # mixed
-        mixed = Series(['aBAD_BAD', NA, 'BAD_b_BAD', True, datetime.today(),
-                        'foo', None, 1, 2.])
+        mixed = Series(['a', NA, 'b', True, datetime.today(), 'foo', None, 1,
+                        2.])
 
-        with tm.assert_produces_warning():
-            rs = Series(mixed).str.match('.*(BAD[_]+).*(BAD)')
-        xp = [('BAD_', 'BAD'), NA, ('BAD_', 'BAD'), NA, NA, [], NA, NA, NA]
-        tm.assertIsInstance(rs, Series)
-        tm.assert_almost_equal(rs, xp)
+        rs = Series(mixed).str.repeat(3)
+        xp = Series(['aaa', NA, 'bbb', NA, NA, 'foofoofoo', NA, NA, NA])
+        assert isinstance(rs, Series)
+        tm.assert_series_equal(rs, xp)
 
         # unicode
-        values = Series([u('fooBAD__barBAD'), NA, u('foo')])
+        values = Series([u('a'), u('b'), NA, u('c'), NA, u('d')])
 
-        with tm.assert_produces_warning():
-            result = values.str.match('.*(BAD[_]+).*(BAD)')
-        exp = Series([(u('BAD__'), u('BAD')), NA, []])
+        result = values.str.repeat(3)
+        exp = Series([u('aaa'), u('bbb'), NA, u('ccc'), NA, u('ddd')])
+        tm.assert_series_equal(result, exp)
+
+        result = values.str.repeat([1, 2, 3, 4, 5, 6])
+        exp = Series([u('a'), u('bb'), NA, u('cccc'), NA, u('dddddd')])
         tm.assert_series_equal(result, exp)
 
     def test_match(self):
         # New match behavior introduced in 0.13
         values = Series(['fooBAD__barBAD', NA, 'foo'])
-        with tm.assert_produces_warning():
-            result = values.str.match('.*(BAD[_]+).*(BAD)', as_indexer=True)
+        result = values.str.match('.*(BAD[_]+).*(BAD)')
         exp = Series([True, NA, False])
         tm.assert_series_equal(result, exp)
 
-        # If no groups, use new behavior even when as_indexer is False.
-        # (Old behavior is pretty much useless in this case.)
         values = Series(['fooBAD__barBAD', NA, 'foo'])
-        result = values.str.match('.*BAD[_]+.*BAD', as_indexer=False)
+        result = values.str.match('.*BAD[_]+.*BAD')
         exp = Series([True, NA, False])
         tm.assert_series_equal(result, exp)
 
+        # test passing as_indexer still works but is ignored
+        values = Series(['fooBAD__barBAD', NA, 'foo'])
+        exp = Series([True, NA, False])
+        with tm.assert_produces_warning(FutureWarning):
+            result = values.str.match('.*BAD[_]+.*BAD', as_indexer=True)
+        tm.assert_series_equal(result, exp)
+        with tm.assert_produces_warning(FutureWarning):
+            result = values.str.match('.*BAD[_]+.*BAD', as_indexer=False)
+        tm.assert_series_equal(result, exp)
+        with tm.assert_produces_warning(FutureWarning):
+            result = values.str.match('.*(BAD[_]+).*(BAD)', as_indexer=True)
+        tm.assert_series_equal(result, exp)
+        pytest.raises(ValueError, values.str.match, '.*(BAD[_]+).*(BAD)',
+                      as_indexer=False)
+
         # mixed
         mixed = Series(['aBAD_BAD', NA, 'BAD_b_BAD', True, datetime.today(),
                         'foo', None, 1, 2.])
-
-        with tm.assert_produces_warning():
-            rs = Series(mixed).str.match('.*(BAD[_]+).*(BAD)', as_indexer=True)
-        xp = [True, NA, True, NA, NA, False, NA, NA, NA]
-        tm.assertIsInstance(rs, Series)
-        tm.assert_almost_equal(rs, xp)
+        rs = Series(mixed).str.match('.*(BAD[_]+).*(BAD)')
+        xp = Series([True, NA, True, NA, NA, False, NA, NA, NA])
+        assert isinstance(rs, Series)
+        tm.assert_series_equal(rs, xp)
 
         # unicode
         values = Series([u('fooBAD__barBAD'), NA, u('foo')])
-
-        with tm.assert_produces_warning():
-            result = values.str.match('.*(BAD[_]+).*(BAD)', as_indexer=True)
+        result = values.str.match('.*(BAD[_]+).*(BAD)')
         exp = Series([True, NA, False])
         tm.assert_series_equal(result, exp)
 
@@ -513,12 +975,25 @@ def test_match(self):
         exp = Series([True, np.nan, np.nan])
         assert_series_equal(exp, res)
 
-    def test_extract(self):
+    def test_extract_expand_None(self):
+        values = Series(['fooBAD__barBAD', NA, 'foo'])
+        with tm.assert_raises_regex(ValueError,
+                                    'expand must be True or False'):
+            values.str.extract('.*(BAD[_]+).*(BAD)', expand=None)
+
+    def test_extract_expand_unspecified(self):
+        values = Series(['fooBAD__barBAD', NA, 'foo'])
+        result_unspecified = values.str.extract('.*(BAD[_]+).*')
+        assert isinstance(result_unspecified, DataFrame)
+        result_true = values.str.extract('.*(BAD[_]+).*', expand=True)
+        tm.assert_frame_equal(result_unspecified, result_true)
+
+    def test_extract_expand_False(self):
         # Contains tests like those in test_match and some others.
         values = Series(['fooBAD__barBAD', NA, 'foo'])
         er = [NA, NA]  # empty row
 
-        result = values.str.extract('.*(BAD[_]+).*(BAD)')
+        result = values.str.extract('.*(BAD[_]+).*(BAD)', expand=False)
         exp = DataFrame([['BAD__', 'BAD'], er, er])
         tm.assert_frame_equal(result, exp)
 
@@ -526,15 +1001,15 @@ def test_extract(self):
         mixed = Series(['aBAD_BAD', NA, 'BAD_b_BAD', True, datetime.today(),
                         'foo', None, 1, 2.])
 
-        rs = Series(mixed).str.extract('.*(BAD[_]+).*(BAD)')
-        exp = DataFrame([['BAD_', 'BAD'], er, ['BAD_', 'BAD'], er, er,
-                         er, er, er, er])
+        rs = Series(mixed).str.extract('.*(BAD[_]+).*(BAD)', expand=False)
+        exp = DataFrame([['BAD_', 'BAD'], er, ['BAD_', 'BAD'], er, er, er, er,
+                         er, er])
         tm.assert_frame_equal(rs, exp)
 
         # unicode
         values = Series([u('fooBAD__barBAD'), NA, u('foo')])
 
-        result = values.str.extract('.*(BAD[_]+).*(BAD)')
+        result = values.str.extract('.*(BAD[_]+).*(BAD)', expand=False)
         exp = DataFrame([[u('BAD__'), u('BAD')], er, er])
         tm.assert_frame_equal(result, exp)
 
@@ -542,80 +1017,93 @@ def test_extract(self):
         # Index only works with one regex group since
         # multi-group would expand to a frame
         idx = Index(['A1', 'A2', 'A3', 'A4', 'B5'])
-        with tm.assertRaisesRegexp(ValueError, "supported"):
-            idx.str.extract('([AB])([123])')
+        with tm.assert_raises_regex(ValueError, "supported"):
+            idx.str.extract('([AB])([123])', expand=False)
 
         # these should work for both Series and Index
         for klass in [Series, Index]:
             # no groups
             s_or_idx = klass(['A1', 'B2', 'C3'])
-            f = lambda: s_or_idx.str.extract('[ABC][123]')
-            self.assertRaises(ValueError, f)
+            f = lambda: s_or_idx.str.extract('[ABC][123]', expand=False)
+            pytest.raises(ValueError, f)
 
             # only non-capturing groups
-            f = lambda: s_or_idx.str.extract('(?:[AB]).*')
-            self.assertRaises(ValueError, f)
+            f = lambda: s_or_idx.str.extract('(?:[AB]).*', expand=False)
+            pytest.raises(ValueError, f)
 
             # single group renames series/index properly
             s_or_idx = klass(['A1', 'A2'])
-            result = s_or_idx.str.extract(r'(?P<uno>A)\d')
-            tm.assert_equal(result.name, 'uno')
-            tm.assert_numpy_array_equal(result, klass(['A', 'A']))
+            result = s_or_idx.str.extract(r'(?P<uno>A)\d', expand=False)
+            assert result.name == 'uno'
+
+            exp = klass(['A', 'A'], name='uno')
+            if klass == Series:
+                tm.assert_series_equal(result, exp)
+            else:
+                tm.assert_index_equal(result, exp)
 
         s = Series(['A1', 'B2', 'C3'])
         # one group, no matches
-        result = s.str.extract('(_)')
+        result = s.str.extract('(_)', expand=False)
         exp = Series([NA, NA, NA], dtype=object)
         tm.assert_series_equal(result, exp)
 
         # two groups, no matches
-        result = s.str.extract('(_)(_)')
+        result = s.str.extract('(_)(_)', expand=False)
         exp = DataFrame([[NA, NA], [NA, NA], [NA, NA]], dtype=object)
         tm.assert_frame_equal(result, exp)
 
         # one group, some matches
-        result = s.str.extract('([AB])[123]')
+        result = s.str.extract('([AB])[123]', expand=False)
         exp = Series(['A', 'B', NA])
         tm.assert_series_equal(result, exp)
 
         # two groups, some matches
-        result = s.str.extract('([AB])([123])')
+        result = s.str.extract('([AB])([123])', expand=False)
         exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]])
         tm.assert_frame_equal(result, exp)
 
         # one named group
-        result = s.str.extract('(?P<letter>[AB])')
+        result = s.str.extract('(?P<letter>[AB])', expand=False)
         exp = Series(['A', 'B', NA], name='letter')
         tm.assert_series_equal(result, exp)
 
         # two named groups
-        result = s.str.extract('(?P<letter>[AB])(?P<number>[123])')
-        exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]], columns=['letter', 'number'])
+        result = s.str.extract('(?P<letter>[AB])(?P<number>[123])',
+                               expand=False)
+        exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]],
+                        columns=['letter', 'number'])
         tm.assert_frame_equal(result, exp)
 
         # mix named and unnamed groups
-        result = s.str.extract('([AB])(?P<number>[123])')
-        exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]], columns=[0, 'number'])
+        result = s.str.extract('([AB])(?P<number>[123])', expand=False)
+        exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]],
+                        columns=[0, 'number'])
         tm.assert_frame_equal(result, exp)
 
         # one normal group, one non-capturing group
-        result = s.str.extract('([AB])(?:[123])')
+        result = s.str.extract('([AB])(?:[123])', expand=False)
         exp = Series(['A', 'B', NA])
         tm.assert_series_equal(result, exp)
 
         # two normal groups, one non-capturing group
-        result = Series(['A11', 'B22', 'C33']).str.extract('([AB])([123])(?:[123])')
+        result = Series(['A11', 'B22', 'C33']).str.extract(
+            '([AB])([123])(?:[123])', expand=False)
         exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]])
         tm.assert_frame_equal(result, exp)
 
         # one optional group followed by one normal group
-        result = Series(['A1', 'B2', '3']).str.extract('(?P<letter>[AB])?(?P<number>[123])')
-        exp = DataFrame([['A', '1'], ['B', '2'], [NA, '3']], columns=['letter', 'number'])
+        result = Series(['A1', 'B2', '3']).str.extract(
+            '(?P<letter>[AB])?(?P<number>[123])', expand=False)
+        exp = DataFrame([['A', '1'], ['B', '2'], [NA, '3']],
+                        columns=['letter', 'number'])
         tm.assert_frame_equal(result, exp)
 
         # one normal group followed by one optional group
-        result = Series(['A1', 'B2', 'C']).str.extract('(?P<letter>[ABC])(?P<number>[123])?')
-        exp = DataFrame([['A', '1'], ['B', '2'], ['C', NA]], columns=['letter', 'number'])
+        result = Series(['A1', 'B2', 'C']).str.extract(
+            '(?P<letter>[ABC])(?P<number>[123])?', expand=False)
+        exp = DataFrame([['A', '1'], ['B', '2'], ['C', NA]],
+                        columns=['letter', 'number'])
         tm.assert_frame_equal(result, exp)
 
         # GH6348
@@ -623,37 +1111,504 @@ def test_extract(self):
         def check_index(index):
             data = ['A1', 'B2', 'C']
             index = index[:len(data)]
-            result = Series(data, index=index).str.extract('(\d)')
+            s = Series(data, index=index)
+            result = s.str.extract(r'(\d)', expand=False)
             exp = Series(['1', '2', NA], index=index)
             tm.assert_series_equal(result, exp)
 
-            result = Series(data, index=index).str.extract('(?P<letter>\D)(?P<number>\d)?')
-            exp = DataFrame([['A', '1'], ['B', '2'], ['C', NA]], columns=['letter', 'number'], index=index)
+            result = Series(data, index=index).str.extract(
+                r'(?P<letter>\D)(?P<number>\d)?', expand=False)
+            e_list = [
+                ['A', '1'],
+                ['B', '2'],
+                ['C', NA]
+            ]
+            exp = DataFrame(e_list, columns=['letter', 'number'], index=index)
             tm.assert_frame_equal(result, exp)
 
-        for index in [ tm.makeStringIndex, tm.makeUnicodeIndex, tm.makeIntIndex,
-                       tm.makeDateIndex, tm.makePeriodIndex ]:
+        i_funs = [
+            tm.makeStringIndex, tm.makeUnicodeIndex, tm.makeIntIndex,
+            tm.makeDateIndex, tm.makePeriodIndex, tm.makeRangeIndex
+        ]
+        for index in i_funs:
             check_index(index())
 
-    def test_extract_single_series_name_is_preserved(self):
+        # single_series_name_is_preserved.
         s = Series(['a3', 'b3', 'c2'], name='bob')
-        r = s.str.extract(r'(?P<sue>[a-z])')
+        r = s.str.extract(r'(?P<sue>[a-z])', expand=False)
         e = Series(['a', 'b', 'c'], name='sue')
         tm.assert_series_equal(r, e)
-        self.assertEqual(r.name, e.name)
+        assert r.name == e.name
+
+    def test_extract_expand_True(self):
+        # Contains tests like those in test_match and some others.
+        values = Series(['fooBAD__barBAD', NA, 'foo'])
+        er = [NA, NA]  # empty row
+
+        result = values.str.extract('.*(BAD[_]+).*(BAD)', expand=True)
+        exp = DataFrame([['BAD__', 'BAD'], er, er])
+        tm.assert_frame_equal(result, exp)
+
+        # mixed
+        mixed = Series(['aBAD_BAD', NA, 'BAD_b_BAD', True, datetime.today(),
+                        'foo', None, 1, 2.])
+
+        rs = Series(mixed).str.extract('.*(BAD[_]+).*(BAD)', expand=True)
+        exp = DataFrame([['BAD_', 'BAD'], er, ['BAD_', 'BAD'], er, er,
+                         er, er, er, er])
+        tm.assert_frame_equal(rs, exp)
+
+        # unicode
+        values = Series([u('fooBAD__barBAD'), NA, u('foo')])
+
+        result = values.str.extract('.*(BAD[_]+).*(BAD)', expand=True)
+        exp = DataFrame([[u('BAD__'), u('BAD')], er, er])
+        tm.assert_frame_equal(result, exp)
+
+        # these should work for both Series and Index
+        for klass in [Series, Index]:
+            # no groups
+            s_or_idx = klass(['A1', 'B2', 'C3'])
+            f = lambda: s_or_idx.str.extract('[ABC][123]', expand=True)
+            pytest.raises(ValueError, f)
+
+            # only non-capturing groups
+            f = lambda: s_or_idx.str.extract('(?:[AB]).*', expand=True)
+            pytest.raises(ValueError, f)
+
+            # single group renames series/index properly
+            s_or_idx = klass(['A1', 'A2'])
+            result_df = s_or_idx.str.extract(r'(?P<uno>A)\d', expand=True)
+            assert isinstance(result_df, DataFrame)
+            result_series = result_df['uno']
+            assert_series_equal(result_series, Series(['A', 'A'], name='uno'))
+
+    def test_extract_series(self):
+        # extract should give the same result whether or not the
+        # series has a name.
+        for series_name in None, "series_name":
+            s = Series(['A1', 'B2', 'C3'], name=series_name)
+            # one group, no matches
+            result = s.str.extract('(_)', expand=True)
+            exp = DataFrame([NA, NA, NA], dtype=object)
+            tm.assert_frame_equal(result, exp)
+
+            # two groups, no matches
+            result = s.str.extract('(_)(_)', expand=True)
+            exp = DataFrame([[NA, NA], [NA, NA], [NA, NA]], dtype=object)
+            tm.assert_frame_equal(result, exp)
+
+            # one group, some matches
+            result = s.str.extract('([AB])[123]', expand=True)
+            exp = DataFrame(['A', 'B', NA])
+            tm.assert_frame_equal(result, exp)
+
+            # two groups, some matches
+            result = s.str.extract('([AB])([123])', expand=True)
+            exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]])
+            tm.assert_frame_equal(result, exp)
+
+            # one named group
+            result = s.str.extract('(?P<letter>[AB])', expand=True)
+            exp = DataFrame({"letter": ['A', 'B', NA]})
+            tm.assert_frame_equal(result, exp)
+
+            # two named groups
+            result = s.str.extract(
+                '(?P<letter>[AB])(?P<number>[123])',
+                expand=True)
+            e_list = [
+                ['A', '1'],
+                ['B', '2'],
+                [NA, NA]
+            ]
+            exp = DataFrame(e_list, columns=['letter', 'number'])
+            tm.assert_frame_equal(result, exp)
+
+            # mix named and unnamed groups
+            result = s.str.extract('([AB])(?P<number>[123])', expand=True)
+            exp = DataFrame(e_list, columns=[0, 'number'])
+            tm.assert_frame_equal(result, exp)
+
+            # one normal group, one non-capturing group
+            result = s.str.extract('([AB])(?:[123])', expand=True)
+            exp = DataFrame(['A', 'B', NA])
+            tm.assert_frame_equal(result, exp)
+
+    def test_extract_optional_groups(self):
+
+        # two normal groups, one non-capturing group
+        result = Series(['A11', 'B22', 'C33']).str.extract(
+            '([AB])([123])(?:[123])', expand=True)
+        exp = DataFrame([['A', '1'], ['B', '2'], [NA, NA]])
+        tm.assert_frame_equal(result, exp)
+
+        # one optional group followed by one normal group
+        result = Series(['A1', 'B2', '3']).str.extract(
+            '(?P<letter>[AB])?(?P<number>[123])', expand=True)
+        e_list = [
+            ['A', '1'],
+            ['B', '2'],
+            [NA, '3']
+        ]
+        exp = DataFrame(e_list, columns=['letter', 'number'])
+        tm.assert_frame_equal(result, exp)
+
+        # one normal group followed by one optional group
+        result = Series(['A1', 'B2', 'C']).str.extract(
+            '(?P<letter>[ABC])(?P<number>[123])?', expand=True)
+        e_list = [
+            ['A', '1'],
+            ['B', '2'],
+            ['C', NA]
+        ]
+        exp = DataFrame(e_list, columns=['letter', 'number'])
+        tm.assert_frame_equal(result, exp)
+
+        # GH6348
+        # not passing index to the extractor
+        def check_index(index):
+            data = ['A1', 'B2', 'C']
+            index = index[:len(data)]
+            result = Series(data, index=index).str.extract(
+                r'(\d)', expand=True)
+            exp = DataFrame(['1', '2', NA], index=index)
+            tm.assert_frame_equal(result, exp)
+
+            result = Series(data, index=index).str.extract(
+                r'(?P<letter>\D)(?P<number>\d)?', expand=True)
+            e_list = [
+                ['A', '1'],
+                ['B', '2'],
+                ['C', NA]
+            ]
+            exp = DataFrame(e_list, columns=['letter', 'number'], index=index)
+            tm.assert_frame_equal(result, exp)
+
+        i_funs = [
+            tm.makeStringIndex, tm.makeUnicodeIndex, tm.makeIntIndex,
+            tm.makeDateIndex, tm.makePeriodIndex, tm.makeRangeIndex
+        ]
+        for index in i_funs:
+            check_index(index())
+
+    def test_extract_single_group_returns_frame(self):
+        # GH11386 extract should always return DataFrame, even when
+        # there is only one group. Prior to v0.18.0, extract returned
+        # Series when there was only one group in the regex.
+        s = Series(['a3', 'b3', 'c2'], name='series_name')
+        r = s.str.extract(r'(?P<letter>[a-z])', expand=True)
+        e = DataFrame({"letter": ['a', 'b', 'c']})
+        tm.assert_frame_equal(r, e)
+
+    def test_extractall(self):
+        subject_list = [
+            'dave@google.com',
+            'tdhock5@gmail.com',
+            'maudelaperriere@gmail.com',
+            'rob@gmail.com some text steve@gmail.com',
+            'a@b.com some text c@d.com and e@f.com',
+            np.nan,
+            "",
+        ]
+        expected_tuples = [
+            ("dave", "google", "com"),
+            ("tdhock5", "gmail", "com"),
+            ("maudelaperriere", "gmail", "com"),
+            ("rob", "gmail", "com"), ("steve", "gmail", "com"),
+            ("a", "b", "com"), ("c", "d", "com"), ("e", "f", "com"),
+        ]
+        named_pattern = r"""
+        (?P<user>[a-z0-9]+)
+        @
+        (?P<domain>[a-z]+)
+        \.
+        (?P<tld>[a-z]{2,4})
+        """
+        expected_columns = ["user", "domain", "tld"]
+        S = Series(subject_list)
+        # extractall should return a DataFrame with one row for each
+        # match, indexed by the subject from which the match came.
+        expected_index = MultiIndex.from_tuples([
+            (0, 0),
+            (1, 0),
+            (2, 0),
+            (3, 0),
+            (3, 1),
+            (4, 0),
+            (4, 1),
+            (4, 2),
+        ], names=(None, "match"))
+        expected_df = DataFrame(
+            expected_tuples, expected_index, expected_columns)
+        computed_df = S.str.extractall(named_pattern, re.VERBOSE)
+        tm.assert_frame_equal(computed_df, expected_df)
+
+        # The index of the input Series should be used to construct
+        # the index of the output DataFrame:
+        series_index = MultiIndex.from_tuples([
+            ("single", "Dave"),
+            ("single", "Toby"),
+            ("single", "Maude"),
+            ("multiple", "robAndSteve"),
+            ("multiple", "abcdef"),
+            ("none", "missing"),
+            ("none", "empty"),
+        ])
+        Si = Series(subject_list, series_index)
+        expected_index = MultiIndex.from_tuples([
+            ("single", "Dave", 0),
+            ("single", "Toby", 0),
+            ("single", "Maude", 0),
+            ("multiple", "robAndSteve", 0),
+            ("multiple", "robAndSteve", 1),
+            ("multiple", "abcdef", 0),
+            ("multiple", "abcdef", 1),
+            ("multiple", "abcdef", 2),
+        ], names=(None, None, "match"))
+        expected_df = DataFrame(
+            expected_tuples, expected_index, expected_columns)
+        computed_df = Si.str.extractall(named_pattern, re.VERBOSE)
+        tm.assert_frame_equal(computed_df, expected_df)
+
+        # MultiIndexed subject with names.
+        Sn = Series(subject_list, series_index)
+        Sn.index.names = ("matches", "description")
+        expected_index.names = ("matches", "description", "match")
+        expected_df = DataFrame(
+            expected_tuples, expected_index, expected_columns)
+        computed_df = Sn.str.extractall(named_pattern, re.VERBOSE)
+        tm.assert_frame_equal(computed_df, expected_df)
+
+        # optional groups.
+        subject_list = ['', 'A1', '32']
+        named_pattern = '(?P<letter>[AB])?(?P<number>[123])'
+        computed_df = Series(subject_list).str.extractall(named_pattern)
+        expected_index = MultiIndex.from_tuples([
+            (1, 0),
+            (2, 0),
+            (2, 1),
+        ], names=(None, "match"))
+        expected_df = DataFrame([
+            ('A', '1'),
+            (NA, '3'),
+            (NA, '2'),
+        ], expected_index, columns=['letter', 'number'])
+        tm.assert_frame_equal(computed_df, expected_df)
+
+        # only one of two groups has a name.
+        pattern = '([AB])?(?P<number>[123])'
+        computed_df = Series(subject_list).str.extractall(pattern)
+        expected_df = DataFrame([
+            ('A', '1'),
+            (NA, '3'),
+            (NA, '2'),
+        ], expected_index, columns=[0, 'number'])
+        tm.assert_frame_equal(computed_df, expected_df)
+
+    def test_extractall_single_group(self):
+        # extractall(one named group) returns DataFrame with one named
+        # column.
+        s = Series(['a3', 'b3', 'd4c2'], name='series_name')
+        r = s.str.extractall(r'(?P<letter>[a-z])')
+        i = MultiIndex.from_tuples([
+            (0, 0),
+            (1, 0),
+            (2, 0),
+            (2, 1),
+        ], names=(None, "match"))
+        e = DataFrame({"letter": ['a', 'b', 'd', 'c']}, i)
+        tm.assert_frame_equal(r, e)
+
+        # extractall(one un-named group) returns DataFrame with one
+        # un-named column.
+        r = s.str.extractall(r'([a-z])')
+        e = DataFrame(['a', 'b', 'd', 'c'], i)
+        tm.assert_frame_equal(r, e)
+
+    def test_extractall_single_group_with_quantifier(self):
+        # extractall(one un-named group with quantifier) returns
+        # DataFrame with one un-named column (GH13382).
+        s = Series(['ab3', 'abc3', 'd4cd2'], name='series_name')
+        r = s.str.extractall(r'([a-z]+)')
+        i = MultiIndex.from_tuples([
+            (0, 0),
+            (1, 0),
+            (2, 0),
+            (2, 1),
+        ], names=(None, "match"))
+        e = DataFrame(['ab', 'abc', 'd', 'cd'], i)
+        tm.assert_frame_equal(r, e)
+
+    @pytest.mark.parametrize('data, names', [
+        ([], (None, )),
+        ([], ('i1', )),
+        ([], (None, 'i2')),
+        ([], ('i1', 'i2')),
+        (['a3', 'b3', 'd4c2'], (None, )),
+        (['a3', 'b3', 'd4c2'], ('i1', 'i2')),
+        (['a3', 'b3', 'd4c2'], (None, 'i2')),
+        (['a3', 'b3', 'd4c2'], ('i1', 'i2')),
+    ])
+    def test_extractall_no_matches(self, data, names):
+        # GH19075 extractall with no matches should return a valid MultiIndex
+        n = len(data)
+        if len(names) == 1:
+            i = Index(range(n), name=names[0])
+        else:
+            a = (tuple([i] * (n - 1)) for i in range(n))
+            i = MultiIndex.from_tuples(a, names=names)
+        s = Series(data, name='series_name', index=i, dtype='object')
+        ei = MultiIndex.from_tuples([], names=(names + ('match',)))
+
+        # one un-named group.
+        r = s.str.extractall('(z)')
+        e = DataFrame(columns=[0], index=ei)
+        tm.assert_frame_equal(r, e)
+
+        # two un-named groups.
+        r = s.str.extractall('(z)(z)')
+        e = DataFrame(columns=[0, 1], index=ei)
+        tm.assert_frame_equal(r, e)
+
+        # one named group.
+        r = s.str.extractall('(?P<first>z)')
+        e = DataFrame(columns=["first"], index=ei)
+        tm.assert_frame_equal(r, e)
+
+        # two named groups.
+        r = s.str.extractall('(?P<first>z)(?P<second>z)')
+        e = DataFrame(columns=["first", "second"], index=ei)
+        tm.assert_frame_equal(r, e)
+
+        # one named, one un-named.
+        r = s.str.extractall('(z)(?P<second>z)')
+        e = DataFrame(columns=[0, "second"], index=ei)
+        tm.assert_frame_equal(r, e)
+
+    def test_extractall_stringindex(self):
+        s = Series(["a1a2", "b1", "c1"], name='xxx')
+        res = s.str.extractall(r"[ab](?P<digit>\d)")
+        exp_idx = MultiIndex.from_tuples([(0, 0), (0, 1), (1, 0)],
+                                         names=[None, 'match'])
+        exp = DataFrame({'digit': ["1", "2", "1"]}, index=exp_idx)
+        tm.assert_frame_equal(res, exp)
+
+        # index should return the same result as the default index without name
+        # thus index.name doesn't affect to the result
+        for idx in [Index(["a1a2", "b1", "c1"]),
+                    Index(["a1a2", "b1", "c1"], name='xxx')]:
+
+            res = idx.str.extractall(r"[ab](?P<digit>\d)")
+            tm.assert_frame_equal(res, exp)
+
+        s = Series(["a1a2", "b1", "c1"], name='s_name',
+                   index=Index(["XX", "yy", "zz"], name='idx_name'))
+        res = s.str.extractall(r"[ab](?P<digit>\d)")
+        exp_idx = MultiIndex.from_tuples([("XX", 0), ("XX", 1), ("yy", 0)],
+                                         names=["idx_name", 'match'])
+        exp = DataFrame({'digit': ["1", "2", "1"]}, index=exp_idx)
+        tm.assert_frame_equal(res, exp)
+
+    def test_extractall_errors(self):
+        # Does not make sense to use extractall with a regex that has
+        # no capture groups. (it returns DataFrame with one column for
+        # each capture group)
+        s = Series(['a3', 'b3', 'd4c2'], name='series_name')
+        with tm.assert_raises_regex(ValueError, "no capture groups"):
+            s.str.extractall(r'[a-z]')
+
+    def test_extract_index_one_two_groups(self):
+        s = Series(['a3', 'b3', 'd4c2'], index=["A3", "B3", "D4"],
+                   name='series_name')
+        r = s.index.str.extract(r'([A-Z])', expand=True)
+        e = DataFrame(['A', "B", "D"])
+        tm.assert_frame_equal(r, e)
+
+        # Prior to v0.18.0, index.str.extract(regex with one group)
+        # returned Index. With more than one group, extract raised an
+        # error (GH9980). Now extract always returns DataFrame.
+        r = s.index.str.extract(
+            r'(?P<letter>[A-Z])(?P<digit>[0-9])', expand=True)
+        e_list = [
+            ("A", "3"),
+            ("B", "3"),
+            ("D", "4"),
+        ]
+        e = DataFrame(e_list, columns=["letter", "digit"])
+        tm.assert_frame_equal(r, e)
+
+    def test_extractall_same_as_extract(self):
+        s = Series(['a3', 'b3', 'c2'], name='series_name')
+
+        pattern_two_noname = r'([a-z])([0-9])'
+        extract_two_noname = s.str.extract(pattern_two_noname, expand=True)
+        has_multi_index = s.str.extractall(pattern_two_noname)
+        no_multi_index = has_multi_index.xs(0, level="match")
+        tm.assert_frame_equal(extract_two_noname, no_multi_index)
+
+        pattern_two_named = r'(?P<letter>[a-z])(?P<digit>[0-9])'
+        extract_two_named = s.str.extract(pattern_two_named, expand=True)
+        has_multi_index = s.str.extractall(pattern_two_named)
+        no_multi_index = has_multi_index.xs(0, level="match")
+        tm.assert_frame_equal(extract_two_named, no_multi_index)
+
+        pattern_one_named = r'(?P<group_name>[a-z])'
+        extract_one_named = s.str.extract(pattern_one_named, expand=True)
+        has_multi_index = s.str.extractall(pattern_one_named)
+        no_multi_index = has_multi_index.xs(0, level="match")
+        tm.assert_frame_equal(extract_one_named, no_multi_index)
+
+        pattern_one_noname = r'([a-z])'
+        extract_one_noname = s.str.extract(pattern_one_noname, expand=True)
+        has_multi_index = s.str.extractall(pattern_one_noname)
+        no_multi_index = has_multi_index.xs(0, level="match")
+        tm.assert_frame_equal(extract_one_noname, no_multi_index)
+
+    def test_extractall_same_as_extract_subject_index(self):
+        # same as above tests, but s has an MultiIndex.
+        i = MultiIndex.from_tuples([
+            ("A", "first"),
+            ("B", "second"),
+            ("C", "third"),
+        ], names=("capital", "ordinal"))
+        s = Series(['a3', 'b3', 'c2'], i, name='series_name')
+
+        pattern_two_noname = r'([a-z])([0-9])'
+        extract_two_noname = s.str.extract(pattern_two_noname, expand=True)
+        has_match_index = s.str.extractall(pattern_two_noname)
+        no_match_index = has_match_index.xs(0, level="match")
+        tm.assert_frame_equal(extract_two_noname, no_match_index)
+
+        pattern_two_named = r'(?P<letter>[a-z])(?P<digit>[0-9])'
+        extract_two_named = s.str.extract(pattern_two_named, expand=True)
+        has_match_index = s.str.extractall(pattern_two_named)
+        no_match_index = has_match_index.xs(0, level="match")
+        tm.assert_frame_equal(extract_two_named, no_match_index)
+
+        pattern_one_named = r'(?P<group_name>[a-z])'
+        extract_one_named = s.str.extract(pattern_one_named, expand=True)
+        has_match_index = s.str.extractall(pattern_one_named)
+        no_match_index = has_match_index.xs(0, level="match")
+        tm.assert_frame_equal(extract_one_named, no_match_index)
+
+        pattern_one_noname = r'([a-z])'
+        extract_one_noname = s.str.extract(pattern_one_noname, expand=True)
+        has_match_index = s.str.extractall(pattern_one_noname)
+        no_match_index = has_match_index.xs(0, level="match")
+        tm.assert_frame_equal(extract_one_noname, no_match_index)
 
     def test_empty_str_methods(self):
-        empty_str = empty = Series(dtype=str)
+        empty_str = empty = Series(dtype=object)
         empty_int = Series(dtype=int)
         empty_bool = Series(dtype=bool)
-        empty_list = Series(dtype=list)
         empty_bytes = Series(dtype=object)
 
         # GH7241
         # (extract) on empty series
 
-        tm.assert_series_equal(empty_str, empty.str.cat(empty))
-        tm.assert_equal('', empty.str.cat())
+        tm.assert_series_equal(empty_str, empty.str.cat(empty, join='left'))
+        assert '' == empty.str.cat()
         tm.assert_series_equal(empty_str, empty.str.title())
         tm.assert_series_equal(empty_int, empty.str.count('a'))
         tm.assert_series_equal(empty_bool, empty.str.contains('a'))
@@ -661,29 +1616,40 @@ def test_empty_str_methods(self):
         tm.assert_series_equal(empty_bool, empty.str.endswith('a'))
         tm.assert_series_equal(empty_str, empty.str.lower())
         tm.assert_series_equal(empty_str, empty.str.upper())
-        tm.assert_series_equal(empty_str, empty.str.replace('a','b'))
+        tm.assert_series_equal(empty_str, empty.str.replace('a', 'b'))
         tm.assert_series_equal(empty_str, empty.str.repeat(3))
         tm.assert_series_equal(empty_bool, empty.str.match('^a'))
-        tm.assert_series_equal(empty_str, empty.str.extract('()'))
-        tm.assert_frame_equal(DataFrame(columns=[0,1], dtype=str), empty.str.extract('()()'))
+        tm.assert_frame_equal(
+            DataFrame(columns=[0], dtype=str),
+            empty.str.extract('()', expand=True))
+        tm.assert_frame_equal(
+            DataFrame(columns=[0, 1], dtype=str),
+            empty.str.extract('()()', expand=True))
+        tm.assert_series_equal(
+            empty_str,
+            empty.str.extract('()', expand=False))
+        tm.assert_frame_equal(
+            DataFrame(columns=[0, 1], dtype=str),
+            empty.str.extract('()()', expand=False))
         tm.assert_frame_equal(DataFrame(dtype=str), empty.str.get_dummies())
-        tm.assert_series_equal(empty_str, empty_list.str.join(''))
+        tm.assert_series_equal(empty_str, empty_str.str.join(''))
         tm.assert_series_equal(empty_int, empty.str.len())
-        tm.assert_series_equal(empty_list, empty_list.str.findall('a'))
+        tm.assert_series_equal(empty_str, empty_str.str.findall('a'))
         tm.assert_series_equal(empty_int, empty.str.find('a'))
         tm.assert_series_equal(empty_int, empty.str.rfind('a'))
         tm.assert_series_equal(empty_str, empty.str.pad(42))
         tm.assert_series_equal(empty_str, empty.str.center(42))
-        tm.assert_series_equal(empty_list, empty.str.split('a'))
-        tm.assert_series_equal(empty_list, empty.str.rsplit('a'))
-        tm.assert_series_equal(empty_list, empty.str.partition('a', expand=False))
-        tm.assert_series_equal(empty_list, empty.str.rpartition('a', expand=False))
+        tm.assert_series_equal(empty_str, empty.str.split('a'))
+        tm.assert_series_equal(empty_str, empty.str.rsplit('a'))
+        tm.assert_series_equal(empty_str,
+                               empty.str.partition('a', expand=False))
+        tm.assert_series_equal(empty_str,
+                               empty.str.rpartition('a', expand=False))
         tm.assert_series_equal(empty_str, empty.str.slice(stop=1))
         tm.assert_series_equal(empty_str, empty.str.slice(step=1))
         tm.assert_series_equal(empty_str, empty.str.strip())
         tm.assert_series_equal(empty_str, empty.str.lstrip())
         tm.assert_series_equal(empty_str, empty.str.rstrip())
-        tm.assert_series_equal(empty_str, empty.str.rstrip())
         tm.assert_series_equal(empty_str, empty.str.wrap(42))
         tm.assert_series_equal(empty_str, empty.str.get(0))
         tm.assert_series_equal(empty_str, empty_bytes.str.decode('ascii'))
@@ -708,7 +1674,7 @@ def test_empty_str_methods(self):
         tm.assert_series_equal(empty_str, empty.str.translate(table))
 
     def test_empty_str_methods_to_frame(self):
-        empty_str = empty = Series(dtype=str)
+        empty = Series(dtype=str)
         empty_df = DataFrame([])
         tm.assert_frame_equal(empty_df, empty.str.partition('a'))
         tm.assert_frame_equal(empty_df, empty.str.rpartition('a'))
@@ -716,14 +1682,25 @@ def test_empty_str_methods_to_frame(self):
     def test_ismethods(self):
         values = ['A', 'b', 'Xy', '4', '3A', '', 'TT', '55', '-', '  ']
         str_s = Series(values)
-        alnum_e = [True, True, True, True, True, False, True, True, False, False]
-        alpha_e = [True, True, True, False, False, False, True, False, False, False]
-        digit_e = [False, False, False, True, False, False, False, True, False, False]
-        num_e = [False, False, False, True, False, False, False, True, False, False]
-        space_e = [False, False, False, False, False, False, False, False, False, True]
-        lower_e = [False, True, False, False, False, False, False, False, False, False]
-        upper_e = [True, False, False, False, True, False, True, False, False, False]
-        title_e = [True, False, True, False, True, False, False, False, False, False]
+        alnum_e = [True, True, True, True, True, False, True, True, False,
+                   False]
+        alpha_e = [True, True, True, False, False, False, True, False, False,
+                   False]
+        digit_e = [False, False, False, True, False, False, False, True, False,
+                   False]
+
+        # TODO: unused
+        num_e = [False, False, False, True, False, False,  # noqa
+                 False, True, False, False]
+
+        space_e = [False, False, False, False, False, False, False, False,
+                   False, True]
+        lower_e = [False, True, False, False, False, False, False, False,
+                   False, False]
+        upper_e = [True, False, False, False, True, False, True, False, False,
+                   False]
+        title_e = [True, False, True, False, True, False, False, False, False,
+                   False]
 
         tm.assert_series_equal(str_s.str.isalnum(), Series(alnum_e))
         tm.assert_series_equal(str_s.str.isalpha(), Series(alpha_e))
@@ -733,13 +1710,13 @@ def test_ismethods(self):
         tm.assert_series_equal(str_s.str.isupper(), Series(upper_e))
         tm.assert_series_equal(str_s.str.istitle(), Series(title_e))
 
-        self.assertEqual(str_s.str.isalnum().tolist(), [v.isalnum() for v in values])
-        self.assertEqual(str_s.str.isalpha().tolist(), [v.isalpha() for v in values])
-        self.assertEqual(str_s.str.isdigit().tolist(), [v.isdigit() for v in values])
-        self.assertEqual(str_s.str.isspace().tolist(), [v.isspace() for v in values])
-        self.assertEqual(str_s.str.islower().tolist(), [v.islower() for v in values])
-        self.assertEqual(str_s.str.isupper().tolist(), [v.isupper() for v in values])
-        self.assertEqual(str_s.str.istitle().tolist(), [v.istitle() for v in values])
+        assert str_s.str.isalnum().tolist() == [v.isalnum() for v in values]
+        assert str_s.str.isalpha().tolist() == [v.isalpha() for v in values]
+        assert str_s.str.isdigit().tolist() == [v.isdigit() for v in values]
+        assert str_s.str.isspace().tolist() == [v.isspace() for v in values]
+        assert str_s.str.islower().tolist() == [v.islower() for v in values]
+        assert str_s.str.isupper().tolist() == [v.isupper() for v in values]
+        assert str_s.str.istitle().tolist() == [v.istitle() for v in values]
 
     def test_isnumeric(self):
         # 0x00bc: ¼ VULGAR FRACTION ONE QUARTER
@@ -754,8 +1731,8 @@ def test_isnumeric(self):
         tm.assert_series_equal(s.str.isdecimal(), Series(decimal_e))
 
         unicodes = [u'A', u'3', u'¼', u'★', u'፸', u'３', u'four']
-        self.assertEqual(s.str.isnumeric().tolist(), [v.isnumeric() for v in unicodes])
-        self.assertEqual(s.str.isdecimal().tolist(), [v.isdecimal() for v in unicodes])
+        assert s.str.isnumeric().tolist() == [v.isnumeric() for v in unicodes]
+        assert s.str.isdecimal().tolist() == [v.isdecimal() for v in unicodes]
 
         values = ['A', np.nan, u'¼', u'★', np.nan, u'３', 'four']
         s = Series(values)
@@ -777,11 +1754,30 @@ def test_get_dummies(self):
                              columns=list('7ab'))
         tm.assert_frame_equal(result, expected)
 
-        # GH9980
-        # Index.str does not support get_dummies() as it returns a frame
-        with tm.assertRaisesRegexp(TypeError, "not supported"):
-            idx = Index(['a|b', 'a|c', 'b|c'])
-            idx.str.get_dummies('|')
+        # GH9980, GH8028
+        idx = Index(['a|b', 'a|c', 'b|c'])
+        result = idx.str.get_dummies('|')
+
+        expected = MultiIndex.from_tuples([(1, 1, 0), (1, 0, 1),
+                                           (0, 1, 1)], names=('a', 'b', 'c'))
+        tm.assert_index_equal(result, expected)
+
+    def test_get_dummies_with_name_dummy(self):
+        # GH 12180
+        # Dummies named 'name' should work as expected
+        s = Series(['a', 'b,name', 'b'])
+        result = s.str.get_dummies(',')
+        expected = DataFrame([[1, 0, 0], [0, 1, 1], [0, 1, 0]],
+                             columns=['a', 'b', 'name'])
+        tm.assert_frame_equal(result, expected)
+
+        idx = Index(['a|b', 'name|c', 'b|name'])
+        result = idx.str.get_dummies('|')
+
+        expected = MultiIndex.from_tuples([(1, 1, 0, 0), (0, 0, 1, 1),
+                                           (0, 1, 0, 1)],
+                                          names=('a', 'b', 'c', 'name'))
+        tm.assert_index_equal(result, expected)
 
     def test_join(self):
         values = Series(['a_b_c', 'c_d_e', np.nan, 'f_g_h'])
@@ -795,12 +1791,11 @@ def test_join(self):
         rs = Series(mixed).str.split('_').str.join('_')
         xp = Series(['a_b', NA, 'asdf_cas_asdf', NA, NA, 'foo', NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
-        values = Series([u('a_b_c'), u('c_d_e'), np.nan,
-                         u('f_g_h')])
+        values = Series([u('a_b_c'), u('c_d_e'), np.nan, u('f_g_h')])
         result = values.str.split('_').str.join('_')
         tm.assert_series_equal(values, result)
 
@@ -808,7 +1803,7 @@ def test_len(self):
         values = Series(['foo', 'fooo', 'fooooo', np.nan, 'fooooooo'])
 
         result = values.str.len()
-        exp = values.map(lambda x: len(x) if com.notnull(x) else NA)
+        exp = values.map(lambda x: len(x) if notna(x) else NA)
         tm.assert_series_equal(result, exp)
 
         # mixed
@@ -818,15 +1813,15 @@ def test_len(self):
         rs = Series(mixed).str.len()
         xp = Series([3, NA, 13, NA, NA, 3, NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
-        values = Series([u('foo'), u('fooo'), u('fooooo'), np.nan,
-                         u('fooooooo')])
+        values = Series([u('foo'), u('fooo'), u('fooooo'), np.nan, u(
+            'fooooooo')])
 
         result = values.str.len()
-        exp = values.map(lambda x: len(x) if com.notnull(x) else NA)
+        exp = values.map(lambda x: len(x) if notna(x) else NA)
         tm.assert_series_equal(result, exp)
 
     def test_findall(self):
@@ -843,12 +1838,11 @@ def test_findall(self):
         rs = Series(mixed).str.findall('BAD[_]*')
         xp = Series([['BAD__', 'BAD'], NA, [], NA, NA, ['BAD'], NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
-        values = Series([u('fooBAD__barBAD'), NA, u('foo'),
-                         u('BAD')])
+        values = Series([u('fooBAD__barBAD'), NA, u('foo'), u('BAD')])
 
         result = values.str.findall('BAD[_]*')
         exp = Series([[u('BAD__'), u('BAD')], NA, [], [u('BAD')]])
@@ -858,38 +1852,46 @@ def test_find(self):
         values = Series(['ABCDEFG', 'BCDEFEF', 'DEFGHIJEF', 'EFGHEF', 'XXXX'])
         result = values.str.find('EF')
         tm.assert_series_equal(result, Series([4, 3, 1, 0, -1]))
-        expected = np.array([v.find('EF') for v in values.values])
+        expected = np.array([v.find('EF') for v in values.values],
+                            dtype=np.int64)
         tm.assert_numpy_array_equal(result.values, expected)
 
         result = values.str.rfind('EF')
         tm.assert_series_equal(result, Series([4, 5, 7, 4, -1]))
-        expected = np.array([v.rfind('EF') for v in values.values])
+        expected = np.array([v.rfind('EF') for v in values.values],
+                            dtype=np.int64)
         tm.assert_numpy_array_equal(result.values, expected)
 
         result = values.str.find('EF', 3)
         tm.assert_series_equal(result, Series([4, 3, 7, 4, -1]))
-        expected = np.array([v.find('EF', 3) for v in values.values])
+        expected = np.array([v.find('EF', 3) for v in values.values],
+                            dtype=np.int64)
         tm.assert_numpy_array_equal(result.values, expected)
 
         result = values.str.rfind('EF', 3)
         tm.assert_series_equal(result, Series([4, 5, 7, 4, -1]))
-        expected = np.array([v.rfind('EF', 3) for v in values.values])
+        expected = np.array([v.rfind('EF', 3) for v in values.values],
+                            dtype=np.int64)
         tm.assert_numpy_array_equal(result.values, expected)
 
         result = values.str.find('EF', 3, 6)
         tm.assert_series_equal(result, Series([4, 3, -1, 4, -1]))
-        expected = np.array([v.find('EF', 3, 6) for v in values.values])
+        expected = np.array([v.find('EF', 3, 6) for v in values.values],
+                            dtype=np.int64)
         tm.assert_numpy_array_equal(result.values, expected)
 
         result = values.str.rfind('EF', 3, 6)
         tm.assert_series_equal(result, Series([4, 3, -1, 4, -1]))
-        expected = np.array([v.rfind('EF', 3, 6) for v in values.values])
+        expected = np.array([v.rfind('EF', 3, 6) for v in values.values],
+                            dtype=np.int64)
         tm.assert_numpy_array_equal(result.values, expected)
 
-        with tm.assertRaisesRegexp(TypeError, "expected a string object, not int"):
+        with tm.assert_raises_regex(TypeError,
+                                    "expected a string object, not int"):
             result = values.str.find(0)
 
-        with tm.assertRaisesRegexp(TypeError, "expected a string object, not int"):
+        with tm.assert_raises_regex(TypeError,
+                                    "expected a string object, not int"):
             result = values.str.rfind(0)
 
     def test_find_nan(self):
@@ -913,51 +1915,67 @@ def test_find_nan(self):
         tm.assert_series_equal(result, Series([4, np.nan, -1, np.nan, -1]))
 
     def test_index(self):
+
+        def _check(result, expected):
+            if isinstance(result, Series):
+                tm.assert_series_equal(result, expected)
+            else:
+                tm.assert_index_equal(result, expected)
+
         for klass in [Series, Index]:
             s = klass(['ABCDEFG', 'BCDEFEF', 'DEFGHIJEF', 'EFGHEF'])
 
             result = s.str.index('EF')
-            tm.assert_numpy_array_equal(result, klass([4, 3, 1, 0]))
-            expected = np.array([v.index('EF') for v in s.values])
+            _check(result, klass([4, 3, 1, 0]))
+            expected = np.array([v.index('EF') for v in s.values],
+                                dtype=np.int64)
             tm.assert_numpy_array_equal(result.values, expected)
 
             result = s.str.rindex('EF')
-            tm.assert_numpy_array_equal(result, klass([4, 5, 7, 4]))
-            expected = np.array([v.rindex('EF') for v in s.values])
+            _check(result, klass([4, 5, 7, 4]))
+            expected = np.array([v.rindex('EF') for v in s.values],
+                                dtype=np.int64)
             tm.assert_numpy_array_equal(result.values, expected)
 
             result = s.str.index('EF', 3)
-            tm.assert_numpy_array_equal(result, klass([4, 3, 7, 4]))
-            expected = np.array([v.index('EF', 3) for v in s.values])
+            _check(result, klass([4, 3, 7, 4]))
+            expected = np.array([v.index('EF', 3) for v in s.values],
+                                dtype=np.int64)
             tm.assert_numpy_array_equal(result.values, expected)
 
             result = s.str.rindex('EF', 3)
-            tm.assert_numpy_array_equal(result, klass([4, 5, 7, 4]))
-            expected = np.array([v.rindex('EF', 3) for v in s.values])
+            _check(result, klass([4, 5, 7, 4]))
+            expected = np.array([v.rindex('EF', 3) for v in s.values],
+                                dtype=np.int64)
             tm.assert_numpy_array_equal(result.values, expected)
 
             result = s.str.index('E', 4, 8)
-            tm.assert_numpy_array_equal(result, klass([4, 5, 7, 4]))
-            expected = np.array([v.index('E', 4, 8) for v in s.values])
+            _check(result, klass([4, 5, 7, 4]))
+            expected = np.array([v.index('E', 4, 8) for v in s.values],
+                                dtype=np.int64)
             tm.assert_numpy_array_equal(result.values, expected)
 
             result = s.str.rindex('E', 0, 5)
-            tm.assert_numpy_array_equal(result, klass([4, 3, 1, 4]))
-            expected = np.array([v.rindex('E', 0, 5) for v in s.values])
+            _check(result, klass([4, 3, 1, 4]))
+            expected = np.array([v.rindex('E', 0, 5) for v in s.values],
+                                dtype=np.int64)
             tm.assert_numpy_array_equal(result.values, expected)
 
-            with tm.assertRaisesRegexp(ValueError, "substring not found"):
+            with tm.assert_raises_regex(ValueError,
+                                        "substring not found"):
                 result = s.str.index('DE')
 
-            with tm.assertRaisesRegexp(TypeError, "expected a string object, not int"):
+            with tm.assert_raises_regex(TypeError,
+                                        "expected a string "
+                                        "object, not int"):
                 result = s.str.index(0)
 
         # test with nan
         s = Series(['abcb', 'ab', 'bcbe', np.nan])
         result = s.str.index('b')
-        tm.assert_numpy_array_equal(result, Series([1, 1, 0, np.nan]))
+        tm.assert_series_equal(result, Series([1, 1, 0, np.nan]))
         result = s.str.rindex('b')
-        tm.assert_numpy_array_equal(result, Series([3, 1, 2, np.nan]))
+        tm.assert_series_equal(result, Series([3, 1, 2, np.nan]))
 
     def test_pad(self):
         values = Series(['a', 'b', NA, 'c', NA, 'eeeeee'])
@@ -975,50 +1993,46 @@ def test_pad(self):
         tm.assert_almost_equal(result, exp)
 
         # mixed
-        mixed = Series(['a', NA, 'b', True, datetime.today(),
-                        'ee', None, 1, 2.])
+        mixed = Series(['a', NA, 'b', True, datetime.today(), 'ee', None, 1, 2.
+                        ])
 
         rs = Series(mixed).str.pad(5, side='left')
         xp = Series(['    a', NA, '    b', NA, NA, '   ee', NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
-        mixed = Series(['a', NA, 'b', True, datetime.today(),
-                        'ee', None, 1, 2.])
+        mixed = Series(['a', NA, 'b', True, datetime.today(), 'ee', None, 1, 2.
+                        ])
 
         rs = Series(mixed).str.pad(5, side='right')
         xp = Series(['a    ', NA, 'b    ', NA, NA, 'ee   ', NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
-        mixed = Series(['a', NA, 'b', True, datetime.today(),
-                        'ee', None, 1, 2.])
+        mixed = Series(['a', NA, 'b', True, datetime.today(), 'ee', None, 1, 2.
+                        ])
 
         rs = Series(mixed).str.pad(5, side='both')
         xp = Series(['  a  ', NA, '  b  ', NA, NA, '  ee ', NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
-        values = Series([u('a'), u('b'), NA, u('c'), NA,
-                         u('eeeeee')])
+        values = Series([u('a'), u('b'), NA, u('c'), NA, u('eeeeee')])
 
         result = values.str.pad(5, side='left')
-        exp = Series([u('    a'), u('    b'), NA, u('    c'), NA,
-                      u('eeeeee')])
+        exp = Series([u('    a'), u('    b'), NA, u('    c'), NA, u('eeeeee')])
         tm.assert_almost_equal(result, exp)
 
         result = values.str.pad(5, side='right')
-        exp = Series([u('a    '), u('b    '), NA, u('c    '), NA,
-                      u('eeeeee')])
+        exp = Series([u('a    '), u('b    '), NA, u('c    '), NA, u('eeeeee')])
         tm.assert_almost_equal(result, exp)
 
         result = values.str.pad(5, side='both')
-        exp = Series([u('  a  '), u('  b  '), NA, u('  c  '), NA,
-                      u('eeeeee')])
+        exp = Series([u('  a  '), u('  b  '), NA, u('  c  '), NA, u('eeeeee')])
         tm.assert_almost_equal(result, exp)
 
     def test_pad_fillchar(self):
@@ -1037,13 +2051,34 @@ def test_pad_fillchar(self):
         exp = Series(['XXaXX', 'XXbXX', NA, 'XXcXX', NA, 'eeeeee'])
         tm.assert_almost_equal(result, exp)
 
-        with tm.assertRaisesRegexp(TypeError, "fillchar must be a character, not str"):
+        with tm.assert_raises_regex(TypeError,
+                                    "fillchar must be a "
+                                    "character, not str"):
             result = values.str.pad(5, fillchar='XY')
 
-        with tm.assertRaisesRegexp(TypeError, "fillchar must be a character, not int"):
+        with tm.assert_raises_regex(TypeError,
+                                    "fillchar must be a "
+                                    "character, not int"):
             result = values.str.pad(5, fillchar=5)
 
+    def test_pad_width(self):
+        # GH 13598
+        s = Series(['1', '22', 'a', 'bb'])
+
+        for f in ['center', 'ljust', 'rjust', 'zfill', 'pad']:
+            with tm.assert_raises_regex(TypeError,
+                                        "width must be of "
+                                        "integer type, not*"):
+                getattr(s.str, f)('f')
+
     def test_translate(self):
+
+        def _check(result, expected):
+            if isinstance(result, Series):
+                tm.assert_series_equal(result, expected)
+            else:
+                tm.assert_index_equal(result, expected)
+
         for klass in [Series, Index]:
             s = klass(['abcdefg', 'abcc', 'cdddfg', 'cdefggg'])
             if not compat.PY3:
@@ -1053,26 +2088,27 @@ def test_translate(self):
                 table = str.maketrans('abc', 'cde')
             result = s.str.translate(table)
             expected = klass(['cdedefg', 'cdee', 'edddfg', 'edefggg'])
-            tm.assert_numpy_array_equal(result, expected)
+            _check(result, expected)
 
             # use of deletechars is python 2 only
             if not compat.PY3:
                 result = s.str.translate(table, deletechars='fg')
                 expected = klass(['cdede', 'cdee', 'eddd', 'ede'])
-                tm.assert_numpy_array_equal(result, expected)
+                _check(result, expected)
 
                 result = s.str.translate(None, deletechars='fg')
                 expected = klass(['abcde', 'abcc', 'cddd', 'cde'])
-                tm.assert_numpy_array_equal(result, expected)
+                _check(result, expected)
             else:
-                with tm.assertRaisesRegexp(ValueError, "deletechars is not a valid argument"):
+                with tm.assert_raises_regex(
+                        ValueError, "deletechars is not a valid argument"):
                     result = s.str.translate(table, deletechars='fg')
 
         # Series with non-string values
         s = Series(['a', 'b', 'c', 1.2])
         expected = Series(['c', 'd', 'e', np.nan])
         result = s.str.translate(table)
-        tm.assert_numpy_array_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
     def test_center_ljust_rjust(self):
         values = Series(['a', 'b', NA, 'c', NA, 'eeeeee'])
@@ -1090,44 +2126,40 @@ def test_center_ljust_rjust(self):
         tm.assert_almost_equal(result, exp)
 
         # mixed
-        mixed = Series(['a', NA, 'b', True, datetime.today(),
-                        'c', 'eee', None, 1, 2.])
+        mixed = Series(['a', NA, 'b', True, datetime.today(), 'c', 'eee', None,
+                        1, 2.])
 
         rs = Series(mixed).str.center(5)
-        xp = Series(['  a  ', NA, '  b  ', NA, NA, '  c  ', ' eee ', NA, NA,
-                     NA])
-        tm.assertIsInstance(rs, Series)
+        xp = Series(['  a  ', NA, '  b  ', NA, NA, '  c  ', ' eee ', NA, NA, NA
+                     ])
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         rs = Series(mixed).str.ljust(5)
-        xp = Series(['a    ', NA, 'b    ', NA, NA, 'c    ', 'eee  ', NA, NA,
-                     NA])
-        tm.assertIsInstance(rs, Series)
+        xp = Series(['a    ', NA, 'b    ', NA, NA, 'c    ', 'eee  ', NA, NA, NA
+                     ])
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         rs = Series(mixed).str.rjust(5)
-        xp = Series(['    a', NA, '    b', NA, NA, '    c', '  eee', NA, NA,
-                     NA])
-        tm.assertIsInstance(rs, Series)
+        xp = Series(['    a', NA, '    b', NA, NA, '    c', '  eee', NA, NA, NA
+                     ])
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
-        values = Series([u('a'), u('b'), NA, u('c'), NA,
-                         u('eeeeee')])
+        values = Series([u('a'), u('b'), NA, u('c'), NA, u('eeeeee')])
 
         result = values.str.center(5)
-        exp = Series([u('  a  '), u('  b  '), NA, u('  c  '), NA,
-                      u('eeeeee')])
+        exp = Series([u('  a  '), u('  b  '), NA, u('  c  '), NA, u('eeeeee')])
         tm.assert_almost_equal(result, exp)
 
         result = values.str.ljust(5)
-        exp = Series([u('a    '), u('b    '), NA, u('c    '), NA,
-                      u('eeeeee')])
+        exp = Series([u('a    '), u('b    '), NA, u('c    '), NA, u('eeeeee')])
         tm.assert_almost_equal(result, exp)
 
         result = values.str.rjust(5)
-        exp = Series([u('    a'), u('    b'), NA, u('    c'), NA,
-                      u('eeeeee')])
+        exp = Series([u('    a'), u('    b'), NA, u('    c'), NA, u('eeeeee')])
         tm.assert_almost_equal(result, exp)
 
     def test_center_ljust_rjust_fillchar(self):
@@ -1136,40 +2168,55 @@ def test_center_ljust_rjust_fillchar(self):
         result = values.str.center(5, fillchar='X')
         expected = Series(['XXaXX', 'XXbbX', 'Xcccc', 'ddddd', 'eeeeee'])
         tm.assert_series_equal(result, expected)
-        expected = np.array([v.center(5, 'X') for v in values.values])
+        expected = np.array([v.center(5, 'X') for v in values.values],
+                            dtype=np.object_)
         tm.assert_numpy_array_equal(result.values, expected)
 
         result = values.str.ljust(5, fillchar='X')
         expected = Series(['aXXXX', 'bbXXX', 'ccccX', 'ddddd', 'eeeeee'])
         tm.assert_series_equal(result, expected)
-        expected = np.array([v.ljust(5, 'X') for v in values.values])
+        expected = np.array([v.ljust(5, 'X') for v in values.values],
+                            dtype=np.object_)
         tm.assert_numpy_array_equal(result.values, expected)
 
         result = values.str.rjust(5, fillchar='X')
         expected = Series(['XXXXa', 'XXXbb', 'Xcccc', 'ddddd', 'eeeeee'])
         tm.assert_series_equal(result, expected)
-        expected = np.array([v.rjust(5, 'X') for v in values.values])
+        expected = np.array([v.rjust(5, 'X') for v in values.values],
+                            dtype=np.object_)
         tm.assert_numpy_array_equal(result.values, expected)
 
         # If fillchar is not a charatter, normal str raises TypeError
         # 'aaa'.ljust(5, 'XY')
         # TypeError: must be char, not str
-        with tm.assertRaisesRegexp(TypeError, "fillchar must be a character, not str"):
+        with tm.assert_raises_regex(TypeError,
+                                    "fillchar must be a "
+                                    "character, not str"):
             result = values.str.center(5, fillchar='XY')
 
-        with tm.assertRaisesRegexp(TypeError, "fillchar must be a character, not str"):
+        with tm.assert_raises_regex(TypeError,
+                                    "fillchar must be a "
+                                    "character, not str"):
             result = values.str.ljust(5, fillchar='XY')
 
-        with tm.assertRaisesRegexp(TypeError, "fillchar must be a character, not str"):
+        with tm.assert_raises_regex(TypeError,
+                                    "fillchar must be a "
+                                    "character, not str"):
             result = values.str.rjust(5, fillchar='XY')
 
-        with tm.assertRaisesRegexp(TypeError, "fillchar must be a character, not int"):
+        with tm.assert_raises_regex(TypeError,
+                                    "fillchar must be a "
+                                    "character, not int"):
             result = values.str.center(5, fillchar=1)
 
-        with tm.assertRaisesRegexp(TypeError, "fillchar must be a character, not int"):
+        with tm.assert_raises_regex(TypeError,
+                                    "fillchar must be a "
+                                    "character, not int"):
             result = values.str.ljust(5, fillchar=1)
 
-        with tm.assertRaisesRegexp(TypeError, "fillchar must be a character, not int"):
+        with tm.assert_raises_regex(TypeError,
+                                    "fillchar must be a "
+                                    "character, not int"):
             result = values.str.rjust(5, fillchar=1)
 
     def test_zfill(self):
@@ -1178,13 +2225,15 @@ def test_zfill(self):
         result = values.str.zfill(5)
         expected = Series(['00001', '00022', '00aaa', '00333', '45678'])
         tm.assert_series_equal(result, expected)
-        expected = np.array([v.zfill(5) for v in values.values])
+        expected = np.array([v.zfill(5) for v in values.values],
+                            dtype=np.object_)
         tm.assert_numpy_array_equal(result.values, expected)
 
         result = values.str.zfill(3)
         expected = Series(['001', '022', 'aaa', '333', '45678'])
         tm.assert_series_equal(result, expected)
-        expected = np.array([v.zfill(3) for v in values.values])
+        expected = np.array([v.zfill(3) for v in values.values],
+                            dtype=np.object_)
         tm.assert_numpy_array_equal(result.values, expected)
 
         values = Series(['1', np.nan, 'aaa', np.nan, '45678'])
@@ -1208,24 +2257,23 @@ def test_split(self):
         tm.assert_series_equal(result, exp)
 
         # mixed
-        mixed = Series(['a_b_c', NA, 'd_e_f', True, datetime.today(),
-                        None, 1, 2.])
+        mixed = Series(['a_b_c', NA, 'd_e_f', True, datetime.today(), None, 1,
+                        2.])
         result = mixed.str.split('_')
-        exp = Series([['a', 'b', 'c'], NA, ['d', 'e', 'f'], NA, NA,
-                     NA, NA, NA])
-        tm.assertIsInstance(result, Series)
+        exp = Series([['a', 'b', 'c'], NA, ['d', 'e', 'f'], NA, NA, NA, NA, NA
+                      ])
+        assert isinstance(result, Series)
         tm.assert_almost_equal(result, exp)
 
         result = mixed.str.split('_', expand=False)
-        tm.assertIsInstance(result, Series)
+        assert isinstance(result, Series)
         tm.assert_almost_equal(result, exp)
 
         # unicode
         values = Series([u('a_b_c'), u('c_d_e'), NA, u('f_g_h')])
 
         result = values.str.split('_')
-        exp = Series([[u('a'), u('b'), u('c')],
-                      [u('c'), u('d'), u('e')], NA,
+        exp = Series([[u('a'), u('b'), u('c')], [u('c'), u('d'), u('e')], NA,
                       [u('f'), u('g'), u('h')]])
         tm.assert_series_equal(result, exp)
 
@@ -1235,8 +2283,7 @@ def test_split(self):
         # regex split
         values = Series([u('a,b_c'), u('c_d,e'), NA, u('f,g,h')])
         result = values.str.split('[,_]')
-        exp = Series([[u('a'), u('b'), u('c')],
-                      [u('c'), u('d'), u('e')], NA,
+        exp = Series([[u('a'), u('b'), u('c')], [u('c'), u('d'), u('e')], NA,
                       [u('f'), u('g'), u('h')]])
         tm.assert_series_equal(result, exp)
 
@@ -1255,23 +2302,22 @@ def test_rsplit(self):
         tm.assert_series_equal(result, exp)
 
         # mixed
-        mixed = Series(['a_b_c', NA, 'd_e_f', True, datetime.today(),
-                        None, 1, 2.])
+        mixed = Series(['a_b_c', NA, 'd_e_f', True, datetime.today(), None, 1,
+                        2.])
         result = mixed.str.rsplit('_')
-        exp = Series([['a', 'b', 'c'], NA, ['d', 'e', 'f'], NA, NA,
-                     NA, NA, NA])
-        tm.assertIsInstance(result, Series)
+        exp = Series([['a', 'b', 'c'], NA, ['d', 'e', 'f'], NA, NA, NA, NA, NA
+                      ])
+        assert isinstance(result, Series)
         tm.assert_almost_equal(result, exp)
 
         result = mixed.str.rsplit('_', expand=False)
-        tm.assertIsInstance(result, Series)
+        assert isinstance(result, Series)
         tm.assert_almost_equal(result, exp)
 
         # unicode
         values = Series([u('a_b_c'), u('c_d_e'), NA, u('f_g_h')])
         result = values.str.rsplit('_')
-        exp = Series([[u('a'), u('b'), u('c')],
-                      [u('c'), u('d'), u('e')], NA,
+        exp = Series([[u('a'), u('b'), u('c')], [u('c'), u('d'), u('e')], NA,
                       [u('f'), u('g'), u('h')]])
         tm.assert_series_equal(result, exp)
 
@@ -1281,10 +2327,7 @@ def test_rsplit(self):
         # regex split is not supported by rsplit
         values = Series([u('a,b_c'), u('c_d,e'), NA, u('f,g,h')])
         result = values.str.rsplit('[,_]')
-        exp = Series([[u('a,b_c')],
-                      [u('c_d,e')],
-                      NA,
-                      [u('f,g,h')]])
+        exp = Series([[u('a,b_c')], [u('c_d,e')], NA, [u('f,g,h')]])
         tm.assert_series_equal(result, exp)
 
         # setting max number of splits, make sure it's from reverse
@@ -1293,14 +2336,27 @@ def test_rsplit(self):
         exp = Series([['a_b', 'c'], ['c_d', 'e'], NA, ['f_g', 'h']])
         tm.assert_series_equal(result, exp)
 
+    def test_split_blank_string(self):
+        # expand blank split GH 20067
+        values = Series([''], name='test')
+        result = values.str.split(expand=True)
+        exp = DataFrame([[]])
+        tm.assert_frame_equal(result, exp)
+
+        values = Series(['a b c', 'a b', '', ' '], name='test')
+        result = values.str.split(expand=True)
+        exp = DataFrame([['a', 'b', 'c'], ['a', 'b', np.nan],
+                         [np.nan, np.nan, np.nan], [np.nan, np.nan, np.nan]])
+        tm.assert_frame_equal(result, exp)
+
     def test_split_noargs(self):
         # #1859
         s = Series(['Wes McKinney', 'Travis  Oliphant'])
         result = s.str.split()
         expected = ['Travis', 'Oliphant']
-        self.assertEqual(result[1], expected)
+        assert result[1] == expected
         result = s.str.rsplit()
-        self.assertEqual(result[1], expected)
+        assert result[1] == expected
 
     def test_split_maxsplit(self):
         # re.split 0, str.split -1
@@ -1324,56 +2380,29 @@ def test_split_no_pat_with_nonzero_n(self):
         s = Series(['split once', 'split once too!'])
         result = s.str.split(n=1)
         expected = Series({0: ['split', 'once'], 1: ['split', 'once too!']})
-        tm.assert_series_equal(expected, result)
+        tm.assert_series_equal(expected, result, check_index_type=False)
 
     def test_split_to_dataframe(self):
         s = Series(['nosplit', 'alsonosplit'])
-
-        with tm.assert_produces_warning():
-            result = s.str.split('_', return_type='frame')
-
-        exp = DataFrame({0: Series(['nosplit', 'alsonosplit'])})
-        tm.assert_frame_equal(result, exp)
-
-        s = Series(['some_equal_splits', 'with_no_nans'])
-        result = s.str.split('_', return_type='frame')
-        exp = DataFrame({0: ['some', 'with'], 1: ['equal', 'no'],
-                         2: ['splits', 'nans']})
-        tm.assert_frame_equal(result, exp)
-
-        s = Series(['some_unequal_splits', 'one_of_these_things_is_not'])
-        result = s.str.split('_', return_type='frame')
-        exp = DataFrame({0: ['some', 'one'], 1: ['unequal', 'of'],
-                         2: ['splits', 'these'], 3: [NA, 'things'],
-                         4: [NA, 'is'], 5: [NA, 'not']})
-        tm.assert_frame_equal(result, exp)
-
-        s = Series(['some_splits', 'with_index'], index=['preserve', 'me'])
-        result = s.str.split('_', return_type='frame')
-        exp = DataFrame({0: ['some', 'with'], 1: ['splits', 'index']},
-                        index=['preserve', 'me'])
-        tm.assert_frame_equal(result, exp)
-
-        with tm.assertRaisesRegexp(ValueError, "expand must be"):
-            s.str.split('_', return_type="some_invalid_type")
-
-    def test_split_to_dataframe_expand(self):
-        s = Series(['nosplit', 'alsonosplit'])
         result = s.str.split('_', expand=True)
         exp = DataFrame({0: Series(['nosplit', 'alsonosplit'])})
         tm.assert_frame_equal(result, exp)
 
         s = Series(['some_equal_splits', 'with_no_nans'])
         result = s.str.split('_', expand=True)
-        exp = DataFrame({0: ['some', 'with'], 1: ['equal', 'no'],
+        exp = DataFrame({0: ['some', 'with'],
+                         1: ['equal', 'no'],
                          2: ['splits', 'nans']})
         tm.assert_frame_equal(result, exp)
 
         s = Series(['some_unequal_splits', 'one_of_these_things_is_not'])
         result = s.str.split('_', expand=True)
-        exp = DataFrame({0: ['some', 'one'], 1: ['unequal', 'of'],
-                         2: ['splits', 'these'], 3: [NA, 'things'],
-                         4: [NA, 'is'], 5: [NA, 'not']})
+        exp = DataFrame({0: ['some', 'one'],
+                         1: ['unequal', 'of'],
+                         2: ['splits', 'these'],
+                         3: [NA, 'things'],
+                         4: [NA, 'is'],
+                         5: [NA, 'not']})
         tm.assert_frame_equal(result, exp)
 
         s = Series(['some_splits', 'with_index'], index=['preserve', 'me'])
@@ -1382,32 +2411,33 @@ def test_split_to_dataframe_expand(self):
                         index=['preserve', 'me'])
         tm.assert_frame_equal(result, exp)
 
-        with tm.assertRaisesRegexp(ValueError, "expand must be"):
-            s.str.split('_', return_type="some_invalid_type")
+        with tm.assert_raises_regex(ValueError, "expand must be"):
+            s.str.split('_', expand="not_a_boolean")
 
     def test_split_to_multiindex_expand(self):
         idx = Index(['nosplit', 'alsonosplit'])
         result = idx.str.split('_', expand=True)
-        exp = Index([np.array(['nosplit']), np.array(['alsonosplit'])])
+        exp = idx
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 1)
+        assert result.nlevels == 1
 
         idx = Index(['some_equal_splits', 'with_no_nans'])
         result = idx.str.split('_', expand=True)
-        exp = MultiIndex.from_tuples([('some', 'equal', 'splits'),
-                                      ('with', 'no', 'nans')])
+        exp = MultiIndex.from_tuples([('some', 'equal', 'splits'), (
+            'with', 'no', 'nans')])
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 3)
+        assert result.nlevels == 3
 
         idx = Index(['some_unequal_splits', 'one_of_these_things_is_not'])
         result = idx.str.split('_', expand=True)
-        exp = MultiIndex.from_tuples([('some', 'unequal', 'splits', NA, NA, NA),
-                                      ('one', 'of', 'these', 'things', 'is', 'not')])
+        exp = MultiIndex.from_tuples([('some', 'unequal', 'splits', NA, NA, NA
+                                       ), ('one', 'of', 'these', 'things',
+                                           'is', 'not')])
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 6)
+        assert result.nlevels == 6
 
-        with tm.assertRaisesRegexp(ValueError, "expand must be"):
-            idx.str.split('_', return_type="some_invalid_type")
+        with tm.assert_raises_regex(ValueError, "expand must be"):
+            idx.str.split('_', expand="not_a_boolean")
 
     def test_rsplit_to_dataframe_expand(self):
         s = Series(['nosplit', 'alsonosplit'])
@@ -1417,18 +2447,19 @@ def test_rsplit_to_dataframe_expand(self):
 
         s = Series(['some_equal_splits', 'with_no_nans'])
         result = s.str.rsplit('_', expand=True)
-        exp = DataFrame({0: ['some', 'with'], 1: ['equal', 'no'],
+        exp = DataFrame({0: ['some', 'with'],
+                         1: ['equal', 'no'],
                          2: ['splits', 'nans']})
         tm.assert_frame_equal(result, exp)
 
         result = s.str.rsplit('_', expand=True, n=2)
-        exp = DataFrame({0: ['some', 'with'], 1: ['equal', 'no'],
+        exp = DataFrame({0: ['some', 'with'],
+                         1: ['equal', 'no'],
                          2: ['splits', 'nans']})
         tm.assert_frame_equal(result, exp)
 
         result = s.str.rsplit('_', expand=True, n=1)
-        exp = DataFrame({0: ['some_equal', 'with_no'],
-                         1: ['splits', 'nans']})
+        exp = DataFrame({0: ['some_equal', 'with_no'], 1: ['splits', 'nans']})
         tm.assert_frame_equal(result, exp)
 
         s = Series(['some_splits', 'with_index'], index=['preserve', 'me'])
@@ -1440,109 +2471,153 @@ def test_rsplit_to_dataframe_expand(self):
     def test_rsplit_to_multiindex_expand(self):
         idx = Index(['nosplit', 'alsonosplit'])
         result = idx.str.rsplit('_', expand=True)
-        exp = Index([np.array(['nosplit']), np.array(['alsonosplit'])])
+        exp = idx
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 1)
+        assert result.nlevels == 1
 
         idx = Index(['some_equal_splits', 'with_no_nans'])
         result = idx.str.rsplit('_', expand=True)
-        exp = MultiIndex.from_tuples([('some', 'equal', 'splits'),
-                                      ('with', 'no', 'nans')])
+        exp = MultiIndex.from_tuples([('some', 'equal', 'splits'), (
+            'with', 'no', 'nans')])
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 3)
+        assert result.nlevels == 3
 
         idx = Index(['some_equal_splits', 'with_no_nans'])
         result = idx.str.rsplit('_', expand=True, n=1)
         exp = MultiIndex.from_tuples([('some_equal', 'splits'),
                                       ('with_no', 'nans')])
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 2)
+        assert result.nlevels == 2
+
+    def test_split_nan_expand(self):
+        # gh-18450
+        s = Series(["foo,bar,baz", NA])
+        result = s.str.split(",", expand=True)
+        exp = DataFrame([["foo", "bar", "baz"], [NA, NA, NA]])
+        tm.assert_frame_equal(result, exp)
+
+        # check that these are actually np.nan and not None
+        # TODO see GH 18463
+        # tm.assert_frame_equal does not differentiate
+        assert all(np.isnan(x) for x in result.iloc[1])
+
+    def test_split_with_name(self):
+        # GH 12617
+
+        # should preserve name
+        s = Series(['a,b', 'c,d'], name='xxx')
+        res = s.str.split(',')
+        exp = Series([['a', 'b'], ['c', 'd']], name='xxx')
+        tm.assert_series_equal(res, exp)
+
+        res = s.str.split(',', expand=True)
+        exp = DataFrame([['a', 'b'], ['c', 'd']])
+        tm.assert_frame_equal(res, exp)
+
+        idx = Index(['a,b', 'c,d'], name='xxx')
+        res = idx.str.split(',')
+        exp = Index([['a', 'b'], ['c', 'd']], name='xxx')
+        assert res.nlevels == 1
+        tm.assert_index_equal(res, exp)
+
+        res = idx.str.split(',', expand=True)
+        exp = MultiIndex.from_tuples([('a', 'b'), ('c', 'd')])
+        assert res.nlevels == 2
+        tm.assert_index_equal(res, exp)
 
     def test_partition_series(self):
         values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h'])
 
         result = values.str.partition('_', expand=False)
-        exp = Series([['a', '_', 'b_c'], ['c', '_', 'd_e'], NA, ['f', '_', 'g_h']])
+        exp = Series([('a', '_', 'b_c'), ('c', '_', 'd_e'), NA,
+                      ('f', '_', 'g_h')])
         tm.assert_series_equal(result, exp)
 
         result = values.str.rpartition('_', expand=False)
-        exp = Series([['a_b', '_', 'c'], ['c_d', '_', 'e'], NA, ['f_g', '_', 'h']])
+        exp = Series([('a_b', '_', 'c'), ('c_d', '_', 'e'), NA,
+                      ('f_g', '_', 'h')])
         tm.assert_series_equal(result, exp)
 
         # more than one char
         values = Series(['a__b__c', 'c__d__e', NA, 'f__g__h'])
         result = values.str.partition('__', expand=False)
-        exp = Series([['a', '__', 'b__c'], ['c', '__', 'd__e'], NA, ['f', '__', 'g__h']])
+        exp = Series([('a', '__', 'b__c'), ('c', '__', 'd__e'), NA,
+                      ('f', '__', 'g__h')])
         tm.assert_series_equal(result, exp)
 
         result = values.str.rpartition('__', expand=False)
-        exp = Series([['a__b', '__', 'c'], ['c__d', '__', 'e'], NA, ['f__g', '__', 'h']])
+        exp = Series([('a__b', '__', 'c'), ('c__d', '__', 'e'), NA,
+                      ('f__g', '__', 'h')])
         tm.assert_series_equal(result, exp)
 
         # None
         values = Series(['a b c', 'c d e', NA, 'f g h'])
         result = values.str.partition(expand=False)
-        exp = Series([['a', ' ', 'b c'], ['c', ' ', 'd e'], NA, ['f', ' ', 'g h']])
+        exp = Series([('a', ' ', 'b c'), ('c', ' ', 'd e'), NA,
+                      ('f', ' ', 'g h')])
         tm.assert_series_equal(result, exp)
 
         result = values.str.rpartition(expand=False)
-        exp = Series([['a b', ' ', 'c'], ['c d', ' ', 'e'], NA, ['f g', ' ', 'h']])
+        exp = Series([('a b', ' ', 'c'), ('c d', ' ', 'e'), NA,
+                      ('f g', ' ', 'h')])
         tm.assert_series_equal(result, exp)
 
         # Not splited
         values = Series(['abc', 'cde', NA, 'fgh'])
         result = values.str.partition('_', expand=False)
-        exp = Series([['abc', '', ''], ['cde', '', ''], NA, ['fgh', '', '']])
+        exp = Series([('abc', '', ''), ('cde', '', ''), NA, ('fgh', '', '')])
         tm.assert_series_equal(result, exp)
 
         result = values.str.rpartition('_', expand=False)
-        exp = Series([['', '', 'abc'], ['', '', 'cde'], NA, ['', '', 'fgh']])
+        exp = Series([('', '', 'abc'), ('', '', 'cde'), NA, ('', '', 'fgh')])
         tm.assert_series_equal(result, exp)
 
         # unicode
-        values = Series([u('a_b_c'), u('c_d_e'), NA, u('f_g_h')])
+        values = Series([u'a_b_c', u'c_d_e', NA, u'f_g_h'])
 
         result = values.str.partition('_', expand=False)
-        exp = Series([[u('a'), u('_'), u('b_c')], [u('c'), u('_'), u('d_e')],
-                      NA, [u('f'), u('_'), u('g_h')]])
+        exp = Series([(u'a', u'_', u'b_c'), (u'c', u'_', u'd_e'),
+                      NA, (u'f', u'_', u'g_h')])
         tm.assert_series_equal(result, exp)
 
         result = values.str.rpartition('_', expand=False)
-        exp = Series([[u('a_b'), u('_'), u('c')], [u('c_d'), u('_'), u('e')],
-                      NA, [u('f_g'), u('_'), u('h')]])
+        exp = Series([(u'a_b', u'_', u'c'), (u'c_d', u'_', u'e'),
+                      NA, (u'f_g', u'_', u'h')])
         tm.assert_series_equal(result, exp)
 
         # compare to standard lib
         values = Series(['A_B_C', 'B_C_D', 'E_F_G', 'EFGHEF'])
         result = values.str.partition('_', expand=False).tolist()
-        self.assertEqual(result, [v.partition('_') for v in values])
+        assert result == [v.partition('_') for v in values]
         result = values.str.rpartition('_', expand=False).tolist()
-        self.assertEqual(result, [v.rpartition('_') for v in values])
+        assert result == [v.rpartition('_') for v in values]
 
     def test_partition_index(self):
         values = Index(['a_b_c', 'c_d_e', 'f_g_h'])
 
         result = values.str.partition('_', expand=False)
-        exp = Index(np.array([('a', '_', 'b_c'), ('c', '_', 'd_e'), ('f', '_', 'g_h')]))
+        exp = Index(np.array([('a', '_', 'b_c'), ('c', '_', 'd_e'), ('f', '_',
+                                                                     'g_h')]))
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 1)
+        assert result.nlevels == 1
 
         result = values.str.rpartition('_', expand=False)
-        exp = Index(np.array([('a_b', '_', 'c'), ('c_d', '_', 'e'), ('f_g', '_', 'h')]))
+        exp = Index(np.array([('a_b', '_', 'c'), ('c_d', '_', 'e'), (
+            'f_g', '_', 'h')]))
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 1)
+        assert result.nlevels == 1
 
         result = values.str.partition('_')
         exp = Index([('a', '_', 'b_c'), ('c', '_', 'd_e'), ('f', '_', 'g_h')])
         tm.assert_index_equal(result, exp)
-        self.assertTrue(isinstance(result, MultiIndex))
-        self.assertEqual(result.nlevels, 3)
+        assert isinstance(result, MultiIndex)
+        assert result.nlevels == 3
 
         result = values.str.rpartition('_')
         exp = Index([('a_b', '_', 'c'), ('c_d', '_', 'e'), ('f_g', '_', 'h')])
         tm.assert_index_equal(result, exp)
-        self.assertTrue(isinstance(result, MultiIndex))
-        self.assertEqual(result.nlevels, 3)
+        assert isinstance(result, MultiIndex)
+        assert result.nlevels == 3
 
     def test_partition_to_dataframe(self):
         values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h'])
@@ -1571,6 +2646,31 @@ def test_partition_to_dataframe(self):
                          2: ['c', 'e', np.nan, 'h']})
         tm.assert_frame_equal(result, exp)
 
+    def test_partition_with_name(self):
+        # GH 12617
+
+        s = Series(['a,b', 'c,d'], name='xxx')
+        res = s.str.partition(',')
+        exp = DataFrame({0: ['a', 'c'], 1: [',', ','], 2: ['b', 'd']})
+        tm.assert_frame_equal(res, exp)
+
+        # should preserve name
+        res = s.str.partition(',', expand=False)
+        exp = Series([('a', ',', 'b'), ('c', ',', 'd')], name='xxx')
+        tm.assert_series_equal(res, exp)
+
+        idx = Index(['a,b', 'c,d'], name='xxx')
+        res = idx.str.partition(',')
+        exp = MultiIndex.from_tuples([('a', ',', 'b'), ('c', ',', 'd')])
+        assert res.nlevels == 3
+        tm.assert_index_equal(res, exp)
+
+        # should preserve name
+        res = idx.str.partition(',', expand=False)
+        exp = Index(np.array([('a', ',', 'b'), ('c', ',', 'd')]), name='xxx')
+        assert res.nlevels == 1
+        tm.assert_index_equal(res, exp)
+
     def test_pipe_failures(self):
         # #2119
         s = Series(['A|B|C'])
@@ -1592,12 +2692,12 @@ def test_slice(self):
         exp = Series(['foo', 'bar', NA, 'baz'])
         tm.assert_series_equal(result, exp)
 
-        for start, stop, step in [(0, 3, -1), (None, None, -1),
-                                  (3, 10, 2), (3, 0, -1)]:
+        for start, stop, step in [(0, 3, -1), (None, None, -1), (3, 10, 2),
+                                  (3, 0, -1)]:
             try:
                 result = values.str.slice(start, stop, step)
-                expected = Series([s[start:stop:step] if not isnull(s) else NA for s in
-                                   values])
+                expected = Series([s[start:stop:step] if not isna(s) else NA
+                                   for s in values])
                 tm.assert_series_equal(result, expected)
             except:
                 print('failed on %s:%s:%s' % (start, stop, step))
@@ -1608,19 +2708,16 @@ def test_slice(self):
                         None, 1, 2.])
 
         rs = Series(mixed).str.slice(2, 5)
-        xp = Series(['foo', NA, 'bar', NA, NA,
-                     NA, NA, NA])
+        xp = Series(['foo', NA, 'bar', NA, NA, NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         rs = Series(mixed).str.slice(2, 5, -1)
-        xp = Series(['oof', NA, 'rab', NA, NA,
-                     NA, NA, NA])
+        xp = Series(['oof', NA, 'rab', NA, NA, NA, NA, NA])
 
         # unicode
-        values = Series([u('aafootwo'), u('aabartwo'), NA,
-                         u('aabazqux')])
+        values = Series([u('aafootwo'), u('aabartwo'), NA, u('aabazqux')])
 
         result = values.str.slice(2, 5)
         exp = Series([u('foo'), u('bar'), NA, u('baz')])
@@ -1631,7 +2728,8 @@ def test_slice(self):
         tm.assert_series_equal(result, exp)
 
     def test_slice_replace(self):
-        values = Series(['short', 'a bit longer', 'evenlongerthanthat', '', NA])
+        values = Series(['short', 'a bit longer', 'evenlongerthanthat', '', NA
+                         ])
 
         exp = Series(['shrt', 'a it longer', 'evnlongerthanthat', '', NA])
         result = values.str.slice_replace(2, 3)
@@ -1641,11 +2739,13 @@ def test_slice_replace(self):
         result = values.str.slice_replace(2, 3, 'z')
         tm.assert_series_equal(result, exp)
 
-        exp = Series(['shzort', 'a zbit longer', 'evzenlongerthanthat', 'z', NA])
+        exp = Series(['shzort', 'a zbit longer', 'evzenlongerthanthat', 'z', NA
+                      ])
         result = values.str.slice_replace(2, 2, 'z')
         tm.assert_series_equal(result, exp)
 
-        exp = Series(['shzort', 'a zbit longer', 'evzenlongerthanthat', 'z', NA])
+        exp = Series(['shzort', 'a zbit longer', 'evzenlongerthanthat', 'z', NA
+                      ])
         result = values.str.slice_replace(2, 1, 'z')
         tm.assert_series_equal(result, exp)
 
@@ -1682,34 +2782,30 @@ def test_strip_lstrip_rstrip(self):
 
     def test_strip_lstrip_rstrip_mixed(self):
         # mixed
-        mixed = Series(['  aa  ', NA, ' bb \t\n', True, datetime.today(),
-                        None, 1, 2.])
+        mixed = Series(['  aa  ', NA, ' bb \t\n', True, datetime.today(), None,
+                        1, 2.])
 
         rs = Series(mixed).str.strip()
-        xp = Series(['aa', NA, 'bb', NA, NA,
-                     NA, NA, NA])
+        xp = Series(['aa', NA, 'bb', NA, NA, NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         rs = Series(mixed).str.lstrip()
-        xp = Series(['aa  ', NA, 'bb \t\n', NA, NA,
-                     NA, NA, NA])
+        xp = Series(['aa  ', NA, 'bb \t\n', NA, NA, NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         rs = Series(mixed).str.rstrip()
-        xp = Series(['  aa', NA, ' bb', NA, NA,
-                     NA, NA, NA])
+        xp = Series(['  aa', NA, ' bb', NA, NA, NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
     def test_strip_lstrip_rstrip_unicode(self):
         # unicode
-        values = Series([u('  aa   '), u(' bb \n'), NA,
-                         u('cc  ')])
+        values = Series([u('  aa   '), u(' bb \n'), NA, u('cc  ')])
 
         result = values.str.strip()
         exp = Series([u('aa'), u('bb'), NA, u('cc')])
@@ -1739,8 +2835,7 @@ def test_strip_lstrip_rstrip_args(self):
         assert_series_equal(rs, xp)
 
     def test_strip_lstrip_rstrip_args_unicode(self):
-        values = Series([u('xxABCxx'), u('xx BNSD'),
-                         u('LDFJH xx')])
+        values = Series([u('xxABCxx'), u('xx BNSD'), u('LDFJH xx')])
 
         rs = values.str.strip(u('x'))
         xp = Series(['ABC', ' BNSD', 'LDFJH '])
@@ -1757,26 +2852,25 @@ def test_strip_lstrip_rstrip_args_unicode(self):
     def test_wrap(self):
         # test values are: two words less than width, two words equal to width,
         # two words greater than width, one word less than width, one word
-        # equal to width, one word greater than width, multiple tokens with trailing
-        # whitespace equal to width
-        values = Series([u('hello world'), u('hello world!'),
-                         u('hello world!!'), u('abcdefabcde'),
-                         u('abcdefabcdef'), u('abcdefabcdefa'),
-                         u('ab ab ab ab '), u('ab ab ab ab a'),
-                         u('\t')])
+        # equal to width, one word greater than width, multiple tokens with
+        # trailing whitespace equal to width
+        values = Series([u('hello world'), u('hello world!'), u(
+            'hello world!!'), u('abcdefabcde'), u('abcdefabcdef'), u(
+                'abcdefabcdefa'), u('ab ab ab ab '), u('ab ab ab ab a'), u(
+                    '\t')])
 
         # expected values
-        xp = Series([u('hello world'), u('hello world!'),
-                     u('hello\nworld!!'), u('abcdefabcde'),
-                     u('abcdefabcdef'), u('abcdefabcdef\na'),
-                     u('ab ab ab ab'), u('ab ab ab ab\na'),
-                     u('')])
+        xp = Series([u('hello world'), u('hello world!'), u('hello\nworld!!'),
+                     u('abcdefabcde'), u('abcdefabcdef'), u('abcdefabcdef\na'),
+                     u('ab ab ab ab'), u('ab ab ab ab\na'), u('')])
 
         rs = values.str.wrap(12, break_long_words=True)
         assert_series_equal(rs, xp)
 
-        # test with pre and post whitespace (non-unicode), NaN, and non-ascii Unicode
-        values = Series(['  pre  ', np.nan, u('\xac\u20ac\U00008000 abadcafe')])
+        # test with pre and post whitespace (non-unicode), NaN, and non-ascii
+        # Unicode
+        values = Series(['  pre  ', np.nan, u('\xac\u20ac\U00008000 abadcafe')
+                         ])
         xp = Series(['  pre', NA, u('\xac\u20ac\U00008000 ab\nadcafe')])
         rs = values.str.wrap(6)
         assert_series_equal(rs, xp)
@@ -1789,28 +2883,62 @@ def test_get(self):
         tm.assert_series_equal(result, expected)
 
         # mixed
-        mixed = Series(['a_b_c', NA, 'c_d_e', True, datetime.today(),
-                        None, 1, 2.])
+        mixed = Series(['a_b_c', NA, 'c_d_e', True, datetime.today(), None, 1,
+                        2.])
 
         rs = Series(mixed).str.split('_').str.get(1)
-        xp = Series(['b', NA, 'd', NA, NA,
-                     NA, NA, NA])
+        xp = Series(['b', NA, 'd', NA, NA, NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
-        values = Series([u('a_b_c'), u('c_d_e'), np.nan,
-                         u('f_g_h')])
+        values = Series([u('a_b_c'), u('c_d_e'), np.nan, u('f_g_h')])
 
         result = values.str.split('_').str.get(1)
         expected = Series([u('b'), u('d'), np.nan, u('g')])
         tm.assert_series_equal(result, expected)
 
+        # bounds testing
+        values = Series(['1_2_3_4_5', '6_7_8_9_10', '11_12'])
+
+        # positive index
+        result = values.str.split('_').str.get(2)
+        expected = Series(['3', '8', np.nan])
+        tm.assert_series_equal(result, expected)
+
+        # negative index
+        result = values.str.split('_').str.get(-3)
+        expected = Series(['3', '8', np.nan])
+        tm.assert_series_equal(result, expected)
+
+    def test_get_complex(self):
+        # GH 20671, getting value not in dict raising `KeyError`
+        values = Series([(1, 2, 3), [1, 2, 3], {1, 2, 3},
+                         {1: 'a', 2: 'b', 3: 'c'}])
+
+        result = values.str.get(1)
+        expected = Series([2, 2, np.nan, 'a'])
+        tm.assert_series_equal(result, expected)
+
+        result = values.str.get(-1)
+        expected = Series([3, 3, np.nan, np.nan])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('to_type', [tuple, list, np.array])
+    def test_get_complex_nested(self, to_type):
+        values = Series([to_type([to_type([1, 2])])])
+
+        result = values.str.get(0)
+        expected = Series([to_type([1, 2])])
+        tm.assert_series_equal(result, expected)
+
+        result = values.str.get(1)
+        expected = Series([np.nan])
+        tm.assert_series_equal(result, expected)
+
     def test_more_contains(self):
         # PR #1179
-        import re
-
         s = Series(['A', 'B', 'C', 'Aaba', 'Baca', '', NA,
                     'CABA', 'dog', 'cat'])
 
@@ -1820,8 +2948,8 @@ def test_more_contains(self):
         assert_series_equal(result, expected)
 
         result = s.str.contains('a', case=False)
-        expected = Series([True, False, False, True, True, False, np.nan,
-                           True, False, True])
+        expected = Series([True, False, False, True, True, False, np.nan, True,
+                           False, True])
         assert_series_equal(result, expected)
 
         result = s.str.contains('Aa')
@@ -1839,11 +2967,30 @@ def test_more_contains(self):
                            True, False, False])
         assert_series_equal(result, expected)
 
+    def test_contains_nan(self):
+        # PR #14171
+        s = Series([np.nan, np.nan, np.nan], dtype=np.object_)
+
+        result = s.str.contains('foo', na=False)
+        expected = Series([False, False, False], dtype=np.bool_)
+        assert_series_equal(result, expected)
+
+        result = s.str.contains('foo', na=True)
+        expected = Series([True, True, True], dtype=np.bool_)
+        assert_series_equal(result, expected)
+
+        result = s.str.contains('foo', na="foo")
+        expected = Series(["foo", "foo", "foo"], dtype=np.object_)
+        assert_series_equal(result, expected)
+
+        result = s.str.contains('foo')
+        expected = Series([np.nan, np.nan, np.nan], dtype=np.object_)
+        assert_series_equal(result, expected)
+
     def test_more_replace(self):
         # PR #1179
-        import re
-        s = Series(['A', 'B', 'C', 'Aaba', 'Baca',
-                    '', NA, 'CABA', 'dog', 'cat'])
+        s = Series(['A', 'B', 'C', 'Aaba', 'Baca', '', NA, 'CABA',
+                    'dog', 'cat'])
 
         result = s.str.replace('A', 'YYY')
         expected = Series(['YYY', 'B', 'C', 'YYYaba', 'Baca', '', NA,
@@ -1861,8 +3008,8 @@ def test_more_replace(self):
         assert_series_equal(result, expected)
 
     def test_string_slice_get_syntax(self):
-        s = Series(['YYY', 'B', 'C', 'YYYYYYbYYY', 'BYYYcYYY', NA,
-                    'CYYYBYYY', 'dog', 'cYYYt'])
+        s = Series(['YYY', 'B', 'C', 'YYYYYYbYYY', 'BYYYcYYY', NA, 'CYYYBYYY',
+                    'dog', 'cYYYt'])
 
         result = s.str[0]
         expected = s.str.get(0)
@@ -1877,7 +3024,7 @@ def test_string_slice_get_syntax(self):
         assert_series_equal(result, expected)
 
     def test_string_slice_out_of_bounds(self):
-        s = Series([(1, 2), (1,), (3,4,5)])
+        s = Series([(1, 2), (1, ), (3, 4, 5)])
 
         result = s.str[1]
         expected = Series([2, np.nan, 4])
@@ -1890,25 +3037,29 @@ def test_string_slice_out_of_bounds(self):
         assert_series_equal(result, expected)
 
     def test_match_findall_flags(self):
-        data = {'Dave': 'dave@google.com', 'Steve': 'steve@gmail.com',
-                'Rob': 'rob@gmail.com', 'Wes': np.nan}
+        data = {'Dave': 'dave@google.com',
+                'Steve': 'steve@gmail.com',
+                'Rob': 'rob@gmail.com',
+                'Wes': np.nan}
         data = Series(data)
 
-        pat = pattern = r'([A-Z0-9._%+-]+)@([A-Z0-9.-]+)\.([A-Z]{2,4})'
+        pat = r'([A-Z0-9._%+-]+)@([A-Z0-9.-]+)\.([A-Z]{2,4})'
 
-        with tm.assert_produces_warning(FutureWarning):
-            result = data.str.match(pat, flags=re.IGNORECASE)
-        self.assertEqual(result[0], ('dave', 'google', 'com'))
+        result = data.str.extract(pat, flags=re.IGNORECASE, expand=True)
+        assert result.iloc[0].tolist() == ['dave', 'google', 'com']
+
+        result = data.str.match(pat, flags=re.IGNORECASE)
+        assert result[0]
 
         result = data.str.findall(pat, flags=re.IGNORECASE)
-        self.assertEqual(result[0][0], ('dave', 'google', 'com'))
+        assert result[0][0] == ('dave', 'google', 'com')
 
         result = data.str.count(pat, flags=re.IGNORECASE)
-        self.assertEqual(result[0], 1)
+        assert result[0] == 1
 
         with tm.assert_produces_warning(UserWarning):
             result = data.str.contains(pat, flags=re.IGNORECASE)
-        self.assertEqual(result[0], True)
+        assert result[0]
 
     def test_encode_decode(self):
         base = Series([u('a'), u('b'), u('a\xe4')])
@@ -1923,8 +3074,7 @@ def test_encode_decode(self):
     def test_encode_decode_errors(self):
         encodeBase = Series([u('a'), u('b'), u('a\x9d')])
 
-        self.assertRaises(UnicodeEncodeError,
-                          encodeBase.str.encode, 'cp1252')
+        pytest.raises(UnicodeEncodeError, encodeBase.str.encode, 'cp1252')
 
         f = lambda x: x.encode('cp1252', 'ignore')
         result = encodeBase.str.encode('cp1252', 'ignore')
@@ -1933,8 +3083,7 @@ def test_encode_decode_errors(self):
 
         decodeBase = Series([b'a', b'b', b'a\x9d'])
 
-        self.assertRaises(UnicodeDecodeError,
-                          decodeBase.str.decode, 'cp1252')
+        pytest.raises(UnicodeDecodeError, decodeBase.str.decode, 'cp1252')
 
         f = lambda x: x.decode('cp1252', 'ignore')
         result = decodeBase.str.decode('cp1252', 'ignore')
@@ -1958,7 +3107,8 @@ def test_normalize(self):
         result = s.str.normalize('NFC')
         tm.assert_series_equal(result, expected)
 
-        with tm.assertRaisesRegexp(ValueError, "invalid normalization form"):
+        with tm.assert_raises_regex(ValueError,
+                                    "invalid normalization form"):
             s.str.normalize('xxx')
 
         s = Index([u'ＡＢＣ', u'１２３', u'ｱｲｴ'])
@@ -1966,38 +3116,18 @@ def test_normalize(self):
         result = s.str.normalize('NFKC')
         tm.assert_index_equal(result, expected)
 
-    def test_cat_on_filtered_index(self):
-        df = DataFrame(index=MultiIndex.from_product([[2011, 2012], [1,2,3]],
-                                                     names=['year', 'month']))
-
-        df = df.reset_index()
-        df = df[df.month > 1]
-
-        str_year = df.year.astype('str')
-        str_month = df.month.astype('str')
-        str_both = str_year.str.cat(str_month, sep=' ')
-
-        self.assertEqual(str_both.loc[1], '2011 2')
-
-        str_multiple = str_year.str.cat([str_month, str_month], sep=' ')
-
-        self.assertEqual(str_multiple.loc[1], '2011 2 2')
-
-
     def test_index_str_accessor_visibility(self):
         from pandas.core.strings import StringMethods
 
         if not compat.PY3:
-            cases = [(['a', 'b'], 'string'),
-                     (['a', u('b')], 'mixed'),
+            cases = [(['a', 'b'], 'string'), (['a', u('b')], 'mixed'),
                      ([u('a'), u('b')], 'unicode'),
                      (['a', 'b', 1], 'mixed-integer'),
                      (['a', 'b', 1.3], 'mixed'),
                      (['a', 'b', 1.3, 1], 'mixed-integer'),
                      (['aa', datetime(2011, 1, 1)], 'mixed')]
         else:
-            cases = [(['a', 'b'], 'string'),
-                     (['a', u('b')], 'string'),
+            cases = [(['a', 'b'], 'string'), (['a', u('b')], 'string'),
                      ([u('a'), u('b')], 'string'),
                      (['a', 'b', 1], 'mixed-integer'),
                      (['a', 'b', 1.3], 'mixed'),
@@ -2005,15 +3135,15 @@ def test_index_str_accessor_visibility(self):
                      (['aa', datetime(2011, 1, 1)], 'mixed')]
         for values, tp in cases:
             idx = Index(values)
-            self.assertTrue(isinstance(Series(values).str, StringMethods))
-            self.assertTrue(isinstance(idx.str, StringMethods))
-            self.assertEqual(idx.inferred_type, tp)
+            assert isinstance(Series(values).str, StringMethods)
+            assert isinstance(idx.str, StringMethods)
+            assert idx.inferred_type == tp
 
         for values, tp in cases:
             idx = Index(values)
-            self.assertTrue(isinstance(Series(values).str, StringMethods))
-            self.assertTrue(isinstance(idx.str, StringMethods))
-            self.assertEqual(idx.inferred_type, tp)
+            assert isinstance(Series(values).str, StringMethods)
+            assert isinstance(idx.str, StringMethods)
+            assert idx.inferred_type == tp
 
         cases = [([1, np.nan], 'floating'),
                  ([datetime(2011, 1, 1)], 'datetime64'),
@@ -2021,31 +3151,33 @@ def test_index_str_accessor_visibility(self):
         for values, tp in cases:
             idx = Index(values)
             message = 'Can only use .str accessor with string values'
-            with self.assertRaisesRegexp(AttributeError, message):
+            with tm.assert_raises_regex(AttributeError, message):
                 Series(values).str
-            with self.assertRaisesRegexp(AttributeError, message):
+            with tm.assert_raises_regex(AttributeError, message):
                 idx.str
-            self.assertEqual(idx.inferred_type, tp)
+            assert idx.inferred_type == tp
 
         # MultiIndex has mixed dtype, but not allow to use accessor
         idx = MultiIndex.from_tuples([('a', 'b'), ('a', 'b')])
-        self.assertEqual(idx.inferred_type, 'mixed')
+        assert idx.inferred_type == 'mixed'
         message = 'Can only use .str accessor with Index, not MultiIndex'
-        with self.assertRaisesRegexp(AttributeError, message):
+        with tm.assert_raises_regex(AttributeError, message):
             idx.str
 
+    def test_str_accessor_no_new_attributes(self):
+        # https://github.com/pandas-dev/pandas/issues/10673
+        s = Series(list('aabbcde'))
+        with tm.assert_raises_regex(AttributeError,
+                                    "You cannot add any new attribute"):
+            s.str.xlabel = "a"
+
     def test_method_on_bytes(self):
         lhs = Series(np.array(list('abc'), 'S1').astype(object))
         rhs = Series(np.array(list('def'), 'S1').astype(object))
         if compat.PY3:
-            self.assertRaises(TypeError, lhs.str.cat, rhs)
+            pytest.raises(TypeError, lhs.str.cat, rhs, join='left')
         else:
-            result = lhs.str.cat(rhs)
-            expected = Series(np.array(['ad', 'be', 'cf'],
-                                       'S2').astype(object))
+            result = lhs.str.cat(rhs, join='left')
+            expected = Series(np.array(
+                ['ad', 'be', 'cf'], 'S2').astype(object))
             tm.assert_series_equal(result, expected)
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_take.py b/pandas/tests/test_take.py
new file mode 100644
index 0000000000000..ade847923c083
--- /dev/null
+++ b/pandas/tests/test_take.py
@@ -0,0 +1,468 @@
+# -*- coding: utf-8 -*-
+import re
+from datetime import datetime
+
+import numpy as np
+import pytest
+from pandas.compat import long
+import pandas.core.algorithms as algos
+import pandas.util.testing as tm
+from pandas._libs.tslib import iNaT
+
+
+@pytest.fixture(params=[True, False])
+def writeable(request):
+    return request.param
+
+
+# Check that take_nd works both with writeable arrays
+# (in which case fast typed memory-views implementation)
+# and read-only arrays alike.
+@pytest.fixture(params=[
+    (np.float64, True),
+    (np.float32, True),
+    (np.uint64, False),
+    (np.uint32, False),
+    (np.uint16, False),
+    (np.uint8, False),
+    (np.int64, False),
+    (np.int32, False),
+    (np.int16, False),
+    (np.int8, False),
+    (np.object_, True),
+    (np.bool, False),
+])
+def dtype_can_hold_na(request):
+    return request.param
+
+
+@pytest.fixture(params=[
+    (np.int8, np.int16(127), np.int8),
+    (np.int8, np.int16(128), np.int16),
+    (np.int32, 1, np.int32),
+    (np.int32, 2.0, np.float64),
+    (np.int32, 3.0 + 4.0j, np.complex128),
+    (np.int32, True, np.object_),
+    (np.int32, "", np.object_),
+    (np.float64, 1, np.float64),
+    (np.float64, 2.0, np.float64),
+    (np.float64, 3.0 + 4.0j, np.complex128),
+    (np.float64, True, np.object_),
+    (np.float64, "", np.object_),
+    (np.complex128, 1, np.complex128),
+    (np.complex128, 2.0, np.complex128),
+    (np.complex128, 3.0 + 4.0j, np.complex128),
+    (np.complex128, True, np.object_),
+    (np.complex128, "", np.object_),
+    (np.bool_, 1, np.object_),
+    (np.bool_, 2.0, np.object_),
+    (np.bool_, 3.0 + 4.0j, np.object_),
+    (np.bool_, True, np.bool_),
+    (np.bool_, '', np.object_),
+])
+def dtype_fill_out_dtype(request):
+    return request.param
+
+
+class TestTake(object):
+    # Standard incompatible fill error.
+    fill_error = re.compile("Incompatible type for fill_value")
+
+    def test_1d_with_out(self, dtype_can_hold_na, writeable):
+        dtype, can_hold_na = dtype_can_hold_na
+
+        data = np.random.randint(0, 2, 4).astype(dtype)
+        data.flags.writeable = writeable
+
+        indexer = [2, 1, 0, 1]
+        out = np.empty(4, dtype=dtype)
+        algos.take_1d(data, indexer, out=out)
+
+        expected = data.take(indexer)
+        tm.assert_almost_equal(out, expected)
+
+        indexer = [2, 1, 0, -1]
+        out = np.empty(4, dtype=dtype)
+
+        if can_hold_na:
+            algos.take_1d(data, indexer, out=out)
+            expected = data.take(indexer)
+            expected[3] = np.nan
+            tm.assert_almost_equal(out, expected)
+        else:
+            with tm.assert_raises_regex(TypeError, self.fill_error):
+                algos.take_1d(data, indexer, out=out)
+
+            # No Exception otherwise.
+            data.take(indexer, out=out)
+
+    def test_1d_fill_nonna(self, dtype_fill_out_dtype):
+        dtype, fill_value, out_dtype = dtype_fill_out_dtype
+        data = np.random.randint(0, 2, 4).astype(dtype)
+        indexer = [2, 1, 0, -1]
+
+        result = algos.take_1d(data, indexer, fill_value=fill_value)
+        assert ((result[[0, 1, 2]] == data[[2, 1, 0]]).all())
+        assert (result[3] == fill_value)
+        assert (result.dtype == out_dtype)
+
+        indexer = [2, 1, 0, 1]
+
+        result = algos.take_1d(data, indexer, fill_value=fill_value)
+        assert ((result[[0, 1, 2, 3]] == data[indexer]).all())
+        assert (result.dtype == dtype)
+
+    def test_2d_with_out(self, dtype_can_hold_na, writeable):
+        dtype, can_hold_na = dtype_can_hold_na
+
+        data = np.random.randint(0, 2, (5, 3)).astype(dtype)
+        data.flags.writeable = writeable
+
+        indexer = [2, 1, 0, 1]
+        out0 = np.empty((4, 3), dtype=dtype)
+        out1 = np.empty((5, 4), dtype=dtype)
+        algos.take_nd(data, indexer, out=out0, axis=0)
+        algos.take_nd(data, indexer, out=out1, axis=1)
+
+        expected0 = data.take(indexer, axis=0)
+        expected1 = data.take(indexer, axis=1)
+        tm.assert_almost_equal(out0, expected0)
+        tm.assert_almost_equal(out1, expected1)
+
+        indexer = [2, 1, 0, -1]
+        out0 = np.empty((4, 3), dtype=dtype)
+        out1 = np.empty((5, 4), dtype=dtype)
+
+        if can_hold_na:
+            algos.take_nd(data, indexer, out=out0, axis=0)
+            algos.take_nd(data, indexer, out=out1, axis=1)
+
+            expected0 = data.take(indexer, axis=0)
+            expected1 = data.take(indexer, axis=1)
+            expected0[3, :] = np.nan
+            expected1[:, 3] = np.nan
+
+            tm.assert_almost_equal(out0, expected0)
+            tm.assert_almost_equal(out1, expected1)
+        else:
+            for i, out in enumerate([out0, out1]):
+                with tm.assert_raises_regex(TypeError,
+                                            self.fill_error):
+                    algos.take_nd(data, indexer, out=out, axis=i)
+
+                # No Exception otherwise.
+                data.take(indexer, out=out, axis=i)
+
+    def test_2d_fill_nonna(self, dtype_fill_out_dtype):
+        dtype, fill_value, out_dtype = dtype_fill_out_dtype
+        data = np.random.randint(0, 2, (5, 3)).astype(dtype)
+        indexer = [2, 1, 0, -1]
+
+        result = algos.take_nd(data, indexer, axis=0,
+                               fill_value=fill_value)
+        assert ((result[[0, 1, 2], :] == data[[2, 1, 0], :]).all())
+        assert ((result[3, :] == fill_value).all())
+        assert (result.dtype == out_dtype)
+
+        result = algos.take_nd(data, indexer, axis=1,
+                               fill_value=fill_value)
+        assert ((result[:, [0, 1, 2]] == data[:, [2, 1, 0]]).all())
+        assert ((result[:, 3] == fill_value).all())
+        assert (result.dtype == out_dtype)
+
+        indexer = [2, 1, 0, 1]
+        result = algos.take_nd(data, indexer, axis=0,
+                               fill_value=fill_value)
+        assert ((result[[0, 1, 2, 3], :] == data[indexer, :]).all())
+        assert (result.dtype == dtype)
+
+        result = algos.take_nd(data, indexer, axis=1,
+                               fill_value=fill_value)
+        assert ((result[:, [0, 1, 2, 3]] == data[:, indexer]).all())
+        assert (result.dtype == dtype)
+
+    def test_3d_with_out(self, dtype_can_hold_na):
+        dtype, can_hold_na = dtype_can_hold_na
+
+        data = np.random.randint(0, 2, (5, 4, 3)).astype(dtype)
+        indexer = [2, 1, 0, 1]
+
+        out0 = np.empty((4, 4, 3), dtype=dtype)
+        out1 = np.empty((5, 4, 3), dtype=dtype)
+        out2 = np.empty((5, 4, 4), dtype=dtype)
+
+        algos.take_nd(data, indexer, out=out0, axis=0)
+        algos.take_nd(data, indexer, out=out1, axis=1)
+        algos.take_nd(data, indexer, out=out2, axis=2)
+
+        expected0 = data.take(indexer, axis=0)
+        expected1 = data.take(indexer, axis=1)
+        expected2 = data.take(indexer, axis=2)
+
+        tm.assert_almost_equal(out0, expected0)
+        tm.assert_almost_equal(out1, expected1)
+        tm.assert_almost_equal(out2, expected2)
+
+        indexer = [2, 1, 0, -1]
+        out0 = np.empty((4, 4, 3), dtype=dtype)
+        out1 = np.empty((5, 4, 3), dtype=dtype)
+        out2 = np.empty((5, 4, 4), dtype=dtype)
+
+        if can_hold_na:
+            algos.take_nd(data, indexer, out=out0, axis=0)
+            algos.take_nd(data, indexer, out=out1, axis=1)
+            algos.take_nd(data, indexer, out=out2, axis=2)
+
+            expected0 = data.take(indexer, axis=0)
+            expected1 = data.take(indexer, axis=1)
+            expected2 = data.take(indexer, axis=2)
+
+            expected0[3, :, :] = np.nan
+            expected1[:, 3, :] = np.nan
+            expected2[:, :, 3] = np.nan
+
+            tm.assert_almost_equal(out0, expected0)
+            tm.assert_almost_equal(out1, expected1)
+            tm.assert_almost_equal(out2, expected2)
+        else:
+            for i, out in enumerate([out0, out1, out2]):
+                with tm.assert_raises_regex(TypeError,
+                                            self.fill_error):
+                    algos.take_nd(data, indexer, out=out, axis=i)
+
+                # No Exception otherwise.
+                data.take(indexer, out=out, axis=i)
+
+    def test_3d_fill_nonna(self, dtype_fill_out_dtype):
+        dtype, fill_value, out_dtype = dtype_fill_out_dtype
+
+        data = np.random.randint(0, 2, (5, 4, 3)).astype(dtype)
+        indexer = [2, 1, 0, -1]
+
+        result = algos.take_nd(data, indexer, axis=0,
+                               fill_value=fill_value)
+        assert ((result[[0, 1, 2], :, :] == data[[2, 1, 0], :, :]).all())
+        assert ((result[3, :, :] == fill_value).all())
+        assert (result.dtype == out_dtype)
+
+        result = algos.take_nd(data, indexer, axis=1,
+                               fill_value=fill_value)
+        assert ((result[:, [0, 1, 2], :] == data[:, [2, 1, 0], :]).all())
+        assert ((result[:, 3, :] == fill_value).all())
+        assert (result.dtype == out_dtype)
+
+        result = algos.take_nd(data, indexer, axis=2,
+                               fill_value=fill_value)
+        assert ((result[:, :, [0, 1, 2]] == data[:, :, [2, 1, 0]]).all())
+        assert ((result[:, :, 3] == fill_value).all())
+        assert (result.dtype == out_dtype)
+
+        indexer = [2, 1, 0, 1]
+        result = algos.take_nd(data, indexer, axis=0,
+                               fill_value=fill_value)
+        assert ((result[[0, 1, 2, 3], :, :] == data[indexer, :, :]).all())
+        assert (result.dtype == dtype)
+
+        result = algos.take_nd(data, indexer, axis=1,
+                               fill_value=fill_value)
+        assert ((result[:, [0, 1, 2, 3], :] == data[:, indexer, :]).all())
+        assert (result.dtype == dtype)
+
+        result = algos.take_nd(data, indexer, axis=2,
+                               fill_value=fill_value)
+        assert ((result[:, :, [0, 1, 2, 3]] == data[:, :, indexer]).all())
+        assert (result.dtype == dtype)
+
+    def test_1d_other_dtypes(self):
+        arr = np.random.randn(10).astype(np.float32)
+
+        indexer = [1, 2, 3, -1]
+        result = algos.take_1d(arr, indexer)
+        expected = arr.take(indexer)
+        expected[-1] = np.nan
+        tm.assert_almost_equal(result, expected)
+
+    def test_2d_other_dtypes(self):
+        arr = np.random.randn(10, 5).astype(np.float32)
+
+        indexer = [1, 2, 3, -1]
+
+        # axis=0
+        result = algos.take_nd(arr, indexer, axis=0)
+        expected = arr.take(indexer, axis=0)
+        expected[-1] = np.nan
+        tm.assert_almost_equal(result, expected)
+
+        # axis=1
+        result = algos.take_nd(arr, indexer, axis=1)
+        expected = arr.take(indexer, axis=1)
+        expected[:, -1] = np.nan
+        tm.assert_almost_equal(result, expected)
+
+    def test_1d_bool(self):
+        arr = np.array([0, 1, 0], dtype=bool)
+
+        result = algos.take_1d(arr, [0, 2, 2, 1])
+        expected = arr.take([0, 2, 2, 1])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = algos.take_1d(arr, [0, 2, -1])
+        assert result.dtype == np.object_
+
+    def test_2d_bool(self):
+        arr = np.array([[0, 1, 0], [1, 0, 1], [0, 1, 1]], dtype=bool)
+
+        result = algos.take_nd(arr, [0, 2, 2, 1])
+        expected = arr.take([0, 2, 2, 1], axis=0)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = algos.take_nd(arr, [0, 2, 2, 1], axis=1)
+        expected = arr.take([0, 2, 2, 1], axis=1)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = algos.take_nd(arr, [0, 2, -1])
+        assert result.dtype == np.object_
+
+    def test_2d_float32(self):
+        arr = np.random.randn(4, 3).astype(np.float32)
+        indexer = [0, 2, -1, 1, -1]
+
+        # axis=0
+        result = algos.take_nd(arr, indexer, axis=0)
+        result2 = np.empty_like(result)
+        algos.take_nd(arr, indexer, axis=0, out=result2)
+        tm.assert_almost_equal(result, result2)
+
+        expected = arr.take(indexer, axis=0)
+        expected[[2, 4], :] = np.nan
+        tm.assert_almost_equal(result, expected)
+
+        # this now accepts a float32! # test with float64 out buffer
+        out = np.empty((len(indexer), arr.shape[1]), dtype='float32')
+        algos.take_nd(arr, indexer, out=out)  # it works!
+
+        # axis=1
+        result = algos.take_nd(arr, indexer, axis=1)
+        result2 = np.empty_like(result)
+        algos.take_nd(arr, indexer, axis=1, out=result2)
+        tm.assert_almost_equal(result, result2)
+
+        expected = arr.take(indexer, axis=1)
+        expected[:, [2, 4]] = np.nan
+        tm.assert_almost_equal(result, expected)
+
+    def test_2d_datetime64(self):
+        # 2005/01/01 - 2006/01/01
+        arr = np.random.randint(
+            long(11045376), long(11360736), (5, 3)) * 100000000000
+        arr = arr.view(dtype='datetime64[ns]')
+        indexer = [0, 2, -1, 1, -1]
+
+        # axis=0
+        result = algos.take_nd(arr, indexer, axis=0)
+        result2 = np.empty_like(result)
+        algos.take_nd(arr, indexer, axis=0, out=result2)
+        tm.assert_almost_equal(result, result2)
+
+        expected = arr.take(indexer, axis=0)
+        expected.view(np.int64)[[2, 4], :] = iNaT
+        tm.assert_almost_equal(result, expected)
+
+        result = algos.take_nd(arr, indexer, axis=0,
+                               fill_value=datetime(2007, 1, 1))
+        result2 = np.empty_like(result)
+        algos.take_nd(arr, indexer, out=result2, axis=0,
+                      fill_value=datetime(2007, 1, 1))
+        tm.assert_almost_equal(result, result2)
+
+        expected = arr.take(indexer, axis=0)
+        expected[[2, 4], :] = datetime(2007, 1, 1)
+        tm.assert_almost_equal(result, expected)
+
+        # axis=1
+        result = algos.take_nd(arr, indexer, axis=1)
+        result2 = np.empty_like(result)
+        algos.take_nd(arr, indexer, axis=1, out=result2)
+        tm.assert_almost_equal(result, result2)
+
+        expected = arr.take(indexer, axis=1)
+        expected.view(np.int64)[:, [2, 4]] = iNaT
+        tm.assert_almost_equal(result, expected)
+
+        result = algos.take_nd(arr, indexer, axis=1,
+                               fill_value=datetime(2007, 1, 1))
+        result2 = np.empty_like(result)
+        algos.take_nd(arr, indexer, out=result2, axis=1,
+                      fill_value=datetime(2007, 1, 1))
+        tm.assert_almost_equal(result, result2)
+
+        expected = arr.take(indexer, axis=1)
+        expected[:, [2, 4]] = datetime(2007, 1, 1)
+        tm.assert_almost_equal(result, expected)
+
+    def test_take_axis_0(self):
+        arr = np.arange(12).reshape(4, 3)
+        result = algos.take(arr, [0, -1])
+        expected = np.array([[0, 1, 2], [9, 10, 11]])
+        tm.assert_numpy_array_equal(result, expected)
+
+        # allow_fill=True
+        result = algos.take(arr, [0, -1], allow_fill=True, fill_value=0)
+        expected = np.array([[0, 1, 2], [0, 0, 0]])
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_take_axis_1(self):
+        arr = np.arange(12).reshape(4, 3)
+        result = algos.take(arr, [0, -1], axis=1)
+        expected = np.array([[0, 2], [3, 5], [6, 8], [9, 11]])
+        tm.assert_numpy_array_equal(result, expected)
+
+        # allow_fill=True
+        result = algos.take(arr, [0, -1], axis=1, allow_fill=True,
+                            fill_value=0)
+        expected = np.array([[0, 0], [3, 0], [6, 0], [9, 0]])
+        tm.assert_numpy_array_equal(result, expected)
+
+
+class TestExtensionTake(object):
+    # The take method found in pd.api.extensions
+
+    def test_bounds_check_large(self):
+        arr = np.array([1, 2])
+        with pytest.raises(IndexError):
+            algos.take(arr, [2, 3], allow_fill=True)
+
+        with pytest.raises(IndexError):
+            algos.take(arr, [2, 3], allow_fill=False)
+
+    def test_bounds_check_small(self):
+        arr = np.array([1, 2, 3], dtype=np.int64)
+        indexer = [0, -1, -2]
+        with pytest.raises(ValueError):
+            algos.take(arr, indexer, allow_fill=True)
+
+        result = algos.take(arr, indexer)
+        expected = np.array([1, 3, 2], dtype=np.int64)
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('allow_fill', [True, False])
+    def test_take_empty(self, allow_fill):
+        arr = np.array([], dtype=np.int64)
+        # empty take is ok
+        result = algos.take(arr, [], allow_fill=allow_fill)
+        tm.assert_numpy_array_equal(arr, result)
+
+        with pytest.raises(IndexError):
+            algos.take(arr, [0], allow_fill=allow_fill)
+
+    def test_take_na_empty(self):
+        result = algos.take(np.array([]), [-1, -1], allow_fill=True,
+                            fill_value=0.0)
+        expected = np.array([0., 0.])
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_take_coerces_list(self):
+        arr = [1, 2, 3]
+        result = algos.take(arr, [0, 0])
+        expected = np.array([1, 1])
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/test_testing.py b/pandas/tests/test_testing.py
deleted file mode 100644
index 2b5443e6ff0d2..0000000000000
--- a/pandas/tests/test_testing.py
+++ /dev/null
@@ -1,632 +0,0 @@
-#!/usr/bin/python
-# -*- coding: utf-8 -*-
-import pandas as pd
-import unittest
-import warnings
-import nose
-import numpy as np
-import sys
-from pandas import Series, DataFrame
-import pandas.util.testing as tm
-from pandas.util.testing import (
-    assert_almost_equal, assertRaisesRegexp, raise_with_traceback,
-    assert_index_equal, assert_series_equal, assert_frame_equal,
-    assert_numpy_array_equal, assert_isinstance, RNGContext
-)
-from pandas.compat import is_platform_windows
-
-# let's get meta.
-
-class TestAssertAlmostEqual(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def _assert_almost_equal_both(self, a, b, **kwargs):
-        assert_almost_equal(a, b, **kwargs)
-        assert_almost_equal(b, a, **kwargs)
-
-    def _assert_not_almost_equal_both(self, a, b, **kwargs):
-        self.assertRaises(AssertionError, assert_almost_equal, a, b, **kwargs)
-        self.assertRaises(AssertionError, assert_almost_equal, b, a, **kwargs)
-
-    def test_assert_almost_equal_numbers(self):
-        self._assert_almost_equal_both(1.1, 1.1)
-        self._assert_almost_equal_both(1.1, 1.100001)
-        self._assert_almost_equal_both(np.int16(1), 1.000001)
-        self._assert_almost_equal_both(np.float64(1.1), 1.1)
-        self._assert_almost_equal_both(np.uint32(5), 5)
-
-        self._assert_not_almost_equal_both(1.1, 1)
-        self._assert_not_almost_equal_both(1.1, True)
-        self._assert_not_almost_equal_both(1, 2)
-        self._assert_not_almost_equal_both(1.0001, np.int16(1))
-
-    def test_assert_almost_equal_numbers_with_zeros(self):
-        self._assert_almost_equal_both(0, 0)
-        self._assert_almost_equal_both(0.000001, 0)
-
-        self._assert_not_almost_equal_both(0.001, 0)
-        self._assert_not_almost_equal_both(1, 0)
-
-    def test_assert_almost_equal_numbers_with_mixed(self):
-        self._assert_not_almost_equal_both(1, 'abc')
-        self._assert_not_almost_equal_both(1, [1,])
-        self._assert_not_almost_equal_both(1, object())
-
-    def test_assert_almost_equal_edge_case_ndarrays(self):
-        self._assert_almost_equal_both(np.array([], dtype='M8[ns]'),
-                                       np.array([], dtype='float64'))
-        self._assert_almost_equal_both(np.array([], dtype=str),
-                                       np.array([], dtype='int64'))
-
-    def test_assert_almost_equal_dicts(self):
-        self._assert_almost_equal_both({'a': 1, 'b': 2}, {'a': 1, 'b': 2})
-
-        self._assert_not_almost_equal_both({'a': 1, 'b': 2}, {'a': 1, 'b': 3})
-        self._assert_not_almost_equal_both(
-            {'a': 1, 'b': 2}, {'a': 1, 'b': 2, 'c': 3}
-        )
-        self._assert_not_almost_equal_both({'a': 1}, 1)
-        self._assert_not_almost_equal_both({'a': 1}, 'abc')
-        self._assert_not_almost_equal_both({'a': 1}, [1,])
-
-    def test_assert_almost_equal_dict_like_object(self):
-        class DictLikeObj(object):
-            def keys(self):
-                return ('a',)
-
-            def __getitem__(self, item):
-                if item == 'a':
-                    return 1
-
-        self._assert_almost_equal_both({'a': 1}, DictLikeObj())
-
-        self._assert_not_almost_equal_both({'a': 2}, DictLikeObj())
-
-    def test_assert_almost_equal_strings(self):
-        self._assert_almost_equal_both('abc', 'abc')
-
-        self._assert_not_almost_equal_both('abc', 'abcd')
-        self._assert_not_almost_equal_both('abc', 'abd')
-        self._assert_not_almost_equal_both('abc', 1)
-        self._assert_not_almost_equal_both('abc', [1,])
-
-    def test_assert_almost_equal_iterables(self):
-        self._assert_almost_equal_both([1, 2, 3], [1, 2, 3])
-        self._assert_almost_equal_both(np.array([1, 2, 3]), [1, 2, 3])
-
-        # Can't compare generators
-        self._assert_not_almost_equal_both(iter([1, 2, 3]), [1, 2, 3])
-
-        self._assert_not_almost_equal_both([1, 2, 3], [1, 2, 4])
-        self._assert_not_almost_equal_both([1, 2, 3], [1, 2, 3, 4])
-        self._assert_not_almost_equal_both([1, 2, 3], 1)
-
-    def test_assert_almost_equal_null(self):
-        self._assert_almost_equal_both(None, None)
-        self._assert_almost_equal_both(None, np.NaN)
-
-        self._assert_not_almost_equal_both(None, 0)
-        self._assert_not_almost_equal_both(np.NaN, 0)
-
-    def test_assert_almost_equal_inf(self):
-        self._assert_almost_equal_both(np.inf, np.inf)
-        self._assert_almost_equal_both(np.inf, float("inf"))
-
-        self._assert_not_almost_equal_both(np.inf, 0)
-
-
-class TestUtilTesting(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def test_raise_with_traceback(self):
-        with assertRaisesRegexp(LookupError, "error_text"):
-            try:
-                raise ValueError("THIS IS AN ERROR")
-            except ValueError as e:
-                e = LookupError("error_text")
-                raise_with_traceback(e)
-        with assertRaisesRegexp(LookupError, "error_text"):
-            try:
-                raise ValueError("This is another error")
-            except ValueError:
-                e = LookupError("error_text")
-                _, _, traceback = sys.exc_info()
-                raise_with_traceback(e, traceback)
-
-
-class TestAssertNumpyArrayEqual(tm.TestCase):
-
-    def test_numpy_array_equal_message(self):
-
-        if is_platform_windows():
-            raise nose.SkipTest("windows has incomparable line-endings and uses L on the shape")
-
-        expected = """numpy array are different
-
-numpy array shapes are different
-\\[left\\]:  \\(2,\\)
-\\[right\\]: \\(3,\\)"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([1, 2]), np.array([3, 4, 5]))
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([1, 2]), np.array([3, 4, 5]))
-
-        # scalar comparison
-        expected = """: 1 != 2"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(1, 2)
-        expected = """expected 2\\.00000 but got 1\\.00000, with decimal 5"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(1, 2)
-
-        # array / scalar array comparison
-        expected = """(numpy array|Iterable) are different
-
-First object is iterable, second isn't
-\\[left\\]:  \\[1\\]
-\\[right\\]: 1"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([1]), 1)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([1]), 1)
-
-        # scalar / array comparison
-        expected = """(numpy array|Iterable) are different
-
-Second object is iterable, first isn't
-\\[left\\]:  1
-\\[right\\]: \\[1\\]"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(1, np.array([1]))
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(1, np.array([1]))
-
-        expected = """numpy array are different
-
-numpy array values are different \\(66\\.66667 %\\)
-\\[left\\]:  \\[nan, 2\\.0, 3\\.0\\]
-\\[right\\]: \\[1\\.0, nan, 3\\.0\\]"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([np.nan, 2, 3]), np.array([1, np.nan, 3]))
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([np.nan, 2, 3]), np.array([1, np.nan, 3]))
-
-        expected = """numpy array are different
-
-numpy array values are different \\(50\\.0 %\\)
-\\[left\\]:  \\[1, 2\\]
-\\[right\\]: \\[1, 3\\]"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([1, 2]), np.array([1, 3]))
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([1, 2]), np.array([1, 3]))
-
-
-        expected = """numpy array are different
-
-numpy array values are different \\(50\\.0 %\\)
-\\[left\\]:  \\[1\\.1, 2\\.000001\\]
-\\[right\\]: \\[1\\.1, 2.0\\]"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([1.1, 2.000001]), np.array([1.1, 2.0]))
-
-        # must pass
-        assert_almost_equal(np.array([1.1, 2.000001]), np.array([1.1, 2.0]))
-
-        expected = """numpy array are different
-
-numpy array values are different \\(16\\.66667 %\\)
-\\[left\\]:  \\[\\[1, 2\\], \\[3, 4\\], \\[5, 6\\]\\]
-\\[right\\]: \\[\\[1, 3\\], \\[3, 4\\], \\[5, 6\\]\\]"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([[1, 2], [3, 4], [5, 6]]),
-                                     np.array([[1, 3], [3, 4], [5, 6]]))
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([[1, 2], [3, 4], [5, 6]]),
-                                np.array([[1, 3], [3, 4], [5, 6]]))
-
-        expected = """numpy array are different
-
-numpy array values are different \\(25\\.0 %\\)
-\\[left\\]:  \\[\\[1, 2\\], \\[3, 4\\]\\]
-\\[right\\]: \\[\\[1, 3\\], \\[3, 4\\]\\]"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([[1, 2], [3, 4]]),
-                                     np.array([[1, 3], [3, 4]]))
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([[1, 2], [3, 4]]),
-                                np.array([[1, 3], [3, 4]]))
-
-        # allow to overwrite message
-        expected = """Index are different
-
-Index shapes are different
-\\[left\\]:  \\(2,\\)
-\\[right\\]: \\(3,\\)"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([1, 2]), np.array([3, 4, 5]),
-                                     obj='Index')
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([1, 2]), np.array([3, 4, 5]),
-                                obj='Index')
-
-    def test_assert_almost_equal_iterable_message(self):
-
-        expected = """Iterable are different
-
-Iterable length are different
-\\[left\\]:  2
-\\[right\\]: 3"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal([1, 2], [3, 4, 5])
-
-        expected = """Iterable are different
-
-Iterable values are different \\(50\\.0 %\\)
-\\[left\\]:  \\[1, 2\\]
-\\[right\\]: \\[1, 3\\]"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal([1, 2], [1, 3])
-
-
-class TestAssertIndexEqual(unittest.TestCase):
-    _multiprocess_can_split_ = True
-
-    def test_index_equal_message(self):
-
-        expected = """Index are different
-
-Index levels are different
-\\[left\\]:  1, Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
-\\[right\\]: 2, MultiIndex\\(levels=\\[\\[u?'A', u?'B'\\], \\[1, 2, 3, 4\\]\\],
-           labels=\\[\\[0, 0, 1, 1\\], \\[0, 1, 2, 3\\]\\]\\)"""
-        idx1 = pd.Index([1, 2, 3])
-        idx2 = pd.MultiIndex.from_tuples([('A', 1), ('A', 2), ('B', 3), ('B', 4)])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, exact=False)
-
-
-        expected = """MultiIndex level \\[1\\] are different
-
-MultiIndex level \\[1\\] values are different \\(25\\.0 %\\)
-\\[left\\]:  Int64Index\\(\\[2, 2, 3, 4\\], dtype='int64'\\)
-\\[right\\]: Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)"""
-        idx1 = pd.MultiIndex.from_tuples([('A', 2), ('A', 2), ('B', 3), ('B', 4)])
-        idx2 = pd.MultiIndex.from_tuples([('A', 1), ('A', 2), ('B', 3), ('B', 4)])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, check_exact=False)
-
-        expected = """Index are different
-
-Index length are different
-\\[left\\]:  3, Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
-\\[right\\]: 4, Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)"""
-        idx1 = pd.Index([1, 2, 3])
-        idx2 = pd.Index([1, 2, 3, 4])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, check_exact=False)
-
-        expected = """Index are different
-
-Index classes are different
-\\[left\\]:  Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
-\\[right\\]: Float64Index\\(\\[1\\.0, 2\\.0, 3\\.0\\], dtype='float64'\\)"""
-        idx1 = pd.Index([1, 2, 3])
-        idx2 = pd.Index([1, 2, 3.0])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, exact=True)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, exact=True, check_exact=False)
-
-        expected = """Index are different
-
-Index values are different \\(33\\.33333 %\\)
-\\[left\\]:  Float64Index\\(\\[1.0, 2.0, 3.0], dtype='float64'\\)
-\\[right\\]: Float64Index\\(\\[1.0, 2.0, 3.0000000001\\], dtype='float64'\\)"""
-        idx1 = pd.Index([1, 2, 3.])
-        idx2 = pd.Index([1, 2, 3.0000000001])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-
-        # must success
-        assert_index_equal(idx1, idx2, check_exact=False)
-
-        expected = """Index are different
-
-Index values are different \\(33\\.33333 %\\)
-\\[left\\]:  Float64Index\\(\\[1.0, 2.0, 3.0], dtype='float64'\\)
-\\[right\\]: Float64Index\\(\\[1.0, 2.0, 3.0001\\], dtype='float64'\\)"""
-        idx1 = pd.Index([1, 2, 3.])
-        idx2 = pd.Index([1, 2, 3.0001])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, check_exact=False)
-        # must success
-        assert_index_equal(idx1, idx2, check_exact=False, check_less_precise=True)
-
-        expected = """Index are different
-
-Index values are different \\(33\\.33333 %\\)
-\\[left\\]:  Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
-\\[right\\]: Int64Index\\(\\[1, 2, 4\\], dtype='int64'\\)"""
-        idx1 = pd.Index([1, 2, 3])
-        idx2 = pd.Index([1, 2, 4])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, check_less_precise=True)
-
-        expected = """MultiIndex level \\[1\\] are different
-
-MultiIndex level \\[1\\] values are different \\(25\\.0 %\\)
-\\[left\\]:  Int64Index\\(\\[2, 2, 3, 4\\], dtype='int64'\\)
-\\[right\\]: Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)"""
-        idx1 = pd.MultiIndex.from_tuples([('A', 2), ('A', 2), ('B', 3), ('B', 4)])
-        idx2 = pd.MultiIndex.from_tuples([('A', 1), ('A', 2), ('B', 3), ('B', 4)])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, check_exact=False)
-
-    def test_index_equal_metadata_message(self):
-
-        expected = """Index are different
-
-Attribute "names" are different
-\\[left\\]:  \\[None\\]
-\\[right\\]: \\[u?'x'\\]"""
-        idx1 = pd.Index([1, 2, 3])
-        idx2 = pd.Index([1, 2, 3], name='x')
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-
-        # same name, should pass
-        assert_index_equal(pd.Index([1, 2, 3], name=np.nan),
-                              pd.Index([1, 2, 3], name=np.nan))
-        assert_index_equal(pd.Index([1, 2, 3], name=pd.NaT),
-                              pd.Index([1, 2, 3], name=pd.NaT))
-
-
-        expected = """Index are different
-
-Attribute "names" are different
-\\[left\\]:  \\[nan\\]
-\\[right\\]: \\[NaT\\]"""
-        idx1 = pd.Index([1, 2, 3], name=np.nan)
-        idx2 = pd.Index([1, 2, 3], name=pd.NaT)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-
-
-class TestAssertSeriesEqual(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def _assert_equal(self, x, y, **kwargs):
-        assert_series_equal(x,y,**kwargs)
-        assert_series_equal(y,x,**kwargs)
-
-    def _assert_not_equal(self, a, b, **kwargs):
-        self.assertRaises(AssertionError, assert_series_equal, a, b, **kwargs)
-        self.assertRaises(AssertionError, assert_series_equal, b, a, **kwargs)
-
-    def test_equal(self):
-        self._assert_equal(Series(range(3)),Series(range(3)))
-        self._assert_equal(Series(list('abc')),Series(list('abc')))
-
-    def test_not_equal(self):
-        self._assert_not_equal(Series(range(3)),Series(range(3))+1)
-        self._assert_not_equal(Series(list('abc')),Series(list('xyz')))
-        self._assert_not_equal(Series(range(3)),Series(range(4)))
-        self._assert_not_equal(Series(range(3)),Series(range(3),dtype='float64'))
-        self._assert_not_equal(Series(range(3)),Series(range(3),index=[1,2,4]))
-
-        # ATM meta data is not checked in assert_series_equal
-        # self._assert_not_equal(Series(range(3)),Series(range(3),name='foo'),check_names=True)
-
-    def test_less_precise(self):
-        s1 =  Series([0.12345],dtype='float64')
-        s2 =  Series([0.12346],dtype='float64')
-
-        self.assertRaises(AssertionError, assert_series_equal, s1, s2)
-        self._assert_equal(s1,s2,check_less_precise=True)
-
-        s1 =  Series([0.12345],dtype='float32')
-        s2 =  Series([0.12346],dtype='float32')
-
-        self.assertRaises(AssertionError, assert_series_equal, s1, s2)
-        self._assert_equal(s1,s2,check_less_precise=True)
-
-        # even less than less precise
-        s1 =  Series([0.1235],dtype='float32')
-        s2 =  Series([0.1236],dtype='float32')
-
-        self.assertRaises(AssertionError, assert_series_equal, s1, s2)
-        self.assertRaises(AssertionError, assert_series_equal, s1, s2, True)
-
-    def test_index_dtype(self):
-        df1 = DataFrame.from_records(
-                {'a':[1,2],'c':['l1','l2']}, index=['a'])
-        df2 = DataFrame.from_records(
-                {'a':[1.0,2.0],'c':['l1','l2']}, index=['a'])
-        self._assert_not_equal(df1.c, df2.c, check_index_type=True)
-
-    def test_multiindex_dtype(self):
-        df1 = DataFrame.from_records(
-                {'a':[1,2],'b':[2.1,1.5],'c':['l1','l2']}, index=['a','b'])
-        df2 = DataFrame.from_records(
-                {'a':[1.0,2.0],'b':[2.1,1.5],'c':['l1','l2']}, index=['a','b'])
-        self._assert_not_equal(df1.c, df2.c, check_index_type=True)
-
-    def test_series_equal_message(self):
-
-        expected = """Series are different
-
-Series length are different
-\\[left\\]:  3, Int64Index\\(\\[0, 1, 2\\], dtype='int64'\\)
-\\[right\\]: 4, Int64Index\\(\\[0, 1, 2, 3\\], dtype='int64'\\)"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_series_equal(pd.Series([1, 2, 3]), pd.Series([1, 2, 3, 4]))
-
-
-        expected = """Series are different
-
-Series values are different \\(33\\.33333 %\\)
-\\[left\\]:  \\[1, 2, 3\\]
-\\[right\\]: \\[1, 2, 4\\]"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_series_equal(pd.Series([1, 2, 3]), pd.Series([1, 2, 4]))
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_series_equal(pd.Series([1, 2, 3]), pd.Series([1, 2, 4]),
-                                   check_less_precise=True)
-
-
-class TestAssertFrameEqual(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def _assert_equal(self, x, y, **kwargs):
-        assert_frame_equal(x,y,**kwargs)
-        assert_frame_equal(y,x,**kwargs)
-
-    def _assert_not_equal(self, a, b, **kwargs):
-        self.assertRaises(AssertionError, assert_frame_equal, a, b, **kwargs)
-        self.assertRaises(AssertionError, assert_frame_equal, b, a, **kwargs)
-
-    def test_index_dtype(self):
-        df1 = DataFrame.from_records(
-                {'a':[1,2],'c':['l1','l2']}, index=['a'])
-        df2 = DataFrame.from_records(
-                {'a':[1.0,2.0],'c':['l1','l2']}, index=['a'])
-        self._assert_not_equal(df1, df2, check_index_type=True)
-
-    def test_multiindex_dtype(self):
-        df1 = DataFrame.from_records(
-                {'a':[1,2],'b':[2.1,1.5],'c':['l1','l2']}, index=['a','b'])
-        df2 = DataFrame.from_records(
-                {'a':[1.0,2.0],'b':[2.1,1.5],'c':['l1','l2']}, index=['a','b'])
-        self._assert_not_equal(df1, df2, check_index_type=True)
-
-    def test_empty_dtypes(self):
-        df1=pd.DataFrame(columns=["col1","col2"])
-        df1["col1"] = df1["col1"].astype('int64')
-        df2=pd.DataFrame(columns=["col1","col2"])
-        self._assert_equal(df1, df2, check_dtype=False)
-        self._assert_not_equal(df1, df2, check_dtype=True)
-
-    def test_frame_equal_message(self):
-
-        expected = """DataFrame are different
-
-DataFrame shape \\(number of rows\\) are different
-\\[left\\]:  3, Int64Index\\(\\[0, 1, 2\\], dtype='int64'\\)
-\\[right\\]: 4, Int64Index\\(\\[0, 1, 2, 3\\], dtype='int64'\\)"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_frame_equal(pd.DataFrame({'A':[1, 2, 3]}),
-                                  pd.DataFrame({'A':[1, 2, 3, 4]}))
-
-
-        expected = """DataFrame are different
-
-DataFrame shape \\(number of columns\\) are different
-\\[left\\]:  2, Index\\(\\[u?'A', u?'B'\\], dtype='object'\\)
-\\[right\\]: 1, Index\\(\\[u?'A'\\], dtype='object'\\)"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_frame_equal(pd.DataFrame({'A':[1, 2, 3], 'B':[4, 5, 6]}),
-                                  pd.DataFrame({'A':[1, 2, 3]}))
-
-
-        expected = """DataFrame\\.index are different
-
-DataFrame\\.index values are different \\(33\\.33333 %\\)
-\\[left\\]:  Index\\(\\[u?'a', u?'b', u?'c'\\], dtype='object'\\)
-\\[right\\]: Index\\(\\[u?'a', u?'b', u?'d'\\], dtype='object'\\)"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_frame_equal(pd.DataFrame({'A':[1, 2, 3], 'B':[4, 5, 6]},
-                                               index=['a', 'b', 'c']),
-                                  pd.DataFrame({'A':[1, 2, 3], 'B':[4, 5, 6]},
-                                               index=['a', 'b', 'd']))
-
-        expected = """DataFrame\\.columns are different
-
-DataFrame\\.columns values are different \\(50\\.0 %\\)
-\\[left\\]:  Index\\(\\[u?'A', u?'B'\\], dtype='object'\\)
-\\[right\\]: Index\\(\\[u?'A', u?'b'\\], dtype='object'\\)"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_frame_equal(pd.DataFrame({'A':[1, 2, 3], 'B':[4, 5, 6]},
-                                               index=['a', 'b', 'c']),
-                                  pd.DataFrame({'A':[1, 2, 3], 'b':[4, 5, 6]},
-                                               index=['a', 'b', 'c']))
-
-
-        expected = """DataFrame\\.iloc\\[:, 1\\] are different
-
-DataFrame\\.iloc\\[:, 1\\] values are different \\(33\\.33333 %\\)
-\\[left\\]:  \\[4, 5, 6\\]
-\\[right\\]: \\[4, 5, 7\\]"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_frame_equal(pd.DataFrame({'A':[1, 2, 3], 'B':[4, 5, 6]}),
-                               pd.DataFrame({'A':[1, 2, 3], 'B':[4, 5, 7]}))
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_frame_equal(pd.DataFrame({'A':[1, 2, 3], 'B':[4, 5, 6]}),
-                                  pd.DataFrame({'A':[1, 2, 3], 'B':[4, 5, 7]}),
-                                  by_blocks=True)
-
-
-class TestRNGContext(unittest.TestCase):
-
-    def test_RNGContext(self):
-        expected0 = 1.764052345967664
-        expected1 = 1.6243453636632417
-
-        with RNGContext(0):
-            with RNGContext(1):
-                self.assertEqual(np.random.randn(), expected1)
-            self.assertEqual(np.random.randn(), expected0)
-
-
-
-class TestDeprecatedTests(tm.TestCase):
-
-    def test_warning(self):
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assertEquals(1, 1)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assertNotEquals(1, 2)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assert_(True)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assertAlmostEquals(1.0, 1.0000000001)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assertNotAlmostEquals(1, 2)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            tm.assert_isinstance(Series([1, 2]), Series, msg='xxx')
-
-
-class TestLocale(tm.TestCase):
-
-    def test_locale(self):
-        if sys.platform == 'win32':
-            raise nose.SkipTest("skipping on win platforms as locale not available")
-
-        #GH9744
-        locales = tm.get_locales()
-        self.assertTrue(len(locales) >= 1)
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_tseries.py b/pandas/tests/test_tseries.py
deleted file mode 100644
index b94c91f72802a..0000000000000
--- a/pandas/tests/test_tseries.py
+++ /dev/null
@@ -1,734 +0,0 @@
-# -*- coding: utf-8 -*-
-import nose
-from numpy import nan
-import numpy as np
-from pandas import Index, isnull, Timestamp
-from pandas.util.testing import assert_almost_equal
-import pandas.util.testing as tm
-from pandas.compat import range, lrange, zip
-import pandas.lib as lib
-import pandas._period as period
-import pandas.algos as algos
-from pandas.core import common as com
-from pandas.tseries.holiday import Holiday, SA, next_monday,USMartinLutherKingJr,USMemorialDay,AbstractHolidayCalendar
-import datetime
-from pandas import DateOffset
-
-
-class TestTseriesUtil(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def test_combineFunc(self):
-        pass
-
-    def test_reindex(self):
-        pass
-
-    def test_isnull(self):
-        pass
-
-    def test_groupby(self):
-        pass
-
-    def test_groupby_withnull(self):
-        pass
-
-    def test_backfill(self):
-        old = Index([1, 5, 10])
-        new = Index(lrange(12))
-
-        filler = algos.backfill_int64(old.values, new.values)
-
-        expect_filler = [0, 0, 1, 1, 1, 1, 2, 2, 2, 2, 2, -1]
-        self.assert_numpy_array_equal(filler, expect_filler)
-
-        # corner case
-        old = Index([1, 4])
-        new = Index(lrange(5, 10))
-        filler = algos.backfill_int64(old.values, new.values)
-
-        expect_filler = [-1, -1, -1, -1, -1]
-        self.assert_numpy_array_equal(filler, expect_filler)
-
-    def test_pad(self):
-        old = Index([1, 5, 10])
-        new = Index(lrange(12))
-
-        filler = algos.pad_int64(old.values, new.values)
-
-        expect_filler = [-1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 2, 2]
-        self.assert_numpy_array_equal(filler, expect_filler)
-
-        # corner case
-        old = Index([5, 10])
-        new = Index(lrange(5))
-        filler = algos.pad_int64(old.values, new.values)
-        expect_filler = [-1, -1, -1, -1, -1]
-        self.assert_numpy_array_equal(filler, expect_filler)
-
-
-def test_left_join_indexer_unique():
-    a = np.array([1, 2, 3, 4, 5], dtype=np.int64)
-    b = np.array([2, 2, 3, 4, 4], dtype=np.int64)
-
-    result = algos.left_join_indexer_unique_int64(b, a)
-    expected = np.array([1, 1, 2, 3, 3], dtype=np.int64)
-    assert(np.array_equal(result, expected))
-
-
-def test_left_outer_join_bug():
-    left = np.array([0, 1, 0, 1, 1, 2, 3, 1, 0, 2, 1, 2, 0, 1, 1, 2, 3, 2, 3,
-                     2, 1, 1, 3, 0, 3, 2, 3, 0, 0, 2, 3, 2, 0, 3, 1, 3, 0, 1,
-                     3, 0, 0, 1, 0, 3, 1, 0, 1, 0, 1, 1, 0, 2, 2, 2, 2, 2, 0,
-                     3, 1, 2, 0, 0, 3, 1, 3, 2, 2, 0, 1, 3, 0, 2, 3, 2, 3, 3,
-                     2, 3, 3, 1, 3, 2, 0, 0, 3, 1, 1, 1, 0, 2, 3, 3, 1, 2, 0,
-                     3, 1, 2, 0, 2], dtype=np.int64)
-
-    right = np.array([3, 1], dtype=np.int64)
-    max_groups = 4
-
-    lidx, ridx = algos.left_outer_join(left, right, max_groups, sort=False)
-
-    exp_lidx = np.arange(len(left))
-    exp_ridx = -np.ones(len(left))
-    exp_ridx[left == 1] = 1
-    exp_ridx[left == 3] = 0
-
-    assert(np.array_equal(lidx, exp_lidx))
-    assert(np.array_equal(ridx, exp_ridx))
-
-
-def test_inner_join_indexer():
-    a = np.array([1, 2, 3, 4, 5], dtype=np.int64)
-    b = np.array([0, 3, 5, 7, 9], dtype=np.int64)
-
-    index, ares, bres = algos.inner_join_indexer_int64(a, b)
-
-    index_exp = np.array([3, 5], dtype=np.int64)
-    assert_almost_equal(index, index_exp)
-
-    aexp = np.array([2, 4])
-    bexp = np.array([1, 2])
-    assert_almost_equal(ares, aexp)
-    assert_almost_equal(bres, bexp)
-
-    a = np.array([5], dtype=np.int64)
-    b = np.array([5], dtype=np.int64)
-
-    index, ares, bres = algos.inner_join_indexer_int64(a, b)
-    assert_almost_equal(index, [5])
-    assert_almost_equal(ares, [0])
-    assert_almost_equal(bres, [0])
-
-
-def test_outer_join_indexer():
-    a = np.array([1, 2, 3, 4, 5], dtype=np.int64)
-    b = np.array([0, 3, 5, 7, 9], dtype=np.int64)
-
-    index, ares, bres = algos.outer_join_indexer_int64(a, b)
-
-    index_exp = np.array([0, 1, 2, 3, 4, 5, 7, 9], dtype=np.int64)
-    assert_almost_equal(index, index_exp)
-
-    aexp = np.array([-1, 0, 1, 2, 3, 4, -1, -1], dtype=np.int64)
-    bexp = np.array([0, -1, -1, 1, -1, 2, 3, 4])
-    assert_almost_equal(ares, aexp)
-    assert_almost_equal(bres, bexp)
-
-    a = np.array([5], dtype=np.int64)
-    b = np.array([5], dtype=np.int64)
-
-    index, ares, bres = algos.outer_join_indexer_int64(a, b)
-    assert_almost_equal(index, [5])
-    assert_almost_equal(ares, [0])
-    assert_almost_equal(bres, [0])
-
-
-def test_left_join_indexer():
-    a = np.array([1, 2, 3, 4, 5], dtype=np.int64)
-    b = np.array([0, 3, 5, 7, 9], dtype=np.int64)
-
-    index, ares, bres = algos.left_join_indexer_int64(a, b)
-
-    assert_almost_equal(index, a)
-
-    aexp = np.array([0, 1, 2, 3, 4], dtype=np.int64)
-    bexp = np.array([-1, -1, 1, -1, 2], dtype=np.int64)
-    assert_almost_equal(ares, aexp)
-    assert_almost_equal(bres, bexp)
-
-    a = np.array([5], dtype=np.int64)
-    b = np.array([5], dtype=np.int64)
-
-    index, ares, bres = algos.left_join_indexer_int64(a, b)
-    assert_almost_equal(index, [5])
-    assert_almost_equal(ares, [0])
-    assert_almost_equal(bres, [0])
-
-
-def test_left_join_indexer2():
-    idx = Index([1, 1, 2, 5])
-    idx2 = Index([1, 2, 5, 7, 9])
-
-    res, lidx, ridx = algos.left_join_indexer_int64(idx2.values, idx.values)
-
-    exp_res = np.array([1, 1, 2, 5, 7, 9], dtype=np.int64)
-    assert_almost_equal(res, exp_res)
-
-    exp_lidx = np.array([0, 0, 1, 2, 3, 4], dtype=np.int64)
-    assert_almost_equal(lidx, exp_lidx)
-
-    exp_ridx = np.array([0, 1, 2, 3, -1, -1], dtype=np.int64)
-    assert_almost_equal(ridx, exp_ridx)
-
-
-def test_outer_join_indexer2():
-    idx = Index([1, 1, 2, 5])
-    idx2 = Index([1, 2, 5, 7, 9])
-
-    res, lidx, ridx = algos.outer_join_indexer_int64(idx2.values, idx.values)
-
-    exp_res = np.array([1, 1, 2, 5, 7, 9], dtype=np.int64)
-    assert_almost_equal(res, exp_res)
-
-    exp_lidx = np.array([0, 0, 1, 2, 3, 4], dtype=np.int64)
-    assert_almost_equal(lidx, exp_lidx)
-
-    exp_ridx = np.array([0, 1, 2, 3, -1, -1], dtype=np.int64)
-    assert_almost_equal(ridx, exp_ridx)
-
-
-def test_inner_join_indexer2():
-    idx = Index([1, 1, 2, 5])
-    idx2 = Index([1, 2, 5, 7, 9])
-
-    res, lidx, ridx = algos.inner_join_indexer_int64(idx2.values, idx.values)
-
-    exp_res = np.array([1, 1, 2, 5], dtype=np.int64)
-    assert_almost_equal(res, exp_res)
-
-    exp_lidx = np.array([0, 0, 1, 2], dtype=np.int64)
-    assert_almost_equal(lidx, exp_lidx)
-
-    exp_ridx = np.array([0, 1, 2, 3], dtype=np.int64)
-    assert_almost_equal(ridx, exp_ridx)
-
-
-def test_is_lexsorted():
-    failure = [
-        np.array([3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
-                  3, 3,
-                  3, 3,
-                  3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
-                  2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1, 1, 1, 1, 1, 1, 1,
-                  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-                  1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
-                  0, 0, 0, 0, 0, 0, 0, 0, 0]),
-        np.array([30, 29, 28, 27, 26, 25, 24, 23, 22, 21, 20, 19, 18, 17, 16,
-                  15, 14,
-                  13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0, 30, 29, 28,
-                  27, 26, 25, 24, 23, 22, 21, 20, 19, 18, 17, 16, 15, 14, 13, 12, 11,
-                  10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0, 30, 29, 28, 27, 26, 25,
-                  24, 23, 22, 21, 20, 19, 18, 17, 16, 15, 14, 13, 12, 11, 10, 9, 8,
-                  7, 6, 5, 4, 3, 2, 1, 0, 30, 29, 28, 27, 26, 25, 24, 23, 22,
-                  21, 20, 19, 18, 17, 16, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5,
-                  4, 3, 2, 1, 0])]
-
-    assert(not algos.is_lexsorted(failure))
-
-# def test_get_group_index():
-#     a = np.array([0, 1, 2, 0, 2, 1, 0, 0], dtype=np.int64)
-#     b = np.array([1, 0, 3, 2, 0, 2, 3, 0], dtype=np.int64)
-#     expected = np.array([1, 4, 11, 2, 8, 6, 3, 0], dtype=np.int64)
-
-#     result = lib.get_group_index([a, b], (3, 4))
-
-#     assert(np.array_equal(result, expected))
-
-
-def test_groupsort_indexer():
-    a = np.random.randint(0, 1000, 100).astype(np.int64)
-    b = np.random.randint(0, 1000, 100).astype(np.int64)
-
-    result = algos.groupsort_indexer(a, 1000)[0]
-
-    # need to use a stable sort
-    expected = np.argsort(a, kind='mergesort')
-    assert(np.array_equal(result, expected))
-
-    # compare with lexsort
-    key = a * 1000 + b
-    result = algos.groupsort_indexer(key, 1000000)[0]
-    expected = np.lexsort((b, a))
-    assert(np.array_equal(result, expected))
-
-
-def test_ensure_platform_int():
-    arr = np.arange(100)
-
-    result = algos.ensure_platform_int(arr)
-    assert(result is arr)
-
-
-def test_duplicated_with_nas():
-    keys = np.array([0, 1, nan, 0, 2, nan], dtype=object)
-
-    result = lib.duplicated(keys)
-    expected = [False, False, False, True, False, True]
-    assert(np.array_equal(result, expected))
-
-    result = lib.duplicated(keys, keep='first')
-    expected = [False, False, False, True, False, True]
-    assert(np.array_equal(result, expected))
-
-    result = lib.duplicated(keys, keep='last')
-    expected = [True, False, True, False, False, False]
-    assert(np.array_equal(result, expected))
-
-    result = lib.duplicated(keys, keep=False)
-    expected = [True, False, True, True, False, True]
-    assert(np.array_equal(result, expected))
-
-    keys = np.empty(8, dtype=object)
-    for i, t in enumerate(zip([0, 0, nan, nan] * 2, [0, nan, 0, nan] * 2)):
-        keys[i] = t
-
-    result = lib.duplicated(keys)
-    falses = [False] * 4
-    trues = [True] * 4
-    expected = falses + trues
-    assert(np.array_equal(result, expected))
-
-    result = lib.duplicated(keys, keep='last')
-    expected = trues + falses
-    assert(np.array_equal(result, expected))
-
-    result = lib.duplicated(keys, keep=False)
-    expected = trues + trues
-    assert(np.array_equal(result, expected))
-
-
-def test_maybe_booleans_to_slice():
-    arr = np.array([0, 0, 1, 1, 1, 0, 1], dtype=np.uint8)
-    result = lib.maybe_booleans_to_slice(arr)
-    assert(result.dtype == np.bool_)
-
-    result = lib.maybe_booleans_to_slice(arr[:0])
-    assert(result == slice(0, 0))
-
-
-def test_convert_objects():
-    arr = np.array(['a', 'b', nan, nan, 'd', 'e', 'f'], dtype='O')
-    result = lib.maybe_convert_objects(arr)
-    assert(result.dtype == np.object_)
-
-
-def test_convert_infs():
-    arr = np.array(['inf', 'inf', 'inf'], dtype='O')
-    result = lib.maybe_convert_numeric(arr, set(), False)
-    assert(result.dtype == np.float64)
-
-    arr = np.array(['-inf', '-inf', '-inf'], dtype='O')
-    result = lib.maybe_convert_numeric(arr, set(), False)
-    assert(result.dtype == np.float64)
-
-
-def test_convert_objects_ints():
-    # test that we can detect many kinds of integers
-    dtypes = ['i1', 'i2', 'i4', 'i8', 'u1', 'u2', 'u4', 'u8']
-
-    for dtype_str in dtypes:
-        arr = np.array(list(np.arange(20, dtype=dtype_str)), dtype='O')
-        assert(arr[0].dtype == np.dtype(dtype_str))
-        result = lib.maybe_convert_objects(arr)
-        assert(issubclass(result.dtype.type, np.integer))
-
-
-def test_convert_objects_complex_number():
-    for dtype in np.sctypes['complex']:
-        arr = np.array(list(1j * np.arange(20, dtype=dtype)), dtype='O')
-        assert(arr[0].dtype == np.dtype(dtype))
-        result = lib.maybe_convert_objects(arr)
-        assert(issubclass(result.dtype.type, np.complexfloating))
-
-
-def test_rank():
-    tm._skip_if_no_scipy()
-    from scipy.stats import rankdata
-
-    def _check(arr):
-        mask = ~np.isfinite(arr)
-        arr = arr.copy()
-        result = algos.rank_1d_float64(arr)
-        arr[mask] = np.inf
-        exp = rankdata(arr)
-        exp[mask] = nan
-        assert_almost_equal(result, exp)
-
-    _check(np.array([nan, nan, 5., 5., 5., nan, 1, 2, 3, nan]))
-    _check(np.array([4., nan, 5., 5., 5., nan, 1, 2, 4., nan]))
-
-
-def test_get_reverse_indexer():
-    indexer = np.array([-1, -1, 1, 2, 0, -1, 3, 4], dtype=np.int64)
-    result = lib.get_reverse_indexer(indexer, 5)
-    expected = np.array([4, 2, 3, 6, 7], dtype=np.int64)
-    assert(np.array_equal(result, expected))
-
-
-def test_pad_backfill_object_segfault():
-
-    old = np.array([], dtype='O')
-    new = np.array([datetime.datetime(2010, 12, 31)], dtype='O')
-
-    result = algos.pad_object(old, new)
-    expected = np.array([-1], dtype=np.int64)
-    assert(np.array_equal(result, expected))
-
-    result = algos.pad_object(new, old)
-    expected = np.array([], dtype=np.int64)
-    assert(np.array_equal(result, expected))
-
-    result = algos.backfill_object(old, new)
-    expected = np.array([-1], dtype=np.int64)
-    assert(np.array_equal(result, expected))
-
-    result = algos.backfill_object(new, old)
-    expected = np.array([], dtype=np.int64)
-    assert(np.array_equal(result, expected))
-
-
-def test_arrmap():
-    values = np.array(['foo', 'foo', 'bar', 'bar', 'baz', 'qux'], dtype='O')
-    result = algos.arrmap_object(values, lambda x: x in ['foo', 'bar'])
-    assert(result.dtype == np.bool_)
-
-
-def test_series_grouper():
-    from pandas import Series
-    obj = Series(np.random.randn(10))
-    dummy = obj[:0]
-
-    labels = np.array([-1, -1, -1, 0, 0, 0, 1, 1, 1, 1], dtype=np.int64)
-
-    grouper = lib.SeriesGrouper(obj, np.mean, labels, 2, dummy)
-    result, counts = grouper.get_result()
-
-    expected = np.array([obj[3:6].mean(), obj[6:].mean()])
-    assert_almost_equal(result, expected)
-
-    exp_counts = np.array([3, 4], dtype=np.int64)
-    assert_almost_equal(counts, exp_counts)
-
-
-def test_series_bin_grouper():
-    from pandas import Series
-    obj = Series(np.random.randn(10))
-    dummy = obj[:0]
-
-    bins = np.array([3, 6])
-
-    grouper = lib.SeriesBinGrouper(obj, np.mean, bins, dummy)
-    result, counts = grouper.get_result()
-
-    expected = np.array([obj[:3].mean(), obj[3:6].mean(), obj[6:].mean()])
-    assert_almost_equal(result, expected)
-
-    exp_counts = np.array([3, 3, 4], dtype=np.int64)
-    assert_almost_equal(counts, exp_counts)
-
-
-class TestBinGroupers(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.obj = np.random.randn(10, 1)
-        self.labels = np.array([0, 0, 0, 1, 1, 1, 2, 2, 2, 2], dtype=np.int64)
-        self.bins = np.array([3, 6], dtype=np.int64)
-
-    def test_generate_bins(self):
-        from pandas.core.groupby import generate_bins_generic
-        values = np.array([1, 2, 3, 4, 5, 6], dtype=np.int64)
-        binner = np.array([0, 3, 6, 9], dtype=np.int64)
-
-        for func in [lib.generate_bins_dt64, generate_bins_generic]:
-            bins = func(values, binner, closed='left')
-            assert((bins == np.array([2, 5, 6])).all())
-
-            bins = func(values, binner, closed='right')
-            assert((bins == np.array([3, 6, 6])).all())
-
-        for func in [lib.generate_bins_dt64, generate_bins_generic]:
-            values = np.array([1, 2, 3, 4, 5, 6], dtype=np.int64)
-            binner = np.array([0, 3, 6], dtype=np.int64)
-
-            bins = func(values, binner, closed='right')
-            assert((bins == np.array([3, 6])).all())
-
-        self.assertRaises(ValueError, generate_bins_generic, values, [],
-                          'right')
-        self.assertRaises(ValueError, generate_bins_generic, values[:0],
-                          binner, 'right')
-
-        self.assertRaises(ValueError, generate_bins_generic,
-                          values, [4], 'right')
-        self.assertRaises(ValueError, generate_bins_generic,
-                          values, [-3, -1], 'right')
-
-
-def test_group_ohlc():
-
-    def _check(dtype):
-        obj = np.array(np.random.randn(20),dtype=dtype)
-
-        bins = np.array([6, 12, 20])
-        out = np.zeros((3, 4), dtype)
-        counts = np.zeros(len(out), dtype=np.int64)
-        labels = com._ensure_int64(np.repeat(np.arange(3), np.diff(np.r_[0, bins])))
-
-        func = getattr(algos,'group_ohlc_%s' % dtype)
-        func(out, counts, obj[:, None], labels)
-
-        def _ohlc(group):
-            if isnull(group).all():
-                return np.repeat(nan, 4)
-            return [group[0], group.max(), group.min(), group[-1]]
-
-        expected = np.array([_ohlc(obj[:6]), _ohlc(obj[6:12]),
-                             _ohlc(obj[12:])])
-
-        assert_almost_equal(out, expected)
-        assert_almost_equal(counts, [6, 6, 8])
-
-        obj[:6] = nan
-        func(out, counts, obj[:, None], labels)
-        expected[0] = nan
-        assert_almost_equal(out, expected)
-
-    _check('float32')
-    _check('float64')
-
-def test_try_parse_dates():
-    from dateutil.parser import parse
-
-    arr = np.array(['5/1/2000', '6/1/2000', '7/1/2000'], dtype=object)
-
-    result = lib.try_parse_dates(arr, dayfirst=True)
-    expected = [parse(d, dayfirst=True) for d in arr]
-    assert(np.array_equal(result, expected))
-
-
-class TestTypeInference(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def test_length_zero(self):
-        result = lib.infer_dtype(np.array([], dtype='i4'))
-        self.assertEqual(result, 'integer')
-
-        result = lib.infer_dtype([])
-        self.assertEqual(result, 'empty')
-
-    def test_integers(self):
-        arr = np.array([1, 2, 3, np.int64(4), np.int32(5)], dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'integer')
-
-        arr = np.array([1, 2, 3, np.int64(4), np.int32(5), 'foo'],
-                       dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'mixed-integer')
-
-        arr = np.array([1, 2, 3, 4, 5], dtype='i4')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'integer')
-
-    def test_bools(self):
-        arr = np.array([True, False, True, True, True], dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'boolean')
-
-        arr = np.array([np.bool_(True), np.bool_(False)], dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'boolean')
-
-        arr = np.array([True, False, True, 'foo'], dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'mixed')
-
-        arr = np.array([True, False, True], dtype=bool)
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'boolean')
-
-    def test_floats(self):
-        arr = np.array([1., 2., 3., np.float64(4), np.float32(5)], dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'floating')
-
-        arr = np.array([1, 2, 3, np.float64(4), np.float32(5), 'foo'],
-                       dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'mixed-integer')
-
-        arr = np.array([1, 2, 3, 4, 5], dtype='f4')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'floating')
-
-        arr = np.array([1, 2, 3, 4, 5], dtype='f8')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'floating')
-
-    def test_string(self):
-        pass
-
-    def test_unicode(self):
-        pass
-
-    def test_datetime(self):
-
-        dates = [datetime.datetime(2012, 1, x) for x in range(1, 20)]
-        index = Index(dates)
-        self.assertEqual(index.inferred_type, 'datetime64')
-
-    def test_date(self):
-
-        dates = [datetime.date(2012, 1, x) for x in range(1, 20)]
-        index = Index(dates)
-        self.assertEqual(index.inferred_type, 'date')
-
-    def test_to_object_array_tuples(self):
-        r = (5, 6)
-        values = [r]
-        result = lib.to_object_array_tuples(values)
-
-        try:
-            # make sure record array works
-            from collections import namedtuple
-            record = namedtuple('record', 'x y')
-            r = record(5, 6)
-            values = [r]
-            result = lib.to_object_array_tuples(values)
-        except ImportError:
-            pass
-
-    def test_object(self):
-
-        # GH 7431
-        # cannot infer more than this as only a single element
-        arr = np.array([None],dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'mixed')
-
-    def test_categorical(self):
-
-        # GH 8974
-        from pandas import Categorical, Series
-        arr = Categorical(list('abc'))
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'categorical')
-
-        result = lib.infer_dtype(Series(arr))
-        self.assertEqual(result, 'categorical')
-
-        arr = Categorical(list('abc'),categories=['cegfab'],ordered=True)
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'categorical')
-
-        result = lib.infer_dtype(Series(arr))
-        self.assertEqual(result, 'categorical')
-
-class TestMoments(tm.TestCase):
-    pass
-
-
-class TestReducer(tm.TestCase):
-
-    def test_int_index(self):
-        from pandas.core.series import Series
-
-        arr = np.random.randn(100, 4)
-        result = lib.reduce(arr, np.sum, labels=Index(np.arange(4)))
-        expected = arr.sum(0)
-        assert_almost_equal(result, expected)
-
-        result = lib.reduce(arr, np.sum, axis=1, labels=Index(np.arange(100)))
-        expected = arr.sum(1)
-        assert_almost_equal(result, expected)
-
-        dummy = Series(0., index=np.arange(100))
-        result = lib.reduce(
-            arr, np.sum, dummy=dummy, labels=Index(np.arange(4)))
-        expected = arr.sum(0)
-        assert_almost_equal(result, expected)
-
-        dummy = Series(0., index=np.arange(4))
-        result = lib.reduce(arr, np.sum, axis=1,
-                            dummy=dummy, labels=Index(np.arange(100)))
-        expected = arr.sum(1)
-        assert_almost_equal(result, expected)
-
-        result = lib.reduce(arr, np.sum, axis=1,
-                            dummy=dummy, labels=Index(np.arange(100)))
-        assert_almost_equal(result, expected)
-
-
-class TestTsUtil(tm.TestCase):
-    def test_min_valid(self):
-        # Ensure that Timestamp.min is a valid Timestamp
-        Timestamp(Timestamp.min)
-
-    def test_max_valid(self):
-        # Ensure that Timestamp.max is a valid Timestamp
-        Timestamp(Timestamp.max)
-
-    def test_to_datetime_bijective(self):
-        # Ensure that converting to datetime and back only loses precision
-        # by going from nanoseconds to microseconds.
-        self.assertEqual(Timestamp(Timestamp.max.to_pydatetime()).value/1000, Timestamp.max.value/1000)
-        self.assertEqual(Timestamp(Timestamp.min.to_pydatetime()).value/1000, Timestamp.min.value/1000)
-
-class TestPeriodField(tm.TestCase):
-
-    def test_get_period_field_raises_on_out_of_range(self):
-        self.assertRaises(ValueError, period.get_period_field, -1, 0, 0)
-
-    def test_get_period_field_array_raises_on_out_of_range(self):
-        self.assertRaises(ValueError, period.get_period_field_arr, -1, np.empty(1), 0)
-
-class TestFederalHolidayCalendar(tm.TestCase):
-
-    # Test for issue 10278
-    def test_no_mlk_before_1984(self):
-        class MLKCalendar(AbstractHolidayCalendar):
-            rules=[USMartinLutherKingJr]
-        holidays = MLKCalendar().holidays(start='1984', end='1988').to_pydatetime().tolist()
-        # Testing to make sure holiday is not incorrectly observed before 1986
-        self.assertEqual(holidays, [datetime.datetime(1986, 1, 20, 0, 0), datetime.datetime(1987, 1, 19, 0, 0)])
-
-    def test_memorial_day(self):
-        class MemorialDay(AbstractHolidayCalendar):
-            rules=[USMemorialDay]
-        holidays = MemorialDay().holidays(start='1971', end='1980').to_pydatetime().tolist()
-        # Fixes 5/31 error and checked manually against wikipedia
-        self.assertEqual(holidays, [datetime.datetime(1971, 5, 31, 0, 0), datetime.datetime(1972, 5, 29, 0, 0),
-            datetime.datetime(1973, 5, 28, 0, 0), datetime.datetime(1974, 5, 27, 0, 0),
-            datetime.datetime(1975, 5, 26, 0, 0), datetime.datetime(1976, 5, 31, 0, 0),
-            datetime.datetime(1977, 5, 30, 0, 0), datetime.datetime(1978, 5, 29, 0, 0),
-            datetime.datetime(1979, 5, 28, 0, 0)])
-
-
-
-
-class TestHolidayConflictingArguments(tm.TestCase):
-
-    # GH 10217
-
-    def test_both_offset_observance_raises(self):
-
-        with self.assertRaises(NotImplementedError) as cm:
-            h = Holiday("Cyber Monday", month=11, day=1,
-                        offset=[DateOffset(weekday=SA(4))], observance=next_monday)
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_util.py b/pandas/tests/test_util.py
deleted file mode 100644
index 427c96a839c26..0000000000000
--- a/pandas/tests/test_util.py
+++ /dev/null
@@ -1,78 +0,0 @@
-# -*- coding: utf-8 -*-
-import nose
-
-from pandas.util.decorators import deprecate_kwarg
-import pandas.util.testing as tm
-
-
-
-class TestDecorators(tm.TestCase):
-    def setUp(self):
-        @deprecate_kwarg('old', 'new')
-        def _f1(new=False):
-            return new
-
-        @deprecate_kwarg('old', 'new', {'yes': True, 'no': False})
-        def _f2(new=False):
-            return new
-
-        @deprecate_kwarg('old', 'new', lambda x: x+1)
-        def _f3(new=0):
-            return new
-
-        self.f1 = _f1
-        self.f2 = _f2
-        self.f3 = _f3
-
-    def test_deprecate_kwarg(self):
-        x = 78
-        with tm.assert_produces_warning(FutureWarning):
-            result = self.f1(old=x)
-        self.assertIs(result, x)
-        with tm.assert_produces_warning(None):
-            self.f1(new=x)
-
-    def test_dict_deprecate_kwarg(self):
-        x = 'yes'
-        with tm.assert_produces_warning(FutureWarning):
-            result = self.f2(old=x)
-        self.assertEqual(result, True)
-
-    def test_missing_deprecate_kwarg(self):
-        x = 'bogus'
-        with tm.assert_produces_warning(FutureWarning):
-            result = self.f2(old=x)
-        self.assertEqual(result, 'bogus')
-
-    def test_callable_deprecate_kwarg(self):
-        x = 5
-        with tm.assert_produces_warning(FutureWarning):
-            result = self.f3(old=x)
-        self.assertEqual(result, x+1)
-        with tm.assertRaises(TypeError):
-            self.f3(old='hello')
-
-    def test_bad_deprecate_kwarg(self):
-        with tm.assertRaises(TypeError):
-            @deprecate_kwarg('old', 'new', 0)
-            def f4(new=None):
-                pass
-
-
-def test_rands():
-    r = tm.rands(10)
-    assert(len(r) == 10)
-
-
-def test_rands_array():
-    arr = tm.rands_array(5, size=10)
-    assert(arr.shape == (10,))
-    assert(len(arr[0]) == 5)
-
-    arr = tm.rands_array(7, size=(10, 10))
-    assert(arr.shape == (10, 10))
-    assert(len(arr[1, 1]) == 7)
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tests/test_window.py b/pandas/tests/test_window.py
new file mode 100644
index 0000000000000..78d1fa84cc5db
--- /dev/null
+++ b/pandas/tests/test_window.py
@@ -0,0 +1,3905 @@
+from itertools import product
+import pytest
+import warnings
+from warnings import catch_warnings
+
+from datetime import datetime, timedelta
+from numpy.random import randn
+import numpy as np
+from pandas import _np_version_under1p12
+
+import pandas as pd
+from pandas import (Series, DataFrame, bdate_range,
+                    isna, notna, concat, Timestamp, Index)
+import pandas.core.window as rwindow
+import pandas.tseries.offsets as offsets
+from pandas.core.base import SpecificationError
+from pandas.errors import UnsupportedFunctionCall
+from pandas.core.sorting import safe_sort
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas.compat import range, zip
+
+N, K = 100, 10
+
+
+def assert_equal(left, right):
+    if isinstance(left, Series):
+        tm.assert_series_equal(left, right)
+    else:
+        tm.assert_frame_equal(left, right)
+
+
+@pytest.fixture(params=[True, False])
+def raw(request):
+    return request.param
+
+
+@pytest.fixture(params=['triang', 'blackman', 'hamming', 'bartlett', 'bohman',
+                        'blackmanharris', 'nuttall', 'barthann'])
+def win_types(request):
+    return request.param
+
+
+@pytest.fixture(params=['kaiser', 'gaussian', 'general_gaussian'])
+def win_types_special(request):
+    return request.param
+
+
+class Base(object):
+
+    _nan_locs = np.arange(20, 40)
+    _inf_locs = np.array([])
+
+    def _create_data(self):
+        arr = randn(N)
+        arr[self._nan_locs] = np.NaN
+
+        self.arr = arr
+        self.rng = bdate_range(datetime(2009, 1, 1), periods=N)
+        self.series = Series(arr.copy(), index=self.rng)
+        self.frame = DataFrame(randn(N, K), index=self.rng,
+                               columns=np.arange(K))
+
+
+class TestApi(Base):
+
+    def setup_method(self, method):
+        self._create_data()
+
+    def test_getitem(self):
+
+        r = self.frame.rolling(window=5)
+        tm.assert_index_equal(r._selected_obj.columns, self.frame.columns)
+
+        r = self.frame.rolling(window=5)[1]
+        assert r._selected_obj.name == self.frame.columns[1]
+
+        # technically this is allowed
+        r = self.frame.rolling(window=5)[1, 3]
+        tm.assert_index_equal(r._selected_obj.columns,
+                              self.frame.columns[[1, 3]])
+
+        r = self.frame.rolling(window=5)[[1, 3]]
+        tm.assert_index_equal(r._selected_obj.columns,
+                              self.frame.columns[[1, 3]])
+
+    def test_select_bad_cols(self):
+        df = DataFrame([[1, 2]], columns=['A', 'B'])
+        g = df.rolling(window=5)
+        pytest.raises(KeyError, g.__getitem__, ['C'])  # g[['C']]
+
+        pytest.raises(KeyError, g.__getitem__, ['A', 'C'])  # g[['A', 'C']]
+        with tm.assert_raises_regex(KeyError, '^[^A]+$'):
+            # A should not be referenced as a bad column...
+            # will have to rethink regex if you change message!
+            g[['A', 'C']]
+
+    def test_attribute_access(self):
+
+        df = DataFrame([[1, 2]], columns=['A', 'B'])
+        r = df.rolling(window=5)
+        tm.assert_series_equal(r.A.sum(), r['A'].sum())
+        pytest.raises(AttributeError, lambda: r.F)
+
+    def tests_skip_nuisance(self):
+
+        df = DataFrame({'A': range(5), 'B': range(5, 10), 'C': 'foo'})
+        r = df.rolling(window=3)
+        result = r[['A', 'B']].sum()
+        expected = DataFrame({'A': [np.nan, np.nan, 3, 6, 9],
+                              'B': [np.nan, np.nan, 18, 21, 24]},
+                             columns=list('AB'))
+        tm.assert_frame_equal(result, expected)
+
+    def test_skip_sum_object_raises(self):
+        df = DataFrame({'A': range(5), 'B': range(5, 10), 'C': 'foo'})
+        r = df.rolling(window=3)
+
+        with tm.assert_raises_regex(TypeError, 'cannot handle this type'):
+            r.sum()
+
+    def test_agg(self):
+        df = DataFrame({'A': range(5), 'B': range(0, 10, 2)})
+
+        r = df.rolling(window=3)
+        a_mean = r['A'].mean()
+        a_std = r['A'].std()
+        a_sum = r['A'].sum()
+        b_mean = r['B'].mean()
+        b_std = r['B'].std()
+        b_sum = r['B'].sum()
+
+        result = r.aggregate([np.mean, np.std])
+        expected = concat([a_mean, a_std, b_mean, b_std], axis=1)
+        expected.columns = pd.MultiIndex.from_product([['A', 'B'], ['mean',
+                                                                    'std']])
+        tm.assert_frame_equal(result, expected)
+
+        result = r.aggregate({'A': np.mean, 'B': np.std})
+
+        expected = concat([a_mean, b_std], axis=1)
+        tm.assert_frame_equal(result, expected, check_like=True)
+
+        result = r.aggregate({'A': ['mean', 'std']})
+        expected = concat([a_mean, a_std], axis=1)
+        expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'), ('A',
+                                                                      'std')])
+        tm.assert_frame_equal(result, expected)
+
+        result = r['A'].aggregate(['mean', 'sum'])
+        expected = concat([a_mean, a_sum], axis=1)
+        expected.columns = ['mean', 'sum']
+        tm.assert_frame_equal(result, expected)
+
+        with catch_warnings(record=True):
+            result = r.aggregate({'A': {'mean': 'mean', 'sum': 'sum'}})
+        expected = concat([a_mean, a_sum], axis=1)
+        expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
+                                                      ('A', 'sum')])
+        tm.assert_frame_equal(result, expected, check_like=True)
+
+        with catch_warnings(record=True):
+            result = r.aggregate({'A': {'mean': 'mean',
+                                        'sum': 'sum'},
+                                  'B': {'mean2': 'mean',
+                                        'sum2': 'sum'}})
+        expected = concat([a_mean, a_sum, b_mean, b_sum], axis=1)
+        exp_cols = [('A', 'mean'), ('A', 'sum'), ('B', 'mean2'), ('B', 'sum2')]
+        expected.columns = pd.MultiIndex.from_tuples(exp_cols)
+        tm.assert_frame_equal(result, expected, check_like=True)
+
+        result = r.aggregate({'A': ['mean', 'std'], 'B': ['mean', 'std']})
+        expected = concat([a_mean, a_std, b_mean, b_std], axis=1)
+
+        exp_cols = [('A', 'mean'), ('A', 'std'), ('B', 'mean'), ('B', 'std')]
+        expected.columns = pd.MultiIndex.from_tuples(exp_cols)
+        tm.assert_frame_equal(result, expected, check_like=True)
+
+    def test_agg_apply(self, raw):
+
+        # passed lambda
+        df = DataFrame({'A': range(5), 'B': range(0, 10, 2)})
+
+        r = df.rolling(window=3)
+        a_sum = r['A'].sum()
+
+        result = r.agg({'A': np.sum, 'B': lambda x: np.std(x, ddof=1)})
+        rcustom = r['B'].apply(lambda x: np.std(x, ddof=1), raw=raw)
+        expected = concat([a_sum, rcustom], axis=1)
+        tm.assert_frame_equal(result, expected, check_like=True)
+
+    def test_agg_consistency(self):
+
+        df = DataFrame({'A': range(5), 'B': range(0, 10, 2)})
+        r = df.rolling(window=3)
+
+        result = r.agg([np.sum, np.mean]).columns
+        expected = pd.MultiIndex.from_product([list('AB'), ['sum', 'mean']])
+        tm.assert_index_equal(result, expected)
+
+        result = r['A'].agg([np.sum, np.mean]).columns
+        expected = Index(['sum', 'mean'])
+        tm.assert_index_equal(result, expected)
+
+        result = r.agg({'A': [np.sum, np.mean]}).columns
+        expected = pd.MultiIndex.from_tuples([('A', 'sum'), ('A', 'mean')])
+        tm.assert_index_equal(result, expected)
+
+    def test_agg_nested_dicts(self):
+
+        # API change for disallowing these types of nested dicts
+        df = DataFrame({'A': range(5), 'B': range(0, 10, 2)})
+        r = df.rolling(window=3)
+
+        def f():
+            r.aggregate({'r1': {'A': ['mean', 'sum']},
+                         'r2': {'B': ['mean', 'sum']}})
+
+        pytest.raises(SpecificationError, f)
+
+        expected = concat([r['A'].mean(), r['A'].std(),
+                           r['B'].mean(), r['B'].std()], axis=1)
+        expected.columns = pd.MultiIndex.from_tuples([('ra', 'mean'), (
+            'ra', 'std'), ('rb', 'mean'), ('rb', 'std')])
+        with catch_warnings(record=True):
+            result = r[['A', 'B']].agg({'A': {'ra': ['mean', 'std']},
+                                        'B': {'rb': ['mean', 'std']}})
+        tm.assert_frame_equal(result, expected, check_like=True)
+
+        with catch_warnings(record=True):
+            result = r.agg({'A': {'ra': ['mean', 'std']},
+                            'B': {'rb': ['mean', 'std']}})
+        expected.columns = pd.MultiIndex.from_tuples([('A', 'ra', 'mean'), (
+            'A', 'ra', 'std'), ('B', 'rb', 'mean'), ('B', 'rb', 'std')])
+        tm.assert_frame_equal(result, expected, check_like=True)
+
+    def test_count_nonnumeric_types(self):
+        # GH12541
+        cols = ['int', 'float', 'string', 'datetime', 'timedelta', 'periods',
+                'fl_inf', 'fl_nan', 'str_nan', 'dt_nat', 'periods_nat']
+
+        df = DataFrame(
+            {'int': [1, 2, 3],
+             'float': [4., 5., 6.],
+             'string': list('abc'),
+             'datetime': pd.date_range('20170101', periods=3),
+             'timedelta': pd.timedelta_range('1 s', periods=3, freq='s'),
+             'periods': [pd.Period('2012-01'), pd.Period('2012-02'),
+                         pd.Period('2012-03')],
+             'fl_inf': [1., 2., np.Inf],
+             'fl_nan': [1., 2., np.NaN],
+             'str_nan': ['aa', 'bb', np.NaN],
+             'dt_nat': [Timestamp('20170101'), Timestamp('20170203'),
+                        Timestamp(None)],
+             'periods_nat': [pd.Period('2012-01'), pd.Period('2012-02'),
+                             pd.Period(None)]},
+            columns=cols)
+
+        expected = DataFrame(
+            {'int': [1., 2., 2.],
+             'float': [1., 2., 2.],
+             'string': [1., 2., 2.],
+             'datetime': [1., 2., 2.],
+             'timedelta': [1., 2., 2.],
+             'periods': [1., 2., 2.],
+             'fl_inf': [1., 2., 2.],
+             'fl_nan': [1., 2., 1.],
+             'str_nan': [1., 2., 1.],
+             'dt_nat': [1., 2., 1.],
+             'periods_nat': [1., 2., 1.]},
+            columns=cols)
+
+        result = df.rolling(window=2).count()
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(1).count()
+        expected = df.notna().astype(float)
+        tm.assert_frame_equal(result, expected)
+
+    @td.skip_if_no_scipy
+    def test_window_with_args(self):
+        # make sure that we are aggregating window functions correctly with arg
+        r = Series(np.random.randn(100)).rolling(window=10, min_periods=1,
+                                                 win_type='gaussian')
+        expected = concat([r.mean(std=10), r.mean(std=.01)], axis=1)
+        expected.columns = ['<lambda>', '<lambda>']
+        result = r.aggregate([lambda x: x.mean(std=10),
+                              lambda x: x.mean(std=.01)])
+        tm.assert_frame_equal(result, expected)
+
+        def a(x):
+            return x.mean(std=10)
+
+        def b(x):
+            return x.mean(std=0.01)
+
+        expected = concat([r.mean(std=10), r.mean(std=.01)], axis=1)
+        expected.columns = ['a', 'b']
+        result = r.aggregate([a, b])
+        tm.assert_frame_equal(result, expected)
+
+    def test_preserve_metadata(self):
+        # GH 10565
+        s = Series(np.arange(100), name='foo')
+
+        s2 = s.rolling(30).sum()
+        s3 = s.rolling(20).sum()
+        assert s2.name == 'foo'
+        assert s3.name == 'foo'
+
+
+class TestWindow(Base):
+
+    def setup_method(self, method):
+        self._create_data()
+
+    @td.skip_if_no_scipy
+    @pytest.mark.parametrize(
+        'which', ['series', 'frame'])
+    def test_constructor(self, which):
+        # GH 12669
+
+        o = getattr(self, which)
+        c = o.rolling
+
+        # valid
+        c(win_type='boxcar', window=2, min_periods=1)
+        c(win_type='boxcar', window=2, min_periods=1, center=True)
+        c(win_type='boxcar', window=2, min_periods=1, center=False)
+
+        # not valid
+        for w in [2., 'foo', np.array([2])]:
+            with pytest.raises(ValueError):
+                c(win_type='boxcar', window=2, min_periods=w)
+            with pytest.raises(ValueError):
+                c(win_type='boxcar', window=2, min_periods=1, center=w)
+
+        for wt in ['foobar', 1]:
+            with pytest.raises(ValueError):
+                c(win_type=wt, window=2)
+
+    @td.skip_if_no_scipy
+    @pytest.mark.parametrize(
+        'which', ['series', 'frame'])
+    def test_constructor_with_win_type(self, which, win_types):
+        # GH 12669
+        o = getattr(self, which)
+        c = o.rolling
+        c(win_type=win_types, window=2)
+
+    @pytest.mark.parametrize(
+        'method', ['sum', 'mean'])
+    def test_numpy_compat(self, method):
+        # see gh-12811
+        w = rwindow.Window(Series([2, 4, 6]), window=[0, 2])
+
+        msg = "numpy operations are not valid with window objects"
+
+        tm.assert_raises_regex(UnsupportedFunctionCall, msg,
+                               getattr(w, method), 1, 2, 3)
+        tm.assert_raises_regex(UnsupportedFunctionCall, msg,
+                               getattr(w, method), dtype=np.float64)
+
+
+class TestRolling(Base):
+
+    def setup_method(self, method):
+        self._create_data()
+
+    def test_doc_string(self):
+
+        df = DataFrame({'B': [0, 1, 2, np.nan, 4]})
+        df
+        df.rolling(2).sum()
+        df.rolling(2, min_periods=1).sum()
+
+    @pytest.mark.parametrize(
+        'which', ['series', 'frame'])
+    def test_constructor(self, which):
+        # GH 12669
+
+        o = getattr(self, which)
+        c = o.rolling
+
+        # valid
+        c(window=2)
+        c(window=2, min_periods=1)
+        c(window=2, min_periods=1, center=True)
+        c(window=2, min_periods=1, center=False)
+
+        # GH 13383
+        with pytest.raises(ValueError):
+            c(0)
+            c(-1)
+
+        # not valid
+        for w in [2., 'foo', np.array([2])]:
+            with pytest.raises(ValueError):
+                c(window=w)
+            with pytest.raises(ValueError):
+                c(window=2, min_periods=w)
+            with pytest.raises(ValueError):
+                c(window=2, min_periods=1, center=w)
+
+    @td.skip_if_no_scipy
+    @pytest.mark.parametrize(
+        'which', ['series', 'frame'])
+    def test_constructor_with_win_type(self, which):
+        # GH 13383
+        o = getattr(self, which)
+        c = o.rolling
+        with pytest.raises(ValueError):
+            c(-1, win_type='boxcar')
+
+    @pytest.mark.parametrize(
+        'window', [timedelta(days=3), pd.Timedelta(days=3)])
+    def test_constructor_with_timedelta_window(self, window):
+        # GH 15440
+        n = 10
+        df = DataFrame({'value': np.arange(n)},
+                       index=pd.date_range('2015-12-24', periods=n, freq="D"))
+        expected_data = np.append([0., 1.], np.arange(3., 27., 3))
+
+        result = df.rolling(window=window).sum()
+        expected = DataFrame({'value': expected_data},
+                             index=pd.date_range('2015-12-24', periods=n,
+                                                 freq="D"))
+        tm.assert_frame_equal(result, expected)
+        expected = df.rolling('3D').sum()
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        'window', [timedelta(days=3), pd.Timedelta(days=3), '3D'])
+    def test_constructor_timedelta_window_and_minperiods(self, window, raw):
+        # GH 15305
+        n = 10
+        df = DataFrame({'value': np.arange(n)},
+                       index=pd.date_range('2017-08-08', periods=n, freq="D"))
+        expected = DataFrame(
+            {'value': np.append([np.NaN, 1.], np.arange(3., 27., 3))},
+            index=pd.date_range('2017-08-08', periods=n, freq="D"))
+        result_roll_sum = df.rolling(window=window, min_periods=2).sum()
+        result_roll_generic = df.rolling(window=window,
+                                         min_periods=2).apply(sum, raw=raw)
+        tm.assert_frame_equal(result_roll_sum, expected)
+        tm.assert_frame_equal(result_roll_generic, expected)
+
+    @pytest.mark.parametrize(
+        'method', ['std', 'mean', 'sum', 'max', 'min', 'var'])
+    def test_numpy_compat(self, method):
+        # see gh-12811
+        r = rwindow.Rolling(Series([2, 4, 6]), window=2)
+
+        msg = "numpy operations are not valid with window objects"
+
+        tm.assert_raises_regex(UnsupportedFunctionCall, msg,
+                               getattr(r, method), 1, 2, 3)
+        tm.assert_raises_regex(UnsupportedFunctionCall, msg,
+                               getattr(r, method), dtype=np.float64)
+
+    def test_closed(self):
+        df = DataFrame({'A': [0, 1, 2, 3, 4]})
+        # closed only allowed for datetimelike
+        with pytest.raises(ValueError):
+            df.rolling(window=3, closed='neither')
+
+    @pytest.mark.parametrize('roller', ['1s', 1])
+    def tests_empty_df_rolling(self, roller):
+        # GH 15819 Verifies that datetime and integer rolling windows can be
+        # applied to empty DataFrames
+        expected = DataFrame()
+        result = DataFrame().rolling(roller).sum()
+        tm.assert_frame_equal(result, expected)
+
+        # Verifies that datetime and integer rolling windows can be applied to
+        # empty DataFrames with datetime index
+        expected = DataFrame(index=pd.DatetimeIndex([]))
+        result = DataFrame(index=pd.DatetimeIndex([])).rolling(roller).sum()
+        tm.assert_frame_equal(result, expected)
+
+    def test_missing_minp_zero(self):
+        # https://github.com/pandas-dev/pandas/pull/18921
+        # minp=0
+        x = pd.Series([np.nan])
+        result = x.rolling(1, min_periods=0).sum()
+        expected = pd.Series([0.0])
+        tm.assert_series_equal(result, expected)
+
+        # minp=1
+        result = x.rolling(1, min_periods=1).sum()
+        expected = pd.Series([np.nan])
+        tm.assert_series_equal(result, expected)
+
+    def test_missing_minp_zero_variable(self):
+        # https://github.com/pandas-dev/pandas/pull/18921
+        x = pd.Series([np.nan] * 4,
+                      index=pd.DatetimeIndex(['2017-01-01', '2017-01-04',
+                                              '2017-01-06', '2017-01-07']))
+        result = x.rolling(pd.Timedelta("2d"), min_periods=0).sum()
+        expected = pd.Series(0.0, index=x.index)
+        tm.assert_series_equal(result, expected)
+
+    def test_multi_index_names(self):
+
+        # GH 16789, 16825
+        cols = pd.MultiIndex.from_product([['A', 'B'], ['C', 'D', 'E']],
+                                          names=['1', '2'])
+        df = DataFrame(np.ones((10, 6)), columns=cols)
+        result = df.rolling(3).cov()
+
+        tm.assert_index_equal(result.columns, df.columns)
+        assert result.index.names == [None, '1', '2']
+
+    @pytest.mark.parametrize('klass', [pd.Series, pd.DataFrame])
+    def test_iter_raises(self, klass):
+        # https://github.com/pandas-dev/pandas/issues/11704
+        # Iteration over a Window
+        obj = klass([1, 2, 3, 4])
+        with pytest.raises(NotImplementedError):
+            iter(obj.rolling(2))
+
+
+class TestExpanding(Base):
+
+    def setup_method(self, method):
+        self._create_data()
+
+    def test_doc_string(self):
+
+        df = DataFrame({'B': [0, 1, 2, np.nan, 4]})
+        df
+        df.expanding(2).sum()
+
+    @pytest.mark.parametrize(
+        'which', ['series', 'frame'])
+    def test_constructor(self, which):
+        # GH 12669
+
+        o = getattr(self, which)
+        c = o.expanding
+
+        # valid
+        c(min_periods=1)
+        c(min_periods=1, center=True)
+        c(min_periods=1, center=False)
+
+        # not valid
+        for w in [2., 'foo', np.array([2])]:
+            with pytest.raises(ValueError):
+                c(min_periods=w)
+            with pytest.raises(ValueError):
+                c(min_periods=1, center=w)
+
+    @pytest.mark.parametrize(
+        'method', ['std', 'mean', 'sum', 'max', 'min', 'var'])
+    def test_numpy_compat(self, method):
+        # see gh-12811
+        e = rwindow.Expanding(Series([2, 4, 6]), window=2)
+
+        msg = "numpy operations are not valid with window objects"
+
+        tm.assert_raises_regex(UnsupportedFunctionCall, msg,
+                               getattr(e, method), 1, 2, 3)
+        tm.assert_raises_regex(UnsupportedFunctionCall, msg,
+                               getattr(e, method), dtype=np.float64)
+
+    @pytest.mark.parametrize(
+        'expander',
+        [1, pytest.param('ls', marks=pytest.mark.xfail(
+                         reason='GH 16425 expanding with '
+                                'offset not supported'))])
+    def test_empty_df_expanding(self, expander):
+        # GH 15819 Verifies that datetime and integer expanding windows can be
+        # applied to empty DataFrames
+
+        expected = DataFrame()
+        result = DataFrame().expanding(expander).sum()
+        tm.assert_frame_equal(result, expected)
+
+        # Verifies that datetime and integer expanding windows can be applied
+        # to empty DataFrames with datetime index
+        expected = DataFrame(index=pd.DatetimeIndex([]))
+        result = DataFrame(
+            index=pd.DatetimeIndex([])).expanding(expander).sum()
+        tm.assert_frame_equal(result, expected)
+
+    def test_missing_minp_zero(self):
+        # https://github.com/pandas-dev/pandas/pull/18921
+        # minp=0
+        x = pd.Series([np.nan])
+        result = x.expanding(min_periods=0).sum()
+        expected = pd.Series([0.0])
+        tm.assert_series_equal(result, expected)
+
+        # minp=1
+        result = x.expanding(min_periods=1).sum()
+        expected = pd.Series([np.nan])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('klass', [pd.Series, pd.DataFrame])
+    def test_iter_raises(self, klass):
+        # https://github.com/pandas-dev/pandas/issues/11704
+        # Iteration over a Window
+        obj = klass([1, 2, 3, 4])
+        with pytest.raises(NotImplementedError):
+            iter(obj.expanding(2))
+
+
+class TestEWM(Base):
+
+    def setup_method(self, method):
+        self._create_data()
+
+    def test_doc_string(self):
+
+        df = DataFrame({'B': [0, 1, 2, np.nan, 4]})
+        df
+        df.ewm(com=0.5).mean()
+
+    @pytest.mark.parametrize(
+        'which', ['series', 'frame'])
+    def test_constructor(self, which):
+        o = getattr(self, which)
+        c = o.ewm
+
+        # valid
+        c(com=0.5)
+        c(span=1.5)
+        c(alpha=0.5)
+        c(halflife=0.75)
+        c(com=0.5, span=None)
+        c(alpha=0.5, com=None)
+        c(halflife=0.75, alpha=None)
+
+        # not valid: mutually exclusive
+        with pytest.raises(ValueError):
+            c(com=0.5, alpha=0.5)
+        with pytest.raises(ValueError):
+            c(span=1.5, halflife=0.75)
+        with pytest.raises(ValueError):
+            c(alpha=0.5, span=1.5)
+
+        # not valid: com < 0
+        with pytest.raises(ValueError):
+            c(com=-0.5)
+
+        # not valid: span < 1
+        with pytest.raises(ValueError):
+            c(span=0.5)
+
+        # not valid: halflife <= 0
+        with pytest.raises(ValueError):
+            c(halflife=0)
+
+        # not valid: alpha <= 0 or alpha > 1
+        for alpha in (-0.5, 1.5):
+            with pytest.raises(ValueError):
+                c(alpha=alpha)
+
+    @pytest.mark.parametrize(
+        'method', ['std', 'mean', 'var'])
+    def test_numpy_compat(self, method):
+        # see gh-12811
+        e = rwindow.EWM(Series([2, 4, 6]), alpha=0.5)
+
+        msg = "numpy operations are not valid with window objects"
+
+        tm.assert_raises_regex(UnsupportedFunctionCall, msg,
+                               getattr(e, method), 1, 2, 3)
+        tm.assert_raises_regex(UnsupportedFunctionCall, msg,
+                               getattr(e, method), dtype=np.float64)
+
+
+# gh-12373 : rolling functions error on float32 data
+# make sure rolling functions works for different dtypes
+#
+# NOTE that these are yielded tests and so _create_data
+# is explicitly called.
+#
+# further note that we are only checking rolling for fully dtype
+# compliance (though both expanding and ewm inherit)
+class Dtype(object):
+    window = 2
+
+    funcs = {
+        'count': lambda v: v.count(),
+        'max': lambda v: v.max(),
+        'min': lambda v: v.min(),
+        'sum': lambda v: v.sum(),
+        'mean': lambda v: v.mean(),
+        'std': lambda v: v.std(),
+        'var': lambda v: v.var(),
+        'median': lambda v: v.median()
+    }
+
+    def get_expects(self):
+        expects = {
+            'sr1': {
+                'count': Series([1, 2, 2, 2, 2], dtype='float64'),
+                'max': Series([np.nan, 1, 2, 3, 4], dtype='float64'),
+                'min': Series([np.nan, 0, 1, 2, 3], dtype='float64'),
+                'sum': Series([np.nan, 1, 3, 5, 7], dtype='float64'),
+                'mean': Series([np.nan, .5, 1.5, 2.5, 3.5], dtype='float64'),
+                'std': Series([np.nan] + [np.sqrt(.5)] * 4, dtype='float64'),
+                'var': Series([np.nan, .5, .5, .5, .5], dtype='float64'),
+                'median': Series([np.nan, .5, 1.5, 2.5, 3.5], dtype='float64')
+            },
+            'sr2': {
+                'count': Series([1, 2, 2, 2, 2], dtype='float64'),
+                'max': Series([np.nan, 10, 8, 6, 4], dtype='float64'),
+                'min': Series([np.nan, 8, 6, 4, 2], dtype='float64'),
+                'sum': Series([np.nan, 18, 14, 10, 6], dtype='float64'),
+                'mean': Series([np.nan, 9, 7, 5, 3], dtype='float64'),
+                'std': Series([np.nan] + [np.sqrt(2)] * 4, dtype='float64'),
+                'var': Series([np.nan, 2, 2, 2, 2], dtype='float64'),
+                'median': Series([np.nan, 9, 7, 5, 3], dtype='float64')
+            },
+            'df': {
+                'count': DataFrame({0: Series([1, 2, 2, 2, 2]),
+                                    1: Series([1, 2, 2, 2, 2])},
+                                   dtype='float64'),
+                'max': DataFrame({0: Series([np.nan, 2, 4, 6, 8]),
+                                  1: Series([np.nan, 3, 5, 7, 9])},
+                                 dtype='float64'),
+                'min': DataFrame({0: Series([np.nan, 0, 2, 4, 6]),
+                                  1: Series([np.nan, 1, 3, 5, 7])},
+                                 dtype='float64'),
+                'sum': DataFrame({0: Series([np.nan, 2, 6, 10, 14]),
+                                  1: Series([np.nan, 4, 8, 12, 16])},
+                                 dtype='float64'),
+                'mean': DataFrame({0: Series([np.nan, 1, 3, 5, 7]),
+                                   1: Series([np.nan, 2, 4, 6, 8])},
+                                  dtype='float64'),
+                'std': DataFrame({0: Series([np.nan] + [np.sqrt(2)] * 4),
+                                  1: Series([np.nan] + [np.sqrt(2)] * 4)},
+                                 dtype='float64'),
+                'var': DataFrame({0: Series([np.nan, 2, 2, 2, 2]),
+                                  1: Series([np.nan, 2, 2, 2, 2])},
+                                 dtype='float64'),
+                'median': DataFrame({0: Series([np.nan, 1, 3, 5, 7]),
+                                     1: Series([np.nan, 2, 4, 6, 8])},
+                                    dtype='float64'),
+            }
+        }
+        return expects
+
+    def _create_dtype_data(self, dtype):
+        sr1 = Series(np.arange(5), dtype=dtype)
+        sr2 = Series(np.arange(10, 0, -2), dtype=dtype)
+        df = DataFrame(np.arange(10).reshape((5, 2)), dtype=dtype)
+
+        data = {
+            'sr1': sr1,
+            'sr2': sr2,
+            'df': df
+        }
+
+        return data
+
+    def _create_data(self):
+        self.data = self._create_dtype_data(self.dtype)
+        self.expects = self.get_expects()
+
+    def test_dtypes(self):
+        self._create_data()
+        for f_name, d_name in product(self.funcs.keys(), self.data.keys()):
+
+            f = self.funcs[f_name]
+            d = self.data[d_name]
+            exp = self.expects[d_name][f_name]
+            self.check_dtypes(f, f_name, d, d_name, exp)
+
+    def check_dtypes(self, f, f_name, d, d_name, exp):
+        roll = d.rolling(window=self.window)
+        result = f(roll)
+        tm.assert_almost_equal(result, exp)
+
+
+class TestDtype_object(Dtype):
+    dtype = object
+
+
+class Dtype_integer(Dtype):
+    pass
+
+
+class TestDtype_int8(Dtype_integer):
+    dtype = np.int8
+
+
+class TestDtype_int16(Dtype_integer):
+    dtype = np.int16
+
+
+class TestDtype_int32(Dtype_integer):
+    dtype = np.int32
+
+
+class TestDtype_int64(Dtype_integer):
+    dtype = np.int64
+
+
+class Dtype_uinteger(Dtype):
+    pass
+
+
+class TestDtype_uint8(Dtype_uinteger):
+    dtype = np.uint8
+
+
+class TestDtype_uint16(Dtype_uinteger):
+    dtype = np.uint16
+
+
+class TestDtype_uint32(Dtype_uinteger):
+    dtype = np.uint32
+
+
+class TestDtype_uint64(Dtype_uinteger):
+    dtype = np.uint64
+
+
+class Dtype_float(Dtype):
+    pass
+
+
+class TestDtype_float16(Dtype_float):
+    dtype = np.float16
+
+
+class TestDtype_float32(Dtype_float):
+    dtype = np.float32
+
+
+class TestDtype_float64(Dtype_float):
+    dtype = np.float64
+
+
+class TestDtype_category(Dtype):
+    dtype = 'category'
+    include_df = False
+
+    def _create_dtype_data(self, dtype):
+        sr1 = Series(range(5), dtype=dtype)
+        sr2 = Series(range(10, 0, -2), dtype=dtype)
+
+        data = {
+            'sr1': sr1,
+            'sr2': sr2
+        }
+
+        return data
+
+
+class DatetimeLike(Dtype):
+
+    def check_dtypes(self, f, f_name, d, d_name, exp):
+
+        roll = d.rolling(window=self.window)
+
+        if f_name == 'count':
+            result = f(roll)
+            tm.assert_almost_equal(result, exp)
+
+        else:
+
+            # other methods not Implemented ATM
+            with pytest.raises(NotImplementedError):
+                f(roll)
+
+
+class TestDtype_timedelta(DatetimeLike):
+    dtype = np.dtype('m8[ns]')
+
+
+class TestDtype_datetime(DatetimeLike):
+    dtype = np.dtype('M8[ns]')
+
+
+class TestDtype_datetime64UTC(DatetimeLike):
+    dtype = 'datetime64[ns, UTC]'
+
+    def _create_data(self):
+        pytest.skip("direct creation of extension dtype "
+                    "datetime64[ns, UTC] is not supported ATM")
+
+
+class TestMoments(Base):
+
+    def setup_method(self, method):
+        self._create_data()
+
+    def test_centered_axis_validation(self):
+
+        # ok
+        Series(np.ones(10)).rolling(window=3, center=True, axis=0).mean()
+
+        # bad axis
+        with pytest.raises(ValueError):
+            Series(np.ones(10)).rolling(window=3, center=True, axis=1).mean()
+
+        # ok ok
+        DataFrame(np.ones((10, 10))).rolling(window=3, center=True,
+                                             axis=0).mean()
+        DataFrame(np.ones((10, 10))).rolling(window=3, center=True,
+                                             axis=1).mean()
+
+        # bad axis
+        with pytest.raises(ValueError):
+            (DataFrame(np.ones((10, 10)))
+             .rolling(window=3, center=True, axis=2).mean())
+
+    def test_rolling_sum(self):
+        self._check_moment_func(np.nansum, name='sum',
+                                zero_min_periods_equal=False)
+
+    def test_rolling_count(self):
+        counter = lambda x: np.isfinite(x).astype(float).sum()
+        self._check_moment_func(counter, name='count', has_min_periods=False,
+                                fill_value=0)
+
+    def test_rolling_mean(self):
+        self._check_moment_func(np.mean, name='mean')
+
+    @td.skip_if_no_scipy
+    def test_cmov_mean(self):
+        # GH 8238
+        vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81, 13.49, 16.68, 9.48,
+                         10.63, 14.48])
+        result = Series(vals).rolling(5, center=True).mean()
+        expected = Series([np.nan, np.nan, 9.962, 11.27, 11.564, 12.516,
+                           12.818, 12.952, np.nan, np.nan])
+        tm.assert_series_equal(expected, result)
+
+    @td.skip_if_no_scipy
+    def test_cmov_window(self):
+        # GH 8238
+        vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81, 13.49, 16.68, 9.48,
+                         10.63, 14.48])
+        result = Series(vals).rolling(5, win_type='boxcar', center=True).mean()
+        expected = Series([np.nan, np.nan, 9.962, 11.27, 11.564, 12.516,
+                           12.818, 12.952, np.nan, np.nan])
+        tm.assert_series_equal(expected, result)
+
+    @td.skip_if_no_scipy
+    def test_cmov_window_corner(self):
+        # GH 8238
+        # all nan
+        vals = pd.Series([np.nan] * 10)
+        result = vals.rolling(5, center=True, win_type='boxcar').mean()
+        assert np.isnan(result).all()
+
+        # empty
+        vals = pd.Series([])
+        result = vals.rolling(5, center=True, win_type='boxcar').mean()
+        assert len(result) == 0
+
+        # shorter than window
+        vals = pd.Series(np.random.randn(5))
+        result = vals.rolling(10, win_type='boxcar').mean()
+        assert np.isnan(result).all()
+        assert len(result) == 5
+
+    @td.skip_if_no_scipy
+    def test_cmov_window_frame(self):
+        # Gh 8238
+        vals = np.array([[12.18, 3.64], [10.18, 9.16], [13.24, 14.61],
+                         [4.51, 8.11], [6.15, 11.44], [9.14, 6.21],
+                         [11.31, 10.67], [2.94, 6.51], [9.42, 8.39], [12.44,
+                                                                      7.34]])
+
+        xp = np.array([[np.nan, np.nan], [np.nan, np.nan], [9.252, 9.392],
+                       [8.644, 9.906], [8.87, 10.208], [6.81, 8.588],
+                       [7.792, 8.644], [9.05, 7.824], [np.nan, np.nan
+                                                       ], [np.nan, np.nan]])
+
+        # DataFrame
+        rs = DataFrame(vals).rolling(5, win_type='boxcar', center=True).mean()
+        tm.assert_frame_equal(DataFrame(xp), rs)
+
+        # invalid method
+        with pytest.raises(AttributeError):
+            (DataFrame(vals).rolling(5, win_type='boxcar', center=True)
+             .std())
+
+        # sum
+        xp = np.array([[np.nan, np.nan], [np.nan, np.nan], [46.26, 46.96],
+                       [43.22, 49.53], [44.35, 51.04], [34.05, 42.94],
+                       [38.96, 43.22], [45.25, 39.12], [np.nan, np.nan
+                                                        ], [np.nan, np.nan]])
+
+        rs = DataFrame(vals).rolling(5, win_type='boxcar', center=True).sum()
+        tm.assert_frame_equal(DataFrame(xp), rs)
+
+    @td.skip_if_no_scipy
+    def test_cmov_window_na_min_periods(self):
+        # min_periods
+        vals = Series(np.random.randn(10))
+        vals[4] = np.nan
+        vals[8] = np.nan
+
+        xp = vals.rolling(5, min_periods=4, center=True).mean()
+        rs = vals.rolling(5, win_type='boxcar', min_periods=4,
+                          center=True).mean()
+        tm.assert_series_equal(xp, rs)
+
+    @td.skip_if_no_scipy
+    def test_cmov_window_regular(self, win_types):
+        # GH 8238
+        vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81, 13.49, 16.68, 9.48,
+                         10.63, 14.48])
+        xps = {
+            'hamming': [np.nan, np.nan, 8.71384, 9.56348, 12.38009, 14.03687,
+                        13.8567, 11.81473, np.nan, np.nan],
+            'triang': [np.nan, np.nan, 9.28667, 10.34667, 12.00556, 13.33889,
+                       13.38, 12.33667, np.nan, np.nan],
+            'barthann': [np.nan, np.nan, 8.4425, 9.1925, 12.5575, 14.3675,
+                         14.0825, 11.5675, np.nan, np.nan],
+            'bohman': [np.nan, np.nan, 7.61599, 9.1764, 12.83559, 14.17267,
+                       14.65923, 11.10401, np.nan, np.nan],
+            'blackmanharris': [np.nan, np.nan, 6.97691, 9.16438, 13.05052,
+                               14.02156, 15.10512, 10.74574, np.nan, np.nan],
+            'nuttall': [np.nan, np.nan, 7.04618, 9.16786, 13.02671, 14.03559,
+                        15.05657, 10.78514, np.nan, np.nan],
+            'blackman': [np.nan, np.nan, 7.73345, 9.17869, 12.79607, 14.20036,
+                         14.57726, 11.16988, np.nan, np.nan],
+            'bartlett': [np.nan, np.nan, 8.4425, 9.1925, 12.5575, 14.3675,
+                         14.0825, 11.5675, np.nan, np.nan]
+        }
+
+        xp = Series(xps[win_types])
+        rs = Series(vals).rolling(5, win_type=win_types, center=True).mean()
+        tm.assert_series_equal(xp, rs)
+
+    @td.skip_if_no_scipy
+    def test_cmov_window_regular_linear_range(self, win_types):
+        # GH 8238
+        vals = np.array(range(10), dtype=np.float)
+        xp = vals.copy()
+        xp[:2] = np.nan
+        xp[-2:] = np.nan
+        xp = Series(xp)
+
+        rs = Series(vals).rolling(5, win_type=win_types, center=True).mean()
+        tm.assert_series_equal(xp, rs)
+
+    @td.skip_if_no_scipy
+    def test_cmov_window_regular_missing_data(self, win_types):
+        # GH 8238
+        vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81, 13.49, 16.68, np.nan,
+                         10.63, 14.48])
+        xps = {
+            'bartlett': [np.nan, np.nan, 9.70333, 10.5225, 8.4425, 9.1925,
+                         12.5575, 14.3675, 15.61667, 13.655],
+            'blackman': [np.nan, np.nan, 9.04582, 11.41536, 7.73345, 9.17869,
+                         12.79607, 14.20036, 15.8706, 13.655],
+            'barthann': [np.nan, np.nan, 9.70333, 10.5225, 8.4425, 9.1925,
+                         12.5575, 14.3675, 15.61667, 13.655],
+            'bohman': [np.nan, np.nan, 8.9444, 11.56327, 7.61599, 9.1764,
+                       12.83559, 14.17267, 15.90976, 13.655],
+            'hamming': [np.nan, np.nan, 9.59321, 10.29694, 8.71384, 9.56348,
+                        12.38009, 14.20565, 15.24694, 13.69758],
+            'nuttall': [np.nan, np.nan, 8.47693, 12.2821, 7.04618, 9.16786,
+                        13.02671, 14.03673, 16.08759, 13.65553],
+            'triang': [np.nan, np.nan, 9.33167, 9.76125, 9.28667, 10.34667,
+                       12.00556, 13.82125, 14.49429, 13.765],
+            'blackmanharris': [np.nan, np.nan, 8.42526, 12.36824, 6.97691,
+                               9.16438, 13.05052, 14.02175, 16.1098, 13.65509]
+        }
+
+        xp = Series(xps[win_types])
+        rs = Series(vals).rolling(5, win_type=win_types, min_periods=3).mean()
+        tm.assert_series_equal(xp, rs)
+
+    @td.skip_if_no_scipy
+    def test_cmov_window_special(self, win_types_special):
+        # GH 8238
+        kwds = {
+            'kaiser': {'beta': 1.},
+            'gaussian': {'std': 1.},
+            'general_gaussian': {'power': 2., 'width': 2.}}
+
+        vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81, 13.49, 16.68, 9.48,
+                         10.63, 14.48])
+
+        xps = {
+            'gaussian': [np.nan, np.nan, 8.97297, 9.76077, 12.24763, 13.89053,
+                         13.65671, 12.01002, np.nan, np.nan],
+            'general_gaussian': [np.nan, np.nan, 9.85011, 10.71589, 11.73161,
+                                 13.08516, 12.95111, 12.74577, np.nan, np.nan],
+            'kaiser': [np.nan, np.nan, 9.86851, 11.02969, 11.65161, 12.75129,
+                       12.90702, 12.83757, np.nan, np.nan]
+        }
+
+        xp = Series(xps[win_types_special])
+        rs = Series(vals).rolling(
+            5, win_type=win_types_special, center=True).mean(
+            **kwds[win_types_special])
+        tm.assert_series_equal(xp, rs)
+
+    @td.skip_if_no_scipy
+    def test_cmov_window_special_linear_range(self, win_types_special):
+        # GH 8238
+        kwds = {
+            'kaiser': {'beta': 1.},
+            'gaussian': {'std': 1.},
+            'general_gaussian': {'power': 2., 'width': 2.},
+            'slepian': {'width': 0.5}}
+
+        vals = np.array(range(10), dtype=np.float)
+        xp = vals.copy()
+        xp[:2] = np.nan
+        xp[-2:] = np.nan
+        xp = Series(xp)
+
+        rs = Series(vals).rolling(
+            5, win_type=win_types_special, center=True).mean(
+            **kwds[win_types_special])
+        tm.assert_series_equal(xp, rs)
+
+    def test_rolling_median(self):
+        self._check_moment_func(np.median, name='median')
+
+    def test_rolling_min(self):
+        self._check_moment_func(np.min, name='min')
+
+        a = pd.Series([1, 2, 3, 4, 5])
+        result = a.rolling(window=100, min_periods=1).min()
+        expected = pd.Series(np.ones(len(a)))
+        tm.assert_series_equal(result, expected)
+
+        with pytest.raises(ValueError):
+            pd.Series([1, 2, 3]).rolling(window=3, min_periods=5).min()
+
+    def test_rolling_max(self):
+        self._check_moment_func(np.max, name='max')
+
+        a = pd.Series([1, 2, 3, 4, 5], dtype=np.float64)
+        b = a.rolling(window=100, min_periods=1).max()
+        tm.assert_almost_equal(a, b)
+
+        with pytest.raises(ValueError):
+            pd.Series([1, 2, 3]).rolling(window=3, min_periods=5).max()
+
+    @pytest.mark.parametrize('q', [0.0, .1, .5, .9, 1.0])
+    def test_rolling_quantile(self, q):
+
+        def scoreatpercentile(a, per):
+            values = np.sort(a, axis=0)
+
+            idx = int(per / 1. * (values.shape[0] - 1))
+
+            if idx == values.shape[0] - 1:
+                retval = values[-1]
+
+            else:
+                qlow = float(idx) / float(values.shape[0] - 1)
+                qhig = float(idx + 1) / float(values.shape[0] - 1)
+                vlow = values[idx]
+                vhig = values[idx + 1]
+                retval = vlow + (vhig - vlow) * (per - qlow) / (qhig - qlow)
+
+            return retval
+
+        def quantile_func(x):
+            return scoreatpercentile(x, q)
+
+        self._check_moment_func(quantile_func, name='quantile',
+                                quantile=q)
+
+    def test_rolling_quantile_np_percentile(self):
+        # #9413: Tests that rolling window's quantile default behavior
+        # is analogus to Numpy's percentile
+        row = 10
+        col = 5
+        idx = pd.date_range('20100101', periods=row, freq='B')
+        df = DataFrame(np.random.rand(row * col).reshape((row, -1)), index=idx)
+
+        df_quantile = df.quantile([0.25, 0.5, 0.75], axis=0)
+        np_percentile = np.percentile(df, [25, 50, 75], axis=0)
+
+        tm.assert_almost_equal(df_quantile.values, np.array(np_percentile))
+
+    @pytest.mark.skipif(_np_version_under1p12,
+                        reason='numpy midpoint interpolation is broken')
+    @pytest.mark.parametrize('quantile', [0.0, 0.1, 0.45, 0.5, 1])
+    @pytest.mark.parametrize('interpolation', ['linear', 'lower', 'higher',
+                                               'nearest', 'midpoint'])
+    @pytest.mark.parametrize('data', [[1., 2., 3., 4., 5., 6., 7.],
+                                      [8., 1., 3., 4., 5., 2., 6., 7.],
+                                      [0., np.nan, 0.2, np.nan, 0.4],
+                                      [np.nan, np.nan, np.nan, np.nan],
+                                      [np.nan, 0.1, np.nan, 0.3, 0.4, 0.5],
+                                      [0.5], [np.nan, 0.7, 0.6]])
+    def test_rolling_quantile_interpolation_options(self, quantile,
+                                                    interpolation, data):
+        # Tests that rolling window's quantile behavior is analogous to
+        # Series' quantile for each interpolation option
+        s = Series(data)
+
+        q1 = s.quantile(quantile, interpolation)
+        q2 = s.expanding(min_periods=1).quantile(
+            quantile, interpolation).iloc[-1]
+
+        if np.isnan(q1):
+            assert np.isnan(q2)
+        else:
+            assert q1 == q2
+
+    def test_invalid_quantile_value(self):
+        data = np.arange(5)
+        s = Series(data)
+
+        with pytest.raises(ValueError, match="Interpolation 'invalid'"
+                                             " is not supported"):
+            s.rolling(len(data), min_periods=1).quantile(
+                0.5, interpolation='invalid')
+
+    def test_rolling_quantile_param(self):
+        ser = Series([0.0, .1, .5, .9, 1.0])
+
+        with pytest.raises(ValueError):
+            ser.rolling(3).quantile(-0.1)
+
+        with pytest.raises(ValueError):
+            ser.rolling(3).quantile(10.0)
+
+        with pytest.raises(TypeError):
+            ser.rolling(3).quantile('foo')
+
+    def test_rolling_apply(self, raw):
+        # suppress warnings about empty slices, as we are deliberately testing
+        # with a 0-length Series
+
+        with warnings.catch_warnings():
+            warnings.filterwarnings("ignore",
+                                    message=".*(empty slice|0 for slice).*",
+                                    category=RuntimeWarning)
+
+            def f(x):
+                return x[np.isfinite(x)].mean()
+
+            self._check_moment_func(np.mean, name='apply', func=f, raw=raw)
+
+            expected = Series([])
+            result = expected.rolling(10).apply(lambda x: x.mean(), raw=raw)
+            tm.assert_series_equal(result, expected)
+
+        # gh-8080
+        s = Series([None, None, None])
+        result = s.rolling(2, min_periods=0).apply(lambda x: len(x), raw=raw)
+        expected = Series([1., 2., 2.])
+        tm.assert_series_equal(result, expected)
+
+        result = s.rolling(2, min_periods=0).apply(len, raw=raw)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('klass', [Series, DataFrame])
+    @pytest.mark.parametrize(
+        'method', [lambda x: x.rolling(window=2), lambda x: x.expanding()])
+    def test_apply_future_warning(self, klass, method):
+
+        # gh-5071
+        s = klass(np.arange(3))
+
+        with tm.assert_produces_warning(FutureWarning):
+            method(s).apply(lambda x: len(x))
+
+    def test_rolling_apply_out_of_bounds(self, raw):
+        # gh-1850
+        vals = pd.Series([1, 2, 3, 4])
+
+        result = vals.rolling(10).apply(np.sum, raw=raw)
+        assert result.isna().all()
+
+        result = vals.rolling(10, min_periods=1).apply(np.sum, raw=raw)
+        expected = pd.Series([1, 3, 6, 10], dtype=float)
+        tm.assert_almost_equal(result, expected)
+
+    @pytest.mark.parametrize('window', [2, '2s'])
+    def test_rolling_apply_with_pandas_objects(self, window):
+        # 5071
+        df = pd.DataFrame({'A': np.random.randn(5),
+                           'B': np.random.randint(0, 10, size=5)},
+                          index=pd.date_range('20130101', periods=5, freq='s'))
+
+        # we have an equal spaced timeseries index
+        # so simulate removing the first period
+        def f(x):
+            if x.index[0] == df.index[0]:
+                return np.nan
+            return x.iloc[-1]
+
+        result = df.rolling(window).apply(f, raw=False)
+        expected = df.iloc[2:].reindex_like(df)
+        tm.assert_frame_equal(result, expected)
+
+        with pytest.raises(AttributeError):
+            df.rolling(window).apply(f, raw=True)
+
+    def test_rolling_std(self):
+        self._check_moment_func(lambda x: np.std(x, ddof=1),
+                                name='std')
+        self._check_moment_func(lambda x: np.std(x, ddof=0),
+                                name='std', ddof=0)
+
+    def test_rolling_std_1obs(self):
+        vals = pd.Series([1., 2., 3., 4., 5.])
+
+        result = vals.rolling(1, min_periods=1).std()
+        expected = pd.Series([np.nan] * 5)
+        tm.assert_series_equal(result, expected)
+
+        result = vals.rolling(1, min_periods=1).std(ddof=0)
+        expected = pd.Series([0.] * 5)
+        tm.assert_series_equal(result, expected)
+
+        result = (pd.Series([np.nan, np.nan, 3, 4, 5])
+                    .rolling(3, min_periods=2).std())
+        assert np.isnan(result[2])
+
+    def test_rolling_std_neg_sqrt(self):
+        # unit test from Bottleneck
+
+        # Test move_nanstd for neg sqrt.
+
+        a = pd.Series([0.0011448196318903589, 0.00028718669878572767,
+                       0.00028718669878572767, 0.00028718669878572767,
+                       0.00028718669878572767])
+        b = a.rolling(window=3).std()
+        assert np.isfinite(b[2:]).all()
+
+        b = a.ewm(span=3).std()
+        assert np.isfinite(b[2:]).all()
+
+    def test_rolling_var(self):
+        self._check_moment_func(lambda x: np.var(x, ddof=1),
+                                name='var')
+        self._check_moment_func(lambda x: np.var(x, ddof=0),
+                                name='var', ddof=0)
+
+    @td.skip_if_no_scipy
+    def test_rolling_skew(self):
+        from scipy.stats import skew
+        self._check_moment_func(lambda x: skew(x, bias=False), name='skew')
+
+    @td.skip_if_no_scipy
+    def test_rolling_kurt(self):
+        from scipy.stats import kurtosis
+        self._check_moment_func(lambda x: kurtosis(x, bias=False),
+                                name='kurt')
+
+    def _check_moment_func(self, static_comp, name, has_min_periods=True,
+                           has_center=True, has_time_rule=True,
+                           fill_value=None, zero_min_periods_equal=True,
+                           **kwargs):
+
+        def get_result(obj, window, min_periods=None, center=False):
+            r = obj.rolling(window=window, min_periods=min_periods,
+                            center=center)
+            return getattr(r, name)(**kwargs)
+
+        series_result = get_result(self.series, window=50)
+        assert isinstance(series_result, Series)
+        tm.assert_almost_equal(series_result.iloc[-1],
+                               static_comp(self.series[-50:]))
+
+        frame_result = get_result(self.frame, window=50)
+        assert isinstance(frame_result, DataFrame)
+        tm.assert_series_equal(
+            frame_result.iloc[-1, :],
+            self.frame.iloc[-50:, :].apply(static_comp, axis=0, raw=raw),
+            check_names=False)
+
+        # check time_rule works
+        if has_time_rule:
+            win = 25
+            minp = 10
+            series = self.series[::2].resample('B').mean()
+            frame = self.frame[::2].resample('B').mean()
+
+            if has_min_periods:
+                series_result = get_result(series, window=win,
+                                           min_periods=minp)
+                frame_result = get_result(frame, window=win,
+                                          min_periods=minp)
+            else:
+                series_result = get_result(series, window=win)
+                frame_result = get_result(frame, window=win)
+
+            last_date = series_result.index[-1]
+            prev_date = last_date - 24 * offsets.BDay()
+
+            trunc_series = self.series[::2].truncate(prev_date, last_date)
+            trunc_frame = self.frame[::2].truncate(prev_date, last_date)
+
+            tm.assert_almost_equal(series_result[-1],
+                                   static_comp(trunc_series))
+
+            tm.assert_series_equal(frame_result.xs(last_date),
+                                   trunc_frame.apply(static_comp, raw=raw),
+                                   check_names=False)
+
+        # excluding NaNs correctly
+        obj = Series(randn(50))
+        obj[:10] = np.NaN
+        obj[-10:] = np.NaN
+        if has_min_periods:
+            result = get_result(obj, 50, min_periods=30)
+            tm.assert_almost_equal(result.iloc[-1], static_comp(obj[10:-10]))
+
+            # min_periods is working correctly
+            result = get_result(obj, 20, min_periods=15)
+            assert isna(result.iloc[23])
+            assert not isna(result.iloc[24])
+
+            assert not isna(result.iloc[-6])
+            assert isna(result.iloc[-5])
+
+            obj2 = Series(randn(20))
+            result = get_result(obj2, 10, min_periods=5)
+            assert isna(result.iloc[3])
+            assert notna(result.iloc[4])
+
+            if zero_min_periods_equal:
+                # min_periods=0 may be equivalent to min_periods=1
+                result0 = get_result(obj, 20, min_periods=0)
+                result1 = get_result(obj, 20, min_periods=1)
+                tm.assert_almost_equal(result0, result1)
+        else:
+            result = get_result(obj, 50)
+            tm.assert_almost_equal(result.iloc[-1], static_comp(obj[10:-10]))
+
+        # window larger than series length (#7297)
+        if has_min_periods:
+            for minp in (0, len(self.series) - 1, len(self.series)):
+                result = get_result(self.series, len(self.series) + 1,
+                                    min_periods=minp)
+                expected = get_result(self.series, len(self.series),
+                                      min_periods=minp)
+                nan_mask = isna(result)
+                tm.assert_series_equal(nan_mask, isna(expected))
+
+                nan_mask = ~nan_mask
+                tm.assert_almost_equal(result[nan_mask],
+                                       expected[nan_mask])
+        else:
+            result = get_result(self.series, len(self.series) + 1)
+            expected = get_result(self.series, len(self.series))
+            nan_mask = isna(result)
+            tm.assert_series_equal(nan_mask, isna(expected))
+
+            nan_mask = ~nan_mask
+            tm.assert_almost_equal(result[nan_mask], expected[nan_mask])
+
+        # check center=True
+        if has_center:
+            if has_min_periods:
+                result = get_result(obj, 20, min_periods=15, center=True)
+                expected = get_result(
+                    pd.concat([obj, Series([np.NaN] * 9)]), 20,
+                    min_periods=15)[9:].reset_index(drop=True)
+            else:
+                result = get_result(obj, 20, center=True)
+                expected = get_result(
+                    pd.concat([obj, Series([np.NaN] * 9)]),
+                    20)[9:].reset_index(drop=True)
+
+            tm.assert_series_equal(result, expected)
+
+            # shifter index
+            s = ['x%d' % x for x in range(12)]
+
+            if has_min_periods:
+                minp = 10
+
+                series_xp = get_result(
+                    self.series.reindex(list(self.series.index) + s),
+                    window=25,
+                    min_periods=minp).shift(-12).reindex(self.series.index)
+                frame_xp = get_result(
+                    self.frame.reindex(list(self.frame.index) + s),
+                    window=25,
+                    min_periods=minp).shift(-12).reindex(self.frame.index)
+
+                series_rs = get_result(self.series, window=25,
+                                       min_periods=minp, center=True)
+                frame_rs = get_result(self.frame, window=25, min_periods=minp,
+                                      center=True)
+
+            else:
+                series_xp = get_result(
+                    self.series.reindex(list(self.series.index) + s),
+                    window=25).shift(-12).reindex(self.series.index)
+                frame_xp = get_result(
+                    self.frame.reindex(list(self.frame.index) + s),
+                    window=25).shift(-12).reindex(self.frame.index)
+
+                series_rs = get_result(self.series, window=25, center=True)
+                frame_rs = get_result(self.frame, window=25, center=True)
+
+            if fill_value is not None:
+                series_xp = series_xp.fillna(fill_value)
+                frame_xp = frame_xp.fillna(fill_value)
+            tm.assert_series_equal(series_xp, series_rs)
+            tm.assert_frame_equal(frame_xp, frame_rs)
+
+    def test_ewma(self):
+        self._check_ew(name='mean')
+
+        vals = pd.Series(np.zeros(1000))
+        vals[5] = 1
+        result = vals.ewm(span=100, adjust=False).mean().sum()
+        assert np.abs(result - 1) < 1e-2
+
+    @pytest.mark.parametrize('adjust', [True, False])
+    @pytest.mark.parametrize('ignore_na', [True, False])
+    def test_ewma_cases(self, adjust, ignore_na):
+        # try adjust/ignore_na args matrix
+
+        s = Series([1.0, 2.0, 4.0, 8.0])
+
+        if adjust:
+            expected = Series([1.0, 1.6, 2.736842, 4.923077])
+        else:
+            expected = Series([1.0, 1.333333, 2.222222, 4.148148])
+
+        result = s.ewm(com=2.0, adjust=adjust, ignore_na=ignore_na).mean()
+        tm.assert_series_equal(result, expected)
+
+    def test_ewma_nan_handling(self):
+        s = Series([1.] + [np.nan] * 5 + [1.])
+        result = s.ewm(com=5).mean()
+        tm.assert_series_equal(result, Series([1.] * len(s)))
+
+        s = Series([np.nan] * 2 + [1.] + [np.nan] * 2 + [1.])
+        result = s.ewm(com=5).mean()
+        tm.assert_series_equal(result, Series([np.nan] * 2 + [1.] * 4))
+
+        # GH 7603
+        s0 = Series([np.nan, 1., 101.])
+        s1 = Series([1., np.nan, 101.])
+        s2 = Series([np.nan, 1., np.nan, np.nan, 101., np.nan])
+        s3 = Series([1., np.nan, 101., 50.])
+        com = 2.
+        alpha = 1. / (1. + com)
+
+        def simple_wma(s, w):
+            return (s.multiply(w).cumsum() / w.cumsum()).fillna(method='ffill')
+
+        for (s, adjust, ignore_na, w) in [
+            (s0, True, False, [np.nan, (1. - alpha), 1.]),
+            (s0, True, True, [np.nan, (1. - alpha), 1.]),
+            (s0, False, False, [np.nan, (1. - alpha), alpha]),
+            (s0, False, True, [np.nan, (1. - alpha), alpha]),
+            (s1, True, False, [(1. - alpha) ** 2, np.nan, 1.]),
+            (s1, True, True, [(1. - alpha), np.nan, 1.]),
+            (s1, False, False, [(1. - alpha) ** 2, np.nan, alpha]),
+            (s1, False, True, [(1. - alpha), np.nan, alpha]),
+            (s2, True, False, [np.nan, (1. - alpha) **
+                               3, np.nan, np.nan, 1., np.nan]),
+            (s2, True, True, [np.nan, (1. - alpha),
+                              np.nan, np.nan, 1., np.nan]),
+            (s2, False, False, [np.nan, (1. - alpha) **
+                                3, np.nan, np.nan, alpha, np.nan]),
+            (s2, False, True, [np.nan, (1. - alpha),
+                               np.nan, np.nan, alpha, np.nan]),
+            (s3, True, False, [(1. - alpha) **
+                               3, np.nan, (1. - alpha), 1.]),
+            (s3, True, True, [(1. - alpha) **
+                              2, np.nan, (1. - alpha), 1.]),
+            (s3, False, False, [(1. - alpha) ** 3, np.nan,
+                                (1. - alpha) * alpha,
+                                alpha * ((1. - alpha) ** 2 + alpha)]),
+            (s3, False, True, [(1. - alpha) ** 2,
+                               np.nan, (1. - alpha) * alpha, alpha])]:
+            expected = simple_wma(s, Series(w))
+            result = s.ewm(com=com, adjust=adjust, ignore_na=ignore_na).mean()
+
+            tm.assert_series_equal(result, expected)
+            if ignore_na is False:
+                # check that ignore_na defaults to False
+                result = s.ewm(com=com, adjust=adjust).mean()
+                tm.assert_series_equal(result, expected)
+
+    def test_ewmvar(self):
+        self._check_ew(name='var')
+
+    def test_ewmvol(self):
+        self._check_ew(name='vol')
+
+    def test_ewma_span_com_args(self):
+        A = self.series.ewm(com=9.5).mean()
+        B = self.series.ewm(span=20).mean()
+        tm.assert_almost_equal(A, B)
+
+        with pytest.raises(ValueError):
+            self.series.ewm(com=9.5, span=20)
+        with pytest.raises(ValueError):
+            self.series.ewm().mean()
+
+    def test_ewma_halflife_arg(self):
+        A = self.series.ewm(com=13.932726172912965).mean()
+        B = self.series.ewm(halflife=10.0).mean()
+        tm.assert_almost_equal(A, B)
+
+        with pytest.raises(ValueError):
+            self.series.ewm(span=20, halflife=50)
+        with pytest.raises(ValueError):
+            self.series.ewm(com=9.5, halflife=50)
+        with pytest.raises(ValueError):
+            self.series.ewm(com=9.5, span=20, halflife=50)
+        with pytest.raises(ValueError):
+            self.series.ewm()
+
+    def test_ewm_alpha(self):
+        # GH 10789
+        s = Series(self.arr)
+        a = s.ewm(alpha=0.61722699889169674).mean()
+        b = s.ewm(com=0.62014947789973052).mean()
+        c = s.ewm(span=2.240298955799461).mean()
+        d = s.ewm(halflife=0.721792864318).mean()
+        tm.assert_series_equal(a, b)
+        tm.assert_series_equal(a, c)
+        tm.assert_series_equal(a, d)
+
+    def test_ewm_alpha_arg(self):
+        # GH 10789
+        s = self.series
+        with pytest.raises(ValueError):
+            s.ewm()
+        with pytest.raises(ValueError):
+            s.ewm(com=10.0, alpha=0.5)
+        with pytest.raises(ValueError):
+            s.ewm(span=10.0, alpha=0.5)
+        with pytest.raises(ValueError):
+            s.ewm(halflife=10.0, alpha=0.5)
+
+    def test_ewm_domain_checks(self):
+        # GH 12492
+        s = Series(self.arr)
+        # com must satisfy: com >= 0
+        pytest.raises(ValueError, s.ewm, com=-0.1)
+        s.ewm(com=0.0)
+        s.ewm(com=0.1)
+        # span must satisfy: span >= 1
+        pytest.raises(ValueError, s.ewm, span=-0.1)
+        pytest.raises(ValueError, s.ewm, span=0.0)
+        pytest.raises(ValueError, s.ewm, span=0.9)
+        s.ewm(span=1.0)
+        s.ewm(span=1.1)
+        # halflife must satisfy: halflife > 0
+        pytest.raises(ValueError, s.ewm, halflife=-0.1)
+        pytest.raises(ValueError, s.ewm, halflife=0.0)
+        s.ewm(halflife=0.1)
+        # alpha must satisfy: 0 < alpha <= 1
+        pytest.raises(ValueError, s.ewm, alpha=-0.1)
+        pytest.raises(ValueError, s.ewm, alpha=0.0)
+        s.ewm(alpha=0.1)
+        s.ewm(alpha=1.0)
+        pytest.raises(ValueError, s.ewm, alpha=1.1)
+
+    @pytest.mark.parametrize('method', ['mean', 'vol', 'var'])
+    def test_ew_empty_series(self, method):
+        vals = pd.Series([], dtype=np.float64)
+
+        ewm = vals.ewm(3)
+        result = getattr(ewm, method)()
+        tm.assert_almost_equal(result, vals)
+
+    def _check_ew(self, name=None, preserve_nan=False):
+        series_result = getattr(self.series.ewm(com=10), name)()
+        assert isinstance(series_result, Series)
+
+        frame_result = getattr(self.frame.ewm(com=10), name)()
+        assert type(frame_result) == DataFrame
+
+        result = getattr(self.series.ewm(com=10), name)()
+        if preserve_nan:
+            assert result[self._nan_locs].isna().all()
+
+        # excluding NaNs correctly
+        arr = randn(50)
+        arr[:10] = np.NaN
+        arr[-10:] = np.NaN
+        s = Series(arr)
+
+        # check min_periods
+        # GH 7898
+        result = getattr(s.ewm(com=50, min_periods=2), name)()
+        assert result[:11].isna().all()
+        assert not result[11:].isna().any()
+
+        for min_periods in (0, 1):
+            result = getattr(s.ewm(com=50, min_periods=min_periods), name)()
+            if name == 'mean':
+                assert result[:10].isna().all()
+                assert not result[10:].isna().any()
+            else:
+                # ewm.std, ewm.vol, ewm.var (with bias=False) require at least
+                # two values
+                assert result[:11].isna().all()
+                assert not result[11:].isna().any()
+
+            # check series of length 0
+            result = getattr(Series().ewm(com=50, min_periods=min_periods),
+                             name)()
+            tm.assert_series_equal(result, Series())
+
+            # check series of length 1
+            result = getattr(Series([1.]).ewm(50, min_periods=min_periods),
+                             name)()
+            if name == 'mean':
+                tm.assert_series_equal(result, Series([1.]))
+            else:
+                # ewm.std, ewm.vol, ewm.var with bias=False require at least
+                # two values
+                tm.assert_series_equal(result, Series([np.NaN]))
+
+        # pass in ints
+        result2 = getattr(Series(np.arange(50)).ewm(span=10), name)()
+        assert result2.dtype == np.float_
+
+
+class TestPairwise(object):
+
+    # GH 7738
+    df1s = [DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[0, 1]),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[1, 0]),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[1, 1]),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]],
+                      columns=['C', 'C']),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[1., 0]),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[0., 1]),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=['C', 1]),
+            DataFrame([[2., 4.], [1., 2.], [5., 2.], [8., 1.]],
+                      columns=[1, 0.]),
+            DataFrame([[2, 4.], [1, 2.], [5, 2.], [8, 1.]],
+                      columns=[0, 1.]),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1.]],
+                      columns=[1., 'X']), ]
+    df2 = DataFrame([[None, 1, 1], [None, 1, 2],
+                     [None, 3, 2], [None, 8, 1]], columns=['Y', 'Z', 'X'])
+    s = Series([1, 1, 3, 8])
+
+    def compare(self, result, expected):
+
+        # since we have sorted the results
+        # we can only compare non-nans
+        result = result.dropna().values
+        expected = expected.dropna().values
+
+        tm.assert_numpy_array_equal(result, expected, check_dtype=False)
+
+    @pytest.mark.parametrize('f', [lambda x: x.cov(), lambda x: x.corr()])
+    def test_no_flex(self, f):
+
+        # DataFrame methods (which do not call _flex_binary_moment())
+
+        results = [f(df) for df in self.df1s]
+        for (df, result) in zip(self.df1s, results):
+            tm.assert_index_equal(result.index, df.columns)
+            tm.assert_index_equal(result.columns, df.columns)
+        for i, result in enumerate(results):
+            if i > 0:
+                self.compare(result, results[0])
+
+    @pytest.mark.parametrize(
+        'f', [lambda x: x.expanding().cov(pairwise=True),
+              lambda x: x.expanding().corr(pairwise=True),
+              lambda x: x.rolling(window=3).cov(pairwise=True),
+              lambda x: x.rolling(window=3).corr(pairwise=True),
+              lambda x: x.ewm(com=3).cov(pairwise=True),
+              lambda x: x.ewm(com=3).corr(pairwise=True)])
+    def test_pairwise_with_self(self, f):
+
+        # DataFrame with itself, pairwise=True
+        # note that we may construct the 1st level of the MI
+        # in a non-motononic way, so compare accordingly
+        results = []
+        for i, df in enumerate(self.df1s):
+            result = f(df)
+            tm.assert_index_equal(result.index.levels[0],
+                                  df.index,
+                                  check_names=False)
+            tm.assert_numpy_array_equal(safe_sort(result.index.levels[1]),
+                                        safe_sort(df.columns.unique()))
+            tm.assert_index_equal(result.columns, df.columns)
+            results.append(df)
+
+        for i, result in enumerate(results):
+            if i > 0:
+                self.compare(result, results[0])
+
+    @pytest.mark.parametrize(
+        'f', [lambda x: x.expanding().cov(pairwise=False),
+              lambda x: x.expanding().corr(pairwise=False),
+              lambda x: x.rolling(window=3).cov(pairwise=False),
+              lambda x: x.rolling(window=3).corr(pairwise=False),
+              lambda x: x.ewm(com=3).cov(pairwise=False),
+              lambda x: x.ewm(com=3).corr(pairwise=False), ])
+    def test_no_pairwise_with_self(self, f):
+
+        # DataFrame with itself, pairwise=False
+        results = [f(df) for df in self.df1s]
+        for (df, result) in zip(self.df1s, results):
+            tm.assert_index_equal(result.index, df.index)
+            tm.assert_index_equal(result.columns, df.columns)
+        for i, result in enumerate(results):
+            if i > 0:
+                self.compare(result, results[0])
+
+    @pytest.mark.parametrize(
+        'f', [lambda x, y: x.expanding().cov(y, pairwise=True),
+              lambda x, y: x.expanding().corr(y, pairwise=True),
+              lambda x, y: x.rolling(window=3).cov(y, pairwise=True),
+              lambda x, y: x.rolling(window=3).corr(y, pairwise=True),
+              lambda x, y: x.ewm(com=3).cov(y, pairwise=True),
+              lambda x, y: x.ewm(com=3).corr(y, pairwise=True), ])
+    def test_pairwise_with_other(self, f):
+
+        # DataFrame with another DataFrame, pairwise=True
+        results = [f(df, self.df2) for df in self.df1s]
+        for (df, result) in zip(self.df1s, results):
+            tm.assert_index_equal(result.index.levels[0],
+                                  df.index,
+                                  check_names=False)
+            tm.assert_numpy_array_equal(safe_sort(result.index.levels[1]),
+                                        safe_sort(self.df2.columns.unique()))
+        for i, result in enumerate(results):
+            if i > 0:
+                self.compare(result, results[0])
+
+    @pytest.mark.parametrize(
+        'f', [lambda x, y: x.expanding().cov(y, pairwise=False),
+              lambda x, y: x.expanding().corr(y, pairwise=False),
+              lambda x, y: x.rolling(window=3).cov(y, pairwise=False),
+              lambda x, y: x.rolling(window=3).corr(y, pairwise=False),
+              lambda x, y: x.ewm(com=3).cov(y, pairwise=False),
+              lambda x, y: x.ewm(com=3).corr(y, pairwise=False), ])
+    def test_no_pairwise_with_other(self, f):
+
+        # DataFrame with another DataFrame, pairwise=False
+        results = [f(df, self.df2) if df.columns.is_unique else None
+                   for df in self.df1s]
+        for (df, result) in zip(self.df1s, results):
+            if result is not None:
+                with catch_warnings(record=True):
+                    # we can have int and str columns
+                    expected_index = df.index.union(self.df2.index)
+                    expected_columns = df.columns.union(self.df2.columns)
+                tm.assert_index_equal(result.index, expected_index)
+                tm.assert_index_equal(result.columns, expected_columns)
+            else:
+                tm.assert_raises_regex(
+                    ValueError, "'arg1' columns are not unique", f, df,
+                    self.df2)
+                tm.assert_raises_regex(
+                    ValueError, "'arg2' columns are not unique", f,
+                    self.df2, df)
+
+    @pytest.mark.parametrize(
+        'f', [lambda x, y: x.expanding().cov(y),
+              lambda x, y: x.expanding().corr(y),
+              lambda x, y: x.rolling(window=3).cov(y),
+              lambda x, y: x.rolling(window=3).corr(y),
+              lambda x, y: x.ewm(com=3).cov(y),
+              lambda x, y: x.ewm(com=3).corr(y), ])
+    def test_pairwise_with_series(self, f):
+
+        # DataFrame with a Series
+        results = ([f(df, self.s) for df in self.df1s] +
+                   [f(self.s, df) for df in self.df1s])
+        for (df, result) in zip(self.df1s, results):
+            tm.assert_index_equal(result.index, df.index)
+            tm.assert_index_equal(result.columns, df.columns)
+        for i, result in enumerate(results):
+            if i > 0:
+                self.compare(result, results[0])
+
+
+# create the data only once as we are not setting it
+def _create_consistency_data():
+    def create_series():
+        return [Series(),
+                Series([np.nan]),
+                Series([np.nan, np.nan]),
+                Series([3.]),
+                Series([np.nan, 3.]),
+                Series([3., np.nan]),
+                Series([1., 3.]),
+                Series([2., 2.]),
+                Series([3., 1.]),
+                Series([5., 5., 5., 5., np.nan, np.nan, np.nan, 5., 5., np.nan,
+                        np.nan]),
+                Series([np.nan, 5., 5., 5., np.nan, np.nan, np.nan, 5., 5.,
+                        np.nan, np.nan]),
+                Series([np.nan, np.nan, 5., 5., np.nan, np.nan, np.nan, 5., 5.,
+                        np.nan, np.nan]),
+                Series([np.nan, 3., np.nan, 3., 4., 5., 6., np.nan, np.nan, 7.,
+                        12., 13., 14., 15.]),
+                Series([np.nan, 5., np.nan, 2., 4., 0., 9., np.nan, np.nan, 3.,
+                        12., 13., 14., 15.]),
+                Series([2., 3., np.nan, 3., 4., 5., 6., np.nan, np.nan, 7.,
+                        12., 13., 14., 15.]),
+                Series([2., 5., np.nan, 2., 4., 0., 9., np.nan, np.nan, 3.,
+                        12., 13., 14., 15.]),
+                Series(range(10)),
+                Series(range(20, 0, -2)), ]
+
+    def create_dataframes():
+        return ([DataFrame(),
+                 DataFrame(columns=['a']),
+                 DataFrame(columns=['a', 'a']),
+                 DataFrame(columns=['a', 'b']),
+                 DataFrame(np.arange(10).reshape((5, 2))),
+                 DataFrame(np.arange(25).reshape((5, 5))),
+                 DataFrame(np.arange(25).reshape((5, 5)),
+                           columns=['a', 'b', 99, 'd', 'd'])] +
+                [DataFrame(s) for s in create_series()])
+
+    def is_constant(x):
+        values = x.values.ravel()
+        return len(set(values[notna(values)])) == 1
+
+    def no_nans(x):
+        return x.notna().all().all()
+
+    # data is a tuple(object, is_contant, no_nans)
+    data = create_series() + create_dataframes()
+
+    return [(x, is_constant(x), no_nans(x)) for x in data]
+
+
+_consistency_data = _create_consistency_data()
+
+
+def _rolling_consistency_cases():
+    for window in [1, 2, 3, 10, 20]:
+        for min_periods in set([0, 1, 2, 3, 4, window]):
+            if min_periods and (min_periods > window):
+                continue
+            for center in [False, True]:
+                yield window, min_periods, center
+
+
+class TestMomentsConsistency(Base):
+    base_functions = [
+        (lambda v: Series(v).count(), None, 'count'),
+        (lambda v: Series(v).max(), None, 'max'),
+        (lambda v: Series(v).min(), None, 'min'),
+        (lambda v: Series(v).sum(), None, 'sum'),
+        (lambda v: Series(v).mean(), None, 'mean'),
+        (lambda v: Series(v).std(), 1, 'std'),
+        (lambda v: Series(v).cov(Series(v)), None, 'cov'),
+        (lambda v: Series(v).corr(Series(v)), None, 'corr'),
+        (lambda v: Series(v).var(), 1, 'var'),
+
+        # restore once GH 8086 is fixed
+        # lambda v: Series(v).skew(), 3, 'skew'),
+        # (lambda v: Series(v).kurt(), 4, 'kurt'),
+
+        # restore once GH 8084 is fixed
+        # lambda v: Series(v).quantile(0.3), None, 'quantile'),
+
+        (lambda v: Series(v).median(), None, 'median'),
+        (np.nanmax, 1, 'max'),
+        (np.nanmin, 1, 'min'),
+        (np.nansum, 1, 'sum'),
+        (np.nanmean, 1, 'mean'),
+        (lambda v: np.nanstd(v, ddof=1), 1, 'std'),
+        (lambda v: np.nanvar(v, ddof=1), 1, 'var'),
+        (np.nanmedian, 1, 'median'),
+    ]
+    no_nan_functions = [
+        (np.max, None, 'max'),
+        (np.min, None, 'min'),
+        (np.sum, None, 'sum'),
+        (np.mean, None, 'mean'),
+        (lambda v: np.std(v, ddof=1), 1, 'std'),
+        (lambda v: np.var(v, ddof=1), 1, 'var'),
+        (np.median, None, 'median'),
+    ]
+
+    def _create_data(self):
+        super(TestMomentsConsistency, self)._create_data()
+        self.data = _consistency_data
+
+    def setup_method(self, method):
+        self._create_data()
+
+    def _test_moments_consistency(self, min_periods, count, mean, mock_mean,
+                                  corr, var_unbiased=None, std_unbiased=None,
+                                  cov_unbiased=None, var_biased=None,
+                                  std_biased=None, cov_biased=None,
+                                  var_debiasing_factors=None):
+        def _non_null_values(x):
+            values = x.values.ravel()
+            return set(values[notna(values)].tolist())
+
+        for (x, is_constant, no_nans) in self.data:
+            count_x = count(x)
+            mean_x = mean(x)
+
+            if mock_mean:
+                # check that mean equals mock_mean
+                expected = mock_mean(x)
+                assert_equal(mean_x, expected.astype('float64'))
+
+            # check that correlation of a series with itself is either 1 or NaN
+            corr_x_x = corr(x, x)
+
+            # assert _non_null_values(corr_x_x).issubset(set([1.]))
+            # restore once rolling_cov(x, x) is identically equal to var(x)
+
+            if is_constant:
+                exp = x.max() if isinstance(x, Series) else x.max().max()
+
+                # check mean of constant series
+                expected = x * np.nan
+                expected[count_x >= max(min_periods, 1)] = exp
+                assert_equal(mean_x, expected)
+
+                # check correlation of constant series with itself is NaN
+                expected[:] = np.nan
+                assert_equal(corr_x_x, expected)
+
+            if var_unbiased and var_biased and var_debiasing_factors:
+                # check variance debiasing factors
+                var_unbiased_x = var_unbiased(x)
+                var_biased_x = var_biased(x)
+                var_debiasing_factors_x = var_debiasing_factors(x)
+                assert_equal(var_unbiased_x, var_biased_x *
+                             var_debiasing_factors_x)
+
+            for (std, var, cov) in [(std_biased, var_biased, cov_biased),
+                                    (std_unbiased, var_unbiased, cov_unbiased)
+                                    ]:
+
+                # check that var(x), std(x), and cov(x) are all >= 0
+                var_x = var(x)
+                std_x = std(x)
+                assert not (var_x < 0).any().any()
+                assert not (std_x < 0).any().any()
+                if cov:
+                    cov_x_x = cov(x, x)
+                    assert not (cov_x_x < 0).any().any()
+
+                    # check that var(x) == cov(x, x)
+                    assert_equal(var_x, cov_x_x)
+
+                # check that var(x) == std(x)^2
+                assert_equal(var_x, std_x * std_x)
+
+                if var is var_biased:
+                    # check that biased var(x) == mean(x^2) - mean(x)^2
+                    mean_x2 = mean(x * x)
+                    assert_equal(var_x, mean_x2 - (mean_x * mean_x))
+
+                if is_constant:
+                    # check that variance of constant series is identically 0
+                    assert not (var_x > 0).any().any()
+                    expected = x * np.nan
+                    expected[count_x >= max(min_periods, 1)] = 0.
+                    if var is var_unbiased:
+                        expected[count_x < 2] = np.nan
+                    assert_equal(var_x, expected)
+
+                if isinstance(x, Series):
+                    for (y, is_constant, no_nans) in self.data:
+                        if not x.isna().equals(y.isna()):
+                            # can only easily test two Series with similar
+                            # structure
+                            continue
+
+                        # check that cor(x, y) is symmetric
+                        corr_x_y = corr(x, y)
+                        corr_y_x = corr(y, x)
+                        assert_equal(corr_x_y, corr_y_x)
+
+                        if cov:
+                            # check that cov(x, y) is symmetric
+                            cov_x_y = cov(x, y)
+                            cov_y_x = cov(y, x)
+                            assert_equal(cov_x_y, cov_y_x)
+
+                            # check that cov(x, y) == (var(x+y) - var(x) -
+                            # var(y)) / 2
+                            var_x_plus_y = var(x + y)
+                            var_y = var(y)
+                            assert_equal(cov_x_y, 0.5 *
+                                         (var_x_plus_y - var_x - var_y))
+
+                            # check that corr(x, y) == cov(x, y) / (std(x) *
+                            # std(y))
+                            std_y = std(y)
+                            assert_equal(corr_x_y, cov_x_y / (std_x * std_y))
+
+                            if cov is cov_biased:
+                                # check that biased cov(x, y) == mean(x*y) -
+                                # mean(x)*mean(y)
+                                mean_y = mean(y)
+                                mean_x_times_y = mean(x * y)
+                                assert_equal(cov_x_y, mean_x_times_y -
+                                             (mean_x * mean_y))
+
+    @pytest.mark.slow
+    @pytest.mark.parametrize('min_periods', [0, 1, 2, 3, 4])
+    @pytest.mark.parametrize('adjust', [True, False])
+    @pytest.mark.parametrize('ignore_na', [True, False])
+    def test_ewm_consistency(self, min_periods, adjust, ignore_na):
+        def _weights(s, com, adjust, ignore_na):
+            if isinstance(s, DataFrame):
+                if not len(s.columns):
+                    return DataFrame(index=s.index, columns=s.columns)
+                w = concat([
+                    _weights(s.iloc[:, i], com=com, adjust=adjust,
+                             ignore_na=ignore_na)
+                    for i, _ in enumerate(s.columns)], axis=1)
+                w.index = s.index
+                w.columns = s.columns
+                return w
+
+            w = Series(np.nan, index=s.index)
+            alpha = 1. / (1. + com)
+            if ignore_na:
+                w[s.notna()] = _weights(s[s.notna()], com=com,
+                                        adjust=adjust, ignore_na=False)
+            elif adjust:
+                for i in range(len(s)):
+                    if s.iat[i] == s.iat[i]:
+                        w.iat[i] = pow(1. / (1. - alpha), i)
+            else:
+                sum_wts = 0.
+                prev_i = -1
+                for i in range(len(s)):
+                    if s.iat[i] == s.iat[i]:
+                        if prev_i == -1:
+                            w.iat[i] = 1.
+                        else:
+                            w.iat[i] = alpha * sum_wts / pow(1. - alpha,
+                                                             i - prev_i)
+                        sum_wts += w.iat[i]
+                        prev_i = i
+            return w
+
+        def _variance_debiasing_factors(s, com, adjust, ignore_na):
+            weights = _weights(s, com=com, adjust=adjust, ignore_na=ignore_na)
+            cum_sum = weights.cumsum().fillna(method='ffill')
+            cum_sum_sq = (weights * weights).cumsum().fillna(method='ffill')
+            numerator = cum_sum * cum_sum
+            denominator = numerator - cum_sum_sq
+            denominator[denominator <= 0.] = np.nan
+            return numerator / denominator
+
+        def _ewma(s, com, min_periods, adjust, ignore_na):
+            weights = _weights(s, com=com, adjust=adjust, ignore_na=ignore_na)
+            result = s.multiply(weights).cumsum().divide(weights.cumsum(
+            )).fillna(method='ffill')
+            result[s.expanding().count() < (max(min_periods, 1) if min_periods
+                                            else 1)] = np.nan
+            return result
+
+        com = 3.
+        # test consistency between different ewm* moments
+        self._test_moments_consistency(
+            min_periods=min_periods,
+            count=lambda x: x.expanding().count(),
+            mean=lambda x: x.ewm(com=com, min_periods=min_periods,
+                                 adjust=adjust,
+                                 ignore_na=ignore_na).mean(),
+            mock_mean=lambda x: _ewma(x, com=com,
+                                      min_periods=min_periods,
+                                      adjust=adjust,
+                                      ignore_na=ignore_na),
+            corr=lambda x, y: x.ewm(com=com, min_periods=min_periods,
+                                    adjust=adjust,
+                                    ignore_na=ignore_na).corr(y),
+            var_unbiased=lambda x: (
+                x.ewm(com=com, min_periods=min_periods,
+                      adjust=adjust,
+                      ignore_na=ignore_na).var(bias=False)),
+            std_unbiased=lambda x: (
+                x.ewm(com=com, min_periods=min_periods,
+                      adjust=adjust, ignore_na=ignore_na)
+                .std(bias=False)),
+            cov_unbiased=lambda x, y: (
+                x.ewm(com=com, min_periods=min_periods,
+                      adjust=adjust, ignore_na=ignore_na)
+                .cov(y, bias=False)),
+            var_biased=lambda x: (
+                x.ewm(com=com, min_periods=min_periods,
+                      adjust=adjust, ignore_na=ignore_na)
+                .var(bias=True)),
+            std_biased=lambda x: x.ewm(com=com, min_periods=min_periods,
+                                       adjust=adjust,
+                                       ignore_na=ignore_na).std(bias=True),
+            cov_biased=lambda x, y: (
+                x.ewm(com=com, min_periods=min_periods,
+                      adjust=adjust, ignore_na=ignore_na)
+                .cov(y, bias=True)),
+            var_debiasing_factors=lambda x: (
+                _variance_debiasing_factors(x, com=com, adjust=adjust,
+                                            ignore_na=ignore_na)))
+
+    @pytest.mark.slow
+    @pytest.mark.parametrize(
+        'min_periods', [0, 1, 2, 3, 4])
+    def test_expanding_consistency(self, min_periods):
+
+        # suppress warnings about empty slices, as we are deliberately testing
+        # with empty/0-length Series/DataFrames
+        with warnings.catch_warnings():
+            warnings.filterwarnings("ignore",
+                                    message=".*(empty slice|0 for slice).*",
+                                    category=RuntimeWarning)
+
+            # test consistency between different expanding_* moments
+            self._test_moments_consistency(
+                min_periods=min_periods,
+                count=lambda x: x.expanding().count(),
+                mean=lambda x: x.expanding(
+                    min_periods=min_periods).mean(),
+                mock_mean=lambda x: x.expanding(
+                    min_periods=min_periods).sum() / x.expanding().count(),
+                corr=lambda x, y: x.expanding(
+                    min_periods=min_periods).corr(y),
+                var_unbiased=lambda x: x.expanding(
+                    min_periods=min_periods).var(),
+                std_unbiased=lambda x: x.expanding(
+                    min_periods=min_periods).std(),
+                cov_unbiased=lambda x, y: x.expanding(
+                    min_periods=min_periods).cov(y),
+                var_biased=lambda x: x.expanding(
+                    min_periods=min_periods).var(ddof=0),
+                std_biased=lambda x: x.expanding(
+                    min_periods=min_periods).std(ddof=0),
+                cov_biased=lambda x, y: x.expanding(
+                    min_periods=min_periods).cov(y, ddof=0),
+                var_debiasing_factors=lambda x: (
+                    x.expanding().count() /
+                    (x.expanding().count() - 1.)
+                    .replace(0., np.nan)))
+
+            # test consistency between expanding_xyz() and either (a)
+            # expanding_apply of Series.xyz(), or (b) expanding_apply of
+            # np.nanxyz()
+            for (x, is_constant, no_nans) in self.data:
+                functions = self.base_functions
+
+                # GH 8269
+                if no_nans:
+                    functions = self.base_functions + self.no_nan_functions
+                for (f, require_min_periods, name) in functions:
+                    expanding_f = getattr(
+                        x.expanding(min_periods=min_periods), name)
+
+                    if (require_min_periods and
+                            (min_periods is not None) and
+                            (min_periods < require_min_periods)):
+                        continue
+
+                    if name == 'count':
+                        expanding_f_result = expanding_f()
+                        expanding_apply_f_result = x.expanding(
+                            min_periods=0).apply(func=f, raw=True)
+                    else:
+                        if name in ['cov', 'corr']:
+                            expanding_f_result = expanding_f(
+                                pairwise=False)
+                        else:
+                            expanding_f_result = expanding_f()
+                        expanding_apply_f_result = x.expanding(
+                            min_periods=min_periods).apply(func=f, raw=True)
+
+                    # GH 9422
+                    if name in ['sum', 'prod']:
+                        assert_equal(expanding_f_result,
+                                     expanding_apply_f_result)
+
+    @pytest.mark.slow
+    @pytest.mark.parametrize(
+        'window,min_periods,center', list(_rolling_consistency_cases()))
+    def test_rolling_consistency(self, window, min_periods, center):
+
+        # suppress warnings about empty slices, as we are deliberately testing
+        # with empty/0-length Series/DataFrames
+        with warnings.catch_warnings():
+            warnings.filterwarnings("ignore",
+                                    message=".*(empty slice|0 for slice).*",
+                                    category=RuntimeWarning)
+
+            # test consistency between different rolling_* moments
+            self._test_moments_consistency(
+                min_periods=min_periods,
+                count=lambda x: (
+                    x.rolling(window=window, center=center)
+                    .count()),
+                mean=lambda x: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).mean()),
+                mock_mean=lambda x: (
+                    x.rolling(window=window,
+                              min_periods=min_periods,
+                              center=center).sum()
+                    .divide(x.rolling(window=window,
+                                      min_periods=min_periods,
+                                      center=center).count())),
+                corr=lambda x, y: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).corr(y)),
+
+                var_unbiased=lambda x: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).var()),
+
+                std_unbiased=lambda x: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).std()),
+
+                cov_unbiased=lambda x, y: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).cov(y)),
+
+                var_biased=lambda x: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).var(ddof=0)),
+
+                std_biased=lambda x: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).std(ddof=0)),
+
+                cov_biased=lambda x, y: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).cov(y, ddof=0)),
+                var_debiasing_factors=lambda x: (
+                    x.rolling(window=window, center=center).count()
+                    .divide((x.rolling(window=window, center=center)
+                             .count() - 1.)
+                            .replace(0., np.nan))))
+
+            # test consistency between rolling_xyz() and either (a)
+            # rolling_apply of Series.xyz(), or (b) rolling_apply of
+            # np.nanxyz()
+            for (x, is_constant, no_nans) in self.data:
+                functions = self.base_functions
+
+                # GH 8269
+                if no_nans:
+                    functions = self.base_functions + self.no_nan_functions
+                for (f, require_min_periods, name) in functions:
+                    rolling_f = getattr(
+                        x.rolling(window=window, center=center,
+                                  min_periods=min_periods), name)
+
+                    if require_min_periods and (
+                            min_periods is not None) and (
+                                min_periods < require_min_periods):
+                        continue
+
+                    if name == 'count':
+                        rolling_f_result = rolling_f()
+                        rolling_apply_f_result = x.rolling(
+                            window=window, min_periods=0,
+                            center=center).apply(func=f, raw=True)
+                    else:
+                        if name in ['cov', 'corr']:
+                            rolling_f_result = rolling_f(
+                                pairwise=False)
+                        else:
+                            rolling_f_result = rolling_f()
+                        rolling_apply_f_result = x.rolling(
+                            window=window, min_periods=min_periods,
+                            center=center).apply(func=f, raw=True)
+
+                    # GH 9422
+                    if name in ['sum', 'prod']:
+                        assert_equal(rolling_f_result,
+                                     rolling_apply_f_result)
+
+    # binary moments
+    def test_rolling_cov(self):
+        A = self.series
+        B = A + randn(len(A))
+
+        result = A.rolling(window=50, min_periods=25).cov(B)
+        tm.assert_almost_equal(result[-1], np.cov(A[-50:], B[-50:])[0, 1])
+
+    def test_rolling_cov_pairwise(self):
+        self._check_pairwise_moment('rolling', 'cov', window=10, min_periods=5)
+
+    def test_rolling_corr(self):
+        A = self.series
+        B = A + randn(len(A))
+
+        result = A.rolling(window=50, min_periods=25).corr(B)
+        tm.assert_almost_equal(result[-1], np.corrcoef(A[-50:], B[-50:])[0, 1])
+
+        # test for correct bias correction
+        a = tm.makeTimeSeries()
+        b = tm.makeTimeSeries()
+        a[:5] = np.nan
+        b[:10] = np.nan
+
+        result = a.rolling(window=len(a), min_periods=1).corr(b)
+        tm.assert_almost_equal(result[-1], a.corr(b))
+
+    def test_rolling_corr_pairwise(self):
+        self._check_pairwise_moment('rolling', 'corr', window=10,
+                                    min_periods=5)
+
+    @pytest.mark.parametrize('window', range(7))
+    def test_rolling_corr_with_zero_variance(self, window):
+        # GH 18430
+        s = pd.Series(np.zeros(20))
+        other = pd.Series(np.arange(20))
+
+        assert s.rolling(window=window).corr(other=other).isna().all()
+
+    def _check_pairwise_moment(self, dispatch, name, **kwargs):
+        def get_result(obj, obj2=None):
+            return getattr(getattr(obj, dispatch)(**kwargs), name)(obj2)
+
+        result = get_result(self.frame)
+        result = result.loc[(slice(None), 1), 5]
+        result.index = result.index.droplevel(1)
+        expected = get_result(self.frame[1], self.frame[5])
+        tm.assert_series_equal(result, expected, check_names=False)
+
+    def test_flex_binary_moment(self):
+        # GH3155
+        # don't blow the stack
+        pytest.raises(TypeError, rwindow._flex_binary_moment, 5, 6, None)
+
+    def test_corr_sanity(self):
+        # GH 3155
+        df = DataFrame(np.array(
+            [[0.87024726, 0.18505595], [0.64355431, 0.3091617],
+             [0.92372966, 0.50552513], [0.00203756, 0.04520709],
+             [0.84780328, 0.33394331], [0.78369152, 0.63919667]]))
+
+        res = df[0].rolling(5, center=True).corr(df[1])
+        assert all(np.abs(np.nan_to_num(x)) <= 1 for x in res)
+
+        # and some fuzzing
+        for _ in range(10):
+            df = DataFrame(np.random.rand(30, 2))
+            res = df[0].rolling(5, center=True).corr(df[1])
+            try:
+                assert all(np.abs(np.nan_to_num(x)) <= 1 for x in res)
+            except AssertionError:
+                print(res)
+
+    @pytest.mark.parametrize('method', ['corr', 'cov'])
+    def test_flex_binary_frame(self, method):
+        series = self.frame[1]
+
+        res = getattr(series.rolling(window=10), method)(self.frame)
+        res2 = getattr(self.frame.rolling(window=10), method)(series)
+        exp = self.frame.apply(lambda x: getattr(
+            series.rolling(window=10), method)(x))
+
+        tm.assert_frame_equal(res, exp)
+        tm.assert_frame_equal(res2, exp)
+
+        frame2 = self.frame.copy()
+        frame2.values[:] = np.random.randn(*frame2.shape)
+
+        res3 = getattr(self.frame.rolling(window=10), method)(frame2)
+        exp = DataFrame(dict((k, getattr(self.frame[k].rolling(
+            window=10), method)(frame2[k])) for k in self.frame))
+        tm.assert_frame_equal(res3, exp)
+
+    def test_ewmcov(self):
+        self._check_binary_ew('cov')
+
+    def test_ewmcov_pairwise(self):
+        self._check_pairwise_moment('ewm', 'cov', span=10, min_periods=5)
+
+    def test_ewmcorr(self):
+        self._check_binary_ew('corr')
+
+    def test_ewmcorr_pairwise(self):
+        self._check_pairwise_moment('ewm', 'corr', span=10, min_periods=5)
+
+    def _check_binary_ew(self, name):
+        def func(A, B, com, **kwargs):
+            return getattr(A.ewm(com, **kwargs), name)(B)
+
+        A = Series(randn(50), index=np.arange(50))
+        B = A[2:] + randn(48)
+
+        A[:10] = np.NaN
+        B[-10:] = np.NaN
+
+        result = func(A, B, 20, min_periods=5)
+        assert np.isnan(result.values[:14]).all()
+        assert not np.isnan(result.values[14:]).any()
+
+        # GH 7898
+        for min_periods in (0, 1, 2):
+            result = func(A, B, 20, min_periods=min_periods)
+            # binary functions (ewmcov, ewmcorr) with bias=False require at
+            # least two values
+            assert np.isnan(result.values[:11]).all()
+            assert not np.isnan(result.values[11:]).any()
+
+            # check series of length 0
+            result = func(Series([]), Series([]), 50, min_periods=min_periods)
+            tm.assert_series_equal(result, Series([]))
+
+            # check series of length 1
+            result = func(
+                Series([1.]), Series([1.]), 50, min_periods=min_periods)
+            tm.assert_series_equal(result, Series([np.NaN]))
+
+        pytest.raises(Exception, func, A, randn(50), 20, min_periods=5)
+
+    def test_expanding_apply_args_kwargs(self, raw):
+
+        def mean_w_arg(x, const):
+            return np.mean(x) + const
+
+        df = DataFrame(np.random.rand(20, 3))
+
+        expected = df.expanding().apply(np.mean, raw=raw) + 20.
+
+        result = df.expanding().apply(mean_w_arg,
+                                      raw=raw,
+                                      args=(20, ))
+        tm.assert_frame_equal(result, expected)
+
+        result = df.expanding().apply(mean_w_arg,
+                                      raw=raw,
+                                      kwargs={'const': 20})
+        tm.assert_frame_equal(result, expected)
+
+    def test_expanding_corr(self):
+        A = self.series.dropna()
+        B = (A + randn(len(A)))[:-5]
+
+        result = A.expanding().corr(B)
+
+        rolling_result = A.rolling(window=len(A), min_periods=1).corr(B)
+
+        tm.assert_almost_equal(rolling_result, result)
+
+    def test_expanding_count(self):
+        result = self.series.expanding().count()
+        tm.assert_almost_equal(result, self.series.rolling(
+            window=len(self.series)).count())
+
+    def test_expanding_quantile(self):
+        result = self.series.expanding().quantile(0.5)
+
+        rolling_result = self.series.rolling(window=len(self.series),
+                                             min_periods=1).quantile(0.5)
+
+        tm.assert_almost_equal(result, rolling_result)
+
+    def test_expanding_cov(self):
+        A = self.series
+        B = (A + randn(len(A)))[:-5]
+
+        result = A.expanding().cov(B)
+
+        rolling_result = A.rolling(window=len(A), min_periods=1).cov(B)
+
+        tm.assert_almost_equal(rolling_result, result)
+
+    def test_expanding_cov_pairwise(self):
+        result = self.frame.expanding().corr()
+
+        rolling_result = self.frame.rolling(window=len(self.frame),
+                                            min_periods=1).corr()
+
+        tm.assert_frame_equal(result, rolling_result)
+
+    def test_expanding_corr_pairwise(self):
+        result = self.frame.expanding().corr()
+
+        rolling_result = self.frame.rolling(window=len(self.frame),
+                                            min_periods=1).corr()
+        tm.assert_frame_equal(result, rolling_result)
+
+    def test_expanding_cov_diff_index(self):
+        # GH 7512
+        s1 = Series([1, 2, 3], index=[0, 1, 2])
+        s2 = Series([1, 3], index=[0, 2])
+        result = s1.expanding().cov(s2)
+        expected = Series([None, None, 2.0])
+        tm.assert_series_equal(result, expected)
+
+        s2a = Series([1, None, 3], index=[0, 1, 2])
+        result = s1.expanding().cov(s2a)
+        tm.assert_series_equal(result, expected)
+
+        s1 = Series([7, 8, 10], index=[0, 1, 3])
+        s2 = Series([7, 9, 10], index=[0, 2, 3])
+        result = s1.expanding().cov(s2)
+        expected = Series([None, None, None, 4.5])
+        tm.assert_series_equal(result, expected)
+
+    def test_expanding_corr_diff_index(self):
+        # GH 7512
+        s1 = Series([1, 2, 3], index=[0, 1, 2])
+        s2 = Series([1, 3], index=[0, 2])
+        result = s1.expanding().corr(s2)
+        expected = Series([None, None, 1.0])
+        tm.assert_series_equal(result, expected)
+
+        s2a = Series([1, None, 3], index=[0, 1, 2])
+        result = s1.expanding().corr(s2a)
+        tm.assert_series_equal(result, expected)
+
+        s1 = Series([7, 8, 10], index=[0, 1, 3])
+        s2 = Series([7, 9, 10], index=[0, 2, 3])
+        result = s1.expanding().corr(s2)
+        expected = Series([None, None, None, 1.])
+        tm.assert_series_equal(result, expected)
+
+    def test_rolling_cov_diff_length(self):
+        # GH 7512
+        s1 = Series([1, 2, 3], index=[0, 1, 2])
+        s2 = Series([1, 3], index=[0, 2])
+        result = s1.rolling(window=3, min_periods=2).cov(s2)
+        expected = Series([None, None, 2.0])
+        tm.assert_series_equal(result, expected)
+
+        s2a = Series([1, None, 3], index=[0, 1, 2])
+        result = s1.rolling(window=3, min_periods=2).cov(s2a)
+        tm.assert_series_equal(result, expected)
+
+    def test_rolling_corr_diff_length(self):
+        # GH 7512
+        s1 = Series([1, 2, 3], index=[0, 1, 2])
+        s2 = Series([1, 3], index=[0, 2])
+        result = s1.rolling(window=3, min_periods=2).corr(s2)
+        expected = Series([None, None, 1.0])
+        tm.assert_series_equal(result, expected)
+
+        s2a = Series([1, None, 3], index=[0, 1, 2])
+        result = s1.rolling(window=3, min_periods=2).corr(s2a)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        'f',
+        [
+            lambda x: (x.rolling(window=10, min_periods=5)
+                       .cov(x, pairwise=False)),
+            lambda x: (x.rolling(window=10, min_periods=5)
+                       .corr(x, pairwise=False)),
+            lambda x: x.rolling(window=10, min_periods=5).max(),
+            lambda x: x.rolling(window=10, min_periods=5).min(),
+            lambda x: x.rolling(window=10, min_periods=5).sum(),
+            lambda x: x.rolling(window=10, min_periods=5).mean(),
+            lambda x: x.rolling(window=10, min_periods=5).std(),
+            lambda x: x.rolling(window=10, min_periods=5).var(),
+            lambda x: x.rolling(window=10, min_periods=5).skew(),
+            lambda x: x.rolling(window=10, min_periods=5).kurt(),
+            lambda x: x.rolling(
+                window=10, min_periods=5).quantile(quantile=0.5),
+            lambda x: x.rolling(window=10, min_periods=5).median(),
+            lambda x: x.rolling(window=10, min_periods=5).apply(
+                sum, raw=False),
+            lambda x: x.rolling(window=10, min_periods=5).apply(
+                sum, raw=True),
+            lambda x: x.rolling(win_type='boxcar',
+                                window=10, min_periods=5).mean()])
+    def test_rolling_functions_window_non_shrinkage(self, f):
+        # GH 7764
+        s = Series(range(4))
+        s_expected = Series(np.nan, index=s.index)
+        df = DataFrame([[1, 5], [3, 2], [3, 9], [-1, 0]], columns=['A', 'B'])
+        df_expected = DataFrame(np.nan, index=df.index, columns=df.columns)
+
+        try:
+            s_result = f(s)
+            tm.assert_series_equal(s_result, s_expected)
+
+            df_result = f(df)
+            tm.assert_frame_equal(df_result, df_expected)
+        except (ImportError):
+
+            # scipy needed for rolling_window
+            pytest.skip("scipy not available")
+
+    def test_rolling_functions_window_non_shrinkage_binary(self):
+
+        # corr/cov return a MI DataFrame
+        df = DataFrame([[1, 5], [3, 2], [3, 9], [-1, 0]],
+                       columns=Index(['A', 'B'], name='foo'),
+                       index=Index(range(4), name='bar'))
+        df_expected = DataFrame(
+            columns=Index(['A', 'B'], name='foo'),
+            index=pd.MultiIndex.from_product([df.index, df.columns],
+                                             names=['bar', 'foo']),
+            dtype='float64')
+        functions = [lambda x: (x.rolling(window=10, min_periods=5)
+                                .cov(x, pairwise=True)),
+                     lambda x: (x.rolling(window=10, min_periods=5)
+                                .corr(x, pairwise=True))]
+        for f in functions:
+            df_result = f(df)
+            tm.assert_frame_equal(df_result, df_expected)
+
+    def test_moment_functions_zero_length(self):
+        # GH 8056
+        s = Series()
+        s_expected = s
+        df1 = DataFrame()
+        df1_expected = df1
+        df2 = DataFrame(columns=['a'])
+        df2['a'] = df2['a'].astype('float64')
+        df2_expected = df2
+
+        functions = [lambda x: x.expanding().count(),
+                     lambda x: x.expanding(min_periods=5).cov(
+                         x, pairwise=False),
+                     lambda x: x.expanding(min_periods=5).corr(
+                         x, pairwise=False),
+                     lambda x: x.expanding(min_periods=5).max(),
+                     lambda x: x.expanding(min_periods=5).min(),
+                     lambda x: x.expanding(min_periods=5).sum(),
+                     lambda x: x.expanding(min_periods=5).mean(),
+                     lambda x: x.expanding(min_periods=5).std(),
+                     lambda x: x.expanding(min_periods=5).var(),
+                     lambda x: x.expanding(min_periods=5).skew(),
+                     lambda x: x.expanding(min_periods=5).kurt(),
+                     lambda x: x.expanding(min_periods=5).quantile(0.5),
+                     lambda x: x.expanding(min_periods=5).median(),
+                     lambda x: x.expanding(min_periods=5).apply(
+                         sum, raw=False),
+                     lambda x: x.expanding(min_periods=5).apply(
+                         sum, raw=True),
+                     lambda x: x.rolling(window=10).count(),
+                     lambda x: x.rolling(window=10, min_periods=5).cov(
+                         x, pairwise=False),
+                     lambda x: x.rolling(window=10, min_periods=5).corr(
+                         x, pairwise=False),
+                     lambda x: x.rolling(window=10, min_periods=5).max(),
+                     lambda x: x.rolling(window=10, min_periods=5).min(),
+                     lambda x: x.rolling(window=10, min_periods=5).sum(),
+                     lambda x: x.rolling(window=10, min_periods=5).mean(),
+                     lambda x: x.rolling(window=10, min_periods=5).std(),
+                     lambda x: x.rolling(window=10, min_periods=5).var(),
+                     lambda x: x.rolling(window=10, min_periods=5).skew(),
+                     lambda x: x.rolling(window=10, min_periods=5).kurt(),
+                     lambda x: x.rolling(
+                         window=10, min_periods=5).quantile(0.5),
+                     lambda x: x.rolling(window=10, min_periods=5).median(),
+                     lambda x: x.rolling(window=10, min_periods=5).apply(
+                         sum, raw=False),
+                     lambda x: x.rolling(window=10, min_periods=5).apply(
+                         sum, raw=True),
+                     lambda x: x.rolling(win_type='boxcar',
+                                         window=10, min_periods=5).mean(),
+                     ]
+        for f in functions:
+            try:
+                s_result = f(s)
+                tm.assert_series_equal(s_result, s_expected)
+
+                df1_result = f(df1)
+                tm.assert_frame_equal(df1_result, df1_expected)
+
+                df2_result = f(df2)
+                tm.assert_frame_equal(df2_result, df2_expected)
+            except (ImportError):
+
+                # scipy needed for rolling_window
+                continue
+
+    def test_moment_functions_zero_length_pairwise(self):
+
+        df1 = DataFrame()
+        df1_expected = df1
+        df2 = DataFrame(columns=Index(['a'], name='foo'),
+                        index=Index([], name='bar'))
+        df2['a'] = df2['a'].astype('float64')
+
+        df1_expected = DataFrame(
+            index=pd.MultiIndex.from_product([df1.index, df1.columns]),
+            columns=Index([]))
+        df2_expected = DataFrame(
+            index=pd.MultiIndex.from_product([df2.index, df2.columns],
+                                             names=['bar', 'foo']),
+            columns=Index(['a'], name='foo'),
+            dtype='float64')
+
+        functions = [lambda x: (x.expanding(min_periods=5)
+                                .cov(x, pairwise=True)),
+                     lambda x: (x.expanding(min_periods=5)
+                                .corr(x, pairwise=True)),
+                     lambda x: (x.rolling(window=10, min_periods=5)
+                                .cov(x, pairwise=True)),
+                     lambda x: (x.rolling(window=10, min_periods=5)
+                                .corr(x, pairwise=True)),
+                     ]
+        for f in functions:
+            df1_result = f(df1)
+            tm.assert_frame_equal(df1_result, df1_expected)
+
+            df2_result = f(df2)
+            tm.assert_frame_equal(df2_result, df2_expected)
+
+    def test_expanding_cov_pairwise_diff_length(self):
+        # GH 7512
+        df1 = DataFrame([[1, 5], [3, 2], [3, 9]],
+                        columns=Index(['A', 'B'], name='foo'))
+        df1a = DataFrame([[1, 5], [3, 9]],
+                         index=[0, 2],
+                         columns=Index(['A', 'B'], name='foo'))
+        df2 = DataFrame([[5, 6], [None, None], [2, 1]],
+                        columns=Index(['X', 'Y'], name='foo'))
+        df2a = DataFrame([[5, 6], [2, 1]],
+                         index=[0, 2],
+                         columns=Index(['X', 'Y'], name='foo'))
+        # TODO: xref gh-15826
+        # .loc is not preserving the names
+        result1 = df1.expanding().cov(df2a, pairwise=True).loc[2]
+        result2 = df1.expanding().cov(df2a, pairwise=True).loc[2]
+        result3 = df1a.expanding().cov(df2, pairwise=True).loc[2]
+        result4 = df1a.expanding().cov(df2a, pairwise=True).loc[2]
+        expected = DataFrame([[-3.0, -6.0], [-5.0, -10.0]],
+                             columns=Index(['A', 'B'], name='foo'),
+                             index=Index(['X', 'Y'], name='foo'))
+        tm.assert_frame_equal(result1, expected)
+        tm.assert_frame_equal(result2, expected)
+        tm.assert_frame_equal(result3, expected)
+        tm.assert_frame_equal(result4, expected)
+
+    def test_expanding_corr_pairwise_diff_length(self):
+        # GH 7512
+        df1 = DataFrame([[1, 2], [3, 2], [3, 4]],
+                        columns=['A', 'B'],
+                        index=Index(range(3), name='bar'))
+        df1a = DataFrame([[1, 2], [3, 4]],
+                         index=Index([0, 2], name='bar'),
+                         columns=['A', 'B'])
+        df2 = DataFrame([[5, 6], [None, None], [2, 1]],
+                        columns=['X', 'Y'],
+                        index=Index(range(3), name='bar'))
+        df2a = DataFrame([[5, 6], [2, 1]],
+                         index=Index([0, 2], name='bar'),
+                         columns=['X', 'Y'])
+        result1 = df1.expanding().corr(df2, pairwise=True).loc[2]
+        result2 = df1.expanding().corr(df2a, pairwise=True).loc[2]
+        result3 = df1a.expanding().corr(df2, pairwise=True).loc[2]
+        result4 = df1a.expanding().corr(df2a, pairwise=True).loc[2]
+        expected = DataFrame([[-1.0, -1.0], [-1.0, -1.0]],
+                             columns=['A', 'B'],
+                             index=Index(['X', 'Y']))
+        tm.assert_frame_equal(result1, expected)
+        tm.assert_frame_equal(result2, expected)
+        tm.assert_frame_equal(result3, expected)
+        tm.assert_frame_equal(result4, expected)
+
+    def test_rolling_skew_edge_cases(self):
+
+        all_nan = Series([np.NaN] * 5)
+
+        # yields all NaN (0 variance)
+        d = Series([1] * 5)
+        x = d.rolling(window=5).skew()
+        tm.assert_series_equal(all_nan, x)
+
+        # yields all NaN (window too small)
+        d = Series(np.random.randn(5))
+        x = d.rolling(window=2).skew()
+        tm.assert_series_equal(all_nan, x)
+
+        # yields [NaN, NaN, NaN, 0.177994, 1.548824]
+        d = Series([-1.50837035, -0.1297039, 0.19501095, 1.73508164, 0.41941401
+                    ])
+        expected = Series([np.NaN, np.NaN, np.NaN, 0.177994, 1.548824])
+        x = d.rolling(window=4).skew()
+        tm.assert_series_equal(expected, x)
+
+    def test_rolling_kurt_edge_cases(self):
+
+        all_nan = Series([np.NaN] * 5)
+
+        # yields all NaN (0 variance)
+        d = Series([1] * 5)
+        x = d.rolling(window=5).kurt()
+        tm.assert_series_equal(all_nan, x)
+
+        # yields all NaN (window too small)
+        d = Series(np.random.randn(5))
+        x = d.rolling(window=3).kurt()
+        tm.assert_series_equal(all_nan, x)
+
+        # yields [NaN, NaN, NaN, 1.224307, 2.671499]
+        d = Series([-1.50837035, -0.1297039, 0.19501095, 1.73508164, 0.41941401
+                    ])
+        expected = Series([np.NaN, np.NaN, np.NaN, 1.224307, 2.671499])
+        x = d.rolling(window=4).kurt()
+        tm.assert_series_equal(expected, x)
+
+    def test_rolling_skew_eq_value_fperr(self):
+        # #18804 all rolling skew for all equal values should return Nan
+        a = Series([1.1] * 15).rolling(window=10).skew()
+        assert np.isnan(a).all()
+
+    def test_rolling_kurt_eq_value_fperr(self):
+        # #18804 all rolling kurt for all equal values should return Nan
+        a = Series([1.1] * 15).rolling(window=10).kurt()
+        assert np.isnan(a).all()
+
+    @pytest.mark.parametrize('func,static_comp', [('sum', np.sum),
+                                                  ('mean', np.mean),
+                                                  ('max', np.max),
+                                                  ('min', np.min)],
+                             ids=['sum', 'mean', 'max', 'min'])
+    def test_expanding_func(self, func, static_comp):
+        def expanding_func(x, min_periods=1, center=False, axis=0):
+            exp = x.expanding(min_periods=min_periods,
+                              center=center, axis=axis)
+            return getattr(exp, func)()
+        self._check_expanding(expanding_func, static_comp, preserve_nan=False)
+
+    def test_expanding_apply(self, raw):
+
+        def expanding_mean(x, min_periods=1):
+
+            exp = x.expanding(min_periods=min_periods)
+            result = exp.apply(lambda x: x.mean(), raw=raw)
+            return result
+
+        # TODO(jreback), needed to add preserve_nan=False
+        # here to make this pass
+        self._check_expanding(expanding_mean, np.mean, preserve_nan=False)
+
+        ser = Series([])
+        tm.assert_series_equal(ser, ser.expanding().apply(
+            lambda x: x.mean(), raw=raw))
+
+        # GH 8080
+        s = Series([None, None, None])
+        result = s.expanding(min_periods=0).apply(lambda x: len(x), raw=raw)
+        expected = Series([1., 2., 3.])
+        tm.assert_series_equal(result, expected)
+
+    def _check_expanding(self, func, static_comp, has_min_periods=True,
+                         has_time_rule=True, preserve_nan=True):
+
+        series_result = func(self.series)
+        assert isinstance(series_result, Series)
+        frame_result = func(self.frame)
+        assert isinstance(frame_result, DataFrame)
+
+        result = func(self.series)
+        tm.assert_almost_equal(result[10], static_comp(self.series[:11]))
+
+        if preserve_nan:
+            assert result.iloc[self._nan_locs].isna().all()
+
+        ser = Series(randn(50))
+
+        if has_min_periods:
+            result = func(ser, min_periods=30)
+            assert result[:29].isna().all()
+            tm.assert_almost_equal(result.iloc[-1], static_comp(ser[:50]))
+
+            # min_periods is working correctly
+            result = func(ser, min_periods=15)
+            assert isna(result.iloc[13])
+            assert notna(result.iloc[14])
+
+            ser2 = Series(randn(20))
+            result = func(ser2, min_periods=5)
+            assert isna(result[3])
+            assert notna(result[4])
+
+            # min_periods=0
+            result0 = func(ser, min_periods=0)
+            result1 = func(ser, min_periods=1)
+            tm.assert_almost_equal(result0, result1)
+        else:
+            result = func(ser)
+            tm.assert_almost_equal(result.iloc[-1], static_comp(ser[:50]))
+
+    def test_rolling_max_gh6297(self):
+        """Replicate result expected in GH #6297"""
+
+        indices = [datetime(1975, 1, i) for i in range(1, 6)]
+        # So that we can have 2 datapoints on one of the days
+        indices.append(datetime(1975, 1, 3, 6, 0))
+        series = Series(range(1, 7), index=indices)
+        # Use floats instead of ints as values
+        series = series.map(lambda x: float(x))
+        # Sort chronologically
+        series = series.sort_index()
+
+        expected = Series([1.0, 2.0, 6.0, 4.0, 5.0],
+                          index=[datetime(1975, 1, i, 0) for i in range(1, 6)])
+        x = series.resample('D').max().rolling(window=1).max()
+        tm.assert_series_equal(expected, x)
+
+    def test_rolling_max_resample(self):
+
+        indices = [datetime(1975, 1, i) for i in range(1, 6)]
+        # So that we can have 3 datapoints on last day (4, 10, and 20)
+        indices.append(datetime(1975, 1, 5, 1))
+        indices.append(datetime(1975, 1, 5, 2))
+        series = Series(list(range(0, 5)) + [10, 20], index=indices)
+        # Use floats instead of ints as values
+        series = series.map(lambda x: float(x))
+        # Sort chronologically
+        series = series.sort_index()
+
+        # Default how should be max
+        expected = Series([0.0, 1.0, 2.0, 3.0, 20.0],
+                          index=[datetime(1975, 1, i, 0) for i in range(1, 6)])
+        x = series.resample('D').max().rolling(window=1).max()
+        tm.assert_series_equal(expected, x)
+
+        # Now specify median (10.0)
+        expected = Series([0.0, 1.0, 2.0, 3.0, 10.0],
+                          index=[datetime(1975, 1, i, 0) for i in range(1, 6)])
+        x = series.resample('D').median().rolling(window=1).max()
+        tm.assert_series_equal(expected, x)
+
+        # Now specify mean (4+10+20)/3
+        v = (4.0 + 10.0 + 20.0) / 3.0
+        expected = Series([0.0, 1.0, 2.0, 3.0, v],
+                          index=[datetime(1975, 1, i, 0) for i in range(1, 6)])
+        x = series.resample('D').mean().rolling(window=1).max()
+        tm.assert_series_equal(expected, x)
+
+    def test_rolling_min_resample(self):
+
+        indices = [datetime(1975, 1, i) for i in range(1, 6)]
+        # So that we can have 3 datapoints on last day (4, 10, and 20)
+        indices.append(datetime(1975, 1, 5, 1))
+        indices.append(datetime(1975, 1, 5, 2))
+        series = Series(list(range(0, 5)) + [10, 20], index=indices)
+        # Use floats instead of ints as values
+        series = series.map(lambda x: float(x))
+        # Sort chronologically
+        series = series.sort_index()
+
+        # Default how should be min
+        expected = Series([0.0, 1.0, 2.0, 3.0, 4.0],
+                          index=[datetime(1975, 1, i, 0) for i in range(1, 6)])
+        r = series.resample('D').min().rolling(window=1)
+        tm.assert_series_equal(expected, r.min())
+
+    def test_rolling_median_resample(self):
+
+        indices = [datetime(1975, 1, i) for i in range(1, 6)]
+        # So that we can have 3 datapoints on last day (4, 10, and 20)
+        indices.append(datetime(1975, 1, 5, 1))
+        indices.append(datetime(1975, 1, 5, 2))
+        series = Series(list(range(0, 5)) + [10, 20], index=indices)
+        # Use floats instead of ints as values
+        series = series.map(lambda x: float(x))
+        # Sort chronologically
+        series = series.sort_index()
+
+        # Default how should be median
+        expected = Series([0.0, 1.0, 2.0, 3.0, 10],
+                          index=[datetime(1975, 1, i, 0) for i in range(1, 6)])
+        x = series.resample('D').median().rolling(window=1).median()
+        tm.assert_series_equal(expected, x)
+
+    def test_rolling_median_memory_error(self):
+        # GH11722
+        n = 20000
+        Series(np.random.randn(n)).rolling(window=2, center=False).median()
+        Series(np.random.randn(n)).rolling(window=2, center=False).median()
+
+    def test_rolling_min_max_numeric_types(self):
+
+        # GH12373
+        types_test = [np.dtype("f{}".format(width)) for width in [4, 8]]
+        types_test.extend([np.dtype("{}{}".format(sign, width))
+                           for width in [1, 2, 4, 8] for sign in "ui"])
+        for data_type in types_test:
+            # Just testing that these don't throw exceptions and that
+            # the return type is float64. Other tests will cover quantitative
+            # correctness
+            result = (DataFrame(np.arange(20, dtype=data_type))
+                      .rolling(window=5).max())
+            assert result.dtypes[0] == np.dtype("f8")
+            result = (DataFrame(np.arange(20, dtype=data_type))
+                      .rolling(window=5).min())
+            assert result.dtypes[0] == np.dtype("f8")
+
+
+class TestGrouperGrouping(object):
+
+    def setup_method(self, method):
+        self.series = Series(np.arange(10))
+        self.frame = DataFrame({'A': [1] * 20 + [2] * 12 + [3] * 8,
+                                'B': np.arange(40)})
+
+    def test_mutated(self):
+
+        def f():
+            self.frame.groupby('A', foo=1)
+        pytest.raises(TypeError, f)
+
+        g = self.frame.groupby('A')
+        assert not g.mutated
+        g = self.frame.groupby('A', mutated=True)
+        assert g.mutated
+
+    def test_getitem(self):
+        g = self.frame.groupby('A')
+        g_mutated = self.frame.groupby('A', mutated=True)
+
+        expected = g_mutated.B.apply(lambda x: x.rolling(2).mean())
+
+        result = g.rolling(2).mean().B
+        tm.assert_series_equal(result, expected)
+
+        result = g.rolling(2).B.mean()
+        tm.assert_series_equal(result, expected)
+
+        result = g.B.rolling(2).mean()
+        tm.assert_series_equal(result, expected)
+
+        result = self.frame.B.groupby(self.frame.A).rolling(2).mean()
+        tm.assert_series_equal(result, expected)
+
+    def test_getitem_multiple(self):
+
+        # GH 13174
+        g = self.frame.groupby('A')
+        r = g.rolling(2)
+        g_mutated = self.frame.groupby('A', mutated=True)
+        expected = g_mutated.B.apply(lambda x: x.rolling(2).count())
+
+        result = r.B.count()
+        tm.assert_series_equal(result, expected)
+
+        result = r.B.count()
+        tm.assert_series_equal(result, expected)
+
+    def test_rolling(self):
+        g = self.frame.groupby('A')
+        r = g.rolling(window=4)
+
+        for f in ['sum', 'mean', 'min', 'max', 'count', 'kurt', 'skew']:
+
+            result = getattr(r, f)()
+            expected = g.apply(lambda x: getattr(x.rolling(4), f)())
+            tm.assert_frame_equal(result, expected)
+
+        for f in ['std', 'var']:
+            result = getattr(r, f)(ddof=1)
+            expected = g.apply(lambda x: getattr(x.rolling(4), f)(ddof=1))
+            tm.assert_frame_equal(result, expected)
+
+        result = r.quantile(0.5)
+        expected = g.apply(lambda x: x.rolling(4).quantile(0.5))
+        tm.assert_frame_equal(result, expected)
+
+    def test_rolling_corr_cov(self):
+        g = self.frame.groupby('A')
+        r = g.rolling(window=4)
+
+        for f in ['corr', 'cov']:
+            result = getattr(r, f)(self.frame)
+
+            def func(x):
+                return getattr(x.rolling(4), f)(self.frame)
+            expected = g.apply(func)
+            tm.assert_frame_equal(result, expected)
+
+            result = getattr(r.B, f)(pairwise=True)
+
+            def func(x):
+                return getattr(x.B.rolling(4), f)(pairwise=True)
+            expected = g.apply(func)
+            tm.assert_series_equal(result, expected)
+
+    def test_rolling_apply(self, raw):
+        g = self.frame.groupby('A')
+        r = g.rolling(window=4)
+
+        # reduction
+        result = r.apply(lambda x: x.sum(), raw=raw)
+        expected = g.apply(
+            lambda x: x.rolling(4).apply(lambda y: y.sum(), raw=raw))
+        tm.assert_frame_equal(result, expected)
+
+    def test_rolling_apply_mutability(self):
+        # GH 14013
+        df = pd.DataFrame({'A': ['foo'] * 3 + ['bar'] * 3, 'B': [1] * 6})
+        g = df.groupby('A')
+
+        mi = pd.MultiIndex.from_tuples([('bar', 3), ('bar', 4), ('bar', 5),
+                                        ('foo', 0), ('foo', 1), ('foo', 2)])
+
+        mi.names = ['A', None]
+        # Grouped column should not be a part of the output
+        expected = pd.DataFrame([np.nan, 2., 2.] * 2, columns=['B'], index=mi)
+
+        result = g.rolling(window=2).sum()
+        tm.assert_frame_equal(result, expected)
+
+        # Call an arbitrary function on the groupby
+        g.sum()
+
+        # Make sure nothing has been mutated
+        result = g.rolling(window=2).sum()
+        tm.assert_frame_equal(result, expected)
+
+    def test_expanding(self):
+        g = self.frame.groupby('A')
+        r = g.expanding()
+
+        for f in ['sum', 'mean', 'min', 'max', 'count', 'kurt', 'skew']:
+
+            result = getattr(r, f)()
+            expected = g.apply(lambda x: getattr(x.expanding(), f)())
+            tm.assert_frame_equal(result, expected)
+
+        for f in ['std', 'var']:
+            result = getattr(r, f)(ddof=0)
+            expected = g.apply(lambda x: getattr(x.expanding(), f)(ddof=0))
+            tm.assert_frame_equal(result, expected)
+
+        result = r.quantile(0.5)
+        expected = g.apply(lambda x: x.expanding().quantile(0.5))
+        tm.assert_frame_equal(result, expected)
+
+    def test_expanding_corr_cov(self):
+        g = self.frame.groupby('A')
+        r = g.expanding()
+
+        for f in ['corr', 'cov']:
+            result = getattr(r, f)(self.frame)
+
+            def func(x):
+                return getattr(x.expanding(), f)(self.frame)
+            expected = g.apply(func)
+            tm.assert_frame_equal(result, expected)
+
+            result = getattr(r.B, f)(pairwise=True)
+
+            def func(x):
+                return getattr(x.B.expanding(), f)(pairwise=True)
+            expected = g.apply(func)
+            tm.assert_series_equal(result, expected)
+
+    def test_expanding_apply(self, raw):
+        g = self.frame.groupby('A')
+        r = g.expanding()
+
+        # reduction
+        result = r.apply(lambda x: x.sum(), raw=raw)
+        expected = g.apply(
+            lambda x: x.expanding().apply(lambda y: y.sum(), raw=raw))
+        tm.assert_frame_equal(result, expected)
+
+
+class TestRollingTS(object):
+
+    # rolling time-series friendly
+    # xref GH13327
+
+    def setup_method(self, method):
+
+        self.regular = DataFrame({'A': pd.date_range('20130101',
+                                                     periods=5,
+                                                     freq='s'),
+                                  'B': range(5)}).set_index('A')
+
+        self.ragged = DataFrame({'B': range(5)})
+        self.ragged.index = [Timestamp('20130101 09:00:00'),
+                             Timestamp('20130101 09:00:02'),
+                             Timestamp('20130101 09:00:03'),
+                             Timestamp('20130101 09:00:05'),
+                             Timestamp('20130101 09:00:06')]
+
+    def test_doc_string(self):
+
+        df = DataFrame({'B': [0, 1, 2, np.nan, 4]},
+                       index=[Timestamp('20130101 09:00:00'),
+                              Timestamp('20130101 09:00:02'),
+                              Timestamp('20130101 09:00:03'),
+                              Timestamp('20130101 09:00:05'),
+                              Timestamp('20130101 09:00:06')])
+        df
+        df.rolling('2s').sum()
+
+    def test_valid(self):
+
+        df = self.regular
+
+        # not a valid freq
+        with pytest.raises(ValueError):
+            df.rolling(window='foobar')
+
+        # not a datetimelike index
+        with pytest.raises(ValueError):
+            df.reset_index().rolling(window='foobar')
+
+        # non-fixed freqs
+        for freq in ['2MS', pd.offsets.MonthBegin(2)]:
+            with pytest.raises(ValueError):
+                df.rolling(window=freq)
+
+        for freq in ['1D', pd.offsets.Day(2), '2ms']:
+            df.rolling(window=freq)
+
+        # non-integer min_periods
+        for minp in [1.0, 'foo', np.array([1, 2, 3])]:
+            with pytest.raises(ValueError):
+                df.rolling(window='1D', min_periods=minp)
+
+        # center is not implemented
+        with pytest.raises(NotImplementedError):
+            df.rolling(window='1D', center=True)
+
+    def test_on(self):
+
+        df = self.regular
+
+        # not a valid column
+        with pytest.raises(ValueError):
+            df.rolling(window='2s', on='foobar')
+
+        # column is valid
+        df = df.copy()
+        df['C'] = pd.date_range('20130101', periods=len(df))
+        df.rolling(window='2d', on='C').sum()
+
+        # invalid columns
+        with pytest.raises(ValueError):
+            df.rolling(window='2d', on='B')
+
+        # ok even though on non-selected
+        df.rolling(window='2d', on='C').B.sum()
+
+    def test_monotonic_on(self):
+
+        # on/index must be monotonic
+        df = DataFrame({'A': pd.date_range('20130101',
+                                           periods=5,
+                                           freq='s'),
+                        'B': range(5)})
+
+        assert df.A.is_monotonic
+        df.rolling('2s', on='A').sum()
+
+        df = df.set_index('A')
+        assert df.index.is_monotonic
+        df.rolling('2s').sum()
+
+        # non-monotonic
+        df.index = reversed(df.index.tolist())
+        assert not df.index.is_monotonic
+
+        with pytest.raises(ValueError):
+            df.rolling('2s').sum()
+
+        df = df.reset_index()
+        with pytest.raises(ValueError):
+            df.rolling('2s', on='A').sum()
+
+    def test_frame_on(self):
+
+        df = DataFrame({'B': range(5),
+                        'C': pd.date_range('20130101 09:00:00',
+                                           periods=5,
+                                           freq='3s')})
+
+        df['A'] = [Timestamp('20130101 09:00:00'),
+                   Timestamp('20130101 09:00:02'),
+                   Timestamp('20130101 09:00:03'),
+                   Timestamp('20130101 09:00:05'),
+                   Timestamp('20130101 09:00:06')]
+
+        # we are doing simulating using 'on'
+        expected = (df.set_index('A')
+                    .rolling('2s')
+                    .B
+                    .sum()
+                    .reset_index(drop=True)
+                    )
+
+        result = (df.rolling('2s', on='A')
+                    .B
+                    .sum()
+                  )
+        tm.assert_series_equal(result, expected)
+
+        # test as a frame
+        # we should be ignoring the 'on' as an aggregation column
+        # note that the expected is setting, computing, and resetting
+        # so the columns need to be switched compared
+        # to the actual result where they are ordered as in the
+        # original
+        expected = (df.set_index('A')
+                      .rolling('2s')[['B']]
+                      .sum()
+                      .reset_index()[['B', 'A']]
+                    )
+
+        result = (df.rolling('2s', on='A')[['B']]
+                    .sum()
+                  )
+        tm.assert_frame_equal(result, expected)
+
+    def test_frame_on2(self):
+
+        # using multiple aggregation columns
+        df = DataFrame({'A': [0, 1, 2, 3, 4],
+                        'B': [0, 1, 2, np.nan, 4],
+                        'C': Index([Timestamp('20130101 09:00:00'),
+                                    Timestamp('20130101 09:00:02'),
+                                    Timestamp('20130101 09:00:03'),
+                                    Timestamp('20130101 09:00:05'),
+                                    Timestamp('20130101 09:00:06')])},
+                       columns=['A', 'C', 'B'])
+
+        expected1 = DataFrame({'A': [0., 1, 3, 3, 7],
+                               'B': [0, 1, 3, np.nan, 4],
+                               'C': df['C']},
+                              columns=['A', 'C', 'B'])
+
+        result = df.rolling('2s', on='C').sum()
+        expected = expected1
+        tm.assert_frame_equal(result, expected)
+
+        expected = Series([0, 1, 3, np.nan, 4], name='B')
+        result = df.rolling('2s', on='C').B.sum()
+        tm.assert_series_equal(result, expected)
+
+        expected = expected1[['A', 'B', 'C']]
+        result = df.rolling('2s', on='C')[['A', 'B', 'C']].sum()
+        tm.assert_frame_equal(result, expected)
+
+    def test_basic_regular(self):
+
+        df = self.regular.copy()
+
+        df.index = pd.date_range('20130101', periods=5, freq='D')
+        expected = df.rolling(window=1, min_periods=1).sum()
+        result = df.rolling(window='1D').sum()
+        tm.assert_frame_equal(result, expected)
+
+        df.index = pd.date_range('20130101', periods=5, freq='2D')
+        expected = df.rolling(window=1, min_periods=1).sum()
+        result = df.rolling(window='2D', min_periods=1).sum()
+        tm.assert_frame_equal(result, expected)
+
+        expected = df.rolling(window=1, min_periods=1).sum()
+        result = df.rolling(window='2D', min_periods=1).sum()
+        tm.assert_frame_equal(result, expected)
+
+        expected = df.rolling(window=1).sum()
+        result = df.rolling(window='2D').sum()
+        tm.assert_frame_equal(result, expected)
+
+    def test_min_periods(self):
+
+        # compare for min_periods
+        df = self.regular
+
+        # these slightly different
+        expected = df.rolling(2, min_periods=1).sum()
+        result = df.rolling('2s').sum()
+        tm.assert_frame_equal(result, expected)
+
+        expected = df.rolling(2, min_periods=1).sum()
+        result = df.rolling('2s', min_periods=1).sum()
+        tm.assert_frame_equal(result, expected)
+
+    def test_closed(self):
+
+        # xref GH13965
+
+        df = DataFrame({'A': [1] * 5},
+                       index=[Timestamp('20130101 09:00:01'),
+                              Timestamp('20130101 09:00:02'),
+                              Timestamp('20130101 09:00:03'),
+                              Timestamp('20130101 09:00:04'),
+                              Timestamp('20130101 09:00:06')])
+
+        # closed must be 'right', 'left', 'both', 'neither'
+        with pytest.raises(ValueError):
+            self.regular.rolling(window='2s', closed="blabla")
+
+        expected = df.copy()
+        expected["A"] = [1.0, 2, 2, 2, 1]
+        result = df.rolling('2s', closed='right').sum()
+        tm.assert_frame_equal(result, expected)
+
+        # default should be 'right'
+        result = df.rolling('2s').sum()
+        tm.assert_frame_equal(result, expected)
+
+        expected = df.copy()
+        expected["A"] = [1.0, 2, 3, 3, 2]
+        result = df.rolling('2s', closed='both').sum()
+        tm.assert_frame_equal(result, expected)
+
+        expected = df.copy()
+        expected["A"] = [np.nan, 1.0, 2, 2, 1]
+        result = df.rolling('2s', closed='left').sum()
+        tm.assert_frame_equal(result, expected)
+
+        expected = df.copy()
+        expected["A"] = [np.nan, 1.0, 1, 1, np.nan]
+        result = df.rolling('2s', closed='neither').sum()
+        tm.assert_frame_equal(result, expected)
+
+    def test_ragged_sum(self):
+
+        df = self.ragged
+        result = df.rolling(window='1s', min_periods=1).sum()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 2, 3, 4]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='2s', min_periods=1).sum()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 3, 3, 7]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='2s', min_periods=2).sum()
+        expected = df.copy()
+        expected['B'] = [np.nan, np.nan, 3, np.nan, 7]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='3s', min_periods=1).sum()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 3, 5, 7]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='3s').sum()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 3, 5, 7]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='4s', min_periods=1).sum()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 3, 6, 9]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='4s', min_periods=3).sum()
+        expected = df.copy()
+        expected['B'] = [np.nan, np.nan, 3, 6, 9]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='5s', min_periods=1).sum()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 3, 6, 10]
+        tm.assert_frame_equal(result, expected)
+
+    def test_ragged_mean(self):
+
+        df = self.ragged
+        result = df.rolling(window='1s', min_periods=1).mean()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 2, 3, 4]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='2s', min_periods=1).mean()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 1.5, 3.0, 3.5]
+        tm.assert_frame_equal(result, expected)
+
+    def test_ragged_median(self):
+
+        df = self.ragged
+        result = df.rolling(window='1s', min_periods=1).median()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 2, 3, 4]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='2s', min_periods=1).median()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 1.5, 3.0, 3.5]
+        tm.assert_frame_equal(result, expected)
+
+    def test_ragged_quantile(self):
+
+        df = self.ragged
+        result = df.rolling(window='1s', min_periods=1).quantile(0.5)
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 2, 3, 4]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='2s', min_periods=1).quantile(0.5)
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 1.5, 3.0, 3.5]
+        tm.assert_frame_equal(result, expected)
+
+    def test_ragged_std(self):
+
+        df = self.ragged
+        result = df.rolling(window='1s', min_periods=1).std(ddof=0)
+        expected = df.copy()
+        expected['B'] = [0.0] * 5
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='1s', min_periods=1).std(ddof=1)
+        expected = df.copy()
+        expected['B'] = [np.nan] * 5
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='3s', min_periods=1).std(ddof=0)
+        expected = df.copy()
+        expected['B'] = [0.0] + [0.5] * 4
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='5s', min_periods=1).std(ddof=1)
+        expected = df.copy()
+        expected['B'] = [np.nan, 0.707107, 1.0, 1.0, 1.290994]
+        tm.assert_frame_equal(result, expected)
+
+    def test_ragged_var(self):
+
+        df = self.ragged
+        result = df.rolling(window='1s', min_periods=1).var(ddof=0)
+        expected = df.copy()
+        expected['B'] = [0.0] * 5
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='1s', min_periods=1).var(ddof=1)
+        expected = df.copy()
+        expected['B'] = [np.nan] * 5
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='3s', min_periods=1).var(ddof=0)
+        expected = df.copy()
+        expected['B'] = [0.0] + [0.25] * 4
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='5s', min_periods=1).var(ddof=1)
+        expected = df.copy()
+        expected['B'] = [np.nan, 0.5, 1.0, 1.0, 1 + 2 / 3.]
+        tm.assert_frame_equal(result, expected)
+
+    def test_ragged_skew(self):
+
+        df = self.ragged
+        result = df.rolling(window='3s', min_periods=1).skew()
+        expected = df.copy()
+        expected['B'] = [np.nan] * 5
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='5s', min_periods=1).skew()
+        expected = df.copy()
+        expected['B'] = [np.nan] * 2 + [0.0, 0.0, 0.0]
+        tm.assert_frame_equal(result, expected)
+
+    def test_ragged_kurt(self):
+
+        df = self.ragged
+        result = df.rolling(window='3s', min_periods=1).kurt()
+        expected = df.copy()
+        expected['B'] = [np.nan] * 5
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='5s', min_periods=1).kurt()
+        expected = df.copy()
+        expected['B'] = [np.nan] * 4 + [-1.2]
+        tm.assert_frame_equal(result, expected)
+
+    def test_ragged_count(self):
+
+        df = self.ragged
+        result = df.rolling(window='1s', min_periods=1).count()
+        expected = df.copy()
+        expected['B'] = [1.0, 1, 1, 1, 1]
+        tm.assert_frame_equal(result, expected)
+
+        df = self.ragged
+        result = df.rolling(window='1s').count()
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='2s', min_periods=1).count()
+        expected = df.copy()
+        expected['B'] = [1.0, 1, 2, 1, 2]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='2s', min_periods=2).count()
+        expected = df.copy()
+        expected['B'] = [np.nan, np.nan, 2, np.nan, 2]
+        tm.assert_frame_equal(result, expected)
+
+    def test_regular_min(self):
+
+        df = DataFrame({'A': pd.date_range('20130101',
+                                           periods=5,
+                                           freq='s'),
+                        'B': [0.0, 1, 2, 3, 4]}).set_index('A')
+        result = df.rolling('1s').min()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 2, 3, 4]
+        tm.assert_frame_equal(result, expected)
+
+        df = DataFrame({'A': pd.date_range('20130101',
+                                           periods=5,
+                                           freq='s'),
+                        'B': [5, 4, 3, 4, 5]}).set_index('A')
+
+        tm.assert_frame_equal(result, expected)
+        result = df.rolling('2s').min()
+        expected = df.copy()
+        expected['B'] = [5.0, 4, 3, 3, 4]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling('5s').min()
+        expected = df.copy()
+        expected['B'] = [5.0, 4, 3, 3, 3]
+        tm.assert_frame_equal(result, expected)
+
+    def test_ragged_min(self):
+
+        df = self.ragged
+
+        result = df.rolling(window='1s', min_periods=1).min()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 2, 3, 4]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='2s', min_periods=1).min()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 1, 3, 3]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='5s', min_periods=1).min()
+        expected = df.copy()
+        expected['B'] = [0.0, 0, 0, 1, 1]
+        tm.assert_frame_equal(result, expected)
+
+    def test_perf_min(self):
+
+        N = 10000
+
+        dfp = DataFrame({'B': np.random.randn(N)},
+                        index=pd.date_range('20130101',
+                                            periods=N,
+                                            freq='s'))
+        expected = dfp.rolling(2, min_periods=1).min()
+        result = dfp.rolling('2s').min()
+        assert ((result - expected) < 0.01).all().bool()
+
+        expected = dfp.rolling(200, min_periods=1).min()
+        result = dfp.rolling('200s').min()
+        assert ((result - expected) < 0.01).all().bool()
+
+    def test_ragged_max(self):
+
+        df = self.ragged
+
+        result = df.rolling(window='1s', min_periods=1).max()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 2, 3, 4]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='2s', min_periods=1).max()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 2, 3, 4]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='5s', min_periods=1).max()
+        expected = df.copy()
+        expected['B'] = [0.0, 1, 2, 3, 4]
+        tm.assert_frame_equal(result, expected)
+
+    def test_ragged_apply(self, raw):
+
+        df = self.ragged
+
+        f = lambda x: 1
+        result = df.rolling(window='1s', min_periods=1).apply(f, raw=raw)
+        expected = df.copy()
+        expected['B'] = 1.
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='2s', min_periods=1).apply(f, raw=raw)
+        expected = df.copy()
+        expected['B'] = 1.
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rolling(window='5s', min_periods=1).apply(f, raw=raw)
+        expected = df.copy()
+        expected['B'] = 1.
+        tm.assert_frame_equal(result, expected)
+
+    def test_all(self):
+
+        # simple comparison of integer vs time-based windowing
+        df = self.regular * 2
+        er = df.rolling(window=1)
+        r = df.rolling(window='1s')
+
+        for f in ['sum', 'mean', 'count', 'median', 'std',
+                  'var', 'kurt', 'skew', 'min', 'max']:
+
+            result = getattr(r, f)()
+            expected = getattr(er, f)()
+            tm.assert_frame_equal(result, expected)
+
+        result = r.quantile(0.5)
+        expected = er.quantile(0.5)
+        tm.assert_frame_equal(result, expected)
+
+    def test_all_apply(self, raw):
+
+        df = self.regular * 2
+        er = df.rolling(window=1)
+        r = df.rolling(window='1s')
+
+        result = r.apply(lambda x: 1, raw=raw)
+        expected = er.apply(lambda x: 1, raw=raw)
+        tm.assert_frame_equal(result, expected)
+
+    def test_all2(self):
+
+        # more sophisticated comparison of integer vs.
+        # time-based windowing
+        df = DataFrame({'B': np.arange(50)},
+                       index=pd.date_range('20130101',
+                                           periods=50, freq='H')
+                       )
+        # in-range data
+        dft = df.between_time("09:00", "16:00")
+
+        r = dft.rolling(window='5H')
+
+        for f in ['sum', 'mean', 'count', 'median', 'std',
+                  'var', 'kurt', 'skew', 'min', 'max']:
+
+            result = getattr(r, f)()
+
+            # we need to roll the days separately
+            # to compare with a time-based roll
+            # finally groupby-apply will return a multi-index
+            # so we need to drop the day
+            def agg_by_day(x):
+                x = x.between_time("09:00", "16:00")
+                return getattr(x.rolling(5, min_periods=1), f)()
+            expected = df.groupby(df.index.day).apply(
+                agg_by_day).reset_index(level=0, drop=True)
+
+            tm.assert_frame_equal(result, expected)
+
+    def test_groupby_monotonic(self):
+
+        # GH 15130
+        # we don't need to validate monotonicity when grouping
+
+        data = [
+            ['David', '1/1/2015', 100], ['David', '1/5/2015', 500],
+            ['David', '5/30/2015', 50], ['David', '7/25/2015', 50],
+            ['Ryan', '1/4/2014', 100], ['Ryan', '1/19/2015', 500],
+            ['Ryan', '3/31/2016', 50], ['Joe', '7/1/2015', 100],
+            ['Joe', '9/9/2015', 500], ['Joe', '10/15/2015', 50]]
+
+        df = DataFrame(data=data, columns=['name', 'date', 'amount'])
+        df['date'] = pd.to_datetime(df['date'])
+
+        expected = df.set_index('date').groupby('name').apply(
+            lambda x: x.rolling('180D')['amount'].sum())
+        result = df.groupby('name').rolling('180D', on='date')['amount'].sum()
+        tm.assert_series_equal(result, expected)
+
+    def test_non_monotonic(self):
+        # GH 13966 (similar to #15130, closed by #15175)
+
+        dates = pd.date_range(start='2016-01-01 09:30:00',
+                              periods=20, freq='s')
+        df = DataFrame({'A': [1] * 20 + [2] * 12 + [3] * 8,
+                        'B': np.concatenate((dates, dates)),
+                        'C': np.arange(40)})
+
+        result = df.groupby('A').rolling('4s', on='B').C.mean()
+        expected = df.set_index('B').groupby('A').apply(
+            lambda x: x.rolling('4s')['C'].mean())
+        tm.assert_series_equal(result, expected)
+
+        df2 = df.sort_values('B')
+        result = df2.groupby('A').rolling('4s', on='B').C.mean()
+        tm.assert_series_equal(result, expected)
+
+    def test_rolling_cov_offset(self):
+        # GH16058
+
+        idx = pd.date_range('2017-01-01', periods=24, freq='1h')
+        ss = Series(np.arange(len(idx)), index=idx)
+
+        result = ss.rolling('2h').cov()
+        expected = Series([np.nan] + [0.5] * (len(idx) - 1), index=idx)
+        tm.assert_series_equal(result, expected)
+
+        expected2 = ss.rolling(2, min_periods=1).cov()
+        tm.assert_series_equal(result, expected2)
+
+        result = ss.rolling('3h').cov()
+        expected = Series([np.nan, 0.5] + [1.0] * (len(idx) - 2), index=idx)
+        tm.assert_series_equal(result, expected)
+
+        expected2 = ss.rolling(3, min_periods=1).cov()
+        tm.assert_series_equal(result, expected2)
diff --git a/pandas/tests/tools/__init__.py b/pandas/tests/tools/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/tools/test_numeric.py b/pandas/tests/tools/test_numeric.py
new file mode 100644
index 0000000000000..b306dba0be7f1
--- /dev/null
+++ b/pandas/tests/tools/test_numeric.py
@@ -0,0 +1,408 @@
+import pytest
+import decimal
+
+import numpy as np
+import pandas as pd
+from pandas import to_numeric
+
+from pandas.util import testing as tm
+from numpy import iinfo
+
+
+class TestToNumeric(object):
+
+    def test_empty(self):
+        # see gh-16302
+        s = pd.Series([], dtype=object)
+
+        res = to_numeric(s)
+        expected = pd.Series([], dtype=np.int64)
+
+        tm.assert_series_equal(res, expected)
+
+        # Original issue example
+        res = to_numeric(s, errors='coerce', downcast='integer')
+        expected = pd.Series([], dtype=np.int8)
+
+        tm.assert_series_equal(res, expected)
+
+    def test_series(self):
+        s = pd.Series(['1', '-3.14', '7'])
+        res = to_numeric(s)
+        expected = pd.Series([1, -3.14, 7])
+        tm.assert_series_equal(res, expected)
+
+        s = pd.Series(['1', '-3.14', 7])
+        res = to_numeric(s)
+        tm.assert_series_equal(res, expected)
+
+    def test_series_numeric(self):
+        s = pd.Series([1, 3, 4, 5], index=list('ABCD'), name='XXX')
+        res = to_numeric(s)
+        tm.assert_series_equal(res, s)
+
+        s = pd.Series([1., 3., 4., 5.], index=list('ABCD'), name='XXX')
+        res = to_numeric(s)
+        tm.assert_series_equal(res, s)
+
+        # bool is regarded as numeric
+        s = pd.Series([True, False, True, True],
+                      index=list('ABCD'), name='XXX')
+        res = to_numeric(s)
+        tm.assert_series_equal(res, s)
+
+    def test_error(self):
+        s = pd.Series([1, -3.14, 'apple'])
+        msg = 'Unable to parse string "apple" at position 2'
+        with tm.assert_raises_regex(ValueError, msg):
+            to_numeric(s, errors='raise')
+
+        res = to_numeric(s, errors='ignore')
+        expected = pd.Series([1, -3.14, 'apple'])
+        tm.assert_series_equal(res, expected)
+
+        res = to_numeric(s, errors='coerce')
+        expected = pd.Series([1, -3.14, np.nan])
+        tm.assert_series_equal(res, expected)
+
+        s = pd.Series(['orange', 1, -3.14, 'apple'])
+        msg = 'Unable to parse string "orange" at position 0'
+        with tm.assert_raises_regex(ValueError, msg):
+            to_numeric(s, errors='raise')
+
+    def test_error_seen_bool(self):
+        s = pd.Series([True, False, 'apple'])
+        msg = 'Unable to parse string "apple" at position 2'
+        with tm.assert_raises_regex(ValueError, msg):
+            to_numeric(s, errors='raise')
+
+        res = to_numeric(s, errors='ignore')
+        expected = pd.Series([True, False, 'apple'])
+        tm.assert_series_equal(res, expected)
+
+        # coerces to float
+        res = to_numeric(s, errors='coerce')
+        expected = pd.Series([1., 0., np.nan])
+        tm.assert_series_equal(res, expected)
+
+    def test_list(self):
+        s = ['1', '-3.14', '7']
+        res = to_numeric(s)
+        expected = np.array([1, -3.14, 7])
+        tm.assert_numpy_array_equal(res, expected)
+
+    def test_list_numeric(self):
+        s = [1, 3, 4, 5]
+        res = to_numeric(s)
+        tm.assert_numpy_array_equal(res, np.array(s, dtype=np.int64))
+
+        s = [1., 3., 4., 5.]
+        res = to_numeric(s)
+        tm.assert_numpy_array_equal(res, np.array(s))
+
+        # bool is regarded as numeric
+        s = [True, False, True, True]
+        res = to_numeric(s)
+        tm.assert_numpy_array_equal(res, np.array(s))
+
+    def test_numeric(self):
+        s = pd.Series([1, -3.14, 7], dtype='O')
+        res = to_numeric(s)
+        expected = pd.Series([1, -3.14, 7])
+        tm.assert_series_equal(res, expected)
+
+        s = pd.Series([1, -3.14, 7])
+        res = to_numeric(s)
+        tm.assert_series_equal(res, expected)
+
+        # GH 14827
+        df = pd.DataFrame(dict(
+            a=[1.2, decimal.Decimal(3.14), decimal.Decimal("infinity"), '0.1'],
+            b=[1.0, 2.0, 3.0, 4.0],
+        ))
+        expected = pd.DataFrame(dict(
+            a=[1.2, 3.14, np.inf, 0.1],
+            b=[1.0, 2.0, 3.0, 4.0],
+        ))
+
+        # Test to_numeric over one column
+        df_copy = df.copy()
+        df_copy['a'] = df_copy['a'].apply(to_numeric)
+        tm.assert_frame_equal(df_copy, expected)
+
+        # Test to_numeric over multiple columns
+        df_copy = df.copy()
+        df_copy[['a', 'b']] = df_copy[['a', 'b']].apply(to_numeric)
+        tm.assert_frame_equal(df_copy, expected)
+
+    def test_numeric_lists_and_arrays(self):
+        # Test to_numeric with embedded lists and arrays
+        df = pd.DataFrame(dict(
+            a=[[decimal.Decimal(3.14), 1.0], decimal.Decimal(1.6), 0.1]
+        ))
+        df['a'] = df['a'].apply(to_numeric)
+        expected = pd.DataFrame(dict(
+            a=[[3.14, 1.0], 1.6, 0.1],
+        ))
+        tm.assert_frame_equal(df, expected)
+
+        df = pd.DataFrame(dict(
+            a=[np.array([decimal.Decimal(3.14), 1.0]), 0.1]
+        ))
+        df['a'] = df['a'].apply(to_numeric)
+        expected = pd.DataFrame(dict(
+            a=[[3.14, 1.0], 0.1],
+        ))
+        tm.assert_frame_equal(df, expected)
+
+    def test_all_nan(self):
+        s = pd.Series(['a', 'b', 'c'])
+        res = to_numeric(s, errors='coerce')
+        expected = pd.Series([np.nan, np.nan, np.nan])
+        tm.assert_series_equal(res, expected)
+
+    def test_type_check(self):
+        # GH 11776
+        df = pd.DataFrame({'a': [1, -3.14, 7], 'b': ['4', '5', '6']})
+        with tm.assert_raises_regex(TypeError, "1-d array"):
+            to_numeric(df)
+        for errors in ['ignore', 'raise', 'coerce']:
+            with tm.assert_raises_regex(TypeError, "1-d array"):
+                to_numeric(df, errors=errors)
+
+    def test_scalar(self):
+        assert pd.to_numeric(1) == 1
+        assert pd.to_numeric(1.1) == 1.1
+
+        assert pd.to_numeric('1') == 1
+        assert pd.to_numeric('1.1') == 1.1
+
+        with pytest.raises(ValueError):
+            to_numeric('XX', errors='raise')
+
+        assert to_numeric('XX', errors='ignore') == 'XX'
+        assert np.isnan(to_numeric('XX', errors='coerce'))
+
+    def test_numeric_dtypes(self):
+        idx = pd.Index([1, 2, 3], name='xxx')
+        res = pd.to_numeric(idx)
+        tm.assert_index_equal(res, idx)
+
+        res = pd.to_numeric(pd.Series(idx, name='xxx'))
+        tm.assert_series_equal(res, pd.Series(idx, name='xxx'))
+
+        res = pd.to_numeric(idx.values)
+        tm.assert_numpy_array_equal(res, idx.values)
+
+        idx = pd.Index([1., np.nan, 3., np.nan], name='xxx')
+        res = pd.to_numeric(idx)
+        tm.assert_index_equal(res, idx)
+
+        res = pd.to_numeric(pd.Series(idx, name='xxx'))
+        tm.assert_series_equal(res, pd.Series(idx, name='xxx'))
+
+        res = pd.to_numeric(idx.values)
+        tm.assert_numpy_array_equal(res, idx.values)
+
+    def test_str(self):
+        idx = pd.Index(['1', '2', '3'], name='xxx')
+        exp = np.array([1, 2, 3], dtype='int64')
+        res = pd.to_numeric(idx)
+        tm.assert_index_equal(res, pd.Index(exp, name='xxx'))
+
+        res = pd.to_numeric(pd.Series(idx, name='xxx'))
+        tm.assert_series_equal(res, pd.Series(exp, name='xxx'))
+
+        res = pd.to_numeric(idx.values)
+        tm.assert_numpy_array_equal(res, exp)
+
+        idx = pd.Index(['1.5', '2.7', '3.4'], name='xxx')
+        exp = np.array([1.5, 2.7, 3.4])
+        res = pd.to_numeric(idx)
+        tm.assert_index_equal(res, pd.Index(exp, name='xxx'))
+
+        res = pd.to_numeric(pd.Series(idx, name='xxx'))
+        tm.assert_series_equal(res, pd.Series(exp, name='xxx'))
+
+        res = pd.to_numeric(idx.values)
+        tm.assert_numpy_array_equal(res, exp)
+
+    def test_datetimelike(self):
+        for tz in [None, 'US/Eastern', 'Asia/Tokyo']:
+            idx = pd.date_range('20130101', periods=3, tz=tz, name='xxx')
+            res = pd.to_numeric(idx)
+            tm.assert_index_equal(res, pd.Index(idx.asi8, name='xxx'))
+
+            res = pd.to_numeric(pd.Series(idx, name='xxx'))
+            tm.assert_series_equal(res, pd.Series(idx.asi8, name='xxx'))
+
+            res = pd.to_numeric(idx.values)
+            tm.assert_numpy_array_equal(res, idx.asi8)
+
+    def test_timedelta(self):
+        idx = pd.timedelta_range('1 days', periods=3, freq='D', name='xxx')
+        res = pd.to_numeric(idx)
+        tm.assert_index_equal(res, pd.Index(idx.asi8, name='xxx'))
+
+        res = pd.to_numeric(pd.Series(idx, name='xxx'))
+        tm.assert_series_equal(res, pd.Series(idx.asi8, name='xxx'))
+
+        res = pd.to_numeric(idx.values)
+        tm.assert_numpy_array_equal(res, idx.asi8)
+
+    def test_period(self):
+        idx = pd.period_range('2011-01', periods=3, freq='M', name='xxx')
+        res = pd.to_numeric(idx)
+        tm.assert_index_equal(res, pd.Index(idx.asi8, name='xxx'))
+
+        # ToDo: enable when we can support native PeriodDtype
+        # res = pd.to_numeric(pd.Series(idx, name='xxx'))
+        # tm.assert_series_equal(res, pd.Series(idx.asi8, name='xxx'))
+
+    def test_non_hashable(self):
+        # Test for Bug #13324
+        s = pd.Series([[10.0, 2], 1.0, 'apple'])
+        res = pd.to_numeric(s, errors='coerce')
+        tm.assert_series_equal(res, pd.Series([np.nan, 1.0, np.nan]))
+
+        res = pd.to_numeric(s, errors='ignore')
+        tm.assert_series_equal(res, pd.Series([[10.0, 2], 1.0, 'apple']))
+
+        with tm.assert_raises_regex(TypeError, "Invalid object type"):
+            pd.to_numeric(s)
+
+    def test_downcast(self):
+        # see gh-13352
+        mixed_data = ['1', 2, 3]
+        int_data = [1, 2, 3]
+        date_data = np.array(['1970-01-02', '1970-01-03',
+                              '1970-01-04'], dtype='datetime64[D]')
+
+        invalid_downcast = 'unsigned-integer'
+        msg = 'invalid downcasting method provided'
+
+        smallest_int_dtype = np.dtype(np.typecodes['Integer'][0])
+        smallest_uint_dtype = np.dtype(np.typecodes['UnsignedInteger'][0])
+
+        # support below np.float32 is rare and far between
+        float_32_char = np.dtype(np.float32).char
+        smallest_float_dtype = float_32_char
+
+        for data in (mixed_data, int_data, date_data):
+            with tm.assert_raises_regex(ValueError, msg):
+                pd.to_numeric(data, downcast=invalid_downcast)
+
+            expected = np.array([1, 2, 3], dtype=np.int64)
+
+            res = pd.to_numeric(data)
+            tm.assert_numpy_array_equal(res, expected)
+
+            res = pd.to_numeric(data, downcast=None)
+            tm.assert_numpy_array_equal(res, expected)
+
+            expected = np.array([1, 2, 3], dtype=smallest_int_dtype)
+
+            for signed_downcast in ('integer', 'signed'):
+                res = pd.to_numeric(data, downcast=signed_downcast)
+                tm.assert_numpy_array_equal(res, expected)
+
+            expected = np.array([1, 2, 3], dtype=smallest_uint_dtype)
+            res = pd.to_numeric(data, downcast='unsigned')
+            tm.assert_numpy_array_equal(res, expected)
+
+            expected = np.array([1, 2, 3], dtype=smallest_float_dtype)
+            res = pd.to_numeric(data, downcast='float')
+            tm.assert_numpy_array_equal(res, expected)
+
+        # if we can't successfully cast the given
+        # data to a numeric dtype, do not bother
+        # with the downcast parameter
+        data = ['foo', 2, 3]
+        expected = np.array(data, dtype=object)
+        res = pd.to_numeric(data, errors='ignore',
+                            downcast='unsigned')
+        tm.assert_numpy_array_equal(res, expected)
+
+        # cannot cast to an unsigned integer because
+        # we have a negative number
+        data = ['-1', 2, 3]
+        expected = np.array([-1, 2, 3], dtype=np.int64)
+        res = pd.to_numeric(data, downcast='unsigned')
+        tm.assert_numpy_array_equal(res, expected)
+
+        # cannot cast to an integer (signed or unsigned)
+        # because we have a float number
+        data = (['1.1', 2, 3],
+                [10000.0, 20000, 3000, 40000.36, 50000, 50000.00])
+        expected = (np.array([1.1, 2, 3], dtype=np.float64),
+                    np.array([10000.0, 20000, 3000,
+                              40000.36, 50000, 50000.00], dtype=np.float64))
+
+        for _data, _expected in zip(data, expected):
+            for downcast in ('integer', 'signed', 'unsigned'):
+                res = pd.to_numeric(_data, downcast=downcast)
+                tm.assert_numpy_array_equal(res, _expected)
+
+        # the smallest integer dtype need not be np.(u)int8
+        data = ['256', 257, 258]
+
+        for downcast, expected_dtype in zip(
+                ['integer', 'signed', 'unsigned'],
+                [np.int16, np.int16, np.uint16]):
+            expected = np.array([256, 257, 258], dtype=expected_dtype)
+            res = pd.to_numeric(data, downcast=downcast)
+            tm.assert_numpy_array_equal(res, expected)
+
+    def test_downcast_limits(self):
+        # Test the limits of each downcast. Bug: #14401.
+
+        i = 'integer'
+        u = 'unsigned'
+        dtype_downcast_min_max = [
+            ('int8', i, [iinfo(np.int8).min, iinfo(np.int8).max]),
+            ('int16', i, [iinfo(np.int16).min, iinfo(np.int16).max]),
+            ('int32', i, [iinfo(np.int32).min, iinfo(np.int32).max]),
+            ('int64', i, [iinfo(np.int64).min, iinfo(np.int64).max]),
+            ('uint8', u, [iinfo(np.uint8).min, iinfo(np.uint8).max]),
+            ('uint16', u, [iinfo(np.uint16).min, iinfo(np.uint16).max]),
+            ('uint32', u, [iinfo(np.uint32).min, iinfo(np.uint32).max]),
+            ('uint64', u, [iinfo(np.uint64).min, iinfo(np.uint64).max]),
+            ('int16', i, [iinfo(np.int8).min, iinfo(np.int8).max + 1]),
+            ('int32', i, [iinfo(np.int16).min, iinfo(np.int16).max + 1]),
+            ('int64', i, [iinfo(np.int32).min, iinfo(np.int32).max + 1]),
+            ('int16', i, [iinfo(np.int8).min - 1, iinfo(np.int16).max]),
+            ('int32', i, [iinfo(np.int16).min - 1, iinfo(np.int32).max]),
+            ('int64', i, [iinfo(np.int32).min - 1, iinfo(np.int64).max]),
+            ('uint16', u, [iinfo(np.uint8).min, iinfo(np.uint8).max + 1]),
+            ('uint32', u, [iinfo(np.uint16).min, iinfo(np.uint16).max + 1]),
+            ('uint64', u, [iinfo(np.uint32).min, iinfo(np.uint32).max + 1])
+        ]
+
+        for dtype, downcast, min_max in dtype_downcast_min_max:
+            series = pd.to_numeric(pd.Series(min_max), downcast=downcast)
+            assert series.dtype == dtype
+
+    def test_coerce_uint64_conflict(self):
+        # see gh-17007 and gh-17125
+        #
+        # Still returns float despite the uint64-nan conflict,
+        # which would normally force the casting to object.
+        df = pd.DataFrame({"a": [200, 300, "", "NaN", 30000000000000000000]})
+        expected = pd.Series([200, 300, np.nan, np.nan,
+                              30000000000000000000], dtype=float, name="a")
+        result = to_numeric(df["a"], errors="coerce")
+        tm.assert_series_equal(result, expected)
+
+        s = pd.Series(["12345678901234567890", "1234567890", "ITEM"])
+        expected = pd.Series([12345678901234567890,
+                              1234567890, np.nan], dtype=float)
+        result = to_numeric(s, errors="coerce")
+        tm.assert_series_equal(result, expected)
+
+        # For completeness, check against "ignore" and "raise"
+        result = to_numeric(s, errors="ignore")
+        tm.assert_series_equal(result, s)
+
+        msg = "Unable to parse string"
+        with tm.assert_raises_regex(ValueError, msg):
+            to_numeric(s, errors="raise")
diff --git a/pandas/tests/tseries/__init__.py b/pandas/tests/tseries/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/tseries/conftest.py b/pandas/tests/tseries/conftest.py
new file mode 100644
index 0000000000000..fc1ecf21c5446
--- /dev/null
+++ b/pandas/tests/tseries/conftest.py
@@ -0,0 +1,7 @@
+import pytest
+
+
+@pytest.fixture(params=[None, 'UTC', 'Asia/Tokyo', 'US/Eastern',
+                        'dateutil/Asia/Tokyo', 'dateutil/US/Pacific'])
+def tz(request):
+    return request.param
diff --git a/pandas/tests/tseries/offsets/__init__.py b/pandas/tests/tseries/offsets/__init__.py
new file mode 100644
index 0000000000000..40a96afc6ff09
--- /dev/null
+++ b/pandas/tests/tseries/offsets/__init__.py
@@ -0,0 +1 @@
+# -*- coding: utf-8 -*-
diff --git a/pandas/tests/tseries/offsets/common.py b/pandas/tests/tseries/offsets/common.py
new file mode 100644
index 0000000000000..2e8eb224bca7f
--- /dev/null
+++ b/pandas/tests/tseries/offsets/common.py
@@ -0,0 +1,25 @@
+# -*- coding: utf-8 -*-
+"""
+Assertion helpers for offsets tests
+"""
+
+
+def assert_offset_equal(offset, base, expected):
+    actual = offset + base
+    actual_swapped = base + offset
+    actual_apply = offset.apply(base)
+    try:
+        assert actual == expected
+        assert actual_swapped == expected
+        assert actual_apply == expected
+    except AssertionError:
+        raise AssertionError("\nExpected: %s\nActual: %s\nFor Offset: %s)"
+                             "\nAt Date: %s" %
+                             (expected, actual, offset, base))
+
+
+def assert_onOffset(offset, date, expected):
+    actual = offset.onOffset(date)
+    assert actual == expected, ("\nExpected: %s\nActual: %s\nFor Offset: %s)"
+                                "\nAt Date: %s" %
+                                (expected, actual, offset, date))
diff --git a/pandas/tests/tseries/offsets/conftest.py b/pandas/tests/tseries/offsets/conftest.py
new file mode 100644
index 0000000000000..76f24123ea0e1
--- /dev/null
+++ b/pandas/tests/tseries/offsets/conftest.py
@@ -0,0 +1,26 @@
+import pytest
+import pandas.tseries.offsets as offsets
+
+
+@pytest.fixture(params=[getattr(offsets, o) for o in offsets.__all__])
+def offset_types(request):
+    return request.param
+
+
+@pytest.fixture(params=[getattr(offsets, o) for o in offsets.__all__ if
+                        issubclass(getattr(offsets, o), offsets.MonthOffset)
+                        and o != 'MonthOffset'])
+def month_classes(request):
+    return request.param
+
+
+@pytest.fixture(params=[getattr(offsets, o) for o in offsets.__all__ if
+                        issubclass(getattr(offsets, o), offsets.Tick)])
+def tick_classes(request):
+    return request.param
+
+
+@pytest.fixture(params=[None, 'UTC', 'Asia/Tokyo', 'US/Eastern',
+                        'dateutil/Asia/Tokyo', 'dateutil/US/Pacific'])
+def tz(request):
+    return request.param
diff --git a/pandas/tseries/tests/data/cday-0.14.1.pickle b/pandas/tests/tseries/offsets/data/cday-0.14.1.pickle
similarity index 100%
rename from pandas/tseries/tests/data/cday-0.14.1.pickle
rename to pandas/tests/tseries/offsets/data/cday-0.14.1.pickle
diff --git a/pandas/tseries/tests/data/dateoffset_0_15_2.pickle b/pandas/tests/tseries/offsets/data/dateoffset_0_15_2.pickle
similarity index 100%
rename from pandas/tseries/tests/data/dateoffset_0_15_2.pickle
rename to pandas/tests/tseries/offsets/data/dateoffset_0_15_2.pickle
diff --git a/pandas/tests/tseries/offsets/test_fiscal.py b/pandas/tests/tseries/offsets/test_fiscal.py
new file mode 100644
index 0000000000000..c084cccbb74ac
--- /dev/null
+++ b/pandas/tests/tseries/offsets/test_fiscal.py
@@ -0,0 +1,658 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for Fiscal Year and Fiscal Quarter offset classes
+"""
+from datetime import datetime
+
+from dateutil.relativedelta import relativedelta
+import pytest
+
+import pandas.util.testing as tm
+
+from pandas import Timestamp
+from pandas.tseries.frequencies import get_offset
+from pandas._libs.tslibs.frequencies import _INVALID_FREQ_ERROR
+from pandas.tseries.offsets import FY5253Quarter, FY5253
+from pandas._libs.tslibs.offsets import WeekDay
+
+from .common import assert_offset_equal, assert_onOffset
+from .test_offsets import Base
+
+
+def makeFY5253LastOfMonthQuarter(*args, **kwds):
+    return FY5253Quarter(*args, variation="last", **kwds)
+
+
+def makeFY5253NearestEndMonthQuarter(*args, **kwds):
+    return FY5253Quarter(*args, variation="nearest", **kwds)
+
+
+def makeFY5253NearestEndMonth(*args, **kwds):
+    return FY5253(*args, variation="nearest", **kwds)
+
+
+def makeFY5253LastOfMonth(*args, **kwds):
+    return FY5253(*args, variation="last", **kwds)
+
+
+def test_get_offset_name():
+    assert (makeFY5253LastOfMonthQuarter(
+            weekday=1, startingMonth=3,
+            qtr_with_extra_week=4).freqstr == "REQ-L-MAR-TUE-4")
+    assert (makeFY5253NearestEndMonthQuarter(
+            weekday=1, startingMonth=3,
+            qtr_with_extra_week=3).freqstr == "REQ-N-MAR-TUE-3")
+
+
+def test_get_offset():
+    with tm.assert_raises_regex(ValueError, _INVALID_FREQ_ERROR):
+        get_offset('gibberish')
+    with tm.assert_raises_regex(ValueError, _INVALID_FREQ_ERROR):
+        get_offset('QS-JAN-B')
+
+    pairs = [
+        ("RE-N-DEC-MON",
+         makeFY5253NearestEndMonth(weekday=0, startingMonth=12)),
+        ("RE-L-DEC-TUE",
+         makeFY5253LastOfMonth(weekday=1, startingMonth=12)),
+        ("REQ-L-MAR-TUE-4",
+         makeFY5253LastOfMonthQuarter(weekday=1,
+                                      startingMonth=3,
+                                      qtr_with_extra_week=4)),
+        ("REQ-L-DEC-MON-3",
+         makeFY5253LastOfMonthQuarter(weekday=0,
+                                      startingMonth=12,
+                                      qtr_with_extra_week=3)),
+        ("REQ-N-DEC-MON-3",
+         makeFY5253NearestEndMonthQuarter(weekday=0,
+                                          startingMonth=12,
+                                          qtr_with_extra_week=3))]
+
+    for name, expected in pairs:
+        offset = get_offset(name)
+        assert offset == expected, ("Expected %r to yield %r (actual: %r)" %
+                                    (name, expected, offset))
+
+
+class TestFY5253LastOfMonth(Base):
+    offset_lom_sat_aug = makeFY5253LastOfMonth(1, startingMonth=8,
+                                               weekday=WeekDay.SAT)
+    offset_lom_sat_sep = makeFY5253LastOfMonth(1, startingMonth=9,
+                                               weekday=WeekDay.SAT)
+
+    on_offset_cases = [
+        # From Wikipedia (see:
+        # http://en.wikipedia.org/wiki/4%E2%80%934%E2%80%935_calendar#Last_Saturday_of_the_month_at_fiscal_year_end)
+        (offset_lom_sat_aug, datetime(2006, 8, 26), True),
+        (offset_lom_sat_aug, datetime(2007, 8, 25), True),
+        (offset_lom_sat_aug, datetime(2008, 8, 30), True),
+        (offset_lom_sat_aug, datetime(2009, 8, 29), True),
+        (offset_lom_sat_aug, datetime(2010, 8, 28), True),
+        (offset_lom_sat_aug, datetime(2011, 8, 27), True),
+        (offset_lom_sat_aug, datetime(2012, 8, 25), True),
+        (offset_lom_sat_aug, datetime(2013, 8, 31), True),
+        (offset_lom_sat_aug, datetime(2014, 8, 30), True),
+        (offset_lom_sat_aug, datetime(2015, 8, 29), True),
+        (offset_lom_sat_aug, datetime(2016, 8, 27), True),
+        (offset_lom_sat_aug, datetime(2017, 8, 26), True),
+        (offset_lom_sat_aug, datetime(2018, 8, 25), True),
+        (offset_lom_sat_aug, datetime(2019, 8, 31), True),
+
+        (offset_lom_sat_aug, datetime(2006, 8, 27), False),
+        (offset_lom_sat_aug, datetime(2007, 8, 28), False),
+        (offset_lom_sat_aug, datetime(2008, 8, 31), False),
+        (offset_lom_sat_aug, datetime(2009, 8, 30), False),
+        (offset_lom_sat_aug, datetime(2010, 8, 29), False),
+        (offset_lom_sat_aug, datetime(2011, 8, 28), False),
+
+        (offset_lom_sat_aug, datetime(2006, 8, 25), False),
+        (offset_lom_sat_aug, datetime(2007, 8, 24), False),
+        (offset_lom_sat_aug, datetime(2008, 8, 29), False),
+        (offset_lom_sat_aug, datetime(2009, 8, 28), False),
+        (offset_lom_sat_aug, datetime(2010, 8, 27), False),
+        (offset_lom_sat_aug, datetime(2011, 8, 26), False),
+        (offset_lom_sat_aug, datetime(2019, 8, 30), False),
+
+        # From GMCR (see for example:
+        # http://yahoo.brand.edgar-online.com/Default.aspx?
+        # companyid=3184&formtypeID=7)
+        (offset_lom_sat_sep, datetime(2010, 9, 25), True),
+        (offset_lom_sat_sep, datetime(2011, 9, 24), True),
+        (offset_lom_sat_sep, datetime(2012, 9, 29), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+    def test_apply(self):
+        offset_lom_aug_sat = makeFY5253LastOfMonth(startingMonth=8,
+                                                   weekday=WeekDay.SAT)
+        offset_lom_aug_sat_1 = makeFY5253LastOfMonth(n=1, startingMonth=8,
+                                                     weekday=WeekDay.SAT)
+
+        date_seq_lom_aug_sat = [datetime(2006, 8, 26), datetime(2007, 8, 25),
+                                datetime(2008, 8, 30), datetime(2009, 8, 29),
+                                datetime(2010, 8, 28), datetime(2011, 8, 27),
+                                datetime(2012, 8, 25), datetime(2013, 8, 31),
+                                datetime(2014, 8, 30), datetime(2015, 8, 29),
+                                datetime(2016, 8, 27)]
+
+        tests = [
+            (offset_lom_aug_sat, date_seq_lom_aug_sat),
+            (offset_lom_aug_sat_1, date_seq_lom_aug_sat),
+            (offset_lom_aug_sat, [
+                datetime(2006, 8, 25)] + date_seq_lom_aug_sat),
+            (offset_lom_aug_sat_1, [
+                datetime(2006, 8, 27)] + date_seq_lom_aug_sat[1:]),
+            (makeFY5253LastOfMonth(n=-1, startingMonth=8,
+                                   weekday=WeekDay.SAT),
+             list(reversed(date_seq_lom_aug_sat))),
+        ]
+        for test in tests:
+            offset, data = test
+            current = data[0]
+            for datum in data[1:]:
+                current = current + offset
+                assert current == datum
+
+
+class TestFY5253NearestEndMonth(Base):
+
+    def test_get_year_end(self):
+        assert (makeFY5253NearestEndMonth(
+            startingMonth=8, weekday=WeekDay.SAT).get_year_end(
+            datetime(2013, 1, 1)) == datetime(2013, 8, 31))
+        assert (makeFY5253NearestEndMonth(
+            startingMonth=8, weekday=WeekDay.SUN).get_year_end(
+            datetime(2013, 1, 1)) == datetime(2013, 9, 1))
+        assert (makeFY5253NearestEndMonth(
+            startingMonth=8, weekday=WeekDay.FRI).get_year_end(
+            datetime(2013, 1, 1)) == datetime(2013, 8, 30))
+
+        offset_n = FY5253(weekday=WeekDay.TUE, startingMonth=12,
+                          variation="nearest")
+        assert (offset_n.get_year_end(datetime(2012, 1, 1)) ==
+                datetime(2013, 1, 1))
+        assert (offset_n.get_year_end(datetime(2012, 1, 10)) ==
+                datetime(2013, 1, 1))
+
+        assert (offset_n.get_year_end(datetime(2013, 1, 1)) ==
+                datetime(2013, 12, 31))
+        assert (offset_n.get_year_end(datetime(2013, 1, 2)) ==
+                datetime(2013, 12, 31))
+        assert (offset_n.get_year_end(datetime(2013, 1, 3)) ==
+                datetime(2013, 12, 31))
+        assert (offset_n.get_year_end(datetime(2013, 1, 10)) ==
+                datetime(2013, 12, 31))
+
+        JNJ = FY5253(n=1, startingMonth=12, weekday=6, variation="nearest")
+        assert (JNJ.get_year_end(datetime(2006, 1, 1)) ==
+                datetime(2006, 12, 31))
+
+    offset_lom_aug_sat = makeFY5253NearestEndMonth(1, startingMonth=8,
+                                                   weekday=WeekDay.SAT)
+    offset_lom_aug_thu = makeFY5253NearestEndMonth(1, startingMonth=8,
+                                                   weekday=WeekDay.THU)
+    offset_n = FY5253(weekday=WeekDay.TUE, startingMonth=12,
+                      variation="nearest")
+
+    on_offset_cases = [
+        #    From Wikipedia (see:
+        #    http://en.wikipedia.org/wiki/4%E2%80%934%E2%80%935_calendar
+        #    #Saturday_nearest_the_end_of_month)
+        #    2006-09-02   2006 September 2
+        #    2007-09-01   2007 September 1
+        #    2008-08-30   2008 August 30    (leap year)
+        #    2009-08-29   2009 August 29
+        #    2010-08-28   2010 August 28
+        #    2011-09-03   2011 September 3
+        #    2012-09-01   2012 September 1  (leap year)
+        #    2013-08-31   2013 August 31
+        #    2014-08-30   2014 August 30
+        #    2015-08-29   2015 August 29
+        #    2016-09-03   2016 September 3  (leap year)
+        #    2017-09-02   2017 September 2
+        #    2018-09-01   2018 September 1
+        #    2019-08-31   2019 August 31
+        (offset_lom_aug_sat, datetime(2006, 9, 2), True),
+        (offset_lom_aug_sat, datetime(2007, 9, 1), True),
+        (offset_lom_aug_sat, datetime(2008, 8, 30), True),
+        (offset_lom_aug_sat, datetime(2009, 8, 29), True),
+        (offset_lom_aug_sat, datetime(2010, 8, 28), True),
+        (offset_lom_aug_sat, datetime(2011, 9, 3), True),
+
+        (offset_lom_aug_sat, datetime(2016, 9, 3), True),
+        (offset_lom_aug_sat, datetime(2017, 9, 2), True),
+        (offset_lom_aug_sat, datetime(2018, 9, 1), True),
+        (offset_lom_aug_sat, datetime(2019, 8, 31), True),
+
+        (offset_lom_aug_sat, datetime(2006, 8, 27), False),
+        (offset_lom_aug_sat, datetime(2007, 8, 28), False),
+        (offset_lom_aug_sat, datetime(2008, 8, 31), False),
+        (offset_lom_aug_sat, datetime(2009, 8, 30), False),
+        (offset_lom_aug_sat, datetime(2010, 8, 29), False),
+        (offset_lom_aug_sat, datetime(2011, 8, 28), False),
+
+        (offset_lom_aug_sat, datetime(2006, 8, 25), False),
+        (offset_lom_aug_sat, datetime(2007, 8, 24), False),
+        (offset_lom_aug_sat, datetime(2008, 8, 29), False),
+        (offset_lom_aug_sat, datetime(2009, 8, 28), False),
+        (offset_lom_aug_sat, datetime(2010, 8, 27), False),
+        (offset_lom_aug_sat, datetime(2011, 8, 26), False),
+        (offset_lom_aug_sat, datetime(2019, 8, 30), False),
+
+        # From Micron, see:
+        # http://google.brand.edgar-online.com/?sym=MU&formtypeID=7
+        (offset_lom_aug_thu, datetime(2012, 8, 30), True),
+        (offset_lom_aug_thu, datetime(2011, 9, 1), True),
+
+        (offset_n, datetime(2012, 12, 31), False),
+        (offset_n, datetime(2013, 1, 1), True),
+        (offset_n, datetime(2013, 1, 2), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+    def test_apply(self):
+        date_seq_nem_8_sat = [datetime(2006, 9, 2), datetime(2007, 9, 1),
+                              datetime(2008, 8, 30), datetime(2009, 8, 29),
+                              datetime(2010, 8, 28), datetime(2011, 9, 3)]
+
+        JNJ = [datetime(2005, 1, 2), datetime(2006, 1, 1),
+               datetime(2006, 12, 31), datetime(2007, 12, 30),
+               datetime(2008, 12, 28), datetime(2010, 1, 3),
+               datetime(2011, 1, 2), datetime(2012, 1, 1),
+               datetime(2012, 12, 30)]
+
+        DEC_SAT = FY5253(n=-1, startingMonth=12, weekday=5,
+                         variation="nearest")
+
+        tests = [
+            (makeFY5253NearestEndMonth(startingMonth=8,
+                                       weekday=WeekDay.SAT),
+             date_seq_nem_8_sat),
+            (makeFY5253NearestEndMonth(n=1, startingMonth=8,
+                                       weekday=WeekDay.SAT),
+             date_seq_nem_8_sat),
+            (makeFY5253NearestEndMonth(startingMonth=8, weekday=WeekDay.SAT),
+             [datetime(2006, 9, 1)] + date_seq_nem_8_sat),
+            (makeFY5253NearestEndMonth(n=1, startingMonth=8,
+                                       weekday=WeekDay.SAT),
+             [datetime(2006, 9, 3)] + date_seq_nem_8_sat[1:]),
+            (makeFY5253NearestEndMonth(n=-1, startingMonth=8,
+                                       weekday=WeekDay.SAT),
+             list(reversed(date_seq_nem_8_sat))),
+            (makeFY5253NearestEndMonth(n=1, startingMonth=12,
+                                       weekday=WeekDay.SUN), JNJ),
+            (makeFY5253NearestEndMonth(n=-1, startingMonth=12,
+                                       weekday=WeekDay.SUN),
+             list(reversed(JNJ))),
+            (makeFY5253NearestEndMonth(n=1, startingMonth=12,
+                                       weekday=WeekDay.SUN),
+             [datetime(2005, 1, 2), datetime(2006, 1, 1)]),
+            (makeFY5253NearestEndMonth(n=1, startingMonth=12,
+                                       weekday=WeekDay.SUN),
+             [datetime(2006, 1, 2), datetime(2006, 12, 31)]),
+            (DEC_SAT, [datetime(2013, 1, 15), datetime(2012, 12, 29)])
+        ]
+        for test in tests:
+            offset, data = test
+            current = data[0]
+            for datum in data[1:]:
+                current = current + offset
+                assert current == datum
+
+
+class TestFY5253LastOfMonthQuarter(Base):
+
+    def test_isAnchored(self):
+        assert makeFY5253LastOfMonthQuarter(
+            startingMonth=1, weekday=WeekDay.SAT,
+            qtr_with_extra_week=4).isAnchored()
+        assert makeFY5253LastOfMonthQuarter(
+            weekday=WeekDay.SAT, startingMonth=3,
+            qtr_with_extra_week=4).isAnchored()
+        assert not makeFY5253LastOfMonthQuarter(
+            2, startingMonth=1, weekday=WeekDay.SAT,
+            qtr_with_extra_week=4).isAnchored()
+
+    def test_equality(self):
+        assert (makeFY5253LastOfMonthQuarter(
+            startingMonth=1, weekday=WeekDay.SAT,
+            qtr_with_extra_week=4) == makeFY5253LastOfMonthQuarter(
+            startingMonth=1, weekday=WeekDay.SAT, qtr_with_extra_week=4))
+        assert (makeFY5253LastOfMonthQuarter(
+            startingMonth=1, weekday=WeekDay.SAT,
+            qtr_with_extra_week=4) != makeFY5253LastOfMonthQuarter(
+            startingMonth=1, weekday=WeekDay.SUN, qtr_with_extra_week=4))
+        assert (makeFY5253LastOfMonthQuarter(
+            startingMonth=1, weekday=WeekDay.SAT,
+            qtr_with_extra_week=4) != makeFY5253LastOfMonthQuarter(
+            startingMonth=2, weekday=WeekDay.SAT, qtr_with_extra_week=4))
+
+    def test_offset(self):
+        offset = makeFY5253LastOfMonthQuarter(1, startingMonth=9,
+                                              weekday=WeekDay.SAT,
+                                              qtr_with_extra_week=4)
+        offset2 = makeFY5253LastOfMonthQuarter(2, startingMonth=9,
+                                               weekday=WeekDay.SAT,
+                                               qtr_with_extra_week=4)
+        offset4 = makeFY5253LastOfMonthQuarter(4, startingMonth=9,
+                                               weekday=WeekDay.SAT,
+                                               qtr_with_extra_week=4)
+
+        offset_neg1 = makeFY5253LastOfMonthQuarter(-1, startingMonth=9,
+                                                   weekday=WeekDay.SAT,
+                                                   qtr_with_extra_week=4)
+        offset_neg2 = makeFY5253LastOfMonthQuarter(-2, startingMonth=9,
+                                                   weekday=WeekDay.SAT,
+                                                   qtr_with_extra_week=4)
+
+        GMCR = [datetime(2010, 3, 27), datetime(2010, 6, 26),
+                datetime(2010, 9, 25), datetime(2010, 12, 25),
+                datetime(2011, 3, 26), datetime(2011, 6, 25),
+                datetime(2011, 9, 24), datetime(2011, 12, 24),
+                datetime(2012, 3, 24), datetime(2012, 6, 23),
+                datetime(2012, 9, 29), datetime(2012, 12, 29),
+                datetime(2013, 3, 30), datetime(2013, 6, 29)]
+
+        assert_offset_equal(offset, base=GMCR[0], expected=GMCR[1])
+        assert_offset_equal(offset, base=GMCR[0] + relativedelta(days=-1),
+                            expected=GMCR[0])
+        assert_offset_equal(offset, base=GMCR[1], expected=GMCR[2])
+
+        assert_offset_equal(offset2, base=GMCR[0], expected=GMCR[2])
+        assert_offset_equal(offset4, base=GMCR[0], expected=GMCR[4])
+
+        assert_offset_equal(offset_neg1, base=GMCR[-1], expected=GMCR[-2])
+        assert_offset_equal(offset_neg1,
+                            base=GMCR[-1] + relativedelta(days=+1),
+                            expected=GMCR[-1])
+        assert_offset_equal(offset_neg2, base=GMCR[-1], expected=GMCR[-3])
+
+        date = GMCR[0] + relativedelta(days=-1)
+        for expected in GMCR:
+            assert_offset_equal(offset, date, expected)
+            date = date + offset
+
+        date = GMCR[-1] + relativedelta(days=+1)
+        for expected in reversed(GMCR):
+            assert_offset_equal(offset_neg1, date, expected)
+            date = date + offset_neg1
+
+    lomq_aug_sat_4 = makeFY5253LastOfMonthQuarter(1, startingMonth=8,
+                                                  weekday=WeekDay.SAT,
+                                                  qtr_with_extra_week=4)
+    lomq_sep_sat_4 = makeFY5253LastOfMonthQuarter(1, startingMonth=9,
+                                                  weekday=WeekDay.SAT,
+                                                  qtr_with_extra_week=4)
+
+    on_offset_cases = [
+        # From Wikipedia
+        (lomq_aug_sat_4, datetime(2006, 8, 26), True),
+        (lomq_aug_sat_4, datetime(2007, 8, 25), True),
+        (lomq_aug_sat_4, datetime(2008, 8, 30), True),
+        (lomq_aug_sat_4, datetime(2009, 8, 29), True),
+        (lomq_aug_sat_4, datetime(2010, 8, 28), True),
+        (lomq_aug_sat_4, datetime(2011, 8, 27), True),
+        (lomq_aug_sat_4, datetime(2019, 8, 31), True),
+
+        (lomq_aug_sat_4, datetime(2006, 8, 27), False),
+        (lomq_aug_sat_4, datetime(2007, 8, 28), False),
+        (lomq_aug_sat_4, datetime(2008, 8, 31), False),
+        (lomq_aug_sat_4, datetime(2009, 8, 30), False),
+        (lomq_aug_sat_4, datetime(2010, 8, 29), False),
+        (lomq_aug_sat_4, datetime(2011, 8, 28), False),
+
+        (lomq_aug_sat_4, datetime(2006, 8, 25), False),
+        (lomq_aug_sat_4, datetime(2007, 8, 24), False),
+        (lomq_aug_sat_4, datetime(2008, 8, 29), False),
+        (lomq_aug_sat_4, datetime(2009, 8, 28), False),
+        (lomq_aug_sat_4, datetime(2010, 8, 27), False),
+        (lomq_aug_sat_4, datetime(2011, 8, 26), False),
+        (lomq_aug_sat_4, datetime(2019, 8, 30), False),
+
+        # From GMCR
+        (lomq_sep_sat_4, datetime(2010, 9, 25), True),
+        (lomq_sep_sat_4, datetime(2011, 9, 24), True),
+        (lomq_sep_sat_4, datetime(2012, 9, 29), True),
+
+        (lomq_sep_sat_4, datetime(2013, 6, 29), True),
+        (lomq_sep_sat_4, datetime(2012, 6, 23), True),
+        (lomq_sep_sat_4, datetime(2012, 6, 30), False),
+
+        (lomq_sep_sat_4, datetime(2013, 3, 30), True),
+        (lomq_sep_sat_4, datetime(2012, 3, 24), True),
+
+        (lomq_sep_sat_4, datetime(2012, 12, 29), True),
+        (lomq_sep_sat_4, datetime(2011, 12, 24), True),
+
+        # INTC (extra week in Q1)
+        # See: http://www.intc.com/releasedetail.cfm?ReleaseID=542844
+        (makeFY5253LastOfMonthQuarter(1, startingMonth=12,
+                                      weekday=WeekDay.SAT,
+                                      qtr_with_extra_week=1),
+         datetime(2011, 4, 2), True),
+
+        # see: http://google.brand.edgar-online.com/?sym=INTC&formtypeID=7
+        (makeFY5253LastOfMonthQuarter(1, startingMonth=12,
+                                      weekday=WeekDay.SAT,
+                                      qtr_with_extra_week=1),
+         datetime(2012, 12, 29), True),
+        (makeFY5253LastOfMonthQuarter(1, startingMonth=12,
+                                      weekday=WeekDay.SAT,
+                                      qtr_with_extra_week=1),
+         datetime(2011, 12, 31), True),
+        (makeFY5253LastOfMonthQuarter(1, startingMonth=12,
+                                      weekday=WeekDay.SAT,
+                                      qtr_with_extra_week=1),
+         datetime(2010, 12, 25), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+    def test_year_has_extra_week(self):
+        # End of long Q1
+        assert makeFY5253LastOfMonthQuarter(
+            1, startingMonth=12, weekday=WeekDay.SAT,
+            qtr_with_extra_week=1).year_has_extra_week(datetime(2011, 4, 2))
+
+        # Start of long Q1
+        assert makeFY5253LastOfMonthQuarter(
+            1, startingMonth=12, weekday=WeekDay.SAT,
+            qtr_with_extra_week=1).year_has_extra_week(datetime(2010, 12, 26))
+
+        # End of year before year with long Q1
+        assert not makeFY5253LastOfMonthQuarter(
+            1, startingMonth=12, weekday=WeekDay.SAT,
+            qtr_with_extra_week=1).year_has_extra_week(datetime(2010, 12, 25))
+
+        for year in [x
+                     for x in range(1994, 2011 + 1)
+                     if x not in [2011, 2005, 2000, 1994]]:
+            assert not makeFY5253LastOfMonthQuarter(
+                1, startingMonth=12, weekday=WeekDay.SAT,
+                qtr_with_extra_week=1).year_has_extra_week(
+                datetime(year, 4, 2))
+
+        # Other long years
+        assert makeFY5253LastOfMonthQuarter(
+            1, startingMonth=12, weekday=WeekDay.SAT,
+            qtr_with_extra_week=1).year_has_extra_week(datetime(2005, 4, 2))
+
+        assert makeFY5253LastOfMonthQuarter(
+            1, startingMonth=12, weekday=WeekDay.SAT,
+            qtr_with_extra_week=1).year_has_extra_week(datetime(2000, 4, 2))
+
+        assert makeFY5253LastOfMonthQuarter(
+            1, startingMonth=12, weekday=WeekDay.SAT,
+            qtr_with_extra_week=1).year_has_extra_week(datetime(1994, 4, 2))
+
+    def test_get_weeks(self):
+        sat_dec_1 = makeFY5253LastOfMonthQuarter(1, startingMonth=12,
+                                                 weekday=WeekDay.SAT,
+                                                 qtr_with_extra_week=1)
+        sat_dec_4 = makeFY5253LastOfMonthQuarter(1, startingMonth=12,
+                                                 weekday=WeekDay.SAT,
+                                                 qtr_with_extra_week=4)
+
+        assert sat_dec_1.get_weeks(datetime(2011, 4, 2)) == [14, 13, 13, 13]
+        assert sat_dec_4.get_weeks(datetime(2011, 4, 2)) == [13, 13, 13, 14]
+        assert sat_dec_1.get_weeks(datetime(2010, 12, 25)) == [13, 13, 13, 13]
+
+
+class TestFY5253NearestEndMonthQuarter(Base):
+
+    offset_nem_sat_aug_4 = makeFY5253NearestEndMonthQuarter(
+        1, startingMonth=8, weekday=WeekDay.SAT,
+        qtr_with_extra_week=4)
+    offset_nem_thu_aug_4 = makeFY5253NearestEndMonthQuarter(
+        1, startingMonth=8, weekday=WeekDay.THU,
+        qtr_with_extra_week=4)
+    offset_n = FY5253(weekday=WeekDay.TUE, startingMonth=12,
+                      variation="nearest")
+
+    on_offset_cases = [
+        # From Wikipedia
+        (offset_nem_sat_aug_4, datetime(2006, 9, 2), True),
+        (offset_nem_sat_aug_4, datetime(2007, 9, 1), True),
+        (offset_nem_sat_aug_4, datetime(2008, 8, 30), True),
+        (offset_nem_sat_aug_4, datetime(2009, 8, 29), True),
+        (offset_nem_sat_aug_4, datetime(2010, 8, 28), True),
+        (offset_nem_sat_aug_4, datetime(2011, 9, 3), True),
+
+        (offset_nem_sat_aug_4, datetime(2016, 9, 3), True),
+        (offset_nem_sat_aug_4, datetime(2017, 9, 2), True),
+        (offset_nem_sat_aug_4, datetime(2018, 9, 1), True),
+        (offset_nem_sat_aug_4, datetime(2019, 8, 31), True),
+
+        (offset_nem_sat_aug_4, datetime(2006, 8, 27), False),
+        (offset_nem_sat_aug_4, datetime(2007, 8, 28), False),
+        (offset_nem_sat_aug_4, datetime(2008, 8, 31), False),
+        (offset_nem_sat_aug_4, datetime(2009, 8, 30), False),
+        (offset_nem_sat_aug_4, datetime(2010, 8, 29), False),
+        (offset_nem_sat_aug_4, datetime(2011, 8, 28), False),
+
+        (offset_nem_sat_aug_4, datetime(2006, 8, 25), False),
+        (offset_nem_sat_aug_4, datetime(2007, 8, 24), False),
+        (offset_nem_sat_aug_4, datetime(2008, 8, 29), False),
+        (offset_nem_sat_aug_4, datetime(2009, 8, 28), False),
+        (offset_nem_sat_aug_4, datetime(2010, 8, 27), False),
+        (offset_nem_sat_aug_4, datetime(2011, 8, 26), False),
+        (offset_nem_sat_aug_4, datetime(2019, 8, 30), False),
+
+        # From Micron, see:
+        # http://google.brand.edgar-online.com/?sym=MU&formtypeID=7
+        (offset_nem_thu_aug_4, datetime(2012, 8, 30), True),
+        (offset_nem_thu_aug_4, datetime(2011, 9, 1), True),
+
+        # See: http://google.brand.edgar-online.com/?sym=MU&formtypeID=13
+        (offset_nem_thu_aug_4, datetime(2013, 5, 30), True),
+        (offset_nem_thu_aug_4, datetime(2013, 2, 28), True),
+        (offset_nem_thu_aug_4, datetime(2012, 11, 29), True),
+        (offset_nem_thu_aug_4, datetime(2012, 5, 31), True),
+        (offset_nem_thu_aug_4, datetime(2007, 3, 1), True),
+        (offset_nem_thu_aug_4, datetime(1994, 3, 3), True),
+
+        (offset_n, datetime(2012, 12, 31), False),
+        (offset_n, datetime(2013, 1, 1), True),
+        (offset_n, datetime(2013, 1, 2), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+    def test_offset(self):
+        offset = makeFY5253NearestEndMonthQuarter(1, startingMonth=8,
+                                                  weekday=WeekDay.THU,
+                                                  qtr_with_extra_week=4)
+
+        MU = [datetime(2012, 5, 31),
+              datetime(2012, 8, 30), datetime(2012, 11, 29),
+              datetime(2013, 2, 28), datetime(2013, 5, 30)]
+
+        date = MU[0] + relativedelta(days=-1)
+        for expected in MU:
+            assert_offset_equal(offset, date, expected)
+            date = date + offset
+
+        assert_offset_equal(offset,
+                            datetime(2012, 5, 31),
+                            datetime(2012, 8, 30))
+        assert_offset_equal(offset,
+                            datetime(2012, 5, 30),
+                            datetime(2012, 5, 31))
+
+        offset2 = FY5253Quarter(weekday=5, startingMonth=12, variation="last",
+                                qtr_with_extra_week=4)
+
+        assert_offset_equal(offset2,
+                            datetime(2013, 1, 15),
+                            datetime(2013, 3, 30))
+
+
+def test_bunched_yearends():
+    # GH#14774 cases with two fiscal year-ends in the same calendar-year
+    fy = FY5253(n=1, weekday=5, startingMonth=12, variation='nearest')
+    dt = Timestamp('2004-01-01')
+    assert fy.rollback(dt) == Timestamp('2002-12-28')
+    assert (-fy).apply(dt) == Timestamp('2002-12-28')
+    assert dt - fy == Timestamp('2002-12-28')
+
+    assert fy.rollforward(dt) == Timestamp('2004-01-03')
+    assert fy.apply(dt) == Timestamp('2004-01-03')
+    assert fy + dt == Timestamp('2004-01-03')
+    assert dt + fy == Timestamp('2004-01-03')
+
+    # Same thing, but starting from a Timestamp in the previous year.
+    dt = Timestamp('2003-12-31')
+    assert fy.rollback(dt) == Timestamp('2002-12-28')
+    assert (-fy).apply(dt) == Timestamp('2002-12-28')
+    assert dt - fy == Timestamp('2002-12-28')
+
+
+def test_fy5253_last_onoffset():
+    # GH#18877 dates on the year-end but not normalized to midnight
+    offset = FY5253(n=-5, startingMonth=5, variation="last", weekday=0)
+    ts = Timestamp('1984-05-28 06:29:43.955911354+0200',
+                   tz='Europe/San_Marino')
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+
+def test_fy5253_nearest_onoffset():
+    # GH#18877 dates on the year-end but not normalized to midnight
+    offset = FY5253(n=3, startingMonth=7, variation="nearest", weekday=2)
+    ts = Timestamp('2032-07-28 00:12:59.035729419+0000', tz='Africa/Dakar')
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+
+def test_fy5253qtr_onoffset_nearest():
+    # GH#19036
+    ts = Timestamp('1985-09-02 23:57:46.232550356-0300',
+                   tz='Atlantic/Bermuda')
+    offset = FY5253Quarter(n=3, qtr_with_extra_week=1, startingMonth=2,
+                           variation="nearest", weekday=0)
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+
+def test_fy5253qtr_onoffset_last():
+    # GH#19036
+    offset = FY5253Quarter(n=-2, qtr_with_extra_week=1,
+                           startingMonth=7, variation="last", weekday=2)
+    ts = Timestamp('2011-01-26 19:03:40.331096129+0200',
+                   tz='Africa/Windhoek')
+    slow = (ts + offset) - offset == ts
+    fast = offset.onOffset(ts)
+    assert fast == slow
diff --git a/pandas/tests/tseries/offsets/test_offsets.py b/pandas/tests/tseries/offsets/test_offsets.py
new file mode 100644
index 0000000000000..b93a0206479ca
--- /dev/null
+++ b/pandas/tests/tseries/offsets/test_offsets.py
@@ -0,0 +1,3174 @@
+from distutils.version import LooseVersion
+from datetime import date, datetime, timedelta
+
+import pytest
+from pandas.compat import range
+from pandas import compat
+
+import numpy as np
+
+from pandas.compat.numpy import np_datetime64_compat
+
+from pandas.core.series import Series
+from pandas._libs.tslibs.frequencies import (get_freq_code, get_freq_str,
+                                             _INVALID_FREQ_ERROR)
+from pandas.tseries.frequencies import _offset_map, get_offset
+from pandas.core.indexes.datetimes import (
+    _to_m8, DatetimeIndex, _daterange_cache)
+import pandas._libs.tslibs.offsets as liboffsets
+from pandas._libs.tslibs.offsets import WeekDay, CacheableOffset
+from pandas.tseries.offsets import (BDay, CDay, BQuarterEnd, BMonthEnd,
+                                    BusinessHour, WeekOfMonth, CBMonthEnd,
+                                    CustomBusinessHour,
+                                    CBMonthBegin, BYearEnd, MonthEnd,
+                                    MonthBegin, SemiMonthBegin, SemiMonthEnd,
+                                    BYearBegin, QuarterBegin, BQuarterBegin,
+                                    BMonthBegin, DateOffset, Week, YearBegin,
+                                    YearEnd, Day,
+                                    QuarterEnd, BusinessMonthEnd, FY5253,
+                                    Nano, Easter, FY5253Quarter,
+                                    LastWeekOfMonth, Tick)
+from pandas.core.tools.datetimes import format, ole2datetime
+import pandas.tseries.offsets as offsets
+from pandas.io.pickle import read_pickle
+from pandas._libs.tslibs import timezones
+from pandas._libs.tslib import normalize_date, NaT, Timestamp
+import pandas._libs.tslib as tslib
+import pandas.util.testing as tm
+from pandas.tseries.holiday import USFederalHolidayCalendar
+
+from .common import assert_offset_equal, assert_onOffset
+
+
+####
+# Misc function tests
+####
+
+
+def test_format():
+    actual = format(datetime(2008, 1, 15))
+    assert actual == '20080115'
+
+
+def test_ole2datetime():
+    actual = ole2datetime(60000)
+    assert actual == datetime(2064, 4, 8)
+
+    with pytest.raises(ValueError):
+        ole2datetime(60)
+
+
+def test_normalize_date():
+    actual = normalize_date(datetime(2007, 10, 1, 1, 12, 5, 10))
+    assert actual == datetime(2007, 10, 1)
+
+
+def test_to_m8():
+    valb = datetime(2007, 10, 1)
+    valu = _to_m8(valb)
+    assert isinstance(valu, np.datetime64)
+    # assert valu == np.datetime64(datetime(2007,10,1))
+
+    # def test_datetime64_box():
+    #    valu = np.datetime64(datetime(2007,10,1))
+    #    valb = _dt_box(valu)
+    #    assert type(valb) == datetime
+    #    assert valb == datetime(2007,10,1)
+
+    #####
+    # DateOffset Tests
+    #####
+
+
+class Base(object):
+    _offset = None
+    d = Timestamp(datetime(2008, 1, 2))
+
+    timezones = [None, 'UTC', 'Asia/Tokyo', 'US/Eastern',
+                 'dateutil/Asia/Tokyo', 'dateutil/US/Pacific']
+
+    def _get_offset(self, klass, value=1, normalize=False):
+        # create instance from offset class
+        if klass is FY5253:
+            klass = klass(n=value, startingMonth=1, weekday=1,
+                          variation='last', normalize=normalize)
+        elif klass is FY5253Quarter:
+            klass = klass(n=value, startingMonth=1, weekday=1,
+                          qtr_with_extra_week=1, variation='last',
+                          normalize=normalize)
+        elif klass is LastWeekOfMonth:
+            klass = klass(n=value, weekday=5, normalize=normalize)
+        elif klass is WeekOfMonth:
+            klass = klass(n=value, week=1, weekday=5, normalize=normalize)
+        elif klass is Week:
+            klass = klass(n=value, weekday=5, normalize=normalize)
+        elif klass is DateOffset:
+            klass = klass(days=value, normalize=normalize)
+        else:
+            try:
+                klass = klass(value, normalize=normalize)
+            except Exception:
+                klass = klass(normalize=normalize)
+        return klass
+
+    def test_apply_out_of_range(self, tz):
+        if self._offset is None:
+            return
+
+        # try to create an out-of-bounds result timestamp; if we can't create
+        # the offset skip
+        try:
+            if self._offset in (BusinessHour, CustomBusinessHour):
+                # Using 10000 in BusinessHour fails in tz check because of DST
+                # difference
+                offset = self._get_offset(self._offset, value=100000)
+            else:
+                offset = self._get_offset(self._offset, value=10000)
+
+            result = Timestamp('20080101') + offset
+            assert isinstance(result, datetime)
+            assert result.tzinfo is None
+
+            # Check tz is preserved
+            t = Timestamp('20080101', tz=tz)
+            result = t + offset
+            assert isinstance(result, datetime)
+            assert t.tzinfo == result.tzinfo
+
+        except tslib.OutOfBoundsDatetime:
+            raise
+        except (ValueError, KeyError):
+            # we are creating an invalid offset
+            # so ignore
+            pass
+
+    def test_offsets_compare_equal(self):
+        # root cause of GH#456: __ne__ was not implemented
+        if self._offset is None:
+            return
+        offset1 = self._offset()
+        offset2 = self._offset()
+        assert not offset1 != offset2
+        assert offset1 == offset2
+
+    def test_rsub(self):
+        if self._offset is None or not hasattr(self, "offset2"):
+            # i.e. skip for TestCommon and YQM subclasses that do not have
+            # offset2 attr
+            return
+        assert self.d - self.offset2 == (-self.offset2).apply(self.d)
+
+    def test_radd(self):
+        if self._offset is None or not hasattr(self, "offset2"):
+            # i.e. skip for TestCommon and YQM subclasses that do not have
+            # offset2 attr
+            return
+        assert self.d + self.offset2 == self.offset2 + self.d
+
+    def test_sub(self):
+        if self._offset is None or not hasattr(self, "offset2"):
+            # i.e. skip for TestCommon and YQM subclasses that do not have
+            # offset2 attr
+            return
+        off = self.offset2
+        with pytest.raises(Exception):
+            off - self.d
+
+        assert 2 * off - off == off
+        assert self.d - self.offset2 == self.d + self._offset(-2)
+        assert self.d - self.offset2 == self.d - (2 * off - off)
+
+    def testMult1(self):
+        if self._offset is None or not hasattr(self, "offset1"):
+            # i.e. skip for TestCommon and YQM subclasses that do not have
+            # offset1 attr
+            return
+        assert self.d + 10 * self.offset1 == self.d + self._offset(10)
+        assert self.d + 5 * self.offset1 == self.d + self._offset(5)
+
+    def testMult2(self):
+        if self._offset is None:
+            return
+        assert self.d + (-5 * self._offset(-10)) == self.d + self._offset(50)
+        assert self.d + (-3 * self._offset(-2)) == self.d + self._offset(6)
+
+
+class TestCommon(Base):
+    # exected value created by Base._get_offset
+    # are applied to 2011/01/01 09:00 (Saturday)
+    # used for .apply and .rollforward
+    expecteds = {'Day': Timestamp('2011-01-02 09:00:00'),
+                 'DateOffset': Timestamp('2011-01-02 09:00:00'),
+                 'BusinessDay': Timestamp('2011-01-03 09:00:00'),
+                 'CustomBusinessDay': Timestamp('2011-01-03 09:00:00'),
+                 'CustomBusinessMonthEnd': Timestamp('2011-01-31 09:00:00'),
+                 'CustomBusinessMonthBegin': Timestamp('2011-01-03 09:00:00'),
+                 'MonthBegin': Timestamp('2011-02-01 09:00:00'),
+                 'BusinessMonthBegin': Timestamp('2011-01-03 09:00:00'),
+                 'MonthEnd': Timestamp('2011-01-31 09:00:00'),
+                 'SemiMonthEnd': Timestamp('2011-01-15 09:00:00'),
+                 'SemiMonthBegin': Timestamp('2011-01-15 09:00:00'),
+                 'BusinessMonthEnd': Timestamp('2011-01-31 09:00:00'),
+                 'YearBegin': Timestamp('2012-01-01 09:00:00'),
+                 'BYearBegin': Timestamp('2011-01-03 09:00:00'),
+                 'YearEnd': Timestamp('2011-12-31 09:00:00'),
+                 'BYearEnd': Timestamp('2011-12-30 09:00:00'),
+                 'QuarterBegin': Timestamp('2011-03-01 09:00:00'),
+                 'BQuarterBegin': Timestamp('2011-03-01 09:00:00'),
+                 'QuarterEnd': Timestamp('2011-03-31 09:00:00'),
+                 'BQuarterEnd': Timestamp('2011-03-31 09:00:00'),
+                 'BusinessHour': Timestamp('2011-01-03 10:00:00'),
+                 'CustomBusinessHour': Timestamp('2011-01-03 10:00:00'),
+                 'WeekOfMonth': Timestamp('2011-01-08 09:00:00'),
+                 'LastWeekOfMonth': Timestamp('2011-01-29 09:00:00'),
+                 'FY5253Quarter': Timestamp('2011-01-25 09:00:00'),
+                 'FY5253': Timestamp('2011-01-25 09:00:00'),
+                 'Week': Timestamp('2011-01-08 09:00:00'),
+                 'Easter': Timestamp('2011-04-24 09:00:00'),
+                 'Hour': Timestamp('2011-01-01 10:00:00'),
+                 'Minute': Timestamp('2011-01-01 09:01:00'),
+                 'Second': Timestamp('2011-01-01 09:00:01'),
+                 'Milli': Timestamp('2011-01-01 09:00:00.001000'),
+                 'Micro': Timestamp('2011-01-01 09:00:00.000001'),
+                 'Nano': Timestamp(np_datetime64_compat(
+                                   '2011-01-01T09:00:00.000000001Z'))}
+
+    def test_immutable(self, offset_types):
+        # GH#21341 check that __setattr__ raises
+        offset = self._get_offset(offset_types)
+        with pytest.raises(AttributeError):
+            offset.normalize = True
+        with pytest.raises(AttributeError):
+            offset.n = 91
+
+    def test_return_type(self, offset_types):
+        offset = self._get_offset(offset_types)
+
+        # make sure that we are returning a Timestamp
+        result = Timestamp('20080101') + offset
+        assert isinstance(result, Timestamp)
+
+        # make sure that we are returning NaT
+        assert NaT + offset is NaT
+        assert offset + NaT is NaT
+
+        assert NaT - offset is NaT
+        assert (-offset).apply(NaT) is NaT
+
+    def test_offset_n(self, offset_types):
+        offset = self._get_offset(offset_types)
+        assert offset.n == 1
+
+        neg_offset = offset * -1
+        assert neg_offset.n == -1
+
+        mul_offset = offset * 3
+        assert mul_offset.n == 3
+
+    def test_offset_freqstr(self, offset_types):
+        offset = self._get_offset(offset_types)
+
+        freqstr = offset.freqstr
+        if freqstr not in ('<Easter>',
+                           "<DateOffset: days=1>",
+                           'LWOM-SAT', ):
+            code = get_offset(freqstr)
+            assert offset.rule_code == code
+
+    def _check_offsetfunc_works(self, offset, funcname, dt, expected,
+                                normalize=False):
+
+        if normalize and issubclass(offset, Tick):
+            # normalize=True disallowed for Tick subclasses GH#21427
+            return
+
+        offset_s = self._get_offset(offset, normalize=normalize)
+        func = getattr(offset_s, funcname)
+
+        result = func(dt)
+        assert isinstance(result, Timestamp)
+        assert result == expected
+
+        result = func(Timestamp(dt))
+        assert isinstance(result, Timestamp)
+        assert result == expected
+
+        # see gh-14101
+        exp_warning = None
+        ts = Timestamp(dt) + Nano(5)
+
+        if (offset_s.__class__.__name__ == 'DateOffset' and
+                (funcname == 'apply' or normalize) and
+                ts.nanosecond > 0):
+            exp_warning = UserWarning
+
+        # test nanosecond is preserved
+        with tm.assert_produces_warning(exp_warning,
+                                        check_stacklevel=False):
+            result = func(ts)
+        assert isinstance(result, Timestamp)
+        if normalize is False:
+            assert result == expected + Nano(5)
+        else:
+            assert result == expected
+
+        if isinstance(dt, np.datetime64):
+            # test tz when input is datetime or Timestamp
+            return
+
+        for tz in self.timezones:
+            expected_localize = expected.tz_localize(tz)
+            tz_obj = timezones.maybe_get_tz(tz)
+            dt_tz = tslib._localize_pydatetime(dt, tz_obj)
+
+            result = func(dt_tz)
+            assert isinstance(result, Timestamp)
+            assert result == expected_localize
+
+            result = func(Timestamp(dt, tz=tz))
+            assert isinstance(result, Timestamp)
+            assert result == expected_localize
+
+            # see gh-14101
+            exp_warning = None
+            ts = Timestamp(dt, tz=tz) + Nano(5)
+
+            if (offset_s.__class__.__name__ == 'DateOffset' and
+                    (funcname == 'apply' or normalize) and
+                    ts.nanosecond > 0):
+                exp_warning = UserWarning
+
+            # test nanosecond is preserved
+            with tm.assert_produces_warning(exp_warning,
+                                            check_stacklevel=False):
+                result = func(ts)
+            assert isinstance(result, Timestamp)
+            if normalize is False:
+                assert result == expected_localize + Nano(5)
+            else:
+                assert result == expected_localize
+
+    def test_apply(self, offset_types):
+        sdt = datetime(2011, 1, 1, 9, 0)
+        ndt = np_datetime64_compat('2011-01-01 09:00Z')
+
+        for dt in [sdt, ndt]:
+            expected = self.expecteds[offset_types.__name__]
+            self._check_offsetfunc_works(offset_types, 'apply', dt, expected)
+
+            expected = Timestamp(expected.date())
+            self._check_offsetfunc_works(offset_types, 'apply', dt, expected,
+                                         normalize=True)
+
+    def test_rollforward(self, offset_types):
+        expecteds = self.expecteds.copy()
+
+        # result will not be changed if the target is on the offset
+        no_changes = ['Day', 'MonthBegin', 'SemiMonthBegin', 'YearBegin',
+                      'Week', 'Hour', 'Minute', 'Second', 'Milli', 'Micro',
+                      'Nano', 'DateOffset']
+        for n in no_changes:
+            expecteds[n] = Timestamp('2011/01/01 09:00')
+
+        expecteds['BusinessHour'] = Timestamp('2011-01-03 09:00:00')
+        expecteds['CustomBusinessHour'] = Timestamp('2011-01-03 09:00:00')
+
+        # but be changed when normalize=True
+        norm_expected = expecteds.copy()
+        for k in norm_expected:
+            norm_expected[k] = Timestamp(norm_expected[k].date())
+
+        normalized = {'Day': Timestamp('2011-01-02 00:00:00'),
+                      'DateOffset': Timestamp('2011-01-02 00:00:00'),
+                      'MonthBegin': Timestamp('2011-02-01 00:00:00'),
+                      'SemiMonthBegin': Timestamp('2011-01-15 00:00:00'),
+                      'YearBegin': Timestamp('2012-01-01 00:00:00'),
+                      'Week': Timestamp('2011-01-08 00:00:00'),
+                      'Hour': Timestamp('2011-01-01 00:00:00'),
+                      'Minute': Timestamp('2011-01-01 00:00:00'),
+                      'Second': Timestamp('2011-01-01 00:00:00'),
+                      'Milli': Timestamp('2011-01-01 00:00:00'),
+                      'Micro': Timestamp('2011-01-01 00:00:00')}
+        norm_expected.update(normalized)
+
+        sdt = datetime(2011, 1, 1, 9, 0)
+        ndt = np_datetime64_compat('2011-01-01 09:00Z')
+
+        for dt in [sdt, ndt]:
+            expected = expecteds[offset_types.__name__]
+            self._check_offsetfunc_works(offset_types, 'rollforward', dt,
+                                         expected)
+            expected = norm_expected[offset_types.__name__]
+            self._check_offsetfunc_works(offset_types, 'rollforward', dt,
+                                         expected, normalize=True)
+
+    def test_rollback(self, offset_types):
+        expecteds = {'BusinessDay': Timestamp('2010-12-31 09:00:00'),
+                     'CustomBusinessDay': Timestamp('2010-12-31 09:00:00'),
+                     'CustomBusinessMonthEnd':
+                     Timestamp('2010-12-31 09:00:00'),
+                     'CustomBusinessMonthBegin':
+                     Timestamp('2010-12-01 09:00:00'),
+                     'BusinessMonthBegin': Timestamp('2010-12-01 09:00:00'),
+                     'MonthEnd': Timestamp('2010-12-31 09:00:00'),
+                     'SemiMonthEnd': Timestamp('2010-12-31 09:00:00'),
+                     'BusinessMonthEnd': Timestamp('2010-12-31 09:00:00'),
+                     'BYearBegin': Timestamp('2010-01-01 09:00:00'),
+                     'YearEnd': Timestamp('2010-12-31 09:00:00'),
+                     'BYearEnd': Timestamp('2010-12-31 09:00:00'),
+                     'QuarterBegin': Timestamp('2010-12-01 09:00:00'),
+                     'BQuarterBegin': Timestamp('2010-12-01 09:00:00'),
+                     'QuarterEnd': Timestamp('2010-12-31 09:00:00'),
+                     'BQuarterEnd': Timestamp('2010-12-31 09:00:00'),
+                     'BusinessHour': Timestamp('2010-12-31 17:00:00'),
+                     'CustomBusinessHour': Timestamp('2010-12-31 17:00:00'),
+                     'WeekOfMonth': Timestamp('2010-12-11 09:00:00'),
+                     'LastWeekOfMonth': Timestamp('2010-12-25 09:00:00'),
+                     'FY5253Quarter': Timestamp('2010-10-26 09:00:00'),
+                     'FY5253': Timestamp('2010-01-26 09:00:00'),
+                     'Easter': Timestamp('2010-04-04 09:00:00')}
+
+        # result will not be changed if the target is on the offset
+        for n in ['Day', 'MonthBegin', 'SemiMonthBegin', 'YearBegin', 'Week',
+                  'Hour', 'Minute', 'Second', 'Milli', 'Micro', 'Nano',
+                  'DateOffset']:
+            expecteds[n] = Timestamp('2011/01/01 09:00')
+
+        # but be changed when normalize=True
+        norm_expected = expecteds.copy()
+        for k in norm_expected:
+            norm_expected[k] = Timestamp(norm_expected[k].date())
+
+        normalized = {'Day': Timestamp('2010-12-31 00:00:00'),
+                      'DateOffset': Timestamp('2010-12-31 00:00:00'),
+                      'MonthBegin': Timestamp('2010-12-01 00:00:00'),
+                      'SemiMonthBegin': Timestamp('2010-12-15 00:00:00'),
+                      'YearBegin': Timestamp('2010-01-01 00:00:00'),
+                      'Week': Timestamp('2010-12-25 00:00:00'),
+                      'Hour': Timestamp('2011-01-01 00:00:00'),
+                      'Minute': Timestamp('2011-01-01 00:00:00'),
+                      'Second': Timestamp('2011-01-01 00:00:00'),
+                      'Milli': Timestamp('2011-01-01 00:00:00'),
+                      'Micro': Timestamp('2011-01-01 00:00:00')}
+        norm_expected.update(normalized)
+
+        sdt = datetime(2011, 1, 1, 9, 0)
+        ndt = np_datetime64_compat('2011-01-01 09:00Z')
+
+        for dt in [sdt, ndt]:
+            expected = expecteds[offset_types.__name__]
+            self._check_offsetfunc_works(offset_types, 'rollback', dt,
+                                         expected)
+
+            expected = norm_expected[offset_types.__name__]
+            self._check_offsetfunc_works(offset_types, 'rollback', dt,
+                                         expected, normalize=True)
+
+    def test_onOffset(self, offset_types):
+        dt = self.expecteds[offset_types.__name__]
+        offset_s = self._get_offset(offset_types)
+        assert offset_s.onOffset(dt)
+
+        # when normalize=True, onOffset checks time is 00:00:00
+        if issubclass(offset_types, Tick):
+            # normalize=True disallowed for Tick subclasses GH#21427
+            return
+        offset_n = self._get_offset(offset_types, normalize=True)
+        assert not offset_n.onOffset(dt)
+
+        if offset_types in (BusinessHour, CustomBusinessHour):
+            # In default BusinessHour (9:00-17:00), normalized time
+            # cannot be in business hour range
+            return
+        date = datetime(dt.year, dt.month, dt.day)
+        assert offset_n.onOffset(date)
+
+    def test_add(self, offset_types, tz):
+        dt = datetime(2011, 1, 1, 9, 0)
+
+        offset_s = self._get_offset(offset_types)
+        expected = self.expecteds[offset_types.__name__]
+
+        result_dt = dt + offset_s
+        result_ts = Timestamp(dt) + offset_s
+        for result in [result_dt, result_ts]:
+            assert isinstance(result, Timestamp)
+            assert result == expected
+
+        expected_localize = expected.tz_localize(tz)
+        result = Timestamp(dt, tz=tz) + offset_s
+        assert isinstance(result, Timestamp)
+        assert result == expected_localize
+
+        # normalize=True, disallowed for Tick subclasses GH#21427
+        if issubclass(offset_types, Tick):
+            return
+        offset_s = self._get_offset(offset_types, normalize=True)
+        expected = Timestamp(expected.date())
+
+        result_dt = dt + offset_s
+        result_ts = Timestamp(dt) + offset_s
+        for result in [result_dt, result_ts]:
+            assert isinstance(result, Timestamp)
+            assert result == expected
+
+        expected_localize = expected.tz_localize(tz)
+        result = Timestamp(dt, tz=tz) + offset_s
+        assert isinstance(result, Timestamp)
+        assert result == expected_localize
+
+    def test_pickle_v0_15_2(self, datapath):
+        offsets = {'DateOffset': DateOffset(years=1),
+                   'MonthBegin': MonthBegin(1),
+                   'Day': Day(1),
+                   'YearBegin': YearBegin(1),
+                   'Week': Week(1)}
+
+        pickle_path = datapath('tseries', 'offsets', 'data',
+                               'dateoffset_0_15_2.pickle')
+        # This code was executed once on v0.15.2 to generate the pickle:
+        # with open(pickle_path, 'wb') as f: pickle.dump(offsets, f)
+        #
+        tm.assert_dict_equal(offsets, read_pickle(pickle_path))
+
+
+class TestDateOffset(Base):
+
+    def setup_method(self, method):
+        self.d = Timestamp(datetime(2008, 1, 2))
+        _offset_map.clear()
+
+    def test_repr(self):
+        repr(DateOffset())
+        repr(DateOffset(2))
+        repr(2 * DateOffset())
+        repr(2 * DateOffset(months=2))
+
+    def test_mul(self):
+        assert DateOffset(2) == 2 * DateOffset(1)
+        assert DateOffset(2) == DateOffset(1) * 2
+
+    def test_constructor(self):
+
+        assert ((self.d + DateOffset(months=2)) == datetime(2008, 3, 2))
+        assert ((self.d - DateOffset(months=2)) == datetime(2007, 11, 2))
+
+        assert ((self.d + DateOffset(2)) == datetime(2008, 1, 4))
+
+        assert not DateOffset(2).isAnchored()
+        assert DateOffset(1).isAnchored()
+
+        d = datetime(2008, 1, 31)
+        assert ((d + DateOffset(months=1)) == datetime(2008, 2, 29))
+
+    def test_copy(self):
+        assert (DateOffset(months=2).copy() == DateOffset(months=2))
+
+    def test_eq(self):
+        offset1 = DateOffset(days=1)
+        offset2 = DateOffset(days=365)
+
+        assert offset1 != offset2
+
+
+class TestBusinessDay(Base):
+    _offset = BDay
+
+    def setup_method(self, method):
+        self.d = datetime(2008, 1, 1)
+
+        self.offset = BDay()
+        self.offset1 = self.offset
+        self.offset2 = BDay(2)
+
+    def test_different_normalize_equals(self):
+        # GH#21404 changed __eq__ to return False when `normalize` doesnt match
+        offset = self._offset()
+        offset2 = self._offset(normalize=True)
+        assert offset != offset2
+
+    def test_repr(self):
+        assert repr(self.offset) == '<BusinessDay>'
+        assert repr(self.offset2) == '<2 * BusinessDays>'
+
+        if compat.PY37:
+            expected = '<BusinessDay: offset=datetime.timedelta(days=1)>'
+        else:
+            expected = '<BusinessDay: offset=datetime.timedelta(1)>'
+        assert repr(self.offset + timedelta(1)) == expected
+
+    def test_with_offset(self):
+        offset = self.offset + timedelta(hours=2)
+
+        assert (self.d + offset) == datetime(2008, 1, 2, 2)
+
+    def test_eq(self):
+        assert self.offset2 == self.offset2
+
+    def test_mul(self):
+        pass
+
+    def test_hash(self):
+        assert hash(self.offset2) == hash(self.offset2)
+
+    def test_call(self):
+        assert self.offset2(self.d) == datetime(2008, 1, 3)
+
+    def testRollback1(self):
+        assert BDay(10).rollback(self.d) == self.d
+
+    def testRollback2(self):
+        assert (BDay(10).rollback(datetime(2008, 1, 5)) ==
+                datetime(2008, 1, 4))
+
+    def testRollforward1(self):
+        assert BDay(10).rollforward(self.d) == self.d
+
+    def testRollforward2(self):
+        assert (BDay(10).rollforward(datetime(2008, 1, 5)) ==
+                datetime(2008, 1, 7))
+
+    def test_roll_date_object(self):
+        offset = BDay()
+
+        dt = date(2012, 9, 15)
+
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 14)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 17)
+
+        offset = offsets.Day()
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 15)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 15)
+
+    def test_onOffset(self):
+        tests = [(BDay(), datetime(2008, 1, 1), True),
+                 (BDay(), datetime(2008, 1, 5), False)]
+
+        for offset, d, expected in tests:
+            assert_onOffset(offset, d, expected)
+
+    apply_cases = []
+    apply_cases.append((BDay(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 2),
+        datetime(2008, 1, 4): datetime(2008, 1, 7),
+        datetime(2008, 1, 5): datetime(2008, 1, 7),
+        datetime(2008, 1, 6): datetime(2008, 1, 7),
+        datetime(2008, 1, 7): datetime(2008, 1, 8)}))
+
+    apply_cases.append((2 * BDay(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 3),
+        datetime(2008, 1, 4): datetime(2008, 1, 8),
+        datetime(2008, 1, 5): datetime(2008, 1, 8),
+        datetime(2008, 1, 6): datetime(2008, 1, 8),
+        datetime(2008, 1, 7): datetime(2008, 1, 9)}))
+
+    apply_cases.append((-BDay(), {
+        datetime(2008, 1, 1): datetime(2007, 12, 31),
+        datetime(2008, 1, 4): datetime(2008, 1, 3),
+        datetime(2008, 1, 5): datetime(2008, 1, 4),
+        datetime(2008, 1, 6): datetime(2008, 1, 4),
+        datetime(2008, 1, 7): datetime(2008, 1, 4),
+        datetime(2008, 1, 8): datetime(2008, 1, 7)}))
+
+    apply_cases.append((-2 * BDay(), {
+        datetime(2008, 1, 1): datetime(2007, 12, 28),
+        datetime(2008, 1, 4): datetime(2008, 1, 2),
+        datetime(2008, 1, 5): datetime(2008, 1, 3),
+        datetime(2008, 1, 6): datetime(2008, 1, 3),
+        datetime(2008, 1, 7): datetime(2008, 1, 3),
+        datetime(2008, 1, 8): datetime(2008, 1, 4),
+        datetime(2008, 1, 9): datetime(2008, 1, 7)}))
+
+    apply_cases.append((BDay(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 1, 4): datetime(2008, 1, 4),
+        datetime(2008, 1, 5): datetime(2008, 1, 7),
+        datetime(2008, 1, 6): datetime(2008, 1, 7),
+        datetime(2008, 1, 7): datetime(2008, 1, 7)}))
+
+    @pytest.mark.parametrize('case', apply_cases)
+    def test_apply(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    def test_apply_large_n(self):
+        dt = datetime(2012, 10, 23)
+
+        result = dt + BDay(10)
+        assert result == datetime(2012, 11, 6)
+
+        result = dt + BDay(100) - BDay(100)
+        assert result == dt
+
+        off = BDay() * 6
+        rs = datetime(2012, 1, 1) - off
+        xp = datetime(2011, 12, 23)
+        assert rs == xp
+
+        st = datetime(2011, 12, 18)
+        rs = st + off
+        xp = datetime(2011, 12, 26)
+        assert rs == xp
+
+        off = BDay() * 10
+        rs = datetime(2014, 1, 5) + off  # see #5890
+        xp = datetime(2014, 1, 17)
+        assert rs == xp
+
+    def test_apply_corner(self):
+        pytest.raises(TypeError, BDay().apply, BMonthEnd())
+
+
+class TestBusinessHour(Base):
+    _offset = BusinessHour
+
+    def setup_method(self, method):
+        self.d = datetime(2014, 7, 1, 10, 00)
+
+        self.offset1 = BusinessHour()
+        self.offset2 = BusinessHour(n=3)
+
+        self.offset3 = BusinessHour(n=-1)
+        self.offset4 = BusinessHour(n=-4)
+
+        from datetime import time as dt_time
+        self.offset5 = BusinessHour(start=dt_time(11, 0), end=dt_time(14, 30))
+        self.offset6 = BusinessHour(start='20:00', end='05:00')
+        self.offset7 = BusinessHour(n=-2, start=dt_time(21, 30),
+                                    end=dt_time(6, 30))
+
+    def test_constructor_errors(self):
+        from datetime import time as dt_time
+        with pytest.raises(ValueError):
+            BusinessHour(start=dt_time(11, 0, 5))
+        with pytest.raises(ValueError):
+            BusinessHour(start='AAA')
+        with pytest.raises(ValueError):
+            BusinessHour(start='14:00:05')
+
+    def test_different_normalize_equals(self):
+        # GH#21404 changed __eq__ to return False when `normalize` doesnt match
+        offset = self._offset()
+        offset2 = self._offset(normalize=True)
+        assert offset != offset2
+
+    def test_repr(self):
+        assert repr(self.offset1) == '<BusinessHour: BH=09:00-17:00>'
+        assert repr(self.offset2) == '<3 * BusinessHours: BH=09:00-17:00>'
+        assert repr(self.offset3) == '<-1 * BusinessHour: BH=09:00-17:00>'
+        assert repr(self.offset4) == '<-4 * BusinessHours: BH=09:00-17:00>'
+
+        assert repr(self.offset5) == '<BusinessHour: BH=11:00-14:30>'
+        assert repr(self.offset6) == '<BusinessHour: BH=20:00-05:00>'
+        assert repr(self.offset7) == '<-2 * BusinessHours: BH=21:30-06:30>'
+
+    def test_with_offset(self):
+        expected = Timestamp('2014-07-01 13:00')
+
+        assert self.d + BusinessHour() * 3 == expected
+        assert self.d + BusinessHour(n=3) == expected
+
+    def test_eq(self):
+        for offset in [self.offset1, self.offset2, self.offset3, self.offset4]:
+            assert offset == offset
+
+        assert BusinessHour() != BusinessHour(-1)
+        assert BusinessHour(start='09:00') == BusinessHour()
+        assert BusinessHour(start='09:00') != BusinessHour(start='09:01')
+        assert (BusinessHour(start='09:00', end='17:00') !=
+                BusinessHour(start='17:00', end='09:01'))
+
+    def test_hash(self):
+        for offset in [self.offset1, self.offset2, self.offset3, self.offset4]:
+            assert hash(offset) == hash(offset)
+
+    def test_call(self):
+        assert self.offset1(self.d) == datetime(2014, 7, 1, 11)
+        assert self.offset2(self.d) == datetime(2014, 7, 1, 13)
+        assert self.offset3(self.d) == datetime(2014, 6, 30, 17)
+        assert self.offset4(self.d) == datetime(2014, 6, 30, 14)
+
+    def test_sub(self):
+        # we have to override test_sub here becasue self.offset2 is not
+        # defined as self._offset(2)
+        off = self.offset2
+        with pytest.raises(Exception):
+            off - self.d
+        assert 2 * off - off == off
+
+        assert self.d - self.offset2 == self.d + self._offset(-3)
+
+    def testRollback1(self):
+        assert self.offset1.rollback(self.d) == self.d
+        assert self.offset2.rollback(self.d) == self.d
+        assert self.offset3.rollback(self.d) == self.d
+        assert self.offset4.rollback(self.d) == self.d
+        assert self.offset5.rollback(self.d) == datetime(2014, 6, 30, 14, 30)
+        assert self.offset6.rollback(self.d) == datetime(2014, 7, 1, 5, 0)
+        assert self.offset7.rollback(self.d) == datetime(2014, 7, 1, 6, 30)
+
+        d = datetime(2014, 7, 1, 0)
+        assert self.offset1.rollback(d) == datetime(2014, 6, 30, 17)
+        assert self.offset2.rollback(d) == datetime(2014, 6, 30, 17)
+        assert self.offset3.rollback(d) == datetime(2014, 6, 30, 17)
+        assert self.offset4.rollback(d) == datetime(2014, 6, 30, 17)
+        assert self.offset5.rollback(d) == datetime(2014, 6, 30, 14, 30)
+        assert self.offset6.rollback(d) == d
+        assert self.offset7.rollback(d) == d
+
+        assert self._offset(5).rollback(self.d) == self.d
+
+    def testRollback2(self):
+        assert (self._offset(-3).rollback(datetime(2014, 7, 5, 15, 0)) ==
+                datetime(2014, 7, 4, 17, 0))
+
+    def testRollforward1(self):
+        assert self.offset1.rollforward(self.d) == self.d
+        assert self.offset2.rollforward(self.d) == self.d
+        assert self.offset3.rollforward(self.d) == self.d
+        assert self.offset4.rollforward(self.d) == self.d
+        assert (self.offset5.rollforward(self.d) ==
+                datetime(2014, 7, 1, 11, 0))
+        assert (self.offset6.rollforward(self.d) ==
+                datetime(2014, 7, 1, 20, 0))
+        assert (self.offset7.rollforward(self.d) ==
+                datetime(2014, 7, 1, 21, 30))
+
+        d = datetime(2014, 7, 1, 0)
+        assert self.offset1.rollforward(d) == datetime(2014, 7, 1, 9)
+        assert self.offset2.rollforward(d) == datetime(2014, 7, 1, 9)
+        assert self.offset3.rollforward(d) == datetime(2014, 7, 1, 9)
+        assert self.offset4.rollforward(d) == datetime(2014, 7, 1, 9)
+        assert self.offset5.rollforward(d) == datetime(2014, 7, 1, 11)
+        assert self.offset6.rollforward(d) == d
+        assert self.offset7.rollforward(d) == d
+
+        assert self._offset(5).rollforward(self.d) == self.d
+
+    def testRollforward2(self):
+        assert (self._offset(-3).rollforward(datetime(2014, 7, 5, 16, 0)) ==
+                datetime(2014, 7, 7, 9))
+
+    def test_roll_date_object(self):
+        offset = BusinessHour()
+
+        dt = datetime(2014, 7, 6, 15, 0)
+
+        result = offset.rollback(dt)
+        assert result == datetime(2014, 7, 4, 17)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2014, 7, 7, 9)
+
+    normalize_cases = []
+    normalize_cases.append((BusinessHour(normalize=True), {
+        datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 2),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 2),
+        datetime(2014, 7, 1, 23): datetime(2014, 7, 2),
+        datetime(2014, 7, 1, 0): datetime(2014, 7, 1),
+        datetime(2014, 7, 4, 15): datetime(2014, 7, 4),
+        datetime(2014, 7, 4, 15, 59): datetime(2014, 7, 4),
+        datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7),
+        datetime(2014, 7, 5, 23): datetime(2014, 7, 7),
+        datetime(2014, 7, 6, 10): datetime(2014, 7, 7)}))
+
+    normalize_cases.append((BusinessHour(-1, normalize=True), {
+        datetime(2014, 7, 1, 8): datetime(2014, 6, 30),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 1),
+        datetime(2014, 7, 1, 10): datetime(2014, 6, 30),
+        datetime(2014, 7, 1, 0): datetime(2014, 6, 30),
+        datetime(2014, 7, 7, 10): datetime(2014, 7, 4),
+        datetime(2014, 7, 7, 10, 1): datetime(2014, 7, 7),
+        datetime(2014, 7, 5, 23): datetime(2014, 7, 4),
+        datetime(2014, 7, 6, 10): datetime(2014, 7, 4)}))
+
+    normalize_cases.append((BusinessHour(1, normalize=True, start='17:00',
+                                         end='04:00'), {
+        datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
+        datetime(2014, 7, 1, 23): datetime(2014, 7, 2),
+        datetime(2014, 7, 2, 2): datetime(2014, 7, 2),
+        datetime(2014, 7, 2, 3): datetime(2014, 7, 2),
+        datetime(2014, 7, 4, 23): datetime(2014, 7, 5),
+        datetime(2014, 7, 5, 2): datetime(2014, 7, 5),
+        datetime(2014, 7, 7, 2): datetime(2014, 7, 7),
+        datetime(2014, 7, 7, 17): datetime(2014, 7, 7)}))
+
+    @pytest.mark.parametrize('case', normalize_cases)
+    def test_normalize(self, case):
+        offset, cases = case
+        for dt, expected in compat.iteritems(cases):
+            assert offset.apply(dt) == expected
+
+    on_offset_cases = []
+    on_offset_cases.append((BusinessHour(), {
+        datetime(2014, 7, 1, 9): True,
+        datetime(2014, 7, 1, 8, 59): False,
+        datetime(2014, 7, 1, 8): False,
+        datetime(2014, 7, 1, 17): True,
+        datetime(2014, 7, 1, 17, 1): False,
+        datetime(2014, 7, 1, 18): False,
+        datetime(2014, 7, 5, 9): False,
+        datetime(2014, 7, 6, 12): False}))
+
+    on_offset_cases.append((BusinessHour(start='10:00', end='15:00'), {
+        datetime(2014, 7, 1, 9): False,
+        datetime(2014, 7, 1, 10): True,
+        datetime(2014, 7, 1, 15): True,
+        datetime(2014, 7, 1, 15, 1): False,
+        datetime(2014, 7, 5, 12): False,
+        datetime(2014, 7, 6, 12): False}))
+
+    on_offset_cases.append((BusinessHour(start='19:00', end='05:00'), {
+        datetime(2014, 7, 1, 9, 0): False,
+        datetime(2014, 7, 1, 10, 0): False,
+        datetime(2014, 7, 1, 15): False,
+        datetime(2014, 7, 1, 15, 1): False,
+        datetime(2014, 7, 5, 12, 0): False,
+        datetime(2014, 7, 6, 12, 0): False,
+        datetime(2014, 7, 1, 19, 0): True,
+        datetime(2014, 7, 2, 0, 0): True,
+        datetime(2014, 7, 4, 23): True,
+        datetime(2014, 7, 5, 1): True,
+        datetime(2014, 7, 5, 5, 0): True,
+        datetime(2014, 7, 6, 23, 0): False,
+        datetime(2014, 7, 7, 3, 0): False}))
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, cases = case
+        for dt, expected in compat.iteritems(cases):
+            assert offset.onOffset(dt) == expected
+
+    opening_time_cases = []
+    # opening time should be affected by sign of n, not by n's value and
+    # end
+    opening_time_cases.append(([BusinessHour(), BusinessHour(n=2),
+                                BusinessHour(n=4), BusinessHour(end='10:00'),
+                                BusinessHour(n=2, end='4:00'),
+                                BusinessHour(n=4, end='15:00')], {
+        datetime(2014, 7, 1, 11): (datetime(2014, 7, 2, 9),
+                                   datetime(2014, 7, 1, 9)),
+        datetime(2014, 7, 1, 18): (datetime(2014, 7, 2, 9),
+                                   datetime(2014, 7, 1, 9)),
+        datetime(2014, 7, 1, 23): (datetime(2014, 7, 2, 9),
+                                   datetime(2014, 7, 1, 9)),
+        datetime(2014, 7, 2, 8): (datetime(2014, 7, 2, 9),
+                                  datetime(2014, 7, 1, 9)),
+        # if timestamp is on opening time, next opening time is
+        # as it is
+        datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 9),
+                                  datetime(2014, 7, 2, 9)),
+        datetime(2014, 7, 2, 10): (datetime(2014, 7, 3, 9),
+                                   datetime(2014, 7, 2, 9)),
+        # 2014-07-05 is saturday
+        datetime(2014, 7, 5, 10): (datetime(2014, 7, 7, 9),
+                                   datetime(2014, 7, 4, 9)),
+        datetime(2014, 7, 4, 10): (datetime(2014, 7, 7, 9),
+                                   datetime(2014, 7, 4, 9)),
+        datetime(2014, 7, 4, 23): (datetime(2014, 7, 7, 9),
+                                   datetime(2014, 7, 4, 9)),
+        datetime(2014, 7, 6, 10): (datetime(2014, 7, 7, 9),
+                                   datetime(2014, 7, 4, 9)),
+        datetime(2014, 7, 7, 5): (datetime(2014, 7, 7, 9),
+                                  datetime(2014, 7, 4, 9)),
+        datetime(2014, 7, 7, 9, 1): (datetime(2014, 7, 8, 9),
+                                     datetime(2014, 7, 7, 9))}))
+
+    opening_time_cases.append(([BusinessHour(start='11:15'),
+                                BusinessHour(n=2, start='11:15'),
+                                BusinessHour(n=3, start='11:15'),
+                                BusinessHour(start='11:15', end='10:00'),
+                                BusinessHour(n=2, start='11:15', end='4:00'),
+                                BusinessHour(n=3, start='11:15',
+                                             end='15:00')], {
+        datetime(2014, 7, 1, 11): (datetime(2014, 7, 1, 11, 15),
+                                   datetime(2014, 6, 30, 11, 15)),
+        datetime(2014, 7, 1, 18): (datetime(2014, 7, 2, 11, 15),
+                                   datetime(2014, 7, 1, 11, 15)),
+        datetime(2014, 7, 1, 23): (datetime(2014, 7, 2, 11, 15),
+                                   datetime(2014, 7, 1, 11, 15)),
+        datetime(2014, 7, 2, 8): (datetime(2014, 7, 2, 11, 15),
+                                  datetime(2014, 7, 1, 11, 15)),
+        datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 11, 15),
+                                  datetime(2014, 7, 1, 11, 15)),
+        datetime(2014, 7, 2, 10): (datetime(2014, 7, 2, 11, 15),
+                                   datetime(2014, 7, 1, 11, 15)),
+        datetime(2014, 7, 2, 11, 15): (datetime(2014, 7, 2, 11, 15),
+                                       datetime(2014, 7, 2, 11, 15)),
+        datetime(2014, 7, 2, 11, 15, 1): (datetime(2014, 7, 3, 11, 15),
+                                          datetime(2014, 7, 2, 11, 15)),
+        datetime(2014, 7, 5, 10): (datetime(2014, 7, 7, 11, 15),
+                                   datetime(2014, 7, 4, 11, 15)),
+        datetime(2014, 7, 4, 10): (datetime(2014, 7, 4, 11, 15),
+                                   datetime(2014, 7, 3, 11, 15)),
+        datetime(2014, 7, 4, 23): (datetime(2014, 7, 7, 11, 15),
+                                   datetime(2014, 7, 4, 11, 15)),
+        datetime(2014, 7, 6, 10): (datetime(2014, 7, 7, 11, 15),
+                                   datetime(2014, 7, 4, 11, 15)),
+        datetime(2014, 7, 7, 5): (datetime(2014, 7, 7, 11, 15),
+                                  datetime(2014, 7, 4, 11, 15)),
+        datetime(2014, 7, 7, 9, 1): (datetime(2014, 7, 7, 11, 15),
+                                     datetime(2014, 7, 4, 11, 15))}))
+
+    opening_time_cases.append(([BusinessHour(-1), BusinessHour(n=-2),
+                                BusinessHour(n=-4),
+                                BusinessHour(n=-1, end='10:00'),
+                                BusinessHour(n=-2, end='4:00'),
+                                BusinessHour(n=-4, end='15:00')], {
+        datetime(2014, 7, 1, 11): (datetime(2014, 7, 1, 9),
+                                   datetime(2014, 7, 2, 9)),
+        datetime(2014, 7, 1, 18): (datetime(2014, 7, 1, 9),
+                                   datetime(2014, 7, 2, 9)),
+        datetime(2014, 7, 1, 23): (datetime(2014, 7, 1, 9),
+                                   datetime(2014, 7, 2, 9)),
+        datetime(2014, 7, 2, 8): (datetime(2014, 7, 1, 9),
+                                  datetime(2014, 7, 2, 9)),
+        datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 9),
+                                  datetime(2014, 7, 2, 9)),
+        datetime(2014, 7, 2, 10): (datetime(2014, 7, 2, 9),
+                                   datetime(2014, 7, 3, 9)),
+        datetime(2014, 7, 5, 10): (datetime(2014, 7, 4, 9),
+                                   datetime(2014, 7, 7, 9)),
+        datetime(2014, 7, 4, 10): (datetime(2014, 7, 4, 9),
+                                   datetime(2014, 7, 7, 9)),
+        datetime(2014, 7, 4, 23): (datetime(2014, 7, 4, 9),
+                                   datetime(2014, 7, 7, 9)),
+        datetime(2014, 7, 6, 10): (datetime(2014, 7, 4, 9),
+                                   datetime(2014, 7, 7, 9)),
+        datetime(2014, 7, 7, 5): (datetime(2014, 7, 4, 9),
+                                  datetime(2014, 7, 7, 9)),
+        datetime(2014, 7, 7, 9): (datetime(2014, 7, 7, 9),
+                                  datetime(2014, 7, 7, 9)),
+        datetime(2014, 7, 7, 9, 1): (datetime(2014, 7, 7, 9),
+                                     datetime(2014, 7, 8, 9))}))
+
+    opening_time_cases.append(([BusinessHour(start='17:00', end='05:00'),
+                                BusinessHour(n=3, start='17:00',
+                                             end='03:00')], {
+        datetime(2014, 7, 1, 11): (datetime(2014, 7, 1, 17),
+                                   datetime(2014, 6, 30, 17)),
+        datetime(2014, 7, 1, 18): (datetime(2014, 7, 2, 17),
+                                   datetime(2014, 7, 1, 17)),
+        datetime(2014, 7, 1, 23): (datetime(2014, 7, 2, 17),
+                                   datetime(2014, 7, 1, 17)),
+        datetime(2014, 7, 2, 8): (datetime(2014, 7, 2, 17),
+                                  datetime(2014, 7, 1, 17)),
+        datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 17),
+                                  datetime(2014, 7, 1, 17)),
+        datetime(2014, 7, 4, 17): (datetime(2014, 7, 4, 17),
+                                   datetime(2014, 7, 4, 17)),
+        datetime(2014, 7, 5, 10): (datetime(2014, 7, 7, 17),
+                                   datetime(2014, 7, 4, 17)),
+        datetime(2014, 7, 4, 10): (datetime(2014, 7, 4, 17),
+                                   datetime(2014, 7, 3, 17)),
+        datetime(2014, 7, 4, 23): (datetime(2014, 7, 7, 17),
+                                   datetime(2014, 7, 4, 17)),
+        datetime(2014, 7, 6, 10): (datetime(2014, 7, 7, 17),
+                                   datetime(2014, 7, 4, 17)),
+        datetime(2014, 7, 7, 5): (datetime(2014, 7, 7, 17),
+                                  datetime(2014, 7, 4, 17)),
+        datetime(2014, 7, 7, 17, 1): (datetime(2014, 7, 8, 17),
+                                      datetime(2014, 7, 7, 17)), }))
+
+    opening_time_cases.append(([BusinessHour(-1, start='17:00', end='05:00'),
+                                BusinessHour(n=-2, start='17:00',
+                                             end='03:00')], {
+        datetime(2014, 7, 1, 11): (datetime(2014, 6, 30, 17),
+                                   datetime(2014, 7, 1, 17)),
+        datetime(2014, 7, 1, 18): (datetime(2014, 7, 1, 17),
+                                   datetime(2014, 7, 2, 17)),
+        datetime(2014, 7, 1, 23): (datetime(2014, 7, 1, 17),
+                                   datetime(2014, 7, 2, 17)),
+        datetime(2014, 7, 2, 8): (datetime(2014, 7, 1, 17),
+                                  datetime(2014, 7, 2, 17)),
+        datetime(2014, 7, 2, 9): (datetime(2014, 7, 1, 17),
+                                  datetime(2014, 7, 2, 17)),
+        datetime(2014, 7, 2, 16, 59): (datetime(2014, 7, 1, 17),
+                                       datetime(2014, 7, 2, 17)),
+        datetime(2014, 7, 5, 10): (datetime(2014, 7, 4, 17),
+                                   datetime(2014, 7, 7, 17)),
+        datetime(2014, 7, 4, 10): (datetime(2014, 7, 3, 17),
+                                   datetime(2014, 7, 4, 17)),
+        datetime(2014, 7, 4, 23): (datetime(2014, 7, 4, 17),
+                                   datetime(2014, 7, 7, 17)),
+        datetime(2014, 7, 6, 10): (datetime(2014, 7, 4, 17),
+                                   datetime(2014, 7, 7, 17)),
+        datetime(2014, 7, 7, 5): (datetime(2014, 7, 4, 17),
+                                  datetime(2014, 7, 7, 17)),
+        datetime(2014, 7, 7, 18): (datetime(2014, 7, 7, 17),
+                                   datetime(2014, 7, 8, 17))}))
+
+    @pytest.mark.parametrize('case', opening_time_cases)
+    def test_opening_time(self, case):
+        _offsets, cases = case
+        for offset in _offsets:
+            for dt, (exp_next, exp_prev) in compat.iteritems(cases):
+                assert offset._next_opening_time(dt) == exp_next
+                assert offset._prev_opening_time(dt) == exp_prev
+
+    apply_cases = []
+    apply_cases.append((BusinessHour(), {
+        datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 12),
+        datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 14),
+        datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 1, 19): datetime(2014, 7, 2, 10),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 2, 9),
+        datetime(2014, 7, 1, 16, 30, 15): datetime(2014, 7, 2, 9, 30, 15),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 2, 10),
+        datetime(2014, 7, 2, 11): datetime(2014, 7, 2, 12),
+        # out of business hours
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 10),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 10),
+        datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 10),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 10),
+        # saturday
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 10),
+        datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 10),
+        datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 9, 30),
+        datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 9, 30, 30)}))
+
+    apply_cases.append((BusinessHour(4), {
+        datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 15),
+        datetime(2014, 7, 1, 13): datetime(2014, 7, 2, 9),
+        datetime(2014, 7, 1, 15): datetime(2014, 7, 2, 11),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 2, 12),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 2, 11): datetime(2014, 7, 2, 15),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 13),
+        datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 13),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 13),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 13),
+        datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 13),
+        datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 12, 30),
+        datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 12, 30, 30)}))
+
+    apply_cases.append((BusinessHour(-1), {
+        datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 10),
+        datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 12),
+        datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 14),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 1, 15),
+        datetime(2014, 7, 1, 10): datetime(2014, 6, 30, 17),
+        datetime(2014, 7, 1, 16, 30, 15): datetime(2014, 7, 1, 15, 30, 15),
+        datetime(2014, 7, 1, 9, 30, 15): datetime(2014, 6, 30, 16, 30, 15),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 1, 5): datetime(2014, 6, 30, 16),
+        datetime(2014, 7, 2, 11): datetime(2014, 7, 2, 10),
+        # out of business hours
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 16),
+        datetime(2014, 7, 2, 23): datetime(2014, 7, 2, 16),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 16),
+        # saturday
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 16),
+        datetime(2014, 7, 7, 9): datetime(2014, 7, 4, 16),
+        datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 4, 16, 30),
+        datetime(2014, 7, 7, 9, 30, 30): datetime(2014, 7, 4, 16, 30, 30)}))
+
+    apply_cases.append((BusinessHour(-4), {
+        datetime(2014, 7, 1, 11): datetime(2014, 6, 30, 15),
+        datetime(2014, 7, 1, 13): datetime(2014, 6, 30, 17),
+        datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 11),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 1, 12),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 13),
+        datetime(2014, 7, 2, 11): datetime(2014, 7, 1, 15),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 1, 13),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 2, 23): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 13),
+        datetime(2014, 7, 4, 18): datetime(2014, 7, 4, 13),
+        datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 4, 13, 30),
+        datetime(2014, 7, 7, 9, 30, 30): datetime(2014, 7, 4, 13, 30, 30)}))
+
+    apply_cases.append((BusinessHour(start='13:00', end='16:00'), {
+        datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 14),
+        datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 14),
+        datetime(2014, 7, 1, 15): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 1, 19): datetime(2014, 7, 2, 14),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 2, 14),
+        datetime(2014, 7, 1, 15, 30, 15): datetime(2014, 7, 2, 13, 30, 15),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 14),
+        datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 14)}))
+
+    apply_cases.append((BusinessHour(n=2, start='13:00', end='16:00'), {
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 2, 15),
+        datetime(2014, 7, 2, 14): datetime(2014, 7, 3, 13),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 15),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 15),
+        datetime(2014, 7, 2, 14, 30): datetime(2014, 7, 3, 13, 30),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 15),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 15),
+        datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 15),
+        datetime(2014, 7, 4, 14, 30): datetime(2014, 7, 7, 13, 30),
+        datetime(2014, 7, 4, 14, 30, 30): datetime(2014, 7, 7, 13, 30, 30)}))
+
+    apply_cases.append((BusinessHour(n=-1, start='13:00', end='16:00'), {
+        datetime(2014, 7, 2, 11): datetime(2014, 7, 1, 15),
+        datetime(2014, 7, 2, 13): datetime(2014, 7, 1, 15),
+        datetime(2014, 7, 2, 14): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 2, 15): datetime(2014, 7, 2, 14),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 15),
+        datetime(2014, 7, 2, 16): datetime(2014, 7, 2, 15),
+        datetime(2014, 7, 2, 13, 30, 15): datetime(2014, 7, 1, 15, 30, 15),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 15),
+        datetime(2014, 7, 7, 11): datetime(2014, 7, 4, 15)}))
+
+    apply_cases.append((BusinessHour(n=-3, start='10:00', end='16:00'), {
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 13),
+        datetime(2014, 7, 2, 14): datetime(2014, 7, 2, 11),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 1, 13),
+        datetime(2014, 7, 2, 13): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 2, 11, 30): datetime(2014, 7, 1, 14, 30),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 4, 10): datetime(2014, 7, 3, 13),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 13),
+        datetime(2014, 7, 4, 16): datetime(2014, 7, 4, 13),
+        datetime(2014, 7, 4, 12, 30): datetime(2014, 7, 3, 15, 30),
+        datetime(2014, 7, 4, 12, 30, 30): datetime(2014, 7, 3, 15, 30, 30)}))
+
+    apply_cases.append((BusinessHour(start='19:00', end='05:00'), {
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 20),
+        datetime(2014, 7, 2, 14): datetime(2014, 7, 2, 20),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 20),
+        datetime(2014, 7, 2, 13): datetime(2014, 7, 2, 20),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 20),
+        datetime(2014, 7, 2, 4, 30): datetime(2014, 7, 2, 19, 30),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 1),
+        datetime(2014, 7, 4, 10): datetime(2014, 7, 4, 20),
+        datetime(2014, 7, 4, 23): datetime(2014, 7, 5, 0),
+        datetime(2014, 7, 5, 0): datetime(2014, 7, 5, 1),
+        datetime(2014, 7, 5, 4): datetime(2014, 7, 7, 19),
+        datetime(2014, 7, 5, 4, 30): datetime(2014, 7, 7, 19, 30),
+        datetime(2014, 7, 5, 4, 30, 30): datetime(2014, 7, 7, 19, 30, 30)}))
+
+    apply_cases.append((BusinessHour(n=-1, start='19:00', end='05:00'), {
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 4),
+        datetime(2014, 7, 2, 14): datetime(2014, 7, 2, 4),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 4),
+        datetime(2014, 7, 2, 13): datetime(2014, 7, 2, 4),
+        datetime(2014, 7, 2, 20): datetime(2014, 7, 2, 5),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 4),
+        datetime(2014, 7, 2, 19, 30): datetime(2014, 7, 2, 4, 30),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 23),
+        datetime(2014, 7, 3, 6): datetime(2014, 7, 3, 4),
+        datetime(2014, 7, 4, 23): datetime(2014, 7, 4, 22),
+        datetime(2014, 7, 5, 0): datetime(2014, 7, 4, 23),
+        datetime(2014, 7, 5, 4): datetime(2014, 7, 5, 3),
+        datetime(2014, 7, 7, 19, 30): datetime(2014, 7, 5, 4, 30),
+        datetime(2014, 7, 7, 19, 30, 30): datetime(2014, 7, 5, 4, 30, 30)}))
+
+    @pytest.mark.parametrize('case', apply_cases)
+    def test_apply(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    apply_large_n_cases = []
+    # A week later
+    apply_large_n_cases.append((BusinessHour(40), {
+        datetime(2014, 7, 1, 11): datetime(2014, 7, 8, 11),
+        datetime(2014, 7, 1, 13): datetime(2014, 7, 8, 13),
+        datetime(2014, 7, 1, 15): datetime(2014, 7, 8, 15),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 8, 16),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 9, 9),
+        datetime(2014, 7, 2, 11): datetime(2014, 7, 9, 11),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 9, 9),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 10, 9),
+        datetime(2014, 7, 2, 23): datetime(2014, 7, 10, 9),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 10, 9),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 14, 9),
+        datetime(2014, 7, 4, 18): datetime(2014, 7, 14, 9),
+        datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 14, 9, 30),
+        datetime(2014, 7, 7, 9, 30, 30): datetime(2014, 7, 14, 9, 30, 30)}))
+
+    # 3 days and 1 hour before
+    apply_large_n_cases.append((BusinessHour(-25), {
+        datetime(2014, 7, 1, 11): datetime(2014, 6, 26, 10),
+        datetime(2014, 7, 1, 13): datetime(2014, 6, 26, 12),
+        datetime(2014, 7, 1, 9): datetime(2014, 6, 25, 16),
+        datetime(2014, 7, 1, 10): datetime(2014, 6, 25, 17),
+        datetime(2014, 7, 3, 11): datetime(2014, 6, 30, 10),
+        datetime(2014, 7, 3, 8): datetime(2014, 6, 27, 16),
+        datetime(2014, 7, 3, 19): datetime(2014, 6, 30, 16),
+        datetime(2014, 7, 3, 23): datetime(2014, 6, 30, 16),
+        datetime(2014, 7, 4, 9): datetime(2014, 6, 30, 16),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 6, 18): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 1, 16, 30),
+        datetime(2014, 7, 7, 10, 30, 30): datetime(2014, 7, 2, 9, 30, 30)}))
+
+    # 5 days and 3 hours later
+    apply_large_n_cases.append((BusinessHour(28, start='21:00', end='02:00'), {
+        datetime(2014, 7, 1, 11): datetime(2014, 7, 9, 0),
+        datetime(2014, 7, 1, 22): datetime(2014, 7, 9, 1),
+        datetime(2014, 7, 1, 23): datetime(2014, 7, 9, 21),
+        datetime(2014, 7, 2, 2): datetime(2014, 7, 10, 0),
+        datetime(2014, 7, 3, 21): datetime(2014, 7, 11, 0),
+        datetime(2014, 7, 4, 1): datetime(2014, 7, 11, 23),
+        datetime(2014, 7, 4, 2): datetime(2014, 7, 12, 0),
+        datetime(2014, 7, 4, 3): datetime(2014, 7, 12, 0),
+        datetime(2014, 7, 5, 1): datetime(2014, 7, 14, 23),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 15, 0),
+        datetime(2014, 7, 6, 18): datetime(2014, 7, 15, 0),
+        datetime(2014, 7, 7, 1): datetime(2014, 7, 15, 0),
+        datetime(2014, 7, 7, 23, 30): datetime(2014, 7, 15, 21, 30)}))
+
+    @pytest.mark.parametrize('case', apply_large_n_cases)
+    def test_apply_large_n(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    def test_apply_nanoseconds(self):
+        tests = []
+
+        tests.append((BusinessHour(),
+                      {Timestamp('2014-07-04 15:00') + Nano(5): Timestamp(
+                          '2014-07-04 16:00') + Nano(5),
+                       Timestamp('2014-07-04 16:00') + Nano(5): Timestamp(
+                           '2014-07-07 09:00') + Nano(5),
+                       Timestamp('2014-07-04 16:00') - Nano(5): Timestamp(
+                           '2014-07-04 17:00') - Nano(5)}))
+
+        tests.append((BusinessHour(-1),
+                      {Timestamp('2014-07-04 15:00') + Nano(5): Timestamp(
+                          '2014-07-04 14:00') + Nano(5),
+                       Timestamp('2014-07-04 10:00') + Nano(5): Timestamp(
+                           '2014-07-04 09:00') + Nano(5),
+                       Timestamp('2014-07-04 10:00') - Nano(5): Timestamp(
+                           '2014-07-03 17:00') - Nano(5), }))
+
+        for offset, cases in tests:
+            for base, expected in compat.iteritems(cases):
+                assert_offset_equal(offset, base, expected)
+
+    def test_datetimeindex(self):
+        idx1 = DatetimeIndex(start='2014-07-04 15:00', end='2014-07-08 10:00',
+                             freq='BH')
+        idx2 = DatetimeIndex(start='2014-07-04 15:00', periods=12, freq='BH')
+        idx3 = DatetimeIndex(end='2014-07-08 10:00', periods=12, freq='BH')
+        expected = DatetimeIndex(['2014-07-04 15:00', '2014-07-04 16:00',
+                                  '2014-07-07 09:00',
+                                  '2014-07-07 10:00', '2014-07-07 11:00',
+                                  '2014-07-07 12:00',
+                                  '2014-07-07 13:00', '2014-07-07 14:00',
+                                  '2014-07-07 15:00',
+                                  '2014-07-07 16:00', '2014-07-08 09:00',
+                                  '2014-07-08 10:00'],
+                                 freq='BH')
+        for idx in [idx1, idx2, idx3]:
+            tm.assert_index_equal(idx, expected)
+
+        idx1 = DatetimeIndex(start='2014-07-04 15:45', end='2014-07-08 10:45',
+                             freq='BH')
+        idx2 = DatetimeIndex(start='2014-07-04 15:45', periods=12, freq='BH')
+        idx3 = DatetimeIndex(end='2014-07-08 10:45', periods=12, freq='BH')
+
+        expected = DatetimeIndex(['2014-07-04 15:45', '2014-07-04 16:45',
+                                  '2014-07-07 09:45',
+                                  '2014-07-07 10:45', '2014-07-07 11:45',
+                                  '2014-07-07 12:45',
+                                  '2014-07-07 13:45', '2014-07-07 14:45',
+                                  '2014-07-07 15:45',
+                                  '2014-07-07 16:45', '2014-07-08 09:45',
+                                  '2014-07-08 10:45'],
+                                 freq='BH')
+        expected = idx1
+        for idx in [idx1, idx2, idx3]:
+            tm.assert_index_equal(idx, expected)
+
+
+class TestCustomBusinessHour(Base):
+    _offset = CustomBusinessHour
+    holidays = ['2014-06-27', datetime(2014, 6, 30),
+                np.datetime64('2014-07-02')]
+
+    def setup_method(self, method):
+        # 2014 Calendar to check custom holidays
+        #   Sun Mon Tue Wed Thu Fri Sat
+        #  6/22  23  24  25  26  27  28
+        #    29  30 7/1   2   3   4   5
+        #     6   7   8   9  10  11  12
+        self.d = datetime(2014, 7, 1, 10, 00)
+        self.offset1 = CustomBusinessHour(weekmask='Tue Wed Thu Fri')
+
+        self.offset2 = CustomBusinessHour(holidays=self.holidays)
+
+    def test_constructor_errors(self):
+        from datetime import time as dt_time
+        with pytest.raises(ValueError):
+            CustomBusinessHour(start=dt_time(11, 0, 5))
+        with pytest.raises(ValueError):
+            CustomBusinessHour(start='AAA')
+        with pytest.raises(ValueError):
+            CustomBusinessHour(start='14:00:05')
+
+    def test_different_normalize_equals(self):
+        # GH#21404 changed __eq__ to return False when `normalize` doesnt match
+        offset = self._offset()
+        offset2 = self._offset(normalize=True)
+        assert offset != offset2
+
+    def test_repr(self):
+        assert repr(self.offset1) == '<CustomBusinessHour: CBH=09:00-17:00>'
+        assert repr(self.offset2) == '<CustomBusinessHour: CBH=09:00-17:00>'
+
+    def test_with_offset(self):
+        expected = Timestamp('2014-07-01 13:00')
+
+        assert self.d + CustomBusinessHour() * 3 == expected
+        assert self.d + CustomBusinessHour(n=3) == expected
+
+    def test_eq(self):
+        for offset in [self.offset1, self.offset2]:
+            assert offset == offset
+
+        assert CustomBusinessHour() != CustomBusinessHour(-1)
+        assert (CustomBusinessHour(start='09:00') ==
+                CustomBusinessHour())
+        assert (CustomBusinessHour(start='09:00') !=
+                CustomBusinessHour(start='09:01'))
+        assert (CustomBusinessHour(start='09:00', end='17:00') !=
+                CustomBusinessHour(start='17:00', end='09:01'))
+
+        assert (CustomBusinessHour(weekmask='Tue Wed Thu Fri') !=
+                CustomBusinessHour(weekmask='Mon Tue Wed Thu Fri'))
+        assert (CustomBusinessHour(holidays=['2014-06-27']) !=
+                CustomBusinessHour(holidays=['2014-06-28']))
+
+    def test_sub(self):
+        # override the Base.test_sub implementation because self.offset2 is
+        # defined differently in this class than the test expects
+        pass
+
+    def test_hash(self):
+        assert hash(self.offset1) == hash(self.offset1)
+        assert hash(self.offset2) == hash(self.offset2)
+
+    def test_call(self):
+        assert self.offset1(self.d) == datetime(2014, 7, 1, 11)
+        assert self.offset2(self.d) == datetime(2014, 7, 1, 11)
+
+    def testRollback1(self):
+        assert self.offset1.rollback(self.d) == self.d
+        assert self.offset2.rollback(self.d) == self.d
+
+        d = datetime(2014, 7, 1, 0)
+
+        # 2014/07/01 is Tuesday, 06/30 is Monday(holiday)
+        assert self.offset1.rollback(d) == datetime(2014, 6, 27, 17)
+
+        # 2014/6/30 and 2014/6/27 are holidays
+        assert self.offset2.rollback(d) == datetime(2014, 6, 26, 17)
+
+    def testRollback2(self):
+        assert (self._offset(-3).rollback(datetime(2014, 7, 5, 15, 0)) ==
+                datetime(2014, 7, 4, 17, 0))
+
+    def testRollforward1(self):
+        assert self.offset1.rollforward(self.d) == self.d
+        assert self.offset2.rollforward(self.d) == self.d
+
+        d = datetime(2014, 7, 1, 0)
+        assert self.offset1.rollforward(d) == datetime(2014, 7, 1, 9)
+        assert self.offset2.rollforward(d) == datetime(2014, 7, 1, 9)
+
+    def testRollforward2(self):
+        assert (self._offset(-3).rollforward(datetime(2014, 7, 5, 16, 0)) ==
+                datetime(2014, 7, 7, 9))
+
+    def test_roll_date_object(self):
+        offset = BusinessHour()
+
+        dt = datetime(2014, 7, 6, 15, 0)
+
+        result = offset.rollback(dt)
+        assert result == datetime(2014, 7, 4, 17)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2014, 7, 7, 9)
+
+    normalize_cases = []
+    normalize_cases.append((
+        CustomBusinessHour(normalize=True, holidays=holidays),
+        {datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
+         datetime(2014, 7, 1, 17): datetime(2014, 7, 3),
+         datetime(2014, 7, 1, 16): datetime(2014, 7, 3),
+         datetime(2014, 7, 1, 23): datetime(2014, 7, 3),
+         datetime(2014, 7, 1, 0): datetime(2014, 7, 1),
+         datetime(2014, 7, 4, 15): datetime(2014, 7, 4),
+         datetime(2014, 7, 4, 15, 59): datetime(2014, 7, 4),
+         datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7),
+         datetime(2014, 7, 5, 23): datetime(2014, 7, 7),
+         datetime(2014, 7, 6, 10): datetime(2014, 7, 7)}))
+
+    normalize_cases.append((
+        CustomBusinessHour(-1, normalize=True, holidays=holidays),
+        {datetime(2014, 7, 1, 8): datetime(2014, 6, 26),
+         datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
+         datetime(2014, 7, 1, 16): datetime(2014, 7, 1),
+         datetime(2014, 7, 1, 10): datetime(2014, 6, 26),
+         datetime(2014, 7, 1, 0): datetime(2014, 6, 26),
+         datetime(2014, 7, 7, 10): datetime(2014, 7, 4),
+         datetime(2014, 7, 7, 10, 1): datetime(2014, 7, 7),
+         datetime(2014, 7, 5, 23): datetime(2014, 7, 4),
+         datetime(2014, 7, 6, 10): datetime(2014, 7, 4)}))
+
+    normalize_cases.append((
+        CustomBusinessHour(1, normalize=True,
+                           start='17:00', end='04:00',
+                           holidays=holidays),
+        {datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
+         datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
+         datetime(2014, 7, 1, 23): datetime(2014, 7, 2),
+         datetime(2014, 7, 2, 2): datetime(2014, 7, 2),
+         datetime(2014, 7, 2, 3): datetime(2014, 7, 3),
+         datetime(2014, 7, 4, 23): datetime(2014, 7, 5),
+         datetime(2014, 7, 5, 2): datetime(2014, 7, 5),
+         datetime(2014, 7, 7, 2): datetime(2014, 7, 7),
+         datetime(2014, 7, 7, 17): datetime(2014, 7, 7)}))
+
+    @pytest.mark.parametrize('norm_cases', normalize_cases)
+    def test_normalize(self, norm_cases):
+        offset, cases = norm_cases
+        for dt, expected in compat.iteritems(cases):
+            assert offset.apply(dt) == expected
+
+    def test_onOffset(self):
+        tests = []
+
+        tests.append((CustomBusinessHour(start='10:00', end='15:00',
+                                         holidays=self.holidays),
+                      {datetime(2014, 7, 1, 9): False,
+                       datetime(2014, 7, 1, 10): True,
+                       datetime(2014, 7, 1, 15): True,
+                       datetime(2014, 7, 1, 15, 1): False,
+                       datetime(2014, 7, 5, 12): False,
+                       datetime(2014, 7, 6, 12): False}))
+
+        for offset, cases in tests:
+            for dt, expected in compat.iteritems(cases):
+                assert offset.onOffset(dt) == expected
+
+    apply_cases = []
+    apply_cases.append((
+        CustomBusinessHour(holidays=holidays),
+        {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 12),
+         datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 14),
+         datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 16),
+         datetime(2014, 7, 1, 19): datetime(2014, 7, 3, 10),
+         datetime(2014, 7, 1, 16): datetime(2014, 7, 3, 9),
+         datetime(2014, 7, 1, 16, 30, 15): datetime(2014, 7, 3, 9, 30, 15),
+         datetime(2014, 7, 1, 17): datetime(2014, 7, 3, 10),
+         datetime(2014, 7, 2, 11): datetime(2014, 7, 3, 10),
+         # out of business hours
+         datetime(2014, 7, 2, 8): datetime(2014, 7, 3, 10),
+         datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 10),
+         datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 10),
+         datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 10),
+         # saturday
+         datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 10),
+         datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 10),
+         datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 9, 30),
+         datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 9, 30, 30)}))
+
+    apply_cases.append((
+        CustomBusinessHour(4, holidays=holidays),
+        {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 15),
+         datetime(2014, 7, 1, 13): datetime(2014, 7, 3, 9),
+         datetime(2014, 7, 1, 15): datetime(2014, 7, 3, 11),
+         datetime(2014, 7, 1, 16): datetime(2014, 7, 3, 12),
+         datetime(2014, 7, 1, 17): datetime(2014, 7, 3, 13),
+         datetime(2014, 7, 2, 11): datetime(2014, 7, 3, 13),
+         datetime(2014, 7, 2, 8): datetime(2014, 7, 3, 13),
+         datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 13),
+         datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 13),
+         datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 13),
+         datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 13),
+         datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 13),
+         datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 12, 30),
+         datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 12, 30, 30)}))
+
+    @pytest.mark.parametrize('apply_case', apply_cases)
+    def test_apply(self, apply_case):
+        offset, cases = apply_case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    nano_cases = []
+    nano_cases.append(
+        (CustomBusinessHour(holidays=holidays),
+         {Timestamp('2014-07-01 15:00') + Nano(5):
+            Timestamp('2014-07-01 16:00') + Nano(5),
+          Timestamp('2014-07-01 16:00') + Nano(5):
+            Timestamp('2014-07-03 09:00') + Nano(5),
+          Timestamp('2014-07-01 16:00') - Nano(5):
+            Timestamp('2014-07-01 17:00') - Nano(5)}))
+
+    nano_cases.append(
+        (CustomBusinessHour(-1, holidays=holidays),
+         {Timestamp('2014-07-01 15:00') + Nano(5):
+            Timestamp('2014-07-01 14:00') + Nano(5),
+          Timestamp('2014-07-01 10:00') + Nano(5):
+            Timestamp('2014-07-01 09:00') + Nano(5),
+          Timestamp('2014-07-01 10:00') - Nano(5):
+            Timestamp('2014-06-26 17:00') - Nano(5)}))
+
+    @pytest.mark.parametrize('nano_case', nano_cases)
+    def test_apply_nanoseconds(self, nano_case):
+        offset, cases = nano_case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+
+class TestCustomBusinessDay(Base):
+    _offset = CDay
+
+    def setup_method(self, method):
+        self.d = datetime(2008, 1, 1)
+        self.nd = np_datetime64_compat('2008-01-01 00:00:00Z')
+
+        self.offset = CDay()
+        self.offset1 = self.offset
+        self.offset2 = CDay(2)
+
+    def test_different_normalize_equals(self):
+        # GH#21404 changed __eq__ to return False when `normalize` doesnt match
+        offset = self._offset()
+        offset2 = self._offset(normalize=True)
+        assert offset != offset2
+
+    def test_repr(self):
+        assert repr(self.offset) == '<CustomBusinessDay>'
+        assert repr(self.offset2) == '<2 * CustomBusinessDays>'
+
+        if compat.PY37:
+            expected = '<BusinessDay: offset=datetime.timedelta(days=1)>'
+        else:
+            expected = '<BusinessDay: offset=datetime.timedelta(1)>'
+        assert repr(self.offset + timedelta(1)) == expected
+
+    def test_with_offset(self):
+        offset = self.offset + timedelta(hours=2)
+
+        assert (self.d + offset) == datetime(2008, 1, 2, 2)
+
+    def test_eq(self):
+        assert self.offset2 == self.offset2
+
+    def test_mul(self):
+        pass
+
+    def test_hash(self):
+        assert hash(self.offset2) == hash(self.offset2)
+
+    def test_call(self):
+        assert self.offset2(self.d) == datetime(2008, 1, 3)
+        assert self.offset2(self.nd) == datetime(2008, 1, 3)
+
+    def testRollback1(self):
+        assert CDay(10).rollback(self.d) == self.d
+
+    def testRollback2(self):
+        assert (CDay(10).rollback(datetime(2008, 1, 5)) ==
+                datetime(2008, 1, 4))
+
+    def testRollforward1(self):
+        assert CDay(10).rollforward(self.d) == self.d
+
+    def testRollforward2(self):
+        assert (CDay(10).rollforward(datetime(2008, 1, 5)) ==
+                datetime(2008, 1, 7))
+
+    def test_roll_date_object(self):
+        offset = CDay()
+
+        dt = date(2012, 9, 15)
+
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 14)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 17)
+
+        offset = offsets.Day()
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 15)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 15)
+
+    on_offset_cases = [(CDay(), datetime(2008, 1, 1), True),
+                       (CDay(), datetime(2008, 1, 5), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, d, expected = case
+        assert_onOffset(offset, d, expected)
+
+    apply_cases = []
+    apply_cases.append((CDay(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 2),
+        datetime(2008, 1, 4): datetime(2008, 1, 7),
+        datetime(2008, 1, 5): datetime(2008, 1, 7),
+        datetime(2008, 1, 6): datetime(2008, 1, 7),
+        datetime(2008, 1, 7): datetime(2008, 1, 8)}))
+
+    apply_cases.append((2 * CDay(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 3),
+        datetime(2008, 1, 4): datetime(2008, 1, 8),
+        datetime(2008, 1, 5): datetime(2008, 1, 8),
+        datetime(2008, 1, 6): datetime(2008, 1, 8),
+        datetime(2008, 1, 7): datetime(2008, 1, 9)}))
+
+    apply_cases.append((-CDay(), {
+        datetime(2008, 1, 1): datetime(2007, 12, 31),
+        datetime(2008, 1, 4): datetime(2008, 1, 3),
+        datetime(2008, 1, 5): datetime(2008, 1, 4),
+        datetime(2008, 1, 6): datetime(2008, 1, 4),
+        datetime(2008, 1, 7): datetime(2008, 1, 4),
+        datetime(2008, 1, 8): datetime(2008, 1, 7)}))
+
+    apply_cases.append((-2 * CDay(), {
+        datetime(2008, 1, 1): datetime(2007, 12, 28),
+        datetime(2008, 1, 4): datetime(2008, 1, 2),
+        datetime(2008, 1, 5): datetime(2008, 1, 3),
+        datetime(2008, 1, 6): datetime(2008, 1, 3),
+        datetime(2008, 1, 7): datetime(2008, 1, 3),
+        datetime(2008, 1, 8): datetime(2008, 1, 4),
+        datetime(2008, 1, 9): datetime(2008, 1, 7)}))
+
+    apply_cases.append((CDay(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 1, 4): datetime(2008, 1, 4),
+        datetime(2008, 1, 5): datetime(2008, 1, 7),
+        datetime(2008, 1, 6): datetime(2008, 1, 7),
+        datetime(2008, 1, 7): datetime(2008, 1, 7)}))
+
+    @pytest.mark.parametrize('case', apply_cases)
+    def test_apply(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    def test_apply_large_n(self):
+        dt = datetime(2012, 10, 23)
+
+        result = dt + CDay(10)
+        assert result == datetime(2012, 11, 6)
+
+        result = dt + CDay(100) - CDay(100)
+        assert result == dt
+
+        off = CDay() * 6
+        rs = datetime(2012, 1, 1) - off
+        xp = datetime(2011, 12, 23)
+        assert rs == xp
+
+        st = datetime(2011, 12, 18)
+        rs = st + off
+        xp = datetime(2011, 12, 26)
+        assert rs == xp
+
+    def test_apply_corner(self):
+        pytest.raises(Exception, CDay().apply, BMonthEnd())
+
+    def test_holidays(self):
+        # Define a TradingDay offset
+        holidays = ['2012-05-01', datetime(2013, 5, 1),
+                    np.datetime64('2014-05-01')]
+        tday = CDay(holidays=holidays)
+        for year in range(2012, 2015):
+            dt = datetime(year, 4, 30)
+            xp = datetime(year, 5, 2)
+            rs = dt + tday
+            assert rs == xp
+
+    def test_weekmask(self):
+        weekmask_saudi = 'Sat Sun Mon Tue Wed'  # Thu-Fri Weekend
+        weekmask_uae = '1111001'  # Fri-Sat Weekend
+        weekmask_egypt = [1, 1, 1, 1, 0, 0, 1]  # Fri-Sat Weekend
+        bday_saudi = CDay(weekmask=weekmask_saudi)
+        bday_uae = CDay(weekmask=weekmask_uae)
+        bday_egypt = CDay(weekmask=weekmask_egypt)
+        dt = datetime(2013, 5, 1)
+        xp_saudi = datetime(2013, 5, 4)
+        xp_uae = datetime(2013, 5, 2)
+        xp_egypt = datetime(2013, 5, 2)
+        assert xp_saudi == dt + bday_saudi
+        assert xp_uae == dt + bday_uae
+        assert xp_egypt == dt + bday_egypt
+        xp2 = datetime(2013, 5, 5)
+        assert xp2 == dt + 2 * bday_saudi
+        assert xp2 == dt + 2 * bday_uae
+        assert xp2 == dt + 2 * bday_egypt
+
+    def test_weekmask_and_holidays(self):
+        weekmask_egypt = 'Sun Mon Tue Wed Thu'  # Fri-Sat Weekend
+        holidays = ['2012-05-01', datetime(2013, 5, 1),
+                    np.datetime64('2014-05-01')]
+        bday_egypt = CDay(holidays=holidays, weekmask=weekmask_egypt)
+        dt = datetime(2013, 4, 30)
+        xp_egypt = datetime(2013, 5, 5)
+        assert xp_egypt == dt + 2 * bday_egypt
+
+    def test_calendar(self):
+        calendar = USFederalHolidayCalendar()
+        dt = datetime(2014, 1, 17)
+        assert_offset_equal(CDay(calendar=calendar), dt, datetime(2014, 1, 21))
+
+    def test_roundtrip_pickle(self):
+        def _check_roundtrip(obj):
+            unpickled = tm.round_trip_pickle(obj)
+            assert unpickled == obj
+
+        _check_roundtrip(self.offset)
+        _check_roundtrip(self.offset2)
+        _check_roundtrip(self.offset * 2)
+
+    def test_pickle_compat_0_14_1(self, datapath):
+        hdays = [datetime(2013, 1, 1) for ele in range(4)]
+        pth = datapath('tseries', 'offsets', 'data', 'cday-0.14.1.pickle')
+        cday0_14_1 = read_pickle(pth)
+        cday = CDay(holidays=hdays)
+        assert cday == cday0_14_1
+
+
+class CustomBusinessMonthBase(object):
+
+    def setup_method(self, method):
+        self.d = datetime(2008, 1, 1)
+
+        self.offset = self._offset()
+        self.offset1 = self.offset
+        self.offset2 = self._offset(2)
+
+    def test_eq(self):
+        assert self.offset2 == self.offset2
+
+    def test_mul(self):
+        pass
+
+    def test_hash(self):
+        assert hash(self.offset2) == hash(self.offset2)
+
+    def test_roundtrip_pickle(self):
+        def _check_roundtrip(obj):
+            unpickled = tm.round_trip_pickle(obj)
+            assert unpickled == obj
+
+        _check_roundtrip(self._offset())
+        _check_roundtrip(self._offset(2))
+        _check_roundtrip(self._offset() * 2)
+
+    def test_copy(self):
+        # GH 17452
+        off = self._offset(weekmask='Mon Wed Fri')
+        assert off == off.copy()
+
+
+class TestCustomBusinessMonthEnd(CustomBusinessMonthBase, Base):
+    _offset = CBMonthEnd
+
+    def test_different_normalize_equals(self):
+        # GH#21404 changed __eq__ to return False when `normalize` doesnt match
+        offset = self._offset()
+        offset2 = self._offset(normalize=True)
+        assert offset != offset2
+
+    def test_repr(self):
+        assert repr(self.offset) == '<CustomBusinessMonthEnd>'
+        assert repr(self.offset2) == '<2 * CustomBusinessMonthEnds>'
+
+    def testCall(self):
+        assert self.offset2(self.d) == datetime(2008, 2, 29)
+
+    def testRollback1(self):
+        assert (CDay(10).rollback(datetime(2007, 12, 31)) ==
+                datetime(2007, 12, 31))
+
+    def testRollback2(self):
+        assert CBMonthEnd(10).rollback(self.d) == datetime(2007, 12, 31)
+
+    def testRollforward1(self):
+        assert CBMonthEnd(10).rollforward(self.d) == datetime(2008, 1, 31)
+
+    def test_roll_date_object(self):
+        offset = CBMonthEnd()
+
+        dt = date(2012, 9, 15)
+
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 8, 31)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 28)
+
+        offset = offsets.Day()
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 15)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 15)
+
+    on_offset_cases = [(CBMonthEnd(), datetime(2008, 1, 31), True),
+                       (CBMonthEnd(), datetime(2008, 1, 1), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, d, expected = case
+        assert_onOffset(offset, d, expected)
+
+    apply_cases = []
+    apply_cases.append((CBMonthEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 2, 7): datetime(2008, 2, 29)}))
+
+    apply_cases.append((2 * CBMonthEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 2, 29),
+        datetime(2008, 2, 7): datetime(2008, 3, 31)}))
+
+    apply_cases.append((-CBMonthEnd(), {
+        datetime(2008, 1, 1): datetime(2007, 12, 31),
+        datetime(2008, 2, 8): datetime(2008, 1, 31)}))
+
+    apply_cases.append((-2 * CBMonthEnd(), {
+        datetime(2008, 1, 1): datetime(2007, 11, 30),
+        datetime(2008, 2, 9): datetime(2007, 12, 31)}))
+
+    apply_cases.append((CBMonthEnd(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 2, 7): datetime(2008, 2, 29)}))
+
+    @pytest.mark.parametrize('case', apply_cases)
+    def test_apply(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    def test_apply_large_n(self):
+        dt = datetime(2012, 10, 23)
+
+        result = dt + CBMonthEnd(10)
+        assert result == datetime(2013, 7, 31)
+
+        result = dt + CDay(100) - CDay(100)
+        assert result == dt
+
+        off = CBMonthEnd() * 6
+        rs = datetime(2012, 1, 1) - off
+        xp = datetime(2011, 7, 29)
+        assert rs == xp
+
+        st = datetime(2011, 12, 18)
+        rs = st + off
+        xp = datetime(2012, 5, 31)
+        assert rs == xp
+
+    def test_holidays(self):
+        # Define a TradingDay offset
+        holidays = ['2012-01-31', datetime(2012, 2, 28),
+                    np.datetime64('2012-02-29')]
+        bm_offset = CBMonthEnd(holidays=holidays)
+        dt = datetime(2012, 1, 1)
+        assert dt + bm_offset == datetime(2012, 1, 30)
+        assert dt + 2 * bm_offset == datetime(2012, 2, 27)
+
+    def test_datetimeindex(self):
+        from pandas.tseries.holiday import USFederalHolidayCalendar
+        hcal = USFederalHolidayCalendar()
+        freq = CBMonthEnd(calendar=hcal)
+
+        assert (DatetimeIndex(start='20120101', end='20130101',
+                              freq=freq).tolist()[0] == datetime(2012, 1, 31))
+
+
+class TestCustomBusinessMonthBegin(CustomBusinessMonthBase, Base):
+    _offset = CBMonthBegin
+
+    def test_different_normalize_equals(self):
+        # GH#21404 changed __eq__ to return False when `normalize` doesnt match
+        offset = self._offset()
+        offset2 = self._offset(normalize=True)
+        assert offset != offset2
+
+    def test_repr(self):
+        assert repr(self.offset) == '<CustomBusinessMonthBegin>'
+        assert repr(self.offset2) == '<2 * CustomBusinessMonthBegins>'
+
+    def testCall(self):
+        assert self.offset2(self.d) == datetime(2008, 3, 3)
+
+    def testRollback1(self):
+        assert (CDay(10).rollback(datetime(2007, 12, 31)) ==
+                datetime(2007, 12, 31))
+
+    def testRollback2(self):
+        assert CBMonthBegin(10).rollback(self.d) == datetime(2008, 1, 1)
+
+    def testRollforward1(self):
+        assert CBMonthBegin(10).rollforward(self.d) == datetime(2008, 1, 1)
+
+    def test_roll_date_object(self):
+        offset = CBMonthBegin()
+
+        dt = date(2012, 9, 15)
+
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 3)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 10, 1)
+
+        offset = offsets.Day()
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 15)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 15)
+
+    on_offset_cases = [(CBMonthBegin(), datetime(2008, 1, 1), True),
+                       (CBMonthBegin(), datetime(2008, 1, 31), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+    apply_cases = []
+    apply_cases.append((CBMonthBegin(), {
+        datetime(2008, 1, 1): datetime(2008, 2, 1),
+        datetime(2008, 2, 7): datetime(2008, 3, 3)}))
+
+    apply_cases.append((2 * CBMonthBegin(), {
+        datetime(2008, 1, 1): datetime(2008, 3, 3),
+        datetime(2008, 2, 7): datetime(2008, 4, 1)}))
+
+    apply_cases.append((-CBMonthBegin(), {
+        datetime(2008, 1, 1): datetime(2007, 12, 3),
+        datetime(2008, 2, 8): datetime(2008, 2, 1)}))
+
+    apply_cases.append((-2 * CBMonthBegin(), {
+        datetime(2008, 1, 1): datetime(2007, 11, 1),
+        datetime(2008, 2, 9): datetime(2008, 1, 1)}))
+
+    apply_cases.append((CBMonthBegin(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 1, 7): datetime(2008, 2, 1)}))
+
+    @pytest.mark.parametrize('case', apply_cases)
+    def test_apply(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    def test_apply_large_n(self):
+        dt = datetime(2012, 10, 23)
+
+        result = dt + CBMonthBegin(10)
+        assert result == datetime(2013, 8, 1)
+
+        result = dt + CDay(100) - CDay(100)
+        assert result == dt
+
+        off = CBMonthBegin() * 6
+        rs = datetime(2012, 1, 1) - off
+        xp = datetime(2011, 7, 1)
+        assert rs == xp
+
+        st = datetime(2011, 12, 18)
+        rs = st + off
+
+        xp = datetime(2012, 6, 1)
+        assert rs == xp
+
+    def test_holidays(self):
+        # Define a TradingDay offset
+        holidays = ['2012-02-01', datetime(2012, 2, 2),
+                    np.datetime64('2012-03-01')]
+        bm_offset = CBMonthBegin(holidays=holidays)
+        dt = datetime(2012, 1, 1)
+
+        assert dt + bm_offset == datetime(2012, 1, 2)
+        assert dt + 2 * bm_offset == datetime(2012, 2, 3)
+
+    def test_datetimeindex(self):
+        hcal = USFederalHolidayCalendar()
+        cbmb = CBMonthBegin(calendar=hcal)
+        assert (DatetimeIndex(start='20120101', end='20130101',
+                              freq=cbmb).tolist()[0] == datetime(2012, 1, 3))
+
+
+class TestWeek(Base):
+    _offset = Week
+    d = Timestamp(datetime(2008, 1, 2))
+    offset1 = _offset()
+    offset2 = _offset(2)
+
+    def test_repr(self):
+        assert repr(Week(weekday=0)) == "<Week: weekday=0>"
+        assert repr(Week(n=-1, weekday=0)) == "<-1 * Week: weekday=0>"
+        assert repr(Week(n=-2, weekday=0)) == "<-2 * Weeks: weekday=0>"
+
+    def test_corner(self):
+        with pytest.raises(ValueError):
+            Week(weekday=7)
+
+        with pytest.raises(ValueError, match="Day must be"):
+            Week(weekday=-1)
+
+    def test_isAnchored(self):
+        assert Week(weekday=0).isAnchored()
+        assert not Week().isAnchored()
+        assert not Week(2, weekday=2).isAnchored()
+        assert not Week(2).isAnchored()
+
+    offset_cases = []
+    # not business week
+    offset_cases.append((Week(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 8),
+        datetime(2008, 1, 4): datetime(2008, 1, 11),
+        datetime(2008, 1, 5): datetime(2008, 1, 12),
+        datetime(2008, 1, 6): datetime(2008, 1, 13),
+        datetime(2008, 1, 7): datetime(2008, 1, 14)}))
+
+    # Mon
+    offset_cases.append((Week(weekday=0), {
+        datetime(2007, 12, 31): datetime(2008, 1, 7),
+        datetime(2008, 1, 4): datetime(2008, 1, 7),
+        datetime(2008, 1, 5): datetime(2008, 1, 7),
+        datetime(2008, 1, 6): datetime(2008, 1, 7),
+        datetime(2008, 1, 7): datetime(2008, 1, 14)}))
+
+    # n=0 -> roll forward. Mon
+    offset_cases.append((Week(0, weekday=0), {
+        datetime(2007, 12, 31): datetime(2007, 12, 31),
+        datetime(2008, 1, 4): datetime(2008, 1, 7),
+        datetime(2008, 1, 5): datetime(2008, 1, 7),
+        datetime(2008, 1, 6): datetime(2008, 1, 7),
+        datetime(2008, 1, 7): datetime(2008, 1, 7)}))
+
+    # n=0 -> roll forward. Mon
+    offset_cases.append((Week(-2, weekday=1), {
+        datetime(2010, 4, 6): datetime(2010, 3, 23),
+        datetime(2010, 4, 8): datetime(2010, 3, 30),
+        datetime(2010, 4, 5): datetime(2010, 3, 23)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    @pytest.mark.parametrize('weekday', range(7))
+    def test_onOffset(self, weekday):
+        offset = Week(weekday=weekday)
+
+        for day in range(1, 8):
+            date = datetime(2008, 1, day)
+
+            if day % 7 == weekday:
+                expected = True
+            else:
+                expected = False
+        assert_onOffset(offset, date, expected)
+
+
+class TestWeekOfMonth(Base):
+    _offset = WeekOfMonth
+    offset1 = _offset()
+    offset2 = _offset(2)
+
+    def test_constructor(self):
+        with pytest.raises(ValueError, match="^Week"):
+            WeekOfMonth(n=1, week=4, weekday=0)
+
+        with pytest.raises(ValueError, match="^Week"):
+            WeekOfMonth(n=1, week=-1, weekday=0)
+
+        with pytest.raises(ValueError, match="^Day"):
+            WeekOfMonth(n=1, week=0, weekday=-1)
+
+        with pytest.raises(ValueError, match="^Day"):
+            WeekOfMonth(n=1, week=0, weekday=-7)
+
+    def test_repr(self):
+        assert (repr(WeekOfMonth(weekday=1, week=2)) ==
+                "<WeekOfMonth: week=2, weekday=1>")
+
+    def test_offset(self):
+        date1 = datetime(2011, 1, 4)  # 1st Tuesday of Month
+        date2 = datetime(2011, 1, 11)  # 2nd Tuesday of Month
+        date3 = datetime(2011, 1, 18)  # 3rd Tuesday of Month
+        date4 = datetime(2011, 1, 25)  # 4th Tuesday of Month
+
+        # see for loop for structure
+        test_cases = [
+            (-2, 2, 1, date1, datetime(2010, 11, 16)),
+            (-2, 2, 1, date2, datetime(2010, 11, 16)),
+            (-2, 2, 1, date3, datetime(2010, 11, 16)),
+            (-2, 2, 1, date4, datetime(2010, 12, 21)),
+
+            (-1, 2, 1, date1, datetime(2010, 12, 21)),
+            (-1, 2, 1, date2, datetime(2010, 12, 21)),
+            (-1, 2, 1, date3, datetime(2010, 12, 21)),
+            (-1, 2, 1, date4, datetime(2011, 1, 18)),
+
+            (0, 0, 1, date1, datetime(2011, 1, 4)),
+            (0, 0, 1, date2, datetime(2011, 2, 1)),
+            (0, 0, 1, date3, datetime(2011, 2, 1)),
+            (0, 0, 1, date4, datetime(2011, 2, 1)),
+            (0, 1, 1, date1, datetime(2011, 1, 11)),
+            (0, 1, 1, date2, datetime(2011, 1, 11)),
+            (0, 1, 1, date3, datetime(2011, 2, 8)),
+            (0, 1, 1, date4, datetime(2011, 2, 8)),
+            (0, 0, 1, date1, datetime(2011, 1, 4)),
+            (0, 1, 1, date2, datetime(2011, 1, 11)),
+            (0, 2, 1, date3, datetime(2011, 1, 18)),
+            (0, 3, 1, date4, datetime(2011, 1, 25)),
+
+            (1, 0, 0, date1, datetime(2011, 2, 7)),
+            (1, 0, 0, date2, datetime(2011, 2, 7)),
+            (1, 0, 0, date3, datetime(2011, 2, 7)),
+            (1, 0, 0, date4, datetime(2011, 2, 7)),
+            (1, 0, 1, date1, datetime(2011, 2, 1)),
+            (1, 0, 1, date2, datetime(2011, 2, 1)),
+            (1, 0, 1, date3, datetime(2011, 2, 1)),
+            (1, 0, 1, date4, datetime(2011, 2, 1)),
+            (1, 0, 2, date1, datetime(2011, 1, 5)),
+            (1, 0, 2, date2, datetime(2011, 2, 2)),
+            (1, 0, 2, date3, datetime(2011, 2, 2)),
+            (1, 0, 2, date4, datetime(2011, 2, 2)),
+
+            (1, 2, 1, date1, datetime(2011, 1, 18)),
+            (1, 2, 1, date2, datetime(2011, 1, 18)),
+            (1, 2, 1, date3, datetime(2011, 2, 15)),
+            (1, 2, 1, date4, datetime(2011, 2, 15)),
+
+            (2, 2, 1, date1, datetime(2011, 2, 15)),
+            (2, 2, 1, date2, datetime(2011, 2, 15)),
+            (2, 2, 1, date3, datetime(2011, 3, 15)),
+            (2, 2, 1, date4, datetime(2011, 3, 15))]
+
+        for n, week, weekday, dt, expected in test_cases:
+            offset = WeekOfMonth(n, week=week, weekday=weekday)
+            assert_offset_equal(offset, dt, expected)
+
+        # try subtracting
+        result = datetime(2011, 2, 1) - WeekOfMonth(week=1, weekday=2)
+        assert result == datetime(2011, 1, 12)
+
+        result = datetime(2011, 2, 3) - WeekOfMonth(week=0, weekday=2)
+        assert result == datetime(2011, 2, 2)
+
+    on_offset_cases = [(0, 0, datetime(2011, 2, 7), True),
+                       (0, 0, datetime(2011, 2, 6), False),
+                       (0, 0, datetime(2011, 2, 14), False),
+                       (1, 0, datetime(2011, 2, 14), True),
+                       (0, 1, datetime(2011, 2, 1), True),
+                       (0, 1, datetime(2011, 2, 8), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        week, weekday, dt, expected = case
+        offset = WeekOfMonth(week=week, weekday=weekday)
+        assert offset.onOffset(dt) == expected
+
+
+class TestLastWeekOfMonth(Base):
+    _offset = LastWeekOfMonth
+    offset1 = _offset()
+    offset2 = _offset(2)
+
+    def test_constructor(self):
+        with pytest.raises(ValueError, match="^N cannot be 0"):
+            LastWeekOfMonth(n=0, weekday=1)
+
+        with pytest.raises(ValueError, match="^Day"):
+            LastWeekOfMonth(n=1, weekday=-1)
+
+        with pytest.raises(ValueError, match="^Day"):
+            LastWeekOfMonth(n=1, weekday=7)
+
+    def test_offset(self):
+        # Saturday
+        last_sat = datetime(2013, 8, 31)
+        next_sat = datetime(2013, 9, 28)
+        offset_sat = LastWeekOfMonth(n=1, weekday=5)
+
+        one_day_before = (last_sat + timedelta(days=-1))
+        assert one_day_before + offset_sat == last_sat
+
+        one_day_after = (last_sat + timedelta(days=+1))
+        assert one_day_after + offset_sat == next_sat
+
+        # Test On that day
+        assert last_sat + offset_sat == next_sat
+
+        # Thursday
+
+        offset_thur = LastWeekOfMonth(n=1, weekday=3)
+        last_thurs = datetime(2013, 1, 31)
+        next_thurs = datetime(2013, 2, 28)
+
+        one_day_before = last_thurs + timedelta(days=-1)
+        assert one_day_before + offset_thur == last_thurs
+
+        one_day_after = last_thurs + timedelta(days=+1)
+        assert one_day_after + offset_thur == next_thurs
+
+        # Test on that day
+        assert last_thurs + offset_thur == next_thurs
+
+        three_before = last_thurs + timedelta(days=-3)
+        assert three_before + offset_thur == last_thurs
+
+        two_after = last_thurs + timedelta(days=+2)
+        assert two_after + offset_thur == next_thurs
+
+        offset_sunday = LastWeekOfMonth(n=1, weekday=WeekDay.SUN)
+        assert datetime(2013, 7, 31) + offset_sunday == datetime(2013, 8, 25)
+
+    on_offset_cases = [
+        (WeekDay.SUN, datetime(2013, 1, 27), True),
+        (WeekDay.SAT, datetime(2013, 3, 30), True),
+        (WeekDay.MON, datetime(2013, 2, 18), False),  # Not the last Mon
+        (WeekDay.SUN, datetime(2013, 2, 25), False),  # Not a SUN
+        (WeekDay.MON, datetime(2013, 2, 25), True),
+        (WeekDay.SAT, datetime(2013, 11, 30), True),
+
+        (WeekDay.SAT, datetime(2006, 8, 26), True),
+        (WeekDay.SAT, datetime(2007, 8, 25), True),
+        (WeekDay.SAT, datetime(2008, 8, 30), True),
+        (WeekDay.SAT, datetime(2009, 8, 29), True),
+        (WeekDay.SAT, datetime(2010, 8, 28), True),
+        (WeekDay.SAT, datetime(2011, 8, 27), True),
+        (WeekDay.SAT, datetime(2019, 8, 31), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        weekday, dt, expected = case
+        offset = LastWeekOfMonth(weekday=weekday)
+        assert offset.onOffset(dt) == expected
+
+
+class TestSemiMonthEnd(Base):
+    _offset = SemiMonthEnd
+    offset1 = _offset()
+    offset2 = _offset(2)
+
+    def test_offset_whole_year(self):
+        dates = (datetime(2007, 12, 31),
+                 datetime(2008, 1, 15),
+                 datetime(2008, 1, 31),
+                 datetime(2008, 2, 15),
+                 datetime(2008, 2, 29),
+                 datetime(2008, 3, 15),
+                 datetime(2008, 3, 31),
+                 datetime(2008, 4, 15),
+                 datetime(2008, 4, 30),
+                 datetime(2008, 5, 15),
+                 datetime(2008, 5, 31),
+                 datetime(2008, 6, 15),
+                 datetime(2008, 6, 30),
+                 datetime(2008, 7, 15),
+                 datetime(2008, 7, 31),
+                 datetime(2008, 8, 15),
+                 datetime(2008, 8, 31),
+                 datetime(2008, 9, 15),
+                 datetime(2008, 9, 30),
+                 datetime(2008, 10, 15),
+                 datetime(2008, 10, 31),
+                 datetime(2008, 11, 15),
+                 datetime(2008, 11, 30),
+                 datetime(2008, 12, 15),
+                 datetime(2008, 12, 31))
+
+        for base, exp_date in zip(dates[:-1], dates[1:]):
+            assert_offset_equal(SemiMonthEnd(), base, exp_date)
+
+        # ensure .apply_index works as expected
+        s = DatetimeIndex(dates[:-1])
+        result = SemiMonthEnd().apply_index(s)
+        exp = DatetimeIndex(dates[1:])
+        tm.assert_index_equal(result, exp)
+
+        # ensure generating a range with DatetimeIndex gives same result
+        result = DatetimeIndex(start=dates[0], end=dates[-1], freq='SM')
+        exp = DatetimeIndex(dates)
+        tm.assert_index_equal(result, exp)
+
+    offset_cases = []
+    offset_cases.append((SemiMonthEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 15),
+        datetime(2008, 1, 15): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 2, 15),
+        datetime(2006, 12, 14): datetime(2006, 12, 15),
+        datetime(2006, 12, 29): datetime(2006, 12, 31),
+        datetime(2006, 12, 31): datetime(2007, 1, 15),
+        datetime(2007, 1, 1): datetime(2007, 1, 15),
+        datetime(2006, 12, 1): datetime(2006, 12, 15),
+        datetime(2006, 12, 15): datetime(2006, 12, 31)}))
+
+    offset_cases.append((SemiMonthEnd(day_of_month=20), {
+        datetime(2008, 1, 1): datetime(2008, 1, 20),
+        datetime(2008, 1, 15): datetime(2008, 1, 20),
+        datetime(2008, 1, 21): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 2, 20),
+        datetime(2006, 12, 14): datetime(2006, 12, 20),
+        datetime(2006, 12, 29): datetime(2006, 12, 31),
+        datetime(2006, 12, 31): datetime(2007, 1, 20),
+        datetime(2007, 1, 1): datetime(2007, 1, 20),
+        datetime(2006, 12, 1): datetime(2006, 12, 20),
+        datetime(2006, 12, 15): datetime(2006, 12, 20)}))
+
+    offset_cases.append((SemiMonthEnd(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 15),
+        datetime(2008, 1, 16): datetime(2008, 1, 31),
+        datetime(2008, 1, 15): datetime(2008, 1, 15),
+        datetime(2008, 1, 31): datetime(2008, 1, 31),
+        datetime(2006, 12, 29): datetime(2006, 12, 31),
+        datetime(2006, 12, 31): datetime(2006, 12, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 15)}))
+
+    offset_cases.append((SemiMonthEnd(0, day_of_month=16), {
+        datetime(2008, 1, 1): datetime(2008, 1, 16),
+        datetime(2008, 1, 16): datetime(2008, 1, 16),
+        datetime(2008, 1, 15): datetime(2008, 1, 16),
+        datetime(2008, 1, 31): datetime(2008, 1, 31),
+        datetime(2006, 12, 29): datetime(2006, 12, 31),
+        datetime(2006, 12, 31): datetime(2006, 12, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 16)}))
+
+    offset_cases.append((SemiMonthEnd(2), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 2, 29),
+        datetime(2006, 12, 29): datetime(2007, 1, 15),
+        datetime(2006, 12, 31): datetime(2007, 1, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 31),
+        datetime(2007, 1, 16): datetime(2007, 2, 15),
+        datetime(2006, 11, 1): datetime(2006, 11, 30)}))
+
+    offset_cases.append((SemiMonthEnd(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 6, 15),
+        datetime(2008, 12, 31): datetime(2008, 12, 15),
+        datetime(2006, 12, 29): datetime(2006, 12, 15),
+        datetime(2006, 12, 30): datetime(2006, 12, 15),
+        datetime(2007, 1, 1): datetime(2006, 12, 31)}))
+
+    offset_cases.append((SemiMonthEnd(-1, day_of_month=4), {
+        datetime(2007, 1, 1): datetime(2006, 12, 31),
+        datetime(2007, 1, 4): datetime(2006, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 6, 4),
+        datetime(2008, 12, 31): datetime(2008, 12, 4),
+        datetime(2006, 12, 5): datetime(2006, 12, 4),
+        datetime(2006, 12, 30): datetime(2006, 12, 4),
+        datetime(2007, 1, 1): datetime(2006, 12, 31)}))
+
+    offset_cases.append((SemiMonthEnd(-2), {
+        datetime(2007, 1, 1): datetime(2006, 12, 15),
+        datetime(2008, 6, 30): datetime(2008, 5, 31),
+        datetime(2008, 3, 15): datetime(2008, 2, 15),
+        datetime(2008, 12, 31): datetime(2008, 11, 30),
+        datetime(2006, 12, 29): datetime(2006, 11, 30),
+        datetime(2006, 12, 14): datetime(2006, 11, 15),
+        datetime(2007, 1, 1): datetime(2006, 12, 15)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_apply_index(self, case):
+        offset, cases = case
+        s = DatetimeIndex(cases.keys())
+        result = offset.apply_index(s)
+        exp = DatetimeIndex(cases.values())
+        tm.assert_index_equal(result, exp)
+
+    on_offset_cases = [(datetime(2007, 12, 31), True),
+                       (datetime(2007, 12, 15), True),
+                       (datetime(2007, 12, 14), False),
+                       (datetime(2007, 12, 1), False),
+                       (datetime(2008, 2, 29), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        dt, expected = case
+        assert_onOffset(SemiMonthEnd(), dt, expected)
+
+    @pytest.mark.parametrize('klass,assert_func',
+                             [(Series, tm.assert_series_equal),
+                              (DatetimeIndex, tm.assert_index_equal)])
+    def test_vectorized_offset_addition(self, klass, assert_func):
+        s = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
+                   Timestamp('2000-02-15', tz='US/Central')], name='a')
+
+        result = s + SemiMonthEnd()
+        result2 = SemiMonthEnd() + s
+        exp = klass([Timestamp('2000-01-31 00:15:00', tz='US/Central'),
+                     Timestamp('2000-02-29', tz='US/Central')], name='a')
+        assert_func(result, exp)
+        assert_func(result2, exp)
+
+        s = klass([Timestamp('2000-01-01 00:15:00', tz='US/Central'),
+                   Timestamp('2000-02-01', tz='US/Central')], name='a')
+        result = s + SemiMonthEnd()
+        result2 = SemiMonthEnd() + s
+        exp = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
+                     Timestamp('2000-02-15', tz='US/Central')], name='a')
+        assert_func(result, exp)
+        assert_func(result2, exp)
+
+
+class TestSemiMonthBegin(Base):
+    _offset = SemiMonthBegin
+    offset1 = _offset()
+    offset2 = _offset(2)
+
+    def test_offset_whole_year(self):
+        dates = (datetime(2007, 12, 15),
+                 datetime(2008, 1, 1),
+                 datetime(2008, 1, 15),
+                 datetime(2008, 2, 1),
+                 datetime(2008, 2, 15),
+                 datetime(2008, 3, 1),
+                 datetime(2008, 3, 15),
+                 datetime(2008, 4, 1),
+                 datetime(2008, 4, 15),
+                 datetime(2008, 5, 1),
+                 datetime(2008, 5, 15),
+                 datetime(2008, 6, 1),
+                 datetime(2008, 6, 15),
+                 datetime(2008, 7, 1),
+                 datetime(2008, 7, 15),
+                 datetime(2008, 8, 1),
+                 datetime(2008, 8, 15),
+                 datetime(2008, 9, 1),
+                 datetime(2008, 9, 15),
+                 datetime(2008, 10, 1),
+                 datetime(2008, 10, 15),
+                 datetime(2008, 11, 1),
+                 datetime(2008, 11, 15),
+                 datetime(2008, 12, 1),
+                 datetime(2008, 12, 15))
+
+        for base, exp_date in zip(dates[:-1], dates[1:]):
+            assert_offset_equal(SemiMonthBegin(), base, exp_date)
+
+        # ensure .apply_index works as expected
+        s = DatetimeIndex(dates[:-1])
+        result = SemiMonthBegin().apply_index(s)
+        exp = DatetimeIndex(dates[1:])
+        tm.assert_index_equal(result, exp)
+
+        # ensure generating a range with DatetimeIndex gives same result
+        result = DatetimeIndex(start=dates[0], end=dates[-1], freq='SMS')
+        exp = DatetimeIndex(dates)
+        tm.assert_index_equal(result, exp)
+
+    offset_cases = []
+    offset_cases.append((SemiMonthBegin(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 15),
+        datetime(2008, 1, 15): datetime(2008, 2, 1),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2006, 12, 14): datetime(2006, 12, 15),
+        datetime(2006, 12, 29): datetime(2007, 1, 1),
+        datetime(2006, 12, 31): datetime(2007, 1, 1),
+        datetime(2007, 1, 1): datetime(2007, 1, 15),
+        datetime(2006, 12, 1): datetime(2006, 12, 15),
+        datetime(2006, 12, 15): datetime(2007, 1, 1)}))
+
+    offset_cases.append((SemiMonthBegin(day_of_month=20), {
+        datetime(2008, 1, 1): datetime(2008, 1, 20),
+        datetime(2008, 1, 15): datetime(2008, 1, 20),
+        datetime(2008, 1, 21): datetime(2008, 2, 1),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2006, 12, 14): datetime(2006, 12, 20),
+        datetime(2006, 12, 29): datetime(2007, 1, 1),
+        datetime(2006, 12, 31): datetime(2007, 1, 1),
+        datetime(2007, 1, 1): datetime(2007, 1, 20),
+        datetime(2006, 12, 1): datetime(2006, 12, 20),
+        datetime(2006, 12, 15): datetime(2006, 12, 20)}))
+
+    offset_cases.append((SemiMonthBegin(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 1, 16): datetime(2008, 2, 1),
+        datetime(2008, 1, 15): datetime(2008, 1, 15),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2006, 12, 29): datetime(2007, 1, 1),
+        datetime(2006, 12, 2): datetime(2006, 12, 15),
+        datetime(2007, 1, 1): datetime(2007, 1, 1)}))
+
+    offset_cases.append((SemiMonthBegin(0, day_of_month=16), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 1, 16): datetime(2008, 1, 16),
+        datetime(2008, 1, 15): datetime(2008, 1, 16),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2006, 12, 29): datetime(2007, 1, 1),
+        datetime(2006, 12, 31): datetime(2007, 1, 1),
+        datetime(2007, 1, 5): datetime(2007, 1, 16),
+        datetime(2007, 1, 1): datetime(2007, 1, 1)}))
+
+    offset_cases.append((SemiMonthBegin(2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 1),
+        datetime(2008, 1, 31): datetime(2008, 2, 15),
+        datetime(2006, 12, 1): datetime(2007, 1, 1),
+        datetime(2006, 12, 29): datetime(2007, 1, 15),
+        datetime(2006, 12, 15): datetime(2007, 1, 15),
+        datetime(2007, 1, 1): datetime(2007, 2, 1),
+        datetime(2007, 1, 16): datetime(2007, 2, 15),
+        datetime(2006, 11, 1): datetime(2006, 12, 1)}))
+
+    offset_cases.append((SemiMonthBegin(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 15),
+        datetime(2008, 6, 30): datetime(2008, 6, 15),
+        datetime(2008, 6, 14): datetime(2008, 6, 1),
+        datetime(2008, 12, 31): datetime(2008, 12, 15),
+        datetime(2006, 12, 29): datetime(2006, 12, 15),
+        datetime(2006, 12, 15): datetime(2006, 12, 1),
+        datetime(2007, 1, 1): datetime(2006, 12, 15)}))
+
+    offset_cases.append((SemiMonthBegin(-1, day_of_month=4), {
+        datetime(2007, 1, 1): datetime(2006, 12, 4),
+        datetime(2007, 1, 4): datetime(2007, 1, 1),
+        datetime(2008, 6, 30): datetime(2008, 6, 4),
+        datetime(2008, 12, 31): datetime(2008, 12, 4),
+        datetime(2006, 12, 5): datetime(2006, 12, 4),
+        datetime(2006, 12, 30): datetime(2006, 12, 4),
+        datetime(2006, 12, 2): datetime(2006, 12, 1),
+        datetime(2007, 1, 1): datetime(2006, 12, 4)}))
+
+    offset_cases.append((SemiMonthBegin(-2), {
+        datetime(2007, 1, 1): datetime(2006, 12, 1),
+        datetime(2008, 6, 30): datetime(2008, 6, 1),
+        datetime(2008, 6, 14): datetime(2008, 5, 15),
+        datetime(2008, 12, 31): datetime(2008, 12, 1),
+        datetime(2006, 12, 29): datetime(2006, 12, 1),
+        datetime(2006, 12, 15): datetime(2006, 11, 15),
+        datetime(2007, 1, 1): datetime(2006, 12, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_apply_index(self, case):
+        offset, cases = case
+        s = DatetimeIndex(cases.keys())
+        result = offset.apply_index(s)
+        exp = DatetimeIndex(cases.values())
+        tm.assert_index_equal(result, exp)
+
+    on_offset_cases = [(datetime(2007, 12, 1), True),
+                       (datetime(2007, 12, 15), True),
+                       (datetime(2007, 12, 14), False),
+                       (datetime(2007, 12, 31), False),
+                       (datetime(2008, 2, 15), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        dt, expected = case
+        assert_onOffset(SemiMonthBegin(), dt, expected)
+
+    @pytest.mark.parametrize('klass,assert_func',
+                             [(Series, tm.assert_series_equal),
+                              (DatetimeIndex, tm.assert_index_equal)])
+    def test_vectorized_offset_addition(self, klass, assert_func):
+        s = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
+                   Timestamp('2000-02-15', tz='US/Central')], name='a')
+        result = s + SemiMonthBegin()
+        result2 = SemiMonthBegin() + s
+        exp = klass([Timestamp('2000-02-01 00:15:00', tz='US/Central'),
+                     Timestamp('2000-03-01', tz='US/Central')], name='a')
+        assert_func(result, exp)
+        assert_func(result2, exp)
+
+        s = klass([Timestamp('2000-01-01 00:15:00', tz='US/Central'),
+                   Timestamp('2000-02-01', tz='US/Central')], name='a')
+        result = s + SemiMonthBegin()
+        result2 = SemiMonthBegin() + s
+        exp = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
+                     Timestamp('2000-02-15', tz='US/Central')], name='a')
+        assert_func(result, exp)
+        assert_func(result2, exp)
+
+
+def test_Easter():
+    assert_offset_equal(Easter(), datetime(2010, 1, 1), datetime(2010, 4, 4))
+    assert_offset_equal(Easter(), datetime(2010, 4, 5), datetime(2011, 4, 24))
+    assert_offset_equal(Easter(2), datetime(2010, 1, 1), datetime(2011, 4, 24))
+
+    assert_offset_equal(Easter(), datetime(2010, 4, 4), datetime(2011, 4, 24))
+    assert_offset_equal(Easter(2), datetime(2010, 4, 4), datetime(2012, 4, 8))
+
+    assert_offset_equal(-Easter(), datetime(2011, 1, 1), datetime(2010, 4, 4))
+    assert_offset_equal(-Easter(), datetime(2010, 4, 5), datetime(2010, 4, 4))
+    assert_offset_equal(-Easter(2),
+                        datetime(2011, 1, 1),
+                        datetime(2009, 4, 12))
+
+    assert_offset_equal(-Easter(), datetime(2010, 4, 4), datetime(2009, 4, 12))
+    assert_offset_equal(-Easter(2),
+                        datetime(2010, 4, 4),
+                        datetime(2008, 3, 23))
+
+
+class TestOffsetNames(object):
+
+    def test_get_offset_name(self):
+        assert BDay().freqstr == 'B'
+        assert BDay(2).freqstr == '2B'
+        assert BMonthEnd().freqstr == 'BM'
+        assert Week(weekday=0).freqstr == 'W-MON'
+        assert Week(weekday=1).freqstr == 'W-TUE'
+        assert Week(weekday=2).freqstr == 'W-WED'
+        assert Week(weekday=3).freqstr == 'W-THU'
+        assert Week(weekday=4).freqstr == 'W-FRI'
+
+        assert LastWeekOfMonth(weekday=WeekDay.SUN).freqstr == "LWOM-SUN"
+
+
+def test_get_offset():
+    with pytest.raises(ValueError, match=_INVALID_FREQ_ERROR):
+        get_offset('gibberish')
+    with pytest.raises(ValueError, match=_INVALID_FREQ_ERROR):
+        get_offset('QS-JAN-B')
+
+    pairs = [
+        ('B', BDay()), ('b', BDay()), ('bm', BMonthEnd()),
+        ('Bm', BMonthEnd()), ('W-MON', Week(weekday=0)),
+        ('W-TUE', Week(weekday=1)), ('W-WED', Week(weekday=2)),
+        ('W-THU', Week(weekday=3)), ('W-FRI', Week(weekday=4))]
+
+    for name, expected in pairs:
+        offset = get_offset(name)
+        assert offset == expected, ("Expected %r to yield %r (actual: %r)" %
+                                    (name, expected, offset))
+
+
+def test_get_offset_legacy():
+    pairs = [('w@Sat', Week(weekday=5))]
+    for name, expected in pairs:
+        with pytest.raises(ValueError, match=_INVALID_FREQ_ERROR):
+            get_offset(name)
+
+
+class TestOffsetAliases(object):
+
+    def setup_method(self, method):
+        _offset_map.clear()
+
+    def test_alias_equality(self):
+        for k, v in compat.iteritems(_offset_map):
+            if v is None:
+                continue
+            assert k == v.copy()
+
+    def test_rule_code(self):
+        lst = ['M', 'MS', 'BM', 'BMS', 'D', 'B', 'H', 'T', 'S', 'L', 'U']
+        for k in lst:
+            assert k == get_offset(k).rule_code
+            # should be cached - this is kind of an internals test...
+            assert k in _offset_map
+            assert k == (get_offset(k) * 3).rule_code
+
+        suffix_lst = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
+        base = 'W'
+        for v in suffix_lst:
+            alias = '-'.join([base, v])
+            assert alias == get_offset(alias).rule_code
+            assert alias == (get_offset(alias) * 5).rule_code
+
+        suffix_lst = ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL', 'AUG',
+                      'SEP', 'OCT', 'NOV', 'DEC']
+        base_lst = ['A', 'AS', 'BA', 'BAS', 'Q', 'QS', 'BQ', 'BQS']
+        for base in base_lst:
+            for v in suffix_lst:
+                alias = '-'.join([base, v])
+                assert alias == get_offset(alias).rule_code
+                assert alias == (get_offset(alias) * 5).rule_code
+
+        lst = ['M', 'D', 'B', 'H', 'T', 'S', 'L', 'U']
+        for k in lst:
+            code, stride = get_freq_code('3' + k)
+            assert isinstance(code, int)
+            assert stride == 3
+            assert k == get_freq_str(code)
+
+
+def test_dateoffset_misc():
+    oset = offsets.DateOffset(months=2, days=4)
+    # it works
+    oset.freqstr
+
+    assert (not offsets.DateOffset(months=2) == 2)
+
+
+def test_freq_offsets():
+    off = BDay(1, offset=timedelta(0, 1800))
+    assert (off.freqstr == 'B+30Min')
+
+    off = BDay(1, offset=timedelta(0, -1800))
+    assert (off.freqstr == 'B-30Min')
+
+
+def get_all_subclasses(cls):
+    ret = set()
+    this_subclasses = cls.__subclasses__()
+    ret = ret | set(this_subclasses)
+    for this_subclass in this_subclasses:
+        ret | get_all_subclasses(this_subclass)
+    return ret
+
+
+class TestCaching(object):
+
+    # as of GH 6479 (in 0.14.0), offset caching is turned off
+    # as of v0.12.0 only BusinessMonth/Quarter were actually caching
+
+    def setup_method(self, method):
+        _daterange_cache.clear()
+        _offset_map.clear()
+
+    def run_X_index_creation(self, cls):
+        inst1 = cls()
+        if not inst1.isAnchored():
+            assert not inst1._should_cache(), cls
+            return
+
+        assert inst1._should_cache(), cls
+
+        DatetimeIndex(start=datetime(2013, 1, 31), end=datetime(2013, 3, 31),
+                      freq=inst1, normalize=True)
+        assert cls() in _daterange_cache, cls
+
+    def test_should_cache_month_end(self):
+        assert not MonthEnd()._should_cache()
+
+    def test_should_cache_bmonth_end(self):
+        assert not BusinessMonthEnd()._should_cache()
+
+    def test_should_cache_week_month(self):
+        assert not WeekOfMonth(weekday=1, week=2)._should_cache()
+
+    def test_all_cacheableoffsets(self):
+        for subclass in get_all_subclasses(CacheableOffset):
+            if subclass.__name__[0] == "_" \
+                    or subclass in TestCaching.no_simple_ctr:
+                continue
+            self.run_X_index_creation(subclass)
+
+    def test_month_end_index_creation(self):
+        DatetimeIndex(start=datetime(2013, 1, 31), end=datetime(2013, 3, 31),
+                      freq=MonthEnd(), normalize=True)
+        assert not MonthEnd() in _daterange_cache
+
+    def test_bmonth_end_index_creation(self):
+        DatetimeIndex(start=datetime(2013, 1, 31), end=datetime(2013, 3, 29),
+                      freq=BusinessMonthEnd(), normalize=True)
+        assert not BusinessMonthEnd() in _daterange_cache
+
+    def test_week_of_month_index_creation(self):
+        inst1 = WeekOfMonth(weekday=1, week=2)
+        DatetimeIndex(start=datetime(2013, 1, 31), end=datetime(2013, 3, 29),
+                      freq=inst1, normalize=True)
+        inst2 = WeekOfMonth(weekday=1, week=2)
+        assert inst2 not in _daterange_cache
+
+
+class TestReprNames(object):
+
+    def test_str_for_named_is_name(self):
+        # look at all the amazing combinations!
+        month_prefixes = ['A', 'AS', 'BA', 'BAS', 'Q', 'BQ', 'BQS', 'QS']
+        names = [prefix + '-' + month
+                 for prefix in month_prefixes
+                 for month in ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL',
+                               'AUG', 'SEP', 'OCT', 'NOV', 'DEC']]
+        days = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
+        names += ['W-' + day for day in days]
+        names += ['WOM-' + week + day
+                  for week in ('1', '2', '3', '4') for day in days]
+        _offset_map.clear()
+        for name in names:
+            offset = get_offset(name)
+            assert offset.freqstr == name
+
+
+def get_utc_offset_hours(ts):
+    # take a Timestamp and compute total hours of utc offset
+    o = ts.utcoffset()
+    return (o.days * 24 * 3600 + o.seconds) / 3600.0
+
+
+class TestDST(object):
+    """
+    test DateOffset additions over Daylight Savings Time
+    """
+    # one microsecond before the DST transition
+    ts_pre_fallback = "2013-11-03 01:59:59.999999"
+    ts_pre_springfwd = "2013-03-10 01:59:59.999999"
+
+    # test both basic names and dateutil timezones
+    timezone_utc_offsets = {
+        'US/Eastern': dict(utc_offset_daylight=-4,
+                           utc_offset_standard=-5, ),
+        'dateutil/US/Pacific': dict(utc_offset_daylight=-7,
+                                    utc_offset_standard=-8, )
+    }
+    valid_date_offsets_singular = [
+        'weekday', 'day', 'hour', 'minute', 'second', 'microsecond'
+    ]
+    valid_date_offsets_plural = [
+        'weeks', 'days',
+        'hours', 'minutes', 'seconds',
+        'milliseconds', 'microseconds'
+    ]
+
+    def _test_all_offsets(self, n, **kwds):
+        valid_offsets = self.valid_date_offsets_plural if n > 1 \
+            else self.valid_date_offsets_singular
+
+        for name in valid_offsets:
+            self._test_offset(offset_name=name, offset_n=n, **kwds)
+
+    def _test_offset(self, offset_name, offset_n, tstart, expected_utc_offset):
+        offset = DateOffset(**{offset_name: offset_n})
+
+        t = tstart + offset
+        if expected_utc_offset is not None:
+            assert get_utc_offset_hours(t) == expected_utc_offset
+
+        if offset_name == 'weeks':
+            # dates should match
+            assert t.date() == timedelta(days=7 * offset.kwds[
+                'weeks']) + tstart.date()
+            # expect the same day of week, hour of day, minute, second, ...
+            assert (t.dayofweek == tstart.dayofweek and
+                    t.hour == tstart.hour and
+                    t.minute == tstart.minute and
+                    t.second == tstart.second)
+        elif offset_name == 'days':
+            # dates should match
+            assert timedelta(offset.kwds['days']) + tstart.date() == t.date()
+            # expect the same hour of day, minute, second, ...
+            assert (t.hour == tstart.hour and
+                    t.minute == tstart.minute and
+                    t.second == tstart.second)
+        elif offset_name in self.valid_date_offsets_singular:
+            # expect the singular offset value to match between tstart and t
+            datepart_offset = getattr(t, offset_name
+                                      if offset_name != 'weekday' else
+                                      'dayofweek')
+            assert datepart_offset == offset.kwds[offset_name]
+        else:
+            # the offset should be the same as if it was done in UTC
+            assert (t == (tstart.tz_convert('UTC') + offset)
+                    .tz_convert('US/Pacific'))
+
+    def _make_timestamp(self, string, hrs_offset, tz):
+        if hrs_offset >= 0:
+            offset_string = '{hrs:02d}00'.format(hrs=hrs_offset)
+        else:
+            offset_string = '-{hrs:02d}00'.format(hrs=-1 * hrs_offset)
+        return Timestamp(string + offset_string).tz_convert(tz)
+
+    def test_fallback_plural(self):
+        # test moving from daylight savings to standard time
+        import dateutil
+        for tz, utc_offsets in self.timezone_utc_offsets.items():
+            hrs_pre = utc_offsets['utc_offset_daylight']
+            hrs_post = utc_offsets['utc_offset_standard']
+
+            if LooseVersion(dateutil.__version__) < LooseVersion('2.6.0'):
+                # buggy ambiguous behavior in 2.6.0
+                # GH 14621
+                # https://github.com/dateutil/dateutil/issues/321
+                self._test_all_offsets(
+                    n=3, tstart=self._make_timestamp(self.ts_pre_fallback,
+                                                     hrs_pre, tz),
+                    expected_utc_offset=hrs_post)
+            elif LooseVersion(dateutil.__version__) > LooseVersion('2.6.0'):
+                # fixed, but skip the test
+                continue
+
+    def test_springforward_plural(self):
+        # test moving from standard to daylight savings
+        for tz, utc_offsets in self.timezone_utc_offsets.items():
+            hrs_pre = utc_offsets['utc_offset_standard']
+            hrs_post = utc_offsets['utc_offset_daylight']
+            self._test_all_offsets(
+                n=3, tstart=self._make_timestamp(self.ts_pre_springfwd,
+                                                 hrs_pre, tz),
+                expected_utc_offset=hrs_post)
+
+    def test_fallback_singular(self):
+        # in the case of singular offsets, we don't necessarily know which utc
+        # offset the new Timestamp will wind up in (the tz for 1 month may be
+        # different from 1 second) so we don't specify an expected_utc_offset
+        for tz, utc_offsets in self.timezone_utc_offsets.items():
+            hrs_pre = utc_offsets['utc_offset_standard']
+            self._test_all_offsets(n=1, tstart=self._make_timestamp(
+                self.ts_pre_fallback, hrs_pre, tz), expected_utc_offset=None)
+
+    def test_springforward_singular(self):
+        for tz, utc_offsets in self.timezone_utc_offsets.items():
+            hrs_pre = utc_offsets['utc_offset_standard']
+            self._test_all_offsets(n=1, tstart=self._make_timestamp(
+                self.ts_pre_springfwd, hrs_pre, tz), expected_utc_offset=None)
+
+    offset_classes = {MonthBegin: ['11/2/2012', '12/1/2012'],
+                      MonthEnd: ['11/2/2012', '11/30/2012'],
+                      BMonthBegin: ['11/2/2012', '12/3/2012'],
+                      BMonthEnd: ['11/2/2012', '11/30/2012'],
+                      CBMonthBegin: ['11/2/2012', '12/3/2012'],
+                      CBMonthEnd: ['11/2/2012', '11/30/2012'],
+                      SemiMonthBegin: ['11/2/2012', '11/15/2012'],
+                      SemiMonthEnd: ['11/2/2012', '11/15/2012'],
+                      Week: ['11/2/2012', '11/9/2012'],
+                      YearBegin: ['11/2/2012', '1/1/2013'],
+                      YearEnd: ['11/2/2012', '12/31/2012'],
+                      BYearBegin: ['11/2/2012', '1/1/2013'],
+                      BYearEnd: ['11/2/2012', '12/31/2012'],
+                      QuarterBegin: ['11/2/2012', '12/1/2012'],
+                      QuarterEnd: ['11/2/2012', '12/31/2012'],
+                      BQuarterBegin: ['11/2/2012', '12/3/2012'],
+                      BQuarterEnd: ['11/2/2012', '12/31/2012'],
+                      Day: ['11/4/2012', '11/4/2012 23:00']}.items()
+
+    @pytest.mark.parametrize('tup', offset_classes)
+    def test_all_offset_classes(self, tup):
+        offset, test_values = tup
+
+        first = Timestamp(test_values[0], tz='US/Eastern') + offset()
+        second = Timestamp(test_values[1], tz='US/Eastern')
+        assert first == second
+
+
+# ---------------------------------------------------------------------
+def test_get_offset_day_error():
+    # subclass of _BaseOffset must override _day_opt attribute, or we should
+    # get a NotImplementedError
+
+    with pytest.raises(NotImplementedError):
+        DateOffset()._get_offset_day(datetime.now())
+
+
+def test_valid_default_arguments(offset_types):
+    # GH#19142 check that the calling the constructors without passing
+    # any keyword arguments produce valid offsets
+    cls = offset_types
+    cls()
+
+
+@pytest.mark.parametrize('kwd', sorted(list(liboffsets.relativedelta_kwds)))
+def test_valid_month_attributes(kwd, month_classes):
+    # GH#18226
+    cls = month_classes
+    # check that we cannot create e.g. MonthEnd(weeks=3)
+    with pytest.raises(TypeError):
+        cls(**{kwd: 3})
+
+
+@pytest.mark.parametrize('kwd', sorted(list(liboffsets.relativedelta_kwds)))
+def test_valid_tick_attributes(kwd, tick_classes):
+    # GH#18226
+    cls = tick_classes
+    # check that we cannot create e.g. Hour(weeks=3)
+    with pytest.raises(TypeError):
+        cls(**{kwd: 3})
+
+
+def test_validate_n_error():
+    with pytest.raises(TypeError):
+        DateOffset(n='Doh!')
+
+    with pytest.raises(TypeError):
+        MonthBegin(n=timedelta(1))
+
+    with pytest.raises(TypeError):
+        BDay(n=np.array([1, 2], dtype=np.int64))
+
+
+def test_require_integers(offset_types):
+    cls = offset_types
+    with pytest.raises(ValueError):
+        cls(n=1.5)
+
+
+def test_tick_normalize_raises(tick_classes):
+    # check that trying to create a Tick object with normalize=True raises
+    # GH#21427
+    cls = tick_classes
+    with pytest.raises(ValueError):
+        cls(n=3, normalize=True)
+
+
+def test_weeks_onoffset():
+    # GH#18510 Week with weekday = None, normalize = False should always
+    # be onOffset
+    offset = Week(n=2, weekday=None)
+    ts = Timestamp('1862-01-13 09:03:34.873477378+0210', tz='Africa/Lusaka')
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+    # negative n
+    offset = Week(n=2, weekday=None)
+    ts = Timestamp('1856-10-24 16:18:36.556360110-0717', tz='Pacific/Easter')
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+
+def test_weekofmonth_onoffset():
+    # GH#18864
+    # Make sure that nanoseconds don't trip up onOffset (and with it apply)
+    offset = WeekOfMonth(n=2, week=2, weekday=0)
+    ts = Timestamp('1916-05-15 01:14:49.583410462+0422', tz='Asia/Qyzylorda')
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+    # negative n
+    offset = WeekOfMonth(n=-3, week=1, weekday=0)
+    ts = Timestamp('1980-12-08 03:38:52.878321185+0500', tz='Asia/Oral')
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+
+def test_last_week_of_month_on_offset():
+    # GH#19036, GH#18977 _adjust_dst was incorrect for LastWeekOfMonth
+    offset = LastWeekOfMonth(n=4, weekday=6)
+    ts = Timestamp('1917-05-27 20:55:27.084284178+0200',
+                   tz='Europe/Warsaw')
+    slow = (ts + offset) - offset == ts
+    fast = offset.onOffset(ts)
+    assert fast == slow
+
+    # negative n
+    offset = LastWeekOfMonth(n=-4, weekday=5)
+    ts = Timestamp('2005-08-27 05:01:42.799392561-0500',
+                   tz='America/Rainy_River')
+    slow = (ts + offset) - offset == ts
+    fast = offset.onOffset(ts)
+    assert fast == slow
diff --git a/pandas/tests/tseries/offsets/test_ticks.py b/pandas/tests/tseries/offsets/test_ticks.py
new file mode 100644
index 0000000000000..24033d4ff6cbd
--- /dev/null
+++ b/pandas/tests/tseries/offsets/test_ticks.py
@@ -0,0 +1,236 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for offsets.Tick and subclasses
+"""
+from datetime import datetime, timedelta
+
+import pytest
+import numpy as np
+
+from pandas import Timedelta, Timestamp
+from pandas.tseries import offsets
+from pandas.tseries.offsets import Hour, Minute, Second, Milli, Micro, Nano
+
+from .common import assert_offset_equal
+
+# ---------------------------------------------------------------------
+# Test Helpers
+
+tick_classes = [Hour, Minute, Second, Milli, Micro, Nano]
+
+
+# ---------------------------------------------------------------------
+
+
+def test_apply_ticks():
+    result = offsets.Hour(3).apply(offsets.Hour(4))
+    exp = offsets.Hour(7)
+    assert (result == exp)
+
+
+def test_delta_to_tick():
+    delta = timedelta(3)
+
+    tick = offsets._delta_to_tick(delta)
+    assert (tick == offsets.Day(3))
+
+
+# ---------------------------------------------------------------------
+
+
+def test_Hour():
+    assert_offset_equal(Hour(),
+                        datetime(2010, 1, 1), datetime(2010, 1, 1, 1))
+    assert_offset_equal(Hour(-1),
+                        datetime(2010, 1, 1, 1), datetime(2010, 1, 1))
+    assert_offset_equal(2 * Hour(),
+                        datetime(2010, 1, 1), datetime(2010, 1, 1, 2))
+    assert_offset_equal(-1 * Hour(),
+                        datetime(2010, 1, 1, 1), datetime(2010, 1, 1))
+
+    assert Hour(3) + Hour(2) == Hour(5)
+    assert Hour(3) - Hour(2) == Hour()
+
+    assert Hour(4) != Hour(1)
+
+
+def test_Minute():
+    assert_offset_equal(Minute(),
+                        datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 1))
+    assert_offset_equal(Minute(-1),
+                        datetime(2010, 1, 1, 0, 1), datetime(2010, 1, 1))
+    assert_offset_equal(2 * Minute(),
+                        datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 2))
+    assert_offset_equal(-1 * Minute(),
+                        datetime(2010, 1, 1, 0, 1), datetime(2010, 1, 1))
+
+    assert Minute(3) + Minute(2) == Minute(5)
+    assert Minute(3) - Minute(2) == Minute()
+    assert Minute(5) != Minute()
+
+
+def test_Second():
+    assert_offset_equal(Second(),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 1))
+    assert_offset_equal(Second(-1),
+                        datetime(2010, 1, 1, 0, 0, 1),
+                        datetime(2010, 1, 1))
+    assert_offset_equal(2 * Second(),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 2))
+    assert_offset_equal(-1 * Second(),
+                        datetime(2010, 1, 1, 0, 0, 1),
+                        datetime(2010, 1, 1))
+
+    assert Second(3) + Second(2) == Second(5)
+    assert Second(3) - Second(2) == Second()
+
+
+def test_Millisecond():
+    assert_offset_equal(Milli(),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 0, 1000))
+    assert_offset_equal(Milli(-1),
+                        datetime(2010, 1, 1, 0, 0, 0, 1000),
+                        datetime(2010, 1, 1))
+    assert_offset_equal(Milli(2),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 0, 2000))
+    assert_offset_equal(2 * Milli(),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 0, 2000))
+    assert_offset_equal(-1 * Milli(),
+                        datetime(2010, 1, 1, 0, 0, 0, 1000),
+                        datetime(2010, 1, 1))
+
+    assert Milli(3) + Milli(2) == Milli(5)
+    assert Milli(3) - Milli(2) == Milli()
+
+
+def test_MillisecondTimestampArithmetic():
+    assert_offset_equal(Milli(),
+                        Timestamp('2010-01-01'),
+                        Timestamp('2010-01-01 00:00:00.001'))
+    assert_offset_equal(Milli(-1),
+                        Timestamp('2010-01-01 00:00:00.001'),
+                        Timestamp('2010-01-01'))
+
+
+def test_Microsecond():
+    assert_offset_equal(Micro(),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 0, 1))
+    assert_offset_equal(Micro(-1),
+                        datetime(2010, 1, 1, 0, 0, 0, 1),
+                        datetime(2010, 1, 1))
+
+    assert_offset_equal(2 * Micro(),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 0, 2))
+    assert_offset_equal(-1 * Micro(),
+                        datetime(2010, 1, 1, 0, 0, 0, 1),
+                        datetime(2010, 1, 1))
+
+    assert Micro(3) + Micro(2) == Micro(5)
+    assert Micro(3) - Micro(2) == Micro()
+
+
+def test_NanosecondGeneric():
+    timestamp = Timestamp(datetime(2010, 1, 1))
+    assert timestamp.nanosecond == 0
+
+    result = timestamp + Nano(10)
+    assert result.nanosecond == 10
+
+    reverse_result = Nano(10) + timestamp
+    assert reverse_result.nanosecond == 10
+
+
+def test_Nanosecond():
+    timestamp = Timestamp(datetime(2010, 1, 1))
+    assert_offset_equal(Nano(),
+                        timestamp,
+                        timestamp + np.timedelta64(1, 'ns'))
+    assert_offset_equal(Nano(-1),
+                        timestamp + np.timedelta64(1, 'ns'),
+                        timestamp)
+    assert_offset_equal(2 * Nano(),
+                        timestamp,
+                        timestamp + np.timedelta64(2, 'ns'))
+    assert_offset_equal(-1 * Nano(),
+                        timestamp + np.timedelta64(1, 'ns'),
+                        timestamp)
+
+    assert Nano(3) + Nano(2) == Nano(5)
+    assert Nano(3) - Nano(2) == Nano()
+
+    # GH9284
+    assert Nano(1) + Nano(10) == Nano(11)
+    assert Nano(5) + Micro(1) == Nano(1005)
+    assert Micro(5) + Nano(1) == Nano(5001)
+
+
+@pytest.mark.parametrize('kls, expected',
+                         [(Hour, Timedelta(hours=5)),
+                          (Minute, Timedelta(hours=2, minutes=3)),
+                          (Second, Timedelta(hours=2, seconds=3)),
+                          (Milli, Timedelta(hours=2, milliseconds=3)),
+                          (Micro, Timedelta(hours=2, microseconds=3)),
+                          (Nano, Timedelta(hours=2, nanoseconds=3))])
+def test_tick_addition(kls, expected):
+    offset = kls(3)
+    result = offset + Timedelta(hours=2)
+    assert isinstance(result, Timedelta)
+    assert result == expected
+
+
+@pytest.mark.parametrize('cls1', tick_classes)
+@pytest.mark.parametrize('cls2', tick_classes)
+def test_tick_zero(cls1, cls2):
+    assert cls1(0) == cls2(0)
+    assert cls1(0) + cls2(0) == cls1(0)
+
+    if cls1 is not Nano:
+        assert cls1(2) + cls2(0) == cls1(2)
+
+    if cls1 is Nano:
+        assert cls1(2) + Nano(0) == cls1(2)
+
+
+@pytest.mark.parametrize('cls', tick_classes)
+def test_tick_equalities(cls):
+    assert cls(3) == cls(3)
+    assert cls() == cls(1)
+
+    # not equals
+    assert cls(3) != cls(2)
+    assert cls(3) != cls(-3)
+
+
+@pytest.mark.parametrize('cls', tick_classes)
+def test_tick_operators(cls):
+    assert cls(3) + cls(2) == cls(5)
+    assert cls(3) - cls(2) == cls(1)
+    assert cls(800) + cls(300) == cls(1100)
+    assert cls(1000) - cls(5) == cls(995)
+
+
+@pytest.mark.parametrize('cls', tick_classes)
+def test_tick_offset(cls):
+    assert not cls().isAnchored()
+
+
+@pytest.mark.parametrize('cls', tick_classes)
+def test_compare_ticks(cls):
+    three = cls(3)
+    four = cls(4)
+
+    # TODO: WTF?  What is this range(10) supposed to do?
+    for _ in range(10):
+        assert three < cls(4)
+        assert cls(3) < four
+        assert four > cls(3)
+        assert cls(4) > three
+        assert cls(3) == cls(3)
+        assert cls(3) != cls(4)
diff --git a/pandas/tests/tseries/offsets/test_yqm_offsets.py b/pandas/tests/tseries/offsets/test_yqm_offsets.py
new file mode 100644
index 0000000000000..22b8cf6119d18
--- /dev/null
+++ b/pandas/tests/tseries/offsets/test_yqm_offsets.py
@@ -0,0 +1,1030 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for Year, Quarter, and Month-based DateOffset subclasses
+"""
+from datetime import datetime
+
+import pytest
+
+import pandas as pd
+from pandas import Timestamp
+from pandas import compat
+
+from pandas.tseries.offsets import (BMonthBegin, BMonthEnd,
+                                    MonthBegin, MonthEnd,
+                                    YearEnd, YearBegin, BYearEnd, BYearBegin,
+                                    QuarterEnd, QuarterBegin,
+                                    BQuarterEnd, BQuarterBegin)
+
+from .test_offsets import Base
+from .common import assert_offset_equal, assert_onOffset
+
+
+# --------------------------------------------------------------------
+# Misc
+
+def test_quarterly_dont_normalize():
+    date = datetime(2012, 3, 31, 5, 30)
+
+    offsets = (QuarterBegin, QuarterEnd, BQuarterEnd, BQuarterBegin)
+
+    for klass in offsets:
+        result = date + klass()
+        assert (result.time() == date.time())
+
+
+@pytest.mark.parametrize('n', [-2, 1])
+@pytest.mark.parametrize('cls', [MonthBegin, MonthEnd,
+                                 BMonthBegin, BMonthEnd,
+                                 QuarterBegin, QuarterEnd,
+                                 BQuarterBegin, BQuarterEnd,
+                                 YearBegin, YearEnd,
+                                 BYearBegin, BYearEnd])
+def test_apply_index(cls, n):
+    offset = cls(n=n)
+    rng = pd.date_range(start='1/1/2000', periods=100000, freq='T')
+    ser = pd.Series(rng)
+
+    res = rng + offset
+    res_v2 = offset.apply_index(rng)
+    assert (res == res_v2).all()
+    assert res[0] == rng[0] + offset
+    assert res[-1] == rng[-1] + offset
+    res2 = ser + offset
+    # apply_index is only for indexes, not series, so no res2_v2
+    assert res2.iloc[0] == ser.iloc[0] + offset
+    assert res2.iloc[-1] == ser.iloc[-1] + offset
+
+
+@pytest.mark.parametrize('offset', [QuarterBegin(), QuarterEnd(),
+                                    BQuarterBegin(), BQuarterEnd()])
+def test_on_offset(offset):
+    dates = [datetime(2016, m, d)
+             for m in [10, 11, 12]
+             for d in [1, 2, 3, 28, 29, 30, 31] if not (m == 11 and d == 31)]
+    for date in dates:
+        res = offset.onOffset(date)
+        slow_version = date == (date + offset) - offset
+        assert res == slow_version
+
+
+# --------------------------------------------------------------------
+# Months
+
+class TestMonthBegin(Base):
+    _offset = MonthBegin
+
+    offset_cases = []
+    # NOTE: I'm not entirely happy with the logic here for Begin -ss
+    # see thread 'offset conventions' on the ML
+    offset_cases.append((MonthBegin(), {
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2008, 2, 1): datetime(2008, 3, 1),
+        datetime(2006, 12, 31): datetime(2007, 1, 1),
+        datetime(2006, 12, 1): datetime(2007, 1, 1),
+        datetime(2007, 1, 31): datetime(2007, 2, 1)}))
+
+    offset_cases.append((MonthBegin(0), {
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2006, 12, 3): datetime(2007, 1, 1),
+        datetime(2007, 1, 31): datetime(2007, 2, 1)}))
+
+    offset_cases.append((MonthBegin(2), {
+        datetime(2008, 2, 29): datetime(2008, 4, 1),
+        datetime(2008, 1, 31): datetime(2008, 3, 1),
+        datetime(2006, 12, 31): datetime(2007, 2, 1),
+        datetime(2007, 12, 28): datetime(2008, 2, 1),
+        datetime(2007, 1, 1): datetime(2007, 3, 1),
+        datetime(2006, 11, 1): datetime(2007, 1, 1)}))
+
+    offset_cases.append((MonthBegin(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 1),
+        datetime(2008, 5, 31): datetime(2008, 5, 1),
+        datetime(2008, 12, 31): datetime(2008, 12, 1),
+        datetime(2006, 12, 29): datetime(2006, 12, 1),
+        datetime(2006, 1, 2): datetime(2006, 1, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+
+class TestMonthEnd(Base):
+    _offset = MonthEnd
+
+    def test_day_of_month(self):
+        dt = datetime(2007, 1, 1)
+        offset = MonthEnd()
+
+        result = dt + offset
+        assert result == Timestamp(2007, 1, 31)
+
+        result = result + offset
+        assert result == Timestamp(2007, 2, 28)
+
+    def test_normalize(self):
+        dt = datetime(2007, 1, 1, 3)
+
+        result = dt + MonthEnd(normalize=True)
+        expected = dt.replace(hour=0) + MonthEnd()
+        assert result == expected
+
+    offset_cases = []
+    offset_cases.append((MonthEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 2, 29),
+        datetime(2006, 12, 29): datetime(2006, 12, 31),
+        datetime(2006, 12, 31): datetime(2007, 1, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 31),
+        datetime(2006, 12, 1): datetime(2006, 12, 31)}))
+
+    offset_cases.append((MonthEnd(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 1, 31),
+        datetime(2006, 12, 29): datetime(2006, 12, 31),
+        datetime(2006, 12, 31): datetime(2006, 12, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 31)}))
+
+    offset_cases.append((MonthEnd(2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 29),
+        datetime(2008, 1, 31): datetime(2008, 3, 31),
+        datetime(2006, 12, 29): datetime(2007, 1, 31),
+        datetime(2006, 12, 31): datetime(2007, 2, 28),
+        datetime(2007, 1, 1): datetime(2007, 2, 28),
+        datetime(2006, 11, 1): datetime(2006, 12, 31)}))
+
+    offset_cases.append((MonthEnd(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 5, 31),
+        datetime(2008, 12, 31): datetime(2008, 11, 30),
+        datetime(2006, 12, 29): datetime(2006, 11, 30),
+        datetime(2006, 12, 30): datetime(2006, 11, 30),
+        datetime(2007, 1, 1): datetime(2006, 12, 31)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(MonthEnd(), datetime(2007, 12, 31), True),
+                       (MonthEnd(), datetime(2008, 1, 1), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestBMonthBegin(Base):
+    _offset = BMonthBegin
+
+    def test_offsets_compare_equal(self):
+        # root cause of #456
+        offset1 = BMonthBegin()
+        offset2 = BMonthBegin()
+        assert not offset1 != offset2
+
+    offset_cases = []
+    offset_cases.append((BMonthBegin(), {
+        datetime(2008, 1, 1): datetime(2008, 2, 1),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2006, 12, 29): datetime(2007, 1, 1),
+        datetime(2006, 12, 31): datetime(2007, 1, 1),
+        datetime(2006, 9, 1): datetime(2006, 10, 2),
+        datetime(2007, 1, 1): datetime(2007, 2, 1),
+        datetime(2006, 12, 1): datetime(2007, 1, 1)}))
+
+    offset_cases.append((BMonthBegin(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2006, 10, 2): datetime(2006, 10, 2),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2006, 12, 29): datetime(2007, 1, 1),
+        datetime(2006, 12, 31): datetime(2007, 1, 1),
+        datetime(2006, 9, 15): datetime(2006, 10, 2)}))
+
+    offset_cases.append((BMonthBegin(2), {
+        datetime(2008, 1, 1): datetime(2008, 3, 3),
+        datetime(2008, 1, 15): datetime(2008, 3, 3),
+        datetime(2006, 12, 29): datetime(2007, 2, 1),
+        datetime(2006, 12, 31): datetime(2007, 2, 1),
+        datetime(2007, 1, 1): datetime(2007, 3, 1),
+        datetime(2006, 11, 1): datetime(2007, 1, 1)}))
+
+    offset_cases.append((BMonthBegin(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 1),
+        datetime(2008, 6, 30): datetime(2008, 6, 2),
+        datetime(2008, 6, 1): datetime(2008, 5, 1),
+        datetime(2008, 3, 10): datetime(2008, 3, 3),
+        datetime(2008, 12, 31): datetime(2008, 12, 1),
+        datetime(2006, 12, 29): datetime(2006, 12, 1),
+        datetime(2006, 12, 30): datetime(2006, 12, 1),
+        datetime(2007, 1, 1): datetime(2006, 12, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(BMonthBegin(), datetime(2007, 12, 31), False),
+                       (BMonthBegin(), datetime(2008, 1, 1), True),
+                       (BMonthBegin(), datetime(2001, 4, 2), True),
+                       (BMonthBegin(), datetime(2008, 3, 3), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestBMonthEnd(Base):
+    _offset = BMonthEnd
+
+    def test_normalize(self):
+        dt = datetime(2007, 1, 1, 3)
+
+        result = dt + BMonthEnd(normalize=True)
+        expected = dt.replace(hour=0) + BMonthEnd()
+        assert result == expected
+
+    def test_offsets_compare_equal(self):
+        # root cause of #456
+        offset1 = BMonthEnd()
+        offset2 = BMonthEnd()
+        assert not offset1 != offset2
+
+    offset_cases = []
+    offset_cases.append((BMonthEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 2, 29),
+        datetime(2006, 12, 29): datetime(2007, 1, 31),
+        datetime(2006, 12, 31): datetime(2007, 1, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 31),
+        datetime(2006, 12, 1): datetime(2006, 12, 29)}))
+
+    offset_cases.append((BMonthEnd(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 1, 31),
+        datetime(2006, 12, 29): datetime(2006, 12, 29),
+        datetime(2006, 12, 31): datetime(2007, 1, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 31)}))
+
+    offset_cases.append((BMonthEnd(2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 29),
+        datetime(2008, 1, 31): datetime(2008, 3, 31),
+        datetime(2006, 12, 29): datetime(2007, 2, 28),
+        datetime(2006, 12, 31): datetime(2007, 2, 28),
+        datetime(2007, 1, 1): datetime(2007, 2, 28),
+        datetime(2006, 11, 1): datetime(2006, 12, 29)}))
+
+    offset_cases.append((BMonthEnd(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 29),
+        datetime(2008, 6, 30): datetime(2008, 5, 30),
+        datetime(2008, 12, 31): datetime(2008, 11, 28),
+        datetime(2006, 12, 29): datetime(2006, 11, 30),
+        datetime(2006, 12, 30): datetime(2006, 12, 29),
+        datetime(2007, 1, 1): datetime(2006, 12, 29)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(BMonthEnd(), datetime(2007, 12, 31), True),
+                       (BMonthEnd(), datetime(2008, 1, 1), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+# --------------------------------------------------------------------
+# Quarters
+
+
+class TestQuarterBegin(Base):
+
+    def test_repr(self):
+        expected = "<QuarterBegin: startingMonth=3>"
+        assert repr(QuarterBegin()) == expected
+        expected = "<QuarterBegin: startingMonth=3>"
+        assert repr(QuarterBegin(startingMonth=3)) == expected
+        expected = "<QuarterBegin: startingMonth=1>"
+        assert repr(QuarterBegin(startingMonth=1)) == expected
+
+    def test_isAnchored(self):
+        assert QuarterBegin(startingMonth=1).isAnchored()
+        assert QuarterBegin().isAnchored()
+        assert not QuarterBegin(2, startingMonth=1).isAnchored()
+
+    def test_offset_corner_case(self):
+        # corner
+        offset = QuarterBegin(n=-1, startingMonth=1)
+        assert datetime(2010, 2, 1) + offset == datetime(2010, 1, 1)
+
+    offset_cases = []
+    offset_cases.append((QuarterBegin(startingMonth=1), {
+        datetime(2007, 12, 1): datetime(2008, 1, 1),
+        datetime(2008, 1, 1): datetime(2008, 4, 1),
+        datetime(2008, 2, 15): datetime(2008, 4, 1),
+        datetime(2008, 2, 29): datetime(2008, 4, 1),
+        datetime(2008, 3, 15): datetime(2008, 4, 1),
+        datetime(2008, 3, 31): datetime(2008, 4, 1),
+        datetime(2008, 4, 15): datetime(2008, 7, 1),
+        datetime(2008, 4, 1): datetime(2008, 7, 1)}))
+
+    offset_cases.append((QuarterBegin(startingMonth=2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 1),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2008, 1, 15): datetime(2008, 2, 1),
+        datetime(2008, 2, 29): datetime(2008, 5, 1),
+        datetime(2008, 3, 15): datetime(2008, 5, 1),
+        datetime(2008, 3, 31): datetime(2008, 5, 1),
+        datetime(2008, 4, 15): datetime(2008, 5, 1),
+        datetime(2008, 4, 30): datetime(2008, 5, 1)}))
+
+    offset_cases.append((QuarterBegin(startingMonth=1, n=0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 12, 1): datetime(2009, 1, 1),
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 2, 15): datetime(2008, 4, 1),
+        datetime(2008, 2, 29): datetime(2008, 4, 1),
+        datetime(2008, 3, 15): datetime(2008, 4, 1),
+        datetime(2008, 3, 31): datetime(2008, 4, 1),
+        datetime(2008, 4, 15): datetime(2008, 7, 1),
+        datetime(2008, 4, 30): datetime(2008, 7, 1)}))
+
+    offset_cases.append((QuarterBegin(startingMonth=1, n=-1), {
+        datetime(2008, 1, 1): datetime(2007, 10, 1),
+        datetime(2008, 1, 31): datetime(2008, 1, 1),
+        datetime(2008, 2, 15): datetime(2008, 1, 1),
+        datetime(2008, 2, 29): datetime(2008, 1, 1),
+        datetime(2008, 3, 15): datetime(2008, 1, 1),
+        datetime(2008, 3, 31): datetime(2008, 1, 1),
+        datetime(2008, 4, 15): datetime(2008, 4, 1),
+        datetime(2008, 4, 30): datetime(2008, 4, 1),
+        datetime(2008, 7, 1): datetime(2008, 4, 1)}))
+
+    offset_cases.append((QuarterBegin(startingMonth=1, n=2), {
+        datetime(2008, 1, 1): datetime(2008, 7, 1),
+        datetime(2008, 2, 15): datetime(2008, 7, 1),
+        datetime(2008, 2, 29): datetime(2008, 7, 1),
+        datetime(2008, 3, 15): datetime(2008, 7, 1),
+        datetime(2008, 3, 31): datetime(2008, 7, 1),
+        datetime(2008, 4, 15): datetime(2008, 10, 1),
+        datetime(2008, 4, 1): datetime(2008, 10, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+
+class TestQuarterEnd(Base):
+    _offset = QuarterEnd
+
+    def test_repr(self):
+        expected = "<QuarterEnd: startingMonth=3>"
+        assert repr(QuarterEnd()) == expected
+        expected = "<QuarterEnd: startingMonth=3>"
+        assert repr(QuarterEnd(startingMonth=3)) == expected
+        expected = "<QuarterEnd: startingMonth=1>"
+        assert repr(QuarterEnd(startingMonth=1)) == expected
+
+    def test_isAnchored(self):
+        assert QuarterEnd(startingMonth=1).isAnchored()
+        assert QuarterEnd().isAnchored()
+        assert not QuarterEnd(2, startingMonth=1).isAnchored()
+
+    def test_offset_corner_case(self):
+        # corner
+        offset = QuarterEnd(n=-1, startingMonth=1)
+        assert datetime(2010, 2, 1) + offset == datetime(2010, 1, 31)
+
+    offset_cases = []
+    offset_cases.append((QuarterEnd(startingMonth=1), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 4, 30),
+        datetime(2008, 2, 15): datetime(2008, 4, 30),
+        datetime(2008, 2, 29): datetime(2008, 4, 30),
+        datetime(2008, 3, 15): datetime(2008, 4, 30),
+        datetime(2008, 3, 31): datetime(2008, 4, 30),
+        datetime(2008, 4, 15): datetime(2008, 4, 30),
+        datetime(2008, 4, 30): datetime(2008, 7, 31)}))
+
+    offset_cases.append((QuarterEnd(startingMonth=2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 29),
+        datetime(2008, 1, 31): datetime(2008, 2, 29),
+        datetime(2008, 2, 15): datetime(2008, 2, 29),
+        datetime(2008, 2, 29): datetime(2008, 5, 31),
+        datetime(2008, 3, 15): datetime(2008, 5, 31),
+        datetime(2008, 3, 31): datetime(2008, 5, 31),
+        datetime(2008, 4, 15): datetime(2008, 5, 31),
+        datetime(2008, 4, 30): datetime(2008, 5, 31)}))
+
+    offset_cases.append((QuarterEnd(startingMonth=1, n=0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 1, 31),
+        datetime(2008, 2, 15): datetime(2008, 4, 30),
+        datetime(2008, 2, 29): datetime(2008, 4, 30),
+        datetime(2008, 3, 15): datetime(2008, 4, 30),
+        datetime(2008, 3, 31): datetime(2008, 4, 30),
+        datetime(2008, 4, 15): datetime(2008, 4, 30),
+        datetime(2008, 4, 30): datetime(2008, 4, 30)}))
+
+    offset_cases.append((QuarterEnd(startingMonth=1, n=-1), {
+        datetime(2008, 1, 1): datetime(2007, 10, 31),
+        datetime(2008, 1, 31): datetime(2007, 10, 31),
+        datetime(2008, 2, 15): datetime(2008, 1, 31),
+        datetime(2008, 2, 29): datetime(2008, 1, 31),
+        datetime(2008, 3, 15): datetime(2008, 1, 31),
+        datetime(2008, 3, 31): datetime(2008, 1, 31),
+        datetime(2008, 4, 15): datetime(2008, 1, 31),
+        datetime(2008, 4, 30): datetime(2008, 1, 31),
+        datetime(2008, 7, 1): datetime(2008, 4, 30)}))
+
+    offset_cases.append((QuarterEnd(startingMonth=1, n=2), {
+        datetime(2008, 1, 31): datetime(2008, 7, 31),
+        datetime(2008, 2, 15): datetime(2008, 7, 31),
+        datetime(2008, 2, 29): datetime(2008, 7, 31),
+        datetime(2008, 3, 15): datetime(2008, 7, 31),
+        datetime(2008, 3, 31): datetime(2008, 7, 31),
+        datetime(2008, 4, 15): datetime(2008, 7, 31),
+        datetime(2008, 4, 30): datetime(2008, 10, 31)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [
+        (QuarterEnd(1, startingMonth=1), datetime(2008, 1, 31), True),
+        (QuarterEnd(1, startingMonth=1), datetime(2007, 12, 31), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2008, 2, 29), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2007, 3, 30), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2007, 3, 31), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2008, 4, 30), True),
+        (QuarterEnd(1, startingMonth=1), datetime(2008, 5, 30), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2008, 5, 31), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2007, 6, 29), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2007, 6, 30), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2008, 1, 31), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2007, 12, 31), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2008, 2, 29), True),
+        (QuarterEnd(1, startingMonth=2), datetime(2007, 3, 30), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2007, 3, 31), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2008, 4, 30), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2008, 5, 30), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2008, 5, 31), True),
+        (QuarterEnd(1, startingMonth=2), datetime(2007, 6, 29), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2007, 6, 30), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2008, 1, 31), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2007, 12, 31), True),
+        (QuarterEnd(1, startingMonth=3), datetime(2008, 2, 29), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2007, 3, 30), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2007, 3, 31), True),
+        (QuarterEnd(1, startingMonth=3), datetime(2008, 4, 30), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2008, 5, 30), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2008, 5, 31), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2007, 6, 29), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2007, 6, 30), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestBQuarterBegin(Base):
+    _offset = BQuarterBegin
+
+    def test_repr(self):
+        expected = "<BusinessQuarterBegin: startingMonth=3>"
+        assert repr(BQuarterBegin()) == expected
+        expected = "<BusinessQuarterBegin: startingMonth=3>"
+        assert repr(BQuarterBegin(startingMonth=3)) == expected
+        expected = "<BusinessQuarterBegin: startingMonth=1>"
+        assert repr(BQuarterBegin(startingMonth=1)) == expected
+
+    def test_isAnchored(self):
+        assert BQuarterBegin(startingMonth=1).isAnchored()
+        assert BQuarterBegin().isAnchored()
+        assert not BQuarterBegin(2, startingMonth=1).isAnchored()
+
+    def test_offset_corner_case(self):
+        # corner
+        offset = BQuarterBegin(n=-1, startingMonth=1)
+        assert datetime(2007, 4, 3) + offset == datetime(2007, 4, 2)
+
+    offset_cases = []
+    offset_cases.append((BQuarterBegin(startingMonth=1), {
+        datetime(2008, 1, 1): datetime(2008, 4, 1),
+        datetime(2008, 1, 31): datetime(2008, 4, 1),
+        datetime(2008, 2, 15): datetime(2008, 4, 1),
+        datetime(2008, 2, 29): datetime(2008, 4, 1),
+        datetime(2008, 3, 15): datetime(2008, 4, 1),
+        datetime(2008, 3, 31): datetime(2008, 4, 1),
+        datetime(2008, 4, 15): datetime(2008, 7, 1),
+        datetime(2007, 3, 15): datetime(2007, 4, 2),
+        datetime(2007, 2, 28): datetime(2007, 4, 2),
+        datetime(2007, 1, 1): datetime(2007, 4, 2),
+        datetime(2007, 4, 15): datetime(2007, 7, 2),
+        datetime(2007, 7, 1): datetime(2007, 7, 2),
+        datetime(2007, 4, 1): datetime(2007, 4, 2),
+        datetime(2007, 4, 2): datetime(2007, 7, 2),
+        datetime(2008, 4, 30): datetime(2008, 7, 1)}))
+
+    offset_cases.append((BQuarterBegin(startingMonth=2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 1),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2008, 1, 15): datetime(2008, 2, 1),
+        datetime(2008, 2, 29): datetime(2008, 5, 1),
+        datetime(2008, 3, 15): datetime(2008, 5, 1),
+        datetime(2008, 3, 31): datetime(2008, 5, 1),
+        datetime(2008, 4, 15): datetime(2008, 5, 1),
+        datetime(2008, 8, 15): datetime(2008, 11, 3),
+        datetime(2008, 9, 15): datetime(2008, 11, 3),
+        datetime(2008, 11, 1): datetime(2008, 11, 3),
+        datetime(2008, 4, 30): datetime(2008, 5, 1)}))
+
+    offset_cases.append((BQuarterBegin(startingMonth=1, n=0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2007, 12, 31): datetime(2008, 1, 1),
+        datetime(2008, 2, 15): datetime(2008, 4, 1),
+        datetime(2008, 2, 29): datetime(2008, 4, 1),
+        datetime(2008, 1, 15): datetime(2008, 4, 1),
+        datetime(2008, 2, 27): datetime(2008, 4, 1),
+        datetime(2008, 3, 15): datetime(2008, 4, 1),
+        datetime(2007, 4, 1): datetime(2007, 4, 2),
+        datetime(2007, 4, 2): datetime(2007, 4, 2),
+        datetime(2007, 7, 1): datetime(2007, 7, 2),
+        datetime(2007, 4, 15): datetime(2007, 7, 2),
+        datetime(2007, 7, 2): datetime(2007, 7, 2)}))
+
+    offset_cases.append((BQuarterBegin(startingMonth=1, n=-1), {
+        datetime(2008, 1, 1): datetime(2007, 10, 1),
+        datetime(2008, 1, 31): datetime(2008, 1, 1),
+        datetime(2008, 2, 15): datetime(2008, 1, 1),
+        datetime(2008, 2, 29): datetime(2008, 1, 1),
+        datetime(2008, 3, 15): datetime(2008, 1, 1),
+        datetime(2008, 3, 31): datetime(2008, 1, 1),
+        datetime(2008, 4, 15): datetime(2008, 4, 1),
+        datetime(2007, 7, 3): datetime(2007, 7, 2),
+        datetime(2007, 4, 3): datetime(2007, 4, 2),
+        datetime(2007, 7, 2): datetime(2007, 4, 2),
+        datetime(2008, 4, 1): datetime(2008, 1, 1)}))
+
+    offset_cases.append((BQuarterBegin(startingMonth=1, n=2), {
+        datetime(2008, 1, 1): datetime(2008, 7, 1),
+        datetime(2008, 1, 15): datetime(2008, 7, 1),
+        datetime(2008, 2, 29): datetime(2008, 7, 1),
+        datetime(2008, 3, 15): datetime(2008, 7, 1),
+        datetime(2007, 3, 31): datetime(2007, 7, 2),
+        datetime(2007, 4, 15): datetime(2007, 10, 1),
+        datetime(2008, 4, 30): datetime(2008, 10, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+
+class TestBQuarterEnd(Base):
+    _offset = BQuarterEnd
+
+    def test_repr(self):
+        expected = "<BusinessQuarterEnd: startingMonth=3>"
+        assert repr(BQuarterEnd()) == expected
+        expected = "<BusinessQuarterEnd: startingMonth=3>"
+        assert repr(BQuarterEnd(startingMonth=3)) == expected
+        expected = "<BusinessQuarterEnd: startingMonth=1>"
+        assert repr(BQuarterEnd(startingMonth=1)) == expected
+
+    def test_isAnchored(self):
+        assert BQuarterEnd(startingMonth=1).isAnchored()
+        assert BQuarterEnd().isAnchored()
+        assert not BQuarterEnd(2, startingMonth=1).isAnchored()
+
+    def test_offset_corner_case(self):
+        # corner
+        offset = BQuarterEnd(n=-1, startingMonth=1)
+        assert datetime(2010, 1, 31) + offset == datetime(2010, 1, 29)
+
+    offset_cases = []
+    offset_cases.append((BQuarterEnd(startingMonth=1), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 4, 30),
+        datetime(2008, 2, 15): datetime(2008, 4, 30),
+        datetime(2008, 2, 29): datetime(2008, 4, 30),
+        datetime(2008, 3, 15): datetime(2008, 4, 30),
+        datetime(2008, 3, 31): datetime(2008, 4, 30),
+        datetime(2008, 4, 15): datetime(2008, 4, 30),
+        datetime(2008, 4, 30): datetime(2008, 7, 31)}))
+
+    offset_cases.append((BQuarterEnd(startingMonth=2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 29),
+        datetime(2008, 1, 31): datetime(2008, 2, 29),
+        datetime(2008, 2, 15): datetime(2008, 2, 29),
+        datetime(2008, 2, 29): datetime(2008, 5, 30),
+        datetime(2008, 3, 15): datetime(2008, 5, 30),
+        datetime(2008, 3, 31): datetime(2008, 5, 30),
+        datetime(2008, 4, 15): datetime(2008, 5, 30),
+        datetime(2008, 4, 30): datetime(2008, 5, 30)}))
+
+    offset_cases.append((BQuarterEnd(startingMonth=1, n=0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 1, 31),
+        datetime(2008, 2, 15): datetime(2008, 4, 30),
+        datetime(2008, 2, 29): datetime(2008, 4, 30),
+        datetime(2008, 3, 15): datetime(2008, 4, 30),
+        datetime(2008, 3, 31): datetime(2008, 4, 30),
+        datetime(2008, 4, 15): datetime(2008, 4, 30),
+        datetime(2008, 4, 30): datetime(2008, 4, 30)}))
+
+    offset_cases.append((BQuarterEnd(startingMonth=1, n=-1), {
+        datetime(2008, 1, 1): datetime(2007, 10, 31),
+        datetime(2008, 1, 31): datetime(2007, 10, 31),
+        datetime(2008, 2, 15): datetime(2008, 1, 31),
+        datetime(2008, 2, 29): datetime(2008, 1, 31),
+        datetime(2008, 3, 15): datetime(2008, 1, 31),
+        datetime(2008, 3, 31): datetime(2008, 1, 31),
+        datetime(2008, 4, 15): datetime(2008, 1, 31),
+        datetime(2008, 4, 30): datetime(2008, 1, 31)}))
+
+    offset_cases.append((BQuarterEnd(startingMonth=1, n=2), {
+        datetime(2008, 1, 31): datetime(2008, 7, 31),
+        datetime(2008, 2, 15): datetime(2008, 7, 31),
+        datetime(2008, 2, 29): datetime(2008, 7, 31),
+        datetime(2008, 3, 15): datetime(2008, 7, 31),
+        datetime(2008, 3, 31): datetime(2008, 7, 31),
+        datetime(2008, 4, 15): datetime(2008, 7, 31),
+        datetime(2008, 4, 30): datetime(2008, 10, 31)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [
+        (BQuarterEnd(1, startingMonth=1), datetime(2008, 1, 31), True),
+        (BQuarterEnd(1, startingMonth=1), datetime(2007, 12, 31), False),
+        (BQuarterEnd(1, startingMonth=1), datetime(2008, 2, 29), False),
+        (BQuarterEnd(1, startingMonth=1), datetime(2007, 3, 30), False),
+        (BQuarterEnd(1, startingMonth=1), datetime(2007, 3, 31), False),
+        (BQuarterEnd(1, startingMonth=1), datetime(2008, 4, 30), True),
+        (BQuarterEnd(1, startingMonth=1), datetime(2008, 5, 30), False),
+        (BQuarterEnd(1, startingMonth=1), datetime(2007, 6, 29), False),
+        (BQuarterEnd(1, startingMonth=1), datetime(2007, 6, 30), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2008, 1, 31), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2007, 12, 31), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2008, 2, 29), True),
+        (BQuarterEnd(1, startingMonth=2), datetime(2007, 3, 30), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2007, 3, 31), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2008, 4, 30), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2008, 5, 30), True),
+        (BQuarterEnd(1, startingMonth=2), datetime(2007, 6, 29), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2007, 6, 30), False),
+        (BQuarterEnd(1, startingMonth=3), datetime(2008, 1, 31), False),
+        (BQuarterEnd(1, startingMonth=3), datetime(2007, 12, 31), True),
+        (BQuarterEnd(1, startingMonth=3), datetime(2008, 2, 29), False),
+        (BQuarterEnd(1, startingMonth=3), datetime(2007, 3, 30), True),
+        (BQuarterEnd(1, startingMonth=3), datetime(2007, 3, 31), False),
+        (BQuarterEnd(1, startingMonth=3), datetime(2008, 4, 30), False),
+        (BQuarterEnd(1, startingMonth=3), datetime(2008, 5, 30), False),
+        (BQuarterEnd(1, startingMonth=3), datetime(2007, 6, 29), True),
+        (BQuarterEnd(1, startingMonth=3), datetime(2007, 6, 30), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+# --------------------------------------------------------------------
+# Years
+
+
+class TestYearBegin(Base):
+    _offset = YearBegin
+
+    def test_misspecified(self):
+        pytest.raises(ValueError, YearBegin, month=13)
+
+    offset_cases = []
+    offset_cases.append((YearBegin(), {
+        datetime(2008, 1, 1): datetime(2009, 1, 1),
+        datetime(2008, 6, 30): datetime(2009, 1, 1),
+        datetime(2008, 12, 31): datetime(2009, 1, 1),
+        datetime(2005, 12, 30): datetime(2006, 1, 1),
+        datetime(2005, 12, 31): datetime(2006, 1, 1)}))
+
+    offset_cases.append((YearBegin(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 6, 30): datetime(2009, 1, 1),
+        datetime(2008, 12, 31): datetime(2009, 1, 1),
+        datetime(2005, 12, 30): datetime(2006, 1, 1),
+        datetime(2005, 12, 31): datetime(2006, 1, 1)}))
+
+    offset_cases.append((YearBegin(3), {
+        datetime(2008, 1, 1): datetime(2011, 1, 1),
+        datetime(2008, 6, 30): datetime(2011, 1, 1),
+        datetime(2008, 12, 31): datetime(2011, 1, 1),
+        datetime(2005, 12, 30): datetime(2008, 1, 1),
+        datetime(2005, 12, 31): datetime(2008, 1, 1)}))
+
+    offset_cases.append((YearBegin(-1), {
+        datetime(2007, 1, 1): datetime(2006, 1, 1),
+        datetime(2007, 1, 15): datetime(2007, 1, 1),
+        datetime(2008, 6, 30): datetime(2008, 1, 1),
+        datetime(2008, 12, 31): datetime(2008, 1, 1),
+        datetime(2006, 12, 29): datetime(2006, 1, 1),
+        datetime(2006, 12, 30): datetime(2006, 1, 1),
+        datetime(2007, 1, 1): datetime(2006, 1, 1)}))
+
+    offset_cases.append((YearBegin(-2), {
+        datetime(2007, 1, 1): datetime(2005, 1, 1),
+        datetime(2008, 6, 30): datetime(2007, 1, 1),
+        datetime(2008, 12, 31): datetime(2007, 1, 1)}))
+
+    offset_cases.append((YearBegin(month=4), {
+        datetime(2007, 4, 1): datetime(2008, 4, 1),
+        datetime(2007, 4, 15): datetime(2008, 4, 1),
+        datetime(2007, 3, 1): datetime(2007, 4, 1),
+        datetime(2007, 12, 15): datetime(2008, 4, 1),
+        datetime(2012, 1, 31): datetime(2012, 4, 1)}))
+
+    offset_cases.append((YearBegin(0, month=4), {
+        datetime(2007, 4, 1): datetime(2007, 4, 1),
+        datetime(2007, 3, 1): datetime(2007, 4, 1),
+        datetime(2007, 12, 15): datetime(2008, 4, 1),
+        datetime(2012, 1, 31): datetime(2012, 4, 1)}))
+
+    offset_cases.append((YearBegin(4, month=4), {
+        datetime(2007, 4, 1): datetime(2011, 4, 1),
+        datetime(2007, 4, 15): datetime(2011, 4, 1),
+        datetime(2007, 3, 1): datetime(2010, 4, 1),
+        datetime(2007, 12, 15): datetime(2011, 4, 1),
+        datetime(2012, 1, 31): datetime(2015, 4, 1)}))
+
+    offset_cases.append((YearBegin(-1, month=4), {
+        datetime(2007, 4, 1): datetime(2006, 4, 1),
+        datetime(2007, 3, 1): datetime(2006, 4, 1),
+        datetime(2007, 12, 15): datetime(2007, 4, 1),
+        datetime(2012, 1, 31): datetime(2011, 4, 1)}))
+
+    offset_cases.append((YearBegin(-3, month=4), {
+        datetime(2007, 4, 1): datetime(2004, 4, 1),
+        datetime(2007, 3, 1): datetime(2004, 4, 1),
+        datetime(2007, 12, 15): datetime(2005, 4, 1),
+        datetime(2012, 1, 31): datetime(2009, 4, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(YearBegin(), datetime(2007, 1, 3), False),
+                       (YearBegin(), datetime(2008, 1, 1), True),
+                       (YearBegin(), datetime(2006, 12, 31), False),
+                       (YearBegin(), datetime(2006, 1, 2), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestYearEnd(Base):
+    _offset = YearEnd
+
+    def test_misspecified(self):
+        pytest.raises(ValueError, YearEnd, month=13)
+
+    offset_cases = []
+    offset_cases.append((YearEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 12, 31),
+        datetime(2008, 12, 31): datetime(2009, 12, 31),
+        datetime(2005, 12, 30): datetime(2005, 12, 31),
+        datetime(2005, 12, 31): datetime(2006, 12, 31)}))
+
+    offset_cases.append((YearEnd(0), {
+        datetime(2008, 1, 1): datetime(2008, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 12, 31),
+        datetime(2008, 12, 31): datetime(2008, 12, 31),
+        datetime(2005, 12, 30): datetime(2005, 12, 31)}))
+
+    offset_cases.append((YearEnd(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 31),
+        datetime(2008, 6, 30): datetime(2007, 12, 31),
+        datetime(2008, 12, 31): datetime(2007, 12, 31),
+        datetime(2006, 12, 29): datetime(2005, 12, 31),
+        datetime(2006, 12, 30): datetime(2005, 12, 31),
+        datetime(2007, 1, 1): datetime(2006, 12, 31)}))
+
+    offset_cases.append((YearEnd(-2), {
+        datetime(2007, 1, 1): datetime(2005, 12, 31),
+        datetime(2008, 6, 30): datetime(2006, 12, 31),
+        datetime(2008, 12, 31): datetime(2006, 12, 31)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(YearEnd(), datetime(2007, 12, 31), True),
+                       (YearEnd(), datetime(2008, 1, 1), False),
+                       (YearEnd(), datetime(2006, 12, 31), True),
+                       (YearEnd(), datetime(2006, 12, 29), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestYearEndDiffMonth(Base):
+    offset_cases = []
+    offset_cases.append((YearEnd(month=3),
+                        {datetime(2008, 1, 1): datetime(2008, 3, 31),
+                         datetime(2008, 2, 15): datetime(2008, 3, 31),
+                         datetime(2008, 3, 31): datetime(2009, 3, 31),
+                         datetime(2008, 3, 30): datetime(2008, 3, 31),
+                         datetime(2005, 3, 31): datetime(2006, 3, 31),
+                         datetime(2006, 7, 30): datetime(2007, 3, 31)}))
+
+    offset_cases.append((YearEnd(0, month=3),
+                        {datetime(2008, 1, 1): datetime(2008, 3, 31),
+                         datetime(2008, 2, 28): datetime(2008, 3, 31),
+                         datetime(2008, 3, 31): datetime(2008, 3, 31),
+                         datetime(2005, 3, 30): datetime(2005, 3, 31)}))
+
+    offset_cases.append((YearEnd(-1, month=3),
+                        {datetime(2007, 1, 1): datetime(2006, 3, 31),
+                         datetime(2008, 2, 28): datetime(2007, 3, 31),
+                         datetime(2008, 3, 31): datetime(2007, 3, 31),
+                         datetime(2006, 3, 29): datetime(2005, 3, 31),
+                         datetime(2006, 3, 30): datetime(2005, 3, 31),
+                         datetime(2007, 3, 1): datetime(2006, 3, 31)}))
+
+    offset_cases.append((YearEnd(-2, month=3),
+                        {datetime(2007, 1, 1): datetime(2005, 3, 31),
+                         datetime(2008, 6, 30): datetime(2007, 3, 31),
+                         datetime(2008, 3, 31): datetime(2006, 3, 31)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(YearEnd(month=3), datetime(2007, 3, 31), True),
+                       (YearEnd(month=3), datetime(2008, 1, 1), False),
+                       (YearEnd(month=3), datetime(2006, 3, 31), True),
+                       (YearEnd(month=3), datetime(2006, 3, 29), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestBYearBegin(Base):
+    _offset = BYearBegin
+
+    def test_misspecified(self):
+        pytest.raises(ValueError, BYearBegin, month=13)
+        pytest.raises(ValueError, BYearEnd, month=13)
+
+    offset_cases = []
+    offset_cases.append((BYearBegin(), {
+        datetime(2008, 1, 1): datetime(2009, 1, 1),
+        datetime(2008, 6, 30): datetime(2009, 1, 1),
+        datetime(2008, 12, 31): datetime(2009, 1, 1),
+        datetime(2011, 1, 1): datetime(2011, 1, 3),
+        datetime(2011, 1, 3): datetime(2012, 1, 2),
+        datetime(2005, 12, 30): datetime(2006, 1, 2),
+        datetime(2005, 12, 31): datetime(2006, 1, 2)}))
+
+    offset_cases.append((BYearBegin(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 6, 30): datetime(2009, 1, 1),
+        datetime(2008, 12, 31): datetime(2009, 1, 1),
+        datetime(2005, 12, 30): datetime(2006, 1, 2),
+        datetime(2005, 12, 31): datetime(2006, 1, 2)}))
+
+    offset_cases.append((BYearBegin(-1), {
+        datetime(2007, 1, 1): datetime(2006, 1, 2),
+        datetime(2009, 1, 4): datetime(2009, 1, 1),
+        datetime(2009, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 6, 30): datetime(2008, 1, 1),
+        datetime(2008, 12, 31): datetime(2008, 1, 1),
+        datetime(2006, 12, 29): datetime(2006, 1, 2),
+        datetime(2006, 12, 30): datetime(2006, 1, 2),
+        datetime(2006, 1, 1): datetime(2005, 1, 3)}))
+
+    offset_cases.append((BYearBegin(-2), {
+        datetime(2007, 1, 1): datetime(2005, 1, 3),
+        datetime(2007, 6, 30): datetime(2006, 1, 2),
+        datetime(2008, 12, 31): datetime(2007, 1, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+
+class TestBYearEnd(Base):
+    _offset = BYearEnd
+
+    offset_cases = []
+    offset_cases.append((BYearEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 12, 31),
+        datetime(2008, 12, 31): datetime(2009, 12, 31),
+        datetime(2005, 12, 30): datetime(2006, 12, 29),
+        datetime(2005, 12, 31): datetime(2006, 12, 29)}))
+
+    offset_cases.append((BYearEnd(0), {
+        datetime(2008, 1, 1): datetime(2008, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 12, 31),
+        datetime(2008, 12, 31): datetime(2008, 12, 31),
+        datetime(2005, 12, 31): datetime(2006, 12, 29)}))
+
+    offset_cases.append((BYearEnd(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 29),
+        datetime(2008, 6, 30): datetime(2007, 12, 31),
+        datetime(2008, 12, 31): datetime(2007, 12, 31),
+        datetime(2006, 12, 29): datetime(2005, 12, 30),
+        datetime(2006, 12, 30): datetime(2006, 12, 29),
+        datetime(2007, 1, 1): datetime(2006, 12, 29)}))
+
+    offset_cases.append((BYearEnd(-2), {
+        datetime(2007, 1, 1): datetime(2005, 12, 30),
+        datetime(2008, 6, 30): datetime(2006, 12, 29),
+        datetime(2008, 12, 31): datetime(2006, 12, 29)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(BYearEnd(), datetime(2007, 12, 31), True),
+                       (BYearEnd(), datetime(2008, 1, 1), False),
+                       (BYearEnd(), datetime(2006, 12, 31), False),
+                       (BYearEnd(), datetime(2006, 12, 29), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestBYearEndLagged(Base):
+    _offset = BYearEnd
+
+    def test_bad_month_fail(self):
+        pytest.raises(Exception, BYearEnd, month=13)
+        pytest.raises(Exception, BYearEnd, month=0)
+
+    offset_cases = []
+    offset_cases.append((BYearEnd(month=6), {
+        datetime(2008, 1, 1): datetime(2008, 6, 30),
+        datetime(2007, 6, 30): datetime(2008, 6, 30)}))
+
+    offset_cases.append((BYearEnd(n=-1, month=6), {
+        datetime(2008, 1, 1): datetime(2007, 6, 29),
+        datetime(2007, 6, 30): datetime(2007, 6, 29)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    def test_roll(self):
+        offset = BYearEnd(month=6)
+        date = datetime(2009, 11, 30)
+
+        assert offset.rollforward(date) == datetime(2010, 6, 30)
+        assert offset.rollback(date) == datetime(2009, 6, 30)
+
+    on_offset_cases = [(BYearEnd(month=2), datetime(2007, 2, 28), True),
+                       (BYearEnd(month=6), datetime(2007, 6, 30), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
diff --git a/pandas/tests/tseries/test_frequencies.py b/pandas/tests/tseries/test_frequencies.py
new file mode 100644
index 0000000000000..92d7eb15c929c
--- /dev/null
+++ b/pandas/tests/tseries/test_frequencies.py
@@ -0,0 +1,806 @@
+from datetime import datetime, timedelta
+from pandas.compat import range
+
+import pytest
+import numpy as np
+
+from pandas import (Index, DatetimeIndex, Timestamp, Series,
+                    date_range, period_range)
+
+from pandas._libs.tslibs.frequencies import (_period_code_map,
+                                             _INVALID_FREQ_ERROR)
+from pandas._libs.tslibs.ccalendar import MONTHS
+from pandas._libs.tslibs import resolution
+import pandas.tseries.frequencies as frequencies
+from pandas.core.tools.datetimes import to_datetime
+
+import pandas.tseries.offsets as offsets
+from pandas.core.indexes.period import PeriodIndex
+import pandas.compat as compat
+from pandas.compat import is_platform_windows
+
+import pandas.util.testing as tm
+from pandas import Timedelta
+
+
+class TestToOffset(object):
+
+    def test_to_offset_multiple(self):
+        freqstr = '2h30min'
+        freqstr2 = '2h 30min'
+
+        result = frequencies.to_offset(freqstr)
+        assert (result == frequencies.to_offset(freqstr2))
+        expected = offsets.Minute(150)
+        assert (result == expected)
+
+        freqstr = '2h30min15s'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.Second(150 * 60 + 15)
+        assert (result == expected)
+
+        freqstr = '2h 60min'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.Hour(3)
+        assert (result == expected)
+
+        freqstr = '2h 20.5min'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.Second(8430)
+        assert (result == expected)
+
+        freqstr = '1.5min'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.Second(90)
+        assert (result == expected)
+
+        freqstr = '0.5S'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.Milli(500)
+        assert (result == expected)
+
+        freqstr = '15l500u'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.Micro(15500)
+        assert (result == expected)
+
+        freqstr = '10s75L'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.Milli(10075)
+        assert (result == expected)
+
+        freqstr = '1s0.25ms'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.Micro(1000250)
+        assert (result == expected)
+
+        freqstr = '1s0.25L'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.Micro(1000250)
+        assert (result == expected)
+
+        freqstr = '2800N'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.Nano(2800)
+        assert (result == expected)
+
+        freqstr = '2SM'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.SemiMonthEnd(2)
+        assert (result == expected)
+
+        freqstr = '2SM-16'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.SemiMonthEnd(2, day_of_month=16)
+        assert (result == expected)
+
+        freqstr = '2SMS-14'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.SemiMonthBegin(2, day_of_month=14)
+        assert (result == expected)
+
+        freqstr = '2SMS-15'
+        result = frequencies.to_offset(freqstr)
+        expected = offsets.SemiMonthBegin(2)
+        assert (result == expected)
+
+        # malformed
+        with tm.assert_raises_regex(ValueError,
+                                    'Invalid frequency: 2h20m'):
+            frequencies.to_offset('2h20m')
+
+    def test_to_offset_negative(self):
+        freqstr = '-1S'
+        result = frequencies.to_offset(freqstr)
+        assert (result.n == -1)
+
+        freqstr = '-5min10s'
+        result = frequencies.to_offset(freqstr)
+        assert (result.n == -310)
+
+        freqstr = '-2SM'
+        result = frequencies.to_offset(freqstr)
+        assert (result.n == -2)
+
+        freqstr = '-1SMS'
+        result = frequencies.to_offset(freqstr)
+        assert (result.n == -1)
+
+    def test_to_offset_invalid(self):
+        # GH 13930
+        with tm.assert_raises_regex(ValueError,
+                                    'Invalid frequency: U1'):
+            frequencies.to_offset('U1')
+        with tm.assert_raises_regex(ValueError,
+                                    'Invalid frequency: -U'):
+            frequencies.to_offset('-U')
+        with tm.assert_raises_regex(ValueError,
+                                    'Invalid frequency: 3U1'):
+            frequencies.to_offset('3U1')
+        with tm.assert_raises_regex(ValueError,
+                                    'Invalid frequency: -2-3U'):
+            frequencies.to_offset('-2-3U')
+        with tm.assert_raises_regex(ValueError,
+                                    'Invalid frequency: -2D:3H'):
+            frequencies.to_offset('-2D:3H')
+        with tm.assert_raises_regex(ValueError,
+                                    'Invalid frequency: 1.5.0S'):
+            frequencies.to_offset('1.5.0S')
+
+        # split offsets with spaces are valid
+        assert frequencies.to_offset('2D 3H') == offsets.Hour(51)
+        assert frequencies.to_offset('2 D3 H') == offsets.Hour(51)
+        assert frequencies.to_offset('2 D 3 H') == offsets.Hour(51)
+        assert frequencies.to_offset('  2 D 3 H  ') == offsets.Hour(51)
+        assert frequencies.to_offset('   H    ') == offsets.Hour()
+        assert frequencies.to_offset(' 3  H    ') == offsets.Hour(3)
+
+        # special cases
+        assert frequencies.to_offset('2SMS-15') == offsets.SemiMonthBegin(2)
+        with tm.assert_raises_regex(ValueError,
+                                    'Invalid frequency: 2SMS-15-15'):
+            frequencies.to_offset('2SMS-15-15')
+        with tm.assert_raises_regex(ValueError,
+                                    'Invalid frequency: 2SMS-15D'):
+            frequencies.to_offset('2SMS-15D')
+
+    def test_to_offset_leading_zero(self):
+        freqstr = '00H 00T 01S'
+        result = frequencies.to_offset(freqstr)
+        assert (result.n == 1)
+
+        freqstr = '-00H 03T 14S'
+        result = frequencies.to_offset(freqstr)
+        assert (result.n == -194)
+
+    def test_to_offset_leading_plus(self):
+        freqstr = '+1d'
+        result = frequencies.to_offset(freqstr)
+        assert (result.n == 1)
+
+        freqstr = '+2h30min'
+        result = frequencies.to_offset(freqstr)
+        assert (result.n == 150)
+
+        for bad_freq in ['+-1d', '-+1h', '+1', '-7', '+d', '-m']:
+            with tm.assert_raises_regex(ValueError, 'Invalid frequency:'):
+                frequencies.to_offset(bad_freq)
+
+    def test_to_offset_pd_timedelta(self):
+        # Tests for #9064
+        td = Timedelta(days=1, seconds=1)
+        result = frequencies.to_offset(td)
+        expected = offsets.Second(86401)
+        assert (expected == result)
+
+        td = Timedelta(days=-1, seconds=1)
+        result = frequencies.to_offset(td)
+        expected = offsets.Second(-86399)
+        assert (expected == result)
+
+        td = Timedelta(hours=1, minutes=10)
+        result = frequencies.to_offset(td)
+        expected = offsets.Minute(70)
+        assert (expected == result)
+
+        td = Timedelta(hours=1, minutes=-10)
+        result = frequencies.to_offset(td)
+        expected = offsets.Minute(50)
+        assert (expected == result)
+
+        td = Timedelta(weeks=1)
+        result = frequencies.to_offset(td)
+        expected = offsets.Day(7)
+        assert (expected == result)
+
+        td1 = Timedelta(hours=1)
+        result1 = frequencies.to_offset(td1)
+        result2 = frequencies.to_offset('60min')
+        assert (result1 == result2)
+
+        td = Timedelta(microseconds=1)
+        result = frequencies.to_offset(td)
+        expected = offsets.Micro(1)
+        assert (expected == result)
+
+        td = Timedelta(microseconds=0)
+        pytest.raises(ValueError, lambda: frequencies.to_offset(td))
+
+    def test_anchored_shortcuts(self):
+        result = frequencies.to_offset('W')
+        expected = frequencies.to_offset('W-SUN')
+        assert (result == expected)
+
+        result1 = frequencies.to_offset('Q')
+        result2 = frequencies.to_offset('Q-DEC')
+        expected = offsets.QuarterEnd(startingMonth=12)
+        assert (result1 == expected)
+        assert (result2 == expected)
+
+        result1 = frequencies.to_offset('Q-MAY')
+        expected = offsets.QuarterEnd(startingMonth=5)
+        assert (result1 == expected)
+
+        result1 = frequencies.to_offset('SM')
+        result2 = frequencies.to_offset('SM-15')
+        expected = offsets.SemiMonthEnd(day_of_month=15)
+        assert (result1 == expected)
+        assert (result2 == expected)
+
+        result = frequencies.to_offset('SM-1')
+        expected = offsets.SemiMonthEnd(day_of_month=1)
+        assert (result == expected)
+
+        result = frequencies.to_offset('SM-27')
+        expected = offsets.SemiMonthEnd(day_of_month=27)
+        assert (result == expected)
+
+        result = frequencies.to_offset('SMS-2')
+        expected = offsets.SemiMonthBegin(day_of_month=2)
+        assert (result == expected)
+
+        result = frequencies.to_offset('SMS-27')
+        expected = offsets.SemiMonthBegin(day_of_month=27)
+        assert (result == expected)
+
+        # ensure invalid cases fail as expected
+        invalid_anchors = ['SM-0', 'SM-28', 'SM-29',
+                           'SM-FOO', 'BSM', 'SM--1',
+                           'SMS-1', 'SMS-28', 'SMS-30',
+                           'SMS-BAR', 'SMS-BYR' 'BSMS',
+                           'SMS--2']
+        for invalid_anchor in invalid_anchors:
+            with tm.assert_raises_regex(ValueError,
+                                        'Invalid frequency: '):
+                frequencies.to_offset(invalid_anchor)
+
+
+def test_ms_vs_MS():
+    left = frequencies.get_offset('ms')
+    right = frequencies.get_offset('MS')
+    assert left == offsets.Milli()
+    assert right == offsets.MonthBegin()
+
+
+def test_rule_aliases():
+    rule = frequencies.to_offset('10us')
+    assert rule == offsets.Micro(10)
+
+
+class TestFrequencyCode(object):
+
+    def test_freq_code(self):
+        assert frequencies.get_freq('A') == 1000
+        assert frequencies.get_freq('3A') == 1000
+        assert frequencies.get_freq('-1A') == 1000
+
+        assert frequencies.get_freq('Y') == 1000
+        assert frequencies.get_freq('3Y') == 1000
+        assert frequencies.get_freq('-1Y') == 1000
+
+        assert frequencies.get_freq('W') == 4000
+        assert frequencies.get_freq('W-MON') == 4001
+        assert frequencies.get_freq('W-FRI') == 4005
+
+        for freqstr, code in compat.iteritems(_period_code_map):
+            result = frequencies.get_freq(freqstr)
+            assert result == code
+
+            result = resolution.get_freq_group(freqstr)
+            assert result == code // 1000 * 1000
+
+            result = resolution.get_freq_group(code)
+            assert result == code // 1000 * 1000
+
+    def test_freq_group(self):
+        assert resolution.get_freq_group('A') == 1000
+        assert resolution.get_freq_group('3A') == 1000
+        assert resolution.get_freq_group('-1A') == 1000
+        assert resolution.get_freq_group('A-JAN') == 1000
+        assert resolution.get_freq_group('A-MAY') == 1000
+
+        assert resolution.get_freq_group('Y') == 1000
+        assert resolution.get_freq_group('3Y') == 1000
+        assert resolution.get_freq_group('-1Y') == 1000
+        assert resolution.get_freq_group('Y-JAN') == 1000
+        assert resolution.get_freq_group('Y-MAY') == 1000
+
+        assert resolution.get_freq_group(offsets.YearEnd()) == 1000
+        assert resolution.get_freq_group(offsets.YearEnd(month=1)) == 1000
+        assert resolution.get_freq_group(offsets.YearEnd(month=5)) == 1000
+
+        assert resolution.get_freq_group('W') == 4000
+        assert resolution.get_freq_group('W-MON') == 4000
+        assert resolution.get_freq_group('W-FRI') == 4000
+        assert resolution.get_freq_group(offsets.Week()) == 4000
+        assert resolution.get_freq_group(offsets.Week(weekday=1)) == 4000
+        assert resolution.get_freq_group(offsets.Week(weekday=5)) == 4000
+
+    def test_get_to_timestamp_base(self):
+        tsb = frequencies.get_to_timestamp_base
+
+        assert (tsb(frequencies.get_freq_code('D')[0]) ==
+                frequencies.get_freq_code('D')[0])
+        assert (tsb(frequencies.get_freq_code('W')[0]) ==
+                frequencies.get_freq_code('D')[0])
+        assert (tsb(frequencies.get_freq_code('M')[0]) ==
+                frequencies.get_freq_code('D')[0])
+
+        assert (tsb(frequencies.get_freq_code('S')[0]) ==
+                frequencies.get_freq_code('S')[0])
+        assert (tsb(frequencies.get_freq_code('T')[0]) ==
+                frequencies.get_freq_code('S')[0])
+        assert (tsb(frequencies.get_freq_code('H')[0]) ==
+                frequencies.get_freq_code('S')[0])
+
+    def test_freq_to_reso(self):
+        Reso = frequencies.Resolution
+
+        assert Reso.get_str_from_freq('A') == 'year'
+        assert Reso.get_str_from_freq('Q') == 'quarter'
+        assert Reso.get_str_from_freq('M') == 'month'
+        assert Reso.get_str_from_freq('D') == 'day'
+        assert Reso.get_str_from_freq('H') == 'hour'
+        assert Reso.get_str_from_freq('T') == 'minute'
+        assert Reso.get_str_from_freq('S') == 'second'
+        assert Reso.get_str_from_freq('L') == 'millisecond'
+        assert Reso.get_str_from_freq('U') == 'microsecond'
+        assert Reso.get_str_from_freq('N') == 'nanosecond'
+
+        for freq in ['A', 'Q', 'M', 'D', 'H', 'T', 'S', 'L', 'U', 'N']:
+            # check roundtrip
+            result = Reso.get_freq(Reso.get_str_from_freq(freq))
+            assert freq == result
+
+        for freq in ['D', 'H', 'T', 'S', 'L', 'U']:
+            result = Reso.get_freq(Reso.get_str(Reso.get_reso_from_freq(freq)))
+            assert freq == result
+
+    def test_resolution_bumping(self):
+        # see gh-14378
+        Reso = frequencies.Resolution
+
+        assert Reso.get_stride_from_decimal(1.5, 'T') == (90, 'S')
+        assert Reso.get_stride_from_decimal(62.4, 'T') == (3744, 'S')
+        assert Reso.get_stride_from_decimal(1.04, 'H') == (3744, 'S')
+        assert Reso.get_stride_from_decimal(1, 'D') == (1, 'D')
+        assert (Reso.get_stride_from_decimal(0.342931, 'H') ==
+                (1234551600, 'U'))
+        assert Reso.get_stride_from_decimal(1.2345, 'D') == (106660800, 'L')
+
+        with pytest.raises(ValueError):
+            Reso.get_stride_from_decimal(0.5, 'N')
+
+        # too much precision in the input can prevent
+        with pytest.raises(ValueError):
+            Reso.get_stride_from_decimal(0.3429324798798269273987982, 'H')
+
+    def test_get_freq_code(self):
+        # frequency str
+        assert (frequencies.get_freq_code('A') ==
+                (frequencies.get_freq('A'), 1))
+        assert (frequencies.get_freq_code('3D') ==
+                (frequencies.get_freq('D'), 3))
+        assert (frequencies.get_freq_code('-2M') ==
+                (frequencies.get_freq('M'), -2))
+
+        # tuple
+        assert (frequencies.get_freq_code(('D', 1)) ==
+                (frequencies.get_freq('D'), 1))
+        assert (frequencies.get_freq_code(('A', 3)) ==
+                (frequencies.get_freq('A'), 3))
+        assert (frequencies.get_freq_code(('M', -2)) ==
+                (frequencies.get_freq('M'), -2))
+
+        # numeric tuple
+        assert frequencies.get_freq_code((1000, 1)) == (1000, 1)
+
+        # offsets
+        assert (frequencies.get_freq_code(offsets.Day()) ==
+                (frequencies.get_freq('D'), 1))
+        assert (frequencies.get_freq_code(offsets.Day(3)) ==
+                (frequencies.get_freq('D'), 3))
+        assert (frequencies.get_freq_code(offsets.Day(-2)) ==
+                (frequencies.get_freq('D'), -2))
+
+        assert (frequencies.get_freq_code(offsets.MonthEnd()) ==
+                (frequencies.get_freq('M'), 1))
+        assert (frequencies.get_freq_code(offsets.MonthEnd(3)) ==
+                (frequencies.get_freq('M'), 3))
+        assert (frequencies.get_freq_code(offsets.MonthEnd(-2)) ==
+                (frequencies.get_freq('M'), -2))
+
+        assert (frequencies.get_freq_code(offsets.Week()) ==
+                (frequencies.get_freq('W'), 1))
+        assert (frequencies.get_freq_code(offsets.Week(3)) ==
+                (frequencies.get_freq('W'), 3))
+        assert (frequencies.get_freq_code(offsets.Week(-2)) ==
+                (frequencies.get_freq('W'), -2))
+
+        # Monday is weekday=0
+        assert (frequencies.get_freq_code(offsets.Week(weekday=1)) ==
+                (frequencies.get_freq('W-TUE'), 1))
+        assert (frequencies.get_freq_code(offsets.Week(3, weekday=0)) ==
+                (frequencies.get_freq('W-MON'), 3))
+        assert (frequencies.get_freq_code(offsets.Week(-2, weekday=4)) ==
+                (frequencies.get_freq('W-FRI'), -2))
+
+    def test_frequency_misc(self):
+        assert (resolution.get_freq_group('T') ==
+                frequencies.FreqGroup.FR_MIN)
+
+        code, stride = frequencies.get_freq_code(offsets.Hour())
+        assert code == frequencies.FreqGroup.FR_HR
+
+        code, stride = frequencies.get_freq_code((5, 'T'))
+        assert code == frequencies.FreqGroup.FR_MIN
+        assert stride == 5
+
+        offset = offsets.Hour()
+        result = frequencies.to_offset(offset)
+        assert result == offset
+
+        result = frequencies.to_offset((5, 'T'))
+        expected = offsets.Minute(5)
+        assert result == expected
+
+        with tm.assert_raises_regex(ValueError, 'Invalid frequency'):
+            frequencies.get_freq_code((5, 'baz'))
+
+        with tm.assert_raises_regex(ValueError, 'Invalid frequency'):
+            frequencies.to_offset('100foo')
+
+        with tm.assert_raises_regex(ValueError, 'Could not evaluate'):
+            frequencies.to_offset(('', ''))
+
+
+_dti = DatetimeIndex
+
+
+class TestFrequencyInference(object):
+
+    def test_raise_if_period_index(self):
+        index = PeriodIndex(start="1/1/1990", periods=20, freq="M")
+        pytest.raises(TypeError, frequencies.infer_freq, index)
+
+    def test_raise_if_too_few(self):
+        index = _dti(['12/31/1998', '1/3/1999'])
+        pytest.raises(ValueError, frequencies.infer_freq, index)
+
+    def test_business_daily(self):
+        index = _dti(['01/01/1999', '1/4/1999', '1/5/1999'])
+        assert frequencies.infer_freq(index) == 'B'
+
+    def test_business_daily_look_alike(self):
+        # GH 16624, do not infer 'B' when 'weekend' (2-day gap) in wrong place
+        index = _dti(['12/31/1998', '1/3/1999', '1/4/1999'])
+        assert frequencies.infer_freq(index) is None
+
+    def test_day(self):
+        self._check_tick(timedelta(1), 'D')
+
+    def test_day_corner(self):
+        index = _dti(['1/1/2000', '1/2/2000', '1/3/2000'])
+        assert frequencies.infer_freq(index) == 'D'
+
+    def test_non_datetimeindex(self):
+        dates = to_datetime(['1/1/2000', '1/2/2000', '1/3/2000'])
+        assert frequencies.infer_freq(dates) == 'D'
+
+    def test_hour(self):
+        self._check_tick(timedelta(hours=1), 'H')
+
+    def test_minute(self):
+        self._check_tick(timedelta(minutes=1), 'T')
+
+    def test_second(self):
+        self._check_tick(timedelta(seconds=1), 'S')
+
+    def test_millisecond(self):
+        self._check_tick(timedelta(microseconds=1000), 'L')
+
+    def test_microsecond(self):
+        self._check_tick(timedelta(microseconds=1), 'U')
+
+    def test_nanosecond(self):
+        self._check_tick(np.timedelta64(1, 'ns'), 'N')
+
+    def _check_tick(self, base_delta, code):
+        b = Timestamp(datetime.now())
+        for i in range(1, 5):
+            inc = base_delta * i
+            index = _dti([b + inc * j for j in range(3)])
+            if i > 1:
+                exp_freq = '%d%s' % (i, code)
+            else:
+                exp_freq = code
+            assert frequencies.infer_freq(index) == exp_freq
+
+        index = _dti([b + base_delta * 7] + [b + base_delta * j for j in range(
+            3)])
+        assert frequencies.infer_freq(index) is None
+
+        index = _dti([b + base_delta * j for j in range(3)] + [b + base_delta *
+                                                               7])
+
+        assert frequencies.infer_freq(index) is None
+
+    def test_weekly(self):
+        days = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
+
+        for day in days:
+            self._check_generated_range('1/1/2000', 'W-%s' % day)
+
+    def test_week_of_month(self):
+        days = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
+
+        for day in days:
+            for i in range(1, 5):
+                self._check_generated_range('1/1/2000', 'WOM-%d%s' % (i, day))
+
+    def test_fifth_week_of_month(self):
+        # Only supports freq up to WOM-4. See #9425
+        func = lambda: date_range('2014-01-01', freq='WOM-5MON')
+        pytest.raises(ValueError, func)
+
+    def test_fifth_week_of_month_infer(self):
+        # Only attempts to infer up to WOM-4. See #9425
+        index = DatetimeIndex(["2014-03-31", "2014-06-30", "2015-03-30"])
+        assert frequencies.infer_freq(index) is None
+
+    def test_week_of_month_fake(self):
+        # All of these dates are on same day of week and are 4 or 5 weeks apart
+        index = DatetimeIndex(["2013-08-27", "2013-10-01", "2013-10-29",
+                               "2013-11-26"])
+        assert frequencies.infer_freq(index) != 'WOM-4TUE'
+
+    def test_monthly(self):
+        self._check_generated_range('1/1/2000', 'M')
+
+    def test_monthly_ambiguous(self):
+        rng = _dti(['1/31/2000', '2/29/2000', '3/31/2000'])
+        assert rng.inferred_freq == 'M'
+
+    def test_business_monthly(self):
+        self._check_generated_range('1/1/2000', 'BM')
+
+    def test_business_start_monthly(self):
+        self._check_generated_range('1/1/2000', 'BMS')
+
+    def test_quarterly(self):
+        for month in ['JAN', 'FEB', 'MAR']:
+            self._check_generated_range('1/1/2000', 'Q-%s' % month)
+
+    def test_annual(self):
+        for month in MONTHS:
+            self._check_generated_range('1/1/2000', 'A-%s' % month)
+
+    def test_business_annual(self):
+        for month in MONTHS:
+            self._check_generated_range('1/1/2000', 'BA-%s' % month)
+
+    def test_annual_ambiguous(self):
+        rng = _dti(['1/31/2000', '1/31/2001', '1/31/2002'])
+        assert rng.inferred_freq == 'A-JAN'
+
+    def _check_generated_range(self, start, freq):
+        freq = freq.upper()
+
+        gen = date_range(start, periods=7, freq=freq)
+        index = _dti(gen.values)
+        if not freq.startswith('Q-'):
+            assert frequencies.infer_freq(index) == gen.freqstr
+        else:
+            inf_freq = frequencies.infer_freq(index)
+            is_dec_range = inf_freq == 'Q-DEC' and gen.freqstr in (
+                'Q', 'Q-DEC', 'Q-SEP', 'Q-JUN', 'Q-MAR')
+            is_nov_range = inf_freq == 'Q-NOV' and gen.freqstr in (
+                'Q-NOV', 'Q-AUG', 'Q-MAY', 'Q-FEB')
+            is_oct_range = inf_freq == 'Q-OCT' and gen.freqstr in (
+                'Q-OCT', 'Q-JUL', 'Q-APR', 'Q-JAN')
+            assert is_dec_range or is_nov_range or is_oct_range
+
+        gen = date_range(start, periods=5, freq=freq)
+        index = _dti(gen.values)
+
+        if not freq.startswith('Q-'):
+            assert frequencies.infer_freq(index) == gen.freqstr
+        else:
+            inf_freq = frequencies.infer_freq(index)
+            is_dec_range = inf_freq == 'Q-DEC' and gen.freqstr in (
+                'Q', 'Q-DEC', 'Q-SEP', 'Q-JUN', 'Q-MAR')
+            is_nov_range = inf_freq == 'Q-NOV' and gen.freqstr in (
+                'Q-NOV', 'Q-AUG', 'Q-MAY', 'Q-FEB')
+            is_oct_range = inf_freq == 'Q-OCT' and gen.freqstr in (
+                'Q-OCT', 'Q-JUL', 'Q-APR', 'Q-JAN')
+
+            assert is_dec_range or is_nov_range or is_oct_range
+
+    def test_infer_freq(self):
+        rng = period_range('1959Q2', '2009Q3', freq='Q')
+        rng = Index(rng.to_timestamp('D', how='e').astype(object))
+        assert rng.inferred_freq == 'Q-DEC'
+
+        rng = period_range('1959Q2', '2009Q3', freq='Q-NOV')
+        rng = Index(rng.to_timestamp('D', how='e').astype(object))
+        assert rng.inferred_freq == 'Q-NOV'
+
+        rng = period_range('1959Q2', '2009Q3', freq='Q-OCT')
+        rng = Index(rng.to_timestamp('D', how='e').astype(object))
+        assert rng.inferred_freq == 'Q-OCT'
+
+    def test_infer_freq_tz(self):
+
+        freqs = {'AS-JAN':
+                 ['2009-01-01', '2010-01-01', '2011-01-01', '2012-01-01'],
+                 'Q-OCT':
+                 ['2009-01-31', '2009-04-30', '2009-07-31', '2009-10-31'],
+                 'M': ['2010-11-30', '2010-12-31', '2011-01-31', '2011-02-28'],
+                 'W-SAT':
+                 ['2010-12-25', '2011-01-01', '2011-01-08', '2011-01-15'],
+                 'D': ['2011-01-01', '2011-01-02', '2011-01-03', '2011-01-04'],
+                 'H': ['2011-12-31 22:00', '2011-12-31 23:00',
+                       '2012-01-01 00:00', '2012-01-01 01:00']}
+
+        # GH 7310
+        for tz in [None, 'Australia/Sydney', 'Asia/Tokyo', 'Europe/Paris',
+                   'US/Pacific', 'US/Eastern']:
+            for expected, dates in compat.iteritems(freqs):
+                idx = DatetimeIndex(dates, tz=tz)
+                assert idx.inferred_freq == expected
+
+    def test_infer_freq_tz_transition(self):
+        # Tests for #8772
+        date_pairs = [['2013-11-02', '2013-11-5'],  # Fall DST
+                      ['2014-03-08', '2014-03-11'],  # Spring DST
+                      ['2014-01-01', '2014-01-03']]  # Regular Time
+        freqs = ['3H', '10T', '3601S', '3600001L', '3600000001U',
+                 '3600000000001N']
+
+        for tz in [None, 'Australia/Sydney', 'Asia/Tokyo', 'Europe/Paris',
+                   'US/Pacific', 'US/Eastern']:
+            for date_pair in date_pairs:
+                for freq in freqs:
+                    idx = date_range(date_pair[0], date_pair[
+                        1], freq=freq, tz=tz)
+                    assert idx.inferred_freq == freq
+
+        index = date_range("2013-11-03", periods=5,
+                           freq="3H").tz_localize("America/Chicago")
+        assert index.inferred_freq is None
+
+    def test_infer_freq_businesshour(self):
+        # GH 7905
+        idx = DatetimeIndex(
+            ['2014-07-01 09:00', '2014-07-01 10:00', '2014-07-01 11:00',
+             '2014-07-01 12:00', '2014-07-01 13:00', '2014-07-01 14:00'])
+        # hourly freq in a day must result in 'H'
+        assert idx.inferred_freq == 'H'
+
+        idx = DatetimeIndex(
+            ['2014-07-01 09:00', '2014-07-01 10:00', '2014-07-01 11:00',
+             '2014-07-01 12:00', '2014-07-01 13:00', '2014-07-01 14:00',
+             '2014-07-01 15:00', '2014-07-01 16:00', '2014-07-02 09:00',
+             '2014-07-02 10:00', '2014-07-02 11:00'])
+        assert idx.inferred_freq == 'BH'
+
+        idx = DatetimeIndex(
+            ['2014-07-04 09:00', '2014-07-04 10:00', '2014-07-04 11:00',
+             '2014-07-04 12:00', '2014-07-04 13:00', '2014-07-04 14:00',
+             '2014-07-04 15:00', '2014-07-04 16:00', '2014-07-07 09:00',
+             '2014-07-07 10:00', '2014-07-07 11:00'])
+        assert idx.inferred_freq == 'BH'
+
+        idx = DatetimeIndex(
+            ['2014-07-04 09:00', '2014-07-04 10:00', '2014-07-04 11:00',
+             '2014-07-04 12:00', '2014-07-04 13:00', '2014-07-04 14:00',
+             '2014-07-04 15:00', '2014-07-04 16:00', '2014-07-07 09:00',
+             '2014-07-07 10:00', '2014-07-07 11:00', '2014-07-07 12:00',
+             '2014-07-07 13:00', '2014-07-07 14:00', '2014-07-07 15:00',
+             '2014-07-07 16:00', '2014-07-08 09:00', '2014-07-08 10:00',
+             '2014-07-08 11:00', '2014-07-08 12:00', '2014-07-08 13:00',
+             '2014-07-08 14:00', '2014-07-08 15:00', '2014-07-08 16:00'])
+        assert idx.inferred_freq == 'BH'
+
+    def test_not_monotonic(self):
+        rng = _dti(['1/31/2000', '1/31/2001', '1/31/2002'])
+        rng = rng[::-1]
+        assert rng.inferred_freq == '-1A-JAN'
+
+    def test_non_datetimeindex2(self):
+        rng = _dti(['1/31/2000', '1/31/2001', '1/31/2002'])
+
+        vals = rng.to_pydatetime()
+
+        result = frequencies.infer_freq(vals)
+        assert result == rng.inferred_freq
+
+    def test_invalid_index_types(self):
+
+        # test all index types
+        for i in [tm.makeIntIndex(10), tm.makeFloatIndex(10),
+                  tm.makePeriodIndex(10)]:
+            pytest.raises(TypeError, lambda: frequencies.infer_freq(i))
+
+        # GH 10822
+        # odd error message on conversions to datetime for unicode
+        if not is_platform_windows():
+            for i in [tm.makeStringIndex(10), tm.makeUnicodeIndex(10)]:
+                pytest.raises(ValueError, lambda: frequencies.infer_freq(i))
+
+    def test_string_datetimelike_compat(self):
+
+        # GH 6463
+        expected = frequencies.infer_freq(['2004-01', '2004-02', '2004-03',
+                                           '2004-04'])
+        result = frequencies.infer_freq(Index(['2004-01', '2004-02', '2004-03',
+                                               '2004-04']))
+        assert result == expected
+
+    def test_series(self):
+
+        # GH6407
+        # inferring series
+
+        # invalid type of Series
+        for s in [Series(np.arange(10)), Series(np.arange(10.))]:
+            pytest.raises(TypeError, lambda: frequencies.infer_freq(s))
+
+        # a non-convertible string
+        pytest.raises(ValueError, lambda: frequencies.infer_freq(
+            Series(['foo', 'bar'])))
+
+        # cannot infer on PeriodIndex
+        for freq in [None, 'L']:
+            s = Series(period_range('2013', periods=10, freq=freq))
+            pytest.raises(TypeError, lambda: frequencies.infer_freq(s))
+
+        # DateTimeIndex
+        for freq in ['M', 'L', 'S']:
+            s = Series(date_range('20130101', periods=10, freq=freq))
+            inferred = frequencies.infer_freq(s)
+            assert inferred == freq
+
+        s = Series(date_range('20130101', '20130110'))
+        inferred = frequencies.infer_freq(s)
+        assert inferred == 'D'
+
+    def test_legacy_offset_warnings(self):
+        freqs = ['WEEKDAY', 'EOM', 'W@MON', 'W@TUE', 'W@WED', 'W@THU',
+                 'W@FRI', 'W@SAT', 'W@SUN', 'Q@JAN', 'Q@FEB', 'Q@MAR',
+                 'A@JAN', 'A@FEB', 'A@MAR', 'A@APR', 'A@MAY', 'A@JUN',
+                 'A@JUL', 'A@AUG', 'A@SEP', 'A@OCT', 'A@NOV', 'A@DEC',
+                 'Y@JAN', 'WOM@1MON', 'WOM@2MON', 'WOM@3MON',
+                 'WOM@4MON', 'WOM@1TUE', 'WOM@2TUE', 'WOM@3TUE',
+                 'WOM@4TUE', 'WOM@1WED', 'WOM@2WED', 'WOM@3WED',
+                 'WOM@4WED', 'WOM@1THU', 'WOM@2THU', 'WOM@3THU',
+                 'WOM@4THU', 'WOM@1FRI', 'WOM@2FRI', 'WOM@3FRI',
+                 'WOM@4FRI']
+
+        msg = _INVALID_FREQ_ERROR
+        for freq in freqs:
+            with tm.assert_raises_regex(ValueError, msg):
+                frequencies.get_offset(freq)
+
+            with tm.assert_raises_regex(ValueError, msg):
+                date_range('2011-01-01', periods=5, freq=freq)
diff --git a/pandas/tests/tseries/test_holiday.py b/pandas/tests/tseries/test_holiday.py
new file mode 100644
index 0000000000000..3ea7e5b8620f2
--- /dev/null
+++ b/pandas/tests/tseries/test_holiday.py
@@ -0,0 +1,385 @@
+import pytest
+
+from datetime import datetime
+import pandas.util.testing as tm
+from pandas import compat
+from pandas import DatetimeIndex
+from pandas.tseries.holiday import (USFederalHolidayCalendar, USMemorialDay,
+                                    USThanksgivingDay, nearest_workday,
+                                    next_monday_or_tuesday, next_monday,
+                                    previous_friday, sunday_to_monday, Holiday,
+                                    DateOffset, MO, SA, Timestamp,
+                                    AbstractHolidayCalendar, get_calendar,
+                                    HolidayCalendarFactory, next_workday,
+                                    previous_workday, before_nearest_workday,
+                                    EasterMonday, GoodFriday,
+                                    after_nearest_workday, weekend_to_monday,
+                                    USLaborDay, USColumbusDay,
+                                    USMartinLutherKingJr, USPresidentsDay)
+from pytz import utc
+
+
+class TestCalendar(object):
+
+    def setup_method(self, method):
+        self.holiday_list = [
+            datetime(2012, 1, 2),
+            datetime(2012, 1, 16),
+            datetime(2012, 2, 20),
+            datetime(2012, 5, 28),
+            datetime(2012, 7, 4),
+            datetime(2012, 9, 3),
+            datetime(2012, 10, 8),
+            datetime(2012, 11, 12),
+            datetime(2012, 11, 22),
+            datetime(2012, 12, 25)]
+
+        self.start_date = datetime(2012, 1, 1)
+        self.end_date = datetime(2012, 12, 31)
+
+    def test_calendar(self):
+
+        calendar = USFederalHolidayCalendar()
+        holidays = calendar.holidays(self.start_date, self.end_date)
+
+        holidays_1 = calendar.holidays(
+            self.start_date.strftime('%Y-%m-%d'),
+            self.end_date.strftime('%Y-%m-%d'))
+        holidays_2 = calendar.holidays(
+            Timestamp(self.start_date),
+            Timestamp(self.end_date))
+
+        assert list(holidays.to_pydatetime()) == self.holiday_list
+        assert list(holidays_1.to_pydatetime()) == self.holiday_list
+        assert list(holidays_2.to_pydatetime()) == self.holiday_list
+
+    def test_calendar_caching(self):
+        # Test for issue #9552
+
+        class TestCalendar(AbstractHolidayCalendar):
+
+            def __init__(self, name=None, rules=None):
+                super(TestCalendar, self).__init__(name=name, rules=rules)
+
+        jan1 = TestCalendar(rules=[Holiday('jan1', year=2015, month=1, day=1)])
+        jan2 = TestCalendar(rules=[Holiday('jan2', year=2015, month=1, day=2)])
+
+        tm.assert_index_equal(jan1.holidays(), DatetimeIndex(['01-Jan-2015']))
+        tm.assert_index_equal(jan2.holidays(), DatetimeIndex(['02-Jan-2015']))
+
+    def test_calendar_observance_dates(self):
+        # Test for issue 11477
+        USFedCal = get_calendar('USFederalHolidayCalendar')
+        holidays0 = USFedCal.holidays(datetime(2015, 7, 3), datetime(
+            2015, 7, 3))  # <-- same start and end dates
+        holidays1 = USFedCal.holidays(datetime(2015, 7, 3), datetime(
+            2015, 7, 6))  # <-- different start and end dates
+        holidays2 = USFedCal.holidays(datetime(2015, 7, 3), datetime(
+            2015, 7, 3))  # <-- same start and end dates
+
+        tm.assert_index_equal(holidays0, holidays1)
+        tm.assert_index_equal(holidays0, holidays2)
+
+    def test_rule_from_name(self):
+        USFedCal = get_calendar('USFederalHolidayCalendar')
+        assert USFedCal.rule_from_name('Thanksgiving') == USThanksgivingDay
+
+
+class TestHoliday(object):
+
+    def setup_method(self, method):
+        self.start_date = datetime(2011, 1, 1)
+        self.end_date = datetime(2020, 12, 31)
+
+    def check_results(self, holiday, start, end, expected):
+        assert list(holiday.dates(start, end)) == expected
+
+        # Verify that timezone info is preserved.
+        assert (list(holiday.dates(utc.localize(Timestamp(start)),
+                                   utc.localize(Timestamp(end)))) ==
+                [utc.localize(dt) for dt in expected])
+
+    def test_usmemorialday(self):
+        self.check_results(holiday=USMemorialDay,
+                           start=self.start_date,
+                           end=self.end_date,
+                           expected=[
+                               datetime(2011, 5, 30),
+                               datetime(2012, 5, 28),
+                               datetime(2013, 5, 27),
+                               datetime(2014, 5, 26),
+                               datetime(2015, 5, 25),
+                               datetime(2016, 5, 30),
+                               datetime(2017, 5, 29),
+                               datetime(2018, 5, 28),
+                               datetime(2019, 5, 27),
+                               datetime(2020, 5, 25),
+                           ], )
+
+    def test_non_observed_holiday(self):
+
+        self.check_results(
+            Holiday('July 4th Eve', month=7, day=3),
+            start="2001-01-01",
+            end="2003-03-03",
+            expected=[
+                Timestamp('2001-07-03 00:00:00'),
+                Timestamp('2002-07-03 00:00:00')
+            ]
+        )
+
+        self.check_results(
+            Holiday('July 4th Eve', month=7, day=3, days_of_week=(0, 1, 2, 3)),
+            start="2001-01-01",
+            end="2008-03-03",
+            expected=[
+                Timestamp('2001-07-03 00:00:00'),
+                Timestamp('2002-07-03 00:00:00'),
+                Timestamp('2003-07-03 00:00:00'),
+                Timestamp('2006-07-03 00:00:00'),
+                Timestamp('2007-07-03 00:00:00'),
+            ]
+        )
+
+    def test_easter(self):
+
+        self.check_results(EasterMonday,
+                           start=self.start_date,
+                           end=self.end_date,
+                           expected=[
+                               Timestamp('2011-04-25 00:00:00'),
+                               Timestamp('2012-04-09 00:00:00'),
+                               Timestamp('2013-04-01 00:00:00'),
+                               Timestamp('2014-04-21 00:00:00'),
+                               Timestamp('2015-04-06 00:00:00'),
+                               Timestamp('2016-03-28 00:00:00'),
+                               Timestamp('2017-04-17 00:00:00'),
+                               Timestamp('2018-04-02 00:00:00'),
+                               Timestamp('2019-04-22 00:00:00'),
+                               Timestamp('2020-04-13 00:00:00'),
+                           ], )
+        self.check_results(GoodFriday,
+                           start=self.start_date,
+                           end=self.end_date,
+                           expected=[
+                               Timestamp('2011-04-22 00:00:00'),
+                               Timestamp('2012-04-06 00:00:00'),
+                               Timestamp('2013-03-29 00:00:00'),
+                               Timestamp('2014-04-18 00:00:00'),
+                               Timestamp('2015-04-03 00:00:00'),
+                               Timestamp('2016-03-25 00:00:00'),
+                               Timestamp('2017-04-14 00:00:00'),
+                               Timestamp('2018-03-30 00:00:00'),
+                               Timestamp('2019-04-19 00:00:00'),
+                               Timestamp('2020-04-10 00:00:00'),
+                           ], )
+
+    def test_usthanksgivingday(self):
+
+        self.check_results(USThanksgivingDay,
+                           start=self.start_date,
+                           end=self.end_date,
+                           expected=[
+                               datetime(2011, 11, 24),
+                               datetime(2012, 11, 22),
+                               datetime(2013, 11, 28),
+                               datetime(2014, 11, 27),
+                               datetime(2015, 11, 26),
+                               datetime(2016, 11, 24),
+                               datetime(2017, 11, 23),
+                               datetime(2018, 11, 22),
+                               datetime(2019, 11, 28),
+                               datetime(2020, 11, 26),
+                           ], )
+
+    def test_holidays_within_dates(self):
+        # Fix holiday behavior found in #11477
+        # where holiday.dates returned dates outside start/end date
+        # or observed rules could not be applied as the holiday
+        # was not in the original date range (e.g., 7/4/2015 -> 7/3/2015)
+        start_date = datetime(2015, 7, 1)
+        end_date = datetime(2015, 7, 1)
+
+        calendar = get_calendar('USFederalHolidayCalendar')
+        new_years = calendar.rule_from_name('New Years Day')
+        july_4th = calendar.rule_from_name('July 4th')
+        veterans_day = calendar.rule_from_name('Veterans Day')
+        christmas = calendar.rule_from_name('Christmas')
+
+        # Holiday: (start/end date, holiday)
+        holidays = {USMemorialDay: ("2015-05-25", "2015-05-25"),
+                    USLaborDay: ("2015-09-07", "2015-09-07"),
+                    USColumbusDay: ("2015-10-12", "2015-10-12"),
+                    USThanksgivingDay: ("2015-11-26", "2015-11-26"),
+                    USMartinLutherKingJr: ("2015-01-19", "2015-01-19"),
+                    USPresidentsDay: ("2015-02-16", "2015-02-16"),
+                    GoodFriday: ("2015-04-03", "2015-04-03"),
+                    EasterMonday: [("2015-04-06", "2015-04-06"),
+                                   ("2015-04-05", [])],
+                    new_years: [("2015-01-01", "2015-01-01"),
+                                ("2011-01-01", []),
+                                ("2010-12-31", "2010-12-31")],
+                    july_4th: [("2015-07-03", "2015-07-03"),
+                               ("2015-07-04", [])],
+                    veterans_day: [("2012-11-11", []),
+                                   ("2012-11-12", "2012-11-12")],
+                    christmas: [("2011-12-25", []),
+                                ("2011-12-26", "2011-12-26")]}
+
+        for rule, dates in compat.iteritems(holidays):
+            empty_dates = rule.dates(start_date, end_date)
+            assert empty_dates.tolist() == []
+
+            if isinstance(dates, tuple):
+                dates = [dates]
+
+            for start, expected in dates:
+                if len(expected):
+                    expected = [Timestamp(expected)]
+                self.check_results(rule, start, start, expected)
+
+    def test_argument_types(self):
+        holidays = USThanksgivingDay.dates(self.start_date, self.end_date)
+
+        holidays_1 = USThanksgivingDay.dates(
+            self.start_date.strftime('%Y-%m-%d'),
+            self.end_date.strftime('%Y-%m-%d'))
+
+        holidays_2 = USThanksgivingDay.dates(
+            Timestamp(self.start_date),
+            Timestamp(self.end_date))
+
+        tm.assert_index_equal(holidays, holidays_1)
+        tm.assert_index_equal(holidays, holidays_2)
+
+    def test_special_holidays(self):
+        base_date = [datetime(2012, 5, 28)]
+        holiday_1 = Holiday('One-Time', year=2012, month=5, day=28)
+        holiday_2 = Holiday('Range', month=5, day=28,
+                            start_date=datetime(2012, 1, 1),
+                            end_date=datetime(2012, 12, 31),
+                            offset=DateOffset(weekday=MO(1)))
+
+        assert base_date == holiday_1.dates(self.start_date, self.end_date)
+        assert base_date == holiday_2.dates(self.start_date, self.end_date)
+
+    def test_get_calendar(self):
+        class TestCalendar(AbstractHolidayCalendar):
+            rules = []
+
+        calendar = get_calendar('TestCalendar')
+        assert TestCalendar == calendar.__class__
+
+    def test_factory(self):
+        class_1 = HolidayCalendarFactory('MemorialDay',
+                                         AbstractHolidayCalendar,
+                                         USMemorialDay)
+        class_2 = HolidayCalendarFactory('Thansksgiving',
+                                         AbstractHolidayCalendar,
+                                         USThanksgivingDay)
+        class_3 = HolidayCalendarFactory('Combined', class_1, class_2)
+
+        assert len(class_1.rules) == 1
+        assert len(class_2.rules) == 1
+        assert len(class_3.rules) == 2
+
+
+class TestObservanceRules(object):
+
+    def setup_method(self, method):
+        self.we = datetime(2014, 4, 9)
+        self.th = datetime(2014, 4, 10)
+        self.fr = datetime(2014, 4, 11)
+        self.sa = datetime(2014, 4, 12)
+        self.su = datetime(2014, 4, 13)
+        self.mo = datetime(2014, 4, 14)
+        self.tu = datetime(2014, 4, 15)
+
+    def test_next_monday(self):
+        assert next_monday(self.sa) == self.mo
+        assert next_monday(self.su) == self.mo
+
+    def test_next_monday_or_tuesday(self):
+        assert next_monday_or_tuesday(self.sa) == self.mo
+        assert next_monday_or_tuesday(self.su) == self.tu
+        assert next_monday_or_tuesday(self.mo) == self.tu
+
+    def test_previous_friday(self):
+        assert previous_friday(self.sa) == self.fr
+        assert previous_friday(self.su) == self.fr
+
+    def test_sunday_to_monday(self):
+        assert sunday_to_monday(self.su) == self.mo
+
+    def test_nearest_workday(self):
+        assert nearest_workday(self.sa) == self.fr
+        assert nearest_workday(self.su) == self.mo
+        assert nearest_workday(self.mo) == self.mo
+
+    def test_weekend_to_monday(self):
+        assert weekend_to_monday(self.sa) == self.mo
+        assert weekend_to_monday(self.su) == self.mo
+        assert weekend_to_monday(self.mo) == self.mo
+
+    def test_next_workday(self):
+        assert next_workday(self.sa) == self.mo
+        assert next_workday(self.su) == self.mo
+        assert next_workday(self.mo) == self.tu
+
+    def test_previous_workday(self):
+        assert previous_workday(self.sa) == self.fr
+        assert previous_workday(self.su) == self.fr
+        assert previous_workday(self.tu) == self.mo
+
+    def test_before_nearest_workday(self):
+        assert before_nearest_workday(self.sa) == self.th
+        assert before_nearest_workday(self.su) == self.fr
+        assert before_nearest_workday(self.tu) == self.mo
+
+    def test_after_nearest_workday(self):
+        assert after_nearest_workday(self.sa) == self.mo
+        assert after_nearest_workday(self.su) == self.tu
+        assert after_nearest_workday(self.fr) == self.mo
+
+
+class TestFederalHolidayCalendar(object):
+
+    def test_no_mlk_before_1986(self):
+        # see gh-10278
+        class MLKCalendar(AbstractHolidayCalendar):
+            rules = [USMartinLutherKingJr]
+
+        holidays = MLKCalendar().holidays(start='1984',
+                                          end='1988').to_pydatetime().tolist()
+
+        # Testing to make sure holiday is not incorrectly observed before 1986
+        assert holidays == [datetime(1986, 1, 20, 0, 0),
+                            datetime(1987, 1, 19, 0, 0)]
+
+    def test_memorial_day(self):
+        class MemorialDay(AbstractHolidayCalendar):
+            rules = [USMemorialDay]
+
+        holidays = MemorialDay().holidays(start='1971',
+                                          end='1980').to_pydatetime().tolist()
+
+        # Fixes 5/31 error and checked manually against Wikipedia
+        assert holidays == [datetime(1971, 5, 31, 0, 0),
+                            datetime(1972, 5, 29, 0, 0),
+                            datetime(1973, 5, 28, 0, 0),
+                            datetime(1974, 5, 27, 0, 0),
+                            datetime(1975, 5, 26, 0, 0),
+                            datetime(1976, 5, 31, 0, 0),
+                            datetime(1977, 5, 30, 0, 0),
+                            datetime(1978, 5, 29, 0, 0),
+                            datetime(1979, 5, 28, 0, 0)]
+
+
+class TestHolidayConflictingArguments(object):
+
+    def test_both_offset_observance_raises(self):
+        # see gh-10217
+        with pytest.raises(NotImplementedError):
+            Holiday("Cyber Monday", month=11, day=1,
+                    offset=[DateOffset(weekday=SA(4))],
+                    observance=next_monday)
diff --git a/pandas/tests/tslibs/__init__.py b/pandas/tests/tslibs/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/tslibs/test_array_to_datetime.py b/pandas/tests/tslibs/test_array_to_datetime.py
new file mode 100644
index 0000000000000..eb77e52e7c91d
--- /dev/null
+++ b/pandas/tests/tslibs/test_array_to_datetime.py
@@ -0,0 +1,145 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime, date
+
+import numpy as np
+import pytest
+
+from pandas._libs import tslib
+from pandas.compat.numpy import np_array_datetime64_compat
+import pandas.util.testing as tm
+
+
+class TestParseISO8601(object):
+    @pytest.mark.parametrize('date_str, exp', [
+        ('2011-01-02', datetime(2011, 1, 2)),
+        ('2011-1-2', datetime(2011, 1, 2)),
+        ('2011-01', datetime(2011, 1, 1)),
+        ('2011-1', datetime(2011, 1, 1)),
+        ('2011 01 02', datetime(2011, 1, 2)),
+        ('2011.01.02', datetime(2011, 1, 2)),
+        ('2011/01/02', datetime(2011, 1, 2)),
+        ('2011\\01\\02', datetime(2011, 1, 2)),
+        ('2013-01-01 05:30:00', datetime(2013, 1, 1, 5, 30)),
+        ('2013-1-1 5:30:00', datetime(2013, 1, 1, 5, 30))])
+    def test_parsers_iso8601(self, date_str, exp):
+        # GH#12060
+        # test only the iso parser - flexibility to different
+        # separators and leadings 0s
+        # Timestamp construction falls back to dateutil
+        actual = tslib._test_parse_iso8601(date_str)
+        assert actual == exp
+
+    @pytest.mark.parametrize(
+        'date_str',
+        ['2011-01/02', '2011^11^11',
+         '201401', '201111', '200101',
+         # mixed separated and unseparated
+         '2005-0101', '200501-01',
+         '20010101 12:3456',
+         '20010101 1234:56',
+         # HHMMSS must have two digits in
+         # each component if unseparated
+         '20010101 1', '20010101 123',
+         '20010101 12345', '20010101 12345Z',
+         # wrong separator for HHMMSS
+         '2001-01-01 12-34-56'])
+    def test_parsers_iso8601_invalid(self, date_str):
+        # separators must all match - YYYYMM not valid
+        with pytest.raises(ValueError):
+            tslib._test_parse_iso8601(date_str)
+
+
+class TestArrayToDatetime(object):
+    def test_parsing_valid_dates(self):
+        arr = np.array(['01-01-2013', '01-02-2013'], dtype=object)
+        result = tslib.array_to_datetime(arr)
+        expected = ['2013-01-01T00:00:00.000000000-0000',
+                    '2013-01-02T00:00:00.000000000-0000']
+        tm.assert_numpy_array_equal(
+            result,
+            np_array_datetime64_compat(expected, dtype='M8[ns]'))
+
+        arr = np.array(['Mon Sep 16 2013', 'Tue Sep 17 2013'], dtype=object)
+        result = tslib.array_to_datetime(arr)
+        expected = ['2013-09-16T00:00:00.000000000-0000',
+                    '2013-09-17T00:00:00.000000000-0000']
+        tm.assert_numpy_array_equal(
+            result,
+            np_array_datetime64_compat(expected, dtype='M8[ns]'))
+
+    @pytest.mark.parametrize('dt_string', [
+        '01-01-2013 08:00:00+08:00',
+        '2013-01-01T08:00:00.000000000+0800',
+        '2012-12-31T16:00:00.000000000-0800',
+        '12-31-2012 23:00:00-01:00'])
+    def test_parsing_timezone_offsets(self, dt_string):
+        # All of these datetime strings with offsets are equivalent
+        # to the same datetime after the timezone offset is added
+        arr = np.array(['01-01-2013 00:00:00'], dtype=object)
+        expected = tslib.array_to_datetime(arr)
+
+        arr = np.array([dt_string], dtype=object)
+        result = tslib.array_to_datetime(arr)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_number_looking_strings_not_into_datetime(self):
+        # GH#4601
+        # These strings don't look like datetimes so they shouldn't be
+        # attempted to be converted
+        arr = np.array(['-352.737091', '183.575577'], dtype=object)
+        result = tslib.array_to_datetime(arr, errors='ignore')
+        tm.assert_numpy_array_equal(result, arr)
+
+        arr = np.array(['1', '2', '3', '4', '5'], dtype=object)
+        result = tslib.array_to_datetime(arr, errors='ignore')
+        tm.assert_numpy_array_equal(result, arr)
+
+    @pytest.mark.parametrize('invalid_date', [
+        date(1000, 1, 1),
+        datetime(1000, 1, 1),
+        '1000-01-01',
+        'Jan 1, 1000',
+        np.datetime64('1000-01-01')])
+    def test_coerce_outside_ns_bounds(self, invalid_date):
+        arr = np.array([invalid_date], dtype='object')
+        with pytest.raises(ValueError):
+            tslib.array_to_datetime(arr, errors='raise')
+
+        result = tslib.array_to_datetime(arr, errors='coerce')
+        expected = np.array([tslib.iNaT], dtype='M8[ns]')
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_coerce_outside_ns_bounds_one_valid(self):
+        arr = np.array(['1/1/1000', '1/1/2000'], dtype=object)
+        result = tslib.array_to_datetime(arr, errors='coerce')
+        expected = [tslib.iNaT,
+                    '2000-01-01T00:00:00.000000000-0000']
+        tm.assert_numpy_array_equal(
+            result,
+            np_array_datetime64_compat(expected, dtype='M8[ns]'))
+
+    def test_coerce_of_invalid_datetimes(self):
+        arr = np.array(['01-01-2013', 'not_a_date', '1'], dtype=object)
+
+        # Without coercing, the presence of any invalid dates prevents
+        # any values from being converted
+        result = tslib.array_to_datetime(arr, errors='ignore')
+        tm.assert_numpy_array_equal(result, arr)
+
+        # With coercing, the invalid dates becomes iNaT
+        result = tslib.array_to_datetime(arr, errors='coerce')
+        expected = ['2013-01-01T00:00:00.000000000-0000',
+                    tslib.iNaT,
+                    tslib.iNaT]
+
+        tm.assert_numpy_array_equal(
+            result,
+            np_array_datetime64_compat(expected, dtype='M8[ns]'))
+
+    def test_to_datetime_barely_out_of_bounds(self):
+        # GH#19529
+        # GH#19382 close enough to bounds that dropping nanos would result
+        # in an in-bounds datetime
+        arr = np.array(['2262-04-11 23:47:16.854775808'], dtype=object)
+        with pytest.raises(tslib.OutOfBoundsDatetime):
+            tslib.array_to_datetime(arr)
diff --git a/pandas/tests/tslibs/test_ccalendar.py b/pandas/tests/tslibs/test_ccalendar.py
new file mode 100644
index 0000000000000..b5d562a7b5a9c
--- /dev/null
+++ b/pandas/tests/tslibs/test_ccalendar.py
@@ -0,0 +1,18 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime
+
+import numpy as np
+
+from pandas._libs.tslibs import ccalendar
+
+
+def test_get_day_of_year():
+    assert ccalendar.get_day_of_year(2001, 3, 1) == 60
+    assert ccalendar.get_day_of_year(2004, 3, 1) == 61
+    assert ccalendar.get_day_of_year(1907, 12, 31) == 365
+    assert ccalendar.get_day_of_year(2004, 12, 31) == 366
+
+    dt = datetime.fromordinal(1 + np.random.randint(365 * 4000))
+    result = ccalendar.get_day_of_year(dt.year, dt.month, dt.day)
+    expected = (dt - dt.replace(month=1, day=1)).days + 1
+    assert result == expected
diff --git a/pandas/tests/tslibs/test_conversion.py b/pandas/tests/tslibs/test_conversion.py
new file mode 100644
index 0000000000000..76038136c26cb
--- /dev/null
+++ b/pandas/tests/tslibs/test_conversion.py
@@ -0,0 +1,57 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+import pandas.util.testing as tm
+from pandas import date_range
+from pandas._libs.tslib import iNaT
+from pandas._libs.tslibs import conversion, timezones
+
+
+def compare_utc_to_local(tz_didx, utc_didx):
+    f = lambda x: conversion.tz_convert_single(x, 'UTC', tz_didx.tz)
+    result = conversion.tz_convert(tz_didx.asi8, 'UTC', tz_didx.tz)
+    result_single = np.vectorize(f)(tz_didx.asi8)
+    tm.assert_numpy_array_equal(result, result_single)
+
+
+def compare_local_to_utc(tz_didx, utc_didx):
+    f = lambda x: conversion.tz_convert_single(x, tz_didx.tz, 'UTC')
+    result = conversion.tz_convert(utc_didx.asi8, tz_didx.tz, 'UTC')
+    result_single = np.vectorize(f)(utc_didx.asi8)
+    tm.assert_numpy_array_equal(result, result_single)
+
+
+class TestTZConvert(object):
+
+    @pytest.mark.parametrize('tz', ['UTC', 'Asia/Tokyo',
+                                    'US/Eastern', 'Europe/Moscow'])
+    def test_tz_convert_single_matches_tz_convert_hourly(self, tz):
+        # US: 2014-03-09 - 2014-11-11
+        # MOSCOW: 2014-10-26  /  2014-12-31
+        tz_didx = date_range('2014-03-01', '2015-01-10', freq='H', tz=tz)
+        utc_didx = date_range('2014-03-01', '2015-01-10', freq='H')
+        compare_utc_to_local(tz_didx, utc_didx)
+
+        # local tz to UTC can be differ in hourly (or higher) freqs because
+        # of DST
+        compare_local_to_utc(tz_didx, utc_didx)
+
+    @pytest.mark.parametrize('tz', ['UTC', 'Asia/Tokyo',
+                                    'US/Eastern', 'Europe/Moscow'])
+    @pytest.mark.parametrize('freq', ['D', 'A'])
+    def test_tz_convert_single_matches_tz_convert(self, tz, freq):
+        tz_didx = date_range('2000-01-01', '2020-01-01', freq=freq, tz=tz)
+        utc_didx = date_range('2000-01-01', '2020-01-01', freq=freq)
+        compare_utc_to_local(tz_didx, utc_didx)
+        compare_local_to_utc(tz_didx, utc_didx)
+
+    @pytest.mark.parametrize('arr', [
+        pytest.param(np.array([], dtype=np.int64), id='empty'),
+        pytest.param(np.array([iNaT], dtype=np.int64), id='all_nat')])
+    def test_tz_convert_corner(self, arr):
+        result = conversion.tz_convert(arr,
+                                       timezones.maybe_get_tz('US/Eastern'),
+                                       timezones.maybe_get_tz('Asia/Tokyo'))
+        tm.assert_numpy_array_equal(result, arr)
diff --git a/pandas/tests/tslibs/test_libfrequencies.py b/pandas/tests/tslibs/test_libfrequencies.py
new file mode 100644
index 0000000000000..601d542da3095
--- /dev/null
+++ b/pandas/tests/tslibs/test_libfrequencies.py
@@ -0,0 +1,116 @@
+# -*- coding: utf-8 -*-
+
+import pandas.util.testing as tm
+
+from pandas.tseries import offsets
+from pandas._libs.tslibs.frequencies import (get_rule_month,
+                                             _period_str_to_code,
+                                             _INVALID_FREQ_ERROR,
+                                             is_superperiod, is_subperiod)
+
+
+def assert_aliases_deprecated(freq, expected, aliases):
+    assert isinstance(aliases, list)
+    assert (_period_str_to_code(freq) == expected)
+
+    for alias in aliases:
+        with tm.assert_raises_regex(ValueError, _INVALID_FREQ_ERROR):
+            _period_str_to_code(alias)
+
+
+def test_get_rule_month():
+    result = get_rule_month('W')
+    assert (result == 'DEC')
+    result = get_rule_month(offsets.Week())
+    assert (result == 'DEC')
+
+    result = get_rule_month('D')
+    assert (result == 'DEC')
+    result = get_rule_month(offsets.Day())
+    assert (result == 'DEC')
+
+    result = get_rule_month('Q')
+    assert (result == 'DEC')
+    result = get_rule_month(offsets.QuarterEnd(startingMonth=12))
+
+    result = get_rule_month('Q-JAN')
+    assert (result == 'JAN')
+    result = get_rule_month(offsets.QuarterEnd(startingMonth=1))
+    assert (result == 'JAN')
+
+    result = get_rule_month('A-DEC')
+    assert (result == 'DEC')
+    result = get_rule_month('Y-DEC')
+    assert (result == 'DEC')
+    result = get_rule_month(offsets.YearEnd())
+    assert (result == 'DEC')
+
+    result = get_rule_month('A-MAY')
+    assert (result == 'MAY')
+    result = get_rule_month('Y-MAY')
+    assert (result == 'MAY')
+    result = get_rule_month(offsets.YearEnd(month=5))
+    assert (result == 'MAY')
+
+
+def test_period_str_to_code():
+    assert (_period_str_to_code('A') == 1000)
+    assert (_period_str_to_code('A-DEC') == 1000)
+    assert (_period_str_to_code('A-JAN') == 1001)
+    assert (_period_str_to_code('Y') == 1000)
+    assert (_period_str_to_code('Y-DEC') == 1000)
+    assert (_period_str_to_code('Y-JAN') == 1001)
+
+    assert (_period_str_to_code('Q') == 2000)
+    assert (_period_str_to_code('Q-DEC') == 2000)
+    assert (_period_str_to_code('Q-FEB') == 2002)
+
+    assert_aliases_deprecated("M", 3000, ["MTH", "MONTH", "MONTHLY"])
+
+    assert (_period_str_to_code('W') == 4000)
+    assert (_period_str_to_code('W-SUN') == 4000)
+    assert (_period_str_to_code('W-FRI') == 4005)
+
+    assert_aliases_deprecated("B", 5000, ["BUS", "BUSINESS",
+                                          "BUSINESSLY", "WEEKDAY"])
+    assert_aliases_deprecated("D", 6000, ["DAY", "DLY", "DAILY"])
+    assert_aliases_deprecated("H", 7000, ["HR", "HOUR", "HRLY", "HOURLY"])
+
+    assert_aliases_deprecated("T", 8000, ["minute", "MINUTE", "MINUTELY"])
+    assert (_period_str_to_code('Min') == 8000)
+
+    assert_aliases_deprecated("S", 9000, ["sec", "SEC", "SECOND", "SECONDLY"])
+    assert_aliases_deprecated("L", 10000, ["MILLISECOND", "MILLISECONDLY"])
+    assert (_period_str_to_code('ms') == 10000)
+
+    assert_aliases_deprecated("U", 11000, ["MICROSECOND", "MICROSECONDLY"])
+    assert (_period_str_to_code('US') == 11000)
+
+    assert_aliases_deprecated("N", 12000, ["NANOSECOND", "NANOSECONDLY"])
+    assert (_period_str_to_code('NS') == 12000)
+
+
+def test_is_superperiod_subperiod():
+
+    # input validation
+    assert not (is_superperiod(offsets.YearEnd(), None))
+    assert not (is_subperiod(offsets.MonthEnd(), None))
+    assert not (is_superperiod(None, offsets.YearEnd()))
+    assert not (is_subperiod(None, offsets.MonthEnd()))
+    assert not (is_superperiod(None, None))
+    assert not (is_subperiod(None, None))
+
+    assert (is_superperiod(offsets.YearEnd(), offsets.MonthEnd()))
+    assert (is_subperiod(offsets.MonthEnd(), offsets.YearEnd()))
+
+    assert (is_superperiod(offsets.Hour(), offsets.Minute()))
+    assert (is_subperiod(offsets.Minute(), offsets.Hour()))
+
+    assert (is_superperiod(offsets.Second(), offsets.Milli()))
+    assert (is_subperiod(offsets.Milli(), offsets.Second()))
+
+    assert (is_superperiod(offsets.Milli(), offsets.Micro()))
+    assert (is_subperiod(offsets.Micro(), offsets.Milli()))
+
+    assert (is_superperiod(offsets.Micro(), offsets.Nano()))
+    assert (is_subperiod(offsets.Nano(), offsets.Micro()))
diff --git a/pandas/tests/tslibs/test_liboffsets.py b/pandas/tests/tslibs/test_liboffsets.py
new file mode 100644
index 0000000000000..a31a79d2f68ed
--- /dev/null
+++ b/pandas/tests/tslibs/test_liboffsets.py
@@ -0,0 +1,172 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for helper functions in the cython tslibs.offsets
+"""
+from datetime import datetime
+
+import pytest
+
+from pandas import Timestamp
+
+import pandas._libs.tslibs.offsets as liboffsets
+from pandas._libs.tslibs.offsets import roll_qtrday
+
+
+def test_get_lastbday():
+    dt = datetime(2017, 11, 30)
+    assert dt.weekday() == 3  # i.e. this is a business day
+    assert liboffsets.get_lastbday(dt.year, dt.month) == 30
+
+    dt = datetime(1993, 10, 31)
+    assert dt.weekday() == 6  # i.e. this is not a business day
+    assert liboffsets.get_lastbday(dt.year, dt.month) == 29
+
+
+def test_get_firstbday():
+    dt = datetime(2017, 4, 1)
+    assert dt.weekday() == 5  # i.e. not a weekday
+    assert liboffsets.get_firstbday(dt.year, dt.month) == 3
+
+    dt = datetime(1993, 10, 1)
+    assert dt.weekday() == 4  # i.e. a business day
+    assert liboffsets.get_firstbday(dt.year, dt.month) == 1
+
+
+def test_shift_month():
+    dt = datetime(2017, 11, 30)
+    assert liboffsets.shift_month(dt, 0, 'business_end') == dt
+    assert liboffsets.shift_month(dt, 0,
+                                  'business_start') == datetime(2017, 11, 1)
+
+    ts = Timestamp('1929-05-05')
+    assert liboffsets.shift_month(ts, 1, 'start') == Timestamp('1929-06-01')
+    assert liboffsets.shift_month(ts, -3, 'end') == Timestamp('1929-02-28')
+
+    assert liboffsets.shift_month(ts, 25, None) == Timestamp('1931-06-5')
+
+    # Try to shift to April 31, then shift back to Apr 30 to get a real date
+    assert liboffsets.shift_month(ts, -1, 31) == Timestamp('1929-04-30')
+
+    dt = datetime(2017, 11, 15)
+
+    assert liboffsets.shift_month(dt, 0, day_opt=None) == dt
+    assert liboffsets.shift_month(dt, 0, day_opt=15) == dt
+
+    assert liboffsets.shift_month(dt, 1,
+                                  day_opt='start') == datetime(2017, 12, 1)
+
+    assert liboffsets.shift_month(dt, -145,
+                                  day_opt='end') == datetime(2005, 10, 31)
+
+    with pytest.raises(ValueError):
+        liboffsets.shift_month(dt, 3, day_opt='this should raise')
+
+
+def test_get_day_of_month():
+    # get_day_of_month is not directly exposed; we test it via roll_yearday
+    dt = datetime(2017, 11, 15)
+
+    with pytest.raises(ValueError):
+        # To hit the raising case we need month == dt.month and n > 0
+        liboffsets.roll_yearday(dt, n=3, month=11, day_opt='foo')
+
+
+def test_roll_yearday():
+    # Copied from doctest examples
+    month = 3
+    day_opt = 'start'              # `other` will be compared to March 1
+    other = datetime(2017, 2, 10)  # before March 1
+    assert liboffsets.roll_yearday(other, 2, month, day_opt) == 1
+    assert liboffsets.roll_yearday(other, -7, month, day_opt) == -7
+    assert liboffsets.roll_yearday(other, 0, month, day_opt) == 0
+
+    other = Timestamp('2014-03-15', tz='US/Eastern')  # after March 1
+    assert liboffsets.roll_yearday(other, 2, month, day_opt) == 2
+    assert liboffsets.roll_yearday(other, -7, month, day_opt) == -6
+    assert liboffsets.roll_yearday(other, 0, month, day_opt) == 1
+
+    month = 6
+    day_opt = 'end'                # `other` will be compared to June 30
+    other = datetime(1999, 6, 29)  # before June 30
+    assert liboffsets.roll_yearday(other, 5, month, day_opt) == 4
+    assert liboffsets.roll_yearday(other, -7, month, day_opt) == -7
+    assert liboffsets.roll_yearday(other, 0, month, day_opt) == 0
+
+    other = Timestamp(2072, 8, 24, 6, 17, 18)  # after June 30
+    assert liboffsets.roll_yearday(other, 5, month, day_opt) == 5
+    assert liboffsets.roll_yearday(other, -7, month, day_opt) == -6
+    assert liboffsets.roll_yearday(other, 0, month, day_opt) == 1
+
+
+def test_roll_qtrday():
+    other = Timestamp(2072, 10, 1, 6, 17, 18)  # Saturday
+    for day_opt in ['start', 'end', 'business_start', 'business_end']:
+        # as long as (other.month % 3) != (month % 3), day_opt is irrelevant
+        # the `day_opt` doesn't matter.
+        month = 5  # (other.month % 3) < (month % 3)
+        assert roll_qtrday(other, 4, month, day_opt, modby=3) == 3
+        assert roll_qtrday(other, -3, month, day_opt, modby=3) == -3
+
+        month = 3  # (other.month % 3) > (month % 3)
+        assert roll_qtrday(other, 4, month, day_opt, modby=3) == 4
+        assert roll_qtrday(other, -3, month, day_opt, modby=3) == -2
+
+    month = 2
+    other = datetime(1999, 5, 31)  # Monday
+    # has (other.month % 3) == (month % 3)
+
+    n = 2
+    assert roll_qtrday(other, n, month, 'start', modby=3) == n
+    assert roll_qtrday(other, n, month, 'end', modby=3) == n
+    assert roll_qtrday(other, n, month, 'business_start', modby=3) == n
+    assert roll_qtrday(other, n, month, 'business_end', modby=3) == n
+
+    n = -1
+    assert roll_qtrday(other, n, month, 'start', modby=3) == n + 1
+    assert roll_qtrday(other, n, month, 'end', modby=3) == n
+    assert roll_qtrday(other, n, month, 'business_start', modby=3) == n + 1
+    assert roll_qtrday(other, n, month, 'business_end', modby=3) == n
+
+    other = Timestamp(2072, 10, 1, 6, 17, 18)  # Saturday
+    month = 4  # (other.month % 3) == (month % 3)
+    n = 2
+    assert roll_qtrday(other, n, month, 'start', modby=3) == n
+    assert roll_qtrday(other, n, month, 'end', modby=3) == n - 1
+    assert roll_qtrday(other, n, month, 'business_start', modby=3) == n - 1
+    assert roll_qtrday(other, n, month, 'business_end', modby=3) == n - 1
+
+    n = -1
+    assert roll_qtrday(other, n, month, 'start', modby=3) == n
+    assert roll_qtrday(other, n, month, 'end', modby=3) == n
+    assert roll_qtrday(other, n, month, 'business_start', modby=3) == n
+    assert roll_qtrday(other, n, month, 'business_end', modby=3) == n
+
+    other = Timestamp(2072, 10, 3, 6, 17, 18)  # First businessday
+    month = 4  # (other.month % 3) == (month % 3)
+    n = 2
+    assert roll_qtrday(other, n, month, 'start', modby=3) == n
+    assert roll_qtrday(other, n, month, 'end', modby=3) == n - 1
+    assert roll_qtrday(other, n, month, 'business_start', modby=3) == n
+    assert roll_qtrday(other, n, month, 'business_end', modby=3) == n - 1
+
+    n = -1
+    assert roll_qtrday(other, n, month, 'start', modby=3) == n + 1
+    assert roll_qtrday(other, n, month, 'end', modby=3) == n
+    assert roll_qtrday(other, n, month, 'business_start', modby=3) == n
+    assert roll_qtrday(other, n, month, 'business_end', modby=3) == n
+
+
+def test_roll_convention():
+    other = 29
+    before = 1
+    after = 31
+
+    n = 42
+    assert liboffsets.roll_convention(other, n, other) == n
+    assert liboffsets.roll_convention(other, n, before) == n
+    assert liboffsets.roll_convention(other, n, after) == n - 1
+
+    n = -4
+    assert liboffsets.roll_convention(other, n, other) == n
+    assert liboffsets.roll_convention(other, n, before) == n + 1
+    assert liboffsets.roll_convention(other, n, after) == n
diff --git a/pandas/tests/tslibs/test_parsing.py b/pandas/tests/tslibs/test_parsing.py
new file mode 100644
index 0000000000000..14c9ca1f6cc54
--- /dev/null
+++ b/pandas/tests/tslibs/test_parsing.py
@@ -0,0 +1,175 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for Timestamp parsing, aimed at pandas/_libs/tslibs/parsing.pyx
+"""
+from datetime import datetime
+import numpy as np
+import pytest
+from dateutil.parser import parse
+
+import pandas.util._test_decorators as td
+from pandas import compat
+from pandas.util import testing as tm
+from pandas._libs.tslibs import parsing
+from pandas._libs.tslibs.parsing import parse_time_string
+
+
+class TestParseQuarters(object):
+
+    def test_parse_time_string(self):
+        (date, parsed, reso) = parse_time_string('4Q1984')
+        (date_lower, parsed_lower, reso_lower) = parse_time_string('4q1984')
+        assert date == date_lower
+        assert parsed == parsed_lower
+        assert reso == reso_lower
+
+    def test_parse_time_quarter_w_dash(self):
+        # https://github.com/pandas-dev/pandas/issue/9688
+        pairs = [('1988-Q2', '1988Q2'), ('2Q-1988', '2Q1988')]
+
+        for dashed, normal in pairs:
+            (date_dash, parsed_dash, reso_dash) = parse_time_string(dashed)
+            (date, parsed, reso) = parse_time_string(normal)
+
+            assert date_dash == date
+            assert parsed_dash == parsed
+            assert reso_dash == reso
+
+        pytest.raises(parsing.DateParseError, parse_time_string, "-2Q1992")
+        pytest.raises(parsing.DateParseError, parse_time_string, "2-Q1992")
+        pytest.raises(parsing.DateParseError, parse_time_string, "4-4Q1992")
+
+
+class TestDatetimeParsingWrappers(object):
+    def test_does_not_convert_mixed_integer(self):
+        bad_date_strings = ('-50000', '999', '123.1234', 'm', 'T')
+
+        for bad_date_string in bad_date_strings:
+            assert not parsing._does_string_look_like_datetime(bad_date_string)
+
+        good_date_strings = ('2012-01-01',
+                             '01/01/2012',
+                             'Mon Sep 16, 2013',
+                             '01012012',
+                             '0101',
+                             '1-1')
+
+        for good_date_string in good_date_strings:
+            assert parsing._does_string_look_like_datetime(good_date_string)
+
+    def test_parsers_quarterly_with_freq(self):
+        msg = ('Incorrect quarterly string is given, quarter '
+               'must be between 1 and 4: 2013Q5')
+        with tm.assert_raises_regex(parsing.DateParseError, msg):
+            parsing.parse_time_string('2013Q5')
+
+        # GH 5418
+        msg = ('Unable to retrieve month information from given freq: '
+               'INVLD-L-DEC-SAT')
+        with tm.assert_raises_regex(parsing.DateParseError, msg):
+            parsing.parse_time_string('2013Q1', freq='INVLD-L-DEC-SAT')
+
+        cases = {('2013Q2', None): datetime(2013, 4, 1),
+                 ('2013Q2', 'A-APR'): datetime(2012, 8, 1),
+                 ('2013-Q2', 'A-DEC'): datetime(2013, 4, 1)}
+
+        for (date_str, freq), exp in compat.iteritems(cases):
+            result, _, _ = parsing.parse_time_string(date_str, freq=freq)
+            assert result == exp
+
+    def test_parsers_quarter_invalid(self):
+
+        cases = ['2Q 2005', '2Q-200A', '2Q-200', '22Q2005', '6Q-20', '2Q200.']
+        for case in cases:
+            pytest.raises(ValueError, parsing.parse_time_string, case)
+
+    def test_parsers_monthfreq(self):
+        cases = {'201101': datetime(2011, 1, 1, 0, 0),
+                 '200005': datetime(2000, 5, 1, 0, 0)}
+
+        for date_str, expected in compat.iteritems(cases):
+            result1, _, _ = parsing.parse_time_string(date_str, freq='M')
+            assert result1 == expected
+
+
+class TestGuessDatetimeFormat(object):
+
+    @td.skip_if_not_us_locale
+    @pytest.mark.parametrize(
+        "string, format",
+        [
+            ('20111230', '%Y%m%d'),
+            ('2011-12-30', '%Y-%m-%d'),
+            ('30-12-2011', '%d-%m-%Y'),
+            ('2011-12-30 00:00:00', '%Y-%m-%d %H:%M:%S'),
+            ('2011-12-30T00:00:00', '%Y-%m-%dT%H:%M:%S'),
+            ('2011-12-30 00:00:00.000000',
+             '%Y-%m-%d %H:%M:%S.%f')])
+    def test_guess_datetime_format_with_parseable_formats(
+            self, string, format):
+        result = parsing._guess_datetime_format(string)
+        assert result == format
+
+    @pytest.mark.parametrize(
+        "dayfirst, expected",
+        [
+            (True, "%d/%m/%Y"),
+            (False, "%m/%d/%Y")])
+    def test_guess_datetime_format_with_dayfirst(self, dayfirst, expected):
+        ambiguous_string = '01/01/2011'
+        result = parsing._guess_datetime_format(
+            ambiguous_string, dayfirst=dayfirst)
+        assert result == expected
+
+    @td.skip_if_has_locale
+    @pytest.mark.parametrize(
+        "string, format",
+        [
+            ('30/Dec/2011', '%d/%b/%Y'),
+            ('30/December/2011', '%d/%B/%Y'),
+            ('30/Dec/2011 00:00:00', '%d/%b/%Y %H:%M:%S')])
+    def test_guess_datetime_format_with_locale_specific_formats(
+            self, string, format):
+        result = parsing._guess_datetime_format(string)
+        assert result == format
+
+    def test_guess_datetime_format_invalid_inputs(self):
+        # A datetime string must include a year, month and a day for it
+        # to be guessable, in addition to being a string that looks like
+        # a datetime
+        invalid_dts = [
+            '2013',
+            '01/2013',
+            '12:00:00',
+            '1/1/1/1',
+            'this_is_not_a_datetime',
+            '51a',
+            9,
+            datetime(2011, 1, 1),
+        ]
+
+        for invalid_dt in invalid_dts:
+            assert parsing._guess_datetime_format(invalid_dt) is None
+
+    @pytest.mark.parametrize(
+        "string, format",
+        [
+            ('2011-1-1', '%Y-%m-%d'),
+            ('30-1-2011', '%d-%m-%Y'),
+            ('1/1/2011', '%m/%d/%Y'),
+            ('2011-1-1 00:00:00', '%Y-%m-%d %H:%M:%S'),
+            ('2011-1-1 0:0:0', '%Y-%m-%d %H:%M:%S'),
+            ('2011-1-3T00:00:0', '%Y-%m-%dT%H:%M:%S')])
+    def test_guess_datetime_format_nopadding(self, string, format):
+        # GH 11142
+        result = parsing._guess_datetime_format(string)
+        assert result == format
+
+
+class TestArrayToDatetime(object):
+    def test_try_parse_dates(self):
+        arr = np.array(['5/1/2000', '6/1/2000', '7/1/2000'], dtype=object)
+
+        result = parsing.try_parse_dates(arr, dayfirst=True)
+        expected = np.array([parse(d, dayfirst=True) for d in arr])
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/tslibs/test_period_asfreq.py b/pandas/tests/tslibs/test_period_asfreq.py
new file mode 100644
index 0000000000000..61737083e22ea
--- /dev/null
+++ b/pandas/tests/tslibs/test_period_asfreq.py
@@ -0,0 +1,82 @@
+# -*- coding: utf-8 -*-
+
+from pandas._libs.tslibs.frequencies import get_freq
+from pandas._libs.tslibs.period import period_ordinal, period_asfreq
+
+
+class TestPeriodFreqConversion(object):
+
+    def test_intraday_conversion_factors(self):
+        assert period_asfreq(1, get_freq('D'), get_freq('H'), False) == 24
+        assert period_asfreq(1, get_freq('D'), get_freq('T'), False) == 1440
+        assert period_asfreq(1, get_freq('D'), get_freq('S'), False) == 86400
+        assert period_asfreq(1, get_freq('D'),
+                             get_freq('L'), False) == 86400000
+        assert period_asfreq(1, get_freq('D'),
+                             get_freq('U'), False) == 86400000000
+        assert period_asfreq(1, get_freq('D'),
+                             get_freq('N'), False) == 86400000000000
+
+        assert period_asfreq(1, get_freq('H'), get_freq('T'), False) == 60
+        assert period_asfreq(1, get_freq('H'), get_freq('S'), False) == 3600
+        assert period_asfreq(1, get_freq('H'),
+                             get_freq('L'), False) == 3600000
+        assert period_asfreq(1, get_freq('H'),
+                             get_freq('U'), False) == 3600000000
+        assert period_asfreq(1, get_freq('H'),
+                             get_freq('N'), False) == 3600000000000
+
+        assert period_asfreq(1, get_freq('T'), get_freq('S'), False) == 60
+        assert period_asfreq(1, get_freq('T'), get_freq('L'), False) == 60000
+        assert period_asfreq(1, get_freq('T'),
+                             get_freq('U'), False) == 60000000
+        assert period_asfreq(1, get_freq('T'),
+                             get_freq('N'), False) == 60000000000
+
+        assert period_asfreq(1, get_freq('S'), get_freq('L'), False) == 1000
+        assert period_asfreq(1, get_freq('S'),
+                             get_freq('U'), False) == 1000000
+        assert period_asfreq(1, get_freq('S'),
+                             get_freq('N'), False) == 1000000000
+
+        assert period_asfreq(1, get_freq('L'), get_freq('U'), False) == 1000
+        assert period_asfreq(1, get_freq('L'),
+                             get_freq('N'), False) == 1000000
+
+        assert period_asfreq(1, get_freq('U'), get_freq('N'), False) == 1000
+
+    def test_period_ordinal_start_values(self):
+        # information for 1.1.1970
+        assert period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('A')) == 0
+        assert period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('M')) == 0
+        assert period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('W')) == 1
+        assert period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('D')) == 0
+        assert period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('B')) == 0
+
+    def test_period_ordinal_week(self):
+        assert period_ordinal(1970, 1, 4, 0, 0, 0, 0, 0, get_freq('W')) == 1
+        assert period_ordinal(1970, 1, 5, 0, 0, 0, 0, 0, get_freq('W')) == 2
+        assert period_ordinal(2013, 10, 6, 0,
+                              0, 0, 0, 0, get_freq('W')) == 2284
+        assert period_ordinal(2013, 10, 7, 0,
+                              0, 0, 0, 0, get_freq('W')) == 2285
+
+    def test_period_ordinal_business_day(self):
+        # Thursday
+        assert period_ordinal(2013, 10, 3, 0,
+                              0, 0, 0, 0, get_freq('B')) == 11415
+        # Friday
+        assert period_ordinal(2013, 10, 4, 0,
+                              0, 0, 0, 0, get_freq('B')) == 11416
+        # Saturday
+        assert period_ordinal(2013, 10, 5, 0,
+                              0, 0, 0, 0, get_freq('B')) == 11417
+        # Sunday
+        assert period_ordinal(2013, 10, 6, 0,
+                              0, 0, 0, 0, get_freq('B')) == 11417
+        # Monday
+        assert period_ordinal(2013, 10, 7, 0,
+                              0, 0, 0, 0, get_freq('B')) == 11417
+        # Tuesday
+        assert period_ordinal(2013, 10, 8, 0,
+                              0, 0, 0, 0, get_freq('B')) == 11418
diff --git a/pandas/tests/tslibs/test_timezones.py b/pandas/tests/tslibs/test_timezones.py
new file mode 100644
index 0000000000000..1bb355f267938
--- /dev/null
+++ b/pandas/tests/tslibs/test_timezones.py
@@ -0,0 +1,68 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime
+
+import pytest
+import pytz
+import dateutil.tz
+
+from pandas._libs import tslib
+from pandas._libs.tslibs import timezones
+from pandas import Timestamp
+
+
+@pytest.mark.parametrize('tz_name', list(pytz.common_timezones))
+def test_cache_keys_are_distinct_for_pytz_vs_dateutil(tz_name):
+    if tz_name == 'UTC':
+        # skip utc as it's a special case in dateutil
+        return
+    tz_p = timezones.maybe_get_tz(tz_name)
+    tz_d = timezones.maybe_get_tz('dateutil/' + tz_name)
+    if tz_d is None:
+        # skip timezones that dateutil doesn't know about.
+        return
+    assert timezones._p_tz_cache_key(tz_p) != timezones._p_tz_cache_key(tz_d)
+
+
+def test_tzlocal():
+    # GH#13583
+    ts = Timestamp('2011-01-01', tz=dateutil.tz.tzlocal())
+    assert ts.tz == dateutil.tz.tzlocal()
+    assert "tz='tzlocal()')" in repr(ts)
+
+    tz = timezones.maybe_get_tz('tzlocal()')
+    assert tz == dateutil.tz.tzlocal()
+
+    # get offset using normal datetime for test
+    offset = dateutil.tz.tzlocal().utcoffset(datetime(2011, 1, 1))
+    offset = offset.total_seconds() * 1000000000
+    assert ts.value + offset == Timestamp('2011-01-01').value
+
+
+@pytest.mark.parametrize('eastern, localize', [
+    (pytz.timezone('US/Eastern'), lambda tz, x: tz.localize(x)),
+    (dateutil.tz.gettz('US/Eastern'), lambda tz, x: x.replace(tzinfo=tz))])
+def test_infer_tz(eastern, localize):
+    utc = pytz.utc
+
+    start_naive = datetime(2001, 1, 1)
+    end_naive = datetime(2009, 1, 1)
+
+    start = localize(eastern, start_naive)
+    end = localize(eastern, end_naive)
+
+    assert (timezones.infer_tzinfo(start, end) is
+            tslib._localize_pydatetime(start_naive, eastern).tzinfo)
+    assert (timezones.infer_tzinfo(start, None) is
+            tslib._localize_pydatetime(start_naive, eastern).tzinfo)
+    assert (timezones.infer_tzinfo(None, end) is
+            tslib._localize_pydatetime(end_naive, eastern).tzinfo)
+
+    start = utc.localize(start_naive)
+    end = utc.localize(end_naive)
+    assert timezones.infer_tzinfo(start, end) is utc
+
+    end = tslib._localize_pydatetime(end_naive, eastern)
+    with pytest.raises(Exception):
+        timezones.infer_tzinfo(start, end)
+    with pytest.raises(Exception):
+        timezones.infer_tzinfo(end, start)
diff --git a/pandas/tests/util/__init__.py b/pandas/tests/util/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/util/test_hashing.py b/pandas/tests/util/test_hashing.py
new file mode 100644
index 0000000000000..82b870c156cc8
--- /dev/null
+++ b/pandas/tests/util/test_hashing.py
@@ -0,0 +1,288 @@
+import pytest
+import datetime
+
+from warnings import catch_warnings
+import numpy as np
+import pandas as pd
+
+from pandas import DataFrame, Series, Index, MultiIndex
+from pandas.util import hash_array, hash_pandas_object
+from pandas.core.util.hashing import hash_tuples, hash_tuple, _hash_scalar
+import pandas.util.testing as tm
+
+
+class TestHashing(object):
+
+    def setup_method(self, method):
+        self.df = DataFrame(
+            {'i32': np.array([1, 2, 3] * 3, dtype='int32'),
+             'f32': np.array([None, 2.5, 3.5] * 3, dtype='float32'),
+             'cat': Series(['a', 'b', 'c'] * 3).astype('category'),
+             'obj': Series(['d', 'e', 'f'] * 3),
+             'bool': np.array([True, False, True] * 3),
+             'dt': Series(pd.date_range('20130101', periods=9)),
+             'dt_tz': Series(pd.date_range('20130101', periods=9,
+                                           tz='US/Eastern')),
+             'td': Series(pd.timedelta_range('2000', periods=9))})
+
+    def test_consistency(self):
+        # check that our hash doesn't change because of a mistake
+        # in the actual code; this is the ground truth
+        result = hash_pandas_object(Index(['foo', 'bar', 'baz']))
+        expected = Series(np.array([3600424527151052760, 1374399572096150070,
+                                    477881037637427054], dtype='uint64'),
+                          index=['foo', 'bar', 'baz'])
+        tm.assert_series_equal(result, expected)
+
+    def test_hash_array(self):
+        for name, s in self.df.iteritems():
+            a = s.values
+            tm.assert_numpy_array_equal(hash_array(a), hash_array(a))
+
+    def test_hash_array_mixed(self):
+        result1 = hash_array(np.array([3, 4, 'All']))
+        result2 = hash_array(np.array(['3', '4', 'All']))
+        result3 = hash_array(np.array([3, 4, 'All'], dtype=object))
+        tm.assert_numpy_array_equal(result1, result2)
+        tm.assert_numpy_array_equal(result1, result3)
+
+    def test_hash_array_errors(self):
+
+        for val in [5, 'foo', pd.Timestamp('20130101')]:
+            pytest.raises(TypeError, hash_array, val)
+
+    def check_equal(self, obj, **kwargs):
+        a = hash_pandas_object(obj, **kwargs)
+        b = hash_pandas_object(obj, **kwargs)
+        tm.assert_series_equal(a, b)
+
+        kwargs.pop('index', None)
+        a = hash_pandas_object(obj, **kwargs)
+        b = hash_pandas_object(obj, **kwargs)
+        tm.assert_series_equal(a, b)
+
+    def check_not_equal_with_index(self, obj):
+
+        # check that we are not hashing the same if
+        # we include the index
+        if not isinstance(obj, Index):
+            a = hash_pandas_object(obj, index=True)
+            b = hash_pandas_object(obj, index=False)
+            if len(obj):
+                assert not (a == b).all()
+
+    def test_hash_tuples(self):
+        tups = [(1, 'one'), (1, 'two'), (2, 'one')]
+        result = hash_tuples(tups)
+        expected = hash_pandas_object(MultiIndex.from_tuples(tups)).values
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = hash_tuples(tups[0])
+        assert result == expected[0]
+
+    def test_hash_tuple(self):
+        # test equivalence between hash_tuples and hash_tuple
+        for tup in [(1, 'one'), (1, np.nan), (1.0, pd.NaT, 'A'),
+                    ('A', pd.Timestamp("2012-01-01"))]:
+            result = hash_tuple(tup)
+            expected = hash_tuples([tup])[0]
+            assert result == expected
+
+    def test_hash_scalar(self):
+        for val in [1, 1.4, 'A', b'A', u'A', pd.Timestamp("2012-01-01"),
+                    pd.Timestamp("2012-01-01", tz='Europe/Brussels'),
+                    datetime.datetime(2012, 1, 1),
+                    pd.Timestamp("2012-01-01", tz='EST').to_pydatetime(),
+                    pd.Timedelta('1 days'), datetime.timedelta(1),
+                    pd.Period('2012-01-01', freq='D'), pd.Interval(0, 1),
+                    np.nan, pd.NaT, None]:
+            result = _hash_scalar(val)
+            expected = hash_array(np.array([val], dtype=object),
+                                  categorize=True)
+            assert result[0] == expected[0]
+
+    def test_hash_tuples_err(self):
+
+        for val in [5, 'foo', pd.Timestamp('20130101')]:
+            pytest.raises(TypeError, hash_tuples, val)
+
+    def test_multiindex_unique(self):
+        mi = MultiIndex.from_tuples([(118, 472), (236, 118),
+                                     (51, 204), (102, 51)])
+        assert mi.is_unique
+        result = hash_pandas_object(mi)
+        assert result.is_unique
+
+    def test_multiindex_objects(self):
+        mi = MultiIndex(levels=[['b', 'd', 'a'], [1, 2, 3]],
+                        labels=[[0, 1, 0, 2], [2, 0, 0, 1]],
+                        names=['col1', 'col2'])
+        recons = mi._sort_levels_monotonic()
+
+        # these are equal
+        assert mi.equals(recons)
+        assert Index(mi.values).equals(Index(recons.values))
+
+        # _hashed_values and hash_pandas_object(..., index=False)
+        # equivalency
+        expected = hash_pandas_object(
+            mi, index=False).values
+        result = mi._hashed_values
+        tm.assert_numpy_array_equal(result, expected)
+
+        expected = hash_pandas_object(
+            recons, index=False).values
+        result = recons._hashed_values
+        tm.assert_numpy_array_equal(result, expected)
+
+        expected = mi._hashed_values
+        result = recons._hashed_values
+
+        # values should match, but in different order
+        tm.assert_numpy_array_equal(np.sort(result),
+                                    np.sort(expected))
+
+    @pytest.mark.parametrize('obj', [
+        Series([1, 2, 3]),
+        Series([1.0, 1.5, 3.2]),
+        Series([1.0, 1.5, np.nan]),
+        Series([1.0, 1.5, 3.2], index=[1.5, 1.1, 3.3]),
+        Series(['a', 'b', 'c']),
+        Series(['a', np.nan, 'c']),
+        Series(['a', None, 'c']),
+        Series([True, False, True]),
+        Series(),
+        Index([1, 2, 3]),
+        Index([True, False, True]),
+        DataFrame({'x': ['a', 'b', 'c'], 'y': [1, 2, 3]}),
+        DataFrame(),
+        tm.makeMissingDataframe(),
+        tm.makeMixedDataFrame(),
+        tm.makeTimeDataFrame(),
+        tm.makeTimeSeries(),
+        tm.makeTimedeltaIndex(),
+        tm.makePeriodIndex(),
+        Series(tm.makePeriodIndex()),
+        Series(pd.date_range('20130101', periods=3, tz='US/Eastern')),
+        MultiIndex.from_product([range(5), ['foo', 'bar', 'baz'],
+                                 pd.date_range('20130101', periods=2)]),
+        MultiIndex.from_product([pd.CategoricalIndex(list('aabc')), range(3)])
+    ])
+    def test_hash_pandas_object(self, obj):
+        self.check_equal(obj)
+        self.check_not_equal_with_index(obj)
+
+    def test_hash_pandas_object2(self):
+        for name, s in self.df.iteritems():
+            self.check_equal(s)
+            self.check_not_equal_with_index(s)
+
+    def test_hash_pandas_empty_object(self):
+        for obj in [Series([], dtype='float64'),
+                    Series([], dtype='object'),
+                    Index([])]:
+            self.check_equal(obj)
+
+            # these are by-definition the same with
+            # or w/o the index as the data is empty
+
+    def test_categorical_consistency(self):
+        # GH15143
+        # Check that categoricals hash consistent with their values, not codes
+        # This should work for categoricals of any dtype
+        for s1 in [Series(['a', 'b', 'c', 'd']),
+                   Series([1000, 2000, 3000, 4000]),
+                   Series(pd.date_range(0, periods=4))]:
+            s2 = s1.astype('category').cat.set_categories(s1)
+            s3 = s2.cat.set_categories(list(reversed(s1)))
+            for categorize in [True, False]:
+                # These should all hash identically
+                h1 = hash_pandas_object(s1, categorize=categorize)
+                h2 = hash_pandas_object(s2, categorize=categorize)
+                h3 = hash_pandas_object(s3, categorize=categorize)
+                tm.assert_series_equal(h1, h2)
+                tm.assert_series_equal(h1, h3)
+
+    def test_categorical_with_nan_consistency(self):
+        c = pd.Categorical.from_codes(
+            [-1, 0, 1, 2, 3, 4],
+            categories=pd.date_range('2012-01-01', periods=5, name='B'))
+        expected = hash_array(c, categorize=False)
+        c = pd.Categorical.from_codes(
+            [-1, 0],
+            categories=[pd.Timestamp('2012-01-01')])
+        result = hash_array(c, categorize=False)
+        assert result[0] in expected
+        assert result[1] in expected
+
+    def test_pandas_errors(self):
+
+        for obj in [pd.Timestamp('20130101')]:
+            with pytest.raises(TypeError):
+                hash_pandas_object(obj)
+
+        with catch_warnings(record=True):
+            obj = tm.makePanel()
+        with pytest.raises(TypeError):
+            hash_pandas_object(obj)
+
+    def test_hash_keys(self):
+        # using different hash keys, should have different hashes
+        # for the same data
+
+        # this only matters for object dtypes
+        obj = Series(list('abc'))
+        a = hash_pandas_object(obj, hash_key='9876543210123456')
+        b = hash_pandas_object(obj, hash_key='9876543210123465')
+        assert (a != b).all()
+
+    def test_invalid_key(self):
+        # this only matters for object dtypes
+        def f():
+            hash_pandas_object(Series(list('abc')), hash_key='foo')
+        pytest.raises(ValueError, f)
+
+    def test_alread_encoded(self):
+        # if already encoded then ok
+
+        obj = Series(list('abc')).str.encode('utf8')
+        self.check_equal(obj)
+
+    def test_alternate_encoding(self):
+
+        obj = Series(list('abc'))
+        self.check_equal(obj, encoding='ascii')
+
+    def test_same_len_hash_collisions(self):
+
+        for l in range(8):
+            length = 2**(l + 8) + 1
+            s = tm.rands_array(length, 2)
+            result = hash_array(s, 'utf8')
+            assert not result[0] == result[1]
+
+        for l in range(8):
+            length = 2**(l + 8)
+            s = tm.rands_array(length, 2)
+            result = hash_array(s, 'utf8')
+            assert not result[0] == result[1]
+
+    def test_hash_collisions(self):
+
+        # hash collisions are bad
+        # https://github.com/pandas-dev/pandas/issues/14711#issuecomment-264885726
+        L = ['Ingrid-9Z9fKIZmkO7i7Cn51Li34pJm44fgX6DYGBNj3VPlOH50m7HnBlPxfIwFMrcNJNMP6PSgLmwWnInciMWrCSAlLEvt7JkJl4IxiMrVbXSa8ZQoVaq5xoQPjltuJEfwdNlO6jo8qRRHvD8sBEBMQASrRa6TsdaPTPCBo3nwIBpE7YzzmyH0vMBhjQZLx1aCT7faSEx7PgFxQhHdKFWROcysamgy9iVj8DO2Fmwg1NNl93rIAqC3mdqfrCxrzfvIY8aJdzin2cHVzy3QUJxZgHvtUtOLxoqnUHsYbNTeq0xcLXpTZEZCxD4PGubIuCNf32c33M7HFsnjWSEjE2yVdWKhmSVodyF8hFYVmhYnMCztQnJrt3O8ZvVRXd5IKwlLexiSp4h888w7SzAIcKgc3g5XQJf6MlSMftDXm9lIsE1mJNiJEv6uY6pgvC3fUPhatlR5JPpVAHNSbSEE73MBzJrhCAbOLXQumyOXigZuPoME7QgJcBalliQol7YZ9',  # noqa
+             'Tim-b9MddTxOWW2AT1Py6vtVbZwGAmYCjbp89p8mxsiFoVX4FyDOF3wFiAkyQTUgwg9sVqVYOZo09Dh1AzhFHbgij52ylF0SEwgzjzHH8TGY8Lypart4p4onnDoDvVMBa0kdthVGKl6K0BDVGzyOXPXKpmnMF1H6rJzqHJ0HywfwS4XYpVwlAkoeNsiicHkJUFdUAhG229INzvIAiJuAHeJDUoyO4DCBqtoZ5TDend6TK7Y914yHlfH3g1WZu5LksKv68VQHJriWFYusW5e6ZZ6dKaMjTwEGuRgdT66iU5nqWTHRH8WSzpXoCFwGcTOwyuqPSe0fTe21DVtJn1FKj9F9nEnR9xOvJUO7E0piCIF4Ad9yAIDY4DBimpsTfKXCu1vdHpKYerzbndfuFe5AhfMduLYZJi5iAw8qKSwR5h86ttXV0Mc0QmXz8dsRvDgxjXSmupPxBggdlqUlC828hXiTPD7am0yETBV0F3bEtvPiNJfremszcV8NcqAoARMe']  # noqa
+
+        # these should be different!
+        result1 = hash_array(np.asarray(L[0:1], dtype=object), 'utf8')
+        expected1 = np.array([14963968704024874985], dtype=np.uint64)
+        tm.assert_numpy_array_equal(result1, expected1)
+
+        result2 = hash_array(np.asarray(L[1:2], dtype=object), 'utf8')
+        expected2 = np.array([16428432627716348016], dtype=np.uint64)
+        tm.assert_numpy_array_equal(result2, expected2)
+
+        result = hash_array(np.asarray(L, dtype=object), 'utf8')
+        tm.assert_numpy_array_equal(
+            result, np.concatenate([expected1, expected2], axis=0))
diff --git a/pandas/tests/util/test_testing.py b/pandas/tests/util/test_testing.py
new file mode 100644
index 0000000000000..95ea4658212e9
--- /dev/null
+++ b/pandas/tests/util/test_testing.py
@@ -0,0 +1,861 @@
+# -*- coding: utf-8 -*-
+import os
+import pandas as pd
+import pytest
+import numpy as np
+import sys
+from pandas import Series, DataFrame
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+from pandas.util.testing import (assert_almost_equal, raise_with_traceback,
+                                 assert_index_equal, assert_series_equal,
+                                 assert_frame_equal, assert_numpy_array_equal,
+                                 RNGContext)
+
+
+class TestAssertAlmostEqual(object):
+
+    def _assert_almost_equal_both(self, a, b, **kwargs):
+        assert_almost_equal(a, b, **kwargs)
+        assert_almost_equal(b, a, **kwargs)
+
+    def _assert_not_almost_equal_both(self, a, b, **kwargs):
+        pytest.raises(AssertionError, assert_almost_equal, a, b, **kwargs)
+        pytest.raises(AssertionError, assert_almost_equal, b, a, **kwargs)
+
+    def test_assert_almost_equal_numbers(self):
+        self._assert_almost_equal_both(1.1, 1.1)
+        self._assert_almost_equal_both(1.1, 1.100001)
+        self._assert_almost_equal_both(np.int16(1), 1.000001)
+        self._assert_almost_equal_both(np.float64(1.1), 1.1)
+        self._assert_almost_equal_both(np.uint32(5), 5)
+
+        self._assert_not_almost_equal_both(1.1, 1)
+        self._assert_not_almost_equal_both(1.1, True)
+        self._assert_not_almost_equal_both(1, 2)
+        self._assert_not_almost_equal_both(1.0001, np.int16(1))
+
+    def test_assert_almost_equal_numbers_with_zeros(self):
+        self._assert_almost_equal_both(0, 0)
+        self._assert_almost_equal_both(0, 0.0)
+        self._assert_almost_equal_both(0, np.float64(0))
+        self._assert_almost_equal_both(0.000001, 0)
+
+        self._assert_not_almost_equal_both(0.001, 0)
+        self._assert_not_almost_equal_both(1, 0)
+
+    def test_assert_almost_equal_numbers_with_mixed(self):
+        self._assert_not_almost_equal_both(1, 'abc')
+        self._assert_not_almost_equal_both(1, [1, ])
+        self._assert_not_almost_equal_both(1, object())
+
+    @pytest.mark.parametrize(
+        "left_dtype",
+        ['M8[ns]', 'm8[ns]', 'float64', 'int64', 'object'])
+    @pytest.mark.parametrize(
+        "right_dtype",
+        ['M8[ns]', 'm8[ns]', 'float64', 'int64', 'object'])
+    def test_assert_almost_equal_edge_case_ndarrays(
+            self, left_dtype, right_dtype):
+
+        # empty compare
+        self._assert_almost_equal_both(np.array([], dtype=left_dtype),
+                                       np.array([], dtype=right_dtype),
+                                       check_dtype=False)
+
+    def test_assert_almost_equal_dicts(self):
+        self._assert_almost_equal_both({'a': 1, 'b': 2}, {'a': 1, 'b': 2})
+
+        self._assert_not_almost_equal_both({'a': 1, 'b': 2}, {'a': 1, 'b': 3})
+        self._assert_not_almost_equal_both({'a': 1, 'b': 2},
+                                           {'a': 1, 'b': 2, 'c': 3})
+        self._assert_not_almost_equal_both({'a': 1}, 1)
+        self._assert_not_almost_equal_both({'a': 1}, 'abc')
+        self._assert_not_almost_equal_both({'a': 1}, [1, ])
+
+    def test_assert_almost_equal_dict_like_object(self):
+        class DictLikeObj(object):
+
+            def keys(self):
+                return ('a', )
+
+            def __getitem__(self, item):
+                if item == 'a':
+                    return 1
+
+        self._assert_almost_equal_both({'a': 1}, DictLikeObj(),
+                                       check_dtype=False)
+
+        self._assert_not_almost_equal_both({'a': 2}, DictLikeObj(),
+                                           check_dtype=False)
+
+    def test_assert_almost_equal_strings(self):
+        self._assert_almost_equal_both('abc', 'abc')
+
+        self._assert_not_almost_equal_both('abc', 'abcd')
+        self._assert_not_almost_equal_both('abc', 'abd')
+        self._assert_not_almost_equal_both('abc', 1)
+        self._assert_not_almost_equal_both('abc', [1, ])
+
+    def test_assert_almost_equal_iterables(self):
+        self._assert_almost_equal_both([1, 2, 3], [1, 2, 3])
+        self._assert_almost_equal_both(np.array([1, 2, 3]),
+                                       np.array([1, 2, 3]))
+
+        # class / dtype are different
+        self._assert_not_almost_equal_both(np.array([1, 2, 3]), [1, 2, 3])
+        self._assert_not_almost_equal_both(np.array([1, 2, 3]),
+                                           np.array([1., 2., 3.]))
+
+        # Can't compare generators
+        self._assert_not_almost_equal_both(iter([1, 2, 3]), [1, 2, 3])
+
+        self._assert_not_almost_equal_both([1, 2, 3], [1, 2, 4])
+        self._assert_not_almost_equal_both([1, 2, 3], [1, 2, 3, 4])
+        self._assert_not_almost_equal_both([1, 2, 3], 1)
+
+    def test_assert_almost_equal_null(self):
+        self._assert_almost_equal_both(None, None)
+
+        self._assert_not_almost_equal_both(None, np.NaN)
+        self._assert_not_almost_equal_both(None, 0)
+        self._assert_not_almost_equal_both(np.NaN, 0)
+
+    def test_assert_almost_equal_inf(self):
+        self._assert_almost_equal_both(np.inf, np.inf)
+        self._assert_almost_equal_both(np.inf, float("inf"))
+        self._assert_not_almost_equal_both(np.inf, 0)
+        self._assert_almost_equal_both(np.array([np.inf, np.nan, -np.inf]),
+                                       np.array([np.inf, np.nan, -np.inf]))
+        self._assert_almost_equal_both(np.array([np.inf, None, -np.inf],
+                                                dtype=np.object_),
+                                       np.array([np.inf, np.nan, -np.inf],
+                                                dtype=np.object_))
+
+    def test_assert_almost_equal_pandas(self):
+        tm.assert_almost_equal(pd.Index([1., 1.1]),
+                               pd.Index([1., 1.100001]))
+        tm.assert_almost_equal(pd.Series([1., 1.1]),
+                               pd.Series([1., 1.100001]))
+        tm.assert_almost_equal(pd.DataFrame({'a': [1., 1.1]}),
+                               pd.DataFrame({'a': [1., 1.100001]}))
+
+    def test_assert_almost_equal_object(self):
+        a = [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-01')]
+        b = [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-01')]
+        self._assert_almost_equal_both(a, b)
+
+
+class TestUtilTesting(object):
+
+    def test_raise_with_traceback(self):
+        with tm.assert_raises_regex(LookupError, "error_text"):
+            try:
+                raise ValueError("THIS IS AN ERROR")
+            except ValueError as e:
+                e = LookupError("error_text")
+                raise_with_traceback(e)
+        with tm.assert_raises_regex(LookupError, "error_text"):
+            try:
+                raise ValueError("This is another error")
+            except ValueError:
+                e = LookupError("error_text")
+                _, _, traceback = sys.exc_info()
+                raise_with_traceback(e, traceback)
+
+
+class TestAssertNumpyArrayEqual(object):
+
+    @td.skip_if_windows
+    def test_numpy_array_equal_message(self):
+
+        expected = """numpy array are different
+
+numpy array shapes are different
+\\[left\\]:  \\(2,\\)
+\\[right\\]: \\(3,\\)"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_numpy_array_equal(np.array([1, 2]), np.array([3, 4, 5]))
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_almost_equal(np.array([1, 2]), np.array([3, 4, 5]))
+
+        # scalar comparison
+        expected = """Expected type """
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_numpy_array_equal(1, 2)
+        expected = """expected 2\\.00000 but got 1\\.00000, with decimal 5"""
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_almost_equal(1, 2)
+
+        # array / scalar array comparison
+        expected = """numpy array are different
+
+numpy array classes are different
+\\[left\\]:  ndarray
+\\[right\\]: int"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            # numpy_array_equal only accepts np.ndarray
+            assert_numpy_array_equal(np.array([1]), 1)
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_almost_equal(np.array([1]), 1)
+
+        # scalar / array comparison
+        expected = """numpy array are different
+
+numpy array classes are different
+\\[left\\]:  int
+\\[right\\]: ndarray"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_numpy_array_equal(1, np.array([1]))
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_almost_equal(1, np.array([1]))
+
+        expected = """numpy array are different
+
+numpy array values are different \\(66\\.66667 %\\)
+\\[left\\]:  \\[nan, 2\\.0, 3\\.0\\]
+\\[right\\]: \\[1\\.0, nan, 3\\.0\\]"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_numpy_array_equal(np.array([np.nan, 2, 3]),
+                                     np.array([1, np.nan, 3]))
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_almost_equal(np.array([np.nan, 2, 3]),
+                                np.array([1, np.nan, 3]))
+
+        expected = """numpy array are different
+
+numpy array values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[1, 2\\]
+\\[right\\]: \\[1, 3\\]"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_numpy_array_equal(np.array([1, 2]), np.array([1, 3]))
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_almost_equal(np.array([1, 2]), np.array([1, 3]))
+
+        expected = """numpy array are different
+
+numpy array values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[1\\.1, 2\\.000001\\]
+\\[right\\]: \\[1\\.1, 2.0\\]"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_numpy_array_equal(
+                np.array([1.1, 2.000001]), np.array([1.1, 2.0]))
+
+        # must pass
+        assert_almost_equal(np.array([1.1, 2.000001]), np.array([1.1, 2.0]))
+
+        expected = """numpy array are different
+
+numpy array values are different \\(16\\.66667 %\\)
+\\[left\\]:  \\[\\[1, 2\\], \\[3, 4\\], \\[5, 6\\]\\]
+\\[right\\]: \\[\\[1, 3\\], \\[3, 4\\], \\[5, 6\\]\\]"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_numpy_array_equal(np.array([[1, 2], [3, 4], [5, 6]]),
+                                     np.array([[1, 3], [3, 4], [5, 6]]))
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_almost_equal(np.array([[1, 2], [3, 4], [5, 6]]),
+                                np.array([[1, 3], [3, 4], [5, 6]]))
+
+        expected = """numpy array are different
+
+numpy array values are different \\(25\\.0 %\\)
+\\[left\\]:  \\[\\[1, 2\\], \\[3, 4\\]\\]
+\\[right\\]: \\[\\[1, 3\\], \\[3, 4\\]\\]"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_numpy_array_equal(np.array([[1, 2], [3, 4]]),
+                                     np.array([[1, 3], [3, 4]]))
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_almost_equal(np.array([[1, 2], [3, 4]]),
+                                np.array([[1, 3], [3, 4]]))
+
+        # allow to overwrite message
+        expected = """Index are different
+
+Index shapes are different
+\\[left\\]:  \\(2,\\)
+\\[right\\]: \\(3,\\)"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_numpy_array_equal(np.array([1, 2]), np.array([3, 4, 5]),
+                                     obj='Index')
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_almost_equal(np.array([1, 2]), np.array([3, 4, 5]),
+                                obj='Index')
+
+    def test_numpy_array_equal_unicode_message(self):
+        # Test ensures that `assert_numpy_array_equals` raises the right
+        # exception when comparing np.arrays containing differing
+        # unicode objects (#20503)
+
+        expected = """numpy array are different
+
+numpy array values are different \\(33\\.33333 %\\)
+\\[left\\]:  \\[á, à, ä\\]
+\\[right\\]: \\[á, à, å\\]"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_numpy_array_equal(np.array([u'á', u'à', u'ä']),
+                                     np.array([u'á', u'à', u'å']))
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_almost_equal(np.array([u'á', u'à', u'ä']),
+                                np.array([u'á', u'à', u'å']))
+
+    @td.skip_if_windows
+    def test_numpy_array_equal_object_message(self):
+
+        a = np.array([pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-01')])
+        b = np.array([pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02')])
+
+        expected = """numpy array are different
+
+numpy array values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[2011-01-01 00:00:00, 2011-01-01 00:00:00\\]
+\\[right\\]: \\[2011-01-01 00:00:00, 2011-01-02 00:00:00\\]"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_numpy_array_equal(a, b)
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_almost_equal(a, b)
+
+    def test_numpy_array_equal_copy_flag(self):
+        a = np.array([1, 2, 3])
+        b = a.copy()
+        c = a.view()
+        expected = r'array\(\[1, 2, 3\]\) is not array\(\[1, 2, 3\]\)'
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_numpy_array_equal(a, b, check_same='same')
+        expected = r'array\(\[1, 2, 3\]\) is array\(\[1, 2, 3\]\)'
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_numpy_array_equal(a, c, check_same='copy')
+
+    def test_assert_almost_equal_iterable_message(self):
+
+        expected = """Iterable are different
+
+Iterable length are different
+\\[left\\]:  2
+\\[right\\]: 3"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_almost_equal([1, 2], [3, 4, 5])
+
+        expected = """Iterable are different
+
+Iterable values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[1, 2\\]
+\\[right\\]: \\[1, 3\\]"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_almost_equal([1, 2], [1, 3])
+
+
+class TestAssertIndexEqual(object):
+
+    def test_index_equal_message(self):
+
+        expected = """Index are different
+
+Index levels are different
+\\[left\\]:  1, Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
+\\[right\\]: 2, MultiIndex\\(levels=\\[\\[u?'A', u?'B'\\], \\[1, 2, 3, 4\\]\\],
+           labels=\\[\\[0, 0, 1, 1\\], \\[0, 1, 2, 3\\]\\]\\)"""
+
+        idx1 = pd.Index([1, 2, 3])
+        idx2 = pd.MultiIndex.from_tuples([('A', 1), ('A', 2),
+                                          ('B', 3), ('B', 4)])
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2, exact=False)
+
+        expected = """MultiIndex level \\[1\\] are different
+
+MultiIndex level \\[1\\] values are different \\(25\\.0 %\\)
+\\[left\\]:  Int64Index\\(\\[2, 2, 3, 4\\], dtype='int64'\\)
+\\[right\\]: Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)"""
+
+        idx1 = pd.MultiIndex.from_tuples([('A', 2), ('A', 2),
+                                          ('B', 3), ('B', 4)])
+        idx2 = pd.MultiIndex.from_tuples([('A', 1), ('A', 2),
+                                          ('B', 3), ('B', 4)])
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2)
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2, check_exact=False)
+
+        expected = """Index are different
+
+Index length are different
+\\[left\\]:  3, Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
+\\[right\\]: 4, Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)"""
+
+        idx1 = pd.Index([1, 2, 3])
+        idx2 = pd.Index([1, 2, 3, 4])
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2)
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2, check_exact=False)
+
+        expected = """Index are different
+
+Index classes are different
+\\[left\\]:  Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
+\\[right\\]: Float64Index\\(\\[1\\.0, 2\\.0, 3\\.0\\], dtype='float64'\\)"""
+
+        idx1 = pd.Index([1, 2, 3])
+        idx2 = pd.Index([1, 2, 3.0])
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2, exact=True)
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2, exact=True, check_exact=False)
+
+        expected = """Index are different
+
+Index values are different \\(33\\.33333 %\\)
+\\[left\\]:  Float64Index\\(\\[1.0, 2.0, 3.0], dtype='float64'\\)
+\\[right\\]: Float64Index\\(\\[1.0, 2.0, 3.0000000001\\], dtype='float64'\\)"""
+
+        idx1 = pd.Index([1, 2, 3.])
+        idx2 = pd.Index([1, 2, 3.0000000001])
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2)
+
+        # must success
+        assert_index_equal(idx1, idx2, check_exact=False)
+
+        expected = """Index are different
+
+Index values are different \\(33\\.33333 %\\)
+\\[left\\]:  Float64Index\\(\\[1.0, 2.0, 3.0], dtype='float64'\\)
+\\[right\\]: Float64Index\\(\\[1.0, 2.0, 3.0001\\], dtype='float64'\\)"""
+
+        idx1 = pd.Index([1, 2, 3.])
+        idx2 = pd.Index([1, 2, 3.0001])
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2)
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2, check_exact=False)
+        # must success
+        assert_index_equal(idx1, idx2, check_exact=False,
+                           check_less_precise=True)
+
+        expected = """Index are different
+
+Index values are different \\(33\\.33333 %\\)
+\\[left\\]:  Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
+\\[right\\]: Int64Index\\(\\[1, 2, 4\\], dtype='int64'\\)"""
+
+        idx1 = pd.Index([1, 2, 3])
+        idx2 = pd.Index([1, 2, 4])
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2)
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2, check_less_precise=True)
+
+        expected = """MultiIndex level \\[1\\] are different
+
+MultiIndex level \\[1\\] values are different \\(25\\.0 %\\)
+\\[left\\]:  Int64Index\\(\\[2, 2, 3, 4\\], dtype='int64'\\)
+\\[right\\]: Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)"""
+
+        idx1 = pd.MultiIndex.from_tuples([('A', 2), ('A', 2),
+                                          ('B', 3), ('B', 4)])
+        idx2 = pd.MultiIndex.from_tuples([('A', 1), ('A', 2),
+                                          ('B', 3), ('B', 4)])
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2)
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2, check_exact=False)
+
+    def test_index_equal_metadata_message(self):
+
+        expected = """Index are different
+
+Attribute "names" are different
+\\[left\\]:  \\[None\\]
+\\[right\\]: \\[u?'x'\\]"""
+
+        idx1 = pd.Index([1, 2, 3])
+        idx2 = pd.Index([1, 2, 3], name='x')
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2)
+
+        # same name, should pass
+        assert_index_equal(pd.Index([1, 2, 3], name=np.nan),
+                           pd.Index([1, 2, 3], name=np.nan))
+        assert_index_equal(pd.Index([1, 2, 3], name=pd.NaT),
+                           pd.Index([1, 2, 3], name=pd.NaT))
+
+        expected = """Index are different
+
+Attribute "names" are different
+\\[left\\]:  \\[nan\\]
+\\[right\\]: \\[NaT\\]"""
+
+        idx1 = pd.Index([1, 2, 3], name=np.nan)
+        idx2 = pd.Index([1, 2, 3], name=pd.NaT)
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(idx1, idx2)
+
+    def test_categorical_index_equality(self):
+        expected = """Index are different
+
+Attribute "dtype" are different
+\\[left\\]:  CategoricalDtype\\(categories=\\[u?'a', u?'b'\\], ordered=False\\)
+\\[right\\]: CategoricalDtype\\(categories=\\[u?'a', u?'b', u?'c'\\], \
+ordered=False\\)"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_index_equal(pd.Index(pd.Categorical(['a', 'b'])),
+                               pd.Index(pd.Categorical(['a', 'b'],
+                                        categories=['a', 'b', 'c'])))
+
+    def test_categorical_index_equality_relax_categories_check(self):
+        assert_index_equal(pd.Index(pd.Categorical(['a', 'b'])),
+                           pd.Index(pd.Categorical(['a', 'b'],
+                                    categories=['a', 'b', 'c'])),
+                           check_categorical=False)
+
+
+class TestAssertSeriesEqual(object):
+
+    def _assert_equal(self, x, y, **kwargs):
+        assert_series_equal(x, y, **kwargs)
+        assert_series_equal(y, x, **kwargs)
+
+    def _assert_not_equal(self, a, b, **kwargs):
+        pytest.raises(AssertionError, assert_series_equal, a, b, **kwargs)
+        pytest.raises(AssertionError, assert_series_equal, b, a, **kwargs)
+
+    def test_equal(self):
+        self._assert_equal(Series(range(3)), Series(range(3)))
+        self._assert_equal(Series(list('abc')), Series(list('abc')))
+        self._assert_equal(Series(list(u'áàä')), Series(list(u'áàä')))
+
+    def test_not_equal(self):
+        self._assert_not_equal(Series(range(3)), Series(range(3)) + 1)
+        self._assert_not_equal(Series(list('abc')), Series(list('xyz')))
+        self._assert_not_equal(Series(list(u'áàä')), Series(list(u'éèë')))
+        self._assert_not_equal(Series(list(u'áàä')), Series(list(b'aaa')))
+        self._assert_not_equal(Series(range(3)), Series(range(4)))
+        self._assert_not_equal(
+            Series(range(3)), Series(
+                range(3), dtype='float64'))
+        self._assert_not_equal(
+            Series(range(3)), Series(
+                range(3), index=[1, 2, 4]))
+
+        # ATM meta data is not checked in assert_series_equal
+        # self._assert_not_equal(Series(range(3)),Series(range(3),name='foo'),check_names=True)
+
+    def test_less_precise(self):
+        s1 = Series([0.12345], dtype='float64')
+        s2 = Series([0.12346], dtype='float64')
+
+        pytest.raises(AssertionError, assert_series_equal, s1, s2)
+        self._assert_equal(s1, s2, check_less_precise=True)
+        for i in range(4):
+            self._assert_equal(s1, s2, check_less_precise=i)
+        pytest.raises(AssertionError, assert_series_equal, s1, s2, 10)
+
+        s1 = Series([0.12345], dtype='float32')
+        s2 = Series([0.12346], dtype='float32')
+
+        pytest.raises(AssertionError, assert_series_equal, s1, s2)
+        self._assert_equal(s1, s2, check_less_precise=True)
+        for i in range(4):
+            self._assert_equal(s1, s2, check_less_precise=i)
+        pytest.raises(AssertionError, assert_series_equal, s1, s2, 10)
+
+        # even less than less precise
+        s1 = Series([0.1235], dtype='float32')
+        s2 = Series([0.1236], dtype='float32')
+
+        pytest.raises(AssertionError, assert_series_equal, s1, s2)
+        pytest.raises(AssertionError, assert_series_equal, s1, s2, True)
+
+    def test_index_dtype(self):
+        df1 = DataFrame.from_records(
+            {'a': [1, 2], 'c': ['l1', 'l2']}, index=['a'])
+        df2 = DataFrame.from_records(
+            {'a': [1.0, 2.0], 'c': ['l1', 'l2']}, index=['a'])
+        self._assert_not_equal(df1.c, df2.c, check_index_type=True)
+
+    def test_multiindex_dtype(self):
+        df1 = DataFrame.from_records(
+            {'a': [1, 2], 'b': [2.1, 1.5],
+             'c': ['l1', 'l2']}, index=['a', 'b'])
+        df2 = DataFrame.from_records(
+            {'a': [1.0, 2.0], 'b': [2.1, 1.5],
+             'c': ['l1', 'l2']}, index=['a', 'b'])
+        self._assert_not_equal(df1.c, df2.c, check_index_type=True)
+
+    def test_series_equal_message(self):
+
+        expected = """Series are different
+
+Series length are different
+\\[left\\]:  3, RangeIndex\\(start=0, stop=3, step=1\\)
+\\[right\\]: 4, RangeIndex\\(start=0, stop=4, step=1\\)"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_series_equal(pd.Series([1, 2, 3]), pd.Series([1, 2, 3, 4]))
+
+        expected = """Series are different
+
+Series values are different \\(33\\.33333 %\\)
+\\[left\\]:  \\[1, 2, 3\\]
+\\[right\\]: \\[1, 2, 4\\]"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_series_equal(pd.Series([1, 2, 3]), pd.Series([1, 2, 4]))
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_series_equal(pd.Series([1, 2, 3]), pd.Series([1, 2, 4]),
+                                check_less_precise=True)
+
+    def test_categorical_series_equality(self):
+        expected = """Attributes are different
+
+Attribute "dtype" are different
+\\[left\\]:  CategoricalDtype\\(categories=\\[u?'a', u?'b'\\], ordered=False\\)
+\\[right\\]: CategoricalDtype\\(categories=\\[u?'a', u?'b', u?'c'\\], \
+ordered=False\\)"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_series_equal(pd.Series(pd.Categorical(['a', 'b'])),
+                                pd.Series(pd.Categorical(['a', 'b'],
+                                          categories=['a', 'b', 'c'])))
+
+    def test_categorical_series_equality_relax_categories_check(self):
+        assert_series_equal(pd.Series(pd.Categorical(['a', 'b'])),
+                            pd.Series(pd.Categorical(['a', 'b'],
+                                      categories=['a', 'b', 'c'])),
+                            check_categorical=False)
+
+
+class TestAssertFrameEqual(object):
+
+    def _assert_equal(self, x, y, **kwargs):
+        assert_frame_equal(x, y, **kwargs)
+        assert_frame_equal(y, x, **kwargs)
+
+    def _assert_not_equal(self, a, b, **kwargs):
+        pytest.raises(AssertionError, assert_frame_equal, a, b, **kwargs)
+        pytest.raises(AssertionError, assert_frame_equal, b, a, **kwargs)
+
+    def test_equal_with_different_row_order(self):
+        # check_like=True ignores row-column orderings
+        df1 = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
+                           index=['a', 'b', 'c'])
+        df2 = pd.DataFrame({'A': [3, 2, 1], 'B': [6, 5, 4]},
+                           index=['c', 'b', 'a'])
+
+        self._assert_equal(df1, df2, check_like=True)
+        self._assert_not_equal(df1, df2)
+
+    def test_not_equal_with_different_shape(self):
+        self._assert_not_equal(pd.DataFrame({'A': [1, 2, 3]}),
+                               pd.DataFrame({'A': [1, 2, 3, 4]}))
+
+    def test_index_dtype(self):
+        df1 = DataFrame.from_records(
+            {'a': [1, 2], 'c': ['l1', 'l2']}, index=['a'])
+        df2 = DataFrame.from_records(
+            {'a': [1.0, 2.0], 'c': ['l1', 'l2']}, index=['a'])
+        self._assert_not_equal(df1, df2, check_index_type=True)
+
+    def test_multiindex_dtype(self):
+        df1 = DataFrame.from_records(
+            {'a': [1, 2], 'b': [2.1, 1.5],
+             'c': ['l1', 'l2']}, index=['a', 'b'])
+        df2 = DataFrame.from_records(
+            {'a': [1.0, 2.0], 'b': [2.1, 1.5],
+             'c': ['l1', 'l2']}, index=['a', 'b'])
+        self._assert_not_equal(df1, df2, check_index_type=True)
+
+    def test_empty_dtypes(self):
+        df1 = pd.DataFrame(columns=["col1", "col2"])
+        df1["col1"] = df1["col1"].astype('int64')
+        df2 = pd.DataFrame(columns=["col1", "col2"])
+        self._assert_equal(df1, df2, check_dtype=False)
+        self._assert_not_equal(df1, df2, check_dtype=True)
+
+    def test_frame_equal_message(self):
+
+        expected = """DataFrame are different
+
+DataFrame shape mismatch
+\\[left\\]:  \\(3, 2\\)
+\\[right\\]: \\(3, 1\\)"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_frame_equal(pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]}),
+                               pd.DataFrame({'A': [1, 2, 3]}))
+
+        expected = """DataFrame\\.index are different
+
+DataFrame\\.index values are different \\(33\\.33333 %\\)
+\\[left\\]:  Index\\(\\[u?'a', u?'b', u?'c'\\], dtype='object'\\)
+\\[right\\]: Index\\(\\[u?'a', u?'b', u?'d'\\], dtype='object'\\)"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_frame_equal(pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
+                                            index=['a', 'b', 'c']),
+                               pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
+                                            index=['a', 'b', 'd']))
+
+        expected = """DataFrame\\.columns are different
+
+DataFrame\\.columns values are different \\(50\\.0 %\\)
+\\[left\\]:  Index\\(\\[u?'A', u?'B'\\], dtype='object'\\)
+\\[right\\]: Index\\(\\[u?'A', u?'b'\\], dtype='object'\\)"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_frame_equal(pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
+                                            index=['a', 'b', 'c']),
+                               pd.DataFrame({'A': [1, 2, 3], 'b': [4, 5, 6]},
+                                            index=['a', 'b', 'c']))
+
+        expected = """DataFrame\\.iloc\\[:, 1\\] are different
+
+DataFrame\\.iloc\\[:, 1\\] values are different \\(33\\.33333 %\\)
+\\[left\\]:  \\[4, 5, 6\\]
+\\[right\\]: \\[4, 5, 7\\]"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_frame_equal(pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]}),
+                               pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 7]}))
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_frame_equal(pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]}),
+                               pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 7]}),
+                               by_blocks=True)
+
+    def test_frame_equal_message_unicode(self):
+        # Test ensures that `assert_frame_equals` raises the right
+        # exception when comparing DataFrames containing differing
+        # unicode objects (#20503)
+
+        expected = """DataFrame\\.iloc\\[:, 1\\] are different
+
+DataFrame\\.iloc\\[:, 1\\] values are different \\(33\\.33333 %\\)
+\\[left\\]:  \\[é, è, ë\\]
+\\[right\\]: \\[é, è, e̊\\]"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_frame_equal(pd.DataFrame({'A': [u'á', u'à', u'ä'],
+                                             'E': [u'é', u'è', u'ë']}),
+                               pd.DataFrame({'A': [u'á', u'à', u'ä'],
+                                             'E': [u'é', u'è', u'e̊']}))
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_frame_equal(pd.DataFrame({'A': [u'á', u'à', u'ä'],
+                                             'E': [u'é', u'è', u'ë']}),
+                               pd.DataFrame({'A': [u'á', u'à', u'ä'],
+                                             'E': [u'é', u'è', u'e̊']}),
+                               by_blocks=True)
+
+        expected = """DataFrame\\.iloc\\[:, 0\\] are different
+
+DataFrame\\.iloc\\[:, 0\\] values are different \\(100\\.0 %\\)
+\\[left\\]:  \\[á, à, ä\\]
+\\[right\\]: \\[a, a, a\\]"""
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_frame_equal(pd.DataFrame({'A': [u'á', u'à', u'ä'],
+                                             'E': [u'é', u'è', u'ë']}),
+                               pd.DataFrame({'A': ['a', 'a', 'a'],
+                                             'E': ['e', 'e', 'e']}))
+
+        with tm.assert_raises_regex(AssertionError, expected):
+            assert_frame_equal(pd.DataFrame({'A': [u'á', u'à', u'ä'],
+                                             'E': [u'é', u'è', u'ë']}),
+                               pd.DataFrame({'A': ['a', 'a', 'a'],
+                                             'E': ['e', 'e', 'e']}),
+                               by_blocks=True)
+
+
+class TestAssertCategoricalEqual(object):
+
+    def test_categorical_equal_message(self):
+
+        expected = """Categorical\\.categories are different
+
+Categorical\\.categories values are different \\(25\\.0 %\\)
+\\[left\\]:  Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)
+\\[right\\]: Int64Index\\(\\[1, 2, 3, 5\\], dtype='int64'\\)"""
+
+        a = pd.Categorical([1, 2, 3, 4])
+        b = pd.Categorical([1, 2, 3, 5])
+        with tm.assert_raises_regex(AssertionError, expected):
+            tm.assert_categorical_equal(a, b)
+
+        expected = """Categorical\\.codes are different
+
+Categorical\\.codes values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[0, 1, 3, 2\\]
+\\[right\\]: \\[0, 1, 2, 3\\]"""
+
+        a = pd.Categorical([1, 2, 4, 3], categories=[1, 2, 3, 4])
+        b = pd.Categorical([1, 2, 3, 4], categories=[1, 2, 3, 4])
+        with tm.assert_raises_regex(AssertionError, expected):
+            tm.assert_categorical_equal(a, b)
+
+        expected = """Categorical are different
+
+Attribute "ordered" are different
+\\[left\\]:  False
+\\[right\\]: True"""
+
+        a = pd.Categorical([1, 2, 3, 4], ordered=False)
+        b = pd.Categorical([1, 2, 3, 4], ordered=True)
+        with tm.assert_raises_regex(AssertionError, expected):
+            tm.assert_categorical_equal(a, b)
+
+
+class TestRNGContext(object):
+
+    def test_RNGContext(self):
+        expected0 = 1.764052345967664
+        expected1 = 1.6243453636632417
+
+        with RNGContext(0):
+            with RNGContext(1):
+                assert np.random.randn() == expected1
+            assert np.random.randn() == expected0
+
+
+class TestLocale(object):
+
+    def test_locale(self):
+        if sys.platform == 'win32':
+            pytest.skip(
+                "skipping on win platforms as locale not available")
+
+        # GH9744
+        locales = tm.get_locales()
+        assert len(locales) >= 1
+
+
+def test_datapath_missing(datapath, request):
+    if not request.config.getoption("--strict-data-files"):
+        pytest.skip("Need to set '--strict-data-files'")
+
+    with pytest.raises(ValueError):
+        datapath('not_a_file')
+
+    result = datapath('data', 'iris.csv')
+    expected = os.path.join(
+        os.path.dirname(os.path.dirname(__file__)),
+        'data',
+        'iris.csv'
+    )
+
+    assert result == expected
diff --git a/pandas/tests/util/test_util.py b/pandas/tests/util/test_util.py
new file mode 100644
index 0000000000000..145be7f85b193
--- /dev/null
+++ b/pandas/tests/util/test_util.py
@@ -0,0 +1,512 @@
+# -*- coding: utf-8 -*-
+import os
+import locale
+import codecs
+import sys
+from uuid import uuid4
+from collections import OrderedDict
+
+import pytest
+from pandas.compat import intern, PY3
+import pandas.core.common as com
+from pandas.util._move import move_into_mutable_buffer, BadMove, stolenbuf
+from pandas.util._decorators import deprecate_kwarg, make_signature
+from pandas.util._validators import (validate_args, validate_kwargs,
+                                     validate_args_and_kwargs,
+                                     validate_bool_kwarg)
+
+import pandas.util.testing as tm
+import pandas.util._test_decorators as td
+
+
+class TestDecorators(object):
+
+    def setup_method(self, method):
+        @deprecate_kwarg('old', 'new')
+        def _f1(new=False):
+            return new
+
+        @deprecate_kwarg('old', 'new', {'yes': True, 'no': False})
+        def _f2(new=False):
+            return new
+
+        @deprecate_kwarg('old', 'new', lambda x: x + 1)
+        def _f3(new=0):
+            return new
+
+        @deprecate_kwarg('old', None)
+        def _f4(old=True, unchanged=True):
+            return old
+
+        self.f1 = _f1
+        self.f2 = _f2
+        self.f3 = _f3
+        self.f4 = _f4
+
+    def test_deprecate_kwarg(self):
+        x = 78
+        with tm.assert_produces_warning(FutureWarning):
+            result = self.f1(old=x)
+        assert result is x
+        with tm.assert_produces_warning(None):
+            self.f1(new=x)
+
+    def test_dict_deprecate_kwarg(self):
+        x = 'yes'
+        with tm.assert_produces_warning(FutureWarning):
+            result = self.f2(old=x)
+        assert result
+
+    def test_missing_deprecate_kwarg(self):
+        x = 'bogus'
+        with tm.assert_produces_warning(FutureWarning):
+            result = self.f2(old=x)
+        assert result == 'bogus'
+
+    def test_callable_deprecate_kwarg(self):
+        x = 5
+        with tm.assert_produces_warning(FutureWarning):
+            result = self.f3(old=x)
+        assert result == x + 1
+        with pytest.raises(TypeError):
+            self.f3(old='hello')
+
+    def test_bad_deprecate_kwarg(self):
+        with pytest.raises(TypeError):
+            @deprecate_kwarg('old', 'new', 0)
+            def f4(new=None):
+                pass
+
+    def test_deprecate_keyword(self):
+        x = 9
+        with tm.assert_produces_warning(FutureWarning):
+            result = self.f4(old=x)
+        assert result is x
+        with tm.assert_produces_warning(None):
+            result = self.f4(unchanged=x)
+        assert result is True
+
+
+def test_rands():
+    r = tm.rands(10)
+    assert(len(r) == 10)
+
+
+def test_rands_array():
+    arr = tm.rands_array(5, size=10)
+    assert(arr.shape == (10,))
+    assert(len(arr[0]) == 5)
+
+    arr = tm.rands_array(7, size=(10, 10))
+    assert(arr.shape == (10, 10))
+    assert(len(arr[1, 1]) == 7)
+
+
+class TestValidateArgs(object):
+    fname = 'func'
+
+    def test_bad_min_fname_arg_count(self):
+        msg = "'max_fname_arg_count' must be non-negative"
+        with tm.assert_raises_regex(ValueError, msg):
+            validate_args(self.fname, (None,), -1, 'foo')
+
+    def test_bad_arg_length_max_value_single(self):
+        args = (None, None)
+        compat_args = ('foo',)
+
+        min_fname_arg_count = 0
+        max_length = len(compat_args) + min_fname_arg_count
+        actual_length = len(args) + min_fname_arg_count
+        msg = (r"{fname}\(\) takes at most {max_length} "
+               r"argument \({actual_length} given\)"
+               .format(fname=self.fname, max_length=max_length,
+                       actual_length=actual_length))
+
+        with tm.assert_raises_regex(TypeError, msg):
+            validate_args(self.fname, args,
+                          min_fname_arg_count,
+                          compat_args)
+
+    def test_bad_arg_length_max_value_multiple(self):
+        args = (None, None)
+        compat_args = dict(foo=None)
+
+        min_fname_arg_count = 2
+        max_length = len(compat_args) + min_fname_arg_count
+        actual_length = len(args) + min_fname_arg_count
+        msg = (r"{fname}\(\) takes at most {max_length} "
+               r"arguments \({actual_length} given\)"
+               .format(fname=self.fname, max_length=max_length,
+                       actual_length=actual_length))
+
+        with tm.assert_raises_regex(TypeError, msg):
+            validate_args(self.fname, args,
+                          min_fname_arg_count,
+                          compat_args)
+
+    def test_not_all_defaults(self):
+        bad_arg = 'foo'
+        msg = ("the '{arg}' parameter is not supported "
+               r"in the pandas implementation of {func}\(\)".
+               format(arg=bad_arg, func=self.fname))
+
+        compat_args = OrderedDict()
+        compat_args['foo'] = 2
+        compat_args['bar'] = -1
+        compat_args['baz'] = 3
+
+        arg_vals = (1, -1, 3)
+
+        for i in range(1, 3):
+            with tm.assert_raises_regex(ValueError, msg):
+                validate_args(self.fname, arg_vals[:i], 2, compat_args)
+
+    def test_validation(self):
+        # No exceptions should be thrown
+        validate_args(self.fname, (None,), 2, dict(out=None))
+
+        compat_args = OrderedDict()
+        compat_args['axis'] = 1
+        compat_args['out'] = None
+
+        validate_args(self.fname, (1, None), 2, compat_args)
+
+
+class TestValidateKwargs(object):
+    fname = 'func'
+
+    def test_bad_kwarg(self):
+        goodarg = 'f'
+        badarg = goodarg + 'o'
+
+        compat_args = OrderedDict()
+        compat_args[goodarg] = 'foo'
+        compat_args[badarg + 'o'] = 'bar'
+        kwargs = {goodarg: 'foo', badarg: 'bar'}
+        msg = (r"{fname}\(\) got an unexpected "
+               r"keyword argument '{arg}'".format(
+                   fname=self.fname, arg=badarg))
+
+        with tm.assert_raises_regex(TypeError, msg):
+            validate_kwargs(self.fname, kwargs, compat_args)
+
+    def test_not_all_none(self):
+        bad_arg = 'foo'
+        msg = (r"the '{arg}' parameter is not supported "
+               r"in the pandas implementation of {func}\(\)".
+               format(arg=bad_arg, func=self.fname))
+
+        compat_args = OrderedDict()
+        compat_args['foo'] = 1
+        compat_args['bar'] = 's'
+        compat_args['baz'] = None
+
+        kwarg_keys = ('foo', 'bar', 'baz')
+        kwarg_vals = (2, 's', None)
+
+        for i in range(1, 3):
+            kwargs = dict(zip(kwarg_keys[:i],
+                              kwarg_vals[:i]))
+
+            with tm.assert_raises_regex(ValueError, msg):
+                validate_kwargs(self.fname, kwargs, compat_args)
+
+    def test_validation(self):
+        # No exceptions should be thrown
+        compat_args = OrderedDict()
+        compat_args['f'] = None
+        compat_args['b'] = 1
+        compat_args['ba'] = 's'
+        kwargs = dict(f=None, b=1)
+        validate_kwargs(self.fname, kwargs, compat_args)
+
+    def test_validate_bool_kwarg(self):
+        arg_names = ['inplace', 'copy']
+        invalid_values = [1, "True", [1, 2, 3], 5.0]
+        valid_values = [True, False, None]
+
+        for name in arg_names:
+            for value in invalid_values:
+                with tm.assert_raises_regex(ValueError,
+                                            "For argument \"%s\" "
+                                            "expected type bool, "
+                                            "received type %s" %
+                                            (name, type(value).__name__)):
+                    validate_bool_kwarg(value, name)
+
+            for value in valid_values:
+                assert validate_bool_kwarg(value, name) == value
+
+
+class TestValidateKwargsAndArgs(object):
+    fname = 'func'
+
+    def test_invalid_total_length_max_length_one(self):
+        compat_args = ('foo',)
+        kwargs = {'foo': 'FOO'}
+        args = ('FoO', 'BaZ')
+
+        min_fname_arg_count = 0
+        max_length = len(compat_args) + min_fname_arg_count
+        actual_length = len(kwargs) + len(args) + min_fname_arg_count
+        msg = (r"{fname}\(\) takes at most {max_length} "
+               r"argument \({actual_length} given\)"
+               .format(fname=self.fname, max_length=max_length,
+                       actual_length=actual_length))
+
+        with tm.assert_raises_regex(TypeError, msg):
+            validate_args_and_kwargs(self.fname, args, kwargs,
+                                     min_fname_arg_count,
+                                     compat_args)
+
+    def test_invalid_total_length_max_length_multiple(self):
+        compat_args = ('foo', 'bar', 'baz')
+        kwargs = {'foo': 'FOO', 'bar': 'BAR'}
+        args = ('FoO', 'BaZ')
+
+        min_fname_arg_count = 2
+        max_length = len(compat_args) + min_fname_arg_count
+        actual_length = len(kwargs) + len(args) + min_fname_arg_count
+        msg = (r"{fname}\(\) takes at most {max_length} "
+               r"arguments \({actual_length} given\)"
+               .format(fname=self.fname, max_length=max_length,
+                       actual_length=actual_length))
+
+        with tm.assert_raises_regex(TypeError, msg):
+            validate_args_and_kwargs(self.fname, args, kwargs,
+                                     min_fname_arg_count,
+                                     compat_args)
+
+    def test_no_args_with_kwargs(self):
+        bad_arg = 'bar'
+        min_fname_arg_count = 2
+
+        compat_args = OrderedDict()
+        compat_args['foo'] = -5
+        compat_args[bad_arg] = 1
+
+        msg = (r"the '{arg}' parameter is not supported "
+               r"in the pandas implementation of {func}\(\)".
+               format(arg=bad_arg, func=self.fname))
+
+        args = ()
+        kwargs = {'foo': -5, bad_arg: 2}
+        tm.assert_raises_regex(ValueError, msg,
+                               validate_args_and_kwargs,
+                               self.fname, args, kwargs,
+                               min_fname_arg_count, compat_args)
+
+        args = (-5, 2)
+        kwargs = {}
+        tm.assert_raises_regex(ValueError, msg,
+                               validate_args_and_kwargs,
+                               self.fname, args, kwargs,
+                               min_fname_arg_count, compat_args)
+
+    def test_duplicate_argument(self):
+        min_fname_arg_count = 2
+        compat_args = OrderedDict()
+        compat_args['foo'] = None
+        compat_args['bar'] = None
+        compat_args['baz'] = None
+        kwargs = {'foo': None, 'bar': None}
+        args = (None,)  # duplicate value for 'foo'
+
+        msg = (r"{fname}\(\) got multiple values for keyword "
+               r"argument '{arg}'".format(fname=self.fname, arg='foo'))
+
+        with tm.assert_raises_regex(TypeError, msg):
+            validate_args_and_kwargs(self.fname, args, kwargs,
+                                     min_fname_arg_count,
+                                     compat_args)
+
+    def test_validation(self):
+        # No exceptions should be thrown
+        compat_args = OrderedDict()
+        compat_args['foo'] = 1
+        compat_args['bar'] = None
+        compat_args['baz'] = -2
+        kwargs = {'baz': -2}
+        args = (1, None)
+
+        min_fname_arg_count = 2
+        validate_args_and_kwargs(self.fname, args, kwargs,
+                                 min_fname_arg_count,
+                                 compat_args)
+
+
+class TestMove(object):
+
+    def test_cannot_create_instance_of_stolenbuffer(self):
+        """Stolen buffers need to be created through the smart constructor
+        ``move_into_mutable_buffer`` which has a bunch of checks in it.
+        """
+        msg = "cannot create 'pandas.util._move.stolenbuf' instances"
+        with tm.assert_raises_regex(TypeError, msg):
+            stolenbuf()
+
+    def test_more_than_one_ref(self):
+        """Test case for when we try to use ``move_into_mutable_buffer`` when
+        the object being moved has other references.
+        """
+        b = b'testing'
+
+        with pytest.raises(BadMove) as e:
+            def handle_success(type_, value, tb):
+                assert value.args[0] is b
+                return type(e).handle_success(e, type_, value, tb)  # super
+
+            e.handle_success = handle_success
+            move_into_mutable_buffer(b)
+
+    def test_exactly_one_ref(self):
+        """Test case for when the object being moved has exactly one reference.
+        """
+        b = b'testing'
+
+        # We need to pass an expression on the stack to ensure that there are
+        # not extra references hanging around. We cannot rewrite this test as
+        #   buf = b[:-3]
+        #   as_stolen_buf = move_into_mutable_buffer(buf)
+        # because then we would have more than one reference to buf.
+        as_stolen_buf = move_into_mutable_buffer(b[:-3])
+
+        # materialize as bytearray to show that it is mutable
+        assert bytearray(as_stolen_buf) == b'test'
+
+    @pytest.mark.skipif(PY3, reason='bytes objects cannot be interned in py3')
+    def test_interned(self):
+        salt = uuid4().hex
+
+        def make_string():
+            # We need to actually create a new string so that it has refcount
+            # one. We use a uuid so that we know the string could not already
+            # be in the intern table.
+            return ''.join(('testing: ', salt))
+
+        # This should work, the string has one reference on the stack.
+        move_into_mutable_buffer(make_string())
+
+        refcount = [None]  # nonlocal
+
+        def ref_capture(ob):
+            # Subtract two because those are the references owned by this
+            # frame:
+            #   1. The local variables of this stack frame.
+            #   2. The python data stack of this stack frame.
+            refcount[0] = sys.getrefcount(ob) - 2
+            return ob
+
+        with pytest.raises(BadMove):
+            # If we intern the string it will still have one reference but now
+            # it is in the intern table so if other people intern the same
+            # string while the mutable buffer holds the first string they will
+            # be the same instance.
+            move_into_mutable_buffer(ref_capture(intern(make_string())))  # noqa
+
+        assert refcount[0] == 1
+
+
+def test_numpy_errstate_is_default():
+    # The defaults since numpy 1.6.0
+    expected = {'over': 'warn', 'divide': 'warn', 'invalid': 'warn',
+                'under': 'ignore'}
+    import numpy as np
+    from pandas.compat import numpy  # noqa
+    # The errstate should be unchanged after that import.
+    assert np.geterr() == expected
+
+
+@td.skip_if_windows
+class TestLocaleUtils(object):
+
+    @classmethod
+    def setup_class(cls):
+        cls.locales = tm.get_locales()
+        cls.current_locale = locale.getlocale()
+
+        if not cls.locales:
+            pytest.skip("No locales found")
+
+    @classmethod
+    def teardown_class(cls):
+        del cls.locales
+        del cls.current_locale
+
+    def test_get_locales(self):
+        # all systems should have at least a single locale
+        assert len(tm.get_locales()) > 0
+
+    def test_get_locales_prefix(self):
+        if len(self.locales) == 1:
+            pytest.skip("Only a single locale found, no point in "
+                        "trying to test filtering locale prefixes")
+        first_locale = self.locales[0]
+        assert len(tm.get_locales(prefix=first_locale[:2])) > 0
+
+    def test_set_locale(self):
+        if len(self.locales) == 1:
+            pytest.skip("Only a single locale found, no point in "
+                        "trying to test setting another locale")
+
+        if com._all_none(*self.current_locale):
+            # Not sure why, but on some travis runs with pytest,
+            # getlocale() returned (None, None).
+            pytest.skip("Current locale is not set.")
+
+        locale_override = os.environ.get('LOCALE_OVERRIDE', None)
+
+        if locale_override is None:
+            lang, enc = 'it_CH', 'UTF-8'
+        elif locale_override == 'C':
+            lang, enc = 'en_US', 'ascii'
+        else:
+            lang, enc = locale_override.split('.')
+
+        enc = codecs.lookup(enc).name
+        new_locale = lang, enc
+
+        if not tm._can_set_locale(new_locale):
+            with pytest.raises(locale.Error):
+                with tm.set_locale(new_locale):
+                    pass
+        else:
+            with tm.set_locale(new_locale) as normalized_locale:
+                new_lang, new_enc = normalized_locale.split('.')
+                new_enc = codecs.lookup(enc).name
+                normalized_locale = new_lang, new_enc
+                assert normalized_locale == new_locale
+
+        current_locale = locale.getlocale()
+        assert current_locale == self.current_locale
+
+
+def test_make_signature():
+    # See GH 17608
+    # Case where the func does not have default kwargs
+    sig = make_signature(validate_kwargs)
+    assert sig == (['fname', 'kwargs', 'compat_args'],
+                   ['fname', 'kwargs', 'compat_args'])
+
+    # Case where the func does have default kwargs
+    sig = make_signature(deprecate_kwarg)
+    assert sig == (['old_arg_name', 'new_arg_name',
+                    'mapping=None', 'stacklevel=2'],
+                   ['old_arg_name', 'new_arg_name', 'mapping', 'stacklevel'])
+
+
+def test_safe_import(monkeypatch):
+    assert not td.safe_import("foo")
+    assert not td.safe_import("pandas", min_version="99.99.99")
+
+    # Create dummy module to be imported
+    import types
+    import sys
+    mod_name = "hello123"
+    mod = types.ModuleType(mod_name)
+    mod.__version__ = "1.5"
+
+    assert not td.safe_import(mod_name)
+    monkeypatch.setitem(sys.modules, mod_name, mod)
+    assert not td.safe_import(mod_name, min_version="2.0")
+    assert td.safe_import(mod_name, min_version="1.0")
diff --git a/pandas/tools/merge.py b/pandas/tools/merge.py
index 95c68aaa00b18..cd58aa2c7f923 100644
--- a/pandas/tools/merge.py
+++ b/pandas/tools/merge.py
@@ -1,1207 +1,17 @@
-"""
-SQL-style merge routines
-"""
+import warnings
 
-import numpy as np
-from pandas.compat import range, lrange, lzip, zip, map, filter
-import pandas.compat as compat
-from pandas.core.categorical import Categorical
-from pandas.core.frame import DataFrame, _merge_doc
-from pandas.core.generic import NDFrame
-from pandas.core.series import Series
-from pandas.core.index import (Index, MultiIndex, _get_combined_index,
-                               _ensure_index, _get_consensus_names,
-                               _all_indexes_same)
-from pandas.core.internals import (items_overlap_with_suffix,
-                                   concatenate_block_managers)
-from pandas.util.decorators import Appender, Substitution
-from pandas.core.common import ABCSeries, isnull
 
-import pandas.core.common as com
+# back-compat of pseudo-public API
+def concat_wrap():
 
-import pandas.algos as algos
-import pandas.hashtable as _hash
+    def wrapper(*args, **kwargs):
+        warnings.warn("pandas.tools.merge.concat is deprecated. "
+                      "import from the public API: "
+                      "pandas.concat instead",
+                      FutureWarning, stacklevel=3)
+        import pandas as pd
+        return pd.concat(*args, **kwargs)
+    return wrapper
 
 
-@Substitution('\nleft : DataFrame')
-@Appender(_merge_doc, indents=0)
-def merge(left, right, how='inner', on=None, left_on=None, right_on=None,
-          left_index=False, right_index=False, sort=False,
-          suffixes=('_x', '_y'), copy=True, indicator=False):
-    op = _MergeOperation(left, right, how=how, on=on, left_on=left_on,
-                         right_on=right_on, left_index=left_index,
-                         right_index=right_index, sort=sort, suffixes=suffixes,
-                         copy=copy, indicator=indicator)
-    return op.get_result()
-if __debug__:
-    merge.__doc__ = _merge_doc % '\nleft : DataFrame'
-
-
-class MergeError(ValueError):
-    pass
-
-
-def ordered_merge(left, right, on=None, left_by=None, right_by=None,
-                  left_on=None, right_on=None,
-                  fill_method=None, suffixes=('_x', '_y')):
-    """Perform merge with optional filling/interpolation designed for ordered
-    data like time series data. Optionally perform group-wise merge (see
-    examples)
-
-    Parameters
-    ----------
-    left : DataFrame
-    right : DataFrame
-    fill_method : {'ffill', None}, default None
-        Interpolation method for data
-    on : label or list
-        Field names to join on. Must be found in both DataFrames.
-    left_on : label or list, or array-like
-        Field names to join on in left DataFrame. Can be a vector or list of
-        vectors of the length of the DataFrame to use a particular vector as
-        the join key instead of columns
-    right_on : label or list, or array-like
-        Field names to join on in right DataFrame or vector/list of vectors per
-        left_on docs
-    left_by : column name or list of column names
-        Group left DataFrame by group columns and merge piece by piece with
-        right DataFrame
-    right_by : column name or list of column names
-        Group right DataFrame by group columns and merge piece by piece with
-        left DataFrame
-    suffixes : 2-length sequence (tuple, list, ...)
-        Suffix to apply to overlapping column names in the left and right
-        side, respectively
-
-    Examples
-    --------
-    >>> A                      >>> B
-          key  lvalue group        key  rvalue
-    0   a       1     a        0     b       1
-    1   c       2     a        1     c       2
-    2   e       3     a        2     d       3
-    3   a       1     b
-    4   c       2     b
-    5   e       3     b
-
-    >>> ordered_merge(A, B, fill_method='ffill', left_by='group')
-       key  lvalue group  rvalue
-    0    a       1     a     NaN
-    1    b       1     a       1
-    2    c       2     a       2
-    3    d       2     a       3
-    4    e       3     a       3
-    5    f       3     a       4
-    6    a       1     b     NaN
-    7    b       1     b       1
-    8    c       2     b       2
-    9    d       2     b       3
-    10   e       3     b       3
-    11   f       3     b       4
-
-    Returns
-    -------
-    merged : DataFrame
-        The output type will the be same as 'left', if it is a subclass
-        of DataFrame.
-    """
-    def _merger(x, y):
-        op = _OrderedMerge(x, y, on=on, left_on=left_on, right_on=right_on,
-                           # left_index=left_index, right_index=right_index,
-                           suffixes=suffixes, fill_method=fill_method)
-        return op.get_result()
-
-    if left_by is not None and right_by is not None:
-        raise ValueError('Can only group either left or right frames')
-    elif left_by is not None:
-        if not isinstance(left_by, (list, tuple)):
-            left_by = [left_by]
-        pieces = []
-        for key, xpiece in left.groupby(left_by):
-            merged = _merger(xpiece, right)
-            for k in left_by:
-                # May have passed ndarray
-                try:
-                    if k in merged:
-                        merged[k] = key
-                except:
-                    pass
-            pieces.append(merged)
-        return concat(pieces, ignore_index=True)
-    elif right_by is not None:
-        if not isinstance(right_by, (list, tuple)):
-            right_by = [right_by]
-        pieces = []
-        for key, ypiece in right.groupby(right_by):
-            merged = _merger(left, ypiece)
-            for k in right_by:
-                try:
-                    if k in merged:
-                        merged[k] = key
-                except:
-                    pass
-            pieces.append(merged)
-        return concat(pieces, ignore_index=True)
-    else:
-        return _merger(left, right)
-
-
-# TODO: transformations??
-# TODO: only copy DataFrames when modification necessary
-class _MergeOperation(object):
-    """
-    Perform a database (SQL) merge operation between two DataFrame objects
-    using either columns as keys or their row indexes
-    """
-
-    def __init__(self, left, right, how='inner', on=None,
-                 left_on=None, right_on=None, axis=1,
-                 left_index=False, right_index=False, sort=True,
-                 suffixes=('_x', '_y'), copy=True, indicator=False):
-        self.left = self.orig_left = left
-        self.right = self.orig_right = right
-        self.how = how
-        self.axis = axis
-
-        self.on = com._maybe_make_list(on)
-        self.left_on = com._maybe_make_list(left_on)
-        self.right_on = com._maybe_make_list(right_on)
-
-        self.copy = copy
-        self.suffixes = suffixes
-        self.sort = sort
-
-        self.left_index = left_index
-        self.right_index = right_index
-
-        self.indicator = indicator
-
-        if isinstance(self.indicator, compat.string_types):
-            self.indicator_name = self.indicator
-        elif isinstance(self.indicator, bool):
-            self.indicator_name = '_merge' if self.indicator else None
-        else:
-            raise ValueError('indicator option can only accept boolean or string arguments')
-
-
-        # note this function has side effects
-        (self.left_join_keys,
-         self.right_join_keys,
-         self.join_names) = self._get_merge_keys()
-
-    def get_result(self):
-        if self.indicator:
-            self.left, self.right = self._indicator_pre_merge(self.left, self.right)
-
-        join_index, left_indexer, right_indexer = self._get_join_info()
-
-        ldata, rdata = self.left._data, self.right._data
-        lsuf, rsuf = self.suffixes
-
-        llabels, rlabels = items_overlap_with_suffix(ldata.items, lsuf,
-                                                     rdata.items, rsuf)
-
-        lindexers = {1: left_indexer} if left_indexer is not None else {}
-        rindexers = {1: right_indexer} if right_indexer is not None else {}
-
-        result_data = concatenate_block_managers(
-            [(ldata, lindexers), (rdata, rindexers)],
-            axes=[llabels.append(rlabels), join_index],
-            concat_axis=0, copy=self.copy)
-
-        typ = self.left._constructor
-        result = typ(result_data).__finalize__(self, method='merge')
-
-        if self.indicator:
-            result = self._indicator_post_merge(result)
-
-        self._maybe_add_join_keys(result, left_indexer, right_indexer)
-
-        return result
-
-    def _indicator_pre_merge(self, left, right):
-                
-        columns = left.columns.union(right.columns)  
-
-        for i in ['_left_indicator', '_right_indicator']:
-            if i in columns:
-                raise ValueError("Cannot use `indicator=True` option when data contains a column named {}".format(i))
-        if self.indicator_name in columns:
-            raise ValueError("Cannot use name of an existing column for indicator column")
-
-        left = left.copy()
-        right = right.copy()
-
-        left['_left_indicator'] = 1  
-        left['_left_indicator'] = left['_left_indicator'].astype('int8')  
-        
-        right['_right_indicator'] = 2     
-        right['_right_indicator'] = right['_right_indicator'].astype('int8') 
-        
-        return left, right
-
-    def _indicator_post_merge(self, result):
-
-        result['_left_indicator'] = result['_left_indicator'].fillna(0)
-        result['_right_indicator'] = result['_right_indicator'].fillna(0)
-
-        result[self.indicator_name] = Categorical((result['_left_indicator'] + result['_right_indicator']), categories=[1,2,3])
-        result[self.indicator_name] = result[self.indicator_name].cat.rename_categories(['left_only', 'right_only', 'both'])        
- 
-        result = result.drop(labels=['_left_indicator', '_right_indicator'], axis=1)
-
-        return result
-
-    def _maybe_add_join_keys(self, result, left_indexer, right_indexer):
-        # insert group keys
-
-        keys = zip(self.join_names, self.left_on, self.right_on)
-        for i, (name, lname, rname) in enumerate(keys):
-            if not _should_fill(lname, rname):
-                continue
-
-            if name in result:
-                key_col = result[name]
-
-                if left_indexer is not None and right_indexer is not None:
-
-                    if name in self.left:
-                        if len(self.left) == 0:
-                            continue
-
-                        na_indexer = (left_indexer == -1).nonzero()[0]
-                        if len(na_indexer) == 0:
-                            continue
-
-                        right_na_indexer = right_indexer.take(na_indexer)
-                        key_col.put(
-                            na_indexer, com.take_1d(self.right_join_keys[i],
-                                                    right_na_indexer))
-                    elif name in self.right:
-                        if len(self.right) == 0:
-                            continue
-
-                        na_indexer = (right_indexer == -1).nonzero()[0]
-                        if len(na_indexer) == 0:
-                            continue
-
-                        left_na_indexer = left_indexer.take(na_indexer)
-                        key_col.put(na_indexer, com.take_1d(self.left_join_keys[i],
-                                                            left_na_indexer))
-
-            elif left_indexer is not None \
-                    and isinstance(self.left_join_keys[i], np.ndarray):
-
-                if name is None:
-                    name = 'key_%d' % i
-
-                # a faster way?
-                key_col = com.take_1d(self.left_join_keys[i], left_indexer)
-                na_indexer = (left_indexer == -1).nonzero()[0]
-                right_na_indexer = right_indexer.take(na_indexer)
-                key_col.put(na_indexer, com.take_1d(self.right_join_keys[i],
-                                                    right_na_indexer))
-                result.insert(i, name, key_col)
-
-    def _get_join_info(self):
-        left_ax = self.left._data.axes[self.axis]
-        right_ax = self.right._data.axes[self.axis]
-        if self.left_index and self.right_index:
-            join_index, left_indexer, right_indexer = \
-                left_ax.join(right_ax, how=self.how, return_indexers=True)
-        elif self.right_index and self.how == 'left':
-            join_index, left_indexer, right_indexer = \
-                _left_join_on_index(left_ax, right_ax, self.left_join_keys,
-                                    sort=self.sort)
-
-        elif self.left_index and self.how == 'right':
-            join_index, right_indexer, left_indexer = \
-                _left_join_on_index(right_ax, left_ax, self.right_join_keys,
-                                    sort=self.sort)
-        else:
-            (left_indexer,
-             right_indexer) = _get_join_indexers(self.left_join_keys,
-                                                 self.right_join_keys,
-                                                 sort=self.sort, how=self.how)
-
-            if self.right_index:
-                if len(self.left) > 0:
-                    join_index = self.left.index.take(left_indexer)
-                else:
-                    join_index = self.right.index.take(right_indexer)
-                    left_indexer = np.array([-1] * len(join_index))
-            elif self.left_index:
-                if len(self.right) > 0:
-                    join_index = self.right.index.take(right_indexer)
-                else:
-                    join_index = self.left.index.take(left_indexer)
-                    right_indexer = np.array([-1] * len(join_index))
-            else:
-                join_index = Index(np.arange(len(left_indexer)))
-
-        return join_index, left_indexer, right_indexer
-
-    def _get_merge_data(self):
-        """
-        Handles overlapping column names etc.
-        """
-        ldata, rdata = self.left._data, self.right._data
-        lsuf, rsuf = self.suffixes
-
-        llabels, rlabels = items_overlap_with_suffix(
-            ldata.items, lsuf, rdata.items, rsuf)
-
-        if not llabels.equals(ldata.items):
-            ldata = ldata.copy(deep=False)
-            ldata.set_axis(0, llabels)
-
-        if not rlabels.equals(rdata.items):
-            rdata = rdata.copy(deep=False)
-            rdata.set_axis(0, rlabels)
-
-        return ldata, rdata
-
-    def _get_merge_keys(self):
-        """
-        Note: has side effects (copy/delete key columns)
-
-        Parameters
-        ----------
-        left
-        right
-        on
-
-        Returns
-        -------
-        left_keys, right_keys
-        """
-        self._validate_specification()
-
-        left_keys = []
-        right_keys = []
-        join_names = []
-        right_drop = []
-        left_drop = []
-        left, right = self.left, self.right
-
-        is_lkey = lambda x: isinstance(x, (np.ndarray, ABCSeries)) and len(x) == len(left)
-        is_rkey = lambda x: isinstance(x, (np.ndarray, ABCSeries)) and len(x) == len(right)
-
-        # ugh, spaghetti re #733
-        if _any(self.left_on) and _any(self.right_on):
-            for lk, rk in zip(self.left_on, self.right_on):
-                if is_lkey(lk):
-                    left_keys.append(lk)
-                    if is_rkey(rk):
-                        right_keys.append(rk)
-                        join_names.append(None)  # what to do?
-                    else:
-                        right_keys.append(right[rk]._values)
-                        join_names.append(rk)
-                else:
-                    if not is_rkey(rk):
-                        right_keys.append(right[rk]._values)
-                        if lk == rk:
-                            # avoid key upcast in corner case (length-0)
-                            if len(left) > 0:
-                                right_drop.append(rk)
-                            else:
-                                left_drop.append(lk)
-                    else:
-                        right_keys.append(rk)
-                    left_keys.append(left[lk]._values)
-                    join_names.append(lk)
-        elif _any(self.left_on):
-            for k in self.left_on:
-                if is_lkey(k):
-                    left_keys.append(k)
-                    join_names.append(None)
-                else:
-                    left_keys.append(left[k]._values)
-                    join_names.append(k)
-            if isinstance(self.right.index, MultiIndex):
-                right_keys = [lev._values.take(lab)
-                              for lev, lab in zip(self.right.index.levels,
-                                                  self.right.index.labels)]
-            else:
-                right_keys = [self.right.index.values]
-        elif _any(self.right_on):
-            for k in self.right_on:
-                if is_rkey(k):
-                    right_keys.append(k)
-                    join_names.append(None)
-                else:
-                    right_keys.append(right[k]._values)
-                    join_names.append(k)
-            if isinstance(self.left.index, MultiIndex):
-                left_keys = [lev._values.take(lab)
-                             for lev, lab in zip(self.left.index.levels,
-                                                 self.left.index.labels)]
-            else:
-                left_keys = [self.left.index.values]
-
-        if left_drop:
-            self.left = self.left.drop(left_drop, axis=1)
-
-        if right_drop:
-            self.right = self.right.drop(right_drop, axis=1)
-
-        return left_keys, right_keys, join_names
-
-    def _validate_specification(self):
-        # Hm, any way to make this logic less complicated??
-        if (self.on is None and self.left_on is None
-                and self.right_on is None):
-
-            if self.left_index and self.right_index:
-                self.left_on, self.right_on = (), ()
-            elif self.left_index:
-                if self.right_on is None:
-                    raise MergeError('Must pass right_on or right_index=True')
-            elif self.right_index:
-                if self.left_on is None:
-                    raise MergeError('Must pass left_on or left_index=True')
-            else:
-                # use the common columns
-                common_cols = self.left.columns.intersection(
-                    self.right.columns)
-                if len(common_cols) == 0:
-                    raise MergeError('No common columns to perform merge on')
-                if not common_cols.is_unique:
-                    raise MergeError("Data columns not unique: %s"
-                                     % repr(common_cols))
-                self.left_on = self.right_on = common_cols
-        elif self.on is not None:
-            if self.left_on is not None or self.right_on is not None:
-                raise MergeError('Can only pass on OR left_on and '
-                                 'right_on')
-            self.left_on = self.right_on = self.on
-        elif self.left_on is not None:
-            n = len(self.left_on)
-            if self.right_index:
-                if len(self.left_on) != self.right.index.nlevels:
-                    raise ValueError('len(left_on) must equal the number '
-                                     'of levels in the index of "right"')
-                self.right_on = [None] * n
-        elif self.right_on is not None:
-            n = len(self.right_on)
-            if self.left_index:
-                if len(self.right_on) != self.left.index.nlevels:
-                    raise ValueError('len(right_on) must equal the number '
-                                     'of levels in the index of "left"')
-                self.left_on = [None] * n
-        if len(self.right_on) != len(self.left_on):
-            raise ValueError("len(right_on) must equal len(left_on)")
-
-
-def _get_join_indexers(left_keys, right_keys, sort=False, how='inner'):
-    """
-
-    Parameters
-    ----------
-
-    Returns
-    -------
-
-    """
-    from functools import partial
-
-    assert len(left_keys) == len(right_keys), \
-            'left_key and right_keys must be the same length'
-
-    # bind `sort` arg. of _factorize_keys
-    fkeys = partial(_factorize_keys, sort=sort)
-
-    # get left & right join labels and num. of levels at each location
-    llab, rlab, shape = map(list, zip( * map(fkeys, left_keys, right_keys)))
-
-    # get flat i8 keys from label lists
-    lkey, rkey = _get_join_keys(llab, rlab, shape, sort)
-
-    # factorize keys to a dense i8 space
-    # `count` is the num. of unique keys
-    # set(lkey) | set(rkey) == range(count)
-    lkey, rkey, count = fkeys(lkey, rkey)
-
-    # preserve left frame order if how == 'left' and sort == False
-    kwargs = {'sort':sort} if how == 'left' else {}
-    join_func = _join_functions[how]
-    return join_func(lkey, rkey, count, **kwargs)
-
-
-class _OrderedMerge(_MergeOperation):
-
-    def __init__(self, left, right, on=None, by=None, left_on=None,
-                 right_on=None, axis=1, left_index=False, right_index=False,
-                 suffixes=('_x', '_y'), copy=True,
-                 fill_method=None):
-
-        self.fill_method = fill_method
-
-        _MergeOperation.__init__(self, left, right, on=on, left_on=left_on,
-                                 right_on=right_on, axis=axis,
-                                 left_index=left_index,
-                                 right_index=right_index,
-                                 how='outer', suffixes=suffixes,
-                                 sort=True  # sorts when factorizing
-                                 )
-
-    def get_result(self):
-        join_index, left_indexer, right_indexer = self._get_join_info()
-
-        # this is a bit kludgy
-        ldata, rdata = self.left._data, self.right._data
-        lsuf, rsuf = self.suffixes
-
-        llabels, rlabels = items_overlap_with_suffix(ldata.items, lsuf,
-                                                     rdata.items, rsuf)
-
-        if self.fill_method == 'ffill':
-            left_join_indexer = algos.ffill_indexer(left_indexer)
-            right_join_indexer = algos.ffill_indexer(right_indexer)
-        else:
-            left_join_indexer = left_indexer
-            right_join_indexer = right_indexer
-
-        lindexers = {1: left_join_indexer} if left_join_indexer is not None else {}
-        rindexers = {1: right_join_indexer} if right_join_indexer is not None else {}
-
-        result_data = concatenate_block_managers(
-            [(ldata, lindexers), (rdata, rindexers)],
-            axes=[llabels.append(rlabels), join_index],
-            concat_axis=0, copy=self.copy)
-
-        typ = self.left._constructor
-        result = typ(result_data).__finalize__(self, method='ordered_merge')
-
-        self._maybe_add_join_keys(result, left_indexer, right_indexer)
-
-        return result
-
-
-def _get_multiindex_indexer(join_keys, index, sort):
-    from functools import partial
-
-    # bind `sort` argument
-    fkeys = partial(_factorize_keys, sort=sort)
-
-    # left & right join labels and num. of levels at each location
-    rlab, llab, shape = map(list, zip( * map(fkeys, index.levels, join_keys)))
-    if sort:
-        rlab = list(map(np.take, rlab, index.labels))
-    else:
-        i8copy = lambda a: a.astype('i8', subok=False, copy=True)
-        rlab = list(map(i8copy, index.labels))
-
-    # fix right labels if there were any nulls
-    for i in range(len(join_keys)):
-        mask = index.labels[i] == -1
-        if mask.any():
-            # check if there already was any nulls at this location
-            # if there was, it is factorized to `shape[i] - 1`
-            a = join_keys[i][llab[i] == shape[i] - 1]
-            if a.size == 0 or not a[0] != a[0]:
-                shape[i] += 1
-
-            rlab[i][mask] = shape[i] - 1
-
-    # get flat i8 join keys
-    lkey, rkey = _get_join_keys(llab, rlab, shape, sort)
-
-    # factorize keys to a dense i8 space
-    lkey, rkey, count = fkeys(lkey, rkey)
-
-    return algos.left_outer_join(lkey, rkey, count, sort=sort)
-
-
-def _get_single_indexer(join_key, index, sort=False):
-    left_key, right_key, count = _factorize_keys(join_key, index, sort=sort)
-
-    left_indexer, right_indexer = \
-        algos.left_outer_join(com._ensure_int64(left_key),
-                              com._ensure_int64(right_key),
-                              count, sort=sort)
-
-    return left_indexer, right_indexer
-
-
-def _left_join_on_index(left_ax, right_ax, join_keys, sort=False):
-    if len(join_keys) > 1:
-        if not ((isinstance(right_ax, MultiIndex) and
-                 len(join_keys) == right_ax.nlevels)):
-            raise AssertionError("If more than one join key is given then "
-                                 "'right_ax' must be a MultiIndex and the "
-                                 "number of join keys must be the number of "
-                                 "levels in right_ax")
-
-        left_indexer, right_indexer = \
-            _get_multiindex_indexer(join_keys, right_ax, sort=sort)
-    else:
-        jkey = join_keys[0]
-
-        left_indexer, right_indexer = \
-            _get_single_indexer(jkey, right_ax, sort=sort)
-
-    if sort or len(left_ax) != len(left_indexer):
-        # if asked to sort or there are 1-to-many matches
-        join_index = left_ax.take(left_indexer)
-        return join_index, left_indexer, right_indexer
-
-    # left frame preserves order & length of its index
-    return left_ax, None, right_indexer
-
-
-def _right_outer_join(x, y, max_groups):
-    right_indexer, left_indexer = algos.left_outer_join(y, x, max_groups)
-    return left_indexer, right_indexer
-
-_join_functions = {
-    'inner': algos.inner_join,
-    'left': algos.left_outer_join,
-    'right': _right_outer_join,
-    'outer': algos.full_outer_join,
-}
-
-
-def _factorize_keys(lk, rk, sort=True):
-    if com.is_int_or_datetime_dtype(lk) and com.is_int_or_datetime_dtype(rk):
-        klass = _hash.Int64Factorizer
-        lk = com._ensure_int64(lk)
-        rk = com._ensure_int64(rk)
-    else:
-        klass = _hash.Factorizer
-        lk = com._ensure_object(lk)
-        rk = com._ensure_object(rk)
-
-    rizer = klass(max(len(lk), len(rk)))
-
-    llab = rizer.factorize(lk)
-    rlab = rizer.factorize(rk)
-
-    count = rizer.get_count()
-
-    if sort:
-        uniques = rizer.uniques.to_array()
-        llab, rlab = _sort_labels(uniques, llab, rlab)
-
-    # NA group
-    lmask = llab == -1
-    lany = lmask.any()
-    rmask = rlab == -1
-    rany = rmask.any()
-
-    if lany or rany:
-        if lany:
-            np.putmask(llab, lmask, count)
-        if rany:
-            np.putmask(rlab, rmask, count)
-        count += 1
-
-    return llab, rlab, count
-
-
-def _sort_labels(uniques, left, right):
-    if not isinstance(uniques, np.ndarray):
-        # tuplesafe
-        uniques = Index(uniques).values
-
-    sorter = uniques.argsort()
-
-    reverse_indexer = np.empty(len(sorter), dtype=np.int64)
-    reverse_indexer.put(sorter, np.arange(len(sorter)))
-
-    new_left = reverse_indexer.take(com._ensure_platform_int(left))
-    np.putmask(new_left, left == -1, -1)
-
-    new_right = reverse_indexer.take(com._ensure_platform_int(right))
-    np.putmask(new_right, right == -1, -1)
-
-    return new_left, new_right
-
-
-def _get_join_keys(llab, rlab, shape, sort):
-    from pandas.core.groupby import _int64_overflow_possible
-
-    # how many levels can be done without overflow
-    pred = lambda i: not _int64_overflow_possible(shape[:i])
-    nlev = next(filter(pred, range(len(shape), 0, -1)))
-
-    # get keys for the first `nlev` levels
-    stride = np.prod(shape[1:nlev], dtype='i8')
-    lkey = stride * llab[0].astype('i8', subok=False, copy=False)
-    rkey = stride * rlab[0].astype('i8', subok=False, copy=False)
-
-    for i in range(1, nlev):
-        stride //= shape[i]
-        lkey += llab[i] * stride
-        rkey += rlab[i] * stride
-
-    if nlev == len(shape):  # all done!
-        return lkey, rkey
-
-    # densify current keys to avoid overflow
-    lkey, rkey, count = _factorize_keys(lkey, rkey, sort=sort)
-
-    llab = [lkey] + llab[nlev:]
-    rlab = [rkey] + rlab[nlev:]
-    shape = [count] + shape[nlev:]
-
-    return _get_join_keys(llab, rlab, shape, sort)
-
-#----------------------------------------------------------------------
-# Concatenate DataFrame objects
-
-
-def concat(objs, axis=0, join='outer', join_axes=None, ignore_index=False,
-           keys=None, levels=None, names=None, verify_integrity=False, copy=True):
-    """
-    Concatenate pandas objects along a particular axis with optional set logic
-    along the other axes. Can also add a layer of hierarchical indexing on the
-    concatenation axis, which may be useful if the labels are the same (or
-    overlapping) on the passed axis number
-
-    Parameters
-    ----------
-    objs : a sequence or mapping of Series, DataFrame, or Panel objects
-        If a dict is passed, the sorted keys will be used as the `keys`
-        argument, unless it is passed, in which case the values will be
-        selected (see below). Any None objects will be dropped silently unless
-        they are all None in which case a ValueError will be raised
-    axis : {0, 1, ...}, default 0
-        The axis to concatenate along
-    join : {'inner', 'outer'}, default 'outer'
-        How to handle indexes on other axis(es)
-    join_axes : list of Index objects
-        Specific indexes to use for the other n - 1 axes instead of performing
-        inner/outer set logic
-    verify_integrity : boolean, default False
-        Check whether the new concatenated axis contains duplicates. This can
-        be very expensive relative to the actual data concatenation
-    keys : sequence, default None
-        If multiple levels passed, should contain tuples. Construct
-        hierarchical index using the passed keys as the outermost level
-    levels : list of sequences, default None
-        Specific levels (unique values) to use for constructing a
-        MultiIndex. Otherwise they will be inferred from the keys
-    names : list, default None
-        Names for the levels in the resulting hierarchical index
-    ignore_index : boolean, default False
-        If True, do not use the index values along the concatenation axis. The
-        resulting axis will be labeled 0, ..., n - 1. This is useful if you are
-        concatenating objects where the concatenation axis does not have
-        meaningful indexing information. Note the the index values on the other
-        axes are still respected in the join.
-    copy : boolean, default True
-        If False, do not copy data unnecessarily
-
-    Notes
-    -----
-    The keys, levels, and names arguments are all optional
-
-    Returns
-    -------
-    concatenated : type of objects
-    """
-    op = _Concatenator(objs, axis=axis, join_axes=join_axes,
-                       ignore_index=ignore_index, join=join,
-                       keys=keys, levels=levels, names=names,
-                       verify_integrity=verify_integrity,
-                       copy=copy)
-    return op.get_result()
-
-
-class _Concatenator(object):
-    """
-    Orchestrates a concatenation operation for BlockManagers
-    """
-
-    def __init__(self, objs, axis=0, join='outer', join_axes=None,
-                 keys=None, levels=None, names=None,
-                 ignore_index=False, verify_integrity=False, copy=True):
-        if isinstance(objs, (NDFrame, compat.string_types)):
-            raise TypeError('first argument must be an iterable of pandas '
-                            'objects, you passed an object of type '
-                            '"{0}"'.format(type(objs).__name__))
-
-        if join == 'outer':
-            self.intersect = False
-        elif join == 'inner':
-            self.intersect = True
-        else:  # pragma: no cover
-            raise ValueError('Only can inner (intersect) or outer (union) '
-                             'join the other axis')
-
-        if isinstance(objs, dict):
-            if keys is None:
-                keys = sorted(objs)
-            objs = [objs[k] for k in keys]
-        else:
-            objs = list(objs)
-
-        if len(objs) == 0:
-            raise ValueError('No objects to concatenate')
-
-        if keys is None:
-            objs = [obj for obj in objs if obj is not None]
-        else:
-            # #1649
-            clean_keys = []
-            clean_objs = []
-            for k, v in zip(keys, objs):
-                if v is None:
-                    continue
-                clean_keys.append(k)
-                clean_objs.append(v)
-            objs = clean_objs
-            keys = clean_keys
-
-        if len(objs) == 0:
-            raise ValueError('All objects passed were None')
-
-        # consolidate data & figure out what our result ndim is going to be
-        ndims = set()
-        for obj in objs:
-            if not isinstance(obj, NDFrame):
-                raise TypeError("cannot concatenate a non-NDFrame object")
-
-            # consolidate
-            obj.consolidate(inplace=True)
-            ndims.add(obj.ndim)
-
-        # get the sample
-        # want the higest ndim that we have, and must be non-empty
-        # unless all objs are empty
-        sample = None
-        if len(ndims) > 1:
-            max_ndim = max(ndims)
-            for obj in objs:
-                if obj.ndim == max_ndim and np.sum(obj.shape):
-                    sample = obj
-                    break
-
-        else:
-            # filter out the empties
-            # if we have not multi-index possibiltes
-            df = DataFrame([ obj.shape for obj in objs ]).sum(1)
-            non_empties = df[df!=0]
-            if len(non_empties) and (keys is None and names is None and levels is None and join_axes is None):
-                objs = [ objs[i] for i in non_empties.index ]
-                sample = objs[0]
-
-        if sample is None:
-            sample = objs[0]
-        self.objs = objs
-
-        # Need to flip BlockManager axis in the DataFrame special case
-        self._is_frame = isinstance(sample, DataFrame)
-        if self._is_frame:
-            axis = 1 if axis == 0 else 0
-
-        self._is_series = isinstance(sample, ABCSeries)
-        if not 0 <= axis <= sample.ndim:
-            raise AssertionError("axis must be between 0 and {0}, "
-                                 "input was {1}".format(sample.ndim, axis))
-
-        # if we have mixed ndims, then convert to highest ndim
-        # creating column numbers as needed
-        if len(ndims) > 1:
-            current_column = 0
-            max_ndim = sample.ndim
-            self.objs, objs = [], self.objs
-            for obj in objs:
-
-                ndim = obj.ndim
-                if ndim == max_ndim:
-                    pass
-
-                elif ndim != max_ndim-1:
-                    raise ValueError("cannot concatenate unaligned mixed "
-                                     "dimensional NDFrame objects")
-
-                else:
-                    name = getattr(obj,'name',None)
-                    if ignore_index or name is None:
-                        name = current_column
-                        current_column += 1
-
-                    # doing a row-wise concatenation so need everything
-                    # to line up
-                    if self._is_frame and axis == 1:
-                        name = 0
-                    obj = sample._constructor({ name : obj })
-
-                self.objs.append(obj)
-
-        # note: this is the BlockManager axis (since DataFrame is transposed)
-        self.axis = axis
-        self.join_axes = join_axes
-        self.keys = keys
-        self.names = names
-        self.levels = levels
-
-        self.ignore_index = ignore_index
-        self.verify_integrity = verify_integrity
-        self.copy = copy
-
-        self.new_axes = self._get_new_axes()
-
-    def get_result(self):
-
-        # series only
-        if self._is_series:
-
-            # stack blocks
-            if self.axis == 0:
-                new_data = com._concat_compat([x._values for x in self.objs])
-                name = com._consensus_name_attr(self.objs)
-                return Series(new_data, index=self.new_axes[0], name=name).__finalize__(self, method='concat')
-
-            # combine as columns in a frame
-            else:
-                data = dict(zip(range(len(self.objs)), self.objs))
-                index, columns = self.new_axes
-                tmpdf = DataFrame(data, index=index)
-                # checks if the column variable already stores valid column names (because set via the 'key' argument
-                # in the 'concat' function call. If that's not the case, use the series names as column names
-                if columns.equals(Index(np.arange(len(self.objs)))) and not self.ignore_index:
-                    columns = np.array([ data[i].name for i in range(len(data)) ], dtype='object')
-                    indexer = isnull(columns)
-                    if indexer.any():
-                        columns[indexer] = np.arange(len(indexer[indexer]))
-                tmpdf.columns = columns
-                return tmpdf.__finalize__(self, method='concat')
-
-        # combine block managers
-        else:
-            mgrs_indexers = []
-            for obj in self.objs:
-                mgr = obj._data
-                indexers = {}
-                for ax, new_labels in enumerate(self.new_axes):
-                    if ax == self.axis:
-                        # Suppress reindexing on concat axis
-                        continue
-
-                    obj_labels = mgr.axes[ax]
-                    if not new_labels.equals(obj_labels):
-                        indexers[ax] = obj_labels.reindex(new_labels)[1]
-
-                mgrs_indexers.append((obj._data, indexers))
-
-            new_data = concatenate_block_managers(
-                mgrs_indexers, self.new_axes, concat_axis=self.axis, copy=self.copy)
-            if not self.copy:
-                new_data._consolidate_inplace()
-
-            return self.objs[0]._from_axes(new_data, self.new_axes).__finalize__(self, method='concat')
-
-    def _get_result_dim(self):
-        if self._is_series and self.axis == 1:
-            return 2
-        else:
-            return self.objs[0].ndim
-
-    def _get_new_axes(self):
-        ndim = self._get_result_dim()
-        new_axes = [None] * ndim
-
-        if self.join_axes is None:
-            for i in range(ndim):
-                if i == self.axis:
-                    continue
-                new_axes[i] = self._get_comb_axis(i)
-        else:
-            if len(self.join_axes) != ndim - 1:
-                raise AssertionError("length of join_axes must not be "
-                                     "equal to {0}".format(ndim - 1))
-
-            # ufff...
-            indices = lrange(ndim)
-            indices.remove(self.axis)
-
-            for i, ax in zip(indices, self.join_axes):
-                new_axes[i] = ax
-
-        new_axes[self.axis] = self._get_concat_axis()
-        return new_axes
-
-    def _get_comb_axis(self, i):
-        if self._is_series:
-            all_indexes = [x.index for x in self.objs]
-        else:
-            try:
-                all_indexes = [x._data.axes[i] for x in self.objs]
-            except IndexError:
-                types = [type(x).__name__ for x in self.objs]
-                raise TypeError("Cannot concatenate list of %s" % types)
-
-        return _get_combined_index(all_indexes, intersect=self.intersect)
-
-    def _get_concat_axis(self):
-        """
-        Return index to be used along concatenation axis.
-        """
-        if self._is_series:
-            if self.axis == 0:
-                indexes = [x.index for x in self.objs]
-            elif self.ignore_index:
-                idx = Index(np.arange(len(self.objs)))
-                idx.is_unique = True  # arange is always unique
-                return idx
-            elif self.keys is None:
-                names = []
-                for x in self.objs:
-                    if not isinstance(x, Series):
-                        raise TypeError("Cannot concatenate type 'Series' "
-                                        "with object of type "
-                                        "%r" % type(x).__name__)
-                    if x.name is not None:
-                        names.append(x.name)
-                    else:
-                        idx = Index(np.arange(len(self.objs)))
-                        idx.is_unique = True
-                        return idx
-
-                return Index(names)
-            else:
-                return _ensure_index(self.keys)
-        else:
-            indexes = [x._data.axes[self.axis] for x in self.objs]
-
-        if self.ignore_index:
-            idx = Index(np.arange(sum(len(i) for i in indexes)))
-            idx.is_unique = True
-            return idx
-
-        if self.keys is None:
-            concat_axis = _concat_indexes(indexes)
-        else:
-            concat_axis = _make_concat_multiindex(indexes, self.keys,
-                                                  self.levels, self.names)
-
-        self._maybe_check_integrity(concat_axis)
-
-        return concat_axis
-
-    def _maybe_check_integrity(self, concat_index):
-        if self.verify_integrity:
-            if not concat_index.is_unique:
-                overlap = concat_index.get_duplicates()
-                raise ValueError('Indexes have overlapping values: %s'
-                                % str(overlap))
-
-
-def _concat_indexes(indexes):
-    return indexes[0].append(indexes[1:])
-
-
-def _make_concat_multiindex(indexes, keys, levels=None, names=None):
-    if ((levels is None and isinstance(keys[0], tuple)) or
-            (levels is not None and len(levels) > 1)):
-        zipped = lzip(*keys)
-        if names is None:
-            names = [None] * len(zipped)
-
-        if levels is None:
-            levels = [Categorical.from_array(zp, ordered=True).categories for zp in zipped]
-        else:
-            levels = [_ensure_index(x) for x in levels]
-    else:
-        zipped = [keys]
-        if names is None:
-            names = [None]
-
-        if levels is None:
-            levels = [_ensure_index(keys)]
-        else:
-            levels = [_ensure_index(x) for x in levels]
-
-    if not _all_indexes_same(indexes):
-        label_list = []
-
-        # things are potentially different sizes, so compute the exact labels
-        # for each level and pass those to MultiIndex.from_arrays
-
-        for hlevel, level in zip(zipped, levels):
-            to_concat = []
-            for key, index in zip(hlevel, indexes):
-                try:
-                    i = level.get_loc(key)
-                except KeyError:
-                    raise ValueError('Key %s not in level %s'
-                                     % (str(key), str(level)))
-
-                to_concat.append(np.repeat(i, len(index)))
-            label_list.append(np.concatenate(to_concat))
-
-        concat_index = _concat_indexes(indexes)
-
-        # these go at the end
-        if isinstance(concat_index, MultiIndex):
-            levels.extend(concat_index.levels)
-            label_list.extend(concat_index.labels)
-        else:
-            factor = Categorical.from_array(concat_index, ordered=True)
-            levels.append(factor.categories)
-            label_list.append(factor.codes)
-
-        if len(names) == len(levels):
-            names = list(names)
-        else:
-            # make sure that all of the passed indices have the same nlevels
-            if not len(set([ i.nlevels for i in indexes ])) == 1:
-                raise AssertionError("Cannot concat indices that do"
-                                     " not have the same number of levels")
-
-            # also copies
-            names = names + _get_consensus_names(indexes)
-
-        return MultiIndex(levels=levels, labels=label_list, names=names,
-                          verify_integrity=False)
-
-    new_index = indexes[0]
-    n = len(new_index)
-    kpieces = len(indexes)
-
-    # also copies
-    new_names = list(names)
-    new_levels = list(levels)
-
-    # construct labels
-    new_labels = []
-
-    # do something a bit more speedy
-
-    for hlevel, level in zip(zipped, levels):
-        hlevel = _ensure_index(hlevel)
-        mapped = level.get_indexer(hlevel)
-
-        mask = mapped == -1
-        if mask.any():
-            raise ValueError('Values not found in passed level: %s'
-                             % str(hlevel[mask]))
-
-        new_labels.append(np.repeat(mapped, n))
-
-    if isinstance(new_index, MultiIndex):
-        new_levels.extend(new_index.levels)
-        new_labels.extend([np.tile(lab, kpieces) for lab in new_index.labels])
-    else:
-        new_levels.append(new_index)
-        new_labels.append(np.tile(np.arange(n), kpieces))
-
-    if len(new_names) < len(new_levels):
-        new_names.extend(new_index.names)
-
-    return MultiIndex(levels=new_levels, labels=new_labels, names=new_names,
-                      verify_integrity=False)
-
-
-def _should_fill(lname, rname):
-    if not isinstance(lname, compat.string_types) or not isinstance(rname, compat.string_types):
-        return True
-    return lname == rname
-
-
-def _any(x):
-    return x is not None and len(x) > 0 and any([y is not None for y in x])
+concat = concat_wrap()
diff --git a/pandas/tools/pivot.py b/pandas/tools/pivot.py
deleted file mode 100644
index 89fe9463282b6..0000000000000
--- a/pandas/tools/pivot.py
+++ /dev/null
@@ -1,411 +0,0 @@
-# pylint: disable=E1103
-
-import warnings
-
-from pandas import Series, DataFrame
-from pandas.core.index import MultiIndex, Index
-from pandas.core.groupby import Grouper
-from pandas.tools.merge import concat
-from pandas.tools.util import cartesian_product
-from pandas.compat import range, lrange, zip
-from pandas.util.decorators import deprecate_kwarg
-from pandas import compat
-import pandas.core.common as com
-import numpy as np
-
-def pivot_table(data, values=None, index=None, columns=None, aggfunc='mean',
-                fill_value=None, margins=False, dropna=True):
-    """
-    Create a spreadsheet-style pivot table as a DataFrame. The levels in the
-    pivot table will be stored in MultiIndex objects (hierarchical indexes) on
-    the index and columns of the result DataFrame
-
-    Parameters
-    ----------
-    data : DataFrame
-    values : column to aggregate, optional
-    index : a column, Grouper, array which has the same length as data, or list of them.
-        Keys to group by on the pivot table index.
-        If an array is passed, it is being used as the same manner as column values.
-    columns : a column, Grouper, array which has the same length as data, or list of them.
-        Keys to group by on the pivot table column.
-        If an array is passed, it is being used as the same manner as column values.
-    aggfunc : function, default numpy.mean, or list of functions
-        If list of functions passed, the resulting pivot table will have
-        hierarchical columns whose top level are the function names (inferred
-        from the function objects themselves)
-    fill_value : scalar, default None
-        Value to replace missing values with
-    margins : boolean, default False
-        Add all row / columns (e.g. for subtotal / grand totals)
-    dropna : boolean, default True
-        Do not include columns whose entries are all NaN
-
-    Examples
-    --------
-    >>> df
-       A   B   C      D
-    0  foo one small  1
-    1  foo one large  2
-    2  foo one large  2
-    3  foo two small  3
-    4  foo two small  3
-    5  bar one large  4
-    6  bar one small  5
-    7  bar two small  6
-    8  bar two large  7
-
-    >>> table = pivot_table(df, values='D', index=['A', 'B'],
-    ...                     columns=['C'], aggfunc=np.sum)
-    >>> table
-              small  large
-    foo  one  1      4
-         two  6      NaN
-    bar  one  5      4
-         two  6      7
-
-    Returns
-    -------
-    table : DataFrame
-    """
-    index = _convert_by(index)
-    columns = _convert_by(columns)
-
-    if isinstance(aggfunc, list):
-        pieces = []
-        keys = []
-        for func in aggfunc:
-            table = pivot_table(data, values=values, index=index, columns=columns,
-                                fill_value=fill_value, aggfunc=func,
-                                margins=margins)
-            pieces.append(table)
-            keys.append(func.__name__)
-        return concat(pieces, keys=keys, axis=1)
-
-    keys = index + columns
-
-    values_passed = values is not None
-    if values_passed:
-        if isinstance(values, (list, tuple)):
-            values_multi = True
-        else:
-            values_multi = False
-            values = [values]
-    else:
-        values = list(data.columns.drop(keys))
-
-    if values_passed:
-        to_filter = []
-        for x in keys + values:
-            if isinstance(x, Grouper):
-                x = x.key
-            try:
-                if x in data:
-                    to_filter.append(x)
-            except TypeError:
-                pass
-        if len(to_filter) < len(data.columns):
-            data = data[to_filter]
-
-    grouped = data.groupby(keys)
-    agged = grouped.agg(aggfunc)
-
-    table = agged
-    if table.index.nlevels > 1:
-        to_unstack = [agged.index.names[i] or i
-                      for i in range(len(index), len(keys))]
-        table = agged.unstack(to_unstack)
-
-    if not dropna:
-        try:
-            m = MultiIndex.from_arrays(cartesian_product(table.index.levels))
-            table = table.reindex_axis(m, axis=0)
-        except AttributeError:
-            pass # it's a single level
-
-        try:
-            m = MultiIndex.from_arrays(cartesian_product(table.columns.levels))
-            table = table.reindex_axis(m, axis=1)
-        except AttributeError:
-            pass # it's a single level or a series
-
-    if isinstance(table, DataFrame):
-        if isinstance(table.columns, MultiIndex):
-            table = table.sortlevel(axis=1)
-        else:
-            table = table.sort_index(axis=1)
-
-    if fill_value is not None:
-        table = table.fillna(value=fill_value, downcast='infer')
-
-    if margins:
-        table = _add_margins(table, data, values, rows=index,
-                             cols=columns, aggfunc=aggfunc)
-
-    # discard the top level
-    if values_passed and not values_multi:
-        table = table[values[0]]
-
-    if len(index) == 0 and len(columns) > 0:
-        table = table.T
-
-    return table
-
-
-DataFrame.pivot_table = pivot_table
-
-
-def _add_margins(table, data, values, rows, cols, aggfunc):
-
-    grand_margin = _compute_grand_margin(data, values, aggfunc)
-
-    if not values and isinstance(table, Series):
-        # If there are no values and the table is a series, then there is only
-        # one column in the data. Compute grand margin and return it.
-        row_key = ('All',) + ('',) * (len(rows) - 1) if len(rows) > 1 else 'All'
-        return table.append(Series({row_key: grand_margin['All']}))
-
-    if values:
-        marginal_result_set = _generate_marginal_results(table, data, values, rows, cols, aggfunc, grand_margin)
-        if not isinstance(marginal_result_set, tuple):
-            return marginal_result_set
-        result, margin_keys, row_margin = marginal_result_set
-    else:
-        marginal_result_set = _generate_marginal_results_without_values(table, data, rows, cols, aggfunc)
-        if not isinstance(marginal_result_set, tuple):
-            return marginal_result_set
-        result, margin_keys, row_margin = marginal_result_set
-
-    key = ('All',) + ('',) * (len(rows) - 1) if len(rows) > 1 else 'All'
-
-    row_margin = row_margin.reindex(result.columns)
-    # populate grand margin
-    for k in margin_keys:
-        if isinstance(k, compat.string_types):
-            row_margin[k] = grand_margin[k]
-        else:
-            row_margin[k] = grand_margin[k[0]]
-
-    margin_dummy = DataFrame(row_margin, columns=[key]).T
-
-    row_names = result.index.names
-    result = result.append(margin_dummy)
-    result.index.names = row_names
-
-    return result
-
-
-def _compute_grand_margin(data, values, aggfunc):
-
-    if values:
-        grand_margin = {}
-        for k, v in data[values].iteritems():
-            try:
-                if isinstance(aggfunc, compat.string_types):
-                    grand_margin[k] = getattr(v, aggfunc)()
-                elif isinstance(aggfunc, dict):
-                    if isinstance(aggfunc[k], compat.string_types):
-                        grand_margin[k] = getattr(v, aggfunc[k])()
-                    else:
-                        grand_margin[k] = aggfunc[k](v)
-                else:
-                    grand_margin[k] = aggfunc(v)
-            except TypeError:
-                pass
-        return grand_margin
-    else:
-        return {'All': aggfunc(data.index)}
-
-
-def _generate_marginal_results(table, data, values, rows, cols, aggfunc, grand_margin):
-    if len(cols) > 0:
-        # need to "interleave" the margins
-        table_pieces = []
-        margin_keys = []
-
-        def _all_key(key):
-            return (key, 'All') + ('',) * (len(cols) - 1)
-
-        if len(rows) > 0:
-            margin = data[rows + values].groupby(rows).agg(aggfunc)
-            cat_axis = 1
-
-            for key, piece in table.groupby(level=0, axis=cat_axis):
-                all_key = _all_key(key)
-
-                # we are going to mutate this, so need to copy!
-                piece = piece.copy()
-                piece[all_key] = margin[key]
-
-                table_pieces.append(piece)
-                margin_keys.append(all_key)
-        else:
-            margin = grand_margin
-            cat_axis = 0
-            for key, piece in table.groupby(level=0, axis=cat_axis):
-                all_key = _all_key(key)
-                table_pieces.append(piece)
-                table_pieces.append(Series(margin[key], index=[all_key]))
-                margin_keys.append(all_key)
-
-        result = concat(table_pieces, axis=cat_axis)
-
-        if len(rows) == 0:
-            return result
-    else:
-        result = table
-        margin_keys = table.columns
-
-    if len(cols) > 0:
-        row_margin = data[cols + values].groupby(cols).agg(aggfunc)
-        row_margin = row_margin.stack()
-
-        # slight hack
-        new_order = [len(cols)] + lrange(len(cols))
-        row_margin.index = row_margin.index.reorder_levels(new_order)
-    else:
-        row_margin = Series(np.nan, index=result.columns)
-
-    return result, margin_keys, row_margin
-
-
-def _generate_marginal_results_without_values(table, data, rows, cols, aggfunc):
-    if len(cols) > 0:
-        # need to "interleave" the margins
-        margin_keys = []
-
-        def _all_key():
-            if len(cols) == 1:
-                return 'All'
-            return ('All', ) + ('', ) * (len(cols) - 1)
-
-        if len(rows) > 0:
-            margin = data[rows].groupby(rows).apply(aggfunc)
-            all_key = _all_key()
-            table[all_key] = margin
-            result = table
-            margin_keys.append(all_key)
-
-        else:
-            margin = data.groupby(level=0, axis=0).apply(aggfunc)
-            all_key = _all_key()
-            table[all_key] = margin
-            result = table
-            margin_keys.append(all_key)
-            return result
-    else:
-        result = table
-        margin_keys = table.columns
-
-    if len(cols):
-        row_margin = data[cols].groupby(cols).apply(aggfunc)
-    else:
-        row_margin = Series(np.nan, index=result.columns)
-
-    return result, margin_keys, row_margin
-
-
-def _convert_by(by):
-    if by is None:
-        by = []
-    elif (np.isscalar(by) or isinstance(by, (np.ndarray, Index, Series, Grouper))
-          or hasattr(by, '__call__')):
-        by = [by]
-    else:
-        by = list(by)
-    return by
-
-def crosstab(index, columns, values=None, rownames=None, colnames=None,
-             aggfunc=None, margins=False, dropna=True):
-    """
-    Compute a simple cross-tabulation of two (or more) factors. By default
-    computes a frequency table of the factors unless an array of values and an
-    aggregation function are passed
-
-    Parameters
-    ----------
-    index : array-like, Series, or list of arrays/Series
-        Values to group by in the rows
-    columns : array-like, Series, or list of arrays/Series
-        Values to group by in the columns
-    values : array-like, optional
-        Array of values to aggregate according to the factors
-    aggfunc : function, optional
-        If no values array is passed, computes a frequency table
-    rownames : sequence, default None
-        If passed, must match number of row arrays passed
-    colnames : sequence, default None
-        If passed, must match number of column arrays passed
-    margins : boolean, default False
-        Add row/column margins (subtotals)
-    dropna : boolean, default True
-        Do not include columns whose entries are all NaN
-
-    Notes
-    -----
-    Any Series passed will have their name attributes used unless row or column
-    names for the cross-tabulation are specified
-
-    Examples
-    --------
-    >>> a
-    array([foo, foo, foo, foo, bar, bar,
-           bar, bar, foo, foo, foo], dtype=object)
-    >>> b
-    array([one, one, one, two, one, one,
-           one, two, two, two, one], dtype=object)
-    >>> c
-    array([dull, dull, shiny, dull, dull, shiny,
-           shiny, dull, shiny, shiny, shiny], dtype=object)
-
-    >>> crosstab(a, [b, c], rownames=['a'], colnames=['b', 'c'])
-    b    one          two
-    c    dull  shiny  dull  shiny
-    a
-    bar  1     2      1     0
-    foo  2     2      1     2
-
-    Returns
-    -------
-    crosstab : DataFrame
-    """
-
-    index = com._maybe_make_list(index)
-    columns = com._maybe_make_list(columns)
-
-    rownames = _get_names(index, rownames, prefix='row')
-    colnames = _get_names(columns, colnames, prefix='col')
-
-    data = {}
-    data.update(zip(rownames, index))
-    data.update(zip(colnames, columns))
-
-    if values is None:
-        df = DataFrame(data)
-        df['__dummy__'] = 0
-        table = df.pivot_table('__dummy__', index=rownames, columns=colnames,
-                               aggfunc=len, margins=margins, dropna=dropna)
-        return table.fillna(0).astype(np.int64)
-    else:
-        data['__dummy__'] = values
-        df = DataFrame(data)
-        table = df.pivot_table('__dummy__', index=rownames, columns=colnames,
-                               aggfunc=aggfunc, margins=margins, dropna=dropna)
-        return table
-
-
-def _get_names(arrs, names, prefix='row'):
-    if names is None:
-        names = []
-        for i, arr in enumerate(arrs):
-            if isinstance(arr, Series) and arr.name is not None:
-                names.append(arr.name)
-            else:
-                names.append('%s_%d' % (prefix, i))
-    else:
-        if len(names) != len(arrs):
-            raise AssertionError('arrays and names must have the same length')
-        if not isinstance(names, list):
-            names = list(names)
-
-    return names
diff --git a/pandas/tools/plotting.py b/pandas/tools/plotting.py
index 98d6f5e8eb797..a68da67a219e2 100644
--- a/pandas/tools/plotting.py
+++ b/pandas/tools/plotting.py
@@ -1,3901 +1,20 @@
-# being a bit too dynamic
-# pylint: disable=E1101
-import datetime
+import sys
 import warnings
-import re
-from math import ceil
-from collections import namedtuple
-from contextlib import contextmanager
-from distutils.version import LooseVersion
 
-import numpy as np
+import pandas.plotting as _plotting
 
-from pandas.util.decorators import cache_readonly, deprecate_kwarg
-from pandas.core.base import PandasObject
-import pandas.core.common as com
-from pandas.core.common import AbstractMethodError
-from pandas.core.generic import _shared_docs, _shared_doc_kwargs
-from pandas.core.index import Index, MultiIndex
-from pandas.core.series import Series, remove_na
-from pandas.tseries.index import DatetimeIndex
-from pandas.tseries.period import PeriodIndex, Period
-import pandas.tseries.frequencies as frequencies
-from pandas.tseries.offsets import DateOffset
-from pandas.compat import range, lrange, lmap, map, zip, string_types
-import pandas.compat as compat
-from pandas.util.decorators import Appender
-try:  # mpl optional
-    import pandas.tseries.converter as conv
-    conv.register()  # needs to override so set_xlim works with str/number
-except ImportError:
-    pass
+# back-compat of public API
+# deprecate these functions
+m = sys.modules['pandas.tools.plotting']
+for t in [t for t in dir(_plotting) if not t.startswith('_')]:
 
+    def outer(t=t):
 
-# Extracted from https://gist.github.com/huyng/816622
-# this is the rcParams set when setting display.with_mpl_style
-# to True.
-mpl_stylesheet = {
-    'axes.axisbelow': True,
-     'axes.color_cycle': ['#348ABD',
-      '#7A68A6',
-      '#A60628',
-      '#467821',
-      '#CF4457',
-      '#188487',
-      '#E24A33'],
-     'axes.edgecolor': '#bcbcbc',
-     'axes.facecolor': '#eeeeee',
-     'axes.grid': True,
-     'axes.labelcolor': '#555555',
-     'axes.labelsize': 'large',
-     'axes.linewidth': 1.0,
-     'axes.titlesize': 'x-large',
-     'figure.edgecolor': 'white',
-     'figure.facecolor': 'white',
-     'figure.figsize': (6.0, 4.0),
-     'figure.subplot.hspace': 0.5,
-     'font.family': 'monospace',
-     'font.monospace': ['Andale Mono',
-      'Nimbus Mono L',
-      'Courier New',
-      'Courier',
-      'Fixed',
-      'Terminal',
-      'monospace'],
-     'font.size': 10,
-     'interactive': True,
-     'keymap.all_axes': ['a'],
-     'keymap.back': ['left', 'c', 'backspace'],
-     'keymap.forward': ['right', 'v'],
-     'keymap.fullscreen': ['f'],
-     'keymap.grid': ['g'],
-     'keymap.home': ['h', 'r', 'home'],
-     'keymap.pan': ['p'],
-     'keymap.save': ['s'],
-     'keymap.xscale': ['L', 'k'],
-     'keymap.yscale': ['l'],
-     'keymap.zoom': ['o'],
-     'legend.fancybox': True,
-     'lines.antialiased': True,
-     'lines.linewidth': 1.0,
-     'patch.antialiased': True,
-     'patch.edgecolor': '#EEEEEE',
-     'patch.facecolor': '#348ABD',
-     'patch.linewidth': 0.5,
-     'toolbar': 'toolbar2',
-     'xtick.color': '#555555',
-     'xtick.direction': 'in',
-     'xtick.major.pad': 6.0,
-     'xtick.major.size': 0.0,
-     'xtick.minor.pad': 6.0,
-     'xtick.minor.size': 0.0,
-     'ytick.color': '#555555',
-     'ytick.direction': 'in',
-     'ytick.major.pad': 6.0,
-     'ytick.major.size': 0.0,
-     'ytick.minor.pad': 6.0,
-     'ytick.minor.size': 0.0
-}
+        def wrapper(*args, **kwargs):
+            warnings.warn("'pandas.tools.plotting.{t}' is deprecated, "
+                          "import 'pandas.plotting.{t}' instead.".format(t=t),
+                          FutureWarning, stacklevel=2)
+            return getattr(_plotting, t)(*args, **kwargs)
+        return wrapper
 
-
-def _mpl_le_1_2_1():
-    try:
-        import matplotlib as mpl
-        return (str(mpl.__version__) <= LooseVersion('1.2.1') and
-                str(mpl.__version__)[0] != '0')
-    except ImportError:
-        return False
-
-def _mpl_ge_1_3_1():
-    try:
-        import matplotlib
-        # The or v[0] == '0' is because their versioneer is
-        # messed up on dev
-        return (matplotlib.__version__ >= LooseVersion('1.3.1')
-                or matplotlib.__version__[0] == '0')
-    except ImportError:
-        return False
-
-def _mpl_ge_1_4_0():
-    try:
-        import matplotlib
-        return (matplotlib.__version__  >= LooseVersion('1.4')
-                or matplotlib.__version__[0] == '0')
-    except ImportError:
-        return False
-
-def _mpl_ge_1_5_0():
-    try:
-        import matplotlib
-        return (matplotlib.__version__  >= LooseVersion('1.5')
-                or matplotlib.__version__[0] == '0')
-    except ImportError:
-        return False
-
-if _mpl_ge_1_5_0():
-    # Compat with mp 1.5, which uses cycler.
-    import cycler
-    colors = mpl_stylesheet.pop('axes.color_cycle')
-    mpl_stylesheet['axes.prop_cycle'] = cycler.cycler('color_cycle', colors)
-
-
-def _get_standard_kind(kind):
-    return {'density': 'kde'}.get(kind, kind)
-
-def _get_standard_colors(num_colors=None, colormap=None, color_type='default',
-                         color=None):
-    import matplotlib.pyplot as plt
-
-    if color is None and colormap is not None:
-        if isinstance(colormap, compat.string_types):
-            import matplotlib.cm as cm
-            cmap = colormap
-            colormap = cm.get_cmap(colormap)
-            if colormap is None:
-                raise ValueError("Colormap {0} is not recognized".format(cmap))
-        colors = lmap(colormap, np.linspace(0, 1, num=num_colors))
-    elif color is not None:
-        if colormap is not None:
-            warnings.warn("'color' and 'colormap' cannot be used "
-                          "simultaneously. Using 'color'")
-        colors = color
-    else:
-        if color_type == 'default':
-            # need to call list() on the result to copy so we don't
-            # modify the global rcParams below
-            colors = list(plt.rcParams.get('axes.color_cycle',
-                                           list('bgrcmyk')))
-            if isinstance(colors, compat.string_types):
-                colors = list(colors)
-        elif color_type == 'random':
-            import random
-            def random_color(column):
-                random.seed(column)
-                return [random.random() for _ in range(3)]
-
-            colors = lmap(random_color, lrange(num_colors))
-        else:
-            raise ValueError("color_type must be either 'default' or 'random'")
-
-    if isinstance(colors, compat.string_types):
-        import matplotlib.colors
-        conv = matplotlib.colors.ColorConverter()
-        def _maybe_valid_colors(colors):
-            try:
-                [conv.to_rgba(c) for c in colors]
-                return True
-            except ValueError:
-                return False
-
-        # check whether the string can be convertable to single color
-        maybe_single_color = _maybe_valid_colors([colors])
-        # check whether each character can be convertable to colors
-        maybe_color_cycle = _maybe_valid_colors(list(colors))
-        if maybe_single_color and maybe_color_cycle and len(colors) > 1:
-            msg = ("'{0}' can be parsed as both single color and "
-                   "color cycle. Specify each color using a list "
-                   "like ['{0}'] or {1}")
-            raise ValueError(msg.format(colors, list(colors)))
-        elif maybe_single_color:
-            colors = [colors]
-        else:
-            # ``colors`` is regarded as color cycle.
-            # mpl will raise error any of them is invalid
-            pass
-
-    if len(colors) != num_colors:
-        multiple = num_colors//len(colors) - 1
-        mod = num_colors % len(colors)
-
-        colors += multiple * colors
-        colors += colors[:mod]
-
-    return colors
-
-class _Options(dict):
-    """
-    Stores pandas plotting options.
-    Allows for parameter aliasing so you can just use parameter names that are
-    the same as the plot function parameters, but is stored in a canonical
-    format that makes it easy to breakdown into groups later
-    """
-
-    # alias so the names are same as plotting method parameter names
-    _ALIASES = {'x_compat': 'xaxis.compat'}
-    _DEFAULT_KEYS = ['xaxis.compat']
-
-    def __init__(self):
-        self['xaxis.compat'] = False
-
-    def __getitem__(self, key):
-        key = self._get_canonical_key(key)
-        if key not in self:
-            raise ValueError('%s is not a valid pandas plotting option' % key)
-        return super(_Options, self).__getitem__(key)
-
-    def __setitem__(self, key, value):
-        key = self._get_canonical_key(key)
-        return super(_Options, self).__setitem__(key, value)
-
-    def __delitem__(self, key):
-        key = self._get_canonical_key(key)
-        if key in self._DEFAULT_KEYS:
-            raise ValueError('Cannot remove default parameter %s' % key)
-        return super(_Options, self).__delitem__(key)
-
-    def __contains__(self, key):
-        key = self._get_canonical_key(key)
-        return super(_Options, self).__contains__(key)
-
-    def reset(self):
-        """
-        Reset the option store to its initial state
-
-        Returns
-        -------
-        None
-        """
-        self.__init__()
-
-    def _get_canonical_key(self, key):
-        return self._ALIASES.get(key, key)
-
-    @contextmanager
-    def use(self, key, value):
-        """
-        Temporarily set a parameter value using the with statement.
-        Aliasing allowed.
-        """
-        old_value = self[key]
-        try:
-            self[key] = value
-            yield self
-        finally:
-            self[key] = old_value
-
-
-plot_params = _Options()
-
-
-def scatter_matrix(frame, alpha=0.5, figsize=None, ax=None, grid=False,
-                   diagonal='hist', marker='.', density_kwds=None,
-                   hist_kwds=None, range_padding=0.05, **kwds):
-    """
-    Draw a matrix of scatter plots.
-
-    Parameters
-    ----------
-    frame : DataFrame
-    alpha : float, optional
-        amount of transparency applied
-    figsize : (float,float), optional
-        a tuple (width, height) in inches
-    ax : Matplotlib axis object, optional
-    grid : bool, optional
-        setting this to True will show the grid
-    diagonal : {'hist', 'kde'}
-        pick between 'kde' and 'hist' for
-        either Kernel Density Estimation or Histogram
-        plot in the diagonal
-    marker : str, optional
-        Matplotlib marker type, default '.'
-    hist_kwds : other plotting keyword arguments
-        To be passed to hist function
-    density_kwds : other plotting keyword arguments
-        To be passed to kernel density estimate plot
-    range_padding : float, optional
-        relative extension of axis range in x and y
-        with respect to (x_max - x_min) or (y_max - y_min),
-        default 0.05
-    kwds : other plotting keyword arguments
-        To be passed to scatter function
-
-    Examples
-    --------
-    >>> df = DataFrame(np.random.randn(1000, 4), columns=['A','B','C','D'])
-    >>> scatter_matrix(df, alpha=0.2)
-    """
-    import matplotlib.pyplot as plt
-    from matplotlib.artist import setp
-
-    df = frame._get_numeric_data()
-    n = df.columns.size
-    naxes = n * n
-    fig, axes = _subplots(naxes=naxes, figsize=figsize, ax=ax,
-                          squeeze=False)
-
-    # no gaps between subplots
-    fig.subplots_adjust(wspace=0, hspace=0)
-
-    mask = com.notnull(df)
-
-    marker = _get_marker_compat(marker)
-
-    hist_kwds = hist_kwds or {}
-    density_kwds = density_kwds or {}
-
-    # workaround because `c='b'` is hardcoded in matplotlibs scatter method
-    kwds.setdefault('c', plt.rcParams['patch.facecolor'])
-
-    boundaries_list = []
-    for a in df.columns:
-        values = df[a].values[mask[a].values]
-        rmin_, rmax_ = np.min(values), np.max(values)
-        rdelta_ext = (rmax_ - rmin_) * range_padding / 2.
-        boundaries_list.append((rmin_ - rdelta_ext, rmax_+ rdelta_ext))
-
-    for i, a in zip(lrange(n), df.columns):
-        for j, b in zip(lrange(n), df.columns):
-            ax = axes[i, j]
-
-            if i == j:
-                values = df[a].values[mask[a].values]
-
-                # Deal with the diagonal by drawing a histogram there.
-                if diagonal == 'hist':
-                    ax.hist(values, **hist_kwds)
-
-                elif diagonal in ('kde', 'density'):
-                    from scipy.stats import gaussian_kde
-                    y = values
-                    gkde = gaussian_kde(y)
-                    ind = np.linspace(y.min(), y.max(), 1000)
-                    ax.plot(ind, gkde.evaluate(ind), **density_kwds)
-
-                ax.set_xlim(boundaries_list[i])
-
-            else:
-                common = (mask[a] & mask[b]).values
-
-                ax.scatter(df[b][common], df[a][common],
-                           marker=marker, alpha=alpha, **kwds)
-
-                ax.set_xlim(boundaries_list[j])
-                ax.set_ylim(boundaries_list[i])
-
-            ax.set_xlabel(b)
-            ax.set_ylabel(a)
-
-            if j!= 0:
-                ax.yaxis.set_visible(False)
-            if i != n-1:
-                ax.xaxis.set_visible(False)
-
-    if len(df.columns) > 1:
-        lim1 = boundaries_list[0]
-        locs = axes[0][1].yaxis.get_majorticklocs()
-        locs = locs[(lim1[0] <= locs) & (locs <= lim1[1])]
-        adj = (locs - lim1[0]) / (lim1[1] - lim1[0])
-
-        lim0 = axes[0][0].get_ylim()
-        adj = adj * (lim0[1] - lim0[0]) + lim0[0]
-        axes[0][0].yaxis.set_ticks(adj)
-
-        if np.all(locs == locs.astype(int)):
-            # if all ticks are int
-            locs = locs.astype(int)
-        axes[0][0].yaxis.set_ticklabels(locs)
-
-    _set_ticks_props(axes, xlabelsize=8, xrot=90, ylabelsize=8, yrot=0)
-
-    return axes
-
-
-def _gca():
-    import matplotlib.pyplot as plt
-    return plt.gca()
-
-
-def _gcf():
-    import matplotlib.pyplot as plt
-    return plt.gcf()
-
-def _get_marker_compat(marker):
-    import matplotlib.lines as mlines
-    import matplotlib as mpl
-    if mpl.__version__ < '1.1.0' and marker == '.':
-        return 'o'
-    if marker not in mlines.lineMarkers:
-        return 'o'
-    return marker
-
-def radviz(frame, class_column, ax=None, color=None, colormap=None, **kwds):
-    """RadViz - a multivariate data visualization algorithm
-
-    Parameters:
-    -----------
-    frame: DataFrame
-    class_column: str
-        Column name containing class names
-    ax: Matplotlib axis object, optional
-    color: list or tuple, optional
-        Colors to use for the different classes
-    colormap : str or matplotlib colormap object, default None
-        Colormap to select colors from. If string, load colormap with that name
-        from matplotlib.
-    kwds: keywords
-        Options to pass to matplotlib scatter plotting method
-
-    Returns:
-    --------
-    ax: Matplotlib axis object
-    """
-    import matplotlib.pyplot as plt
-    import matplotlib.patches as patches
-
-    def normalize(series):
-        a = min(series)
-        b = max(series)
-        return (series - a) / (b - a)
-
-    n = len(frame)
-    classes = frame[class_column].drop_duplicates()
-    class_col = frame[class_column]
-    df = frame.drop(class_column, axis=1).apply(normalize)
-
-    if ax is None:
-        ax = plt.gca(xlim=[-1, 1], ylim=[-1, 1])
-
-    to_plot = {}
-    colors = _get_standard_colors(num_colors=len(classes), colormap=colormap,
-                                  color_type='random', color=color)
-
-    for kls in classes:
-        to_plot[kls] = [[], []]
-
-    m = len(frame.columns) - 1
-    s = np.array([(np.cos(t), np.sin(t))
-                  for t in [2.0 * np.pi * (i / float(m))
-                            for i in range(m)]])
-
-    for i in range(n):
-        row = df.iloc[i].values
-        row_ = np.repeat(np.expand_dims(row, axis=1), 2, axis=1)
-        y = (s * row_).sum(axis=0) / row.sum()
-        kls = class_col.iat[i]
-        to_plot[kls][0].append(y[0])
-        to_plot[kls][1].append(y[1])
-
-    for i, kls in enumerate(classes):
-        ax.scatter(to_plot[kls][0], to_plot[kls][1], color=colors[i],
-                   label=com.pprint_thing(kls), **kwds)
-    ax.legend()
-
-    ax.add_patch(patches.Circle((0.0, 0.0), radius=1.0, facecolor='none'))
-
-    for xy, name in zip(s, df.columns):
-
-        ax.add_patch(patches.Circle(xy, radius=0.025, facecolor='gray'))
-
-        if xy[0] < 0.0 and xy[1] < 0.0:
-            ax.text(xy[0] - 0.025, xy[1] - 0.025, name,
-                    ha='right', va='top', size='small')
-        elif xy[0] < 0.0 and xy[1] >= 0.0:
-            ax.text(xy[0] - 0.025, xy[1] + 0.025, name,
-                    ha='right', va='bottom', size='small')
-        elif xy[0] >= 0.0 and xy[1] < 0.0:
-            ax.text(xy[0] + 0.025, xy[1] - 0.025, name,
-                    ha='left', va='top', size='small')
-        elif xy[0] >= 0.0 and xy[1] >= 0.0:
-            ax.text(xy[0] + 0.025, xy[1] + 0.025, name,
-                    ha='left', va='bottom', size='small')
-
-    ax.axis('equal')
-    return ax
-
-@deprecate_kwarg(old_arg_name='data', new_arg_name='frame')
-def andrews_curves(frame, class_column, ax=None, samples=200, color=None,
-                   colormap=None, **kwds):
-    """
-    Parameters:
-    -----------
-    frame : DataFrame
-        Data to be plotted, preferably normalized to (0.0, 1.0)
-    class_column : Name of the column containing class names
-    ax : matplotlib axes object, default None
-    samples : Number of points to plot in each curve
-    color: list or tuple, optional
-        Colors to use for the different classes
-    colormap : str or matplotlib colormap object, default None
-        Colormap to select colors from. If string, load colormap with that name
-        from matplotlib.
-    kwds: keywords
-        Options to pass to matplotlib plotting method
-
-    Returns:
-    --------
-    ax: Matplotlib axis object
-
-    """
-    from math import sqrt, pi, sin, cos
-    import matplotlib.pyplot as plt
-
-    def function(amplitudes):
-        def f(x):
-            x1 = amplitudes[0]
-            result = x1 / sqrt(2.0)
-            harmonic = 1.0
-            for x_even, x_odd in zip(amplitudes[1::2], amplitudes[2::2]):
-                result += (x_even * sin(harmonic * x) +
-                           x_odd * cos(harmonic * x))
-                harmonic += 1.0
-            if len(amplitudes) % 2 != 0:
-                result += amplitudes[-1] * sin(harmonic * x)
-            return result
-        return f
-
-    n = len(frame)
-    class_col = frame[class_column]
-    classes = frame[class_column].drop_duplicates()
-    df = frame.drop(class_column, axis=1)
-    x = [-pi + 2.0 * pi * (t / float(samples)) for t in range(samples)]
-    used_legends = set([])
-
-    color_values = _get_standard_colors(num_colors=len(classes),
-                                        colormap=colormap, color_type='random',
-                                        color=color)
-    colors = dict(zip(classes, color_values))
-    if ax is None:
-        ax = plt.gca(xlim=(-pi, pi))
-    for i in range(n):
-        row = df.iloc[i].values
-        f = function(row)
-        y = [f(t) for t in x]
-        kls = class_col.iat[i]
-        label = com.pprint_thing(kls)
-        if label not in used_legends:
-            used_legends.add(label)
-            ax.plot(x, y, color=colors[kls], label=label, **kwds)
-        else:
-            ax.plot(x, y, color=colors[kls], **kwds)
-
-    ax.legend(loc='upper right')
-    ax.grid()
-    return ax
-
-
-def bootstrap_plot(series, fig=None, size=50, samples=500, **kwds):
-    """Bootstrap plot.
-
-    Parameters:
-    -----------
-    series: Time series
-    fig: matplotlib figure object, optional
-    size: number of data points to consider during each sampling
-    samples: number of times the bootstrap procedure is performed
-    kwds: optional keyword arguments for plotting commands, must be accepted
-        by both hist and plot
-
-    Returns:
-    --------
-    fig: matplotlib figure
-    """
-    import random
-    import matplotlib.pyplot as plt
-
-    # random.sample(ndarray, int) fails on python 3.3, sigh
-    data = list(series.values)
-    samplings = [random.sample(data, size) for _ in range(samples)]
-
-    means = np.array([np.mean(sampling) for sampling in samplings])
-    medians = np.array([np.median(sampling) for sampling in samplings])
-    midranges = np.array([(min(sampling) + max(sampling)) * 0.5
-                          for sampling in samplings])
-    if fig is None:
-        fig = plt.figure()
-    x = lrange(samples)
-    axes = []
-    ax1 = fig.add_subplot(2, 3, 1)
-    ax1.set_xlabel("Sample")
-    axes.append(ax1)
-    ax1.plot(x, means, **kwds)
-    ax2 = fig.add_subplot(2, 3, 2)
-    ax2.set_xlabel("Sample")
-    axes.append(ax2)
-    ax2.plot(x, medians, **kwds)
-    ax3 = fig.add_subplot(2, 3, 3)
-    ax3.set_xlabel("Sample")
-    axes.append(ax3)
-    ax3.plot(x, midranges, **kwds)
-    ax4 = fig.add_subplot(2, 3, 4)
-    ax4.set_xlabel("Mean")
-    axes.append(ax4)
-    ax4.hist(means, **kwds)
-    ax5 = fig.add_subplot(2, 3, 5)
-    ax5.set_xlabel("Median")
-    axes.append(ax5)
-    ax5.hist(medians, **kwds)
-    ax6 = fig.add_subplot(2, 3, 6)
-    ax6.set_xlabel("Midrange")
-    axes.append(ax6)
-    ax6.hist(midranges, **kwds)
-    for axis in axes:
-        plt.setp(axis.get_xticklabels(), fontsize=8)
-        plt.setp(axis.get_yticklabels(), fontsize=8)
-    return fig
-
-@deprecate_kwarg(old_arg_name='colors', new_arg_name='color')
-@deprecate_kwarg(old_arg_name='data', new_arg_name='frame', stacklevel=3)
-def parallel_coordinates(frame, class_column, cols=None, ax=None, color=None,
-                         use_columns=False, xticks=None, colormap=None,
-                         axvlines=True, **kwds):
-    """Parallel coordinates plotting.
-
-    Parameters
-    ----------
-    frame: DataFrame
-    class_column: str
-        Column name containing class names
-    cols: list, optional
-        A list of column names to use
-    ax: matplotlib.axis, optional
-        matplotlib axis object
-    color: list or tuple, optional
-        Colors to use for the different classes
-    use_columns: bool, optional
-        If true, columns will be used as xticks
-    xticks: list or tuple, optional
-        A list of values to use for xticks
-    colormap: str or matplotlib colormap, default None
-        Colormap to use for line colors.
-    axvlines: bool, optional
-        If true, vertical lines will be added at each xtick
-    kwds: keywords
-        Options to pass to matplotlib plotting method
-
-    Returns
-    -------
-    ax: matplotlib axis object
-
-    Examples
-    --------
-    >>> from pandas import read_csv
-    >>> from pandas.tools.plotting import parallel_coordinates
-    >>> from matplotlib import pyplot as plt
-    >>> df = read_csv('https://raw.github.com/pydata/pandas/master/pandas/tests/data/iris.csv')
-    >>> parallel_coordinates(df, 'Name', color=('#556270', '#4ECDC4', '#C7F464'))
-    >>> plt.show()
-    """
-    import matplotlib.pyplot as plt
-
-    n = len(frame)
-    classes = frame[class_column].drop_duplicates()
-    class_col = frame[class_column]
-
-    if cols is None:
-        df = frame.drop(class_column, axis=1)
-    else:
-        df = frame[cols]
-
-    used_legends = set([])
-
-    ncols = len(df.columns)
-
-    # determine values to use for xticks
-    if use_columns is True:
-        if not np.all(np.isreal(list(df.columns))):
-            raise ValueError('Columns must be numeric to be used as xticks')
-        x = df.columns
-    elif xticks is not None:
-        if not np.all(np.isreal(xticks)):
-            raise ValueError('xticks specified must be numeric')
-        elif len(xticks) != ncols:
-            raise ValueError('Length of xticks must match number of columns')
-        x = xticks
-    else:
-        x = lrange(ncols)
-
-    if ax is None:
-        ax = plt.gca()
-
-    color_values = _get_standard_colors(num_colors=len(classes),
-                                        colormap=colormap, color_type='random',
-                                        color=color)
-
-    colors = dict(zip(classes, color_values))
-
-    for i in range(n):
-        y = df.iloc[i].values
-        kls = class_col.iat[i]
-        label = com.pprint_thing(kls)
-        if label not in used_legends:
-            used_legends.add(label)
-            ax.plot(x, y, color=colors[kls], label=label, **kwds)
-        else:
-            ax.plot(x, y, color=colors[kls], **kwds)
-
-    if axvlines:
-        for i in x:
-            ax.axvline(i, linewidth=1, color='black')
-
-    ax.set_xticks(x)
-    ax.set_xticklabels(df.columns)
-    ax.set_xlim(x[0], x[-1])
-    ax.legend(loc='upper right')
-    ax.grid()
-    return ax
-
-
-def lag_plot(series, lag=1, ax=None, **kwds):
-    """Lag plot for time series.
-
-    Parameters:
-    -----------
-    series: Time series
-    lag: lag of the scatter plot, default 1
-    ax: Matplotlib axis object, optional
-    kwds: Matplotlib scatter method keyword arguments, optional
-
-    Returns:
-    --------
-    ax: Matplotlib axis object
-    """
-    import matplotlib.pyplot as plt
-
-    # workaround because `c='b'` is hardcoded in matplotlibs scatter method
-    kwds.setdefault('c', plt.rcParams['patch.facecolor'])
-
-    data = series.values
-    y1 = data[:-lag]
-    y2 = data[lag:]
-    if ax is None:
-        ax = plt.gca()
-    ax.set_xlabel("y(t)")
-    ax.set_ylabel("y(t + %s)" % lag)
-    ax.scatter(y1, y2, **kwds)
-    return ax
-
-
-def autocorrelation_plot(series, ax=None, **kwds):
-    """Autocorrelation plot for time series.
-
-    Parameters:
-    -----------
-    series: Time series
-    ax: Matplotlib axis object, optional
-    kwds : keywords
-        Options to pass to matplotlib plotting method
-
-    Returns:
-    -----------
-    ax: Matplotlib axis object
-    """
-    import matplotlib.pyplot as plt
-    n = len(series)
-    data = np.asarray(series)
-    if ax is None:
-        ax = plt.gca(xlim=(1, n), ylim=(-1.0, 1.0))
-    mean = np.mean(data)
-    c0 = np.sum((data - mean) ** 2) / float(n)
-
-    def r(h):
-        return ((data[:n - h] - mean) * (data[h:] - mean)).sum() / float(n) / c0
-    x = np.arange(n) + 1
-    y = lmap(r, x)
-    z95 = 1.959963984540054
-    z99 = 2.5758293035489004
-    ax.axhline(y=z99 / np.sqrt(n), linestyle='--', color='grey')
-    ax.axhline(y=z95 / np.sqrt(n), color='grey')
-    ax.axhline(y=0.0, color='black')
-    ax.axhline(y=-z95 / np.sqrt(n), color='grey')
-    ax.axhline(y=-z99 / np.sqrt(n), linestyle='--', color='grey')
-    ax.set_xlabel("Lag")
-    ax.set_ylabel("Autocorrelation")
-    ax.plot(x, y, **kwds)
-    if 'label' in kwds:
-        ax.legend()
-    ax.grid()
-    return ax
-
-
-class MPLPlot(object):
-    """
-    Base class for assembling a pandas plot using matplotlib
-
-    Parameters
-    ----------
-    data :
-
-    """
-
-    @property
-    def _kind(self):
-        """Specify kind str. Must be overridden in child class"""
-        raise NotImplementedError
-
-    _layout_type = 'vertical'
-    _default_rot = 0
-    orientation = None
-    _pop_attributes = ['label', 'style', 'logy', 'logx', 'loglog',
-                       'mark_right', 'stacked']
-    _attr_defaults = {'logy': False, 'logx': False, 'loglog': False,
-                      'mark_right': True, 'stacked': False}
-
-    def __init__(self, data, kind=None, by=None, subplots=False, sharex=None,
-                 sharey=False, use_index=True,
-                 figsize=None, grid=None, legend=True, rot=None,
-                 ax=None, fig=None, title=None, xlim=None, ylim=None,
-                 xticks=None, yticks=None,
-                 sort_columns=False, fontsize=None,
-                 secondary_y=False, colormap=None,
-                 table=False, layout=None, **kwds):
-
-        self.data = data
-        self.by = by
-
-        self.kind = kind
-
-        self.sort_columns = sort_columns
-
-        self.subplots = subplots
-
-        if sharex is None:
-            if ax is None:
-                 self.sharex = True
-            else:
-                 # if we get an axis, the users should do the visibility setting...
-                 self.sharex = False
-        else:
-            self.sharex = sharex
-
-        self.sharey = sharey
-        self.figsize = figsize
-        self.layout = layout
-
-        self.xticks = xticks
-        self.yticks = yticks
-        self.xlim = xlim
-        self.ylim = ylim
-        self.title = title
-        self.use_index = use_index
-
-        self.fontsize = fontsize
-
-        if rot is not None:
-            self.rot = rot
-            # need to know for format_date_labels since it's rotated to 30 by
-            # default
-            self._rot_set = True
-        else:
-            self._rot_set = False
-            self.rot = self._default_rot
-
-        if grid is None:
-            grid = False if secondary_y else self.plt.rcParams['axes.grid']
-
-        self.grid = grid
-        self.legend = legend
-        self.legend_handles = []
-        self.legend_labels = []
-
-        for attr in self._pop_attributes:
-            value = kwds.pop(attr, self._attr_defaults.get(attr, None))
-            setattr(self, attr, value)
-
-        self.ax = ax
-        self.fig = fig
-        self.axes = None
-
-        # parse errorbar input if given
-        xerr = kwds.pop('xerr', None)
-        yerr = kwds.pop('yerr', None)
-        self.errors = {}
-        for kw, err in zip(['xerr', 'yerr'], [xerr, yerr]):
-            self.errors[kw] = self._parse_errorbars(kw, err)
-
-        if not isinstance(secondary_y, (bool, tuple, list, np.ndarray, Index)):
-            secondary_y = [secondary_y]
-        self.secondary_y = secondary_y
-
-        # ugly TypeError if user passes matplotlib's `cmap` name.
-        # Probably better to accept either.
-        if 'cmap' in kwds and colormap:
-            raise TypeError("Only specify one of `cmap` and `colormap`.")
-        elif 'cmap' in kwds:
-            self.colormap = kwds.pop('cmap')
-        else:
-            self.colormap = colormap
-
-        self.table = table
-
-        self.kwds = kwds
-
-        self._validate_color_args()
-
-    def _validate_color_args(self):
-        if 'color' not in self.kwds and 'colors' in self.kwds:
-            warnings.warn(("'colors' is being deprecated. Please use 'color'"
-                           "instead of 'colors'"))
-            colors = self.kwds.pop('colors')
-            self.kwds['color'] = colors
-
-        if ('color' in self.kwds and self.nseries == 1):
-            # support series.plot(color='green')
-            self.kwds['color'] = [self.kwds['color']]
-
-        if ('color' in self.kwds or 'colors' in self.kwds) and \
-                self.colormap is not None:
-            warnings.warn("'color' and 'colormap' cannot be used "
-                          "simultaneously. Using 'color'")
-
-        if 'color' in self.kwds and self.style is not None:
-            if com.is_list_like(self.style):
-                styles = self.style
-            else:
-                styles = [self.style]
-            # need only a single match
-            for s in styles:
-                if re.match('^[a-z]+?', s) is not None:
-                    raise ValueError("Cannot pass 'style' string with a color "
-                                     "symbol and 'color' keyword argument. Please"
-                                     " use one or the other or pass 'style' "
-                                     "without a color symbol")
-
-    def _iter_data(self, data=None, keep_index=False, fillna=None):
-        if data is None:
-            data = self.data
-        if fillna is not None:
-            data = data.fillna(fillna)
-
-        if self.sort_columns:
-            columns = com._try_sort(data.columns)
-        else:
-            columns = data.columns
-
-        for col, values in data.iteritems():
-            if keep_index is True:
-                yield col, values
-            else:
-                yield col, values.values
-
-    @property
-    def nseries(self):
-        if self.data.ndim == 1:
-            return 1
-        else:
-            return self.data.shape[1]
-
-    def draw(self):
-        self.plt.draw_if_interactive()
-
-    def generate(self):
-        self._args_adjust()
-        self._compute_plot_data()
-        self._setup_subplots()
-        self._make_plot()
-        self._add_table()
-        self._make_legend()
-
-        for ax in self.axes:
-            self._post_plot_logic_common(ax, self.data)
-            self._post_plot_logic(ax, self.data)
-        self._adorn_subplots()
-
-    def _args_adjust(self):
-        pass
-
-    def _has_plotted_object(self, ax):
-        """check whether ax has data"""
-        return (len(ax.lines) != 0 or
-                len(ax.artists) != 0 or
-                len(ax.containers) != 0)
-
-    def _maybe_right_yaxis(self, ax, axes_num):
-        if not self.on_right(axes_num):
-            # secondary axes may be passed via ax kw
-            return self._get_ax_layer(ax)
-
-        if hasattr(ax, 'right_ax'):
-            # if it has right_ax proparty, ``ax`` must be left axes
-            return ax.right_ax
-        elif hasattr(ax, 'left_ax'):
-            # if it has left_ax proparty, ``ax`` must be right axes
-            return ax
-        else:
-            # otherwise, create twin axes
-            orig_ax, new_ax = ax, ax.twinx()
-            # TODO: use Matplotlib public API when available
-            new_ax._get_lines = orig_ax._get_lines
-            new_ax._get_patches_for_fill = orig_ax._get_patches_for_fill
-            orig_ax.right_ax, new_ax.left_ax = new_ax, orig_ax
-
-            if not self._has_plotted_object(orig_ax):  # no data on left y
-                orig_ax.get_yaxis().set_visible(False)
-            return new_ax
-
-    def _setup_subplots(self):
-        if self.subplots:
-            fig, axes = _subplots(naxes=self.nseries,
-                                  sharex=self.sharex, sharey=self.sharey,
-                                  figsize=self.figsize, ax=self.ax,
-                                  layout=self.layout,
-                                  layout_type=self._layout_type)
-        else:
-            if self.ax is None:
-                fig = self.plt.figure(figsize=self.figsize)
-                axes = fig.add_subplot(111)
-            else:
-                fig = self.ax.get_figure()
-                if self.figsize is not None:
-                    fig.set_size_inches(self.figsize)
-                axes = self.ax
-
-        axes = _flatten(axes)
-
-        if self.logx or self.loglog:
-            [a.set_xscale('log') for a in axes]
-        if self.logy or self.loglog:
-            [a.set_yscale('log') for a in axes]
-
-        self.fig = fig
-        self.axes = axes
-
-    @property
-    def result(self):
-        """
-        Return result axes
-        """
-        if self.subplots:
-            if self.layout is not None and not com.is_list_like(self.ax):
-                return self.axes.reshape(*self.layout)
-            else:
-                return self.axes
-        else:
-            sec_true = isinstance(self.secondary_y, bool) and self.secondary_y
-            all_sec = (com.is_list_like(self.secondary_y) and
-                       len(self.secondary_y) == self.nseries)
-            if (sec_true or all_sec):
-                # if all data is plotted on secondary, return right axes
-                return self._get_ax_layer(self.axes[0], primary=False)
-            else:
-                return self.axes[0]
-
-    def _compute_plot_data(self):
-        data = self.data
-
-        if isinstance(data, Series):
-            label = self.label
-            if label is None and data.name is None:
-                label = 'None'
-            data = data.to_frame(name=label)
-
-        numeric_data = data._convert(datetime=True)._get_numeric_data()
-
-        try:
-            is_empty = numeric_data.empty
-        except AttributeError:
-            is_empty = not len(numeric_data)
-
-        # no empty frames or series allowed
-        if is_empty:
-            raise TypeError('Empty {0!r}: no numeric data to '
-                            'plot'.format(numeric_data.__class__.__name__))
-
-        self.data = numeric_data
-
-    def _make_plot(self):
-        raise AbstractMethodError(self)
-
-    def _add_table(self):
-        if self.table is False:
-            return
-        elif self.table is True:
-            data = self.data.transpose()
-        else:
-            data = self.table
-        ax = self._get_ax(0)
-        table(ax, data)
-
-    def _post_plot_logic_common(self, ax, data):
-        """Common post process for each axes"""
-        labels = [com.pprint_thing(key) for key in data.index]
-        labels = dict(zip(range(len(data.index)), labels))
-
-        if self.orientation == 'vertical' or self.orientation is None:
-            if self._need_to_set_index:
-                xticklabels = [labels.get(x, '') for x in ax.get_xticks()]
-                ax.set_xticklabels(xticklabels)
-            self._apply_axis_properties(ax.xaxis, rot=self.rot,
-                                        fontsize=self.fontsize)
-            self._apply_axis_properties(ax.yaxis, fontsize=self.fontsize)
-        elif self.orientation == 'horizontal':
-            if self._need_to_set_index:
-                yticklabels = [labels.get(y, '') for y in ax.get_yticks()]
-                ax.set_yticklabels(yticklabels)
-            self._apply_axis_properties(ax.yaxis, rot=self.rot,
-                                        fontsize=self.fontsize)
-            self._apply_axis_properties(ax.xaxis, fontsize=self.fontsize)
-        else: # pragma no cover
-            raise ValueError
-
-    def _post_plot_logic(self, ax, data):
-        """Post process for each axes. Overridden in child classes"""
-        pass
-
-    def _adorn_subplots(self):
-        """Common post process unrelated to data"""
-        if len(self.axes) > 0:
-            all_axes = self._get_axes()
-            nrows, ncols = self._get_axes_layout()
-            _handle_shared_axes(axarr=all_axes, nplots=len(all_axes),
-                                naxes=nrows * ncols, nrows=nrows,
-                                ncols=ncols, sharex=self.sharex,
-                                sharey=self.sharey)
-
-        for ax in self.axes:
-            if self.yticks is not None:
-                ax.set_yticks(self.yticks)
-
-            if self.xticks is not None:
-                ax.set_xticks(self.xticks)
-
-            if self.ylim is not None:
-                ax.set_ylim(self.ylim)
-
-            if self.xlim is not None:
-                ax.set_xlim(self.xlim)
-
-            ax.grid(self.grid)
-
-        if self.title:
-            if self.subplots:
-                self.fig.suptitle(self.title)
-            else:
-                self.axes[0].set_title(self.title)
-
-    def _apply_axis_properties(self, axis, rot=None, fontsize=None):
-        labels = axis.get_majorticklabels() + axis.get_minorticklabels()
-        for label in labels:
-            if rot is not None:
-                label.set_rotation(rot)
-            if fontsize is not None:
-                label.set_fontsize(fontsize)
-
-    @property
-    def legend_title(self):
-        if not isinstance(self.data.columns, MultiIndex):
-            name = self.data.columns.name
-            if name is not None:
-                name = com.pprint_thing(name)
-            return name
-        else:
-            stringified = map(com.pprint_thing,
-                              self.data.columns.names)
-            return ','.join(stringified)
-
-    def _add_legend_handle(self, handle, label, index=None):
-        if not label is None:
-            if self.mark_right and index is not None:
-                if self.on_right(index):
-                    label = label + ' (right)'
-            self.legend_handles.append(handle)
-            self.legend_labels.append(label)
-
-    def _make_legend(self):
-        ax, leg = self._get_ax_legend(self.axes[0])
-
-        handles = []
-        labels = []
-        title = ''
-
-        if not self.subplots:
-            if not leg is None:
-                title = leg.get_title().get_text()
-                handles = leg.legendHandles
-                labels = [x.get_text() for x in leg.get_texts()]
-
-            if self.legend:
-                if self.legend == 'reverse':
-                    self.legend_handles = reversed(self.legend_handles)
-                    self.legend_labels = reversed(self.legend_labels)
-
-                handles += self.legend_handles
-                labels += self.legend_labels
-                if not self.legend_title is None:
-                    title = self.legend_title
-
-            if len(handles) > 0:
-                ax.legend(handles, labels, loc='best', title=title)
-
-        elif self.subplots and self.legend:
-            for ax in self.axes:
-                if ax.get_visible():
-                    ax.legend(loc='best')
-
-    def _get_ax_legend(self, ax):
-        leg = ax.get_legend()
-        other_ax = (getattr(ax, 'left_ax', None) or
-                    getattr(ax, 'right_ax', None))
-        other_leg = None
-        if other_ax is not None:
-            other_leg = other_ax.get_legend()
-        if leg is None and other_leg is not None:
-            leg = other_leg
-            ax = other_ax
-        return ax, leg
-
-    @cache_readonly
-    def plt(self):
-        import matplotlib.pyplot as plt
-        return plt
-
-    @staticmethod
-    def mpl_ge_1_3_1():
-        return _mpl_ge_1_3_1()
-
-    @staticmethod
-    def mpl_ge_1_5_0():
-        return _mpl_ge_1_5_0()
-
-    _need_to_set_index = False
-
-    def _get_xticks(self, convert_period=False):
-        index = self.data.index
-        is_datetype = index.inferred_type in ('datetime', 'date',
-                                              'datetime64', 'time')
-
-        if self.use_index:
-            if convert_period and isinstance(index, PeriodIndex):
-                self.data = self.data.reindex(index=index.sort_values())
-                x = self.data.index.to_timestamp()._mpl_repr()
-            elif index.is_numeric():
-                """
-                Matplotlib supports numeric values or datetime objects as
-                xaxis values. Taking LBYL approach here, by the time
-                matplotlib raises exception when using non numeric/datetime
-                values for xaxis, several actions are already taken by plt.
-                """
-                x = index._mpl_repr()
-            elif is_datetype:
-                self.data = self.data.sort_index()
-                x = self.data.index._mpl_repr()
-            else:
-                self._need_to_set_index = True
-                x = lrange(len(index))
-        else:
-            x = lrange(len(index))
-
-        return x
-
-    @classmethod
-    def _plot(cls, ax, x, y, style=None, is_errorbar=False, **kwds):
-        mask = com.isnull(y)
-        if mask.any():
-            y = np.ma.array(y)
-            y = np.ma.masked_where(mask, y)
-
-        if isinstance(x, Index):
-            x = x._mpl_repr()
-
-        if is_errorbar:
-            return ax.errorbar(x, y, **kwds)
-        else:
-            # prevent style kwarg from going to errorbar, where it is unsupported
-            if style is not None:
-                args = (x, y, style)
-            else:
-                args = (x, y)
-            return ax.plot(*args, **kwds)
-
-    def _get_index_name(self):
-        if isinstance(self.data.index, MultiIndex):
-            name = self.data.index.names
-            if any(x is not None for x in name):
-                name = ','.join([com.pprint_thing(x) for x in name])
-            else:
-                name = None
-        else:
-            name = self.data.index.name
-            if name is not None:
-                name = com.pprint_thing(name)
-
-        return name
-
-    @classmethod
-    def _get_ax_layer(cls, ax, primary=True):
-        """get left (primary) or right (secondary) axes"""
-        if primary:
-            return getattr(ax, 'left_ax', ax)
-        else:
-            return getattr(ax, 'right_ax', ax)
-
-    def _get_ax(self, i):
-        # get the twinx ax if appropriate
-        if self.subplots:
-            ax = self.axes[i]
-            ax = self._maybe_right_yaxis(ax, i)
-            self.axes[i] = ax
-        else:
-            ax = self.axes[0]
-            ax = self._maybe_right_yaxis(ax, i)
-
-        ax.get_yaxis().set_visible(True)
-        return ax
-
-    def on_right(self, i):
-        if isinstance(self.secondary_y, bool):
-            return self.secondary_y
-
-        if isinstance(self.secondary_y, (tuple, list, np.ndarray, Index)):
-            return self.data.columns[i] in self.secondary_y
-
-    def _apply_style_colors(self, colors, kwds, col_num, label):
-        """
-        Manage style and color based on column number and its label.
-        Returns tuple of appropriate style and kwds which "color" may be added.
-        """
-        style = None
-        if self.style is not None:
-            if isinstance(self.style, list):
-                try:
-                    style = self.style[col_num]
-                except IndexError:
-                    pass
-            elif isinstance(self.style, dict):
-                style = self.style.get(label, style)
-            else:
-                style = self.style
-
-        has_color = 'color' in kwds or self.colormap is not None
-        nocolor_style = style is None or re.match('[a-z]+', style) is None
-        if (has_color or self.subplots) and nocolor_style:
-            kwds['color'] = colors[col_num % len(colors)]
-        return style, kwds
-
-    def _get_colors(self, num_colors=None, color_kwds='color'):
-        if num_colors is None:
-            num_colors = self.nseries
-
-        return _get_standard_colors(num_colors=num_colors,
-                                    colormap=self.colormap,
-                                    color=self.kwds.get(color_kwds))
-
-    def _parse_errorbars(self, label, err):
-        '''
-        Look for error keyword arguments and return the actual errorbar data
-        or return the error DataFrame/dict
-
-        Error bars can be specified in several ways:
-            Series: the user provides a pandas.Series object of the same
-                    length as the data
-            ndarray: provides a np.ndarray of the same length as the data
-            DataFrame/dict: error values are paired with keys matching the
-                    key in the plotted DataFrame
-            str: the name of the column within the plotted DataFrame
-        '''
-
-        if err is None:
-            return None
-
-        from pandas import DataFrame, Series
-
-        def match_labels(data, e):
-            e = e.reindex_axis(data.index)
-            return e
-
-        # key-matched DataFrame
-        if isinstance(err, DataFrame):
-
-            err = match_labels(self.data, err)
-        # key-matched dict
-        elif isinstance(err, dict):
-            pass
-
-        # Series of error values
-        elif isinstance(err, Series):
-            # broadcast error series across data
-            err = match_labels(self.data, err)
-            err = np.atleast_2d(err)
-            err = np.tile(err, (self.nseries, 1))
-
-        # errors are a column in the dataframe
-        elif isinstance(err, string_types):
-            evalues = self.data[err].values
-            self.data = self.data[self.data.columns.drop(err)]
-            err = np.atleast_2d(evalues)
-            err = np.tile(err, (self.nseries, 1))
-
-        elif com.is_list_like(err):
-            if com.is_iterator(err):
-                err = np.atleast_2d(list(err))
-            else:
-                # raw error values
-                err = np.atleast_2d(err)
-
-            err_shape = err.shape
-
-            # asymmetrical error bars
-            if err.ndim == 3:
-                if (err_shape[0] != self.nseries) or \
-                    (err_shape[1] != 2) or \
-                    (err_shape[2] != len(self.data)):
-                    msg = "Asymmetrical error bars should be provided " + \
-                    "with the shape (%u, 2, %u)" % \
-                        (self.nseries, len(self.data))
-                    raise ValueError(msg)
-
-            # broadcast errors to each data series
-            if len(err) == 1:
-                err = np.tile(err, (self.nseries, 1))
-
-        elif com.is_number(err):
-            err = np.tile([err], (self.nseries, len(self.data)))
-
-        else:
-            msg = "No valid %s detected" % label
-            raise ValueError(msg)
-
-        return err
-
-    def _get_errorbars(self, label=None, index=None, xerr=True, yerr=True):
-        from pandas import DataFrame
-        errors = {}
-
-        for kw, flag in zip(['xerr', 'yerr'], [xerr, yerr]):
-            if flag:
-                err = self.errors[kw]
-                # user provided label-matched dataframe of errors
-                if isinstance(err, (DataFrame, dict)):
-                    if label is not None and label in err.keys():
-                        err = err[label]
-                    else:
-                        err = None
-                elif index is not None and err is not None:
-                    err = err[index]
-
-                if err is not None:
-                    errors[kw] = err
-        return errors
-
-    def _get_axes(self):
-        return self.axes[0].get_figure().get_axes()
-
-    def _get_axes_layout(self):
-        axes = self._get_axes()
-        x_set = set()
-        y_set = set()
-        for ax in axes:
-            # check axes coordinates to estimate layout
-            points = ax.get_position().get_points()
-            x_set.add(points[0][0])
-            y_set.add(points[0][1])
-        return (len(y_set), len(x_set))
-
-
-class PlanePlot(MPLPlot):
-    """
-    Abstract class for plotting on plane, currently scatter and hexbin.
-    """
-
-    _layout_type = 'single'
-
-    def __init__(self, data, x, y, **kwargs):
-        MPLPlot.__init__(self, data, **kwargs)
-        if x is None or y is None:
-            raise ValueError(self._kind + ' requires and x and y column')
-        if com.is_integer(x) and not self.data.columns.holds_integer():
-            x = self.data.columns[x]
-        if com.is_integer(y) and not self.data.columns.holds_integer():
-            y = self.data.columns[y]
-        self.x = x
-        self.y = y
-
-    @property
-    def nseries(self):
-        return 1
-
-    def _post_plot_logic(self, ax, data):
-        x, y = self.x, self.y
-        ax.set_ylabel(com.pprint_thing(y))
-        ax.set_xlabel(com.pprint_thing(x))
-
-
-class ScatterPlot(PlanePlot):
-    _kind = 'scatter'
-
-    def __init__(self, data, x, y, s=None, c=None, **kwargs):
-        if s is None:
-            # hide the matplotlib default for size, in case we want to change
-            # the handling of this argument later
-            s = 20
-        super(ScatterPlot, self).__init__(data, x, y, s=s, **kwargs)
-        if com.is_integer(c) and not self.data.columns.holds_integer():
-            c = self.data.columns[c]
-        self.c = c
-
-    def _make_plot(self):
-        x, y, c, data = self.x, self.y, self.c, self.data
-        ax = self.axes[0]
-
-        c_is_column = com.is_hashable(c) and c in self.data.columns
-
-        # plot a colorbar only if a colormap is provided or necessary
-        cb = self.kwds.pop('colorbar', self.colormap or c_is_column)
-
-        # pandas uses colormap, matplotlib uses cmap.
-        cmap = self.colormap or 'Greys'
-        cmap = self.plt.cm.get_cmap(cmap)
-        color = self.kwds.pop("color", None)
-        if c is not None and color is not None:
-            raise TypeError('Specify exactly one of `c` and `color`')
-        elif c is None and color is None:
-            c_values = self.plt.rcParams['patch.facecolor']
-        elif color is not None:
-            c_values = color
-        elif c_is_column:
-            c_values = self.data[c].values
-        else:
-            c_values = c
-
-        if self.legend and hasattr(self, 'label'):
-            label = self.label
-        else:
-            label = None
-        scatter = ax.scatter(data[x].values, data[y].values, c=c_values,
-                             label=label, cmap=cmap, **self.kwds)
-        if cb:
-            img = ax.collections[0]
-            kws = dict(ax=ax)
-            if self.mpl_ge_1_3_1():
-                kws['label'] = c if c_is_column else ''
-            self.fig.colorbar(img, **kws)
-
-        if label is not None:
-            self._add_legend_handle(scatter, label)
-        else:
-            self.legend = False
-
-        errors_x = self._get_errorbars(label=x, index=0, yerr=False)
-        errors_y = self._get_errorbars(label=y, index=0, xerr=False)
-        if len(errors_x) > 0 or len(errors_y) > 0:
-            err_kwds = dict(errors_x, **errors_y)
-            err_kwds['ecolor'] = scatter.get_facecolor()[0]
-            ax.errorbar(data[x].values, data[y].values, linestyle='none', **err_kwds)
-
-
-class HexBinPlot(PlanePlot):
-    _kind = 'hexbin'
-
-    def __init__(self, data, x, y, C=None, **kwargs):
-        super(HexBinPlot, self).__init__(data, x, y, **kwargs)
-        if com.is_integer(C) and not self.data.columns.holds_integer():
-            C = self.data.columns[C]
-        self.C = C
-
-    def _make_plot(self):
-        x, y, data, C = self.x, self.y, self.data, self.C
-        ax = self.axes[0]
-        # pandas uses colormap, matplotlib uses cmap.
-        cmap = self.colormap or 'BuGn'
-        cmap = self.plt.cm.get_cmap(cmap)
-        cb = self.kwds.pop('colorbar', True)
-
-        if C is None:
-            c_values = None
-        else:
-            c_values = data[C].values
-
-        ax.hexbin(data[x].values, data[y].values, C=c_values, cmap=cmap,
-                  **self.kwds)
-        if cb:
-            img = ax.collections[0]
-            self.fig.colorbar(img, ax=ax)
-
-    def _make_legend(self):
-        pass
-
-
-class LinePlot(MPLPlot):
-    _kind = 'line'
-    _default_rot = 0
-    orientation = 'vertical'
-
-    def __init__(self, data, **kwargs):
-        MPLPlot.__init__(self, data, **kwargs)
-        if self.stacked:
-            self.data = self.data.fillna(value=0)
-        self.x_compat = plot_params['x_compat']
-        if 'x_compat' in self.kwds:
-            self.x_compat = bool(self.kwds.pop('x_compat'))
-
-    def _is_ts_plot(self):
-        # this is slightly deceptive
-        return not self.x_compat and self.use_index and self._use_dynamic_x()
-
-    def _use_dynamic_x(self):
-        from pandas.tseries.plotting import _use_dynamic_x
-        return _use_dynamic_x(self._get_ax(0), self.data)
-
-    def _make_plot(self):
-        if self._is_ts_plot():
-            from pandas.tseries.plotting import _maybe_convert_index
-            data = _maybe_convert_index(self._get_ax(0), self.data)
-
-            x = data.index      # dummy, not used
-            plotf = self._ts_plot
-            it = self._iter_data(data=data, keep_index=True)
-        else:
-            x = self._get_xticks(convert_period=True)
-            plotf = self._plot
-            it = self._iter_data()
-
-        stacking_id = self._get_stacking_id()
-        is_errorbar = any(e is not None for e in self.errors.values())
-
-        colors = self._get_colors()
-        for i, (label, y) in enumerate(it):
-            ax = self._get_ax(i)
-            kwds = self.kwds.copy()
-            style, kwds = self._apply_style_colors(colors, kwds, i, label)
-
-            errors = self._get_errorbars(label=label, index=i)
-            kwds = dict(kwds, **errors)
-
-            label = com.pprint_thing(label)  # .encode('utf-8')
-            kwds['label'] = label
-
-            newlines = plotf(ax, x, y, style=style, column_num=i,
-                             stacking_id=stacking_id,
-                             is_errorbar=is_errorbar,
-                             **kwds)
-            self._add_legend_handle(newlines[0], label, index=i)
-
-            lines = _get_all_lines(ax)
-            left, right = _get_xlim(lines)
-            ax.set_xlim(left, right)
-
-    @classmethod
-    def _plot(cls, ax, x, y, style=None, column_num=None,
-              stacking_id=None, **kwds):
-        # column_num is used to get the target column from protf in line and area plots
-        if column_num == 0:
-            cls._initialize_stacker(ax, stacking_id, len(y))
-        y_values = cls._get_stacked_values(ax, stacking_id, y, kwds['label'])
-        lines = MPLPlot._plot(ax, x, y_values, style=style, **kwds)
-        cls._update_stacker(ax, stacking_id, y)
-        return lines
-
-    @classmethod
-    def _ts_plot(cls, ax, x, data, style=None, **kwds):
-        from pandas.tseries.plotting import (_maybe_resample,
-                                             _decorate_axes,
-                                             format_dateaxis)
-        # accept x to be consistent with normal plot func,
-        # x is not passed to tsplot as it uses data.index as x coordinate
-        # column_num must be in kwds for stacking purpose
-        freq, data = _maybe_resample(data, ax, kwds)
-
-        # Set ax with freq info
-        _decorate_axes(ax, freq, kwds)
-        # digging deeper
-        if hasattr(ax, 'left_ax'):
-            _decorate_axes(ax.left_ax, freq, kwds)
-        if hasattr(ax, 'right_ax'):
-            _decorate_axes(ax.right_ax, freq, kwds)
-        ax._plot_data.append((data, cls._kind, kwds))
-
-        lines = cls._plot(ax, data.index, data.values, style=style, **kwds)
-        # set date formatter, locators and rescale limits
-        format_dateaxis(ax, ax.freq)
-        return lines
-
-    def _get_stacking_id(self):
-        if self.stacked:
-            return id(self.data)
-        else:
-            return None
-
-    @classmethod
-    def _initialize_stacker(cls, ax, stacking_id, n):
-        if stacking_id is None:
-            return
-        if not hasattr(ax, '_stacker_pos_prior'):
-            ax._stacker_pos_prior = {}
-        if not hasattr(ax, '_stacker_neg_prior'):
-            ax._stacker_neg_prior = {}
-        ax._stacker_pos_prior[stacking_id] = np.zeros(n)
-        ax._stacker_neg_prior[stacking_id] = np.zeros(n)
-
-    @classmethod
-    def _get_stacked_values(cls, ax, stacking_id, values, label):
-        if stacking_id is None:
-            return values
-        if not hasattr(ax, '_stacker_pos_prior'):
-            # stacker may not be initialized for subplots
-            cls._initialize_stacker(ax, stacking_id, len(values))
-
-        if (values >= 0).all():
-            return ax._stacker_pos_prior[stacking_id] + values
-        elif (values <= 0).all():
-            return ax._stacker_neg_prior[stacking_id] + values
-
-        raise ValueError('When stacked is True, each column must be either all positive or negative.'
-                         '{0} contains both positive and negative values'.format(label))
-
-    @classmethod
-    def _update_stacker(cls, ax, stacking_id, values):
-        if stacking_id is None:
-            return
-        if (values >= 0).all():
-            ax._stacker_pos_prior[stacking_id] += values
-        elif (values <= 0).all():
-            ax._stacker_neg_prior[stacking_id] += values
-
-    def _post_plot_logic(self, ax, data):
-        condition = (not self._use_dynamic_x()
-                     and data.index.is_all_dates
-                     and not self.subplots
-                     or (self.subplots and self.sharex))
-
-        index_name = self._get_index_name()
-
-        if condition:
-            # irregular TS rotated 30 deg. by default
-            # probably a better place to check / set this.
-            if not self._rot_set:
-                self.rot = 30
-            format_date_labels(ax, rot=self.rot)
-
-        if index_name is not None and self.use_index:
-            ax.set_xlabel(index_name)
-
-
-class AreaPlot(LinePlot):
-    _kind = 'area'
-
-    def __init__(self, data, **kwargs):
-        kwargs.setdefault('stacked', True)
-        data = data.fillna(value=0)
-        LinePlot.__init__(self, data, **kwargs)
-
-        if not self.stacked:
-            # use smaller alpha to distinguish overlap
-            self.kwds.setdefault('alpha', 0.5)
-
-        if self.logy or self.loglog:
-            raise ValueError("Log-y scales are not supported in area plot")
-
-    @classmethod
-    def _plot(cls, ax, x, y, style=None, column_num=None,
-              stacking_id=None, is_errorbar=False, **kwds):
-        if column_num == 0:
-            cls._initialize_stacker(ax, stacking_id, len(y))
-        y_values = cls._get_stacked_values(ax, stacking_id, y, kwds['label'])
-        lines = MPLPlot._plot(ax, x, y_values, style=style, **kwds)
-
-        # get data from the line to get coordinates for fill_between
-        xdata, y_values = lines[0].get_data(orig=False)
-
-        # unable to use ``_get_stacked_values`` here to get starting point
-        if stacking_id is None:
-            start = np.zeros(len(y))
-        elif (y >= 0).all():
-            start = ax._stacker_pos_prior[stacking_id]
-        elif (y <= 0).all():
-            start = ax._stacker_neg_prior[stacking_id]
-        else:
-            start = np.zeros(len(y))
-
-        if not 'color' in kwds:
-            kwds['color'] = lines[0].get_color()
-
-        if cls.mpl_ge_1_5_0(): # mpl 1.5 added real support for poly legends
-            kwds.pop('label')
-        ax.fill_between(xdata, start, y_values, **kwds)
-        cls._update_stacker(ax, stacking_id, y)
-        return lines
-
-    def _add_legend_handle(self, handle, label, index=None):
-        from matplotlib.patches import Rectangle
-        # Because fill_between isn't supported in legend,
-        # specifically add Rectangle handle here
-        alpha = self.kwds.get('alpha', None)
-        handle = Rectangle((0, 0), 1, 1, fc=handle.get_color(), alpha=alpha)
-        LinePlot._add_legend_handle(self, handle, label, index=index)
-
-    def _post_plot_logic(self, ax, data):
-        LinePlot._post_plot_logic(self, ax, data)
-
-        if self.ylim is None:
-            if (data >= 0).all().all():
-                ax.set_ylim(0, None)
-            elif (data <= 0).all().all():
-                ax.set_ylim(None, 0)
-
-
-class BarPlot(MPLPlot):
-    _kind = 'bar'
-    _default_rot = 90
-    orientation = 'vertical'
-
-    def __init__(self, data, **kwargs):
-        self.bar_width = kwargs.pop('width', 0.5)
-        pos = kwargs.pop('position', 0.5)
-        kwargs.setdefault('align', 'center')
-        self.tick_pos = np.arange(len(data))
-
-        self.bottom = kwargs.pop('bottom', 0)
-        self.left = kwargs.pop('left', 0)
-
-        self.log = kwargs.pop('log',False)
-        MPLPlot.__init__(self, data, **kwargs)
-
-        if self.stacked or self.subplots:
-            self.tickoffset = self.bar_width * pos
-            if kwargs['align'] == 'edge':
-                self.lim_offset = self.bar_width / 2
-            else:
-                self.lim_offset = 0
-        else:
-            if kwargs['align'] == 'edge':
-                w = self.bar_width / self.nseries
-                self.tickoffset = self.bar_width * (pos - 0.5) + w * 0.5
-                self.lim_offset = w * 0.5
-            else:
-                self.tickoffset = self.bar_width * pos
-                self.lim_offset = 0
-
-        self.ax_pos = self.tick_pos - self.tickoffset
-
-    def _args_adjust(self):
-        if com.is_list_like(self.bottom):
-            self.bottom = np.array(self.bottom)
-        if com.is_list_like(self.left):
-            self.left = np.array(self.left)
-
-    @classmethod
-    def _plot(cls, ax, x, y, w, start=0, log=False, **kwds):
-        return ax.bar(x, y, w, bottom=start, log=log, **kwds)
-
-    @property
-    def _start_base(self):
-        return self.bottom
-
-    def _make_plot(self):
-        import matplotlib as mpl
-
-        colors = self._get_colors()
-        ncolors = len(colors)
-
-        pos_prior = neg_prior = np.zeros(len(self.data))
-        K = self.nseries
-
-        for i, (label, y) in enumerate(self._iter_data(fillna=0)):
-            ax = self._get_ax(i)
-            kwds = self.kwds.copy()
-            kwds['color'] = colors[i % ncolors]
-
-            errors = self._get_errorbars(label=label, index=i)
-            kwds = dict(kwds, **errors)
-
-            label = com.pprint_thing(label)
-
-            if (('yerr' in kwds) or ('xerr' in kwds)) \
-                and (kwds.get('ecolor') is None):
-                kwds['ecolor'] = mpl.rcParams['xtick.color']
-
-            start = 0
-            if self.log and (y >= 1).all():
-                start = 1
-            start = start + self._start_base
-
-            if self.subplots:
-                w = self.bar_width / 2
-                rect = self._plot(ax, self.ax_pos + w, y, self.bar_width,
-                                  start=start, label=label, log=self.log, **kwds)
-                ax.set_title(label)
-            elif self.stacked:
-                mask = y > 0
-                start = np.where(mask, pos_prior, neg_prior) + self._start_base
-                w = self.bar_width / 2
-                rect = self._plot(ax, self.ax_pos + w, y, self.bar_width,
-                                  start=start, label=label, log=self.log, **kwds)
-                pos_prior = pos_prior + np.where(mask, y, 0)
-                neg_prior = neg_prior + np.where(mask, 0, y)
-            else:
-                w = self.bar_width / K
-                rect = self._plot(ax, self.ax_pos + (i + 0.5) * w, y, w,
-                                  start=start, label=label, log=self.log, **kwds)
-            self._add_legend_handle(rect, label, index=i)
-
-    def _post_plot_logic(self, ax, data):
-        if self.use_index:
-            str_index = [com.pprint_thing(key) for key in data.index]
-        else:
-            str_index = [com.pprint_thing(key) for key in range(data.shape[0])]
-        name = self._get_index_name()
-
-        s_edge = self.ax_pos[0] - 0.25 + self.lim_offset
-        e_edge = self.ax_pos[-1] + 0.25 + self.bar_width + self.lim_offset
-
-        self._decorate_ticks(ax, name, str_index, s_edge, e_edge)
-
-    def _decorate_ticks(self, ax, name, ticklabels, start_edge, end_edge):
-        ax.set_xlim((start_edge, end_edge))
-        ax.set_xticks(self.tick_pos)
-        ax.set_xticklabels(ticklabels)
-        if name is not None and self.use_index:
-            ax.set_xlabel(name)
-
-
-class BarhPlot(BarPlot):
-    _kind = 'barh'
-    _default_rot = 0
-    orientation = 'horizontal'
-
-    @property
-    def _start_base(self):
-        return self.left
-
-    @classmethod
-    def _plot(cls, ax, x, y, w, start=0, log=False, **kwds):
-        return ax.barh(x, y, w, left=start, log=log, **kwds)
-
-    def _decorate_ticks(self, ax, name, ticklabels, start_edge, end_edge):
-        # horizontal bars
-        ax.set_ylim((start_edge, end_edge))
-        ax.set_yticks(self.tick_pos)
-        ax.set_yticklabels(ticklabels)
-        if name is not None and self.use_index:
-            ax.set_ylabel(name)
-
-
-class HistPlot(LinePlot):
-    _kind = 'hist'
-
-    def __init__(self, data, bins=10, bottom=0, **kwargs):
-        self.bins = bins        # use mpl default
-        self.bottom = bottom
-        # Do not call LinePlot.__init__ which may fill nan
-        MPLPlot.__init__(self, data, **kwargs)
-
-    def _args_adjust(self):
-        if com.is_integer(self.bins):
-            # create common bin edge
-            values = (self.data._convert(datetime=True)._get_numeric_data())
-            values = np.ravel(values)
-            values = values[~com.isnull(values)]
-
-            hist, self.bins = np.histogram(values, bins=self.bins,
-                                        range=self.kwds.get('range', None),
-                                        weights=self.kwds.get('weights', None))
-
-        if com.is_list_like(self.bottom):
-            self.bottom = np.array(self.bottom)
-
-    @classmethod
-    def _plot(cls, ax, y, style=None, bins=None, bottom=0, column_num=0,
-              stacking_id=None, **kwds):
-        if column_num == 0:
-            cls._initialize_stacker(ax, stacking_id, len(bins) - 1)
-        y = y[~com.isnull(y)]
-
-        base = np.zeros(len(bins) - 1)
-        bottom = bottom + cls._get_stacked_values(ax, stacking_id, base, kwds['label'])
-        # ignore style
-        n, bins, patches = ax.hist(y, bins=bins, bottom=bottom, **kwds)
-        cls._update_stacker(ax, stacking_id, n)
-        return patches
-
-    def _make_plot(self):
-        colors = self._get_colors()
-        stacking_id = self._get_stacking_id()
-
-        for i, (label, y) in enumerate(self._iter_data()):
-            ax = self._get_ax(i)
-
-            kwds = self.kwds.copy()
-
-            label = com.pprint_thing(label)
-            kwds['label'] = label
-
-            style, kwds = self._apply_style_colors(colors, kwds, i, label)
-            if style is not None:
-                kwds['style'] = style
-
-            kwds = self._make_plot_keywords(kwds, y)
-            artists = self._plot(ax, y, column_num=i,
-                                 stacking_id=stacking_id, **kwds)
-            self._add_legend_handle(artists[0], label, index=i)
-
-    def _make_plot_keywords(self, kwds, y):
-        """merge BoxPlot/KdePlot properties to passed kwds"""
-        # y is required for KdePlot
-        kwds['bottom'] = self.bottom
-        kwds['bins'] = self.bins
-        return kwds
-
-    def _post_plot_logic(self, ax, data):
-        if self.orientation == 'horizontal':
-            ax.set_xlabel('Frequency')
-        else:
-            ax.set_ylabel('Frequency')
-
-    @property
-    def orientation(self):
-        if self.kwds.get('orientation', None) == 'horizontal':
-            return 'horizontal'
-        else:
-            return 'vertical'
-
-
-class KdePlot(HistPlot):
-    _kind = 'kde'
-    orientation = 'vertical'
-
-    def __init__(self, data, bw_method=None, ind=None, **kwargs):
-        MPLPlot.__init__(self, data, **kwargs)
-        self.bw_method = bw_method
-        self.ind = ind
-
-    def _args_adjust(self):
-        pass
-
-    def _get_ind(self, y):
-        if self.ind is None:
-            sample_range = max(y) - min(y)
-            ind = np.linspace(min(y) - 0.5 * sample_range,
-                              max(y) + 0.5 * sample_range, 1000)
-        else:
-            ind = self.ind
-        return ind
-
-    @classmethod
-    def _plot(cls, ax, y, style=None, bw_method=None, ind=None,
-              column_num=None, stacking_id=None, **kwds):
-        from scipy.stats import gaussian_kde
-        from scipy import __version__ as spv
-
-        y = remove_na(y)
-
-        if LooseVersion(spv) >= '0.11.0':
-            gkde = gaussian_kde(y, bw_method=bw_method)
-        else:
-            gkde = gaussian_kde(y)
-            if bw_method is not None:
-                msg = ('bw_method was added in Scipy 0.11.0.' +
-                       ' Scipy version in use is %s.' % spv)
-                warnings.warn(msg)
-
-        y = gkde.evaluate(ind)
-        lines = MPLPlot._plot(ax, ind, y, style=style, **kwds)
-        return lines
-
-    def _make_plot_keywords(self, kwds, y):
-        kwds['bw_method'] = self.bw_method
-        kwds['ind'] = self._get_ind(y)
-        return kwds
-
-    def _post_plot_logic(self, ax, data):
-        ax.set_ylabel('Density')
-
-
-class PiePlot(MPLPlot):
-    _kind = 'pie'
-    _layout_type = 'horizontal'
-
-    def __init__(self, data, kind=None, **kwargs):
-        data = data.fillna(value=0)
-        if (data < 0).any().any():
-            raise ValueError("{0} doesn't allow negative values".format(kind))
-        MPLPlot.__init__(self, data, kind=kind, **kwargs)
-
-    def _args_adjust(self):
-        self.grid = False
-        self.logy = False
-        self.logx = False
-        self.loglog = False
-
-    def _validate_color_args(self):
-        pass
-
-    def _make_plot(self):
-        colors = self._get_colors(num_colors=len(self.data), color_kwds='colors')
-        self.kwds.setdefault('colors', colors)
-
-        for i, (label, y) in enumerate(self._iter_data()):
-            ax = self._get_ax(i)
-            if label is not None:
-                label = com.pprint_thing(label)
-                ax.set_ylabel(label)
-
-            kwds = self.kwds.copy()
-
-            def blank_labeler(label, value):
-                if value == 0:
-                    return ''
-                else:
-                    return label
-
-            idx = [com.pprint_thing(v) for v in self.data.index]
-            labels = kwds.pop('labels', idx)
-            # labels is used for each wedge's labels
-            # Blank out labels for values of 0 so they don't overlap
-            # with nonzero wedges
-            if labels is not None:
-                blabels = [blank_labeler(label, value) for
-                           label, value in zip(labels, y)]
-            else:
-                blabels = None
-            results = ax.pie(y, labels=blabels, **kwds)
-
-            if kwds.get('autopct', None) is not None:
-                patches, texts, autotexts = results
-            else:
-                patches, texts = results
-                autotexts = []
-
-            if self.fontsize is not None:
-                for t in texts + autotexts:
-                    t.set_fontsize(self.fontsize)
-
-            # leglabels is used for legend labels
-            leglabels = labels if labels is not None else idx
-            for p, l in zip(patches, leglabels):
-                self._add_legend_handle(p, l)
-
-
-class BoxPlot(LinePlot):
-    _kind = 'box'
-    _layout_type = 'horizontal'
-
-    _valid_return_types = (None, 'axes', 'dict', 'both')
-    # namedtuple to hold results
-    BP = namedtuple("Boxplot", ['ax', 'lines'])
-
-    def __init__(self, data, return_type=None, **kwargs):
-        # Do not call LinePlot.__init__ which may fill nan
-        if return_type not in self._valid_return_types:
-            raise ValueError("return_type must be {None, 'axes', 'dict', 'both'}")
-
-        self.return_type = return_type
-        MPLPlot.__init__(self, data, **kwargs)
-
-    def _args_adjust(self):
-        if self.subplots:
-            # Disable label ax sharing. Otherwise, all subplots shows last column label
-            if self.orientation == 'vertical':
-                self.sharex = False
-            else:
-                self.sharey = False
-
-    @classmethod
-    def _plot(cls, ax, y, column_num=None, return_type=None, **kwds):
-        if y.ndim == 2:
-            y = [remove_na(v) for v in y]
-            # Boxplot fails with empty arrays, so need to add a NaN
-            #   if any cols are empty
-            # GH 8181
-            y = [v if v.size > 0 else np.array([np.nan]) for v in y]
-        else:
-            y = remove_na(y)
-        bp = ax.boxplot(y, **kwds)
-
-        if return_type == 'dict':
-            return bp, bp
-        elif return_type == 'both':
-            return cls.BP(ax=ax, lines=bp), bp
-        else:
-            return ax, bp
-
-    def _validate_color_args(self):
-        if 'color' in self.kwds:
-            if self.colormap is not None:
-                warnings.warn("'color' and 'colormap' cannot be used "
-                              "simultaneously. Using 'color'")
-            self.color = self.kwds.pop('color')
-
-            if isinstance(self.color, dict):
-                valid_keys = ['boxes', 'whiskers', 'medians', 'caps']
-                for key, values in compat.iteritems(self.color):
-                    if key not in valid_keys:
-                        raise ValueError("color dict contains invalid key '{0}' "
-                                         "The key must be either {1}".format(key, valid_keys))
-        else:
-            self.color = None
-
-        # get standard colors for default
-        colors = _get_standard_colors(num_colors=3,
-                                      colormap=self.colormap,
-                                      color=None)
-        # use 2 colors by default, for box/whisker and median
-        # flier colors isn't needed here
-        # because it can be specified by ``sym`` kw
-        self._boxes_c = colors[0]
-        self._whiskers_c = colors[0]
-        self._medians_c = colors[2]
-        self._caps_c = 'k'          # mpl default
-
-    def _get_colors(self, num_colors=None, color_kwds='color'):
-        pass
-
-    def maybe_color_bp(self, bp):
-        if isinstance(self.color, dict):
-            boxes = self.color.get('boxes', self._boxes_c)
-            whiskers = self.color.get('whiskers', self._whiskers_c)
-            medians = self.color.get('medians', self._medians_c)
-            caps = self.color.get('caps', self._caps_c)
-        else:
-            # Other types are forwarded to matplotlib
-            # If None, use default colors
-            boxes = self.color or self._boxes_c
-            whiskers = self.color or self._whiskers_c
-            medians = self.color or self._medians_c
-            caps = self.color or self._caps_c
-
-        from matplotlib.artist import setp
-        setp(bp['boxes'], color=boxes, alpha=1)
-        setp(bp['whiskers'], color=whiskers, alpha=1)
-        setp(bp['medians'], color=medians, alpha=1)
-        setp(bp['caps'], color=caps, alpha=1)
-
-    def _make_plot(self):
-        if self.subplots:
-            self._return_obj = compat.OrderedDict()
-
-            for i, (label, y) in enumerate(self._iter_data()):
-                ax = self._get_ax(i)
-                kwds = self.kwds.copy()
-
-                ret, bp = self._plot(ax, y, column_num=i,
-                                     return_type=self.return_type, **kwds)
-                self.maybe_color_bp(bp)
-                self._return_obj[label] = ret
-
-                label = [com.pprint_thing(label)]
-                self._set_ticklabels(ax, label)
-        else:
-            y = self.data.values.T
-            ax = self._get_ax(0)
-            kwds = self.kwds.copy()
-
-            ret, bp = self._plot(ax, y, column_num=0,
-                                 return_type=self.return_type, **kwds)
-            self.maybe_color_bp(bp)
-            self._return_obj = ret
-
-            labels = [l for l, y in self._iter_data()]
-            labels = [com.pprint_thing(l) for l in labels]
-            if not self.use_index:
-                labels = [com.pprint_thing(key) for key in range(len(labels))]
-            self._set_ticklabels(ax, labels)
-
-    def _set_ticklabels(self, ax, labels):
-        if self.orientation == 'vertical':
-            ax.set_xticklabels(labels)
-        else:
-            ax.set_yticklabels(labels)
-
-    def _make_legend(self):
-        pass
-
-    def _post_plot_logic(self, ax, data):
-        pass
-
-    @property
-    def orientation(self):
-        if self.kwds.get('vert', True):
-            return 'vertical'
-        else:
-            return 'horizontal'
-
-    @property
-    def result(self):
-        if self.return_type is None:
-            return super(BoxPlot, self).result
-        else:
-            return self._return_obj
-
-
-# kinds supported by both dataframe and series
-_common_kinds = ['line', 'bar', 'barh', 'kde', 'density', 'area', 'hist', 'box']
-# kinds supported by dataframe
-_dataframe_kinds = ['scatter', 'hexbin']
-# kinds supported only by series or dataframe single column
-_series_kinds = ['pie']
-_all_kinds = _common_kinds + _dataframe_kinds + _series_kinds
-
-_klasses = [LinePlot, BarPlot, BarhPlot, KdePlot, HistPlot, BoxPlot,
-            ScatterPlot, HexBinPlot, AreaPlot, PiePlot]
-
-_plot_klass = {}
-for klass in _klasses:
-    _plot_klass[klass._kind] = klass
-
-
-def _plot(data, x=None, y=None, subplots=False,
-          ax=None, kind='line', **kwds):
-    kind = _get_standard_kind(kind.lower().strip())
-    if kind in _all_kinds:
-        klass = _plot_klass[kind]
-    else:
-        raise ValueError("%r is not a valid plot kind" % kind)
-
-    from pandas import DataFrame
-    if kind in _dataframe_kinds:
-        if isinstance(data, DataFrame):
-            plot_obj = klass(data, x=x, y=y, subplots=subplots, ax=ax,
-                             kind=kind, **kwds)
-        else:
-            raise ValueError("plot kind %r can only be used for data frames"
-                             % kind)
-
-    elif kind in _series_kinds:
-        if isinstance(data, DataFrame):
-            if y is None and subplots is False:
-                msg = "{0} requires either y column or 'subplots=True'"
-                raise ValueError(msg.format(kind))
-            elif y is not None:
-                if com.is_integer(y) and not data.columns.holds_integer():
-                    y = data.columns[y]
-                # converted to series actually. copy to not modify
-                data = data[y].copy()
-                data.index.name = y
-        plot_obj = klass(data, subplots=subplots, ax=ax, kind=kind, **kwds)
-    else:
-        if isinstance(data, DataFrame):
-            if x is not None:
-                if com.is_integer(x) and not data.columns.holds_integer():
-                    x = data.columns[x]
-                data = data.set_index(x)
-
-            if y is not None:
-                if com.is_integer(y) and not data.columns.holds_integer():
-                    y = data.columns[y]
-                label = kwds['label'] if 'label' in kwds else y
-                series = data[y].copy()  # Don't modify
-                series.name = label
-
-                for kw in ['xerr', 'yerr']:
-                    if (kw in kwds) and \
-                        (isinstance(kwds[kw], string_types) or
-                            com.is_integer(kwds[kw])):
-                        try:
-                            kwds[kw] = data[kwds[kw]]
-                        except (IndexError, KeyError, TypeError):
-                            pass
-                data = series
-        plot_obj = klass(data, subplots=subplots, ax=ax, kind=kind, **kwds)
-
-    plot_obj.generate()
-    plot_obj.draw()
-    return plot_obj.result
-
-
-df_kind = """- 'scatter' : scatter plot
-        - 'hexbin' : hexbin plot"""
-series_kind = ""
-
-df_coord = """x : label or position, default None
-    y : label or position, default None
-        Allows plotting of one column versus another"""
-series_coord = ""
-
-df_unique = """stacked : boolean, default False in line and
-        bar plots, and True in area plot. If True, create stacked plot.
-    sort_columns : boolean, default False
-        Sort column names to determine plot ordering
-    secondary_y : boolean or sequence, default False
-        Whether to plot on the secondary y-axis
-        If a list/tuple, which columns to plot on secondary y-axis"""
-series_unique = """label : label argument to provide to plot
-    secondary_y : boolean or sequence of ints, default False
-        If True then y-axis will be on the right"""
-
-df_ax = """ax : matplotlib axes object, default None
-    subplots : boolean, default False
-        Make separate subplots for each column
-    sharex : boolean, default True if ax is None else False
-        In case subplots=True, share x axis and set some x axis labels to
-        invisible; defaults to True if ax is None otherwise False if an ax
-        is passed in; Be aware, that passing in both an ax and sharex=True
-        will alter all x axis labels for all axis in a figure!
-    sharey : boolean, default False
-        In case subplots=True, share y axis and set some y axis labels to
-        invisible
-    layout : tuple (optional)
-        (rows, columns) for the layout of subplots"""
-series_ax = """ax : matplotlib axes object
-        If not passed, uses gca()"""
-
-df_note = """- If `kind` = 'scatter' and the argument `c` is the name of a dataframe
-      column, the values of that column are used to color each point.
-    - If `kind` = 'hexbin', you can control the size of the bins with the
-      `gridsize` argument. By default, a histogram of the counts around each
-      `(x, y)` point is computed. You can specify alternative aggregations
-      by passing values to the `C` and `reduce_C_function` arguments.
-      `C` specifies the value at each `(x, y)` point and `reduce_C_function`
-      is a function of one argument that reduces all the values in a bin to
-      a single number (e.g. `mean`, `max`, `sum`, `std`)."""
-series_note = ""
-
-_shared_doc_df_kwargs = dict(klass='DataFrame', klass_obj='df',
-                             klass_kind=df_kind, klass_coord=df_coord,
-                             klass_ax=df_ax, klass_unique=df_unique,
-                             klass_note=df_note)
-_shared_doc_series_kwargs = dict(klass='Series', klass_obj='s',
-                                 klass_kind=series_kind,
-                                 klass_coord=series_coord, klass_ax=series_ax,
-                                 klass_unique=series_unique,
-                                 klass_note=series_note)
-
-_shared_docs['plot'] = """
-    Make plots of %(klass)s using matplotlib / pylab.
-
-    *New in version 0.17.0:* Each plot kind has a corresponding method on the
-    ``%(klass)s.plot`` accessor:
-    ``%(klass_obj)s.plot(kind='line')`` is equivalent to
-    ``%(klass_obj)s.plot.line()``.
-
-    Parameters
-    ----------
-    data : %(klass)s
-    %(klass_coord)s
-    kind : str
-        - 'line' : line plot (default)
-        - 'bar' : vertical bar plot
-        - 'barh' : horizontal bar plot
-        - 'hist' : histogram
-        - 'box' : boxplot
-        - 'kde' : Kernel Density Estimation plot
-        - 'density' : same as 'kde'
-        - 'area' : area plot
-        - 'pie' : pie plot
-        %(klass_kind)s
-    %(klass_ax)s
-    figsize : a tuple (width, height) in inches
-    use_index : boolean, default True
-        Use index as ticks for x axis
-    title : string
-        Title to use for the plot
-    grid : boolean, default None (matlab style default)
-        Axis grid lines
-    legend : False/True/'reverse'
-        Place legend on axis subplots
-    style : list or dict
-        matplotlib line style per column
-    logx : boolean, default False
-        Use log scaling on x axis
-    logy : boolean, default False
-        Use log scaling on y axis
-    loglog : boolean, default False
-        Use log scaling on both x and y axes
-    xticks : sequence
-        Values to use for the xticks
-    yticks : sequence
-        Values to use for the yticks
-    xlim : 2-tuple/list
-    ylim : 2-tuple/list
-    rot : int, default None
-        Rotation for ticks (xticks for vertical, yticks for horizontal plots)
-    fontsize : int, default None
-        Font size for xticks and yticks
-    colormap : str or matplotlib colormap object, default None
-        Colormap to select colors from. If string, load colormap with that name
-        from matplotlib.
-    colorbar : boolean, optional
-        If True, plot colorbar (only relevant for 'scatter' and 'hexbin' plots)
-    position : float
-        Specify relative alignments for bar plot layout.
-        From 0 (left/bottom-end) to 1 (right/top-end). Default is 0.5 (center)
-    layout : tuple (optional)
-        (rows, columns) for the layout of the plot
-    table : boolean, Series or DataFrame, default False
-        If True, draw a table using the data in the DataFrame and the data will
-        be transposed to meet matplotlib's default layout.
-        If a Series or DataFrame is passed, use passed data to draw a table.
-    yerr : DataFrame, Series, array-like, dict and str
-        See :ref:`Plotting with Error Bars <visualization.errorbars>` for detail.
-    xerr : same types as yerr.
-    %(klass_unique)s
-    mark_right : boolean, default True
-        When using a secondary_y axis, automatically mark the column
-        labels with "(right)" in the legend
-    kwds : keywords
-        Options to pass to matplotlib plotting method
-
-    Returns
-    -------
-    axes : matplotlib.AxesSubplot or np.array of them
-
-    Notes
-    -----
-
-    - See matplotlib documentation online for more on this subject
-    - If `kind` = 'bar' or 'barh', you can specify relative alignments
-      for bar plot layout by `position` keyword.
-      From 0 (left/bottom-end) to 1 (right/top-end). Default is 0.5 (center)
-    %(klass_note)s
-
-    """
-
-
-@Appender(_shared_docs['plot'] % _shared_doc_df_kwargs)
-def plot_frame(data, x=None, y=None, kind='line', ax=None,                 # Dataframe unique
-               subplots=False, sharex=None, sharey=False, layout=None,     # Dataframe unique
-               figsize=None, use_index=True, title=None, grid=None,
-               legend=True, style=None, logx=False, logy=False, loglog=False,
-               xticks=None, yticks=None, xlim=None, ylim=None,
-               rot=None, fontsize=None, colormap=None, table=False,
-               yerr=None, xerr=None,
-               secondary_y=False, sort_columns=False,        # Dataframe unique
-               **kwds):
-    return _plot(data, kind=kind, x=x, y=y, ax=ax,
-                 subplots=subplots, sharex=sharex, sharey=sharey,
-                 layout=layout, figsize=figsize, use_index=use_index,
-                 title=title, grid=grid, legend=legend,
-                 style=style, logx=logx, logy=logy, loglog=loglog,
-                 xticks=xticks, yticks=yticks, xlim=xlim, ylim=ylim,
-                 rot=rot, fontsize=fontsize, colormap=colormap, table=table,
-                 yerr=yerr, xerr=xerr,
-                 secondary_y=secondary_y, sort_columns=sort_columns,
-                 **kwds)
-
-
-@Appender(_shared_docs['plot'] % _shared_doc_series_kwargs)
-def plot_series(data, kind='line', ax=None,                    # Series unique
-                figsize=None, use_index=True, title=None, grid=None,
-                legend=False, style=None, logx=False, logy=False, loglog=False,
-                xticks=None, yticks=None, xlim=None, ylim=None,
-                rot=None, fontsize=None, colormap=None, table=False,
-                yerr=None, xerr=None,
-                label=None, secondary_y=False,                 # Series unique
-                **kwds):
-
-    import matplotlib.pyplot as plt
-    """
-    If no axes is specified, check whether there are existing figures
-    If there is no existing figures, _gca() will
-    create a figure with the default figsize, causing the figsize=parameter to
-    be ignored.
-    """
-    if ax is None and len(plt.get_fignums()) > 0:
-        ax = _gca()
-        ax = MPLPlot._get_ax_layer(ax)
-    return _plot(data, kind=kind, ax=ax,
-                 figsize=figsize, use_index=use_index, title=title,
-                 grid=grid, legend=legend,
-                 style=style, logx=logx, logy=logy, loglog=loglog,
-                 xticks=xticks, yticks=yticks, xlim=xlim, ylim=ylim,
-                 rot=rot, fontsize=fontsize, colormap=colormap, table=table,
-                 yerr=yerr, xerr=xerr,
-                 label=label, secondary_y=secondary_y,
-                 **kwds)
-
-
-_shared_docs['boxplot'] = """
-    Make a box plot from DataFrame column optionally grouped by some columns or
-    other inputs
-
-    Parameters
-    ----------
-    data : the pandas object holding the data
-    column : column name or list of names, or vector
-        Can be any valid input to groupby
-    by : string or sequence
-        Column in the DataFrame to group by
-    ax : Matplotlib axes object, optional
-    fontsize : int or string
-    rot : label rotation angle
-    figsize : A tuple (width, height) in inches
-    grid : Setting this to True will show the grid
-    layout : tuple (optional)
-        (rows, columns) for the layout of the plot
-    return_type : {'axes', 'dict', 'both'}, default 'dict'
-        The kind of object to return. 'dict' returns a dictionary
-        whose values are the matplotlib Lines of the boxplot;
-        'axes' returns the matplotlib axes the boxplot is drawn on;
-        'both' returns a namedtuple with the axes and dict.
-
-        When grouping with ``by``, a dict mapping columns to ``return_type``
-        is returned.
-
-    kwds : other plotting keyword arguments to be passed to matplotlib boxplot
-           function
-
-    Returns
-    -------
-    lines : dict
-    ax : matplotlib Axes
-    (ax, lines): namedtuple
-
-    Notes
-    -----
-    Use ``return_type='dict'`` when you want to tweak the appearance
-    of the lines after plotting. In this case a dict containing the Lines
-    making up the boxes, caps, fliers, medians, and whiskers is returned.
-    """
-
-
-@Appender(_shared_docs['boxplot'] % _shared_doc_kwargs)
-def boxplot(data, column=None, by=None, ax=None, fontsize=None,
-            rot=0, grid=True, figsize=None, layout=None, return_type=None,
-            **kwds):
-
-    # validate return_type:
-    if return_type not in BoxPlot._valid_return_types:
-        raise ValueError("return_type must be {None, 'axes', 'dict', 'both'}")
-
-    from pandas import Series, DataFrame
-    if isinstance(data, Series):
-        data = DataFrame({'x': data})
-        column = 'x'
-
-    def _get_colors():
-        return _get_standard_colors(color=kwds.get('color'), num_colors=1)
-
-    def maybe_color_bp(bp):
-        if 'color' not in kwds:
-            from matplotlib.artist import setp
-            setp(bp['boxes'], color=colors[0], alpha=1)
-            setp(bp['whiskers'], color=colors[0], alpha=1)
-            setp(bp['medians'], color=colors[2], alpha=1)
-
-    def plot_group(keys, values, ax):
-        keys = [com.pprint_thing(x) for x in keys]
-        values = [remove_na(v) for v in values]
-        bp = ax.boxplot(values, **kwds)
-        if kwds.get('vert', 1):
-            ax.set_xticklabels(keys, rotation=rot, fontsize=fontsize)
-        else:
-            ax.set_yticklabels(keys, rotation=rot, fontsize=fontsize)
-        maybe_color_bp(bp)
-
-        # Return axes in multiplot case, maybe revisit later # 985
-        if return_type == 'dict':
-            return bp
-        elif return_type == 'both':
-            return BoxPlot.BP(ax=ax, lines=bp)
-        else:
-            return ax
-
-    colors = _get_colors()
-    if column is None:
-        columns = None
-    else:
-        if isinstance(column, (list, tuple)):
-            columns = column
-        else:
-            columns = [column]
-
-    if by is not None:
-        result = _grouped_plot_by_column(plot_group, data, columns=columns,
-                                         by=by, grid=grid, figsize=figsize,
-                                         ax=ax, layout=layout,
-                                         return_type=return_type)
-    else:
-        if layout is not None:
-            raise ValueError("The 'layout' keyword is not supported when "
-                             "'by' is None")
-
-        if return_type is None:
-            msg = ("\nThe default value for 'return_type' will change to "
-                   "'axes' in a future release.\n To use the future behavior "
-                   "now, set return_type='axes'.\n To keep the previous "
-                   "behavior and silence this warning, set "
-                   "return_type='dict'.")
-            warnings.warn(msg, FutureWarning, stacklevel=3)
-            return_type = 'dict'
-        if ax is None:
-            ax = _gca()
-        data = data._get_numeric_data()
-        if columns is None:
-            columns = data.columns
-        else:
-            data = data[columns]
-
-        result = plot_group(columns, data.values.T, ax)
-        ax.grid(grid)
-
-    return result
-
-
-def format_date_labels(ax, rot):
-    # mini version of autofmt_xdate
-    try:
-        for label in ax.get_xticklabels():
-            label.set_ha('right')
-            label.set_rotation(rot)
-        fig = ax.get_figure()
-        fig.subplots_adjust(bottom=0.2)
-    except Exception:  # pragma: no cover
-        pass
-
-
-def scatter_plot(data, x, y, by=None, ax=None, figsize=None, grid=False,
-                 **kwargs):
-    """
-    Make a scatter plot from two DataFrame columns
-
-    Parameters
-    ----------
-    data : DataFrame
-    x : Column name for the x-axis values
-    y : Column name for the y-axis values
-    ax : Matplotlib axis object
-    figsize : A tuple (width, height) in inches
-    grid : Setting this to True will show the grid
-    kwargs : other plotting keyword arguments
-        To be passed to scatter function
-
-    Returns
-    -------
-    fig : matplotlib.Figure
-    """
-    import matplotlib.pyplot as plt
-
-    # workaround because `c='b'` is hardcoded in matplotlibs scatter method
-    kwargs.setdefault('c', plt.rcParams['patch.facecolor'])
-
-    def plot_group(group, ax):
-        xvals = group[x].values
-        yvals = group[y].values
-        ax.scatter(xvals, yvals, **kwargs)
-        ax.grid(grid)
-
-    if by is not None:
-        fig = _grouped_plot(plot_group, data, by=by, figsize=figsize, ax=ax)
-    else:
-        if ax is None:
-            fig = plt.figure()
-            ax = fig.add_subplot(111)
-        else:
-            fig = ax.get_figure()
-        plot_group(data, ax)
-        ax.set_ylabel(com.pprint_thing(y))
-        ax.set_xlabel(com.pprint_thing(x))
-
-        ax.grid(grid)
-
-    return fig
-
-
-def hist_frame(data, column=None, by=None, grid=True, xlabelsize=None,
-               xrot=None, ylabelsize=None, yrot=None, ax=None, sharex=False,
-               sharey=False, figsize=None, layout=None, bins=10, **kwds):
-    """
-    Draw histogram of the DataFrame's series using matplotlib / pylab.
-
-    Parameters
-    ----------
-    data : DataFrame
-    column : string or sequence
-        If passed, will be used to limit data to a subset of columns
-    by : object, optional
-        If passed, then used to form histograms for separate groups
-    grid : boolean, default True
-        Whether to show axis grid lines
-    xlabelsize : int, default None
-        If specified changes the x-axis label size
-    xrot : float, default None
-        rotation of x axis labels
-    ylabelsize : int, default None
-        If specified changes the y-axis label size
-    yrot : float, default None
-        rotation of y axis labels
-    ax : matplotlib axes object, default None
-    sharex : boolean, default True if ax is None else False
-        In case subplots=True, share x axis and set some x axis labels to
-        invisible; defaults to True if ax is None otherwise False if an ax
-        is passed in; Be aware, that passing in both an ax and sharex=True
-        will alter all x axis labels for all subplots in a figure!
-    sharey : boolean, default False
-        In case subplots=True, share y axis and set some y axis labels to
-        invisible
-    figsize : tuple
-        The size of the figure to create in inches by default
-    layout: (optional) a tuple (rows, columns) for the layout of the histograms
-    bins: integer, default 10
-        Number of histogram bins to be used
-    kwds : other plotting keyword arguments
-        To be passed to hist function
-    """
-
-    if by is not None:
-        axes = grouped_hist(data, column=column, by=by, ax=ax, grid=grid, figsize=figsize,
-                            sharex=sharex, sharey=sharey, layout=layout, bins=bins,
-                            xlabelsize=xlabelsize, xrot=xrot, ylabelsize=ylabelsize, yrot=yrot,
-                            **kwds)
-        return axes
-
-    if column is not None:
-        if not isinstance(column, (list, np.ndarray, Index)):
-            column = [column]
-        data = data[column]
-    data = data._get_numeric_data()
-    naxes = len(data.columns)
-
-    fig, axes = _subplots(naxes=naxes, ax=ax, squeeze=False,
-                          sharex=sharex, sharey=sharey, figsize=figsize,
-                          layout=layout)
-    _axes = _flatten(axes)
-
-    for i, col in enumerate(com._try_sort(data.columns)):
-        ax = _axes[i]
-        ax.hist(data[col].dropna().values, bins=bins, **kwds)
-        ax.set_title(col)
-        ax.grid(grid)
-
-    _set_ticks_props(axes, xlabelsize=xlabelsize, xrot=xrot,
-             ylabelsize=ylabelsize, yrot=yrot)
-    fig.subplots_adjust(wspace=0.3, hspace=0.3)
-
-    return axes
-
-
-def hist_series(self, by=None, ax=None, grid=True, xlabelsize=None,
-                xrot=None, ylabelsize=None, yrot=None, figsize=None, bins=10, **kwds):
-    """
-    Draw histogram of the input series using matplotlib
-
-    Parameters
-    ----------
-    by : object, optional
-        If passed, then used to form histograms for separate groups
-    ax : matplotlib axis object
-        If not passed, uses gca()
-    grid : boolean, default True
-        Whether to show axis grid lines
-    xlabelsize : int, default None
-        If specified changes the x-axis label size
-    xrot : float, default None
-        rotation of x axis labels
-    ylabelsize : int, default None
-        If specified changes the y-axis label size
-    yrot : float, default None
-        rotation of y axis labels
-    figsize : tuple, default None
-        figure size in inches by default
-    bins: integer, default 10
-        Number of histogram bins to be used
-    kwds : keywords
-        To be passed to the actual plotting function
-
-    Notes
-    -----
-    See matplotlib documentation online for more on this
-
-    """
-    import matplotlib.pyplot as plt
-
-    if by is None:
-        if kwds.get('layout', None) is not None:
-            raise ValueError("The 'layout' keyword is not supported when "
-                             "'by' is None")
-        # hack until the plotting interface is a bit more unified
-        fig = kwds.pop('figure', plt.gcf() if plt.get_fignums() else
-                       plt.figure(figsize=figsize))
-        if (figsize is not None and tuple(figsize) !=
-            tuple(fig.get_size_inches())):
-            fig.set_size_inches(*figsize, forward=True)
-        if ax is None:
-            ax = fig.gca()
-        elif ax.get_figure() != fig:
-            raise AssertionError('passed axis not bound to passed figure')
-        values = self.dropna().values
-
-        ax.hist(values, bins=bins, **kwds)
-        ax.grid(grid)
-        axes = np.array([ax])
-
-        _set_ticks_props(axes, xlabelsize=xlabelsize, xrot=xrot,
-                 ylabelsize=ylabelsize, yrot=yrot)
-
-    else:
-        if 'figure' in kwds:
-            raise ValueError("Cannot pass 'figure' when using the "
-                             "'by' argument, since a new 'Figure' instance "
-                             "will be created")
-        axes = grouped_hist(self, by=by, ax=ax, grid=grid, figsize=figsize, bins=bins,
-                            xlabelsize=xlabelsize, xrot=xrot, ylabelsize=ylabelsize, yrot=yrot,
-                            **kwds)
-
-    if hasattr(axes, 'ndim'):
-        if axes.ndim == 1 and len(axes) == 1:
-            return axes[0]
-    return axes
-
-
-def grouped_hist(data, column=None, by=None, ax=None, bins=50, figsize=None,
-                 layout=None, sharex=False, sharey=False, rot=90, grid=True,
-                 xlabelsize=None, xrot=None, ylabelsize=None, yrot=None,
-                 **kwargs):
-    """
-    Grouped histogram
-
-    Parameters
-    ----------
-    data: Series/DataFrame
-    column: object, optional
-    by: object, optional
-    ax: axes, optional
-    bins: int, default 50
-    figsize: tuple, optional
-    layout: optional
-    sharex: boolean, default False
-    sharey: boolean, default False
-    rot: int, default 90
-    grid: bool, default True
-    kwargs: dict, keyword arguments passed to matplotlib.Axes.hist
-
-    Returns
-    -------
-    axes: collection of Matplotlib Axes
-    """
-    def plot_group(group, ax):
-        ax.hist(group.dropna().values, bins=bins, **kwargs)
-
-    xrot = xrot or rot
-
-    fig, axes = _grouped_plot(plot_group, data, column=column,
-                              by=by, sharex=sharex, sharey=sharey, ax=ax,
-                              figsize=figsize, layout=layout, rot=rot)
-
-    _set_ticks_props(axes, xlabelsize=xlabelsize, xrot=xrot,
-             ylabelsize=ylabelsize, yrot=yrot)
-
-    fig.subplots_adjust(bottom=0.15, top=0.9, left=0.1, right=0.9,
-                        hspace=0.5, wspace=0.3)
-    return axes
-
-
-def boxplot_frame_groupby(grouped, subplots=True, column=None, fontsize=None,
-                          rot=0, grid=True, ax=None, figsize=None,
-                          layout=None, **kwds):
-    """
-    Make box plots from DataFrameGroupBy data.
-
-    Parameters
-    ----------
-    grouped : Grouped DataFrame
-    subplots :
-        * ``False`` - no subplots will be used
-        * ``True`` - create a subplot for each group
-    column : column name or list of names, or vector
-        Can be any valid input to groupby
-    fontsize : int or string
-    rot : label rotation angle
-    grid : Setting this to True will show the grid
-    ax : Matplotlib axis object, default None
-    figsize : A tuple (width, height) in inches
-    layout : tuple (optional)
-        (rows, columns) for the layout of the plot
-    kwds : other plotting keyword arguments to be passed to matplotlib boxplot
-           function
-
-    Returns
-    -------
-    dict of key/value = group key/DataFrame.boxplot return value
-    or DataFrame.boxplot return value in case subplots=figures=False
-
-    Examples
-    --------
-    >>> import pandas
-    >>> import numpy as np
-    >>> import itertools
-    >>>
-    >>> tuples = [t for t in itertools.product(range(1000), range(4))]
-    >>> index = pandas.MultiIndex.from_tuples(tuples, names=['lvl0', 'lvl1'])
-    >>> data = np.random.randn(len(index),4)
-    >>> df = pandas.DataFrame(data, columns=list('ABCD'), index=index)
-    >>>
-    >>> grouped = df.groupby(level='lvl1')
-    >>> boxplot_frame_groupby(grouped)
-    >>>
-    >>> grouped = df.unstack(level='lvl1').groupby(level=0, axis=1)
-    >>> boxplot_frame_groupby(grouped, subplots=False)
-    """
-    if subplots is True:
-        naxes = len(grouped)
-        fig, axes = _subplots(naxes=naxes, squeeze=False,
-                              ax=ax, sharex=False, sharey=True, figsize=figsize,
-                              layout=layout)
-        axes = _flatten(axes)
-
-        ret = compat.OrderedDict()
-        for (key, group), ax in zip(grouped, axes):
-            d = group.boxplot(ax=ax, column=column, fontsize=fontsize,
-                              rot=rot, grid=grid, **kwds)
-            ax.set_title(com.pprint_thing(key))
-            ret[key] = d
-        fig.subplots_adjust(bottom=0.15, top=0.9, left=0.1, right=0.9, wspace=0.2)
-    else:
-        from pandas.tools.merge import concat
-        keys, frames = zip(*grouped)
-        if grouped.axis == 0:
-            df = concat(frames, keys=keys, axis=1)
-        else:
-            if len(frames) > 1:
-                df = frames[0].join(frames[1::])
-            else:
-                df = frames[0]
-        ret = df.boxplot(column=column, fontsize=fontsize, rot=rot,
-                         grid=grid, ax=ax, figsize=figsize, layout=layout, **kwds)
-    return ret
-
-
-def _grouped_plot(plotf, data, column=None, by=None, numeric_only=True,
-                  figsize=None, sharex=True, sharey=True, layout=None,
-                  rot=0, ax=None, **kwargs):
-    from pandas import DataFrame
-
-    if figsize == 'default':
-        # allowed to specify mpl default with 'default'
-        warnings.warn("figsize='default' is deprecated. Specify figure"
-                      "size by tuple instead", FutureWarning, stacklevel=4)
-        figsize = None
-
-    grouped = data.groupby(by)
-    if column is not None:
-        grouped = grouped[column]
-
-    naxes = len(grouped)
-    fig, axes = _subplots(naxes=naxes, figsize=figsize,
-                          sharex=sharex, sharey=sharey, ax=ax,
-                          layout=layout)
-
-    _axes = _flatten(axes)
-
-    for i, (key, group) in enumerate(grouped):
-        ax = _axes[i]
-        if numeric_only and isinstance(group, DataFrame):
-            group = group._get_numeric_data()
-        plotf(group, ax, **kwargs)
-        ax.set_title(com.pprint_thing(key))
-
-    return fig, axes
-
-
-def _grouped_plot_by_column(plotf, data, columns=None, by=None,
-                            numeric_only=True, grid=False,
-                            figsize=None, ax=None, layout=None, return_type=None,
-                            **kwargs):
-    grouped = data.groupby(by)
-    if columns is None:
-        if not isinstance(by, (list, tuple)):
-            by = [by]
-        columns = data._get_numeric_data().columns.difference(by)
-    naxes = len(columns)
-    fig, axes = _subplots(naxes=naxes, sharex=True, sharey=True,
-                          figsize=figsize, ax=ax, layout=layout)
-
-    _axes = _flatten(axes)
-
-    result = compat.OrderedDict()
-    for i, col in enumerate(columns):
-        ax = _axes[i]
-        gp_col = grouped[col]
-        keys, values = zip(*gp_col)
-        re_plotf = plotf(keys, values, ax, **kwargs)
-        ax.set_title(col)
-        ax.set_xlabel(com.pprint_thing(by))
-        result[col] = re_plotf
-        ax.grid(grid)
-
-    # Return axes in multiplot case, maybe revisit later # 985
-    if return_type is None:
-        result = axes
-
-    byline = by[0] if len(by) == 1 else by
-    fig.suptitle('Boxplot grouped by %s' % byline)
-    fig.subplots_adjust(bottom=0.15, top=0.9, left=0.1, right=0.9, wspace=0.2)
-
-    return result
-
-
-def table(ax, data, rowLabels=None, colLabels=None,
-          **kwargs):
-
-    """
-    Helper function to convert DataFrame and Series to matplotlib.table
-
-    Parameters
-    ----------
-    `ax`: Matplotlib axes object
-    `data`: DataFrame or Series
-        data for table contents
-    `kwargs`: keywords, optional
-        keyword arguments which passed to matplotlib.table.table.
-        If `rowLabels` or `colLabels` is not specified, data index or column name will be used.
-
-    Returns
-    -------
-    matplotlib table object
-    """
-    from pandas import DataFrame
-    if isinstance(data, Series):
-        data = DataFrame(data, columns=[data.name])
-    elif isinstance(data, DataFrame):
-        pass
-    else:
-        raise ValueError('Input data must be DataFrame or Series')
-
-    if rowLabels is None:
-        rowLabels = data.index
-
-    if colLabels is None:
-        colLabels = data.columns
-
-    cellText = data.values
-
-    import matplotlib.table
-    table = matplotlib.table.table(ax, cellText=cellText,
-        rowLabels=rowLabels, colLabels=colLabels, **kwargs)
-    return table
-
-
-def _get_layout(nplots, layout=None, layout_type='box'):
-    if layout is not None:
-        if not isinstance(layout, (tuple, list)) or len(layout) != 2:
-            raise ValueError('Layout must be a tuple of (rows, columns)')
-
-        nrows, ncols = layout
-
-        # Python 2 compat
-        ceil_ = lambda x: int(ceil(x))
-        if nrows == -1 and ncols >0:
-            layout = nrows, ncols = (ceil_(float(nplots) / ncols), ncols)
-        elif ncols == -1 and nrows > 0:
-            layout = nrows, ncols = (nrows, ceil_(float(nplots) / nrows))
-        elif ncols <= 0 and nrows <= 0:
-            msg = "At least one dimension of layout must be positive"
-            raise ValueError(msg)
-
-        if nrows * ncols < nplots:
-            raise ValueError('Layout of %sx%s must be larger than required size %s' %
-                (nrows, ncols, nplots))
-
-        return layout
-
-    if layout_type == 'single':
-        return (1, 1)
-    elif layout_type == 'horizontal':
-        return (1, nplots)
-    elif layout_type == 'vertical':
-        return (nplots, 1)
-
-    layouts = {1: (1, 1), 2: (1, 2), 3: (2, 2), 4: (2, 2)}
-    try:
-        return layouts[nplots]
-    except KeyError:
-        k = 1
-        while k ** 2 < nplots:
-            k += 1
-
-        if (k - 1) * k >= nplots:
-            return k, (k - 1)
-        else:
-            return k, k
-
-# copied from matplotlib/pyplot.py and modified for pandas.plotting
-
-
-def _subplots(naxes=None, sharex=False, sharey=False, squeeze=True,
-              subplot_kw=None, ax=None, layout=None, layout_type='box', **fig_kw):
-    """Create a figure with a set of subplots already made.
-
-    This utility wrapper makes it convenient to create common layouts of
-    subplots, including the enclosing figure object, in a single call.
-
-    Keyword arguments:
-
-    naxes : int
-      Number of required axes. Exceeded axes are set invisible. Default is
-      nrows * ncols.
-
-    sharex : bool
-      If True, the X axis will be shared amongst all subplots.
-
-    sharey : bool
-      If True, the Y axis will be shared amongst all subplots.
-
-    squeeze : bool
-
-      If True, extra dimensions are squeezed out from the returned axis object:
-        - if only one subplot is constructed (nrows=ncols=1), the resulting
-        single Axis object is returned as a scalar.
-        - for Nx1 or 1xN subplots, the returned object is a 1-d numpy object
-        array of Axis objects are returned as numpy 1-d arrays.
-        - for NxM subplots with N>1 and M>1 are returned as a 2d array.
-
-      If False, no squeezing at all is done: the returned axis object is always
-      a 2-d array containing Axis instances, even if it ends up being 1x1.
-
-    subplot_kw : dict
-      Dict with keywords passed to the add_subplot() call used to create each
-      subplots.
-
-    ax : Matplotlib axis object, optional
-
-    layout : tuple
-      Number of rows and columns of the subplot grid.
-      If not specified, calculated from naxes and layout_type
-
-    layout_type : {'box', 'horziontal', 'vertical'}, default 'box'
-      Specify how to layout the subplot grid.
-
-    fig_kw : Other keyword arguments to be passed to the figure() call.
-        Note that all keywords not recognized above will be
-        automatically included here.
-
-    Returns:
-
-    fig, ax : tuple
-      - fig is the Matplotlib Figure object
-      - ax can be either a single axis object or an array of axis objects if
-      more than one subplot was created.  The dimensions of the resulting array
-      can be controlled with the squeeze keyword, see above.
-
-    **Examples:**
-
-    x = np.linspace(0, 2*np.pi, 400)
-    y = np.sin(x**2)
-
-    # Just a figure and one subplot
-    f, ax = plt.subplots()
-    ax.plot(x, y)
-    ax.set_title('Simple plot')
-
-    # Two subplots, unpack the output array immediately
-    f, (ax1, ax2) = plt.subplots(1, 2, sharey=True)
-    ax1.plot(x, y)
-    ax1.set_title('Sharing Y axis')
-    ax2.scatter(x, y)
-
-    # Four polar axes
-    plt.subplots(2, 2, subplot_kw=dict(polar=True))
-    """
-    import matplotlib.pyplot as plt
-
-    if subplot_kw is None:
-        subplot_kw = {}
-
-    if ax is None:
-        fig = plt.figure(**fig_kw)
-    else:
-        if com.is_list_like(ax):
-            ax = _flatten(ax)
-            if layout is not None:
-                warnings.warn("When passing multiple axes, layout keyword is ignored", UserWarning)
-            if sharex or sharey:
-                warnings.warn("When passing multiple axes, sharex and sharey are ignored."
-                              "These settings must be specified when creating axes", UserWarning)
-            if len(ax) == naxes:
-                fig = ax[0].get_figure()
-                return fig, ax
-            else:
-                raise ValueError("The number of passed axes must be {0}, the same as "
-                                 "the output plot".format(naxes))
-
-        fig = ax.get_figure()
-         # if ax is passed and a number of subplots is 1, return ax as it is
-        if naxes == 1:
-            if squeeze:
-                return fig, ax
-            else:
-                return fig, _flatten(ax)
-        else:
-            warnings.warn("To output multiple subplots, the figure containing the passed axes "
-                          "is being cleared", UserWarning)
-            fig.clear()
-
-    nrows, ncols = _get_layout(naxes, layout=layout, layout_type=layout_type)
-    nplots = nrows * ncols
-
-    # Create empty object array to hold all axes.  It's easiest to make it 1-d
-    # so we can just append subplots upon creation, and then
-    axarr = np.empty(nplots, dtype=object)
-
-    # Create first subplot separately, so we can share it if requested
-    ax0 = fig.add_subplot(nrows, ncols, 1, **subplot_kw)
-
-    if sharex:
-        subplot_kw['sharex'] = ax0
-    if sharey:
-        subplot_kw['sharey'] = ax0
-    axarr[0] = ax0
-
-    # Note off-by-one counting because add_subplot uses the MATLAB 1-based
-    # convention.
-    for i in range(1, nplots):
-        kwds = subplot_kw.copy()
-        # Set sharex and sharey to None for blank/dummy axes, these can
-        # interfere with proper axis limits on the visible axes if
-        # they share axes e.g. issue #7528
-        if i >= naxes:
-            kwds['sharex'] = None
-            kwds['sharey'] = None
-        ax = fig.add_subplot(nrows, ncols, i + 1, **kwds)
-        axarr[i] = ax
-
-    if naxes != nplots:
-        for ax in axarr[naxes:]:
-            ax.set_visible(False)
-
-    _handle_shared_axes(axarr, nplots, naxes, nrows, ncols, sharex, sharey)
-
-    if squeeze:
-        # Reshape the array to have the final desired dimension (nrow,ncol),
-        # though discarding unneeded dimensions that equal 1.  If we only have
-        # one subplot, just return it instead of a 1-element array.
-        if nplots == 1:
-            axes = axarr[0]
-        else:
-            axes = axarr.reshape(nrows, ncols).squeeze()
-    else:
-        # returned axis array will be always 2-d, even if nrows=ncols=1
-        axes = axarr.reshape(nrows, ncols)
-
-    return fig, axes
-
-
-def _remove_labels_from_axis(axis):
-    for t in axis.get_majorticklabels():
-        t.set_visible(False)
-
-    try:
-        # set_visible will not be effective if
-        # minor axis has NullLocator and NullFormattor (default)
-        import matplotlib.ticker as ticker
-        if isinstance(axis.get_minor_locator(), ticker.NullLocator):
-            axis.set_minor_locator(ticker.AutoLocator())
-        if isinstance(axis.get_minor_formatter(), ticker.NullFormatter):
-            axis.set_minor_formatter(ticker.FormatStrFormatter(''))
-        for t in axis.get_minorticklabels():
-            t.set_visible(False)
-    except Exception:   # pragma no cover
-        raise
-    axis.get_label().set_visible(False)
-
-
-def _handle_shared_axes(axarr, nplots, naxes, nrows, ncols, sharex, sharey):
-    if nplots > 1:
-
-        if nrows > 1:
-            try:
-                # first find out the ax layout,
-                # so that we can correctly handle 'gaps"
-                layout = np.zeros((nrows+1,ncols+1), dtype=np.bool)
-                for ax in axarr:
-                    layout[ax.rowNum, ax.colNum] = ax.get_visible()
-
-                for ax in axarr:
-                    # only the last row of subplots should get x labels -> all
-                    # other off layout handles the case that the subplot is
-                    # the last in the column, because below is no subplot/gap.
-                    if not layout[ax.rowNum+1, ax.colNum]:
-                        continue
-                    if sharex or len(ax.get_shared_x_axes().get_siblings(ax)) > 1:
-                        _remove_labels_from_axis(ax.xaxis)
-
-            except IndexError:
-                # if gridspec is used, ax.rowNum and ax.colNum may different
-                # from layout shape. in this case, use last_row logic
-                for ax in axarr:
-                    if ax.is_last_row():
-                        continue
-                    if sharex or len(ax.get_shared_x_axes().get_siblings(ax)) > 1:
-                        _remove_labels_from_axis(ax.xaxis)
-
-        if ncols > 1:
-            for ax in axarr:
-                # only the first column should get y labels -> set all other to off
-                # as we only have labels in teh first column and we always have a subplot there,
-                # we can skip the layout test
-                if ax.is_first_col():
-                    continue
-                if sharey or len(ax.get_shared_y_axes().get_siblings(ax)) > 1:
-                    _remove_labels_from_axis(ax.yaxis)
-
-
-
-def _flatten(axes):
-    if not com.is_list_like(axes):
-        return np.array([axes])
-    elif isinstance(axes, (np.ndarray, Index)):
-        return axes.ravel()
-    return np.array(axes)
-
-
-def _get_all_lines(ax):
-    lines = ax.get_lines()
-
-    if hasattr(ax, 'right_ax'):
-        lines += ax.right_ax.get_lines()
-
-    if hasattr(ax, 'left_ax'):
-        lines += ax.left_ax.get_lines()
-
-    return lines
-
-
-def _get_xlim(lines):
-    left, right = np.inf, -np.inf
-    for l in lines:
-        x = l.get_xdata(orig=False)
-        left = min(x[0], left)
-        right = max(x[-1], right)
-    return left, right
-
-
-def _set_ticks_props(axes, xlabelsize=None, xrot=None,
-                     ylabelsize=None, yrot=None):
-    import matplotlib.pyplot as plt
-
-    for ax in _flatten(axes):
-        if xlabelsize is not None:
-            plt.setp(ax.get_xticklabels(), fontsize=xlabelsize)
-        if xrot is not None:
-            plt.setp(ax.get_xticklabels(), rotation=xrot)
-        if ylabelsize is not None:
-            plt.setp(ax.get_yticklabels(), fontsize=ylabelsize)
-        if yrot is not None:
-            plt.setp(ax.get_yticklabels(), rotation=yrot)
-    return axes
-
-
-class BasePlotMethods(PandasObject):
-    def __init__(self, data):
-        self._data = data
-
-    def __call__(self, *args, **kwargs):
-        raise NotImplementedError
-
-
-class SeriesPlotMethods(BasePlotMethods):
-    """Series plotting accessor and method
-
-    Examples
-    --------
-    >>> s.plot.line()
-    >>> s.plot.bar()
-    >>> s.plot.hist()
-
-    Plotting methods can also be accessed by calling the accessor as a method
-    with the ``kind`` argument:
-    ``s.plot(kind='line')`` is equivalent to ``s.plot.line()``
-    """
-    def __call__(self, kind='line', ax=None,                    # Series unique
-                 figsize=None, use_index=True, title=None, grid=None,
-                 legend=False, style=None, logx=False, logy=False, loglog=False,
-                 xticks=None, yticks=None, xlim=None, ylim=None,
-                 rot=None, fontsize=None, colormap=None, table=False,
-                 yerr=None, xerr=None,
-                 label=None, secondary_y=False,                 # Series unique
-                 **kwds):
-        return plot_series(self._data, kind=kind, ax=ax, figsize=figsize,
-                           use_index=use_index, title=title, grid=grid,
-                           legend=legend, style=style, logx=logx, logy=logy,
-                           loglog=loglog, xticks=xticks, yticks=yticks,
-                           xlim=xlim, ylim=ylim, rot=rot, fontsize=fontsize,
-                           colormap=colormap, table=table, yerr=yerr,
-                           xerr=xerr, label=label, secondary_y=secondary_y,
-                           **kwds)
-    __call__.__doc__ = plot_series.__doc__
-
-    def line(self, **kwds):
-        """
-        Line plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='line', **kwds)
-
-    def bar(self, **kwds):
-        """
-        Vertical bar plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='bar', **kwds)
-
-    def barh(self, **kwds):
-        """
-        Horizontal bar plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='barh', **kwds)
-
-    def box(self, **kwds):
-        """
-        Boxplot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='box', **kwds)
-
-    def hist(self, bins=10, **kwds):
-        """
-        Histogram
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        bins: integer, default 10
-            Number of histogram bins to be used
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='hist', bins=bins, **kwds)
-
-    def kde(self, **kwds):
-        """
-        Kernel Density Estimate plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='kde', **kwds)
-
-    density = kde
-
-    def area(self, **kwds):
-        """
-        Area plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='area', **kwds)
-
-    def pie(self, **kwds):
-        """
-        Pie chart
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='pie', **kwds)
-
-
-class FramePlotMethods(BasePlotMethods):
-    """DataFrame plotting accessor and method
-
-    Examples
-    --------
-    >>> df.plot.line()
-    >>> df.plot.scatter('x', 'y')
-    >>> df.plot.hexbin()
-
-    These plotting methods can also be accessed by calling the accessor as a
-    method with the ``kind`` argument:
-    ``df.plot(kind='line')`` is equivalent to ``df.plot.line()``
-    """
-    def __call__(self, x=None, y=None, kind='line', ax=None,                 # Dataframe unique
-                 subplots=False, sharex=None, sharey=False, layout=None,     # Dataframe unique
-                 figsize=None, use_index=True, title=None, grid=None,
-                 legend=True, style=None, logx=False, logy=False, loglog=False,
-                 xticks=None, yticks=None, xlim=None, ylim=None,
-                 rot=None, fontsize=None, colormap=None, table=False,
-                 yerr=None, xerr=None,
-                 secondary_y=False, sort_columns=False,        # Dataframe unique
-                 **kwds):
-        return plot_frame(self._data, kind=kind, x=x, y=y, ax=ax,
-                          subplots=subplots, sharex=sharex, sharey=sharey,
-                          layout=layout, figsize=figsize, use_index=use_index,
-                          title=title, grid=grid, legend=legend, style=style,
-                          logx=logx, logy=logy, loglog=loglog, xticks=xticks,
-                          yticks=yticks, xlim=xlim, ylim=ylim, rot=rot,
-                          fontsize=fontsize, colormap=colormap, table=table,
-                          yerr=yerr, xerr=xerr, secondary_y=secondary_y,
-                          sort_columns=sort_columns, **kwds)
-    __call__.__doc__ = plot_frame.__doc__
-
-    def line(self, x=None, y=None, **kwds):
-        """
-        Line plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        x, y : label or position, optional
-            Coordinates for each point.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='line', x=x, y=y, **kwds)
-
-    def bar(self, x=None, y=None, **kwds):
-        """
-        Vertical bar plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        x, y : label or position, optional
-            Coordinates for each point.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='bar', x=x, y=y, **kwds)
-
-    def barh(self, x=None, y=None, **kwds):
-        """
-        Horizontal bar plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        x, y : label or position, optional
-            Coordinates for each point.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='barh', x=x, y=y, **kwds)
-
-    def box(self, by=None, **kwds):
-        """
-        Boxplot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        by : string or sequence
-            Column in the DataFrame to group by.
-        \*\*kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='box', by=by, **kwds)
-
-    def hist(self, by=None, bins=10, **kwds):
-        """
-        Histogram
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        by : string or sequence
-            Column in the DataFrame to group by.
-        bins: integer, default 10
-            Number of histogram bins to be used
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='hist', by=by, bins=bins, **kwds)
-
-    def kde(self, **kwds):
-        """
-        Kernel Density Estimate plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='kde', **kwds)
-
-    density = kde
-
-    def area(self, x=None, y=None, **kwds):
-        """
-        Area plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        x, y : label or position, optional
-            Coordinates for each point.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='area', x=x, y=y, **kwds)
-
-    def pie(self, y=None, **kwds):
-        """
-        Pie chart
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        y : label or position, optional
-            Column to plot.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='pie', y=y, **kwds)
-
-    def scatter(self, x, y, s=None, c=None, **kwds):
-        """
-        Scatter plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        x, y : label or position, optional
-            Coordinates for each point.
-        s : scalar or array_like, optional
-            Size of each point.
-        c : label or position, optional
-            Color of each point.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='scatter', x=x, y=y, c=c, s=s, **kwds)
-
-    def hexbin(self, x, y, C=None, reduce_C_function=None, gridsize=None,
-               **kwds):
-        """
-        Hexbin plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        x, y : label or position, optional
-            Coordinates for each point.
-        C : label or position, optional
-            The value at each `(x, y)` point.
-        reduce_C_function : callable, optional
-            Function of one argument that reduces all the values in a bin to
-            a single number (e.g. `mean`, `max`, `sum`, `std`).
-        gridsize : int, optional
-            Number of bins.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        if reduce_C_function is not None:
-            kwds['reduce_C_function'] = reduce_C_function
-        if gridsize is not None:
-            kwds['gridsize'] = gridsize
-        return self(kind='hexbin', x=x, y=y, C=C, **kwds)
-
-
-if __name__ == '__main__':
-    # import pandas.rpy.common as com
-    # sales = com.load_data('sanfrancisco.home.sales', package='nutshell')
-    # top10 = sales['zip'].value_counts()[:10].index
-    # sales2 = sales[sales.zip.isin(top10)]
-    # _ = scatter_plot(sales2, 'squarefeet', 'price', by='zip')
-
-    # plt.show()
-
-    import matplotlib.pyplot as plt
-
-    import pandas.tools.plotting as plots
-    import pandas.core.frame as fr
-    reload(plots)
-    reload(fr)
-    from pandas.core.frame import DataFrame
-
-    data = DataFrame([[3, 6, -5], [4, 8, 2], [4, 9, -6],
-                      [4, 9, -3], [2, 5, -1]],
-                     columns=['A', 'B', 'C'])
-    data.plot(kind='barh', stacked=True)
-
-    plt.show()
+    setattr(m, t, outer(t))
diff --git a/pandas/tools/rplot.py b/pandas/tools/rplot.py
deleted file mode 100644
index bc834689ffce8..0000000000000
--- a/pandas/tools/rplot.py
+++ /dev/null
@@ -1,896 +0,0 @@
-import random
-import warnings
-from copy import deepcopy
-from pandas.core.common import _values_from_object
-
-import numpy as np
-from pandas.compat import range, zip
-#
-# TODO:
-# * Make sure legends work properly
-#
-
-
-warnings.warn("\n"
-              "The rplot trellis plotting interface is deprecated and will be "
-              "removed in a future version. We refer to external packages "
-              "like seaborn for similar but more refined functionality. \n\n"
-              "See our docs http://pandas.pydata.org/pandas-docs/stable/visualization.html#rplot "
-              "for some example how to convert your existing code to these "
-              "packages.", FutureWarning, stacklevel=2)
-
-
-class Scale:
-    """
-    Base class for mapping between graphical and data attributes.
-    """
-    pass
-
-class ScaleGradient(Scale):
-    """
-    A mapping between a data attribute value and a
-    point in colour space between two specified colours.
-    """
-    def __init__(self, column, colour1, colour2):
-        """Initialize ScaleGradient instance.
-
-        Parameters:
-        -----------
-        column: string, pandas DataFrame column name
-        colour1: tuple, 3 element tuple with float values representing an RGB colour
-        colour2: tuple, 3 element tuple with float values representing an RGB colour
-        """
-        self.column = column
-        self.colour1 = colour1
-        self.colour2 = colour2
-        self.categorical = False
-
-    def __call__(self, data, index):
-        """Return a colour corresponding to data attribute value.
-
-        Parameters:
-        -----------
-        data: pandas DataFrame
-        index: pandas DataFrame row index
-
-        Returns:
-        --------
-        A three element tuple representing an RGB somewhere between colour1 and colour2
-        """
-        x = data[self.column].iget(index)
-        a = min(data[self.column])
-        b = max(data[self.column])
-        r1, g1, b1 = self.colour1
-        r2, g2, b2 = self.colour2
-        x_scaled = (x - a) / (b - a)
-        return (r1 + (r2 - r1) * x_scaled,
-                g1 + (g2 - g1) * x_scaled,
-                b1 + (b2 - b1) * x_scaled)
-
-class ScaleGradient2(Scale):
-    """
-    Create a mapping between a data attribute value and a
-    point in colour space in a line of three specified colours.
-    """
-    def __init__(self, column, colour1, colour2, colour3):
-        """Initialize ScaleGradient2 instance.
-
-        Parameters:
-        -----------
-        column: string, pandas DataFrame column name
-        colour1: tuple, 3 element tuple with float values representing an RGB colour
-        colour2: tuple, 3 element tuple with float values representing an RGB colour
-        colour3: tuple, 3 element tuple with float values representing an RGB colour
-        """
-        self.column = column
-        self.colour1 = colour1
-        self.colour2 = colour2
-        self.colour3 = colour3
-        self.categorical = False
-
-    def __call__(self, data, index):
-        """Return a colour corresponding to data attribute value.
-
-        Parameters:
-        -----------
-        data: pandas DataFrame
-        index: pandas DataFrame row index
-
-        Returns:
-        --------
-        A three element tuple representing an RGB somewhere along the line
-        of colour1, colour2 and colour3
-        """
-        x = data[self.column].iget(index)
-        a = min(data[self.column])
-        b = max(data[self.column])
-        r1, g1, b1 = self.colour1
-        r2, g2, b2 = self.colour2
-        r3, g3, b3 = self.colour3
-        x_scaled = (x - a) / (b - a)
-        if x_scaled < 0.5:
-            x_scaled *= 2.0
-            return (r1 + (r2 - r1) * x_scaled,
-                    g1 + (g2 - g1) * x_scaled,
-                    b1 + (b2 - b1) * x_scaled)
-        else:
-            x_scaled = (x_scaled - 0.5) * 2.0
-            return (r2 + (r3 - r2) * x_scaled,
-                    g2 + (g3 - g2) * x_scaled,
-                    b2 + (b3 - b2) * x_scaled)
-
-class ScaleSize(Scale):
-    """
-    Provide a mapping between a DataFrame column and matplotlib
-    scatter plot shape size.
-    """
-    def __init__(self, column, min_size=5.0, max_size=100.0, transform=lambda x: x):
-        """Initialize ScaleSize instance.
-
-        Parameters:
-        -----------
-        column: string, a column name
-        min_size: float, minimum point size
-        max_size: float, maximum point size
-        transform: a one argument function of form float -> float (e.g. lambda x: log(x))
-        """
-        self.column = column
-        self.min_size = min_size
-        self.max_size = max_size
-        self.transform = transform
-        self.categorical = False
-
-    def __call__(self, data, index):
-        """Return matplotlib scatter plot marker shape size.
-
-        Parameters:
-        -----------
-        data: pandas DataFrame
-        index: pandas DataFrame row index
-        """
-        x = data[self.column].iget(index)
-        a = float(min(data[self.column]))
-        b = float(max(data[self.column]))
-        return self.transform(self.min_size + ((x - a) / (b - a)) *
-            (self.max_size - self.min_size))
-
-class ScaleShape(Scale):
-    """
-    Provides a mapping between matplotlib marker shapes
-    and attribute values.
-    """
-    def __init__(self, column):
-        """Initialize ScaleShape instance.
-
-        Parameters:
-        -----------
-        column: string, pandas DataFrame column name
-        """
-        self.column = column
-        self.shapes = ['o', '+', 's', '*', '^', '<', '>', 'v', '|', 'x']
-        self.legends = set([])
-        self.categorical = True
-
-    def __call__(self, data, index):
-        """Returns a matplotlib marker identifier.
-
-        Parameters:
-        -----------
-        data: pandas DataFrame
-        index: pandas DataFrame row index
-
-        Returns:
-        --------
-        a matplotlib marker identifier
-        """
-        values = sorted(list(set(data[self.column])))
-        if len(values) > len(self.shapes):
-            raise ValueError("Too many different values of the categorical attribute for ScaleShape")
-        x = data[self.column].iget(index)
-        return self.shapes[values.index(x)]
-
-class ScaleRandomColour(Scale):
-    """
-    Maps a random colour to a DataFrame attribute.
-    """
-    def __init__(self, column):
-        """Initialize ScaleRandomColour instance.
-
-        Parameters:
-        -----------
-        column: string, pandas DataFrame column name
-        """
-        self.column = column
-        self.categorical = True
-
-    def __call__(self, data, index):
-        """Return a tuple of three floats, representing
-        an RGB colour.
-
-        Parameters:
-        -----------
-        data: pandas DataFrame
-        index: pandas DataFrame row index
-        """
-        random.seed(data[self.column].iget(index))
-        return [random.random() for _ in range(3)]
-
-class ScaleConstant(Scale):
-    """
-    Constant returning scale. Usually used automatically.
-    """
-    def __init__(self, value):
-        """Initialize ScaleConstant instance.
-
-        Parameters:
-        -----------
-        value: any Python value to be returned when called
-        """
-        self.value = value
-        self.categorical = False
-
-    def __call__(self, data, index):
-        """Return the constant value.
-
-        Parameters:
-        -----------
-        data: pandas DataFrame
-        index: pandas DataFrame row index
-
-        Returns:
-        --------
-        A constant value specified during initialisation
-        """
-        return self.value
-
-def default_aes(x=None, y=None):
-    """Create the default aesthetics dictionary.
-
-    Parameters:
-    -----------
-    x: string, DataFrame column name
-    y: string, DataFrame column name
-
-    Returns:
-    --------
-    a dictionary with aesthetics bindings
-    """
-    return {
-        'x' : x,
-        'y' : y,
-        'size' : ScaleConstant(40.0),
-        'colour' : ScaleConstant('grey'),
-        'shape' : ScaleConstant('o'),
-        'alpha' : ScaleConstant(1.0),
-    }
-
-def make_aes(x=None, y=None, size=None, colour=None, shape=None, alpha=None):
-    """Create an empty aesthetics dictionary.
-
-    Parameters:
-    -----------
-    x: string, DataFrame column name
-    y: string, DataFrame column name
-    size: function, binding for size attribute of Geoms
-    colour: function, binding for colour attribute of Geoms
-    shape: function, binding for shape attribute of Geoms
-    alpha: function, binding for alpha attribute of Geoms
-
-    Returns:
-    --------
-    a dictionary with aesthetics bindings
-    """
-    if not hasattr(size, '__call__') and size is not None:
-        size = ScaleConstant(size)
-    if not hasattr(colour, '__call__') and colour is not None:
-        colour = ScaleConstant(colour)
-    if not hasattr(shape, '__call__') and shape is not None:
-        shape = ScaleConstant(shape)
-    if not hasattr(alpha, '__call__') and alpha is not None:
-        alpha = ScaleConstant(alpha)
-    if any([isinstance(size, scale) for scale in [ScaleConstant, ScaleSize]]) or size is None:
-        pass
-    else:
-        raise ValueError('size mapping should be done through ScaleConstant or ScaleSize')
-    if any([isinstance(colour, scale) for scale in [ScaleConstant, ScaleGradient, ScaleGradient2, ScaleRandomColour]]) or colour is None:
-        pass
-    else:
-        raise ValueError('colour mapping should be done through ScaleConstant, ScaleRandomColour, ScaleGradient or ScaleGradient2')
-    if any([isinstance(shape, scale) for scale in [ScaleConstant, ScaleShape]]) or shape is None:
-        pass
-    else:
-        raise ValueError('shape mapping should be done through ScaleConstant or ScaleShape')
-    if any([isinstance(alpha, scale) for scale in [ScaleConstant]]) or alpha is None:
-        pass
-    else:
-        raise ValueError('alpha mapping should be done through ScaleConstant')
-    return {
-        'x' : x,
-        'y' : y,
-        'size' : size,
-        'colour' : colour,
-        'shape' : shape,
-        'alpha' : alpha,
-    }
-
-class Layer:
-    """
-    Layer object representing a single plot layer.
-    """
-    def __init__(self, data=None, **kwds):
-        """Initialize layer object.
-
-        Parameters:
-        -----------
-        data: pandas DataFrame instance
-        aes: aesthetics dictionary with bindings
-        """
-        self.data = data
-        self.aes = make_aes(**kwds)
-        self.legend = {}
-
-    def work(self, fig=None, ax=None):
-        """Do the drawing (usually) work.
-
-        Parameters:
-        -----------
-        fig: matplotlib figure
-        ax: matplotlib axis object
-
-        Returns:
-        --------
-        a tuple with the same figure and axis instances
-        """
-        return fig, ax
-
-class GeomPoint(Layer):
-    def work(self, fig=None, ax=None):
-        """Render the layer on a matplotlib axis.
-        You can specify either a figure or an axis to draw on.
-
-        Parameters:
-        -----------
-        fig: matplotlib figure object
-        ax: matplotlib axis object to draw on
-
-        Returns:
-        --------
-        fig, ax: matplotlib figure and axis objects
-        """
-        if ax is None:
-            if fig is None:
-                return fig, ax
-            else:
-                ax = fig.gca()
-        for index in range(len(self.data)):
-            row = self.data.iloc[index]
-            x = row[self.aes['x']]
-            y = row[self.aes['y']]
-            size_scaler = self.aes['size']
-            colour_scaler = self.aes['colour']
-            shape_scaler = self.aes['shape']
-            alpha = self.aes['alpha']
-            size_value = size_scaler(self.data, index)
-            colour_value = colour_scaler(self.data, index)
-            marker_value = shape_scaler(self.data, index)
-            alpha_value = alpha(self.data, index)
-            patch = ax.scatter(x, y,
-                    s=size_value,
-                    c=colour_value,
-                    marker=marker_value,
-                    alpha=alpha_value)
-            label = []
-            if colour_scaler.categorical:
-                label += [colour_scaler.column, row[colour_scaler.column]]
-            if shape_scaler.categorical:
-                label += [shape_scaler.column, row[shape_scaler.column]]
-            self.legend[tuple(label)] = patch
-        ax.set_xlabel(self.aes['x'])
-        ax.set_ylabel(self.aes['y'])
-        return fig, ax
-
-class GeomPolyFit(Layer):
-    """
-    Draw a polynomial fit of specified degree.
-    """
-    def __init__(self, degree, lw=2.0, colour='grey'):
-        """Initialize GeomPolyFit object.
-
-        Parameters:
-        -----------
-        degree: an integer, polynomial degree
-        lw: line width
-        colour: matplotlib colour
-        """
-        self.degree = degree
-        self.lw = lw
-        self.colour = colour
-        Layer.__init__(self)
-
-    def work(self, fig=None, ax=None):
-        """Draw the polynomial fit on matplotlib figure or axis
-
-        Parameters:
-        -----------
-        fig: matplotlib figure
-        ax: matplotlib axis
-
-        Returns:
-        --------
-        a tuple with figure and axis objects
-        """
-        if ax is None:
-            if fig is None:
-                return fig, ax
-            else:
-                ax = fig.gca()
-        from numpy.polynomial.polynomial import polyfit
-        from numpy.polynomial.polynomial import polyval
-        x = self.data[self.aes['x']]
-        y = self.data[self.aes['y']]
-        min_x = min(x)
-        max_x = max(x)
-        c = polyfit(x, y, self.degree)
-        x_ = np.linspace(min_x, max_x, len(x))
-        y_ = polyval(x_, c)
-        ax.plot(x_, y_, lw=self.lw, c=self.colour)
-        return fig, ax
-
-class GeomScatter(Layer):
-    """
-    An efficient scatter plot, use this instead of GeomPoint for speed.
-    """
-    def __init__(self, marker='o', colour='lightblue', alpha=1.0):
-        """Initialize GeomScatter instance.
-
-        Parameters:
-        -----------
-        marker: matplotlib marker string
-        colour: matplotlib colour
-        alpha: matplotlib alpha
-        """
-        self.marker = marker
-        self.colour = colour
-        self.alpha = alpha
-        Layer.__init__(self)
-
-    def work(self, fig=None, ax=None):
-        """Draw a scatter plot on matplotlib figure or axis
-
-        Parameters:
-        -----------
-        fig: matplotlib figure
-        ax: matplotlib axis
-
-        Returns:
-        --------
-        a tuple with figure and axis objects
-        """
-        if ax is None:
-            if fig is None:
-                return fig, ax
-            else:
-                ax = fig.gca()
-        x = self.data[self.aes['x']]
-        y = self.data[self.aes['y']]
-        ax.scatter(x, y, marker=self.marker, c=self.colour, alpha=self.alpha)
-        return fig, ax
-
-class GeomHistogram(Layer):
-    """
-    An efficient histogram, use this instead of GeomBar for speed.
-    """
-    def __init__(self, bins=10, colour='lightblue'):
-        """Initialize GeomHistogram instance.
-
-        Parameters:
-        -----------
-        bins: integer, number of histogram bins
-        colour: matplotlib colour
-        """
-        self.bins = bins
-        self.colour = colour
-        Layer.__init__(self)
-
-    def work(self, fig=None, ax=None):
-        """Draw a histogram on matplotlib figure or axis
-
-        Parameters:
-        -----------
-        fig: matplotlib figure
-        ax: matplotlib axis
-
-        Returns:
-        --------
-        a tuple with figure and axis objects
-        """
-        if ax is None:
-            if fig is None:
-                return fig, ax
-            else:
-                ax = fig.gca()
-        x = self.data[self.aes['x']]
-        ax.hist(_values_from_object(x), self.bins, facecolor=self.colour)
-        ax.set_xlabel(self.aes['x'])
-        return fig, ax
-
-class GeomDensity(Layer):
-    """
-    A kernel density estimation plot.
-    """
-    def work(self, fig=None, ax=None):
-        """Draw a one dimensional kernel density plot.
-        You can specify either a figure or an axis to draw on.
-
-        Parameters:
-        -----------
-        fig: matplotlib figure object
-        ax: matplotlib axis object to draw on
-
-        Returns:
-        --------
-        fig, ax: matplotlib figure and axis objects
-        """
-        if ax is None:
-            if fig is None:
-                return fig, ax
-            else:
-                ax = fig.gca()
-        from scipy.stats import gaussian_kde
-        x = self.data[self.aes['x']]
-        gkde = gaussian_kde(x)
-        ind = np.linspace(x.min(), x.max(), 200)
-        ax.plot(ind, gkde.evaluate(ind))
-        return fig, ax
-
-class GeomDensity2D(Layer):
-    def work(self, fig=None, ax=None):
-        """Draw a two dimensional kernel density plot.
-        You can specify either a figure or an axis to draw on.
-
-        Parameters:
-        -----------
-        fig: matplotlib figure object
-        ax: matplotlib axis object to draw on
-
-        Returns:
-        --------
-        fig, ax: matplotlib figure and axis objects
-        """
-        if ax is None:
-            if fig is None:
-                return fig, ax
-            else:
-                ax = fig.gca()
-        x = self.data[self.aes['x']]
-        y = self.data[self.aes['y']]
-        rvs = np.array([x, y])
-        x_min = x.min()
-        x_max = x.max()
-        y_min = y.min()
-        y_max = y.max()
-        X, Y = np.mgrid[x_min:x_max:200j, y_min:y_max:200j]
-        positions = np.vstack([X.ravel(), Y.ravel()])
-        values = np.vstack([x, y])
-        import scipy.stats as stats
-        kernel = stats.gaussian_kde(values)
-        Z = np.reshape(kernel(positions).T, X.shape)
-        ax.contour(Z, extent=[x_min, x_max, y_min, y_max])
-        return fig, ax
-
-class TrellisGrid(Layer):
-    def __init__(self, by):
-        """Initialize TreelisGrid instance.
-
-        Parameters:
-        -----------
-        by: column names to group by
-        """
-        if len(by) != 2:
-            raise ValueError("You must give a list of length 2 to group by")
-        elif by[0] == '.' and by[1] == '.':
-            raise ValueError("At least one of grouping attributes must be not a dot")
-        self.by = by
-
-    def trellis(self, layers):
-        """Create a trellis structure for a list of layers.
-        Each layer will be cloned with different data in to a two dimensional grid.
-
-        Parameters:
-        -----------
-        layers: a list of Layer objects
-
-        Returns:
-        --------
-        trellised_layers: Clones of each layer in the list arranged in a trellised latice
-        """
-        trellised_layers = []
-        for layer in layers:
-            data = layer.data
-            if self.by[0] == '.':
-                grouped = data.groupby(self.by[1])
-            elif self.by[1] == '.':
-                grouped = data.groupby(self.by[0])
-            else:
-                grouped = data.groupby(self.by)
-            groups = list(grouped.groups.keys())
-            if self.by[0] == '.' or self.by[1] == '.':
-                shingle1 = set([g for g in groups])
-            else:
-                shingle1 = set([g[0] for g in groups])
-                shingle2 = set([g[1] for g in groups])
-            if self.by[0] == '.':
-                self.rows = 1
-                self.cols = len(shingle1)
-            elif self.by[1] == '.':
-                self.rows = len(shingle1)
-                self.cols = 1
-            else:
-                self.rows = len(shingle1)
-                self.cols = len(shingle2)
-            trellised = [[None for _ in range(self.cols)] for _ in range(self.rows)]
-            self.group_grid = [[None for _ in range(self.cols)] for _ in range(self.rows)]
-            row = 0
-            col = 0
-            for group, data in grouped:
-                new_layer = deepcopy(layer)
-                new_layer.data = data
-                trellised[row][col] = new_layer
-                self.group_grid[row][col] = group
-                col += 1
-                if col >= self.cols:
-                    col = 0
-                    row += 1
-            trellised_layers.append(trellised)
-        return trellised_layers
-
-def dictionary_union(dict1, dict2):
-    """Take two dictionaries, return dictionary union.
-
-    Parameters:
-    -----------
-    dict1: Python dictionary
-    dict2: Python dictionary
-
-    Returns:
-    --------
-    A union of the dictionaries. It assumes that values
-    with the same keys are identical.
-    """
-    keys1 = list(dict1.keys())
-    keys2 = list(dict2.keys())
-    result = {}
-    for key1 in keys1:
-        result[key1] = dict1[key1]
-    for key2 in keys2:
-        result[key2] = dict2[key2]
-    return result
-
-def merge_aes(layer1, layer2):
-    """Merges the aesthetics dictionaries for the two layers.
-    Look up sequence_layers function. Which layer is first and which
-    one is second is important.
-
-    Parameters:
-    -----------
-    layer1: Layer object
-    layer2: Layer object
-    """
-    for key in layer2.aes.keys():
-        if layer2.aes[key] is None:
-            layer2.aes[key] = layer1.aes[key]
-
-def sequence_layers(layers):
-    """Go through the list of layers and fill in the missing bits of information.
-    The basic rules are this:
-    * If the current layer has data set to None, take the data from previous layer.
-    * For each aesthetic mapping, if that mapping is set to None, take it from previous layer.
-
-    Parameters:
-    -----------
-    layers: a list of Layer objects
-    """
-    for layer1, layer2 in zip(layers[:-1], layers[1:]):
-        if layer2.data is None:
-            layer2.data = layer1.data
-        merge_aes(layer1, layer2)
-    return layers
-
-def sequence_grids(layer_grids):
-    """Go through the list of layer girds and perform the same thing as sequence_layers.
-
-    Parameters:
-    -----------
-    layer_grids: a list of two dimensional layer grids
-    """
-    for grid1, grid2 in zip(layer_grids[:-1], layer_grids[1:]):
-        for row1, row2 in zip(grid1, grid2):
-            for layer1, layer2 in zip(row1, row2):
-                if layer2.data is None:
-                    layer2.data = layer1.data
-                merge_aes(layer1, layer2)
-    return layer_grids
-
-def work_grid(grid, fig):
-    """Take a two dimensional grid, add subplots to a figure for each cell and do layer work.
-
-    Parameters:
-    -----------
-    grid: a two dimensional grid of layers
-    fig: matplotlib figure to draw on
-
-    Returns:
-    --------
-    axes: a two dimensional list of matplotlib axes
-    """
-    nrows = len(grid)
-    ncols = len(grid[0])
-    axes = [[None for _ in range(ncols)] for _ in range(nrows)]
-    for row in range(nrows):
-        for col in range(ncols):
-            axes[row][col] = fig.add_subplot(nrows, ncols, ncols * row + col + 1)
-            grid[row][col].work(ax=axes[row][col])
-    return axes
-
-def adjust_subplots(fig, axes, trellis, layers):
-    """Adjust the subtplots on matplotlib figure with the
-    fact that we have a trellis plot in mind.
-
-    Parameters:
-    -----------
-    fig: matplotlib figure
-    axes: a two dimensional grid of matplotlib axes
-    trellis: TrellisGrid object
-    layers: last grid of layers in the plot
-    """
-    # Flatten the axes grid
-    axes = [ax for row in axes for ax in row]
-    min_x = min([ax.get_xlim()[0] for ax in axes])
-    max_x = max([ax.get_xlim()[1] for ax in axes])
-    min_y = min([ax.get_ylim()[0] for ax in axes])
-    max_y = max([ax.get_ylim()[1] for ax in axes])
-    [ax.set_xlim(min_x, max_x) for ax in axes]
-    [ax.set_ylim(min_y, max_y) for ax in axes]
-    for index, axis in enumerate(axes):
-        if index % trellis.cols == 0:
-            pass
-        else:
-            axis.get_yaxis().set_ticks([])
-            axis.set_ylabel('')
-        if index / trellis.cols == trellis.rows - 1:
-            pass
-        else:
-            axis.get_xaxis().set_ticks([])
-            axis.set_xlabel('')
-        if trellis.by[0] == '.':
-            label1 = "%s = %s" % (trellis.by[1], trellis.group_grid[index // trellis.cols][index % trellis.cols])
-            label2 = None
-        elif trellis.by[1] == '.':
-            label1 = "%s = %s" % (trellis.by[0], trellis.group_grid[index // trellis.cols][index % trellis.cols])
-            label2 = None
-        else:
-            label1 = "%s = %s" % (trellis.by[0], trellis.group_grid[index // trellis.cols][index % trellis.cols][0])
-            label2 = "%s = %s" % (trellis.by[1], trellis.group_grid[index // trellis.cols][index % trellis.cols][1])
-        if label2 is not None:
-            axis.table(cellText=[[label1], [label2]],
-                loc='top', cellLoc='center',
-                cellColours=[['lightgrey'], ['lightgrey']])
-        else:
-            axis.table(cellText=[[label1]], loc='top', cellLoc='center', cellColours=[['lightgrey']])
-    # Flatten the layer grid
-    layers = [layer for row in layers for layer in row]
-    legend = {}
-    for layer in layers:
-        legend = dictionary_union(legend, layer.legend)
-    patches = []
-    labels = []
-    if len(list(legend.keys())) == 0:
-        key_function = lambda tup: tup
-    elif len(list(legend.keys())[0]) == 2:
-        key_function = lambda tup: (tup[1])
-    else:
-        key_function = lambda tup: (tup[1], tup[3])
-    for key in sorted(list(legend.keys()), key=key_function):
-        value = legend[key]
-        patches.append(value)
-        if len(key) == 2:
-            col, val = key
-            labels.append("%s" % str(val))
-        elif len(key) == 4:
-            col1, val1, col2, val2 = key
-            labels.append("%s, %s" % (str(val1), str(val2)))
-        else:
-            raise ValueError("Maximum 2 categorical attributes to display a lengend of")
-    if len(legend):
-        fig.legend(patches, labels, loc='upper right')
-    fig.subplots_adjust(wspace=0.05, hspace=0.2)
-
-class RPlot:
-    """
-    The main plot object. Add layers to an instance of this object to create a plot.
-    """
-    def __init__(self, data, x=None, y=None):
-        """Initialize RPlot instance.
-
-        Parameters:
-        -----------
-        data: pandas DataFrame instance
-        x: string, DataFrame column name
-        y: string, DataFrame column name
-        """
-        self.layers = [Layer(data, **default_aes(x=x, y=y))]
-        trellised = False
-
-    def add(self, layer):
-        """Add a layer to RPlot instance.
-
-        Parameters:
-        -----------
-        layer: Layer instance
-        """
-        if not isinstance(layer, Layer):
-            raise TypeError("The operand on the right side of + must be a Layer instance")
-        self.layers.append(layer)
-
-    def render(self, fig=None):
-        """Render all the layers on a matplotlib figure.
-
-        Parameters:
-        -----------
-        fig: matplotlib figure
-        """
-        import matplotlib.pyplot as plt
-        if fig is None:
-            fig = plt.gcf()
-        # Look for the last TrellisGrid instance in the layer list
-        last_trellis = None
-        for layer in self.layers:
-            if isinstance(layer, TrellisGrid):
-                last_trellis = layer
-        if last_trellis is None:
-            # We have a simple, non-trellised plot
-            new_layers = sequence_layers(self.layers)
-            for layer in new_layers:
-                layer.work(fig=fig)
-            legend = {}
-            for layer in new_layers:
-                legend = dictionary_union(legend, layer.legend)
-            patches = []
-            labels = []
-            if len(list(legend.keys())) == 0:
-                key_function = lambda tup: tup
-            elif len(list(legend.keys())[0]) == 2:
-                key_function = lambda tup: (tup[1])
-            else:
-                key_function = lambda tup: (tup[1], tup[3])
-            for key in sorted(list(legend.keys()), key=key_function):
-                value = legend[key]
-                patches.append(value)
-                if len(key) == 2:
-                    col, val = key
-                    labels.append("%s" % str(val))
-                elif len(key) == 4:
-                    col1, val1, col2, val2 = key
-                    labels.append("%s, %s" % (str(val1), str(val2)))
-                else:
-                    raise ValueError("Maximum 2 categorical attributes to display a lengend of")
-            if len(legend):
-                fig.legend(patches, labels, loc='upper right')
-        else:
-            # We have a trellised plot.
-            # First let's remove all other TrellisGrid instances from the layer list,
-            # including this one.
-            new_layers = []
-            for layer in self.layers:
-                if not isinstance(layer, TrellisGrid):
-                    new_layers.append(layer)
-            new_layers = sequence_layers(new_layers)
-            # Now replace the old layers by their trellised versions
-            new_layers = last_trellis.trellis(new_layers)
-            # Prepare the subplots and draw on them
-            new_layers = sequence_grids(new_layers)
-            axes_grids = [work_grid(grid, fig) for grid in new_layers]
-            axes_grid = axes_grids[-1]
-            adjust_subplots(fig, axes_grid, last_trellis, new_layers[-1])
-        # And we're done
-        return fig
diff --git a/pandas/tools/tests/test_merge.py b/pandas/tools/tests/test_merge.py
deleted file mode 100644
index 929a72cfd4adc..0000000000000
--- a/pandas/tools/tests/test_merge.py
+++ /dev/null
@@ -1,2772 +0,0 @@
-# pylint: disable=E1103
-
-import nose
-
-from datetime import datetime
-from numpy.random import randn
-from numpy import nan
-import numpy as np
-import random
-
-import pandas as pd
-from pandas.compat import range, lrange, lzip, zip, StringIO
-from pandas import compat
-from pandas.tseries.index import DatetimeIndex
-from pandas.tools.merge import merge, concat, ordered_merge, MergeError
-from pandas.util.testing import (assert_frame_equal, assert_series_equal,
-                                 assert_almost_equal,
-                                 makeCustomDataframe as mkdf,
-                                 assertRaisesRegexp)
-from pandas import isnull, DataFrame, Index, MultiIndex, Panel, Series, date_range, read_table, read_csv
-import pandas.algos as algos
-import pandas.util.testing as tm
-
-a_ = np.array
-
-N = 50
-NGROUPS = 8
-JOIN_TYPES = ['inner', 'outer', 'left', 'right']
-
-
-def get_test_data(ngroups=NGROUPS, n=N):
-    unique_groups = lrange(ngroups)
-    arr = np.asarray(np.tile(unique_groups, n // ngroups))
-
-    if len(arr) < n:
-        arr = np.asarray(list(arr) + unique_groups[:n - len(arr)])
-
-    random.shuffle(arr)
-    return arr
-
-
-class TestMerge(tm.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        # aggregate multiple columns
-        self.df = DataFrame({'key1': get_test_data(),
-                             'key2': get_test_data(),
-                             'data1': np.random.randn(N),
-                             'data2': np.random.randn(N)})
-
-        # exclude a couple keys for fun
-        self.df = self.df[self.df['key2'] > 1]
-
-        self.df2 = DataFrame({'key1': get_test_data(n=N // 5),
-                              'key2': get_test_data(ngroups=NGROUPS // 2,
-                                                    n=N // 5),
-                              'value': np.random.randn(N // 5)})
-
-        index, data = tm.getMixedTypeDict()
-        self.target = DataFrame(data, index=index)
-
-        # Join on string value
-        self.source = DataFrame({'MergedA': data['A'], 'MergedD': data['D']},
-                                index=data['C'])
-
-        self.left = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'e', 'a'],
-                               'v1': np.random.randn(7)})
-        self.right = DataFrame({'v2': np.random.randn(4)},
-                               index=['d', 'b', 'c', 'a'])
-
-    def test_cython_left_outer_join(self):
-        left = a_([0, 1, 2, 1, 2, 0, 0, 1, 2, 3, 3], dtype=np.int64)
-        right = a_([1, 1, 0, 4, 2, 2, 1], dtype=np.int64)
-        max_group = 5
-
-        ls, rs = algos.left_outer_join(left, right, max_group)
-
-        exp_ls = left.argsort(kind='mergesort')
-        exp_rs = right.argsort(kind='mergesort')
-
-        exp_li = a_([0, 1, 2, 3, 3, 3, 4, 4, 4, 5, 5, 5,
-                     6, 6, 7, 7, 8, 8, 9, 10])
-        exp_ri = a_([0, 0, 0, 1, 2, 3, 1, 2, 3, 1, 2, 3,
-                     4, 5, 4, 5, 4, 5, -1, -1])
-
-        exp_ls = exp_ls.take(exp_li)
-        exp_ls[exp_li == -1] = -1
-
-        exp_rs = exp_rs.take(exp_ri)
-        exp_rs[exp_ri == -1] = -1
-
-        self.assert_numpy_array_equal(ls, exp_ls)
-        self.assert_numpy_array_equal(rs, exp_rs)
-
-    def test_cython_right_outer_join(self):
-        left = a_([0, 1, 2, 1, 2, 0, 0, 1, 2, 3, 3], dtype=np.int64)
-        right = a_([1, 1, 0, 4, 2, 2, 1], dtype=np.int64)
-        max_group = 5
-
-        rs, ls = algos.left_outer_join(right, left, max_group)
-
-        exp_ls = left.argsort(kind='mergesort')
-        exp_rs = right.argsort(kind='mergesort')
-
-        #            0        1        1        1
-        exp_li = a_([0, 1, 2, 3, 4, 5, 3, 4, 5, 3, 4, 5,
-                     #            2        2        4
-                     6, 7, 8, 6, 7, 8, -1])
-        exp_ri = a_([0, 0, 0, 1, 1, 1, 2, 2, 2, 3, 3, 3,
-                     4, 4, 4, 5, 5, 5, 6])
-
-        exp_ls = exp_ls.take(exp_li)
-        exp_ls[exp_li == -1] = -1
-
-        exp_rs = exp_rs.take(exp_ri)
-        exp_rs[exp_ri == -1] = -1
-
-        self.assert_numpy_array_equal(ls, exp_ls)
-        self.assert_numpy_array_equal(rs, exp_rs)
-
-    def test_cython_inner_join(self):
-        left = a_([0, 1, 2, 1, 2, 0, 0, 1, 2, 3, 3], dtype=np.int64)
-        right = a_([1, 1, 0, 4, 2, 2, 1, 4], dtype=np.int64)
-        max_group = 5
-
-        ls, rs = algos.inner_join(left, right, max_group)
-
-        exp_ls = left.argsort(kind='mergesort')
-        exp_rs = right.argsort(kind='mergesort')
-
-        exp_li = a_([0, 1, 2, 3, 3, 3, 4, 4, 4, 5, 5, 5,
-                     6, 6, 7, 7, 8, 8])
-        exp_ri = a_([0, 0, 0, 1, 2, 3, 1, 2, 3, 1, 2, 3,
-                     4, 5, 4, 5, 4, 5])
-
-        exp_ls = exp_ls.take(exp_li)
-        exp_ls[exp_li == -1] = -1
-
-        exp_rs = exp_rs.take(exp_ri)
-        exp_rs[exp_ri == -1] = -1
-
-        self.assert_numpy_array_equal(ls, exp_ls)
-        self.assert_numpy_array_equal(rs, exp_rs)
-
-    def test_left_outer_join(self):
-        joined_key2 = merge(self.df, self.df2, on='key2')
-        _check_join(self.df, self.df2, joined_key2, ['key2'], how='left')
-
-        joined_both = merge(self.df, self.df2)
-        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
-                    how='left')
-
-    def test_right_outer_join(self):
-        joined_key2 = merge(self.df, self.df2, on='key2', how='right')
-        _check_join(self.df, self.df2, joined_key2, ['key2'], how='right')
-
-        joined_both = merge(self.df, self.df2, how='right')
-        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
-                    how='right')
-
-    def test_full_outer_join(self):
-        joined_key2 = merge(self.df, self.df2, on='key2', how='outer')
-        _check_join(self.df, self.df2, joined_key2, ['key2'], how='outer')
-
-        joined_both = merge(self.df, self.df2, how='outer')
-        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
-                    how='outer')
-
-    def test_inner_join(self):
-        joined_key2 = merge(self.df, self.df2, on='key2', how='inner')
-        _check_join(self.df, self.df2, joined_key2, ['key2'], how='inner')
-
-        joined_both = merge(self.df, self.df2, how='inner')
-        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
-                    how='inner')
-
-    def test_handle_overlap(self):
-        joined = merge(self.df, self.df2, on='key2',
-                       suffixes=['.foo', '.bar'])
-
-        self.assertIn('key1.foo', joined)
-        self.assertIn('key1.bar', joined)
-
-    def test_handle_overlap_arbitrary_key(self):
-        joined = merge(self.df, self.df2,
-                       left_on='key2', right_on='key1',
-                       suffixes=['.foo', '.bar'])
-        self.assertIn('key1.foo', joined)
-        self.assertIn('key2.bar', joined)
-
-    def test_merge_common(self):
-        joined = merge(self.df, self.df2)
-        exp = merge(self.df, self.df2, on=['key1', 'key2'])
-        tm.assert_frame_equal(joined, exp)
-
-    def test_join_on(self):
-        target = self.target
-        source = self.source
-
-        merged = target.join(source, on='C')
-        self.assert_numpy_array_equal(merged['MergedA'], target['A'])
-        self.assert_numpy_array_equal(merged['MergedD'], target['D'])
-
-        # join with duplicates (fix regression from DataFrame/Matrix merge)
-        df = DataFrame({'key': ['a', 'a', 'b', 'b', 'c']})
-        df2 = DataFrame({'value': [0, 1, 2]}, index=['a', 'b', 'c'])
-        joined = df.join(df2, on='key')
-        expected = DataFrame({'key': ['a', 'a', 'b', 'b', 'c'],
-                              'value': [0, 0, 1, 1, 2]})
-        assert_frame_equal(joined, expected)
-
-        # Test when some are missing
-        df_a = DataFrame([[1], [2], [3]], index=['a', 'b', 'c'],
-                         columns=['one'])
-        df_b = DataFrame([['foo'], ['bar']], index=[1, 2],
-                         columns=['two'])
-        df_c = DataFrame([[1], [2]], index=[1, 2],
-                         columns=['three'])
-        joined = df_a.join(df_b, on='one')
-        joined = joined.join(df_c, on='one')
-        self.assertTrue(np.isnan(joined['two']['c']))
-        self.assertTrue(np.isnan(joined['three']['c']))
-
-        # merge column not p resent
-        self.assertRaises(KeyError, target.join, source, on='E')
-
-        # overlap
-        source_copy = source.copy()
-        source_copy['A'] = 0
-        self.assertRaises(ValueError, target.join, source_copy, on='A')
-
-    def test_join_on_fails_with_different_right_index(self):
-        with tm.assertRaises(ValueError):
-            df = DataFrame({'a': tm.choice(['m', 'f'], size=3),
-                            'b': np.random.randn(3)})
-            df2 = DataFrame({'a': tm.choice(['m', 'f'], size=10),
-                             'b': np.random.randn(10)},
-                            index=tm.makeCustomIndex(10, 2))
-            merge(df, df2, left_on='a', right_index=True)
-
-    def test_join_on_fails_with_different_left_index(self):
-        with tm.assertRaises(ValueError):
-            df = DataFrame({'a': tm.choice(['m', 'f'], size=3),
-                            'b': np.random.randn(3)},
-                           index=tm.makeCustomIndex(10, 2))
-            df2 = DataFrame({'a': tm.choice(['m', 'f'], size=10),
-                             'b': np.random.randn(10)})
-            merge(df, df2, right_on='b', left_index=True)
-
-    def test_join_on_fails_with_different_column_counts(self):
-        with tm.assertRaises(ValueError):
-            df = DataFrame({'a': tm.choice(['m', 'f'], size=3),
-                            'b': np.random.randn(3)})
-            df2 = DataFrame({'a': tm.choice(['m', 'f'], size=10),
-                             'b': np.random.randn(10)},
-                            index=tm.makeCustomIndex(10, 2))
-            merge(df, df2, right_on='a', left_on=['a', 'b'])
-
-    def test_join_on_pass_vector(self):
-        expected = self.target.join(self.source, on='C')
-        del expected['C']
-
-        join_col = self.target.pop('C')
-        result = self.target.join(self.source, on=join_col)
-        assert_frame_equal(result, expected)
-
-    def test_join_with_len0(self):
-        # nothing to merge
-        merged = self.target.join(self.source.reindex([]), on='C')
-        for col in self.source:
-            self.assertIn(col, merged)
-            self.assertTrue(merged[col].isnull().all())
-
-        merged2 = self.target.join(self.source.reindex([]), on='C',
-                                   how='inner')
-        self.assertTrue(merged2.columns.equals(merged.columns))
-        self.assertEqual(len(merged2), 0)
-
-    def test_join_on_inner(self):
-        df = DataFrame({'key': ['a', 'a', 'd', 'b', 'b', 'c']})
-        df2 = DataFrame({'value': [0, 1]}, index=['a', 'b'])
-
-        joined = df.join(df2, on='key', how='inner')
-
-        expected = df.join(df2, on='key')
-        expected = expected[expected['value'].notnull()]
-        self.assert_numpy_array_equal(joined['key'], expected['key'])
-        self.assert_numpy_array_equal(joined['value'], expected['value'])
-        self.assertTrue(joined.index.equals(expected.index))
-
-    def test_join_on_singlekey_list(self):
-        df = DataFrame({'key': ['a', 'a', 'b', 'b', 'c']})
-        df2 = DataFrame({'value': [0, 1, 2]}, index=['a', 'b', 'c'])
-
-        # corner cases
-        joined = df.join(df2, on=['key'])
-        expected = df.join(df2, on='key')
-
-        assert_frame_equal(joined, expected)
-
-    def test_join_on_series(self):
-        result = self.target.join(self.source['MergedA'], on='C')
-        expected = self.target.join(self.source[['MergedA']], on='C')
-        assert_frame_equal(result, expected)
-
-    def test_join_on_series_buglet(self):
-        # GH #638
-        df = DataFrame({'a': [1, 1]})
-        ds = Series([2], index=[1], name='b')
-        result = df.join(ds, on='a')
-        expected = DataFrame({'a': [1, 1],
-                              'b': [2, 2]}, index=df.index)
-        tm.assert_frame_equal(result, expected)
-
-    def test_join_index_mixed(self):
-        df1 = DataFrame({'A': 1., 'B': 2, 'C': 'foo', 'D': True},
-                        index=np.arange(10),
-                        columns=['A', 'B', 'C', 'D'])
-        self.assertEqual(df1['B'].dtype, np.int64)
-        self.assertEqual(df1['D'].dtype, np.bool_)
-
-        df2 = DataFrame({'A': 1., 'B': 2, 'C': 'foo', 'D': True},
-                        index=np.arange(0, 10, 2),
-                        columns=['A', 'B', 'C', 'D'])
-
-        # overlap
-        joined = df1.join(df2, lsuffix='_one', rsuffix='_two')
-        expected_columns = ['A_one', 'B_one', 'C_one', 'D_one',
-                            'A_two', 'B_two', 'C_two', 'D_two']
-        df1.columns = expected_columns[:4]
-        df2.columns = expected_columns[4:]
-        expected = _join_by_hand(df1, df2)
-        assert_frame_equal(joined, expected)
-
-        # no overlapping blocks
-        df1 = DataFrame(index=np.arange(10))
-        df1['bool'] = True
-        df1['string'] = 'foo'
-
-        df2 = DataFrame(index=np.arange(5, 15))
-        df2['int'] = 1
-        df2['float'] = 1.
-
-        for kind in JOIN_TYPES:
-
-            joined = df1.join(df2, how=kind)
-            expected = _join_by_hand(df1, df2, how=kind)
-            assert_frame_equal(joined, expected)
-
-            joined = df2.join(df1, how=kind)
-            expected = _join_by_hand(df2, df1, how=kind)
-            assert_frame_equal(joined, expected)
-
-    def test_join_empty_bug(self):
-        # generated an exception in 0.4.3
-        x = DataFrame()
-        x.join(DataFrame([3], index=[0], columns=['A']), how='outer')
-
-    def test_join_unconsolidated(self):
-        # GH #331
-        a = DataFrame(randn(30, 2), columns=['a', 'b'])
-        c = Series(randn(30))
-        a['c'] = c
-        d = DataFrame(randn(30, 1), columns=['q'])
-
-        # it works!
-        a.join(d)
-        d.join(a)
-
-    def test_join_multiindex(self):
-        index1 = MultiIndex.from_arrays([['a', 'a', 'a', 'b', 'b', 'b'],
-                                         [1, 2, 3, 1, 2, 3]],
-                                        names=['first', 'second'])
-
-        index2 = MultiIndex.from_arrays([['b', 'b', 'b', 'c', 'c', 'c'],
-                                         [1, 2, 3, 1, 2, 3]],
-                                        names=['first', 'second'])
-
-        df1 = DataFrame(data=np.random.randn(6), index=index1,
-                        columns=['var X'])
-        df2 = DataFrame(data=np.random.randn(6), index=index2,
-                        columns=['var Y'])
-
-        df1 = df1.sortlevel(0)
-        df2 = df2.sortlevel(0)
-
-        joined = df1.join(df2, how='outer')
-        ex_index = index1._tuple_index.union(index2._tuple_index)
-        expected = df1.reindex(ex_index).join(df2.reindex(ex_index))
-        expected.index.names = index1.names
-        assert_frame_equal(joined, expected)
-        self.assertEqual(joined.index.names, index1.names)
-
-        df1 = df1.sortlevel(1)
-        df2 = df2.sortlevel(1)
-
-        joined = df1.join(df2, how='outer').sortlevel(0)
-        ex_index = index1._tuple_index.union(index2._tuple_index)
-        expected = df1.reindex(ex_index).join(df2.reindex(ex_index))
-        expected.index.names = index1.names
-
-        assert_frame_equal(joined, expected)
-        self.assertEqual(joined.index.names, index1.names)
-
-    def test_join_inner_multiindex(self):
-        key1 = ['bar', 'bar', 'bar', 'foo', 'foo', 'baz', 'baz', 'qux',
-                'qux', 'snap']
-        key2 = ['two', 'one', 'three', 'one', 'two', 'one', 'two', 'two',
-                'three', 'one']
-
-        data = np.random.randn(len(key1))
-        data = DataFrame({'key1': key1, 'key2': key2,
-                         'data': data})
-
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['first', 'second'])
-        to_join = DataFrame(np.random.randn(10, 3), index=index,
-                            columns=['j_one', 'j_two', 'j_three'])
-
-        joined = data.join(to_join, on=['key1', 'key2'], how='inner')
-        expected = merge(data, to_join.reset_index(),
-                         left_on=['key1', 'key2'],
-                         right_on=['first', 'second'], how='inner',
-                         sort=False)
-
-        expected2 = merge(to_join, data,
-                          right_on=['key1', 'key2'], left_index=True,
-                          how='inner', sort=False)
-        assert_frame_equal(joined, expected2.reindex_like(joined))
-
-        expected2 = merge(to_join, data, right_on=['key1', 'key2'],
-                          left_index=True, how='inner', sort=False)
-
-        expected = expected.drop(['first', 'second'], axis=1)
-        expected.index = joined.index
-
-        self.assertTrue(joined.index.is_monotonic)
-        assert_frame_equal(joined, expected)
-
-        # _assert_same_contents(expected, expected2.ix[:, expected.columns])
-
-    def test_join_hierarchical_mixed(self):
-        df = DataFrame([(1, 2, 3), (4, 5, 6)], columns=['a', 'b', 'c'])
-        new_df = df.groupby(['a']).agg({'b': [np.mean, np.sum]})
-        other_df = DataFrame(
-            [(1, 2, 3), (7, 10, 6)], columns=['a', 'b', 'd'])
-        other_df.set_index('a', inplace=True)
-
-        result = merge(new_df, other_df, left_index=True, right_index=True)
-        self.assertTrue(('b', 'mean') in result)
-        self.assertTrue('b' in result)
-
-    def test_join_float64_float32(self):
-
-        a = DataFrame(randn(10, 2), columns=['a', 'b'], dtype = np.float64)
-        b = DataFrame(randn(10, 1), columns=['c'], dtype = np.float32)
-        joined = a.join(b)
-        self.assertEqual(joined.dtypes['a'], 'float64')
-        self.assertEqual(joined.dtypes['b'], 'float64')
-        self.assertEqual(joined.dtypes['c'], 'float32')
-
-        a = np.random.randint(0, 5, 100).astype('int64')
-        b = np.random.random(100).astype('float64')
-        c = np.random.random(100).astype('float32')
-        df = DataFrame({'a': a, 'b': b, 'c': c})
-        xpdf = DataFrame({'a': a, 'b': b, 'c': c })
-        s = DataFrame(np.random.random(5).astype('float32'), columns=['md'])
-        rs = df.merge(s, left_on='a', right_index=True)
-        self.assertEqual(rs.dtypes['a'], 'int64')
-        self.assertEqual(rs.dtypes['b'], 'float64')
-        self.assertEqual(rs.dtypes['c'], 'float32')
-        self.assertEqual(rs.dtypes['md'], 'float32')
-
-        xp = xpdf.merge(s, left_on='a', right_index=True)
-        assert_frame_equal(rs, xp)
-
-    def test_join_many_non_unique_index(self):
-        df1 = DataFrame({"a": [1, 1], "b": [1, 1], "c": [10, 20]})
-        df2 = DataFrame({"a": [1, 1], "b": [1, 2], "d": [100, 200]})
-        df3 = DataFrame({"a": [1, 1], "b": [1, 2], "e": [1000, 2000]})
-        idf1 = df1.set_index(["a", "b"])
-        idf2 = df2.set_index(["a", "b"])
-        idf3 = df3.set_index(["a", "b"])
-
-        result = idf1.join([idf2, idf3], how='outer')
-
-        df_partially_merged = merge(df1, df2, on=['a', 'b'], how='outer')
-        expected = merge(df_partially_merged, df3, on=['a', 'b'], how='outer')
-
-        result = result.reset_index()
-
-        result['a'] = result['a'].astype(np.float64)
-        result['b'] = result['b'].astype(np.float64)
-
-        assert_frame_equal(result, expected.ix[:, result.columns])
-
-        df1 = DataFrame({"a": [1, 1, 1], "b": [1, 1, 1], "c": [10, 20, 30]})
-        df2 = DataFrame({"a": [1, 1, 1], "b": [1, 1, 2], "d": [100, 200, 300]})
-        df3 = DataFrame(
-            {"a": [1, 1, 1], "b": [1, 1, 2], "e": [1000, 2000, 3000]})
-        idf1 = df1.set_index(["a", "b"])
-        idf2 = df2.set_index(["a", "b"])
-        idf3 = df3.set_index(["a", "b"])
-        result = idf1.join([idf2, idf3], how='inner')
-
-        df_partially_merged = merge(df1, df2, on=['a', 'b'], how='inner')
-        expected = merge(df_partially_merged, df3, on=['a', 'b'], how='inner')
-
-        result = result.reset_index()
-
-        assert_frame_equal(result, expected.ix[:, result.columns])
-
-    def test_merge_index_singlekey_right_vs_left(self):
-        left = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'e', 'a'],
-                          'v1': np.random.randn(7)})
-        right = DataFrame({'v2': np.random.randn(4)},
-                          index=['d', 'b', 'c', 'a'])
-
-        merged1 = merge(left, right, left_on='key',
-                        right_index=True, how='left', sort=False)
-        merged2 = merge(right, left, right_on='key',
-                        left_index=True, how='right', sort=False)
-        assert_frame_equal(merged1, merged2.ix[:, merged1.columns])
-
-        merged1 = merge(left, right, left_on='key',
-                        right_index=True, how='left', sort=True)
-        merged2 = merge(right, left, right_on='key',
-                        left_index=True, how='right', sort=True)
-        assert_frame_equal(merged1, merged2.ix[:, merged1.columns])
-
-    def test_merge_index_singlekey_inner(self):
-        left = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'e', 'a'],
-                          'v1': np.random.randn(7)})
-        right = DataFrame({'v2': np.random.randn(4)},
-                          index=['d', 'b', 'c', 'a'])
-
-        # inner join
-        result = merge(left, right, left_on='key', right_index=True,
-                       how='inner')
-        expected = left.join(right, on='key').ix[result.index]
-        assert_frame_equal(result, expected)
-
-        result = merge(right, left, right_on='key', left_index=True,
-                       how='inner')
-        expected = left.join(right, on='key').ix[result.index]
-        assert_frame_equal(result, expected.ix[:, result.columns])
-
-    def test_merge_misspecified(self):
-        self.assertRaises(ValueError, merge, self.left, self.right,
-                          left_index=True)
-        self.assertRaises(ValueError, merge, self.left, self.right,
-                          right_index=True)
-
-        self.assertRaises(ValueError, merge, self.left, self.left,
-                          left_on='key', on='key')
-
-        self.assertRaises(ValueError, merge, self.df, self.df2,
-                          left_on=['key1'], right_on=['key1', 'key2'])
-
-    def test_merge_overlap(self):
-        merged = merge(self.left, self.left, on='key')
-        exp_len = (self.left['key'].value_counts() ** 2).sum()
-        self.assertEqual(len(merged), exp_len)
-        self.assertIn('v1_x', merged)
-        self.assertIn('v1_y', merged)
-
-    def test_merge_different_column_key_names(self):
-        left = DataFrame({'lkey': ['foo', 'bar', 'baz', 'foo'],
-                          'value': [1, 2, 3, 4]})
-        right = DataFrame({'rkey': ['foo', 'bar', 'qux', 'foo'],
-                           'value': [5, 6, 7, 8]})
-
-        merged = left.merge(right, left_on='lkey', right_on='rkey',
-                            how='outer', sort=True)
-
-        assert_almost_equal(merged['lkey'],
-                            ['bar', 'baz', 'foo', 'foo', 'foo', 'foo', np.nan])
-        assert_almost_equal(merged['rkey'],
-                            ['bar', np.nan, 'foo', 'foo', 'foo', 'foo', 'qux'])
-        assert_almost_equal(merged['value_x'], [2, 3, 1, 1, 4, 4, np.nan])
-        assert_almost_equal(merged['value_y'], [6, np.nan, 5, 8, 5, 8, 7])
-
-    def test_merge_copy(self):
-        left = DataFrame({'a': 0, 'b': 1}, index=lrange(10))
-        right = DataFrame({'c': 'foo', 'd': 'bar'}, index=lrange(10))
-
-        merged = merge(left, right, left_index=True,
-                       right_index=True, copy=True)
-
-        merged['a'] = 6
-        self.assertTrue((left['a'] == 0).all())
-
-        merged['d'] = 'peekaboo'
-        self.assertTrue((right['d'] == 'bar').all())
-
-    def test_merge_nocopy(self):
-        left = DataFrame({'a': 0, 'b': 1}, index=lrange(10))
-        right = DataFrame({'c': 'foo', 'd': 'bar'}, index=lrange(10))
-
-        merged = merge(left, right, left_index=True,
-                       right_index=True, copy=False)
-
-        merged['a'] = 6
-        self.assertTrue((left['a'] == 6).all())
-
-        merged['d'] = 'peekaboo'
-        self.assertTrue((right['d'] == 'peekaboo').all())
-
-    def test_join_sort(self):
-        left = DataFrame({'key': ['foo', 'bar', 'baz', 'foo'],
-                          'value': [1, 2, 3, 4]})
-        right = DataFrame({'value2': ['a', 'b', 'c']},
-                          index=['bar', 'baz', 'foo'])
-
-        joined = left.join(right, on='key', sort=True)
-        expected = DataFrame({'key': ['bar', 'baz', 'foo', 'foo'],
-                              'value': [2, 3, 1, 4],
-                              'value2': ['a', 'b', 'c', 'c']},
-                             index=[1, 2, 0, 3])
-        assert_frame_equal(joined, expected)
-
-        # smoke test
-        joined = left.join(right, on='key', sort=False)
-        self.assert_numpy_array_equal(joined.index, lrange(4))
-
-    def test_intelligently_handle_join_key(self):
-        # #733, be a bit more 1337 about not returning unconsolidated DataFrame
-
-        left = DataFrame({'key': [1, 1, 2, 2, 3],
-                          'value': lrange(5)}, columns=['value', 'key'])
-        right = DataFrame({'key': [1, 1, 2, 3, 4, 5],
-                           'rvalue': lrange(6)})
-
-        joined = merge(left, right, on='key', how='outer')
-        expected = DataFrame({'key': [1, 1, 1, 1, 2, 2, 3, 4, 5.],
-                              'value': np.array([0, 0, 1, 1, 2, 3, 4,
-                                                 np.nan, np.nan]),
-                              'rvalue': np.array([0, 1, 0, 1, 2, 2, 3, 4, 5])},
-                             columns=['value', 'key', 'rvalue'])
-        assert_frame_equal(joined, expected, check_dtype=False)
-
-        self.assertTrue(joined._data.is_consolidated())
-
-    def test_handle_join_key_pass_array(self):
-        left = DataFrame({'key': [1, 1, 2, 2, 3],
-                          'value': lrange(5)}, columns=['value', 'key'])
-        right = DataFrame({'rvalue': lrange(6)})
-        key = np.array([1, 1, 2, 3, 4, 5])
-
-        merged = merge(left, right, left_on='key', right_on=key, how='outer')
-        merged2 = merge(right, left, left_on=key, right_on='key', how='outer')
-
-        assert_series_equal(merged['key'], merged2['key'])
-        self.assertTrue(merged['key'].notnull().all())
-        self.assertTrue(merged2['key'].notnull().all())
-
-        left = DataFrame({'value': lrange(5)}, columns=['value'])
-        right = DataFrame({'rvalue': lrange(6)})
-        lkey = np.array([1, 1, 2, 2, 3])
-        rkey = np.array([1, 1, 2, 3, 4, 5])
-
-        merged = merge(left, right, left_on=lkey, right_on=rkey, how='outer')
-        self.assert_numpy_array_equal(merged['key_0'],
-                                      np.array([1, 1, 1, 1, 2, 2, 3, 4, 5]))
-
-        left = DataFrame({'value': lrange(3)})
-        right = DataFrame({'rvalue': lrange(6)})
-
-        key = np.array([0, 1, 1, 2, 2, 3])
-        merged = merge(left, right, left_index=True, right_on=key, how='outer')
-        self.assert_numpy_array_equal(merged['key_0'], key)
-
-    def test_mixed_type_join_with_suffix(self):
-        # GH #916
-        df = DataFrame(np.random.randn(20, 6),
-                       columns=['a', 'b', 'c', 'd', 'e', 'f'])
-        df.insert(0, 'id', 0)
-        df.insert(5, 'dt', 'foo')
-
-        grouped = df.groupby('id')
-        mn = grouped.mean()
-        cn = grouped.count()
-
-        # it works!
-        mn.join(cn, rsuffix='_right')
-
-    def test_no_overlap_more_informative_error(self):
-        dt = datetime.now()
-        df1 = DataFrame({'x': ['a']}, index=[dt])
-
-        df2 = DataFrame({'y': ['b', 'c']}, index=[dt, dt])
-        self.assertRaises(MergeError, merge, df1, df2)
-
-    def test_merge_non_unique_indexes(self):
-
-        dt = datetime(2012, 5, 1)
-        dt2 = datetime(2012, 5, 2)
-        dt3 = datetime(2012, 5, 3)
-        dt4 = datetime(2012, 5, 4)
-
-        df1 = DataFrame({'x': ['a']}, index=[dt])
-        df2 = DataFrame({'y': ['b', 'c']}, index=[dt, dt])
-        _check_merge(df1, df2)
-
-        # Not monotonic
-        df1 = DataFrame({'x': ['a', 'b', 'q']}, index=[dt2, dt, dt4])
-        df2 = DataFrame({'y': ['c', 'd', 'e', 'f', 'g', 'h']},
-                        index=[dt3, dt3, dt2, dt2, dt, dt])
-        _check_merge(df1, df2)
-
-        df1 = DataFrame({'x': ['a', 'b']}, index=[dt, dt])
-        df2 = DataFrame({'y': ['c', 'd']}, index=[dt, dt])
-        _check_merge(df1, df2)
-
-    def test_merge_non_unique_index_many_to_many(self):
-        dt = datetime(2012, 5, 1)
-        dt2 = datetime(2012, 5, 2)
-        dt3 = datetime(2012, 5, 3)
-        df1 = DataFrame({'x': ['a', 'b', 'c', 'd']},
-                        index=[dt2, dt2, dt, dt])
-        df2 = DataFrame({'y': ['e', 'f', 'g', ' h', 'i']},
-                        index=[dt2, dt2, dt3, dt, dt])
-        _check_merge(df1, df2)
-
-    def test_left_merge_empty_dataframe(self):
-        left = DataFrame({'key': [1], 'value': [2]})
-        right = DataFrame({'key': []})
-
-        result = merge(left, right, on='key', how='left')
-        assert_frame_equal(result, left)
-
-        result = merge(right, left, on='key', how='right')
-        assert_frame_equal(result, left)
-
-    def test_merge_left_empty_right_empty(self):
-        # GH 10824
-        left = pd.DataFrame([], columns=['a', 'b', 'c'])
-        right = pd.DataFrame([], columns=['x', 'y', 'z'])
-
-        exp_in = pd.DataFrame([], columns=['a', 'b', 'c', 'x', 'y', 'z'],
-                              dtype=object)
-
-        for kwarg in [dict(left_index=True, right_index=True),
-                      dict(left_index=True, right_on='x'),
-                      dict(left_on='a', right_index=True),
-                      dict(left_on='a', right_on='x')]:
-
-            result = pd.merge(left, right, how='inner', **kwarg)
-            tm.assert_frame_equal(result, exp_in)
-            result = pd.merge(left, right, how='left', **kwarg)
-            tm.assert_frame_equal(result, exp_in)
-            result = pd.merge(left, right, how='right', **kwarg)
-            tm.assert_frame_equal(result, exp_in)
-            result = pd.merge(left, right, how='outer', **kwarg)
-            tm.assert_frame_equal(result, exp_in)
-
-    def test_merge_left_empty_right_notempty(self):
-        # GH 10824
-        left = pd.DataFrame([], columns=['a', 'b', 'c'])
-        right = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
-                             columns=['x', 'y', 'z'])
-
-        exp_out = pd.DataFrame({'a': np.array([np.nan]*3, dtype=object),
-                                'b': np.array([np.nan]*3, dtype=object),
-                                'c': np.array([np.nan]*3, dtype=object),
-                                'x': [1, 4, 7],
-                                'y': [2, 5, 8],
-                                'z': [3, 6, 9]},
-                               columns=['a', 'b', 'c', 'x', 'y', 'z'])
-        exp_in = exp_out[0:0] # make empty DataFrame keeping dtype
-
-        for kwarg in [dict(left_index=True, right_index=True),
-                      dict(left_index=True, right_on='x'),
-                      dict(left_on='a', right_index=True),
-                      dict(left_on='a', right_on='x')]:
-
-            result = pd.merge(left, right, how='inner', **kwarg)
-            tm.assert_frame_equal(result, exp_in)
-            result = pd.merge(left, right, how='left', **kwarg)
-            tm.assert_frame_equal(result, exp_in)
-
-            result = pd.merge(left, right, how='right', **kwarg)
-            tm.assert_frame_equal(result, exp_out)
-            result = pd.merge(left, right, how='outer', **kwarg)
-            tm.assert_frame_equal(result, exp_out)
-
-    def test_merge_left_notempty_right_empty(self):
-        # GH 10824
-        left = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
-                            columns=['a', 'b', 'c'])
-        right = pd.DataFrame([], columns=['x', 'y', 'z'])
-
-        exp_out = pd.DataFrame({'a': [1, 4, 7],
-                                'b': [2, 5, 8],
-                                'c': [3, 6, 9],
-                                'x': np.array([np.nan]*3, dtype=object),
-                                'y': np.array([np.nan]*3, dtype=object),
-                                'z': np.array([np.nan]*3, dtype=object)},
-                               columns=['a', 'b', 'c', 'x', 'y', 'z'])
-        exp_in = exp_out[0:0] # make empty DataFrame keeping dtype
-
-        for kwarg in [dict(left_index=True, right_index=True),
-                      dict(left_index=True, right_on='x'),
-                      dict(left_on='a', right_index=True),
-                      dict(left_on='a', right_on='x')]:
-
-            result = pd.merge(left, right, how='inner', **kwarg)
-            tm.assert_frame_equal(result, exp_in)
-            result = pd.merge(left, right, how='right', **kwarg)
-            tm.assert_frame_equal(result, exp_in)
-
-            result = pd.merge(left, right, how='left', **kwarg)
-            tm.assert_frame_equal(result, exp_out)
-            result = pd.merge(left, right, how='outer', **kwarg)
-            tm.assert_frame_equal(result, exp_out)
-
-    def test_merge_nosort(self):
-        # #2098, anything to do?
-
-        from datetime import datetime
-
-        d = {"var1": np.random.randint(0, 10, size=10),
-             "var2": np.random.randint(0, 10, size=10),
-             "var3": [datetime(2012, 1, 12), datetime(2011, 2, 4),
-                      datetime(
-                      2010, 2, 3), datetime(2012, 1, 12),
-                      datetime(
-                      2011, 2, 4), datetime(2012, 4, 3),
-                      datetime(
-                      2012, 3, 4), datetime(2008, 5, 1),
-                      datetime(2010, 2, 3), datetime(2012, 2, 3)]}
-        df = DataFrame.from_dict(d)
-        var3 = df.var3.unique()
-        var3.sort()
-        new = DataFrame.from_dict({"var3": var3,
-                                   "var8": np.random.random(7)})
-
-        result = df.merge(new, on="var3", sort=False)
-        exp = merge(df, new, on='var3', sort=False)
-        assert_frame_equal(result, exp)
-
-        self.assertTrue((df.var3.unique() == result.var3.unique()).all())
-
-    def test_merge_nan_right(self):
-        df1 = DataFrame({"i1" : [0, 1], "i2" : [0, 1]})
-        df2 = DataFrame({"i1" : [0], "i3" : [0]})
-        result = df1.join(df2, on="i1", rsuffix="_")
-        expected = DataFrame({'i1': {0: 0.0, 1: 1}, 'i2': {0: 0, 1: 1},
-                              'i1_': {0: 0, 1: np.nan}, 'i3': {0: 0.0, 1: np.nan},
-                               None: {0: 0, 1: 0}}).set_index(None).reset_index()[['i1', 'i2', 'i1_', 'i3']]
-        assert_frame_equal(result, expected, check_dtype=False)
-
-        df1 = DataFrame({"i1" : [0, 1], "i2" : [0.5, 1.5]})
-        df2 = DataFrame({"i1" : [0], "i3" : [0.7]})
-        result = df1.join(df2, rsuffix="_", on='i1')
-        expected = DataFrame({'i1': {0: 0, 1: 1}, 'i1_': {0: 0.0, 1: nan},
-                              'i2': {0: 0.5, 1: 1.5}, 'i3': {0: 0.69999999999999996,
-                              1: nan}})[['i1', 'i2', 'i1_', 'i3']]
-        assert_frame_equal(result, expected)
-
-    def test_merge_type(self):
-        class NotADataFrame(DataFrame):
-            @property
-            def _constructor(self):
-                return NotADataFrame
-
-        nad = NotADataFrame(self.df)
-        result = nad.merge(self.df2, on='key1')
-
-        tm.assertIsInstance(result, NotADataFrame)
-
-    def test_append_dtype_coerce(self):
-
-        # GH 4993
-        # appending with datetime will incorrectly convert datetime64
-        import datetime as dt
-        from pandas import NaT
-
-        df1 = DataFrame(index=[1,2], data=[dt.datetime(2013,1,1,0,0),
-                                           dt.datetime(2013,1,2,0,0)],
-                        columns=['start_time'])
-        df2 = DataFrame(index=[4,5], data=[[dt.datetime(2013,1,3,0,0),
-                                            dt.datetime(2013,1,3,6,10)],
-                                           [dt.datetime(2013,1,4,0,0),
-                                            dt.datetime(2013,1,4,7,10)]],
-                        columns=['start_time','end_time'])
-
-        expected = concat([
-            Series([NaT,NaT,dt.datetime(2013,1,3,6,10),dt.datetime(2013,1,4,7,10)],name='end_time'),
-            Series([dt.datetime(2013,1,1,0,0),dt.datetime(2013,1,2,0,0),dt.datetime(2013,1,3,0,0),dt.datetime(2013,1,4,0,0)],name='start_time'),
-            ],axis=1)
-        result = df1.append(df2,ignore_index=True)
-        assert_frame_equal(result, expected)
-
-    def test_join_append_timedeltas(self):
-
-        import datetime as dt
-        from pandas import NaT
-
-        # timedelta64 issues with join/merge
-        # GH 5695
-
-        d = {'d': dt.datetime(2013, 11, 5, 5, 56), 't': dt.timedelta(0, 22500)}
-        df = DataFrame(columns=list('dt'))
-        df = df.append(d, ignore_index=True)
-        result = df.append(d, ignore_index=True)
-        expected = DataFrame({'d': [dt.datetime(2013, 11, 5, 5, 56),
-                                    dt.datetime(2013, 11, 5, 5, 56) ],
-                              't': [ dt.timedelta(0, 22500),
-                                     dt.timedelta(0, 22500) ]})
-        assert_frame_equal(result, expected)
-
-        td = np.timedelta64(300000000)
-        lhs = DataFrame(Series([td,td],index=["A","B"]))
-        rhs = DataFrame(Series([td],index=["A"]))
-
-        from pandas import NaT
-        result = lhs.join(rhs,rsuffix='r', how="left")
-        expected = DataFrame({ '0' : Series([td,td],index=list('AB')), '0r' : Series([td,NaT],index=list('AB')) })
-        assert_frame_equal(result, expected)
-
-    def test_overlapping_columns_error_message(self):
-        df = DataFrame({'key': [1, 2, 3],
-                        'v1': [4, 5, 6],
-                        'v2': [7, 8, 9]})
-        df2 = DataFrame({'key': [1, 2, 3],
-                         'v1': [4, 5, 6],
-                         'v2': [7, 8, 9]})
-
-        df.columns = ['key', 'foo', 'foo']
-        df2.columns = ['key', 'bar', 'bar']
-        expected = DataFrame({'key': [1, 2, 3],
-                         'v1': [4, 5, 6],
-                         'v2': [7, 8, 9],
-                         'v3': [4, 5, 6],
-                         'v4': [7, 8, 9]})
-        expected.columns = ['key', 'foo', 'foo', 'bar', 'bar']
-        assert_frame_equal(merge(df, df2), expected)
-
-        # #2649, #10639
-        df2.columns = ['key1', 'foo', 'foo']
-        self.assertRaises(ValueError, merge, df, df2)
-
-    def test_indicator(self):
-        # PR #10054. xref #7412 and closes #8790.
-        df1 = pd.DataFrame({'col1':[0,1], 'col_left':['a','b'], 'col_conflict':[1,2]})
-        df1_copy = df1.copy()
-
-        df2 = pd.DataFrame({'col1':[1,2,3,4,5],'col_right':[2,2,2,2,2],
-                            'col_conflict':[1,2,3,4,5]})
-        df2_copy = df2.copy()
-
-        df_result = pd.DataFrame({'col1':[0,1,2,3,4,5],
-                'col_conflict_x':[1,2,np.nan,np.nan,np.nan,np.nan],
-                'col_left':['a','b', np.nan,np.nan,np.nan,np.nan],
-                'col_conflict_y':[np.nan,1,2,3,4,5],
-                'col_right':[np.nan, 2,2,2,2,2]},
-                dtype='float64')
-        df_result['_merge'] = pd.Categorical(['left_only','both','right_only',
-            'right_only','right_only','right_only']
-            , categories=['left_only', 'right_only', 'both'])
-
-        df_result = df_result[['col1', 'col_conflict_x', 'col_left',
-                               'col_conflict_y', 'col_right', '_merge' ]]
-
-        test = pd.merge(df1, df2, on='col1', how='outer', indicator=True)
-        assert_frame_equal(test, df_result)
-        test = df1.merge(df2, on='col1', how='outer', indicator=True)
-        assert_frame_equal(test, df_result)
-
-        # No side effects
-        assert_frame_equal(df1, df1_copy)
-        assert_frame_equal(df2, df2_copy)
-
-        # Check with custom name
-        df_result_custom_name = df_result
-        df_result_custom_name = df_result_custom_name.rename(columns={'_merge':'custom_name'})
-
-        test_custom_name = pd.merge(df1, df2, on='col1', how='outer', indicator='custom_name')
-        assert_frame_equal(test_custom_name, df_result_custom_name)
-        test_custom_name = df1.merge(df2, on='col1', how='outer', indicator='custom_name')
-        assert_frame_equal(test_custom_name, df_result_custom_name)
-
-        # Check only accepts strings and booleans
-        with tm.assertRaises(ValueError):
-            pd.merge(df1, df2, on='col1', how='outer', indicator=5)
-        with tm.assertRaises(ValueError):
-            df1.merge(df2, on='col1', how='outer', indicator=5)
-
-        # Check result integrity
-
-        test2 = pd.merge(df1, df2, on='col1', how='left', indicator=True)
-        self.assertTrue((test2._merge != 'right_only').all())
-        test2 = df1.merge(df2, on='col1', how='left', indicator=True)
-        self.assertTrue((test2._merge != 'right_only').all())
-
-        test3 = pd.merge(df1, df2, on='col1', how='right', indicator=True)
-        self.assertTrue((test3._merge != 'left_only').all())
-        test3 = df1.merge(df2, on='col1', how='right', indicator=True)
-        self.assertTrue((test3._merge != 'left_only').all())
-
-        test4 = pd.merge(df1, df2, on='col1', how='inner', indicator=True)
-        self.assertTrue((test4._merge == 'both').all())
-        test4 = df1.merge(df2, on='col1', how='inner', indicator=True)
-        self.assertTrue((test4._merge == 'both').all())
-
-        # Check if working name in df
-        for i in ['_right_indicator', '_left_indicator', '_merge']:
-            df_badcolumn = pd.DataFrame({'col1':[1,2], i:[2,2]})
-
-            with tm.assertRaises(ValueError):
-                pd.merge(df1, df_badcolumn, on='col1', how='outer', indicator=True)
-            with tm.assertRaises(ValueError):
-                df1.merge(df_badcolumn, on='col1', how='outer', indicator=True)
-
-        # Check for name conflict with custom name
-        df_badcolumn = pd.DataFrame({'col1':[1,2], 'custom_column_name':[2,2]})
-
-        with tm.assertRaises(ValueError):
-            pd.merge(df1, df_badcolumn, on='col1', how='outer', indicator='custom_column_name')
-        with tm.assertRaises(ValueError):
-            df1.merge(df_badcolumn, on='col1', how='outer', indicator='custom_column_name')
-
-        # Merge on multiple columns
-        df3 = pd.DataFrame({'col1':[0,1], 'col2':['a','b']})
-
-        df4 = pd.DataFrame({'col1':[1,1,3], 'col2':['b','x','y']})
-
-        hand_coded_result = pd.DataFrame({'col1':[0,1,1,3.0],
-                                         'col2':['a','b','x','y']})
-        hand_coded_result['_merge'] = pd.Categorical(
-            ['left_only','both','right_only','right_only']
-            , categories=['left_only', 'right_only', 'both'])
-
-        test5 = pd.merge(df3, df4, on=['col1', 'col2'], how='outer', indicator=True)
-        assert_frame_equal(test5, hand_coded_result)
-        test5 = df3.merge(df4, on=['col1', 'col2'], how='outer', indicator=True)
-        assert_frame_equal(test5, hand_coded_result)
-
-
-def _check_merge(x, y):
-    for how in ['inner', 'left', 'outer']:
-        result = x.join(y, how=how)
-
-        expected = merge(x.reset_index(), y.reset_index(), how=how,
-                         sort=True)
-        expected = expected.set_index('index')
-
-        assert_frame_equal(result, expected, check_names=False)  # TODO check_names on merge?
-
-
-class TestMergeMulti(tm.TestCase):
-
-    def setUp(self):
-        self.index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                        ['one', 'two', 'three']],
-                                labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                        [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                                names=['first', 'second'])
-        self.to_join = DataFrame(np.random.randn(10, 3), index=self.index,
-                                 columns=['j_one', 'j_two', 'j_three'])
-
-        # a little relevant example with NAs
-        key1 = ['bar', 'bar', 'bar', 'foo', 'foo', 'baz', 'baz', 'qux',
-                'qux', 'snap']
-        key2 = ['two', 'one', 'three', 'one', 'two', 'one', 'two', 'two',
-                'three', 'one']
-
-        data = np.random.randn(len(key1))
-        self.data = DataFrame({'key1': key1, 'key2': key2,
-                               'data': data})
-
-    def test_merge_on_multikey(self):
-        joined = self.data.join(self.to_join, on=['key1', 'key2'])
-
-        join_key = Index(lzip(self.data['key1'], self.data['key2']))
-        indexer = self.to_join.index.get_indexer(join_key)
-        ex_values = self.to_join.values.take(indexer, axis=0)
-        ex_values[indexer == -1] = np.nan
-        expected = self.data.join(DataFrame(ex_values,
-                                            columns=self.to_join.columns))
-
-        # TODO: columns aren't in the same order yet
-        assert_frame_equal(joined, expected.ix[:, joined.columns])
-
-        left = self.data.join(self.to_join, on=['key1', 'key2'], sort=True)
-        right = expected.ix[:, joined.columns].sort_values(['key1', 'key2'],
-                                                           kind='mergesort')
-        assert_frame_equal(left, right)
-
-    def test_left_join_multi_index(self):
-        icols = ['1st', '2nd', '3rd']
-
-        def bind_cols(df):
-            iord = lambda a: 0 if a != a else ord(a)
-            f = lambda ts: ts.map(iord) - ord('a')
-            return f(df['1st']) + f(df['3rd'])* 1e2 + df['2nd'].fillna(0) * 1e4
-
-        def run_asserts(left, right):
-            for sort in [False, True]:
-                res = left.join(right, on=icols, how='left', sort=sort)
-
-                self.assertTrue(len(left) < len(res) + 1)
-                self.assertFalse(res['4th'].isnull().any())
-                self.assertFalse(res['5th'].isnull().any())
-
-                tm.assert_series_equal(res['4th'], - res['5th'], check_names=False)
-                result = bind_cols(res.iloc[:, :-2])
-                tm.assert_series_equal(res['4th'], result, check_names=False)
-                self.assertTrue(result.name is None)
-
-                if sort:
-                    tm.assert_frame_equal(res,
-                                          res.sort_values(icols, kind='mergesort'))
-
-                out = merge(left, right.reset_index(), on=icols,
-                            sort=sort, how='left')
-
-                res.index = np.arange(len(res))
-                tm.assert_frame_equal(out, res)
-
-        lc = list(map(chr, np.arange(ord('a'), ord('z') + 1)))
-        left = DataFrame(np.random.choice(lc, (5000, 2)),
-                         columns=['1st', '3rd'])
-        left.insert(1, '2nd', np.random.randint(0, 1000, len(left)))
-
-        i = np.random.permutation(len(left))
-        right = left.iloc[i].copy()
-
-        left['4th'] = bind_cols(left)
-        right['5th'] = - bind_cols(right)
-        right.set_index(icols, inplace=True)
-
-        run_asserts(left, right)
-
-        # inject some nulls
-        left.loc[1::23, '1st'] = np.nan
-        left.loc[2::37, '2nd'] = np.nan
-        left.loc[3::43, '3rd'] = np.nan
-        left['4th'] = bind_cols(left)
-
-        i = np.random.permutation(len(left))
-        right = left.iloc[i, :-1]
-        right['5th'] = - bind_cols(right)
-        right.set_index(icols, inplace=True)
-
-        run_asserts(left, right)
-
-    def test_merge_right_vs_left(self):
-        # compare left vs right merge with multikey
-        for sort in [False, True]:
-            merged1 = self.data.merge(self.to_join, left_on=['key1', 'key2'],
-                    right_index=True, how='left', sort=sort)
-
-            merged2 = self.to_join.merge(self.data, right_on=['key1', 'key2'],
-                    left_index=True, how='right', sort=sort)
-
-            merged2 = merged2.ix[:, merged1.columns]
-            assert_frame_equal(merged1, merged2)
-
-    def test_compress_group_combinations(self):
-
-        # ~ 40000000 possible unique groups
-        key1 = tm.rands_array(10, 10000)
-        key1 = np.tile(key1, 2)
-        key2 = key1[::-1]
-
-        df = DataFrame({'key1': key1, 'key2': key2,
-                        'value1': np.random.randn(20000)})
-
-        df2 = DataFrame({'key1': key1[::2], 'key2': key2[::2],
-                         'value2': np.random.randn(10000)})
-
-        # just to hit the label compression code path
-        merged = merge(df, df2, how='outer')
-
-    def test_left_join_index_preserve_order(self):
-
-        left = DataFrame({'k1': [0, 1, 2] * 8,
-                          'k2': ['foo', 'bar'] * 12,
-                          'v': np.array(np.arange(24),dtype=np.int64) })
-
-        index = MultiIndex.from_tuples([(2, 'bar'), (1, 'foo')])
-        right = DataFrame({'v2': [5, 7]}, index=index)
-
-        result = left.join(right, on=['k1', 'k2'])
-
-        expected = left.copy()
-        expected['v2'] = np.nan
-        expected.loc[(expected.k1 == 2) & (expected.k2 == 'bar'),'v2'] = 5
-        expected.loc[(expected.k1 == 1) & (expected.k2 == 'foo'),'v2'] = 7
-
-        tm.assert_frame_equal(result, expected)
-        tm.assert_frame_equal(result.sort_values(['k1', 'k2'], kind='mergesort'),
-                              left.join(right, on=['k1', 'k2'], sort=True))
-
-        # test join with multi dtypes blocks
-        left = DataFrame({'k1': [0, 1, 2] * 8,
-                          'k2': ['foo', 'bar'] * 12,
-                          'k3' : np.array([0, 1, 2]*8, dtype=np.float32),
-                          'v': np.array(np.arange(24),dtype=np.int32) })
-
-        index = MultiIndex.from_tuples([(2, 'bar'), (1, 'foo')])
-        right = DataFrame({'v2': [5, 7]}, index=index)
-
-        result = left.join(right, on=['k1', 'k2'])
-
-        expected = left.copy()
-        expected['v2'] = np.nan
-        expected.loc[(expected.k1 == 2) & (expected.k2 == 'bar'),'v2'] = 5
-        expected.loc[(expected.k1 == 1) & (expected.k2 == 'foo'),'v2'] = 7
-
-        tm.assert_frame_equal(result, expected)
-        tm.assert_frame_equal(result.sort_values(['k1', 'k2'], kind='mergesort'),
-                              left.join(right, on=['k1', 'k2'], sort=True))
-
-        # do a right join for an extra test
-        joined = merge(right, left, left_index=True,
-                       right_on=['k1', 'k2'], how='right')
-        tm.assert_frame_equal(joined.ix[:, expected.columns], expected)
-
-    def test_left_join_index_multi_match_multiindex(self):
-        left = DataFrame([
-            ['X', 'Y', 'C', 'a'],
-            ['W', 'Y', 'C', 'e'],
-            ['V', 'Q', 'A', 'h'],
-            ['V', 'R', 'D', 'i'],
-            ['X', 'Y', 'D', 'b'],
-            ['X', 'Y', 'A', 'c'],
-            ['W', 'Q', 'B', 'f'],
-            ['W', 'R', 'C', 'g'],
-            ['V', 'Y', 'C', 'j'],
-            ['X', 'Y', 'B', 'd']],
-            columns=['cola', 'colb', 'colc', 'tag'],
-            index=[3, 2, 0, 1, 7, 6, 4, 5, 9, 8])
-
-        right = DataFrame([
-            ['W', 'R', 'C',  0],
-            ['W', 'Q', 'B',  3],
-            ['W', 'Q', 'B',  8],
-            ['X', 'Y', 'A',  1],
-            ['X', 'Y', 'A',  4],
-            ['X', 'Y', 'B',  5],
-            ['X', 'Y', 'C',  6],
-            ['X', 'Y', 'C',  9],
-            ['X', 'Q', 'C', -6],
-            ['X', 'R', 'C', -9],
-            ['V', 'Y', 'C',  7],
-            ['V', 'R', 'D',  2],
-            ['V', 'R', 'D', -1],
-            ['V', 'Q', 'A', -3]],
-            columns=['col1', 'col2', 'col3', 'val'])
-
-        right.set_index(['col1', 'col2', 'col3'], inplace=True)
-        result = left.join(right, on=['cola', 'colb', 'colc'], how='left')
-
-        expected = DataFrame([
-            ['X', 'Y', 'C', 'a',   6],
-            ['X', 'Y', 'C', 'a',   9],
-            ['W', 'Y', 'C', 'e', nan],
-            ['V', 'Q', 'A', 'h',  -3],
-            ['V', 'R', 'D', 'i',   2],
-            ['V', 'R', 'D', 'i',  -1],
-            ['X', 'Y', 'D', 'b', nan],
-            ['X', 'Y', 'A', 'c',   1],
-            ['X', 'Y', 'A', 'c',   4],
-            ['W', 'Q', 'B', 'f',   3],
-            ['W', 'Q', 'B', 'f',   8],
-            ['W', 'R', 'C', 'g',   0],
-            ['V', 'Y', 'C', 'j',   7],
-            ['X', 'Y', 'B', 'd',   5]],
-            columns=['cola', 'colb', 'colc', 'tag', 'val'],
-            index=[3, 3, 2, 0, 1, 1, 7, 6, 6, 4, 4, 5, 9, 8])
-
-        tm.assert_frame_equal(result, expected)
-
-        result = left.join(right, on=['cola', 'colb', 'colc'],
-                           how='left', sort=True)
-
-        tm.assert_frame_equal(result,
-                expected.sort_values(['cola', 'colb', 'colc'], kind='mergesort'))
-
-        # GH7331 - maintain left frame order in left merge
-        right.reset_index(inplace=True)
-        right.columns = left.columns[:3].tolist() + right.columns[-1:].tolist()
-        result = merge(left, right, how='left', on=left.columns[:-1].tolist())
-        expected.index = np.arange(len(expected))
-        tm.assert_frame_equal(result, expected)
-
-    def test_left_join_index_multi_match(self):
-        left = DataFrame([
-            ['c', 0],
-            ['b', 1],
-            ['a', 2],
-            ['b', 3]],
-            columns=['tag', 'val'],
-            index=[2, 0, 1, 3])
-
-        right = DataFrame([
-            ['a', 'v'],
-            ['c', 'w'],
-            ['c', 'x'],
-            ['d', 'y'],
-            ['a', 'z'],
-            ['c', 'r'],
-            ['e', 'q'],
-            ['c', 's']],
-            columns=['tag', 'char'])
-
-        right.set_index('tag', inplace=True)
-        result = left.join(right, on='tag', how='left')
-
-        expected = DataFrame([
-            ['c', 0, 'w'],
-            ['c', 0, 'x'],
-            ['c', 0, 'r'],
-            ['c', 0, 's'],
-            ['b', 1, nan],
-            ['a', 2, 'v'],
-            ['a', 2, 'z'],
-            ['b', 3, nan]],
-            columns=['tag', 'val', 'char'],
-            index=[2, 2, 2, 2, 0, 1, 1, 3])
-
-        tm.assert_frame_equal(result, expected)
-
-        result = left.join(right, on='tag', how='left', sort=True)
-        tm.assert_frame_equal(result, expected.sort_values('tag', kind='mergesort'))
-
-        # GH7331 - maintain left frame order in left merge
-        result = merge(left, right.reset_index(), how='left', on='tag')
-        expected.index = np.arange(len(expected))
-        tm.assert_frame_equal(result, expected)
-
-    def test_join_multi_dtypes(self):
-
-        # test with multi dtypes in the join index
-        def _test(dtype1,dtype2):
-            left = DataFrame({'k1': np.array([0, 1, 2] * 8, dtype=dtype1),
-                              'k2': ['foo', 'bar'] * 12,
-                              'v': np.array(np.arange(24),dtype=np.int64) })
-
-            index = MultiIndex.from_tuples([(2, 'bar'), (1, 'foo')])
-            right = DataFrame({'v2': np.array([5, 7], dtype=dtype2)}, index=index)
-
-            result = left.join(right, on=['k1', 'k2'])
-
-            expected = left.copy()
-
-            if dtype2.kind == 'i':
-                dtype2 = np.dtype('float64')
-            expected['v2'] = np.array(np.nan,dtype=dtype2)
-            expected.loc[(expected.k1 == 2) & (expected.k2 == 'bar'),'v2'] = 5
-            expected.loc[(expected.k1 == 1) & (expected.k2 == 'foo'),'v2'] = 7
-
-            tm.assert_frame_equal(result, expected)
-
-            result = left.join(right, on=['k1', 'k2'], sort=True)
-            expected.sort_values(['k1', 'k2'], kind='mergesort', inplace=True)
-            tm.assert_frame_equal(result, expected)
-
-        for d1 in [np.int64,np.int32,np.int16,np.int8,np.uint8]:
-            for d2 in [np.int64,np.float64,np.float32,np.float16]:
-                _test(np.dtype(d1),np.dtype(d2))
-
-    def test_left_merge_na_buglet(self):
-        left = DataFrame({'id': list('abcde'), 'v1': randn(5),
-                          'v2': randn(5), 'dummy': list('abcde'),
-                          'v3': randn(5)},
-                         columns=['id', 'v1', 'v2', 'dummy', 'v3'])
-        right = DataFrame({'id': ['a', 'b', np.nan, np.nan, np.nan],
-                           'sv3': [1.234, 5.678, np.nan, np.nan, np.nan]})
-
-        merged = merge(left, right, on='id', how='left')
-
-        rdf = right.drop(['id'], axis=1)
-        expected = left.join(rdf)
-        tm.assert_frame_equal(merged, expected)
-
-    def test_merge_na_keys(self):
-        data = [[1950, "A", 1.5],
-                [1950, "B", 1.5],
-                [1955, "B", 1.5],
-                [1960, "B", np.nan],
-                [1970, "B", 4.],
-                [1950, "C", 4.],
-                [1960, "C", np.nan],
-                [1965, "C", 3.],
-                [1970, "C", 4.]]
-
-        frame = DataFrame(data, columns=["year", "panel", "data"])
-
-        other_data = [[1960, 'A', np.nan],
-                      [1970, 'A', np.nan],
-                      [1955, 'A', np.nan],
-                      [1965, 'A', np.nan],
-                      [1965, 'B', np.nan],
-                      [1955, 'C', np.nan]]
-        other = DataFrame(other_data, columns=['year', 'panel', 'data'])
-
-        result = frame.merge(other, how='outer')
-
-        expected = frame.fillna(-999).merge(other.fillna(-999), how='outer')
-        expected = expected.replace(-999, np.nan)
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_int64_overflow_issues(self):
-        from itertools import product
-        from collections import defaultdict
-        from pandas.core.groupby import _int64_overflow_possible
-
-        # #2690, combinatorial explosion
-        df1 = DataFrame(np.random.randn(1000, 7),
-                        columns=list('ABCDEF') + ['G1'])
-        df2 = DataFrame(np.random.randn(1000, 7),
-                        columns=list('ABCDEF') + ['G2'])
-
-        # it works!
-        result = merge(df1, df2, how='outer')
-        self.assertTrue(len(result) == 2000)
-
-        low, high, n = -1 << 10, 1 << 10, 1 << 20
-        left = DataFrame(np.random.randint(low, high, (n, 7)),
-                         columns=list('ABCDEFG'))
-        left['left'] = left.sum(axis=1)
-
-        # one-2-one match
-        i = np.random.permutation(len(left))
-        right = left.iloc[i].copy()
-        right.columns = right.columns[:-1].tolist() + ['right']
-        right.index = np.arange(len(right))
-        right['right'] *= -1
-
-        out = merge(left, right, how='outer')
-        self.assertEqual(len(out), len(left))
-        assert_series_equal(out['left'], - out['right'], check_names=False)
-        result = out.iloc[:, :-2].sum(axis=1)
-        assert_series_equal(out['left'], result, check_names=False)
-        self.assertTrue(result.name is None)
-
-        out.sort_values(out.columns.tolist(), inplace=True)
-        out.index = np.arange(len(out))
-        for how in ['left', 'right', 'outer', 'inner']:
-            assert_frame_equal(out, merge(left, right, how=how, sort=True))
-
-        # check that left merge w/ sort=False maintains left frame order
-        out = merge(left, right, how='left', sort=False)
-        assert_frame_equal(left, out[left.columns.tolist()])
-
-        out = merge(right, left, how='left', sort=False)
-        assert_frame_equal(right, out[right.columns.tolist()])
-
-        # one-2-many/none match
-        n = 1 << 11
-        left = DataFrame(np.random.randint(low, high, (n, 7)).astype('int64'),
-                         columns=list('ABCDEFG'))
-
-        # confirm that this is checking what it is supposed to check
-        shape = left.apply(pd.Series.nunique).values
-        self.assertTrue(_int64_overflow_possible(shape))
-
-        # add duplicates to left frame
-        left = pd.concat([left, left], ignore_index=True)
-
-        right = DataFrame(np.random.randint(low, high, (n // 2, 7)).astype('int64'),
-                          columns=list('ABCDEFG'))
-
-        # add duplicates & overlap with left to the right frame
-        i = np.random.choice(len(left), n)
-        right = pd.concat([right, right, left.iloc[i]], ignore_index=True)
-
-        left['left'] = np.random.randn(len(left))
-        right['right'] = np.random.randn(len(right))
-
-        # shuffle left & right frames
-        i = np.random.permutation(len(left))
-        left = left.iloc[i].copy()
-        left.index = np.arange(len(left))
-
-        i = np.random.permutation(len(right))
-        right = right.iloc[i].copy()
-        right.index = np.arange(len(right))
-
-        # manually compute outer merge
-        ldict, rdict = defaultdict(list), defaultdict(list)
-
-        for idx, row in left.set_index(list('ABCDEFG')).iterrows():
-            ldict[idx].append(row['left'])
-
-        for idx, row in right.set_index(list('ABCDEFG')).iterrows():
-            rdict[idx].append(row['right'])
-
-        vals = []
-        for k, lval in ldict.items():
-            rval = rdict.get(k, [np.nan])
-            for lv, rv in product(lval, rval):
-                vals.append(k + tuple([lv, rv]))
-
-        for k, rval in rdict.items():
-            if k not in ldict:
-                for rv in rval:
-                    vals.append(k + tuple([np.nan, rv]))
-
-        def align(df):
-            df = df.sort_values(df.columns.tolist())
-            df.index = np.arange(len(df))
-            return df
-
-        def verify_order(df):
-            kcols = list('ABCDEFG')
-            assert_frame_equal(df[kcols].copy(),
-                               df[kcols].sort_values(kcols, kind='mergesort'))
-
-        out = DataFrame(vals, columns=list('ABCDEFG') + ['left', 'right'])
-        out = align(out)
-
-        jmask = {'left': out['left'].notnull(),
-                 'right': out['right'].notnull(),
-                 'inner': out['left'].notnull() & out['right'].notnull(),
-                 'outer': np.ones(len(out), dtype='bool')}
-
-        for how in 'left', 'right', 'outer', 'inner':
-            mask = jmask[how]
-            frame = align(out[mask].copy())
-            self.assertTrue(mask.all() ^ mask.any() or how == 'outer')
-
-            for sort in [False, True]:
-                res = merge(left, right, how=how, sort=sort)
-                if sort:
-                    verify_order(res)
-
-                # as in GH9092 dtypes break with outer/right join
-                assert_frame_equal(frame, align(res),
-                                   check_dtype=how not in ('right', 'outer'))
-
-
-    def test_join_multi_levels(self):
-
-        # GH 3662
-        # merge multi-levels
-
-        household = DataFrame(dict(household_id = [1,2,3],
-                                   male = [0,1,0],
-                                   wealth = [196087.3,316478.7,294750]),
-                              columns = ['household_id','male','wealth']).set_index('household_id')
-        portfolio = DataFrame(dict(household_id = [1,2,2,3,3,3,4],
-                                   asset_id = ["nl0000301109","nl0000289783","gb00b03mlx29","gb00b03mlx29","lu0197800237","nl0000289965",np.nan],
-                                   name = ["ABN Amro","Robeco","Royal Dutch Shell","Royal Dutch Shell","AAB Eastern Europe Equity Fund","Postbank BioTech Fonds",np.nan],
-                                   share = [1.0,0.4,0.6,0.15,0.6,0.25,1.0]),
-                              columns = ['household_id','asset_id','name','share']).set_index(['household_id','asset_id'])
-        result = household.join(portfolio, how='inner')
-        expected = DataFrame(dict(male = [0,1,1,0,0,0],
-                                  wealth = [ 196087.3, 316478.7, 316478.7, 294750.0, 294750.0, 294750.0 ],
-                                  name = ['ABN Amro','Robeco','Royal Dutch Shell','Royal Dutch Shell','AAB Eastern Europe Equity Fund','Postbank BioTech Fonds'],
-                                  share = [1.00,0.40,0.60,0.15,0.60,0.25],
-                                  household_id = [1,2,2,3,3,3],
-                                  asset_id = ['nl0000301109','nl0000289783','gb00b03mlx29','gb00b03mlx29','lu0197800237','nl0000289965']),
-                             ).set_index(['household_id','asset_id']).reindex(columns=['male','wealth','name','share'])
-        assert_frame_equal(result,expected)
-
-        assert_frame_equal(result,expected)
-
-        # equivalency
-        result2 = merge(household.reset_index(),portfolio.reset_index(),on=['household_id'],how='inner').set_index(['household_id','asset_id'])
-        assert_frame_equal(result2,expected)
-
-        result = household.join(portfolio, how='outer')
-        expected = concat([expected,DataFrame(dict(share = [1.00]),
-                                              index=MultiIndex.from_tuples([(4,np.nan)],
-                                                                           names=['household_id','asset_id']))],
-                          axis=0).reindex(columns=expected.columns)
-        assert_frame_equal(result,expected)
-
-        # invalid cases
-        household.index.name = 'foo'
-        def f():
-            household.join(portfolio, how='inner')
-        self.assertRaises(ValueError, f)
-
-        portfolio2 = portfolio.copy()
-        portfolio2.index.set_names(['household_id','foo'])
-        def f():
-            portfolio2.join(portfolio, how='inner')
-        self.assertRaises(ValueError, f)
-
-    def test_join_multi_levels2(self):
-
-        # some more advanced merges
-        # GH6360
-        household = DataFrame(dict(household_id = [1,2,2,3,3,3,4],
-                                   asset_id = ["nl0000301109","nl0000301109","gb00b03mlx29","gb00b03mlx29","lu0197800237","nl0000289965",np.nan],
-                                   share = [1.0,0.4,0.6,0.15,0.6,0.25,1.0]),
-                              columns = ['household_id','asset_id','share']).set_index(['household_id','asset_id'])
-
-        log_return = DataFrame(dict(
-            asset_id = ["gb00b03mlx29", "gb00b03mlx29", "gb00b03mlx29", "lu0197800237", "lu0197800237"],
-            t = [233, 234, 235, 180, 181],
-            log_return = [.09604978, -.06524096, .03532373, .03025441, .036997]
-                )).set_index(["asset_id","t"])
-
-        expected = DataFrame(dict(
-            household_id = [2, 2, 2, 3, 3, 3, 3, 3],
-            asset_id = ["gb00b03mlx29", "gb00b03mlx29", "gb00b03mlx29", "gb00b03mlx29", "gb00b03mlx29", "gb00b03mlx29", "lu0197800237", "lu0197800237"],
-            t = [233, 234, 235, 233, 234, 235, 180, 181],
-            share = [0.6, 0.6, 0.6, 0.15, 0.15, 0.15, 0.6, 0.6],
-            log_return = [.09604978, -.06524096, .03532373, .09604978, -.06524096, .03532373, .03025441, .036997]
-            )).set_index(["household_id", "asset_id", "t"]).reindex(columns=['share','log_return'])
-
-        def f():
-            household.join(log_return, how='inner')
-        self.assertRaises(NotImplementedError, f)
-
-        # this is the equivalency
-        result = merge(household.reset_index(),log_return.reset_index(),on=['asset_id'],how='inner').set_index(['household_id','asset_id','t'])
-        assert_frame_equal(result,expected)
-
-        expected = DataFrame(dict(
-            household_id = [1, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 4],
-            asset_id = ["nl0000301109", "nl0000289783", "gb00b03mlx29", "gb00b03mlx29", "gb00b03mlx29", "gb00b03mlx29", "gb00b03mlx29", "gb00b03mlx29", "lu0197800237", "lu0197800237", "nl0000289965", None],
-            t = [None, None, 233, 234, 235, 233, 234, 235, 180, 181, None, None],
-            share = [1.0, 0.4, 0.6, 0.6, 0.6, 0.15, 0.15, 0.15, 0.6, 0.6, 0.25, 1.0],
-            log_return = [None, None, .09604978, -.06524096, .03532373, .09604978, -.06524096, .03532373, .03025441, .036997, None, None]
-            )).set_index(["household_id", "asset_id", "t"])
-
-        def f():
-            household.join(log_return, how='outer')
-        self.assertRaises(NotImplementedError, f)
-
-def _check_join(left, right, result, join_col, how='left',
-                lsuffix='_x', rsuffix='_y'):
-
-    # some smoke tests
-    for c in join_col:
-        assert(result[c].notnull().all())
-
-    left_grouped = left.groupby(join_col)
-    right_grouped = right.groupby(join_col)
-
-    for group_key, group in result.groupby(join_col):
-        l_joined = _restrict_to_columns(group, left.columns, lsuffix)
-        r_joined = _restrict_to_columns(group, right.columns, rsuffix)
-
-        try:
-            lgroup = left_grouped.get_group(group_key)
-        except KeyError:
-            if how in ('left', 'inner'):
-                raise AssertionError('key %s should not have been in the join'
-                                     % str(group_key))
-
-            _assert_all_na(l_joined, left.columns, join_col)
-        else:
-            _assert_same_contents(l_joined, lgroup)
-
-        try:
-            rgroup = right_grouped.get_group(group_key)
-        except KeyError:
-            if how in ('right', 'inner'):
-                raise AssertionError('key %s should not have been in the join'
-                                     % str(group_key))
-
-            _assert_all_na(r_joined, right.columns, join_col)
-        else:
-            _assert_same_contents(r_joined, rgroup)
-
-
-def _restrict_to_columns(group, columns, suffix):
-    found = [c for c in group.columns
-             if c in columns or c.replace(suffix, '') in columns]
-
-     # filter
-    group = group.ix[:, found]
-
-    # get rid of suffixes, if any
-    group = group.rename(columns=lambda x: x.replace(suffix, ''))
-
-    # put in the right order...
-    group = group.ix[:, columns]
-
-    return group
-
-
-def _assert_same_contents(join_chunk, source):
-    NA_SENTINEL = -1234567  # drop_duplicates not so NA-friendly...
-
-    jvalues = join_chunk.fillna(NA_SENTINEL).drop_duplicates().values
-    svalues = source.fillna(NA_SENTINEL).drop_duplicates().values
-
-    rows = set(tuple(row) for row in jvalues)
-    assert(len(rows) == len(source))
-    assert(all(tuple(row) in rows for row in svalues))
-
-
-def _assert_all_na(join_chunk, source_columns, join_col):
-    for c in source_columns:
-        if c in join_col:
-            continue
-        assert(join_chunk[c].isnull().all())
-
-
-def _join_by_hand(a, b, how='left'):
-    join_index = a.index.join(b.index, how=how)
-
-    a_re = a.reindex(join_index)
-    b_re = b.reindex(join_index)
-
-    result_columns = a.columns.append(b.columns)
-
-    for col, s in compat.iteritems(b_re):
-        a_re[col] = s
-    return a_re.reindex(columns=result_columns)
-
-
-class TestConcatenate(tm.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.frame = DataFrame(tm.getSeriesData())
-        self.mixed_frame = self.frame.copy()
-        self.mixed_frame['foo'] = 'bar'
-
-    def test_append(self):
-        begin_index = self.frame.index[:5]
-        end_index = self.frame.index[5:]
-
-        begin_frame = self.frame.reindex(begin_index)
-        end_frame = self.frame.reindex(end_index)
-
-        appended = begin_frame.append(end_frame)
-        assert_almost_equal(appended['A'], self.frame['A'])
-
-        del end_frame['A']
-        partial_appended = begin_frame.append(end_frame)
-        self.assertIn('A', partial_appended)
-
-        partial_appended = end_frame.append(begin_frame)
-        self.assertIn('A', partial_appended)
-
-        # mixed type handling
-        appended = self.mixed_frame[:5].append(self.mixed_frame[5:])
-        assert_frame_equal(appended, self.mixed_frame)
-
-        # what to test here
-        mixed_appended = self.mixed_frame[:5].append(self.frame[5:])
-        mixed_appended2 = self.frame[:5].append(self.mixed_frame[5:])
-
-        # all equal except 'foo' column
-        assert_frame_equal(
-            mixed_appended.reindex(columns=['A', 'B', 'C', 'D']),
-            mixed_appended2.reindex(columns=['A', 'B', 'C', 'D']))
-
-        # append empty
-        empty = DataFrame({})
-
-        appended = self.frame.append(empty)
-        assert_frame_equal(self.frame, appended)
-        self.assertIsNot(appended, self.frame)
-
-        appended = empty.append(self.frame)
-        assert_frame_equal(self.frame, appended)
-        self.assertIsNot(appended, self.frame)
-
-        # overlap
-        self.assertRaises(ValueError, self.frame.append, self.frame,
-                          verify_integrity=True)
-
-        # new columns
-        # GH 6129
-        df = DataFrame({'a': {'x': 1, 'y': 2}, 'b': {'x': 3, 'y': 4}})
-        row = Series([5, 6, 7], index=['a', 'b', 'c'], name='z')
-        expected = DataFrame({'a': {'x': 1, 'y': 2, 'z': 5}, 'b': {'x': 3, 'y': 4, 'z': 6}, 'c' : {'z' : 7}})
-        result = df.append(row)
-        assert_frame_equal(result, expected)
-
-    def test_append_length0_frame(self):
-        df = DataFrame(columns=['A', 'B', 'C'])
-        df3 = DataFrame(index=[0, 1], columns=['A', 'B'])
-        df5 = df.append(df3)
-
-        expected = DataFrame(index=[0, 1], columns=['A', 'B', 'C'])
-        assert_frame_equal(df5, expected)
-
-    def test_append_records(self):
-        arr1 = np.zeros((2,), dtype=('i4,f4,a10'))
-        arr1[:] = [(1, 2., 'Hello'), (2, 3., "World")]
-
-        arr2 = np.zeros((3,), dtype=('i4,f4,a10'))
-        arr2[:] = [(3, 4., 'foo'),
-                   (5, 6., "bar"),
-                   (7., 8., 'baz')]
-
-        df1 = DataFrame(arr1)
-        df2 = DataFrame(arr2)
-
-        result = df1.append(df2, ignore_index=True)
-        expected = DataFrame(np.concatenate((arr1, arr2)))
-        assert_frame_equal(result, expected)
-
-    def test_append_different_columns(self):
-        df = DataFrame({'bools': np.random.randn(10) > 0,
-                        'ints': np.random.randint(0, 10, 10),
-                        'floats': np.random.randn(10),
-                        'strings': ['foo', 'bar'] * 5})
-
-        a = df[:5].ix[:, ['bools', 'ints', 'floats']]
-        b = df[5:].ix[:, ['strings', 'ints', 'floats']]
-
-        appended = a.append(b)
-        self.assertTrue(isnull(appended['strings'][0:4]).all())
-        self.assertTrue(isnull(appended['bools'][5:]).all())
-
-    def test_append_many(self):
-        chunks = [self.frame[:5], self.frame[5:10],
-                  self.frame[10:15], self.frame[15:]]
-
-        result = chunks[0].append(chunks[1:])
-        tm.assert_frame_equal(result, self.frame)
-
-        chunks[-1] = chunks[-1].copy()
-        chunks[-1]['foo'] = 'bar'
-        result = chunks[0].append(chunks[1:])
-        tm.assert_frame_equal(result.ix[:, self.frame.columns], self.frame)
-        self.assertTrue((result['foo'][15:] == 'bar').all())
-        self.assertTrue(result['foo'][:15].isnull().all())
-
-    def test_append_preserve_index_name(self):
-        # #980
-        df1 = DataFrame(data=None, columns=['A', 'B', 'C'])
-        df1 = df1.set_index(['A'])
-        df2 = DataFrame(data=[[1, 4, 7], [2, 5, 8], [3, 6, 9]],
-                        columns=['A', 'B', 'C'])
-        df2 = df2.set_index(['A'])
-
-        result = df1.append(df2)
-        self.assertEqual(result.index.name, 'A')
-
-    def test_join_many(self):
-        df = DataFrame(np.random.randn(10, 6), columns=list('abcdef'))
-        df_list = [df[['a', 'b']], df[['c', 'd']], df[['e', 'f']]]
-
-        joined = df_list[0].join(df_list[1:])
-        tm.assert_frame_equal(joined, df)
-
-        df_list = [df[['a', 'b']][:-2],
-                   df[['c', 'd']][2:], df[['e', 'f']][1:9]]
-
-        def _check_diff_index(df_list, result, exp_index):
-            reindexed = [x.reindex(exp_index) for x in df_list]
-            expected = reindexed[0].join(reindexed[1:])
-            tm.assert_frame_equal(result, expected)
-
-        # different join types
-        joined = df_list[0].join(df_list[1:], how='outer')
-        _check_diff_index(df_list, joined, df.index)
-
-        joined = df_list[0].join(df_list[1:])
-        _check_diff_index(df_list, joined, df_list[0].index)
-
-        joined = df_list[0].join(df_list[1:], how='inner')
-        _check_diff_index(df_list, joined, df.index[2:8])
-
-        self.assertRaises(ValueError, df_list[0].join, df_list[1:], on='a')
-
-    def test_join_many_mixed(self):
-        df = DataFrame(np.random.randn(8, 4), columns=['A', 'B', 'C', 'D'])
-        df['key'] = ['foo', 'bar'] * 4
-        df1 = df.ix[:, ['A', 'B']]
-        df2 = df.ix[:, ['C', 'D']]
-        df3 = df.ix[:, ['key']]
-
-        result = df1.join([df2, df3])
-        assert_frame_equal(result, df)
-
-    def test_append_missing_column_proper_upcast(self):
-        df1 = DataFrame({'A': np.array([1, 2, 3, 4], dtype='i8')})
-        df2 = DataFrame({'B': np.array([True, False, True, False],
-                                       dtype=bool)})
-
-        appended = df1.append(df2, ignore_index=True)
-        self.assertEqual(appended['A'].dtype, 'f8')
-        self.assertEqual(appended['B'].dtype, 'O')
-
-    def test_concat_copy(self):
-
-        df = DataFrame(np.random.randn(4, 3))
-        df2 = DataFrame(np.random.randint(0,10,size=4).reshape(4,1))
-        df3 = DataFrame({5 : 'foo'},index=range(4))
-
-        # these are actual copies
-        result = concat([df,df2,df3],axis=1,copy=True)
-        for b in result._data.blocks:
-            self.assertIsNone(b.values.base)
-
-        # these are the same
-        result = concat([df,df2,df3],axis=1,copy=False)
-        for b in result._data.blocks:
-            if b.is_float:
-                self.assertTrue(b.values.base is df._data.blocks[0].values.base)
-            elif b.is_integer:
-                self.assertTrue(b.values.base is df2._data.blocks[0].values.base)
-            elif b.is_object:
-                self.assertIsNotNone(b.values.base)
-
-        # float block was consolidated
-        df4 = DataFrame(np.random.randn(4,1))
-        result = concat([df,df2,df3,df4],axis=1,copy=False)
-        for b in result._data.blocks:
-            if b.is_float:
-                self.assertIsNone(b.values.base)
-            elif b.is_integer:
-                self.assertTrue(b.values.base is df2._data.blocks[0].values.base)
-            elif b.is_object:
-                self.assertIsNotNone(b.values.base)
-
-    def test_concat_with_group_keys(self):
-        df = DataFrame(np.random.randn(4, 3))
-        df2 = DataFrame(np.random.randn(4, 4))
-
-        # axis=0
-        df = DataFrame(np.random.randn(3, 4))
-        df2 = DataFrame(np.random.randn(4, 4))
-
-        result = concat([df, df2], keys=[0, 1])
-        exp_index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1, 1],
-                                            [0, 1, 2, 0, 1, 2, 3]])
-        expected = DataFrame(np.r_[df.values, df2.values],
-                             index=exp_index)
-        tm.assert_frame_equal(result, expected)
-
-        result = concat([df, df], keys=[0, 1])
-        exp_index2 = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1],
-                                            [0, 1, 2, 0, 1, 2]])
-        expected = DataFrame(np.r_[df.values, df.values],
-                             index=exp_index2)
-        tm.assert_frame_equal(result, expected)
-
-        # axis=1
-        df = DataFrame(np.random.randn(4, 3))
-        df2 = DataFrame(np.random.randn(4, 4))
-
-        result = concat([df, df2], keys=[0, 1], axis=1)
-        expected = DataFrame(np.c_[df.values, df2.values],
-                             columns=exp_index)
-        tm.assert_frame_equal(result, expected)
-
-        result = concat([df, df], keys=[0, 1], axis=1)
-        expected = DataFrame(np.c_[df.values, df.values],
-                             columns=exp_index2)
-        tm.assert_frame_equal(result, expected)
-
-    def test_concat_keys_specific_levels(self):
-        df = DataFrame(np.random.randn(10, 4))
-        pieces = [df.ix[:, [0, 1]], df.ix[:, [2]], df.ix[:, [3]]]
-        level = ['three', 'two', 'one', 'zero']
-        result = concat(pieces, axis=1, keys=['one', 'two', 'three'],
-                        levels=[level],
-                        names=['group_key'])
-
-        self.assert_numpy_array_equal(result.columns.levels[0], level)
-        self.assertEqual(result.columns.names[0], 'group_key')
-
-    def test_concat_dataframe_keys_bug(self):
-        t1 = DataFrame({'value': Series([1, 2, 3],
-                       index=Index(['a', 'b', 'c'], name='id'))})
-        t2 = DataFrame({'value': Series([7, 8],
-                       index=Index(['a', 'b'], name='id'))})
-
-        # it works
-        result = concat([t1, t2], axis=1, keys=['t1', 't2'])
-        self.assertEqual(list(result.columns), [('t1', 'value'),
-                                                ('t2', 'value')])
-
-    def test_concat_series_partial_columns_names(self):
-        # GH10698
-        foo = pd.Series([1,2], name='foo')
-        bar = pd.Series([1,2])
-        baz = pd.Series([4,5])
-
-        result = pd.concat([foo, bar, baz], axis=1)
-        expected = DataFrame({'foo' : [1,2], 0 : [1,2], 1 : [4,5]}, columns=['foo',0,1])
-        tm.assert_frame_equal(result, expected)
-
-        result = pd.concat([foo, bar, baz], axis=1, keys=['red','blue','yellow'])
-        expected = DataFrame({'red' : [1,2], 'blue' : [1,2], 'yellow' : [4,5]}, columns=['red','blue','yellow'])
-        tm.assert_frame_equal(result, expected)
-
-        result = pd.concat([foo, bar, baz], axis=1, ignore_index=True)
-        expected = DataFrame({0 : [1,2], 1 : [1,2], 2 : [4,5]})
-        tm.assert_frame_equal(result, expected)
-
-    def test_concat_dict(self):
-        frames = {'foo': DataFrame(np.random.randn(4, 3)),
-                  'bar': DataFrame(np.random.randn(4, 3)),
-                  'baz': DataFrame(np.random.randn(4, 3)),
-                  'qux': DataFrame(np.random.randn(4, 3))}
-
-        sorted_keys = sorted(frames)
-
-        result = concat(frames)
-        expected = concat([frames[k] for k in sorted_keys], keys=sorted_keys)
-        tm.assert_frame_equal(result, expected)
-
-        result = concat(frames, axis=1)
-        expected = concat([frames[k] for k in sorted_keys], keys=sorted_keys,
-                          axis=1)
-        tm.assert_frame_equal(result, expected)
-
-        keys = ['baz', 'foo', 'bar']
-        result = concat(frames, keys=keys)
-        expected = concat([frames[k] for k in keys], keys=keys)
-        tm.assert_frame_equal(result, expected)
-
-    def test_concat_ignore_index(self):
-        frame1 = DataFrame({"test1": ["a", "b", "c"],
-                            "test2": [1, 2, 3],
-                            "test3": [4.5, 3.2, 1.2]})
-        frame2 = DataFrame({"test3": [5.2, 2.2, 4.3]})
-        frame1.index = Index(["x", "y", "z"])
-        frame2.index = Index(["x", "y", "q"])
-
-        v1 = concat([frame1, frame2], axis=1, ignore_index=True)
-
-        nan = np.nan
-        expected = DataFrame([[nan, nan, nan, 4.3],
-                              ['a', 1, 4.5, 5.2],
-                              ['b', 2, 3.2, 2.2],
-                              ['c', 3, 1.2, nan]],
-                             index=Index(["q", "x", "y", "z"]))
-
-        tm.assert_frame_equal(v1, expected)
-
-    def test_concat_multiindex_with_keys(self):
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['first', 'second'])
-        frame = DataFrame(np.random.randn(10, 3), index=index,
-                          columns=Index(['A', 'B', 'C'], name='exp'))
-        result = concat([frame, frame], keys=[0, 1], names=['iteration'])
-
-        self.assertEqual(result.index.names, ('iteration',) + index.names)
-        tm.assert_frame_equal(result.ix[0], frame)
-        tm.assert_frame_equal(result.ix[1], frame)
-        self.assertEqual(result.index.nlevels, 3)
-
-    def test_concat_multiindex_with_tz(self):
-        # GH 6606
-        df = DataFrame({'dt': [datetime(2014, 1, 1),
-                               datetime(2014, 1, 2),
-                               datetime(2014, 1, 3)],
-                        'b': ['A', 'B', 'C'],
-                        'c': [1, 2, 3], 'd': [4, 5, 6]})
-        df['dt'] = df['dt'].apply(lambda d: pd.Timestamp(d, tz='US/Pacific'))
-        df = df.set_index(['dt', 'b'])
-
-        exp_idx1 = pd.DatetimeIndex(['2014-01-01', '2014-01-02', '2014-01-03'] * 2,
-                                    tz='US/Pacific', name='dt')
-        exp_idx2 = Index(['A', 'B', 'C'] * 2, name='b')
-        exp_idx = pd.MultiIndex.from_arrays([exp_idx1, exp_idx2])
-        expected = DataFrame({'c': [1, 2, 3] * 2, 'd': [4, 5, 6] * 2},
-                             index=exp_idx, columns=['c', 'd'])
-
-        result = concat([df, df])
-        tm.assert_frame_equal(result, expected)
-
-    def test_concat_keys_and_levels(self):
-        df = DataFrame(np.random.randn(1, 3))
-        df2 = DataFrame(np.random.randn(1, 4))
-
-        levels = [['foo', 'baz'], ['one', 'two']]
-        names = ['first', 'second']
-        result = concat([df, df2, df, df2],
-                        keys=[('foo', 'one'), ('foo', 'two'),
-                              ('baz', 'one'), ('baz', 'two')],
-                        levels=levels,
-                        names=names)
-        expected = concat([df, df2, df, df2])
-        exp_index = MultiIndex(levels=levels + [[0]],
-                               labels=[[0, 0, 1, 1], [0, 1, 0, 1],
-                                       [0, 0, 0, 0]],
-                               names=names + [None])
-        expected.index = exp_index
-
-        assert_frame_equal(result, expected)
-
-        # no names
-
-        result = concat([df, df2, df, df2],
-                        keys=[('foo', 'one'), ('foo', 'two'),
-                              ('baz', 'one'), ('baz', 'two')],
-                        levels=levels)
-        self.assertEqual(result.index.names, (None,) * 3)
-
-        # no levels
-        result = concat([df, df2, df, df2],
-                        keys=[('foo', 'one'), ('foo', 'two'),
-                              ('baz', 'one'), ('baz', 'two')],
-                        names=['first', 'second'])
-        self.assertEqual(result.index.names, ('first', 'second') + (None,))
-        self.assert_numpy_array_equal(result.index.levels[0], ['baz', 'foo'])
-
-    def test_concat_keys_levels_no_overlap(self):
-        # GH #1406
-        df = DataFrame(np.random.randn(1, 3), index=['a'])
-        df2 = DataFrame(np.random.randn(1, 4), index=['b'])
-
-        self.assertRaises(ValueError, concat, [df, df],
-                          keys=['one', 'two'], levels=[['foo', 'bar', 'baz']])
-
-        self.assertRaises(ValueError, concat, [df, df2],
-                          keys=['one', 'two'], levels=[['foo', 'bar', 'baz']])
-
-    def test_concat_rename_index(self):
-        a = DataFrame(np.random.rand(3, 3),
-                      columns=list('ABC'),
-                      index=Index(list('abc'), name='index_a'))
-        b = DataFrame(np.random.rand(3, 3),
-                      columns=list('ABC'),
-                      index=Index(list('abc'), name='index_b'))
-
-        result = concat([a, b], keys=['key0', 'key1'],
-                        names=['lvl0', 'lvl1'])
-
-        exp = concat([a, b], keys=['key0', 'key1'], names=['lvl0'])
-        names = list(exp.index.names)
-        names[1] = 'lvl1'
-        exp.index.set_names(names, inplace=True)
-
-        tm.assert_frame_equal(result, exp)
-        self.assertEqual(result.index.names, exp.index.names)
-
-    def test_crossed_dtypes_weird_corner(self):
-        columns = ['A', 'B', 'C', 'D']
-        df1 = DataFrame({'A': np.array([1, 2, 3, 4], dtype='f8'),
-                         'B': np.array([1, 2, 3, 4], dtype='i8'),
-                         'C': np.array([1, 2, 3, 4], dtype='f8'),
-                         'D': np.array([1, 2, 3, 4], dtype='i8')},
-                        columns=columns)
-
-        df2 = DataFrame({'A': np.array([1, 2, 3, 4], dtype='i8'),
-                         'B': np.array([1, 2, 3, 4], dtype='f8'),
-                         'C': np.array([1, 2, 3, 4], dtype='i8'),
-                         'D': np.array([1, 2, 3, 4], dtype='f8')},
-                        columns=columns)
-
-        appended = df1.append(df2, ignore_index=True)
-        expected = DataFrame(np.concatenate([df1.values, df2.values], axis=0),
-                             columns=columns)
-        tm.assert_frame_equal(appended, expected)
-
-        df = DataFrame(np.random.randn(1, 3), index=['a'])
-        df2 = DataFrame(np.random.randn(1, 4), index=['b'])
-        result = concat(
-            [df, df2], keys=['one', 'two'], names=['first', 'second'])
-        self.assertEqual(result.index.names, ('first', 'second'))
-
-    def test_dups_index(self):
-        # GH 4771
-
-        # single dtypes
-        df = DataFrame(np.random.randint(0,10,size=40).reshape(10,4),columns=['A','A','C','C'])
-
-        result = concat([df,df],axis=1)
-        assert_frame_equal(result.iloc[:,:4],df)
-        assert_frame_equal(result.iloc[:,4:],df)
-
-        result = concat([df,df],axis=0)
-        assert_frame_equal(result.iloc[:10],df)
-        assert_frame_equal(result.iloc[10:],df)
-
-        # multi dtypes
-        df = concat([DataFrame(np.random.randn(10,4),columns=['A','A','B','B']),
-                     DataFrame(np.random.randint(0,10,size=20).reshape(10,2),columns=['A','C'])],
-                    axis=1)
-
-        result = concat([df,df],axis=1)
-        assert_frame_equal(result.iloc[:,:6],df)
-        assert_frame_equal(result.iloc[:,6:],df)
-
-        result = concat([df,df],axis=0)
-        assert_frame_equal(result.iloc[:10],df)
-        assert_frame_equal(result.iloc[10:],df)
-
-        # append
-        result = df.iloc[0:8,:].append(df.iloc[8:])
-        assert_frame_equal(result, df)
-
-        result = df.iloc[0:8,:].append(df.iloc[8:9]).append(df.iloc[9:10])
-        assert_frame_equal(result, df)
-
-        expected = concat([df,df],axis=0)
-        result = df.append(df)
-        assert_frame_equal(result, expected)
-
-    def test_with_mixed_tuples(self):
-        # 10697
-        # columns have mixed tuples, so handle properly
-        df1 = DataFrame({ u'A' : 'foo', (u'B',1) : 'bar' },index=range(2))
-        df2 = DataFrame({ u'B' : 'foo', (u'B',1) : 'bar' },index=range(2))
-        result = concat([df1,df2])
-
-    def test_join_dups(self):
-
-        # joining dups
-        df = concat([DataFrame(np.random.randn(10,4),columns=['A','A','B','B']),
-                     DataFrame(np.random.randint(0,10,size=20).reshape(10,2),columns=['A','C'])],
-                    axis=1)
-
-        expected = concat([df,df],axis=1)
-        result = df.join(df,rsuffix='_2')
-        result.columns = expected.columns
-        assert_frame_equal(result, expected)
-
-        # GH 4975, invalid join on dups
-        w = DataFrame(np.random.randn(4,2), columns=["x", "y"])
-        x = DataFrame(np.random.randn(4,2), columns=["x", "y"])
-        y = DataFrame(np.random.randn(4,2), columns=["x", "y"])
-        z = DataFrame(np.random.randn(4,2), columns=["x", "y"])
-
-        dta = x.merge(y, left_index=True, right_index=True).merge(z, left_index=True, right_index=True, how="outer")
-        dta = dta.merge(w, left_index=True, right_index=True)
-        expected = concat([x,y,z,w],axis=1)
-        expected.columns=['x_x','y_x','x_y','y_y','x_x','y_x','x_y','y_y']
-        assert_frame_equal(dta,expected)
-
-    def test_handle_empty_objects(self):
-        df = DataFrame(np.random.randn(10, 4), columns=list('abcd'))
-
-        baz = df[:5].copy()
-        baz['foo'] = 'bar'
-        empty = df[5:5]
-
-        frames = [baz, empty, empty, df[5:]]
-        concatted = concat(frames, axis=0)
-
-        expected = df.ix[:, ['a', 'b', 'c', 'd', 'foo']]
-        expected['foo'] = expected['foo'].astype('O')
-        expected.loc[0:4,'foo'] = 'bar'
-
-        tm.assert_frame_equal(concatted, expected)
-
-        # empty as first element with time series
-        # GH3259
-        df = DataFrame(dict(A = range(10000)),index=date_range('20130101',periods=10000,freq='s'))
-        empty = DataFrame()
-        result = concat([df,empty],axis=1)
-        assert_frame_equal(result, df)
-        result = concat([empty,df],axis=1)
-        assert_frame_equal(result, df)
-
-        result = concat([df,empty])
-        assert_frame_equal(result, df)
-        result = concat([empty,df])
-        assert_frame_equal(result, df)
-
-    def test_concat_mixed_objs(self):
-
-        # concat mixed series/frames
-        # G2385
-
-        # axis 1
-        index=date_range('01-Jan-2013', periods=10, freq='H')
-        arr = np.arange(10, dtype='int64')
-        s1 = Series(arr, index=index)
-        s2 = Series(arr, index=index)
-        df = DataFrame(arr.reshape(-1,1), index=index)
-
-        expected = DataFrame(np.repeat(arr,2).reshape(-1,2), index=index, columns = [0, 0])
-        result = concat([df,df], axis=1)
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame(np.repeat(arr,2).reshape(-1,2), index=index, columns = [0, 1])
-        result = concat([s1,s2], axis=1)
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame(np.repeat(arr,3).reshape(-1,3), index=index, columns = [0, 1, 2])
-        result = concat([s1,s2,s1], axis=1)
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame(np.repeat(arr,5).reshape(-1,5), index=index, columns = [0, 0, 1, 2, 3])
-        result = concat([s1,df,s2,s2,s1], axis=1)
-        assert_frame_equal(result, expected)
-
-        # with names
-        s1.name = 'foo'
-        expected = DataFrame(np.repeat(arr,3).reshape(-1,3), index=index, columns = ['foo', 0, 0])
-        result = concat([s1,df,s2], axis=1)
-        assert_frame_equal(result, expected)
-
-        s2.name = 'bar'
-        expected = DataFrame(np.repeat(arr,3).reshape(-1,3), index=index, columns = ['foo', 0, 'bar'])
-        result = concat([s1,df,s2], axis=1)
-        assert_frame_equal(result, expected)
-
-        # ignore index
-        expected = DataFrame(np.repeat(arr,3).reshape(-1,3), index=index, columns = [0, 1, 2])
-        result = concat([s1,df,s2], axis=1, ignore_index=True)
-        assert_frame_equal(result, expected)
-
-        # axis 0
-        expected = DataFrame(np.tile(arr,3).reshape(-1,1), index=index.tolist() * 3, columns = [0])
-        result = concat([s1,df,s2])
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame(np.tile(arr,3).reshape(-1,1), columns = [0])
-        result = concat([s1,df,s2], ignore_index=True)
-        assert_frame_equal(result, expected)
-
-        # invalid concatente of mixed dims
-        panel = tm.makePanel()
-        self.assertRaises(ValueError, lambda : concat([panel,s1],axis=1))
-
-    def test_panel_join(self):
-        panel = tm.makePanel()
-        tm.add_nans(panel)
-
-        p1 = panel.ix[:2, :10, :3]
-        p2 = panel.ix[2:, 5:, 2:]
-
-        # left join
-        result = p1.join(p2)
-        expected = p1.copy()
-        expected['ItemC'] = p2['ItemC']
-        tm.assert_panel_equal(result, expected)
-
-        # right join
-        result = p1.join(p2, how='right')
-        expected = p2.copy()
-        expected['ItemA'] = p1['ItemA']
-        expected['ItemB'] = p1['ItemB']
-        expected = expected.reindex(items=['ItemA', 'ItemB', 'ItemC'])
-        tm.assert_panel_equal(result, expected)
-
-        # inner join
-        result = p1.join(p2, how='inner')
-        expected = panel.ix[:, 5:10, 2:3]
-        tm.assert_panel_equal(result, expected)
-
-        # outer join
-        result = p1.join(p2, how='outer')
-        expected = p1.reindex(major=panel.major_axis,
-                              minor=panel.minor_axis)
-        expected = expected.join(p2.reindex(major=panel.major_axis,
-                                            minor=panel.minor_axis))
-        tm.assert_panel_equal(result, expected)
-
-    def test_panel_join_overlap(self):
-        panel = tm.makePanel()
-        tm.add_nans(panel)
-
-        p1 = panel.ix[['ItemA', 'ItemB', 'ItemC']]
-        p2 = panel.ix[['ItemB', 'ItemC']]
-
-        # Expected index is
-        #
-        # ItemA, ItemB_p1, ItemC_p1, ItemB_p2, ItemC_p2
-        joined = p1.join(p2, lsuffix='_p1', rsuffix='_p2')
-        p1_suf = p1.ix[['ItemB', 'ItemC']].add_suffix('_p1')
-        p2_suf = p2.ix[['ItemB', 'ItemC']].add_suffix('_p2')
-        no_overlap = panel.ix[['ItemA']]
-        expected = no_overlap.join(p1_suf.join(p2_suf))
-        tm.assert_panel_equal(joined, expected)
-
-    def test_panel_join_many(self):
-        tm.K = 10
-        panel = tm.makePanel()
-        tm.K = 4
-
-        panels = [panel.ix[:2], panel.ix[2:6], panel.ix[6:]]
-
-        joined = panels[0].join(panels[1:])
-        tm.assert_panel_equal(joined, panel)
-
-        panels = [panel.ix[:2, :-5], panel.ix[2:6, 2:], panel.ix[6:, 5:-7]]
-
-        data_dict = {}
-        for p in panels:
-            data_dict.update(compat.iteritems(p))
-
-        joined = panels[0].join(panels[1:], how='inner')
-        expected = Panel.from_dict(data_dict, intersect=True)
-        tm.assert_panel_equal(joined, expected)
-
-        joined = panels[0].join(panels[1:], how='outer')
-        expected = Panel.from_dict(data_dict, intersect=False)
-        tm.assert_panel_equal(joined, expected)
-
-        # edge cases
-        self.assertRaises(ValueError, panels[0].join, panels[1:],
-                          how='outer', lsuffix='foo', rsuffix='bar')
-        self.assertRaises(ValueError, panels[0].join, panels[1:],
-                          how='right')
-
-    def test_panel_concat_other_axes(self):
-        panel = tm.makePanel()
-
-        p1 = panel.ix[:, :5, :]
-        p2 = panel.ix[:, 5:, :]
-
-        result = concat([p1, p2], axis=1)
-        tm.assert_panel_equal(result, panel)
-
-        p1 = panel.ix[:, :, :2]
-        p2 = panel.ix[:, :, 2:]
-
-        result = concat([p1, p2], axis=2)
-        tm.assert_panel_equal(result, panel)
-
-        # if things are a bit misbehaved
-        p1 = panel.ix[:2, :, :2]
-        p2 = panel.ix[:, :, 2:]
-        p1['ItemC'] = 'baz'
-
-        result = concat([p1, p2], axis=2)
-
-        expected = panel.copy()
-        expected['ItemC'] = expected['ItemC'].astype('O')
-        expected.ix['ItemC', :, :2] = 'baz'
-        tm.assert_panel_equal(result, expected)
-
-    def test_panel_concat_buglet(self):
-        # #2257
-        def make_panel():
-            index = 5
-            cols = 3
-
-            def df():
-                return DataFrame(np.random.randn(index, cols),
-                                 index=["I%s" % i for i in range(index)],
-                                 columns=["C%s" % i for i in range(cols)])
-            return Panel(dict([("Item%s" % x, df()) for x in ['A', 'B', 'C']]))
-
-        panel1 = make_panel()
-        panel2 = make_panel()
-
-        panel2 = panel2.rename_axis(dict([(x, "%s_1" % x)
-                                          for x in panel2.major_axis]),
-                                    axis=1)
-
-        panel3 = panel2.rename_axis(lambda x: '%s_1' % x, axis=1)
-        panel3 = panel3.rename_axis(lambda x: '%s_1' % x, axis=2)
-
-        # it works!
-        concat([panel1, panel3], axis=1, verify_integrity=True)
-
-    def test_panel4d_concat(self):
-        p4d = tm.makePanel4D()
-
-        p1 = p4d.ix[:, :, :5, :]
-        p2 = p4d.ix[:, :, 5:, :]
-
-        result = concat([p1, p2], axis=2)
-        tm.assert_panel4d_equal(result, p4d)
-
-        p1 = p4d.ix[:, :, :, :2]
-        p2 = p4d.ix[:, :, :, 2:]
-
-        result = concat([p1, p2], axis=3)
-        tm.assert_panel4d_equal(result, p4d)
-
-    def test_panel4d_concat_mixed_type(self):
-        p4d = tm.makePanel4D()
-
-        # if things are a bit misbehaved
-        p1 = p4d.ix[:, :2, :, :2]
-        p2 = p4d.ix[:, :, :, 2:]
-        p1['L5'] = 'baz'
-
-        result = concat([p1, p2], axis=3)
-
-        p2['L5'] = np.nan
-        expected = concat([p1, p2], axis=3)
-        expected = expected.ix[result.labels]
-
-        tm.assert_panel4d_equal(result, expected)
-
-    def test_concat_series(self):
-
-        ts = tm.makeTimeSeries()
-        ts.name = 'foo'
-
-        pieces = [ts[:5], ts[5:15], ts[15:]]
-
-        result = concat(pieces)
-        tm.assert_series_equal(result, ts)
-        self.assertEqual(result.name, ts.name)
-
-        result = concat(pieces, keys=[0, 1, 2])
-        expected = ts.copy()
-
-        ts.index = DatetimeIndex(np.array(ts.index.values, dtype='M8[ns]'))
-
-        exp_labels = [np.repeat([0, 1, 2], [len(x) for x in pieces]),
-                      np.arange(len(ts))]
-        exp_index = MultiIndex(levels=[[0, 1, 2], ts.index],
-                               labels=exp_labels)
-        expected.index = exp_index
-        tm.assert_series_equal(result, expected)
-
-    def test_concat_series_axis1(self):
-        ts = tm.makeTimeSeries()
-
-        pieces = [ts[:-2], ts[2:], ts[2:-2]]
-
-        result = concat(pieces, axis=1)
-        expected = DataFrame(pieces).T
-        assert_frame_equal(result, expected)
-
-        result = concat(pieces, keys=['A', 'B', 'C'], axis=1)
-        expected = DataFrame(pieces, index=['A', 'B', 'C']).T
-        assert_frame_equal(result, expected)
-
-        # preserve series names, #2489
-        s = Series(randn(5), name='A')
-        s2 = Series(randn(5), name='B')
-
-        result = concat([s, s2], axis=1)
-        expected = DataFrame({'A': s, 'B': s2})
-        assert_frame_equal(result, expected)
-
-        s2.name = None
-        result = concat([s, s2], axis=1)
-        self.assertTrue(np.array_equal(result.columns, Index(['A', 0], dtype='object')))
-
-        # must reindex, #2603
-        s = Series(randn(3), index=['c', 'a', 'b'], name='A')
-        s2 = Series(randn(4), index=['d', 'a', 'b', 'c'], name='B')
-        result = concat([s, s2], axis=1)
-        expected = DataFrame({'A': s, 'B': s2})
-        assert_frame_equal(result, expected)
-
-    def test_concat_single_with_key(self):
-        df = DataFrame(np.random.randn(10, 4))
-
-        result = concat([df], keys=['foo'])
-        expected = concat([df, df], keys=['foo', 'bar'])
-        tm.assert_frame_equal(result, expected[:10])
-
-    def test_concat_exclude_none(self):
-        df = DataFrame(np.random.randn(10, 4))
-
-        pieces = [df[:5], None, None, df[5:]]
-        result = concat(pieces)
-        tm.assert_frame_equal(result, df)
-        self.assertRaises(ValueError, concat, [None, None])
-
-    def test_concat_datetime64_block(self):
-        from pandas.tseries.index import date_range
-
-        rng = date_range('1/1/2000', periods=10)
-
-        df = DataFrame({'time': rng})
-
-        result = concat([df, df])
-        self.assertTrue((result.iloc[:10]['time'] == rng).all())
-        self.assertTrue((result.iloc[10:]['time'] == rng).all())
-
-    def test_concat_timedelta64_block(self):
-        from pandas import to_timedelta
-
-        rng = to_timedelta(np.arange(10),unit='s')
-
-        df = DataFrame({'time': rng})
-
-        result = concat([df, df])
-        self.assertTrue((result.iloc[:10]['time'] == rng).all())
-        self.assertTrue((result.iloc[10:]['time'] == rng).all())
-
-    def test_concat_keys_with_none(self):
-        # #1649
-        df0 = DataFrame([[10, 20, 30], [10, 20, 30], [10, 20, 30]])
-
-        result = concat(dict(a=None, b=df0, c=df0[:2], d=df0[:1], e=df0))
-        expected = concat(dict(b=df0, c=df0[:2], d=df0[:1], e=df0))
-        tm.assert_frame_equal(result, expected)
-
-        result = concat([None, df0, df0[:2], df0[:1], df0],
-                        keys=['a', 'b', 'c', 'd', 'e'])
-        expected = concat([df0, df0[:2], df0[:1], df0],
-                          keys=['b', 'c', 'd', 'e'])
-        tm.assert_frame_equal(result, expected)
-
-    def test_concat_bug_1719(self):
-        ts1 = tm.makeTimeSeries()
-        ts2 = tm.makeTimeSeries()[::2]
-
-        ## to join with union
-        ## these two are of different length!
-        left = concat([ts1, ts2], join='outer', axis=1)
-        right = concat([ts2, ts1], join='outer', axis=1)
-
-        self.assertEqual(len(left), len(right))
-
-    def test_concat_bug_2972(self):
-        ts0 = Series(np.zeros(5))
-        ts1 = Series(np.ones(5))
-        ts0.name = ts1.name = 'same name'
-        result = concat([ts0, ts1], axis=1)
-
-        expected = DataFrame({0: ts0, 1: ts1})
-        expected.columns=['same name', 'same name']
-        assert_frame_equal(result, expected)
-
-    def test_concat_bug_3602(self):
-
-        # GH 3602, duplicate columns
-        df1 = DataFrame({'firmNo' : [0,0,0,0], 'stringvar' : ['rrr', 'rrr', 'rrr', 'rrr'], 'prc' : [6,6,6,6] })
-        df2 = DataFrame({'misc' : [1,2,3,4], 'prc' : [6,6,6,6], 'C' : [9,10,11,12]})
-        expected = DataFrame([[0,6,'rrr',9,1,6],
-                              [0,6,'rrr',10,2,6],
-                              [0,6,'rrr',11,3,6],
-                              [0,6,'rrr',12,4,6]])
-        expected.columns = ['firmNo','prc','stringvar','C','misc','prc']
-
-        result = concat([df1,df2],axis=1)
-        assert_frame_equal(result,expected)
-
-    def test_concat_series_axis1_same_names_ignore_index(self):
-        dates = date_range('01-Jan-2013', '01-Jan-2014', freq='MS')[0:-1]
-        s1 = Series(randn(len(dates)), index=dates, name='value')
-        s2 = Series(randn(len(dates)), index=dates, name='value')
-
-        result = concat([s1, s2], axis=1, ignore_index=True)
-        self.assertTrue(np.array_equal(result.columns, [0, 1]))
-
-    def test_concat_iterables(self):
-        from collections import deque, Iterable
-
-        # GH8645 check concat works with tuples, list, generators, and weird
-        # stuff like deque and custom iterables
-        df1 = DataFrame([1, 2, 3])
-        df2 = DataFrame([4, 5, 6])
-        expected = DataFrame([1, 2, 3, 4, 5, 6])
-        assert_frame_equal(pd.concat((df1, df2), ignore_index=True), expected)
-        assert_frame_equal(pd.concat([df1, df2], ignore_index=True), expected)
-        assert_frame_equal(pd.concat((df for df in (df1, df2)), ignore_index=True), expected)
-        assert_frame_equal(pd.concat(deque((df1, df2)), ignore_index=True), expected)
-        class CustomIterator1(object):
-            def __len__(self):
-                return 2
-            def __getitem__(self, index):
-                try:
-                    return {0: df1, 1: df2}[index]
-                except KeyError:
-                    raise IndexError
-        assert_frame_equal(pd.concat(CustomIterator1(), ignore_index=True), expected)
-        class CustomIterator2(Iterable):
-            def __iter__(self):
-                yield df1
-                yield df2
-        assert_frame_equal(pd.concat(CustomIterator2(), ignore_index=True), expected)
-
-    def test_concat_invalid(self):
-
-        # trying to concat a ndframe with a non-ndframe
-        df1 = mkdf(10, 2)
-        for obj in [1, dict(), [1, 2], (1, 2) ]:
-            self.assertRaises(TypeError, lambda x: concat([ df1, obj ]))
-
-    def test_concat_invalid_first_argument(self):
-        df1 = mkdf(10, 2)
-        df2 = mkdf(10, 2)
-        self.assertRaises(TypeError, concat, df1, df2)
-
-        # generator ok though
-        concat(DataFrame(np.random.rand(5,5)) for _ in range(3))
-
-        # text reader ok
-        # GH6583
-        data = """index,A,B,C,D
-foo,2,3,4,5
-bar,7,8,9,10
-baz,12,13,14,15
-qux,12,13,14,15
-foo2,12,13,14,15
-bar2,12,13,14,15
-"""
-
-        reader = read_csv(StringIO(data), chunksize=1)
-        result = concat(reader, ignore_index=True)
-        expected = read_csv(StringIO(data))
-        assert_frame_equal(result,expected)
-
-class TestOrderedMerge(tm.TestCase):
-
-    def setUp(self):
-        self.left = DataFrame({'key': ['a', 'c', 'e'],
-                               'lvalue': [1, 2., 3]})
-
-        self.right = DataFrame({'key': ['b', 'c', 'd', 'f'],
-                                'rvalue': [1, 2, 3., 4]})
-
-    # GH #813
-
-    def test_basic(self):
-        result = ordered_merge(self.left, self.right, on='key')
-        expected = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'f'],
-                              'lvalue': [1, nan, 2, nan, 3, nan],
-                              'rvalue': [nan, 1, 2, 3, nan, 4]})
-
-        assert_frame_equal(result, expected)
-
-    def test_ffill(self):
-        result = ordered_merge(
-            self.left, self.right, on='key', fill_method='ffill')
-        expected = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'f'],
-                              'lvalue': [1., 1, 2, 2, 3, 3.],
-                              'rvalue': [nan, 1, 2, 3, 3, 4]})
-        assert_frame_equal(result, expected)
-
-    def test_multigroup(self):
-        left = concat([self.left, self.left], ignore_index=True)
-        # right = concat([self.right, self.right], ignore_index=True)
-
-        left['group'] = ['a'] * 3 + ['b'] * 3
-        # right['group'] = ['a'] * 4 + ['b'] * 4
-
-        result = ordered_merge(left, self.right, on='key', left_by='group',
-                               fill_method='ffill')
-        expected = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'f'] * 2,
-                              'lvalue': [1., 1, 2, 2, 3, 3.] * 2,
-                              'rvalue': [nan, 1, 2, 3, 3, 4] * 2})
-        expected['group'] = ['a'] * 6 + ['b'] * 6
-
-        assert_frame_equal(result, expected.ix[:, result.columns])
-
-        result2 = ordered_merge(self.right, left, on='key', right_by='group',
-                                fill_method='ffill')
-        assert_frame_equal(result, result2.ix[:, result.columns])
-
-        result = ordered_merge(left, self.right, on='key', left_by='group')
-        self.assertTrue(result['group'].notnull().all())
-
-    def test_merge_type(self):
-        class NotADataFrame(DataFrame):
-            @property
-            def _constructor(self):
-                return NotADataFrame
-
-        nad = NotADataFrame(self.left)
-        result = nad.merge(self.right, on='key')
-
-        tm.assertIsInstance(result, NotADataFrame)
-
-    def test_empty_sequence_concat(self):
-        # GH 9157
-        empty_pat = "[Nn]o objects"
-        none_pat = "objects.*None"
-        test_cases = [
-            ((), empty_pat),
-            ([], empty_pat),
-            ({}, empty_pat),
-            ([None], none_pat),
-            ([None, None], none_pat)
-        ]
-        for df_seq, pattern in test_cases:
-            assertRaisesRegexp(ValueError, pattern, pd.concat, df_seq)
-
-        pd.concat([pd.DataFrame()])
-        pd.concat([None, pd.DataFrame()])
-        pd.concat([pd.DataFrame(), None])
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tools/tests/test_pivot.py b/pandas/tools/tests/test_pivot.py
deleted file mode 100644
index 50ae574c03067..0000000000000
--- a/pandas/tools/tests/test_pivot.py
+++ /dev/null
@@ -1,725 +0,0 @@
-import datetime
-
-import numpy as np
-from numpy.testing import assert_equal
-
-import pandas as pd
-from pandas import DataFrame, Series, Index, MultiIndex, Grouper
-from pandas.tools.merge import concat
-from pandas.tools.pivot import pivot_table, crosstab
-from pandas.compat import range, u, product
-import pandas.util.testing as tm
-
-
-class TestPivotTable(tm.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.data = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
-                                     'bar', 'bar', 'bar', 'bar',
-                                     'foo', 'foo', 'foo'],
-                               'B': ['one', 'one', 'one', 'two',
-                                     'one', 'one', 'one', 'two',
-                                     'two', 'two', 'one'],
-                               'C': ['dull', 'dull', 'shiny', 'dull',
-                                     'dull', 'shiny', 'shiny', 'dull',
-                                     'shiny', 'shiny', 'shiny'],
-                               'D': np.random.randn(11),
-                               'E': np.random.randn(11),
-                               'F': np.random.randn(11)})
-
-    def test_pivot_table(self):
-        index = ['A', 'B']
-        columns = 'C'
-        table = pivot_table(self.data, values='D', index=index, columns=columns)
-
-        table2 = self.data.pivot_table(values='D', index=index, columns=columns)
-        tm.assert_frame_equal(table, table2)
-
-        # this works
-        pivot_table(self.data, values='D', index=index)
-
-        if len(index) > 1:
-            self.assertEqual(table.index.names, tuple(index))
-        else:
-            self.assertEqual(table.index.name, index[0])
-
-        if len(columns) > 1:
-            self.assertEqual(table.columns.names, columns)
-        else:
-            self.assertEqual(table.columns.name, columns[0])
-
-        expected = self.data.groupby(index + [columns])['D'].agg(np.mean).unstack()
-        tm.assert_frame_equal(table, expected)
-
-    def test_pivot_table_nocols(self):
-        df = DataFrame({'rows': ['a', 'b', 'c'],
-                        'cols': ['x', 'y', 'z'],
-                        'values': [1,2,3]})
-        rs = df.pivot_table(columns='cols', aggfunc=np.sum)
-        xp = df.pivot_table(index='cols', aggfunc=np.sum).T
-        tm.assert_frame_equal(rs, xp)
-
-        rs = df.pivot_table(columns='cols', aggfunc={'values': 'mean'})
-        xp = df.pivot_table(index='cols', aggfunc={'values': 'mean'}).T
-        tm.assert_frame_equal(rs, xp)
-
-    def test_pivot_table_dropna(self):
-        df = DataFrame({'amount': {0: 60000, 1: 100000, 2: 50000, 3: 30000},
-                        'customer': {0: 'A', 1: 'A', 2: 'B', 3: 'C'},
-                        'month': {0: 201307, 1: 201309, 2: 201308, 3: 201310},
-                        'product': {0: 'a', 1: 'b', 2: 'c', 3: 'd'},
-                        'quantity': {0: 2000000, 1: 500000, 2: 1000000, 3: 1000000}})
-        pv_col = df.pivot_table('quantity', 'month', ['customer', 'product'], dropna=False)
-        pv_ind = df.pivot_table('quantity', ['customer', 'product'], 'month', dropna=False)
-
-        m = MultiIndex.from_tuples([(u('A'), u('a')),
-                                    (u('A'), u('b')),
-                                    (u('A'), u('c')),
-                                    (u('A'), u('d')),
-                                    (u('B'), u('a')),
-                                    (u('B'), u('b')),
-                                    (u('B'), u('c')),
-                                    (u('B'), u('d')),
-                                    (u('C'), u('a')),
-                                    (u('C'), u('b')),
-                                    (u('C'), u('c')),
-                                    (u('C'), u('d'))])
-
-        assert_equal(pv_col.columns.values, m.values)
-        assert_equal(pv_ind.index.values, m.values)
-
-
-    def test_pass_array(self):
-        result = self.data.pivot_table('D', index=self.data.A, columns=self.data.C)
-        expected = self.data.pivot_table('D', index='A', columns='C')
-        tm.assert_frame_equal(result, expected)
-
-    def test_pass_function(self):
-        result = self.data.pivot_table('D', index=lambda x: x // 5,
-                                       columns=self.data.C)
-        expected = self.data.pivot_table('D', index=self.data.index // 5,
-                                         columns='C')
-        tm.assert_frame_equal(result, expected)
-
-    def test_pivot_table_multiple(self):
-        index = ['A', 'B']
-        columns = 'C'
-        table = pivot_table(self.data, index=index, columns=columns)
-        expected = self.data.groupby(index + [columns]).agg(np.mean).unstack()
-        tm.assert_frame_equal(table, expected)
-
-    def test_pivot_dtypes(self):
-
-        # can convert dtypes
-        f = DataFrame({'a' : ['cat', 'bat', 'cat', 'bat'], 'v' : [1,2,3,4], 'i' : ['a','b','a','b']})
-        self.assertEqual(f.dtypes['v'], 'int64')
-
-        z = pivot_table(f, values='v', index=['a'], columns=['i'], fill_value=0, aggfunc=np.sum)
-        result = z.get_dtype_counts()
-        expected = Series(dict(int64 = 2))
-        tm.assert_series_equal(result, expected)
-
-        # cannot convert dtypes
-        f = DataFrame({'a' : ['cat', 'bat', 'cat', 'bat'], 'v' : [1.5,2.5,3.5,4.5], 'i' : ['a','b','a','b']})
-        self.assertEqual(f.dtypes['v'], 'float64')
-
-        z = pivot_table(f, values='v', index=['a'], columns=['i'], fill_value=0, aggfunc=np.mean)
-        result = z.get_dtype_counts()
-        expected = Series(dict(float64 = 2))
-        tm.assert_series_equal(result, expected)
-
-    def test_pivot_multi_values(self):
-        result = pivot_table(self.data, values=['D', 'E'],
-                             index='A', columns=['B', 'C'], fill_value=0)
-        expected = pivot_table(self.data.drop(['F'], axis=1),
-                               index='A', columns=['B', 'C'], fill_value=0)
-        tm.assert_frame_equal(result, expected)
-
-    def test_pivot_multi_functions(self):
-        f = lambda func: pivot_table(self.data, values=['D', 'E'],
-                                     index=['A', 'B'], columns='C',
-                                     aggfunc=func)
-        result = f([np.mean, np.std])
-        means = f(np.mean)
-        stds = f(np.std)
-        expected = concat([means, stds], keys=['mean', 'std'], axis=1)
-        tm.assert_frame_equal(result, expected)
-
-        # margins not supported??
-        f = lambda func: pivot_table(self.data, values=['D', 'E'],
-                                     index=['A', 'B'], columns='C',
-                                     aggfunc=func, margins=True)
-        result = f([np.mean, np.std])
-        means = f(np.mean)
-        stds = f(np.std)
-        expected = concat([means, stds], keys=['mean', 'std'], axis=1)
-        tm.assert_frame_equal(result, expected)
-
-    def test_pivot_index_with_nan(self):
-        # GH 3588
-        nan = np.nan
-        df = DataFrame({'a':['R1', 'R2', nan, 'R4'],
-                        'b':['C1', 'C2', 'C3' , 'C4'],
-                        'c':[10, 15, 17, 20]})
-        result = df.pivot('a','b','c')
-        expected = DataFrame([[nan,nan,17,nan],[10,nan,nan,nan],
-                              [nan,15,nan,nan],[nan,nan,nan,20]],
-                             index = Index([nan,'R1','R2','R4'], name='a'),
-                             columns = Index(['C1','C2','C3','C4'], name='b'))
-        tm.assert_frame_equal(result, expected)
-        tm.assert_frame_equal(df.pivot('b', 'a', 'c'), expected.T)
-
-        # GH9491
-        df = DataFrame({'a':pd.date_range('2014-02-01', periods=6, freq='D'),
-                        'c':100 + np.arange(6)})
-        df['b'] = df['a'] - pd.Timestamp('2014-02-02')
-        df.loc[1, 'a'] = df.loc[3, 'a'] = nan
-        df.loc[1, 'b'] = df.loc[4, 'b'] = nan
-
-        pv = df.pivot('a', 'b', 'c')
-        self.assertEqual(pv.notnull().values.sum(), len(df))
-
-        for _, row in df.iterrows():
-            self.assertEqual(pv.loc[row['a'], row['b']], row['c'])
-
-        tm.assert_frame_equal(df.pivot('b', 'a', 'c'), pv.T)
-
-    def test_pivot_with_tz(self):
-        # GH 5878
-        df = DataFrame({'dt1': [datetime.datetime(2013, 1, 1, 9, 0),
-                                datetime.datetime(2013, 1, 2, 9, 0),
-                                datetime.datetime(2013, 1, 1, 9, 0),
-                                datetime.datetime(2013, 1, 2, 9, 0)],
-                        'dt2': [datetime.datetime(2014, 1, 1, 9, 0),
-                                datetime.datetime(2014, 1, 1, 9, 0),
-                                datetime.datetime(2014, 1, 2, 9, 0),
-                                datetime.datetime(2014, 1, 2, 9, 0)],
-                        'data1': np.arange(4,dtype='int64'),
-                        'data2': np.arange(4,dtype='int64')})
-
-        df['dt1'] = df['dt1'].apply(lambda d: pd.Timestamp(d, tz='US/Pacific'))
-        df['dt2'] = df['dt2'].apply(lambda d: pd.Timestamp(d, tz='Asia/Tokyo'))
-
-        exp_col1 = Index(['data1', 'data1', 'data2', 'data2'])
-        exp_col2 = pd.DatetimeIndex(['2014/01/01 09:00', '2014/01/02 09:00'] * 2,
-                                    name='dt2', tz='Asia/Tokyo')
-        exp_col = pd.MultiIndex.from_arrays([exp_col1, exp_col2])
-        expected = DataFrame([[0, 2, 0, 2], [1, 3, 1, 3]],
-                             index=pd.DatetimeIndex(['2013/01/01 09:00', '2013/01/02 09:00'],
-                                                    name='dt1', tz='US/Pacific'),
-                             columns=exp_col)
-
-        pv =  df.pivot(index='dt1', columns='dt2')
-        tm.assert_frame_equal(pv, expected)
-
-        expected = DataFrame([[0, 2], [1, 3]],
-                     index=pd.DatetimeIndex(['2013/01/01 09:00', '2013/01/02 09:00'],
-                                            name='dt1', tz='US/Pacific'),
-                     columns=pd.DatetimeIndex(['2014/01/01 09:00', '2014/01/02 09:00'],
-                                            name='dt2', tz='Asia/Tokyo'))
-
-        pv =  df.pivot(index='dt1', columns='dt2', values='data1')
-        tm.assert_frame_equal(pv, expected)
-
-    def test_margins(self):
-        def _check_output(res, col, index=['A', 'B'], columns=['C']):
-            cmarg = res['All'][:-1]
-            exp = self.data.groupby(index)[col].mean()
-            tm.assert_series_equal(cmarg, exp, check_names=False)
-            self.assertEqual(cmarg.name, 'All')
-
-            res = res.sortlevel()
-            rmarg = res.xs(('All', ''))[:-1]
-            exp = self.data.groupby(columns)[col].mean()
-            tm.assert_series_equal(rmarg, exp, check_names=False)
-            self.assertEqual(rmarg.name, ('All', ''))
-
-            gmarg = res['All']['All', '']
-            exp = self.data[col].mean()
-            self.assertEqual(gmarg, exp)
-
-        # column specified
-        table = self.data.pivot_table('D', index=['A', 'B'], columns='C',
-                                      margins=True, aggfunc=np.mean)
-        _check_output(table, 'D')
-
-        # no column specified
-        table = self.data.pivot_table(index=['A', 'B'], columns='C',
-                                      margins=True, aggfunc=np.mean)
-        for valcol in table.columns.levels[0]:
-            _check_output(table[valcol], valcol)
-
-        # no col
-
-        # to help with a buglet
-        self.data.columns = [k * 2 for k in self.data.columns]
-        table = self.data.pivot_table(index=['AA', 'BB'], margins=True,
-                                      aggfunc=np.mean)
-        for valcol in table.columns:
-            gmarg = table[valcol]['All', '']
-            self.assertEqual(gmarg, self.data[valcol].mean())
-
-        # this is OK
-        table = self.data.pivot_table(index=['AA', 'BB'], margins=True,
-                                      aggfunc='mean')
-
-        # no rows
-        rtable = self.data.pivot_table(columns=['AA', 'BB'], margins=True,
-                                       aggfunc=np.mean)
-        tm.assertIsInstance(rtable, Series)
-        for item in ['DD', 'EE', 'FF']:
-            gmarg = table[item]['All', '']
-            self.assertEqual(gmarg, self.data[item].mean())
-
-        # issue number #8349: pivot_table with margins and dictionary aggfunc
-
-        df=DataFrame([  {'JOB':'Worker','NAME':'Bob' ,'YEAR':2013,'MONTH':12,'DAYS': 3,'SALARY': 17},
-                        {'JOB':'Employ','NAME':'Mary','YEAR':2013,'MONTH':12,'DAYS': 5,'SALARY': 23},
-                        {'JOB':'Worker','NAME':'Bob' ,'YEAR':2014,'MONTH': 1,'DAYS':10,'SALARY':100},
-                        {'JOB':'Worker','NAME':'Bob' ,'YEAR':2014,'MONTH': 1,'DAYS':11,'SALARY':110},
-                        {'JOB':'Employ','NAME':'Mary','YEAR':2014,'MONTH': 1,'DAYS':15,'SALARY':200},
-                        {'JOB':'Worker','NAME':'Bob' ,'YEAR':2014,'MONTH': 2,'DAYS': 8,'SALARY': 80},
-                        {'JOB':'Employ','NAME':'Mary','YEAR':2014,'MONTH': 2,'DAYS': 5,'SALARY':190} ])
-
-        df=df.set_index(['JOB','NAME','YEAR','MONTH'],drop=False,append=False)
-
-        rs=df.pivot_table(  index=['JOB','NAME'],
-                            columns=['YEAR','MONTH'],
-                            values=['DAYS','SALARY'],
-                            aggfunc={'DAYS':'mean','SALARY':'sum'},
-                            margins=True)
-
-        ex=df.pivot_table(index=['JOB','NAME'],columns=['YEAR','MONTH'],values=['DAYS'],aggfunc='mean',margins=True)
-
-        tm.assert_frame_equal(rs['DAYS'], ex['DAYS'])
-
-        ex=df.pivot_table(index=['JOB','NAME'],columns=['YEAR','MONTH'],values=['SALARY'],aggfunc='sum',margins=True)
-
-        tm.assert_frame_equal(rs['SALARY'], ex['SALARY'])
-
-
-
-    def test_pivot_integer_columns(self):
-        # caused by upstream bug in unstack
-
-        d = datetime.date.min
-        data = list(product(['foo', 'bar'], ['A', 'B', 'C'], ['x1', 'x2'],
-                            [d + datetime.timedelta(i) for i in range(20)], [1.0]))
-        df = DataFrame(data)
-        table = df.pivot_table(values=4, index=[0, 1, 3], columns=[2])
-
-        df2 = df.rename(columns=str)
-        table2 = df2.pivot_table(values='4', index=['0', '1', '3'], columns=['2'])
-
-        tm.assert_frame_equal(table, table2, check_names=False)
-
-    def test_pivot_no_level_overlap(self):
-        # GH #1181
-
-        data = DataFrame({'a': ['a', 'a', 'a', 'a', 'b', 'b', 'b', 'b'] * 2,
-                          'b': [0, 0, 0, 0, 1, 1, 1, 1] * 2,
-                          'c': (['foo'] * 4 + ['bar'] * 4) * 2,
-                          'value': np.random.randn(16)})
-
-        table = data.pivot_table('value', index='a', columns=['b', 'c'])
-
-        grouped = data.groupby(['a', 'b', 'c'])['value'].mean()
-        expected = grouped.unstack('b').unstack('c').dropna(axis=1, how='all')
-        tm.assert_frame_equal(table, expected)
-
-    def test_pivot_columns_lexsorted(self):
-
-        n = 10000
-
-        dtype = np.dtype([
-            ("Index", object),
-            ("Symbol", object),
-            ("Year", int),
-            ("Month", int),
-            ("Day", int),
-            ("Quantity", int),
-            ("Price", float),
-        ])
-
-        products = np.array([
-            ('SP500', 'ADBE'),
-            ('SP500', 'NVDA'),
-            ('SP500', 'ORCL'),
-            ('NDQ100', 'AAPL'),
-            ('NDQ100', 'MSFT'),
-            ('NDQ100', 'GOOG'),
-            ('FTSE', 'DGE.L'),
-            ('FTSE', 'TSCO.L'),
-            ('FTSE', 'GSK.L'),
-        ], dtype=[('Index', object), ('Symbol', object)])
-        items = np.empty(n, dtype=dtype)
-        iproduct = np.random.randint(0, len(products), n)
-        items['Index'] = products['Index'][iproduct]
-        items['Symbol'] = products['Symbol'][iproduct]
-        dr = pd.date_range(datetime.date(2000, 1, 1), datetime.date(2010, 12, 31))
-        dates = dr[np.random.randint(0, len(dr), n)]
-        items['Year'] = dates.year
-        items['Month'] = dates.month
-        items['Day'] = dates.day
-        items['Price'] = np.random.lognormal(4.0, 2.0, n)
-
-        df = DataFrame(items)
-
-        pivoted = df.pivot_table('Price', index=['Month', 'Day'],
-                                 columns=['Index', 'Symbol', 'Year'],
-                                 aggfunc='mean')
-
-        self.assertTrue(pivoted.columns.is_monotonic)
-
-    def test_pivot_complex_aggfunc(self):
-        f = {'D': ['std'], 'E': ['sum']}
-        expected = self.data.groupby(['A', 'B']).agg(f).unstack('B')
-        result = self.data.pivot_table(index='A', columns='B', aggfunc=f)
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_margins_no_values_no_cols(self):
-        # Regression test on pivot table: no values or cols passed.
-        result = self.data[['A', 'B']].pivot_table(index=['A', 'B'], aggfunc=len, margins=True)
-        result_list = result.tolist()
-        self.assertEqual(sum(result_list[:-1]), result_list[-1])
-
-    def test_margins_no_values_two_rows(self):
-        # Regression test on pivot table: no values passed but rows are a multi-index
-        result = self.data[['A', 'B', 'C']].pivot_table(index=['A', 'B'], columns='C', aggfunc=len, margins=True)
-        self.assertEqual(result.All.tolist(), [3.0, 1.0, 4.0, 3.0, 11.0])
-
-    def test_margins_no_values_one_row_one_col(self):
-        # Regression test on pivot table: no values passed but row and col defined
-        result = self.data[['A', 'B']].pivot_table(index='A', columns='B', aggfunc=len, margins=True)
-        self.assertEqual(result.All.tolist(), [4.0, 7.0, 11.0])
-
-    def test_margins_no_values_two_row_two_cols(self):
-        # Regression test on pivot table: no values passed but rows and cols are multi-indexed
-        self.data['D'] = ['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k']
-        result = self.data[['A', 'B', 'C', 'D']].pivot_table(index=['A', 'B'], columns=['C', 'D'], aggfunc=len, margins=True)
-        self.assertEqual(result.All.tolist(), [3.0, 1.0, 4.0, 3.0, 11.0])
-
-    def test_pivot_timegrouper(self):
-        df = DataFrame({
-            'Branch' : 'A A A A A A A B'.split(),
-            'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
-            'Quantity': [1, 3, 5, 1, 8, 1, 9, 3],
-            'Date' : [datetime.datetime(2013, 1, 1), datetime.datetime(2013, 1, 1),
-                      datetime.datetime(2013, 10, 1), datetime.datetime(2013, 10, 2),
-                      datetime.datetime(2013, 10, 1), datetime.datetime(2013, 10, 2),
-                      datetime.datetime(2013, 12, 2), datetime.datetime(2013, 12, 2),]}).set_index('Date')
-
-        expected = DataFrame(np.array([10, 18, 3],dtype='int64').reshape(1, 3),
-                             index=[datetime.datetime(2013, 12, 31)],
-                             columns='Carl Joe Mark'.split())
-        expected.index.name = 'Date'
-        expected.columns.name = 'Buyer'
-
-        result = pivot_table(df, index=Grouper(freq='A'), columns='Buyer',
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result,expected)
-
-        result = pivot_table(df, index='Buyer', columns=Grouper(freq='A'),
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result,expected.T)
-
-        expected = DataFrame(np.array([1, np.nan, 3, 9, 18, np.nan]).reshape(2, 3),
-                             index=[datetime.datetime(2013, 1, 1), datetime.datetime(2013, 7, 1)],
-                             columns='Carl Joe Mark'.split())
-        expected.index.name = 'Date'
-        expected.columns.name = 'Buyer'
-
-        result = pivot_table(df, index=Grouper(freq='6MS'), columns='Buyer',
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index='Buyer', columns=Grouper(freq='6MS'),
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected.T)
-
-        # passing the name
-        df = df.reset_index()
-        result = pivot_table(df, index=Grouper(freq='6MS', key='Date'), columns='Buyer',
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index='Buyer', columns=Grouper(freq='6MS', key='Date'),
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected.T)
-
-        self.assertRaises(KeyError, lambda : pivot_table(df, index=Grouper(freq='6MS', key='foo'),
-                          columns='Buyer', values='Quantity', aggfunc=np.sum))
-        self.assertRaises(KeyError, lambda : pivot_table(df, index='Buyer',
-                          columns=Grouper(freq='6MS', key='foo'), values='Quantity', aggfunc=np.sum))
-
-        # passing the level
-        df = df.set_index('Date')
-        result = pivot_table(df, index=Grouper(freq='6MS', level='Date'), columns='Buyer',
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index='Buyer', columns=Grouper(freq='6MS', level='Date'),
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected.T)
-
-        self.assertRaises(ValueError, lambda : pivot_table(df, index=Grouper(freq='6MS', level='foo'),
-                          columns='Buyer', values='Quantity', aggfunc=np.sum))
-        self.assertRaises(ValueError, lambda : pivot_table(df, index='Buyer',
-                          columns=Grouper(freq='6MS', level='foo'), values='Quantity', aggfunc=np.sum))
-
-        # double grouper
-        df = DataFrame({
-            'Branch' : 'A A A A A A A B'.split(),
-            'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
-            'Quantity': [1,3,5,1,8,1,9,3],
-            'Date' : [datetime.datetime(2013,11,1,13,0), datetime.datetime(2013,9,1,13,5),
-                      datetime.datetime(2013,10,1,20,0), datetime.datetime(2013,10,2,10,0),
-                      datetime.datetime(2013,11,1,20,0), datetime.datetime(2013,10,2,10,0),
-                      datetime.datetime(2013,10,2,12,0), datetime.datetime(2013,12,5,14,0)],
-            'PayDay' : [datetime.datetime(2013,10,4,0,0), datetime.datetime(2013,10,15,13,5),
-                        datetime.datetime(2013,9,5,20,0), datetime.datetime(2013,11,2,10,0),
-                        datetime.datetime(2013,10,7,20,0), datetime.datetime(2013,9,5,10,0),
-                        datetime.datetime(2013,12,30,12,0), datetime.datetime(2013,11,20,14,0),]})
-
-        result = pivot_table(df, index=Grouper(freq='M', key='Date'),
-                             columns=Grouper(freq='M', key='PayDay'),
-                             values='Quantity', aggfunc=np.sum)
-        expected = DataFrame(np.array([np.nan, 3, np.nan, np.nan, 6, np.nan, 1, 9,
-                                       np.nan, 9, np.nan, np.nan, np.nan, np.nan, 3, np.nan]).reshape(4, 4),
-                             index=[datetime.datetime(2013, 9, 30), datetime.datetime(2013, 10, 31),
-                                    datetime.datetime(2013, 11, 30), datetime.datetime(2013, 12, 31)],
-                             columns=[datetime.datetime(2013, 9, 30), datetime.datetime(2013, 10, 31),
-                                    datetime.datetime(2013, 11, 30), datetime.datetime(2013, 12, 31)])
-        expected.index.name = 'Date'
-        expected.columns.name = 'PayDay'
-
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index=Grouper(freq='M', key='PayDay'),
-                             columns=Grouper(freq='M', key='Date'),
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected.T)
-
-        tuples = [(datetime.datetime(2013, 9, 30), datetime.datetime(2013, 10, 31)),
-                  (datetime.datetime(2013, 10, 31), datetime.datetime(2013, 9, 30)),
-                  (datetime.datetime(2013, 10, 31), datetime.datetime(2013, 11, 30)),
-                  (datetime.datetime(2013, 10, 31), datetime.datetime(2013, 12, 31)),
-                  (datetime.datetime(2013, 11, 30), datetime.datetime(2013, 10, 31)),
-                  (datetime.datetime(2013, 12, 31), datetime.datetime(2013, 11, 30)),]
-        idx = MultiIndex.from_tuples(tuples, names=['Date', 'PayDay'])
-        expected = DataFrame(np.array([3, np.nan, 6, np.nan, 1, np.nan,
-                                       9, np.nan, 9, np.nan, np.nan, 3]).reshape(6, 2),
-                             index=idx, columns=['A', 'B'])
-        expected.columns.name = 'Branch'
-
-        result = pivot_table(df, index=[Grouper(freq='M', key='Date'),
-                             Grouper(freq='M', key='PayDay')], columns=['Branch'],
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index=['Branch'], columns=[Grouper(freq='M', key='Date'),
-                             Grouper(freq='M', key='PayDay')],
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected.T)
-
-    def test_pivot_datetime_tz(self):
-        dates1 = ['2011-07-19 07:00:00', '2011-07-19 08:00:00', '2011-07-19 09:00:00',
-                  '2011-07-19 07:00:00', '2011-07-19 08:00:00', '2011-07-19 09:00:00']
-        dates2 = ['2013-01-01 15:00:00', '2013-01-01 15:00:00', '2013-01-01 15:00:00',
-                  '2013-02-01 15:00:00', '2013-02-01 15:00:00', '2013-02-01 15:00:00']
-        df = DataFrame({'label': ['a', 'a', 'a', 'b', 'b', 'b'],
-                        'dt1': dates1, 'dt2': dates2,
-                        'value1': np.arange(6,dtype='int64'), 'value2': [1, 2] * 3})
-        df['dt1'] = df['dt1'].apply(lambda d: pd.Timestamp(d, tz='US/Pacific'))
-        df['dt2'] = df['dt2'].apply(lambda d: pd.Timestamp(d, tz='Asia/Tokyo'))
-
-        exp_idx = pd.DatetimeIndex(['2011-07-19 07:00:00', '2011-07-19 08:00:00',
-                                    '2011-07-19 09:00:00'], tz='US/Pacific', name='dt1')
-        exp_col1 = Index(['value1', 'value1'])
-        exp_col2 = Index(['a', 'b'], name='label')
-        exp_col = MultiIndex.from_arrays([exp_col1, exp_col2])
-        expected = DataFrame([[0, 3], [1, 4], [2, 5]],
-                             index=exp_idx, columns=exp_col)
-        result = pivot_table(df, index=['dt1'], columns=['label'], values=['value1'])
-        tm.assert_frame_equal(result, expected)
-
-
-        exp_col1 = Index(['sum', 'sum', 'sum', 'sum', 'mean', 'mean', 'mean', 'mean'])
-        exp_col2 = Index(['value1', 'value1', 'value2', 'value2'] * 2)
-        exp_col3 = pd.DatetimeIndex(['2013-01-01 15:00:00', '2013-02-01 15:00:00'] * 4,
-                                    tz='Asia/Tokyo', name='dt2')
-        exp_col = MultiIndex.from_arrays([exp_col1, exp_col2, exp_col3])
-        expected = DataFrame(np.array([[0, 3, 1, 2, 0, 3, 1, 2],
-                                       [1, 4, 2, 1, 1, 4, 2, 1],
-                                       [2, 5, 1, 2, 2, 5, 1, 2]], dtype='int64'),
-                             index=exp_idx,
-                             columns=exp_col)
-
-        result = pivot_table(df, index=['dt1'], columns=['dt2'], values=['value1', 'value2'],
-                             aggfunc=[np.sum, np.mean])
-        tm.assert_frame_equal(result, expected)
-
-    def test_pivot_dtaccessor(self):
-        # GH 8103
-        dates1 = ['2011-07-19 07:00:00', '2011-07-19 08:00:00', '2011-07-19 09:00:00',
-                  '2011-07-19 07:00:00', '2011-07-19 08:00:00', '2011-07-19 09:00:00']
-        dates2 = ['2013-01-01 15:00:00', '2013-01-01 15:00:00', '2013-01-01 15:00:00',
-                  '2013-02-01 15:00:00', '2013-02-01 15:00:00', '2013-02-01 15:00:00']
-        df = DataFrame({'label': ['a', 'a', 'a', 'b', 'b', 'b'],
-                        'dt1': dates1, 'dt2': dates2,
-                        'value1': np.arange(6,dtype='int64'), 'value2': [1, 2] * 3})
-        df['dt1'] = df['dt1'].apply(lambda d: pd.Timestamp(d))
-        df['dt2'] = df['dt2'].apply(lambda d: pd.Timestamp(d))
-
-        result = pivot_table(df, index='label', columns=df['dt1'].dt.hour,
-                             values='value1')
-
-        exp_idx = Index(['a', 'b'], name='label')
-        expected = DataFrame({7: [0, 3], 8: [1, 4], 9:[2, 5]},
-                             index=exp_idx, columns=Index([7, 8, 9],name='dt1'))
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index=df['dt2'].dt.month, columns=df['dt1'].dt.hour,
-                             values='value1')
-
-        expected = DataFrame({7: [0, 3], 8: [1, 4], 9:[2, 5]},
-                             index=Index([1, 2],name='dt2'), columns=Index([7, 8, 9],name='dt1'))
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index=df['dt2'].dt.year.values,
-                             columns=[df['dt1'].dt.hour, df['dt2'].dt.month],
-                             values='value1')
-
-        exp_col = MultiIndex.from_arrays([[7, 7, 8, 8, 9, 9], [1, 2] * 3],names=['dt1','dt2'])
-        expected = DataFrame(np.array([[0, 3, 1, 4, 2, 5]],dtype='int64'),
-                             index=[2013], columns=exp_col)
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index=np.array(['X', 'X', 'X', 'X', 'Y', 'Y']),
-                             columns=[df['dt1'].dt.hour, df['dt2'].dt.month],
-                             values='value1')
-        expected = DataFrame(np.array([[0, 3, 1, np.nan, 2, np.nan],
-                                       [np.nan, np.nan, np.nan, 4, np.nan, 5]]),
-                             index=['X', 'Y'], columns=exp_col)
-        tm.assert_frame_equal(result, expected)
-
-
-class TestCrosstab(tm.TestCase):
-
-    def setUp(self):
-        df = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
-                              'bar', 'bar', 'bar', 'bar',
-                              'foo', 'foo', 'foo'],
-                        'B': ['one', 'one', 'one', 'two',
-                              'one', 'one', 'one', 'two',
-                              'two', 'two', 'one'],
-                        'C': ['dull', 'dull', 'shiny', 'dull',
-                              'dull', 'shiny', 'shiny', 'dull',
-                              'shiny', 'shiny', 'shiny'],
-                        'D': np.random.randn(11),
-                        'E': np.random.randn(11),
-                        'F': np.random.randn(11)})
-
-        self.df = df.append(df, ignore_index=True)
-
-    def test_crosstab_single(self):
-        df = self.df
-        result = crosstab(df['A'], df['C'])
-        expected = df.groupby(['A', 'C']).size().unstack()
-        tm.assert_frame_equal(result, expected.fillna(0).astype(np.int64))
-
-    def test_crosstab_multiple(self):
-        df = self.df
-
-        result = crosstab(df['A'], [df['B'], df['C']])
-        expected = df.groupby(['A', 'B', 'C']).size()
-        expected = expected.unstack(
-            'B').unstack('C').fillna(0).astype(np.int64)
-        tm.assert_frame_equal(result, expected)
-
-        result = crosstab([df['B'], df['C']], df['A'])
-        expected = df.groupby(['B', 'C', 'A']).size()
-        expected = expected.unstack('A').fillna(0).astype(np.int64)
-        tm.assert_frame_equal(result, expected)
-
-    def test_crosstab_ndarray(self):
-        a = np.random.randint(0, 5, size=100)
-        b = np.random.randint(0, 3, size=100)
-        c = np.random.randint(0, 10, size=100)
-
-        df = DataFrame({'a': a, 'b': b, 'c': c})
-
-        result = crosstab(a, [b, c], rownames=['a'], colnames=('b', 'c'))
-        expected = crosstab(df['a'], [df['b'], df['c']])
-        tm.assert_frame_equal(result, expected)
-
-        result = crosstab([b, c], a, colnames=['a'], rownames=('b', 'c'))
-        expected = crosstab([df['b'], df['c']], df['a'])
-        tm.assert_frame_equal(result, expected)
-
-        # assign arbitrary names
-        result = crosstab(self.df['A'].values, self.df['C'].values)
-        self.assertEqual(result.index.name, 'row_0')
-        self.assertEqual(result.columns.name, 'col_0')
-
-    def test_crosstab_margins(self):
-        a = np.random.randint(0, 7, size=100)
-        b = np.random.randint(0, 3, size=100)
-        c = np.random.randint(0, 5, size=100)
-
-        df = DataFrame({'a': a, 'b': b, 'c': c})
-
-        result = crosstab(a, [b, c], rownames=['a'], colnames=('b', 'c'),
-                          margins=True)
-
-        self.assertEqual(result.index.names, ('a',))
-        self.assertEqual(result.columns.names, ['b', 'c'])
-
-        all_cols = result['All', '']
-        exp_cols = df.groupby(['a']).size().astype('i8')
-        exp_cols = exp_cols.append(Series([len(df)], index=['All']))
-        exp_cols.name = ('All', '')
-
-        tm.assert_series_equal(all_cols, exp_cols)
-
-        all_rows = result.ix['All']
-        exp_rows = df.groupby(['b', 'c']).size().astype('i8')
-        exp_rows = exp_rows.append(Series([len(df)], index=[('All', '')]))
-        exp_rows.name = 'All'
-
-        exp_rows = exp_rows.reindex(all_rows.index)
-        exp_rows = exp_rows.fillna(0).astype(np.int64)
-        tm.assert_series_equal(all_rows, exp_rows)
-
-    def test_crosstab_pass_values(self):
-        a = np.random.randint(0, 7, size=100)
-        b = np.random.randint(0, 3, size=100)
-        c = np.random.randint(0, 5, size=100)
-        values = np.random.randn(100)
-
-        table = crosstab([a, b], c, values, aggfunc=np.sum,
-                         rownames=['foo', 'bar'], colnames=['baz'])
-
-        df = DataFrame({'foo': a, 'bar': b, 'baz': c, 'values': values})
-
-        expected = df.pivot_table('values', index=['foo', 'bar'], columns='baz',
-                                  aggfunc=np.sum)
-        tm.assert_frame_equal(table, expected)
-
-    def test_crosstab_dropna(self):
-        # GH 3820
-        a = np.array(['foo', 'foo', 'foo', 'bar', 'bar', 'foo', 'foo'], dtype=object)
-        b = np.array(['one', 'one', 'two', 'one', 'two', 'two', 'two'], dtype=object)
-        c = np.array(['dull', 'dull', 'dull', 'dull', 'dull', 'shiny', 'shiny'], dtype=object)
-        res = crosstab(a, [b, c], rownames=['a'], colnames=['b', 'c'], dropna=False)
-        m = MultiIndex.from_tuples([('one', 'dull'), ('one', 'shiny'),
-                                    ('two', 'dull'), ('two', 'shiny')])
-        assert_equal(res.columns.values, m.values)
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tools/tests/test_tile.py b/pandas/tools/tests/test_tile.py
deleted file mode 100644
index eac6973bffb25..0000000000000
--- a/pandas/tools/tests/test_tile.py
+++ /dev/null
@@ -1,268 +0,0 @@
-import os
-import nose
-
-import numpy as np
-from pandas.compat import zip
-
-from pandas import DataFrame, Series, unique
-import pandas.util.testing as tm
-from pandas.util.testing import assertRaisesRegexp
-import pandas.core.common as com
-
-from pandas.core.algorithms import quantile
-from pandas.tools.tile import cut, qcut
-import pandas.tools.tile as tmod
-
-
-class TestCut(tm.TestCase):
-
-    def test_simple(self):
-        data = np.ones(5)
-        result = cut(data, 4, labels=False)
-        desired = [1, 1, 1, 1, 1]
-        tm.assert_numpy_array_equal(result, desired)
-
-    def test_bins(self):
-        data = np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1])
-        result, bins = cut(data, 3, retbins=True)
-        tm.assert_numpy_array_equal(result.codes, [0, 0, 0, 1, 2, 0])
-        tm.assert_almost_equal(bins, [0.1905, 3.36666667, 6.53333333, 9.7])
-
-    def test_right(self):
-        data = np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1, 2.575])
-        result, bins = cut(data, 4, right=True, retbins=True)
-        tm.assert_numpy_array_equal(result.codes, [0, 0, 0, 2, 3, 0, 0])
-        tm.assert_almost_equal(bins, [0.1905, 2.575, 4.95, 7.325, 9.7])
-
-    def test_noright(self):
-        data = np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1, 2.575])
-        result, bins = cut(data, 4, right=False, retbins=True)
-        tm.assert_numpy_array_equal(result.codes, [0, 0, 0, 2, 3, 0, 1])
-        tm.assert_almost_equal(bins, [0.2, 2.575, 4.95, 7.325, 9.7095])
-
-    def test_arraylike(self):
-        data = [.2, 1.4, 2.5, 6.2, 9.7, 2.1]
-        result, bins = cut(data, 3, retbins=True)
-        tm.assert_numpy_array_equal(result.codes, [0, 0, 0, 1, 2, 0])
-        tm.assert_almost_equal(bins, [0.1905, 3.36666667, 6.53333333, 9.7])
-
-    def test_bins_not_monotonic(self):
-        data = [.2, 1.4, 2.5, 6.2, 9.7, 2.1]
-        self.assertRaises(ValueError, cut, data, [0.1, 1.5, 1, 10])
-
-    def test_wrong_num_labels(self):
-        data = [.2, 1.4, 2.5, 6.2, 9.7, 2.1]
-        self.assertRaises(ValueError, cut, data, [0, 1, 10],
-                          labels=['foo', 'bar', 'baz'])
-
-    def test_cut_corner(self):
-        # h3h
-        self.assertRaises(ValueError, cut, [], 2)
-
-        self.assertRaises(ValueError, cut, [1, 2, 3], 0.5)
-
-    def test_cut_out_of_range_more(self):
-        # #1511
-        s = Series([0, -1, 0, 1, -3])
-        ind = cut(s, [0, 1], labels=False)
-        exp = [np.nan, np.nan, np.nan, 0, np.nan]
-        tm.assert_almost_equal(ind, exp)
-
-    def test_labels(self):
-        arr = np.tile(np.arange(0, 1.01, 0.1), 4)
-
-        result, bins = cut(arr, 4, retbins=True)
-        ex_levels = ['(-0.001, 0.25]', '(0.25, 0.5]', '(0.5, 0.75]',
-                     '(0.75, 1]']
-        self.assert_numpy_array_equal(result.categories, ex_levels)
-
-        result, bins = cut(arr, 4, retbins=True, right=False)
-        ex_levels = ['[0, 0.25)', '[0.25, 0.5)', '[0.5, 0.75)',
-                     '[0.75, 1.001)']
-        self.assert_numpy_array_equal(result.categories, ex_levels)
-
-    def test_cut_pass_series_name_to_factor(self):
-        s = Series(np.random.randn(100), name='foo')
-
-        factor = cut(s, 4)
-        self.assertEqual(factor.name, 'foo')
-
-    def test_label_precision(self):
-        arr = np.arange(0, 0.73, 0.01)
-
-        result = cut(arr, 4, precision=2)
-        ex_levels = ['(-0.00072, 0.18]', '(0.18, 0.36]', '(0.36, 0.54]',
-                     '(0.54, 0.72]']
-        self.assert_numpy_array_equal(result.categories, ex_levels)
-
-    def test_na_handling(self):
-        arr = np.arange(0, 0.75, 0.01)
-        arr[::3] = np.nan
-
-        result = cut(arr, 4)
-
-        result_arr = np.asarray(result)
-
-        ex_arr = np.where(com.isnull(arr), np.nan, result_arr)
-
-        tm.assert_almost_equal(result_arr, ex_arr)
-
-        result = cut(arr, 4, labels=False)
-        ex_result = np.where(com.isnull(arr), np.nan, result)
-        tm.assert_almost_equal(result, ex_result)
-
-    def test_inf_handling(self):
-        data = np.arange(6)
-        data_ser = Series(data,dtype='int64')
-
-        result = cut(data, [-np.inf, 2, 4, np.inf])
-        result_ser = cut(data_ser, [-np.inf, 2, 4, np.inf])
-
-        ex_categories = ['(-inf, 2]', '(2, 4]', '(4, inf]']
-
-        tm.assert_numpy_array_equal(result.categories, ex_categories)
-        tm.assert_numpy_array_equal(result_ser.cat.categories, ex_categories)
-        self.assertEqual(result[5], '(4, inf]')
-        self.assertEqual(result[0], '(-inf, 2]')
-        self.assertEqual(result_ser[5], '(4, inf]')
-        self.assertEqual(result_ser[0], '(-inf, 2]')
-
-    def test_qcut(self):
-        arr = np.random.randn(1000)
-
-        labels, bins = qcut(arr, 4, retbins=True)
-        ex_bins = quantile(arr, [0, .25, .5, .75, 1.])
-        tm.assert_almost_equal(bins, ex_bins)
-
-        ex_levels = cut(arr, ex_bins, include_lowest=True)
-        self.assert_numpy_array_equal(labels, ex_levels)
-
-    def test_qcut_bounds(self):
-        arr = np.random.randn(1000)
-
-        factor = qcut(arr, 10, labels=False)
-        self.assertEqual(len(np.unique(factor)), 10)
-
-    def test_qcut_specify_quantiles(self):
-        arr = np.random.randn(100)
-
-        factor = qcut(arr, [0, .25, .5, .75, 1.])
-        expected = qcut(arr, 4)
-        self.assertTrue(factor.equals(expected))
-
-    def test_qcut_all_bins_same(self):
-        assertRaisesRegexp(ValueError, "edges.*unique", qcut, [0,0,0,0,0,0,0,0,0,0], 3)
-
-    def test_cut_out_of_bounds(self):
-        arr = np.random.randn(100)
-
-        result = cut(arr, [-1, 0, 1])
-
-        mask = result.codes == -1
-        ex_mask = (arr < -1) | (arr > 1)
-        self.assert_numpy_array_equal(mask, ex_mask)
-
-    def test_cut_pass_labels(self):
-        arr = [50, 5, 10, 15, 20, 30, 70]
-        bins = [0, 25, 50, 100]
-        labels = ['Small', 'Medium', 'Large']
-
-        result = cut(arr, bins, labels=labels)
-
-        exp = cut(arr, bins)
-        exp.categories = labels
-
-        self.assertTrue(result.equals(exp))
-
-    def test_qcut_include_lowest(self):
-        values = np.arange(10)
-
-        cats = qcut(values, 4)
-
-        ex_levels = ['[0, 2.25]', '(2.25, 4.5]', '(4.5, 6.75]', '(6.75, 9]']
-        self.assertTrue((cats.categories == ex_levels).all())
-
-    def test_qcut_nas(self):
-        arr = np.random.randn(100)
-        arr[:20] = np.nan
-
-        result = qcut(arr, 4)
-        self.assertTrue(com.isnull(result[:20]).all())
-
-    def test_label_formatting(self):
-        self.assertEqual(tmod._trim_zeros('1.000'), '1')
-
-        # it works
-        result = cut(np.arange(11.), 2)
-
-        result = cut(np.arange(11.) / 1e10, 2)
-
-        # #1979, negative numbers
-
-        result = tmod._format_label(-117.9998, precision=3)
-        self.assertEqual(result, '-118')
-        result = tmod._format_label(117.9998, precision=3)
-        self.assertEqual(result, '118')
-
-    def test_qcut_binning_issues(self):
-        # #1978, 1979
-        path = os.path.join(curpath(), 'cut_data.csv')
-
-        arr = np.loadtxt(path)
-
-        result = qcut(arr, 20)
-
-        starts = []
-        ends = []
-        for lev in result.categories:
-            s, e = lev[1:-1].split(',')
-
-            self.assertTrue(s != e)
-
-            starts.append(float(s))
-            ends.append(float(e))
-
-        for (sp, sn), (ep, en) in zip(zip(starts[:-1], starts[1:]),
-                                      zip(ends[:-1], ends[1:])):
-            self.assertTrue(sp < sn)
-            self.assertTrue(ep < en)
-            self.assertTrue(ep <= sn)
-
-    def test_cut_return_categorical(self):
-        from pandas import Categorical
-        s = Series([0,1,2,3,4,5,6,7,8])
-        res = cut(s,3)
-        exp = Series(Categorical.from_codes([0,0,0,1,1,1,2,2,2],
-                                            ["(-0.008, 2.667]", "(2.667, 5.333]", "(5.333, 8]"],
-                                            ordered=True))
-        tm.assert_series_equal(res, exp)
-
-    def test_qcut_return_categorical(self):
-        from pandas import Categorical
-        s = Series([0,1,2,3,4,5,6,7,8])
-        res = qcut(s,[0,0.333,0.666,1])
-        exp = Series(Categorical.from_codes([0,0,0,1,1,1,2,2,2],
-                                            ["[0, 2.664]", "(2.664, 5.328]", "(5.328, 8]"],
-                                            ordered=True))
-        tm.assert_series_equal(res, exp)
-
-    def test_series_retbins(self):
-        # GH 8589
-        s = Series(np.arange(4))
-        result, bins = cut(s, 2, retbins=True)
-        tm.assert_numpy_array_equal(result.cat.codes.values, [0, 0, 1, 1])
-        tm.assert_almost_equal(bins, [-0.003, 1.5, 3])
-
-        result, bins = qcut(s, 2, retbins=True)
-        tm.assert_numpy_array_equal(result.cat.codes.values, [0, 0, 1, 1])
-        tm.assert_almost_equal(bins, [0, 1.5, 3])
-
-
-def curpath():
-    pth, _ = os.path.split(os.path.abspath(__file__))
-    return pth
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tools/tests/test_util.py b/pandas/tools/tests/test_util.py
deleted file mode 100644
index 72ce7d8659157..0000000000000
--- a/pandas/tools/tests/test_util.py
+++ /dev/null
@@ -1,143 +0,0 @@
-import os
-import locale
-import codecs
-import nose
-from nose.tools import assert_raises, assert_true
-
-import numpy as np
-from numpy.testing import assert_equal
-
-import pandas as pd
-from pandas import date_range, Index
-import pandas.util.testing as tm
-from pandas.tools.util import cartesian_product, to_numeric
-
-CURRENT_LOCALE = locale.getlocale()
-LOCALE_OVERRIDE = os.environ.get('LOCALE_OVERRIDE', None)
-
-
-class TestCartesianProduct(tm.TestCase):
-
-    def test_simple(self):
-        x, y = list('ABC'), [1, 22]
-        result = cartesian_product([x, y])
-        expected = [np.array(['A', 'A', 'B', 'B', 'C', 'C']),
-                    np.array([ 1, 22,  1, 22,  1, 22])]
-        assert_equal(result, expected)
-
-    def test_datetimeindex(self):
-        # regression test for GitHub issue #6439
-        # make sure that the ordering on datetimeindex is consistent
-        x = date_range('2000-01-01', periods=2)
-        result = [Index(y).day for y in cartesian_product([x, x])]
-        expected = [np.array([1, 1, 2, 2]), np.array([1, 2, 1, 2])]
-        assert_equal(result, expected)
-
-
-class TestLocaleUtils(tm.TestCase):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestLocaleUtils, cls).setUpClass()
-        cls.locales = tm.get_locales()
-
-        if not cls.locales:
-            raise nose.SkipTest("No locales found")
-
-        tm._skip_if_windows()
-
-    @classmethod
-    def tearDownClass(cls):
-        super(TestLocaleUtils, cls).tearDownClass()
-        del cls.locales
-
-    def test_get_locales(self):
-        # all systems should have at least a single locale
-        assert len(tm.get_locales()) > 0
-
-    def test_get_locales_prefix(self):
-        if len(self.locales) == 1:
-            raise nose.SkipTest("Only a single locale found, no point in "
-                                "trying to test filtering locale prefixes")
-        first_locale = self.locales[0]
-        assert len(tm.get_locales(prefix=first_locale[:2])) > 0
-
-    def test_set_locale(self):
-        if len(self.locales) == 1:
-            raise nose.SkipTest("Only a single locale found, no point in "
-                                "trying to test setting another locale")
-
-        if LOCALE_OVERRIDE is not None:
-            lang, enc = LOCALE_OVERRIDE.split('.')
-        else:
-            lang, enc = 'it_CH', 'UTF-8'
-
-        enc = codecs.lookup(enc).name
-        new_locale = lang, enc
-
-        if not tm._can_set_locale(new_locale):
-            with tm.assertRaises(locale.Error):
-                with tm.set_locale(new_locale):
-                    pass
-        else:
-            with tm.set_locale(new_locale) as normalized_locale:
-                new_lang, new_enc = normalized_locale.split('.')
-                new_enc = codecs.lookup(enc).name
-                normalized_locale = new_lang, new_enc
-                self.assertEqual(normalized_locale, new_locale)
-
-        current_locale = locale.getlocale()
-        self.assertEqual(current_locale, CURRENT_LOCALE)
-
-
-class TestToNumeric(tm.TestCase):
-    def test_series(self):
-        s = pd.Series(['1', '-3.14', '7'])
-        res = to_numeric(s)
-        expected = pd.Series([1, -3.14, 7])
-        tm.assert_series_equal(res, expected)
-
-        s = pd.Series(['1', '-3.14', 7])
-        res = to_numeric(s)
-        tm.assert_series_equal(res, expected)
-
-    def test_error(self):
-        s = pd.Series([1, -3.14, 'apple'])
-        assert_raises(ValueError, to_numeric, s, errors='raise')
-
-        res = to_numeric(s, errors='ignore')
-        expected = pd.Series([1, -3.14, 'apple'])
-        tm.assert_series_equal(res, expected)
-
-        res = to_numeric(s, errors='coerce')
-        expected = pd.Series([1, -3.14, np.nan])
-        tm.assert_series_equal(res, expected)
-
-
-    def test_list(self):
-        s = ['1', '-3.14', '7']
-        res = to_numeric(s)
-        expected = np.array([1, -3.14, 7])
-        tm.assert_numpy_array_equal(res, expected)
-
-    def test_numeric(self):
-        s = pd.Series([1, -3.14, 7], dtype='O')
-        res = to_numeric(s)
-        expected = pd.Series([1, -3.14, 7])
-        tm.assert_series_equal(res, expected)
-
-        s = pd.Series([1, -3.14, 7])
-        res = to_numeric(s)
-        tm.assert_series_equal(res, expected)
-
-    def test_all_nan(self):
-        s = pd.Series(['a','b','c'])
-        res = to_numeric(s, errors='coerce')
-        expected = pd.Series([np.nan, np.nan, np.nan])
-        tm.assert_series_equal(res, expected)
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
-
diff --git a/pandas/tools/tile.py b/pandas/tools/tile.py
deleted file mode 100644
index 416addfcf2ad5..0000000000000
--- a/pandas/tools/tile.py
+++ /dev/null
@@ -1,297 +0,0 @@
-"""
-Quantilization functions and related stuff
-"""
-
-from pandas.core.api import DataFrame, Series
-from pandas.core.categorical import Categorical
-from pandas.core.index import _ensure_index
-import pandas.core.algorithms as algos
-import pandas.core.common as com
-import pandas.core.nanops as nanops
-from pandas.compat import zip
-
-import numpy as np
-
-
-def cut(x, bins, right=True, labels=None, retbins=False, precision=3,
-        include_lowest=False):
-    """
-    Return indices of half-open bins to which each value of `x` belongs.
-
-    Parameters
-    ----------
-    x : array-like
-        Input array to be binned. It has to be 1-dimensional.
-    bins : int or sequence of scalars
-        If `bins` is an int, it defines the number of equal-width bins in the
-        range of `x`. However, in this case, the range of `x` is extended
-        by .1% on each side to include the min or max values of `x`. If
-        `bins` is a sequence it defines the bin edges allowing for
-        non-uniform bin width. No extension of the range of `x` is done in
-        this case.
-    right : bool, optional
-        Indicates whether the bins include the rightmost edge or not. If
-        right == True (the default), then the bins [1,2,3,4] indicate
-        (1,2], (2,3], (3,4].
-    labels : array or boolean, default None
-        Used as labels for the resulting bins. Must be of the same length as the resulting
-        bins. If False, return only integer indicators of the bins.
-    retbins : bool, optional
-        Whether to return the bins or not. Can be useful if bins is given
-        as a scalar.
-    precision : int
-        The precision at which to store and display the bins labels
-    include_lowest : bool
-        Whether the first interval should be left-inclusive or not.
-
-    Returns
-    -------
-    out : Categorical or Series or array of integers if labels is False
-        The return type (Categorical or Series) depends on the input: a Series of type category if
-        input is a Series else Categorical. Bins are represented as categories when categorical
-        data is returned.
-    bins : ndarray of floats
-        Returned only if `retbins` is True.
-
-    Notes
-    -----
-    The `cut` function can be useful for going from a continuous variable to
-    a categorical variable. For example, `cut` could convert ages to groups
-    of age ranges.
-
-    Any NA values will be NA in the result.  Out of bounds values will be NA in
-    the resulting Categorical object
-
-
-    Examples
-    --------
-    >>> pd.cut(np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1]), 3, retbins=True)
-    ([(0.191, 3.367], (0.191, 3.367], (0.191, 3.367], (3.367, 6.533], (6.533, 9.7], (0.191, 3.367]]
-    Categories (3, object): [(0.191, 3.367] < (3.367, 6.533] < (6.533, 9.7]],
-    array([ 0.1905    ,  3.36666667,  6.53333333,  9.7       ]))
-    >>> pd.cut(np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1]), 3, labels=["good","medium","bad"])
-    [good, good, good, medium, bad, good]
-    Categories (3, object): [good < medium < bad]
-    >>> pd.cut(np.ones(5), 4, labels=False)
-    array([1, 1, 1, 1, 1], dtype=int64)
-    """
-    # NOTE: this binning code is changed a bit from histogram for var(x) == 0
-    if not np.iterable(bins):
-        if np.isscalar(bins) and bins < 1:
-            raise ValueError("`bins` should be a positive integer.")
-        try:  # for array-like
-            sz = x.size
-        except AttributeError:
-            x = np.asarray(x)
-            sz = x.size
-        if sz == 0:
-            raise ValueError('Cannot cut empty array')
-            # handle empty arrays. Can't determine range, so use 0-1.
-            # rng = (0, 1)
-        else:
-            rng = (nanops.nanmin(x), nanops.nanmax(x))
-        mn, mx = [mi + 0.0 for mi in rng]
-
-        if mn == mx:  # adjust end points before binning
-            mn -= .001 * mn
-            mx += .001 * mx
-            bins = np.linspace(mn, mx, bins + 1, endpoint=True)
-        else:  # adjust end points after binning
-            bins = np.linspace(mn, mx, bins + 1, endpoint=True)
-            adj = (mx - mn) * 0.001  # 0.1% of the range
-            if right:
-                bins[0] -= adj
-            else:
-                bins[-1] += adj
-
-    else:
-        bins = np.asarray(bins)
-        if (np.diff(bins) < 0).any():
-            raise ValueError('bins must increase monotonically.')
-
-    return _bins_to_cuts(x, bins, right=right, labels=labels,retbins=retbins, precision=precision,
-                         include_lowest=include_lowest)
-
-
-
-def qcut(x, q, labels=None, retbins=False, precision=3):
-    """
-    Quantile-based discretization function. Discretize variable into
-    equal-sized buckets based on rank or based on sample quantiles. For example
-    1000 values for 10 quantiles would produce a Categorical object indicating
-    quantile membership for each data point.
-
-    Parameters
-    ----------
-    x : ndarray or Series
-    q : integer or array of quantiles
-        Number of quantiles. 10 for deciles, 4 for quartiles, etc. Alternately
-        array of quantiles, e.g. [0, .25, .5, .75, 1.] for quartiles
-    labels : array or boolean, default None
-        Used as labels for the resulting bins. Must be of the same length as the resulting
-        bins. If False, return only integer indicators of the bins.
-    retbins : bool, optional
-        Whether to return the bins or not. Can be useful if bins is given
-        as a scalar.
-    precision : int
-        The precision at which to store and display the bins labels
-
-    Returns
-    -------
-    out : Categorical or Series or array of integers if labels is False
-        The return type (Categorical or Series) depends on the input: a Series of type category if
-        input is a Series else Categorical. Bins are represented as categories when categorical
-        data is returned.
-    bins : ndarray of floats
-        Returned only if `retbins` is True.
-
-    Notes
-    -----
-    Out of bounds values will be NA in the resulting Categorical object
-
-    Examples
-    --------
-    >>> pd.qcut(range(5), 4)
-    [[0, 1], [0, 1], (1, 2], (2, 3], (3, 4]]
-    Categories (4, object): [[0, 1] < (1, 2] < (2, 3] < (3, 4]]
-    >>> pd.qcut(range(5), 3, labels=["good","medium","bad"])
-    [good, good, medium, bad, bad]
-    Categories (3, object): [good < medium < bad]
-    >>> pd.qcut(range(5), 4, labels=False)
-    array([0, 0, 1, 2, 3], dtype=int64)
-    """
-    if com.is_integer(q):
-        quantiles = np.linspace(0, 1, q + 1)
-    else:
-        quantiles = q
-    bins = algos.quantile(x, quantiles)
-    return _bins_to_cuts(x, bins, labels=labels, retbins=retbins,precision=precision,
-                         include_lowest=True)
-
-
-
-def _bins_to_cuts(x, bins, right=True, labels=None, retbins=False,
-                  precision=3, name=None, include_lowest=False):
-    x_is_series = isinstance(x, Series)
-    series_index = None
-
-    if x_is_series:
-        series_index = x.index
-        if name is None:
-            name = x.name
-
-    x = np.asarray(x)
-
-    side = 'left' if right else 'right'
-    ids = bins.searchsorted(x, side=side)
-
-    if len(algos.unique(bins)) < len(bins):
-        raise ValueError('Bin edges must be unique: %s' % repr(bins))
-
-    if include_lowest:
-        ids[x == bins[0]] = 1
-
-    na_mask = com.isnull(x) | (ids == len(bins)) | (ids == 0)
-    has_nas = na_mask.any()
-
-    if labels is not False:
-        if labels is None:
-            increases = 0
-            while True:
-                try:
-                    levels = _format_levels(bins, precision, right=right,
-                                            include_lowest=include_lowest)
-                except ValueError:
-                    increases += 1
-                    precision += 1
-                    if increases >= 20:
-                        raise
-                else:
-                    break
-
-        else:
-            if len(labels) != len(bins) - 1:
-                raise ValueError('Bin labels must be one fewer than '
-                                 'the number of bin edges')
-            levels = labels
-
-        levels = np.asarray(levels, dtype=object)
-        np.putmask(ids, na_mask, 0)
-        fac = Categorical(ids - 1, levels, ordered=True, fastpath=True)
-    else:
-        fac = ids - 1
-        if has_nas:
-            fac = fac.astype(np.float64)
-            np.putmask(fac, na_mask, np.nan)
-
-    if x_is_series:
-        fac = Series(fac, index=series_index, name=name)
-
-    if not retbins:
-        return fac
-
-    return fac, bins
-
-
-def _format_levels(bins, prec, right=True,
-                   include_lowest=False):
-    fmt = lambda v: _format_label(v, precision=prec)
-    if right:
-        levels = []
-        for a, b in zip(bins, bins[1:]):
-            fa, fb = fmt(a), fmt(b)
-
-            if a != b and fa == fb:
-                raise ValueError('precision too low')
-
-            formatted = '(%s, %s]' % (fa, fb)
-
-            levels.append(formatted)
-
-        if include_lowest:
-            levels[0] = '[' + levels[0][1:]
-    else:
-        levels = ['[%s, %s)' % (fmt(a), fmt(b))
-                  for a, b in zip(bins, bins[1:])]
-
-    return levels
-
-
-def _format_label(x, precision=3):
-    fmt_str = '%%.%dg' % precision
-    if np.isinf(x):
-        return str(x)
-    elif com.is_float(x):
-        frac, whole = np.modf(x)
-        sgn = '-' if x < 0 else ''
-        whole = abs(whole)
-        if frac != 0.0:
-            val = fmt_str % frac
-
-            # rounded up or down
-            if '.' not in val:
-                if x < 0:
-                    return '%d' % (-whole - 1)
-                else:
-                    return '%d' % (whole + 1)
-
-            if 'e' in val:
-                return _trim_zeros(fmt_str % x)
-            else:
-                val = _trim_zeros(val)
-                if '.' in val:
-                    return sgn + '.'.join(('%d' % whole, val.split('.')[1]))
-                else:  # pragma: no cover
-                    return sgn + '.'.join(('%d' % whole, val))
-        else:
-            return sgn + '%0.f' % whole
-    else:
-        return str(x)
-
-
-def _trim_zeros(x):
-    while len(x) > 1 and x[-1] == '0':
-        x = x[:-1]
-    if len(x) > 1 and x[-1] == '.':
-        x = x[:-1]
-    return x
diff --git a/pandas/tools/util.py b/pandas/tools/util.py
deleted file mode 100644
index 925c23255b5f5..0000000000000
--- a/pandas/tools/util.py
+++ /dev/null
@@ -1,104 +0,0 @@
-import numpy as np
-import pandas.lib as lib
-
-import pandas as pd
-from pandas.compat import reduce
-from pandas.core.index import Index
-from pandas.core import common as com
-
-
-def match(needles, haystack):
-    haystack = Index(haystack)
-    needles = Index(needles)
-    return haystack.get_indexer(needles)
-
-
-def cartesian_product(X):
-    '''
-    Numpy version of itertools.product or pandas.compat.product.
-    Sometimes faster (for large inputs)...
-
-    Examples
-    --------
-    >>> cartesian_product([list('ABC'), [1, 2]])
-    [array(['A', 'A', 'B', 'B', 'C', 'C'], dtype='|S1'),
-    array([1, 2, 1, 2, 1, 2])]
-
-    '''
-
-    lenX = np.fromiter((len(x) for x in X), dtype=int)
-    cumprodX = np.cumproduct(lenX)
-
-    a = np.roll(cumprodX, 1)
-    a[0] = 1
-
-    b = cumprodX[-1] / cumprodX
-
-    return [np.tile(np.repeat(np.asarray(com._values_from_object(x)), b[i]),
-                    np.product(a[i]))
-               for i, x in enumerate(X)]
-
-
-def _compose2(f, g):
-    """Compose 2 callables"""
-    return lambda *args, **kwargs: f(g(*args, **kwargs))
-
-
-def compose(*funcs):
-    """Compose 2 or more callables"""
-    assert len(funcs) > 1, 'At least 2 callables must be passed to compose'
-    return reduce(_compose2, funcs)
-
-
-def to_numeric(arg, errors='raise'):
-    """
-    Convert argument to a numeric type.
-
-    Parameters
-    ----------
-    arg : list, tuple or array of objects, or Series
-    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
-        - If 'raise', then invalid parsing will raise an exception
-        - If 'coerce', then invalid parsing will be set as NaN
-        - If 'ignore', then invalid parsing will return the input
-
-    Returns
-    -------
-    ret : numeric if parsing succeeded.
-        Return type depends on input.  Series if Series, otherwise ndarray
-
-    Examples
-    --------
-    Take separate series and convert to numeric, coercing when told to
-
-    >>> import pandas as pd
-    >>> s = pd.Series(['1.0', '2', -3])
-    >>> pd.to_numeric(s)
-    >>> s = pd.Series(['apple', '1.0', '2', -3])
-    >>> pd.to_numeric(s, errors='ignore')
-    >>> pd.to_numeric(s, errors='coerce')
-    """
-
-    index = name = None
-    if isinstance(arg, pd.Series):
-        index, name = arg.index, arg.name
-    elif isinstance(arg, (list, tuple)):
-        arg = np.array(arg, dtype='O')
-
-    conv = arg
-    arg = com._ensure_object(arg)
-
-    coerce_numeric = False if errors in ('ignore', 'raise') else True
-
-    try:
-        conv = lib.maybe_convert_numeric(arg,
-                                         set(),
-                                         coerce_numeric=coerce_numeric)
-    except:
-        if errors == 'raise':
-            raise
-
-    if index is not None:
-        return pd.Series(conv, index=index, name=name)
-    else:
-        return conv
diff --git a/pandas/tseries/api.py b/pandas/tseries/api.py
index 7c47bd9a232a9..2094791ecdc60 100644
--- a/pandas/tseries/api.py
+++ b/pandas/tseries/api.py
@@ -1,13 +1,8 @@
 """
-
+Timeseries API
 """
 
+# flake8: noqa
 
-from pandas.tseries.index import DatetimeIndex, date_range, bdate_range
 from pandas.tseries.frequencies import infer_freq
-from pandas.tseries.tdi import Timedelta, TimedeltaIndex, timedelta_range
-from pandas.tseries.period import Period, PeriodIndex, period_range, pnow
-from pandas.tseries.resample import TimeGrouper
-from pandas.tseries.timedeltas import to_timedelta
-from pandas.lib import NaT
 import pandas.tseries.offsets as offsets
diff --git a/pandas/tseries/base.py b/pandas/tseries/base.py
deleted file mode 100644
index 2f4858300293e..0000000000000
--- a/pandas/tseries/base.py
+++ /dev/null
@@ -1,568 +0,0 @@
-"""
-Base and utility classes for tseries type pandas objects.
-"""
-
-import warnings
-from datetime import datetime, timedelta
-
-from pandas import compat
-import numpy as np
-from pandas.core import common as com, algorithms
-from pandas.core.common import is_integer, is_float, AbstractMethodError
-import pandas.tslib as tslib
-import pandas.lib as lib
-from pandas.core.index import Index
-from pandas.util.decorators import Appender, cache_readonly
-import pandas.tseries.frequencies as frequencies
-import pandas.algos as _algos
-
-
-
-class DatelikeOps(object):
-    """ common ops for DatetimeIndex/PeriodIndex, but not TimedeltaIndex """
-
-    def strftime(self, date_format):
-        """
-        Return an array of formatted strings specified by date_format, which
-        supports the same string format as the python standard library. Details
-        of the string format can be found in the `python string format doc
-        <https://docs.python.org/2/library/datetime.html#strftime-and-strptime-behavior>`__
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        date_format : str
-            date format string (e.g. "%Y-%m-%d")
-
-        Returns
-        -------
-        ndarray of formatted strings
-        """
-        return np.asarray(self.format(date_format=date_format))
-
-
-class DatetimeIndexOpsMixin(object):
-    """ common ops mixin to support a unified inteface datetimelike Index """
-
-    def __iter__(self):
-        return (self._box_func(v) for v in self.asi8)
-
-    @staticmethod
-    def _join_i8_wrapper(joinf, dtype, with_indexers=True):
-        """ create the join wrapper methods """
-
-        @staticmethod
-        def wrapper(left, right):
-            if isinstance(left, (np.ndarray, com.ABCIndex, com.ABCSeries)):
-                left = left.view('i8')
-            if isinstance(right, (np.ndarray, com.ABCIndex, com.ABCSeries)):
-                right = right.view('i8')
-            results = joinf(left, right)
-            if with_indexers:
-                join_index, left_indexer, right_indexer = results
-                join_index = join_index.view(dtype)
-                return join_index, left_indexer, right_indexer
-            return results
-
-        return wrapper
-
-    @property
-    def _box_func(self):
-        """
-        box function to get object from internal representation
-        """
-        raise AbstractMethodError(self)
-
-    def _box_values(self, values):
-        """
-        apply box func to passed values
-        """
-        return lib.map_infer(values, self._box_func)
-
-    def groupby(self, f):
-        objs = self.asobject.values
-        return _algos.groupby_object(objs, f)
-
-    def _format_with_header(self, header, **kwargs):
-        return header + list(self._format_native_types(**kwargs))
-
-    def __contains__(self, key):
-        try:
-            res = self.get_loc(key)
-            return np.isscalar(res) or type(res) == slice or np.any(res)
-        except (KeyError, TypeError, ValueError):
-            return False
-
-    def __getitem__(self, key):
-        getitem = self._data.__getitem__
-        if np.isscalar(key):
-            val = getitem(key)
-            return self._box_func(val)
-        else:
-            if com.is_bool_indexer(key):
-                key = np.asarray(key)
-                if key.all():
-                    key = slice(0, None, None)
-                else:
-                    key = lib.maybe_booleans_to_slice(key.view(np.uint8))
-
-            attribs = self._get_attributes_dict()
-
-            freq = None
-            if isinstance(key, slice):
-                if self.freq is not None and key.step is not None:
-                    freq = key.step * self.freq
-                else:
-                    freq = self.freq
-            attribs['freq'] = freq
-
-            result = getitem(key)
-            if result.ndim > 1:
-                return result
-
-            return self._simple_new(result, **attribs)
-
-    @property
-    def freqstr(self):
-        """ return the frequency object as a string if its set, otherwise None """
-        if self.freq is None:
-            return None
-        return self.freq.freqstr
-
-    @cache_readonly
-    def inferred_freq(self):
-        """
-        Trys to return a string representing a frequency guess,
-        generated by infer_freq.  Returns None if it can't autodetect the
-        frequency.
-        """
-        try:
-            return frequencies.infer_freq(self)
-        except ValueError:
-            return None
-
-    # Try to run function on index first, and then on elements of index
-    # Especially important for group-by functionality
-    def map(self, f):
-        try:
-            result = f(self)
-            if not isinstance(result, (np.ndarray, Index)):
-                raise TypeError
-            return result
-        except Exception:
-            return _algos.arrmap_object(self.asobject.values, f)
-
-    def sort_values(self, return_indexer=False, ascending=True):
-        """
-        Return sorted copy of Index
-        """
-        if return_indexer:
-            _as = self.argsort()
-            if not ascending:
-                _as = _as[::-1]
-            sorted_index = self.take(_as)
-            return sorted_index, _as
-        else:
-            sorted_values = np.sort(self.values)
-            attribs = self._get_attributes_dict()
-            freq = attribs['freq']
-            from pandas.tseries.period import PeriodIndex
-            if freq is not None and not isinstance(self, PeriodIndex):
-                if freq.n > 0 and not ascending:
-                    freq = freq * -1
-                elif freq.n < 0 and ascending:
-                    freq = freq * -1
-            attribs['freq'] = freq
-
-            if not ascending:
-                sorted_values = sorted_values[::-1]
-
-            return self._simple_new(sorted_values, **attribs)
-
-    def take(self, indices, axis=0, **kwargs):
-        """
-        Analogous to ndarray.take
-        """
-        indices = com._ensure_int64(indices)
-        maybe_slice = lib.maybe_indices_to_slice(indices, len(self))
-        if isinstance(maybe_slice, slice):
-            return self[maybe_slice]
-        taken = self.asi8.take(com._ensure_platform_int(indices))
-        return self._shallow_copy(taken, freq=None)
-
-    def get_duplicates(self):
-        values = Index.get_duplicates(self)
-        return self._simple_new(values)
-
-    @cache_readonly
-    def hasnans(self):
-        """ return if I have any nans; enables various perf speedups """
-        return (self.asi8 == tslib.iNaT).any()
-
-    @property
-    def asobject(self):
-        from pandas.core.index import Index
-        return Index(self._box_values(self.asi8), name=self.name, dtype=object)
-
-    def _convert_tolerance(self, tolerance):
-        try:
-            return tslib.Timedelta(tolerance).to_timedelta64()
-        except ValueError:
-            raise ValueError('tolerance argument for %s must be convertible '
-                             'to Timedelta: %r'
-                             % (type(self).__name__, tolerance))
-
-    def _maybe_mask_results(self, result, fill_value=None, convert=None):
-        """
-        Parameters
-        ----------
-        result : a ndarray
-        convert : string/dtype or None
-
-        Returns
-        -------
-        result : ndarray with values replace by the fill_value
-
-        mask the result if needed, convert to the provided dtype if its not None
-
-        This is an internal routine
-        """
-
-        if self.hasnans:
-            mask = self.asi8 == tslib.iNaT
-            if convert:
-                result = result.astype(convert)
-            if fill_value is None:
-                fill_value = np.nan
-            result[mask] = fill_value
-        return result
-
-    def tolist(self):
-        """
-        return a list of the underlying data
-        """
-        return list(self.asobject)
-
-    def min(self, axis=None):
-        """
-        return the minimum value of the Index
-
-        See also
-        --------
-        numpy.ndarray.min
-        """
-        try:
-            i8 = self.asi8
-
-            # quick check
-            if len(i8) and self.is_monotonic:
-                if i8[0] != tslib.iNaT:
-                    return self._box_func(i8[0])
-
-            if self.hasnans:
-                mask = i8 == tslib.iNaT
-                min_stamp = i8[~mask].min()
-            else:
-                min_stamp = i8.min()
-            return self._box_func(min_stamp)
-        except ValueError:
-            return self._na_value
-
-    def argmin(self, axis=None):
-        """
-        return a ndarray of the minimum argument indexer
-
-        See also
-        --------
-        numpy.ndarray.argmin
-        """
-
-        i8 = self.asi8
-        if self.hasnans:
-            mask = i8 == tslib.iNaT
-            if mask.all():
-                return -1
-            i8 = i8.copy()
-            i8[mask] = np.iinfo('int64').max
-        return i8.argmin()
-
-    def max(self, axis=None):
-        """
-        return the maximum value of the Index
-
-        See also
-        --------
-        numpy.ndarray.max
-        """
-        try:
-            i8 = self.asi8
-
-            # quick check
-            if len(i8) and self.is_monotonic:
-                if i8[-1] != tslib.iNaT:
-                    return self._box_func(i8[-1])
-
-            if self.hasnans:
-                mask = i8 == tslib.iNaT
-                max_stamp = i8[~mask].max()
-            else:
-                max_stamp = i8.max()
-            return self._box_func(max_stamp)
-        except ValueError:
-            return self._na_value
-
-    def argmax(self, axis=None):
-        """
-        return a ndarray of the maximum argument indexer
-
-        See also
-        --------
-        numpy.ndarray.argmax
-        """
-
-        i8 = self.asi8
-        if self.hasnans:
-            mask = i8 == tslib.iNaT
-            if mask.all():
-                return -1
-            i8 = i8.copy()
-            i8[mask] = 0
-        return i8.argmax()
-
-    @property
-    def _formatter_func(self):
-        raise AbstractMethodError(self)
-
-    def _format_attrs(self):
-        """
-        Return a list of tuples of the (attr,formatted_value)
-        """
-        attrs = super(DatetimeIndexOpsMixin, self)._format_attrs()
-        for attrib in self._attributes:
-            if attrib == 'freq':
-                freq = self.freqstr
-                if freq is not None:
-                    freq = "'%s'" % freq
-                attrs.append(('freq',freq))
-        return attrs
-
-    @cache_readonly
-    def _resolution(self):
-        return frequencies.Resolution.get_reso_from_freq(self.freqstr)
-
-    @cache_readonly
-    def resolution(self):
-        """
-        Returns day, hour, minute, second, millisecond or microsecond
-        """
-        return frequencies.Resolution.get_str(self._resolution)
-
-    def _convert_scalar_indexer(self, key, kind=None):
-        """
-        we don't allow integer or float indexing on datetime-like when using loc
-
-        Parameters
-        ----------
-        key : label of the slice bound
-        kind : optional, type of the indexing operation (loc/ix/iloc/None)
-        """
-
-        if kind in ['loc'] and lib.isscalar(key) and (is_integer(key) or is_float(key)):
-            self._invalid_indexer('index',key)
-
-        return super(DatetimeIndexOpsMixin, self)._convert_scalar_indexer(key, kind=kind)
-
-    def _add_datelike(self, other):
-        raise AbstractMethodError(self)
-
-    def _sub_datelike(self, other):
-        raise AbstractMethodError(self)
-
-    @classmethod
-    def _add_datetimelike_methods(cls):
-        """ add in the datetimelike methods (as we may have to override the superclass) """
-
-        def __add__(self, other):
-            from pandas.core.index import Index
-            from pandas.tseries.tdi import TimedeltaIndex
-            from pandas.tseries.offsets import DateOffset
-            if isinstance(other, TimedeltaIndex):
-                return self._add_delta(other)
-            elif isinstance(self, TimedeltaIndex) and isinstance(other, Index):
-                if hasattr(other,'_add_delta'):
-                    return other._add_delta(self)
-                raise TypeError("cannot add TimedeltaIndex and {typ}".format(typ=type(other)))
-            elif isinstance(other, Index):
-                warnings.warn("using '+' to provide set union with datetimelike Indexes is deprecated, "
-                              "use .union()",FutureWarning, stacklevel=2)
-                return self.union(other)
-            elif isinstance(other, (DateOffset, timedelta, np.timedelta64, tslib.Timedelta)):
-                return self._add_delta(other)
-            elif com.is_integer(other):
-                return self.shift(other)
-            elif isinstance(other, (tslib.Timestamp, datetime)):
-                return self._add_datelike(other)
-            else:  # pragma: no cover
-                return NotImplemented
-        cls.__add__ = __add__
-        cls.__radd__ = __add__
-
-        def __sub__(self, other):
-            from pandas.core.index import Index
-            from pandas.tseries.tdi import TimedeltaIndex
-            from pandas.tseries.offsets import DateOffset
-            if isinstance(other, TimedeltaIndex):
-                return self._add_delta(-other)
-            elif isinstance(self, TimedeltaIndex) and isinstance(other, Index):
-                if not isinstance(other, TimedeltaIndex):
-                    raise TypeError("cannot subtract TimedeltaIndex and {typ}".format(typ=type(other)))
-                return self._add_delta(-other)
-            elif isinstance(other, Index):
-                warnings.warn("using '-' to provide set differences with datetimelike Indexes is deprecated, "
-                              "use .difference()",FutureWarning, stacklevel=2)
-                return self.difference(other)
-            elif isinstance(other, (DateOffset, timedelta, np.timedelta64, tslib.Timedelta)):
-                return self._add_delta(-other)
-            elif com.is_integer(other):
-                return self.shift(-other)
-            elif isinstance(other, (tslib.Timestamp, datetime)):
-                return self._sub_datelike(other)
-            else:  # pragma: no cover
-                return NotImplemented
-        cls.__sub__ = __sub__
-
-        def __rsub__(self, other):
-            return -(self - other)
-        cls.__rsub__ = __rsub__
-
-        cls.__iadd__ = __add__
-        cls.__isub__ = __sub__
-
-    def _add_delta(self, other):
-        return NotImplemented
-
-    def _add_delta_td(self, other):
-        # add a delta of a timedeltalike
-        # return the i8 result view
-
-        inc = tslib._delta_to_nanoseconds(other)
-        mask = self.asi8 == tslib.iNaT
-        new_values = (self.asi8 + inc).view('i8')
-        new_values[mask] = tslib.iNaT
-        return new_values.view('i8')
-
-    def _add_delta_tdi(self, other):
-        # add a delta of a TimedeltaIndex
-        # return the i8 result view
-
-        # delta operation
-        if not len(self) == len(other):
-            raise ValueError("cannot add indices of unequal length")
-
-        self_i8 = self.asi8
-        other_i8 = other.asi8
-        mask = (self_i8 == tslib.iNaT) | (other_i8 == tslib.iNaT)
-        new_values = self_i8 + other_i8
-        new_values[mask] = tslib.iNaT
-        return new_values.view(self.dtype)
-
-    def isin(self, values):
-        """
-        Compute boolean array of whether each index value is found in the
-        passed set of values
-
-        Parameters
-        ----------
-        values : set or sequence of values
-
-        Returns
-        -------
-        is_contained : ndarray (boolean dtype)
-        """
-        if not isinstance(values, type(self)):
-            try:
-                values = type(self)(values)
-            except ValueError:
-                return self.asobject.isin(values)
-
-        return algorithms.isin(self.asi8, values.asi8)
-
-    def shift(self, n, freq=None):
-        """
-        Specialized shift which produces a DatetimeIndex
-
-        Parameters
-        ----------
-        n : int
-            Periods to shift by
-        freq : DateOffset or timedelta-like, optional
-
-        Returns
-        -------
-        shifted : DatetimeIndex
-        """
-        if freq is not None and freq != self.freq:
-            if isinstance(freq, compat.string_types):
-                freq = frequencies.to_offset(freq)
-            result = Index.shift(self, n, freq)
-
-            if hasattr(self,'tz'):
-                result.tz = self.tz
-
-            return result
-
-        if n == 0:
-            # immutable so OK
-            return self
-
-        if self.freq is None:
-            raise ValueError("Cannot shift with no freq")
-
-        start = self[0] + n * self.freq
-        end = self[-1] + n * self.freq
-        attribs = self._get_attributes_dict()
-        attribs['start'] = start
-        attribs['end'] = end
-        return type(self)(**attribs)
-
-    def unique(self):
-        """
-        Index.unique with handling for DatetimeIndex/PeriodIndex metadata
-
-        Returns
-        -------
-        result : DatetimeIndex or PeriodIndex
-        """
-        from pandas.core.index import Int64Index
-        result = Int64Index.unique(self)
-        return self._simple_new(result, name=self.name, freq=self.freq,
-                                tz=getattr(self, 'tz', None))
-
-    def repeat(self, repeats, axis=None):
-        """
-        Analogous to ndarray.repeat
-        """
-        return self._shallow_copy(self.values.repeat(repeats), freq=None)
-
-    def summary(self, name=None):
-        """
-        return a summarized representation
-        """
-        formatter = self._formatter_func
-        if len(self) > 0:
-            index_summary = ', %s to %s' % (formatter(self[0]),
-                                            formatter(self[-1]))
-        else:
-            index_summary = ''
-
-        if name is None:
-            name = type(self).__name__
-        result = '%s: %s entries%s' % (com.pprint_thing(name),
-                                       len(self), index_summary)
-        if self.freq:
-            result += '\nFreq: %s' % self.freqstr
-
-        # display as values, not quoted
-        result = result.replace("'","")
-        return result
diff --git a/pandas/tseries/common.py b/pandas/tseries/common.py
deleted file mode 100644
index dcfe809074a0b..0000000000000
--- a/pandas/tseries/common.py
+++ /dev/null
@@ -1,259 +0,0 @@
-## datetimelike delegation ##
-
-import numpy as np
-from pandas.core.base import PandasDelegate
-from pandas.core import common as com
-from pandas.tseries.index import DatetimeIndex
-from pandas.tseries.period import PeriodIndex
-from pandas.tseries.tdi import TimedeltaIndex
-from pandas import tslib
-from pandas.core.common import (_NS_DTYPE, _TD_DTYPE, is_period_arraylike,
-                                is_datetime_arraylike, is_integer_dtype, is_list_like,
-                                is_datetime64_dtype, is_datetime64tz_dtype,
-                                is_timedelta64_dtype,
-                                get_dtype_kinds)
-
-def is_datetimelike(data):
-    """ return a boolean if we can be successfully converted to a datetimelike """
-    try:
-        maybe_to_datetimelike(data)
-        return True
-    except (Exception):
-        pass
-    return False
-
-def maybe_to_datetimelike(data, copy=False):
-    """
-    return a DelegatedClass of a Series that is datetimelike
-      (e.g. datetime64[ns],timedelta64[ns] dtype or a Series of Periods)
-    raise TypeError if this is not possible.
-
-    Parameters
-    ----------
-    data : Series
-    copy : boolean, default False
-           copy the input data
-
-    Returns
-    -------
-    DelegatedClass
-
-    """
-    from pandas import Series
-
-    if not isinstance(data, Series):
-        raise TypeError("cannot convert an object of type {0} to a datetimelike index".format(type(data)))
-
-    index = data.index
-    if is_datetime64_dtype(data.dtype):
-        return DatetimeProperties(DatetimeIndex(data, copy=copy, freq='infer'), index, name=data.name)
-    elif is_datetime64tz_dtype(data.dtype):
-        return DatetimeProperties(DatetimeIndex(data, copy=copy, freq='infer', ambiguous='infer'), index, name=data.name)
-    elif is_timedelta64_dtype(data.dtype):
-        return TimedeltaProperties(TimedeltaIndex(data, copy=copy, freq='infer'), index, name=data.name)
-    else:
-        if is_period_arraylike(data):
-            return PeriodProperties(PeriodIndex(data, copy=copy), index, name=data.name)
-        if is_datetime_arraylike(data):
-            return DatetimeProperties(DatetimeIndex(data, copy=copy, freq='infer'), index, name=data.name)
-
-    raise TypeError("cannot convert an object of type {0} to a datetimelike index".format(type(data)))
-
-class Properties(PandasDelegate):
-
-    def __init__(self, values, index, name):
-        self.values = values
-        self.index = index
-        self.name = name
-
-    def _delegate_property_get(self, name):
-        from pandas import Series
-
-        result = getattr(self.values,name)
-
-        # maybe need to upcast (ints)
-        if isinstance(result, np.ndarray):
-            if is_integer_dtype(result):
-                result = result.astype('int64')
-        elif not is_list_like(result):
-            return result
-
-        # return the result as a Series, which is by definition a copy
-        result = Series(result, index=self.index, name=self.name)
-
-        # setting this object will show a SettingWithCopyWarning/Error
-        result.is_copy = ("modifications to a property of a datetimelike object are not "
-                          "supported and are discarded. Change values on the original.")
-
-        return result
-
-    def _delegate_property_set(self, name, value, *args, **kwargs):
-        raise ValueError("modifications to a property of a datetimelike object are not "
-                         "supported. Change values on the original.")
-
-    def _delegate_method(self, name, *args, **kwargs):
-        from pandas import Series
-
-        method = getattr(self.values, name)
-        result = method(*args, **kwargs)
-
-        if not com.is_list_like(result):
-            return result
-
-        result = Series(result, index=self.index, name=self.name)
-
-        # setting this object will show a SettingWithCopyWarning/Error
-        result.is_copy = ("modifications to a method of a datetimelike object are not "
-                          "supported and are discarded. Change values on the original.")
-
-        return result
-
-
-class DatetimeProperties(Properties):
-    """
-    Accessor object for datetimelike properties of the Series values.
-
-    Examples
-    --------
-    >>> s.dt.hour
-    >>> s.dt.second
-    >>> s.dt.quarter
-
-    Returns a Series indexed like the original Series.
-    Raises TypeError if the Series does not contain datetimelike values.
-    """
-
-    def to_pydatetime(self):
-        return self.values.to_pydatetime()
-
-DatetimeProperties._add_delegate_accessors(delegate=DatetimeIndex,
-                                           accessors=DatetimeIndex._datetimelike_ops,
-                                           typ='property')
-DatetimeProperties._add_delegate_accessors(delegate=DatetimeIndex,
-                                           accessors=["to_period","tz_localize","tz_convert","normalize","strftime"],
-                                           typ='method')
-
-class TimedeltaProperties(Properties):
-    """
-    Accessor object for datetimelike properties of the Series values.
-
-    Examples
-    --------
-    >>> s.dt.hours
-    >>> s.dt.seconds
-
-    Returns a Series indexed like the original Series.
-    Raises TypeError if the Series does not contain datetimelike values.
-    """
-
-    def to_pytimedelta(self):
-        return self.values.to_pytimedelta()
-
-    @property
-    def components(self):
-        """
-        Return a dataframe of the components (days, hours, minutes,
-        seconds, milliseconds, microseconds, nanoseconds) of the Timedeltas.
-
-        Returns
-        -------
-        a DataFrame
-
-        """
-        return self.values.components.set_index(self.index)
-
-TimedeltaProperties._add_delegate_accessors(delegate=TimedeltaIndex,
-                                            accessors=TimedeltaIndex._datetimelike_ops,
-                                            typ='property')
-TimedeltaProperties._add_delegate_accessors(delegate=TimedeltaIndex,
-                                            accessors=["to_pytimedelta", "total_seconds"],
-                                            typ='method')
-
-class PeriodProperties(Properties):
-    """
-    Accessor object for datetimelike properties of the Series values.
-
-    Examples
-    --------
-    >>> s.dt.hour
-    >>> s.dt.second
-    >>> s.dt.quarter
-
-    Returns a Series indexed like the original Series.
-    Raises TypeError if the Series does not contain datetimelike values.
-    """
-
-PeriodProperties._add_delegate_accessors(delegate=PeriodIndex,
-                                         accessors=PeriodIndex._datetimelike_ops,
-                                         typ='property')
-PeriodProperties._add_delegate_accessors(delegate=PeriodIndex,
-                                         accessors=["strftime"],
-                                         typ='method')
-
-
-class CombinedDatetimelikeProperties(DatetimeProperties, TimedeltaProperties):
-    # This class is never instantiated, and exists solely for the benefit of
-    # the Series.dt class property. For Series objects, .dt will always be one
-    # of the more specific classes above.
-    __doc__ = DatetimeProperties.__doc__
-
-
-def _concat_compat(to_concat, axis=0):
-    """
-    provide concatenation of an datetimelike array of arrays each of which is a single
-    M8[ns], datetimet64[ns, tz] or m8[ns] dtype
-
-    Parameters
-    ----------
-    to_concat : array of arrays
-    axis : axis to provide concatenation
-
-    Returns
-    -------
-    a single array, preserving the combined dtypes
-    """
-
-    def convert_to_pydatetime(x, axis):
-        # coerce to an object dtype
-        if x.dtype == _NS_DTYPE:
-
-            if hasattr(x, 'tz'):
-                x = x.asobject
-
-            shape = x.shape
-            x = tslib.ints_to_pydatetime(x.view(np.int64).ravel())
-            x = x.reshape(shape)
-        elif x.dtype == _TD_DTYPE:
-            shape = x.shape
-            x = tslib.ints_to_pytimedelta(x.view(np.int64).ravel())
-            x = x.reshape(shape)
-
-        return x
-
-    typs = get_dtype_kinds(to_concat)
-
-    # datetimetz
-    if 'datetimetz' in typs:
-
-        # we require ALL of the same tz for datetimetz
-        tzs = set([ getattr(x,'tz',None) for x in to_concat ])-set([None])
-        if len(tzs) == 1:
-            return DatetimeIndex(np.concatenate([ x.tz_localize(None).asi8 for x in to_concat ]), tz=list(tzs)[0])
-
-    # single dtype
-    if len(typs) == 1:
-
-        if not len(typs-set(['datetime'])):
-            new_values = np.concatenate([x.view(np.int64) for x in to_concat],
-                                        axis=axis)
-            return new_values.view(_NS_DTYPE)
-
-        elif not len(typs-set(['timedelta'])):
-            new_values = np.concatenate([x.view(np.int64) for x in to_concat],
-                                        axis=axis)
-            return new_values.view(_TD_DTYPE)
-
-    # need to coerce to object
-    to_concat = [convert_to_pydatetime(x, axis) for x in to_concat]
-
-    return np.concatenate(to_concat,axis=axis)
diff --git a/pandas/tseries/converter.py b/pandas/tseries/converter.py
index a9fee1d5c3ee6..26d3f3cb85edc 100644
--- a/pandas/tseries/converter.py
+++ b/pandas/tseries/converter.py
@@ -1,994 +1,20 @@
-from datetime import datetime, timedelta
-import datetime as pydt
-import numpy as np
+# flake8: noqa
+import warnings
 
-from dateutil.relativedelta import relativedelta
-
-import matplotlib.units as units
-import matplotlib.dates as dates
-
-from matplotlib.ticker import Formatter, AutoLocator, Locator
-from matplotlib.transforms import nonsingular
-
-from pandas.compat import lrange
-import pandas.compat as compat
-import pandas.lib as lib
-import pandas.core.common as com
-from pandas.core.index import Index
-
-from pandas.core.series import Series
-from pandas.tseries.index import date_range
-import pandas.tseries.tools as tools
-import pandas.tseries.frequencies as frequencies
-from pandas.tseries.frequencies import FreqGroup
-from pandas.tseries.period import Period, PeriodIndex
+from pandas.plotting._converter import (time2num,
+                                        TimeConverter, TimeFormatter,
+                                        PeriodConverter, get_datevalue,
+                                        DatetimeConverter,
+                                        PandasAutoDateFormatter,
+                                        PandasAutoDateLocator,
+                                        MilliSecondLocator, get_finder,
+                                        TimeSeries_DateLocator,
+                                        TimeSeries_DateFormatter)
 
 
 def register():
-    units.registry[lib.Timestamp] = DatetimeConverter()
-    units.registry[Period] = PeriodConverter()
-    units.registry[pydt.datetime] = DatetimeConverter()
-    units.registry[pydt.date] = DatetimeConverter()
-    units.registry[pydt.time] = TimeConverter()
-    units.registry[np.datetime64] = DatetimeConverter()
-
-
-def _to_ordinalf(tm):
-    tot_sec = (tm.hour * 3600 + tm.minute * 60 + tm.second +
-               float(tm.microsecond / 1e6))
-    return tot_sec
-
-
-def time2num(d):
-    if isinstance(d, compat.string_types):
-        parsed = tools.to_datetime(d)
-        if not isinstance(parsed, datetime):
-            raise ValueError('Could not parse time %s' % d)
-        return _to_ordinalf(parsed.time())
-    if isinstance(d, pydt.time):
-        return _to_ordinalf(d)
-    return d
-
-
-class TimeConverter(units.ConversionInterface):
-
-    @staticmethod
-    def convert(value, unit, axis):
-        valid_types = (str, pydt.time)
-        if (isinstance(value, valid_types) or com.is_integer(value) or
-                com.is_float(value)):
-            return time2num(value)
-        if isinstance(value, Index):
-            return value.map(time2num)
-        if isinstance(value, (list, tuple, np.ndarray, Index)):
-            return [time2num(x) for x in value]
-        return value
-
-    @staticmethod
-    def axisinfo(unit, axis):
-        if unit != 'time':
-            return None
-
-        majloc = AutoLocator()
-        majfmt = TimeFormatter(majloc)
-        return units.AxisInfo(majloc=majloc, majfmt=majfmt, label='time')
-
-    @staticmethod
-    def default_units(x, axis):
-        return 'time'
-
-
-### time formatter
-class TimeFormatter(Formatter):
-
-    def __init__(self, locs):
-        self.locs = locs
-
-    def __call__(self, x, pos=0):
-        fmt = '%H:%M:%S'
-        s = int(x)
-        ms = int((x - s) * 1e3)
-        us = int((x - s) * 1e6 - ms)
-        m, s = divmod(s, 60)
-        h, m = divmod(m, 60)
-        _, h = divmod(h, 24)
-        if us != 0:
-            fmt += '.%6f'
-        elif ms != 0:
-            fmt += '.%3f'
-
-        return pydt.time(h, m, s, us).strftime(fmt)
-
-
-### Period Conversion
-
-
-class PeriodConverter(dates.DateConverter):
-
-    @staticmethod
-    def convert(values, units, axis):
-        if not hasattr(axis, 'freq'):
-            raise TypeError('Axis must have `freq` set to convert to Periods')
-        valid_types = (compat.string_types, datetime, Period, pydt.date, pydt.time)
-        if (isinstance(values, valid_types) or com.is_integer(values) or
-                com.is_float(values)):
-            return get_datevalue(values, axis.freq)
-        if isinstance(values, PeriodIndex):
-            return values.asfreq(axis.freq).values
-        if isinstance(values, Index):
-            return values.map(lambda x: get_datevalue(x, axis.freq))
-        if com.is_period_arraylike(values):
-            return PeriodIndex(values, freq=axis.freq).values
-        if isinstance(values, (list, tuple, np.ndarray, Index)):
-            return [get_datevalue(x, axis.freq) for x in values]
-        return values
-
-
-def get_datevalue(date, freq):
-    if isinstance(date, Period):
-        return date.asfreq(freq).ordinal
-    elif isinstance(date, (compat.string_types, datetime, pydt.date, pydt.time)):
-        return Period(date, freq).ordinal
-    elif (com.is_integer(date) or com.is_float(date) or
-          (isinstance(date, (np.ndarray, Index)) and (date.size == 1))):
-        return date
-    elif date is None:
-        return None
-    raise ValueError("Unrecognizable date '%s'" % date)
-
-HOURS_PER_DAY = 24.
-MINUTES_PER_DAY = 60. * HOURS_PER_DAY
-SECONDS_PER_DAY = 60. * MINUTES_PER_DAY
-MUSECONDS_PER_DAY = 1e6 * SECONDS_PER_DAY
-
-
-def _dt_to_float_ordinal(dt):
-    """
-    Convert :mod:`datetime` to the Gregorian date as UTC float days,
-    preserving hours, minutes, seconds and microseconds.  Return value
-    is a :func:`float`.
-    """
-    if isinstance(dt, (np.ndarray, Index, Series)) and com.is_datetime64_ns_dtype(dt):
-        base = dates.epoch2num(dt.asi8 / 1.0E9)
-    else:
-        base = dates.date2num(dt)
-    return base
-
-
-### Datetime Conversion
-class DatetimeConverter(dates.DateConverter):
-
-    @staticmethod
-    def convert(values, unit, axis):
-        def try_parse(values):
-            try:
-                return _dt_to_float_ordinal(tools.to_datetime(values))
-            except Exception:
-                return values
-
-        if isinstance(values, (datetime, pydt.date)):
-            return _dt_to_float_ordinal(values)
-        elif isinstance(values, np.datetime64):
-            return _dt_to_float_ordinal(lib.Timestamp(values))
-        elif isinstance(values, pydt.time):
-            return dates.date2num(values)
-        elif (com.is_integer(values) or com.is_float(values)):
-            return values
-        elif isinstance(values, compat.string_types):
-            return try_parse(values)
-        elif isinstance(values, (list, tuple, np.ndarray, Index)):
-            if isinstance(values, Index):
-                values = values.values
-            if not isinstance(values, np.ndarray):
-                values = com._asarray_tuplesafe(values)
-
-            if com.is_integer_dtype(values) or com.is_float_dtype(values):
-                return values
-
-            try:
-                values = tools.to_datetime(values)
-                if isinstance(values, Index):
-                    values = values.map(_dt_to_float_ordinal)
-                else:
-                    values = [_dt_to_float_ordinal(x) for x in values]
-            except Exception:
-                pass
-
-        return values
-
-    @staticmethod
-    def axisinfo(unit, axis):
-        """
-        Return the :class:`~matplotlib.units.AxisInfo` for *unit*.
-
-        *unit* is a tzinfo instance or None.
-        The *axis* argument is required but not used.
-        """
-        tz = unit
-
-        majloc = PandasAutoDateLocator(tz=tz)
-        majfmt = PandasAutoDateFormatter(majloc, tz=tz)
-        datemin = pydt.date(2000, 1, 1)
-        datemax = pydt.date(2010, 1, 1)
-
-        return units.AxisInfo(majloc=majloc, majfmt=majfmt, label='',
-                              default_limits=(datemin, datemax))
-
-
-class PandasAutoDateFormatter(dates.AutoDateFormatter):
-
-    def __init__(self, locator, tz=None, defaultfmt='%Y-%m-%d'):
-        dates.AutoDateFormatter.__init__(self, locator, tz, defaultfmt)
-        # matplotlib.dates._UTC has no _utcoffset called by pandas
-        if self._tz is dates.UTC:
-            self._tz._utcoffset = self._tz.utcoffset(None)
-        self.scaled = {
-            365.0: '%Y',
-            30.: '%b %Y',
-            1.0: '%b %d %Y',
-            1. / 24.: '%H:%M:%S',
-            1. / 24. / 3600. / 1000.: '%H:%M:%S.%f'
-        }
-
-    def _get_fmt(self, x):
-
-        scale = float(self._locator._get_unit())
-
-        fmt = self.defaultfmt
-
-        for k in sorted(self.scaled):
-            if k >= scale:
-                fmt = self.scaled[k]
-                break
-
-        return fmt
-
-    def __call__(self, x, pos=0):
-        fmt = self._get_fmt(x)
-        self._formatter = dates.DateFormatter(fmt, self._tz)
-        return self._formatter(x, pos)
-
-
-class PandasAutoDateLocator(dates.AutoDateLocator):
-
-    def get_locator(self, dmin, dmax):
-        'Pick the best locator based on a distance.'
-        delta = relativedelta(dmax, dmin)
-
-        num_days = ((delta.years * 12.0) + delta.months * 31.0) + delta.days
-        num_sec = (delta.hours * 60.0 + delta.minutes) * 60.0 + delta.seconds
-        tot_sec = num_days * 86400. + num_sec
-
-        if abs(tot_sec) < self.minticks:
-            self._freq = -1
-            locator = MilliSecondLocator(self.tz)
-            locator.set_axis(self.axis)
-
-            locator.set_view_interval(*self.axis.get_view_interval())
-            locator.set_data_interval(*self.axis.get_data_interval())
-            return locator
-
-        return dates.AutoDateLocator.get_locator(self, dmin, dmax)
-
-    def _get_unit(self):
-        return MilliSecondLocator.get_unit_generic(self._freq)
-
-
-class MilliSecondLocator(dates.DateLocator):
-
-    UNIT = 1. / (24 * 3600 * 1000)
-
-    def __init__(self, tz):
-        dates.DateLocator.__init__(self, tz)
-        self._interval = 1.
-
-    def _get_unit(self):
-        return self.get_unit_generic(-1)
-
-    @staticmethod
-    def get_unit_generic(freq):
-        unit = dates.RRuleLocator.get_unit_generic(freq)
-        if unit < 0:
-            return MilliSecondLocator.UNIT
-        return unit
-
-    def __call__(self):
-        # if no data have been set, this will tank with a ValueError
-        try:
-            dmin, dmax = self.viewlim_to_dt()
-        except ValueError:
-            return []
-
-        if dmin > dmax:
-            dmax, dmin = dmin, dmax
-        delta = relativedelta(dmax, dmin)
-
-        # We need to cap at the endpoints of valid datetime
-        try:
-            start = dmin - delta
-        except ValueError:
-            start = _from_ordinal(1.0)
-
-        try:
-            stop = dmax + delta
-        except ValueError:
-            # The magic number!
-            stop = _from_ordinal(3652059.9999999)
-
-        nmax, nmin = dates.date2num((dmax, dmin))
-
-        num = (nmax - nmin) * 86400 * 1000
-        max_millis_ticks = 6
-        for interval in [1, 10, 50, 100, 200, 500]:
-            if num <= interval * (max_millis_ticks - 1):
-                self._interval = interval
-                break
-            else:
-                # We went through the whole loop without breaking, default to 1
-                self._interval = 1000.
-
-        estimate = (nmax - nmin) / (self._get_unit() * self._get_interval())
-
-        if estimate > self.MAXTICKS * 2:
-            raise RuntimeError(('MillisecondLocator estimated to generate %d '
-                                'ticks from %s to %s: exceeds Locator.MAXTICKS'
-                                '* 2 (%d) ') %
-                              (estimate, dmin, dmax, self.MAXTICKS * 2))
-
-        freq = '%dL' % self._get_interval()
-        tz = self.tz.tzname(None)
-        st = _from_ordinal(dates.date2num(dmin))  # strip tz
-        ed = _from_ordinal(dates.date2num(dmax))
-        all_dates = date_range(start=st, end=ed, freq=freq, tz=tz).asobject
-
-        try:
-            if len(all_dates) > 0:
-                locs = self.raise_if_exceeds(dates.date2num(all_dates))
-                return locs
-        except Exception as e:  # pragma: no cover
-            pass
-
-        lims = dates.date2num([dmin, dmax])
-        return lims
-
-    def _get_interval(self):
-        return self._interval
-
-    def autoscale(self):
-        """
-        Set the view limits to include the data range.
-        """
-        dmin, dmax = self.datalim_to_dt()
-        if dmin > dmax:
-            dmax, dmin = dmin, dmax
-
-        delta = relativedelta(dmax, dmin)
-
-        # We need to cap at the endpoints of valid datetime
-        try:
-            start = dmin - delta
-        except ValueError:
-            start = _from_ordinal(1.0)
-
-        try:
-            stop = dmax + delta
-        except ValueError:
-            # The magic number!
-            stop = _from_ordinal(3652059.9999999)
-
-        dmin, dmax = self.datalim_to_dt()
-
-        vmin = dates.date2num(dmin)
-        vmax = dates.date2num(dmax)
-
-        return self.nonsingular(vmin, vmax)
-
-
-def _from_ordinal(x, tz=None):
-    ix = int(x)
-    dt = datetime.fromordinal(ix)
-    remainder = float(x) - ix
-    hour, remainder = divmod(24 * remainder, 1)
-    minute, remainder = divmod(60 * remainder, 1)
-    second, remainder = divmod(60 * remainder, 1)
-    microsecond = int(1e6 * remainder)
-    if microsecond < 10:
-        microsecond = 0  # compensate for rounding errors
-    dt = datetime(dt.year, dt.month, dt.day, int(hour), int(minute),
-                  int(second), microsecond)
-    if tz is not None:
-        dt = dt.astimezone(tz)
-
-    if microsecond > 999990:  # compensate for rounding errors
-        dt += timedelta(microseconds=1e6 - microsecond)
-
-    return dt
-
-### Fixed frequency dynamic tick locators and formatters
-
-##### -------------------------------------------------------------------------
-#---- --- Locators ---
-##### -------------------------------------------------------------------------
-
-
-def _get_default_annual_spacing(nyears):
-    """
-    Returns a default spacing between consecutive ticks for annual data.
-    """
-    if nyears < 11:
-        (min_spacing, maj_spacing) = (1, 1)
-    elif nyears < 20:
-        (min_spacing, maj_spacing) = (1, 2)
-    elif nyears < 50:
-        (min_spacing, maj_spacing) = (1, 5)
-    elif nyears < 100:
-        (min_spacing, maj_spacing) = (5, 10)
-    elif nyears < 200:
-        (min_spacing, maj_spacing) = (5, 25)
-    elif nyears < 600:
-        (min_spacing, maj_spacing) = (10, 50)
-    else:
-        factor = nyears // 1000 + 1
-        (min_spacing, maj_spacing) = (factor * 20, factor * 100)
-    return (min_spacing, maj_spacing)
-
-
-def period_break(dates, period):
-    """
-    Returns the indices where the given period changes.
-
-    Parameters
-    ----------
-    dates : PeriodIndex
-        Array of intervals to monitor.
-    period : string
-        Name of the period to monitor.
-    """
-    current = getattr(dates, period)
-    previous = getattr(dates - 1, period)
-    return (current - previous).nonzero()[0]
-
-
-def has_level_label(label_flags, vmin):
-    """
-    Returns true if the ``label_flags`` indicate there is at least one label
-    for this level.
-
-    if the minimum view limit is not an exact integer, then the first tick
-    label won't be shown, so we must adjust for that.
-    """
-    if label_flags.size == 0 or (label_flags.size == 1 and
-                                 label_flags[0] == 0 and
-                                 vmin % 1 > 0.0):
-        return False
-    else:
-        return True
-
-
-def _daily_finder(vmin, vmax, freq):
-    periodsperday = -1
-
-    if freq >= FreqGroup.FR_HR:
-        if freq == FreqGroup.FR_NS:
-            periodsperday = 24 * 60 * 60 * 1000000000
-        elif freq == FreqGroup.FR_US:
-            periodsperday = 24 * 60 * 60 * 1000000
-        elif freq == FreqGroup.FR_MS:
-            periodsperday = 24 * 60 * 60 * 1000
-        elif freq == FreqGroup.FR_SEC:
-            periodsperday = 24 * 60 * 60
-        elif freq == FreqGroup.FR_MIN:
-            periodsperday = 24 * 60
-        elif freq == FreqGroup.FR_HR:
-            periodsperday = 24
-        else:  # pragma: no cover
-            raise ValueError("unexpected frequency: %s" % freq)
-        periodsperyear = 365 * periodsperday
-        periodspermonth = 28 * periodsperday
-
-    elif freq == FreqGroup.FR_BUS:
-        periodsperyear = 261
-        periodspermonth = 19
-    elif freq == FreqGroup.FR_DAY:
-        periodsperyear = 365
-        periodspermonth = 28
-    elif frequencies.get_freq_group(freq) == FreqGroup.FR_WK:
-        periodsperyear = 52
-        periodspermonth = 3
-    else:  # pragma: no cover
-        raise ValueError("unexpected frequency")
-
-    # save this for later usage
-    vmin_orig = vmin
-
-    (vmin, vmax) = (Period(ordinal=int(vmin), freq=freq),
-                    Period(ordinal=int(vmax), freq=freq))
-    span = vmax.ordinal - vmin.ordinal + 1
-    dates_ = PeriodIndex(start=vmin, end=vmax, freq=freq)
-    # Initialize the output
-    info = np.zeros(span,
-                    dtype=[('val', np.int64), ('maj', bool),
-                           ('min', bool), ('fmt', '|S20')])
-    info['val'][:] = dates_.values
-    info['fmt'][:] = ''
-    info['maj'][[0, -1]] = True
-    # .. and set some shortcuts
-    info_maj = info['maj']
-    info_min = info['min']
-    info_fmt = info['fmt']
-
-    def first_label(label_flags):
-        if (label_flags[0] == 0) and (label_flags.size > 1) and \
-                ((vmin_orig % 1) > 0.0):
-            return label_flags[1]
-        else:
-            return label_flags[0]
-
-    # Case 1. Less than a month
-    if span <= periodspermonth:
-        day_start = period_break(dates_, 'day')
-        month_start = period_break(dates_, 'month')
-
-        def _hour_finder(label_interval, force_year_start):
-            _hour = dates_.hour
-            _prev_hour = (dates_ - 1).hour
-            hour_start = (_hour - _prev_hour) != 0
-            info_maj[day_start] = True
-            info_min[hour_start & (_hour % label_interval == 0)] = True
-            year_start = period_break(dates_, 'year')
-            info_fmt[hour_start & (_hour % label_interval == 0)] = '%H:%M'
-            info_fmt[day_start] = '%H:%M\n%d-%b'
-            info_fmt[year_start] = '%H:%M\n%d-%b\n%Y'
-            if force_year_start and not has_level_label(year_start, vmin_orig):
-                info_fmt[first_label(day_start)] = '%H:%M\n%d-%b\n%Y'
-
-        def _minute_finder(label_interval):
-            hour_start = period_break(dates_, 'hour')
-            _minute = dates_.minute
-            _prev_minute = (dates_ - 1).minute
-            minute_start = (_minute - _prev_minute) != 0
-            info_maj[hour_start] = True
-            info_min[minute_start & (_minute % label_interval == 0)] = True
-            year_start = period_break(dates_, 'year')
-            info_fmt = info['fmt']
-            info_fmt[minute_start & (_minute % label_interval == 0)] = '%H:%M'
-            info_fmt[day_start] = '%H:%M\n%d-%b'
-            info_fmt[year_start] = '%H:%M\n%d-%b\n%Y'
-
-        def _second_finder(label_interval):
-            minute_start = period_break(dates_, 'minute')
-            _second = dates_.second
-            _prev_second = (dates_ - 1).second
-            second_start = (_second - _prev_second) != 0
-            info['maj'][minute_start] = True
-            info['min'][second_start & (_second % label_interval == 0)] = True
-            year_start = period_break(dates_, 'year')
-            info_fmt = info['fmt']
-            info_fmt[second_start & (_second %
-                                     label_interval == 0)] = '%H:%M:%S'
-            info_fmt[day_start] = '%H:%M:%S\n%d-%b'
-            info_fmt[year_start] = '%H:%M:%S\n%d-%b\n%Y'
-
-        if span < periodsperday / 12000.0:
-            _second_finder(1)
-        elif span < periodsperday / 6000.0:
-            _second_finder(2)
-        elif span < periodsperday / 2400.0:
-            _second_finder(5)
-        elif span < periodsperday / 1200.0:
-            _second_finder(10)
-        elif span < periodsperday / 800.0:
-            _second_finder(15)
-        elif span < periodsperday / 400.0:
-            _second_finder(30)
-        elif span < periodsperday / 150.0:
-            _minute_finder(1)
-        elif span < periodsperday / 70.0:
-            _minute_finder(2)
-        elif span < periodsperday / 24.0:
-            _minute_finder(5)
-        elif span < periodsperday / 12.0:
-            _minute_finder(15)
-        elif span < periodsperday / 6.0:
-            _minute_finder(30)
-        elif span < periodsperday / 2.5:
-            _hour_finder(1, False)
-        elif span < periodsperday / 1.5:
-            _hour_finder(2, False)
-        elif span < periodsperday * 1.25:
-            _hour_finder(3, False)
-        elif span < periodsperday * 2.5:
-            _hour_finder(6, True)
-        elif span < periodsperday * 4:
-            _hour_finder(12, True)
-        else:
-            info_maj[month_start] = True
-            info_min[day_start] = True
-            year_start = period_break(dates_, 'year')
-            info_fmt = info['fmt']
-            info_fmt[day_start] = '%d'
-            info_fmt[month_start] = '%d\n%b'
-            info_fmt[year_start] = '%d\n%b\n%Y'
-            if not has_level_label(year_start, vmin_orig):
-                if not has_level_label(month_start, vmin_orig):
-                    info_fmt[first_label(day_start)] = '%d\n%b\n%Y'
-                else:
-                    info_fmt[first_label(month_start)] = '%d\n%b\n%Y'
-
-    # Case 2. Less than three months
-    elif span <= periodsperyear // 4:
-        month_start = period_break(dates_, 'month')
-        info_maj[month_start] = True
-        if freq < FreqGroup.FR_HR:
-            info['min'] = True
-        else:
-            day_start = period_break(dates_, 'day')
-            info['min'][day_start] = True
-        week_start = period_break(dates_, 'week')
-        year_start = period_break(dates_, 'year')
-        info_fmt[week_start] = '%d'
-        info_fmt[month_start] = '\n\n%b'
-        info_fmt[year_start] = '\n\n%b\n%Y'
-        if not has_level_label(year_start, vmin_orig):
-            if not has_level_label(month_start, vmin_orig):
-                info_fmt[first_label(week_start)] = '\n\n%b\n%Y'
-            else:
-                info_fmt[first_label(month_start)] = '\n\n%b\n%Y'
-    # Case 3. Less than 14 months ...............
-    elif span <= 1.15 * periodsperyear:
-        year_start = period_break(dates_, 'year')
-        month_start = period_break(dates_, 'month')
-        week_start = period_break(dates_, 'week')
-        info_maj[month_start] = True
-        info_min[week_start] = True
-        info_min[year_start] = False
-        info_min[month_start] = False
-        info_fmt[month_start] = '%b'
-        info_fmt[year_start] = '%b\n%Y'
-        if not has_level_label(year_start, vmin_orig):
-            info_fmt[first_label(month_start)] = '%b\n%Y'
-    # Case 4. Less than 2.5 years ...............
-    elif span <= 2.5 * periodsperyear:
-        year_start = period_break(dates_, 'year')
-        quarter_start = period_break(dates_, 'quarter')
-        month_start = period_break(dates_, 'month')
-        info_maj[quarter_start] = True
-        info_min[month_start] = True
-        info_fmt[quarter_start] = '%b'
-        info_fmt[year_start] = '%b\n%Y'
-    # Case 4. Less than 4 years .................
-    elif span <= 4 * periodsperyear:
-        year_start = period_break(dates_, 'year')
-        month_start = period_break(dates_, 'month')
-        info_maj[year_start] = True
-        info_min[month_start] = True
-        info_min[year_start] = False
-
-        month_break = dates_[month_start].month
-        jan_or_jul = month_start[(month_break == 1) | (month_break == 7)]
-        info_fmt[jan_or_jul] = '%b'
-        info_fmt[year_start] = '%b\n%Y'
-    # Case 5. Less than 11 years ................
-    elif span <= 11 * periodsperyear:
-        year_start = period_break(dates_, 'year')
-        quarter_start = period_break(dates_, 'quarter')
-        info_maj[year_start] = True
-        info_min[quarter_start] = True
-        info_min[year_start] = False
-        info_fmt[year_start] = '%Y'
-    # Case 6. More than 12 years ................
-    else:
-        year_start = period_break(dates_, 'year')
-        year_break = dates_[year_start].year
-        nyears = span / periodsperyear
-        (min_anndef, maj_anndef) = _get_default_annual_spacing(nyears)
-        major_idx = year_start[(year_break % maj_anndef == 0)]
-        info_maj[major_idx] = True
-        minor_idx = year_start[(year_break % min_anndef == 0)]
-        info_min[minor_idx] = True
-        info_fmt[major_idx] = '%Y'
-    #............................................
-
-    return info
-
-
-def _monthly_finder(vmin, vmax, freq):
-    periodsperyear = 12
-
-    vmin_orig = vmin
-    (vmin, vmax) = (int(vmin), int(vmax))
-    span = vmax - vmin + 1
-    #..............
-    # Initialize the output
-    info = np.zeros(span,
-                    dtype=[('val', int), ('maj', bool), ('min', bool),
-                           ('fmt', '|S8')])
-    info['val'] = np.arange(vmin, vmax + 1)
-    dates_ = info['val']
-    info['fmt'] = ''
-    year_start = (dates_ % 12 == 0).nonzero()[0]
-    info_maj = info['maj']
-    info_fmt = info['fmt']
-    #..............
-    if span <= 1.15 * periodsperyear:
-        info_maj[year_start] = True
-        info['min'] = True
-
-        info_fmt[:] = '%b'
-        info_fmt[year_start] = '%b\n%Y'
-
-        if not has_level_label(year_start, vmin_orig):
-            if dates_.size > 1:
-                idx = 1
-            else:
-                idx = 0
-            info_fmt[idx] = '%b\n%Y'
-    #..............
-    elif span <= 2.5 * periodsperyear:
-        quarter_start = (dates_ % 3 == 0).nonzero()
-        info_maj[year_start] = True
-        # TODO: Check the following : is it really info['fmt'] ?
-        info['fmt'][quarter_start] = True
-        info['min'] = True
-
-        info_fmt[quarter_start] = '%b'
-        info_fmt[year_start] = '%b\n%Y'
-    #..............
-    elif span <= 4 * periodsperyear:
-        info_maj[year_start] = True
-        info['min'] = True
-
-        jan_or_jul = (dates_ % 12 == 0) | (dates_ % 12 == 6)
-        info_fmt[jan_or_jul] = '%b'
-        info_fmt[year_start] = '%b\n%Y'
-    #..............
-    elif span <= 11 * periodsperyear:
-        quarter_start = (dates_ % 3 == 0).nonzero()
-        info_maj[year_start] = True
-        info['min'][quarter_start] = True
-
-        info_fmt[year_start] = '%Y'
-    #..................
-    else:
-        nyears = span / periodsperyear
-        (min_anndef, maj_anndef) = _get_default_annual_spacing(nyears)
-        years = dates_[year_start] // 12 + 1
-        major_idx = year_start[(years % maj_anndef == 0)]
-        info_maj[major_idx] = True
-        info['min'][year_start[(years % min_anndef == 0)]] = True
-
-        info_fmt[major_idx] = '%Y'
-    #..............
-    return info
-
-
-def _quarterly_finder(vmin, vmax, freq):
-    periodsperyear = 4
-    vmin_orig = vmin
-    (vmin, vmax) = (int(vmin), int(vmax))
-    span = vmax - vmin + 1
-    #............................................
-    info = np.zeros(span,
-                    dtype=[('val', int), ('maj', bool), ('min', bool),
-                           ('fmt', '|S8')])
-    info['val'] = np.arange(vmin, vmax + 1)
-    info['fmt'] = ''
-    dates_ = info['val']
-    info_maj = info['maj']
-    info_fmt = info['fmt']
-    year_start = (dates_ % 4 == 0).nonzero()[0]
-    #..............
-    if span <= 3.5 * periodsperyear:
-        info_maj[year_start] = True
-        info['min'] = True
-
-        info_fmt[:] = 'Q%q'
-        info_fmt[year_start] = 'Q%q\n%F'
-        if not has_level_label(year_start, vmin_orig):
-            if dates_.size > 1:
-                idx = 1
-            else:
-                idx = 0
-            info_fmt[idx] = 'Q%q\n%F'
-    #..............
-    elif span <= 11 * periodsperyear:
-        info_maj[year_start] = True
-        info['min'] = True
-        info_fmt[year_start] = '%F'
-    #..............
-    else:
-        years = dates_[year_start] // 4 + 1
-        nyears = span / periodsperyear
-        (min_anndef, maj_anndef) = _get_default_annual_spacing(nyears)
-        major_idx = year_start[(years % maj_anndef == 0)]
-        info_maj[major_idx] = True
-        info['min'][year_start[(years % min_anndef == 0)]] = True
-        info_fmt[major_idx] = '%F'
-    #..............
-    return info
-
-
-def _annual_finder(vmin, vmax, freq):
-    (vmin, vmax) = (int(vmin), int(vmax + 1))
-    span = vmax - vmin + 1
-    #..............
-    info = np.zeros(span,
-                    dtype=[('val', int), ('maj', bool), ('min', bool),
-                           ('fmt', '|S8')])
-    info['val'] = np.arange(vmin, vmax + 1)
-    info['fmt'] = ''
-    dates_ = info['val']
-    #..............
-    (min_anndef, maj_anndef) = _get_default_annual_spacing(span)
-    major_idx = dates_ % maj_anndef == 0
-    info['maj'][major_idx] = True
-    info['min'][(dates_ % min_anndef == 0)] = True
-    info['fmt'][major_idx] = '%Y'
-    #..............
-    return info
-
-
-def get_finder(freq):
-    if isinstance(freq, compat.string_types):
-        freq = frequencies.get_freq(freq)
-    fgroup = frequencies.get_freq_group(freq)
-
-    if fgroup == FreqGroup.FR_ANN:
-        return _annual_finder
-    elif fgroup == FreqGroup.FR_QTR:
-        return _quarterly_finder
-    elif freq == FreqGroup.FR_MTH:
-        return _monthly_finder
-    elif ((freq >= FreqGroup.FR_BUS) or fgroup == FreqGroup.FR_WK):
-        return _daily_finder
-    else:  # pragma: no cover
-        errmsg = "Unsupported frequency: %s" % (freq)
-        raise NotImplementedError(errmsg)
-
-
-class TimeSeries_DateLocator(Locator):
-    """
-    Locates the ticks along an axis controlled by a :class:`Series`.
-
-    Parameters
-    ----------
-    freq : {var}
-        Valid frequency specifier.
-    minor_locator : {False, True}, optional
-        Whether the locator is for minor ticks (True) or not.
-    dynamic_mode : {True, False}, optional
-        Whether the locator should work in dynamic mode.
-    base : {int}, optional
-    quarter : {int}, optional
-    month : {int}, optional
-    day : {int}, optional
-    """
-
-    def __init__(self, freq, minor_locator=False, dynamic_mode=True,
-                 base=1, quarter=1, month=1, day=1, plot_obj=None):
-        if isinstance(freq, compat.string_types):
-            freq = frequencies.get_freq(freq)
-        self.freq = freq
-        self.base = base
-        (self.quarter, self.month, self.day) = (quarter, month, day)
-        self.isminor = minor_locator
-        self.isdynamic = dynamic_mode
-        self.offset = 0
-        self.plot_obj = plot_obj
-        self.finder = get_finder(freq)
-
-    def _get_default_locs(self, vmin, vmax):
-        "Returns the default locations of ticks."
-
-        if self.plot_obj.date_axis_info is None:
-            self.plot_obj.date_axis_info = self.finder(vmin, vmax, self.freq)
-
-        locator = self.plot_obj.date_axis_info
-
-        if self.isminor:
-            return np.compress(locator['min'], locator['val'])
-        return np.compress(locator['maj'], locator['val'])
-
-    def __call__(self):
-        'Return the locations of the ticks.'
-        # axis calls Locator.set_axis inside set_m<xxxx>_formatter
-        vi = tuple(self.axis.get_view_interval())
-        if vi != self.plot_obj.view_interval:
-            self.plot_obj.date_axis_info = None
-        self.plot_obj.view_interval = vi
-        vmin, vmax = vi
-        if vmax < vmin:
-            vmin, vmax = vmax, vmin
-        if self.isdynamic:
-            locs = self._get_default_locs(vmin, vmax)
-        else:  # pragma: no cover
-            base = self.base
-            (d, m) = divmod(vmin, base)
-            vmin = (d + 1) * base
-            locs = lrange(vmin, vmax + 1, base)
-        return locs
-
-    def autoscale(self):
-        """
-        Sets the view limits to the nearest multiples of base that contain the
-        data.
-        """
-        # requires matplotlib >= 0.98.0
-        (vmin, vmax) = self.axis.get_data_interval()
-
-        locs = self._get_default_locs(vmin, vmax)
-        (vmin, vmax) = locs[[0, -1]]
-        if vmin == vmax:
-            vmin -= 1
-            vmax += 1
-        return nonsingular(vmin, vmax)
-
-#####-------------------------------------------------------------------------
-#---- --- Formatter ---
-#####-------------------------------------------------------------------------
-
-
-class TimeSeries_DateFormatter(Formatter):
-    """
-    Formats the ticks along an axis controlled by a :class:`PeriodIndex`.
-
-    Parameters
-    ----------
-    freq : {int, string}
-        Valid frequency specifier.
-    minor_locator : {False, True}
-        Whether the current formatter should apply to minor ticks (True) or
-        major ticks (False).
-    dynamic_mode : {True, False}
-        Whether the formatter works in dynamic mode or not.
-    """
-
-    def __init__(self, freq, minor_locator=False, dynamic_mode=True,
-                 plot_obj=None):
-        if isinstance(freq, compat.string_types):
-            freq = frequencies.get_freq(freq)
-        self.format = None
-        self.freq = freq
-        self.locs = []
-        self.formatdict = None
-        self.isminor = minor_locator
-        self.isdynamic = dynamic_mode
-        self.offset = 0
-        self.plot_obj = plot_obj
-        self.finder = get_finder(freq)
-
-    def _set_default_format(self, vmin, vmax):
-        "Returns the default ticks spacing."
-
-        if self.plot_obj.date_axis_info is None:
-            self.plot_obj.date_axis_info = self.finder(vmin, vmax, self.freq)
-        info = self.plot_obj.date_axis_info
-
-        if self.isminor:
-            format = np.compress(info['min'] & np.logical_not(info['maj']),
-                                 info)
-        else:
-            format = np.compress(info['maj'], info)
-        self.formatdict = dict([(x, f) for (x, _, _, f) in format])
-        return self.formatdict
-
-    def set_locs(self, locs):
-        'Sets the locations of the ticks'
-        # don't actually use the locs. This is just needed to work with
-        # matplotlib. Force to use vmin, vmax
-        self.locs = locs
-
-        (vmin, vmax) = vi = tuple(self.axis.get_view_interval())
-        if vi != self.plot_obj.view_interval:
-            self.plot_obj.date_axis_info = None
-        self.plot_obj.view_interval = vi
-        if vmax < vmin:
-            (vmin, vmax) = (vmax, vmin)
-        self._set_default_format(vmin, vmax)
-
-    def __call__(self, x, pos=0):
-        if self.formatdict is None:
-            return ''
-        else:
-            fmt = self.formatdict.pop(x, '')
-            return Period(ordinal=int(x), freq=self.freq).strftime(fmt)
+    from pandas.plotting._converter import register as register_
+    msg = ("'pandas.tseries.converter.register' has been moved and renamed to "
+           "'pandas.plotting.register_matplotlib_converters'. ")
+    warnings.warn(msg, FutureWarning, stacklevel=2)
+    register_()
diff --git a/pandas/tseries/frequencies.py b/pandas/tseries/frequencies.py
index 07546a76be431..0cffd818202ed 100644
--- a/pandas/tseries/frequencies.py
+++ b/pandas/tseries/frequencies.py
@@ -1,293 +1,53 @@
-from datetime import datetime,timedelta
-from pandas.compat import range, long, zip
+# -*- coding: utf-8 -*-
+from datetime import timedelta
+from pandas.compat import zip
 from pandas import compat
 import re
-import warnings
 
 import numpy as np
 
-from pandas.core.algorithms import unique
-from pandas.tseries.offsets import DateOffset
-from pandas.util.decorators import cache_readonly
-import pandas.tseries.offsets as offsets
-import pandas.core.common as com
-import pandas.lib as lib
-import pandas.tslib as tslib
-import pandas._period as period
-from pandas.tslib import Timedelta
-from pytz import AmbiguousTimeError
-
-class FreqGroup(object):
-    FR_ANN = 1000
-    FR_QTR = 2000
-    FR_MTH = 3000
-    FR_WK = 4000
-    FR_BUS = 5000
-    FR_DAY = 6000
-    FR_HR = 7000
-    FR_MIN = 8000
-    FR_SEC = 9000
-    FR_MS = 10000
-    FR_US = 11000
-    FR_NS = 12000
-
-
-class Resolution(object):
-
-    # defined in period.pyx
-    # note that these are different from freq codes
-    RESO_US = period.US_RESO
-    RESO_MS = period.MS_RESO
-    RESO_SEC = period.S_RESO
-    RESO_MIN = period.T_RESO
-    RESO_HR = period.H_RESO
-    RESO_DAY = period.D_RESO
-
-    _reso_str_map = {
-    RESO_US: 'microsecond',
-    RESO_MS: 'millisecond',
-    RESO_SEC: 'second',
-    RESO_MIN: 'minute',
-    RESO_HR: 'hour',
-    RESO_DAY: 'day'}
-
-    _str_reso_map = dict([(v, k) for k, v in compat.iteritems(_reso_str_map)])
-
-    _reso_freq_map = {
-    'year': 'A',
-    'quarter': 'Q',
-    'month': 'M',
-    'day': 'D',
-    'hour': 'H',
-    'minute': 'T',
-    'second': 'S',
-    'millisecond': 'L',
-    'microsecond': 'U',
-    'nanosecond': 'N'}
-
-    _freq_reso_map = dict([(v, k) for k, v in compat.iteritems(_reso_freq_map)])
-
-    @classmethod
-    def get_str(cls, reso):
-        """
-        Return resolution str against resolution code.
-
-        Example
-        -------
-        >>> Resolution.get_str(Resolution.RESO_SEC)
-        'second'
-        """
-        return cls._reso_str_map.get(reso, 'day')
-
-    @classmethod
-    def get_reso(cls, resostr):
-        """
-        Return resolution str against resolution code.
-
-        Example
-        -------
-        >>> Resolution.get_reso('second')
-        2
-
-        >>> Resolution.get_reso('second') == Resolution.RESO_SEC
-        True
-        """
-        return cls._str_reso_map.get(resostr, cls.RESO_DAY)
-
-    @classmethod
-    def get_freq_group(cls, resostr):
-        """
-        Return frequency str against resolution str.
-
-        Example
-        -------
-        >>> f.Resolution.get_freq_group('day')
-        4000
-        """
-        return get_freq_group(cls.get_freq(resostr))
-
-    @classmethod
-    def get_freq(cls, resostr):
-        """
-        Return frequency str against resolution str.
-
-        Example
-        -------
-        >>> f.Resolution.get_freq('day')
-        'D'
-        """
-        return cls._reso_freq_map[resostr]
-
-    @classmethod
-    def get_str_from_freq(cls, freq):
-        """
-        Return resolution str against frequency str.
-
-        Example
-        -------
-        >>> Resolution.get_str_from_freq('H')
-        'hour'
-        """
-        return cls._freq_reso_map.get(freq, 'day')
-
-    @classmethod
-    def get_reso_from_freq(cls, freq):
-        """
-        Return resolution code against frequency str.
-
-        Example
-        -------
-        >>> Resolution.get_reso_from_freq('H')
-        4
-
-        >>> Resolution.get_reso_from_freq('H') == Resolution.RESO_HR
-        True
-        """
-        return cls.get_reso(cls.get_str_from_freq(freq))
-
-
-def get_to_timestamp_base(base):
-    """
-    Return frequency code group used for base of to_timestamp against
-    frequency code.
-
-    Example
-    -------
-    # Return day freq code against longer freq than day
-    >>> get_to_timestamp_base(get_freq_code('D')[0])
-    6000
-    >>> get_to_timestamp_base(get_freq_code('W')[0])
-    6000
-    >>> get_to_timestamp_base(get_freq_code('M')[0])
-    6000
-
-    # Return second freq code against hour between second
-    >>> get_to_timestamp_base(get_freq_code('H')[0])
-    9000
-    >>> get_to_timestamp_base(get_freq_code('S')[0])
-    9000
-    """
-    if base < FreqGroup.FR_BUS:
-        return FreqGroup.FR_DAY
-    if FreqGroup.FR_HR <= base <= FreqGroup.FR_SEC:
-        return FreqGroup.FR_SEC
-    return base
-
-
-def get_freq_group(freq):
-    """
-    Return frequency code group of given frequency str or offset.
+from pandas.core.dtypes.generic import ABCSeries
+from pandas.core.dtypes.common import (
+    is_period_arraylike,
+    is_timedelta64_dtype,
+    is_datetime64_dtype)
 
-    Example
-    -------
-    >>> get_freq_group('W-MON')
-    4000
-
-    >>> get_freq_group('W-FRI')
-    4000
-    """
-    if isinstance(freq, offsets.DateOffset):
-        freq = freq.rule_code
-
-    if isinstance(freq, compat.string_types):
-        base, mult = get_freq_code(freq)
-        freq = base
-    elif isinstance(freq, int):
-        pass
-    else:
-        raise ValueError('input must be str, offset or int')
-    return (freq // 1000) * 1000
-
-
-def get_freq(freq):
-    """
-    Return frequency code of given frequency str.
-    If input is not string, return input as it is.
-
-    Example
-    -------
-    >>> get_freq('A')
-    1000
-
-    >>> get_freq('3A')
-    1000
-    """
-    if isinstance(freq, compat.string_types):
-        base, mult = get_freq_code(freq)
-        freq = base
-    return freq
-
-
-def get_freq_code(freqstr):
-    """
-    Return freq str or tuple to freq code and stride (mult)
-
-    Parameters
-    ----------
-    freqstr : str or tuple
-
-    Returns
-    -------
-    return : tuple of base frequency code and stride (mult)
-
-    Example
-    -------
-    >>> get_freq_code('3D')
-    (6000, 3)
-
-    >>> get_freq_code('D')
-    (6000, 1)
-
-    >>> get_freq_code(('D', 3))
-    (6000, 3)
-    """
-    if isinstance(freqstr, DateOffset):
-        freqstr = (freqstr.rule_code, freqstr.n)
-
-    if isinstance(freqstr, tuple):
-        if (com.is_integer(freqstr[0]) and
-                com.is_integer(freqstr[1])):
-            # e.g., freqstr = (2000, 1)
-            return freqstr
-        else:
-            # e.g., freqstr = ('T', 5)
-            try:
-                code = _period_str_to_code(freqstr[0])
-                stride = freqstr[1]
-            except:
-                if com.is_integer(freqstr[1]):
-                    raise
-                code = _period_str_to_code(freqstr[1])
-                stride = freqstr[0]
-            return code, stride
+from pandas.tseries.offsets import DateOffset
 
-    if com.is_integer(freqstr):
-        return (freqstr, 1)
+from pandas._libs.tslib import Timedelta
 
-    base, stride = _base_and_stride(freqstr)
-    code = _period_str_to_code(base)
+import pandas._libs.tslibs.frequencies as libfreqs
+from pandas._libs.tslibs.frequencies import (  # noqa, semi-public API
+    get_freq, get_base_alias, get_to_timestamp_base, get_freq_code,
+    FreqGroup,
+    is_subperiod, is_superperiod)
 
-    return code, stride
+from pandas._libs.tslibs.resolution import (Resolution,
+                                            _FrequencyInferer,
+                                            _TimedeltaFrequencyInferer)
 
+from pytz import AmbiguousTimeError
 
-def _get_freq_str(base, mult=1):
-    code = _reverse_period_code_map.get(base)
-    if mult == 1:
-        return code
-    return str(mult) + code
 
+RESO_NS = 0
+RESO_US = 1
+RESO_MS = 2
+RESO_SEC = 3
+RESO_MIN = 4
+RESO_HR = 5
+RESO_DAY = 6
 
-#----------------------------------------------------------------------
+# ---------------------------------------------------------------------
 # Offset names ("time rules") and related functions
 
-
-from pandas.tseries.offsets import (Nano, Micro, Milli, Second, Minute, Hour,
+from pandas._libs.tslibs.offsets import _offset_to_period_map  # noqa:E402
+from pandas.tseries.offsets import (Nano, Micro, Milli, Second,  # noqa
+                                    Minute, Hour,
                                     Day, BDay, CDay, Week, MonthBegin,
                                     MonthEnd, BMonthBegin, BMonthEnd,
                                     QuarterBegin, QuarterEnd, BQuarterBegin,
                                     BQuarterEnd, YearBegin, YearEnd,
-                                    BYearBegin, BYearEnd, _make_offset
-                                    )
+                                    BYearBegin, BYearEnd, prefix_mapping)
 try:
     cday = CDay()
 except NotImplementedError:
@@ -296,106 +56,11 @@ def _get_freq_str(base, mult=1):
 #: cache of previously seen offsets
 _offset_map = {}
 
-_offset_to_period_map = {
-    'WEEKDAY': 'D',
-    'EOM': 'M',
-    'BM': 'M',
-    'BQS': 'Q',
-    'QS': 'Q',
-    'BQ': 'Q',
-    'BA': 'A',
-    'AS': 'A',
-    'BAS': 'A',
-    'MS': 'M',
-    'D': 'D',
-    'C': 'C',
-    'B': 'B',
-    'T': 'T',
-    'S': 'S',
-    'L': 'L',
-    'U': 'U',
-    'N': 'N',
-    'H': 'H',
-    'Q': 'Q',
-    'A': 'A',
-    'W': 'W',
-    'M': 'M'
-}
-
-need_suffix = ['QS', 'BQ', 'BQS', 'AS', 'BA', 'BAS']
-for __prefix in need_suffix:
-    for _m in tslib._MONTHS:
-        _offset_to_period_map['%s-%s' % (__prefix, _m)] = \
-            _offset_to_period_map[__prefix]
-for __prefix in ['A', 'Q']:
-    for _m in tslib._MONTHS:
-        _alias = '%s-%s' % (__prefix, _m)
-        _offset_to_period_map[_alias] = _alias
-
-_days = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
-for _d in _days:
-    _offset_to_period_map['W-%s' % _d] = 'W-%s' % _d
-
 
 def get_period_alias(offset_str):
     """ alias to closest period strings BQ->Q etc"""
     return _offset_to_period_map.get(offset_str, None)
 
-_rule_aliases = {
-    # Legacy rules that will continue to map to their original values
-    # essentially for the rest of time
-    'WEEKDAY': 'B',
-    'EOM': 'BM',
-    'W@MON': 'W-MON',
-    'W@TUE': 'W-TUE',
-    'W@WED': 'W-WED',
-    'W@THU': 'W-THU',
-    'W@FRI': 'W-FRI',
-    'W@SAT': 'W-SAT',
-    'W@SUN': 'W-SUN',
-    'Q@JAN': 'BQ-JAN',
-    'Q@FEB': 'BQ-FEB',
-    'Q@MAR': 'BQ-MAR',
-    'A@JAN': 'BA-JAN',
-    'A@FEB': 'BA-FEB',
-    'A@MAR': 'BA-MAR',
-    'A@APR': 'BA-APR',
-    'A@MAY': 'BA-MAY',
-    'A@JUN': 'BA-JUN',
-    'A@JUL': 'BA-JUL',
-    'A@AUG': 'BA-AUG',
-    'A@SEP': 'BA-SEP',
-    'A@OCT': 'BA-OCT',
-    'A@NOV': 'BA-NOV',
-    'A@DEC': 'BA-DEC',
-}
-
-_lite_rule_alias = {
-    'W': 'W-SUN',
-    'Q': 'Q-DEC',
-
-    'A': 'A-DEC',  # YearEnd(month=12),
-    'AS': 'AS-JAN',  # YearBegin(month=1),
-    'BA': 'BA-DEC',  # BYearEnd(month=12),
-    'BAS': 'BAS-JAN',  # BYearBegin(month=1),
-
-    'Min': 'T',
-    'min': 'T',
-    'ms': 'L',
-    'us': 'U'
-}
-
-#TODO: Can this be killed?
-for _i, _weekday in enumerate(['MON', 'TUE', 'WED', 'THU', 'FRI']):
-    for _iweek in range(4):
-        _name = 'WOM-%d%s' % (_iweek + 1, _weekday)
-        _rule_aliases[_name.replace('-', '@')] = _name
-
-# Note that _rule_aliases is not 1:1 (d[BA]==d[A@DEC]), and so traversal
-# order matters when constructing an inverse. we pick one. #2331
-# Used in get_legacy_offset_name
-_legacy_reverse_map = dict((v, k) for k, v in
-                           reversed(sorted(compat.iteritems(_rule_aliases))))
 
 _name_to_offset_map = {'days': Day(1),
                        'hours': Hour(1),
@@ -405,37 +70,71 @@ def get_period_alias(offset_str):
                        'microseconds': Micro(1),
                        'nanoseconds': Nano(1)}
 
-def to_offset(freqstr):
+
+def to_offset(freq):
     """
-    Return DateOffset object from string representation or
-    Timedelta object
+    Return DateOffset object from string or tuple representation
+    or datetime.timedelta object
+
+    Parameters
+    ----------
+    freq : str, tuple, datetime.timedelta, DateOffset or None
+
+    Returns
+    -------
+    delta : DateOffset
+        None if freq is None
+
+    Raises
+    ------
+    ValueError
+        If freq is an invalid frequency
+
+    See Also
+    --------
+    pandas.DateOffset
 
     Examples
     --------
-    >>> to_offset('5Min')
-    Minute(5)
+    >>> to_offset('5min')
+    <5 * Minutes>
+
+    >>> to_offset('1D1H')
+    <25 * Hours>
+
+    >>> to_offset(('W', 2))
+    <2 * Weeks: weekday=6>
+
+    >>> to_offset((2, 'B'))
+    <2 * BusinessDays>
+
+    >>> to_offset(datetime.timedelta(days=1))
+    <Day>
+
+    >>> to_offset(Hour())
+    <Hour>
     """
-    if freqstr is None:
+    if freq is None:
         return None
 
-    if isinstance(freqstr, DateOffset):
-        return freqstr
+    if isinstance(freq, DateOffset):
+        return freq
 
-    if isinstance(freqstr, tuple):
-        name = freqstr[0]
-        stride = freqstr[1]
+    if isinstance(freq, tuple):
+        name = freq[0]
+        stride = freq[1]
         if isinstance(stride, compat.string_types):
             name, stride = stride, name
-        name, _ = _base_and_stride(name)
+        name, _ = libfreqs._base_and_stride(name)
         delta = get_offset(name) * stride
 
-    elif isinstance(freqstr, timedelta):
+    elif isinstance(freq, timedelta):
         delta = None
-        freqstr = Timedelta(freqstr)
+        freq = Timedelta(freq)
         try:
-            for name in freqstr.components._fields:
+            for name in freq.components._fields:
                 offset = _name_to_offset_map[name]
-                stride = getattr(freqstr.components, name)
+                stride = getattr(freq.components, name)
                 if stride != 0:
                     offset = stride * offset
                     if delta is None:
@@ -443,75 +142,45 @@ def to_offset(freqstr):
                     else:
                         delta = delta + offset
         except Exception:
-            raise ValueError("Could not evaluate %s" % freqstr)
+            raise ValueError(libfreqs._INVALID_FREQ_ERROR.format(freq))
 
     else:
         delta = None
         stride_sign = None
         try:
-            for stride, name, _ in opattern.findall(freqstr):
-                offset = get_offset(name)
+            splitted = re.split(libfreqs.opattern, freq)
+            if splitted[-1] != '' and not splitted[-1].isspace():
+                # the last element must be blank
+                raise ValueError('last element must be blank')
+            for sep, stride, name in zip(splitted[0::4], splitted[1::4],
+                                         splitted[2::4]):
+                if sep != '' and not sep.isspace():
+                    raise ValueError('separator must be spaces')
+                prefix = libfreqs._lite_rule_alias.get(name) or name
                 if stride_sign is None:
                     stride_sign = -1 if stride.startswith('-') else 1
                 if not stride:
                     stride = 1
+                if prefix in Resolution._reso_str_bump_map.keys():
+                    stride, name = Resolution.get_stride_from_decimal(
+                        float(stride), prefix
+                    )
                 stride = int(stride)
+                offset = get_offset(name)
                 offset = offset * int(np.fabs(stride) * stride_sign)
                 if delta is None:
                     delta = offset
                 else:
                     delta = delta + offset
         except Exception:
-            raise ValueError("Could not evaluate %s" % freqstr)
+            raise ValueError(libfreqs._INVALID_FREQ_ERROR.format(freq))
 
     if delta is None:
-        raise ValueError('Unable to understand %s as a frequency' % freqstr)
+        raise ValueError(libfreqs._INVALID_FREQ_ERROR.format(freq))
 
     return delta
 
 
-# hack to handle WOM-1MON
-opattern = re.compile(r'([\-]?\d*)\s*([A-Za-z]+([\-@][\dA-Za-z\-]+)?)')
-
-
-def _base_and_stride(freqstr):
-    """
-    Return base freq and stride info from string representation
-
-    Examples
-    --------
-    _freq_and_stride('5Min') -> 'Min', 5
-    """
-    groups = opattern.match(freqstr)
-
-    if not groups:
-        raise ValueError("Could not evaluate %s" % freqstr)
-
-    stride = groups.group(1)
-
-    if len(stride):
-        stride = int(stride)
-    else:
-        stride = 1
-
-    base = groups.group(2)
-
-    return (base, stride)
-
-
-def get_base_alias(freqstr):
-    """
-    Returns the base frequency alias, e.g., '5D' -> 'D'
-    """
-    return _base_and_stride(freqstr)[0]
-
-
-_dont_uppercase = set(('MS', 'ms'))
-
-
-_LEGACY_FREQ_WARNING = 'Freq "{0}" is deprecated, use "{1}" as alternative.'
-
-
 def get_offset(name):
     """
     Return DateOffset object associated with rule name
@@ -520,298 +189,34 @@ def get_offset(name):
     --------
     get_offset('EOM') --> BMonthEnd(1)
     """
-    if name not in _dont_uppercase:
+    if name not in libfreqs._dont_uppercase:
         name = name.upper()
-
-        if name in _rule_aliases:
-            new = _rule_aliases[name]
-            warnings.warn(_LEGACY_FREQ_WARNING.format(name, new),
-                          FutureWarning, stacklevel=2)
-            name = new
-        elif name.lower() in _rule_aliases:
-            new = _rule_aliases[name.lower()]
-            warnings.warn(_LEGACY_FREQ_WARNING.format(name, new),
-                          FutureWarning, stacklevel=2)
-            name = new
-
-        name = _lite_rule_alias.get(name, name)
-        name = _lite_rule_alias.get(name.lower(), name)
-
+        name = libfreqs._lite_rule_alias.get(name, name)
+        name = libfreqs._lite_rule_alias.get(name.lower(), name)
     else:
-        if name in _rule_aliases:
-            new = _rule_aliases[name]
-            warnings.warn(_LEGACY_FREQ_WARNING.format(name, new),
-                          FutureWarning, stacklevel=2)
-            name = new
-        name = _lite_rule_alias.get(name, name)
+        name = libfreqs._lite_rule_alias.get(name, name)
 
     if name not in _offset_map:
         try:
-            # generate and cache offset
-            offset = _make_offset(name)
+            split = name.split('-')
+            klass = prefix_mapping[split[0]]
+            # handles case where there's no suffix (and will TypeError if too
+            # many '-')
+            offset = klass._from_name(*split[1:])
         except (ValueError, TypeError, KeyError):
             # bad prefix or suffix
-            raise ValueError('Bad rule name requested: %s.' % name)
+            raise ValueError(libfreqs._INVALID_FREQ_ERROR.format(name))
+        # cache
         _offset_map[name] = offset
-    return _offset_map[name]
+    # do not return cache because it's mutable
+    return _offset_map[name].copy()
 
 
 getOffset = get_offset
 
-
-def get_offset_name(offset):
-    """
-    Return rule name associated with a DateOffset object
-
-    Examples
-    --------
-    get_offset_name(BMonthEnd(1)) --> 'EOM'
-    """
-    if offset is None:
-        raise ValueError("Offset can't be none!")
-    # Hack because this is what it did before...
-    if isinstance(offset, BDay):
-        if offset.n != 1:
-            raise ValueError('Bad rule given: %s.' % 'BusinessDays')
-        else:
-            return offset.rule_code
-    try:
-        return offset.freqstr
-    except AttributeError:
-        # Bad offset, give useful error.
-        raise ValueError('Bad rule given: %s.' % offset)
-
-
-def get_legacy_offset_name(offset):
-    """
-    Return the pre pandas 0.8.0 name for the date offset
-    """
-
-    # This only used in test_timeseries_legacy.py
-
-    name = offset.name
-    return _legacy_reverse_map.get(name, name)
-
-def get_standard_freq(freq):
-    """
-    Return the standardized frequency string
-    """
-    if freq is None:
-        return None
-
-    if isinstance(freq, DateOffset):
-        return freq.rule_code
-
-    code, stride = get_freq_code(freq)
-    return _get_freq_str(code, stride)
-
-#----------------------------------------------------------------------
+# ---------------------------------------------------------------------
 # Period codes
 
-# period frequency constants corresponding to scikits timeseries
-# originals
-_period_code_map = {
-    # Annual freqs with various fiscal year ends.
-    # eg, 2005 for A-FEB runs Mar 1, 2004 to Feb 28, 2005
-    "A-DEC": 1000,  # Annual - December year end
-    "A-JAN": 1001,  # Annual - January year end
-    "A-FEB": 1002,  # Annual - February year end
-    "A-MAR": 1003,  # Annual - March year end
-    "A-APR": 1004,  # Annual - April year end
-    "A-MAY": 1005,  # Annual - May year end
-    "A-JUN": 1006,  # Annual - June year end
-    "A-JUL": 1007,  # Annual - July year end
-    "A-AUG": 1008,  # Annual - August year end
-    "A-SEP": 1009,  # Annual - September year end
-    "A-OCT": 1010,  # Annual - October year end
-    "A-NOV": 1011,  # Annual - November year end
-
-    # Quarterly frequencies with various fiscal year ends.
-    # eg, Q42005 for Q-OCT runs Aug 1, 2005 to Oct 31, 2005
-    "Q-DEC": 2000,    # Quarterly - December year end
-    "Q-JAN": 2001,    # Quarterly - January year end
-    "Q-FEB": 2002,    # Quarterly - February year end
-    "Q-MAR": 2003,    # Quarterly - March year end
-    "Q-APR": 2004,    # Quarterly - April year end
-    "Q-MAY": 2005,    # Quarterly - May year end
-    "Q-JUN": 2006,    # Quarterly - June year end
-    "Q-JUL": 2007,    # Quarterly - July year end
-    "Q-AUG": 2008,    # Quarterly - August year end
-    "Q-SEP": 2009,    # Quarterly - September year end
-    "Q-OCT": 2010,    # Quarterly - October year end
-    "Q-NOV": 2011,    # Quarterly - November year end
-
-    "M": 3000,        # Monthly
-
-    "W-SUN": 4000,    # Weekly - Sunday end of week
-    "W-MON": 4001,    # Weekly - Monday end of week
-    "W-TUE": 4002,    # Weekly - Tuesday end of week
-    "W-WED": 4003,    # Weekly - Wednesday end of week
-    "W-THU": 4004,    # Weekly - Thursday end of week
-    "W-FRI": 4005,    # Weekly - Friday end of week
-    "W-SAT": 4006,    # Weekly - Saturday end of week
-
-    "B": 5000,        # Business days
-    "D": 6000,        # Daily
-    "H": 7000,        # Hourly
-    "T": 8000,        # Minutely
-    "S": 9000,        # Secondly
-    "L": 10000,       # Millisecondly
-    "U": 11000,       # Microsecondly
-    "N": 12000,       # Nanosecondly
-}
-
-_reverse_period_code_map = {}
-for _k, _v in compat.iteritems(_period_code_map):
-    _reverse_period_code_map[_v] = _k
-
-# Additional aliases
-_period_code_map.update({
-    "Q": 2000,  # Quarterly - December year end (default quarterly)
-    "A": 1000,  # Annual
-    "W": 4000,  # Weekly
-})
-
-
-def _period_alias_dictionary():
-    """
-    Build freq alias dictionary to support freqs from original c_dates.c file
-    of the scikits.timeseries library.
-    """
-    alias_dict = {}
-
-    M_aliases = ["M", "MTH", "MONTH", "MONTHLY"]
-    B_aliases = ["B", "BUS", "BUSINESS", "BUSINESSLY", 'WEEKDAY']
-    D_aliases = ["D", "DAY", "DLY", "DAILY"]
-    H_aliases = ["H", "HR", "HOUR", "HRLY", "HOURLY"]
-    T_aliases = ["T", "MIN", "MINUTE", "MINUTELY"]
-    S_aliases = ["S", "SEC", "SECOND", "SECONDLY"]
-    L_aliases = ["L", "ms", "MILLISECOND", "MILLISECONDLY"]
-    U_aliases = ["U", "US", "MICROSECOND", "MICROSECONDLY"]
-    N_aliases = ["N", "NS", "NANOSECOND", "NANOSECONDLY"]
-
-    for k in M_aliases:
-        alias_dict[k] = 'M'
-
-    for k in B_aliases:
-        alias_dict[k] = 'B'
-
-    for k in D_aliases:
-        alias_dict[k] = 'D'
-
-    for k in H_aliases:
-        alias_dict[k] = 'H'
-
-    for k in T_aliases:
-        alias_dict[k] = 'Min'
-
-    for k in S_aliases:
-        alias_dict[k] = 'S'
-
-    for k in L_aliases:
-        alias_dict[k] = 'L'
-
-    for k in U_aliases:
-        alias_dict[k] = 'U'
-
-    for k in N_aliases:
-        alias_dict[k] = 'N'
-
-    A_prefixes = ["A", "Y", "ANN", "ANNUAL", "ANNUALLY", "YR", "YEAR",
-                  "YEARLY"]
-
-    Q_prefixes = ["Q", "QTR", "QUARTER", "QUARTERLY", "Q-E",
-                  "QTR-E", "QUARTER-E", "QUARTERLY-E"]
-
-    month_names = [
-        ["DEC", "DECEMBER"],
-        ["JAN", "JANUARY"],
-        ["FEB", "FEBRUARY"],
-        ["MAR", "MARCH"],
-        ["APR", "APRIL"],
-        ["MAY", "MAY"],
-        ["JUN", "JUNE"],
-        ["JUL", "JULY"],
-        ["AUG", "AUGUST"],
-        ["SEP", "SEPTEMBER"],
-        ["OCT", "OCTOBER"],
-        ["NOV", "NOVEMBER"]]
-
-    seps = ["@", "-"]
-
-    for k in A_prefixes:
-        alias_dict[k] = 'A'
-        for m_tup in month_names:
-            for sep in seps:
-                m1, m2 = m_tup
-                alias_dict[k + sep + m1] = 'A-' + m1
-                alias_dict[k + sep + m2] = 'A-' + m1
-
-    for k in Q_prefixes:
-        alias_dict[k] = 'Q'
-        for m_tup in month_names:
-            for sep in seps:
-                m1, m2 = m_tup
-                alias_dict[k + sep + m1] = 'Q-' + m1
-                alias_dict[k + sep + m2] = 'Q-' + m1
-
-    W_prefixes = ["W", "WK", "WEEK", "WEEKLY"]
-
-    day_names = [
-        ["SUN", "SUNDAY"],
-        ["MON", "MONDAY"],
-        ["TUE", "TUESDAY"],
-        ["WED", "WEDNESDAY"],
-        ["THU", "THURSDAY"],
-        ["FRI", "FRIDAY"],
-        ["SAT", "SATURDAY"]]
-
-    for k in W_prefixes:
-        alias_dict[k] = 'W'
-        for d_tup in day_names:
-            for sep in ["@", "-"]:
-                d1, d2 = d_tup
-                alias_dict[k + sep + d1] = 'W-' + d1
-                alias_dict[k + sep + d2] = 'W-' + d1
-
-    return alias_dict
-
-
-_period_alias_dict = _period_alias_dictionary()
-
-
-def _period_str_to_code(freqstr):
-    # hack
-    if freqstr in _rule_aliases:
-        new = _rule_aliases[freqstr]
-        warnings.warn(_LEGACY_FREQ_WARNING.format(freqstr, new),
-                      FutureWarning, stacklevel=3)
-        freqstr = new
-    freqstr = _lite_rule_alias.get(freqstr, freqstr)
-
-    if freqstr not in _dont_uppercase:
-        lower = freqstr.lower()
-        if lower in _rule_aliases:
-            new = _rule_aliases[lower]
-            warnings.warn(_LEGACY_FREQ_WARNING.format(lower, new),
-                          FutureWarning, stacklevel=3)
-            freqstr = new
-        freqstr = _lite_rule_alias.get(lower, freqstr)
-
-    try:
-        if freqstr not in _dont_uppercase:
-            freqstr = freqstr.upper()
-        return _period_code_map[freqstr]
-    except KeyError:
-        try:
-            alias = _period_alias_dict[freqstr]
-            warnings.warn(_LEGACY_FREQ_WARNING.format(freqstr, alias),
-                          FutureWarning, stacklevel=3)
-        except KeyError:
-            raise ValueError("Unknown freqstr: %s" % freqstr)
-
-        return _period_code_map[alias]
-
 
 def infer_freq(index, warn=True):
     """
@@ -821,7 +226,7 @@ def infer_freq(index, warn=True):
     Parameters
     ----------
     index : DatetimeIndex or TimedeltaIndex
-            if passed a Series will use the values of the series (NOT THE INDEX)
+      if passed a Series will use the values of the series (NOT THE INDEX)
     warn : boolean, default True
 
     Returns
@@ -833,13 +238,16 @@ def infer_freq(index, warn=True):
     """
     import pandas as pd
 
-    if isinstance(index, com.ABCSeries):
+    if isinstance(index, ABCSeries):
         values = index._values
-        if not (com.is_datetime64_dtype(values) or com.is_timedelta64_dtype(values) or values.dtype == object):
-            raise TypeError("cannot infer freq from a non-convertible dtype on a Series of {0}".format(index.dtype))
+        if not (is_datetime64_dtype(values) or
+                is_timedelta64_dtype(values) or
+                values.dtype == object):
+            raise TypeError("cannot infer freq from a non-convertible dtype "
+                            "on a Series of {dtype}".format(dtype=index.dtype))
         index = values
 
-    if com.is_period_arraylike(index):
+    if is_period_arraylike(index):
         raise TypeError("PeriodIndex given. Check the `freq` attribute "
                         "instead of using infer_freq.")
     elif isinstance(index, pd.TimedeltaIndex):
@@ -848,7 +256,8 @@ def infer_freq(index, warn=True):
 
     if isinstance(index, pd.Index) and not isinstance(index, pd.DatetimeIndex):
         if isinstance(index, (pd.Int64Index, pd.Float64Index)):
-            raise TypeError("cannot infer freq from a non-convertible index type {0}".format(type(index)))
+            raise TypeError("cannot infer freq from a non-convertible index "
+                            "type {type}".format(type=type(index)))
         index = index.values
 
     if not isinstance(index, pd.DatetimeIndex):
@@ -859,414 +268,3 @@ def infer_freq(index, warn=True):
 
     inferer = _FrequencyInferer(index, warn=warn)
     return inferer.get_freq()
-
-_ONE_MICRO = long(1000)
-_ONE_MILLI = _ONE_MICRO * 1000
-_ONE_SECOND = _ONE_MILLI * 1000
-_ONE_MINUTE = 60 * _ONE_SECOND
-_ONE_HOUR = 60 * _ONE_MINUTE
-_ONE_DAY = 24 * _ONE_HOUR
-
-
-class _FrequencyInferer(object):
-    """
-    Not sure if I can avoid the state machine here
-    """
-
-    def __init__(self, index, warn=True):
-        self.index = index
-        self.values = np.asarray(index).view('i8')
-
-        # This moves the values, which are implicitly in UTC, to the
-        # the timezone so they are in local time
-        if hasattr(index,'tz'):
-            if index.tz is not None:
-                self.values = tslib.tz_convert(self.values, 'UTC', index.tz)
-
-        self.warn = warn
-
-        if len(index) < 3:
-            raise ValueError('Need at least 3 dates to infer frequency')
-
-        self.is_monotonic = (self.index.is_monotonic_increasing or
-                             self.index.is_monotonic_decreasing)
-
-    @cache_readonly
-    def deltas(self):
-        return tslib.unique_deltas(self.values)
-
-    @cache_readonly
-    def deltas_asi8(self):
-        return tslib.unique_deltas(self.index.asi8)
-
-    @cache_readonly
-    def is_unique(self):
-        return len(self.deltas) == 1
-
-    @cache_readonly
-    def is_unique_asi8(self):
-        return len(self.deltas_asi8) == 1
-
-    def get_freq(self):
-        if not self.is_monotonic or not self.index.is_unique:
-            return None
-
-        delta = self.deltas[0]
-        if _is_multiple(delta, _ONE_DAY):
-            return self._infer_daily_rule()
-        else:
-            # Business hourly, maybe. 17: one day / 65: one weekend
-            if self.hour_deltas in ([1, 17], [1, 65], [1, 17, 65]):
-                return 'BH'
-            # Possibly intraday frequency.  Here we use the
-            # original .asi8 values as the modified values
-            # will not work around DST transitions.  See #8772
-            elif not self.is_unique_asi8:
-                return None
-            delta = self.deltas_asi8[0]
-            if _is_multiple(delta, _ONE_HOUR):
-                # Hours
-                return _maybe_add_count('H', delta / _ONE_HOUR)
-            elif _is_multiple(delta, _ONE_MINUTE):
-                # Minutes
-                return _maybe_add_count('T', delta / _ONE_MINUTE)
-            elif _is_multiple(delta, _ONE_SECOND):
-                # Seconds
-                return _maybe_add_count('S', delta / _ONE_SECOND)
-            elif _is_multiple(delta, _ONE_MILLI):
-                # Milliseconds
-                return _maybe_add_count('L', delta / _ONE_MILLI)
-            elif _is_multiple(delta, _ONE_MICRO):
-                # Microseconds
-                return _maybe_add_count('U', delta / _ONE_MICRO)
-            else:
-                # Nanoseconds
-                return _maybe_add_count('N', delta)
-
-    @cache_readonly
-    def day_deltas(self):
-        return [x / _ONE_DAY for x in self.deltas]
-
-    @cache_readonly
-    def hour_deltas(self):
-        return [x / _ONE_HOUR for x in self.deltas]
-
-    @cache_readonly
-    def fields(self):
-        return tslib.build_field_sarray(self.values)
-
-    @cache_readonly
-    def rep_stamp(self):
-        return lib.Timestamp(self.values[0])
-
-    def month_position_check(self):
-        # TODO: cythonize this, very slow
-        calendar_end = True
-        business_end = True
-        calendar_start = True
-        business_start = True
-
-        years = self.fields['Y']
-        months = self.fields['M']
-        days = self.fields['D']
-        weekdays = self.index.dayofweek
-
-        from calendar import monthrange
-        for y, m, d, wd in zip(years, months, days, weekdays):
-
-            if calendar_start:
-                calendar_start &= d == 1
-            if business_start:
-                business_start &= d == 1 or (d <= 3 and wd == 0)
-
-            if calendar_end or business_end:
-                _, daysinmonth = monthrange(y, m)
-                cal = d == daysinmonth
-                if calendar_end:
-                    calendar_end &= cal
-                if business_end:
-                    business_end &= cal or (daysinmonth - d < 3 and wd == 4)
-            elif not calendar_start and not business_start:
-                break
-
-        if calendar_end:
-            return 'ce'
-        elif business_end:
-            return 'be'
-        elif calendar_start:
-            return 'cs'
-        elif business_start:
-            return 'bs'
-        else:
-            return None
-
-    @cache_readonly
-    def mdiffs(self):
-        nmonths = self.fields['Y'] * 12 + self.fields['M']
-        return tslib.unique_deltas(nmonths.astype('i8'))
-
-    @cache_readonly
-    def ydiffs(self):
-        return tslib.unique_deltas(self.fields['Y'].astype('i8'))
-
-    def _infer_daily_rule(self):
-        annual_rule = self._get_annual_rule()
-        if annual_rule:
-            nyears = self.ydiffs[0]
-            month = _month_aliases[self.rep_stamp.month]
-            return _maybe_add_count('%s-%s' % (annual_rule, month), nyears)
-
-        quarterly_rule = self._get_quarterly_rule()
-        if quarterly_rule:
-            nquarters = self.mdiffs[0] / 3
-            mod_dict = {0: 12, 2: 11, 1: 10}
-            month = _month_aliases[mod_dict[self.rep_stamp.month % 3]]
-            return _maybe_add_count('%s-%s' % (quarterly_rule, month),
-                                    nquarters)
-
-        monthly_rule = self._get_monthly_rule()
-        if monthly_rule:
-            return _maybe_add_count(monthly_rule, self.mdiffs[0])
-
-        if self.is_unique:
-            days = self.deltas[0] / _ONE_DAY
-            if days % 7 == 0:
-                # Weekly
-                alias = _weekday_rule_aliases[self.rep_stamp.weekday()]
-                return _maybe_add_count('W-%s' % alias, days / 7)
-            else:
-                return _maybe_add_count('D', days)
-
-        # Business daily. Maybe
-        if self.day_deltas == [1, 3]:
-            return 'B'
-
-        wom_rule = self._get_wom_rule()
-        if wom_rule:
-            return wom_rule
-
-    def _get_annual_rule(self):
-        if len(self.ydiffs) > 1:
-            return None
-
-        if len(algos.unique(self.fields['M'])) > 1:
-            return None
-
-        pos_check = self.month_position_check()
-        return {'cs': 'AS', 'bs': 'BAS',
-                'ce': 'A', 'be': 'BA'}.get(pos_check)
-
-    def _get_quarterly_rule(self):
-        if len(self.mdiffs) > 1:
-            return None
-
-        if not self.mdiffs[0] % 3 == 0:
-            return None
-
-        pos_check = self.month_position_check()
-        return {'cs': 'QS', 'bs': 'BQS',
-                'ce': 'Q', 'be': 'BQ'}.get(pos_check)
-
-    def _get_monthly_rule(self):
-        if len(self.mdiffs) > 1:
-            return None
-        pos_check = self.month_position_check()
-        return {'cs': 'MS', 'bs': 'BMS',
-                'ce': 'M', 'be': 'BM'}.get(pos_check)
-
-    def _get_wom_rule(self):
-#         wdiffs = unique(np.diff(self.index.week))
-        #We also need -47, -49, -48 to catch index spanning year boundary
-#         if not lib.ismember(wdiffs, set([4, 5, -47, -49, -48])).all():
-#             return None
-
-        weekdays = unique(self.index.weekday)
-        if len(weekdays) > 1:
-            return None
-
-        week_of_months = unique((self.index.day - 1) // 7)
-        # Only attempt to infer up to WOM-4. See #9425
-        week_of_months = week_of_months[week_of_months < 4]
-        if len(week_of_months) == 0 or len(week_of_months) > 1:
-            return None
-
-        # get which week
-        week = week_of_months[0] + 1
-        wd = _weekday_rule_aliases[weekdays[0]]
-
-        return 'WOM-%d%s' % (week, wd)
-
-import pandas.core.algorithms as algos
-
-class _TimedeltaFrequencyInferer(_FrequencyInferer):
-
-    def _infer_daily_rule(self):
-        if self.is_unique:
-            days = self.deltas[0] / _ONE_DAY
-            if days % 7 == 0:
-                # Weekly
-                alias = _weekday_rule_aliases[self.rep_stamp.weekday()]
-                return _maybe_add_count('W-%s' % alias, days / 7)
-            else:
-                return _maybe_add_count('D', days)
-
-
-def _maybe_add_count(base, count):
-    if count != 1:
-        return '%d%s' % (count, base)
-    else:
-        return base
-
-
-def is_subperiod(source, target):
-    """
-    Returns True if downsampling is possible between source and target
-    frequencies
-
-    Parameters
-    ----------
-    source : string
-        Frequency converting from
-    target : string
-        Frequency converting to
-
-    Returns
-    -------
-    is_subperiod : boolean
-    """
-    if isinstance(source, offsets.DateOffset):
-        source = source.rule_code
-
-    if isinstance(target, offsets.DateOffset):
-        target = target.rule_code
-
-    target = target.upper()
-    source = source.upper()
-    if _is_annual(target):
-        if _is_quarterly(source):
-            return _quarter_months_conform(_get_rule_month(source),
-                                           _get_rule_month(target))
-        return source in ['D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif _is_quarterly(target):
-        return source in ['D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif _is_monthly(target):
-        return source in ['D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif _is_weekly(target):
-        return source in [target, 'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif target == 'B':
-        return source in ['B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif target == 'C':
-        return source in ['C', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif target == 'D':
-        return source in ['D', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif target == 'H':
-        return source in ['H', 'T', 'S', 'L', 'U', 'N']
-    elif target == 'T':
-        return source in ['T', 'S', 'L', 'U', 'N']
-    elif target == 'S':
-        return source in ['S', 'L', 'U', 'N']
-    elif target == 'L':
-        return source in ['L', 'U', 'N']
-    elif target == 'U':
-        return source in ['U', 'N']
-    elif target == 'N':
-        return source in ['N']
-
-
-def is_superperiod(source, target):
-    """
-    Returns True if upsampling is possible between source and target
-    frequencies
-
-    Parameters
-    ----------
-    source : string
-        Frequency converting from
-    target : string
-        Frequency converting to
-
-    Returns
-    -------
-    is_superperiod : boolean
-    """
-    if isinstance(source, offsets.DateOffset):
-        source = source.rule_code
-
-    if isinstance(target, offsets.DateOffset):
-        target = target.rule_code
-
-    target = target.upper()
-    source = source.upper()
-    if _is_annual(source):
-        if _is_annual(target):
-            return _get_rule_month(source) == _get_rule_month(target)
-
-        if _is_quarterly(target):
-            smonth = _get_rule_month(source)
-            tmonth = _get_rule_month(target)
-            return _quarter_months_conform(smonth, tmonth)
-        return target in ['D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif _is_quarterly(source):
-        return target in ['D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif _is_monthly(source):
-        return target in ['D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif _is_weekly(source):
-        return target in [source, 'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif source == 'B':
-        return target in ['D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif source == 'C':
-        return target in ['D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif source == 'D':
-        return target in ['D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif source == 'H':
-        return target in ['H', 'T', 'S', 'L', 'U', 'N']
-    elif source == 'T':
-        return target in ['T', 'S', 'L', 'U', 'N']
-    elif source == 'S':
-        return target in ['S', 'L', 'U', 'N']
-    elif source == 'L':
-        return target in ['L', 'U', 'N']
-    elif source == 'U':
-        return target in ['U', 'N']
-    elif source == 'N':
-        return target in ['N']
-
-
-_get_rule_month = tslib._get_rule_month
-
-
-def _is_annual(rule):
-    rule = rule.upper()
-    return rule == 'A' or rule.startswith('A-')
-
-
-def _quarter_months_conform(source, target):
-    snum = _month_numbers[source]
-    tnum = _month_numbers[target]
-    return snum % 3 == tnum % 3
-
-
-def _is_quarterly(rule):
-    rule = rule.upper()
-    return rule == 'Q' or rule.startswith('Q-') or rule.startswith('BQ')
-
-
-def _is_monthly(rule):
-    rule = rule.upper()
-    return rule == 'M' or rule == 'BM'
-
-
-def _is_weekly(rule):
-    rule = rule.upper()
-    return rule == 'W' or rule.startswith('W-')
-
-
-DAYS = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
-
-MONTHS = tslib._MONTHS
-_month_numbers = tslib._MONTH_NUMBERS
-_month_aliases = tslib._MONTH_ALIASES
-_weekday_rule_aliases = dict((k, v) for k, v in enumerate(DAYS))
-
-def _is_multiple(us, mult):
-    return us % mult == 0
diff --git a/pandas/tseries/holiday.py b/pandas/tseries/holiday.py
index e98c5dd93e68a..4e874eac9e6c6 100644
--- a/pandas/tseries/holiday.py
+++ b/pandas/tseries/holiday.py
@@ -1,8 +1,11 @@
+import warnings
+
 from pandas import DateOffset, DatetimeIndex, Series, Timestamp
 from pandas.compat import add_metaclass
 from datetime import datetime, timedelta
-from dateutil.relativedelta import MO, TU, WE, TH, FR, SA, SU
+from dateutil.relativedelta import MO, TU, WE, TH, FR, SA, SU  # noqa
 from pandas.tseries.offsets import Easter, Day
+import numpy as np
 
 
 def next_monday(dt):
@@ -16,6 +19,7 @@ def next_monday(dt):
         return dt + timedelta(1)
     return dt
 
+
 def next_monday_or_tuesday(dt):
     """
     For second holiday of two adjacent ones!
@@ -30,6 +34,7 @@ def next_monday_or_tuesday(dt):
         return dt + timedelta(1)
     return dt
 
+
 def previous_friday(dt):
     """
     If holiday falls on Saturday or Sunday, use previous Friday instead.
@@ -40,6 +45,7 @@ def previous_friday(dt):
         return dt - timedelta(2)
     return dt
 
+
 def sunday_to_monday(dt):
     """
     If holiday falls on Sunday, use day thereafter (Monday) instead.
@@ -116,6 +122,7 @@ class Holiday(object):
     Class that defines a holiday with start/end dates and rules
     for observance.
     """
+
     def __init__(self, name, year=None, month=None, day=None, offset=None,
                  observance=None, start_date=None, end_date=None,
                  days_of_week=None):
@@ -126,7 +133,7 @@ def __init__(self, name, year=None, month=None, day=None, offset=None,
             Name of the holiday , defaults to class name
         offset : array of pandas.tseries.offsets or
                 class from pandas.tseries.offsets
-            computes offset from  date
+            computes offset from date
         observance: function
             computes when holiday is given a pandas Timestamp
         days_of_week:
@@ -156,8 +163,10 @@ class from pandas.tseries.offsets
         self.month = month
         self.day = day
         self.offset = offset
-        self.start_date = start_date
-        self.end_date = end_date
+        self.start_date = Timestamp(
+            start_date) if start_date is not None else start_date
+        self.end_date = Timestamp(
+            end_date) if end_date is not None else end_date
         self.observance = observance
         assert (days_of_week is None or type(days_of_week) == tuple)
         self.days_of_week = days_of_week
@@ -165,21 +174,21 @@ class from pandas.tseries.offsets
     def __repr__(self):
         info = ''
         if self.year is not None:
-            info += 'year=%s, ' % self.year
-        info += 'month=%s, day=%s, ' % (self.month, self.day)
+            info += 'year={year}, '.format(year=self.year)
+        info += 'month={mon}, day={day}, '.format(mon=self.month, day=self.day)
 
         if self.offset is not None:
-            info += 'offset=%s' % self.offset
+            info += 'offset={offset}'.format(offset=self.offset)
 
         if self.observance is not None:
-            info += 'observance=%s' % self.observance
+            info += 'observance={obs}'.format(obs=self.observance)
 
-        repr = 'Holiday: %s (%s)' % (self.name, info)
+        repr = 'Holiday: {name} ({info})'.format(name=self.name, info=info)
         return repr
 
     def dates(self, start_date, end_date, return_name=False):
         """
-        Calculate holidays between start date and end date
+        Calculate holidays observed between start date and end date
 
         Parameters
         ----------
@@ -189,6 +198,12 @@ def dates(self, start_date, end_date, return_name=False):
             If True, return a series that has dates and holiday names.
             False will only return dates.
         """
+        start_date = Timestamp(start_date)
+        end_date = Timestamp(end_date)
+
+        filter_start_date = start_date
+        filter_end_date = end_date
+
         if self.year is not None:
             dt = Timestamp(datetime(self.year, self.month, self.day))
             if return_name:
@@ -196,40 +211,59 @@ def dates(self, start_date, end_date, return_name=False):
             else:
                 return [dt]
 
-        if self.start_date is not None:
-            start_date = self.start_date
-
-        if self.end_date is not None:
-            end_date = self.end_date
-
-        start_date = Timestamp(start_date)
-        end_date = Timestamp(end_date)
-
-        year_offset = DateOffset(years=1)
-        base_date = Timestamp(
-            datetime(start_date.year, self.month, self.day),
-            tz=start_date.tz,
-        )
-        dates = DatetimeIndex(start=base_date, end=end_date, freq=year_offset)
+        dates = self._reference_dates(start_date, end_date)
         holiday_dates = self._apply_rule(dates)
         if self.days_of_week is not None:
-            holiday_dates = list(filter(lambda x: x is not None and
-                                                  x.dayofweek in self.days_of_week,
-                                                  holiday_dates))
-        else:
-            holiday_dates = list(filter(lambda x: x is not None, holiday_dates))
+            holiday_dates = holiday_dates[np.in1d(holiday_dates.dayofweek,
+                                                  self.days_of_week)]
+
+        if self.start_date is not None:
+            filter_start_date = max(self.start_date.tz_localize(
+                filter_start_date.tz), filter_start_date)
+        if self.end_date is not None:
+            filter_end_date = min(self.end_date.tz_localize(
+                filter_end_date.tz), filter_end_date)
+        holiday_dates = holiday_dates[(holiday_dates >= filter_start_date) &
+                                      (holiday_dates <= filter_end_date)]
         if return_name:
             return Series(self.name, index=holiday_dates)
         return holiday_dates
 
+    def _reference_dates(self, start_date, end_date):
+        """
+        Get reference dates for the holiday.
+
+        Return reference dates for the holiday also returning the year
+        prior to the start_date and year following the end_date.  This ensures
+        that any offsets to be applied will yield the holidays within
+        the passed in dates.
+        """
+        if self.start_date is not None:
+            start_date = self.start_date.tz_localize(start_date.tz)
+
+        if self.end_date is not None:
+            end_date = self.end_date.tz_localize(start_date.tz)
+
+        year_offset = DateOffset(years=1)
+        reference_start_date = Timestamp(
+            datetime(start_date.year - 1, self.month, self.day))
+
+        reference_end_date = Timestamp(
+            datetime(end_date.year + 1, self.month, self.day))
+        # Don't process unnecessary holidays
+        dates = DatetimeIndex(start=reference_start_date,
+                              end=reference_end_date,
+                              freq=year_offset, tz=start_date.tz)
+
+        return dates
+
     def _apply_rule(self, dates):
         """
-        Apply the given offset/observance to an
-        iterable of dates.
+        Apply the given offset/observance to a DatetimeIndex of dates.
 
         Parameters
         ----------
-        dates : array-like
+        dates : DatetimeIndex
             Dates to apply the given offset/observance rule
 
         Returns
@@ -237,7 +271,7 @@ def _apply_rule(self, dates):
         Dates with rules applied
         """
         if self.observance is not None:
-            return map(lambda d: self.observance(d), dates)
+            return dates.map(lambda d: self.observance(d))
 
         if self.offset is not None:
             if not isinstance(self.offset, list):
@@ -245,10 +279,17 @@ def _apply_rule(self, dates):
             else:
                 offsets = self.offset
             for offset in offsets:
-                dates = list(map(lambda d: d + offset, dates))
+
+                # if we are adding a non-vectorized value
+                # ignore the PerformanceWarnings:
+                with warnings.catch_warnings(record=True):
+                    dates += offset
         return dates
 
+
 holiday_calendars = {}
+
+
 def register(cls):
     try:
         name = cls.name
@@ -256,6 +297,7 @@ def register(cls):
         name = cls.__name__
     holiday_calendars[name] = cls
 
+
 def get_calendar(name):
     """
     Return an instance of a calendar based on its name.
@@ -267,12 +309,16 @@ def get_calendar(name):
     """
     return holiday_calendars[name]()
 
+
 class HolidayCalendarMetaClass(type):
+
     def __new__(cls, clsname, bases, attrs):
-        calendar_class = super(HolidayCalendarMetaClass, cls).__new__(cls, clsname, bases, attrs)
+        calendar_class = super(HolidayCalendarMetaClass, cls).__new__(
+            cls, clsname, bases, attrs)
         register(calendar_class)
         return calendar_class
 
+
 @add_metaclass(HolidayCalendarMetaClass)
 class AbstractHolidayCalendar(object):
     """
@@ -304,6 +350,13 @@ def __init__(self, name=None, rules=None):
         if rules is not None:
             self.rules = rules
 
+    def rule_from_name(self, name):
+        for rule in self.rules:
+            if rule.name == name:
+                return rule
+
+        return None
+
     def holidays(self, start=None, end=None, return_name=False):
         """
         Returns a curve with holidays between start_date and end_date
@@ -312,7 +365,7 @@ def holidays(self, start=None, end=None, return_name=False):
         ----------
         start : starting date, datetime-like, optional
         end : ending date, datetime-like, optional
-        return_names : bool, optional
+        return_name : bool, optional
             If True, return a series that has dates and holiday names.
             False will only return a DatetimeIndex of dates.
 
@@ -321,8 +374,8 @@ def holidays(self, start=None, end=None, return_name=False):
             DatetimeIndex of holidays
         """
         if self.rules is None:
-            raise Exception('Holiday Calendar %s does not have any '
-                            'rules specified' % self.name)
+            raise Exception('Holiday Calendar {name} does not have any '
+                            'rules specified'.format(name=self.name))
 
         if start is None:
             start = AbstractHolidayCalendar.start_date
@@ -334,8 +387,10 @@ def holidays(self, start=None, end=None, return_name=False):
         end = Timestamp(end)
 
         holidays = None
-        # If we don't have a cache or the dates are outside the prior cache, we get them again
-        if self._cache is None or start < self._cache[0] or end > self._cache[1]:
+        # If we don't have a cache or the dates are outside the prior cache, we
+        # get them again
+        if (self._cache is None or start < self._cache[0] or
+                end > self._cache[1]):
             for rule in self.rules:
                 rule_holidays = rule.dates(start, end, return_name=True)
 
@@ -363,8 +418,10 @@ def merge_class(base, other):
 
         Parameters
         ----------
-        base : AbstractHolidayCalendar instance/subclass or array of Holiday objects
-        other : AbstractHolidayCalendar instance/subclass or array of Holiday objects
+        base : AbstractHolidayCalendar
+          instance/subclass or array of Holiday objects
+        other : AbstractHolidayCalendar
+          instance/subclass or array of Holiday objects
         """
         try:
             other = other.rules
@@ -373,7 +430,7 @@ def merge_class(base, other):
 
         if not isinstance(other, list):
             other = [other]
-        other_holidays = dict((holiday.name, holiday) for holiday in other)
+        other_holidays = {holiday.name: holiday for holiday in other}
 
         try:
             base = base.rules
@@ -382,7 +439,7 @@ def merge_class(base, other):
 
         if not isinstance(base, list):
             base = [base]
-        base_holidays = dict([(holiday.name, holiday) for holiday in base])
+        base_holidays = {holiday.name: holiday for holiday in base}
 
         other_holidays.update(base_holidays)
         return list(other_holidays.values())
@@ -405,6 +462,7 @@ def merge(self, other, inplace=False):
         else:
             return holidays
 
+
 USMemorialDay = Holiday('MemorialDay', month=5, day=31,
                         offset=DateOffset(weekday=MO(-1)))
 USLaborDay = Holiday('Labor Day', month=9, day=1,
@@ -413,34 +471,39 @@ def merge(self, other, inplace=False):
                         offset=DateOffset(weekday=MO(2)))
 USThanksgivingDay = Holiday('Thanksgiving', month=11, day=1,
                             offset=DateOffset(weekday=TH(4)))
-USMartinLutherKingJr = Holiday('Dr. Martin Luther King Jr.', start_date=datetime(1986,1,1), month=1, day=1,
+USMartinLutherKingJr = Holiday('Dr. Martin Luther King Jr.',
+                               start_date=datetime(1986, 1, 1), month=1, day=1,
                                offset=DateOffset(weekday=MO(3)))
 USPresidentsDay = Holiday('President''s Day', month=2, day=1,
                           offset=DateOffset(weekday=MO(3)))
 GoodFriday = Holiday("Good Friday", month=1, day=1, offset=[Easter(), Day(-2)])
 
-EasterMonday = Holiday("Easter Monday", month=1, day=1, offset=[Easter(), Day(1)])
+EasterMonday = Holiday("Easter Monday", month=1, day=1,
+                       offset=[Easter(), Day(1)])
 
 
 class USFederalHolidayCalendar(AbstractHolidayCalendar):
     """
-    US Federal Government Holiday Calendar based on rules specified
-    by: https://www.opm.gov/policy-data-oversight/snow-dismissal-procedures/federal-holidays/
+    US Federal Government Holiday Calendar based on rules specified by:
+    https://www.opm.gov/policy-data-oversight/
+       snow-dismissal-procedures/federal-holidays/
     """
     rules = [
-        Holiday('New Years Day', month=1,  day=1,  observance=nearest_workday),
+        Holiday('New Years Day', month=1, day=1, observance=nearest_workday),
         USMartinLutherKingJr,
         USPresidentsDay,
         USMemorialDay,
-        Holiday('July 4th', month=7,  day=4,  observance=nearest_workday),
+        Holiday('July 4th', month=7, day=4, observance=nearest_workday),
         USLaborDay,
         USColumbusDay,
         Holiday('Veterans Day', month=11, day=11, observance=nearest_workday),
         USThanksgivingDay,
         Holiday('Christmas', month=12, day=25, observance=nearest_workday)
-        ]
+    ]
+
 
-def HolidayCalendarFactory(name, base, other, base_class=AbstractHolidayCalendar):
+def HolidayCalendarFactory(name, base, other,
+                           base_class=AbstractHolidayCalendar):
     rules = AbstractHolidayCalendar.merge_class(base, other)
     calendar_class = type(name, (base_class,), {"rules": rules, "name": name})
     return calendar_class
diff --git a/pandas/tseries/index.py b/pandas/tseries/index.py
deleted file mode 100644
index 814a9ccc45582..0000000000000
--- a/pandas/tseries/index.py
+++ /dev/null
@@ -1,2096 +0,0 @@
-# pylint: disable=E1101
-from __future__ import division
-import operator
-import warnings
-from datetime import time, datetime
-from datetime import timedelta
-import numpy as np
-from pandas.core.common import (_NS_DTYPE, _INT64_DTYPE,
-                                _values_from_object, _maybe_box,
-                                is_object_dtype, is_datetime64_dtype,
-                                is_datetimetz, is_dtype_equal,
-                                ABCSeries, is_integer, is_float,
-                                DatetimeTZDtype)
-
-from pandas.io.common import PerformanceWarning
-from pandas.core.index import Index, Int64Index, Float64Index
-import pandas.compat as compat
-from pandas.compat import u
-from pandas.tseries.frequencies import (
-    to_offset, get_period_alias,
-    Resolution)
-from pandas.tseries.base import DatelikeOps, DatetimeIndexOpsMixin
-from pandas.tseries.offsets import DateOffset, generate_range, Tick, CDay
-from pandas.tseries.tools import parse_time_string, normalize_date
-from pandas.tseries.timedeltas import to_timedelta
-from pandas.util.decorators import cache_readonly, deprecate_kwarg
-import pandas.core.common as com
-import pandas.tseries.offsets as offsets
-import pandas.tseries.tools as tools
-
-from pandas.lib import Timestamp
-import pandas.lib as lib
-import pandas.tslib as tslib
-import pandas._period as period
-import pandas.algos as _algos
-import pandas.index as _index
-
-
-def _utc():
-    import pytz
-    return pytz.utc
-
-# -------- some conversion wrapper functions
-
-
-def _field_accessor(name, field, docstring=None):
-    def f(self):
-        values = self.asi8
-        if self.tz is not None:
-            utc = _utc()
-            if self.tz is not utc:
-                values = self._local_timestamps()
-
-        if field in ['is_month_start', 'is_month_end',
-                    'is_quarter_start', 'is_quarter_end',
-                    'is_year_start', 'is_year_end']:
-            month_kw = self.freq.kwds.get('startingMonth', self.freq.kwds.get('month', 12)) if self.freq else 12
-            result = tslib.get_start_end_field(values, field, self.freqstr, month_kw)
-        else:
-            result = tslib.get_date_field(values, field)
-
-        return self._maybe_mask_results(result,convert='float64')
-
-    f.__name__ = name
-    f.__doc__ = docstring
-    return property(f)
-
-
-def _dt_index_cmp(opname, nat_result=False):
-    """
-    Wrap comparison operations to convert datetime-like to datetime64
-    """
-    def wrapper(self, other):
-        func = getattr(super(DatetimeIndex, self), opname)
-        if isinstance(other, datetime) or isinstance(other, compat.string_types):
-            other = _to_m8(other, tz=self.tz)
-            result = func(other)
-            if com.isnull(other):
-                result.fill(nat_result)
-        else:
-            if isinstance(other, list):
-                other = DatetimeIndex(other)
-            elif not isinstance(other, (np.ndarray, Index, ABCSeries)):
-                other = _ensure_datetime64(other)
-            result = func(np.asarray(other))
-            result = _values_from_object(result)
-
-            if isinstance(other, Index):
-                o_mask = other.values.view('i8') == tslib.iNaT
-            else:
-                o_mask = other.view('i8') == tslib.iNaT
-
-            if o_mask.any():
-                result[o_mask] = nat_result
-
-        mask = self.asi8 == tslib.iNaT
-        if mask.any():
-            result[mask] = nat_result
-
-        # support of bool dtype indexers
-        if com.is_bool_dtype(result):
-            return result
-        return Index(result)
-
-    return wrapper
-
-
-def _ensure_datetime64(other):
-    if isinstance(other, np.datetime64):
-        return other
-    raise TypeError('%s type object %s' % (type(other), str(other)))
-
-
-_midnight = time(0, 0)
-
-def _new_DatetimeIndex(cls, d):
-    """ This is called upon unpickling, rather than the default which doesn't have arguments
-        and breaks __new__ """
-
-    # data are already in UTC
-    # so need to localize
-    tz = d.pop('tz',None)
-
-    result = cls.__new__(cls, verify_integrity=False, **d)
-    if tz is not None:
-        result = result.tz_localize('UTC').tz_convert(tz)
-    return result
-
-class DatetimeIndex(DatelikeOps, DatetimeIndexOpsMixin, Int64Index):
-    """
-    Immutable ndarray of datetime64 data, represented internally as int64, and
-    which can be boxed to Timestamp objects that are subclasses of datetime and
-    carry metadata such as frequency information.
-
-    Parameters
-    ----------
-    data  : array-like (1-dimensional), optional
-        Optional datetime-like data to construct index with
-    copy  : bool
-        Make a copy of input ndarray
-    freq : string or pandas offset object, optional
-        One of pandas date offset strings or corresponding objects
-    start : starting value, datetime-like, optional
-        If data is None, start is used as the start point in generating regular
-        timestamp data.
-    periods  : int, optional, > 0
-        Number of periods to generate, if generating index. Takes precedence
-        over end argument
-    end   : end time, datetime-like, optional
-        If periods is none, generated index will extend to first conforming
-        time on or just past end argument
-    closed : string or None, default None
-        Make the interval closed with respect to the given frequency to
-        the 'left', 'right', or both sides (None)
-    tz : pytz.timezone or dateutil.tz.tzfile
-    ambiguous : 'infer', bool-ndarray, 'NaT', default 'raise'
-        - 'infer' will attempt to infer fall dst-transition hours based on order
-        - bool-ndarray where True signifies a DST time, False signifies
-          a non-DST time (note that this flag is only applicable for ambiguous times)
-        - 'NaT' will return NaT where there are ambiguous times
-        - 'raise' will raise an AmbiguousTimeError if there are ambiguous times
-    infer_dst : boolean, default False (DEPRECATED)
-        Attempt to infer fall dst-transition hours based on order
-    name : object
-        Name to be stored in the index
-    """
-
-    _typ = 'datetimeindex'
-    _join_precedence = 10
-
-    def _join_i8_wrapper(joinf, **kwargs):
-        return DatetimeIndexOpsMixin._join_i8_wrapper(joinf, dtype='M8[ns]', **kwargs)
-
-    _inner_indexer = _join_i8_wrapper(_algos.inner_join_indexer_int64)
-    _outer_indexer = _join_i8_wrapper(_algos.outer_join_indexer_int64)
-    _left_indexer = _join_i8_wrapper(_algos.left_join_indexer_int64)
-    _left_indexer_unique = _join_i8_wrapper(
-        _algos.left_join_indexer_unique_int64, with_indexers=False)
-    _arrmap = None
-
-    __eq__ = _dt_index_cmp('__eq__')
-    __ne__ = _dt_index_cmp('__ne__', nat_result=True)
-    __lt__ = _dt_index_cmp('__lt__')
-    __gt__ = _dt_index_cmp('__gt__')
-    __le__ = _dt_index_cmp('__le__')
-    __ge__ = _dt_index_cmp('__ge__')
-
-    _engine_type = _index.DatetimeEngine
-
-    tz = None
-    offset = None
-    _comparables = ['name', 'freqstr', 'tz']
-    _attributes = ['name', 'freq', 'tz']
-    _datetimelike_ops = ['year','month','day','hour','minute','second',
-                         'weekofyear','week','dayofweek','weekday','dayofyear','quarter', 'days_in_month', 'daysinmonth',
-                         'date','time','microsecond','nanosecond','is_month_start','is_month_end',
-                         'is_quarter_start','is_quarter_end','is_year_start','is_year_end',
-                         'tz','freq']
-    _is_numeric_dtype = False
-
-
-    @deprecate_kwarg(old_arg_name='infer_dst', new_arg_name='ambiguous',
-                     mapping={True: 'infer', False: 'raise'})
-    def __new__(cls, data=None,
-                freq=None, start=None, end=None, periods=None,
-                copy=False, name=None, tz=None,
-                verify_integrity=True, normalize=False,
-                closed=None, ambiguous='raise', dtype=None, **kwargs):
-
-        dayfirst = kwargs.pop('dayfirst', None)
-        yearfirst = kwargs.pop('yearfirst', None)
-
-        freq_infer = False
-        if not isinstance(freq, DateOffset):
-
-            # if a passed freq is None, don't infer automatically
-            if freq != 'infer':
-                freq = to_offset(freq)
-            else:
-                freq_infer = True
-                freq = None
-
-        if periods is not None:
-            if is_float(periods):
-                periods = int(periods)
-            elif not is_integer(periods):
-                raise ValueError('Periods must be a number, got %s' %
-                                 str(periods))
-
-        if data is None and freq is None:
-            raise ValueError("Must provide freq argument if no data is "
-                             "supplied")
-
-        if data is None:
-            return cls._generate(start, end, periods, name, freq,
-                                 tz=tz, normalize=normalize, closed=closed,
-                                 ambiguous=ambiguous)
-
-        if not isinstance(data, (np.ndarray, Index, ABCSeries)):
-            if np.isscalar(data):
-                raise ValueError('DatetimeIndex() must be called with a '
-                                 'collection of some kind, %s was passed'
-                                 % repr(data))
-
-            # other iterable of some kind
-            if not isinstance(data, (list, tuple)):
-                data = list(data)
-
-            data = np.asarray(data, dtype='O')
-
-            # try a few ways to make it datetime64
-            if lib.is_string_array(data):
-                data = tslib.parse_str_array_to_datetime(data, freq=freq,
-                                                         dayfirst=dayfirst,
-                                                         yearfirst=yearfirst)
-            else:
-                data = tools.to_datetime(data, errors='raise')
-                data.offset = freq
-                if isinstance(data, DatetimeIndex):
-                    if name is not None:
-                        data.name = name
-
-                    if tz is not None:
-                        return data.tz_localize(tz, ambiguous=ambiguous)
-
-                    return data
-
-        if issubclass(data.dtype.type, compat.string_types):
-            data = tslib.parse_str_array_to_datetime(data, freq=freq,
-                                                     dayfirst=dayfirst,
-                                                     yearfirst=yearfirst)
-
-        if issubclass(data.dtype.type, np.datetime64) or is_datetimetz(data):
-            if isinstance(data, ABCSeries):
-                data = data._values
-            if isinstance(data, DatetimeIndex):
-                if tz is None:
-                    tz = data.tz
-
-                subarr = data.values
-
-                if freq is None:
-                    freq = data.offset
-                    verify_integrity = False
-            else:
-                if data.dtype != _NS_DTYPE:
-                    subarr = tslib.cast_to_nanoseconds(data)
-                else:
-                    subarr = data
-        elif data.dtype == _INT64_DTYPE:
-            if isinstance(data, Int64Index):
-                raise TypeError('cannot convert Int64Index->DatetimeIndex')
-            if copy:
-                subarr = np.asarray(data, dtype=_NS_DTYPE)
-            else:
-                subarr = data.view(_NS_DTYPE)
-        else:
-            if isinstance(data, (ABCSeries, Index)):
-                values = data._values
-            else:
-                values = data
-
-            if lib.is_string_array(values):
-                subarr = tslib.parse_str_array_to_datetime(values, freq=freq, dayfirst=dayfirst,
-                                                     yearfirst=yearfirst)
-
-            else:
-                try:
-                    subarr = tools.to_datetime(data, box=False)
-
-                    # make sure that we have a index/ndarray like (and not a Series)
-                    if isinstance(subarr, ABCSeries):
-                        subarr = subarr._values
-                        if subarr.dtype == np.object_:
-                            subarr = tools._to_datetime(subarr, box=False)
-
-                except ValueError:
-                    # tz aware
-                    subarr = tools._to_datetime(data, box=False, utc=True)
-
-                # we may not have been able to convert
-                if not (is_datetimetz(subarr) or np.issubdtype(subarr.dtype, np.datetime64)):
-                    raise ValueError('Unable to convert %s to datetime dtype'
-                                     % str(data))
-
-        if isinstance(subarr, DatetimeIndex):
-            if tz is None:
-                tz = subarr.tz
-        else:
-            if tz is not None:
-                tz = tslib.maybe_get_tz(tz)
-
-                if (not isinstance(data, DatetimeIndex) or
-                        getattr(data, 'tz', None) is None):
-                    # Convert tz-naive to UTC
-                    ints = subarr.view('i8')
-                    subarr = tslib.tz_localize_to_utc(ints, tz,
-                                                      ambiguous=ambiguous)
-
-                subarr = subarr.view(_NS_DTYPE)
-
-        subarr = cls._simple_new(subarr, name=name, freq=freq, tz=tz)
-
-        # if dtype is provided, coerce here
-        if dtype is not None:
-
-            if not is_dtype_equal(subarr.dtype, dtype):
-
-                if subarr.tz is not None:
-                    raise ValueError("cannot localize from non-UTC data")
-                dtype = DatetimeTZDtype.construct_from_string(dtype)
-                subarr = subarr.tz_localize(dtype.tz)
-
-        if verify_integrity and len(subarr) > 0:
-            if freq is not None and not freq_infer:
-                inferred = subarr.inferred_freq
-                if inferred != freq.freqstr:
-                    on_freq = cls._generate(subarr[0], None, len(subarr), None, freq, tz=tz)
-                    if not np.array_equal(subarr.asi8, on_freq.asi8):
-                        raise ValueError('Inferred frequency {0} from passed dates does not '
-                                         'conform to passed frequency {1}'.format(inferred, freq.freqstr))
-
-        if freq_infer:
-            inferred = subarr.inferred_freq
-            if inferred:
-                subarr.offset = to_offset(inferred)
-
-        return subarr
-
-    @classmethod
-    def _generate(cls, start, end, periods, name, offset,
-                  tz=None, normalize=False, ambiguous='raise', closed=None):
-        if com._count_not_none(start, end, periods) != 2:
-            raise ValueError('Must specify two of start, end, or periods')
-
-        _normalized = True
-
-        if start is not None:
-            start = Timestamp(start)
-
-        if end is not None:
-            end = Timestamp(end)
-
-        left_closed = False
-        right_closed = False
-
-        if start is None and end is None:
-            if closed is not None:
-                raise ValueError("Closed has to be None if not both of start"
-                                 "and end are defined")
-
-        if closed is None:
-            left_closed = True
-            right_closed = True
-        elif closed == "left":
-            left_closed = True
-        elif closed == "right":
-            right_closed = True
-        else:
-            raise ValueError("Closed has to be either 'left', 'right' or None")
-
-        try:
-            inferred_tz = tools._infer_tzinfo(start, end)
-        except:
-            raise TypeError('Start and end cannot both be tz-aware with '
-                             'different timezones')
-
-        inferred_tz = tslib.maybe_get_tz(inferred_tz)
-
-        # these may need to be localized
-        tz = tslib.maybe_get_tz(tz)
-        if tz is not None:
-            date = start or end
-            if date.tzinfo is not None and hasattr(tz, 'localize'):
-                tz = tz.localize(date.replace(tzinfo=None)).tzinfo
-
-        if tz is not None and inferred_tz is not None:
-            if not inferred_tz == tz:
-                raise AssertionError("Inferred time zone not equal to passed "
-                                     "time zone")
-
-        elif inferred_tz is not None:
-            tz = inferred_tz
-
-        if start is not None:
-            if normalize:
-                start = normalize_date(start)
-                _normalized = True
-            else:
-                _normalized = _normalized and start.time() == _midnight
-
-        if end is not None:
-            if normalize:
-                end = normalize_date(end)
-                _normalized = True
-            else:
-                _normalized = _normalized and end.time() == _midnight
-
-        if hasattr(offset, 'delta') and offset != offsets.Day():
-            if inferred_tz is None and tz is not None:
-                # naive dates
-                if start is not None and start.tz is None:
-                    start = start.tz_localize(tz)
-
-                if end is not None and end.tz is None:
-                    end = end.tz_localize(tz)
-
-            if start and end:
-                if start.tz is None and end.tz is not None:
-                    start = start.tz_localize(end.tz)
-
-                if end.tz is None and start.tz is not None:
-                    end = end.tz_localize(start.tz)
-
-            if _use_cached_range(offset, _normalized, start, end):
-                index = cls._cached_range(start, end, periods=periods,
-                                          offset=offset, name=name)
-            else:
-                index = _generate_regular_range(start, end, periods, offset)
-
-        else:
-
-            if tz is not None:
-                # naive dates
-                if start is not None and start.tz is not None:
-                    start = start.replace(tzinfo=None)
-
-                if end is not None and end.tz is not None:
-                    end = end.replace(tzinfo=None)
-
-            if start and end:
-                if start.tz is None and end.tz is not None:
-                    end = end.replace(tzinfo=None)
-
-                if end.tz is None and start.tz is not None:
-                    start = start.replace(tzinfo=None)
-
-            if _use_cached_range(offset, _normalized, start, end):
-                index = cls._cached_range(start, end, periods=periods,
-                                          offset=offset, name=name)
-            else:
-                index = _generate_regular_range(start, end, periods, offset)
-
-            if tz is not None and getattr(index, 'tz', None) is None:
-                index = tslib.tz_localize_to_utc(com._ensure_int64(index), tz,
-                                                 ambiguous=ambiguous)
-                index = index.view(_NS_DTYPE)
-
-        index = cls._simple_new(index, name=name, freq=offset, tz=tz)
-
-        if not left_closed:
-            index = index[1:]
-        if not right_closed:
-            index = index[:-1]
-
-        return index
-
-    @property
-    def _box_func(self):
-        return lambda x: Timestamp(x, offset=self.offset, tz=self.tz)
-
-    def _local_timestamps(self):
-        utc = _utc()
-
-        if self.is_monotonic:
-            return tslib.tz_convert(self.asi8, utc, self.tz)
-        else:
-            values = self.asi8
-            indexer = values.argsort()
-            result = tslib.tz_convert(values.take(indexer), utc, self.tz)
-
-            n = len(indexer)
-            reverse = np.empty(n, dtype=np.int_)
-            reverse.put(indexer, np.arange(n))
-            return result.take(reverse)
-
-    @classmethod
-    def _simple_new(cls, values, name=None, freq=None, tz=None, dtype=None, **kwargs):
-        """
-        we require the we have a dtype compat for the values
-        if we are passed a non-dtype compat, then coerce using the constructor
-        """
-
-        if not getattr(values,'dtype',None):
-            # empty, but with dtype compat
-            if values is None:
-                values = np.empty(0, dtype=_NS_DTYPE)
-                return cls(values, name=name, freq=freq, tz=tz, dtype=dtype, **kwargs)
-            values = np.array(values,copy=False)
-
-        if is_object_dtype(values):
-            return cls(values, name=name, freq=freq, tz=tz, dtype=dtype, **kwargs).values
-        elif not is_datetime64_dtype(values):
-            values = com._ensure_int64(values).view(_NS_DTYPE)
-
-        result = object.__new__(cls)
-        result._data = values
-        result.name = name
-        result.offset = freq
-        result.tz = tslib.maybe_get_tz(tz)
-        result._reset_identity()
-        return result
-
-    @property
-    def tzinfo(self):
-        """
-        Alias for tz attribute
-        """
-        return self.tz
-
-    @classmethod
-    def _cached_range(cls, start=None, end=None, periods=None, offset=None,
-                      name=None):
-        if start is None and end is None:
-            # I somewhat believe this should never be raised externally and therefore
-            # should be a `PandasError` but whatever...
-            raise TypeError('Must specify either start or end.')
-        if start is not None:
-            start = Timestamp(start)
-        if end is not None:
-            end = Timestamp(end)
-        if (start is None or end is None) and periods is None:
-            raise TypeError('Must either specify period or provide both start and end.')
-
-        if offset is None:
-            # This can't happen with external-facing code, therefore PandasError
-            raise TypeError('Must provide offset.')
-
-        drc = _daterange_cache
-        if offset not in _daterange_cache:
-            xdr = generate_range(offset=offset, start=_CACHE_START,
-                                 end=_CACHE_END)
-
-            arr = tools._to_datetime(list(xdr), box=False)
-
-            cachedRange = DatetimeIndex._simple_new(arr)
-            cachedRange.offset = offset
-            cachedRange.tz = None
-            cachedRange.name = None
-            drc[offset] = cachedRange
-        else:
-            cachedRange = drc[offset]
-
-        if start is None:
-            if not isinstance(end, Timestamp):
-                raise AssertionError('end must be an instance of Timestamp')
-
-            end = offset.rollback(end)
-
-            endLoc = cachedRange.get_loc(end) + 1
-            startLoc = endLoc - periods
-        elif end is None:
-            if not isinstance(start, Timestamp):
-                raise AssertionError('start must be an instance of Timestamp')
-
-            start = offset.rollforward(start)
-
-            startLoc = cachedRange.get_loc(start)
-            endLoc = startLoc + periods
-        else:
-            if not offset.onOffset(start):
-                start = offset.rollforward(start)
-
-            if not offset.onOffset(end):
-                end = offset.rollback(end)
-
-            startLoc = cachedRange.get_loc(start)
-            endLoc = cachedRange.get_loc(end) + 1
-
-        indexSlice = cachedRange[startLoc:endLoc]
-        indexSlice.name = name
-        indexSlice.offset = offset
-
-        return indexSlice
-
-    def _mpl_repr(self):
-        # how to represent ourselves to matplotlib
-        return tslib.ints_to_pydatetime(self.asi8, self.tz)
-
-    _na_value = tslib.NaT
-    """The expected NA value to use with this index."""
-
-    @cache_readonly
-    def _is_dates_only(self):
-        from pandas.core.format import _is_dates_only
-        return _is_dates_only(self.values)
-
-    @property
-    def _formatter_func(self):
-        from pandas.core.format import _get_format_datetime64
-        formatter = _get_format_datetime64(is_dates_only=self._is_dates_only)
-        return lambda x: "'%s'" % formatter(x, tz=self.tz)
-
-    def __reduce__(self):
-
-        # we use a special reudce here because we need
-        # to simply set the .tz (and not reinterpret it)
-
-        d = dict(data=self._data)
-        d.update(self._get_attributes_dict())
-        return _new_DatetimeIndex, (self.__class__, d), None
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-        if isinstance(state, dict):
-            super(DatetimeIndex, self).__setstate__(state)
-
-        elif isinstance(state, tuple):
-
-            # < 0.15 compat
-            if len(state) == 2:
-                nd_state, own_state = state
-                data = np.empty(nd_state[1], dtype=nd_state[2])
-                np.ndarray.__setstate__(data, nd_state)
-
-                self.name = own_state[0]
-                self.offset = own_state[1]
-                self.tz = own_state[2]
-
-                # provide numpy < 1.7 compat
-                if nd_state[2] == 'M8[us]':
-                    new_state = np.ndarray.__reduce__(data.astype('M8[ns]'))
-                    np.ndarray.__setstate__(data, new_state[2])
-
-            else:  # pragma: no cover
-                data = np.empty(state)
-                np.ndarray.__setstate__(data, state)
-
-            self._data = data
-            self._reset_identity()
-
-        else:
-            raise Exception("invalid pickle state")
-    _unpickle_compat = __setstate__
-
-    def _sub_datelike(self, other):
-        # subtract a datetime from myself, yielding a TimedeltaIndex
-
-        from pandas import TimedeltaIndex
-        other = Timestamp(other)
-
-        # require tz compat
-        if tslib.get_timezone(self.tz) != tslib.get_timezone(other.tzinfo):
-            raise TypeError("Timestamp subtraction must have the same timezones or no timezones")
-
-        i8 = self.asi8
-        result = i8 - other.value
-        result = self._maybe_mask_results(result,fill_value=tslib.iNaT)
-        return TimedeltaIndex(result,name=self.name,copy=False)
-
-    def _maybe_update_attributes(self, attrs):
-        """ Update Index attributes (e.g. freq) depending on op """
-        freq = attrs.get('freq', None)
-        if freq is not None:
-            # no need to infer if freq is None
-            attrs['freq'] = 'infer'
-        return attrs
-
-    def _add_delta(self, delta):
-        from pandas import TimedeltaIndex
-        name = self.name
-
-        if isinstance(delta, (Tick, timedelta, np.timedelta64)):
-            new_values = self._add_delta_td(delta)
-        elif isinstance(delta, TimedeltaIndex):
-            new_values = self._add_delta_tdi(delta)
-            # update name when delta is Index
-            name = com._maybe_match_name(self, delta)
-        elif isinstance(delta, DateOffset):
-            new_values = self._add_offset(delta).asi8
-        else:
-            new_values = self.astype('O') + delta
-
-        tz = 'UTC' if self.tz is not None else None
-        result = DatetimeIndex(new_values, tz=tz, name=name, freq='infer')
-        utc = _utc()
-        if self.tz is not None and self.tz is not utc:
-            result = result.tz_convert(self.tz)
-        return result
-
-    def _add_offset(self, offset):
-        try:
-            if self.tz is not None:
-                values = self.tz_localize(None)
-            else:
-                values = self
-            result = offset.apply_index(values)
-            if self.tz is not None:
-                result = result.tz_localize(self.tz)
-            return result
-
-        except NotImplementedError:
-            warnings.warn("Non-vectorized DateOffset being applied to Series or DatetimeIndex",
-                           PerformanceWarning)
-            return self.astype('O') + offset
-
-    def _format_native_types(self, na_rep=u('NaT'),
-                             date_format=None, **kwargs):
-        from pandas.core.format import _get_format_datetime64_from_values
-        format = _get_format_datetime64_from_values(self, date_format)
-
-        return tslib.format_array_from_datetime(self.asi8,
-                                                tz=self.tz,
-                                                format=format,
-                                                na_rep=na_rep)
-
-    def to_datetime(self, dayfirst=False):
-        return self.copy()
-
-    def astype(self, dtype):
-        dtype = np.dtype(dtype)
-
-        if dtype == np.object_:
-            return self.asobject
-        elif dtype == _INT64_DTYPE:
-            return self.asi8.copy()
-        elif dtype == _NS_DTYPE and self.tz is not None:
-            return self.tz_convert('UTC').tz_localize(None)
-        else:  # pragma: no cover
-            raise ValueError('Cannot cast DatetimeIndex to dtype %s' % dtype)
-
-    def _get_time_micros(self):
-        utc = _utc()
-        values = self.asi8
-        if self.tz is not None and self.tz is not utc:
-            values = self._local_timestamps()
-        return tslib.get_time_micros(values)
-
-    def to_series(self, keep_tz=False):
-        """
-        Create a Series with both index and values equal to the index keys
-        useful with map for returning an indexer based on an index
-
-        Parameters
-        ----------
-        keep_tz : optional, defaults False.
-                  return the data keeping the timezone.
-
-                  If keep_tz is True:
-
-                    If the timezone is not set, the resulting
-                    Series will have a datetime64[ns] dtype.
-
-                    Otherwise the Series will have an datetime64[ns, tz] dtype; the
-                    tz will be preserved.
-
-                  If keep_tz is False:
-
-                    Series will have a datetime64[ns] dtype. TZ aware
-                    objects will have the tz removed.
-
-        Returns
-        -------
-        Series
-        """
-        from pandas import Series
-        return Series(self._to_embed(keep_tz), index=self, name=self.name)
-
-    def _to_embed(self, keep_tz=False):
-        """
-        return an array repr of this object, potentially casting to object
-
-        This is for internal compat
-        """
-        if keep_tz and self.tz is not None:
-
-            # preserve the tz & copy
-            return self.copy(deep=True)
-
-        return self.values.copy()
-
-    def to_pydatetime(self):
-        """
-        Return DatetimeIndex as object ndarray of datetime.datetime objects
-
-        Returns
-        -------
-        datetimes : ndarray
-        """
-        return tslib.ints_to_pydatetime(self.asi8, tz=self.tz)
-
-    def to_period(self, freq=None):
-        """
-        Cast to PeriodIndex at a particular frequency
-        """
-        from pandas.tseries.period import PeriodIndex
-
-        if freq is None:
-            freq = self.freqstr or self.inferred_freq
-
-            if freq is None:
-                msg = "You must pass a freq argument as current index has none."
-                raise ValueError(msg)
-
-            freq = get_period_alias(freq)
-
-        return PeriodIndex(self.values, name=self.name, freq=freq, tz=self.tz)
-
-    def snap(self, freq='S'):
-        """
-        Snap time stamps to nearest occurring frequency
-
-        """
-        # Superdumb, punting on any optimizing
-        freq = to_offset(freq)
-
-        snapped = np.empty(len(self), dtype=_NS_DTYPE)
-
-        for i, v in enumerate(self):
-            s = v
-            if not freq.onOffset(s):
-                t0 = freq.rollback(s)
-                t1 = freq.rollforward(s)
-                if abs(s - t0) < abs(t1 - s):
-                    s = t0
-                else:
-                    s = t1
-            snapped[i] = s
-
-        # we know it conforms; skip check
-        return DatetimeIndex(snapped, freq=freq, verify_integrity=False)
-
-    def union(self, other):
-        """
-        Specialized union for DatetimeIndex objects. If combine
-        overlapping ranges with the same DateOffset, will be much
-        faster than Index.union
-
-        Parameters
-        ----------
-        other : DatetimeIndex or array-like
-
-        Returns
-        -------
-        y : Index or DatetimeIndex
-        """
-        self._assert_can_do_setop(other)
-        if not isinstance(other, DatetimeIndex):
-            try:
-                other = DatetimeIndex(other)
-            except TypeError:
-                pass
-
-        this, other = self._maybe_utc_convert(other)
-
-        if this._can_fast_union(other):
-            return this._fast_union(other)
-        else:
-            result = Index.union(this, other)
-            if isinstance(result, DatetimeIndex):
-                result.tz = this.tz
-                if (result.freq is None and
-                        (this.freq is not None or other.freq is not None)):
-                    result.offset = to_offset(result.inferred_freq)
-            return result
-
-    def to_perioddelta(self, freq):
-        """
-        Calcuates TimedeltaIndex of difference between index
-        values and index converted to PeriodIndex at specified
-        freq.  Used for vectorized offsets
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        freq : Period frequency
-
-        Returns
-        -------
-        y : TimedeltaIndex
-        """
-        return to_timedelta(self.asi8 - self.to_period(freq).to_timestamp().asi8)
-
-    def union_many(self, others):
-        """
-        A bit of a hack to accelerate unioning a collection of indexes
-        """
-        this = self
-
-        for other in others:
-            if not isinstance(this, DatetimeIndex):
-                this = Index.union(this, other)
-                continue
-
-            if not isinstance(other, DatetimeIndex):
-                try:
-                    other = DatetimeIndex(other)
-                except TypeError:
-                    pass
-
-            this, other = this._maybe_utc_convert(other)
-
-            if this._can_fast_union(other):
-                this = this._fast_union(other)
-            else:
-                tz = this.tz
-                this = Index.union(this, other)
-                if isinstance(this, DatetimeIndex):
-                    this.tz = tz
-
-        if this.freq is None:
-            this.offset = to_offset(this.inferred_freq)
-        return this
-
-    def append(self, other):
-        """
-        Append a collection of Index options together
-
-        Parameters
-        ----------
-        other : Index or list/tuple of indices
-
-        Returns
-        -------
-        appended : Index
-        """
-        name = self.name
-        to_concat = [self]
-
-        if isinstance(other, (list, tuple)):
-            to_concat = to_concat + list(other)
-        else:
-            to_concat.append(other)
-
-        for obj in to_concat:
-            if isinstance(obj, Index) and obj.name != name:
-                name = None
-                break
-
-        to_concat = self._ensure_compat_concat(to_concat)
-        to_concat, factory = _process_concat_data(to_concat, name)
-
-        return factory(to_concat)
-
-    def join(self, other, how='left', level=None, return_indexers=False):
-        """
-        See Index.join
-        """
-        if (not isinstance(other, DatetimeIndex) and len(other) > 0 and
-            other.inferred_type not in ('floating', 'mixed-integer',
-                                        'mixed-integer-float', 'mixed')):
-            try:
-                other = DatetimeIndex(other)
-            except (TypeError, ValueError):
-                pass
-
-        this, other = self._maybe_utc_convert(other)
-        return Index.join(this, other, how=how, level=level,
-                          return_indexers=return_indexers)
-
-    def _maybe_utc_convert(self, other):
-        this = self
-        if isinstance(other, DatetimeIndex):
-            if self.tz is not None:
-                if other.tz is None:
-                    raise TypeError('Cannot join tz-naive with tz-aware '
-                                    'DatetimeIndex')
-            elif other.tz is not None:
-                raise TypeError('Cannot join tz-naive with tz-aware '
-                                'DatetimeIndex')
-
-            if self.tz != other.tz:
-                this = self.tz_convert('UTC')
-                other = other.tz_convert('UTC')
-        return this, other
-
-    def _wrap_joined_index(self, joined, other):
-        name = self.name if self.name == other.name else None
-        if (isinstance(other, DatetimeIndex)
-            and self.offset == other.offset
-                and self._can_fast_union(other)):
-            joined = self._shallow_copy(joined)
-            joined.name = name
-            return joined
-        else:
-            tz = getattr(other, 'tz', None)
-            return self._simple_new(joined, name, tz=tz)
-
-    def _can_fast_union(self, other):
-        if not isinstance(other, DatetimeIndex):
-            return False
-
-        offset = self.offset
-
-        if offset is None or offset != other.offset:
-            return False
-
-        if not self.is_monotonic or not other.is_monotonic:
-            return False
-
-        if len(self) == 0 or len(other) == 0:
-            return True
-
-        # to make our life easier, "sort" the two ranges
-        if self[0] <= other[0]:
-            left, right = self, other
-        else:
-            left, right = other, self
-
-        right_start = right[0]
-        left_end = left[-1]
-
-        # Only need to "adjoin", not overlap
-        try:
-            return (right_start == left_end + offset) or right_start in left
-        except (ValueError):
-
-            # if we are comparing an offset that does not propogate timezones
-            # this will raise
-            return False
-
-    def _fast_union(self, other):
-        if len(other) == 0:
-            return self.view(type(self))
-
-        if len(self) == 0:
-            return other.view(type(self))
-
-        # to make our life easier, "sort" the two ranges
-        if self[0] <= other[0]:
-            left, right = self, other
-        else:
-            left, right = other, self
-
-        left_start, left_end = left[0], left[-1]
-        right_end = right[-1]
-
-        if not self.offset._should_cache():
-            # concatenate dates
-            if left_end < right_end:
-                loc = right.searchsorted(left_end, side='right')
-                right_chunk = right.values[loc:]
-                dates = com._concat_compat((left.values, right_chunk))
-                return self._shallow_copy(dates)
-            else:
-                return left
-        else:
-            return type(self)(start=left_start,
-                              end=max(left_end, right_end),
-                              freq=left.offset)
-
-    def __iter__(self):
-        """
-        Return an iterator over the boxed values
-
-        Returns
-        -------
-        Timestamps : ndarray
-        """
-
-        # convert in chunks of 10k for efficiency
-        data = self.asi8
-        l = len(self)
-        chunksize = 10000
-        chunks = int(l / chunksize) + 1
-        for i in range(chunks):
-            start_i = i*chunksize
-            end_i = min((i+1)*chunksize,l)
-            converted = tslib.ints_to_pydatetime(data[start_i:end_i], tz=self.tz, offset=self.offset, box=True)
-            for v in converted:
-                yield v
-
-    def _wrap_union_result(self, other, result):
-        name = self.name if self.name == other.name else None
-        if self.tz != other.tz:
-            raise ValueError('Passed item and index have different timezone')
-        return self._simple_new(result, name=name, freq=None, tz=self.tz)
-
-    def intersection(self, other):
-        """
-        Specialized intersection for DatetimeIndex objects. May be much faster
-        than Index.intersection
-
-        Parameters
-        ----------
-        other : DatetimeIndex or array-like
-
-        Returns
-        -------
-        y : Index or DatetimeIndex
-        """
-        self._assert_can_do_setop(other)
-        if not isinstance(other, DatetimeIndex):
-            try:
-                other = DatetimeIndex(other)
-            except (TypeError, ValueError):
-                pass
-            result = Index.intersection(self, other)
-            if isinstance(result, DatetimeIndex):
-                if result.freq is None:
-                    result.offset = to_offset(result.inferred_freq)
-            return result
-
-        elif (other.offset is None or self.offset is None or
-              other.offset != self.offset or
-              not other.offset.isAnchored() or
-              (not self.is_monotonic or not other.is_monotonic)):
-            result = Index.intersection(self, other)
-            if isinstance(result, DatetimeIndex):
-                if result.freq is None:
-                    result.offset = to_offset(result.inferred_freq)
-            return result
-
-        if len(self) == 0:
-            return self
-        if len(other) == 0:
-            return other
-        # to make our life easier, "sort" the two ranges
-        if self[0] <= other[0]:
-            left, right = self, other
-        else:
-            left, right = other, self
-
-        end = min(left[-1], right[-1])
-        start = right[0]
-
-        if end < start:
-            return type(self)(data=[])
-        else:
-            lslice = slice(*left.slice_locs(start, end))
-            left_chunk = left.values[lslice]
-            return self._shallow_copy(left_chunk)
-
-    def _parsed_string_to_bounds(self, reso, parsed):
-        """
-        Calculate datetime bounds for parsed time string and its resolution.
-
-        Parameters
-        ----------
-        reso : Resolution
-            Resolution provided by parsed string.
-        parsed : datetime
-            Datetime from parsed string.
-
-        Returns
-        -------
-        lower, upper: pd.Timestamp
-
-        """
-        is_monotonic = self.is_monotonic
-        if reso == 'year':
-            return (Timestamp(datetime(parsed.year, 1, 1), tz=self.tz),
-                    Timestamp(datetime(parsed.year, 12, 31, 23, 59, 59, 999999), tz=self.tz))
-        elif reso == 'month':
-            d = tslib.monthrange(parsed.year, parsed.month)[1]
-            return (Timestamp(datetime(parsed.year, parsed.month, 1), tz=self.tz),
-                    Timestamp(datetime(parsed.year, parsed.month, d, 23, 59, 59, 999999), tz=self.tz))
-        elif reso == 'quarter':
-            qe = (((parsed.month - 1) + 2) % 12) + 1  # two months ahead
-            d = tslib.monthrange(parsed.year, qe)[1]   # at end of month
-            return (Timestamp(datetime(parsed.year, parsed.month, 1), tz=self.tz),
-                    Timestamp(datetime(parsed.year, qe, d, 23, 59, 59, 999999), tz=self.tz))
-        elif reso == 'day':
-            st = datetime(parsed.year, parsed.month, parsed.day)
-            return (Timestamp(st, tz=self.tz),
-                    Timestamp(Timestamp(st + offsets.Day(), tz=self.tz).value - 1))
-        elif reso == 'hour':
-            st = datetime(parsed.year, parsed.month, parsed.day,
-                          hour=parsed.hour)
-            return (Timestamp(st, tz=self.tz),
-                    Timestamp(Timestamp(st + offsets.Hour(),
-                                        tz=self.tz).value - 1))
-        elif reso == 'minute':
-            st = datetime(parsed.year, parsed.month, parsed.day,
-                          hour=parsed.hour, minute=parsed.minute)
-            return (Timestamp(st, tz=self.tz),
-                    Timestamp(Timestamp(st + offsets.Minute(),
-                                        tz=self.tz).value - 1))
-        elif reso == 'second':
-            st = datetime(parsed.year, parsed.month, parsed.day,
-                          hour=parsed.hour, minute=parsed.minute, second=parsed.second)
-            return (Timestamp(st, tz=self.tz),
-                    Timestamp(Timestamp(st + offsets.Second(),
-                                        tz=self.tz).value - 1))
-        elif reso == 'microsecond':
-            st = datetime(parsed.year, parsed.month, parsed.day,
-                          parsed.hour, parsed.minute, parsed.second,
-                          parsed.microsecond)
-            return (Timestamp(st, tz=self.tz), Timestamp(st, tz=self.tz))
-        else:
-            raise KeyError
-
-    def _partial_date_slice(self, reso, parsed, use_lhs=True, use_rhs=True):
-        is_monotonic = self.is_monotonic
-        if ((reso in ['day', 'hour', 'minute'] and
-             not (self._resolution < Resolution.get_reso(reso) or
-                  not is_monotonic)) or
-            (reso == 'second' and
-             not (self._resolution <= Resolution.RESO_SEC or
-                  not is_monotonic))):
-            # These resolution/monotonicity validations came from GH3931,
-            # GH3452 and GH2369.
-            raise KeyError
-
-        if reso == 'microsecond':
-            # _partial_date_slice doesn't allow microsecond resolution, but
-            # _parsed_string_to_bounds allows it.
-            raise KeyError
-
-        t1, t2 = self._parsed_string_to_bounds(reso, parsed)
-        stamps = self.asi8
-
-        if is_monotonic:
-
-            # we are out of range
-            if len(stamps) and (
-                (use_lhs and t1.value < stamps[0] and t2.value < stamps[0]) or (
-                (use_rhs and t1.value > stamps[-1] and t2.value > stamps[-1]))):
-                raise KeyError
-
-            # a monotonic (sorted) series can be sliced
-            left = stamps.searchsorted(t1.value, side='left') if use_lhs else None
-            right = stamps.searchsorted(t2.value, side='right') if use_rhs else None
-
-            return slice(left, right)
-
-        lhs_mask = (stamps >= t1.value) if use_lhs else True
-        rhs_mask = (stamps <= t2.value) if use_rhs else True
-
-        # try to find a the dates
-        return (lhs_mask & rhs_mask).nonzero()[0]
-
-    def _possibly_promote(self, other):
-        if other.inferred_type == 'date':
-            other = DatetimeIndex(other)
-        return self, other
-
-    def get_value(self, series, key):
-        """
-        Fast lookup of value from 1-dimensional ndarray. Only use this if you
-        know what you're doing
-        """
-
-        if isinstance(key, datetime):
-
-            # needed to localize naive datetimes
-            if self.tz is not None:
-                key = Timestamp(key, tz=self.tz)
-
-            return self.get_value_maybe_box(series, key)
-
-        if isinstance(key, time):
-            locs = self.indexer_at_time(key)
-            return series.take(locs)
-
-        try:
-            return _maybe_box(self, Index.get_value(self, series, key), series, key)
-        except KeyError:
-            try:
-                loc = self._get_string_slice(key)
-                return series[loc]
-            except (TypeError, ValueError, KeyError):
-                pass
-
-            try:
-                return self.get_value_maybe_box(series, key)
-            except (TypeError, ValueError, KeyError):
-                raise KeyError(key)
-
-    def get_value_maybe_box(self, series, key):
-        # needed to localize naive datetimes
-        if self.tz is not None:
-            key = Timestamp(key, tz=self.tz)
-        elif not isinstance(key, Timestamp):
-            key = Timestamp(key)
-        values = self._engine.get_value(_values_from_object(series), key)
-        return _maybe_box(self, values, series, key)
-
-    def get_loc(self, key, method=None, tolerance=None):
-        """
-        Get integer location for requested label
-
-        Returns
-        -------
-        loc : int
-        """
-        if tolerance is not None:
-            # try converting tolerance now, so errors don't get swallowed by
-            # the try/except clauses below
-            tolerance = self._convert_tolerance(tolerance)
-
-        if isinstance(key, datetime):
-            # needed to localize naive datetimes
-            key = Timestamp(key, tz=self.tz)
-            return Index.get_loc(self, key, method, tolerance)
-
-        if isinstance(key, time):
-            if method is not None:
-                raise NotImplementedError('cannot yet lookup inexact labels '
-                                          'when key is a time object')
-            return self.indexer_at_time(key)
-
-        try:
-            return Index.get_loc(self, key, method, tolerance)
-        except (KeyError, ValueError, TypeError):
-            try:
-                return self._get_string_slice(key)
-            except (TypeError, KeyError, ValueError):
-                pass
-
-            try:
-                stamp = Timestamp(key, tz=self.tz)
-                return Index.get_loc(self, stamp, method, tolerance)
-            except (KeyError, ValueError):
-                raise KeyError(key)
-
-    def _maybe_cast_slice_bound(self, label, side, kind):
-        """
-        If label is a string, cast it to datetime according to resolution.
-
-        Parameters
-        ----------
-        label : object
-        side : {'left', 'right'}
-        kind : string / None
-
-        Returns
-        -------
-        label :  object
-
-        Notes
-        -----
-        Value of `side` parameter should be validated in caller.
-
-        """
-        if is_float(label) or isinstance(label, time) or is_integer(label):
-            self._invalid_indexer('slice',label)
-
-        if isinstance(label, compat.string_types):
-            freq = getattr(self, 'freqstr',
-                           getattr(self, 'inferred_freq', None))
-            _, parsed, reso = parse_time_string(label, freq)
-            bounds = self._parsed_string_to_bounds(reso, parsed)
-            return bounds[0 if side == 'left' else 1]
-        else:
-            return label
-
-    def _get_string_slice(self, key, use_lhs=True, use_rhs=True):
-        freq = getattr(self, 'freqstr',
-                       getattr(self, 'inferred_freq', None))
-        _, parsed, reso = parse_time_string(key, freq)
-        loc = self._partial_date_slice(reso, parsed, use_lhs=use_lhs,
-                                       use_rhs=use_rhs)
-        return loc
-
-    def slice_indexer(self, start=None, end=None, step=None, kind=None):
-        """
-        Return indexer for specified label slice.
-        Index.slice_indexer, customized to handle time slicing.
-
-        In addition to functionality provided by Index.slice_indexer, does the
-        following:
-
-        - if both `start` and `end` are instances of `datetime.time`, it
-          invokes `indexer_between_time`
-        - if `start` and `end` are both either string or None perform
-          value-based selection in non-monotonic cases.
-
-        """
-        # For historical reasons DatetimeIndex supports slices between two
-        # instances of datetime.time as if it were applying a slice mask to
-        # an array of (self.hour, self.minute, self.seconds, self.microsecond).
-        if isinstance(start, time) and isinstance(end, time):
-            if step is not None and step != 1:
-                raise ValueError('Must have step size of 1 with time slices')
-            return self.indexer_between_time(start, end)
-
-        if isinstance(start, time) or isinstance(end, time):
-            raise KeyError('Cannot mix time and non-time slice keys')
-
-        try:
-            return Index.slice_indexer(self, start, end, step)
-        except KeyError:
-            # For historical reasons DatetimeIndex by default supports
-            # value-based partial (aka string) slices on non-monotonic arrays,
-            # let's try that.
-            if ((start is None or isinstance(start, compat.string_types)) and
-                (end is None or isinstance(end, compat.string_types))):
-                mask = True
-                if start is not None:
-                    start_casted = self._maybe_cast_slice_bound(start, 'left', kind)
-                    mask = start_casted <= self
-
-                if end is not None:
-                    end_casted = self._maybe_cast_slice_bound(end, 'right', kind)
-                    mask = (self <= end_casted) & mask
-
-                indexer = mask.nonzero()[0][::step]
-                if len(indexer) == len(self):
-                    return slice(None)
-                else:
-                    return indexer
-            else:
-                raise
-
-    # alias to offset
-    def _get_freq(self):
-        return self.offset
-
-    def _set_freq(self, value):
-        self.offset = value
-    freq = property(fget=_get_freq, fset=_set_freq, doc="get/set the frequncy of the Index")
-
-    year = _field_accessor('year', 'Y', "The year of the datetime")
-    month = _field_accessor('month', 'M', "The month as January=1, December=12")
-    day = _field_accessor('day', 'D', "The days of the datetime")
-    hour = _field_accessor('hour', 'h', "The hours of the datetime")
-    minute = _field_accessor('minute', 'm', "The minutes of the datetime")
-    second = _field_accessor('second', 's', "The seconds of the datetime")
-    millisecond = _field_accessor('millisecond', 'ms', "The milliseconds of the datetime")
-    microsecond = _field_accessor('microsecond', 'us', "The microseconds of the datetime")
-    nanosecond = _field_accessor('nanosecond', 'ns', "The nanoseconds of the datetime")
-    weekofyear = _field_accessor('weekofyear', 'woy', "The week ordinal of the year")
-    week = weekofyear
-    dayofweek = _field_accessor('dayofweek', 'dow',
-                                 "The day of the week with Monday=0, Sunday=6")
-    weekday = dayofweek
-    dayofyear = _field_accessor('dayofyear', 'doy', "The ordinal day of the year")
-    quarter = _field_accessor('quarter', 'q', "The quarter of the date")
-    days_in_month = _field_accessor('days_in_month', 'dim', "The number of days in the month\n\n.. versionadded:: 0.16.0")
-    daysinmonth = days_in_month
-    is_month_start = _field_accessor('is_month_start', 'is_month_start', "Logical indicating if first day of month (defined by frequency)")
-    is_month_end = _field_accessor('is_month_end', 'is_month_end', "Logical indicating if last day of month (defined by frequency)")
-    is_quarter_start = _field_accessor('is_quarter_start', 'is_quarter_start', "Logical indicating if first day of quarter (defined by frequency)")
-    is_quarter_end = _field_accessor('is_quarter_end', 'is_quarter_end', "Logical indicating if last day of quarter (defined by frequency)")
-    is_year_start = _field_accessor('is_year_start', 'is_year_start', "Logical indicating if first day of year (defined by frequency)")
-    is_year_end = _field_accessor('is_year_end', 'is_year_end', "Logical indicating if last day of year (defined by frequency)")
-
-    @property
-    def time(self):
-        """
-        Returns numpy array of datetime.time. The time part of the Timestamps.
-        """
-        # can't call self.map() which tries to treat func as ufunc
-        # and causes recursion warnings on python 2.6
-        return self._maybe_mask_results(_algos.arrmap_object(self.asobject.values,
-                                                             lambda x: np.nan if x is tslib.NaT else x.time()))
-
-    @property
-    def date(self):
-        """
-        Returns numpy array of datetime.date. The date part of the Timestamps.
-        """
-        return self._maybe_mask_results(_algos.arrmap_object(self.asobject.values, lambda x: x.date()))
-
-    def normalize(self):
-        """
-        Return DatetimeIndex with times to midnight. Length is unaltered
-
-        Returns
-        -------
-        normalized : DatetimeIndex
-        """
-        new_values = tslib.date_normalize(self.asi8, self.tz)
-        return DatetimeIndex(new_values, freq='infer', name=self.name,
-                             tz=self.tz)
-
-    def searchsorted(self, key, side='left'):
-        if isinstance(key, (np.ndarray, Index)):
-            key = np.array(key, dtype=_NS_DTYPE, copy=False)
-        else:
-            key = _to_m8(key, tz=self.tz)
-
-        return self.values.searchsorted(key, side=side)
-
-    def is_type_compatible(self, typ):
-        return typ == self.inferred_type or typ == 'datetime'
-
-    @property
-    def inferred_type(self):
-        # b/c datetime is represented as microseconds since the epoch, make
-        # sure we can't have ambiguous indexing
-        return 'datetime64'
-
-    @cache_readonly
-    def dtype(self):
-        if self.tz is None:
-            return _NS_DTYPE
-        return com.DatetimeTZDtype('ns',self.tz)
-
-    @property
-    def is_all_dates(self):
-        return True
-
-    @cache_readonly
-    def is_normalized(self):
-        """
-        Returns True if all of the dates are at midnight ("no time")
-        """
-        return tslib.dates_normalized(self.asi8, self.tz)
-
-    @cache_readonly
-    def _resolution(self):
-        return period.resolution(self.asi8, self.tz)
-
-    def equals(self, other):
-        """
-        Determines if two Index objects contain the same elements.
-        """
-        if self.is_(other):
-            return True
-
-        if (not hasattr(other, 'inferred_type') or
-                other.inferred_type != 'datetime64'):
-            if self.offset is not None:
-                return False
-            try:
-                other = DatetimeIndex(other)
-            except:
-                return False
-
-        if self.tz is not None:
-            if other.tz is None:
-                return False
-            same_zone = tslib.get_timezone(
-                self.tz) == tslib.get_timezone(other.tz)
-        else:
-            if other.tz is not None:
-                return False
-            same_zone = True
-
-        return same_zone and np.array_equal(self.asi8, other.asi8)
-
-    def insert(self, loc, item):
-        """
-        Make new Index inserting new item at location
-
-        Parameters
-        ----------
-        loc : int
-        item : object
-            if not either a Python datetime or a numpy integer-like, returned
-            Index dtype will be object rather than datetime.
-
-        Returns
-        -------
-        new_index : Index
-        """
-
-        freq = None
-        if isinstance(item, (datetime, np.datetime64)):
-            zone = tslib.get_timezone(self.tz)
-            izone = tslib.get_timezone(getattr(item, 'tzinfo', None))
-            if zone != izone:
-                raise ValueError('Passed item and index have different timezone')
-            # check freq can be preserved on edge cases
-            if self.size and self.freq is not None:
-                if (loc == 0 or loc == -len(self)) and item + self.freq == self[0]:
-                    freq = self.freq
-                elif (loc == len(self)) and item - self.freq == self[-1]:
-                    freq = self.freq
-            item = _to_m8(item, tz=self.tz)
-        try:
-            new_dates = np.concatenate((self[:loc].asi8, [item.view(np.int64)],
-                                        self[loc:].asi8))
-            if self.tz is not None:
-                new_dates = tslib.tz_convert(new_dates, 'UTC', self.tz)
-            return DatetimeIndex(new_dates, name=self.name, freq=freq, tz=self.tz)
-
-        except (AttributeError, TypeError):
-
-            # fall back to object index
-            if isinstance(item,compat.string_types):
-                return self.asobject.insert(loc, item)
-            raise TypeError("cannot insert DatetimeIndex with incompatible label")
-
-    def delete(self, loc):
-        """
-        Make a new DatetimeIndex with passed location(s) deleted.
-
-        Parameters
-        ----------
-        loc: int, slice or array of ints
-            Indicate which sub-arrays to remove.
-
-        Returns
-        -------
-        new_index : DatetimeIndex
-        """
-        new_dates = np.delete(self.asi8, loc)
-
-        freq = None
-        if is_integer(loc):
-            if loc in (0, -len(self), -1, len(self) - 1):
-                freq = self.freq
-        else:
-            if com.is_list_like(loc):
-                loc = lib.maybe_indices_to_slice(com._ensure_int64(np.array(loc)), len(self))
-            if isinstance(loc, slice) and loc.step in (1, None):
-                if (loc.start in (0, None) or loc.stop in (len(self), None)):
-                    freq = self.freq
-
-        if self.tz is not None:
-            new_dates = tslib.tz_convert(new_dates, 'UTC', self.tz)
-        return DatetimeIndex(new_dates, name=self.name, freq=freq, tz=self.tz)
-
-    def tz_convert(self, tz):
-        """
-        Convert tz-aware DatetimeIndex from one time zone to another (using pytz/dateutil)
-
-        Parameters
-        ----------
-        tz : string, pytz.timezone, dateutil.tz.tzfile or None
-            Time zone for time. Corresponding timestamps would be converted to
-            time zone of the TimeSeries.
-            None will remove timezone holding UTC time.
-
-        Returns
-        -------
-        normalized : DatetimeIndex
-
-        Raises
-        ------
-        TypeError
-            If DatetimeIndex is tz-naive.
-        """
-        tz = tslib.maybe_get_tz(tz)
-
-        if self.tz is None:
-            # tz naive, use tz_localize
-            raise TypeError('Cannot convert tz-naive timestamps, use '
-                            'tz_localize to localize')
-
-        # No conversion since timestamps are all UTC to begin with
-        return self._shallow_copy(tz=tz)
-
-    @deprecate_kwarg(old_arg_name='infer_dst', new_arg_name='ambiguous',
-                 mapping={True: 'infer', False: 'raise'})
-    def tz_localize(self, tz, ambiguous='raise'):
-        """
-        Localize tz-naive DatetimeIndex to given time zone (using pytz/dateutil),
-        or remove timezone from tz-aware DatetimeIndex
-
-        Parameters
-        ----------
-        tz : string, pytz.timezone, dateutil.tz.tzfile or None
-            Time zone for time. Corresponding timestamps would be converted to
-            time zone of the TimeSeries.
-            None will remove timezone holding local time.
-        ambiguous : 'infer', bool-ndarray, 'NaT', default 'raise'
-            - 'infer' will attempt to infer fall dst-transition hours based on order
-            - bool-ndarray where True signifies a DST time, False signifies
-              a non-DST time (note that this flag is only applicable for ambiguous times)
-            - 'NaT' will return NaT where there are ambiguous times
-            - 'raise' will raise an AmbiguousTimeError if there are ambiguous times
-        infer_dst : boolean, default False (DEPRECATED)
-            Attempt to infer fall dst-transition hours based on order
-
-        Returns
-        -------
-        localized : DatetimeIndex
-
-        Raises
-        ------
-        TypeError
-            If the DatetimeIndex is tz-aware and tz is not None.
-        """
-        if self.tz is not None:
-            if tz is None:
-                new_dates = tslib.tz_convert(self.asi8, 'UTC', self.tz)
-            else:
-                raise TypeError("Already tz-aware, use tz_convert to convert.")
-        else:
-            tz = tslib.maybe_get_tz(tz)
-            # Convert to UTC
-
-            new_dates = tslib.tz_localize_to_utc(self.asi8, tz,
-                                                 ambiguous=ambiguous)
-        new_dates = new_dates.view(_NS_DTYPE)
-        return self._shallow_copy(new_dates, tz=tz)
-
-    def indexer_at_time(self, time, asof=False):
-        """
-        Select values at particular time of day (e.g. 9:30AM)
-
-        Parameters
-        ----------
-        time : datetime.time or string
-
-        Returns
-        -------
-        values_at_time : TimeSeries
-        """
-        from dateutil.parser import parse
-
-        if asof:
-            raise NotImplementedError("'asof' argument is not supported")
-
-        if isinstance(time, compat.string_types):
-            time = parse(time).time()
-
-        if time.tzinfo:
-            # TODO
-            raise NotImplementedError("argument 'time' with timezone info is "
-                                      "not supported")
-
-        time_micros = self._get_time_micros()
-        micros = _time_to_micros(time)
-        return (micros == time_micros).nonzero()[0]
-
-    def indexer_between_time(self, start_time, end_time, include_start=True,
-                             include_end=True):
-        """
-        Select values between particular times of day (e.g., 9:00-9:30AM)
-
-        Parameters
-        ----------
-        start_time : datetime.time or string
-        end_time : datetime.time or string
-        include_start : boolean, default True
-        include_end : boolean, default True
-        tz : string or pytz.timezone or dateutil.tz.tzfile, default None
-
-        Returns
-        -------
-        values_between_time : TimeSeries
-        """
-        from dateutil.parser import parse
-
-        if isinstance(start_time, compat.string_types):
-            start_time = parse(start_time).time()
-
-        if isinstance(end_time, compat.string_types):
-            end_time = parse(end_time).time()
-
-        if start_time.tzinfo or end_time.tzinfo:
-            raise NotImplementedError("argument 'time' with timezone info is "
-                                      "not supported")
-
-        time_micros = self._get_time_micros()
-        start_micros = _time_to_micros(start_time)
-        end_micros = _time_to_micros(end_time)
-
-        if include_start and include_end:
-            lop = rop = operator.le
-        elif include_start:
-            lop = operator.le
-            rop = operator.lt
-        elif include_end:
-            lop = operator.lt
-            rop = operator.le
-        else:
-            lop = rop = operator.lt
-
-        if start_time <= end_time:
-            join_op = operator.and_
-        else:
-            join_op = operator.or_
-
-        mask = join_op(lop(start_micros, time_micros),
-                       rop(time_micros, end_micros))
-
-        return mask.nonzero()[0]
-
-    def to_julian_date(self):
-        """
-        Convert DatetimeIndex to Float64Index of Julian Dates.
-        0 Julian date is noon January 1, 4713 BC.
-        http://en.wikipedia.org/wiki/Julian_day
-        """
-
-        # http://mysite.verizon.net/aesir_research/date/jdalg2.htm
-        year = self.year
-        month = self.month
-        day = self.day
-        testarr = month < 3
-        year[testarr] -= 1
-        month[testarr] += 12
-        return Float64Index(day +
-                            np.fix((153*month - 457)/5) +
-                            365*year +
-                            np.floor(year / 4) -
-                            np.floor(year / 100) +
-                            np.floor(year / 400) +
-                            1721118.5 +
-                            (self.hour +
-                             self.minute/60.0 +
-                             self.second/3600.0 +
-                             self.microsecond/3600.0/1e+6 +
-                             self.nanosecond/3600.0/1e+9
-                            )/24.0)
-
-
-DatetimeIndex._add_numeric_methods_disabled()
-DatetimeIndex._add_logical_methods_disabled()
-DatetimeIndex._add_datetimelike_methods()
-
-
-def _generate_regular_range(start, end, periods, offset):
-    if isinstance(offset, Tick):
-        stride = offset.nanos
-        if periods is None:
-            b = Timestamp(start).value
-            # cannot just use e = Timestamp(end) + 1 because arange breaks when
-            # stride is too large, see GH10887
-            e = b + (Timestamp(end).value - b)//stride * stride + stride//2
-            # end.tz == start.tz by this point due to _generate implementation
-            tz = start.tz
-        elif start is not None:
-            b = Timestamp(start).value
-            e = b + np.int64(periods) * stride
-            tz = start.tz
-        elif end is not None:
-            e = Timestamp(end).value + stride
-            b = e - np.int64(periods) * stride
-            tz = end.tz
-        else:
-            raise ValueError("at least 'start' or 'end' should be specified "
-                             "if a 'period' is given.")
-
-        data = np.arange(b, e, stride, dtype=np.int64)
-        data = DatetimeIndex._simple_new(data, None, tz=tz)
-    else:
-        if isinstance(start, Timestamp):
-            start = start.to_pydatetime()
-
-        if isinstance(end, Timestamp):
-            end = end.to_pydatetime()
-
-        xdr = generate_range(start=start, end=end,
-                             periods=periods, offset=offset)
-
-        dates = list(xdr)
-        # utc = len(dates) > 0 and dates[0].tzinfo is not None
-        data = tools.to_datetime(dates)
-
-    return data
-
-
-def date_range(start=None, end=None, periods=None, freq='D', tz=None,
-               normalize=False, name=None, closed=None):
-    """
-    Return a fixed frequency datetime index, with day (calendar) as the default
-    frequency
-
-    Parameters
-    ----------
-    start : string or datetime-like, default None
-        Left bound for generating dates
-    end : string or datetime-like, default None
-        Right bound for generating dates
-    periods : integer or None, default None
-        If None, must specify start and end
-    freq : string or DateOffset, default 'D' (calendar daily)
-        Frequency strings can have multiples, e.g. '5H'
-    tz : string or None
-        Time zone name for returning localized DatetimeIndex, for example
-    Asia/Hong_Kong
-    normalize : bool, default False
-        Normalize start/end dates to midnight before generating date range
-    name : str, default None
-        Name of the resulting index
-    closed : string or None, default None
-        Make the interval closed with respect to the given frequency to
-        the 'left', 'right', or both sides (None)
-
-    Notes
-    -----
-    2 of start, end, or periods must be specified
-
-    Returns
-    -------
-    rng : DatetimeIndex
-    """
-    return DatetimeIndex(start=start, end=end, periods=periods,
-                         freq=freq, tz=tz, normalize=normalize, name=name,
-                         closed=closed)
-
-
-def bdate_range(start=None, end=None, periods=None, freq='B', tz=None,
-                normalize=True, name=None, closed=None):
-    """
-    Return a fixed frequency datetime index, with business day as the default
-    frequency
-
-    Parameters
-    ----------
-    start : string or datetime-like, default None
-        Left bound for generating dates
-    end : string or datetime-like, default None
-        Right bound for generating dates
-    periods : integer or None, default None
-        If None, must specify start and end
-    freq : string or DateOffset, default 'B' (business daily)
-        Frequency strings can have multiples, e.g. '5H'
-    tz : string or None
-        Time zone name for returning localized DatetimeIndex, for example
-        Asia/Beijing
-    normalize : bool, default False
-        Normalize start/end dates to midnight before generating date range
-    name : str, default None
-        Name for the resulting index
-    closed : string or None, default None
-        Make the interval closed with respect to the given frequency to
-        the 'left', 'right', or both sides (None)
-
-    Notes
-    -----
-    2 of start, end, or periods must be specified
-
-    Returns
-    -------
-    rng : DatetimeIndex
-    """
-
-    return DatetimeIndex(start=start, end=end, periods=periods,
-                         freq=freq, tz=tz, normalize=normalize, name=name,
-                         closed=closed)
-
-
-def cdate_range(start=None, end=None, periods=None, freq='C', tz=None,
-                normalize=True, name=None, closed=None, **kwargs):
-    """
-    **EXPERIMENTAL** Return a fixed frequency datetime index, with
-    CustomBusinessDay as the default frequency
-
-    .. warning:: EXPERIMENTAL
-
-        The CustomBusinessDay class is not officially supported and the API is
-        likely to change in future versions. Use this at your own risk.
-
-    Parameters
-    ----------
-    start : string or datetime-like, default None
-        Left bound for generating dates
-    end : string or datetime-like, default None
-        Right bound for generating dates
-    periods : integer or None, default None
-        If None, must specify start and end
-    freq : string or DateOffset, default 'C' (CustomBusinessDay)
-        Frequency strings can have multiples, e.g. '5H'
-    tz : string or None
-        Time zone name for returning localized DatetimeIndex, for example
-        Asia/Beijing
-    normalize : bool, default False
-        Normalize start/end dates to midnight before generating date range
-    name : str, default None
-        Name for the resulting index
-    weekmask : str, Default 'Mon Tue Wed Thu Fri'
-        weekmask of valid business days, passed to ``numpy.busdaycalendar``
-    holidays : list
-        list/array of dates to exclude from the set of valid business days,
-        passed to ``numpy.busdaycalendar``
-    closed : string or None, default None
-        Make the interval closed with respect to the given frequency to
-        the 'left', 'right', or both sides (None)
-
-    Notes
-    -----
-    2 of start, end, or periods must be specified
-
-    Returns
-    -------
-    rng : DatetimeIndex
-    """
-
-    if freq=='C':
-        holidays = kwargs.pop('holidays', [])
-        weekmask = kwargs.pop('weekmask', 'Mon Tue Wed Thu Fri')
-        freq = CDay(holidays=holidays, weekmask=weekmask)
-    return DatetimeIndex(start=start, end=end, periods=periods, freq=freq,
-                         tz=tz, normalize=normalize, name=name,
-                         closed=closed, **kwargs)
-
-
-def _to_m8(key, tz=None):
-    '''
-    Timestamp-like => dt64
-    '''
-    if not isinstance(key, Timestamp):
-        # this also converts strings
-        key = Timestamp(key, tz=tz)
-
-    return np.int64(tslib.pydt_to_i8(key)).view(_NS_DTYPE)
-
-
-_CACHE_START = Timestamp(datetime(1950, 1, 1))
-_CACHE_END = Timestamp(datetime(2030, 1, 1))
-
-_daterange_cache = {}
-
-
-def _naive_in_cache_range(start, end):
-    if start is None or end is None:
-        return False
-    else:
-        if start.tzinfo is not None or end.tzinfo is not None:
-            return False
-        return _in_range(start, end, _CACHE_START, _CACHE_END)
-
-
-def _in_range(start, end, rng_start, rng_end):
-    return start > rng_start and end < rng_end
-
-def _use_cached_range(offset, _normalized, start, end):
-    return (offset._should_cache() and
-                not (offset._normalize_cache and not _normalized) and
-                    _naive_in_cache_range(start, end))
-
-def _time_to_micros(time):
-    seconds = time.hour * 60 * 60 + 60 * time.minute + time.second
-    return 1000000 * seconds + time.microsecond
-
-
-def _process_concat_data(to_concat, name):
-    klass = Index
-    kwargs = {}
-    concat = np.concatenate
-
-    all_dti = True
-    need_utc_convert = False
-    has_naive = False
-    tz = None
-
-    for x in to_concat:
-        if not isinstance(x, DatetimeIndex):
-            all_dti = False
-        else:
-            if tz is None:
-                tz = x.tz
-
-            if x.tz is None:
-                has_naive = True
-
-            if x.tz != tz:
-                need_utc_convert = True
-                tz = 'UTC'
-
-    if all_dti:
-        need_obj_convert = False
-        if has_naive and tz is not None:
-            need_obj_convert = True
-
-        if need_obj_convert:
-            to_concat = [x.asobject.values for x in to_concat]
-
-        else:
-            if need_utc_convert:
-                to_concat = [x.tz_convert('UTC').values for x in to_concat]
-            else:
-                to_concat = [x.values for x in to_concat]
-
-            # well, technically not a "class" anymore...oh well
-            klass = DatetimeIndex._simple_new
-            kwargs = {'tz': tz}
-            concat = com._concat_compat
-    else:
-        for i, x in enumerate(to_concat):
-            if isinstance(x, DatetimeIndex):
-                to_concat[i] = x.asobject.values
-            elif isinstance(x, Index):
-                to_concat[i] = x.values
-
-    factory_func = lambda x: klass(concat(x), name=name, **kwargs)
-    return to_concat, factory_func
diff --git a/pandas/tseries/interval.py b/pandas/tseries/interval.py
deleted file mode 100644
index bcce64c3a71bf..0000000000000
--- a/pandas/tseries/interval.py
+++ /dev/null
@@ -1,36 +0,0 @@
-
-from pandas.core.index import Index
-
-
-class Interval(object):
-    """
-    Represents an interval of time defined by two timestamps
-    """
-
-    def __init__(self, start, end):
-        self.start = start
-        self.end = end
-
-
-class PeriodInterval(object):
-    """
-    Represents an interval of time defined by two Period objects (time ordinals)
-    """
-
-    def __init__(self, start, end):
-        self.start = start
-        self.end = end
-
-
-class IntervalIndex(Index):
-    """
-
-    """
-    def __new__(self, starts, ends):
-        pass
-
-    def dtype(self):
-        return self.values.dtype
-
-if __name__ == '__main__':
-    pass
diff --git a/pandas/tseries/offsets.py b/pandas/tseries/offsets.py
index 0dac09a243d36..1cfd3f476f8ab 100644
--- a/pandas/tseries/offsets.py
+++ b/pandas/tseries/offsets.py
@@ -1,24 +1,39 @@
+# -*- coding: utf-8 -*-
 from datetime import date, datetime, timedelta
+import functools
+import operator
+
 from pandas.compat import range
 from pandas import compat
 import numpy as np
 
-from pandas.tseries.tools import to_datetime
-from pandas.tseries.timedeltas import to_timedelta
-from pandas.core.common import ABCSeries, ABCDatetimeIndex
+from pandas.core.dtypes.generic import ABCSeries, ABCDatetimeIndex, ABCPeriod
+from pandas.core.tools.datetimes import to_datetime
+import pandas.core.common as com
 
 # import after tools, dateutil check
-from dateutil.relativedelta import relativedelta, weekday
 from dateutil.easter import easter
-import pandas.tslib as tslib
-from pandas.tslib import Timestamp, OutOfBoundsDatetime, Timedelta
+from pandas._libs import tslib, Timestamp, OutOfBoundsDatetime, Timedelta
+from pandas.util._decorators import cache_readonly
+
+from pandas._libs.tslibs import ccalendar, frequencies as libfrequencies
+from pandas._libs.tslibs.timedeltas import delta_to_nanoseconds
+import pandas._libs.tslibs.offsets as liboffsets
+from pandas._libs.tslibs.offsets import (
+    ApplyTypeError,
+    as_datetime, _is_normalized,
+    _get_calendar, _to_dt64,
+    apply_index_wraps,
+    roll_yearday,
+    shift_month,
+    BaseOffset)
 
-import functools
 
 __all__ = ['Day', 'BusinessDay', 'BDay', 'CustomBusinessDay', 'CDay',
-           'CBMonthEnd','CBMonthBegin',
+           'CBMonthEnd', 'CBMonthBegin',
            'MonthBegin', 'BMonthBegin', 'MonthEnd', 'BMonthEnd',
-           'BusinessHour',
+           'SemiMonthEnd', 'SemiMonthBegin',
+           'BusinessHour', 'CustomBusinessHour',
            'YearBegin', 'BYearBegin', 'YearEnd', 'BYearEnd',
            'QuarterBegin', 'BQuarterBegin', 'QuarterEnd', 'BQuarterEnd',
            'LastWeekOfMonth', 'FY5253Quarter', 'FY5253',
@@ -26,7 +41,10 @@
            'Hour', 'Minute', 'Second', 'Milli', 'Micro', 'Nano',
            'DateOffset']
 
-# convert to/from datetime/timestamp to allow invalid Timestamp ranges to pass thru
+# convert to/from datetime/timestamp to allow invalid Timestamp ranges to
+# pass thru
+
+
 def as_timestamp(obj):
     if isinstance(obj, Timestamp):
         return obj
@@ -36,11 +54,6 @@ def as_timestamp(obj):
         pass
     return obj
 
-def as_datetime(obj):
-    f = getattr(obj,'to_pydatetime',None)
-    if f is not None:
-        obj = f()
-    return obj
 
 def apply_wraps(func):
     @functools.wraps(func)
@@ -61,6 +74,7 @@ def wrapper(self, other):
                 other = other.tz_localize(None)
 
             result = func(self, other)
+
             if self._adjust_dst:
                 result = tslib._localize_pydatetime(result, tz)
 
@@ -73,7 +87,8 @@ def wrapper(self, other):
                 if not isinstance(self, Nano) and result.nanosecond != nano:
                     if result.tz is not None:
                         # convert to UTC
-                        value = tslib.tz_convert_single(result.value, 'UTC', result.tz)
+                        value = tslib.tz_convert_single(
+                            result.value, 'UTC', result.tz)
                     else:
                         value = result.value
                     result = Timestamp(value + nano)
@@ -86,7 +101,7 @@ def wrapper(self, other):
 
             if self.normalize:
                 # normalize_date returns normal datetime
-                result = normalize_date(result)
+                result = tslib.normalize_date(result)
 
             if tz is not None and result.tzinfo is None:
                 result = tslib._localize_pydatetime(result, tz)
@@ -95,35 +110,36 @@ def wrapper(self, other):
     return wrapper
 
 
-def apply_index_wraps(func):
-    @functools.wraps(func)
-    def wrapper(self, other):
-        result = func(self, other)
-        if self.normalize:
-            result  = result.to_period('D').to_timestamp()
-        return result
-    return wrapper
-
-def _is_normalized(dt):
-    if (dt.hour != 0 or dt.minute != 0 or dt.second != 0
-        or dt.microsecond != 0 or getattr(dt, 'nanosecond', 0) != 0):
-        return False
-    return True
+def shift_day(other, days):
+    """
+    Increment the datetime `other` by the given number of days, retaining
+    the time-portion of the datetime.  For tz-naive datetimes this is
+    equivalent to adding a timedelta.  For tz-aware datetimes it is similar to
+    dateutil's relativedelta.__add__, but handles pytz tzinfo objects.
 
-#----------------------------------------------------------------------
-# DateOffset
+    Parameters
+    ----------
+    other : datetime or Timestamp
+    days : int
 
+    Returns
+    -------
+    shifted: datetime or Timestamp
+    """
+    if other.tzinfo is None:
+        return other + timedelta(days=days)
 
-class ApplyTypeError(TypeError):
-    # sentinel class for catching the apply error to return NotImplemented
-    pass
+    tz = other.tzinfo
+    naive = other.replace(tzinfo=None)
+    shifted = naive + timedelta(days=days)
+    return tslib._localize_pydatetime(shifted, tz)
 
 
-class CacheableOffset(object):
-    _cacheable = True
+# ---------------------------------------------------------------------
+# DateOffset
 
 
-class DateOffset(object):
+class DateOffset(BaseOffset):
     """
     Standard kind of date increment used for a date range.
 
@@ -145,14 +161,14 @@ class DateOffset(object):
     DateOffsets can be created to move dates forward a given number of
     valid dates.  For example, Bday(2) can be added to a date to move
     it two business days forward.  If the date does not start on a
-    valid date, first it is moved to a valid date.  Thus psedo code
+    valid date, first it is moved to a valid date.  Thus pseudo code
     is:
 
     def __add__(date):
       date = rollback(date) # does nothing if date is valid
       return date + <n number of periods>
 
-    When a date offset is created for a negitive number of periods,
+    When a date offset is created for a negative number of periods,
     the date is first rolled forward.  The pseudo code is:
 
     def __add__(date):
@@ -166,45 +182,24 @@ def __add__(date):
 
     Since 0 is a bit weird, we suggest avoiding its use.
     """
-    _cacheable = False
-    _normalize_cache = True
-    _kwds_use_relativedelta = (
-        'years', 'months', 'weeks', 'days',
-        'year', 'month', 'week', 'day', 'weekday',
-        'hour', 'minute', 'second', 'microsecond'
-        )
+    _params = cache_readonly(BaseOffset._params.fget)
     _use_relativedelta = False
     _adjust_dst = False
+    _attributes = frozenset(['n', 'normalize'] +
+                            list(liboffsets.relativedelta_kwds))
 
     # default for prior pickles
     normalize = False
 
     def __init__(self, n=1, normalize=False, **kwds):
-        self.n = int(n)
-        self.normalize = normalize
-        self.kwds = kwds
-        self._offset, self._use_relativedelta = self._determine_offset()
-
-    def _determine_offset(self):
-        # timedelta is used for sub-daily plural offsets and all singular offsets
-        # relativedelta is used for plural offsets of daily length or more
-        # nanosecond(s) are handled by apply_wraps
-        kwds_no_nanos = dict(
-            (k, v) for k, v in self.kwds.items()
-            if k not in ('nanosecond', 'nanoseconds')
-            )
-        use_relativedelta = False
-
-        if len(kwds_no_nanos) > 0:
-            if any(k in self._kwds_use_relativedelta for k in kwds_no_nanos):
-                use_relativedelta = True
-                offset = relativedelta(**kwds_no_nanos)
-            else:
-                # sub-daily offset - use timedelta (tz-aware)
-                offset = timedelta(**kwds_no_nanos)
-        else:
-            offset = timedelta(1)
-        return offset, use_relativedelta
+        BaseOffset.__init__(self, n, normalize)
+
+        off, use_rd = liboffsets._determine_offset(kwds)
+        object.__setattr__(self, "_offset", off)
+        object.__setattr__(self, "_use_relativedelta", use_rd)
+        for key in kwds:
+            val = kwds[key]
+            object.__setattr__(self, key, val)
 
     @apply_wraps
     def apply(self, other):
@@ -239,8 +234,6 @@ def apply_index(self, i):
         raises NotImplentedError for offsets without a
         vectorized implementation
 
-        .. versionadded:: 0.17.0
-
         Parameters
         ----------
         i : DatetimeIndex
@@ -250,31 +243,33 @@ def apply_index(self, i):
         y : DatetimeIndex
         """
 
-        if not type(self) is DateOffset:
-            raise NotImplementedError("DateOffset subclass %s "
-                                     "does not have a vectorized "
-                                     "implementation"
-                                     % (self.__class__.__name__,))
+        if type(self) is not DateOffset:
+            raise NotImplementedError("DateOffset subclass {name} "
+                                      "does not have a vectorized "
+                                      "implementation".format(
+                                          name=self.__class__.__name__))
+        kwds = self.kwds
         relativedelta_fast = set(['years', 'months', 'weeks',
-                                'days', 'hours', 'minutes',
-                                'seconds', 'microseconds'])
+                                  'days', 'hours', 'minutes',
+                                  'seconds', 'microseconds'])
         # relativedelta/_offset path only valid for base DateOffset
         if (self._use_relativedelta and
-            set(self.kwds).issubset(relativedelta_fast)):
+                set(kwds).issubset(relativedelta_fast)):
 
-            months = ((self.kwds.get('years', 0) * 12
-                        + self.kwds.get('months', 0)) * self.n)
+            months = ((kwds.get('years', 0) * 12 +
+                       kwds.get('months', 0)) * self.n)
             if months:
-                shifted = tslib.shift_months(i.asi8, months)
+                shifted = liboffsets.shift_months(i.asi8, months)
                 i = i._shallow_copy(shifted)
 
-            weeks = (self.kwds.get('weeks', 0)) * self.n
+            weeks = (kwds.get('weeks', 0)) * self.n
             if weeks:
-                i = (i.to_period('W') + weeks).to_timestamp() + i.to_perioddelta('W')
+                i = (i.to_period('W') + weeks).to_timestamp() + \
+                    i.to_perioddelta('W')
 
-            timedelta_kwds = dict((k,v) for k,v in self.kwds.items()
-                                    if k in ['days','hours','minutes',
-                                            'seconds','microseconds'])
+            timedelta_kwds = {k: v for k, v in kwds.items()
+                              if k in ['days', 'hours', 'minutes',
+                                       'seconds', 'microseconds']}
             if timedelta_kwds:
                 delta = Timedelta(**timedelta_kwds)
                 i = i + (self.n * delta)
@@ -284,129 +279,57 @@ def apply_index(self, i):
             return i + (self._offset * self.n)
         else:
             # relativedelta with other keywords
+            kwd = set(kwds) - relativedelta_fast
             raise NotImplementedError("DateOffset with relativedelta "
-                                      "keyword(s) %s not able to be "
-                                      "applied vectorized" %
-                                      (set(self.kwds) - relativedelta_fast),)
+                                      "keyword(s) {kwd} not able to be "
+                                      "applied vectorized".format(kwd=kwd))
 
     def isAnchored(self):
+        # TODO: Does this make sense for the general case?  It would help
+        # if there were a canonical docstring for what isAnchored means.
         return (self.n == 1)
 
-    def copy(self):
-        return self.__class__(self.n, normalize=self.normalize, **self.kwds)
-
-    def _should_cache(self):
-        return self.isAnchored() and self._cacheable
-
-    def _params(self):
-        all_paras = dict(list(vars(self).items()) + list(self.kwds.items()))
-        if 'holidays' in all_paras and not all_paras['holidays']:
-            all_paras.pop('holidays')
-        exclude = ['kwds', 'name','normalize', 'calendar']
-        attrs = [(k, v) for k, v in all_paras.items() if (k not in exclude ) and (k[0] != '_')]
-        attrs = sorted(set(attrs))
-        params = tuple([str(self.__class__)] + attrs)
-        return params
-
-    def __repr__(self):
-        if hasattr(self, '_named'):
-            return self._named
-        className = getattr(self, '_outputName', type(self).__name__)
+    # TODO: Combine this with BusinessMixin version by defining a whitelisted
+    # set of attributes on each object rather than the existing behavior of
+    # iterating over internal ``__dict__``
+    def _repr_attrs(self):
         exclude = set(['n', 'inc', 'normalize'])
         attrs = []
         for attr in sorted(self.__dict__):
-            if ((attr == 'kwds' and len(self.kwds) == 0)
-                    or attr.startswith('_')):
+            if attr.startswith('_') or attr == 'kwds':
                 continue
-            elif attr == 'kwds':
-                kwds_new = {}
-                for key in self.kwds:
-                    if not hasattr(self, key):
-                        kwds_new[key] = self.kwds[key]
-                if len(kwds_new) > 0:
-                    attrs.append('='.join((attr, repr(kwds_new))))
-            else:
-                if attr not in exclude:
-                    attrs.append('='.join((attr, repr(getattr(self, attr)))))
-
-        if abs(self.n) != 1:
-            plural = 's'
-        else:
-            plural = ''
-
-        n_str = ""
-        if self.n != 1:
-            n_str = "%s * " % self.n
+            elif attr not in exclude:
+                value = getattr(self, attr)
+                attrs.append('{attr}={value}'.format(attr=attr, value=value))
 
-        out = '<%s' % n_str + className + plural
+        out = ''
         if attrs:
             out += ': ' + ', '.join(attrs)
-        out += '>'
         return out
 
     @property
     def name(self):
-        if hasattr(self, '_named'):
-            return self._named
-        else:
-            return self.rule_code
-
-    def __eq__(self, other):
-        if other is None:
-            return False
-
-        if isinstance(other, compat.string_types):
-            from pandas.tseries.frequencies import to_offset
-
-            other = to_offset(other)
-
-        if not isinstance(other, DateOffset):
-            return False
-
-        return self._params() == other._params()
-
-    def __ne__(self, other):
-        return not self == other
-
-    def __hash__(self):
-        return hash(self._params())
-
-    def __call__(self, other):
-        return self.apply(other)
+        return self.rule_code
 
     def __add__(self, other):
         if isinstance(other, (ABCDatetimeIndex, ABCSeries)):
             return other + self
+        elif isinstance(other, ABCPeriod):
+            return other + self
         try:
             return self.apply(other)
         except ApplyTypeError:
             return NotImplemented
 
-    def __radd__(self, other):
-        return self.__add__(other)
-
     def __sub__(self, other):
         if isinstance(other, datetime):
             raise TypeError('Cannot subtract datetime from offset.')
         elif type(other) == type(self):
-            return self.__class__(self.n - other.n, normalize=self.normalize, **self.kwds)
+            return self.__class__(self.n - other.n, normalize=self.normalize,
+                                  **self.kwds)
         else:  # pragma: no cover
             return NotImplemented
 
-    def __rsub__(self, other):
-        if isinstance(other, (ABCDatetimeIndex, ABCSeries)):
-            return other - self
-        return self.__class__(-self.n, normalize=self.normalize, **self.kwds) + other
-
-    def __mul__(self, someInt):
-        return self.__class__(n=someInt * self.n, normalize=self.normalize, **self.kwds)
-
-    def __rmul__(self, someInt):
-        return self.__mul__(someInt)
-
-    def __neg__(self):
-        return self.__class__(-self.n, normalize=self.normalize, **self.kwds)
-
     def rollback(self, dt):
         """Roll provided date backward to next offset only if not on offset"""
         dt = as_timestamp(dt)
@@ -435,44 +358,6 @@ def onOffset(self, dt):
         b = ((dt + self) - self)
         return a == b
 
-    # helpers for vectorized offsets
-    def _beg_apply_index(self, i, freq):
-        """Offsets index to beginning of Period frequency"""
-
-        off = i.to_perioddelta('D')
-
-        from pandas.tseries.frequencies import get_freq_code
-        base, mult = get_freq_code(freq)
-        base_period = i.to_period(base)
-        if self.n < 0:
-            # when subtracting, dates on start roll to prior
-            roll = np.where(base_period.to_timestamp() == i - off,
-                            self.n, self.n + 1)
-        else:
-            roll = self.n
-
-        base = (base_period + roll).to_timestamp()
-        return base + off
-
-    def _end_apply_index(self, i, freq):
-        """Offsets index to end of Period frequency"""
-
-        off = i.to_perioddelta('D')
-
-        import pandas.tseries.frequencies as frequencies
-        from pandas.tseries.frequencies import get_freq_code
-        base, mult = get_freq_code(freq)
-        base_period = i.to_period(base)
-        if self.n > 0:
-            # when adding, dtates on end roll to next
-            roll = np.where(base_period.to_timestamp(how='end') == i - off,
-                            self.n, self.n - 1)
-        else:
-            roll = self.n
-
-        base = (base_period + roll).to_timestamp(how='end')
-        return base + off
-
     # way to get around weirdness with rule_code
     @property
     def _prefix(self):
@@ -482,7 +367,7 @@ def _prefix(self):
     def rule_code(self):
         return self._prefix
 
-    @property
+    @cache_readonly
     def freqstr(self):
         try:
             code = self.rule_code
@@ -490,47 +375,66 @@ def freqstr(self):
             return repr(self)
 
         if self.n != 1:
-            fstr = '%d%s' % (self.n, code)
+            fstr = '{n}{code}'.format(n=self.n, code=code)
         else:
             fstr = code
 
+        try:
+            if self._offset:
+                fstr += self._offset_str()
+        except AttributeError:
+            # TODO: standardize `_offset` vs `offset` naming convention
+            pass
+
         return fstr
 
-class SingleConstructorOffset(DateOffset):
+    def _offset_str(self):
+        return ''
+
+    @property
+    def nanos(self):
+        raise ValueError("{name} is a non-fixed frequency".format(name=self))
 
+
+class SingleConstructorOffset(DateOffset):
     @classmethod
     def _from_name(cls, suffix=None):
         # default _from_name calls cls with no args
         if suffix:
-            raise ValueError("Bad freq suffix %s" % suffix)
+            raise ValueError("Bad freq suffix {suffix}".format(suffix=suffix))
         return cls()
 
-class BusinessMixin(object):
-    """ mixin to business types to provide related functions """
-
-    # TODO: Combine this with DateOffset by defining a whitelisted set of
-    # attributes on each object rather than the existing behavior of iterating
-    # over internal ``__dict__``
-    def __repr__(self):
-        if hasattr(self, '_named'):
-            return self._named
-        className = getattr(self, '_outputName', self.__class__.__name__)
-
-        if abs(self.n) != 1:
-            plural = 's'
-        else:
-            plural = ''
 
-        n_str = ""
-        if self.n != 1:
-            n_str = "%s * " % self.n
+class _CustomMixin(object):
+    """
+    Mixin for classes that define and validate calendar, holidays,
+    and weekdays attributes
+    """
+    def __init__(self, weekmask, holidays, calendar):
+        calendar, holidays = _get_calendar(weekmask=weekmask,
+                                           holidays=holidays,
+                                           calendar=calendar)
+        # Custom offset instances are identified by the
+        # following two attributes. See DateOffset._params()
+        # holidays, weekmask
 
-        out = '<%s' % n_str + className + plural + self._repr_attrs() + '>'
-        return out
+        object.__setattr__(self, "weekmask", weekmask)
+        object.__setattr__(self, "holidays", holidays)
+        object.__setattr__(self, "calendar", calendar)
+
+
+class BusinessMixin(object):
+    """ Mixin to business types to provide related functions """
+
+    @property
+    def offset(self):
+        """Alias for self._offset"""
+        # Alias for backward compat
+        return self._offset
 
     def _repr_attrs(self):
         if self.offset:
-            attrs = ['offset=%s' % repr(self.offset)]
+            attrs = ['offset={offset!r}'.format(offset=self.offset)]
         else:
             attrs = None
         out = ''
@@ -538,35 +442,18 @@ def _repr_attrs(self):
             out += ': ' + ', '.join(attrs)
         return out
 
+
 class BusinessDay(BusinessMixin, SingleConstructorOffset):
     """
     DateOffset subclass representing possibly n business days
     """
     _prefix = 'B'
     _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize', 'offset'])
 
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = int(n)
-        self.normalize = normalize
-        self.kwds = kwds
-        self.offset = kwds.get('offset', timedelta(0))
-
-    @property
-    def freqstr(self):
-        try:
-            code = self.rule_code
-        except NotImplementedError:
-            return repr(self)
-
-        if self.n != 1:
-            fstr = '%d%s' % (self.n, code)
-        else:
-            fstr = code
-
-        if self.offset:
-            fstr += self._offset_str()
-
-        return fstr
+    def __init__(self, n=1, normalize=False, offset=timedelta(0)):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "_offset", offset)
 
     def _offset_str(self):
         def get_str(td):
@@ -599,35 +486,35 @@ def get_str(td):
         else:
             return '+' + repr(self.offset)
 
-    def isAnchored(self):
-        return (self.n == 1)
-
     @apply_wraps
     def apply(self, other):
         if isinstance(other, datetime):
             n = self.n
+            wday = other.weekday()
 
-            if n == 0 and other.weekday() > 4:
-                n = 1
-
-            result = other
-
-            # avoid slowness below
-            if abs(n) > 5:
-                k = n // 5
-                result = result + timedelta(7 * k)
-                if n < 0 and result.weekday() > 4:
-                    n += 1
-                n -= 5 * k
-                if n == 0 and result.weekday() > 4:
-                    n -= 1
+            # avoid slowness below by operating on weeks first
+            weeks = n // 5
+            if n <= 0 and wday > 4:
+                # roll forward
+                n += 1
 
-            while n != 0:
-                k = n // abs(n)
-                result = result + timedelta(k)
-                if result.weekday() < 5:
-                    n -= k
+            n -= 5 * weeks
+
+            # n is always >= 0 at this point
+            if n == 0 and wday > 4:
+                # roll back
+                days = 4 - wday
+            elif wday > 4:
+                # roll forward
+                days = (7 - wday) + (n - 1)
+            elif wday + n <= 4:
+                # shift by n days without leaving the current week
+                days = n
+            else:
+                # shift by n days plus 2 to get past the weekend
+                days = n + 2
 
+            result = other + timedelta(days=7 * weeks + days)
             if self.offset:
                 result = result + self.offset
             return result
@@ -658,50 +545,33 @@ def onOffset(self, dt):
         return dt.weekday() < 5
 
 
-class BusinessHour(BusinessMixin, SingleConstructorOffset):
-    """
-    DateOffset subclass representing possibly n business days
-
-    .. versionadded: 0.16.1
-
-    """
-    _prefix = 'BH'
-    _anchor = 0
-
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = int(n)
-        self.normalize = normalize
+class BusinessHourMixin(BusinessMixin):
 
+    def __init__(self, start='09:00', end='17:00', offset=timedelta(0)):
         # must be validated here to equality check
-        kwds['start'] = self._validate_time(kwds.get('start', '09:00'))
-        kwds['end'] = self._validate_time(kwds.get('end', '17:00'))
-        self.kwds = kwds
-        self.offset = kwds.get('offset', timedelta(0))
-        self.start = kwds.get('start', '09:00')
-        self.end = kwds.get('end', '17:00')
-
-        # used for moving to next businessday
+        start = liboffsets._validate_business_time(start)
+        object.__setattr__(self, "start", start)
+        end = liboffsets._validate_business_time(end)
+        object.__setattr__(self, "end", end)
+        object.__setattr__(self, "_offset", offset)
+
+    @cache_readonly
+    def next_bday(self):
+        """used for moving to next businessday"""
         if self.n >= 0:
-            self.next_bday = BusinessDay(n=1)
+            nb_offset = 1
         else:
-            self.next_bday = BusinessDay(n=-1)
-
-    def _validate_time(self, t_input):
-        from datetime import time as dt_time
-        import time
-        if isinstance(t_input, compat.string_types):
-            try:
-                t = time.strptime(t_input, '%H:%M')
-                return dt_time(hour=t.tm_hour, minute=t.tm_min)
-            except ValueError:
-                raise ValueError("time data must match '%H:%M' format")
-        elif isinstance(t_input, dt_time):
-            if t_input.second != 0 or t_input.microsecond != 0:
-                raise ValueError("time data must be specified only with hour and minute")
-            return t_input
+            nb_offset = -1
+        if self._prefix.startswith('C'):
+            # CustomBusinessHour
+            return CustomBusinessDay(n=nb_offset,
+                                     weekmask=self.weekmask,
+                                     holidays=self.holidays,
+                                     calendar=self.calendar)
         else:
-            raise ValueError("time data must be string or datetime.time")
+            return BusinessDay(n=nb_offset)
 
+    @cache_readonly
     def _get_daytime_flag(self):
         if self.start == self.end:
             raise ValueError('start and end must not be the same')
@@ -710,13 +580,6 @@ def _get_daytime_flag(self):
         else:
             return False
 
-    def _repr_attrs(self):
-        out = super(BusinessHour, self)._repr_attrs()
-        attrs = ['BH=%s-%s' % (self.start.strftime('%H:%M'),
-                               self.end.strftime('%H:%M'))]
-        out += ': ' + ', '.join(attrs)
-        return out
-
     def _next_opening_time(self, other):
         """
         If n is positive, return tomorrow's business day opening time.
@@ -750,30 +613,32 @@ def _prev_opening_time(self, other):
         return datetime(other.year, other.month, other.day,
                         self.start.hour, self.start.minute)
 
+    @cache_readonly
     def _get_business_hours_by_sec(self):
         """
         Return business hours in a day by seconds.
         """
-        if self._get_daytime_flag():
-            # create dummy datetime to calcurate businesshours in a day
+        if self._get_daytime_flag:
+            # create dummy datetime to calculate businesshours in a day
             dtstart = datetime(2014, 4, 1, self.start.hour, self.start.minute)
             until = datetime(2014, 4, 1, self.end.hour, self.end.minute)
-            return tslib.tot_seconds(until - dtstart)
+            return (until - dtstart).total_seconds()
         else:
-            self.daytime = False
             dtstart = datetime(2014, 4, 1, self.start.hour, self.start.minute)
             until = datetime(2014, 4, 2, self.end.hour, self.end.minute)
-            return tslib.tot_seconds(until - dtstart)
+            return (until - dtstart).total_seconds()
 
     @apply_wraps
     def rollback(self, dt):
         """Roll provided date backward to next offset only if not on offset"""
         if not self.onOffset(dt):
-            businesshours = self._get_business_hours_by_sec()
+            businesshours = self._get_business_hours_by_sec
             if self.n >= 0:
-                dt = self._prev_opening_time(dt) + timedelta(seconds=businesshours)
+                dt = self._prev_opening_time(
+                    dt) + timedelta(seconds=businesshours)
             else:
-                dt = self._next_opening_time(dt) + timedelta(seconds=businesshours)
+                dt = self._next_opening_time(
+                    dt) + timedelta(seconds=businesshours)
         return dt
 
     @apply_wraps
@@ -788,9 +653,8 @@ def rollforward(self, dt):
 
     @apply_wraps
     def apply(self, other):
-        # calcurate here because offset is not immutable
-        daytime = self._get_daytime_flag()
-        businesshours = self._get_business_hours_by_sec()
+        daytime = self._get_daytime_flag
+        businesshours = self._get_business_hours_by_sec
         bhdelta = timedelta(seconds=businesshours)
 
         if isinstance(other, datetime):
@@ -804,7 +668,7 @@ def apply(self, other):
             n = self.n
             if n >= 0:
                 if (other.time() == self.end or
-                    not self._onOffset(other, businesshours)):
+                        not self._onOffset(other, businesshours)):
                     other = self._next_opening_time(other)
             else:
                 if other.time() == self.start:
@@ -820,7 +684,7 @@ def apply(self, other):
 
             if bd != 0:
                 skip_bd = BusinessDay(n=bd)
-                # midnight busienss hour may not on BusinessDay
+                # midnight business hour may not on BusinessDay
                 if not self.next_bday.onOffset(other):
                     remain = other - self._prev_opening_time(other)
                     other = self._next_opening_time(other + skip_bd) + remain
@@ -831,12 +695,13 @@ def apply(self, other):
             result = other + timedelta(hours=hours, minutes=minutes)
 
             # because of previous adjustment, time will be larger than start
-            if ((daytime and (result.time() < self.start or self.end < result.time())) or
-                not daytime and (self.end < result.time() < self.start)):
+            if ((daytime and (result.time() < self.start or
+                              self.end < result.time())) or
+                    not daytime and (self.end < result.time() < self.start)):
                 if n >= 0:
                     bday_edge = self._prev_opening_time(other)
                     bday_edge = bday_edge + bhdelta
-                    # calcurate remainder
+                    # calculate remainder
                     bday_remain = result - bday_edge
                     result = self._next_opening_time(other)
                     result += bday_remain
@@ -852,11 +717,14 @@ def apply(self, other):
             else:
                 if result.time() == self.start and nanosecond == 0:
                     # adjustment to move to previous business day
-                    result = self._next_opening_time(result- timedelta(seconds=1)) +bhdelta
+                    result = self._next_opening_time(
+                        result - timedelta(seconds=1)) + bhdelta
 
             return result
         else:
-            raise ApplyTypeError('Only know how to combine business hour with ')
+            # TODO: Figure out the end of this sente
+            raise ApplyTypeError(
+                'Only know how to combine business hour with ')
 
     def onOffset(self, dt):
         if self.normalize and not _is_normalized(dt):
@@ -867,12 +735,12 @@ def onOffset(self, dt):
                           dt.minute, dt.second, dt.microsecond)
         # Valid BH can be on the different BusinessDay during midnight
         # Distinguish by the time spent from previous opening time
-        businesshours = self._get_business_hours_by_sec()
+        businesshours = self._get_business_hours_by_sec
         return self._onOffset(dt, businesshours)
 
     def _onOffset(self, dt, businesshours):
         """
-        Slight speedups using calcurated values
+        Slight speedups using calculated values
         """
         # if self.normalize and not _is_normalized(dt):
         #     return False
@@ -882,22 +750,43 @@ def _onOffset(self, dt, businesshours):
             op = self._prev_opening_time(dt)
         else:
             op = self._next_opening_time(dt)
-        span = tslib.tot_seconds(dt - op)
+        span = (dt - op).total_seconds()
         if span <= businesshours:
             return True
         else:
             return False
 
+    def _repr_attrs(self):
+        out = super(BusinessHourMixin, self)._repr_attrs()
+        start = self.start.strftime('%H:%M')
+        end = self.end.strftime('%H:%M')
+        attrs = ['{prefix}={start}-{end}'.format(prefix=self._prefix,
+                                                 start=start, end=end)]
+        out += ': ' + ', '.join(attrs)
+        return out
+
 
-class CustomBusinessDay(BusinessDay):
+class BusinessHour(BusinessHourMixin, SingleConstructorOffset):
     """
-    **EXPERIMENTAL** DateOffset subclass representing possibly n business days
-    excluding holidays
+    DateOffset subclass representing possibly n business days
 
-    .. warning:: EXPERIMENTAL
+    .. versionadded:: 0.16.1
 
-        This class is not officially supported and the API is likely to change
-        in future versions. Use this at your own risk.
+    """
+    _prefix = 'BH'
+    _anchor = 0
+    _attributes = frozenset(['n', 'normalize', 'start', 'end', 'offset'])
+
+    def __init__(self, n=1, normalize=False, start='09:00',
+                 end='17:00', offset=timedelta(0)):
+        BaseOffset.__init__(self, n, normalize)
+        super(BusinessHour, self).__init__(start=start, end=end, offset=offset)
+
+
+class CustomBusinessDay(_CustomMixin, BusinessDay):
+    """
+    DateOffset subclass representing possibly n custom business days,
+    excluding holidays
 
     Parameters
     ----------
@@ -914,88 +803,15 @@ class CustomBusinessDay(BusinessDay):
     """
     _cacheable = False
     _prefix = 'C'
+    _attributes = frozenset(['n', 'normalize',
+                             'weekmask', 'holidays', 'calendar', 'offset'])
 
     def __init__(self, n=1, normalize=False, weekmask='Mon Tue Wed Thu Fri',
-                 holidays=None, calendar=None, **kwds):
-        self.n = int(n)
-        self.normalize = normalize
-        self.kwds = kwds
-        self.offset = kwds.get('offset', timedelta(0))
-        calendar, holidays = self.get_calendar(weekmask=weekmask,
-                                                         holidays=holidays,
-                                                         calendar=calendar)
-        # CustomBusinessDay instances are identified by the
-        # following two attributes. See DateOffset._params()
-        # holidays, weekmask
-
-        self.kwds['weekmask'] = self.weekmask = weekmask
-        self.kwds['holidays'] = self.holidays = holidays
-        self.kwds['calendar'] = self.calendar = calendar
-
-    def get_calendar(self, weekmask, holidays, calendar):
-        '''Generate busdaycalendar'''
-        if isinstance(calendar, np.busdaycalendar):
-            if not holidays:
-                holidays = tuple(calendar.holidays)
-            elif not isinstance(holidays, tuple):
-                holidays = tuple(holidays)
-            else:
-                 # trust that calendar.holidays and holidays are
-                 # consistent
-                pass
-            return calendar, holidays
-
-        if holidays is None:
-            holidays = []
-        try:
-            holidays = holidays + calendar.holidays().tolist()
-        except AttributeError:
-            pass
-        holidays = [self._to_dt64(dt, dtype='datetime64[D]') for dt in
-                    holidays]
-        holidays = tuple(sorted(holidays))
-
-        kwargs = {'weekmask': weekmask}
-        if holidays:
-            kwargs['holidays'] = holidays
-
-        try:
-            busdaycalendar = np.busdaycalendar(**kwargs)
-        except:
-            # Check we have the required numpy version
-            from distutils.version import LooseVersion
-
-            if LooseVersion(np.__version__) < '1.7.0':
-                raise NotImplementedError("CustomBusinessDay requires numpy >= "
-                                          "1.7.0. Current version: " +
-                                          np.__version__)
-            else:
-                raise
-        return busdaycalendar, holidays
-
-    def __getstate__(self):
-        """Return a pickleable state"""
-        state = self.__dict__.copy()
-        del state['calendar']
-
-        # we don't want to actually pickle the calendar object
-        # as its a np.busyday; we recreate on deserilization
-        try:
-            state['kwds'].pop('calendar')
-        except:
-            pass
-
-        return state
+                 holidays=None, calendar=None, offset=timedelta(0)):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "_offset", offset)
 
-    def __setstate__(self, state):
-        """Reconstruct an instance from a pickled state"""
-        self.__dict__ = state
-        calendar, holidays = self.get_calendar(weekmask=self.weekmask,
-                                               holidays=self.holidays,
-                                               calendar=None)
-        self.kwds['calendar'] = self.calendar = calendar
-        self.kwds['holidays'] = self.holidays = holidays
-        self.kwds['weekmask'] = state['weekmask']
+        _CustomMixin.__init__(self, weekmask, holidays, calendar)
 
     @apply_wraps
     def apply(self, other):
@@ -1009,7 +825,7 @@ def apply(self, other):
             np_dt = np.datetime64(date_in.date())
 
             np_incr_dt = np.busday_offset(np_dt, self.n, roll=roll,
-                                  busdaycal=self.calendar)
+                                          busdaycal=self.calendar)
 
             dt_date = np_incr_dt.astype(datetime)
             result = datetime.combine(dt_date, date_in.time())
@@ -1028,165 +844,101 @@ def apply(self, other):
     def apply_index(self, i):
         raise NotImplementedError
 
-    @staticmethod
-    def _to_dt64(dt, dtype='datetime64'):
-        # Currently
-        # > np.datetime64(dt.datetime(2013,5,1),dtype='datetime64[D]')
-        # numpy.datetime64('2013-05-01T02:00:00.000000+0200')
-        # Thus astype is needed to cast datetime to datetime64[D]
-        if getattr(dt, 'tzinfo', None) is not None:
-            i8 = tslib.pydt_to_i8(dt)
-            dt = tslib.tz_convert_single(i8, 'UTC', dt.tzinfo)
-            dt = Timestamp(dt)
-        dt = np.datetime64(dt)
-        if dt.dtype.name != dtype:
-            dt = dt.astype(dtype)
-        return dt
-
     def onOffset(self, dt):
         if self.normalize and not _is_normalized(dt):
             return False
-        day64 = self._to_dt64(dt,'datetime64[D]')
+        day64 = _to_dt64(dt, 'datetime64[D]')
         return np.is_busday(day64, busdaycal=self.calendar)
 
 
+class CustomBusinessHour(_CustomMixin, BusinessHourMixin,
+                         SingleConstructorOffset):
+    """
+    DateOffset subclass representing possibly n custom business days
+
+    .. versionadded:: 0.18.1
+
+    """
+    _prefix = 'CBH'
+    _anchor = 0
+    _attributes = frozenset(['n', 'normalize',
+                             'weekmask', 'holidays', 'calendar',
+                             'start', 'end', 'offset'])
+
+    def __init__(self, n=1, normalize=False, weekmask='Mon Tue Wed Thu Fri',
+                 holidays=None, calendar=None,
+                 start='09:00', end='17:00', offset=timedelta(0)):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "_offset", offset)
+
+        _CustomMixin.__init__(self, weekmask, holidays, calendar)
+        BusinessHourMixin.__init__(self, start=start, end=end, offset=offset)
+
+
+# ---------------------------------------------------------------------
+# Month-Based Offset Classes
+
+
 class MonthOffset(SingleConstructorOffset):
     _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize'])
+
+    __init__ = BaseOffset.__init__
 
     @property
     def name(self):
         if self.isAnchored:
             return self.rule_code
         else:
-            return "%s-%s" % (self.rule_code, _int_to_month[self.n])
-
+            month = ccalendar.MONTH_ALIASES[self.n]
+            return "{code}-{month}".format(code=self.rule_code,
+                                           month=month)
 
-class MonthEnd(MonthOffset):
-    """DateOffset of one month end"""
+    def onOffset(self, dt):
+        if self.normalize and not _is_normalized(dt):
+            return False
+        return dt.day == self._get_offset_day(dt)
 
     @apply_wraps
     def apply(self, other):
-        n = self.n
-        _, days_in_month = tslib.monthrange(other.year, other.month)
-        if other.day != days_in_month:
-            other = other + relativedelta(months=-1, day=31)
-            if n <= 0:
-                n = n + 1
-        other = other + relativedelta(months=n, day=31)
-        return other
+        compare_day = self._get_offset_day(other)
+        n = liboffsets.roll_convention(other.day, self.n, compare_day)
+        return shift_month(other, n, self._day_opt)
 
     @apply_index_wraps
     def apply_index(self, i):
-        months = self.n - 1 if self.n >= 0 else self.n
-        shifted = tslib.shift_months(i.asi8, months, 'end')
+        shifted = liboffsets.shift_months(i.asi8, self.n, self._day_opt)
         return i._shallow_copy(shifted)
 
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        days_in_month = tslib.monthrange(dt.year, dt.month)[1]
-        return dt.day == days_in_month
 
+class MonthEnd(MonthOffset):
+    """DateOffset of one month end"""
     _prefix = 'M'
+    _day_opt = 'end'
 
 
 class MonthBegin(MonthOffset):
     """DateOffset of one month at beginning"""
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-
-        if other.day > 1 and n <= 0:  # then roll forward if n<=0
-            n += 1
-
-        return other + relativedelta(months=n, day=1)
-
-    @apply_index_wraps
-    def apply_index(self, i):
-        months = self.n + 1 if self.n < 0 else self.n
-        shifted = tslib.shift_months(i.asi8, months, 'start')
-        return i._shallow_copy(shifted)
-
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        return dt.day == 1
-
     _prefix = 'MS'
+    _day_opt = 'start'
 
 
 class BusinessMonthEnd(MonthOffset):
     """DateOffset increments between business EOM dates"""
-
-    def isAnchored(self):
-        return (self.n == 1)
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        wkday, days_in_month = tslib.monthrange(other.year, other.month)
-        lastBDay = days_in_month - max(((wkday + days_in_month - 1)
-                                        % 7) - 4, 0)
-
-        if n > 0 and not other.day >= lastBDay:
-            n = n - 1
-        elif n <= 0 and other.day > lastBDay:
-            n = n + 1
-        other = other + relativedelta(months=n, day=31)
-
-        if other.weekday() > 4:
-            other = other - BDay()
-        return other
-
     _prefix = 'BM'
+    _day_opt = 'business_end'
 
 
 class BusinessMonthBegin(MonthOffset):
     """DateOffset of one business month at beginning"""
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        wkday, _ = tslib.monthrange(other.year, other.month)
-        first = _get_firstbday(wkday)
-
-        if other.day > first and n <= 0:
-            # as if rolled forward already
-            n += 1
-        elif other.day < first and n > 0:
-            other = other + timedelta(days=first - other.day)
-            n -= 1
-
-        other = other + relativedelta(months=n)
-        wkday, _ = tslib.monthrange(other.year, other.month)
-        first = _get_firstbday(wkday)
-        result = datetime(other.year, other.month, first, other.hour, other.minute,
-                          other.second, other.microsecond)
-        return result
-
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        first_weekday, _ = tslib.monthrange(dt.year, dt.month)
-        if first_weekday == 5:
-            return dt.day == 3
-        elif first_weekday == 6:
-            return dt.day == 2
-        else:
-            return dt.day == 1
-
     _prefix = 'BMS'
+    _day_opt = 'business_start'
 
 
-class CustomBusinessMonthEnd(BusinessMixin, MonthOffset):
+class _CustomBusinessMonth(_CustomMixin, BusinessMixin, MonthOffset):
     """
-    **EXPERIMENTAL** DateOffset of one custom business month
-
-    .. warning:: EXPERIMENTAL
-
-        This class is not officially supported and the API is likely to change
-        in future versions. Use this at your own risk.
+    DateOffset subclass representing one custom business month, incrementing
+    between [BEGIN/END] of month dates
 
     Parameters
     ----------
@@ -1201,100 +953,294 @@ class CustomBusinessMonthEnd(BusinessMixin, MonthOffset):
         passed to ``numpy.busdaycalendar``
     calendar : pd.HolidayCalendar or np.busdaycalendar
     """
-
     _cacheable = False
-    _prefix = 'CBM'
-    def __init__(self, n=1, normalize=False,  weekmask='Mon Tue Wed Thu Fri',
-                 holidays=None, calendar=None, **kwds):
-        self.n = int(n)
-        self.normalize = normalize
-        self.kwds = kwds
-        self.offset = kwds.get('offset', timedelta(0))
-        self.cbday = CustomBusinessDay(n=self.n, normalize=normalize,
-                                       weekmask=weekmask, holidays=holidays,
-                                       calendar=calendar, **kwds)
-        self.m_offset = MonthEnd(n=1, normalize=normalize, **kwds)
-        self.kwds['calendar'] = self.cbday.calendar  # cache numpy calendar
-
-    @apply_wraps
-    def apply(self,other):
-        n = self.n
-        # First move to month offset
-        cur_mend = self.m_offset.rollforward(other)
-        # Find this custom month offset
-        cur_cmend = self.cbday.rollback(cur_mend)
+    _attributes = frozenset(['n', 'normalize',
+                             'weekmask', 'holidays', 'calendar', 'offset'])
 
-        # handle zero case. arbitrarily rollforward
-        if n == 0 and other != cur_cmend:
-            n += 1
+    onOffset = DateOffset.onOffset        # override MonthOffset method
+    apply_index = DateOffset.apply_index  # override MonthOffset method
 
-        if other < cur_cmend and n >= 1:
-            n -= 1
-        elif other > cur_cmend and n <= -1:
-            n += 1
+    def __init__(self, n=1, normalize=False, weekmask='Mon Tue Wed Thu Fri',
+                 holidays=None, calendar=None, offset=timedelta(0)):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "_offset", offset)
 
-        new = cur_mend + n * self.m_offset
-        result = self.cbday.rollback(new)
-        return result
+        _CustomMixin.__init__(self, weekmask, holidays, calendar)
 
-class CustomBusinessMonthBegin(BusinessMixin, MonthOffset):
-    """
-    **EXPERIMENTAL** DateOffset of one custom business month
+    @cache_readonly
+    def cbday_roll(self):
+        """Define default roll function to be called in apply method"""
+        cbday = CustomBusinessDay(n=self.n, normalize=False, **self.kwds)
 
-    .. warning:: EXPERIMENTAL
+        if self._prefix.endswith('S'):
+            # MonthBegin
+            roll_func = cbday.rollforward
+        else:
+            # MonthEnd
+            roll_func = cbday.rollback
+        return roll_func
+
+    @cache_readonly
+    def m_offset(self):
+        if self._prefix.endswith('S'):
+            # MonthBegin
+            moff = MonthBegin(n=1, normalize=False)
+        else:
+            # MonthEnd
+            moff = MonthEnd(n=1, normalize=False)
+        return moff
+
+    @cache_readonly
+    def month_roll(self):
+        """Define default roll function to be called in apply method"""
+        if self._prefix.endswith('S'):
+            # MonthBegin
+            roll_func = self.m_offset.rollback
+        else:
+            # MonthEnd
+            roll_func = self.m_offset.rollforward
+        return roll_func
 
-        This class is not officially supported and the API is likely to change
-        in future versions. Use this at your own risk.
+    @apply_wraps
+    def apply(self, other):
+        # First move to month offset
+        cur_month_offset_date = self.month_roll(other)
+
+        # Find this custom month offset
+        compare_date = self.cbday_roll(cur_month_offset_date)
+        n = liboffsets.roll_convention(other.day, self.n, compare_date.day)
+
+        new = cur_month_offset_date + n * self.m_offset
+        result = self.cbday_roll(new)
+        return result
+
+
+class CustomBusinessMonthEnd(_CustomBusinessMonth):
+    # TODO(py27): Replace condition with Subsitution after dropping Py27
+    if _CustomBusinessMonth.__doc__:
+        __doc__ = _CustomBusinessMonth.__doc__.replace('[BEGIN/END]', 'end')
+    _prefix = 'CBM'
+
+
+class CustomBusinessMonthBegin(_CustomBusinessMonth):
+    # TODO(py27): Replace condition with Subsitution after dropping Py27
+    if _CustomBusinessMonth.__doc__:
+        __doc__ = _CustomBusinessMonth.__doc__.replace('[BEGIN/END]',
+                                                       'beginning')
+    _prefix = 'CBMS'
+
+
+# ---------------------------------------------------------------------
+# Semi-Month Based Offset Classes
+
+class SemiMonthOffset(DateOffset):
+    _adjust_dst = True
+    _default_day_of_month = 15
+    _min_day_of_month = 2
+    _attributes = frozenset(['n', 'normalize', 'day_of_month'])
+
+    def __init__(self, n=1, normalize=False, day_of_month=None):
+        BaseOffset.__init__(self, n, normalize)
+
+        if day_of_month is None:
+            object.__setattr__(self, "day_of_month",
+                               self._default_day_of_month)
+        else:
+            object.__setattr__(self, "day_of_month", int(day_of_month))
+        if not self._min_day_of_month <= self.day_of_month <= 27:
+            msg = 'day_of_month must be {min}<=day_of_month<=27, got {day}'
+            raise ValueError(msg.format(min=self._min_day_of_month,
+                                        day=self.day_of_month))
+
+    @classmethod
+    def _from_name(cls, suffix=None):
+        return cls(day_of_month=suffix)
+
+    @property
+    def rule_code(self):
+        suffix = '-{day_of_month}'.format(day_of_month=self.day_of_month)
+        return self._prefix + suffix
+
+    @apply_wraps
+    def apply(self, other):
+        # shift `other` to self.day_of_month, incrementing `n` if necessary
+        n = liboffsets.roll_convention(other.day, self.n, self.day_of_month)
+
+        days_in_month = ccalendar.get_days_in_month(other.year, other.month)
+
+        # For SemiMonthBegin on other.day == 1 and
+        # SemiMonthEnd on other.day == days_in_month,
+        # shifting `other` to `self.day_of_month` _always_ requires
+        # incrementing/decrementing `n`, regardless of whether it is
+        # initially positive.
+        if type(self) is SemiMonthBegin and (self.n <= 0 and other.day == 1):
+            n -= 1
+        elif type(self) is SemiMonthEnd and (self.n > 0 and
+                                             other.day == days_in_month):
+            n += 1
+
+        return self._apply(n, other)
+
+    def _apply(self, n, other):
+        """Handle specific apply logic for child classes"""
+        raise com.AbstractMethodError(self)
+
+    @apply_index_wraps
+    def apply_index(self, i):
+        # determine how many days away from the 1st of the month we are
+        days_from_start = i.to_perioddelta('M').asi8
+        delta = Timedelta(days=self.day_of_month - 1).value
+
+        # get boolean array for each element before the day_of_month
+        before_day_of_month = days_from_start < delta
+
+        # get boolean array for each element after the day_of_month
+        after_day_of_month = days_from_start > delta
+
+        # determine the correct n for each date in i
+        roll = self._get_roll(i, before_day_of_month, after_day_of_month)
+
+        # isolate the time since it will be striped away one the next line
+        time = i.to_perioddelta('D')
+
+        # apply the correct number of months
+        i = (i.to_period('M') + (roll // 2)).to_timestamp()
+
+        # apply the correct day
+        i = self._apply_index_days(i, roll)
+
+        return i + time
+
+    def _get_roll(self, i, before_day_of_month, after_day_of_month):
+        """Return an array with the correct n for each date in i.
+
+        The roll array is based on the fact that i gets rolled back to
+        the first day of the month.
+        """
+        raise com.AbstractMethodError(self)
+
+    def _apply_index_days(self, i, roll):
+        """Apply the correct day for each date in i"""
+        raise com.AbstractMethodError(self)
+
+
+class SemiMonthEnd(SemiMonthOffset):
+    """
+    Two DateOffset's per month repeating on the last
+    day of the month and day_of_month.
+
+    .. versionadded:: 0.19.0
 
     Parameters
     ----------
-    n : int, default 1
-    offset : timedelta, default timedelta(0)
+    n: int
     normalize : bool, default False
-        Normalize start/end dates to midnight before generating date range
-    weekmask : str, Default 'Mon Tue Wed Thu Fri'
-        weekmask of valid business days, passed to ``numpy.busdaycalendar``
-    holidays : list
-        list/array of dates to exclude from the set of valid business days,
-        passed to ``numpy.busdaycalendar``
-    calendar : pd.HolidayCalendar or np.busdaycalendar
+    day_of_month: int, {1, 3,...,27}, default 15
     """
+    _prefix = 'SM'
+    _min_day_of_month = 1
 
-    _cacheable = False
-    _prefix = 'CBMS'
-    def __init__(self, n=1, normalize=False,  weekmask='Mon Tue Wed Thu Fri',
-                 holidays=None, calendar=None, **kwds):
-        self.n = int(n)
-        self.normalize = normalize
-        self.kwds = kwds
-        self.offset = kwds.get('offset', timedelta(0))
-        self.cbday = CustomBusinessDay(n=self.n, normalize=normalize,
-                                       weekmask=weekmask, holidays=holidays,
-                                       calendar=calendar, **kwds)
-        self.m_offset = MonthBegin(n=1, normalize=normalize, **kwds)
-        self.kwds['calendar'] = self.cbday.calendar  # cache numpy calendar
+    def onOffset(self, dt):
+        if self.normalize and not _is_normalized(dt):
+            return False
+        days_in_month = ccalendar.get_days_in_month(dt.year, dt.month)
+        return dt.day in (self.day_of_month, days_in_month)
 
-    @apply_wraps
-    def apply(self,other):
+    def _apply(self, n, other):
+        months = n // 2
+        day = 31 if n % 2 else self.day_of_month
+        return shift_month(other, months, day)
+
+    def _get_roll(self, i, before_day_of_month, after_day_of_month):
         n = self.n
-        dt_in = other
-        # First move to month offset
-        cur_mbegin = self.m_offset.rollback(dt_in)
-        # Find this custom month offset
-        cur_cmbegin = self.cbday.rollforward(cur_mbegin)
+        is_month_end = i.is_month_end
+        if n > 0:
+            roll_end = np.where(is_month_end, 1, 0)
+            roll_before = np.where(before_day_of_month, n, n + 1)
+            roll = roll_end + roll_before
+        elif n == 0:
+            roll_after = np.where(after_day_of_month, 2, 0)
+            roll_before = np.where(~after_day_of_month, 1, 0)
+            roll = roll_before + roll_after
+        else:
+            roll = np.where(after_day_of_month, n + 2, n + 1)
+        return roll
 
-        # handle zero case. arbitrarily rollforward
-        if n == 0 and dt_in != cur_cmbegin:
-            n += 1
+    def _apply_index_days(self, i, roll):
+        """Add days portion of offset to DatetimeIndex i
 
-        if dt_in > cur_cmbegin and n <= -1:
-            n += 1
-        elif dt_in < cur_cmbegin and n >= 1:
-            n -= 1
+        Parameters
+        ----------
+        i : DatetimeIndex
+        roll : ndarray[int64_t]
 
-        new = cur_mbegin + n * self.m_offset
-        result = self.cbday.rollforward(new)
-        return result
+        Returns
+        -------
+        result : DatetimeIndex
+        """
+        nanos = (roll % 2) * Timedelta(days=self.day_of_month).value
+        i += nanos.astype('timedelta64[ns]')
+        return i + Timedelta(days=-1)
+
+
+class SemiMonthBegin(SemiMonthOffset):
+    """
+    Two DateOffset's per month repeating on the first
+    day of the month and day_of_month.
+
+    .. versionadded:: 0.19.0
+
+    Parameters
+    ----------
+    n: int
+    normalize : bool, default False
+    day_of_month: int, {2, 3,...,27}, default 15
+    """
+    _prefix = 'SMS'
+
+    def onOffset(self, dt):
+        if self.normalize and not _is_normalized(dt):
+            return False
+        return dt.day in (1, self.day_of_month)
+
+    def _apply(self, n, other):
+        months = n // 2 + n % 2
+        day = 1 if n % 2 else self.day_of_month
+        return shift_month(other, months, day)
+
+    def _get_roll(self, i, before_day_of_month, after_day_of_month):
+        n = self.n
+        is_month_start = i.is_month_start
+        if n > 0:
+            roll = np.where(before_day_of_month, n, n + 1)
+        elif n == 0:
+            roll_start = np.where(is_month_start, 0, 1)
+            roll_after = np.where(after_day_of_month, 1, 0)
+            roll = roll_start + roll_after
+        else:
+            roll_after = np.where(after_day_of_month, n + 2, n + 1)
+            roll_start = np.where(is_month_start, -1, 0)
+            roll = roll_after + roll_start
+        return roll
+
+    def _apply_index_days(self, i, roll):
+        """Add days portion of offset to DatetimeIndex i
+
+        Parameters
+        ----------
+        i : DatetimeIndex
+        roll : ndarray[int64_t]
+
+        Returns
+        -------
+        result : DatetimeIndex
+        """
+        nanos = (roll % 2) * Timedelta(days=self.day_of_month - 1).value
+        return i + nanos.astype('timedelta64[ns]')
+
+
+# ---------------------------------------------------------------------
+# Week-Based Offset Classes
 
 class Week(DateOffset):
     """
@@ -1306,68 +1252,84 @@ class Week(DateOffset):
         Always generate specific day of week. 0 for Monday
     """
     _adjust_dst = True
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-        self.weekday = kwds.get('weekday', None)
+    _inc = timedelta(weeks=1)
+    _prefix = 'W'
+    _attributes = frozenset(['n', 'normalize', 'weekday'])
+
+    def __init__(self, n=1, normalize=False, weekday=None):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "weekday", weekday)
 
         if self.weekday is not None:
             if self.weekday < 0 or self.weekday > 6:
-                raise ValueError('Day must be 0<=day<=6, got %d' %
-                                 self.weekday)
-
-        self._inc = timedelta(weeks=1)
-        self.kwds = kwds
+                raise ValueError('Day must be 0<=day<=6, got {day}'
+                                 .format(day=self.weekday))
 
     def isAnchored(self):
         return (self.n == 1 and self.weekday is not None)
 
     @apply_wraps
     def apply(self, other):
-        base = other
         if self.weekday is None:
             return other + self.n * self._inc
 
-        if self.n > 0:
-            k = self.n
-            otherDay = other.weekday()
-            if otherDay != self.weekday:
-                other = other + timedelta((self.weekday - otherDay) % 7)
-                k = k - 1
-            other = other
-            for i in range(k):
-                other = other + self._inc
-        else:
-            k = self.n
-            otherDay = other.weekday()
-            if otherDay != self.weekday:
-                other = other + timedelta((self.weekday - otherDay) % 7)
-            for i in range(-k):
-                other = other - self._inc
+        k = self.n
+        otherDay = other.weekday()
+        if otherDay != self.weekday:
+            other = other + timedelta((self.weekday - otherDay) % 7)
+            if k > 0:
+                k -= 1
 
-        other = datetime(other.year, other.month, other.day,
-                         base.hour, base.minute, base.second, base.microsecond)
-        return other
+        return other + timedelta(weeks=k)
 
     @apply_index_wraps
     def apply_index(self, i):
         if self.weekday is None:
-            return (i.to_period('W') + self.n).to_timestamp() + i.to_perioddelta('W')
+            return ((i.to_period('W') + self.n).to_timestamp() +
+                    i.to_perioddelta('W'))
         else:
-            return self._end_apply_index(i, self.freqstr)
+            return self._end_apply_index(i)
+
+    def _end_apply_index(self, dtindex):
+        """Add self to the given DatetimeIndex, specialized for case where
+        self.weekday is non-null.
+
+        Parameters
+        ----------
+        dtindex : DatetimeIndex
+
+        Returns
+        -------
+        result : DatetimeIndex
+        """
+        off = dtindex.to_perioddelta('D')
+
+        base, mult = libfrequencies.get_freq_code(self.freqstr)
+        base_period = dtindex.to_period(base)
+        if self.n > 0:
+            # when adding, dates on end roll to next
+            normed = dtindex - off
+            roll = np.where(base_period.to_timestamp(how='end') == normed,
+                            self.n, self.n - 1)
+        else:
+            roll = self.n
+
+        base = (base_period + roll).to_timestamp(how='end')
+        return base + off
 
     def onOffset(self, dt):
         if self.normalize and not _is_normalized(dt):
             return False
+        elif self.weekday is None:
+            return True
         return dt.weekday() == self.weekday
 
-    _prefix = 'W'
-
     @property
     def rule_code(self):
         suffix = ''
         if self.weekday is not None:
-            suffix = '-%s' % (_int_to_weekday[self.weekday])
+            weekday = ccalendar.int_to_weekday[self.weekday]
+            suffix = '-{weekday}'.format(weekday=weekday)
         return self._prefix + suffix
 
     @classmethod
@@ -1375,41 +1337,42 @@ def _from_name(cls, suffix=None):
         if not suffix:
             weekday = None
         else:
-            weekday = _weekday_to_int[suffix]
+            weekday = ccalendar.weekday_to_int[suffix]
         return cls(weekday=weekday)
 
-class WeekDay(object):
-    MON = 0
-    TUE = 1
-    WED = 2
-    THU = 3
-    FRI = 4
-    SAT = 5
-    SUN = 6
-
-_int_to_weekday = {
-    WeekDay.MON: 'MON',
-    WeekDay.TUE: 'TUE',
-    WeekDay.WED: 'WED',
-    WeekDay.THU: 'THU',
-    WeekDay.FRI: 'FRI',
-    WeekDay.SAT: 'SAT',
-    WeekDay.SUN: 'SUN'
-}
-
-_weekday_to_int = dict((v, k) for k, v in _int_to_weekday.items())
-
-
-class WeekOfMonth(DateOffset):
+
+class _WeekOfMonthMixin(object):
+    """Mixin for methods common to WeekOfMonth and LastWeekOfMonth"""
+    @apply_wraps
+    def apply(self, other):
+        compare_day = self._get_offset_day(other)
+
+        months = self.n
+        if months > 0 and compare_day > other.day:
+            months -= 1
+        elif months <= 0 and compare_day < other.day:
+            months += 1
+
+        shifted = shift_month(other, months, 'start')
+        to_day = self._get_offset_day(shifted)
+        return shift_day(shifted, to_day - shifted.day)
+
+    def onOffset(self, dt):
+        if self.normalize and not _is_normalized(dt):
+            return False
+        return dt.day == self._get_offset_day(dt)
+
+
+class WeekOfMonth(_WeekOfMonthMixin, DateOffset):
     """
     Describes monthly dates like "the Tuesday of the 2nd week of each month"
 
     Parameters
     ----------
     n : int
-    week : {0, 1, 2, 3, ...}
+    week : {0, 1, 2, 3, ...}, default 0
         0 is 1st week of month, 1 2nd week, etc.
-    weekday : {0, 1, ..., 6}
+    weekday : {0, 1, ..., 6}, default 0
         0: Mondays
         1: Tuesdays
         2: Wednesdays
@@ -1418,91 +1381,68 @@ class WeekOfMonth(DateOffset):
         5: Saturdays
         6: Sundays
     """
-
+    _prefix = 'WOM'
     _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize', 'week', 'weekday'])
 
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-        self.weekday = kwds['weekday']
-        self.week = kwds['week']
-
-        if self.n == 0:
-            raise ValueError('N cannot be 0')
+    def __init__(self, n=1, normalize=False, week=0, weekday=0):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "weekday", weekday)
+        object.__setattr__(self, "week", week)
 
         if self.weekday < 0 or self.weekday > 6:
-            raise ValueError('Day must be 0<=day<=6, got %d' %
-                             self.weekday)
+            raise ValueError('Day must be 0<=day<=6, got {day}'
+                             .format(day=self.weekday))
         if self.week < 0 or self.week > 3:
-            raise ValueError('Week must be 0<=day<=3, got %d' %
-                             self.week)
-
-        self.kwds = kwds
-
-    @apply_wraps
-    def apply(self, other):
-        base = other
-        offsetOfMonth = self.getOffsetOfMonth(other)
-
-        if offsetOfMonth > other:
-            if self.n > 0:
-                months = self.n - 1
-            else:
-                months = self.n
-        elif offsetOfMonth == other:
-            months = self.n
-        else:
-            if self.n > 0:
-                months = self.n
-            else:
-                months = self.n + 1
+            raise ValueError('Week must be 0<=week<=3, got {week}'
+                             .format(week=self.week))
 
-        other = self.getOffsetOfMonth(other + relativedelta(months=months, day=1))
-        other = datetime(other.year, other.month, other.day, base.hour,
-                         base.minute, base.second, base.microsecond)
-        return other
-
-    def getOffsetOfMonth(self, dt):
-        w = Week(weekday=self.weekday)
-        d = datetime(dt.year, dt.month, 1, tzinfo=dt.tzinfo)
-        d = w.rollforward(d)
-
-        for i in range(self.week):
-            d = w.apply(d)
+    def _get_offset_day(self, other):
+        """
+        Find the day in the same month as other that has the same
+        weekday as self.weekday and is the self.week'th such day in the month.
 
-        return d
+        Parameters
+        ----------
+        other: datetime
 
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        d = datetime(dt.year, dt.month, dt.day, tzinfo=dt.tzinfo)
-        return d == self.getOffsetOfMonth(dt)
+        Returns
+        -------
+        day: int
+        """
+        mstart = datetime(other.year, other.month, 1)
+        wday = mstart.weekday()
+        shift_days = (self.weekday - wday) % 7
+        return 1 + shift_days + self.week * 7
 
     @property
     def rule_code(self):
-        return '%s-%d%s' % (self._prefix, self.week + 1,
-                            _int_to_weekday.get(self.weekday, ''))
-
-    _prefix = 'WOM'
+        weekday = ccalendar.int_to_weekday.get(self.weekday, '')
+        return '{prefix}-{week}{weekday}'.format(prefix=self._prefix,
+                                                 week=self.week + 1,
+                                                 weekday=weekday)
 
     @classmethod
     def _from_name(cls, suffix=None):
         if not suffix:
-            raise ValueError("Prefix %r requires a suffix." % (cls._prefix))
+            raise ValueError("Prefix {prefix!r} requires a suffix."
+                             .format(prefix=cls._prefix))
         # TODO: handle n here...
         # only one digit weeks (1 --> week 0, 2 --> week 1, etc.)
         week = int(suffix[0]) - 1
-        weekday = _weekday_to_int[suffix[1:]]
+        weekday = ccalendar.weekday_to_int[suffix[1:]]
         return cls(week=week, weekday=weekday)
 
-class LastWeekOfMonth(DateOffset):
+
+class LastWeekOfMonth(_WeekOfMonthMixin, DateOffset):
     """
-    Describes monthly dates in last week of month like "the last Tuesday of each month"
+    Describes monthly dates in last week of month like "the last Tuesday of
+    each month"
 
     Parameters
     ----------
-    n : int
-    weekday : {0, 1, ..., 6}
+    n : int, default 1
+    weekday : {0, 1, ..., 6}, default 0
         0: Mondays
         1: Tuesdays
         2: Wednesdays
@@ -1510,85 +1450,77 @@ class LastWeekOfMonth(DateOffset):
         4: Fridays
         5: Saturdays
         6: Sundays
+
     """
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-        self.weekday = kwds['weekday']
+    _prefix = 'LWOM'
+    _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize', 'weekday'])
+
+    def __init__(self, n=1, normalize=False, weekday=0):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "weekday", weekday)
 
         if self.n == 0:
             raise ValueError('N cannot be 0')
 
         if self.weekday < 0 or self.weekday > 6:
-            raise ValueError('Day must be 0<=day<=6, got %d' %
-                            self.weekday)
-
-        self.kwds = kwds
+            raise ValueError('Day must be 0<=day<=6, got {day}'
+                             .format(day=self.weekday))
 
-    @apply_wraps
-    def apply(self, other):
-        offsetOfMonth = self.getOffsetOfMonth(other)
-
-        if offsetOfMonth > other:
-            if self.n > 0:
-                months = self.n - 1
-            else:
-                months = self.n
-        elif offsetOfMonth == other:
-            months = self.n
-        else:
-            if self.n > 0:
-                months = self.n
-            else:
-                months = self.n + 1
-
-        return self.getOffsetOfMonth(other + relativedelta(months=months, day=1))
+    def _get_offset_day(self, other):
+        """
+        Find the day in the same month as other that has the same
+        weekday as self.weekday and is the last such day in the month.
 
-    def getOffsetOfMonth(self, dt):
-        m =  MonthEnd()
-        d = datetime(dt.year, dt.month, 1, dt.hour, dt.minute,
-                     dt.second, dt.microsecond, tzinfo=dt.tzinfo)
-        eom = m.rollforward(d)
-        w = Week(weekday=self.weekday)
-        return w.rollback(eom)
+        Parameters
+        ----------
+        other: datetime
 
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        return dt == self.getOffsetOfMonth(dt)
+        Returns
+        -------
+        day: int
+        """
+        dim = ccalendar.get_days_in_month(other.year, other.month)
+        mend = datetime(other.year, other.month, dim)
+        wday = mend.weekday()
+        shift_days = (wday - self.weekday) % 7
+        return dim - shift_days
 
     @property
     def rule_code(self):
-        return '%s-%s' % (self._prefix, _int_to_weekday.get(self.weekday, ''))
-
-    _prefix = 'LWOM'
+        weekday = ccalendar.int_to_weekday.get(self.weekday, '')
+        return '{prefix}-{weekday}'.format(prefix=self._prefix,
+                                           weekday=weekday)
 
     @classmethod
     def _from_name(cls, suffix=None):
         if not suffix:
-            raise ValueError("Prefix %r requires a suffix." % (cls._prefix))
+            raise ValueError("Prefix {prefix!r} requires a suffix."
+                             .format(prefix=cls._prefix))
         # TODO: handle n here...
-        weekday = _weekday_to_int[suffix]
+        weekday = ccalendar.weekday_to_int[suffix]
         return cls(weekday=weekday)
 
+# ---------------------------------------------------------------------
+# Quarter-Based Offset Classes
+
 
 class QuarterOffset(DateOffset):
     """Quarter representation - doesn't call super"""
-
-    #: default month for __init__
     _default_startingMonth = None
-    #: default month in _from_name
     _from_name_startingMonth = None
     _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize', 'startingMonth'])
     # TODO: Consider combining QuarterOffset and YearOffset __init__ at some
-    #       point
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-        self.startingMonth = kwds.get('startingMonth',
-                                      self._default_startingMonth)
+    #       point.  Also apply_index, onOffset, rule_code if
+    #       startingMonth vs month attr names are resolved
+
+    def __init__(self, n=1, normalize=False, startingMonth=None):
+        BaseOffset.__init__(self, n, normalize)
 
-        self.kwds = kwds
+        if startingMonth is None:
+            startingMonth = self._default_startingMonth
+        object.__setattr__(self, "startingMonth", startingMonth)
 
     def isAnchored(self):
         return (self.n == 1 and self.startingMonth is not None)
@@ -1597,7 +1529,7 @@ def isAnchored(self):
     def _from_name(cls, suffix=None):
         kwargs = {}
         if suffix:
-            kwargs['startingMonth'] = _month_to_int[suffix]
+            kwargs['startingMonth'] = ccalendar.MONTH_TO_CAL_NUM[suffix]
         else:
             if cls._from_name_startingMonth is not None:
                 kwargs['startingMonth'] = cls._from_name_startingMonth
@@ -1605,7 +1537,33 @@ def _from_name(cls, suffix=None):
 
     @property
     def rule_code(self):
-        return '%s-%s' % (self._prefix, _int_to_month[self.startingMonth])
+        month = ccalendar.MONTH_ALIASES[self.startingMonth]
+        return '{prefix}-{month}'.format(prefix=self._prefix, month=month)
+
+    @apply_wraps
+    def apply(self, other):
+        # months_since: find the calendar quarter containing other.month,
+        # e.g. if other.month == 8, the calendar quarter is [Jul, Aug, Sep].
+        # Then find the month in that quarter containing an onOffset date for
+        # self.  `months_since` is the number of months to shift other.month
+        # to get to this on-offset month.
+        months_since = other.month % 3 - self.startingMonth % 3
+        qtrs = liboffsets.roll_qtrday(other, self.n, self.startingMonth,
+                                      day_opt=self._day_opt, modby=3)
+        months = qtrs * 3 - months_since
+        return shift_month(other, months, self._day_opt)
+
+    def onOffset(self, dt):
+        if self.normalize and not _is_normalized(dt):
+            return False
+        mod_month = (dt.month - self.startingMonth) % 3
+        return mod_month == 0 and dt.day == self._get_offset_day(dt)
+
+    @apply_index_wraps
+    def apply_index(self, dtindex):
+        shifted = liboffsets.shift_quarters(dtindex.asi8, self.n,
+                                            self.startingMonth, self._day_opt)
+        return dtindex._shallow_copy(shifted)
 
 
 class BQuarterEnd(QuarterOffset):
@@ -1616,45 +1574,9 @@ class BQuarterEnd(QuarterOffset):
     """
     _outputName = 'BusinessQuarterEnd'
     _default_startingMonth = 3
-    # 'BQ'
     _from_name_startingMonth = 12
     _prefix = 'BQ'
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        base = other
-        other = datetime(other.year, other.month, other.day,
-                         other.hour, other.minute, other.second,
-                         other.microsecond)
-
-        wkday, days_in_month = tslib.monthrange(other.year, other.month)
-        lastBDay = days_in_month - max(((wkday + days_in_month - 1)
-                                        % 7) - 4, 0)
-
-        monthsToGo = 3 - ((other.month - self.startingMonth) % 3)
-        if monthsToGo == 3:
-            monthsToGo = 0
-
-        if n > 0 and not (other.day >= lastBDay and monthsToGo == 0):
-            n = n - 1
-        elif n <= 0 and other.day > lastBDay and monthsToGo == 0:
-            n = n + 1
-
-        other = other + relativedelta(months=monthsToGo + 3 * n, day=31)
-        other = tslib._localize_pydatetime(other, base.tzinfo)
-        if other.weekday() > 4:
-            other = other - BDay()
-        return other
-
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        modMonth = (dt.month - self.startingMonth) % 3
-        return BMonthEnd().onOffset(dt) and modMonth == 0
-
-_int_to_month = tslib._MONTH_ALIASES
-_month_to_int = dict((v, k) for k, v in _int_to_month.items())
+    _day_opt = 'business_end'
 
 
 # TODO: This is basically the same as BQuarterEnd
@@ -1664,34 +1586,7 @@ class BQuarterBegin(QuarterOffset):
     _default_startingMonth = 3
     _from_name_startingMonth = 1
     _prefix = 'BQS'
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        wkday, _ = tslib.monthrange(other.year, other.month)
-
-        first = _get_firstbday(wkday)
-
-        monthsSince = (other.month - self.startingMonth) % 3
-
-        if n <= 0 and monthsSince != 0:  # make sure to roll forward so negate
-            monthsSince = monthsSince - 3
-
-        # roll forward if on same month later than first bday
-        if n <= 0 and (monthsSince == 0 and other.day > first):
-            n = n + 1
-        # pretend to roll back if on same month but before firstbday
-        elif n > 0 and (monthsSince == 0 and other.day < first):
-            n = n - 1
-
-        # get the first bday for result
-        other = other + relativedelta(months=3 * n - monthsSince)
-        wkday, _ = tslib.monthrange(other.year, other.month)
-        first = _get_firstbday(wkday)
-        result = datetime(other.year, other.month, first,
-                          other.hour, other.minute, other.second,
-                          other.microsecond)
-        return result
+    _day_opt = 'business_start'
 
 
 class QuarterEnd(QuarterOffset):
@@ -1703,44 +1598,7 @@ class QuarterEnd(QuarterOffset):
     _outputName = 'QuarterEnd'
     _default_startingMonth = 3
     _prefix = 'Q'
-
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-        self.startingMonth = kwds.get('startingMonth', 3)
-
-        self.kwds = kwds
-
-    def isAnchored(self):
-        return (self.n == 1 and self.startingMonth is not None)
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        other = datetime(other.year, other.month, other.day,
-                         other.hour, other.minute, other.second,
-                         other.microsecond)
-        wkday, days_in_month = tslib.monthrange(other.year, other.month)
-
-        monthsToGo = 3 - ((other.month - self.startingMonth) % 3)
-        if monthsToGo == 3:
-            monthsToGo = 0
-
-        if n > 0 and not (other.day >= days_in_month and monthsToGo == 0):
-            n = n - 1
-
-        other = other + relativedelta(months=monthsToGo + 3 * n, day=31)
-        return other
-
-    @apply_index_wraps
-    def apply_index(self, i):
-        return self._end_apply_index(i, self.freqstr)
-
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        modMonth = (dt.month - self.startingMonth) % 3
-        return MonthEnd().onOffset(dt) and modMonth == 0
+    _day_opt = 'end'
 
 
 class QuarterBegin(QuarterOffset):
@@ -1748,55 +1606,61 @@ class QuarterBegin(QuarterOffset):
     _default_startingMonth = 3
     _from_name_startingMonth = 1
     _prefix = 'QS'
+    _day_opt = 'start'
 
-    def isAnchored(self):
-        return (self.n == 1 and self.startingMonth is not None)
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        wkday, days_in_month = tslib.monthrange(other.year, other.month)
 
-        monthsSince = (other.month - self.startingMonth) % 3
+# ---------------------------------------------------------------------
+# Year-Based Offset Classes
 
-        if n <= 0 and monthsSince != 0:
-            # make sure you roll forward, so negate
-            monthsSince = monthsSince - 3
+class YearOffset(DateOffset):
+    """DateOffset that just needs a month"""
+    _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize', 'month'])
 
-        if n < 0 and (monthsSince == 0 and other.day > 1):
-            # after start, so come back an extra period as if rolled forward
-            n = n + 1
+    def _get_offset_day(self, other):
+        # override BaseOffset method to use self.month instead of other.month
+        # TODO: there may be a more performant way to do this
+        return liboffsets.get_day_of_month(other.replace(month=self.month),
+                                           self._day_opt)
 
-        other = other + relativedelta(months=3 * n - monthsSince, day=1)
-        return other
+    @apply_wraps
+    def apply(self, other):
+        years = roll_yearday(other, self.n, self.month, self._day_opt)
+        months = years * 12 + (self.month - other.month)
+        return shift_month(other, months, self._day_opt)
 
     @apply_index_wraps
-    def apply_index(self, i):
-        freq_month = 12 if self.startingMonth == 1 else self.startingMonth - 1
-        freqstr =  'Q-%s' % (_int_to_month[freq_month],)
-        return self._beg_apply_index(i, freqstr)
+    def apply_index(self, dtindex):
+        shifted = liboffsets.shift_quarters(dtindex.asi8, self.n,
+                                            self.month, self._day_opt,
+                                            modby=12)
+        return dtindex._shallow_copy(shifted)
 
-class YearOffset(DateOffset):
-    """DateOffset that just needs a month"""
-    _adjust_dst = True
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.month = kwds.get('month', self._default_month)
+    def onOffset(self, dt):
+        if self.normalize and not _is_normalized(dt):
+            return False
+        return dt.month == self.month and dt.day == self._get_offset_day(dt)
+
+    def __init__(self, n=1, normalize=False, month=None):
+        BaseOffset.__init__(self, n, normalize)
+
+        month = month if month is not None else self._default_month
+        object.__setattr__(self, "month", month)
 
         if self.month < 1 or self.month > 12:
             raise ValueError('Month must go from 1 to 12')
 
-        DateOffset.__init__(self, n=n, normalize=normalize, **kwds)
-
     @classmethod
     def _from_name(cls, suffix=None):
         kwargs = {}
         if suffix:
-            kwargs['month'] = _month_to_int[suffix]
+            kwargs['month'] = ccalendar.MONTH_TO_CAL_NUM[suffix]
         return cls(**kwargs)
 
     @property
     def rule_code(self):
-        return '%s-%s' % (self._prefix, _int_to_month[self.month])
+        month = ccalendar.MONTH_ALIASES[self.month]
+        return '{prefix}-{month}'.format(prefix=self._prefix, month=month)
 
 
 class BYearEnd(YearOffset):
@@ -1804,35 +1668,7 @@ class BYearEnd(YearOffset):
     _outputName = 'BusinessYearEnd'
     _default_month = 12
     _prefix = 'BA'
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        wkday, days_in_month = tslib.monthrange(other.year, self.month)
-        lastBDay = (days_in_month -
-                    max(((wkday + days_in_month - 1) % 7) - 4, 0))
-
-        years = n
-        if n > 0:
-            if (other.month < self.month or
-                    (other.month == self.month and other.day < lastBDay)):
-                years -= 1
-        elif n <= 0:
-            if (other.month > self.month or
-                    (other.month == self.month and other.day > lastBDay)):
-                years += 1
-
-        other = other + relativedelta(years=years)
-
-        _, days_in_month = tslib.monthrange(other.year, self.month)
-        result = datetime(other.year, self.month, days_in_month,
-                          other.hour, other.minute, other.second,
-                          other.microsecond)
-
-        if result.weekday() > 4:
-            result = result - BDay()
-
-        return result
+    _day_opt = 'business_end'
 
 
 class BYearBegin(YearOffset):
@@ -1840,145 +1676,25 @@ class BYearBegin(YearOffset):
     _outputName = 'BusinessYearBegin'
     _default_month = 1
     _prefix = 'BAS'
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        wkday, days_in_month = tslib.monthrange(other.year, self.month)
-
-        first = _get_firstbday(wkday)
-
-        years = n
-
-        if n > 0:  # roll back first for positive n
-            if (other.month < self.month or
-                    (other.month == self.month and other.day < first)):
-                years -= 1
-        elif n <= 0:  # roll forward
-            if (other.month > self.month or
-                    (other.month == self.month and other.day > first)):
-                years += 1
-
-        # set first bday for result
-        other = other + relativedelta(years=years)
-        wkday, days_in_month = tslib.monthrange(other.year, self.month)
-        first = _get_firstbday(wkday)
-        return datetime(other.year, self.month, first, other.hour,
-                        other.minute, other.second, other.microsecond)
+    _day_opt = 'business_start'
 
 
 class YearEnd(YearOffset):
     """DateOffset increments between calendar year ends"""
     _default_month = 12
     _prefix = 'A'
-
-    @apply_wraps
-    def apply(self, other):
-        def _increment(date):
-            if date.month == self.month:
-                _, days_in_month = tslib.monthrange(date.year, self.month)
-                if date.day != days_in_month:
-                    year = date.year
-                else:
-                    year = date.year + 1
-            elif date.month < self.month:
-                year = date.year
-            else:
-                year = date.year + 1
-            _, days_in_month = tslib.monthrange(year, self.month)
-            return datetime(year, self.month, days_in_month,
-                            date.hour, date.minute, date.second,
-                            date.microsecond)
-
-        def _decrement(date):
-            year = date.year if date.month > self.month else date.year - 1
-            _, days_in_month = tslib.monthrange(year, self.month)
-            return datetime(year, self.month, days_in_month,
-                            date.hour, date.minute, date.second,
-                            date.microsecond)
-
-        def _rollf(date):
-            if date.month != self.month or\
-               date.day < tslib.monthrange(date.year, date.month)[1]:
-                date = _increment(date)
-            return date
-
-        n = self.n
-        result = other
-        if n > 0:
-            while n > 0:
-                result = _increment(result)
-                n -= 1
-        elif n < 0:
-            while n < 0:
-                result = _decrement(result)
-                n += 1
-        else:
-            # n == 0, roll forward
-            result = _rollf(result)
-        return result
-
-    @apply_index_wraps
-    def apply_index(self, i):
-        # convert month anchor to annual period tuple
-        return self._end_apply_index(i, self.freqstr)
-
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        wkday, days_in_month = tslib.monthrange(dt.year, self.month)
-        return self.month == dt.month and dt.day == days_in_month
+    _day_opt = 'end'
 
 
 class YearBegin(YearOffset):
     """DateOffset increments between calendar year begin dates"""
     _default_month = 1
     _prefix = 'AS'
+    _day_opt = 'start'
 
-    @apply_wraps
-    def apply(self, other):
-        def _increment(date, n):
-            year = date.year + n - 1
-            if date.month >= self.month:
-                year += 1
-            return datetime(year, self.month, 1, date.hour, date.minute,
-                            date.second, date.microsecond)
-
-        def _decrement(date, n):
-            year = date.year + n + 1
-            if date.month < self.month or (date.month == self.month and
-                                           date.day == 1):
-                year -= 1
-            return datetime(year, self.month, 1, date.hour, date.minute,
-                            date.second, date.microsecond)
-
-        def _rollf(date):
-            if (date.month != self.month) or date.day > 1:
-                date = _increment(date, 1)
-            return date
-
-        n = self.n
-        result = other
-        if n > 0:
-            result = _increment(result, n)
-        elif n < 0:
-            result = _decrement(result, n)
-        else:
-            # n == 0, roll forward
-            result = _rollf(result)
-        return result
-
-    @apply_index_wraps
-    def apply_index(self, i):
-        freq_month = 12 if self.month == 1 else self.month - 1
-        freqstr =  'A-%s' % (_int_to_month[freq_month],)
-        return self._beg_apply_index(i, freqstr)
-
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        return dt.month == self.month and dt.day == 1
 
+# ---------------------------------------------------------------------
+# Special Offset Classes
 
 class FY5253(DateOffset):
     """
@@ -1992,8 +1708,7 @@ class FY5253(DateOffset):
     such as retail, manufacturing and parking industry.
 
     For more information see:
-    http://en.wikipedia.org/wiki/4%E2%80%934%E2%80%935_calendar
-
+    http://en.wikipedia.org/wiki/4-4-5_calendar
 
     The year may either:
     - end on the last X day of the Y month.
@@ -2017,39 +1732,29 @@ class FY5253(DateOffset):
     variation : str
         {"nearest", "last"} for "LastOfMonth" or "NearestEndMonth"
     """
-
     _prefix = 'RE'
-    _suffix_prefix_last = 'L'
-    _suffix_prefix_nearest = 'N'
     _adjust_dst = True
+    _attributes = frozenset(['weekday', 'startingMonth', 'variation'])
 
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-        self.startingMonth = kwds['startingMonth']
-        self.weekday = kwds["weekday"]
-
-        self.variation = kwds["variation"]
+    def __init__(self, n=1, normalize=False, weekday=0, startingMonth=1,
+                 variation="nearest"):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "startingMonth", startingMonth)
+        object.__setattr__(self, "weekday", weekday)
 
-        self.kwds = kwds
+        object.__setattr__(self, "variation", variation)
 
         if self.n == 0:
             raise ValueError('N cannot be 0')
 
         if self.variation not in ["nearest", "last"]:
-            raise ValueError('%s is not a valid variation' % self.variation)
-
-        if self.variation == "nearest":
-            weekday_offset = weekday(self.weekday)
-            self._rd_forward = relativedelta(weekday=weekday_offset)
-            self._rd_backward = relativedelta(weekday=weekday_offset(-1))
-        else:
-            self._offset_lwom = LastWeekOfMonth(n=1, weekday=self.weekday)
+            raise ValueError('{variation} is not a valid variation'
+                             .format(variation=self.variation))
 
     def isAnchored(self):
-        return self.n == 1 \
-                and self.startingMonth is not None \
-                and self.weekday is not None
+        return (self.n == 1 and
+                self.startingMonth is not None and
+                self.weekday is not None)
 
     def onOffset(self, dt):
         if self.normalize and not _is_normalized(dt):
@@ -2059,120 +1764,105 @@ def onOffset(self, dt):
 
         if self.variation == "nearest":
             # We have to check the year end of "this" cal year AND the previous
-            return year_end == dt or \
-                self.get_year_end(dt - relativedelta(months=1)) == dt
+            return (year_end == dt or
+                    self.get_year_end(shift_month(dt, -1, None)) == dt)
         else:
             return year_end == dt
 
     @apply_wraps
     def apply(self, other):
+        norm = Timestamp(other).normalize()
+
         n = self.n
         prev_year = self.get_year_end(
-                        datetime(other.year - 1, self.startingMonth, 1))
+            datetime(other.year - 1, self.startingMonth, 1))
         cur_year = self.get_year_end(
-                        datetime(other.year, self.startingMonth, 1))
+            datetime(other.year, self.startingMonth, 1))
         next_year = self.get_year_end(
-                        datetime(other.year + 1, self.startingMonth, 1))
+            datetime(other.year + 1, self.startingMonth, 1))
+
         prev_year = tslib._localize_pydatetime(prev_year, other.tzinfo)
         cur_year = tslib._localize_pydatetime(cur_year, other.tzinfo)
         next_year = tslib._localize_pydatetime(next_year, other.tzinfo)
 
-        if n > 0:
-            if other == prev_year:
-                year = other.year - 1
-            elif other == cur_year:
-                year = other.year
-            elif other == next_year:
-                year = other.year + 1
-            elif other < prev_year:
-                year = other.year - 1
-                n -= 1
-            elif other < cur_year:
-                year = other.year
-                n -= 1
-            elif other < next_year:
-                year = other.year + 1
+        # Note: next_year.year == other.year + 1, so we will always
+        # have other < next_year
+        if norm == prev_year:
+            n -= 1
+        elif norm == cur_year:
+            pass
+        elif n > 0:
+            if norm < prev_year:
+                n -= 2
+            elif prev_year < norm < cur_year:
                 n -= 1
-            else:
-                assert False
-
-            result = self.get_year_end(datetime(year + n, self.startingMonth, 1))
-
-            result = datetime(result.year, result.month, result.day,
-                              other.hour, other.minute, other.second, other.microsecond)
-            return result
+            elif cur_year < norm < next_year:
+                pass
         else:
-            n = -n
-            if other == prev_year:
-                year = other.year - 1
-            elif other == cur_year:
-                year = other.year
-            elif other == next_year:
-                year = other.year + 1
-            elif other > next_year:
-                year = other.year + 1
-                n -= 1
-            elif other > cur_year:
-                year = other.year
-                n -= 1
-            elif other > prev_year:
-                year = other.year - 1
+            if cur_year < norm < next_year:
+                n += 1
+            elif prev_year < norm < cur_year:
+                pass
+            elif (norm.year == prev_year.year and norm < prev_year and
+                  prev_year - norm <= timedelta(6)):
+                # GH#14774, error when next_year.year == cur_year.year
+                # e.g. prev_year == datetime(2004, 1, 3),
+                # other == datetime(2004, 1, 1)
                 n -= 1
             else:
                 assert False
 
-            result = self.get_year_end(datetime(year - n, self.startingMonth, 1))
-
-            result = datetime(result.year, result.month, result.day,
-                              other.hour, other.minute, other.second, other.microsecond)
-            return result
+        shifted = datetime(other.year + n, self.startingMonth, 1)
+        result = self.get_year_end(shifted)
+        result = datetime(result.year, result.month, result.day,
+                          other.hour, other.minute, other.second,
+                          other.microsecond)
+        return result
 
     def get_year_end(self, dt):
-        if self.variation == "nearest":
-            return self._get_year_end_nearest(dt)
-        else:
-            return self._get_year_end_last(dt)
-
-    def get_target_month_end(self, dt):
-        target_month = datetime(dt.year, self.startingMonth, 1, tzinfo=dt.tzinfo)
-        next_month_first_of = target_month + relativedelta(months=+1)
-        return next_month_first_of + relativedelta(days=-1)
+        assert dt.tzinfo is None
 
-    def _get_year_end_nearest(self, dt):
-        target_date = self.get_target_month_end(dt)
-        if target_date.weekday() == self.weekday:
+        dim = ccalendar.get_days_in_month(dt.year, self.startingMonth)
+        target_date = datetime(dt.year, self.startingMonth, dim)
+        wkday_diff = self.weekday - target_date.weekday()
+        if wkday_diff == 0:
+            # year_end is the same for "last" and "nearest" cases
             return target_date
-        else:
-            forward = target_date + self._rd_forward
-            backward = target_date + self._rd_backward
 
-            if forward - target_date < target_date - backward:
-                return forward
-            else:
-                return backward
+        if self.variation == "last":
+            days_forward = (wkday_diff % 7) - 7
 
-    def _get_year_end_last(self, dt):
-        current_year = datetime(dt.year, self.startingMonth, 1, tzinfo=dt.tzinfo)
-        return current_year + self._offset_lwom
+            # days_forward is always negative, so we always end up
+            # in the same year as dt
+            return target_date + timedelta(days=days_forward)
+        else:
+            # variation == "nearest":
+            days_forward = wkday_diff % 7
+            if days_forward <= 3:
+                # The upcoming self.weekday is closer than the previous one
+                return target_date + timedelta(days_forward)
+            else:
+                # The previous self.weekday is closer than the upcoming one
+                return target_date + timedelta(days_forward - 7)
 
     @property
     def rule_code(self):
+        prefix = self._prefix
         suffix = self.get_rule_code_suffix()
-        return "%s-%s" % (self._get_prefix(), suffix)
-
-    def _get_prefix(self):
-        return self._prefix
+        return "{prefix}-{suffix}".format(prefix=prefix, suffix=suffix)
 
     def _get_suffix_prefix(self):
         if self.variation == "nearest":
-            return self._suffix_prefix_nearest
+            return 'N'
         else:
-            return self._suffix_prefix_last
+            return 'L'
 
     def get_rule_code_suffix(self):
-        return '%s-%s-%s' % (self._get_suffix_prefix(), \
-                           _int_to_month[self.startingMonth], \
-                         _int_to_weekday[self.weekday])
+        prefix = self._get_suffix_prefix()
+        month = ccalendar.MONTH_ALIASES[self.startingMonth]
+        weekday = ccalendar.int_to_weekday[self.weekday]
+        return '{prefix}-{month}-{weekday}'.format(prefix=prefix, month=month,
+                                                   weekday=weekday)
 
     @classmethod
     def _parse_suffix(cls, varion_code, startingMonth_code, weekday_code):
@@ -2181,17 +1871,15 @@ def _parse_suffix(cls, varion_code, startingMonth_code, weekday_code):
         elif varion_code == "L":
             variation = "last"
         else:
-            raise ValueError(
-                "Unable to parse varion_code: %s" % (varion_code,))
+            raise ValueError("Unable to parse varion_code: "
+                             "{code}".format(code=varion_code))
 
-        startingMonth = _month_to_int[startingMonth_code]
-        weekday = _weekday_to_int[weekday_code]
+        startingMonth = ccalendar.MONTH_TO_CAL_NUM[startingMonth_code]
+        weekday = ccalendar.weekday_to_int[weekday_code]
 
-        return {
-                "weekday": weekday,
+        return {"weekday": weekday,
                 "startingMonth": startingMonth,
-                "variation": variation,
-                }
+                "variation": variation}
 
     @classmethod
     def _from_name(cls, *args):
@@ -2211,7 +1899,7 @@ class FY5253Quarter(DateOffset):
     such as retail, manufacturing and parking industry.
 
     For more information see:
-    http://en.wikipedia.org/wiki/4%E2%80%934%E2%80%935_calendar
+    http://en.wikipedia.org/wiki/4-4-5_calendar
 
     The year may either:
     - end on the last X day of the Y month.
@@ -2244,66 +1932,101 @@ class FY5253Quarter(DateOffset):
 
     _prefix = 'REQ'
     _adjust_dst = True
+    _attributes = frozenset(['weekday', 'startingMonth', 'qtr_with_extra_week',
+                             'variation'])
 
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-
-        self.qtr_with_extra_week = kwds["qtr_with_extra_week"]
+    def __init__(self, n=1, normalize=False, weekday=0, startingMonth=1,
+                 qtr_with_extra_week=1, variation="nearest"):
+        BaseOffset.__init__(self, n, normalize)
 
-        self.kwds = kwds
+        object.__setattr__(self, "startingMonth", startingMonth)
+        object.__setattr__(self, "weekday", weekday)
+        object.__setattr__(self, "qtr_with_extra_week", qtr_with_extra_week)
+        object.__setattr__(self, "variation", variation)
 
         if self.n == 0:
             raise ValueError('N cannot be 0')
 
-        self._offset = FY5253( \
-                            startingMonth=kwds['startingMonth'], \
-                            weekday=kwds["weekday"],
-                            variation=kwds["variation"])
+    @cache_readonly
+    def _offset(self):
+        return FY5253(startingMonth=self.startingMonth,
+                      weekday=self.weekday,
+                      variation=self.variation)
 
     def isAnchored(self):
         return self.n == 1 and self._offset.isAnchored()
 
+    def _rollback_to_year(self, other):
+        """roll `other` back to the most recent date that was on a fiscal year
+        end.  Return the date of that year-end, the number of full quarters
+        elapsed between that year-end and other, and the remaining Timedelta
+        since the most recent quarter-end.
+
+        Parameters
+        ----------
+        other : datetime or Timestamp
+
+        Returns
+        -------
+        tuple of
+        prev_year_end : Timestamp giving most recent fiscal year end
+        num_qtrs : int
+        tdelta : Timedelta
+        """
+        num_qtrs = 0
+
+        norm = Timestamp(other).tz_localize(None)
+        start = self._offset.rollback(norm)
+        # Note: start <= norm and self._offset.onOffset(start)
+
+        if start < norm:
+            # roll adjustment
+            qtr_lens = self.get_weeks(norm)
+
+            # check thet qtr_lens is consistent with self._offset addition
+            end = shift_day(start, days=7 * sum(qtr_lens))
+            assert self._offset.onOffset(end), (start, end, qtr_lens)
+
+            tdelta = norm - start
+            for qlen in qtr_lens:
+                if qlen * 7 <= tdelta.days:
+                    num_qtrs += 1
+                    tdelta -= Timedelta(days=qlen * 7)
+                else:
+                    break
+        else:
+            tdelta = Timedelta(0)
+
+        # Note: we always have tdelta.value >= 0
+        return start, num_qtrs, tdelta
+
     @apply_wraps
     def apply(self, other):
-        base = other
+        # Note: self.n == 0 is not allowed.
         n = self.n
 
-        if n > 0:
-            while n > 0:
-                if not self._offset.onOffset(other):
-                    qtr_lens = self.get_weeks(other)
-                    start = other - self._offset
-                else:
-                    start = other
-                    qtr_lens = self.get_weeks(other + self._offset)
+        prev_year_end, num_qtrs, tdelta = self._rollback_to_year(other)
+        res = prev_year_end
+        n += num_qtrs
+        if self.n <= 0 and tdelta.value > 0:
+            n += 1
 
-                for weeks in qtr_lens:
-                    start += relativedelta(weeks=weeks)
-                    if start > other:
-                        other = start
-                        n -= 1
-                        break
+        # Possible speedup by handling years first.
+        years = n // 4
+        if years:
+            res += self._offset * years
+            n -= years * 4
 
-        else:
-            n = -n
-            while n > 0:
-                if not self._offset.onOffset(other):
-                    qtr_lens = self.get_weeks(other)
-                    end = other + self._offset
-                else:
-                    end = other
-                    qtr_lens = self.get_weeks(other)
-
-                for weeks in reversed(qtr_lens):
-                    end -= relativedelta(weeks=weeks)
-                    if end < other:
-                        other = end
-                        n -= 1
-                        break
-        other = datetime(other.year, other.month, other.day,
-                         base.hour, base.minute, base.second, base.microsecond)
-        return other
+        # Add an extra day to make *sure* we are getting the quarter lengths
+        # for the upcoming year, not the previous year
+        qtr_lens = self.get_weeks(res + Timedelta(days=1))
+
+        # Note: we always have 0 <= n < 4
+        weeks = sum(qtr_lens[:n])
+        if weeks:
+            res = shift_day(res, days=weeks * 7)
+
+        return res
 
     def get_weeks(self, dt):
         ret = [13] * 4
@@ -2316,16 +2039,15 @@ def get_weeks(self, dt):
         return ret
 
     def year_has_extra_week(self, dt):
-        if self._offset.onOffset(dt):
-            prev_year_end = dt - self._offset
-            next_year_end = dt
-        else:
-            next_year_end = dt + self._offset
-            prev_year_end = dt - self._offset
-
-        week_in_year = (next_year_end - prev_year_end).days / 7
+        # Avoid round-down errors --> normalize to get
+        # e.g. '370D' instead of '360D23H'
+        norm = Timestamp(dt).normalize().tz_localize(None)
 
-        return week_in_year == 53
+        next_year_end = self._offset.rollforward(norm)
+        prev_year_end = norm - self._offset
+        weeks_in_year = (next_year_end - prev_year_end).days / 7
+        assert weeks_in_year in [52, 53], weeks_in_year
+        return weeks_in_year == 53
 
     def onOffset(self, dt):
         if self.normalize and not _is_normalized(dt):
@@ -2338,8 +2060,8 @@ def onOffset(self, dt):
         qtr_lens = self.get_weeks(dt)
 
         current = next_year_end
-        for qtr_len in qtr_lens[0:4]:
-            current += relativedelta(weeks=qtr_len)
+        for qtr_len in qtr_lens:
+            current = shift_day(current, days=qtr_len * 7)
             if dt == current:
                 return True
         return False
@@ -2347,44 +2069,46 @@ def onOffset(self, dt):
     @property
     def rule_code(self):
         suffix = self._offset.get_rule_code_suffix()
-        return "%s-%s" % (self._prefix,
-                          "%s-%d" % (suffix, self.qtr_with_extra_week))
+        qtr = self.qtr_with_extra_week
+        return "{prefix}-{suffix}-{qtr}".format(prefix=self._prefix,
+                                                suffix=suffix, qtr=qtr)
 
     @classmethod
     def _from_name(cls, *args):
         return cls(**dict(FY5253._parse_suffix(*args[:-1]),
                           qtr_with_extra_week=int(args[-1])))
 
+
 class Easter(DateOffset):
-    '''
+    """
     DateOffset for the Easter holiday using
     logic defined in dateutil.  Right now uses
     the revised method which is valid in years
     1583-4099.
-    '''
+    """
     _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize'])
 
-    def __init__(self, n=1, **kwds):
-        super(Easter, self).__init__(n, **kwds)
+    __init__ = BaseOffset.__init__
 
     @apply_wraps
     def apply(self, other):
-        currentEaster = easter(other.year)
-        currentEaster = datetime(currentEaster.year, currentEaster.month, currentEaster.day)
-        currentEaster = tslib._localize_pydatetime(currentEaster, other.tzinfo)
+        current_easter = easter(other.year)
+        current_easter = datetime(current_easter.year,
+                                  current_easter.month, current_easter.day)
+        current_easter = tslib._localize_pydatetime(current_easter,
+                                                    other.tzinfo)
 
-        # NOTE: easter returns a datetime.date so we have to convert to type of other
-        if self.n >= 0:
-            if other >= currentEaster:
-                new = easter(other.year + self.n)
-            else:
-                new = easter(other.year + self.n - 1)
-        else:
-            if other > currentEaster:
-                new = easter(other.year + self.n + 1)
-            else:
-                new = easter(other.year + self.n)
+        n = self.n
+        if n >= 0 and other < current_easter:
+            n -= 1
+        elif n < 0 and other > current_easter:
+            n += 1
+        # TODO: Why does this handle the 0 case the opposite of others?
 
+        # NOTE: easter returns a datetime.date so we have to convert to type of
+        # other
+        new = easter(other.year + n)
         new = datetime(new.year, new.month, new.day, other.hour,
                        other.minute, other.second, other.microsecond)
         return new
@@ -2394,11 +2118,9 @@ def onOffset(self, dt):
             return False
         return date(dt.year, dt.month, dt.day) == easter(dt.year)
 
-#----------------------------------------------------------------------
+# ---------------------------------------------------------------------
 # Ticks
 
-import operator
-
 
 def _tick_comp(op):
     def f(self, other):
@@ -2409,6 +2131,14 @@ def f(self, other):
 
 class Tick(SingleConstructorOffset):
     _inc = Timedelta(microseconds=1000)
+    _prefix = 'undefined'
+    _attributes = frozenset(['n', 'normalize'])
+
+    def __init__(self, n=1, normalize=False):
+        BaseOffset.__init__(self, n, normalize)
+        if normalize:
+            raise ValueError("Tick offset with `normalize=True` are not "
+                             "allowed.")  # GH#21427
 
     __gt__ = _tick_comp(operator.gt)
     __ge__ = _tick_comp(operator.ge)
@@ -2423,10 +2153,15 @@ def __add__(self, other):
                 return type(self)(self.n + other.n)
             else:
                 return _delta_to_tick(self.delta + other.delta)
+        elif isinstance(other, ABCPeriod):
+            return other + self
         try:
             return self.apply(other)
         except ApplyTypeError:
             return NotImplemented
+        except OverflowError:
+            raise OverflowError("the add operation between {self} and {other} "
+                                "will overflow".format(self=self, other=other))
 
     def __eq__(self, other):
         if isinstance(other, compat.string_types):
@@ -2437,12 +2172,12 @@ def __eq__(self, other):
         if isinstance(other, Tick):
             return self.delta == other.delta
         else:
-            return DateOffset.__eq__(self, other)
+            return False
 
     # This is identical to DateOffset.__hash__, but has to be redefined here
     # for Python 3, because we've redefined __eq__.
     def __hash__(self):
-        return hash(self._params())
+        return hash(self._params)
 
     def __ne__(self, other):
         if isinstance(other, compat.string_types):
@@ -2453,7 +2188,7 @@ def __ne__(self, other):
         if isinstance(other, Tick):
             return self.delta != other.delta
         else:
-            return DateOffset.__ne__(self, other)
+            return True
 
     @property
     def delta(self):
@@ -2461,21 +2196,32 @@ def delta(self):
 
     @property
     def nanos(self):
-        return _delta_to_nanoseconds(self.delta)
+        return delta_to_nanoseconds(self.delta)
 
+    # TODO: Should Tick have its own apply_index?
     def apply(self, other):
         # Timestamp can handle tz and nano sec, thus no need to use apply_wraps
-        if isinstance(other, (datetime, np.datetime64, date)):
+        if isinstance(other, Timestamp):
+
+            # GH 15126
+            # in order to avoid a recursive
+            # call of __add__ and __radd__ if there is
+            # an exception, when we call using the + operator,
+            # we directly call the known method
+            result = other.__add__(self)
+            if result == NotImplemented:
+                raise OverflowError
+            return result
+        elif isinstance(other, (datetime, np.datetime64, date)):
             return as_timestamp(other) + self
+
         if isinstance(other, timedelta):
             return other + self.delta
         elif isinstance(other, type(self)):
             return type(self)(self.n + other.n)
-        else:
-            raise ApplyTypeError('Unhandled type: %s' % type(other).__name__)
-
-    _prefix = 'undefined'
 
+        raise ApplyTypeError('Unhandled type: {type_str}'
+                             .format(type_str=type(other).__name__))
 
     def isAnchored(self):
         return False
@@ -2494,7 +2240,7 @@ def _delta_to_tick(delta):
             else:
                 return Second(seconds)
     else:
-        nanos = _delta_to_nanoseconds(delta)
+        nanos = delta_to_nanoseconds(delta)
         if nanos % 1000000 == 0:
             return Milli(nanos // 1000000)
         elif nanos % 1000 == 0:
@@ -2502,8 +2248,6 @@ def _delta_to_tick(delta):
         else:  # pragma: no cover
             return Nano(nanos)
 
-_delta_to_nanoseconds = tslib._delta_to_nanoseconds
-
 
 class Day(Tick):
     _inc = Timedelta(days=1)
@@ -2547,19 +2291,7 @@ class Nano(Tick):
 CBMonthBegin = CustomBusinessMonthBegin
 CDay = CustomBusinessDay
 
-
-def _get_firstbday(wkday):
-    """
-    wkday is the result of monthrange(year, month)
-
-    If it's a saturday or sunday, increment first business day to reflect this
-    """
-    first = 1
-    if wkday == 5:  # on Saturday
-        first = 3
-    elif wkday == 6:  # on Sunday
-        first = 2
-    return first
+# ---------------------------------------------------------------------
 
 
 def generate_range(start=None, end=None, periods=None,
@@ -2622,7 +2354,8 @@ def generate_range(start=None, end=None, periods=None,
             # faster than cur + offset
             next_date = offset.apply(cur)
             if next_date <= cur:
-                raise ValueError('Offset %s did not increment date' % offset)
+                raise ValueError('Offset {offset} did not increment date'
+                                 .format(offset=offset))
             cur = next_date
     else:
         while cur >= end:
@@ -2631,50 +2364,41 @@ def generate_range(start=None, end=None, periods=None,
             # faster than cur + offset
             next_date = offset.apply(cur)
             if next_date >= cur:
-                raise ValueError('Offset %s did not decrement date' % offset)
+                raise ValueError('Offset {offset} did not decrement date'
+                                 .format(offset=offset))
             cur = next_date
 
+
 prefix_mapping = dict((offset._prefix, offset) for offset in [
-    YearBegin,                # 'AS'
-    YearEnd,                  # 'A'
-    BYearBegin,               # 'BAS'
-    BYearEnd,                 # 'BA'
-    BusinessDay,              # 'B'
-    BusinessMonthBegin,       # 'BMS'
-    BusinessMonthEnd,         # 'BM'
-    BQuarterEnd,              # 'BQ'
-    BQuarterBegin,            # 'BQS'
-    BusinessHour,             # 'BH'
-    CustomBusinessDay,        # 'C'
-    CustomBusinessMonthEnd,   # 'CBM'
-    CustomBusinessMonthBegin, # 'CBMS'
-    MonthEnd,                 # 'M'
-    MonthBegin,               # 'MS'
-    Week,                     # 'W'
-    Second,                   # 'S'
-    Minute,                   # 'T'
-    Micro,                    # 'U'
-    QuarterEnd,               # 'Q'
-    QuarterBegin,             # 'QS'
-    Milli,                    # 'L'
-    Hour,                     # 'H'
-    Day,                      # 'D'
-    WeekOfMonth,              # 'WOM'
+    YearBegin,                 # 'AS'
+    YearEnd,                   # 'A'
+    BYearBegin,                # 'BAS'
+    BYearEnd,                  # 'BA'
+    BusinessDay,               # 'B'
+    BusinessMonthBegin,        # 'BMS'
+    BusinessMonthEnd,          # 'BM'
+    BQuarterEnd,               # 'BQ'
+    BQuarterBegin,             # 'BQS'
+    BusinessHour,              # 'BH'
+    CustomBusinessDay,         # 'C'
+    CustomBusinessMonthEnd,    # 'CBM'
+    CustomBusinessMonthBegin,  # 'CBMS'
+    CustomBusinessHour,        # 'CBH'
+    MonthEnd,                  # 'M'
+    MonthBegin,                # 'MS'
+    Nano,                      # 'N'
+    SemiMonthEnd,              # 'SM'
+    SemiMonthBegin,            # 'SMS'
+    Week,                      # 'W'
+    Second,                    # 'S'
+    Minute,                    # 'T'
+    Micro,                     # 'U'
+    QuarterEnd,                # 'Q'
+    QuarterBegin,              # 'QS'
+    Milli,                     # 'L'
+    Hour,                      # 'H'
+    Day,                       # 'D'
+    WeekOfMonth,               # 'WOM'
     FY5253,
     FY5253Quarter,
 ])
-
-prefix_mapping['N'] = Nano
-
-def _make_offset(key):
-    """Gets offset based on key. KeyError if prefix is bad, ValueError if
-    suffix is bad. All handled by `get_offset` in tseries/frequencies. Not
-    public."""
-    if key is None:
-        return None
-    split = key.split('-')
-    klass = prefix_mapping[split[0]]
-    # handles case where there's no suffix (and will TypeError if too many '-')
-    obj = klass._from_name(*split[1:])
-    obj._named = key
-    return obj
diff --git a/pandas/tseries/period.py b/pandas/tseries/period.py
deleted file mode 100644
index 888c50e86b7b2..0000000000000
--- a/pandas/tseries/period.py
+++ /dev/null
@@ -1,1072 +0,0 @@
-# pylint: disable=E1101,E1103,W0232
-from datetime import datetime, timedelta
-import numpy as np
-import pandas.tseries.frequencies as frequencies
-from pandas.tseries.frequencies import get_freq_code as _gfc
-from pandas.tseries.index import DatetimeIndex, Int64Index, Index
-from pandas.tseries.base import DatelikeOps, DatetimeIndexOpsMixin
-from pandas.tseries.tools import parse_time_string
-import pandas.tseries.offsets as offsets
-
-from pandas._period import Period
-import pandas._period as period
-from pandas._period import (
-    get_period_field_arr,
-    _validate_end_alias,
-    _quarter_to_myear,
-)
-
-import pandas.core.common as com
-from pandas.core.common import (isnull, _INT64_DTYPE, _maybe_box,
-                                _values_from_object, ABCSeries,
-                                is_integer, is_float, is_object_dtype,
-                                is_float_dtype)
-from pandas import compat
-from pandas.util.decorators import cache_readonly
-
-from pandas.lib import Timestamp, Timedelta
-import pandas.lib as lib
-import pandas.tslib as tslib
-import pandas.algos as _algos
-from pandas.compat import zip, u
-
-
-def _field_accessor(name, alias, docstring=None):
-    def f(self):
-        base, mult = _gfc(self.freq)
-        return get_period_field_arr(alias, self.values, base)
-    f.__name__ = name
-    f.__doc__ = docstring
-    return property(f)
-
-
-def _get_ordinals(data, freq):
-    f = lambda x: Period(x, freq=freq).ordinal
-    if isinstance(data[0], Period):
-        return period.extract_ordinals(data, freq)
-    else:
-        return lib.map_infer(data, f)
-
-
-def dt64arr_to_periodarr(data, freq, tz):
-    if data.dtype != np.dtype('M8[ns]'):
-        raise ValueError('Wrong dtype: %s' % data.dtype)
-
-    base, mult = _gfc(freq)
-    return period.dt64arr_to_periodarr(data.view('i8'), base, tz)
-
-# --- Period index sketch
-
-_DIFFERENT_FREQ_ERROR = "Input has different freq={1} from PeriodIndex(freq={0})"
-
-def _period_index_cmp(opname, nat_result=False):
-    """
-    Wrap comparison operations to convert datetime-like to datetime64
-    """
-    def wrapper(self, other):
-        if isinstance(other, Period):
-            func = getattr(self.values, opname)
-            other_base, _ = _gfc(other.freq)
-            if other.freq != self.freq:
-                msg = _DIFFERENT_FREQ_ERROR.format(self.freqstr, other.freqstr)
-                raise ValueError(msg)
-
-            result = func(other.ordinal)
-        elif isinstance(other, PeriodIndex):
-            if other.freq != self.freq:
-                msg = _DIFFERENT_FREQ_ERROR.format(self.freqstr, other.freqstr)
-                raise ValueError(msg)
-
-            result = getattr(self.values, opname)(other.values)
-
-            mask = (com.mask_missing(self.values, tslib.iNaT) |
-                    com.mask_missing(other.values, tslib.iNaT))
-            if mask.any():
-                result[mask] = nat_result
-
-            return result
-        else:
-            other = Period(other, freq=self.freq)
-            func = getattr(self.values, opname)
-            result = func(other.ordinal)
-
-        if other.ordinal == tslib.iNaT:
-            result.fill(nat_result)
-        mask = self.values == tslib.iNaT
-        if mask.any():
-            result[mask] = nat_result
-
-        return result
-    return wrapper
-
-
-class PeriodIndex(DatelikeOps, DatetimeIndexOpsMixin, Int64Index):
-    """
-    Immutable ndarray holding ordinal values indicating regular periods in
-    time such as particular years, quarters, months, etc. A value of 1 is the
-    period containing the Gregorian proleptic datetime Jan 1, 0001 00:00:00.
-    This ordinal representation is from the scikits.timeseries project.
-
-    For instance,
-        # construct period for day 1/1/1 and get the first second
-        i = Period(year=1,month=1,day=1,freq='D').asfreq('S', 'S')
-        i.ordinal
-        ===> 1
-
-    Index keys are boxed to Period objects which carries the metadata (eg,
-    frequency information).
-
-    Parameters
-    ----------
-    data : array-like (1-dimensional), optional
-        Optional period-like data to construct index with
-    dtype : NumPy dtype (default: i8)
-    copy : bool
-        Make a copy of input ndarray
-    freq : string or period object, optional
-        One of pandas period strings or corresponding objects
-    start : starting value, period-like, optional
-        If data is None, used as the start point in generating regular
-        period data.
-    periods : int, optional, > 0
-        Number of periods to generate, if generating index. Takes precedence
-        over end argument
-    end : end value, period-like, optional
-        If periods is none, generated index will extend to first conforming
-        period on or just past end argument
-    year : int, array, or Series, default None
-    month : int, array, or Series, default None
-    quarter : int, array, or Series, default None
-    day : int, array, or Series, default None
-    hour : int, array, or Series, default None
-    minute : int, array, or Series, default None
-    second : int, array, or Series, default None
-    tz : object, default None
-        Timezone for converting datetime64 data to Periods
-
-    Examples
-    --------
-    >>> idx = PeriodIndex(year=year_arr, quarter=q_arr)
-
-    >>> idx2 = PeriodIndex(start='2000', end='2010', freq='A')
-    """
-    _box_scalars = True
-    _typ = 'periodindex'
-    _attributes = ['name','freq']
-    _datetimelike_ops = ['year','month','day','hour','minute','second',
-                         'weekofyear','week','dayofweek','weekday','dayofyear','quarter', 'qyear', 'freq', 'days_in_month', 'daysinmonth']
-    _is_numeric_dtype = False
-    freq = None
-
-    __eq__ = _period_index_cmp('__eq__')
-    __ne__ = _period_index_cmp('__ne__', nat_result=True)
-    __lt__ = _period_index_cmp('__lt__')
-    __gt__ = _period_index_cmp('__gt__')
-    __le__ = _period_index_cmp('__le__')
-    __ge__ = _period_index_cmp('__ge__')
-
-    def __new__(cls, data=None, ordinal=None, freq=None, start=None, end=None,
-                periods=None, copy=False, name=None, tz=None, **kwargs):
-
-        if periods is not None:
-            if is_float(periods):
-                periods = int(periods)
-            elif not is_integer(periods):
-                raise ValueError('Periods must be a number, got %s' %
-                                 str(periods))
-
-        if data is None:
-            if ordinal is not None:
-                data = np.asarray(ordinal, dtype=np.int64)
-            else:
-                data, freq = cls._generate_range(start, end, periods,
-                                                 freq, kwargs)
-        else:
-            ordinal, freq = cls._from_arraylike(data, freq, tz)
-            data = np.array(ordinal, dtype=np.int64, copy=False)
-
-        return cls._simple_new(data, name=name, freq=freq)
-
-    @classmethod
-    def _generate_range(cls, start, end, periods, freq, fields):
-        field_count = len(fields)
-        if com._count_not_none(start, end) > 0:
-            if field_count > 0:
-                raise ValueError('Can either instantiate from fields '
-                                 'or endpoints, but not both')
-            subarr, freq = _get_ordinal_range(start, end, periods, freq)
-        elif field_count > 0:
-            subarr, freq = _range_from_fields(freq=freq, **fields)
-        else:
-            raise ValueError('Not enough parameters to construct '
-                             'Period range')
-
-        return subarr, freq
-
-    @classmethod
-    def _from_arraylike(cls, data, freq, tz):
-
-        if not isinstance(data, (np.ndarray, PeriodIndex, DatetimeIndex, Int64Index)):
-            if np.isscalar(data) or isinstance(data, Period):
-                raise ValueError('PeriodIndex() must be called with a '
-                                 'collection of some kind, %s was passed'
-                                 % repr(data))
-
-            # other iterable of some kind
-            if not isinstance(data, (list, tuple)):
-                data = list(data)
-
-            try:
-                data = com._ensure_int64(data)
-                if freq is None:
-                    raise ValueError('freq not specified')
-                data = np.array([Period(x, freq=freq).ordinal for x in data],
-                                dtype=np.int64)
-            except (TypeError, ValueError):
-                data = com._ensure_object(data)
-
-                if freq is None and len(data) > 0:
-                    freq = getattr(data[0], 'freq', None)
-
-                if freq is None:
-                    raise ValueError('freq not specified and cannot be '
-                                     'inferred from first element')
-
-                data = _get_ordinals(data, freq)
-        else:
-            if isinstance(data, PeriodIndex):
-                if freq is None or freq == data.freq:
-                    freq = data.freq
-                    data = data.values
-                else:
-                    base1, _ = _gfc(data.freq)
-                    base2, _ = _gfc(freq)
-                    data = period.period_asfreq_arr(data.values,
-                                                    base1, base2, 1)
-            else:
-                if freq is None and len(data) > 0:
-                    freq = getattr(data[0], 'freq', None)
-
-                if freq is None:
-                    raise ValueError('freq not specified and cannot be '
-                                     'inferred from first element')
-
-                if data.dtype != np.int64:
-                    if np.issubdtype(data.dtype, np.datetime64):
-                        data = dt64arr_to_periodarr(data, freq, tz)
-                    else:
-                        try:
-                            data = com._ensure_int64(data)
-                        except (TypeError, ValueError):
-                            data = com._ensure_object(data)
-                            data = _get_ordinals(data, freq)
-
-        return data, freq
-
-    @classmethod
-    def _simple_new(cls, values, name=None, freq=None, **kwargs):
-        if not getattr(values,'dtype',None):
-            values = np.array(values,copy=False)
-        if is_object_dtype(values):
-            return PeriodIndex(values, name=name, freq=freq, **kwargs)
-
-        result = object.__new__(cls)
-        result._data = values
-        result.name = name
-        if freq is None:
-            raise ValueError('freq is not specified')
-        result.freq = Period._maybe_convert_freq(freq)
-        result._reset_identity()
-        return result
-
-    def _shallow_copy(self, values=None, infer=False, **kwargs):
-        """ we always want to return a PeriodIndex """
-        return super(PeriodIndex, self)._shallow_copy(values=values, infer=False, **kwargs)
-
-    def _coerce_scalar_to_index(self, item):
-        """
-        we need to coerce a scalar to a compat for our index type
-
-        Parameters
-        ----------
-        item : scalar item to coerce
-        """
-        return PeriodIndex([item], **self._get_attributes_dict())
-
-    @property
-    def _na_value(self):
-        return self._box_func(tslib.iNaT)
-
-    def __contains__(self, key):
-        if not isinstance(key, Period) or key.freq != self.freq:
-            if isinstance(key, compat.string_types):
-                try:
-                    self.get_loc(key)
-                    return True
-                except Exception:
-                    return False
-            return False
-        return key.ordinal in self._engine
-
-    def __array_wrap__(self, result, context=None):
-        """
-        Gets called after a ufunc. Needs additional handling as
-        PeriodIndex stores internal data as int dtype
-
-        Replace this to __numpy_ufunc__ in future version
-        """
-        if isinstance(context, tuple) and len(context) > 0:
-            func = context[0]
-            if (func is np.add):
-                return self._add_delta(context[1][1])
-            elif (func is np.subtract):
-                return self._add_delta(-context[1][1])
-            elif isinstance(func, np.ufunc):
-                if 'M->M' not in func.types:
-                    msg = "ufunc '{0}' not supported for the PeriodIndex"
-                    # This should be TypeError, but TypeError cannot be raised
-                    # from here because numpy catches.
-                    raise ValueError(msg.format(func.__name__))
-
-        if com.is_bool_dtype(result):
-            return result
-        return PeriodIndex(result, freq=self.freq, name=self.name)
-
-    @property
-    def _box_func(self):
-        return lambda x: Period._from_ordinal(ordinal=x, freq=self.freq)
-
-    def _to_embed(self, keep_tz=False):
-        """ return an array repr of this object, potentially casting to object """
-        return self.asobject.values
-
-    @property
-    def _formatter_func(self):
-        return lambda x: "'%s'" % x
-
-    def asof_locs(self, where, mask):
-        """
-        where : array of timestamps
-        mask : array of booleans where data is not NA
-
-        """
-        where_idx = where
-        if isinstance(where_idx, DatetimeIndex):
-            where_idx = PeriodIndex(where_idx.values, freq=self.freq)
-
-        locs = self.values[mask].searchsorted(where_idx.values, side='right')
-
-        locs = np.where(locs > 0, locs - 1, 0)
-        result = np.arange(len(self))[mask].take(locs)
-
-        first = mask.argmax()
-        result[(locs == 0) & (where_idx.values < self.values[first])] = -1
-
-        return result
-
-    def _array_values(self):
-        return self.asobject
-
-    def astype(self, dtype):
-        dtype = np.dtype(dtype)
-        if dtype == np.object_:
-            return Index(np.array(list(self), dtype), dtype)
-        elif dtype == _INT64_DTYPE:
-            return Index(self.values, dtype)
-        raise ValueError('Cannot cast PeriodIndex to dtype %s' % dtype)
-
-    def searchsorted(self, key, side='left'):
-        if isinstance(key, Period):
-            if key.freq != self.freq:
-                msg = _DIFFERENT_FREQ_ERROR.format(self.freqstr, key.freqstr)
-                raise ValueError(msg)
-            key = key.ordinal
-        elif isinstance(key, compat.string_types):
-            key = Period(key, freq=self.freq).ordinal
-
-        return self.values.searchsorted(key, side=side)
-
-    @property
-    def is_all_dates(self):
-        return True
-
-    @property
-    def is_full(self):
-        """
-        Returns True if there are any missing periods from start to end
-        """
-        if len(self) == 0:
-            return True
-        if not self.is_monotonic:
-            raise ValueError('Index is not monotonic')
-        values = self.values
-        return ((values[1:] - values[:-1]) < 2).all()
-
-    def asfreq(self, freq=None, how='E'):
-        """
-        Convert the PeriodIndex to the specified frequency `freq`.
-
-        Parameters
-        ----------
-
-        freq : str
-            a frequency
-        how : str {'E', 'S'}
-            'E', 'END', or 'FINISH' for end,
-            'S', 'START', or 'BEGIN' for start.
-            Whether the elements should be aligned to the end
-            or start within pa period. January 31st ('END') vs.
-            Janury 1st ('START') for example.
-
-        Returns
-        -------
-
-        new : PeriodIndex with the new frequency
-
-        Examples
-        --------
-        >>> pidx = pd.period_range('2010-01-01', '2015-01-01', freq='A')
-        >>> pidx
-        <class 'pandas.tseries.period.PeriodIndex'>
-        [2010, ..., 2015]
-        Length: 6, Freq: A-DEC
-
-        >>> pidx.asfreq('M')
-        <class 'pandas.tseries.period.PeriodIndex'>
-        [2010-12, ..., 2015-12]
-        Length: 6, Freq: M
-
-        >>> pidx.asfreq('M', how='S')
-        <class 'pandas.tseries.period.PeriodIndex'>
-        [2010-01, ..., 2015-01]
-        Length: 6, Freq: M
-        """
-        how = _validate_end_alias(how)
-
-        freq = frequencies.get_standard_freq(freq)
-
-        base1, mult1 = _gfc(self.freq)
-        base2, mult2 = _gfc(freq)
-
-        asi8 = self.asi8
-        # mult1 can't be negative or 0
-        end = how == 'E'
-        if end:
-            ordinal = asi8 + mult1 - 1
-        else:
-            ordinal = asi8
-
-        new_data = period.period_asfreq_arr(ordinal, base1, base2, end)
-
-        if self.hasnans:
-            mask = asi8 == tslib.iNaT
-            new_data[mask] = tslib.iNaT
-
-        return self._simple_new(new_data, self.name, freq=freq)
-
-    def to_datetime(self, dayfirst=False):
-        return self.to_timestamp()
-
-    year = _field_accessor('year', 0, "The year of the period")
-    month = _field_accessor('month', 3, "The month as January=1, December=12")
-    day = _field_accessor('day', 4, "The days of the period")
-    hour = _field_accessor('hour', 5, "The hour of the period")
-    minute = _field_accessor('minute', 6, "The minute of the period")
-    second = _field_accessor('second', 7, "The second of the period")
-    weekofyear = _field_accessor('week', 8, "The week ordinal of the year")
-    week = weekofyear
-    dayofweek = _field_accessor('dayofweek', 10, "The day of the week with Monday=0, Sunday=6")
-    weekday = dayofweek
-    dayofyear = day_of_year = _field_accessor('dayofyear', 9, "The ordinal day of the year")
-    quarter = _field_accessor('quarter', 2, "The quarter of the date")
-    qyear = _field_accessor('qyear', 1)
-    days_in_month = _field_accessor('days_in_month', 11, "The number of days in the month")
-    daysinmonth = days_in_month
-
-    def _get_object_array(self):
-        freq = self.freq
-        return np.array([ Period._from_ordinal(ordinal=x, freq=freq) for x in self.values], copy=False)
-
-    def _mpl_repr(self):
-        # how to represent ourselves to matplotlib
-        return self._get_object_array()
-
-    def equals(self, other):
-        """
-        Determines if two Index objects contain the same elements.
-        """
-        if self.is_(other):
-            return True
-
-        if (not hasattr(other, 'inferred_type') or
-                other.inferred_type != 'int64'):
-            try:
-                other = PeriodIndex(other)
-            except:
-                return False
-
-        return np.array_equal(self.asi8, other.asi8)
-
-    def to_timestamp(self, freq=None, how='start'):
-        """
-        Cast to DatetimeIndex
-
-        Parameters
-        ----------
-        freq : string or DateOffset, default 'D' for week or longer, 'S'
-               otherwise
-            Target frequency
-        how : {'s', 'e', 'start', 'end'}
-
-        Returns
-        -------
-        DatetimeIndex
-        """
-        how = _validate_end_alias(how)
-
-        if freq is None:
-            base, mult = _gfc(self.freq)
-            freq = frequencies.get_to_timestamp_base(base)
-
-        base, mult = _gfc(freq)
-        new_data = self.asfreq(freq, how)
-
-        new_data = period.periodarr_to_dt64arr(new_data.values, base)
-        return DatetimeIndex(new_data, freq='infer', name=self.name)
-
-    def _maybe_convert_timedelta(self, other):
-        if isinstance(other, (timedelta, np.timedelta64, offsets.Tick, Timedelta)):
-            offset = frequencies.to_offset(self.freq.rule_code)
-            if isinstance(offset, offsets.Tick):
-                nanos = tslib._delta_to_nanoseconds(other)
-                offset_nanos = tslib._delta_to_nanoseconds(offset)
-                if nanos % offset_nanos == 0:
-                    return nanos // offset_nanos
-        elif isinstance(other, offsets.DateOffset):
-            freqstr = frequencies.get_standard_freq(other)
-            base = frequencies.get_base_alias(freqstr)
-            if base == self.freq.rule_code:
-                return other.n
-        elif isinstance(other, np.ndarray):
-            if com.is_integer_dtype(other):
-                return other
-            elif com.is_timedelta64_dtype(other):
-                offset = frequencies.to_offset(self.freq)
-                if isinstance(offset, offsets.Tick):
-                    nanos = tslib._delta_to_nanoseconds(other)
-                    offset_nanos = tslib._delta_to_nanoseconds(offset)
-                    if (nanos % offset_nanos).all() == 0:
-                        return nanos // offset_nanos
-        msg = "Input has different freq from PeriodIndex(freq={0})"
-        raise ValueError(msg.format(self.freqstr))
-
-    def _add_delta(self, other):
-        ordinal_delta = self._maybe_convert_timedelta(other)
-        return self.shift(ordinal_delta)
-
-    def shift(self, n):
-        """
-        Specialized shift which produces an PeriodIndex
-
-        Parameters
-        ----------
-        n : int
-            Periods to shift by
-
-        Returns
-        -------
-        shifted : PeriodIndex
-        """
-        mask = self.values == tslib.iNaT
-        values = self.values + n * self.freq.n
-        values[mask] = tslib.iNaT
-        return PeriodIndex(data=values, name=self.name, freq=self.freq)
-
-    @cache_readonly
-    def dtype_str(self):
-        """ return the dtype str of the underlying data """
-        return self.inferred_type
-
-    @property
-    def inferred_type(self):
-        # b/c data is represented as ints make sure we can't have ambiguous
-        # indexing
-        return 'period'
-
-    def get_value(self, series, key):
-        """
-        Fast lookup of value from 1-dimensional ndarray. Only use this if you
-        know what you're doing
-        """
-        s = _values_from_object(series)
-        try:
-            return _maybe_box(self, super(PeriodIndex, self).get_value(s, key), series, key)
-        except (KeyError, IndexError):
-            try:
-                asdt, parsed, reso = parse_time_string(key, self.freq)
-                grp = frequencies.Resolution.get_freq_group(reso)
-                freqn = frequencies.get_freq_group(self.freq)
-
-                vals = self.values
-
-                # if our data is higher resolution than requested key, slice
-                if grp < freqn:
-                    iv = Period(asdt, freq=(grp, 1))
-                    ord1 = iv.asfreq(self.freq, how='S').ordinal
-                    ord2 = iv.asfreq(self.freq, how='E').ordinal
-
-                    if ord2 < vals[0] or ord1 > vals[-1]:
-                        raise KeyError(key)
-
-                    pos = np.searchsorted(self.values, [ord1, ord2])
-                    key = slice(pos[0], pos[1] + 1)
-                    return series[key]
-                elif grp == freqn:
-                    key = Period(asdt, freq=self.freq).ordinal
-                    return _maybe_box(self, self._engine.get_value(s, key), series, key)
-                else:
-                    raise KeyError(key)
-            except TypeError:
-                pass
-
-            key = Period(key, self.freq).ordinal
-            return _maybe_box(self, self._engine.get_value(s, key), series, key)
-
-    def get_indexer(self, target, method=None, limit=None, tolerance=None):
-        if hasattr(target, 'freq') and target.freq != self.freq:
-            raise ValueError('target and index have different freq: '
-                             '(%s, %s)' % (target.freq, self.freq))
-        return Index.get_indexer(self, target, method, limit, tolerance)
-
-    def get_loc(self, key, method=None, tolerance=None):
-        """
-        Get integer location for requested label
-
-        Returns
-        -------
-        loc : int
-        """
-        try:
-            return self._engine.get_loc(key)
-        except KeyError:
-            if is_integer(key):
-                raise
-
-            try:
-                asdt, parsed, reso = parse_time_string(key, self.freq)
-                key = asdt
-            except TypeError:
-                pass
-
-            key = Period(key, freq=self.freq)
-            try:
-                return Index.get_loc(self, key.ordinal, method, tolerance)
-            except KeyError:
-                raise KeyError(key)
-
-    def _maybe_cast_slice_bound(self, label, side, kind):
-        """
-        If label is a string or a datetime, cast it to Period.ordinal according to
-        resolution.
-
-        Parameters
-        ----------
-        label : object
-        side : {'left', 'right'}
-        kind : string / None
-
-        Returns
-        -------
-        bound : Period or object
-
-        Notes
-        -----
-        Value of `side` parameter should be validated in caller.
-
-        """
-        if isinstance(label, datetime):
-            return Period(label, freq=self.freq)
-        elif isinstance(label, compat.string_types):
-            try:
-                _, parsed, reso = parse_time_string(label, self.freq)
-                bounds = self._parsed_string_to_bounds(reso, parsed)
-                return bounds[0 if side == 'left' else 1]
-            except Exception:
-                raise KeyError(label)
-        elif is_integer(label) or is_float(label):
-            self._invalid_indexer('slice',label)
-
-        return label
-
-    def _parsed_string_to_bounds(self, reso, parsed):
-        if reso == 'year':
-            t1 = Period(year=parsed.year, freq='A')
-        elif reso == 'month':
-            t1 = Period(year=parsed.year, month=parsed.month, freq='M')
-        elif reso == 'quarter':
-            q = (parsed.month - 1) // 3 + 1
-            t1 = Period(year=parsed.year, quarter=q, freq='Q-DEC')
-        elif reso == 'day':
-            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
-                        freq='D')
-        elif reso == 'hour':
-            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
-                        hour=parsed.hour, freq='H')
-        elif reso == 'minute':
-            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
-                        hour=parsed.hour, minute=parsed.minute, freq='T')
-        elif reso == 'second':
-            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
-                        hour=parsed.hour, minute=parsed.minute, second=parsed.second,
-                        freq='S')
-        else:
-            raise KeyError(key)
-        return (t1.asfreq(self.freq, how='start'),
-                t1.asfreq(self.freq, how='end'))
-
-    def _get_string_slice(self, key):
-        if not self.is_monotonic:
-            raise ValueError('Partial indexing only valid for '
-                             'ordered time series')
-
-        key, parsed, reso = parse_time_string(key, self.freq)
-        grp = frequencies.Resolution.get_freq_group(reso)
-        freqn = frequencies.get_freq_group(self.freq)
-        if reso in ['day', 'hour', 'minute', 'second'] and not grp < freqn:
-            raise KeyError(key)
-
-        t1, t2 = self._parsed_string_to_bounds(reso, parsed)
-        return slice(self.searchsorted(t1.ordinal, side='left'),
-                     self.searchsorted(t2.ordinal, side='right'))
-
-    def _convert_tolerance(self, tolerance):
-        tolerance = DatetimeIndexOpsMixin._convert_tolerance(self, tolerance)
-        return self._maybe_convert_timedelta(tolerance)
-
-    def join(self, other, how='left', level=None, return_indexers=False):
-        """
-        See Index.join
-        """
-        self._assert_can_do_setop(other)
-
-        result = Int64Index.join(self, other, how=how, level=level,
-                                 return_indexers=return_indexers)
-
-        if return_indexers:
-            result, lidx, ridx = result
-            return self._apply_meta(result), lidx, ridx
-        return self._apply_meta(result)
-
-    def _assert_can_do_setop(self, other):
-        super(PeriodIndex, self)._assert_can_do_setop(other)
-
-        if not isinstance(other, PeriodIndex):
-            raise ValueError('can only call with other PeriodIndex-ed objects')
-
-        if self.freq != other.freq:
-            msg = _DIFFERENT_FREQ_ERROR.format(self.freqstr, other.freqstr)
-            raise ValueError(msg)
-
-    def _wrap_union_result(self, other, result):
-        name = self.name if self.name == other.name else None
-        result = self._apply_meta(result)
-        result.name = name
-        return result
-
-    def _apply_meta(self, rawarr):
-        if not isinstance(rawarr, PeriodIndex):
-            rawarr = PeriodIndex(rawarr, freq=self.freq)
-        return rawarr
-
-    def __getitem__(self, key):
-        getitem = self._data.__getitem__
-        if np.isscalar(key):
-            val = getitem(key)
-            return Period(ordinal=val, freq=self.freq)
-        else:
-            if com.is_bool_indexer(key):
-                key = np.asarray(key)
-
-            result = getitem(key)
-            if result.ndim > 1:
-                # MPL kludge
-                # values = np.asarray(list(values), dtype=object)
-                # return values.reshape(result.shape)
-
-                return PeriodIndex(result, name=self.name, freq=self.freq)
-
-            return PeriodIndex(result, name=self.name, freq=self.freq)
-
-    def _format_native_types(self, na_rep=u('NaT'), date_format=None, **kwargs):
-
-        values = np.array(list(self), dtype=object)
-        mask = isnull(self.values)
-        values[mask] = na_rep
-        imask = ~mask
-
-        if date_format:
-            formatter = lambda dt: dt.strftime(date_format)
-        else:
-            formatter = lambda dt: u('%s') % dt
-        values[imask] = np.array([formatter(dt) for dt in values[imask]])
-        return values
-
-    def take(self, indices, axis=0):
-        """
-        Analogous to ndarray.take
-        """
-        indices = com._ensure_platform_int(indices)
-        taken = self.asi8.take(indices, axis=axis)
-        return self._simple_new(taken, self.name, freq=self.freq)
-
-    def append(self, other):
-        """
-        Append a collection of Index options together
-
-        Parameters
-        ----------
-        other : Index or list/tuple of indices
-
-        Returns
-        -------
-        appended : Index
-        """
-        name = self.name
-        to_concat = [self]
-
-        if isinstance(other, (list, tuple)):
-            to_concat = to_concat + list(other)
-        else:
-            to_concat.append(other)
-
-        for obj in to_concat:
-            if isinstance(obj, Index) and obj.name != name:
-                name = None
-                break
-
-        to_concat = self._ensure_compat_concat(to_concat)
-
-        if isinstance(to_concat[0], PeriodIndex):
-            if len(set([x.freq for x in to_concat])) > 1:
-                # box
-                to_concat = [x.asobject.values for x in to_concat]
-            else:
-                cat_values = np.concatenate([x.values for x in to_concat])
-                return PeriodIndex(cat_values, freq=self.freq, name=name)
-
-        to_concat = [x.values if isinstance(x, Index) else x
-                     for x in to_concat]
-        return Index(com._concat_compat(to_concat), name=name)
-
-    def repeat(self, n):
-        """
-        Return a new Index of the values repeated n times.
-
-        See also
-        --------
-        numpy.ndarray.repeat
-        """
-        # overwrites method from DatetimeIndexOpsMixin
-        return self._shallow_copy(self.values.repeat(n))
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-
-        if isinstance(state, dict):
-            super(PeriodIndex, self).__setstate__(state)
-
-        elif isinstance(state, tuple):
-
-            # < 0.15 compat
-            if len(state) == 2:
-                nd_state, own_state = state
-                data = np.empty(nd_state[1], dtype=nd_state[2])
-                np.ndarray.__setstate__(data, nd_state)
-
-                # backcompat
-                self.freq = Period._maybe_convert_freq(own_state[1])
-
-            else:  # pragma: no cover
-                data = np.empty(state)
-                np.ndarray.__setstate__(self, state)
-
-            self._data = data
-
-        else:
-            raise Exception("invalid pickle state")
-
-    _unpickle_compat = __setstate__
-
-    def tz_convert(self, tz):
-        """
-        Convert tz-aware DatetimeIndex from one time zone to another (using pytz/dateutil)
-
-        Parameters
-        ----------
-        tz : string, pytz.timezone, dateutil.tz.tzfile or None
-            Time zone for time. Corresponding timestamps would be converted to
-            time zone of the TimeSeries.
-            None will remove timezone holding UTC time.
-
-        Returns
-        -------
-        normalized : DatetimeIndex
-
-        Note
-        ----
-        Not currently implemented for PeriodIndex
-        """
-        raise NotImplementedError("Not yet implemented for PeriodIndex")
-
-    def tz_localize(self, tz, infer_dst=False):
-        """
-        Localize tz-naive DatetimeIndex to given time zone (using pytz/dateutil),
-        or remove timezone from tz-aware DatetimeIndex
-
-        Parameters
-        ----------
-        tz : string, pytz.timezone, dateutil.tz.tzfile or None
-            Time zone for time. Corresponding timestamps would be converted to
-            time zone of the TimeSeries.
-            None will remove timezone holding local time.
-        infer_dst : boolean, default False
-            Attempt to infer fall dst-transition hours based on order
-
-        Returns
-        -------
-        localized : DatetimeIndex
-
-        Note
-        ----
-        Not currently implemented for PeriodIndex
-        """
-        raise NotImplementedError("Not yet implemented for PeriodIndex")
-
-
-PeriodIndex._add_numeric_methods_disabled()
-PeriodIndex._add_logical_methods_disabled()
-PeriodIndex._add_datetimelike_methods()
-
-
-def _get_ordinal_range(start, end, periods, freq, mult=1):
-    if com._count_not_none(start, end, periods) < 2:
-        raise ValueError('Must specify 2 of start, end, periods')
-
-    if freq is not None:
-        _, mult = _gfc(freq)
-
-    if start is not None:
-        start = Period(start, freq)
-    if end is not None:
-        end = Period(end, freq)
-
-    is_start_per = isinstance(start, Period)
-    is_end_per = isinstance(end, Period)
-
-    if is_start_per and is_end_per and start.freq != end.freq:
-        raise ValueError('Start and end must have same freq')
-    if ((is_start_per and start.ordinal == tslib.iNaT) or
-        (is_end_per and end.ordinal == tslib.iNaT)):
-        raise ValueError('Start and end must not be NaT')
-
-    if freq is None:
-        if is_start_per:
-            freq = start.freq
-        elif is_end_per:
-            freq = end.freq
-        else:  # pragma: no cover
-            raise ValueError('Could not infer freq from start/end')
-
-    if periods is not None:
-        periods = periods * mult
-        if start is None:
-            data = np.arange(end.ordinal - periods + mult,
-                             end.ordinal + 1, mult,
-                             dtype=np.int64)
-        else:
-            data = np.arange(start.ordinal, start.ordinal + periods, mult,
-                             dtype=np.int64)
-    else:
-        data = np.arange(start.ordinal, end.ordinal + 1, mult, dtype=np.int64)
-
-    return data, freq
-
-
-def _range_from_fields(year=None, month=None, quarter=None, day=None,
-                       hour=None, minute=None, second=None, freq=None):
-    if hour is None:
-        hour = 0
-    if minute is None:
-        minute = 0
-    if second is None:
-        second = 0
-    if day is None:
-        day = 1
-
-    ordinals = []
-
-    if quarter is not None:
-        if freq is None:
-            freq = 'Q'
-            base = frequencies.FreqGroup.FR_QTR
-        else:
-            base, mult = _gfc(freq)
-            if base != frequencies.FreqGroup.FR_QTR:
-                raise AssertionError("base must equal FR_QTR")
-
-        year, quarter = _make_field_arrays(year, quarter)
-        for y, q in zip(year, quarter):
-            y, m = _quarter_to_myear(y, q, freq)
-            val = period.period_ordinal(y, m, 1, 1, 1, 1, 0, 0, base)
-            ordinals.append(val)
-    else:
-        base, mult = _gfc(freq)
-        arrays = _make_field_arrays(year, month, day, hour, minute, second)
-        for y, mth, d, h, mn, s in zip(*arrays):
-            ordinals.append(period.period_ordinal(y, mth, d, h, mn, s, 0, 0, base))
-
-    return np.array(ordinals, dtype=np.int64), freq
-
-
-def _make_field_arrays(*fields):
-    length = None
-    for x in fields:
-        if isinstance(x, (list, np.ndarray, ABCSeries)):
-            if length is not None and len(x) != length:
-                raise ValueError('Mismatched Period array lengths')
-            elif length is None:
-                length = len(x)
-
-    arrays = [np.asarray(x) if isinstance(x, (np.ndarray, list, ABCSeries))
-              else np.repeat(x, length) for x in fields]
-
-    return arrays
-
-
-def pnow(freq=None):
-    return Period(datetime.now(), freq=freq)
-
-
-def period_range(start=None, end=None, periods=None, freq='D', name=None):
-    """
-    Return a fixed frequency datetime index, with day (calendar) as the default
-    frequency
-
-
-    Parameters
-    ----------
-    start : starting value, period-like, optional
-    end : ending value, period-like, optional
-    periods : int, default None
-        Number of periods in the index
-    freq : str/DateOffset, default 'D'
-        Frequency alias
-    name : str, default None
-        Name for the resulting PeriodIndex
-
-    Returns
-    -------
-    prng : PeriodIndex
-    """
-    return PeriodIndex(start=start, end=end, periods=periods,
-                       freq=freq, name=name)
diff --git a/pandas/tseries/plotting.py b/pandas/tseries/plotting.py
index ad27b412cddb9..302016907635d 100644
--- a/pandas/tseries/plotting.py
+++ b/pandas/tseries/plotting.py
@@ -1,293 +1,3 @@
-"""
-Period formatters and locators adapted from scikits.timeseries by
-Pierre GF Gerard-Marchant & Matt Knox
-"""
+# flake8: noqa
 
-#!!! TODO: Use the fact that axis can have units to simplify the process
-
-import numpy as np
-
-from matplotlib import pylab
-from pandas.tseries.period import Period
-from pandas.tseries.offsets import DateOffset
-import pandas.tseries.frequencies as frequencies
-from pandas.tseries.index import DatetimeIndex
-import pandas.core.common as com
-import pandas.compat as compat
-
-from pandas.tseries.converter import (TimeSeries_DateLocator,
-                                      TimeSeries_DateFormatter)
-
-#----------------------------------------------------------------------
-# Plotting functions and monkey patches
-
-
-def tsplot(series, plotf, ax=None, **kwargs):
-    """
-    Plots a Series on the given Matplotlib axes or the current axes
-
-    Parameters
-    ----------
-    axes : Axes
-    series : Series
-
-    Notes
-    _____
-    Supports same kwargs as Axes.plot
-
-    """
-    # Used inferred freq is possible, need a test case for inferred
-    if ax is None:
-        import matplotlib.pyplot as plt
-        ax = plt.gca()
-
-    freq, series = _maybe_resample(series, ax, kwargs)
-
-    # Set ax with freq info
-    _decorate_axes(ax, freq, kwargs)
-    ax._plot_data.append((series, plotf, kwargs))
-    lines = plotf(ax, series.index._mpl_repr(), series.values, **kwargs)
-
-    # set date formatter, locators and rescale limits
-    format_dateaxis(ax, ax.freq)
-    return lines
-
-
-def _maybe_resample(series, ax, kwargs):
-    # resample against axes freq if necessary
-    freq, ax_freq = _get_freq(ax, series)
-
-    if freq is None:  # pragma: no cover
-        raise ValueError('Cannot use dynamic axis without frequency info')
-
-    # Convert DatetimeIndex to PeriodIndex
-    if isinstance(series.index, DatetimeIndex):
-        series = series.to_period(freq=freq)
-
-    if ax_freq is not None and freq != ax_freq:
-        if frequencies.is_superperiod(freq, ax_freq):  # upsample input
-            series = series.copy()
-            series.index = series.index.asfreq(ax_freq, how='s')
-            freq = ax_freq
-        elif _is_sup(freq, ax_freq):  # one is weekly
-            how = kwargs.pop('how', 'last')
-            series = series.resample('D', how=how).dropna()
-            series = series.resample(ax_freq, how=how).dropna()
-            freq = ax_freq
-        elif frequencies.is_subperiod(freq, ax_freq) or _is_sub(freq, ax_freq):
-            _upsample_others(ax, freq, kwargs)
-            ax_freq = freq
-        else:  # pragma: no cover
-            raise ValueError('Incompatible frequency conversion')
-    return freq, series
-
-
-def _is_sub(f1, f2):
-    return ((f1.startswith('W') and frequencies.is_subperiod('D', f2)) or
-            (f2.startswith('W') and frequencies.is_subperiod(f1, 'D')))
-
-
-def _is_sup(f1, f2):
-    return ((f1.startswith('W') and frequencies.is_superperiod('D', f2)) or
-            (f2.startswith('W') and frequencies.is_superperiod(f1, 'D')))
-
-
-def _upsample_others(ax, freq, kwargs):
-    legend = ax.get_legend()
-    lines, labels = _replot_ax(ax, freq, kwargs)
-    _replot_ax(ax, freq, kwargs)
-
-    other_ax = None
-    if hasattr(ax, 'left_ax'):
-        other_ax = ax.left_ax
-    if hasattr(ax, 'right_ax'):
-        other_ax = ax.right_ax
-
-    if other_ax is not None:
-        rlines, rlabels = _replot_ax(other_ax, freq, kwargs)
-        lines.extend(rlines)
-        labels.extend(rlabels)
-
-    if (legend is not None and kwargs.get('legend', True) and
-            len(lines) > 0):
-        title = legend.get_title().get_text()
-        if title == 'None':
-            title = None
-        ax.legend(lines, labels, loc='best', title=title)
-
-
-def _replot_ax(ax, freq, kwargs):
-    data = getattr(ax, '_plot_data', None)
-
-    # clear current axes and data
-    ax._plot_data = []
-    ax.clear()
-
-    _decorate_axes(ax, freq, kwargs)
-
-    lines = []
-    labels = []
-    if data is not None:
-        for series, plotf, kwds in data:
-            series = series.copy()
-            idx = series.index.asfreq(freq, how='S')
-            series.index = idx
-            ax._plot_data.append((series, plotf, kwds))
-
-            # for tsplot
-            if isinstance(plotf, compat.string_types):
-                from pandas.tools.plotting import _plot_klass
-                plotf = _plot_klass[plotf]._plot
-
-            lines.append(plotf(ax, series.index._mpl_repr(), series.values, **kwds)[0])
-            labels.append(com.pprint_thing(series.name))
-
-    return lines, labels
-
-
-def _decorate_axes(ax, freq, kwargs):
-    """Initialize axes for time-series plotting"""
-    if not hasattr(ax, '_plot_data'):
-        ax._plot_data = []
-
-    ax.freq = freq
-    xaxis = ax.get_xaxis()
-    xaxis.freq = freq
-    if not hasattr(ax, 'legendlabels'):
-        ax.legendlabels = [kwargs.get('label', None)]
-    else:
-        ax.legendlabels.append(kwargs.get('label', None))
-    ax.view_interval = None
-    ax.date_axis_info = None
-
-
-def _get_freq(ax, series):
-    # get frequency from data
-    freq = getattr(series.index, 'freq', None)
-    if freq is None:
-        freq = getattr(series.index, 'inferred_freq', None)
-
-    ax_freq = getattr(ax, 'freq', None)
-    if ax_freq is None:
-        if hasattr(ax, 'left_ax'):
-            ax_freq = getattr(ax.left_ax, 'freq', None)
-        elif hasattr(ax, 'right_ax'):
-            ax_freq = getattr(ax.right_ax, 'freq', None)
-
-    # use axes freq if no data freq
-    if freq is None:
-        freq = ax_freq
-
-    # get the period frequency
-    if isinstance(freq, DateOffset):
-        freq = freq.rule_code
-    else:
-        freq = frequencies.get_base_alias(freq)
-
-    freq = frequencies.get_period_alias(freq)
-    return freq, ax_freq
-
-
-def _use_dynamic_x(ax, data):
-    freq = _get_index_freq(data)
-    ax_freq = getattr(ax, 'freq', None)
-
-    if freq is None:  # convert irregular if axes has freq info
-        freq = ax_freq
-    else:  # do not use tsplot if irregular was plotted first
-        if (ax_freq is None) and (len(ax.get_lines()) > 0):
-            return False
-
-    if freq is None:
-        return False
-
-    if isinstance(freq, DateOffset):
-        freq = freq.rule_code
-    else:
-        freq = frequencies.get_base_alias(freq)
-    freq = frequencies.get_period_alias(freq)
-
-    if freq is None:
-        return False
-
-    # hack this for 0.10.1, creating more technical debt...sigh
-    if isinstance(data.index, DatetimeIndex):
-        base = frequencies.get_freq(freq)
-        x = data.index
-        if (base <= frequencies.FreqGroup.FR_DAY):
-            return x[:1].is_normalized
-        return Period(x[0], freq).to_timestamp(tz=x.tz) == x[0]
-    return True
-
-
-def _get_index_freq(data):
-    freq = getattr(data.index, 'freq', None)
-    if freq is None:
-        freq = getattr(data.index, 'inferred_freq', None)
-        if freq == 'B':
-            weekdays = np.unique(data.index.dayofweek)
-            if (5 in weekdays) or (6 in weekdays):
-                freq = None
-    return freq
-
-
-def _maybe_convert_index(ax, data):
-    # tsplot converts automatically, but don't want to convert index
-    # over and over for DataFrames
-    if isinstance(data.index, DatetimeIndex):
-        freq = getattr(data.index, 'freq', None)
-
-        if freq is None:
-            freq = getattr(data.index, 'inferred_freq', None)
-        if isinstance(freq, DateOffset):
-            freq = freq.rule_code
-
-        if freq is None:
-            freq = getattr(ax, 'freq', None)
-
-        if freq is None:
-            raise ValueError('Could not get frequency alias for plotting')
-
-        freq = frequencies.get_base_alias(freq)
-        freq = frequencies.get_period_alias(freq)
-
-        data = data.to_period(freq=freq)
-    return data
-
-
-# Patch methods for subplot. Only format_dateaxis is currently used.
-# Do we need the rest for convenience?
-
-
-def format_dateaxis(subplot, freq):
-    """
-    Pretty-formats the date axis (x-axis).
-
-    Major and minor ticks are automatically set for the frequency of the
-    current underlying series.  As the dynamic mode is activated by
-    default, changing the limits of the x axis will intelligently change
-    the positions of the ticks.
-    """
-    majlocator = TimeSeries_DateLocator(freq, dynamic_mode=True,
-                                        minor_locator=False,
-                                        plot_obj=subplot)
-    minlocator = TimeSeries_DateLocator(freq, dynamic_mode=True,
-                                        minor_locator=True,
-                                        plot_obj=subplot)
-    subplot.xaxis.set_major_locator(majlocator)
-    subplot.xaxis.set_minor_locator(minlocator)
-
-    majformatter = TimeSeries_DateFormatter(freq, dynamic_mode=True,
-                                            minor_locator=False,
-                                            plot_obj=subplot)
-    minformatter = TimeSeries_DateFormatter(freq, dynamic_mode=True,
-                                            minor_locator=True,
-                                            plot_obj=subplot)
-    subplot.xaxis.set_major_formatter(majformatter)
-    subplot.xaxis.set_minor_formatter(minformatter)
-
-    # x and y coord info
-    subplot.format_coord = lambda t, y: ("t = {0}  "
-        "y = {1:8f}".format(Period(ordinal=int(t), freq=freq), y))
-
-    pylab.draw_if_interactive()
+from pandas.plotting._timeseries import tsplot
diff --git a/pandas/tseries/resample.py b/pandas/tseries/resample.py
deleted file mode 100644
index 0ecdb43895f07..0000000000000
--- a/pandas/tseries/resample.py
+++ /dev/null
@@ -1,488 +0,0 @@
-from datetime import timedelta
-import numpy as np
-from pandas.core.groupby import BinGrouper, Grouper
-from pandas.tseries.frequencies import to_offset, is_subperiod, is_superperiod
-from pandas.tseries.index import DatetimeIndex, date_range
-from pandas.tseries.tdi import TimedeltaIndex
-from pandas.tseries.offsets import DateOffset, Tick, Day, _delta_to_nanoseconds
-from pandas.tseries.period import PeriodIndex, period_range
-import pandas.core.common as com
-import pandas.compat as compat
-
-from pandas.lib import Timestamp
-import pandas.lib as lib
-import pandas.tslib as tslib
-
-
-_DEFAULT_METHOD = 'mean'
-
-
-class TimeGrouper(Grouper):
-    """
-    Custom groupby class for time-interval grouping
-
-    Parameters
-    ----------
-    freq : pandas date offset or offset alias for identifying bin edges
-    closed : closed end of interval; left or right
-    label : interval boundary to use for labeling; left or right
-    nperiods : optional, integer
-    convention : {'start', 'end', 'e', 's'}
-        If axis is PeriodIndex
-
-    Notes
-    -----
-    Use begin, end, nperiods to generate intervals that cannot be derived
-    directly from the associated object
-    """
-    def __init__(self, freq='Min', closed=None, label=None, how='mean',
-                 nperiods=None, axis=0,
-                 fill_method=None, limit=None, loffset=None, kind=None,
-                 convention=None, base=0, **kwargs):
-        freq = to_offset(freq)
-
-        end_types = set(['M', 'A', 'Q', 'BM', 'BA', 'BQ', 'W'])
-        rule = freq.rule_code
-        if (rule in end_types or
-                ('-' in rule and rule[:rule.find('-')] in end_types)):
-            if closed is None:
-                closed = 'right'
-            if label is None:
-                label = 'right'
-        else:
-            if closed is None:
-                closed = 'left'
-            if label is None:
-                label = 'left'
-
-        self.closed = closed
-        self.label = label
-        self.nperiods = nperiods
-        self.kind = kind
-
-        self.convention = convention or 'E'
-        self.convention = self.convention.lower()
-
-        self.loffset = loffset
-        self.how = how
-        self.fill_method = fill_method
-        self.limit = limit
-        self.base = base
-
-        # always sort time groupers
-        kwargs['sort'] = True
-
-        super(TimeGrouper, self).__init__(freq=freq, axis=axis, **kwargs)
-
-    def resample(self, obj):
-        self._set_grouper(obj, sort=True)
-        ax = self.grouper
-
-        if isinstance(ax, DatetimeIndex):
-            rs = self._resample_timestamps()
-        elif isinstance(ax, PeriodIndex):
-            offset = to_offset(self.freq)
-            if offset.n > 1:
-                if self.kind == 'period':  # pragma: no cover
-                    print('Warning: multiple of frequency -> timestamps')
-                # Cannot have multiple of periods, convert to timestamp
-                self.kind = 'timestamp'
-
-            if self.kind is None or self.kind == 'period':
-                rs = self._resample_periods()
-            else:
-                obj = self.obj.to_timestamp(how=self.convention)
-                self._set_grouper(obj)
-                rs = self._resample_timestamps()
-        elif isinstance(ax, TimedeltaIndex):
-            rs = self._resample_timestamps(kind='timedelta')
-        elif len(ax) == 0:
-            return self.obj
-        else:  # pragma: no cover
-            raise TypeError('Only valid with DatetimeIndex, TimedeltaIndex or PeriodIndex')
-
-        rs_axis = rs._get_axis(self.axis)
-        rs_axis.name = ax.name
-        return rs
-
-    def _get_grouper(self, obj):
-        self._set_grouper(obj)
-        return self._get_binner_for_resample()
-
-    def _get_binner_for_resample(self, kind=None):
-        # create the BinGrouper
-        # assume that self.set_grouper(obj) has already been called
-
-        ax = self.ax
-        if kind is None:
-            kind = self.kind
-        if kind is None or kind == 'timestamp':
-            self.binner, bins, binlabels = self._get_time_bins(ax)
-        elif kind == 'timedelta':
-            self.binner, bins, binlabels = self._get_time_delta_bins(ax)
-        else:
-            self.binner, bins, binlabels = self._get_time_period_bins(ax)
-
-        self.grouper = BinGrouper(bins, binlabels)
-        return self.binner, self.grouper, self.obj
-
-    def _get_binner_for_grouping(self, obj):
-        # return an ordering of the transformed group labels,
-        # suitable for multi-grouping, e.g the labels for
-        # the resampled intervals
-        ax = self._set_grouper(obj)
-        self._get_binner_for_resample()
-
-        # create the grouper
-        binner = self.binner
-        l = []
-        for key, group in self.grouper.get_iterator(ax):
-            l.extend([key]*len(group))
-        grouper = binner.__class__(l,freq=binner.freq,name=binner.name)
-
-        # since we may have had to sort
-        # may need to reorder groups here
-        if self.indexer is not None:
-            indexer = self.indexer.argsort(kind='quicksort')
-            grouper = grouper.take(indexer)
-        return grouper
-
-    def _get_time_bins(self, ax):
-        if not isinstance(ax, DatetimeIndex):
-            raise TypeError('axis must be a DatetimeIndex, but got '
-                            'an instance of %r' % type(ax).__name__)
-
-        if len(ax) == 0:
-            binner = labels = DatetimeIndex(data=[], freq=self.freq, name=ax.name)
-            return binner, [], labels
-
-        first, last = ax.min(), ax.max()
-        first, last = _get_range_edges(first, last, self.freq, closed=self.closed,
-                                       base=self.base)
-        tz = ax.tz
-        binner = labels = DatetimeIndex(freq=self.freq,
-                                        start=first.replace(tzinfo=None),
-                                        end=last.replace(tzinfo=None),
-                                        tz=tz,
-                                        name=ax.name)
-
-        # a little hack
-        trimmed = False
-        if (len(binner) > 2 and binner[-2] == last and
-                self.closed == 'right'):
-
-            binner = binner[:-1]
-            trimmed = True
-
-        ax_values = ax.asi8
-        binner, bin_edges = self._adjust_bin_edges(binner, ax_values)
-
-        # general version, knowing nothing about relative frequencies
-        bins = lib.generate_bins_dt64(ax_values, bin_edges, self.closed, hasnans=ax.hasnans)
-
-        if self.closed == 'right':
-            labels = binner
-            if self.label == 'right':
-                labels = labels[1:]
-            elif not trimmed:
-                labels = labels[:-1]
-        else:
-            if self.label == 'right':
-                labels = labels[1:]
-            elif not trimmed:
-                labels = labels[:-1]
-
-        if ax.hasnans:
-            binner = binner.insert(0, tslib.NaT)
-            labels = labels.insert(0, tslib.NaT)
-
-        # if we end up with more labels than bins
-        # adjust the labels
-        # GH4076
-        if len(bins) < len(labels):
-            labels = labels[:len(bins)]
-
-        return binner, bins, labels
-
-    def _adjust_bin_edges(self, binner, ax_values):
-        # Some hacks for > daily data, see #1471, #1458, #1483
-
-        bin_edges = binner.asi8
-
-        if self.freq != 'D' and is_superperiod(self.freq, 'D'):
-            day_nanos = _delta_to_nanoseconds(timedelta(1))
-            if self.closed == 'right':
-                bin_edges = bin_edges + day_nanos - 1
-
-            # intraday values on last day
-            if bin_edges[-2] > ax_values.max():
-                bin_edges = bin_edges[:-1]
-                binner = binner[:-1]
-
-        return binner, bin_edges
-
-    def _get_time_delta_bins(self, ax):
-        if not isinstance(ax, TimedeltaIndex):
-            raise TypeError('axis must be a TimedeltaIndex, but got '
-                            'an instance of %r' % type(ax).__name__)
-
-        if not len(ax):
-            binner = labels = TimedeltaIndex(data=[], freq=self.freq, name=ax.name)
-            return binner, [], labels
-
-        labels = binner = TimedeltaIndex(start=ax[0],
-                                         end=ax[-1],
-                                         freq=self.freq,
-                                         name=ax.name)
-
-        end_stamps = labels + 1
-        bins = ax.searchsorted(end_stamps, side='left')
-
-        # Addresses GH #10530
-        if self.base > 0:
-            labels += type(self.freq)(self.base)
-
-        return binner, bins, labels
-
-    def _get_time_period_bins(self, ax):
-        if not isinstance(ax, DatetimeIndex):
-            raise TypeError('axis must be a DatetimeIndex, but got '
-                            'an instance of %r' % type(ax).__name__)
-
-        if not len(ax):
-            binner = labels = PeriodIndex(data=[], freq=self.freq, name=ax.name)
-            return binner, [], labels
-
-        labels = binner = PeriodIndex(start=ax[0],
-                                      end=ax[-1],
-                                      freq=self.freq,
-                                      name=ax.name)
-
-        end_stamps = (labels + 1).asfreq(self.freq, 's').to_timestamp()
-        if ax.tzinfo:
-            end_stamps = end_stamps.tz_localize(ax.tzinfo)
-        bins = ax.searchsorted(end_stamps, side='left')
-
-        return binner, bins, labels
-
-    @property
-    def _agg_method(self):
-        return self.how if self.how else _DEFAULT_METHOD
-
-    def _resample_timestamps(self, kind=None):
-        # assumes set_grouper(obj) already called
-        axlabels = self.ax
-
-        self._get_binner_for_resample(kind=kind)
-        grouper = self.grouper
-        binner = self.binner
-        obj = self.obj
-
-        # Determine if we're downsampling
-        if axlabels.freq is not None or axlabels.inferred_freq is not None:
-
-            if len(grouper.binlabels) < len(axlabels) or self.how is not None:
-                # downsample
-                grouped = obj.groupby(grouper, axis=self.axis)
-                result = grouped.aggregate(self._agg_method)
-                # GH2073
-                if self.fill_method is not None:
-                    result = result.fillna(method=self.fill_method,
-                                           limit=self.limit)
-
-            else:
-                # upsampling shortcut
-                if self.axis:
-                    raise AssertionError('axis must be 0')
-
-                if self.closed == 'right':
-                    res_index = binner[1:]
-                else:
-                    res_index = binner[:-1]
-
-                # if we have the same frequency as our axis, then we are equal sampling
-                # even if how is None
-                if self.fill_method is None and self.limit is None and to_offset(
-                    axlabels.inferred_freq) == self.freq:
-                    result = obj.copy()
-                    result.index = res_index
-                else:
-                    result = obj.reindex(res_index, method=self.fill_method,
-                                         limit=self.limit)
-        else:
-            # Irregular data, have to use groupby
-            grouped = obj.groupby(grouper, axis=self.axis)
-            result = grouped.aggregate(self._agg_method)
-
-            if self.fill_method is not None:
-                result = result.fillna(method=self.fill_method,
-                                       limit=self.limit)
-
-        loffset = self.loffset
-        if isinstance(loffset, compat.string_types):
-            loffset = to_offset(self.loffset)
-
-        if isinstance(loffset, (DateOffset, timedelta)):
-            if (isinstance(result.index, DatetimeIndex)
-                    and len(result.index) > 0):
-
-                result.index = result.index + loffset
-
-        return result
-
-    def _resample_periods(self):
-        # assumes set_grouper(obj) already called
-        axlabels = self.ax
-        obj = self.obj
-
-        if len(axlabels) == 0:
-            new_index = PeriodIndex(data=[], freq=self.freq)
-            return obj.reindex(new_index)
-        else:
-            start = axlabels[0].asfreq(self.freq, how=self.convention)
-            end = axlabels[-1].asfreq(self.freq, how='end')
-
-            new_index = period_range(start, end, freq=self.freq)
-
-        # Start vs. end of period
-        memb = axlabels.asfreq(self.freq, how=self.convention)
-
-        if is_subperiod(axlabels.freq, self.freq) or self.how is not None:
-            # Downsampling
-            rng = np.arange(memb.values[0], memb.values[-1] + 1)
-            bins = memb.searchsorted(rng, side='right')
-            grouper = BinGrouper(bins, new_index)
-
-            grouped = obj.groupby(grouper, axis=self.axis)
-            return grouped.aggregate(self._agg_method)
-        elif is_superperiod(axlabels.freq, self.freq):
-            # Get the fill indexer
-            indexer = memb.get_indexer(new_index, method=self.fill_method,
-                                       limit=self.limit)
-            return _take_new_index(obj, indexer, new_index, axis=self.axis)
-
-        else:
-            raise ValueError('Frequency %s cannot be resampled to %s'
-                             % (axlabels.freq, self.freq))
-
-
-def _take_new_index(obj, indexer, new_index, axis=0):
-    from pandas.core.api import Series, DataFrame
-
-    if isinstance(obj, Series):
-        new_values = com.take_1d(obj.values, indexer)
-        return Series(new_values, index=new_index, name=obj.name)
-    elif isinstance(obj, DataFrame):
-        if axis == 1:
-            raise NotImplementedError("axis 1 is not supported")
-        return DataFrame(obj._data.reindex_indexer(
-            new_axis=new_index, indexer=indexer, axis=1))
-    else:
-        raise ValueError("'obj' should be either a Series or a DataFrame")
-
-
-def _get_range_edges(first, last, offset, closed='left', base=0):
-    if isinstance(offset, compat.string_types):
-        offset = to_offset(offset)
-
-    if isinstance(offset, Tick):
-        is_day = isinstance(offset, Day)
-        day_nanos = _delta_to_nanoseconds(timedelta(1))
-
-        # #1165
-        if (is_day and day_nanos % offset.nanos == 0) or not is_day:
-            return _adjust_dates_anchored(first, last, offset,
-                                          closed=closed, base=base)
-
-    if not isinstance(offset, Tick):  # and first.time() != last.time():
-        # hack!
-        first = first.normalize()
-        last = last.normalize()
-
-    if closed == 'left':
-        first = Timestamp(offset.rollback(first))
-    else:
-        first = Timestamp(first - offset)
-
-    last = Timestamp(last + offset)
-
-    return first, last
-
-
-def _adjust_dates_anchored(first, last, offset, closed='right', base=0):
-#     from pandas.tseries.tools import normalize_date
-
-    # First and last offsets should be calculated from the start day to fix an
-    # error cause by resampling across multiple days when a one day period is
-    # not a multiple of the frequency.
-    #
-    # See https://github.com/pydata/pandas/issues/8683
-
-    first_tzinfo = first.tzinfo
-    first = first.tz_localize(None)
-    last = last.tz_localize(None)
-    start_day_nanos = first.normalize().value
-
-    base_nanos = (base % offset.n) * offset.nanos // offset.n
-    start_day_nanos += base_nanos
-
-    foffset = (first.value - start_day_nanos) % offset.nanos
-    loffset = (last.value - start_day_nanos) % offset.nanos
-
-    if closed == 'right':
-        if foffset > 0:
-            # roll back
-            fresult = first.value - foffset
-        else:
-            fresult = first.value - offset.nanos
-
-        if loffset > 0:
-            # roll forward
-            lresult = last.value + (offset.nanos - loffset)
-        else:
-            # already the end of the road
-            lresult = last.value
-    else:  # closed == 'left'
-        if foffset > 0:
-            fresult = first.value - foffset
-        else:
-            # start of the road
-            fresult = first.value
-
-        if loffset > 0:
-            # roll forward
-            lresult = last.value + (offset.nanos - loffset)
-        else:
-            lresult = last.value + offset.nanos
-
-#     return (Timestamp(fresult, tz=first.tz),
-#             Timestamp(lresult, tz=last.tz))
-
-    return (Timestamp(fresult).tz_localize(first_tzinfo),
-            Timestamp(lresult).tz_localize(first_tzinfo))
-
-
-def asfreq(obj, freq, method=None, how=None, normalize=False):
-    """
-    Utility frequency conversion method for Series/DataFrame
-    """
-    if isinstance(obj.index, PeriodIndex):
-        if method is not None:
-            raise NotImplementedError("'method' argument is not supported")
-
-        if how is None:
-            how = 'E'
-
-        new_index = obj.index.asfreq(freq, how=how)
-        new_obj = obj.copy()
-        new_obj.index = new_index
-        return new_obj
-    else:
-        if len(obj.index) == 0:
-            return obj.copy()
-        dti = date_range(obj.index[0], obj.index[-1], freq=freq)
-        dti.name = obj.index.name
-        rs = obj.reindex(dti, method=method)
-        if normalize:
-            rs.index = rs.index.normalize()
-        return rs
diff --git a/pandas/tseries/tdi.py b/pandas/tseries/tdi.py
deleted file mode 100644
index 89229fc48bcb2..0000000000000
--- a/pandas/tseries/tdi.py
+++ /dev/null
@@ -1,961 +0,0 @@
-""" implement the TimedeltaIndex """
-
-from datetime import timedelta
-import numpy as np
-from pandas.core.common import (ABCSeries, _TD_DTYPE, _INT64_DTYPE,
-                                is_timedelta64_dtype, _maybe_box,
-                                _values_from_object, isnull, is_integer, is_float)
-from pandas.core.index import Index, Int64Index
-import pandas.compat as compat
-from pandas.compat import u
-from pandas.util.decorators import cache_readonly
-from pandas.tseries.frequencies import to_offset
-import pandas.core.common as com
-from pandas.tseries import timedeltas
-from pandas.tseries.base import DatetimeIndexOpsMixin
-from pandas.tseries.timedeltas import to_timedelta, _coerce_scalar_to_timedelta_type
-import pandas.tseries.offsets as offsets
-from pandas.tseries.offsets import Tick, DateOffset
-
-import pandas.lib as lib
-import pandas.tslib as tslib
-import pandas.algos as _algos
-import pandas.index as _index
-
-Timedelta = tslib.Timedelta
-
-_resolution_map = {
-    'ns' : offsets.Nano,
-    'us' : offsets.Micro,
-    'ms' : offsets.Milli,
-    's'  : offsets.Second,
-    'm'  : offsets.Minute,
-    'h'  : offsets.Hour,
-    'D'  : offsets.Day,
-    }
-
-def _td_index_cmp(opname, nat_result=False):
-    """
-    Wrap comparison operations to convert timedelta-like to timedelta64
-    """
-    def wrapper(self, other):
-        func = getattr(super(TimedeltaIndex, self), opname)
-        if _is_convertible_to_td(other):
-            other = _to_m8(other)
-            result = func(other)
-            if com.isnull(other):
-                result.fill(nat_result)
-        else:
-            if not com.is_list_like(other):
-                raise TypeError("cannot compare a TimedeltaIndex with type {0}".format(type(other)))
-
-            other = TimedeltaIndex(other).values
-            result = func(other)
-            result = _values_from_object(result)
-
-            if isinstance(other, Index):
-                o_mask = other.values.view('i8') == tslib.iNaT
-            else:
-                o_mask = other.view('i8') == tslib.iNaT
-
-            if o_mask.any():
-                result[o_mask] = nat_result
-
-        mask = self.asi8 == tslib.iNaT
-        if mask.any():
-            result[mask] = nat_result
-
-        # support of bool dtype indexers
-        if com.is_bool_dtype(result):
-            return result
-        return Index(result)
-
-    return wrapper
-
-
-class TimedeltaIndex(DatetimeIndexOpsMixin, Int64Index):
-    """
-    Immutable ndarray of timedelta64 data, represented internally as int64, and
-    which can be boxed to timedelta objects
-
-    Parameters
-    ----------
-    data  : array-like (1-dimensional), optional
-        Optional timedelta-like data to construct index with
-    unit: unit of the arg (D,h,m,s,ms,us,ns) denote the unit, optional
-        which is an integer/float number
-    freq: a frequency for the index, optional
-    copy  : bool
-        Make a copy of input ndarray
-    start : starting value, timedelta-like, optional
-        If data is None, start is used as the start point in generating regular
-        timedelta data.
-    periods  : int, optional, > 0
-        Number of periods to generate, if generating index. Takes precedence
-        over end argument
-    end   : end time, timedelta-like, optional
-        If periods is none, generated index will extend to first conforming
-        time on or just past end argument
-    closed : string or None, default None
-        Make the interval closed with respect to the given frequency to
-        the 'left', 'right', or both sides (None)
-    name : object
-        Name to be stored in the index
-    """
-
-    _typ = 'timedeltaindex'
-    _join_precedence = 10
-    def _join_i8_wrapper(joinf, **kwargs):
-        return DatetimeIndexOpsMixin._join_i8_wrapper(joinf, dtype='m8[ns]', **kwargs)
-
-    _inner_indexer = _join_i8_wrapper(_algos.inner_join_indexer_int64)
-    _outer_indexer = _join_i8_wrapper(_algos.outer_join_indexer_int64)
-    _left_indexer = _join_i8_wrapper(_algos.left_join_indexer_int64)
-    _left_indexer_unique = _join_i8_wrapper(
-        _algos.left_join_indexer_unique_int64, with_indexers=False)
-    _arrmap = None
-    _datetimelike_ops = ['days','seconds','microseconds','nanoseconds',
-                         'freq','components']
-
-    __eq__ = _td_index_cmp('__eq__')
-    __ne__ = _td_index_cmp('__ne__', nat_result=True)
-    __lt__ = _td_index_cmp('__lt__')
-    __gt__ = _td_index_cmp('__gt__')
-    __le__ = _td_index_cmp('__le__')
-    __ge__ = _td_index_cmp('__ge__')
-
-    _engine_type = _index.TimedeltaEngine
-
-    _comparables = ['name', 'freq']
-    _attributes = ['name', 'freq']
-    _is_numeric_dtype = True
-    freq = None
-
-    def __new__(cls, data=None, unit=None,
-                freq=None, start=None, end=None, periods=None,
-                copy=False, name=None,
-                closed=None, verify_integrity=True, **kwargs):
-
-        if isinstance(data, TimedeltaIndex) and freq is None and name is None:
-            if copy:
-                data = data.copy()
-            return data
-
-        freq_infer = False
-        if not isinstance(freq, DateOffset):
-
-            # if a passed freq is None, don't infer automatically
-            if freq != 'infer':
-                freq = to_offset(freq)
-            else:
-                freq_infer = True
-                freq = None
-
-        if periods is not None:
-            if is_float(periods):
-                periods = int(periods)
-            elif not is_integer(periods):
-                raise ValueError('Periods must be a number, got %s' %
-                                 str(periods))
-
-        if data is None and freq is None:
-            raise ValueError("Must provide freq argument if no data is "
-                             "supplied")
-
-        if data is None:
-            return cls._generate(start, end, periods, name, freq,
-                                 closed=closed)
-
-        if unit is not None:
-            data = to_timedelta(data, unit=unit, box=False)
-
-        if not isinstance(data, (np.ndarray, Index, ABCSeries)):
-            if np.isscalar(data):
-                raise ValueError('TimedeltaIndex() must be called with a '
-                                 'collection of some kind, %s was passed'
-                                 % repr(data))
-
-        # convert if not already
-        if getattr(data,'dtype',None) != _TD_DTYPE:
-            data = to_timedelta(data,unit=unit,box=False)
-        elif copy:
-            data = np.array(data,copy=True)
-
-        # check that we are matching freqs
-        if verify_integrity and len(data) > 0:
-            if freq is not None and not freq_infer:
-                index = cls._simple_new(data, name=name)
-                inferred = index.inferred_freq
-                if inferred != freq.freqstr:
-                    on_freq = cls._generate(index[0], None, len(index), name, freq)
-                    if not np.array_equal(index.asi8, on_freq.asi8):
-                        raise ValueError('Inferred frequency {0} from passed timedeltas does not '
-                                         'conform to passed frequency {1}'.format(inferred, freq.freqstr))
-                index.freq = freq
-                return index
-
-        if freq_infer:
-            index = cls._simple_new(data, name=name)
-            inferred = index.inferred_freq
-            if inferred:
-                index.freq = to_offset(inferred)
-            return index
-
-        return cls._simple_new(data, name=name, freq=freq)
-
-    @classmethod
-    def _generate(cls, start, end, periods, name, offset, closed=None):
-        if com._count_not_none(start, end, periods) != 2:
-            raise ValueError('Must specify two of start, end, or periods')
-
-        if start is not None:
-            start = Timedelta(start)
-
-        if end is not None:
-            end = Timedelta(end)
-
-        left_closed = False
-        right_closed = False
-
-        if start is None and end is None:
-            if closed is not None:
-                raise ValueError("Closed has to be None if not both of start"
-                                 "and end are defined")
-
-        if closed is None:
-            left_closed = True
-            right_closed = True
-        elif closed == "left":
-            left_closed = True
-        elif closed == "right":
-            right_closed = True
-        else:
-            raise ValueError("Closed has to be either 'left', 'right' or None")
-
-        index = _generate_regular_range(start, end, periods, offset)
-        index = cls._simple_new(index, name=name, freq=offset)
-
-        if not left_closed:
-            index = index[1:]
-        if not right_closed:
-            index = index[:-1]
-
-        return index
-
-    @property
-    def _box_func(self):
-        return lambda x: Timedelta(x, unit='ns')
-
-    @classmethod
-    def _simple_new(cls, values, name=None, freq=None, **kwargs):
-        if not getattr(values,'dtype',None):
-            values = np.array(values,copy=False)
-        if values.dtype == np.object_:
-            values = tslib.array_to_timedelta64(values)
-        if values.dtype != _TD_DTYPE:
-            values = com._ensure_int64(values).view(_TD_DTYPE)
-
-        result = object.__new__(cls)
-        result._data = values
-        result.name = name
-        result.freq = freq
-        result._reset_identity()
-        return result
-
-    _na_value = tslib.NaT
-    """The expected NA value to use with this index."""
-
-    @property
-    def _formatter_func(self):
-        from pandas.core.format import _get_format_timedelta64
-        return _get_format_timedelta64(self, box=True)
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-        if isinstance(state, dict):
-            super(TimedeltaIndex, self).__setstate__(state)
-        else:
-            raise Exception("invalid pickle state")
-    _unpickle_compat = __setstate__
-
-    def _maybe_update_attributes(self, attrs):
-        """ Update Index attributes (e.g. freq) depending on op """
-        freq = attrs.get('freq', None)
-        if freq is not None:
-            # no need to infer if freq is None
-            attrs['freq'] = 'infer'
-        return attrs
-
-    def _add_delta(self, delta):
-        if isinstance(delta, (Tick, timedelta, np.timedelta64)):
-            new_values = self._add_delta_td(delta)
-            name = self.name
-        elif isinstance(delta, TimedeltaIndex):
-            new_values = self._add_delta_tdi(delta)
-            # update name when delta is index
-            name = com._maybe_match_name(self, delta)
-        else:
-            raise ValueError("cannot add the type {0} to a TimedeltaIndex".format(type(delta)))
-
-        result = TimedeltaIndex(new_values, freq='infer', name=name)
-        return result
-
-    def _evaluate_with_timedelta_like(self, other, op, opstr):
-
-        # allow division by a timedelta
-        if opstr in ['__div__','__truediv__']:
-            if _is_convertible_to_td(other):
-                other = Timedelta(other)
-                if isnull(other):
-                    raise NotImplementedError("division by pd.NaT not implemented")
-
-                i8 = self.asi8
-                result = i8/float(other.value)
-                result = self._maybe_mask_results(result,convert='float64')
-                return Index(result,name=self.name,copy=False)
-
-        return NotImplemented
-
-    def _add_datelike(self, other):
-
-        # adding a timedeltaindex to a datetimelike
-        from pandas import Timestamp, DatetimeIndex
-        other = Timestamp(other)
-        i8 = self.asi8
-        result = i8 + other.value
-        result = self._maybe_mask_results(result,fill_value=tslib.iNaT)
-        return DatetimeIndex(result,name=self.name,copy=False)
-
-    def _sub_datelike(self, other):
-        raise TypeError("cannot subtract a datelike from a TimedeltaIndex")
-
-    def _format_native_types(self, na_rep=u('NaT'),
-                             date_format=None, **kwargs):
-        from pandas.core.format import Timedelta64Formatter
-        return Timedelta64Formatter(values=self,
-                                    nat_rep=na_rep,
-                                    justify='all').get_result()
-
-    def _get_field(self, m):
-
-        values = self.asi8
-        hasnans = self.hasnans
-        if hasnans:
-            result = np.empty(len(self), dtype='float64')
-            mask = values == tslib.iNaT
-            imask = ~mask
-            result.flat[imask] = np.array([ getattr(Timedelta(val),m) for val in values[imask] ])
-            result[mask] = np.nan
-        else:
-            result = np.array([ getattr(Timedelta(val),m) for val in values ],dtype='int64')
-        return result
-
-    @property
-    def days(self):
-        """ Number of days for each element. """
-        return self._get_field('days')
-
-    @property
-    def seconds(self):
-        """ Number of seconds (>= 0 and less than 1 day) for each element. """
-        return self._get_field('seconds')
-
-    @property
-    def microseconds(self):
-        """ Number of microseconds (>= 0 and less than 1 second) for each element. """
-        return self._get_field('microseconds')
-
-    @property
-    def nanoseconds(self):
-        """ Number of nanoseconds (>= 0 and less than 1 microsecond) for each element. """
-        return self._get_field('nanoseconds')
-
-    @property
-    def components(self):
-        """
-        Return a dataframe of the components (days, hours, minutes,
-        seconds, milliseconds, microseconds, nanoseconds) of the Timedeltas.
-
-        Returns
-        -------
-        a DataFrame
-        """
-        from pandas import DataFrame
-
-        columns = ['days','hours','minutes','seconds','milliseconds','microseconds','nanoseconds']
-        hasnans = self.hasnans
-        if hasnans:
-            def f(x):
-                if isnull(x):
-                    return [np.nan]*len(columns)
-                return x.components
-        else:
-            def f(x):
-                return x.components
-
-        result = DataFrame([ f(x) for x in self ])
-        result.columns = columns
-        if not hasnans:
-            result = result.astype('int64')
-        return result
-
-    def total_seconds(self):
-        """
-        Total duration of each element expressed in seconds.
-
-        .. versionadded:: 0.17.0
-        """
-        return self._maybe_mask_results(1e-9*self.asi8)
-
-    def to_pytimedelta(self):
-        """
-        Return TimedeltaIndex as object ndarray of datetime.timedelta objects
-
-        Returns
-        -------
-        datetimes : ndarray
-        """
-        return tslib.ints_to_pytimedelta(self.asi8)
-
-    def astype(self, dtype):
-        dtype = np.dtype(dtype)
-
-        if dtype == np.object_:
-            return self.asobject
-        elif dtype == _INT64_DTYPE:
-            return self.asi8.copy()
-        elif dtype == _TD_DTYPE:
-            return self
-        elif dtype.kind == 'm':
-
-            # return an index (essentially this is division)
-            result = self.values.astype(dtype)
-            if self.hasnans:
-                return Index(self._maybe_mask_results(result,convert='float64'),name=self.name)
-
-            return Index(result.astype('i8'),name=self.name)
-
-        else:  # pragma: no cover
-            raise ValueError('Cannot cast TimedeltaIndex to dtype %s' % dtype)
-
-    def union(self, other):
-        """
-        Specialized union for TimedeltaIndex objects. If combine
-        overlapping ranges with the same DateOffset, will be much
-        faster than Index.union
-
-        Parameters
-        ----------
-        other : TimedeltaIndex or array-like
-
-        Returns
-        -------
-        y : Index or TimedeltaIndex
-        """
-        self._assert_can_do_setop(other)
-        if not isinstance(other, TimedeltaIndex):
-            try:
-                other = TimedeltaIndex(other)
-            except (TypeError, ValueError):
-                pass
-        this, other = self, other
-
-        if this._can_fast_union(other):
-            return this._fast_union(other)
-        else:
-            result = Index.union(this, other)
-            if isinstance(result, TimedeltaIndex):
-                if result.freq is None:
-                    result.freq = to_offset(result.inferred_freq)
-            return result
-
-    def append(self, other):
-        """
-        Append a collection of Index options together
-
-        Parameters
-        ----------
-        other : Index or list/tuple of indices
-
-        Returns
-        -------
-        appended : Index
-        """
-        name = self.name
-        to_concat = [self]
-
-        if isinstance(other, (list, tuple)):
-            to_concat = to_concat + list(other)
-        else:
-            to_concat.append(other)
-
-        for obj in to_concat:
-            if isinstance(obj, Index) and obj.name != name:
-                name = None
-                break
-
-        to_concat = self._ensure_compat_concat(to_concat)
-        return Index(com._concat_compat(to_concat), name=name)
-
-    def join(self, other, how='left', level=None, return_indexers=False):
-        """
-        See Index.join
-        """
-        if _is_convertible_to_index(other):
-            try:
-                other = TimedeltaIndex(other)
-            except (TypeError, ValueError):
-                pass
-
-        return Index.join(self, other, how=how, level=level,
-                          return_indexers=return_indexers)
-
-    def _wrap_joined_index(self, joined, other):
-        name = self.name if self.name == other.name else None
-        if (isinstance(other, TimedeltaIndex) and  self.freq == other.freq
-            and self._can_fast_union(other)):
-            joined = self._shallow_copy(joined)
-            joined.name = name
-            return joined
-        else:
-            return self._simple_new(joined, name)
-
-    def _can_fast_union(self, other):
-        if not isinstance(other, TimedeltaIndex):
-            return False
-
-        freq = self.freq
-
-        if freq is None or freq != other.freq:
-            return False
-
-        if not self.is_monotonic or not other.is_monotonic:
-            return False
-
-        if len(self) == 0 or len(other) == 0:
-            return True
-
-        # to make our life easier, "sort" the two ranges
-        if self[0] <= other[0]:
-            left, right = self, other
-        else:
-            left, right = other, self
-
-        right_start = right[0]
-        left_end = left[-1]
-
-        # Only need to "adjoin", not overlap
-        return (right_start == left_end + freq) or right_start in left
-
-    def _fast_union(self, other):
-        if len(other) == 0:
-            return self.view(type(self))
-
-        if len(self) == 0:
-            return other.view(type(self))
-
-        # to make our life easier, "sort" the two ranges
-        if self[0] <= other[0]:
-            left, right = self, other
-        else:
-            left, right = other, self
-
-        left_start, left_end = left[0], left[-1]
-        right_end = right[-1]
-
-        # concatenate
-        if left_end < right_end:
-            loc = right.searchsorted(left_end, side='right')
-            right_chunk = right.values[loc:]
-            dates = com._concat_compat((left.values, right_chunk))
-            return self._shallow_copy(dates)
-        else:
-            return left
-
-    def _wrap_union_result(self, other, result):
-        name = self.name if self.name == other.name else None
-        return self._simple_new(result, name=name, freq=None)
-
-    def intersection(self, other):
-        """
-        Specialized intersection for TimedeltaIndex objects. May be much faster
-        than Index.intersection
-
-        Parameters
-        ----------
-        other : TimedeltaIndex or array-like
-
-        Returns
-        -------
-        y : Index or TimedeltaIndex
-        """
-        self._assert_can_do_setop(other)
-        if not isinstance(other, TimedeltaIndex):
-            try:
-                other = TimedeltaIndex(other)
-            except (TypeError, ValueError):
-                pass
-            result = Index.intersection(self, other)
-            return result
-
-        if len(self) == 0:
-            return self
-        if len(other) == 0:
-            return other
-        # to make our life easier, "sort" the two ranges
-        if self[0] <= other[0]:
-            left, right = self, other
-        else:
-            left, right = other, self
-
-        end = min(left[-1], right[-1])
-        start = right[0]
-
-        if end < start:
-            return type(self)(data=[])
-        else:
-            lslice = slice(*left.slice_locs(start, end))
-            left_chunk = left.values[lslice]
-            return self._shallow_copy(left_chunk)
-
-    def _possibly_promote(self, other):
-        if other.inferred_type == 'timedelta':
-            other = TimedeltaIndex(other)
-        return self, other
-
-    def get_value(self, series, key):
-        """
-        Fast lookup of value from 1-dimensional ndarray. Only use this if you
-        know what you're doing
-        """
-
-        if _is_convertible_to_td(key):
-            key = Timedelta(key)
-            return self.get_value_maybe_box(series, key)
-
-        try:
-            return _maybe_box(self, Index.get_value(self, series, key), series, key)
-        except KeyError:
-            try:
-                loc = self._get_string_slice(key)
-                return series[loc]
-            except (TypeError, ValueError, KeyError):
-                pass
-
-            try:
-                return self.get_value_maybe_box(series, key)
-            except (TypeError, ValueError, KeyError):
-                raise KeyError(key)
-
-    def get_value_maybe_box(self, series, key):
-        if not isinstance(key, Timedelta):
-            key = Timedelta(key)
-        values = self._engine.get_value(_values_from_object(series), key)
-        return _maybe_box(self, values, series, key)
-
-    def get_loc(self, key, method=None, tolerance=None):
-        """
-        Get integer location for requested label
-
-        Returns
-        -------
-        loc : int
-        """
-        if tolerance is not None:
-            # try converting tolerance now, so errors don't get swallowed by
-            # the try/except clauses below
-            tolerance = self._convert_tolerance(tolerance)
-
-        if _is_convertible_to_td(key):
-            key = Timedelta(key)
-            return Index.get_loc(self, key, method, tolerance)
-
-        try:
-            return Index.get_loc(self, key, method, tolerance)
-        except (KeyError, ValueError, TypeError):
-            try:
-                return self._get_string_slice(key)
-            except (TypeError, KeyError, ValueError):
-                pass
-
-            try:
-                stamp = Timedelta(key)
-                return Index.get_loc(self, stamp, method, tolerance)
-            except (KeyError, ValueError):
-                raise KeyError(key)
-
-    def _maybe_cast_slice_bound(self, label, side, kind):
-        """
-        If label is a string, cast it to timedelta according to resolution.
-
-
-        Parameters
-        ----------
-        label : object
-        side : {'left', 'right'}
-        kind : string / None
-
-        Returns
-        -------
-        label :  object
-
-        """
-        if isinstance(label, compat.string_types):
-            parsed = _coerce_scalar_to_timedelta_type(label, box=True)
-            lbound = parsed.round(parsed.resolution)
-            if side == 'left':
-                return lbound
-            else:
-                return (lbound + _resolution_map[parsed.resolution]() -
-                        Timedelta(1, 'ns'))
-        elif is_integer(label) or is_float(label):
-            self._invalid_indexer('slice',label)
-
-        return label
-
-    def _get_string_slice(self, key, use_lhs=True, use_rhs=True):
-        freq = getattr(self, 'freqstr',
-                       getattr(self, 'inferred_freq', None))
-        if is_integer(key) or is_float(key):
-            self._invalid_indexer('slice',key)
-        loc = self._partial_td_slice(key, freq, use_lhs=use_lhs,
-                                     use_rhs=use_rhs)
-        return loc
-
-    def _partial_td_slice(self, key, freq, use_lhs=True, use_rhs=True):
-
-        # given a key, try to figure out a location for a partial slice
-        if not isinstance(key, compat.string_types):
-            return key
-
-        parsed = _coerce_scalar_to_timedelta_type(key, box=True)
-
-        is_monotonic = self.is_monotonic
-
-        # figure out the resolution of the passed td
-        # and round to it
-        reso = parsed.resolution
-        t1 = parsed.round(reso)
-        t2 = t1 + _resolution_map[reso]() - Timedelta(1,'ns')
-
-        stamps = self.asi8
-
-        if is_monotonic:
-
-            # we are out of range
-            if len(stamps) and (
-                (use_lhs and t1.value < stamps[0] and t2.value < stamps[0]) or (
-                (use_rhs and t1.value > stamps[-1] and t2.value > stamps[-1]))):
-                raise KeyError
-
-            # a monotonic (sorted) series can be sliced
-            left = stamps.searchsorted(t1.value, side='left') if use_lhs else None
-            right = stamps.searchsorted(t2.value, side='right') if use_rhs else None
-
-            return slice(left, right)
-
-        lhs_mask = (stamps >= t1.value) if use_lhs else True
-        rhs_mask = (stamps <= t2.value) if use_rhs else True
-
-        # try to find a the dates
-        return (lhs_mask & rhs_mask).nonzero()[0]
-
-    def searchsorted(self, key, side='left'):
-        if isinstance(key, (np.ndarray, Index)):
-            key = np.array(key, dtype=_TD_DTYPE, copy=False)
-        else:
-            key = _to_m8(key)
-
-        return self.values.searchsorted(key, side=side)
-
-    def is_type_compatible(self, typ):
-        return typ == self.inferred_type or typ == 'timedelta'
-
-    @property
-    def inferred_type(self):
-        return 'timedelta64'
-
-    @property
-    def dtype(self):
-        return _TD_DTYPE
-
-    @property
-    def is_all_dates(self):
-        return True
-
-    def equals(self, other):
-        """
-        Determines if two Index objects contain the same elements.
-        """
-        if self.is_(other):
-            return True
-
-        if (not hasattr(other, 'inferred_type') or
-                other.inferred_type != 'timedelta64'):
-            try:
-                other = TimedeltaIndex(other)
-            except:
-                return False
-
-        return np.array_equal(self.asi8, other.asi8)
-
-    def insert(self, loc, item):
-        """
-        Make new Index inserting new item at location
-
-        Parameters
-        ----------
-        loc : int
-        item : object
-            if not either a Python datetime or a numpy integer-like, returned
-            Index dtype will be object rather than datetime.
-
-        Returns
-        -------
-        new_index : Index
-        """
-
-        # try to convert if possible
-        if _is_convertible_to_td(item):
-            try:
-                item = Timedelta(item)
-            except:
-                pass
-
-        freq = None
-        if isinstance(item, (Timedelta, tslib.NaTType)):
-
-            # check freq can be preserved on edge cases
-            if self.freq is not None:
-                if (loc == 0 or loc == -len(self)) and item + self.freq == self[0]:
-                    freq = self.freq
-                elif (loc == len(self)) and item - self.freq == self[-1]:
-                    freq = self.freq
-            item = _to_m8(item)
-
-        try:
-            new_tds = np.concatenate((self[:loc].asi8, [item.view(np.int64)],
-                                        self[loc:].asi8))
-            return TimedeltaIndex(new_tds, name=self.name, freq=freq)
-
-        except (AttributeError, TypeError):
-
-            # fall back to object index
-            if isinstance(item,compat.string_types):
-                return self.asobject.insert(loc, item)
-            raise TypeError("cannot insert TimedeltaIndex with incompatible label")
-
-    def delete(self, loc):
-        """
-        Make a new DatetimeIndex with passed location(s) deleted.
-
-        Parameters
-        ----------
-        loc: int, slice or array of ints
-            Indicate which sub-arrays to remove.
-
-        Returns
-        -------
-        new_index : TimedeltaIndex
-        """
-        new_tds = np.delete(self.asi8, loc)
-
-        freq = 'infer'
-        if is_integer(loc):
-            if loc in (0, -len(self), -1, len(self) - 1):
-                freq = self.freq
-        else:
-            if com.is_list_like(loc):
-                loc = lib.maybe_indices_to_slice(com._ensure_int64(np.array(loc)), len(self))
-            if isinstance(loc, slice) and loc.step in (1, None):
-                if (loc.start in (0, None) or loc.stop in (len(self), None)):
-                    freq = self.freq
-
-        return TimedeltaIndex(new_tds, name=self.name, freq=freq)
-
-
-TimedeltaIndex._add_numeric_methods()
-TimedeltaIndex._add_logical_methods_disabled()
-TimedeltaIndex._add_datetimelike_methods()
-
-
-def _is_convertible_to_index(other):
-    """ return a boolean whether I can attempt conversion to a TimedeltaIndex """
-    if isinstance(other, TimedeltaIndex):
-        return True
-    elif (len(other) > 0 and
-          other.inferred_type not in ('floating', 'mixed-integer','integer',
-                                      'mixed-integer-float', 'mixed')):
-        return True
-    return False
-
-
-def _is_convertible_to_td(key):
-    return isinstance(key, (DateOffset, timedelta, Timedelta, np.timedelta64, compat.string_types))
-
-def _to_m8(key):
-    '''
-    Timedelta-like => dt64
-    '''
-    if not isinstance(key, Timedelta):
-        # this also converts strings
-        key = Timedelta(key)
-
-    # return an type that can be compared
-    return np.int64(key.value).view(_TD_DTYPE)
-
-def _generate_regular_range(start, end, periods, offset):
-    stride = offset.nanos
-    if periods is None:
-        b = Timedelta(start).value
-        e = Timedelta(end).value
-        e += stride - e % stride
-    elif start is not None:
-        b = Timedelta(start).value
-        e = b + periods * stride
-    elif end is not None:
-        e = Timedelta(end).value + stride
-        b = e - periods * stride
-    else:
-        raise ValueError("at least 'start' or 'end' should be specified "
-                         "if a 'period' is given.")
-
-    data = np.arange(b, e, stride, dtype=np.int64)
-    data = TimedeltaIndex._simple_new(data, None)
-
-    return data
-
-
-def timedelta_range(start=None, end=None, periods=None, freq='D',
-                    name=None, closed=None):
-    """
-    Return a fixed frequency timedelta index, with day as the default
-    frequency
-
-    Parameters
-    ----------
-    start : string or timedelta-like, default None
-        Left bound for generating dates
-    end : string or datetime-like, default None
-        Right bound for generating dates
-    periods : integer or None, default None
-        If None, must specify start and end
-    freq : string or DateOffset, default 'D' (calendar daily)
-        Frequency strings can have multiples, e.g. '5H'
-    name : str, default None
-        Name of the resulting index
-    closed : string or None, default None
-        Make the interval closed with respect to the given frequency to
-        the 'left', 'right', or both sides (None)
-
-    Notes
-    -----
-    2 of start, end, or periods must be specified
-
-    Returns
-    -------
-    rng : TimedeltaIndex
-    """
-    return TimedeltaIndex(start=start, end=end, periods=periods,
-                          freq=freq, name=name,
-                          closed=closed)
diff --git a/pandas/tseries/tests/data/daterange_073.pickle b/pandas/tseries/tests/data/daterange_073.pickle
deleted file mode 100644
index 0214a023e6338..0000000000000
Binary files a/pandas/tseries/tests/data/daterange_073.pickle and /dev/null differ
diff --git a/pandas/tseries/tests/data/frame.pickle b/pandas/tseries/tests/data/frame.pickle
deleted file mode 100644
index b3b100fb43022..0000000000000
Binary files a/pandas/tseries/tests/data/frame.pickle and /dev/null differ
diff --git a/pandas/tseries/tests/data/series.pickle b/pandas/tseries/tests/data/series.pickle
deleted file mode 100644
index 307a4ac265173..0000000000000
Binary files a/pandas/tseries/tests/data/series.pickle and /dev/null differ
diff --git a/pandas/tseries/tests/data/series_daterange0.pickle b/pandas/tseries/tests/data/series_daterange0.pickle
deleted file mode 100644
index 07e2144039f2e..0000000000000
Binary files a/pandas/tseries/tests/data/series_daterange0.pickle and /dev/null differ
diff --git a/pandas/tseries/tests/test_base.py b/pandas/tseries/tests/test_base.py
deleted file mode 100644
index 24edc54582ec1..0000000000000
--- a/pandas/tseries/tests/test_base.py
+++ /dev/null
@@ -1,1850 +0,0 @@
-from __future__ import print_function
-import re
-from datetime import datetime, timedelta
-import numpy as np
-import pandas as pd
-from pandas.tseries.base import DatetimeIndexOpsMixin
-from pandas.util.testing import assertRaisesRegexp, assertIsInstance
-from pandas.tseries.common import is_datetimelike
-from pandas import (Series, Index, Int64Index, Timestamp, DatetimeIndex, PeriodIndex,
-                    TimedeltaIndex, Timedelta, timedelta_range, date_range, Float64Index)
-import pandas.tseries.offsets as offsets
-import pandas.tslib as tslib
-import nose
-
-import pandas.util.testing as tm
-
-from pandas.tests.test_base import Ops
-
-class TestDatetimeIndexOps(Ops):
-    tz = [None, 'UTC', 'Asia/Tokyo', 'US/Eastern',
-          'dateutil/Asia/Singapore', 'dateutil/US/Pacific']
-
-    def setUp(self):
-        super(TestDatetimeIndexOps, self).setUp()
-        mask = lambda x: isinstance(x, DatetimeIndex) or isinstance(x, PeriodIndex)
-        self.is_valid_objs  = [ o for o in self.objs if mask(o) ]
-        self.not_valid_objs = [ o for o in self.objs if not mask(o) ]
-
-    def test_ops_properties(self):
-        self.check_ops_properties(['year','month','day','hour','minute','second','weekofyear','week','dayofweek','dayofyear','quarter'])
-        self.check_ops_properties(['date','time','microsecond','nanosecond', 'is_month_start', 'is_month_end', 'is_quarter_start',
-                                   'is_quarter_end', 'is_year_start', 'is_year_end'], lambda x: isinstance(x,DatetimeIndex))
-
-    def test_ops_properties_basic(self):
-
-        # sanity check that the behavior didn't change
-        # GH7206
-        for op in ['year','day','second','weekday']:
-            self.assertRaises(TypeError, lambda x: getattr(self.dt_series,op))
-
-        # attribute access should still work!
-        s = Series(dict(year=2000,month=1,day=10))
-        self.assertEqual(s.year,2000)
-        self.assertEqual(s.month,1)
-        self.assertEqual(s.day,10)
-        self.assertRaises(AttributeError, lambda : s.weekday)
-
-    def test_asobject_tolist(self):
-        idx = pd.date_range(start='2013-01-01', periods=4, freq='M', name='idx')
-        expected_list = [pd.Timestamp('2013-01-31'), pd.Timestamp('2013-02-28'),
-                         pd.Timestamp('2013-03-31'), pd.Timestamp('2013-04-30')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-
-        self.assertEqual(result.dtype, object)
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.name, expected.name)
-        self.assertEqual(idx.tolist(), expected_list)
-
-        idx = pd.date_range(start='2013-01-01', periods=4, freq='M', name='idx', tz='Asia/Tokyo')
-        expected_list = [pd.Timestamp('2013-01-31', tz='Asia/Tokyo'),
-                         pd.Timestamp('2013-02-28', tz='Asia/Tokyo'),
-                         pd.Timestamp('2013-03-31', tz='Asia/Tokyo'),
-                         pd.Timestamp('2013-04-30', tz='Asia/Tokyo')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-        self.assertEqual(result.dtype, object)
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.name, expected.name)
-        self.assertEqual(idx.tolist(), expected_list)
-
-        idx = DatetimeIndex([datetime(2013, 1, 1), datetime(2013, 1, 2),
-                             pd.NaT, datetime(2013, 1, 4)], name='idx')
-        expected_list = [pd.Timestamp('2013-01-01'), pd.Timestamp('2013-01-02'),
-                         pd.NaT, pd.Timestamp('2013-01-04')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-        self.assertEqual(result.dtype, object)
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.name, expected.name)
-        self.assertEqual(idx.tolist(), expected_list)
-
-    def test_minmax(self):
-        for tz in self.tz:
-            # monotonic
-            idx1 = pd.DatetimeIndex(['2011-01-01', '2011-01-02',
-                                     '2011-01-03'], tz=tz)
-            self.assertTrue(idx1.is_monotonic)
-
-            # non-monotonic
-            idx2 = pd.DatetimeIndex(['2011-01-01', pd.NaT, '2011-01-03',
-                                     '2011-01-02', pd.NaT], tz=tz)
-            self.assertFalse(idx2.is_monotonic)
-
-            for idx in [idx1, idx2]:
-                self.assertEqual(idx.min(), pd.Timestamp('2011-01-01', tz=tz))
-                self.assertEqual(idx.max(), pd.Timestamp('2011-01-03', tz=tz))
-
-        for op in ['min', 'max']:
-            # Return NaT
-            obj = DatetimeIndex([])
-            self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-            obj = DatetimeIndex([pd.NaT])
-            self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-            obj = DatetimeIndex([pd.NaT, pd.NaT, pd.NaT])
-            self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-    def test_representation(self):
-
-        idx = []
-        idx.append(DatetimeIndex([], freq='D'))
-        idx.append(DatetimeIndex(['2011-01-01'], freq='D'))
-        idx.append(DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D'))
-        idx.append(DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'], freq='D'))
-        idx.append(DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00'],
-                                 freq='H', tz='Asia/Tokyo'))
-        idx.append(DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT],
-                                 tz='US/Eastern'))
-        idx.append(DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT],
-                                 tz='UTC'))
-
-        exp = []
-        exp.append("""DatetimeIndex([], dtype='datetime64[ns]', freq='D')""")
-        exp.append("""DatetimeIndex(['2011-01-01'], dtype='datetime64[ns]', freq='D')""")
-        exp.append("""DatetimeIndex(['2011-01-01', '2011-01-02'], dtype='datetime64[ns]', freq='D')""")
-        exp.append("""DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'], dtype='datetime64[ns]', freq='D')""")
-        exp.append("""DatetimeIndex(['2011-01-01 09:00:00+09:00', '2011-01-01 10:00:00+09:00', '2011-01-01 11:00:00+09:00'], dtype='datetime64[ns, Asia/Tokyo]', freq='H')""")
-        exp.append("""DatetimeIndex(['2011-01-01 09:00:00-05:00', '2011-01-01 10:00:00-05:00', 'NaT'], dtype='datetime64[ns, US/Eastern]', freq=None)""")
-        exp.append("""DatetimeIndex(['2011-01-01 09:00:00+00:00', '2011-01-01 10:00:00+00:00', 'NaT'], dtype='datetime64[ns, UTC]', freq=None)""")
-
-        with pd.option_context('display.width', 300):
-            for indx, expected in zip(idx, exp):
-                for func in ['__repr__', '__unicode__', '__str__']:
-                    result = getattr(indx, func)()
-                    self.assertEqual(result, expected)
-
-    def test_representation_to_series(self):
-        idx1 = DatetimeIndex([], freq='D')
-        idx2 = DatetimeIndex(['2011-01-01'], freq='D')
-        idx3 = DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D')
-        idx4 = DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'], freq='D')
-        idx5 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00'],
-                             freq='H', tz='Asia/Tokyo')
-        idx6 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT],
-                             tz='US/Eastern')
-        idx7 = DatetimeIndex(['2011-01-01 09:00', '2011-01-02 10:15'])
-
-        exp1 = """Series([], dtype: datetime64[ns])"""
-
-        exp2 = """0   2011-01-01
-dtype: datetime64[ns]"""
-
-        exp3 = """0   2011-01-01
-1   2011-01-02
-dtype: datetime64[ns]"""
-
-        exp4 = """0   2011-01-01
-1   2011-01-02
-2   2011-01-03
-dtype: datetime64[ns]"""
-
-        exp5 = """0   2011-01-01 09:00:00+09:00
-1   2011-01-01 10:00:00+09:00
-2   2011-01-01 11:00:00+09:00
-dtype: datetime64[ns, Asia/Tokyo]"""
-
-        exp6 = """0   2011-01-01 09:00:00-05:00
-1   2011-01-01 10:00:00-05:00
-2                         NaT
-dtype: datetime64[ns, US/Eastern]"""
-
-        exp7 = """0   2011-01-01 09:00:00
-1   2011-01-02 10:15:00
-dtype: datetime64[ns]"""
-
-        with pd.option_context('display.width', 300):
-            for idx, expected in zip([idx1, idx2, idx3, idx4, idx5, idx6, idx7],
-                                     [exp1, exp2, exp3, exp4, exp5, exp6, exp7]):
-                result = repr(Series(idx))
-                self.assertEqual(result, expected)
-
-    def test_summary(self):
-        # GH9116
-        idx1 = DatetimeIndex([], freq='D')
-        idx2 = DatetimeIndex(['2011-01-01'], freq='D')
-        idx3 = DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D')
-        idx4 = DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'], freq='D')
-        idx5 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00'],
-                             freq='H', tz='Asia/Tokyo')
-        idx6 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT],
-                             tz='US/Eastern')
-
-        exp1 = """DatetimeIndex: 0 entries
-Freq: D"""
-        exp2 = """DatetimeIndex: 1 entries, 2011-01-01 to 2011-01-01
-Freq: D"""
-        exp3 = """DatetimeIndex: 2 entries, 2011-01-01 to 2011-01-02
-Freq: D"""
-        exp4 = """DatetimeIndex: 3 entries, 2011-01-01 to 2011-01-03
-Freq: D"""
-        exp5 = """DatetimeIndex: 3 entries, 2011-01-01 09:00:00+09:00 to 2011-01-01 11:00:00+09:00
-Freq: H"""
-        exp6 = """DatetimeIndex: 3 entries, 2011-01-01 09:00:00-05:00 to NaT"""
-
-        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5, idx6],
-                                 [exp1, exp2, exp3, exp4, exp5, exp6]):
-            result = idx.summary()
-            self.assertEqual(result, expected)
-
-    def test_resolution(self):
-        for freq, expected in zip(['A', 'Q', 'M', 'D', 'H', 'T', 'S', 'L', 'U'],
-                                  ['day', 'day', 'day', 'day',
-                                   'hour', 'minute', 'second', 'millisecond', 'microsecond']):
-            for tz in [None, 'Asia/Tokyo', 'US/Eastern']:
-                idx = pd.date_range(start='2013-04-01', periods=30, freq=freq, tz=tz)
-                self.assertEqual(idx.resolution, expected)
-
-    def test_add_iadd(self):
-        for tz in self.tz:
-            # union
-            rng1 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-            other1 = pd.date_range('1/6/2000', freq='D', periods=5, tz=tz)
-            expected1 = pd.date_range('1/1/2000', freq='D', periods=10, tz=tz)
-
-            rng2 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-            other2 = pd.date_range('1/4/2000', freq='D', periods=5, tz=tz)
-            expected2 = pd.date_range('1/1/2000', freq='D', periods=8, tz=tz)
-
-            rng3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-            other3 = pd.DatetimeIndex([], tz=tz)
-            expected3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-
-            for rng, other, expected in [(rng1, other1, expected1), (rng2, other2, expected2),
-                                         (rng3, other3, expected3)]:
-                # GH9094
-                with tm.assert_produces_warning(FutureWarning):
-                    result_add = rng + other
-                result_union = rng.union(other)
-
-                tm.assert_index_equal(result_add, expected)
-                tm.assert_index_equal(result_union, expected)
-                # GH9094
-                with tm.assert_produces_warning(FutureWarning):
-                    rng += other
-                tm.assert_index_equal(rng, expected)
-
-            # offset
-            offsets = [pd.offsets.Hour(2), timedelta(hours=2),
-                       np.timedelta64(2, 'h'),  Timedelta(hours=2)]
-
-            for delta in offsets:
-                rng = pd.date_range('2000-01-01', '2000-02-01', tz=tz)
-                result = rng + delta
-                expected = pd.date_range('2000-01-01 02:00', '2000-02-01 02:00', tz=tz)
-                tm.assert_index_equal(result, expected)
-                rng += delta
-                tm.assert_index_equal(rng, expected)
-
-            # int
-            rng = pd.date_range('2000-01-01 09:00', freq='H', periods=10, tz=tz)
-            result = rng + 1
-            expected = pd.date_range('2000-01-01 10:00', freq='H', periods=10, tz=tz)
-            tm.assert_index_equal(result, expected)
-            rng += 1
-            tm.assert_index_equal(rng, expected)
-
-    def test_sub_isub(self):
-        for tz in self.tz:
-            # diff
-            rng1 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-            other1 = pd.date_range('1/6/2000', freq='D', periods=5, tz=tz)
-            expected1 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-
-            rng2 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-            other2 = pd.date_range('1/4/2000', freq='D', periods=5, tz=tz)
-            expected2 = pd.date_range('1/1/2000', freq='D', periods=3, tz=tz)
-
-            rng3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-            other3 = pd.DatetimeIndex([], tz=tz)
-            expected3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-
-            for rng, other, expected in [(rng1, other1, expected1), (rng2, other2, expected2),
-                                         (rng3, other3, expected3)]:
-                result_union = rng.difference(other)
-
-                tm.assert_index_equal(result_union, expected)
-
-            # offset
-            offsets = [pd.offsets.Hour(2), timedelta(hours=2), np.timedelta64(2, 'h'),
-                       Timedelta(hours=2)]
-
-            for delta in offsets:
-                rng = pd.date_range('2000-01-01', '2000-02-01', tz=tz)
-                result = rng - delta
-                expected = pd.date_range('1999-12-31 22:00', '2000-01-31 22:00', tz=tz)
-                tm.assert_index_equal(result, expected)
-                rng -= delta
-                tm.assert_index_equal(rng, expected)
-
-            # int
-            rng = pd.date_range('2000-01-01 09:00', freq='H', periods=10, tz=tz)
-            result = rng - 1
-            expected = pd.date_range('2000-01-01 08:00', freq='H', periods=10, tz=tz)
-            tm.assert_index_equal(result, expected)
-            rng -= 1
-            tm.assert_index_equal(rng, expected)
-
-    def test_value_counts_unique(self):
-        # GH 7735
-        for tz in [None, 'UTC', 'Asia/Tokyo', 'US/Eastern']:
-            idx = pd.date_range('2011-01-01 09:00', freq='H', periods=10)
-            # create repeated values, 'n'th element is repeated by n+1 times
-            idx = DatetimeIndex(np.repeat(idx.values, range(1, len(idx) + 1)), tz=tz)
-
-            exp_idx = pd.date_range('2011-01-01 18:00', freq='-1H', periods=10, tz=tz)
-            expected = Series(range(10, 0, -1), index=exp_idx, dtype='int64')
-            tm.assert_series_equal(idx.value_counts(), expected)
-
-            expected = pd.date_range('2011-01-01 09:00', freq='H', periods=10, tz=tz)
-            tm.assert_index_equal(idx.unique(), expected)
-
-            idx = DatetimeIndex(['2013-01-01 09:00', '2013-01-01 09:00', '2013-01-01 09:00',
-                                 '2013-01-01 08:00', '2013-01-01 08:00', pd.NaT], tz=tz)
-
-            exp_idx = DatetimeIndex(['2013-01-01 09:00', '2013-01-01 08:00'], tz=tz)
-            expected = Series([3, 2], index=exp_idx)
-            tm.assert_series_equal(idx.value_counts(), expected)
-
-            exp_idx = DatetimeIndex(['2013-01-01 09:00', '2013-01-01 08:00', pd.NaT], tz=tz)
-            expected = Series([3, 2, 1], index=exp_idx)
-            tm.assert_series_equal(idx.value_counts(dropna=False), expected)
-
-            tm.assert_index_equal(idx.unique(), exp_idx)
-
-    def test_nonunique_contains(self):
-        # GH 9512
-        for idx in map(DatetimeIndex, ([0, 1, 0], [0, 0, -1], [0, -1, -1],
-                                       ['2015', '2015', '2016'], ['2015', '2015', '2014'])):
-            tm.assertIn(idx[0], idx)
-
-    def test_order(self):
-        # with freq
-        idx1 = DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'], freq='D', name='idx')
-        idx2 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00'],
-                             freq='H', tz='Asia/Tokyo', name='tzidx')
-
-        for idx in [idx1, idx2]:
-            ordered = idx.sort_values()
-            self.assert_index_equal(ordered, idx)
-            self.assertEqual(ordered.freq, idx.freq)
-
-            ordered = idx.sort_values(ascending=False)
-            expected = idx[::-1]
-            self.assert_index_equal(ordered, expected)
-            self.assertEqual(ordered.freq, expected.freq)
-            self.assertEqual(ordered.freq.n, -1)
-
-            ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, idx)
-            self.assert_numpy_array_equal(indexer, np.array([0, 1, 2]))
-            self.assertEqual(ordered.freq, idx.freq)
-
-            ordered, indexer = idx.sort_values(return_indexer=True, ascending=False)
-            expected = idx[::-1]
-            self.assert_index_equal(ordered, expected)
-            self.assert_numpy_array_equal(indexer, np.array([2, 1, 0]))
-            self.assertEqual(ordered.freq, expected.freq)
-            self.assertEqual(ordered.freq.n, -1)
-
-        # without freq
-        idx1 = DatetimeIndex(['2011-01-01', '2011-01-03', '2011-01-05',
-                              '2011-01-02', '2011-01-01'], name='idx1')
-        exp1 = DatetimeIndex(['2011-01-01', '2011-01-01', '2011-01-02',
-                              '2011-01-03', '2011-01-05'], name='idx1')
-
-        idx2 = DatetimeIndex(['2011-01-01', '2011-01-03', '2011-01-05',
-                              '2011-01-02', '2011-01-01'],
-                             tz='Asia/Tokyo', name='idx2')
-        exp2 = DatetimeIndex(['2011-01-01', '2011-01-01', '2011-01-02',
-                              '2011-01-03', '2011-01-05'],
-                             tz='Asia/Tokyo', name='idx2')
-
-        idx3 = DatetimeIndex([pd.NaT, '2011-01-03', '2011-01-05',
-                              '2011-01-02', pd.NaT], name='idx3')
-        exp3 = DatetimeIndex([pd.NaT, pd.NaT, '2011-01-02', '2011-01-03',
-                              '2011-01-05'], name='idx3')
-
-        for idx, expected in [(idx1, exp1), (idx1, exp1), (idx1, exp1)]:
-            ordered = idx.sort_values()
-            self.assert_index_equal(ordered, expected)
-            self.assertIsNone(ordered.freq)
-
-            ordered = idx.sort_values(ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
-            self.assertIsNone(ordered.freq)
-
-            ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, expected)
-            self.assert_numpy_array_equal(indexer, np.array([0, 4, 3, 1, 2]))
-            self.assertIsNone(ordered.freq)
-
-            ordered, indexer = idx.sort_values(return_indexer=True, ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
-            self.assert_numpy_array_equal(indexer, np.array([2, 1, 3, 4, 0]))
-            self.assertIsNone(ordered.freq)
-
-    def test_getitem(self):
-        idx1 = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
-        idx2 = pd.date_range('2011-01-01', '2011-01-31', freq='D', tz='Asia/Tokyo', name='idx')
-
-        for idx in [idx1, idx2]:
-            result = idx[0]
-            self.assertEqual(result, pd.Timestamp('2011-01-01', tz=idx.tz))
-
-            result = idx[0:5]
-            expected = pd.date_range('2011-01-01', '2011-01-05', freq='D',
-                                     tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx[0:10:2]
-            expected = pd.date_range('2011-01-01', '2011-01-09', freq='2D',
-                                     tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx[-20:-5:3]
-            expected = pd.date_range('2011-01-12', '2011-01-24', freq='3D',
-                                     tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx[4::-1]
-            expected = DatetimeIndex(['2011-01-05', '2011-01-04', '2011-01-03',
-                                      '2011-01-02', '2011-01-01'],
-                                     freq='-1D', tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-    def test_drop_duplicates_metadata(self):
-        #GH 10115
-        idx = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
-        result = idx.drop_duplicates()
-        self.assert_index_equal(idx, result)
-        self.assertEqual(idx.freq, result.freq)
-
-        idx_dup = idx.append(idx)
-        self.assertIsNone(idx_dup.freq)   # freq is reset
-        result = idx_dup.drop_duplicates()
-        self.assert_index_equal(idx, result)
-        self.assertIsNone(result.freq)
-
-    def test_take(self):
-        #GH 10295
-        idx1 = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
-        idx2 = pd.date_range('2011-01-01', '2011-01-31', freq='D', tz='Asia/Tokyo', name='idx')
-
-        for idx in [idx1, idx2]:
-            result = idx.take([0])
-            self.assertEqual(result, pd.Timestamp('2011-01-01', tz=idx.tz))
-
-            result = idx.take([0, 1, 2])
-            expected = pd.date_range('2011-01-01', '2011-01-03', freq='D',
-                                     tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.take([0, 2, 4])
-            expected = pd.date_range('2011-01-01', '2011-01-05', freq='2D',
-                                     tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.take([7, 4, 1])
-            expected = pd.date_range('2011-01-08', '2011-01-02', freq='-3D',
-                                     tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.take([3, 2, 5])
-            expected = DatetimeIndex(['2011-01-04', '2011-01-03', '2011-01-06'],
-                                     freq=None, tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertIsNone(result.freq)
-
-            result = idx.take([-3, 2, 5])
-            expected = DatetimeIndex(['2011-01-29', '2011-01-03', '2011-01-06'],
-                                     freq=None, tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertIsNone(result.freq)
-
-    def test_infer_freq(self):
-        # GH 11018
-        for freq in ['A', '2A', '-2A', 'Q', '-1Q', 'M', '-1M', 'D', '3D', '-3D',
-                     'W', '-1W', 'H', '2H', '-2H', 'T', '2T', 'S', '-3S']:
-            idx = pd.date_range('2011-01-01 09:00:00', freq=freq, periods=10)
-            result = pd.DatetimeIndex(idx.asi8, freq='infer')
-            tm.assert_index_equal(idx, result)
-            self.assertEqual(result.freq, freq)
-
-
-class TestTimedeltaIndexOps(Ops):
-
-    def setUp(self):
-        super(TestTimedeltaIndexOps, self).setUp()
-        mask = lambda x: isinstance(x, TimedeltaIndex)
-        self.is_valid_objs  = [ o for o in self.objs if mask(o) ]
-        self.not_valid_objs = [ ]
-
-    def test_ops_properties(self):
-        self.check_ops_properties(['days','hours','minutes','seconds','milliseconds'])
-        self.check_ops_properties(['microseconds','nanoseconds'])
-
-    def test_asobject_tolist(self):
-        idx = timedelta_range(start='1 days', periods=4, freq='D', name='idx')
-        expected_list = [Timedelta('1 days'),Timedelta('2 days'),Timedelta('3 days'),
-                         Timedelta('4 days')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-
-        self.assertEqual(result.dtype, object)
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.name, expected.name)
-        self.assertEqual(idx.tolist(), expected_list)
-
-        idx = TimedeltaIndex([timedelta(days=1),timedelta(days=2),pd.NaT,
-                              timedelta(days=4)], name='idx')
-        expected_list = [Timedelta('1 days'),Timedelta('2 days'),pd.NaT,
-                         Timedelta('4 days')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-        self.assertEqual(result.dtype, object)
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.name, expected.name)
-        self.assertEqual(idx.tolist(), expected_list)
-
-    def test_minmax(self):
-
-        # monotonic
-        idx1 = TimedeltaIndex(['1 days', '2 days', '3 days'])
-        self.assertTrue(idx1.is_monotonic)
-
-        # non-monotonic
-        idx2 = TimedeltaIndex(['1 days', np.nan, '3 days', 'NaT'])
-        self.assertFalse(idx2.is_monotonic)
-
-        for idx in [idx1, idx2]:
-            self.assertEqual(idx.min(), Timedelta('1 days')),
-            self.assertEqual(idx.max(), Timedelta('3 days')),
-
-        for op in ['min', 'max']:
-            # Return NaT
-            obj = TimedeltaIndex([])
-            self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-            obj = TimedeltaIndex([pd.NaT])
-            self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-            obj = TimedeltaIndex([pd.NaT, pd.NaT, pd.NaT])
-            self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-    def test_representation(self):
-        idx1 = TimedeltaIndex([], freq='D')
-        idx2 = TimedeltaIndex(['1 days'], freq='D')
-        idx3 = TimedeltaIndex(['1 days', '2 days'], freq='D')
-        idx4 = TimedeltaIndex(['1 days', '2 days', '3 days'], freq='D')
-        idx5 = TimedeltaIndex(['1 days 00:00:01', '2 days', '3 days'])
-
-        exp1 = """TimedeltaIndex([], dtype='timedelta64[ns]', freq='D')"""
-
-        exp2 = """TimedeltaIndex(['1 days'], dtype='timedelta64[ns]', freq='D')"""
-
-        exp3 = """TimedeltaIndex(['1 days', '2 days'], dtype='timedelta64[ns]', freq='D')"""
-
-        exp4 = """TimedeltaIndex(['1 days', '2 days', '3 days'], dtype='timedelta64[ns]', freq='D')"""
-
-        exp5 = """TimedeltaIndex(['1 days 00:00:01', '2 days 00:00:00', '3 days 00:00:00'], dtype='timedelta64[ns]', freq=None)"""
-
-        with pd.option_context('display.width',300):
-            for idx, expected in zip([idx1, idx2, idx3, idx4, idx5],
-                                     [exp1, exp2, exp3, exp4, exp5]):
-                for func in ['__repr__', '__unicode__', '__str__']:
-                    result = getattr(idx, func)()
-                    self.assertEqual(result, expected)
-
-    def test_representation_to_series(self):
-        idx1 = TimedeltaIndex([], freq='D')
-        idx2 = TimedeltaIndex(['1 days'], freq='D')
-        idx3 = TimedeltaIndex(['1 days', '2 days'], freq='D')
-        idx4 = TimedeltaIndex(['1 days', '2 days', '3 days'], freq='D')
-        idx5 = TimedeltaIndex(['1 days 00:00:01', '2 days', '3 days'])
-
-        exp1 = """Series([], dtype: timedelta64[ns])"""
-
-        exp2 = """0   1 days
-dtype: timedelta64[ns]"""
-
-        exp3 = """0   1 days
-1   2 days
-dtype: timedelta64[ns]"""
-
-        exp4 = """0   1 days
-1   2 days
-2   3 days
-dtype: timedelta64[ns]"""
-
-        exp5 = """0   1 days 00:00:01
-1   2 days 00:00:00
-2   3 days 00:00:00
-dtype: timedelta64[ns]"""
-
-        with pd.option_context('display.width',300):
-            for idx, expected in zip([idx1, idx2, idx3, idx4, idx5],
-                                     [exp1, exp2, exp3, exp4, exp5]):
-                result = repr(pd.Series(idx))
-                self.assertEqual(result, expected)
-
-    def test_summary(self):
-        # GH9116
-        idx1 = TimedeltaIndex([], freq='D')
-        idx2 = TimedeltaIndex(['1 days'], freq='D')
-        idx3 = TimedeltaIndex(['1 days', '2 days'], freq='D')
-        idx4 = TimedeltaIndex(['1 days', '2 days', '3 days'], freq='D')
-        idx5 = TimedeltaIndex(['1 days 00:00:01', '2 days', '3 days'])
-
-        exp1 = """TimedeltaIndex: 0 entries
-Freq: D"""
-        exp2 = """TimedeltaIndex: 1 entries, 1 days to 1 days
-Freq: D"""
-        exp3 = """TimedeltaIndex: 2 entries, 1 days to 2 days
-Freq: D"""
-        exp4 = """TimedeltaIndex: 3 entries, 1 days to 3 days
-Freq: D"""
-        exp5 = """TimedeltaIndex: 3 entries, 1 days 00:00:01 to 3 days 00:00:00"""
-
-        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5],
-                                 [exp1, exp2, exp3, exp4, exp5]):
-            result = idx.summary()
-            self.assertEqual(result, expected)
-
-    def test_add_iadd(self):
-
-        # only test adding/sub offsets as + is now numeric
-
-        # offset
-        offsets = [pd.offsets.Hour(2), timedelta(hours=2),
-                   np.timedelta64(2, 'h'),  Timedelta(hours=2)]
-
-        for delta in offsets:
-            rng = timedelta_range('1 days','10 days')
-            result = rng + delta
-            expected = timedelta_range('1 days 02:00:00','10 days 02:00:00',freq='D')
-            tm.assert_index_equal(result, expected)
-            rng += delta
-            tm.assert_index_equal(rng, expected)
-
-        # int
-        rng = timedelta_range('1 days 09:00:00', freq='H', periods=10)
-        result = rng + 1
-        expected = timedelta_range('1 days 10:00:00', freq='H', periods=10)
-        tm.assert_index_equal(result, expected)
-        rng += 1
-        tm.assert_index_equal(rng, expected)
-
-    def test_sub_isub(self):
-
-        # only test adding/sub offsets as - is now numeric
-
-        # offset
-        offsets = [pd.offsets.Hour(2), timedelta(hours=2), np.timedelta64(2, 'h'),
-                   Timedelta(hours=2)]
-
-        for delta in offsets:
-            rng = timedelta_range('1 days','10 days')
-            result = rng - delta
-            expected = timedelta_range('0 days 22:00:00', '9 days 22:00:00')
-            tm.assert_index_equal(result, expected)
-            rng -= delta
-            tm.assert_index_equal(rng, expected)
-
-        # int
-        rng = timedelta_range('1 days 09:00:00', freq='H', periods=10)
-        result = rng - 1
-        expected = timedelta_range('1 days 08:00:00', freq='H', periods=10)
-        tm.assert_index_equal(result, expected)
-        rng -= 1
-        tm.assert_index_equal(rng, expected)
-
-    def test_ops_compat(self):
-
-        offsets = [pd.offsets.Hour(2), timedelta(hours=2), np.timedelta64(2, 'h'),
-                   Timedelta(hours=2)]
-
-        rng = timedelta_range('1 days','10 days',name='foo')
-
-        # multiply
-        for offset in offsets:
-            self.assertRaises(TypeError, lambda : rng * offset)
-
-        # divide
-        expected = Int64Index((np.arange(10)+1)*12,name='foo')
-        for offset in offsets:
-            result = rng / offset
-            tm.assert_index_equal(result,expected)
-
-        # divide with nats
-        rng = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
-        expected = Float64Index([12, np.nan, 24], name='foo')
-        for offset in offsets:
-            result = rng / offset
-            tm.assert_index_equal(result,expected)
-
-        # don't allow division by NaT (make could in the future)
-        self.assertRaises(TypeError, lambda : rng / pd.NaT)
-
-    def test_subtraction_ops(self):
-
-        # with datetimes/timedelta and tdi/dti
-        tdi = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
-        dti = date_range('20130101', periods=3, name='bar')
-        td = Timedelta('1 days')
-        dt = Timestamp('20130101')
-
-        self.assertRaises(TypeError, lambda : tdi - dt)
-        self.assertRaises(TypeError, lambda : tdi - dti)
-        self.assertRaises(TypeError, lambda : td - dt)
-        self.assertRaises(TypeError, lambda : td - dti)
-
-        result = dt - dti
-        expected = TimedeltaIndex(['0 days', '-1 days', '-2 days'], name='bar')
-        tm.assert_index_equal(result, expected)
-
-        result = dti - dt
-        expected = TimedeltaIndex(['0 days', '1 days', '2 days'], name='bar')
-        tm.assert_index_equal(result, expected)
-
-        result = tdi - td
-        expected = TimedeltaIndex(['0 days', pd.NaT, '1 days'], name='foo')
-        tm.assert_index_equal(result, expected, check_names=False)
-
-        result = td - tdi
-        expected = TimedeltaIndex(['0 days', pd.NaT, '-1 days'], name='foo')
-        tm.assert_index_equal(result, expected, check_names=False)
-
-        result = dti - td
-        expected = DatetimeIndex(['20121231', '20130101', '20130102'], name='bar')
-        tm.assert_index_equal(result, expected, check_names=False)
-
-        result = dt - tdi
-        expected = DatetimeIndex(['20121231', pd.NaT, '20121230'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-    def test_subtraction_ops_with_tz(self):
-
-        # check that dt/dti subtraction ops with tz are validated
-        dti = date_range('20130101',periods=3)
-        ts = Timestamp('20130101')
-        dt = ts.to_datetime()
-        dti_tz = date_range('20130101',periods=3).tz_localize('US/Eastern')
-        ts_tz = Timestamp('20130101').tz_localize('US/Eastern')
-        ts_tz2 = Timestamp('20130101').tz_localize('CET')
-        dt_tz = ts_tz.to_datetime()
-        td = Timedelta('1 days')
-
-        def _check(result, expected):
-            self.assertEqual(result,expected)
-            self.assertIsInstance(result, Timedelta)
-
-        # scalars
-        result = ts - ts
-        expected = Timedelta('0 days')
-        _check(result, expected)
-
-        result = dt_tz - ts_tz
-        expected = Timedelta('0 days')
-        _check(result, expected)
-
-        result = ts_tz - dt_tz
-        expected = Timedelta('0 days')
-        _check(result, expected)
-
-        # tz mismatches
-        self.assertRaises(TypeError, lambda : dt_tz - ts)
-        self.assertRaises(TypeError, lambda : dt_tz - dt)
-        self.assertRaises(TypeError, lambda : dt_tz - ts_tz2)
-        self.assertRaises(TypeError, lambda : dt - dt_tz)
-        self.assertRaises(TypeError, lambda : ts - dt_tz)
-        self.assertRaises(TypeError, lambda : ts_tz2 - ts)
-        self.assertRaises(TypeError, lambda : ts_tz2 - dt)
-        self.assertRaises(TypeError, lambda : ts_tz - ts_tz2)
-
-        # with dti
-        self.assertRaises(TypeError, lambda : dti - ts_tz)
-        self.assertRaises(TypeError, lambda : dti_tz - ts)
-        self.assertRaises(TypeError, lambda : dti_tz - ts_tz2)
-
-        result = dti_tz-dt_tz
-        expected = TimedeltaIndex(['0 days','1 days','2 days'])
-        tm.assert_index_equal(result,expected)
-
-        result = dt_tz-dti_tz
-        expected = TimedeltaIndex(['0 days','-1 days','-2 days'])
-        tm.assert_index_equal(result,expected)
-
-        result = dti_tz-ts_tz
-        expected = TimedeltaIndex(['0 days','1 days','2 days'])
-        tm.assert_index_equal(result,expected)
-
-        result = ts_tz-dti_tz
-        expected = TimedeltaIndex(['0 days','-1 days','-2 days'])
-        tm.assert_index_equal(result,expected)
-
-        result = td - td
-        expected = Timedelta('0 days')
-        _check(result, expected)
-
-        result = dti_tz - td
-        expected = DatetimeIndex(['20121231','20130101','20130102'],tz='US/Eastern')
-        tm.assert_index_equal(result,expected)
-
-    def test_dti_dti_deprecated_ops(self):
-
-        # deprecated in 0.16.0 (GH9094)
-        # change to return subtraction -> TimeDeltaIndex in 0.17.0
-        # shoudl move to the appropriate sections above
-
-        dti = date_range('20130101',periods=3)
-        dti_tz = date_range('20130101',periods=3).tz_localize('US/Eastern')
-
-        with tm.assert_produces_warning(FutureWarning):
-            result = dti-dti
-            expected = Index([])
-            tm.assert_index_equal(result,expected)
-
-        with tm.assert_produces_warning(FutureWarning):
-            result = dti+dti
-            expected = dti
-            tm.assert_index_equal(result,expected)
-
-        with tm.assert_produces_warning(FutureWarning):
-            result = dti_tz-dti_tz
-            expected = Index([])
-            tm.assert_index_equal(result,expected)
-
-        with tm.assert_produces_warning(FutureWarning):
-            result = dti_tz+dti_tz
-            expected = dti_tz
-            tm.assert_index_equal(result,expected)
-
-        with tm.assert_produces_warning(FutureWarning):
-            result = dti_tz-dti
-            expected = dti_tz
-            tm.assert_index_equal(result,expected)
-
-        with tm.assert_produces_warning(FutureWarning):
-            result = dti-dti_tz
-            expected = dti
-            tm.assert_index_equal(result,expected)
-
-        with tm.assert_produces_warning(FutureWarning):
-            self.assertRaises(TypeError, lambda : dti_tz+dti)
-        with tm.assert_produces_warning(FutureWarning):
-            self.assertRaises(TypeError, lambda : dti+dti_tz)
-
-    def test_dti_tdi_numeric_ops(self):
-
-        # These are normally union/diff set-like ops
-        tdi = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
-        dti = date_range('20130101', periods=3, name='bar')
-        td = Timedelta('1 days')
-        dt = Timestamp('20130101')
-
-        result = tdi - tdi
-        expected = TimedeltaIndex(['0 days', pd.NaT, '0 days'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-        result = tdi + tdi
-        expected = TimedeltaIndex(['2 days', pd.NaT, '4 days'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-        result = dti - tdi   # name will be reset
-        expected = DatetimeIndex(['20121231', pd.NaT, '20130101'])
-        tm.assert_index_equal(result, expected)
-
-    def test_addition_ops(self):
-
-        # with datetimes/timedelta and tdi/dti
-        tdi = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
-        dti = date_range('20130101', periods=3, name='bar')
-        td = Timedelta('1 days')
-        dt = Timestamp('20130101')
-
-        result = tdi + dt
-        expected = DatetimeIndex(['20130102', pd.NaT, '20130103'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-        result = dt + tdi
-        expected = DatetimeIndex(['20130102', pd.NaT, '20130103'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-        result = td + tdi
-        expected = TimedeltaIndex(['2 days', pd.NaT, '3 days'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-        result = tdi + td
-        expected = TimedeltaIndex(['2 days', pd.NaT, '3 days'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-        # unequal length
-        self.assertRaises(ValueError, lambda : tdi + dti[0:1])
-        self.assertRaises(ValueError, lambda : tdi[0:1] + dti)
-
-        # random indexes
-        self.assertRaises(TypeError, lambda : tdi + Int64Index([1,2,3]))
-
-        # this is a union!
-        #self.assertRaises(TypeError, lambda : Int64Index([1,2,3]) + tdi)
-
-        result = tdi + dti   # name will be reset
-        expected = DatetimeIndex(['20130102', pd.NaT, '20130105'])
-        tm.assert_index_equal(result, expected)
-
-        result = dti + tdi   # name will be reset
-        expected = DatetimeIndex(['20130102', pd.NaT, '20130105'])
-        tm.assert_index_equal(result, expected)
-
-        result = dt + td
-        expected = Timestamp('20130102')
-        self.assertEqual(result, expected)
-
-        result = td + dt
-        expected = Timestamp('20130102')
-        self.assertEqual(result, expected)
-
-    def test_value_counts_unique(self):
-        # GH 7735
-
-        idx = timedelta_range('1 days 09:00:00', freq='H', periods=10)
-        # create repeated values, 'n'th element is repeated by n+1 times
-        idx = TimedeltaIndex(np.repeat(idx.values, range(1, len(idx) + 1)))
-
-        exp_idx = timedelta_range('1 days 18:00:00', freq='-1H', periods=10)
-        expected = Series(range(10, 0, -1), index=exp_idx, dtype='int64')
-        tm.assert_series_equal(idx.value_counts(), expected)
-
-        expected = timedelta_range('1 days 09:00:00', freq='H', periods=10)
-        tm.assert_index_equal(idx.unique(), expected)
-
-        idx = TimedeltaIndex(['1 days 09:00:00', '1 days 09:00:00', '1 days 09:00:00',
-                              '1 days 08:00:00', '1 days 08:00:00', pd.NaT])
-
-        exp_idx = TimedeltaIndex(['1 days 09:00:00', '1 days 08:00:00'])
-        expected = Series([3, 2], index=exp_idx)
-        tm.assert_series_equal(idx.value_counts(), expected)
-
-        exp_idx = TimedeltaIndex(['1 days 09:00:00', '1 days 08:00:00', pd.NaT])
-        expected = Series([3, 2, 1], index=exp_idx)
-        tm.assert_series_equal(idx.value_counts(dropna=False), expected)
-
-        tm.assert_index_equal(idx.unique(), exp_idx)
-
-    def test_nonunique_contains(self):
-        # GH 9512
-        for idx in map(TimedeltaIndex, ([0, 1, 0], [0, 0, -1], [0, -1, -1],
-                                        ['00:01:00', '00:01:00', '00:02:00'],
-                                        ['00:01:00', '00:01:00', '00:00:01'])):
-            tm.assertIn(idx[0], idx)
-
-    def test_unknown_attribute(self):
-        #GH 9680
-        tdi = pd.timedelta_range(start=0,periods=10,freq='1s')
-        ts = pd.Series(np.random.normal(size=10),index=tdi)
-        self.assertNotIn('foo',ts.__dict__.keys())
-        self.assertRaises(AttributeError,lambda : ts.foo)
-
-    def test_order(self):
-        #GH 10295
-        idx1 = TimedeltaIndex(['1 day', '2 day', '3 day'], freq='D', name='idx')
-        idx2 = TimedeltaIndex(['1 hour', '2 hour', '3 hour'], freq='H', name='idx')
-
-        for idx in [idx1, idx2]:
-            ordered = idx.sort_values()
-            self.assert_index_equal(ordered, idx)
-            self.assertEqual(ordered.freq, idx.freq)
-
-            ordered = idx.sort_values(ascending=False)
-            expected = idx[::-1]
-            self.assert_index_equal(ordered, expected)
-            self.assertEqual(ordered.freq, expected.freq)
-            self.assertEqual(ordered.freq.n, -1)
-
-            ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, idx)
-            self.assert_numpy_array_equal(indexer, np.array([0, 1, 2]))
-            self.assertEqual(ordered.freq, idx.freq)
-
-            ordered, indexer = idx.sort_values(return_indexer=True, ascending=False)
-            self.assert_index_equal(ordered, idx[::-1])
-            self.assertEqual(ordered.freq, expected.freq)
-            self.assertEqual(ordered.freq.n, -1)
-
-        idx1 = TimedeltaIndex(['1 hour', '3 hour', '5 hour',
-                               '2 hour ', '1 hour'], name='idx1')
-        exp1 = TimedeltaIndex(['1 hour', '1 hour', '2 hour',
-                               '3 hour', '5 hour'], name='idx1')
-
-        idx2 = TimedeltaIndex(['1 day', '3 day', '5 day',
-                               '2 day', '1 day'], name='idx2')
-        exp2 = TimedeltaIndex(['1 day', '1 day', '2 day',
-                               '3 day', '5 day'], name='idx2')
-
-        idx3 = TimedeltaIndex([pd.NaT, '3 minute', '5 minute',
-                               '2 minute', pd.NaT], name='idx3')
-        exp3 = TimedeltaIndex([pd.NaT, pd.NaT, '2 minute', '3 minute',
-                               '5 minute'], name='idx3')
-
-        for idx, expected in [(idx1, exp1), (idx1, exp1), (idx1, exp1)]:
-            ordered = idx.sort_values()
-            self.assert_index_equal(ordered, expected)
-            self.assertIsNone(ordered.freq)
-
-            ordered = idx.sort_values(ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
-            self.assertIsNone(ordered.freq)
-
-            ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, expected)
-            self.assert_numpy_array_equal(indexer, np.array([0, 4, 3, 1, 2]))
-            self.assertIsNone(ordered.freq)
-
-            ordered, indexer = idx.sort_values(return_indexer=True, ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
-            self.assert_numpy_array_equal(indexer, np.array([2, 1, 3, 4, 0]))
-            self.assertIsNone(ordered.freq)
-
-    def test_getitem(self):
-        idx1 = pd.timedelta_range('1 day', '31 day', freq='D', name='idx')
-
-        for idx in [idx1]:
-            result = idx[0]
-            self.assertEqual(result, pd.Timedelta('1 day'))
-
-            result = idx[0:5]
-            expected = pd.timedelta_range('1 day', '5 day', freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx[0:10:2]
-            expected = pd.timedelta_range('1 day', '9 day', freq='2D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx[-20:-5:3]
-            expected = pd.timedelta_range('12 day', '24 day', freq='3D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx[4::-1]
-            expected = TimedeltaIndex(['5 day', '4 day', '3 day', '2 day', '1 day'],
-                                      freq='-1D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-    def test_drop_duplicates_metadata(self):
-        #GH 10115
-        idx = pd.timedelta_range('1 day', '31 day', freq='D', name='idx')
-        result = idx.drop_duplicates()
-        self.assert_index_equal(idx, result)
-        self.assertEqual(idx.freq, result.freq)
-
-        idx_dup = idx.append(idx)
-        self.assertIsNone(idx_dup.freq)   # freq is reset
-        result = idx_dup.drop_duplicates()
-        self.assert_index_equal(idx, result)
-        self.assertIsNone(result.freq)
-
-    def test_take(self):
-        #GH 10295
-        idx1 = pd.timedelta_range('1 day', '31 day', freq='D', name='idx')
-
-        for idx in [idx1]:
-            result = idx.take([0])
-            self.assertEqual(result, pd.Timedelta('1 day'))
-
-            result = idx.take([-1])
-            self.assertEqual(result, pd.Timedelta('31 day'))
-
-            result = idx.take([0, 1, 2])
-            expected = pd.timedelta_range('1 day', '3 day', freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.take([0, 2, 4])
-            expected = pd.timedelta_range('1 day', '5 day', freq='2D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.take([7, 4, 1])
-            expected = pd.timedelta_range('8 day', '2 day', freq='-3D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.take([3, 2, 5])
-            expected = TimedeltaIndex(['4 day', '3 day', '6 day'], name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertIsNone(result.freq)
-
-            result = idx.take([-3, 2, 5])
-            expected = TimedeltaIndex(['29 day', '3 day', '6 day'], name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertIsNone(result.freq)
-
-    def test_infer_freq(self):
-        # GH 11018
-        for freq in ['D', '3D', '-3D', 'H', '2H', '-2H', 'T', '2T', 'S', '-3S']:
-            idx = pd.timedelta_range('1', freq=freq, periods=10)
-            result = pd.TimedeltaIndex(idx.asi8, freq='infer')
-            tm.assert_index_equal(idx, result)
-            self.assertEqual(result.freq, freq)
-
-
-class TestPeriodIndexOps(Ops):
-
-    def setUp(self):
-        super(TestPeriodIndexOps, self).setUp()
-        mask = lambda x: isinstance(x, DatetimeIndex) or isinstance(x, PeriodIndex)
-        self.is_valid_objs  = [ o for o in self.objs if mask(o) ]
-        self.not_valid_objs = [ o for o in self.objs if not mask(o) ]
-
-    def test_ops_properties(self):
-        self.check_ops_properties(['year','month','day','hour','minute','second','weekofyear','week','dayofweek','dayofyear','quarter'])
-        self.check_ops_properties(['qyear'], lambda x: isinstance(x,PeriodIndex))
-
-    def test_asobject_tolist(self):
-        idx = pd.period_range(start='2013-01-01', periods=4, freq='M', name='idx')
-        expected_list = [pd.Period('2013-01-31', freq='M'), pd.Period('2013-02-28', freq='M'),
-                         pd.Period('2013-03-31', freq='M'), pd.Period('2013-04-30', freq='M')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-        self.assertEqual(result.dtype, object)
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.name, expected.name)
-        self.assertEqual(idx.tolist(), expected_list)
-
-        idx = PeriodIndex(['2013-01-01', '2013-01-02', 'NaT', '2013-01-04'], freq='D', name='idx')
-        expected_list = [pd.Period('2013-01-01', freq='D'), pd.Period('2013-01-02', freq='D'),
-                         pd.Period('NaT', freq='D'), pd.Period('2013-01-04', freq='D')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-        self.assertEqual(result.dtype, object)
-        for i in [0, 1, 3]:
-            self.assertTrue(result[i], expected[i])
-        self.assertTrue(result[2].ordinal, pd.tslib.iNaT)
-        self.assertTrue(result[2].freq, 'D')
-        self.assertEqual(result.name, expected.name)
-
-        result_list = idx.tolist()
-        for i in [0, 1, 3]:
-            self.assertTrue(result_list[i], expected_list[i])
-        self.assertTrue(result_list[2].ordinal, pd.tslib.iNaT)
-        self.assertTrue(result_list[2].freq, 'D')
-
-    def test_minmax(self):
-
-        # monotonic
-        idx1 = pd.PeriodIndex([pd.NaT, '2011-01-01', '2011-01-02',
-                               '2011-01-03'], freq='D')
-        self.assertTrue(idx1.is_monotonic)
-
-        # non-monotonic
-        idx2 = pd.PeriodIndex(['2011-01-01', pd.NaT, '2011-01-03',
-                                '2011-01-02', pd.NaT], freq='D')
-        self.assertFalse(idx2.is_monotonic)
-
-        for idx in [idx1, idx2]:
-            self.assertEqual(idx.min(), pd.Period('2011-01-01', freq='D'))
-            self.assertEqual(idx.max(), pd.Period('2011-01-03', freq='D'))
-
-        for op in ['min', 'max']:
-            # Return NaT
-            obj = PeriodIndex([], freq='M')
-            result = getattr(obj, op)()
-            self.assertEqual(result.ordinal, tslib.iNaT)
-            self.assertEqual(result.freq, 'M')
-
-            obj = PeriodIndex([pd.NaT], freq='M')
-            result = getattr(obj, op)()
-            self.assertEqual(result.ordinal, tslib.iNaT)
-            self.assertEqual(result.freq, 'M')
-
-            obj = PeriodIndex([pd.NaT, pd.NaT, pd.NaT], freq='M')
-            result = getattr(obj, op)()
-            self.assertEqual(result.ordinal, tslib.iNaT)
-            self.assertEqual(result.freq, 'M')
-
-    def test_representation(self):
-        # GH 7601
-        idx1 = PeriodIndex([], freq='D')
-        idx2 = PeriodIndex(['2011-01-01'], freq='D')
-        idx3 = PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
-        idx4 = PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'], freq='D')
-        idx5 = PeriodIndex(['2011', '2012', '2013'], freq='A')
-        idx6 = PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'], freq='H')
-
-        idx7 = pd.period_range('2013Q1', periods=1, freq="Q")
-        idx8 = pd.period_range('2013Q1', periods=2, freq="Q")
-        idx9 = pd.period_range('2013Q1', periods=3, freq="Q")
-
-        exp1 = """PeriodIndex([], dtype='int64', freq='D')"""
-
-        exp2 = """PeriodIndex(['2011-01-01'], dtype='int64', freq='D')"""
-
-        exp3 = """PeriodIndex(['2011-01-01', '2011-01-02'], dtype='int64', freq='D')"""
-
-        exp4 = """PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'], dtype='int64', freq='D')"""
-
-        exp5 = """PeriodIndex(['2011', '2012', '2013'], dtype='int64', freq='A-DEC')"""
-
-        exp6 = """PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'], dtype='int64', freq='H')"""
-
-        exp7 = """PeriodIndex(['2013Q1'], dtype='int64', freq='Q-DEC')"""
-
-        exp8 = """PeriodIndex(['2013Q1', '2013Q2'], dtype='int64', freq='Q-DEC')"""
-
-        exp9 = """PeriodIndex(['2013Q1', '2013Q2', '2013Q3'], dtype='int64', freq='Q-DEC')"""
-
-        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5, idx6, idx7, idx8, idx9],
-                                 [exp1, exp2, exp3, exp4, exp5, exp6, exp7, exp8, exp9]):
-            for func in ['__repr__', '__unicode__', '__str__']:
-                result = getattr(idx, func)()
-                self.assertEqual(result, expected)
-
-    def test_representation_to_series(self):
-        # GH 10971
-        idx1 = PeriodIndex([], freq='D')
-        idx2 = PeriodIndex(['2011-01-01'], freq='D')
-        idx3 = PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
-        idx4 = PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'], freq='D')
-        idx5 = PeriodIndex(['2011', '2012', '2013'], freq='A')
-        idx6 = PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'], freq='H')
-
-        idx7 = pd.period_range('2013Q1', periods=1, freq="Q")
-        idx8 = pd.period_range('2013Q1', periods=2, freq="Q")
-        idx9 = pd.period_range('2013Q1', periods=3, freq="Q")
-
-        exp1 = """Series([], dtype: object)"""
-
-        exp2 = """0   2011-01-01
-dtype: object"""
-
-        exp3 = """0   2011-01-01
-1   2011-01-02
-dtype: object"""
-
-        exp4 = """0   2011-01-01
-1   2011-01-02
-2   2011-01-03
-dtype: object"""
-
-        exp5 = """0   2011
-1   2012
-2   2013
-dtype: object"""
-
-        exp6 = """0   2011-01-01 09:00
-1   2012-02-01 10:00
-2                NaT
-dtype: object"""
-
-        exp7 = """0   2013Q1
-dtype: object"""
-
-        exp8 = """0   2013Q1
-1   2013Q2
-dtype: object"""
-
-        exp9 = """0   2013Q1
-1   2013Q2
-2   2013Q3
-dtype: object"""
-
-        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5, idx6, idx7, idx8, idx9],
-                                 [exp1, exp2, exp3, exp4, exp5, exp6, exp7, exp8, exp9]):
-            result = repr(pd.Series(idx))
-            self.assertEqual(result, expected)
-
-    def test_summary(self):
-        # GH9116
-        idx1 = PeriodIndex([], freq='D')
-        idx2 = PeriodIndex(['2011-01-01'], freq='D')
-        idx3 = PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
-        idx4 = PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'], freq='D')
-        idx5 = PeriodIndex(['2011', '2012', '2013'], freq='A')
-        idx6 = PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'], freq='H')
-
-        idx7 = pd.period_range('2013Q1', periods=1, freq="Q")
-        idx8 = pd.period_range('2013Q1', periods=2, freq="Q")
-        idx9 = pd.period_range('2013Q1', periods=3, freq="Q")
-
-        exp1 = """PeriodIndex: 0 entries
-Freq: D"""
-        exp2 = """PeriodIndex: 1 entries, 2011-01-01 to 2011-01-01
-Freq: D"""
-        exp3 = """PeriodIndex: 2 entries, 2011-01-01 to 2011-01-02
-Freq: D"""
-        exp4 = """PeriodIndex: 3 entries, 2011-01-01 to 2011-01-03
-Freq: D"""
-        exp5 = """PeriodIndex: 3 entries, 2011 to 2013
-Freq: A-DEC"""
-        exp6 = """PeriodIndex: 3 entries, 2011-01-01 09:00 to NaT
-Freq: H"""
-        exp7 = """PeriodIndex: 1 entries, 2013Q1 to 2013Q1
-Freq: Q-DEC"""
-        exp8 = """PeriodIndex: 2 entries, 2013Q1 to 2013Q2
-Freq: Q-DEC"""
-        exp9 = """PeriodIndex: 3 entries, 2013Q1 to 2013Q3
-Freq: Q-DEC"""
-
-        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5, idx6, idx7, idx8, idx9],
-                                 [exp1, exp2, exp3, exp4, exp5, exp6, exp7, exp8, exp9]):
-            result = idx.summary()
-            self.assertEqual(result, expected)
-
-    def test_resolution(self):
-        for freq, expected in zip(['A', 'Q', 'M', 'D', 'H', 'T', 'S', 'L', 'U'],
-                                  ['day', 'day', 'day', 'day',
-                                   'hour', 'minute', 'second', 'millisecond', 'microsecond']):
-
-            idx = pd.period_range(start='2013-04-01', periods=30, freq=freq)
-            self.assertEqual(idx.resolution, expected)
-
-    def test_add_iadd(self):
-        # union
-        rng1 = pd.period_range('1/1/2000', freq='D', periods=5)
-        other1 = pd.period_range('1/6/2000', freq='D', periods=5)
-        expected1 = pd.period_range('1/1/2000', freq='D', periods=10)
-
-        rng2 = pd.period_range('1/1/2000', freq='D', periods=5)
-        other2 = pd.period_range('1/4/2000', freq='D', periods=5)
-        expected2 = pd.period_range('1/1/2000', freq='D', periods=8)
-
-        rng3 = pd.period_range('1/1/2000', freq='D', periods=5)
-        other3 = pd.PeriodIndex([], freq='D')
-        expected3 = pd.period_range('1/1/2000', freq='D', periods=5)
-
-        rng4 = pd.period_range('2000-01-01 09:00', freq='H', periods=5)
-        other4 = pd.period_range('2000-01-02 09:00', freq='H', periods=5)
-        expected4 = pd.PeriodIndex(['2000-01-01 09:00', '2000-01-01 10:00',
-                                    '2000-01-01 11:00', '2000-01-01 12:00',
-                                    '2000-01-01 13:00', '2000-01-02 09:00',
-                                    '2000-01-02 10:00', '2000-01-02 11:00',
-                                    '2000-01-02 12:00', '2000-01-02 13:00'],
-                                   freq='H')
-
-        rng5 = pd.PeriodIndex(['2000-01-01 09:01', '2000-01-01 09:03',
-                               '2000-01-01 09:05'], freq='T')
-        other5 = pd.PeriodIndex(['2000-01-01 09:01', '2000-01-01 09:05'
-                                 '2000-01-01 09:08'], freq='T')
-        expected5 = pd.PeriodIndex(['2000-01-01 09:01', '2000-01-01 09:03',
-                                    '2000-01-01 09:05', '2000-01-01 09:08'],
-                                   freq='T')
-
-        rng6 = pd.period_range('2000-01-01', freq='M', periods=7)
-        other6 = pd.period_range('2000-04-01', freq='M', periods=7)
-        expected6 = pd.period_range('2000-01-01', freq='M', periods=10)
-
-        rng7 = pd.period_range('2003-01-01', freq='A', periods=5)
-        other7 = pd.period_range('1998-01-01', freq='A', periods=8)
-        expected7 = pd.period_range('1998-01-01', freq='A', periods=10)
-
-        for rng, other, expected in [(rng1, other1, expected1), (rng2, other2, expected2),
-                                     (rng3, other3, expected3), (rng4, other4, expected4),
-                                     (rng5, other5, expected5), (rng6, other6, expected6),
-                                     (rng7, other7, expected7)]:
-
-            # GH9094
-            with tm.assert_produces_warning(FutureWarning):
-                result_add = rng + other
-
-            result_union = rng.union(other)
-
-            tm.assert_index_equal(result_add, expected)
-            tm.assert_index_equal(result_union, expected)
-
-            # GH 6527
-            # GH9094
-            with tm.assert_produces_warning(FutureWarning):
-                rng += other
-            tm.assert_index_equal(rng, expected)
-
-        # offset
-        # DateOffset
-        rng = pd.period_range('2014', '2024', freq='A')
-        result = rng + pd.offsets.YearEnd(5)
-        expected = pd.period_range('2019', '2029', freq='A')
-        tm.assert_index_equal(result, expected)
-        rng += pd.offsets.YearEnd(5)
-        tm.assert_index_equal(rng, expected)
-
-        for o in [pd.offsets.YearBegin(2), pd.offsets.MonthBegin(1), pd.offsets.Minute(),
-                  np.timedelta64(365, 'D'), timedelta(365), Timedelta(days=365)]:
-            msg = 'Input has different freq from PeriodIndex\\(freq=A-DEC\\)'
-            with tm.assertRaisesRegexp(ValueError, 'Input has different freq from Period'):
-                rng + o
-
-        rng = pd.period_range('2014-01', '2016-12', freq='M')
-        result = rng + pd.offsets.MonthEnd(5)
-        expected = pd.period_range('2014-06', '2017-05', freq='M')
-        tm.assert_index_equal(result, expected)
-        rng += pd.offsets.MonthEnd(5)
-        tm.assert_index_equal(rng, expected)
-
-        for o in [pd.offsets.YearBegin(2), pd.offsets.MonthBegin(1), pd.offsets.Minute(),
-                  np.timedelta64(365, 'D'), timedelta(365),  Timedelta(days=365)]:
-            rng = pd.period_range('2014-01', '2016-12', freq='M')
-            msg = 'Input has different freq from PeriodIndex\\(freq=M\\)'
-            with tm.assertRaisesRegexp(ValueError, msg):
-                rng + o
-
-        # Tick
-        offsets = [pd.offsets.Day(3), timedelta(days=3), np.timedelta64(3, 'D'),
-                   pd.offsets.Hour(72), timedelta(minutes=60*24*3),
-                   np.timedelta64(72, 'h'), Timedelta('72:00:00')]
-        for delta in offsets:
-            rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
-            result = rng + delta
-            expected = pd.period_range('2014-05-04', '2014-05-18', freq='D')
-            tm.assert_index_equal(result, expected)
-            rng += delta
-            tm.assert_index_equal(rng, expected)
-
-        for o in [pd.offsets.YearBegin(2), pd.offsets.MonthBegin(1), pd.offsets.Minute(),
-                  np.timedelta64(4, 'h'), timedelta(hours=23), Timedelta('23:00:00')]:
-            rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
-            msg = 'Input has different freq from PeriodIndex\\(freq=D\\)'
-            with tm.assertRaisesRegexp(ValueError, msg):
-                rng + o
-
-        offsets = [pd.offsets.Hour(2), timedelta(hours=2), np.timedelta64(2, 'h'),
-                   pd.offsets.Minute(120), timedelta(minutes=120),
-                   np.timedelta64(120, 'm'), Timedelta(minutes=120)]
-        for delta in offsets:
-            rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00', freq='H')
-            result = rng + delta
-            expected = pd.period_range('2014-01-01 12:00', '2014-01-05 12:00', freq='H')
-            tm.assert_index_equal(result, expected)
-            rng += delta
-            tm.assert_index_equal(rng, expected)
-
-        for delta in [pd.offsets.YearBegin(2), timedelta(minutes=30),
-                      np.timedelta64(30, 's'),  Timedelta(seconds=30)]:
-            rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00', freq='H')
-            msg = 'Input has different freq from PeriodIndex\\(freq=H\\)'
-            with tm.assertRaisesRegexp(ValueError, msg):
-                result = rng + delta
-            with tm.assertRaisesRegexp(ValueError, msg):
-                rng += delta
-
-        # int
-        rng = pd.period_range('2000-01-01 09:00', freq='H', periods=10)
-        result = rng + 1
-        expected = pd.period_range('2000-01-01 10:00', freq='H', periods=10)
-        tm.assert_index_equal(result, expected)
-        rng += 1
-        tm.assert_index_equal(rng, expected)
-
-    def test_sub_isub(self):
-        # diff
-        rng1 = pd.period_range('1/1/2000', freq='D', periods=5)
-        other1 = pd.period_range('1/6/2000', freq='D', periods=5)
-        expected1 = pd.period_range('1/1/2000', freq='D', periods=5)
-
-        rng2 = pd.period_range('1/1/2000', freq='D', periods=5)
-        other2 = pd.period_range('1/4/2000', freq='D', periods=5)
-        expected2 = pd.period_range('1/1/2000', freq='D', periods=3)
-
-        rng3 = pd.period_range('1/1/2000', freq='D', periods=5)
-        other3 = pd.PeriodIndex([], freq='D')
-        expected3 = pd.period_range('1/1/2000', freq='D', periods=5)
-
-        rng4 = pd.period_range('2000-01-01 09:00', freq='H', periods=5)
-        other4 = pd.period_range('2000-01-02 09:00', freq='H', periods=5)
-        expected4 = rng4
-
-        rng5 = pd.PeriodIndex(['2000-01-01 09:01', '2000-01-01 09:03',
-                               '2000-01-01 09:05'], freq='T')
-        other5 = pd.PeriodIndex(['2000-01-01 09:01', '2000-01-01 09:05'], freq='T')
-        expected5 = pd.PeriodIndex(['2000-01-01 09:03'], freq='T')
-
-        rng6 = pd.period_range('2000-01-01', freq='M', periods=7)
-        other6 = pd.period_range('2000-04-01', freq='M', periods=7)
-        expected6 = pd.period_range('2000-01-01', freq='M', periods=3)
-
-        rng7 = pd.period_range('2003-01-01', freq='A', periods=5)
-        other7 = pd.period_range('1998-01-01', freq='A', periods=8)
-        expected7 = pd.period_range('2006-01-01', freq='A', periods=2)
-
-        for rng, other, expected in [(rng1, other1, expected1), (rng2, other2, expected2),
-                                     (rng3, other3, expected3), (rng4, other4, expected4),
-                                     (rng5, other5, expected5), (rng6, other6, expected6),
-                                     (rng7, other7, expected7),]:
-            result_union = rng.difference(other)
-            tm.assert_index_equal(result_union, expected)
-
-        # offset
-        # DateOffset
-        rng = pd.period_range('2014', '2024', freq='A')
-        result = rng - pd.offsets.YearEnd(5)
-        expected = pd.period_range('2009', '2019', freq='A')
-        tm.assert_index_equal(result, expected)
-        rng -= pd.offsets.YearEnd(5)
-        tm.assert_index_equal(rng, expected)
-
-        for o in [pd.offsets.YearBegin(2), pd.offsets.MonthBegin(1), pd.offsets.Minute(),
-                  np.timedelta64(365, 'D'), timedelta(365)]:
-            rng = pd.period_range('2014', '2024', freq='A')
-            msg = 'Input has different freq from PeriodIndex\\(freq=A-DEC\\)'
-            with tm.assertRaisesRegexp(ValueError, msg):
-                rng - o
-
-        rng = pd.period_range('2014-01', '2016-12', freq='M')
-        result = rng - pd.offsets.MonthEnd(5)
-        expected = pd.period_range('2013-08', '2016-07', freq='M')
-        tm.assert_index_equal(result, expected)
-        rng -= pd.offsets.MonthEnd(5)
-        tm.assert_index_equal(rng, expected)
-
-        for o in [pd.offsets.YearBegin(2), pd.offsets.MonthBegin(1), pd.offsets.Minute(),
-                  np.timedelta64(365, 'D'), timedelta(365)]:
-            rng = pd.period_range('2014-01', '2016-12', freq='M')
-            msg = 'Input has different freq from PeriodIndex\\(freq=M\\)'
-            with tm.assertRaisesRegexp(ValueError, msg):
-                rng - o
-
-        # Tick
-        offsets = [pd.offsets.Day(3), timedelta(days=3), np.timedelta64(3, 'D'),
-                   pd.offsets.Hour(72), timedelta(minutes=60*24*3), np.timedelta64(72, 'h')]
-        for delta in offsets:
-            rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
-            result = rng - delta
-            expected = pd.period_range('2014-04-28', '2014-05-12', freq='D')
-            tm.assert_index_equal(result, expected)
-            rng -= delta
-            tm.assert_index_equal(rng, expected)
-
-        for o in [pd.offsets.YearBegin(2), pd.offsets.MonthBegin(1), pd.offsets.Minute(),
-                  np.timedelta64(4, 'h'), timedelta(hours=23)]:
-            rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
-            msg = 'Input has different freq from PeriodIndex\\(freq=D\\)'
-            with tm.assertRaisesRegexp(ValueError, msg):
-                rng - o
-
-        offsets = [pd.offsets.Hour(2), timedelta(hours=2), np.timedelta64(2, 'h'),
-                   pd.offsets.Minute(120), timedelta(minutes=120), np.timedelta64(120, 'm')]
-        for delta in offsets:
-            rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00', freq='H')
-            result = rng - delta
-            expected = pd.period_range('2014-01-01 08:00', '2014-01-05 08:00', freq='H')
-            tm.assert_index_equal(result, expected)
-            rng -= delta
-            tm.assert_index_equal(rng, expected)
-
-        for delta in [pd.offsets.YearBegin(2), timedelta(minutes=30), np.timedelta64(30, 's')]:
-            rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00', freq='H')
-            msg = 'Input has different freq from PeriodIndex\\(freq=H\\)'
-            with tm.assertRaisesRegexp(ValueError, msg):
-                result = rng + delta
-            with tm.assertRaisesRegexp(ValueError, msg):
-                rng += delta
-
-        # int
-        rng = pd.period_range('2000-01-01 09:00', freq='H', periods=10)
-        result = rng - 1
-        expected = pd.period_range('2000-01-01 08:00', freq='H', periods=10)
-        tm.assert_index_equal(result, expected)
-        rng -= 1
-        tm.assert_index_equal(rng, expected)
-
-    def test_value_counts_unique(self):
-        # GH 7735
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=10)
-        # create repeated values, 'n'th element is repeated by n+1 times
-        idx = PeriodIndex(np.repeat(idx.values, range(1, len(idx) + 1)), freq='H')
-
-        exp_idx = PeriodIndex(['2011-01-01 18:00', '2011-01-01 17:00', '2011-01-01 16:00',
-                               '2011-01-01 15:00', '2011-01-01 14:00', '2011-01-01 13:00',
-                               '2011-01-01 12:00', '2011-01-01 11:00', '2011-01-01 10:00',
-                               '2011-01-01 09:00'], freq='H')
-        expected = Series(range(10, 0, -1), index=exp_idx, dtype='int64')
-        tm.assert_series_equal(idx.value_counts(), expected)
-
-        expected = pd.period_range('2011-01-01 09:00', freq='H', periods=10)
-        tm.assert_index_equal(idx.unique(), expected)
-
-        idx = PeriodIndex(['2013-01-01 09:00', '2013-01-01 09:00', '2013-01-01 09:00',
-                           '2013-01-01 08:00', '2013-01-01 08:00', pd.NaT], freq='H')
-
-        exp_idx = PeriodIndex(['2013-01-01 09:00', '2013-01-01 08:00'], freq='H')
-        expected = Series([3, 2], index=exp_idx)
-        tm.assert_series_equal(idx.value_counts(), expected)
-
-        exp_idx = PeriodIndex(['2013-01-01 09:00', '2013-01-01 08:00', pd.NaT], freq='H')
-        expected = Series([3, 2, 1], index=exp_idx)
-        tm.assert_series_equal(idx.value_counts(dropna=False), expected)
-
-        tm.assert_index_equal(idx.unique(), exp_idx)
-
-    def test_drop_duplicates_metadata(self):
-        #GH 10115
-        idx = pd.period_range('2011-01-01', '2011-01-31', freq='D', name='idx')
-        result = idx.drop_duplicates()
-        self.assert_index_equal(idx, result)
-        self.assertEqual(idx.freq, result.freq)
-
-        idx_dup = idx.append(idx) # freq will not be reset
-        result = idx_dup.drop_duplicates()
-        self.assert_index_equal(idx, result)
-        self.assertEqual(idx.freq, result.freq)
-
-    def test_order_compat(self):
-
-        def _check_freq(index, expected_index):
-            if isinstance(index, PeriodIndex):
-                self.assertEqual(index.freq, expected_index.freq)
-
-        pidx = PeriodIndex(['2011', '2012', '2013'], name='pidx', freq='A')
-        # for compatibility check
-        iidx = Index([2011, 2012, 2013], name='idx')
-        for idx in [pidx, iidx]:
-            ordered = idx.sort_values()
-            self.assert_index_equal(ordered, idx)
-            _check_freq(ordered, idx)
-
-            ordered = idx.sort_values(ascending=False)
-            self.assert_index_equal(ordered, idx[::-1])
-            _check_freq(ordered, idx[::-1])
-
-            ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, idx)
-            self.assert_numpy_array_equal(indexer, np.array([0, 1, 2]))
-            _check_freq(ordered, idx)
-
-            ordered, indexer = idx.sort_values(return_indexer=True, ascending=False)
-            self.assert_index_equal(ordered, idx[::-1])
-            self.assert_numpy_array_equal(indexer, np.array([2, 1, 0]))
-            _check_freq(ordered, idx[::-1])
-
-        pidx = PeriodIndex(['2011', '2013', '2015', '2012', '2011'], name='pidx', freq='A')
-        pexpected = PeriodIndex(['2011', '2011', '2012', '2013', '2015'], name='pidx', freq='A')
-        # for compatibility check
-        iidx = Index([2011, 2013, 2015, 2012, 2011], name='idx')
-        iexpected = Index([2011, 2011, 2012, 2013, 2015], name='idx')
-        for idx, expected in [(pidx, pexpected), (iidx, iexpected)]:
-            ordered = idx.sort_values()
-            self.assert_index_equal(ordered, expected)
-            _check_freq(ordered, idx)
-
-            ordered = idx.sort_values(ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
-            _check_freq(ordered, idx)
-
-            ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, expected)
-            self.assert_numpy_array_equal(indexer, np.array([0, 4, 3, 1, 2]))
-            _check_freq(ordered, idx)
-
-            ordered, indexer = idx.sort_values(return_indexer=True, ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
-            self.assert_numpy_array_equal(indexer, np.array([2, 1, 3, 4, 0]))
-            _check_freq(ordered, idx)
-
-        pidx = PeriodIndex(['2011', '2013', 'NaT', '2011'], name='pidx', freq='D')
-
-        result = pidx.sort_values()
-        expected = PeriodIndex(['NaT', '2011', '2011', '2013'], name='pidx', freq='D')
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.freq, 'D')
-
-        result = pidx.sort_values(ascending=False)
-        expected = PeriodIndex(['2013', '2011', '2011', 'NaT'], name='pidx', freq='D')
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.freq, 'D')
-
-    def test_order(self):
-        for freq in ['D', '2D', '4D']:
-            idx = PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
-                              freq=freq, name='idx')
-
-            ordered = idx.sort_values()
-            self.assert_index_equal(ordered, idx)
-            self.assertEqual(ordered.freq, idx.freq)
-
-            ordered = idx.sort_values(ascending=False)
-            expected = idx[::-1]
-            self.assert_index_equal(ordered, expected)
-            self.assertEqual(ordered.freq, expected.freq)
-            self.assertEqual(ordered.freq, freq)
-
-            ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, idx)
-            self.assert_numpy_array_equal(indexer, np.array([0, 1, 2]))
-            self.assertEqual(ordered.freq, idx.freq)
-            self.assertEqual(ordered.freq, freq)
-
-            ordered, indexer = idx.sort_values(return_indexer=True, ascending=False)
-            expected = idx[::-1]
-            self.assert_index_equal(ordered, expected)
-            self.assert_numpy_array_equal(indexer, np.array([2, 1, 0]))
-            self.assertEqual(ordered.freq, expected.freq)
-            self.assertEqual(ordered.freq, freq)
-
-        idx1 = PeriodIndex(['2011-01-01', '2011-01-03', '2011-01-05',
-                            '2011-01-02', '2011-01-01'], freq='D', name='idx1')
-        exp1 = PeriodIndex(['2011-01-01', '2011-01-01', '2011-01-02',
-                            '2011-01-03', '2011-01-05'], freq='D', name='idx1')
-
-        idx2 = PeriodIndex(['2011-01-01', '2011-01-03', '2011-01-05',
-                            '2011-01-02', '2011-01-01'],
-                           freq='D',  name='idx2')
-        exp2 = PeriodIndex(['2011-01-01', '2011-01-01', '2011-01-02',
-                            '2011-01-03', '2011-01-05'],
-                           freq='D', name='idx2')
-
-        idx3 = PeriodIndex([pd.NaT, '2011-01-03', '2011-01-05',
-                            '2011-01-02', pd.NaT], freq='D', name='idx3')
-        exp3 = PeriodIndex([pd.NaT, pd.NaT, '2011-01-02', '2011-01-03',
-                            '2011-01-05'], freq='D', name='idx3')
-
-        for idx, expected in [(idx1, exp1), (idx1, exp1), (idx1, exp1)]:
-            ordered = idx.sort_values()
-            self.assert_index_equal(ordered, expected)
-            self.assertEqual(ordered.freq, 'D')
-
-            ordered = idx.sort_values(ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
-            self.assertEqual(ordered.freq, 'D')
-
-            ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, expected)
-            self.assert_numpy_array_equal(indexer, np.array([0, 4, 3, 1, 2]))
-            self.assertEqual(ordered.freq, 'D')
-
-            ordered, indexer = idx.sort_values(return_indexer=True, ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
-            self.assert_numpy_array_equal(indexer, np.array([2, 1, 3, 4, 0]))
-            self.assertEqual(ordered.freq, 'D')
-
-    def test_getitem(self):
-        idx1 = pd.period_range('2011-01-01', '2011-01-31', freq='D', name='idx')
-
-        for idx in [idx1]:
-            result = idx[0]
-            self.assertEqual(result, pd.Period('2011-01-01', freq='D'))
-
-            result = idx[-1]
-            self.assertEqual(result, pd.Period('2011-01-31', freq='D'))
-
-            result = idx[0:5]
-            expected = pd.period_range('2011-01-01', '2011-01-05', freq='D',
-                                       name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
-
-            result = idx[0:10:2]
-            expected = pd.PeriodIndex(['2011-01-01', '2011-01-03', '2011-01-05',
-                                       '2011-01-07', '2011-01-09'],
-                                      freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
-
-            result = idx[-20:-5:3]
-            expected = pd.PeriodIndex(['2011-01-12', '2011-01-15', '2011-01-18',
-                                       '2011-01-21', '2011-01-24'],
-                                      freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
-
-            result = idx[4::-1]
-            expected = PeriodIndex(['2011-01-05', '2011-01-04', '2011-01-03',
-                                   '2011-01-02', '2011-01-01'],
-                                   freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
-
-    def test_take(self):
-        #GH 10295
-        idx1 = pd.period_range('2011-01-01', '2011-01-31', freq='D', name='idx')
-
-        for idx in [idx1]:
-            result = idx.take([0])
-            self.assertEqual(result, pd.Period('2011-01-01', freq='D'))
-
-            result = idx.take([5])
-            self.assertEqual(result, pd.Period('2011-01-06', freq='D'))
-
-            result = idx.take([0, 1, 2])
-            expected = pd.period_range('2011-01-01', '2011-01-03', freq='D',
-                                       name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, 'D')
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.take([0, 2, 4])
-            expected = pd.PeriodIndex(['2011-01-01', '2011-01-03', '2011-01-05'],
-                                      freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
-
-            result = idx.take([7, 4, 1])
-            expected = pd.PeriodIndex(['2011-01-08', '2011-01-05', '2011-01-02'],
-                                      freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
-
-            result = idx.take([3, 2, 5])
-            expected = PeriodIndex(['2011-01-04', '2011-01-03', '2011-01-06'],
-                                   freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
-
-            result = idx.take([-3, 2, 5])
-            expected = PeriodIndex(['2011-01-29', '2011-01-03', '2011-01-06'],
-                                   freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
-
-
-if __name__ == '__main__':
-    import nose
-
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   # '--with-coverage', '--cover-package=pandas.core'],
-                   exit=False)
diff --git a/pandas/tseries/tests/test_converter.py b/pandas/tseries/tests/test_converter.py
deleted file mode 100644
index 95c0b4466da26..0000000000000
--- a/pandas/tseries/tests/test_converter.py
+++ /dev/null
@@ -1,163 +0,0 @@
-from datetime import datetime, time, timedelta, date
-import sys
-import os
-
-import nose
-
-import numpy as np
-from numpy.testing import assert_almost_equal as np_assert_almost_equal
-from pandas import Timestamp, Period
-from pandas.compat import u
-import pandas.util.testing as tm
-from pandas.tseries.offsets import Second, Milli, Micro
-
-try:
-    import pandas.tseries.converter as converter
-except ImportError:
-    raise nose.SkipTest("no pandas.tseries.converter, skipping")
-
-
-def test_timtetonum_accepts_unicode():
-    assert(converter.time2num("00:01") == converter.time2num(u("00:01")))
-
-
-class TestDateTimeConverter(tm.TestCase):
-
-    def setUp(self):
-        self.dtc = converter.DatetimeConverter()
-        self.tc = converter.TimeFormatter(None)
-
-    def test_convert_accepts_unicode(self):
-        r1 = self.dtc.convert("12:22", None, None)
-        r2 = self.dtc.convert(u("12:22"), None, None)
-        assert(r1 == r2), "DatetimeConverter.convert should accept unicode"
-
-    def test_conversion(self):
-        rs = self.dtc.convert(['2012-1-1'], None, None)[0]
-        xp = datetime(2012, 1, 1).toordinal()
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert('2012-1-1', None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert(date(2012, 1, 1), None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert(datetime(2012, 1, 1).toordinal(), None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert('2012-1-1', None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert(Timestamp('2012-1-1'), None, None)
-        self.assertEqual(rs, xp)
-
-        # also testing datetime64 dtype (GH8614)
-        rs = self.dtc.convert(np.datetime64('2012-01-01'), None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert(np.datetime64('2012-01-01 00:00:00+00:00'), None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert(np.array([np.datetime64('2012-01-01 00:00:00+00:00'),
-                                        np.datetime64('2012-01-02 00:00:00+00:00')]), None, None)
-        self.assertEqual(rs[0], xp)
-
-    def test_conversion_float(self):
-        decimals = 9
-
-        rs = self.dtc.convert(Timestamp('2012-1-1 01:02:03', tz='UTC'), None, None)
-        xp = converter.dates.date2num(Timestamp('2012-1-1 01:02:03', tz='UTC'))
-        np_assert_almost_equal(rs, xp, decimals)
-
-        rs = self.dtc.convert(Timestamp('2012-1-1 09:02:03', tz='Asia/Hong_Kong'), None, None)
-        np_assert_almost_equal(rs, xp, decimals)
-
-        rs = self.dtc.convert(datetime(2012, 1, 1, 1, 2, 3), None, None)
-        np_assert_almost_equal(rs, xp, decimals)
-
-    def test_time_formatter(self):
-        self.tc(90000)
-
-    def test_dateindex_conversion(self):
-        decimals = 9
-
-        for freq in ('B', 'L', 'S'):
-            dateindex = tm.makeDateIndex(k = 10, freq = freq)
-            rs = self.dtc.convert(dateindex, None, None)
-            xp = converter.dates.date2num(dateindex._mpl_repr())
-            np_assert_almost_equal(rs, xp, decimals)
-
-    def test_resolution(self):
-        def _assert_less(ts1, ts2):
-            val1 = self.dtc.convert(ts1, None, None)
-            val2 = self.dtc.convert(ts2, None, None)
-            if not val1 < val2:
-                raise AssertionError('{0} is not less than {1}.'.format(val1, val2))
-
-        # Matplotlib's time representation using floats cannot distinguish intervals smaller
-        # than ~10 microsecond in the common range of years.
-        ts = Timestamp('2012-1-1')
-        _assert_less(ts, ts + Second())
-        _assert_less(ts, ts + Milli())
-        _assert_less(ts, ts + Micro(50))
-
-
-class TestPeriodConverter(tm.TestCase):
-
-    def setUp(self):
-        self.pc = converter.PeriodConverter()
-
-        class Axis(object):
-            pass
-
-        self.axis = Axis()
-        self.axis.freq = 'D'
-
-    def test_convert_accepts_unicode(self):
-        r1 = self.pc.convert("2012-1-1", None, self.axis)
-        r2 = self.pc.convert(u("2012-1-1"), None, self.axis)
-        self.assert_equal(r1, r2, "PeriodConverter.convert should accept unicode")
-
-    def test_conversion(self):
-        rs = self.pc.convert(['2012-1-1'], None, self.axis)[0]
-        xp = Period('2012-1-1').ordinal
-        self.assertEqual(rs, xp)
-
-        rs = self.pc.convert('2012-1-1', None, self.axis)
-        self.assertEqual(rs, xp)
-
-        rs = self.pc.convert([date(2012, 1, 1)], None, self.axis)[0]
-        self.assertEqual(rs, xp)
-
-        rs = self.pc.convert(date(2012, 1, 1), None, self.axis)
-        self.assertEqual(rs, xp)
-
-        rs = self.pc.convert([Timestamp('2012-1-1')], None, self.axis)[0]
-        self.assertEqual(rs, xp)
-
-        rs = self.pc.convert(Timestamp('2012-1-1'), None, self.axis)
-        self.assertEqual(rs, xp)
-
-        # FIXME
-        # rs = self.pc.convert(np.datetime64('2012-01-01'), None, self.axis)
-        # self.assertEqual(rs, xp)
-        #
-        # rs = self.pc.convert(np.datetime64('2012-01-01 00:00:00+00:00'), None, self.axis)
-        # self.assertEqual(rs, xp)
-        #
-        # rs = self.pc.convert(np.array([np.datetime64('2012-01-01 00:00:00+00:00'),
-        #                                 np.datetime64('2012-01-02 00:00:00+00:00')]), None, self.axis)
-        # self.assertEqual(rs[0], xp)
-
-    def test_integer_passthrough(self):
-        # GH9012
-        rs = self.pc.convert([0, 1], None, self.axis)
-        xp = [0, 1]
-        self.assertEqual(rs, xp)
-
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tseries/tests/test_daterange.py b/pandas/tseries/tests/test_daterange.py
deleted file mode 100644
index 42136c3433977..0000000000000
--- a/pandas/tseries/tests/test_daterange.py
+++ /dev/null
@@ -1,740 +0,0 @@
-from datetime import datetime
-from pandas.compat import range
-import nose
-import numpy as np
-
-from pandas.core.index import Index
-from pandas.tseries.index import DatetimeIndex
-
-from pandas import Timestamp
-from pandas.tseries.offsets import generate_range
-from pandas.tseries.index import cdate_range, bdate_range, date_range
-
-import pandas.core.datetools as datetools
-from pandas.util.testing import assertRaisesRegexp
-import pandas.util.testing as tm
-
-
-def eq_gen_range(kwargs, expected):
-    rng = generate_range(**kwargs)
-    assert(np.array_equal(list(rng), expected))
-
-
-START, END = datetime(2009, 1, 1), datetime(2010, 1, 1)
-
-
-class TestGenRangeGeneration(tm.TestCase):
-    def test_generate(self):
-        rng1 = list(generate_range(START, END, offset=datetools.bday))
-        rng2 = list(generate_range(START, END, time_rule='B'))
-        self.assert_numpy_array_equal(rng1, rng2)
-
-    def test_generate_cday(self):
-        tm._skip_if_no_cday()
-        rng1 = list(generate_range(START, END, offset=datetools.cday))
-        rng2 = list(generate_range(START, END, time_rule='C'))
-        self.assert_numpy_array_equal(rng1, rng2)
-
-    def test_1(self):
-        eq_gen_range(dict(start=datetime(2009, 3, 25), periods=2),
-                     [datetime(2009, 3, 25), datetime(2009, 3, 26)])
-
-    def test_2(self):
-        eq_gen_range(dict(start=datetime(2008, 1, 1),
-                          end=datetime(2008, 1, 3)),
-                     [datetime(2008, 1, 1),
-                      datetime(2008, 1, 2),
-                      datetime(2008, 1, 3)])
-
-    def test_3(self):
-        eq_gen_range(dict(start=datetime(2008, 1, 5),
-                          end=datetime(2008, 1, 6)),
-                     [])
-
-    def test_precision_finer_than_offset(self):
-        # GH 9907
-        result1 = DatetimeIndex(start='2015-04-15 00:00:03',
-                                end='2016-04-22 00:00:00', freq='Q')
-        result2 = DatetimeIndex(start='2015-04-15 00:00:03',
-                                end='2015-06-22 00:00:04', freq='W')
-        expected1_list = ['2015-06-30 00:00:03', '2015-09-30 00:00:03',
-                          '2015-12-31 00:00:03', '2016-03-31 00:00:03']
-        expected2_list = ['2015-04-19 00:00:03', '2015-04-26 00:00:03',
-                          '2015-05-03 00:00:03', '2015-05-10 00:00:03',
-                          '2015-05-17 00:00:03', '2015-05-24 00:00:03',
-                          '2015-05-31 00:00:03', '2015-06-07 00:00:03',
-                          '2015-06-14 00:00:03', '2015-06-21 00:00:03']
-        expected1 = DatetimeIndex(expected1_list, dtype='datetime64[ns]',
-                                  freq='Q-DEC', tz=None)
-        expected2 = DatetimeIndex(expected2_list, dtype='datetime64[ns]',
-                                  freq='W-SUN', tz=None)
-        self.assertTrue(result1.equals(expected1))
-        self.assertTrue(result2.equals(expected2))
-
-
-class TestDateRange(tm.TestCase):
-
-    def setUp(self):
-        self.rng = bdate_range(START, END)
-
-    def test_constructor(self):
-        rng = bdate_range(START, END, freq=datetools.bday)
-        rng = bdate_range(START, periods=20, freq=datetools.bday)
-        rng = bdate_range(end=START, periods=20, freq=datetools.bday)
-        self.assertRaises(ValueError, date_range, '2011-1-1', '2012-1-1', 'B')
-        self.assertRaises(ValueError, bdate_range, '2011-1-1', '2012-1-1', 'B')
-
-    def test_naive_aware_conflicts(self):
-        naive = bdate_range(START, END, freq=datetools.bday, tz=None)
-        aware = bdate_range(START, END, freq=datetools.bday, tz="Asia/Hong_Kong")
-        assertRaisesRegexp(TypeError, "tz-naive.*tz-aware", naive.join, aware)
-        assertRaisesRegexp(TypeError, "tz-naive.*tz-aware", aware.join, naive)
-
-    def test_cached_range(self):
-        rng = DatetimeIndex._cached_range(START, END,
-                                          offset=datetools.bday)
-        rng = DatetimeIndex._cached_range(START, periods=20,
-                                          offset=datetools.bday)
-        rng = DatetimeIndex._cached_range(end=START, periods=20,
-                                          offset=datetools.bday)
-
-        assertRaisesRegexp(TypeError, "offset", DatetimeIndex._cached_range, START, END)
-
-        assertRaisesRegexp(TypeError, "specify period", DatetimeIndex._cached_range, START,
-                          offset=datetools.bday)
-
-        assertRaisesRegexp(TypeError, "specify period", DatetimeIndex._cached_range, end=END,
-                          offset=datetools.bday)
-
-        assertRaisesRegexp(TypeError, "start or end", DatetimeIndex._cached_range, periods=20,
-                          offset=datetools.bday)
-
-    def test_cached_range_bug(self):
-        rng = date_range('2010-09-01 05:00:00', periods=50,
-                         freq=datetools.DateOffset(hours=6))
-        self.assertEqual(len(rng), 50)
-        self.assertEqual(rng[0], datetime(2010, 9, 1, 5))
-
-    def test_timezone_comparaison_bug(self):
-        start = Timestamp('20130220 10:00', tz='US/Eastern')
-        try:
-            date_range(start, periods=2, tz='US/Eastern')
-        except AssertionError:
-            self.fail()
-
-    def test_timezone_comparaison_assert(self):
-        start = Timestamp('20130220 10:00', tz='US/Eastern')
-        self.assertRaises(AssertionError, date_range, start, periods=2, tz='Europe/Berlin')
-
-    def test_comparison(self):
-        d = self.rng[10]
-
-        comp = self.rng > d
-        self.assertTrue(comp[11])
-        self.assertFalse(comp[9])
-
-    def test_copy(self):
-        cp = self.rng.copy()
-        repr(cp)
-        self.assertTrue(cp.equals(self.rng))
-
-    def test_repr(self):
-        # only really care that it works
-        repr(self.rng)
-
-    def test_getitem(self):
-        smaller = self.rng[:5]
-        self.assert_numpy_array_equal(smaller, self.rng.view(np.ndarray)[:5])
-        self.assertEqual(smaller.offset, self.rng.offset)
-
-        sliced = self.rng[::5]
-        self.assertEqual(sliced.offset, datetools.bday * 5)
-
-        fancy_indexed = self.rng[[4, 3, 2, 1, 0]]
-        self.assertEqual(len(fancy_indexed), 5)
-        tm.assertIsInstance(fancy_indexed, DatetimeIndex)
-        self.assertIsNone(fancy_indexed.freq)
-
-        # 32-bit vs. 64-bit platforms
-        self.assertEqual(self.rng[4], self.rng[np.int_(4)])
-
-    def test_getitem_matplotlib_hackaround(self):
-        values = self.rng[:, None]
-        expected = self.rng.values[:, None]
-        self.assert_numpy_array_equal(values, expected)
-
-    def test_shift(self):
-        shifted = self.rng.shift(5)
-        self.assertEqual(shifted[0], self.rng[5])
-        self.assertEqual(shifted.offset, self.rng.offset)
-
-        shifted = self.rng.shift(-5)
-        self.assertEqual(shifted[5], self.rng[0])
-        self.assertEqual(shifted.offset, self.rng.offset)
-
-        shifted = self.rng.shift(0)
-        self.assertEqual(shifted[0], self.rng[0])
-        self.assertEqual(shifted.offset, self.rng.offset)
-
-        rng = date_range(START, END, freq=datetools.bmonthEnd)
-        shifted = rng.shift(1, freq=datetools.bday)
-        self.assertEqual(shifted[0], rng[0] + datetools.bday)
-
-    def test_pickle_unpickle(self):
-        unpickled = self.round_trip_pickle(self.rng)
-        self.assertIsNotNone(unpickled.offset)
-
-    def test_union(self):
-        # overlapping
-        left = self.rng[:10]
-        right = self.rng[5:10]
-
-        the_union = left.union(right)
-        tm.assertIsInstance(the_union, DatetimeIndex)
-
-        # non-overlapping, gap in middle
-        left = self.rng[:5]
-        right = self.rng[10:]
-
-        the_union = left.union(right)
-        tm.assertIsInstance(the_union, Index)
-
-        # non-overlapping, no gap
-        left = self.rng[:5]
-        right = self.rng[5:10]
-
-        the_union = left.union(right)
-        tm.assertIsInstance(the_union, DatetimeIndex)
-
-        # order does not matter
-        self.assert_numpy_array_equal(right.union(left), the_union)
-
-        # overlapping, but different offset
-        rng = date_range(START, END, freq=datetools.bmonthEnd)
-
-        the_union = self.rng.union(rng)
-        tm.assertIsInstance(the_union, DatetimeIndex)
-
-    def test_outer_join(self):
-        # should just behave as union
-
-        # overlapping
-        left = self.rng[:10]
-        right = self.rng[5:10]
-
-        the_join = left.join(right, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
-
-        # non-overlapping, gap in middle
-        left = self.rng[:5]
-        right = self.rng[10:]
-
-        the_join = left.join(right, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
-        self.assertIsNone(the_join.freq)
-
-        # non-overlapping, no gap
-        left = self.rng[:5]
-        right = self.rng[5:10]
-
-        the_join = left.join(right, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
-
-        # overlapping, but different offset
-        rng = date_range(START, END, freq=datetools.bmonthEnd)
-
-        the_join = self.rng.join(rng, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
-        self.assertIsNone(the_join.freq)
-
-    def test_union_not_cacheable(self):
-        rng = date_range('1/1/2000', periods=50, freq=datetools.Minute())
-        rng1 = rng[10:]
-        rng2 = rng[:25]
-        the_union = rng1.union(rng2)
-        self.assertTrue(the_union.equals(rng))
-
-        rng1 = rng[10:]
-        rng2 = rng[15:35]
-        the_union = rng1.union(rng2)
-        expected = rng[10:]
-        self.assertTrue(the_union.equals(expected))
-
-    def test_intersection(self):
-        rng = date_range('1/1/2000', periods=50, freq=datetools.Minute())
-        rng1 = rng[10:]
-        rng2 = rng[:25]
-        the_int = rng1.intersection(rng2)
-        expected = rng[10:25]
-        self.assertTrue(the_int.equals(expected))
-        tm.assertIsInstance(the_int, DatetimeIndex)
-        self.assertEqual(the_int.offset, rng.offset)
-
-        the_int = rng1.intersection(rng2.view(DatetimeIndex))
-        self.assertTrue(the_int.equals(expected))
-
-        # non-overlapping
-        the_int = rng[:10].intersection(rng[10:])
-        expected = DatetimeIndex([])
-        self.assertTrue(the_int.equals(expected))
-
-    def test_intersection_bug(self):
-        # GH #771
-        a = bdate_range('11/30/2011', '12/31/2011')
-        b = bdate_range('12/10/2011', '12/20/2011')
-        result = a.intersection(b)
-        self.assertTrue(result.equals(b))
-
-    def test_summary(self):
-        self.rng.summary()
-        self.rng[2:2].summary()
-
-    def test_summary_pytz(self):
-        tm._skip_if_no_pytz()
-        import pytz
-        bdate_range('1/1/2005', '1/1/2009', tz=pytz.utc).summary()
-
-    def test_summary_dateutil(self):
-        tm._skip_if_no_dateutil()
-        import dateutil
-        bdate_range('1/1/2005', '1/1/2009', tz=dateutil.tz.tzutc()).summary()
-
-    def test_misc(self):
-        end = datetime(2009, 5, 13)
-        dr = bdate_range(end=end, periods=20)
-        firstDate = end - 19 * datetools.bday
-
-        assert len(dr) == 20
-        assert dr[0] == firstDate
-        assert dr[-1] == end
-
-    def test_date_parse_failure(self):
-        badly_formed_date = '2007/100/1'
-
-        self.assertRaises(ValueError, Timestamp, badly_formed_date)
-
-        self.assertRaises(ValueError, bdate_range, start=badly_formed_date,
-                          periods=10)
-        self.assertRaises(ValueError, bdate_range, end=badly_formed_date,
-                          periods=10)
-        self.assertRaises(ValueError, bdate_range, badly_formed_date,
-                          badly_formed_date)
-
-    def test_equals(self):
-        self.assertFalse(self.rng.equals(list(self.rng)))
-
-    def test_identical(self):
-        t1 = self.rng.copy()
-        t2 = self.rng.copy()
-        self.assertTrue(t1.identical(t2))
-
-        # name
-        t1 = t1.rename('foo')
-        self.assertTrue(t1.equals(t2))
-        self.assertFalse(t1.identical(t2))
-        t2 = t2.rename('foo')
-        self.assertTrue(t1.identical(t2))
-
-        # freq
-        t2v = Index(t2.values)
-        self.assertTrue(t1.equals(t2v))
-        self.assertFalse(t1.identical(t2v))
-
-    def test_daterange_bug_456(self):
-        # GH #456
-        rng1 = bdate_range('12/5/2011', '12/5/2011')
-        rng2 = bdate_range('12/2/2011', '12/5/2011')
-        rng2.offset = datetools.BDay()
-
-        result = rng1.union(rng2)
-        tm.assertIsInstance(result, DatetimeIndex)
-
-    def test_error_with_zero_monthends(self):
-        self.assertRaises(ValueError, date_range, '1/1/2000', '1/1/2001',
-                          freq=datetools.MonthEnd(0))
-
-    def test_range_bug(self):
-        # GH #770
-        offset = datetools.DateOffset(months=3)
-        result = date_range("2011-1-1", "2012-1-31", freq=offset)
-
-        start = datetime(2011, 1, 1)
-        exp_values = [start + i * offset for i in range(5)]
-        self.assert_numpy_array_equal(result, DatetimeIndex(exp_values))
-
-    def test_range_tz_pytz(self):
-        # GH 2906
-        tm._skip_if_no_pytz()
-        from pytz import timezone
-
-        tz = timezone('US/Eastern')
-        start = tz.localize(datetime(2011, 1, 1))
-        end = tz.localize(datetime(2011, 1, 3))
-
-        dr = date_range(start=start, periods=3)
-        self.assertEqual(dr.tz.zone, tz.zone)
-        self.assertEqual(dr[0], start)
-        self.assertEqual(dr[2], end)
-
-        dr = date_range(end=end, periods=3)
-        self.assertEqual(dr.tz.zone, tz.zone)
-        self.assertEqual(dr[0], start)
-        self.assertEqual(dr[2], end)
-
-        dr = date_range(start=start, end=end)
-        self.assertEqual(dr.tz.zone, tz.zone)
-        self.assertEqual(dr[0], start)
-        self.assertEqual(dr[2], end)
-
-    def test_range_tz_dst_straddle_pytz(self):
-
-        tm._skip_if_no_pytz()
-        from pytz import timezone
-        tz = timezone('US/Eastern')
-        dates = [(tz.localize(datetime(2014, 3, 6)),
-                  tz.localize(datetime(2014, 3, 12))),
-                 (tz.localize(datetime(2013, 11, 1)),
-                  tz.localize(datetime(2013, 11, 6)))]
-        for (start, end) in dates:
-            dr = date_range(start, end, freq='D')
-            self.assertEqual(dr[0], start)
-            self.assertEqual(dr[-1], end)
-            self.assertEqual(np.all(dr.hour==0), True)
-
-            dr = date_range(start, end, freq='D', tz='US/Eastern')
-            self.assertEqual(dr[0], start)
-            self.assertEqual(dr[-1], end)
-            self.assertEqual(np.all(dr.hour==0), True)
-
-            dr = date_range(start.replace(tzinfo=None), end.replace(tzinfo=None), freq='D', tz='US/Eastern')
-            self.assertEqual(dr[0], start)
-            self.assertEqual(dr[-1], end)
-            self.assertEqual(np.all(dr.hour==0), True)
-
-    def test_range_tz_dateutil(self):
-        # GH 2906
-        tm._skip_if_no_dateutil()
-        # Use maybe_get_tz to fix filename in tz under dateutil.
-        from pandas.tslib import maybe_get_tz
-        tz = lambda x: maybe_get_tz('dateutil/' + x)
-
-        start = datetime(2011, 1, 1, tzinfo=tz('US/Eastern'))
-        end = datetime(2011, 1, 3, tzinfo=tz('US/Eastern'))
-
-        dr = date_range(start=start, periods=3)
-        self.assertTrue(dr.tz == tz('US/Eastern'))
-        self.assertTrue(dr[0] == start)
-        self.assertTrue(dr[2] == end)
-
-        dr = date_range(end=end, periods=3)
-        self.assertTrue(dr.tz == tz('US/Eastern'))
-        self.assertTrue(dr[0] == start)
-        self.assertTrue(dr[2] == end)
-
-        dr = date_range(start=start, end=end)
-        self.assertTrue(dr.tz == tz('US/Eastern'))
-        self.assertTrue(dr[0] == start)
-        self.assertTrue(dr[2] == end)
-
-    def test_month_range_union_tz_pytz(self):
-        tm._skip_if_no_pytz()
-        from pytz import timezone
-        tz = timezone('US/Eastern')
-
-        early_start = datetime(2011, 1, 1)
-        early_end = datetime(2011, 3, 1)
-
-        late_start = datetime(2011, 3, 1)
-        late_end = datetime(2011, 5, 1)
-
-        early_dr = date_range(start=early_start, end=early_end, tz=tz, freq=datetools.monthEnd)
-        late_dr = date_range(start=late_start, end=late_end, tz=tz, freq=datetools.monthEnd)
-
-        early_dr.union(late_dr)
-
-    def test_month_range_union_tz_dateutil(self):
-        tm._skip_if_windows_python_3()
-        tm._skip_if_no_dateutil()
-        from pandas.tslib import _dateutil_gettz as timezone
-        tz = timezone('US/Eastern')
-
-        early_start = datetime(2011, 1, 1)
-        early_end = datetime(2011, 3, 1)
-
-        late_start = datetime(2011, 3, 1)
-        late_end = datetime(2011, 5, 1)
-
-        early_dr = date_range(start=early_start, end=early_end, tz=tz, freq=datetools.monthEnd)
-        late_dr = date_range(start=late_start, end=late_end, tz=tz, freq=datetools.monthEnd)
-
-        early_dr.union(late_dr)
-
-    def test_range_closed(self):
-        begin = datetime(2011, 1, 1)
-        end = datetime(2014, 1, 1)
-
-        for freq in ["3D", "2M", "7W", "3H", "A"]:
-            closed = date_range(begin, end, closed=None, freq=freq)
-            left = date_range(begin, end, closed="left", freq=freq)
-            right = date_range(begin, end, closed="right", freq=freq)
-
-            expected_left = closed[:-1]
-            expected_right = closed[1:]
-
-            self.assertTrue(expected_left.equals(left))
-            self.assertTrue(expected_right.equals(right))
-
-    def test_years_only(self):
-        # GH 6961
-        dr = date_range('2014', '2015', freq='M')
-        self.assertEqual(dr[0], datetime(2014, 1, 31))
-        self.assertEqual(dr[-1], datetime(2014, 12, 31))
-
-    def test_freq_divides_end_in_nanos(self):
-        # GH 10885
-        result_1 = date_range('2005-01-12 10:00', '2005-01-12 16:00',
-                              freq='345min')
-        result_2 = date_range('2005-01-13 10:00', '2005-01-13 16:00',
-                              freq='345min')
-        expected_1 = DatetimeIndex(['2005-01-12 10:00:00', '2005-01-12 15:45:00'],
-                                   dtype='datetime64[ns]', freq='345T', tz=None)
-        expected_2 = DatetimeIndex(['2005-01-13 10:00:00', '2005-01-13 15:45:00'],
-                                   dtype='datetime64[ns]', freq='345T', tz=None)
-        self.assertTrue(result_1.equals(expected_1))
-        self.assertTrue(result_2.equals(expected_2))
-
-class TestCustomDateRange(tm.TestCase):
-
-    def setUp(self):
-        tm._skip_if_no_cday()
-        self.rng = cdate_range(START, END)
-
-    def test_constructor(self):
-        rng = cdate_range(START, END, freq=datetools.cday)
-        rng = cdate_range(START, periods=20, freq=datetools.cday)
-        rng = cdate_range(end=START, periods=20, freq=datetools.cday)
-        self.assertRaises(ValueError, date_range, '2011-1-1', '2012-1-1', 'C')
-        self.assertRaises(ValueError, cdate_range, '2011-1-1', '2012-1-1', 'C')
-
-    def test_cached_range(self):
-        rng = DatetimeIndex._cached_range(START, END,
-                                          offset=datetools.cday)
-        rng = DatetimeIndex._cached_range(START, periods=20,
-                                          offset=datetools.cday)
-        rng = DatetimeIndex._cached_range(end=START, periods=20,
-                                          offset=datetools.cday)
-
-        self.assertRaises(Exception, DatetimeIndex._cached_range, START, END)
-
-        self.assertRaises(Exception, DatetimeIndex._cached_range, START,
-                          freq=datetools.cday)
-
-        self.assertRaises(Exception, DatetimeIndex._cached_range, end=END,
-                          freq=datetools.cday)
-
-        self.assertRaises(Exception, DatetimeIndex._cached_range, periods=20,
-                          freq=datetools.cday)
-
-    def test_comparison(self):
-        d = self.rng[10]
-
-        comp = self.rng > d
-        self.assertTrue(comp[11])
-        self.assertFalse(comp[9])
-
-    def test_copy(self):
-        cp = self.rng.copy()
-        repr(cp)
-        self.assertTrue(cp.equals(self.rng))
-
-    def test_repr(self):
-        # only really care that it works
-        repr(self.rng)
-
-    def test_getitem(self):
-        smaller = self.rng[:5]
-        self.assert_numpy_array_equal(smaller, self.rng.view(np.ndarray)[:5])
-        self.assertEqual(smaller.offset, self.rng.offset)
-
-        sliced = self.rng[::5]
-        self.assertEqual(sliced.offset, datetools.cday * 5)
-
-        fancy_indexed = self.rng[[4, 3, 2, 1, 0]]
-        self.assertEqual(len(fancy_indexed), 5)
-        tm.assertIsInstance(fancy_indexed, DatetimeIndex)
-        self.assertIsNone(fancy_indexed.freq)
-
-        # 32-bit vs. 64-bit platforms
-        self.assertEqual(self.rng[4], self.rng[np.int_(4)])
-
-    def test_getitem_matplotlib_hackaround(self):
-        values = self.rng[:, None]
-        expected = self.rng.values[:, None]
-        self.assert_numpy_array_equal(values, expected)
-
-    def test_shift(self):
-        shifted = self.rng.shift(5)
-        self.assertEqual(shifted[0], self.rng[5])
-        self.assertEqual(shifted.offset, self.rng.offset)
-
-        shifted = self.rng.shift(-5)
-        self.assertEqual(shifted[5], self.rng[0])
-        self.assertEqual(shifted.offset, self.rng.offset)
-
-        shifted = self.rng.shift(0)
-        self.assertEqual(shifted[0], self.rng[0])
-        self.assertEqual(shifted.offset, self.rng.offset)
-
-        rng = date_range(START, END, freq=datetools.bmonthEnd)
-        shifted = rng.shift(1, freq=datetools.cday)
-        self.assertEqual(shifted[0], rng[0] + datetools.cday)
-
-    def test_pickle_unpickle(self):
-        unpickled = self.round_trip_pickle(self.rng)
-        self.assertIsNotNone(unpickled.offset)
-
-    def test_union(self):
-        # overlapping
-        left = self.rng[:10]
-        right = self.rng[5:10]
-
-        the_union = left.union(right)
-        tm.assertIsInstance(the_union, DatetimeIndex)
-
-        # non-overlapping, gap in middle
-        left = self.rng[:5]
-        right = self.rng[10:]
-
-        the_union = left.union(right)
-        tm.assertIsInstance(the_union, Index)
-
-        # non-overlapping, no gap
-        left = self.rng[:5]
-        right = self.rng[5:10]
-
-        the_union = left.union(right)
-        tm.assertIsInstance(the_union, DatetimeIndex)
-
-        # order does not matter
-        self.assert_numpy_array_equal(right.union(left), the_union)
-
-        # overlapping, but different offset
-        rng = date_range(START, END, freq=datetools.bmonthEnd)
-
-        the_union = self.rng.union(rng)
-        tm.assertIsInstance(the_union, DatetimeIndex)
-
-    def test_outer_join(self):
-        # should just behave as union
-
-        # overlapping
-        left = self.rng[:10]
-        right = self.rng[5:10]
-
-        the_join = left.join(right, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
-
-        # non-overlapping, gap in middle
-        left = self.rng[:5]
-        right = self.rng[10:]
-
-        the_join = left.join(right, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
-        self.assertIsNone(the_join.freq)
-
-        # non-overlapping, no gap
-        left = self.rng[:5]
-        right = self.rng[5:10]
-
-        the_join = left.join(right, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
-
-        # overlapping, but different offset
-        rng = date_range(START, END, freq=datetools.bmonthEnd)
-
-        the_join = self.rng.join(rng, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
-        self.assertIsNone(the_join.freq)
-
-    def test_intersection_bug(self):
-        # GH #771
-        a = cdate_range('11/30/2011', '12/31/2011')
-        b = cdate_range('12/10/2011', '12/20/2011')
-        result = a.intersection(b)
-        self.assertTrue(result.equals(b))
-
-    def test_summary(self):
-        self.rng.summary()
-        self.rng[2:2].summary()
-
-    def test_summary_pytz(self):
-        tm._skip_if_no_pytz()
-        import pytz
-        cdate_range('1/1/2005', '1/1/2009', tz=pytz.utc).summary()
-
-    def test_summary_dateutil(self):
-        tm._skip_if_no_dateutil()
-        import dateutil
-        cdate_range('1/1/2005', '1/1/2009', tz=dateutil.tz.tzutc()).summary()
-
-    def test_misc(self):
-        end = datetime(2009, 5, 13)
-        dr = cdate_range(end=end, periods=20)
-        firstDate = end - 19 * datetools.cday
-
-        assert len(dr) == 20
-        assert dr[0] == firstDate
-        assert dr[-1] == end
-
-    def test_date_parse_failure(self):
-        badly_formed_date = '2007/100/1'
-
-        self.assertRaises(ValueError, Timestamp, badly_formed_date)
-
-        self.assertRaises(ValueError, cdate_range, start=badly_formed_date,
-                          periods=10)
-        self.assertRaises(ValueError, cdate_range, end=badly_formed_date,
-                          periods=10)
-        self.assertRaises(ValueError, cdate_range, badly_formed_date,
-                          badly_formed_date)
-
-    def test_equals(self):
-        self.assertFalse(self.rng.equals(list(self.rng)))
-
-    def test_daterange_bug_456(self):
-        # GH #456
-        rng1 = cdate_range('12/5/2011', '12/5/2011')
-        rng2 = cdate_range('12/2/2011', '12/5/2011')
-        rng2.offset = datetools.CDay()
-
-        result = rng1.union(rng2)
-        tm.assertIsInstance(result, DatetimeIndex)
-
-    def test_cdaterange(self):
-        rng = cdate_range('2013-05-01', periods=3)
-        xp = DatetimeIndex(['2013-05-01', '2013-05-02', '2013-05-03'])
-        self.assertTrue(xp.equals(rng))
-
-    def test_cdaterange_weekmask(self):
-        rng = cdate_range('2013-05-01', periods=3,
-                          weekmask='Sun Mon Tue Wed Thu')
-        xp = DatetimeIndex(['2013-05-01', '2013-05-02', '2013-05-05'])
-        self.assertTrue(xp.equals(rng))
-
-    def test_cdaterange_holidays(self):
-        rng = cdate_range('2013-05-01', periods=3,
-                          holidays=['2013-05-01'])
-        xp = DatetimeIndex(['2013-05-02', '2013-05-03', '2013-05-06'])
-        self.assertTrue(xp.equals(rng))
-
-    def test_cdaterange_weekmask_and_holidays(self):
-        rng = cdate_range('2013-05-01', periods=3,
-                          weekmask='Sun Mon Tue Wed Thu',
-                          holidays=['2013-05-01'])
-        xp = DatetimeIndex(['2013-05-02', '2013-05-05', '2013-05-06'])
-        self.assertTrue(xp.equals(rng))
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tseries/tests/test_frequencies.py b/pandas/tseries/tests/test_frequencies.py
deleted file mode 100644
index d9bc64136e390..0000000000000
--- a/pandas/tseries/tests/test_frequencies.py
+++ /dev/null
@@ -1,643 +0,0 @@
-from datetime import datetime, time, timedelta
-from pandas.compat import range
-import sys
-import os
-
-import nose
-
-import numpy as np
-
-from pandas import Index, DatetimeIndex, Timestamp, Series, date_range, period_range
-
-import pandas.tseries.frequencies as frequencies
-from pandas.tseries.tools import to_datetime
-
-import pandas.tseries.offsets as offsets
-from pandas.tseries.period import PeriodIndex
-import pandas.compat as compat
-from pandas.compat import is_platform_windows
-
-import pandas.util.testing as tm
-from pandas import Timedelta
-
-def test_to_offset_multiple():
-    freqstr = '2h30min'
-    freqstr2 = '2h 30min'
-
-    result = frequencies.to_offset(freqstr)
-    assert(result == frequencies.to_offset(freqstr2))
-    expected = offsets.Minute(150)
-    assert(result == expected)
-
-    freqstr = '2h30min15s'
-    result = frequencies.to_offset(freqstr)
-    expected = offsets.Second(150 * 60 + 15)
-    assert(result == expected)
-
-    freqstr = '2h 60min'
-    result = frequencies.to_offset(freqstr)
-    expected = offsets.Hour(3)
-    assert(result == expected)
-
-    freqstr = '15l500u'
-    result = frequencies.to_offset(freqstr)
-    expected = offsets.Micro(15500)
-    assert(result == expected)
-
-    freqstr = '10s75L'
-    result = frequencies.to_offset(freqstr)
-    expected = offsets.Milli(10075)
-    assert(result == expected)
-
-    freqstr = '2800N'
-    result = frequencies.to_offset(freqstr)
-    expected = offsets.Nano(2800)
-    assert(result == expected)
-
-    # malformed
-    try:
-        frequencies.to_offset('2h20m')
-    except ValueError:
-        pass
-    else:
-        assert(False)
-
-
-def test_to_offset_negative():
-    freqstr = '-1S'
-    result = frequencies.to_offset(freqstr)
-    assert(result.n == -1)
-
-    freqstr = '-5min10s'
-    result = frequencies.to_offset(freqstr)
-    assert(result.n == -310)
-
-
-def test_to_offset_leading_zero():
-    freqstr = '00H 00T 01S'
-    result = frequencies.to_offset(freqstr)
-    assert(result.n == 1)
-
-    freqstr = '-00H 03T 14S'
-    result = frequencies.to_offset(freqstr)
-    assert(result.n == -194)
-
-
-def test_to_offset_pd_timedelta():
-    # Tests for #9064
-    td = Timedelta(days=1, seconds=1)
-    result = frequencies.to_offset(td)
-    expected = offsets.Second(86401)
-    assert(expected==result)
-
-    td = Timedelta(days=-1, seconds=1)
-    result = frequencies.to_offset(td)
-    expected = offsets.Second(-86399)
-    assert(expected==result)
-
-    td = Timedelta(hours=1, minutes=10)
-    result = frequencies.to_offset(td)
-    expected = offsets.Minute(70)
-    assert(expected==result)
-
-    td = Timedelta(hours=1, minutes=-10)
-    result = frequencies.to_offset(td)
-    expected = offsets.Minute(50)
-    assert(expected==result)
-
-    td = Timedelta(weeks=1)
-    result = frequencies.to_offset(td)
-    expected = offsets.Day(7)
-    assert(expected==result)
-
-    td1 = Timedelta(hours=1)
-    result1 = frequencies.to_offset(td1)
-    result2 = frequencies.to_offset('60min')
-    assert(result1 == result2)
-
-    td = Timedelta(microseconds=1)
-    result = frequencies.to_offset(td)
-    expected = offsets.Micro(1)
-    assert(expected == result)
-
-    td = Timedelta(microseconds=0)
-    tm.assertRaises(ValueError, lambda: frequencies.to_offset(td))
-
-
-def test_anchored_shortcuts():
-    result = frequencies.to_offset('W')
-    expected = frequencies.to_offset('W-SUN')
-    assert(result == expected)
-
-    result1 = frequencies.to_offset('Q')
-    result2 = frequencies.to_offset('Q-DEC')
-    expected = offsets.QuarterEnd(startingMonth=12)
-    assert(result1 == expected)
-    assert(result2 == expected)
-
-    result1 = frequencies.to_offset('Q-MAY')
-    expected = offsets.QuarterEnd(startingMonth=5)
-    assert(result1 == expected)
-
-
-def test_get_rule_month():
-    result = frequencies._get_rule_month('W')
-    assert(result == 'DEC')
-    result = frequencies._get_rule_month(offsets.Week())
-    assert(result == 'DEC')
-
-    result = frequencies._get_rule_month('D')
-    assert(result == 'DEC')
-    result = frequencies._get_rule_month(offsets.Day())
-    assert(result == 'DEC')
-
-    result = frequencies._get_rule_month('Q')
-    assert(result == 'DEC')
-    result = frequencies._get_rule_month(offsets.QuarterEnd(startingMonth=12))
-    print(result == 'DEC')
-
-    result = frequencies._get_rule_month('Q-JAN')
-    assert(result == 'JAN')
-    result = frequencies._get_rule_month(offsets.QuarterEnd(startingMonth=1))
-    assert(result == 'JAN')
-
-    result = frequencies._get_rule_month('A-DEC')
-    assert(result == 'DEC')
-    result = frequencies._get_rule_month(offsets.YearEnd())
-    assert(result == 'DEC')
-
-    result = frequencies._get_rule_month('A-MAY')
-    assert(result == 'MAY')
-    result = frequencies._get_rule_month(offsets.YearEnd(month=5))
-    assert(result == 'MAY')
-
-
-class TestFrequencyCode(tm.TestCase):
-
-    def test_freq_code(self):
-        self.assertEqual(frequencies.get_freq('A'), 1000)
-        self.assertEqual(frequencies.get_freq('3A'), 1000)
-        self.assertEqual(frequencies.get_freq('-1A'), 1000)
-
-        self.assertEqual(frequencies.get_freq('W'), 4000)
-        self.assertEqual(frequencies.get_freq('W-MON'), 4001)
-        self.assertEqual(frequencies.get_freq('W-FRI'), 4005)
-
-        for freqstr, code in compat.iteritems(frequencies._period_code_map):
-            result = frequencies.get_freq(freqstr)
-            self.assertEqual(result, code)
-
-            result = frequencies.get_freq_group(freqstr)
-            self.assertEqual(result, code // 1000 * 1000)
-
-            result = frequencies.get_freq_group(code)
-            self.assertEqual(result, code // 1000 * 1000)
-
-    def test_freq_group(self):
-        self.assertEqual(frequencies.get_freq_group('A'), 1000)
-        self.assertEqual(frequencies.get_freq_group('3A'), 1000)
-        self.assertEqual(frequencies.get_freq_group('-1A'), 1000)
-        self.assertEqual(frequencies.get_freq_group('A-JAN'), 1000)
-        self.assertEqual(frequencies.get_freq_group('A-MAY'), 1000)
-        self.assertEqual(frequencies.get_freq_group(offsets.YearEnd()), 1000)
-        self.assertEqual(frequencies.get_freq_group(offsets.YearEnd(month=1)), 1000)
-        self.assertEqual(frequencies.get_freq_group(offsets.YearEnd(month=5)), 1000)
-
-        self.assertEqual(frequencies.get_freq_group('W'), 4000)
-        self.assertEqual(frequencies.get_freq_group('W-MON'), 4000)
-        self.assertEqual(frequencies.get_freq_group('W-FRI'), 4000)
-        self.assertEqual(frequencies.get_freq_group(offsets.Week()), 4000)
-        self.assertEqual(frequencies.get_freq_group(offsets.Week(weekday=1)), 4000)
-        self.assertEqual(frequencies.get_freq_group(offsets.Week(weekday=5)), 4000)
-
-    def test_get_to_timestamp_base(self):
-        tsb = frequencies.get_to_timestamp_base
-
-        self.assertEqual(tsb(frequencies.get_freq_code('D')[0]),
-                         frequencies.get_freq_code('D')[0])
-        self.assertEqual(tsb(frequencies.get_freq_code('W')[0]),
-                         frequencies.get_freq_code('D')[0])
-        self.assertEqual(tsb(frequencies.get_freq_code('M')[0]),
-                         frequencies.get_freq_code('D')[0])
-
-        self.assertEqual(tsb(frequencies.get_freq_code('S')[0]),
-                         frequencies.get_freq_code('S')[0])
-        self.assertEqual(tsb(frequencies.get_freq_code('T')[0]),
-                         frequencies.get_freq_code('S')[0])
-        self.assertEqual(tsb(frequencies.get_freq_code('H')[0]),
-                         frequencies.get_freq_code('S')[0])
-
-
-    def test_freq_to_reso(self):
-        Reso = frequencies.Resolution
-
-        self.assertEqual(Reso.get_str_from_freq('A'), 'year')
-        self.assertEqual(Reso.get_str_from_freq('Q'), 'quarter')
-        self.assertEqual(Reso.get_str_from_freq('M'), 'month')
-        self.assertEqual(Reso.get_str_from_freq('D'), 'day')
-        self.assertEqual(Reso.get_str_from_freq('H'), 'hour')
-        self.assertEqual(Reso.get_str_from_freq('T'), 'minute')
-        self.assertEqual(Reso.get_str_from_freq('S'), 'second')
-        self.assertEqual(Reso.get_str_from_freq('L'), 'millisecond')
-        self.assertEqual(Reso.get_str_from_freq('U'), 'microsecond')
-        self.assertEqual(Reso.get_str_from_freq('N'), 'nanosecond')
-
-        for freq in ['A', 'Q', 'M', 'D', 'H', 'T', 'S', 'L', 'U', 'N']:
-            # check roundtrip
-            result = Reso.get_freq(Reso.get_str_from_freq(freq))
-            self.assertEqual(freq, result)
-
-        for freq in ['D', 'H', 'T', 'S', 'L', 'U']:
-            result = Reso.get_freq(Reso.get_str(Reso.get_reso_from_freq(freq)))
-            self.assertEqual(freq, result)
-
-    def test_get_freq_code(self):
-        # freqstr
-        self.assertEqual(frequencies.get_freq_code('A'),
-                         (frequencies.get_freq('A'), 1))
-        self.assertEqual(frequencies.get_freq_code('3D'),
-                         (frequencies.get_freq('D'), 3))
-        self.assertEqual(frequencies.get_freq_code('-2M'),
-                         (frequencies.get_freq('M'), -2))
-
-        # tuple
-        self.assertEqual(frequencies.get_freq_code(('D', 1)),
-                         (frequencies.get_freq('D'), 1))
-        self.assertEqual(frequencies.get_freq_code(('A', 3)),
-                         (frequencies.get_freq('A'), 3))
-        self.assertEqual(frequencies.get_freq_code(('M', -2)),
-                         (frequencies.get_freq('M'), -2))
-        # numeric tuple
-        self.assertEqual(frequencies.get_freq_code((1000, 1)), (1000, 1))
-
-        # offsets
-        self.assertEqual(frequencies.get_freq_code(offsets.Day()),
-                         (frequencies.get_freq('D'), 1))
-        self.assertEqual(frequencies.get_freq_code(offsets.Day(3)),
-                         (frequencies.get_freq('D'), 3))
-        self.assertEqual(frequencies.get_freq_code(offsets.Day(-2)),
-                         (frequencies.get_freq('D'), -2))
-
-        self.assertEqual(frequencies.get_freq_code(offsets.MonthEnd()),
-                         (frequencies.get_freq('M'), 1))
-        self.assertEqual(frequencies.get_freq_code(offsets.MonthEnd(3)),
-                         (frequencies.get_freq('M'), 3))
-        self.assertEqual(frequencies.get_freq_code(offsets.MonthEnd(-2)),
-                         (frequencies.get_freq('M'), -2))
-
-        self.assertEqual(frequencies.get_freq_code(offsets.Week()),
-                         (frequencies.get_freq('W'), 1))
-        self.assertEqual(frequencies.get_freq_code(offsets.Week(3)),
-                         (frequencies.get_freq('W'), 3))
-        self.assertEqual(frequencies.get_freq_code(offsets.Week(-2)),
-                         (frequencies.get_freq('W'), -2))
-
-        # monday is weekday=0
-        self.assertEqual(frequencies.get_freq_code(offsets.Week(weekday=1)),
-                         (frequencies.get_freq('W-TUE'), 1))
-        self.assertEqual(frequencies.get_freq_code(offsets.Week(3, weekday=0)),
-                         (frequencies.get_freq('W-MON'), 3))
-        self.assertEqual(frequencies.get_freq_code(offsets.Week(-2, weekday=4)),
-                         (frequencies.get_freq('W-FRI'), -2))
-
-
-_dti = DatetimeIndex
-
-
-class TestFrequencyInference(tm.TestCase):
-
-    def test_raise_if_period_index(self):
-        index = PeriodIndex(start="1/1/1990", periods=20, freq="M")
-        self.assertRaises(TypeError, frequencies.infer_freq, index)
-
-    def test_raise_if_too_few(self):
-        index = _dti(['12/31/1998', '1/3/1999'])
-        self.assertRaises(ValueError, frequencies.infer_freq, index)
-
-    def test_business_daily(self):
-        index = _dti(['12/31/1998', '1/3/1999', '1/4/1999'])
-        self.assertEqual(frequencies.infer_freq(index), 'B')
-
-    def test_day(self):
-        self._check_tick(timedelta(1), 'D')
-
-    def test_day_corner(self):
-        index = _dti(['1/1/2000', '1/2/2000', '1/3/2000'])
-        self.assertEqual(frequencies.infer_freq(index), 'D')
-
-    def test_non_datetimeindex(self):
-        dates = to_datetime(['1/1/2000', '1/2/2000', '1/3/2000'])
-        self.assertEqual(frequencies.infer_freq(dates), 'D')
-
-    def test_hour(self):
-        self._check_tick(timedelta(hours=1), 'H')
-
-    def test_minute(self):
-        self._check_tick(timedelta(minutes=1), 'T')
-
-    def test_second(self):
-        self._check_tick(timedelta(seconds=1), 'S')
-
-    def test_millisecond(self):
-        self._check_tick(timedelta(microseconds=1000), 'L')
-
-    def test_microsecond(self):
-        self._check_tick(timedelta(microseconds=1), 'U')
-
-    def test_nanosecond(self):
-        self._check_tick(np.timedelta64(1, 'ns'), 'N')
-
-    def _check_tick(self, base_delta, code):
-        b = Timestamp(datetime.now())
-        for i in range(1, 5):
-            inc = base_delta * i
-            index = _dti([b + inc * j for j in range(3)])
-            if i > 1:
-                exp_freq = '%d%s' % (i, code)
-            else:
-                exp_freq = code
-            self.assertEqual(frequencies.infer_freq(index), exp_freq)
-
-        index = _dti([b + base_delta * 7] +
-                     [b + base_delta * j for j in range(3)])
-        self.assertIsNone(frequencies.infer_freq(index))
-
-        index = _dti([b + base_delta * j for j in range(3)] +
-                     [b + base_delta * 7])
-
-        self.assertIsNone(frequencies.infer_freq(index))
-
-    def test_weekly(self):
-        days = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
-
-        for day in days:
-            self._check_generated_range('1/1/2000', 'W-%s' % day)
-
-    def test_week_of_month(self):
-        days = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
-
-        for day in days:
-            for i in range(1, 5):
-                self._check_generated_range('1/1/2000', 'WOM-%d%s' % (i, day))
-
-    def test_fifth_week_of_month(self):
-        # Only supports freq up to WOM-4. See #9425
-        func = lambda: date_range('2014-01-01', freq='WOM-5MON')
-        self.assertRaises(ValueError, func)
-
-    def test_fifth_week_of_month_infer(self):
-        # Only attempts to infer up to WOM-4. See #9425
-        index = DatetimeIndex(["2014-03-31", "2014-06-30", "2015-03-30"])
-        assert frequencies.infer_freq(index) is None
-
-    def test_week_of_month_fake(self):
-        #All of these dates are on same day of week and are 4 or 5 weeks apart
-        index = DatetimeIndex(["2013-08-27","2013-10-01","2013-10-29","2013-11-26"])
-        assert frequencies.infer_freq(index) != 'WOM-4TUE'
-
-    def test_monthly(self):
-        self._check_generated_range('1/1/2000', 'M')
-
-    def test_monthly_ambiguous(self):
-        rng = _dti(['1/31/2000', '2/29/2000', '3/31/2000'])
-        self.assertEqual(rng.inferred_freq, 'M')
-
-    def test_business_monthly(self):
-        self._check_generated_range('1/1/2000', 'BM')
-
-    def test_business_start_monthly(self):
-        self._check_generated_range('1/1/2000', 'BMS')
-
-    def test_quarterly(self):
-        for month in ['JAN', 'FEB', 'MAR']:
-            self._check_generated_range('1/1/2000', 'Q-%s' % month)
-
-    def test_annual(self):
-        for month in MONTHS:
-            self._check_generated_range('1/1/2000', 'A-%s' % month)
-
-    def test_business_annual(self):
-        for month in MONTHS:
-            self._check_generated_range('1/1/2000', 'BA-%s' % month)
-
-    def test_annual_ambiguous(self):
-        rng = _dti(['1/31/2000', '1/31/2001', '1/31/2002'])
-        self.assertEqual(rng.inferred_freq, 'A-JAN')
-
-    def _check_generated_range(self, start, freq):
-        freq = freq.upper()
-
-        gen = date_range(start, periods=7, freq=freq)
-        index = _dti(gen.values)
-        if not freq.startswith('Q-'):
-            self.assertEqual(frequencies.infer_freq(index), gen.freqstr)
-        else:
-            inf_freq = frequencies.infer_freq(index)
-            self.assertTrue((inf_freq == 'Q-DEC' and
-                             gen.freqstr in ('Q', 'Q-DEC', 'Q-SEP', 'Q-JUN',
-                                             'Q-MAR'))
-                            or
-                            (inf_freq == 'Q-NOV' and
-                             gen.freqstr in ('Q-NOV', 'Q-AUG', 'Q-MAY', 'Q-FEB'))
-                            or
-                            (inf_freq == 'Q-OCT' and
-                             gen.freqstr in ('Q-OCT', 'Q-JUL', 'Q-APR', 'Q-JAN')))
-
-        gen = date_range(start, periods=5, freq=freq)
-        index = _dti(gen.values)
-        if not freq.startswith('Q-'):
-            self.assertEqual(frequencies.infer_freq(index), gen.freqstr)
-        else:
-            inf_freq = frequencies.infer_freq(index)
-            self.assertTrue((inf_freq == 'Q-DEC' and
-                             gen.freqstr in ('Q', 'Q-DEC', 'Q-SEP', 'Q-JUN',
-                                             'Q-MAR'))
-                            or
-                            (inf_freq == 'Q-NOV' and
-                             gen.freqstr in ('Q-NOV', 'Q-AUG', 'Q-MAY', 'Q-FEB'))
-                            or
-                            (inf_freq == 'Q-OCT' and
-                             gen.freqstr in ('Q-OCT', 'Q-JUL', 'Q-APR', 'Q-JAN')))
-
-    def test_infer_freq(self):
-        rng = period_range('1959Q2', '2009Q3', freq='Q')
-        rng = Index(rng.to_timestamp('D', how='e').asobject)
-        self.assertEqual(rng.inferred_freq, 'Q-DEC')
-
-        rng = period_range('1959Q2', '2009Q3', freq='Q-NOV')
-        rng = Index(rng.to_timestamp('D', how='e').asobject)
-        self.assertEqual(rng.inferred_freq, 'Q-NOV')
-
-        rng = period_range('1959Q2', '2009Q3', freq='Q-OCT')
-        rng = Index(rng.to_timestamp('D', how='e').asobject)
-        self.assertEqual(rng.inferred_freq, 'Q-OCT')
-
-    def test_infer_freq_tz(self):
-
-        freqs = {'AS-JAN': ['2009-01-01', '2010-01-01', '2011-01-01', '2012-01-01'],
-                 'Q-OCT': ['2009-01-31', '2009-04-30', '2009-07-31', '2009-10-31'],
-                 'M': ['2010-11-30', '2010-12-31', '2011-01-31', '2011-02-28'],
-                 'W-SAT': ['2010-12-25', '2011-01-01', '2011-01-08', '2011-01-15'],
-                 'D': ['2011-01-01', '2011-01-02', '2011-01-03', '2011-01-04'],
-                 'H': ['2011-12-31 22:00', '2011-12-31 23:00', '2012-01-01 00:00', '2012-01-01 01:00']
-        }
-
-        # GH 7310
-        for tz in [None, 'Australia/Sydney', 'Asia/Tokyo', 'Europe/Paris',
-                   'US/Pacific', 'US/Eastern']:
-            for expected, dates in compat.iteritems(freqs):
-                idx = DatetimeIndex(dates, tz=tz)
-                self.assertEqual(idx.inferred_freq, expected)
-
-    def test_infer_freq_tz_transition(self):
-        # Tests for #8772
-        date_pairs = [['2013-11-02', '2013-11-5'], #Fall DST
-                      ['2014-03-08', '2014-03-11'], #Spring DST
-                      ['2014-01-01', '2014-01-03']] #Regular Time
-        freqs = ['3H', '10T', '3601S', '3600001L', '3600000001U', '3600000000001N']
-
-        for tz in [None, 'Australia/Sydney', 'Asia/Tokyo', 'Europe/Paris',
-                   'US/Pacific', 'US/Eastern']:
-            for date_pair in date_pairs:
-                for freq in freqs:
-                    idx = date_range(date_pair[0], date_pair[1], freq=freq, tz=tz)
-                    self.assertEqual(idx.inferred_freq, freq)
-
-        index = date_range("2013-11-03", periods=5, freq="3H").tz_localize("America/Chicago")
-        self.assertIsNone(index.inferred_freq)
-
-    def test_infer_freq_businesshour(self):
-        # GH 7905
-        idx = DatetimeIndex(['2014-07-01 09:00', '2014-07-01 10:00', '2014-07-01 11:00',
-                             '2014-07-01 12:00', '2014-07-01 13:00', '2014-07-01 14:00'])
-        # hourly freq in a day must result in 'H'
-        self.assertEqual(idx.inferred_freq, 'H')
-
-        idx = DatetimeIndex(['2014-07-01 09:00', '2014-07-01 10:00', '2014-07-01 11:00',
-                             '2014-07-01 12:00', '2014-07-01 13:00', '2014-07-01 14:00',
-                             '2014-07-01 15:00', '2014-07-01 16:00',
-                             '2014-07-02 09:00', '2014-07-02 10:00', '2014-07-02 11:00'])
-        self.assertEqual(idx.inferred_freq, 'BH')
-
-        idx = DatetimeIndex(['2014-07-04 09:00', '2014-07-04 10:00', '2014-07-04 11:00',
-                             '2014-07-04 12:00', '2014-07-04 13:00', '2014-07-04 14:00',
-                             '2014-07-04 15:00', '2014-07-04 16:00',
-                             '2014-07-07 09:00', '2014-07-07 10:00', '2014-07-07 11:00'])
-        self.assertEqual(idx.inferred_freq, 'BH')
-
-        idx = DatetimeIndex(['2014-07-04 09:00', '2014-07-04 10:00', '2014-07-04 11:00',
-                             '2014-07-04 12:00', '2014-07-04 13:00', '2014-07-04 14:00',
-                             '2014-07-04 15:00', '2014-07-04 16:00',
-                             '2014-07-07 09:00', '2014-07-07 10:00', '2014-07-07 11:00',
-                             '2014-07-07 12:00', '2014-07-07 13:00', '2014-07-07 14:00',
-                             '2014-07-07 15:00', '2014-07-07 16:00',
-                             '2014-07-08 09:00', '2014-07-08 10:00', '2014-07-08 11:00',
-                             '2014-07-08 12:00', '2014-07-08 13:00', '2014-07-08 14:00',
-                             '2014-07-08 15:00', '2014-07-08 16:00'])
-        self.assertEqual(idx.inferred_freq, 'BH')
-
-    def test_not_monotonic(self):
-        rng = _dti(['1/31/2000', '1/31/2001', '1/31/2002'])
-        rng = rng[::-1]
-        self.assertEqual(rng.inferred_freq, '-1A-JAN')
-
-    def test_non_datetimeindex(self):
-        rng = _dti(['1/31/2000', '1/31/2001', '1/31/2002'])
-
-        vals = rng.to_pydatetime()
-
-        result = frequencies.infer_freq(vals)
-        self.assertEqual(result, rng.inferred_freq)
-
-    def test_invalid_index_types(self):
-
-        # test all index types
-        for i in [ tm.makeIntIndex(10),
-                   tm.makeFloatIndex(10),
-                   tm.makePeriodIndex(10) ]:
-            self.assertRaises(TypeError, lambda : frequencies.infer_freq(i))
-
-        # GH 10822
-        # odd error message on conversions to datetime for unicode
-        if not is_platform_windows():
-            for i in [ tm.makeStringIndex(10),
-                       tm.makeUnicodeIndex(10) ]:
-                self.assertRaises(ValueError, lambda : frequencies.infer_freq(i))
-
-    def test_string_datetimelike_compat(self):
-
-        # GH 6463
-        expected = frequencies.infer_freq(['2004-01', '2004-02', '2004-03', '2004-04'])
-        result = frequencies.infer_freq(Index(['2004-01', '2004-02', '2004-03', '2004-04']))
-        self.assertEqual(result,expected)
-
-    def test_series(self):
-
-        # GH6407
-        # inferring series
-
-        # invalid type of Series
-        for s in [ Series(np.arange(10)),
-                   Series(np.arange(10.))]:
-            self.assertRaises(TypeError, lambda : frequencies.infer_freq(s))
-
-        # a non-convertible string
-        self.assertRaises(ValueError, lambda : frequencies.infer_freq(Series(['foo','bar'])))
-
-        # cannot infer on PeriodIndex
-        for freq in [None, 'L']:
-            s = Series(period_range('2013',periods=10,freq=freq))
-            self.assertRaises(TypeError, lambda : frequencies.infer_freq(s))
-        for freq in ['Y']:
-            with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-                s = Series(period_range('2013',periods=10,freq=freq))
-            self.assertRaises(TypeError, lambda : frequencies.infer_freq(s))
-
-        # DateTimeIndex
-        for freq in ['M', 'L', 'S']:
-            s = Series(date_range('20130101',periods=10,freq=freq))
-            inferred = frequencies.infer_freq(s)
-            self.assertEqual(inferred,freq)
-
-        s = Series(date_range('20130101','20130110'))
-        inferred = frequencies.infer_freq(s)
-        self.assertEqual(inferred,'D')
-
-    def test_legacy_offset_warnings(self):
-        for k, v in compat.iteritems(frequencies._rule_aliases):
-            with tm.assert_produces_warning(FutureWarning):
-                result = frequencies.get_offset(k)
-            exp = frequencies.get_offset(v)
-            self.assertEqual(result, exp)
-
-            with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-                idx = date_range('2011-01-01', periods=5, freq=k)
-            exp = date_range('2011-01-01', periods=5, freq=v)
-            self.assert_index_equal(idx, exp)
-
-
-MONTHS = ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL', 'AUG', 'SEP',
-          'OCT', 'NOV', 'DEC']
-
-
-def test_is_superperiod_subperiod():
-    assert(frequencies.is_superperiod(offsets.YearEnd(), offsets.MonthEnd()))
-    assert(frequencies.is_subperiod(offsets.MonthEnd(), offsets.YearEnd()))
-
-    assert(frequencies.is_superperiod(offsets.Hour(), offsets.Minute()))
-    assert(frequencies.is_subperiod(offsets.Minute(), offsets.Hour()))
-
-    assert(frequencies.is_superperiod(offsets.Second(), offsets.Milli()))
-    assert(frequencies.is_subperiod(offsets.Milli(), offsets.Second()))
-
-    assert(frequencies.is_superperiod(offsets.Milli(), offsets.Micro()))
-    assert(frequencies.is_subperiod(offsets.Micro(), offsets.Milli()))
-
-    assert(frequencies.is_superperiod(offsets.Micro(), offsets.Nano()))
-    assert(frequencies.is_subperiod(offsets.Nano(), offsets.Micro()))
-
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tseries/tests/test_holiday.py b/pandas/tseries/tests/test_holiday.py
deleted file mode 100644
index 7d233ba78e7b6..0000000000000
--- a/pandas/tseries/tests/test_holiday.py
+++ /dev/null
@@ -1,305 +0,0 @@
-
-from datetime import datetime
-import pandas.util.testing as tm
-from pandas import DatetimeIndex
-from pandas.tseries.holiday import (
-    USFederalHolidayCalendar, USMemorialDay, USThanksgivingDay,
-    nearest_workday, next_monday_or_tuesday, next_monday,
-    previous_friday, sunday_to_monday, Holiday, DateOffset,
-    MO, Timestamp, AbstractHolidayCalendar, get_calendar,
-    HolidayCalendarFactory, next_workday, previous_workday,
-    before_nearest_workday, EasterMonday, GoodFriday,
-    after_nearest_workday, weekend_to_monday)
-from pytz import utc
-import nose
-
-class TestCalendar(tm.TestCase):
-
-    def setUp(self):
-        self.holiday_list = [
-                       datetime(2012, 1, 2),
-                       datetime(2012, 1, 16),
-                       datetime(2012, 2, 20),
-                       datetime(2012, 5, 28),
-                       datetime(2012, 7, 4),
-                       datetime(2012, 9, 3),
-                       datetime(2012, 10, 8),
-                       datetime(2012, 11, 12),
-                       datetime(2012, 11, 22),
-                       datetime(2012, 12, 25)]
-
-        self.start_date = datetime(2012, 1, 1)
-        self.end_date = datetime(2012, 12, 31)
-
-    def test_calendar(self):
-
-        calendar = USFederalHolidayCalendar()
-        holidays = calendar.holidays(self.start_date,
-                                     self.end_date)
-
-        holidays_1 = calendar.holidays(
-                        self.start_date.strftime('%Y-%m-%d'),
-                        self.end_date.strftime('%Y-%m-%d'))
-        holidays_2 = calendar.holidays(
-                        Timestamp(self.start_date),
-                        Timestamp(self.end_date))
-
-        self.assertEqual(list(holidays.to_pydatetime()),
-                         self.holiday_list)
-        self.assertEqual(list(holidays_1.to_pydatetime()),
-                         self.holiday_list)
-        self.assertEqual(list(holidays_2.to_pydatetime()),
-                         self.holiday_list)
-
-    def test_calendar_caching(self):
-        # Test for issue #9552
-
-        class TestCalendar(AbstractHolidayCalendar):
-            def __init__(self, name=None, rules=None):
-                super(TestCalendar, self).__init__(
-                    name=name,
-                    rules=rules
-                )
-
-        jan1 = TestCalendar(rules=[Holiday('jan1', year=2015, month=1, day=1)])
-        jan2 = TestCalendar(rules=[Holiday('jan2', year=2015, month=1, day=2)])
-
-        tm.assert_index_equal(
-            jan1.holidays(),
-            DatetimeIndex(['01-Jan-2015'])
-        )
-        tm.assert_index_equal(
-            jan2.holidays(),
-            DatetimeIndex(['02-Jan-2015'])
-        )
-
-
-class TestHoliday(tm.TestCase):
-
-    def setUp(self):
-        self.start_date = datetime(2011, 1, 1)
-        self.end_date   = datetime(2020, 12, 31)
-
-    def check_results(self, holiday, start, end, expected):
-        self.assertEqual(list(holiday.dates(start, end)), expected)
-        # Verify that timezone info is preserved.
-        self.assertEqual(
-            list(
-                holiday.dates(
-                    utc.localize(Timestamp(start)),
-                    utc.localize(Timestamp(end)),
-                )
-            ),
-            [utc.localize(dt) for dt in expected],
-        )
-
-    def test_usmemorialday(self):
-        self.check_results(
-            holiday=USMemorialDay,
-            start=self.start_date,
-            end=self.end_date,
-            expected=[
-                datetime(2011, 5, 30),
-                datetime(2012, 5, 28),
-                datetime(2013, 5, 27),
-                datetime(2014, 5, 26),
-                datetime(2015, 5, 25),
-                datetime(2016, 5, 30),
-                datetime(2017, 5, 29),
-                datetime(2018, 5, 28),
-                datetime(2019, 5, 27),
-                datetime(2020, 5, 25),
-            ],
-        )
-
-    def test_non_observed_holiday(self):
-
-        self.check_results(
-            Holiday('July 4th Eve', month=7, day=3),
-            start="2001-01-01",
-            end="2003-03-03",
-            expected=[
-                Timestamp('2001-07-03 00:00:00'),
-                Timestamp('2002-07-03 00:00:00')
-            ]
-        )
-
-        self.check_results(
-            Holiday('July 4th Eve', month=7, day=3, days_of_week=(0, 1, 2, 3)),
-            start="2001-01-01",
-            end="2008-03-03",
-            expected=[
-                Timestamp('2001-07-03 00:00:00'),
-                Timestamp('2002-07-03 00:00:00'),
-                Timestamp('2003-07-03 00:00:00'),
-                Timestamp('2006-07-03 00:00:00'),
-                Timestamp('2007-07-03 00:00:00'),
-            ]
-        )
-
-    def test_easter(self):
-
-        self.check_results(
-            EasterMonday,
-            start=self.start_date,
-            end=self.end_date,
-            expected=[
-                Timestamp('2011-04-25 00:00:00'),
-                Timestamp('2012-04-09 00:00:00'),
-                Timestamp('2013-04-01 00:00:00'),
-                Timestamp('2014-04-21 00:00:00'),
-                Timestamp('2015-04-06 00:00:00'),
-                Timestamp('2016-03-28 00:00:00'),
-                Timestamp('2017-04-17 00:00:00'),
-                Timestamp('2018-04-02 00:00:00'),
-                Timestamp('2019-04-22 00:00:00'),
-                Timestamp('2020-04-13 00:00:00'),
-            ],
-        )
-        self.check_results(
-            GoodFriday,
-            start=self.start_date,
-            end=self.end_date,
-            expected=[
-                Timestamp('2011-04-22 00:00:00'),
-                Timestamp('2012-04-06 00:00:00'),
-                Timestamp('2013-03-29 00:00:00'),
-                Timestamp('2014-04-18 00:00:00'),
-                Timestamp('2015-04-03 00:00:00'),
-                Timestamp('2016-03-25 00:00:00'),
-                Timestamp('2017-04-14 00:00:00'),
-                Timestamp('2018-03-30 00:00:00'),
-                Timestamp('2019-04-19 00:00:00'),
-                Timestamp('2020-04-10 00:00:00'),
-            ],
-        )
-
-    def test_usthanksgivingday(self):
-
-        self.check_results(
-            USThanksgivingDay,
-            start=self.start_date,
-            end=self.end_date,
-            expected=[
-                datetime(2011, 11, 24),
-                datetime(2012, 11, 22),
-                datetime(2013, 11, 28),
-                datetime(2014, 11, 27),
-                datetime(2015, 11, 26),
-                datetime(2016, 11, 24),
-                datetime(2017, 11, 23),
-                datetime(2018, 11, 22),
-                datetime(2019, 11, 28),
-                datetime(2020, 11, 26),
-            ],
-        )
-
-    def test_argument_types(self):
-        holidays = USThanksgivingDay.dates(self.start_date,
-                                           self.end_date)
-
-        holidays_1 = USThanksgivingDay.dates(
-                        self.start_date.strftime('%Y-%m-%d'),
-                        self.end_date.strftime('%Y-%m-%d'))
-
-        holidays_2 = USThanksgivingDay.dates(
-                        Timestamp(self.start_date),
-                        Timestamp(self.end_date))
-
-        self.assertEqual(holidays, holidays_1)
-        self.assertEqual(holidays, holidays_2)
-
-    def test_special_holidays(self):
-        base_date = [datetime(2012, 5, 28)]
-        holiday_1 = Holiday('One-Time', year=2012, month=5, day=28)
-        holiday_2 = Holiday('Range', month=5, day=28,
-                            start_date=datetime(2012, 1, 1),
-                            end_date=datetime(2012, 12, 31),
-                            offset=DateOffset(weekday=MO(1)))
-
-        self.assertEqual(base_date,
-                         holiday_1.dates(self.start_date, self.end_date))
-        self.assertEqual(base_date,
-                         holiday_2.dates(self.start_date, self.end_date))
-
-    def test_get_calendar(self):
-        class TestCalendar(AbstractHolidayCalendar):
-            rules = []
-
-        calendar = get_calendar('TestCalendar')
-        self.assertEqual(TestCalendar, calendar.__class__)
-
-    def test_factory(self):
-        class_1 = HolidayCalendarFactory('MemorialDay', AbstractHolidayCalendar,
-                                         USMemorialDay)
-        class_2 = HolidayCalendarFactory('Thansksgiving', AbstractHolidayCalendar,
-                                         USThanksgivingDay)
-        class_3 = HolidayCalendarFactory('Combined', class_1, class_2)
-
-        self.assertEqual(len(class_1.rules), 1)
-        self.assertEqual(len(class_2.rules), 1)
-        self.assertEqual(len(class_3.rules), 2)
-
-
-class TestObservanceRules(tm.TestCase):
-
-    def setUp(self):
-        self.we =   datetime(2014, 4, 9)
-        self.th =   datetime(2014, 4, 10)
-        self.fr =   datetime(2014, 4, 11)
-        self.sa =   datetime(2014, 4, 12)
-        self.su =   datetime(2014, 4, 13)
-        self.mo =   datetime(2014, 4, 14)
-        self.tu =   datetime(2014, 4, 15)
-
-    def test_next_monday(self):
-        self.assertEqual(next_monday(self.sa), self.mo)
-        self.assertEqual(next_monday(self.su), self.mo)
-
-    def test_next_monday_or_tuesday(self):
-        self.assertEqual(next_monday_or_tuesday(self.sa), self.mo)
-        self.assertEqual(next_monday_or_tuesday(self.su), self.tu)
-        self.assertEqual(next_monday_or_tuesday(self.mo), self.tu)
-
-    def test_previous_friday(self):
-        self.assertEqual(previous_friday(self.sa), self.fr)
-        self.assertEqual(previous_friday(self.su), self.fr)
-
-    def test_sunday_to_monday(self):
-        self.assertEqual(sunday_to_monday(self.su), self.mo)
-
-    def test_nearest_workday(self):
-        self.assertEqual(nearest_workday(self.sa), self.fr)
-        self.assertEqual(nearest_workday(self.su), self.mo)
-        self.assertEqual(nearest_workday(self.mo), self.mo)
-
-    def test_weekend_to_monday(self):
-        self.assertEqual(weekend_to_monday(self.sa), self.mo)
-        self.assertEqual(weekend_to_monday(self.su), self.mo)
-        self.assertEqual(weekend_to_monday(self.mo), self.mo)
-
-    def test_next_workday(self):
-        self.assertEqual(next_workday(self.sa), self.mo)
-        self.assertEqual(next_workday(self.su), self.mo)
-        self.assertEqual(next_workday(self.mo), self.tu)
-
-    def test_previous_workday(self):
-        self.assertEqual(previous_workday(self.sa), self.fr)
-        self.assertEqual(previous_workday(self.su), self.fr)
-        self.assertEqual(previous_workday(self.tu), self.mo)
-
-    def test_before_nearest_workday(self):
-        self.assertEqual(before_nearest_workday(self.sa), self.th)
-        self.assertEqual(before_nearest_workday(self.su), self.fr)
-        self.assertEqual(before_nearest_workday(self.tu), self.mo)
-    
-    def test_after_nearest_workday(self):
-        self.assertEqual(after_nearest_workday(self.sa), self.mo)
-        self.assertEqual(after_nearest_workday(self.su), self.tu)
-        self.assertEqual(after_nearest_workday(self.fr), self.mo)
-    
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
-
diff --git a/pandas/tseries/tests/test_offsets.py b/pandas/tseries/tests/test_offsets.py
deleted file mode 100644
index fada4a966c10b..0000000000000
--- a/pandas/tseries/tests/test_offsets.py
+++ /dev/null
@@ -1,3999 +0,0 @@
-import os
-from datetime import date, datetime, timedelta
-from dateutil.relativedelta import relativedelta
-from pandas.compat import range, iteritems
-from pandas import compat
-import nose
-from nose.tools import assert_raises
-
-
-import numpy as np
-
-from pandas.core.datetools import (
-    bday, BDay, CDay, BQuarterEnd, BMonthEnd, BusinessHour,
-    CBMonthEnd, CBMonthBegin,
-    BYearEnd, MonthEnd, MonthBegin, BYearBegin, CustomBusinessDay,
-    QuarterBegin, BQuarterBegin, BMonthBegin, DateOffset, Week,
-    YearBegin, YearEnd, Hour, Minute, Second, Day, Micro, Milli, Nano, Easter,
-    WeekOfMonth, format, ole2datetime, QuarterEnd, to_datetime, normalize_date,
-    get_offset, get_offset_name, get_standard_freq)
-
-from pandas import Series
-from pandas.tseries.frequencies import _offset_map, get_freq_code, _get_freq_str
-from pandas.tseries.index import _to_m8, DatetimeIndex, _daterange_cache, date_range
-from pandas.tseries.tools import parse_time_string, DateParseError
-import pandas.tseries.offsets as offsets
-from pandas.io.pickle import read_pickle
-from pandas.tslib import NaT, Timestamp, Timedelta
-import pandas.tslib as tslib
-from pandas.util.testing import assertRaisesRegexp
-import pandas.util.testing as tm
-from pandas.tseries.offsets import BusinessMonthEnd, CacheableOffset, \
-    LastWeekOfMonth, FY5253, FY5253Quarter, WeekDay
-from pandas.tseries.holiday import USFederalHolidayCalendar
-
-_multiprocess_can_split_ = True
-
-
-def test_monthrange():
-    import calendar
-    for y in range(2000, 2013):
-        for m in range(1, 13):
-            assert tslib.monthrange(y, m) == calendar.monthrange(y, m)
-
-
-####
-## Misc function tests
-####
-
-
-def test_format():
-    actual = format(datetime(2008, 1, 15))
-    assert actual == '20080115'
-
-
-def test_ole2datetime():
-    actual = ole2datetime(60000)
-    assert actual == datetime(2064, 4, 8)
-
-    assert_raises(ValueError, ole2datetime, 60)
-
-
-def test_to_datetime1():
-    actual = to_datetime(datetime(2008, 1, 15))
-    assert actual == datetime(2008, 1, 15)
-
-    actual = to_datetime('20080115')
-    assert actual == datetime(2008, 1, 15)
-
-    # unparseable
-    s = 'Month 1, 1999'
-    assert to_datetime(s, errors='ignore') == s
-
-
-def test_normalize_date():
-    actual = normalize_date(datetime(2007, 10, 1, 1, 12, 5, 10))
-    assert actual == datetime(2007, 10, 1)
-
-
-def test_to_m8():
-    valb = datetime(2007, 10, 1)
-    valu = _to_m8(valb)
-    tm.assertIsInstance(valu, np.datetime64)
-    # assert valu == np.datetime64(datetime(2007,10,1))
-
-# def test_datetime64_box():
-#    valu = np.datetime64(datetime(2007,10,1))
-#    valb = _dt_box(valu)
-#    assert type(valb) == datetime
-#    assert valb == datetime(2007,10,1)
-
-#####
-### DateOffset Tests
-#####
-
-class Base(tm.TestCase):
-    _offset = None
-
-    _offset_types = [getattr(offsets, o) for o in offsets.__all__]
-
-    timezones = [None, 'UTC', 'Asia/Tokyo', 'US/Eastern',
-                 'dateutil/Asia/Tokyo', 'dateutil/US/Pacific']
-
-    @property
-    def offset_types(self):
-        return self._offset_types
-
-    def _get_offset(self, klass, value=1, normalize=False):
-        # create instance from offset class
-        if klass is FY5253 or klass is FY5253Quarter:
-            klass = klass(n=value, startingMonth=1, weekday=1,
-                          qtr_with_extra_week=1, variation='last',
-                          normalize=normalize)
-        elif klass is LastWeekOfMonth:
-            klass = klass(n=value, weekday=5, normalize=normalize)
-        elif klass is WeekOfMonth:
-            klass = klass(n=value, week=1, weekday=5, normalize=normalize)
-        elif klass is Week:
-            klass = klass(n=value, weekday=5, normalize=normalize)
-        elif klass is DateOffset:
-            klass = klass(days=value, normalize=normalize)
-        else:
-            try:
-                klass = klass(value, normalize=normalize)
-            except:
-                klass = klass(normalize=normalize)
-        return klass
-
-    def test_apply_out_of_range(self):
-        if self._offset is None:
-            return
-
-        # try to create an out-of-bounds result timestamp; if we can't create the offset
-        # skip
-        try:
-            if self._offset is BusinessHour:
-                # Using 10000 in BusinessHour fails in tz check because of DST difference
-                offset = self._get_offset(self._offset, value=100000)
-            else:
-                offset = self._get_offset(self._offset, value=10000)
-
-            result = Timestamp('20080101') + offset
-            self.assertIsInstance(result, datetime)
-            self.assertIsNone(result.tzinfo)
-
-            tm._skip_if_no_pytz()
-            tm._skip_if_no_dateutil()
-            # Check tz is preserved
-            for tz in self.timezones:
-                t = Timestamp('20080101', tz=tz)
-                result = t + offset
-                self.assertIsInstance(result, datetime)
-                self.assertEqual(t.tzinfo, result.tzinfo)
-
-        except (tslib.OutOfBoundsDatetime):
-            raise
-        except (ValueError, KeyError) as e:
-            raise nose.SkipTest("cannot create out_of_range offset: {0} {1}".format(str(self).split('.')[-1],e))
-
-
-class TestCommon(Base):
-
-    def setUp(self):
-
-        # exected value created by Base._get_offset
-        # are applied to 2011/01/01 09:00 (Saturday)
-        # used for .apply and .rollforward
-        self.expecteds = {'Day': Timestamp('2011-01-02 09:00:00'),
-                          'DateOffset': Timestamp('2011-01-02 09:00:00'),
-                          'BusinessDay': Timestamp('2011-01-03 09:00:00'),
-                          'CustomBusinessDay': Timestamp('2011-01-03 09:00:00'),
-                          'CustomBusinessMonthEnd': Timestamp('2011-01-31 09:00:00'),
-                          'CustomBusinessMonthBegin': Timestamp('2011-01-03 09:00:00'),
-                          'MonthBegin': Timestamp('2011-02-01 09:00:00'),
-                          'BusinessMonthBegin': Timestamp('2011-01-03 09:00:00'),
-                          'MonthEnd': Timestamp('2011-01-31 09:00:00'),
-                          'BusinessMonthEnd': Timestamp('2011-01-31 09:00:00'),
-                          'YearBegin': Timestamp('2012-01-01 09:00:00'),
-                          'BYearBegin': Timestamp('2011-01-03 09:00:00'),
-                          'YearEnd': Timestamp('2011-12-31 09:00:00'),
-                          'BYearEnd': Timestamp('2011-12-30 09:00:00'),
-                          'QuarterBegin': Timestamp('2011-03-01 09:00:00'),
-                          'BQuarterBegin': Timestamp('2011-03-01 09:00:00'),
-                          'QuarterEnd': Timestamp('2011-03-31 09:00:00'),
-                          'BQuarterEnd': Timestamp('2011-03-31 09:00:00'),
-                          'BusinessHour': Timestamp('2011-01-03 10:00:00'),
-                          'WeekOfMonth': Timestamp('2011-01-08 09:00:00'),
-                          'LastWeekOfMonth': Timestamp('2011-01-29 09:00:00'),
-                          'FY5253Quarter': Timestamp('2011-01-25 09:00:00'),
-                          'FY5253': Timestamp('2011-01-25 09:00:00'),
-                          'Week': Timestamp('2011-01-08 09:00:00'),
-                          'Easter': Timestamp('2011-04-24 09:00:00'),
-                          'Hour': Timestamp('2011-01-01 10:00:00'),
-                          'Minute': Timestamp('2011-01-01 09:01:00'),
-                          'Second': Timestamp('2011-01-01 09:00:01'),
-                          'Milli': Timestamp('2011-01-01 09:00:00.001000'),
-                          'Micro': Timestamp('2011-01-01 09:00:00.000001'),
-                          'Nano': Timestamp(np.datetime64('2011-01-01T09:00:00.000000001Z'))}
-
-    def test_return_type(self):
-        for offset in self.offset_types:
-            offset = self._get_offset(offset)
-
-            # make sure that we are returning a Timestamp
-            result = Timestamp('20080101') + offset
-            self.assertIsInstance(result, Timestamp)
-
-            # make sure that we are returning NaT
-            self.assertTrue(NaT + offset is NaT)
-            self.assertTrue(offset + NaT is NaT)
-
-            self.assertTrue(NaT - offset is NaT)
-            self.assertTrue((-offset).apply(NaT) is NaT)
-
-    def test_offset_n(self):
-        for offset_klass in self.offset_types:
-            offset = self._get_offset(offset_klass)
-            self.assertEqual(offset.n, 1)
-
-            neg_offset = offset * -1
-            self.assertEqual(neg_offset.n, -1)
-
-            mul_offset = offset * 3
-            self.assertEqual(mul_offset.n, 3)
-
-    def test_offset_freqstr(self):
-        for offset_klass in self.offset_types:
-            offset = self._get_offset(offset_klass)
-
-            freqstr = offset.freqstr
-            if freqstr not in ('<Easter>', "<DateOffset: kwds={'days': 1}>",
-                               'LWOM-SAT', ):
-                code = get_offset(freqstr)
-                self.assertEqual(offset.rule_code, code)
-
-    def _check_offsetfunc_works(self, offset, funcname, dt, expected,
-                                normalize=False):
-        offset_s = self._get_offset(offset, normalize=normalize)
-        func = getattr(offset_s, funcname)
-
-        result = func(dt)
-        self.assertTrue(isinstance(result, Timestamp))
-        self.assertEqual(result, expected)
-
-        result = func(Timestamp(dt))
-        self.assertTrue(isinstance(result, Timestamp))
-        self.assertEqual(result, expected)
-
-        # test nano second is preserved
-        result = func(Timestamp(dt) + Nano(5))
-        self.assertTrue(isinstance(result, Timestamp))
-        if normalize is False:
-            self.assertEqual(result, expected + Nano(5))
-        else:
-            self.assertEqual(result, expected)
-
-        if isinstance(dt, np.datetime64):
-            # test tz when input is datetime or Timestamp
-            return
-
-        tm._skip_if_no_pytz()
-        tm._skip_if_no_dateutil()
-
-        for tz in self.timezones:
-            expected_localize = expected.tz_localize(tz)
-            tz_obj = tslib.maybe_get_tz(tz)
-            dt_tz = tslib._localize_pydatetime(dt, tz_obj)
-
-            result = func(dt_tz)
-            self.assertTrue(isinstance(result, Timestamp))
-            self.assertEqual(result, expected_localize)
-
-            result = func(Timestamp(dt, tz=tz))
-            self.assertTrue(isinstance(result, Timestamp))
-            self.assertEqual(result, expected_localize)
-
-            # test nano second is preserved
-            result = func(Timestamp(dt, tz=tz) + Nano(5))
-            self.assertTrue(isinstance(result, Timestamp))
-            if normalize is False:
-                self.assertEqual(result, expected_localize + Nano(5))
-            else:
-                self.assertEqual(result, expected_localize)
-
-    def test_apply(self):
-        sdt = datetime(2011, 1, 1, 9, 0)
-        ndt = np.datetime64('2011-01-01 09:00Z')
-
-        for offset in self.offset_types:
-            for dt in [sdt, ndt]:
-                expected = self.expecteds[offset.__name__]
-                self._check_offsetfunc_works(offset, 'apply', dt, expected)
-
-                expected = Timestamp(expected.date())
-                self._check_offsetfunc_works(offset, 'apply', dt, expected,
-                                             normalize=True)
-
-    def test_rollforward(self):
-        expecteds = self.expecteds.copy()
-
-        # result will not be changed if the target is on the offset
-        no_changes = ['Day', 'MonthBegin', 'YearBegin', 'Week', 'Hour', 'Minute',
-                      'Second', 'Milli', 'Micro', 'Nano', 'DateOffset']
-        for n in no_changes:
-            expecteds[n] = Timestamp('2011/01/01 09:00')
-
-        expecteds['BusinessHour'] = Timestamp('2011-01-03 09:00:00')
-
-        # but be changed when normalize=True
-        norm_expected = expecteds.copy()
-        for k in norm_expected:
-            norm_expected[k] = Timestamp(norm_expected[k].date())
-
-        normalized = {'Day': Timestamp('2011-01-02 00:00:00'),
-                      'DateOffset': Timestamp('2011-01-02 00:00:00'),
-                      'MonthBegin': Timestamp('2011-02-01 00:00:00'),
-                      'YearBegin': Timestamp('2012-01-01 00:00:00'),
-                      'Week': Timestamp('2011-01-08 00:00:00'),
-                      'Hour': Timestamp('2011-01-01 00:00:00'),
-                      'Minute': Timestamp('2011-01-01 00:00:00'),
-                      'Second': Timestamp('2011-01-01 00:00:00'),
-                      'Milli': Timestamp('2011-01-01 00:00:00'),
-                      'Micro': Timestamp('2011-01-01 00:00:00')}
-        norm_expected.update(normalized)
-
-        sdt = datetime(2011, 1, 1, 9, 0)
-        ndt = np.datetime64('2011-01-01 09:00Z')
-
-        for offset in self.offset_types:
-            for dt in [sdt, ndt]:
-                expected = expecteds[offset.__name__]
-                self._check_offsetfunc_works(offset, 'rollforward', dt, expected)
-                expected = norm_expected[offset.__name__]
-                self._check_offsetfunc_works(offset, 'rollforward', dt, expected,
-                                             normalize=True)
-
-    def test_rollback(self):
-        expecteds = {'BusinessDay': Timestamp('2010-12-31 09:00:00'),
-                     'CustomBusinessDay': Timestamp('2010-12-31 09:00:00'),
-                     'CustomBusinessMonthEnd': Timestamp('2010-12-31 09:00:00'),
-                     'CustomBusinessMonthBegin': Timestamp('2010-12-01 09:00:00'),
-                     'BusinessMonthBegin': Timestamp('2010-12-01 09:00:00'),
-                     'MonthEnd': Timestamp('2010-12-31 09:00:00'),
-                     'BusinessMonthEnd': Timestamp('2010-12-31 09:00:00'),
-                     'BYearBegin': Timestamp('2010-01-01 09:00:00'),
-                     'YearEnd': Timestamp('2010-12-31 09:00:00'),
-                     'BYearEnd': Timestamp('2010-12-31 09:00:00'),
-                     'QuarterBegin': Timestamp('2010-12-01 09:00:00'),
-                     'BQuarterBegin': Timestamp('2010-12-01 09:00:00'),
-                     'QuarterEnd': Timestamp('2010-12-31 09:00:00'),
-                     'BQuarterEnd': Timestamp('2010-12-31 09:00:00'),
-                     'BusinessHour': Timestamp('2010-12-31 17:00:00'),
-                     'WeekOfMonth': Timestamp('2010-12-11 09:00:00'),
-                     'LastWeekOfMonth': Timestamp('2010-12-25 09:00:00'),
-                     'FY5253Quarter': Timestamp('2010-10-26 09:00:00'),
-                     'FY5253': Timestamp('2010-01-26 09:00:00'),
-                     'Easter': Timestamp('2010-04-04 09:00:00')}
-
-        # result will not be changed if the target is on the offset
-        for n in ['Day', 'MonthBegin', 'YearBegin', 'Week', 'Hour', 'Minute',
-                  'Second', 'Milli', 'Micro', 'Nano', 'DateOffset']:
-            expecteds[n] = Timestamp('2011/01/01 09:00')
-
-        # but be changed when normalize=True
-        norm_expected = expecteds.copy()
-        for k in norm_expected:
-            norm_expected[k] = Timestamp(norm_expected[k].date())
-
-        normalized = {'Day': Timestamp('2010-12-31 00:00:00'),
-                      'DateOffset': Timestamp('2010-12-31 00:00:00'),
-                      'MonthBegin': Timestamp('2010-12-01 00:00:00'),
-                      'YearBegin': Timestamp('2010-01-01 00:00:00'),
-                      'Week': Timestamp('2010-12-25 00:00:00'),
-                      'Hour': Timestamp('2011-01-01 00:00:00'),
-                      'Minute': Timestamp('2011-01-01 00:00:00'),
-                      'Second': Timestamp('2011-01-01 00:00:00'),
-                      'Milli': Timestamp('2011-01-01 00:00:00'),
-                      'Micro': Timestamp('2011-01-01 00:00:00')}
-        norm_expected.update(normalized)
-
-        sdt = datetime(2011, 1, 1, 9, 0)
-        ndt = np.datetime64('2011-01-01 09:00Z')
-
-        for offset in self.offset_types:
-            for dt in [sdt, ndt]:
-                expected = expecteds[offset.__name__]
-                self._check_offsetfunc_works(offset, 'rollback', dt, expected)
-
-                expected = norm_expected[offset.__name__]
-                self._check_offsetfunc_works(offset, 'rollback',
-                                             dt, expected, normalize=True)
-
-    def test_onOffset(self):
-        for offset in self.offset_types:
-            dt = self.expecteds[offset.__name__]
-            offset_s = self._get_offset(offset)
-            self.assertTrue(offset_s.onOffset(dt))
-
-            # when normalize=True, onOffset checks time is 00:00:00
-            offset_n = self._get_offset(offset, normalize=True)
-            self.assertFalse(offset_n.onOffset(dt))
-
-            if offset is BusinessHour:
-                # In default BusinessHour (9:00-17:00), normalized time
-                # cannot be in business hour range
-                continue
-            date = datetime(dt.year, dt.month, dt.day)
-            self.assertTrue(offset_n.onOffset(date))
-
-    def test_add(self):
-        dt = datetime(2011, 1, 1, 9, 0)
-
-        for offset in self.offset_types:
-            offset_s = self._get_offset(offset)
-            expected = self.expecteds[offset.__name__]
-
-            result_dt = dt + offset_s
-            result_ts = Timestamp(dt) + offset_s
-            for result in [result_dt, result_ts]:
-                self.assertTrue(isinstance(result, Timestamp))
-                self.assertEqual(result, expected)
-
-            tm._skip_if_no_pytz()
-            for tz in self.timezones:
-                expected_localize = expected.tz_localize(tz)
-                result = Timestamp(dt, tz=tz) + offset_s
-                self.assertTrue(isinstance(result, Timestamp))
-                self.assertEqual(result, expected_localize)
-
-            # normalize=True
-            offset_s = self._get_offset(offset, normalize=True)
-            expected = Timestamp(expected.date())
-
-            result_dt = dt + offset_s
-            result_ts = Timestamp(dt) + offset_s
-            for result in [result_dt, result_ts]:
-                self.assertTrue(isinstance(result, Timestamp))
-                self.assertEqual(result, expected)
-
-            for tz in self.timezones:
-                expected_localize = expected.tz_localize(tz)
-                result = Timestamp(dt, tz=tz) + offset_s
-                self.assertTrue(isinstance(result, Timestamp))
-                self.assertEqual(result, expected_localize)
-
-    def test_pickle_v0_15_2(self):
-        offsets = {'DateOffset': DateOffset(years=1),
-                   'MonthBegin': MonthBegin(1),
-                   'Day': Day(1),
-                   'YearBegin': YearBegin(1),
-                   'Week': Week(1)}
-        pickle_path = os.path.join(tm.get_data_path(),
-                                   'dateoffset_0_15_2.pickle')
-        # This code was executed once on v0.15.2 to generate the pickle:
-        # with open(pickle_path, 'wb') as f: pickle.dump(offsets, f)
-        #
-        tm.assert_dict_equal(offsets, read_pickle(pickle_path))
-
-class TestDateOffset(Base):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.d = Timestamp(datetime(2008, 1, 2))
-        _offset_map.clear()
-
-    def test_repr(self):
-        repr(DateOffset())
-        repr(DateOffset(2))
-        repr(2 * DateOffset())
-        repr(2 * DateOffset(months=2))
-
-    def test_mul(self):
-        assert DateOffset(2) == 2 * DateOffset(1)
-        assert DateOffset(2) == DateOffset(1) * 2
-
-    def test_constructor(self):
-
-        assert((self.d + DateOffset(months=2)) == datetime(2008, 3, 2))
-        assert((self.d - DateOffset(months=2)) == datetime(2007, 11, 2))
-
-        assert((self.d + DateOffset(2)) == datetime(2008, 1, 4))
-
-        assert not DateOffset(2).isAnchored()
-        assert DateOffset(1).isAnchored()
-
-        d = datetime(2008, 1, 31)
-        assert((d + DateOffset(months=1)) == datetime(2008, 2, 29))
-
-    def test_copy(self):
-        assert(DateOffset(months=2).copy() == DateOffset(months=2))
-
-    def test_eq(self):
-        offset1 = DateOffset(days=1)
-        offset2 = DateOffset(days=365)
-
-        self.assertNotEqual(offset1, offset2)
-
-
-class TestBusinessDay(Base):
-    _multiprocess_can_split_ = True
-    _offset = BDay
-
-    def setUp(self):
-        self.d = datetime(2008, 1, 1)
-
-        self.offset = BDay()
-        self.offset2 = BDay(2)
-
-    def test_different_normalize_equals(self):
-        # equivalent in this special case
-        offset = BDay()
-        offset2 = BDay()
-        offset2.normalize = True
-        self.assertEqual(offset, offset2)
-
-    def test_repr(self):
-        self.assertEqual(repr(self.offset), '<BusinessDay>')
-        assert repr(self.offset2) == '<2 * BusinessDays>'
-
-        expected = '<BusinessDay: offset=datetime.timedelta(1)>'
-        assert repr(self.offset + timedelta(1)) == expected
-
-    def test_with_offset(self):
-        offset = self.offset + timedelta(hours=2)
-
-        assert (self.d + offset) == datetime(2008, 1, 2, 2)
-
-    def testEQ(self):
-        self.assertEqual(self.offset2, self.offset2)
-
-    def test_mul(self):
-        pass
-
-    def test_hash(self):
-        self.assertEqual(hash(self.offset2), hash(self.offset2))
-
-    def testCall(self):
-        self.assertEqual(self.offset2(self.d), datetime(2008, 1, 3))
-
-    def testRAdd(self):
-        self.assertEqual(self.d + self.offset2, self.offset2 + self.d)
-
-    def testSub(self):
-        off = self.offset2
-        self.assertRaises(Exception, off.__sub__, self.d)
-        self.assertEqual(2 * off - off, off)
-
-        self.assertEqual(self.d - self.offset2, self.d + BDay(-2))
-
-    def testRSub(self):
-        self.assertEqual(self.d - self.offset2, (-self.offset2).apply(self.d))
-
-    def testMult1(self):
-        self.assertEqual(self.d + 10 * self.offset, self.d + BDay(10))
-
-    def testMult2(self):
-        self.assertEqual(self.d + (-5 * BDay(-10)),
-                         self.d + BDay(50))
-
-    def testRollback1(self):
-        self.assertEqual(BDay(10).rollback(self.d), self.d)
-
-    def testRollback2(self):
-        self.assertEqual(
-            BDay(10).rollback(datetime(2008, 1, 5)), datetime(2008, 1, 4))
-
-    def testRollforward1(self):
-        self.assertEqual(BDay(10).rollforward(self.d), self.d)
-
-    def testRollforward2(self):
-        self.assertEqual(
-            BDay(10).rollforward(datetime(2008, 1, 5)), datetime(2008, 1, 7))
-
-    def test_roll_date_object(self):
-        offset = BDay()
-
-        dt = date(2012, 9, 15)
-
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 14))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 17))
-
-        offset = offsets.Day()
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-    def test_onOffset(self):
-        tests = [(BDay(), datetime(2008, 1, 1), True),
-                 (BDay(), datetime(2008, 1, 5), False)]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-    def test_apply(self):
-        tests = []
-
-        tests.append((bday,
-                      {datetime(2008, 1, 1): datetime(2008, 1, 2),
-                       datetime(2008, 1, 4): datetime(2008, 1, 7),
-                       datetime(2008, 1, 5): datetime(2008, 1, 7),
-                       datetime(2008, 1, 6): datetime(2008, 1, 7),
-                       datetime(2008, 1, 7): datetime(2008, 1, 8)}))
-
-        tests.append((2 * bday,
-                      {datetime(2008, 1, 1): datetime(2008, 1, 3),
-                       datetime(2008, 1, 4): datetime(2008, 1, 8),
-                       datetime(2008, 1, 5): datetime(2008, 1, 8),
-                       datetime(2008, 1, 6): datetime(2008, 1, 8),
-                       datetime(2008, 1, 7): datetime(2008, 1, 9)}))
-
-        tests.append((-bday,
-                      {datetime(2008, 1, 1): datetime(2007, 12, 31),
-                       datetime(2008, 1, 4): datetime(2008, 1, 3),
-                       datetime(2008, 1, 5): datetime(2008, 1, 4),
-                       datetime(2008, 1, 6): datetime(2008, 1, 4),
-                       datetime(2008, 1, 7): datetime(2008, 1, 4),
-                       datetime(2008, 1, 8): datetime(2008, 1, 7)}))
-
-        tests.append((-2 * bday,
-                      {datetime(2008, 1, 1): datetime(2007, 12, 28),
-                       datetime(2008, 1, 4): datetime(2008, 1, 2),
-                       datetime(2008, 1, 5): datetime(2008, 1, 3),
-                       datetime(2008, 1, 6): datetime(2008, 1, 3),
-                       datetime(2008, 1, 7): datetime(2008, 1, 3),
-                       datetime(2008, 1, 8): datetime(2008, 1, 4),
-                       datetime(2008, 1, 9): datetime(2008, 1, 7)}))
-
-        tests.append((BDay(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 1, 4): datetime(2008, 1, 4),
-                       datetime(2008, 1, 5): datetime(2008, 1, 7),
-                       datetime(2008, 1, 6): datetime(2008, 1, 7),
-                       datetime(2008, 1, 7): datetime(2008, 1, 7)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_large_n(self):
-        dt = datetime(2012, 10, 23)
-
-        result = dt + BDay(10)
-        self.assertEqual(result, datetime(2012, 11, 6))
-
-        result = dt + BDay(100) - BDay(100)
-        self.assertEqual(result, dt)
-
-        off = BDay() * 6
-        rs = datetime(2012, 1, 1) - off
-        xp = datetime(2011, 12, 23)
-        self.assertEqual(rs, xp)
-
-        st = datetime(2011, 12, 18)
-        rs = st + off
-        xp = datetime(2011, 12, 26)
-        self.assertEqual(rs, xp)
-
-        off = BDay() * 10
-        rs = datetime(2014, 1, 5) + off # see #5890
-        xp = datetime(2014, 1, 17)
-        self.assertEqual(rs, xp)
-
-    def test_apply_corner(self):
-        self.assertRaises(TypeError, BDay().apply, BMonthEnd())
-
-    def test_offsets_compare_equal(self):
-        # root cause of #456
-        offset1 = BDay()
-        offset2 = BDay()
-        self.assertFalse(offset1 != offset2)
-
-
-class TestBusinessHour(Base):
-    _multiprocess_can_split_ = True
-    _offset = BusinessHour
-
-    def setUp(self):
-        self.d = datetime(2014, 7, 1, 10, 00)
-
-        self.offset1 = BusinessHour()
-        self.offset2 = BusinessHour(n=3)
-
-        self.offset3 = BusinessHour(n=-1)
-        self.offset4 = BusinessHour(n=-4)
-
-        from datetime import time as dt_time
-        self.offset5 = BusinessHour(start=dt_time(11, 0), end=dt_time(14, 30))
-        self.offset6 = BusinessHour(start='20:00', end='05:00')
-        self.offset7 = BusinessHour(n=-2, start=dt_time(21, 30), end=dt_time(6, 30))
-
-    def test_constructor_errors(self):
-        from datetime import time as dt_time
-        with tm.assertRaises(ValueError):
-            BusinessHour(start=dt_time(11, 0, 5))
-        with tm.assertRaises(ValueError):
-            BusinessHour(start='AAA')
-        with tm.assertRaises(ValueError):
-            BusinessHour(start='14:00:05')
-
-    def test_different_normalize_equals(self):
-        # equivalent in this special case
-        offset = self._offset()
-        offset2 = self._offset()
-        offset2.normalize = True
-        self.assertEqual(offset, offset2)
-
-    def test_repr(self):
-        self.assertEqual(repr(self.offset1), '<BusinessHour: BH=09:00-17:00>')
-        self.assertEqual(repr(self.offset2), '<3 * BusinessHours: BH=09:00-17:00>')
-        self.assertEqual(repr(self.offset3), '<-1 * BusinessHour: BH=09:00-17:00>')
-        self.assertEqual(repr(self.offset4), '<-4 * BusinessHours: BH=09:00-17:00>')
-
-        self.assertEqual(repr(self.offset5), '<BusinessHour: BH=11:00-14:30>')
-        self.assertEqual(repr(self.offset6), '<BusinessHour: BH=20:00-05:00>')
-        self.assertEqual(repr(self.offset7), '<-2 * BusinessHours: BH=21:30-06:30>')
-
-    def test_with_offset(self):
-        expected = Timestamp('2014-07-01 13:00')
-
-        self.assertEqual(self.d + BusinessHour() * 3, expected)
-        self.assertEqual(self.d + BusinessHour(n=3), expected)
-
-    def testEQ(self):
-        for offset in [self.offset1, self.offset2, self.offset3, self.offset4]:
-            self.assertEqual(offset, offset)
-
-        self.assertNotEqual(BusinessHour(), BusinessHour(-1))
-        self.assertEqual(BusinessHour(start='09:00'), BusinessHour())
-        self.assertNotEqual(BusinessHour(start='09:00'), BusinessHour(start='09:01'))
-        self.assertNotEqual(BusinessHour(start='09:00', end='17:00'),
-                                         BusinessHour(start='17:00', end='09:01'))
-
-    def test_hash(self):
-        self.assertEqual(hash(self.offset2), hash(self.offset2))
-
-    def testCall(self):
-        self.assertEqual(self.offset1(self.d), datetime(2014, 7, 1, 11))
-        self.assertEqual(self.offset2(self.d), datetime(2014, 7, 1, 13))
-        self.assertEqual(self.offset3(self.d), datetime(2014, 6, 30, 17))
-        self.assertEqual(self.offset4(self.d), datetime(2014, 6, 30, 14))
-
-    def testRAdd(self):
-        self.assertEqual(self.d + self.offset2, self.offset2 + self.d)
-
-    def testSub(self):
-        off = self.offset2
-        self.assertRaises(Exception, off.__sub__, self.d)
-        self.assertEqual(2 * off - off, off)
-
-        self.assertEqual(self.d - self.offset2, self.d + self._offset(-3))
-
-    def testRSub(self):
-        self.assertEqual(self.d - self.offset2, (-self.offset2).apply(self.d))
-
-    def testMult1(self):
-        self.assertEqual(self.d + 5 * self.offset1, self.d + self._offset(5))
-
-    def testMult2(self):
-        self.assertEqual(self.d + (-3 * self._offset(-2)),
-                         self.d + self._offset(6))
-
-    def testRollback1(self):
-        self.assertEqual(self.offset1.rollback(self.d), self.d)
-        self.assertEqual(self.offset2.rollback(self.d), self.d)
-        self.assertEqual(self.offset3.rollback(self.d), self.d)
-        self.assertEqual(self.offset4.rollback(self.d), self.d)
-        self.assertEqual(self.offset5.rollback(self.d), datetime(2014, 6, 30, 14, 30))
-        self.assertEqual(self.offset6.rollback(self.d), datetime(2014, 7, 1, 5, 0))
-        self.assertEqual(self.offset7.rollback(self.d), datetime(2014, 7, 1, 6, 30))
-
-        d = datetime(2014, 7, 1, 0)
-        self.assertEqual(self.offset1.rollback(d), datetime(2014, 6, 30, 17))
-        self.assertEqual(self.offset2.rollback(d), datetime(2014, 6, 30, 17))
-        self.assertEqual(self.offset3.rollback(d), datetime(2014, 6, 30, 17))
-        self.assertEqual(self.offset4.rollback(d), datetime(2014, 6, 30, 17))
-        self.assertEqual(self.offset5.rollback(d), datetime(2014, 6, 30, 14, 30))
-        self.assertEqual(self.offset6.rollback(d), d)
-        self.assertEqual(self.offset7.rollback(d), d)
-
-        self.assertEqual(self._offset(5).rollback(self.d), self.d)
-
-    def testRollback2(self):
-        self.assertEqual(self._offset(-3).rollback(datetime(2014, 7, 5, 15, 0)),
-                         datetime(2014, 7, 4, 17, 0))
-
-    def testRollforward1(self):
-        self.assertEqual(self.offset1.rollforward(self.d), self.d)
-        self.assertEqual(self.offset2.rollforward(self.d), self.d)
-        self.assertEqual(self.offset3.rollforward(self.d), self.d)
-        self.assertEqual(self.offset4.rollforward(self.d), self.d)
-        self.assertEqual(self.offset5.rollforward(self.d), datetime(2014, 7, 1, 11, 0))
-        self.assertEqual(self.offset6.rollforward(self.d), datetime(2014, 7, 1, 20, 0))
-        self.assertEqual(self.offset7.rollforward(self.d), datetime(2014, 7, 1, 21, 30))
-
-        d = datetime(2014, 7, 1, 0)
-        self.assertEqual(self.offset1.rollforward(d), datetime(2014, 7, 1, 9))
-        self.assertEqual(self.offset2.rollforward(d), datetime(2014, 7, 1, 9))
-        self.assertEqual(self.offset3.rollforward(d), datetime(2014, 7, 1, 9))
-        self.assertEqual(self.offset4.rollforward(d), datetime(2014, 7, 1, 9))
-        self.assertEqual(self.offset5.rollforward(d), datetime(2014, 7, 1, 11))
-        self.assertEqual(self.offset6.rollforward(d), d)
-        self.assertEqual(self.offset7.rollforward(d), d)
-
-        self.assertEqual(self._offset(5).rollforward(self.d), self.d)
-
-    def testRollforward2(self):
-        self.assertEqual(self._offset(-3).rollforward(datetime(2014, 7, 5, 16, 0)),
-                         datetime(2014, 7, 7, 9))
-
-    def test_roll_date_object(self):
-        offset = BusinessHour()
-
-        dt = datetime(2014, 7, 6, 15, 0)
-
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2014, 7, 4, 17))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2014, 7, 7, 9))
-
-    def test_normalize(self):
-        tests = []
-
-        tests.append((BusinessHour(normalize=True),
-                      {datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 2),
-                       datetime(2014, 7, 1, 16): datetime(2014, 7, 2),
-                       datetime(2014, 7, 1, 23): datetime(2014, 7, 2),
-                       datetime(2014, 7, 1, 0): datetime(2014, 7, 1),
-                       datetime(2014, 7, 4, 15): datetime(2014, 7, 4),
-                       datetime(2014, 7, 4, 15, 59): datetime(2014, 7, 4),
-                       datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7),
-                       datetime(2014, 7, 5, 23): datetime(2014, 7, 7),
-                       datetime(2014, 7, 6, 10): datetime(2014, 7, 7)}))
-
-        tests.append((BusinessHour(-1, normalize=True),
-                      {datetime(2014, 7, 1, 8): datetime(2014, 6, 30),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 16): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 10): datetime(2014, 6, 30),
-                       datetime(2014, 7, 1, 0): datetime(2014, 6, 30),
-                       datetime(2014, 7, 7, 10): datetime(2014, 7, 4),
-                       datetime(2014, 7, 7, 10, 1): datetime(2014, 7, 7),
-                       datetime(2014, 7, 5, 23): datetime(2014, 7, 4),
-                       datetime(2014, 7, 6, 10): datetime(2014, 7, 4)}))
-
-        tests.append((BusinessHour(1, normalize=True, start='17:00', end='04:00'),
-                      {datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 23): datetime(2014, 7, 2),
-                       datetime(2014, 7, 2, 2): datetime(2014, 7, 2),
-                       datetime(2014, 7, 2, 3): datetime(2014, 7, 2),
-                       datetime(2014, 7, 4, 23): datetime(2014, 7, 5),
-                       datetime(2014, 7, 5, 2): datetime(2014, 7, 5),
-                       datetime(2014, 7, 7, 2): datetime(2014, 7, 7),
-                       datetime(2014, 7, 7, 17): datetime(2014, 7, 7)}))
-
-        for offset, cases in tests:
-            for dt, expected in compat.iteritems(cases):
-                self.assertEqual(offset.apply(dt), expected)
-
-    def test_onOffset(self):
-        tests = []
-
-        tests.append((BusinessHour(),
-                     {datetime(2014, 7, 1, 9): True,
-                      datetime(2014, 7, 1, 8, 59): False,
-                      datetime(2014, 7, 1, 8): False,
-                      datetime(2014, 7, 1, 17): True,
-                      datetime(2014, 7, 1, 17, 1): False,
-                      datetime(2014, 7, 1, 18): False,
-                      datetime(2014, 7, 5, 9): False,
-                      datetime(2014, 7, 6, 12): False}))
-
-        tests.append((BusinessHour(start='10:00', end='15:00'),
-                     {datetime(2014, 7, 1, 9): False,
-                      datetime(2014, 7, 1, 10): True,
-                      datetime(2014, 7, 1, 15): True,
-                      datetime(2014, 7, 1, 15, 1): False,
-                      datetime(2014, 7, 5, 12): False,
-                      datetime(2014, 7, 6, 12): False}))
-
-        tests.append((BusinessHour(start='19:00', end='05:00'),
-                     {datetime(2014, 7, 1, 9, 0): False,
-                      datetime(2014, 7, 1, 10, 0): False,
-                      datetime(2014, 7, 1, 15): False,
-                      datetime(2014, 7, 1, 15, 1): False,
-                      datetime(2014, 7, 5, 12, 0): False,
-                      datetime(2014, 7, 6, 12, 0): False,
-                      datetime(2014, 7, 1, 19, 0): True,
-                      datetime(2014, 7, 2, 0, 0): True,
-                      datetime(2014, 7, 4, 23): True,
-                      datetime(2014, 7, 5, 1): True,
-                      datetime(2014, 7, 5, 5, 0): True,
-                      datetime(2014, 7, 6, 23, 0): False,
-                      datetime(2014, 7, 7, 3, 0): False}))
-
-        for offset, cases in tests:
-            for dt, expected in compat.iteritems(cases):
-                self.assertEqual(offset.onOffset(dt), expected)
-
-    def test_opening_time(self):
-        tests = []
-
-        # opening time should be affected by sign of n, not by n's value and end
-        tests.append(([BusinessHour(), BusinessHour(n=2), BusinessHour(n=4),
-                       BusinessHour(end='10:00'), BusinessHour(n=2, end='4:00'),
-                       BusinessHour(n=4, end='15:00')],
-                      {datetime(2014, 7, 1, 11): (datetime(2014, 7, 2, 9), datetime(2014, 7, 1, 9)),
-                       datetime(2014, 7, 1, 18): (datetime(2014, 7, 2, 9), datetime(2014, 7, 1, 9)),
-                       datetime(2014, 7, 1, 23): (datetime(2014, 7, 2, 9), datetime(2014, 7, 1, 9)),
-                       datetime(2014, 7, 2, 8): (datetime(2014, 7, 2, 9), datetime(2014, 7, 1, 9)),
-                       # if timestamp is on opening time, next opening time is as it is
-                       datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 9), datetime(2014, 7, 2, 9)),
-                       datetime(2014, 7, 2, 10): (datetime(2014, 7, 3, 9), datetime(2014, 7, 2, 9)),
-                       # 2014-07-05 is saturday
-                       datetime(2014, 7, 5, 10): (datetime(2014, 7, 7, 9), datetime(2014, 7, 4, 9)),
-                       datetime(2014, 7, 4, 10): (datetime(2014, 7, 7, 9), datetime(2014, 7, 4, 9)),
-                       datetime(2014, 7, 4, 23): (datetime(2014, 7, 7, 9), datetime(2014, 7, 4, 9)),
-                       datetime(2014, 7, 6, 10): (datetime(2014, 7, 7, 9), datetime(2014, 7, 4, 9)),
-                       datetime(2014, 7, 7, 5): (datetime(2014, 7, 7, 9), datetime(2014, 7, 4, 9)),
-                       datetime(2014, 7, 7, 9, 1): (datetime(2014, 7, 8, 9), datetime(2014, 7, 7, 9))}))
-
-        tests.append(([BusinessHour(start='11:15'), BusinessHour(n=2, start='11:15'),
-                       BusinessHour(n=3, start='11:15'),
-                       BusinessHour(start='11:15', end='10:00'),
-                       BusinessHour(n=2, start='11:15', end='4:00'),
-                       BusinessHour(n=3, start='11:15', end='15:00')],
-                      {datetime(2014, 7, 1, 11): (datetime(2014, 7, 1, 11, 15), datetime(2014, 6, 30, 11, 15)),
-                       datetime(2014, 7, 1, 18): (datetime(2014, 7, 2, 11, 15), datetime(2014, 7, 1, 11, 15)),
-                       datetime(2014, 7, 1, 23): (datetime(2014, 7, 2, 11, 15), datetime(2014, 7, 1, 11, 15)),
-                       datetime(2014, 7, 2, 8): (datetime(2014, 7, 2, 11, 15), datetime(2014, 7, 1, 11, 15)),
-                       datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 11, 15), datetime(2014, 7, 1, 11, 15)),
-                       datetime(2014, 7, 2, 10): (datetime(2014, 7, 2, 11, 15), datetime(2014, 7, 1, 11, 15)),
-                       datetime(2014, 7, 2, 11, 15): (datetime(2014, 7, 2, 11, 15), datetime(2014, 7, 2, 11, 15)),
-                       datetime(2014, 7, 2, 11, 15, 1): (datetime(2014, 7, 3, 11, 15), datetime(2014, 7, 2, 11, 15)),
-                       datetime(2014, 7, 5, 10): (datetime(2014, 7, 7, 11, 15), datetime(2014, 7, 4, 11, 15)),
-                       datetime(2014, 7, 4, 10): (datetime(2014, 7, 4, 11, 15), datetime(2014, 7, 3, 11, 15)),
-                       datetime(2014, 7, 4, 23): (datetime(2014, 7, 7, 11, 15), datetime(2014, 7, 4, 11, 15)),
-                       datetime(2014, 7, 6, 10): (datetime(2014, 7, 7, 11, 15), datetime(2014, 7, 4, 11, 15)),
-                       datetime(2014, 7, 7, 5): (datetime(2014, 7, 7, 11, 15), datetime(2014, 7, 4, 11, 15)),
-                       datetime(2014, 7, 7, 9, 1): (datetime(2014, 7, 7, 11, 15), datetime(2014, 7, 4, 11, 15))}))
-
-        tests.append(([BusinessHour(-1), BusinessHour(n=-2), BusinessHour(n=-4),
-                       BusinessHour(n=-1, end='10:00'), BusinessHour(n=-2, end='4:00'),
-                       BusinessHour(n=-4, end='15:00')],
-                      {datetime(2014, 7, 1, 11): (datetime(2014, 7, 1, 9), datetime(2014, 7, 2, 9)),
-                       datetime(2014, 7, 1, 18): (datetime(2014, 7, 1, 9), datetime(2014, 7, 2, 9)),
-                       datetime(2014, 7, 1, 23): (datetime(2014, 7, 1, 9), datetime(2014, 7, 2, 9)),
-                       datetime(2014, 7, 2, 8): (datetime(2014, 7, 1, 9), datetime(2014, 7, 2, 9)),
-                       datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 9), datetime(2014, 7, 2, 9)),
-                       datetime(2014, 7, 2, 10): (datetime(2014, 7, 2, 9), datetime(2014, 7, 3, 9)),
-                       datetime(2014, 7, 5, 10): (datetime(2014, 7, 4, 9), datetime(2014, 7, 7, 9)),
-                       datetime(2014, 7, 4, 10): (datetime(2014, 7, 4, 9), datetime(2014, 7, 7, 9)),
-                       datetime(2014, 7, 4, 23): (datetime(2014, 7, 4, 9), datetime(2014, 7, 7, 9)),
-                       datetime(2014, 7, 6, 10): (datetime(2014, 7, 4, 9), datetime(2014, 7, 7, 9)),
-                       datetime(2014, 7, 7, 5): (datetime(2014, 7, 4, 9), datetime(2014, 7, 7, 9)),
-                       datetime(2014, 7, 7, 9): (datetime(2014, 7, 7, 9), datetime(2014, 7, 7, 9)),
-                       datetime(2014, 7, 7, 9, 1): (datetime(2014, 7, 7, 9), datetime(2014, 7, 8, 9))}))
-
-        tests.append(([BusinessHour(start='17:00', end='05:00'),
-                       BusinessHour(n=3, start='17:00', end='03:00')],
-                      {datetime(2014, 7, 1, 11): (datetime(2014, 7, 1, 17), datetime(2014, 6, 30, 17)),
-                       datetime(2014, 7, 1, 18): (datetime(2014, 7, 2, 17), datetime(2014, 7, 1, 17)),
-                       datetime(2014, 7, 1, 23): (datetime(2014, 7, 2, 17), datetime(2014, 7, 1, 17)),
-                       datetime(2014, 7, 2, 8): (datetime(2014, 7, 2, 17), datetime(2014, 7, 1, 17)),
-                       datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 17), datetime(2014, 7, 1, 17)),
-                       datetime(2014, 7, 4, 17): (datetime(2014, 7, 4, 17), datetime(2014, 7, 4, 17)),
-                       datetime(2014, 7, 5, 10): (datetime(2014, 7, 7, 17), datetime(2014, 7, 4, 17)),
-                       datetime(2014, 7, 4, 10): (datetime(2014, 7, 4, 17), datetime(2014, 7, 3, 17)),
-                       datetime(2014, 7, 4, 23): (datetime(2014, 7, 7, 17), datetime(2014, 7, 4, 17)),
-                       datetime(2014, 7, 6, 10): (datetime(2014, 7, 7, 17), datetime(2014, 7, 4, 17)),
-                       datetime(2014, 7, 7, 5): (datetime(2014, 7, 7, 17), datetime(2014, 7, 4, 17)),
-                       datetime(2014, 7, 7, 17, 1): (datetime(2014, 7, 8, 17), datetime(2014, 7, 7, 17)),}))
-
-        tests.append(([BusinessHour(-1, start='17:00', end='05:00'),
-                       BusinessHour(n=-2, start='17:00', end='03:00')],
-                      {datetime(2014, 7, 1, 11): (datetime(2014, 6, 30, 17), datetime(2014, 7, 1, 17)),
-                       datetime(2014, 7, 1, 18): (datetime(2014, 7, 1, 17), datetime(2014, 7, 2, 17)),
-                       datetime(2014, 7, 1, 23): (datetime(2014, 7, 1, 17), datetime(2014, 7, 2, 17)),
-                       datetime(2014, 7, 2, 8): (datetime(2014, 7, 1, 17), datetime(2014, 7, 2, 17)),
-                       datetime(2014, 7, 2, 9): (datetime(2014, 7, 1, 17), datetime(2014, 7, 2, 17)),
-                       datetime(2014, 7, 2, 16, 59): (datetime(2014, 7, 1, 17), datetime(2014, 7, 2, 17)),
-                       datetime(2014, 7, 5, 10): (datetime(2014, 7, 4, 17), datetime(2014, 7, 7, 17)),
-                       datetime(2014, 7, 4, 10): (datetime(2014, 7, 3, 17), datetime(2014, 7, 4, 17)),
-                       datetime(2014, 7, 4, 23): (datetime(2014, 7, 4, 17), datetime(2014, 7, 7, 17)),
-                       datetime(2014, 7, 6, 10): (datetime(2014, 7, 4, 17), datetime(2014, 7, 7, 17)),
-                       datetime(2014, 7, 7, 5): (datetime(2014, 7, 4, 17), datetime(2014, 7, 7, 17)),
-                       datetime(2014, 7, 7, 18): (datetime(2014, 7, 7, 17), datetime(2014, 7, 8, 17))}))
-
-        for offsets, cases in tests:
-            for offset in offsets:
-                for dt, (exp_next, exp_prev) in compat.iteritems(cases):
-                    self.assertEqual(offset._next_opening_time(dt), exp_next)
-                    self.assertEqual(offset._prev_opening_time(dt), exp_prev)
-
-    def test_apply(self):
-        tests = []
-
-        tests.append((BusinessHour(),
-                      {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 12),
-                       datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 14),
-                       datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 16),
-                       datetime(2014, 7, 1, 19): datetime(2014, 7, 2, 10),
-                       datetime(2014, 7, 1, 16): datetime(2014, 7, 2, 9),
-                       datetime(2014, 7, 1, 16, 30, 15): datetime(2014, 7, 2, 9, 30, 15),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 2, 10),
-                       datetime(2014, 7, 2, 11): datetime(2014, 7, 2, 12),
-                       # out of business hours
-                       datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 10),
-                       datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 10),
-                       datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 10),
-                       datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 10),
-                       # saturday
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 10),
-                       datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 10),
-                       datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 9, 30),
-                       datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 9, 30, 30)}))
-
-        tests.append((BusinessHour(4),
-                      {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 15),
-                       datetime(2014, 7, 1, 13): datetime(2014, 7, 2, 9),
-                       datetime(2014, 7, 1, 15): datetime(2014, 7, 2, 11),
-                       datetime(2014, 7, 1, 16): datetime(2014, 7, 2, 12),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 2, 13),
-                       datetime(2014, 7, 2, 11): datetime(2014, 7, 2, 15),
-                       datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 13),
-                       datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 13),
-                       datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 13),
-                       datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 13),
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 13),
-                       datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 13),
-                       datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 12, 30),
-                       datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 12, 30, 30)}))
-
-        tests.append((BusinessHour(-1),
-                      {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 10),
-                       datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 12),
-                       datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 14),
-                       datetime(2014, 7, 1, 16): datetime(2014, 7, 1, 15),
-                       datetime(2014, 7, 1, 10): datetime(2014, 6, 30, 17),
-                       datetime(2014, 7, 1, 16, 30, 15): datetime(2014, 7, 1, 15, 30, 15),
-                       datetime(2014, 7, 1, 9, 30, 15): datetime(2014, 6, 30, 16, 30, 15),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 16),
-                       datetime(2014, 7, 1, 5): datetime(2014, 6, 30, 16),
-                       datetime(2014, 7, 2, 11): datetime(2014, 7, 2, 10),
-                       # out of business hours
-                       datetime(2014, 7, 2, 8): datetime(2014, 7, 1, 16),
-                       datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 16),
-                       datetime(2014, 7, 2, 23): datetime(2014, 7, 2, 16),
-                       datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 16),
-                       # saturday
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 16),
-                       datetime(2014, 7, 7, 9): datetime(2014, 7, 4, 16),
-                       datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 4, 16, 30),
-                       datetime(2014, 7, 7, 9, 30, 30): datetime(2014, 7, 4, 16, 30, 30)}))
-
-        tests.append((BusinessHour(-4),
-                      {datetime(2014, 7, 1, 11): datetime(2014, 6, 30, 15),
-                       datetime(2014, 7, 1, 13): datetime(2014, 6, 30, 17),
-                       datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 11),
-                       datetime(2014, 7, 1, 16): datetime(2014, 7, 1, 12),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 13),
-                       datetime(2014, 7, 2, 11): datetime(2014, 7, 1, 15),
-                       datetime(2014, 7, 2, 8): datetime(2014, 7, 1, 13),
-                       datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 13),
-                       datetime(2014, 7, 2, 23): datetime(2014, 7, 2, 13),
-                       datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 13),
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 13),
-                       datetime(2014, 7, 4, 18): datetime(2014, 7, 4, 13),
-                       datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 4, 13, 30),
-                       datetime(2014, 7, 7, 9, 30, 30): datetime(2014, 7, 4, 13, 30, 30)}))
-
-        tests.append((BusinessHour(start='13:00', end='16:00'),
-                      {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 14),
-                       datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 14),
-                       datetime(2014, 7, 1, 15): datetime(2014, 7, 2, 13),
-                       datetime(2014, 7, 1, 19): datetime(2014, 7, 2, 14),
-                       datetime(2014, 7, 1, 16): datetime(2014, 7, 2, 14),
-                       datetime(2014, 7, 1, 15, 30, 15): datetime(2014, 7, 2, 13, 30, 15),
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 14),
-                       datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 14)}))
-
-        tests.append((BusinessHour(n=2, start='13:00', end='16:00'),
-                      {datetime(2014, 7, 1, 17): datetime(2014, 7, 2, 15),
-                       datetime(2014, 7, 2, 14): datetime(2014, 7, 3, 13),
-                       datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 15),
-                       datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 15),
-                       datetime(2014, 7, 2, 14, 30): datetime(2014, 7, 3, 13, 30),
-                       datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 15),
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 15),
-                       datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 15),
-                       datetime(2014, 7, 4, 14, 30): datetime(2014, 7, 7, 13, 30),
-                       datetime(2014, 7, 4, 14, 30, 30): datetime(2014, 7, 7, 13, 30, 30)}))
-
-        tests.append((BusinessHour(n=-1, start='13:00', end='16:00'),
-                      {datetime(2014, 7, 2, 11): datetime(2014, 7, 1, 15),
-                       datetime(2014, 7, 2, 13): datetime(2014, 7, 1, 15),
-                       datetime(2014, 7, 2, 14): datetime(2014, 7, 1, 16),
-                       datetime(2014, 7, 2, 15): datetime(2014, 7, 2, 14),
-                       datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 15),
-                       datetime(2014, 7, 2, 16): datetime(2014, 7, 2, 15),
-                       datetime(2014, 7, 2, 13, 30, 15): datetime(2014, 7, 1, 15, 30, 15),
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 15),
-                       datetime(2014, 7, 7, 11): datetime(2014, 7, 4, 15)}))
-
-        tests.append((BusinessHour(n=-3, start='10:00', end='16:00'),
-                      {datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 13),
-                       datetime(2014, 7, 2, 14): datetime(2014, 7, 2, 11),
-                       datetime(2014, 7, 2, 8): datetime(2014, 7, 1, 13),
-                       datetime(2014, 7, 2, 13): datetime(2014, 7, 1, 16),
-                       datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 13),
-                       datetime(2014, 7, 2, 11, 30): datetime(2014, 7, 1, 14, 30),
-                       datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 13),
-                       datetime(2014, 7, 4, 10): datetime(2014, 7, 3, 13),
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 13),
-                       datetime(2014, 7, 4, 16): datetime(2014, 7, 4, 13),
-                       datetime(2014, 7, 4, 12, 30): datetime(2014, 7, 3, 15, 30),
-                       datetime(2014, 7, 4, 12, 30, 30): datetime(2014, 7, 3, 15, 30, 30)}))
-
-        tests.append((BusinessHour(start='19:00', end='05:00'),
-                      {datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 20),
-                       datetime(2014, 7, 2, 14): datetime(2014, 7, 2, 20),
-                       datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 20),
-                       datetime(2014, 7, 2, 13): datetime(2014, 7, 2, 20),
-                       datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 20),
-                       datetime(2014, 7, 2, 4, 30): datetime(2014, 7, 2, 19, 30),
-                       datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 1),
-                       datetime(2014, 7, 4, 10): datetime(2014, 7, 4, 20),
-                       datetime(2014, 7, 4, 23): datetime(2014, 7, 5, 0),
-                       datetime(2014, 7, 5, 0): datetime(2014, 7, 5, 1),
-                       datetime(2014, 7, 5, 4): datetime(2014, 7, 7, 19),
-                       datetime(2014, 7, 5, 4, 30): datetime(2014, 7, 7, 19, 30),
-                       datetime(2014, 7, 5, 4, 30, 30): datetime(2014, 7, 7, 19, 30, 30)}))
-
-        tests.append((BusinessHour(n=-1, start='19:00', end='05:00'),
-                      {datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 4),
-                       datetime(2014, 7, 2, 14): datetime(2014, 7, 2, 4),
-                       datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 4),
-                       datetime(2014, 7, 2, 13): datetime(2014, 7, 2, 4),
-                       datetime(2014, 7, 2, 20): datetime(2014, 7, 2, 5),
-                       datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 4),
-                       datetime(2014, 7, 2, 19, 30): datetime(2014, 7, 2, 4, 30),
-                       datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 23),
-                       datetime(2014, 7, 3, 6): datetime(2014, 7, 3, 4),
-                       datetime(2014, 7, 4, 23): datetime(2014, 7, 4, 22),
-                       datetime(2014, 7, 5, 0): datetime(2014, 7, 4, 23),
-                       datetime(2014, 7, 5, 4): datetime(2014, 7, 5, 3),
-                       datetime(2014, 7, 7, 19, 30): datetime(2014, 7, 5, 4, 30),
-                       datetime(2014, 7, 7, 19, 30, 30): datetime(2014, 7, 5, 4, 30, 30)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_large_n(self):
-        tests = []
-
-        tests.append((BusinessHour(40), # A week later
-                      {datetime(2014, 7, 1, 11): datetime(2014, 7, 8, 11),
-                       datetime(2014, 7, 1, 13): datetime(2014, 7, 8, 13),
-                       datetime(2014, 7, 1, 15): datetime(2014, 7, 8, 15),
-                       datetime(2014, 7, 1, 16): datetime(2014, 7, 8, 16),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 9, 9),
-                       datetime(2014, 7, 2, 11): datetime(2014, 7, 9, 11),
-                       datetime(2014, 7, 2, 8): datetime(2014, 7, 9, 9),
-                       datetime(2014, 7, 2, 19): datetime(2014, 7, 10, 9),
-                       datetime(2014, 7, 2, 23): datetime(2014, 7, 10, 9),
-                       datetime(2014, 7, 3, 0): datetime(2014, 7, 10, 9),
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 14, 9),
-                       datetime(2014, 7, 4, 18): datetime(2014, 7, 14, 9),
-                       datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 14, 9, 30),
-                       datetime(2014, 7, 7, 9, 30, 30): datetime(2014, 7, 14, 9, 30, 30)}))
-
-        tests.append((BusinessHour(-25), # 3 days and 1 hour before
-                      {datetime(2014, 7, 1, 11): datetime(2014, 6, 26, 10),
-                       datetime(2014, 7, 1, 13): datetime(2014, 6, 26, 12),
-                       datetime(2014, 7, 1, 9): datetime(2014, 6, 25, 16),
-                       datetime(2014, 7, 1, 10): datetime(2014, 6, 25, 17),
-                       datetime(2014, 7, 3, 11): datetime(2014, 6, 30, 10),
-                       datetime(2014, 7, 3, 8): datetime(2014, 6, 27, 16),
-                       datetime(2014, 7, 3, 19): datetime(2014, 6, 30, 16),
-                       datetime(2014, 7, 3, 23): datetime(2014, 6, 30, 16),
-                       datetime(2014, 7, 4, 9): datetime(2014, 6, 30, 16),
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 1, 16),
-                       datetime(2014, 7, 6, 18): datetime(2014, 7, 1, 16),
-                       datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 1, 16, 30),
-                       datetime(2014, 7, 7, 10, 30, 30): datetime(2014, 7, 2, 9, 30, 30)}))
-
-        tests.append((BusinessHour(28, start='21:00', end='02:00'), # 5 days and 3 hours later
-                      {datetime(2014, 7, 1, 11): datetime(2014, 7, 9, 0),
-                       datetime(2014, 7, 1, 22): datetime(2014, 7, 9, 1),
-                       datetime(2014, 7, 1, 23): datetime(2014, 7, 9, 21),
-                       datetime(2014, 7, 2, 2): datetime(2014, 7, 10, 0),
-                       datetime(2014, 7, 3, 21): datetime(2014, 7, 11, 0),
-                       datetime(2014, 7, 4, 1): datetime(2014, 7, 11, 23),
-                       datetime(2014, 7, 4, 2): datetime(2014, 7, 12, 0),
-                       datetime(2014, 7, 4, 3): datetime(2014, 7, 12, 0),
-                       datetime(2014, 7, 5, 1): datetime(2014, 7, 14, 23),
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 15, 0),
-                       datetime(2014, 7, 6, 18): datetime(2014, 7, 15, 0),
-                       datetime(2014, 7, 7, 1): datetime(2014, 7, 15, 0),
-                       datetime(2014, 7, 7, 23, 30): datetime(2014, 7, 15, 21, 30)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_nanoseconds(self):
-        tests = []
-
-        tests.append((BusinessHour(),
-                      {Timestamp('2014-07-04 15:00') + Nano(5): Timestamp('2014-07-04 16:00') + Nano(5),
-                       Timestamp('2014-07-04 16:00') + Nano(5): Timestamp('2014-07-07 09:00') + Nano(5),
-                       Timestamp('2014-07-04 16:00') - Nano(5): Timestamp('2014-07-04 17:00') - Nano(5)
-                       }))
-
-        tests.append((BusinessHour(-1),
-                      {Timestamp('2014-07-04 15:00') + Nano(5): Timestamp('2014-07-04 14:00') + Nano(5),
-                       Timestamp('2014-07-04 10:00') + Nano(5): Timestamp('2014-07-04 09:00') + Nano(5),
-                       Timestamp('2014-07-04 10:00') - Nano(5): Timestamp('2014-07-03 17:00') - Nano(5),
-                       }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_offsets_compare_equal(self):
-        # root cause of #456
-        offset1 = self._offset()
-        offset2 = self._offset()
-        self.assertFalse(offset1 != offset2)
-
-    def test_datetimeindex(self):
-        idx1 = DatetimeIndex(start='2014-07-04 15:00', end='2014-07-08 10:00', freq='BH')
-        idx2 = DatetimeIndex(start='2014-07-04 15:00', periods=12, freq='BH')
-        idx3 = DatetimeIndex(end='2014-07-08 10:00', periods=12, freq='BH')
-        expected = DatetimeIndex(['2014-07-04 15:00', '2014-07-04 16:00', '2014-07-07 09:00',
-                                  '2014-07-07 10:00', '2014-07-07 11:00', '2014-07-07 12:00',
-                                  '2014-07-07 13:00', '2014-07-07 14:00', '2014-07-07 15:00',
-                                  '2014-07-07 16:00', '2014-07-08 09:00', '2014-07-08 10:00'],
-                                  freq='BH')
-        for idx in [idx1, idx2, idx3]:
-            tm.assert_index_equal(idx, expected)
-
-        idx1 = DatetimeIndex(start='2014-07-04 15:45', end='2014-07-08 10:45', freq='BH')
-        idx2 = DatetimeIndex(start='2014-07-04 15:45', periods=12, freq='BH')
-        idx3 = DatetimeIndex(end='2014-07-08 10:45', periods=12, freq='BH')
-
-        expected = DatetimeIndex(['2014-07-04 15:45', '2014-07-04 16:45', '2014-07-07 09:45',
-                                  '2014-07-07 10:45', '2014-07-07 11:45', '2014-07-07 12:45',
-                                  '2014-07-07 13:45', '2014-07-07 14:45', '2014-07-07 15:45',
-                                  '2014-07-07 16:45', '2014-07-08 09:45', '2014-07-08 10:45'],
-                                  freq='BH')
-        expected = idx1
-        for idx in [idx1, idx2, idx3]:
-            tm.assert_index_equal(idx, expected)
-
-
-class TestCustomBusinessDay(Base):
-    _multiprocess_can_split_ = True
-    _offset = CDay
-
-    def setUp(self):
-        self.d = datetime(2008, 1, 1)
-        self.nd = np.datetime64('2008-01-01 00:00:00Z')
-
-        tm._skip_if_no_cday()
-        self.offset = CDay()
-        self.offset2 = CDay(2)
-
-    def test_different_normalize_equals(self):
-        # equivalent in this special case
-        offset = CDay()
-        offset2 = CDay()
-        offset2.normalize = True
-        self.assertEqual(offset, offset2)
-
-    def test_repr(self):
-        assert repr(self.offset) == '<CustomBusinessDay>'
-        assert repr(self.offset2) == '<2 * CustomBusinessDays>'
-
-        expected = '<BusinessDay: offset=datetime.timedelta(1)>'
-        assert repr(self.offset + timedelta(1)) == expected
-
-    def test_with_offset(self):
-        offset = self.offset + timedelta(hours=2)
-
-        assert (self.d + offset) == datetime(2008, 1, 2, 2)
-
-    def testEQ(self):
-        self.assertEqual(self.offset2, self.offset2)
-
-    def test_mul(self):
-        pass
-
-    def test_hash(self):
-        self.assertEqual(hash(self.offset2), hash(self.offset2))
-
-    def testCall(self):
-        self.assertEqual(self.offset2(self.d), datetime(2008, 1, 3))
-        self.assertEqual(self.offset2(self.nd), datetime(2008, 1, 3))
-
-    def testRAdd(self):
-        self.assertEqual(self.d + self.offset2, self.offset2 + self.d)
-
-    def testSub(self):
-        off = self.offset2
-        self.assertRaises(Exception, off.__sub__, self.d)
-        self.assertEqual(2 * off - off, off)
-
-        self.assertEqual(self.d - self.offset2, self.d + CDay(-2))
-
-    def testRSub(self):
-        self.assertEqual(self.d - self.offset2, (-self.offset2).apply(self.d))
-
-    def testMult1(self):
-        self.assertEqual(self.d + 10 * self.offset, self.d + CDay(10))
-
-    def testMult2(self):
-        self.assertEqual(self.d + (-5 * CDay(-10)),
-                         self.d + CDay(50))
-
-    def testRollback1(self):
-        self.assertEqual(CDay(10).rollback(self.d), self.d)
-
-    def testRollback2(self):
-        self.assertEqual(
-            CDay(10).rollback(datetime(2008, 1, 5)), datetime(2008, 1, 4))
-
-    def testRollforward1(self):
-        self.assertEqual(CDay(10).rollforward(self.d), self.d)
-
-    def testRollforward2(self):
-        self.assertEqual(
-            CDay(10).rollforward(datetime(2008, 1, 5)), datetime(2008, 1, 7))
-
-    def test_roll_date_object(self):
-        offset = CDay()
-
-        dt = date(2012, 9, 15)
-
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 14))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 17))
-
-        offset = offsets.Day()
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-    def test_onOffset(self):
-        tests = [(CDay(), datetime(2008, 1, 1), True),
-                 (CDay(), datetime(2008, 1, 5), False)]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-    def test_apply(self):
-        from pandas.core.datetools import cday
-        tests = []
-
-        tests.append((cday,
-                      {datetime(2008, 1, 1): datetime(2008, 1, 2),
-                       datetime(2008, 1, 4): datetime(2008, 1, 7),
-                       datetime(2008, 1, 5): datetime(2008, 1, 7),
-                       datetime(2008, 1, 6): datetime(2008, 1, 7),
-                       datetime(2008, 1, 7): datetime(2008, 1, 8)}))
-
-        tests.append((2 * cday,
-                      {datetime(2008, 1, 1): datetime(2008, 1, 3),
-                       datetime(2008, 1, 4): datetime(2008, 1, 8),
-                       datetime(2008, 1, 5): datetime(2008, 1, 8),
-                       datetime(2008, 1, 6): datetime(2008, 1, 8),
-                       datetime(2008, 1, 7): datetime(2008, 1, 9)}))
-
-        tests.append((-cday,
-                      {datetime(2008, 1, 1): datetime(2007, 12, 31),
-                       datetime(2008, 1, 4): datetime(2008, 1, 3),
-                       datetime(2008, 1, 5): datetime(2008, 1, 4),
-                       datetime(2008, 1, 6): datetime(2008, 1, 4),
-                       datetime(2008, 1, 7): datetime(2008, 1, 4),
-                       datetime(2008, 1, 8): datetime(2008, 1, 7)}))
-
-        tests.append((-2 * cday,
-                      {datetime(2008, 1, 1): datetime(2007, 12, 28),
-                       datetime(2008, 1, 4): datetime(2008, 1, 2),
-                       datetime(2008, 1, 5): datetime(2008, 1, 3),
-                       datetime(2008, 1, 6): datetime(2008, 1, 3),
-                       datetime(2008, 1, 7): datetime(2008, 1, 3),
-                       datetime(2008, 1, 8): datetime(2008, 1, 4),
-                       datetime(2008, 1, 9): datetime(2008, 1, 7)}))
-
-        tests.append((CDay(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 1, 4): datetime(2008, 1, 4),
-                       datetime(2008, 1, 5): datetime(2008, 1, 7),
-                       datetime(2008, 1, 6): datetime(2008, 1, 7),
-                       datetime(2008, 1, 7): datetime(2008, 1, 7)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_large_n(self):
-        dt = datetime(2012, 10, 23)
-
-        result = dt + CDay(10)
-        self.assertEqual(result, datetime(2012, 11, 6))
-
-        result = dt + CDay(100) - CDay(100)
-        self.assertEqual(result, dt)
-
-        off = CDay() * 6
-        rs = datetime(2012, 1, 1) - off
-        xp = datetime(2011, 12, 23)
-        self.assertEqual(rs, xp)
-
-        st = datetime(2011, 12, 18)
-        rs = st + off
-        xp = datetime(2011, 12, 26)
-        self.assertEqual(rs, xp)
-
-    def test_apply_corner(self):
-        self.assertRaises(Exception, CDay().apply, BMonthEnd())
-
-    def test_offsets_compare_equal(self):
-        # root cause of #456
-        offset1 = CDay()
-        offset2 = CDay()
-        self.assertFalse(offset1 != offset2)
-
-    def test_holidays(self):
-        # Define a TradingDay offset
-        holidays = ['2012-05-01', datetime(2013, 5, 1),
-                    np.datetime64('2014-05-01')]
-        tday = CDay(holidays=holidays)
-        for year in range(2012, 2015):
-            dt = datetime(year, 4, 30)
-            xp = datetime(year, 5, 2)
-            rs = dt + tday
-            self.assertEqual(rs, xp)
-
-    def test_weekmask(self):
-        weekmask_saudi = 'Sat Sun Mon Tue Wed'  # Thu-Fri Weekend
-        weekmask_uae = '1111001'                # Fri-Sat Weekend
-        weekmask_egypt = [1,1,1,1,0,0,1]        # Fri-Sat Weekend
-        bday_saudi = CDay(weekmask=weekmask_saudi)
-        bday_uae = CDay(weekmask=weekmask_uae)
-        bday_egypt = CDay(weekmask=weekmask_egypt)
-        dt = datetime(2013, 5, 1)
-        xp_saudi = datetime(2013, 5, 4)
-        xp_uae = datetime(2013, 5, 2)
-        xp_egypt = datetime(2013, 5, 2)
-        self.assertEqual(xp_saudi, dt + bday_saudi)
-        self.assertEqual(xp_uae, dt + bday_uae)
-        self.assertEqual(xp_egypt, dt + bday_egypt)
-        xp2 = datetime(2013, 5, 5)
-        self.assertEqual(xp2, dt + 2 * bday_saudi)
-        self.assertEqual(xp2, dt + 2 * bday_uae)
-        self.assertEqual(xp2, dt + 2 * bday_egypt)
-
-    def test_weekmask_and_holidays(self):
-        weekmask_egypt = 'Sun Mon Tue Wed Thu'  # Fri-Sat Weekend
-        holidays = ['2012-05-01', datetime(2013, 5, 1),
-                    np.datetime64('2014-05-01')]
-        bday_egypt = CDay(holidays=holidays, weekmask=weekmask_egypt)
-        dt = datetime(2013, 4, 30)
-        xp_egypt = datetime(2013, 5, 5)
-        self.assertEqual(xp_egypt, dt + 2 * bday_egypt)
-
-    def test_calendar(self):
-        calendar = USFederalHolidayCalendar()
-        dt = datetime(2014, 1, 17)
-        assertEq(CDay(calendar=calendar), dt, datetime(2014, 1, 21))
-
-    def test_roundtrip_pickle(self):
-        def _check_roundtrip(obj):
-            unpickled = self.round_trip_pickle(obj)
-            self.assertEqual(unpickled, obj)
-        _check_roundtrip(self.offset)
-        _check_roundtrip(self.offset2)
-        _check_roundtrip(self.offset*2)
-
-    def test_pickle_compat_0_14_1(self):
-        hdays = [datetime(2013,1,1) for ele in range(4)]
-
-        pth = tm.get_data_path()
-
-        cday0_14_1 = read_pickle(os.path.join(pth, 'cday-0.14.1.pickle'))
-        cday = CDay(holidays=hdays)
-        self.assertEqual(cday, cday0_14_1)
-
-class CustomBusinessMonthBase(object):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        self.d = datetime(2008, 1, 1)
-
-        tm._skip_if_no_cday()
-        self.offset = self._object()
-        self.offset2 = self._object(2)
-
-    def testEQ(self):
-        self.assertEqual(self.offset2, self.offset2)
-
-    def test_mul(self):
-        pass
-
-    def test_hash(self):
-        self.assertEqual(hash(self.offset2), hash(self.offset2))
-
-    def testRAdd(self):
-        self.assertEqual(self.d + self.offset2, self.offset2 + self.d)
-
-    def testSub(self):
-        off = self.offset2
-        self.assertRaises(Exception, off.__sub__, self.d)
-        self.assertEqual(2 * off - off, off)
-
-        self.assertEqual(self.d - self.offset2,
-                         self.d + self._object(-2))
-
-    def testRSub(self):
-        self.assertEqual(self.d - self.offset2, (-self.offset2).apply(self.d))
-
-    def testMult1(self):
-        self.assertEqual(self.d + 10 * self.offset,
-                         self.d + self._object(10))
-
-    def testMult2(self):
-        self.assertEqual(self.d + (-5 * self._object(-10)),
-                         self.d + self._object(50))
-
-    def test_offsets_compare_equal(self):
-        offset1 = self._object()
-        offset2 = self._object()
-        self.assertFalse(offset1 != offset2)
-
-    def test_roundtrip_pickle(self):
-        def _check_roundtrip(obj):
-            unpickled = self.round_trip_pickle(obj)
-            self.assertEqual(unpickled, obj)
-        _check_roundtrip(self._object())
-        _check_roundtrip(self._object(2))
-        _check_roundtrip(self._object()*2)
-
-
-class TestCustomBusinessMonthEnd(CustomBusinessMonthBase, Base):
-    _object = CBMonthEnd
-
-    def test_different_normalize_equals(self):
-        # equivalent in this special case
-        offset = CBMonthEnd()
-        offset2 = CBMonthEnd()
-        offset2.normalize = True
-        self.assertEqual(offset, offset2)
-
-    def test_repr(self):
-        assert repr(self.offset) == '<CustomBusinessMonthEnd>'
-        assert repr(self.offset2) == '<2 * CustomBusinessMonthEnds>'
-
-    def testCall(self):
-        self.assertEqual(self.offset2(self.d), datetime(2008, 2, 29))
-
-    def testRollback1(self):
-        self.assertEqual(
-            CDay(10).rollback(datetime(2007, 12, 31)), datetime(2007, 12, 31))
-
-    def testRollback2(self):
-        self.assertEqual(CBMonthEnd(10).rollback(self.d),
-                         datetime(2007,12,31))
-
-    def testRollforward1(self):
-        self.assertEqual(CBMonthEnd(10).rollforward(self.d), datetime(2008,1,31))
-
-    def test_roll_date_object(self):
-        offset = CBMonthEnd()
-
-        dt = date(2012, 9, 15)
-
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 8, 31))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 28))
-
-        offset = offsets.Day()
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-    def test_onOffset(self):
-        tests = [(CBMonthEnd(), datetime(2008, 1, 31), True),
-                 (CBMonthEnd(), datetime(2008, 1, 1), False)]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-
-    def test_apply(self):
-        cbm = CBMonthEnd()
-        tests = []
-
-        tests.append((cbm,
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 2, 7): datetime(2008, 2, 29)}))
-
-        tests.append((2 * cbm,
-                      {datetime(2008, 1, 1): datetime(2008, 2, 29),
-                       datetime(2008, 2, 7): datetime(2008, 3, 31)}))
-
-        tests.append((-cbm,
-                      {datetime(2008, 1, 1): datetime(2007, 12, 31),
-                       datetime(2008, 2, 8): datetime(2008, 1, 31)}))
-
-        tests.append((-2 * cbm,
-                      {datetime(2008, 1, 1): datetime(2007, 11, 30),
-                       datetime(2008, 2, 9): datetime(2007, 12, 31)}))
-
-        tests.append((CBMonthEnd(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 2, 7): datetime(2008, 2, 29)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_large_n(self):
-        dt = datetime(2012, 10, 23)
-
-        result = dt + CBMonthEnd(10)
-        self.assertEqual(result, datetime(2013, 7, 31))
-
-        result = dt + CDay(100) - CDay(100)
-        self.assertEqual(result, dt)
-
-        off = CBMonthEnd() * 6
-        rs = datetime(2012, 1, 1) - off
-        xp = datetime(2011, 7, 29)
-        self.assertEqual(rs, xp)
-
-        st = datetime(2011, 12, 18)
-        rs = st + off
-        xp = datetime(2012, 5, 31)
-        self.assertEqual(rs, xp)
-
-    def test_holidays(self):
-        # Define a TradingDay offset
-        holidays = ['2012-01-31', datetime(2012, 2, 28),
-                    np.datetime64('2012-02-29')]
-        bm_offset = CBMonthEnd(holidays=holidays)
-        dt = datetime(2012,1,1)
-        self.assertEqual(dt + bm_offset,datetime(2012,1,30))
-        self.assertEqual(dt + 2*bm_offset,datetime(2012,2,27))
-
-    def test_datetimeindex(self):
-        from pandas.tseries.holiday import USFederalHolidayCalendar
-        hcal = USFederalHolidayCalendar()
-        freq = CBMonthEnd(calendar=hcal)
-
-        self.assertEqual(DatetimeIndex(start='20120101',end='20130101',
-                                       freq=freq).tolist()[0],
-                         datetime(2012,1,31))
-
-class TestCustomBusinessMonthBegin(CustomBusinessMonthBase, Base):
-    _object = CBMonthBegin
-
-    def test_different_normalize_equals(self):
-        # equivalent in this special case
-        offset = CBMonthBegin()
-        offset2 = CBMonthBegin()
-        offset2.normalize = True
-        self.assertEqual(offset, offset2)
-
-    def test_repr(self):
-        assert repr(self.offset) == '<CustomBusinessMonthBegin>'
-        assert repr(self.offset2) == '<2 * CustomBusinessMonthBegins>'
-
-    def testCall(self):
-        self.assertEqual(self.offset2(self.d), datetime(2008, 3, 3))
-
-    def testRollback1(self):
-        self.assertEqual(
-            CDay(10).rollback(datetime(2007, 12, 31)), datetime(2007, 12, 31))
-
-    def testRollback2(self):
-        self.assertEqual(CBMonthBegin(10).rollback(self.d),
-                         datetime(2008,1,1))
-
-    def testRollforward1(self):
-        self.assertEqual(CBMonthBegin(10).rollforward(self.d), datetime(2008,1,1))
-
-    def test_roll_date_object(self):
-        offset = CBMonthBegin()
-
-        dt = date(2012, 9, 15)
-
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 3))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 10, 1))
-
-        offset = offsets.Day()
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-    def test_onOffset(self):
-        tests = [(CBMonthBegin(), datetime(2008, 1, 1), True),
-                 (CBMonthBegin(), datetime(2008, 1, 31), False)]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-
-    def test_apply(self):
-        cbm = CBMonthBegin()
-        tests = []
-
-        tests.append((cbm,
-                      {datetime(2008, 1, 1): datetime(2008, 2, 1),
-                       datetime(2008, 2, 7): datetime(2008, 3, 3)}))
-
-        tests.append((2 * cbm,
-                      {datetime(2008, 1, 1): datetime(2008, 3, 3),
-                       datetime(2008, 2, 7): datetime(2008, 4, 1)}))
-
-        tests.append((-cbm,
-                      {datetime(2008, 1, 1): datetime(2007, 12, 3),
-                       datetime(2008, 2, 8): datetime(2008, 2, 1)}))
-
-        tests.append((-2 * cbm,
-                      {datetime(2008, 1, 1): datetime(2007, 11, 1),
-                       datetime(2008, 2, 9): datetime(2008, 1, 1)}))
-
-        tests.append((CBMonthBegin(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 1, 7): datetime(2008, 2, 1)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_large_n(self):
-        dt = datetime(2012, 10, 23)
-
-        result = dt + CBMonthBegin(10)
-        self.assertEqual(result, datetime(2013, 8, 1))
-
-        result = dt + CDay(100) - CDay(100)
-        self.assertEqual(result, dt)
-
-        off = CBMonthBegin() * 6
-        rs = datetime(2012, 1, 1) - off
-        xp = datetime(2011, 7, 1)
-        self.assertEqual(rs, xp)
-
-        st = datetime(2011, 12, 18)
-        rs = st + off
-        xp = datetime(2012, 6, 1)
-        self.assertEqual(rs, xp)
-
-    def test_holidays(self):
-        # Define a TradingDay offset
-        holidays = ['2012-02-01', datetime(2012, 2, 2),
-                    np.datetime64('2012-03-01')]
-        bm_offset = CBMonthBegin(holidays=holidays)
-        dt = datetime(2012,1,1)
-        self.assertEqual(dt + bm_offset,datetime(2012,1,2))
-        self.assertEqual(dt + 2*bm_offset,datetime(2012,2,3))
-
-    def test_datetimeindex(self):
-        hcal = USFederalHolidayCalendar()
-        cbmb = CBMonthBegin(calendar=hcal)
-        self.assertEqual(DatetimeIndex(start='20120101', end='20130101',
-                                       freq=cbmb).tolist()[0],
-                         datetime(2012,1,3))
-
-
-def assertOnOffset(offset, date, expected):
-    actual = offset.onOffset(date)
-    assert actual == expected, ("\nExpected: %s\nActual: %s\nFor Offset: %s)"
-                                "\nAt Date: %s" %
-                                (expected, actual, offset, date))
-
-
-class TestWeek(Base):
-    _offset = Week
-
-    def test_repr(self):
-        self.assertEqual(repr(Week(weekday=0)), "<Week: weekday=0>")
-        self.assertEqual(repr(Week(n=-1, weekday=0)), "<-1 * Week: weekday=0>")
-        self.assertEqual(repr(Week(n=-2, weekday=0)), "<-2 * Weeks: weekday=0>")
-
-    def test_corner(self):
-        self.assertRaises(ValueError, Week, weekday=7)
-        assertRaisesRegexp(ValueError, "Day must be", Week, weekday=-1)
-
-    def test_isAnchored(self):
-        self.assertTrue(Week(weekday=0).isAnchored())
-        self.assertFalse(Week().isAnchored())
-        self.assertFalse(Week(2, weekday=2).isAnchored())
-        self.assertFalse(Week(2).isAnchored())
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((Week(),  # not business week
-                      {datetime(2008, 1, 1): datetime(2008, 1, 8),
-                       datetime(2008, 1, 4): datetime(2008, 1, 11),
-                       datetime(2008, 1, 5): datetime(2008, 1, 12),
-                       datetime(2008, 1, 6): datetime(2008, 1, 13),
-                       datetime(2008, 1, 7): datetime(2008, 1, 14)}))
-
-        tests.append((Week(weekday=0),  # Mon
-                      {datetime(2007, 12, 31): datetime(2008, 1, 7),
-                       datetime(2008, 1, 4): datetime(2008, 1, 7),
-                       datetime(2008, 1, 5): datetime(2008, 1, 7),
-                       datetime(2008, 1, 6): datetime(2008, 1, 7),
-                       datetime(2008, 1, 7): datetime(2008, 1, 14)}))
-
-        tests.append((Week(0, weekday=0),  # n=0 -> roll forward. Mon
-                      {datetime(2007, 12, 31): datetime(2007, 12, 31),
-                       datetime(2008, 1, 4): datetime(2008, 1, 7),
-                       datetime(2008, 1, 5): datetime(2008, 1, 7),
-                       datetime(2008, 1, 6): datetime(2008, 1, 7),
-                       datetime(2008, 1, 7): datetime(2008, 1, 7)}))
-
-        tests.append((Week(-2, weekday=1),  # n=0 -> roll forward. Mon
-                      {datetime(2010, 4, 6): datetime(2010, 3, 23),
-                       datetime(2010, 4, 8): datetime(2010, 3, 30),
-                       datetime(2010, 4, 5): datetime(2010, 3, 23)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_onOffset(self):
-        for weekday in range(7):
-            offset = Week(weekday=weekday)
-
-            for day in range(1, 8):
-                date = datetime(2008, 1, day)
-
-                if day % 7 == weekday:
-                    expected = True
-                else:
-                    expected = False
-            assertOnOffset(offset, date, expected)
-
-    def test_offsets_compare_equal(self):
-        # root cause of #456
-        offset1 = Week()
-        offset2 = Week()
-        self.assertFalse(offset1 != offset2)
-
-
-class TestWeekOfMonth(Base):
-    _offset = WeekOfMonth
-
-    def test_constructor(self):
-        assertRaisesRegexp(ValueError, "^N cannot be 0", WeekOfMonth, n=0, week=1, weekday=1)
-        assertRaisesRegexp(ValueError, "^Week", WeekOfMonth, n=1, week=4, weekday=0)
-        assertRaisesRegexp(ValueError, "^Week", WeekOfMonth, n=1, week=-1, weekday=0)
-        assertRaisesRegexp(ValueError, "^Day", WeekOfMonth, n=1, week=0, weekday=-1)
-        assertRaisesRegexp(ValueError, "^Day", WeekOfMonth, n=1, week=0, weekday=7)
-
-    def test_repr(self):
-        self.assertEqual(repr(WeekOfMonth(weekday=1,week=2)), "<WeekOfMonth: week=2, weekday=1>")
-
-    def test_offset(self):
-        date1 = datetime(2011, 1, 4)  # 1st Tuesday of Month
-        date2 = datetime(2011, 1, 11)  # 2nd Tuesday of Month
-        date3 = datetime(2011, 1, 18)  # 3rd Tuesday of Month
-        date4 = datetime(2011, 1, 25)  # 4th Tuesday of Month
-
-        # see for loop for structure
-        test_cases = [
-            (-2, 2, 1, date1, datetime(2010, 11, 16)),
-            (-2, 2, 1, date2, datetime(2010, 11, 16)),
-            (-2, 2, 1, date3, datetime(2010, 11, 16)),
-            (-2, 2, 1, date4, datetime(2010, 12, 21)),
-
-            (-1, 2, 1, date1, datetime(2010, 12, 21)),
-            (-1, 2, 1, date2, datetime(2010, 12, 21)),
-            (-1, 2, 1, date3, datetime(2010, 12, 21)),
-            (-1, 2, 1, date4, datetime(2011, 1, 18)),
-
-            (1, 0, 0, date1, datetime(2011, 2, 7)),
-            (1, 0, 0, date2, datetime(2011, 2, 7)),
-            (1, 0, 0, date3, datetime(2011, 2, 7)),
-            (1, 0, 0, date4, datetime(2011, 2, 7)),
-            (1, 0, 1, date1, datetime(2011, 2, 1)),
-            (1, 0, 1, date2, datetime(2011, 2, 1)),
-            (1, 0, 1, date3, datetime(2011, 2, 1)),
-            (1, 0, 1, date4, datetime(2011, 2, 1)),
-            (1, 0, 2, date1, datetime(2011, 1, 5)),
-            (1, 0, 2, date2, datetime(2011, 2, 2)),
-            (1, 0, 2, date3, datetime(2011, 2, 2)),
-            (1, 0, 2, date4, datetime(2011, 2, 2)),
-
-            (1, 2, 1, date1, datetime(2011, 1, 18)),
-            (1, 2, 1, date2, datetime(2011, 1, 18)),
-            (1, 2, 1, date3, datetime(2011, 2, 15)),
-            (1, 2, 1, date4, datetime(2011, 2, 15)),
-
-            (2, 2, 1, date1, datetime(2011, 2, 15)),
-            (2, 2, 1, date2, datetime(2011, 2, 15)),
-            (2, 2, 1, date3, datetime(2011, 3, 15)),
-            (2, 2, 1, date4, datetime(2011, 3, 15)),
-        ]
-
-        for n, week, weekday, date, expected in test_cases:
-            offset = WeekOfMonth(n, week=week, weekday=weekday)
-            assertEq(offset, date, expected)
-
-        # try subtracting
-        result = datetime(2011, 2, 1) - WeekOfMonth(week=1, weekday=2)
-        self.assertEqual(result, datetime(2011, 1, 12))
-        result = datetime(2011, 2, 3) - WeekOfMonth(week=0, weekday=2)
-        self.assertEqual(result, datetime(2011, 2, 2))
-
-    def test_onOffset(self):
-        test_cases = [
-            (0, 0, datetime(2011, 2, 7), True),
-            (0, 0, datetime(2011, 2, 6), False),
-            (0, 0, datetime(2011, 2, 14), False),
-            (1, 0, datetime(2011, 2, 14), True),
-            (0, 1, datetime(2011, 2, 1), True),
-            (0, 1, datetime(2011, 2, 8), False),
-        ]
-
-        for week, weekday, date, expected in test_cases:
-            offset = WeekOfMonth(week=week, weekday=weekday)
-            self.assertEqual(offset.onOffset(date), expected)
-
-class TestLastWeekOfMonth(Base):
-    _offset = LastWeekOfMonth
-
-    def test_constructor(self):
-        assertRaisesRegexp(ValueError, "^N cannot be 0", \
-                           LastWeekOfMonth, n=0, weekday=1)
-
-        assertRaisesRegexp(ValueError, "^Day", LastWeekOfMonth, n=1, weekday=-1)
-        assertRaisesRegexp(ValueError, "^Day", LastWeekOfMonth, n=1, weekday=7)
-
-    def test_offset(self):
-        #### Saturday
-        last_sat = datetime(2013,8,31)
-        next_sat = datetime(2013,9,28)
-        offset_sat = LastWeekOfMonth(n=1, weekday=5)
-
-        one_day_before = (last_sat + timedelta(days=-1))
-        self.assertEqual(one_day_before + offset_sat, last_sat)
-
-        one_day_after = (last_sat + timedelta(days=+1))
-        self.assertEqual(one_day_after + offset_sat, next_sat)
-
-        #Test On that day
-        self.assertEqual(last_sat + offset_sat, next_sat)
-
-        #### Thursday
-
-        offset_thur = LastWeekOfMonth(n=1, weekday=3)
-        last_thurs = datetime(2013,1,31)
-        next_thurs = datetime(2013,2,28)
-
-        one_day_before = last_thurs + timedelta(days=-1)
-        self.assertEqual(one_day_before + offset_thur, last_thurs)
-
-        one_day_after = last_thurs + timedelta(days=+1)
-        self.assertEqual(one_day_after + offset_thur, next_thurs)
-
-        # Test on that day
-        self.assertEqual(last_thurs + offset_thur, next_thurs)
-
-        three_before = last_thurs + timedelta(days=-3)
-        self.assertEqual(three_before + offset_thur, last_thurs)
-
-        two_after = last_thurs + timedelta(days=+2)
-        self.assertEqual(two_after + offset_thur, next_thurs)
-
-        offset_sunday = LastWeekOfMonth(n=1, weekday=WeekDay.SUN)
-        self.assertEqual(datetime(2013,7,31) + offset_sunday, datetime(2013,8,25))
-
-    def test_onOffset(self):
-        test_cases = [
-            (WeekDay.SUN, datetime(2013, 1, 27), True),
-            (WeekDay.SAT, datetime(2013, 3, 30), True),
-            (WeekDay.MON, datetime(2013, 2, 18), False), #Not the last Mon
-            (WeekDay.SUN, datetime(2013, 2, 25), False), #Not a SUN
-            (WeekDay.MON, datetime(2013, 2, 25), True),
-            (WeekDay.SAT, datetime(2013, 11, 30), True),
-
-            (WeekDay.SAT, datetime(2006, 8, 26), True),
-            (WeekDay.SAT, datetime(2007, 8, 25), True),
-            (WeekDay.SAT, datetime(2008, 8, 30), True),
-            (WeekDay.SAT, datetime(2009, 8, 29), True),
-            (WeekDay.SAT, datetime(2010, 8, 28), True),
-            (WeekDay.SAT, datetime(2011, 8, 27), True),
-            (WeekDay.SAT, datetime(2019, 8, 31), True),
-        ]
-
-        for weekday, date, expected in test_cases:
-            offset = LastWeekOfMonth(weekday=weekday)
-            self.assertEqual(offset.onOffset(date), expected, msg=date)
-
-
-class TestBMonthBegin(Base):
-    _offset = BMonthBegin
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BMonthBegin(),
-                     {datetime(2008, 1, 1): datetime(2008, 2, 1),
-                      datetime(2008, 1, 31): datetime(2008, 2, 1),
-                      datetime(2006, 12, 29): datetime(2007, 1, 1),
-                      datetime(2006, 12, 31): datetime(2007, 1, 1),
-                      datetime(2006, 9, 1): datetime(2006, 10, 2),
-                      datetime(2007, 1, 1): datetime(2007, 2, 1),
-                      datetime(2006, 12, 1): datetime(2007, 1, 1)}))
-
-        tests.append((BMonthBegin(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2006, 10, 2): datetime(2006, 10, 2),
-                       datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2006, 12, 29): datetime(2007, 1, 1),
-                       datetime(2006, 12, 31): datetime(2007, 1, 1),
-                       datetime(2006, 9, 15): datetime(2006, 10, 2)}))
-
-        tests.append((BMonthBegin(2),
-                     {datetime(2008, 1, 1): datetime(2008, 3, 3),
-                      datetime(2008, 1, 15): datetime(2008, 3, 3),
-                      datetime(2006, 12, 29): datetime(2007, 2, 1),
-                      datetime(2006, 12, 31): datetime(2007, 2, 1),
-                      datetime(2007, 1, 1): datetime(2007, 3, 1),
-                      datetime(2006, 11, 1): datetime(2007, 1, 1)}))
-
-        tests.append((BMonthBegin(-1),
-                     {datetime(2007, 1, 1): datetime(2006, 12, 1),
-                      datetime(2008, 6, 30): datetime(2008, 6, 2),
-                      datetime(2008, 6, 1): datetime(2008, 5, 1),
-                      datetime(2008, 3, 10): datetime(2008, 3, 3),
-                      datetime(2008, 12, 31): datetime(2008, 12, 1),
-                      datetime(2006, 12, 29): datetime(2006, 12, 1),
-                      datetime(2006, 12, 30): datetime(2006, 12, 1),
-                      datetime(2007, 1, 1): datetime(2006, 12, 1)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_onOffset(self):
-
-        tests = [(BMonthBegin(), datetime(2007, 12, 31), False),
-                 (BMonthBegin(), datetime(2008, 1, 1), True),
-                 (BMonthBegin(), datetime(2001, 4, 2), True),
-                 (BMonthBegin(), datetime(2008, 3, 3), True)]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-    def test_offsets_compare_equal(self):
-        # root cause of #456
-        offset1 = BMonthBegin()
-        offset2 = BMonthBegin()
-        self.assertFalse(offset1 != offset2)
-
-
-class TestBMonthEnd(Base):
-    _offset = BMonthEnd
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BMonthEnd(),
-                     {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                      datetime(2008, 1, 31): datetime(2008, 2, 29),
-                      datetime(2006, 12, 29): datetime(2007, 1, 31),
-                      datetime(2006, 12, 31): datetime(2007, 1, 31),
-                      datetime(2007, 1, 1): datetime(2007, 1, 31),
-                      datetime(2006, 12, 1): datetime(2006, 12, 29)}))
-
-        tests.append((BMonthEnd(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 1, 31),
-                       datetime(2006, 12, 29): datetime(2006, 12, 29),
-                       datetime(2006, 12, 31): datetime(2007, 1, 31),
-                       datetime(2007, 1, 1): datetime(2007, 1, 31)}))
-
-        tests.append((BMonthEnd(2),
-                     {datetime(2008, 1, 1): datetime(2008, 2, 29),
-                      datetime(2008, 1, 31): datetime(2008, 3, 31),
-                      datetime(2006, 12, 29): datetime(2007, 2, 28),
-                      datetime(2006, 12, 31): datetime(2007, 2, 28),
-                      datetime(2007, 1, 1): datetime(2007, 2, 28),
-                      datetime(2006, 11, 1): datetime(2006, 12, 29)}))
-
-        tests.append((BMonthEnd(-1),
-                     {datetime(2007, 1, 1): datetime(2006, 12, 29),
-                      datetime(2008, 6, 30): datetime(2008, 5, 30),
-                      datetime(2008, 12, 31): datetime(2008, 11, 28),
-                      datetime(2006, 12, 29): datetime(2006, 11, 30),
-                      datetime(2006, 12, 30): datetime(2006, 12, 29),
-                      datetime(2007, 1, 1): datetime(2006, 12, 29)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_normalize(self):
-        dt = datetime(2007, 1, 1, 3)
-
-        result = dt + BMonthEnd(normalize=True)
-        expected = dt.replace(hour=0) + BMonthEnd()
-        self.assertEqual(result, expected)
-
-    def test_onOffset(self):
-
-        tests = [(BMonthEnd(), datetime(2007, 12, 31), True),
-                 (BMonthEnd(), datetime(2008, 1, 1), False)]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-    def test_offsets_compare_equal(self):
-        # root cause of #456
-        offset1 = BMonthEnd()
-        offset2 = BMonthEnd()
-        self.assertFalse(offset1 != offset2)
-
-
-class TestMonthBegin(Base):
-    _offset = MonthBegin
-
-    def test_offset(self):
-        tests = []
-
-        # NOTE: I'm not entirely happy with the logic here for Begin -ss
-        # see thread 'offset conventions' on the ML
-        tests.append((MonthBegin(),
-                     {datetime(2008, 1, 31): datetime(2008, 2, 1),
-                      datetime(2008, 2, 1): datetime(2008, 3, 1),
-                      datetime(2006, 12, 31): datetime(2007, 1, 1),
-                      datetime(2006, 12, 1): datetime(2007, 1, 1),
-                      datetime(2007, 1, 31): datetime(2007, 2, 1)}))
-
-        tests.append((MonthBegin(0),
-                      {datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2006, 12, 3): datetime(2007, 1, 1),
-                       datetime(2007, 1, 31): datetime(2007, 2, 1)}))
-
-        tests.append((MonthBegin(2),
-                     {datetime(2008, 2, 29): datetime(2008, 4, 1),
-                      datetime(2008, 1, 31): datetime(2008, 3, 1),
-                      datetime(2006, 12, 31): datetime(2007, 2, 1),
-                      datetime(2007, 12, 28): datetime(2008, 2, 1),
-                      datetime(2007, 1, 1): datetime(2007, 3, 1),
-                      datetime(2006, 11, 1): datetime(2007, 1, 1)}))
-
-        tests.append((MonthBegin(-1),
-                     {datetime(2007, 1, 1): datetime(2006, 12, 1),
-                      datetime(2008, 5, 31): datetime(2008, 5, 1),
-                      datetime(2008, 12, 31): datetime(2008, 12, 1),
-                      datetime(2006, 12, 29): datetime(2006, 12, 1),
-                      datetime(2006, 1, 2): datetime(2006, 1, 1)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-
-class TestMonthEnd(Base):
-    _offset = MonthEnd
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((MonthEnd(),
-                     {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                      datetime(2008, 1, 31): datetime(2008, 2, 29),
-                      datetime(2006, 12, 29): datetime(2006, 12, 31),
-                      datetime(2006, 12, 31): datetime(2007, 1, 31),
-                      datetime(2007, 1, 1): datetime(2007, 1, 31),
-                      datetime(2006, 12, 1): datetime(2006, 12, 31)}))
-
-        tests.append((MonthEnd(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 1, 31),
-                       datetime(2006, 12, 29): datetime(2006, 12, 31),
-                       datetime(2006, 12, 31): datetime(2006, 12, 31),
-                       datetime(2007, 1, 1): datetime(2007, 1, 31)}))
-
-        tests.append((MonthEnd(2),
-                     {datetime(2008, 1, 1): datetime(2008, 2, 29),
-                      datetime(2008, 1, 31): datetime(2008, 3, 31),
-                      datetime(2006, 12, 29): datetime(2007, 1, 31),
-                      datetime(2006, 12, 31): datetime(2007, 2, 28),
-                      datetime(2007, 1, 1): datetime(2007, 2, 28),
-                      datetime(2006, 11, 1): datetime(2006, 12, 31)}))
-
-        tests.append((MonthEnd(-1),
-                     {datetime(2007, 1, 1): datetime(2006, 12, 31),
-                      datetime(2008, 6, 30): datetime(2008, 5, 31),
-                      datetime(2008, 12, 31): datetime(2008, 11, 30),
-                      datetime(2006, 12, 29): datetime(2006, 11, 30),
-                      datetime(2006, 12, 30): datetime(2006, 11, 30),
-                      datetime(2007, 1, 1): datetime(2006, 12, 31)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    # def test_day_of_month(self):
-    #     dt = datetime(2007, 1, 1)
-
-    #     offset = MonthEnd(day=20)
-
-    #     result = dt + offset
-    #     self.assertEqual(result, datetime(2007, 1, 20))
-
-    #     result = result + offset
-    #     self.assertEqual(result, datetime(2007, 2, 20))
-
-    def test_normalize(self):
-        dt = datetime(2007, 1, 1, 3)
-
-        result = dt + MonthEnd(normalize=True)
-        expected = dt.replace(hour=0) + MonthEnd()
-        self.assertEqual(result, expected)
-
-    def test_onOffset(self):
-
-        tests = [(MonthEnd(), datetime(2007, 12, 31), True),
-                 (MonthEnd(), datetime(2008, 1, 1), False)]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-
-class TestBQuarterBegin(Base):
-    _offset = BQuarterBegin
-
-    def test_repr(self):
-        self.assertEqual(repr(BQuarterBegin()),"<BusinessQuarterBegin: startingMonth=3>")
-        self.assertEqual(repr(BQuarterBegin(startingMonth=3)), "<BusinessQuarterBegin: startingMonth=3>")
-        self.assertEqual(repr(BQuarterBegin(startingMonth=1)), "<BusinessQuarterBegin: startingMonth=1>")
-
-    def test_isAnchored(self):
-        self.assertTrue(BQuarterBegin(startingMonth=1).isAnchored())
-        self.assertTrue(BQuarterBegin().isAnchored())
-        self.assertFalse(BQuarterBegin(2, startingMonth=1).isAnchored())
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BQuarterBegin(startingMonth=1),
-                      {datetime(2008, 1, 1): datetime(2008, 4, 1),
-                       datetime(2008, 1, 31): datetime(2008, 4, 1),
-                       datetime(2008, 2, 15): datetime(2008, 4, 1),
-                       datetime(2008, 2, 29): datetime(2008, 4, 1),
-                       datetime(2008, 3, 15): datetime(2008, 4, 1),
-                       datetime(2008, 3, 31): datetime(2008, 4, 1),
-                       datetime(2008, 4, 15): datetime(2008, 7, 1),
-                       datetime(2007, 3, 15): datetime(2007, 4, 2),
-                       datetime(2007, 2, 28): datetime(2007, 4, 2),
-                       datetime(2007, 1, 1): datetime(2007, 4, 2),
-                       datetime(2007, 4, 15): datetime(2007, 7, 2),
-                       datetime(2007, 7, 1): datetime(2007, 7, 2),
-                       datetime(2007, 4, 1): datetime(2007, 4, 2),
-                       datetime(2007, 4, 2): datetime(2007, 7, 2),
-                       datetime(2008, 4, 30): datetime(2008, 7, 1), }))
-
-        tests.append((BQuarterBegin(startingMonth=2),
-                      {datetime(2008, 1, 1): datetime(2008, 2, 1),
-                       datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2008, 1, 15): datetime(2008, 2, 1),
-                       datetime(2008, 2, 29): datetime(2008, 5, 1),
-                       datetime(2008, 3, 15): datetime(2008, 5, 1),
-                       datetime(2008, 3, 31): datetime(2008, 5, 1),
-                       datetime(2008, 4, 15): datetime(2008, 5, 1),
-                       datetime(2008, 8, 15): datetime(2008, 11, 3),
-                       datetime(2008, 9, 15): datetime(2008, 11, 3),
-                       datetime(2008, 11, 1): datetime(2008, 11, 3),
-                       datetime(2008, 4, 30): datetime(2008, 5, 1), }))
-
-        tests.append((BQuarterBegin(startingMonth=1, n=0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2007, 12, 31): datetime(2008, 1, 1),
-                       datetime(2008, 2, 15): datetime(2008, 4, 1),
-                       datetime(2008, 2, 29): datetime(2008, 4, 1),
-                       datetime(2008, 1, 15): datetime(2008, 4, 1),
-                       datetime(2008, 2, 27): datetime(2008, 4, 1),
-                       datetime(2008, 3, 15): datetime(2008, 4, 1),
-                       datetime(2007, 4, 1): datetime(2007, 4, 2),
-                       datetime(2007, 4, 2): datetime(2007, 4, 2),
-                       datetime(2007, 7, 1): datetime(2007, 7, 2),
-                       datetime(2007, 4, 15): datetime(2007, 7, 2),
-                       datetime(2007, 7, 2): datetime(2007, 7, 2), }))
-
-        tests.append((BQuarterBegin(startingMonth=1, n=-1),
-                      {datetime(2008, 1, 1): datetime(2007, 10, 1),
-                       datetime(2008, 1, 31): datetime(2008, 1, 1),
-                       datetime(2008, 2, 15): datetime(2008, 1, 1),
-                       datetime(2008, 2, 29): datetime(2008, 1, 1),
-                       datetime(2008, 3, 15): datetime(2008, 1, 1),
-                       datetime(2008, 3, 31): datetime(2008, 1, 1),
-                       datetime(2008, 4, 15): datetime(2008, 4, 1),
-                       datetime(2007, 7, 3): datetime(2007, 7, 2),
-                       datetime(2007, 4, 3): datetime(2007, 4, 2),
-                       datetime(2007, 7, 2): datetime(2007, 4, 2),
-                       datetime(2008, 4, 1): datetime(2008, 1, 1), }))
-
-        tests.append((BQuarterBegin(startingMonth=1, n=2),
-                      {datetime(2008, 1, 1): datetime(2008, 7, 1),
-                       datetime(2008, 1, 15): datetime(2008, 7, 1),
-                       datetime(2008, 2, 29): datetime(2008, 7, 1),
-                       datetime(2008, 3, 15): datetime(2008, 7, 1),
-                       datetime(2007, 3, 31): datetime(2007, 7, 2),
-                       datetime(2007, 4, 15): datetime(2007, 10, 1),
-                       datetime(2008, 4, 30): datetime(2008, 10, 1), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-        # corner
-        offset = BQuarterBegin(n=-1, startingMonth=1)
-        self.assertEqual(datetime(2007, 4, 3) + offset, datetime(2007, 4, 2))
-
-
-class TestBQuarterEnd(Base):
-    _offset = BQuarterEnd
-
-    def test_repr(self):
-        self.assertEqual(repr(BQuarterEnd()),"<BusinessQuarterEnd: startingMonth=3>")
-        self.assertEqual(repr(BQuarterEnd(startingMonth=3)), "<BusinessQuarterEnd: startingMonth=3>")
-        self.assertEqual(repr(BQuarterEnd(startingMonth=1)), "<BusinessQuarterEnd: startingMonth=1>")
-
-    def test_isAnchored(self):
-        self.assertTrue(BQuarterEnd(startingMonth=1).isAnchored())
-        self.assertTrue(BQuarterEnd().isAnchored())
-        self.assertFalse(BQuarterEnd(2, startingMonth=1).isAnchored())
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BQuarterEnd(startingMonth=1),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 4, 30),
-                       datetime(2008, 2, 15): datetime(2008, 4, 30),
-                       datetime(2008, 2, 29): datetime(2008, 4, 30),
-                       datetime(2008, 3, 15): datetime(2008, 4, 30),
-                       datetime(2008, 3, 31): datetime(2008, 4, 30),
-                       datetime(2008, 4, 15): datetime(2008, 4, 30),
-                       datetime(2008, 4, 30): datetime(2008, 7, 31), }))
-
-        tests.append((BQuarterEnd(startingMonth=2),
-                      {datetime(2008, 1, 1): datetime(2008, 2, 29),
-                       datetime(2008, 1, 31): datetime(2008, 2, 29),
-                       datetime(2008, 2, 15): datetime(2008, 2, 29),
-                       datetime(2008, 2, 29): datetime(2008, 5, 30),
-                       datetime(2008, 3, 15): datetime(2008, 5, 30),
-                       datetime(2008, 3, 31): datetime(2008, 5, 30),
-                       datetime(2008, 4, 15): datetime(2008, 5, 30),
-                       datetime(2008, 4, 30): datetime(2008, 5, 30), }))
-
-        tests.append((BQuarterEnd(startingMonth=1, n=0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 1, 31),
-                       datetime(2008, 2, 15): datetime(2008, 4, 30),
-                       datetime(2008, 2, 29): datetime(2008, 4, 30),
-                       datetime(2008, 3, 15): datetime(2008, 4, 30),
-                       datetime(2008, 3, 31): datetime(2008, 4, 30),
-                       datetime(2008, 4, 15): datetime(2008, 4, 30),
-                       datetime(2008, 4, 30): datetime(2008, 4, 30), }))
-
-        tests.append((BQuarterEnd(startingMonth=1, n=-1),
-                      {datetime(2008, 1, 1): datetime(2007, 10, 31),
-                       datetime(2008, 1, 31): datetime(2007, 10, 31),
-                       datetime(2008, 2, 15): datetime(2008, 1, 31),
-                       datetime(2008, 2, 29): datetime(2008, 1, 31),
-                       datetime(2008, 3, 15): datetime(2008, 1, 31),
-                       datetime(2008, 3, 31): datetime(2008, 1, 31),
-                       datetime(2008, 4, 15): datetime(2008, 1, 31),
-                       datetime(2008, 4, 30): datetime(2008, 1, 31), }))
-
-        tests.append((BQuarterEnd(startingMonth=1, n=2),
-                      {datetime(2008, 1, 31): datetime(2008, 7, 31),
-                       datetime(2008, 2, 15): datetime(2008, 7, 31),
-                       datetime(2008, 2, 29): datetime(2008, 7, 31),
-                       datetime(2008, 3, 15): datetime(2008, 7, 31),
-                       datetime(2008, 3, 31): datetime(2008, 7, 31),
-                       datetime(2008, 4, 15): datetime(2008, 7, 31),
-                       datetime(2008, 4, 30): datetime(2008, 10, 31), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-        # corner
-        offset = BQuarterEnd(n=-1, startingMonth=1)
-        self.assertEqual(datetime(2010, 1, 31) + offset, datetime(2010, 1, 29))
-
-    def test_onOffset(self):
-
-        tests = [
-            (BQuarterEnd(1, startingMonth=1), datetime(2008, 1, 31), True),
-            (BQuarterEnd(1, startingMonth=1), datetime(2007, 12, 31), False),
-            (BQuarterEnd(1, startingMonth=1), datetime(2008, 2, 29), False),
-            (BQuarterEnd(1, startingMonth=1), datetime(2007, 3, 30), False),
-            (BQuarterEnd(1, startingMonth=1), datetime(2007, 3, 31), False),
-            (BQuarterEnd(1, startingMonth=1), datetime(2008, 4, 30), True),
-            (BQuarterEnd(1, startingMonth=1), datetime(2008, 5, 30), False),
-            (BQuarterEnd(1, startingMonth=1), datetime(2007, 6, 29), False),
-            (BQuarterEnd(1, startingMonth=1), datetime(2007, 6, 30), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2008, 1, 31), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2007, 12, 31), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2008, 2, 29), True),
-            (BQuarterEnd(1, startingMonth=2), datetime(2007, 3, 30), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2007, 3, 31), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2008, 4, 30), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2008, 5, 30), True),
-            (BQuarterEnd(1, startingMonth=2), datetime(2007, 6, 29), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2007, 6, 30), False),
-            (BQuarterEnd(1, startingMonth=3), datetime(2008, 1, 31), False),
-            (BQuarterEnd(1, startingMonth=3), datetime(2007, 12, 31), True),
-            (BQuarterEnd(1, startingMonth=3), datetime(2008, 2, 29), False),
-            (BQuarterEnd(1, startingMonth=3), datetime(2007, 3, 30), True),
-            (BQuarterEnd(1, startingMonth=3), datetime(2007, 3, 31), False),
-            (BQuarterEnd(1, startingMonth=3), datetime(2008, 4, 30), False),
-            (BQuarterEnd(1, startingMonth=3), datetime(2008, 5, 30), False),
-            (BQuarterEnd(1, startingMonth=3), datetime(2007, 6, 29), True),
-            (BQuarterEnd(1, startingMonth=3), datetime(2007, 6, 30), False),
-        ]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-def makeFY5253LastOfMonthQuarter(*args, **kwds):
-    return FY5253Quarter(*args, variation="last", **kwds)
-
-def makeFY5253NearestEndMonthQuarter(*args, **kwds):
-    return FY5253Quarter(*args, variation="nearest", **kwds)
-
-def makeFY5253NearestEndMonth(*args, **kwds):
-    return FY5253(*args, variation="nearest", **kwds)
-
-def makeFY5253LastOfMonth(*args, **kwds):
-    return FY5253(*args, variation="last", **kwds)
-
-class TestFY5253LastOfMonth(Base):
-
-    def test_onOffset(self):
-
-        offset_lom_sat_aug = makeFY5253LastOfMonth(1, startingMonth=8, weekday=WeekDay.SAT)
-        offset_lom_sat_sep = makeFY5253LastOfMonth(1, startingMonth=9, weekday=WeekDay.SAT)
-
-        tests = [
-            #From Wikipedia (see: http://en.wikipedia.org/wiki/4%E2%80%934%E2%80%935_calendar#Last_Saturday_of_the_month_at_fiscal_year_end)
-            (offset_lom_sat_aug, datetime(2006, 8, 26), True),
-            (offset_lom_sat_aug, datetime(2007, 8, 25), True),
-            (offset_lom_sat_aug, datetime(2008, 8, 30), True),
-            (offset_lom_sat_aug, datetime(2009, 8, 29), True),
-            (offset_lom_sat_aug, datetime(2010, 8, 28), True),
-            (offset_lom_sat_aug, datetime(2011, 8, 27), True),
-            (offset_lom_sat_aug, datetime(2012, 8, 25), True),
-            (offset_lom_sat_aug, datetime(2013, 8, 31), True),
-            (offset_lom_sat_aug, datetime(2014, 8, 30), True),
-            (offset_lom_sat_aug, datetime(2015, 8, 29), True),
-            (offset_lom_sat_aug, datetime(2016, 8, 27), True),
-            (offset_lom_sat_aug, datetime(2017, 8, 26), True),
-            (offset_lom_sat_aug, datetime(2018, 8, 25), True),
-            (offset_lom_sat_aug, datetime(2019, 8, 31), True),
-
-            (offset_lom_sat_aug, datetime(2006, 8, 27), False),
-            (offset_lom_sat_aug, datetime(2007, 8, 28), False),
-            (offset_lom_sat_aug, datetime(2008, 8, 31), False),
-            (offset_lom_sat_aug, datetime(2009, 8, 30), False),
-            (offset_lom_sat_aug, datetime(2010, 8, 29), False),
-            (offset_lom_sat_aug, datetime(2011, 8, 28), False),
-
-            (offset_lom_sat_aug, datetime(2006, 8, 25), False),
-            (offset_lom_sat_aug, datetime(2007, 8, 24), False),
-            (offset_lom_sat_aug, datetime(2008, 8, 29), False),
-            (offset_lom_sat_aug, datetime(2009, 8, 28), False),
-            (offset_lom_sat_aug, datetime(2010, 8, 27), False),
-            (offset_lom_sat_aug, datetime(2011, 8, 26), False),
-            (offset_lom_sat_aug, datetime(2019, 8, 30), False),
-
-            #From GMCR (see for example: http://yahoo.brand.edgar-online.com/Default.aspx?companyid=3184&formtypeID=7)
-            (offset_lom_sat_sep, datetime(2010, 9, 25), True),
-            (offset_lom_sat_sep, datetime(2011, 9, 24), True),
-            (offset_lom_sat_sep, datetime(2012, 9, 29), True),
-
-        ]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-    def test_apply(self):
-        offset_lom_aug_sat = makeFY5253LastOfMonth(startingMonth=8, weekday=WeekDay.SAT)
-        offset_lom_aug_sat_1 = makeFY5253LastOfMonth(n=1, startingMonth=8, weekday=WeekDay.SAT)
-
-        date_seq_lom_aug_sat = [datetime(2006, 8, 26), datetime(2007, 8, 25),
-                                datetime(2008, 8, 30), datetime(2009, 8, 29),
-                                datetime(2010, 8, 28), datetime(2011, 8, 27),
-                                datetime(2012, 8, 25), datetime(2013, 8, 31),
-                                datetime(2014, 8, 30), datetime(2015, 8, 29),
-                                datetime(2016, 8, 27)]
-
-        tests = [
-                 (offset_lom_aug_sat, date_seq_lom_aug_sat),
-                 (offset_lom_aug_sat_1, date_seq_lom_aug_sat),
-                 (offset_lom_aug_sat, [datetime(2006, 8, 25)] + date_seq_lom_aug_sat),
-                 (offset_lom_aug_sat_1, [datetime(2006, 8, 27)] + date_seq_lom_aug_sat[1:]),
-                 (makeFY5253LastOfMonth(n=-1, startingMonth=8, weekday=WeekDay.SAT), list(reversed(date_seq_lom_aug_sat))),
-                ]
-        for test in tests:
-            offset, data = test
-            current = data[0]
-            for datum in data[1:]:
-                current = current + offset
-                self.assertEqual(current, datum)
-
-class TestFY5253NearestEndMonth(Base):
-
-    def test_get_target_month_end(self):
-        self.assertEqual(makeFY5253NearestEndMonth(startingMonth=8, weekday=WeekDay.SAT).get_target_month_end(datetime(2013,1,1)), datetime(2013,8,31))
-        self.assertEqual(makeFY5253NearestEndMonth(startingMonth=12, weekday=WeekDay.SAT).get_target_month_end(datetime(2013,1,1)), datetime(2013,12,31))
-        self.assertEqual(makeFY5253NearestEndMonth(startingMonth=2, weekday=WeekDay.SAT).get_target_month_end(datetime(2013,1,1)), datetime(2013,2,28))
-
-    def test_get_year_end(self):
-        self.assertEqual(makeFY5253NearestEndMonth(startingMonth=8, weekday=WeekDay.SAT).get_year_end(datetime(2013,1,1)), datetime(2013,8,31))
-        self.assertEqual(makeFY5253NearestEndMonth(startingMonth=8, weekday=WeekDay.SUN).get_year_end(datetime(2013,1,1)), datetime(2013,9,1))
-        self.assertEqual(makeFY5253NearestEndMonth(startingMonth=8, weekday=WeekDay.FRI).get_year_end(datetime(2013,1,1)), datetime(2013,8,30))
-
-        offset_n = FY5253(weekday=WeekDay.TUE, startingMonth=12,
-                      variation="nearest")
-        self.assertEqual(offset_n.get_year_end(datetime(2012,1,1)), datetime(2013,1,1))
-        self.assertEqual(offset_n.get_year_end(datetime(2012,1,10)), datetime(2013,1,1))
-
-        self.assertEqual(offset_n.get_year_end(datetime(2013,1,1)), datetime(2013,12,31))
-        self.assertEqual(offset_n.get_year_end(datetime(2013,1,2)), datetime(2013,12,31))
-        self.assertEqual(offset_n.get_year_end(datetime(2013,1,3)), datetime(2013,12,31))
-        self.assertEqual(offset_n.get_year_end(datetime(2013,1,10)), datetime(2013,12,31))
-
-        JNJ = FY5253(n=1, startingMonth=12, weekday=6, variation="nearest")
-        self.assertEqual(JNJ.get_year_end(datetime(2006, 1, 1)), datetime(2006, 12, 31))
-
-    def test_onOffset(self):
-        offset_lom_aug_sat = makeFY5253NearestEndMonth(1, startingMonth=8, weekday=WeekDay.SAT)
-        offset_lom_aug_thu = makeFY5253NearestEndMonth(1, startingMonth=8, weekday=WeekDay.THU)
-        offset_n = FY5253(weekday=WeekDay.TUE, startingMonth=12,
-                      variation="nearest")
-
-        tests = [
-#             From Wikipedia (see: http://en.wikipedia.org/wiki/4%E2%80%934%E2%80%935_calendar#Saturday_nearest_the_end_of_month)
-#             2006-09-02   2006 September 2
-#             2007-09-01   2007 September 1
-#             2008-08-30   2008 August 30    (leap year)
-#             2009-08-29   2009 August 29
-#             2010-08-28   2010 August 28
-#             2011-09-03   2011 September 3
-#             2012-09-01   2012 September 1  (leap year)
-#             2013-08-31   2013 August 31
-#             2014-08-30   2014 August 30
-#             2015-08-29   2015 August 29
-#             2016-09-03   2016 September 3  (leap year)
-#             2017-09-02   2017 September 2
-#             2018-09-01   2018 September 1
-#             2019-08-31   2019 August 31
-            (offset_lom_aug_sat, datetime(2006, 9, 2), True),
-            (offset_lom_aug_sat, datetime(2007, 9, 1), True),
-            (offset_lom_aug_sat, datetime(2008, 8, 30), True),
-            (offset_lom_aug_sat, datetime(2009, 8, 29), True),
-            (offset_lom_aug_sat, datetime(2010, 8, 28), True),
-            (offset_lom_aug_sat, datetime(2011, 9, 3), True),
-
-            (offset_lom_aug_sat, datetime(2016, 9, 3), True),
-            (offset_lom_aug_sat, datetime(2017, 9, 2), True),
-            (offset_lom_aug_sat, datetime(2018, 9, 1), True),
-            (offset_lom_aug_sat, datetime(2019, 8, 31), True),
-
-            (offset_lom_aug_sat, datetime(2006, 8, 27), False),
-            (offset_lom_aug_sat, datetime(2007, 8, 28), False),
-            (offset_lom_aug_sat, datetime(2008, 8, 31), False),
-            (offset_lom_aug_sat, datetime(2009, 8, 30), False),
-            (offset_lom_aug_sat, datetime(2010, 8, 29), False),
-            (offset_lom_aug_sat, datetime(2011, 8, 28), False),
-
-            (offset_lom_aug_sat, datetime(2006, 8, 25), False),
-            (offset_lom_aug_sat, datetime(2007, 8, 24), False),
-            (offset_lom_aug_sat, datetime(2008, 8, 29), False),
-            (offset_lom_aug_sat, datetime(2009, 8, 28), False),
-            (offset_lom_aug_sat, datetime(2010, 8, 27), False),
-            (offset_lom_aug_sat, datetime(2011, 8, 26), False),
-            (offset_lom_aug_sat, datetime(2019, 8, 30), False),
-
-            #From Micron, see: http://google.brand.edgar-online.com/?sym=MU&formtypeID=7
-            (offset_lom_aug_thu, datetime(2012, 8, 30), True),
-            (offset_lom_aug_thu, datetime(2011, 9, 1), True),
-
-            (offset_n, datetime(2012, 12, 31), False),
-            (offset_n, datetime(2013, 1, 1), True),
-            (offset_n, datetime(2013, 1, 2), False),
-        ]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-    def test_apply(self):
-        date_seq_nem_8_sat = [datetime(2006, 9, 2), datetime(2007, 9, 1),
-                              datetime(2008, 8, 30), datetime(2009, 8, 29),
-                              datetime(2010, 8, 28), datetime(2011, 9, 3)]
-
-        JNJ = [datetime(2005, 1, 2), datetime(2006, 1, 1),
-               datetime(2006, 12, 31), datetime(2007, 12, 30),
-               datetime(2008, 12, 28), datetime(2010, 1, 3),
-               datetime(2011, 1, 2), datetime(2012, 1, 1),
-               datetime(2012, 12, 30)]
-
-        DEC_SAT = FY5253(n=-1, startingMonth=12, weekday=5, variation="nearest")
-
-        tests = [
-                (makeFY5253NearestEndMonth(startingMonth=8, weekday=WeekDay.SAT), date_seq_nem_8_sat),
-                (makeFY5253NearestEndMonth(n=1, startingMonth=8, weekday=WeekDay.SAT), date_seq_nem_8_sat),
-                (makeFY5253NearestEndMonth(startingMonth=8, weekday=WeekDay.SAT), [datetime(2006, 9, 1)] + date_seq_nem_8_sat),
-                (makeFY5253NearestEndMonth(n=1, startingMonth=8, weekday=WeekDay.SAT), [datetime(2006, 9, 3)] + date_seq_nem_8_sat[1:]),
-                (makeFY5253NearestEndMonth(n=-1, startingMonth=8, weekday=WeekDay.SAT), list(reversed(date_seq_nem_8_sat))),
-                (makeFY5253NearestEndMonth(n=1, startingMonth=12, weekday=WeekDay.SUN), JNJ),
-                (makeFY5253NearestEndMonth(n=-1, startingMonth=12, weekday=WeekDay.SUN), list(reversed(JNJ))),
-                (makeFY5253NearestEndMonth(n=1, startingMonth=12, weekday=WeekDay.SUN), [datetime(2005,1,2), datetime(2006, 1, 1)]),
-                (makeFY5253NearestEndMonth(n=1, startingMonth=12, weekday=WeekDay.SUN), [datetime(2006,1,2), datetime(2006, 12, 31)]),
-                (DEC_SAT, [datetime(2013,1,15), datetime(2012,12,29)])
-                ]
-        for test in tests:
-            offset, data = test
-            current = data[0]
-            for datum in data[1:]:
-                current = current + offset
-                self.assertEqual(current, datum)
-
-class TestFY5253LastOfMonthQuarter(Base):
-
-    def test_isAnchored(self):
-        self.assertTrue(makeFY5253LastOfMonthQuarter(startingMonth=1, weekday=WeekDay.SAT, qtr_with_extra_week=4).isAnchored())
-        self.assertTrue(makeFY5253LastOfMonthQuarter(weekday=WeekDay.SAT, startingMonth=3, qtr_with_extra_week=4).isAnchored())
-        self.assertFalse(makeFY5253LastOfMonthQuarter(2, startingMonth=1, weekday=WeekDay.SAT, qtr_with_extra_week=4).isAnchored())
-
-    def test_equality(self):
-        self.assertEqual(makeFY5253LastOfMonthQuarter(startingMonth=1, weekday=WeekDay.SAT, qtr_with_extra_week=4), makeFY5253LastOfMonthQuarter(startingMonth=1, weekday=WeekDay.SAT, qtr_with_extra_week=4))
-        self.assertNotEqual(makeFY5253LastOfMonthQuarter(startingMonth=1, weekday=WeekDay.SAT, qtr_with_extra_week=4), makeFY5253LastOfMonthQuarter(startingMonth=1, weekday=WeekDay.SUN, qtr_with_extra_week=4))
-        self.assertNotEqual(makeFY5253LastOfMonthQuarter(startingMonth=1, weekday=WeekDay.SAT, qtr_with_extra_week=4), makeFY5253LastOfMonthQuarter(startingMonth=2, weekday=WeekDay.SAT, qtr_with_extra_week=4))
-
-    def test_offset(self):
-        offset = makeFY5253LastOfMonthQuarter(1, startingMonth=9, weekday=WeekDay.SAT, qtr_with_extra_week=4)
-        offset2 = makeFY5253LastOfMonthQuarter(2, startingMonth=9, weekday=WeekDay.SAT, qtr_with_extra_week=4)
-        offset4 = makeFY5253LastOfMonthQuarter(4, startingMonth=9, weekday=WeekDay.SAT, qtr_with_extra_week=4)
-
-        offset_neg1 = makeFY5253LastOfMonthQuarter(-1, startingMonth=9, weekday=WeekDay.SAT, qtr_with_extra_week=4)
-        offset_neg2 = makeFY5253LastOfMonthQuarter(-2, startingMonth=9, weekday=WeekDay.SAT, qtr_with_extra_week=4)
-
-        GMCR = [datetime(2010, 3, 27),
-                datetime(2010, 6, 26),
-                datetime(2010, 9, 25),
-                datetime(2010, 12, 25),
-                datetime(2011, 3, 26),
-                datetime(2011, 6, 25),
-                datetime(2011, 9, 24),
-                datetime(2011, 12, 24),
-                datetime(2012, 3, 24),
-                datetime(2012, 6, 23),
-                datetime(2012, 9, 29),
-                datetime(2012, 12, 29),
-                datetime(2013, 3, 30),
-                datetime(2013, 6, 29)]
-
-
-        assertEq(offset, base=GMCR[0], expected=GMCR[1])
-        assertEq(offset, base=GMCR[0] + relativedelta(days=-1), expected=GMCR[0])
-        assertEq(offset, base=GMCR[1], expected=GMCR[2])
-
-        assertEq(offset2, base=GMCR[0], expected=GMCR[2])
-        assertEq(offset4, base=GMCR[0], expected=GMCR[4])
-
-        assertEq(offset_neg1, base=GMCR[-1], expected=GMCR[-2])
-        assertEq(offset_neg1, base=GMCR[-1] + relativedelta(days=+1), expected=GMCR[-1])
-        assertEq(offset_neg2, base=GMCR[-1], expected=GMCR[-3])
-
-        date = GMCR[0] + relativedelta(days=-1)
-        for expected in GMCR:
-            assertEq(offset, date, expected)
-            date = date + offset
-
-        date = GMCR[-1] + relativedelta(days=+1)
-        for expected in reversed(GMCR):
-            assertEq(offset_neg1, date, expected)
-            date = date + offset_neg1
-
-
-    def test_onOffset(self):
-        lomq_aug_sat_4 = makeFY5253LastOfMonthQuarter(1, startingMonth=8, weekday=WeekDay.SAT, qtr_with_extra_week=4)
-        lomq_sep_sat_4 = makeFY5253LastOfMonthQuarter(1, startingMonth=9, weekday=WeekDay.SAT, qtr_with_extra_week=4)
-
-        tests = [
-            #From Wikipedia
-            (lomq_aug_sat_4, datetime(2006, 8, 26), True),
-            (lomq_aug_sat_4, datetime(2007, 8, 25), True),
-            (lomq_aug_sat_4, datetime(2008, 8, 30), True),
-            (lomq_aug_sat_4, datetime(2009, 8, 29), True),
-            (lomq_aug_sat_4, datetime(2010, 8, 28), True),
-            (lomq_aug_sat_4, datetime(2011, 8, 27), True),
-            (lomq_aug_sat_4, datetime(2019, 8, 31), True),
-
-            (lomq_aug_sat_4, datetime(2006, 8, 27), False),
-            (lomq_aug_sat_4, datetime(2007, 8, 28), False),
-            (lomq_aug_sat_4, datetime(2008, 8, 31), False),
-            (lomq_aug_sat_4, datetime(2009, 8, 30), False),
-            (lomq_aug_sat_4, datetime(2010, 8, 29), False),
-            (lomq_aug_sat_4, datetime(2011, 8, 28), False),
-
-            (lomq_aug_sat_4, datetime(2006, 8, 25), False),
-            (lomq_aug_sat_4, datetime(2007, 8, 24), False),
-            (lomq_aug_sat_4, datetime(2008, 8, 29), False),
-            (lomq_aug_sat_4, datetime(2009, 8, 28), False),
-            (lomq_aug_sat_4, datetime(2010, 8, 27), False),
-            (lomq_aug_sat_4, datetime(2011, 8, 26), False),
-            (lomq_aug_sat_4, datetime(2019, 8, 30), False),
-
-            #From GMCR
-            (lomq_sep_sat_4, datetime(2010, 9, 25), True),
-            (lomq_sep_sat_4, datetime(2011, 9, 24), True),
-            (lomq_sep_sat_4, datetime(2012, 9, 29), True),
-
-            (lomq_sep_sat_4, datetime(2013, 6, 29), True),
-            (lomq_sep_sat_4, datetime(2012, 6, 23), True),
-            (lomq_sep_sat_4, datetime(2012, 6, 30), False),
-
-            (lomq_sep_sat_4, datetime(2013, 3, 30), True),
-            (lomq_sep_sat_4, datetime(2012, 3, 24), True),
-
-            (lomq_sep_sat_4, datetime(2012, 12, 29), True),
-            (lomq_sep_sat_4, datetime(2011, 12, 24), True),
-
-            #INTC (extra week in Q1)
-            #See: http://www.intc.com/releasedetail.cfm?ReleaseID=542844
-            (makeFY5253LastOfMonthQuarter(1, startingMonth=12, weekday=WeekDay.SAT, qtr_with_extra_week=1), datetime(2011, 4, 2), True),
-
-            #see: http://google.brand.edgar-online.com/?sym=INTC&formtypeID=7
-            (makeFY5253LastOfMonthQuarter(1, startingMonth=12, weekday=WeekDay.SAT, qtr_with_extra_week=1), datetime(2012, 12, 29), True),
-            (makeFY5253LastOfMonthQuarter(1, startingMonth=12, weekday=WeekDay.SAT, qtr_with_extra_week=1), datetime(2011, 12, 31), True),
-            (makeFY5253LastOfMonthQuarter(1, startingMonth=12, weekday=WeekDay.SAT, qtr_with_extra_week=1), datetime(2010, 12, 25), True),
-
-        ]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-    def test_year_has_extra_week(self):
-        #End of long Q1
-        self.assertTrue(makeFY5253LastOfMonthQuarter(1, startingMonth=12, weekday=WeekDay.SAT, qtr_with_extra_week=1).year_has_extra_week(datetime(2011, 4, 2)))
-
-        #Start of long Q1
-        self.assertTrue(makeFY5253LastOfMonthQuarter(1, startingMonth=12, weekday=WeekDay.SAT, qtr_with_extra_week=1).year_has_extra_week(datetime(2010, 12, 26)))
-
-        #End of year before year with long Q1
-        self.assertFalse(makeFY5253LastOfMonthQuarter(1, startingMonth=12, weekday=WeekDay.SAT, qtr_with_extra_week=1).year_has_extra_week(datetime(2010, 12, 25)))
-
-        for year in [x for x in range(1994, 2011+1) if x not in [2011, 2005, 2000, 1994]]:
-            self.assertFalse(makeFY5253LastOfMonthQuarter(1, startingMonth=12, weekday=WeekDay.SAT, qtr_with_extra_week=1).year_has_extra_week(datetime(year, 4, 2)))
-
-        #Other long years
-        self.assertTrue(makeFY5253LastOfMonthQuarter(1, startingMonth=12, weekday=WeekDay.SAT, qtr_with_extra_week=1).year_has_extra_week(datetime(2005, 4, 2)))
-        self.assertTrue(makeFY5253LastOfMonthQuarter(1, startingMonth=12, weekday=WeekDay.SAT, qtr_with_extra_week=1).year_has_extra_week(datetime(2000, 4, 2)))
-        self.assertTrue(makeFY5253LastOfMonthQuarter(1, startingMonth=12, weekday=WeekDay.SAT, qtr_with_extra_week=1).year_has_extra_week(datetime(1994, 4, 2)))
-
-    def test_get_weeks(self):
-        sat_dec_1 = makeFY5253LastOfMonthQuarter(1, startingMonth=12, weekday=WeekDay.SAT, qtr_with_extra_week=1)
-        sat_dec_4 = makeFY5253LastOfMonthQuarter(1, startingMonth=12, weekday=WeekDay.SAT, qtr_with_extra_week=4)
-
-        self.assertEqual(sat_dec_1.get_weeks(datetime(2011, 4, 2)), [14, 13, 13, 13])
-        self.assertEqual(sat_dec_4.get_weeks(datetime(2011, 4, 2)), [13, 13, 13, 14])
-        self.assertEqual(sat_dec_1.get_weeks(datetime(2010, 12, 25)), [13, 13, 13, 13])
-
-class TestFY5253NearestEndMonthQuarter(Base):
-
-    def test_onOffset(self):
-
-        offset_nem_sat_aug_4 = makeFY5253NearestEndMonthQuarter(1, startingMonth=8, weekday=WeekDay.SAT, qtr_with_extra_week=4)
-        offset_nem_thu_aug_4 = makeFY5253NearestEndMonthQuarter(1, startingMonth=8, weekday=WeekDay.THU, qtr_with_extra_week=4)
-        offset_n = FY5253(weekday=WeekDay.TUE, startingMonth=12,
-                      variation="nearest", qtr_with_extra_week=4)
-
-        tests = [
-            #From Wikipedia
-            (offset_nem_sat_aug_4, datetime(2006, 9, 2), True),
-            (offset_nem_sat_aug_4, datetime(2007, 9, 1), True),
-            (offset_nem_sat_aug_4, datetime(2008, 8, 30), True),
-            (offset_nem_sat_aug_4, datetime(2009, 8, 29), True),
-            (offset_nem_sat_aug_4, datetime(2010, 8, 28), True),
-            (offset_nem_sat_aug_4, datetime(2011, 9, 3), True),
-
-            (offset_nem_sat_aug_4, datetime(2016, 9, 3), True),
-            (offset_nem_sat_aug_4, datetime(2017, 9, 2), True),
-            (offset_nem_sat_aug_4, datetime(2018, 9, 1), True),
-            (offset_nem_sat_aug_4, datetime(2019, 8, 31), True),
-
-            (offset_nem_sat_aug_4, datetime(2006, 8, 27), False),
-            (offset_nem_sat_aug_4, datetime(2007, 8, 28), False),
-            (offset_nem_sat_aug_4, datetime(2008, 8, 31), False),
-            (offset_nem_sat_aug_4, datetime(2009, 8, 30), False),
-            (offset_nem_sat_aug_4, datetime(2010, 8, 29), False),
-            (offset_nem_sat_aug_4, datetime(2011, 8, 28), False),
-
-            (offset_nem_sat_aug_4, datetime(2006, 8, 25), False),
-            (offset_nem_sat_aug_4, datetime(2007, 8, 24), False),
-            (offset_nem_sat_aug_4, datetime(2008, 8, 29), False),
-            (offset_nem_sat_aug_4, datetime(2009, 8, 28), False),
-            (offset_nem_sat_aug_4, datetime(2010, 8, 27), False),
-            (offset_nem_sat_aug_4, datetime(2011, 8, 26), False),
-            (offset_nem_sat_aug_4, datetime(2019, 8, 30), False),
-
-            #From Micron, see: http://google.brand.edgar-online.com/?sym=MU&formtypeID=7
-            (offset_nem_thu_aug_4, datetime(2012, 8, 30), True),
-            (offset_nem_thu_aug_4, datetime(2011, 9, 1), True),
-
-            #See: http://google.brand.edgar-online.com/?sym=MU&formtypeID=13
-            (offset_nem_thu_aug_4, datetime(2013, 5, 30), True),
-            (offset_nem_thu_aug_4, datetime(2013, 2, 28), True),
-            (offset_nem_thu_aug_4, datetime(2012, 11, 29), True),
-            (offset_nem_thu_aug_4, datetime(2012, 5, 31), True),
-            (offset_nem_thu_aug_4, datetime(2007, 3, 1), True),
-            (offset_nem_thu_aug_4, datetime(1994, 3, 3), True),
-
-            (offset_n, datetime(2012, 12, 31), False),
-            (offset_n, datetime(2013, 1, 1), True),
-            (offset_n, datetime(2013, 1, 2), False)
-        ]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-    def test_offset(self):
-        offset = makeFY5253NearestEndMonthQuarter(1, startingMonth=8, weekday=WeekDay.THU, qtr_with_extra_week=4)
-
-        MU = [datetime(2012, 5, 31), datetime(2012, 8, 30), datetime(2012, 11, 29), datetime(2013, 2, 28), datetime(2013, 5, 30)]
-
-        date = MU[0] + relativedelta(days=-1)
-        for expected in MU:
-            assertEq(offset, date, expected)
-            date = date + offset
-
-        assertEq(offset, datetime(2012, 5, 31), datetime(2012, 8, 30))
-        assertEq(offset, datetime(2012, 5, 30), datetime(2012, 5, 31))
-
-        offset2 = FY5253Quarter(weekday=5, startingMonth=12,
-                     variation="last", qtr_with_extra_week=4)
-
-        assertEq(offset2, datetime(2013,1,15), datetime(2013, 3, 30))
-
-class TestQuarterBegin(Base):
-
-    def test_repr(self):
-        self.assertEqual(repr(QuarterBegin()), "<QuarterBegin: startingMonth=3>")
-        self.assertEqual(repr(QuarterBegin(startingMonth=3)), "<QuarterBegin: startingMonth=3>")
-        self.assertEqual(repr(QuarterBegin(startingMonth=1)),"<QuarterBegin: startingMonth=1>")
-
-    def test_isAnchored(self):
-        self.assertTrue(QuarterBegin(startingMonth=1).isAnchored())
-        self.assertTrue(QuarterBegin().isAnchored())
-        self.assertFalse(QuarterBegin(2, startingMonth=1).isAnchored())
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((QuarterBegin(startingMonth=1),
-                      {datetime(2007, 12, 1): datetime(2008, 1, 1),
-                       datetime(2008, 1, 1): datetime(2008, 4, 1),
-                       datetime(2008, 2, 15): datetime(2008, 4, 1),
-                       datetime(2008, 2, 29): datetime(2008, 4, 1),
-                       datetime(2008, 3, 15): datetime(2008, 4, 1),
-                       datetime(2008, 3, 31): datetime(2008, 4, 1),
-                       datetime(2008, 4, 15): datetime(2008, 7, 1),
-                       datetime(2008, 4, 1): datetime(2008, 7, 1), }))
-
-        tests.append((QuarterBegin(startingMonth=2),
-                      {datetime(2008, 1, 1): datetime(2008, 2, 1),
-                       datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2008, 1, 15): datetime(2008, 2, 1),
-                       datetime(2008, 2, 29): datetime(2008, 5, 1),
-                       datetime(2008, 3, 15): datetime(2008, 5, 1),
-                       datetime(2008, 3, 31): datetime(2008, 5, 1),
-                       datetime(2008, 4, 15): datetime(2008, 5, 1),
-                       datetime(2008, 4, 30): datetime(2008, 5, 1), }))
-
-        tests.append((QuarterBegin(startingMonth=1, n=0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 12, 1): datetime(2009, 1, 1),
-                       datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 2, 15): datetime(2008, 4, 1),
-                       datetime(2008, 2, 29): datetime(2008, 4, 1),
-                       datetime(2008, 3, 15): datetime(2008, 4, 1),
-                       datetime(2008, 3, 31): datetime(2008, 4, 1),
-                       datetime(2008, 4, 15): datetime(2008, 4, 1),
-                       datetime(2008, 4, 30): datetime(2008, 4, 1), }))
-
-        tests.append((QuarterBegin(startingMonth=1, n=-1),
-                      {datetime(2008, 1, 1): datetime(2007, 10, 1),
-                       datetime(2008, 1, 31): datetime(2008, 1, 1),
-                       datetime(2008, 2, 15): datetime(2008, 1, 1),
-                       datetime(2008, 2, 29): datetime(2008, 1, 1),
-                       datetime(2008, 3, 15): datetime(2008, 1, 1),
-                       datetime(2008, 3, 31): datetime(2008, 1, 1),
-                       datetime(2008, 4, 15): datetime(2008, 4, 1),
-                       datetime(2008, 4, 30): datetime(2008, 4, 1),
-                       datetime(2008, 7, 1): datetime(2008, 4, 1)}))
-
-        tests.append((QuarterBegin(startingMonth=1, n=2),
-                      {datetime(2008, 1, 1): datetime(2008, 7, 1),
-                       datetime(2008, 2, 15): datetime(2008, 7, 1),
-                       datetime(2008, 2, 29): datetime(2008, 7, 1),
-                       datetime(2008, 3, 15): datetime(2008, 7, 1),
-                       datetime(2008, 3, 31): datetime(2008, 7, 1),
-                       datetime(2008, 4, 15): datetime(2008, 10, 1),
-                       datetime(2008, 4, 1): datetime(2008, 10, 1), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-        # corner
-        offset = QuarterBegin(n=-1, startingMonth=1)
-        self.assertEqual(datetime(2010, 2, 1) + offset, datetime(2010, 1, 1))
-
-
-class TestQuarterEnd(Base):
-    _offset = QuarterEnd
-
-    def test_repr(self):
-        self.assertEqual(repr(QuarterEnd()), "<QuarterEnd: startingMonth=3>")
-        self.assertEqual(repr(QuarterEnd(startingMonth=3)), "<QuarterEnd: startingMonth=3>")
-        self.assertEqual(repr(QuarterEnd(startingMonth=1)), "<QuarterEnd: startingMonth=1>")
-
-    def test_isAnchored(self):
-        self.assertTrue(QuarterEnd(startingMonth=1).isAnchored())
-        self.assertTrue(QuarterEnd().isAnchored())
-        self.assertFalse(QuarterEnd(2, startingMonth=1).isAnchored())
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((QuarterEnd(startingMonth=1),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 4, 30),
-                       datetime(2008, 2, 15): datetime(2008, 4, 30),
-                       datetime(2008, 2, 29): datetime(2008, 4, 30),
-                       datetime(2008, 3, 15): datetime(2008, 4, 30),
-                       datetime(2008, 3, 31): datetime(2008, 4, 30),
-                       datetime(2008, 4, 15): datetime(2008, 4, 30),
-                       datetime(2008, 4, 30): datetime(2008, 7, 31), }))
-
-        tests.append((QuarterEnd(startingMonth=2),
-                      {datetime(2008, 1, 1): datetime(2008, 2, 29),
-                       datetime(2008, 1, 31): datetime(2008, 2, 29),
-                       datetime(2008, 2, 15): datetime(2008, 2, 29),
-                       datetime(2008, 2, 29): datetime(2008, 5, 31),
-                       datetime(2008, 3, 15): datetime(2008, 5, 31),
-                       datetime(2008, 3, 31): datetime(2008, 5, 31),
-                       datetime(2008, 4, 15): datetime(2008, 5, 31),
-                       datetime(2008, 4, 30): datetime(2008, 5, 31), }))
-
-        tests.append((QuarterEnd(startingMonth=1, n=0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 1, 31),
-                       datetime(2008, 2, 15): datetime(2008, 4, 30),
-                       datetime(2008, 2, 29): datetime(2008, 4, 30),
-                       datetime(2008, 3, 15): datetime(2008, 4, 30),
-                       datetime(2008, 3, 31): datetime(2008, 4, 30),
-                       datetime(2008, 4, 15): datetime(2008, 4, 30),
-                       datetime(2008, 4, 30): datetime(2008, 4, 30), }))
-
-        tests.append((QuarterEnd(startingMonth=1, n=-1),
-                      {datetime(2008, 1, 1): datetime(2007, 10, 31),
-                       datetime(2008, 1, 31): datetime(2007, 10, 31),
-                       datetime(2008, 2, 15): datetime(2008, 1, 31),
-                       datetime(2008, 2, 29): datetime(2008, 1, 31),
-                       datetime(2008, 3, 15): datetime(2008, 1, 31),
-                       datetime(2008, 3, 31): datetime(2008, 1, 31),
-                       datetime(2008, 4, 15): datetime(2008, 1, 31),
-                       datetime(2008, 4, 30): datetime(2008, 1, 31),
-                       datetime(2008, 7, 1): datetime(2008, 4, 30)}))
-
-        tests.append((QuarterEnd(startingMonth=1, n=2),
-                      {datetime(2008, 1, 31): datetime(2008, 7, 31),
-                       datetime(2008, 2, 15): datetime(2008, 7, 31),
-                       datetime(2008, 2, 29): datetime(2008, 7, 31),
-                       datetime(2008, 3, 15): datetime(2008, 7, 31),
-                       datetime(2008, 3, 31): datetime(2008, 7, 31),
-                       datetime(2008, 4, 15): datetime(2008, 7, 31),
-                       datetime(2008, 4, 30): datetime(2008, 10, 31), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-        # corner
-        offset = QuarterEnd(n=-1, startingMonth=1)
-        self.assertEqual(datetime(2010, 2, 1) + offset, datetime(2010, 1, 31))
-
-    def test_onOffset(self):
-
-        tests = [(QuarterEnd(1, startingMonth=1), datetime(2008, 1, 31), True),
-                 (QuarterEnd(
-                     1, startingMonth=1), datetime(2007, 12, 31), False),
-                 (QuarterEnd(
-                     1, startingMonth=1), datetime(2008, 2, 29), False),
-                 (QuarterEnd(
-                     1, startingMonth=1), datetime(2007, 3, 30), False),
-                 (QuarterEnd(
-                     1, startingMonth=1), datetime(2007, 3, 31), False),
-                 (QuarterEnd(1, startingMonth=1), datetime(2008, 4, 30), True),
-                 (QuarterEnd(
-                     1, startingMonth=1), datetime(2008, 5, 30), False),
-                 (QuarterEnd(
-                     1, startingMonth=1), datetime(2008, 5, 31), False),
-                 (QuarterEnd(
-                     1, startingMonth=1), datetime(2007, 6, 29), False),
-                 (QuarterEnd(
-                     1, startingMonth=1), datetime(2007, 6, 30), False),
-
-                 (QuarterEnd(
-                     1, startingMonth=2), datetime(2008, 1, 31), False),
-                 (QuarterEnd(
-                     1, startingMonth=2), datetime(2007, 12, 31), False),
-                 (QuarterEnd(1, startingMonth=2), datetime(2008, 2, 29), True),
-                 (QuarterEnd(
-                     1, startingMonth=2), datetime(2007, 3, 30), False),
-                 (QuarterEnd(
-                     1, startingMonth=2), datetime(2007, 3, 31), False),
-                 (QuarterEnd(
-                     1, startingMonth=2), datetime(2008, 4, 30), False),
-                 (QuarterEnd(
-                     1, startingMonth=2), datetime(2008, 5, 30), False),
-                 (QuarterEnd(1, startingMonth=2), datetime(2008, 5, 31), True),
-                 (QuarterEnd(
-                     1, startingMonth=2), datetime(2007, 6, 29), False),
-                 (QuarterEnd(
-                     1, startingMonth=2), datetime(2007, 6, 30), False),
-
-                 (QuarterEnd(
-                     1, startingMonth=3), datetime(2008, 1, 31), False),
-                 (QuarterEnd(
-                     1, startingMonth=3), datetime(2007, 12, 31), True),
-                 (QuarterEnd(
-                     1, startingMonth=3), datetime(2008, 2, 29), False),
-                 (QuarterEnd(
-                     1, startingMonth=3), datetime(2007, 3, 30), False),
-                 (QuarterEnd(1, startingMonth=3), datetime(2007, 3, 31), True),
-                 (QuarterEnd(
-                     1, startingMonth=3), datetime(2008, 4, 30), False),
-                 (QuarterEnd(
-                     1, startingMonth=3), datetime(2008, 5, 30), False),
-                 (QuarterEnd(
-                     1, startingMonth=3), datetime(2008, 5, 31), False),
-                 (QuarterEnd(
-                     1, startingMonth=3), datetime(2007, 6, 29), False),
-                 (QuarterEnd(1, startingMonth=3), datetime(2007, 6, 30), True),
-                 ]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-
-class TestBYearBegin(Base):
-    _offset = BYearBegin
-
-    def test_misspecified(self):
-        self.assertRaises(ValueError, BYearBegin, month=13)
-        self.assertRaises(ValueError, BYearEnd, month=13)
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BYearBegin(),
-                      {datetime(2008, 1, 1): datetime(2009, 1, 1),
-                       datetime(2008, 6, 30): datetime(2009, 1, 1),
-                       datetime(2008, 12, 31): datetime(2009, 1, 1),
-                       datetime(2011, 1, 1): datetime(2011, 1, 3),
-                       datetime(2011, 1, 3): datetime(2012, 1, 2),
-                       datetime(2005, 12, 30): datetime(2006, 1, 2),
-                       datetime(2005, 12, 31): datetime(2006, 1, 2)
-                       }
-                      ))
-
-        tests.append((BYearBegin(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 6, 30): datetime(2009, 1, 1),
-                       datetime(2008, 12, 31): datetime(2009, 1, 1),
-                       datetime(2005, 12, 30): datetime(2006, 1, 2),
-                       datetime(2005, 12, 31): datetime(2006, 1, 2), }))
-
-        tests.append((BYearBegin(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 1, 2),
-                       datetime(2009, 1, 4): datetime(2009, 1, 1),
-                       datetime(2009, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 6, 30): datetime(2008, 1, 1),
-                       datetime(2008, 12, 31): datetime(2008, 1, 1),
-                       datetime(2006, 12, 29): datetime(2006, 1, 2),
-                       datetime(2006, 12, 30): datetime(2006, 1, 2),
-                       datetime(2006, 1, 1): datetime(2005, 1, 3), }))
-
-        tests.append((BYearBegin(-2),
-                      {datetime(2007, 1, 1): datetime(2005, 1, 3),
-                       datetime(2007, 6, 30): datetime(2006, 1, 2),
-                       datetime(2008, 12, 31): datetime(2007, 1, 1), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-
-class TestYearBegin(Base):
-    _offset = YearBegin
-
-    def test_misspecified(self):
-        self.assertRaises(ValueError, YearBegin, month=13)
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((YearBegin(),
-                      {datetime(2008, 1, 1): datetime(2009, 1, 1),
-                       datetime(2008, 6, 30): datetime(2009, 1, 1),
-                       datetime(2008, 12, 31): datetime(2009, 1, 1),
-                       datetime(2005, 12, 30): datetime(2006, 1, 1),
-                       datetime(2005, 12, 31): datetime(2006, 1, 1), }))
-
-        tests.append((YearBegin(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 6, 30): datetime(2009, 1, 1),
-                       datetime(2008, 12, 31): datetime(2009, 1, 1),
-                       datetime(2005, 12, 30): datetime(2006, 1, 1),
-                       datetime(2005, 12, 31): datetime(2006, 1, 1), }))
-
-        tests.append((YearBegin(3),
-                      {datetime(2008, 1, 1): datetime(2011, 1, 1),
-                       datetime(2008, 6, 30): datetime(2011, 1, 1),
-                       datetime(2008, 12, 31): datetime(2011, 1, 1),
-                       datetime(2005, 12, 30): datetime(2008, 1, 1),
-                       datetime(2005, 12, 31): datetime(2008, 1, 1), }))
-
-        tests.append((YearBegin(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 1, 1),
-                       datetime(2007, 1, 15): datetime(2007, 1, 1),
-                       datetime(2008, 6, 30): datetime(2008, 1, 1),
-                       datetime(2008, 12, 31): datetime(2008, 1, 1),
-                       datetime(2006, 12, 29): datetime(2006, 1, 1),
-                       datetime(2006, 12, 30): datetime(2006, 1, 1),
-                       datetime(2007, 1, 1): datetime(2006, 1, 1), }))
-
-        tests.append((YearBegin(-2),
-                      {datetime(2007, 1, 1): datetime(2005, 1, 1),
-                       datetime(2008, 6, 30): datetime(2007, 1, 1),
-                       datetime(2008, 12, 31): datetime(2007, 1, 1), }))
-
-        tests.append((YearBegin(month=4),
-                      {datetime(2007, 4, 1): datetime(2008, 4, 1),
-                       datetime(2007, 4, 15): datetime(2008, 4, 1),
-                       datetime(2007, 3, 1): datetime(2007, 4, 1),
-                       datetime(2007, 12, 15): datetime(2008, 4, 1),
-                       datetime(2012, 1, 31): datetime(2012, 4, 1), }))
-
-        tests.append((YearBegin(0, month=4),
-                      {datetime(2007, 4, 1): datetime(2007, 4, 1),
-                       datetime(2007, 3, 1): datetime(2007, 4, 1),
-                       datetime(2007, 12, 15): datetime(2008, 4, 1),
-                       datetime(2012, 1, 31): datetime(2012, 4, 1), }))
-
-        tests.append((YearBegin(4, month=4),
-                      {datetime(2007, 4, 1): datetime(2011, 4, 1),
-                       datetime(2007, 4, 15): datetime(2011, 4, 1),
-                       datetime(2007, 3, 1): datetime(2010, 4, 1),
-                       datetime(2007, 12, 15): datetime(2011, 4, 1),
-                       datetime(2012, 1, 31): datetime(2015, 4, 1), }))
-
-        tests.append((YearBegin(-1, month=4),
-                      {datetime(2007, 4, 1): datetime(2006, 4, 1),
-                       datetime(2007, 3, 1): datetime(2006, 4, 1),
-                       datetime(2007, 12, 15): datetime(2007, 4, 1),
-                       datetime(2012, 1, 31): datetime(2011, 4, 1), }))
-
-        tests.append((YearBegin(-3, month=4),
-                      {datetime(2007, 4, 1): datetime(2004, 4, 1),
-                       datetime(2007, 3, 1): datetime(2004, 4, 1),
-                       datetime(2007, 12, 15): datetime(2005, 4, 1),
-                       datetime(2012, 1, 31): datetime(2009, 4, 1), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_onOffset(self):
-
-        tests = [
-            (YearBegin(), datetime(2007, 1, 3), False),
-            (YearBegin(), datetime(2008, 1, 1), True),
-            (YearBegin(), datetime(2006, 12, 31), False),
-            (YearBegin(), datetime(2006, 1, 2), False),
-        ]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-
-class TestBYearEndLagged(Base):
-
-    def test_bad_month_fail(self):
-        self.assertRaises(Exception, BYearEnd, month=13)
-        self.assertRaises(Exception, BYearEnd, month=0)
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BYearEnd(month=6),
-                      {datetime(2008, 1, 1): datetime(2008, 6, 30),
-                      datetime(2007, 6, 30): datetime(2008, 6, 30)},
-                      ))
-
-        tests.append((BYearEnd(n=-1, month=6),
-                      {datetime(2008, 1, 1): datetime(2007, 6, 29),
-                      datetime(2007, 6, 30): datetime(2007, 6, 29)},
-                      ))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                self.assertEqual(base + offset, expected)
-
-    def test_roll(self):
-        offset = BYearEnd(month=6)
-        date = datetime(2009, 11, 30)
-
-        self.assertEqual(offset.rollforward(date), datetime(2010, 6, 30))
-        self.assertEqual(offset.rollback(date), datetime(2009, 6, 30))
-
-    def test_onOffset(self):
-
-        tests = [
-            (BYearEnd(month=2), datetime(2007, 2, 28), True),
-            (BYearEnd(month=6), datetime(2007, 6, 30), False),
-        ]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-
-class TestBYearEnd(Base):
-    _offset = BYearEnd
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BYearEnd(),
-                      {datetime(2008, 1, 1): datetime(2008, 12, 31),
-                       datetime(2008, 6, 30): datetime(2008, 12, 31),
-                       datetime(2008, 12, 31): datetime(2009, 12, 31),
-                       datetime(2005, 12, 30): datetime(2006, 12, 29),
-                       datetime(2005, 12, 31): datetime(2006, 12, 29), }))
-
-        tests.append((BYearEnd(0),
-                      {datetime(2008, 1, 1): datetime(2008, 12, 31),
-                       datetime(2008, 6, 30): datetime(2008, 12, 31),
-                       datetime(2008, 12, 31): datetime(2008, 12, 31),
-                       datetime(2005, 12, 31): datetime(2006, 12, 29), }))
-
-        tests.append((BYearEnd(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 29),
-                       datetime(2008, 6, 30): datetime(2007, 12, 31),
-                       datetime(2008, 12, 31): datetime(2007, 12, 31),
-                       datetime(2006, 12, 29): datetime(2005, 12, 30),
-                       datetime(2006, 12, 30): datetime(2006, 12, 29),
-                       datetime(2007, 1, 1): datetime(2006, 12, 29), }))
-
-        tests.append((BYearEnd(-2),
-                      {datetime(2007, 1, 1): datetime(2005, 12, 30),
-                       datetime(2008, 6, 30): datetime(2006, 12, 29),
-                       datetime(2008, 12, 31): datetime(2006, 12, 29), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_onOffset(self):
-
-        tests = [
-            (BYearEnd(), datetime(2007, 12, 31), True),
-            (BYearEnd(), datetime(2008, 1, 1), False),
-            (BYearEnd(), datetime(2006, 12, 31), False),
-            (BYearEnd(), datetime(2006, 12, 29), True),
-        ]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-
-class TestYearEnd(Base):
-    _offset = YearEnd
-
-    def test_misspecified(self):
-        self.assertRaises(ValueError, YearEnd, month=13)
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((YearEnd(),
-                      {datetime(2008, 1, 1): datetime(2008, 12, 31),
-                       datetime(2008, 6, 30): datetime(2008, 12, 31),
-                       datetime(2008, 12, 31): datetime(2009, 12, 31),
-                       datetime(2005, 12, 30): datetime(2005, 12, 31),
-                       datetime(2005, 12, 31): datetime(2006, 12, 31), }))
-
-        tests.append((YearEnd(0),
-                      {datetime(2008, 1, 1): datetime(2008, 12, 31),
-                       datetime(2008, 6, 30): datetime(2008, 12, 31),
-                       datetime(2008, 12, 31): datetime(2008, 12, 31),
-                       datetime(2005, 12, 30): datetime(2005, 12, 31), }))
-
-        tests.append((YearEnd(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 31),
-                       datetime(2008, 6, 30): datetime(2007, 12, 31),
-                       datetime(2008, 12, 31): datetime(2007, 12, 31),
-                       datetime(2006, 12, 29): datetime(2005, 12, 31),
-                       datetime(2006, 12, 30): datetime(2005, 12, 31),
-                       datetime(2007, 1, 1): datetime(2006, 12, 31), }))
-
-        tests.append((YearEnd(-2),
-                      {datetime(2007, 1, 1): datetime(2005, 12, 31),
-                       datetime(2008, 6, 30): datetime(2006, 12, 31),
-                       datetime(2008, 12, 31): datetime(2006, 12, 31), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_onOffset(self):
-
-        tests = [
-            (YearEnd(), datetime(2007, 12, 31), True),
-            (YearEnd(), datetime(2008, 1, 1), False),
-            (YearEnd(), datetime(2006, 12, 31), True),
-            (YearEnd(), datetime(2006, 12, 29), False),
-        ]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-
-class TestYearEndDiffMonth(Base):
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((YearEnd(month=3),
-                      {datetime(2008, 1, 1): datetime(2008, 3, 31),
-                       datetime(2008, 2, 15): datetime(2008, 3, 31),
-                       datetime(2008, 3, 31): datetime(2009, 3, 31),
-                       datetime(2008, 3, 30): datetime(2008, 3, 31),
-                       datetime(2005, 3, 31): datetime(2006, 3, 31),
-                       datetime(2006, 7, 30): datetime(2007, 3, 31)}))
-
-        tests.append((YearEnd(0, month=3),
-                      {datetime(2008, 1, 1): datetime(2008, 3, 31),
-                       datetime(2008, 2, 28): datetime(2008, 3, 31),
-                       datetime(2008, 3, 31): datetime(2008, 3, 31),
-                       datetime(2005, 3, 30): datetime(2005, 3, 31), }))
-
-        tests.append((YearEnd(-1, month=3),
-                      {datetime(2007, 1, 1): datetime(2006, 3, 31),
-                       datetime(2008, 2, 28): datetime(2007, 3, 31),
-                       datetime(2008, 3, 31): datetime(2007, 3, 31),
-                       datetime(2006, 3, 29): datetime(2005, 3, 31),
-                       datetime(2006, 3, 30): datetime(2005, 3, 31),
-                       datetime(2007, 3, 1): datetime(2006, 3, 31), }))
-
-        tests.append((YearEnd(-2, month=3),
-                      {datetime(2007, 1, 1): datetime(2005, 3, 31),
-                       datetime(2008, 6, 30): datetime(2007, 3, 31),
-                       datetime(2008, 3, 31): datetime(2006, 3, 31), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_onOffset(self):
-
-        tests = [
-            (YearEnd(month=3), datetime(2007, 3, 31), True),
-            (YearEnd(month=3), datetime(2008, 1, 1), False),
-            (YearEnd(month=3), datetime(2006, 3, 31), True),
-            (YearEnd(month=3), datetime(2006, 3, 29), False),
-        ]
-
-        for offset, date, expected in tests:
-            assertOnOffset(offset, date, expected)
-
-
-def assertEq(offset, base, expected):
-    actual = offset + base
-    actual_swapped = base + offset
-    actual_apply = offset.apply(base)
-    try:
-        assert actual == expected
-        assert actual_swapped == expected
-        assert actual_apply == expected
-    except AssertionError:
-        raise AssertionError("\nExpected: %s\nActual: %s\nFor Offset: %s)"
-                             "\nAt Date: %s" %
-                            (expected, actual, offset, base))
-
-def test_Easter():
-    assertEq(Easter(), datetime(2010, 1, 1), datetime(2010, 4, 4))
-    assertEq(Easter(), datetime(2010, 4, 5), datetime(2011, 4, 24))
-    assertEq(Easter(2), datetime(2010, 1, 1), datetime(2011, 4, 24))
-
-    assertEq(Easter(), datetime(2010, 4, 4), datetime(2011, 4, 24))
-    assertEq(Easter(2), datetime(2010, 4, 4), datetime(2012, 4, 8))
-
-    assertEq(-Easter(), datetime(2011, 1, 1), datetime(2010, 4, 4))
-    assertEq(-Easter(), datetime(2010, 4, 5), datetime(2010, 4, 4))
-    assertEq(-Easter(2), datetime(2011, 1, 1), datetime(2009, 4, 12))
-
-    assertEq(-Easter(), datetime(2010, 4, 4), datetime(2009, 4, 12))
-    assertEq(-Easter(2), datetime(2010, 4, 4), datetime(2008, 3, 23))
-
-
-class TestTicks(tm.TestCase):
-
-    ticks = [Hour, Minute, Second, Milli, Micro, Nano]
-
-    def test_ticks(self):
-        offsets = [(Hour, Timedelta(hours=5)),
-                   (Minute, Timedelta(hours=2, minutes=3)),
-                   (Second, Timedelta(hours=2, seconds=3)),
-                   (Milli, Timedelta(hours=2, milliseconds=3)),
-                   (Micro, Timedelta(hours=2, microseconds=3)),
-                   (Nano, Timedelta(hours=2, nanoseconds=3))]
-
-        for kls, expected in offsets:
-            offset = kls(3)
-            result = offset + Timedelta(hours=2)
-            self.assertTrue(isinstance(result, Timedelta))
-            self.assertEqual(result, expected)
-
-    def test_Hour(self):
-        assertEq(Hour(), datetime(2010, 1, 1), datetime(2010, 1, 1, 1))
-        assertEq(Hour(-1), datetime(2010, 1, 1, 1), datetime(2010, 1, 1))
-        assertEq(2 * Hour(), datetime(2010, 1, 1), datetime(2010, 1, 1, 2))
-        assertEq(-1 * Hour(), datetime(2010, 1, 1, 1), datetime(2010, 1, 1))
-
-        self.assertEqual(Hour(3) + Hour(2), Hour(5))
-        self.assertEqual(Hour(3) - Hour(2), Hour())
-
-        self.assertNotEqual(Hour(4), Hour(1))
-
-    def test_Minute(self):
-        assertEq(Minute(), datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 1))
-        assertEq(Minute(-1), datetime(2010, 1, 1, 0, 1), datetime(2010, 1, 1))
-        assertEq(2 * Minute(), datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 2))
-        assertEq(-1 * Minute(), datetime(2010, 1, 1, 0, 1), datetime(2010, 1, 1))
-
-        self.assertEqual(Minute(3) + Minute(2), Minute(5))
-        self.assertEqual(Minute(3) - Minute(2), Minute())
-        self.assertNotEqual(Minute(5), Minute())
-
-    def test_Second(self):
-        assertEq(Second(), datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 0, 1))
-        assertEq(Second(-1), datetime(2010, 1, 1, 0, 0, 1), datetime(2010, 1, 1))
-        assertEq(2 * Second(), datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 0, 2))
-        assertEq(
-            -1 * Second(), datetime(2010, 1, 1, 0, 0, 1), datetime(2010, 1, 1))
-
-        self.assertEqual(Second(3) + Second(2), Second(5))
-        self.assertEqual(Second(3) - Second(2), Second())
-
-    def test_Millisecond(self):
-        assertEq(Milli(), datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 0, 0, 1000))
-        assertEq(Milli(-1), datetime(2010, 1, 1, 0, 0, 0, 1000), datetime(2010, 1, 1))
-        assertEq(Milli(2), datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 0, 0, 2000))
-        assertEq(2 * Milli(), datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 0, 0, 2000))
-        assertEq(-1 * Milli(), datetime(2010, 1, 1, 0, 0, 0, 1000), datetime(2010, 1, 1))
-
-        self.assertEqual(Milli(3) + Milli(2), Milli(5))
-        self.assertEqual(Milli(3) - Milli(2), Milli())
-
-    def test_MillisecondTimestampArithmetic(self):
-        assertEq(Milli(), Timestamp('2010-01-01'), Timestamp('2010-01-01 00:00:00.001'))
-        assertEq(Milli(-1), Timestamp('2010-01-01 00:00:00.001'), Timestamp('2010-01-01'))
-
-    def test_Microsecond(self):
-        assertEq(Micro(), datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 0, 0, 1))
-        assertEq(Micro(-1), datetime(2010, 1, 1, 0, 0, 0, 1), datetime(2010, 1, 1))
-        assertEq(2 * Micro(), datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 0, 0, 2))
-        assertEq(-1 * Micro(), datetime(2010, 1, 1, 0, 0, 0, 1), datetime(2010, 1, 1))
-
-        self.assertEqual(Micro(3) + Micro(2), Micro(5))
-        self.assertEqual(Micro(3) - Micro(2), Micro())
-
-    def test_NanosecondGeneric(self):
-        timestamp = Timestamp(datetime(2010, 1, 1))
-        self.assertEqual(timestamp.nanosecond, 0)
-
-        result = timestamp + Nano(10)
-        self.assertEqual(result.nanosecond, 10)
-
-        reverse_result = Nano(10) + timestamp
-        self.assertEqual(reverse_result.nanosecond, 10)
-
-    def test_Nanosecond(self):
-        timestamp = Timestamp(datetime(2010, 1, 1))
-        assertEq(Nano(), timestamp, timestamp + np.timedelta64(1, 'ns'))
-        assertEq(Nano(-1), timestamp + np.timedelta64(1, 'ns'), timestamp)
-        assertEq(2 * Nano(), timestamp, timestamp + np.timedelta64(2, 'ns'))
-        assertEq(-1 * Nano(), timestamp + np.timedelta64(1, 'ns'), timestamp)
-
-        self.assertEqual(Nano(3) + Nano(2), Nano(5))
-        self.assertEqual(Nano(3) - Nano(2), Nano())
-
-        # GH9284
-        self.assertEqual(Nano(1) + Nano(10), Nano(11))
-        self.assertEqual(Nano(5) + Micro(1), Nano(1005))
-        self.assertEqual(Micro(5) + Nano(1), Nano(5001))
-
-    def test_tick_zero(self):
-        for t1 in self.ticks:
-            for t2 in self.ticks:
-                self.assertEqual(t1(0), t2(0))
-                self.assertEqual(t1(0) + t2(0), t1(0))
-
-                if t1 is not Nano:
-                    self.assertEqual(t1(2) + t2(0), t1(2))
-            if t1 is Nano:
-                self.assertEqual(t1(2) + Nano(0), t1(2))
-
-    def test_tick_equalities(self):
-        for t in self.ticks:
-            self.assertEqual(t(3), t(3))
-            self.assertEqual(t(), t(1))
-
-            # not equals
-            self.assertNotEqual(t(3), t(2))
-            self.assertNotEqual(t(3), t(-3))
-
-    def test_tick_operators(self):
-        for t in self.ticks:
-            self.assertEqual(t(3) + t(2), t(5))
-            self.assertEqual(t(3) - t(2), t(1))
-            self.assertEqual(t(800) + t(300), t(1100))
-            self.assertEqual(t(1000) - t(5), t(995))
-
-    def test_tick_offset(self):
-        for t in self.ticks:
-            self.assertFalse(t().isAnchored())
-
-    def test_compare_ticks(self):
-        for kls in self.ticks:
-            three = kls(3)
-            four = kls(4)
-
-            for _ in range(10):
-                self.assertTrue(three < kls(4))
-                self.assertTrue(kls(3) < four)
-                self.assertTrue(four > kls(3))
-                self.assertTrue(kls(4) > three)
-                self.assertTrue(kls(3) == kls(3))
-                self.assertTrue(kls(3) != kls(4))
-
-
-class TestOffsetNames(tm.TestCase):
-    def test_get_offset_name(self):
-        assertRaisesRegexp(ValueError, 'Bad rule.*BusinessDays', get_offset_name, BDay(2))
-
-        assert get_offset_name(BDay()) == 'B'
-        assert get_offset_name(BMonthEnd()) == 'BM'
-        assert get_offset_name(Week(weekday=0)) == 'W-MON'
-        assert get_offset_name(Week(weekday=1)) == 'W-TUE'
-        assert get_offset_name(Week(weekday=2)) == 'W-WED'
-        assert get_offset_name(Week(weekday=3)) == 'W-THU'
-        assert get_offset_name(Week(weekday=4)) == 'W-FRI'
-
-        self.assertEqual(get_offset_name(LastWeekOfMonth(weekday=WeekDay.SUN)), "LWOM-SUN")
-        self.assertEqual(get_offset_name(makeFY5253LastOfMonthQuarter(weekday=1, startingMonth=3, qtr_with_extra_week=4)),"REQ-L-MAR-TUE-4")
-        self.assertEqual(get_offset_name(makeFY5253NearestEndMonthQuarter(weekday=1, startingMonth=3, qtr_with_extra_week=3)), "REQ-N-MAR-TUE-3")
-
-def test_get_offset():
-    assertRaisesRegexp(ValueError, "rule.*GIBBERISH", get_offset, 'gibberish')
-    assertRaisesRegexp(ValueError, "rule.*QS-JAN-B", get_offset, 'QS-JAN-B')
-    pairs = [
-             ('B', BDay()), ('b', BDay()), ('bm', BMonthEnd()),
-             ('Bm', BMonthEnd()), ('W-MON', Week(weekday=0)),
-             ('W-TUE', Week(weekday=1)), ('W-WED', Week(weekday=2)),
-             ('W-THU', Week(weekday=3)), ('W-FRI', Week(weekday=4)),
-             ("RE-N-DEC-MON", makeFY5253NearestEndMonth(weekday=0, startingMonth=12)),
-             ("RE-L-DEC-TUE", makeFY5253LastOfMonth(weekday=1, startingMonth=12)),
-             ("REQ-L-MAR-TUE-4", makeFY5253LastOfMonthQuarter(weekday=1, startingMonth=3, qtr_with_extra_week=4)),
-             ("REQ-L-DEC-MON-3", makeFY5253LastOfMonthQuarter(weekday=0, startingMonth=12, qtr_with_extra_week=3)),
-             ("REQ-N-DEC-MON-3", makeFY5253NearestEndMonthQuarter(weekday=0, startingMonth=12, qtr_with_extra_week=3)),
-             ]
-
-    for name, expected in pairs:
-        offset = get_offset(name)
-        assert offset == expected, ("Expected %r to yield %r (actual: %r)" %
-                                    (name, expected, offset))
-
-def test_get_offset_legacy():
-    pairs = [('w@Sat', Week(weekday=5))]
-    for name, expected in pairs:
-        with tm.assert_produces_warning(FutureWarning):
-            offset = get_offset(name)
-        assert offset == expected, ("Expected %r to yield %r (actual: %r)" %
-                                    (name, expected, offset))
-
-class TestParseTimeString(tm.TestCase):
-
-    def test_parse_time_string(self):
-        (date, parsed, reso) = parse_time_string('4Q1984')
-        (date_lower, parsed_lower, reso_lower) = parse_time_string('4q1984')
-        self.assertEqual(date, date_lower)
-        self.assertEqual(parsed, parsed_lower)
-        self.assertEqual(reso, reso_lower)
-
-    def test_parse_time_quarter_w_dash(self):
-        # https://github.com/pydata/pandas/issue/9688
-        pairs = [
-            ('1988-Q2', '1988Q2'),
-            ('2Q-1988', '2Q1988'),
-        ]
-
-        for dashed, normal in pairs:
-            (date_dash, parsed_dash, reso_dash) = parse_time_string(dashed)
-            (date, parsed, reso) = parse_time_string(normal)
-
-            self.assertEqual(date_dash, date)
-            self.assertEqual(parsed_dash, parsed)
-            self.assertEqual(reso_dash, reso)
-
-        self.assertRaises(DateParseError, parse_time_string, "-2Q1992")
-        self.assertRaises(DateParseError, parse_time_string, "2-Q1992")
-        self.assertRaises(DateParseError, parse_time_string, "4-4Q1992")
-
-
-def test_get_standard_freq():
-    fstr = get_standard_freq('W')
-    assert fstr == get_standard_freq('w')
-    assert fstr == get_standard_freq('1w')
-    assert fstr == get_standard_freq(('W', 1))
-
-    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-        result = get_standard_freq('WeEk')
-    assert fstr == result
-
-    fstr = get_standard_freq('5Q')
-    assert fstr == get_standard_freq('5q')
-
-    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-        result = get_standard_freq('5QuarTer')
-    assert fstr == result
-
-    assert fstr == get_standard_freq(('q', 5))
-
-
-def test_quarterly_dont_normalize():
-    date = datetime(2012, 3, 31, 5, 30)
-
-    offsets = (QuarterBegin, QuarterEnd, BQuarterEnd, BQuarterBegin)
-
-    for klass in offsets:
-        result = date + klass()
-        assert(result.time() == date.time())
-
-
-class TestOffsetAliases(tm.TestCase):
-
-    def setUp(self):
-        _offset_map.clear()
-
-    def test_alias_equality(self):
-        for k, v in compat.iteritems(_offset_map):
-            if v is None:
-                continue
-            self.assertEqual(k, v.copy())
-
-    def test_rule_code(self):
-        lst = ['M', 'MS', 'BM', 'BMS', 'D', 'B', 'H', 'T', 'S', 'L', 'U']
-        for k in lst:
-            self.assertEqual(k, get_offset(k).rule_code)
-            # should be cached - this is kind of an internals test...
-            assert k in _offset_map
-            self.assertEqual(k, (get_offset(k) * 3).rule_code)
-
-        suffix_lst = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
-        base = 'W'
-        for v in suffix_lst:
-            alias = '-'.join([base, v])
-            self.assertEqual(alias, get_offset(alias).rule_code)
-            self.assertEqual(alias, (get_offset(alias) * 5).rule_code)
-
-        suffix_lst = ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL', 'AUG',
-                      'SEP', 'OCT', 'NOV', 'DEC']
-        base_lst = ['A', 'AS', 'BA', 'BAS', 'Q', 'QS', 'BQ', 'BQS']
-        for base in base_lst:
-            for v in suffix_lst:
-                alias = '-'.join([base, v])
-                self.assertEqual(alias, get_offset(alias).rule_code)
-                self.assertEqual(alias, (get_offset(alias) * 5).rule_code)
-
-        lst = ['M', 'D', 'B', 'H', 'T', 'S', 'L', 'U']
-        for k in lst:
-            code, stride = get_freq_code('3' + k)
-            self.assertTrue(isinstance(code, int))
-            self.assertEqual(stride, 3)
-            self.assertEqual(k, _get_freq_str(code))
-
-def test_apply_ticks():
-    result = offsets.Hour(3).apply(offsets.Hour(4))
-    exp = offsets.Hour(7)
-    assert(result == exp)
-
-
-def test_delta_to_tick():
-    delta = timedelta(3)
-
-    tick = offsets._delta_to_tick(delta)
-    assert(tick == offsets.Day(3))
-
-
-def test_dateoffset_misc():
-    oset = offsets.DateOffset(months=2, days=4)
-    # it works
-    result = oset.freqstr
-
-    assert(not offsets.DateOffset(months=2) == 2)
-
-
-def test_freq_offsets():
-    off = BDay(1, offset=timedelta(0, 1800))
-    assert(off.freqstr == 'B+30Min')
-
-    off = BDay(1, offset=timedelta(0, -1800))
-    assert(off.freqstr == 'B-30Min')
-
-
-def get_all_subclasses(cls):
-    ret = set()
-    this_subclasses = cls.__subclasses__()
-    ret = ret | set(this_subclasses)
-    for this_subclass in this_subclasses:
-        ret | get_all_subclasses(this_subclass)
-    return ret
-
-class TestCaching(tm.TestCase):
-
-    # as of GH 6479 (in 0.14.0), offset caching is turned off
-    # as of v0.12.0 only BusinessMonth/Quarter were actually caching
-
-    def setUp(self):
-        _daterange_cache.clear()
-        _offset_map.clear()
-
-    def run_X_index_creation(self, cls):
-        inst1 = cls()
-        if not inst1.isAnchored():
-            self.assertFalse(inst1._should_cache(), cls)
-            return
-
-        self.assertTrue(inst1._should_cache(), cls)
-
-        DatetimeIndex(start=datetime(2013,1,31), end=datetime(2013,3,31), freq=inst1, normalize=True)
-        self.assertTrue(cls() in _daterange_cache, cls)
-
-    def test_should_cache_month_end(self):
-        self.assertFalse(MonthEnd()._should_cache())
-
-    def test_should_cache_bmonth_end(self):
-        self.assertFalse(BusinessMonthEnd()._should_cache())
-
-    def test_should_cache_week_month(self):
-        self.assertFalse(WeekOfMonth(weekday=1, week=2)._should_cache())
-
-    def test_all_cacheableoffsets(self):
-        for subclass in get_all_subclasses(CacheableOffset):
-            if subclass.__name__[0] == "_" \
-                or subclass in TestCaching.no_simple_ctr:
-                continue
-            self.run_X_index_creation(subclass)
-
-    def test_month_end_index_creation(self):
-        DatetimeIndex(start=datetime(2013,1,31), end=datetime(2013,3,31), freq=MonthEnd(), normalize=True)
-        self.assertFalse(MonthEnd() in _daterange_cache)
-
-    def test_bmonth_end_index_creation(self):
-        DatetimeIndex(start=datetime(2013,1,31), end=datetime(2013,3,29), freq=BusinessMonthEnd(), normalize=True)
-        self.assertFalse(BusinessMonthEnd() in _daterange_cache)
-
-    def test_week_of_month_index_creation(self):
-        inst1 = WeekOfMonth(weekday=1, week=2)
-        DatetimeIndex(start=datetime(2013,1,31), end=datetime(2013,3,29), freq=inst1, normalize=True)
-        inst2 = WeekOfMonth(weekday=1, week=2)
-        self.assertFalse(inst2 in _daterange_cache)
-
-class TestReprNames(tm.TestCase):
-    def test_str_for_named_is_name(self):
-        # look at all the amazing combinations!
-        month_prefixes = ['A', 'AS', 'BA', 'BAS', 'Q', 'BQ', 'BQS', 'QS']
-        names = [prefix + '-' + month for prefix in month_prefixes
-                    for month in ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN',
-                                  'JUL', 'AUG', 'SEP', 'OCT', 'NOV', 'DEC']]
-        days = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
-        names += ['W-' + day for day in days]
-        names += ['WOM-' + week + day for week in ('1', '2', '3', '4')
-                                       for day in days]
-        #singletons
-        names += ['S', 'T', 'U', 'BM', 'BMS', 'BQ', 'QS'] # No 'Q'
-        _offset_map.clear()
-        for name in names:
-            offset = get_offset(name)
-            self.assertEqual(repr(offset), name)
-            self.assertEqual(str(offset), name)
-
-
-def get_utc_offset_hours(ts):
-    # take a Timestamp and compute total hours of utc offset
-    o = ts.utcoffset()
-    return (o.days * 24 * 3600 + o.seconds) / 3600.0
-
-
-class TestDST(tm.TestCase):
-    """
-    test DateOffset additions over Daylight Savings Time
-    """
-    # one microsecond before the DST transition
-    ts_pre_fallback = "2013-11-03 01:59:59.999999"
-    ts_pre_springfwd = "2013-03-10 01:59:59.999999"
-
-    # test both basic names and dateutil timezones
-    timezone_utc_offsets = {
-        'US/Eastern': dict(
-            utc_offset_daylight=-4,
-            utc_offset_standard=-5,
-            ),
-        'dateutil/US/Pacific': dict(
-            utc_offset_daylight=-7,
-            utc_offset_standard=-8,
-            )
-        }
-    valid_date_offsets_singular = [
-        'weekday', 'day', 'hour', 'minute', 'second', 'microsecond'
-        ]
-    valid_date_offsets_plural = [
-        'weeks', 'days',
-        'hours', 'minutes', 'seconds',
-        'milliseconds', 'microseconds'
-        ]
-
-    def _test_all_offsets(self, n, **kwds):
-        valid_offsets = self.valid_date_offsets_plural if n > 1 \
-            else self.valid_date_offsets_singular
-
-        for name in valid_offsets:
-            self._test_offset(offset_name=name, offset_n=n, **kwds)
-
-    def _test_offset(self, offset_name, offset_n, tstart, expected_utc_offset):
-        offset = DateOffset(**{offset_name: offset_n})
-        t = tstart + offset
-        if expected_utc_offset is not None:
-            self.assertTrue(get_utc_offset_hours(t) == expected_utc_offset)
-
-        if offset_name == 'weeks':
-            # dates should match
-            self.assertTrue(
-                t.date() ==
-                timedelta(days=7 * offset.kwds['weeks']) + tstart.date()
-                )
-            # expect the same day of week, hour of day, minute, second, ...
-            self.assertTrue(
-                t.dayofweek == tstart.dayofweek and
-                t.hour == tstart.hour and
-                t.minute == tstart.minute and
-                t.second == tstart.second
-                )
-        elif offset_name == 'days':
-            # dates should match
-            self.assertTrue(timedelta(offset.kwds['days']) + tstart.date() == t.date())
-            # expect the same hour of day, minute, second, ...
-            self.assertTrue(
-                t.hour == tstart.hour and
-                t.minute == tstart.minute and
-                t.second == tstart.second
-                )
-        elif offset_name in self.valid_date_offsets_singular:
-            # expect the signular offset value to match between tstart and t
-            datepart_offset = getattr(t, offset_name if offset_name != 'weekday' else 'dayofweek')
-            self.assertTrue(datepart_offset == offset.kwds[offset_name])
-        else:
-            # the offset should be the same as if it was done in UTC
-            self.assertTrue(
-                t == (tstart.tz_convert('UTC') + offset).tz_convert('US/Pacific')
-                )
-
-    def _make_timestamp(self, string, hrs_offset, tz):
-        offset_string = '{hrs:02d}00'.format(hrs=hrs_offset) if hrs_offset >= 0 else \
-            '-{hrs:02d}00'.format(hrs=-1 * hrs_offset)
-        return Timestamp(string + offset_string).tz_convert(tz)
-
-    def test_fallback_plural(self):
-        """test moving from daylight savings to standard time"""
-        for tz, utc_offsets in self.timezone_utc_offsets.items():
-            hrs_pre = utc_offsets['utc_offset_daylight']
-            hrs_post = utc_offsets['utc_offset_standard']
-            self._test_all_offsets(
-                n=3,
-                tstart=self._make_timestamp(self.ts_pre_fallback, hrs_pre, tz),
-                expected_utc_offset=hrs_post
-                )
-
-    def test_springforward_plural(self):
-        """test moving from standard to daylight savings"""
-        for tz, utc_offsets in self.timezone_utc_offsets.items():
-            hrs_pre = utc_offsets['utc_offset_standard']
-            hrs_post = utc_offsets['utc_offset_daylight']
-            self._test_all_offsets(
-                n=3,
-                tstart=self._make_timestamp(self.ts_pre_springfwd, hrs_pre, tz),
-                expected_utc_offset=hrs_post
-                )
-
-    def test_fallback_singular(self):
-        # in the case of signular offsets, we dont neccesarily know which utc offset
-        # the new Timestamp will wind up in (the tz for 1 month may be different from 1 second)
-        # so we don't specify an expected_utc_offset
-        for tz, utc_offsets in self.timezone_utc_offsets.items():
-            hrs_pre = utc_offsets['utc_offset_standard']
-            self._test_all_offsets(
-                n=1,
-                tstart=self._make_timestamp(self.ts_pre_fallback, hrs_pre, tz),
-                expected_utc_offset=None
-                )
-
-    def test_springforward_singular(self):
-        for tz, utc_offsets in self.timezone_utc_offsets.items():
-            hrs_pre = utc_offsets['utc_offset_standard']
-            self._test_all_offsets(
-                n=1,
-                tstart=self._make_timestamp(self.ts_pre_springfwd, hrs_pre, tz),
-                expected_utc_offset=None
-                )
-
-    def test_all_offset_classes(self):
-        tests = {MonthBegin: ['11/2/2012', '12/1/2012'],
-                 MonthEnd: ['11/2/2012', '11/30/2012'],
-                 BMonthBegin: ['11/2/2012', '12/3/2012'],
-                 BMonthEnd: ['11/2/2012', '11/30/2012'],
-                 CBMonthBegin: ['11/2/2012', '12/3/2012'],
-                 CBMonthEnd: ['11/2/2012', '11/30/2012'],
-                 Week: ['11/2/2012', '11/9/2012'],
-                 YearBegin: ['11/2/2012', '1/1/2013'],
-                 YearEnd: ['11/2/2012', '12/31/2012'],
-                 BYearBegin: ['11/2/2012', '1/1/2013'],
-                 BYearEnd: ['11/2/2012', '12/31/2012'],
-                 QuarterBegin: ['11/2/2012', '12/1/2012'],
-                 QuarterEnd: ['11/2/2012', '12/31/2012'],
-                 BQuarterBegin: ['11/2/2012', '12/3/2012'],
-                 BQuarterEnd: ['11/2/2012', '12/31/2012'],
-                 Day: ['11/4/2012', '11/4/2012 23:00']
-                 }
-
-        for offset, test_values in iteritems(tests):
-            first = Timestamp(test_values[0], tz='US/Eastern') + offset()
-            second = Timestamp(test_values[1], tz='US/Eastern')
-            self.assertEqual(first, second, str(offset))
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tseries/tests/test_period.py b/pandas/tseries/tests/test_period.py
deleted file mode 100644
index c6fb54ceec644..0000000000000
--- a/pandas/tseries/tests/test_period.py
+++ /dev/null
@@ -1,3633 +0,0 @@
-"""Tests suite for Period handling.
-
-Parts derived from scikits.timeseries code, original authors:
-- Pierre Gerard-Marchant & Matt Knox
-- pierregm_at_uga_dot_edu - mattknow_ca_at_hotmail_dot_com
-
-"""
-
-from datetime import datetime, date, timedelta
-
-from numpy.ma.testutils import assert_equal
-
-from pandas import Timestamp
-from pandas.tseries.frequencies import MONTHS, DAYS, _period_code_map
-from pandas.tseries.period import Period, PeriodIndex, period_range
-from pandas.tseries.index import DatetimeIndex, date_range, Index
-from pandas.tseries.tools import to_datetime
-import pandas.tseries.period as period
-import pandas.tseries.offsets as offsets
-
-import pandas.core.datetools as datetools
-import pandas as pd
-import numpy as np
-from numpy.random import randn
-from pandas.compat import range, lrange, lmap, zip
-
-from pandas import Series, DataFrame, _np_version_under1p9
-from pandas import tslib
-from pandas.util.testing import(assert_series_equal, assert_almost_equal,
-                                assertRaisesRegexp)
-import pandas.util.testing as tm
-from pandas import compat
-
-
-class TestPeriodProperties(tm.TestCase):
-    "Test properties such as year, month, weekday, etc...."
-    #
-
-    def test_quarterly_negative_ordinals(self):
-        p = Period(ordinal=-1, freq='Q-DEC')
-        self.assertEqual(p.year, 1969)
-        self.assertEqual(p.quarter, 4)
-
-        p = Period(ordinal=-2, freq='Q-DEC')
-        self.assertEqual(p.year, 1969)
-        self.assertEqual(p.quarter, 3)
-
-        p = Period(ordinal=-2, freq='M')
-        self.assertEqual(p.year, 1969)
-        self.assertEqual(p.month, 11)
-
-    def test_period_cons_quarterly(self):
-        # bugs in scikits.timeseries
-        for month in MONTHS:
-            freq = 'Q-%s' % month
-            exp = Period('1989Q3', freq=freq)
-            self.assertIn('1989Q3', str(exp))
-            stamp = exp.to_timestamp('D', how='end')
-            p = Period(stamp, freq=freq)
-            self.assertEqual(p, exp)
-
-            stamp = exp.to_timestamp('3D', how='end')
-            p = Period(stamp, freq=freq)
-            self.assertEqual(p, exp)
-
-    def test_period_cons_annual(self):
-        # bugs in scikits.timeseries
-        for month in MONTHS:
-            freq = 'A-%s' % month
-            exp = Period('1989', freq=freq)
-            stamp = exp.to_timestamp('D', how='end') + timedelta(days=30)
-            p = Period(stamp, freq=freq)
-            self.assertEqual(p, exp + 1)
-
-    def test_period_cons_weekly(self):
-        for num in range(10, 17):
-            daystr = '2011-02-%d' % num
-            for day in DAYS:
-                freq = 'W-%s' % day
-
-                result = Period(daystr, freq=freq)
-                expected = Period(daystr, freq='D').asfreq(freq)
-                self.assertEqual(result, expected)
-
-    def test_period_cons_nat(self):
-        p = Period('NaT', freq='M')
-        self.assertEqual(p.ordinal, tslib.iNaT)
-        self.assertEqual(p.freq, 'M')
-        self.assertEqual((p + 1).ordinal, tslib.iNaT)
-
-        p = Period('nat', freq='W-SUN')
-        self.assertEqual(p.ordinal, tslib.iNaT)
-        self.assertEqual(p.freq, 'W-SUN')
-        self.assertEqual((p + 1).ordinal, tslib.iNaT)
-
-        p = Period(tslib.iNaT, freq='D')
-        self.assertEqual(p.ordinal, tslib.iNaT)
-        self.assertEqual(p.freq, 'D')
-        self.assertEqual((p + 1).ordinal, tslib.iNaT)
-
-        p = Period(tslib.iNaT, freq='3D')
-        self.assertEqual(p.ordinal, tslib.iNaT)
-        self.assertEqual(p.freq, offsets.Day(3))
-        self.assertEqual(p.freqstr, '3D')
-        self.assertEqual((p + 1).ordinal, tslib.iNaT)
-
-        self.assertRaises(ValueError, Period, 'NaT')
-
-    def test_period_cons_mult(self):
-        p1 = Period('2011-01', freq='3M')
-        p2 = Period('2011-01', freq='M')
-        self.assertEqual(p1.ordinal, p2.ordinal)
-
-        self.assertEqual(p1.freq, offsets.MonthEnd(3))
-        self.assertEqual(p1.freqstr, '3M')
-
-        self.assertEqual(p2.freq, offsets.MonthEnd())
-        self.assertEqual(p2.freqstr, 'M')
-
-        result = p1 + 1
-        self.assertEqual(result.ordinal, (p2 + 3).ordinal)
-        self.assertEqual(result.freq, p1.freq)
-        self.assertEqual(result.freqstr, '3M')
-
-        result = p1 - 1
-        self.assertEqual(result.ordinal, (p2 - 3).ordinal)
-        self.assertEqual(result.freq, p1.freq)
-        self.assertEqual(result.freqstr, '3M')
-
-        msg = ('Frequency must be positive, because it'
-               ' represents span: -3M')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Period('2011-01', freq='-3M')
-
-        msg = ('Frequency must be positive, because it'
-               ' represents span: 0M')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Period('2011-01', freq='0M')
-
-    def test_timestamp_tz_arg(self):
-        tm._skip_if_no_pytz()
-        import pytz
-        for case in ['Europe/Brussels', 'Asia/Tokyo', 'US/Pacific']:
-            p = Period('1/1/2005', freq='M').to_timestamp(tz=case)
-            exp = Timestamp('1/1/2005', tz='UTC').tz_convert(case)
-            exp_zone = pytz.timezone(case).normalize(p)
-
-            self.assertEqual(p, exp)
-            self.assertEqual(p.tz, exp_zone.tzinfo)
-            self.assertEqual(p.tz, exp.tz)
-
-            p = Period('1/1/2005', freq='3H').to_timestamp(tz=case)
-            exp = Timestamp('1/1/2005', tz='UTC').tz_convert(case)
-            exp_zone = pytz.timezone(case).normalize(p)
-
-            self.assertEqual(p, exp)
-            self.assertEqual(p.tz, exp_zone.tzinfo)
-            self.assertEqual(p.tz, exp.tz)
-
-            p = Period('1/1/2005', freq='A').to_timestamp(freq='A', tz=case)
-            exp = Timestamp('31/12/2005', tz='UTC').tz_convert(case)
-            exp_zone = pytz.timezone(case).normalize(p)
-
-            self.assertEqual(p, exp)
-            self.assertEqual(p.tz, exp_zone.tzinfo)
-            self.assertEqual(p.tz, exp.tz)
-
-            p = Period('1/1/2005', freq='A').to_timestamp(freq='3H', tz=case)
-            exp = Timestamp('1/1/2005', tz='UTC').tz_convert(case)
-            exp_zone = pytz.timezone(case).normalize(p)
-
-            self.assertEqual(p, exp)
-            self.assertEqual(p.tz, exp_zone.tzinfo)
-            self.assertEqual(p.tz, exp.tz)
-
-    def test_timestamp_tz_arg_dateutil(self):
-        from pandas.tslib import _dateutil_gettz as gettz
-        from pandas.tslib import maybe_get_tz
-        for case in ['dateutil/Europe/Brussels', 'dateutil/Asia/Tokyo',
-                     'dateutil/US/Pacific']:
-            p = Period('1/1/2005', freq='M').to_timestamp(tz=maybe_get_tz(case))
-            exp = Timestamp('1/1/2005', tz='UTC').tz_convert(case)
-            self.assertEqual(p, exp)
-            self.assertEqual(p.tz, gettz(case.split('/', 1)[1]))
-            self.assertEqual(p.tz, exp.tz)
-
-            p = Period('1/1/2005', freq='M').to_timestamp(freq='3H', tz=maybe_get_tz(case))
-            exp = Timestamp('1/1/2005', tz='UTC').tz_convert(case)
-            self.assertEqual(p, exp)
-            self.assertEqual(p.tz, gettz(case.split('/', 1)[1]))
-            self.assertEqual(p.tz, exp.tz)
-
-    def test_timestamp_tz_arg_dateutil_from_string(self):
-        from pandas.tslib import _dateutil_gettz as gettz
-        p = Period('1/1/2005', freq='M').to_timestamp(tz='dateutil/Europe/Brussels')
-        self.assertEqual(p.tz, gettz('Europe/Brussels'))
-
-    def test_timestamp_nat_tz(self):
-        t = Period('NaT', freq='M').to_timestamp()
-        self.assertTrue(t is tslib.NaT)
-
-        t = Period('NaT', freq='M').to_timestamp(tz='Asia/Tokyo')
-        self.assertTrue(t is tslib.NaT)
-
-    def test_timestamp_mult(self):
-        p = pd.Period('2011-01', freq='M')
-        self.assertEqual(p.to_timestamp(how='S'), pd.Timestamp('2011-01-01'))
-        self.assertEqual(p.to_timestamp(how='E'), pd.Timestamp('2011-01-31'))
-
-        p = pd.Period('2011-01', freq='3M')
-        self.assertEqual(p.to_timestamp(how='S'), pd.Timestamp('2011-01-01'))
-        self.assertEqual(p.to_timestamp(how='E'), pd.Timestamp('2011-03-31'))
-
-    def test_timestamp_nat_mult(self):
-        for freq in ['M', '3M']:
-            p = pd.Period('NaT', freq=freq)
-            self.assertTrue(p.to_timestamp(how='S') is pd.NaT)
-            self.assertTrue(p.to_timestamp(how='E') is pd.NaT)
-
-    def test_period_constructor(self):
-        i1 = Period('1/1/2005', freq='M')
-        i2 = Period('Jan 2005')
-
-        self.assertEqual(i1, i2)
-
-        i1 = Period('2005', freq='A')
-        i2 = Period('2005')
-        i3 = Period('2005', freq='a')
-
-        self.assertEqual(i1, i2)
-        self.assertEqual(i1, i3)
-
-        i4 = Period('2005', freq='M')
-        i5 = Period('2005', freq='m')
-
-        self.assertRaises(ValueError, i1.__ne__, i4)
-        self.assertEqual(i4, i5)
-
-        i1 = Period.now('Q')
-        i2 = Period(datetime.now(), freq='Q')
-        i3 = Period.now('q')
-
-        self.assertEqual(i1, i2)
-        self.assertEqual(i1, i3)
-
-        # Biz day construction, roll forward if non-weekday
-        i1 = Period('3/10/12', freq='B')
-        i2 = Period('3/10/12', freq='D')
-        self.assertEqual(i1, i2.asfreq('B'))
-        i2 = Period('3/11/12', freq='D')
-        self.assertEqual(i1, i2.asfreq('B'))
-        i2 = Period('3/12/12', freq='D')
-        self.assertEqual(i1, i2.asfreq('B'))
-
-        i3 = Period('3/10/12', freq='b')
-        self.assertEqual(i1, i3)
-
-        i1 = Period(year=2005, quarter=1, freq='Q')
-        i2 = Period('1/1/2005', freq='Q')
-        self.assertEqual(i1, i2)
-
-        i1 = Period(year=2005, quarter=3, freq='Q')
-        i2 = Period('9/1/2005', freq='Q')
-        self.assertEqual(i1, i2)
-
-        i1 = Period(year=2005, month=3, day=1, freq='D')
-        i2 = Period('3/1/2005', freq='D')
-        self.assertEqual(i1, i2)
-
-        i3 = Period(year=2005, month=3, day=1, freq='d')
-        self.assertEqual(i1, i3)
-
-        i1 = Period(year=2012, month=3, day=10, freq='B')
-        i2 = Period('3/12/12', freq='B')
-        self.assertEqual(i1, i2)
-
-        i1 = Period('2005Q1')
-        i2 = Period(year=2005, quarter=1, freq='Q')
-        i3 = Period('2005q1')
-        self.assertEqual(i1, i2)
-        self.assertEqual(i1, i3)
-
-        i1 = Period('05Q1')
-        self.assertEqual(i1, i2)
-        lower = Period('05q1')
-        self.assertEqual(i1, lower)
-
-        i1 = Period('1Q2005')
-        self.assertEqual(i1, i2)
-        lower = Period('1q2005')
-        self.assertEqual(i1, lower)
-
-        i1 = Period('1Q05')
-        self.assertEqual(i1, i2)
-        lower = Period('1q05')
-        self.assertEqual(i1, lower)
-
-        i1 = Period('4Q1984')
-        self.assertEqual(i1.year, 1984)
-        lower = Period('4q1984')
-        self.assertEqual(i1, lower)
-
-        i1 = Period('1982', freq='min')
-        i2 = Period('1982', freq='MIN')
-        self.assertEqual(i1, i2)
-        i2 = Period('1982', freq=('Min', 1))
-        self.assertEqual(i1, i2)
-
-        expected = Period('2007-01', freq='M')
-        i1 = Period('200701', freq='M')
-        self.assertEqual(i1, expected)
-
-        i1 = Period('200701', freq='M')
-        self.assertEqual(i1, expected)
-
-        i1 = Period(200701, freq='M')
-        self.assertEqual(i1, expected)
-
-        i1 = Period(ordinal=200701, freq='M')
-        self.assertEqual(i1.year, 18695)
-
-        i1 = Period(datetime(2007, 1, 1), freq='M')
-        i2 = Period('200701', freq='M')
-        self.assertEqual(i1, i2)
-
-        i1 = Period(date(2007, 1, 1), freq='M')
-        i2 = Period(datetime(2007, 1, 1), freq='M')
-        i3 = Period(np.datetime64('2007-01-01'), freq='M')
-        i4 = Period(np.datetime64('2007-01-01 00:00:00Z'), freq='M')
-        i5 = Period(np.datetime64('2007-01-01 00:00:00.000Z'), freq='M')
-        self.assertEqual(i1, i2)
-        self.assertEqual(i1, i3)
-        self.assertEqual(i1, i4)
-        self.assertEqual(i1, i5)
-
-        i1 = Period('2007-01-01 09:00:00.001')
-        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1000), freq='L')
-        self.assertEqual(i1, expected)
-
-        expected = Period(np.datetime64('2007-01-01 09:00:00.001Z'), freq='L')
-        self.assertEqual(i1, expected)
-
-        i1 = Period('2007-01-01 09:00:00.00101')
-        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1010), freq='U')
-        self.assertEqual(i1, expected)
-
-        expected = Period(np.datetime64('2007-01-01 09:00:00.00101Z'),
-                          freq='U')
-        self.assertEqual(i1, expected)
-
-        self.assertRaises(ValueError, Period, ordinal=200701)
-
-        self.assertRaises(ValueError, Period, '2007-1-1', freq='X')
-
-
-    def test_period_constructor_offsets(self):
-        self.assertEqual(Period('1/1/2005', freq=offsets.MonthEnd()),
-                         Period('1/1/2005', freq='M'))
-        self.assertEqual(Period('2005', freq=offsets.YearEnd()),
-                         Period('2005', freq='A'))
-        self.assertEqual(Period('2005', freq=offsets.MonthEnd()),
-                         Period('2005', freq='M'))
-        self.assertEqual(Period('3/10/12', freq=offsets.BusinessDay()),
-                         Period('3/10/12', freq='B'))
-        self.assertEqual(Period('3/10/12', freq=offsets.Day()),
-                         Period('3/10/12', freq='D'))
-
-        self.assertEqual(Period(year=2005, quarter=1,
-                                freq=offsets.QuarterEnd(startingMonth=12)),
-                         Period(year=2005, quarter=1, freq='Q'))
-        self.assertEqual(Period(year=2005, quarter=2,
-                                freq=offsets.QuarterEnd(startingMonth=12)),
-                         Period(year=2005, quarter=2, freq='Q'))
-
-        self.assertEqual(Period(year=2005, month=3, day=1, freq=offsets.Day()),
-                         Period(year=2005, month=3, day=1, freq='D'))
-        self.assertEqual(Period(year=2012, month=3, day=10, freq=offsets.BDay()),
-                         Period(year=2012, month=3, day=10, freq='B'))
-
-        expected = Period('2005-03-01', freq='3D')
-        self.assertEqual(Period(year=2005, month=3, day=1, freq=offsets.Day(3)),
-                         expected)
-        self.assertEqual(Period(year=2005, month=3, day=1, freq='3D'),
-                         expected)
-
-        self.assertEqual(Period(year=2012, month=3, day=10, freq=offsets.BDay(3)),
-                         Period(year=2012, month=3, day=10, freq='3B'))
-
-        self.assertEqual(Period(200701, freq=offsets.MonthEnd()),
-                         Period(200701, freq='M'))
-
-        i1 = Period(ordinal=200701, freq=offsets.MonthEnd())
-        i2 = Period(ordinal=200701, freq='M')
-        self.assertEqual(i1, i2)
-        self.assertEqual(i1.year, 18695)
-        self.assertEqual(i2.year, 18695)
-
-        i1 = Period(datetime(2007, 1, 1), freq='M')
-        i2 = Period('200701', freq='M')
-        self.assertEqual(i1, i2)
-
-        i1 = Period(date(2007, 1, 1), freq='M')
-        i2 = Period(datetime(2007, 1, 1), freq='M')
-        i3 = Period(np.datetime64('2007-01-01'), freq='M')
-        i4 = Period(np.datetime64('2007-01-01 00:00:00Z'), freq='M')
-        i5 = Period(np.datetime64('2007-01-01 00:00:00.000Z'), freq='M')
-        self.assertEqual(i1, i2)
-        self.assertEqual(i1, i3)
-        self.assertEqual(i1, i4)
-        self.assertEqual(i1, i5)
-
-        i1 = Period('2007-01-01 09:00:00.001')
-        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1000), freq='L')
-        self.assertEqual(i1, expected)
-
-        expected = Period(np.datetime64('2007-01-01 09:00:00.001Z'), freq='L')
-        self.assertEqual(i1, expected)
-
-        i1 = Period('2007-01-01 09:00:00.00101')
-        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1010), freq='U')
-        self.assertEqual(i1, expected)
-
-        expected = Period(np.datetime64('2007-01-01 09:00:00.00101Z'),
-                          freq='U')
-        self.assertEqual(i1, expected)
-
-        self.assertRaises(ValueError, Period, ordinal=200701)
-
-        self.assertRaises(ValueError, Period, '2007-1-1', freq='X')
-
-
-    def test_freq_str(self):
-        i1 = Period('1982', freq='Min')
-        self.assertEqual(i1.freq, offsets.Minute())
-        self.assertEqual(i1.freqstr, 'T')
-
-    def test_repr(self):
-        p = Period('Jan-2000')
-        self.assertIn('2000-01', repr(p))
-
-        p = Period('2000-12-15')
-        self.assertIn('2000-12-15', repr(p))
-
-    def test_repr_nat(self):
-        p = Period('nat', freq='M')
-        self.assertIn(repr(tslib.NaT), repr(p))
-
-    def test_millisecond_repr(self):
-        p = Period('2000-01-01 12:15:02.123')
-
-        self.assertEqual("Period('2000-01-01 12:15:02.123', 'L')", repr(p))
-
-    def test_microsecond_repr(self):
-        p = Period('2000-01-01 12:15:02.123567')
-
-        self.assertEqual("Period('2000-01-01 12:15:02.123567', 'U')", repr(p))
-
-    def test_strftime(self):
-        p = Period('2000-1-1 12:34:12', freq='S')
-        res = p.strftime('%Y-%m-%d %H:%M:%S')
-        self.assertEqual(res,  '2000-01-01 12:34:12')
-        tm.assertIsInstance(res, compat.text_type) # GH3363
-
-    def test_sub_delta(self):
-        left, right = Period('2011', freq='A'), Period('2007', freq='A')
-        result = left - right
-        self.assertEqual(result, 4)
-
-        self.assertRaises(ValueError, left.__sub__,
-                          Period('2007-01', freq='M'))
-
-    def test_to_timestamp(self):
-        p = Period('1982', freq='A')
-        start_ts = p.to_timestamp(how='S')
-        aliases = ['s', 'StarT', 'BEGIn']
-        for a in aliases:
-            self.assertEqual(start_ts, p.to_timestamp('D', how=a))
-            # freq with mult should not affect to the result
-            self.assertEqual(start_ts, p.to_timestamp('3D', how=a))
-
-        end_ts = p.to_timestamp(how='E')
-        aliases = ['e', 'end', 'FINIsH']
-        for a in aliases:
-            self.assertEqual(end_ts, p.to_timestamp('D', how=a))
-            self.assertEqual(end_ts, p.to_timestamp('3D', how=a))
-
-        from_lst = ['A', 'Q', 'M', 'W', 'B',
-                    'D', 'H', 'Min', 'S']
-
-        def _ex(p):
-            return Timestamp((p + 1).start_time.value - 1)
-
-        for i, fcode in enumerate(from_lst):
-            p = Period('1982', freq=fcode)
-            result = p.to_timestamp().to_period(fcode)
-            self.assertEqual(result, p)
-
-            self.assertEqual(p.start_time, p.to_timestamp(how='S'))
-
-            self.assertEqual(p.end_time, _ex(p))
-
-        # Frequency other than daily
-
-        p = Period('1985', freq='A')
-
-        result = p.to_timestamp('H', how='end')
-        expected = datetime(1985, 12, 31, 23)
-        self.assertEqual(result, expected)
-        result = p.to_timestamp('3H', how='end')
-        self.assertEqual(result, expected)
-
-        result = p.to_timestamp('T', how='end')
-        expected = datetime(1985, 12, 31, 23, 59)
-        self.assertEqual(result, expected)
-        result = p.to_timestamp('2T', how='end')
-        self.assertEqual(result, expected)
-
-
-        result = p.to_timestamp(how='end')
-        expected = datetime(1985, 12, 31)
-        self.assertEqual(result, expected)
-
-        expected = datetime(1985, 1, 1)
-        result = p.to_timestamp('H', how='start')
-        self.assertEqual(result, expected)
-        result = p.to_timestamp('T', how='start')
-        self.assertEqual(result, expected)
-        result = p.to_timestamp('S', how='start')
-        self.assertEqual(result, expected)
-        result = p.to_timestamp('3H', how='start')
-        self.assertEqual(result, expected)
-        result = p.to_timestamp('5S', how='start')
-        self.assertEqual(result, expected)
-
-        p = Period('NaT', freq='W')
-        self.assertTrue(p.to_timestamp() is tslib.NaT)
-
-    def test_start_time(self):
-        freq_lst = ['A', 'Q', 'M', 'D', 'H', 'T', 'S']
-        xp = datetime(2012, 1, 1)
-        for f in freq_lst:
-            p = Period('2012', freq=f)
-            self.assertEqual(p.start_time, xp)
-        self.assertEqual(Period('2012', freq='B').start_time,
-                         datetime(2012, 1, 2))
-        self.assertEqual(Period('2012', freq='W').start_time,
-                         datetime(2011, 12, 26))
-
-        p = Period('NaT', freq='W')
-        self.assertTrue(p.start_time is tslib.NaT)
-
-    def test_end_time(self):
-        p = Period('2012', freq='A')
-
-        def _ex(*args):
-            return Timestamp(Timestamp(datetime(*args)).value - 1)
-
-        xp = _ex(2013, 1, 1)
-        self.assertEqual(xp, p.end_time)
-
-        p = Period('2012', freq='Q')
-        xp = _ex(2012, 4, 1)
-        self.assertEqual(xp, p.end_time)
-
-        p = Period('2012', freq='M')
-        xp = _ex(2012, 2, 1)
-        self.assertEqual(xp, p.end_time)
-
-        xp = _ex(2012, 1, 2)
-        p = Period('2012', freq='D')
-        self.assertEqual(p.end_time, xp)
-
-        xp = _ex(2012, 1, 1, 1)
-        p = Period('2012', freq='H')
-        self.assertEqual(p.end_time, xp)
-
-        xp = _ex(2012, 1, 3)
-        self.assertEqual(Period('2012', freq='B').end_time, xp)
-
-        xp = _ex(2012, 1, 2)
-        self.assertEqual(Period('2012', freq='W').end_time, xp)
-
-        p = Period('NaT', freq='W')
-        self.assertTrue(p.end_time is tslib.NaT)
-
-    def test_anchor_week_end_time(self):
-        def _ex(*args):
-            return Timestamp(Timestamp(datetime(*args)).value - 1)
-
-        p = Period('2013-1-1', 'W-SAT')
-        xp = _ex(2013, 1, 6)
-        self.assertEqual(p.end_time, xp)
-
-    def test_properties_annually(self):
-        # Test properties on Periods with annually frequency.
-        a_date = Period(freq='A', year=2007)
-        assert_equal(a_date.year, 2007)
-
-    def test_properties_quarterly(self):
-        # Test properties on Periods with daily frequency.
-        qedec_date = Period(freq="Q-DEC", year=2007, quarter=1)
-        qejan_date = Period(freq="Q-JAN", year=2007, quarter=1)
-        qejun_date = Period(freq="Q-JUN", year=2007, quarter=1)
-        #
-        for x in range(3):
-            for qd in (qedec_date, qejan_date, qejun_date):
-                assert_equal((qd + x).qyear, 2007)
-                assert_equal((qd + x).quarter, x + 1)
-
-    def test_properties_monthly(self):
-        # Test properties on Periods with daily frequency.
-        m_date = Period(freq='M', year=2007, month=1)
-        for x in range(11):
-            m_ival_x = m_date + x
-            assert_equal(m_ival_x.year, 2007)
-            if 1 <= x + 1 <= 3:
-                assert_equal(m_ival_x.quarter, 1)
-            elif 4 <= x + 1 <= 6:
-                assert_equal(m_ival_x.quarter, 2)
-            elif 7 <= x + 1 <= 9:
-                assert_equal(m_ival_x.quarter, 3)
-            elif 10 <= x + 1 <= 12:
-                assert_equal(m_ival_x.quarter, 4)
-            assert_equal(m_ival_x.month, x + 1)
-
-    def test_properties_weekly(self):
-        # Test properties on Periods with daily frequency.
-        w_date = Period(freq='W', year=2007, month=1, day=7)
-        #
-        assert_equal(w_date.year, 2007)
-        assert_equal(w_date.quarter, 1)
-        assert_equal(w_date.month, 1)
-        assert_equal(w_date.week, 1)
-        assert_equal((w_date - 1).week, 52)
-        assert_equal(w_date.days_in_month, 31)
-        assert_equal(Period(freq='W', year=2012, month=2, day=1).days_in_month, 29)
-
-    def test_properties_weekly_legacy(self):
-        # Test properties on Periods with daily frequency.
-        with tm.assert_produces_warning(FutureWarning):
-            w_date = Period(freq='WK', year=2007, month=1, day=7)
-        #
-        assert_equal(w_date.year, 2007)
-        assert_equal(w_date.quarter, 1)
-        assert_equal(w_date.month, 1)
-        assert_equal(w_date.week, 1)
-        assert_equal((w_date - 1).week, 52)
-        assert_equal(w_date.days_in_month, 31)
-        with tm.assert_produces_warning(FutureWarning):
-            exp = Period(freq='WK', year=2012, month=2, day=1)
-        assert_equal(exp.days_in_month, 29)
-
-    def test_properties_daily(self):
-        # Test properties on Periods with daily frequency.
-        b_date = Period(freq='B', year=2007, month=1, day=1)
-        #
-        assert_equal(b_date.year, 2007)
-        assert_equal(b_date.quarter, 1)
-        assert_equal(b_date.month, 1)
-        assert_equal(b_date.day, 1)
-        assert_equal(b_date.weekday, 0)
-        assert_equal(b_date.dayofyear, 1)
-        assert_equal(b_date.days_in_month, 31)
-        assert_equal(Period(freq='B', year=2012, month=2, day=1).days_in_month, 29)
-        #
-        d_date = Period(freq='D', year=2007, month=1, day=1)
-        #
-        assert_equal(d_date.year, 2007)
-        assert_equal(d_date.quarter, 1)
-        assert_equal(d_date.month, 1)
-        assert_equal(d_date.day, 1)
-        assert_equal(d_date.weekday, 0)
-        assert_equal(d_date.dayofyear, 1)
-        assert_equal(d_date.days_in_month, 31)
-        assert_equal(Period(freq='D', year=2012, month=2,
-                            day=1).days_in_month, 29)
-
-    def test_properties_hourly(self):
-        # Test properties on Periods with hourly frequency.
-        h_date1 = Period(freq='H', year=2007, month=1, day=1, hour=0)
-        h_date2 = Period(freq='2H', year=2007, month=1, day=1, hour=0)
-
-        for h_date in [h_date1, h_date2]:
-            assert_equal(h_date.year, 2007)
-            assert_equal(h_date.quarter, 1)
-            assert_equal(h_date.month, 1)
-            assert_equal(h_date.day, 1)
-            assert_equal(h_date.weekday, 0)
-            assert_equal(h_date.dayofyear, 1)
-            assert_equal(h_date.hour, 0)
-            assert_equal(h_date.days_in_month, 31)
-            assert_equal(Period(freq='H', year=2012, month=2, day=1,
-                                hour=0).days_in_month, 29)
-
-    def test_properties_minutely(self):
-        # Test properties on Periods with minutely frequency.
-        t_date = Period(freq='Min', year=2007, month=1, day=1, hour=0,
-                        minute=0)
-        #
-        assert_equal(t_date.quarter, 1)
-        assert_equal(t_date.month, 1)
-        assert_equal(t_date.day, 1)
-        assert_equal(t_date.weekday, 0)
-        assert_equal(t_date.dayofyear, 1)
-        assert_equal(t_date.hour, 0)
-        assert_equal(t_date.minute, 0)
-        assert_equal(t_date.days_in_month, 31)
-        assert_equal(Period(freq='D', year=2012, month=2, day=1, hour=0,
-                            minute=0).days_in_month, 29)
-
-    def test_properties_secondly(self):
-        # Test properties on Periods with secondly frequency.
-        s_date = Period(freq='Min', year=2007, month=1, day=1,
-                        hour=0, minute=0, second=0)
-        #
-        assert_equal(s_date.year, 2007)
-        assert_equal(s_date.quarter, 1)
-        assert_equal(s_date.month, 1)
-        assert_equal(s_date.day, 1)
-        assert_equal(s_date.weekday, 0)
-        assert_equal(s_date.dayofyear, 1)
-        assert_equal(s_date.hour, 0)
-        assert_equal(s_date.minute, 0)
-        assert_equal(s_date.second, 0)
-        assert_equal(s_date.days_in_month, 31)
-        assert_equal(Period(freq='Min', year=2012, month=2, day=1, hour=0,
-                            minute=0, second=0).days_in_month, 29)
-
-    def test_properties_nat(self):
-        p_nat = Period('NaT', freq='M')
-        t_nat = pd.Timestamp('NaT')
-        # confirm Period('NaT') work identical with Timestamp('NaT')
-        for f in ['year', 'month', 'day', 'hour', 'minute', 'second',
-                  'week', 'dayofyear', 'quarter', 'days_in_month']:
-            self.assertTrue(np.isnan(getattr(p_nat, f)))
-            self.assertTrue(np.isnan(getattr(t_nat, f)))
-
-        for f in ['weekofyear', 'dayofweek', 'weekday', 'qyear']:
-            self.assertTrue(np.isnan(getattr(p_nat, f)))
-
-    def test_pnow(self):
-        dt = datetime.now()
-
-        val = period.pnow('D')
-        exp = Period(dt, freq='D')
-        self.assertEqual(val, exp)
-
-        val2 = period.pnow('2D')
-        exp2 = Period(dt, freq='2D')
-        self.assertEqual(val2, exp2)
-        self.assertEqual(val.ordinal, val2.ordinal)
-        self.assertEqual(val.ordinal, exp2.ordinal)
-
-    def test_constructor_corner(self):
-        expected = Period('2007-01', freq='2M')
-        self.assertEqual(Period(year=2007, month=1, freq='2M'), expected)
-
-        self.assertRaises(ValueError, Period, datetime.now())
-        self.assertRaises(ValueError, Period, datetime.now().date())
-        self.assertRaises(ValueError, Period, 1.6, freq='D')
-        self.assertRaises(ValueError, Period, ordinal=1.6, freq='D')
-        self.assertRaises(ValueError, Period, ordinal=2, value=1, freq='D')
-        self.assertRaises(ValueError, Period)
-        self.assertRaises(ValueError, Period, month=1)
-
-        p = Period('2007-01-01', freq='D')
-
-        result = Period(p, freq='A')
-        exp = Period('2007', freq='A')
-        self.assertEqual(result, exp)
-
-    def test_constructor_infer_freq(self):
-        p = Period('2007-01-01')
-        self.assertEqual(p.freq, 'D')
-
-        p = Period('2007-01-01 07')
-        self.assertEqual(p.freq, 'H')
-
-        p = Period('2007-01-01 07:10')
-        self.assertEqual(p.freq, 'T')
-
-        p = Period('2007-01-01 07:10:15')
-        self.assertEqual(p.freq, 'S')
-
-        p = Period('2007-01-01 07:10:15.123')
-        self.assertEqual(p.freq, 'L')
-
-        p = Period('2007-01-01 07:10:15.123000')
-        self.assertEqual(p.freq, 'L')
-
-        p = Period('2007-01-01 07:10:15.123400')
-        self.assertEqual(p.freq, 'U')
-
-    def test_asfreq_MS(self):
-        initial = Period("2013")
-
-        self.assertEqual(initial.asfreq(freq="M", how="S"), Period('2013-01', 'M'))
-        self.assertRaises(ValueError, initial.asfreq, freq="MS", how="S")
-        tm.assertRaisesRegexp(ValueError, "Unknown freqstr: MS", pd.Period, '2013-01', 'MS')
-        self.assertTrue(_period_code_map.get("MS") is None)
-
-def noWrap(item):
-    return item
-
-
-class TestFreqConversion(tm.TestCase):
-    "Test frequency conversion of date objects"
-
-    def test_asfreq_corner(self):
-        val = Period(freq='A', year=2007)
-        result1 = val.asfreq('5t')
-        result2 = val.asfreq('t')
-        expected = Period('2007-12-31 23:59', freq='t')
-        self.assertEqual(result1.ordinal, expected.ordinal)
-        self.assertEqual(result1.freqstr, '5T')
-        self.assertEqual(result2.ordinal, expected.ordinal)
-        self.assertEqual(result2.freqstr, 'T')
-
-    def test_conv_annual(self):
-        # frequency conversion tests: from Annual Frequency
-
-        ival_A = Period(freq='A', year=2007)
-
-        ival_AJAN = Period(freq="A-JAN", year=2007)
-        ival_AJUN = Period(freq="A-JUN", year=2007)
-        ival_ANOV = Period(freq="A-NOV", year=2007)
-
-        ival_A_to_Q_start = Period(freq='Q', year=2007, quarter=1)
-        ival_A_to_Q_end = Period(freq='Q', year=2007, quarter=4)
-        ival_A_to_M_start = Period(freq='M', year=2007, month=1)
-        ival_A_to_M_end = Period(freq='M', year=2007, month=12)
-        ival_A_to_W_start = Period(freq='W', year=2007, month=1, day=1)
-        ival_A_to_W_end = Period(freq='W', year=2007, month=12, day=31)
-        ival_A_to_B_start = Period(freq='B', year=2007, month=1, day=1)
-        ival_A_to_B_end = Period(freq='B', year=2007, month=12, day=31)
-        ival_A_to_D_start = Period(freq='D', year=2007, month=1, day=1)
-        ival_A_to_D_end = Period(freq='D', year=2007, month=12, day=31)
-        ival_A_to_H_start = Period(freq='H', year=2007, month=1, day=1,
-                                   hour=0)
-        ival_A_to_H_end = Period(freq='H', year=2007, month=12, day=31,
-                                 hour=23)
-        ival_A_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_A_to_T_end = Period(freq='Min', year=2007, month=12, day=31,
-                                 hour=23, minute=59)
-        ival_A_to_S_start = Period(freq='S', year=2007, month=1, day=1,
-                                   hour=0, minute=0, second=0)
-        ival_A_to_S_end = Period(freq='S', year=2007, month=12, day=31,
-                                 hour=23, minute=59, second=59)
-
-        ival_AJAN_to_D_end = Period(freq='D', year=2007, month=1, day=31)
-        ival_AJAN_to_D_start = Period(freq='D', year=2006, month=2, day=1)
-        ival_AJUN_to_D_end = Period(freq='D', year=2007, month=6, day=30)
-        ival_AJUN_to_D_start = Period(freq='D', year=2006, month=7, day=1)
-        ival_ANOV_to_D_end = Period(freq='D', year=2007, month=11, day=30)
-        ival_ANOV_to_D_start = Period(freq='D', year=2006, month=12, day=1)
-
-        assert_equal(ival_A.asfreq('Q', 'S'), ival_A_to_Q_start)
-        assert_equal(ival_A.asfreq('Q', 'e'), ival_A_to_Q_end)
-        assert_equal(ival_A.asfreq('M', 's'), ival_A_to_M_start)
-        assert_equal(ival_A.asfreq('M', 'E'), ival_A_to_M_end)
-        assert_equal(ival_A.asfreq('W', 'S'), ival_A_to_W_start)
-        assert_equal(ival_A.asfreq('W', 'E'), ival_A_to_W_end)
-        assert_equal(ival_A.asfreq('B', 'S'), ival_A_to_B_start)
-        assert_equal(ival_A.asfreq('B', 'E'), ival_A_to_B_end)
-        assert_equal(ival_A.asfreq('D', 'S'), ival_A_to_D_start)
-        assert_equal(ival_A.asfreq('D', 'E'), ival_A_to_D_end)
-        assert_equal(ival_A.asfreq('H', 'S'), ival_A_to_H_start)
-        assert_equal(ival_A.asfreq('H', 'E'), ival_A_to_H_end)
-        assert_equal(ival_A.asfreq('min', 'S'), ival_A_to_T_start)
-        assert_equal(ival_A.asfreq('min', 'E'), ival_A_to_T_end)
-        assert_equal(ival_A.asfreq('T', 'S'), ival_A_to_T_start)
-        assert_equal(ival_A.asfreq('T', 'E'), ival_A_to_T_end)
-        assert_equal(ival_A.asfreq('S', 'S'), ival_A_to_S_start)
-        assert_equal(ival_A.asfreq('S', 'E'), ival_A_to_S_end)
-
-        assert_equal(ival_AJAN.asfreq('D', 'S'), ival_AJAN_to_D_start)
-        assert_equal(ival_AJAN.asfreq('D', 'E'), ival_AJAN_to_D_end)
-
-        assert_equal(ival_AJUN.asfreq('D', 'S'), ival_AJUN_to_D_start)
-        assert_equal(ival_AJUN.asfreq('D', 'E'), ival_AJUN_to_D_end)
-
-        assert_equal(ival_ANOV.asfreq('D', 'S'), ival_ANOV_to_D_start)
-        assert_equal(ival_ANOV.asfreq('D', 'E'), ival_ANOV_to_D_end)
-
-        assert_equal(ival_A.asfreq('A'), ival_A)
-
-    def test_conv_quarterly(self):
-        # frequency conversion tests: from Quarterly Frequency
-
-        ival_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_Q_end_of_year = Period(freq='Q', year=2007, quarter=4)
-
-        ival_QEJAN = Period(freq="Q-JAN", year=2007, quarter=1)
-        ival_QEJUN = Period(freq="Q-JUN", year=2007, quarter=1)
-
-        ival_Q_to_A = Period(freq='A', year=2007)
-        ival_Q_to_M_start = Period(freq='M', year=2007, month=1)
-        ival_Q_to_M_end = Period(freq='M', year=2007, month=3)
-        ival_Q_to_W_start = Period(freq='W', year=2007, month=1, day=1)
-        ival_Q_to_W_end = Period(freq='W', year=2007, month=3, day=31)
-        ival_Q_to_B_start = Period(freq='B', year=2007, month=1, day=1)
-        ival_Q_to_B_end = Period(freq='B', year=2007, month=3, day=30)
-        ival_Q_to_D_start = Period(freq='D', year=2007, month=1, day=1)
-        ival_Q_to_D_end = Period(freq='D', year=2007, month=3, day=31)
-        ival_Q_to_H_start = Period(freq='H', year=2007, month=1, day=1,
-                                   hour=0)
-        ival_Q_to_H_end = Period(freq='H', year=2007, month=3, day=31,
-                                 hour=23)
-        ival_Q_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_Q_to_T_end = Period(freq='Min', year=2007, month=3, day=31,
-                                 hour=23, minute=59)
-        ival_Q_to_S_start = Period(freq='S', year=2007, month=1, day=1,
-                                   hour=0, minute=0, second=0)
-        ival_Q_to_S_end = Period(freq='S', year=2007, month=3, day=31,
-                                 hour=23, minute=59, second=59)
-
-        ival_QEJAN_to_D_start = Period(freq='D', year=2006, month=2, day=1)
-        ival_QEJAN_to_D_end = Period(freq='D', year=2006, month=4, day=30)
-
-        ival_QEJUN_to_D_start = Period(freq='D', year=2006, month=7, day=1)
-        ival_QEJUN_to_D_end = Period(freq='D', year=2006, month=9, day=30)
-
-        assert_equal(ival_Q.asfreq('A'), ival_Q_to_A)
-        assert_equal(ival_Q_end_of_year.asfreq('A'), ival_Q_to_A)
-
-        assert_equal(ival_Q.asfreq('M', 'S'), ival_Q_to_M_start)
-        assert_equal(ival_Q.asfreq('M', 'E'), ival_Q_to_M_end)
-        assert_equal(ival_Q.asfreq('W', 'S'), ival_Q_to_W_start)
-        assert_equal(ival_Q.asfreq('W', 'E'), ival_Q_to_W_end)
-        assert_equal(ival_Q.asfreq('B', 'S'), ival_Q_to_B_start)
-        assert_equal(ival_Q.asfreq('B', 'E'), ival_Q_to_B_end)
-        assert_equal(ival_Q.asfreq('D', 'S'), ival_Q_to_D_start)
-        assert_equal(ival_Q.asfreq('D', 'E'), ival_Q_to_D_end)
-        assert_equal(ival_Q.asfreq('H', 'S'), ival_Q_to_H_start)
-        assert_equal(ival_Q.asfreq('H', 'E'), ival_Q_to_H_end)
-        assert_equal(ival_Q.asfreq('Min', 'S'), ival_Q_to_T_start)
-        assert_equal(ival_Q.asfreq('Min', 'E'), ival_Q_to_T_end)
-        assert_equal(ival_Q.asfreq('S', 'S'), ival_Q_to_S_start)
-        assert_equal(ival_Q.asfreq('S', 'E'), ival_Q_to_S_end)
-
-        assert_equal(ival_QEJAN.asfreq('D', 'S'), ival_QEJAN_to_D_start)
-        assert_equal(ival_QEJAN.asfreq('D', 'E'), ival_QEJAN_to_D_end)
-        assert_equal(ival_QEJUN.asfreq('D', 'S'), ival_QEJUN_to_D_start)
-        assert_equal(ival_QEJUN.asfreq('D', 'E'), ival_QEJUN_to_D_end)
-
-        assert_equal(ival_Q.asfreq('Q'), ival_Q)
-
-    def test_conv_monthly(self):
-        # frequency conversion tests: from Monthly Frequency
-
-        ival_M = Period(freq='M', year=2007, month=1)
-        ival_M_end_of_year = Period(freq='M', year=2007, month=12)
-        ival_M_end_of_quarter = Period(freq='M', year=2007, month=3)
-        ival_M_to_A = Period(freq='A', year=2007)
-        ival_M_to_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_M_to_W_start = Period(freq='W', year=2007, month=1, day=1)
-        ival_M_to_W_end = Period(freq='W', year=2007, month=1, day=31)
-        ival_M_to_B_start = Period(freq='B', year=2007, month=1, day=1)
-        ival_M_to_B_end = Period(freq='B', year=2007, month=1, day=31)
-        ival_M_to_D_start = Period(freq='D', year=2007, month=1, day=1)
-        ival_M_to_D_end = Period(freq='D', year=2007, month=1, day=31)
-        ival_M_to_H_start = Period(freq='H', year=2007, month=1, day=1,
-                                   hour=0)
-        ival_M_to_H_end = Period(freq='H', year=2007, month=1, day=31,
-                                 hour=23)
-        ival_M_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_M_to_T_end = Period(freq='Min', year=2007, month=1, day=31,
-                                 hour=23, minute=59)
-        ival_M_to_S_start = Period(freq='S', year=2007, month=1, day=1,
-                                   hour=0, minute=0, second=0)
-        ival_M_to_S_end = Period(freq='S', year=2007, month=1, day=31,
-                                 hour=23, minute=59, second=59)
-
-        assert_equal(ival_M.asfreq('A'), ival_M_to_A)
-        assert_equal(ival_M_end_of_year.asfreq('A'), ival_M_to_A)
-        assert_equal(ival_M.asfreq('Q'), ival_M_to_Q)
-        assert_equal(ival_M_end_of_quarter.asfreq('Q'), ival_M_to_Q)
-
-        assert_equal(ival_M.asfreq('W', 'S'), ival_M_to_W_start)
-        assert_equal(ival_M.asfreq('W', 'E'), ival_M_to_W_end)
-        assert_equal(ival_M.asfreq('B', 'S'), ival_M_to_B_start)
-        assert_equal(ival_M.asfreq('B', 'E'), ival_M_to_B_end)
-        assert_equal(ival_M.asfreq('D', 'S'), ival_M_to_D_start)
-        assert_equal(ival_M.asfreq('D', 'E'), ival_M_to_D_end)
-        assert_equal(ival_M.asfreq('H', 'S'), ival_M_to_H_start)
-        assert_equal(ival_M.asfreq('H', 'E'), ival_M_to_H_end)
-        assert_equal(ival_M.asfreq('Min', 'S'), ival_M_to_T_start)
-        assert_equal(ival_M.asfreq('Min', 'E'), ival_M_to_T_end)
-        assert_equal(ival_M.asfreq('S', 'S'), ival_M_to_S_start)
-        assert_equal(ival_M.asfreq('S', 'E'), ival_M_to_S_end)
-
-        assert_equal(ival_M.asfreq('M'), ival_M)
-
-    def test_conv_weekly(self):
-        # frequency conversion tests: from Weekly Frequency
-        ival_W = Period(freq='W', year=2007, month=1, day=1)
-
-        ival_WSUN = Period(freq='W', year=2007, month=1, day=7)
-        ival_WSAT = Period(freq='W-SAT', year=2007, month=1, day=6)
-        ival_WFRI = Period(freq='W-FRI', year=2007, month=1, day=5)
-        ival_WTHU = Period(freq='W-THU', year=2007, month=1, day=4)
-        ival_WWED = Period(freq='W-WED', year=2007, month=1, day=3)
-        ival_WTUE = Period(freq='W-TUE', year=2007, month=1, day=2)
-        ival_WMON = Period(freq='W-MON', year=2007, month=1, day=1)
-
-        ival_WSUN_to_D_start = Period(freq='D', year=2007, month=1, day=1)
-        ival_WSUN_to_D_end = Period(freq='D', year=2007, month=1, day=7)
-        ival_WSAT_to_D_start = Period(freq='D', year=2006, month=12, day=31)
-        ival_WSAT_to_D_end = Period(freq='D', year=2007, month=1, day=6)
-        ival_WFRI_to_D_start = Period(freq='D', year=2006, month=12, day=30)
-        ival_WFRI_to_D_end = Period(freq='D', year=2007, month=1, day=5)
-        ival_WTHU_to_D_start = Period(freq='D', year=2006, month=12, day=29)
-        ival_WTHU_to_D_end = Period(freq='D', year=2007, month=1, day=4)
-        ival_WWED_to_D_start = Period(freq='D', year=2006, month=12, day=28)
-        ival_WWED_to_D_end = Period(freq='D', year=2007, month=1, day=3)
-        ival_WTUE_to_D_start = Period(freq='D', year=2006, month=12, day=27)
-        ival_WTUE_to_D_end = Period(freq='D', year=2007, month=1, day=2)
-        ival_WMON_to_D_start = Period(freq='D', year=2006, month=12, day=26)
-        ival_WMON_to_D_end = Period(freq='D', year=2007, month=1, day=1)
-
-        ival_W_end_of_year = Period(freq='W', year=2007, month=12, day=31)
-        ival_W_end_of_quarter = Period(freq='W', year=2007, month=3, day=31)
-        ival_W_end_of_month = Period(freq='W', year=2007, month=1, day=31)
-        ival_W_to_A = Period(freq='A', year=2007)
-        ival_W_to_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_W_to_M = Period(freq='M', year=2007, month=1)
-
-        if Period(freq='D', year=2007, month=12, day=31).weekday == 6:
-            ival_W_to_A_end_of_year = Period(freq='A', year=2007)
-        else:
-            ival_W_to_A_end_of_year = Period(freq='A', year=2008)
-
-        if Period(freq='D', year=2007, month=3, day=31).weekday == 6:
-            ival_W_to_Q_end_of_quarter = Period(freq='Q', year=2007,
-                                                quarter=1)
-        else:
-            ival_W_to_Q_end_of_quarter = Period(freq='Q', year=2007,
-                                                quarter=2)
-
-        if Period(freq='D', year=2007, month=1, day=31).weekday == 6:
-            ival_W_to_M_end_of_month = Period(freq='M', year=2007, month=1)
-        else:
-            ival_W_to_M_end_of_month = Period(freq='M', year=2007, month=2)
-
-        ival_W_to_B_start = Period(freq='B', year=2007, month=1, day=1)
-        ival_W_to_B_end = Period(freq='B', year=2007, month=1, day=5)
-        ival_W_to_D_start = Period(freq='D', year=2007, month=1, day=1)
-        ival_W_to_D_end = Period(freq='D', year=2007, month=1, day=7)
-        ival_W_to_H_start = Period(freq='H', year=2007, month=1, day=1,
-                                   hour=0)
-        ival_W_to_H_end = Period(freq='H', year=2007, month=1, day=7,
-                                 hour=23)
-        ival_W_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_W_to_T_end = Period(freq='Min', year=2007, month=1, day=7,
-                                 hour=23, minute=59)
-        ival_W_to_S_start = Period(freq='S', year=2007, month=1, day=1,
-                                   hour=0, minute=0, second=0)
-        ival_W_to_S_end = Period(freq='S', year=2007, month=1, day=7,
-                                 hour=23, minute=59, second=59)
-
-        assert_equal(ival_W.asfreq('A'), ival_W_to_A)
-        assert_equal(ival_W_end_of_year.asfreq('A'),
-                     ival_W_to_A_end_of_year)
-        assert_equal(ival_W.asfreq('Q'), ival_W_to_Q)
-        assert_equal(ival_W_end_of_quarter.asfreq('Q'),
-                     ival_W_to_Q_end_of_quarter)
-        assert_equal(ival_W.asfreq('M'), ival_W_to_M)
-        assert_equal(ival_W_end_of_month.asfreq('M'),
-                     ival_W_to_M_end_of_month)
-
-        assert_equal(ival_W.asfreq('B', 'S'), ival_W_to_B_start)
-        assert_equal(ival_W.asfreq('B', 'E'), ival_W_to_B_end)
-
-        assert_equal(ival_W.asfreq('D', 'S'), ival_W_to_D_start)
-        assert_equal(ival_W.asfreq('D', 'E'), ival_W_to_D_end)
-
-        assert_equal(ival_WSUN.asfreq('D', 'S'), ival_WSUN_to_D_start)
-        assert_equal(ival_WSUN.asfreq('D', 'E'), ival_WSUN_to_D_end)
-        assert_equal(ival_WSAT.asfreq('D', 'S'), ival_WSAT_to_D_start)
-        assert_equal(ival_WSAT.asfreq('D', 'E'), ival_WSAT_to_D_end)
-        assert_equal(ival_WFRI.asfreq('D', 'S'), ival_WFRI_to_D_start)
-        assert_equal(ival_WFRI.asfreq('D', 'E'), ival_WFRI_to_D_end)
-        assert_equal(ival_WTHU.asfreq('D', 'S'), ival_WTHU_to_D_start)
-        assert_equal(ival_WTHU.asfreq('D', 'E'), ival_WTHU_to_D_end)
-        assert_equal(ival_WWED.asfreq('D', 'S'), ival_WWED_to_D_start)
-        assert_equal(ival_WWED.asfreq('D', 'E'), ival_WWED_to_D_end)
-        assert_equal(ival_WTUE.asfreq('D', 'S'), ival_WTUE_to_D_start)
-        assert_equal(ival_WTUE.asfreq('D', 'E'), ival_WTUE_to_D_end)
-        assert_equal(ival_WMON.asfreq('D', 'S'), ival_WMON_to_D_start)
-        assert_equal(ival_WMON.asfreq('D', 'E'), ival_WMON_to_D_end)
-
-        assert_equal(ival_W.asfreq('H', 'S'), ival_W_to_H_start)
-        assert_equal(ival_W.asfreq('H', 'E'), ival_W_to_H_end)
-        assert_equal(ival_W.asfreq('Min', 'S'), ival_W_to_T_start)
-        assert_equal(ival_W.asfreq('Min', 'E'), ival_W_to_T_end)
-        assert_equal(ival_W.asfreq('S', 'S'), ival_W_to_S_start)
-        assert_equal(ival_W.asfreq('S', 'E'), ival_W_to_S_end)
-
-        assert_equal(ival_W.asfreq('W'), ival_W)
-
-    def test_conv_weekly_legacy(self):
-        # frequency conversion tests: from Weekly Frequency
-
-        with tm.assert_produces_warning(FutureWarning):
-            ival_W = Period(freq='WK', year=2007, month=1, day=1)
-
-        with tm.assert_produces_warning(FutureWarning):
-            ival_WSUN = Period(freq='WK', year=2007, month=1, day=7)
-        with tm.assert_produces_warning(FutureWarning):
-            ival_WSAT = Period(freq='WK-SAT', year=2007, month=1, day=6)
-        with tm.assert_produces_warning(FutureWarning):
-            ival_WFRI = Period(freq='WK-FRI', year=2007, month=1, day=5)
-        with tm.assert_produces_warning(FutureWarning):
-            ival_WTHU = Period(freq='WK-THU', year=2007, month=1, day=4)
-        with tm.assert_produces_warning(FutureWarning):
-            ival_WWED = Period(freq='WK-WED', year=2007, month=1, day=3)
-        with tm.assert_produces_warning(FutureWarning):
-            ival_WTUE = Period(freq='WK-TUE', year=2007, month=1, day=2)
-        with tm.assert_produces_warning(FutureWarning):
-            ival_WMON = Period(freq='WK-MON', year=2007, month=1, day=1)
-
-        ival_WSUN_to_D_start = Period(freq='D', year=2007, month=1, day=1)
-        ival_WSUN_to_D_end = Period(freq='D', year=2007, month=1, day=7)
-        ival_WSAT_to_D_start = Period(freq='D', year=2006, month=12, day=31)
-        ival_WSAT_to_D_end = Period(freq='D', year=2007, month=1, day=6)
-        ival_WFRI_to_D_start = Period(freq='D', year=2006, month=12, day=30)
-        ival_WFRI_to_D_end = Period(freq='D', year=2007, month=1, day=5)
-        ival_WTHU_to_D_start = Period(freq='D', year=2006, month=12, day=29)
-        ival_WTHU_to_D_end = Period(freq='D', year=2007, month=1, day=4)
-        ival_WWED_to_D_start = Period(freq='D', year=2006, month=12, day=28)
-        ival_WWED_to_D_end = Period(freq='D', year=2007, month=1, day=3)
-        ival_WTUE_to_D_start = Period(freq='D', year=2006, month=12, day=27)
-        ival_WTUE_to_D_end = Period(freq='D', year=2007, month=1, day=2)
-        ival_WMON_to_D_start = Period(freq='D', year=2006, month=12, day=26)
-        ival_WMON_to_D_end = Period(freq='D', year=2007, month=1, day=1)
-
-        with tm.assert_produces_warning(FutureWarning):
-            ival_W_end_of_year = Period(freq='WK', year=2007, month=12, day=31)
-        with tm.assert_produces_warning(FutureWarning):
-            ival_W_end_of_quarter = Period(freq='WK', year=2007, month=3, day=31)
-        with tm.assert_produces_warning(FutureWarning):
-            ival_W_end_of_month = Period(freq='WK', year=2007, month=1, day=31)
-        ival_W_to_A = Period(freq='A', year=2007)
-        ival_W_to_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_W_to_M = Period(freq='M', year=2007, month=1)
-
-        if Period(freq='D', year=2007, month=12, day=31).weekday == 6:
-            ival_W_to_A_end_of_year = Period(freq='A', year=2007)
-        else:
-            ival_W_to_A_end_of_year = Period(freq='A', year=2008)
-
-        if Period(freq='D', year=2007, month=3, day=31).weekday == 6:
-            ival_W_to_Q_end_of_quarter = Period(freq='Q', year=2007,
-                                                quarter=1)
-        else:
-            ival_W_to_Q_end_of_quarter = Period(freq='Q', year=2007,
-                                                quarter=2)
-
-        if Period(freq='D', year=2007, month=1, day=31).weekday == 6:
-            ival_W_to_M_end_of_month = Period(freq='M', year=2007, month=1)
-        else:
-            ival_W_to_M_end_of_month = Period(freq='M', year=2007, month=2)
-
-        ival_W_to_B_start = Period(freq='B', year=2007, month=1, day=1)
-        ival_W_to_B_end = Period(freq='B', year=2007, month=1, day=5)
-        ival_W_to_D_start = Period(freq='D', year=2007, month=1, day=1)
-        ival_W_to_D_end = Period(freq='D', year=2007, month=1, day=7)
-        ival_W_to_H_start = Period(freq='H', year=2007, month=1, day=1,
-                                   hour=0)
-        ival_W_to_H_end = Period(freq='H', year=2007, month=1, day=7,
-                                 hour=23)
-        ival_W_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_W_to_T_end = Period(freq='Min', year=2007, month=1, day=7,
-                                 hour=23, minute=59)
-        ival_W_to_S_start = Period(freq='S', year=2007, month=1, day=1,
-                                   hour=0, minute=0, second=0)
-        ival_W_to_S_end = Period(freq='S', year=2007, month=1, day=7,
-                                 hour=23, minute=59, second=59)
-
-        assert_equal(ival_W.asfreq('A'), ival_W_to_A)
-        assert_equal(ival_W_end_of_year.asfreq('A'),
-                     ival_W_to_A_end_of_year)
-        assert_equal(ival_W.asfreq('Q'), ival_W_to_Q)
-        assert_equal(ival_W_end_of_quarter.asfreq('Q'),
-                     ival_W_to_Q_end_of_quarter)
-        assert_equal(ival_W.asfreq('M'), ival_W_to_M)
-        assert_equal(ival_W_end_of_month.asfreq('M'),
-                     ival_W_to_M_end_of_month)
-
-        assert_equal(ival_W.asfreq('B', 'S'), ival_W_to_B_start)
-        assert_equal(ival_W.asfreq('B', 'E'), ival_W_to_B_end)
-
-        assert_equal(ival_W.asfreq('D', 'S'), ival_W_to_D_start)
-        assert_equal(ival_W.asfreq('D', 'E'), ival_W_to_D_end)
-
-        assert_equal(ival_WSUN.asfreq('D', 'S'), ival_WSUN_to_D_start)
-        assert_equal(ival_WSUN.asfreq('D', 'E'), ival_WSUN_to_D_end)
-        assert_equal(ival_WSAT.asfreq('D', 'S'), ival_WSAT_to_D_start)
-        assert_equal(ival_WSAT.asfreq('D', 'E'), ival_WSAT_to_D_end)
-        assert_equal(ival_WFRI.asfreq('D', 'S'), ival_WFRI_to_D_start)
-        assert_equal(ival_WFRI.asfreq('D', 'E'), ival_WFRI_to_D_end)
-        assert_equal(ival_WTHU.asfreq('D', 'S'), ival_WTHU_to_D_start)
-        assert_equal(ival_WTHU.asfreq('D', 'E'), ival_WTHU_to_D_end)
-        assert_equal(ival_WWED.asfreq('D', 'S'), ival_WWED_to_D_start)
-        assert_equal(ival_WWED.asfreq('D', 'E'), ival_WWED_to_D_end)
-        assert_equal(ival_WTUE.asfreq('D', 'S'), ival_WTUE_to_D_start)
-        assert_equal(ival_WTUE.asfreq('D', 'E'), ival_WTUE_to_D_end)
-        assert_equal(ival_WMON.asfreq('D', 'S'), ival_WMON_to_D_start)
-        assert_equal(ival_WMON.asfreq('D', 'E'), ival_WMON_to_D_end)
-
-        assert_equal(ival_W.asfreq('H', 'S'), ival_W_to_H_start)
-        assert_equal(ival_W.asfreq('H', 'E'), ival_W_to_H_end)
-        assert_equal(ival_W.asfreq('Min', 'S'), ival_W_to_T_start)
-        assert_equal(ival_W.asfreq('Min', 'E'), ival_W_to_T_end)
-        assert_equal(ival_W.asfreq('S', 'S'), ival_W_to_S_start)
-        assert_equal(ival_W.asfreq('S', 'E'), ival_W_to_S_end)
-
-        with tm.assert_produces_warning(FutureWarning):
-            assert_equal(ival_W.asfreq('WK'), ival_W)
-
-    def test_conv_business(self):
-        # frequency conversion tests: from Business Frequency"
-
-        ival_B = Period(freq='B', year=2007, month=1, day=1)
-        ival_B_end_of_year = Period(freq='B', year=2007, month=12, day=31)
-        ival_B_end_of_quarter = Period(freq='B', year=2007, month=3, day=30)
-        ival_B_end_of_month = Period(freq='B', year=2007, month=1, day=31)
-        ival_B_end_of_week = Period(freq='B', year=2007, month=1, day=5)
-
-        ival_B_to_A = Period(freq='A', year=2007)
-        ival_B_to_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_B_to_M = Period(freq='M', year=2007, month=1)
-        ival_B_to_W = Period(freq='W', year=2007, month=1, day=7)
-        ival_B_to_D = Period(freq='D', year=2007, month=1, day=1)
-        ival_B_to_H_start = Period(freq='H', year=2007, month=1, day=1,
-                                   hour=0)
-        ival_B_to_H_end = Period(freq='H', year=2007, month=1, day=1,
-                                 hour=23)
-        ival_B_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_B_to_T_end = Period(freq='Min', year=2007, month=1, day=1,
-                                 hour=23, minute=59)
-        ival_B_to_S_start = Period(freq='S', year=2007, month=1, day=1,
-                                   hour=0, minute=0, second=0)
-        ival_B_to_S_end = Period(freq='S', year=2007, month=1, day=1,
-                                 hour=23, minute=59, second=59)
-
-        assert_equal(ival_B.asfreq('A'), ival_B_to_A)
-        assert_equal(ival_B_end_of_year.asfreq('A'), ival_B_to_A)
-        assert_equal(ival_B.asfreq('Q'), ival_B_to_Q)
-        assert_equal(ival_B_end_of_quarter.asfreq('Q'), ival_B_to_Q)
-        assert_equal(ival_B.asfreq('M'), ival_B_to_M)
-        assert_equal(ival_B_end_of_month.asfreq('M'), ival_B_to_M)
-        assert_equal(ival_B.asfreq('W'), ival_B_to_W)
-        assert_equal(ival_B_end_of_week.asfreq('W'), ival_B_to_W)
-
-        assert_equal(ival_B.asfreq('D'), ival_B_to_D)
-
-        assert_equal(ival_B.asfreq('H', 'S'), ival_B_to_H_start)
-        assert_equal(ival_B.asfreq('H', 'E'), ival_B_to_H_end)
-        assert_equal(ival_B.asfreq('Min', 'S'), ival_B_to_T_start)
-        assert_equal(ival_B.asfreq('Min', 'E'), ival_B_to_T_end)
-        assert_equal(ival_B.asfreq('S', 'S'), ival_B_to_S_start)
-        assert_equal(ival_B.asfreq('S', 'E'), ival_B_to_S_end)
-
-        assert_equal(ival_B.asfreq('B'), ival_B)
-
-    def test_conv_daily(self):
-        # frequency conversion tests: from Business Frequency"
-
-        ival_D = Period(freq='D', year=2007, month=1, day=1)
-        ival_D_end_of_year = Period(freq='D', year=2007, month=12, day=31)
-        ival_D_end_of_quarter = Period(freq='D', year=2007, month=3, day=31)
-        ival_D_end_of_month = Period(freq='D', year=2007, month=1, day=31)
-        ival_D_end_of_week = Period(freq='D', year=2007, month=1, day=7)
-
-        ival_D_friday = Period(freq='D', year=2007, month=1, day=5)
-        ival_D_saturday = Period(freq='D', year=2007, month=1, day=6)
-        ival_D_sunday = Period(freq='D', year=2007, month=1, day=7)
-        ival_D_monday = Period(freq='D', year=2007, month=1, day=8)
-
-        ival_B_friday = Period(freq='B', year=2007, month=1, day=5)
-        ival_B_monday = Period(freq='B', year=2007, month=1, day=8)
-
-        ival_D_to_A = Period(freq='A', year=2007)
-
-        ival_Deoq_to_AJAN = Period(freq='A-JAN', year=2008)
-        ival_Deoq_to_AJUN = Period(freq='A-JUN', year=2007)
-        ival_Deoq_to_ADEC = Period(freq='A-DEC', year=2007)
-
-        ival_D_to_QEJAN = Period(freq="Q-JAN", year=2007, quarter=4)
-        ival_D_to_QEJUN = Period(freq="Q-JUN", year=2007, quarter=3)
-        ival_D_to_QEDEC = Period(freq="Q-DEC", year=2007, quarter=1)
-
-        ival_D_to_M = Period(freq='M', year=2007, month=1)
-        ival_D_to_W = Period(freq='W', year=2007, month=1, day=7)
-
-        ival_D_to_H_start = Period(freq='H', year=2007, month=1, day=1,
-                                   hour=0)
-        ival_D_to_H_end = Period(freq='H', year=2007, month=1, day=1,
-                                 hour=23)
-        ival_D_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_D_to_T_end = Period(freq='Min', year=2007, month=1, day=1,
-                                 hour=23, minute=59)
-        ival_D_to_S_start = Period(freq='S', year=2007, month=1, day=1,
-                                   hour=0, minute=0, second=0)
-        ival_D_to_S_end = Period(freq='S', year=2007, month=1, day=1,
-                                 hour=23, minute=59, second=59)
-
-        assert_equal(ival_D.asfreq('A'), ival_D_to_A)
-
-        assert_equal(ival_D_end_of_quarter.asfreq('A-JAN'),
-                     ival_Deoq_to_AJAN)
-        assert_equal(ival_D_end_of_quarter.asfreq('A-JUN'),
-                     ival_Deoq_to_AJUN)
-        assert_equal(ival_D_end_of_quarter.asfreq('A-DEC'),
-                     ival_Deoq_to_ADEC)
-
-        assert_equal(ival_D_end_of_year.asfreq('A'), ival_D_to_A)
-        assert_equal(ival_D_end_of_quarter.asfreq('Q'), ival_D_to_QEDEC)
-        assert_equal(ival_D.asfreq("Q-JAN"), ival_D_to_QEJAN)
-        assert_equal(ival_D.asfreq("Q-JUN"), ival_D_to_QEJUN)
-        assert_equal(ival_D.asfreq("Q-DEC"), ival_D_to_QEDEC)
-        assert_equal(ival_D.asfreq('M'), ival_D_to_M)
-        assert_equal(ival_D_end_of_month.asfreq('M'), ival_D_to_M)
-        assert_equal(ival_D.asfreq('W'), ival_D_to_W)
-        assert_equal(ival_D_end_of_week.asfreq('W'), ival_D_to_W)
-
-        assert_equal(ival_D_friday.asfreq('B'), ival_B_friday)
-        assert_equal(ival_D_saturday.asfreq('B', 'S'), ival_B_friday)
-        assert_equal(ival_D_saturday.asfreq('B', 'E'), ival_B_monday)
-        assert_equal(ival_D_sunday.asfreq('B', 'S'), ival_B_friday)
-        assert_equal(ival_D_sunday.asfreq('B', 'E'), ival_B_monday)
-
-        assert_equal(ival_D.asfreq('H', 'S'), ival_D_to_H_start)
-        assert_equal(ival_D.asfreq('H', 'E'), ival_D_to_H_end)
-        assert_equal(ival_D.asfreq('Min', 'S'), ival_D_to_T_start)
-        assert_equal(ival_D.asfreq('Min', 'E'), ival_D_to_T_end)
-        assert_equal(ival_D.asfreq('S', 'S'), ival_D_to_S_start)
-        assert_equal(ival_D.asfreq('S', 'E'), ival_D_to_S_end)
-
-        assert_equal(ival_D.asfreq('D'), ival_D)
-
-    def test_conv_hourly(self):
-        # frequency conversion tests: from Hourly Frequency"
-
-        ival_H = Period(freq='H', year=2007, month=1, day=1, hour=0)
-        ival_H_end_of_year = Period(freq='H', year=2007, month=12, day=31,
-                                    hour=23)
-        ival_H_end_of_quarter = Period(freq='H', year=2007, month=3, day=31,
-                                       hour=23)
-        ival_H_end_of_month = Period(freq='H', year=2007, month=1, day=31,
-                                     hour=23)
-        ival_H_end_of_week = Period(freq='H', year=2007, month=1, day=7,
-                                    hour=23)
-        ival_H_end_of_day = Period(freq='H', year=2007, month=1, day=1,
-                                   hour=23)
-        ival_H_end_of_bus = Period(freq='H', year=2007, month=1, day=1,
-                                   hour=23)
-
-        ival_H_to_A = Period(freq='A', year=2007)
-        ival_H_to_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_H_to_M = Period(freq='M', year=2007, month=1)
-        ival_H_to_W = Period(freq='W', year=2007, month=1, day=7)
-        ival_H_to_D = Period(freq='D', year=2007, month=1, day=1)
-        ival_H_to_B = Period(freq='B', year=2007, month=1, day=1)
-
-        ival_H_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_H_to_T_end = Period(freq='Min', year=2007, month=1, day=1,
-                                 hour=0, minute=59)
-        ival_H_to_S_start = Period(freq='S', year=2007, month=1, day=1,
-                                   hour=0, minute=0, second=0)
-        ival_H_to_S_end = Period(freq='S', year=2007, month=1, day=1,
-                                 hour=0, minute=59, second=59)
-
-        assert_equal(ival_H.asfreq('A'), ival_H_to_A)
-        assert_equal(ival_H_end_of_year.asfreq('A'), ival_H_to_A)
-        assert_equal(ival_H.asfreq('Q'), ival_H_to_Q)
-        assert_equal(ival_H_end_of_quarter.asfreq('Q'), ival_H_to_Q)
-        assert_equal(ival_H.asfreq('M'), ival_H_to_M)
-        assert_equal(ival_H_end_of_month.asfreq('M'), ival_H_to_M)
-        assert_equal(ival_H.asfreq('W'), ival_H_to_W)
-        assert_equal(ival_H_end_of_week.asfreq('W'), ival_H_to_W)
-        assert_equal(ival_H.asfreq('D'), ival_H_to_D)
-        assert_equal(ival_H_end_of_day.asfreq('D'), ival_H_to_D)
-        assert_equal(ival_H.asfreq('B'), ival_H_to_B)
-        assert_equal(ival_H_end_of_bus.asfreq('B'), ival_H_to_B)
-
-        assert_equal(ival_H.asfreq('Min', 'S'), ival_H_to_T_start)
-        assert_equal(ival_H.asfreq('Min', 'E'), ival_H_to_T_end)
-        assert_equal(ival_H.asfreq('S', 'S'), ival_H_to_S_start)
-        assert_equal(ival_H.asfreq('S', 'E'), ival_H_to_S_end)
-
-        assert_equal(ival_H.asfreq('H'), ival_H)
-
-    def test_conv_minutely(self):
-        # frequency conversion tests: from Minutely Frequency"
-
-        ival_T = Period(freq='Min', year=2007, month=1, day=1,
-                        hour=0, minute=0)
-        ival_T_end_of_year = Period(freq='Min', year=2007, month=12, day=31,
-                                    hour=23, minute=59)
-        ival_T_end_of_quarter = Period(freq='Min', year=2007, month=3, day=31,
-                                       hour=23, minute=59)
-        ival_T_end_of_month = Period(freq='Min', year=2007, month=1, day=31,
-                                     hour=23, minute=59)
-        ival_T_end_of_week = Period(freq='Min', year=2007, month=1, day=7,
-                                    hour=23, minute=59)
-        ival_T_end_of_day = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=23, minute=59)
-        ival_T_end_of_bus = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=23, minute=59)
-        ival_T_end_of_hour = Period(freq='Min', year=2007, month=1, day=1,
-                                    hour=0, minute=59)
-
-        ival_T_to_A = Period(freq='A', year=2007)
-        ival_T_to_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_T_to_M = Period(freq='M', year=2007, month=1)
-        ival_T_to_W = Period(freq='W', year=2007, month=1, day=7)
-        ival_T_to_D = Period(freq='D', year=2007, month=1, day=1)
-        ival_T_to_B = Period(freq='B', year=2007, month=1, day=1)
-        ival_T_to_H = Period(freq='H', year=2007, month=1, day=1, hour=0)
-
-        ival_T_to_S_start = Period(freq='S', year=2007, month=1, day=1,
-                                   hour=0, minute=0, second=0)
-        ival_T_to_S_end = Period(freq='S', year=2007, month=1, day=1,
-                                 hour=0, minute=0, second=59)
-
-        assert_equal(ival_T.asfreq('A'), ival_T_to_A)
-        assert_equal(ival_T_end_of_year.asfreq('A'), ival_T_to_A)
-        assert_equal(ival_T.asfreq('Q'), ival_T_to_Q)
-        assert_equal(ival_T_end_of_quarter.asfreq('Q'), ival_T_to_Q)
-        assert_equal(ival_T.asfreq('M'), ival_T_to_M)
-        assert_equal(ival_T_end_of_month.asfreq('M'), ival_T_to_M)
-        assert_equal(ival_T.asfreq('W'), ival_T_to_W)
-        assert_equal(ival_T_end_of_week.asfreq('W'), ival_T_to_W)
-        assert_equal(ival_T.asfreq('D'), ival_T_to_D)
-        assert_equal(ival_T_end_of_day.asfreq('D'), ival_T_to_D)
-        assert_equal(ival_T.asfreq('B'), ival_T_to_B)
-        assert_equal(ival_T_end_of_bus.asfreq('B'), ival_T_to_B)
-        assert_equal(ival_T.asfreq('H'), ival_T_to_H)
-        assert_equal(ival_T_end_of_hour.asfreq('H'), ival_T_to_H)
-
-        assert_equal(ival_T.asfreq('S', 'S'), ival_T_to_S_start)
-        assert_equal(ival_T.asfreq('S', 'E'), ival_T_to_S_end)
-
-        assert_equal(ival_T.asfreq('Min'), ival_T)
-
-    def test_conv_secondly(self):
-        # frequency conversion tests: from Secondly Frequency"
-
-        ival_S = Period(freq='S', year=2007, month=1, day=1,
-                        hour=0, minute=0, second=0)
-        ival_S_end_of_year = Period(freq='S', year=2007, month=12, day=31,
-                                    hour=23, minute=59, second=59)
-        ival_S_end_of_quarter = Period(freq='S', year=2007, month=3, day=31,
-                                       hour=23, minute=59, second=59)
-        ival_S_end_of_month = Period(freq='S', year=2007, month=1, day=31,
-                                     hour=23, minute=59, second=59)
-        ival_S_end_of_week = Period(freq='S', year=2007, month=1, day=7,
-                                    hour=23, minute=59, second=59)
-        ival_S_end_of_day = Period(freq='S', year=2007, month=1, day=1,
-                                   hour=23, minute=59, second=59)
-        ival_S_end_of_bus = Period(freq='S', year=2007, month=1, day=1,
-                                   hour=23, minute=59, second=59)
-        ival_S_end_of_hour = Period(freq='S', year=2007, month=1, day=1,
-                                    hour=0, minute=59, second=59)
-        ival_S_end_of_minute = Period(freq='S', year=2007, month=1, day=1,
-                                      hour=0, minute=0, second=59)
-
-        ival_S_to_A = Period(freq='A', year=2007)
-        ival_S_to_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_S_to_M = Period(freq='M', year=2007, month=1)
-        ival_S_to_W = Period(freq='W', year=2007, month=1, day=7)
-        ival_S_to_D = Period(freq='D', year=2007, month=1, day=1)
-        ival_S_to_B = Period(freq='B', year=2007, month=1, day=1)
-        ival_S_to_H = Period(freq='H', year=2007, month=1, day=1,
-                             hour=0)
-        ival_S_to_T = Period(freq='Min', year=2007, month=1, day=1,
-                             hour=0, minute=0)
-
-        assert_equal(ival_S.asfreq('A'), ival_S_to_A)
-        assert_equal(ival_S_end_of_year.asfreq('A'), ival_S_to_A)
-        assert_equal(ival_S.asfreq('Q'), ival_S_to_Q)
-        assert_equal(ival_S_end_of_quarter.asfreq('Q'), ival_S_to_Q)
-        assert_equal(ival_S.asfreq('M'), ival_S_to_M)
-        assert_equal(ival_S_end_of_month.asfreq('M'), ival_S_to_M)
-        assert_equal(ival_S.asfreq('W'), ival_S_to_W)
-        assert_equal(ival_S_end_of_week.asfreq('W'), ival_S_to_W)
-        assert_equal(ival_S.asfreq('D'), ival_S_to_D)
-        assert_equal(ival_S_end_of_day.asfreq('D'), ival_S_to_D)
-        assert_equal(ival_S.asfreq('B'), ival_S_to_B)
-        assert_equal(ival_S_end_of_bus.asfreq('B'), ival_S_to_B)
-        assert_equal(ival_S.asfreq('H'), ival_S_to_H)
-        assert_equal(ival_S_end_of_hour.asfreq('H'), ival_S_to_H)
-        assert_equal(ival_S.asfreq('Min'), ival_S_to_T)
-        assert_equal(ival_S_end_of_minute.asfreq('Min'), ival_S_to_T)
-
-        assert_equal(ival_S.asfreq('S'), ival_S)
-
-    def test_asfreq_nat(self):
-        p = Period('NaT', freq='A')
-        result = p.asfreq('M')
-        self.assertEqual(result.ordinal, tslib.iNaT)
-        self.assertEqual(result.freq, 'M')
-
-    def test_asfreq_mult(self):
-        # normal freq to mult freq
-        p = Period(freq='A', year=2007)
-        # ordinal will not change
-        for freq in ['3A', offsets.YearEnd(3)]:
-            result = p.asfreq(freq)
-            expected = Period('2007', freq='3A')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-        # ordinal will not change
-        for freq in ['3A', offsets.YearEnd(3)]:
-            result = p.asfreq(freq, how='S')
-            expected = Period('2007', freq='3A')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-
-        # mult freq to normal freq
-        p = Period(freq='3A', year=2007)
-        # ordinal will change because how=E is the default
-        for freq in ['A', offsets.YearEnd()]:
-            result = p.asfreq(freq)
-            expected = Period('2009', freq='A')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-        # ordinal will not change
-        for freq in ['A', offsets.YearEnd()]:
-            result = p.asfreq(freq, how='S')
-            expected = Period('2007', freq='A')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-
-        p = Period(freq='A', year=2007)
-        for freq in ['2M', offsets.MonthEnd(2)]:
-            result = p.asfreq(freq)
-            expected = Period('2007-12', freq='2M')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-        for freq in ['2M', offsets.MonthEnd(2)]:
-            result = p.asfreq(freq, how='S')
-            expected = Period('2007-01', freq='2M')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-
-        p = Period(freq='3A', year=2007)
-        for freq in ['2M', offsets.MonthEnd(2)]:
-            result = p.asfreq(freq)
-            expected = Period('2009-12', freq='2M')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-        for freq in ['2M', offsets.MonthEnd(2)]:
-            result = p.asfreq(freq, how='S')
-            expected = Period('2007-01', freq='2M')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-
-    def test_asfreq_mult_nat(self):
-        # normal freq to mult freq
-        for p in [Period('NaT', freq='A'), Period('NaT', freq='3A'),
-                  Period('NaT', freq='2M'), Period('NaT', freq='3D')]:
-            for freq in ['3A', offsets.YearEnd(3)]:
-                result = p.asfreq(freq)
-                expected = Period('NaT', freq='3A')
-                self.assertEqual(result.ordinal, pd.tslib.iNaT)
-                self.assertEqual(result.freq, expected.freq)
-
-                result = p.asfreq(freq, how='S')
-                expected = Period('NaT', freq='3A')
-                self.assertEqual(result.ordinal, pd.tslib.iNaT)
-                self.assertEqual(result.freq, expected.freq)
-
-
-class TestPeriodIndex(tm.TestCase):
-
-    def setUp(self):
-        pass
-
-    def test_hash_error(self):
-        index = period_range('20010101', periods=10)
-        with tm.assertRaisesRegexp(TypeError,
-                                   "unhashable type: %r" %
-                                   type(index).__name__):
-            hash(index)
-
-    def test_make_time_series(self):
-        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        series = Series(1, index=index)
-        tm.assertIsInstance(series, Series)
-
-    def test_astype(self):
-        idx = period_range('1990', '2009', freq='A')
-
-        result = idx.astype('i8')
-        self.assert_numpy_array_equal(result, idx.values)
-
-    def test_constructor_use_start_freq(self):
-        # GH #1118
-        p = Period('4/2/2012', freq='B')
-        index = PeriodIndex(start=p, periods=10)
-        expected = PeriodIndex(start='4/2/2012', periods=10, freq='B')
-        self.assertTrue(index.equals(expected))
-
-    def test_constructor_field_arrays(self):
-        # GH #1264
-
-        years = np.arange(1990, 2010).repeat(4)[2:-2]
-        quarters = np.tile(np.arange(1, 5), 20)[2:-2]
-
-        index = PeriodIndex(year=years, quarter=quarters, freq='Q-DEC')
-        expected = period_range('1990Q3', '2009Q2', freq='Q-DEC')
-        self.assertTrue(index.equals(expected))
-
-        index2 = PeriodIndex(year=years, quarter=quarters, freq='2Q-DEC')
-        tm.assert_numpy_array_equal(index.asi8, index2.asi8)
-
-        index = PeriodIndex(year=years, quarter=quarters)
-        self.assertTrue(index.equals(expected))
-
-        years = [2007, 2007, 2007]
-        months = [1, 2]
-        self.assertRaises(ValueError, PeriodIndex, year=years, month=months,
-                          freq='M')
-        self.assertRaises(ValueError, PeriodIndex, year=years, month=months,
-                          freq='2M')
-        self.assertRaises(ValueError, PeriodIndex, year=years, month=months,
-                          freq='M', start=Period('2007-01', freq='M'))
-
-        years = [2007, 2007, 2007]
-        months = [1, 2, 3]
-        idx = PeriodIndex(year=years, month=months, freq='M')
-        exp = period_range('2007-01', periods=3, freq='M')
-        self.assertTrue(idx.equals(exp))
-
-    def test_constructor_U(self):
-        # U was used as undefined period
-        self.assertRaises(ValueError, period_range, '2007-1-1', periods=500,
-                          freq='X')
-
-    def test_constructor_arrays_negative_year(self):
-        years = np.arange(1960, 2000).repeat(4)
-        quarters = np.tile(lrange(1, 5), 40)
-
-        pindex = PeriodIndex(year=years, quarter=quarters)
-
-        self.assert_numpy_array_equal(pindex.year, years)
-        self.assert_numpy_array_equal(pindex.quarter, quarters)
-
-    def test_constructor_invalid_quarters(self):
-        self.assertRaises(ValueError, PeriodIndex, year=lrange(2000, 2004),
-                          quarter=lrange(4), freq='Q-DEC')
-
-    def test_constructor_corner(self):
-        self.assertRaises(ValueError, PeriodIndex, periods=10, freq='A')
-
-        start = Period('2007', freq='A-JUN')
-        end = Period('2010', freq='A-DEC')
-        self.assertRaises(ValueError, PeriodIndex, start=start, end=end)
-        self.assertRaises(ValueError, PeriodIndex, start=start)
-        self.assertRaises(ValueError, PeriodIndex, end=end)
-
-        result = period_range('2007-01', periods=10.5, freq='M')
-        exp = period_range('2007-01', periods=10, freq='M')
-        self.assertTrue(result.equals(exp))
-
-    def test_constructor_fromarraylike(self):
-        idx = period_range('2007-01', periods=20, freq='M')
-
-        self.assertRaises(ValueError, PeriodIndex, idx.values)
-        self.assertRaises(ValueError, PeriodIndex, list(idx.values))
-        self.assertRaises(ValueError, PeriodIndex,
-                          data=Period('2007', freq='A'))
-
-        result = PeriodIndex(iter(idx))
-        self.assertTrue(result.equals(idx))
-
-        result = PeriodIndex(idx)
-        self.assertTrue(result.equals(idx))
-
-        result = PeriodIndex(idx, freq='M')
-        self.assertTrue(result.equals(idx))
-
-        result = PeriodIndex(idx, freq=offsets.MonthEnd())
-        self.assertTrue(result.equals(idx))
-        self.assertTrue(result.freq, 'M')
-
-        result = PeriodIndex(idx, freq='2M')
-        self.assertTrue(result.equals(idx))
-        self.assertTrue(result.freq, '2M')
-
-        result = PeriodIndex(idx, freq=offsets.MonthEnd(2))
-        self.assertTrue(result.equals(idx))
-        self.assertTrue(result.freq, '2M')
-
-        result = PeriodIndex(idx, freq='D')
-        exp = idx.asfreq('D', 'e')
-        self.assertTrue(result.equals(exp))
-
-    def test_constructor_datetime64arr(self):
-        vals = np.arange(100000, 100000 + 10000, 100, dtype=np.int64)
-        vals = vals.view(np.dtype('M8[us]'))
-
-        self.assertRaises(ValueError, PeriodIndex, vals, freq='D')
-
-    def test_constructor_simple_new(self):
-        idx = period_range('2007-01', name='p', periods=20, freq='M')
-        result = idx._simple_new(idx, 'p', freq=idx.freq)
-        self.assertTrue(result.equals(idx))
-
-        result = idx._simple_new(idx.astype('i8'), 'p', freq=idx.freq)
-        self.assertTrue(result.equals(idx))
-
-    def test_constructor_nat(self):
-        self.assertRaises(
-            ValueError, period_range, start='NaT', end='2011-01-01', freq='M')
-        self.assertRaises(
-            ValueError, period_range, start='2011-01-01', end='NaT', freq='M')
-
-    def test_constructor_year_and_quarter(self):
-        year = pd.Series([2001, 2002, 2003])
-        quarter = year - 2000
-        idx = PeriodIndex(year=year, quarter=quarter)
-        strs = ['%dQ%d' % t for t in zip(quarter, year)]
-        lops = list(map(Period, strs))
-        p = PeriodIndex(lops)
-        tm.assert_index_equal(p, idx)
-
-    def test_constructor_freq_mult(self):
-        # GH #7811
-        for func in [PeriodIndex, period_range]:
-            # must be the same, but for sure...
-            pidx = func(start='2014-01', freq='2M', periods=4)
-            expected = PeriodIndex(['2014-01', '2014-03', '2014-05', '2014-07'], freq='M')
-            tm.assert_index_equal(pidx, expected)
-
-            pidx = func(start='2014-01-02', end='2014-01-15', freq='3D')
-            expected = PeriodIndex(['2014-01-02', '2014-01-05', '2014-01-08', '2014-01-11',
-                                    '2014-01-14'], freq='D')
-            tm.assert_index_equal(pidx, expected)
-
-            pidx = func(end='2014-01-01 17:00', freq='4H', periods=3)
-            expected = PeriodIndex(['2014-01-01 09:00', '2014-01-01 13:00',
-                                    '2014-01-01 17:00'], freq='4H')
-            tm.assert_index_equal(pidx, expected)
-
-        msg = ('Frequency must be positive, because it'
-               ' represents span: -1M')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            PeriodIndex(['2011-01'], freq='-1M')
-
-        msg = ('Frequency must be positive, because it'
-               ' represents span: 0M')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            PeriodIndex(['2011-01'], freq='0M')
-
-        msg = ('Frequency must be positive, because it'
-               ' represents span: 0M')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            period_range('2011-01', periods=3, freq='0M')
-
-    def test_constructor_freq_mult_dti_compat(self):
-        import itertools
-        mults = [1, 2, 3, 4, 5]
-        freqs = ['A', 'M', 'D', 'T', 'S']
-        for mult, freq in itertools.product(mults, freqs):
-            freqstr = str(mult) + freq
-            pidx = PeriodIndex(start='2014-04-01', freq=freqstr, periods=10)
-            expected = date_range(start='2014-04-01', freq=freqstr, periods=10).to_period(freq)
-            tm.assert_index_equal(pidx, expected)
-
-    def test_is_(self):
-        create_index = lambda: PeriodIndex(freq='A', start='1/1/2001',
-                                           end='12/1/2009')
-        index = create_index()
-        self.assertEqual(index.is_(index), True)
-        self.assertEqual(index.is_(create_index()), False)
-        self.assertEqual(index.is_(index.view()), True)
-        self.assertEqual(index.is_(index.view().view().view().view().view()), True)
-        self.assertEqual(index.view().is_(index), True)
-        ind2 = index.view()
-        index.name = "Apple"
-        self.assertEqual(ind2.is_(index), True)
-        self.assertEqual(index.is_(index[:]), False)
-        self.assertEqual(index.is_(index.asfreq('M')), False)
-        self.assertEqual(index.is_(index.asfreq('A')), False)
-        self.assertEqual(index.is_(index - 2), False)
-        self.assertEqual(index.is_(index - 0), False)
-
-    def test_comp_period(self):
-        idx = period_range('2007-01', periods=20, freq='M')
-
-        result = idx < idx[10]
-        exp = idx.values < idx.values[10]
-        self.assert_numpy_array_equal(result, exp)
-
-    def test_getitem_ndim2(self):
-        idx = period_range('2007-01', periods=3, freq='M')
-
-        result = idx[:, None]
-        # MPL kludge
-        tm.assertIsInstance(result, PeriodIndex)
-
-    def test_getitem_partial(self):
-        rng = period_range('2007-01', periods=50, freq='M')
-        ts = Series(np.random.randn(len(rng)), rng)
-
-        self.assertRaises(KeyError, ts.__getitem__, '2006')
-
-        result = ts['2008']
-        self.assertTrue((result.index.year == 2008).all())
-
-        result = ts['2008':'2009']
-        self.assertEqual(len(result), 24)
-
-        result = ts['2008-1':'2009-12']
-        self.assertEqual(len(result), 24)
-
-        result = ts['2008Q1':'2009Q4']
-        self.assertEqual(len(result), 24)
-
-        result = ts[:'2009']
-        self.assertEqual(len(result), 36)
-
-        result = ts['2009':]
-        self.assertEqual(len(result), 50 - 24)
-
-        exp = result
-        result = ts[24:]
-        assert_series_equal(exp, result)
-
-        ts = ts[10:].append(ts[10:])
-        self.assertRaisesRegexp(
-            KeyError, "left slice bound for non-unique label: '2008'",
-            ts.__getitem__, slice('2008', '2009'))
-
-    def test_getitem_datetime(self):
-        rng = period_range(start='2012-01-01', periods=10, freq='W-MON')
-        ts = Series(lrange(len(rng)), index=rng)
-
-        dt1 = datetime(2011, 10, 2)
-        dt4 = datetime(2012, 4, 20)
-
-        rs = ts[dt1:dt4]
-        assert_series_equal(rs, ts)
-
-    def test_slice_with_negative_step(self):
-        ts = Series(np.arange(20),
-                    period_range('2014-01', periods=20, freq='M'))
-        SLC = pd.IndexSlice
-
-        def assert_slices_equivalent(l_slc, i_slc):
-            assert_series_equal(ts[l_slc], ts.iloc[i_slc])
-            assert_series_equal(ts.loc[l_slc], ts.iloc[i_slc])
-            assert_series_equal(ts.ix[l_slc], ts.iloc[i_slc])
-
-        assert_slices_equivalent(SLC[Period('2014-10')::-1], SLC[9::-1])
-        assert_slices_equivalent(SLC['2014-10'::-1], SLC[9::-1])
-
-        assert_slices_equivalent(SLC[:Period('2014-10'):-1], SLC[:8:-1])
-        assert_slices_equivalent(SLC[:'2014-10':-1], SLC[:8:-1])
-
-        assert_slices_equivalent(SLC['2015-02':'2014-10':-1], SLC[13:8:-1])
-        assert_slices_equivalent(SLC[Period('2015-02'):Period('2014-10'):-1], SLC[13:8:-1])
-        assert_slices_equivalent(SLC['2015-02':Period('2014-10'):-1], SLC[13:8:-1])
-        assert_slices_equivalent(SLC[Period('2015-02'):'2014-10':-1], SLC[13:8:-1])
-
-        assert_slices_equivalent(SLC['2014-10':'2015-02':-1], SLC[:0])
-
-    def test_slice_with_zero_step_raises(self):
-        ts = Series(np.arange(20),
-                    period_range('2014-01', periods=20, freq='M'))
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts.loc[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts.ix[::0])
-
-    def test_contains(self):
-        rng = period_range('2007-01', freq='M', periods=10)
-
-        self.assertTrue(Period('2007-01', freq='M') in rng)
-        self.assertFalse(Period('2007-01', freq='D') in rng)
-        self.assertFalse(Period('2007-01', freq='2M') in rng)
-
-    def test_sub(self):
-        rng = period_range('2007-01', periods=50)
-
-        result = rng - 5
-        exp = rng + (-5)
-        self.assertTrue(result.equals(exp))
-
-    def test_periods_number_check(self):
-        self.assertRaises(
-            ValueError, period_range, '2011-1-1', '2012-1-1', 'B')
-
-    def test_tolist(self):
-        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        rs = index.tolist()
-        [tm.assertIsInstance(x, Period) for x in rs]
-
-        recon = PeriodIndex(rs)
-        self.assertTrue(index.equals(recon))
-
-    def test_to_timestamp(self):
-        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        series = Series(1, index=index, name='foo')
-
-        exp_index = date_range('1/1/2001', end='12/31/2009', freq='A-DEC')
-        result = series.to_timestamp(how='end')
-        self.assertTrue(result.index.equals(exp_index))
-        self.assertEqual(result.name, 'foo')
-
-        exp_index = date_range('1/1/2001', end='1/1/2009', freq='AS-JAN')
-        result = series.to_timestamp(how='start')
-        self.assertTrue(result.index.equals(exp_index))
-
-        def _get_with_delta(delta, freq='A-DEC'):
-            return date_range(to_datetime('1/1/2001') + delta,
-                              to_datetime('12/31/2009') + delta, freq=freq)
-
-        delta = timedelta(hours=23)
-        result = series.to_timestamp('H', 'end')
-        exp_index = _get_with_delta(delta)
-        self.assertTrue(result.index.equals(exp_index))
-
-        delta = timedelta(hours=23, minutes=59)
-        result = series.to_timestamp('T', 'end')
-        exp_index = _get_with_delta(delta)
-        self.assertTrue(result.index.equals(exp_index))
-
-        result = series.to_timestamp('S', 'end')
-        delta = timedelta(hours=23, minutes=59, seconds=59)
-        exp_index = _get_with_delta(delta)
-        self.assertTrue(result.index.equals(exp_index))
-
-        index = PeriodIndex(freq='H', start='1/1/2001', end='1/2/2001')
-        series = Series(1, index=index, name='foo')
-
-        exp_index = date_range('1/1/2001 00:59:59', end='1/2/2001 00:59:59',
-                               freq='H')
-        result = series.to_timestamp(how='end')
-        self.assertTrue(result.index.equals(exp_index))
-        self.assertEqual(result.name, 'foo')
-
-    def test_to_timestamp_quarterly_bug(self):
-        years = np.arange(1960, 2000).repeat(4)
-        quarters = np.tile(lrange(1, 5), 40)
-
-        pindex = PeriodIndex(year=years, quarter=quarters)
-
-        stamps = pindex.to_timestamp('D', 'end')
-        expected = DatetimeIndex([x.to_timestamp('D', 'end') for x in pindex])
-        self.assertTrue(stamps.equals(expected))
-
-    def test_to_timestamp_preserve_name(self):
-        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009',
-                            name='foo')
-        self.assertEqual(index.name, 'foo')
-
-        conv = index.to_timestamp('D')
-        self.assertEqual(conv.name, 'foo')
-
-    def test_to_timestamp_repr_is_code(self):
-        zs=[Timestamp('99-04-17 00:00:00',tz='UTC'),
-        Timestamp('2001-04-17 00:00:00',tz='UTC'),
-        Timestamp('2001-04-17 00:00:00',tz='America/Los_Angeles'),
-        Timestamp('2001-04-17 00:00:00',tz=None)]
-        for z in zs:
-            self.assertEqual( eval(repr(z)), z)
-
-    def test_to_timestamp_pi_nat(self):
-        # GH 7228
-        index = PeriodIndex(['NaT', '2011-01', '2011-02'], freq='M', name='idx')
-
-        result = index.to_timestamp('D')
-        expected = DatetimeIndex([pd.NaT, datetime(2011, 1, 1),
-                                  datetime(2011, 2, 1)], name='idx')
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.name, 'idx')
-
-        result2 = result.to_period(freq='M')
-        self.assertTrue(result2.equals(index))
-        self.assertEqual(result2.name, 'idx')
-
-        result3 = result.to_period(freq='3M')
-        exp = PeriodIndex(['NaT', '2011-01', '2011-02'], freq='3M', name='idx')
-        self.assert_index_equal(result3, exp)
-        self.assertEqual(result3.freqstr, '3M')
-
-        msg = ('Frequency must be positive, because it'
-               ' represents span: -2A')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            result.to_period(freq='-2A')
-
-    def test_to_timestamp_pi_mult(self):
-        idx = PeriodIndex(['2011-01', 'NaT', '2011-02'], freq='2M', name='idx')
-        result = idx.to_timestamp()
-        expected = DatetimeIndex(['2011-01-01', 'NaT', '2011-02-01'], name='idx')
-        self.assert_index_equal(result, expected)
-        result = idx.to_timestamp(how='E')
-        expected = DatetimeIndex(['2011-02-28', 'NaT', '2011-03-31'], name='idx')
-        self.assert_index_equal(result, expected)
-
-    def test_as_frame_columns(self):
-        rng = period_range('1/1/2000', periods=5)
-        df = DataFrame(randn(10, 5), columns=rng)
-
-        ts = df[rng[0]]
-        assert_series_equal(ts, df.ix[:, 0])
-
-        # GH # 1211
-        repr(df)
-
-        ts = df['1/1/2000']
-        assert_series_equal(ts, df.ix[:, 0])
-
-    def test_indexing(self):
-
-        # GH 4390, iat incorrectly indexing
-        index = period_range('1/1/2001', periods=10)
-        s = Series(randn(10), index=index)
-        expected = s[index[0]]
-        result = s.iat[0]
-        self.assertEqual(expected, result)
-
-    def test_frame_setitem(self):
-        rng = period_range('1/1/2000', periods=5)
-        rng.name = 'index'
-        df = DataFrame(randn(5, 3), index=rng)
-
-        df['Index'] = rng
-        rs = Index(df['Index'])
-        self.assertTrue(rs.equals(rng))
-
-        rs = df.reset_index().set_index('index')
-        tm.assertIsInstance(rs.index, PeriodIndex)
-        self.assertTrue(rs.index.equals(rng))
-
-    def test_period_set_index_reindex(self):
-        # GH 6631
-        df = DataFrame(np.random.random(6))
-        idx1 = period_range('2011/01/01', periods=6, freq='M')
-        idx2 = period_range('2013', periods=6, freq='A')
-
-        df = df.set_index(idx1)
-        self.assertTrue(df.index.equals(idx1))
-        df = df.set_index(idx2)
-        self.assertTrue(df.index.equals(idx2))
-
-    def test_frame_to_time_stamp(self):
-        K = 5
-        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        df = DataFrame(randn(len(index), K), index=index)
-        df['mix'] = 'a'
-
-        exp_index = date_range('1/1/2001', end='12/31/2009', freq='A-DEC')
-        result = df.to_timestamp('D', 'end')
-        self.assertTrue(result.index.equals(exp_index))
-        assert_almost_equal(result.values, df.values)
-
-        exp_index = date_range('1/1/2001', end='1/1/2009', freq='AS-JAN')
-        result = df.to_timestamp('D', 'start')
-        self.assertTrue(result.index.equals(exp_index))
-
-        def _get_with_delta(delta, freq='A-DEC'):
-            return date_range(to_datetime('1/1/2001') + delta,
-                              to_datetime('12/31/2009') + delta, freq=freq)
-
-        delta = timedelta(hours=23)
-        result = df.to_timestamp('H', 'end')
-        exp_index = _get_with_delta(delta)
-        self.assertTrue(result.index.equals(exp_index))
-
-        delta = timedelta(hours=23, minutes=59)
-        result = df.to_timestamp('T', 'end')
-        exp_index = _get_with_delta(delta)
-        self.assertTrue(result.index.equals(exp_index))
-
-        result = df.to_timestamp('S', 'end')
-        delta = timedelta(hours=23, minutes=59, seconds=59)
-        exp_index = _get_with_delta(delta)
-        self.assertTrue(result.index.equals(exp_index))
-
-        # columns
-        df = df.T
-
-        exp_index = date_range('1/1/2001', end='12/31/2009', freq='A-DEC')
-        result = df.to_timestamp('D', 'end', axis=1)
-        self.assertTrue(result.columns.equals(exp_index))
-        assert_almost_equal(result.values, df.values)
-
-        exp_index = date_range('1/1/2001', end='1/1/2009', freq='AS-JAN')
-        result = df.to_timestamp('D', 'start', axis=1)
-        self.assertTrue(result.columns.equals(exp_index))
-
-        delta = timedelta(hours=23)
-        result = df.to_timestamp('H', 'end', axis=1)
-        exp_index = _get_with_delta(delta)
-        self.assertTrue(result.columns.equals(exp_index))
-
-        delta = timedelta(hours=23, minutes=59)
-        result = df.to_timestamp('T', 'end', axis=1)
-        exp_index = _get_with_delta(delta)
-        self.assertTrue(result.columns.equals(exp_index))
-
-        result = df.to_timestamp('S', 'end', axis=1)
-        delta = timedelta(hours=23, minutes=59, seconds=59)
-        exp_index = _get_with_delta(delta)
-        self.assertTrue(result.columns.equals(exp_index))
-
-        # invalid axis
-        assertRaisesRegexp(ValueError, 'axis', df.to_timestamp, axis=2)
-
-        result1 = df.to_timestamp('5t', axis=1)
-        result2 = df.to_timestamp('t', axis=1)
-        expected = pd.date_range('2001-01-01', '2009-01-01', freq='AS')
-        self.assertTrue(isinstance(result1.columns, DatetimeIndex))
-        self.assertTrue(isinstance(result2.columns, DatetimeIndex))
-        self.assert_numpy_array_equal(result1.columns.asi8, expected.asi8)
-        self.assert_numpy_array_equal(result2.columns.asi8, expected.asi8)
-        # PeriodIndex.to_timestamp always use 'infer'
-        self.assertEqual(result1.columns.freqstr, 'AS-JAN')
-        self.assertEqual(result2.columns.freqstr, 'AS-JAN')
-
-    def test_index_duplicate_periods(self):
-        # monotonic
-        idx = PeriodIndex([2000, 2007, 2007, 2009, 2009], freq='A-JUN')
-        ts = Series(np.random.randn(len(idx)), index=idx)
-
-        result = ts[2007]
-        expected = ts[1:3]
-        assert_series_equal(result, expected)
-        result[:] = 1
-        self.assertTrue((ts[1:3] == 1).all())
-
-        # not monotonic
-        idx = PeriodIndex([2000, 2007, 2007, 2009, 2007], freq='A-JUN')
-        ts = Series(np.random.randn(len(idx)), index=idx)
-
-        result = ts[2007]
-        expected = ts[idx == 2007]
-        assert_series_equal(result, expected)
-
-    def test_index_unique(self):
-        idx = PeriodIndex([2000, 2007, 2007, 2009, 2009], freq='A-JUN')
-        expected = PeriodIndex([2000, 2007, 2009], freq='A-JUN')
-        self.assert_numpy_array_equal(idx.unique(), expected.values)
-        self.assertEqual(idx.nunique(), 3)
-
-        idx = PeriodIndex([2000, 2007, 2007, 2009, 2007], freq='A-JUN', tz='US/Eastern')
-        expected = PeriodIndex([2000, 2007, 2009], freq='A-JUN', tz='US/Eastern')
-        self.assert_numpy_array_equal(idx.unique(), expected.values)
-        self.assertEqual(idx.nunique(), 3)
-
-    def test_constructor(self):
-        pi = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        assert_equal(len(pi), 9)
-
-        pi = PeriodIndex(freq='Q', start='1/1/2001', end='12/1/2009')
-        assert_equal(len(pi), 4 * 9)
-
-        pi = PeriodIndex(freq='M', start='1/1/2001', end='12/1/2009')
-        assert_equal(len(pi), 12 * 9)
-
-        pi = PeriodIndex(freq='D', start='1/1/2001', end='12/31/2009')
-        assert_equal(len(pi), 365 * 9 + 2)
-
-        pi = PeriodIndex(freq='B', start='1/1/2001', end='12/31/2009')
-        assert_equal(len(pi), 261 * 9)
-
-        pi = PeriodIndex(freq='H', start='1/1/2001', end='12/31/2001 23:00')
-        assert_equal(len(pi), 365 * 24)
-
-        pi = PeriodIndex(freq='Min', start='1/1/2001', end='1/1/2001 23:59')
-        assert_equal(len(pi), 24 * 60)
-
-        pi = PeriodIndex(freq='S', start='1/1/2001', end='1/1/2001 23:59:59')
-        assert_equal(len(pi), 24 * 60 * 60)
-
-        start = Period('02-Apr-2005', 'B')
-        i1 = PeriodIndex(start=start, periods=20)
-        assert_equal(len(i1), 20)
-        assert_equal(i1.freq, start.freq)
-        assert_equal(i1[0], start)
-
-        end_intv = Period('2006-12-31', 'W')
-        i1 = PeriodIndex(end=end_intv, periods=10)
-        assert_equal(len(i1), 10)
-        assert_equal(i1.freq, end_intv.freq)
-        assert_equal(i1[-1], end_intv)
-
-        end_intv = Period('2006-12-31', '1w')
-        i2 = PeriodIndex(end=end_intv, periods=10)
-        assert_equal(len(i1), len(i2))
-        self.assertTrue((i1 == i2).all())
-        assert_equal(i1.freq, i2.freq)
-
-        end_intv = Period('2006-12-31', ('w', 1))
-        i2 = PeriodIndex(end=end_intv, periods=10)
-        assert_equal(len(i1), len(i2))
-        self.assertTrue((i1 == i2).all())
-        assert_equal(i1.freq, i2.freq)
-
-        try:
-            PeriodIndex(start=start, end=end_intv)
-            raise AssertionError('Cannot allow mixed freq for start and end')
-        except ValueError:
-            pass
-
-        end_intv = Period('2005-05-01', 'B')
-        i1 = PeriodIndex(start=start, end=end_intv)
-
-        try:
-            PeriodIndex(start=start)
-            raise AssertionError(
-                'Must specify periods if missing start or end')
-        except ValueError:
-            pass
-
-        # infer freq from first element
-        i2 = PeriodIndex([end_intv, Period('2005-05-05', 'B')])
-        assert_equal(len(i2), 2)
-        assert_equal(i2[0], end_intv)
-
-        i2 = PeriodIndex(np.array([end_intv, Period('2005-05-05', 'B')]))
-        assert_equal(len(i2), 2)
-        assert_equal(i2[0], end_intv)
-
-        # Mixed freq should fail
-        vals = [end_intv, Period('2006-12-31', 'w')]
-        self.assertRaises(ValueError, PeriodIndex, vals)
-        vals = np.array(vals)
-        self.assertRaises(ValueError, PeriodIndex, vals)
-
-    def test_shift(self):
-        pi1 = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        pi2 = PeriodIndex(freq='A', start='1/1/2002', end='12/1/2010')
-
-        self.assertTrue(pi1.shift(0).equals(pi1))
-
-        assert_equal(len(pi1), len(pi2))
-        assert_equal(pi1.shift(1).values, pi2.values)
-
-        pi1 = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        pi2 = PeriodIndex(freq='A', start='1/1/2000', end='12/1/2008')
-        assert_equal(len(pi1), len(pi2))
-        assert_equal(pi1.shift(-1).values, pi2.values)
-
-        pi1 = PeriodIndex(freq='M', start='1/1/2001', end='12/1/2009')
-        pi2 = PeriodIndex(freq='M', start='2/1/2001', end='1/1/2010')
-        assert_equal(len(pi1), len(pi2))
-        assert_equal(pi1.shift(1).values, pi2.values)
-
-        pi1 = PeriodIndex(freq='M', start='1/1/2001', end='12/1/2009')
-        pi2 = PeriodIndex(freq='M', start='12/1/2000', end='11/1/2009')
-        assert_equal(len(pi1), len(pi2))
-        assert_equal(pi1.shift(-1).values, pi2.values)
-
-        pi1 = PeriodIndex(freq='D', start='1/1/2001', end='12/1/2009')
-        pi2 = PeriodIndex(freq='D', start='1/2/2001', end='12/2/2009')
-        assert_equal(len(pi1), len(pi2))
-        assert_equal(pi1.shift(1).values, pi2.values)
-
-        pi1 = PeriodIndex(freq='D', start='1/1/2001', end='12/1/2009')
-        pi2 = PeriodIndex(freq='D', start='12/31/2000', end='11/30/2009')
-        assert_equal(len(pi1), len(pi2))
-        assert_equal(pi1.shift(-1).values, pi2.values)
-
-    def test_shift_nat(self):
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'], freq='M', name='idx')
-        result = idx.shift(1)
-        expected = PeriodIndex(['2011-02', '2011-03', 'NaT', '2011-05'], freq='M', name='idx')
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.name, expected.name)
-
-    def test_shift_ndarray(self):
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'], freq='M', name='idx')
-        result = idx.shift(np.array([1, 2, 3, 4]))
-        expected = PeriodIndex(['2011-02', '2011-04', 'NaT', '2011-08'], freq='M', name='idx')
-        self.assertTrue(result.equals(expected))
-
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'], freq='M', name='idx')
-        result = idx.shift(np.array([1, -2, 3, -4]))
-        expected = PeriodIndex(['2011-02', '2010-12', 'NaT', '2010-12'], freq='M', name='idx')
-        self.assertTrue(result.equals(expected))
-
-    def test_asfreq(self):
-        pi1 = PeriodIndex(freq='A', start='1/1/2001', end='1/1/2001')
-        pi2 = PeriodIndex(freq='Q', start='1/1/2001', end='1/1/2001')
-        pi3 = PeriodIndex(freq='M', start='1/1/2001', end='1/1/2001')
-        pi4 = PeriodIndex(freq='D', start='1/1/2001', end='1/1/2001')
-        pi5 = PeriodIndex(freq='H', start='1/1/2001', end='1/1/2001 00:00')
-        pi6 = PeriodIndex(freq='Min', start='1/1/2001', end='1/1/2001 00:00')
-        pi7 = PeriodIndex(freq='S', start='1/1/2001', end='1/1/2001 00:00:00')
-
-        self.assertEqual(pi1.asfreq('Q', 'S'), pi2)
-        self.assertEqual(pi1.asfreq('Q', 's'), pi2)
-        self.assertEqual(pi1.asfreq('M', 'start'), pi3)
-        self.assertEqual(pi1.asfreq('D', 'StarT'), pi4)
-        self.assertEqual(pi1.asfreq('H', 'beGIN'), pi5)
-        self.assertEqual(pi1.asfreq('Min', 'S'), pi6)
-        self.assertEqual(pi1.asfreq('S', 'S'), pi7)
-
-        self.assertEqual(pi2.asfreq('A', 'S'), pi1)
-        self.assertEqual(pi2.asfreq('M', 'S'), pi3)
-        self.assertEqual(pi2.asfreq('D', 'S'), pi4)
-        self.assertEqual(pi2.asfreq('H', 'S'), pi5)
-        self.assertEqual(pi2.asfreq('Min', 'S'), pi6)
-        self.assertEqual(pi2.asfreq('S', 'S'), pi7)
-
-        self.assertEqual(pi3.asfreq('A', 'S'), pi1)
-        self.assertEqual(pi3.asfreq('Q', 'S'), pi2)
-        self.assertEqual(pi3.asfreq('D', 'S'), pi4)
-        self.assertEqual(pi3.asfreq('H', 'S'), pi5)
-        self.assertEqual(pi3.asfreq('Min', 'S'), pi6)
-        self.assertEqual(pi3.asfreq('S', 'S'), pi7)
-
-        self.assertEqual(pi4.asfreq('A', 'S'), pi1)
-        self.assertEqual(pi4.asfreq('Q', 'S'), pi2)
-        self.assertEqual(pi4.asfreq('M', 'S'), pi3)
-        self.assertEqual(pi4.asfreq('H', 'S'), pi5)
-        self.assertEqual(pi4.asfreq('Min', 'S'), pi6)
-        self.assertEqual(pi4.asfreq('S', 'S'), pi7)
-
-        self.assertEqual(pi5.asfreq('A', 'S'), pi1)
-        self.assertEqual(pi5.asfreq('Q', 'S'), pi2)
-        self.assertEqual(pi5.asfreq('M', 'S'), pi3)
-        self.assertEqual(pi5.asfreq('D', 'S'), pi4)
-        self.assertEqual(pi5.asfreq('Min', 'S'), pi6)
-        self.assertEqual(pi5.asfreq('S', 'S'), pi7)
-
-        self.assertEqual(pi6.asfreq('A', 'S'), pi1)
-        self.assertEqual(pi6.asfreq('Q', 'S'), pi2)
-        self.assertEqual(pi6.asfreq('M', 'S'), pi3)
-        self.assertEqual(pi6.asfreq('D', 'S'), pi4)
-        self.assertEqual(pi6.asfreq('H', 'S'), pi5)
-        self.assertEqual(pi6.asfreq('S', 'S'), pi7)
-
-        self.assertEqual(pi7.asfreq('A', 'S'), pi1)
-        self.assertEqual(pi7.asfreq('Q', 'S'), pi2)
-        self.assertEqual(pi7.asfreq('M', 'S'), pi3)
-        self.assertEqual(pi7.asfreq('D', 'S'), pi4)
-        self.assertEqual(pi7.asfreq('H', 'S'), pi5)
-        self.assertEqual(pi7.asfreq('Min', 'S'), pi6)
-
-        self.assertRaises(ValueError, pi7.asfreq, 'T', 'foo')
-        result1 = pi1.asfreq('3M')
-        result2 = pi1.asfreq('M')
-        expected = PeriodIndex(freq='M', start='2001-12', end='2001-12')
-        self.assert_numpy_array_equal(result1.asi8, expected.asi8)
-        self.assertEqual(result1.freqstr, '3M')
-        self.assert_numpy_array_equal(result2.asi8, expected.asi8)
-        self.assertEqual(result2.freqstr, 'M')
-
-    def test_asfreq_nat(self):
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'], freq='M')
-        result = idx.asfreq(freq='Q')
-        expected = PeriodIndex(['2011Q1', '2011Q1', 'NaT', '2011Q2'], freq='Q')
-        self.assertTrue(result.equals(expected))
-
-    def test_asfreq_mult_pi(self):
-        pi = PeriodIndex(['2001-01', '2001-02', 'NaT', '2001-03'], freq='2M')
-
-        for freq in ['D', '3D']:
-            result = pi.asfreq(freq)
-            exp = PeriodIndex(['2001-02-28', '2001-03-31', 'NaT',
-                               '2001-04-30'], freq=freq)
-            self.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, exp.freq)
-
-            result = pi.asfreq(freq, how='S')
-            exp = PeriodIndex(['2001-01-01', '2001-02-01', 'NaT',
-                               '2001-03-01'], freq=freq)
-            self.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, exp.freq)
-
-    def test_period_index_length(self):
-        pi = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        assert_equal(len(pi), 9)
-
-        pi = PeriodIndex(freq='Q', start='1/1/2001', end='12/1/2009')
-        assert_equal(len(pi), 4 * 9)
-
-        pi = PeriodIndex(freq='M', start='1/1/2001', end='12/1/2009')
-        assert_equal(len(pi), 12 * 9)
-
-        start = Period('02-Apr-2005', 'B')
-        i1 = PeriodIndex(start=start, periods=20)
-        assert_equal(len(i1), 20)
-        assert_equal(i1.freq, start.freq)
-        assert_equal(i1[0], start)
-
-        end_intv = Period('2006-12-31', 'W')
-        i1 = PeriodIndex(end=end_intv, periods=10)
-        assert_equal(len(i1), 10)
-        assert_equal(i1.freq, end_intv.freq)
-        assert_equal(i1[-1], end_intv)
-
-        end_intv = Period('2006-12-31', '1w')
-        i2 = PeriodIndex(end=end_intv, periods=10)
-        assert_equal(len(i1), len(i2))
-        self.assertTrue((i1 == i2).all())
-        assert_equal(i1.freq, i2.freq)
-
-        end_intv = Period('2006-12-31', ('w', 1))
-        i2 = PeriodIndex(end=end_intv, periods=10)
-        assert_equal(len(i1), len(i2))
-        self.assertTrue((i1 == i2).all())
-        assert_equal(i1.freq, i2.freq)
-
-        try:
-            PeriodIndex(start=start, end=end_intv)
-            raise AssertionError('Cannot allow mixed freq for start and end')
-        except ValueError:
-            pass
-
-        end_intv = Period('2005-05-01', 'B')
-        i1 = PeriodIndex(start=start, end=end_intv)
-
-        try:
-            PeriodIndex(start=start)
-            raise AssertionError(
-                'Must specify periods if missing start or end')
-        except ValueError:
-            pass
-
-        # infer freq from first element
-        i2 = PeriodIndex([end_intv, Period('2005-05-05', 'B')])
-        assert_equal(len(i2), 2)
-        assert_equal(i2[0], end_intv)
-
-        i2 = PeriodIndex(np.array([end_intv, Period('2005-05-05', 'B')]))
-        assert_equal(len(i2), 2)
-        assert_equal(i2[0], end_intv)
-
-        # Mixed freq should fail
-        vals = [end_intv, Period('2006-12-31', 'w')]
-        self.assertRaises(ValueError, PeriodIndex, vals)
-        vals = np.array(vals)
-        self.assertRaises(ValueError, PeriodIndex, vals)
-
-    def test_frame_index_to_string(self):
-        index = PeriodIndex(['2011-1', '2011-2', '2011-3'], freq='M')
-        frame = DataFrame(np.random.randn(3, 4), index=index)
-
-        # it works!
-        frame.to_string()
-
-    def test_asfreq_ts(self):
-        index = PeriodIndex(freq='A', start='1/1/2001', end='12/31/2010')
-        ts = Series(np.random.randn(len(index)), index=index)
-        df = DataFrame(np.random.randn(len(index), 3), index=index)
-
-        result = ts.asfreq('D', how='end')
-        df_result = df.asfreq('D', how='end')
-        exp_index = index.asfreq('D', how='end')
-        self.assertEqual(len(result), len(ts))
-        self.assertTrue(result.index.equals(exp_index))
-        self.assertTrue(df_result.index.equals(exp_index))
-
-        result = ts.asfreq('D', how='start')
-        self.assertEqual(len(result), len(ts))
-        self.assertTrue(result.index.equals(index.asfreq('D', how='start')))
-
-    def test_badinput(self):
-        self.assertRaises(datetools.DateParseError, Period, '1/1/-2000', 'A')
-        # self.assertRaises(datetools.DateParseError, Period, '-2000', 'A')
-        # self.assertRaises(datetools.DateParseError, Period, '0', 'A')
-
-    def test_negative_ordinals(self):
-        p = Period(ordinal=-1000, freq='A')
-        p = Period(ordinal=0, freq='A')
-
-        idx1 = PeriodIndex(ordinal=[-1, 0, 1], freq='A')
-        idx2 = PeriodIndex(ordinal=np.array([-1, 0, 1]), freq='A')
-        tm.assert_numpy_array_equal(idx1,idx2)
-
-    def test_dti_to_period(self):
-        dti = DatetimeIndex(start='1/1/2005', end='12/1/2005', freq='M')
-        pi1 = dti.to_period()
-        pi2 = dti.to_period(freq='D')
-        pi3 = dti.to_period(freq='3D')
-
-        self.assertEqual(pi1[0], Period('Jan 2005', freq='M'))
-        self.assertEqual(pi2[0], Period('1/31/2005', freq='D'))
-        self.assertEqual(pi3[0], Period('1/31/2005', freq='3D'))
-
-        self.assertEqual(pi1[-1], Period('Nov 2005', freq='M'))
-        self.assertEqual(pi2[-1], Period('11/30/2005', freq='D'))
-        self.assertEqual(pi3[-1], Period('11/30/2005', freq='3D'))
-
-        tm.assert_index_equal(pi1, period_range('1/1/2005', '11/1/2005', freq='M'))
-        tm.assert_index_equal(pi2, period_range('1/1/2005', '11/1/2005', freq='M').asfreq('D'))
-        tm.assert_index_equal(pi3, period_range('1/1/2005', '11/1/2005', freq='M').asfreq('3D'))
-
-    def test_pindex_slice_index(self):
-        pi = PeriodIndex(start='1/1/10', end='12/31/12', freq='M')
-        s = Series(np.random.rand(len(pi)), index=pi)
-        res = s['2010']
-        exp = s[0:12]
-        assert_series_equal(res, exp)
-        res = s['2011']
-        exp = s[12:24]
-        assert_series_equal(res, exp)
-
-    def test_getitem_day(self):
-        # GH 6716
-        # Confirm DatetimeIndex and PeriodIndex works identically
-        didx = DatetimeIndex(start='2013/01/01', freq='D', periods=400)
-        pidx = PeriodIndex(start='2013/01/01', freq='D', periods=400)
-
-        for idx in [didx, pidx]:
-            # getitem against index should raise ValueError
-            values = ['2014', '2013/02', '2013/01/02',
-                      '2013/02/01 9H', '2013/02/01 09:00']
-            for v in values:
-
-                if _np_version_under1p9:
-                    with tm.assertRaises(ValueError):
-                        idx[v]
-                else:
-                    # GH7116
-                    # these show deprecations as we are trying
-                    # to slice with non-integer indexers
-                    #with tm.assertRaises(IndexError):
-                    #    idx[v]
-                    continue
-
-            s = Series(np.random.rand(len(idx)), index=idx)
-            assert_series_equal(s['2013/01'], s[0:31])
-            assert_series_equal(s['2013/02'], s[31:59])
-            assert_series_equal(s['2014'], s[365:])
-
-            invalid = ['2013/02/01 9H', '2013/02/01 09:00']
-            for v in invalid:
-                with tm.assertRaises(KeyError):
-                    s[v]
-
-    def test_range_slice_day(self):
-        # GH 6716
-        didx = DatetimeIndex(start='2013/01/01', freq='D', periods=400)
-        pidx = PeriodIndex(start='2013/01/01', freq='D', periods=400)
-
-        for idx in [didx, pidx]:
-            # slices against index should raise IndexError
-            values = ['2014', '2013/02', '2013/01/02',
-                      '2013/02/01 9H', '2013/02/01 09:00']
-            for v in values:
-                with tm.assertRaises(IndexError):
-                    idx[v:]
-
-            s = Series(np.random.rand(len(idx)), index=idx)
-
-            assert_series_equal(s['2013/01/02':], s[1:])
-            assert_series_equal(s['2013/01/02':'2013/01/05'], s[1:5])
-            assert_series_equal(s['2013/02':], s[31:])
-            assert_series_equal(s['2014':], s[365:])
-
-            invalid = ['2013/02/01 9H', '2013/02/01 09:00']
-            for v in invalid:
-                with tm.assertRaises(IndexError):
-                    idx[v:]
-
-    def test_getitem_seconds(self):
-        # GH 6716
-        didx = DatetimeIndex(start='2013/01/01 09:00:00', freq='S', periods=4000)
-        pidx = PeriodIndex(start='2013/01/01 09:00:00', freq='S', periods=4000)
-
-        for idx in [didx, pidx]:
-            # getitem against index should raise ValueError
-            values = ['2014', '2013/02', '2013/01/02',
-                      '2013/02/01 9H', '2013/02/01 09:00']
-            for v in values:
-                if _np_version_under1p9:
-                    with tm.assertRaises(ValueError):
-                        idx[v]
-                else:
-                    # GH7116
-                    # these show deprecations as we are trying
-                    # to slice with non-integer indexers
-                    #with tm.assertRaises(IndexError):
-                    #    idx[v]
-                    continue
-
-            s = Series(np.random.rand(len(idx)), index=idx)
-            assert_series_equal(s['2013/01/01 10:00'], s[3600:3660])
-            assert_series_equal(s['2013/01/01 9H'], s[:3600])
-            for d in ['2013/01/01', '2013/01', '2013']:
-                assert_series_equal(s[d], s)
-
-    def test_range_slice_seconds(self):
-        # GH 6716
-        didx = DatetimeIndex(start='2013/01/01 09:00:00', freq='S', periods=4000)
-        pidx = PeriodIndex(start='2013/01/01 09:00:00', freq='S', periods=4000)
-
-        for idx in [didx, pidx]:
-            # slices against index should raise IndexError
-            values = ['2014', '2013/02', '2013/01/02',
-                      '2013/02/01 9H', '2013/02/01 09:00']
-            for v in values:
-                with tm.assertRaises(IndexError):
-                    idx[v:]
-
-            s = Series(np.random.rand(len(idx)), index=idx)
-
-            assert_series_equal(s['2013/01/01 09:05':'2013/01/01 09:10'], s[300:660])
-            assert_series_equal(s['2013/01/01 10:00':'2013/01/01 10:05'], s[3600:3960])
-            assert_series_equal(s['2013/01/01 10H':], s[3600:])
-            assert_series_equal(s[:'2013/01/01 09:30'], s[:1860])
-            for d in ['2013/01/01', '2013/01', '2013']:
-                assert_series_equal(s[d:], s)
-
-    def test_range_slice_outofbounds(self):
-        # GH 5407
-        didx = DatetimeIndex(start='2013/10/01', freq='D', periods=10)
-        pidx = PeriodIndex(start='2013/10/01', freq='D', periods=10)
-
-        for idx in [didx, pidx]:
-            df = DataFrame(dict(units=[100 + i for i in range(10)]), index=idx)
-            empty = DataFrame(index=idx.__class__([], freq='D'), columns=['units'])
-            empty['units'] = empty['units'].astype('int64')
-
-            tm.assert_frame_equal(df['2013/09/01':'2013/09/30'], empty)
-            tm.assert_frame_equal(df['2013/09/30':'2013/10/02'], df.iloc[:2])
-            tm.assert_frame_equal(df['2013/10/01':'2013/10/02'], df.iloc[:2])
-            tm.assert_frame_equal(df['2013/10/02':'2013/09/30'], empty)
-            tm.assert_frame_equal(df['2013/10/15':'2013/10/17'], empty)
-            tm.assert_frame_equal(df['2013-06':'2013-09'], empty)
-            tm.assert_frame_equal(df['2013-11':'2013-12'], empty)
-
-    def test_pindex_fieldaccessor_nat(self):
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2012-03', '2012-04'], freq='D')
-        self.assert_numpy_array_equal(idx.year, np.array([2011, 2011, -1, 2012, 2012]))
-        self.assert_numpy_array_equal(idx.month, np.array([1, 2, -1, 3, 4]))
-
-    def test_pindex_qaccess(self):
-        pi = PeriodIndex(['2Q05', '3Q05', '4Q05', '1Q06', '2Q06'], freq='Q')
-        s = Series(np.random.rand(len(pi)), index=pi).cumsum()
-        # Todo: fix these accessors!
-        self.assertEqual(s['05Q4'], s[2])
-
-    def test_period_dt64_round_trip(self):
-        dti = date_range('1/1/2000', '1/7/2002', freq='B')
-        pi = dti.to_period()
-        self.assertTrue(pi.to_timestamp().equals(dti))
-
-        dti = date_range('1/1/2000', '1/7/2002', freq='B')
-        pi = dti.to_period(freq='H')
-        self.assertTrue(pi.to_timestamp().equals(dti))
-
-    def test_to_period_quarterly(self):
-        # make sure we can make the round trip
-        for month in MONTHS:
-            freq = 'Q-%s' % month
-            rng = period_range('1989Q3', '1991Q3', freq=freq)
-            stamps = rng.to_timestamp()
-            result = stamps.to_period(freq)
-            self.assertTrue(rng.equals(result))
-
-    def test_to_period_quarterlyish(self):
-        offsets = ['BQ', 'QS', 'BQS']
-        for off in offsets:
-            rng = date_range('01-Jan-2012', periods=8, freq=off)
-            prng = rng.to_period()
-            self.assertEqual(prng.freq, 'Q-DEC')
-
-    def test_to_period_annualish(self):
-        offsets = ['BA', 'AS', 'BAS']
-        for off in offsets:
-            rng = date_range('01-Jan-2012', periods=8, freq=off)
-            prng = rng.to_period()
-            self.assertEqual(prng.freq, 'A-DEC')
-
-    def test_to_period_monthish(self):
-        offsets = ['MS', 'BM']
-        for off in offsets:
-            rng = date_range('01-Jan-2012', periods=8, freq=off)
-            prng = rng.to_period()
-            self.assertEqual(prng.freq, 'M')
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            rng = date_range('01-Jan-2012', periods=8, freq='EOM')
-        prng = rng.to_period()
-        self.assertEqual(prng.freq, 'M')
-
-    def test_multiples(self):
-        result1 = Period('1989', freq='2A')
-        result2 = Period('1989', freq='A')
-        self.assertEqual(result1.ordinal, result2.ordinal)
-        self.assertEqual(result1.freqstr, '2A-DEC')
-        self.assertEqual(result2.freqstr, 'A-DEC')
-        self.assertEqual(result1.freq, offsets.YearEnd(2))
-        self.assertEqual(result2.freq, offsets.YearEnd())
-
-        self.assertEqual((result1 + 1).ordinal, result1.ordinal + 2)
-        self.assertEqual((result1 - 1).ordinal, result2.ordinal - 2)
-
-    def test_pindex_multiples(self):
-        pi = PeriodIndex(start='1/1/11', end='12/31/11', freq='2M')
-        expected = PeriodIndex(['2011-01', '2011-03', '2011-05', '2011-07',
-                                '2011-09', '2011-11'], freq='M')
-        tm.assert_index_equal(pi, expected)
-        self.assertEqual(pi.freq, offsets.MonthEnd(2))
-        self.assertEqual(pi.freqstr, '2M')
-
-        pi = period_range(start='1/1/11', end='12/31/11', freq='2M')
-        tm.assert_index_equal(pi, expected)
-        self.assertEqual(pi.freq, offsets.MonthEnd(2))
-        self.assertEqual(pi.freqstr, '2M')
-
-        pi = period_range(start='1/1/11', periods=6, freq='2M')
-        tm.assert_index_equal(pi, expected)
-        self.assertEqual(pi.freq, offsets.MonthEnd(2))
-        self.assertEqual(pi.freqstr, '2M')
-
-    def test_iteration(self):
-        index = PeriodIndex(start='1/1/10', periods=4, freq='B')
-
-        result = list(index)
-        tm.assertIsInstance(result[0], Period)
-        self.assertEqual(result[0].freq, index.freq)
-
-    def test_take(self):
-        index = PeriodIndex(start='1/1/10', end='12/31/12', freq='D', name='idx')
-        expected = PeriodIndex([datetime(2010, 1, 6), datetime(2010, 1, 7),
-                                datetime(2010, 1, 9), datetime(2010, 1, 13)],
-                                freq='D', name='idx')
-
-        taken1 = index.take([5, 6, 8, 12])
-        taken2 = index[[5, 6, 8, 12]]
-
-        for taken in [taken1, taken2]:
-            self.assertTrue(taken.equals(expected))
-            tm.assertIsInstance(taken, PeriodIndex)
-            self.assertEqual(taken.freq, index.freq)
-            self.assertEqual(taken.name, expected.name)
-
-    def test_joins(self):
-        index = period_range('1/1/2000', '1/20/2000', freq='D')
-
-        for kind in ['inner', 'outer', 'left', 'right']:
-            joined = index.join(index[:-5], how=kind)
-
-            tm.assertIsInstance(joined, PeriodIndex)
-            self.assertEqual(joined.freq, index.freq)
-
-    def test_join_self(self):
-        index = period_range('1/1/2000', '1/20/2000', freq='D')
-
-        for kind in ['inner', 'outer', 'left', 'right']:
-            res = index.join(index, how=kind)
-            self.assertIs(index, res)
-
-    def test_join_does_not_recur(self):
-        df = tm.makeCustomDataframe(3, 2, data_gen_f=lambda *args:
-                                    np.random.randint(2), c_idx_type='p',
-                                    r_idx_type='dt')
-        s = df.iloc[:2, 0]
-
-        res = s.index.join(df.columns, how='outer')
-        expected = Index([s.index[0], s.index[1],
-                          df.columns[0], df.columns[1]], object)
-        tm.assert_index_equal(res, expected)
-
-    def test_align_series(self):
-        rng = period_range('1/1/2000', '1/1/2010', freq='A')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts + ts[::2]
-        expected = ts + ts
-        expected[1::2] = np.nan
-        assert_series_equal(result, expected)
-
-        result = ts + _permute(ts[::2])
-        assert_series_equal(result, expected)
-
-        # it works!
-        for kind in ['inner', 'outer', 'left', 'right']:
-            ts.align(ts[::2], join=kind)
-        msg = "Input has different freq=D from PeriodIndex\\(freq=A-DEC\\)"
-        with assertRaisesRegexp(ValueError, msg):
-            ts + ts.asfreq('D', how="end")
-
-    def test_align_frame(self):
-        rng = period_range('1/1/2000', '1/1/2010', freq='A')
-        ts = DataFrame(np.random.randn(len(rng), 3), index=rng)
-
-        result = ts + ts[::2]
-        expected = ts + ts
-        expected.values[1::2] = np.nan
-        tm.assert_frame_equal(result, expected)
-
-        result = ts + _permute(ts[::2])
-        tm.assert_frame_equal(result, expected)
-
-    def test_union(self):
-        index = period_range('1/1/2000', '1/20/2000', freq='D')
-
-        result = index[:-5].union(index[10:])
-        self.assertTrue(result.equals(index))
-
-        # not in order
-        result = _permute(index[:-5]).union(_permute(index[10:]))
-        self.assertTrue(result.equals(index))
-
-        # raise if different frequencies
-        index = period_range('1/1/2000', '1/20/2000', freq='D')
-        index2 = period_range('1/1/2000', '1/20/2000', freq='W-WED')
-        self.assertRaises(ValueError, index.union, index2)
-
-        self.assertRaises(ValueError, index.join, index.to_timestamp())
-
-        index3 = period_range('1/1/2000', '1/20/2000', freq='2D')
-        self.assertRaises(ValueError, index.join, index3)
-
-    def test_intersection(self):
-        index = period_range('1/1/2000', '1/20/2000', freq='D')
-
-        result = index[:-5].intersection(index[10:])
-        self.assertTrue(result.equals(index[10:-5]))
-
-        # not in order
-        left = _permute(index[:-5])
-        right = _permute(index[10:])
-        result = left.intersection(right).sort_values()
-        self.assertTrue(result.equals(index[10:-5]))
-
-        # raise if different frequencies
-        index = period_range('1/1/2000', '1/20/2000', freq='D')
-        index2 = period_range('1/1/2000', '1/20/2000', freq='W-WED')
-        self.assertRaises(ValueError, index.intersection, index2)
-
-        index3 = period_range('1/1/2000', '1/20/2000', freq='2D')
-        self.assertRaises(ValueError, index.intersection, index3)
-
-    def test_fields(self):
-        # year, month, day, hour, minute
-        # second, weekofyear, week, dayofweek, weekday, dayofyear, quarter
-        # qyear
-        pi = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2005')
-        self._check_all_fields(pi)
-
-        pi = PeriodIndex(freq='Q', start='1/1/2001', end='12/1/2002')
-        self._check_all_fields(pi)
-
-        pi = PeriodIndex(freq='M', start='1/1/2001', end='1/1/2002')
-        self._check_all_fields(pi)
-
-        pi = PeriodIndex(freq='D', start='12/1/2001', end='6/1/2001')
-        self._check_all_fields(pi)
-
-        pi = PeriodIndex(freq='B', start='12/1/2001', end='6/1/2001')
-        self._check_all_fields(pi)
-
-        pi = PeriodIndex(freq='H', start='12/31/2001', end='1/1/2002 23:00')
-        self._check_all_fields(pi)
-
-        pi = PeriodIndex(freq='Min', start='12/31/2001', end='1/1/2002 00:20')
-        self._check_all_fields(pi)
-
-        pi = PeriodIndex(freq='S', start='12/31/2001 00:00:00',
-                         end='12/31/2001 00:05:00')
-        self._check_all_fields(pi)
-
-        end_intv = Period('2006-12-31', 'W')
-        i1 = PeriodIndex(end=end_intv, periods=10)
-        self._check_all_fields(i1)
-
-    def _check_all_fields(self, periodindex):
-        fields = ['year', 'month', 'day', 'hour', 'minute',
-                  'second', 'weekofyear', 'week', 'dayofweek',
-                  'weekday', 'dayofyear', 'quarter', 'qyear', 'days_in_month']
-
-        periods = list(periodindex)
-
-        for field in fields:
-            field_idx = getattr(periodindex, field)
-            assert_equal(len(periodindex), len(field_idx))
-            for x, val in zip(periods, field_idx):
-                assert_equal(getattr(x, field), val)
-
-    def test_is_full(self):
-        index = PeriodIndex([2005, 2007, 2009], freq='A')
-        self.assertFalse(index.is_full)
-
-        index = PeriodIndex([2005, 2006, 2007], freq='A')
-        self.assertTrue(index.is_full)
-
-        index = PeriodIndex([2005, 2005, 2007], freq='A')
-        self.assertFalse(index.is_full)
-
-        index = PeriodIndex([2005, 2005, 2006], freq='A')
-        self.assertTrue(index.is_full)
-
-        index = PeriodIndex([2006, 2005, 2005], freq='A')
-        self.assertRaises(ValueError, getattr, index, 'is_full')
-
-        self.assertTrue(index[:0].is_full)
-
-    def test_map(self):
-        index = PeriodIndex([2005, 2007, 2009], freq='A')
-        result = index.map(lambda x: x + 1)
-        expected = index + 1
-        self.assertTrue(result.equals(expected))
-
-        result = index.map(lambda x: x.ordinal)
-        exp = [x.ordinal for x in index]
-        tm.assert_numpy_array_equal(result, exp)
-
-    def test_map_with_string_constructor(self):
-        raw = [2005, 2007, 2009]
-        index = PeriodIndex(raw, freq='A')
-        types = str,
-
-        if compat.PY3:
-            # unicode
-            types += compat.text_type,
-
-        for t in types:
-            expected = np.array(lmap(t, raw), dtype=object)
-            res = index.map(t)
-
-            # should return an array
-            tm.assertIsInstance(res, np.ndarray)
-
-            # preserve element types
-            self.assertTrue(all(isinstance(resi, t) for resi in res))
-
-            # dtype should be object
-            self.assertEqual(res.dtype, np.dtype('object').type)
-
-            # lastly, values should compare equal
-            tm.assert_numpy_array_equal(res, expected)
-
-    def test_convert_array_of_periods(self):
-        rng = period_range('1/1/2000', periods=20, freq='D')
-        periods = list(rng)
-
-        result = pd.Index(periods)
-        tm.assertIsInstance(result, PeriodIndex)
-
-    def test_with_multi_index(self):
-        # #1705
-        index = date_range('1/1/2012', periods=4, freq='12H')
-        index_as_arrays = [index.to_period(freq='D'), index.hour]
-
-        s = Series([0, 1, 2, 3], index_as_arrays)
-
-        tm.assertIsInstance(s.index.levels[0], PeriodIndex)
-
-        tm.assertIsInstance(s.index.values[0][0], Period)
-
-    def test_to_datetime_1703(self):
-        index = period_range('1/1/2012', periods=4, freq='D')
-
-        result = index.to_datetime()
-        self.assertEqual(result[0], Timestamp('1/1/2012'))
-
-    def test_get_loc_msg(self):
-        idx = period_range('2000-1-1', freq='A', periods=10)
-        bad_period = Period('2012', 'A')
-        self.assertRaises(KeyError, idx.get_loc, bad_period)
-
-        try:
-            idx.get_loc(bad_period)
-        except KeyError as inst:
-            self.assertEqual(inst.args[0], bad_period)
-
-    def test_append_concat(self):
-        # #1815
-        d1 = date_range('12/31/1990', '12/31/1999', freq='A-DEC')
-        d2 = date_range('12/31/2000', '12/31/2009', freq='A-DEC')
-
-        s1 = Series(np.random.randn(10), d1)
-        s2 = Series(np.random.randn(10), d2)
-
-        s1 = s1.to_period()
-        s2 = s2.to_period()
-
-        # drops index
-        result = pd.concat([s1, s2])
-        tm.assertIsInstance(result.index, PeriodIndex)
-        self.assertEqual(result.index[0], s1.index[0])
-
-    def test_pickle_freq(self):
-        # GH2891
-        prng = period_range('1/1/2011', '1/1/2012', freq='M')
-        new_prng = self.round_trip_pickle(prng)
-        self.assertEqual(new_prng.freq, offsets.MonthEnd())
-        self.assertEqual(new_prng.freqstr, 'M')
-
-    def test_slice_keep_name(self):
-        idx = period_range('20010101', periods=10, freq='D', name='bob')
-        self.assertEqual(idx.name, idx[1:].name)
-
-    def test_factorize(self):
-        idx1 = PeriodIndex(['2014-01', '2014-01', '2014-02', '2014-02',
-                            '2014-03', '2014-03'], freq='M')
-
-        exp_arr = np.array([0, 0, 1, 1, 2, 2])
-        exp_idx = PeriodIndex(['2014-01', '2014-02', '2014-03'], freq='M')
-
-        arr, idx = idx1.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assertTrue(idx.equals(exp_idx))
-
-        arr, idx = idx1.factorize(sort=True)
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assertTrue(idx.equals(exp_idx))
-
-        idx2 = pd.PeriodIndex(['2014-03', '2014-03', '2014-02', '2014-01',
-                               '2014-03', '2014-01'], freq='M')
-
-        exp_arr = np.array([2, 2, 1, 0, 2, 0])
-        arr, idx = idx2.factorize(sort=True)
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assertTrue(idx.equals(exp_idx))
-
-        exp_arr = np.array([0, 0, 1, 2, 0, 2])
-        exp_idx = PeriodIndex(['2014-03', '2014-02', '2014-01'], freq='M')
-        arr, idx = idx2.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assertTrue(idx.equals(exp_idx))
-
-    def test_recreate_from_data(self):
-        for o in ['M', 'Q', 'A', 'D', 'B', 'T', 'S', 'L', 'U', 'N', 'H']:
-            org = PeriodIndex(start='2001/04/01', freq=o, periods=1)
-            idx = PeriodIndex(org.values, freq=o)
-            self.assertTrue(idx.equals(org))
-
-    def test_combine_first(self):
-        # GH 3367
-        didx = pd.DatetimeIndex(start='1950-01-31', end='1950-07-31', freq='M')
-        pidx = pd.PeriodIndex(start=pd.Period('1950-1'), end=pd.Period('1950-7'), freq='M')
-        # check to be consistent with DatetimeIndex
-        for idx in [didx, pidx]:
-            a = pd.Series([1, np.nan, np.nan, 4, 5, np.nan, 7], index=idx)
-            b = pd.Series([9, 9, 9, 9, 9, 9, 9], index=idx)
-
-            result = a.combine_first(b)
-            expected = pd.Series([1, 9, 9, 4, 5, 9, 7], index=idx, dtype=np.float64)
-            tm.assert_series_equal(result, expected)
-
-    def test_searchsorted(self):
-        for freq in ['D', '2D']:
-            pidx = pd.PeriodIndex(['2014-01-01', '2014-01-02', '2014-01-03',
-                                   '2014-01-04', '2014-01-05'], freq=freq)
-
-            p1 = pd.Period('2014-01-01', freq=freq)
-            self.assertEqual(pidx.searchsorted(p1), 0)
-
-            p2 = pd.Period('2014-01-04', freq=freq)
-            self.assertEqual(pidx.searchsorted(p2), 3)
-
-            msg = "Input has different freq=H from PeriodIndex"
-            with self.assertRaisesRegexp(ValueError, msg):
-                pidx.searchsorted(pd.Period('2014-01-01', freq='H'))
-
-            msg = "Input has different freq=5D from PeriodIndex"
-            with self.assertRaisesRegexp(ValueError, msg):
-                pidx.searchsorted(pd.Period('2014-01-01', freq='5D'))
-
-
-    def test_round_trip(self):
-
-        p = Period('2000Q1')
-        new_p = self.round_trip_pickle(p)
-        self.assertEqual(new_p, p)
-
-def _permute(obj):
-    return obj.take(np.random.permutation(len(obj)))
-
-
-class TestMethods(tm.TestCase):
-    "Base test class for MaskedArrays."
-
-    def test_add(self):
-        dt1 = Period(freq='D', year=2008, month=1, day=1)
-        dt2 = Period(freq='D', year=2008, month=1, day=2)
-        assert_equal(dt1 + 1, dt2)
-        #
-        # GH 4731
-        msg = "unsupported operand type\(s\)"
-        with tm.assertRaisesRegexp(TypeError, msg):
-            dt1 + "str"
-
-        with tm.assertRaisesRegexp(TypeError, msg):
-            dt1 + dt2
-
-    def test_add_offset(self):
-        # freq is DateOffset
-        for freq in ['A', '2A', '3A']:
-            p = Period('2011', freq=freq)
-            self.assertEqual(p + offsets.YearEnd(2), Period('2013', freq=freq))
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(365, 'D'), timedelta(365)]:
-                with tm.assertRaises(ValueError):
-                    p + o
-
-        for freq in ['M', '2M', '3M']:
-            p = Period('2011-03', freq=freq)
-            self.assertEqual(p + offsets.MonthEnd(2), Period('2011-05', freq=freq))
-            self.assertEqual(p + offsets.MonthEnd(12), Period('2012-03', freq=freq))
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(365, 'D'), timedelta(365)]:
-                with tm.assertRaises(ValueError):
-                    p + o
-
-        # freq is Tick
-        for freq in ['D', '2D', '3D']:
-            p = Period('2011-04-01', freq=freq)
-            self.assertEqual(p + offsets.Day(5), Period('2011-04-06', freq=freq))
-            self.assertEqual(p + offsets.Hour(24), Period('2011-04-02', freq=freq))
-            self.assertEqual(p + np.timedelta64(2, 'D'), Period('2011-04-03', freq=freq))
-            self.assertEqual(p + np.timedelta64(3600 * 24, 's'), Period('2011-04-02', freq=freq))
-            self.assertEqual(p + timedelta(-2), Period('2011-03-30', freq=freq))
-            self.assertEqual(p + timedelta(hours=48), Period('2011-04-03', freq=freq))
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(4, 'h'), timedelta(hours=23)]:
-                with tm.assertRaises(ValueError):
-                    p + o
-
-        for freq in ['H', '2H', '3H']:
-            p = Period('2011-04-01 09:00', freq=freq)
-            self.assertEqual(p + offsets.Day(2), Period('2011-04-03 09:00', freq=freq))
-            self.assertEqual(p + offsets.Hour(3), Period('2011-04-01 12:00', freq=freq))
-            self.assertEqual(p + np.timedelta64(3, 'h'), Period('2011-04-01 12:00', freq=freq))
-            self.assertEqual(p + np.timedelta64(3600, 's'), Period('2011-04-01 10:00', freq=freq))
-            self.assertEqual(p + timedelta(minutes=120), Period('2011-04-01 11:00', freq=freq))
-            self.assertEqual(p + timedelta(days=4, minutes=180), Period('2011-04-05 12:00', freq=freq))
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(3200, 's'), timedelta(hours=23, minutes=30)]:
-                with tm.assertRaises(ValueError):
-                    p + o
-
-    def test_add_offset_nat(self):
-        # freq is DateOffset
-        for freq in ['A', '2A', '3A']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.YearEnd(2)]:
-                self.assertEqual((p + o).ordinal, tslib.iNaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(365, 'D'), timedelta(365)]:
-                with tm.assertRaises(ValueError):
-                    p + o
-
-        for freq in ['M', '2M', '3M']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.MonthEnd(2), offsets.MonthEnd(12)]:
-                self.assertEqual((p + o).ordinal, tslib.iNaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(365, 'D'), timedelta(365)]:
-                with tm.assertRaises(ValueError):
-                    p + o
-
-        # freq is Tick
-        for freq in ['D', '2D', '3D']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.Day(5), offsets.Hour(24), np.timedelta64(2, 'D'),
-                      np.timedelta64(3600 * 24, 's'), timedelta(-2), timedelta(hours=48)]:
-                self.assertEqual((p + o).ordinal, tslib.iNaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(4, 'h'), timedelta(hours=23)]:
-                with tm.assertRaises(ValueError):
-                    p + o
-
-        for freq in ['H', '2H', '3H']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.Day(2), offsets.Hour(3), np.timedelta64(3, 'h'),
-                      np.timedelta64(3600, 's'), timedelta(minutes=120),
-                      timedelta(days=4, minutes=180)]:
-                self.assertEqual((p + o).ordinal, tslib.iNaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(3200, 's'), timedelta(hours=23, minutes=30)]:
-                with tm.assertRaises(ValueError):
-                    p + o
-
-    def test_sub_offset(self):
-        # freq is DateOffset
-        for freq in ['A', '2A', '3A']:
-            p = Period('2011', freq=freq)
-            self.assertEqual(p - offsets.YearEnd(2), Period('2009', freq=freq))
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(365, 'D'), timedelta(365)]:
-                with tm.assertRaises(ValueError):
-                    p - o
-
-        for freq in ['M', '2M', '3M']:
-            p = Period('2011-03', freq=freq)
-            self.assertEqual(p - offsets.MonthEnd(2), Period('2011-01', freq=freq))
-            self.assertEqual(p - offsets.MonthEnd(12), Period('2010-03', freq=freq))
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(365, 'D'), timedelta(365)]:
-                with tm.assertRaises(ValueError):
-                    p - o
-
-        # freq is Tick
-        for freq in ['D', '2D', '3D']:
-            p = Period('2011-04-01', freq=freq)
-            self.assertEqual(p - offsets.Day(5), Period('2011-03-27', freq=freq))
-            self.assertEqual(p - offsets.Hour(24), Period('2011-03-31', freq=freq))
-            self.assertEqual(p - np.timedelta64(2, 'D'), Period('2011-03-30', freq=freq))
-            self.assertEqual(p - np.timedelta64(3600 * 24, 's'), Period('2011-03-31', freq=freq))
-            self.assertEqual(p - timedelta(-2), Period('2011-04-03', freq=freq))
-            self.assertEqual(p - timedelta(hours=48), Period('2011-03-30', freq=freq))
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(4, 'h'), timedelta(hours=23)]:
-                with tm.assertRaises(ValueError):
-                    p - o
-
-        for freq in ['H', '2H', '3H']:
-            p = Period('2011-04-01 09:00', freq=freq)
-            self.assertEqual(p - offsets.Day(2), Period('2011-03-30 09:00', freq=freq))
-            self.assertEqual(p - offsets.Hour(3), Period('2011-04-01 06:00', freq=freq))
-            self.assertEqual(p - np.timedelta64(3, 'h'), Period('2011-04-01 06:00', freq=freq))
-            self.assertEqual(p - np.timedelta64(3600, 's'), Period('2011-04-01 08:00', freq=freq))
-            self.assertEqual(p - timedelta(minutes=120), Period('2011-04-01 07:00', freq=freq))
-            self.assertEqual(p - timedelta(days=4, minutes=180), Period('2011-03-28 06:00', freq=freq))
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(3200, 's'), timedelta(hours=23, minutes=30)]:
-                with tm.assertRaises(ValueError):
-                    p - o
-
-    def test_sub_offset_nat(self):
-        # freq is DateOffset
-        for freq in ['A', '2A', '3A']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.YearEnd(2)]:
-                self.assertEqual((p - o).ordinal, tslib.iNaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(365, 'D'), timedelta(365)]:
-                with tm.assertRaises(ValueError):
-                    p - o
-
-        for freq in ['M', '2M', '3M']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.MonthEnd(2), offsets.MonthEnd(12)]:
-                self.assertEqual((p - o).ordinal, tslib.iNaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(365, 'D'), timedelta(365)]:
-                with tm.assertRaises(ValueError):
-                    p - o
-
-        # freq is Tick
-        for freq in ['D', '2D', '3D']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.Day(5), offsets.Hour(24), np.timedelta64(2, 'D'),
-                      np.timedelta64(3600 * 24, 's'), timedelta(-2), timedelta(hours=48)]:
-                self.assertEqual((p - o).ordinal, tslib.iNaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(4, 'h'), timedelta(hours=23)]:
-                with tm.assertRaises(ValueError):
-                    p - o
-
-        for freq in ['H', '2H', '3H']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.Day(2), offsets.Hour(3), np.timedelta64(3, 'h'),
-                      np.timedelta64(3600, 's'), timedelta(minutes=120),
-                      timedelta(days=4, minutes=180)]:
-                self.assertEqual((p - o).ordinal, tslib.iNaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1), offsets.Minute(),
-                      np.timedelta64(3200, 's'), timedelta(hours=23, minutes=30)]:
-                with tm.assertRaises(ValueError):
-                    p - o
-
-    def test_nat_ops(self):
-        for freq in ['M', '2M', '3M']:
-            p = Period('NaT', freq=freq)
-            self.assertEqual((p + 1).ordinal, tslib.iNaT)
-            self.assertEqual((p - 1).ordinal, tslib.iNaT)
-            self.assertEqual((p - Period('2011-01', freq=freq)).ordinal, tslib.iNaT)
-            self.assertEqual((Period('2011-01', freq=freq) - p).ordinal, tslib.iNaT)
-
-    def test_pi_ops_nat(self):
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'], freq='M', name='idx')
-        result = idx + 2
-        expected = PeriodIndex(['2011-03', '2011-04', 'NaT', '2011-06'], freq='M', name='idx')
-        self.assertTrue(result.equals(expected))
-
-        result2 = result - 2
-        self.assertTrue(result2.equals(idx))
-
-        msg = "unsupported operand type\(s\)"
-        with tm.assertRaisesRegexp(TypeError, msg):
-            idx + "str"
-
-    def test_pi_ops_array(self):
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'], freq='M', name='idx')
-        result = idx + np.array([1, 2, 3, 4])
-        exp = PeriodIndex(['2011-02', '2011-04', 'NaT', '2011-08'], freq='M', name='idx')
-        self.assert_index_equal(result, exp)
-
-        result = np.add(idx, np.array([4, -1, 1, 2]))
-        exp = PeriodIndex(['2011-05', '2011-01', 'NaT', '2011-06'], freq='M', name='idx')
-        self.assert_index_equal(result, exp)
-
-        result = idx - np.array([1, 2, 3, 4])
-        exp = PeriodIndex(['2010-12', '2010-12', 'NaT', '2010-12'], freq='M', name='idx')
-        self.assert_index_equal(result, exp)
-
-        result = np.subtract(idx, np.array([3, 2, 3, -2]))
-        exp = PeriodIndex(['2010-10', '2010-12', 'NaT', '2011-06'], freq='M', name='idx')
-        self.assert_index_equal(result, exp)
-
-        # incompatible freq
-        msg = "Input has different freq from PeriodIndex\(freq=M\)"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx + np.array([np.timedelta64(1, 'D')] * 4)
-
-        idx = PeriodIndex(['2011-01-01 09:00', '2011-01-01 10:00', 'NaT',
-                           '2011-01-01 12:00'], freq='H', name='idx')
-        result = idx + np.array([np.timedelta64(1, 'D')] * 4)
-        exp = PeriodIndex(['2011-01-02 09:00', '2011-01-02 10:00', 'NaT',
-                           '2011-01-02 12:00'], freq='H', name='idx')
-        self.assert_index_equal(result, exp)
-
-        result = idx - np.array([np.timedelta64(1, 'h')] * 4)
-        exp = PeriodIndex(['2011-01-01 08:00', '2011-01-01 09:00', 'NaT',
-                           '2011-01-01 11:00'], freq='H', name='idx')
-        self.assert_index_equal(result, exp)
-
-        msg = "Input has different freq from PeriodIndex\(freq=H\)"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx + np.array([np.timedelta64(1, 's')] * 4)
-
-        idx = PeriodIndex(['2011-01-01 09:00:00', '2011-01-01 10:00:00', 'NaT',
-                           '2011-01-01 12:00:00'], freq='S', name='idx')
-        result = idx + np.array([np.timedelta64(1, 'h'), np.timedelta64(30, 's'),
-                                 np.timedelta64(2, 'h'), np.timedelta64(15, 'm')])
-        exp = PeriodIndex(['2011-01-01 10:00:00', '2011-01-01 10:00:30', 'NaT',
-                           '2011-01-01 12:15:00'], freq='S', name='idx')
-        self.assert_index_equal(result, exp)
-
-
-class TestPeriodRepresentation(tm.TestCase):
-    """
-    Wish to match NumPy units
-    """
-
-    def test_annual(self):
-        self._check_freq('A', 1970)
-
-    def test_monthly(self):
-        self._check_freq('M', '1970-01')
-
-    def test_weekly(self):
-        self._check_freq('W-THU', '1970-01-01')
-
-    def test_daily(self):
-        self._check_freq('D', '1970-01-01')
-
-    def test_business_daily(self):
-        self._check_freq('B', '1970-01-01')
-
-    def test_hourly(self):
-        self._check_freq('H', '1970-01-01')
-
-    def test_minutely(self):
-        self._check_freq('T', '1970-01-01')
-
-    def test_secondly(self):
-        self._check_freq('S', '1970-01-01')
-
-    def test_millisecondly(self):
-        self._check_freq('L', '1970-01-01')
-
-    def test_microsecondly(self):
-        self._check_freq('U', '1970-01-01')
-
-    def test_nanosecondly(self):
-        self._check_freq('N', '1970-01-01')
-
-    def _check_freq(self, freq, base_date):
-        rng = PeriodIndex(start=base_date, periods=10, freq=freq)
-        exp = np.arange(10, dtype=np.int64)
-        self.assert_numpy_array_equal(rng.values, exp)
-
-    def test_negone_ordinals(self):
-        freqs = ['A', 'M', 'Q', 'D', 'H', 'T', 'S']
-
-        period = Period(ordinal=-1, freq='D')
-        for freq in freqs:
-            repr(period.asfreq(freq))
-
-        for freq in freqs:
-            period = Period(ordinal=-1, freq=freq)
-            repr(period)
-            self.assertEqual(period.year, 1969)
-
-        period = Period(ordinal=-1, freq='B')
-        repr(period)
-        period = Period(ordinal=-1, freq='W')
-        repr(period)
-
-
-class TestComparisons(tm.TestCase):
-    def setUp(self):
-        self.january1 = Period('2000-01', 'M')
-        self.january2 = Period('2000-01', 'M')
-        self.february = Period('2000-02', 'M')
-        self.march = Period('2000-03', 'M')
-        self.day = Period('2012-01-01', 'D')
-
-    def test_equal(self):
-        self.assertEqual(self.january1, self.january2)
-
-    def test_equal_Raises_Value(self):
-        with tm.assertRaises(ValueError):
-            self.january1 == self.day
-
-    def test_notEqual(self):
-        self.assertNotEqual(self.january1, 1)
-        self.assertNotEqual(self.january1, self.february)
-
-    def test_greater(self):
-        self.assertTrue(self.february > self.january1)
-
-    def test_greater_Raises_Value(self):
-        with tm.assertRaises(ValueError):
-            self.january1 > self.day
-
-    def test_greater_Raises_Type(self):
-        with tm.assertRaises(TypeError):
-            self.january1 > 1
-
-    def test_greaterEqual(self):
-        self.assertTrue(self.january1 >= self.january2)
-
-    def test_greaterEqual_Raises_Value(self):
-        with tm.assertRaises(ValueError):
-            self.january1 >= self.day
-        with tm.assertRaises(TypeError):
-            print(self.january1 >= 1)
-
-    def test_smallerEqual(self):
-        self.assertTrue(self.january1 <= self.january2)
-
-    def test_smallerEqual_Raises_Value(self):
-        with tm.assertRaises(ValueError):
-            self.january1 <= self.day
-
-    def test_smallerEqual_Raises_Type(self):
-        with tm.assertRaises(TypeError):
-            self.january1 <= 1
-
-    def test_smaller(self):
-        self.assertTrue(self.january1 < self.february)
-
-    def test_smaller_Raises_Value(self):
-        with tm.assertRaises(ValueError):
-            self.january1 < self.day
-
-    def test_smaller_Raises_Type(self):
-        with tm.assertRaises(TypeError):
-            self.january1 < 1
-
-    def test_sort(self):
-        periods = [self.march, self.january1, self.february]
-        correctPeriods = [self.january1, self.february, self.march]
-        self.assertEqual(sorted(periods), correctPeriods)
-
-    def test_period_nat_comp(self):
-        p_nat = Period('NaT', freq='D')
-        p = Period('2011-01-01', freq='D')
-
-        nat = pd.Timestamp('NaT')
-        t = pd.Timestamp('2011-01-01')
-        # confirm Period('NaT') work identical with Timestamp('NaT')
-        for left, right in [(p_nat, p), (p, p_nat), (p_nat, p_nat),
-                            (nat, t), (t, nat), (nat, nat)]:
-            self.assertEqual(left < right, False)
-            self.assertEqual(left > right, False)
-            self.assertEqual(left == right, False)
-            self.assertEqual(left != right, True)
-            self.assertEqual(left <= right, False)
-            self.assertEqual(left >= right, False)
-
-    def test_pi_pi_comp(self):
-
-        for freq in ['M', '2M', '3M']:
-            base = PeriodIndex(['2011-01', '2011-02',
-                                '2011-03', '2011-04'], freq=freq)
-            p = Period('2011-02', freq=freq)
-
-            exp = np.array([False, True, False, False])
-            self.assert_numpy_array_equal(base == p, exp)
-
-            exp = np.array([True, False, True, True])
-            self.assert_numpy_array_equal(base != p, exp)
-
-            exp = np.array([False, False, True, True])
-            self.assert_numpy_array_equal(base > p, exp)
-
-            exp = np.array([True, False, False, False])
-            self.assert_numpy_array_equal(base < p, exp)
-
-            exp = np.array([False, True, True, True])
-            self.assert_numpy_array_equal(base >= p, exp)
-
-            exp = np.array([True, True, False, False])
-            self.assert_numpy_array_equal(base <= p, exp)
-
-            idx = PeriodIndex(['2011-02', '2011-01', '2011-03', '2011-05'], freq=freq)
-
-            exp = np.array([False, False, True, False])
-            self.assert_numpy_array_equal(base == idx, exp)
-
-            exp = np.array([True, True, False, True])
-            self.assert_numpy_array_equal(base != idx, exp)
-
-            exp = np.array([False, True, False, False])
-            self.assert_numpy_array_equal(base > idx, exp)
-
-            exp = np.array([True, False, False, True])
-            self.assert_numpy_array_equal(base < idx, exp)
-
-            exp = np.array([False, True, True, False])
-            self.assert_numpy_array_equal(base >= idx, exp)
-
-            exp = np.array([True, False, True, True])
-            self.assert_numpy_array_equal(base <= idx, exp)
-
-            # different base freq
-            msg = "Input has different freq=A-DEC from PeriodIndex"
-            with tm.assertRaisesRegexp(ValueError, msg):
-                base <= Period('2011', freq='A')
-
-            with tm.assertRaisesRegexp(ValueError, msg):
-                idx = PeriodIndex(['2011', '2012', '2013', '2014'], freq='A')
-                base <= idx
-
-            # different mult
-            msg = "Input has different freq=4M from PeriodIndex"
-            with tm.assertRaisesRegexp(ValueError, msg):
-                base <= Period('2011', freq='4M')
-
-            with tm.assertRaisesRegexp(ValueError, msg):
-                idx = PeriodIndex(['2011', '2012', '2013', '2014'], freq='4M')
-                base <= idx
-
-    def test_pi_nat_comp(self):
-        for freq in ['M', '2M', '3M']:
-            idx1 = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-05'], freq=freq)
-
-            result = idx1 > Period('2011-02', freq=freq)
-            exp = np.array([False, False, False, True])
-            self.assert_numpy_array_equal(result, exp)
-
-            result = idx1 == Period('NaT', freq=freq)
-            exp = np.array([False, False, False, False])
-            self.assert_numpy_array_equal(result, exp)
-
-            result = idx1 != Period('NaT', freq=freq)
-            exp = np.array([True, True, True, True])
-            self.assert_numpy_array_equal(result, exp)
-
-            idx2 = PeriodIndex(['2011-02', '2011-01', '2011-04', 'NaT'], freq=freq)
-            result = idx1 < idx2
-            exp = np.array([True, False, False, False])
-            self.assert_numpy_array_equal(result, exp)
-
-            result = idx1 == idx2
-            exp = np.array([False, False, False, False])
-            self.assert_numpy_array_equal(result, exp)
-
-            result = idx1 != idx2
-            exp = np.array([True, True, True, True])
-            self.assert_numpy_array_equal(result, exp)
-
-            result = idx1 == idx1
-            exp = np.array([True, True, False, True])
-            self.assert_numpy_array_equal(result, exp)
-
-            result = idx1 != idx1
-            exp = np.array([False, False, True, False])
-            self.assert_numpy_array_equal(result, exp)
-
-            diff = PeriodIndex(['2011-02', '2011-01', '2011-04', 'NaT'], freq='4M')
-            msg = "Input has different freq=4M from PeriodIndex"
-            with tm.assertRaisesRegexp(ValueError, msg):
-                idx1 > diff
-            with tm.assertRaisesRegexp(ValueError, msg):
-                idx1 == diff
-
-
-if __name__ == '__main__':
-    import nose
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tseries/tests/test_plotting.py b/pandas/tseries/tests/test_plotting.py
deleted file mode 100644
index bcd1e400d3974..0000000000000
--- a/pandas/tseries/tests/test_plotting.py
+++ /dev/null
@@ -1,1232 +0,0 @@
-from datetime import datetime, timedelta, date, time
-
-import nose
-from pandas.compat import lrange, zip
-
-import numpy as np
-from numpy.testing.decorators import slow
-
-from pandas import Index, Series, DataFrame
-
-from pandas.tseries.index import date_range, bdate_range
-from pandas.tseries.offsets import DateOffset, Week
-from pandas.tseries.period import period_range, Period, PeriodIndex
-from pandas.tseries.resample import DatetimeIndex
-
-from pandas.util.testing import assert_series_equal, ensure_clean
-import pandas.util.testing as tm
-
-from pandas.tests.test_graphics import _skip_if_no_scipy_gaussian_kde
-
-
-@tm.mplskip
-class TestTSPlot(tm.TestCase):
-    def setUp(self):
-        freq = ['S', 'T', 'H', 'D', 'W', 'M', 'Q', 'A']
-        idx = [period_range('12/31/1999', freq=x, periods=100) for x in freq]
-        self.period_ser = [Series(np.random.randn(len(x)), x) for x in idx]
-        self.period_df = [DataFrame(np.random.randn(len(x), 3), index=x,
-                                    columns=['A', 'B', 'C'])
-                          for x in idx]
-
-        freq = ['S', 'T', 'H', 'D', 'W', 'M', 'Q-DEC', 'A', '1B30Min']
-        idx = [date_range('12/31/1999', freq=x, periods=100) for x in freq]
-        self.datetime_ser = [Series(np.random.randn(len(x)), x) for x in idx]
-        self.datetime_df = [DataFrame(np.random.randn(len(x), 3), index=x,
-                                      columns=['A', 'B', 'C'])
-                            for x in idx]
-
-    def tearDown(self):
-        tm.close()
-
-    @slow
-    def test_ts_plot_with_tz(self):
-        # GH2877
-        index = date_range('1/1/2011', periods=2, freq='H',
-                           tz='Europe/Brussels')
-        ts = Series([188.5, 328.25], index=index)
-        _check_plot_works(ts.plot)
-
-    def test_fontsize_set_correctly(self):
-        # For issue #8765
-        import matplotlib.pyplot as plt
-        df = DataFrame(np.random.randn(10, 9), index=range(10))
-        ax = df.plot(fontsize=2)
-        for label in (ax.get_xticklabels() + ax.get_yticklabels()):
-            self.assertEqual(label.get_fontsize(), 2)
-
-    @slow
-    def test_frame_inferred(self):
-        # inferred freq
-        import matplotlib.pyplot as plt
-        idx = date_range('1/1/1987', freq='MS', periods=100)
-        idx = DatetimeIndex(idx.values, freq=None)
-
-        df = DataFrame(np.random.randn(len(idx), 3), index=idx)
-        _check_plot_works(df.plot)
-
-        # axes freq
-        idx = idx[0:40].union(idx[45:99])
-        df2 = DataFrame(np.random.randn(len(idx), 3), index=idx)
-        _check_plot_works(df2.plot)
-
-        # N > 1
-        idx = date_range('2008-1-1 00:15:00', freq='15T', periods=10)
-        idx = DatetimeIndex(idx.values, freq=None)
-        df = DataFrame(np.random.randn(len(idx), 3), index=idx)
-        _check_plot_works(df.plot)
-
-    def test_nonnumeric_exclude(self):
-        import matplotlib.pyplot as plt
-
-        idx = date_range('1/1/1987', freq='A', periods=3)
-        df = DataFrame({'A': ["x", "y", "z"], 'B': [1,2,3]}, idx)
-
-        ax = df.plot() # it works
-        self.assertEqual(len(ax.get_lines()), 1) #B was plotted
-        plt.close(plt.gcf())
-
-        self.assertRaises(TypeError, df['A'].plot)
-
-    @slow
-    def test_tsplot(self):
-        from pandas.tseries.plotting import tsplot
-        import matplotlib.pyplot as plt
-
-        ax = plt.gca()
-        ts = tm.makeTimeSeries()
-
-        f = lambda *args, **kwds: tsplot(s, plt.Axes.plot, *args, **kwds)
-
-        for s in self.period_ser:
-            _check_plot_works(f, s.index.freq, ax=ax, series=s)
-
-        for s in self.datetime_ser:
-            _check_plot_works(f, s.index.freq.rule_code, ax=ax, series=s)
-
-        for s in self.period_ser:
-            _check_plot_works(s.plot, ax=ax)
-
-        for s in self.datetime_ser:
-            _check_plot_works(s.plot, ax=ax)
-
-        ax = ts.plot(style='k')
-        self.assertEqual((0., 0., 0.), ax.get_lines()[0].get_color())
-
-    def test_both_style_and_color(self):
-        import matplotlib.pyplot as plt
-
-        ts = tm.makeTimeSeries()
-        self.assertRaises(ValueError, ts.plot, style='b-', color='#000099')
-
-        s = ts.reset_index(drop=True)
-        self.assertRaises(ValueError, s.plot, style='b-', color='#000099')
-
-    @slow
-    def test_high_freq(self):
-        freaks = ['ms', 'us']
-        for freq in freaks:
-            rng = date_range('1/1/2012', periods=100000, freq=freq)
-            ser = Series(np.random.randn(len(rng)), rng)
-            _check_plot_works(ser.plot)
-
-    def test_get_datevalue(self):
-        from pandas.tseries.converter import get_datevalue
-        self.assertIsNone(get_datevalue(None, 'D'))
-        self.assertEqual(get_datevalue(1987, 'A'), 1987)
-        self.assertEqual(get_datevalue(Period(1987, 'A'), 'M'),
-                         Period('1987-12', 'M').ordinal)
-        self.assertEqual(get_datevalue('1/1/1987', 'D'),
-                         Period('1987-1-1', 'D').ordinal)
-
-    @slow
-    def test_ts_plot_format_coord(self):
-        def check_format_of_first_point(ax, expected_string):
-            first_line = ax.get_lines()[0]
-            first_x = first_line.get_xdata()[0].ordinal
-            first_y = first_line.get_ydata()[0]
-            try:
-                self.assertEqual(expected_string, ax.format_coord(first_x, first_y))
-            except (ValueError):
-                raise nose.SkipTest("skipping test because issue forming test comparison GH7664")
-
-        annual = Series(1, index=date_range('2014-01-01', periods=3, freq='A-DEC'))
-        check_format_of_first_point(annual.plot(), 't = 2014  y = 1.000000')
-
-        # note this is added to the annual plot already in existence, and changes its freq field
-        daily = Series(1, index=date_range('2014-01-01', periods=3, freq='D'))
-        check_format_of_first_point(daily.plot(), 't = 2014-01-01  y = 1.000000')
-        tm.close()
-
-        # tsplot
-        import matplotlib.pyplot as plt
-        from pandas.tseries.plotting import tsplot
-        tsplot(annual, plt.Axes.plot)
-        check_format_of_first_point(plt.gca(), 't = 2014  y = 1.000000')
-        tsplot(daily, plt.Axes.plot)
-        check_format_of_first_point(plt.gca(), 't = 2014-01-01  y = 1.000000')
-
-    @slow
-    def test_line_plot_period_series(self):
-        for s in self.period_ser:
-            _check_plot_works(s.plot, s.index.freq)
-
-    @slow
-    def test_line_plot_datetime_series(self):
-        for s in self.datetime_ser:
-            _check_plot_works(s.plot, s.index.freq.rule_code)
-
-    @slow
-    def test_line_plot_period_frame(self):
-        for df in self.period_df:
-            _check_plot_works(df.plot, df.index.freq)
-
-    @slow
-    def test_line_plot_datetime_frame(self):
-        for df in self.datetime_df:
-            freq = df.index.to_period(df.index.freq.rule_code).freq
-            _check_plot_works(df.plot, freq)
-
-    @slow
-    def test_line_plot_inferred_freq(self):
-        for ser in self.datetime_ser:
-            ser = Series(ser.values, Index(np.asarray(ser.index)))
-            _check_plot_works(ser.plot, ser.index.inferred_freq)
-
-            ser = ser[[0, 3, 5, 6]]
-            _check_plot_works(ser.plot)
-
-    def test_fake_inferred_business(self):
-        import matplotlib.pyplot as plt
-        fig = plt.gcf()
-        plt.clf()
-        fig.add_subplot(111)
-        rng = date_range('2001-1-1', '2001-1-10')
-        ts = Series(lrange(len(rng)), rng)
-        ts = ts[:3].append(ts[5:])
-        ax = ts.plot()
-        self.assertFalse(hasattr(ax, 'freq'))
-
-    @slow
-    def test_plot_offset_freq(self):
-        ser = tm.makeTimeSeries()
-        _check_plot_works(ser.plot)
-
-        dr = date_range(ser.index[0], freq='BQS', periods=10)
-        ser = Series(np.random.randn(len(dr)), dr)
-        _check_plot_works(ser.plot)
-
-    @slow
-    def test_plot_multiple_inferred_freq(self):
-        dr = Index([datetime(2000, 1, 1),
-                    datetime(2000, 1, 6),
-                    datetime(2000, 1, 11)])
-        ser = Series(np.random.randn(len(dr)), dr)
-        _check_plot_works(ser.plot)
-
-    @slow
-    def test_uhf(self):
-        import pandas.tseries.converter as conv
-        import matplotlib.pyplot as plt
-        fig = plt.gcf()
-        plt.clf()
-        fig.add_subplot(111)
-
-        idx = date_range('2012-6-22 21:59:51.960928', freq='L', periods=500)
-        df = DataFrame(np.random.randn(len(idx), 2), idx)
-
-        ax = df.plot()
-        axis = ax.get_xaxis()
-
-        tlocs = axis.get_ticklocs()
-        tlabels = axis.get_ticklabels()
-        for loc, label in zip(tlocs, tlabels):
-            xp = conv._from_ordinal(loc).strftime('%H:%M:%S.%f')
-            rs = str(label.get_text())
-            if len(rs):
-                self.assertEqual(xp, rs)
-
-    @slow
-    def test_irreg_hf(self):
-        import matplotlib.pyplot as plt
-        fig = plt.gcf()
-        plt.clf()
-        fig.add_subplot(111)
-
-        idx = date_range('2012-6-22 21:59:51', freq='S', periods=100)
-        df = DataFrame(np.random.randn(len(idx), 2), idx)
-
-        irreg = df.ix[[0, 1, 3, 4]]
-        ax = irreg.plot()
-        diffs = Series(ax.get_lines()[0].get_xydata()[:, 0]).diff()
-
-        sec = 1. / 24 / 60 / 60
-        self.assertTrue((np.fabs(diffs[1:] - [sec, sec * 2, sec]) < 1e-8).all())
-
-        plt.clf()
-        fig.add_subplot(111)
-        df2 = df.copy()
-        df2.index = df.index.asobject
-        ax = df2.plot()
-        diffs = Series(ax.get_lines()[0].get_xydata()[:, 0]).diff()
-        self.assertTrue((np.fabs(diffs[1:] - sec) < 1e-8).all())
-
-    def test_irregular_datetime64_repr_bug(self):
-        import matplotlib.pyplot as plt
-        ser = tm.makeTimeSeries()
-        ser = ser[[0, 1, 2, 7]]
-
-        fig = plt.gcf()
-        plt.clf()
-        ax = fig.add_subplot(211)
-        ret = ser.plot()
-        self.assertIsNotNone(ret)
-
-        for rs, xp in zip(ax.get_lines()[0].get_xdata(), ser.index):
-            self.assertEqual(rs, xp)
-
-    def test_business_freq(self):
-        import matplotlib.pyplot as plt
-        bts = tm.makePeriodSeries()
-        ax = bts.plot()
-        self.assertEqual(ax.get_lines()[0].get_xydata()[0, 0],
-                         bts.index[0].ordinal)
-        idx = ax.get_lines()[0].get_xdata()
-        self.assertEqual(PeriodIndex(data=idx).freqstr, 'B')
-
-    @slow
-    def test_business_freq_convert(self):
-        n = tm.N
-        tm.N = 300
-        bts = tm.makeTimeSeries().asfreq('BM')
-        tm.N = n
-        ts = bts.to_period('M')
-        ax = bts.plot()
-        self.assertEqual(ax.get_lines()[0].get_xydata()[0, 0],
-                         ts.index[0].ordinal)
-        idx = ax.get_lines()[0].get_xdata()
-        self.assertEqual(PeriodIndex(data=idx).freqstr, 'M')
-
-    def test_nonzero_base(self):
-        # GH2571
-        idx = (date_range('2012-12-20', periods=24, freq='H') +
-               timedelta(minutes=30))
-        df = DataFrame(np.arange(24), index=idx)
-        ax = df.plot()
-        rs = ax.get_lines()[0].get_xdata()
-        self.assertFalse(Index(rs).is_normalized)
-
-    def test_dataframe(self):
-        bts = DataFrame({'a': tm.makeTimeSeries()})
-        ax = bts.plot()
-        idx = ax.get_lines()[0].get_xdata()
-        tm.assert_numpy_array_equal(bts.index.to_period(), PeriodIndex(idx))
-
-    @slow
-    def test_axis_limits(self):
-        import matplotlib.pyplot as plt
-
-        def _test(ax):
-            xlim = ax.get_xlim()
-            ax.set_xlim(xlim[0] - 5, xlim[1] + 10)
-            ax.get_figure().canvas.draw()
-            result = ax.get_xlim()
-            self.assertEqual(result[0], xlim[0] - 5)
-            self.assertEqual(result[1], xlim[1] + 10)
-
-            # string
-            expected = (Period('1/1/2000', ax.freq),
-                        Period('4/1/2000', ax.freq))
-            ax.set_xlim('1/1/2000', '4/1/2000')
-            ax.get_figure().canvas.draw()
-            result = ax.get_xlim()
-            self.assertEqual(int(result[0]), expected[0].ordinal)
-            self.assertEqual(int(result[1]), expected[1].ordinal)
-
-            # datetim
-            expected = (Period('1/1/2000', ax.freq),
-                        Period('4/1/2000', ax.freq))
-            ax.set_xlim(datetime(2000, 1, 1), datetime(2000, 4, 1))
-            ax.get_figure().canvas.draw()
-            result = ax.get_xlim()
-            self.assertEqual(int(result[0]), expected[0].ordinal)
-            self.assertEqual(int(result[1]), expected[1].ordinal)
-            fig = ax.get_figure()
-            plt.close(fig)
-
-        ser = tm.makeTimeSeries()
-        ax = ser.plot()
-        _test(ax)
-
-        df = DataFrame({'a': ser, 'b': ser + 1})
-        ax = df.plot()
-        _test(ax)
-
-        df = DataFrame({'a': ser, 'b': ser + 1})
-        axes = df.plot(subplots=True)
-
-        for ax in axes:
-            _test(ax)
-
-    def test_get_finder(self):
-        import pandas.tseries.converter as conv
-
-        self.assertEqual(conv.get_finder('B'), conv._daily_finder)
-        self.assertEqual(conv.get_finder('D'), conv._daily_finder)
-        self.assertEqual(conv.get_finder('M'), conv._monthly_finder)
-        self.assertEqual(conv.get_finder('Q'), conv._quarterly_finder)
-        self.assertEqual(conv.get_finder('A'), conv._annual_finder)
-        self.assertEqual(conv.get_finder('W'), conv._daily_finder)
-
-    @slow
-    def test_finder_daily(self):
-        import matplotlib.pyplot as plt
-        xp = Period('1999-1-1', freq='B').ordinal
-        day_lst = [10, 40, 252, 400, 950, 2750, 10000]
-        for n in day_lst:
-            rng = bdate_range('1999-1-1', periods=n)
-            ser = Series(np.random.randn(len(rng)), rng)
-            ax = ser.plot()
-            xaxis = ax.get_xaxis()
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(xp, rs)
-            vmin, vmax = ax.get_xlim()
-            ax.set_xlim(vmin + 0.9, vmax)
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(xp, rs)
-            plt.close(ax.get_figure())
-
-    @slow
-    def test_finder_quarterly(self):
-        import matplotlib.pyplot as plt
-        xp = Period('1988Q1').ordinal
-        yrs = [3.5, 11]
-        for n in yrs:
-            rng = period_range('1987Q2', periods=int(n * 4), freq='Q')
-            ser = Series(np.random.randn(len(rng)), rng)
-            ax = ser.plot()
-            xaxis = ax.get_xaxis()
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(rs, xp)
-            (vmin, vmax) = ax.get_xlim()
-            ax.set_xlim(vmin + 0.9, vmax)
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(xp, rs)
-            plt.close(ax.get_figure())
-
-    @slow
-    def test_finder_monthly(self):
-        import matplotlib.pyplot as plt
-        xp = Period('Jan 1988').ordinal
-        yrs = [1.15, 2.5, 4, 11]
-        for n in yrs:
-            rng = period_range('1987Q2', periods=int(n * 12), freq='M')
-            ser = Series(np.random.randn(len(rng)), rng)
-            ax = ser.plot()
-            xaxis = ax.get_xaxis()
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(rs, xp)
-            vmin, vmax = ax.get_xlim()
-            ax.set_xlim(vmin + 0.9, vmax)
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(xp, rs)
-            plt.close(ax.get_figure())
-
-    def test_finder_monthly_long(self):
-        rng = period_range('1988Q1', periods=24 * 12, freq='M')
-        ser = Series(np.random.randn(len(rng)), rng)
-        ax = ser.plot()
-        xaxis = ax.get_xaxis()
-        rs = xaxis.get_majorticklocs()[0]
-        xp = Period('1989Q1', 'M').ordinal
-        self.assertEqual(rs, xp)
-
-    @slow
-    def test_finder_annual(self):
-        import matplotlib.pyplot as plt
-        xp = [1987, 1988, 1990, 1990, 1995, 2020, 2070, 2170]
-        for i, nyears in enumerate([5, 10, 19, 49, 99, 199, 599, 1001]):
-            rng = period_range('1987', periods=nyears, freq='A')
-            ser = Series(np.random.randn(len(rng)), rng)
-            ax = ser.plot()
-            xaxis = ax.get_xaxis()
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(rs, Period(xp[i], freq='A').ordinal)
-            plt.close(ax.get_figure())
-
-    @slow
-    def test_finder_minutely(self):
-        nminutes = 50 * 24 * 60
-        rng = date_range('1/1/1999', freq='Min', periods=nminutes)
-        ser = Series(np.random.randn(len(rng)), rng)
-        ax = ser.plot()
-        xaxis = ax.get_xaxis()
-        rs = xaxis.get_majorticklocs()[0]
-        xp = Period('1/1/1999', freq='Min').ordinal
-        self.assertEqual(rs, xp)
-
-    def test_finder_hourly(self):
-        nhours = 23
-        rng = date_range('1/1/1999', freq='H', periods=nhours)
-        ser = Series(np.random.randn(len(rng)), rng)
-        ax = ser.plot()
-        xaxis = ax.get_xaxis()
-        rs = xaxis.get_majorticklocs()[0]
-        xp = Period('1/1/1999', freq='H').ordinal
-        self.assertEqual(rs, xp)
-
-    @slow
-    def test_gaps(self):
-        import matplotlib.pyplot as plt
-
-        ts = tm.makeTimeSeries()
-        ts[5:25] = np.nan
-        ax = ts.plot()
-        lines = ax.get_lines()
-        tm._skip_if_mpl_1_5()
-        self.assertEqual(len(lines), 1)
-        l = lines[0]
-        data = l.get_xydata()
-        tm.assertIsInstance(data, np.ma.core.MaskedArray)
-        mask = data.mask
-        self.assertTrue(mask[5:25, 1].all())
-        plt.close(ax.get_figure())
-
-        # irregular
-        ts = tm.makeTimeSeries()
-        ts = ts[[0, 1, 2, 5, 7, 9, 12, 15, 20]]
-        ts[2:5] = np.nan
-        ax = ts.plot()
-        lines = ax.get_lines()
-        self.assertEqual(len(lines), 1)
-        l = lines[0]
-        data = l.get_xydata()
-        tm.assertIsInstance(data, np.ma.core.MaskedArray)
-        mask = data.mask
-        self.assertTrue(mask[2:5, 1].all())
-        plt.close(ax.get_figure())
-
-        # non-ts
-        idx = [0, 1, 2, 5, 7, 9, 12, 15, 20]
-        ser = Series(np.random.randn(len(idx)), idx)
-        ser[2:5] = np.nan
-        ax = ser.plot()
-        lines = ax.get_lines()
-        self.assertEqual(len(lines), 1)
-        l = lines[0]
-        data = l.get_xydata()
-        tm.assertIsInstance(data, np.ma.core.MaskedArray)
-        mask = data.mask
-        self.assertTrue(mask[2:5, 1].all())
-
-    @slow
-    def test_gap_upsample(self):
-        low = tm.makeTimeSeries()
-        low[5:25] = np.nan
-        ax = low.plot()
-
-        idxh = date_range(low.index[0], low.index[-1], freq='12h')
-        s = Series(np.random.randn(len(idxh)), idxh)
-        s.plot(secondary_y=True)
-        lines = ax.get_lines()
-        self.assertEqual(len(lines), 1)
-        self.assertEqual(len(ax.right_ax.get_lines()), 1)
-        l = lines[0]
-        data = l.get_xydata()
-
-        tm._skip_if_mpl_1_5()
-
-        tm.assertIsInstance(data, np.ma.core.MaskedArray)
-        mask = data.mask
-        self.assertTrue(mask[5:25, 1].all())
-
-    @slow
-    def test_secondary_y(self):
-        import matplotlib.pyplot as plt
-
-        ser = Series(np.random.randn(10))
-        ser2 = Series(np.random.randn(10))
-        ax = ser.plot(secondary_y=True)
-        self.assertTrue(hasattr(ax, 'left_ax'))
-        self.assertFalse(hasattr(ax, 'right_ax'))
-        fig = ax.get_figure()
-        axes = fig.get_axes()
-        l = ax.get_lines()[0]
-        xp = Series(l.get_ydata(), l.get_xdata())
-        assert_series_equal(ser, xp)
-        self.assertEqual(ax.get_yaxis().get_ticks_position(), 'right')
-        self.assertFalse(axes[0].get_yaxis().get_visible())
-        plt.close(fig)
-
-        ax2 = ser2.plot()
-        self.assertEqual(ax2.get_yaxis().get_ticks_position(), 'default')
-        plt.close(ax2.get_figure())
-
-        ax = ser2.plot()
-        ax2 = ser.plot(secondary_y=True)
-        self.assertTrue(ax.get_yaxis().get_visible())
-        self.assertFalse(hasattr(ax, 'left_ax'))
-        self.assertTrue(hasattr(ax, 'right_ax'))
-        self.assertTrue(hasattr(ax2, 'left_ax'))
-        self.assertFalse(hasattr(ax2, 'right_ax'))
-
-    @slow
-    def test_secondary_y_ts(self):
-        import matplotlib.pyplot as plt
-        idx = date_range('1/1/2000', periods=10)
-        ser = Series(np.random.randn(10), idx)
-        ser2 = Series(np.random.randn(10), idx)
-        ax = ser.plot(secondary_y=True)
-        self.assertTrue(hasattr(ax, 'left_ax'))
-        self.assertFalse(hasattr(ax, 'right_ax'))
-        fig = ax.get_figure()
-        axes = fig.get_axes()
-        l = ax.get_lines()[0]
-        xp = Series(l.get_ydata(), l.get_xdata()).to_timestamp()
-        assert_series_equal(ser, xp)
-        self.assertEqual(ax.get_yaxis().get_ticks_position(), 'right')
-        self.assertFalse(axes[0].get_yaxis().get_visible())
-        plt.close(fig)
-
-        ax2 = ser2.plot()
-        self.assertEqual(ax2.get_yaxis().get_ticks_position(), 'default')
-        plt.close(ax2.get_figure())
-
-        ax = ser2.plot()
-        ax2 = ser.plot(secondary_y=True)
-        self.assertTrue(ax.get_yaxis().get_visible())
-
-    @slow
-    def test_secondary_kde(self):
-        tm._skip_if_no_scipy()
-        _skip_if_no_scipy_gaussian_kde()
-
-        import matplotlib.pyplot as plt
-        ser = Series(np.random.randn(10))
-        ax = ser.plot(secondary_y=True, kind='density')
-        self.assertTrue(hasattr(ax, 'left_ax'))
-        self.assertFalse(hasattr(ax, 'right_ax'))
-        fig = ax.get_figure()
-        axes = fig.get_axes()
-        self.assertEqual(axes[1].get_yaxis().get_ticks_position(), 'right')
-
-    @slow
-    def test_secondary_bar(self):
-        ser = Series(np.random.randn(10))
-        ax = ser.plot(secondary_y=True, kind='bar')
-        fig = ax.get_figure()
-        axes = fig.get_axes()
-        self.assertEqual(axes[1].get_yaxis().get_ticks_position(),  'right')
-
-    @slow
-    def test_secondary_frame(self):
-        df = DataFrame(np.random.randn(5, 3), columns=['a', 'b', 'c'])
-        axes = df.plot(secondary_y=['a', 'c'], subplots=True)
-        self.assertEqual(axes[0].get_yaxis().get_ticks_position(), 'right')
-        self.assertEqual(axes[1].get_yaxis().get_ticks_position(), 'default')
-        self.assertEqual(axes[2].get_yaxis().get_ticks_position(), 'right')
-
-    @slow
-    def test_secondary_bar_frame(self):
-        df = DataFrame(np.random.randn(5, 3), columns=['a', 'b', 'c'])
-        axes = df.plot(kind='bar', secondary_y=['a', 'c'], subplots=True)
-        self.assertEqual(axes[0].get_yaxis().get_ticks_position(), 'right')
-        self.assertEqual(axes[1].get_yaxis().get_ticks_position(), 'default')
-        self.assertEqual(axes[2].get_yaxis().get_ticks_position(), 'right')
-
-    def test_mixed_freq_regular_first(self):
-        import matplotlib.pyplot as plt
-        s1 = tm.makeTimeSeries()
-        s2 = s1[[0, 5, 10, 11, 12, 13, 14, 15]]
-        ax = s1.plot()
-        ax2 = s2.plot(style='g')
-        lines = ax2.get_lines()
-        idx1 = PeriodIndex(lines[0].get_xdata())
-        idx2 = PeriodIndex(lines[1].get_xdata())
-        self.assertTrue(idx1.equals(s1.index.to_period('B')))
-        self.assertTrue(idx2.equals(s2.index.to_period('B')))
-        left, right = ax2.get_xlim()
-        pidx = s1.index.to_period()
-        self.assertEqual(left, pidx[0].ordinal)
-        self.assertEqual(right, pidx[-1].ordinal)
-
-    @slow
-    def test_mixed_freq_irregular_first(self):
-        import matplotlib.pyplot as plt
-        s1 = tm.makeTimeSeries()
-        s2 = s1[[0, 5, 10, 11, 12, 13, 14, 15]]
-        s2.plot(style='g')
-        ax = s1.plot()
-        self.assertFalse(hasattr(ax, 'freq'))
-        lines = ax.get_lines()
-        x1 = lines[0].get_xdata()
-        tm.assert_numpy_array_equal(x1, s2.index.asobject.values)
-        x2 = lines[1].get_xdata()
-        tm.assert_numpy_array_equal(x2, s1.index.asobject.values)
-
-    def test_mixed_freq_regular_first_df(self):
-        # GH 9852
-        import matplotlib.pyplot as plt
-        s1 = tm.makeTimeSeries().to_frame()
-        s2 = s1.iloc[[0, 5, 10, 11, 12, 13, 14, 15], :]
-        ax = s1.plot()
-        ax2 = s2.plot(style='g', ax=ax)
-        lines = ax2.get_lines()
-        idx1 = PeriodIndex(lines[0].get_xdata())
-        idx2 = PeriodIndex(lines[1].get_xdata())
-        self.assertTrue(idx1.equals(s1.index.to_period('B')))
-        self.assertTrue(idx2.equals(s2.index.to_period('B')))
-        left, right = ax2.get_xlim()
-        pidx = s1.index.to_period()
-        self.assertEqual(left, pidx[0].ordinal)
-        self.assertEqual(right, pidx[-1].ordinal)
-
-    @slow
-    def test_mixed_freq_irregular_first_df(self):
-        # GH 9852
-        import matplotlib.pyplot as plt
-        s1 = tm.makeTimeSeries().to_frame()
-        s2 = s1.iloc[[0, 5, 10, 11, 12, 13, 14, 15], :]
-        ax = s2.plot(style='g')
-        ax = s1.plot(ax=ax)
-        self.assertFalse(hasattr(ax, 'freq'))
-        lines = ax.get_lines()
-        x1 = lines[0].get_xdata()
-        tm.assert_numpy_array_equal(x1, s2.index.asobject.values)
-        x2 = lines[1].get_xdata()
-        tm.assert_numpy_array_equal(x2, s1.index.asobject.values)
-
-    def test_mixed_freq_hf_first(self):
-        idxh = date_range('1/1/1999', periods=365, freq='D')
-        idxl = date_range('1/1/1999', periods=12, freq='M')
-        high = Series(np.random.randn(len(idxh)), idxh)
-        low = Series(np.random.randn(len(idxl)), idxl)
-        high.plot()
-        ax = low.plot()
-        for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, 'D')
-
-    @slow
-    def test_mixed_freq_alignment(self):
-        ts_ind = date_range('2012-01-01 13:00', '2012-01-02', freq='H')
-        ts_data = np.random.randn(12)
-
-        ts = Series(ts_data, index=ts_ind)
-        ts2 = ts.asfreq('T').interpolate()
-
-        ax = ts.plot()
-        ts2.plot(style='r')
-
-        self.assertEqual(ax.lines[0].get_xdata()[0],
-                         ax.lines[1].get_xdata()[0])
-
-    @slow
-    def test_mixed_freq_lf_first(self):
-        import matplotlib.pyplot as plt
-
-        idxh = date_range('1/1/1999', periods=365, freq='D')
-        idxl = date_range('1/1/1999', periods=12, freq='M')
-        high = Series(np.random.randn(len(idxh)), idxh)
-        low = Series(np.random.randn(len(idxl)), idxl)
-        low.plot(legend=True)
-        ax = high.plot(legend=True)
-        for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, 'D')
-        leg = ax.get_legend()
-        self.assertEqual(len(leg.texts), 2)
-        plt.close(ax.get_figure())
-
-        idxh = date_range('1/1/1999', periods=240, freq='T')
-        idxl = date_range('1/1/1999', periods=4, freq='H')
-        high = Series(np.random.randn(len(idxh)), idxh)
-        low = Series(np.random.randn(len(idxl)), idxl)
-        low.plot()
-        ax = high.plot()
-        for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, 'T')
-
-    def test_mixed_freq_irreg_period(self):
-        ts = tm.makeTimeSeries()
-        irreg = ts[[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 15, 16, 17, 18, 29]]
-        rng = period_range('1/3/2000', periods=30, freq='B')
-        ps = Series(np.random.randn(len(rng)), rng)
-        irreg.plot()
-        ps.plot()
-
-    @slow
-    def test_to_weekly_resampling(self):
-        idxh = date_range('1/1/1999', periods=52, freq='W')
-        idxl = date_range('1/1/1999', periods=12, freq='M')
-        high = Series(np.random.randn(len(idxh)), idxh)
-        low = Series(np.random.randn(len(idxl)), idxl)
-        high.plot()
-        ax = low.plot()
-        for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, idxh.freq)
-
-        # tsplot
-        from pandas.tseries.plotting import tsplot
-        import matplotlib.pyplot as plt
-
-        tsplot(high, plt.Axes.plot)
-        lines = tsplot(low, plt.Axes.plot)
-        for l in lines:
-            self.assertTrue(PeriodIndex(data=l.get_xdata()).freq, idxh.freq)
-
-    @slow
-    def test_from_weekly_resampling(self):
-        idxh = date_range('1/1/1999', periods=52, freq='W')
-        idxl = date_range('1/1/1999', periods=12, freq='M')
-        high = Series(np.random.randn(len(idxh)), idxh)
-        low = Series(np.random.randn(len(idxl)), idxl)
-        low.plot()
-        ax = high.plot()
-
-        expected_h = idxh.to_period().asi8
-        expected_l = np.array([1514, 1519, 1523, 1527, 1531, 1536, 1540, 1544, 1549,
-                               1553, 1558, 1562])
-        for l in ax.get_lines():
-            self.assertTrue(PeriodIndex(data=l.get_xdata()).freq, idxh.freq)
-            xdata = l.get_xdata(orig=False)
-            if len(xdata) == 12: # idxl lines
-                self.assert_numpy_array_equal(xdata, expected_l)
-            else:
-                self.assert_numpy_array_equal(xdata, expected_h)
-        tm.close()
-
-        # tsplot
-        from pandas.tseries.plotting import tsplot
-        import matplotlib.pyplot as plt
-
-        tsplot(low, plt.Axes.plot)
-        lines = tsplot(high, plt.Axes.plot)
-        for l in lines:
-            self.assertTrue(PeriodIndex(data=l.get_xdata()).freq, idxh.freq)
-            xdata = l.get_xdata(orig=False)
-            if len(xdata) == 12: # idxl lines
-                self.assert_numpy_array_equal(xdata, expected_l)
-            else:
-                self.assert_numpy_array_equal(xdata, expected_h)
-
-    @slow
-    def test_from_resampling_area_line_mixed(self):
-        idxh = date_range('1/1/1999', periods=52, freq='W')
-        idxl = date_range('1/1/1999', periods=12, freq='M')
-        high = DataFrame(np.random.rand(len(idxh), 3),
-                         index=idxh, columns=[0, 1, 2])
-        low = DataFrame(np.random.rand(len(idxl), 3),
-                     index=idxl, columns=[0, 1, 2])
-
-        # low to high
-        for kind1, kind2 in [('line', 'area'), ('area', 'line')]:
-            ax = low.plot(kind=kind1, stacked=True)
-            ax = high.plot(kind=kind2, stacked=True, ax=ax)
-
-            # check low dataframe result
-            expected_x = np.array([1514, 1519, 1523, 1527, 1531, 1536, 1540, 1544, 1549,
-                                   1553, 1558, 1562])
-            expected_y = np.zeros(len(expected_x))
-            for i in range(3):
-                l = ax.lines[i]
-                self.assertEqual(PeriodIndex(l.get_xdata()).freq, idxh.freq)
-                self.assert_numpy_array_equal(l.get_xdata(orig=False), expected_x)
-                # check stacked values are correct
-                expected_y += low[i].values
-                self.assert_numpy_array_equal(l.get_ydata(orig=False), expected_y)
-
-            # check high dataframe result
-            expected_x = idxh.to_period().asi8
-            expected_y = np.zeros(len(expected_x))
-            for i in range(3):
-                l = ax.lines[3 + i]
-                self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, idxh.freq)
-                self.assert_numpy_array_equal(l.get_xdata(orig=False), expected_x)
-                expected_y += high[i].values
-                self.assert_numpy_array_equal(l.get_ydata(orig=False), expected_y)
-
-        # high to low
-        for kind1, kind2 in [('line', 'area'), ('area', 'line')]:
-            ax = high.plot(kind=kind1, stacked=True)
-            ax = low.plot(kind=kind2, stacked=True, ax=ax)
-
-            # check high dataframe result
-            expected_x = idxh.to_period().asi8
-            expected_y = np.zeros(len(expected_x))
-            for i in range(3):
-                l = ax.lines[i]
-                self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, idxh.freq)
-                self.assert_numpy_array_equal(l.get_xdata(orig=False), expected_x)
-                expected_y += high[i].values
-                self.assert_numpy_array_equal(l.get_ydata(orig=False), expected_y)
-
-            # check low dataframe result
-            expected_x = np.array([1514, 1519, 1523, 1527, 1531, 1536, 1540, 1544, 1549,
-                                   1553, 1558, 1562])
-            expected_y = np.zeros(len(expected_x))
-            for i in range(3):
-                l = ax.lines[3 + i]
-                self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, idxh.freq)
-                self.assert_numpy_array_equal(l.get_xdata(orig=False), expected_x)
-                expected_y += low[i].values
-                self.assert_numpy_array_equal(l.get_ydata(orig=False), expected_y)
-
-    @slow
-    def test_mixed_freq_second_millisecond(self):
-        # GH 7772, GH 7760
-        idxh = date_range('2014-07-01 09:00', freq='S', periods=50)
-        idxl = date_range('2014-07-01 09:00', freq='100L', periods=500)
-        high = Series(np.random.randn(len(idxh)), idxh)
-        low = Series(np.random.randn(len(idxl)), idxl)
-        # high to low
-        high.plot()
-        ax = low.plot()
-        self.assertEqual(len(ax.get_lines()), 2)
-        for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, 'L')
-        tm.close()
-
-        # low to high
-        low.plot()
-        ax = high.plot()
-        self.assertEqual(len(ax.get_lines()), 2)
-        for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, 'L')
-
-    @slow
-    def test_irreg_dtypes(self):
-        # date
-        idx = [date(2000, 1, 1), date(2000, 1, 5), date(2000, 1, 20)]
-        df = DataFrame(np.random.randn(len(idx), 3), Index(idx, dtype=object))
-        _check_plot_works(df.plot)
-
-        # np.datetime64
-        idx = date_range('1/1/2000', periods=10)
-        idx = idx[[0, 2, 5, 9]].asobject
-        df = DataFrame(np.random.randn(len(idx), 3), idx)
-        _check_plot_works(df.plot)
-
-    @slow
-    def test_time(self):
-        t = datetime(1, 1, 1, 3, 30, 0)
-        deltas = np.random.randint(1, 20, 3).cumsum()
-        ts = np.array([(t + timedelta(minutes=int(x))).time() for x in deltas])
-        df = DataFrame({'a': np.random.randn(len(ts)),
-                        'b': np.random.randn(len(ts))},
-                       index=ts)
-        ax = df.plot()
-
-        # verify tick labels
-        ticks = ax.get_xticks()
-        labels = ax.get_xticklabels()
-        for t, l in zip(ticks, labels):
-            m, s = divmod(int(t), 60)
-            h, m = divmod(m, 60)
-            xp = l.get_text()
-            if len(xp) > 0:
-                rs = time(h, m, s).strftime('%H:%M:%S')
-                self.assertEqual(xp, rs)
-
-        # change xlim
-        ax.set_xlim('1:30', '5:00')
-
-        # check tick labels again
-        ticks = ax.get_xticks()
-        labels = ax.get_xticklabels()
-        for t, l in zip(ticks, labels):
-            m, s = divmod(int(t), 60)
-            h, m = divmod(m, 60)
-            xp = l.get_text()
-            if len(xp) > 0:
-                rs = time(h, m, s).strftime('%H:%M:%S')
-                self.assertEqual(xp, rs)
-
-    @slow
-    def test_time_musec(self):
-        t = datetime(1, 1, 1, 3, 30, 0)
-        deltas = np.random.randint(1, 20, 3).cumsum()
-        ts = np.array([(t + timedelta(microseconds=int(x))).time()
-                       for x in deltas])
-        df = DataFrame({'a': np.random.randn(len(ts)),
-                        'b': np.random.randn(len(ts))},
-                       index=ts)
-        ax = df.plot()
-
-        # verify tick labels
-        ticks = ax.get_xticks()
-        labels = ax.get_xticklabels()
-        for t, l in zip(ticks, labels):
-            m, s = divmod(int(t), 60)
-            us = int((t - int(t)) * 1e6)
-            h, m = divmod(m, 60)
-            xp = l.get_text()
-            if len(xp) > 0:
-                rs = time(h, m, s).strftime('%H:%M:%S.%f')
-                self.assertEqual(xp, rs)
-
-    @slow
-    def test_secondary_upsample(self):
-        idxh = date_range('1/1/1999', periods=365, freq='D')
-        idxl = date_range('1/1/1999', periods=12, freq='M')
-        high = Series(np.random.randn(len(idxh)), idxh)
-        low = Series(np.random.randn(len(idxl)), idxl)
-        low.plot()
-        ax = high.plot(secondary_y=True)
-        for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(l.get_xdata()).freq, 'D')
-        self.assertTrue(hasattr(ax, 'left_ax'))
-        self.assertFalse(hasattr(ax, 'right_ax'))
-        for l in ax.left_ax.get_lines():
-            self.assertEqual(PeriodIndex(l.get_xdata()).freq, 'D')
-
-    @slow
-    def test_secondary_legend(self):
-        import matplotlib.pyplot as plt
-        fig = plt.gcf()
-        plt.clf()
-        ax = fig.add_subplot(211)
-
-        # ts
-        df = tm.makeTimeDataFrame()
-        ax = df.plot(secondary_y=['A', 'B'])
-        leg = ax.get_legend()
-        self.assertEqual(len(leg.get_lines()), 4)
-        self.assertEqual(leg.get_texts()[0].get_text(), 'A (right)')
-        self.assertEqual(leg.get_texts()[1].get_text(), 'B (right)')
-        self.assertEqual(leg.get_texts()[2].get_text(), 'C')
-        self.assertEqual(leg.get_texts()[3].get_text(), 'D')
-        self.assertIsNone(ax.right_ax.get_legend())
-        colors = set()
-        for line in leg.get_lines():
-            colors.add(line.get_color())
-
-        # TODO: color cycle problems
-        self.assertEqual(len(colors), 4)
-
-        plt.clf()
-        ax = fig.add_subplot(211)
-        ax = df.plot(secondary_y=['A', 'C'], mark_right=False)
-        leg = ax.get_legend()
-        self.assertEqual(len(leg.get_lines()), 4)
-        self.assertEqual(leg.get_texts()[0].get_text(), 'A')
-        self.assertEqual(leg.get_texts()[1].get_text(), 'B')
-        self.assertEqual(leg.get_texts()[2].get_text(), 'C')
-        self.assertEqual(leg.get_texts()[3].get_text(), 'D')
-
-        plt.clf()
-        ax = df.plot(kind='bar', secondary_y=['A'])
-        leg = ax.get_legend()
-        self.assertEqual(leg.get_texts()[0].get_text(), 'A (right)')
-        self.assertEqual(leg.get_texts()[1].get_text(), 'B')
-
-        plt.clf()
-        ax = df.plot(kind='bar', secondary_y=['A'], mark_right=False)
-        leg = ax.get_legend()
-        self.assertEqual(leg.get_texts()[0].get_text(), 'A')
-        self.assertEqual(leg.get_texts()[1].get_text(), 'B')
-
-        plt.clf()
-        ax = fig.add_subplot(211)
-        df = tm.makeTimeDataFrame()
-        ax = df.plot(secondary_y=['C', 'D'])
-        leg = ax.get_legend()
-        self.assertEqual(len(leg.get_lines()), 4)
-        self.assertIsNone(ax.right_ax.get_legend())
-        colors = set()
-        for line in leg.get_lines():
-            colors.add(line.get_color())
-
-        # TODO: color cycle problems
-        self.assertEqual(len(colors), 4)
-
-        # non-ts
-        df = tm.makeDataFrame()
-        plt.clf()
-        ax = fig.add_subplot(211)
-        ax = df.plot(secondary_y=['A', 'B'])
-        leg = ax.get_legend()
-        self.assertEqual(len(leg.get_lines()), 4)
-        self.assertIsNone(ax.right_ax.get_legend())
-        colors = set()
-        for line in leg.get_lines():
-            colors.add(line.get_color())
-
-        # TODO: color cycle problems
-        self.assertEqual(len(colors), 4)
-
-        plt.clf()
-        ax = fig.add_subplot(211)
-        ax = df.plot(secondary_y=['C', 'D'])
-        leg = ax.get_legend()
-        self.assertEqual(len(leg.get_lines()), 4)
-        self.assertIsNone(ax.right_ax.get_legend())
-        colors = set()
-        for line in leg.get_lines():
-            colors.add(line.get_color())
-
-        # TODO: color cycle problems
-        self.assertEqual(len(colors), 4)
-
-    def test_format_date_axis(self):
-        rng = date_range('1/1/2012', periods=12, freq='M')
-        df = DataFrame(np.random.randn(len(rng), 3), rng)
-        ax = df.plot()
-        xaxis = ax.get_xaxis()
-        for l in xaxis.get_ticklabels():
-            if len(l.get_text()) > 0:
-                self.assertEqual(l.get_rotation(), 30)
-
-    @slow
-    def test_ax_plot(self):
-        import matplotlib.pyplot as plt
-
-        x = DatetimeIndex(start='2012-01-02', periods=10,
-                          freq='D')
-        y = lrange(len(x))
-        fig = plt.figure()
-        ax = fig.add_subplot(111)
-        lines = ax.plot(x, y, label='Y')
-        tm.assert_numpy_array_equal(DatetimeIndex(lines[0].get_xdata()), x)
-
-    @slow
-    def test_mpl_nopandas(self):
-        import matplotlib.pyplot as plt
-
-        dates = [date(2008, 12, 31), date(2009, 1, 31)]
-        values1 = np.arange(10.0, 11.0, 0.5)
-        values2 = np.arange(11.0, 12.0, 0.5)
-
-        kw = dict(fmt='-', lw=4)
-
-        plt.close('all')
-        fig = plt.figure()
-        ax = fig.add_subplot(111)
-        ax.plot_date([x.toordinal() for x in dates], values1, **kw)
-        ax.plot_date([x.toordinal() for x in dates], values2, **kw)
-
-        line1, line2 = ax.get_lines()
-        tm.assert_numpy_array_equal(np.array([x.toordinal() for x in dates]),
-                           line1.get_xydata()[:, 0])
-        tm.assert_numpy_array_equal(np.array([x.toordinal() for x in dates]),
-                           line2.get_xydata()[:, 0])
-
-    @slow
-    def test_irregular_ts_shared_ax_xlim(self):
-        # GH 2960
-        ts = tm.makeTimeSeries()[:20]
-        ts_irregular = ts[[1, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 17, 18]]
-
-        # plot the left section of the irregular series, then the right section
-        ax = ts_irregular[:5].plot()
-        ts_irregular[5:].plot(ax=ax)
-
-        # check that axis limits are correct
-        left, right = ax.get_xlim()
-        self.assertEqual(left, ts_irregular.index.min().toordinal())
-        self.assertEqual(right, ts_irregular.index.max().toordinal())
-
-    @slow
-    def test_secondary_y_non_ts_xlim(self):
-        # GH 3490 - non-timeseries with secondary y
-        index_1 = [1, 2, 3, 4]
-        index_2 = [5, 6, 7, 8]
-        s1 = Series(1, index=index_1)
-        s2 = Series(2, index=index_2)
-
-        ax = s1.plot()
-        left_before, right_before = ax.get_xlim()
-        s2.plot(secondary_y=True, ax=ax)
-        left_after, right_after = ax.get_xlim()
-
-        self.assertEqual(left_before, left_after)
-        self.assertTrue(right_before < right_after)
-
-    @slow
-    def test_secondary_y_regular_ts_xlim(self):
-        # GH 3490 - regular-timeseries with secondary y
-        index_1 = date_range(start='2000-01-01', periods=4, freq='D')
-        index_2 = date_range(start='2000-01-05', periods=4, freq='D')
-        s1 = Series(1, index=index_1)
-        s2 = Series(2, index=index_2)
-
-        ax = s1.plot()
-        left_before, right_before = ax.get_xlim()
-        s2.plot(secondary_y=True, ax=ax)
-        left_after, right_after = ax.get_xlim()
-
-        self.assertEqual(left_before, left_after)
-        self.assertTrue(right_before < right_after)
-
-    @slow
-    def test_secondary_y_mixed_freq_ts_xlim(self):
-        # GH 3490 - mixed frequency timeseries with secondary y
-        rng = date_range('2000-01-01', periods=10000, freq='min')
-        ts = Series(1, index=rng)
-
-        ax = ts.plot()
-        left_before, right_before = ax.get_xlim()
-        ts.resample('D').plot(secondary_y=True, ax=ax)
-        left_after, right_after = ax.get_xlim()
-
-        # a downsample should not have changed either limit
-        self.assertEqual(left_before, left_after)
-        self.assertEqual(right_before, right_after)
-
-    @slow
-    def test_secondary_y_irregular_ts_xlim(self):
-        # GH 3490 - irregular-timeseries with secondary y
-        ts = tm.makeTimeSeries()[:20]
-        ts_irregular = ts[[1, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 17, 18]]
-
-        ax = ts_irregular[:5].plot()
-        # plot higher-x values on secondary axis
-        ts_irregular[5:].plot(secondary_y=True, ax=ax)
-        # ensure secondary limits aren't overwritten by plot on primary
-        ts_irregular[:5].plot(ax=ax)
-
-        left, right = ax.get_xlim()
-        self.assertEqual(left, ts_irregular.index.min().toordinal())
-        self.assertEqual(right, ts_irregular.index.max().toordinal())
-
-
-def _check_plot_works(f, freq=None, series=None, *args, **kwargs):
-    import matplotlib.pyplot as plt
-
-    fig = plt.gcf()
-
-    try:
-        plt.clf()
-        ax = fig.add_subplot(211)
-        orig_ax = kwargs.pop('ax', plt.gca())
-        orig_axfreq = getattr(orig_ax, 'freq', None)
-
-        ret = f(*args, **kwargs)
-        assert ret is not None  # do something more intelligent
-
-        ax = kwargs.pop('ax', plt.gca())
-        if series is not None:
-            dfreq = series.index.freq
-            if isinstance(dfreq, DateOffset):
-                dfreq = dfreq.rule_code
-            if orig_axfreq is None:
-                assert ax.freq == dfreq
-
-        if freq is not None and orig_axfreq is None:
-            assert ax.freq == freq
-
-        ax = fig.add_subplot(212)
-        try:
-            kwargs['ax'] = ax
-            ret = f(*args, **kwargs)
-            assert ret is not None  # do something more intelligent
-        except Exception:
-            pass
-
-        with ensure_clean(return_filelike=True) as path:
-            plt.savefig(path)
-    finally:
-        plt.close(fig)
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tseries/tests/test_resample.py b/pandas/tseries/tests/test_resample.py
deleted file mode 100644
index b48f077bd6f6d..0000000000000
--- a/pandas/tseries/tests/test_resample.py
+++ /dev/null
@@ -1,1648 +0,0 @@
-# pylint: disable=E1101
-
-from datetime import datetime, timedelta
-from functools import partial
-
-from pandas.compat import range, lrange, zip, product
-import numpy as np
-
-from pandas import (Series, TimeSeries, DataFrame, Panel, Index,
-                    isnull, notnull, Timestamp)
-
-from pandas.core.groupby import DataError
-from pandas.tseries.index import date_range
-from pandas.tseries.tdi import timedelta_range
-from pandas.tseries.offsets import Minute, BDay
-from pandas.tseries.period import period_range, PeriodIndex, Period
-from pandas.tseries.resample import DatetimeIndex, TimeGrouper
-from pandas.tseries.frequencies import MONTHS, DAYS
-
-import pandas.tseries.offsets as offsets
-import pandas as pd
-
-import nose
-
-from pandas.util.testing import (assert_series_equal, assert_almost_equal,
-                                 assert_frame_equal)
-import pandas.util.testing as tm
-
-bday = BDay()
-
-
-class TestResample(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        dti = DatetimeIndex(start=datetime(2005, 1, 1),
-                            end=datetime(2005, 1, 10), freq='Min')
-
-        self.series = Series(np.random.rand(len(dti)), dti)
-
-    def test_custom_grouper(self):
-
-        dti = DatetimeIndex(freq='Min', start=datetime(2005, 1, 1),
-                            end=datetime(2005, 1, 10))
-
-        s = Series(np.array([1] * len(dti)), index=dti, dtype='int64')
-
-        b = TimeGrouper(Minute(5))
-        g = s.groupby(b)
-
-        # check all cython functions work
-        funcs = ['add', 'mean', 'prod', 'ohlc', 'min', 'max', 'var']
-        for f in funcs:
-            g._cython_agg_general(f)
-
-        b = TimeGrouper(Minute(5), closed='right', label='right')
-        g = s.groupby(b)
-        # check all cython functions work
-        funcs = ['add', 'mean', 'prod', 'ohlc', 'min', 'max', 'var']
-        for f in funcs:
-            g._cython_agg_general(f)
-
-        self.assertEqual(g.ngroups, 2593)
-        self.assertTrue(notnull(g.mean()).all())
-
-        # construct expected val
-        arr = [1] + [5] * 2592
-        idx = dti[0:-1:5]
-        idx = idx.append(dti[-1:])
-        expect = Series(arr, index=idx)
-
-        # GH2763 - return in put dtype if we can
-        result = g.agg(np.sum)
-        assert_series_equal(result, expect)
-
-        df = DataFrame(np.random.rand(len(dti), 10), index=dti, dtype='float64')
-        r = df.groupby(b).agg(np.sum)
-
-        self.assertEqual(len(r.columns), 10)
-        self.assertEqual(len(r.index), 2593)
-
-    def test_resample_basic(self):
-        rng = date_range('1/1/2000 00:00:00', '1/1/2000 00:13:00', freq='min',
-                         name='index')
-        s = Series(np.random.randn(14), index=rng)
-        result = s.resample('5min', how='mean', closed='right', label='right')
-
-        exp_idx = date_range('1/1/2000', periods=4, freq='5min', name='index')
-        expected = Series([s[0], s[1:6].mean(), s[6:11].mean(), s[11:].mean()],
-                          index=exp_idx)
-        assert_series_equal(result, expected)
-        self.assertEqual(result.index.name, 'index')
-
-        result = s.resample('5min', how='mean', closed='left', label='right')
-
-        exp_idx = date_range('1/1/2000 00:05', periods=3, freq='5min', name='index')
-        expected = Series([s[:5].mean(), s[5:10].mean(), s[10:].mean()], index=exp_idx)
-        assert_series_equal(result, expected)
-
-        s = self.series
-        result = s.resample('5Min', how='last')
-        grouper = TimeGrouper(Minute(5), closed='left', label='left')
-        expect = s.groupby(grouper).agg(lambda x: x[-1])
-        assert_series_equal(result, expect)
-
-    def test_resample_how(self):
-        rng = date_range('1/1/2000 00:00:00', '1/1/2000 00:13:00',
-                            freq='min', name='index')
-        s = Series(np.random.randn(14), index=rng)
-        grouplist = np.ones_like(s)
-        grouplist[0] = 0
-        grouplist[1:6] = 1
-        grouplist[6:11] = 2
-        grouplist[11:] = 3
-        args = ['sum', 'mean', 'std', 'sem', 'max', 'min',
-                'median', 'first', 'last', 'ohlc']
-
-        def _ohlc(group):
-            if isnull(group).all():
-                return np.repeat(np.nan, 4)
-            return [group[0], group.max(), group.min(), group[-1]]
-        inds = date_range('1/1/2000', periods=4, freq='5min', name='index')
-
-        for arg in args:
-            if arg == 'ohlc':
-                func = _ohlc
-            else:
-                func = arg
-            try:
-                result = s.resample('5min', how=arg,
-                                    closed='right', label='right')
-
-                expected = s.groupby(grouplist).agg(func)
-                self.assertEqual(result.index.name, 'index')
-                if arg == 'ohlc':
-                    expected = DataFrame(expected.values.tolist())
-                    expected.columns = ['open', 'high', 'low', 'close']
-                    expected.index = Index(inds, name='index')
-                    assert_frame_equal(result, expected)
-                else:
-                    expected.index = inds
-                    assert_series_equal(result, expected)
-            except BaseException as exc:
-
-                exc.args += ('how=%s' % arg,)
-                raise
-
-    def test_resample_how_callables(self):
-        # GH 7929
-        data = np.arange(5, dtype=np.int64)
-        ind = pd.DatetimeIndex(start='2014-01-01', periods=len(data), freq='d')
-        df = pd.DataFrame({"A": data, "B": data}, index=ind)
-
-        def fn(x, a=1):
-            return str(type(x))
-
-        class fn_class:
-            def __call__(self, x):
-                return str(type(x))
-
-        df_standard = df.resample("M", how=fn)
-        df_lambda = df.resample("M", how=lambda x: str(type(x)))
-        df_partial = df.resample("M", how=partial(fn))
-        df_partial2 = df.resample("M", how=partial(fn, a=2))
-        df_class = df.resample("M", how=fn_class())
-
-        assert_frame_equal(df_standard, df_lambda)
-        assert_frame_equal(df_standard, df_partial)
-        assert_frame_equal(df_standard, df_partial2)
-        assert_frame_equal(df_standard, df_class)
-
-    def test_resample_with_timedeltas(self):
-
-        expected = DataFrame({'A' : np.arange(1480)})
-        expected = expected.groupby(expected.index // 30).sum()
-        expected.index = pd.timedelta_range('0 days',freq='30T',periods=50)
-
-        df = DataFrame({'A' : np.arange(1480)},index=pd.to_timedelta(np.arange(1480),unit='T'))
-        result = df.resample('30T',how='sum')
-
-        assert_frame_equal(result, expected)
-
-    def test_resample_rounding(self):
-        # GH 8371
-        # odd results when rounding is needed
-
-        data = """date,time,value
-11-08-2014,00:00:01.093,1
-11-08-2014,00:00:02.159,1
-11-08-2014,00:00:02.667,1
-11-08-2014,00:00:03.175,1
-11-08-2014,00:00:07.058,1
-11-08-2014,00:00:07.362,1
-11-08-2014,00:00:08.324,1
-11-08-2014,00:00:08.830,1
-11-08-2014,00:00:08.982,1
-11-08-2014,00:00:09.815,1
-11-08-2014,00:00:10.540,1
-11-08-2014,00:00:11.061,1
-11-08-2014,00:00:11.617,1
-11-08-2014,00:00:13.607,1
-11-08-2014,00:00:14.535,1
-11-08-2014,00:00:15.525,1
-11-08-2014,00:00:17.960,1
-11-08-2014,00:00:20.674,1
-11-08-2014,00:00:21.191,1"""
-
-        from pandas.compat import StringIO
-        df = pd.read_csv(StringIO(data), parse_dates={'timestamp': ['date', 'time']}, index_col='timestamp')
-        df.index.name = None
-        result = df.resample('6s', how='sum')
-        expected = DataFrame({'value' : [4,9,4,2]},index=date_range('2014-11-08',freq='6s',periods=4))
-        assert_frame_equal(result,expected)
-
-        result = df.resample('7s', how='sum')
-        expected = DataFrame({'value' : [4,10,4,1]},index=date_range('2014-11-08',freq='7s',periods=4))
-        assert_frame_equal(result,expected)
-
-        result = df.resample('11s', how='sum')
-        expected = DataFrame({'value' : [11,8]},index=date_range('2014-11-08',freq='11s',periods=2))
-        assert_frame_equal(result,expected)
-
-        result = df.resample('13s', how='sum')
-        expected = DataFrame({'value' : [13,6]},index=date_range('2014-11-08',freq='13s',periods=2))
-        assert_frame_equal(result,expected)
-
-        result = df.resample('17s', how='sum')
-        expected = DataFrame({'value' : [16,3]},index=date_range('2014-11-08',freq='17s',periods=2))
-        assert_frame_equal(result,expected)
-
-    def test_resample_basic_from_daily(self):
-        # from daily
-        dti = DatetimeIndex(
-            start=datetime(2005, 1, 1), end=datetime(2005, 1, 10),
-            freq='D', name='index')
-
-        s = Series(np.random.rand(len(dti)), dti)
-
-        # to weekly
-        result = s.resample('w-sun', how='last')
-
-        self.assertEqual(len(result), 3)
-        self.assertTrue((result.index.dayofweek == [6, 6, 6]).all())
-        self.assertEqual(result.iloc[0], s['1/2/2005'])
-        self.assertEqual(result.iloc[1], s['1/9/2005'])
-        self.assertEqual(result.iloc[2], s.iloc[-1])
-
-        result = s.resample('W-MON', how='last')
-        self.assertEqual(len(result), 2)
-        self.assertTrue((result.index.dayofweek == [0, 0]).all())
-        self.assertEqual(result.iloc[0], s['1/3/2005'])
-        self.assertEqual(result.iloc[1], s['1/10/2005'])
-
-        result = s.resample('W-TUE', how='last')
-        self.assertEqual(len(result), 2)
-        self.assertTrue((result.index.dayofweek == [1, 1]).all())
-        self.assertEqual(result.iloc[0], s['1/4/2005'])
-        self.assertEqual(result.iloc[1], s['1/10/2005'])
-
-        result = s.resample('W-WED', how='last')
-        self.assertEqual(len(result), 2)
-        self.assertTrue((result.index.dayofweek == [2, 2]).all())
-        self.assertEqual(result.iloc[0], s['1/5/2005'])
-        self.assertEqual(result.iloc[1], s['1/10/2005'])
-
-        result = s.resample('W-THU', how='last')
-        self.assertEqual(len(result), 2)
-        self.assertTrue((result.index.dayofweek == [3, 3]).all())
-        self.assertEqual(result.iloc[0], s['1/6/2005'])
-        self.assertEqual(result.iloc[1], s['1/10/2005'])
-
-        result = s.resample('W-FRI', how='last')
-        self.assertEqual(len(result), 2)
-        self.assertTrue((result.index.dayofweek == [4, 4]).all())
-        self.assertEqual(result.iloc[0], s['1/7/2005'])
-        self.assertEqual(result.iloc[1], s['1/10/2005'])
-
-        # to biz day
-        result = s.resample('B', how='last')
-        self.assertEqual(len(result), 7)
-        self.assertTrue((result.index.dayofweek == [4, 0, 1, 2, 3, 4, 0]).all())
-        self.assertEqual(result.iloc[0], s['1/2/2005'])
-        self.assertEqual(result.iloc[1], s['1/3/2005'])
-        self.assertEqual(result.iloc[5], s['1/9/2005'])
-        self.assertEqual(result.index.name, 'index')
-
-    def test_resample_upsampling_picked_but_not_correct(self):
-
-        # Test for issue #3020
-        dates = date_range('01-Jan-2014','05-Jan-2014', freq='D')
-        series = Series(1, index=dates)
-
-        result = series.resample('D')
-        self.assertEqual(result.index[0], dates[0])
-
-        # GH 5955
-        # incorrect deciding to upsample when the axis frequency matches the resample frequency
-
-        import datetime
-        s = Series(np.arange(1.,6),index=[datetime.datetime(1975, 1, i, 12, 0) for i in range(1, 6)])
-        expected = Series(np.arange(1.,6),index=date_range('19750101',periods=5,freq='D'))
-
-        result = s.resample('D',how='count')
-        assert_series_equal(result,Series(1,index=expected.index))
-
-        result1 = s.resample('D',how='sum')
-        result2 = s.resample('D',how='mean')
-        result3 = s.resample('D')
-        assert_series_equal(result1,expected)
-        assert_series_equal(result2,expected)
-        assert_series_equal(result3,expected)
-
-    def test_resample_frame_basic(self):
-        df = tm.makeTimeDataFrame()
-
-        b = TimeGrouper('M')
-        g = df.groupby(b)
-
-        # check all cython functions work
-        funcs = ['add', 'mean', 'prod', 'min', 'max', 'var']
-        for f in funcs:
-            g._cython_agg_general(f)
-
-        result = df.resample('A')
-        assert_series_equal(result['A'], df['A'].resample('A'))
-
-        result = df.resample('M')
-        assert_series_equal(result['A'], df['A'].resample('M'))
-
-        df.resample('M', kind='period')
-        df.resample('W-WED', kind='period')
-
-    def test_resample_loffset(self):
-        rng = date_range('1/1/2000 00:00:00', '1/1/2000 00:13:00', freq='min')
-        s = Series(np.random.randn(14), index=rng)
-
-        result = s.resample('5min', how='mean', closed='right', label='right',
-                            loffset=timedelta(minutes=1))
-        idx = date_range('1/1/2000', periods=4, freq='5min')
-        expected = Series([s[0], s[1:6].mean(), s[6:11].mean(), s[11:].mean()],
-                          index=idx + timedelta(minutes=1))
-        assert_series_equal(result, expected)
-
-        expected = s.resample(
-            '5min', how='mean', closed='right', label='right',
-            loffset='1min')
-        assert_series_equal(result, expected)
-
-        expected = s.resample(
-            '5min', how='mean', closed='right', label='right',
-            loffset=Minute(1))
-        assert_series_equal(result, expected)
-
-        self.assertEqual(result.index.freq, Minute(5))
-
-                # from daily
-        dti = DatetimeIndex(
-            start=datetime(2005, 1, 1), end=datetime(2005, 1, 10),
-            freq='D')
-        ser = Series(np.random.rand(len(dti)), dti)
-
-        # to weekly
-        result = ser.resample('w-sun', how='last')
-        expected = ser.resample('w-sun', how='last', loffset=-bday)
-        self.assertEqual(result.index[0] - bday, expected.index[0])
-
-    def test_resample_upsample(self):
-        # from daily
-        dti = DatetimeIndex(
-            start=datetime(2005, 1, 1), end=datetime(2005, 1, 10),
-            freq='D', name='index')
-
-        s = Series(np.random.rand(len(dti)), dti)
-
-        # to minutely, by padding
-        result = s.resample('Min', fill_method='pad')
-        self.assertEqual(len(result), 12961)
-        self.assertEqual(result[0], s[0])
-        self.assertEqual(result[-1], s[-1])
-
-        self.assertEqual(result.index.name, 'index')
-
-    def test_resample_extra_index_point(self):
-        # GH 9756
-        index = DatetimeIndex(start='20150101', end='20150331', freq='BM')
-        expected = DataFrame({'A' : Series([21,41,63], index=index)})
-
-        index = DatetimeIndex(start='20150101', end='20150331', freq='B')
-        df = DataFrame({'A' : Series(range(len(index)),index=index)},dtype='int64')
-        result = df.resample('BM', how='last')
-        assert_frame_equal(result, expected)
-
-    def test_upsample_with_limit(self):
-        rng = date_range('1/1/2000', periods=3, freq='5t')
-        ts = Series(np.random.randn(len(rng)), rng)
-
-        result = ts.resample('t', fill_method='ffill', limit=2)
-        expected = ts.reindex(result.index, method='ffill', limit=2)
-        assert_series_equal(result, expected)
-
-    def test_resample_ohlc(self):
-        s = self.series
-
-        grouper = TimeGrouper(Minute(5))
-        expect = s.groupby(grouper).agg(lambda x: x[-1])
-        result = s.resample('5Min', how='ohlc')
-
-        self.assertEqual(len(result), len(expect))
-        self.assertEqual(len(result.columns), 4)
-
-        xs = result.iloc[-2]
-        self.assertEqual(xs['open'], s[-6])
-        self.assertEqual(xs['high'], s[-6:-1].max())
-        self.assertEqual(xs['low'], s[-6:-1].min())
-        self.assertEqual(xs['close'], s[-2])
-
-        xs = result.iloc[0]
-        self.assertEqual(xs['open'], s[0])
-        self.assertEqual(xs['high'], s[:5].max())
-        self.assertEqual(xs['low'], s[:5].min())
-        self.assertEqual(xs['close'], s[4])
-
-    def test_resample_ohlc_dataframe(self):
-        df = (pd.DataFrame({'PRICE': {Timestamp('2011-01-06 10:59:05', tz=None): 24990,
-                                     Timestamp('2011-01-06 12:43:33', tz=None): 25499,
-                                     Timestamp('2011-01-06 12:54:09', tz=None): 25499},
-                           'VOLUME': {Timestamp('2011-01-06 10:59:05', tz=None): 1500000000,
-                                      Timestamp('2011-01-06 12:43:33', tz=None): 5000000000,
-                                      Timestamp('2011-01-06 12:54:09', tz=None): 100000000}})
-            ).reindex_axis(['VOLUME', 'PRICE'], axis=1)
-        res = df.resample('H', how='ohlc')
-        exp = pd.concat([df['VOLUME'].resample('H', how='ohlc'),
-                          df['PRICE'].resample('H', how='ohlc')],
-                        axis=1,
-                        keys=['VOLUME', 'PRICE'])
-        assert_frame_equal(exp, res)
-
-        df.columns = [['a', 'b'], ['c', 'd']]
-        res = df.resample('H', how='ohlc')
-        exp.columns = pd.MultiIndex.from_tuples([('a', 'c', 'open'), ('a', 'c', 'high'),
-            ('a', 'c', 'low'), ('a', 'c', 'close'), ('b', 'd', 'open'),
-            ('b', 'd', 'high'), ('b', 'd', 'low'), ('b', 'd', 'close')])
-        assert_frame_equal(exp, res)
-
-        # dupe columns fail atm
-        # df.columns = ['PRICE', 'PRICE']
-
-    def test_resample_dup_index(self):
-
-        # GH 4812
-        # dup columns with resample raising
-        df = DataFrame(np.random.randn(4,12),index=[2000,2000,2000,2000],columns=[ Period(year=2000,month=i+1,freq='M') for i in range(12) ])
-        df.iloc[3,:] = np.nan
-        result = df.resample('Q',axis=1)
-        expected = df.groupby(lambda x: int((x.month-1)/3),axis=1).mean()
-        expected.columns = [ Period(year=2000,quarter=i+1,freq='Q') for i in range(4) ]
-        assert_frame_equal(result, expected)
-
-    def test_resample_reresample(self):
-        dti = DatetimeIndex(
-            start=datetime(2005, 1, 1), end=datetime(2005, 1, 10),
-            freq='D')
-        s = Series(np.random.rand(len(dti)), dti)
-        bs = s.resample('B', closed='right', label='right')
-        result = bs.resample('8H')
-        self.assertEqual(len(result), 22)
-        tm.assertIsInstance(result.index.freq, offsets.DateOffset)
-        self.assertEqual(result.index.freq, offsets.Hour(8))
-
-    def test_resample_timestamp_to_period(self):
-        ts = _simple_ts('1/1/1990', '1/1/2000')
-
-        result = ts.resample('A-DEC', kind='period')
-        expected = ts.resample('A-DEC')
-        expected.index = period_range('1990', '2000', freq='a-dec')
-        assert_series_equal(result, expected)
-
-        result = ts.resample('A-JUN', kind='period')
-        expected = ts.resample('A-JUN')
-        expected.index = period_range('1990', '2000', freq='a-jun')
-        assert_series_equal(result, expected)
-
-        result = ts.resample('M', kind='period')
-        expected = ts.resample('M')
-        expected.index = period_range('1990-01', '2000-01', freq='M')
-        assert_series_equal(result, expected)
-
-        result = ts.resample('M', kind='period')
-        expected = ts.resample('M')
-        expected.index = period_range('1990-01', '2000-01', freq='M')
-        assert_series_equal(result, expected)
-
-    def test_ohlc_5min(self):
-        def _ohlc(group):
-            if isnull(group).all():
-                return np.repeat(np.nan, 4)
-            return [group[0], group.max(), group.min(), group[-1]]
-
-        rng = date_range('1/1/2000 00:00:00', '1/1/2000 5:59:50',
-                         freq='10s')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        resampled = ts.resample('5min', how='ohlc', closed='right',
-                                label='right')
-
-        self.assertTrue((resampled.ix['1/1/2000 00:00'] == ts[0]).all())
-
-        exp = _ohlc(ts[1:31])
-        self.assertTrue((resampled.ix['1/1/2000 00:05'] == exp).all())
-
-        exp = _ohlc(ts['1/1/2000 5:55:01':])
-        self.assertTrue((resampled.ix['1/1/2000 6:00:00'] == exp).all())
-
-    def test_downsample_non_unique(self):
-        rng = date_range('1/1/2000', '2/29/2000')
-        rng2 = rng.repeat(5).values
-        ts = Series(np.random.randn(len(rng2)), index=rng2)
-
-        result = ts.resample('M', how='mean')
-
-        expected = ts.groupby(lambda x: x.month).mean()
-        self.assertEqual(len(result), 2)
-        assert_almost_equal(result[0], expected[1])
-        assert_almost_equal(result[1], expected[2])
-
-    def test_asfreq_non_unique(self):
-        # GH #1077
-        rng = date_range('1/1/2000', '2/29/2000')
-        rng2 = rng.repeat(2).values
-        ts = Series(np.random.randn(len(rng2)), index=rng2)
-
-        self.assertRaises(Exception, ts.asfreq, 'B')
-
-    def test_resample_axis1(self):
-        rng = date_range('1/1/2000', '2/29/2000')
-        df = DataFrame(np.random.randn(3, len(rng)), columns=rng,
-                       index=['a', 'b', 'c'])
-
-        result = df.resample('M', axis=1)
-        expected = df.T.resample('M').T
-        tm.assert_frame_equal(result, expected)
-
-    def test_resample_panel(self):
-        rng = date_range('1/1/2000', '6/30/2000')
-        n = len(rng)
-
-        panel = Panel(np.random.randn(3, n, 5),
-                      items=['one', 'two', 'three'],
-                      major_axis=rng,
-                      minor_axis=['a', 'b', 'c', 'd', 'e'])
-
-        result = panel.resample('M', axis=1)
-
-        def p_apply(panel, f):
-            result = {}
-            for item in panel.items:
-                result[item] = f(panel[item])
-            return Panel(result, items=panel.items)
-
-        expected = p_apply(panel, lambda x: x.resample('M'))
-        tm.assert_panel_equal(result, expected)
-
-        panel2 = panel.swapaxes(1, 2)
-        result = panel2.resample('M', axis=2)
-        expected = p_apply(panel2, lambda x: x.resample('M', axis=1))
-        tm.assert_panel_equal(result, expected)
-
-    def test_resample_panel_numpy(self):
-        rng = date_range('1/1/2000', '6/30/2000')
-        n = len(rng)
-
-        panel = Panel(np.random.randn(3, n, 5),
-                      items=['one', 'two', 'three'],
-                      major_axis=rng,
-                      minor_axis=['a', 'b', 'c', 'd', 'e'])
-
-        result = panel.resample('M', how=lambda x: x.mean(1), axis=1)
-        expected = panel.resample('M', how='mean', axis=1)
-        tm.assert_panel_equal(result, expected)
-
-        panel = panel.swapaxes(1, 2)
-        result = panel.resample('M', how=lambda x: x.mean(2), axis=2)
-        expected = panel.resample('M', how='mean', axis=2)
-        tm.assert_panel_equal(result, expected)
-
-    def test_resample_anchored_ticks(self):
-        # If a fixed delta (5 minute, 4 hour) evenly divides a day, we should
-        # "anchor" the origin at midnight so we get regular intervals rather
-        # than starting from the first timestamp which might start in the middle
-        # of a desired interval
-
-        rng = date_range('1/1/2000 04:00:00', periods=86400, freq='s')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-        ts[:2] = np.nan  # so results are the same
-
-        freqs = ['t', '5t', '15t', '30t', '4h', '12h']
-        for freq in freqs:
-            result = ts[2:].resample(freq, closed='left', label='left')
-            expected = ts.resample(freq, closed='left', label='left')
-            assert_series_equal(result, expected)
-
-    def test_resample_single_group(self):
-        mysum = lambda x: x.sum()
-
-        rng = date_range('2000-1-1', '2000-2-10', freq='D')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-        assert_series_equal(ts.resample('M', how='sum'),
-                            ts.resample('M', how=mysum))
-
-        rng = date_range('2000-1-1', '2000-1-10', freq='D')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-        assert_series_equal(ts.resample('M', how='sum'),
-                            ts.resample('M', how=mysum))
-
-        # GH 3849
-        s = Series([30.1, 31.6], index=[Timestamp('20070915 15:30:00'),
-                                        Timestamp('20070915 15:40:00')])
-        expected = Series([0.75], index=[Timestamp('20070915')])
-        result = s.resample('D', how=lambda x: np.std(x))
-        assert_series_equal(result, expected)
-
-    def test_resample_base(self):
-        rng = date_range('1/1/2000 00:00:00', '1/1/2000 02:00', freq='s')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        resampled = ts.resample('5min', base=2)
-        exp_rng = date_range('12/31/1999 23:57:00', '1/1/2000 01:57',
-                             freq='5min')
-        self.assertTrue(resampled.index.equals(exp_rng))
-
-    def test_resample_base_with_timedeltaindex(self):
-
-        # GH 10530
-        rng = timedelta_range(start = '0s', periods = 25, freq = 's')
-        ts = Series(np.random.randn(len(rng)), index = rng)
-
-        with_base = ts.resample('2s', base = 5)
-        without_base = ts.resample('2s')
-
-        exp_without_base = timedelta_range(start = '0s', end = '25s', freq = '2s')
-        exp_with_base = timedelta_range(start = '5s', end = '29s', freq = '2s')
-
-        self.assertTrue(without_base.index.equals(exp_without_base))
-        self.assertTrue(with_base.index.equals(exp_with_base))
-
-    def test_resample_daily_anchored(self):
-        rng = date_range('1/1/2000 0:00:00', periods=10000, freq='T')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-        ts[:2] = np.nan  # so results are the same
-
-        result = ts[2:].resample('D', closed='left', label='left')
-        expected = ts.resample('D', closed='left', label='left')
-        assert_series_equal(result, expected)
-
-    def test_resample_to_period_monthly_buglet(self):
-        # GH #1259
-
-        rng = date_range('1/1/2000', '12/31/2000')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts.resample('M', kind='period')
-        exp_index = period_range('Jan-2000', 'Dec-2000', freq='M')
-        self.assertTrue(result.index.equals(exp_index))
-
-    def test_resample_empty(self):
-        ts = _simple_ts('1/1/2000', '2/1/2000')[:0]
-
-        result = ts.resample('A')
-        self.assertEqual(len(result), 0)
-        self.assertEqual(result.index.freqstr, 'A-DEC')
-
-        result = ts.resample('A', kind='period')
-        self.assertEqual(len(result), 0)
-        self.assertEqual(result.index.freqstr, 'A-DEC')
-
-        xp = DataFrame()
-        rs = xp.resample('A')
-        assert_frame_equal(xp, rs)
-
-        # Empty series were sometimes causing a segfault (for the functions
-        # with Cython bounds-checking disabled) or an IndexError.  We just run
-        # them to ensure they no longer do.  (GH #10228)
-        for index in tm.all_timeseries_index_generator(0):
-            for dtype in (np.float, np.int, np.object, 'datetime64[ns]'):
-                for how in ('count', 'mean', 'min', 'ohlc', 'last', 'prod'):
-                    empty_series = pd.Series([], index, dtype)
-                    try:
-                        empty_series.resample('d', how)
-                    except DataError:
-                        # Ignore these since some combinations are invalid
-                        # (ex: doing mean with dtype of np.object)
-                        pass
-
-    def test_weekly_resample_buglet(self):
-        # #1327
-        rng = date_range('1/1/2000', freq='B', periods=20)
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        resampled = ts.resample('W')
-        expected = ts.resample('W-SUN')
-        assert_series_equal(resampled, expected)
-
-    def test_monthly_resample_error(self):
-        # #1451
-        dates = date_range('4/16/2012 20:00', periods=5000, freq='h')
-        ts = Series(np.random.randn(len(dates)), index=dates)
-        # it works!
-        result = ts.resample('M')
-
-    def test_resample_anchored_intraday(self):
-        # #1471, #1458
-
-        rng = date_range('1/1/2012', '4/1/2012', freq='100min')
-        df = DataFrame(rng.month, index=rng)
-
-        result = df.resample('M')
-        expected = df.resample('M', kind='period').to_timestamp(how='end')
-        tm.assert_frame_equal(result, expected)
-
-        result = df.resample('M', closed='left')
-        exp = df.tshift(1, freq='D').resample('M', kind='period')
-        exp = exp.to_timestamp(how='end')
-
-        tm.assert_frame_equal(result, exp)
-
-        rng = date_range('1/1/2012', '4/1/2012', freq='100min')
-        df = DataFrame(rng.month, index=rng)
-
-        result = df.resample('Q')
-        expected = df.resample('Q', kind='period').to_timestamp(how='end')
-        tm.assert_frame_equal(result, expected)
-
-        result = df.resample('Q', closed='left')
-        expected = df.tshift(1, freq='D').resample('Q', kind='period',
-                                                   closed='left')
-        expected = expected.to_timestamp(how='end')
-        tm.assert_frame_equal(result, expected)
-
-        ts = _simple_ts('2012-04-29 23:00', '2012-04-30 5:00', freq='h')
-        resampled = ts.resample('M')
-        self.assertEqual(len(resampled), 1)
-
-    def test_resample_anchored_monthstart(self):
-        ts = _simple_ts('1/1/2000', '12/31/2002')
-
-        freqs = ['MS', 'BMS', 'QS-MAR', 'AS-DEC', 'AS-JUN']
-
-        for freq in freqs:
-            result = ts.resample(freq, how='mean')
-
-    def test_resample_anchored_multiday(self):
-        # When resampling a range spanning multiple days, ensure that the
-        # start date gets used to determine the offset.  Fixes issue where
-        # a one day period is not a multiple of the frequency.
-        #
-        # See: https://github.com/pydata/pandas/issues/8683
-
-        s = pd.Series(np.random.randn(5),
-                      index=pd.date_range('2014-10-14 23:06:23.206',
-                                          periods=3, freq='400L')
-                      | pd.date_range('2014-10-15 23:00:00',
-                                      periods=2, freq='2200L'))
-
-        # Ensure left closing works
-        result = s.resample('2200L', 'mean')
-        self.assertEqual(result.index[-1],
-                         pd.Timestamp('2014-10-15 23:00:02.000'))
-
-        # Ensure right closing works
-        result = s.resample('2200L', 'mean', label='right')
-        self.assertEqual(result.index[-1],
-                         pd.Timestamp('2014-10-15 23:00:04.200'))
-
-    def test_corner_cases(self):
-        # miscellaneous test coverage
-
-        rng = date_range('1/1/2000', periods=12, freq='t')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts.resample('5t', closed='right', label='left')
-        ex_index = date_range('1999-12-31 23:55', periods=4, freq='5t')
-        self.assertTrue(result.index.equals(ex_index))
-
-        len0pts = _simple_pts('2007-01', '2010-05', freq='M')[:0]
-        # it works
-        result = len0pts.resample('A-DEC')
-        self.assertEqual(len(result), 0)
-
-        # resample to periods
-        ts = _simple_ts('2000-04-28', '2000-04-30 11:00', freq='h')
-        result = ts.resample('M', kind='period')
-        self.assertEqual(len(result), 1)
-        self.assertEqual(result.index[0], Period('2000-04', freq='M'))
-
-    def test_anchored_lowercase_buglet(self):
-        dates = date_range('4/16/2012 20:00', periods=50000, freq='s')
-        ts = Series(np.random.randn(len(dates)), index=dates)
-        # it works!
-        ts.resample('d')
-
-    def test_upsample_apply_functions(self):
-        # #1596
-        rng = pd.date_range('2012-06-12', periods=4, freq='h')
-
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts.resample('20min', how=['mean', 'sum'])
-        tm.assertIsInstance(result, DataFrame)
-
-    def test_resample_not_monotonic(self):
-        rng = pd.date_range('2012-06-12', periods=200, freq='h')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        ts = ts.take(np.random.permutation(len(ts)))
-
-        result = ts.resample('D', how='sum')
-        exp = ts.sort_index().resample('D', how='sum')
-        assert_series_equal(result, exp)
-
-    def test_resample_median_bug_1688(self):
-
-        for dtype in ['int64','int32','float64','float32']:
-            df = DataFrame([1, 2], index=[datetime(2012, 1, 1, 0, 0, 0),
-                                          datetime(2012, 1, 1, 0, 5, 0)],
-                           dtype = dtype)
-
-            result = df.resample("T", how=lambda x: x.mean())
-            exp = df.asfreq('T')
-            tm.assert_frame_equal(result, exp)
-
-            result = df.resample("T", how="median")
-            exp = df.asfreq('T')
-            tm.assert_frame_equal(result, exp)
-
-    def test_how_lambda_functions(self):
-
-        ts = _simple_ts('1/1/2000', '4/1/2000')
-
-        result = ts.resample('M', how=lambda x: x.mean())
-        exp = ts.resample('M', how='mean')
-        tm.assert_series_equal(result, exp)
-
-        self.assertRaises(Exception, ts.resample, 'M',
-                          how=[lambda x: x.mean(), lambda x: x.std(ddof=1)])
-
-        result = ts.resample('M', how={'foo': lambda x: x.mean(),
-                                       'bar': lambda x: x.std(ddof=1)})
-        foo_exp = ts.resample('M', how='mean')
-        foo_exp.name = 'foo'
-        bar_exp = ts.resample('M', how='std')
-        bar_exp.name = 'bar'
-
-        tm.assert_series_equal(result['foo'], foo_exp)
-        tm.assert_series_equal(result['bar'], bar_exp)
-
-    def test_resample_unequal_times(self):
-        # #1772
-        start = datetime(1999, 3, 1, 5)
-        # end hour is less than start
-        end = datetime(2012, 7, 31, 4)
-        bad_ind = date_range(start, end, freq="30min")
-        df = DataFrame({'close': 1}, index=bad_ind)
-
-        # it works!
-        df.resample('AS', 'sum')
-
-    def test_resample_consistency(self):
-
-        # GH 6418
-        # resample with bfill / limit / reindex consistency
-
-        i30 = index=pd.date_range('2002-02-02', periods=4, freq='30T')
-        s=pd.Series(np.arange(4.), index=i30)
-        s[2] = np.NaN
-
-        # Upsample by factor 3 with reindex() and resample() methods:
-        i10 = pd.date_range(i30[0], i30[-1], freq='10T')
-
-        s10 = s.reindex(index=i10, method='bfill')
-        s10_2 = s.reindex(index=i10, method='bfill', limit=2)
-        rl = s.reindex_like(s10, method='bfill', limit=2)
-        r10_2 = s.resample('10Min', fill_method='bfill', limit=2)
-        r10 = s.resample('10Min', fill_method='bfill')
-
-        # s10_2, r10, r10_2, rl should all be equal
-        assert_series_equal(s10_2, r10)
-        assert_series_equal(s10_2, r10_2)
-        assert_series_equal(s10_2, rl)
-
-    def test_resample_timegrouper(self):
-        # GH 7227
-        dates1 = [datetime(2014, 10, 1), datetime(2014, 9, 3),
-                  datetime(2014, 11, 5), datetime(2014, 9, 5),
-                  datetime(2014, 10, 8), datetime(2014, 7, 15)]
-
-        dates2 = dates1[:2] + [pd.NaT] + dates1[2:4] + [pd.NaT] + dates1[4:]
-        dates3 = [pd.NaT] + dates1 + [pd.NaT]
-
-        for dates in [dates1, dates2, dates3]:
-            df = DataFrame(dict(A=dates, B=np.arange(len(dates))))
-            result = df.set_index('A').resample('M', how='count')
-            exp_idx = pd.DatetimeIndex(['2014-07-31', '2014-08-31', '2014-09-30',
-                                        '2014-10-31', '2014-11-30'], freq='M', name='A')
-            expected = DataFrame({'B': [1, 0, 2, 2, 1]}, index=exp_idx)
-            assert_frame_equal(result, expected)
-
-            result = df.groupby(pd.Grouper(freq='M', key='A')).count()
-            assert_frame_equal(result, expected)
-
-            df = DataFrame(dict(A=dates, B=np.arange(len(dates)), C=np.arange(len(dates))))
-            result = df.set_index('A').resample('M', how='count')
-            expected = DataFrame({'B': [1, 0, 2, 2, 1], 'C': [1, 0, 2, 2, 1]},
-                                 index=exp_idx, columns=['B', 'C'])
-            assert_frame_equal(result, expected)
-
-            result = df.groupby(pd.Grouper(freq='M', key='A')).count()
-            assert_frame_equal(result, expected)
-
-    def test_resample_group_info(self):  # GH10914
-        for n, k in product((10000, 100000), (10, 100, 1000)):
-            dr = date_range(start='2015-08-27', periods=n // 10, freq='T')
-            ts = Series(np.random.randint(0, n // k, n).astype('int64'),
-                        index=np.random.choice(dr, n))
-
-            left = ts.resample('30T', how='nunique')
-            ix = date_range(start=ts.index.min(),
-                            end=ts.index.max(),
-                            freq='30T')
-
-            vals = ts.values
-            bins = np.searchsorted(ix.values, ts.index, side='right')
-
-            sorter = np.lexsort((vals, bins))
-            vals, bins = vals[sorter], bins[sorter]
-
-            mask = np.r_[True, vals[1:] != vals[:-1]]
-            mask |= np.r_[True, bins[1:] != bins[:-1]]
-
-            arr = np.bincount(bins[mask] - 1, minlength=len(ix)).astype('int64',copy=False)
-            right = Series(arr, index=ix)
-
-            assert_series_equal(left, right)
-
-    def test_resample_size(self):
-        n = 10000
-        dr = date_range('2015-09-19', periods=n, freq='T')
-        ts = Series(np.random.randn(n), index=np.random.choice(dr, n))
-
-        left = ts.resample('7T', how='size')
-        ix = date_range(start=left.index.min(), end=ts.index.max(), freq='7T')
-
-        bins = np.searchsorted(ix.values, ts.index.values, side='right')
-        val = np.bincount(bins, minlength=len(ix) + 1)[1:].astype('int64',copy=False)
-
-        right = Series(val, index=ix)
-        assert_series_equal(left, right)
-
-    def test_resmaple_dst_anchor(self):
-        # 5172
-        dti = DatetimeIndex([datetime(2012, 11, 4, 23)], tz='US/Eastern')
-        df = DataFrame([5], index=dti)
-        assert_frame_equal(df.resample(rule='D', how='sum'),
-                           DataFrame([5], index=df.index.normalize()))
-        df.resample(rule='MS', how='sum')
-        assert_frame_equal(df.resample(rule='MS', how='sum'),
-                           DataFrame([5], index=DatetimeIndex([datetime(2012, 11, 1)],
-                                                              tz='US/Eastern')))
-
-        dti = date_range('2013-09-30', '2013-11-02', freq='30Min', tz='Europe/Paris')
-        values = range(dti.size)
-        df = DataFrame({"a": values, "b": values, "c": values}, index=dti, dtype='int64')
-        how = {"a": "min", "b": "max", "c": "count"}
-
-        assert_frame_equal(df.resample("W-MON", how=how)[["a", "b", "c"]],
-                           DataFrame({"a": [0, 48, 384, 720, 1056, 1394],
-                                      "b": [47, 383, 719, 1055, 1393, 1586],
-                                      "c": [48, 336, 336, 336, 338, 193]},
-                                     index=date_range('9/30/2013', '11/4/2013',
-                                                      freq='W-MON', tz='Europe/Paris')),
-                           'W-MON Frequency')
-
-        assert_frame_equal(df.resample("2W-MON", how=how)[["a", "b", "c"]],
-                           DataFrame({"a": [0, 48, 720, 1394],
-                                      "b": [47, 719, 1393, 1586],
-                                      "c": [48, 672, 674, 193]},
-                                     index=date_range('9/30/2013', '11/11/2013',
-                                                      freq='2W-MON', tz='Europe/Paris')),
-                           '2W-MON Frequency')
-
-        assert_frame_equal(df.resample("MS", how=how)[["a", "b", "c"]],
-                           DataFrame({"a": [0, 48, 1538],
-                                      "b": [47, 1537, 1586],
-                                      "c": [48, 1490, 49]},
-                                     index=date_range('9/1/2013', '11/1/2013',
-                                                      freq='MS', tz='Europe/Paris')),
-                           'MS Frequency')
-
-        assert_frame_equal(df.resample("2MS", how=how)[["a", "b", "c"]],
-                           DataFrame({"a": [0, 1538],
-                                      "b": [1537, 1586],
-                                      "c": [1538, 49]},
-                                     index=date_range('9/1/2013', '11/1/2013',
-                                                      freq='2MS', tz='Europe/Paris')),
-                           '2MS Frequency')
-
-        df_daily = df['10/26/2013':'10/29/2013']
-        assert_frame_equal(df_daily.resample("D", how={"a": "min", "b": "max", "c": "count"})[["a", "b", "c"]],
-                           DataFrame({"a": [1248, 1296, 1346, 1394],
-                                      "b": [1295, 1345, 1393, 1441],
-                                      "c": [48, 50, 48, 48]},
-                                     index=date_range('10/26/2013', '10/29/2013',
-                                                      freq='D', tz='Europe/Paris')),
-                           'D Frequency')
-
-def _simple_ts(start, end, freq='D'):
-    rng = date_range(start, end, freq=freq)
-    return Series(np.random.randn(len(rng)), index=rng)
-
-
-def _simple_pts(start, end, freq='D'):
-    rng = period_range(start, end, freq=freq)
-    return Series(np.random.randn(len(rng)), index=rng)
-
-
-class TestResamplePeriodIndex(tm.TestCase):
-
-    _multiprocess_can_split_ = True
-
-    def test_annual_upsample_D_s_f(self):
-        self._check_annual_upsample_cases('D', 'start', 'ffill')
-
-    def test_annual_upsample_D_e_f(self):
-        self._check_annual_upsample_cases('D', 'end', 'ffill')
-
-    def test_annual_upsample_D_s_b(self):
-        self._check_annual_upsample_cases('D', 'start', 'bfill')
-
-    def test_annual_upsample_D_e_b(self):
-        self._check_annual_upsample_cases('D', 'end', 'bfill')
-
-    def test_annual_upsample_B_s_f(self):
-        self._check_annual_upsample_cases('B', 'start', 'ffill')
-
-    def test_annual_upsample_B_e_f(self):
-        self._check_annual_upsample_cases('B', 'end', 'ffill')
-
-    def test_annual_upsample_B_s_b(self):
-        self._check_annual_upsample_cases('B', 'start', 'bfill')
-
-    def test_annual_upsample_B_e_b(self):
-        self._check_annual_upsample_cases('B', 'end', 'bfill')
-
-    def test_annual_upsample_M_s_f(self):
-        self._check_annual_upsample_cases('M', 'start', 'ffill')
-
-    def test_annual_upsample_M_e_f(self):
-        self._check_annual_upsample_cases('M', 'end', 'ffill')
-
-    def test_annual_upsample_M_s_b(self):
-        self._check_annual_upsample_cases('M', 'start', 'bfill')
-
-    def test_annual_upsample_M_e_b(self):
-        self._check_annual_upsample_cases('M', 'end', 'bfill')
-
-    def _check_annual_upsample_cases(self, targ, conv, meth, end='12/31/1991'):
-        for month in MONTHS:
-            ts = _simple_pts('1/1/1990', end, freq='A-%s' % month)
-
-            result = ts.resample(targ, fill_method=meth,
-                                 convention=conv)
-            expected = result.to_timestamp(targ, how=conv)
-            expected = expected.asfreq(targ, meth).to_period()
-            assert_series_equal(result, expected)
-
-    def test_basic_downsample(self):
-        ts = _simple_pts('1/1/1990', '6/30/1995', freq='M')
-        result = ts.resample('a-dec')
-
-        expected = ts.groupby(ts.index.year).mean()
-        expected.index = period_range('1/1/1990', '6/30/1995',
-                                      freq='a-dec')
-        assert_series_equal(result, expected)
-
-        # this is ok
-        assert_series_equal(ts.resample('a-dec'), result)
-        assert_series_equal(ts.resample('a'), result)
-
-    def test_not_subperiod(self):
-        # These are incompatible period rules for resampling
-        ts = _simple_pts('1/1/1990', '6/30/1995', freq='w-wed')
-        self.assertRaises(ValueError, ts.resample, 'a-dec')
-        self.assertRaises(ValueError, ts.resample, 'q-mar')
-        self.assertRaises(ValueError, ts.resample, 'M')
-        self.assertRaises(ValueError, ts.resample, 'w-thu')
-
-    def test_basic_upsample(self):
-        ts = _simple_pts('1/1/1990', '6/30/1995', freq='M')
-        result = ts.resample('a-dec')
-
-        resampled = result.resample('D', fill_method='ffill', convention='end')
-
-        expected = result.to_timestamp('D', how='end')
-        expected = expected.asfreq('D', 'ffill').to_period()
-
-        assert_series_equal(resampled, expected)
-
-    def test_upsample_with_limit(self):
-        rng = period_range('1/1/2000', periods=5, freq='A')
-        ts = Series(np.random.randn(len(rng)), rng)
-
-        result = ts.resample('M', fill_method='ffill', limit=2,
-                             convention='end')
-        expected = ts.asfreq('M').reindex(result.index, method='ffill',
-                                          limit=2)
-        assert_series_equal(result, expected)
-
-    def test_annual_upsample(self):
-        ts = _simple_pts('1/1/1990', '12/31/1995', freq='A-DEC')
-        df = DataFrame({'a': ts})
-        rdf = df.resample('D', fill_method='ffill')
-        exp = df['a'].resample('D', fill_method='ffill')
-        assert_series_equal(rdf['a'], exp)
-
-        rng = period_range('2000', '2003', freq='A-DEC')
-        ts = Series([1, 2, 3, 4], index=rng)
-
-        result = ts.resample('M', fill_method='ffill')
-        ex_index = period_range('2000-01', '2003-12', freq='M')
-
-        expected = ts.asfreq('M', how='start').reindex(ex_index,
-                                                       method='ffill')
-        assert_series_equal(result, expected)
-
-    def test_quarterly_upsample(self):
-        targets = ['D', 'B', 'M']
-
-        for month in MONTHS:
-            ts = _simple_pts('1/1/1990', '12/31/1995', freq='Q-%s' % month)
-
-            for targ, conv in product(targets, ['start', 'end']):
-                result = ts.resample(targ, fill_method='ffill',
-                                     convention=conv)
-                expected = result.to_timestamp(targ, how=conv)
-                expected = expected.asfreq(targ, 'ffill').to_period()
-                assert_series_equal(result, expected)
-
-    def test_monthly_upsample(self):
-        targets = ['D', 'B']
-
-        ts = _simple_pts('1/1/1990', '12/31/1995', freq='M')
-
-        for targ, conv in product(targets, ['start', 'end']):
-            result = ts.resample(targ, fill_method='ffill',
-                                 convention=conv)
-            expected = result.to_timestamp(targ, how=conv)
-            expected = expected.asfreq(targ, 'ffill').to_period()
-            assert_series_equal(result, expected)
-
-    def test_fill_method_and_how_upsample(self):
-        # GH2073
-        s = Series(np.arange(9,dtype='int64'),
-                   index=date_range('2010-01-01', periods=9, freq='Q'))
-        last = s.resample('M', fill_method='ffill')
-        both = s.resample('M', how='last', fill_method='ffill').astype('int64')
-        assert_series_equal(last, both)
-
-    def test_weekly_upsample(self):
-        targets = ['D', 'B']
-
-        for day in DAYS:
-            ts = _simple_pts('1/1/1990', '12/31/1995', freq='W-%s' % day)
-
-            for targ, conv in product(targets, ['start', 'end']):
-                result = ts.resample(targ, fill_method='ffill',
-                                     convention=conv)
-                expected = result.to_timestamp(targ, how=conv)
-                expected = expected.asfreq(targ, 'ffill').to_period()
-                assert_series_equal(result, expected)
-
-    def test_resample_to_timestamps(self):
-        ts = _simple_pts('1/1/1990', '12/31/1995', freq='M')
-
-        result = ts.resample('A-DEC', kind='timestamp')
-        expected = ts.to_timestamp(how='end').resample('A-DEC')
-        assert_series_equal(result, expected)
-
-    def test_resample_to_quarterly(self):
-        for month in MONTHS:
-            ts = _simple_pts('1990', '1992', freq='A-%s' % month)
-            quar_ts = ts.resample('Q-%s' % month, fill_method='ffill')
-
-            stamps = ts.to_timestamp('D', how='start')
-            qdates = period_range(ts.index[0].asfreq('D', 'start'),
-                                  ts.index[-1].asfreq('D', 'end'),
-                                  freq='Q-%s' % month)
-
-            expected = stamps.reindex(qdates.to_timestamp('D', 's'),
-                                      method='ffill')
-            expected.index = qdates
-
-            assert_series_equal(quar_ts, expected)
-
-        # conforms, but different month
-        ts = _simple_pts('1990', '1992', freq='A-JUN')
-
-        for how in ['start', 'end']:
-            result = ts.resample('Q-MAR', convention=how, fill_method='ffill')
-            expected = ts.asfreq('Q-MAR', how=how)
-            expected = expected.reindex(result.index, method='ffill')
-
-            # .to_timestamp('D')
-            # expected = expected.resample('Q-MAR', fill_method='ffill')
-
-            assert_series_equal(result, expected)
-
-    def test_resample_fill_missing(self):
-        rng = PeriodIndex([2000, 2005, 2007, 2009], freq='A')
-
-        s = Series(np.random.randn(4), index=rng)
-
-        stamps = s.to_timestamp()
-
-        filled = s.resample('A')
-        expected = stamps.resample('A').to_period('A')
-        assert_series_equal(filled, expected)
-
-        filled = s.resample('A', fill_method='ffill')
-        expected = stamps.resample('A', fill_method='ffill').to_period('A')
-        assert_series_equal(filled, expected)
-
-    def test_cant_fill_missing_dups(self):
-        rng = PeriodIndex([2000, 2005, 2005, 2007, 2007], freq='A')
-        s = Series(np.random.randn(5), index=rng)
-        self.assertRaises(Exception, s.resample, 'A')
-
-    def test_resample_5minute(self):
-        rng = period_range('1/1/2000', '1/5/2000', freq='T')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts.resample('5min')
-        expected = ts.to_timestamp().resample('5min')
-        assert_series_equal(result, expected)
-
-    def test_upsample_daily_business_daily(self):
-        ts = _simple_pts('1/1/2000', '2/1/2000', freq='B')
-
-        result = ts.resample('D')
-        expected = ts.asfreq('D').reindex(period_range('1/3/2000', '2/1/2000'))
-        assert_series_equal(result, expected)
-
-        ts = _simple_pts('1/1/2000', '2/1/2000')
-        result = ts.resample('H', convention='s')
-        exp_rng = period_range('1/1/2000', '2/1/2000 23:00', freq='H')
-        expected = ts.asfreq('H', how='s').reindex(exp_rng)
-        assert_series_equal(result, expected)
-
-    def test_resample_empty(self):
-        ts = _simple_pts('1/1/2000', '2/1/2000')[:0]
-
-        result = ts.resample('A')
-        self.assertEqual(len(result), 0)
-
-    def test_resample_irregular_sparse(self):
-        dr = date_range(start='1/1/2012', freq='5min', periods=1000)
-        s = Series(np.array(100), index=dr)
-        # subset the data.
-        subset = s[:'2012-01-04 06:55']
-
-        result = subset.resample('10min', how=len)
-        expected = s.resample('10min', how=len).ix[result.index]
-        assert_series_equal(result, expected)
-
-    def test_resample_weekly_all_na(self):
-        rng = date_range('1/1/2000', periods=10, freq='W-WED')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts.resample('W-THU')
-
-        self.assertTrue(result.isnull().all())
-
-        result = ts.resample('W-THU', fill_method='ffill')[:-1]
-        expected = ts.asfreq('W-THU', method='ffill')
-        assert_series_equal(result, expected)
-
-    def test_resample_tz_localized(self):
-        dr = date_range(start='2012-4-13', end='2012-5-1')
-        ts = Series(lrange(len(dr)), dr)
-
-        ts_utc = ts.tz_localize('UTC')
-        ts_local = ts_utc.tz_convert('America/Los_Angeles')
-
-        result = ts_local.resample('W')
-
-        ts_local_naive = ts_local.copy()
-        ts_local_naive.index = [x.replace(tzinfo=None)
-                                for x in ts_local_naive.index.to_pydatetime()]
-
-        exp = ts_local_naive.resample('W').tz_localize('America/Los_Angeles')
-
-        assert_series_equal(result, exp)
-
-        # it works
-        result = ts_local.resample('D')
-
-        # #2245
-        idx = date_range('2001-09-20 15:59', '2001-09-20 16:00', freq='T',
-                         tz='Australia/Sydney')
-        s = Series([1, 2], index=idx)
-
-        result = s.resample('D', closed='right', label='right')
-        ex_index = date_range('2001-09-21', periods=1, freq='D',
-                              tz='Australia/Sydney')
-        expected = Series([1.5], index=ex_index)
-
-        assert_series_equal(result, expected)
-
-        # for good measure
-        result = s.resample('D', kind='period')
-        ex_index = period_range('2001-09-20', periods=1, freq='D')
-        expected = Series([1.5], index=ex_index)
-        assert_series_equal(result, expected)
-
-        # GH 6397
-        # comparing an offset that doesn't propogate tz's
-        rng = date_range('1/1/2011', periods=20000, freq='H')
-        rng = rng.tz_localize('EST')
-        ts = DataFrame(index=rng)
-        ts['first']=np.random.randn(len(rng))
-        ts['second']=np.cumsum(np.random.randn(len(rng)))
-        expected = DataFrame({ 'first' : ts.resample('A',how=np.sum)['first'],
-                               'second' : ts.resample('A',how=np.mean)['second'] },columns=['first','second'])
-        result = ts.resample('A', how={'first':np.sum, 'second':np.mean}).reindex(columns=['first','second'])
-        assert_frame_equal(result,expected)
-
-    def test_closed_left_corner(self):
-        # #1465
-        s = Series(np.random.randn(21),
-                   index=date_range(start='1/1/2012 9:30',
-                                    freq='1min', periods=21))
-        s[0] = np.nan
-
-        result = s.resample('10min', how='mean', closed='left', label='right')
-        exp = s[1:].resample('10min', how='mean', closed='left', label='right')
-        assert_series_equal(result, exp)
-
-        result = s.resample('10min', how='mean', closed='left', label='left')
-        exp = s[1:].resample('10min', how='mean', closed='left', label='left')
-
-        ex_index = date_range(start='1/1/2012 9:30', freq='10min', periods=3)
-
-        self.assertTrue(result.index.equals(ex_index))
-        assert_series_equal(result, exp)
-
-    def test_quarterly_resampling(self):
-        rng = period_range('2000Q1', periods=10, freq='Q-DEC')
-        ts = Series(np.arange(10), index=rng)
-
-        result = ts.resample('A')
-        exp = ts.to_timestamp().resample('A').to_period()
-        assert_series_equal(result, exp)
-
-    def test_resample_weekly_bug_1726(self):
-        # 8/6/12 is a Monday
-        ind = DatetimeIndex(start="8/6/2012", end="8/26/2012", freq="D")
-        n = len(ind)
-        data = [[x] * 5 for x in range(n)]
-        df = DataFrame(data, columns=['open', 'high', 'low', 'close', 'vol'],
-                       index=ind)
-
-        # it works!
-        df.resample('W-MON', how='first', closed='left', label='left')
-
-    def test_resample_bms_2752(self):
-        # GH2753
-        foo = pd.Series(index=pd.bdate_range('20000101','20000201'))
-        res1 = foo.resample("BMS")
-        res2 = foo.resample("BMS").resample("B")
-        self.assertEqual(res1.index[0], Timestamp('20000103'))
-        self.assertEqual(res1.index[0], res2.index[0])
-
-    # def test_monthly_convention_span(self):
-    #     rng = period_range('2000-01', periods=3, freq='M')
-    #     ts = Series(np.arange(3), index=rng)
-
-    #     # hacky way to get same thing
-    #     exp_index = period_range('2000-01-01', '2000-03-31', freq='D')
-    #     expected = ts.asfreq('D', how='end').reindex(exp_index)
-    #     expected = expected.fillna(method='bfill')
-
-    #     result = ts.resample('D', convention='span')
-
-    #     assert_series_equal(result, expected)
-
-    def test_default_right_closed_label(self):
-        end_freq = ['D', 'Q', 'M', 'D']
-        end_types = ['M', 'A', 'Q', 'W']
-
-        for from_freq, to_freq in zip(end_freq, end_types):
-            idx = DatetimeIndex(start='8/15/2012', periods=100,
-                                freq=from_freq)
-            df = DataFrame(np.random.randn(len(idx), 2), idx)
-
-            resampled = df.resample(to_freq)
-            assert_frame_equal(resampled, df.resample(to_freq, closed='right',
-                                                      label='right'))
-
-    def test_default_left_closed_label(self):
-        others = ['MS', 'AS', 'QS', 'D', 'H']
-        others_freq = ['D', 'Q', 'M', 'H', 'T']
-
-        for from_freq, to_freq in zip(others_freq, others):
-            idx = DatetimeIndex(start='8/15/2012', periods=100,
-                                freq=from_freq)
-            df = DataFrame(np.random.randn(len(idx), 2), idx)
-
-            resampled = df.resample(to_freq)
-            assert_frame_equal(resampled, df.resample(to_freq, closed='left',
-                                                      label='left'))
-
-    def test_all_values_single_bin(self):
-        # 2070
-        index = period_range(start="2012-01-01", end="2012-12-31", freq="M")
-        s = Series(np.random.randn(len(index)), index=index)
-
-        result = s.resample("A", how='mean')
-        tm.assert_almost_equal(result[0], s.mean())
-
-    def test_evenly_divisible_with_no_extra_bins(self):
-        # 4076
-        # when the frequency is evenly divisible, sometimes extra bins
-
-        df = DataFrame(np.random.randn(9, 3), index=date_range('2000-1-1', periods=9))
-        result = df.resample('5D')
-        expected = pd.concat([df.iloc[0:5].mean(),df.iloc[5:].mean()],axis=1).T
-        expected.index = [Timestamp('2000-1-1'),Timestamp('2000-1-6')]
-        assert_frame_equal(result,expected)
-
-        index = date_range(start='2001-5-4', periods=28)
-        df = DataFrame(
-            [{'REST_KEY': 1, 'DLY_TRN_QT': 80, 'DLY_SLS_AMT': 90,
-              'COOP_DLY_TRN_QT': 30, 'COOP_DLY_SLS_AMT': 20}] * 28 +
-            [{'REST_KEY': 2, 'DLY_TRN_QT': 70, 'DLY_SLS_AMT': 10,
-              'COOP_DLY_TRN_QT': 50, 'COOP_DLY_SLS_AMT': 20}] * 28,
-            index=index.append(index)).sort_index()
-
-        index = date_range('2001-5-4',periods=4,freq='7D')
-        expected = DataFrame(
-            [{'REST_KEY': 14, 'DLY_TRN_QT': 14, 'DLY_SLS_AMT': 14,
-              'COOP_DLY_TRN_QT': 14, 'COOP_DLY_SLS_AMT': 14}] * 4,
-            index=index)
-        result = df.resample('7D', how='count')
-        assert_frame_equal(result,expected)
-
-        expected = DataFrame(
-            [{'REST_KEY': 21, 'DLY_TRN_QT': 1050, 'DLY_SLS_AMT': 700,
-              'COOP_DLY_TRN_QT': 560, 'COOP_DLY_SLS_AMT': 280}] * 4,
-            index=index)
-        result = df.resample('7D', how='sum')
-        assert_frame_equal(result,expected)
-
-class TestTimeGrouper(tm.TestCase):
-
-    def setUp(self):
-        self.ts = Series(np.random.randn(1000),
-                         index=date_range('1/1/2000', periods=1000))
-
-    def test_apply(self):
-        grouper = TimeGrouper('A', label='right', closed='right')
-
-        grouped = self.ts.groupby(grouper)
-
-        f = lambda x: x.sort_values()[-3:]
-
-        applied = grouped.apply(f)
-        expected = self.ts.groupby(lambda x: x.year).apply(f)
-
-        applied.index = applied.index.droplevel(0)
-        expected.index = expected.index.droplevel(0)
-        assert_series_equal(applied, expected)
-
-    def test_count(self):
-        self.ts[::3] = np.nan
-
-        grouper = TimeGrouper('A', label='right', closed='right')
-        result = self.ts.resample('A', how='count')
-
-        expected = self.ts.groupby(lambda x: x.year).count()
-        expected.index = result.index
-
-        assert_series_equal(result, expected)
-
-    def test_numpy_reduction(self):
-        result = self.ts.resample('A', how='prod', closed='right')
-
-        expected = self.ts.groupby(lambda x: x.year).agg(np.prod)
-        expected.index = result.index
-
-        assert_series_equal(result, expected)
-
-    def test_apply_iteration(self):
-        # #2300
-        N = 1000
-        ind = pd.date_range(start="2000-01-01", freq="D", periods=N)
-        df = DataFrame({'open': 1, 'close': 2}, index=ind)
-        tg = TimeGrouper('M')
-
-        _, grouper, _ = tg._get_grouper(df)
-
-        # Errors
-        grouped = df.groupby(grouper, group_keys=False)
-        f = lambda df: df['close'] / df['open']
-
-        # it works!
-        result = grouped.apply(f)
-        self.assertTrue(result.index.equals(df.index))
-
-    def test_panel_aggregation(self):
-        ind = pd.date_range('1/1/2000', periods=100)
-        data = np.random.randn(2, len(ind), 4)
-        wp = pd.Panel(data, items=['Item1', 'Item2'], major_axis=ind,
-                      minor_axis=['A', 'B', 'C', 'D'])
-
-        tg = TimeGrouper('M', axis=1)
-        _, grouper, _ = tg._get_grouper(wp)
-        bingrouped = wp.groupby(grouper)
-        binagg = bingrouped.mean()
-
-        def f(x):
-            assert(isinstance(x, Panel))
-            return x.mean(1)
-        result = bingrouped.agg(f)
-        tm.assert_panel_equal(result, binagg)
-
-    def test_fails_on_no_datetime_index(self):
-        index_names = ('Int64Index', 'PeriodIndex', 'Index', 'Float64Index',
-                       'MultiIndex')
-        index_funcs = (tm.makeIntIndex, tm.makePeriodIndex,
-                       tm.makeUnicodeIndex, tm.makeFloatIndex,
-                       lambda m: tm.makeCustomIndex(m, 2))
-        n = 2
-        for name, func in zip(index_names, index_funcs):
-            index = func(n)
-            df = DataFrame({'a': np.random.randn(n)}, index=index)
-            with tm.assertRaisesRegexp(TypeError,
-                                       "axis must be a DatetimeIndex, "
-                                       "but got an instance of %r" % name):
-                df.groupby(TimeGrouper('D'))
-
-    def test_aggregate_normal(self):
-        # check TimeGrouper's aggregation is identical as normal groupby
-
-        n = 20
-        data = np.random.randn(n, 4)
-        normal_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
-        normal_df['key'] = [1, 2, 3, 4, 5] * 4
-
-        dt_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
-        dt_df['key'] = [datetime(2013, 1, 1), datetime(2013, 1, 2), datetime(2013, 1, 3),
-                        datetime(2013, 1, 4), datetime(2013, 1, 5)] * 4
-
-        normal_grouped = normal_df.groupby('key')
-        dt_grouped = dt_df.groupby(TimeGrouper(key='key', freq='D'))
-
-        for func in ['min', 'max', 'prod', 'var', 'std', 'mean']:
-            expected = getattr(normal_grouped, func)()
-            dt_result = getattr(dt_grouped, func)()
-            expected.index = date_range(start='2013-01-01', freq='D', periods=5, name='key')
-            assert_frame_equal(expected, dt_result)
-
-        for func in ['count', 'sum']:
-            expected = getattr(normal_grouped, func)()
-            expected.index = date_range(start='2013-01-01', freq='D', periods=5, name='key')
-            dt_result = getattr(dt_grouped, func)()
-            assert_frame_equal(expected, dt_result)
-
-        # GH 7453
-        for func in ['size']:
-            expected = getattr(normal_grouped, func)()
-            expected.index = date_range(start='2013-01-01', freq='D', periods=5, name='key')
-            dt_result = getattr(dt_grouped, func)()
-            assert_series_equal(expected, dt_result)
-
-        """
-        for func in ['first', 'last']:
-            expected = getattr(normal_grouped, func)()
-            expected.index = date_range(start='2013-01-01', freq='D', periods=5, name='key')
-            dt_result = getattr(dt_grouped, func)()
-            assert_frame_equal(expected, dt_result)
-
-        for func in ['nth']:
-            expected = getattr(normal_grouped, func)(3)
-            expected.index = date_range(start='2013-01-01', freq='D', periods=5, name='key')
-            dt_result = getattr(dt_grouped, func)(3)
-            assert_frame_equal(expected, dt_result)
-        """
-        # if TimeGrouper is used included, 'first','last' and 'nth' doesn't work yet
-
-    def test_aggregate_with_nat(self):
-        # check TimeGrouper's aggregation is identical as normal groupby
-
-        n = 20
-        data = np.random.randn(n, 4).astype('int64')
-        normal_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
-        normal_df['key'] = [1, 2, np.nan, 4, 5] * 4
-
-        dt_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
-        dt_df['key'] = [datetime(2013, 1, 1), datetime(2013, 1, 2), pd.NaT,
-                        datetime(2013, 1, 4), datetime(2013, 1, 5)] * 4
-
-        normal_grouped = normal_df.groupby('key')
-        dt_grouped = dt_df.groupby(TimeGrouper(key='key', freq='D'))
-
-        for func in ['min', 'max', 'sum', 'prod']:
-            normal_result = getattr(normal_grouped, func)()
-            dt_result = getattr(dt_grouped, func)()
-            pad = DataFrame([[np.nan, np.nan, np.nan, np.nan]],
-                            index=[3], columns=['A', 'B', 'C', 'D'])
-            expected = normal_result.append(pad)
-            expected = expected.sort_index()
-            expected.index = date_range(start='2013-01-01', freq='D', periods=5, name='key')
-            assert_frame_equal(expected, dt_result)
-
-        for func in ['count']:
-            normal_result = getattr(normal_grouped, func)()
-            pad = DataFrame([[0, 0, 0, 0]], index=[3], columns=['A', 'B', 'C', 'D'])
-            expected = normal_result.append(pad)
-            expected = expected.sort_index()
-            expected.index = date_range(start='2013-01-01', freq='D', periods=5, name='key')
-            dt_result = getattr(dt_grouped, func)()
-            assert_frame_equal(expected, dt_result)
-
-        for func in ['size']:
-            normal_result = getattr(normal_grouped, func)()
-            pad = Series([0], index=[3])
-            expected = normal_result.append(pad)
-            expected = expected.sort_index()
-            expected.index = date_range(start='2013-01-01', freq='D', periods=5, name='key')
-            dt_result = getattr(dt_grouped, func)()
-            assert_series_equal(expected, dt_result)
-            # GH 9925
-            self.assertEqual(dt_result.index.name, 'key')
-
-        # if NaT is included, 'var', 'std', 'mean', 'first','last' and 'nth' doesn't work yet
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tseries/tests/test_timedeltas.py b/pandas/tseries/tests/test_timedeltas.py
deleted file mode 100644
index 45b98b0f85b1c..0000000000000
--- a/pandas/tseries/tests/test_timedeltas.py
+++ /dev/null
@@ -1,1573 +0,0 @@
-# pylint: disable-msg=E1101,W0612
-
-from __future__ import division
-from datetime import datetime, timedelta, time
-import nose
-
-from distutils.version import LooseVersion
-import numpy as np
-import pandas as pd
-
-from pandas import (Index, Series, DataFrame, Timestamp, Timedelta, TimedeltaIndex, isnull, notnull,
-                    bdate_range, date_range, timedelta_range, Int64Index)
-import pandas.core.common as com
-from pandas.compat import StringIO, lrange, range, zip, u, OrderedDict, long
-from pandas import compat, to_timedelta, tslib
-from pandas.tseries.timedeltas import _coerce_scalar_to_timedelta_type as ct
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal,
-                                 assert_almost_equal,
-                                 assert_index_equal,
-                                 ensure_clean)
-from numpy.testing import assert_allclose
-from pandas.tseries.offsets import Day, Second, Hour
-import pandas.util.testing as tm
-from numpy.random import rand, randn
-from pandas import _np_version_under1p8
-import pandas.compat as compat
-
-
-iNaT = tslib.iNaT
-
-class TestTimedeltas(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        pass
-
-    def test_construction(self):
-
-        expected = np.timedelta64(10,'D').astype('m8[ns]').view('i8')
-        self.assertEqual(Timedelta(10,unit='d').value, expected)
-        self.assertEqual(Timedelta(10.0,unit='d').value, expected)
-        self.assertEqual(Timedelta('10 days').value, expected)
-        self.assertEqual(Timedelta(days=10).value, expected)
-        self.assertEqual(Timedelta(days=10.0).value, expected)
-
-        expected += np.timedelta64(10,'s').astype('m8[ns]').view('i8')
-        self.assertEqual(Timedelta('10 days 00:00:10').value, expected)
-        self.assertEqual(Timedelta(days=10,seconds=10).value, expected)
-        self.assertEqual(Timedelta(days=10,milliseconds=10*1000).value, expected)
-        self.assertEqual(Timedelta(days=10,microseconds=10*1000*1000).value, expected)
-
-        # test construction with np dtypes
-        # GH 8757
-        timedelta_kwargs = {'days':'D', 'seconds':'s', 'microseconds':'us',
-                            'milliseconds':'ms', 'minutes':'m', 'hours':'h', 'weeks':'W'}
-        npdtypes = [np.int64, np.int32, np.int16,
-                    np.float64, np.float32, np.float16]
-        for npdtype in npdtypes:
-            for pykwarg, npkwarg in timedelta_kwargs.items():
-                expected = np.timedelta64(1, npkwarg).astype('m8[ns]').view('i8')
-                self.assertEqual(Timedelta(**{pykwarg:npdtype(1)}).value, expected)
-
-        # rounding cases
-        self.assertEqual(Timedelta(82739999850000).value, 82739999850000)
-        self.assertTrue('0 days 22:58:59.999850' in str(Timedelta(82739999850000)))
-        self.assertEqual(Timedelta(123072001000000).value, 123072001000000)
-        self.assertTrue('1 days 10:11:12.001' in str(Timedelta(123072001000000)))
-
-        # string conversion with/without leading zero
-        # GH 9570
-        self.assertEqual(Timedelta('0:00:00'), timedelta(hours=0))
-        self.assertEqual(Timedelta('00:00:00'), timedelta(hours=0))
-        self.assertEqual(Timedelta('-1:00:00'), -timedelta(hours=1))
-        self.assertEqual(Timedelta('-01:00:00'), -timedelta(hours=1))
-
-        # more strings
-        # GH 8190
-        self.assertEqual(Timedelta('1 h'), timedelta(hours=1))
-        self.assertEqual(Timedelta('1 hour'), timedelta(hours=1))
-        self.assertEqual(Timedelta('1 hours'), timedelta(hours=1))
-        self.assertEqual(Timedelta('-1 hours'), -timedelta(hours=1))
-        self.assertEqual(Timedelta('1 m'), timedelta(minutes=1))
-        self.assertEqual(Timedelta('1.5 m'), timedelta(seconds=90))
-        self.assertEqual(Timedelta('1 minute'), timedelta(minutes=1))
-        self.assertEqual(Timedelta('1 minutes'), timedelta(minutes=1))
-        self.assertEqual(Timedelta('1 s'), timedelta(seconds=1))
-        self.assertEqual(Timedelta('1 second'), timedelta(seconds=1))
-        self.assertEqual(Timedelta('1 seconds'), timedelta(seconds=1))
-        self.assertEqual(Timedelta('1 ms'), timedelta(milliseconds=1))
-        self.assertEqual(Timedelta('1 milli'), timedelta(milliseconds=1))
-        self.assertEqual(Timedelta('1 millisecond'), timedelta(milliseconds=1))
-        self.assertEqual(Timedelta('1 us'), timedelta(microseconds=1))
-        self.assertEqual(Timedelta('1 micros'), timedelta(microseconds=1))
-        self.assertEqual(Timedelta('1 microsecond'), timedelta(microseconds=1))
-        self.assertEqual(Timedelta('1.5 microsecond'), Timedelta('00:00:00.000001500'))
-        self.assertEqual(Timedelta('1 ns'), Timedelta('00:00:00.000000001'))
-        self.assertEqual(Timedelta('1 nano'),  Timedelta('00:00:00.000000001'))
-        self.assertEqual(Timedelta('1 nanosecond'),  Timedelta('00:00:00.000000001'))
-
-        # combos
-        self.assertEqual(Timedelta('10 days 1 hour'), timedelta(days=10,hours=1))
-        self.assertEqual(Timedelta('10 days 1 h'), timedelta(days=10,hours=1))
-        self.assertEqual(Timedelta('10 days 1 h 1m 1s'), timedelta(days=10,hours=1,minutes=1,seconds=1))
-        self.assertEqual(Timedelta('-10 days 1 h 1m 1s'), -timedelta(days=10,hours=1,minutes=1,seconds=1))
-        self.assertEqual(Timedelta('-10 days 1 h 1m 1s'), -timedelta(days=10,hours=1,minutes=1,seconds=1))
-        self.assertEqual(Timedelta('-10 days 1 h 1m 1s 3us'), -timedelta(days=10,hours=1,minutes=1,seconds=1,microseconds=3))
-        self.assertEqual(Timedelta('-10 days 1 h 1.5m 1s 3us'), -timedelta(days=10,hours=1,minutes=1,seconds=31,microseconds=3))
-
-        # currently invalid as it has a - on the hhmmdd part (only allowed on the days)
-        self.assertRaises(ValueError, lambda : Timedelta('-10 days -1 h 1.5m 1s 3us'))
-
-        # only leading neg signs are allowed
-        self.assertRaises(ValueError, lambda : Timedelta('10 days -1 h 1.5m 1s 3us'))
-
-        # no units specified
-        self.assertRaises(ValueError, lambda : Timedelta('3.1415'))
-
-        # invalid construction
-        tm.assertRaisesRegexp(ValueError,
-                              "cannot construct a TimeDelta",
-                              lambda : Timedelta())
-        tm.assertRaisesRegexp(ValueError,
-                              "unit abbreviation w/o a number",
-                              lambda : Timedelta('foo'))
-        tm.assertRaisesRegexp(ValueError,
-                              "cannot construct a TimeDelta from the passed arguments, allowed keywords are ",
-                              lambda : Timedelta(day=10))
-
-        # roundtripping both for string and value
-        for v in ['1s',
-                  '-1s',
-                  '1us',
-                  '-1us',
-                  '1 day',
-                  '-1 day',
-                  '-23:59:59.999999',
-                  '-1 days +23:59:59.999999',
-                  '-1ns',
-                  '1ns',
-                  '-23:59:59.999999999']:
-
-            td = Timedelta(v)
-            self.assertEqual(Timedelta(td.value),td)
-
-            # str does not normally display nanos
-            if not td.nanoseconds:
-                self.assertEqual(Timedelta(str(td)),td)
-            self.assertEqual(Timedelta(td._repr_base(format='all')),td)
-
-        # floats
-        expected = np.timedelta64(10,'s').astype('m8[ns]').view('i8') + np.timedelta64(500,'ms').astype('m8[ns]').view('i8')
-        self.assertEqual(Timedelta(10.5,unit='s').value, expected)
-
-        # nat
-        self.assertEqual(Timedelta('').value,iNaT)
-        self.assertEqual(Timedelta('nat').value,iNaT)
-        self.assertEqual(Timedelta('NAT').value,iNaT)
-        self.assertTrue(isnull(Timestamp('nat')))
-        self.assertTrue(isnull(Timedelta('nat')))
-
-        # offset
-        self.assertEqual(to_timedelta(pd.offsets.Hour(2)),Timedelta('0 days, 02:00:00'))
-        self.assertEqual(Timedelta(pd.offsets.Hour(2)),Timedelta('0 days, 02:00:00'))
-        self.assertEqual(Timedelta(pd.offsets.Second(2)),Timedelta('0 days, 00:00:02'))
-
-    def test_repr(self):
-
-        self.assertEqual(repr(Timedelta(10,unit='d')),"Timedelta('10 days 00:00:00')")
-        self.assertEqual(repr(Timedelta(10,unit='s')),"Timedelta('0 days 00:00:10')")
-        self.assertEqual(repr(Timedelta(10,unit='ms')),"Timedelta('0 days 00:00:00.010000')")
-        self.assertEqual(repr(Timedelta(-10,unit='ms')),"Timedelta('-1 days +23:59:59.990000')")
-
-    def test_identity(self):
-
-        td = Timedelta(10,unit='d')
-        self.assertTrue(isinstance(td, Timedelta))
-        self.assertTrue(isinstance(td, timedelta))
-
-    def test_conversion(self):
-
-        for td in [ Timedelta(10,unit='d'), Timedelta('1 days, 10:11:12.012345') ]:
-            pydt = td.to_pytimedelta()
-            self.assertTrue(td == Timedelta(pydt))
-            self.assertEqual(td, pydt)
-            self.assertTrue(isinstance(pydt, timedelta)
-                            and not isinstance(pydt, Timedelta))
-
-            self.assertEqual(td, np.timedelta64(td.value, 'ns'))
-            td64 = td.to_timedelta64()
-            self.assertEqual(td64, np.timedelta64(td.value, 'ns'))
-            self.assertEqual(td, td64)
-            self.assertTrue(isinstance(td64, np.timedelta64))
-
-        # this is NOT equal and cannot be roundtriped (because of the nanos)
-        td = Timedelta('1 days, 10:11:12.012345678')
-        self.assertTrue(td != td.to_pytimedelta())
-
-    def test_ops(self):
-
-        td = Timedelta(10,unit='d')
-        self.assertEqual(-td,Timedelta(-10,unit='d'))
-        self.assertEqual(+td,Timedelta(10,unit='d'))
-        self.assertEqual(td - td, Timedelta(0,unit='ns'))
-        self.assertTrue((td - pd.NaT) is pd.NaT)
-        self.assertEqual(td + td, Timedelta(20,unit='d'))
-        self.assertTrue((td + pd.NaT) is pd.NaT)
-        self.assertEqual(td * 2, Timedelta(20,unit='d'))
-        self.assertTrue((td * pd.NaT) is pd.NaT)
-        self.assertEqual(td / 2, Timedelta(5,unit='d'))
-        self.assertEqual(abs(td), td)
-        self.assertEqual(abs(-td), td)
-        self.assertEqual(td / td, 1)
-        self.assertTrue((td / pd.NaT) is pd.NaT)
-
-        # invert
-        self.assertEqual(-td,Timedelta('-10d'))
-        self.assertEqual(td * -1,Timedelta('-10d'))
-        self.assertEqual(-1 * td,Timedelta('-10d'))
-        self.assertEqual(abs(-td),Timedelta('10d'))
-
-        # invalid
-        self.assertRaises(TypeError, lambda : Timedelta(11,unit='d') // 2)
-
-        # invalid multiply with another timedelta
-        self.assertRaises(TypeError, lambda : td * td)
-
-        # can't operate with integers
-        self.assertRaises(TypeError, lambda : td + 2)
-        self.assertRaises(TypeError, lambda : td - 2)
-
-    def test_ops_offsets(self):
-        td = Timedelta(10, unit='d')
-        self.assertEqual(Timedelta(241, unit='h'), td + pd.offsets.Hour(1))
-        self.assertEqual(Timedelta(241, unit='h'), pd.offsets.Hour(1) + td)
-        self.assertEqual(240, td / pd.offsets.Hour(1))
-        self.assertEqual(1 / 240.0, pd.offsets.Hour(1) / td)
-        self.assertEqual(Timedelta(239, unit='h'), td - pd.offsets.Hour(1))
-        self.assertEqual(Timedelta(-239, unit='h'), pd.offsets.Hour(1) - td)
-
-    def test_freq_conversion(self):
-
-        td = Timedelta('1 days 2 hours 3 ns')
-        result = td / np.timedelta64(1,'D')
-        self.assertEqual(result, td.value/float(86400*1e9))
-        result = td / np.timedelta64(1,'s')
-        self.assertEqual(result, td.value/float(1e9))
-        result = td / np.timedelta64(1,'ns')
-        self.assertEqual(result, td.value)
-
-    def test_ops_ndarray(self):
-        td = Timedelta('1 day')
-
-        # timedelta, timedelta
-        other = pd.to_timedelta(['1 day']).values
-        expected = pd.to_timedelta(['2 days']).values
-        self.assert_numpy_array_equal(td + other, expected)
-        if LooseVersion(np.__version__) >= '1.8':
-            self.assert_numpy_array_equal(other + td, expected)
-        self.assertRaises(TypeError, lambda: td + np.array([1]))
-        self.assertRaises(TypeError, lambda: np.array([1]) + td)
-
-        expected = pd.to_timedelta(['0 days']).values
-        self.assert_numpy_array_equal(td - other, expected)
-        if LooseVersion(np.__version__) >= '1.8':
-            self.assert_numpy_array_equal(-other + td, expected)
-        self.assertRaises(TypeError, lambda: td - np.array([1]))
-        self.assertRaises(TypeError, lambda: np.array([1]) - td)
-
-        expected = pd.to_timedelta(['2 days']).values
-        self.assert_numpy_array_equal(td * np.array([2]), expected)
-        self.assert_numpy_array_equal(np.array([2]) * td, expected)
-        self.assertRaises(TypeError, lambda: td * other)
-        self.assertRaises(TypeError, lambda: other * td)
-
-        self.assert_numpy_array_equal(td / other, np.array([1]))
-        if LooseVersion(np.__version__) >= '1.8':
-            self.assert_numpy_array_equal(other / td, np.array([1]))
-
-        # timedelta, datetime
-        other = pd.to_datetime(['2000-01-01']).values
-        expected = pd.to_datetime(['2000-01-02']).values
-        self.assert_numpy_array_equal(td + other, expected)
-        if LooseVersion(np.__version__) >= '1.8':
-            self.assert_numpy_array_equal(other + td, expected)
-
-        expected = pd.to_datetime(['1999-12-31']).values
-        self.assert_numpy_array_equal(-td + other, expected)
-        if LooseVersion(np.__version__) >= '1.8':
-            self.assert_numpy_array_equal(other - td, expected)
-
-    def test_ops_series(self):
-        # regression test for GH8813
-        td = Timedelta('1 day')
-        other = pd.Series([1, 2])
-        expected = pd.Series(pd.to_timedelta(['1 day', '2 days']))
-        tm.assert_series_equal(expected, td * other)
-        tm.assert_series_equal(expected, other * td)
-
-    def test_compare_timedelta_series(self):
-        # regresssion test for GH5963
-        s = pd.Series([timedelta(days=1), timedelta(days=2)])
-        actual = s > timedelta(days=1)
-        expected = pd.Series([False, True])
-        tm.assert_series_equal(actual, expected)
-
-    def test_ops_notimplemented(self):
-        class Other:
-            pass
-        other = Other()
-
-        td = Timedelta('1 day')
-        self.assertTrue(td.__add__(other) is NotImplemented)
-        self.assertTrue(td.__sub__(other) is NotImplemented)
-        self.assertTrue(td.__truediv__(other) is NotImplemented)
-        self.assertTrue(td.__mul__(other) is NotImplemented)
-        self.assertTrue(td.__floordiv__(td) is NotImplemented)
-
-    def test_fields(self):
-
-        def check(value):
-            # that we are int/long like
-            self.assertTrue(isinstance(value, (int, compat.long)))
-
-        # compat to datetime.timedelta
-        rng = to_timedelta('1 days, 10:11:12')
-        self.assertEqual(rng.days, 1)
-        self.assertEqual(rng.seconds, 10*3600+11*60+12)
-        self.assertEqual(rng.microseconds, 0)
-        self.assertEqual(rng.nanoseconds, 0)
-
-        self.assertRaises(AttributeError, lambda : rng.hours)
-        self.assertRaises(AttributeError, lambda : rng.minutes)
-        self.assertRaises(AttributeError, lambda : rng.milliseconds)
-
-        # GH 10050
-        check(rng.days)
-        check(rng.seconds)
-        check(rng.microseconds)
-        check(rng.nanoseconds)
-
-        td = Timedelta('-1 days, 10:11:12')
-        self.assertEqual(abs(td), Timedelta('13:48:48'))
-        self.assertTrue(str(td) == "-1 days +10:11:12")
-        self.assertEqual(-td, Timedelta('0 days 13:48:48'))
-        self.assertEqual(-Timedelta('-1 days, 10:11:12').value, 49728000000000)
-        self.assertEqual(Timedelta('-1 days, 10:11:12').value, -49728000000000)
-
-        rng = to_timedelta('-1 days, 10:11:12.100123456')
-        self.assertEqual(rng.days, -1)
-        self.assertEqual(rng.seconds, 10*3600+11*60+12)
-        self.assertEqual(rng.microseconds, 100*1000+123)
-        self.assertEqual(rng.nanoseconds, 456)
-        self.assertRaises(AttributeError, lambda : rng.hours)
-        self.assertRaises(AttributeError, lambda : rng.minutes)
-        self.assertRaises(AttributeError, lambda : rng.milliseconds)
-
-        # components
-        tup = pd.to_timedelta(-1, 'us').components
-        self.assertEqual(tup.days, -1)
-        self.assertEqual(tup.hours, 23)
-        self.assertEqual(tup.minutes, 59)
-        self.assertEqual(tup.seconds, 59)
-        self.assertEqual(tup.milliseconds, 999)
-        self.assertEqual(tup.microseconds, 999)
-        self.assertEqual(tup.nanoseconds, 0)
-
-        # GH 10050
-        check(tup.days)
-        check(tup.hours)
-        check(tup.minutes)
-        check(tup.seconds)
-        check(tup.milliseconds)
-        check(tup.microseconds)
-        check(tup.nanoseconds)
-
-        tup = Timedelta('-1 days 1 us').components
-        self.assertEqual(tup.days, -2)
-        self.assertEqual(tup.hours, 23)
-        self.assertEqual(tup.minutes, 59)
-        self.assertEqual(tup.seconds, 59)
-        self.assertEqual(tup.milliseconds, 999)
-        self.assertEqual(tup.microseconds, 999)
-        self.assertEqual(tup.nanoseconds, 0)
-
-    def test_timedelta_range(self):
-
-        expected = to_timedelta(np.arange(5),unit='D')
-        result = timedelta_range('0 days',periods=5,freq='D')
-        tm.assert_index_equal(result, expected)
-
-        expected = to_timedelta(np.arange(11),unit='D')
-        result = timedelta_range('0 days','10 days',freq='D')
-        tm.assert_index_equal(result, expected)
-
-        expected = to_timedelta(np.arange(5),unit='D') + Second(2) + Day()
-        result = timedelta_range('1 days, 00:00:02','5 days, 00:00:02',freq='D')
-        tm.assert_index_equal(result, expected)
-
-        expected = to_timedelta([1,3,5,7,9],unit='D') + Second(2)
-        result = timedelta_range('1 days, 00:00:02',periods=5,freq='2D')
-        tm.assert_index_equal(result, expected)
-
-        expected = to_timedelta(np.arange(50),unit='T')*30
-        result = timedelta_range('0 days',freq='30T',periods=50)
-        tm.assert_index_equal(result, expected)
-
-        # issue10583
-        df = pd.DataFrame(np.random.normal(size=(10,4)))
-        df.index = pd.timedelta_range(start='0s', periods=10, freq='s')
-        expected = df.loc[pd.Timedelta('0s'):,:]
-        result = df.loc['0s':,:]
-        assert_frame_equal(expected, result)
-
-
-    def test_numeric_conversions(self):
-        self.assertEqual(ct(0), np.timedelta64(0,'ns'))
-        self.assertEqual(ct(10), np.timedelta64(10,'ns'))
-        self.assertEqual(ct(10,unit='ns'), np.timedelta64(10,'ns').astype('m8[ns]'))
-
-        self.assertEqual(ct(10,unit='us'), np.timedelta64(10,'us').astype('m8[ns]'))
-        self.assertEqual(ct(10,unit='ms'), np.timedelta64(10,'ms').astype('m8[ns]'))
-        self.assertEqual(ct(10,unit='s'), np.timedelta64(10,'s').astype('m8[ns]'))
-        self.assertEqual(ct(10,unit='d'), np.timedelta64(10,'D').astype('m8[ns]'))
-
-    def test_timedelta_conversions(self):
-        self.assertEqual(ct(timedelta(seconds=1)), np.timedelta64(1,'s').astype('m8[ns]'))
-        self.assertEqual(ct(timedelta(microseconds=1)), np.timedelta64(1,'us').astype('m8[ns]'))
-        self.assertEqual(ct(timedelta(days=1)), np.timedelta64(1,'D').astype('m8[ns]'))
-
-    def test_short_format_converters(self):
-        def conv(v):
-            return v.astype('m8[ns]')
-
-        self.assertEqual(ct('10'), np.timedelta64(10,'ns'))
-        self.assertEqual(ct('10ns'), np.timedelta64(10,'ns'))
-        self.assertEqual(ct('100'), np.timedelta64(100,'ns'))
-        self.assertEqual(ct('100ns'), np.timedelta64(100,'ns'))
-
-        self.assertEqual(ct('1000'), np.timedelta64(1000,'ns'))
-        self.assertEqual(ct('1000ns'), np.timedelta64(1000,'ns'))
-        self.assertEqual(ct('1000NS'), np.timedelta64(1000,'ns'))
-
-        self.assertEqual(ct('10us'), np.timedelta64(10000,'ns'))
-        self.assertEqual(ct('100us'), np.timedelta64(100000,'ns'))
-        self.assertEqual(ct('1000us'), np.timedelta64(1000000,'ns'))
-        self.assertEqual(ct('1000Us'), np.timedelta64(1000000,'ns'))
-        self.assertEqual(ct('1000uS'), np.timedelta64(1000000,'ns'))
-
-        self.assertEqual(ct('1ms'), np.timedelta64(1000000,'ns'))
-        self.assertEqual(ct('10ms'), np.timedelta64(10000000,'ns'))
-        self.assertEqual(ct('100ms'), np.timedelta64(100000000,'ns'))
-        self.assertEqual(ct('1000ms'), np.timedelta64(1000000000,'ns'))
-
-        self.assertEqual(ct('-1s'), -np.timedelta64(1000000000,'ns'))
-        self.assertEqual(ct('1s'), np.timedelta64(1000000000,'ns'))
-        self.assertEqual(ct('10s'), np.timedelta64(10000000000,'ns'))
-        self.assertEqual(ct('100s'), np.timedelta64(100000000000,'ns'))
-        self.assertEqual(ct('1000s'), np.timedelta64(1000000000000,'ns'))
-
-        self.assertEqual(ct('1d'), conv(np.timedelta64(1,'D')))
-        self.assertEqual(ct('-1d'), -conv(np.timedelta64(1,'D')))
-        self.assertEqual(ct('1D'), conv(np.timedelta64(1,'D')))
-        self.assertEqual(ct('10D'), conv(np.timedelta64(10,'D')))
-        self.assertEqual(ct('100D'), conv(np.timedelta64(100,'D')))
-        self.assertEqual(ct('1000D'), conv(np.timedelta64(1000,'D')))
-        self.assertEqual(ct('10000D'), conv(np.timedelta64(10000,'D')))
-
-        # space
-        self.assertEqual(ct(' 10000D '), conv(np.timedelta64(10000,'D')))
-        self.assertEqual(ct(' - 10000D '), -conv(np.timedelta64(10000,'D')))
-
-        # invalid
-        self.assertRaises(ValueError, ct, '1foo')
-        self.assertRaises(ValueError, ct, 'foo')
-
-    def test_full_format_converters(self):
-        def conv(v):
-            return v.astype('m8[ns]')
-        d1 = np.timedelta64(1,'D')
-
-        self.assertEqual(ct('1days'), conv(d1))
-        self.assertEqual(ct('1days,'), conv(d1))
-        self.assertEqual(ct('- 1days,'), -conv(d1))
-
-        self.assertEqual(ct('00:00:01'), conv(np.timedelta64(1,'s')))
-        self.assertEqual(ct('06:00:01'), conv(np.timedelta64(6*3600+1,'s')))
-        self.assertEqual(ct('06:00:01.0'), conv(np.timedelta64(6*3600+1,'s')))
-        self.assertEqual(ct('06:00:01.01'), conv(np.timedelta64(1000*(6*3600+1)+10,'ms')))
-
-        self.assertEqual(ct('- 1days, 00:00:01'), conv(-d1+np.timedelta64(1,'s')))
-        self.assertEqual(ct('1days, 06:00:01'), conv(d1+np.timedelta64(6*3600+1,'s')))
-        self.assertEqual(ct('1days, 06:00:01.01'), conv(d1+np.timedelta64(1000*(6*3600+1)+10,'ms')))
-
-        # invalid
-        self.assertRaises(ValueError, ct, '- 1days, 00')
-
-    def test_nat_converters(self):
-        self.assertEqual(to_timedelta('nat',box=False).astype('int64'), tslib.iNaT)
-        self.assertEqual(to_timedelta('nan',box=False).astype('int64'), tslib.iNaT)
-
-    def test_to_timedelta(self):
-        def conv(v):
-            return v.astype('m8[ns]')
-        d1 = np.timedelta64(1,'D')
-
-        self.assertEqual(to_timedelta('1 days 06:05:01.00003',box=False), conv(d1+np.timedelta64(6*3600+5*60+1,'s')+np.timedelta64(30,'us')))
-        self.assertEqual(to_timedelta('15.5us',box=False), conv(np.timedelta64(15500,'ns')))
-
-        # empty string
-        result = to_timedelta('',box=False)
-        self.assertEqual(result.astype('int64'), tslib.iNaT)
-
-        result = to_timedelta(['', ''])
-        self.assertTrue(isnull(result).all())
-
-        # pass thru
-        result = to_timedelta(np.array([np.timedelta64(1,'s')]))
-        expected = np.array([np.timedelta64(1,'s')])
-        tm.assert_almost_equal(result,expected)
-
-        # ints
-        result = np.timedelta64(0,'ns')
-        expected = to_timedelta(0,box=False)
-        self.assertEqual(result, expected)
-
-        # Series
-        expected = Series([timedelta(days=1), timedelta(days=1, seconds=1)])
-        result = to_timedelta(Series(['1d','1days 00:00:01']))
-        tm.assert_series_equal(result, expected)
-
-        # with units
-        result = TimedeltaIndex([ np.timedelta64(0,'ns'), np.timedelta64(10,'s').astype('m8[ns]') ])
-        expected = to_timedelta([0,10],unit='s')
-        tm.assert_index_equal(result, expected)
-
-        # single element conversion
-        v = timedelta(seconds=1)
-        result = to_timedelta(v,box=False)
-        expected = np.timedelta64(timedelta(seconds=1))
-        self.assertEqual(result, expected)
-
-        v = np.timedelta64(timedelta(seconds=1))
-        result = to_timedelta(v,box=False)
-        expected = np.timedelta64(timedelta(seconds=1))
-        self.assertEqual(result, expected)
-
-        # arrays of various dtypes
-        arr = np.array([1]*5,dtype='int64')
-        result = to_timedelta(arr,unit='s')
-        expected = TimedeltaIndex([ np.timedelta64(1,'s') ]*5)
-        tm.assert_index_equal(result, expected)
-
-        arr = np.array([1]*5,dtype='int64')
-        result = to_timedelta(arr,unit='m')
-        expected = TimedeltaIndex([ np.timedelta64(1,'m') ]*5)
-        tm.assert_index_equal(result, expected)
-
-        arr = np.array([1]*5,dtype='int64')
-        result = to_timedelta(arr,unit='h')
-        expected = TimedeltaIndex([ np.timedelta64(1,'h') ]*5)
-        tm.assert_index_equal(result, expected)
-
-        arr = np.array([1]*5,dtype='timedelta64[s]')
-        result = to_timedelta(arr)
-        expected = TimedeltaIndex([ np.timedelta64(1,'s') ]*5)
-        tm.assert_index_equal(result, expected)
-
-        arr = np.array([1]*5,dtype='timedelta64[D]')
-        result = to_timedelta(arr)
-        expected = TimedeltaIndex([ np.timedelta64(1,'D') ]*5)
-        tm.assert_index_equal(result, expected)
-
-        # Test with lists as input when box=false
-        expected = np.array(np.arange(3)*1000000000, dtype='timedelta64[ns]')
-        result = to_timedelta(range(3), unit='s', box=False)
-        tm.assert_numpy_array_equal(expected, result)
-
-        result = to_timedelta(np.arange(3), unit='s', box=False)
-        tm.assert_numpy_array_equal(expected, result)
-
-        result = to_timedelta([0, 1, 2], unit='s', box=False)
-        tm.assert_numpy_array_equal(expected, result)
-
-        # Tests with fractional seconds as input:
-        expected = np.array([0, 500000000, 800000000, 1200000000], dtype='timedelta64[ns]')
-        result = to_timedelta([0., 0.5, 0.8, 1.2], unit='s', box=False)
-        tm.assert_numpy_array_equal(expected, result)
-
-        def testit(unit, transform):
-
-            # array
-            result = to_timedelta(np.arange(5),unit=unit)
-            expected = TimedeltaIndex([ np.timedelta64(i,transform(unit)) for i in np.arange(5).tolist() ])
-            tm.assert_index_equal(result, expected)
-
-            # scalar
-            result = to_timedelta(2,unit=unit)
-            expected = Timedelta(np.timedelta64(2,transform(unit)).astype('timedelta64[ns]'))
-            self.assertEqual(result, expected)
-
-        # validate all units
-        # GH 6855
-        for unit in ['Y','M','W','D','y','w','d']:
-            testit(unit,lambda x: x.upper())
-        for unit in ['days','day','Day','Days']:
-            testit(unit,lambda x: 'D')
-        for unit in ['h','m','s','ms','us','ns','H','S','MS','US','NS']:
-            testit(unit,lambda x: x.lower())
-
-        # offsets
-
-        # m
-        testit('T',lambda x: 'm')
-
-        # ms
-        testit('L',lambda x: 'ms')
-
-    def test_to_timedelta_invalid(self):
-
-        # these will error
-        self.assertRaises(ValueError, lambda : to_timedelta([1,2],unit='foo'))
-        self.assertRaises(ValueError, lambda : to_timedelta(1,unit='foo'))
-
-        # time not supported ATM
-        self.assertRaises(ValueError, lambda :to_timedelta(time(second=1)))
-        self.assertTrue(to_timedelta(time(second=1), errors='coerce') is pd.NaT)
-
-        self.assertRaises(ValueError, lambda : to_timedelta(['foo','bar']))
-        tm.assert_index_equal(TimedeltaIndex([pd.NaT,pd.NaT]),
-                              to_timedelta(['foo','bar'], errors='coerce'))
-
-        tm.assert_index_equal(TimedeltaIndex(['1 day', pd.NaT, '1 min']),
-                              to_timedelta(['1 day','bar','1 min'], errors='coerce'))
-
-    def test_to_timedelta_via_apply(self):
-        # GH 5458
-        expected = Series([np.timedelta64(1,'s')])
-        result = Series(['00:00:01']).apply(to_timedelta)
-        tm.assert_series_equal(result, expected)
-
-        result = Series([to_timedelta('00:00:01')])
-        tm.assert_series_equal(result, expected)
-
-    def test_timedelta_ops(self):
-        # GH4984
-        # make sure ops return Timedelta
-        s = Series([Timestamp('20130101') + timedelta(seconds=i*i) for i in range(10) ])
-        td = s.diff()
-
-        result = td.mean()
-        expected = to_timedelta(timedelta(seconds=9))
-        self.assertEqual(result, expected)
-
-        result = td.to_frame().mean()
-        self.assertEqual(result[0], expected)
-
-        result = td.quantile(.1)
-        expected = Timedelta(np.timedelta64(2600,'ms'))
-        self.assertEqual(result, expected)
-
-        result = td.median()
-        expected = to_timedelta('00:00:09')
-        self.assertEqual(result, expected)
-
-        result = td.to_frame().median()
-        self.assertEqual(result[0], expected)
-
-        # GH 6462
-        # consistency in returned values for sum
-        result = td.sum()
-        expected = to_timedelta('00:01:21')
-        self.assertEqual(result, expected)
-
-        result = td.to_frame().sum()
-        self.assertEqual(result[0], expected)
-
-        # std
-        result = td.std()
-        expected = to_timedelta(Series(td.dropna().values).std())
-        self.assertEqual(result, expected)
-
-        result = td.to_frame().std()
-        self.assertEqual(result[0], expected)
-
-        # invalid ops
-        for op in ['skew','kurt','sem','prod']:
-            self.assertRaises(TypeError, getattr(td,op))
-
-        # GH 10040
-        # make sure NaT is properly handled by median()
-        s = Series([Timestamp('2015-02-03'), Timestamp('2015-02-07')])
-        self.assertEqual(s.diff().median(), timedelta(days=4))
-
-        s = Series([Timestamp('2015-02-03'), Timestamp('2015-02-07'), Timestamp('2015-02-15')])
-        self.assertEqual(s.diff().median(), timedelta(days=6))
-
-    def test_overflow(self):
-        # GH 9442
-        s = Series(pd.date_range('20130101',periods=100000,freq='H'))
-        s[0] += pd.Timedelta('1s 1ms')
-
-        # mean
-        result = (s-s.min()).mean()
-        expected = pd.Timedelta((pd.DatetimeIndex((s-s.min())).asi8/len(s)).sum())
-
-        # the computation is converted to float so might be some loss of precision
-        self.assertTrue(np.allclose(result.value/1000, expected.value/1000))
-
-        # sum
-        self.assertRaises(ValueError, lambda : (s-s.min()).sum())
-        s1 = s[0:10000]
-        self.assertRaises(ValueError, lambda : (s1-s1.min()).sum())
-        s2 = s[0:1000]
-        result = (s2-s2.min()).sum()
-
-    def test_timedelta_ops_scalar(self):
-        # GH 6808
-        base = pd.to_datetime('20130101 09:01:12.123456')
-        expected_add = pd.to_datetime('20130101 09:01:22.123456')
-        expected_sub = pd.to_datetime('20130101 09:01:02.123456')
-
-        for offset in [pd.to_timedelta(10,unit='s'),
-                       timedelta(seconds=10),
-                       np.timedelta64(10,'s'),
-                       np.timedelta64(10000000000,'ns'),
-                       pd.offsets.Second(10)]:
-            result = base + offset
-            self.assertEqual(result, expected_add)
-
-            result = base - offset
-            self.assertEqual(result, expected_sub)
-
-        base = pd.to_datetime('20130102 09:01:12.123456')
-        expected_add = pd.to_datetime('20130103 09:01:22.123456')
-        expected_sub = pd.to_datetime('20130101 09:01:02.123456')
-
-        for offset in [pd.to_timedelta('1 day, 00:00:10'),
-                       pd.to_timedelta('1 days, 00:00:10'),
-                       timedelta(days=1,seconds=10),
-                       np.timedelta64(1,'D')+np.timedelta64(10,'s'),
-                       pd.offsets.Day()+pd.offsets.Second(10)]:
-            result = base + offset
-            self.assertEqual(result, expected_add)
-
-            result = base - offset
-            self.assertEqual(result, expected_sub)
-
-    def test_to_timedelta_on_missing_values(self):
-        # GH5438
-        timedelta_NaT = np.timedelta64('NaT')
-
-        actual = pd.to_timedelta(Series(['00:00:01', np.nan]))
-        expected = Series([np.timedelta64(1000000000, 'ns'), timedelta_NaT], dtype='<m8[ns]')
-        assert_series_equal(actual, expected)
-
-        actual = pd.to_timedelta(Series(['00:00:01', pd.NaT]))
-        assert_series_equal(actual, expected)
-
-        actual = pd.to_timedelta(np.nan)
-        self.assertEqual(actual.value, timedelta_NaT.astype('int64'))
-
-        actual = pd.to_timedelta(pd.NaT)
-        self.assertEqual(actual.value, timedelta_NaT.astype('int64'))
-
-    def test_to_timedelta_on_nanoseconds(self):
-        # GH 9273
-        result = Timedelta(nanoseconds=100)
-        expected = Timedelta('100ns')
-        self.assertEqual(result, expected)
-
-        result = Timedelta(days=1,hours=1,minutes=1,weeks=1,seconds=1,milliseconds=1,microseconds=1,nanoseconds=1)
-        expected = Timedelta(694861001001001)
-        self.assertEqual(result, expected)
-
-        result = Timedelta(microseconds=1) + Timedelta(nanoseconds=1)
-        expected = Timedelta('1us1ns')
-        self.assertEqual(result, expected)
-
-        result = Timedelta(microseconds=1) - Timedelta(nanoseconds=1)
-        expected = Timedelta('999ns')
-        self.assertEqual(result, expected)
-
-        result = Timedelta(microseconds=1) + 5*Timedelta(nanoseconds=-2)
-        expected = Timedelta('990ns')
-        self.assertEqual(result, expected)
-
-        self.assertRaises(TypeError, lambda: Timedelta(nanoseconds='abc'))
-
-    def test_timedelta_ops_with_missing_values(self):
-        # setup
-        s1 = pd.to_timedelta(Series(['00:00:01']))
-        s2 = pd.to_timedelta(Series(['00:00:02']))
-        sn = pd.to_timedelta(Series([pd.NaT]))
-        df1 = DataFrame(['00:00:01']).apply(pd.to_timedelta)
-        df2 = DataFrame(['00:00:02']).apply(pd.to_timedelta)
-        dfn = DataFrame([pd.NaT]).apply(pd.to_timedelta)
-        scalar1 = pd.to_timedelta('00:00:01')
-        scalar2 = pd.to_timedelta('00:00:02')
-        timedelta_NaT = pd.to_timedelta('NaT')
-        NA = np.nan
-
-        actual = scalar1 + scalar1
-        self.assertEqual(actual, scalar2)
-        actual = scalar2 - scalar1
-        self.assertEqual(actual, scalar1)
-
-        actual = s1 + s1
-        assert_series_equal(actual, s2)
-        actual = s2 - s1
-        assert_series_equal(actual, s1)
-
-        actual = s1 + scalar1
-        assert_series_equal(actual, s2)
-        actual = s2 - scalar1
-        assert_series_equal(actual, s1)
-
-        actual = s1 + timedelta_NaT
-        assert_series_equal(actual, sn)
-        actual = s1 - timedelta_NaT
-        assert_series_equal(actual, sn)
-
-        actual = s1 + NA
-        assert_series_equal(actual, sn)
-        actual = s1 - NA
-        assert_series_equal(actual, sn)
-
-        actual = s1 + pd.NaT  # NaT is datetime, not timedelta
-        assert_series_equal(actual, sn)
-        actual = s2 - pd.NaT
-        assert_series_equal(actual, sn)
-
-        actual = s1 + df1
-        assert_frame_equal(actual, df2)
-        actual = s2 - df1
-        assert_frame_equal(actual, df1)
-        actual = df1 + s1
-        assert_frame_equal(actual, df2)
-        actual = df2 - s1
-        assert_frame_equal(actual, df1)
-
-        actual = df1 + df1
-        assert_frame_equal(actual, df2)
-        actual = df2 - df1
-        assert_frame_equal(actual, df1)
-
-        actual = df1 + scalar1
-        assert_frame_equal(actual, df2)
-        actual = df2 - scalar1
-        assert_frame_equal(actual, df1)
-
-        actual = df1 + timedelta_NaT
-        assert_frame_equal(actual, dfn)
-        actual = df1 - timedelta_NaT
-        assert_frame_equal(actual, dfn)
-
-        actual = df1 + NA
-        assert_frame_equal(actual, dfn)
-        actual = df1 - NA
-        assert_frame_equal(actual, dfn)
-
-        actual = df1 + pd.NaT  # NaT is datetime, not timedelta
-        assert_frame_equal(actual, dfn)
-        actual = df1 - pd.NaT
-        assert_frame_equal(actual, dfn)
-
-    def test_apply_to_timedelta(self):
-        timedelta_NaT = pd.to_timedelta('NaT')
-
-        list_of_valid_strings = ['00:00:01', '00:00:02']
-        a = pd.to_timedelta(list_of_valid_strings)
-        b = Series(list_of_valid_strings).apply(pd.to_timedelta)
-        # Can't compare until apply on a Series gives the correct dtype
-        # assert_series_equal(a, b)
-
-        list_of_strings = ['00:00:01', np.nan, pd.NaT, timedelta_NaT]
-        a = pd.to_timedelta(list_of_strings)
-        b = Series(list_of_strings).apply(pd.to_timedelta)
-        # Can't compare until apply on a Series gives the correct dtype
-        # assert_series_equal(a, b)
-
-    def test_pickle(self):
-
-        v = Timedelta('1 days 10:11:12.0123456')
-        v_p = self.round_trip_pickle(v)
-        self.assertEqual(v,v_p)
-
-    def test_timedelta_hash_equality(self):
-        #GH 11129
-        v = Timedelta(1, 'D')
-        td = timedelta(days=1)
-        self.assertEqual(hash(v), hash(td))
-
-        d = {td: 2}
-        self.assertEqual(d[v], 2)
-
-        tds = timedelta_range('1 second', periods=20)
-        self.assertTrue(
-            all(hash(td) == hash(td.to_pytimedelta()) for td in tds))
-
-        # python timedeltas drop ns resolution
-        ns_td = Timedelta(1, 'ns')
-        self.assertNotEqual(hash(ns_td), hash(ns_td.to_pytimedelta()))
-
-
-class TestTimedeltaIndex(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def test_pass_TimedeltaIndex_to_index(self):
-
-        rng = timedelta_range('1 days','10 days')
-        idx = Index(rng, dtype=object)
-
-        expected = Index(rng.to_pytimedelta(), dtype=object)
-
-        self.assert_numpy_array_equal(idx.values, expected.values)
-
-    def test_pickle(self):
-
-        rng = timedelta_range('1 days', periods=10)
-        rng_p = self.round_trip_pickle(rng)
-        tm.assert_index_equal(rng,rng_p)
-
-    def test_hash_error(self):
-        index = timedelta_range('1 days', periods=10)
-        with tm.assertRaisesRegexp(TypeError,
-                                   "unhashable type: %r" %
-                                   type(index).__name__):
-            hash(index)
-
-    def test_append_join_nondatetimeindex(self):
-        rng = timedelta_range('1 days', periods=10)
-        idx = Index(['a', 'b', 'c', 'd'])
-
-        result = rng.append(idx)
-        tm.assertIsInstance(result[0], Timedelta)
-
-        # it works
-        rng.join(idx, how='outer')
-
-    def test_append_numpy_bug_1681(self):
-
-        td = timedelta_range('1 days','10 days',freq='2D')
-        a = DataFrame()
-        c = DataFrame({'A': 'foo', 'B': td}, index=td)
-        str(c)
-
-        result = a.append(c)
-        self.assertTrue((result['B'] == td).all())
-
-    def test_astype(self):
-        rng = timedelta_range('1 days', periods=10)
-
-        result = rng.astype('i8')
-        self.assert_numpy_array_equal(result, rng.asi8)
-
-    def test_fields(self):
-        rng = timedelta_range('1 days, 10:11:12.100123456', periods=2, freq='s')
-        self.assert_numpy_array_equal(rng.days, np.array([1,1],dtype='int64'))
-        self.assert_numpy_array_equal(rng.seconds, np.array([10*3600+11*60+12,10*3600+11*60+13],dtype='int64'))
-        self.assert_numpy_array_equal(rng.microseconds, np.array([100*1000+123,100*1000+123],dtype='int64'))
-        self.assert_numpy_array_equal(rng.nanoseconds, np.array([456,456],dtype='int64'))
-
-        self.assertRaises(AttributeError, lambda : rng.hours)
-        self.assertRaises(AttributeError, lambda : rng.minutes)
-        self.assertRaises(AttributeError, lambda : rng.milliseconds)
-
-        # with nat
-        s = Series(rng)
-        s[1] = np.nan
-
-        tm.assert_series_equal(s.dt.days,Series([1,np.nan],index=[0,1]))
-        tm.assert_series_equal(s.dt.seconds,Series([10*3600+11*60+12,np.nan],index=[0,1]))
-
-    def test_total_seconds(self):
-        # GH 10939
-        # test index
-        rng = timedelta_range('1 days, 10:11:12.100123456', periods=2, freq='s')
-        expt = [1*86400+10*3600+11*60+12+100123456./1e9,1*86400+10*3600+11*60+13+100123456./1e9]
-        assert_allclose(rng.total_seconds(), expt, atol=1e-10, rtol=0)
-
-        # test Series
-        s = Series(rng)
-        s_expt = Series(expt,index=[0,1])
-        tm.assert_series_equal(s.dt.total_seconds(),s_expt)
-
-        # with nat
-        s[1] = np.nan
-        s_expt = Series([1*86400+10*3600+11*60+12+100123456./1e9,np.nan],index=[0,1])
-        tm.assert_series_equal(s.dt.total_seconds(),s_expt)
-
-        # with both nat
-        s = Series([np.nan,np.nan], dtype='timedelta64[ns]')
-        tm.assert_series_equal(s.dt.total_seconds(),Series([np.nan,np.nan],index=[0,1]))
-
-    def test_total_seconds_scalar(self):
-        # GH 10939
-        rng = Timedelta('1 days, 10:11:12.100123456')
-        expt = 1*86400+10*3600+11*60+12+100123456./1e9
-        assert_allclose(rng.total_seconds(), expt, atol=1e-10, rtol=0)
-
-        rng = Timedelta(np.nan)
-        self.assertTrue(np.isnan(rng.total_seconds()))
-
-    def test_components(self):
-        rng = timedelta_range('1 days, 10:11:12', periods=2, freq='s')
-        rng.components
-
-        # with nat
-        s = Series(rng)
-        s[1] = np.nan
-
-        result = s.dt.components
-        self.assertFalse(result.iloc[0].isnull().all())
-        self.assertTrue(result.iloc[1].isnull().all())
-
-    def test_constructor(self):
-        expected = TimedeltaIndex(['1 days','1 days 00:00:05',
-                                   '2 days','2 days 00:00:02','0 days 00:00:03'])
-        result = TimedeltaIndex(['1 days','1 days, 00:00:05',
-                                 np.timedelta64(2,'D'),
-                                 timedelta(days=2,seconds=2),
-                                 pd.offsets.Second(3)])
-        tm.assert_index_equal(result,expected)
-
-        expected = TimedeltaIndex(['0 days 00:00:00', '0 days 00:00:01', '0 days 00:00:02'])
-        tm.assert_index_equal(TimedeltaIndex(range(3), unit='s'), expected)
-        expected = TimedeltaIndex(['0 days 00:00:00', '0 days 00:00:05', '0 days 00:00:09'])
-        tm.assert_index_equal(TimedeltaIndex([0, 5, 9], unit='s'), expected)
-        expected = TimedeltaIndex(['0 days 00:00:00.400', '0 days 00:00:00.450', '0 days 00:00:01.200'])
-        tm.assert_index_equal(TimedeltaIndex([400, 450, 1200], unit='ms'), expected)
-
-    def test_constructor_coverage(self):
-        rng = timedelta_range('1 days', periods=10.5)
-        exp = timedelta_range('1 days', periods=10)
-        self.assertTrue(rng.equals(exp))
-
-        self.assertRaises(ValueError, TimedeltaIndex, start='1 days',
-                          periods='foo', freq='D')
-
-        self.assertRaises(ValueError, TimedeltaIndex, start='1 days',
-                          end='10 days')
-
-        self.assertRaises(ValueError, TimedeltaIndex, '1 days')
-
-        # generator expression
-        gen = (timedelta(i) for i in range(10))
-        result = TimedeltaIndex(gen)
-        expected = TimedeltaIndex([timedelta(i) for i in range(10)])
-        self.assertTrue(result.equals(expected))
-
-        # NumPy string array
-        strings = np.array(['1 days', '2 days', '3 days'])
-        result = TimedeltaIndex(strings)
-        expected = to_timedelta([1,2,3],unit='d')
-        self.assertTrue(result.equals(expected))
-
-        from_ints = TimedeltaIndex(expected.asi8)
-        self.assertTrue(from_ints.equals(expected))
-
-        # non-conforming freq
-        self.assertRaises(ValueError, TimedeltaIndex,
-                          ['1 days', '2 days', '4 days'],
-                          freq='D')
-
-        self.assertRaises(ValueError, TimedeltaIndex, periods=10, freq='D')
-
-    def test_constructor_name(self):
-        idx = TimedeltaIndex(start='1 days', periods=1, freq='D',
-                            name='TEST')
-        self.assertEqual(idx.name, 'TEST')
-
-        # GH10025
-        idx2 = TimedeltaIndex(idx, name='something else')
-        self.assertEqual(idx2.name, 'something else')
-
-    def test_freq_conversion(self):
-
-        # doc example
-
-        # series
-        td = Series(date_range('20130101',periods=4)) - \
-             Series(date_range('20121201',periods=4))
-        td[2] += timedelta(minutes=5,seconds=3)
-        td[3] = np.nan
-
-        result = td / np.timedelta64(1,'D')
-        expected = Series([31,31,(31*86400+5*60+3)/86400.0,np.nan])
-        assert_series_equal(result,expected)
-
-        result = td.astype('timedelta64[D]')
-        expected = Series([31,31,31,np.nan])
-        assert_series_equal(result,expected)
-
-        result = td / np.timedelta64(1,'s')
-        expected = Series([31*86400,31*86400,31*86400+5*60+3,np.nan])
-        assert_series_equal(result,expected)
-
-        result = td.astype('timedelta64[s]')
-        assert_series_equal(result,expected)
-
-        # tdi
-        td = TimedeltaIndex(td)
-
-        result = td / np.timedelta64(1,'D')
-        expected = Index([31,31,(31*86400+5*60+3)/86400.0,np.nan])
-        assert_index_equal(result,expected)
-
-        result = td.astype('timedelta64[D]')
-        expected = Index([31,31,31,np.nan])
-        assert_index_equal(result,expected)
-
-        result = td / np.timedelta64(1,'s')
-        expected = Index([31*86400,31*86400,31*86400+5*60+3,np.nan])
-        assert_index_equal(result,expected)
-
-        result = td.astype('timedelta64[s]')
-        assert_index_equal(result,expected)
-
-    def test_comparisons_coverage(self):
-        rng = timedelta_range('1 days', periods=10)
-
-        result = rng < rng[3]
-        exp = np.array([True, True, True]+[False]*7)
-        self.assert_numpy_array_equal(result, exp)
-
-        # raise TypeError for now
-        self.assertRaises(TypeError, rng.__lt__, rng[3].value)
-
-        result = rng == list(rng)
-        exp = rng == rng
-        self.assert_numpy_array_equal(result, exp)
-
-    def test_comparisons_nat(self):
-
-        tdidx1 = pd.TimedeltaIndex(['1 day', pd.NaT, '1 day 00:00:01', pd.NaT,
-                                    '1 day 00:00:01', '5 day 00:00:03'])
-        tdidx2 = pd.TimedeltaIndex(['2 day', '2 day', pd.NaT, pd.NaT,
-                                    '1 day 00:00:02', '5 days 00:00:03'])
-        tdarr = np.array([np.timedelta64(2,'D'),
-                          np.timedelta64(2,'D'),
-                          np.timedelta64('nat'), np.timedelta64('nat'),
-                          np.timedelta64(1,'D') + np.timedelta64(2,'s'),
-                          np.timedelta64(5,'D') + np.timedelta64(3,'s')])
-
-        if _np_version_under1p8:
-            # cannot test array because np.datetime('nat') returns today's date
-            cases = [(tdidx1, tdidx2)]
-        else:
-            cases = [(tdidx1, tdidx2), (tdidx1, tdarr)]
-
-        # Check pd.NaT is handles as the same as np.nan
-        for idx1, idx2 in cases:
-
-            result = idx1 < idx2
-            expected = np.array([True, False, False, False, True, False])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx2 > idx1
-            expected = np.array([True, False, False, False, True, False])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 <= idx2
-            expected = np.array([True, False, False, False, True, True])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx2 >= idx1
-            expected = np.array([True, False, False, False, True, True])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 == idx2
-            expected = np.array([False, False, False, False, False, True])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 != idx2
-            expected = np.array([True, True, True, True, True, False])
-            self.assert_numpy_array_equal(result, expected)
-
-    def test_map(self):
-
-        rng = timedelta_range('1 day', periods=10)
-
-        f = lambda x: x.days
-        result = rng.map(f)
-        exp = [f(x) for x in rng]
-        self.assert_numpy_array_equal(result, exp)
-
-    def test_misc_coverage(self):
-
-        rng = timedelta_range('1 day', periods=5)
-        result = rng.groupby(rng.days)
-        tm.assertIsInstance(list(result.values())[0][0], Timedelta)
-
-        idx = TimedeltaIndex(['3d','1d','2d'])
-        self.assertTrue(idx.equals(list(idx)))
-
-        non_td = Index(list('abc'))
-        self.assertFalse(idx.equals(list(non_td)))
-
-    def test_union(self):
-
-        i1 = timedelta_range('1day',periods=5)
-        i2 = timedelta_range('3day',periods=5)
-        result = i1.union(i2)
-        expected = timedelta_range('1day',periods=7)
-        self.assert_numpy_array_equal(result, expected)
-
-        i1 = Int64Index(np.arange(0, 20, 2))
-        i2 = TimedeltaIndex(start='1 day', periods=10, freq='D')
-        i1.union(i2)  # Works
-        i2.union(i1)  # Fails with "AttributeError: can't set attribute"
-
-    def test_union_coverage(self):
-
-        idx = TimedeltaIndex(['3d','1d','2d'])
-        ordered = TimedeltaIndex(idx.sort_values(), freq='infer')
-        result = ordered.union(idx)
-        self.assertTrue(result.equals(ordered))
-
-        result = ordered[:0].union(ordered)
-        self.assertTrue(result.equals(ordered))
-        self.assertEqual(result.freq, ordered.freq)
-
-    def test_union_bug_1730(self):
-
-        rng_a = timedelta_range('1 day', periods=4, freq='3H')
-        rng_b = timedelta_range('1 day', periods=4, freq='4H')
-
-        result = rng_a.union(rng_b)
-        exp = TimedeltaIndex(sorted(set(list(rng_a)) | set(list(rng_b))))
-        self.assertTrue(result.equals(exp))
-
-    def test_union_bug_1745(self):
-
-        left = TimedeltaIndex(['1 day 15:19:49.695000'])
-        right = TimedeltaIndex(['2 day 13:04:21.322000',
-                               '1 day 15:27:24.873000',
-                               '1 day 15:31:05.350000'])
-
-        result = left.union(right)
-        exp = TimedeltaIndex(sorted(set(list(left)) | set(list(right))))
-        self.assertTrue(result.equals(exp))
-
-    def test_union_bug_4564(self):
-
-        left = timedelta_range("1 day","30d")
-        right = left + pd.offsets.Minute(15)
-
-        result = left.union(right)
-        exp = TimedeltaIndex(sorted(set(list(left)) | set(list(right))))
-        self.assertTrue(result.equals(exp))
-
-    def test_intersection_bug_1708(self):
-        index_1 = timedelta_range('1 day', periods=4, freq='h')
-        index_2 = index_1 + pd.offsets.Hour(5)
-
-        result = index_1 & index_2
-        self.assertEqual(len(result), 0)
-
-        index_1 = timedelta_range('1 day', periods=4, freq='h')
-        index_2 = index_1 + pd.offsets.Hour(1)
-
-        result = index_1 & index_2
-        expected = timedelta_range('1 day 01:00:00',periods=3,freq='h')
-        tm.assert_index_equal(result,expected)
-
-    def test_get_duplicates(self):
-        idx = TimedeltaIndex(['1 day','2 day','2 day','3 day','3day', '4day'])
-
-        result = idx.get_duplicates()
-        ex = TimedeltaIndex(['2 day','3day'])
-        self.assertTrue(result.equals(ex))
-
-    def test_argmin_argmax(self):
-        idx = TimedeltaIndex(['1 day 00:00:05','1 day 00:00:01','1 day 00:00:02'])
-        self.assertEqual(idx.argmin(), 1)
-        self.assertEqual(idx.argmax(), 0)
-
-    def test_sort_values(self):
-
-        idx = TimedeltaIndex(['4d','1d','2d'])
-
-        ordered = idx.sort_values()
-        self.assertTrue(ordered.is_monotonic)
-
-        ordered = idx.sort_values(ascending=False)
-        self.assertTrue(ordered[::-1].is_monotonic)
-
-        ordered, dexer = idx.sort_values(return_indexer=True)
-        self.assertTrue(ordered.is_monotonic)
-        self.assert_numpy_array_equal(dexer, [1, 2, 0])
-
-        ordered, dexer = idx.sort_values(return_indexer=True, ascending=False)
-        self.assertTrue(ordered[::-1].is_monotonic)
-        self.assert_numpy_array_equal(dexer, [0, 2, 1])
-
-    def test_insert(self):
-
-        idx = TimedeltaIndex(['4day','1day','2day'], name='idx')
-
-        result = idx.insert(2, timedelta(days=5))
-        exp = TimedeltaIndex(['4day','1day','5day','2day'],name='idx')
-        self.assertTrue(result.equals(exp))
-
-        # insertion of non-datetime should coerce to object index
-        result = idx.insert(1, 'inserted')
-        expected = Index([Timedelta('4day'), 'inserted', Timedelta('1day'),
-                          Timedelta('2day')], name='idx')
-        self.assertNotIsInstance(result, TimedeltaIndex)
-        tm.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
-
-        idx = timedelta_range('1day 00:00:01', periods=3, freq='s', name='idx')
-
-        # preserve freq
-        expected_0 = TimedeltaIndex(['1day','1day 00:00:01','1day 00:00:02','1day 00:00:03'],
-                                    name='idx', freq='s')
-        expected_3 = TimedeltaIndex(['1day 00:00:01','1day 00:00:02','1day 00:00:03','1day 00:00:04'],
-                                    name='idx', freq='s')
-
-        # reset freq to None
-        expected_1_nofreq = TimedeltaIndex(['1day 00:00:01','1day 00:00:01','1day 00:00:02','1day 00:00:03'],
-                                           name='idx', freq=None)
-        expected_3_nofreq = TimedeltaIndex(['1day 00:00:01','1day 00:00:02','1day 00:00:03','1day 00:00:05'],
-                                           name='idx', freq=None)
-
-        cases = [(0, Timedelta('1day'), expected_0),
-                 (-3, Timedelta('1day'), expected_0),
-                 (3, Timedelta('1day 00:00:04'), expected_3),
-                 (1, Timedelta('1day 00:00:01'), expected_1_nofreq),
-                 (3, Timedelta('1day 00:00:05'), expected_3_nofreq)]
-
-        for n, d, expected in cases:
-            result = idx.insert(n, d)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
-
-    def test_delete(self):
-        idx = timedelta_range(start='1 Days', periods=5, freq='D', name='idx')
-
-        # prserve freq
-        expected_0 = timedelta_range(start='2 Days', periods=4, freq='D', name='idx')
-        expected_4 = timedelta_range(start='1 Days', periods=4, freq='D', name='idx')
-
-        # reset freq to None
-        expected_1 = TimedeltaIndex(['1 day','3 day','4 day', '5 day'],freq=None,name='idx')
-
-        cases ={0: expected_0, -5: expected_0,
-                -1: expected_4, 4: expected_4,
-                1: expected_1}
-        for n, expected in compat.iteritems(cases):
-            result = idx.delete(n)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
-
-        with tm.assertRaises((IndexError, ValueError)):
-            # either depeidnig on numpy version
-            result = idx.delete(5)
-
-    def test_delete_slice(self):
-        idx = timedelta_range(start='1 days', periods=10, freq='D', name='idx')
-
-        # prserve freq
-        expected_0_2 = timedelta_range(start='4 days', periods=7, freq='D', name='idx')
-        expected_7_9 = timedelta_range(start='1 days', periods=7, freq='D', name='idx')
-
-        # reset freq to None
-        expected_3_5 = TimedeltaIndex(['1 d','2 d','3 d',
-                                       '7 d','8 d','9 d','10d'], freq=None, name='idx')
-
-        cases ={(0, 1, 2): expected_0_2,
-                (7, 8, 9): expected_7_9,
-                (3, 4, 5): expected_3_5}
-        for n, expected in compat.iteritems(cases):
-            result = idx.delete(n)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.delete(slice(n[0], n[-1] + 1))
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
-
-    def test_take(self):
-
-        tds = ['1day 02:00:00','1 day 04:00:00','1 day 10:00:00']
-        idx = TimedeltaIndex(start='1d',end='2d',freq='H',name='idx')
-        expected = TimedeltaIndex(tds, freq=None, name='idx')
-
-        taken1 = idx.take([2, 4, 10])
-        taken2 = idx[[2,4,10]]
-
-        for taken in [taken1, taken2]:
-            self.assertTrue(taken.equals(expected))
-            tm.assertIsInstance(taken, TimedeltaIndex)
-            self.assertIsNone(taken.freq)
-            self.assertEqual(taken.name, expected.name)
-
-    def test_isin(self):
-
-        index = tm.makeTimedeltaIndex(4)
-        result = index.isin(index)
-        self.assertTrue(result.all())
-
-        result = index.isin(list(index))
-        self.assertTrue(result.all())
-
-        assert_almost_equal(index.isin([index[2], 5]),
-                            [False, False, True, False])
-
-    def test_does_not_convert_mixed_integer(self):
-        df = tm.makeCustomDataframe(10, 10, data_gen_f=lambda *args, **kwargs:
-                                    randn(), r_idx_type='i', c_idx_type='td')
-        str(df)
-
-        cols = df.columns.join(df.index, how='outer')
-        joined = cols.join(df.columns)
-        self.assertEqual(cols.dtype, np.dtype('O'))
-        self.assertEqual(cols.dtype, joined.dtype)
-        tm.assert_index_equal(cols, joined)
-
-    def test_slice_keeps_name(self):
-
-        # GH4226
-        dr = pd.timedelta_range('1d','5d', freq='H', name='timebucket')
-        self.assertEqual(dr[1:].name, dr.name)
-
-    def test_join_self(self):
-
-        index = timedelta_range('1 day', periods=10)
-        kinds = 'outer', 'inner', 'left', 'right'
-        for kind in kinds:
-            joined = index.join(index, how=kind)
-            self.assertIs(index, joined)
-
-    def test_factorize(self):
-        idx1 = TimedeltaIndex(['1 day','1 day','2 day',
-                               '2 day','3 day','3 day'])
-
-        exp_arr = np.array([0, 0, 1, 1, 2, 2])
-        exp_idx = TimedeltaIndex(['1 day','2 day','3 day'])
-
-        arr, idx = idx1.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assertTrue(idx.equals(exp_idx))
-
-        arr, idx = idx1.factorize(sort=True)
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assertTrue(idx.equals(exp_idx))
-
-        # freq must be preserved
-        idx3 = timedelta_range('1 day', periods=4, freq='s')
-        exp_arr = np.array([0, 1, 2, 3])
-        arr, idx = idx3.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assertTrue(idx.equals(idx3))
-
-class TestSlicing(tm.TestCase):
-
-    def test_partial_slice(self):
-        rng = timedelta_range('1 day 10:11:12', freq='h',periods=500)
-        s = Series(np.arange(len(rng)), index=rng)
-
-        result = s['5 day':'6 day']
-        expected = s.iloc[86:134]
-        assert_series_equal(result, expected)
-
-        result = s['5 day':]
-        expected = s.iloc[86:]
-        assert_series_equal(result, expected)
-
-        result = s[:'6 day']
-        expected = s.iloc[:134]
-        assert_series_equal(result, expected)
-
-        result = s['6 days, 23:11:12']
-        self.assertEqual(result, s.iloc[133])
-
-        self.assertRaises(KeyError, s.__getitem__, '50 days')
-
-    def test_partial_slice_high_reso(self):
-
-        # higher reso
-        rng = timedelta_range('1 day 10:11:12', freq='us',periods=2000)
-        s = Series(np.arange(len(rng)), index=rng)
-
-        result = s['1 day 10:11:12':]
-        expected = s.iloc[0:]
-        assert_series_equal(result, expected)
-
-        result = s['1 day 10:11:12.001':]
-        expected = s.iloc[1000:]
-        assert_series_equal(result, expected)
-
-        result = s['1 days, 10:11:12.001001']
-        self.assertEqual(result, s.iloc[1001])
-
-    def test_slice_with_negative_step(self):
-        ts = Series(np.arange(20),
-                    timedelta_range('0', periods=20, freq='H'))
-        SLC = pd.IndexSlice
-
-        def assert_slices_equivalent(l_slc, i_slc):
-            assert_series_equal(ts[l_slc], ts.iloc[i_slc])
-            assert_series_equal(ts.loc[l_slc], ts.iloc[i_slc])
-            assert_series_equal(ts.ix[l_slc], ts.iloc[i_slc])
-
-        assert_slices_equivalent(SLC[Timedelta(hours=7)::-1], SLC[7::-1])
-        assert_slices_equivalent(SLC['7 hours'::-1], SLC[7::-1])
-
-        assert_slices_equivalent(SLC[:Timedelta(hours=7):-1], SLC[:6:-1])
-        assert_slices_equivalent(SLC[:'7 hours':-1], SLC[:6:-1])
-
-        assert_slices_equivalent(SLC['15 hours':'7 hours':-1], SLC[15:6:-1])
-        assert_slices_equivalent(SLC[Timedelta(hours=15):Timedelta(hours=7):-1], SLC[15:6:-1])
-        assert_slices_equivalent(SLC['15 hours':Timedelta(hours=7):-1], SLC[15:6:-1])
-        assert_slices_equivalent(SLC[Timedelta(hours=15):'7 hours':-1], SLC[15:6:-1])
-
-        assert_slices_equivalent(SLC['7 hours':'15 hours':-1], SLC[:0])
-
-    def test_slice_with_zero_step_raises(self):
-        ts = Series(np.arange(20),
-                    timedelta_range('0', periods=20, freq='H'))
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts.loc[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts.ix[::0])
-
-    def test_tdi_ops_attributes(self):
-        rng = timedelta_range('2 days', periods=5, freq='2D', name='x')
-
-        result = rng + 1
-        exp = timedelta_range('4 days', periods=5, freq='2D', name='x')
-        tm.assert_index_equal(result, exp)
-        self.assertEqual(result.freq, '2D')
-
-        result = rng -2
-        exp = timedelta_range('-2 days', periods=5, freq='2D', name='x')
-        tm.assert_index_equal(result, exp)
-        self.assertEqual(result.freq, '2D')
-
-        result = rng * 2
-        exp = timedelta_range('4 days', periods=5, freq='4D', name='x')
-        tm.assert_index_equal(result, exp)
-        self.assertEqual(result.freq, '4D')
-
-        result = rng / 2
-        exp = timedelta_range('1 days', periods=5, freq='D', name='x')
-        tm.assert_index_equal(result, exp)
-        self.assertEqual(result.freq, 'D')
-
-        result = - rng
-        exp = timedelta_range('-2 days', periods=5, freq='-2D', name='x')
-        tm.assert_index_equal(result, exp)
-        self.assertEqual(result.freq, '-2D')
-
-        rng = pd.timedelta_range('-2 days', periods=5, freq='D', name='x')
-
-        result = abs(rng)
-        exp = TimedeltaIndex(['2 days', '1 days', '0 days', '1 days',
-                              '2 days'], name='x')
-        tm.assert_index_equal(result, exp)
-        self.assertEqual(result.freq, None)
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tseries/tests/test_timeseries.py b/pandas/tseries/tests/test_timeseries.py
deleted file mode 100644
index a80bdf970cccb..0000000000000
--- a/pandas/tseries/tests/test_timeseries.py
+++ /dev/null
@@ -1,4795 +0,0 @@
-# pylint: disable-msg=E1101,W0612
-import calendar
-from datetime import datetime, time, timedelta
-import sys
-import operator
-
-import nose
-
-import numpy as np
-randn = np.random.randn
-
-from pandas import (Index, Series, DataFrame,
-                    isnull, date_range, Timestamp, Period, DatetimeIndex,
-                    Int64Index, to_datetime, bdate_range, Float64Index, TimedeltaIndex, NaT)
-
-import pandas.core.datetools as datetools
-import pandas.tseries.offsets as offsets
-import pandas.tseries.tools as tools
-import pandas.tseries.frequencies as frequencies
-import pandas as pd
-
-from pandas.util.testing import assert_series_equal, assert_almost_equal
-import pandas.util.testing as tm
-
-from pandas.tslib import NaT, iNaT
-import pandas.lib as lib
-import pandas.tslib as tslib
-
-import pandas.index as _index
-
-from pandas.compat import range, long, StringIO, lrange, lmap, zip, product
-from numpy.random import rand
-from pandas.util.testing import assert_frame_equal
-from pandas.io.common import PerformanceWarning
-import pandas.compat as compat
-import pandas.core.common as com
-from pandas import concat
-from pandas import _np_version_under1p8
-
-from numpy.testing.decorators import slow
-
-
-def _skip_if_has_locale():
-    import locale
-    lang, _ = locale.getlocale()
-    if lang is not None:
-        raise nose.SkipTest("Specific locale is set {0}".format(lang))
-
-
-class TestTimeSeriesDuplicates(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        dates = [datetime(2000, 1, 2), datetime(2000, 1, 2),
-                 datetime(2000, 1, 2), datetime(2000, 1, 3),
-                 datetime(2000, 1, 3), datetime(2000, 1, 3),
-                 datetime(2000, 1, 4), datetime(2000, 1, 4),
-                 datetime(2000, 1, 4), datetime(2000, 1, 5)]
-
-        self.dups = Series(np.random.randn(len(dates)), index=dates)
-
-    def test_constructor(self):
-        tm.assertIsInstance(self.dups, Series)
-        tm.assertIsInstance(self.dups.index, DatetimeIndex)
-
-    def test_is_unique_monotonic(self):
-        self.assertFalse(self.dups.index.is_unique)
-
-    def test_index_unique(self):
-        uniques = self.dups.index.unique()
-        expected = DatetimeIndex([datetime(2000, 1, 2), datetime(2000, 1, 3),
-                                  datetime(2000, 1, 4), datetime(2000, 1, 5)])
-        self.assertEqual(uniques.dtype, 'M8[ns]')  # sanity
-        self.assertTrue(uniques.equals(expected))
-        self.assertEqual(self.dups.index.nunique(), 4)
-
-        # #2563
-        self.assertTrue(isinstance(uniques, DatetimeIndex))
-
-        dups_local = self.dups.index.tz_localize('US/Eastern')
-        dups_local.name = 'foo'
-        result = dups_local.unique()
-        expected = DatetimeIndex(expected, tz='US/Eastern')
-        self.assertTrue(result.tz is not None)
-        self.assertEqual(result.name, 'foo')
-        self.assertTrue(result.equals(expected))
-
-        # NaT, note this is excluded
-        arr = [ 1370745748 + t for t in range(20) ] + [iNaT]
-        idx = DatetimeIndex(arr * 3)
-        self.assertTrue(idx.unique().equals(DatetimeIndex(arr)))
-        self.assertEqual(idx.nunique(), 20)
-        self.assertEqual(idx.nunique(dropna=False), 21)
-
-        arr = [ Timestamp('2013-06-09 02:42:28') + timedelta(seconds=t) for t in range(20) ] + [NaT]
-        idx = DatetimeIndex(arr * 3)
-        self.assertTrue(idx.unique().equals(DatetimeIndex(arr)))
-        self.assertEqual(idx.nunique(), 20)
-        self.assertEqual(idx.nunique(dropna=False), 21)
-
-
-    def test_index_dupes_contains(self):
-        d = datetime(2011, 12, 5, 20, 30)
-        ix = DatetimeIndex([d, d])
-        self.assertTrue(d in ix)
-
-    def test_duplicate_dates_indexing(self):
-        ts = self.dups
-
-        uniques = ts.index.unique()
-        for date in uniques:
-            result = ts[date]
-
-            mask = ts.index == date
-            total = (ts.index == date).sum()
-            expected = ts[mask]
-            if total > 1:
-                assert_series_equal(result, expected)
-            else:
-                assert_almost_equal(result, expected[0])
-
-            cp = ts.copy()
-            cp[date] = 0
-            expected = Series(np.where(mask, 0, ts), index=ts.index)
-            assert_series_equal(cp, expected)
-
-        self.assertRaises(KeyError, ts.__getitem__, datetime(2000, 1, 6))
-
-        # new index
-        ts[datetime(2000,1,6)] = 0
-        self.assertEqual(ts[datetime(2000,1,6)], 0)
-
-    def test_range_slice(self):
-        idx = DatetimeIndex(['1/1/2000', '1/2/2000', '1/2/2000', '1/3/2000',
-                             '1/4/2000'])
-
-        ts = Series(np.random.randn(len(idx)), index=idx)
-
-        result = ts['1/2/2000':]
-        expected = ts[1:]
-        assert_series_equal(result, expected)
-
-        result = ts['1/2/2000':'1/3/2000']
-        expected = ts[1:4]
-        assert_series_equal(result, expected)
-
-    def test_groupby_average_dup_values(self):
-        result = self.dups.groupby(level=0).mean()
-        expected = self.dups.groupby(self.dups.index).mean()
-        assert_series_equal(result, expected)
-
-    def test_indexing_over_size_cutoff(self):
-        import datetime
-        # #1821
-
-        old_cutoff = _index._SIZE_CUTOFF
-        try:
-            _index._SIZE_CUTOFF = 1000
-
-            # create large list of non periodic datetime
-            dates = []
-            sec = datetime.timedelta(seconds=1)
-            half_sec = datetime.timedelta(microseconds=500000)
-            d = datetime.datetime(2011, 12, 5, 20, 30)
-            n = 1100
-            for i in range(n):
-                dates.append(d)
-                dates.append(d + sec)
-                dates.append(d + sec + half_sec)
-                dates.append(d + sec + sec + half_sec)
-                d += 3 * sec
-
-            # duplicate some values in the list
-            duplicate_positions = np.random.randint(0, len(dates) - 1, 20)
-            for p in duplicate_positions:
-                dates[p + 1] = dates[p]
-
-            df = DataFrame(np.random.randn(len(dates), 4),
-                           index=dates,
-                           columns=list('ABCD'))
-
-            pos = n * 3
-            timestamp = df.index[pos]
-            self.assertIn(timestamp, df.index)
-
-            # it works!
-            df.ix[timestamp]
-            self.assertTrue(len(df.ix[[timestamp]]) > 0)
-        finally:
-            _index._SIZE_CUTOFF = old_cutoff
-
-    def test_indexing_unordered(self):
-        # GH 2437
-        rng = date_range(start='2011-01-01', end='2011-01-15')
-        ts  = Series(randn(len(rng)), index=rng)
-        ts2 = concat([ts[0:4],ts[-4:],ts[4:-4]])
-
-        for t in ts.index:
-            s = str(t)
-            expected = ts[t]
-            result = ts2[t]
-            self.assertTrue(expected == result)
-
-        # GH 3448 (ranges)
-        def compare(slobj):
-            result = ts2[slobj].copy()
-            result = result.sort_index()
-            expected = ts[slobj]
-            assert_series_equal(result,expected)
-
-        compare(slice('2011-01-01','2011-01-15'))
-        compare(slice('2010-12-30','2011-01-15'))
-        compare(slice('2011-01-01','2011-01-16'))
-
-        # partial ranges
-        compare(slice('2011-01-01','2011-01-6'))
-        compare(slice('2011-01-06','2011-01-8'))
-        compare(slice('2011-01-06','2011-01-12'))
-
-        # single values
-        result = ts2['2011'].sort_index()
-        expected = ts['2011']
-        assert_series_equal(result,expected)
-
-        # diff freq
-        rng = date_range(datetime(2005, 1, 1), periods=20, freq='M')
-        ts = Series(np.arange(len(rng)), index=rng)
-        ts = ts.take(np.random.permutation(20))
-
-        result = ts['2005']
-        for t in result.index:
-            self.assertTrue(t.year == 2005)
-
-    def test_indexing(self):
-
-        idx = date_range("2001-1-1", periods=20, freq='M')
-        ts = Series(np.random.rand(len(idx)),index=idx)
-
-        # getting
-
-        # GH 3070, make sure semantics work on Series/Frame
-        expected = ts['2001']
-        expected.name = 'A'
-
-        df = DataFrame(dict(A = ts))
-        result = df['2001']['A']
-        assert_series_equal(expected, result)
-
-        # setting
-        ts['2001'] = 1
-        expected = ts['2001']
-        expected.name = 'A'
-
-        df.loc['2001','A'] = 1
-
-        result = df['2001']['A']
-        assert_series_equal(expected, result)
-
-        # GH3546 (not including times on the last day)
-        idx = date_range(start='2013-05-31 00:00', end='2013-05-31 23:00', freq='H')
-        ts  = Series(lrange(len(idx)), index=idx)
-        expected = ts['2013-05']
-        assert_series_equal(expected, ts)
-
-        idx = date_range(start='2013-05-31 00:00', end='2013-05-31 23:59', freq='S')
-        ts  = Series(lrange(len(idx)), index=idx)
-        expected = ts['2013-05']
-        assert_series_equal(expected,ts)
-
-        idx = [ Timestamp('2013-05-31 00:00'), Timestamp(datetime(2013,5,31,23,59,59,999999))]
-        ts  = Series(lrange(len(idx)), index=idx)
-        expected = ts['2013']
-        assert_series_equal(expected,ts)
-
-        # GH 3925, indexing with a seconds resolution string / datetime object
-        df = DataFrame(randn(5,5),columns=['open','high','low','close','volume'],index=date_range('2012-01-02 18:01:00',periods=5,tz='US/Central',freq='s'))
-        expected = df.loc[[df.index[2]]]
-        result = df['2012-01-02 18:01:02']
-        assert_frame_equal(result,expected)
-
-        # this is a single date, so will raise
-        self.assertRaises(KeyError, df.__getitem__, df.index[2],)
-
-    def test_recreate_from_data(self):
-        freqs = ['M', 'Q', 'A', 'D', 'B', 'BH', 'T', 'S', 'L', 'U', 'H', 'N', 'C']
-
-        for f in freqs:
-            org = DatetimeIndex(start='2001/02/01 09:00', freq=f, periods=1)
-            idx = DatetimeIndex(org, freq=f)
-            self.assertTrue(idx.equals(org))
-
-            org = DatetimeIndex(start='2001/02/01 09:00', freq=f, tz='US/Pacific', periods=1)
-            idx = DatetimeIndex(org, freq=f, tz='US/Pacific')
-            self.assertTrue(idx.equals(org))
-
-
-def assert_range_equal(left, right):
-    assert(left.equals(right))
-    assert(left.freq == right.freq)
-    assert(left.tz == right.tz)
-
-
-class TestTimeSeries(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def test_is_(self):
-        dti = DatetimeIndex(start='1/1/2005', end='12/1/2005', freq='M')
-        self.assertTrue(dti.is_(dti))
-        self.assertTrue(dti.is_(dti.view()))
-        self.assertFalse(dti.is_(dti.copy()))
-
-    def test_dti_slicing(self):
-        dti = DatetimeIndex(start='1/1/2005', end='12/1/2005', freq='M')
-        dti2 = dti[[1, 3, 5]]
-
-        v1 = dti2[0]
-        v2 = dti2[1]
-        v3 = dti2[2]
-
-        self.assertEqual(v1, Timestamp('2/28/2005'))
-        self.assertEqual(v2, Timestamp('4/30/2005'))
-        self.assertEqual(v3, Timestamp('6/30/2005'))
-
-        # don't carry freq through irregular slicing
-        self.assertIsNone(dti2.freq)
-
-    def test_pass_datetimeindex_to_index(self):
-        # Bugs in #1396
-        rng = date_range('1/1/2000', '3/1/2000')
-        idx = Index(rng, dtype=object)
-
-        expected = Index(rng.to_pydatetime(), dtype=object)
-
-        self.assert_numpy_array_equal(idx.values, expected.values)
-
-    def test_contiguous_boolean_preserve_freq(self):
-        rng = date_range('1/1/2000', '3/1/2000', freq='B')
-
-        mask = np.zeros(len(rng), dtype=bool)
-        mask[10:20] = True
-
-        masked = rng[mask]
-        expected = rng[10:20]
-        self.assertIsNotNone(expected.freq)
-        assert_range_equal(masked, expected)
-
-        mask[22] = True
-        masked = rng[mask]
-        self.assertIsNone(masked.freq)
-
-    def test_getitem_median_slice_bug(self):
-        index = date_range('20090415', '20090519', freq='2B')
-        s = Series(np.random.randn(13), index=index)
-
-        indexer = [slice(6, 7, None)]
-        result = s[indexer]
-        expected = s[indexer[0]]
-        assert_series_equal(result, expected)
-
-    def test_series_box_timestamp(self):
-        rng = date_range('20090415', '20090519', freq='B')
-        s = Series(rng)
-
-        tm.assertIsInstance(s[5], Timestamp)
-
-        rng = date_range('20090415', '20090519', freq='B')
-        s = Series(rng, index=rng)
-        tm.assertIsInstance(s[5], Timestamp)
-
-        tm.assertIsInstance(s.iat[5], Timestamp)
-
-    def test_date_range_ambiguous_arguments(self):
-        # #2538
-        start = datetime(2011, 1, 1, 5, 3, 40)
-        end = datetime(2011, 1, 1, 8, 9, 40)
-
-        self.assertRaises(ValueError, date_range, start, end,
-                          freq='s', periods=10)
-
-    def test_timestamp_to_datetime(self):
-        tm._skip_if_no_pytz()
-        rng = date_range('20090415', '20090519',
-                         tz='US/Eastern')
-
-        stamp = rng[0]
-        dtval = stamp.to_pydatetime()
-        self.assertEqual(stamp, dtval)
-        self.assertEqual(stamp.tzinfo, dtval.tzinfo)
-
-    def test_timestamp_to_datetime_dateutil(self):
-        tm._skip_if_no_pytz()
-        rng = date_range('20090415', '20090519',
-                         tz='dateutil/US/Eastern')
-
-        stamp = rng[0]
-        dtval = stamp.to_pydatetime()
-        self.assertEqual(stamp, dtval)
-        self.assertEqual(stamp.tzinfo, dtval.tzinfo)
-
-    def test_timestamp_to_datetime_explicit_pytz(self):
-        tm._skip_if_no_pytz()
-        import pytz
-        rng = date_range('20090415', '20090519',
-                         tz=pytz.timezone('US/Eastern'))
-
-        stamp = rng[0]
-        dtval = stamp.to_pydatetime()
-        self.assertEqual(stamp, dtval)
-        self.assertEqual(stamp.tzinfo, dtval.tzinfo)
-
-    def test_timestamp_to_datetime_explicit_dateutil(self):
-        tm._skip_if_windows_python_3()
-        tm._skip_if_no_dateutil()
-        from pandas.tslib import _dateutil_gettz as gettz
-        rng = date_range('20090415', '20090519',
-                         tz=gettz('US/Eastern'))
-
-        stamp = rng[0]
-        dtval = stamp.to_pydatetime()
-        self.assertEqual(stamp, dtval)
-        self.assertEqual(stamp.tzinfo, dtval.tzinfo)
-
-    def test_index_convert_to_datetime_array(self):
-        tm._skip_if_no_pytz()
-
-        def _check_rng(rng):
-            converted = rng.to_pydatetime()
-            tm.assertIsInstance(converted, np.ndarray)
-            for x, stamp in zip(converted, rng):
-                tm.assertIsInstance(x, datetime)
-                self.assertEqual(x, stamp.to_pydatetime())
-                self.assertEqual(x.tzinfo, stamp.tzinfo)
-
-        rng = date_range('20090415', '20090519')
-        rng_eastern = date_range('20090415', '20090519', tz='US/Eastern')
-        rng_utc = date_range('20090415', '20090519', tz='utc')
-
-        _check_rng(rng)
-        _check_rng(rng_eastern)
-        _check_rng(rng_utc)
-
-    def test_index_convert_to_datetime_array_explicit_pytz(self):
-        tm._skip_if_no_pytz()
-        import pytz
-
-        def _check_rng(rng):
-            converted = rng.to_pydatetime()
-            tm.assertIsInstance(converted, np.ndarray)
-            for x, stamp in zip(converted, rng):
-                tm.assertIsInstance(x, datetime)
-                self.assertEqual(x, stamp.to_pydatetime())
-                self.assertEqual(x.tzinfo, stamp.tzinfo)
-
-        rng = date_range('20090415', '20090519')
-        rng_eastern = date_range('20090415', '20090519', tz=pytz.timezone('US/Eastern'))
-        rng_utc = date_range('20090415', '20090519', tz=pytz.utc)
-
-        _check_rng(rng)
-        _check_rng(rng_eastern)
-        _check_rng(rng_utc)
-
-    def test_index_convert_to_datetime_array_dateutil(self):
-        tm._skip_if_no_dateutil()
-        import dateutil
-
-        def _check_rng(rng):
-            converted = rng.to_pydatetime()
-            tm.assertIsInstance(converted, np.ndarray)
-            for x, stamp in zip(converted, rng):
-                tm.assertIsInstance(x, datetime)
-                self.assertEqual(x, stamp.to_pydatetime())
-                self.assertEqual(x.tzinfo, stamp.tzinfo)
-
-        rng = date_range('20090415', '20090519')
-        rng_eastern = date_range('20090415', '20090519', tz='dateutil/US/Eastern')
-        rng_utc = date_range('20090415', '20090519', tz=dateutil.tz.tzutc())
-
-        _check_rng(rng)
-        _check_rng(rng_eastern)
-        _check_rng(rng_utc)
-
-    def test_ctor_str_intraday(self):
-        rng = DatetimeIndex(['1-1-2000 00:00:01'])
-        self.assertEqual(rng[0].second, 1)
-
-    def test_series_ctor_plus_datetimeindex(self):
-        rng = date_range('20090415', '20090519', freq='B')
-        data = dict((k, 1) for k in rng)
-
-        result = Series(data, index=rng)
-        self.assertIs(result.index, rng)
-
-    def test_series_pad_backfill_limit(self):
-        index = np.arange(10)
-        s = Series(np.random.randn(10), index=index)
-
-        result = s[:2].reindex(index, method='pad', limit=5)
-
-        expected = s[:2].reindex(index).fillna(method='pad')
-        expected[-3:] = np.nan
-        assert_series_equal(result, expected)
-
-        result = s[-2:].reindex(index, method='backfill', limit=5)
-
-        expected = s[-2:].reindex(index).fillna(method='backfill')
-        expected[:3] = np.nan
-        assert_series_equal(result, expected)
-
-    def test_series_fillna_limit(self):
-        index = np.arange(10)
-        s = Series(np.random.randn(10), index=index)
-
-        result = s[:2].reindex(index)
-        result = result.fillna(method='pad', limit=5)
-
-        expected = s[:2].reindex(index).fillna(method='pad')
-        expected[-3:] = np.nan
-        assert_series_equal(result, expected)
-
-        result = s[-2:].reindex(index)
-        result = result.fillna(method='bfill', limit=5)
-
-        expected = s[-2:].reindex(index).fillna(method='backfill')
-        expected[:3] = np.nan
-        assert_series_equal(result, expected)
-
-    def test_frame_pad_backfill_limit(self):
-        index = np.arange(10)
-        df = DataFrame(np.random.randn(10, 4), index=index)
-
-        result = df[:2].reindex(index, method='pad', limit=5)
-
-        expected = df[:2].reindex(index).fillna(method='pad')
-        expected.values[-3:] = np.nan
-        tm.assert_frame_equal(result, expected)
-
-        result = df[-2:].reindex(index, method='backfill', limit=5)
-
-        expected = df[-2:].reindex(index).fillna(method='backfill')
-        expected.values[:3] = np.nan
-        tm.assert_frame_equal(result, expected)
-
-    def test_frame_fillna_limit(self):
-        index = np.arange(10)
-        df = DataFrame(np.random.randn(10, 4), index=index)
-
-        result = df[:2].reindex(index)
-        result = result.fillna(method='pad', limit=5)
-
-        expected = df[:2].reindex(index).fillna(method='pad')
-        expected.values[-3:] = np.nan
-        tm.assert_frame_equal(result, expected)
-
-        result = df[-2:].reindex(index)
-        result = result.fillna(method='backfill', limit=5)
-
-        expected = df[-2:].reindex(index).fillna(method='backfill')
-        expected.values[:3] = np.nan
-        tm.assert_frame_equal(result, expected)
-
-    def test_frame_setitem_timestamp(self):
-        # 2155
-        columns = DatetimeIndex(start='1/1/2012', end='2/1/2012',
-                                freq=datetools.bday)
-        index = lrange(10)
-        data = DataFrame(columns=columns, index=index)
-        t = datetime(2012, 11, 1)
-        ts = Timestamp(t)
-        data[ts] = np.nan  # works
-
-    def test_sparse_series_fillna_limit(self):
-        index = np.arange(10)
-        s = Series(np.random.randn(10), index=index)
-
-        ss = s[:2].reindex(index).to_sparse()
-        result = ss.fillna(method='pad', limit=5)
-        expected = ss.fillna(method='pad', limit=5)
-        expected = expected.to_dense()
-        expected[-3:] = np.nan
-        expected = expected.to_sparse()
-        assert_series_equal(result, expected)
-
-        ss = s[-2:].reindex(index).to_sparse()
-        result = ss.fillna(method='backfill', limit=5)
-        expected = ss.fillna(method='backfill')
-        expected = expected.to_dense()
-        expected[:3] = np.nan
-        expected = expected.to_sparse()
-        assert_series_equal(result, expected)
-
-    def test_sparse_series_pad_backfill_limit(self):
-        index = np.arange(10)
-        s = Series(np.random.randn(10), index=index)
-        s = s.to_sparse()
-
-        result = s[:2].reindex(index, method='pad', limit=5)
-        expected = s[:2].reindex(index).fillna(method='pad')
-        expected = expected.to_dense()
-        expected[-3:] = np.nan
-        expected = expected.to_sparse()
-        assert_series_equal(result, expected)
-
-        result = s[-2:].reindex(index, method='backfill', limit=5)
-        expected = s[-2:].reindex(index).fillna(method='backfill')
-        expected = expected.to_dense()
-        expected[:3] = np.nan
-        expected = expected.to_sparse()
-        assert_series_equal(result, expected)
-
-    def test_sparse_frame_pad_backfill_limit(self):
-        index = np.arange(10)
-        df = DataFrame(np.random.randn(10, 4), index=index)
-        sdf = df.to_sparse()
-
-        result = sdf[:2].reindex(index, method='pad', limit=5)
-
-        expected = sdf[:2].reindex(index).fillna(method='pad')
-        expected = expected.to_dense()
-        expected.values[-3:] = np.nan
-        expected = expected.to_sparse()
-        tm.assert_frame_equal(result, expected)
-
-        result = sdf[-2:].reindex(index, method='backfill', limit=5)
-
-        expected = sdf[-2:].reindex(index).fillna(method='backfill')
-        expected = expected.to_dense()
-        expected.values[:3] = np.nan
-        expected = expected.to_sparse()
-        tm.assert_frame_equal(result, expected)
-
-    def test_sparse_frame_fillna_limit(self):
-        index = np.arange(10)
-        df = DataFrame(np.random.randn(10, 4), index=index)
-        sdf = df.to_sparse()
-
-        result = sdf[:2].reindex(index)
-        result = result.fillna(method='pad', limit=5)
-
-        expected = sdf[:2].reindex(index).fillna(method='pad')
-        expected = expected.to_dense()
-        expected.values[-3:] = np.nan
-        expected = expected.to_sparse()
-        tm.assert_frame_equal(result, expected)
-
-        result = sdf[-2:].reindex(index)
-        result = result.fillna(method='backfill', limit=5)
-
-        expected = sdf[-2:].reindex(index).fillna(method='backfill')
-        expected = expected.to_dense()
-        expected.values[:3] = np.nan
-        expected = expected.to_sparse()
-        tm.assert_frame_equal(result, expected)
-
-    def test_pad_require_monotonicity(self):
-        rng = date_range('1/1/2000', '3/1/2000', freq='B')
-
-        # neither monotonic increasing or decreasing
-        rng2 = rng[[1, 0, 2]]
-
-        self.assertRaises(ValueError, rng2.get_indexer, rng,
-                          method='pad')
-
-    def test_frame_ctor_datetime64_column(self):
-        rng = date_range('1/1/2000 00:00:00', '1/1/2000 1:59:50',
-                         freq='10s')
-        dates = np.asarray(rng)
-
-        df = DataFrame({'A': np.random.randn(len(rng)), 'B': dates})
-        self.assertTrue(np.issubdtype(df['B'].dtype, np.dtype('M8[ns]')))
-
-    def test_frame_add_datetime64_column(self):
-        rng = date_range('1/1/2000 00:00:00', '1/1/2000 1:59:50',
-                         freq='10s')
-        df = DataFrame(index=np.arange(len(rng)))
-
-        df['A'] = rng
-        self.assertTrue(np.issubdtype(df['A'].dtype, np.dtype('M8[ns]')))
-
-    def test_frame_datetime64_pre1900_repr(self):
-        df = DataFrame({'year': date_range('1/1/1700', periods=50,
-                                           freq='A-DEC')})
-        # it works!
-        repr(df)
-
-    def test_frame_add_datetime64_col_other_units(self):
-        n = 100
-
-        units = ['h', 'm', 's', 'ms', 'D', 'M', 'Y']
-
-        ns_dtype = np.dtype('M8[ns]')
-
-        for unit in units:
-            dtype = np.dtype('M8[%s]' % unit)
-            vals = np.arange(n, dtype=np.int64).view(dtype)
-
-            df = DataFrame({'ints': np.arange(n)}, index=np.arange(n))
-            df[unit] = vals
-
-            ex_vals = to_datetime(vals.astype('O')).values
-
-            self.assertEqual(df[unit].dtype, ns_dtype)
-            self.assertTrue((df[unit].values == ex_vals).all())
-
-        # Test insertion into existing datetime64 column
-        df = DataFrame({'ints': np.arange(n)}, index=np.arange(n))
-        df['dates'] = np.arange(n, dtype=np.int64).view(ns_dtype)
-
-        for unit in units:
-            dtype = np.dtype('M8[%s]' % unit)
-            vals = np.arange(n, dtype=np.int64).view(dtype)
-
-            tmp = df.copy()
-
-            tmp['dates'] = vals
-            ex_vals = to_datetime(vals.astype('O')).values
-
-            self.assertTrue((tmp['dates'].values == ex_vals).all())
-
-    def test_to_datetime_unit(self):
-
-        epoch = 1370745748
-        s = Series([ epoch + t for t in range(20) ])
-        result = to_datetime(s,unit='s')
-        expected = Series([ Timestamp('2013-06-09 02:42:28') + timedelta(seconds=t) for t in range(20) ])
-        assert_series_equal(result,expected)
-
-        s = Series([ epoch + t for t in range(20) ]).astype(float)
-        result = to_datetime(s,unit='s')
-        expected = Series([ Timestamp('2013-06-09 02:42:28') + timedelta(seconds=t) for t in range(20) ])
-        assert_series_equal(result,expected)
-
-        s = Series([ epoch + t for t in range(20) ] + [iNaT])
-        result = to_datetime(s,unit='s')
-        expected = Series([ Timestamp('2013-06-09 02:42:28') + timedelta(seconds=t) for t in range(20) ] + [NaT])
-        assert_series_equal(result,expected)
-
-        s = Series([ epoch + t for t in range(20) ] + [iNaT]).astype(float)
-        result = to_datetime(s,unit='s')
-        expected = Series([ Timestamp('2013-06-09 02:42:28') + timedelta(seconds=t) for t in range(20) ] + [NaT])
-        assert_series_equal(result,expected)
-
-        s = concat([Series([ epoch + t for t in range(20) ]).astype(float),Series([np.nan])],ignore_index=True)
-        result = to_datetime(s,unit='s')
-        expected = Series([ Timestamp('2013-06-09 02:42:28') + timedelta(seconds=t) for t in range(20) ] + [NaT])
-        assert_series_equal(result,expected)
-
-    def test_series_ctor_datetime64(self):
-        rng = date_range('1/1/2000 00:00:00', '1/1/2000 1:59:50',
-                         freq='10s')
-        dates = np.asarray(rng)
-
-        series = Series(dates)
-        self.assertTrue(np.issubdtype(series.dtype, np.dtype('M8[ns]')))
-
-    def test_index_cast_datetime64_other_units(self):
-        arr = np.arange(0, 100, 10, dtype=np.int64).view('M8[D]')
-
-        idx = Index(arr)
-
-        self.assertTrue((idx.values == tslib.cast_to_nanoseconds(arr)).all())
-
-    def test_reindex_series_add_nat(self):
-        rng = date_range('1/1/2000 00:00:00', periods=10, freq='10s')
-        series = Series(rng)
-
-        result = series.reindex(lrange(15))
-        self.assertTrue(np.issubdtype(result.dtype, np.dtype('M8[ns]')))
-
-        mask = result.isnull()
-        self.assertTrue(mask[-5:].all())
-        self.assertFalse(mask[:-5].any())
-
-    def test_reindex_frame_add_nat(self):
-        rng = date_range('1/1/2000 00:00:00', periods=10, freq='10s')
-        df = DataFrame({'A': np.random.randn(len(rng)), 'B': rng})
-
-        result = df.reindex(lrange(15))
-        self.assertTrue(np.issubdtype(result['B'].dtype, np.dtype('M8[ns]')))
-
-        mask = com.isnull(result)['B']
-        self.assertTrue(mask[-5:].all())
-        self.assertFalse(mask[:-5].any())
-
-    def test_series_repr_nat(self):
-        series = Series([0, 1000, 2000, iNaT], dtype='M8[ns]')
-
-        result = repr(series)
-        expected = ('0   1970-01-01 00:00:00.000000\n'
-                    '1   1970-01-01 00:00:00.000001\n'
-                    '2   1970-01-01 00:00:00.000002\n'
-                    '3                          NaT\n'
-                    'dtype: datetime64[ns]')
-        self.assertEqual(result, expected)
-
-    def test_fillna_nat(self):
-        series = Series([0, 1, 2, iNaT], dtype='M8[ns]')
-
-        filled = series.fillna(method='pad')
-        filled2 = series.fillna(value=series.values[2])
-
-        expected = series.copy()
-        expected.values[3] = expected.values[2]
-
-        assert_series_equal(filled, expected)
-        assert_series_equal(filled2, expected)
-
-        df = DataFrame({'A': series})
-        filled = df.fillna(method='pad')
-        filled2 = df.fillna(value=series.values[2])
-        expected = DataFrame({'A': expected})
-        assert_frame_equal(filled, expected)
-        assert_frame_equal(filled2, expected)
-
-        series = Series([iNaT, 0, 1, 2], dtype='M8[ns]')
-
-        filled = series.fillna(method='bfill')
-        filled2 = series.fillna(value=series[1])
-
-        expected = series.copy()
-        expected[0] = expected[1]
-
-        assert_series_equal(filled, expected)
-        assert_series_equal(filled2, expected)
-
-        df = DataFrame({'A': series})
-        filled = df.fillna(method='bfill')
-        filled2 = df.fillna(value=series[1])
-        expected = DataFrame({'A': expected})
-        assert_frame_equal(filled, expected)
-        assert_frame_equal(filled2, expected)
-
-    def test_string_na_nat_conversion(self):
-        # GH #999, #858
-
-        from pandas.compat import parse_date
-
-        strings = np.array(['1/1/2000', '1/2/2000', np.nan,
-                            '1/4/2000, 12:34:56'], dtype=object)
-
-        expected = np.empty(4, dtype='M8[ns]')
-        for i, val in enumerate(strings):
-            if com.isnull(val):
-                expected[i] = iNaT
-            else:
-                expected[i] = parse_date(val)
-
-        result = tslib.array_to_datetime(strings)
-        assert_almost_equal(result, expected)
-
-        result2 = to_datetime(strings)
-        tm.assertIsInstance(result2, DatetimeIndex)
-        tm.assert_numpy_array_equal(result, result2)
-
-        malformed = np.array(['1/100/2000', np.nan], dtype=object)
-
-        # GH 10636, default is now 'raise'
-        self.assertRaises(ValueError, lambda : to_datetime(malformed, errors='raise'))
-
-        result = to_datetime(malformed, errors='ignore')
-        tm.assert_numpy_array_equal(result, malformed)
-
-        self.assertRaises(ValueError, to_datetime, malformed,
-                          errors='raise')
-
-        idx = ['a', 'b', 'c', 'd', 'e']
-        series = Series(['1/1/2000', np.nan, '1/3/2000', np.nan,
-                         '1/5/2000'], index=idx, name='foo')
-        dseries = Series([to_datetime('1/1/2000'), np.nan,
-                          to_datetime('1/3/2000'), np.nan,
-                          to_datetime('1/5/2000')], index=idx, name='foo')
-
-        result = to_datetime(series)
-        dresult = to_datetime(dseries)
-
-        expected = Series(np.empty(5, dtype='M8[ns]'), index=idx)
-        for i in range(5):
-            x = series[i]
-            if isnull(x):
-                expected[i] = iNaT
-            else:
-                expected[i] = to_datetime(x)
-
-        assert_series_equal(result, expected, check_names=False)
-        self.assertEqual(result.name, 'foo')
-
-        assert_series_equal(dresult, expected, check_names=False)
-        self.assertEqual(dresult.name, 'foo')
-
-    def test_to_datetime_iso8601(self):
-        result = to_datetime(["2012-01-01 00:00:00"])
-        exp = Timestamp("2012-01-01 00:00:00")
-        self.assertEqual(result[0], exp)
-
-        result = to_datetime(['20121001'])  # bad iso 8601
-        exp = Timestamp('2012-10-01')
-        self.assertEqual(result[0], exp)
-
-    def test_to_datetime_default(self):
-        rs = to_datetime('2001')
-        xp = datetime(2001, 1, 1)
-        self.assertTrue(rs, xp)
-
-        #### dayfirst is essentially broken
-        #### to_datetime('01-13-2012', dayfirst=True)
-        #### self.assertRaises(ValueError, to_datetime('01-13-2012', dayfirst=True))
-
-    def test_to_datetime_on_datetime64_series(self):
-        # #2699
-        s = Series(date_range('1/1/2000', periods=10))
-
-        result = to_datetime(s)
-        self.assertEqual(result[0], s[0])
-
-    def test_to_datetime_with_apply(self):
-        # this is only locale tested with US/None locales
-        _skip_if_has_locale()
-
-        # GH 5195
-        # with a format and coerce a single item to_datetime fails
-        td = Series(['May 04', 'Jun 02', 'Dec 11'], index=[1,2,3])
-        expected = pd.to_datetime(td, format='%b %y')
-        result = td.apply(pd.to_datetime, format='%b %y')
-        assert_series_equal(result, expected)
-
-        td = pd.Series(['May 04', 'Jun 02', ''], index=[1,2,3])
-        self.assertRaises(ValueError, lambda : pd.to_datetime(td,format='%b %y', errors='raise'))
-        self.assertRaises(ValueError, lambda : td.apply(pd.to_datetime, format='%b %y', errors='raise'))
-        expected = pd.to_datetime(td, format='%b %y', errors='coerce')
-
-        result = td.apply(lambda x: pd.to_datetime(x, format='%b %y', errors='coerce'))
-        assert_series_equal(result, expected)
-
-    def test_nat_vector_field_access(self):
-        idx = DatetimeIndex(['1/1/2000', None, None, '1/4/2000'])
-
-        fields = ['year', 'quarter', 'month', 'day', 'hour',
-                  'minute', 'second', 'microsecond', 'nanosecond',
-                  'week', 'dayofyear', 'days_in_month']
-        for field in fields:
-            result = getattr(idx, field)
-            expected = [getattr(x, field) if x is not NaT else np.nan
-                        for x in idx]
-            self.assert_numpy_array_equal(result, np.array(expected))
-
-    def test_nat_scalar_field_access(self):
-        fields = ['year', 'quarter', 'month', 'day', 'hour',
-                  'minute', 'second', 'microsecond', 'nanosecond',
-                  'week', 'dayofyear', 'days_in_month', 'daysinmonth',
-                  'dayofweek']
-        for field in fields:
-            result = getattr(NaT, field)
-            self.assertTrue(np.isnan(result))
-
-    def test_NaT_methods(self):
-        # GH 9513
-        raise_methods = ['astimezone', 'combine', 'ctime', 'dst', 'fromordinal',
-                         'fromtimestamp', 'isocalendar', 'isoformat',
-                         'strftime', 'strptime',
-                         'time', 'timestamp', 'timetuple', 'timetz',
-                         'toordinal', 'tzname', 'utcfromtimestamp',
-                         'utcnow', 'utcoffset', 'utctimetuple']
-        nat_methods = ['date', 'now', 'replace', 'to_datetime', 'today']
-        nan_methods = ['weekday', 'isoweekday']
-
-        for method in raise_methods:
-            if hasattr(NaT, method):
-                self.assertRaises(ValueError, getattr(NaT, method))
-
-        for method in nan_methods:
-            if hasattr(NaT, method):
-                self.assertTrue(np.isnan(getattr(NaT, method)()))
-
-        for method in nat_methods:
-            if hasattr(NaT, method):
-                self.assertIs(getattr(NaT, method)(), NaT)
-
-    def test_to_datetime_types(self):
-
-        # empty string
-        result = to_datetime('')
-        self.assertIs(result, NaT)
-
-        result = to_datetime(['', ''])
-        self.assertTrue(isnull(result).all())
-
-        # ints
-        result = Timestamp(0)
-        expected = to_datetime(0)
-        self.assertEqual(result, expected)
-
-        # GH 3888 (strings)
-        expected = to_datetime(['2012'])[0]
-        result = to_datetime('2012')
-        self.assertEqual(result, expected)
-
-        ### array = ['2012','20120101','20120101 12:01:01']
-        array = ['20120101','20120101 12:01:01']
-        expected = list(to_datetime(array))
-        result = lmap(Timestamp,array)
-        tm.assert_almost_equal(result,expected)
-
-        ### currently fails ###
-        ### result = Timestamp('2012')
-        ### expected = to_datetime('2012')
-        ### self.assertEqual(result, expected)
-
-    def test_to_datetime_unprocessable_input(self):
-        # GH 4928
-        self.assert_numpy_array_equal(
-            to_datetime([1, '1'], errors='ignore'),
-            np.array([1, '1'], dtype='O')
-        )
-        self.assertRaises(TypeError, to_datetime, [1, '1'], errors='raise')
-
-    def test_to_datetime_other_datetime64_units(self):
-        # 5/25/2012
-        scalar = np.int64(1337904000000000).view('M8[us]')
-        as_obj = scalar.astype('O')
-
-        index = DatetimeIndex([scalar])
-        self.assertEqual(index[0], scalar.astype('O'))
-
-        value = Timestamp(scalar)
-        self.assertEqual(value, as_obj)
-
-    def test_to_datetime_list_of_integers(self):
-        rng = date_range('1/1/2000', periods=20)
-        rng = DatetimeIndex(rng.values)
-
-        ints = list(rng.asi8)
-
-        result = DatetimeIndex(ints)
-
-        self.assertTrue(rng.equals(result))
-
-    def test_to_datetime_dt64s(self):
-        in_bound_dts = [
-            np.datetime64('2000-01-01'),
-            np.datetime64('2000-01-02'),
-        ]
-
-        for dt in in_bound_dts:
-            self.assertEqual(
-                pd.to_datetime(dt),
-                Timestamp(dt)
-            )
-
-        oob_dts = [
-            np.datetime64('1000-01-01'),
-            np.datetime64('5000-01-02'),
-        ]
-
-        for dt in oob_dts:
-            self.assertRaises(ValueError, pd.to_datetime, dt, errors='raise')
-            self.assertRaises(ValueError, tslib.Timestamp, dt)
-            self.assertIs(pd.to_datetime(dt, errors='coerce'), NaT)
-
-    def test_to_datetime_array_of_dt64s(self):
-        dts = [
-            np.datetime64('2000-01-01'),
-            np.datetime64('2000-01-02'),
-        ]
-
-        # Assuming all datetimes are in bounds, to_datetime() returns
-        # an array that is equal to Timestamp() parsing
-        self.assert_numpy_array_equal(
-            pd.to_datetime(dts, box=False),
-            np.array([Timestamp(x).asm8 for x in dts])
-        )
-
-        # A list of datetimes where the last one is out of bounds
-        dts_with_oob = dts + [np.datetime64('9999-01-01')]
-
-        self.assertRaises(
-            ValueError,
-            pd.to_datetime,
-            dts_with_oob,
-            errors='raise'
-        )
-
-        self.assert_numpy_array_equal(
-            pd.to_datetime(dts_with_oob, box=False, errors='coerce'),
-            np.array(
-                    [
-                        Timestamp(dts_with_oob[0]).asm8,
-                        Timestamp(dts_with_oob[1]).asm8,
-                        iNaT,
-                    ],
-                    dtype='M8'
-            )
-        )
-
-        # With errors='ignore', out of bounds datetime64s
-        # are converted to their .item(), which depending on the version of
-        # numpy is either a python datetime.datetime or datetime.date
-        self.assert_numpy_array_equal(
-            pd.to_datetime(dts_with_oob, box=False, errors='ignore'),
-            np.array(
-                    [dt.item() for dt in dts_with_oob],
-                    dtype='O'
-            )
-        )
-
-    def test_to_datetime_tz(self):
-
-        # xref 8260
-        # uniform returns a DatetimeIndex
-        arr = [pd.Timestamp('2013-01-01 13:00:00-0800', tz='US/Pacific'),pd.Timestamp('2013-01-02 14:00:00-0800', tz='US/Pacific')]
-        result = pd.to_datetime(arr)
-        expected = DatetimeIndex(['2013-01-01 13:00:00','2013-01-02 14:00:00'],tz='US/Pacific')
-        tm.assert_index_equal(result, expected)
-
-        # mixed tzs will raise
-        arr = [pd.Timestamp('2013-01-01 13:00:00', tz='US/Pacific'),pd.Timestamp('2013-01-02 14:00:00', tz='US/Eastern')]
-        self.assertRaises(ValueError, lambda : pd.to_datetime(arr))
-
-    def test_to_datetime_tz_pytz(self):
-
-        # xref 8260
-        tm._skip_if_no_pytz()
-        import pytz
-
-        us_eastern = pytz.timezone('US/Eastern')
-        arr = np.array([us_eastern.localize(datetime(year=2000, month=1, day=1, hour=3, minute=0)),
-                        us_eastern.localize(datetime(year=2000, month=6, day=1, hour=3, minute=0))],dtype=object)
-        result = pd.to_datetime(arr, utc=True)
-        expected = DatetimeIndex(['2000-01-01 08:00:00+00:00', '2000-06-01 07:00:00+00:00'], dtype='datetime64[ns, UTC]', freq=None)
-        tm.assert_index_equal(result, expected)
-
-    def test_to_datetime_tz_psycopg2(self):
-
-        # xref 8260
-        try:
-            import psycopg2
-        except ImportError:
-            raise nose.SkipTest("no psycopg2 installed")
-
-        # misc cases
-        arr = np.array([ datetime(2000, 1, 1, 3, 0, tzinfo=psycopg2.tz.FixedOffsetTimezone(offset=-300, name=None)),
-                         datetime(2000, 6, 1, 3, 0, tzinfo=psycopg2.tz.FixedOffsetTimezone(offset=-240, name=None))], dtype=object)
-
-        result = pd.to_datetime(arr, errors='coerce', utc=True)
-        expected = DatetimeIndex(['2000-01-01 08:00:00+00:00', '2000-06-01 07:00:00+00:00'], dtype='datetime64[ns, UTC]', freq=None)
-        tm.assert_index_equal(result, expected)
-
-        # dtype coercion
-        i = pd.DatetimeIndex(['2000-01-01 08:00:00+00:00'],tz=psycopg2.tz.FixedOffsetTimezone(offset=-300, name=None))
-        self.assertFalse(com.is_datetime64_ns_dtype(i))
-
-        # tz coerceion
-        result = pd.to_datetime(i, errors='coerce')
-        tm.assert_index_equal(result, i)
-
-        result = pd.to_datetime(i, errors='coerce', utc=True)
-        expected = pd.DatetimeIndex(['2000-01-01 13:00:00'])
-        tm.assert_index_equal(result, expected)
-
-    def test_index_to_datetime(self):
-        idx = Index(['1/1/2000', '1/2/2000', '1/3/2000'])
-
-        result = idx.to_datetime()
-        expected = DatetimeIndex(datetools.to_datetime(idx.values))
-        self.assertTrue(result.equals(expected))
-
-        today = datetime.today()
-        idx = Index([today], dtype=object)
-        result = idx.to_datetime()
-        expected = DatetimeIndex([today])
-        self.assertTrue(result.equals(expected))
-
-    def test_to_datetime_freq(self):
-        xp = bdate_range('2000-1-1', periods=10, tz='UTC')
-        rs = xp.to_datetime()
-        self.assertEqual(xp.freq, rs.freq)
-        self.assertEqual(xp.tzinfo, rs.tzinfo)
-
-    def test_range_misspecified(self):
-        # GH #1095
-
-        self.assertRaises(ValueError, date_range, '1/1/2000')
-        self.assertRaises(ValueError, date_range, end='1/1/2000')
-        self.assertRaises(ValueError, date_range, periods=10)
-
-        self.assertRaises(ValueError, date_range, '1/1/2000', freq='H')
-        self.assertRaises(ValueError, date_range, end='1/1/2000', freq='H')
-        self.assertRaises(ValueError, date_range, periods=10, freq='H')
-
-    def test_reasonable_keyerror(self):
-        # GH #1062
-        index = DatetimeIndex(['1/3/2000'])
-        try:
-            index.get_loc('1/1/2000')
-        except KeyError as e:
-            self.assertIn('2000', str(e))
-
-    def test_reindex_with_datetimes(self):
-        rng = date_range('1/1/2000', periods=20)
-        ts = Series(np.random.randn(20), index=rng)
-
-        result = ts.reindex(list(ts.index[5:10]))
-        expected = ts[5:10]
-        tm.assert_series_equal(result, expected)
-
-        result = ts[list(ts.index[5:10])]
-        tm.assert_series_equal(result, expected)
-
-    def test_asfreq_keep_index_name(self):
-        # GH #9854
-        index_name = 'bar'
-        index = pd.date_range('20130101',periods=20,name=index_name)
-        df = pd.DataFrame([x for x in range(20)],columns=['foo'],index=index)
-
-        tm.assert_equal(index_name, df.index.name)
-        tm.assert_equal(index_name, df.asfreq('10D').index.name)
-
-    def test_promote_datetime_date(self):
-        rng = date_range('1/1/2000', periods=20)
-        ts = Series(np.random.randn(20), index=rng)
-
-        ts_slice = ts[5:]
-        ts2 = ts_slice.copy()
-        ts2.index = [x.date() for x in ts2.index]
-
-        result = ts + ts2
-        result2 = ts2 + ts
-        expected = ts + ts[5:]
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-
-        # test asfreq
-        result = ts2.asfreq('4H', method='ffill')
-        expected = ts[5:].asfreq('4H', method='ffill')
-        assert_series_equal(result, expected)
-
-        result = rng.get_indexer(ts2.index)
-        expected = rng.get_indexer(ts_slice.index)
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_asfreq_normalize(self):
-        rng = date_range('1/1/2000 09:30', periods=20)
-        norm = date_range('1/1/2000', periods=20)
-        vals = np.random.randn(20)
-        ts = Series(vals, index=rng)
-
-        result = ts.asfreq('D', normalize=True)
-        norm = date_range('1/1/2000', periods=20)
-        expected = Series(vals, index=norm)
-
-        assert_series_equal(result, expected)
-
-        vals = np.random.randn(20, 3)
-        ts = DataFrame(vals, index=rng)
-
-        result = ts.asfreq('D', normalize=True)
-        expected = DataFrame(vals, index=norm)
-
-        assert_frame_equal(result, expected)
-
-    def test_date_range_gen_error(self):
-        rng = date_range('1/1/2000 00:00', '1/1/2000 00:18', freq='5min')
-        self.assertEqual(len(rng), 4)
-
-    def test_date_range_negative_freq(self):
-        # GH 11018
-        rng = date_range('2011-12-31', freq='-2A', periods=3)
-        exp = pd.DatetimeIndex(['2011-12-31', '2009-12-31', '2007-12-31'], freq='-2A')
-        self.assert_index_equal(rng, exp)
-        self.assertEqual(rng.freq, '-2A')
-
-        rng = date_range('2011-01-31', freq='-2M', periods=3)
-        exp = pd.DatetimeIndex(['2011-01-31', '2010-11-30', '2010-09-30'], freq='-2M')
-        self.assert_index_equal(rng, exp)
-        self.assertEqual(rng.freq, '-2M')
-
-    def test_first_subset(self):
-        ts = _simple_ts('1/1/2000', '1/1/2010', freq='12h')
-        result = ts.first('10d')
-        self.assertEqual(len(result), 20)
-
-        ts = _simple_ts('1/1/2000', '1/1/2010')
-        result = ts.first('10d')
-        self.assertEqual(len(result), 10)
-
-        result = ts.first('3M')
-        expected = ts[:'3/31/2000']
-        assert_series_equal(result, expected)
-
-        result = ts.first('21D')
-        expected = ts[:21]
-        assert_series_equal(result, expected)
-
-        result = ts[:0].first('3M')
-        assert_series_equal(result, ts[:0])
-
-    def test_last_subset(self):
-        ts = _simple_ts('1/1/2000', '1/1/2010', freq='12h')
-        result = ts.last('10d')
-        self.assertEqual(len(result), 20)
-
-        ts = _simple_ts('1/1/2000', '1/1/2010')
-        result = ts.last('10d')
-        self.assertEqual(len(result), 10)
-
-        result = ts.last('21D')
-        expected = ts['12/12/2009':]
-        assert_series_equal(result, expected)
-
-        result = ts.last('21D')
-        expected = ts[-21:]
-        assert_series_equal(result, expected)
-
-        result = ts[:0].last('3M')
-        assert_series_equal(result, ts[:0])
-
-    def test_format_pre_1900_dates(self):
-        rng = date_range('1/1/1850', '1/1/1950', freq='A-DEC')
-        rng.format()
-        ts = Series(1, index=rng)
-        repr(ts)
-
-    def test_repeat(self):
-        rng = date_range('1/1/2000', '1/1/2001')
-
-        result = rng.repeat(5)
-        self.assertIsNone(result.freq)
-        self.assertEqual(len(result), 5 * len(rng))
-
-    def test_at_time(self):
-        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-        rs = ts.at_time(rng[1])
-        self.assertTrue((rs.index.hour == rng[1].hour).all())
-        self.assertTrue((rs.index.minute == rng[1].minute).all())
-        self.assertTrue((rs.index.second == rng[1].second).all())
-
-        result = ts.at_time('9:30')
-        expected = ts.at_time(time(9, 30))
-        assert_series_equal(result, expected)
-
-        df = DataFrame(np.random.randn(len(rng), 3), index=rng)
-
-        result = ts[time(9, 30)]
-        result_df = df.ix[time(9, 30)]
-        expected = ts[(rng.hour == 9) & (rng.minute == 30)]
-        exp_df = df[(rng.hour == 9) & (rng.minute == 30)]
-
-        # expected.index = date_range('1/1/2000', '1/4/2000')
-
-        assert_series_equal(result, expected)
-        tm.assert_frame_equal(result_df, exp_df)
-
-        chunk = df.ix['1/4/2000':]
-        result = chunk.ix[time(9, 30)]
-        expected = result_df[-1:]
-        tm.assert_frame_equal(result, expected)
-
-        # midnight, everything
-        rng = date_range('1/1/2000', '1/31/2000')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts.at_time(time(0, 0))
-        assert_series_equal(result, ts)
-
-        # time doesn't exist
-        rng = date_range('1/1/2012', freq='23Min', periods=384)
-        ts = Series(np.random.randn(len(rng)), rng)
-        rs = ts.at_time('16:00')
-        self.assertEqual(len(rs), 0)
-
-    def test_at_time_frame(self):
-        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
-        ts = DataFrame(np.random.randn(len(rng), 2), index=rng)
-        rs = ts.at_time(rng[1])
-        self.assertTrue((rs.index.hour == rng[1].hour).all())
-        self.assertTrue((rs.index.minute == rng[1].minute).all())
-        self.assertTrue((rs.index.second == rng[1].second).all())
-
-        result = ts.at_time('9:30')
-        expected = ts.at_time(time(9, 30))
-        assert_frame_equal(result, expected)
-
-        result = ts.ix[time(9, 30)]
-        expected = ts.ix[(rng.hour == 9) & (rng.minute == 30)]
-
-        assert_frame_equal(result, expected)
-
-        # midnight, everything
-        rng = date_range('1/1/2000', '1/31/2000')
-        ts = DataFrame(np.random.randn(len(rng), 3), index=rng)
-
-        result = ts.at_time(time(0, 0))
-        assert_frame_equal(result, ts)
-
-        # time doesn't exist
-        rng = date_range('1/1/2012', freq='23Min', periods=384)
-        ts = DataFrame(np.random.randn(len(rng), 2), rng)
-        rs = ts.at_time('16:00')
-        self.assertEqual(len(rs), 0)
-
-    def test_between_time(self):
-        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-        stime = time(0, 0)
-        etime = time(1, 0)
-
-        close_open = product([True, False], [True, False])
-        for inc_start, inc_end in close_open:
-            filtered = ts.between_time(stime, etime, inc_start, inc_end)
-            exp_len = 13 * 4 + 1
-            if not inc_start:
-                exp_len -= 5
-            if not inc_end:
-                exp_len -= 4
-
-            self.assertEqual(len(filtered), exp_len)
-            for rs in filtered.index:
-                t = rs.time()
-                if inc_start:
-                    self.assertTrue(t >= stime)
-                else:
-                    self.assertTrue(t > stime)
-
-                if inc_end:
-                    self.assertTrue(t <= etime)
-                else:
-                    self.assertTrue(t < etime)
-
-        result = ts.between_time('00:00', '01:00')
-        expected = ts.between_time(stime, etime)
-        assert_series_equal(result, expected)
-
-        # across midnight
-        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-        stime = time(22, 0)
-        etime = time(9, 0)
-
-        close_open = product([True, False], [True, False])
-        for inc_start, inc_end in close_open:
-            filtered = ts.between_time(stime, etime, inc_start, inc_end)
-            exp_len = (12 * 11 + 1) * 4 + 1
-            if not inc_start:
-                exp_len -= 4
-            if not inc_end:
-                exp_len -= 4
-
-            self.assertEqual(len(filtered), exp_len)
-            for rs in filtered.index:
-                t = rs.time()
-                if inc_start:
-                    self.assertTrue((t >= stime) or (t <= etime))
-                else:
-                    self.assertTrue((t > stime) or (t <= etime))
-
-                if inc_end:
-                    self.assertTrue((t <= etime) or (t >= stime))
-                else:
-                    self.assertTrue((t < etime) or (t >= stime))
-
-    def test_between_time_frame(self):
-        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
-        ts = DataFrame(np.random.randn(len(rng), 2), index=rng)
-        stime = time(0, 0)
-        etime = time(1, 0)
-
-        close_open = product([True, False], [True, False])
-        for inc_start, inc_end in close_open:
-            filtered = ts.between_time(stime, etime, inc_start, inc_end)
-            exp_len = 13 * 4 + 1
-            if not inc_start:
-                exp_len -= 5
-            if not inc_end:
-                exp_len -= 4
-
-            self.assertEqual(len(filtered), exp_len)
-            for rs in filtered.index:
-                t = rs.time()
-                if inc_start:
-                    self.assertTrue(t >= stime)
-                else:
-                    self.assertTrue(t > stime)
-
-                if inc_end:
-                    self.assertTrue(t <= etime)
-                else:
-                    self.assertTrue(t < etime)
-
-        result = ts.between_time('00:00', '01:00')
-        expected = ts.between_time(stime, etime)
-        assert_frame_equal(result, expected)
-
-        # across midnight
-        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
-        ts = DataFrame(np.random.randn(len(rng), 2), index=rng)
-        stime = time(22, 0)
-        etime = time(9, 0)
-
-        close_open = product([True, False], [True, False])
-        for inc_start, inc_end in close_open:
-            filtered = ts.between_time(stime, etime, inc_start, inc_end)
-            exp_len = (12 * 11 + 1) * 4 + 1
-            if not inc_start:
-                exp_len -= 4
-            if not inc_end:
-                exp_len -= 4
-
-            self.assertEqual(len(filtered), exp_len)
-            for rs in filtered.index:
-                t = rs.time()
-                if inc_start:
-                    self.assertTrue((t >= stime) or (t <= etime))
-                else:
-                    self.assertTrue((t > stime) or (t <= etime))
-
-                if inc_end:
-                    self.assertTrue((t <= etime) or (t >= stime))
-                else:
-                    self.assertTrue((t < etime) or (t >= stime))
-
-    def test_dti_constructor_preserve_dti_freq(self):
-        rng = date_range('1/1/2000', '1/2/2000', freq='5min')
-
-        rng2 = DatetimeIndex(rng)
-        self.assertEqual(rng.freq, rng2.freq)
-
-    def test_dti_constructor_years_only(self):
-        # GH 6961
-        for tz in [None, 'UTC', 'Asia/Tokyo', 'dateutil/US/Pacific']:
-            rng1 = date_range('2014', '2015', freq='M', tz=tz)
-            expected1 = date_range('2014-01-31', '2014-12-31', freq='M', tz=tz)
-
-            rng2 = date_range('2014', '2015', freq='MS', tz=tz)
-            expected2 = date_range('2014-01-01', '2015-01-01', freq='MS', tz=tz)
-
-            rng3 = date_range('2014', '2020', freq='A', tz=tz)
-            expected3 = date_range('2014-12-31', '2019-12-31', freq='A', tz=tz)
-
-            rng4 = date_range('2014', '2020', freq='AS', tz=tz)
-            expected4 = date_range('2014-01-01', '2020-01-01', freq='AS', tz=tz)
-
-            for rng, expected in [(rng1, expected1), (rng2, expected2),
-                                  (rng3, expected3), (rng4, expected4)]:
-                tm.assert_index_equal(rng, expected)
-
-    def test_normalize(self):
-        rng = date_range('1/1/2000 9:30', periods=10, freq='D')
-
-        result = rng.normalize()
-        expected = date_range('1/1/2000', periods=10, freq='D')
-        self.assertTrue(result.equals(expected))
-
-        rng_ns = pd.DatetimeIndex(np.array([1380585623454345752, 1380585612343234312]).astype("datetime64[ns]"))
-        rng_ns_normalized = rng_ns.normalize()
-        expected = pd.DatetimeIndex(np.array([1380585600000000000, 1380585600000000000]).astype("datetime64[ns]"))
-        self.assertTrue(rng_ns_normalized.equals(expected))
-
-        self.assertTrue(result.is_normalized)
-        self.assertFalse(rng.is_normalized)
-
-    def test_to_period(self):
-        from pandas.tseries.period import period_range
-
-        ts = _simple_ts('1/1/2000', '1/1/2001')
-
-        pts = ts.to_period()
-        exp = ts.copy()
-        exp.index = period_range('1/1/2000', '1/1/2001')
-        assert_series_equal(pts, exp)
-
-        pts = ts.to_period('M')
-        exp.index = exp.index.asfreq('M')
-        self.assertTrue(pts.index.equals(exp.index.asfreq('M')))
-        assert_series_equal(pts, exp)
-
-        # GH 7606 without freq
-        idx = DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03', '2011-01-04'])
-        exp_idx = pd.PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03',
-                                  '2011-01-04'], freq='D')
-
-        s = Series(np.random.randn(4), index=idx)
-        expected = s.copy()
-        expected.index = exp_idx
-        assert_series_equal(s.to_period(), expected)
-
-        df = DataFrame(np.random.randn(4, 4), index=idx, columns=idx)
-        expected = df.copy()
-        expected.index = exp_idx
-        assert_frame_equal(df.to_period(), expected)
-
-        expected = df.copy()
-        expected.columns = exp_idx
-        assert_frame_equal(df.to_period(axis=1), expected)
-
-    def create_dt64_based_index(self):
-        data = [Timestamp('2007-01-01 10:11:12.123456Z'),
-                Timestamp('2007-01-01 10:11:13.789123Z')]
-        index = DatetimeIndex(data)
-        return index
-
-    def test_to_period_millisecond(self):
-        index = self.create_dt64_based_index()
-
-        period = index.to_period(freq='L')
-        self.assertEqual(2, len(period))
-        self.assertEqual(period[0], Period('2007-01-01 10:11:12.123Z', 'L'))
-        self.assertEqual(period[1], Period('2007-01-01 10:11:13.789Z', 'L'))
-
-    def test_to_period_microsecond(self):
-        index = self.create_dt64_based_index()
-
-        period = index.to_period(freq='U')
-        self.assertEqual(2, len(period))
-        self.assertEqual(period[0], Period('2007-01-01 10:11:12.123456Z', 'U'))
-        self.assertEqual(period[1], Period('2007-01-01 10:11:13.789123Z', 'U'))
-
-    def test_to_period_tz_pytz(self):
-        tm._skip_if_no_pytz()
-        from dateutil.tz import tzlocal
-        from pytz import utc as UTC
-
-        xp = date_range('1/1/2000', '4/1/2000').to_period()
-
-        ts = date_range('1/1/2000', '4/1/2000', tz='US/Eastern')
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertEqual(result, expected)
-        self.assertTrue(ts.to_period().equals(xp))
-
-        ts = date_range('1/1/2000', '4/1/2000', tz=UTC)
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertEqual(result, expected)
-        self.assertTrue(ts.to_period().equals(xp))
-
-        ts = date_range('1/1/2000', '4/1/2000', tz=tzlocal())
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertEqual(result, expected)
-        self.assertTrue(ts.to_period().equals(xp))
-
-    def test_to_period_tz_explicit_pytz(self):
-        tm._skip_if_no_pytz()
-        import pytz
-        from dateutil.tz import tzlocal
-
-        xp = date_range('1/1/2000', '4/1/2000').to_period()
-
-        ts = date_range('1/1/2000', '4/1/2000', tz=pytz.timezone('US/Eastern'))
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertTrue(result == expected)
-        self.assertTrue(ts.to_period().equals(xp))
-
-        ts = date_range('1/1/2000', '4/1/2000', tz=pytz.utc)
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertTrue(result == expected)
-        self.assertTrue(ts.to_period().equals(xp))
-
-        ts = date_range('1/1/2000', '4/1/2000', tz=tzlocal())
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertTrue(result == expected)
-        self.assertTrue(ts.to_period().equals(xp))
-
-    def test_to_period_tz_dateutil(self):
-        tm._skip_if_no_dateutil()
-        import dateutil
-        from dateutil.tz import tzlocal
-
-        xp = date_range('1/1/2000', '4/1/2000').to_period()
-
-        ts = date_range('1/1/2000', '4/1/2000', tz='dateutil/US/Eastern')
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertTrue(result == expected)
-        self.assertTrue(ts.to_period().equals(xp))
-
-        ts = date_range('1/1/2000', '4/1/2000', tz=dateutil.tz.tzutc())
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertTrue(result == expected)
-        self.assertTrue(ts.to_period().equals(xp))
-
-        ts = date_range('1/1/2000', '4/1/2000', tz=tzlocal())
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertTrue(result == expected)
-        self.assertTrue(ts.to_period().equals(xp))
-
-    def test_frame_to_period(self):
-        K = 5
-        from pandas.tseries.period import period_range
-
-        dr = date_range('1/1/2000', '1/1/2001')
-        pr = period_range('1/1/2000', '1/1/2001')
-        df = DataFrame(randn(len(dr), K), index=dr)
-        df['mix'] = 'a'
-
-        pts = df.to_period()
-        exp = df.copy()
-        exp.index = pr
-        assert_frame_equal(pts, exp)
-
-        pts = df.to_period('M')
-        self.assertTrue(pts.index.equals(exp.index.asfreq('M')))
-
-        df = df.T
-        pts = df.to_period(axis=1)
-        exp = df.copy()
-        exp.columns = pr
-        assert_frame_equal(pts, exp)
-
-        pts = df.to_period('M', axis=1)
-        self.assertTrue(pts.columns.equals(exp.columns.asfreq('M')))
-
-        self.assertRaises(ValueError, df.to_period, axis=2)
-
-    def test_timestamp_fields(self):
-        # extra fields from DatetimeIndex like quarter and week
-        idx = tm.makeDateIndex(100)
-
-        fields = ['dayofweek', 'dayofyear', 'week', 'weekofyear', 'quarter', 'days_in_month', 'is_month_start', 'is_month_end', 'is_quarter_start', 'is_quarter_end', 'is_year_start', 'is_year_end']
-        for f in fields:
-            expected = getattr(idx, f)[-1]
-            result = getattr(Timestamp(idx[-1]), f)
-            self.assertEqual(result, expected)
-
-        self.assertEqual(idx.freq, Timestamp(idx[-1], idx.freq).freq)
-        self.assertEqual(idx.freqstr, Timestamp(idx[-1], idx.freq).freqstr)
-
-    def test_woy_boundary(self):
-        # make sure weeks at year boundaries are correct
-        d = datetime(2013,12,31)
-        result = Timestamp(d).week
-        expected = 1 # ISO standard
-        self.assertEqual(result, expected)
-
-        d = datetime(2008,12,28)
-        result = Timestamp(d).week
-        expected = 52 # ISO standard
-        self.assertEqual(result, expected)
-
-        d = datetime(2009,12,31)
-        result = Timestamp(d).week
-        expected = 53 # ISO standard
-        self.assertEqual(result, expected)
-
-        d = datetime(2010,1,1)
-        result = Timestamp(d).week
-        expected = 53 # ISO standard
-        self.assertEqual(result, expected)
-
-        d = datetime(2010,1,3)
-        result = Timestamp(d).week
-        expected = 53 # ISO standard
-        self.assertEqual(result, expected)
-
-        result = np.array([Timestamp(datetime(*args)).week for args in
-                           [(2000,1,1),(2000,1,2),(2005,1,1),(2005,1,2)]])
-        self.assertTrue((result == [52, 52, 53, 53]).all())
-
-    def test_timestamp_date_out_of_range(self):
-        self.assertRaises(ValueError, Timestamp, '1676-01-01')
-        self.assertRaises(ValueError, Timestamp, '2263-01-01')
-
-        # 1475
-        self.assertRaises(ValueError, DatetimeIndex, ['1400-01-01'])
-        self.assertRaises(ValueError, DatetimeIndex, [datetime(1400, 1, 1)])
-
-    def test_timestamp_repr(self):
-        # pre-1900
-        stamp = Timestamp('1850-01-01', tz='US/Eastern')
-        repr(stamp)
-
-        iso8601 = '1850-01-01 01:23:45.012345'
-        stamp = Timestamp(iso8601, tz='US/Eastern')
-        result = repr(stamp)
-        self.assertIn(iso8601, result)
-
-    def test_timestamp_from_ordinal(self):
-
-        # GH 3042
-        dt = datetime(2011, 4, 16, 0, 0)
-        ts = Timestamp.fromordinal(dt.toordinal())
-        self.assertEqual(ts.to_pydatetime(), dt)
-
-        # with a tzinfo
-        stamp = Timestamp('2011-4-16', tz='US/Eastern')
-        dt_tz = stamp.to_pydatetime()
-        ts = Timestamp.fromordinal(dt_tz.toordinal(),tz='US/Eastern')
-        self.assertEqual(ts.to_pydatetime(), dt_tz)
-
-    def test_datetimeindex_integers_shift(self):
-        rng = date_range('1/1/2000', periods=20)
-
-        result = rng + 5
-        expected = rng.shift(5)
-        self.assertTrue(result.equals(expected))
-
-        result = rng - 5
-        expected = rng.shift(-5)
-        self.assertTrue(result.equals(expected))
-
-    def test_astype_object(self):
-        # NumPy 1.6.1 weak ns support
-        rng = date_range('1/1/2000', periods=20)
-
-        casted = rng.astype('O')
-        exp_values = list(rng)
-
-        self.assert_numpy_array_equal(casted, exp_values)
-
-    def test_catch_infinite_loop(self):
-        offset = datetools.DateOffset(minute=5)
-        # blow up, don't loop forever
-        self.assertRaises(Exception, date_range, datetime(2011, 11, 11),
-                          datetime(2011, 11, 12), freq=offset)
-
-    def test_append_concat(self):
-        rng = date_range('5/8/2012 1:45', periods=10, freq='5T')
-        ts = Series(np.random.randn(len(rng)), rng)
-        df = DataFrame(np.random.randn(len(rng), 4), index=rng)
-
-        result = ts.append(ts)
-        result_df = df.append(df)
-        ex_index = DatetimeIndex(np.tile(rng.values, 2))
-        self.assertTrue(result.index.equals(ex_index))
-        self.assertTrue(result_df.index.equals(ex_index))
-
-        appended = rng.append(rng)
-        self.assertTrue(appended.equals(ex_index))
-
-        appended = rng.append([rng, rng])
-        ex_index = DatetimeIndex(np.tile(rng.values, 3))
-        self.assertTrue(appended.equals(ex_index))
-
-        # different index names
-        rng1 = rng.copy()
-        rng2 = rng.copy()
-        rng1.name = 'foo'
-        rng2.name = 'bar'
-        self.assertEqual(rng1.append(rng1).name, 'foo')
-        self.assertIsNone(rng1.append(rng2).name)
-
-    def test_append_concat_tz(self):
-        #GH 2938
-        tm._skip_if_no_pytz()
-
-        rng = date_range('5/8/2012 1:45', periods=10, freq='5T',
-                         tz='US/Eastern')
-        rng2 = date_range('5/8/2012 2:35', periods=10, freq='5T',
-                         tz='US/Eastern')
-        rng3 = date_range('5/8/2012 1:45', periods=20, freq='5T',
-                         tz='US/Eastern')
-        ts = Series(np.random.randn(len(rng)), rng)
-        df = DataFrame(np.random.randn(len(rng), 4), index=rng)
-        ts2 = Series(np.random.randn(len(rng2)), rng2)
-        df2 = DataFrame(np.random.randn(len(rng2), 4), index=rng2)
-
-        result = ts.append(ts2)
-        result_df = df.append(df2)
-        self.assertTrue(result.index.equals(rng3))
-        self.assertTrue(result_df.index.equals(rng3))
-
-        appended = rng.append(rng2)
-        self.assertTrue(appended.equals(rng3))
-
-    def test_append_concat_tz_explicit_pytz(self):
-        # GH 2938
-        tm._skip_if_no_pytz()
-        from pytz import timezone as timezone
-
-        rng = date_range('5/8/2012 1:45', periods=10, freq='5T',
-                         tz=timezone('US/Eastern'))
-        rng2 = date_range('5/8/2012 2:35', periods=10, freq='5T',
-                         tz=timezone('US/Eastern'))
-        rng3 = date_range('5/8/2012 1:45', periods=20, freq='5T',
-                         tz=timezone('US/Eastern'))
-        ts = Series(np.random.randn(len(rng)), rng)
-        df = DataFrame(np.random.randn(len(rng), 4), index=rng)
-        ts2 = Series(np.random.randn(len(rng2)), rng2)
-        df2 = DataFrame(np.random.randn(len(rng2), 4), index=rng2)
-
-        result = ts.append(ts2)
-        result_df = df.append(df2)
-        self.assertTrue(result.index.equals(rng3))
-        self.assertTrue(result_df.index.equals(rng3))
-
-        appended = rng.append(rng2)
-        self.assertTrue(appended.equals(rng3))
-
-    def test_append_concat_tz_dateutil(self):
-        # GH 2938
-        tm._skip_if_no_dateutil()
-        from pandas.tslib import _dateutil_gettz as timezone
-
-        rng = date_range('5/8/2012 1:45', periods=10, freq='5T',
-                         tz='dateutil/US/Eastern')
-        rng2 = date_range('5/8/2012 2:35', periods=10, freq='5T',
-                         tz='dateutil/US/Eastern')
-        rng3 = date_range('5/8/2012 1:45', periods=20, freq='5T',
-                         tz='dateutil/US/Eastern')
-        ts = Series(np.random.randn(len(rng)), rng)
-        df = DataFrame(np.random.randn(len(rng), 4), index=rng)
-        ts2 = Series(np.random.randn(len(rng2)), rng2)
-        df2 = DataFrame(np.random.randn(len(rng2), 4), index=rng2)
-
-        result = ts.append(ts2)
-        result_df = df.append(df2)
-        self.assertTrue(result.index.equals(rng3))
-        self.assertTrue(result_df.index.equals(rng3))
-
-        appended = rng.append(rng2)
-        self.assertTrue(appended.equals(rng3))
-
-    def test_set_dataframe_column_ns_dtype(self):
-        x = DataFrame([datetime.now(), datetime.now()])
-        self.assertEqual(x[0].dtype, np.dtype('M8[ns]'))
-
-    def test_groupby_count_dateparseerror(self):
-        dr = date_range(start='1/1/2012', freq='5min', periods=10)
-
-        # BAD Example, datetimes first
-        s = Series(np.arange(10), index=[dr, lrange(10)])
-        grouped = s.groupby(lambda x: x[1] % 2 == 0)
-        result = grouped.count()
-
-        s = Series(np.arange(10), index=[lrange(10), dr])
-        grouped = s.groupby(lambda x: x[0] % 2 == 0)
-        expected = grouped.count()
-
-        assert_series_equal(result, expected)
-
-    def test_datetimeindex_repr_short(self):
-        dr = date_range(start='1/1/2012', periods=1)
-        repr(dr)
-
-        dr = date_range(start='1/1/2012', periods=2)
-        repr(dr)
-
-        dr = date_range(start='1/1/2012', periods=3)
-        repr(dr)
-
-    def test_constructor_int64_nocopy(self):
-        # #1624
-        arr = np.arange(1000, dtype=np.int64)
-        index = DatetimeIndex(arr)
-
-        arr[50:100] = -1
-        self.assertTrue((index.asi8[50:100] == -1).all())
-
-        arr = np.arange(1000, dtype=np.int64)
-        index = DatetimeIndex(arr, copy=True)
-
-        arr[50:100] = -1
-        self.assertTrue((index.asi8[50:100] != -1).all())
-
-    def test_series_interpolate_method_values(self):
-        # #1646
-        ts = _simple_ts('1/1/2000', '1/20/2000')
-        ts[::2] = np.nan
-
-        result = ts.interpolate(method='values')
-        exp = ts.interpolate()
-        assert_series_equal(result, exp)
-
-    def test_frame_datetime64_handling_groupby(self):
-        # it works!
-        df = DataFrame([(3, np.datetime64('2012-07-03')),
-                        (3, np.datetime64('2012-07-04'))],
-                       columns=['a', 'date'])
-        result = df.groupby('a').first()
-        self.assertEqual(result['date'][3], Timestamp('2012-07-03'))
-
-    def test_series_interpolate_intraday(self):
-        # #1698
-        index = pd.date_range('1/1/2012', periods=4, freq='12D')
-        ts = pd.Series([0, 12, 24, 36], index)
-        new_index = index.append(index + pd.DateOffset(days=1)).sort_values()
-
-        exp = ts.reindex(new_index).interpolate(method='time')
-
-        index = pd.date_range('1/1/2012', periods=4, freq='12H')
-        ts = pd.Series([0, 12, 24, 36], index)
-        new_index = index.append(index + pd.DateOffset(hours=1)).sort_values()
-        result = ts.reindex(new_index).interpolate(method='time')
-
-        self.assert_numpy_array_equal(result.values, exp.values)
-
-    def test_frame_dict_constructor_datetime64_1680(self):
-        dr = date_range('1/1/2012', periods=10)
-        s = Series(dr, index=dr)
-
-        # it works!
-        DataFrame({'a': 'foo', 'b': s}, index=dr)
-        DataFrame({'a': 'foo', 'b': s.values}, index=dr)
-
-    def test_frame_datetime64_mixed_index_ctor_1681(self):
-        dr = date_range('2011/1/1', '2012/1/1', freq='W-FRI')
-        ts = Series(dr)
-
-        # it works!
-        d = DataFrame({'A': 'foo', 'B': ts}, index=dr)
-        self.assertTrue(d['B'].isnull().all())
-
-    def test_frame_timeseries_to_records(self):
-        index = date_range('1/1/2000', periods=10)
-        df = DataFrame(np.random.randn(10, 3), index=index,
-                       columns=['a', 'b', 'c'])
-
-        result = df.to_records()
-        result['index'].dtype == 'M8[ns]'
-
-        result = df.to_records(index=False)
-
-    def test_frame_datetime64_duplicated(self):
-        dates = date_range('2010-07-01', end='2010-08-05')
-
-        tst = DataFrame({'symbol': 'AAA', 'date': dates})
-        result = tst.duplicated(['date', 'symbol'])
-        self.assertTrue((-result).all())
-
-        tst = DataFrame({'date': dates})
-        result = tst.duplicated()
-        self.assertTrue((-result).all())
-
-    def test_timestamp_compare_with_early_datetime(self):
-        # e.g. datetime.min
-        stamp = Timestamp('2012-01-01')
-
-        self.assertFalse(stamp == datetime.min)
-        self.assertFalse(stamp == datetime(1600, 1, 1))
-        self.assertFalse(stamp == datetime(2700, 1, 1))
-        self.assertNotEqual(stamp, datetime.min)
-        self.assertNotEqual(stamp, datetime(1600, 1, 1))
-        self.assertNotEqual(stamp, datetime(2700, 1, 1))
-        self.assertTrue(stamp > datetime(1600, 1, 1))
-        self.assertTrue(stamp >= datetime(1600, 1, 1))
-        self.assertTrue(stamp < datetime(2700, 1, 1))
-        self.assertTrue(stamp <= datetime(2700, 1, 1))
-
-    def test_to_html_timestamp(self):
-        rng = date_range('2000-01-01', periods=10)
-        df = DataFrame(np.random.randn(10, 4), index=rng)
-
-        result = df.to_html()
-        self.assertIn('2000-01-01', result)
-
-    def test_to_csv_numpy_16_bug(self):
-        frame = DataFrame({'a': date_range('1/1/2000', periods=10)})
-
-        buf = StringIO()
-        frame.to_csv(buf)
-
-        result = buf.getvalue()
-        self.assertIn('2000-01-01', result)
-
-    def test_series_map_box_timestamps(self):
-        # #2689, #2627
-        s = Series(date_range('1/1/2000', periods=10))
-
-        def f(x):
-            return (x.hour, x.day, x.month)
-
-        # it works!
-        s.map(f)
-        s.apply(f)
-        DataFrame(s).applymap(f)
-
-    def test_concat_datetime_datetime64_frame(self):
-        # #2624
-        rows = []
-        rows.append([datetime(2010, 1, 1), 1])
-        rows.append([datetime(2010, 1, 2), 'hi'])
-
-        df2_obj = DataFrame.from_records(rows, columns=['date', 'test'])
-
-        ind = date_range(start="2000/1/1", freq="D", periods=10)
-        df1 = DataFrame({'date': ind, 'test':lrange(10)})
-
-        # it works!
-        pd.concat([df1, df2_obj])
-
-    def test_period_resample(self):
-        # GH3609
-        s = Series(range(100),index=date_range('20130101', freq='s', periods=100), dtype='float')
-        s[10:30] = np.nan
-        expected = Series([34.5, 79.5], index=[Period('2013-01-01 00:00', 'T'), Period('2013-01-01 00:01', 'T')])
-        result = s.to_period().resample('T', kind='period')
-        assert_series_equal(result, expected)
-        result2 = s.resample('T', kind='period')
-        assert_series_equal(result2, expected)
-
-    def test_period_resample_with_local_timezone_pytz(self):
-        # GH5430
-        tm._skip_if_no_pytz()
-        import pytz
-
-        local_timezone = pytz.timezone('America/Los_Angeles')
-
-        start = datetime(year=2013, month=11, day=1, hour=0, minute=0, tzinfo=pytz.utc)
-        # 1 day later
-        end = datetime(year=2013, month=11, day=2, hour=0, minute=0, tzinfo=pytz.utc)
-
-        index = pd.date_range(start, end, freq='H')
-
-        series = pd.Series(1, index=index)
-        series = series.tz_convert(local_timezone)
-        result = series.resample('D', kind='period')
-        # Create the expected series
-        expected_index = (pd.period_range(start=start, end=end, freq='D') - 1)  # Index is moved back a day with the timezone conversion from UTC to Pacific
-        expected = pd.Series(1, index=expected_index)
-        assert_series_equal(result, expected)
-
-    def test_period_resample_with_local_timezone_dateutil(self):
-        # GH5430
-        tm._skip_if_no_dateutil()
-        import dateutil
-
-        local_timezone = 'dateutil/America/Los_Angeles'
-
-        start = datetime(year=2013, month=11, day=1, hour=0, minute=0, tzinfo=dateutil.tz.tzutc())
-        # 1 day later
-        end = datetime(year=2013, month=11, day=2, hour=0, minute=0, tzinfo=dateutil.tz.tzutc())
-
-        index = pd.date_range(start, end, freq='H')
-
-        series = pd.Series(1, index=index)
-        series = series.tz_convert(local_timezone)
-        result = series.resample('D', kind='period')
-        # Create the expected series
-        expected_index = (pd.period_range(start=start, end=end, freq='D') - 1)  # Index is moved back a day with the timezone conversion from UTC to Pacific
-        expected = pd.Series(1, index=expected_index)
-        assert_series_equal(result, expected)
-
-    def test_pickle(self):
-
-        # GH4606
-        p = self.round_trip_pickle(NaT)
-        self.assertTrue(p is NaT)
-
-        idx = pd.to_datetime(['2013-01-01', NaT, '2014-01-06'])
-        idx_p = self.round_trip_pickle(idx)
-        self.assertTrue(idx_p[0] == idx[0])
-        self.assertTrue(idx_p[1] is NaT)
-        self.assertTrue(idx_p[2] == idx[2])
-
-        # GH11002
-        # don't infer freq
-        idx = date_range('1750-1-1', '2050-1-1', freq='7D')
-        idx_p = self.round_trip_pickle(idx)
-        tm.assert_index_equal(idx, idx_p)
-
-    def test_timestamp_equality(self):
-
-        # GH 11034
-        s = Series([Timestamp('2000-01-29 01:59:00'),'NaT'])
-        result = s != s
-        assert_series_equal(result, Series([False,True]))
-        result = s != s[0]
-        assert_series_equal(result, Series([False,True]))
-        result = s != s[1]
-        assert_series_equal(result, Series([True,True]))
-
-        result = s == s
-        assert_series_equal(result, Series([True,False]))
-        result = s == s[0]
-        assert_series_equal(result, Series([True,False]))
-        result = s == s[1]
-        assert_series_equal(result, Series([False,False]))
-
-
-
-def _simple_ts(start, end, freq='D'):
-    rng = date_range(start, end, freq=freq)
-    return Series(np.random.randn(len(rng)), index=rng)
-
-
-class TestDatetimeIndex(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def test_hash_error(self):
-        index = date_range('20010101', periods=10)
-        with tm.assertRaisesRegexp(TypeError,
-                                   "unhashable type: %r" %
-                                   type(index).__name__):
-            hash(index)
-
-    def test_stringified_slice_with_tz(self):
-        #GH2658
-        import datetime
-        start=datetime.datetime.now()
-        idx=DatetimeIndex(start=start,freq="1d",periods=10)
-        df=DataFrame(lrange(10),index=idx)
-        df["2013-01-14 23:44:34.437768-05:00":] # no exception here
-
-    def test_append_join_nondatetimeindex(self):
-        rng = date_range('1/1/2000', periods=10)
-        idx = Index(['a', 'b', 'c', 'd'])
-
-        result = rng.append(idx)
-        tm.assertIsInstance(result[0], Timestamp)
-
-        # it works
-        rng.join(idx, how='outer')
-
-    def test_astype(self):
-        rng = date_range('1/1/2000', periods=10)
-
-        result = rng.astype('i8')
-        self.assert_numpy_array_equal(result, rng.asi8)
-
-        # with tz
-        rng = date_range('1/1/2000', periods=10, tz='US/Eastern')
-        result = rng.astype('datetime64[ns]')
-        expected = date_range('1/1/2000', periods=10, tz='US/Eastern').tz_convert('UTC').tz_localize(None)
-        tm.assert_index_equal(result, expected)
-
-    def test_to_period_nofreq(self):
-        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-04'])
-        self.assertRaises(ValueError, idx.to_period)
-
-        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03'],
-                            freq='infer')
-        self.assertEqual(idx.freqstr, 'D')
-        expected = pd.PeriodIndex(['2000-01-01', '2000-01-02', '2000-01-03'], freq='D')
-        self.assertTrue(idx.to_period().equals(expected))
-
-        # GH 7606
-        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03'])
-        self.assertEqual(idx.freqstr, None)
-        self.assertTrue(idx.to_period().equals(expected))
-
-    def test_000constructor_resolution(self):
-        # 2252
-        t1 = Timestamp((1352934390 * 1000000000) + 1000000 + 1000 + 1)
-        idx = DatetimeIndex([t1])
-
-        self.assertEqual(idx.nanosecond[0], t1.nanosecond)
-
-    def test_constructor_coverage(self):
-        rng = date_range('1/1/2000', periods=10.5)
-        exp = date_range('1/1/2000', periods=10)
-        self.assertTrue(rng.equals(exp))
-
-        self.assertRaises(ValueError, DatetimeIndex, start='1/1/2000',
-                          periods='foo', freq='D')
-
-        self.assertRaises(ValueError, DatetimeIndex, start='1/1/2000',
-                          end='1/10/2000')
-
-        self.assertRaises(ValueError, DatetimeIndex, '1/1/2000')
-
-        # generator expression
-        gen = (datetime(2000, 1, 1) + timedelta(i) for i in range(10))
-        result = DatetimeIndex(gen)
-        expected = DatetimeIndex([datetime(2000, 1, 1) + timedelta(i)
-                                  for i in range(10)])
-        self.assertTrue(result.equals(expected))
-
-        # NumPy string array
-        strings = np.array(['2000-01-01', '2000-01-02', '2000-01-03'])
-        result = DatetimeIndex(strings)
-        expected = DatetimeIndex(strings.astype('O'))
-        self.assertTrue(result.equals(expected))
-
-        from_ints = DatetimeIndex(expected.asi8)
-        self.assertTrue(from_ints.equals(expected))
-
-        # string with NaT
-        strings = np.array(['2000-01-01', '2000-01-02', 'NaT'])
-        result = DatetimeIndex(strings)
-        expected = DatetimeIndex(strings.astype('O'))
-        self.assertTrue(result.equals(expected))
-
-        from_ints = DatetimeIndex(expected.asi8)
-        self.assertTrue(from_ints.equals(expected))
-
-        # non-conforming
-        self.assertRaises(ValueError, DatetimeIndex,
-                          ['2000-01-01', '2000-01-02', '2000-01-04'],
-                          freq='D')
-
-        self.assertRaises(ValueError, DatetimeIndex,
-                          start='2011-01-01', freq='b')
-        self.assertRaises(ValueError, DatetimeIndex,
-                          end='2011-01-01', freq='B')
-        self.assertRaises(ValueError, DatetimeIndex, periods=10, freq='D')
-
-    def test_constructor_datetime64_tzformat(self):
-        # GH 6572
-        tm._skip_if_no_pytz()
-        import pytz
-        # ISO 8601 format results in pytz.FixedOffset
-        for freq in ['AS', 'W-SUN']:
-            idx = date_range('2013-01-01T00:00:00-05:00', '2016-01-01T23:59:59-05:00', freq=freq)
-            expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
-                                  freq=freq, tz=pytz.FixedOffset(-300))
-            tm.assert_index_equal(idx, expected)
-            # Unable to use `US/Eastern` because of DST
-            expected_i8 = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
-                                     freq=freq, tz='America/Lima')
-            self.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
-
-            idx = date_range('2013-01-01T00:00:00+09:00', '2016-01-01T23:59:59+09:00', freq=freq)
-            expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
-                                  freq=freq, tz=pytz.FixedOffset(540))
-            tm.assert_index_equal(idx, expected)
-            expected_i8 = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
-                                     freq=freq, tz='Asia/Tokyo')
-            self.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
-
-        tm._skip_if_no_dateutil()
-        from dateutil.tz import tzoffset
-        # Non ISO 8601 format results in dateutil.tz.tzoffset
-        for freq in ['AS', 'W-SUN']:
-            idx = date_range('2013/1/1 0:00:00-5:00', '2016/1/1 23:59:59-5:00', freq=freq)
-            expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
-                                  freq=freq, tz=tzoffset(None, -18000))
-            tm.assert_index_equal(idx, expected)
-            # Unable to use `US/Eastern` because of DST
-            expected_i8 = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
-                                     freq=freq, tz='America/Lima')
-            self.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
-
-            idx = date_range('2013/1/1 0:00:00+9:00', '2016/1/1 23:59:59+09:00', freq=freq)
-            expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
-                                  freq=freq, tz=tzoffset(None, 32400))
-            tm.assert_index_equal(idx, expected)
-            expected_i8 = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
-                                     freq=freq, tz='Asia/Tokyo')
-            self.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
-
-    def test_constructor_name(self):
-        idx = DatetimeIndex(start='2000-01-01', periods=1, freq='A',
-                            name='TEST')
-        self.assertEqual(idx.name, 'TEST')
-
-    def test_comparisons_coverage(self):
-        rng = date_range('1/1/2000', periods=10)
-
-        # raise TypeError for now
-        self.assertRaises(TypeError, rng.__lt__, rng[3].value)
-
-        result = rng == list(rng)
-        exp = rng == rng
-        self.assert_numpy_array_equal(result, exp)
-
-    def test_comparisons_nat(self):
-
-        fidx1 = pd.Index([1.0, np.nan, 3.0, np.nan, 5.0, 7.0])
-        fidx2 = pd.Index([2.0, 3.0, np.nan, np.nan, 6.0, 7.0])
-
-        didx1 = pd.DatetimeIndex(['2014-01-01', pd.NaT, '2014-03-01', pd.NaT,
-                                  '2014-05-01', '2014-07-01'])
-        didx2 = pd.DatetimeIndex(['2014-02-01', '2014-03-01', pd.NaT, pd.NaT,
-                                  '2014-06-01', '2014-07-01'])
-        darr = np.array([np.datetime64('2014-02-01 00:00Z'),
-                         np.datetime64('2014-03-01 00:00Z'),
-                         np.datetime64('nat'), np.datetime64('nat'),
-                         np.datetime64('2014-06-01 00:00Z'),
-                         np.datetime64('2014-07-01 00:00Z')])
-
-        if _np_version_under1p8:
-            # cannot test array because np.datetime('nat') returns today's date
-            cases = [(fidx1, fidx2), (didx1, didx2)]
-        else:
-            cases = [(fidx1, fidx2), (didx1, didx2), (didx1, darr)]
-
-        # Check pd.NaT is handles as the same as np.nan
-        for idx1, idx2 in cases:
-
-            result = idx1 < idx2
-            expected = np.array([True, False, False, False, True, False])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx2 > idx1
-            expected = np.array([True, False, False, False, True, False])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 <= idx2
-            expected = np.array([True, False, False, False, True, True])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx2 >= idx1
-            expected = np.array([True, False, False, False, True, True])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 == idx2
-            expected = np.array([False, False, False, False, False, True])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 != idx2
-            expected = np.array([True, True, True, True, True, False])
-            self.assert_numpy_array_equal(result, expected)
-
-        for idx1, val in [(fidx1, np.nan), (didx1, pd.NaT)]:
-            result = idx1 < val
-            expected = np.array([False, False, False, False, False, False])
-            self.assert_numpy_array_equal(result, expected)
-            result = idx1 > val
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 <= val
-            self.assert_numpy_array_equal(result, expected)
-            result = idx1 >= val
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 == val
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 != val
-            expected = np.array([True, True, True, True, True, True])
-            self.assert_numpy_array_equal(result, expected)
-
-        # Check pd.NaT is handles as the same as np.nan
-        for idx1, val in [(fidx1, 3), (didx1, datetime(2014, 3, 1))]:
-            result = idx1 < val
-            expected = np.array([True, False, False, False, False, False])
-            self.assert_numpy_array_equal(result, expected)
-            result = idx1 > val
-            expected = np.array([False, False, False, False, True, True])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 <= val
-            expected = np.array([True, False, True, False, False, False])
-            self.assert_numpy_array_equal(result, expected)
-            result = idx1 >= val
-            expected = np.array([False, False, True, False, True, True])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 == val
-            expected = np.array([False, False, True, False, False, False])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 != val
-            expected = np.array([True, True, False, True, True, True])
-            self.assert_numpy_array_equal(result, expected)
-
-    def test_map(self):
-        rng = date_range('1/1/2000', periods=10)
-
-        f = lambda x: x.strftime('%Y%m%d')
-        result = rng.map(f)
-        exp = [f(x) for x in rng]
-        tm.assert_almost_equal(result, exp)
-
-
-    def test_iteration_preserves_tz(self):
-
-        tm._skip_if_no_dateutil()
-
-        # GH 8890
-        import dateutil
-        index = date_range("2012-01-01", periods=3, freq='H', tz='US/Eastern')
-
-        for i, ts in enumerate(index):
-            result = ts
-            expected = index[i]
-            self.assertEqual(result, expected)
-
-        index = date_range("2012-01-01", periods=3, freq='H', tz=dateutil.tz.tzoffset(None, -28800))
-
-        for i, ts in enumerate(index):
-            result = ts
-            expected = index[i]
-            self.assertEqual(result._repr_base, expected._repr_base)
-            self.assertEqual(result, expected)
-
-        # 9100
-        index = pd.DatetimeIndex(['2014-12-01 03:32:39.987000-08:00','2014-12-01 04:12:34.987000-08:00'])
-        for i, ts in enumerate(index):
-            result = ts
-            expected = index[i]
-            self.assertEqual(result._repr_base, expected._repr_base)
-            self.assertEqual(result, expected)
-
-
-    def test_misc_coverage(self):
-        rng = date_range('1/1/2000', periods=5)
-        result = rng.groupby(rng.day)
-        tm.assertIsInstance(list(result.values())[0][0], Timestamp)
-
-        idx = DatetimeIndex(['2000-01-03', '2000-01-01', '2000-01-02'])
-        self.assertTrue(idx.equals(list(idx)))
-
-        non_datetime = Index(list('abc'))
-        self.assertFalse(idx.equals(list(non_datetime)))
-
-    def test_union_coverage(self):
-        idx = DatetimeIndex(['2000-01-03', '2000-01-01', '2000-01-02'])
-        ordered = DatetimeIndex(idx.sort_values(), freq='infer')
-        result = ordered.union(idx)
-        self.assertTrue(result.equals(ordered))
-
-        result = ordered[:0].union(ordered)
-        self.assertTrue(result.equals(ordered))
-        self.assertEqual(result.freq, ordered.freq)
-
-    def test_union_bug_1730(self):
-        rng_a = date_range('1/1/2012', periods=4, freq='3H')
-        rng_b = date_range('1/1/2012', periods=4, freq='4H')
-
-        result = rng_a.union(rng_b)
-        exp = DatetimeIndex(sorted(set(list(rng_a)) | set(list(rng_b))))
-        self.assertTrue(result.equals(exp))
-
-    def test_union_bug_1745(self):
-        left = DatetimeIndex(['2012-05-11 15:19:49.695000'])
-        right = DatetimeIndex(['2012-05-29 13:04:21.322000',
-                               '2012-05-11 15:27:24.873000',
-                               '2012-05-11 15:31:05.350000'])
-
-        result = left.union(right)
-        exp = DatetimeIndex(sorted(set(list(left)) | set(list(right))))
-        self.assertTrue(result.equals(exp))
-
-    def test_union_bug_4564(self):
-        from pandas import DateOffset
-        left = date_range("2013-01-01", "2013-02-01")
-        right = left + DateOffset(minutes=15)
-
-        result = left.union(right)
-        exp = DatetimeIndex(sorted(set(list(left)) | set(list(right))))
-        self.assertTrue(result.equals(exp))
-
-    def test_intersection_bug_1708(self):
-        from pandas import DateOffset
-        index_1 = date_range('1/1/2012', periods=4, freq='12H')
-        index_2 = index_1 + DateOffset(hours=1)
-
-        result = index_1 & index_2
-        self.assertEqual(len(result), 0)
-
-    def test_union_freq_both_none(self):
-        #GH11086
-        expected = bdate_range('20150101', periods=10)
-        expected.freq = None
-
-        result = expected.union(expected)
-        tm.assert_index_equal(result, expected)
-        self.assertIsNone(result.freq)
-
-    # GH 10699
-    def test_datetime64_with_DateOffset(self):
-        for klass, assert_func in zip([Series, DatetimeIndex],
-                                      [self.assert_series_equal,
-                                       tm.assert_index_equal]):
-            s = klass(date_range('2000-01-01', '2000-01-31'), name='a')
-            result = s + pd.DateOffset(years=1)
-            result2 = pd.DateOffset(years=1) + s
-            exp = klass(date_range('2001-01-01', '2001-01-31'), name='a')
-            assert_func(result, exp)
-            assert_func(result2, exp)
-
-            result = s - pd.DateOffset(years=1)
-            exp = klass(date_range('1999-01-01', '1999-01-31'), name='a')
-            assert_func(result, exp)
-
-            s = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
-                       pd.Timestamp('2000-02-15', tz='US/Central')], name='a')
-            result = s + pd.offsets.Day()
-            result2 = pd.offsets.Day() + s
-            exp = klass([Timestamp('2000-01-16 00:15:00', tz='US/Central'),
-                         Timestamp('2000-02-16', tz='US/Central')], name='a')
-            assert_func(result, exp)
-            assert_func(result2, exp)
-
-            s = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
-                       pd.Timestamp('2000-02-15', tz='US/Central')], name='a')
-            result = s + pd.offsets.MonthEnd()
-            result2 = pd.offsets.MonthEnd() + s
-            exp = klass([Timestamp('2000-01-31 00:15:00', tz='US/Central'),
-                         Timestamp('2000-02-29', tz='US/Central')], name='a')
-            assert_func(result, exp)
-            assert_func(result2, exp)
-
-            # array of offsets - valid for Series only
-            if klass is Series:
-                with tm.assert_produces_warning(PerformanceWarning):
-                    s = klass([Timestamp('2000-1-1'), Timestamp('2000-2-1')])
-                    result = s + Series([pd.offsets.DateOffset(years=1),
-                                        pd.offsets.MonthEnd()])
-                    exp = klass([Timestamp('2001-1-1'), Timestamp('2000-2-29')])
-                    assert_func(result, exp)
-
-                    # same offset
-                    result = s + Series([pd.offsets.DateOffset(years=1),
-                                         pd.offsets.DateOffset(years=1)])
-                    exp = klass([Timestamp('2001-1-1'), Timestamp('2001-2-1')])
-                    assert_func(result, exp)
-
-            s = klass([Timestamp('2000-01-05 00:15:00'), Timestamp('2000-01-31 00:23:00'),
-                       Timestamp('2000-01-01'), Timestamp('2000-02-29'), Timestamp('2000-12-31')])
-
-            #DateOffset relativedelta fastpath
-            relative_kwargs = [('years', 2), ('months', 5), ('days', 3),
-                            ('hours', 5), ('minutes', 10), ('seconds', 2),
-                            ('microseconds', 5)]
-            for i, kwd in enumerate(relative_kwargs):
-                op = pd.DateOffset(**dict([kwd]))
-                assert_func(klass([x + op for x in s]), s + op)
-                assert_func(klass([x - op for x in s]), s - op)
-                op = pd.DateOffset(**dict(relative_kwargs[:i+1]))
-                assert_func(klass([x + op for x in s]), s + op)
-                assert_func(klass([x - op for x in s]), s - op)
-
-
-            # split by fast/slow path to test perf warning
-            off = {False:
-                   ['YearBegin', ('YearBegin', {'month': 5}),
-                    'YearEnd', ('YearEnd', {'month': 5}),
-                    'MonthBegin', 'MonthEnd', 'Week', ('Week', {'weekday': 3}),
-                    'BusinessDay', 'BDay', 'QuarterEnd', 'QuarterBegin'],
-                   PerformanceWarning:
-                   ['CustomBusinessDay', 'CDay', 'CBMonthEnd','CBMonthBegin',
-                    'BMonthBegin', 'BMonthEnd', 'BusinessHour', 'BYearBegin',
-                    'BYearEnd','BQuarterBegin', ('LastWeekOfMonth', {'weekday':2}),
-                    ('FY5253Quarter', {'qtr_with_extra_week': 1, 'startingMonth': 1,
-                                       'weekday': 2, 'variation': 'nearest'}),
-                    ('FY5253',{'weekday': 0, 'startingMonth': 2, 'variation': 'nearest'}),
-                    ('WeekOfMonth', {'weekday': 2, 'week': 2}), 'Easter',
-                    ('DateOffset', {'day': 4}), ('DateOffset', {'month': 5})]}
-
-            for normalize in (True, False):
-                for warning, offsets in off.items():
-                    for do in offsets:
-                        if isinstance(do, tuple):
-                            do, kwargs = do
-                        else:
-                            do = do
-                            kwargs = {}
-                        op = getattr(pd.offsets,do)(5, normalize=normalize, **kwargs)
-                        with tm.assert_produces_warning(warning):
-                            assert_func(klass([x + op for x in s]), s + op)
-                            assert_func(klass([x - op for x in s]), s - op)
-                            assert_func(klass([op + x for x in s]), op + s)
-    # def test_add_timedelta64(self):
-    #     rng = date_range('1/1/2000', periods=5)
-    #     delta = rng.values[3] - rng.values[1]
-
-    #     result = rng + delta
-    #     expected = rng + timedelta(2)
-    #     self.assertTrue(result.equals(expected))
-
-    def test_get_duplicates(self):
-        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-02',
-                             '2000-01-03', '2000-01-03', '2000-01-04'])
-
-        result = idx.get_duplicates()
-        ex = DatetimeIndex(['2000-01-02', '2000-01-03'])
-        self.assertTrue(result.equals(ex))
-
-    def test_argmin_argmax(self):
-        idx = DatetimeIndex(['2000-01-04', '2000-01-01', '2000-01-02'])
-        self.assertEqual(idx.argmin(), 1)
-        self.assertEqual(idx.argmax(), 0)
-
-    def test_sort_values(self):
-        idx = DatetimeIndex(['2000-01-04', '2000-01-01', '2000-01-02'])
-
-        ordered = idx.sort_values()
-        self.assertTrue(ordered.is_monotonic)
-
-        ordered = idx.sort_values(ascending=False)
-        self.assertTrue(ordered[::-1].is_monotonic)
-
-        ordered, dexer = idx.sort_values(return_indexer=True)
-        self.assertTrue(ordered.is_monotonic)
-        self.assert_numpy_array_equal(dexer, [1, 2, 0])
-
-        ordered, dexer = idx.sort_values(return_indexer=True, ascending=False)
-        self.assertTrue(ordered[::-1].is_monotonic)
-        self.assert_numpy_array_equal(dexer, [0, 2, 1])
-
-    def test_insert(self):
-        idx = DatetimeIndex(['2000-01-04', '2000-01-01', '2000-01-02'], name='idx')
-
-        result = idx.insert(2, datetime(2000, 1, 5))
-        exp = DatetimeIndex(['2000-01-04', '2000-01-01', '2000-01-05',
-                             '2000-01-02'], name='idx')
-        self.assertTrue(result.equals(exp))
-
-        # insertion of non-datetime should coerce to object index
-        result = idx.insert(1, 'inserted')
-        expected = Index([datetime(2000, 1, 4), 'inserted', datetime(2000, 1, 1),
-                          datetime(2000, 1, 2)], name='idx')
-        self.assertNotIsInstance(result, DatetimeIndex)
-        tm.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
-
-        idx = date_range('1/1/2000', periods=3, freq='M', name='idx')
-
-        # preserve freq
-        expected_0 = DatetimeIndex(['1999-12-31', '2000-01-31', '2000-02-29',
-                                    '2000-03-31'], name='idx', freq='M')
-        expected_3 = DatetimeIndex(['2000-01-31', '2000-02-29', '2000-03-31',
-                                    '2000-04-30'], name='idx', freq='M')
-
-        # reset freq to None
-        expected_1_nofreq = DatetimeIndex(['2000-01-31', '2000-01-31', '2000-02-29',
-                                           '2000-03-31'], name='idx', freq=None)
-        expected_3_nofreq = DatetimeIndex(['2000-01-31', '2000-02-29', '2000-03-31',
-                                           '2000-01-02'], name='idx', freq=None)
-
-        cases = [(0, datetime(1999, 12, 31), expected_0),
-                 (-3, datetime(1999, 12, 31), expected_0),
-                 (3, datetime(2000, 4, 30), expected_3),
-                 (1, datetime(2000, 1, 31), expected_1_nofreq),
-                 (3, datetime(2000, 1, 2), expected_3_nofreq)]
-
-        for n, d, expected in cases:
-            result = idx.insert(n, d)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
-
-        # reset freq to None
-        result = idx.insert(3, datetime(2000, 1, 2))
-        expected = DatetimeIndex(['2000-01-31', '2000-02-29', '2000-03-31',
-                                  '2000-01-02'], name='idx', freq=None)
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.name, expected.name)
-        self.assertTrue(result.freq is None)
-
-        # GH 7299
-        tm._skip_if_no_pytz()
-        import pytz
-
-        idx = date_range('1/1/2000', periods=3, freq='D', tz='Asia/Tokyo', name='idx')
-        with tm.assertRaises(ValueError):
-            result = idx.insert(3, pd.Timestamp('2000-01-04'))
-        with tm.assertRaises(ValueError):
-            result = idx.insert(3, datetime(2000, 1, 4))
-        with tm.assertRaises(ValueError):
-            result = idx.insert(3, pd.Timestamp('2000-01-04', tz='US/Eastern'))
-        with tm.assertRaises(ValueError):
-            result = idx.insert(3, datetime(2000, 1, 4, tzinfo=pytz.timezone('US/Eastern')))
-
-        for tz in ['US/Pacific', 'Asia/Singapore']:
-            idx = date_range('1/1/2000 09:00', periods=6, freq='H', tz=tz, name='idx')
-            # preserve freq
-            expected = date_range('1/1/2000 09:00', periods=7, freq='H', tz=tz, name='idx')
-            for d in [pd.Timestamp('2000-01-01 15:00', tz=tz),
-                      pytz.timezone(tz).localize(datetime(2000, 1, 1, 15))]:
-
-                result = idx.insert(6, d)
-                self.assertTrue(result.equals(expected))
-                self.assertEqual(result.name, expected.name)
-                self.assertEqual(result.freq, expected.freq)
-                self.assertEqual(result.tz, expected.tz)
-
-            expected = DatetimeIndex(['2000-01-01 09:00', '2000-01-01 10:00', '2000-01-01 11:00',
-                                      '2000-01-01 12:00', '2000-01-01 13:00', '2000-01-01 14:00',
-                                      '2000-01-01 10:00'], name='idx',
-                                      tz=tz, freq=None)
-            # reset freq to None
-            for d in [pd.Timestamp('2000-01-01 10:00', tz=tz),
-                      pytz.timezone(tz).localize(datetime(2000, 1, 1, 10))]:
-                result = idx.insert(6, d)
-                self.assertTrue(result.equals(expected))
-                self.assertEqual(result.name, expected.name)
-                self.assertTrue(result.freq is None)
-                self.assertEqual(result.tz, expected.tz)
-
-    def test_delete(self):
-        idx = date_range(start='2000-01-01', periods=5, freq='M', name='idx')
-
-        # prserve freq
-        expected_0 = date_range(start='2000-02-01', periods=4, freq='M', name='idx')
-        expected_4 = date_range(start='2000-01-01', periods=4, freq='M', name='idx')
-
-        # reset freq to None
-        expected_1 = DatetimeIndex(['2000-01-31', '2000-03-31', '2000-04-30',
-                                    '2000-05-31'], freq=None, name='idx')
-
-        cases ={0: expected_0, -5: expected_0,
-                -1: expected_4, 4: expected_4,
-                1: expected_1}
-        for n, expected in compat.iteritems(cases):
-            result = idx.delete(n)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
-
-        with tm.assertRaises((IndexError, ValueError)):
-            # either depeidnig on numpy version
-            result = idx.delete(5)
-
-        for tz in [None, 'Asia/Tokyo', 'US/Pacific']:
-            idx = date_range(start='2000-01-01 09:00', periods=10,
-                             freq='H', name='idx', tz=tz)
-
-            expected = date_range(start='2000-01-01 10:00', periods=9,
-                                  freq='H', name='idx', tz=tz)
-            result = idx.delete(0)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freqstr, 'H')
-            self.assertEqual(result.tz, expected.tz)
-
-            expected = date_range(start='2000-01-01 09:00', periods=9,
-                                  freq='H', name='idx', tz=tz)
-            result = idx.delete(-1)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freqstr, 'H')
-            self.assertEqual(result.tz, expected.tz)
-
-    def test_delete_slice(self):
-        idx = date_range(start='2000-01-01', periods=10, freq='D', name='idx')
-
-        # prserve freq
-        expected_0_2 = date_range(start='2000-01-04', periods=7, freq='D', name='idx')
-        expected_7_9 = date_range(start='2000-01-01', periods=7, freq='D', name='idx')
-
-        # reset freq to None
-        expected_3_5 = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03',
-                                    '2000-01-07', '2000-01-08', '2000-01-09',
-                                    '2000-01-10'], freq=None, name='idx')
-
-        cases ={(0, 1, 2): expected_0_2,
-                (7, 8, 9): expected_7_9,
-                (3, 4, 5): expected_3_5}
-        for n, expected in compat.iteritems(cases):
-            result = idx.delete(n)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.delete(slice(n[0], n[-1] + 1))
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
-
-        for tz in [None, 'Asia/Tokyo', 'US/Pacific']:
-            ts = pd.Series(1, index=pd.date_range('2000-01-01 09:00', periods=10,
-                                                  freq='H', name='idx', tz=tz))
-            # preserve freq
-            result = ts.drop(ts.index[:5]).index
-            expected = pd.date_range('2000-01-01 14:00', periods=5, freq='H', name='idx', tz=tz)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.tz, expected.tz)
-
-            # reset freq to None
-            result = ts.drop(ts.index[[1, 3, 5, 7, 9]]).index
-            expected = DatetimeIndex(['2000-01-01 09:00', '2000-01-01 11:00', '2000-01-01 13:00',
-                                      '2000-01-01 15:00', '2000-01-01 17:00'],
-                                      freq=None, name='idx', tz=tz)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.tz, expected.tz)
-
-    def test_take(self):
-        dates = [datetime(2010, 1, 1, 14), datetime(2010, 1, 1, 15),
-                 datetime(2010, 1, 1, 17), datetime(2010, 1, 1, 21)]
-
-        for tz in [None, 'US/Eastern', 'Asia/Tokyo']:
-            idx = DatetimeIndex(start='2010-01-01 09:00', end='2010-02-01 09:00',
-                                freq='H', tz=tz, name='idx')
-            expected = DatetimeIndex(dates, freq=None, name='idx', tz=tz)
-
-            taken1 = idx.take([5, 6, 8, 12])
-            taken2 = idx[[5, 6, 8, 12]]
-
-            for taken in [taken1, taken2]:
-                self.assertTrue(taken.equals(expected))
-                tm.assertIsInstance(taken, DatetimeIndex)
-                self.assertIsNone(taken.freq)
-                self.assertEqual(taken.tz, expected.tz)
-                self.assertEqual(taken.name, expected.name)
-
-    def test_map_bug_1677(self):
-        index = DatetimeIndex(['2012-04-25 09:30:00.393000'])
-        f = index.asof
-
-        result = index.map(f)
-        expected = np.array([f(index[0])])
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_groupby_function_tuple_1677(self):
-        df = DataFrame(np.random.rand(100),
-                       index=date_range("1/1/2000", periods=100))
-        monthly_group = df.groupby(lambda x: (x.year, x.month))
-
-        result = monthly_group.mean()
-        tm.assertIsInstance(result.index[0], tuple)
-
-    def test_append_numpy_bug_1681(self):
-        # another datetime64 bug
-        dr = date_range('2011/1/1', '2012/1/1', freq='W-FRI')
-        a = DataFrame()
-        c = DataFrame({'A': 'foo', 'B': dr}, index=dr)
-
-        result = a.append(c)
-        self.assertTrue((result['B'] == dr).all())
-
-    def test_isin(self):
-        index = tm.makeDateIndex(4)
-        result = index.isin(index)
-        self.assertTrue(result.all())
-
-        result = index.isin(list(index))
-        self.assertTrue(result.all())
-
-        assert_almost_equal(index.isin([index[2], 5]),
-                            [False, False, True, False])
-
-    def test_union(self):
-        i1 = Int64Index(np.arange(0, 20, 2))
-        i2 = Int64Index(np.arange(10, 30, 2))
-        result = i1.union(i2)
-        expected = Int64Index(np.arange(0, 30, 2))
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_union_with_DatetimeIndex(self):
-        i1 = Int64Index(np.arange(0, 20, 2))
-        i2 = DatetimeIndex(start='2012-01-03 00:00:00', periods=10, freq='D')
-        i1.union(i2)  # Works
-        i2.union(i1)  # Fails with "AttributeError: can't set attribute"
-
-    def test_time(self):
-        rng = pd.date_range('1/1/2000', freq='12min', periods=10)
-        result = pd.Index(rng).time
-        expected = [t.time() for t in rng]
-        self.assertTrue((result == expected).all())
-
-    def test_date(self):
-        rng = pd.date_range('1/1/2000', freq='12H', periods=10)
-        result = pd.Index(rng).date
-        expected = [t.date() for t in rng]
-        self.assertTrue((result == expected).all())
-
-    def test_does_not_convert_mixed_integer(self):
-        df = tm.makeCustomDataframe(10, 10, data_gen_f=lambda *args, **kwargs:
-                                    randn(), r_idx_type='i', c_idx_type='dt')
-        cols = df.columns.join(df.index, how='outer')
-        joined = cols.join(df.columns)
-        self.assertEqual(cols.dtype, np.dtype('O'))
-        self.assertEqual(cols.dtype, joined.dtype)
-        tm.assert_numpy_array_equal(cols.values, joined.values)
-
-    def test_slice_keeps_name(self):
-        # GH4226
-        st = pd.Timestamp('2013-07-01 00:00:00', tz='America/Los_Angeles')
-        et = pd.Timestamp('2013-07-02 00:00:00', tz='America/Los_Angeles')
-        dr = pd.date_range(st, et, freq='H', name='timebucket')
-        self.assertEqual(dr[1:].name, dr.name)
-
-    def test_join_self(self):
-        index = date_range('1/1/2000', periods=10)
-        kinds = 'outer', 'inner', 'left', 'right'
-        for kind in kinds:
-            joined = index.join(index, how=kind)
-            self.assertIs(index, joined)
-
-    def assert_index_parameters(self, index):
-        assert index.freq == '40960N'
-        assert index.inferred_freq == '40960N'
-
-    def test_ns_index(self):
-        nsamples = 400
-        ns = int(1e9 / 24414)
-        dtstart = np.datetime64('2012-09-20T00:00:00')
-
-        dt = dtstart + np.arange(nsamples) * np.timedelta64(ns, 'ns')
-        freq = ns * pd.datetools.Nano()
-        index = pd.DatetimeIndex(dt, freq=freq, name='time')
-        self.assert_index_parameters(index)
-
-        new_index = pd.DatetimeIndex(start=index[0], end=index[-1], freq=index.freq)
-        self.assert_index_parameters(new_index)
-
-    def test_join_with_period_index(self):
-        df = tm.makeCustomDataframe(10, 10, data_gen_f=lambda *args:
-                                    np.random.randint(2), c_idx_type='p',
-                                    r_idx_type='dt')
-        s = df.iloc[:5, 0]
-        joins = 'left', 'right', 'inner', 'outer'
-
-        for join in joins:
-            with tm.assertRaisesRegexp(ValueError, 'can only call with other '
-                                       'PeriodIndex-ed objects'):
-                df.columns.join(s.index, how=join)
-
-    def test_factorize(self):
-        idx1 = DatetimeIndex(['2014-01', '2014-01', '2014-02',
-                              '2014-02', '2014-03', '2014-03'])
-
-        exp_arr = np.array([0, 0, 1, 1, 2, 2])
-        exp_idx = DatetimeIndex(['2014-01', '2014-02', '2014-03'])
-
-        arr, idx = idx1.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assertTrue(idx.equals(exp_idx))
-
-        arr, idx = idx1.factorize(sort=True)
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assertTrue(idx.equals(exp_idx))
-
-        # tz must be preserved
-        idx1 = idx1.tz_localize('Asia/Tokyo')
-        exp_idx = exp_idx.tz_localize('Asia/Tokyo')
-
-        arr, idx = idx1.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assertTrue(idx.equals(exp_idx))
-
-        idx2 = pd.DatetimeIndex(['2014-03', '2014-03', '2014-02', '2014-01',
-                               '2014-03', '2014-01'])
-
-        exp_arr = np.array([2, 2, 1, 0, 2, 0])
-        exp_idx = DatetimeIndex(['2014-01', '2014-02', '2014-03'])
-        arr, idx = idx2.factorize(sort=True)
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assertTrue(idx.equals(exp_idx))
-
-        exp_arr = np.array([0, 0, 1, 2, 0, 2])
-        exp_idx = DatetimeIndex(['2014-03', '2014-02', '2014-01'])
-        arr, idx = idx2.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assertTrue(idx.equals(exp_idx))
-
-        # freq must be preserved
-        idx3 = date_range('2000-01', periods=4, freq='M', tz='Asia/Tokyo')
-        exp_arr = np.array([0, 1, 2, 3])
-        arr, idx = idx3.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assertTrue(idx.equals(idx3))
-
-
-    def test_slice_with_negative_step(self):
-        ts = Series(np.arange(20),
-                    date_range('2014-01-01', periods=20, freq='MS'))
-        SLC = pd.IndexSlice
-
-        def assert_slices_equivalent(l_slc, i_slc):
-            assert_series_equal(ts[l_slc], ts.iloc[i_slc])
-            assert_series_equal(ts.loc[l_slc], ts.iloc[i_slc])
-            assert_series_equal(ts.ix[l_slc], ts.iloc[i_slc])
-
-        assert_slices_equivalent(SLC[Timestamp('2014-10-01')::-1], SLC[9::-1])
-        assert_slices_equivalent(SLC['2014-10-01'::-1], SLC[9::-1])
-
-        assert_slices_equivalent(SLC[:Timestamp('2014-10-01'):-1], SLC[:8:-1])
-        assert_slices_equivalent(SLC[:'2014-10-01':-1], SLC[:8:-1])
-
-        assert_slices_equivalent(SLC['2015-02-01':'2014-10-01':-1], SLC[13:8:-1])
-        assert_slices_equivalent(SLC[Timestamp('2015-02-01'):Timestamp('2014-10-01'):-1], SLC[13:8:-1])
-        assert_slices_equivalent(SLC['2015-02-01':Timestamp('2014-10-01'):-1], SLC[13:8:-1])
-        assert_slices_equivalent(SLC[Timestamp('2015-02-01'):'2014-10-01':-1], SLC[13:8:-1])
-
-        assert_slices_equivalent(SLC['2014-10-01':'2015-02-01':-1], SLC[:0])
-
-    def test_slice_with_zero_step_raises(self):
-        ts = Series(np.arange(20),
-                    date_range('2014-01-01', periods=20, freq='MS'))
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts.loc[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts.ix[::0])
-
-
-
-class TestDatetime64(tm.TestCase):
-    """
-    Also test support for datetime64[ns] in Series / DataFrame
-    """
-
-    def setUp(self):
-        dti = DatetimeIndex(start=datetime(2005, 1, 1),
-                            end=datetime(2005, 1, 10), freq='Min')
-        self.series = Series(rand(len(dti)), dti)
-
-    def test_datetimeindex_accessors(self):
-        dti = DatetimeIndex(
-            freq='D', start=datetime(1998, 1, 1), periods=365)
-
-        self.assertEqual(dti.year[0], 1998)
-        self.assertEqual(dti.month[0], 1)
-        self.assertEqual(dti.day[0], 1)
-        self.assertEqual(dti.hour[0], 0)
-        self.assertEqual(dti.minute[0], 0)
-        self.assertEqual(dti.second[0], 0)
-        self.assertEqual(dti.microsecond[0], 0)
-        self.assertEqual(dti.dayofweek[0], 3)
-
-        self.assertEqual(dti.dayofyear[0], 1)
-        self.assertEqual(dti.dayofyear[120], 121)
-
-        self.assertEqual(dti.weekofyear[0], 1)
-        self.assertEqual(dti.weekofyear[120], 18)
-
-        self.assertEqual(dti.quarter[0], 1)
-        self.assertEqual(dti.quarter[120], 2)
-
-        self.assertEqual(dti.days_in_month[0], 31)
-        self.assertEqual(dti.days_in_month[90], 30)
-
-        self.assertEqual(dti.is_month_start[0], True)
-        self.assertEqual(dti.is_month_start[1], False)
-        self.assertEqual(dti.is_month_start[31], True)
-        self.assertEqual(dti.is_quarter_start[0], True)
-        self.assertEqual(dti.is_quarter_start[90], True)
-        self.assertEqual(dti.is_year_start[0], True)
-        self.assertEqual(dti.is_year_start[364], False)
-        self.assertEqual(dti.is_month_end[0], False)
-        self.assertEqual(dti.is_month_end[30], True)
-        self.assertEqual(dti.is_month_end[31], False)
-        self.assertEqual(dti.is_month_end[364], True)
-        self.assertEqual(dti.is_quarter_end[0], False)
-        self.assertEqual(dti.is_quarter_end[30], False)
-        self.assertEqual(dti.is_quarter_end[89], True)
-        self.assertEqual(dti.is_quarter_end[364], True)
-        self.assertEqual(dti.is_year_end[0], False)
-        self.assertEqual(dti.is_year_end[364], True)
-
-        self.assertEqual(len(dti.year), 365)
-        self.assertEqual(len(dti.month), 365)
-        self.assertEqual(len(dti.day), 365)
-        self.assertEqual(len(dti.hour), 365)
-        self.assertEqual(len(dti.minute), 365)
-        self.assertEqual(len(dti.second), 365)
-        self.assertEqual(len(dti.microsecond), 365)
-        self.assertEqual(len(dti.dayofweek), 365)
-        self.assertEqual(len(dti.dayofyear), 365)
-        self.assertEqual(len(dti.weekofyear), 365)
-        self.assertEqual(len(dti.quarter), 365)
-        self.assertEqual(len(dti.is_month_start), 365)
-        self.assertEqual(len(dti.is_month_end), 365)
-        self.assertEqual(len(dti.is_quarter_start), 365)
-        self.assertEqual(len(dti.is_quarter_end), 365)
-        self.assertEqual(len(dti.is_year_start), 365)
-        self.assertEqual(len(dti.is_year_end), 365)
-
-        dti = DatetimeIndex(
-            freq='BQ-FEB', start=datetime(1998, 1, 1), periods=4)
-
-        self.assertEqual(sum(dti.is_quarter_start), 0)
-        self.assertEqual(sum(dti.is_quarter_end), 4)
-        self.assertEqual(sum(dti.is_year_start), 0)
-        self.assertEqual(sum(dti.is_year_end), 1)
-
-        # Ensure is_start/end accessors throw ValueError for CustomBusinessDay, CBD requires np >= 1.7
-        bday_egypt = offsets.CustomBusinessDay(weekmask='Sun Mon Tue Wed Thu')
-        dti = date_range(datetime(2013, 4, 30), periods=5, freq=bday_egypt)
-        self.assertRaises(ValueError, lambda: dti.is_month_start)
-
-        dti = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03'])
-
-        self.assertEqual(dti.is_month_start[0], 1)
-
-        tests = [
-            (Timestamp('2013-06-01', offset='M').is_month_start, 1),
-            (Timestamp('2013-06-01', offset='BM').is_month_start, 0),
-            (Timestamp('2013-06-03', offset='M').is_month_start, 0),
-            (Timestamp('2013-06-03', offset='BM').is_month_start, 1),
-            (Timestamp('2013-02-28', offset='Q-FEB').is_month_end, 1),
-            (Timestamp('2013-02-28', offset='Q-FEB').is_quarter_end, 1),
-            (Timestamp('2013-02-28', offset='Q-FEB').is_year_end, 1),
-            (Timestamp('2013-03-01', offset='Q-FEB').is_month_start, 1),
-            (Timestamp('2013-03-01', offset='Q-FEB').is_quarter_start, 1),
-            (Timestamp('2013-03-01', offset='Q-FEB').is_year_start, 1),
-            (Timestamp('2013-03-31', offset='QS-FEB').is_month_end, 1),
-            (Timestamp('2013-03-31', offset='QS-FEB').is_quarter_end, 0),
-            (Timestamp('2013-03-31', offset='QS-FEB').is_year_end, 0),
-            (Timestamp('2013-02-01', offset='QS-FEB').is_month_start, 1),
-            (Timestamp('2013-02-01', offset='QS-FEB').is_quarter_start, 1),
-            (Timestamp('2013-02-01', offset='QS-FEB').is_year_start, 1),
-            (Timestamp('2013-06-30', offset='BQ').is_month_end, 0),
-            (Timestamp('2013-06-30', offset='BQ').is_quarter_end, 0),
-            (Timestamp('2013-06-30', offset='BQ').is_year_end, 0),
-            (Timestamp('2013-06-28', offset='BQ').is_month_end, 1),
-            (Timestamp('2013-06-28', offset='BQ').is_quarter_end, 1),
-            (Timestamp('2013-06-28', offset='BQ').is_year_end, 0),
-            (Timestamp('2013-06-30', offset='BQS-APR').is_month_end, 0),
-            (Timestamp('2013-06-30', offset='BQS-APR').is_quarter_end, 0),
-            (Timestamp('2013-06-30', offset='BQS-APR').is_year_end, 0),
-            (Timestamp('2013-06-28', offset='BQS-APR').is_month_end, 1),
-            (Timestamp('2013-06-28', offset='BQS-APR').is_quarter_end, 1),
-            (Timestamp('2013-03-29', offset='BQS-APR').is_year_end, 1),
-            (Timestamp('2013-11-01', offset='AS-NOV').is_year_start, 1),
-            (Timestamp('2013-10-31', offset='AS-NOV').is_year_end, 1),
-            (Timestamp('2012-02-01').days_in_month, 29),
-            (Timestamp('2013-02-01').days_in_month, 28)]
-
-        for ts, value in tests:
-            self.assertEqual(ts, value)
-
-
-    def test_nanosecond_field(self):
-        dti = DatetimeIndex(np.arange(10))
-
-        self.assert_numpy_array_equal(dti.nanosecond, np.arange(10))
-
-    def test_datetimeindex_diff(self):
-        dti1 = DatetimeIndex(freq='Q-JAN', start=datetime(1997, 12, 31),
-                             periods=100)
-        dti2 = DatetimeIndex(freq='Q-JAN', start=datetime(1997, 12, 31),
-                             periods=98)
-        self.assertEqual(len(dti1.difference(dti2)), 2)
-
-    def test_fancy_getitem(self):
-        dti = DatetimeIndex(freq='WOM-1FRI', start=datetime(2005, 1, 1),
-                            end=datetime(2010, 1, 1))
-
-        s = Series(np.arange(len(dti)), index=dti)
-
-        self.assertEqual(s[48], 48)
-        self.assertEqual(s['1/2/2009'], 48)
-        self.assertEqual(s['2009-1-2'], 48)
-        self.assertEqual(s[datetime(2009, 1, 2)], 48)
-        self.assertEqual(s[lib.Timestamp(datetime(2009, 1, 2))], 48)
-        self.assertRaises(KeyError, s.__getitem__, '2009-1-3')
-
-        assert_series_equal(s['3/6/2009':'2009-06-05'],
-                            s[datetime(2009, 3, 6):datetime(2009, 6, 5)])
-
-    def test_fancy_setitem(self):
-        dti = DatetimeIndex(freq='WOM-1FRI', start=datetime(2005, 1, 1),
-                            end=datetime(2010, 1, 1))
-
-        s = Series(np.arange(len(dti)), index=dti)
-        s[48] = -1
-        self.assertEqual(s[48], -1)
-        s['1/2/2009'] = -2
-        self.assertEqual(s[48], -2)
-        s['1/2/2009':'2009-06-05'] = -3
-        self.assertTrue((s[48:54] == -3).all())
-
-    def test_datetimeindex_constructor(self):
-        arr = ['1/1/2005', '1/2/2005', 'Jn 3, 2005', '2005-01-04']
-        self.assertRaises(Exception, DatetimeIndex, arr)
-
-        arr = ['1/1/2005', '1/2/2005', '1/3/2005', '2005-01-04']
-        idx1 = DatetimeIndex(arr)
-
-        arr = [datetime(2005, 1, 1), '1/2/2005', '1/3/2005', '2005-01-04']
-        idx2 = DatetimeIndex(arr)
-
-        arr = [lib.Timestamp(datetime(2005, 1, 1)), '1/2/2005', '1/3/2005',
-               '2005-01-04']
-        idx3 = DatetimeIndex(arr)
-
-        arr = np.array(['1/1/2005', '1/2/2005', '1/3/2005',
-                        '2005-01-04'], dtype='O')
-        idx4 = DatetimeIndex(arr)
-
-        arr = to_datetime(['1/1/2005', '1/2/2005', '1/3/2005', '2005-01-04'])
-        idx5 = DatetimeIndex(arr)
-
-        arr = to_datetime(
-            ['1/1/2005', '1/2/2005', 'Jan 3, 2005', '2005-01-04'])
-        idx6 = DatetimeIndex(arr)
-
-        idx7 = DatetimeIndex(['12/05/2007', '25/01/2008'], dayfirst=True)
-        idx8 = DatetimeIndex(['2007/05/12', '2008/01/25'], dayfirst=False,
-                             yearfirst=True)
-        self.assertTrue(idx7.equals(idx8))
-
-        for other in [idx2, idx3, idx4, idx5, idx6]:
-            self.assertTrue((idx1.values == other.values).all())
-
-        sdate = datetime(1999, 12, 25)
-        edate = datetime(2000, 1, 1)
-        idx = DatetimeIndex(start=sdate, freq='1B', periods=20)
-        self.assertEqual(len(idx), 20)
-        self.assertEqual(idx[0], sdate + 0 * datetools.bday)
-        self.assertEqual(idx.freq, 'B')
-
-        idx = DatetimeIndex(end=edate, freq=('D', 5), periods=20)
-        self.assertEqual(len(idx), 20)
-        self.assertEqual(idx[-1], edate)
-        self.assertEqual(idx.freq, '5D')
-
-        idx1 = DatetimeIndex(start=sdate, end=edate, freq='W-SUN')
-        idx2 = DatetimeIndex(start=sdate, end=edate,
-                             freq=datetools.Week(weekday=6))
-        self.assertEqual(len(idx1), len(idx2))
-        self.assertEqual(idx1.offset, idx2.offset)
-
-        idx1 = DatetimeIndex(start=sdate, end=edate, freq='QS')
-        idx2 = DatetimeIndex(start=sdate, end=edate,
-                             freq=datetools.QuarterBegin(startingMonth=1))
-        self.assertEqual(len(idx1), len(idx2))
-        self.assertEqual(idx1.offset, idx2.offset)
-
-        idx1 = DatetimeIndex(start=sdate, end=edate, freq='BQ')
-        idx2 = DatetimeIndex(start=sdate, end=edate,
-                             freq=datetools.BQuarterEnd(startingMonth=12))
-        self.assertEqual(len(idx1), len(idx2))
-        self.assertEqual(idx1.offset, idx2.offset)
-
-    def test_dayfirst(self):
-        # GH 5917
-        arr = ['10/02/2014', '11/02/2014', '12/02/2014']
-        expected = DatetimeIndex([datetime(2014, 2, 10),
-                                  datetime(2014, 2, 11),
-                                  datetime(2014, 2, 12)])
-        idx1 = DatetimeIndex(arr, dayfirst=True)
-        idx2 = DatetimeIndex(np.array(arr), dayfirst=True)
-        idx3 = to_datetime(arr, dayfirst=True)
-        idx4 = to_datetime(np.array(arr), dayfirst=True)
-        idx5 = DatetimeIndex(Index(arr), dayfirst=True)
-        idx6 = DatetimeIndex(Series(arr), dayfirst=True)
-        self.assertTrue(expected.equals(idx1))
-        self.assertTrue(expected.equals(idx2))
-        self.assertTrue(expected.equals(idx3))
-        self.assertTrue(expected.equals(idx4))
-        self.assertTrue(expected.equals(idx5))
-        self.assertTrue(expected.equals(idx6))
-
-    def test_dti_snap(self):
-        dti = DatetimeIndex(['1/1/2002', '1/2/2002', '1/3/2002', '1/4/2002',
-                             '1/5/2002', '1/6/2002', '1/7/2002'], freq='D')
-
-        res = dti.snap(freq='W-MON')
-        exp = date_range('12/31/2001', '1/7/2002', freq='w-mon')
-        exp = exp.repeat([3, 4])
-        self.assertTrue((res == exp).all())
-
-        res = dti.snap(freq='B')
-
-        exp = date_range('1/1/2002', '1/7/2002', freq='b')
-        exp = exp.repeat([1, 1, 1, 2, 2])
-        self.assertTrue((res == exp).all())
-
-    def test_dti_reset_index_round_trip(self):
-        dti = DatetimeIndex(start='1/1/2001', end='6/1/2001', freq='D')
-        d1 = DataFrame({'v': np.random.rand(len(dti))}, index=dti)
-        d2 = d1.reset_index()
-        self.assertEqual(d2.dtypes[0], np.dtype('M8[ns]'))
-        d3 = d2.set_index('index')
-        assert_frame_equal(d1, d3, check_names=False)
-
-        # #2329
-        stamp = datetime(2012, 11, 22)
-        df = DataFrame([[stamp, 12.1]], columns=['Date', 'Value'])
-        df = df.set_index('Date')
-
-        self.assertEqual(df.index[0], stamp)
-        self.assertEqual(df.reset_index()['Date'][0], stamp)
-
-    def test_dti_set_index_reindex(self):
-        # GH 6631
-        df = DataFrame(np.random.random(6))
-        idx1 = date_range('2011/01/01', periods=6, freq='M', tz='US/Eastern')
-        idx2 = date_range('2013', periods=6, freq='A', tz='Asia/Tokyo')
-
-        df = df.set_index(idx1)
-        self.assertTrue(df.index.equals(idx1))
-        df = df.reindex(idx2)
-        self.assertTrue(df.index.equals(idx2))
-
-        # 11314
-        # with tz
-        index = date_range(datetime(2015, 10, 1), datetime(2015,10,1,23), freq='H', tz='US/Eastern')
-        df = DataFrame(np.random.randn(24, 1), columns=['a'], index=index)
-        new_index = date_range(datetime(2015, 10, 2), datetime(2015,10,2,23), freq='H', tz='US/Eastern')
-        result = df.set_index(new_index)
-        self.assertEqual(new_index.freq,index.freq)
-
-    def test_datetimeindex_union_join_empty(self):
-        dti = DatetimeIndex(start='1/1/2001', end='2/1/2001', freq='D')
-        empty = Index([])
-
-        result = dti.union(empty)
-        tm.assertIsInstance(result, DatetimeIndex)
-        self.assertIs(result, result)
-
-        result = dti.join(empty)
-        tm.assertIsInstance(result, DatetimeIndex)
-
-    def test_series_set_value(self):
-        # #1561
-
-        dates = [datetime(2001, 1, 1), datetime(2001, 1, 2)]
-        index = DatetimeIndex(dates)
-
-        s = Series().set_value(dates[0], 1.)
-        s2 = s.set_value(dates[1], np.nan)
-
-        exp = Series([1., np.nan], index=index)
-
-        assert_series_equal(s2, exp)
-
-        # s = Series(index[:1], index[:1])
-        # s2 = s.set_value(dates[1], index[1])
-        # self.assertEqual(s2.values.dtype, 'M8[ns]')
-
-    @slow
-    def test_slice_locs_indexerror(self):
-        times = [datetime(2000, 1, 1) + timedelta(minutes=i * 10)
-                 for i in range(100000)]
-        s = Series(lrange(100000), times)
-        s.ix[datetime(1900, 1, 1):datetime(2100, 1, 1)]
-
-    def test_slicing_datetimes(self):
-
-        # GH 7523
-
-        # unique
-        df = DataFrame(np.arange(4.,dtype='float64'),
-                       index=[datetime(2001, 1, i, 10, 00) for i in [1,2,3,4]])
-        result = df.ix[datetime(2001,1,1,10):]
-        assert_frame_equal(result,df)
-        result = df.ix[:datetime(2001,1,4,10)]
-        assert_frame_equal(result,df)
-        result = df.ix[datetime(2001,1,1,10):datetime(2001,1,4,10)]
-        assert_frame_equal(result,df)
-
-        result = df.ix[datetime(2001,1,1,11):]
-        expected = df.iloc[1:]
-        assert_frame_equal(result,expected)
-        result = df.ix['20010101 11':]
-        assert_frame_equal(result,expected)
-
-        # duplicates
-        df = pd.DataFrame(np.arange(5.,dtype='float64'),
-                          index=[datetime(2001, 1, i, 10, 00) for i in [1,2,2,3,4]])
-
-        result = df.ix[datetime(2001,1,1,10):]
-        assert_frame_equal(result,df)
-        result = df.ix[:datetime(2001,1,4,10)]
-        assert_frame_equal(result,df)
-        result = df.ix[datetime(2001,1,1,10):datetime(2001,1,4,10)]
-        assert_frame_equal(result,df)
-
-        result = df.ix[datetime(2001,1,1,11):]
-        expected = df.iloc[1:]
-        assert_frame_equal(result,expected)
-        result = df.ix['20010101 11':]
-        assert_frame_equal(result,expected)
-
-class TestSeriesDatetime64(tm.TestCase):
-
-    def setUp(self):
-        self.series = Series(date_range('1/1/2000', periods=10))
-
-    def test_auto_conversion(self):
-        series = Series(list(date_range('1/1/2000', periods=10)))
-        self.assertEqual(series.dtype, 'M8[ns]')
-
-    def test_constructor_cant_cast_datetime64(self):
-        self.assertRaises(TypeError, Series,
-                          date_range('1/1/2000', periods=10), dtype=float)
-
-    def test_series_comparison_scalars(self):
-        val = datetime(2000, 1, 4)
-        result = self.series > val
-        expected = np.array([x > val for x in self.series])
-        self.assert_numpy_array_equal(result, expected)
-
-        val = self.series[5]
-        result = self.series > val
-        expected = np.array([x > val for x in self.series])
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_between(self):
-        left, right = self.series[[2, 7]]
-
-        result = self.series.between(left, right)
-        expected = (self.series >= left) & (self.series <= right)
-        assert_series_equal(result, expected)
-
-    #----------------------------------------------------------------------
-    # NaT support
-
-    def test_NaT_scalar(self):
-        series = Series([0, 1000, 2000, iNaT], dtype='M8[ns]')
-
-        val = series[3]
-        self.assertTrue(com.isnull(val))
-
-        series[2] = val
-        self.assertTrue(com.isnull(series[2]))
-
-    def test_NaT_cast(self):
-        # GH10747
-        result = Series([np.nan]).astype('M8[ns]')
-        expected = Series([NaT])
-        assert_series_equal(result, expected)
-
-    def test_set_none_nan(self):
-        self.series[3] = None
-        self.assertIs(self.series[3], NaT)
-
-        self.series[3:5] = None
-        self.assertIs(self.series[4], NaT)
-
-        self.series[5] = np.nan
-        self.assertIs(self.series[5], NaT)
-
-        self.series[5:7] = np.nan
-        self.assertIs(self.series[6], NaT)
-
-    def test_intercept_astype_object(self):
-
-        # this test no longer makes sense as series is by default already M8[ns]
-        expected = self.series.astype('object')
-
-        df = DataFrame({'a': self.series,
-                        'b': np.random.randn(len(self.series))})
-
-        result = df.values.squeeze()
-        self.assertTrue((result[:, 0] == expected.values).all())
-
-        df = DataFrame({'a': self.series,
-                        'b': ['foo'] * len(self.series)})
-
-        result = df.values.squeeze()
-        self.assertTrue((result[:, 0] == expected.values).all())
-
-    def test_union(self):
-        rng1 = date_range('1/1/1999', '1/1/2012', freq='MS')
-        s1 = Series(np.random.randn(len(rng1)), rng1)
-
-        rng2 = date_range('1/1/1980', '12/1/2001', freq='MS')
-        s2 = Series(np.random.randn(len(rng2)), rng2)
-        df = DataFrame({'s1': s1, 's2': s2})
-        self.assertEqual(df.index.values.dtype, np.dtype('M8[ns]'))
-
-    def test_intersection(self):
-        # GH 4690 (with tz)
-        for tz in [None, 'Asia/Tokyo', 'US/Eastern', 'dateutil/US/Pacific']:
-            base = date_range('6/1/2000', '6/30/2000', freq='D', name='idx')
-
-            # if target has the same name, it is preserved
-            rng2 = date_range('5/15/2000', '6/20/2000', freq='D', name='idx')
-            expected2 = date_range('6/1/2000', '6/20/2000', freq='D', name='idx')
-
-            # if target name is different, it will be reset
-            rng3 = date_range('5/15/2000', '6/20/2000', freq='D', name='other')
-            expected3 = date_range('6/1/2000', '6/20/2000', freq='D', name=None)
-
-            rng4 = date_range('7/1/2000', '7/31/2000', freq='D', name='idx')
-            expected4 = DatetimeIndex([], name='idx')
-
-            for (rng, expected) in [(rng2, expected2), (rng3, expected3), (rng4, expected4)]:
-                result = base.intersection(rng)
-                self.assertTrue(result.equals(expected))
-                self.assertEqual(result.name, expected.name)
-                self.assertEqual(result.freq, expected.freq)
-                self.assertEqual(result.tz, expected.tz)
-
-            # non-monotonic
-            base = DatetimeIndex(['2011-01-05', '2011-01-04', '2011-01-02', '2011-01-03'],
-                                tz=tz, name='idx')
-
-            rng2 = DatetimeIndex(['2011-01-04', '2011-01-02', '2011-02-02', '2011-02-03'],
-                                 tz=tz, name='idx')
-            expected2 = DatetimeIndex(['2011-01-04', '2011-01-02'], tz=tz, name='idx')
-
-            rng3 = DatetimeIndex(['2011-01-04', '2011-01-02', '2011-02-02', '2011-02-03'],
-                                 tz=tz, name='other')
-            expected3 = DatetimeIndex(['2011-01-04', '2011-01-02'], tz=tz, name=None)
-
-            # GH 7880
-            rng4 = date_range('7/1/2000', '7/31/2000', freq='D', tz=tz, name='idx')
-            expected4 = DatetimeIndex([], tz=tz, name='idx')
-
-            for (rng, expected) in [(rng2, expected2), (rng3, expected3), (rng4, expected4)]:
-                result = base.intersection(rng)
-                self.assertTrue(result.equals(expected))
-                self.assertEqual(result.name, expected.name)
-                self.assertIsNone(result.freq)
-                self.assertEqual(result.tz, expected.tz)
-
-        # empty same freq GH2129
-        rng = date_range('6/1/2000', '6/15/2000', freq='T')
-        result = rng[0:0].intersection(rng)
-        self.assertEqual(len(result), 0)
-
-        result = rng.intersection(rng[0:0])
-        self.assertEqual(len(result), 0)
-
-    def test_date_range_bms_bug(self):
-        # #1645
-        rng = date_range('1/1/2000', periods=10, freq='BMS')
-
-        ex_first = Timestamp('2000-01-03')
-        self.assertEqual(rng[0], ex_first)
-
-    def test_date_range_businesshour(self):
-        idx = DatetimeIndex(['2014-07-04 09:00', '2014-07-04 10:00', '2014-07-04 11:00',
-                             '2014-07-04 12:00', '2014-07-04 13:00', '2014-07-04 14:00',
-                             '2014-07-04 15:00', '2014-07-04 16:00'], freq='BH')
-        rng = date_range('2014-07-04 09:00', '2014-07-04 16:00', freq='BH')
-        tm.assert_index_equal(idx, rng)
-
-        idx = DatetimeIndex(['2014-07-04 16:00', '2014-07-07 09:00'], freq='BH')
-        rng = date_range('2014-07-04 16:00', '2014-07-07 09:00', freq='BH')
-        tm.assert_index_equal(idx, rng)
-
-        idx = DatetimeIndex(['2014-07-04 09:00', '2014-07-04 10:00', '2014-07-04 11:00',
-                             '2014-07-04 12:00', '2014-07-04 13:00', '2014-07-04 14:00',
-                             '2014-07-04 15:00', '2014-07-04 16:00',
-                             '2014-07-07 09:00', '2014-07-07 10:00', '2014-07-07 11:00',
-                             '2014-07-07 12:00', '2014-07-07 13:00', '2014-07-07 14:00',
-                             '2014-07-07 15:00', '2014-07-07 16:00',
-                             '2014-07-08 09:00', '2014-07-08 10:00', '2014-07-08 11:00',
-                             '2014-07-08 12:00', '2014-07-08 13:00', '2014-07-08 14:00',
-                             '2014-07-08 15:00', '2014-07-08 16:00'], freq='BH')
-        rng = date_range('2014-07-04 09:00', '2014-07-08 16:00', freq='BH')
-        tm.assert_index_equal(idx, rng)
-
-    def test_string_index_series_name_converted(self):
-        # #1644
-        df = DataFrame(np.random.randn(10, 4),
-                       index=date_range('1/1/2000', periods=10))
-
-        result = df.ix['1/3/2000']
-        self.assertEqual(result.name, df.index[2])
-
-        result = df.T['1/3/2000']
-        self.assertEqual(result.name, df.index[2])
-
-
-class TestTimestamp(tm.TestCase):
-
-    def test_class_ops_pytz(self):
-        tm._skip_if_no_pytz()
-        from pytz import timezone
-
-        def compare(x, y):
-            self.assertEqual(int(Timestamp(x).value / 1e9), int(Timestamp(y).value / 1e9))
-
-        compare(Timestamp.now(), datetime.now())
-        compare(Timestamp.now('UTC'), datetime.now(timezone('UTC')))
-        compare(Timestamp.utcnow(), datetime.utcnow())
-        compare(Timestamp.today(), datetime.today())
-        current_time = calendar.timegm(datetime.now().utctimetuple())
-        compare(Timestamp.utcfromtimestamp(current_time),
-                datetime.utcfromtimestamp(current_time))
-        compare(Timestamp.fromtimestamp(current_time),
-                datetime.fromtimestamp(current_time))
-
-        date_component = datetime.utcnow()
-        time_component = (date_component + timedelta(minutes=10)).time()
-        compare(Timestamp.combine(date_component, time_component),
-                datetime.combine(date_component, time_component))
-
-    def test_class_ops_dateutil(self):
-        tm._skip_if_no_dateutil()
-        from dateutil.tz import tzutc
-
-        def compare(x,y):
-            self.assertEqual(int(np.round(Timestamp(x).value/1e9)), int(np.round(Timestamp(y).value/1e9)))
-
-        compare(Timestamp.now(),datetime.now())
-        compare(Timestamp.now('UTC'), datetime.now(tzutc()))
-        compare(Timestamp.utcnow(),datetime.utcnow())
-        compare(Timestamp.today(),datetime.today())
-        current_time = calendar.timegm(datetime.now().utctimetuple())
-        compare(Timestamp.utcfromtimestamp(current_time),
-                datetime.utcfromtimestamp(current_time))
-        compare(Timestamp.fromtimestamp(current_time),
-                datetime.fromtimestamp(current_time))
-
-        date_component = datetime.utcnow()
-        time_component = (date_component + timedelta(minutes=10)).time()
-        compare(Timestamp.combine(date_component, time_component),
-                datetime.combine(date_component, time_component))
-
-    def test_basics_nanos(self):
-        val = np.int64(946684800000000000).view('M8[ns]')
-        stamp = Timestamp(val.view('i8') + 500)
-        self.assertEqual(stamp.year, 2000)
-        self.assertEqual(stamp.month, 1)
-        self.assertEqual(stamp.microsecond, 0)
-        self.assertEqual(stamp.nanosecond, 500)
-
-    def test_unit(self):
-        def check(val,unit=None,h=1,s=1,us=0):
-            stamp = Timestamp(val, unit=unit)
-            self.assertEqual(stamp.year, 2000)
-            self.assertEqual(stamp.month, 1)
-            self.assertEqual(stamp.day, 1)
-            self.assertEqual(stamp.hour, h)
-            if unit != 'D':
-                self.assertEqual(stamp.minute, 1)
-                self.assertEqual(stamp.second, s)
-                self.assertEqual(stamp.microsecond, us)
-            else:
-                self.assertEqual(stamp.minute, 0)
-                self.assertEqual(stamp.second, 0)
-                self.assertEqual(stamp.microsecond, 0)
-            self.assertEqual(stamp.nanosecond, 0)
-
-        ts = Timestamp('20000101 01:01:01')
-        val = ts.value
-        days = (ts - Timestamp('1970-01-01')).days
-
-        check(val)
-        check(val/long(1000),unit='us')
-        check(val/long(1000000),unit='ms')
-        check(val/long(1000000000),unit='s')
-        check(days,unit='D',h=0)
-
-        # using truediv, so these are like floats
-        if compat.PY3:
-            check((val+500000)/long(1000000000),unit='s',us=500)
-            check((val+500000000)/long(1000000000),unit='s',us=500000)
-            check((val+500000)/long(1000000),unit='ms',us=500)
-
-        # get chopped in py2
-        else:
-            check((val+500000)/long(1000000000),unit='s')
-            check((val+500000000)/long(1000000000),unit='s')
-            check((val+500000)/long(1000000),unit='ms')
-
-        # ok
-        check((val+500000)/long(1000),unit='us',us=500)
-        check((val+500000000)/long(1000000),unit='ms',us=500000)
-
-        # floats
-        check(val/1000.0 + 5,unit='us',us=5)
-        check(val/1000.0 + 5000,unit='us',us=5000)
-        check(val/1000000.0 + 0.5,unit='ms',us=500)
-        check(val/1000000.0 + 0.005,unit='ms',us=5)
-        check(val/1000000000.0 + 0.5,unit='s',us=500000)
-        check(days + 0.5,unit='D',h=12)
-
-        # nan
-        result = Timestamp(np.nan)
-        self.assertIs(result, NaT)
-
-        result = Timestamp(None)
-        self.assertIs(result, NaT)
-
-        result = Timestamp(iNaT)
-        self.assertIs(result, NaT)
-
-        result = Timestamp(NaT)
-        self.assertIs(result, NaT)
-
-        result = Timestamp('NaT')
-        self.assertIs(result, NaT)
-
-    def test_roundtrip(self):
-
-        # test value to string and back conversions
-        # further test accessors
-        base = Timestamp('20140101 00:00:00')
-
-        result = Timestamp(base.value + pd.Timedelta('5ms').value)
-        self.assertEqual(result,Timestamp(str(base) + ".005000"))
-        self.assertEqual(result.microsecond,5000)
-
-        result = Timestamp(base.value + pd.Timedelta('5us').value)
-        self.assertEqual(result,Timestamp(str(base) + ".000005"))
-        self.assertEqual(result.microsecond,5)
-
-        result = Timestamp(base.value + pd.Timedelta('5ns').value)
-        self.assertEqual(result,Timestamp(str(base) + ".000000005"))
-        self.assertEqual(result.nanosecond,5)
-        self.assertEqual(result.microsecond,0)
-
-        result = Timestamp(base.value + pd.Timedelta('6ms 5us').value)
-        self.assertEqual(result,Timestamp(str(base) + ".006005"))
-        self.assertEqual(result.microsecond,5+6*1000)
-
-        result = Timestamp(base.value + pd.Timedelta('200ms 5us').value)
-        self.assertEqual(result,Timestamp(str(base) + ".200005"))
-        self.assertEqual(result.microsecond,5+200*1000)
-
-    def test_comparison(self):
-        # 5-18-2012 00:00:00.000
-        stamp = long(1337299200000000000)
-
-        val = Timestamp(stamp)
-
-        self.assertEqual(val, val)
-        self.assertFalse(val != val)
-        self.assertFalse(val < val)
-        self.assertTrue(val <= val)
-        self.assertFalse(val > val)
-        self.assertTrue(val >= val)
-
-        other = datetime(2012, 5, 18)
-        self.assertEqual(val, other)
-        self.assertFalse(val != other)
-        self.assertFalse(val < other)
-        self.assertTrue(val <= other)
-        self.assertFalse(val > other)
-        self.assertTrue(val >= other)
-
-        other = Timestamp(stamp + 100)
-
-        self.assertNotEqual(val, other)
-        self.assertNotEqual(val, other)
-        self.assertTrue(val < other)
-        self.assertTrue(val <= other)
-        self.assertTrue(other > val)
-        self.assertTrue(other >= val)
-
-    def test_compare_invalid(self):
-
-        # GH 8058
-        val = Timestamp('20130101 12:01:02')
-        self.assertFalse(val == 'foo')
-        self.assertFalse(val == 10.0)
-        self.assertFalse(val == 1)
-        self.assertFalse(val == long(1))
-        self.assertFalse(val == [])
-        self.assertFalse(val == {'foo' : 1})
-        self.assertFalse(val == np.float64(1))
-        self.assertFalse(val == np.int64(1))
-
-        self.assertTrue(val != 'foo')
-        self.assertTrue(val != 10.0)
-        self.assertTrue(val != 1)
-        self.assertTrue(val != long(1))
-        self.assertTrue(val != [])
-        self.assertTrue(val != {'foo' : 1})
-        self.assertTrue(val != np.float64(1))
-        self.assertTrue(val != np.int64(1))
-
-        # ops testing
-        df = DataFrame(randn(5,2))
-        a = df[0]
-        b = Series(randn(5))
-        b.name = Timestamp('2000-01-01')
-        tm.assert_series_equal(a / b, 1 / (b / a))
-
-    def test_cant_compare_tz_naive_w_aware(self):
-        tm._skip_if_no_pytz()
-        # #1404
-        a = Timestamp('3/12/2012')
-        b = Timestamp('3/12/2012', tz='utc')
-
-        self.assertRaises(Exception, a.__eq__, b)
-        self.assertRaises(Exception, a.__ne__, b)
-        self.assertRaises(Exception, a.__lt__, b)
-        self.assertRaises(Exception, a.__gt__, b)
-        self.assertRaises(Exception, b.__eq__, a)
-        self.assertRaises(Exception, b.__ne__, a)
-        self.assertRaises(Exception, b.__lt__, a)
-        self.assertRaises(Exception, b.__gt__, a)
-
-        if sys.version_info < (3, 3):
-            self.assertRaises(Exception, a.__eq__, b.to_pydatetime())
-            self.assertRaises(Exception, a.to_pydatetime().__eq__, b)
-        else:
-            self.assertFalse(a == b.to_pydatetime())
-            self.assertFalse(a.to_pydatetime() == b)
-
-    def test_cant_compare_tz_naive_w_aware_explicit_pytz(self):
-        tm._skip_if_no_pytz()
-        from pytz import utc
-        # #1404
-        a = Timestamp('3/12/2012')
-        b = Timestamp('3/12/2012', tz=utc)
-
-        self.assertRaises(Exception, a.__eq__, b)
-        self.assertRaises(Exception, a.__ne__, b)
-        self.assertRaises(Exception, a.__lt__, b)
-        self.assertRaises(Exception, a.__gt__, b)
-        self.assertRaises(Exception, b.__eq__, a)
-        self.assertRaises(Exception, b.__ne__, a)
-        self.assertRaises(Exception, b.__lt__, a)
-        self.assertRaises(Exception, b.__gt__, a)
-
-        if sys.version_info < (3, 3):
-            self.assertRaises(Exception, a.__eq__, b.to_pydatetime())
-            self.assertRaises(Exception, a.to_pydatetime().__eq__, b)
-        else:
-            self.assertFalse(a == b.to_pydatetime())
-            self.assertFalse(a.to_pydatetime() == b)
-
-    def test_cant_compare_tz_naive_w_aware_dateutil(self):
-        tm._skip_if_no_dateutil()
-        from dateutil.tz import tzutc
-        utc = tzutc()
-        # #1404
-        a = Timestamp('3/12/2012')
-        b = Timestamp('3/12/2012', tz=utc)
-
-        self.assertRaises(Exception, a.__eq__, b)
-        self.assertRaises(Exception, a.__ne__, b)
-        self.assertRaises(Exception, a.__lt__, b)
-        self.assertRaises(Exception, a.__gt__, b)
-        self.assertRaises(Exception, b.__eq__, a)
-        self.assertRaises(Exception, b.__ne__, a)
-        self.assertRaises(Exception, b.__lt__, a)
-        self.assertRaises(Exception, b.__gt__, a)
-
-        if sys.version_info < (3, 3):
-            self.assertRaises(Exception, a.__eq__, b.to_pydatetime())
-            self.assertRaises(Exception, a.to_pydatetime().__eq__, b)
-        else:
-            self.assertFalse(a == b.to_pydatetime())
-            self.assertFalse(a.to_pydatetime() == b)
-
-    def test_delta_preserve_nanos(self):
-        val = Timestamp(long(1337299200000000123))
-        result = val + timedelta(1)
-        self.assertEqual(result.nanosecond, val.nanosecond)
-
-    def test_frequency_misc(self):
-        self.assertEqual(frequencies.get_freq_group('T'),
-                          frequencies.FreqGroup.FR_MIN)
-
-        code, stride = frequencies.get_freq_code(offsets.Hour())
-        self.assertEqual(code, frequencies.FreqGroup.FR_HR)
-
-        code, stride = frequencies.get_freq_code((5, 'T'))
-        self.assertEqual(code, frequencies.FreqGroup.FR_MIN)
-        self.assertEqual(stride, 5)
-
-        offset = offsets.Hour()
-        result = frequencies.to_offset(offset)
-        self.assertEqual(result, offset)
-
-        result = frequencies.to_offset((5, 'T'))
-        expected = offsets.Minute(5)
-        self.assertEqual(result, expected)
-
-        self.assertRaises(ValueError, frequencies.get_freq_code, (5, 'baz'))
-
-        self.assertRaises(ValueError, frequencies.to_offset, '100foo')
-
-        self.assertRaises(ValueError, frequencies.to_offset, ('', ''))
-
-        result = frequencies.get_standard_freq(offsets.Hour())
-        self.assertEqual(result, 'H')
-
-    def test_hash_equivalent(self):
-        d = {datetime(2011, 1, 1): 5}
-        stamp = Timestamp(datetime(2011, 1, 1))
-        self.assertEqual(d[stamp], 5)
-
-    def test_timestamp_compare_scalars(self):
-        # case where ndim == 0
-        lhs = np.datetime64(datetime(2013, 12, 6))
-        rhs = Timestamp('now')
-        nat = Timestamp('nat')
-
-        ops = {'gt': 'lt', 'lt': 'gt', 'ge': 'le', 'le': 'ge', 'eq': 'eq',
-            'ne': 'ne'}
-
-        for left, right in ops.items():
-            left_f = getattr(operator, left)
-            right_f = getattr(operator, right)
-            expected = left_f(lhs, rhs)
-
-            result = right_f(rhs, lhs)
-            self.assertEqual(result, expected)
-
-            expected = left_f(rhs, nat)
-            result = right_f(nat, rhs)
-            self.assertEqual(result, expected)
-
-    def test_timestamp_compare_series(self):
-        # make sure we can compare Timestamps on the right AND left hand side
-        # GH4982
-        s = Series(date_range('20010101', periods=10), name='dates')
-        s_nat = s.copy(deep=True)
-
-        s[0] = pd.Timestamp('nat')
-        s[3] = pd.Timestamp('nat')
-
-        ops = {'lt': 'gt', 'le': 'ge', 'eq': 'eq', 'ne': 'ne'}
-
-        for left, right in ops.items():
-            left_f = getattr(operator, left)
-            right_f = getattr(operator, right)
-
-            # no nats
-            expected = left_f(s, Timestamp('20010109'))
-            result = right_f(Timestamp('20010109'), s)
-            tm.assert_series_equal(result, expected)
-
-            # nats
-            expected = left_f(s, Timestamp('nat'))
-            result = right_f(Timestamp('nat'), s)
-            tm.assert_series_equal(result, expected)
-
-            # compare to timestamp with series containing nats
-            expected = left_f(s_nat, Timestamp('20010109'))
-            result = right_f(Timestamp('20010109'), s_nat)
-            tm.assert_series_equal(result, expected)
-
-            # compare to nat with series containing nats
-            expected = left_f(s_nat, Timestamp('nat'))
-            result = right_f(Timestamp('nat'), s_nat)
-            tm.assert_series_equal(result, expected)
-
-
-class TestSlicing(tm.TestCase):
-
-    def test_slice_year(self):
-        dti = DatetimeIndex(freq='B', start=datetime(2005, 1, 1), periods=500)
-
-        s = Series(np.arange(len(dti)), index=dti)
-        result = s['2005']
-        expected = s[s.index.year == 2005]
-        assert_series_equal(result, expected)
-
-        df = DataFrame(np.random.rand(len(dti), 5), index=dti)
-        result = df.ix['2005']
-        expected = df[df.index.year == 2005]
-        assert_frame_equal(result, expected)
-
-        rng = date_range('1/1/2000', '1/1/2010')
-
-        result = rng.get_loc('2009')
-        expected = slice(3288, 3653)
-        self.assertEqual(result, expected)
-
-    def test_slice_quarter(self):
-        dti = DatetimeIndex(freq='D', start=datetime(2000, 6, 1), periods=500)
-
-        s = Series(np.arange(len(dti)), index=dti)
-        self.assertEqual(len(s['2001Q1']), 90)
-
-        df = DataFrame(np.random.rand(len(dti), 5), index=dti)
-        self.assertEqual(len(df.ix['1Q01']), 90)
-
-    def test_slice_month(self):
-        dti = DatetimeIndex(freq='D', start=datetime(2005, 1, 1), periods=500)
-        s = Series(np.arange(len(dti)), index=dti)
-        self.assertEqual(len(s['2005-11']), 30)
-
-        df = DataFrame(np.random.rand(len(dti), 5), index=dti)
-        self.assertEqual(len(df.ix['2005-11']), 30)
-
-        assert_series_equal(s['2005-11'], s['11-2005'])
-
-    def test_partial_slice(self):
-        rng = DatetimeIndex(freq='D', start=datetime(2005, 1, 1), periods=500)
-        s = Series(np.arange(len(rng)), index=rng)
-
-        result = s['2005-05':'2006-02']
-        expected = s['20050501':'20060228']
-        assert_series_equal(result, expected)
-
-        result = s['2005-05':]
-        expected = s['20050501':]
-        assert_series_equal(result, expected)
-
-        result = s[:'2006-02']
-        expected = s[:'20060228']
-        assert_series_equal(result, expected)
-
-        result = s['2005-1-1']
-        self.assertEqual(result, s.iloc[0])
-
-        self.assertRaises(Exception, s.__getitem__, '2004-12-31')
-
-    def test_partial_slice_daily(self):
-        rng = DatetimeIndex(freq='H', start=datetime(2005, 1, 31), periods=500)
-        s = Series(np.arange(len(rng)), index=rng)
-
-        result = s['2005-1-31']
-        assert_series_equal(result, s.ix[:24])
-
-        self.assertRaises(Exception, s.__getitem__, '2004-12-31 00')
-
-    def test_partial_slice_hourly(self):
-        rng = DatetimeIndex(freq='T', start=datetime(2005, 1, 1, 20, 0, 0),
-                            periods=500)
-        s = Series(np.arange(len(rng)), index=rng)
-
-        result = s['2005-1-1']
-        assert_series_equal(result, s.ix[:60 * 4])
-
-        result = s['2005-1-1 20']
-        assert_series_equal(result, s.ix[:60])
-
-        self.assertEqual(s['2005-1-1 20:00'], s.ix[0])
-        self.assertRaises(Exception, s.__getitem__, '2004-12-31 00:15')
-
-    def test_partial_slice_minutely(self):
-        rng = DatetimeIndex(freq='S', start=datetime(2005, 1, 1, 23, 59, 0),
-                            periods=500)
-        s = Series(np.arange(len(rng)), index=rng)
-
-        result = s['2005-1-1 23:59']
-        assert_series_equal(result, s.ix[:60])
-
-        result = s['2005-1-1']
-        assert_series_equal(result, s.ix[:60])
-
-        self.assertEqual(s[Timestamp('2005-1-1 23:59:00')], s.ix[0])
-        self.assertRaises(Exception, s.__getitem__, '2004-12-31 00:00:00')
-
-    def test_partial_slice_second_precision(self):
-        rng = DatetimeIndex(start=datetime(2005, 1, 1, 0, 0, 59,
-                                           microsecond=999990),
-                            periods=20, freq='US')
-        s = Series(np.arange(20), rng)
-
-        assert_series_equal(s['2005-1-1 00:00'], s.iloc[:10])
-        assert_series_equal(s['2005-1-1 00:00:59'], s.iloc[:10])
-
-        assert_series_equal(s['2005-1-1 00:01'], s.iloc[10:])
-        assert_series_equal(s['2005-1-1 00:01:00'], s.iloc[10:])
-
-        self.assertEqual(s[Timestamp('2005-1-1 00:00:59.999990')], s.iloc[0])
-        self.assertRaisesRegexp(KeyError, '2005-1-1 00:00:00',
-                                lambda: s['2005-1-1 00:00:00'])
-
-    def test_partial_slicing_with_multiindex(self):
-
-        # GH 4758
-        # partial string indexing with a multi-index buggy
-        df = DataFrame({'ACCOUNT':["ACCT1", "ACCT1", "ACCT1", "ACCT2"],
-                        'TICKER':["ABC", "MNP", "XYZ", "XYZ"],
-                        'val':[1,2,3,4]},
-                       index=date_range("2013-06-19 09:30:00", periods=4, freq='5T'))
-        df_multi = df.set_index(['ACCOUNT', 'TICKER'], append=True)
-
-        expected = DataFrame([[1]],index=Index(['ABC'],name='TICKER'),columns=['val'])
-        result = df_multi.loc[('2013-06-19 09:30:00', 'ACCT1')]
-        assert_frame_equal(result, expected)
-
-        expected = df_multi.loc[(pd.Timestamp('2013-06-19 09:30:00', tz=None), 'ACCT1', 'ABC')]
-        result = df_multi.loc[('2013-06-19 09:30:00', 'ACCT1', 'ABC')]
-        assert_series_equal(result, expected)
-
-        # this is a KeyError as we don't do partial string selection on multi-levels
-        def f():
-            df_multi.loc[('2013-06-19', 'ACCT1', 'ABC')]
-        self.assertRaises(KeyError, f)
-
-        # GH 4294
-        # partial slice on a series mi
-        s = pd.DataFrame(randn(1000, 1000), index=pd.date_range('2000-1-1', periods=1000)).stack()
-
-        s2 = s[:-1].copy()
-        expected = s2['2000-1-4']
-        result = s2[pd.Timestamp('2000-1-4')]
-        assert_series_equal(result, expected)
-
-        result = s[pd.Timestamp('2000-1-4')]
-        expected = s['2000-1-4']
-        assert_series_equal(result, expected)
-
-        df2 = pd.DataFrame(s)
-        expected = df2.ix['2000-1-4']
-        result = df2.ix[pd.Timestamp('2000-1-4')]
-        assert_frame_equal(result, expected)
-
-    def test_date_range_normalize(self):
-        snap = datetime.today()
-        n = 50
-
-        rng = date_range(snap, periods=n, normalize=False, freq='2D')
-
-        offset = timedelta(2)
-        values = np.array([snap + i * offset for i in range(n)],
-                          dtype='M8[ns]')
-
-        self.assert_numpy_array_equal(rng, values)
-
-        rng = date_range(
-            '1/1/2000 08:15', periods=n, normalize=False, freq='B')
-        the_time = time(8, 15)
-        for val in rng:
-            self.assertEqual(val.time(), the_time)
-
-    def test_timedelta(self):
-        # this is valid too
-        index = date_range('1/1/2000', periods=50, freq='B')
-        shifted = index + timedelta(1)
-        back = shifted + timedelta(-1)
-        self.assertTrue(tm.equalContents(index, back))
-        self.assertEqual(shifted.freq, index.freq)
-        self.assertEqual(shifted.freq, back.freq)
-
-        result = index - timedelta(1)
-        expected = index + timedelta(-1)
-        self.assertTrue(result.equals(expected))
-
-        # GH4134, buggy with timedeltas
-        rng = date_range('2013', '2014')
-        s = Series(rng)
-        result1 = rng - pd.offsets.Hour(1)
-        result2 = DatetimeIndex(s - np.timedelta64(100000000))
-        result3 = rng - np.timedelta64(100000000)
-        result4 = DatetimeIndex(s - pd.offsets.Hour(1))
-        self.assertTrue(result1.equals(result4))
-        self.assertTrue(result2.equals(result3))
-
-    def test_shift(self):
-        ts = Series(np.random.randn(5),
-                    index=date_range('1/1/2000', periods=5, freq='H'))
-
-        result = ts.shift(1, freq='5T')
-        exp_index = ts.index.shift(1, freq='5T')
-        self.assertTrue(result.index.equals(exp_index))
-
-        # GH #1063, multiple of same base
-        result = ts.shift(1, freq='4H')
-        exp_index = ts.index + datetools.Hour(4)
-        self.assertTrue(result.index.equals(exp_index))
-
-        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-04'])
-        self.assertRaises(ValueError, idx.shift, 1)
-
-    def test_setops_preserve_freq(self):
-        for tz in [None, 'Asia/Tokyo', 'US/Eastern']:
-            rng = date_range('1/1/2000', '1/1/2002', name='idx', tz=tz)
-
-            result = rng[:50].union(rng[50:100])
-            self.assertEqual(result.name, rng.name)
-            self.assertEqual(result.freq, rng.freq)
-            self.assertEqual(result.tz, rng.tz)
-
-            result = rng[:50].union(rng[30:100])
-            self.assertEqual(result.name, rng.name)
-            self.assertEqual(result.freq, rng.freq)
-            self.assertEqual(result.tz, rng.tz)
-
-            result = rng[:50].union(rng[60:100])
-            self.assertEqual(result.name, rng.name)
-            self.assertIsNone(result.freq)
-            self.assertEqual(result.tz, rng.tz)
-
-            result = rng[:50].intersection(rng[25:75])
-            self.assertEqual(result.name, rng.name)
-            self.assertEqual(result.freqstr, 'D')
-            self.assertEqual(result.tz, rng.tz)
-
-            nofreq = DatetimeIndex(list(rng[25:75]), name='other')
-            result = rng[:50].union(nofreq)
-            self.assertIsNone(result.name)
-            self.assertEqual(result.freq, rng.freq)
-            self.assertEqual(result.tz, rng.tz)
-
-            result = rng[:50].intersection(nofreq)
-            self.assertIsNone(result.name)
-            self.assertEqual(result.freq, rng.freq)
-            self.assertEqual(result.tz, rng.tz)
-
-    def test_min_max(self):
-        rng = date_range('1/1/2000', '12/31/2000')
-        rng2 = rng.take(np.random.permutation(len(rng)))
-
-        the_min = rng2.min()
-        the_max = rng2.max()
-        tm.assertIsInstance(the_min, Timestamp)
-        tm.assertIsInstance(the_max, Timestamp)
-        self.assertEqual(the_min, rng[0])
-        self.assertEqual(the_max, rng[-1])
-
-        self.assertEqual(rng.min(), rng[0])
-        self.assertEqual(rng.max(), rng[-1])
-
-    def test_min_max_series(self):
-        rng = date_range('1/1/2000', periods=10, freq='4h')
-        lvls = ['A', 'A', 'A', 'B', 'B', 'B', 'C', 'C', 'C', 'C']
-        df = DataFrame({'TS': rng, 'V': np.random.randn(len(rng)),
-                        'L': lvls})
-
-        result = df.TS.max()
-        exp = Timestamp(df.TS.iat[-1])
-        self.assertTrue(isinstance(result, Timestamp))
-        self.assertEqual(result, exp)
-
-        result = df.TS.min()
-        exp = Timestamp(df.TS.iat[0])
-        self.assertTrue(isinstance(result, Timestamp))
-        self.assertEqual(result, exp)
-
-    def test_from_M8_structured(self):
-        dates = [(datetime(2012, 9, 9, 0, 0),
-                 datetime(2012, 9, 8, 15, 10))]
-        arr = np.array(dates,
-                       dtype=[('Date', 'M8[us]'), ('Forecasting', 'M8[us]')])
-        df = DataFrame(arr)
-
-        self.assertEqual(df['Date'][0], dates[0][0])
-        self.assertEqual(df['Forecasting'][0], dates[0][1])
-
-        s = Series(arr['Date'])
-        self.assertTrue(s[0], Timestamp)
-        self.assertEqual(s[0], dates[0][0])
-
-        s = Series.from_array(arr['Date'], Index([0]))
-        self.assertEqual(s[0], dates[0][0])
-
-    def test_get_level_values_box(self):
-        from pandas import MultiIndex
-
-        dates = date_range('1/1/2000', periods=4)
-        levels = [dates, [0, 1]]
-        labels = [[0, 0, 1, 1, 2, 2, 3, 3],
-                  [0, 1, 0, 1, 0, 1, 0, 1]]
-
-        index = MultiIndex(levels=levels, labels=labels)
-
-        self.assertTrue(isinstance(index.get_level_values(0)[0], Timestamp))
-
-    def test_frame_apply_dont_convert_datetime64(self):
-        from pandas.tseries.offsets import BDay
-        df = DataFrame({'x1': [datetime(1996, 1, 1)]})
-
-        df = df.applymap(lambda x: x + BDay())
-        df = df.applymap(lambda x: x + BDay())
-
-        self.assertTrue(df.x1.dtype == 'M8[ns]')
-
-    def test_date_range_fy5252(self):
-        dr = date_range(start="2013-01-01",
-                           periods=2,
-                           freq=offsets.FY5253(startingMonth=1,
-                                               weekday=3,
-                                               variation="nearest"))
-        self.assertEqual(dr[0], Timestamp('2013-01-31'))
-        self.assertEqual(dr[1], Timestamp('2014-01-30'))
-
-    def test_partial_slice_doesnt_require_monotonicity(self):
-        # For historical reasons.
-        s = pd.Series(np.arange(10),
-                      pd.date_range('2014-01-01', periods=10))
-
-        nonmonotonic = s[[3, 5, 4]]
-        expected = nonmonotonic.iloc[:0]
-        timestamp = pd.Timestamp('2014-01-10')
-
-        assert_series_equal(nonmonotonic['2014-01-10':], expected)
-        self.assertRaisesRegexp(KeyError, "Timestamp\('2014-01-10 00:00:00'\)",
-                                lambda: nonmonotonic[timestamp:])
-
-        assert_series_equal(nonmonotonic.ix['2014-01-10':], expected)
-        self.assertRaisesRegexp(KeyError, "Timestamp\('2014-01-10 00:00:00'\)",
-                                lambda: nonmonotonic.ix[timestamp:])
-
-
-class TimeConversionFormats(tm.TestCase):
-    def test_to_datetime_format(self):
-        values = ['1/1/2000', '1/2/2000', '1/3/2000']
-
-        results1 = [ Timestamp('20000101'), Timestamp('20000201'),
-                     Timestamp('20000301') ]
-        results2 = [ Timestamp('20000101'), Timestamp('20000102'),
-                     Timestamp('20000103') ]
-        for vals, expecteds in [ (values, (Index(results1), Index(results2))),
-                                 (Series(values),(Series(results1), Series(results2))),
-                                 (values[0], (results1[0], results2[0])),
-                                 (values[1], (results1[1], results2[1])),
-                                 (values[2], (results1[2], results2[2])) ]:
-
-            for i, fmt in enumerate(['%d/%m/%Y', '%m/%d/%Y']):
-                result = to_datetime(vals, format=fmt)
-                expected = expecteds[i]
-
-                if isinstance(expected, Series):
-                    assert_series_equal(result, Series(expected))
-                elif isinstance(expected, Timestamp):
-                    self.assertEqual(result, expected)
-                else:
-                    self.assertTrue(result.equals(expected))
-
-    def test_to_datetime_format_YYYYMMDD(self):
-        s = Series([19801222,19801222] + [19810105]*5)
-        expected = Series([ Timestamp(x) for x in s.apply(str) ])
-
-        result = to_datetime(s,format='%Y%m%d')
-        assert_series_equal(result, expected)
-
-        result = to_datetime(s.apply(str),format='%Y%m%d')
-        assert_series_equal(result, expected)
-
-        # with NaT
-        expected = Series([Timestamp("19801222"),Timestamp("19801222")] + [Timestamp("19810105")]*5)
-        expected[2] = np.nan
-        s[2] = np.nan
-
-        result = to_datetime(s,format='%Y%m%d')
-        assert_series_equal(result, expected)
-
-        # string with NaT
-        s = s.apply(str)
-        s[2] = 'nat'
-        result = to_datetime(s,format='%Y%m%d')
-        assert_series_equal(result, expected)
-
-        # coercion
-        # GH 7930
-        s = Series([20121231, 20141231, 99991231])
-        result = pd.to_datetime(s,format='%Y%m%d',errors='ignore')
-        expected = np.array([ datetime(2012,12,31), datetime(2014,12,31), datetime(9999,12,31) ], dtype=object)
-        self.assert_numpy_array_equal(result, expected)
-
-        result = pd.to_datetime(s,format='%Y%m%d', errors='coerce')
-        expected = Series(['20121231','20141231','NaT'],dtype='M8[ns]')
-        assert_series_equal(result, expected)
-
-    # GH 10178
-    def test_to_datetime_format_integer(self):
-        s = Series([2000, 2001, 2002])
-        expected = Series([ Timestamp(x) for x in s.apply(str) ])
-
-        result = to_datetime(s,format='%Y')
-        assert_series_equal(result, expected)
-
-        s = Series([200001, 200105, 200206])
-        expected = Series([ Timestamp(x[:4] + '-' + x[4:]) for x in s.apply(str) ])
-
-        result = to_datetime(s,format='%Y%m')
-        assert_series_equal(result, expected)
-
-    def test_to_datetime_format_microsecond(self):
-        val = '01-Apr-2011 00:00:01.978'
-        format = '%d-%b-%Y %H:%M:%S.%f'
-        result = to_datetime(val, format=format)
-        exp = datetime.strptime(val, format)
-        self.assertEqual(result, exp)
-
-    def test_to_datetime_format_time(self):
-        data = [
-               ['01/10/2010 15:20', '%m/%d/%Y %H:%M', Timestamp('2010-01-10 15:20')],
-             ['01/10/2010 05:43', '%m/%d/%Y %I:%M', Timestamp('2010-01-10 05:43')],
-             ['01/10/2010 13:56:01', '%m/%d/%Y %H:%M:%S', Timestamp('2010-01-10 13:56:01')]#,
-             #['01/10/2010 08:14 PM', '%m/%d/%Y %I:%M %p', Timestamp('2010-01-10 20:14')],
-             #['01/10/2010 07:40 AM', '%m/%d/%Y %I:%M %p', Timestamp('2010-01-10 07:40')],
-             #['01/10/2010 09:12:56 AM', '%m/%d/%Y %I:%M:%S %p', Timestamp('2010-01-10 09:12:56')]
-            ]
-        for s, format, dt in data:
-            self.assertEqual(to_datetime(s, format=format), dt)
-
-    def test_to_datetime_with_non_exact(self):
-        # GH 10834
-        _skip_if_has_locale()
-
-        # 8904
-        # exact kw
-        if sys.version_info < (2, 7):
-            raise nose.SkipTest('on python version < 2.7')
-
-        s = Series(['19MAY11','foobar19MAY11','19MAY11:00:00:00','19MAY11 00:00:00Z'])
-        result = to_datetime(s,format='%d%b%y',exact=False)
-        expected = to_datetime(s.str.extract('(\d+\w+\d+)'),format='%d%b%y')
-        assert_series_equal(result, expected)
-
-    def test_parse_nanoseconds_with_formula(self):
-
-        # GH8989
-        # trunctaing the nanoseconds when a format was provided
-        for v in ["2012-01-01 09:00:00.000000001",
-                  "2012-01-01 09:00:00.000001",
-                  "2012-01-01 09:00:00.001",
-                  "2012-01-01 09:00:00.001000",
-                  "2012-01-01 09:00:00.001000000",
-                  ]:
-            expected = pd.to_datetime(v)
-            result =  pd.to_datetime(v, format="%Y-%m-%d %H:%M:%S.%f")
-            self.assertEqual(result,expected)
-
-    def test_to_datetime_format_weeks(self):
-        data = [
-                ['2009324', '%Y%W%w', Timestamp('2009-08-13')],
-                ['2013020', '%Y%U%w', Timestamp('2013-01-13')]
-            ]
-        for s, format, dt in data:
-            self.assertEqual(to_datetime(s, format=format), dt)
-
-class TestToDatetimeInferFormat(tm.TestCase):
-    def test_to_datetime_infer_datetime_format_consistent_format(self):
-        time_series = pd.Series(
-            pd.date_range('20000101', periods=50, freq='H')
-        )
-
-        test_formats = [
-            '%m-%d-%Y',
-            '%m/%d/%Y %H:%M:%S.%f',
-            '%Y-%m-%dT%H:%M:%S.%f',
-        ]
-
-        for test_format in test_formats:
-            s_as_dt_strings = time_series.apply(
-                lambda x: x.strftime(test_format)
-            )
-
-            with_format = pd.to_datetime(s_as_dt_strings, format=test_format)
-            no_infer = pd.to_datetime(
-                s_as_dt_strings, infer_datetime_format=False
-            )
-            yes_infer = pd.to_datetime(
-                s_as_dt_strings, infer_datetime_format=True
-            )
-
-            # Whether the format is explicitly passed, it is inferred, or
-            # it is not inferred, the results should all be the same
-            self.assert_numpy_array_equal(with_format, no_infer)
-            self.assert_numpy_array_equal(no_infer, yes_infer)
-
-    def test_to_datetime_infer_datetime_format_inconsistent_format(self):
-        test_series = pd.Series(
-            np.array([
-                '01/01/2011 00:00:00',
-                '01-02-2011 00:00:00',
-                '2011-01-03T00:00:00',
-        ]))
-
-        # When the format is inconsistent, infer_datetime_format should just
-        # fallback to the default parsing
-        self.assert_numpy_array_equal(
-            pd.to_datetime(test_series, infer_datetime_format=False),
-            pd.to_datetime(test_series, infer_datetime_format=True)
-        )
-
-        test_series = pd.Series(
-            np.array([
-                'Jan/01/2011',
-                'Feb/01/2011',
-                'Mar/01/2011',
-        ]))
-
-        self.assert_numpy_array_equal(
-            pd.to_datetime(test_series, infer_datetime_format=False),
-            pd.to_datetime(test_series, infer_datetime_format=True)
-        )
-
-    def test_to_datetime_infer_datetime_format_series_with_nans(self):
-        test_series = pd.Series(
-            np.array([
-                '01/01/2011 00:00:00',
-                np.nan,
-                '01/03/2011 00:00:00',
-                np.nan,
-        ]))
-
-        self.assert_numpy_array_equal(
-            pd.to_datetime(test_series, infer_datetime_format=False),
-            pd.to_datetime(test_series, infer_datetime_format=True)
-        )
-
-    def test_to_datetime_infer_datetime_format_series_starting_with_nans(self):
-        test_series = pd.Series(
-            np.array([
-                np.nan,
-                np.nan,
-                '01/01/2011 00:00:00',
-                '01/02/2011 00:00:00',
-                '01/03/2011 00:00:00',
-        ]))
-
-        self.assert_numpy_array_equal(
-            pd.to_datetime(test_series, infer_datetime_format=False),
-            pd.to_datetime(test_series, infer_datetime_format=True)
-        )
-
-
-class TestGuessDatetimeFormat(tm.TestCase):
-    def test_guess_datetime_format_with_parseable_formats(self):
-        dt_string_to_format = (
-            ('20111230', '%Y%m%d'),
-            ('2011-12-30', '%Y-%m-%d'),
-            ('30-12-2011', '%d-%m-%Y'),
-            ('2011-12-30 00:00:00', '%Y-%m-%d %H:%M:%S'),
-            ('2011-12-30T00:00:00', '%Y-%m-%dT%H:%M:%S'),
-            ('2011-12-30 00:00:00.000000', '%Y-%m-%d %H:%M:%S.%f'),
-        )
-
-        for dt_string, dt_format in dt_string_to_format:
-            self.assertEqual(
-                tools._guess_datetime_format(dt_string),
-                dt_format
-            )
-
-    def test_guess_datetime_format_with_dayfirst(self):
-        ambiguous_string = '01/01/2011'
-        self.assertEqual(
-            tools._guess_datetime_format(ambiguous_string, dayfirst=True),
-            '%d/%m/%Y'
-        )
-        self.assertEqual(
-            tools._guess_datetime_format(ambiguous_string, dayfirst=False),
-            '%m/%d/%Y'
-        )
-
-    def test_guess_datetime_format_with_locale_specific_formats(self):
-        # The month names will vary depending on the locale, in which
-        # case these wont be parsed properly (dateutil can't parse them)
-        _skip_if_has_locale()
-
-        dt_string_to_format = (
-            ('30/Dec/2011', '%d/%b/%Y'),
-            ('30/December/2011', '%d/%B/%Y'),
-            ('30/Dec/2011 00:00:00', '%d/%b/%Y %H:%M:%S'),
-        )
-
-        for dt_string, dt_format in dt_string_to_format:
-            self.assertEqual(
-                tools._guess_datetime_format(dt_string),
-                dt_format
-            )
-
-    def test_guess_datetime_format_invalid_inputs(self):
-        # A datetime string must include a year, month and a day for it
-        # to be guessable, in addition to being a string that looks like
-        # a datetime
-        invalid_dts = [
-            '2013',
-            '01/2013',
-            '12:00:00',
-            '1/1/1/1',
-            'this_is_not_a_datetime',
-            '51a',
-            9,
-            datetime(2011, 1, 1),
-        ]
-
-        for invalid_dt in invalid_dts:
-            self.assertTrue(tools._guess_datetime_format(invalid_dt) is None)
-
-    def test_guess_datetime_format_nopadding(self):
-        # GH 11142
-        dt_string_to_format = (
-            ('2011-1-1', '%Y-%m-%d'),
-            ('30-1-2011', '%d-%m-%Y'),
-            ('1/1/2011', '%m/%d/%Y'),
-            ('2011-1-1 00:00:00', '%Y-%m-%d %H:%M:%S'),
-            ('2011-1-1 0:0:0', '%Y-%m-%d %H:%M:%S'),
-            ('2011-1-3T00:00:0', '%Y-%m-%dT%H:%M:%S')
-        )
-
-        for dt_string, dt_format in dt_string_to_format:
-            self.assertEqual(
-                tools._guess_datetime_format(dt_string),
-                dt_format
-            )
-
-
-    def test_guess_datetime_format_for_array(self):
-        expected_format = '%Y-%m-%d %H:%M:%S.%f'
-        dt_string = datetime(2011, 12, 30, 0, 0, 0).strftime(expected_format)
-
-        test_arrays = [
-            np.array([dt_string, dt_string, dt_string], dtype='O'),
-            np.array([np.nan, np.nan, dt_string], dtype='O'),
-            np.array([dt_string, 'random_string'], dtype='O'),
-        ]
-
-        for test_array in test_arrays:
-            self.assertEqual(
-                tools._guess_datetime_format_for_array(test_array),
-                expected_format
-            )
-
-        format_for_string_of_nans = tools._guess_datetime_format_for_array(
-            np.array([np.nan, np.nan, np.nan], dtype='O')
-        )
-        self.assertTrue(format_for_string_of_nans is None)
-
-
-class TestTimestampToJulianDate(tm.TestCase):
-
-    def test_compare_1700(self):
-        r = Timestamp('1700-06-23').to_julian_date()
-        self.assertEqual(r, 2342145.5)
-
-    def test_compare_2000(self):
-        r = Timestamp('2000-04-12').to_julian_date()
-        self.assertEqual(r, 2451646.5)
-
-    def test_compare_2100(self):
-        r = Timestamp('2100-08-12').to_julian_date()
-        self.assertEqual(r, 2488292.5)
-
-    def test_compare_hour01(self):
-        r = Timestamp('2000-08-12T01:00:00').to_julian_date()
-        self.assertEqual(r, 2451768.5416666666666666)
-
-    def test_compare_hour13(self):
-        r = Timestamp('2000-08-12T13:00:00').to_julian_date()
-        self.assertEqual(r, 2451769.0416666666666666)
-
-
-class TestDateTimeIndexToJulianDate(tm.TestCase):
-    def test_1700(self):
-        r1 = Float64Index([2345897.5,
-                           2345898.5,
-                           2345899.5,
-                           2345900.5,
-                           2345901.5])
-        r2 = date_range(start=Timestamp('1710-10-01'),
-                        periods=5,
-                        freq='D').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-    def test_2000(self):
-        r1 = Float64Index([2451601.5,
-                           2451602.5,
-                           2451603.5,
-                           2451604.5,
-                           2451605.5])
-        r2 = date_range(start=Timestamp('2000-02-27'),
-                        periods=5,
-                        freq='D').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-    def test_hour(self):
-        r1 = Float64Index([2451601.5,
-                           2451601.5416666666666666,
-                           2451601.5833333333333333,
-                           2451601.625,
-                           2451601.6666666666666666])
-        r2 = date_range(start=Timestamp('2000-02-27'),
-                        periods=5,
-                        freq='H').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-    def test_minute(self):
-        r1 = Float64Index([2451601.5,
-                           2451601.5006944444444444,
-                           2451601.5013888888888888,
-                           2451601.5020833333333333,
-                           2451601.5027777777777777])
-        r2 = date_range(start=Timestamp('2000-02-27'),
-                        periods=5,
-                        freq='T').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-    def test_second(self):
-        r1 = Float64Index([2451601.5,
-                           2451601.500011574074074,
-                           2451601.5000231481481481,
-                           2451601.5000347222222222,
-                           2451601.5000462962962962])
-        r2 = date_range(start=Timestamp('2000-02-27'),
-                        periods=5,
-                        freq='S').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-class TestDaysInMonth(tm.TestCase):
-
-    def test_coerce_deprecation(self):
-
-        # deprecation of coerce
-        with tm.assert_produces_warning(FutureWarning):
-            to_datetime('2015-02-29', coerce=True)
-        with tm.assert_produces_warning(FutureWarning):
-            self.assertRaises(ValueError, lambda : to_datetime('2015-02-29', coerce=False))
-
-        # multiple arguments
-        for e, c in zip(['raise','ignore','coerce'],[True,False]):
-            with tm.assert_produces_warning(FutureWarning):
-                self.assertRaises(TypeError, lambda : to_datetime('2015-02-29', errors=e, coerce=c))
-
-    # tests for issue #10154
-    def test_day_not_in_month_coerce(self):
-        self.assertTrue(isnull(to_datetime('2015-02-29', errors='coerce')))
-        self.assertTrue(isnull(to_datetime('2015-02-29', format="%Y-%m-%d", errors='coerce')))
-        self.assertTrue(isnull(to_datetime('2015-02-32', format="%Y-%m-%d", errors='coerce')))
-        self.assertTrue(isnull(to_datetime('2015-04-31', format="%Y-%m-%d", errors='coerce')))
-
-    def test_day_not_in_month_raise(self):
-        self.assertRaises(ValueError, to_datetime, '2015-02-29', errors='raise')
-        self.assertRaises(ValueError, to_datetime, '2015-02-29', errors='raise', format="%Y-%m-%d")
-        self.assertRaises(ValueError, to_datetime, '2015-02-32', errors='raise', format="%Y-%m-%d")
-        self.assertRaises(ValueError, to_datetime, '2015-04-31', errors='raise', format="%Y-%m-%d")
-
-    def test_day_not_in_month_ignore(self):
-        self.assertEqual(to_datetime('2015-02-29', errors='ignore'), '2015-02-29')
-        self.assertEqual(to_datetime('2015-02-29', errors='ignore', format="%Y-%m-%d"), '2015-02-29')
-        self.assertEqual(to_datetime('2015-02-32', errors='ignore', format="%Y-%m-%d"), '2015-02-32')
-        self.assertEqual(to_datetime('2015-04-31', errors='ignore', format="%Y-%m-%d"), '2015-04-31')
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tseries/tests/test_timeseries_legacy.py b/pandas/tseries/tests/test_timeseries_legacy.py
deleted file mode 100644
index 4cbc171364ee6..0000000000000
--- a/pandas/tseries/tests/test_timeseries_legacy.py
+++ /dev/null
@@ -1,238 +0,0 @@
-# pylint: disable-msg=E1101,W0612
-from datetime import datetime, time, timedelta
-import sys
-import os
-
-import nose
-
-import numpy as np
-randn = np.random.randn
-
-from pandas import (Index, Series, DataFrame,
-                    isnull, date_range, Timestamp, DatetimeIndex,
-                    Int64Index, to_datetime, bdate_range)
-
-import pandas.core.datetools as datetools
-import pandas.tseries.offsets as offsets
-import pandas as pd
-
-from pandas.util.testing import assert_series_equal, assert_almost_equal
-import pandas.util.testing as tm
-
-from pandas.compat import(
-    range, long, StringIO, lrange, lmap, map, zip, cPickle as pickle, product
-)
-from pandas import read_pickle
-from numpy.random import rand
-import pandas.compat as compat
-from pandas.core.datetools import BDay
-
-
-# infortunately, too much has changed to handle these legacy pickles
-# class TestLegacySupport(unittest.TestCase):
-class LegacySupport(object):
-
-    _multiprocess_can_split_ = True
-
-    @classmethod
-    def setUpClass(cls):
-        if compat.PY3:
-            raise nose.SkipTest("not compatible with Python >= 3")
-
-        pth, _ = os.path.split(os.path.abspath(__file__))
-        filepath = os.path.join(pth, 'data', 'frame.pickle')
-
-        with open(filepath, 'rb') as f:
-            cls.frame = pickle.load(f)
-
-        filepath = os.path.join(pth, 'data', 'series.pickle')
-        with open(filepath, 'rb') as f:
-            cls.series = pickle.load(f)
-
-    def test_pass_offset_warn(self):
-        buf = StringIO()
-
-        sys.stderr = buf
-        DatetimeIndex(start='1/1/2000', periods=10, offset='H')
-        sys.stderr = sys.__stderr__
-
-    def test_unpickle_legacy_frame(self):
-        dtindex = DatetimeIndex(start='1/3/2005', end='1/14/2005',
-                                freq=BDay(1))
-
-        unpickled = self.frame
-
-        self.assertEqual(type(unpickled.index), DatetimeIndex)
-        self.assertEqual(len(unpickled), 10)
-        self.assertTrue((unpickled.columns == Int64Index(np.arange(5))).all())
-        self.assertTrue((unpickled.index == dtindex).all())
-        self.assertEqual(unpickled.index.offset, BDay(1, normalize=True))
-
-    def test_unpickle_legacy_series(self):
-        from pandas.core.datetools import BDay
-
-        unpickled = self.series
-
-        dtindex = DatetimeIndex(start='1/3/2005', end='1/14/2005',
-                                freq=BDay(1))
-
-        self.assertEqual(type(unpickled.index), DatetimeIndex)
-        self.assertEqual(len(unpickled), 10)
-        self.assertTrue((unpickled.index == dtindex).all())
-        self.assertEqual(unpickled.index.offset, BDay(1, normalize=True))
-
-    def test_unpickle_legacy_len0_daterange(self):
-        pth, _ = os.path.split(os.path.abspath(__file__))
-        filepath = os.path.join(pth, 'data', 'series_daterange0.pickle')
-
-        result = pd.read_pickle(filepath)
-
-        ex_index = DatetimeIndex([], freq='B')
-
-        self.assertTrue(result.index.equals(ex_index))
-        tm.assertIsInstance(result.index.freq, offsets.BDay)
-        self.assertEqual(len(result), 0)
-
-    def test_arithmetic_interaction(self):
-        index = self.frame.index
-        obj_index = index.asobject
-
-        dseries = Series(rand(len(index)), index=index)
-        oseries = Series(dseries.values, index=obj_index)
-
-        result = dseries + oseries
-        expected = dseries * 2
-        tm.assertIsInstance(result.index, DatetimeIndex)
-        assert_series_equal(result, expected)
-
-        result = dseries + oseries[:5]
-        expected = dseries + dseries[:5]
-        tm.assertIsInstance(result.index, DatetimeIndex)
-        assert_series_equal(result, expected)
-
-    def test_join_interaction(self):
-        index = self.frame.index
-        obj_index = index.asobject
-
-        def _check_join(left, right, how='inner'):
-            ra, rb, rc = left.join(right, how=how, return_indexers=True)
-            ea, eb, ec = left.join(DatetimeIndex(right), how=how,
-                                   return_indexers=True)
-
-            tm.assertIsInstance(ra, DatetimeIndex)
-            self.assertTrue(ra.equals(ea))
-
-            assert_almost_equal(rb, eb)
-            assert_almost_equal(rc, ec)
-
-        _check_join(index[:15], obj_index[5:], how='inner')
-        _check_join(index[:15], obj_index[5:], how='outer')
-        _check_join(index[:15], obj_index[5:], how='right')
-        _check_join(index[:15], obj_index[5:], how='left')
-
-    def test_join_nonunique(self):
-        idx1 = to_datetime(['2012-11-06 16:00:11.477563',
-                            '2012-11-06 16:00:11.477563'])
-        idx2 = to_datetime(['2012-11-06 15:11:09.006507',
-                            '2012-11-06 15:11:09.006507'])
-        rs = idx1.join(idx2, how='outer')
-        self.assertTrue(rs.is_monotonic)
-
-    def test_unpickle_daterange(self):
-        pth, _ = os.path.split(os.path.abspath(__file__))
-        filepath = os.path.join(pth, 'data', 'daterange_073.pickle')
-
-        rng = read_pickle(filepath)
-        tm.assertIsInstance(rng[0], datetime)
-        tm.assertIsInstance(rng.offset, offsets.BDay)
-        self.assertEqual(rng.values.dtype, object)
-
-    def test_setops(self):
-        index = self.frame.index
-        obj_index = index.asobject
-
-        result = index[:5].union(obj_index[5:])
-        expected = index
-        tm.assertIsInstance(result, DatetimeIndex)
-        self.assertTrue(result.equals(expected))
-
-        result = index[:10].intersection(obj_index[5:])
-        expected = index[5:10]
-        tm.assertIsInstance(result, DatetimeIndex)
-        self.assertTrue(result.equals(expected))
-
-        result = index[:10] - obj_index[5:]
-        expected = index[:5]
-        tm.assertIsInstance(result, DatetimeIndex)
-        self.assertTrue(result.equals(expected))
-
-    def test_index_conversion(self):
-        index = self.frame.index
-        obj_index = index.asobject
-
-        conv = DatetimeIndex(obj_index)
-        self.assertTrue(conv.equals(index))
-
-        self.assertRaises(ValueError, DatetimeIndex, ['a', 'b', 'c', 'd'])
-
-    def test_tolist(self):
-        rng = date_range('1/1/2000', periods=10)
-
-        result = rng.tolist()
-        tm.assertIsInstance(result[0], Timestamp)
-
-    def test_object_convert_fail(self):
-        idx = DatetimeIndex([NaT])
-        self.assertRaises(ValueError, idx.astype, 'O')
-
-    def test_setops_conversion_fail(self):
-        index = self.frame.index
-
-        right = Index(['a', 'b', 'c', 'd'])
-
-        result = index.union(right)
-        expected = Index(np.concatenate([index.asobject, right]))
-        self.assertTrue(result.equals(expected))
-
-        result = index.intersection(right)
-        expected = Index([])
-        self.assertTrue(result.equals(expected))
-
-    def test_legacy_time_rules(self):
-        rules = [('WEEKDAY', 'B'),
-                 ('EOM', 'BM'),
-                 ('W@MON', 'W-MON'), ('W@TUE', 'W-TUE'), ('W@WED', 'W-WED'),
-                 ('W@THU', 'W-THU'), ('W@FRI', 'W-FRI'),
-                 ('Q@JAN', 'BQ-JAN'), ('Q@FEB', 'BQ-FEB'), ('Q@MAR', 'BQ-MAR'),
-                 ('A@JAN', 'BA-JAN'), ('A@FEB', 'BA-FEB'), ('A@MAR', 'BA-MAR'),
-                 ('A@APR', 'BA-APR'), ('A@MAY', 'BA-MAY'), ('A@JUN', 'BA-JUN'),
-                 ('A@JUL', 'BA-JUL'), ('A@AUG', 'BA-AUG'), ('A@SEP', 'BA-SEP'),
-                 ('A@OCT', 'BA-OCT'), ('A@NOV', 'BA-NOV'), ('A@DEC', 'BA-DEC'),
-                 ('WOM@1FRI', 'WOM-1FRI'), ('WOM@2FRI', 'WOM-2FRI'),
-                 ('WOM@3FRI', 'WOM-3FRI'), ('WOM@4FRI', 'WOM-4FRI')]
-
-        start, end = '1/1/2000', '1/1/2010'
-
-        for old_freq, new_freq in rules:
-            old_rng = date_range(start, end, freq=old_freq)
-            new_rng = date_range(start, end, freq=new_freq)
-            self.assertTrue(old_rng.equals(new_rng))
-
-            # test get_legacy_offset_name
-            offset = datetools.get_offset(new_freq)
-            old_name = datetools.get_legacy_offset_name(offset)
-            self.assertEqual(old_name, old_freq)
-
-    def test_ms_vs_MS(self):
-        left = datetools.get_offset('ms')
-        right = datetools.get_offset('MS')
-        self.assertEqual(left, datetools.Milli())
-        self.assertEqual(right, datetools.MonthBegin())
-
-    def test_rule_aliases(self):
-        rule = datetools.to_offset('10us')
-        self.assertEqual(rule, datetools.Micro(10))
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tseries/tests/test_timezones.py b/pandas/tseries/tests/test_timezones.py
deleted file mode 100644
index a6e5812158474..0000000000000
--- a/pandas/tseries/tests/test_timezones.py
+++ /dev/null
@@ -1,1306 +0,0 @@
-# pylint: disable-msg=E1101,W0612
-from datetime import datetime, timedelta, tzinfo, date
-import nose
-
-import numpy as np
-import pytz
-
-from pandas import (Index, Series, DataFrame, isnull, Timestamp)
-
-from pandas import DatetimeIndex, to_datetime, NaT
-from pandas import tslib
-
-import pandas.core.datetools as datetools
-import pandas.tseries.offsets as offsets
-from pandas.tseries.index import bdate_range, date_range
-import pandas.tseries.tools as tools
-from pytz import NonExistentTimeError
-
-import pandas.util.testing as tm
-from pandas.core.dtypes import DatetimeTZDtype
-from pandas.util.testing import assert_frame_equal
-from pandas.compat import lrange, zip
-
-
-try:
-    import pytz
-except ImportError:
-    pass
-
-try:
-    import dateutil
-except ImportError:
-    pass
-
-
-class FixedOffset(tzinfo):
-    """Fixed offset in minutes east from UTC."""
-
-    def __init__(self, offset, name):
-        self.__offset = timedelta(minutes=offset)
-        self.__name = name
-
-    def utcoffset(self, dt):
-        return self.__offset
-
-    def tzname(self, dt):
-        return self.__name
-
-    def dst(self, dt):
-        return timedelta(0)
-
-fixed_off = FixedOffset(-420, '-07:00')
-fixed_off_no_name = FixedOffset(-330, None)
-
-
-class TestTimeZoneSupportPytz(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        tm._skip_if_no_pytz()
-
-    def tz(self, tz):
-        ''' Construct a timezone object from a string. Overridden in subclass to parameterize tests. '''
-        return pytz.timezone(tz)
-
-    def tzstr(self, tz):
-        ''' Construct a timezone string from a string. Overridden in subclass to parameterize tests. '''
-        return tz
-
-    def localize(self, tz, x):
-        return tz.localize(x)
-
-    def cmptz(self, tz1, tz2):
-        ''' Compare two timezones. Overridden in subclass to parameterize tests. '''
-        return tz1.zone == tz2.zone
-
-    def test_utc_to_local_no_modify(self):
-        rng = date_range('3/11/2012', '3/12/2012', freq='H', tz='utc')
-        rng_eastern = rng.tz_convert(self.tzstr('US/Eastern'))
-
-        # Values are unmodified
-        self.assertTrue(np.array_equal(rng.asi8, rng_eastern.asi8))
-
-        self.assertTrue(self.cmptz(rng_eastern.tz, self.tz('US/Eastern')))
-
-    def test_utc_to_local_no_modify_explicit(self):
-        rng = date_range('3/11/2012', '3/12/2012', freq='H', tz='utc')
-        rng_eastern = rng.tz_convert(self.tz('US/Eastern'))
-
-        # Values are unmodified
-        self.assert_numpy_array_equal(rng.asi8, rng_eastern.asi8)
-
-        self.assertEqual(rng_eastern.tz, self.tz('US/Eastern'))
-
-
-    def test_localize_utc_conversion(self):
-        # Localizing to time zone should:
-        #  1) check for DST ambiguities
-        #  2) convert to UTC
-
-        rng = date_range('3/10/2012', '3/11/2012', freq='30T')
-
-        converted = rng.tz_localize(self.tzstr('US/Eastern'))
-        expected_naive = rng + offsets.Hour(5)
-        self.assert_numpy_array_equal(converted.asi8, expected_naive.asi8)
-
-        # DST ambiguity, this should fail
-        rng = date_range('3/11/2012', '3/12/2012', freq='30T')
-        # Is this really how it should fail??
-        self.assertRaises(NonExistentTimeError, rng.tz_localize, self.tzstr('US/Eastern'))
-
-    def test_localize_utc_conversion_explicit(self):
-        # Localizing to time zone should:
-        #  1) check for DST ambiguities
-        #  2) convert to UTC
-
-        rng = date_range('3/10/2012', '3/11/2012', freq='30T')
-        converted = rng.tz_localize(self.tz('US/Eastern'))
-        expected_naive = rng + offsets.Hour(5)
-        self.assertTrue(np.array_equal(converted.asi8, expected_naive.asi8))
-
-        # DST ambiguity, this should fail
-        rng = date_range('3/11/2012', '3/12/2012', freq='30T')
-        # Is this really how it should fail??
-        self.assertRaises(NonExistentTimeError, rng.tz_localize, self.tz('US/Eastern'))
-
-    def test_timestamp_tz_localize(self):
-        stamp = Timestamp('3/11/2012 04:00')
-
-        result = stamp.tz_localize(self.tzstr('US/Eastern'))
-        expected = Timestamp('3/11/2012 04:00', tz=self.tzstr('US/Eastern'))
-        self.assertEqual(result.hour, expected.hour)
-        self.assertEqual(result, expected)
-
-    def test_timestamp_tz_localize_explicit(self):
-        stamp = Timestamp('3/11/2012 04:00')
-
-        result = stamp.tz_localize(self.tz('US/Eastern'))
-        expected = Timestamp('3/11/2012 04:00', tz=self.tz('US/Eastern'))
-        self.assertEqual(result.hour, expected.hour)
-        self.assertEqual(result, expected)
-
-    def test_timestamp_constructed_by_date_and_tz(self):
-        # Fix Issue 2993, Timestamp cannot be constructed by datetime.date
-        # and tz correctly
-
-        result = Timestamp(date(2012, 3, 11), tz=self.tzstr('US/Eastern'))
-
-        expected = Timestamp('3/11/2012', tz=self.tzstr('US/Eastern'))
-        self.assertEqual(result.hour, expected.hour)
-        self.assertEqual(result, expected)
-
-    def test_timestamp_constructed_by_date_and_tz_explicit(self):
-        # Fix Issue 2993, Timestamp cannot be constructed by datetime.date
-        # and tz correctly
-
-        result = Timestamp(date(2012, 3, 11), tz=self.tz('US/Eastern'))
-
-        expected = Timestamp('3/11/2012', tz=self.tz('US/Eastern'))
-        self.assertEqual(result.hour, expected.hour)
-        self.assertEqual(result, expected)
-
-    def test_timestamp_to_datetime_tzoffset(self):
-        # tzoffset
-        from dateutil.tz import tzoffset
-        tzinfo = tzoffset(None, 7200)
-        expected = Timestamp('3/11/2012 04:00', tz=tzinfo)
-        result = Timestamp(expected.to_datetime())
-        self.assertEqual(expected, result)
-
-    def test_timedelta_push_over_dst_boundary(self):
-        # #1389
-
-        # 4 hours before DST transition
-        stamp = Timestamp('3/10/2012 22:00', tz=self.tzstr('US/Eastern'))
-
-        result = stamp + timedelta(hours=6)
-
-        # spring forward, + "7" hours
-        expected = Timestamp('3/11/2012 05:00', tz=self.tzstr('US/Eastern'))
-
-        self.assertEqual(result, expected)
-
-    def test_timedelta_push_over_dst_boundary_explicit(self):
-        # #1389
-
-        # 4 hours before DST transition
-        stamp = Timestamp('3/10/2012 22:00', tz=self.tz('US/Eastern'))
-
-        result = stamp + timedelta(hours=6)
-
-        # spring forward, + "7" hours
-        expected = Timestamp('3/11/2012 05:00', tz=self.tz('US/Eastern'))
-
-        self.assertEqual(result, expected)
-
-    def test_tz_localize_dti(self):
-        from pandas.tseries.offsets import Hour
-
-        dti = DatetimeIndex(start='1/1/2005', end='1/1/2005 0:00:30.256',
-                            freq='L')
-        dti2 = dti.tz_localize(self.tzstr('US/Eastern'))
-
-        dti_utc = DatetimeIndex(start='1/1/2005 05:00',
-                                end='1/1/2005 5:00:30.256', freq='L',
-                                tz='utc')
-
-        self.assert_numpy_array_equal(dti2.values, dti_utc.values)
-
-        dti3 = dti2.tz_convert(self.tzstr('US/Pacific'))
-        self.assert_numpy_array_equal(dti3.values, dti_utc.values)
-
-        dti = DatetimeIndex(start='11/6/2011 1:59',
-                            end='11/6/2011 2:00', freq='L')
-        self.assertRaises(pytz.AmbiguousTimeError, dti.tz_localize,
-                          self.tzstr('US/Eastern'))
-
-        dti = DatetimeIndex(start='3/13/2011 1:59', end='3/13/2011 2:00',
-                            freq='L')
-        self.assertRaises(
-            pytz.NonExistentTimeError, dti.tz_localize, self.tzstr('US/Eastern'))
-
-    def test_tz_localize_empty_series(self):
-        # #2248
-
-        ts = Series()
-
-        ts2 = ts.tz_localize('utc')
-        self.assertTrue(ts2.index.tz == pytz.utc)
-
-        ts2 = ts.tz_localize(self.tzstr('US/Eastern'))
-        self.assertTrue(self.cmptz(ts2.index.tz, self.tz('US/Eastern')))
-
-    def test_astimezone(self):
-        utc = Timestamp('3/11/2012 22:00', tz='UTC')
-        expected = utc.tz_convert(self.tzstr('US/Eastern'))
-        result = utc.astimezone(self.tzstr('US/Eastern'))
-        self.assertEqual(expected, result)
-        tm.assertIsInstance(result, Timestamp)
-
-    def test_create_with_tz(self):
-        stamp = Timestamp('3/11/2012 05:00', tz=self.tzstr('US/Eastern'))
-        self.assertEqual(stamp.hour, 5)
-
-        rng = date_range(
-            '3/11/2012 04:00', periods=10, freq='H', tz=self.tzstr('US/Eastern'))
-
-        self.assertEqual(stamp, rng[1])
-
-        utc_stamp = Timestamp('3/11/2012 05:00', tz='utc')
-        self.assertIs(utc_stamp.tzinfo, pytz.utc)
-        self.assertEqual(utc_stamp.hour, 5)
-
-        stamp = Timestamp('3/11/2012 05:00').tz_localize('utc')
-        self.assertEqual(utc_stamp.hour, 5)
-
-    def test_create_with_fixed_tz(self):
-        off = FixedOffset(420, '+07:00')
-        start = datetime(2012, 3, 11, 5, 0, 0, tzinfo=off)
-        end = datetime(2012, 6, 11, 5, 0, 0, tzinfo=off)
-        rng = date_range(start=start, end=end)
-        self.assertEqual(off, rng.tz)
-
-        rng2 = date_range(start, periods=len(rng), tz=off)
-        self.assertTrue(rng.equals(rng2))
-
-        rng3 = date_range(
-            '3/11/2012 05:00:00+07:00', '6/11/2012 05:00:00+07:00')
-        self.assertTrue((rng.values == rng3.values).all())
-
-    def test_create_with_fixedoffset_noname(self):
-        off = fixed_off_no_name
-        start = datetime(2012, 3, 11, 5, 0, 0, tzinfo=off)
-        end = datetime(2012, 6, 11, 5, 0, 0, tzinfo=off)
-        rng = date_range(start=start, end=end)
-        self.assertEqual(off, rng.tz)
-
-        idx = Index([start, end])
-        self.assertEqual(off, idx.tz)
-
-    def test_date_range_localize(self):
-        rng = date_range(
-            '3/11/2012 03:00', periods=15, freq='H', tz='US/Eastern')
-        rng2 = DatetimeIndex(['3/11/2012 03:00', '3/11/2012 04:00'],
-                             tz='US/Eastern')
-        rng3 = date_range('3/11/2012 03:00', periods=15, freq='H')
-        rng3 = rng3.tz_localize('US/Eastern')
-
-        self.assertTrue(rng.equals(rng3))
-
-        # DST transition time
-        val = rng[0]
-        exp = Timestamp('3/11/2012 03:00', tz='US/Eastern')
-
-        self.assertEqual(val.hour, 3)
-        self.assertEqual(exp.hour, 3)
-        self.assertEqual(val, exp)  # same UTC value
-        self.assertTrue(rng[:2].equals(rng2))
-
-        # Right before the DST transition
-        rng = date_range(
-            '3/11/2012 00:00', periods=2, freq='H', tz='US/Eastern')
-        rng2 = DatetimeIndex(['3/11/2012 00:00', '3/11/2012 01:00'],
-                             tz='US/Eastern')
-        self.assertTrue(rng.equals(rng2))
-        exp = Timestamp('3/11/2012 00:00', tz='US/Eastern')
-        self.assertEqual(exp.hour, 0)
-        self.assertEqual(rng[0], exp)
-        exp = Timestamp('3/11/2012 01:00', tz='US/Eastern')
-        self.assertEqual(exp.hour, 1)
-        self.assertEqual(rng[1], exp)
-
-        rng = date_range('3/11/2012 00:00', periods=10, freq='H',
-                         tz='US/Eastern')
-        self.assertEqual(rng[2].hour, 3)
-
-    def test_utc_box_timestamp_and_localize(self):
-        rng = date_range('3/11/2012', '3/12/2012', freq='H', tz='utc')
-        rng_eastern = rng.tz_convert(self.tzstr('US/Eastern'))
-
-        tz = self.tz('US/Eastern')
-        expected = rng[-1].astimezone(tz)
-
-        stamp = rng_eastern[-1]
-        self.assertEqual(stamp, expected)
-        self.assertEqual(stamp.tzinfo, expected.tzinfo)
-
-        # right tzinfo
-        rng = date_range('3/13/2012', '3/14/2012', freq='H', tz='utc')
-        rng_eastern = rng.tz_convert(self.tzstr('US/Eastern'))
-        # test not valid for dateutil timezones.
-        # self.assertIn('EDT', repr(rng_eastern[0].tzinfo))
-        self.assertTrue('EDT' in repr(rng_eastern[0].tzinfo) or 'tzfile' in repr(rng_eastern[0].tzinfo))
-
-    def test_timestamp_tz_convert(self):
-        strdates = ['1/1/2012', '3/1/2012', '4/1/2012']
-        idx = DatetimeIndex(strdates, tz=self.tzstr('US/Eastern'))
-
-        conv = idx[0].tz_convert(self.tzstr('US/Pacific'))
-        expected = idx.tz_convert(self.tzstr('US/Pacific'))[0]
-
-        self.assertEqual(conv, expected)
-
-    def test_pass_dates_localize_to_utc(self):
-        strdates = ['1/1/2012', '3/1/2012', '4/1/2012']
-
-        idx = DatetimeIndex(strdates)
-        conv = idx.tz_localize(self.tzstr('US/Eastern'))
-
-        fromdates = DatetimeIndex(strdates, tz=self.tzstr('US/Eastern'))
-
-        self.assertEqual(conv.tz, fromdates.tz)
-        self.assert_numpy_array_equal(conv.values, fromdates.values)
-
-    def test_field_access_localize(self):
-        strdates = ['1/1/2012', '3/1/2012', '4/1/2012']
-        rng = DatetimeIndex(strdates, tz=self.tzstr('US/Eastern'))
-        self.assertTrue((rng.hour == 0).all())
-
-        # a more unusual time zone, #1946
-        dr = date_range('2011-10-02 00:00', freq='h', periods=10,
-                        tz=self.tzstr('America/Atikokan'))
-
-        expected = np.arange(10)
-        self.assert_numpy_array_equal(dr.hour, expected)
-
-    def test_with_tz(self):
-        tz = self.tz('US/Central')
-
-        # just want it to work
-        start = datetime(2011, 3, 12, tzinfo=pytz.utc)
-        dr = bdate_range(start, periods=50, freq=datetools.Hour())
-        self.assertIs(dr.tz, pytz.utc)
-
-        # DateRange with naive datetimes
-        dr = bdate_range('1/1/2005', '1/1/2009', tz=pytz.utc)
-        dr = bdate_range('1/1/2005', '1/1/2009', tz=tz)
-
-        # normalized
-        central = dr.tz_convert(tz)
-        self.assertIs(central.tz, tz)
-        comp = self.localize(tz, central[0].to_pydatetime().replace(tzinfo=None)).tzinfo
-        self.assertIs(central[0].tz, comp)
-
-        # compare vs a localized tz
-        comp = self.localize(tz, dr[0].to_pydatetime().replace(tzinfo=None)).tzinfo
-        self.assertIs(central[0].tz, comp)
-
-        # datetimes with tzinfo set
-        dr = bdate_range(datetime(2005, 1, 1, tzinfo=pytz.utc),
-                         '1/1/2009', tz=pytz.utc)
-
-        self.assertRaises(Exception, bdate_range,
-                          datetime(2005, 1, 1, tzinfo=pytz.utc),
-                          '1/1/2009', tz=tz)
-
-    def test_tz_localize(self):
-        dr = bdate_range('1/1/2009', '1/1/2010')
-        dr_utc = bdate_range('1/1/2009', '1/1/2010', tz=pytz.utc)
-        localized = dr.tz_localize(pytz.utc)
-        self.assert_numpy_array_equal(dr_utc, localized)
-
-    def test_with_tz_ambiguous_times(self):
-        tz = self.tz('US/Eastern')
-
-        # March 13, 2011, spring forward, skip from 2 AM to 3 AM
-        dr = date_range(datetime(2011, 3, 13, 1, 30), periods=3,
-                        freq=datetools.Hour())
-        self.assertRaises(pytz.NonExistentTimeError, dr.tz_localize, tz)
-
-        # after dst transition, it works
-        dr = date_range(datetime(2011, 3, 13, 3, 30), periods=3,
-                        freq=datetools.Hour(), tz=tz)
-
-        # November 6, 2011, fall back, repeat 2 AM hour
-        dr = date_range(datetime(2011, 11, 6, 1, 30), periods=3,
-                        freq=datetools.Hour())
-        self.assertRaises(pytz.AmbiguousTimeError, dr.tz_localize, tz)
-
-        # UTC is OK
-        dr = date_range(datetime(2011, 3, 13), periods=48,
-                        freq=datetools.Minute(30), tz=pytz.utc)
-
-    def test_ambiguous_infer(self):
-        # November 6, 2011, fall back, repeat 2 AM hour
-        # With no repeated hours, we cannot infer the transition
-        tz = self.tz('US/Eastern')
-        dr = date_range(datetime(2011, 11, 6, 0), periods=5,
-                        freq=datetools.Hour())
-        self.assertRaises(pytz.AmbiguousTimeError, dr.tz_localize, tz)
-
-        # With repeated hours, we can infer the transition
-        dr = date_range(datetime(2011, 11, 6, 0), periods=5,
-                        freq=datetools.Hour(), tz=tz)
-        times = ['11/06/2011 00:00', '11/06/2011 01:00',
-                 '11/06/2011 01:00', '11/06/2011 02:00',
-                 '11/06/2011 03:00']
-        di = DatetimeIndex(times)
-        localized = di.tz_localize(tz, ambiguous='infer')
-        self.assert_numpy_array_equal(dr, localized)
-        with tm.assert_produces_warning(FutureWarning):
-            localized_old = di.tz_localize(tz, infer_dst=True)
-        self.assert_numpy_array_equal(dr, localized_old)
-        self.assert_numpy_array_equal(dr, DatetimeIndex(times, tz=tz, ambiguous='infer'))
-
-        # When there is no dst transition, nothing special happens
-        dr = date_range(datetime(2011, 6, 1, 0), periods=10,
-                        freq=datetools.Hour())
-        localized = dr.tz_localize(tz)
-        localized_infer = dr.tz_localize(tz, ambiguous='infer')
-        self.assert_numpy_array_equal(localized, localized_infer)
-        with tm.assert_produces_warning(FutureWarning):
-            localized_infer_old = dr.tz_localize(tz, infer_dst=True)
-        self.assert_numpy_array_equal(localized, localized_infer_old)
-
-    def test_ambiguous_flags(self):
-        # November 6, 2011, fall back, repeat 2 AM hour
-        tz = self.tz('US/Eastern')
-
-        # Pass in flags to determine right dst transition
-        dr = date_range(datetime(2011, 11, 6, 0), periods=5,
-                        freq=datetools.Hour(), tz=tz)
-        times = ['11/06/2011 00:00', '11/06/2011 01:00',
-                 '11/06/2011 01:00', '11/06/2011 02:00',
-                 '11/06/2011 03:00']
-
-        # Test tz_localize
-        di = DatetimeIndex(times)
-        is_dst = [1, 1, 0, 0, 0]
-        localized = di.tz_localize(tz, ambiguous=is_dst)
-        self.assert_numpy_array_equal(dr, localized)
-        self.assert_numpy_array_equal(dr, DatetimeIndex(times, tz=tz, ambiguous=is_dst))
-
-        localized = di.tz_localize(tz, ambiguous=np.array(is_dst))
-        self.assert_numpy_array_equal(dr, localized)
-
-        localized = di.tz_localize(tz, ambiguous=np.array(is_dst).astype('bool'))
-        self.assert_numpy_array_equal(dr, localized)
-
-        # Test constructor
-        localized = DatetimeIndex(times, tz=tz, ambiguous=is_dst)
-        self.assert_numpy_array_equal(dr, localized)
-
-        # Test duplicate times where infer_dst fails
-        times += times
-        di = DatetimeIndex(times)
-
-        # When the sizes are incompatible, make sure error is raised
-        self.assertRaises(Exception, di.tz_localize, tz, ambiguous=is_dst)
-
-        # When sizes are compatible and there are repeats ('infer' won't work)
-        is_dst = np.hstack((is_dst, is_dst))
-        localized = di.tz_localize(tz, ambiguous=is_dst)
-        dr = dr.append(dr)
-        self.assert_numpy_array_equal(dr, localized)
-
-        # When there is no dst transition, nothing special happens
-        dr = date_range(datetime(2011, 6, 1, 0), periods=10,
-                        freq=datetools.Hour())
-        is_dst = np.array([1] * 10)
-        localized = dr.tz_localize(tz)
-        localized_is_dst = dr.tz_localize(tz, ambiguous=is_dst)
-        self.assert_numpy_array_equal(localized, localized_is_dst)
-
-    def test_ambiguous_nat(self):
-        tz = self.tz('US/Eastern')
-        times = ['11/06/2011 00:00', '11/06/2011 01:00',
-                 '11/06/2011 01:00', '11/06/2011 02:00',
-                 '11/06/2011 03:00']
-        di = DatetimeIndex(times)
-        localized = di.tz_localize(tz, ambiguous='NaT')
-
-        times = ['11/06/2011 00:00', np.NaN,
-                 np.NaN, '11/06/2011 02:00',
-                 '11/06/2011 03:00']
-        di_test = DatetimeIndex(times, tz='US/Eastern')
-        self.assert_numpy_array_equal(di_test, localized)
-
-    # test utility methods
-    def test_infer_tz(self):
-        eastern = self.tz('US/Eastern')
-        utc = pytz.utc
-
-        _start = datetime(2001, 1, 1)
-        _end = datetime(2009, 1, 1)
-
-        start = self.localize(eastern, _start)
-        end = self.localize(eastern, _end)
-        assert(tools._infer_tzinfo(start, end) is self.localize(eastern, _start).tzinfo)
-        assert(tools._infer_tzinfo(start, None) is self.localize(eastern, _start).tzinfo)
-        assert(tools._infer_tzinfo(None, end) is self.localize(eastern, _end).tzinfo)
-
-        start = utc.localize(_start)
-        end = utc.localize(_end)
-        assert(tools._infer_tzinfo(start, end) is utc)
-
-        end = self.localize(eastern, _end)
-        self.assertRaises(Exception, tools._infer_tzinfo, start, end)
-        self.assertRaises(Exception, tools._infer_tzinfo, end, start)
-
-    def test_tz_string(self):
-        result = date_range('1/1/2000', periods=10, tz=self.tzstr('US/Eastern'))
-        expected = date_range('1/1/2000', periods=10,
-                              tz=self.tz('US/Eastern'))
-
-        self.assertTrue(result.equals(expected))
-
-    def test_take_dont_lose_meta(self):
-        tm._skip_if_no_pytz()
-        rng = date_range('1/1/2000', periods=20, tz=self.tzstr('US/Eastern'))
-
-        result = rng.take(lrange(5))
-        self.assertEqual(result.tz, rng.tz)
-        self.assertEqual(result.freq, rng.freq)
-
-    def test_index_with_timezone_repr(self):
-        rng = date_range('4/13/2010', '5/6/2010')
-
-        rng_eastern = rng.tz_localize(self.tzstr('US/Eastern'))
-
-        rng_repr = repr(rng_eastern)
-        self.assertIn('2010-04-13 00:00:00', rng_repr)
-
-    def test_index_astype_asobject_tzinfos(self):
-        # #1345
-
-        # dates around a dst transition
-        rng = date_range('2/13/2010', '5/6/2010', tz=self.tzstr('US/Eastern'))
-
-        objs = rng.asobject
-        for i, x in enumerate(objs):
-            exval = rng[i]
-            self.assertEqual(x, exval)
-            self.assertEqual(x.tzinfo, exval.tzinfo)
-
-        objs = rng.astype(object)
-        for i, x in enumerate(objs):
-            exval = rng[i]
-            self.assertEqual(x, exval)
-            self.assertEqual(x.tzinfo, exval.tzinfo)
-
-    def test_localized_at_time_between_time(self):
-        from datetime import time
-
-        rng = date_range('4/16/2012', '5/1/2012', freq='H')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        ts_local = ts.tz_localize(self.tzstr('US/Eastern'))
-
-        result = ts_local.at_time(time(10, 0))
-        expected = ts.at_time(time(10, 0)).tz_localize(self.tzstr('US/Eastern'))
-        tm.assert_series_equal(result, expected)
-        self.assertTrue(self.cmptz(result.index.tz, self.tz('US/Eastern')))
-
-        t1, t2 = time(10, 0), time(11, 0)
-        result = ts_local.between_time(t1, t2)
-        expected = ts.between_time(t1, t2).tz_localize(self.tzstr('US/Eastern'))
-        tm.assert_series_equal(result, expected)
-        self.assertTrue(self.cmptz(result.index.tz, self.tz('US/Eastern')))
-
-    def test_string_index_alias_tz_aware(self):
-        rng = date_range('1/1/2000', periods=10, tz=self.tzstr('US/Eastern'))
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts['1/3/2000']
-        self.assertAlmostEqual(result, ts[2])
-
-    def test_fixed_offset(self):
-        dates = [datetime(2000, 1, 1, tzinfo=fixed_off),
-                 datetime(2000, 1, 2, tzinfo=fixed_off),
-                 datetime(2000, 1, 3, tzinfo=fixed_off)]
-        result = to_datetime(dates)
-        self.assertEqual(result.tz, fixed_off)
-
-    def test_fixedtz_topydatetime(self):
-        dates = np.array([datetime(2000, 1, 1, tzinfo=fixed_off),
-                          datetime(2000, 1, 2, tzinfo=fixed_off),
-                          datetime(2000, 1, 3, tzinfo=fixed_off)])
-        result = to_datetime(dates).to_pydatetime()
-        self.assert_numpy_array_equal(dates, result)
-        result = to_datetime(dates)._mpl_repr()
-        self.assert_numpy_array_equal(dates, result)
-
-    def test_convert_tz_aware_datetime_datetime(self):
-        # #1581
-
-        tz = self.tz('US/Eastern')
-
-        dates = [datetime(2000, 1, 1), datetime(2000, 1, 2),
-                 datetime(2000, 1, 3)]
-
-        dates_aware = [self.localize(tz, x) for x in dates]
-        result = to_datetime(dates_aware)
-        self.assertTrue(self.cmptz(result.tz, self.tz('US/Eastern')))
-
-        converted = to_datetime(dates_aware, utc=True)
-        ex_vals = [Timestamp(x).value for x in dates_aware]
-        self.assert_numpy_array_equal(converted.asi8, ex_vals)
-        self.assertIs(converted.tz, pytz.utc)
-
-    def test_to_datetime_utc(self):
-        from dateutil.parser import parse
-        arr = np.array([parse('2012-06-13T01:39:00Z')], dtype=object)
-
-        result = to_datetime(arr, utc=True)
-        self.assertIs(result.tz, pytz.utc)
-
-    def test_to_datetime_tzlocal(self):
-        from dateutil.parser import parse
-        from dateutil.tz import tzlocal
-        dt = parse('2012-06-13T01:39:00Z')
-        dt = dt.replace(tzinfo=tzlocal())
-
-        arr = np.array([dt], dtype=object)
-
-        result = to_datetime(arr, utc=True)
-        self.assertIs(result.tz, pytz.utc)
-
-        rng = date_range('2012-11-03 03:00', '2012-11-05 03:00', tz=tzlocal())
-        arr = rng.to_pydatetime()
-        result = to_datetime(arr, utc=True)
-        self.assertIs(result.tz, pytz.utc)
-
-    def test_frame_no_datetime64_dtype(self):
-
-        # after 7822
-        # these retain the timezones on dict construction
-
-        dr = date_range('2011/1/1', '2012/1/1', freq='W-FRI')
-        dr_tz = dr.tz_localize(self.tzstr('US/Eastern'))
-        e = DataFrame({'A': 'foo', 'B': dr_tz}, index=dr)
-        tz_expected = DatetimeTZDtype('ns',dr_tz.tzinfo)
-        self.assertEqual(e['B'].dtype, tz_expected)
-
-        # GH 2810 (with timezones)
-        datetimes_naive   = [ ts.to_pydatetime() for ts in dr ]
-        datetimes_with_tz = [ ts.to_pydatetime() for ts in dr_tz ]
-        df = DataFrame({'dr' : dr, 'dr_tz' : dr_tz,
-                        'datetimes_naive': datetimes_naive,
-                        'datetimes_with_tz' : datetimes_with_tz })
-        result = df.get_dtype_counts().sort_index()
-        expected = Series({ 'datetime64[ns]' : 2, str(tz_expected) : 2 }).sort_index()
-        tm.assert_series_equal(result, expected)
-
-    def test_hongkong_tz_convert(self):
-        # #1673
-        dr = date_range(
-            '2012-01-01', '2012-01-10', freq='D', tz='Hongkong')
-
-        # it works!
-        dr.hour
-
-    def test_tz_convert_unsorted(self):
-        dr = date_range('2012-03-09', freq='H', periods=100, tz='utc')
-        dr = dr.tz_convert(self.tzstr('US/Eastern'))
-
-        result = dr[::-1].hour
-        exp = dr.hour[::-1]
-        tm.assert_almost_equal(result, exp)
-
-    def test_shift_localized(self):
-        dr = date_range('2011/1/1', '2012/1/1', freq='W-FRI')
-        dr_tz = dr.tz_localize(self.tzstr('US/Eastern'))
-
-        result = dr_tz.shift(1, '10T')
-        self.assertEqual(result.tz, dr_tz.tz)
-
-    def test_tz_aware_asfreq(self):
-        dr = date_range(
-            '2011-12-01', '2012-07-20', freq='D', tz=self.tzstr('US/Eastern'))
-
-        s = Series(np.random.randn(len(dr)), index=dr)
-
-        # it works!
-        s.asfreq('T')
-
-    def test_static_tzinfo(self):
-        # it works!
-        index = DatetimeIndex([datetime(2012, 1, 1)], tz=self.tzstr('EST'))
-        index.hour
-        index[0]
-
-    def test_tzaware_datetime_to_index(self):
-        d = [datetime(2012, 8, 19, tzinfo=self.tz('US/Eastern'))]
-
-        index = DatetimeIndex(d)
-        self.assertTrue(self.cmptz(index.tz, self.tz('US/Eastern')))
-
-    def test_date_range_span_dst_transition(self):
-        # #1778
-
-        # Standard -> Daylight Savings Time
-        dr = date_range('03/06/2012 00:00', periods=200, freq='W-FRI',
-                        tz='US/Eastern')
-
-        self.assertTrue((dr.hour == 0).all())
-
-        dr = date_range('2012-11-02', periods=10, tz=self.tzstr('US/Eastern'))
-        self.assertTrue((dr.hour == 0).all())
-
-    def test_convert_datetime_list(self):
-        dr = date_range('2012-06-02', periods=10, tz=self.tzstr('US/Eastern'))
-
-        dr2 = DatetimeIndex(list(dr), name='foo')
-        self.assertTrue(dr.equals(dr2))
-        self.assertEqual(dr.tz, dr2.tz)
-        self.assertEqual(dr2.name, 'foo')
-
-    def test_frame_from_records_utc(self):
-        rec = {'datum': 1.5,
-               'begin_time': datetime(2006, 4, 27, tzinfo=pytz.utc)}
-
-        # it works
-        DataFrame.from_records([rec], index='begin_time')
-
-    def test_frame_reset_index(self):
-        dr = date_range('2012-06-02', periods=10, tz=self.tzstr('US/Eastern'))
-        df = DataFrame(np.random.randn(len(dr)), dr)
-        roundtripped = df.reset_index().set_index('index')
-        xp = df.index.tz
-        rs = roundtripped.index.tz
-        self.assertEqual(xp, rs)
-
-    def test_dateutil_tzoffset_support(self):
-        from dateutil.tz import tzoffset
-        values = [188.5, 328.25]
-        tzinfo = tzoffset(None, 7200)
-        index = [datetime(2012, 5, 11, 11, tzinfo=tzinfo),
-                 datetime(2012, 5, 11, 12, tzinfo=tzinfo)]
-        series = Series(data=values, index=index)
-
-        self.assertEqual(series.index.tz, tzinfo)
-
-        # it works! #2443
-        repr(series.index[0])
-
-    def test_getitem_pydatetime_tz(self):
-        index = date_range(start='2012-12-24 16:00',
-                           end='2012-12-24 18:00', freq='H',
-                           tz=self.tzstr('Europe/Berlin'))
-        ts = Series(index=index, data=index.hour)
-        time_pandas = Timestamp('2012-12-24 17:00', tz=self.tzstr('Europe/Berlin'))
-        time_datetime = self.localize(self.tz('Europe/Berlin'), datetime(2012, 12, 24, 17, 0))
-        self.assertEqual(ts[time_pandas], ts[time_datetime])
-
-    def test_index_drop_dont_lose_tz(self):
-        # #2621
-        ind = date_range("2012-12-01", periods=10, tz="utc")
-        ind = ind.drop(ind[-1])
-
-        self.assertTrue(ind.tz is not None)
-
-    def test_datetimeindex_tz(self):
-        """ Test different DatetimeIndex constructions with timezone
-        Follow-up of #4229
-        """
-
-        arr = ['11/10/2005 08:00:00', '11/10/2005 09:00:00']
-
-        idx1 = to_datetime(arr).tz_localize(self.tzstr('US/Eastern'))
-        idx2 = DatetimeIndex(start="2005-11-10 08:00:00", freq='H', periods=2, tz=self.tzstr('US/Eastern'))
-        idx3 = DatetimeIndex(arr, tz=self.tzstr('US/Eastern'))
-        idx4 = DatetimeIndex(np.array(arr), tz=self.tzstr('US/Eastern'))
-
-        for other in [idx2, idx3, idx4]:
-            self.assertTrue(idx1.equals(other))
-
-    def test_datetimeindex_tz_nat(self):
-        idx = to_datetime([Timestamp("2013-1-1", tz=self.tzstr('US/Eastern')), NaT])
-
-        self.assertTrue(isnull(idx[1]))
-        self.assertTrue(idx[0].tzinfo is not None)
-
-
-class TestTimeZoneSupportDateutil(TestTimeZoneSupportPytz):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        tm._skip_if_no_dateutil()
-
-    def tz(self, tz):
-        '''
-        Construct a dateutil timezone.
-        Use tslib.maybe_get_tz so that we get the filename on the tz right
-        on windows. See #7337.
-        '''
-        return tslib.maybe_get_tz('dateutil/' + tz)
-
-    def tzstr(self, tz):
-        ''' Construct a timezone string from a string. Overridden in subclass to parameterize tests. '''
-        return 'dateutil/' + tz
-
-    def cmptz(self, tz1, tz2):
-        ''' Compare two timezones. Overridden in subclass to parameterize tests. '''
-        return tz1 == tz2
-
-    def localize(self, tz, x):
-        return x.replace(tzinfo=tz)
-
-    def test_utc_with_system_utc(self):
-        # Skipped on win32 due to dateutil bug
-        tm._skip_if_windows()
-
-        from pandas.tslib import maybe_get_tz
-
-        # from system utc to real utc
-        ts = Timestamp('2001-01-05 11:56', tz=maybe_get_tz('dateutil/UTC'))
-        # check that the time hasn't changed.
-        self.assertEqual(ts, ts.tz_convert(dateutil.tz.tzutc()))
-
-        # from system utc to real utc
-        ts = Timestamp('2001-01-05 11:56', tz=maybe_get_tz('dateutil/UTC'))
-        # check that the time hasn't changed.
-        self.assertEqual(ts, ts.tz_convert(dateutil.tz.tzutc()))
-
-    def test_tslib_tz_convert_trans_pos_plus_1__bug(self):
-        # Regression test for tslib.tz_convert(vals, tz1, tz2).
-        # See https://github.com/pydata/pandas/issues/4496 for details.
-        for freq, n in [('H', 1), ('T', 60), ('S', 3600)]:
-            idx = date_range(datetime(2011, 3, 26, 23), datetime(2011, 3, 27, 1), freq=freq)
-            idx = idx.tz_localize('UTC')
-            idx = idx.tz_convert('Europe/Moscow')
-
-            expected = np.repeat(np.array([3, 4, 5]), np.array([n, n, 1]))
-            self.assert_numpy_array_equal(idx.hour, expected)
-
-    def test_tslib_tz_convert_dst(self):
-        for freq, n in [('H', 1), ('T', 60), ('S', 3600)]:
-            # Start DST
-            idx = date_range('2014-03-08 23:00', '2014-03-09 09:00', freq=freq, tz='UTC')
-            idx = idx.tz_convert('US/Eastern')
-            expected = np.repeat(np.array([18, 19, 20, 21, 22, 23, 0, 1, 3, 4, 5]),
-                                 np.array([n, n, n, n, n, n, n, n, n, n, 1]))
-            self.assert_numpy_array_equal(idx.hour, expected)
-
-            idx = date_range('2014-03-08 18:00', '2014-03-09 05:00', freq=freq, tz='US/Eastern')
-            idx = idx.tz_convert('UTC')
-            expected = np.repeat(np.array([23, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9]),
-                                 np.array([n, n, n, n, n, n, n, n, n, n, 1]))
-            self.assert_numpy_array_equal(idx.hour, expected)
-
-            # End DST
-            idx = date_range('2014-11-01 23:00', '2014-11-02 09:00', freq=freq, tz='UTC')
-            idx = idx.tz_convert('US/Eastern')
-            expected = np.repeat(np.array([19, 20, 21, 22, 23, 0, 1, 1, 2, 3, 4]),
-                                 np.array([n, n, n, n, n, n, n, n, n, n, 1]))
-            self.assert_numpy_array_equal(idx.hour, expected)
-
-            idx = date_range('2014-11-01 18:00', '2014-11-02 05:00', freq=freq, tz='US/Eastern')
-            idx = idx.tz_convert('UTC')
-            expected = np.repeat(np.array([22, 23, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10]),
-                                 np.array([n, n, n, n, n, n, n, n, n, n, n, n, 1]))
-            self.assert_numpy_array_equal(idx.hour, expected)
-
-        # daily
-        # Start DST
-        idx = date_range('2014-03-08 00:00', '2014-03-09 00:00', freq='D', tz='UTC')
-        idx = idx.tz_convert('US/Eastern')
-        self.assert_numpy_array_equal(idx.hour, np.array([19, 19]))
-
-        idx = date_range('2014-03-08 00:00', '2014-03-09 00:00', freq='D', tz='US/Eastern')
-        idx = idx.tz_convert('UTC')
-        self.assert_numpy_array_equal(idx.hour, np.array([5, 5]))
-
-        # End DST
-        idx = date_range('2014-11-01 00:00', '2014-11-02 00:00', freq='D', tz='UTC')
-        idx = idx.tz_convert('US/Eastern')
-        self.assert_numpy_array_equal(idx.hour, np.array([20, 20]))
-
-        idx = date_range('2014-11-01 00:00', '2014-11-02 000:00', freq='D', tz='US/Eastern')
-        idx = idx.tz_convert('UTC')
-        self.assert_numpy_array_equal(idx.hour, np.array([4, 4]))
-
-
-class TestTimeZoneCacheKey(tm.TestCase):
-    def test_cache_keys_are_distinct_for_pytz_vs_dateutil(self):
-        tzs = pytz.common_timezones
-        for tz_name in tzs:
-            if tz_name == 'UTC':
-                # skip utc as it's a special case in dateutil
-                continue
-            tz_p = tslib.maybe_get_tz(tz_name)
-            tz_d = tslib.maybe_get_tz('dateutil/' + tz_name)
-            if tz_d is None:
-                # skip timezones that dateutil doesn't know about.
-                continue
-            self.assertNotEqual(tslib._p_tz_cache_key(tz_p), tslib._p_tz_cache_key(tz_d))
-
-
-class TestTimeZones(tm.TestCase):
-    _multiprocess_can_split_ = True
-    timezones = ['UTC', 'Asia/Tokyo', 'US/Eastern', 'dateutil/US/Pacific']
-
-    def setUp(self):
-        tm._skip_if_no_pytz()
-
-    def test_index_equals_with_tz(self):
-        left = date_range('1/1/2011', periods=100, freq='H', tz='utc')
-        right = date_range('1/1/2011', periods=100, freq='H',
-                           tz='US/Eastern')
-
-        self.assertFalse(left.equals(right))
-
-    def test_tz_localize_naive(self):
-        rng = date_range('1/1/2011', periods=100, freq='H')
-
-        conv = rng.tz_localize('US/Pacific')
-        exp = date_range('1/1/2011', periods=100, freq='H', tz='US/Pacific')
-
-        self.assertTrue(conv.equals(exp))
-
-    def test_tz_localize_roundtrip(self):
-        for tz in self.timezones:
-            idx1 = date_range(start='2014-01-01', end='2014-12-31', freq='M')
-            idx2 = date_range(start='2014-01-01', end='2014-12-31', freq='D')
-            idx3 = date_range(start='2014-01-01', end='2014-03-01', freq='H')
-            idx4 = date_range(start='2014-08-01', end='2014-10-31', freq='T')
-            for idx in [idx1, idx2, idx3, idx4]:
-                localized = idx.tz_localize(tz)
-                expected = date_range(start=idx[0], end=idx[-1], freq=idx.freq, tz=tz)
-                tm.assert_index_equal(localized, expected)
-
-                with tm.assertRaises(TypeError):
-                    localized.tz_localize(tz)
-
-                reset = localized.tz_localize(None)
-                tm.assert_index_equal(reset, idx)
-                self.assertTrue(reset.tzinfo is None)
-
-    def test_series_frame_tz_localize(self):
-
-        rng = date_range('1/1/2011', periods=100, freq='H')
-        ts = Series(1, index=rng)
-
-        result = ts.tz_localize('utc')
-        self.assertEqual(result.index.tz.zone, 'UTC')
-
-        df = DataFrame({'a': 1}, index=rng)
-        result = df.tz_localize('utc')
-        expected = DataFrame({'a': 1}, rng.tz_localize('UTC'))
-        self.assertEqual(result.index.tz.zone, 'UTC')
-        assert_frame_equal(result, expected)
-
-        df = df.T
-        result = df.tz_localize('utc', axis=1)
-        self.assertEqual(result.columns.tz.zone, 'UTC')
-        assert_frame_equal(result, expected.T)
-
-        # Can't localize if already tz-aware
-        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
-        ts = Series(1, index=rng)
-        tm.assertRaisesRegexp(TypeError, 'Already tz-aware', ts.tz_localize, 'US/Eastern')
-
-    def test_series_frame_tz_convert(self):
-        rng = date_range('1/1/2011', periods=200, freq='D',
-                         tz='US/Eastern')
-        ts = Series(1, index=rng)
-
-        result = ts.tz_convert('Europe/Berlin')
-        self.assertEqual(result.index.tz.zone, 'Europe/Berlin')
-
-        df = DataFrame({'a': 1}, index=rng)
-        result = df.tz_convert('Europe/Berlin')
-        expected = DataFrame({'a': 1}, rng.tz_convert('Europe/Berlin'))
-        self.assertEqual(result.index.tz.zone, 'Europe/Berlin')
-        assert_frame_equal(result, expected)
-
-        df = df.T
-        result = df.tz_convert('Europe/Berlin', axis=1)
-        self.assertEqual(result.columns.tz.zone, 'Europe/Berlin')
-        assert_frame_equal(result, expected.T)
-
-        # can't convert tz-naive
-        rng = date_range('1/1/2011', periods=200, freq='D')
-        ts = Series(1, index=rng)
-        tm.assertRaisesRegexp(TypeError, "Cannot convert tz-naive", ts.tz_convert, 'US/Eastern')
-
-    def test_tz_convert_roundtrip(self):
-        for tz in self.timezones:
-            idx1 = date_range(start='2014-01-01', end='2014-12-31', freq='M', tz='UTC')
-            exp1 = date_range(start='2014-01-01', end='2014-12-31', freq='M')
-
-            idx2 = date_range(start='2014-01-01', end='2014-12-31', freq='D', tz='UTC')
-            exp2 = date_range(start='2014-01-01', end='2014-12-31', freq='D')
-
-            idx3 = date_range(start='2014-01-01', end='2014-03-01', freq='H', tz='UTC')
-            exp3 = date_range(start='2014-01-01', end='2014-03-01', freq='H')
-
-            idx4 = date_range(start='2014-08-01', end='2014-10-31', freq='T', tz='UTC')
-            exp4 = date_range(start='2014-08-01', end='2014-10-31', freq='T')
-
-
-            for idx, expected in [(idx1, exp1), (idx2, exp2), (idx3, exp3), (idx4, exp4)]:
-                converted = idx.tz_convert(tz)
-                reset = converted.tz_convert(None)
-                tm.assert_index_equal(reset, expected)
-                self.assertTrue(reset.tzinfo is None)
-                tm.assert_index_equal(reset, converted.tz_convert('UTC').tz_localize(None))
-
-
-    def test_join_utc_convert(self):
-        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
-
-        left = rng.tz_convert('US/Eastern')
-        right = rng.tz_convert('Europe/Berlin')
-
-        for how in ['inner', 'outer', 'left', 'right']:
-            result = left.join(left[:-5], how=how)
-            tm.assertIsInstance(result, DatetimeIndex)
-            self.assertEqual(result.tz, left.tz)
-
-            result = left.join(right[:-5], how=how)
-            tm.assertIsInstance(result, DatetimeIndex)
-            self.assertEqual(result.tz.zone, 'UTC')
-
-    def test_join_aware(self):
-        rng = date_range('1/1/2011', periods=10, freq='H')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        ts_utc = ts.tz_localize('utc')
-
-        self.assertRaises(Exception, ts.__add__, ts_utc)
-        self.assertRaises(Exception, ts_utc.__add__, ts)
-
-        test1 = DataFrame(np.zeros((6, 3)),
-                          index=date_range("2012-11-15 00:00:00", periods=6,
-                                           freq="100L", tz="US/Central"))
-        test2 = DataFrame(np.zeros((3, 3)),
-                          index=date_range("2012-11-15 00:00:00", periods=3,
-                                           freq="250L", tz="US/Central"),
-                          columns=lrange(3, 6))
-
-        result = test1.join(test2, how='outer')
-        ex_index = test1.index.union(test2.index)
-
-        self.assertTrue(result.index.equals(ex_index))
-        self.assertTrue(result.index.tz.zone == 'US/Central')
-
-        # non-overlapping
-        rng = date_range("2012-11-15 00:00:00", periods=6,
-                         freq="H", tz="US/Central")
-
-        rng2 = date_range("2012-11-15 12:00:00", periods=6,
-                          freq="H", tz="US/Eastern")
-
-        result = rng.union(rng2)
-        self.assertTrue(result.tz.zone == 'UTC')
-
-    def test_align_aware(self):
-        idx1 = date_range('2001', periods=5, freq='H', tz='US/Eastern')
-        idx2 = date_range('2001', periods=5, freq='2H', tz='US/Eastern')
-        df1 = DataFrame(np.random.randn(len(idx1), 3), idx1)
-        df2 = DataFrame(np.random.randn(len(idx2), 3), idx2)
-        new1, new2 = df1.align(df2)
-        self.assertEqual(df1.index.tz, new1.index.tz)
-        self.assertEqual(df2.index.tz, new2.index.tz)
-
-    def test_append_aware(self):
-        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H',
-                          tz='US/Eastern')
-        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H',
-                          tz='US/Eastern')
-        ts1 = Series(np.random.randn(len(rng1)), index=rng1)
-        ts2 = Series(np.random.randn(len(rng2)), index=rng2)
-        ts_result = ts1.append(ts2)
-        self.assertEqual(ts_result.index.tz, rng1.tz)
-
-        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H',
-                          tz='UTC')
-        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H',
-                          tz='UTC')
-        ts1 = Series(np.random.randn(len(rng1)), index=rng1)
-        ts2 = Series(np.random.randn(len(rng2)), index=rng2)
-        ts_result = ts1.append(ts2)
-        utc = rng1.tz
-        self.assertEqual(utc, ts_result.index.tz)
-
-        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H',
-                          tz='US/Eastern')
-        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H',
-                          tz='US/Central')
-        ts1 = Series(np.random.randn(len(rng1)), index=rng1)
-        ts2 = Series(np.random.randn(len(rng2)), index=rng2)
-        ts_result = ts1.append(ts2)
-        self.assertEqual(utc, ts_result.index.tz)
-
-    def test_append_aware_naive(self):
-        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H')
-        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H',
-                          tz='US/Eastern')
-        ts1 = Series(np.random.randn(len(rng1)), index=rng1)
-        ts2 = Series(np.random.randn(len(rng2)), index=rng2)
-        ts_result = ts1.append(ts2)
-        self.assertTrue(ts_result.index.equals(
-            ts1.index.asobject.append(ts2.index.asobject)))
-
-        # mixed
-
-        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H')
-        rng2 = lrange(100)
-        ts1 = Series(np.random.randn(len(rng1)), index=rng1)
-        ts2 = Series(np.random.randn(len(rng2)), index=rng2)
-        ts_result = ts1.append(ts2)
-        self.assertTrue(ts_result.index.equals(
-            ts1.index.asobject.append(ts2.index)))
-
-    def test_equal_join_ensure_utc(self):
-        rng = date_range('1/1/2011', periods=10, freq='H', tz='US/Eastern')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        ts_moscow = ts.tz_convert('Europe/Moscow')
-
-        result = ts + ts_moscow
-        self.assertIs(result.index.tz, pytz.utc)
-
-        result = ts_moscow + ts
-        self.assertIs(result.index.tz, pytz.utc)
-
-        df = DataFrame({'a': ts})
-        df_moscow = df.tz_convert('Europe/Moscow')
-        result = df + df_moscow
-        self.assertIs(result.index.tz, pytz.utc)
-
-        result = df_moscow + df
-        self.assertIs(result.index.tz, pytz.utc)
-
-    def test_arith_utc_convert(self):
-        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
-
-        perm = np.random.permutation(100)[:90]
-        ts1 = Series(np.random.randn(90),
-                     index=rng.take(perm).tz_convert('US/Eastern'))
-
-        perm = np.random.permutation(100)[:90]
-        ts2 = Series(np.random.randn(90),
-                     index=rng.take(perm).tz_convert('Europe/Berlin'))
-
-        result = ts1 + ts2
-
-        uts1 = ts1.tz_convert('utc')
-        uts2 = ts2.tz_convert('utc')
-        expected = uts1 + uts2
-
-        self.assertEqual(result.index.tz, pytz.UTC)
-        tm.assert_series_equal(result, expected)
-
-    def test_intersection(self):
-        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
-
-        left = rng[10:90][::-1]
-        right = rng[20:80][::-1]
-
-        self.assertEqual(left.tz, rng.tz)
-        result = left.intersection(right)
-        self.assertEqual(result.tz, left.tz)
-
-    def test_timestamp_equality_different_timezones(self):
-        utc_range = date_range('1/1/2000', periods=20, tz='UTC')
-        eastern_range = utc_range.tz_convert('US/Eastern')
-        berlin_range = utc_range.tz_convert('Europe/Berlin')
-
-        for a, b, c in zip(utc_range, eastern_range, berlin_range):
-            self.assertEqual(a, b)
-            self.assertEqual(b, c)
-            self.assertEqual(a, c)
-
-        self.assertTrue((utc_range == eastern_range).all())
-        self.assertTrue((utc_range == berlin_range).all())
-        self.assertTrue((berlin_range == eastern_range).all())
-
-    def test_datetimeindex_tz(self):
-        rng = date_range('03/12/2012 00:00', periods=10, freq='W-FRI',
-                         tz='US/Eastern')
-        rng2 = DatetimeIndex(data=rng, tz='US/Eastern')
-        self.assertTrue(rng.equals(rng2))
-
-    def test_normalize_tz(self):
-        rng = date_range('1/1/2000 9:30', periods=10, freq='D',
-                         tz='US/Eastern')
-
-        result = rng.normalize()
-        expected = date_range('1/1/2000', periods=10, freq='D',
-                              tz='US/Eastern')
-        self.assertTrue(result.equals(expected))
-
-        self.assertTrue(result.is_normalized)
-        self.assertFalse(rng.is_normalized)
-
-        rng = date_range('1/1/2000 9:30', periods=10, freq='D',
-                         tz='UTC')
-
-        result = rng.normalize()
-        expected = date_range('1/1/2000', periods=10, freq='D',
-                              tz='UTC')
-        self.assertTrue(result.equals(expected))
-
-        self.assertTrue(result.is_normalized)
-        self.assertFalse(rng.is_normalized)
-
-        from dateutil.tz import tzlocal
-        rng = date_range('1/1/2000 9:30', periods=10, freq='D',
-                         tz=tzlocal())
-        result = rng.normalize()
-        expected = date_range('1/1/2000', periods=10, freq='D',
-                              tz=tzlocal())
-        self.assertTrue(result.equals(expected))
-
-        self.assertTrue(result.is_normalized)
-        self.assertFalse(rng.is_normalized)
-
-    def test_tzaware_offset(self):
-        dates = date_range('2012-11-01', periods=3, tz='US/Pacific')
-        offset = dates + offsets.Hour(5)
-        self.assertEqual(dates[0] + offsets.Hour(5), offset[0])
-
-        # GH 6818
-        for tz in ['UTC', 'US/Pacific', 'Asia/Tokyo']:
-            dates = date_range('2010-11-01 00:00', periods=3, tz=tz, freq='H')
-            expected = DatetimeIndex(['2010-11-01 05:00', '2010-11-01 06:00',
-                                      '2010-11-01 07:00'], freq='H', tz=tz)
-
-            offset = dates + offsets.Hour(5)
-            self.assertTrue(offset.equals(expected))
-            offset = dates + np.timedelta64(5, 'h')
-            self.assertTrue(offset.equals(expected))
-            offset = dates + timedelta(hours=5)
-            self.assertTrue(offset.equals(expected))
-
-    def test_nat(self):
-        # GH 5546
-        dates = [NaT]
-        idx = DatetimeIndex(dates)
-        idx = idx.tz_localize('US/Pacific')
-        self.assertTrue(idx.equals(DatetimeIndex(dates, tz='US/Pacific')))
-        idx = idx.tz_convert('US/Eastern')
-        self.assertTrue(idx.equals(DatetimeIndex(dates, tz='US/Eastern')))
-        idx = idx.tz_convert('UTC')
-        self.assertTrue(idx.equals(DatetimeIndex(dates, tz='UTC')))
-
-        dates = ['2010-12-01 00:00', '2010-12-02 00:00', NaT]
-        idx = DatetimeIndex(dates)
-        idx = idx.tz_localize('US/Pacific')
-        self.assertTrue(idx.equals(DatetimeIndex(dates, tz='US/Pacific')))
-        idx = idx.tz_convert('US/Eastern')
-        expected = ['2010-12-01 03:00', '2010-12-02 03:00', NaT]
-        self.assertTrue(idx.equals(DatetimeIndex(expected, tz='US/Eastern')))
-
-        idx = idx + offsets.Hour(5)
-        expected = ['2010-12-01 08:00', '2010-12-02 08:00', NaT]
-        self.assertTrue(idx.equals(DatetimeIndex(expected, tz='US/Eastern')))
-        idx = idx.tz_convert('US/Pacific')
-        expected = ['2010-12-01 05:00', '2010-12-02 05:00', NaT]
-        self.assertTrue(idx.equals(DatetimeIndex(expected, tz='US/Pacific')))
-
-        idx = idx + np.timedelta64(3, 'h')
-        expected = ['2010-12-01 08:00', '2010-12-02 08:00', NaT]
-        self.assertTrue(idx.equals(DatetimeIndex(expected, tz='US/Pacific')))
-
-        idx = idx.tz_convert('US/Eastern')
-        expected = ['2010-12-01 11:00', '2010-12-02 11:00', NaT]
-        self.assertTrue(idx.equals(DatetimeIndex(expected, tz='US/Eastern')))
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tseries/tests/test_tslib.py b/pandas/tseries/tests/test_tslib.py
deleted file mode 100644
index f618b2593597e..0000000000000
--- a/pandas/tseries/tests/test_tslib.py
+++ /dev/null
@@ -1,1023 +0,0 @@
-import nose
-from distutils.version import LooseVersion
-import numpy as np
-
-from pandas import tslib
-import pandas._period as period
-import datetime
-
-from pandas.core.api import Timestamp, Series, Timedelta, Period, to_datetime
-from pandas.tslib import get_timezone
-from pandas._period import period_asfreq, period_ordinal
-from pandas.tseries.index import date_range, DatetimeIndex
-from pandas.tseries.frequencies import get_freq
-import pandas.tseries.tools as tools
-import pandas.tseries.offsets as offsets
-import pandas.util.testing as tm
-import pandas.compat as compat
-from pandas.util.testing import assert_series_equal
-import pandas.compat as compat
-
-
-class TestTimestamp(tm.TestCase):
-
-    def test_constructor(self):
-        base_str = '2014-07-01 09:00'
-        base_dt = datetime.datetime(2014, 7, 1, 9)
-        base_expected = 1404205200000000000
-
-        # confirm base representation is correct
-        import calendar
-        self.assertEqual(calendar.timegm(base_dt.timetuple()) * 1000000000, base_expected)
-
-        tests = [(base_str, base_dt, base_expected),
-                 ('2014-07-01 10:00', datetime.datetime(2014, 7, 1, 10),
-                  base_expected + 3600 * 1000000000),
-                 ('2014-07-01 09:00:00.000008000',
-                  datetime.datetime(2014, 7, 1, 9, 0, 0, 8), base_expected + 8000),
-                 ('2014-07-01 09:00:00.000000005',
-                  Timestamp('2014-07-01 09:00:00.000000005'), base_expected + 5)]
-
-        tm._skip_if_no_pytz()
-        tm._skip_if_no_dateutil()
-        import pytz
-        import dateutil
-        timezones = [(None, 0), ('UTC', 0), (pytz.utc, 0),
-                     ('Asia/Tokyo', 9), ('US/Eastern', -4), ('dateutil/US/Pacific', -7),
-                     (pytz.FixedOffset(-180), -3), (dateutil.tz.tzoffset(None, 18000), 5)]
-
-        for date_str, date, expected in tests:
-            for result in [Timestamp(date_str), Timestamp(date)]:
-                # only with timestring
-                self.assertEqual(result.value, expected)
-                self.assertEqual(tslib.pydt_to_i8(result), expected)
-
-                # re-creation shouldn't affect to internal value
-                result = Timestamp(result)
-                self.assertEqual(result.value, expected)
-                self.assertEqual(tslib.pydt_to_i8(result), expected)
-
-            # with timezone
-            for tz, offset in timezones:
-                for result in [Timestamp(date_str, tz=tz), Timestamp(date, tz=tz)]:
-                    expected_tz = expected - offset * 3600 * 1000000000
-                    self.assertEqual(result.value, expected_tz)
-                    self.assertEqual(tslib.pydt_to_i8(result), expected_tz)
-
-                    # should preserve tz
-                    result = Timestamp(result)
-                    self.assertEqual(result.value, expected_tz)
-                    self.assertEqual(tslib.pydt_to_i8(result), expected_tz)
-
-                    # should convert to UTC
-                    result = Timestamp(result, tz='UTC')
-                    expected_utc = expected - offset * 3600 * 1000000000
-                    self.assertEqual(result.value, expected_utc)
-                    self.assertEqual(tslib.pydt_to_i8(result), expected_utc)
-
-    def test_constructor_with_stringoffset(self):
-        # GH 7833
-        base_str = '2014-07-01 11:00:00+02:00'
-        base_dt = datetime.datetime(2014, 7, 1, 9)
-        base_expected = 1404205200000000000
-
-        # confirm base representation is correct
-        import calendar
-        self.assertEqual(calendar.timegm(base_dt.timetuple()) * 1000000000, base_expected)
-
-        tests = [(base_str, base_expected),
-                 ('2014-07-01 12:00:00+02:00', base_expected + 3600 * 1000000000),
-                 ('2014-07-01 11:00:00.000008000+02:00', base_expected + 8000),
-                 ('2014-07-01 11:00:00.000000005+02:00', base_expected + 5)]
-
-        tm._skip_if_no_pytz()
-        tm._skip_if_no_dateutil()
-        import pytz
-        import dateutil
-        timezones = [(None, 0), ('UTC', 0), (pytz.utc, 0),
-                     ('Asia/Tokyo', 9), ('US/Eastern', -4),
-                     ('dateutil/US/Pacific', -7),
-                     (pytz.FixedOffset(-180), -3), (dateutil.tz.tzoffset(None, 18000), 5)]
-
-        for date_str, expected in tests:
-            for result in [Timestamp(date_str)]:
-                # only with timestring
-                self.assertEqual(result.value, expected)
-                self.assertEqual(tslib.pydt_to_i8(result), expected)
-
-                # re-creation shouldn't affect to internal value
-                result = Timestamp(result)
-                self.assertEqual(result.value, expected)
-                self.assertEqual(tslib.pydt_to_i8(result), expected)
-
-            # with timezone
-            for tz, offset in timezones:
-                result = Timestamp(date_str, tz=tz)
-                expected_tz = expected
-                self.assertEqual(result.value, expected_tz)
-                self.assertEqual(tslib.pydt_to_i8(result), expected_tz)
-
-                # should preserve tz
-                result = Timestamp(result)
-                self.assertEqual(result.value, expected_tz)
-                self.assertEqual(tslib.pydt_to_i8(result), expected_tz)
-
-                # should convert to UTC
-                result = Timestamp(result, tz='UTC')
-                expected_utc = expected
-                self.assertEqual(result.value, expected_utc)
-                self.assertEqual(tslib.pydt_to_i8(result), expected_utc)
-
-        # This should be 2013-11-01 05:00 in UTC -> converted to Chicago tz
-        result = Timestamp('2013-11-01 00:00:00-0500', tz='America/Chicago')
-        self.assertEqual(result.value, Timestamp('2013-11-01 05:00').value)
-        expected_repr = "Timestamp('2013-11-01 00:00:00-0500', tz='America/Chicago')"
-        self.assertEqual(repr(result), expected_repr)
-        self.assertEqual(result, eval(repr(result)))
-
-        # This should be 2013-11-01 05:00 in UTC -> converted to Tokyo tz (+09:00)
-        result = Timestamp('2013-11-01 00:00:00-0500', tz='Asia/Tokyo')
-        self.assertEqual(result.value, Timestamp('2013-11-01 05:00').value)
-        expected_repr = "Timestamp('2013-11-01 14:00:00+0900', tz='Asia/Tokyo')"
-        self.assertEqual(repr(result), expected_repr)
-        self.assertEqual(result, eval(repr(result)))
-
-    def test_constructor_invalid(self):
-        with tm.assertRaisesRegexp(TypeError, 'Cannot convert input'):
-            Timestamp(slice(2))
-        with tm.assertRaisesRegexp(ValueError, 'Cannot convert Period'):
-            Timestamp(Period('1000-01-01'))
-
-    def test_conversion(self):
-        # GH 9255
-        ts = Timestamp('2000-01-01')
-
-        result = ts.to_pydatetime()
-        expected = datetime.datetime(2000, 1, 1)
-        self.assertEqual(result, expected)
-        self.assertEqual(type(result), type(expected))
-
-        result = ts.to_datetime64()
-        expected = np.datetime64(ts.value, 'ns')
-        self.assertEqual(result, expected)
-        self.assertEqual(type(result), type(expected))
-        self.assertEqual(result.dtype, expected.dtype)
-
-    def test_repr(self):
-        tm._skip_if_no_pytz()
-        tm._skip_if_no_dateutil()
-
-        dates = ['2014-03-07', '2014-01-01 09:00', '2014-01-01 00:00:00.000000001']
-
-        # dateutil zone change (only matters for repr)
-        import dateutil
-        if dateutil.__version__ >= LooseVersion('2.3') and dateutil.__version__ <= LooseVersion('2.4.0'):
-            timezones = ['UTC', 'Asia/Tokyo', 'US/Eastern', 'dateutil/US/Pacific']
-        else:
-            timezones = ['UTC', 'Asia/Tokyo', 'US/Eastern', 'dateutil/America/Los_Angeles']
-
-        freqs = ['D', 'M', 'S', 'N']
-
-        for date in dates:
-            for tz in timezones:
-                for freq in freqs:
-
-                    # avoid to match with timezone name
-                    freq_repr = "'{0}'".format(freq)
-                    if tz.startswith('dateutil'):
-                        tz_repr = tz.replace('dateutil', '')
-                    else:
-                        tz_repr = tz
-
-                    date_only = Timestamp(date)
-                    self.assertIn(date, repr(date_only))
-                    self.assertNotIn(tz_repr, repr(date_only))
-                    self.assertNotIn(freq_repr, repr(date_only))
-                    self.assertEqual(date_only, eval(repr(date_only)))
-
-                    date_tz = Timestamp(date, tz=tz)
-                    self.assertIn(date, repr(date_tz))
-                    self.assertIn(tz_repr, repr(date_tz))
-                    self.assertNotIn(freq_repr, repr(date_tz))
-                    self.assertEqual(date_tz, eval(repr(date_tz)))
-
-                    date_freq = Timestamp(date, offset=freq)
-                    self.assertIn(date, repr(date_freq))
-                    self.assertNotIn(tz_repr, repr(date_freq))
-                    self.assertIn(freq_repr, repr(date_freq))
-                    self.assertEqual(date_freq, eval(repr(date_freq)))
-
-                    date_tz_freq = Timestamp(date, tz=tz, offset=freq)
-                    self.assertIn(date, repr(date_tz_freq))
-                    self.assertIn(tz_repr, repr(date_tz_freq))
-                    self.assertIn(freq_repr, repr(date_tz_freq))
-                    self.assertEqual(date_tz_freq, eval(repr(date_tz_freq)))
-
-        # this can cause the tz field to be populated, but it's redundant to information in the datestring
-        tm._skip_if_no_pytz()
-        import pytz
-        date_with_utc_offset = Timestamp('2014-03-13 00:00:00-0400', tz=None)
-        self.assertIn('2014-03-13 00:00:00-0400', repr(date_with_utc_offset))
-        self.assertNotIn('tzoffset', repr(date_with_utc_offset))
-        self.assertIn('pytz.FixedOffset(-240)', repr(date_with_utc_offset))
-        expr = repr(date_with_utc_offset).replace("'pytz.FixedOffset(-240)'",
-                    'pytz.FixedOffset(-240)')
-        self.assertEqual(date_with_utc_offset, eval(expr))
-
-    def test_bounds_with_different_units(self):
-        out_of_bounds_dates = (
-            '1677-09-21',
-            '2262-04-12',
-        )
-
-        time_units = ('D', 'h', 'm', 's', 'ms', 'us')
-
-        for date_string in out_of_bounds_dates:
-            for unit in time_units:
-                self.assertRaises(
-                    ValueError,
-                    Timestamp,
-                    np.datetime64(date_string, dtype='M8[%s]' % unit)
-                )
-
-        in_bounds_dates = (
-            '1677-09-23',
-            '2262-04-11',
-        )
-
-        for date_string in in_bounds_dates:
-            for unit in time_units:
-                Timestamp(
-                    np.datetime64(date_string, dtype='M8[%s]' % unit)
-                )
-
-    def test_tz(self):
-        t = '2014-02-01 09:00'
-        ts = Timestamp(t)
-        local = ts.tz_localize('Asia/Tokyo')
-        self.assertEqual(local.hour, 9)
-        self.assertEqual(local, Timestamp(t, tz='Asia/Tokyo'))
-        conv = local.tz_convert('US/Eastern')
-        self.assertEqual(conv,
-                         Timestamp('2014-01-31 19:00', tz='US/Eastern'))
-        self.assertEqual(conv.hour, 19)
-
-        # preserves nanosecond
-        ts = Timestamp(t) + offsets.Nano(5)
-        local = ts.tz_localize('Asia/Tokyo')
-        self.assertEqual(local.hour, 9)
-        self.assertEqual(local.nanosecond, 5)
-        conv = local.tz_convert('US/Eastern')
-        self.assertEqual(conv.nanosecond, 5)
-        self.assertEqual(conv.hour, 19)
-
-    def test_tz_localize_ambiguous(self):
-
-        ts = Timestamp('2014-11-02 01:00')
-        ts_dst = ts.tz_localize('US/Eastern', ambiguous=True)
-        ts_no_dst = ts.tz_localize('US/Eastern', ambiguous=False)
-
-        rng = date_range('2014-11-02', periods=3, freq='H', tz='US/Eastern')
-        self.assertEqual(rng[1], ts_dst)
-        self.assertEqual(rng[2], ts_no_dst)
-        self.assertRaises(ValueError, ts.tz_localize, 'US/Eastern', ambiguous='infer')
-
-        # GH 8025
-        with tm.assertRaisesRegexp(TypeError, 'Cannot localize tz-aware Timestamp, use '
-                                   'tz_convert for conversions'):
-            Timestamp('2011-01-01' ,tz='US/Eastern').tz_localize('Asia/Tokyo')
-
-        with tm.assertRaisesRegexp(TypeError, 'Cannot convert tz-naive Timestamp, use '
-                            'tz_localize to localize'):
-            Timestamp('2011-01-01').tz_convert('Asia/Tokyo')
-
-    def test_tz_localize_roundtrip(self):
-        for tz in ['UTC', 'Asia/Tokyo', 'US/Eastern', 'dateutil/US/Pacific']:
-            for t in ['2014-02-01 09:00', '2014-07-08 09:00', '2014-11-01 17:00',
-                      '2014-11-05 00:00']:
-                ts = Timestamp(t)
-                localized = ts.tz_localize(tz)
-                self.assertEqual(localized, Timestamp(t, tz=tz))
-
-                with tm.assertRaises(TypeError):
-                    localized.tz_localize(tz)
-
-                reset = localized.tz_localize(None)
-                self.assertEqual(reset, ts)
-                self.assertTrue(reset.tzinfo is None)
-
-    def test_tz_convert_roundtrip(self):
-        for tz in ['UTC', 'Asia/Tokyo', 'US/Eastern', 'dateutil/US/Pacific']:
-            for t in ['2014-02-01 09:00', '2014-07-08 09:00', '2014-11-01 17:00',
-                      '2014-11-05 00:00']:
-                ts = Timestamp(t, tz='UTC')
-                converted = ts.tz_convert(tz)
-
-                reset = converted.tz_convert(None)
-                self.assertEqual(reset, Timestamp(t))
-                self.assertTrue(reset.tzinfo is None)
-                self.assertEqual(reset, converted.tz_convert('UTC').tz_localize(None))
-
-    def test_barely_oob_dts(self):
-        one_us = np.timedelta64(1).astype('timedelta64[us]')
-
-        # By definition we can't go out of bounds in [ns], so we
-        # convert the datetime64s to [us] so we can go out of bounds
-        min_ts_us = np.datetime64(Timestamp.min).astype('M8[us]')
-        max_ts_us = np.datetime64(Timestamp.max).astype('M8[us]')
-
-        # No error for the min/max datetimes
-        Timestamp(min_ts_us)
-        Timestamp(max_ts_us)
-
-        # One us less than the minimum is an error
-        self.assertRaises(ValueError, Timestamp, min_ts_us - one_us)
-
-        # One us more than the maximum is an error
-        self.assertRaises(ValueError, Timestamp, max_ts_us + one_us)
-
-    def test_utc_z_designator(self):
-        self.assertEqual(get_timezone(Timestamp('2014-11-02 01:00Z').tzinfo), 'UTC')
-
-    def test_now(self):
-        # #9000
-        ts_from_string = Timestamp('now')
-        ts_from_method = Timestamp.now()
-        ts_datetime = datetime.datetime.now()
-
-        ts_from_string_tz = Timestamp('now', tz='US/Eastern')
-        ts_from_method_tz = Timestamp.now(tz='US/Eastern')
-
-        # Check that the delta between the times is less than 1s (arbitrarily small)
-        delta = Timedelta(seconds=1)
-        self.assertTrue(abs(ts_from_method - ts_from_string) < delta)
-        self.assertTrue(abs(ts_datetime - ts_from_method) < delta)
-        self.assertTrue(abs(ts_from_method_tz - ts_from_string_tz) < delta)
-        self.assertTrue(abs(ts_from_string_tz.tz_localize(None)
-                            - ts_from_method_tz.tz_localize(None)) < delta)
-
-    def test_today(self):
-
-        ts_from_string = Timestamp('today')
-        ts_from_method = Timestamp.today()
-        ts_datetime = datetime.datetime.today()
-
-        ts_from_string_tz = Timestamp('today', tz='US/Eastern')
-        ts_from_method_tz = Timestamp.today(tz='US/Eastern')
-
-        # Check that the delta between the times is less than 1s (arbitrarily small)
-        delta = Timedelta(seconds=1)
-        self.assertTrue(abs(ts_from_method - ts_from_string) < delta)
-        self.assertTrue(abs(ts_datetime - ts_from_method) < delta)
-        self.assertTrue(abs(ts_from_method_tz - ts_from_string_tz) < delta)
-        self.assertTrue(abs(ts_from_string_tz.tz_localize(None)
-                            - ts_from_method_tz.tz_localize(None)) < delta)
-
-    def test_fields(self):
-
-        def check(value, equal):
-            # that we are int/long like
-            self.assertTrue(isinstance(value, (int, compat.long)))
-            self.assertEqual(value, equal)
-
-        # GH 10050
-        ts = Timestamp('2015-05-10 09:06:03.000100001')
-        check(ts.year, 2015)
-        check(ts.month, 5)
-        check(ts.day, 10)
-        check(ts.hour, 9)
-        check(ts.minute, 6)
-        check(ts.second, 3)
-        self.assertRaises(AttributeError, lambda : ts.millisecond)
-        check(ts.microsecond, 100)
-        check(ts.nanosecond, 1)
-        check(ts.dayofweek, 6)
-        check(ts.quarter, 2)
-        check(ts.dayofyear, 130)
-        check(ts.week, 19)
-        check(ts.daysinmonth, 31)
-        check(ts.daysinmonth, 31)
-
-    def test_nat_fields(self):
-        # GH 10050
-        ts = Timestamp('NaT')
-        self.assertTrue(np.isnan(ts.year))
-        self.assertTrue(np.isnan(ts.month))
-        self.assertTrue(np.isnan(ts.day))
-        self.assertTrue(np.isnan(ts.hour))
-        self.assertTrue(np.isnan(ts.minute))
-        self.assertTrue(np.isnan(ts.second))
-        self.assertTrue(np.isnan(ts.microsecond))
-        self.assertTrue(np.isnan(ts.nanosecond))
-        self.assertTrue(np.isnan(ts.dayofweek))
-        self.assertTrue(np.isnan(ts.quarter))
-        self.assertTrue(np.isnan(ts.dayofyear))
-        self.assertTrue(np.isnan(ts.week))
-        self.assertTrue(np.isnan(ts.daysinmonth))
-        self.assertTrue(np.isnan(ts.days_in_month))
-
-
-class TestDatetimeParsingWrappers(tm.TestCase):
-
-    def test_does_not_convert_mixed_integer(self):
-        bad_date_strings = (
-            '-50000',
-            '999',
-            '123.1234',
-            'm',
-            'T'
-        )
-
-        for bad_date_string in bad_date_strings:
-            self.assertFalse(
-                tslib._does_string_look_like_datetime(bad_date_string)
-            )
-
-        good_date_strings = (
-            '2012-01-01',
-            '01/01/2012',
-            'Mon Sep 16, 2013',
-            '01012012',
-            '0101',
-            '1-1',
-        )
-
-        for good_date_string in good_date_strings:
-            self.assertTrue(
-                tslib._does_string_look_like_datetime(good_date_string)
-            )
-
-    def test_parsers(self):
-        cases = {'2011-01-01': datetime.datetime(2011, 1, 1),
-                 '2Q2005': datetime.datetime(2005, 4, 1),
-                 '2Q05': datetime.datetime(2005, 4, 1),
-                 '2005Q1': datetime.datetime(2005, 1, 1),
-                 '05Q1': datetime.datetime(2005, 1, 1),
-                 '2011Q3': datetime.datetime(2011, 7, 1),
-                 '11Q3': datetime.datetime(2011, 7, 1),
-                 '3Q2011': datetime.datetime(2011, 7, 1),
-                 '3Q11': datetime.datetime(2011, 7, 1),
-
-                 # quarterly without space
-                 '2000Q4': datetime.datetime(2000, 10, 1),
-                 '00Q4': datetime.datetime(2000, 10, 1),
-                 '4Q2000': datetime.datetime(2000, 10, 1),
-                 '4Q00': datetime.datetime(2000, 10, 1),
-                 '2000q4': datetime.datetime(2000, 10, 1),
-
-                 '2000-Q4': datetime.datetime(2000, 10, 1),
-                 '00-Q4': datetime.datetime(2000, 10, 1),
-                 '4Q-2000': datetime.datetime(2000, 10, 1),
-                 '4Q-00': datetime.datetime(2000, 10, 1),
-
-                 '2000q4': datetime.datetime(2000, 10, 1),
-                 '00q4': datetime.datetime(2000, 10, 1),
-
-                 '2005': datetime.datetime(2005, 1, 1),
-                 '2005-11': datetime.datetime(2005, 11, 1),
-                 '2005 11': datetime.datetime(2005, 11, 1),
-                 '11-2005': datetime.datetime(2005, 11, 1),
-                 '11 2005': datetime.datetime(2005, 11, 1),
-                 '200511': datetime.datetime(2020, 5, 11),
-                 '20051109': datetime.datetime(2005, 11, 9),
-
-                 '20051109 10:15': datetime.datetime(2005, 11, 9, 10, 15),
-                 '20051109 08H': datetime.datetime(2005, 11, 9, 8, 0),
-
-                 '2005-11-09 10:15': datetime.datetime(2005, 11, 9, 10, 15),
-                 '2005-11-09 08H': datetime.datetime(2005, 11, 9, 8, 0),
-                 '2005/11/09 10:15': datetime.datetime(2005, 11, 9, 10, 15),
-                 '2005/11/09 08H': datetime.datetime(2005, 11, 9, 8, 0),
-
-                 "Thu Sep 25 10:36:28 2003": datetime.datetime(2003, 9, 25, 10, 36, 28),
-                 "Thu Sep 25 2003": datetime.datetime(2003, 9, 25),
-                 "Sep 25 2003": datetime.datetime(2003, 9, 25),
-                 "January 1 2014": datetime.datetime(2014, 1, 1),
-
-                 # GH 10537
-                 '2014-06': datetime.datetime(2014, 6, 1),
-                 '06-2014': datetime.datetime(2014, 6, 1),
-                 '2014-6': datetime.datetime(2014, 6, 1),
-                 '6-2014': datetime.datetime(2014, 6, 1),
-                 }
-
-        for date_str, expected in compat.iteritems(cases):
-            result1, _, _ = tools.parse_time_string(date_str)
-            result2 = to_datetime(date_str)
-            result3 = to_datetime([date_str])
-            result4 = to_datetime(np.array([date_str], dtype=object))
-            result5 = Timestamp(date_str)
-            result6 = DatetimeIndex([date_str])[0]
-            result7 = date_range(date_str, freq='S', periods=1)
-            self.assertEqual(result1, expected)
-            self.assertEqual(result2, expected)
-            self.assertEqual(result3, expected)
-            self.assertEqual(result4, expected)
-            self.assertEqual(result5, expected)
-            self.assertEqual(result6, expected)
-            self.assertEqual(result7, expected)
-
-        # NaT
-        result1, _, _ = tools.parse_time_string('NaT')
-        result2 = to_datetime('NaT')
-        result3 = Timestamp('NaT')
-        result4 = DatetimeIndex(['NaT'])[0]
-        self.assertTrue(result1 is tslib.NaT)
-        self.assertTrue(result1 is tslib.NaT)
-        self.assertTrue(result1 is tslib.NaT)
-        self.assertTrue(result1 is tslib.NaT)
-
-    def test_parsers_quarter_invalid(self):
-
-        cases = ['2Q 2005', '2Q-200A', '2Q-200',
-                 '22Q2005', '6Q-20', '2Q200.']
-        for case in cases:
-            self.assertRaises(ValueError, tools.parse_time_string, case)
-
-    def test_parsers_dayfirst_yearfirst(self):
-        # str : dayfirst, yearfirst, expected
-        cases = {'10-11-12': [(False, False, datetime.datetime(2012, 10, 11)),
-                              (True, False, datetime.datetime(2012, 11, 10)),
-                              (False, True, datetime.datetime(2010, 11, 12)),
-                              (True, True, datetime.datetime(2010, 11, 12))],
-                 '20/12/21': [(False, False, datetime.datetime(2021, 12, 20)),
-                              (True, False, datetime.datetime(2021, 12, 20)),
-                              (False, True, datetime.datetime(2020, 12, 21)),
-                              (True, True, datetime.datetime(2020, 12, 21))]}
-
-        tm._skip_if_no_dateutil()
-        from dateutil.parser import parse
-        for date_str, values in compat.iteritems(cases):
-            for dayfirst, yearfirst ,expected in values:
-                result1, _, _ = tools.parse_time_string(date_str, dayfirst=dayfirst,
-                                                        yearfirst=yearfirst)
-
-                result2 = to_datetime(date_str, dayfirst=dayfirst,
-                                      yearfirst=yearfirst)
-
-                result3 = DatetimeIndex([date_str], dayfirst=dayfirst,
-                                        yearfirst=yearfirst)[0]
-
-                # Timestamp doesn't support dayfirst and yearfirst
-
-                self.assertEqual(result1, expected)
-                self.assertEqual(result2, expected)
-                self.assertEqual(result3, expected)
-
-                # compare with dateutil result
-                dateutil_result = parse(date_str, dayfirst=dayfirst, yearfirst=yearfirst)
-                self.assertEqual(dateutil_result, expected)
-
-    def test_parsers_timestring(self):
-        tm._skip_if_no_dateutil()
-        from dateutil.parser import parse
-
-        # must be the same as dateutil result
-        cases = {'10:15': (parse('10:15'), datetime.datetime(1, 1, 1, 10, 15)),
-                 '9:05': (parse('9:05'), datetime.datetime(1, 1, 1, 9, 5)) }
-
-        for date_str, (exp_now, exp_def) in compat.iteritems(cases):
-            result1, _, _ = tools.parse_time_string(date_str)
-            result2 = to_datetime(date_str)
-            result3 = to_datetime([date_str])
-            result4 = Timestamp(date_str)
-            result5 = DatetimeIndex([date_str])[0]
-            # parse time string return time string based on default date
-            # others are not, and can't be changed because it is used in
-            # time series plot
-            self.assertEqual(result1, exp_def)
-            self.assertEqual(result2, exp_now)
-            self.assertEqual(result3, exp_now)
-            self.assertEqual(result4, exp_now)
-            self.assertEqual(result5, exp_now)
-
-    def test_parsers_monthfreq(self):
-        cases = {'201101': datetime.datetime(2011, 1, 1, 0, 0),
-                 '200005': datetime.datetime(2000, 5, 1, 0, 0)}
-
-        for date_str, expected in compat.iteritems(cases):
-            result1, _, _ = tools.parse_time_string(date_str, freq='M')
-            result2 = tools._to_datetime(date_str, freq='M')
-            self.assertEqual(result1, expected)
-            self.assertEqual(result2, expected)
-
-    def test_parsers_quarterly_with_freq(self):
-
-        msg = 'Incorrect quarterly string is given, quarter must be between 1 and 4: 2013Q5'
-        with tm.assertRaisesRegexp(tslib.DateParseError, msg):
-            tools.parse_time_string('2013Q5')
-
-        # GH 5418
-        msg = 'Unable to retrieve month information from given freq: INVLD-L-DEC-SAT'
-        with tm.assertRaisesRegexp(tslib.DateParseError, msg):
-            tools.parse_time_string('2013Q1', freq='INVLD-L-DEC-SAT')
-
-        cases = {('2013Q2', None): datetime.datetime(2013, 4, 1),
-                 ('2013Q2', 'A-APR'): datetime.datetime(2012, 8, 1),
-                 ('2013-Q2', 'A-DEC'): datetime.datetime(2013, 4, 1)}
-
-        for (date_str, freq), exp in compat.iteritems(cases):
-            result, _, _ = tools.parse_time_string(date_str, freq=freq)
-            self.assertEqual(result, exp)
-
-
-class TestArrayToDatetime(tm.TestCase):
-    def test_parsing_valid_dates(self):
-        arr = np.array(['01-01-2013', '01-02-2013'], dtype=object)
-        self.assert_numpy_array_equal(
-            tslib.array_to_datetime(arr),
-            np.array(
-                    [
-                        '2013-01-01T00:00:00.000000000-0000',
-                        '2013-01-02T00:00:00.000000000-0000'
-                    ],
-                    dtype='M8[ns]'
-            )
-        )
-
-        arr = np.array(['Mon Sep 16 2013', 'Tue Sep 17 2013'], dtype=object)
-        self.assert_numpy_array_equal(
-            tslib.array_to_datetime(arr),
-            np.array(
-                    [
-                        '2013-09-16T00:00:00.000000000-0000',
-                        '2013-09-17T00:00:00.000000000-0000'
-                    ],
-                    dtype='M8[ns]'
-            )
-        )
-
-    def test_number_looking_strings_not_into_datetime(self):
-        # #4601
-        # These strings don't look like datetimes so they shouldn't be
-        # attempted to be converted
-        arr = np.array(['-352.737091', '183.575577'], dtype=object)
-        self.assert_numpy_array_equal(tslib.array_to_datetime(arr, errors='ignore'), arr)
-
-        arr = np.array(['1', '2', '3', '4', '5'], dtype=object)
-        self.assert_numpy_array_equal(tslib.array_to_datetime(arr, errors='ignore'), arr)
-
-    def test_coercing_dates_outside_of_datetime64_ns_bounds(self):
-        invalid_dates = [
-            datetime.date(1000, 1, 1),
-            datetime.datetime(1000, 1, 1),
-            '1000-01-01',
-            'Jan 1, 1000',
-            np.datetime64('1000-01-01'),
-        ]
-
-        for invalid_date in invalid_dates:
-            self.assertRaises(
-                ValueError,
-                tslib.array_to_datetime,
-                np.array([invalid_date], dtype='object'),
-                errors='raise',
-            )
-            self.assertTrue(
-                np.array_equal(
-                    tslib.array_to_datetime(
-                        np.array([invalid_date], dtype='object'), errors='coerce',
-                    ),
-                    np.array([tslib.iNaT], dtype='M8[ns]')
-                )
-            )
-
-        arr = np.array(['1/1/1000', '1/1/2000'], dtype=object)
-        self.assert_numpy_array_equal(
-            tslib.array_to_datetime(arr, errors='coerce'),
-            np.array(
-                    [
-                        tslib.iNaT,
-                        '2000-01-01T00:00:00.000000000-0000'
-                    ],
-                    dtype='M8[ns]'
-            )
-        )
-
-    def test_coerce_of_invalid_datetimes(self):
-        arr = np.array(['01-01-2013', 'not_a_date', '1'], dtype=object)
-
-        # Without coercing, the presence of any invalid dates prevents
-        # any values from being converted
-        self.assert_numpy_array_equal(tslib.array_to_datetime(arr,errors='ignore'), arr)
-
-        # With coercing, the invalid dates becomes iNaT
-        self.assert_numpy_array_equal(
-            tslib.array_to_datetime(arr, errors='coerce'),
-            np.array(
-                    [
-                        '2013-01-01T00:00:00.000000000-0000',
-                        tslib.iNaT,
-                        tslib.iNaT
-                    ],
-                    dtype='M8[ns]'
-            )
-        )
-
-    def test_parsing_timezone_offsets(self):
-        # All of these datetime strings with offsets are equivalent
-        # to the same datetime after the timezone offset is added
-        dt_strings = [
-            '01-01-2013 08:00:00+08:00',
-            '2013-01-01T08:00:00.000000000+0800',
-            '2012-12-31T16:00:00.000000000-0800',
-            '12-31-2012 23:00:00-01:00',
-        ]
-
-        expected_output = tslib.array_to_datetime(
-            np.array(['01-01-2013 00:00:00'], dtype=object)
-        )
-
-        for dt_string in dt_strings:
-            self.assert_numpy_array_equal(
-                tslib.array_to_datetime(
-                    np.array([dt_string], dtype=object)
-                ),
-                expected_output
-            )
-
-class TestTimestampNsOperations(tm.TestCase):
-    def setUp(self):
-        self.timestamp = Timestamp(datetime.datetime.utcnow())
-
-    def assert_ns_timedelta(self, modified_timestamp, expected_value):
-        value = self.timestamp.value
-        modified_value = modified_timestamp.value
-
-        self.assertEqual(modified_value - value, expected_value)
-
-    def test_timedelta_ns_arithmetic(self):
-        self.assert_ns_timedelta(self.timestamp + np.timedelta64(-123, 'ns'), -123)
-
-    def test_timedelta_ns_based_arithmetic(self):
-        self.assert_ns_timedelta(self.timestamp + np.timedelta64(1234567898, 'ns'), 1234567898)
-
-    def test_timedelta_us_arithmetic(self):
-        self.assert_ns_timedelta(self.timestamp + np.timedelta64(-123, 'us'), -123000)
-
-    def test_timedelta_ms_arithmetic(self):
-        time = self.timestamp + np.timedelta64(-123, 'ms')
-        self.assert_ns_timedelta(time, -123000000)
-
-    def test_nanosecond_string_parsing(self):
-        ts = Timestamp('2013-05-01 07:15:45.123456789')
-        # GH 7878
-        expected_repr = '2013-05-01 07:15:45.123456789'
-        expected_value = 1367392545123456789
-        self.assertEqual(ts.value, expected_value)
-        self.assertIn(expected_repr, repr(ts))
-
-        ts = Timestamp('2013-05-01 07:15:45.123456789+09:00', tz='Asia/Tokyo')
-        self.assertEqual(ts.value, expected_value - 9 * 3600 * 1000000000)
-        self.assertIn(expected_repr, repr(ts))
-
-        ts = Timestamp('2013-05-01 07:15:45.123456789', tz='UTC')
-        self.assertEqual(ts.value, expected_value)
-        self.assertIn(expected_repr, repr(ts))
-
-        ts = Timestamp('2013-05-01 07:15:45.123456789', tz='US/Eastern')
-        self.assertEqual(ts.value, expected_value + 4 * 3600 * 1000000000)
-        self.assertIn(expected_repr, repr(ts))
-
-    def test_nanosecond_timestamp(self):
-        # GH 7610
-        expected = 1293840000000000005
-        t = Timestamp('2011-01-01') + offsets.Nano(5)
-        self.assertEqual(repr(t), "Timestamp('2011-01-01 00:00:00.000000005')")
-        self.assertEqual(t.value, expected)
-        self.assertEqual(t.nanosecond, 5)
-
-        t = Timestamp(t)
-        self.assertEqual(repr(t), "Timestamp('2011-01-01 00:00:00.000000005')")
-        self.assertEqual(t.value, expected)
-        self.assertEqual(t.nanosecond, 5)
-
-        t = Timestamp(np.datetime64('2011-01-01 00:00:00.000000005Z'))
-        self.assertEqual(repr(t), "Timestamp('2011-01-01 00:00:00.000000005')")
-        self.assertEqual(t.value, expected)
-        self.assertEqual(t.nanosecond, 5)
-
-        expected = 1293840000000000010
-        t = t + offsets.Nano(5)
-        self.assertEqual(repr(t), "Timestamp('2011-01-01 00:00:00.000000010')")
-        self.assertEqual(t.value, expected)
-        self.assertEqual(t.nanosecond, 10)
-
-        t = Timestamp(t)
-        self.assertEqual(repr(t), "Timestamp('2011-01-01 00:00:00.000000010')")
-        self.assertEqual(t.value, expected)
-        self.assertEqual(t.nanosecond, 10)
-
-        t = Timestamp(np.datetime64('2011-01-01 00:00:00.000000010Z'))
-        self.assertEqual(repr(t), "Timestamp('2011-01-01 00:00:00.000000010')")
-        self.assertEqual(t.value, expected)
-        self.assertEqual(t.nanosecond, 10)
-
-    def test_nat_arithmetic(self):
-        # GH 6873
-        nat = tslib.NaT
-        t = Timestamp('2014-01-01')
-        dt = datetime.datetime(2014, 1, 1)
-        delta = datetime.timedelta(3600)
-
-        # Timestamp / datetime
-        for (left, right) in [(nat, nat), (nat, t), (dt, nat)]:
-            # NaT + Timestamp-like should raise TypeError
-            with tm.assertRaises(TypeError):
-                left + right
-            with tm.assertRaises(TypeError):
-                right + left
-
-            # NaT - Timestamp-like (or inverse) returns NaT
-            self.assertTrue((left - right) is tslib.NaT)
-            self.assertTrue((right - left) is tslib.NaT)
-
-        # timedelta-like
-        # offsets are tested in test_offsets.py
-        for (left, right) in [(nat, delta)]:
-            # NaT + timedelta-like returns NaT
-            self.assertTrue((left + right) is tslib.NaT)
-            # timedelta-like + NaT should raise TypeError
-            with tm.assertRaises(TypeError):
-                right + left
-
-            self.assertTrue((left - right) is tslib.NaT)
-            with tm.assertRaises(TypeError):
-                right - left
-
-
-class TestTslib(tm.TestCase):
-
-    def test_intraday_conversion_factors(self):
-        self.assertEqual(period_asfreq(1, get_freq('D'), get_freq('H'), False), 24)
-        self.assertEqual(period_asfreq(1, get_freq('D'), get_freq('T'), False), 1440)
-        self.assertEqual(period_asfreq(1, get_freq('D'), get_freq('S'), False), 86400)
-        self.assertEqual(period_asfreq(1, get_freq('D'), get_freq('L'), False), 86400000)
-        self.assertEqual(period_asfreq(1, get_freq('D'), get_freq('U'), False), 86400000000)
-        self.assertEqual(period_asfreq(1, get_freq('D'), get_freq('N'), False), 86400000000000)
-
-        self.assertEqual(period_asfreq(1, get_freq('H'), get_freq('T'), False), 60)
-        self.assertEqual(period_asfreq(1, get_freq('H'), get_freq('S'), False), 3600)
-        self.assertEqual(period_asfreq(1, get_freq('H'), get_freq('L'), False), 3600000)
-        self.assertEqual(period_asfreq(1, get_freq('H'), get_freq('U'), False), 3600000000)
-        self.assertEqual(period_asfreq(1, get_freq('H'), get_freq('N'), False), 3600000000000)
-
-        self.assertEqual(period_asfreq(1, get_freq('T'), get_freq('S'), False), 60)
-        self.assertEqual(period_asfreq(1, get_freq('T'), get_freq('L'), False), 60000)
-        self.assertEqual(period_asfreq(1, get_freq('T'), get_freq('U'), False), 60000000)
-        self.assertEqual(period_asfreq(1, get_freq('T'), get_freq('N'), False), 60000000000)
-
-        self.assertEqual(period_asfreq(1, get_freq('S'), get_freq('L'), False), 1000)
-        self.assertEqual(period_asfreq(1, get_freq('S'), get_freq('U'), False), 1000000)
-        self.assertEqual(period_asfreq(1, get_freq('S'), get_freq('N'), False), 1000000000)
-
-        self.assertEqual(period_asfreq(1, get_freq('L'), get_freq('U'), False), 1000)
-        self.assertEqual(period_asfreq(1, get_freq('L'), get_freq('N'), False), 1000000)
-
-        self.assertEqual(period_asfreq(1, get_freq('U'), get_freq('N'), False), 1000)
-
-    def test_period_ordinal_start_values(self):
-        # information for 1.1.1970
-        self.assertEqual(0, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('A')))
-        self.assertEqual(0, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('M')))
-        self.assertEqual(1, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('W')))
-        self.assertEqual(0, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('D')))
-        self.assertEqual(0, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('B')))
-
-    def test_period_ordinal_week(self):
-        self.assertEqual(1, period_ordinal(1970, 1, 4, 0, 0, 0, 0, 0, get_freq('W')))
-        self.assertEqual(2, period_ordinal(1970, 1, 5, 0, 0, 0, 0, 0, get_freq('W')))
-
-        self.assertEqual(2284, period_ordinal(2013, 10, 6, 0, 0, 0, 0, 0, get_freq('W')))
-        self.assertEqual(2285, period_ordinal(2013, 10, 7, 0, 0, 0, 0, 0, get_freq('W')))
-
-    def test_period_ordinal_business_day(self):
-        # Thursday
-        self.assertEqual(11415, period_ordinal(2013, 10, 3, 0, 0, 0, 0, 0, get_freq('B')))
-        # Friday
-        self.assertEqual(11416, period_ordinal(2013, 10, 4, 0, 0, 0, 0, 0, get_freq('B')))
-        # Saturday
-        self.assertEqual(11417, period_ordinal(2013, 10, 5, 0, 0, 0, 0, 0, get_freq('B')))
-        # Sunday
-        self.assertEqual(11417, period_ordinal(2013, 10, 6, 0, 0, 0, 0, 0, get_freq('B')))
-        # Monday
-        self.assertEqual(11417, period_ordinal(2013, 10, 7, 0, 0, 0, 0, 0, get_freq('B')))
-        # Tuesday
-        self.assertEqual(11418, period_ordinal(2013, 10, 8, 0, 0, 0, 0, 0, get_freq('B')))
-
-    def test_tslib_tz_convert(self):
-        def compare_utc_to_local(tz_didx, utc_didx):
-            f = lambda x: tslib.tz_convert_single(x, 'UTC', tz_didx.tz)
-            result = tslib.tz_convert(tz_didx.asi8, 'UTC', tz_didx.tz)
-            result_single = np.vectorize(f)(tz_didx.asi8)
-            self.assert_numpy_array_equal(result, result_single)
-
-        def compare_local_to_utc(tz_didx, utc_didx):
-            f = lambda x: tslib.tz_convert_single(x, tz_didx.tz, 'UTC')
-            result = tslib.tz_convert(utc_didx.asi8, tz_didx.tz, 'UTC')
-            result_single = np.vectorize(f)(utc_didx.asi8)
-            self.assert_numpy_array_equal(result, result_single)
-
-        for tz in ['UTC', 'Asia/Tokyo', 'US/Eastern', 'Europe/Moscow']:
-            # US: 2014-03-09 - 2014-11-11
-            # MOSCOW: 2014-10-26  /  2014-12-31
-            tz_didx = date_range('2014-03-01', '2015-01-10', freq='H', tz=tz)
-            utc_didx = date_range('2014-03-01', '2015-01-10', freq='H')
-            compare_utc_to_local(tz_didx, utc_didx)
-            # local tz to UTC can be differ in hourly (or higher) freqs because of DST
-            compare_local_to_utc(tz_didx, utc_didx)
-
-            tz_didx = date_range('2000-01-01', '2020-01-01', freq='D', tz=tz)
-            utc_didx = date_range('2000-01-01', '2020-01-01', freq='D')
-            compare_utc_to_local(tz_didx, utc_didx)
-            compare_local_to_utc(tz_didx, utc_didx)
-
-            tz_didx = date_range('2000-01-01', '2100-01-01', freq='A', tz=tz)
-            utc_didx = date_range('2000-01-01', '2100-01-01', freq='A')
-            compare_utc_to_local(tz_didx, utc_didx)
-            compare_local_to_utc(tz_didx, utc_didx)
-
-        # Check empty array
-        result = tslib.tz_convert(np.array([], dtype=np.int64),
-                                  tslib.maybe_get_tz('US/Eastern'),
-                                  tslib.maybe_get_tz('Asia/Tokyo'))
-        self.assert_numpy_array_equal(result, np.array([], dtype=np.int64))
-
-        # Check all-NaT array
-        result = tslib.tz_convert(np.array([tslib.iNaT], dtype=np.int64),
-                                  tslib.maybe_get_tz('US/Eastern'),
-                                  tslib.maybe_get_tz('Asia/Tokyo'))
-        self.assert_numpy_array_equal(result, np.array([tslib.iNaT], dtype=np.int64))
-
-    def test_shift_months(self):
-        s = DatetimeIndex([Timestamp('2000-01-05 00:15:00'), Timestamp('2000-01-31 00:23:00'),
-                           Timestamp('2000-01-01'), Timestamp('2000-02-29'), Timestamp('2000-12-31')])
-        for years in [-1, 0, 1]:
-            for months in [-2, 0, 2]:
-                actual = DatetimeIndex(tslib.shift_months(s.asi8, years * 12 + months))
-                expected = DatetimeIndex([x + offsets.DateOffset(years=years, months=months) for x in s])
-                tm.assert_index_equal(actual, expected)
-
-
-
-class TestTimestampOps(tm.TestCase):
-    def test_timestamp_and_datetime(self):
-        self.assertEqual((Timestamp(datetime.datetime(2013, 10, 13)) - datetime.datetime(2013, 10, 12)).days, 1)
-        self.assertEqual((datetime.datetime(2013, 10, 12) - Timestamp(datetime.datetime(2013, 10, 13))).days, -1)
-
-    def test_timestamp_and_series(self):
-        timestamp_series = Series(date_range('2014-03-17', periods=2, freq='D', tz='US/Eastern'))
-        first_timestamp = timestamp_series[0]
-
-        delta_series = Series([np.timedelta64(0, 'D'), np.timedelta64(1, 'D')])
-        assert_series_equal(timestamp_series - first_timestamp, delta_series)
-        assert_series_equal(first_timestamp - timestamp_series, -delta_series)
-
-    def test_addition_subtraction_types(self):
-        # Assert on the types resulting from Timestamp +/- various date/time objects
-        datetime_instance = datetime.datetime(2014, 3, 4)
-        timedelta_instance = datetime.timedelta(seconds=1)
-        # build a timestamp with a frequency, since then it supports addition/subtraction of integers
-        timestamp_instance = date_range(datetime_instance, periods=1, freq='D')[0]
-
-        self.assertEqual(type(timestamp_instance + 1), Timestamp)
-        self.assertEqual(type(timestamp_instance - 1), Timestamp)
-
-        # Timestamp + datetime not supported, though subtraction is supported and yields timedelta
-        # more tests in tseries/base/tests/test_base.py
-        self.assertEqual(type(timestamp_instance - datetime_instance), Timedelta)
-        self.assertEqual(type(timestamp_instance + timedelta_instance), Timestamp)
-        self.assertEqual(type(timestamp_instance - timedelta_instance), Timestamp)
-
-        # Timestamp +/- datetime64 not supported, so not tested (could possibly assert error raised?)
-        timedelta64_instance = np.timedelta64(1, 'D')
-        self.assertEqual(type(timestamp_instance + timedelta64_instance), Timestamp)
-        self.assertEqual(type(timestamp_instance - timedelta64_instance), Timestamp)
-
-    def test_addition_subtraction_preserve_frequency(self):
-        timestamp_instance = date_range('2014-03-05', periods=1, freq='D')[0]
-        timedelta_instance = datetime.timedelta(days=1)
-        original_freq = timestamp_instance.freq
-        self.assertEqual((timestamp_instance + 1).freq, original_freq)
-        self.assertEqual((timestamp_instance - 1).freq, original_freq)
-        self.assertEqual((timestamp_instance + timedelta_instance).freq, original_freq)
-        self.assertEqual((timestamp_instance - timedelta_instance).freq, original_freq)
-
-        timedelta64_instance = np.timedelta64(1, 'D')
-        self.assertEqual((timestamp_instance + timedelta64_instance).freq, original_freq)
-        self.assertEqual((timestamp_instance - timedelta64_instance).freq, original_freq)
-
-    def test_resolution(self):
-
-        for freq, expected in zip(['A', 'Q', 'M', 'D', 'H', 'T', 'S', 'L', 'U'],
-                                  [period.D_RESO, period.D_RESO, period.D_RESO, period.D_RESO,
-                                   period.H_RESO, period.T_RESO, period.S_RESO, period.MS_RESO, period.US_RESO]):
-            for tz in [None, 'Asia/Tokyo', 'US/Eastern', 'dateutil/US/Eastern']:
-                idx = date_range(start='2013-04-01', periods=30, freq=freq, tz=tz)
-                result = period.resolution(idx.asi8, idx.tz)
-                self.assertEqual(result, expected)
-
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tseries/tests/test_util.py b/pandas/tseries/tests/test_util.py
deleted file mode 100644
index c75fcbdac07c0..0000000000000
--- a/pandas/tseries/tests/test_util.py
+++ /dev/null
@@ -1,116 +0,0 @@
-from pandas.compat import range
-import nose
-
-import numpy as np
-from numpy.testing.decorators import slow
-
-from pandas import Series, date_range
-import pandas.util.testing as tm
-
-from datetime import datetime, date
-
-from pandas.tseries.tools import normalize_date
-from pandas.tseries.util import pivot_annual, isleapyear
-
-
-class TestPivotAnnual(tm.TestCase):
-    """
-    New pandas of scikits.timeseries pivot_annual
-    """
-    def test_daily(self):
-        rng = date_range('1/1/2000', '12/31/2004', freq='D')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        annual = pivot_annual(ts, 'D')
-
-        doy = ts.index.dayofyear
-        doy[(~isleapyear(ts.index.year)) & (doy >= 60)] += 1
-
-        for i in range(1, 367):
-            subset = ts[doy == i]
-            subset.index = [x.year for x in subset.index]
-
-            result = annual[i].dropna()
-            tm.assert_series_equal(result, subset, check_names=False)
-            self.assertEqual(result.name, i)
-
-        # check leap days
-        leaps = ts[(ts.index.month == 2) & (ts.index.day == 29)]
-        day = leaps.index.dayofyear[0]
-        leaps.index = leaps.index.year
-        leaps.name = 60
-        tm.assert_series_equal(annual[day].dropna(), leaps)
-
-    def test_hourly(self):
-        rng_hourly = date_range(
-            '1/1/1994', periods=(18 * 8760 + 4 * 24), freq='H')
-        data_hourly = np.random.randint(100, 350, rng_hourly.size)
-        ts_hourly = Series(data_hourly, index=rng_hourly)
-
-        grouped = ts_hourly.groupby(ts_hourly.index.year)
-        hoy = grouped.apply(lambda x: x.reset_index(drop=True))
-        hoy = hoy.index.droplevel(0).values
-        hoy[~isleapyear(ts_hourly.index.year) & (hoy >= 1416)] += 24
-        hoy += 1
-
-        annual = pivot_annual(ts_hourly)
-
-        ts_hourly = ts_hourly.astype(float)
-        for i in [1, 1416, 1417, 1418, 1439, 1440, 1441, 8784]:
-            subset = ts_hourly[hoy == i]
-            subset.index = [x.year for x in subset.index]
-
-            result = annual[i].dropna()
-            tm.assert_series_equal(result, subset, check_names=False)
-            self.assertEqual(result.name, i)
-
-        leaps = ts_hourly[(ts_hourly.index.month == 2) &
-                          (ts_hourly.index.day == 29) &
-                          (ts_hourly.index.hour == 0)]
-        hour = leaps.index.dayofyear[0] * 24 - 23
-        leaps.index = leaps.index.year
-        leaps.name = 1417
-        tm.assert_series_equal(annual[hour].dropna(), leaps)
-
-
-    def test_weekly(self):
-        pass
-
-    def test_monthly(self):
-        rng = date_range('1/1/2000', '12/31/2004', freq='M')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        annual = pivot_annual(ts, 'M')
-
-        month = ts.index.month
-        for i in range(1, 13):
-            subset = ts[month == i]
-            subset.index = [x.year for x in subset.index]
-            result = annual[i].dropna()
-            tm.assert_series_equal(result, subset, check_names=False)
-            self.assertEqual(result.name, i)
-
-    def test_period_monthly(self):
-        pass
-
-    def test_period_daily(self):
-        pass
-
-    def test_period_weekly(self):
-        pass
-
-
-def test_normalize_date():
-    value = date(2012, 9, 7)
-
-    result = normalize_date(value)
-    assert(result == datetime(2012, 9, 7))
-
-    value = datetime(2012, 9, 7, 12)
-
-    result = normalize_date(value)
-    assert(result == datetime(2012, 9, 7))
-
-if __name__ == '__main__':
-    nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
-                   exit=False)
diff --git a/pandas/tseries/timedeltas.py b/pandas/tseries/timedeltas.py
deleted file mode 100644
index 11200bb2540cd..0000000000000
--- a/pandas/tseries/timedeltas.py
+++ /dev/null
@@ -1,114 +0,0 @@
-"""
-timedelta support tools
-"""
-
-import re
-import numpy as np
-import pandas.tslib as tslib
-from pandas import compat
-from pandas.core.common import (ABCSeries, is_integer_dtype,
-                                is_timedelta64_dtype, is_list_like,
-                                isnull, _ensure_object, ABCIndexClass)
-from pandas.util.decorators import deprecate_kwarg
-
-@deprecate_kwarg(old_arg_name='coerce', new_arg_name='errors',
-                 mapping={True: 'coerce', False: 'raise'})
-def to_timedelta(arg, unit='ns', box=True, errors='raise', coerce=None):
-    """
-    Convert argument to timedelta
-
-    Parameters
-    ----------
-    arg : string, timedelta, array of strings (with possible NAs)
-    unit : unit of the arg (D,h,m,s,ms,us,ns) denote the unit, which is an integer/float number
-    box : boolean, default True
-        - If True returns a Timedelta/TimedeltaIndex of the results
-        - if False returns a np.timedelta64 or ndarray of values of dtype timedelta64[ns]
-    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
-        - If 'raise', then invalid parsing will raise an exception
-        - If 'coerce', then invalid parsing will be set as NaT
-        - If 'ignore', then invalid parsing will return the input
-
-    Returns
-    -------
-    ret : timedelta64/arrays of timedelta64 if parsing succeeded
-    """
-    unit = _validate_timedelta_unit(unit)
-
-    def _convert_listlike(arg, box, unit, name=None):
-
-        if isinstance(arg, (list,tuple)) or ((hasattr(arg,'__iter__') and not hasattr(arg,'dtype'))):
-            arg = np.array(list(arg), dtype='O')
-
-        # these are shortcutable
-        if is_timedelta64_dtype(arg):
-            value = arg.astype('timedelta64[ns]')
-        elif is_integer_dtype(arg):
-            value = arg.astype('timedelta64[{0}]'.format(unit)).astype('timedelta64[ns]', copy=False)
-        else:
-            value = tslib.array_to_timedelta64(_ensure_object(arg), unit=unit, errors=errors)
-            value = value.astype('timedelta64[ns]', copy=False)
-
-        if box:
-            from pandas import TimedeltaIndex
-            value = TimedeltaIndex(value,unit='ns', name=name)
-        return value
-
-    if arg is None:
-        return arg
-    elif isinstance(arg, ABCSeries):
-        from pandas import Series
-        values = _convert_listlike(arg._values, box=False, unit=unit)
-        return Series(values, index=arg.index, name=arg.name, dtype='m8[ns]')
-    elif isinstance(arg, ABCIndexClass):
-        return _convert_listlike(arg, box=box, unit=unit, name=arg.name)
-    elif is_list_like(arg):
-        return _convert_listlike(arg, box=box, unit=unit)
-
-    # ...so it must be a scalar value. Return scalar.
-    return _coerce_scalar_to_timedelta_type(arg, unit=unit, box=box, errors=errors)
-
-_unit_map = {
-    'Y' : 'Y',
-    'y' : 'Y',
-    'W' : 'W',
-    'w' : 'W',
-    'D' : 'D',
-    'd' : 'D',
-    'days' : 'D',
-    'Days' : 'D',
-    'day'  : 'D',
-    'Day'  : 'D',
-    'M'    : 'M',
-    'H'  : 'h',
-    'h'  : 'h',
-    'm'  : 'm',
-    'T'  : 'm',
-    'S'  : 's',
-    's'  : 's',
-    'L'  : 'ms',
-    'MS' : 'ms',
-    'ms' : 'ms',
-    'US' : 'us',
-    'us' : 'us',
-    'NS' : 'ns',
-    'ns' : 'ns',
-    }
-
-def _validate_timedelta_unit(arg):
-    """ provide validation / translation for timedelta short units """
-    try:
-        return _unit_map[arg]
-    except:
-        if arg is None:
-            return 'ns'
-        raise ValueError("invalid timedelta unit {0} provided".format(arg))
-
-def _coerce_scalar_to_timedelta_type(r, unit='ns', box=True, errors='raise'):
-    """ convert strings to timedelta; coerce to Timedelta (if box), else np.timedelta64"""
-
-    result = tslib.convert_to_timedelta(r,unit,errors)
-    if box:
-        result = tslib.Timedelta(result)
-
-    return result
diff --git a/pandas/tseries/tools.py b/pandas/tseries/tools.py
deleted file mode 100644
index c38878fe398e4..0000000000000
--- a/pandas/tseries/tools.py
+++ /dev/null
@@ -1,501 +0,0 @@
-from datetime import datetime, timedelta
-import re
-import sys
-
-import numpy as np
-
-import pandas.lib as lib
-import pandas.tslib as tslib
-import pandas.core.common as com
-from pandas.compat import StringIO, callable
-from pandas.core.common import ABCIndexClass
-import pandas.compat as compat
-from pandas.util.decorators import deprecate_kwarg
-
-try:
-    import dateutil
-    # raise exception if dateutil 2.0 install on 2.x platform
-    if (sys.version_info[0] == 2 and
-            dateutil.__version__ == '2.0'):  # pragma: no cover
-        raise Exception('dateutil 2.0 incompatible with Python 2.x, you must '
-                        'install version 1.5 or 2.1+!')
-except ImportError:  # pragma: no cover
-    print('Please install python-dateutil via easy_install or some method!')
-    raise  # otherwise a 2nd import won't show the message
-
-_DATEUTIL_LEXER_SPLIT = None
-try:
-    # Since these are private methods from dateutil, it is safely imported
-    # here so in case this interface changes, pandas will just fallback
-    # to not using the functionality
-    from dateutil.parser import _timelex
-
-    if hasattr(_timelex, 'split'):
-        def _lexer_split_from_str(dt_str):
-            # The StringIO(str(_)) is for dateutil 2.2 compatibility
-            return _timelex.split(StringIO(str(dt_str)))
-
-        _DATEUTIL_LEXER_SPLIT = _lexer_split_from_str
-except (ImportError, AttributeError):
-    pass
-
-def _infer_tzinfo(start, end):
-    def _infer(a, b):
-        tz = a.tzinfo
-        if b and b.tzinfo:
-            if not (tslib.get_timezone(tz) == tslib.get_timezone(b.tzinfo)):
-                raise AssertionError('Inputs must both have the same timezone,'
-                                     ' {0} != {1}'.format(tz, b.tzinfo))
-        return tz
-    tz = None
-    if start is not None:
-        tz = _infer(start, end)
-    elif end is not None:
-        tz = _infer(end, start)
-    return tz
-
-
-def _guess_datetime_format(dt_str, dayfirst=False,
-                           dt_str_parse=compat.parse_date,
-                           dt_str_split=_DATEUTIL_LEXER_SPLIT):
-    """
-    Guess the datetime format of a given datetime string.
-
-    Parameters
-    ----------
-    dt_str : string, datetime string to guess the format of
-    dayfirst : boolean, default False
-        If True parses dates with the day first, eg 20/01/2005
-        Warning: dayfirst=True is not strict, but will prefer to parse
-        with day first (this is a known bug).
-    dt_str_parse : function, defaults to `compate.parse_date` (dateutil)
-        This function should take in a datetime string and return
-        a `datetime.datetime` guess that the datetime string represents
-    dt_str_split : function, defaults to `_DATEUTIL_LEXER_SPLIT` (dateutil)
-        This function should take in a datetime string and return
-        a list of strings, the guess of the various specific parts
-        e.g. '2011/12/30' -> ['2011', '/', '12', '/', '30']
-
-    Returns
-    -------
-    ret : datetime formatt string (for `strftime` or `strptime`)
-    """
-    if dt_str_parse is None or dt_str_split is None:
-        return None
-
-    if not isinstance(dt_str, compat.string_types):
-        return None
-
-    day_attribute_and_format = (('day',), '%d', 2)
-
-    # attr name, format, padding (if any)
-    datetime_attrs_to_format = [
-        (('year', 'month', 'day'), '%Y%m%d', 0),
-        (('year',), '%Y', 0),
-        (('month',), '%B', 0),
-        (('month',), '%b', 0),
-        (('month',), '%m', 2),
-        day_attribute_and_format,
-        (('hour',), '%H', 2),
-        (('minute',), '%M', 2),
-        (('second',), '%S', 2),
-        (('microsecond',), '%f', 6),
-        (('second', 'microsecond'), '%S.%f', 0),
-    ]
-
-    if dayfirst:
-        datetime_attrs_to_format.remove(day_attribute_and_format)
-        datetime_attrs_to_format.insert(0, day_attribute_and_format)
-
-    try:
-        parsed_datetime = dt_str_parse(dt_str, dayfirst=dayfirst)
-    except:
-        # In case the datetime can't be parsed, its format cannot be guessed
-        return None
-
-    if parsed_datetime is None:
-        return None
-
-    try:
-        tokens = dt_str_split(dt_str)
-    except:
-        # In case the datetime string can't be split, its format cannot
-        # be guessed
-        return None
-
-    format_guess = [None] * len(tokens)
-    found_attrs = set()
-
-    for attrs, attr_format, padding in datetime_attrs_to_format:
-        # If a given attribute has been placed in the format string, skip
-        # over other formats for that same underlying attribute (IE, month
-        # can be represented in multiple different ways)
-        if set(attrs) & found_attrs:
-            continue
-
-        if all(getattr(parsed_datetime, attr) is not None for attr in attrs):
-            for i, token_format in enumerate(format_guess):
-                token_filled = tokens[i].zfill(padding)
-                if (token_format is None and
-                        token_filled == parsed_datetime.strftime(attr_format)):
-                    format_guess[i] = attr_format
-                    tokens[i] = token_filled
-                    found_attrs.update(attrs)
-                    break
-
-    # Only consider it a valid guess if we have a year, month and day
-    if len(set(['year', 'month', 'day']) & found_attrs) != 3:
-        return None
-
-    output_format = []
-    for i, guess in enumerate(format_guess):
-        if guess is not None:
-            # Either fill in the format placeholder (like %Y)
-            output_format.append(guess)
-        else:
-            # Or just the token separate (IE, the dashes in "01-01-2013")
-            try:
-                # If the token is numeric, then we likely didn't parse it
-                # properly, so our guess is wrong
-                float(tokens[i])
-                return None
-            except ValueError:
-                pass
-
-            output_format.append(tokens[i])
-
-    guessed_format = ''.join(output_format)
-
-    # rebuild string, capturing any inferred padding
-    dt_str = ''.join(tokens)
-    if parsed_datetime.strftime(guessed_format) == dt_str:
-        return guessed_format
-
-def _guess_datetime_format_for_array(arr, **kwargs):
-    # Try to guess the format based on the first non-NaN element
-    non_nan_elements = com.notnull(arr).nonzero()[0]
-    if len(non_nan_elements):
-        return _guess_datetime_format(arr[non_nan_elements[0]], **kwargs)
-
-
-@deprecate_kwarg(old_arg_name='coerce', new_arg_name='errors',
-                 mapping={True: 'coerce', False: 'raise'})
-def to_datetime(arg, errors='raise', dayfirst=False, yearfirst=False,
-                utc=None, box=True, format=None, exact=True, coerce=None,
-                unit='ns', infer_datetime_format=False):
-    """
-    Convert argument to datetime.
-
-    Parameters
-    ----------
-    arg : string, datetime, array of strings (with possible NAs)
-    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
-        - If 'raise', then invalid parsing will raise an exception
-        - If 'coerce', then invalid parsing will be set as NaT
-        - If 'ignore', then invalid parsing will return the input
-    dayfirst : boolean, default False
-        Specify a date parse order if `arg` is str or its list-likes.
-        If True, parses dates with the day first, eg 10/11/12 is parsed as 2012-11-10.
-        Warning: dayfirst=True is not strict, but will prefer to parse
-        with day first (this is a known bug, based on dateutil behavior).
-    yearfirst : boolean, default False
-        Specify a date parse order if `arg` is str or its list-likes.
-        - If True parses dates with the year first, eg 10/11/12 is parsed as 2010-11-12.
-        - If both dayfirst and yearfirst are True, yearfirst is preceded (same as dateutil).
-        Warning: yearfirst=True is not strict, but will prefer to parse
-        with year first (this is a known bug, based on dateutil beahavior).
-
-        .. versionadded: 0.16.1
-
-    utc : boolean, default None
-        Return UTC DatetimeIndex if True (converting any tz-aware
-        datetime.datetime objects as well).
-    box : boolean, default True
-        - If True returns a DatetimeIndex
-        - If False returns ndarray of values.
-    format : string, default None
-        strftime to parse time, eg "%d/%m/%Y", note that "%f" will parse
-        all the way up to nanoseconds.
-    exact : boolean, True by default
-        - If True, require an exact format match.
-        - If False, allow the format to match anywhere in the target string.
-    unit : unit of the arg (D,s,ms,us,ns) denote the unit in epoch
-        (e.g. a unix timestamp), which is an integer/float number.
-    infer_datetime_format : boolean, default False
-        If no `format` is given, try to infer the format based on the first
-        datetime string. Provides a large speed-up in many cases.
-
-    Returns
-    -------
-    ret : datetime if parsing succeeded.
-        Return type depends on input:
-
-        - list-like: DatetimeIndex
-        - Series: Series of datetime64 dtype
-        - scalar: Timestamp
-
-        In case when it is not possible to return designated types (e.g. when
-        any element of input is before Timestamp.min or after Timestamp.max)
-        return will have datetime.datetime type (or correspoding array/Series).
-
-    Examples
-    --------
-    Take separate series and convert to datetime
-
-    >>> import pandas as pd
-    >>> i = pd.date_range('20000101',periods=100)
-    >>> df = pd.DataFrame(dict(year = i.year, month = i.month, day = i.day))
-    >>> pd.to_datetime(df.year*10000 + df.month*100 + df.day, format='%Y%m%d')
-    0    2000-01-01
-    1    2000-01-02
-    ...
-    98   2000-04-08
-    99   2000-04-09
-    Length: 100, dtype: datetime64[ns]
-
-    Or from strings
-
-    >>> df = df.astype(str)
-    >>> pd.to_datetime(df.day + df.month + df.year, format="%d%m%Y")
-    0    2000-01-01
-    1    2000-01-02
-    ...
-    98   2000-04-08
-    99   2000-04-09
-    Length: 100, dtype: datetime64[ns]
-
-    Date that does not meet timestamp limitations:
-
-    >>> pd.to_datetime('13000101', format='%Y%m%d')
-    datetime.datetime(1300, 1, 1, 0, 0)
-    >>> pd.to_datetime('13000101', format='%Y%m%d', errors='coerce')
-    NaT
-    """
-    return _to_datetime(arg, errors=errors, dayfirst=dayfirst, yearfirst=yearfirst,
-                        utc=utc, box=box, format=format, exact=exact,
-                        unit=unit, infer_datetime_format=infer_datetime_format)
-
-
-def _to_datetime(arg, errors='raise', dayfirst=False, yearfirst=False,
-                 utc=None, box=True, format=None, exact=True,
-                 unit='ns', freq=None, infer_datetime_format=False):
-    """
-    Same as to_datetime, but accept freq for
-    DatetimeIndex internal construction
-    """
-    from pandas.core.series import Series
-    from pandas.tseries.index import DatetimeIndex
-
-    def _convert_listlike(arg, box, format, name=None):
-
-        if isinstance(arg, (list,tuple)):
-            arg = np.array(arg, dtype='O')
-
-        # these are shortcutable
-        if com.is_datetime64_ns_dtype(arg):
-            if box and not isinstance(arg, DatetimeIndex):
-                try:
-                    return DatetimeIndex(arg, tz='utc' if utc else None, name=name)
-                except ValueError:
-                    pass
-
-            return arg
-
-        elif com.is_datetime64tz_dtype(arg):
-            if not isinstance(arg, DatetimeIndex):
-                return DatetimeIndex(arg, tz='utc' if utc else None)
-            if utc:
-                arg = arg.tz_convert(None)
-            return arg
-
-        elif format is None and com.is_integer_dtype(arg) and unit=='ns':
-            result = arg.astype('datetime64[ns]')
-            if box:
-                return DatetimeIndex(result, tz='utc' if utc else None, name=name)
-
-            return result
-
-        arg = com._ensure_object(arg)
-        require_iso8601 = False
-
-        if infer_datetime_format and format is None:
-            format = _guess_datetime_format_for_array(arg, dayfirst=dayfirst)
-
-        if format is not None:
-            # There is a special fast-path for iso8601 formatted
-            # datetime strings, so in those cases don't use the inferred
-            # format because this path makes process slower in this
-            # special case
-            format_is_iso8601 = (
-                ('%Y-%m-%dT%H:%M:%S.%f'.startswith(format) or
-                '%Y-%m-%d %H:%M:%S.%f'.startswith(format)) and
-				format != '%Y'
-            )
-            if format_is_iso8601:
-                require_iso8601 = not infer_datetime_format
-                format = None
-
-        try:
-            result = None
-
-            if format is not None:
-                # shortcut formatting here
-                if format == '%Y%m%d':
-                    try:
-                        result = _attempt_YYYYMMDD(arg, errors=errors)
-                    except:
-                        raise ValueError("cannot convert the input to '%Y%m%d' date format")
-
-                # fallback
-                if result is None:
-                    try:
-                        result = tslib.array_strptime(
-                            arg, format, exact=exact, errors=errors)
-                    except (tslib.OutOfBoundsDatetime):
-                        if errors == 'raise':
-                            raise
-                        result = arg
-                    except ValueError:
-                        # if format was inferred, try falling back
-                        # to array_to_datetime - terminate here
-                        # for specified formats
-                        if not infer_datetime_format:
-                            if errors == 'raise':
-                                raise
-                            result = arg
-
-            if result is None and (format is None or infer_datetime_format):
-                result = tslib.array_to_datetime(arg, errors=errors,
-                                                 utc=utc, dayfirst=dayfirst,
-                                                 yearfirst=yearfirst, freq=freq,
-                                                 unit=unit,
-                                                 require_iso8601=require_iso8601)
-
-            if com.is_datetime64_dtype(result) and box:
-                result = DatetimeIndex(result, tz='utc' if utc else None, name=name)
-            return result
-
-        except ValueError as e:
-            try:
-                values, tz = tslib.datetime_to_datetime64(arg)
-                return DatetimeIndex._simple_new(values, name=name, tz=tz)
-            except (ValueError, TypeError):
-                raise e
-
-    if arg is None:
-        return arg
-    elif isinstance(arg, tslib.Timestamp):
-        return arg
-    elif isinstance(arg, Series):
-        values = _convert_listlike(arg._values, False, format)
-        return Series(values, index=arg.index, name=arg.name)
-    elif isinstance(arg, ABCIndexClass):
-        return _convert_listlike(arg, box, format, name=arg.name)
-    elif com.is_list_like(arg):
-        return _convert_listlike(arg, box, format)
-
-    return _convert_listlike(np.array([ arg ]), box, format)[0]
-
-
-def _attempt_YYYYMMDD(arg, errors):
-    """ try to parse the YYYYMMDD/%Y%m%d format, try to deal with NaT-like,
-        arg is a passed in as an object dtype, but could really be ints/strings with nan-like/or floats (e.g. with nan)
-
-        Parameters
-        ----------
-        arg : passed value
-        errors : 'raise','ignore','coerce'
-        """
-
-    def calc(carg):
-        # calculate the actual result
-        carg = carg.astype(object)
-        return tslib.array_to_datetime(lib.try_parse_year_month_day(carg/10000,carg/100 % 100, carg % 100), errors=errors)
-
-    def calc_with_mask(carg,mask):
-        result = np.empty(carg.shape, dtype='M8[ns]')
-        iresult = result.view('i8')
-        iresult[~mask] = tslib.iNaT
-        result[mask] = calc(carg[mask].astype(np.float64).astype(np.int64)).astype('M8[ns]')
-        return result
-
-    # try intlike / strings that are ints
-    try:
-        return calc(arg.astype(np.int64))
-    except:
-        pass
-
-    # a float with actual np.nan
-    try:
-        carg = arg.astype(np.float64)
-        return calc_with_mask(carg,com.notnull(carg))
-    except:
-        pass
-
-    # string with NaN-like
-    try:
-        mask = ~lib.ismember(arg, tslib._nat_strings)
-        return calc_with_mask(arg,mask)
-    except:
-        pass
-
-    return None
-
-
-def parse_time_string(arg, freq=None, dayfirst=None, yearfirst=None):
-    """
-    Try hard to parse datetime string, leveraging dateutil plus some extra
-    goodies like quarter recognition.
-
-    Parameters
-    ----------
-    arg : compat.string_types
-    freq : str or DateOffset, default None
-        Helps with interpreting time string if supplied
-    dayfirst : bool, default None
-        If None uses default from print_config
-    yearfirst : bool, default None
-        If None uses default from print_config
-
-    Returns
-    -------
-    datetime, datetime/dateutil.parser._result, str
-    """
-    from pandas.core.config import get_option
-    if not isinstance(arg, compat.string_types):
-        return arg
-
-    from pandas.tseries.offsets import DateOffset
-    if isinstance(freq, DateOffset):
-        freq = freq.rule_code
-
-    if dayfirst is None:
-        dayfirst = get_option("display.date_dayfirst")
-    if yearfirst is None:
-        yearfirst = get_option("display.date_yearfirst")
-
-    return tslib.parse_datetime_string_with_reso(arg, freq=freq, dayfirst=dayfirst,
-                                                 yearfirst=yearfirst)
-
-
-DateParseError = tslib.DateParseError
-normalize_date = tslib.normalize_date
-
-
-def format(dt):
-    """Returns date in YYYYMMDD format."""
-    return dt.strftime('%Y%m%d')
-
-OLE_TIME_ZERO = datetime(1899, 12, 30, 0, 0, 0)
-
-
-def ole2datetime(oledt):
-    """function for converting excel date to normal date format"""
-    val = float(oledt)
-
-    # Excel has a bug where it thinks the date 2/29/1900 exists
-    # we just reject any date before 3/1/1900.
-    if val < 61:
-        raise ValueError("Value is outside of acceptable range: %s " % val)
-
-    return OLE_TIME_ZERO + timedelta(days=val)
diff --git a/pandas/tseries/util.py b/pandas/tseries/util.py
deleted file mode 100644
index 4f29b2bf31f83..0000000000000
--- a/pandas/tseries/util.py
+++ /dev/null
@@ -1,92 +0,0 @@
-from pandas.compat import range, lrange
-import numpy as np
-import pandas.core.common as com
-from pandas.core.frame import DataFrame
-import pandas.core.nanops as nanops
-
-
-def pivot_annual(series, freq=None):
-    """
-    Group a series by years, taking leap years into account.
-
-    The output has as many rows as distinct years in the original series,
-    and as many columns as the length of a leap year in the units corresponding
-    to the original frequency (366 for daily frequency, 366*24 for hourly...).
-    The fist column of the output corresponds to Jan. 1st, 00:00:00,
-    while the last column corresponds to Dec, 31st, 23:59:59.
-    Entries corresponding to Feb. 29th are masked for non-leap years.
-
-    For example, if the initial series has a daily frequency, the 59th column
-    of the output always corresponds to Feb. 28th, the 61st column to Mar. 1st,
-    and the 60th column is masked for non-leap years.
-    With a hourly initial frequency, the (59*24)th column of the output always
-    correspond to Feb. 28th 23:00, the (61*24)th column to Mar. 1st, 00:00, and
-    the 24 columns between (59*24) and (61*24) are masked.
-
-    If the original frequency is less than daily, the output is equivalent to
-    ``series.convert('A', func=None)``.
-
-    Parameters
-    ----------
-    series : Series
-    freq : string or None, default None
-
-    Returns
-    -------
-    annual : DataFrame
-    """
-    index = series.index
-    year = index.year
-    years = nanops.unique1d(year)
-
-    if freq is not None:
-        freq = freq.upper()
-    else:
-        freq = series.index.freq
-
-    if freq == 'D':
-        width = 366
-        offset = index.dayofyear - 1
-
-        # adjust for leap year
-        offset[(~isleapyear(year)) & (offset >= 59)] += 1
-
-        columns = lrange(1, 367)
-        # todo: strings like 1/1, 1/25, etc.?
-    elif freq in ('M', 'BM'):
-        width = 12
-        offset = index.month - 1
-        columns = lrange(1, 13)
-    elif freq == 'H':
-        width = 8784
-        grouped = series.groupby(series.index.year)
-        defaulted = grouped.apply(lambda x: x.reset_index(drop=True))
-        defaulted.index = defaulted.index.droplevel(0)
-        offset = np.asarray(defaulted.index)
-        offset[~isleapyear(year) & (offset >= 1416)] += 24
-        columns = lrange(1, 8785)
-    else:
-        raise NotImplementedError(freq)
-
-    flat_index = (year - years.min()) * width + offset
-    flat_index = com._ensure_platform_int(flat_index)
-
-    values = np.empty((len(years), width))
-    values.fill(np.nan)
-    values.put(flat_index, series.values)
-
-    return DataFrame(values, index=years, columns=columns)
-
-
-def isleapyear(year):
-    """
-    Returns true if year is a leap year.
-
-    Parameters
-    ----------
-    year : integer / sequence
-        A given (list of) year(s).
-    """
-    year = np.asarray(year)
-    return np.logical_or(year % 400 == 0,
-                         np.logical_and(year % 4 == 0, year % 100 > 0))
diff --git a/pandas/tslib.pxd b/pandas/tslib.pxd
deleted file mode 100644
index 3cb7e94c65100..0000000000000
--- a/pandas/tslib.pxd
+++ /dev/null
@@ -1,9 +0,0 @@
-from numpy cimport ndarray, int64_t
-
-cdef convert_to_tsobject(object, object, object)
-cdef convert_to_timedelta64(object, object, object)
-cpdef object maybe_get_tz(object)
-cdef bint _is_utc(object)
-cdef bint _is_tzlocal(object)
-cdef object _get_dst_info(object)
-cdef bint _nat_scalar_rules[6]
diff --git a/pandas/tslib.py b/pandas/tslib.py
new file mode 100644
index 0000000000000..c06b34c1b0483
--- /dev/null
+++ b/pandas/tslib.py
@@ -0,0 +1,7 @@
+# flake8: noqa
+
+import warnings
+warnings.warn("The pandas.tslib module is deprecated and will be "
+              "removed in a future version.", FutureWarning, stacklevel=2)
+from pandas._libs.tslib import Timestamp, Timedelta, OutOfBoundsDatetime
+from pandas._libs.tslibs.nattype import NaT, NaTType
diff --git a/pandas/tslib.pyx b/pandas/tslib.pyx
deleted file mode 100644
index 398c5f0232de1..0000000000000
--- a/pandas/tslib.pyx
+++ /dev/null
@@ -1,4768 +0,0 @@
-# cython: profile=False
-
-cimport numpy as np
-from numpy cimport (int8_t, int32_t, int64_t, import_array, ndarray,
-                    NPY_INT64, NPY_DATETIME, NPY_TIMEDELTA)
-import numpy as np
-
-# GH3363
-from sys import version_info
-cdef bint PY2 = version_info[0] == 2
-cdef bint PY3 = not PY2
-
-from cpython cimport (
-    PyTypeObject,
-    PyFloat_Check,
-    PyLong_Check,
-    PyObject_RichCompareBool,
-    PyObject_RichCompare,
-    PyString_Check,
-    Py_GT, Py_GE, Py_EQ, Py_NE, Py_LT, Py_LE
-)
-
-# Cython < 0.17 doesn't have this in cpython
-cdef extern from "Python.h":
-    cdef PyTypeObject *Py_TYPE(object)
-    int PySlice_Check(object)
-
-cdef extern from "datetime_helper.h":
-    double total_seconds(object)
-
-# this is our datetime.pxd
-from datetime cimport cmp_pandas_datetimestruct
-from util cimport is_integer_object, is_float_object, is_datetime64_object, is_timedelta64_object
-
-from libc.stdlib cimport free
-
-cimport util
-
-from datetime cimport *
-from khash cimport *
-cimport cython
-
-from datetime import timedelta, datetime
-from datetime import time as datetime_time
-
-import re
-
-# dateutil compat
-from dateutil.tz import (tzoffset, tzlocal as _dateutil_tzlocal, tzfile as _dateutil_tzfile,
-                         tzutc as _dateutil_tzutc, tzstr as _dateutil_tzstr)
-
-from pandas.compat import is_platform_windows
-if is_platform_windows():
-    from dateutil.zoneinfo import gettz as _dateutil_gettz
-else:
-    from dateutil.tz import gettz as _dateutil_gettz
-from dateutil.relativedelta import relativedelta
-from dateutil.parser import DEFAULTPARSER
-
-from pytz.tzinfo import BaseTzInfo as _pytz_BaseTzInfo
-from pandas.compat import parse_date, string_types, iteritems, StringIO, callable
-
-import operator
-import collections
-
-# initialize numpy
-import_array()
-#import_ufunc()
-
-# import datetime C API
-PyDateTime_IMPORT
-
-# in numpy 1.7, will prob need the following:
-# numpy_pydatetime_import
-
-cdef int64_t NPY_NAT = util.get_nat()
-
-# < numpy 1.7 compat for NaT
-compat_NaT = np.array([NPY_NAT]).astype('m8[ns]').item()
-
-# numpy actual nat object
-np_NaT = np.datetime64('NaT')
-
-try:
-    basestring
-except NameError: # py3
-    basestring = str
-
-cdef inline object create_timestamp_from_ts(int64_t value, pandas_datetimestruct dts, object tz, object offset):
-    cdef _Timestamp ts_base
-    ts_base = _Timestamp.__new__(Timestamp, dts.year, dts.month,
-                                 dts.day, dts.hour, dts.min,
-                                 dts.sec, dts.us, tz)
-
-    ts_base.value = value
-    ts_base.offset = offset
-    ts_base.nanosecond = dts.ps / 1000
-
-    return ts_base
-
-cdef inline object create_datetime_from_ts(int64_t value, pandas_datetimestruct dts, object tz, object offset):
-    return datetime(dts.year, dts.month, dts.day, dts.hour,
-                    dts.min, dts.sec, dts.us, tz)
-
-def ints_to_pydatetime(ndarray[int64_t] arr, tz=None, offset=None, box=False):
-    # convert an i8 repr to an ndarray of datetimes or Timestamp (if box == True)
-
-    cdef:
-        Py_ssize_t i, n = len(arr)
-        pandas_datetimestruct dts
-        object dt
-        int64_t value
-        ndarray[object] result = np.empty(n, dtype=object)
-        object (*func_create)(int64_t, pandas_datetimestruct, object, object)
-
-    if box and util.is_string_object(offset):
-        from pandas.tseries.frequencies import to_offset
-        offset = to_offset(offset)
-
-    if box:
-        func_create = create_timestamp_from_ts
-    else:
-        func_create = create_datetime_from_ts
-
-    if tz is not None:
-        if _is_utc(tz):
-            for i in range(n):
-                value = arr[i]
-                if value == iNaT:
-                    result[i] = NaT
-                else:
-                    pandas_datetime_to_datetimestruct(value, PANDAS_FR_ns, &dts)
-                    result[i] = func_create(value, dts, tz, offset)
-        elif _is_tzlocal(tz) or _is_fixed_offset(tz):
-            for i in range(n):
-                value = arr[i]
-                if value == iNaT:
-                    result[i] = NaT
-                else:
-                    pandas_datetime_to_datetimestruct(value, PANDAS_FR_ns, &dts)
-                    dt = create_datetime_from_ts(value, dts, tz, offset)
-                    dt = dt + tz.utcoffset(dt)
-                    if box:
-                        dt = Timestamp(dt)
-                    result[i] = dt
-        else:
-            trans, deltas, typ = _get_dst_info(tz)
-
-            for i in range(n):
-
-                value = arr[i]
-                if value == iNaT:
-                    result[i] = NaT
-                else:
-
-                    # Adjust datetime64 timestamp, recompute datetimestruct
-                    pos = trans.searchsorted(value, side='right') - 1
-                    if _treat_tz_as_pytz(tz):
-                        # find right representation of dst etc in pytz timezone
-                        new_tz = tz._tzinfos[tz._transition_info[pos]]
-                    else:
-                        # no zone-name change for dateutil tzs - dst etc represented in single object.
-                        new_tz = tz
-
-                    pandas_datetime_to_datetimestruct(value + deltas[pos], PANDAS_FR_ns, &dts)
-                    result[i] = func_create(value, dts, new_tz, offset)
-    else:
-        for i in range(n):
-
-            value = arr[i]
-            if value == iNaT:
-                result[i] = NaT
-            else:
-                pandas_datetime_to_datetimestruct(value, PANDAS_FR_ns, &dts)
-                result[i] = func_create(value, dts, None, offset)
-
-    return result
-
-def ints_to_pytimedelta(ndarray[int64_t] arr, box=False):
-    # convert an i8 repr to an ndarray of timedelta or Timedelta (if box == True)
-
-    cdef:
-        Py_ssize_t i, n = len(arr)
-        int64_t value
-        ndarray[object] result = np.empty(n, dtype=object)
-
-    for i in range(n):
-
-        value = arr[i]
-        if value == iNaT:
-            result[i] = NaT
-        else:
-            if box:
-                result[i] = Timedelta(value)
-            else:
-                result[i] = timedelta(microseconds=int(value)/1000)
-
-    return result
-
-
-cdef inline bint _is_tzlocal(object tz):
-    return isinstance(tz, _dateutil_tzlocal)
-
-cdef inline bint _is_fixed_offset(object tz):
-    if _treat_tz_as_dateutil(tz):
-        if len(tz._trans_idx) == 0 and len(tz._trans_list) == 0:
-            return 1
-        else:
-            return 0
-    elif _treat_tz_as_pytz(tz):
-        if len(tz._transition_info) == 0 and len(tz._utc_transition_times) == 0:
-            return 1
-        else:
-            return 0
-    return 1
-
-
-_zero_time = datetime_time(0, 0)
-
-# Python front end to C extension type _Timestamp
-# This serves as the box for datetime64
-class Timestamp(_Timestamp):
-    """TimeStamp is the pandas equivalent of python's Datetime
-    and is interchangable with it in most cases. It's the type used
-    for the entries that make up a DatetimeIndex, and other timeseries
-    oriented data structures in pandas.
-
-    Parameters
-    ----------
-    ts_input : datetime-like, str, int, float
-        Value to be converted to Timestamp
-    offset : str, DateOffset
-        Offset which Timestamp will have
-    tz : string, pytz.timezone, dateutil.tz.tzfile or None
-        Time zone for time which Timestamp will have.
-    unit : string
-        numpy unit used for conversion, if ts_input is int or float
-    """
-
-    # Do not add ``dayfirst`` and ``yearfist`` to Timestamp based on the discussion
-    # https://github.com/pydata/pandas/pull/7599
-
-    @classmethod
-    def fromordinal(cls, ordinal, offset=None, tz=None):
-        """ passed an ordinal, translate and convert to a ts
-            note: by definition there cannot be any tz info on the ordinal itself """
-        return cls(datetime.fromordinal(ordinal),offset=offset,tz=tz)
-
-    @classmethod
-    def now(cls, tz=None):
-        """
-        Return the current time in the local timezone.  Equivalent
-        to datetime.now([tz])
-
-        Parameters
-        ----------
-        tz : string / timezone object, default None
-            Timezone to localize to
-        """
-        if isinstance(tz, basestring):
-            tz = maybe_get_tz(tz)
-        return cls(datetime.now(tz))
-
-    @classmethod
-    def today(cls, tz=None):
-        """
-        Return the current time in the local timezone.  This differs
-        from datetime.today() in that it can be localized to a
-        passed timezone.
-
-        Parameters
-        ----------
-        tz : string / timezone object, default None
-            Timezone to localize to
-        """
-        return cls.now(tz)
-
-    @classmethod
-    def utcnow(cls):
-        return cls.now('UTC')
-
-    @classmethod
-    def utcfromtimestamp(cls, ts):
-        return cls(datetime.utcfromtimestamp(ts))
-
-    @classmethod
-    def fromtimestamp(cls, ts):
-        return cls(datetime.fromtimestamp(ts))
-
-    @classmethod
-    def combine(cls, date, time):
-        return cls(datetime.combine(date, time))
-
-    def __new__(cls, object ts_input, object offset=None, tz=None, unit=None):
-        cdef _TSObject ts
-        cdef _Timestamp ts_base
-
-        ts = convert_to_tsobject(ts_input, tz, unit)
-
-        if ts.value == NPY_NAT:
-            return NaT
-
-        if util.is_string_object(offset):
-            from pandas.tseries.frequencies import to_offset
-            offset = to_offset(offset)
-
-        # make datetime happy
-        ts_base = _Timestamp.__new__(cls, ts.dts.year, ts.dts.month,
-                                     ts.dts.day, ts.dts.hour, ts.dts.min,
-                                     ts.dts.sec, ts.dts.us, ts.tzinfo)
-
-        # fill out rest of data
-        ts_base.value = ts.value
-        ts_base.offset = offset
-        ts_base.nanosecond = ts.dts.ps / 1000
-
-        return ts_base
-
-    def __repr__(self):
-        stamp = self._repr_base
-        zone = None
-
-        try:
-            stamp += self.strftime('%z')
-            if self.tzinfo:
-                zone = _get_zone(self.tzinfo)
-        except ValueError:
-            year2000 = self.replace(year=2000)
-            stamp += year2000.strftime('%z')
-            if self.tzinfo:
-                zone = _get_zone(self.tzinfo)
-
-        try:
-            stamp += zone.strftime(' %%Z')
-        except:
-            pass
-
-        tz = ", tz='{0}'".format(zone) if zone is not None else ""
-        offset = ", offset='{0}'".format(self.offset.freqstr) if self.offset is not None else ""
-
-        return "Timestamp('{stamp}'{tz}{offset})".format(stamp=stamp, tz=tz, offset=offset)
-
-    @property
-    def _date_repr(self):
-        # Ideal here would be self.strftime("%Y-%m-%d"), but
-        # the datetime strftime() methods require year >= 1900
-        return '%d-%.2d-%.2d' % (self.year, self.month, self.day)
-
-    @property
-    def _time_repr(self):
-        result = '%.2d:%.2d:%.2d' % (self.hour, self.minute, self.second)
-
-        if self.nanosecond != 0:
-            result += '.%.9d' % (self.nanosecond + 1000 * self.microsecond)
-        elif self.microsecond != 0:
-            result += '.%.6d' % self.microsecond
-
-        return result
-
-    @property
-    def _repr_base(self):
-        return '%s %s' % (self._date_repr, self._time_repr)
-
-    @property
-    def tz(self):
-        """
-        Alias for tzinfo
-        """
-        return self.tzinfo
-
-    @property
-    def freq(self):
-        return self.offset
-
-    def __setstate__(self, state):
-        self.value = state[0]
-        self.offset = state[1]
-        self.tzinfo = state[2]
-
-    def __reduce__(self):
-        object_state = self.value, self.offset, self.tzinfo
-        return (Timestamp, object_state)
-
-    def to_period(self, freq=None):
-        """
-        Return an period of which this timestamp is an observation.
-        """
-        from pandas.tseries.period import Period
-
-        if freq is None:
-            freq = self.freq
-
-        return Period(self, freq=freq)
-
-    @property
-    def dayofweek(self):
-        return self.weekday()
-
-    @property
-    def dayofyear(self):
-        return self._get_field('doy')
-
-    @property
-    def week(self):
-        return self._get_field('woy')
-
-    weekofyear = week
-
-    @property
-    def microsecond(self):
-        return self._get_field('us')
-
-    @property
-    def quarter(self):
-        return self._get_field('q')
-
-    @property
-    def days_in_month(self):
-        return self._get_field('dim')
-
-    daysinmonth = days_in_month
-
-    @property
-    def freqstr(self):
-        return getattr(self.offset, 'freqstr', self.offset)
-
-    @property
-    def asm8(self):
-        return np.int64(self.value).view('M8[ns]')
-
-    @property
-    def is_month_start(self):
-        return self._get_start_end_field('is_month_start')
-
-    @property
-    def is_month_end(self):
-        return self._get_start_end_field('is_month_end')
-
-    @property
-    def is_quarter_start(self):
-        return self._get_start_end_field('is_quarter_start')
-
-    @property
-    def is_quarter_end(self):
-        return self._get_start_end_field('is_quarter_end')
-
-    @property
-    def is_year_start(self):
-        return self._get_start_end_field('is_year_start')
-
-    @property
-    def is_year_end(self):
-        return self._get_start_end_field('is_year_end')
-
-    def tz_localize(self, tz, ambiguous='raise'):
-        """
-        Convert naive Timestamp to local time zone, or remove
-        timezone from tz-aware Timestamp.
-
-        Parameters
-        ----------
-        tz : string, pytz.timezone, dateutil.tz.tzfile or None
-            Time zone for time which Timestamp will be converted to.
-            None will remove timezone holding local time.
-        ambiguous : bool, 'NaT', default 'raise'
-            - bool contains flags to determine if time is dst or not (note
-            that this flag is only applicable for ambiguous fall dst dates)
-            - 'NaT' will return NaT for an ambiguous time
-            - 'raise' will raise an AmbiguousTimeError for an ambiguous time
-
-        Returns
-        -------
-        localized : Timestamp
-
-        Raises
-        ------
-        TypeError
-            If the Timestamp is tz-aware and tz is not None.
-        """
-        if ambiguous == 'infer':
-            raise ValueError('Cannot infer offset with only one time.')
-
-        if self.tzinfo is None:
-            # tz naive, localize
-            tz = maybe_get_tz(tz)
-            if not isinstance(ambiguous, basestring):
-                ambiguous   =   [ambiguous]
-            value = tz_localize_to_utc(np.array([self.value],dtype='i8'), tz,
-                                       ambiguous=ambiguous)[0]
-            return Timestamp(value, tz=tz)
-        else:
-            if tz is None:
-                # reset tz
-                value = tz_convert_single(self.value, 'UTC', self.tz)
-                return Timestamp(value, tz=None)
-            else:
-                raise TypeError('Cannot localize tz-aware Timestamp, use '
-                                'tz_convert for conversions')
-
-
-    def tz_convert(self, tz):
-        """
-        Convert tz-aware Timestamp to another time zone.
-
-        Parameters
-        ----------
-        tz : string, pytz.timezone, dateutil.tz.tzfile or None
-            Time zone for time which Timestamp will be converted to.
-            None will remove timezone holding UTC time.
-
-        Returns
-        -------
-        converted : Timestamp
-
-        Raises
-        ------
-        TypeError
-            If Timestamp is tz-naive.
-        """
-        if self.tzinfo is None:
-            # tz naive, use tz_localize
-            raise TypeError('Cannot convert tz-naive Timestamp, use '
-                            'tz_localize to localize')
-        else:
-            # Same UTC timestamp, different time zone
-            return Timestamp(self.value, tz=tz)
-
-    astimezone = tz_convert
-
-    def replace(self, **kwds):
-        return Timestamp(datetime.replace(self, **kwds),
-                         offset=self.offset)
-
-    def to_pydatetime(self, warn=True):
-        """
-        If warn=True, issue warning if nanoseconds is nonzero
-        """
-        cdef:
-            pandas_datetimestruct dts
-            _TSObject ts
-
-        if self.nanosecond != 0 and warn:
-            print 'Warning: discarding nonzero nanoseconds'
-        ts = convert_to_tsobject(self, self.tzinfo, None)
-
-        return datetime(ts.dts.year, ts.dts.month, ts.dts.day,
-                        ts.dts.hour, ts.dts.min, ts.dts.sec,
-                        ts.dts.us, ts.tzinfo)
-
-    def isoformat(self, sep='T'):
-        base = super(_Timestamp, self).isoformat(sep=sep)
-        if self.nanosecond == 0:
-            return base
-
-        if self.tzinfo is not None:
-            base1, base2 = base[:-6], base[-6:]
-        else:
-            base1, base2 = base, ""
-
-        if self.microsecond != 0:
-            base1 += "%.3d" % self.nanosecond
-        else:
-            base1 += ".%.9d" % self.nanosecond
-
-        return base1 + base2
-
-    def _has_time_component(self):
-        """
-        Returns if the Timestamp has a time component
-        in addition to the date part
-        """
-        return (self.time() != _zero_time
-                or self.tzinfo is not None
-                or self.nanosecond != 0)
-
-    def to_julian_date(self):
-        """
-        Convert TimeStamp to a Julian Date.
-        0 Julian date is noon January 1, 4713 BC.
-        """
-        year = self.year
-        month = self.month
-        day = self.day
-        if month <= 2:
-            year -= 1
-            month += 12
-        return (day +
-                np.fix((153*month - 457)/5) +
-                365*year +
-                np.floor(year / 4) -
-                np.floor(year / 100) +
-                np.floor(year / 400) +
-                1721118.5 +
-                (self.hour +
-                 self.minute/60.0 +
-                 self.second/3600.0 +
-                 self.microsecond/3600.0/1e+6 +
-                 self.nanosecond/3600.0/1e+9
-                )/24.0)
-
-    def normalize(self):
-        """
-        Normalize Timestamp to midnight, preserving
-        tz information.
-        """
-        normalized_value = date_normalize(np.array([self.value], dtype='i8'), tz=self.tz)[0]
-        return Timestamp(normalized_value).tz_localize(self.tz)
-
-    def __radd__(self, other):
-        # __radd__ on cython extension types like _Timestamp is not used, so
-        # define it here instead
-        return self + other
-
-
-_nat_strings = set(['NaT','nat','NAT','nan','NaN','NAN'])
-class NaTType(_NaT):
-    """(N)ot-(A)-(T)ime, the time equivalent of NaN"""
-
-    def __new__(cls):
-        cdef _NaT base
-
-        base = _NaT.__new__(cls, 1, 1, 1)
-        mangle_nat(base)
-        base.value = NPY_NAT
-
-        return base
-
-    def __repr__(self):
-        return 'NaT'
-
-    def __str__(self):
-        return 'NaT'
-
-    def __hash__(self):
-        return iNaT
-
-    def __int__(self):
-        return NPY_NAT
-
-    def __long__(self):
-        return NPY_NAT
-
-    def __reduce__(self):
-        return (__nat_unpickle, (None, ))
-    
-    def total_seconds(self):
-        # GH 10939
-        return np.nan
-
-
-fields = ['year', 'quarter', 'month', 'day', 'hour',
-          'minute', 'second', 'millisecond', 'microsecond', 'nanosecond',
-          'week', 'dayofyear', 'days_in_month', 'daysinmonth', 'dayofweek']
-for field in fields:
-    prop = property(fget=lambda self: np.nan)
-    setattr(NaTType, field, prop)
-
-# GH9513 NaT methods (except to_datetime64) to raise, return np.nan, or return NaT
-# create functions that raise, for binding to NaTType
-def _make_error_func(func_name):
-    def f(*args, **kwargs):
-        raise ValueError("NaTType does not support " + func_name)
-    f.__name__ = func_name
-    return f
-
-def _make_nat_func(func_name):
-    def f(*args, **kwargs):
-        return NaT
-    f.__name__ = func_name
-    return f
-
-def _make_nan_func(func_name):
-    def f(*args, **kwargs):
-        return np.nan
-    f.__name__ = func_name
-    return f
-
-_nat_methods = ['date', 'now', 'replace', 'to_datetime', 'today']
-
-_nan_methods = ['weekday', 'isoweekday', 'total_seconds']
-
-_implemented_methods = ['to_datetime64']
-_implemented_methods.extend(_nat_methods)
-_implemented_methods.extend(_nan_methods)
-
-for _method_name in _nat_methods:
-    # not all methods exist in all versions of Python
-    if hasattr(NaTType, _method_name):
-        setattr(NaTType, _method_name, _make_nat_func(_method_name))
-
-for _method_name in _nan_methods:
-    if hasattr(NaTType, _method_name):
-        setattr(NaTType, _method_name, _make_nan_func(_method_name))
-
-for _maybe_method_name in dir(NaTType):
-    _maybe_method = getattr(NaTType, _maybe_method_name)
-    if (callable(_maybe_method)
-        and not _maybe_method_name.startswith("_")
-        and _maybe_method_name not in _implemented_methods):
-        setattr(NaTType, _maybe_method_name, _make_error_func(_maybe_method_name))
-
-def __nat_unpickle(*args):
-    # return constant defined in the module
-    return NaT
-
-NaT = NaTType()
-
-iNaT = util.get_nat()
-
-
-cdef inline bint _checknull_with_nat(object val):
-    """ utility to check if a value is a nat or not """
-    return val is None or (
-        PyFloat_Check(val) and val != val) or val is NaT
-
-cdef inline bint _cmp_nat_dt(_NaT lhs, _Timestamp rhs, int op) except -1:
-    return _nat_scalar_rules[op]
-
-
-cdef _tz_format(object obj, object zone):
-    try:
-        return obj.strftime(' %%Z, tz=%s' % zone)
-    except:
-        return ', tz=%s' % zone
-
-def is_timestamp_array(ndarray[object] values):
-    cdef int i, n = len(values)
-    if n == 0:
-        return False
-    for i in range(n):
-        if not is_timestamp(values[i]):
-            return False
-    return True
-
-
-cpdef object get_value_box(ndarray arr, object loc):
-    cdef:
-        Py_ssize_t i, sz
-        void* data_ptr
-
-    if util.is_float_object(loc):
-        casted = int(loc)
-        if casted == loc:
-            loc = casted
-    i = <Py_ssize_t> loc
-    sz = np.PyArray_SIZE(arr)
-
-    if i < 0 and sz > 0:
-        i += sz
-
-    if i >= sz or sz == 0 or i < 0:
-        raise IndexError('index out of bounds')
-
-    if arr.descr.type_num == NPY_DATETIME:
-        return Timestamp(util.get_value_1d(arr, i))
-    elif arr.descr.type_num == NPY_TIMEDELTA:
-        return Timedelta(util.get_value_1d(arr, i))
-    else:
-        return util.get_value_1d(arr, i)
-
-
-# Add the min and max fields at the class level
-# These are defined as magic numbers due to strange
-# wraparound behavior when using the true int64 lower boundary
-cdef int64_t _NS_LOWER_BOUND = -9223285636854775000LL
-cdef int64_t _NS_UPPER_BOUND = 9223372036854775807LL
-
-cdef pandas_datetimestruct _NS_MIN_DTS, _NS_MAX_DTS
-pandas_datetime_to_datetimestruct(_NS_LOWER_BOUND, PANDAS_FR_ns, &_NS_MIN_DTS)
-pandas_datetime_to_datetimestruct(_NS_UPPER_BOUND, PANDAS_FR_ns, &_NS_MAX_DTS)
-
-Timestamp.min = Timestamp(_NS_LOWER_BOUND)
-Timestamp.max = Timestamp(_NS_UPPER_BOUND)
-
-
-#----------------------------------------------------------------------
-# Frequency inference
-
-def unique_deltas(ndarray[int64_t] arr):
-    cdef:
-        Py_ssize_t i, n = len(arr)
-        int64_t val
-        khiter_t k
-        kh_int64_t *table
-        int ret = 0
-        list uniques = []
-
-    table = kh_init_int64()
-    kh_resize_int64(table, 10)
-    for i in range(n - 1):
-        val = arr[i + 1] - arr[i]
-        k = kh_get_int64(table, val)
-        if k == table.n_buckets:
-            kh_put_int64(table, val, &ret)
-            uniques.append(val)
-    kh_destroy_int64(table)
-
-    result = np.array(uniques, dtype=np.int64)
-    result.sort()
-    return result
-
-
-cdef inline bint _is_multiple(int64_t us, int64_t mult):
-    return us % mult == 0
-
-
-def apply_offset(ndarray[object] values, object offset):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[int64_t] new_values
-        object boxed
-
-    result = np.empty(n, dtype='M8[ns]')
-    new_values = result.view('i8')
-
-
-cdef inline bint _cmp_scalar(int64_t lhs, int64_t rhs, int op) except -1:
-    if op == Py_EQ:
-        return lhs == rhs
-    elif op == Py_NE:
-        return lhs != rhs
-    elif op == Py_LT:
-        return lhs < rhs
-    elif op == Py_LE:
-        return lhs <= rhs
-    elif op == Py_GT:
-        return lhs > rhs
-    elif op == Py_GE:
-        return lhs >= rhs
-
-
-cdef int _reverse_ops[6]
-
-_reverse_ops[Py_LT] = Py_GT
-_reverse_ops[Py_LE] = Py_GE
-_reverse_ops[Py_EQ] = Py_EQ
-_reverse_ops[Py_NE] = Py_NE
-_reverse_ops[Py_GT] = Py_LT
-_reverse_ops[Py_GE] = Py_LE
-
-
-cdef str _NDIM_STRING = "ndim"
-
-# This is PITA. Because we inherit from datetime, which has very specific
-# construction requirements, we need to do object instantiation in python
-# (see Timestamp class above). This will serve as a C extension type that
-# shadows the python class, where we do any heavy lifting.
-cdef class _Timestamp(datetime):
-    cdef readonly:
-        int64_t value, nanosecond
-        object offset       # frequency reference
-
-    def __hash__(_Timestamp self):
-        if self.nanosecond:
-            return hash(self.value)
-        return datetime.__hash__(self)
-
-    def __richcmp__(_Timestamp self, object other, int op):
-        cdef:
-            _Timestamp ots
-            int ndim
-
-        if isinstance(other, _Timestamp):
-            if isinstance(other, _NaT):
-                return _cmp_nat_dt(other, self, _reverse_ops[op])
-            ots = other
-        elif isinstance(other, datetime):
-            if self.nanosecond == 0:
-                val = self.to_datetime()
-                return PyObject_RichCompareBool(val, other, op)
-
-            try:
-                ots = Timestamp(other)
-            except ValueError:
-                return self._compare_outside_nanorange(other, op)
-        else:
-            ndim = getattr(other, _NDIM_STRING, -1)
-
-            if ndim != -1:
-                if ndim == 0:
-                    if isinstance(other, np.datetime64):
-                        other = Timestamp(other)
-                    else:
-                        if op == Py_EQ:
-                            return False
-                        elif op == Py_NE:
-                            return True
-
-                        # only allow ==, != ops
-                        raise TypeError('Cannot compare type %r with type %r' %
-                                        (type(self).__name__,
-                                         type(other).__name__))
-                return PyObject_RichCompare(other, self, _reverse_ops[op])
-            else:
-                if op == Py_EQ:
-                    return False
-                elif op == Py_NE:
-                    return True
-                raise TypeError('Cannot compare type %r with type %r' %
-                                (type(self).__name__, type(other).__name__))
-
-        self._assert_tzawareness_compat(other)
-        return _cmp_scalar(self.value, ots.value, op)
-
-    cdef bint _compare_outside_nanorange(_Timestamp self, datetime other,
-                                         int op) except -1:
-        cdef datetime dtval = self.to_datetime()
-
-        self._assert_tzawareness_compat(other)
-
-        if self.nanosecond == 0:
-            return PyObject_RichCompareBool(dtval, other, op)
-        else:
-            if op == Py_EQ:
-                return False
-            elif op == Py_NE:
-                return True
-            elif op == Py_LT:
-                return dtval < other
-            elif op == Py_LE:
-                return dtval < other
-            elif op == Py_GT:
-                return dtval >= other
-            elif op == Py_GE:
-                return dtval >= other
-
-    cdef int _assert_tzawareness_compat(_Timestamp self,
-                                        object other) except -1:
-        if self.tzinfo is None:
-            if other.tzinfo is not None:
-                raise TypeError('Cannot compare tz-naive and tz-aware '
-                                 'timestamps')
-        elif other.tzinfo is None:
-            raise TypeError('Cannot compare tz-naive and tz-aware timestamps')
-
-    cpdef datetime to_datetime(_Timestamp self):
-        cdef:
-            pandas_datetimestruct dts
-            _TSObject ts
-        ts = convert_to_tsobject(self, self.tzinfo, None)
-        dts = ts.dts
-        return datetime(dts.year, dts.month, dts.day,
-                        dts.hour, dts.min, dts.sec,
-                        dts.us, ts.tzinfo)
-
-    cpdef to_datetime64(self):
-        """ Returns a numpy.datetime64 object with 'ns' precision """
-        return np.datetime64(self.value, 'ns')
-
-    def __add__(self, other):
-        cdef int64_t other_int
-
-        if is_timedelta64_object(other):
-            other_int = other.astype('timedelta64[ns]').view('i8')
-            return Timestamp(self.value + other_int, tz=self.tzinfo, offset=self.offset)
-
-        elif is_integer_object(other):
-            if self.offset is None:
-                raise ValueError("Cannot add integral value to Timestamp "
-                                 "without offset.")
-            return Timestamp((self.offset * other).apply(self), offset=self.offset)
-
-        elif isinstance(other, timedelta) or hasattr(other, 'delta'):
-            nanos = _delta_to_nanoseconds(other)
-            result = Timestamp(self.value + nanos, tz=self.tzinfo, offset=self.offset)
-            if getattr(other, 'normalize', False):
-                result = Timestamp(normalize_date(result))
-            return result
-
-        # index/series like
-        elif hasattr(other, '_typ'):
-            return other + self
-
-        result = datetime.__add__(self, other)
-        if isinstance(result, datetime):
-            result = Timestamp(result)
-            result.nanosecond = self.nanosecond
-        return result
-
-    def __sub__(self, other):
-        if is_timedelta64_object(other) or is_integer_object(other) \
-                or isinstance(other, timedelta) or hasattr(other, 'delta'):
-            neg_other = -other
-            return self + neg_other
-
-        # a Timestamp-DatetimeIndex -> yields a negative TimedeltaIndex
-        elif getattr(other,'_typ',None) == 'datetimeindex':
-
-            # we may be passed reverse ops
-            if get_timezone(getattr(self,'tzinfo',None)) != get_timezone(other.tz):
-                    raise TypeError("Timestamp subtraction must have the same timezones or no timezones")
-
-            return -other.__sub__(self)
-
-        # a Timestamp-TimedeltaIndex -> yields a negative TimedeltaIndex
-        elif getattr(other,'_typ',None) == 'timedeltaindex':
-            return (-other).__add__(self)
-
-        elif other is NaT:
-            return NaT
-
-        # coerce if necessary if we are a Timestamp-like
-        if isinstance(self, datetime) and (isinstance(other, datetime) or is_datetime64_object(other)):
-            self = Timestamp(self)
-            other = Timestamp(other)
-
-            # validate tz's
-            if get_timezone(self.tzinfo) != get_timezone(other.tzinfo):
-                raise TypeError("Timestamp subtraction must have the same timezones or no timezones")
-
-            # scalar Timestamp/datetime - Timestamp/datetime -> yields a Timedelta
-            try:
-                return Timedelta(self.value-other.value)
-            except (OverflowError, OutOfBoundsDatetime):
-                pass
-
-        # scalar Timestamp/datetime - Timedelta -> yields a Timestamp (with same timezone if specified)
-        return datetime.__sub__(self, other)
-
-    cpdef _get_field(self, field):
-        out = get_date_field(np.array([self.value], dtype=np.int64), field)
-        return int(out[0])
-
-    cpdef _get_start_end_field(self, field):
-        month_kw = self.freq.kwds.get('startingMonth', self.freq.kwds.get('month', 12)) if self.freq else 12
-        freqstr = self.freqstr if self.freq else None
-        out = get_start_end_field(np.array([self.value], dtype=np.int64), field, freqstr, month_kw)
-        return out[0]
-
-
-cdef PyTypeObject* ts_type = <PyTypeObject*> Timestamp
-
-
-cdef inline bint is_timestamp(object o):
-    return Py_TYPE(o) == ts_type # isinstance(o, Timestamp)
-
-
-cdef bint _nat_scalar_rules[6]
-
-_nat_scalar_rules[Py_EQ] = False
-_nat_scalar_rules[Py_NE] = True
-_nat_scalar_rules[Py_LT] = False
-_nat_scalar_rules[Py_LE] = False
-_nat_scalar_rules[Py_GT] = False
-_nat_scalar_rules[Py_GE] = False
-
-
-cdef class _NaT(_Timestamp):
-
-    def __hash__(_NaT self):
-        # py3k needs this defined here
-        return hash(self.value)
-
-    def __richcmp__(_NaT self, object other, int op):
-        cdef int ndim = getattr(other, 'ndim', -1)
-
-        if ndim == -1:
-            return _nat_scalar_rules[op]
-
-        if ndim == 0:
-            if isinstance(other, np.datetime64):
-                other = Timestamp(other)
-            else:
-                raise TypeError('Cannot compare type %r with type %r' %
-                                (type(self).__name__, type(other).__name__))
-        return PyObject_RichCompare(other, self, _reverse_ops[op])
-
-    def __add__(self, other):
-        try:
-            result = _Timestamp.__add__(self, other)
-            if result is NotImplemented:
-                return result
-        except (OverflowError, OutOfBoundsDatetime):
-            pass
-        return NaT
-
-    def __sub__(self, other):
-
-        if type(self) is datetime:
-            other, self = self, other
-        try:
-            result = _Timestamp.__sub__(self, other)
-            if result is NotImplemented:
-                return result
-        except (OverflowError, OutOfBoundsDatetime):
-            pass
-        return NaT
-
-
-def _delta_to_nanoseconds(delta):
-    if isinstance(delta, np.ndarray):
-        return delta.astype('m8[ns]').astype('int64')
-    if hasattr(delta, 'nanos'):
-        return delta.nanos
-    if hasattr(delta, 'delta'):
-        delta = delta.delta
-    if is_timedelta64_object(delta):
-        return delta.astype("timedelta64[ns]").item()
-    if is_integer_object(delta):
-        return delta
-    return (delta.days * 24 * 60 * 60 * 1000000
-            + delta.seconds * 1000000
-            + delta.microseconds) * 1000
-
-
-# lightweight C object to hold datetime & int64 pair
-cdef class _TSObject:
-    cdef:
-        pandas_datetimestruct dts      # pandas_datetimestruct
-        int64_t value               # numpy dt64
-        object tzinfo
-
-    property value:
-        def __get__(self):
-            return self.value
-
-cpdef _get_utcoffset(tzinfo, obj):
-    try:
-        return tzinfo._utcoffset
-    except AttributeError:
-        return tzinfo.utcoffset(obj)
-
-# helper to extract datetime and int64 from several different possibilities
-cdef convert_to_tsobject(object ts, object tz, object unit):
-    """
-    Extract datetime and int64 from any of:
-        - np.int64 (with unit providing a possible modifier)
-        - np.datetime64
-        - a float (with unit providing a possible modifier)
-        - python int or long object (with unit providing a possible modifier)
-        - iso8601 string object
-        - python datetime object
-        - another timestamp object
-    """
-    cdef:
-        _TSObject obj
-        bint utc_convert = 1
-        int out_local = 0, out_tzoffset = 0
-
-    if tz is not None:
-        tz = maybe_get_tz(tz)
-
-    obj = _TSObject()
-
-    if util.is_string_object(ts):
-        return convert_str_to_tsobject(ts, tz, unit)
-
-    if ts is None or ts is NaT or ts is np_NaT:
-        obj.value = NPY_NAT
-    elif is_datetime64_object(ts):
-        if ts.view('i8') == iNaT:
-            obj.value = NPY_NAT
-        else:
-            obj.value = _get_datetime64_nanos(ts)
-            pandas_datetime_to_datetimestruct(obj.value, PANDAS_FR_ns, &obj.dts)
-    elif is_integer_object(ts):
-        if ts == NPY_NAT:
-            obj.value = NPY_NAT
-        else:
-            ts = ts * cast_from_unit(None,unit)
-            obj.value = ts
-            pandas_datetime_to_datetimestruct(ts, PANDAS_FR_ns, &obj.dts)
-    elif util.is_float_object(ts):
-        if ts != ts or ts == NPY_NAT:
-            obj.value = NPY_NAT
-        else:
-            ts = cast_from_unit(ts,unit)
-            obj.value = ts
-            pandas_datetime_to_datetimestruct(ts, PANDAS_FR_ns, &obj.dts)
-    elif PyDateTime_Check(ts):
-        if tz is not None:
-            # sort of a temporary hack
-            if ts.tzinfo is not None:
-                if (hasattr(tz, 'normalize') and
-                    hasattr(ts.tzinfo, '_utcoffset')):
-                    ts = tz.normalize(ts)
-                    obj.value = _pydatetime_to_dts(ts, &obj.dts)
-                    obj.tzinfo = ts.tzinfo
-                else: #tzoffset
-                    try:
-                        tz = ts.astimezone(tz).tzinfo
-                    except:
-                        pass
-                    obj.value = _pydatetime_to_dts(ts, &obj.dts)
-                    ts_offset = _get_utcoffset(ts.tzinfo, ts)
-                    obj.value -= _delta_to_nanoseconds(ts_offset)
-                    tz_offset = _get_utcoffset(tz, ts)
-                    obj.value += _delta_to_nanoseconds(tz_offset)
-                    pandas_datetime_to_datetimestruct(obj.value,
-                                                      PANDAS_FR_ns, &obj.dts)
-                    obj.tzinfo = tz
-            elif not _is_utc(tz):
-                ts = _localize_pydatetime(ts, tz)
-                obj.value = _pydatetime_to_dts(ts, &obj.dts)
-                obj.tzinfo = ts.tzinfo
-            else:
-                # UTC
-                obj.value = _pydatetime_to_dts(ts, &obj.dts)
-                obj.tzinfo = pytz.utc
-        else:
-            obj.value = _pydatetime_to_dts(ts, &obj.dts)
-            obj.tzinfo = ts.tzinfo
-
-        if obj.tzinfo is not None and not _is_utc(obj.tzinfo):
-            offset = _get_utcoffset(obj.tzinfo, ts)
-            obj.value -= _delta_to_nanoseconds(offset)
-
-        if is_timestamp(ts):
-            obj.value += ts.nanosecond
-            obj.dts.ps = ts.nanosecond * 1000
-        _check_dts_bounds(&obj.dts)
-        return obj
-    elif PyDate_Check(ts):
-        # Keep the converter same as PyDateTime's
-        ts = datetime.combine(ts, datetime_time())
-        return convert_to_tsobject(ts, tz, None)
-    elif getattr(ts, '_typ', None) == 'period':
-        raise ValueError("Cannot convert Period to Timestamp unambiguously. Use to_timestamp")
-    else:
-        raise TypeError('Cannot convert input to Timestamp')
-
-    if obj.value != NPY_NAT:
-        _check_dts_bounds(&obj.dts)
-
-    if tz is not None:
-        _localize_tso(obj, tz)
-
-    return obj
-
-
-cpdef convert_str_to_tsobject(object ts, object tz, object unit,
-                              dayfirst=False, yearfirst=False):
-    cdef:
-        _TSObject obj
-        int out_local = 0, out_tzoffset = 0
-
-    if tz is not None:
-        tz = maybe_get_tz(tz)
-
-    obj = _TSObject()
-
-    if ts in _nat_strings:
-        ts = NaT
-    elif ts == 'now':
-        # Issue 9000, we short-circuit rather than going
-        # into np_datetime_strings which returns utc
-        ts = Timestamp.now(tz)
-    elif ts == 'today':
-        # Issue 9000, we short-circuit rather than going
-        # into np_datetime_strings which returns a normalized datetime
-        ts = Timestamp.today(tz)
-    else:
-        try:
-            _string_to_dts(ts, &obj.dts, &out_local, &out_tzoffset)
-            obj.value = pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &obj.dts)
-            _check_dts_bounds(&obj.dts)
-            if out_local == 1:
-                obj.tzinfo = pytz.FixedOffset(out_tzoffset)
-                obj.value = tz_convert_single(obj.value, obj.tzinfo, 'UTC')
-                if tz is None:
-                    _check_dts_bounds(&obj.dts)
-                    return obj
-                else:
-                    # Keep the converter same as PyDateTime's
-                    ts = Timestamp(obj.value, tz=obj.tzinfo)
-            else:
-                ts = obj.value
-                if tz is not None:
-                    # shift for _localize_tso
-                    ts = tz_convert_single(ts, tz, 'UTC')
-        except ValueError:
-            try:
-                ts = parse_datetime_string(ts, dayfirst=dayfirst, yearfirst=yearfirst)
-            except Exception:
-                raise ValueError
-
-    return convert_to_tsobject(ts, tz, unit)
-
-
-cdef inline void _localize_tso(_TSObject obj, object tz):
-    '''
-    Take a TSObject in UTC and localizes to timezone tz.
-    '''
-    if _is_utc(tz):
-        obj.tzinfo = tz
-    elif _is_tzlocal(tz):
-        pandas_datetime_to_datetimestruct(obj.value, PANDAS_FR_ns, &obj.dts)
-        dt = datetime(obj.dts.year, obj.dts.month, obj.dts.day, obj.dts.hour,
-                      obj.dts.min, obj.dts.sec, obj.dts.us, tz)
-        delta = int(total_seconds(_get_utcoffset(tz, dt))) * 1000000000
-        pandas_datetime_to_datetimestruct(obj.value + delta,
-                                          PANDAS_FR_ns, &obj.dts)
-        obj.tzinfo = tz
-    else:
-        # Adjust datetime64 timestamp, recompute datetimestruct
-        trans, deltas, typ = _get_dst_info(tz)
-
-        pos = trans.searchsorted(obj.value, side='right') - 1
-
-
-        # static/pytz/dateutil specific code
-        if _is_fixed_offset(tz):
-            # statictzinfo
-            if len(deltas) > 0:
-                pandas_datetime_to_datetimestruct(obj.value + deltas[0],
-                                                  PANDAS_FR_ns, &obj.dts)
-            else:
-                pandas_datetime_to_datetimestruct(obj.value, PANDAS_FR_ns, &obj.dts)
-            obj.tzinfo = tz
-        elif _treat_tz_as_pytz(tz):
-            inf = tz._transition_info[pos]
-            pandas_datetime_to_datetimestruct(obj.value + deltas[pos],
-                                              PANDAS_FR_ns, &obj.dts)
-            obj.tzinfo = tz._tzinfos[inf]
-        elif _treat_tz_as_dateutil(tz):
-            pandas_datetime_to_datetimestruct(obj.value + deltas[pos],
-                                              PANDAS_FR_ns, &obj.dts)
-            obj.tzinfo = tz
-        else:
-            obj.tzinfo = tz
-
-
-def _localize_pydatetime(object dt, object tz):
-    '''
-    Take a datetime/Timestamp in UTC and localizes to timezone tz.
-    '''
-    if tz is None:
-        return dt
-    elif isinstance(dt, Timestamp):
-        return dt.tz_localize(tz)
-    elif tz == 'UTC' or tz is UTC:
-        return UTC.localize(dt)
-    try:
-        # datetime.replace with pytz may be incorrect result
-        return tz.localize(dt)
-    except AttributeError:
-        return dt.replace(tzinfo=tz)
-
-
-def get_timezone(tz):
-    return _get_zone(tz)
-
-cdef inline bint _is_utc(object tz):
-    return tz is UTC or isinstance(tz, _dateutil_tzutc)
-
-cdef inline object _get_zone(object tz):
-    '''
-    We need to do several things here:
-    1/ Distinguish between pytz and dateutil timezones
-    2/ Not be over-specific (e.g. US/Eastern with/without DST is same *zone* but a different tz object)
-    3/ Provide something to serialize when we're storing a datetime object in pytables.
-
-    We return a string prefaced with dateutil if it's a dateutil tz, else just the tz name. It needs to be a
-    string so that we can serialize it with UJSON/pytables. maybe_get_tz (below) is the inverse of this process.
-    '''
-    if _is_utc(tz):
-        return 'UTC'
-    else:
-        if _treat_tz_as_dateutil(tz):
-            if '.tar.gz' in tz._filename:
-                raise ValueError('Bad tz filename. Dateutil on python 3 on windows has a bug which causes tzfile._filename to be the same for all '
-                                 'timezone files. Please construct dateutil timezones implicitly by passing a string like "dateutil/Europe/London" '
-                                 'when you construct your pandas objects instead of passing a timezone object. See https://github.com/pydata/pandas/pull/7362')
-            return 'dateutil/' + tz._filename
-        else:
-            # tz is a pytz timezone or unknown.
-            try:
-                zone = tz.zone
-                if zone is None:
-                    return tz
-                return zone
-            except AttributeError:
-                return tz
-
-
-cpdef inline object maybe_get_tz(object tz):
-    '''
-    (Maybe) Construct a timezone object from a string. If tz is a string, use it to construct a timezone object.
-    Otherwise, just return tz.
-    '''
-    if isinstance(tz, string_types):
-        if tz.startswith('dateutil/'):
-            zone = tz[9:]
-            tz = _dateutil_gettz(zone)
-            # On Python 3 on Windows, the filename is not always set correctly.
-            if isinstance(tz, _dateutil_tzfile) and '.tar.gz' in tz._filename:
-                tz._filename = zone
-        else:
-            tz = pytz.timezone(tz)
-    elif is_integer_object(tz):
-        tz = pytz.FixedOffset(tz / 60)
-    return tz
-
-
-
-class OutOfBoundsDatetime(ValueError):
-    pass
-
-cdef inline _check_dts_bounds(pandas_datetimestruct *dts):
-    cdef:
-        bint error = False
-
-    if dts.year <= 1677 and cmp_pandas_datetimestruct(dts, &_NS_MIN_DTS) == -1:
-        error = True
-    elif (
-            dts.year >= 2262 and
-            cmp_pandas_datetimestruct(dts, &_NS_MAX_DTS) == 1):
-        error = True
-
-    if error:
-        fmt = '%d-%.2d-%.2d %.2d:%.2d:%.2d' % (dts.year, dts.month,
-                                               dts.day, dts.hour,
-                                               dts.min, dts.sec)
-
-        raise OutOfBoundsDatetime('Out of bounds nanosecond timestamp: %s' % fmt)
-
-# elif isinstance(ts, _Timestamp):
-#     tmp = ts
-#     obj.value = (<_Timestamp> ts).value
-#     obj.dtval =
-# elif isinstance(ts, object):
-#     # If all else fails
-#     obj.value = _dtlike_to_datetime64(ts, &obj.dts)
-#     obj.dtval = _dts_to_pydatetime(&obj.dts)
-
-def datetime_to_datetime64(ndarray[object] values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        object val, inferred_tz = None
-        ndarray[int64_t] iresult
-        pandas_datetimestruct dts
-        _TSObject _ts
-
-    result = np.empty(n, dtype='M8[ns]')
-    iresult = result.view('i8')
-    for i in range(n):
-        val = values[i]
-        if _checknull_with_nat(val):
-            iresult[i] = iNaT
-        elif PyDateTime_Check(val):
-            if val.tzinfo is not None:
-                if inferred_tz is not None:
-                    if _get_zone(val.tzinfo) != inferred_tz:
-                        raise ValueError('Array must be all same time zone')
-                else:
-                    inferred_tz = _get_zone(val.tzinfo)
-
-                _ts = convert_to_tsobject(val, None, None)
-                iresult[i] = _ts.value
-                _check_dts_bounds(&_ts.dts)
-            else:
-                if inferred_tz is not None:
-                    raise ValueError('Cannot mix tz-aware with tz-naive values')
-                iresult[i] = _pydatetime_to_dts(val, &dts)
-                _check_dts_bounds(&dts)
-        else:
-            raise TypeError('Unrecognized value type: %s' % type(val))
-
-    return result, inferred_tz
-
-cdef:
-    set _not_datelike_strings = set(['a','A','m','M','p','P','t','T'])
-
-cpdef object _does_string_look_like_datetime(object date_string):
-    if date_string.startswith('0'):
-        # Strings starting with 0 are more consistent with a
-        # date-like string than a number
-        return True
-
-    try:
-        if float(date_string) < 1000:
-            return False
-    except ValueError:
-        pass
-
-    if date_string in _not_datelike_strings:
-        return False
-
-    return True
-
-
-def format_array_from_datetime(ndarray[int64_t] values, object tz=None,
-                               object format=None, object na_rep=None):
-    """
-    return a np object array of the string formatted values
-
-    Parameters
-    ----------
-    values : a 1-d i8 array
-    tz : the timezone (or None)
-    format : optional, default is None
-          a strftime capable string
-    na_rep : optional, default is None
-          a nat format
-
-    """
-    cdef:
-        int64_t val, ns, N = len(values)
-        ndarray[int64_t] consider_values
-        bint show_ms = 0, show_us = 0, show_ns = 0, basic_format = 0
-        ndarray[object] result = np.empty(N, dtype=object)
-        object ts, res
-        pandas_datetimestruct dts
-
-    if na_rep is None:
-       na_rep = 'NaT'
-
-    # if we don't have a format nor tz, then choose
-    # a format based on precision
-    basic_format = format is None and tz is None
-    if basic_format:
-        consider_values = values[values != iNaT]
-        show_ns = (consider_values%1000).any()
-
-        if not show_ns:
-            consider_values //= 1000
-            show_us = (consider_values%1000).any()
-
-            if not show_ms:
-                consider_values //= 1000
-                show_ms = (consider_values%1000).any()
-
-    for i in range(N):
-        val = values[i]
-
-        if val == iNaT:
-            result[i] = na_rep
-        elif basic_format:
-
-            pandas_datetime_to_datetimestruct(val, PANDAS_FR_ns, &dts)
-            res = '%d-%.2d-%.2d %.2d:%.2d:%.2d' % (dts.year,
-                                                   dts.month,
-                                                   dts.day,
-                                                   dts.hour,
-                                                   dts.min,
-                                                   dts.sec)
-
-            if show_ns:
-                ns = dts.ps / 1000
-                res += '.%.9d' % (ns + 1000 * dts.us)
-            elif show_us:
-                res += '.%.6d' % dts.us
-            elif show_ms:
-                res += '.%.3d' % (dts.us/1000)
-
-            result[i] = res
-
-        else:
-
-            ts = Timestamp(val, tz=tz)
-            if format is None:
-                result[i] = str(ts)
-            else:
-
-                # invalid format string
-                # requires dates > 1900
-                try:
-                    result[i] = ts.strftime(format)
-                except ValueError:
-                    result[i] = str(ts)
-
-    return result
-
-
-class DateParseError(ValueError):
-    pass
-
-
-cdef object _TIMEPAT = re.compile(r'^([01]?[0-9]|2[0-3]):([0-5][0-9])')
-
-
-def parse_datetime_string(object date_string, object freq=None,
-                          dayfirst=False, yearfirst=False, **kwargs):
-
-    """parse datetime string, only returns datetime.
-    Also cares special handling matching time patterns.
-
-    Returns
-    -------
-    datetime
-    """
-
-    cdef:
-        object dt
-
-    if not _does_string_look_like_datetime(date_string):
-        raise ValueError('Given date string not likely a datetime.')
-
-    if _TIMEPAT.match(date_string):
-        # use current datetime as default, not pass _DEFAULT_DATETIME
-        dt = parse_date(date_string, dayfirst=dayfirst,
-                        yearfirst=yearfirst, **kwargs)
-        return dt
-    try:
-        dt, _, _ = _parse_dateabbr_string(date_string, _DEFAULT_DATETIME, freq)
-        return dt
-    except DateParseError:
-        raise
-    except ValueError:
-        pass
-
-    dt = parse_date(date_string, default=_DEFAULT_DATETIME,
-                    dayfirst=dayfirst, yearfirst=yearfirst, **kwargs)
-    return dt
-
-
-def parse_datetime_string_with_reso(object date_string, object freq=None,
-                                    dayfirst=False, yearfirst=False, **kwargs):
-    """parse datetime string, only returns datetime
-
-    Returns
-    -------
-    datetime
-    """
-
-    cdef:
-        object parsed, reso
-
-    if not _does_string_look_like_datetime(date_string):
-        raise ValueError('Given date string not likely a datetime.')
-
-    try:
-        return _parse_dateabbr_string(date_string, _DEFAULT_DATETIME, freq)
-    except DateParseError:
-        raise
-    except ValueError:
-        pass
-
-    try:
-        parsed, reso = dateutil_parse(date_string, _DEFAULT_DATETIME,
-                                      dayfirst=dayfirst, yearfirst=yearfirst)
-    except Exception as e:
-        # TODO: allow raise of errors within instead
-        raise DateParseError(e)
-    if parsed is None:
-        raise DateParseError("Could not parse %s" % date_string)
-    return parsed, parsed, reso
-
-
-cdef inline object _parse_dateabbr_string(object date_string, object default,
-                                          object freq):
-    cdef:
-        object ret
-        int year, quarter, month, mnum, date_len
-
-    # special handling for possibilities eg, 2Q2005, 2Q05, 2005Q1, 05Q1
-
-    if date_string in _nat_strings:
-        return NaT, NaT, ''
-
-    date_string = date_string.upper()
-    date_len = len(date_string)
-
-    if date_len == 4:
-        # parse year only like 2000
-        try:
-            ret = default.replace(year=int(date_string))
-            return ret, ret, 'year'
-        except ValueError:
-            pass
-
-    try:
-        if 4 <= date_len <= 7:
-            i = date_string.index('Q', 1, 6)
-            if i == 1:
-                quarter = int(date_string[0])
-                if date_len == 4 or (date_len == 5 and date_string[i + 1] == '-'):
-                    # r'(\d)Q-?(\d\d)')
-                    year = 2000 + int(date_string[-2:])
-                elif date_len == 6 or (date_len == 7 and date_string[i + 1] == '-'):
-                    # r'(\d)Q-?(\d\d\d\d)')
-                    year = int(date_string[-4:])
-                else:
-                    raise ValueError
-            elif i == 2 or i == 3:
-                # r'(\d\d)-?Q(\d)'
-                if date_len == 4 or (date_len == 5 and date_string[i - 1] == '-'):
-                    quarter = int(date_string[-1])
-                    year = 2000 + int(date_string[:2])
-                else:
-                    raise ValueError
-            elif i == 4 or i == 5:
-                if date_len == 6 or (date_len == 7 and date_string[i - 1] == '-'):
-                    # r'(\d\d\d\d)-?Q(\d)'
-                    quarter = int(date_string[-1])
-                    year = int(date_string[:4])
-                else:
-                    raise ValueError
-
-            if not (1 <= quarter <= 4):
-                msg = 'Incorrect quarterly string is given, quarter must be between 1 and 4: {0}'
-                raise DateParseError(msg.format(date_string))
-
-            if freq is not None:
-                # hack attack, #1228
-                try:
-                    mnum = _MONTH_NUMBERS[_get_rule_month(freq)] + 1
-                except (KeyError, ValueError):
-                    msg = 'Unable to retrieve month information from given freq: {0}'.format(freq)
-                    raise DateParseError(msg)
-
-                month = (mnum + (quarter - 1) * 3) % 12 + 1
-                if month > mnum:
-                    year -= 1
-            else:
-                month = (quarter - 1) * 3 + 1
-
-            ret = default.replace(year=year, month=month)
-            return ret, ret, 'quarter'
-
-    except DateParseError:
-        raise
-    except ValueError:
-        pass
-
-    if date_len == 6 and (freq == 'M' or getattr(freq, 'rule_code', None) == 'M'):
-        year = int(date_string[:4])
-        month = int(date_string[4:6])
-        try:
-            ret = default.replace(year=year, month=month)
-            return ret, ret, 'month'
-        except ValueError:
-            pass
-
-    for pat in ['%Y-%m', '%m-%Y', '%b %Y', '%b-%Y']:
-        try:
-            ret = datetime.strptime(date_string, pat)
-            return ret, ret, 'month'
-        except ValueError:
-            pass
-
-    raise ValueError('Unable to parse {0}'.format(date_string))
-
-
-def dateutil_parse(object timestr, object default, ignoretz=False,
-                   tzinfos=None, **kwargs):
-    """ lifted from dateutil to get resolution"""
-
-    cdef:
-        object fobj, res, attr, ret, tzdata
-        object reso = None
-        dict repl = {}
-
-    fobj = StringIO(str(timestr))
-    res = DEFAULTPARSER._parse(fobj, **kwargs)
-
-    # dateutil 2.2 compat
-    if isinstance(res, tuple):
-        res, _ = res
-
-    if res is None:
-        raise ValueError("unknown string format")
-
-    for attr in ["year", "month", "day", "hour",
-                 "minute", "second", "microsecond"]:
-        value = getattr(res, attr)
-        if value is not None:
-            repl[attr] = value
-            reso = attr
-
-    if reso is None:
-        raise ValueError("Cannot parse date.")
-
-    if reso == 'microsecond':
-        if repl['microsecond'] == 0:
-            reso = 'second'
-        elif repl['microsecond'] % 1000 == 0:
-            reso = 'millisecond'
-
-    ret = default.replace(**repl)
-    if res.weekday is not None and not res.day:
-        ret = ret + relativedelta.relativedelta(weekday=res.weekday)
-    if not ignoretz:
-        if callable(tzinfos) or tzinfos and res.tzname in tzinfos:
-            if callable(tzinfos):
-                tzdata = tzinfos(res.tzname, res.tzoffset)
-            else:
-                tzdata = tzinfos.get(res.tzname)
-            if isinstance(tzdata, datetime.tzinfo):
-                tzinfo = tzdata
-            elif isinstance(tzdata, string_types):
-                tzinfo = _dateutil_tzstr(tzdata)
-            elif isinstance(tzdata, int):
-                tzinfo = tzoffset(res.tzname, tzdata)
-            else:
-                raise ValueError("offset must be tzinfo subclass, "
-                                 "tz string, or int offset")
-            ret = ret.replace(tzinfo=tzinfo)
-        elif res.tzname and res.tzname in time.tzname:
-            ret = ret.replace(tzinfo=_dateutil_tzlocal())
-        elif res.tzoffset == 0:
-            ret = ret.replace(tzinfo=_dateutil_tzutc())
-        elif res.tzoffset:
-            ret = ret.replace(tzinfo=tzoffset(res.tzname, res.tzoffset))
-    return ret, reso
-
-
-# const for parsers
-
-_DEFAULT_DATETIME = datetime(1, 1, 1).replace(hour=0, minute=0, second=0, microsecond=0)
-_MONTHS = ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL',
-           'AUG', 'SEP', 'OCT', 'NOV', 'DEC']
-_MONTH_NUMBERS = dict((k, i) for i, k in enumerate(_MONTHS))
-_MONTH_ALIASES = dict((k + 1, v) for k, v in enumerate(_MONTHS))
-
-
-cpdef object _get_rule_month(object source, object default='DEC'):
-    """
-    Return starting month of given freq, default is December.
-
-    Example
-    -------
-    >>> _get_rule_month('D')
-    'DEC'
-
-    >>> _get_rule_month('A-JAN')
-    'JAN'
-    """
-    if hasattr(source, 'freqstr'):
-        source = source.freqstr
-    source = source.upper()
-    if '-' not in source:
-        return default
-    else:
-        return source.split('-')[1]
-
-
-cpdef array_to_datetime(ndarray[object] values, errors='raise',
-                        dayfirst=False, yearfirst=False, freq=None,
-                        format=None, utc=None, unit=None,
-                        require_iso8601=False):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        object val, py_dt
-        ndarray[int64_t] iresult
-        ndarray[object] oresult
-        pandas_datetimestruct dts
-        bint utc_convert = bool(utc), seen_integer=0, seen_datetime=0
-        bint is_raise=errors=='raise', is_ignore=errors=='ignore', is_coerce=errors=='coerce'
-        _TSObject _ts
-        int64_t m = cast_from_unit(None,unit)
-        int out_local = 0, out_tzoffset = 0
-
-    # specify error conditions
-    assert is_raise or is_ignore or is_coerce
-
-    try:
-        result = np.empty(n, dtype='M8[ns]')
-        iresult = result.view('i8')
-        for i in range(n):
-            val = values[i]
-            if _checknull_with_nat(val):
-                iresult[i] = iNaT
-            elif PyDateTime_Check(val):
-                seen_datetime=1
-                if val.tzinfo is not None:
-                    if utc_convert:
-                        _ts = convert_to_tsobject(val, None, unit)
-                        iresult[i] = _ts.value
-                        try:
-                            _check_dts_bounds(&_ts.dts)
-                        except ValueError:
-                            if is_coerce:
-                                iresult[i] = iNaT
-                                continue
-                            raise
-                    else:
-                        raise ValueError('Tz-aware datetime.datetime cannot '
-                                         'be converted to datetime64 unless '
-                                         'utc=True')
-                else:
-                    iresult[i] = _pydatetime_to_dts(val, &dts)
-                    if is_timestamp(val):
-                        iresult[i] += (<_Timestamp>val).nanosecond
-                    try:
-                        _check_dts_bounds(&dts)
-                    except ValueError:
-                        if is_coerce:
-                            iresult[i] = iNaT
-                            continue
-                        raise
-            elif PyDate_Check(val):
-                iresult[i] = _date_to_datetime64(val, &dts)
-                try:
-                    _check_dts_bounds(&dts)
-                    seen_datetime=1
-                except ValueError:
-                    if is_coerce:
-                        iresult[i] = iNaT
-                        continue
-                    raise
-            elif util.is_datetime64_object(val):
-                if val is np_NaT or val.view('i8') == iNaT:
-                    iresult[i] = iNaT
-                else:
-                    try:
-                        iresult[i] = _get_datetime64_nanos(val)
-                        seen_datetime=1
-                    except ValueError:
-                        if is_coerce:
-                            iresult[i] = iNaT
-                            continue
-                        raise
-
-            # if we are coercing, dont' allow integers
-            elif is_integer_object(val) and not is_coerce:
-                if val == iNaT:
-                    iresult[i] = iNaT
-                else:
-                    iresult[i] = val*m
-                    seen_integer=1
-            elif is_float_object(val) and not is_coerce:
-                if val != val or val == iNaT:
-                    iresult[i] = iNaT
-                else:
-                    iresult[i] = cast_from_unit(val,unit)
-                    seen_integer=1
-            else:
-                try:
-                    if len(val) == 0:
-                        iresult[i] = iNaT
-                        continue
-
-                    elif val in _nat_strings:
-                        iresult[i] = iNaT
-                        continue
-                    _string_to_dts(val, &dts, &out_local, &out_tzoffset)
-                    value = pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-                    if out_local == 1:
-                        tz = pytz.FixedOffset(out_tzoffset)
-                        value = tz_convert_single(value, tz, 'UTC')
-                    iresult[i] = value
-                    _check_dts_bounds(&dts)
-                except ValueError:
-                    # if requiring iso8601 strings, skip trying other formats
-                    if require_iso8601:
-                        if is_coerce:
-                            iresult[i] = iNaT
-                            continue
-                        elif is_raise:
-                            raise ValueError("time data %r does match format specified" %
-                                             (val,))
-                        else:
-                            return values
-
-                    try:
-                        py_dt = parse_datetime_string(val, dayfirst=dayfirst,
-                                                      yearfirst=yearfirst, freq=freq)
-                    except Exception:
-                        if is_coerce:
-                            iresult[i] = iNaT
-                            continue
-                        raise TypeError("invalid string coercion to datetime")
-
-                    try:
-                        _ts = convert_to_tsobject(py_dt, None, None)
-                        iresult[i] = _ts.value
-                    except ValueError:
-                        if is_coerce:
-                            iresult[i] = iNaT
-                            continue
-                        raise
-                except:
-                    if is_coerce:
-                        iresult[i] = iNaT
-                        continue
-                    raise
-
-        # don't allow mixed integers and datetime like
-        # higher levels can catch and is_coerce to object, for
-        # example
-        if seen_integer and seen_datetime:
-            raise ValueError("mixed datetimes and integers in passed array")
-
-        return result
-    except OutOfBoundsDatetime:
-        if is_raise:
-            raise
-
-        oresult = np.empty(n, dtype=object)
-        for i in range(n):
-            val = values[i]
-
-            # set as nan except if its a NaT
-            if _checknull_with_nat(val):
-                if val is np_NaT or val.view('i8') == iNaT:
-                    oresult[i] = NaT
-                else:
-                    oresult[i] = np.nan
-            elif util.is_datetime64_object(val):
-                if val is np_NaT or val.view('i8') == iNaT:
-                    oresult[i] = NaT
-                else:
-                    oresult[i] = val.item()
-            else:
-                oresult[i] = val
-        return oresult
-    except TypeError:
-        oresult = np.empty(n, dtype=object)
-
-        for i in range(n):
-            val = values[i]
-            if _checknull_with_nat(val):
-                oresult[i] = val
-            elif util.is_string_object(val):
-                if len(val) == 0:
-                    # TODO: ??
-                    oresult[i] = 'NaT'
-                    continue
-                try:
-                    oresult[i] = parse_datetime_string(val, dayfirst=dayfirst,
-                                                    yearfirst=yearfirst, freq=freq)
-                    _pydatetime_to_dts(oresult[i], &dts)
-                    _check_dts_bounds(&dts)
-                except Exception:
-                    if is_raise:
-                        raise
-                    return values
-                    # oresult[i] = val
-            else:
-                if is_raise:
-                    raise
-                return values
-
-        return oresult
-
-def parse_str_array_to_datetime(ndarray values, dayfirst=False,
-                                yearfirst=False, object freq=None):
-    """Shortcut to parse str array for quicker DatetimeIndex construction"""
-    cdef:
-        Py_ssize_t i, n = len(values)
-        object val, py_dt
-        ndarray[int64_t] iresult
-        _TSObject _ts
-
-    iresult = np.empty(n, dtype='i8')
-
-    for i in range(n):
-        val = values[i]
-        try:
-            py_dt = parse_datetime_string(val, dayfirst=dayfirst,
-                                          yearfirst=yearfirst, freq=freq)
-        except Exception:
-            raise ValueError
-        _ts = convert_to_tsobject(py_dt, None, None)
-        iresult[i] = _ts.value
-
-    return iresult
-
-# Similar to Timestamp/datetime, this is a construction requirement for timedeltas
-# we need to do object instantiation in python
-# This will serve as a C extension type that
-# shadows the python class, where we do any heavy lifting.
-
-cdef class _Timedelta(timedelta):
-
-    cdef readonly:
-        int64_t value     # nanoseconds
-        object freq       # frequency reference
-        bint is_populated # are my components populated
-        int64_t _sign, _d, _h, _m, _s, _ms, _us, _ns
-
-    def __hash__(_Timedelta self):
-        if self._has_ns():
-            return hash(self.value)
-        else:
-            return timedelta.__hash__(self)
-
-    def __richcmp__(_Timedelta self, object other, int op):
-        cdef:
-            _Timedelta ots
-            int ndim
-
-        if isinstance(other, _Timedelta):
-            if isinstance(other, _NaT):
-                return _cmp_nat_dt(other, self, _reverse_ops[op])
-            ots = other
-        elif isinstance(other, timedelta):
-            ots = Timedelta(other)
-        else:
-            ndim = getattr(other, _NDIM_STRING, -1)
-
-            if ndim != -1:
-                if ndim == 0:
-                    if isinstance(other, np.timedelta64):
-                        other = Timedelta(other)
-                    else:
-                        if op == Py_EQ:
-                            return False
-                        elif op == Py_NE:
-                            return True
-
-                        # only allow ==, != ops
-                        raise TypeError('Cannot compare type %r with type %r' %
-                                        (type(self).__name__,
-                                         type(other).__name__))
-                return PyObject_RichCompare(other, self, _reverse_ops[op])
-            else:
-                if op == Py_EQ:
-                    return False
-                elif op == Py_NE:
-                    return True
-                raise TypeError('Cannot compare type %r with type %r' %
-                                (type(self).__name__, type(other).__name__))
-
-        return _cmp_scalar(self.value, ots.value, op)
-
-    def _ensure_components(_Timedelta self):
-        """
-        compute the components
-        """
-        cdef int64_t sfrac, ifrac, ivalue = self.value
-        cdef float64_t frac
-
-        if self.is_populated:
-            return
-
-        # put frac in seconds
-        frac = float(ivalue)/1e9
-        if frac < 0:
-            self._sign = -1
-
-            # even fraction
-            if int(-frac/86400) != -frac/86400.0:
-                self._d = int(-frac/86400.0+1)
-                frac += 86400*self._d
-            else:
-                frac = -frac
-        else:
-            self._sign = 1
-            self._d = 0
-
-        if frac >= 86400:
-            self._d += int(frac / 86400)
-            frac   -= self._d * 86400
-
-        if frac >= 3600:
-            self._h  = int(frac / 3600)
-            frac    -= self._h * 3600
-        else:
-            self._h = 0
-
-        if frac >= 60:
-            self._m = int(frac / 60)
-            frac   -= self._m * 60
-        else:
-            self._m = 0
-
-        if frac >= 0:
-            self._s = int(frac)
-            frac   -= self._s
-        else:
-            self._s = 0
-
-        if frac != 0:
-
-            # reset so we don't lose precision
-            sfrac = int((self._h*3600 + self._m*60 + self._s)*1e9)
-            if self._sign < 0:
-                ifrac = ivalue + self._d*DAY_NS - sfrac
-            else:
-                ifrac = ivalue - (self._d*DAY_NS + sfrac)
-
-            self._ms = int(ifrac/1e6)
-            ifrac -= self._ms*1000*1000
-            self._us = int(ifrac/1e3)
-            ifrac -= self._us*1000
-            self._ns = ifrac
-        else:
-            self._ms = 0
-            self._us = 0
-            self._ns = 0
-
-        self.is_populated = 1
-
-    cpdef timedelta to_pytimedelta(_Timedelta self):
-        """
-        return an actual datetime.timedelta object
-        note: we lose nanosecond resolution if any
-        """
-        return timedelta(microseconds=int(self.value)/1000)
-
-    cpdef bint _has_ns(self):
-        return self.value % 1000 != 0
-
-# components named tuple
-Components = collections.namedtuple('Components',['days','hours','minutes','seconds','milliseconds','microseconds','nanoseconds'])
-
-# Python front end to C extension type _Timedelta
-# This serves as the box for timedelta64
-class Timedelta(_Timedelta):
-    """
-    Represents a duration, the difference between two dates or times.
-
-    Timedelta is the pandas equivalent of python's ``datetime.timedelta``
-    and is interchangable with it in most cases.
-
-    Parameters
-    ----------
-    value : Timedelta, timedelta, np.timedelta64, string, or integer
-    unit : string, [D,h,m,s,ms,us,ns]
-        Denote the unit of the input, if input is an integer. Default 'ns'.
-    days, seconds, microseconds, milliseconds, minutes, hours, weeks : numeric, optional
-        Values for construction in compat with datetime.timedelta.
-        np ints and floats will be coereced to python ints and floats.
-
-    Notes
-    -----
-    The ``.value`` attribute is always in ns.
-
-    """
-
-    def __new__(cls, object value=None, unit=None, **kwargs):
-        cdef _Timedelta td_base
-
-        if value is None:
-            if not len(kwargs):
-                raise ValueError("cannot construct a TimeDelta without a value/unit or descriptive keywords (days,seconds....)")
-
-            def _to_py_int_float(v):
-                if is_integer_object(v):
-                    return int(v)
-                elif is_float_object(v):
-                    return float(v)
-                raise TypeError("Invalid type {0}. Must be int or float.".format(type(v)))
-
-            kwargs = dict([ (k, _to_py_int_float(v)) for k, v in iteritems(kwargs) ])
-
-            try:
-                nano = kwargs.pop('nanoseconds',0)
-                value = convert_to_timedelta64(timedelta(**kwargs),'ns',False) + nano
-            except TypeError as e:
-                raise ValueError("cannot construct a TimeDelta from the passed arguments, allowed keywords are "
-                                 "[weeks, days, hours, minutes, seconds, milliseconds, microseconds, nanoseconds]")
-
-        if isinstance(value, Timedelta):
-            value = value.value
-        elif util.is_string_object(value):
-            value = np.timedelta64(parse_timedelta_string(value, False))
-        elif isinstance(value, timedelta):
-            value = convert_to_timedelta64(value,'ns',False)
-        elif isinstance(value, np.timedelta64):
-            if unit is not None:
-                value = value.astype('timedelta64[{0}]'.format(unit))
-            value = value.astype('timedelta64[ns]')
-        elif hasattr(value,'delta'):
-            value = np.timedelta64(_delta_to_nanoseconds(value.delta),'ns')
-        elif is_integer_object(value) or util.is_float_object(value):
-            # unit=None is de-facto 'ns'
-            value = convert_to_timedelta64(value,unit,False)
-        elif _checknull_with_nat(value):
-            return NaT
-        else:
-            raise ValueError("Value must be Timedelta, string, integer, float, timedelta or convertible")
-
-        if isinstance(value, np.timedelta64):
-            value = value.view('i8')
-
-        # nat
-        if value == NPY_NAT:
-            return NaT
-
-        # make timedelta happy
-        td_base = _Timedelta.__new__(cls, microseconds=int(value)/1000)
-        td_base.value = value
-        td_base.is_populated = 0
-        return td_base
-
-    @property
-    def delta(self):
-        """ return out delta in ns (for internal compat) """
-        return self.value
-
-    @property
-    def asm8(self):
-        """ return a numpy timedelta64 array view of myself """
-        return np.int64(self.value).view('m8[ns]')
-
-    @property
-    def resolution(self):
-        """ return a string representing the lowest resolution that we have """
-
-        self._ensure_components()
-        if self._ns:
-           return "ns"
-        elif self._us:
-           return "us"
-        elif self._ms:
-           return "ms"
-        elif self._s:
-           return "s"
-        elif self._m:
-           return "m"
-        elif self._h:
-           return "h"
-        else:
-           return "D"
-
-    def round(self, reso):
-        """
-        return a new Timedelta rounded to this resolution
-
-        Parameters
-        ----------
-        reso : a string indicating the rouding resolution, accepting values
-           d,h,m,s,ms,us
-
-        """
-        cdef int64_t frac, value = np.abs(self.value)
-
-        self._ensure_components()
-        frac = int(self._ms*1e6 + self._us*1e3+ self._ns)
-        if reso == 'us':
-           value -= self._ns
-        elif reso == 'ms':
-           value -= self._us*1000 + self._ns
-        elif reso == 's':
-           value -= frac
-        elif reso == 'm':
-           value -= int(self._s*1e9) + frac
-        elif reso == 'h':
-           value -= int((60*self._m + self._s)*1e9) + frac
-        elif reso == 'd' or reso == 'D':
-           value -= int((3600*self._h + 60*self._m + self._s)*1e9) + frac
-        else:
-           raise ValueError("invalid resolution")
-
-        if self._sign < 0:
-           value *= -1
-        return Timedelta(value,unit='ns')
-
-    def _repr_base(self, format=None):
-        """
-
-        Parameters
-        ----------
-        format : None|all|even_day|sub_day|long
-
-        Returns
-        -------
-        converted : string of a Timedelta
-
-        """
-        cdef object sign_pretty, sign2_pretty, seconds_pretty, subs
-
-        self._ensure_components()
-
-        if self._sign < 0:
-           sign_pretty = "-"
-           sign2_pretty = " +"
-        else:
-           sign_pretty = ""
-           sign2_pretty = " "
-
-        # show everything
-        if format == 'all':
-           seconds_pretty = "%02d.%03d%03d%03d" % (self._s, self._ms, self._us, self._ns)
-           return "%s%d days%s%02d:%02d:%s" % (sign_pretty, self._d, sign2_pretty, self._h, self._m, seconds_pretty)
-
-        # by default not showing nano
-        if self._ms or self._us or self._ns:
-           seconds_pretty = "%02d.%03d%03d" % (self._s, self._ms, self._us)
-        else:
-           seconds_pretty = "%02d" % self._s
-
-        # if we have a partial day
-        subs = self._h or self._m or self._s or self._ms or self._us or self._ns
-
-        if format == 'even_day':
-           if not subs:
-               return "%s%d days" % (sign_pretty, self._d)
-
-        elif format == 'sub_day':
-           if not self._d:
-
-               # degenerate, don't need the extra space
-               if self._sign > 0:
-                   sign2_pretty = ""
-               return "%s%s%02d:%02d:%s" % (sign_pretty, sign2_pretty, self._h, self._m, seconds_pretty)
-
-        if subs or format=='long':
-           return "%s%d days%s%02d:%02d:%s" % (sign_pretty, self._d, sign2_pretty, self._h, self._m, seconds_pretty)
-        return "%s%d days" % (sign_pretty, self._d)
-
-
-    def __repr__(self):
-        return "Timedelta('{0}')".format(self._repr_base(format='long'))
-    def __str__(self):
-        return self._repr_base(format='long')
-
-    @property
-    def components(self):
-        """ Return a Components NamedTuple-like """
-        self._ensure_components()
-        if self._sign < 0:
-           return Components(-self._d,self._h,self._m,self._s,self._ms,self._us,self._ns)
-
-        # return the named tuple
-        return Components(self._d,self._h,self._m,self._s,self._ms,self._us,self._ns)
-
-    @property
-    def days(self):
-        """
-        Number of Days
-
-        .components will return the shown components
-        """
-        self._ensure_components()
-        if self._sign < 0:
-            return -1*self._d
-        return self._d
-
-    @property
-    def seconds(self):
-        """
-        Number of seconds (>= 0 and less than 1 day).
-
-        .components will return the shown components
-        """
-        self._ensure_components()
-        return self._h*3600 + self._m*60 + self._s
-
-    @property
-    def microseconds(self):
-        """
-        Number of microseconds (>= 0 and less than 1 second).
-
-        .components will return the shown components
-        """
-        self._ensure_components()
-        return self._ms*1000 + self._us
-
-    @property
-    def nanoseconds(self):
-        """
-        Number of nanoseconds (>= 0 and less than 1 microsecond).
-
-        .components will return the shown components
-        """
-        self._ensure_components()
-        return self._ns
-
-    def total_seconds(self):
-        """
-        Total duration of timedelta in seconds (to ns precision)
-        """
-        return 1e-9*self.value
-
-    def __setstate__(self, state):
-        (value) = state
-        self.value = value
-
-    def __reduce__(self):
-        object_state = self.value,
-        return (Timedelta, object_state)
-
-    def view(self, dtype):
-        """ array view compat """
-        return np.timedelta64(self.value).view(dtype)
-
-    def to_timedelta64(self):
-        """ Returns a numpy.timedelta64 object with 'ns' precision """
-        return np.timedelta64(self.value, 'ns')
-
-    def _validate_ops_compat(self, other):
-        # return True if we are compat with operating
-        if _checknull_with_nat(other):
-             return True
-        elif isinstance(other, (Timedelta, timedelta, np.timedelta64)):
-             return True
-        elif util.is_string_object(other):
-             return True
-        elif hasattr(other,'delta'):
-             return True
-        return False
-
-    # higher than np.ndarray and np.matrix
-    __array_priority__ = 100
-
-    def _binary_op_method_timedeltalike(op, name):
-        # define a binary operation that only works if the other argument is
-        # timedelta like or an array of timedeltalike
-        def f(self, other):
-            # an offset
-            if hasattr(other, 'delta') and not isinstance(other, Timedelta):
-                return op(self, other.delta)
-
-            # a datetimelike
-            if (isinstance(other, (datetime, np.datetime64))
-                    and not isinstance(other, (Timestamp, NaTType))):
-                return op(self, Timestamp(other))
-
-            # nd-array like
-            if hasattr(other, 'dtype'):
-                if other.dtype.kind not in ['m', 'M']:
-                    # raise rathering than letting numpy return wrong answer
-                    return NotImplemented
-                return op(self.to_timedelta64(), other)
-
-            if not self._validate_ops_compat(other):
-                return NotImplemented
-
-            other = Timedelta(other)
-            if other is NaT:
-                return NaT
-            return Timedelta(op(self.value, other.value), unit='ns')
-        f.__name__ = name
-        return f
-
-    __add__ = _binary_op_method_timedeltalike(lambda x, y: x + y, '__add__')
-    __radd__ = _binary_op_method_timedeltalike(lambda x, y: x + y, '__radd__')
-    __sub__ = _binary_op_method_timedeltalike(lambda x, y: x - y, '__sub__')
-    __rsub__ = _binary_op_method_timedeltalike(lambda x, y: y - x, '__rsub__')
-
-    def __mul__(self, other):
-
-        # nd-array like
-        if hasattr(other, 'dtype'):
-            return other * self.to_timedelta64()
-
-        if other is NaT:
-            return NaT
-
-        # only integers allowed
-        if not is_integer_object(other):
-           return NotImplemented
-
-        return Timedelta(other*self.value, unit='ns')
-
-    __rmul__ = __mul__
-
-    def __truediv__(self, other):
-
-        if hasattr(other, 'dtype'):
-            return self.to_timedelta64() / other
-
-        # pure integers
-        if is_integer_object(other):
-           return Timedelta(self.value/other, unit='ns')
-
-        if not self._validate_ops_compat(other):
-            return NotImplemented
-
-        other = Timedelta(other)
-        if other is NaT:
-            return NaT
-        return self.value/float(other.value)
-
-    def __rtruediv__(self, other):
-        if hasattr(other, 'dtype'):
-            return other / self.to_timedelta64()
-
-        if not self._validate_ops_compat(other):
-            return NotImplemented
-
-        other = Timedelta(other)
-        if other is NaT:
-            return NaT
-        return float(other.value) / self.value
-
-    if not PY3:
-       __div__ = __truediv__
-       __rdiv__ = __rtruediv__
-
-    def _not_implemented(self, *args, **kwargs):
-        return NotImplemented
-
-    __floordiv__  = _not_implemented
-    __rfloordiv__ = _not_implemented
-
-    def _op_unary_method(func, name):
-
-        def f(self):
-            return Timedelta(func(self.value), unit='ns')
-        f.__name__ = name
-        return f
-
-    __inv__ = _op_unary_method(lambda x: -x, '__inv__')
-    __neg__ = _op_unary_method(lambda x: -x, '__neg__')
-    __pos__ = _op_unary_method(lambda x: x, '__pos__')
-    __abs__ = _op_unary_method(lambda x: abs(x), '__abs__')
-
-cdef PyTypeObject* td_type = <PyTypeObject*> Timedelta
-
-cdef inline bint is_timedelta(object o):
-    return Py_TYPE(o) == td_type # isinstance(o, Timedelta)
-
-def array_to_timedelta64(ndarray[object] values, unit='ns', errors='raise'):
-    """ convert an ndarray to an array of ints that are timedeltas
-        force conversion if coerce = True,
-        else will raise if cannot convert """
-    cdef:
-        Py_ssize_t i, n
-        ndarray[int64_t] iresult
-        bint is_raise=errors=='raise', is_ignore=errors=='ignore', is_coerce=errors=='coerce'
-
-    assert is_raise or is_ignore or is_coerce
-
-    n = values.shape[0]
-    result = np.empty(n, dtype='m8[ns]')
-    iresult = result.view('i8')
-
-    # usually we have all strings
-    # if so then we hit the fast path
-    try:
-        for i in range(n):
-            result[i] = parse_timedelta_string(values[i], is_coerce)
-    except:
-        for i in range(n):
-            result[i] = convert_to_timedelta64(values[i], unit, is_coerce)
-    return iresult
-
-
-def convert_to_timedelta(object ts, object unit='ns', errors='raise'):
-    cdef bint is_raise=errors=='raise', is_ignore=errors=='ignore', is_coerce=errors=='coerce'
-
-    assert is_raise or is_ignore or is_coerce
-    return convert_to_timedelta64(ts, unit, is_coerce)
-
-cdef dict timedelta_abbrevs = { 'd' : 'd',
-                                'days' : 'd',
-                                'day' : 'd',
-                                'hours' : 'h',
-                                'hour' : 'h',
-                                'h' : 'h',
-                                'm' : 'm',
-                                'minute' : 'm',
-                                'min' : 'm',
-                                'minutes' : 'm',
-                                's' : 's',
-                                'seconds' : 's',
-                                'sec' : 's',
-                                'second' : 's',
-                                'ms' : 'ms',
-                                'milliseconds' : 'ms',
-                                'millisecond' : 'ms',
-                                'milli' : 'ms',
-                                'millis' : 'ms',
-                                'us' : 'us',
-                                'microseconds' : 'us',
-                                'microsecond' : 'us',
-                                'micro' : 'us',
-                                'micros' : 'us',
-                                'ns' : 'ns',
-                                'nanoseconds' : 'ns',
-                                'nano' : 'ns',
-                                'nanos' : 'ns',
-                                'nanosecond' : 'ns',
-                                }
-
-cdef inline int64_t timedelta_as_neg(int64_t value, bint neg):
-    """
-
-    Parameters
-    ----------
-    value : int64_t of the timedelta value
-    neg : boolean if the a negative value
-    """
-    if neg:
-        return -value
-    return value
-
-cdef inline timedelta_from_spec(object number, object frac, object unit):
-    """
-
-    Parameters
-    ----------
-    number : a list of number digits
-    frac : a list of frac digits
-    unit : a list of unit characters
-    """
-    cdef object n
-
-    try:
-        unit = ''.join(unit)
-        unit = timedelta_abbrevs[unit.lower()]
-    except KeyError:
-        raise ValueError("invalid abbreviation: {0}".format(unit))
-
-    n = ''.join(number) + '.' + ''.join(frac)
-    return cast_from_unit(float(n), unit)
-
-cdef inline parse_timedelta_string(object ts, coerce=False):
-    """
-    Parse an regular format timedelta string
-
-    Return an int64_t or raise a ValueError on an invalid parse
-
-    if coerce, set a non-valid value to NaT
-
-    Return a ns based int64
-    """
-
-    cdef:
-        str c
-        bint neg=0, have_dot=0, have_value=0, have_hhmmss=0
-        object current_unit=None
-        int64_t result=0, m=0, r
-        list number=[], frac=[], unit=[]
-
-    # neg : tracks if we have a leading negative for the value
-    # have_dot : tracks if we are processing a dot (either post hhmmss or inside an expression)
-    # have_value : track if we have at least 1 leading unit
-    # have_hhmmss : tracks if we have a regular format hh:mm:ss
-
-    if ts in _nat_strings or not len(ts):
-        return iNaT
-
-    for c in ts:
-
-        # skip whitespace / commas
-        if c == ' ' or c == ',':
-            pass
-
-        # positive signs are ignored
-        elif c == '+':
-            pass
-
-        # neg
-        elif c == '-':
-
-            if neg or have_value or have_hhmmss:
-                raise ValueError("only leading negative signs are allowed")
-
-            neg = 1
-
-        # number (ascii codes)
-        elif ord(c) >= 48 and ord(c) <= 57:
-
-            if have_dot:
-
-                # we found a dot, but now its just a fraction
-                if len(unit):
-                    number.append(c)
-                    have_dot = 0
-                else:
-                    frac.append(c)
-
-            elif not len(unit):
-                number.append(c)
-
-            else:
-
-                try:
-                    r = timedelta_from_spec(number, frac, unit)
-                except ValueError:
-                    if coerce:
-                        return iNaT
-                    raise
-                unit, number, frac = [], [c], []
-
-                result += timedelta_as_neg(r, neg)
-
-        # hh:mm:ss.
-        elif c == ':':
-
-            # we flip this off if we have a leading value
-            if have_value:
-                neg = 0
-
-            # we are in the pattern hh:mm:ss pattern
-            if len(number):
-                if current_unit is None:
-                    current_unit = 'h'
-                    m = 1000000000L * 3600
-                elif current_unit == 'h':
-                    current_unit = 'm'
-                    m = 1000000000L * 60
-                elif current_unit == 'm':
-                    current_unit = 's'
-                    m = 1000000000L
-                r = <int64_t> int(''.join(number)) * m
-                result += timedelta_as_neg(r, neg)
-                have_hhmmss = 1
-            else:
-                if coerce:
-                    return iNaT
-                raise ValueError("expecting hh:mm:ss format, received: {0}".format(ts))
-            unit, number = [], []
-
-        # after the decimal point
-        elif c == '.':
-
-            if len(number) and current_unit is not None:
-
-                # by definition we had something like
-                # so we need to evaluate the final field from a
-                # hh:mm:ss (so current_unit is 'm')
-                if current_unit != 'm':
-                    raise ValueError("expected hh:mm:ss format before .")
-                m = 1000000000L
-                r = <int64_t> int(''.join(number)) * m
-                result += timedelta_as_neg(r, neg)
-                have_value = 1
-                unit, number, frac = [], [], []
-
-            have_dot = 1
-
-        # unit
-        else:
-            unit.append(c)
-            have_value = 1
-            have_dot = 0
-
-    # we had a dot, but we have a fractional
-    # value since we have an unit
-    if have_dot and len(unit):
-        try:
-            r = timedelta_from_spec(number, frac, unit)
-            result += timedelta_as_neg(r, neg)
-        except ValueError:
-            if coerce:
-                return iNaT
-            raise
-
-    # we have a dot as part of a regular format
-    # e.g. hh:mm:ss.fffffff
-    elif have_dot:
-
-        if (len(number) or len(frac)) and not len(unit) and current_unit is None:
-            if coerce:
-                return iNaT
-            raise ValueError("no units specified")
-
-        if len(frac) > 0 and len(frac) <= 3:
-            m = 10**(3-len(frac)) * 1000L * 1000L
-        elif len(frac) > 3 and len(frac) <= 6:
-            m = 10**(6-len(frac)) * 1000L
-        else:
-            m = 10**(9-len(frac))
-
-        r = <int64_t> int(''.join(frac)) * m
-        result += timedelta_as_neg(r, neg)
-
-    # we have a regular format
-    # we must have seconds at this point (hence the unit is still 'm')
-    elif current_unit is not None:
-        if current_unit != 'm':
-            raise ValueError("expected hh:mm:ss format")
-        m = 1000000000L
-        r = <int64_t> int(''.join(number)) * m
-        result += timedelta_as_neg(r, neg)
-
-    # we have a last abbreviation
-    elif len(unit):
-
-        if len(number):
-            try:
-                r = timedelta_from_spec(number, frac, unit)
-                result += timedelta_as_neg(r, neg)
-            except ValueError:
-                if coerce:
-                    return iNaT
-                raise
-        else:
-            if coerce:
-                return iNaT
-            raise ValueError("unit abbreviation w/o a number")
-
-    # treat as nanoseconds
-    # but only if we don't have anything else
-    else:
-
-        if have_value:
-            raise ValueError("have leftover units")
-        if len(number):
-            try:
-                r = timedelta_from_spec(number, frac, 'ns')
-                result += timedelta_as_neg(r, neg)
-            except ValueError:
-                if coerce:
-                    return iNaT
-                raise
-
-    return result
-
-cdef inline convert_to_timedelta64(object ts, object unit, object coerce):
-    """
-    Convert an incoming object to a timedelta64 if possible
-
-    Handle these types of objects:
-        - timedelta/Timedelta
-        - timedelta64
-        - an offset
-        - np.int64 (with unit providing a possible modifier)
-        - None/NaT
-
-    if coerce, set a non-valid value to NaT
-
-    Return a ns based int64
-
-    # kludgy here until we have a timedelta scalar
-    # handle the numpy < 1.7 case
-    """
-    if _checknull_with_nat(ts):
-        return np.timedelta64(iNaT)
-    elif isinstance(ts, Timedelta):
-        # already in the proper format
-        ts = np.timedelta64(ts.value)
-    elif util.is_datetime64_object(ts):
-        # only accept a NaT here
-        if ts.astype('int64') == iNaT:
-            return np.timedelta64(iNaT)
-    elif isinstance(ts, np.timedelta64):
-        ts = ts.astype("m8[{0}]".format(unit.lower()))
-    elif is_integer_object(ts):
-        if ts == iNaT:
-            return np.timedelta64(iNaT)
-        else:
-            if util.is_array(ts):
-                ts = ts.astype('int64').item()
-            if unit in ['Y','M','W']:
-                ts = np.timedelta64(ts, unit)
-            else:
-                ts = cast_from_unit(ts, unit)
-                ts = np.timedelta64(ts)
-    elif is_float_object(ts):
-        if util.is_array(ts):
-            ts = ts.astype('int64').item()
-        if unit in ['Y','M','W']:
-            ts = np.timedelta64(int(ts), unit)
-        else:
-            ts = cast_from_unit(ts, unit)
-            ts = np.timedelta64(ts)
-    elif util.is_string_object(ts):
-        ts = np.timedelta64(parse_timedelta_string(ts, coerce))
-    elif hasattr(ts,'delta'):
-        ts = np.timedelta64(_delta_to_nanoseconds(ts),'ns')
-
-    if isinstance(ts, timedelta):
-        ts = np.timedelta64(ts)
-    elif not isinstance(ts, np.timedelta64):
-        if coerce:
-            return np.timedelta64(iNaT)
-        raise ValueError("Invalid type for timedelta scalar: %s" % type(ts))
-    return ts.astype('timedelta64[ns]')
-
-def array_strptime(ndarray[object] values, object fmt, bint exact=True, errors='raise'):
-    """
-    Parameters
-    ----------
-    values : ndarray of string-like objects
-    fmt : string-like regex
-    exact : matches must be exact if True, search if False
-    coerce : if invalid values found, coerce to NaT
-    """
-
-    cdef:
-        Py_ssize_t i, n = len(values)
-        pandas_datetimestruct dts
-        ndarray[int64_t] iresult
-        int year, month, day, minute, hour, second, weekday, julian, tz
-        int week_of_year, week_of_year_start
-        int64_t us, ns
-        object val, group_key, ampm, found
-        dict found_key
-        bint is_raise=errors=='raise', is_ignore=errors=='ignore', is_coerce=errors=='coerce'
-
-    assert is_raise or is_ignore or is_coerce
-
-    global _TimeRE_cache, _regex_cache
-    with _cache_lock:
-        if _getlang() != _TimeRE_cache.locale_time.lang:
-            _TimeRE_cache = TimeRE()
-            _regex_cache.clear()
-        if len(_regex_cache) > _CACHE_MAX_SIZE:
-            _regex_cache.clear()
-        locale_time = _TimeRE_cache.locale_time
-        format_regex = _regex_cache.get(fmt)
-        if not format_regex:
-            try:
-                format_regex = _TimeRE_cache.compile(fmt)
-            # KeyError raised when a bad format is found; can be specified as
-            # \\, in which case it was a stray % but with a space after it
-            except KeyError, err:
-                bad_directive = err.args[0]
-                if bad_directive == "\\":
-                    bad_directive = "%"
-                del err
-                raise ValueError("'%s' is a bad directive in format '%s'" %
-                                    (bad_directive, fmt))
-            # IndexError only occurs when the format string is "%"
-            except IndexError:
-                raise ValueError("stray %% in format '%s'" % fmt)
-            _regex_cache[fmt] = format_regex
-
-    result = np.empty(n, dtype='M8[ns]')
-    iresult = result.view('i8')
-
-    dts.us = dts.ps = dts.as = 0
-
-    cdef dict _parse_code_table = {
-        'y': 0,
-        'Y': 1,
-        'm': 2,
-        'B': 3,
-        'b': 4,
-        'd': 5,
-        'H': 6,
-        'I': 7,
-        'M': 8,
-        'S': 9,
-        'f': 10,
-        'A': 11,
-        'a': 12,
-        'w': 13,
-        'j': 14,
-        'U': 15,
-        'W': 16,
-        'Z': 17,
-        'p': 18   # just an additional key, works only with I
-    }
-    cdef int parse_code
-
-    for i in range(n):
-        val = values[i]
-        if util.is_string_object(val):
-            if val in _nat_strings:
-                iresult[i] = iNaT
-                continue
-        else:
-            if _checknull_with_nat(val):
-                iresult[i] = iNaT
-                continue
-            else:
-                val = str(val)
-
-        # exact matching
-        if exact:
-            found = format_regex.match(val)
-            if not found:
-                if is_coerce:
-                    iresult[i] = iNaT
-                    continue
-                raise ValueError("time data %r does not match format %r (match)" %
-                                 (values[i], fmt))
-            if len(val) != found.end():
-                if is_coerce:
-                    iresult[i] = iNaT
-                    continue
-                raise ValueError("unconverted data remains: %s" %
-                                  values[i][found.end():])
-
-        # search
-        else:
-            found = format_regex.search(val)
-            if not found:
-                if is_coerce:
-                    iresult[i] = iNaT
-                    continue
-                raise ValueError("time data %r does not match format %r (search)" %
-                                 (values[i], fmt))
-
-        year = 1900
-        month = day = 1
-        hour = minute = second = ns = us = 0
-        tz = -1
-        # Default to -1 to signify that values not known; not critical to have,
-        # though
-        week_of_year = -1
-        week_of_year_start = -1
-        # weekday and julian defaulted to -1 so as to signal need to calculate
-        # values
-        weekday = julian = -1
-        found_dict = found.groupdict()
-        for group_key in found_dict.iterkeys():
-            # Directives not explicitly handled below:
-            #   c, x, X
-            #      handled by making out of other directives
-            #   U, W
-            #      worthless without day of the week
-            parse_code = _parse_code_table[group_key]
-
-            if parse_code == 0:
-                year = int(found_dict['y'])
-                # Open Group specification for strptime() states that a %y
-                #value in the range of [00, 68] is in the century 2000, while
-                #[69,99] is in the century 1900
-                if year <= 68:
-                    year += 2000
-                else:
-                    year += 1900
-            elif parse_code == 1:
-                year = int(found_dict['Y'])
-            elif parse_code == 2:
-                month = int(found_dict['m'])
-            elif parse_code == 3:
-            # elif group_key == 'B':
-                month = locale_time.f_month.index(found_dict['B'].lower())
-            elif parse_code == 4:
-            # elif group_key == 'b':
-                month = locale_time.a_month.index(found_dict['b'].lower())
-            elif parse_code == 5:
-            # elif group_key == 'd':
-                day = int(found_dict['d'])
-            elif parse_code == 6:
-            # elif group_key == 'H':
-                hour = int(found_dict['H'])
-            elif parse_code == 7:
-                hour = int(found_dict['I'])
-                ampm = found_dict.get('p', '').lower()
-                # If there was no AM/PM indicator, we'll treat this like AM
-                if ampm in ('', locale_time.am_pm[0]):
-                    # We're in AM so the hour is correct unless we're
-                    # looking at 12 midnight.
-                    # 12 midnight == 12 AM == hour 0
-                    if hour == 12:
-                        hour = 0
-                elif ampm == locale_time.am_pm[1]:
-                    # We're in PM so we need to add 12 to the hour unless
-                    # we're looking at 12 noon.
-                    # 12 noon == 12 PM == hour 12
-                    if hour != 12:
-                        hour += 12
-            elif parse_code == 8:
-                minute = int(found_dict['M'])
-            elif parse_code == 9:
-                second = int(found_dict['S'])
-            elif parse_code == 10:
-                s = found_dict['f']
-                # Pad to always return nanoseconds
-                s += "0" * (9 - len(s))
-                us = long(s)
-                ns = us % 1000
-                us = us / 1000
-            elif parse_code == 11:
-                weekday = locale_time.f_weekday.index(found_dict['A'].lower())
-            elif parse_code == 12:
-                weekday = locale_time.a_weekday.index(found_dict['a'].lower())
-            elif parse_code == 13:
-                weekday = int(found_dict['w'])
-                if weekday == 0:
-                    weekday = 6
-                else:
-                    weekday -= 1
-            elif parse_code == 14:
-                julian = int(found_dict['j'])
-            elif parse_code == 15 or parse_code == 16:
-                week_of_year = int(found_dict[group_key])
-                if group_key == 'U':
-                    # U starts week on Sunday.
-                    week_of_year_start = 6
-                else:
-                    # W starts week on Monday.
-                    week_of_year_start = 0
-            elif parse_code == 17:
-                # Since -1 is default value only need to worry about setting tz
-                # if it can be something other than -1.
-                found_zone = found_dict['Z'].lower()
-                for value, tz_values in enumerate(locale_time.timezone):
-                    if found_zone in tz_values:
-                        # Deal w/ bad locale setup where timezone names are the
-                        # same and yet time.daylight is true; too ambiguous to
-                        # be able to tell what timezone has daylight savings
-                        if (time.tzname[0] == time.tzname[1] and
-                           time.daylight and found_zone not in ("utc", "gmt")):
-                            break
-                        else:
-                            tz = value
-                            break
-        # If we know the wk of the year and what day of that wk, we can figure
-        # out the Julian day of the year.
-        if julian == -1 and week_of_year != -1 and weekday != -1:
-            week_starts_Mon = True if week_of_year_start == 0 else False
-            julian = _calc_julian_from_U_or_W(year, week_of_year, weekday,
-                                                week_starts_Mon)
-        # Cannot pre-calculate datetime_date() since can change in Julian
-        # calculation and thus could have different value for the day of the wk
-        # calculation.
-        try:
-            if julian == -1:
-                # Need to add 1 to result since first day of the year is 1, not 0.
-                julian = datetime_date(year, month, day).toordinal() - \
-                          datetime_date(year, 1, 1).toordinal() + 1
-            else: # Assume that if they bothered to include Julian day it will
-                # be accurate.
-                datetime_result = datetime_date.fromordinal(
-                    (julian - 1) + datetime_date(year, 1, 1).toordinal())
-                year = datetime_result.year
-                month = datetime_result.month
-                day = datetime_result.day
-        except ValueError:
-                if is_coerce:
-                    iresult[i] = iNaT
-                    continue
-                raise
-        if weekday == -1:
-            weekday = datetime_date(year, month, day).weekday()
-
-        dts.year = year
-        dts.month = month
-        dts.day = day
-        dts.hour = hour
-        dts.min = minute
-        dts.sec = second
-        dts.us = us
-        dts.ps = ns * 1000
-
-        iresult[i] = pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-        try:
-            _check_dts_bounds(&dts)
-        except ValueError:
-            if is_coerce:
-                iresult[i] = iNaT
-                continue
-            raise
-
-    return result
-
-
-cdef inline _get_datetime64_nanos(object val):
-    cdef:
-        pandas_datetimestruct dts
-        PANDAS_DATETIMEUNIT unit
-        npy_datetime ival
-
-    unit = get_datetime64_unit(val)
-    ival = get_datetime64_value(val)
-
-    if unit != PANDAS_FR_ns:
-        pandas_datetime_to_datetimestruct(ival, unit, &dts)
-        _check_dts_bounds(&dts)
-        return pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-    else:
-        return ival
-
-cpdef inline int64_t cast_from_unit(object ts, object unit) except? -1:
-    """ return a casting of the unit represented to nanoseconds
-        round the fractional part of a float to our precision, p """
-    cdef:
-        int64_t m
-        int p
-
-    if unit == 'D' or unit == 'd':
-        m = 1000000000L * 86400
-        p = 6
-    elif unit == 'h':
-        m = 1000000000L * 3600
-        p = 6
-    elif unit == 'm':
-        m = 1000000000L * 60
-        p = 6
-    elif unit == 's':
-        m = 1000000000L
-        p = 6
-    elif unit == 'ms':
-        m = 1000000L
-        p = 3
-    elif unit == 'us':
-        m = 1000L
-        p = 0
-    elif unit == 'ns' or unit is None:
-        m = 1L
-        p = 0
-    else:
-        raise ValueError("cannot cast unit {0}".format(unit))
-
-    # just give me the unit back
-    if ts is None:
-        return m
-
-    # cast the unit, multiply base/frace separately
-    # to avoid precision issues from float -> int
-    base = <int64_t> ts
-    frac = ts-base
-    if p:
-        frac = round(frac,p)
-    return <int64_t> (base*m) + <int64_t> (frac*m)
-
-def cast_to_nanoseconds(ndarray arr):
-    cdef:
-        Py_ssize_t i, n = arr.size
-        ndarray[int64_t] ivalues, iresult
-        PANDAS_DATETIMEUNIT unit
-        pandas_datetimestruct dts
-
-    shape = (<object> arr).shape
-
-    ivalues = arr.view(np.int64).ravel()
-
-    result = np.empty(shape, dtype='M8[ns]')
-    iresult = result.ravel().view(np.int64)
-
-    if len(iresult) == 0:
-        return result
-
-    unit = get_datetime64_unit(arr.flat[0])
-    for i in range(n):
-        if ivalues[i] != NPY_NAT:
-            pandas_datetime_to_datetimestruct(ivalues[i], unit, &dts)
-            iresult[i] = pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-            _check_dts_bounds(&dts)
-        else:
-            iresult[i] = NPY_NAT
-
-    return result
-
-#----------------------------------------------------------------------
-# Conversion routines
-
-
-def pydt_to_i8(object pydt):
-    '''
-    Convert to int64 representation compatible with numpy datetime64; converts
-    to UTC
-    '''
-    cdef:
-        _TSObject ts
-
-    ts = convert_to_tsobject(pydt, None, None)
-
-    return ts.value
-
-def i8_to_pydt(int64_t i8, object tzinfo = None):
-    '''
-    Inverse of pydt_to_i8
-    '''
-    return Timestamp(i8)
-
-#----------------------------------------------------------------------
-# time zone conversion helpers
-
-try:
-    import pytz
-    UTC = pytz.utc
-    have_pytz = True
-except:
-    have_pytz = False
-
-def tz_convert(ndarray[int64_t] vals, object tz1, object tz2):
-    cdef:
-        ndarray[int64_t] utc_dates, tt, result, trans, deltas
-        Py_ssize_t i, pos, n = len(vals)
-        int64_t v, offset
-        pandas_datetimestruct dts
-        Py_ssize_t trans_len
-
-    if not have_pytz:
-        import pytz
-
-    if len(vals) == 0:
-        return np.array([], dtype=np.int64)
-
-    # Convert to UTC
-
-    if _get_zone(tz1) != 'UTC':
-        utc_dates = np.empty(n, dtype=np.int64)
-        if _is_tzlocal(tz1):
-            for i in range(n):
-                v = vals[i]
-                if v == iNaT:
-                    utc_dates[i] = iNaT
-                else:
-                    pandas_datetime_to_datetimestruct(v, PANDAS_FR_ns, &dts)
-                    dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                                  dts.min, dts.sec, dts.us, tz1)
-                    delta = (int(total_seconds(_get_utcoffset(tz1, dt)))
-                             * 1000000000)
-                    utc_dates[i] = v - delta
-        else:
-            trans, deltas, typ = _get_dst_info(tz1)
-
-            # all-NaT
-            tt = vals[vals!=iNaT]
-            if not len(tt):
-                return vals
-
-            trans_len = len(trans)
-            pos = trans.searchsorted(tt[0]) - 1
-            if pos < 0:
-                raise ValueError('First time before start of DST info')
-
-            offset = deltas[pos]
-            for i in range(n):
-                v = vals[i]
-                if v == iNaT:
-                    utc_dates[i] = iNaT
-                else:
-                    while pos + 1 < trans_len and v >= trans[pos + 1]:
-                        pos += 1
-                        offset = deltas[pos]
-                    utc_dates[i] = v - offset
-    else:
-        utc_dates = vals
-
-    if _get_zone(tz2) == 'UTC':
-        return utc_dates
-
-    result = np.empty(n, dtype=np.int64)
-    if _is_tzlocal(tz2):
-        for i in range(n):
-            v = utc_dates[i]
-            if v == iNaT:
-                result[i] = iNaT
-            else:
-                pandas_datetime_to_datetimestruct(v, PANDAS_FR_ns, &dts)
-                dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                              dts.min, dts.sec, dts.us, tz2)
-                delta = int(total_seconds(_get_utcoffset(tz2, dt))) * 1000000000
-                result[i] = v + delta
-            return result
-
-    # Convert UTC to other timezone
-    trans, deltas, typ = _get_dst_info(tz2)
-    trans_len = len(trans)
-
-    # use first non-NaT element
-    # if all-NaT, return all-NaT
-    if (result==iNaT).all():
-        return result
-
-    pos = trans.searchsorted(utc_dates[utc_dates!=iNaT][0]) - 1
-    if pos < 0:
-        raise ValueError('First time before start of DST info')
-
-    # TODO: this assumed sortedness :/
-    offset = deltas[pos]
-    for i in range(n):
-        v = utc_dates[i]
-        if vals[i] == iNaT:
-            result[i] = vals[i]
-        else:
-            while pos + 1 < trans_len and v >= trans[pos + 1]:
-                pos += 1
-                offset = deltas[pos]
-            result[i] = v + offset
-    return result
-
-def tz_convert_single(int64_t val, object tz1, object tz2):
-    cdef:
-        ndarray[int64_t] trans, deltas
-        Py_ssize_t pos
-        int64_t v, offset, utc_date
-        pandas_datetimestruct dts
-
-    if not have_pytz:
-        import pytz
-
-    if val == NPY_NAT:
-        return val
-
-    # Convert to UTC
-    if _is_tzlocal(tz1):
-        pandas_datetime_to_datetimestruct(val, PANDAS_FR_ns, &dts)
-        dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                      dts.min, dts.sec, dts.us, tz1)
-        delta = int(total_seconds(_get_utcoffset(tz1, dt))) * 1000000000
-        utc_date = val - delta
-    elif _get_zone(tz1) != 'UTC':
-        trans, deltas, typ = _get_dst_info(tz1)
-        pos = trans.searchsorted(val, side='right') - 1
-        if pos < 0:
-            raise ValueError('First time before start of DST info')
-        offset = deltas[pos]
-        utc_date = val - offset
-    else:
-        utc_date = val
-
-    if _get_zone(tz2) == 'UTC':
-        return utc_date
-    if _is_tzlocal(tz2):
-        pandas_datetime_to_datetimestruct(val, PANDAS_FR_ns, &dts)
-        dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                      dts.min, dts.sec, dts.us, tz2)
-        delta = int(total_seconds(_get_utcoffset(tz2, dt))) * 1000000000
-        return utc_date + delta
-
-    # Convert UTC to other timezone
-    trans, deltas, typ = _get_dst_info(tz2)
-
-    pos = trans.searchsorted(utc_date, side='right') - 1
-    if pos < 0:
-        raise ValueError('First time before start of DST info')
-
-    offset = deltas[pos]
-    return utc_date + offset
-
-# Timezone data caches, key is the pytz string or dateutil file name.
-dst_cache = {}
-
-cdef inline bint _treat_tz_as_pytz(object tz):
-    return hasattr(tz, '_utc_transition_times') and hasattr(tz, '_transition_info')
-
-cdef inline bint _treat_tz_as_dateutil(object tz):
-    return hasattr(tz, '_trans_list') and hasattr(tz, '_trans_idx')
-
-
-def _p_tz_cache_key(tz):
-    ''' Python interface for cache function to facilitate testing.'''
-    return _tz_cache_key(tz)
-
-
-cdef inline object _tz_cache_key(object tz):
-    """
-    Return the key in the cache for the timezone info object or None if unknown.
-
-    The key is currently the tz string for pytz timezones, the filename for dateutil timezones.
-
-    Notes
-    =====
-    This cannot just be the hash of a timezone object. Unfortunately, the hashes of two dateutil tz objects
-    which represent the same timezone are not equal (even though the tz objects will compare equal and
-    represent the same tz file).
-    Also, pytz objects are not always hashable so we use str(tz) instead.
-    """
-    if isinstance(tz, _pytz_BaseTzInfo):
-        return tz.zone
-    elif isinstance(tz, _dateutil_tzfile):
-        if '.tar.gz' in tz._filename:
-            raise ValueError('Bad tz filename. Dateutil on python 3 on windows has a bug which causes tzfile._filename to be the same for all '
-                             'timezone files. Please construct dateutil timezones implicitly by passing a string like "dateutil/Europe/London" '
-                             'when you construct your pandas objects instead of passing a timezone object. See https://github.com/pydata/pandas/pull/7362')
-        return 'dateutil' + tz._filename
-    else:
-        return None
-
-
-cdef object _get_dst_info(object tz):
-    """
-    return a tuple of :
-      (UTC times of DST transitions,
-       UTC offsets in microseconds corresponding to DST transitions,
-       string of type of transitions)
-
-    """
-    cache_key = _tz_cache_key(tz)
-    if cache_key is None:
-        num = int(total_seconds(_get_utcoffset(tz, None))) * 1000000000
-        return (np.array([NPY_NAT + 1], dtype=np.int64),
-                np.array([num], dtype=np.int64),
-                None)
-
-    if cache_key not in dst_cache:
-        if _treat_tz_as_pytz(tz):
-            trans = np.array(tz._utc_transition_times, dtype='M8[ns]')
-            trans = trans.view('i8')
-            try:
-                if tz._utc_transition_times[0].year == 1:
-                    trans[0] = NPY_NAT + 1
-            except Exception:
-                pass
-            deltas = _unbox_utcoffsets(tz._transition_info)
-            typ = 'pytz'
-
-        elif _treat_tz_as_dateutil(tz):
-            if len(tz._trans_list):
-                # get utc trans times
-                trans_list = _get_utc_trans_times_from_dateutil_tz(tz)
-                trans = np.hstack([np.array([0], dtype='M8[s]'), # place holder for first item
-                                  np.array(trans_list, dtype='M8[s]')]).astype('M8[ns]')  # all trans listed
-                trans = trans.view('i8')
-                trans[0] = NPY_NAT + 1
-
-                # deltas
-                deltas = np.array([v.offset for v in (tz._ttinfo_before,) + tz._trans_idx], dtype='i8')  # + (tz._ttinfo_std,)
-                deltas *= 1000000000
-                typ = 'dateutil'
-
-            elif _is_fixed_offset(tz):
-                trans = np.array([NPY_NAT + 1], dtype=np.int64)
-                deltas = np.array([tz._ttinfo_std.offset], dtype='i8') * 1000000000
-                typ = 'fixed'
-            else:
-                trans = np.array([], dtype='M8[ns]')
-                deltas = np.array([], dtype='i8')
-                typ = None
-
-
-        else:
-            # static tzinfo
-            trans = np.array([NPY_NAT + 1], dtype=np.int64)
-            num = int(total_seconds(_get_utcoffset(tz, None))) * 1000000000
-            deltas = np.array([num], dtype=np.int64)
-            typ = 'static'
-
-        dst_cache[cache_key] = (trans, deltas, typ)
-
-    return dst_cache[cache_key]
-
-cdef object _get_utc_trans_times_from_dateutil_tz(object tz):
-    '''
-    Transition times in dateutil timezones are stored in local non-dst time. This code
-    converts them to UTC. It's the reverse of the code in dateutil.tz.tzfile.__init__.
-    '''
-    new_trans = list(tz._trans_list)
-    last_std_offset = 0
-    for i, (trans, tti) in enumerate(zip(tz._trans_list, tz._trans_idx)):
-        if not tti.isdst:
-            last_std_offset = tti.offset
-        new_trans[i] = trans - last_std_offset
-    return new_trans
-
-def tot_seconds(td):
-    return total_seconds(td)
-
-cpdef ndarray _unbox_utcoffsets(object transinfo):
-    cdef:
-        Py_ssize_t i, sz
-        ndarray[int64_t] arr
-
-    sz = len(transinfo)
-    arr = np.empty(sz, dtype='i8')
-
-    for i in range(sz):
-        arr[i] = int(total_seconds(transinfo[i][0])) * 1000000000
-
-    return arr
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def tz_localize_to_utc(ndarray[int64_t] vals, object tz, object ambiguous=None):
-    """
-    Localize tzinfo-naive DateRange to given time zone (using pytz). If
-    there are ambiguities in the values, raise AmbiguousTimeError.
-
-    Returns
-    -------
-    localized : DatetimeIndex
-    """
-    cdef:
-        ndarray[int64_t] trans, deltas, idx_shifted
-        Py_ssize_t i, idx, pos, ntrans, n = len(vals)
-        int64_t *tdata
-        int64_t v, left, right
-        ndarray[int64_t] result, result_a, result_b, dst_hours
-        pandas_datetimestruct dts
-        bint infer_dst = False, is_dst = False, fill = False
-
-    # Vectorized version of DstTzInfo.localize
-
-    if not have_pytz:
-        raise Exception("Could not find pytz module")
-
-    if tz == UTC or tz is None:
-        return vals
-
-    result = np.empty(n, dtype=np.int64)
-
-    if _is_tzlocal(tz):
-        for i in range(n):
-            v = vals[i]
-            pandas_datetime_to_datetimestruct(v, PANDAS_FR_ns, &dts)
-            dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                          dts.min, dts.sec, dts.us, tz)
-            delta = int(total_seconds(_get_utcoffset(tz, dt))) * 1000000000
-            result[i] = v - delta
-        return result
-
-    if isinstance(ambiguous, string_types):
-        if ambiguous == 'infer':
-            infer_dst = True
-        elif ambiguous == 'NaT':
-            fill = True
-    elif hasattr(ambiguous, '__iter__'):
-        is_dst = True
-        if len(ambiguous) != len(vals):
-            raise ValueError("Length of ambiguous bool-array must be the same size as vals")
-
-    trans, deltas, typ = _get_dst_info(tz)
-
-    tdata = <int64_t*> trans.data
-    ntrans = len(trans)
-
-    result_a = np.empty(n, dtype=np.int64)
-    result_b = np.empty(n, dtype=np.int64)
-    result_a.fill(NPY_NAT)
-    result_b.fill(NPY_NAT)
-
-    # left side
-    idx_shifted = (np.maximum(0, trans.searchsorted(vals - DAY_NS, side='right') - 1)).astype(np.int64)
-
-    for i in range(n):
-        v = vals[i] - deltas[idx_shifted[i]]
-        pos = bisect_right_i8(tdata, v, ntrans) - 1
-
-        # timestamp falls to the left side of the DST transition
-        if v + deltas[pos] == vals[i]:
-            result_a[i] = v
-
-    # right side
-    idx_shifted = (np.maximum(0, trans.searchsorted(vals + DAY_NS, side='right') - 1)).astype(np.int64)
-
-    for i in range(n):
-        v = vals[i] - deltas[idx_shifted[i]]
-        pos = bisect_right_i8(tdata, v, ntrans) - 1
-
-        # timestamp falls to the right side of the DST transition
-        if v + deltas[pos] == vals[i]:
-            result_b[i] = v
-
-    if infer_dst:
-        dst_hours = np.empty(n, dtype=np.int64)
-        dst_hours.fill(NPY_NAT)
-
-        # Get the ambiguous hours (given the above, these are the hours
-        # where result_a != result_b and neither of them are NAT)
-        both_nat = np.logical_and(result_a != NPY_NAT, result_b != NPY_NAT)
-        both_eq  = result_a == result_b
-        trans_idx = np.squeeze(np.nonzero(np.logical_and(both_nat, ~both_eq)))
-        if trans_idx.size == 1:
-            stamp = Timestamp(vals[trans_idx])
-            raise pytz.AmbiguousTimeError("Cannot infer dst time from %s as"
-                                          "there are no repeated times" % stamp)
-        # Split the array into contiguous chunks (where the difference between
-        # indices is 1).  These are effectively dst transitions in different years
-        # which is useful for checking that there is not an ambiguous transition
-        # in an individual year.
-        if trans_idx.size > 0:
-            one_diff = np.where(np.diff(trans_idx)!=1)[0]+1
-            trans_grp = np.array_split(trans_idx, one_diff)
-
-            # Iterate through each day, if there are no hours where the delta is negative
-            # (indicates a repeat of hour) the switch cannot be inferred
-            for grp in trans_grp:
-
-                delta = np.diff(result_a[grp])
-                if grp.size == 1 or np.all(delta>0):
-                    stamp = Timestamp(vals[grp[0]])
-                    raise pytz.AmbiguousTimeError(stamp)
-
-                # Find the index for the switch and pull from a for dst and b for standard
-                switch_idx = (delta<=0).nonzero()[0]
-                if switch_idx.size > 1:
-                    raise pytz.AmbiguousTimeError("There are %i dst switches "
-                                                  "when there should only be 1."
-                                                  % switch_idx.size)
-                switch_idx = switch_idx[0]+1 # Pull the only index and adjust
-                a_idx = grp[:switch_idx]
-                b_idx = grp[switch_idx:]
-                dst_hours[grp] = np.hstack((result_a[a_idx], result_b[b_idx]))
-
-    for i in range(n):
-        left = result_a[i]
-        right = result_b[i]
-        if vals[i] == NPY_NAT:
-            result[i] = vals[i]
-        elif left != NPY_NAT and right != NPY_NAT:
-            if left == right:
-                result[i] = left
-            else:
-                if infer_dst and dst_hours[i] != NPY_NAT:
-                    result[i] = dst_hours[i]
-                elif is_dst:
-                    if ambiguous[i]:
-                        result[i] = left
-                    else:
-                        result[i] = right
-                elif fill:
-                    result[i] = NPY_NAT
-                else:
-                    stamp = Timestamp(vals[i])
-                    raise pytz.AmbiguousTimeError("Cannot infer dst time from %r, "\
-                                                  "try using the 'ambiguous' argument"
-                                                  % stamp)
-        elif left != NPY_NAT:
-            result[i] = left
-        elif right != NPY_NAT:
-            result[i] = right
-        else:
-            stamp = Timestamp(vals[i])
-            raise pytz.NonExistentTimeError(stamp)
-
-    return result
-
-cdef inline bisect_right_i8(int64_t *data, int64_t val, Py_ssize_t n):
-    cdef Py_ssize_t pivot, left = 0, right = n
-
-    # edge cases
-    if val > data[n - 1]:
-        return n
-
-    if val < data[0]:
-        return 0
-
-    while left < right:
-        pivot = left + (right - left) // 2
-
-        if data[pivot] <= val:
-            left = pivot + 1
-        else:
-            right = pivot
-
-    return left
-
-
-# Accessors
-#----------------------------------------------------------------------
-
-def build_field_sarray(ndarray[int64_t] dtindex):
-    '''
-    Datetime as int64 representation to a structured array of fields
-    '''
-    cdef:
-        Py_ssize_t i, count = 0
-        int isleap
-        pandas_datetimestruct dts
-        ndarray[int32_t] years, months, days, hours, minutes, seconds, mus
-
-    count = len(dtindex)
-
-    sa_dtype = [('Y', 'i4'), # year
-                ('M', 'i4'), # month
-                ('D', 'i4'), # day
-                ('h', 'i4'), # hour
-                ('m', 'i4'), # min
-                ('s', 'i4'), # second
-                ('u', 'i4')] # microsecond
-
-    out = np.empty(count, dtype=sa_dtype)
-
-    years = out['Y']
-    months = out['M']
-    days = out['D']
-    hours = out['h']
-    minutes = out['m']
-    seconds = out['s']
-    mus = out['u']
-
-    for i in range(count):
-        pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-        years[i] = dts.year
-        months[i] = dts.month
-        days[i] = dts.day
-        hours[i] = dts.hour
-        minutes[i] = dts.min
-        seconds[i] = dts.sec
-        mus[i] = dts.us
-
-    return out
-
-def get_time_micros(ndarray[int64_t] dtindex):
-    '''
-    Datetime as int64 representation to a structured array of fields
-    '''
-    cdef:
-        Py_ssize_t i, n = len(dtindex)
-        pandas_datetimestruct dts
-        ndarray[int64_t] micros
-
-    micros = np.empty(n, dtype=np.int64)
-
-    for i in range(n):
-        pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-        micros[i] = 1000000LL * (dts.hour * 60 * 60 +
-                                 60 * dts.min + dts.sec) + dts.us
-
-    return micros
-
-
-@cython.wraparound(False)
-def get_date_field(ndarray[int64_t] dtindex, object field):
-    '''
-    Given a int64-based datetime index, extract the year, month, etc.,
-    field and return an array of these values.
-    '''
-    cdef:
-        _TSObject ts
-        Py_ssize_t i, count = 0
-        ndarray[int32_t] out
-        ndarray[int32_t, ndim=2] _month_offset
-        int isleap, isleap_prev
-        pandas_datetimestruct dts
-        int mo_off, doy, dow, woy
-
-    _month_offset = np.array(
-        [[ 0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365 ],
-         [ 0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366 ]],
-         dtype=np.int32 )
-
-    count = len(dtindex)
-    out = np.empty(count, dtype='i4')
-
-    if field == 'Y':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-            out[i] = dts.year
-        return out
-
-    elif field == 'M':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-            out[i] = dts.month
-        return out
-
-    elif field == 'D':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-            out[i] = dts.day
-        return out
-
-    elif field == 'h':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-            out[i] = dts.hour
-        return out
-
-    elif field == 'm':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-            out[i] = dts.min
-        return out
-
-    elif field == 's':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-            out[i] = dts.sec
-        return out
-
-    elif field == 'us':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-            out[i] = dts.us
-        return out
-
-    elif field == 'ns':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-            out[i] = dts.ps / 1000
-        return out
-    elif field == 'doy':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-            isleap = is_leapyear(dts.year)
-            out[i] = _month_offset[isleap, dts.month-1] + dts.day
-        return out
-
-    elif field == 'dow':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-            ts = convert_to_tsobject(dtindex[i], None, None)
-            out[i] = ts_dayofweek(ts)
-        return out
-
-    elif field == 'woy':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-            ts = convert_to_tsobject(dtindex[i], None, None)
-            isleap = is_leapyear(dts.year)
-            isleap_prev = is_leapyear(dts.year - 1)
-            mo_off = _month_offset[isleap, dts.month - 1]
-            doy = mo_off + dts.day
-            dow = ts_dayofweek(ts)
-
-            #estimate
-            woy = (doy - 1) - dow + 3
-            if woy >= 0:
-                woy = woy / 7 + 1
-
-            # verify
-            if woy < 0:
-                if (woy > -2) or (woy == -2 and isleap_prev):
-                    woy = 53
-                else:
-                    woy = 52
-            elif woy == 53:
-                if 31 - dts.day + dow < 3:
-                    woy = 1
-
-            out[i] = woy
-        return out
-
-    elif field == 'q':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-            out[i] = dts.month
-            out[i] = ((out[i] - 1) / 3) + 1
-        return out
-
-    elif field == 'dim':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-            out[i] = monthrange(dts.year, dts.month)[1]
-        return out
-
-    raise ValueError("Field %s not supported" % field)
-
-
-@cython.wraparound(False)
-def get_start_end_field(ndarray[int64_t] dtindex, object field, object freqstr=None, int month_kw=12):
-    '''
-    Given an int64-based datetime index return array of indicators
-    of whether timestamps are at the start/end of the month/quarter/year
-    (defined by frequency).
-    '''
-    cdef:
-        _TSObject ts
-        Py_ssize_t i
-        int count = 0
-        bint is_business = 0
-        int end_month = 12
-        int start_month = 1
-        ndarray[int8_t] out
-        ndarray[int32_t, ndim=2] _month_offset
-        bint isleap
-        pandas_datetimestruct dts
-        int mo_off, dom, doy, dow, ldom
-
-    _month_offset = np.array(
-        [[ 0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365 ],
-         [ 0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366 ]],
-         dtype=np.int32 )
-
-    count = len(dtindex)
-    out = np.zeros(count, dtype='int8')
-
-    if freqstr:
-        if freqstr == 'C':
-            raise ValueError("Custom business days is not supported by %s" % field)
-        is_business = freqstr[0] == 'B'
-
-        # YearBegin(), BYearBegin() use month = starting month of year
-        # QuarterBegin(), BQuarterBegin() use startingMonth = starting month of year
-        # other offests use month, startingMonth as ending month of year.
-
-        if (freqstr[0:2] in ['MS', 'QS', 'AS']) or (freqstr[1:3] in ['MS', 'QS', 'AS']):
-            end_month = 12 if month_kw == 1 else month_kw - 1
-            start_month = month_kw
-        else:
-            end_month = month_kw
-            start_month = (end_month % 12) + 1
-    else:
-        end_month = 12
-        start_month = 1
-
-    if field == 'is_month_start':
-        if is_business:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None)
-                dom = dts.day
-                dow = ts_dayofweek(ts)
-
-                if (dom == 1 and dow < 5) or (dom <= 3 and dow == 0):
-                    out[i] = 1
-            return out.view(bool)
-        else:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-                dom = dts.day
-
-                if dom == 1:
-                    out[i] = 1
-            return out.view(bool)
-
-    elif field == 'is_month_end':
-        if is_business:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None)
-                isleap = is_leapyear(dts.year)
-                mo_off = _month_offset[isleap, dts.month - 1]
-                dom = dts.day
-                doy = mo_off + dom
-                ldom = _month_offset[isleap, dts.month]
-                dow = ts_dayofweek(ts)
-
-                if (ldom == doy and dow < 5) or (dow == 4 and (ldom - doy <= 2)):
-                    out[i] = 1
-            return out.view(bool)
-        else:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-                isleap = is_leapyear(dts.year)
-                mo_off = _month_offset[isleap, dts.month - 1]
-                dom = dts.day
-                doy = mo_off + dom
-                ldom = _month_offset[isleap, dts.month]
-
-                if ldom == doy:
-                    out[i] = 1
-            return out.view(bool)
-
-    elif field == 'is_quarter_start':
-        if is_business:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None)
-                dom = dts.day
-                dow = ts_dayofweek(ts)
-
-                if ((dts.month - start_month) % 3 == 0) and ((dom == 1 and dow < 5) or (dom <= 3 and dow == 0)):
-                    out[i] = 1
-            return out.view(bool)
-        else:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-                dom = dts.day
-
-                if ((dts.month - start_month) % 3 == 0) and dom == 1:
-                    out[i] = 1
-            return out.view(bool)
-
-    elif field == 'is_quarter_end':
-        if is_business:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None)
-                isleap = is_leapyear(dts.year)
-                mo_off = _month_offset[isleap, dts.month - 1]
-                dom = dts.day
-                doy = mo_off + dom
-                ldom = _month_offset[isleap, dts.month]
-                dow = ts_dayofweek(ts)
-
-                if ((dts.month - end_month) % 3 == 0) and ((ldom == doy and dow < 5) or (dow == 4 and (ldom - doy <= 2))):
-                    out[i] = 1
-            return out.view(bool)
-        else:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-                isleap = is_leapyear(dts.year)
-                mo_off = _month_offset[isleap, dts.month - 1]
-                dom = dts.day
-                doy = mo_off + dom
-                ldom = _month_offset[isleap, dts.month]
-
-                if ((dts.month - end_month) % 3 == 0) and (ldom == doy):
-                    out[i] = 1
-            return out.view(bool)
-
-    elif field == 'is_year_start':
-        if is_business:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None)
-                dom = dts.day
-                dow = ts_dayofweek(ts)
-
-                if (dts.month == start_month) and ((dom == 1 and dow < 5) or (dom <= 3 and dow == 0)):
-                    out[i] = 1
-            return out.view(bool)
-        else:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-                dom = dts.day
-
-                if (dts.month == start_month) and dom == 1:
-                    out[i] = 1
-            return out.view(bool)
-
-    elif field == 'is_year_end':
-        if is_business:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None)
-                isleap = is_leapyear(dts.year)
-                dom = dts.day
-                mo_off = _month_offset[isleap, dts.month - 1]
-                doy = mo_off + dom
-                dow = ts_dayofweek(ts)
-                ldom = _month_offset[isleap, dts.month]
-
-                if (dts.month == end_month) and ((ldom == doy and dow < 5) or (dow == 4 and (ldom - doy <= 2))):
-                    out[i] = 1
-            return out.view(bool)
-        else:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None)
-                isleap = is_leapyear(dts.year)
-                mo_off = _month_offset[isleap, dts.month - 1]
-                dom = dts.day
-                doy = mo_off + dom
-                ldom = _month_offset[isleap, dts.month]
-
-                if (dts.month == end_month) and (ldom == doy):
-                    out[i] = 1
-            return out.view(bool)
-
-    raise ValueError("Field %s not supported" % field)
-
-
-cdef inline int m8_weekday(int64_t val):
-    ts = convert_to_tsobject(val, None, None)
-    return ts_dayofweek(ts)
-
-cdef int64_t DAY_NS = 86400000000000LL
-
-
-def date_normalize(ndarray[int64_t] stamps, tz=None):
-    cdef:
-        Py_ssize_t i, n = len(stamps)
-        pandas_datetimestruct dts
-        _TSObject tso
-        ndarray[int64_t] result = np.empty(n, dtype=np.int64)
-
-    if tz is not None:
-        tso = _TSObject()
-        tz = maybe_get_tz(tz)
-        result = _normalize_local(stamps, tz)
-    else:
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                result[i] = NPY_NAT
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns, &dts)
-            result[i] = _normalized_stamp(&dts)
-
-    return result
-
-cdef _normalize_local(ndarray[int64_t] stamps, object tz):
-    cdef:
-        Py_ssize_t n = len(stamps)
-        ndarray[int64_t] result = np.empty(n, dtype=np.int64)
-        ndarray[int64_t] trans, deltas, pos
-        pandas_datetimestruct dts
-
-    if _is_utc(tz):
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                result[i] = NPY_NAT
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns, &dts)
-            result[i] = _normalized_stamp(&dts)
-    elif _is_tzlocal(tz):
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                result[i] = NPY_NAT
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns,
-                                              &dts)
-            dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                          dts.min, dts.sec, dts.us, tz)
-            delta = int(total_seconds(_get_utcoffset(tz, dt))) * 1000000000
-            pandas_datetime_to_datetimestruct(stamps[i] + delta,
-                                              PANDAS_FR_ns, &dts)
-            result[i] = _normalized_stamp(&dts)
-    else:
-        # Adjust datetime64 timestamp, recompute datetimestruct
-        trans, deltas, typ = _get_dst_info(tz)
-
-        _pos = trans.searchsorted(stamps, side='right') - 1
-        if _pos.dtype != np.int64:
-            _pos = _pos.astype(np.int64)
-        pos = _pos
-
-        # statictzinfo
-        if typ not in ['pytz','dateutil']:
-            for i in range(n):
-                if stamps[i] == NPY_NAT:
-                    result[i] = NPY_NAT
-                    continue
-                pandas_datetime_to_datetimestruct(stamps[i] + deltas[0],
-                                                  PANDAS_FR_ns, &dts)
-                result[i] = _normalized_stamp(&dts)
-        else:
-            for i in range(n):
-                if stamps[i] == NPY_NAT:
-                    result[i] = NPY_NAT
-                    continue
-                pandas_datetime_to_datetimestruct(stamps[i] + deltas[pos[i]],
-                                                  PANDAS_FR_ns, &dts)
-                result[i] = _normalized_stamp(&dts)
-
-    return result
-
-cdef inline int64_t _normalized_stamp(pandas_datetimestruct *dts):
-    dts.hour = 0
-    dts.min = 0
-    dts.sec = 0
-    dts.us = 0
-    dts.ps = 0
-    return pandas_datetimestruct_to_datetime(PANDAS_FR_ns, dts)
-
-
-def dates_normalized(ndarray[int64_t] stamps, tz=None):
-    cdef:
-        Py_ssize_t i, n = len(stamps)
-        pandas_datetimestruct dts
-
-    if tz is None or _is_utc(tz):
-        for i in range(n):
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns, &dts)
-            if (dts.hour + dts.min + dts.sec + dts.us) > 0:
-                return False
-    elif _is_tzlocal(tz):
-        for i in range(n):
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns, &dts)
-            if (dts.min + dts.sec + dts.us) > 0:
-                return False
-            dt = datetime(dts.year, dts.month, dts.day, dts.hour, dts.min,
-                          dts.sec, dts.us, tz)
-            dt = dt + tz.utcoffset(dt)
-            if dt.hour > 0:
-                return False
-    else:
-        trans, deltas, typ = _get_dst_info(tz)
-
-        for i in range(n):
-            # Adjust datetime64 timestamp, recompute datetimestruct
-            pos = trans.searchsorted(stamps[i]) - 1
-            inf = tz._transition_info[pos]
-
-            pandas_datetime_to_datetimestruct(stamps[i] + deltas[pos],
-                                              PANDAS_FR_ns, &dts)
-            if (dts.hour + dts.min + dts.sec + dts.us) > 0:
-                return False
-
-    return True
-
-# Some general helper functions
-#----------------------------------------------------------------------
-
-def isleapyear(int64_t year):
-    return is_leapyear(year)
-
-def monthrange(int64_t year, int64_t month):
-    cdef:
-        int64_t days
-        int64_t day_of_week
-
-    if month < 1 or month > 12:
-        raise ValueError("bad month number 0; must be 1-12")
-
-    days = days_per_month_table[is_leapyear(year)][month-1]
-
-    return (dayofweek(year, month, 1), days)
-
-cdef inline int64_t ts_dayofweek(_TSObject ts):
-    return dayofweek(ts.dts.year, ts.dts.month, ts.dts.day)
-
-
-cpdef normalize_date(object dt):
-    '''
-    Normalize datetime.datetime value to midnight. Returns datetime.date as a
-    datetime.datetime at midnight
-
-    Returns
-    -------
-    normalized : datetime.datetime or Timestamp
-    '''
-    if PyDateTime_Check(dt):
-        return dt.replace(hour=0, minute=0, second=0, microsecond=0)
-    elif PyDate_Check(dt):
-        return datetime(dt.year, dt.month, dt.day)
-    else:
-        raise TypeError('Unrecognized type: %s' % type(dt))
-
-
-cdef inline int _year_add_months(pandas_datetimestruct dts,
-                                 int months):
-    '''new year number after shifting pandas_datetimestruct number of months'''
-    return dts.year + (dts.month + months - 1) / 12
-
-cdef inline int _month_add_months(pandas_datetimestruct dts,
-                                  int months):
-    '''new month number after shifting pandas_datetimestruct number of months'''
-    cdef int new_month = (dts.month + months) % 12
-    return 12 if new_month == 0 else new_month
-
-@cython.wraparound(False)
-def shift_months(int64_t[:] dtindex, int months, object day=None):
-    '''
-    Given an int64-based datetime index, shift all elements
-    specified number of months using DateOffset semantics
-
-    day: {None, 'start', 'end'}
-       * None: day of month
-       * 'start' 1st day of month
-       * 'end' last day of month
-    '''
-    cdef:
-        Py_ssize_t i
-        int days_in_month
-        pandas_datetimestruct dts
-        int count = len(dtindex)
-        int64_t[:] out = np.empty(count, dtype='int64')
-
-    for i in range(count):
-        if dtindex[i] == NPY_NAT:
-            out[i] = NPY_NAT
-        else:
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-
-            if day is None:
-                dts.year = _year_add_months(dts, months)
-                dts.month = _month_add_months(dts, months)
-                #prevent day from wrapping around month end
-                days_in_month = days_per_month_table[is_leapyear(dts.year)][dts.month-1]
-                dts.day = min(dts.day, days_in_month)
-            elif day == 'start':
-                dts.year = _year_add_months(dts, months)
-                dts.month = _month_add_months(dts, months)
-
-                # offset semantics - when subtracting if at the start anchor
-                # point, shift back by one more month
-                if months <= 0 and dts.day == 1:
-                    dts.year = _year_add_months(dts, -1)
-                    dts.month = _month_add_months(dts, -1)
-                else:
-                    dts.day = 1
-            elif day == 'end':
-                days_in_month = days_per_month_table[is_leapyear(dts.year)][dts.month-1]
-                dts.year = _year_add_months(dts, months)
-                dts.month = _month_add_months(dts, months)
-
-                # similar semantics - when adding shift forward by one
-                # month if already at an end of month
-                if months >= 0 and dts.day == days_in_month:
-                    dts.year = _year_add_months(dts, 1)
-                    dts.month = _month_add_months(dts, 1)
-
-                days_in_month = days_per_month_table[is_leapyear(dts.year)][dts.month-1]
-                dts.day = days_in_month
-
-            out[i] = pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-    return np.asarray(out)
-
-#----------------------------------------------------------------------
-# Don't even ask
-
-"""Strptime-related classes and functions.
-
-CLASSES:
-    LocaleTime -- Discovers and stores locale-specific time information
-    TimeRE -- Creates regexes for pattern matching a string of text containing
-                time information
-
-FUNCTIONS:
-    _getlang -- Figure out what language is being used for the locale
-    strptime -- Calculates the time struct represented by the passed-in string
-
-"""
-import time
-import locale
-import calendar
-from re import compile as re_compile
-from re import IGNORECASE
-from re import escape as re_escape
-from datetime import date as datetime_date
-
-# Python 2 vs Python 3
-try:
-    from thread import allocate_lock as _thread_allocate_lock
-except:
-    try:
-        from _thread import allocate_lock as _thread_allocate_lock
-    except:
-        try:
-            from dummy_thread import allocate_lock as _thread_allocate_lock
-        except:
-            from _dummy_thread import allocate_lock as _thread_allocate_lock
-
-__all__ = []
-
-def _getlang():
-    # Figure out what the current language is set to.
-    return locale.getlocale(locale.LC_TIME)
-
-class LocaleTime(object):
-    """Stores and handles locale-specific information related to time.
-
-    ATTRIBUTES:
-        f_weekday -- full weekday names (7-item list)
-        a_weekday -- abbreviated weekday names (7-item list)
-        f_month -- full month names (13-item list; dummy value in [0], which
-                    is added by code)
-        a_month -- abbreviated month names (13-item list, dummy value in
-                    [0], which is added by code)
-        am_pm -- AM/PM representation (2-item list)
-        LC_date_time -- format string for date/time representation (string)
-        LC_date -- format string for date representation (string)
-        LC_time -- format string for time representation (string)
-        timezone -- daylight- and non-daylight-savings timezone representation
-                    (2-item list of sets)
-        lang -- Language used by instance (2-item tuple)
-    """
-
-    def __init__(self):
-        """Set all attributes.
-
-        Order of methods called matters for dependency reasons.
-
-        The locale language is set at the offset and then checked again before
-        exiting.  This is to make sure that the attributes were not set with a
-        mix of information from more than one locale.  This would most likely
-        happen when using threads where one thread calls a locale-dependent
-        function while another thread changes the locale while the function in
-        the other thread is still running.  Proper coding would call for
-        locks to prevent changing the locale while locale-dependent code is
-        running.  The check here is done in case someone does not think about
-        doing this.
-
-        Only other possible issue is if someone changed the timezone and did
-        not call tz.tzset .  That is an issue for the programmer, though,
-        since changing the timezone is worthless without that call.
-
-        """
-        self.lang = _getlang()
-        self.__calc_weekday()
-        self.__calc_month()
-        self.__calc_am_pm()
-        self.__calc_timezone()
-        self.__calc_date_time()
-        if _getlang() != self.lang:
-            raise ValueError("locale changed during initialization")
-
-    def __pad(self, seq, front):
-        # Add '' to seq to either the front (is True), else the back.
-        seq = list(seq)
-        if front:
-            seq.insert(0, '')
-        else:
-            seq.append('')
-        return seq
-
-    def __calc_weekday(self):
-        # Set self.a_weekday and self.f_weekday using the calendar
-        # module.
-        a_weekday = [calendar.day_abbr[i].lower() for i in range(7)]
-        f_weekday = [calendar.day_name[i].lower() for i in range(7)]
-        self.a_weekday = a_weekday
-        self.f_weekday = f_weekday
-
-    def __calc_month(self):
-        # Set self.f_month and self.a_month using the calendar module.
-        a_month = [calendar.month_abbr[i].lower() for i in range(13)]
-        f_month = [calendar.month_name[i].lower() for i in range(13)]
-        self.a_month = a_month
-        self.f_month = f_month
-
-    def __calc_am_pm(self):
-        # Set self.am_pm by using time.strftime().
-
-        # The magic date (1999,3,17,hour,44,55,2,76,0) is not really that
-        # magical; just happened to have used it everywhere else where a
-        # static date was needed.
-        am_pm = []
-        for hour in (01,22):
-            time_tuple = time.struct_time((1999,3,17,hour,44,55,2,76,0))
-            am_pm.append(time.strftime("%p", time_tuple).lower())
-        self.am_pm = am_pm
-
-    def __calc_date_time(self):
-        # Set self.date_time, self.date, & self.time by using
-        # time.strftime().
-
-        # Use (1999,3,17,22,44,55,2,76,0) for magic date because the amount of
-        # overloaded numbers is minimized.  The order in which searches for
-        # values within the format string is very important; it eliminates
-        # possible ambiguity for what something represents.
-        time_tuple = time.struct_time((1999,3,17,22,44,55,2,76,0))
-        date_time = [None, None, None]
-        date_time[0] = time.strftime("%c", time_tuple).lower()
-        date_time[1] = time.strftime("%x", time_tuple).lower()
-        date_time[2] = time.strftime("%X", time_tuple).lower()
-        replacement_pairs = [('%', '%%'), (self.f_weekday[2], '%A'),
-                    (self.f_month[3], '%B'), (self.a_weekday[2], '%a'),
-                    (self.a_month[3], '%b'), (self.am_pm[1], '%p'),
-                    ('1999', '%Y'), ('99', '%y'), ('22', '%H'),
-                    ('44', '%M'), ('55', '%S'), ('76', '%j'),
-                    ('17', '%d'), ('03', '%m'), ('3', '%m'),
-                    # '3' needed for when no leading zero.
-                    ('2', '%w'), ('10', '%I')]
-        replacement_pairs.extend([(tz, "%Z") for tz_values in self.timezone
-                                                for tz in tz_values])
-        for offset,directive in ((0,'%c'), (1,'%x'), (2,'%X')):
-            current_format = date_time[offset]
-            for old, new in replacement_pairs:
-                # Must deal with possible lack of locale info
-                # manifesting itself as the empty string (e.g., Swedish's
-                # lack of AM/PM info) or a platform returning a tuple of empty
-                # strings (e.g., MacOS 9 having timezone as ('','')).
-                if old:
-                    current_format = current_format.replace(old, new)
-            # If %W is used, then Sunday, 2005-01-03 will fall on week 0 since
-            # 2005-01-03 occurs before the first Monday of the year.  Otherwise
-            # %U is used.
-            time_tuple = time.struct_time((1999,1,3,1,1,1,6,3,0))
-            if '00' in time.strftime(directive, time_tuple):
-                U_W = '%W'
-            else:
-                U_W = '%U'
-            date_time[offset] = current_format.replace('11', U_W)
-        self.LC_date_time = date_time[0]
-        self.LC_date = date_time[1]
-        self.LC_time = date_time[2]
-
-    def __calc_timezone(self):
-        # Set self.timezone by using time.tzname.
-        # Do not worry about possibility of time.tzname[0] == timetzname[1]
-        # and time.daylight; handle that in strptime .
-        try:
-            time.tzset()
-        except AttributeError:
-            pass
-        no_saving = frozenset(["utc", "gmt", time.tzname[0].lower()])
-        if time.daylight:
-            has_saving = frozenset([time.tzname[1].lower()])
-        else:
-            has_saving = frozenset()
-        self.timezone = (no_saving, has_saving)
-
-
-class TimeRE(dict):
-    """Handle conversion from format directives to regexes."""
-
-    def __init__(self, locale_time=None):
-        """Create keys/values.
-
-        Order of execution is important for dependency reasons.
-
-        """
-        if locale_time:
-            self.locale_time = locale_time
-        else:
-            self.locale_time = LocaleTime()
-        base = super(TimeRE, self)
-        base.__init__({
-            # The " \d" part of the regex is to make %c from ANSI C work
-            'd': r"(?P<d>3[0-1]|[1-2]\d|0[1-9]|[1-9]| [1-9])",
-            'f': r"(?P<f>[0-9]{1,9})",
-            'H': r"(?P<H>2[0-3]|[0-1]\d|\d)",
-            'I': r"(?P<I>1[0-2]|0[1-9]|[1-9])",
-            'j': r"(?P<j>36[0-6]|3[0-5]\d|[1-2]\d\d|0[1-9]\d|00[1-9]|[1-9]\d|0[1-9]|[1-9])",
-            'm': r"(?P<m>1[0-2]|0[1-9]|[1-9])",
-            'M': r"(?P<M>[0-5]\d|\d)",
-            'S': r"(?P<S>6[0-1]|[0-5]\d|\d)",
-            'U': r"(?P<U>5[0-3]|[0-4]\d|\d)",
-            'w': r"(?P<w>[0-6])",
-            # W is set below by using 'U'
-            'y': r"(?P<y>\d\d)",
-            #XXX: Does 'Y' need to worry about having less or more than
-            #     4 digits?
-            'Y': r"(?P<Y>\d\d\d\d)",
-            'A': self.__seqToRE(self.locale_time.f_weekday, 'A'),
-            'a': self.__seqToRE(self.locale_time.a_weekday, 'a'),
-            'B': self.__seqToRE(self.locale_time.f_month[1:], 'B'),
-            'b': self.__seqToRE(self.locale_time.a_month[1:], 'b'),
-            'p': self.__seqToRE(self.locale_time.am_pm, 'p'),
-            'Z': self.__seqToRE((tz for tz_names in self.locale_time.timezone
-                                        for tz in tz_names),
-                                'Z'),
-            '%': '%'})
-        base.__setitem__('W', base.__getitem__('U').replace('U', 'W'))
-        base.__setitem__('c', self.pattern(self.locale_time.LC_date_time))
-        base.__setitem__('x', self.pattern(self.locale_time.LC_date))
-        base.__setitem__('X', self.pattern(self.locale_time.LC_time))
-
-    def __seqToRE(self, to_convert, directive):
-        """Convert a list to a regex string for matching a directive.
-
-        Want possible matching values to be from longest to shortest.  This
-        prevents the possibility of a match occuring for a value that also
-        a substring of a larger value that should have matched (e.g., 'abc'
-        matching when 'abcdef' should have been the match).
-
-        """
-        to_convert = sorted(to_convert, key=len, reverse=True)
-        for value in to_convert:
-            if value != '':
-                break
-        else:
-            return ''
-        regex = '|'.join(re_escape(stuff) for stuff in to_convert)
-        regex = '(?P<%s>%s' % (directive, regex)
-        return '%s)' % regex
-
-    def pattern(self, format):
-        """Return regex pattern for the format string.
-
-        Need to make sure that any characters that might be interpreted as
-        regex syntax are escaped.
-
-        """
-        processed_format = ''
-        # The sub() call escapes all characters that might be misconstrued
-        # as regex syntax.  Cannot use re.escape since we have to deal with
-        # format directives (%m, etc.).
-        regex_chars = re_compile(r"([\\.^$*+?\(\){}\[\]|])")
-        format = regex_chars.sub(r"\\\1", format)
-        whitespace_replacement = re_compile('\s+')
-        format = whitespace_replacement.sub('\s+', format)
-        while '%' in format:
-            directive_index = format.index('%')+1
-            processed_format = "%s%s%s" % (processed_format,
-                                           format[:directive_index-1],
-                                           self[format[directive_index]])
-            format = format[directive_index+1:]
-        return "%s%s" % (processed_format, format)
-
-    def compile(self, format):
-        """Return a compiled re object for the format string."""
-        return re_compile(self.pattern(format), IGNORECASE)
-
-_cache_lock = _thread_allocate_lock()
-# DO NOT modify _TimeRE_cache or _regex_cache without acquiring the cache lock
-# first!
-_TimeRE_cache = TimeRE()
-_CACHE_MAX_SIZE = 5 # Max number of regexes stored in _regex_cache
-_regex_cache = {}
-
-cdef _calc_julian_from_U_or_W(int year, int week_of_year, int day_of_week, int week_starts_Mon):
-    """Calculate the Julian day based on the year, week of the year, and day of
-    the week, with week_start_day representing whether the week of the year
-    assumes the week starts on Sunday or Monday (6 or 0)."""
-
-    cdef:
-        int first_weekday,  week_0_length, days_to_week
-
-    first_weekday = datetime_date(year, 1, 1).weekday()
-    # If we are dealing with the %U directive (week starts on Sunday), it's
-    # easier to just shift the view to Sunday being the first day of the
-    # week.
-    if not week_starts_Mon:
-        first_weekday = (first_weekday + 1) % 7
-        day_of_week = (day_of_week + 1) % 7
-    # Need to watch out for a week 0 (when the first day of the year is not
-    # the same as that specified by %U or %W).
-    week_0_length = (7 - first_weekday) % 7
-    if week_of_year == 0:
-        return 1 + day_of_week - first_weekday
-    else:
-        days_to_week = week_0_length + (7 * (week_of_year - 1))
-        return 1 + days_to_week + day_of_week
-
-# def _strptime_time(data_string, format="%a %b %d %H:%M:%S %Y"):
-#     return _strptime(data_string, format)[0]
diff --git a/pandas/types/__init__.py b/pandas/types/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/types/common.py b/pandas/types/common.py
new file mode 100644
index 0000000000000..a125c27d04596
--- /dev/null
+++ b/pandas/types/common.py
@@ -0,0 +1,8 @@
+import warnings
+
+warnings.warn("pandas.types.common is deprecated and will be "
+              "removed in a future version, import "
+              "from pandas.api.types",
+              DeprecationWarning, stacklevel=3)
+
+from pandas.core.dtypes.common import *  # noqa
diff --git a/pandas/types/concat.py b/pandas/types/concat.py
new file mode 100644
index 0000000000000..477156b38d56d
--- /dev/null
+++ b/pandas/types/concat.py
@@ -0,0 +1,11 @@
+import warnings
+
+
+def union_categoricals(to_union, sort_categories=False, ignore_order=False):
+    warnings.warn("pandas.types.concat.union_categoricals is "
+                  "deprecated and will be removed in a future version.\n"
+                  "use pandas.api.types.union_categoricals",
+                  FutureWarning, stacklevel=2)
+    from pandas.api.types import union_categoricals
+    return union_categoricals(
+        to_union, sort_categories=sort_categories, ignore_order=ignore_order)
diff --git a/pandas/util/__init__.py b/pandas/util/__init__.py
index e69de29bb2d1d..202e58c916e47 100644
--- a/pandas/util/__init__.py
+++ b/pandas/util/__init__.py
@@ -0,0 +1,2 @@
+from pandas.util._decorators import Appender, Substitution, cache_readonly  # noqa
+from pandas.core.util.hashing import hash_pandas_object, hash_array   # noqa
diff --git a/pandas/util/_decorators.py b/pandas/util/_decorators.py
new file mode 100644
index 0000000000000..7d5753d03f4fc
--- /dev/null
+++ b/pandas/util/_decorators.py
@@ -0,0 +1,386 @@
+from pandas.compat import callable, signature, PY2
+from pandas._libs.properties import cache_readonly  # noqa
+import inspect
+import types
+import warnings
+from textwrap import dedent, wrap
+from functools import wraps, update_wrapper, WRAPPER_ASSIGNMENTS
+
+
+def deprecate(name, alternative, version, alt_name=None,
+              klass=None, stacklevel=2, msg=None):
+    """Return a new function that emits a deprecation warning on use.
+
+    To use this method for a deprecated function, another function
+    `alternative` with the same signature must exist. The deprecated
+    function will emit a deprecation warning, and in the docstring
+    it will contain the deprecation directive with the provided version
+    so it can be detected for future removal.
+
+    Parameters
+    ----------
+    name : str
+        Name of function to deprecate.
+    alternative : func
+        Function to use instead.
+    version : str
+        Version of pandas in which the method has been deprecated.
+    alt_name : str, optional
+        Name to use in preference of alternative.__name__.
+    klass : Warning, default FutureWarning
+    stacklevel : int, default 2
+    msg : str
+        The message to display in the warning.
+        Default is '{name} is deprecated. Use {alt_name} instead.'
+    """
+
+    alt_name = alt_name or alternative.__name__
+    klass = klass or FutureWarning
+    warning_msg = msg or '{} is deprecated, use {} instead'.format(name,
+                                                                   alt_name)
+
+    # adding deprecated directive to the docstring
+    msg = msg or 'Use `{alt_name}` instead.'.format(alt_name=alt_name)
+    msg = '\n    '.join(wrap(msg, 70))
+
+    @Substitution(version=version, msg=msg)
+    @Appender(alternative.__doc__)
+    def wrapper(*args, **kwargs):
+        """
+        .. deprecated:: %(version)s
+
+           %(msg)s
+
+        """
+        warnings.warn(warning_msg, klass, stacklevel=stacklevel)
+        return alternative(*args, **kwargs)
+
+    # Since we are using Substitution to create the required docstring,
+    # remove that from the attributes that should be assigned to the wrapper
+    assignments = tuple(x for x in WRAPPER_ASSIGNMENTS if x != '__doc__')
+    update_wrapper(wrapper, alternative, assigned=assignments)
+
+    return wrapper
+
+
+def deprecate_kwarg(old_arg_name, new_arg_name, mapping=None, stacklevel=2):
+    """
+    Decorator to deprecate a keyword argument of a function.
+
+    Parameters
+    ----------
+    old_arg_name : str
+        Name of argument in function to deprecate
+    new_arg_name : str or None
+        Name of preferred argument in function. Use None to raise warning that
+        ``old_arg_name`` keyword is deprecated.
+    mapping : dict or callable
+        If mapping is present, use it to translate old arguments to
+        new arguments. A callable must do its own value checking;
+        values not found in a dict will be forwarded unchanged.
+
+    Examples
+    --------
+    The following deprecates 'cols', using 'columns' instead
+
+    >>> @deprecate_kwarg(old_arg_name='cols', new_arg_name='columns')
+    ... def f(columns=''):
+    ...     print(columns)
+    ...
+    >>> f(columns='should work ok')
+    should work ok
+
+    >>> f(cols='should raise warning')
+    FutureWarning: cols is deprecated, use columns instead
+      warnings.warn(msg, FutureWarning)
+    should raise warning
+
+    >>> f(cols='should error', columns="can\'t pass do both")
+    TypeError: Can only specify 'cols' or 'columns', not both
+
+    >>> @deprecate_kwarg('old', 'new', {'yes': True, 'no': False})
+    ... def f(new=False):
+    ...     print('yes!' if new else 'no!')
+    ...
+    >>> f(old='yes')
+    FutureWarning: old='yes' is deprecated, use new=True instead
+      warnings.warn(msg, FutureWarning)
+    yes!
+
+
+    To raise a warning that a keyword will be removed entirely in the future
+
+    >>> @deprecate_kwarg(old_arg_name='cols', new_arg_name=None)
+    ... def f(cols='', another_param=''):
+    ...     print(cols)
+    ...
+    >>> f(cols='should raise warning')
+    FutureWarning: the 'cols' keyword is deprecated and will be removed in a
+    future version please takes steps to stop use of 'cols'
+    should raise warning
+    >>> f(another_param='should not raise warning')
+    should not raise warning
+
+    >>> f(cols='should raise warning', another_param='')
+    FutureWarning: the 'cols' keyword is deprecated and will be removed in a
+    future version please takes steps to stop use of 'cols'
+    should raise warning
+    """
+
+    if mapping is not None and not hasattr(mapping, 'get') and \
+            not callable(mapping):
+        raise TypeError("mapping from old to new argument values "
+                        "must be dict or callable!")
+
+    def _deprecate_kwarg(func):
+        @wraps(func)
+        def wrapper(*args, **kwargs):
+            old_arg_value = kwargs.pop(old_arg_name, None)
+
+            if new_arg_name is None and old_arg_value is not None:
+                msg = (
+                    "the '{old_name}' keyword is deprecated and will be "
+                    "removed in a future version. "
+                    "Please take steps to stop the use of '{old_name}'"
+                ).format(old_name=old_arg_name)
+                warnings.warn(msg, FutureWarning, stacklevel=stacklevel)
+                kwargs[old_arg_name] = old_arg_value
+                return func(*args, **kwargs)
+
+            if old_arg_value is not None:
+                if mapping is not None:
+                    if hasattr(mapping, 'get'):
+                        new_arg_value = mapping.get(old_arg_value,
+                                                    old_arg_value)
+                    else:
+                        new_arg_value = mapping(old_arg_value)
+                    msg = ("the {old_name}={old_val!r} keyword is deprecated, "
+                           "use {new_name}={new_val!r} instead"
+                           ).format(old_name=old_arg_name,
+                                    old_val=old_arg_value,
+                                    new_name=new_arg_name,
+                                    new_val=new_arg_value)
+                else:
+                    new_arg_value = old_arg_value
+                    msg = ("the '{old_name}' keyword is deprecated, "
+                           "use '{new_name}' instead"
+                           ).format(old_name=old_arg_name,
+                                    new_name=new_arg_name)
+
+                warnings.warn(msg, FutureWarning, stacklevel=stacklevel)
+                if kwargs.get(new_arg_name, None) is not None:
+                    msg = ("Can only specify '{old_name}' or '{new_name}', "
+                           "not both").format(old_name=old_arg_name,
+                                              new_name=new_arg_name)
+                    raise TypeError(msg)
+                else:
+                    kwargs[new_arg_name] = new_arg_value
+            return func(*args, **kwargs)
+        return wrapper
+    return _deprecate_kwarg
+
+
+def rewrite_axis_style_signature(name, extra_params):
+    def decorate(func):
+        @wraps(func)
+        def wrapper(*args, **kwargs):
+            return func(*args, **kwargs)
+
+        if not PY2:
+            kind = inspect.Parameter.POSITIONAL_OR_KEYWORD
+            params = [
+                inspect.Parameter('self', kind),
+                inspect.Parameter(name, kind, default=None),
+                inspect.Parameter('index', kind, default=None),
+                inspect.Parameter('columns', kind, default=None),
+                inspect.Parameter('axis', kind, default=None),
+            ]
+
+            for pname, default in extra_params:
+                params.append(inspect.Parameter(pname, kind, default=default))
+
+            sig = inspect.Signature(params)
+
+            func.__signature__ = sig
+        return wrapper
+    return decorate
+
+# Substitution and Appender are derived from matplotlib.docstring (1.1.0)
+# module http://matplotlib.org/users/license.html
+
+
+class Substitution(object):
+    """
+    A decorator to take a function's docstring and perform string
+    substitution on it.
+
+    This decorator should be robust even if func.__doc__ is None
+    (for example, if -OO was passed to the interpreter)
+
+    Usage: construct a docstring.Substitution with a sequence or
+    dictionary suitable for performing substitution; then
+    decorate a suitable function with the constructed object. e.g.
+
+    sub_author_name = Substitution(author='Jason')
+
+    @sub_author_name
+    def some_function(x):
+        "%(author)s wrote this function"
+
+    # note that some_function.__doc__ is now "Jason wrote this function"
+
+    One can also use positional arguments.
+
+    sub_first_last_names = Substitution('Edgar Allen', 'Poe')
+
+    @sub_first_last_names
+    def some_function(x):
+        "%s %s wrote the Raven"
+    """
+
+    def __init__(self, *args, **kwargs):
+        if (args and kwargs):
+            raise AssertionError("Only positional or keyword args are allowed")
+
+        self.params = args or kwargs
+
+    def __call__(self, func):
+        func.__doc__ = func.__doc__ and func.__doc__ % self.params
+        return func
+
+    def update(self, *args, **kwargs):
+        """
+        Update self.params with supplied args.
+
+        If called, we assume self.params is a dict.
+        """
+
+        self.params.update(*args, **kwargs)
+
+    @classmethod
+    def from_params(cls, params):
+        """
+        In the case where the params is a mutable sequence (list or dictionary)
+        and it may change before this class is called, one may explicitly use a
+        reference to the params rather than using *args or **kwargs which will
+        copy the values and not reference them.
+        """
+        result = cls()
+        result.params = params
+        return result
+
+
+class Appender(object):
+    """
+    A function decorator that will append an addendum to the docstring
+    of the target function.
+
+    This decorator should be robust even if func.__doc__ is None
+    (for example, if -OO was passed to the interpreter).
+
+    Usage: construct a docstring.Appender with a string to be joined to
+    the original docstring. An optional 'join' parameter may be supplied
+    which will be used to join the docstring and addendum. e.g.
+
+    add_copyright = Appender("Copyright (c) 2009", join='\n')
+
+    @add_copyright
+    def my_dog(has='fleas'):
+        "This docstring will have a copyright below"
+        pass
+    """
+
+    def __init__(self, addendum, join='', indents=0):
+        if indents > 0:
+            self.addendum = indent(addendum, indents=indents)
+        else:
+            self.addendum = addendum
+        self.join = join
+
+    def __call__(self, func):
+        func.__doc__ = func.__doc__ if func.__doc__ else ''
+        self.addendum = self.addendum if self.addendum else ''
+        docitems = [func.__doc__, self.addendum]
+        func.__doc__ = dedent(self.join.join(docitems))
+        return func
+
+
+def indent(text, indents=1):
+    if not text or not isinstance(text, str):
+        return ''
+    jointext = ''.join(['\n'] + ['    '] * indents)
+    return jointext.join(text.split('\n'))
+
+
+def make_signature(func):
+    """
+    Returns a string repr of the arg list of a func call, with any defaults.
+
+    Examples
+    --------
+    >>> def f(a,b,c=2) :
+    >>>     return a*b*c
+    >>> print(_make_signature(f))
+    a,b,c=2
+    """
+
+    spec = signature(func)
+    if spec.defaults is None:
+        n_wo_defaults = len(spec.args)
+        defaults = ('',) * n_wo_defaults
+    else:
+        n_wo_defaults = len(spec.args) - len(spec.defaults)
+        defaults = ('',) * n_wo_defaults + tuple(spec.defaults)
+    args = []
+    for i, (var, default) in enumerate(zip(spec.args, defaults)):
+        args.append(var if default == '' else var + '=' + repr(default))
+    if spec.varargs:
+        args.append('*' + spec.varargs)
+    if spec.keywords:
+        args.append('**' + spec.keywords)
+    return args, spec.args
+
+
+class docstring_wrapper(object):
+    """
+    Decorator to wrap a function and provide
+    a dynamically evaluated doc-string.
+
+    Parameters
+    ----------
+    func : callable
+    creator : callable
+        return the doc-string
+    default : str, optional
+        return this doc-string on error
+    """
+    _attrs = ['__module__', '__name__',
+              '__qualname__', '__annotations__']
+
+    def __init__(self, func, creator, default=None):
+        self.func = func
+        self.creator = creator
+        self.default = default
+        update_wrapper(
+            self, func, [attr for attr in self._attrs
+                         if hasattr(func, attr)])
+
+    def __get__(self, instance, cls=None):
+
+        # we are called with a class
+        if instance is None:
+            return self
+
+        # we want to return the actual passed instance
+        return types.MethodType(self, instance)
+
+    def __call__(self, *args, **kwargs):
+        return self.func(*args, **kwargs)
+
+    @property
+    def __doc__(self):
+        try:
+            return self.creator()
+        except Exception as exc:
+            msg = self.default or str(exc)
+            return msg
diff --git a/pandas/util/_depr_module.py b/pandas/util/_depr_module.py
new file mode 100644
index 0000000000000..9c648b76fdad1
--- /dev/null
+++ b/pandas/util/_depr_module.py
@@ -0,0 +1,103 @@
+"""
+This module houses a utility class for mocking deprecated modules.
+It is for internal use only and should not be used beyond this purpose.
+"""
+
+import warnings
+import importlib
+
+
+class _DeprecatedModule(object):
+    """ Class for mocking deprecated modules.
+
+    Parameters
+    ----------
+    deprmod : name of module to be deprecated.
+    deprmodto : name of module as a replacement, optional.
+                If not given, the __module__ attribute will
+                be used when needed.
+    removals : objects or methods in module that will no longer be
+               accessible once module is removed.
+    moved : dict, optional
+            dictionary of function name -> new location for moved
+            objects
+    """
+
+    def __init__(self, deprmod, deprmodto=None, removals=None,
+                 moved=None):
+        self.deprmod = deprmod
+        self.deprmodto = deprmodto
+        self.removals = removals
+        if self.removals is not None:
+            self.removals = frozenset(self.removals)
+        self.moved = moved
+
+        # For introspection purposes.
+        self.self_dir = frozenset(dir(self.__class__))
+
+    def __dir__(self):
+        deprmodule = self._import_deprmod()
+        return dir(deprmodule)
+
+    def __repr__(self):
+        deprmodule = self._import_deprmod()
+        return repr(deprmodule)
+
+    __str__ = __repr__
+
+    def __getattr__(self, name):
+        if name in self.self_dir:
+            return object.__getattribute__(self, name)
+
+        try:
+            deprmodule = self._import_deprmod(self.deprmod)
+        except ImportError:
+            if self.deprmodto is None:
+                raise
+
+            # a rename
+            deprmodule = self._import_deprmod(self.deprmodto)
+
+        obj = getattr(deprmodule, name)
+
+        if self.removals is not None and name in self.removals:
+            warnings.warn(
+                "{deprmod}.{name} is deprecated and will be removed in "
+                "a future version.".format(deprmod=self.deprmod, name=name),
+                FutureWarning, stacklevel=2)
+        elif self.moved is not None and name in self.moved:
+            warnings.warn(
+                "{deprmod} is deprecated and will be removed in "
+                "a future version.\nYou can access {name} as {moved}".format(
+                    deprmod=self.deprmod,
+                    name=name,
+                    moved=self.moved[name]),
+                FutureWarning, stacklevel=2)
+        else:
+            deprmodto = self.deprmodto
+            if deprmodto is False:
+                warnings.warn(
+                    "{deprmod}.{name} is deprecated and will be removed in "
+                    "a future version.".format(
+                        deprmod=self.deprmod, name=name),
+                    FutureWarning, stacklevel=2)
+            else:
+                if deprmodto is None:
+                    deprmodto = obj.__module__
+                # The object is actually located in another module.
+                warnings.warn(
+                    "{deprmod}.{name} is deprecated. Please use "
+                    "{deprmodto}.{name} instead.".format(
+                        deprmod=self.deprmod, name=name, deprmodto=deprmodto),
+                    FutureWarning, stacklevel=2)
+
+        return obj
+
+    def _import_deprmod(self, mod=None):
+        if mod is None:
+            mod = self.deprmod
+
+        with warnings.catch_warnings():
+            warnings.filterwarnings('ignore', category=FutureWarning)
+            deprmodule = importlib.import_module(mod)
+            return deprmodule
diff --git a/pandas/util/_doctools.py b/pandas/util/_doctools.py
new file mode 100644
index 0000000000000..667c5d9526563
--- /dev/null
+++ b/pandas/util/_doctools.py
@@ -0,0 +1,196 @@
+import numpy as np
+import pandas as pd
+import pandas.compat as compat
+
+
+class TablePlotter(object):
+    """
+    Layout some DataFrames in vertical/horizontal layout for explanation.
+    Used in merging.rst
+    """
+
+    def __init__(self, cell_width=0.37, cell_height=0.25, font_size=7.5):
+        self.cell_width = cell_width
+        self.cell_height = cell_height
+        self.font_size = font_size
+
+    def _shape(self, df):
+        """
+        Calculate table chape considering index levels.
+        """
+
+        row, col = df.shape
+        return row + df.columns.nlevels, col + df.index.nlevels
+
+    def _get_cells(self, left, right, vertical):
+        """
+        Calculate appropriate figure size based on left and right data.
+        """
+
+        if vertical:
+            # calculate required number of cells
+            vcells = max(sum(self._shape(l)[0] for l in left),
+                         self._shape(right)[0])
+            hcells = (max(self._shape(l)[1] for l in left) +
+                      self._shape(right)[1])
+        else:
+            vcells = max([self._shape(l)[0] for l in left] +
+                         [self._shape(right)[0]])
+            hcells = sum([self._shape(l)[1] for l in left] +
+                         [self._shape(right)[1]])
+        return hcells, vcells
+
+    def plot(self, left, right, labels=None, vertical=True):
+        """
+        Plot left / right DataFrames in specified layout.
+
+        Parameters
+        ----------
+        left : list of DataFrames before operation is applied
+        right : DataFrame of operation result
+        labels : list of str to be drawn as titles of left DataFrames
+        vertical : bool
+            If True, use vertical layout. If False, use horizontal layout.
+        """
+        import matplotlib.pyplot as plt
+        import matplotlib.gridspec as gridspec
+
+        if not isinstance(left, list):
+            left = [left]
+        left = [self._conv(l) for l in left]
+        right = self._conv(right)
+
+        hcells, vcells = self._get_cells(left, right, vertical)
+
+        if vertical:
+            figsize = self.cell_width * hcells, self.cell_height * vcells
+        else:
+            # include margin for titles
+            figsize = self.cell_width * hcells, self.cell_height * vcells
+        fig = plt.figure(figsize=figsize)
+
+        if vertical:
+            gs = gridspec.GridSpec(len(left), hcells)
+            # left
+            max_left_cols = max(self._shape(l)[1] for l in left)
+            max_left_rows = max(self._shape(l)[0] for l in left)
+            for i, (l, label) in enumerate(zip(left, labels)):
+                ax = fig.add_subplot(gs[i, 0:max_left_cols])
+                self._make_table(ax, l, title=label,
+                                 height=1.0 / max_left_rows)
+            # right
+            ax = plt.subplot(gs[:, max_left_cols:])
+            self._make_table(ax, right, title='Result', height=1.05 / vcells)
+            fig.subplots_adjust(top=0.9, bottom=0.05, left=0.05, right=0.95)
+        else:
+            max_rows = max(self._shape(df)[0] for df in left + [right])
+            height = 1.0 / np.max(max_rows)
+            gs = gridspec.GridSpec(1, hcells)
+            # left
+            i = 0
+            for l, label in zip(left, labels):
+                sp = self._shape(l)
+                ax = fig.add_subplot(gs[0, i:i + sp[1]])
+                self._make_table(ax, l, title=label, height=height)
+                i += sp[1]
+            # right
+            ax = plt.subplot(gs[0, i:])
+            self._make_table(ax, right, title='Result', height=height)
+            fig.subplots_adjust(top=0.85, bottom=0.05, left=0.05, right=0.95)
+
+        return fig
+
+    def _conv(self, data):
+        """Convert each input to appropriate for table outplot"""
+        if isinstance(data, pd.Series):
+            if data.name is None:
+                data = data.to_frame(name='')
+            else:
+                data = data.to_frame()
+        data = data.fillna('NaN')
+        return data
+
+    def _insert_index(self, data):
+        # insert is destructive
+        data = data.copy()
+        idx_nlevels = data.index.nlevels
+        if idx_nlevels == 1:
+            data.insert(0, 'Index', data.index)
+        else:
+            for i in range(idx_nlevels):
+                data.insert(i, 'Index{0}'.format(i),
+                            data.index._get_level_values(i))
+
+        col_nlevels = data.columns.nlevels
+        if col_nlevels > 1:
+            col = data.columns._get_level_values(0)
+            values = [data.columns._get_level_values(i).values
+                      for i in range(1, col_nlevels)]
+            col_df = pd.DataFrame(values)
+            data.columns = col_df.columns
+            data = pd.concat([col_df, data])
+            data.columns = col
+        return data
+
+    def _make_table(self, ax, df, title, height=None):
+        if df is None:
+            ax.set_visible(False)
+            return
+
+        import pandas.plotting as plotting
+
+        idx_nlevels = df.index.nlevels
+        col_nlevels = df.columns.nlevels
+        # must be convert here to get index levels for colorization
+        df = self._insert_index(df)
+        tb = plotting.table(ax, df, loc=9)
+        tb.set_fontsize(self.font_size)
+
+        if height is None:
+            height = 1.0 / (len(df) + 1)
+
+        props = tb.properties()
+        for (r, c), cell in compat.iteritems(props['celld']):
+            if c == -1:
+                cell.set_visible(False)
+            elif r < col_nlevels and c < idx_nlevels:
+                cell.set_visible(False)
+            elif r < col_nlevels or c < idx_nlevels:
+                cell.set_facecolor('#AAAAAA')
+            cell.set_height(height)
+
+        ax.set_title(title, size=self.font_size)
+        ax.axis('off')
+
+
+if __name__ == "__main__":
+    import matplotlib.pyplot as plt
+
+    p = TablePlotter()
+
+    df1 = pd.DataFrame({'A': [10, 11, 12],
+                        'B': [20, 21, 22],
+                        'C': [30, 31, 32]})
+    df2 = pd.DataFrame({'A': [10, 12],
+                        'C': [30, 32]})
+
+    p.plot([df1, df2], pd.concat([df1, df2]),
+           labels=['df1', 'df2'], vertical=True)
+    plt.show()
+
+    df3 = pd.DataFrame({'X': [10, 12],
+                        'Z': [30, 32]})
+
+    p.plot([df1, df3], pd.concat([df1, df3], axis=1),
+           labels=['df1', 'df2'], vertical=False)
+    plt.show()
+
+    idx = pd.MultiIndex.from_tuples([(1, 'A'), (1, 'B'), (1, 'C'),
+                                     (2, 'A'), (2, 'B'), (2, 'C')])
+    col = pd.MultiIndex.from_tuples([(1, 'A'), (1, 'B')])
+    df3 = pd.DataFrame({'v1': [1, 2, 3, 4, 5, 6],
+                        'v2': [5, 6, 7, 8, 9, 10]},
+                       index=idx)
+    df3.columns = col
+    p.plot(df3, df3, labels=['df3'])
+    plt.show()
diff --git a/pandas/util/_print_versions.py b/pandas/util/_print_versions.py
new file mode 100644
index 0000000000000..01198fc541e0c
--- /dev/null
+++ b/pandas/util/_print_versions.py
@@ -0,0 +1,159 @@
+import os
+import platform
+import sys
+import struct
+import subprocess
+import codecs
+import locale
+import importlib
+
+
+def get_sys_info():
+    "Returns system information as a dict"
+
+    blob = []
+
+    # get full commit hash
+    commit = None
+    if os.path.isdir(".git") and os.path.isdir("pandas"):
+        try:
+            pipe = subprocess.Popen('git log --format="%H" -n 1'.split(" "),
+                                    stdout=subprocess.PIPE,
+                                    stderr=subprocess.PIPE)
+            so, serr = pipe.communicate()
+        except:
+            pass
+        else:
+            if pipe.returncode == 0:
+                commit = so
+                try:
+                    commit = so.decode('utf-8')
+                except ValueError:
+                    pass
+                commit = commit.strip().strip('"')
+
+    blob.append(('commit', commit))
+
+    try:
+        (sysname, nodename, release,
+         version, machine, processor) = platform.uname()
+        blob.extend([
+            ("python", '.'.join(map(str, sys.version_info))),
+            ("python-bits", struct.calcsize("P") * 8),
+            ("OS", "{sysname}".format(sysname=sysname)),
+            ("OS-release", "{release}".format(release=release)),
+            # ("Version", "{version}".format(version=version)),
+            ("machine", "{machine}".format(machine=machine)),
+            ("processor", "{processor}".format(processor=processor)),
+            ("byteorder", "{byteorder}".format(byteorder=sys.byteorder)),
+            ("LC_ALL", "{lc}".format(lc=os.environ.get('LC_ALL', "None"))),
+            ("LANG", "{lang}".format(lang=os.environ.get('LANG', "None"))),
+            ("LOCALE", '.'.join(map(str, locale.getlocale()))),
+        ])
+    except:
+        pass
+
+    return blob
+
+
+def show_versions(as_json=False):
+    sys_info = get_sys_info()
+
+    deps = [
+        # (MODULE_NAME, f(mod) -> mod version)
+        ("pandas", lambda mod: mod.__version__),
+        ("pytest", lambda mod: mod.__version__),
+        ("pip", lambda mod: mod.__version__),
+        ("setuptools", lambda mod: mod.__version__),
+        ("Cython", lambda mod: mod.__version__),
+        ("numpy", lambda mod: mod.version.version),
+        ("scipy", lambda mod: mod.version.version),
+        ("pyarrow", lambda mod: mod.__version__),
+        ("xarray", lambda mod: mod.__version__),
+        ("IPython", lambda mod: mod.__version__),
+        ("sphinx", lambda mod: mod.__version__),
+        ("patsy", lambda mod: mod.__version__),
+        ("dateutil", lambda mod: mod.__version__),
+        ("pytz", lambda mod: mod.VERSION),
+        ("blosc", lambda mod: mod.__version__),
+        ("bottleneck", lambda mod: mod.__version__),
+        ("tables", lambda mod: mod.__version__),
+        ("numexpr", lambda mod: mod.__version__),
+        ("feather", lambda mod: mod.__version__),
+        ("matplotlib", lambda mod: mod.__version__),
+        ("openpyxl", lambda mod: mod.__version__),
+        ("xlrd", lambda mod: mod.__VERSION__),
+        ("xlwt", lambda mod: mod.__VERSION__),
+        ("xlsxwriter", lambda mod: mod.__version__),
+        ("lxml", lambda mod: mod.etree.__version__),
+        ("bs4", lambda mod: mod.__version__),
+        ("html5lib", lambda mod: mod.__version__),
+        ("sqlalchemy", lambda mod: mod.__version__),
+        ("pymysql", lambda mod: mod.__version__),
+        ("psycopg2", lambda mod: mod.__version__),
+        ("jinja2", lambda mod: mod.__version__),
+        ("s3fs", lambda mod: mod.__version__),
+        ("fastparquet", lambda mod: mod.__version__),
+        ("pandas_gbq", lambda mod: mod.__version__),
+        ("pandas_datareader", lambda mod: mod.__version__),
+        ("gcsfs", lambda mod: mod.__version__),
+    ]
+
+    deps_blob = list()
+    for (modname, ver_f) in deps:
+        try:
+            if modname in sys.modules:
+                mod = sys.modules[modname]
+            else:
+                mod = importlib.import_module(modname)
+            ver = ver_f(mod)
+            deps_blob.append((modname, ver))
+        except:
+            deps_blob.append((modname, None))
+
+    if (as_json):
+        try:
+            import json
+        except:
+            import simplejson as json
+
+        j = dict(system=dict(sys_info), dependencies=dict(deps_blob))
+
+        if as_json is True:
+            print(j)
+        else:
+            with codecs.open(as_json, "wb", encoding='utf8') as f:
+                json.dump(j, f, indent=2)
+
+    else:
+
+        print("\nINSTALLED VERSIONS")
+        print("------------------")
+
+        for k, stat in sys_info:
+            print("{k}: {stat}".format(k=k, stat=stat))
+
+        print("")
+        for k, stat in deps_blob:
+            print("{k}: {stat}".format(k=k, stat=stat))
+
+
+def main():
+    from optparse import OptionParser
+    parser = OptionParser()
+    parser.add_option("-j", "--json", metavar="FILE", nargs=1,
+                      help="Save output as JSON into file, pass in "
+                      "'-' to output to stdout")
+
+    (options, args) = parser.parse_args()
+
+    if options.json == "-":
+        options.json = True
+
+    show_versions(as_json=options.json)
+
+    return 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/pandas/util/_test_decorators.py b/pandas/util/_test_decorators.py
new file mode 100644
index 0000000000000..c6ab24403d58d
--- /dev/null
+++ b/pandas/util/_test_decorators.py
@@ -0,0 +1,219 @@
+"""
+This module provides decorator functions which can be applied to test objects
+in order to skip those objects when certain conditions occur. A sample use case
+is to detect if the platform is missing ``matplotlib``. If so, any test objects
+which require ``matplotlib`` and decorated with ``@td.skip_if_no_mpl`` will be
+skipped by ``pytest`` during the execution of the test suite.
+
+To illustrate, after importing this module:
+
+import pandas.util._test_decorators as td
+
+The decorators can be applied to classes:
+
+@td.skip_if_some_reason
+class Foo():
+    ...
+
+Or individual functions:
+
+@td.skip_if_some_reason
+def test_foo():
+    ...
+
+For more information, refer to the ``pytest`` documentation on ``skipif``.
+"""
+import pytest
+import locale
+from distutils.version import LooseVersion
+
+from pandas.compat import (is_platform_windows, is_platform_32bit, PY3,
+                           import_lzma)
+from pandas.compat.numpy import _np_version_under1p15
+from pandas.core.computation.expressions import (_USE_NUMEXPR,
+                                                 _NUMEXPR_INSTALLED)
+
+
+def safe_import(mod_name, min_version=None):
+    """
+    Parameters:
+    -----------
+    mod_name : str
+        Name of the module to be imported
+    min_version : str, default None
+        Minimum required version of the specified mod_name
+
+    Returns:
+    --------
+    object
+        The imported module if successful, or False
+    """
+    try:
+        mod = __import__(mod_name)
+    except ImportError:
+        return False
+
+    if not min_version:
+        return mod
+    else:
+        import sys
+        try:
+            version = getattr(sys.modules[mod_name], '__version__')
+        except AttributeError:
+            # xlrd uses a capitalized attribute name
+            version = getattr(sys.modules[mod_name], '__VERSION__')
+        if version:
+            from distutils.version import LooseVersion
+            if LooseVersion(version) >= LooseVersion(min_version):
+                return mod
+
+    return False
+
+
+def _skip_if_no_mpl():
+    mod = safe_import("matplotlib")
+    if mod:
+        mod.use("Agg", warn=False)
+    else:
+        return True
+
+
+def _skip_if_mpl_1_5():
+    mod = safe_import("matplotlib")
+
+    if mod:
+        v = mod.__version__
+        if LooseVersion(v) > LooseVersion('1.4.3') or str(v)[0] == '0':
+            return True
+        else:
+            mod.use("Agg", warn=False)
+
+
+def _skip_if_mpl_2_2():
+    mod = safe_import("matplotlib")
+
+    if mod:
+        v = mod.__version__
+        if LooseVersion(v) > LooseVersion('2.1.2'):
+            return True
+        else:
+            mod.use("Agg", warn=False)
+
+
+def _skip_if_has_locale():
+    lang, _ = locale.getlocale()
+    if lang is not None:
+        return True
+
+
+def _skip_if_not_us_locale():
+    lang, _ = locale.getlocale()
+    if lang != 'en_US':
+        return True
+
+
+def _skip_if_no_scipy():
+    return not (safe_import('scipy.stats') and safe_import('scipy.sparse') and
+                safe_import('scipy.interpolate'))
+
+
+def _skip_if_no_lzma():
+    try:
+        import_lzma()
+    except ImportError:
+        return True
+
+
+def skip_if_no(package, min_version=None):
+    """
+    Generic function to help skip test functions when required packages are not
+    present on the testing system.
+
+    Intended for use as a decorator, this function will wrap the decorated
+    function with a pytest ``skip_if`` mark. During a pytest test suite
+    execution, that mark will attempt to import the specified ``package`` and
+    optionally ensure it meets the ``min_version``. If the import and version
+    check are unsuccessful, then the decorated function will be skipped.
+
+    Parameters
+    ----------
+    package: str
+        The name of the package required by the decorated function
+    min_version: str or None, default None
+        Optional minimum version of the package required by the decorated
+        function
+
+    Returns
+    -------
+    decorated_func: function
+        The decorated function wrapped within a pytest ``skip_if`` mark
+    """
+    def decorated_func(func):
+        msg = "Could not import '{}'".format(package)
+        if min_version:
+            msg += " satisfying a min_version of {}".format(min_version)
+        return pytest.mark.skipif(
+            not safe_import(package, min_version=min_version), reason=msg
+        )(func)
+    return decorated_func
+
+
+skip_if_no_mpl = pytest.mark.skipif(_skip_if_no_mpl(),
+                                    reason="Missing matplotlib dependency")
+
+skip_if_np_lt_115 = pytest.mark.skipif(_np_version_under1p15,
+                                       reason="NumPy 1.15 or greater required")
+skip_if_mpl = pytest.mark.skipif(not _skip_if_no_mpl(),
+                                 reason="matplotlib is present")
+skip_if_mpl_1_5 = pytest.mark.skipif(_skip_if_mpl_1_5(),
+                                     reason="matplotlib 1.5")
+xfail_if_mpl_2_2 = pytest.mark.xfail(_skip_if_mpl_2_2(),
+                                     reason="matplotlib 2.2")
+skip_if_32bit = pytest.mark.skipif(is_platform_32bit(),
+                                   reason="skipping for 32 bit")
+skip_if_windows = pytest.mark.skipif(is_platform_windows(),
+                                     reason="Running on Windows")
+skip_if_windows_python_3 = pytest.mark.skipif(is_platform_windows() and PY3,
+                                              reason=("not used on python3/"
+                                                      "win32"))
+skip_if_has_locale = pytest.mark.skipif(_skip_if_has_locale(),
+                                        reason="Specific locale is set {lang}"
+                                        .format(lang=locale.getlocale()[0]))
+skip_if_not_us_locale = pytest.mark.skipif(_skip_if_not_us_locale(),
+                                           reason="Specific locale is set "
+                                           "{lang}".format(
+                                               lang=locale.getlocale()[0]))
+skip_if_no_scipy = pytest.mark.skipif(_skip_if_no_scipy(),
+                                      reason="Missing SciPy requirement")
+skip_if_no_lzma = pytest.mark.skipif(_skip_if_no_lzma(),
+                                     reason="need backports.lzma to run")
+skip_if_no_ne = pytest.mark.skipif(not _USE_NUMEXPR,
+                                   reason="numexpr enabled->{enabled}, "
+                                   "installed->{installed}".format(
+                                       enabled=_USE_NUMEXPR,
+                                       installed=_NUMEXPR_INSTALLED))
+
+
+def parametrize_fixture_doc(*args):
+    """
+    Intended for use as a decorator for parametrized fixture,
+    this function will wrap the decorated function with a pytest
+    ``parametrize_fixture_doc`` mark. That mark will format
+    initial fixture docstring by replacing placeholders {0}, {1} etc
+    with parameters passed as arguments.
+
+    Parameters:
+    ----------
+        args: iterable
+            Positional arguments for docstring.
+
+    Returns:
+    -------
+    documented_fixture: function
+        The decorated function wrapped within a pytest
+        ``parametrize_fixture_doc`` mark
+    """
+    def documented_fixture(fixture):
+        fixture.__doc__ = fixture.__doc__.format(*args)
+        return fixture
+    return documented_fixture
diff --git a/pandas/util/_tester.py b/pandas/util/_tester.py
new file mode 100644
index 0000000000000..d18467f17ec5b
--- /dev/null
+++ b/pandas/util/_tester.py
@@ -0,0 +1,25 @@
+"""
+Entrypoint for testing from the top-level namespace
+"""
+import os
+import sys
+
+PKG = os.path.dirname(os.path.dirname(__file__))
+
+
+def test(extra_args=None):
+    try:
+        import pytest
+    except ImportError:
+        raise ImportError("Need pytest>=3.0 to run tests")
+    cmd = ['--skip-slow', '--skip-network']
+    if extra_args:
+        if not isinstance(extra_args, list):
+            extra_args = [extra_args]
+        cmd = extra_args
+    cmd += [PKG]
+    print("running: pytest {}".format(' '.join(cmd)))
+    sys.exit(pytest.main(cmd))
+
+
+__all__ = ['test']
diff --git a/pandas/util/_validators.py b/pandas/util/_validators.py
new file mode 100644
index 0000000000000..a96563051e7de
--- /dev/null
+++ b/pandas/util/_validators.py
@@ -0,0 +1,358 @@
+"""
+Module that contains many useful utilities
+for validating data or function arguments
+"""
+import warnings
+
+from pandas.core.dtypes.common import is_bool
+
+
+def _check_arg_length(fname, args, max_fname_arg_count, compat_args):
+    """
+    Checks whether 'args' has length of at most 'compat_args'. Raises
+    a TypeError if that is not the case, similar to in Python when a
+    function is called with too many arguments.
+
+    """
+    if max_fname_arg_count < 0:
+        raise ValueError("'max_fname_arg_count' must be non-negative")
+
+    if len(args) > len(compat_args):
+        max_arg_count = len(compat_args) + max_fname_arg_count
+        actual_arg_count = len(args) + max_fname_arg_count
+        argument = 'argument' if max_arg_count == 1 else 'arguments'
+
+        raise TypeError(
+            "{fname}() takes at most {max_arg} {argument} "
+            "({given_arg} given)".format(
+                fname=fname, max_arg=max_arg_count,
+                argument=argument, given_arg=actual_arg_count))
+
+
+def _check_for_default_values(fname, arg_val_dict, compat_args):
+    """
+    Check that the keys in `arg_val_dict` are mapped to their
+    default values as specified in `compat_args`.
+
+    Note that this function is to be called only when it has been
+    checked that arg_val_dict.keys() is a subset of compat_args
+
+    """
+    for key in arg_val_dict:
+        # try checking equality directly with '=' operator,
+        # as comparison may have been overridden for the left
+        # hand object
+        try:
+            v1 = arg_val_dict[key]
+            v2 = compat_args[key]
+
+            # check for None-ness otherwise we could end up
+            # comparing a numpy array vs None
+            if (v1 is not None and v2 is None) or \
+               (v1 is None and v2 is not None):
+                match = False
+            else:
+                match = (v1 == v2)
+
+            if not is_bool(match):
+                raise ValueError("'match' is not a boolean")
+
+        # could not compare them directly, so try comparison
+        # using the 'is' operator
+        except:
+            match = (arg_val_dict[key] is compat_args[key])
+
+        if not match:
+            raise ValueError(("the '{arg}' parameter is not "
+                              "supported in the pandas "
+                              "implementation of {fname}()".
+                              format(fname=fname, arg=key)))
+
+
+def validate_args(fname, args, max_fname_arg_count, compat_args):
+    """
+    Checks whether the length of the `*args` argument passed into a function
+    has at most `len(compat_args)` arguments and whether or not all of these
+    elements in `args` are set to their default values.
+
+    fname: str
+        The name of the function being passed the `*args` parameter
+
+    args: tuple
+        The `*args` parameter passed into a function
+
+    max_fname_arg_count: int
+        The maximum number of arguments that the function `fname`
+        can accept, excluding those in `args`. Used for displaying
+        appropriate error messages. Must be non-negative.
+
+    compat_args: OrderedDict
+        A ordered dictionary of keys and their associated default values.
+        In order to accommodate buggy behaviour in some versions of `numpy`,
+        where a signature displayed keyword arguments but then passed those
+        arguments **positionally** internally when calling downstream
+        implementations, an ordered dictionary ensures that the original
+        order of the keyword arguments is enforced. Note that if there is
+        only one key, a generic dict can be passed in as well.
+
+    Raises
+    ------
+    TypeError if `args` contains more values than there are `compat_args`
+    ValueError if `args` contains values that do not correspond to those
+    of the default values specified in `compat_args`
+
+    """
+    _check_arg_length(fname, args, max_fname_arg_count, compat_args)
+
+    # We do this so that we can provide a more informative
+    # error message about the parameters that we are not
+    # supporting in the pandas implementation of 'fname'
+    kwargs = dict(zip(compat_args, args))
+    _check_for_default_values(fname, kwargs, compat_args)
+
+
+def _check_for_invalid_keys(fname, kwargs, compat_args):
+    """
+    Checks whether 'kwargs' contains any keys that are not
+    in 'compat_args' and raises a TypeError if there is one.
+
+    """
+    # set(dict) --> set of the dictionary's keys
+    diff = set(kwargs) - set(compat_args)
+
+    if diff:
+        bad_arg = list(diff)[0]
+        raise TypeError(("{fname}() got an unexpected "
+                         "keyword argument '{arg}'".
+                         format(fname=fname, arg=bad_arg)))
+
+
+def validate_kwargs(fname, kwargs, compat_args):
+    """
+    Checks whether parameters passed to the **kwargs argument in a
+    function `fname` are valid parameters as specified in `*compat_args`
+    and whether or not they are set to their default values.
+
+    Parameters
+    ----------
+    fname: str
+        The name of the function being passed the `**kwargs` parameter
+
+    kwargs: dict
+        The `**kwargs` parameter passed into `fname`
+
+    compat_args: dict
+        A dictionary of keys that `kwargs` is allowed to have and their
+        associated default values
+
+    Raises
+    ------
+    TypeError if `kwargs` contains keys not in `compat_args`
+    ValueError if `kwargs` contains keys in `compat_args` that do not
+    map to the default values specified in `compat_args`
+
+    """
+    kwds = kwargs.copy()
+    _check_for_invalid_keys(fname, kwargs, compat_args)
+    _check_for_default_values(fname, kwds, compat_args)
+
+
+def validate_args_and_kwargs(fname, args, kwargs,
+                             max_fname_arg_count,
+                             compat_args):
+    """
+    Checks whether parameters passed to the *args and **kwargs argument in a
+    function `fname` are valid parameters as specified in `*compat_args`
+    and whether or not they are set to their default values.
+
+    Parameters
+    ----------
+    fname: str
+        The name of the function being passed the `**kwargs` parameter
+
+    args: tuple
+        The `*args` parameter passed into a function
+
+    kwargs: dict
+        The `**kwargs` parameter passed into `fname`
+
+    max_fname_arg_count: int
+        The minimum number of arguments that the function `fname`
+        requires, excluding those in `args`. Used for displaying
+        appropriate error messages. Must be non-negative.
+
+    compat_args: OrderedDict
+        A ordered dictionary of keys that `kwargs` is allowed to
+        have and their associated default values. Note that if there
+        is only one key, a generic dict can be passed in as well.
+
+    Raises
+    ------
+    TypeError if `args` contains more values than there are
+    `compat_args` OR `kwargs` contains keys not in `compat_args`
+    ValueError if `args` contains values not at the default value (`None`)
+    `kwargs` contains keys in `compat_args` that do not map to the default
+    value as specified in `compat_args`
+
+    See Also
+    --------
+    validate_args : purely args validation
+    validate_kwargs : purely kwargs validation
+
+    """
+    # Check that the total number of arguments passed in (i.e.
+    # args and kwargs) does not exceed the length of compat_args
+    _check_arg_length(fname, args + tuple(kwargs.values()),
+                      max_fname_arg_count, compat_args)
+
+    # Check there is no overlap with the positional and keyword
+    # arguments, similar to what is done in actual Python functions
+    args_dict = dict(zip(compat_args, args))
+
+    for key in args_dict:
+        if key in kwargs:
+            raise TypeError("{fname}() got multiple values for keyword "
+                            "argument '{arg}'".format(fname=fname, arg=key))
+
+    kwargs.update(args_dict)
+    validate_kwargs(fname, kwargs, compat_args)
+
+
+def validate_bool_kwarg(value, arg_name):
+    """ Ensures that argument passed in arg_name is of type bool. """
+    if not (is_bool(value) or value is None):
+        raise ValueError('For argument "{arg}" expected type bool, received '
+                         'type {typ}.'.format(arg=arg_name,
+                                              typ=type(value).__name__))
+    return value
+
+
+def validate_axis_style_args(data, args, kwargs, arg_name, method_name):
+    """Argument handler for mixed index, columns / axis functions
+
+    In an attempt to handle both `.method(index, columns)`, and
+    `.method(arg, axis=.)`, we have to do some bad things to argument
+    parsing. This translates all arguments to `{index=., columns=.}` style.
+
+    Parameters
+    ----------
+    data : DataFrame or Panel
+    arg : tuple
+        All positional arguments from the user
+    kwargs : dict
+        All keyword arguments from the user
+    arg_name, method_name : str
+        Used for better error messages
+
+    Returns
+    -------
+    kwargs : dict
+        A dictionary of keyword arguments. Doesn't modify ``kwargs``
+        inplace, so update them with the return value here.
+
+    Examples
+    --------
+    >>> df._validate_axis_style_args((str.upper,), {'columns': id},
+    ...                              'mapper', 'rename')
+    {'columns': <function id>, 'index': <method 'upper' of 'str' objects>}
+
+    This emits a warning
+    >>> df._validate_axis_style_args((str.upper, id), {},
+    ...                              'mapper', 'rename')
+    {'columns': <function id>, 'index': <method 'upper' of 'str' objects>}
+    """
+    # TODO(PY3): Change to keyword-only args and remove all this
+
+    out = {}
+    # Goal: fill 'out' with index/columns-style arguments
+    # like out = {'index': foo, 'columns': bar}
+
+    # Start by validating for consistency
+    if 'axis' in kwargs and any(x in kwargs for x in data._AXIS_NUMBERS):
+        msg = "Cannot specify both 'axis' and any of 'index' or 'columns'."
+        raise TypeError(msg)
+
+    # First fill with explicit values provided by the user...
+    if arg_name in kwargs:
+        if args:
+            msg = ("{} got multiple values for argument "
+                   "'{}'".format(method_name, arg_name))
+            raise TypeError(msg)
+
+        axis = data._get_axis_name(kwargs.get('axis', 0))
+        out[axis] = kwargs[arg_name]
+
+    # More user-provided arguments, now from kwargs
+    for k, v in kwargs.items():
+        try:
+            ax = data._get_axis_name(k)
+        except ValueError:
+            pass
+        else:
+            out[ax] = v
+
+    # All user-provided kwargs have been handled now.
+    # Now we supplement with positional arguments, emitting warnings
+    # when there's ambiguity and raising when there's conflicts
+
+    if len(args) == 0:
+        pass  # It's up to the function to decide if this is valid
+    elif len(args) == 1:
+        axis = data._get_axis_name(kwargs.get('axis', 0))
+        out[axis] = args[0]
+    elif len(args) == 2:
+        if 'axis' in kwargs:
+            # Unambiguously wrong
+            msg = ("Cannot specify both 'axis' and any of 'index' "
+                   "or 'columns'")
+            raise TypeError(msg)
+
+        msg = ("Interpreting call\n\t'.{method_name}(a, b)' as "
+               "\n\t'.{method_name}(index=a, columns=b)'.\nUse named "
+               "arguments to remove any ambiguity. In the future, using "
+               "positional arguments for 'index' or 'columns' will raise "
+               " a 'TypeError'.")
+        warnings.warn(msg.format(method_name=method_name,), FutureWarning,
+                      stacklevel=4)
+        out[data._AXIS_NAMES[0]] = args[0]
+        out[data._AXIS_NAMES[1]] = args[1]
+    else:
+        msg = "Cannot specify all of '{}', 'index', 'columns'."
+        raise TypeError(msg.format(arg_name))
+    return out
+
+
+def validate_fillna_kwargs(value, method, validate_scalar_dict_value=True):
+    """Validate the keyword arguments to 'fillna'.
+
+    This checks that exactly one of 'value' and 'method' is specified.
+    If 'method' is specified, this validates that it's a valid method.
+
+    Parameters
+    ----------
+    value, method : object
+        The 'value' and 'method' keyword arguments for 'fillna'.
+    validate_scalar_dict_value : bool, default True
+        Whether to validate that 'value' is a scalar or dict. Specifically,
+        validate that it is not a list or tuple.
+
+    Returns
+    -------
+    value, method : object
+    """
+    from pandas.core.missing import clean_fill_method
+
+    if value is None and method is None:
+        raise ValueError("Must specify a fill 'value' or 'method'.")
+    elif value is None and method is not None:
+        method = clean_fill_method(method)
+
+    elif value is not None and method is None:
+        if validate_scalar_dict_value and isinstance(value, (list, tuple)):
+            raise TypeError('"value" parameter must be a scalar or dict, but '
+                            'you passed a "{0}"'.format(type(value).__name__))
+
+    elif value is not None and method is not None:
+        raise ValueError("Cannot specify both 'value' and 'method'.")
+
+    return value, method
diff --git a/pandas/util/clipboard.py b/pandas/util/clipboard.py
deleted file mode 100644
index 65c372bf7cd5b..0000000000000
--- a/pandas/util/clipboard.py
+++ /dev/null
@@ -1,176 +0,0 @@
-# Pyperclip v1.3
-# A cross-platform clipboard module for Python. (only handles plain text for now)
-# By Al Sweigart al@coffeeghost.net
-
-# Usage:
-#   import pyperclip
-#   pyperclip.copy('The text to be copied to the clipboard.')
-#   spam = pyperclip.paste()
-
-# On Mac, this module makes use of the pbcopy and pbpaste commands, which should come with the os.
-# On Linux, this module makes use of the xclip command, which should come with the os. Otherwise run "sudo apt-get install xclip"
-
-
-# Copyright (c) 2010, Albert Sweigart
-# All rights reserved.
-#
-# BSD-style license:
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-#     * Redistributions of source code must retain the above copyright
-#       notice, this list of conditions and the following disclaimer.
-#     * Redistributions in binary form must reproduce the above copyright
-#       notice, this list of conditions and the following disclaimer in the
-#       documentation and/or other materials provided with the distribution.
-#     * Neither the name of the pyperclip nor the
-#       names of its contributors may be used to endorse or promote products
-#       derived from this software without specific prior written permission.
-#
-# THIS SOFTWARE IS PROVIDED BY Albert Sweigart "AS IS" AND ANY
-# EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-# WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL Albert Sweigart BE LIABLE FOR ANY
-# DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
-# (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
-# LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
-# ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
-# SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-# Change Log:
-# 1.2 Use the platform module to help determine OS.
-# 1.3 Changed ctypes.windll.user32.OpenClipboard(None) to ctypes.windll.user32.OpenClipboard(0), after some people ran into some TypeError
-
-import platform, os
-
-class NoClipboardProgramError(OSError):
-    pass
-
-
-def winGetClipboard():
-    ctypes.windll.user32.OpenClipboard(0)
-    pcontents = ctypes.windll.user32.GetClipboardData(1) # 1 is CF_TEXT
-    data = ctypes.c_char_p(pcontents).value
-    #ctypes.windll.kernel32.GlobalUnlock(pcontents)
-    ctypes.windll.user32.CloseClipboard()
-    return data
-
-def winSetClipboard(text):
-    GMEM_DDESHARE = 0x2000
-    ctypes.windll.user32.OpenClipboard(0)
-    ctypes.windll.user32.EmptyClipboard()
-    try:
-        # works on Python 2 (bytes() only takes one argument)
-        hCd = ctypes.windll.kernel32.GlobalAlloc(GMEM_DDESHARE, len(bytes(text))+1)
-    except TypeError:
-        # works on Python 3 (bytes() requires an encoding)
-        hCd = ctypes.windll.kernel32.GlobalAlloc(GMEM_DDESHARE, len(bytes(text, 'ascii'))+1)
-    pchData = ctypes.windll.kernel32.GlobalLock(hCd)
-    try:
-        # works on Python 2 (bytes() only takes one argument)
-        ctypes.cdll.msvcrt.strcpy(ctypes.c_char_p(pchData), bytes(text))
-    except TypeError:
-        # works on Python 3 (bytes() requires an encoding)
-        ctypes.cdll.msvcrt.strcpy(ctypes.c_char_p(pchData), bytes(text, 'ascii'))
-    ctypes.windll.kernel32.GlobalUnlock(hCd)
-    ctypes.windll.user32.SetClipboardData(1,hCd)
-    ctypes.windll.user32.CloseClipboard()
-
-def macSetClipboard(text):
-    outf = os.popen('pbcopy', 'w')
-    outf.write(text)
-    outf.close()
-
-def macGetClipboard():
-    outf = os.popen('pbpaste', 'r')
-    content = outf.read()
-    outf.close()
-    return content
-
-def gtkGetClipboard():
-    return gtk.Clipboard().wait_for_text()
-
-def gtkSetClipboard(text):
-    cb = gtk.Clipboard()
-    cb.set_text(text)
-    cb.store()
-
-def qtGetClipboard():
-    return str(cb.text())
-
-def qtSetClipboard(text):
-    cb.setText(text)
-
-def xclipSetClipboard(text):
-    outf = os.popen('xclip -selection c', 'w')
-    outf.write(text)
-    outf.close()
-
-def xclipGetClipboard():
-    outf = os.popen('xclip -selection c -o', 'r')
-    content = outf.read()
-    outf.close()
-    return content
-
-def xselSetClipboard(text):
-    outf = os.popen('xsel -i', 'w')
-    outf.write(text)
-    outf.close()
-
-def xselGetClipboard():
-    outf = os.popen('xsel -o', 'r')
-    content = outf.read()
-    outf.close()
-    return content
-
-
-if os.name == 'nt' or platform.system() == 'Windows':
-    import ctypes
-    getcb = winGetClipboard
-    setcb = winSetClipboard
-elif os.name == 'mac' or platform.system() == 'Darwin':
-    getcb = macGetClipboard
-    setcb = macSetClipboard
-elif os.name == 'posix' or platform.system() == 'Linux':
-    xclipExists = os.system('which xclip > /dev/null') == 0
-    if xclipExists:
-        getcb = xclipGetClipboard
-        setcb = xclipSetClipboard
-    else:
-        xselExists = os.system('which xsel > /dev/null') == 0
-        if xselExists:
-            getcb = xselGetClipboard
-            setcb = xselSetClipboard
-        else:
-            try:
-                import gtk
-            except ImportError:
-                try:
-                    import PyQt4 as qt4
-                    import PyQt4.QtCore
-                    import PyQt4.QtGui
-                except ImportError:
-                    try:
-                        import PySide as qt4
-                        import PySide.QtCore
-                        import PySide.QtGui
-                    except ImportError:
-                        raise NoClipboardProgramError('Pyperclip requires the'
-                                                      ' gtk, PyQt4, or PySide'
-                                                      ' module installed, or '
-                                                      'either the xclip or '
-                                                      'xsel command.')
-                app = qt4.QtGui.QApplication([])
-                cb = qt4.QtGui.QApplication.clipboard()
-                getcb = qtGetClipboard
-                setcb = qtSetClipboard
-            else:
-                getcb = gtkGetClipboard
-                setcb = gtkSetClipboard
-copy = setcb
-paste = getcb
-
-## pandas aliases
-clipboard_get = paste
-clipboard_set = copy
diff --git a/pandas/util/decorators.py b/pandas/util/decorators.py
index 49806491ed1c6..54bb834e829f3 100644
--- a/pandas/util/decorators.py
+++ b/pandas/util/decorators.py
@@ -1,290 +1,8 @@
-from pandas.compat import StringIO, callable
-from pandas.lib import cache_readonly
-import sys
 import warnings
-from functools import wraps
 
+warnings.warn("pandas.util.decorators is deprecated and will be "
+              "removed in a future version, import "
+              "from pandas.util",
+              DeprecationWarning, stacklevel=3)
 
-def deprecate(name, alternative, alt_name=None):
-    alt_name = alt_name or alternative.__name__
-
-    def wrapper(*args, **kwargs):
-        warnings.warn("%s is deprecated. Use %s instead" % (name, alt_name),
-                      FutureWarning, stacklevel=2)
-        return alternative(*args, **kwargs)
-    return wrapper
-
-
-def deprecate_kwarg(old_arg_name, new_arg_name, mapping=None, stacklevel=2):
-    """Decorator to deprecate a keyword argument of a function
-
-    Parameters
-    ----------
-    old_arg_name : str
-        Name of argument in function to deprecate
-    new_arg_name : str
-        Name of prefered argument in function
-    mapping : dict or callable
-        If mapping is present, use it to translate old arguments to
-        new arguments. A callable must do its own value checking;
-        values not found in a dict will be forwarded unchanged.
-
-    Examples
-    --------
-    The following deprecates 'cols', using 'columns' instead
-
-    >>> @deprecate_kwarg(old_arg_name='cols', new_arg_name='columns')
-    ... def f(columns=''):
-    ...     print(columns)
-    ...
-    >>> f(columns='should work ok')
-    should work ok
-    >>> f(cols='should raise warning')
-    FutureWarning: cols is deprecated, use columns instead
-      warnings.warn(msg, FutureWarning)
-    should raise warning
-    >>> f(cols='should error', columns="can\'t pass do both")
-    TypeError: Can only specify 'cols' or 'columns', not both
-    >>> @deprecate_kwarg('old', 'new', {'yes': True, 'no': False})
-    ... def f(new=False):
-    ...     print('yes!' if new else 'no!')
-    ...
-    >>> f(old='yes')
-    FutureWarning: old='yes' is deprecated, use new=True instead
-      warnings.warn(msg, FutureWarning)
-    yes!
-
-    """
-    if mapping is not None and not hasattr(mapping, 'get') and \
-            not callable(mapping):
-        raise TypeError("mapping from old to new argument values "
-                        "must be dict or callable!")
-    def _deprecate_kwarg(func):
-        @wraps(func)
-        def wrapper(*args, **kwargs):
-            old_arg_value = kwargs.pop(old_arg_name, None)
-            if old_arg_value is not None:
-                if mapping is not None:
-                    if hasattr(mapping, 'get'):
-                        new_arg_value = mapping.get(old_arg_value,
-                                                    old_arg_value)
-                    else:
-                        new_arg_value = mapping(old_arg_value)
-                    msg = "the %s=%r keyword is deprecated, " \
-                          "use %s=%r instead" % \
-                          (old_arg_name, old_arg_value,
-                           new_arg_name, new_arg_value)
-                else:
-                    new_arg_value = old_arg_value
-                    msg = "the '%s' keyword is deprecated, " \
-                          "use '%s' instead" % (old_arg_name, new_arg_name)
-
-                warnings.warn(msg, FutureWarning, stacklevel=stacklevel)
-                if kwargs.get(new_arg_name, None) is not None:
-                    msg = "Can only specify '%s' or '%s', not both" % \
-                      (old_arg_name, new_arg_name)
-                    raise TypeError(msg)
-                else:
-                    kwargs[new_arg_name] = new_arg_value
-            return func(*args, **kwargs)
-        return wrapper
-    return _deprecate_kwarg
-
-
-# Substitution and Appender are derived from matplotlib.docstring (1.1.0)
-# module http://matplotlib.sourceforge.net/users/license.html
-
-
-class Substitution(object):
-    """
-    A decorator to take a function's docstring and perform string
-    substitution on it.
-
-    This decorator should be robust even if func.__doc__ is None
-    (for example, if -OO was passed to the interpreter)
-
-    Usage: construct a docstring.Substitution with a sequence or
-    dictionary suitable for performing substitution; then
-    decorate a suitable function with the constructed object. e.g.
-
-    sub_author_name = Substitution(author='Jason')
-
-    @sub_author_name
-    def some_function(x):
-        "%(author)s wrote this function"
-
-    # note that some_function.__doc__ is now "Jason wrote this function"
-
-    One can also use positional arguments.
-
-    sub_first_last_names = Substitution('Edgar Allen', 'Poe')
-
-    @sub_first_last_names
-    def some_function(x):
-        "%s %s wrote the Raven"
-    """
-    def __init__(self, *args, **kwargs):
-        if (args and kwargs):
-            raise AssertionError( "Only positional or keyword args are allowed")
-
-        self.params = args or kwargs
-
-    def __call__(self, func):
-        func.__doc__ = func.__doc__ and func.__doc__ % self.params
-        return func
-
-    def update(self, *args, **kwargs):
-        "Assume self.params is a dict and update it with supplied args"
-        self.params.update(*args, **kwargs)
-
-    @classmethod
-    def from_params(cls, params):
-        """
-        In the case where the params is a mutable sequence (list or dictionary)
-        and it may change before this class is called, one may explicitly use a
-        reference to the params rather than using *args or **kwargs which will
-        copy the values and not reference them.
-        """
-        result = cls()
-        result.params = params
-        return result
-
-
-class Appender(object):
-    """
-    A function decorator that will append an addendum to the docstring
-    of the target function.
-
-    This decorator should be robust even if func.__doc__ is None
-    (for example, if -OO was passed to the interpreter).
-
-    Usage: construct a docstring.Appender with a string to be joined to
-    the original docstring. An optional 'join' parameter may be supplied
-    which will be used to join the docstring and addendum. e.g.
-
-    add_copyright = Appender("Copyright (c) 2009", join='\n')
-
-    @add_copyright
-    def my_dog(has='fleas'):
-        "This docstring will have a copyright below"
-        pass
-    """
-    def __init__(self, addendum, join='', indents=0):
-        if indents > 0:
-            self.addendum = indent(addendum, indents=indents)
-        else:
-            self.addendum = addendum
-        self.join = join
-
-    def __call__(self, func):
-        func.__doc__ = func.__doc__ if func.__doc__ else ''
-        self.addendum = self.addendum if self.addendum else ''
-        docitems = [func.__doc__, self.addendum]
-        func.__doc__ = self.join.join(docitems)
-        return func
-
-
-def indent(text, indents=1):
-    if not text or not isinstance(text, str):
-        return ''
-    jointext = ''.join(['\n'] + ['    '] * indents)
-    return jointext.join(text.split('\n'))
-
-
-def suppress_stdout(f):
-    def wrapped(*args, **kwargs):
-        try:
-            sys.stdout = StringIO()
-            f(*args, **kwargs)
-        finally:
-            sys.stdout = sys.__stdout__
-
-    return wrapped
-
-
-class KnownFailureTest(Exception):
-    '''Raise this exception to mark a test as a known failing test.'''
-    pass
-
-
-def knownfailureif(fail_condition, msg=None):
-    """
-    Make function raise KnownFailureTest exception if given condition is true.
-
-    If the condition is a callable, it is used at runtime to dynamically
-    make the decision. This is useful for tests that may require costly
-    imports, to delay the cost until the test suite is actually executed.
-
-    Parameters
-    ----------
-    fail_condition : bool or callable
-        Flag to determine whether to mark the decorated test as a known
-        failure (if True) or not (if False).
-    msg : str, optional
-        Message to give on raising a KnownFailureTest exception.
-        Default is None.
-
-    Returns
-    -------
-    decorator : function
-        Decorator, which, when applied to a function, causes SkipTest
-        to be raised when `skip_condition` is True, and the function
-        to be called normally otherwise.
-
-    Notes
-    -----
-    The decorator itself is decorated with the ``nose.tools.make_decorator``
-    function in order to transmit function name, and various other metadata.
-
-    """
-    if msg is None:
-        msg = 'Test skipped due to known failure'
-
-    # Allow for both boolean or callable known failure conditions.
-    if callable(fail_condition):
-        fail_val = fail_condition
-    else:
-        fail_val = lambda: fail_condition
-
-    def knownfail_decorator(f):
-        # Local import to avoid a hard nose dependency and only incur the
-        # import time overhead at actual test-time.
-        import nose
-
-        def knownfailer(*args, **kwargs):
-            if fail_val():
-                raise KnownFailureTest(msg)
-            else:
-                return f(*args, **kwargs)
-        return nose.tools.make_decorator(f)(knownfailer)
-
-    return knownfail_decorator
-
-def make_signature(func) :
-    """
-    Returns a string repr of the arg list of a func call, with any defaults
-
-    Examples
-    --------
-
-    >>> def f(a,b,c=2) :
-    >>>     return a*b*c
-    >>> print(_make_signature(f))
-    a,b,c=2
-    """
-    from inspect import getargspec
-    spec = getargspec(func)
-    if spec.defaults == None :
-        n_wo_defaults = len(spec.args)
-        defaults = ('',) * n_wo_defaults
-    else :
-        n_wo_defaults = len(spec.args) - len(spec.defaults)
-        defaults = ('',) * n_wo_defaults + spec.defaults
-    args = []
-    for i, (var, default) in enumerate(zip(spec.args, defaults)) :
-        args.append(var if default=='' else var+'='+repr(default))
-    if spec.varargs:
-        args.append('*' + spec.varargs)
-    if spec.keywords:
-        args.append('**' + spec.keywords)
-    return args, spec.args
+from pandas.util._decorators import *  # noqa
diff --git a/pandas/util/doctools.py b/pandas/util/doctools.py
deleted file mode 100644
index 20a2a68ce6b03..0000000000000
--- a/pandas/util/doctools.py
+++ /dev/null
@@ -1,184 +0,0 @@
-import numpy as np
-import pandas as pd
-import pandas.compat as compat
-
-
-class TablePlotter(object):
-    """
-    Layout some DataFrames in vertical/horizontal layout for explanation.
-    Used in merging.rst
-    """
-
-    def __init__(self, cell_width=0.37, cell_height=0.25, font_size=7.5):
-        self.cell_width = cell_width
-        self.cell_height = cell_height
-        self.font_size = font_size
-
-    def _shape(self, df):
-        """Calcurate table chape considering index levels"""
-        row, col = df.shape
-        return row + df.columns.nlevels, col + df.index.nlevels
-
-    def _get_cells(self, left, right, vertical):
-        """Calcurate appropriate figure size based on left and right data"""
-        if vertical:
-            # calcurate required number of cells
-            vcells = max(sum([self._shape(l)[0] for l in left]), self._shape(right)[0])
-            hcells = max([self._shape(l)[1] for l in left]) + self._shape(right)[1]
-        else:
-            vcells = max([self._shape(l)[0] for l in left] + [self._shape(right)[0]])
-            hcells = sum([self._shape(l)[1] for l in left] + [self._shape(right)[1]])
-        return hcells, vcells
-
-    def plot(self, left, right, labels=None, vertical=True):
-        """
-        Plot left / right DataFrames in specified layout.
-
-        Parameters
-        ----------
-        left : list of DataFrames before operation is applied
-        right : DataFrame of operation result
-        labels : list of str to be drawn as titles of left DataFrames
-        vertical : bool
-            If True, use vertical layout. If False, use horizontal layout.
-        """
-        import matplotlib.pyplot as plt
-        import matplotlib.gridspec as gridspec
-
-        if not isinstance(left, list):
-            left = [left]
-        left = [self._conv(l) for l in left]
-        right = self._conv(right)
-
-        hcells, vcells = self._get_cells(left, right, vertical)
-
-        if vertical:
-            figsize = self.cell_width * hcells, self.cell_height * vcells
-        else:
-            # include margin for titles
-            figsize = self.cell_width * hcells, self.cell_height * vcells
-        fig = plt.figure(figsize=figsize)
-
-        if vertical:
-            gs = gridspec.GridSpec(len(left), hcells)
-            # left
-            max_left_cols = max([self._shape(l)[1] for l in left])
-            max_left_rows = max([self._shape(l)[0] for l in left])
-            for i, (l, label) in enumerate(zip(left, labels)):
-                ax = fig.add_subplot(gs[i, 0:max_left_cols])
-                self._make_table(ax, l, title=label, height=1.0/max_left_rows)
-            # right
-            ax = plt.subplot(gs[:, max_left_cols:])
-            self._make_table(ax, right, title='Result', height=1.05/vcells)
-            fig.subplots_adjust(top=0.9, bottom=0.05, left=0.05, right=0.95)
-        else:
-            max_rows = max([self._shape(df)[0] for df in left + [right]])
-            height = 1.0 / np.max(max_rows)
-            gs = gridspec.GridSpec(1, hcells)
-            # left
-            i = 0
-            for l, label in zip(left, labels):
-                sp = self._shape(l)
-                ax = fig.add_subplot(gs[0, i:i+sp[1]])
-                self._make_table(ax, l, title=label, height=height)
-                i += sp[1]
-            # right
-            ax = plt.subplot(gs[0, i:])
-            self._make_table(ax, right, title='Result', height=height)
-            fig.subplots_adjust(top=0.85, bottom=0.05, left=0.05, right=0.95)
-
-        return fig
-
-    def _conv(self, data):
-        """Convert each input to appropriate for table outplot"""
-        if isinstance(data, pd.Series):
-            if data.name is None:
-                data = data.to_frame(name='')
-            else:
-                data = data.to_frame()
-        data = data.fillna('NaN')
-        return data
-
-    def _insert_index(self, data):
-        # insert is destructive
-        data = data.copy()
-        idx_nlevels = data.index.nlevels
-        if idx_nlevels == 1:
-            data.insert(0, 'Index', data.index)
-        else:
-            for i in range(idx_nlevels):
-                data.insert(i, 'Index{0}'.format(i), data.index.get_level_values(i))
-
-        col_nlevels = data.columns.nlevels
-        if col_nlevels > 1:
-            col = data.columns.get_level_values(0)
-            values = [data.columns.get_level_values(i).values for i in range(1, col_nlevels)]
-            col_df = pd.DataFrame(values)
-            data.columns = col_df.columns
-            data = pd.concat([col_df, data])
-            data.columns = col
-        return data
-
-    def _make_table(self, ax, df, title, height=None):
-        if df is None:
-            ax.set_visible(False)
-            return
-
-        import pandas.tools.plotting as plotting
-
-        idx_nlevels = df.index.nlevels
-        col_nlevels = df.columns.nlevels
-        # must be convert here to get index levels for colorization
-        df = self._insert_index(df)
-        tb = plotting.table(ax, df, loc=9)
-        tb.set_fontsize(self.font_size)
-
-        if height is None:
-            height = 1.0 / (len(df) + 1)
-
-        props = tb.properties()
-        for (r, c), cell in compat.iteritems(props['celld']):
-            if c == -1:
-                cell.set_visible(False)
-            elif r < col_nlevels and c < idx_nlevels:
-                cell.set_visible(False)
-            elif r < col_nlevels or c < idx_nlevels:
-                cell.set_facecolor('#AAAAAA')
-            cell.set_height(height)
-
-        ax.set_title(title, size=self.font_size)
-        ax.axis('off')
-
-
-if __name__ == "__main__":
-    import pandas as pd
-    import matplotlib.pyplot as plt
-
-    p = TablePlotter()
-
-    df1 = pd.DataFrame({'A': [10, 11, 12],
-                        'B': [20, 21, 22],
-                        'C': [30, 31, 32]})
-    df2 = pd.DataFrame({'A': [10, 12],
-                        'C': [30, 32]})
-
-    p.plot([df1, df2], pd.concat([df1, df2]),
-           labels=['df1', 'df2'], vertical=True)
-    plt.show()
-
-    df3 = pd.DataFrame({'X': [10, 12],
-                        'Z': [30, 32]})
-
-    p.plot([df1, df3], pd.concat([df1, df3], axis=1),
-           labels=['df1', 'df2'], vertical=False)
-    plt.show()
-
-    idx = pd.MultiIndex.from_tuples([(1, 'A'), (1, 'B'), (1, 'C'),
-                                 (2, 'A'), (2, 'B'), (2, 'C')])
-    col = pd.MultiIndex.from_tuples([(1, 'A'), (1, 'B')])
-    df3 = pd.DataFrame({'v1': [1, 2, 3, 4, 5, 6],
-                        'v2': [5, 6, 7, 8, 9, 10]},
-                        index=idx)
-    df3.columns = col
-    p.plot(df3, df3, labels=['df3'])
-    plt.show()
diff --git a/pandas/util/misc.py b/pandas/util/misc.py
deleted file mode 100644
index 15492cde5a9f7..0000000000000
--- a/pandas/util/misc.py
+++ /dev/null
@@ -1,10 +0,0 @@
-""" various miscellaneous utilities """
-
-def is_little_endian():
-    """ am I little endian """
-    import sys
-    return sys.byteorder == 'little'
-
-def exclusive(*args):
-    count = sum([arg is not None for arg in args])
-    return count == 1
diff --git a/pandas/util/move.c b/pandas/util/move.c
new file mode 100644
index 0000000000000..9a8af5bbfbdf6
--- /dev/null
+++ b/pandas/util/move.c
@@ -0,0 +1,268 @@
+#include <Python.h>
+
+#define COMPILING_IN_PY2 (PY_VERSION_HEX <= 0x03000000)
+
+#if !COMPILING_IN_PY2
+/* alias this because it is not aliased in Python 3 */
+#define PyString_CheckExact PyBytes_CheckExact
+#define PyString_AS_STRING PyBytes_AS_STRING
+#define PyString_GET_SIZE PyBytes_GET_SIZE
+
+/* in python 3, we cannot intern bytes objects so this is always false */
+#define PyString_CHECK_INTERNED(cs) 0
+#endif  /* !COMPILING_IN_PY2 */
+
+#ifndef Py_TPFLAGS_HAVE_GETCHARBUFFER
+#define Py_TPFLAGS_HAVE_GETCHARBUFFER 0
+#endif
+
+#ifndef Py_TPFLAGS_HAVE_NEWBUFFER
+#define Py_TPFLAGS_HAVE_NEWBUFFER 0
+#endif
+
+PyObject *badmove;  /* bad move exception class */
+
+typedef struct {
+    PyObject_HEAD
+    /* the bytes that own the buffer we are mutating */
+    PyObject *invalid_bytes;
+} stolenbufobject;
+
+PyTypeObject stolenbuf_type;  /* forward declare type */
+
+static void
+stolenbuf_dealloc(stolenbufobject *self)
+{
+    Py_DECREF(self->invalid_bytes);
+    PyObject_Del(self);
+}
+
+static int
+stolenbuf_getbuffer(stolenbufobject *self, Py_buffer *view, int flags)
+{
+    return PyBuffer_FillInfo(view,
+                             (PyObject*) self,
+                             (void*) PyString_AS_STRING(self->invalid_bytes),
+                             PyString_GET_SIZE(self->invalid_bytes),
+                             0,  /* not readonly */
+                             flags);
+}
+
+#if COMPILING_IN_PY2
+
+static Py_ssize_t
+stolenbuf_getreadwritebuf(stolenbufobject *self, Py_ssize_t segment, void **out)
+{
+    if (segment != 0) {
+        PyErr_SetString(PyExc_SystemError,
+                        "accessing non-existent string segment");
+        return -1;
+    }
+    *out = PyString_AS_STRING(self->invalid_bytes);
+    return PyString_GET_SIZE(self->invalid_bytes);
+}
+
+static Py_ssize_t
+stolenbuf_getsegcount(stolenbufobject *self, Py_ssize_t *len)
+{
+    if (len) {
+        *len = PyString_GET_SIZE(self->invalid_bytes);
+    }
+    return 1;
+}
+
+PyBufferProcs stolenbuf_as_buffer = {
+    (readbufferproc) stolenbuf_getreadwritebuf,
+    (writebufferproc) stolenbuf_getreadwritebuf,
+    (segcountproc) stolenbuf_getsegcount,
+    (charbufferproc) stolenbuf_getreadwritebuf,
+    (getbufferproc) stolenbuf_getbuffer,
+};
+
+#else  /* Python 3 */
+
+PyBufferProcs stolenbuf_as_buffer = {
+    (getbufferproc) stolenbuf_getbuffer,
+    NULL,
+};
+
+#endif  /* COMPILING_IN_PY2 */
+
+PyDoc_STRVAR(stolenbuf_doc,
+             "A buffer that is wrapping a stolen bytes object's buffer.");
+
+PyTypeObject stolenbuf_type = {
+    PyVarObject_HEAD_INIT(NULL, 0)
+    "pandas.util._move.stolenbuf",              /* tp_name */
+    sizeof(stolenbufobject),                    /* tp_basicsize */
+    0,                                          /* tp_itemsize */
+    (destructor) stolenbuf_dealloc,             /* tp_dealloc */
+    0,                                          /* tp_print */
+    0,                                          /* tp_getattr */
+    0,                                          /* tp_setattr */
+    0,                                          /* tp_reserved */
+    0,                                          /* tp_repr */
+    0,                                          /* tp_as_number */
+    0,                                          /* tp_as_sequence */
+    0,                                          /* tp_as_mapping */
+    0,                                          /* tp_hash */
+    0,                                          /* tp_call */
+    0,                                          /* tp_str */
+    0,                                          /* tp_getattro */
+    0,                                          /* tp_setattro */
+    &stolenbuf_as_buffer,                       /* tp_as_buffer */
+    Py_TPFLAGS_DEFAULT |
+    Py_TPFLAGS_HAVE_NEWBUFFER |
+    Py_TPFLAGS_HAVE_GETCHARBUFFER,              /* tp_flags */
+    stolenbuf_doc,                              /* tp_doc */
+};
+
+PyDoc_STRVAR(
+    move_into_mutable_buffer_doc,
+    "Moves a bytes object that is about to be destroyed into a mutable buffer\n"
+    "without copying the data.\n"
+    "\n"
+    "Parameters\n"
+    "----------\n"
+    "bytes_rvalue : bytes with 1 refcount.\n"
+    "    The bytes object that you want to move into a mutable buffer. This\n"
+    "    cannot be a named object. It must only have a single reference.\n"
+    "\n"
+    "Returns\n"
+    "-------\n"
+    "buf : stolenbuf\n"
+    "    An object that supports the buffer protocol which can give a mutable\n"
+    "    view of the data that was previously owned by ``bytes_rvalue``.\n"
+    "\n"
+    "Raises\n"
+    "------\n"
+    "BadMove\n"
+    "    Raised when a move is attempted on an object with more than one\n"
+    "    reference.\n"
+    "\n"
+    "Notes\n"
+    "-----\n"
+    "If you want to use this function you are probably wrong.\n"
+    "\n"
+    "Warning: Do not call this function through *unpacking. This can\n"
+    "potentially trick the reference checks which may allow you to get a\n"
+    "mutable reference to a shared string!\n"
+    "\n");
+
+/* This is implemented as a standalone function instead of the ``tp_new`` of
+   ``stolenbuf`` because we need to create a function using the METH_O flag
+   to support Python 3.6. In python 3.6, PyCFunction calls from python code now
+   count the reference owned by the argument tuple. This would cause the object
+   to have 2 references if used with a direct call like: ``stolenbuf(a)``;
+   however, if called through *unpacking like ``stolenbuf(*(a,))`` it would
+   only have the one reference (the tuple). */
+static PyObject*
+move_into_mutable_buffer(PyObject *self, PyObject *bytes_rvalue)
+{
+    stolenbufobject *ret;
+
+    if (!PyString_CheckExact(bytes_rvalue)) {
+        PyErr_SetString(PyExc_TypeError,
+                        "stolenbuf can only steal from bytes objects");
+        return NULL;
+    }
+
+    if (Py_REFCNT(bytes_rvalue) != 1 || PyString_CHECK_INTERNED(bytes_rvalue)) {
+        /* there is a reference other than the caller's stack or the string is
+           interned */
+        PyErr_SetObject(badmove, bytes_rvalue);
+        return NULL;
+    }
+
+    if (!(ret = PyObject_New(stolenbufobject, &stolenbuf_type))) {
+        return NULL;
+    }
+
+    /* store the original bytes object in a field that is not
+       exposed to python */
+    Py_INCREF(bytes_rvalue);
+    ret->invalid_bytes = bytes_rvalue;
+    return (PyObject*) ret;
+}
+
+PyMethodDef methods[] = {
+    {"move_into_mutable_buffer",
+     (PyCFunction) move_into_mutable_buffer,
+     METH_O,
+     move_into_mutable_buffer_doc},
+    {NULL},
+};
+
+#define MODULE_NAME "pandas.util._move"
+
+#if !COMPILING_IN_PY2
+PyModuleDef _move_module = {
+    PyModuleDef_HEAD_INIT,
+    MODULE_NAME,
+    NULL,
+    -1,
+    methods,
+};
+#endif  /* !COMPILING_IN_PY2 */
+
+PyDoc_STRVAR(
+    badmove_doc,
+    "Exception used to indicate that a move was attempted on a value with\n"
+    "more than a single reference.\n"
+    "\n"
+    "Parameters\n"
+    "----------\n"
+    "data : any\n"
+    "    The data which was passed to ``move_into_mutable_buffer``.\n"
+    "\n"
+    "See Also\n"
+    "--------\n"
+    "pandas.util._move.move_into_mutable_buffer\n");
+
+PyMODINIT_FUNC
+#if !COMPILING_IN_PY2
+#define ERROR_RETURN NULL
+PyInit__move(void)
+#else
+#define ERROR_RETURN
+init_move(void)
+#endif  /* !COMPILING_IN_PY2 */
+{
+    PyObject *m;
+
+    if (!(badmove = PyErr_NewExceptionWithDoc("pandas.util._move.BadMove",
+                                              badmove_doc,
+                                              NULL,
+                                              NULL))) {
+        return ERROR_RETURN;
+    }
+
+    if (PyType_Ready(&stolenbuf_type)) {
+        return ERROR_RETURN;
+    }
+
+#if !COMPILING_IN_PY2
+    if (!(m = PyModule_Create(&_move_module)))
+#else
+    if (!(m = Py_InitModule(MODULE_NAME, methods)))
+#endif  /* !COMPILING_IN_PY2 */
+    {
+        return ERROR_RETURN;
+    }
+
+    if (PyModule_AddObject(m,
+                           "stolenbuf",
+                           (PyObject*) &stolenbuf_type)) {
+        Py_DECREF(m);
+        return ERROR_RETURN;
+    }
+
+    if (PyModule_AddObject(m, "BadMove", badmove)) {
+        Py_DECREF(m);
+        return ERROR_RETURN;
+    }
+
+#if !COMPILING_IN_PY2
+    return m;
+#endif  /* !COMPILING_IN_PY2 */
+}
diff --git a/pandas/util/print_versions.py b/pandas/util/print_versions.py
deleted file mode 100644
index f0545e9949e24..0000000000000
--- a/pandas/util/print_versions.py
+++ /dev/null
@@ -1,152 +0,0 @@
-import os
-import platform
-import sys
-import struct
-import subprocess
-import codecs
-
-
-def get_sys_info():
-    "Returns system information as a dict"
-
-    blob = []
-
-    # get full commit hash
-    commit = None
-    if os.path.isdir(".git") and os.path.isdir("pandas"):
-        try:
-            pipe = subprocess.Popen('git log --format="%H" -n 1'.split(" "),
-                                    stdout=subprocess.PIPE, stderr=subprocess.PIPE)
-            so, serr = pipe.communicate()
-        except:
-            pass
-        else:
-            if pipe.returncode == 0:
-                commit = so
-                try:
-                    commit = so.decode('utf-8')
-                except ValueError:
-                    pass
-                commit = commit.strip().strip('"')
-
-    blob.append(('commit', commit))
-
-    try:
-        sysname, nodename, release, version, machine, processor = platform.uname(
-        )
-        blob.extend([
-            ("python", "%d.%d.%d.%s.%s" % sys.version_info[:]),
-            ("python-bits", struct.calcsize("P") * 8),
-            ("OS", "%s" % (sysname)),
-            ("OS-release", "%s" % (release)),
-            # ("Version", "%s" % (version)),
-            ("machine", "%s" % (machine)),
-            ("processor", "%s" % (processor)),
-            ("byteorder", "%s" % sys.byteorder),
-            ("LC_ALL", "%s" % os.environ.get('LC_ALL', "None")),
-            ("LANG", "%s" % os.environ.get('LANG', "None")),
-
-        ])
-    except:
-        pass
-
-    return blob
-
-
-def show_versions(as_json=False):
-    import imp
-    sys_info = get_sys_info()
-
-    deps = [
-        # (MODULE_NAME, f(mod) -> mod version)
-        ("pandas", lambda mod: mod.__version__),
-        ("nose", lambda mod: mod.__version__),
-        ("pip", lambda mod: mod.__version__),
-        ("setuptools", lambda mod: mod.__version__),
-        ("Cython", lambda mod: mod.__version__),
-        ("numpy", lambda mod: mod.version.version),
-        ("scipy", lambda mod: mod.version.version),
-        ("statsmodels", lambda mod: mod.__version__),
-        ("IPython", lambda mod: mod.__version__),
-        ("sphinx", lambda mod: mod.__version__),
-        ("patsy", lambda mod: mod.__version__),
-        ("dateutil", lambda mod: mod.__version__),
-        ("pytz", lambda mod: mod.VERSION),
-        ("blosc", lambda mod: mod.__version__),
-        ("bottleneck", lambda mod: mod.__version__),
-        ("tables", lambda mod: mod.__version__),
-        ("numexpr", lambda mod: mod.__version__),
-        ("matplotlib", lambda mod: mod.__version__),
-        ("openpyxl", lambda mod: mod.__version__),
-        ("xlrd", lambda mod: mod.__VERSION__),
-        ("xlwt", lambda mod: mod.__VERSION__),
-        ("xlsxwriter", lambda mod: mod.__version__),
-        ("lxml", lambda mod: mod.etree.__version__),
-        ("bs4", lambda mod: mod.__version__),
-        ("html5lib", lambda mod: mod.__version__),
-        ("httplib2", lambda mod: mod.__version__),
-        ("apiclient", lambda mod: mod.__version__),
-        ("sqlalchemy", lambda mod: mod.__version__),
-        ("pymysql", lambda mod: mod.__version__),
-        ("psycopg2", lambda mod: mod.__version__),
-    ]
-
-    deps_blob = list()
-    for (modname, ver_f) in deps:
-        try:
-            try:
-                mod = imp.load_module(modname, *imp.find_module(modname))
-            except (ImportError):
-                import importlib
-                mod = importlib.import_module(modname)
-            ver = ver_f(mod)
-            deps_blob.append((modname, ver))
-        except:
-            deps_blob.append((modname, None))
-
-    if (as_json):
-        # 2.6-safe
-        try:
-            import json
-        except:
-            import simplejson as json
-
-        j = dict(system=dict(sys_info), dependencies=dict(deps_blob))
-
-        if as_json == True:
-            print(j)
-        else:
-            with codecs.open(as_json, "wb", encoding='utf8') as f:
-                json.dump(j, f, indent=2)
-
-    else:
-
-        print("\nINSTALLED VERSIONS")
-        print("------------------")
-
-        for k, stat in sys_info:
-            print("%s: %s" % (k, stat))
-
-        print("")
-        for k, stat in deps_blob:
-            print("%s: %s" % (k, stat))
-
-
-def main():
-        # optparse is 2.6-safe
-    from optparse import OptionParser
-    parser = OptionParser()
-    parser.add_option("-j", "--json", metavar="FILE", nargs=1,
-                      help="Save output as JSON into file, pass in '-' to output to stdout")
-
-    (options, args) = parser.parse_args()
-
-    if options.json == "-":
-        options.json = True
-
-    show_versions(as_json=options.json)
-
-    return 0
-
-if __name__ == "__main__":
-    sys.exit(main())
diff --git a/pandas/util/testing.py b/pandas/util/testing.py
index 362351c7c31c2..11e9942079aad 100644
--- a/pandas/util/testing.py
+++ b/pandas/util/testing.py
@@ -1,110 +1,313 @@
 from __future__ import division
 # pylint: disable-msg=W0402
 
-import random
 import re
 import string
 import sys
 import tempfile
 import warnings
-import inspect
 import os
 import subprocess
 import locale
-import unittest
 import traceback
 
 from datetime import datetime
-from functools import wraps, partial
+from functools import wraps
 from contextlib import contextmanager
-from distutils.version import LooseVersion
 
 from numpy.random import randn, rand
 import numpy as np
 
 import pandas as pd
-from pandas.core.common import (is_sequence, array_equivalent, is_list_like, is_number,
-                                is_datetimelike_v_numeric, is_datetimelike_v_object,
-                                is_number, pprint_thing, take_1d,
-                                needs_i8_conversion)
+from pandas.core.arrays import ExtensionArray
+from pandas.core.dtypes.missing import array_equivalent
+from pandas.core.dtypes.common import (
+    is_datetimelike_v_numeric,
+    is_datetimelike_v_object,
+    is_number, is_bool,
+    needs_i8_conversion,
+    is_categorical_dtype,
+    is_interval_dtype,
+    is_sequence,
+    is_list_like,
+    is_extension_array_dtype)
+from pandas.io.formats.printing import pprint_thing
+from pandas.core.algorithms import take_1d
+import pandas.core.common as com
 
 import pandas.compat as compat
-from pandas.compat import(
+from pandas.compat import (
     filter, map, zip, range, unichr, lrange, lmap, lzip, u, callable, Counter,
-    raise_with_traceback, httplib, is_platform_windows, is_platform_32bit
-)
+    raise_with_traceback, httplib, StringIO, string_types, PY3, PY2)
 
-from pandas.computation import expressions as expr
+from pandas import (bdate_range, CategoricalIndex, Categorical, IntervalIndex,
+                    DatetimeIndex, TimedeltaIndex, PeriodIndex, RangeIndex,
+                    Index, MultiIndex,
+                    Series, DataFrame, Panel)
 
-from pandas import (bdate_range, CategoricalIndex, DatetimeIndex, TimedeltaIndex, PeriodIndex,
-                    Index, MultiIndex, Series, DataFrame, Panel, Panel4D)
-from pandas.util.decorators import deprecate
-from pandas import _testing
+from pandas._libs import testing as _testing
 from pandas.io.common import urlopen
 
+
 N = 30
 K = 4
 _RAISE_NETWORK_ERROR_DEFAULT = False
 
 # set testing_mode
+_testing_mode_warnings = (DeprecationWarning, compat.ResourceWarning)
+
+
 def set_testing_mode():
     # set the testing mode filters
-    testing_mode = os.environ.get('PANDAS_TESTING_MODE','None')
+    testing_mode = os.environ.get('PANDAS_TESTING_MODE', 'None')
     if 'deprecate' in testing_mode:
-        warnings.simplefilter('always', DeprecationWarning)
+        warnings.simplefilter('always', _testing_mode_warnings)
+
 
 def reset_testing_mode():
     # reset the testing mode filters
-    testing_mode = os.environ.get('PANDAS_TESTING_MODE','None')
+    testing_mode = os.environ.get('PANDAS_TESTING_MODE', 'None')
     if 'deprecate' in testing_mode:
-        warnings.simplefilter('ignore', DeprecationWarning)
+        warnings.simplefilter('ignore', _testing_mode_warnings)
 
 
 set_testing_mode()
 
-class TestCase(unittest.TestCase):
 
-    @classmethod
-    def setUpClass(cls):
-        pd.set_option('chained_assignment', 'raise')
+def reset_display_options():
+    """
+    Reset the display options for printing and representing objects.
+    """
 
-    @classmethod
-    def tearDownClass(cls):
-        pass
+    pd.reset_option('^display.', silent=True)
 
-    def reset_display_options(self):
-        # reset the display options
-        pd.reset_option('^display.', silent=True)
 
-    def round_trip_pickle(self, obj, path=None):
-        if path is None:
-            path = u('__%s__.pickle' % rands(10))
-        with ensure_clean(path) as path:
-            pd.to_pickle(obj, path)
-            return pd.read_pickle(path)
+def round_trip_pickle(obj, path=None):
+    """
+    Pickle an object and then read it again.
 
-    # https://docs.python.org/3/library/unittest.html#deprecated-aliases
-    def assertEquals(self, *args, **kwargs):
-        return deprecate('assertEquals', self.assertEqual)(*args, **kwargs)
+    Parameters
+    ----------
+    obj : pandas object
+        The object to pickle and then re-read.
+    path : str, default None
+        The path where the pickled object is written and then read.
+
+    Returns
+    -------
+    round_trip_pickled_object : pandas object
+        The original object that was pickled and then re-read.
+    """
+
+    if path is None:
+        path = u('__{random_bytes}__.pickle'.format(random_bytes=rands(10)))
+    with ensure_clean(path) as path:
+        pd.to_pickle(obj, path)
+        return pd.read_pickle(path)
 
-    def assertNotEquals(self, *args, **kwargs):
-        return deprecate('assertNotEquals', self.assertNotEqual)(*args, **kwargs)
 
-    def assert_(self, *args, **kwargs):
-        return deprecate('assert_', self.assertTrue)(*args, **kwargs)
+def round_trip_pathlib(writer, reader, path=None):
+    """
+    Write an object to file specified by a pathlib.Path and read it back
+
+    Parameters
+    ----------
+    writer : callable bound to pandas object
+        IO writing function (e.g. DataFrame.to_csv )
+    reader : callable
+        IO reading function (e.g. pd.read_csv )
+    path : str, default None
+        The path where the object is written and then read.
 
-    def assertAlmostEquals(self, *args, **kwargs):
-        return deprecate('assertAlmostEquals', self.assertAlmostEqual)(*args, **kwargs)
+    Returns
+    -------
+    round_trip_object : pandas object
+        The original object that was serialized and then re-read.
+    """
 
-    def assertNotAlmostEquals(self, *args, **kwargs):
-        return deprecate('assertNotAlmostEquals', self.assertNotAlmostEqual)(*args, **kwargs)
+    import pytest
+    Path = pytest.importorskip('pathlib').Path
+    if path is None:
+        path = '___pathlib___'
+    with ensure_clean(path) as path:
+        writer(Path(path))
+        obj = reader(Path(path))
+    return obj
 
 
-# NOTE: don't pass an NDFrame or index to this function - may not handle it
-# well.
-assert_almost_equal = _testing.assert_almost_equal
+def round_trip_localpath(writer, reader, path=None):
+    """
+    Write an object to file specified by a py.path LocalPath and read it back
+
+    Parameters
+    ----------
+    writer : callable bound to pandas object
+        IO writing function (e.g. DataFrame.to_csv )
+    reader : callable
+        IO reading function (e.g. pd.read_csv )
+    path : str, default None
+        The path where the object is written and then read.
+
+    Returns
+    -------
+    round_trip_object : pandas object
+        The original object that was serialized and then re-read.
+    """
+    import pytest
+    LocalPath = pytest.importorskip('py.path').local
+    if path is None:
+        path = '___localpath___'
+    with ensure_clean(path) as path:
+        writer(LocalPath(path))
+        obj = reader(LocalPath(path))
+    return obj
+
+
+@contextmanager
+def decompress_file(path, compression):
+    """
+    Open a compressed file and return a file object
+
+    Parameters
+    ----------
+    path : str
+        The path where the file is read from
+
+    compression : {'gzip', 'bz2', 'zip', 'xz', None}
+        Name of the decompression to use
+
+    Returns
+    -------
+    f : file object
+    """
+
+    if compression is None:
+        f = open(path, 'rb')
+    elif compression == 'gzip':
+        import gzip
+        f = gzip.open(path, 'rb')
+    elif compression == 'bz2':
+        import bz2
+        f = bz2.BZ2File(path, 'rb')
+    elif compression == 'xz':
+        lzma = compat.import_lzma()
+        f = lzma.LZMAFile(path, 'rb')
+    elif compression == 'zip':
+        import zipfile
+        zip_file = zipfile.ZipFile(path)
+        zip_names = zip_file.namelist()
+        if len(zip_names) == 1:
+            f = zip_file.open(zip_names.pop())
+        else:
+            raise ValueError('ZIP file {} error. Only one file per ZIP.'
+                             .format(path))
+    else:
+        msg = 'Unrecognized compression type: {}'.format(compression)
+        raise ValueError(msg)
+
+    yield f
+    f.close()
+
+
+def assert_almost_equal(left, right, check_exact=False,
+                        check_dtype='equiv', check_less_precise=False,
+                        **kwargs):
+    """
+    Check that the left and right objects are approximately equal.
+
+    Parameters
+    ----------
+    left : object
+    right : object
+    check_exact : bool, default False
+        Whether to compare number exactly.
+    check_dtype: bool, default True
+        check dtype if both a and b are the same type
+    check_less_precise : bool or int, default False
+        Specify comparison precision. Only used when `check_exact` is False.
+        5 digits (False) or 3 digits (True) after decimal points are compared.
+        If int, then specify the digits to compare.
+
+        When comparing two numbers, if the first number has magnitude less
+        than 1e-5, we compare the two numbers directly and check whether
+        they are equivalent within the specified precision. Otherwise, we
+        compare the **ratio** of the second number to the first number and
+        check whether it is equivalent to 1 within the specified precision.
+    """
+    if isinstance(left, pd.Index):
+        return assert_index_equal(left, right, check_exact=check_exact,
+                                  exact=check_dtype,
+                                  check_less_precise=check_less_precise,
+                                  **kwargs)
+
+    elif isinstance(left, pd.Series):
+        return assert_series_equal(left, right, check_exact=check_exact,
+                                   check_dtype=check_dtype,
+                                   check_less_precise=check_less_precise,
+                                   **kwargs)
+
+    elif isinstance(left, pd.DataFrame):
+        return assert_frame_equal(left, right, check_exact=check_exact,
+                                  check_dtype=check_dtype,
+                                  check_less_precise=check_less_precise,
+                                  **kwargs)
+
+    else:
+        # other sequences
+        if check_dtype:
+            if is_number(left) and is_number(right):
+                # do not compare numeric classes, like np.float64 and float
+                pass
+            elif is_bool(left) and is_bool(right):
+                # do not compare bool classes, like np.bool_ and bool
+                pass
+            else:
+                if (isinstance(left, np.ndarray) or
+                        isinstance(right, np.ndarray)):
+                    obj = 'numpy array'
+                else:
+                    obj = 'Input'
+                assert_class_equal(left, right, obj=obj)
+        return _testing.assert_almost_equal(
+            left, right,
+            check_dtype=check_dtype,
+            check_less_precise=check_less_precise,
+            **kwargs)
+
+
+def _check_isinstance(left, right, cls):
+    """
+    Helper method for our assert_* methods that ensures that
+    the two objects being compared have the right type before
+    proceeding with the comparison.
+
+    Parameters
+    ----------
+    left : The first object being compared.
+    right : The second object being compared.
+    cls : The class type to check against.
+
+    Raises
+    ------
+    AssertionError : Either `left` or `right` is not an instance of `cls`.
+    """
+
+    err_msg = "{name} Expected type {exp_type}, found {act_type} instead"
+    cls_name = cls.__name__
+
+    if not isinstance(left, cls):
+        raise AssertionError(err_msg.format(name=cls_name, exp_type=cls,
+                                            act_type=type(left)))
+    if not isinstance(right, cls):
+        raise AssertionError(err_msg.format(name=cls_name, exp_type=cls,
+                                            act_type=type(right)))
+
+
+def assert_dict_equal(left, right, compare_keys=True):
+
+    _check_isinstance(left, right, dict)
+    return _testing.assert_dict_equal(left, right, compare_keys=compare_keys)
 
-assert_dict_equal = _testing.assert_dict_equal
 
 def randbool(size=(), p=0.5):
     return rand(*size) <= p
@@ -118,7 +321,7 @@ def randbool(size=(), p=0.5):
 
 def rands_array(nchars, size, dtype='O'):
     """Generate an array of byte strings."""
-    retval = (choice(RANDS_CHARS, size=nchars * np.prod(size))
+    retval = (np.random.choice(RANDS_CHARS, size=nchars * np.prod(size))
               .view((np.str_, nchars)).reshape(size))
     if dtype is None:
         return retval
@@ -128,7 +331,7 @@ def rands_array(nchars, size, dtype='O'):
 
 def randu_array(nchars, size, dtype='O'):
     """Generate an array of unicode strings."""
-    retval = (choice(RANDU_CHARS, size=nchars * np.prod(size))
+    retval = (np.random.choice(RANDU_CHARS, size=nchars * np.prod(size))
               .view((np.unicode_, nchars)).reshape(size))
     if dtype is None:
         return retval
@@ -143,7 +346,7 @@ def rands(nchars):
     See `rands_array` if you want to create an array of random strings.
 
     """
-    return ''.join(choice(RANDS_CHARS, nchars))
+    return ''.join(np.random.choice(RANDS_CHARS, nchars))
 
 
 def randu(nchars):
@@ -153,15 +356,7 @@ def randu(nchars):
     See `randu_array` if you want to create an array of random unicode strings.
 
     """
-    return ''.join(choice(RANDU_CHARS, nchars))
-
-
-def choice(x, size=10):
-    """sample with replacement; uniform over the input"""
-    try:
-        return np.random.choice(x, size=size)
-    except AttributeError:
-        return np.random.randint(len(x), size=size).choose(x)
+    return ''.join(np.random.choice(RANDU_CHARS, nchars))
 
 
 def close(fignum=None):
@@ -174,124 +369,12 @@ def close(fignum=None):
         _close(fignum)
 
 
-def _skip_if_32bit():
-    import nose
-    if is_platform_32bit():
-        raise nose.SkipTest("skipping for 32 bit")
-
-def mplskip(cls):
-    """Skip a TestCase instance if matplotlib isn't installed"""
-
-    @classmethod
-    def setUpClass(cls):
-        try:
-            import matplotlib as mpl
-            mpl.use("Agg", warn=False)
-        except ImportError:
-            import nose
-            raise nose.SkipTest("matplotlib not installed")
-
-    cls.setUpClass = setUpClass
-    return cls
-
-
-def _skip_if_mpl_1_5():
-    import matplotlib
-    v = matplotlib.__version__
-    if v > LooseVersion('1.4.3') or v[0] == '0':
-        import nose
-        raise nose.SkipTest("matplotlib 1.5")
-
-
-def _skip_if_no_scipy():
-    try:
-        import scipy.stats
-    except ImportError:
-        import nose
-        raise nose.SkipTest("no scipy.stats module")
-    try:
-        import scipy.interpolate
-    except ImportError:
-        import nose
-        raise nose.SkipTest('scipy.interpolate missing')
-
-
-def _skip_if_no_pytz():
-    try:
-        import pytz
-    except ImportError:
-        import nose
-        raise nose.SkipTest("pytz not installed")
-
-
-def _skip_if_no_dateutil():
-    try:
-        import dateutil
-    except ImportError:
-        import nose
-        raise nose.SkipTest("dateutil not installed")
-
-
-def _skip_if_windows_python_3():
-    if compat.PY3 and is_platform_windows():
-        import nose
-        raise nose.SkipTest("not used on python 3/win32")
-
-def _skip_if_windows():
-    if is_platform_windows():
-        import nose
-        raise nose.SkipTest("Running on Windows")
-
-
-def _skip_if_no_cday():
-    from pandas.core.datetools import cday
-    if cday is None:
-        import nose
-        raise nose.SkipTest("CustomBusinessDay not available.")
-
-
-def _skip_if_python26():
-    if sys.version_info[:2] == (2, 6):
-        import nose
-        raise nose.SkipTest("skipping on python2.6")
-
-def _incompat_bottleneck_version(method):
-    """ skip if we have bottleneck installed
-    and its >= 1.0
-    as we don't match the nansum/nanprod behavior for all-nan
-    ops, see GH9422
-    """
-    if method not in ['sum','prod']:
-        return False
-    try:
-        import bottleneck as bn
-        return bn.__version__ >= LooseVersion('1.0')
-    except ImportError:
-        return False
-
-def skip_if_no_ne(engine='numexpr'):
-    import nose
-    _USE_NUMEXPR = pd.computation.expressions._USE_NUMEXPR
-
-    if engine == 'numexpr':
-        try:
-            import numexpr as ne
-        except ImportError:
-            raise nose.SkipTest("numexpr not installed")
-
-        if not _USE_NUMEXPR:
-            raise nose.SkipTest("numexpr disabled")
-
-        if ne.__version__ < LooseVersion('2.0'):
-            raise nose.SkipTest("numexpr version too low: "
-                                "%s" % ne.__version__)
-
-
-
-#------------------------------------------------------------------------------
+# -----------------------------------------------------------------------------
 # locale utilities
 
-def check_output(*popenargs, **kwargs):  # shamelessly taken from Python 2.7 source
+
+def check_output(*popenargs, **kwargs):
+    # shamelessly taken from Python 2.7 source
     r"""Run command with arguments and return its output as a byte string.
 
     If the exit code was non-zero it raises a CalledProcessError.  The
@@ -313,7 +396,7 @@ def check_output(*popenargs, **kwargs):  # shamelessly taken from Python 2.7 sou
     """
     if 'stdout' in kwargs:
         raise ValueError('stdout argument not allowed, it will be overridden.')
-    process = subprocess.Popen(stdout=subprocess.PIPE,stderr=subprocess.PIPE,
+    process = subprocess.Popen(stdout=subprocess.PIPE, stderr=subprocess.PIPE,
                                *popenargs, **kwargs)
     output, unused_err = process.communicate()
     retcode = process.poll()
@@ -329,8 +412,8 @@ def _default_locale_getter():
     try:
         raw_locales = check_output(['locale -a'], shell=True)
     except subprocess.CalledProcessError as e:
-        raise type(e)("%s, the 'locale -a' command cannot be found on your "
-                      "system" % e)
+        raise type(e)("{exception}, the 'locale -a' command cannot be found "
+                      "on your system".format(exception=e))
     return raw_locales
 
 
@@ -365,18 +448,19 @@ def get_locales(prefix=None, normalize=True,
     """
     try:
         raw_locales = locale_getter()
-    except:
+    except Exception:
         return None
 
     try:
-        # raw_locales is "\n" seperated list of locales
+        # raw_locales is "\n" separated list of locales
         # it may contain non-decodable parts, so split
         # extract what we can and then rejoin.
         raw_locales = raw_locales.split(b'\n')
         out_locales = []
         for x in raw_locales:
-            if compat.PY3:
-                out_locales.append(str(x, encoding=pd.options.display.encoding))
+            if PY3:
+                out_locales.append(str(
+                    x, encoding=pd.options.display.encoding))
             else:
                 out_locales.append(str(x))
 
@@ -386,7 +470,8 @@ def get_locales(prefix=None, normalize=True,
     if prefix is None:
         return _valid_locales(out_locales, normalize)
 
-    found = re.compile('%s.*' % prefix).findall('\n'.join(out_locales))
+    found = re.compile('{prefix}.*'.format(prefix=prefix)) \
+              .findall('\n'.join(out_locales))
     return _valid_locales(found, normalize)
 
 
@@ -417,7 +502,7 @@ def set_locale(new_locale, lc_var=locale.LC_ALL):
         except ValueError:
             yield new_locale
         else:
-            if all(lc is not None for lc in normalized_locale):
+            if com._all_not_none(*normalized_locale):
                 yield '.'.join(normalized_locale)
             else:
                 yield new_locale
@@ -470,10 +555,131 @@ def _valid_locales(locales, normalize):
 
     return list(filter(_can_set_locale, map(normalizer, locales)))
 
+# -----------------------------------------------------------------------------
+# Stdout / stderr decorators
+
+
+@contextmanager
+def set_defaultencoding(encoding):
+    """
+    Set default encoding (as given by sys.getdefaultencoding()) to the given
+    encoding; restore on exit.
+
+    Parameters
+    ----------
+    encoding : str
+    """
+    if not PY2:
+        raise ValueError("set_defaultencoding context is only available "
+                         "in Python 2.")
+    orig = sys.getdefaultencoding()
+    reload(sys)  # noqa:F821
+    sys.setdefaultencoding(encoding)
+    try:
+        yield
+    finally:
+        sys.setdefaultencoding(orig)
+
+
+def capture_stdout(f):
+    """
+    Decorator to capture stdout in a buffer so that it can be checked
+    (or suppressed) during testing.
+
+    Parameters
+    ----------
+    f : callable
+        The test that is capturing stdout.
+
+    Returns
+    -------
+    f : callable
+        The decorated test ``f``, which captures stdout.
+
+    Examples
+    --------
+
+    >>> from pandas.util.testing import capture_stdout
+    >>>
+    >>> import sys
+    >>>
+    >>> @capture_stdout
+    ... def test_print_pass():
+    ...     print("foo")
+    ...     out = sys.stdout.getvalue()
+    ...     assert out == "foo\n"
+    >>>
+    >>> @capture_stdout
+    ... def test_print_fail():
+    ...     print("foo")
+    ...     out = sys.stdout.getvalue()
+    ...     assert out == "bar\n"
+    ...
+    AssertionError: assert 'foo\n' == 'bar\n'
+    """
+
+    @wraps(f)
+    def wrapper(*args, **kwargs):
+        try:
+            sys.stdout = StringIO()
+            f(*args, **kwargs)
+        finally:
+            sys.stdout = sys.__stdout__
+
+    return wrapper
+
+
+def capture_stderr(f):
+    """
+    Decorator to capture stderr in a buffer so that it can be checked
+    (or suppressed) during testing.
+
+    Parameters
+    ----------
+    f : callable
+        The test that is capturing stderr.
+
+    Returns
+    -------
+    f : callable
+        The decorated test ``f``, which captures stderr.
+
+    Examples
+    --------
+
+    >>> from pandas.util.testing import capture_stderr
+    >>>
+    >>> import sys
+    >>>
+    >>> @capture_stderr
+    ... def test_stderr_pass():
+    ...     sys.stderr.write("foo")
+    ...     out = sys.stderr.getvalue()
+    ...     assert out == "foo\n"
+    >>>
+    >>> @capture_stderr
+    ... def test_stderr_fail():
+    ...     sys.stderr.write("foo")
+    ...     out = sys.stderr.getvalue()
+    ...     assert out == "bar\n"
+    ...
+    AssertionError: assert 'foo\n' == 'bar\n'
+    """
+
+    @wraps(f)
+    def wrapper(*args, **kwargs):
+        try:
+            sys.stderr = StringIO()
+            f(*args, **kwargs)
+        finally:
+            sys.stderr = sys.__stderr__
+
+    return wrapper
 
-#------------------------------------------------------------------------------
+# -----------------------------------------------------------------------------
 # Console debugging tools
 
+
 def debug(f, *args, **kwargs):
     from pdb import Pdb as OldPdb
     try:
@@ -495,11 +701,11 @@ def set_trace():
     from IPython.core.debugger import Pdb
     try:
         Pdb(color_scheme='Linux').set_trace(sys._getframe().f_back)
-    except:
+    except Exception:
         from pdb import Pdb as OldPdb
         OldPdb().set_trace(sys._getframe().f_back)
 
-#------------------------------------------------------------------------------
+# -----------------------------------------------------------------------------
 # contextmanager to ensure the file cleanup
 
 
@@ -533,8 +739,8 @@ def ensure_clean(filename=None, return_filelike=False):
         try:
             fd, filename = tempfile.mkstemp(suffix=filename)
         except UnicodeEncodeError:
-            import nose
-            raise nose.SkipTest('no unicode file names on this system')
+            import pytest
+            pytest.skip('no unicode file names on this system')
 
         try:
             yield filename
@@ -542,24 +748,16 @@ def ensure_clean(filename=None, return_filelike=False):
             try:
                 os.close(fd)
             except Exception as e:
-                print("Couldn't close file descriptor: %d (file: %s)" %
-                    (fd, filename))
+                print("Couldn't close file descriptor: {fdesc} (file: {fname})"
+                      .format(fdesc=fd, fname=filename))
             try:
                 if os.path.exists(filename):
                     os.remove(filename)
             except Exception as e:
-                print("Exception on removing file: %s" % e)
+                print("Exception on removing file: {error}".format(error=e))
 
-def get_data_path(f=''):
-    """Return the path of a data file, these are relative to the current test
-    directory.
-    """
-    # get our callers file
-    _, filename, _, _, _, _ = inspect.getouterframes(inspect.currentframe())[1]
-    base_dir = os.path.abspath(os.path.dirname(filename))
-    return os.path.join(base_dir, 'data', f)
 
-#------------------------------------------------------------------------------
+# -----------------------------------------------------------------------------
 # Comparators
 
 
@@ -569,38 +767,29 @@ def equalContents(arr1, arr2):
     return frozenset(arr1) == frozenset(arr2)
 
 
-def assert_equal(a, b, msg=""):
-    """asserts that a equals b, like nose's assert_equal, but allows custom message to start.
-    Passes a and b to format string as well. So you can use '{0}' and '{1}' to display a and b.
-
-    Examples
-    --------
-    >>> assert_equal(2, 2, "apples")
-    >>> assert_equal(5.2, 1.2, "{0} was really a dead parrot")
-    Traceback (most recent call last):
-        ...
-    AssertionError: 5.2 was really a dead parrot: 5.2 != 1.2
-    """
-    assert a == b, "%s: %r != %r" % (msg.format(a,b), a, b)
-
-
-def assert_index_equal(left, right, exact=False, check_names=True,
-                       check_less_precise=False, check_exact=True, obj='Index'):
+def assert_index_equal(left, right, exact='equiv', check_names=True,
+                       check_less_precise=False, check_exact=True,
+                       check_categorical=True, obj='Index'):
     """Check that left and right Index are equal.
 
     Parameters
     ----------
     left : Index
     right : Index
-    exact : bool, default False
-        Whether to check the Index class, dtype and inferred_type are identical.
+    exact : bool / string {'equiv'}, default False
+        Whether to check the Index class, dtype and inferred_type
+        are identical. If 'equiv', then RangeIndex can be substituted for
+        Int64Index as well.
     check_names : bool, default True
         Whether to check the names attribute.
-    check_less_precise : bool, default False
+    check_less_precise : bool or int, default False
         Specify comparison precision. Only used when check_exact is False.
         5 digits (False) or 3 digits (True) after decimal points are compared.
+        If int, then specify the digits to compare
     check_exact : bool, default True
         Whether to compare number exactly.
+    check_categorical : bool, default True
+        Whether to compare internal Categorical exactly.
     obj : str, default 'Index'
         Specify object name being compared, internally used to show appropriate
         assertion message
@@ -608,40 +797,45 @@ def assert_index_equal(left, right, exact=False, check_names=True,
 
     def _check_types(l, r, obj='Index'):
         if exact:
-            if type(l) != type(r):
-                msg = '{0} classes are different'.format(obj)
-                raise_assert_detail(obj, msg, l, r)
-            assert_attr_equal('dtype', l, r, obj=obj)
-            assert_attr_equal('inferred_type', l, r, obj=obj)
+            assert_class_equal(l, r, exact=exact, obj=obj)
+
+            # Skip exact dtype checking when `check_categorical` is False
+            if check_categorical:
+                assert_attr_equal('dtype', l, r, obj=obj)
+
+            # allow string-like to have different inferred_types
+            if l.inferred_type in ('string', 'unicode'):
+                assert r.inferred_type in ('string', 'unicode')
+            else:
+                assert_attr_equal('inferred_type', l, r, obj=obj)
 
     def _get_ilevel_values(index, level):
         # accept level number only
         unique = index.levels[level]
         labels = index.labels[level]
         filled = take_1d(unique.values, labels, fill_value=unique._na_value)
-        values = unique._simple_new(filled, index.names[level],
-                                    freq=getattr(unique, 'freq', None),
-                                    tz=getattr(unique, 'tz', None))
+        values = unique._shallow_copy(filled, name=index.names[level])
         return values
 
     # instance validation
-    assertIsInstance(left, Index, '[index] ')
-    assertIsInstance(right, Index, '[index] ')
+    _check_isinstance(left, right, Index)
 
     # class / dtype comparison
-    _check_types(left, right)
+    _check_types(left, right, obj=obj)
 
     # level comparison
     if left.nlevels != right.nlevels:
-        raise_assert_detail(obj, '{0} levels are different'.format(obj),
-                            '{0}, {1}'.format(left.nlevels, left),
-                            '{0}, {1}'.format(right.nlevels, right))
+        msg1 = '{obj} levels are different'.format(obj=obj)
+        msg2 = '{nlevels}, {left}'.format(nlevels=left.nlevels, left=left)
+        msg3 = '{nlevels}, {right}'.format(nlevels=right.nlevels, right=right)
+        raise_assert_detail(obj, msg1, msg2, msg3)
 
     # length comparison
     if len(left) != len(right):
-        raise_assert_detail(obj, '{0} length are different'.format(obj),
-                           '{0}, {1}'.format(len(left), left),
-                           '{0}, {1}'.format(len(right), right))
+        msg1 = '{obj} length are different'.format(obj=obj)
+        msg2 = '{length}, {left}'.format(length=len(left), left=left)
+        msg3 = '{length}, {right}'.format(length=len(right), right=right)
+        raise_assert_detail(obj, msg1, msg2, msg3)
 
     # MultiIndex special comparison for little-friendly error messages
     if left.nlevels > 1:
@@ -650,7 +844,7 @@ def _get_ilevel_values(index, level):
             llevel = _get_ilevel_values(left, level)
             rlevel = _get_ilevel_values(right, level)
 
-            lobj = 'MultiIndex level [{0}]'.format(level)
+            lobj = 'MultiIndex level [{level}]'.format(level=level)
             assert_index_equal(llevel, rlevel,
                                exact=exact, check_names=check_names,
                                check_less_precise=check_less_precise,
@@ -658,19 +852,61 @@ def _get_ilevel_values(index, level):
             # get_level_values may change dtype
             _check_types(left.levels[level], right.levels[level], obj=obj)
 
-    if check_exact:
+    # skip exact index checking when `check_categorical` is False
+    if check_exact and check_categorical:
         if not left.equals(right):
-            diff = np.sum((left.values != right.values).astype(int)) * 100.0 / len(left)
-            msg = '{0} values are different ({1} %)'.format(obj, np.round(diff, 5))
+            diff = np.sum((left.values != right.values)
+                          .astype(int)) * 100.0 / len(left)
+            msg = '{obj} values are different ({pct} %)'.format(
+                obj=obj, pct=np.round(diff, 5))
             raise_assert_detail(obj, msg, left, right)
     else:
-        assert_almost_equal(left.values, right.values,
-                            check_less_precise=check_less_precise,
-                            obj=obj, lobj=left, robj=right)
+        _testing.assert_almost_equal(left.values, right.values,
+                                     check_less_precise=check_less_precise,
+                                     check_dtype=exact,
+                                     obj=obj, lobj=left, robj=right)
 
     # metadata comparison
     if check_names:
         assert_attr_equal('names', left, right, obj=obj)
+    if isinstance(left, pd.PeriodIndex) or isinstance(right, pd.PeriodIndex):
+        assert_attr_equal('freq', left, right, obj=obj)
+    if (isinstance(left, pd.IntervalIndex) or
+            isinstance(right, pd.IntervalIndex)):
+        assert_attr_equal('closed', left, right, obj=obj)
+
+    if check_categorical:
+        if is_categorical_dtype(left) or is_categorical_dtype(right):
+            assert_categorical_equal(left.values, right.values,
+                                     obj='{obj} category'.format(obj=obj))
+
+
+def assert_class_equal(left, right, exact=True, obj='Input'):
+    """checks classes are equal."""
+
+    def repr_class(x):
+        if isinstance(x, Index):
+            # return Index as it is to include values in the error message
+            return x
+
+        try:
+            return x.__class__.__name__
+        except AttributeError:
+            return repr(type(x))
+
+    if exact == 'equiv':
+        if type(left) != type(right):
+            # allow equivalence of Int64Index/RangeIndex
+            types = set([type(left).__name__, type(right).__name__])
+            if len(types - set(['Int64Index', 'RangeIndex'])):
+                msg = '{obj} classes are not equivalent'.format(obj=obj)
+                raise_assert_detail(obj, msg, repr_class(left),
+                                    repr_class(right))
+    elif exact:
+        if type(left) != type(right):
+            msg = '{obj} classes are different'.format(obj=obj)
+            raise_assert_detail(obj, msg, repr_class(left),
+                                repr_class(right))
 
 
 def assert_attr_equal(attr, left, right, obj='Attributes'):
@@ -697,136 +933,165 @@ def assert_attr_equal(attr, left, right, obj='Attributes'):
         # np.nan
         return True
 
-    result = left_attr == right_attr
+    try:
+        result = left_attr == right_attr
+    except TypeError:
+        # datetimetz on rhs may raise TypeError
+        result = False
     if not isinstance(result, bool):
         result = result.all()
 
     if result:
         return True
     else:
-        raise_assert_detail(obj, 'Attribute "{0}" are different'.format(attr),
-                        left_attr, right_attr)
-
-
-def isiterable(obj):
-    return hasattr(obj, '__iter__')
-
-def is_sorted(seq):
-    return assert_almost_equal(seq, np.sort(np.array(seq)))
-
-
-def assertIs(first, second, msg=''):
-    """Checks that 'first' is 'second'"""
-    a, b = first, second
-    assert a is b, "%s: %r is not %r" % (msg.format(a, b), a, b)
-
-
-def assertIsNot(first, second, msg=''):
-    """Checks that 'first' is not 'second'"""
-    a, b = first, second
-    assert a is not b, "%s: %r is %r" % (msg.format(a, b), a, b)
-
+        msg = 'Attribute "{attr}" are different'.format(attr=attr)
+        raise_assert_detail(obj, msg, left_attr, right_attr)
 
-def assertIn(first, second, msg=''):
-    """Checks that 'first' is in 'second'"""
-    a, b = first, second
-    assert a in b, "%s: %r is not in %r" % (msg.format(a, b), a, b)
-
-
-def assertNotIn(first, second, msg=''):
-    """Checks that 'first' is not in 'second'"""
-    a, b = first, second
-    assert a not in b, "%s: %r is in %r" % (msg.format(a, b), a, b)
-
-
-def assertIsNone(expr, msg=''):
-    """Checks that 'expr' is None"""
-    return assertIs(expr, None, msg)
-
-
-def assertIsNotNone(expr, msg=''):
-    """Checks that 'expr' is not None"""
-    return assertIsNot(expr, None, msg)
 
+def assert_is_valid_plot_return_object(objs):
+    import matplotlib.pyplot as plt
+    if isinstance(objs, (pd.Series, np.ndarray)):
+        for el in objs.ravel():
+            msg = ('one of \'objs\' is not a matplotlib Axes instance, type '
+                   'encountered {name!r}').format(name=el.__class__.__name__)
+            assert isinstance(el, (plt.Axes, dict)), msg
+    else:
+        assert isinstance(objs, (plt.Artist, tuple, dict)), \
+            ('objs is neither an ndarray of Artist instances nor a '
+             'single Artist instance, tuple, or dict, "objs" is a {name!r}'
+             ).format(name=objs.__class__.__name__)
 
-def assertIsInstance(obj, cls, msg=''):
-    """Test that obj is an instance of cls
-    (which can be a class or a tuple of classes,
-    as supported by isinstance())."""
-    assert isinstance(obj, cls), (
-        "%sExpected object to be of type %r, found %r instead" % (
-            msg, cls, type(obj)))
 
-def assert_isinstance(obj, class_type_or_tuple, msg=''):
-    return deprecate('assert_isinstance', assertIsInstance)(obj, class_type_or_tuple, msg=msg)
+def isiterable(obj):
+    return hasattr(obj, '__iter__')
 
 
-def assertNotIsInstance(obj, cls, msg=''):
-    """Test that obj is not an instance of cls
-    (which can be a class or a tuple of classes,
-    as supported by isinstance())."""
-    assert not isinstance(obj, cls), (
-        "%sExpected object to be of type %r, found %r instead" % (
-            msg, cls, type(obj)))
+def is_sorted(seq):
+    if isinstance(seq, (Index, Series)):
+        seq = seq.values
+    # sorting does not change precisions
+    return assert_numpy_array_equal(seq, np.sort(np.array(seq)))
 
 
-def assert_categorical_equal(res, exp):
+def assert_categorical_equal(left, right, check_dtype=True,
+                             check_category_order=True, obj='Categorical'):
+    """Test that Categoricals are equivalent.
 
-    if not array_equivalent(res.categories, exp.categories):
-        raise AssertionError(
-            'categories not equivalent: {0} vs {1}.'.format(res.categories,
-                                                            exp.categories))
-    if not array_equivalent(res.codes, exp.codes):
-        raise AssertionError(
-            'codes not equivalent: {0} vs {1}.'.format(res.codes, exp.codes))
+    Parameters
+    ----------
+    left : Categorical
+    right : Categorical
+    check_dtype : bool, default True
+        Check that integer dtype of the codes are the same
+    check_category_order : bool, default True
+        Whether the order of the categories should be compared, which
+        implies identical integer codes.  If False, only the resulting
+        values are compared.  The ordered attribute is
+        checked regardless.
+    obj : str, default 'Categorical'
+        Specify object name being compared, internally used to show appropriate
+        assertion message
+    """
+    _check_isinstance(left, right, Categorical)
+
+    if check_category_order:
+        assert_index_equal(left.categories, right.categories,
+                           obj='{obj}.categories'.format(obj=obj))
+        assert_numpy_array_equal(left.codes, right.codes,
+                                 check_dtype=check_dtype,
+                                 obj='{obj}.codes'.format(obj=obj))
+    else:
+        assert_index_equal(left.categories.sort_values(),
+                           right.categories.sort_values(),
+                           obj='{obj}.categories'.format(obj=obj))
+        assert_index_equal(left.categories.take(left.codes),
+                           right.categories.take(right.codes),
+                           obj='{obj}.values'.format(obj=obj))
 
-    if res.ordered != exp.ordered:
-        raise AssertionError("ordered not the same")
+    assert_attr_equal('ordered', left, right, obj=obj)
 
 
-def raise_assert_detail(obj, message, left, right):
+def raise_assert_detail(obj, message, left, right, diff=None):
     if isinstance(left, np.ndarray):
         left = pprint_thing(left)
+    elif is_categorical_dtype(left):
+        left = repr(left)
+
+    if PY2 and isinstance(left, string_types):
+        # left needs to be printable in native text type in python2
+        left = left.encode('utf-8')
+
     if isinstance(right, np.ndarray):
         right = pprint_thing(right)
+    elif is_categorical_dtype(right):
+        right = repr(right)
 
-    msg = """{0} are different
+    if PY2 and isinstance(right, string_types):
+        # right needs to be printable in native text type in python2
+        right = right.encode('utf-8')
 
-{1}
-[left]:  {2}
-[right]: {3}""".format(obj, message, left, right)
-    raise AssertionError(msg)
+    msg = """{obj} are different
 
+{message}
+[left]:  {left}
+[right]: {right}""".format(obj=obj, message=message, left=left, right=right)
 
-def assert_numpy_array_equal(left, right,
-                             strict_nan=False, err_msg=None,
-                             obj='numpy array'):
-    """Checks that 'np_array' is equivalent to 'assert_equal'.
+    if diff is not None:
+        msg += "\n[diff]: {diff}".format(diff=diff)
 
-    This is similar to ``numpy.testing.assert_array_equal``, but can
-    check equality including ``np.nan``. Two numpy arrays are regarded as
-    equivalent if the arrays have equal non-NaN elements,
-    and `np.nan` in corresponding locations.
-    """
+    raise AssertionError(msg)
 
-    # compare shape and values
-    if array_equivalent(left, right, strict_nan=strict_nan):
-        return
 
-    if err_msg is None:
-        # show detailed error
+def assert_numpy_array_equal(left, right, strict_nan=False,
+                             check_dtype=True, err_msg=None,
+                             check_same=None, obj='numpy array'):
+    """ Checks that 'np.ndarray' is equivalent
 
-        if np.isscalar(left) and np.isscalar(right):
-            # show scalar comparison error
-            assert_equal(left, right)
-        elif is_list_like(left) and is_list_like(right):
-            # some test cases pass list
-            left = np.asarray(left)
-            right = np.array(right)
+    Parameters
+    ----------
+    left : np.ndarray or iterable
+    right : np.ndarray or iterable
+    strict_nan : bool, default False
+        If True, consider NaN and None to be different.
+    check_dtype: bool, default True
+        check dtype if both a and b are np.ndarray
+    err_msg : str, default None
+        If provided, used as assertion message
+    check_same : None|'copy'|'same', default None
+        Ensure left and right refer/do not refer to the same memory area
+    obj : str, default 'numpy array'
+        Specify object name being compared, internally used to show appropriate
+        assertion message
+    """
 
+    # instance validation
+    # Show a detailed error message when classes are different
+    assert_class_equal(left, right, obj=obj)
+    # both classes must be an np.ndarray
+    _check_isinstance(left, right, np.ndarray)
+
+    def _get_base(obj):
+        return obj.base if getattr(obj, 'base', None) is not None else obj
+
+    left_base = _get_base(left)
+    right_base = _get_base(right)
+
+    if check_same == 'same':
+        if left_base is not right_base:
+            msg = "{left!r} is not {right!r}".format(
+                left=left_base, right=right_base)
+            raise AssertionError(msg)
+    elif check_same == 'copy':
+        if left_base is right_base:
+            msg = "{left!r} is {right!r}".format(
+                left=left_base, right=right_base)
+            raise AssertionError(msg)
+
+    def _raise(left, right, err_msg):
+        if err_msg is None:
             if left.shape != right.shape:
-                raise_assert_detail(obj, '{0} shapes are different'.format(obj),
-                                    left.shape, right.shape)
+                raise_assert_detail(obj, '{obj} shapes are different'
+                                    .format(obj=obj), left.shape, right.shape)
 
             diff = 0
             for l, r in zip(left, right):
@@ -835,28 +1100,59 @@ def assert_numpy_array_equal(left, right,
                     diff += 1
 
             diff = diff * 100.0 / left.size
-            msg = '{0} values are different ({1} %)'.format(obj, np.round(diff, 5))
-            raise_assert_detail(obj, msg, left, right)
-        elif is_list_like(left):
-            msg = "First object is iterable, second isn't"
-            raise_assert_detail(obj, msg, left, right)
-        else:
-            msg = "Second object is iterable, first isn't"
+            msg = '{obj} values are different ({pct} %)'.format(
+                obj=obj, pct=np.round(diff, 5))
             raise_assert_detail(obj, msg, left, right)
 
-    raise AssertionError(err_msg)
+        raise AssertionError(err_msg)
+
+    # compare shape and values
+    if not array_equivalent(left, right, strict_nan=strict_nan):
+        _raise(left, right, err_msg)
+
+    if check_dtype:
+        if isinstance(left, np.ndarray) and isinstance(right, np.ndarray):
+            assert_attr_equal('dtype', left, right, obj=obj)
+
+    return True
+
+
+def assert_extension_array_equal(left, right):
+    """Check that left and right ExtensionArrays are equal.
+
+    Parameters
+    ----------
+    left, right : ExtensionArray
+        The two arrays to compare
+
+    Notes
+    -----
+    Missing values are checked separately from valid values.
+    A mask of missing values is computed for each and checked to match.
+    The remaining all-valid values are cast to object dtype and checked.
+    """
+    assert isinstance(left, ExtensionArray)
+    assert left.dtype == right.dtype
+    left_na = left.isna()
+    right_na = right.isna()
+    assert_numpy_array_equal(left_na, right_na)
+
+    left_valid = left[~left_na].astype(object)
+    right_valid = right[~right_na].astype(object)
+
+    assert_numpy_array_equal(left_valid, right_valid)
 
 
 # This could be refactored to use the NDFrame.equals method
 def assert_series_equal(left, right, check_dtype=True,
-                        check_index_type=False,
-                        check_series_type=False,
+                        check_index_type='equiv',
+                        check_series_type=True,
                         check_less_precise=False,
                         check_names=True,
                         check_exact=False,
                         check_datetimelike_compat=False,
+                        check_categorical=True,
                         obj='Series'):
-
     """Check that left and right Series are equal.
 
     Parameters
@@ -865,220 +1161,435 @@ def assert_series_equal(left, right, check_dtype=True,
     right : Series
     check_dtype : bool, default True
         Whether to check the Series dtype is identical.
-    check_index_type : bool, default False
-        Whether to check the Index class, dtype and inferred_type are identical.
-    check_series_type : bool, default False
+    check_index_type : bool / string {'equiv'}, default 'equiv'
+        Whether to check the Index class, dtype and inferred_type
+        are identical.
+    check_series_type : bool, default True
         Whether to check the Series class is identical.
-    check_less_precise : bool, default False
+    check_less_precise : bool or int, default False
         Specify comparison precision. Only used when check_exact is False.
         5 digits (False) or 3 digits (True) after decimal points are compared.
+        If int, then specify the digits to compare
     check_exact : bool, default False
         Whether to compare number exactly.
     check_names : bool, default True
         Whether to check the Series and Index names attribute.
-    check_dateteimelike_compat : bool, default False
+    check_datetimelike_compat : bool, default False
         Compare datetime-like which is comparable ignoring dtype.
+    check_categorical : bool, default True
+        Whether to compare internal Categorical exactly.
     obj : str, default 'Series'
         Specify object name being compared, internally used to show appropriate
         assertion message
     """
 
     # instance validation
-    assertIsInstance(left, Series, '[Series] ')
-    assertIsInstance(right, Series, '[Series] ')
+    _check_isinstance(left, right, Series)
 
     if check_series_type:
-        assertIsInstance(left, type(right))
+        # ToDo: There are some tests using rhs is sparse
+        # lhs is dense. Should use assert_class_equal in future
+        assert isinstance(left, type(right))
+        # assert_class_equal(left, right, obj=obj)
 
     # length comparison
     if len(left) != len(right):
-        raise_assert_detail(obj, 'Series length are different',
-                            '{0}, {1}'.format(len(left), left.index),
-                            '{0}, {1}'.format(len(right), right.index))
+        msg1 = '{len}, {left}'.format(len=len(left), left=left.index)
+        msg2 = '{len}, {right}'.format(len=len(right), right=right.index)
+        raise_assert_detail(obj, 'Series length are different', msg1, msg2)
 
     # index comparison
     assert_index_equal(left.index, right.index, exact=check_index_type,
                        check_names=check_names,
-                       check_less_precise=check_less_precise, check_exact=check_exact,
-                       obj='{0}.index'.format(obj))
+                       check_less_precise=check_less_precise,
+                       check_exact=check_exact,
+                       check_categorical=check_categorical,
+                       obj='{obj}.index'.format(obj=obj))
 
     if check_dtype:
-        assert_attr_equal('dtype', left, right)
+        # We want to skip exact dtype checking when `check_categorical`
+        # is False. We'll still raise if only one is a `Categorical`,
+        # regardless of `check_categorical`
+        if (is_categorical_dtype(left) and is_categorical_dtype(right) and
+                not check_categorical):
+            pass
+        else:
+            assert_attr_equal('dtype', left, right)
 
     if check_exact:
         assert_numpy_array_equal(left.get_values(), right.get_values(),
-                                 obj='{0}'.format(obj))
+                                 check_dtype=check_dtype,
+                                 obj='{obj}'.format(obj=obj),)
     elif check_datetimelike_compat:
         # we want to check only if we have compat dtypes
-        # e.g. integer and M|m are NOT compat, but we can simply check the values in that case
-        if is_datetimelike_v_numeric(left, right) or is_datetimelike_v_object(left, right) or needs_i8_conversion(left) or needs_i8_conversion(right):
-
-            # datetimelike may have different objects (e.g. datetime.datetime vs Timestamp) but will compare equal
+        # e.g. integer and M|m are NOT compat, but we can simply check
+        # the values in that case
+        if (is_datetimelike_v_numeric(left, right) or
+            is_datetimelike_v_object(left, right) or
+            needs_i8_conversion(left) or
+                needs_i8_conversion(right)):
+
+            # datetimelike may have different objects (e.g. datetime.datetime
+            # vs Timestamp) but will compare equal
             if not Index(left.values).equals(Index(right.values)):
-                raise AssertionError(
-                    '[datetimelike_compat=True] {0} is not equal to {1}.'.format(left.values,
-                                                                                 right.values))
+                msg = ('[datetimelike_compat=True] {left} is not equal to '
+                       '{right}.').format(left=left.values, right=right.values)
+                raise AssertionError(msg)
         else:
-            assert_numpy_array_equal(left.values, right.values)
+            assert_numpy_array_equal(left.get_values(), right.get_values(),
+                                     check_dtype=check_dtype)
+    elif is_interval_dtype(left) or is_interval_dtype(right):
+        # TODO: big hack here
+        left = pd.IntervalIndex(left)
+        right = pd.IntervalIndex(right)
+        assert_index_equal(left, right, obj='{obj}.index'.format(obj=obj))
+
+    elif (is_extension_array_dtype(left) and not is_categorical_dtype(left) and
+          is_extension_array_dtype(right) and not is_categorical_dtype(right)):
+        return assert_extension_array_equal(left.values, right.values)
+
     else:
-        assert_almost_equal(left.get_values(), right.get_values(),
-                            check_less_precise, obj='{0}'.format(obj))
+        _testing.assert_almost_equal(left.get_values(), right.get_values(),
+                                     check_less_precise=check_less_precise,
+                                     check_dtype=check_dtype,
+                                     obj='{obj}'.format(obj=obj))
+
+    # metadata comparison
+    if check_names:
+        assert_attr_equal('name', left, right, obj=obj)
+
+    if check_categorical:
+        if is_categorical_dtype(left) or is_categorical_dtype(right):
+            assert_categorical_equal(left.values, right.values,
+                                     obj='{obj} category'.format(obj=obj))
+
+
+# This could be refactored to use the NDFrame.equals method
+def assert_frame_equal(left, right, check_dtype=True,
+                       check_index_type='equiv',
+                       check_column_type='equiv',
+                       check_frame_type=True,
+                       check_less_precise=False,
+                       check_names=True,
+                       by_blocks=False,
+                       check_exact=False,
+                       check_datetimelike_compat=False,
+                       check_categorical=True,
+                       check_like=False,
+                       obj='DataFrame'):
+    """Check that left and right DataFrame are equal.
+
+    Parameters
+    ----------
+    left : DataFrame
+    right : DataFrame
+    check_dtype : bool, default True
+        Whether to check the DataFrame dtype is identical.
+    check_index_type : bool / string {'equiv'}, default False
+        Whether to check the Index class, dtype and inferred_type
+        are identical.
+    check_column_type : bool / string {'equiv'}, default False
+        Whether to check the columns class, dtype and inferred_type
+        are identical.
+    check_frame_type : bool, default False
+        Whether to check the DataFrame class is identical.
+    check_less_precise : bool or int, default False
+        Specify comparison precision. Only used when check_exact is False.
+        5 digits (False) or 3 digits (True) after decimal points are compared.
+        If int, then specify the digits to compare
+    check_names : bool, default True
+        Whether to check the Index names attribute.
+    by_blocks : bool, default False
+        Specify how to compare internal data. If False, compare by columns.
+        If True, compare by blocks.
+    check_exact : bool, default False
+        Whether to compare number exactly.
+    check_datetimelike_compat : bool, default False
+        Compare datetime-like which is comparable ignoring dtype.
+    check_categorical : bool, default True
+        Whether to compare internal Categorical exactly.
+    check_like : bool, default False
+        If true, ignore the order of rows & columns
+    obj : str, default 'DataFrame'
+        Specify object name being compared, internally used to show appropriate
+        assertion message
+    """
+
+    # instance validation
+    _check_isinstance(left, right, DataFrame)
+
+    if check_frame_type:
+        # ToDo: There are some tests using rhs is SparseDataFrame
+        # lhs is DataFrame. Should use assert_class_equal in future
+        assert isinstance(left, type(right))
+        # assert_class_equal(left, right, obj=obj)
+
+    # shape comparison
+    if left.shape != right.shape:
+        raise_assert_detail(obj,
+                            'DataFrame shape mismatch',
+                            '{shape!r}'.format(shape=left.shape),
+                            '{shape!r}'.format(shape=right.shape))
+
+    if check_like:
+        left, right = left.reindex_like(right), right
+
+    # index comparison
+    assert_index_equal(left.index, right.index, exact=check_index_type,
+                       check_names=check_names,
+                       check_less_precise=check_less_precise,
+                       check_exact=check_exact,
+                       check_categorical=check_categorical,
+                       obj='{obj}.index'.format(obj=obj))
+
+    # column comparison
+    assert_index_equal(left.columns, right.columns, exact=check_column_type,
+                       check_names=check_names,
+                       check_less_precise=check_less_precise,
+                       check_exact=check_exact,
+                       check_categorical=check_categorical,
+                       obj='{obj}.columns'.format(obj=obj))
+
+    # compare by blocks
+    if by_blocks:
+        rblocks = right._to_dict_of_blocks()
+        lblocks = left._to_dict_of_blocks()
+        for dtype in list(set(list(lblocks.keys()) + list(rblocks.keys()))):
+            assert dtype in lblocks
+            assert dtype in rblocks
+            assert_frame_equal(lblocks[dtype], rblocks[dtype],
+                               check_dtype=check_dtype, obj='DataFrame.blocks')
+
+    # compare by columns
+    else:
+        for i, col in enumerate(left.columns):
+            assert col in right
+            lcol = left.iloc[:, i]
+            rcol = right.iloc[:, i]
+            assert_series_equal(
+                lcol, rcol, check_dtype=check_dtype,
+                check_index_type=check_index_type,
+                check_less_precise=check_less_precise,
+                check_exact=check_exact, check_names=check_names,
+                check_datetimelike_compat=check_datetimelike_compat,
+                check_categorical=check_categorical,
+                obj='DataFrame.iloc[:, {idx}]'.format(idx=i))
+
+
+def assert_panel_equal(left, right,
+                       check_dtype=True,
+                       check_panel_type=False,
+                       check_less_precise=False,
+                       check_names=False,
+                       by_blocks=False,
+                       obj='Panel'):
+    """Check that left and right Panels are equal.
+
+    Parameters
+    ----------
+    left : Panel (or nd)
+    right : Panel (or nd)
+    check_dtype : bool, default True
+        Whether to check the Panel dtype is identical.
+    check_panel_type : bool, default False
+        Whether to check the Panel class is identical.
+    check_less_precise : bool or int, default False
+        Specify comparison precision. Only used when check_exact is False.
+        5 digits (False) or 3 digits (True) after decimal points are compared.
+        If int, then specify the digits to compare
+    check_names : bool, default True
+        Whether to check the Index names attribute.
+    by_blocks : bool, default False
+        Specify how to compare internal data. If False, compare by columns.
+        If True, compare by blocks.
+    obj : str, default 'Panel'
+        Specify the object name being compared, internally used to show
+        the appropriate assertion message.
+    """
+
+    if check_panel_type:
+        assert_class_equal(left, right, obj=obj)
+
+    for axis in left._AXIS_ORDERS:
+        left_ind = getattr(left, axis)
+        right_ind = getattr(right, axis)
+        assert_index_equal(left_ind, right_ind, check_names=check_names)
+
+    if by_blocks:
+        rblocks = right._to_dict_of_blocks()
+        lblocks = left._to_dict_of_blocks()
+        for dtype in list(set(list(lblocks.keys()) + list(rblocks.keys()))):
+            assert dtype in lblocks
+            assert dtype in rblocks
+            array_equivalent(lblocks[dtype].values, rblocks[dtype].values)
+    else:
+
+        # can potentially be slow
+        for i, item in enumerate(left._get_axis(0)):
+            msg = "non-matching item (right) '{item}'".format(item=item)
+            assert item in right, msg
+            litem = left.iloc[i]
+            ritem = right.iloc[i]
+            assert_frame_equal(litem, ritem,
+                               check_less_precise=check_less_precise,
+                               check_names=check_names)
+
+        for i, item in enumerate(right._get_axis(0)):
+            msg = "non-matching item (left) '{item}'".format(item=item)
+            assert item in left, msg
+
+
+# -----------------------------------------------------------------------------
+# Sparse
+
+
+def assert_sp_array_equal(left, right, check_dtype=True):
+    """Check that the left and right SparseArray are equal.
+
+    Parameters
+    ----------
+    left : SparseArray
+    right : SparseArray
+    check_dtype : bool, default True
+        Whether to check the data dtype is identical.
+    """
+
+    _check_isinstance(left, right, pd.SparseArray)
+
+    assert_numpy_array_equal(left.sp_values, right.sp_values,
+                             check_dtype=check_dtype)
+
+    # SparseIndex comparison
+    assert isinstance(left.sp_index, pd._libs.sparse.SparseIndex)
+    assert isinstance(right.sp_index, pd._libs.sparse.SparseIndex)
+
+    if not left.sp_index.equals(right.sp_index):
+        raise_assert_detail('SparseArray.index', 'index are not equal',
+                            left.sp_index, right.sp_index)
+
+    assert_attr_equal('fill_value', left, right)
+    if check_dtype:
+        assert_attr_equal('dtype', left, right)
+    assert_numpy_array_equal(left.values, right.values,
+                             check_dtype=check_dtype)
+
+
+def assert_sp_series_equal(left, right, check_dtype=True, exact_indices=True,
+                           check_series_type=True, check_names=True,
+                           obj='SparseSeries'):
+    """Check that the left and right SparseSeries are equal.
+
+    Parameters
+    ----------
+    left : SparseSeries
+    right : SparseSeries
+    check_dtype : bool, default True
+        Whether to check the Series dtype is identical.
+    exact_indices : bool, default True
+    check_series_type : bool, default True
+        Whether to check the SparseSeries class is identical.
+    check_names : bool, default True
+        Whether to check the SparseSeries name attribute.
+    obj : str, default 'SparseSeries'
+        Specify the object name being compared, internally used to show
+        the appropriate assertion message.
+    """
+    _check_isinstance(left, right, pd.SparseSeries)
+
+    if check_series_type:
+        assert_class_equal(left, right, obj=obj)
+
+    assert_index_equal(left.index, right.index,
+                       obj='{obj}.index'.format(obj=obj))
+
+    assert_sp_array_equal(left.block.values, right.block.values)
 
-    # metadata comparison
     if check_names:
-        assert_attr_equal('name', left, right, obj=obj)
+        assert_attr_equal('name', left, right)
+    if check_dtype:
+        assert_attr_equal('dtype', left, right)
 
+    assert_numpy_array_equal(left.values, right.values)
 
-# This could be refactored to use the NDFrame.equals method
-def assert_frame_equal(left, right, check_dtype=True,
-                       check_index_type=False,
-                       check_column_type=False,
-                       check_frame_type=False,
-                       check_less_precise=False,
-                       check_names=True,
-                       by_blocks=False,
-                       check_exact=False,
-                       check_datetimelike_compat=False,
-                       obj='DataFrame'):
 
-    """Check that left and right DataFrame are equal.
+def assert_sp_frame_equal(left, right, check_dtype=True, exact_indices=True,
+                          check_frame_type=True, obj='SparseDataFrame'):
+    """Check that the left and right SparseDataFrame are equal.
 
     Parameters
     ----------
-    left : DataFrame
-    right : DataFrame
+    left : SparseDataFrame
+    right : SparseDataFrame
     check_dtype : bool, default True
-        Whether to check the DataFrame dtype is identical.
-    check_index_type : bool, default False
-        Whether to check the Index class, dtype and inferred_type are identical.
-    check_column_type : bool, default False
-        Whether to check the columns class, dtype and inferred_type are identical.
-    check_frame_type : bool, default False
-        Whether to check the DataFrame class is identical.
-    check_less_precise : bool, default False
-        Specify comparison precision. Only used when check_exact is False.
-        5 digits (False) or 3 digits (True) after decimal points are compared.
-    check_names : bool, default True
-        Whether to check the Index names attribute.
-    by_blocks : bool, default False
-        Specify how to compare internal data. If False, compare by columns.
-        If True, compare by blocks.
-    check_exact : bool, default False
-        Whether to compare number exactly.
-    check_dateteimelike_compat : bool, default False
-        Compare datetime-like which is comparable ignoring dtype.
-    obj : str, default 'DataFrame'
-        Specify object name being compared, internally used to show appropriate
-        assertion message
+        Whether to check the Series dtype is identical.
+    exact_indices : bool, default True
+        SparseSeries SparseIndex objects must be exactly the same,
+        otherwise just compare dense representations.
+    check_frame_type : bool, default True
+        Whether to check the SparseDataFrame class is identical.
+    obj : str, default 'SparseDataFrame'
+        Specify the object name being compared, internally used to show
+        the appropriate assertion message.
     """
-
-    # instance validation
-    assertIsInstance(left, DataFrame, '[DataFrame] ')
-    assertIsInstance(right, DataFrame, '[DataFrame] ')
+    _check_isinstance(left, right, pd.SparseDataFrame)
 
     if check_frame_type:
-        assertIsInstance(left, type(right))
-
-    # shape comparison (row)
-    if left.shape[0] != right.shape[0]:
-        raise_assert_detail(obj, 'DataFrame shape (number of rows) are different',
-                            '{0}, {1}'.format(left.shape[0], left.index),
-                            '{0}, {1}'.format(right.shape[0], right.index))
-    # shape comparison (columns)
-    if left.shape[1] != right.shape[1]:
-        raise_assert_detail(obj, 'DataFrame shape (number of columns) are different',
-                            '{0}, {1}'.format(left.shape[1], left.columns),
-                            '{0}, {1}'.format(right.shape[1], right.columns))
-
-    # index comparison
-    assert_index_equal(left.index, right.index, exact=check_index_type,
-                       check_names=check_names,
-                       check_less_precise=check_less_precise, check_exact=check_exact,
-                       obj='{0}.index'.format(obj))
+        assert_class_equal(left, right, obj=obj)
 
-    # column comparison
-    assert_index_equal(left.columns, right.columns, exact=check_column_type,
-                       check_names=check_names,
-                       check_less_precise=check_less_precise, check_exact=check_exact,
-                       obj='{0}.columns'.format(obj))
+    assert_index_equal(left.index, right.index,
+                       obj='{obj}.index'.format(obj=obj))
+    assert_index_equal(left.columns, right.columns,
+                       obj='{obj}.columns'.format(obj=obj))
 
-    # compare by blocks
-    if by_blocks:
-        rblocks = right.blocks
-        lblocks = left.blocks
-        for dtype in list(set(list(lblocks.keys()) + list(rblocks.keys()))):
-            assert dtype in lblocks
-            assert dtype in rblocks
-            assert_frame_equal(lblocks[dtype], rblocks[dtype],
-                               check_dtype=check_dtype, obj='DataFrame.blocks')
+    for col, series in compat.iteritems(left):
+        assert (col in right)
+        # trade-off?
 
-    # compare by columns
-    else:
-        for i, col in enumerate(left.columns):
-            assert col in right
-            lcol = left.iloc[:, i]
-            rcol = right.iloc[:, i]
-            assert_series_equal(lcol, rcol,
-                                check_dtype=check_dtype,
-                                check_index_type=check_index_type,
-                                check_less_precise=check_less_precise,
-                                check_exact=check_exact,
-                                check_names=check_names,
-                                check_datetimelike_compat=check_datetimelike_compat,
-                                obj='DataFrame.iloc[:, {0}]'.format(i))
-
-
-def assert_panelnd_equal(left, right,
-                         check_panel_type=False,
-                         check_less_precise=False,
-                         assert_func=assert_frame_equal,
-                         check_names=False):
-    if check_panel_type:
-        assertIsInstance(left, type(right))
+        if exact_indices:
+            assert_sp_series_equal(series, right[col],
+                                   check_dtype=check_dtype)
+        else:
+            assert_series_equal(series.to_dense(), right[col].to_dense(),
+                                check_dtype=check_dtype)
 
-    for axis in ['items', 'major_axis', 'minor_axis']:
-        left_ind = getattr(left, axis)
-        right_ind = getattr(right, axis)
-        assert_index_equal(left_ind, right_ind, check_names=check_names)
+    assert_attr_equal('default_fill_value', left, right, obj=obj)
 
-    for i, item in enumerate(left._get_axis(0)):
-        assert item in right, "non-matching item (right) '%s'" % item
-        litem = left.iloc[i]
-        ritem = right.iloc[i]
-        assert_func(litem, ritem, check_less_precise=check_less_precise)
+    # do I care?
+    # assert(left.default_kind == right.default_kind)
 
-    for i, item in enumerate(right._get_axis(0)):
-        assert item in left, "non-matching item (left) '%s'" % item
+    for col in right:
+        assert (col in left)
 
-# TODO: strangely check_names fails in py3 ?
-_panel_frame_equal = partial(assert_frame_equal, check_names=False)
-assert_panel_equal = partial(assert_panelnd_equal,
-                             assert_func=_panel_frame_equal)
-assert_panel4d_equal = partial(assert_panelnd_equal,
-                               assert_func=assert_panel_equal)
+# -----------------------------------------------------------------------------
+# Others
 
 
 def assert_contains_all(iterable, dic):
     for k in iterable:
-        assert k in dic, "Did not contain item: '%r'" % k
+        assert k in dic, "Did not contain item: '{key!r}'".format(key=k)
 
 
 def assert_copy(iter1, iter2, **eql_kwargs):
     """
-    iter1, iter2: iterables that produce elements comparable with assert_almost_equal
+    iter1, iter2: iterables that produce elements
+    comparable with assert_almost_equal
 
-    Checks that the elements are equal, but not the same object. (Does not
-    check that items in sequences are also not the same object)
+    Checks that the elements are equal, but not
+    the same object. (Does not check that items
+    in sequences are also not the same object)
     """
     for elem1, elem2 in zip(iter1, iter2):
         assert_almost_equal(elem1, elem2, **eql_kwargs)
-        assert elem1 is not elem2, "Expected object %r and object %r to be different objects, were same." % (
-                                    type(elem1), type(elem2))
+        msg = ("Expected object {obj1!r} and object {obj2!r} to be "
+               "different objects, but they were the same object."
+               ).format(obj1=type(elem1), obj2=type(elem2))
+        assert elem1 is not elem2, msg
 
 
 def getCols(k):
     return string.ascii_uppercase[:k]
 
+
 def getArangeMat():
     return np.arange(N * K).reshape((N, K))
 
@@ -1089,40 +1600,68 @@ def makeStringIndex(k=10, name=None):
 
 
 def makeUnicodeIndex(k=10, name=None):
-    return Index(randu_array(nchars=10, size=k))
+    return Index(randu_array(nchars=10, size=k), name=name)
 
-def makeCategoricalIndex(k=10, n=3, name=None):
+
+def makeCategoricalIndex(k=10, n=3, name=None, **kwargs):
     """ make a length k index or n categories """
     x = rands_array(nchars=4, size=n)
-    return CategoricalIndex(np.random.choice(x,k), name=name)
+    return CategoricalIndex(np.random.choice(x, k), name=name, **kwargs)
+
+
+def makeIntervalIndex(k=10, name=None, **kwargs):
+    """ make a length k IntervalIndex """
+    x = np.linspace(0, 100, num=(k + 1))
+    return IntervalIndex.from_breaks(x, name=name, **kwargs)
+
 
 def makeBoolIndex(k=10, name=None):
     if k == 1:
         return Index([True], name=name)
     elif k == 2:
-        return Index([False,True], name=name)
-    return Index([False,True] + [False]*(k-2), name=name)
+        return Index([False, True], name=name)
+    return Index([False, True] + [False] * (k - 2), name=name)
+
 
 def makeIntIndex(k=10, name=None):
     return Index(lrange(k), name=name)
 
+
+def makeUIntIndex(k=10, name=None):
+    return Index([2**63 + i for i in lrange(k)], name=name)
+
+
+def makeRangeIndex(k=10, name=None, **kwargs):
+    return RangeIndex(0, k, 1, name=name, **kwargs)
+
+
 def makeFloatIndex(k=10, name=None):
     values = sorted(np.random.random_sample(k)) - np.random.random_sample(1)
     return Index(values * (10 ** np.random.randint(0, 9)), name=name)
 
-def makeDateIndex(k=10, freq='B', name=None):
+
+def makeDateIndex(k=10, freq='B', name=None, **kwargs):
     dt = datetime(2000, 1, 1)
     dr = bdate_range(dt, periods=k, freq=freq, name=name)
-    return DatetimeIndex(dr, name=name)
+    return DatetimeIndex(dr, name=name, **kwargs)
+
 
-def makeTimedeltaIndex(k=10, freq='D', name=None):
-    return TimedeltaIndex(start='1 day', periods=k, freq=freq, name=name)
+def makeTimedeltaIndex(k=10, freq='D', name=None, **kwargs):
+    return TimedeltaIndex(start='1 day', periods=k, freq=freq,
+                          name=name, **kwargs)
 
-def makePeriodIndex(k=10, name=None):
+
+def makePeriodIndex(k=10, name=None, **kwargs):
     dt = datetime(2000, 1, 1)
-    dr = PeriodIndex(start=dt, periods=k, freq='B', name=name)
+    dr = PeriodIndex(start=dt, periods=k, freq='B', name=name, **kwargs)
     return dr
 
+
+def makeMultiIndex(k=10, names=None, **kwargs):
+    return MultiIndex.from_product(
+        (('foo', 'bar'), (1, 2)), names=names, **kwargs)
+
+
 def all_index_generator(k=10):
     """Generator which can be iterated over to get instances of all the various
     index classes.
@@ -1133,11 +1672,24 @@ def all_index_generator(k=10):
     """
     all_make_index_funcs = [makeIntIndex, makeFloatIndex, makeStringIndex,
                             makeUnicodeIndex, makeDateIndex, makePeriodIndex,
-                            makeTimedeltaIndex, makeBoolIndex,
+                            makeTimedeltaIndex, makeBoolIndex, makeRangeIndex,
+                            makeIntervalIndex,
                             makeCategoricalIndex]
     for make_index_func in all_make_index_funcs:
         yield make_index_func(k=k)
 
+
+def index_subclass_makers_generator():
+    make_index_funcs = [
+        makeDateIndex, makePeriodIndex,
+        makeTimedeltaIndex, makeRangeIndex,
+        makeIntervalIndex, makeCategoricalIndex,
+        makeMultiIndex
+    ]
+    for make_index_func in make_index_funcs:
+        yield make_index_func
+
+
 def all_timeseries_index_generator(k=10):
     """Generator which can be iterated over to get instances of all the classes
     which represent time-seires.
@@ -1171,7 +1723,7 @@ def makeObjectSeries(name=None):
 
 def getSeriesData():
     index = makeStringIndex(N)
-    return dict((c, Series(randn(N), index=index)) for c in getCols(K))
+    return {c: Series(randn(N), index=index) for c in getCols(K)}
 
 
 def makeTimeSeries(nper=None, freq='B', name=None):
@@ -1187,11 +1739,12 @@ def makePeriodSeries(nper=None, name=None):
 
 
 def getTimeSeriesData(nper=None, freq='B'):
-    return dict((c, makeTimeSeries(nper, freq)) for c in getCols(K))
+    return {c: makeTimeSeries(nper, freq) for c in getCols(K)}
 
 
 def getPeriodData(nper=None):
-    return dict((c, makePeriodSeries(nper)) for c in getCols(K))
+    return {c: makePeriodSeries(nper) for c in getCols(K)}
+
 
 # make frame
 def makeTimeDataFrame(nper=None, freq='B'):
@@ -1216,29 +1769,28 @@ def getMixedTypeDict():
 
     return index, data
 
+
 def makeMixedDataFrame():
     return DataFrame(getMixedTypeDict()[1])
 
+
 def makePeriodFrame(nper=None):
     data = getPeriodData(nper)
     return DataFrame(data)
 
 
 def makePanel(nper=None):
-    cols = ['Item' + c for c in string.ascii_uppercase[:K - 1]]
-    data = dict((c, makeTimeDataFrame(nper)) for c in cols)
-    return Panel.fromDict(data)
+    with warnings.catch_warnings(record=True):
+        cols = ['Item' + c for c in string.ascii_uppercase[:K - 1]]
+        data = {c: makeTimeDataFrame(nper) for c in cols}
+        return Panel.fromDict(data)
 
 
 def makePeriodPanel(nper=None):
-    cols = ['Item' + c for c in string.ascii_uppercase[:K - 1]]
-    data = dict((c, makePeriodFrame(nper)) for c in cols)
-    return Panel.fromDict(data)
-
-
-def makePanel4D(nper=None):
-    return Panel4D(dict(l1=makePanel(nper), l2=makePanel(nper),
-                        l3=makePanel(nper)))
+    with warnings.catch_warnings(record=True):
+        cols = ['Item' + c for c in string.ascii_uppercase[:K - 1]]
+        data = {c: makePeriodFrame(nper) for c in cols}
+        return Panel.fromDict(data)
 
 
 def makeCustomIndex(nentries, nlevels, prefix='#', names=False, ndupe_l=None,
@@ -1248,9 +1800,9 @@ def makeCustomIndex(nentries, nlevels, prefix='#', names=False, ndupe_l=None,
     nentries - number of entries in index
     nlevels - number of levels (> 1 produces multindex)
     prefix - a string prefix for labels
-    names - (Optional), bool or list of strings. if True will use default names,
-       if false will use no names, if a list is given,  the name of each level
-       in the index will be taken from the list.
+    names - (Optional), bool or list of strings. if True will use default
+       names, if false will use no names, if a list is given, the name of
+       each level in the index will be taken from the list.
     ndupe_l - (Optional), list of ints, the number of rows for which the
        label will repeated at the corresponding level, you can specify just
        the first few, the rest will use the default ndupe_l of 1.
@@ -1268,8 +1820,8 @@ def makeCustomIndex(nentries, nlevels, prefix='#', names=False, ndupe_l=None,
     if ndupe_l is None:
         ndupe_l = [1] * nlevels
     assert (is_sequence(ndupe_l) and len(ndupe_l) <= nlevels)
-    assert (names is None or names is False
-            or names is True or len(names) is nlevels)
+    assert (names is None or names is False or
+            names is True or len(names) is nlevels)
     assert idx_type is None or \
         (idx_type in ('i', 'f', 's', 'u', 'dt', 'p', 'td') and nlevels == 1)
 
@@ -1285,8 +1837,9 @@ def makeCustomIndex(nentries, nlevels, prefix='#', names=False, ndupe_l=None,
         names = [names]
 
     # specific 1D index type requested?
-    idx_func = dict(i=makeIntIndex, f=makeFloatIndex, s=makeStringIndex,
-                    u=makeUnicodeIndex, dt=makeDateIndex, td=makeTimedeltaIndex,
+    idx_func = dict(i=makeIntIndex, f=makeFloatIndex,
+                    s=makeStringIndex, u=makeUnicodeIndex,
+                    dt=makeDateIndex, td=makeTimedeltaIndex,
                     p=makePeriodIndex).get(idx_type)
     if idx_func:
         idx = idx_func(nentries)
@@ -1295,27 +1848,28 @@ def makeCustomIndex(nentries, nlevels, prefix='#', names=False, ndupe_l=None,
             idx.name = names[0]
         return idx
     elif idx_type is not None:
-        raise ValueError('"%s" is not a legal value for `idx_type`, use  '
-                         '"i"/"f"/"s"/"u"/"dt/"p"/"td".' % idx_type)
+        raise ValueError('"{idx_type}" is not a legal value for `idx_type`, '
+                         'use  "i"/"f"/"s"/"u"/"dt/"p"/"td".'
+                         .format(idx_type=idx_type))
 
     if len(ndupe_l) < nlevels:
         ndupe_l.extend([1] * (nlevels - len(ndupe_l)))
     assert len(ndupe_l) == nlevels
 
-    assert all([x > 0 for x in ndupe_l])
+    assert all(x > 0 for x in ndupe_l)
 
     tuples = []
     for i in range(nlevels):
         def keyfunc(x):
             import re
-            numeric_tuple = re.sub("[^\d_]_?", "", x).split("_")
+            numeric_tuple = re.sub(r"[^\d_]_?", "", x).split("_")
             return lmap(int, numeric_tuple)
 
         # build a list of lists to create the index from
         div_factor = nentries // ndupe_l[i] + 1
         cnt = Counter()
         for j in range(div_factor):
-            label = prefix + '_l%d_g' % i + str(j)
+            label = '{prefix}_l{i}_g{j}'.format(prefix=prefix, i=i, j=j)
             cnt[label] = ndupe_l[i]
         # cute Counter trick
         result = list(sorted(cnt.elements(), key=keyfunc))[:nentries]
@@ -1325,7 +1879,11 @@ def keyfunc(x):
 
     # convert tuples to index
     if nentries == 1:
+        # we have a single level of tuples, i.e. a regular Index
         index = Index(tuples[0], name=names[0])
+    elif nlevels == 1:
+        name = None if names is None else names[0]
+        index = Index((x[0] for x in tuples), name=name)
     else:
         index = MultiIndex.from_tuples(tuples, names=names)
     return index
@@ -1338,19 +1896,20 @@ def makeCustomDataframe(nrows, ncols, c_idx_names=True, r_idx_names=True,
     """
    nrows,  ncols - number of data rows/cols
    c_idx_names, idx_names  - False/True/list of strings,  yields No names ,
-        default names or  uses the provided names for the levels of the
-        corresponding  index. You can provide a single string when
+        default names or uses the provided names for the levels of the
+        corresponding index. You can provide a single string when
         c_idx_nlevels ==1.
    c_idx_nlevels - number of levels in columns index. > 1 will yield MultiIndex
    r_idx_nlevels - number of levels in rows index. > 1 will yield MultiIndex
-   data_gen_f - a function f(row,col) which return the data value at that position,
-        the default generator used yields values of the form "RxCy" based on position.
+   data_gen_f - a function f(row,col) which return the data value
+        at that position, the default generator used yields values of the form
+        "RxCy" based on position.
    c_ndupe_l, r_ndupe_l - list of integers, determines the number
-        of duplicates for each label at a given level of the corresponding index.
-        The default `None` value produces a multiplicity of 1 across
-        all levels, i.e. a unique index. Will accept a partial list of
-        length N < idx_nlevels, for just the first N levels. If ndupe
-        doesn't divide nrows/ncol, the last label might have lower multiplicity.
+        of duplicates for each label at a given level of the corresponding
+        index. The default `None` value produces a multiplicity of 1 across
+        all levels, i.e. a unique index. Will accept a partial list of length
+        N < idx_nlevels, for just the first N levels. If ndupe doesn't divide
+        nrows/ncol, the last label might have lower multiplicity.
    dtype - passed to the DataFrame constructor as is, in case you wish to
         have more control in conjuncion with a custom `data_gen_f`
    r_idx_type, c_idx_type -  "i"/"f"/"s"/"u"/"dt"/"td".
@@ -1370,8 +1929,9 @@ def makeCustomDataframe(nrows, ncols, c_idx_names=True, r_idx_names=True,
     # make the data a random int between 1 and 100
     >> mkdf(5,3,data_gen_f=lambda r,c:randint(1,100))
 
-    # 2-level multiindex on rows with each label duplicated twice on first level,
-    # default names on both axis, single index on both axis
+    # 2-level multiindex on rows with each label duplicated
+    # twice on first level, default names on both axis, single
+    # index on both axis
     >> a=makeCustomDataframe(5,3,r_idx_nlevels=2,r_ndupe_l=[2])
 
     # DatetimeIndex on row, index with unicode labels on columns
@@ -1391,9 +1951,11 @@ def makeCustomDataframe(nrows, ncols, c_idx_names=True, r_idx_names=True,
     assert c_idx_nlevels > 0
     assert r_idx_nlevels > 0
     assert r_idx_type is None or \
-        (r_idx_type in ('i', 'f', 's', 'u', 'dt', 'p', 'td') and r_idx_nlevels == 1)
+        (r_idx_type in ('i', 'f', 's',
+                        'u', 'dt', 'p', 'td') and r_idx_nlevels == 1)
     assert c_idx_type is None or \
-        (c_idx_type in ('i', 'f', 's', 'u', 'dt', 'p', 'td') and c_idx_nlevels == 1)
+        (c_idx_type in ('i', 'f', 's',
+                        'u', 'dt', 'p', 'td') and c_idx_nlevels == 1)
 
     columns = makeCustomIndex(ncols, nlevels=c_idx_nlevels, prefix='C',
                               names=c_idx_names, ndupe_l=c_ndupe_l,
@@ -1404,7 +1966,7 @@ def makeCustomDataframe(nrows, ncols, c_idx_names=True, r_idx_names=True,
 
     # by default, generate data based on location
     if data_gen_f is None:
-        data_gen_f = lambda r, c: "R%dC%d" % (r, c)
+        data_gen_f = lambda r, c: "R{rows}C{cols}".format(rows=r, cols=c)
 
     data = [[data_gen_f(r, c) for c in range(ncols)] for r in range(nrows)]
 
@@ -1485,88 +2047,20 @@ def add_nans(panel):
             dm[col][:i + j] = np.NaN
     return panel
 
+
 def add_nans_panel4d(panel4d):
     for l, label in enumerate(panel4d.labels):
         panel = panel4d[label]
         add_nans(panel)
     return panel4d
 
+
 class TestSubDict(dict):
 
     def __init__(self, *args, **kwargs):
         dict.__init__(self, *args, **kwargs)
 
 
-# Dependency checks.  Copied this from Nipy/Nipype (Copyright of
-# respective developers, license: BSD-3)
-def package_check(pkg_name, version=None, app='pandas', checker=LooseVersion,
-                  exc_failed_import=ImportError,
-                  exc_failed_check=RuntimeError):
-    """Check that the minimal version of the required package is installed.
-
-    Parameters
-    ----------
-    pkg_name : string
-        Name of the required package.
-    version : string, optional
-        Minimal version number for required package.
-    app : string, optional
-        Application that is performing the check.  For instance, the
-        name of the tutorial being executed that depends on specific
-        packages.
-    checker : object, optional
-        The class that will perform the version checking.  Default is
-        distutils.version.LooseVersion.
-    exc_failed_import : Exception, optional
-        Class of the exception to be thrown if import failed.
-    exc_failed_check : Exception, optional
-        Class of the exception to be thrown if version check failed.
-
-    Examples
-    --------
-    package_check('numpy', '1.3')
-    package_check('networkx', '1.0', 'tutorial1')
-
-    """
-
-    if app:
-        msg = '%s requires %s' % (app, pkg_name)
-    else:
-        msg = 'module requires %s' % pkg_name
-    if version:
-        msg += ' with version >= %s' % (version,)
-    try:
-        mod = __import__(pkg_name)
-    except ImportError:
-        raise exc_failed_import(msg)
-    if not version:
-        return
-    try:
-        have_version = mod.__version__
-    except AttributeError:
-        raise exc_failed_check('Cannot find version for %s' % pkg_name)
-    if checker(have_version) < checker(version):
-        raise exc_failed_check(msg)
-
-
-def skip_if_no_package(*args, **kwargs):
-    """Raise SkipTest if package_check fails
-
-    Parameters
-    ----------
-    *args Positional parameters passed to `package_check`
-    *kwargs Keyword parameters passed to `package_check`
-    """
-    from nose import SkipTest
-    package_check(exc_failed_import=SkipTest,
-                  exc_failed_check=SkipTest,
-                  *args, **kwargs)
-
-#
-# Additional tags decorators for nose
-#
-
-
 def optional_args(decorator):
     """allows a decorator to take optional positional and keyword arguments.
     Assumes that taking a single, callable, positional argument means that
@@ -1592,6 +2086,7 @@ def dec(f):
 
     return wrapper
 
+
 # skip tests on exceptions with this message
 _network_error_messages = (
     # 'urlopen error timed out',
@@ -1605,20 +2100,22 @@ def dec(f):
     'HTTP Error 502',
     'HTTP Error 503',
     'HTTP Error 403',
+    'HTTP Error 400',
     'Temporary failure in name resolution',
     'Name or service not known',
     'Connection refused',
+    'certificate verify',
 )
 
 # or this e.errno/e.reason.errno
 _network_errno_vals = (
-    101, # Network is unreachable
-    111, # Connection refused
-    110, # Connection timed out
-    104, # Connection reset Error
-    54,  # Connection reset by peer
-    60,  # urllib.error.URLError: [Errno 60] Connection timed out
-    )
+    101,  # Network is unreachable
+    111,  # Connection refused
+    110,  # Connection timed out
+    104,  # Connection reset Error
+    54,   # Connection reset by peer
+    60,   # urllib.error.URLError: [Errno 60] Connection timed out
+)
 
 # Both of the above shouldn't mask real issues such as 404's
 # or refused connections (changed DNS).
@@ -1628,8 +2125,9 @@ def dec(f):
 # and conditionally raise on these exception types
 _network_error_classes = (IOError, httplib.HTTPException)
 
-if sys.version_info >= (3, 3):
-    _network_error_classes += (TimeoutError,)
+if PY3:
+    _network_error_classes += (TimeoutError,)  # noqa
+
 
 def can_connect(url, error_classes=_network_error_classes):
     """Try to connect to the given url. True if succeeds, False if IOError
@@ -1679,8 +2177,8 @@ def network(t, url="http://www.google.com",
     t : callable
         The test requiring network connectivity.
     url : path
-        The url to test via ``pandas.io.common.urlopen`` to check for connectivity.
-        Defaults to 'http://www.google.com'.
+        The url to test via ``pandas.io.common.urlopen`` to check
+        for connectivity. Defaults to 'http://www.google.com'.
     raise_on_error : bool
         If True, never catches errors.
     check_before_test : bool
@@ -1695,7 +2193,7 @@ def network(t, url="http://www.google.com",
     _skip_on_messages: iterable of string
         any exception e for which one of the strings is
         a substring of str(e) will be skipped with an appropriate
-        message. Intended to supress errors where an errno isn't available.
+        message. Intended to suppress errors where an errno isn't available.
 
     Notes
     -----
@@ -1742,18 +2240,17 @@ def network(t, url="http://www.google.com",
         >>> test_something()
         Traceback (most recent call last):
             ...
-        SkipTest
 
     Errors not related to networking will always be raised.
     """
-    from nose import SkipTest
+    from pytest import skip
     t.network = True
 
-    @wraps(t)
+    @compat.wraps(t)
     def wrapper(*args, **kwargs):
         if check_before_test and not raise_on_error:
             if not can_connect(url, error_classes):
-                raise SkipTest
+                skip()
         try:
             return t(*args, **kwargs)
         except Exception as e:
@@ -1762,17 +2259,17 @@ def wrapper(*args, **kwargs):
                 errno = getattr(e.reason, 'errno', None)
 
             if errno in skip_errnos:
-                raise SkipTest("Skipping test due to known errno"
-                               " and error %s" % e)
+                skip("Skipping test due to known errno"
+                     " and error {error}".format(error=e))
 
             try:
                 e_str = traceback.format_exc(e)
-            except:
+            except Exception:
                 e_str = str(e)
 
-            if any([m.lower() in e_str.lower() for m in _skip_on_messages]):
-                raise SkipTest("Skipping test because exception message is known"
-                               " and error %s" % e)
+            if any(m.lower() in e_str.lower() for m in _skip_on_messages):
+                skip("Skipping test because exception "
+                     "message is known and error {error}".format(error=e))
 
             if not isinstance(e, error_classes):
                 raise
@@ -1780,8 +2277,8 @@ def wrapper(*args, **kwargs):
             if raise_on_error or can_connect(url, error_classes):
                 raise
             else:
-                raise SkipTest("Skipping test due to lack of connectivity"
-                               " and error %s" % e)
+                skip("Skipping test due to lack of connectivity"
+                     " and error {error}".format(e))
 
     return wrapper
 
@@ -1789,128 +2286,37 @@ def wrapper(*args, **kwargs):
 with_connectivity_check = network
 
 
-class SimpleMock(object):
-
-    """
-    Poor man's mocking object
-
-    Note: only works for new-style classes, assumes  __getattribute__ exists.
-
-    >>> a = type("Duck",(),{})
-    >>> a.attr1,a.attr2 ="fizz","buzz"
-    >>> b = SimpleMock(a,"attr1","bar")
-    >>> b.attr1 == "bar" and b.attr2 == "buzz"
-    True
-    >>> a.attr1 == "fizz" and a.attr2 == "buzz"
-    True
-    """
-
-    def __init__(self, obj, *args, **kwds):
-        assert(len(args) % 2 == 0)
-        attrs = kwds.get("attrs", {})
-        for k, v in zip(args[::2], args[1::2]):
-            # dict comprehensions break 2.6
-            attrs[k] = v
-        self.attrs = attrs
-        self.obj = obj
-
-    def __getattribute__(self, name):
-        attrs = object.__getattribute__(self, "attrs")
-        obj = object.__getattribute__(self, "obj")
-        return attrs.get(name, type(obj).__getattribute__(obj, name))
-
-
-@contextmanager
-def stdin_encoding(encoding=None):
-    """
-    Context manager for running bits of code while emulating an arbitrary
-    stdin encoding.
-
-    >>> import sys
-    >>> _encoding = sys.stdin.encoding
-    >>> with stdin_encoding('AES'): sys.stdin.encoding
-    'AES'
-    >>> sys.stdin.encoding==_encoding
-    True
-
-    """
-    import sys
-
-    _stdin = sys.stdin
-    sys.stdin = SimpleMock(sys.stdin, "encoding", encoding)
-    yield
-    sys.stdin = _stdin
-
-
-def assertRaises(_exception, _callable=None, *args, **kwargs):
-    """assertRaises that is usable as context manager or in a with statement
-
-    Exceptions that don't match the given Exception type fall through::
-
-    >>> with assertRaises(ValueError):
-    ...     raise TypeError("banana")
-    ...
-    Traceback (most recent call last):
-        ...
-    TypeError: banana
-
-    If it raises the given Exception type, the test passes
-    >>> with assertRaises(KeyError):
-    ...     dct = dict()
-    ...     dct["apple"]
-
-    If the expected error doesn't occur, it raises an error.
-    >>> with assertRaises(KeyError):
-    ...     dct = {'apple':True}
-    ...     dct["apple"]
-    Traceback (most recent call last):
-        ...
-    AssertionError: KeyError not raised.
-
-    In addition to using it as a contextmanager, you can also use it as a
-    function, just like the normal assertRaises
-
-    >>> assertRaises(TypeError, ",".join, [1, 3, 5]);
-    """
-    manager = _AssertRaisesContextmanager(exception=_exception)
-    # don't return anything if used in function form
-    if _callable is not None:
-        with manager:
-            _callable(*args, **kwargs)
-    else:
-        return manager
-
-def assertRaisesRegexp(_exception, _regexp, _callable=None, *args, **kwargs):
-    """ Port of assertRaisesRegexp from unittest in Python 2.7 - used in with statement.
-
-    Explanation from standard library:
-        Like assertRaises() but also tests that regexp matches on the string
-        representation of the raised exception. regexp may be a regular expression
-        object or a string containing a regular expression suitable for use by
-        re.search().
+def assert_raises_regex(_exception, _regexp, _callable=None,
+                        *args, **kwargs):
+    r"""
+    Check that the specified Exception is raised and that the error message
+    matches a given regular expression pattern. This may be a regular
+    expression object or a string containing a regular expression suitable
+    for use by `re.search()`. This is a port of the `assertRaisesRegexp`
+    function from unittest in Python 2.7.
 
-    You can pass either a regular expression or a compiled regular expression object.
-    >>> assertRaisesRegexp(ValueError, 'invalid literal for.*XYZ',
-    ...                                int, 'XYZ');
+    Examples
+    --------
+    >>> assert_raises_regex(ValueError, 'invalid literal for.*XYZ', int, 'XYZ')
     >>> import re
-    >>> assertRaisesRegexp(ValueError, re.compile('literal'), int, 'XYZ');
+    >>> assert_raises_regex(ValueError, re.compile('literal'), int, 'XYZ')
 
     If an exception of a different type is raised, it bubbles up.
 
-    >>> assertRaisesRegexp(TypeError, 'literal', int, 'XYZ');
+    >>> assert_raises_regex(TypeError, 'literal', int, 'XYZ')
     Traceback (most recent call last):
         ...
     ValueError: invalid literal for int() with base 10: 'XYZ'
     >>> dct = dict()
-    >>> assertRaisesRegexp(KeyError, 'pear', dct.__getitem__, 'apple');
+    >>> assert_raises_regex(KeyError, 'pear', dct.__getitem__, 'apple')
     Traceback (most recent call last):
         ...
     AssertionError: "pear" does not match "'apple'"
 
     You can also use this in a with statement.
-    >>> with assertRaisesRegexp(TypeError, 'unsupported operand type\(s\)'):
+    >>> with assert_raises_regex(TypeError, 'unsupported operand type\(s\)'):
     ...     1 + {}
-    >>> with assertRaisesRegexp(TypeError, 'banana'):
+    >>> with assert_raises_regex(TypeError, 'banana'):
     ...     'apple'[0] = 'b'
     Traceback (most recent call last):
         ...
@@ -1926,49 +2332,125 @@ def assertRaisesRegexp(_exception, _regexp, _callable=None, *args, **kwargs):
 
 
 class _AssertRaisesContextmanager(object):
-    """handles the behind the scenes work for assertRaises and assertRaisesRegexp"""
-    def __init__(self, exception, regexp=None, *args, **kwargs):
+    """
+    Context manager behind `assert_raises_regex`.
+    """
+
+    def __init__(self, exception, regexp=None):
+        """
+        Initialize an _AssertRaisesContextManager instance.
+
+        Parameters
+        ----------
+        exception : class
+            The expected Exception class.
+        regexp : str, default None
+            The regex to compare against the Exception message.
+        """
+
         self.exception = exception
+
         if regexp is not None and not hasattr(regexp, "search"):
             regexp = re.compile(regexp, re.DOTALL)
+
         self.regexp = regexp
 
     def __enter__(self):
         return self
 
-    def __exit__(self, exc_type, exc_value, traceback):
+    def __exit__(self, exc_type, exc_value, trace_back):
         expected = self.exception
-        if not exc_type:
-            name = getattr(expected, "__name__", str(expected))
-            raise AssertionError("{0} not raised.".format(name))
-        if issubclass(exc_type, expected):
-            return self.handle_success(exc_type, exc_value, traceback)
-        return self.handle_failure(exc_type, exc_value, traceback)
-
-    def handle_failure(*args, **kwargs):
-        # Failed, so allow Exception to bubble up
-        return False
 
-    def handle_success(self, exc_type, exc_value, traceback):
-        if self.regexp is not None:
-            val = str(exc_value)
-            if not self.regexp.search(val):
-                e = AssertionError('"%s" does not match "%s"' %
-                                   (self.regexp.pattern, str(val)))
-                raise_with_traceback(e, traceback)
-        return True
+        if not exc_type:
+            exp_name = getattr(expected, "__name__", str(expected))
+            raise AssertionError("{name} not raised.".format(name=exp_name))
+
+        return self.exception_matches(exc_type, exc_value, trace_back)
+
+    def exception_matches(self, exc_type, exc_value, trace_back):
+        """
+        Check that the Exception raised matches the expected Exception
+        and expected error message regular expression.
+
+        Parameters
+        ----------
+        exc_type : class
+            The type of Exception raised.
+        exc_value : Exception
+            The instance of `exc_type` raised.
+        trace_back : stack trace object
+            The traceback object associated with `exc_value`.
+
+        Returns
+        -------
+        is_matched : bool
+            Whether or not the Exception raised matches the expected
+            Exception class and expected error message regular expression.
+
+        Raises
+        ------
+        AssertionError : The error message provided does not match
+                         the expected error message regular expression.
+        """
+
+        if issubclass(exc_type, self.exception):
+            if self.regexp is not None:
+                val = str(exc_value)
+
+                if not self.regexp.search(val):
+                    msg = '"{pat}" does not match "{val}"'.format(
+                        pat=self.regexp.pattern, val=val)
+                    e = AssertionError(msg)
+                    raise_with_traceback(e, trace_back)
+
+            return True
+        else:
+            # Failed, so allow Exception to bubble up.
+            return False
 
 
 @contextmanager
 def assert_produces_warning(expected_warning=Warning, filter_level="always",
                             clear=None, check_stacklevel=True):
     """
-    Context manager for running code that expects to raise (or not raise)
-    warnings.  Checks that code raises the expected warning and only the
-    expected warning. Pass ``False`` or ``None`` to check that it does *not*
-    raise a warning. Defaults to ``exception.Warning``, baseclass of all
-    Warnings. (basically a wrapper around ``warnings.catch_warnings``).
+    Context manager for running code expected to either raise a specific
+    warning, or not raise any warnings. Verifies that the code raises the
+    expected warning, and that it does not raise any other unexpected
+    warnings. It is basically a wrapper around ``warnings.catch_warnings``.
+
+    Parameters
+    ----------
+    expected_warning : {Warning, False, None}, default Warning
+        The type of Exception raised. ``exception.Warning`` is the base
+        class for all warnings. To check that no warning is returned,
+        specify ``False`` or ``None``.
+    filter_level : str, default "always"
+        Specifies whether warnings are ignored, displayed, or turned
+        into errors.
+        Valid values are:
+
+        * "error" - turns matching warnings into exceptions
+        * "ignore" - discard the warning
+        * "always" - always emit a warning
+        * "default" - print the warning the first time it is generated
+          from each location
+        * "module" - print the warning the first time it is generated
+          from each module
+        * "once" - print the warning the first time it is generated
+
+    clear : str, default None
+        If not ``None`` then remove any previously raised warnings from
+        the ``__warningsregistry__`` to ensure that no warning messages are
+        suppressed by this context manager. If ``None`` is specified,
+        the ``__warningsregistry__`` keeps track of which warnings have been
+         shown, and does not show them again.
+    check_stacklevel : bool, default True
+        If True, displays the line that called the function containing
+        the warning to show were the function is called. Otherwise, the
+        line that implements the function is displayed.
 
+    Examples
+    --------
     >>> import warnings
     >>> with assert_produces_warning():
     ...     warnings.warn(UserWarning())
@@ -1994,43 +2476,43 @@ def assert_produces_warning(expected_warning=Warning, filter_level="always",
             # if they have happened before
             # to guarantee that we will catch them
             if not is_list_like(clear):
-                clear = [ clear ]
+                clear = [clear]
             for m in clear:
                 try:
                     m.__warningregistry__.clear()
-                except:
+                except Exception:
                     pass
 
         saw_warning = False
         warnings.simplefilter(filter_level)
         yield w
         extra_warnings = []
+
         for actual_warning in w:
             if (expected_warning and issubclass(actual_warning.category,
                                                 expected_warning)):
                 saw_warning = True
 
                 if check_stacklevel and issubclass(actual_warning.category,
-                                                   (FutureWarning, DeprecationWarning)):
+                                                   (FutureWarning,
+                                                    DeprecationWarning)):
                     from inspect import getframeinfo, stack
                     caller = getframeinfo(stack()[2][0])
-                    msg = ("Warning not set with correct stacklevel. File were warning"
-                           " is raised: {0} != {1}. Warning message: {2}".format(
-                               actual_warning.filename, caller.filename,
-                               actual_warning.message))
+                    msg = ("Warning not set with correct stacklevel. "
+                           "File where warning is raised: {actual} != "
+                           "{caller}. Warning message: {message}"
+                           ).format(actual=actual_warning.filename,
+                                    caller=caller.filename,
+                                    message=actual_warning.message)
                     assert actual_warning.filename == caller.filename, msg
             else:
                 extra_warnings.append(actual_warning.category.__name__)
         if expected_warning:
-            assert saw_warning, ("Did not see expected warning of class %r."
-                                 % expected_warning.__name__)
-        assert not extra_warnings, ("Caused unexpected warning(s): %r."
-                                    % extra_warnings)
-
-
-def disabled(t):
-    t.disabled = True
-    return t
+            msg = "Did not see expected warning of class {name!r}.".format(
+                name=expected_warning.__name__)
+            assert saw_warning, msg
+        assert not extra_warnings, ("Caused unexpected warning(s): {extra!r}."
+                                    ).format(extra=extra_warnings)
 
 
 class RNGContext(object):
@@ -2064,7 +2546,11 @@ def __exit__(self, exc_type, exc_value, traceback):
 
 
 @contextmanager
-def use_numexpr(use, min_elements=expr._MIN_ELEMENTS):
+def use_numexpr(use, min_elements=None):
+    from pandas.core.computation import expressions as expr
+    if min_elements is None:
+        min_elements = expr._MIN_ELEMENTS
+
     olduse = expr._USE_NUMEXPR
     oldmin = expr._MIN_ELEMENTS
     expr.set_use_numexpr(use)
@@ -2074,12 +2560,6 @@ def use_numexpr(use, min_elements=expr._MIN_ELEMENTS):
     expr.set_use_numexpr(olduse)
 
 
-# Also provide all assert_* functions in the TestCase class
-for name, obj in inspect.getmembers(sys.modules[__name__]):
-    if inspect.isfunction(obj) and name.startswith('assert'):
-        setattr(TestCase, name, staticmethod(obj))
-
-
 def test_parallel(num_threads=2, kwargs_list=None):
     """Decorator to run the same function multiple times in parallel.
 
@@ -2088,12 +2568,15 @@ def test_parallel(num_threads=2, kwargs_list=None):
     num_threads : int, optional
         The number of times the function is run in parallel.
     kwargs_list : list of dicts, optional
-        The list of kwargs to update original function kwargs on different threads.
+        The list of kwargs to update original
+        function kwargs on different threads.
     Notes
     -----
     This decorator does not pass the return value of the decorated function.
 
-    Original from scikit-image: https://github.com/scikit-image/scikit-image/pull/1519
+    Original from scikit-image:
+
+    https://github.com/scikit-image/scikit-image/pull/1519
 
     """
 
@@ -2124,9 +2607,180 @@ def inner(*args, **kwargs):
     return wrapper
 
 
+class SubclassedSeries(Series):
+    _metadata = ['testattr', 'name']
+
+    @property
+    def _constructor(self):
+        return SubclassedSeries
+
+    @property
+    def _constructor_expanddim(self):
+        return SubclassedDataFrame
+
+
 class SubclassedDataFrame(DataFrame):
     _metadata = ['testattr']
 
     @property
     def _constructor(self):
         return SubclassedDataFrame
+
+    @property
+    def _constructor_sliced(self):
+        return SubclassedSeries
+
+
+class SubclassedSparseSeries(pd.SparseSeries):
+    _metadata = ['testattr']
+
+    @property
+    def _constructor(self):
+        return SubclassedSparseSeries
+
+    @property
+    def _constructor_expanddim(self):
+        return SubclassedSparseDataFrame
+
+
+class SubclassedSparseDataFrame(pd.SparseDataFrame):
+    _metadata = ['testattr']
+
+    @property
+    def _constructor(self):
+        return SubclassedSparseDataFrame
+
+    @property
+    def _constructor_sliced(self):
+        return SubclassedSparseSeries
+
+
+class SubclassedCategorical(Categorical):
+
+    @property
+    def _constructor(self):
+        return SubclassedCategorical
+
+
+@contextmanager
+def patch(ob, attr, value):
+    """Temporarily patch an attribute of an object.
+
+    Parameters
+    ----------
+    ob : any
+        The object to patch. This must support attribute assignment for `attr`.
+    attr : str
+        The name of the attribute to patch.
+    value : any
+        The temporary attribute to assign.
+
+    Examples
+    --------
+    >>> class C(object):
+    ...     attribute = 'original'
+    ...
+    >>> C.attribute
+    'original'
+    >>> with patch(C, 'attribute', 'patched'):
+    ...     in_context = C.attribute
+    ...
+    >>> in_context
+    'patched'
+    >>> C.attribute  # the value is reset when the context manager exists
+    'original'
+
+    Correctly replaces attribute when the manager exits with an exception.
+    >>> with patch(C, 'attribute', 'patched'):
+    ...     in_context = C.attribute
+    ...     raise ValueError()
+    Traceback (most recent call last):
+       ...
+    ValueError
+    >>> in_context
+    'patched'
+    >>> C.attribute
+    'original'
+    """
+    noattr = object()  # mark that the attribute never existed
+    old = getattr(ob, attr, noattr)
+    setattr(ob, attr, value)
+    try:
+        yield
+    finally:
+        if old is noattr:
+            delattr(ob, attr)
+        else:
+            setattr(ob, attr, old)
+
+
+@contextmanager
+def set_timezone(tz):
+    """Context manager for temporarily setting a timezone.
+
+    Parameters
+    ----------
+    tz : str
+        A string representing a valid timezone.
+
+    Examples
+    --------
+
+    >>> from datetime import datetime
+    >>> from dateutil.tz import tzlocal
+    >>> tzlocal().tzname(datetime.now())
+    'IST'
+
+    >>> with set_timezone('US/Eastern'):
+    ...     tzlocal().tzname(datetime.now())
+    ...
+    'EDT'
+    """
+
+    import os
+    import time
+
+    def setTZ(tz):
+        if tz is None:
+            try:
+                del os.environ['TZ']
+            except KeyError:
+                pass
+        else:
+            os.environ['TZ'] = tz
+            time.tzset()
+
+    orig_tz = os.environ.get('TZ')
+    setTZ(tz)
+    try:
+        yield
+    finally:
+        setTZ(orig_tz)
+
+
+def _make_skipna_wrapper(alternative, skipna_alternative=None):
+    """Create a function for calling on an array.
+
+    Parameters
+    ----------
+    alternative : function
+        The function to be called on the array with no NaNs.
+        Only used when 'skipna_alternative' is None.
+    skipna_alternative : function
+        The function to be called on the original array
+
+    Returns
+    -------
+    skipna_wrapper : function
+    """
+    if skipna_alternative:
+        def skipna_wrapper(x):
+            return skipna_alternative(x.values)
+    else:
+        def skipna_wrapper(x):
+            nona = x.dropna()
+            if len(nona) == 0:
+                return np.nan
+            return alternative(nona)
+
+    return skipna_wrapper
diff --git a/release_stats.sh b/release_stats.sh
index 749d30e554226..1e82447007796 100755
--- a/release_stats.sh
+++ b/release_stats.sh
@@ -1,15 +1,42 @@
-#!/bin/sh
-
-LAST=`git tag --sort v:refname | grep -v rc | tail -1`
-START=`git log $LAST.. --simplify-by-decoration --pretty="format:%ai %d" | tail -1 | gawk '{ print $1 }'`
-END=`git log $LAST.. --simplify-by-decoration --pretty="format:%ai %d" | head -1 | gawk '{ print $1 }'`
-
-git log $LAST.. --format='%an#%s' | grep -v Merge > commits
+#!/bin/bash
+
+while [[ $# > 1 ]]
+do
+key="$1"
+
+case $key in
+    --from)
+    FROM="$2"
+    shift # past argument
+    ;;
+    --to)
+    TO="$2"
+    shift # past argument
+    ;;
+    *)
+          # unknown option
+    ;;
+esac
+shift # past argument or value
+done
+
+if [ -z "$FROM" ]; then
+   FROM=`git tag --sort v:refname | grep -v rc | tail -1`
+fi
+
+if [ -z "$TO" ]; then
+   TO=""
+fi
+
+START=`git log $FROM.. --simplify-by-decoration --pretty="format:%ai %d" | tail -1 | gawk '{ print $1 }'`
+END=`git log $TO.. --simplify-by-decoration --pretty="format:%ai %d" | head -1 | gawk '{ print $1 }'`
+
+git log $FROM.. --format='%an#%s' | grep -v Merge > commits
 
 # Include a summary by contributor in release notes:
 # cat commits | gawk -F '#' '{ print "- " $1 }' | sort | uniq
 
-echo "Stats since <$LAST> [$START - $END]"
+echo "Stats since <$FROM> [$START - $END]"
 echo ""
 
 AUTHORS=`cat commits | gawk -F '#' '{ print $1 }' | sort | uniq | wc -l`
diff --git a/scripts/announce.py b/scripts/announce.py
new file mode 100755
index 0000000000000..7b7933eba54dd
--- /dev/null
+++ b/scripts/announce.py
@@ -0,0 +1,124 @@
+#!/usr/bin/env python
+# -*- encoding:utf-8 -*-
+"""
+Script to generate contributor and pull request lists
+
+This script generates contributor and pull request lists for release
+announcements using Github v3 protocol. Use requires an authentication token in
+order to have sufficient bandwidth, you can get one following the directions at
+`<https://help.github.com/articles/creating-an-access-token-for-command-line-use/>_
+Don't add any scope, as the default is read access to public information. The
+token may be stored in an environment variable as you only get one chance to
+see it.
+
+Usage::
+
+    $ ./scripts/announce.py <token> <revision range>
+
+The output is utf8 rst.
+
+Dependencies
+------------
+
+- gitpython
+- pygithub
+
+Some code was copied from scipy `tools/gh_lists.py` and `tools/authors.py`.
+
+Examples
+--------
+
+From the bash command line with $GITHUB token.
+
+    $ ./scripts/announce.py $GITHUB v1.11.0..v1.11.1 > announce.rst
+
+"""
+from __future__ import print_function, division
+
+import os
+import re
+import codecs
+from git import Repo
+
+UTF8Writer = codecs.getwriter('utf8')
+this_repo = Repo(os.path.join(os.path.dirname(__file__), ".."))
+
+author_msg = """\
+A total of %d people contributed to this release.  People with a "+" by their
+names contributed a patch for the first time.
+"""
+
+pull_request_msg = """\
+A total of %d pull requests were merged for this release.
+"""
+
+
+def get_authors(revision_range):
+    pat = u'^.*\\t(.*)$'
+    lst_release, cur_release = [r.strip() for r in revision_range.split('..')]
+
+    # authors, in current release and previous to current release.
+    cur = set(re.findall(pat, this_repo.git.shortlog('-s', revision_range),
+                         re.M))
+    pre = set(re.findall(pat, this_repo.git.shortlog('-s', lst_release),
+                         re.M))
+
+    # Homu is the author of auto merges, clean him out.
+    cur.discard('Homu')
+    pre.discard('Homu')
+
+    # Append '+' to new authors.
+    authors = [s + u' +' for s in cur - pre] + [s for s in cur & pre]
+    authors.sort()
+    return authors
+
+
+def get_pull_requests(repo, revision_range):
+    prnums = []
+
+    # From regular merges
+    merges = this_repo.git.log(
+        '--oneline', '--merges', revision_range)
+    issues = re.findall(u"Merge pull request \\#(\\d*)", merges)
+    prnums.extend(int(s) for s in issues)
+
+    # From Homu merges (Auto merges)
+    issues = re. findall(u"Auto merge of \\#(\\d*)", merges)
+    prnums.extend(int(s) for s in issues)
+
+    # From fast forward squash-merges
+    commits = this_repo.git.log(
+        '--oneline', '--no-merges', '--first-parent', revision_range)
+    issues = re.findall(u'^.*\\(\\#(\\d+)\\)$', commits, re.M)
+    prnums.extend(int(s) for s in issues)
+
+    # get PR data from github repo
+    prnums.sort()
+    prs = [repo.get_pull(n) for n in prnums]
+    return prs
+
+
+def main(revision_range, repo):
+    lst_release, cur_release = [r.strip() for r in revision_range.split('..')]
+
+    # document authors
+    authors = get_authors(revision_range)
+    heading = u"Contributors"
+    print()
+    print(heading)
+    print(u"=" * len(heading))
+    print(author_msg % len(authors))
+
+    for s in authors:
+        print(u'* ' + s)
+
+
+if __name__ == "__main__":
+    from argparse import ArgumentParser
+
+    parser = ArgumentParser(description="Generate author lists for release")
+    parser.add_argument('revision_range', help='<revision>..<revision>')
+    parser.add_argument('--repo', help="Github org/repository",
+                        default="pandas-dev/pandas")
+    args = parser.parse_args()
+    main(args.revision_range, args.repo)
diff --git a/scripts/api_rst_coverage.py b/scripts/api_rst_coverage.py
deleted file mode 100644
index cc456f03c02ec..0000000000000
--- a/scripts/api_rst_coverage.py
+++ /dev/null
@@ -1,43 +0,0 @@
-import pandas as pd
-import inspect
-import re
-
-def main():
-    # classes whose members to check
-    classes = [pd.Series, pd.DataFrame, pd.Panel, pd.Panel4D]
-
-    def class_name_sort_key(x):
-        if x.startswith('Series'):
-            # make sure Series precedes DataFrame, Panel, and Panel4D
-            return ' ' + x
-        else:
-            return x
-
-    # class members
-    class_members = set()
-    for cls in classes:
-        class_members.update([cls.__name__ + '.' + x[0] for x in inspect.getmembers(cls)])
-
-    # class members referenced in api.rst
-    api_rst_members = set()
-    file_name = '../doc/source/api.rst'
-    with open(file_name, 'r') as f:
-        pattern = re.compile('({})\.(\w+)'.format('|'.join([cls.__name__ for cls in classes])))
-        for line in f:
-            match = pattern.search(line)
-            if match:
-                api_rst_members.add(match.group(0))
-
-    print()
-    print("Documented members in api.rst that aren't actual class members:")
-    for x in sorted(api_rst_members.difference(class_members), key=class_name_sort_key):
-        print(x)
-
-    print()
-    print("Class members (other than those beginning with '_') missing from api.rst:")
-    for x in sorted(class_members.difference(api_rst_members), key=class_name_sort_key):
-        if '._' not in x:
-            print(x)
-
-if __name__ == "__main__":
-    main()
diff --git a/scripts/bench_join.R b/scripts/bench_join.R
deleted file mode 100644
index edba277f0295c..0000000000000
--- a/scripts/bench_join.R
+++ /dev/null
@@ -1,50 +0,0 @@
-library(xts)
-
-iterations <- 50
-
-ns = c(100, 1000, 10000, 100000, 1000000)
-kinds = c("outer", "left", "inner")
-
-result = matrix(0, nrow=3, ncol=length(ns))
-n <- 100000
-pct.overlap <- 0.2
-
-k <- 1
-
-for (ni in 1:length(ns)){
- n <- ns[ni]
- rng1 <- 1:n
- offset <- as.integer(n * pct.overlap)
- rng2 <- rng1 + offset
- x <- xts(matrix(rnorm(n * k), nrow=n, ncol=k),
-          as.POSIXct(Sys.Date()) + rng1)
- y <- xts(matrix(rnorm(n * k), nrow=n, ncol=k),
-          as.POSIXct(Sys.Date()) + rng2)
- timing <- numeric()
- for (i in 1:3) {
-     kind = kinds[i]
-     for(j in 1:iterations) {
-       gc()  # just to be sure
-       timing[j] <- system.time(merge(x,y,join=kind))[3]
-     }
-     #timing <- system.time(for (j in 1:iterations) merge.xts(x, y, join=kind),
-     #                      gcFirst=F)
-     #timing <- as.list(timing)
-     result[i, ni] <- mean(timing) * 1000
-     #result[i, ni] = (timing$elapsed / iterations) * 1000
-   }
-}
-
-rownames(result) <- kinds
-colnames(result) <- log10(ns)
-
-mat <- matrix(rnorm(500000), nrow=100000, ncol=5)
-set.seed(12345)
-indexer <- sample(1:100000)
-
-timing <- rep(0, 10)
-for (i in 1:10) {
-  gc()
-  timing[i] = system.time(mat[indexer,])[3]
-}
-
diff --git a/scripts/bench_join.py b/scripts/bench_join.py
deleted file mode 100644
index 5223aac40d63b..0000000000000
--- a/scripts/bench_join.py
+++ /dev/null
@@ -1,211 +0,0 @@
-from pandas.compat import range, lrange
-import numpy as np
-import pandas.lib as lib
-from pandas import *
-from copy import deepcopy
-import time
-
-n = 1000000
-K = 1
-pct_overlap = 0.2
-
-a = np.arange(n, dtype=np.int64)
-b = np.arange(n * pct_overlap, n * (1 + pct_overlap), dtype=np.int64)
-
-dr1 = DatetimeIndex('1/1/2000', periods=n, offset=datetools.Minute())
-dr2 = DatetimeIndex(
-    dr1[int(pct_overlap * n)], periods=n, offset=datetools.Minute(2))
-
-aobj = a.astype(object)
-bobj = b.astype(object)
-
-av = np.random.randn(n)
-bv = np.random.randn(n)
-
-avf = np.random.randn(n, K)
-bvf = np.random.randn(n, K)
-
-a_series = Series(av, index=a)
-b_series = Series(bv, index=b)
-
-a_frame = DataFrame(avf, index=a, columns=lrange(K))
-b_frame = DataFrame(bvf, index=b, columns=lrange(K, 2 * K))
-
-
-def do_left_join(a, b, av, bv):
-    out = np.empty((len(a), 2))
-    lib.left_join_1d(a, b, av, bv, out)
-    return out
-
-
-def do_outer_join(a, b, av, bv):
-    result_index, aindexer, bindexer = lib.outer_join_indexer(a, b)
-    result = np.empty((2, len(result_index)))
-    lib.take_1d(av, aindexer, result[0])
-    lib.take_1d(bv, bindexer, result[1])
-    return result_index, result
-
-
-def do_inner_join(a, b, av, bv):
-    result_index, aindexer, bindexer = lib.inner_join_indexer(a, b)
-    result = np.empty((2, len(result_index)))
-    lib.take_1d(av, aindexer, result[0])
-    lib.take_1d(bv, bindexer, result[1])
-    return result_index, result
-
-from line_profiler import LineProfiler
-prof = LineProfiler()
-
-from pandas.util.testing import set_trace
-
-
-def do_left_join_python(a, b, av, bv):
-    indexer, mask = lib.ordered_left_join_int64(a, b)
-
-    n, ak = av.shape
-    _, bk = bv.shape
-    result_width = ak + bk
-
-    result = np.empty((result_width, n), dtype=np.float64)
-    result[:ak] = av.T
-
-    bchunk = result[ak:]
-    _take_multi(bv.T, indexer, bchunk)
-    np.putmask(bchunk, np.tile(mask, bk), np.nan)
-    return result
-
-
-def _take_multi(data, indexer, out):
-    if not data.flags.c_contiguous:
-        data = data.copy()
-    for i in range(data.shape[0]):
-        data[i].take(indexer, out=out[i])
-
-
-def do_left_join_multi(a, b, av, bv):
-    n, ak = av.shape
-    _, bk = bv.shape
-    result = np.empty((n, ak + bk), dtype=np.float64)
-    lib.left_join_2d(a, b, av, bv, result)
-    return result
-
-
-def do_outer_join_multi(a, b, av, bv):
-    n, ak = av.shape
-    _, bk = bv.shape
-    result_index, rindexer, lindexer = lib.outer_join_indexer(a, b)
-    result = np.empty((len(result_index), ak + bk), dtype=np.float64)
-    lib.take_join_contiguous(av, bv, lindexer, rindexer, result)
-    # result = np.empty((ak + bk, len(result_index)), dtype=np.float64)
-    # lib.take_axis0(av, rindexer, out=result[:ak].T)
-    # lib.take_axis0(bv, lindexer, out=result[ak:].T)
-    return result_index, result
-
-
-def do_inner_join_multi(a, b, av, bv):
-    n, ak = av.shape
-    _, bk = bv.shape
-    result_index, rindexer, lindexer = lib.inner_join_indexer(a, b)
-    result = np.empty((len(result_index), ak + bk), dtype=np.float64)
-    lib.take_join_contiguous(av, bv, lindexer, rindexer, result)
-    # result = np.empty((ak + bk, len(result_index)), dtype=np.float64)
-    # lib.take_axis0(av, rindexer, out=result[:ak].T)
-    # lib.take_axis0(bv, lindexer, out=result[ak:].T)
-    return result_index, result
-
-
-def do_left_join_multi_v2(a, b, av, bv):
-    indexer, mask = lib.ordered_left_join_int64(a, b)
-    bv_taken = bv.take(indexer, axis=0)
-    np.putmask(bv_taken, mask.repeat(bv.shape[1]), np.nan)
-    return np.concatenate((av, bv_taken), axis=1)
-
-
-def do_left_join_series(a, b):
-    return b.reindex(a.index)
-
-
-def do_left_join_frame(a, b):
-    a.index._indexMap = None
-    b.index._indexMap = None
-    return a.join(b, how='left')
-
-
-# a = np.array([1, 2, 3, 4, 5], dtype=np.int64)
-# b = np.array([0, 3, 5, 7, 9], dtype=np.int64)
-# print(lib.inner_join_indexer(a, b))
-
-out = np.empty((10, 120000))
-
-
-def join(a, b, av, bv, how="left"):
-    func_dict = {'left': do_left_join_multi,
-                 'outer': do_outer_join_multi,
-                 'inner': do_inner_join_multi}
-
-    f = func_dict[how]
-    return f(a, b, av, bv)
-
-
-def bench_python(n=100000, pct_overlap=0.20, K=1):
-    import gc
-    ns = [2, 3, 4, 5, 6]
-    iterations = 200
-    pct_overlap = 0.2
-    kinds = ['outer', 'left', 'inner']
-
-    all_results = {}
-    for logn in ns:
-        n = 10 ** logn
-        a = np.arange(n, dtype=np.int64)
-        b = np.arange(n * pct_overlap, n * pct_overlap + n, dtype=np.int64)
-
-        avf = np.random.randn(n, K)
-        bvf = np.random.randn(n, K)
-
-        a_frame = DataFrame(avf, index=a, columns=lrange(K))
-        b_frame = DataFrame(bvf, index=b, columns=lrange(K, 2 * K))
-
-        all_results[logn] = result = {}
-
-        for kind in kinds:
-            gc.disable()
-            elapsed = 0
-            _s = time.clock()
-            for i in range(iterations):
-                if i % 10 == 0:
-                    elapsed += time.clock() - _s
-                    gc.collect()
-                    _s = time.clock()
-                a_frame.join(b_frame, how=kind)
-                # join(a, b, avf, bvf, how=kind)
-            elapsed += time.clock() - _s
-            gc.enable()
-            result[kind] = (elapsed / iterations) * 1000
-
-    return DataFrame(all_results, index=kinds)
-
-
-def bench_xts(n=100000, pct_overlap=0.20):
-    from pandas.rpy.common import r
-    r('a <- 5')
-
-    xrng = '1:%d' % n
-
-    start = n * pct_overlap + 1
-    end = n + start - 1
-    yrng = '%d:%d' % (start, end)
-
-    r('library(xts)')
-
-    iterations = 500
-
-    kinds = ['left', 'outer', 'inner']
-    result = {}
-    for kind in kinds:
-        r('x <- xts(rnorm(%d), as.POSIXct(Sys.Date()) + %s)' % (n, xrng))
-        r('y <- xts(rnorm(%d), as.POSIXct(Sys.Date()) + %s)' % (n, yrng))
-        stmt = 'for (i in 1:%d) merge(x, y, join="%s")' % (iterations, kind)
-        elapsed = r('as.list(system.time(%s, gcFirst=F))$elapsed' % stmt)[0]
-        result[kind] = (elapsed / iterations) * 1000
-    return Series(result)
diff --git a/scripts/bench_join_multi.py b/scripts/bench_join_multi.py
deleted file mode 100644
index 7b93112b7f869..0000000000000
--- a/scripts/bench_join_multi.py
+++ /dev/null
@@ -1,32 +0,0 @@
-from pandas import *
-
-import numpy as np
-from pandas.compat import zip, range, lzip
-from pandas.util.testing import rands
-import pandas.lib as lib
-
-N = 100000
-
-key1 = [rands(10) for _ in range(N)]
-key2 = [rands(10) for _ in range(N)]
-
-zipped = lzip(key1, key2)
-
-
-def _zip(*args):
-    arr = np.empty(N, dtype=object)
-    arr[:] = lzip(*args)
-    return arr
-
-
-def _zip2(*args):
-    return lib.list_to_object_array(lzip(*args))
-
-index = MultiIndex.from_arrays([key1, key2])
-to_join = DataFrame({'j1': np.random.randn(100000)}, index=index)
-
-data = DataFrame({'A': np.random.randn(500000),
-                  'key1': np.repeat(key1, 5),
-                  'key2': np.repeat(key2, 5)})
-
-# data.join(to_join, on=['key1', 'key2'])
diff --git a/scripts/bench_refactor.py b/scripts/bench_refactor.py
deleted file mode 100644
index dafba371e995a..0000000000000
--- a/scripts/bench_refactor.py
+++ /dev/null
@@ -1,51 +0,0 @@
-from pandas import *
-from pandas.compat import range
-try:
-    import pandas.core.internals as internals
-    reload(internals)
-    import pandas.core.frame as frame
-    reload(frame)
-    from pandas.core.frame import DataFrame as DataMatrix
-except ImportError:
-    pass
-
-N = 1000
-K = 500
-
-
-def horribly_unconsolidated():
-    index = np.arange(N)
-
-    df = DataMatrix(index=index)
-
-    for i in range(K):
-        df[i] = float(K)
-
-    return df
-
-
-def bench_reindex_index(df, it=100):
-    new_idx = np.arange(0, N, 2)
-    for i in range(it):
-        df.reindex(new_idx)
-
-
-def bench_reindex_columns(df, it=100):
-    new_cols = np.arange(0, K, 2)
-    for i in range(it):
-        df.reindex(columns=new_cols)
-
-
-def bench_join_index(df, it=10):
-    left = df.reindex(index=np.arange(0, N, 2),
-                      columns=np.arange(K // 2))
-    right = df.reindex(columns=np.arange(K // 2 + 1, K))
-    for i in range(it):
-        joined = left.join(right)
-
-if __name__ == '__main__':
-    df = horribly_unconsolidated()
-    left = df.reindex(index=np.arange(0, N, 2),
-                      columns=np.arange(K // 2))
-    right = df.reindex(columns=np.arange(K // 2 + 1, K))
-    bench_join_index(df)
diff --git a/scripts/boxplot_test.py b/scripts/boxplot_test.py
deleted file mode 100644
index 3704f7b60dc60..0000000000000
--- a/scripts/boxplot_test.py
+++ /dev/null
@@ -1,14 +0,0 @@
-import matplotlib.pyplot as plt
-
-import random
-import pandas.util.testing as tm
-tm.N = 1000
-df = tm.makeTimeDataFrame()
-import string
-foo = list(string.letters[:5]) * 200
-df['indic'] = list(string.letters[:5]) * 200
-random.shuffle(foo)
-df['indic2'] = foo
-df.boxplot(by=['indic', 'indic2'], fontsize=8, rot=90)
-
-plt.show()
diff --git a/scripts/build_dist.sh b/scripts/build_dist.sh
new file mode 100755
index 0000000000000..c3f849ce7a6eb
--- /dev/null
+++ b/scripts/build_dist.sh
@@ -0,0 +1,18 @@
+#!/bin/bash
+
+# build the distribution
+LAST=`git tag --sort version:refname | grep -v rc | tail -1`
+
+echo "Building distribution for: $LAST"
+git checkout $LAST
+
+read -p "Ok to continue (y/n)? " answer
+case ${answer:0:1} in
+    y|Y )
+        echo "Building distribution"
+        ./build_dist_for_release.sh
+    ;;
+    * )
+        echo "Not building distribution"
+    ;;
+esac
diff --git a/scripts/build_dist_for_release.sh b/scripts/build_dist_for_release.sh
new file mode 100755
index 0000000000000..bee0f23a68ec2
--- /dev/null
+++ b/scripts/build_dist_for_release.sh
@@ -0,0 +1,10 @@
+#!/bin/bash
+
+# this requires cython to be installed
+
+# this builds the release cleanly & is building on the current checkout
+rm -rf dist
+git clean -xfd
+python setup.py clean --quiet
+python setup.py cython --quiet
+python setup.py sdist --formats=gztar --quiet
diff --git a/scripts/convert_deps.py b/scripts/convert_deps.py
new file mode 100755
index 0000000000000..aabeb24a0c3c8
--- /dev/null
+++ b/scripts/convert_deps.py
@@ -0,0 +1,29 @@
+"""
+Convert the conda environment.yaml to a pip requirements.txt
+"""
+import yaml
+
+exclude = {'python=3'}
+rename = {'pytables': 'tables'}
+
+with open("ci/environment-dev.yaml") as f:
+    dev = yaml.load(f)
+
+with open("ci/requirements-optional-conda.txt") as f:
+    optional = [x.strip() for x in f.readlines()]
+
+required = dev['dependencies']
+required = [rename.get(dep, dep) for dep in required if dep not in exclude]
+optional = [rename.get(dep, dep) for dep in optional if dep not in exclude]
+
+
+with open("ci/requirements_dev.txt", 'wt') as f:
+    f.write("# This file was autogenerated by scripts/convert_deps.py\n")
+    f.write("# Do not modify directly\n")
+    f.write('\n'.join(required))
+
+
+with open("ci/requirements-optional-pip.txt", 'wt') as f:
+    f.write("# This file was autogenerated by scripts/convert_deps.py\n")
+    f.write("# Do not modify directly\n")
+    f.write("\n".join(optional))
diff --git a/scripts/count_code.sh b/scripts/count_code.sh
deleted file mode 100755
index 991faf2e8711b..0000000000000
--- a/scripts/count_code.sh
+++ /dev/null
@@ -1 +0,0 @@
-cloc pandas --force-lang=Python,pyx --not-match-f="parser.c|lib.c|tslib.c|sandbox.c|hashtable.c|sparse.c|algos.c|index.c"
\ No newline at end of file
diff --git a/scripts/download_wheels.py b/scripts/download_wheels.py
new file mode 100644
index 0000000000000..f5cdbbe36d90d
--- /dev/null
+++ b/scripts/download_wheels.py
@@ -0,0 +1,47 @@
+#!/usr/bin/env python
+"""Fetch wheels from wheels.scipy.org for a pandas version."""
+import argparse
+import pathlib
+import sys
+import urllib.parse
+import urllib.request
+
+from lxml import html
+
+
+def parse_args(args=None):
+    parser = argparse.ArgumentParser(description=__doc__)
+    parser.add_argument("version", type=str, help="Pandas version (0.23.0)")
+    return parser.parse_args(args)
+
+
+def fetch(version):
+    base = 'http://wheels.scipy.org'
+    tree = html.parse(base)
+    root = tree.getroot()
+
+    dest = pathlib.Path('dist')
+    dest.mkdir(exist_ok=True)
+
+    files = [x for x in root.xpath("//a/text()")
+             if x.startswith('pandas-{}'.format(version))
+             and not dest.joinpath(x).exists()]
+
+    N = len(files)
+
+    for i, filename in enumerate(files, 1):
+        out = str(dest.joinpath(filename))
+        link = urllib.request.urljoin(base, filename)
+        urllib.request.urlretrieve(link, out)
+        print("Downloaded {link} to {out} [{i}/{N}]".format(
+            link=link, out=out, i=i, N=N
+        ))
+
+
+def main(args=None):
+    args = parse_args(args)
+    fetch(args.version)
+
+
+if __name__ == '__main__':
+    sys.exit(main())
diff --git a/scripts/faster_xs.py b/scripts/faster_xs.py
deleted file mode 100644
index 2bb6271124c4f..0000000000000
--- a/scripts/faster_xs.py
+++ /dev/null
@@ -1,15 +0,0 @@
-import numpy as np
-
-import pandas.util.testing as tm
-
-from pandas.core.internals import _interleaved_dtype
-
-df = tm.makeDataFrame()
-
-df['E'] = 'foo'
-df['F'] = 'foo'
-df['G'] = 2
-df['H'] = df['A'] > 0
-
-blocks = df._data.blocks
-items = df.columns
diff --git a/scripts/file_sizes.py b/scripts/file_sizes.py
deleted file mode 100644
index de03c72ffbd09..0000000000000
--- a/scripts/file_sizes.py
+++ /dev/null
@@ -1,208 +0,0 @@
-from __future__ import print_function
-import os
-import sys
-
-import numpy as np
-import matplotlib.pyplot as plt
-
-from pandas import DataFrame
-from pandas.util.testing import set_trace
-from pandas import compat
-
-dirs = []
-names = []
-lengths = []
-
-if len(sys.argv) > 1:
-    loc = sys.argv[1]
-else:
-    loc = '.'
-walked = os.walk(loc)
-
-
-def _should_count_file(path):
-    return path.endswith('.py') or path.endswith('.pyx')
-
-
-def _is_def_line(line):
-    """def/cdef/cpdef, but not `cdef class`"""
-    return (line.endswith(':') and not 'class' in line.split() and
-            (line.startswith('def ') or
-             line.startswith('cdef ') or
-             line.startswith('cpdef ') or
-             ' def ' in line or ' cdef ' in line or ' cpdef ' in line))
-
-
-class LengthCounter(object):
-    """
-    should add option for subtracting nested function lengths??
-    """
-    def __init__(self, lines):
-        self.lines = lines
-        self.pos = 0
-        self.counts = []
-        self.n = len(lines)
-
-    def get_counts(self):
-        self.pos = 0
-        self.counts = []
-        while self.pos < self.n:
-            line = self.lines[self.pos]
-            self.pos += 1
-            if _is_def_line(line):
-                level = _get_indent_level(line)
-                self._count_function(indent_level=level)
-        return self.counts
-
-    def _count_function(self, indent_level=1):
-        indent = '    ' * indent_level
-
-        def _end_of_function(line):
-            return (line != '' and
-                    not line.startswith(indent) and
-                    not line.startswith('#'))
-
-        start_pos = self.pos
-        while self.pos < self.n:
-            line = self.lines[self.pos]
-            if _end_of_function(line):
-                self._push_count(start_pos)
-                return
-
-            self.pos += 1
-
-            if _is_def_line(line):
-                self._count_function(indent_level=indent_level + 1)
-
-        # end of file
-        self._push_count(start_pos)
-
-    def _push_count(self, start_pos):
-        func_lines = self.lines[start_pos:self.pos]
-
-        if len(func_lines) > 300:
-            set_trace()
-
-        # remove blank lines at end
-        while len(func_lines) > 0 and func_lines[-1] == '':
-            func_lines = func_lines[:-1]
-
-        # remove docstrings and comments
-        clean_lines = []
-        in_docstring = False
-        for line in func_lines:
-            line = line.strip()
-            if in_docstring and _is_triplequote(line):
-                in_docstring = False
-                continue
-
-            if line.startswith('#'):
-                continue
-
-            if _is_triplequote(line):
-                in_docstring = True
-                continue
-
-        self.counts.append(len(func_lines))
-
-
-def _get_indent_level(line):
-    level = 0
-    while line.startswith('    ' * level):
-        level += 1
-    return level
-
-
-def _is_triplequote(line):
-    return line.startswith('"""') or line.startswith("'''")
-
-
-def _get_file_function_lengths(path):
-    lines = [x.rstrip() for x in open(path).readlines()]
-    counter = LengthCounter(lines)
-    return counter.get_counts()
-
-# def test_get_function_lengths():
-text = """
-class Foo:
-
-def foo():
-    def bar():
-        a = 1
-
-        b = 2
-
-        c = 3
-
-    foo = 'bar'
-
-def x():
-    a = 1
-
-    b = 3
-
-    c = 7
-
-    pass
-"""
-
-expected = [5, 8, 7]
-
-lines = [x.rstrip() for x in text.splitlines()]
-counter = LengthCounter(lines)
-result = counter.get_counts()
-assert(result == expected)
-
-
-def doit():
-    for directory, _, files in walked:
-        print(directory)
-        for path in files:
-            if not _should_count_file(path):
-                continue
-
-            full_path = os.path.join(directory, path)
-            print(full_path)
-            lines = len(open(full_path).readlines())
-
-            dirs.append(directory)
-            names.append(path)
-            lengths.append(lines)
-
-    result = DataFrame({'dirs': dirs, 'names': names,
-                        'lengths': lengths})
-
-
-def doit2():
-    counts = {}
-    for directory, _, files in walked:
-        print(directory)
-        for path in files:
-            if not _should_count_file(path) or path.startswith('test_'):
-                continue
-
-            full_path = os.path.join(directory, path)
-            counts[full_path] = _get_file_function_lengths(full_path)
-
-    return counts
-
-counts = doit2()
-
-# counts = _get_file_function_lengths('pandas/tests/test_series.py')
-
-all_counts = []
-for k, v in compat.iteritems(counts):
-    all_counts.extend(v)
-all_counts = np.array(all_counts)
-
-fig = plt.figure(figsize=(10, 5))
-ax = fig.add_subplot(111)
-ax.hist(all_counts, bins=100)
-n = len(all_counts)
-nmore = (all_counts > 50).sum()
-ax.set_title('%s function lengths, n=%d' % ('pandas', n))
-ax.set_ylabel('N functions')
-ax.set_xlabel('Function length')
-ax.text(100, 300, '%.3f%% with > 50 lines' % ((n - nmore) / float(n)),
-        fontsize=18)
-plt.show()
diff --git a/scripts/find_commits_touching_func.py b/scripts/find_commits_touching_func.py
index 099761f38bb44..29eb4161718ff 100755
--- a/scripts/find_commits_touching_func.py
+++ b/scripts/find_commits_touching_func.py
@@ -1,135 +1,148 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
-
-# copryright 2013, y-p @ github
-
-from __future__ import print_function
-from pandas.compat import range, lrange, map
-
-"""Search the git history for all commits touching a named method
+# copyright 2013, y-p @ github
+"""
+Search the git history for all commits touching a named method
 
 You need the sh module to run this
-WARNING: this script uses git clean -f, running it on a repo with untracked files
-will probably erase them.
+WARNING: this script uses git clean -f, running it on a repo with untracked
+files will probably erase them.
+
+Usage::
+    $ ./find_commits_touching_func.py  (see arguments below)
 """
+from __future__ import print_function
 import logging
 import re
 import os
+import argparse
 from collections import namedtuple
-from pandas.compat import parse_date
-
+from pandas.compat import lrange, map, string_types, text_type, parse_date
 try:
     import sh
 except ImportError:
-    raise ImportError("The 'sh' package is required in order to run this script. ")
+    raise ImportError("The 'sh' package is required to run this script.")
 
-import argparse
 
 desc = """
-Find all commits touching a sepcified function across the codebase.
+Find all commits touching a specified function across the codebase.
 """.strip()
 argparser = argparse.ArgumentParser(description=desc)
 argparser.add_argument('funcname', metavar='FUNCNAME',
-                   help='Name of function/method to search for changes on.')
+                       help='Name of function/method to search for changes on')
 argparser.add_argument('-f', '--file-masks', metavar='f_re(,f_re)*',
                        default=["\.py.?$"],
-                   help='comma seperated list of regexes to match filenames against\n'+
-                   'defaults all .py? files')
+                       help='comma separated list of regexes to match '
+                       'filenames against\ndefaults all .py? files')
 argparser.add_argument('-d', '--dir-masks', metavar='d_re(,d_re)*',
                        default=[],
-                   help='comma seperated list of regexes to match base path against')
+                       help='comma separated list of regexes to match base '
+                       'path against')
 argparser.add_argument('-p', '--path-masks', metavar='p_re(,p_re)*',
                        default=[],
-                   help='comma seperated list of regexes to match full file path against')
+                       help='comma separated list of regexes to match full '
+                       'file path against')
 argparser.add_argument('-y', '--saw-the-warning',
-                       action='store_true',default=False,
-                   help='must specify this to run, acknowledge you realize this will erase untracked files')
+                       action='store_true', default=False,
+                       help='must specify this to run, acknowledge you '
+                       'realize this will erase untracked files')
 argparser.add_argument('--debug-level',
                        default="CRITICAL",
-                   help='debug level of messages (DEBUG,INFO,etc...)')
-
+                       help='debug level of messages (DEBUG, INFO, etc...)')
 args = argparser.parse_args()
 
 
 lfmt = logging.Formatter(fmt='%(levelname)-8s %(message)s',
-    datefmt='%m-%d %H:%M:%S'
-)
-
+                         datefmt='%m-%d %H:%M:%S')
 shh = logging.StreamHandler()
 shh.setFormatter(lfmt)
-
-logger=logging.getLogger("findit")
+logger = logging.getLogger("findit")
 logger.addHandler(shh)
 
+Hit = namedtuple("Hit", "commit path")
+HASH_LEN = 8
 
-Hit=namedtuple("Hit","commit path")
-HASH_LEN=8
 
 def clean_checkout(comm):
-    h,s,d = get_commit_vitals(comm)
+    h, s, d = get_commit_vitals(comm)
     if len(s) > 60:
         s = s[:60] + "..."
-    s=s.split("\n")[0]
-    logger.info("CO: %s %s" % (comm,s ))
+    s = s.split("\n")[0]
+    logger.info("CO: %s %s" % (comm, s))
 
-    sh.git('checkout', comm ,_tty_out=False)
+    sh.git('checkout', comm, _tty_out=False)
     sh.git('clean', '-f')
 
-def get_hits(defname,files=()):
-    cs=set()
+
+def get_hits(defname, files=()):
+    cs = set()
     for f in files:
         try:
-            r=sh.git('blame', '-L', '/def\s*{start}/,/def/'.format(start=defname),f,_tty_out=False)
+            r = sh.git('blame',
+                       '-L',
+                       '/def\s*{start}/,/def/'.format(start=defname),
+                       f,
+                       _tty_out=False)
         except sh.ErrorReturnCode_128:
             logger.debug("no matches in %s" % f)
             continue
 
         lines = r.strip().splitlines()[:-1]
         # remove comment lines
-        lines = [x for x in lines if not re.search("^\w+\s*\(.+\)\s*#",x)]
-        hits = set(map(lambda x: x.split(" ")[0],lines))
-        cs.update(set([Hit(commit=c,path=f) for c in hits]))
+        lines = [x for x in lines if not re.search("^\w+\s*\(.+\)\s*#", x)]
+        hits = set(map(lambda x: x.split(" ")[0], lines))
+        cs.update(set(Hit(commit=c, path=f) for c in hits))
 
     return cs
 
-def get_commit_info(c,fmt,sep='\t'):
-    r=sh.git('log', "--format={}".format(fmt), '{}^..{}'.format(c,c),"-n","1",_tty_out=False)
-    return compat.text_type(r).split(sep)
 
-def get_commit_vitals(c,hlen=HASH_LEN):
-    h,s,d= get_commit_info(c,'%H\t%s\t%ci',"\t")
-    return h[:hlen],s,parse_date(d)
+def get_commit_info(c, fmt, sep='\t'):
+    r = sh.git('log',
+               "--format={}".format(fmt),
+               '{}^..{}'.format(c, c),
+               "-n",
+               "1",
+               _tty_out=False)
+    return text_type(r).split(sep)
+
 
-def file_filter(state,dirname,fnames):
-    if args.dir_masks and not any([re.search(x,dirname) for x in args.dir_masks]):
+def get_commit_vitals(c, hlen=HASH_LEN):
+    h, s, d = get_commit_info(c, '%H\t%s\t%ci', "\t")
+    return h[:hlen], s, parse_date(d)
+
+
+def file_filter(state, dirname, fnames):
+    if (args.dir_masks and
+            not any(re.search(x, dirname) for x in args.dir_masks)):
         return
     for f in fnames:
-        p = os.path.abspath(os.path.join(os.path.realpath(dirname),f))
-        if  any([re.search(x,f) for x in args.file_masks])\
-            or any([re.search(x,p) for x in args.path_masks]):
+        p = os.path.abspath(os.path.join(os.path.realpath(dirname), f))
+        if (any(re.search(x, f) for x in args.file_masks) or
+                any(re.search(x, p) for x in args.path_masks)):
             if os.path.isfile(p):
                 state['files'].append(p)
 
-def search(defname,head_commit="HEAD"):
-    HEAD,s = get_commit_vitals("HEAD")[:2]
-    logger.info("HEAD at %s: %s" % (HEAD,s))
+
+def search(defname, head_commit="HEAD"):
+    HEAD, s = get_commit_vitals("HEAD")[:2]
+    logger.info("HEAD at %s: %s" % (HEAD, s))
     done_commits = set()
     # allhits = set()
     files = []
     state = dict(files=files)
-    os.path.walk('.',file_filter,state)
+    os.walk('.', file_filter, state)
     # files now holds a list of paths to files
 
     # seed with hits from q
-    allhits= set(get_hits(defname, files = files))
+    allhits = set(get_hits(defname, files=files))
     q = set([HEAD])
     try:
         while q:
-            h=q.pop()
+            h = q.pop()
             clean_checkout(h)
-            hits = get_hits(defname, files = files)
+            hits = get_hits(defname, files=files)
             for x in hits:
-                prevc = get_commit_vitals(x.commit+"^")[0]
+                prevc = get_commit_vitals(x.commit + "^")[0]
                 if prevc not in done_commits:
                     q.add(prevc)
             allhits.update(hits)
@@ -141,61 +154,63 @@ def search(defname,head_commit="HEAD"):
         clean_checkout(HEAD)
     return allhits
 
+
 def pprint_hits(hits):
-    SUBJ_LEN=50
+    SUBJ_LEN = 50
     PATH_LEN = 20
-    hits=list(hits)
+    hits = list(hits)
     max_p = 0
     for hit in hits:
-        p=hit.path.split(os.path.realpath(os.curdir)+os.path.sep)[-1]
-        max_p=max(max_p,len(p))
+        p = hit.path.split(os.path.realpath(os.curdir) + os.path.sep)[-1]
+        max_p = max(max_p, len(p))
 
     if max_p < PATH_LEN:
         SUBJ_LEN += PATH_LEN - max_p
         PATH_LEN = max_p
 
     def sorter(i):
-        h,s,d=get_commit_vitals(hits[i].commit)
-        return hits[i].path,d
+        h, s, d = get_commit_vitals(hits[i].commit)
+        return hits[i].path, d
 
-    print("\nThese commits touched the %s method in these files on these dates:\n" \
-          % args.funcname)
-    for i in sorted(lrange(len(hits)),key=sorter):
+    print(('\nThese commits touched the %s method in these files '
+           'on these dates:\n') % args.funcname)
+    for i in sorted(lrange(len(hits)), key=sorter):
         hit = hits[i]
-        h,s,d=get_commit_vitals(hit.commit)
-        p=hit.path.split(os.path.realpath(os.curdir)+os.path.sep)[-1]
+        h, s, d = get_commit_vitals(hit.commit)
+        p = hit.path.split(os.path.realpath(os.curdir) + os.path.sep)[-1]
 
         fmt = "{:%d} {:10} {:<%d} {:<%d}" % (HASH_LEN, SUBJ_LEN, PATH_LEN)
         if len(s) > SUBJ_LEN:
-            s = s[:SUBJ_LEN-5] + " ..."
-        print(fmt.format(h[:HASH_LEN],d.isoformat()[:10],s,p[-20:]) )
+            s = s[:SUBJ_LEN - 5] + " ..."
+        print(fmt.format(h[:HASH_LEN], d.isoformat()[:10], s, p[-20:]))
 
     print("\n")
 
+
 def main():
     if not args.saw_the_warning:
         argparser.print_help()
         print("""
 !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
-WARNING: this script uses git clean -f, running it on a repo with untracked files.
+WARNING:
+this script uses git clean -f, running it on a repo with untracked files.
 It's recommended that you make a fresh clone and run from its root directory.
 You must specify the -y argument to ignore this warning.
 !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
 """)
         return
-    if isinstance(args.file_masks,compat.string_types):
+    if isinstance(args.file_masks, string_types):
         args.file_masks = args.file_masks.split(',')
-    if isinstance(args.path_masks,compat.string_types):
+    if isinstance(args.path_masks, string_types):
         args.path_masks = args.path_masks.split(',')
-    if isinstance(args.dir_masks,compat.string_types):
+    if isinstance(args.dir_masks, string_types):
         args.dir_masks = args.dir_masks.split(',')
 
-    logger.setLevel(getattr(logging,args.debug_level))
+    logger.setLevel(getattr(logging, args.debug_level))
 
-    hits=search(args.funcname)
+    hits = search(args.funcname)
     pprint_hits(hits)
 
-    pass
 
 if __name__ == "__main__":
     import sys
diff --git a/scripts/find_undoc_args.py b/scripts/find_undoc_args.py
index f00273bc75199..a135c8e5171a1 100755
--- a/scripts/find_undoc_args.py
+++ b/scripts/find_undoc_args.py
@@ -1,126 +1,135 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
+"""
+Script that compares the signature arguments with the ones in the docsting
+and returns the differences in plain text or GitHub task list format.
 
+Usage::
+    $ ./find_undoc_args.py  (see arguments below)
+"""
 from __future__ import print_function
-
+import sys
 from collections import namedtuple
-from itertools import islice
 import types
 import os
 import re
 import argparse
-#http://docs.python.org/2/library/argparse.html
-# arg name is positional is not prefixed with - or --
+import inspect
+
 
 parser = argparse.ArgumentParser(description='Program description.')
 parser.add_argument('-p', '--path', metavar='PATH', type=str, required=False,
-                    default=None,
-                   help='full path relative to which paths wills be reported',action='store')
-parser.add_argument('-m', '--module', metavar='MODULE', type=str,required=True,
-                   help='name of package to import and examine',action='store')
-parser.add_argument('-G', '--github_repo', metavar='REPO', type=str,required=False,
-                   help='github project where the the code lives, e.g. "pydata/pandas"',
-                   default=None,action='store')
-
+                    default=None, action='store',
+                    help='full path relative to which paths wills be reported')
+parser.add_argument('-m', '--module', metavar='MODULE', type=str,
+                    required=True, action='store',
+                    help='name of package to import and examine')
+parser.add_argument('-G', '--github_repo', metavar='REPO', type=str,
+                    required=False, default=None, action='store',
+                    help='github project where the code lives, '
+                    'e.g. "pandas-dev/pandas"')
 args = parser.parse_args()
 
-Entry=namedtuple("Entry","func path lnum undoc_names missing_args nsig_names ndoc_names")
+Entry = namedtuple('Entry',
+                   'func path lnum undoc_names missing_args '
+                   'nsig_names ndoc_names')
 
-def entry_gen(root_ns,module_name):
 
-    q=[root_ns]
-    seen=set()
+def entry_gen(root_ns, module_name):
+    """Walk and yield all methods and functions in the module root_ns and
+    submodules."""
+    q = [root_ns]
+    seen = set()
     while q:
         ns = q.pop()
         for x in dir(ns):
-            cand = getattr(ns,x)
-            if (isinstance(cand,types.ModuleType)
-                and cand.__name__ not in seen
-                and cand.__name__.startswith(module_name)):
-                # print(cand.__name__)
+            cand = getattr(ns, x)
+            if (isinstance(cand, types.ModuleType) and
+                    cand.__name__ not in seen and
+                    cand.__name__.startswith(module_name)):
                 seen.add(cand.__name__)
-                q.insert(0,cand)
-            elif (isinstance(cand,(types.MethodType,types.FunctionType)) and
+                q.insert(0, cand)
+            elif (isinstance(cand, (types.MethodType, types.FunctionType)) and
                   cand not in seen and cand.__doc__):
                 seen.add(cand)
                 yield cand
 
+
 def cmp_docstring_sig(f):
+    """Return an `Entry` object describing the differences between the
+    arguments in the signature and the documented ones."""
     def build_loc(f):
-        path=f.__code__.co_filename.split(args.path,1)[-1][1:]
-        return dict(path=path,lnum=f.__code__.co_firstlineno)
+        path = f.__code__.co_filename.split(args.path, 1)[-1][1:]
+        return dict(path=path, lnum=f.__code__.co_firstlineno)
 
-    import inspect
-    sig_names=set(inspect.getargspec(f).args)
+    sig_names = set(inspect.getargspec(f).args)
+    # XXX numpydoc can be used to get the list of parameters
     doc = f.__doc__.lower()
-    doc = re.split("^\s*parameters\s*",doc,1,re.M)[-1]
-    doc = re.split("^\s*returns*",doc,1,re.M)[0]
-    doc_names={x.split(":")[0].strip() for x in doc.split("\n")
-                if re.match("\s+[\w_]+\s*:",x)}
-    sig_names.discard("self")
-    doc_names.discard("kwds")
-    doc_names.discard("kwargs")
-    doc_names.discard("args")
-    return Entry(func=f,path=build_loc(f)['path'],lnum=build_loc(f)['lnum'],
+    doc = re.split('^\s*parameters\s*', doc, 1, re.M)[-1]
+    doc = re.split('^\s*returns*', doc, 1, re.M)[0]
+    doc_names = {x.split(":")[0].strip() for x in doc.split('\n')
+                 if re.match('\s+[\w_]+\s*:', x)}
+    sig_names.discard('self')
+    doc_names.discard('kwds')
+    doc_names.discard('kwargs')
+    doc_names.discard('args')
+    return Entry(func=f, path=build_loc(f)['path'], lnum=build_loc(f)['lnum'],
                  undoc_names=sig_names.difference(doc_names),
-                 missing_args=doc_names.difference(sig_names),nsig_names=len(sig_names),
-                 ndoc_names=len(doc_names))
+                 missing_args=doc_names.difference(sig_names),
+                 nsig_names=len(sig_names), ndoc_names=len(doc_names))
+
 
 def format_id(i):
     return i
 
-def format_item_as_github_task_list( i,item,repo):
-    tmpl = "- [ ] {id}) [{file}:{lnum} ({func_name}())]({link}) -  __Missing__[{nmissing}/{total_args}]: {undoc_names}"
 
+def format_item_as_github_task_list(i, item, repo):
+    tmpl = ('- [ ] {id_}) [{fname}:{lnum} ({func_name}())]({link}) -  '
+            '__Missing__[{nmissing}/{total_args}]: {undoc_names}')
     link_tmpl = "https://github.com/{repo}/blob/master/{file}#L{lnum}"
-
-    link = link_tmpl.format(repo=repo,file=item.path ,lnum=item.lnum           )
-
-    s = tmpl.format(id=i,file=item.path ,
-                      lnum=item.lnum,
-                      func_name=item.func.__name__,
-                      link=link,
-                      nmissing=len(item.undoc_names),
-                      total_args=item.nsig_names,
-                      undoc_names=list(item.undoc_names))
-
+    link = link_tmpl.format(repo=repo, file=item.path, lnum=item.lnum)
+    s = tmpl.format(id_=i, fname=item.path, lnum=item.lnum,
+                    func_name=item.func.__name__, link=link,
+                    nmissing=len(item.undoc_names),
+                    total_args=item.nsig_names,
+                    undoc_names=list(item.undoc_names))
     if item.missing_args:
-        s+= "    __Extra__(?): {missing_args}".format(missing_args=list(item.missing_args))
-
+        s += '    __Extra__(?): %s' % list(item.missing_args)
     return s
 
-def format_item_as_plain(i,item):
-    tmpl = "+{lnum} {path} {func_name}(): Missing[{nmissing}/{total_args}]={undoc_names}"
-
-    s = tmpl.format(path=item.path ,
-                      lnum=item.lnum,
-                      func_name=item.func.__name__,
-                      nmissing=len(item.undoc_names),
-                      total_args=item.nsig_names,
-                      undoc_names=list(item.undoc_names))
 
+def format_item_as_plain(i, item):
+    tmpl = ('+{lnum} {path} {func_name}(): '
+            'Missing[{nmissing}/{total_args}]={undoc_names}')
+    s = tmpl.format(path=item.path, lnum=item.lnum,
+                    func_name=item.func.__name__,
+                    nmissing=len(item.undoc_names),
+                    total_args=item.nsig_names,
+                    undoc_names=list(item.undoc_names))
     if item.missing_args:
-        s+= " Extra(?)={missing_args}".format(missing_args=list(item.missing_args))
-
+        s += ' Extra(?)=%s' % list(item.missing_args)
     return s
 
+
 def main():
     module = __import__(args.module)
     if not args.path:
-        args.path=os.path.dirname(module.__file__)
-    collect=[cmp_docstring_sig(e) for e in entry_gen(module,module.__name__)]
-    # only include if there are missing arguments in the docstring (fewer false positives)
-    # and there are at least some documented arguments
-    collect = [e for e in collect if e.undoc_names and len(e.undoc_names) != e.nsig_names]
-    collect.sort(key=lambda x:x.path)
+        args.path = os.path.dirname(module.__file__)
+    collect = [cmp_docstring_sig(e)
+               for e in entry_gen(module, module.__name__)]
+    # only include if there are missing arguments in the docstring
+    # (fewer false positives) and there are at least some documented arguments
+    collect = [e for e in collect
+               if e.undoc_names and len(e.undoc_names) != e.nsig_names]
+    collect.sort(key=lambda x: x.path)
 
     if args.github_repo:
-        for i,item in enumerate(collect,1):
-            print( format_item_as_github_task_list(i,item,args.github_repo))
+        for i, item in enumerate(collect, 1):
+            print(format_item_as_github_task_list(i, item, args.github_repo))
     else:
-        for i,item in enumerate(collect,1):
-            print( format_item_as_plain(i, item))
+        for i, item in enumerate(collect, 1):
+            print(format_item_as_plain(i, item))
+
 
-if __name__ == "__main__":
-    import sys
+if __name__ == '__main__':
     sys.exit(main())
diff --git a/scripts/gen_release_notes.py b/scripts/gen_release_notes.py
deleted file mode 100644
index 02ba4f57c189d..0000000000000
--- a/scripts/gen_release_notes.py
+++ /dev/null
@@ -1,95 +0,0 @@
-from __future__ import print_function
-import sys
-import json
-from pandas.io.common import urlopen
-from datetime import datetime
-
-
-class Milestone(object):
-
-    def __init__(self, title, number):
-        self.title = title
-        self.number = number
-
-    def __eq__(self, other):
-        if isinstance(other, Milestone):
-            return self.number == other.number
-        return False
-
-
-class Issue(object):
-
-    def __init__(self, title, labels, number, milestone, body, state):
-        self.title = title
-        self.labels = set([x['name'] for x in labels])
-        self.number = number
-        self.milestone = milestone
-        self.body = body
-        self.closed = state == 'closed'
-
-    def __eq__(self, other):
-        if isinstance(other, Issue):
-            return self.number == other.number
-        return False
-
-
-def get_issues():
-    all_issues = []
-    page_number = 1
-    while True:
-        iss = _get_page(page_number)
-        if len(iss) == 0:
-            break
-        page_number += 1
-        all_issues.extend(iss)
-    return all_issues
-
-
-def _get_page(page_number):
-    gh_url = ('https://api.github.com/repos/pydata/pandas/issues?'
-              'milestone=*&state=closed&assignee=*&page=%d') % page_number
-    with urlopen(gh_url) as resp:
-        rs = resp.readlines()[0]
-    jsondata = json.loads(rs)
-    issues = [Issue(x['title'], x['labels'], x['number'],
-                    get_milestone(x['milestone']), x['body'], x['state'])
-              for x in jsondata]
-    return issues
-
-
-def get_milestone(data):
-    if data is None:
-        return None
-    return Milestone(data['title'], data['number'])
-
-
-def collate_label(issues, label):
-    lines = []
-    for x in issues:
-        if label in x.labels:
-            lines.append('\t- %s(#%d)' % (x.title, x.number))
-
-    return '\n'.join(lines)
-
-
-def release_notes(milestone):
-    issues = get_issues()
-
-    headers = ['New Features', 'Improvements to existing features',
-               'API Changes', 'Bug fixes']
-    labels = ['New', 'Enhancement', 'API-Change', 'Bug']
-
-    rs = 'pandas %s' % milestone
-    rs += '\n' + ('=' * len(rs))
-    rs += '\n\n **Release date:** %s' % datetime.today().strftime('%B %d, %Y')
-    for i, h in enumerate(headers):
-        rs += '\n\n**%s**\n\n' % h
-        l = labels[i]
-        rs += collate_label(issues, l)
-
-    return rs
-
-if __name__ == '__main__':
-
-    rs = release_notes(sys.argv[1])
-    print(rs)
diff --git a/scripts/git-mrb b/scripts/git-mrb
deleted file mode 100644
index c15e6dbf9f51a..0000000000000
--- a/scripts/git-mrb
+++ /dev/null
@@ -1,82 +0,0 @@
-#!/usr/bin/env python
-"""git-mrb: merge remote branch.
-
-git mrb [remote:branch OR remote-branch] [onto] [upstream]
-
-remote must be locally available, and branch must exist in that remote.
-
-If 'onto' branch isn't given, default is 'master'.
-
-If 'upstream' repository isn't given, default is 'origin'.
-
-You can separate the remote and branch spec with either a : or a -.
-
-Taken from IPython project
-"""
-#-----------------------------------------------------------------------------
-# Imports
-#-----------------------------------------------------------------------------
-
-from subprocess import check_call
-import sys
-
-#-----------------------------------------------------------------------------
-# Functions
-#-----------------------------------------------------------------------------
-
-def sh(cmd):
-    cmd = cmd.format(**shvars)
-    print('$', cmd)
-    check_call(cmd, shell=True)
-
-#-----------------------------------------------------------------------------
-# Main Script
-#-----------------------------------------------------------------------------
-
-argv = sys.argv[1:]
-narg = len(argv)
-
-try:
-    branch_spec = argv[0]
-    sep = ':' if ':' in branch_spec else '-'
-    remote, branch = branch_spec.split(':', 1)
-    if not branch:
-        raise ValueError('Branch spec %s invalid, branch not found' %
-                         branch_spec)
-except:
-    import traceback as tb
-    tb.print_exc()
-    print(__doc__)
-    sys.exit(1)
-
-onto = argv[1] if narg >= 2 else 'master'
-upstream = argv[1] if narg == 3 else 'origin'
-
-# Git doesn't like ':' in branch names.
-if sep == ':':
-    branch_spec = branch_spec.replace(':', '-')
-
-# Global used by sh
-shvars = dict(remote=remote, branch_spec=branch_spec, branch=branch,
-              onto=onto, upstream=upstream)
-
-# Start git calls.
-sh('git fetch {remote}')
-sh('git checkout -b {branch_spec} {onto}')
-sh('git merge {remote}/{branch}')
-
-print("""
-*************************************************************
- Run test suite.  If tests pass, run the following to merge:
-
-git checkout {onto}
-git merge {branch_spec}
-git push {upstream} {onto}
-
-*************************************************************
-""".format(**shvars))
-
-ans = raw_input("Revert to master and delete temporary branch? [Y/n]: ")
-if ans.strip().lower() in ('', 'y', 'yes'):
-    sh('git checkout {onto}')
-    sh('git branch -D {branch_spec}')
\ No newline at end of file
diff --git a/scripts/git_code_churn.py b/scripts/git_code_churn.py
deleted file mode 100644
index 18c9b244a6ba0..0000000000000
--- a/scripts/git_code_churn.py
+++ /dev/null
@@ -1,34 +0,0 @@
-import subprocess
-import os
-import re
-import sys
-
-import numpy as np
-
-from pandas import *
-
-
-if __name__ == '__main__':
-    from vbench.git import GitRepo
-    repo = GitRepo('/Users/wesm/code/pandas')
-    churn = repo.get_churn_by_file()
-
-    file_include = []
-    for path in churn.major_axis:
-        if path.endswith('.pyx') or path.endswith('.py'):
-            file_include.append(path)
-    commits_include = [sha for sha in churn.minor_axis
-                       if 'LF' not in repo.messages[sha]]
-    commits_include.remove('dcf3490')
-
-    clean_churn = churn.reindex(major=file_include, minor=commits_include)
-
-    by_commit = clean_churn.sum('major').sum(1)
-
-    by_date = by_commit.groupby(repo.commit_date).sum()
-
-    by_date = by_date.drop([datetime(2011, 6, 10)])
-
-    # clean out days where I touched Cython
-
-    by_date = by_date[by_date < 5000]
diff --git a/scripts/groupby_sample.py b/scripts/groupby_sample.py
deleted file mode 100644
index 42008858d3cad..0000000000000
--- a/scripts/groupby_sample.py
+++ /dev/null
@@ -1,54 +0,0 @@
-from pandas import *
-import numpy as np
-import string
-import pandas.compat as compat
-
-g1 = np.array(list(string.letters))[:-1]
-g2 = np.arange(510)
-df_small = DataFrame({'group1': ["a", "b", "a", "a", "b", "c", "c", "c", "c",
-                                 "c", "a", "a", "a", "b", "b", "b", "b"],
-                      'group2': [1, 2, 3, 4, 1, 3, 5, 6, 5, 4, 1, 2, 3, 4, 3, 2, 1],
-                      'value': ["apple", "pear", "orange", "apple",
-                                "banana", "durian", "lemon", "lime",
-                                "raspberry", "durian", "peach", "nectarine",
-                                "banana", "lemon", "guava", "blackberry",
-                                "grape"]})
-value = df_small['value'].values.repeat(3)
-df = DataFrame({'group1': g1.repeat(4000 * 5),
-                'group2': np.tile(g2, 400 * 5),
-                'value': value.repeat(4000 * 5)})
-
-
-def random_sample():
-    grouped = df.groupby(['group1', 'group2'])['value']
-    from random import choice
-    choose = lambda group: choice(group.index)
-    indices = grouped.apply(choose)
-    return df.reindex(indices)
-
-
-def random_sample_v2():
-    grouped = df.groupby(['group1', 'group2'])['value']
-    from random import choice
-    choose = lambda group: choice(group.index)
-    indices = [choice(v) for k, v in compat.iteritems(grouped.groups)]
-    return df.reindex(indices)
-
-
-def do_shuffle(arr):
-    from random import shuffle
-    result = arr.copy().values
-    shuffle(result)
-    return result
-
-
-def shuffle_uri(df, grouped):
-    perm = np.r_[tuple([np.random.permutation(
-        idxs) for idxs in compat.itervalues(grouped.groups)])]
-    df['state_permuted'] = np.asarray(df.ix[perm]['value'])
-
-df2 = df.copy()
-grouped = df2.groupby('group1')
-shuffle_uri(df2, grouped)
-
-df2['state_perm'] = grouped['value'].transform(do_shuffle)
diff --git a/scripts/groupby_speed.py b/scripts/groupby_speed.py
deleted file mode 100644
index 34f293d5008c6..0000000000000
--- a/scripts/groupby_speed.py
+++ /dev/null
@@ -1,35 +0,0 @@
-from __future__ import print_function
-from pandas import *
-
-rng = DatetimeIndex('1/3/2011', '11/30/2011', offset=datetools.Minute())
-
-df = DataFrame(np.random.randn(len(rng), 5), index=rng,
-               columns=list('OHLCV'))
-
-rng5 = DatetimeIndex('1/3/2011', '11/30/2011', offset=datetools.Minute(5))
-gp = rng5.asof
-grouped = df.groupby(gp)
-
-
-def get1(dt):
-    k = gp(dt)
-    return grouped.get_group(k)
-
-
-def get2(dt):
-    k = gp(dt)
-    return df.ix[grouped.groups[k]]
-
-
-def f():
-    for i, date in enumerate(df.index):
-        if i % 10000 == 0:
-            print(i)
-        get1(date)
-
-
-def g():
-    for i, date in enumerate(df.index):
-        if i % 10000 == 0:
-            print(i)
-        get2(date)
diff --git a/scripts/groupby_test.py b/scripts/groupby_test.py
deleted file mode 100644
index 5acf7da7534a3..0000000000000
--- a/scripts/groupby_test.py
+++ /dev/null
@@ -1,145 +0,0 @@
-from collections import defaultdict
-
-from numpy import nan
-import numpy as np
-
-from pandas import *
-
-import pandas.lib as tseries
-import pandas.core.groupby as gp
-import pandas.util.testing as tm
-from pandas.compat import range
-reload(gp)
-
-"""
-
-k = 1000
-values = np.random.randn(8 * k)
-key1 = np.array(['foo', 'bar', 'baz', 'bar', 'foo', 'baz', 'bar', 'baz'] * k,
-                dtype=object)
-key2 = np.array(['b', 'b', 'b', 'b', 'a', 'a', 'a', 'a' ] * k,
-                dtype=object)
-shape, labels, idicts = gp.labelize(key1, key2)
-
-print(tseries.group_labels(key1))
-
-# print(shape)
-# print(labels)
-# print(idicts)
-
-result = tseries.group_aggregate(values, labels, shape)
-
-print(tseries.groupby_indices(key2))
-
-df = DataFrame({'key1' : key1,
-                'key2' : key2,
-                'v1' : values,
-                'v2' : values})
-k1 = df['key1']
-k2 = df['key2']
-
-# del df['key1']
-# del df['key2']
-
-# r2 = gp.multi_groupby(df, np.sum, k1, k2)
-
-# print(result)
-
-gen = gp.generate_groups(df['v1'], labels, shape, axis=1,
-                         factory=DataFrame)
-
-res = defaultdict(dict)
-for a, gen1 in gen:
-    for b, group in gen1:
-        print(a, b)
-        print(group)
-        # res[b][a] = group['values'].sum()
-        res[b][a] = group.sum()
-
-res = DataFrame(res)
-
-grouped = df.groupby(['key1', 'key2'])
-"""
-
-# data = {'A' : [0, 0, 0, 0, 1, 1, 1, 1, 1, 1., nan, nan],
-#         'B' : ['A', 'B'] * 6,
-#         'C' : np.random.randn(12)}
-# df = DataFrame(data)
-# df['C'][2:10:2] = nan
-
-# single column
-# grouped = df.drop(['B'], axis=1).groupby('A')
-# exp = {}
-# for cat, group in grouped:
-#     exp[cat] = group['C'].sum()
-# exp = DataFrame({'C' : exp})
-# result = grouped.sum()
-
-# grouped = df.groupby(['A', 'B'])
-# expd = {}
-# for cat1, cat2, group in grouped:
-#     expd.setdefault(cat1, {})[cat2] = group['C'].sum()
-# exp = DataFrame(expd).T.stack()
-# result = grouped.sum()['C']
-
-# print('wanted')
-# print(exp)
-# print('got')
-# print(result)
-
-# tm.N = 10000
-
-# mapping = {'A': 0, 'C': 1, 'B': 0, 'D': 1}
-# tf = lambda x: x - x.mean()
-
-# df = tm.makeTimeDataFrame()
-# ts = df['A']
-
-# # grouped = df.groupby(lambda x: x.strftime('%m/%y'))
-# grouped = df.groupby(mapping, axis=1)
-# groupedT = df.T.groupby(mapping, axis=0)
-
-# r1 = groupedT.transform(tf).T
-# r2 = grouped.transform(tf)
-
-# fillit = lambda x: x.fillna(method='pad')
-
-# f = lambda x: x
-
-# transformed = df.groupby(lambda x: x.strftime('%m/%y')).transform(lambda
-# x: x)
-
-# def ohlc(group):
-#     return Series([group[0], group.max(), group.min(), group[-1]],
-#                   index=['open', 'high', 'low', 'close'])
-# grouper = [lambda x: x.year, lambda x: x.month]
-# dr = DateRange('1/1/2000', '1/1/2002')
-# ts = Series(np.random.randn(len(dr)), index=dr)
-
-# import string
-
-# k = 20
-# n = 1000
-
-# keys = list(string.letters[:k])
-
-# df = DataFrame({'A' : np.tile(keys, n),
-#                 'B' : np.repeat(keys[:k/2], n * 2),
-#                 'C' : np.random.randn(k * n)})
-
-# def f():
-#     for x in df.groupby(['A', 'B']):
-#         pass
-
-a = np.arange(100).repeat(100)
-b = np.tile(np.arange(100), 100)
-index = MultiIndex.from_arrays([a, b])
-s = Series(np.random.randn(len(index)), index)
-df = DataFrame({'A': s})
-df['B'] = df.index.get_level_values(0)
-df['C'] = df.index.get_level_values(1)
-
-
-def f():
-    for x in df.groupby(['B', 'B']):
-        pass
diff --git a/scripts/hdfstore_panel_perf.py b/scripts/hdfstore_panel_perf.py
deleted file mode 100644
index 66b0b52444bc1..0000000000000
--- a/scripts/hdfstore_panel_perf.py
+++ /dev/null
@@ -1,17 +0,0 @@
-from pandas import *
-from pandas.util.testing import rands
-from pandas.compat import range
-
-i, j, k = 7, 771, 5532
-
-panel = Panel(np.random.randn(i, j, k),
-              items=[rands(10) for _ in range(i)],
-              major_axis=DatetimeIndex('1/1/2000', periods=j,
-                                   offset=datetools.Minute()),
-              minor_axis=[rands(10) for _ in range(k)])
-
-
-store = HDFStore('test.h5')
-store.put('test_panel', panel, table=True)
-
-retrieved = store['test_panel']
diff --git a/scripts/json_manip.py b/scripts/json_manip.py
deleted file mode 100644
index 7ff4547825568..0000000000000
--- a/scripts/json_manip.py
+++ /dev/null
@@ -1,423 +0,0 @@
-"""
-
-Tasks
--------
-
-Search and transform jsonable structures, specifically to make it 'easy' to make tabular/csv output for other consumers.
-
-Example
-~~~~~~~~~~~~~
-
-    *give me a list of all the fields called 'id' in this stupid, gnarly
-    thing*
-
-    >>> Q('id',gnarly_data)
-    ['id1','id2','id3']
-
-
-Observations:
----------------------
-
-1) 'simple data structures' exist and are common.  They are tedious
-   to search.
-
-2)  The DOM is another nested / treeish structure, and jQuery selector is
-    a good tool for that.
-
-3a) R, Numpy, Excel and other analysis tools want 'tabular' data.  These
-    analyses are valuable and worth doing.
-
-3b) Dot/Graphviz, NetworkX, and some other analyses *like* treeish/dicty
-    things, and those analyses are also worth doing!
-
-3c) Some analyses are best done using 'one-off' and custom code in C, Python,
-    or another 'real' programming language.
-
-4)  Arbitrary transforms are tedious and error prone.  SQL is one solution,
-    XSLT is another,
-
-5)  the XPATH/XML/XSLT family is.... not universally loved :)  They are
-    very complete, and the completeness can make simple cases... gross.
-
-6)  For really complicated data structures, we can write one-off code.  Getting
-    80% of the way is mostly okay.  There will always have to be programmers
-    in the loop.
-
-7)  Re-inventing SQL is probably a failure mode.  So is reinventing XPATH, XSLT
-    and the like.  Be wary of mission creep!  Re-use when possible (e.g., can
-    we put the thing into a DOM using
-
-8)  If the interface is good, people can improve performance later.
-
-
-Simplifying
----------------
-
-
-1)  Assuming 'jsonable' structures
-
-2)  keys are strings or stringlike.  Python allows any hashable to be a key.
-    for now, we pretend that doesn't happen.
-
-3)  assumes most dicts are 'well behaved'.  DAG, no cycles!
-
-4)  assume that if people want really specialized transforms, they can do it
-    themselves.
-
-"""
-from __future__ import print_function
-
-from collections import namedtuple
-import csv
-import itertools
-from itertools import product
-from operator import attrgetter as aget, itemgetter as iget
-import operator
-import sys
-from pandas.compat import map, u, callable, Counter
-import pandas.compat as compat
-
-
-##  note 'url' appears multiple places and not all extensions have same struct
-ex1 = {
-    'name': 'Gregg',
-    'extensions': [
-        {'id':'hello',
-         'url':'url1'},
-        {'id':'gbye',
-         'url':'url2',
-         'more': dict(url='url3')},
-    ]
-}
-
-## much longer example
-ex2 = {u('metadata'): {u('accessibilities'): [{u('name'): u('accessibility.tabfocus'),
-    u('value'): 7},
-   {u('name'): u('accessibility.mouse_focuses_formcontrol'), u('value'): False},
-   {u('name'): u('accessibility.browsewithcaret'), u('value'): False},
-   {u('name'): u('accessibility.win32.force_disabled'), u('value'): False},
-   {u('name'): u('accessibility.typeaheadfind.startlinksonly'), u('value'): False},
-   {u('name'): u('accessibility.usebrailledisplay'), u('value'): u('')},
-   {u('name'): u('accessibility.typeaheadfind.timeout'), u('value'): 5000},
-   {u('name'): u('accessibility.typeaheadfind.enabletimeout'), u('value'): True},
-   {u('name'): u('accessibility.tabfocus_applies_to_xul'), u('value'): False},
-   {u('name'): u('accessibility.typeaheadfind.flashBar'), u('value'): 1},
-   {u('name'): u('accessibility.typeaheadfind.autostart'), u('value'): True},
-   {u('name'): u('accessibility.blockautorefresh'), u('value'): False},
-   {u('name'): u('accessibility.browsewithcaret_shortcut.enabled'),
-    u('value'): True},
-   {u('name'): u('accessibility.typeaheadfind.enablesound'), u('value'): True},
-   {u('name'): u('accessibility.typeaheadfind.prefillwithselection'),
-    u('value'): True},
-   {u('name'): u('accessibility.typeaheadfind.soundURL'), u('value'): u('beep')},
-   {u('name'): u('accessibility.typeaheadfind'), u('value'): False},
-   {u('name'): u('accessibility.typeaheadfind.casesensitive'), u('value'): 0},
-   {u('name'): u('accessibility.warn_on_browsewithcaret'), u('value'): True},
-   {u('name'): u('accessibility.usetexttospeech'), u('value'): u('')},
-   {u('name'): u('accessibility.accesskeycausesactivation'), u('value'): True},
-   {u('name'): u('accessibility.typeaheadfind.linksonly'), u('value'): False},
-   {u('name'): u('isInstantiated'), u('value'): True}],
-  u('extensions'): [{u('id'): u('216ee7f7f4a5b8175374cd62150664efe2433a31'),
-    u('isEnabled'): True},
-   {u('id'): u('1aa53d3b720800c43c4ced5740a6e82bb0b3813e'), u('isEnabled'): False},
-   {u('id'): u('01ecfac5a7bd8c9e27b7c5499e71c2d285084b37'), u('isEnabled'): True},
-   {u('id'): u('1c01f5b22371b70b312ace94785f7b0b87c3dfb2'), u('isEnabled'): True},
-   {u('id'): u('fb723781a2385055f7d024788b75e959ad8ea8c3'), u('isEnabled'): True}],
-  u('fxVersion'): u('9.0'),
-  u('location'): u('zh-CN'),
-  u('operatingSystem'): u('WINNT Windows NT 5.1'),
-  u('surveyAnswers'): u(''),
-  u('task_guid'): u('d69fbd15-2517-45b5-8a17-bb7354122a75'),
-  u('tpVersion'): u('1.2'),
-  u('updateChannel'): u('beta')},
- u('survey_data'): {
-  u('extensions'): [{u('appDisabled'): False,
-    u('id'): u('testpilot?labs.mozilla.com'),
-    u('isCompatible'): True,
-    u('isEnabled'): True,
-    u('isPlatformCompatible'): True,
-    u('name'): u('Test Pilot')},
-   {u('appDisabled'): True,
-    u('id'): u('dict?www.youdao.com'),
-    u('isCompatible'): False,
-    u('isEnabled'): False,
-    u('isPlatformCompatible'): True,
-    u('name'): u('Youdao Word Capturer')},
-   {u('appDisabled'): False,
-    u('id'): u('jqs?sun.com'),
-    u('isCompatible'): True,
-    u('isEnabled'): True,
-    u('isPlatformCompatible'): True,
-    u('name'): u('Java Quick Starter')},
-   {u('appDisabled'): False,
-    u('id'): u('?20a82645-c095-46ed-80e3-08825760534b?'),
-    u('isCompatible'): True,
-    u('isEnabled'): True,
-    u('isPlatformCompatible'): True,
-    u('name'): u('Microsoft .NET Framework Assistant')},
-   {u('appDisabled'): False,
-    u('id'): u('?a0d7ccb3-214d-498b-b4aa-0e8fda9a7bf7?'),
-    u('isCompatible'): True,
-    u('isEnabled'): True,
-    u('isPlatformCompatible'): True,
-    u('name'): u('WOT')}],
-  u('version_number'): 1}}
-
-# class SurveyResult(object):
-
-#     def __init__(self, record):
-#         self.record = record
-#         self.metadata, self.survey_data = self._flatten_results()
-
-#     def _flatten_results(self):
-#         survey_data = self.record['survey_data']
-#         extensions = DataFrame(survey_data['extensions'])
-
-def denorm(queries,iterable_of_things,default=None):
-    """
-    'repeat', or 'stutter' to 'tableize' for downstream.
-    (I have no idea what a good word for this is!)
-
-    Think ``kronecker`` products, or:
-
-    ``SELECT single,multiple FROM table;``
-
-    single   multiple
-    -------  ---------
-    id1      val1
-    id1      val2
-
-
-    Args:
-
-        queries:  iterable of ``Q`` queries.
-        iterable_of_things:  to be queried.
-
-    Returns:
-
-        list of 'stuttered' output, where if a query returns
-        a 'single', it gets repeated appropriately.
-
-
-    """
-
-    def _denorm(queries,thing):
-        fields = []
-        results = []
-        for q in queries:
-            #print(q)
-            r = Ql(q,thing)
-            #print("-- result: ", r)
-            if not r:
-                r = [default]
-            if isinstance(r[0], type({})):
-                fields.append(sorted(r[0].keys()))  # dicty answers
-            else:
-                fields.append([q])  # stringy answer
-
-            results.append(r)
-
-        #print(results)
-        #print(fields)
-        flist =  list(flatten(*map(iter,fields)))
-
-        prod = itertools.product(*results)
-        for p in prod:
-            U = dict()
-            for (ii,thing) in enumerate(p):
-                #print(ii,thing)
-                if isinstance(thing, type({})):
-                    U.update(thing)
-                else:
-                    U[fields[ii][0]] = thing
-
-            yield U
-
-    return list(flatten(*[_denorm(queries,thing) for thing in iterable_of_things]))
-
-
-def default_iget(fields,default=None,):
-    """ itemgetter with 'default' handling, that *always* returns lists
-
-    API CHANGES from ``operator.itemgetter``
-
-    Note: Sorry to break the iget api... (fields vs *fields)
-    Note: *always* returns a list... unlike itemgetter,
-        which can return tuples or 'singles'
-    """
-    myiget = operator.itemgetter(*fields)
-    L = len(fields)
-    def f(thing):
-        try:
-            ans = list(myiget(thing))
-            if L < 2:
-                ans = [ans,]
-            return ans
-        except KeyError:
-            # slower!
-            return [thing.get(x,default) for x in fields]
-
-    f.__doc__ = "itemgetter with default %r for fields %r" %(default,fields)
-    f.__name__ = "default_itemgetter"
-    return f
-
-
-def flatten(*stack):
-    """
-    helper function for flattening iterables of generators in a
-    sensible way.
-    """
-    stack = list(stack)
-    while stack:
-        try: x = next(stack[0])
-        except StopIteration:
-            stack.pop(0)
-            continue
-        if hasattr(x,'next') and callable(getattr(x,'next')):
-            stack.insert(0, x)
-
-        #if isinstance(x, (GeneratorType,listerator)):
-        else: yield x
-
-
-def _Q(filter_, thing):
-    """ underlying machinery for Q function recursion """
-    T = type(thing)
-    if isinstance({}, T):
-        for k,v in compat.iteritems(thing):
-            #print(k,v)
-            if filter_ == k:
-                if isinstance(v, type([])):
-                    yield iter(v)
-                else:
-                    yield v
-
-            if type(v)  in (type({}),type([])):
-                yield Q(filter_,v)
-
-    elif isinstance([], T):
-        for k in thing:
-            #print(k)
-            yield Q(filter_,k)
-
-    else:
-        # no recursion.
-        pass
-
-def Q(filter_,thing):
-    """
-    type(filter):
-    - list:  a flattened list of all searches (one list)
-    - dict:  dict with vals each of which is that search
-
-    Notes:
-
-    [1] 'parent thing', with space, will do a descendent
-    [2] this will come back 'flattened' jQuery style
-    [3] returns a generator.  Use ``Ql`` if you want a list.
-
-    """
-    if isinstance(filter_, type([])):
-        return flatten(*[_Q(x,thing) for x in filter_])
-    elif isinstance(filter_, type({})):
-        d = dict.fromkeys(list(filter_.keys()))
-        #print(d)
-        for k in d:
-            #print(flatten(Q(k,thing)))
-            d[k] = Q(k,thing)
-
-        return d
-
-    else:
-        if " " in filter_:   # i.e. "antecendent post"
-            parts = filter_.strip().split()
-            r = None
-            for p in parts:
-                r = Ql(p,thing)
-                thing = r
-
-            return r
-
-        else:  # simple.
-            return flatten(_Q(filter_,thing))
-
-def Ql(filter_,thing):
-    """ same as Q, but returns a list, not a generator """
-    res = Q(filter_,thing)
-
-    if isinstance(filter_, type({})):
-        for k in res:
-            res[k] = list(res[k])
-        return res
-
-    else:
-        return list(res)
-
-
-
-def countit(fields,iter_of_iter,default=None):
-    """
-    note: robust to fields not being in i_of_i, using ``default``
-    """
-    C = Counter()  # needs hashables
-    T = namedtuple("Thing",fields)
-    get = default_iget(*fields,default=default)
-    return Counter(
-        (T(*get(thing)) for thing in iter_of_iter)
-    )
-
-
-## right now this works for one row...
-def printout(queries,things,default=None, f=sys.stdout, **kwargs):
-    """ will print header and objects
-
-    **kwargs go to csv.DictWriter
-
-    help(csv.DictWriter) for more.
-    """
-
-    results = denorm(queries,things,default=None)
-    fields = set(itertools.chain(*(x.keys() for x in results)))
-
-    W = csv.DictWriter(f=f,fieldnames=fields,**kwargs)
-    #print("---prod---")
-    #print(list(prod))
-    W.writeheader()
-    for r in results:
-        W.writerow(r)
-
-
-def test_run():
-    print("\n>>> print(list(Q('url',ex1)))")
-    print(list(Q('url',ex1)))
-    assert  list(Q('url',ex1)) == ['url1','url2','url3']
-    assert Ql('url',ex1) == ['url1','url2','url3']
-
-    print("\n>>>  print(list(Q(['name','id'],ex1)))")
-    print(list(Q(['name','id'],ex1)))
-    assert Ql(['name','id'],ex1) == ['Gregg','hello','gbye']
-
-
-    print("\n>>> print(Ql('more url',ex1))")
-    print(Ql('more url',ex1))
-
-
-    print("\n>>> list(Q('extensions',ex1))")
-    print(list(Q('extensions',ex1)))
-
-    print("\n>>> print(Ql('extensions',ex1))")
-    print(Ql('extensions',ex1))
-
-    print("\n>>> printout(['name','extensions'],[ex1,], extrasaction='ignore')")
-    printout(['name','extensions'],[ex1,], extrasaction='ignore')
-
-    print("\n\n")
-
-    from pprint import pprint as pp
-
-    print("-- note that the extension fields are also flattened!  (and N/A) -- ")
-    pp(denorm(['location','fxVersion','notthere','survey_data extensions'],[ex2,], default="N/A")[:2])
-
-
-if __name__ == "__main__":
-    pass
diff --git a/scripts/leak.py b/scripts/leak.py
deleted file mode 100644
index 47f74bf020597..0000000000000
--- a/scripts/leak.py
+++ /dev/null
@@ -1,13 +0,0 @@
-from pandas import *
-from pandas.compat import range
-import numpy as np
-import pandas.util.testing as tm
-import os
-import psutil
-
-pid = os.getpid()
-proc = psutil.Process(pid)
-
-df = DataFrame(index=np.arange(100))
-for i in range(5000):
-    df[i] = 5
diff --git a/scripts/list_future_warnings.sh b/scripts/list_future_warnings.sh
new file mode 100755
index 0000000000000..0c4046bbb5f49
--- /dev/null
+++ b/scripts/list_future_warnings.sh
@@ -0,0 +1,46 @@
+#!/bin/bash
+
+# Check all future warnings in Python files, and report them with the version
+# where the FutureWarning was added.
+#
+# This is useful to detect features that have been deprecated, and should be
+# removed from the code. For example, if a line of code contains:
+#
+#     warning.warn('Method deprecated', FutureWarning, stacklevel=2)
+#
+# Which is released in Pandas 0.20.0, then it is expected that the method
+# is removed before releasing Pandas 0.24.0, including the warning. If it
+# is not, this script will list this line, with the version 0.20.0, which
+# will make it easy to detect that it had to be removed.
+#
+# In some cases this script can return false positives, for example in files
+# where FutureWarning is used to detect deprecations, or similar. The EXCLUDE
+# variable can be used to ignore files that use FutureWarning, but do not
+# deprecate functionality.
+#
+# Usage:
+#
+#     $ ./list_future_warnings.sh
+
+EXCLUDE="^pandas/tests/|"  # tests validate that FutureWarnings are raised
+EXCLUDE+="^pandas/util/_decorators.py$|"  # generic deprecate function that raises warning
+EXCLUDE+="^pandas/util/_depr_module.py$|"  # generic deprecate module that raises warnings
+EXCLUDE+="^pandas/util/testing.py$|" # contains function to evaluate if warning is raised
+EXCLUDE+="^pandas/io/parsers.py$"  # implements generic deprecation system in io reading
+
+BASE_DIR="$(dirname $0)/.."
+cd $BASE_DIR
+FILES=`grep -RIl "FutureWarning" pandas/* | grep -vE "$EXCLUDE"`
+OUTPUT=()
+IFS=$'\n'
+
+for FILE in $FILES; do
+    FILE_LINES=`git blame -sf $FILE | grep FutureWarning | tr -s " " | cut -d " " -f1,3`
+    for FILE_LINE in $FILE_LINES; do
+        TAG=$(git tag --contains $(echo $FILE_LINE | cut -d" " -f1) | head -n1)
+        OUTPUT_ROW=`printf "%-14s %-16s %s" ${TAG:-"(not released)"} $FILE_LINE $FILE`
+        OUTPUT+=($OUTPUT_ROW)
+    done
+done
+
+printf "%s\n" "${OUTPUT[@]}" | sort -V
diff --git a/scripts/merge-pr.py b/scripts/merge-pr.py
new file mode 100755
index 0000000000000..31264cad52e4f
--- /dev/null
+++ b/scripts/merge-pr.py
@@ -0,0 +1,321 @@
+#!/usr/bin/env python
+
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+# Utility for creating well-formed pull request merges and pushing them to
+# Apache.
+#   usage: ./apache-pr-merge.py    (see config env vars below)
+#
+# Lightly modified from version of this script in incubator-parquet-format
+from __future__ import print_function
+
+from subprocess import check_output
+from requests.auth import HTTPBasicAuth
+import requests
+
+import os
+import six
+import sys
+import textwrap
+
+from six.moves import input
+
+PANDAS_HOME = '.'
+PROJECT_NAME = 'pandas'
+print("PANDAS_HOME = " + PANDAS_HOME)
+
+# Remote name with the PR
+PR_REMOTE_NAME = os.environ.get("PR_REMOTE_NAME", "upstream")
+
+# Remote name where results pushed
+PUSH_REMOTE_NAME = os.environ.get("PUSH_REMOTE_NAME", "upstream")
+
+GITHUB_BASE = "https://github.com/pandas-dev/" + PROJECT_NAME + "/pull"
+GITHUB_API_BASE = "https://api.github.com/repos/pandas-dev/" + PROJECT_NAME
+
+# Prefix added to temporary branches
+BRANCH_PREFIX = "PR_TOOL"
+
+os.chdir(PANDAS_HOME)
+
+auth_required = False
+
+if auth_required:
+    GITHUB_USERNAME = os.environ['GITHUB_USER']
+    import getpass
+    GITHUB_PASSWORD = getpass.getpass('Enter github.com password for %s:'
+                                      % GITHUB_USERNAME)
+
+    def get_json_auth(url):
+        auth = HTTPBasicAuth(GITHUB_USERNAME, GITHUB_PASSWORD)
+        req = requests.get(url, auth=auth)
+        return req.json()
+
+    get_json = get_json_auth
+else:
+    def get_json_no_auth(url):
+        req = requests.get(url)
+        return req.json()
+
+    get_json = get_json_no_auth
+
+
+def fail(msg):
+    print(msg)
+    clean_up()
+    sys.exit(-1)
+
+
+def run_cmd(cmd):
+    if isinstance(cmd, six.string_types):
+        cmd = cmd.split(' ')
+
+    output = check_output(cmd)
+
+    if isinstance(output, six.binary_type):
+        output = output.decode('utf-8')
+    return output
+
+
+def continue_maybe(prompt):
+    result = input("\n%s (y/n): " % prompt)
+    if result.lower() != "y":
+        fail("Okay, exiting")
+
+
+def continue_maybe2(prompt):
+    result = input("\n%s (y/n): " % prompt)
+    if result.lower() != "y":
+        return False
+    else:
+        return True
+
+
+original_head = run_cmd("git rev-parse HEAD")[:8]
+
+
+def clean_up():
+    print("Restoring head pointer to %s" % original_head)
+    run_cmd("git checkout %s" % original_head)
+
+    branches = run_cmd("git branch").replace(" ", "").split("\n")
+
+    for branch in [b for b in branches if b.startswith(BRANCH_PREFIX)]:
+        print("Deleting local branch %s" % branch)
+        run_cmd("git branch -D %s" % branch)
+
+
+# Merge the requested PR and return the merge hash
+def merge_pr(pr_num, target_ref):
+
+    pr_branch_name = "%s_MERGE_PR_%s" % (BRANCH_PREFIX, pr_num)
+    target_branch_name = "%s_MERGE_PR_%s_%s" % (BRANCH_PREFIX, pr_num,
+                                                target_ref.upper())
+    run_cmd("git fetch %s pull/%s/head:%s" % (PR_REMOTE_NAME, pr_num,
+                                              pr_branch_name))
+    run_cmd("git fetch %s %s:%s" % (PUSH_REMOTE_NAME, target_ref,
+                                    target_branch_name))
+    run_cmd("git checkout %s" % target_branch_name)
+
+    had_conflicts = False
+    try:
+        run_cmd(['git', 'merge', pr_branch_name, '--squash'])
+    except Exception as e:
+        msg = ("Error merging: %s\nWould you like to manually fix-up "
+               "this merge?" % e)
+        continue_maybe(msg)
+        msg = ("Okay, please fix any conflicts and 'git add' "
+               "conflicting files... Finished?")
+        continue_maybe(msg)
+        had_conflicts = True
+
+    commit_authors = run_cmd(['git', 'log', 'HEAD..%s' % pr_branch_name,
+                             '--pretty=format:%an <%ae>']).split("\n")
+    distinct_authors = sorted(set(commit_authors),
+                              key=lambda x: commit_authors.count(x),
+                              reverse=True)
+    primary_author = distinct_authors[0]
+    commits = run_cmd(['git', 'log', 'HEAD..%s' % pr_branch_name,
+                      '--pretty=format:%h [%an] %s']).split("\n\n")
+
+    merge_message_flags = []
+
+    merge_message_flags += ["-m", title]
+    if body is not None:
+        merge_message_flags += ["-m", '\n'.join(textwrap.wrap(body))]
+
+    authors = "\n".join("Author: %s" % a for a in distinct_authors)
+
+    merge_message_flags += ["-m", authors]
+
+    if had_conflicts:
+        committer_name = run_cmd("git config --get user.name").strip()
+        committer_email = run_cmd("git config --get user.email").strip()
+        message = ("This patch had conflicts when merged, "
+                   "resolved by\nCommitter: %s <%s>"
+                   % (committer_name, committer_email))
+        merge_message_flags += ["-m", message]
+
+    # The string "Closes #%s" string is required for GitHub to correctly close
+    # the PR
+    merge_message_flags += [
+        "-m",
+        "Closes #%s from %s and squashes the following commits:"
+        % (pr_num, pr_repo_desc)]
+    for c in commits:
+        merge_message_flags += ["-m", c]
+
+    run_cmd(['git', 'commit', '--author="%s"' % primary_author] +
+            merge_message_flags)
+
+    continue_maybe("Merge complete (local ref %s). Push to %s?" % (
+        target_branch_name, PUSH_REMOTE_NAME))
+
+    try:
+        run_cmd('git push %s %s:%s' % (PUSH_REMOTE_NAME, target_branch_name,
+                                       target_ref))
+    except Exception as e:
+        clean_up()
+        fail("Exception while pushing: %s" % e)
+
+    merge_hash = run_cmd("git rev-parse %s" % target_branch_name)[:8]
+    clean_up()
+    print("Pull request #%s merged!" % pr_num)
+    print("Merge hash: %s" % merge_hash)
+    return merge_hash
+
+
+def update_pr(pr_num, user_login, base_ref):
+
+    pr_branch_name = "%s_MERGE_PR_%s" % (BRANCH_PREFIX, pr_num)
+
+    run_cmd("git fetch %s pull/%s/head:%s" % (PR_REMOTE_NAME, pr_num,
+                                              pr_branch_name))
+    run_cmd("git checkout %s" % pr_branch_name)
+
+    continue_maybe("Update ready (local ref %s)? Push to %s/%s?" % (
+        pr_branch_name, user_login, base_ref))
+
+    push_user_remote = "https://github.com/%s/pandas.git" % user_login
+
+    try:
+        run_cmd('git push %s %s:%s' % (push_user_remote, pr_branch_name,
+                                       base_ref))
+    except Exception as e:
+
+        if continue_maybe2("Force push?"):
+            try:
+                run_cmd(
+                    'git push -f %s %s:%s' % (push_user_remote, pr_branch_name,
+                                              base_ref))
+            except Exception as e:
+                fail("Exception while pushing: %s" % e)
+                clean_up()
+        else:
+            fail("Exception while pushing: %s" % e)
+            clean_up()
+
+    clean_up()
+    print("Pull request #%s updated!" % pr_num)
+
+
+def cherry_pick(pr_num, merge_hash, default_branch):
+    pick_ref = input("Enter a branch name [%s]: " % default_branch)
+    if pick_ref == "":
+        pick_ref = default_branch
+
+    pick_branch_name = "%s_PICK_PR_%s_%s" % (BRANCH_PREFIX, pr_num,
+                                             pick_ref.upper())
+
+    run_cmd("git fetch %s %s:%s" % (PUSH_REMOTE_NAME, pick_ref,
+                                    pick_branch_name))
+    run_cmd("git checkout %s" % pick_branch_name)
+    run_cmd("git cherry-pick -sx %s" % merge_hash)
+
+    continue_maybe("Pick complete (local ref %s). Push to %s?" % (
+        pick_branch_name, PUSH_REMOTE_NAME))
+
+    try:
+        run_cmd('git push %s %s:%s' % (PUSH_REMOTE_NAME, pick_branch_name,
+                                       pick_ref))
+    except Exception as e:
+        clean_up()
+        fail("Exception while pushing: %s" % e)
+
+    pick_hash = run_cmd("git rev-parse %s" % pick_branch_name)[:8]
+    clean_up()
+
+    print("Pull request #%s picked into %s!" % (pr_num, pick_ref))
+    print("Pick hash: %s" % pick_hash)
+    return pick_ref
+
+
+def fix_version_from_branch(branch, versions):
+    #  Note: Assumes this is a sorted (newest->oldest) list of un-released
+    #  versions
+    if branch == "master":
+        return versions[0]
+    else:
+        branch_ver = branch.replace("branch-", "")
+        return filter(lambda x: x.name.startswith(branch_ver), versions)[-1]
+
+
+pr_num = input("Which pull request would you like to merge? (e.g. 34): ")
+pr = get_json("%s/pulls/%s" % (GITHUB_API_BASE, pr_num))
+
+url = pr["url"]
+title = pr["title"]
+body = pr["body"]
+target_ref = pr["base"]["ref"]
+user_login = pr["user"]["login"]
+base_ref = pr["head"]["ref"]
+pr_repo_desc = "%s/%s" % (user_login, base_ref)
+
+if pr["merged"] is True:
+    print("Pull request {0} has already been merged, please backport manually"
+          .format(pr_num))
+    sys.exit(0)
+
+if not bool(pr["mergeable"]):
+    msg = ("Pull request {0} is not mergeable in its current form.\n"
+           "Continue? (experts only!)".format(pr_num))
+    continue_maybe(msg)
+
+print("\n=== Pull Request #%s ===" % pr_num)
+
+# we may have un-printable unicode in our title
+try:
+    title = title.encode('raw_unicode_escape')
+except Exception:
+    pass
+
+print("title\t{title}\nsource\t{source}\ntarget\t{target}\nurl\t{url}".format(
+    title=title, source=pr_repo_desc, target=target_ref, url=url))
+
+
+merged_refs = [target_ref]
+
+print("\nProceed with updating or merging pull request #%s?" % pr_num)
+update = input("Update PR and push to remote (r), merge locally (l), "
+               "or do nothing (n) ?")
+update = update.lower()
+
+if update == 'r':
+    merge_hash = update_pr(pr_num, user_login, base_ref)
+elif update == 'l':
+    merge_hash = merge_pr(pr_num, target_ref)
diff --git a/scripts/parser_magic.py b/scripts/parser_magic.py
deleted file mode 100644
index 72fef39d8db65..0000000000000
--- a/scripts/parser_magic.py
+++ /dev/null
@@ -1,74 +0,0 @@
-from pandas.util.testing import set_trace
-import pandas.util.testing as tm
-import pandas.compat as compat
-
-from pandas import *
-import ast
-import inspect
-import sys
-
-
-def merge(a, b):
-    f, args, _ = parse_stmt(inspect.currentframe().f_back)
-    return DataFrame({args[0]: a,
-                      args[1]: b})
-
-
-def parse_stmt(frame):
-    info = inspect.getframeinfo(frame)
-    call = info[-2][0]
-    mod = ast.parse(call)
-    body = mod.body[0]
-    if isinstance(body, (ast.Assign, ast.Expr)):
-        call = body.value
-    elif isinstance(body, ast.Call):
-        call = body
-    return _parse_call(call)
-
-
-def _parse_call(call):
-    func = _maybe_format_attribute(call.func)
-
-    str_args = []
-    for arg in call.args:
-        if isinstance(arg, ast.Name):
-            str_args.append(arg.id)
-        elif isinstance(arg, ast.Call):
-            formatted = _format_call(arg)
-            str_args.append(formatted)
-
-    return func, str_args, {}
-
-
-def _format_call(call):
-    func, args, kwds = _parse_call(call)
-    content = ''
-    if args:
-        content += ', '.join(args)
-    if kwds:
-        fmt_kwds = ['%s=%s' % item for item in compat.iteritems(kwds)]
-        joined_kwds = ', '.join(fmt_kwds)
-        if args:
-            content = content + ', ' + joined_kwds
-        else:
-            content += joined_kwds
-    return '%s(%s)' % (func, content)
-
-
-def _maybe_format_attribute(name):
-    if isinstance(name, ast.Attribute):
-        return _format_attribute(name)
-    return name.id
-
-
-def _format_attribute(attr):
-    obj = attr.value
-    if isinstance(attr.value, ast.Attribute):
-        obj = _format_attribute(attr.value)
-    else:
-        obj = obj.id
-    return '.'.join((obj, attr.attr))
-
-a = tm.makeTimeSeries()
-b = tm.makeTimeSeries()
-df = merge(a, b)
diff --git a/scripts/preepoch_test.py b/scripts/preepoch_test.py
deleted file mode 100644
index 36a3d768e671f..0000000000000
--- a/scripts/preepoch_test.py
+++ /dev/null
@@ -1,23 +0,0 @@
-import numpy as np
-from pandas import *
-
-
-def panda_test():
-
-    # generate some data
-    data = np.random.rand(50, 5)
-    # generate some dates
-    dates = DatetimeIndex('1/1/1969', periods=50)
-    # generate column headings
-    cols = ['A', 'B', 'C', 'D', 'E']
-
-    df = DataFrame(data, index=dates, columns=cols)
-
-    # save to HDF5Store
-    store = HDFStore('bugzilla.h5', mode='w')
-    store['df'] = df  # This gives: OverflowError: mktime argument out of range
-    store.close()
-
-
-if __name__ == '__main__':
-    panda_test()
diff --git a/scripts/pypistats.py b/scripts/pypistats.py
deleted file mode 100644
index 41343f6d30c76..0000000000000
--- a/scripts/pypistats.py
+++ /dev/null
@@ -1,101 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-"""
-Calculates the total number of downloads that a particular PyPI package has
-received across all versions tracked by PyPI
-"""
-
-from datetime import datetime
-import locale
-import sys
-import xmlrpclib
-import pandas as pd
-
-locale.setlocale(locale.LC_ALL, '')
-
-
-class PyPIDownloadAggregator(object):
-
-    def __init__(self, package_name, include_hidden=True):
-        self.package_name = package_name
-        self.include_hidden = include_hidden
-        self.proxy = xmlrpclib.Server('http://pypi.python.org/pypi')
-        self._downloads = {}
-
-    @property
-    def releases(self):
-        """Retrieves the release number for each uploaded release"""
-
-        result = self.proxy.package_releases(self.package_name,
-                                             self.include_hidden)
-
-        if len(result) == 0:
-            # no matching package--search for possibles, and limit to 15
-            # results
-            results = self.proxy.search({
-                'name': self.package_name,
-                'description': self.package_name
-            }, 'or')[:15]
-
-            # make sure we only get unique package names
-            matches = []
-            for match in results:
-                name = match['name']
-                if name not in matches:
-                    matches.append(name)
-
-            # if only one package was found, return it
-            if len(matches) == 1:
-                self.package_name = matches[0]
-                return self.releases
-
-            error = """No such package found: %s
-
-Possible matches include:
-%s
-""" % (self.package_name, '\n'.join('\t- %s' % n for n in matches))
-
-            sys.exit(error)
-
-        return result
-
-    def get_downloads(self):
-        """Calculate the total number of downloads for the package"""
-        downloads = {}
-        for release in self.releases:
-            urls = self.proxy.release_urls(self.package_name, release)
-            urls = pd.DataFrame(urls)
-            urls['version'] = release
-            downloads[release] = urls
-
-        return pd.concat(downloads, ignore_index=True)
-
-if __name__ == '__main__':
-    agg = PyPIDownloadAggregator('pandas')
-
-    data = agg.get_downloads()
-
-    to_omit = ['0.2b1', '0.2beta']
-
-    isostrings = data['upload_time'].map(lambda x: x.value)
-    data['upload_time'] = pd.to_datetime(isostrings)
-
-    totals = data.groupby('version').downloads.sum()
-    rollup = {'0.8.0rc1': '0.8.0',
-              '0.8.0rc2': '0.8.0',
-              '0.3.0.beta': '0.3.0',
-              '0.3.0.beta2': '0.3.0'}
-    downloads = totals.groupby(lambda x: rollup.get(x, x)).sum()
-
-    first_upload = data.groupby('version').upload_time.min()
-
-    result = pd.DataFrame({'downloads': totals,
-                           'release_date': first_upload})
-    result = result.sort('release_date')
-    result = result.drop(to_omit + list(rollup.keys()))
-    result.index.name = 'release'
-
-    by_date = result.reset_index().set_index('release_date').downloads
-    dummy = pd.Series(index=pd.DatetimeIndex([datetime(2012, 12, 27)]))
-    by_date = by_date.append(dummy).shift(1).fillna(0)
diff --git a/scripts/roll_median_leak.py b/scripts/roll_median_leak.py
deleted file mode 100644
index 07161cc6499bf..0000000000000
--- a/scripts/roll_median_leak.py
+++ /dev/null
@@ -1,26 +0,0 @@
-from __future__ import print_function
-from pandas import *
-
-import numpy as np
-import os
-
-from vbench.api import Benchmark
-from pandas.util.testing import rands
-from pandas.compat import range
-import pandas.lib as lib
-import pandas._sandbox as sbx
-import time
-
-import psutil
-
-pid = os.getpid()
-proc = psutil.Process(pid)
-
-lst = SparseList()
-lst.append([5] * 10000)
-lst.append(np.repeat(np.nan, 1000000))
-
-for _ in range(10000):
-    print(proc.get_memory_info())
-    sdf = SparseDataFrame({'A': lst.to_array()})
-    chunk = sdf[sdf['A'] == 5]
diff --git a/scripts/runtests.py b/scripts/runtests.py
deleted file mode 100644
index e14752b43116b..0000000000000
--- a/scripts/runtests.py
+++ /dev/null
@@ -1,5 +0,0 @@
-from __future__ import print_function
-import os
-print(os.getpid())
-import nose
-nose.main('pandas.core')
diff --git a/scripts/test_py25.bat b/scripts/test_py25.bat
deleted file mode 100644
index fbf00b0451e3d..0000000000000
--- a/scripts/test_py25.bat
+++ /dev/null
@@ -1,8 +0,0 @@
-SET PATH=C:\MinGW\bin;C:\Python25;C:\Python25\Scripts;%PATH%
-del pandas\_tseries.pyd
-del pandas\_sparse.pyd
-del pandas\src\tseries.c
-del pandas\src\sparse.c
-python setup.py clean
-python setup.py build_ext -c mingw32 --inplace
-nosetests pandas
\ No newline at end of file
diff --git a/scripts/test_py26.bat b/scripts/test_py26.bat
deleted file mode 100644
index e2502e87ad459..0000000000000
--- a/scripts/test_py26.bat
+++ /dev/null
@@ -1,8 +0,0 @@
-SET PATH=C:\MinGW\bin;E:\Python26;E:\Python26\Scripts;%PATH%
-del pandas\_tseries.pyd
-del pandas\_sparse.pyd
-del pandas\src\tseries.c
-del pandas\src\sparse.c
-python setup.py clean
-python setup.py build_ext -c mingw32 --inplace
-nosetests pandas
\ No newline at end of file
diff --git a/scripts/test_py27.bat b/scripts/test_py27.bat
deleted file mode 100644
index 11e3056287e31..0000000000000
--- a/scripts/test_py27.bat
+++ /dev/null
@@ -1,6 +0,0 @@
-SET PATH=C:\MinGW\bin;C:\Python27;C:\Python27\Scripts;%PATH%
-
-python setup.py clean
-python setup.py build_ext -c mingw32 --inplace
-
-nosetests pandas
\ No newline at end of file
diff --git a/scripts/test_py31.bat b/scripts/test_py31.bat
deleted file mode 100644
index e146ef2826cff..0000000000000
--- a/scripts/test_py31.bat
+++ /dev/null
@@ -1,8 +0,0 @@
-set BASE=E:\python31
-set PYTHON=%BASE%\python.exe
-set NOSETESTS=%BASE%\scripts\nosetests-script.py
-
-%PYTHON% setup.py install
-cd bench
-%PYTHON% %NOSETESTS% pandas
-cd ..
\ No newline at end of file
diff --git a/scripts/test_py32.bat b/scripts/test_py32.bat
deleted file mode 100644
index 31685ae40aee5..0000000000000
--- a/scripts/test_py32.bat
+++ /dev/null
@@ -1,8 +0,0 @@
-set BASE=E:\python32
-set PYTHON=%BASE%\python.exe
-set NOSETESTS=%BASE%\scripts\nosetests-script.py
-
-%PYTHON% setup.py install
-cd bench
-%PYTHON% %NOSETESTS% pandas
-cd ..
\ No newline at end of file
diff --git a/scripts/testmed.py b/scripts/testmed.py
deleted file mode 100644
index dd3b952d58c60..0000000000000
--- a/scripts/testmed.py
+++ /dev/null
@@ -1,171 +0,0 @@
-## {{{ Recipe 576930 (r10): Efficient Running Median using an Indexable Skiplist
-
-from random import random
-from math import log, ceil
-from pandas.compat import range
-from numpy.random import randn
-from pandas.lib.skiplist import rolling_median
-
-
-class Node(object):
-    __slots__ = 'value', 'next', 'width'
-
-    def __init__(self, value, next, width):
-        self.value, self.next, self.width = value, next, width
-
-
-class End(object):
-    'Sentinel object that always compares greater than another object'
-    def __cmp__(self, other):
-        return 1
-
-NIL = Node(End(), [], [])               # Singleton terminator node
-
-
-class IndexableSkiplist:
-    'Sorted collection supporting O(lg n) insertion, removal, and lookup by rank.'
-
-    def __init__(self, expected_size=100):
-        self.size = 0
-        self.maxlevels = int(1 + log(expected_size, 2))
-        self.head = Node('HEAD', [NIL] * self.maxlevels, [1] * self.maxlevels)
-
-    def __len__(self):
-        return self.size
-
-    def __getitem__(self, i):
-        node = self.head
-        i += 1
-        for level in reversed(range(self.maxlevels)):
-            while node.width[level] <= i:
-                i -= node.width[level]
-                node = node.next[level]
-        return node.value
-
-    def insert(self, value):
-        # find first node on each level where node.next[levels].value > value
-        chain = [None] * self.maxlevels
-        steps_at_level = [0] * self.maxlevels
-        node = self.head
-        for level in reversed(range(self.maxlevels)):
-            while node.next[level].value <= value:
-                steps_at_level[level] += node.width[level]
-                node = node.next[level]
-            chain[level] = node
-
-        # insert a link to the newnode at each level
-        d = min(self.maxlevels, 1 - int(log(random(), 2.0)))
-        newnode = Node(value, [None] * d, [None] * d)
-        steps = 0
-        for level in range(d):
-            prevnode = chain[level]
-            newnode.next[level] = prevnode.next[level]
-            prevnode.next[level] = newnode
-            newnode.width[level] = prevnode.width[level] - steps
-            prevnode.width[level] = steps + 1
-            steps += steps_at_level[level]
-        for level in range(d, self.maxlevels):
-            chain[level].width[level] += 1
-        self.size += 1
-
-    def remove(self, value):
-        # find first node on each level where node.next[levels].value >= value
-        chain = [None] * self.maxlevels
-        node = self.head
-        for level in reversed(range(self.maxlevels)):
-            while node.next[level].value < value:
-                node = node.next[level]
-            chain[level] = node
-        if value != chain[0].next[0].value:
-            raise KeyError('Not Found')
-
-        # remove one link at each level
-        d = len(chain[0].next[0].next)
-        for level in range(d):
-            prevnode = chain[level]
-            prevnode.width[level] += prevnode.next[level].width[level] - 1
-            prevnode.next[level] = prevnode.next[level].next[level]
-        for level in range(d, self.maxlevels):
-            chain[level].width[level] -= 1
-        self.size -= 1
-
-    def __iter__(self):
-        'Iterate over values in sorted order'
-        node = self.head.next[0]
-        while node is not NIL:
-            yield node.value
-            node = node.next[0]
-
-from collections import deque
-from itertools import islice
-
-
-class RunningMedian:
-    'Fast running median with O(lg n) updates where n is the window size'
-
-    def __init__(self, n, iterable):
-        from pandas.lib.skiplist import IndexableSkiplist as skiplist
-
-        self.it = iter(iterable)
-        self.queue = deque(islice(self.it, n))
-        self.skiplist = IndexableSkiplist(n)
-        for elem in self.queue:
-            self.skiplist.insert(elem)
-
-    def __iter__(self):
-        queue = self.queue
-        skiplist = self.skiplist
-        midpoint = len(queue) // 2
-        yield skiplist[midpoint]
-        for newelem in self.it:
-            oldelem = queue.popleft()
-            skiplist.remove(oldelem)
-            queue.append(newelem)
-            skiplist.insert(newelem)
-            yield skiplist[midpoint]
-
-N = 100000
-K = 10000
-
-import time
-
-
-def test():
-    from numpy.random import randn
-
-    arr = randn(N)
-
-    def _test(arr, k):
-        meds = RunningMedian(k, arr)
-        return list(meds)
-
-    _test(arr, K)
-
-
-
-def test2():
-
-    arr = randn(N)
-
-    return rolling_median(arr, K)
-
-
-def runmany(f, arr, arglist):
-    timings = []
-
-    for arg in arglist:
-        tot = 0
-        for i in range(5):
-            tot += _time(f, arr, arg)
-        timings.append(tot / 5)
-
-    return timings
-
-
-def _time(f, *args):
-    _start = time.clock()
-    result = f(*args)
-    return time.clock() - _start
-
-if __name__ == '__main__':
-    test2()
diff --git a/scripts/touchup_gh_issues.py b/scripts/touchup_gh_issues.py
deleted file mode 100755
index 96ee220f55a02..0000000000000
--- a/scripts/touchup_gh_issues.py
+++ /dev/null
@@ -1,44 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-from __future__ import print_function
-from collections import OrderedDict
-import sys
-import re
-
-"""
-Reads in stdin, replace all occurences of '#num' or 'GH #num' with
-links to github issue. dumps the issue anchors before the next
-section header
-"""
-
-pat = "((?:\s*GH\s*)?)#(\d{3,4})([^_]|$)?"
-rep_pat = r"\1GH\2_\3"
-anchor_pat = ".. _GH{id}: https://github.com/pydata/pandas/issues/{id}"
-section_pat = "^pandas\s[\d\.]+\s*$"
-
-
-def main():
-    issues = OrderedDict()
-    while True:
-
-        line = sys.stdin.readline()
-        if not line:
-            break
-
-        if re.search(section_pat, line):
-            for id in issues:
-                print(anchor_pat.format(id=id).rstrip())
-            if issues:
-                print("\n")
-            issues = OrderedDict()
-
-        for m in re.finditer(pat, line):
-            id = m.group(2)
-            if id not in issues:
-                issues[id] = True
-        print(re.sub(pat, rep_pat, line).rstrip())
-    pass
-
-if __name__ == "__main__":
-    main()
diff --git a/scripts/use_build_cache.py b/scripts/use_build_cache.py
deleted file mode 100755
index f8c2df2a8a45d..0000000000000
--- a/scripts/use_build_cache.py
+++ /dev/null
@@ -1,354 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-import os
-
-"""
-This script should be run from the repo root dir, it rewrites setup.py
-to use the build cache directory specified in the envar BUILD_CACHE_DIR
-or in a file named .build_cache_dir in the repo root directory.
-
-Artifacts included in the cache:
-- gcc artifacts
-- The .c files resulting from cythonizing pyx/d files
-- 2to3 refactoring results (when run under python3)
-
-Tested on releases back to 0.7.0.
-
-"""
-
-try:
-    import argparse
-    argparser = argparse.ArgumentParser(description="""
-    'Program description.
-    """.strip())
-
-    argparser.add_argument('-f', '--force-overwrite',
-                    default=False,
-                   help='Setting this will overwrite any existing cache results for the current commit',
-                   action='store_true')
-    argparser.add_argument('-d', '--debug',
-                    default=False,
-                   help='Report cache hits/misses',
-                   action='store_true')
-
-    args = argparser.parse_args()
-except:
-    class Foo(object):
-        debug=False
-        force_overwrite=False
-
-    args = Foo() # for 2.6, no argparse
-
-#print(args.accumulate(args.integers))
-
-shim="""
-import os
-import sys
-import shutil
-import warnings
-import re
-"""
-
-shim += ("BC_FORCE_OVERWRITE = %s\n" % args.force_overwrite)
-shim += ("BC_DEBUG = %s\n" % args.debug)
-
-shim += """
-try:
-    if not ("develop" in sys.argv) and not ("install" in sys.argv):
-        1/0
-    basedir = os.path.dirname(__file__)
-    dotfile = os.path.join(basedir,".build_cache_dir")
-    BUILD_CACHE_DIR = ""
-    if os.path.exists(dotfile):
-        BUILD_CACHE_DIR = open(dotfile).readline().strip()
-    BUILD_CACHE_DIR = os.environ.get('BUILD_CACHE_DIR',BUILD_CACHE_DIR)
-
-    if os.path.isdir(BUILD_CACHE_DIR):
-        print("--------------------------------------------------------")
-        print("BUILD CACHE ACTIVATED (V2). be careful, this is experimental.")
-        print("BUILD_CACHE_DIR: " + BUILD_CACHE_DIR )
-        print("--------------------------------------------------------")
-    else:
-        BUILD_CACHE_DIR = None
-
-    # retrieve 2to3 artifacts
-    if sys.version_info[0] >= 3:
-        from lib2to3 import refactor
-        from  hashlib import sha1
-        import shutil
-        import multiprocessing
-        pyver = "%d.%d" % (sys.version_info[:2])
-        fileq = ["pandas"]
-        to_process = dict()
-
-        # retrieve the hashes existing in the cache
-        orig_hashes=dict()
-        post_hashes=dict()
-        for path,dirs,files in os.walk(os.path.join(BUILD_CACHE_DIR,'pandas')):
-            for f in files:
-                s=f.split(".py-")[-1]
-                try:
-                    prev_h,post_h,ver = s.split('-')
-                    if ver == pyver:
-                        orig_hashes[prev_h] = os.path.join(path,f)
-                        post_hashes[post_h] = os.path.join(path,f)
-                except:
-                    pass
-
-        while fileq:
-            f = fileq.pop()
-
-            if os.path.isdir(f):
-                fileq.extend([os.path.join(f,x) for x in os.listdir(f)])
-            else:
-                if not f.endswith(".py"):
-                    continue
-                else:
-                    try:
-                        h = sha1(open(f,"rb").read()).hexdigest()
-                    except IOError:
-                        to_process[h] = f
-                    else:
-                        if h in orig_hashes and not BC_FORCE_OVERWRITE:
-                            src = orig_hashes[h]
-                            if BC_DEBUG:
-                                print("2to3 cache hit %s,%s" % (f,h))
-                            shutil.copyfile(src,f)
-                        elif h not in post_hashes:
-                            # we're not in a dev dir with already processed files
-                            if BC_DEBUG:
-                                print("2to3 cache miss (will process) %s,%s" % (f,h))
-                            to_process[h] = f
-
-        avail_fixes = set(refactor.get_fixers_from_package("lib2to3.fixes"))
-        avail_fixes.discard('lib2to3.fixes.fix_next')
-        t=refactor.RefactoringTool(avail_fixes)
-        if to_process:
-            print("Starting 2to3 refactoring...")
-            for orig_h,f in to_process.items():
-                if BC_DEBUG:
-                    print("2to3 on %s" % f)
-                try:
-                    t.refactor([f],True)
-                    post_h = sha1(open(f, "rb").read()).hexdigest()
-                    cached_fname = f + '-' + orig_h  + '-' + post_h + '-' + pyver
-                    path = os.path.join(BUILD_CACHE_DIR, cached_fname)
-                    pathdir =os.path.dirname(path)
-                    if BC_DEBUG:
-                        print("cache put %s in %s" % (f, path))
-                    try:
-                        os.makedirs(pathdir)
-                    except OSError as exc:
-                        import errno
-                        if exc.errno == errno.EEXIST and os.path.isdir(pathdir):
-                            pass
-                        else:
-                            raise
-
-                    shutil.copyfile(f, path)
-
-                except Exception as e:
-                    print("While processing %s 2to3 raised: %s" % (f,str(e)))
-
-                    pass
-            print("2to3 done refactoring.")
-
-except Exception as e:
-    if not isinstance(e,ZeroDivisionError):
-        print( "Exception: " + str(e))
-    BUILD_CACHE_DIR = None
-
-class CompilationCacheMixin(object):
-    def __init__(self, *args, **kwds):
-        cache_dir = kwds.pop("cache_dir", BUILD_CACHE_DIR)
-        self.cache_dir = cache_dir
-        if  not os.path.isdir(cache_dir):
-            raise Exception("Error: path to Cache directory (%s) is not a dir" % cache_dir)
-
-    def _copy_from_cache(self, hash, target):
-        src = os.path.join(self.cache_dir, hash)
-        if os.path.exists(src) and not BC_FORCE_OVERWRITE:
-            if BC_DEBUG:
-                print("Cache HIT: asked to copy file %s in %s"  %
-                    (src,os.path.abspath(target)))
-            s = "."
-            for d in target.split(os.path.sep)[:-1]:
-                s = os.path.join(s, d)
-                if not os.path.exists(s):
-                    os.mkdir(s)
-            shutil.copyfile(src, target)
-
-            return True
-
-        return False
-
-    def _put_to_cache(self, hash, src):
-        target = os.path.join(self.cache_dir, hash)
-        if BC_DEBUG:
-            print( "Cache miss: asked to copy file from %s to %s" % (src,target))
-        s = "."
-        for d in target.split(os.path.sep)[:-1]:
-            s = os.path.join(s, d)
-            if not os.path.exists(s):
-                os.mkdir(s)
-        shutil.copyfile(src, target)
-
-    def _hash_obj(self, obj):
-        try:
-            return hash(obj)
-        except:
-            raise NotImplementedError("You must override this method")
-
-class CompilationCacheExtMixin(CompilationCacheMixin):
-    def _hash_file(self, fname):
-        from hashlib import sha1
-        f= None
-        try:
-            hash = sha1()
-            hash.update(self.build_lib.encode('utf-8'))
-            try:
-                if sys.version_info[0] >= 3:
-                    import io
-                    f = io.open(fname, "rb")
-                else:
-                    f = open(fname)
-
-                first_line = f.readline()
-                # ignore cython generation timestamp header
-                if "Generated by Cython" not in first_line.decode('utf-8'):
-                    hash.update(first_line)
-                hash.update(f.read())
-                return hash.hexdigest()
-
-            except:
-                raise
-                return None
-            finally:
-                if f:
-                    f.close()
-
-        except IOError:
-            return None
-
-    def _hash_obj(self, ext):
-        from hashlib import sha1
-
-        sources = ext.sources
-        if (sources is None or
-            (not hasattr(sources, '__iter__')) or
-            isinstance(sources, str) or
-                sys.version[0] == 2 and isinstance(sources, unicode)):  # argh
-            return False
-
-        sources = list(sources) + ext.depends
-        hash = sha1()
-        try:
-            for fname in sources:
-                fhash = self._hash_file(fname)
-                if fhash:
-                    hash.update(fhash.encode('utf-8'))
-        except:
-            return None
-
-        return hash.hexdigest()
-
-
-class CachingBuildExt(build_ext, CompilationCacheExtMixin):
-    def __init__(self, *args, **kwds):
-        CompilationCacheExtMixin.__init__(self, *args, **kwds)
-        kwds.pop("cache_dir", None)
-        build_ext.__init__(self, *args, **kwds)
-
-    def build_extension(self, ext, *args, **kwds):
-        ext_path = self.get_ext_fullpath(ext.name)
-        build_path = os.path.join(self.build_lib, os.path.basename(ext_path))
-
-        hash = self._hash_obj(ext)
-        if hash and self._copy_from_cache(hash, ext_path):
-            return
-
-        build_ext.build_extension(self, ext, *args, **kwds)
-
-        hash = self._hash_obj(ext)
-        if os.path.exists(build_path):
-            self._put_to_cache(hash, build_path)  # build_ext
-        if os.path.exists(ext_path):
-            self._put_to_cache(hash, ext_path)  # develop
-
-    def cython_sources(self, sources, extension):
-        import re
-        cplus = self.cython_cplus or getattr(extension, 'cython_cplus', 0) or \
-            (extension.language and extension.language.lower() == 'c++')
-        target_ext = '.c'
-        if cplus:
-            target_ext = '.cpp'
-
-        for i, s in enumerate(sources):
-            if not re.search("\.(pyx|pxi|pxd)$", s):
-                continue
-            ext_dir = os.path.dirname(s)
-            ext_basename = re.sub("\.[^\.]+$", "", os.path.basename(s))
-            ext_basename += target_ext
-            target = os.path.join(ext_dir, ext_basename)
-            hash = self._hash_file(s)
-            sources[i] = target
-            if hash and self._copy_from_cache(hash, target):
-                continue
-            build_ext.cython_sources(self, [s], extension)
-            self._put_to_cache(hash, target)
-
-        sources = [x for x in sources if x.startswith("pandas") or "lib." in x]
-
-        return sources
-
-if BUILD_CACHE_DIR:  # use the cache
-    cmdclass['build_ext'] = CachingBuildExt
-
-try:
-    # recent
-    setuptools_kwargs['use_2to3'] = True if BUILD_CACHE_DIR is None else False
-except:
-    pass
-
-try:
-    # pre eb2234231 , ~ 0.7.0,
-    setuptools_args['use_2to3'] = True if BUILD_CACHE_DIR is None else False
-except:
-    pass
-
-"""
-def main():
-    opd = os.path.dirname
-    opj = os.path.join
-    s= None
-    with open(opj(opd(__file__),"..","setup.py")) as f:
-        s = f.read()
-    if s:
-        if "BUILD CACHE ACTIVATED (V2)" in s:
-            print( "setup.py already wired with V2 build_cache, skipping..")
-        else:
-            SEP="\nsetup("
-            before,after = s.split(SEP)
-            with open(opj(opd(__file__),"..","setup.py"),"wb") as f:
-                f.write((before + shim + SEP + after).encode('ascii'))
-            print("""
-    setup.py was rewritten to use a build cache.
-    Make sure you've put the following in your .bashrc:
-
-    export BUILD_CACHE_DIR=<an existing directory for saving cached files>
-    echo $BUILD_CACHE_DIR > pandas_repo_rootdir/.build_cache_dir
-
-    Once active, build results (compilation, cythonizations and 2to3 artifacts)
-    will be cached in "$BUILD_CACHE_DIR" and subsequent builds should be
-    sped up if no changes requiring recompilation were made.
-
-    Go ahead and run:
-
-    python setup.py clean
-    python setup.py develop
-
-    """)
-
-if __name__ == '__main__':
-    import sys
-    sys.exit(main())
diff --git a/scripts/validate_docstrings.py b/scripts/validate_docstrings.py
new file mode 100755
index 0000000000000..aed3eb2f1226d
--- /dev/null
+++ b/scripts/validate_docstrings.py
@@ -0,0 +1,506 @@
+#!/usr/bin/env python
+"""
+Analyze docstrings to detect errors.
+
+If no argument is provided, it does a quick check of docstrings and returns
+a csv with all API functions and results of basic checks.
+
+If a function or method is provided in the form "pandas.function",
+"pandas.module.class.method", etc. a list of all errors in the docstring for
+the specified function or method.
+
+Usage::
+    $ ./validate_docstrings.py
+    $ ./validate_docstrings.py pandas.DataFrame.head
+"""
+import os
+import sys
+import csv
+import re
+import functools
+import collections
+import argparse
+import contextlib
+import pydoc
+import inspect
+import importlib
+import doctest
+try:
+    from io import StringIO
+except ImportError:
+    from cStringIO import StringIO
+import numpy
+
+BASE_PATH = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+
+sys.path.insert(0, os.path.join(BASE_PATH))
+import pandas
+
+sys.path.insert(1, os.path.join(BASE_PATH, 'doc', 'sphinxext'))
+from numpydoc.docscrape import NumpyDocString
+
+
+PRIVATE_CLASSES = ['NDFrame', 'IndexOpsMixin']
+
+
+def _load_obj(obj_name):
+    for maxsplit in range(1, obj_name.count('.') + 1):
+        # TODO when py3 only replace by: module, *func_parts = ...
+        func_name_split = obj_name.rsplit('.', maxsplit=maxsplit)
+        module = func_name_split[0]
+        func_parts = func_name_split[1:]
+        try:
+            obj = importlib.import_module(module)
+        except ImportError:
+            pass
+        else:
+            continue
+
+    if 'module' not in locals():
+        raise ImportError('No module can be imported '
+                          'from "{}"'.format(obj_name))
+
+    for part in func_parts:
+        obj = getattr(obj, part)
+    return obj
+
+
+def _to_original_callable(obj):
+    while True:
+        if inspect.isfunction(obj) or inspect.isclass(obj):
+            f = inspect.getfile(obj)
+            if f.startswith('<') and f.endswith('>'):
+                return None
+            return obj
+        if inspect.ismethod(obj):
+            obj = obj.__func__
+        elif isinstance(obj, functools.partial):
+            obj = obj.func
+        elif isinstance(obj, property):
+            obj = obj.fget
+        else:
+            return None
+
+
+def _output_header(title, width=80, char='#'):
+    full_line = char * width
+    side_len = (width - len(title) - 2) // 2
+    adj = '' if len(title) % 2 == 0 else ' '
+    title_line = '{side} {title}{adj} {side}'.format(side=char * side_len,
+                                                     title=title,
+                                                     adj=adj)
+
+    return '\n{full_line}\n{title_line}\n{full_line}\n\n'.format(
+        full_line=full_line, title_line=title_line)
+
+
+class Docstring(object):
+    def __init__(self, method_name, method_obj):
+        self.method_name = method_name
+        self.method_obj = method_obj
+        self.raw_doc = method_obj.__doc__ or ''
+        self.clean_doc = pydoc.getdoc(self.method_obj)
+        self.doc = NumpyDocString(self.clean_doc)
+
+    def __len__(self):
+        return len(self.raw_doc)
+
+    @property
+    def is_function_or_method(self):
+        return inspect.isfunction(self.method_obj)
+
+    @property
+    def source_file_name(self):
+        fname = inspect.getsourcefile(self.method_obj)
+        if fname:
+            fname = os.path.relpath(fname, BASE_PATH)
+            return fname
+
+    @property
+    def source_file_def_line(self):
+        try:
+            return inspect.getsourcelines(self.method_obj)[-1]
+        except OSError:
+            pass
+
+    @property
+    def github_url(self):
+        url = 'https://github.com/pandas-dev/pandas/blob/master/'
+        url += '{}#L{}'.format(self.source_file_name,
+                               self.source_file_def_line)
+        return url
+
+    @property
+    def start_blank_lines(self):
+        i = None
+        if self.raw_doc:
+            for i, row in enumerate(self.raw_doc.split('\n')):
+                if row.strip():
+                    break
+        return i
+
+    @property
+    def end_blank_lines(self):
+        i = None
+        if self.raw_doc:
+            for i, row in enumerate(reversed(self.raw_doc.split('\n'))):
+                if row.strip():
+                    break
+        return i
+
+    @property
+    def double_blank_lines(self):
+        prev = True
+        for row in self.raw_doc.split('\n'):
+            if not prev and not row.strip():
+                return True
+            prev = row.strip()
+        return False
+
+    @property
+    def summary(self):
+        if not self.doc['Extended Summary'] and len(self.doc['Summary']) > 1:
+            return ''
+        return ' '.join(self.doc['Summary'])
+
+    @property
+    def extended_summary(self):
+        if not self.doc['Extended Summary'] and len(self.doc['Summary']) > 1:
+            return ' '.join(self.doc['Summary'])
+        return ' '.join(self.doc['Extended Summary'])
+
+    @property
+    def needs_summary(self):
+        return not (bool(self.summary) and bool(self.extended_summary))
+
+    @property
+    def doc_parameters(self):
+        return collections.OrderedDict((name, (type_, ''.join(desc)))
+                                       for name, type_, desc
+                                       in self.doc['Parameters'])
+
+    @property
+    def signature_parameters(self):
+        if (inspect.isclass(self.method_obj)
+                and self.method_name.split('.')[-1] in
+                self.method_obj._accessors):
+            # accessor classes have a signature, but don't want to show this
+            return tuple()
+        try:
+            signature = inspect.signature(self.method_obj)
+        except (TypeError, ValueError):
+            # Some objects, mainly in C extensions do not support introspection
+            # of the signature
+            return tuple()
+        params = tuple(signature.parameters.keys())
+        if params and params[0] in ('self', 'cls'):
+            return params[1:]
+        return params
+
+    @property
+    def parameter_mismatches(self):
+        errs = []
+        signature_params = self.signature_parameters
+        doc_params = tuple(self.doc_parameters)
+        missing = set(signature_params) - set(doc_params)
+        if missing:
+            errs.append('Parameters {!r} not documented'.format(missing))
+        extra = set(doc_params) - set(signature_params)
+        if extra:
+            errs.append('Unknown parameters {!r}'.format(extra))
+        if (not missing and not extra and signature_params != doc_params
+                and not (not signature_params and not doc_params)):
+            errs.append('Wrong parameters order. ' +
+                        'Actual: {!r}. '.format(signature_params) +
+                        'Documented: {!r}'.format(doc_params))
+
+        return errs
+
+    @property
+    def correct_parameters(self):
+        return not bool(self.parameter_mismatches)
+
+    def parameter_type(self, param):
+        return self.doc_parameters[param][0]
+
+    def parameter_desc(self, param):
+        return self.doc_parameters[param][1]
+
+    @property
+    def see_also(self):
+        return collections.OrderedDict((name, ''.join(desc))
+                                       for name, desc, _
+                                       in self.doc['See Also'])
+
+    @property
+    def examples(self):
+        return self.doc['Examples']
+
+    @property
+    def returns(self):
+        return self.doc['Returns']
+
+    @property
+    def first_line_ends_in_dot(self):
+        if self.doc:
+            return self.doc.split('\n')[0][-1] == '.'
+
+    @property
+    def deprecated(self):
+        pattern = re.compile('.. deprecated:: ')
+        return (self.method_name.startswith('pandas.Panel') or
+                bool(pattern.search(self.summary)) or
+                bool(pattern.search(self.extended_summary)))
+
+    @property
+    def mentioned_private_classes(self):
+        return [klass for klass in PRIVATE_CLASSES if klass in self.raw_doc]
+
+    @property
+    def examples_errors(self):
+        flags = doctest.NORMALIZE_WHITESPACE | doctest.IGNORE_EXCEPTION_DETAIL
+        finder = doctest.DocTestFinder()
+        runner = doctest.DocTestRunner(optionflags=flags)
+        context = {'np': numpy, 'pd': pandas}
+        error_msgs = ''
+        for test in finder.find(self.raw_doc, self.method_name, globs=context):
+            f = StringIO()
+            with contextlib.redirect_stdout(f):
+                runner.run(test)
+            error_msgs += f.getvalue()
+        return error_msgs
+
+
+def get_api_items():
+    api_fname = os.path.join(BASE_PATH, 'doc', 'source', 'api.rst')
+
+    previous_line = current_section = current_subsection = ''
+    position = None
+    with open(api_fname) as f:
+        for line in f:
+            line = line.strip()
+            if len(line) == len(previous_line):
+                if set(line) == set('-'):
+                    current_section = previous_line
+                    continue
+                if set(line) == set('~'):
+                    current_subsection = previous_line
+                    continue
+
+            if line.startswith('.. currentmodule::'):
+                current_module = line.replace('.. currentmodule::', '').strip()
+                continue
+
+            if line == '.. autosummary::':
+                position = 'autosummary'
+                continue
+
+            if position == 'autosummary':
+                if line == '':
+                    position = 'items'
+                    continue
+
+            if position == 'items':
+                if line == '':
+                    position = None
+                    continue
+                item = line.strip()
+                func = importlib.import_module(current_module)
+                for part in item.split('.'):
+                    func = getattr(func, part)
+
+                yield ('.'.join([current_module, item]), func,
+                       current_section, current_subsection)
+
+            previous_line = line
+
+
+def _csv_row(func_name, func_obj, section, subsection, in_api, seen={}):
+    obj_type = type(func_obj).__name__
+    original_callable = _to_original_callable(func_obj)
+    if original_callable is None:
+        return [func_name, obj_type] + [''] * 12, ''
+    else:
+        doc = Docstring(func_name, original_callable)
+        key = doc.source_file_name, doc.source_file_def_line
+        shared_code = seen.get(key, '')
+        return [func_name,
+                obj_type,
+                in_api,
+                int(doc.deprecated),
+                section,
+                subsection,
+                doc.source_file_name,
+                doc.source_file_def_line,
+                doc.github_url,
+                int(bool(doc.summary)),
+                int(bool(doc.extended_summary)),
+                int(doc.correct_parameters),
+                int(bool(doc.examples)),
+                shared_code], key
+
+
+def validate_all():
+    writer = csv.writer(sys.stdout)
+    cols = ('Function or method',
+            'Type',
+            'In API doc',
+            'Is deprecated',
+            'Section',
+            'Subsection',
+            'File',
+            'Code line',
+            'GitHub link',
+            'Has summary',
+            'Has extended summary',
+            'Parameters ok',
+            'Has examples',
+            'Shared code with')
+    writer.writerow(cols)
+    seen = {}
+    api_items = list(get_api_items())
+    for func_name, func, section, subsection in api_items:
+        row, key = _csv_row(func_name, func, section, subsection,
+                            in_api=1, seen=seen)
+        seen[key] = func_name
+        writer.writerow(row)
+
+    api_item_names = set(list(zip(*api_items))[0])
+    for class_ in (pandas.Series, pandas.DataFrame, pandas.Panel):
+        for member in inspect.getmembers(class_):
+            func_name = 'pandas.{}.{}'.format(class_.__name__, member[0])
+            if (not member[0].startswith('_') and
+                    func_name not in api_item_names):
+                func = _load_obj(func_name)
+                row, key = _csv_row(func_name, func, section='', subsection='',
+                                    in_api=0)
+                writer.writerow(row)
+
+    return 0
+
+
+def validate_one(func_name):
+    func_obj = _load_obj(func_name)
+    doc = Docstring(func_name, func_obj)
+
+    sys.stderr.write(_output_header('Docstring ({})'.format(func_name)))
+    sys.stderr.write('{}\n'.format(doc.clean_doc))
+
+    errs = []
+    if doc.start_blank_lines != 1:
+        errs.append('Docstring text (summary) should start in the line '
+                    'immediately after the opening quotes (not in the same '
+                    'line, or leaving a blank line in between)')
+    if doc.end_blank_lines != 1:
+        errs.append('Closing quotes should be placed in the line after '
+                    'the last text in the docstring (do not close the '
+                    'quotes in the same line as the text, or leave a '
+                    'blank line between the last text and the quotes)')
+    if doc.double_blank_lines:
+        errs.append('Use only one blank line to separate sections or '
+                    'paragraphs')
+
+    if not doc.summary:
+        errs.append('No summary found (a short summary in a single line '
+                    'should be present at the beginning of the docstring)')
+    else:
+        if not doc.summary[0].isupper():
+            errs.append('Summary does not start with capital')
+        if doc.summary[-1] != '.':
+            errs.append('Summary does not end with dot')
+        if (doc.is_function_or_method and
+                doc.summary.split(' ')[0][-1] == 's'):
+            errs.append('Summary must start with infinitive verb, '
+                        'not third person (e.g. use "Generate" instead of '
+                        '"Generates")')
+    if not doc.extended_summary:
+        errs.append('No extended summary found')
+
+    param_errs = doc.parameter_mismatches
+    for param in doc.doc_parameters:
+        if not doc.parameter_type(param):
+            param_errs.append('Parameter "{}" has no type'.format(param))
+        else:
+            if doc.parameter_type(param)[-1] == '.':
+                param_errs.append('Parameter "{}" type '
+                                  'should not finish with "."'.format(param))
+
+        if not doc.parameter_desc(param):
+            param_errs.append('Parameter "{}" '
+                              'has no description'.format(param))
+        else:
+            if not doc.parameter_desc(param)[0].isupper():
+                param_errs.append('Parameter "{}" description '
+                                  'should start with '
+                                  'capital letter'.format(param))
+            if doc.parameter_desc(param)[-1] != '.':
+                param_errs.append('Parameter "{}" description '
+                                  'should finish with "."'.format(param))
+    if param_errs:
+        errs.append('Errors in parameters section')
+        for param_err in param_errs:
+            errs.append('\t{}'.format(param_err))
+
+    if not doc.returns:
+        errs.append('No returns section found')
+
+    mentioned_errs = doc.mentioned_private_classes
+    if mentioned_errs:
+        errs.append('Private classes ({}) should not be mentioned in public '
+                    'docstring.'.format(mentioned_errs))
+
+    if not doc.see_also:
+        errs.append('See Also section not found')
+    else:
+        for rel_name, rel_desc in doc.see_also.items():
+            if not rel_desc:
+                errs.append('Missing description for '
+                            'See Also "{}" reference'.format(rel_name))
+
+    for line in doc.raw_doc.splitlines():
+        if re.match("^ *\t", line):
+            errs.append('Tabs found at the start of line "{}", '
+                        'please use whitespace only'.format(line.lstrip()))
+
+    examples_errs = ''
+    if not doc.examples:
+        errs.append('No examples section found')
+    else:
+        examples_errs = doc.examples_errors
+        if examples_errs:
+            errs.append('Examples do not pass tests')
+
+    sys.stderr.write(_output_header('Validation'))
+    if errs:
+        sys.stderr.write('Errors found:\n')
+        for err in errs:
+            sys.stderr.write('\t{}\n'.format(err))
+    else:
+        sys.stderr.write('Docstring for "{}" correct. :)\n'.format(func_name))
+
+    if examples_errs:
+        sys.stderr.write(_output_header('Doctests'))
+        sys.stderr.write(examples_errs)
+
+    return len(errs)
+
+
+def main(function):
+    if function is None:
+        return validate_all()
+    else:
+        return validate_one(function)
+
+
+if __name__ == '__main__':
+    argparser = argparse.ArgumentParser(
+        description='validate pandas docstrings')
+    argparser.add_argument('function',
+                           nargs='?',
+                           default=None,
+                           help=('function or method to validate '
+                                 '(e.g. pandas.DataFrame.head) '
+                                 'if not provided, all docstrings '
+                                 'are validated'))
+    args = argparser.parse_args()
+    sys.exit(main(args.function))
diff --git a/scripts/winbuild_py25.bat b/scripts/winbuild_py25.bat
deleted file mode 100644
index 5ecebab71b851..0000000000000
--- a/scripts/winbuild_py25.bat
+++ /dev/null
@@ -1,2 +0,0 @@
-SET PATH=C:\MinGW\bin;C:\Python25;C:\Python25\Scripts;%PATH%
-python setup.py build -c mingw32 bdist_wininst
diff --git a/scripts/winbuild_py27.bat b/scripts/winbuild_py27.bat
deleted file mode 100644
index bec67c7e527ed..0000000000000
--- a/scripts/winbuild_py27.bat
+++ /dev/null
@@ -1,2 +0,0 @@
-SET PATH=C:\MinGW\bin;C:\Python27;C:\Python27\Scripts;%PATH%
-python setup.py build -c mingw32 bdist_wininst
diff --git a/scripts/windows_builder/build_26-32.bat b/scripts/windows_builder/build_26-32.bat
deleted file mode 100644
index 00cf016ff3bad..0000000000000
--- a/scripts/windows_builder/build_26-32.bat
+++ /dev/null
@@ -1,21 +0,0 @@
-@echo off
-echo "starting 26-32"
-
-
-title 26-32 build
-echo "building"
-cd "c:\users\Jeff Reback\documents\github\pandas"
-C:\python26-32\python.exe setup.py build > build.26-32.log 2>&1
-
-echo "installing"
-C:\python26-32\python.exe setup.py bdist --formats=wininst > install.26-32.log 2>&1
-
-echo "testing"
-C:\python26-32\scripts\nosetests -A "not slow" build\lib.win32-2.6\pandas > test.26-32.log 2>&1
-
-echo "versions"
-cd build\lib.win32-2.6
-C:\python26-32\python.exe ../../ci/print_versions.py > ../../versions.26-32.log 2>&1
-
-
-exit
diff --git a/scripts/windows_builder/build_26-64.bat b/scripts/windows_builder/build_26-64.bat
deleted file mode 100644
index 55abf37c6c37a..0000000000000
--- a/scripts/windows_builder/build_26-64.bat
+++ /dev/null
@@ -1,25 +0,0 @@
-@echo off
-echo "starting 26-64"
-
-setlocal EnableDelayedExpansion
-set MSSdk=1
-CALL "C:\Program Files\Microsoft SDKs\Windows\v7.0\Bin\SetEnv.cmd" /x64 /release
-set DISTUTILS_USE_SDK=1
-
-title 26-64 build
-echo "building"
-cd "c:\users\Jeff Reback\documents\github\pandas"
-C:\python26-64\python.exe setup.py build > build.26-64.log 2>&1
-
-echo "installing"
-C:\python26-64\python.exe setup.py bdist --formats=wininst > install.26-64.log 2>&1
-
-echo "testing"
-C:\python26-64\scripts\nosetests -A "not slow" build\lib.win-amd64-2.6\pandas > test.26-64.log 2>&1
-
-echo "versions"
-cd build\lib.win-amd64-2.6
-C:\python26-64\python.exe ../../ci/print_versions.py > ../../versions.26-64.log 2>&1
-
-
-exit
diff --git a/scripts/windows_builder/build_27-32.bat b/scripts/windows_builder/build_27-32.bat
deleted file mode 100644
index 37eb4d436d567..0000000000000
--- a/scripts/windows_builder/build_27-32.bat
+++ /dev/null
@@ -1,25 +0,0 @@
-@echo off
-echo "starting 27-32"
-
-setlocal EnableDelayedExpansion
-set MSSdk=1
-CALL "C:\Program Files\Microsoft SDKs\Windows\v7.0\Bin\SetEnv.cmd" /x86 /release
-set DISTUTILS_USE_SDK=1
-
-title 27-32 build
-echo "building"
-cd "c:\users\Jeff Reback\documents\github\pandas"
-C:\python27-32\python.exe setup.py build > build.27-32.log 2>&1
-
-title "installing"
-C:\python27-32\python.exe setup.py bdist --formats=wininst > install.27-32.log 2>&1
-
-echo "testing"
-C:\python27-32\scripts\nosetests -A "not slow" build\lib.win32-2.7\pandas > test.27-32.log 2>&1
-
-echo "versions"
-cd build\lib.win32-2.7
-C:\python27-32\python.exe ../../ci/print_versions.py > ../../versions.27-32.log 2>&1
-
-exit
-
diff --git a/scripts/windows_builder/build_27-64.bat b/scripts/windows_builder/build_27-64.bat
deleted file mode 100644
index e76e25d0ef39c..0000000000000
--- a/scripts/windows_builder/build_27-64.bat
+++ /dev/null
@@ -1,25 +0,0 @@
-@echo off
-echo "starting 27-64"
-
-setlocal EnableDelayedExpansion
-set MSSdk=1
-CALL "C:\Program Files\Microsoft SDKs\Windows\v7.0\Bin\SetEnv.cmd" /x64 /release
-set DISTUTILS_USE_SDK=1
-
-title 27-64 build
-echo "building"
-cd "c:\users\Jeff Reback\documents\github\pandas"
-C:\python27-64\python.exe setup.py build > build.27-64.log 2>&1
-
-echo "installing"
-C:\python27-64\python.exe setup.py bdist --formats=wininst > install.27-64.log 2>&1
-
-echo "testing"
-C:\python27-64\scripts\nosetests -A "not slow" build\lib.win-amd64-2.7\pandas > test.27-64.log 2>&1
-
-echo "versions"
-cd build\lib.win-amd64-2.7
-C:\python27-64\python.exe ../../ci/print_versions.py > ../../versions.27-64.log 2>&1
-
-exit
-
diff --git a/scripts/windows_builder/build_33-32.bat b/scripts/windows_builder/build_33-32.bat
deleted file mode 100644
index cf629bc71f34e..0000000000000
--- a/scripts/windows_builder/build_33-32.bat
+++ /dev/null
@@ -1,27 +0,0 @@
-@echo off
-echo "starting 33-32"
-
-setlocal EnableDelayedExpansion
-set MSSdk=1
-CALL "C:\Program Files\Microsoft SDKs\Windows\v7.1\Bin\SetEnv.cmd" /x86 /release
-set DISTUTILS_USE_SDK=1
-
-title 33-32 build
-echo "building"
-cd "c:\users\Jeff Reback\documents\github\pandas"
-C:\python33-32\python.exe setup.py build > build.33-32.log 2>&1
-
-echo "installing"
-C:\python33-32\python.exe setup.py bdist --formats=wininst > install.33-32.log 2>&1
-
-echo "testing"
-C:\python33-32\scripts\nosetests -A "not slow" build\lib.win32-3.3\pandas > test.33-32.log 2>&1
-
-echo "versions"
-cd build\lib.win32-3.3
-C:\python33-32\python.exe ../../ci/print_versions.py > ../../versions.33-32.log 2>&1
-
-exit
-
-
-
diff --git a/scripts/windows_builder/build_33-64.bat b/scripts/windows_builder/build_33-64.bat
deleted file mode 100644
index 8f037941868f9..0000000000000
--- a/scripts/windows_builder/build_33-64.bat
+++ /dev/null
@@ -1,27 +0,0 @@
-@echo off
-echo "starting 33-64"
-
-setlocal EnableDelayedExpansion
-set MSSdk=1
-CALL "C:\Program Files\Microsoft SDKs\Windows\v7.1\Bin\SetEnv.cmd" /x64 /release
-set DISTUTILS_USE_SDK=1
-
-title 33-64 build
-echo "building"
-cd "c:\users\Jeff Reback\documents\github\pandas"
-C:\python33-64\python.exe setup.py build > build.33-64.log 2>&1
-
-echo "installing"
-C:\python33-64\python.exe setup.py bdist --formats=wininst > install.33-64.log 2>&1
-
-echo "testing"
-C:\python33-64\scripts\nosetests -A "not slow" build\lib.win-amd64-3.3\pandas > test.33-64.log 2>&1
-
-echo "versions"
-cd build\lib.win-amd64-3.3
-C:\python33-64\python.exe ../../ci/print_versions.py > ../../versions.33-64.log 2>&1
-
-exit
-
-
-
diff --git a/scripts/windows_builder/build_34-32.bat b/scripts/windows_builder/build_34-32.bat
deleted file mode 100644
index 8e060e000bc8f..0000000000000
--- a/scripts/windows_builder/build_34-32.bat
+++ /dev/null
@@ -1,27 +0,0 @@
-@echo off
-echo "starting 34-32"
-
-setlocal EnableDelayedExpansion
-set MSSdk=1
-CALL "C:\Program Files\Microsoft SDKs\Windows\v7.1\Bin\SetEnv.cmd" /x86 /release
-set DISTUTILS_USE_SDK=1
-
-title 34-32 build
-echo "building"
-cd "c:\users\Jeff Reback\documents\github\pandas"
-C:\python34-32\python.exe setup.py build > build.34-32.log 2>&1
-
-echo "installing"
-C:\python34-32\python.exe setup.py bdist --formats=wininst > install.34-32.log 2>&1
-
-echo "testing"
-C:\python34-32\scripts\nosetests -A "not slow" build\lib.win32-3.4\pandas > test.34-32.log 2>&1
-
-echo "versions"
-cd build\lib.win32-3.4
-C:\python34-32\python.exe ../../ci/print_versions.py > ../../versions.34-32.log 2>&1
-
-exit
-
-
-
diff --git a/scripts/windows_builder/build_34-64.bat b/scripts/windows_builder/build_34-64.bat
deleted file mode 100644
index 3a8512b730346..0000000000000
--- a/scripts/windows_builder/build_34-64.bat
+++ /dev/null
@@ -1,27 +0,0 @@
-@echo off
-echo "starting 34-64"
-
-setlocal EnableDelayedExpansion
-set MSSdk=1
-CALL "C:\Program Files\Microsoft SDKs\Windows\v7.1\Bin\SetEnv.cmd" /x64 /release
-set DISTUTILS_USE_SDK=1
-
-title 34-64 build
-echo "building"
-cd "c:\users\Jeff Reback\documents\github\pandas"
-C:\python34-64\python.exe setup.py build > build.34-64.log 2>&1
-
-echo "installing"
-C:\python34-64\python.exe setup.py bdist --formats=wininst > install.34-64.log 2>&1
-
-echo "testing"
-C:\python34-64\scripts\nosetests -A "not slow" build\lib.win-amd64-3.4\pandas > test.34-64.log 2>&1
-
-echo "versions"
-cd build\lib.win-amd64-3.4
-C:\python34-64\python.exe ../../ci/print_versions.py > ../../versions.34-64.log 2>&1
-
-exit
-
-
-
diff --git a/scripts/windows_builder/check_and_build.bat b/scripts/windows_builder/check_and_build.bat
deleted file mode 100644
index 32be1bde1f7f3..0000000000000
--- a/scripts/windows_builder/check_and_build.bat
+++ /dev/null
@@ -1,2 +0,0 @@
-set PYTHONPATH=c:/python27-64/lib
-c:/python27-64/python.exe c:/Builds/check_and_build.py %1 %2 %3 %4 %4 %6 %7 %8 %9
diff --git a/scripts/windows_builder/check_and_build.py b/scripts/windows_builder/check_and_build.py
deleted file mode 100644
index 81669972b991d..0000000000000
--- a/scripts/windows_builder/check_and_build.py
+++ /dev/null
@@ -1,194 +0,0 @@
-import datetime
-import git
-import logging
-import os, re, time
-import subprocess
-import argparse
-import pysftp
-
-# parse the args
-parser = argparse.ArgumentParser(description='build, test, and install updated versions of master pandas')
-parser.add_argument('-b', '--build',
-                    help='run just this build',
-                    dest='build')
-parser.add_argument('-u', '--update',
-                    help='get a git update',
-                    dest='update',
-                    action='store_true',
-                    default=False)
-parser.add_argument('-t', '--test',
-                    help='run the tests',
-                    dest='test',
-                    action='store_true',
-                    default=False)
-parser.add_argument('-c', '--compare',
-                    help='show the last tests compare',
-                    dest='compare',
-                    action='store_true',
-                    default=False)
-parser.add_argument('-v', '--version',
-                    help='show the last versions',
-                    dest='version',
-                    action='store_true',
-                    default=False)
-parser.add_argument('-i', '--install',
-                    help='run the install',
-                    dest='install',
-                    action='store_true',
-                    default=False)
-parser.add_argument('--dry',
-                    help='dry run',
-                    dest='dry',
-                    action='store_true',
-                    default=False)
-
-args = parser.parse_args()
-dry_run = args.dry
-
-builds = ['26-32','26-64','27-32','27-64','33-32','33-64','34-32','34-64']
-base_dir = "C:\Users\Jeff Reback\Documents\GitHub\pandas"
-remote_host='pandas.pydata.org'
-username='pandas'
-password=############
-
-# drop python from our environment to avoid
-# passing this onto sub-processes
-env = os.environ
-del env['PYTHONPATH']
-
-# the stdout logger
-fmt = '%(asctime)s: %(message)s'
-logger = logging.getLogger('check_and_build')
-logger.setLevel(logging.DEBUG)
-stream_handler = logging.StreamHandler()
-stream_handler.setFormatter(logging.Formatter(fmt))
-logger.addHandler(stream_handler)
-
-def run_all(test=False,compare=False,install=False,version=False,build=None):
-    # run everything
-
-    for b in builds:
-        if build is not None and build != b:
-            continue
-        if test:
-            do_rebuild(b)
-        if compare or test:
-            try:
-                do_compare(b)
-            except (Exception) as e:
-                logger.info("ERROR COMPARE {0} : {1}".format(b,e))
-        if version:
-            try:
-                do_version(b)
-            except (Exception) as e:
-                logger.info("ERROR VERSION {0} : {1}".format(b,e))
-
-    if install:
-        run_install()
-
-def do_rebuild(build):
-    # trigger the rebuild
-
-    cmd = "c:/Builds/build_{0}.bat".format(build)
-    logger.info("rebuild : {0}".format(cmd))
-    p = subprocess.Popen("start /wait /min {0}".format(cmd),env=env,shell=True,close_fds=True)
-    ret = p.wait()
-
-def do_compare(build):
-    # print the test outputs
-
-    f = os.path.join(base_dir,"test.{0}.log".format(build))
-    with open(f,'r') as fh:
-        for l in fh:
-            l = l.rstrip()
-            if l.startswith('ERROR:'):
-                logger.info("{0} : {1}".format(build,l))
-            if l.startswith('Ran') or l.startswith('OK') or l.startswith('FAIL'):
-                logger.info("{0} : {1}".format(build,l))
-
-def do_version(build):
-    # print the version strings
-
-    f = os.path.join(base_dir,"versions.{0}.log".format(build))
-    with open(f,'r') as fh:
-        for l in fh:
-            l = l.rstrip()
-            logger.info("{0} : {1}".format(build,l))
-
-def do_update(is_verbose=True):
-    # update git; return True if the commit has changed
-
-    repo = git.Repo(base_dir)
-    master = repo.heads.master
-    origin = repo.remotes.origin
-    start_commit = master.commit
-
-    if is_verbose:
-        logger.info("current commit   : {0}".format(start_commit))
-
-    try:
-        origin.update()
-    except (Exception) as e:
-        logger.info("update exception : {0}".format(e))
-    try:
-        origin.pull()
-    except (Exception) as e:
-        logger.info("pull exception : {0}".format(e))
-
-    result = start_commit != master.commit
-    if result:
-        if is_verbose:
-            logger.info("commits changed : {0} -> {1}".format(start_commit,master.commit))
-    return result
-    
-def run_install():
-    # send the installation binaries
-
-    repo = git.Repo(base_dir)
-    master = repo.heads.master
-    commit = master.commit
-    short_hash = str(commit)[:7]
-
-    logger.info("sending files : {0}".format(commit))
-    d = os.path.join(base_dir,"dist")
-    files = [ f for f in os.listdir(d) if re.search(short_hash,f) ]
-    srv = pysftp.Connection(host=remote_host,username=username,password=password)
-    srv.chdir("www/pandas-build/dev")
-
-    # get current files
-    remote_files = set(srv.listdir(path='.'))
-
-    for f in files:
-        if f not in remote_files:
-            logger.info("sending: {0}".format(f))
-            local = os.path.join(d,f)
-            srv.put(localpath=local)
-
-    srv.close()
-    logger.info("sending files: done")
-
-# just perform the action
-if args.update or args.test or args.compare or args.install or args.version:
-    if args.update:
-        do_update()
-    run_all(test=args.test,compare=args.compare,install=args.install,version=args.version,build=args.build)
-    exit(0)
-
-# file logging
-file_handler = logging.FileHandler("C:\Builds\logs\check_and_build.log")
-file_handler.setFormatter(logging.Formatter(fmt))
-logger.addHandler(file_handler)
-
-logger.info("start")
-
-# main loop
-while(True):
-
-    if do_update():
-        run_all(test=True,install=False)
-
-    time.sleep(60*60)
-
-logger.info("exit")
-file_handler.close()
-
diff --git a/scripts/windows_builder/readme.txt b/scripts/windows_builder/readme.txt
deleted file mode 100644
index 85c011e515b74..0000000000000
--- a/scripts/windows_builder/readme.txt
+++ /dev/null
@@ -1,17 +0,0 @@
-This is a collection of windows batch scripts (and a python script)
-to rebuild the binaries, test, and upload the binaries for public distribution
-upon a commit on github.
-
-Obviously requires that these be setup on windows
-Requires an install of Windows SDK 3.5 and 4.0
-Full python installs for each version with the deps
-
-Currently supporting
-
-26-32,26-64,27-32,27-64,33-32,33-64,34-32,34-64
-
-Note that 33 and 34 use the 4.0 SDK, while the other suse 3.5 SDK
-
-I installed these scripts in C:\Builds
-
-Installed libaries in C:\Installs
diff --git a/setup.cfg b/setup.cfg
index 8798e2ce6a5a5..9ec967c25e225 100644
--- a/setup.cfg
+++ b/setup.cfg
@@ -10,3 +10,27 @@ versionfile_source = pandas/_version.py
 versionfile_build = pandas/_version.py
 tag_prefix = v
 parentdir_prefix = pandas-
+
+[flake8]
+ignore =
+    E402,  # module level import not at top of file
+    E731,  # do not assign a lambda expression, use a def
+    E741,  # do not use variables named 'l', 'O', or 'I'
+    W503   # line break before binary operator
+max-line-length = 79
+
+[yapf]
+based_on_style = pep8
+split_before_named_assigns = false
+split_penalty_after_opening_bracket = 1000000
+split_penalty_logical_operator = 30
+
+[tool:pytest]
+testpaths = pandas
+markers =
+    single: mark a test as single cpu only
+    slow: mark a test as slow
+    network: mark a test as network
+    high_memory: mark a test as a high-memory only
+addopts = --strict-data-files
+doctest_optionflags= NORMALIZE_WHITESPACE IGNORE_EXCEPTION_DETAIL
\ No newline at end of file
diff --git a/setup.py b/setup.py
index 2d1b9374f6c94..621655dd05dbc 100755
--- a/setup.py
+++ b/setup.py
@@ -7,17 +7,32 @@
 """
 
 import os
+from os.path import join as pjoin
+
+import pkg_resources
 import sys
 import shutil
-import warnings
-import re
 from distutils.version import LooseVersion
+from setuptools import setup, Command, find_packages
 
 # versioning
 import versioneer
 cmdclass = versioneer.get_cmdclass()
 
-min_cython_ver = '0.19.1'
+
+def is_platform_windows():
+    return sys.platform == 'win32' or sys.platform == 'cygwin'
+
+
+def is_platform_linux():
+    return sys.platform == 'linux2'
+
+
+def is_platform_mac():
+    return sys.platform == 'darwin'
+
+
+min_cython_ver = '0.24'
 try:
     import Cython
     ver = Cython.__version__
@@ -25,75 +40,101 @@
 except ImportError:
     _CYTHON_INSTALLED = False
 
-try:
-    import pkg_resources
-    from setuptools import setup, Command
-    _have_setuptools = True
-except ImportError:
-    # no setuptools installed
-    from distutils.core import setup, Command
-    _have_setuptools = False
-
-setuptools_kwargs = {}
-min_numpy_ver = '1.7.0'
-if sys.version_info[0] >= 3:
-
-    setuptools_kwargs = {
-                         'zip_safe': False,
-                         'install_requires': ['python-dateutil >= 2',
-                                              'pytz >= 2011k',
-                                              'numpy >= %s' % min_numpy_ver],
-                         'setup_requires': ['numpy >= %s' % min_numpy_ver],
-                         }
-    if not _have_setuptools:
-        sys.exit("need setuptools/distribute for Py3k"
-                 "\n$ pip install distribute")
 
-else:
-    setuptools_kwargs = {
-        'install_requires': ['python-dateutil',
-                            'pytz >= 2011k',
-                             'numpy >= %s' % min_numpy_ver],
-        'setup_requires': ['numpy >= %s' % min_numpy_ver],
-        'zip_safe': False,
-    }
+min_numpy_ver = '1.9.0'
+setuptools_kwargs = {
+    'install_requires': [
+        'python-dateutil >= 2.5.0',
+        'pytz >= 2011k',
+        'numpy >= {numpy_ver}'.format(numpy_ver=min_numpy_ver),
+    ],
+    'setup_requires': ['numpy >= {numpy_ver}'.format(numpy_ver=min_numpy_ver)],
+    'zip_safe': False,
+}
 
-    if not _have_setuptools:
-        try:
-            import numpy
-            import dateutil
-            setuptools_kwargs = {}
-        except ImportError:
-            sys.exit("install requires: 'python-dateutil < 2','numpy'."
-                     "  use pip or easy_install."
-                     "\n   $ pip install 'python-dateutil < 2' 'numpy'")
 
-from distutils.extension import Extension
-from distutils.command.build import build
-from distutils.command.build_ext import build_ext as _build_ext
+from distutils.extension import Extension  # noqa:E402
+from distutils.command.build import build  # noqa:E402
+from distutils.command.build_ext import build_ext as _build_ext  # noqa:E402
 
 try:
     if not _CYTHON_INSTALLED:
         raise ImportError('No supported version of Cython installed.')
-    from Cython.Distutils import build_ext as _build_ext
+    try:
+        from Cython.Distutils.old_build_ext import old_build_ext as _build_ext  # noqa:F811,E501
+    except ImportError:
+        # Pre 0.25
+        from Cython.Distutils import build_ext as _build_ext
     cython = True
 except ImportError:
     cython = False
 
-from os.path import join as pjoin
+
+if cython:
+    try:
+        try:
+            from Cython import Tempita as tempita
+        except ImportError:
+            import tempita
+    except ImportError:
+        raise ImportError('Building pandas requires Tempita: '
+                          'pip install Tempita')
+
+
+_pxi_dep_template = {
+    'algos': ['_libs/algos_common_helper.pxi.in',
+              '_libs/algos_take_helper.pxi.in',
+              '_libs/algos_rank_helper.pxi.in'],
+    'groupby': ['_libs/groupby_helper.pxi.in'],
+    'join': ['_libs/join_helper.pxi.in', '_libs/join_func_helper.pxi.in'],
+    'reshape': ['_libs/reshape_helper.pxi.in'],
+    'hashtable': ['_libs/hashtable_class_helper.pxi.in',
+                  '_libs/hashtable_func_helper.pxi.in'],
+    'index': ['_libs/index_class_helper.pxi.in'],
+    'sparse': ['_libs/sparse_op_helper.pxi.in'],
+    'interval': ['_libs/intervaltree.pxi.in']}
+
+_pxifiles = []
+_pxi_dep = {}
+for module, files in _pxi_dep_template.items():
+    pxi_files = [pjoin('pandas', x) for x in files]
+    _pxifiles.extend(pxi_files)
+    _pxi_dep[module] = pxi_files
 
 
 class build_ext(_build_ext):
     def build_extensions(self):
+
+        # if builing from c files, don't need to
+        # generate template output
+        if cython:
+            for pxifile in _pxifiles:
+                # build pxifiles first, template extension must be .pxi.in
+                assert pxifile.endswith('.pxi.in')
+                outfile = pxifile[:-3]
+
+                if (os.path.exists(outfile) and
+                        os.stat(pxifile).st_mtime < os.stat(outfile).st_mtime):
+                    # if .pxi.in is not updated, no need to output .pxi
+                    continue
+
+                with open(pxifile, "r") as f:
+                    tmpl = f.read()
+                pyxcontent = tempita.sub(tmpl)
+
+                with open(outfile, "w") as f:
+                    f.write(pyxcontent)
+
         numpy_incl = pkg_resources.resource_filename('numpy', 'core/include')
 
         for ext in self.extensions:
-            if hasattr(ext, 'include_dirs') and not numpy_incl in ext.include_dirs:
+            if (hasattr(ext, 'include_dirs') and
+                    numpy_incl not in ext.include_dirs):
                 ext.include_dirs.append(numpy_incl)
         _build_ext.build_extensions(self)
 
 
-DESCRIPTION = ("Powerful data structures for data analysis, time series,"
+DESCRIPTION = ("Powerful data structures for data analysis, time series, "
                "and statistics")
 LONG_DESCRIPTION = """
 **pandas** is a Python package providing fast, flexible, and expressive data
@@ -157,10 +198,6 @@ def build_extensions(self):
 munging and cleaning data, analyzing / modeling it, then organizing the results
 of the analysis into a form suitable for plotting or tabular display. pandas is
 the ideal tool for all of these tasks.
-
-Note
-----
-Windows binaries built against NumPy 1.8.1
 """
 
 DISTNAME = 'pandas'
@@ -177,14 +214,13 @@ def build_extensions(self):
     'Programming Language :: Python',
     'Programming Language :: Python :: 2',
     'Programming Language :: Python :: 3',
-    'Programming Language :: Python :: 2.6',
     'Programming Language :: Python :: 2.7',
-    'Programming Language :: Python :: 3.3',
-    'Programming Language :: Python :: 3.4',
     'Programming Language :: Python :: 3.5',
+    'Programming Language :: Python :: 3.6',
+    'Programming Language :: Python :: 3.7',
     'Programming Language :: Cython',
-    'Topic :: Scientific/Engineering',
-]
+    'Topic :: Scientific/Engineering']
+
 
 class CleanCommand(Command):
     """Custom distutils command to clean the .so and .pyc files."""
@@ -196,22 +232,24 @@ def initialize_options(self):
         self._clean_me = []
         self._clean_trees = []
 
-        base = pjoin('pandas','src')
-        dt = pjoin(base,'datetime')
+        base = pjoin('pandas', '_libs', 'src')
+        dt = pjoin(base, 'datetime')
         src = base
-        parser = pjoin(base,'parser')
-        ujson_python = pjoin(base,'ujson','python')
-        ujson_lib = pjoin(base,'ujson','lib')
-        self._clean_exclude = [pjoin(dt,'np_datetime.c'),
-                               pjoin(dt,'np_datetime_strings.c'),
-                               pjoin(src,'period_helper.c'),
-                               pjoin(parser,'tokenizer.c'),
-                               pjoin(parser,'io.c'),
-                               pjoin(ujson_python,'ujson.c'),
-                               pjoin(ujson_python,'objToJSON.c'),
-                               pjoin(ujson_python,'JSONtoObj.c'),
-                               pjoin(ujson_lib,'ultrajsonenc.c'),
-                               pjoin(ujson_lib,'ultrajsondec.c'),
+        util = pjoin('pandas', 'util')
+        parser = pjoin(base, 'parser')
+        ujson_python = pjoin(base, 'ujson', 'python')
+        ujson_lib = pjoin(base, 'ujson', 'lib')
+        self._clean_exclude = [pjoin(dt, 'np_datetime.c'),
+                               pjoin(dt, 'np_datetime_strings.c'),
+                               pjoin(src, 'period_helper.c'),
+                               pjoin(parser, 'tokenizer.c'),
+                               pjoin(parser, 'io.c'),
+                               pjoin(ujson_python, 'ujson.c'),
+                               pjoin(ujson_python, 'objToJSON.c'),
+                               pjoin(ujson_python, 'JSONtoObj.c'),
+                               pjoin(ujson_lib, 'ultrajsonenc.c'),
+                               pjoin(ujson_lib, 'ultrajsondec.c'),
+                               pjoin(util, 'move.c'),
                                ]
 
         for root, dirs, files in os.walk('pandas'):
@@ -228,6 +266,11 @@ def initialize_options(self):
                 if d == '__pycache__':
                     self._clean_trees.append(pjoin(root, d))
 
+        # clean the generated pxi files
+        for pxifile in _pxifiles:
+            pxifile = pxifile.replace(".pxi.in", ".pxi")
+            self._clean_me.append(pxifile)
+
         for d in ('build', 'dist'):
             if os.path.exists(d):
                 self._clean_trees.append(d)
@@ -252,53 +295,83 @@ def run(self):
 # class as it encodes the version info
 sdist_class = cmdclass['sdist']
 
+
 class CheckSDist(sdist_class):
     """Custom sdist that ensures Cython has compiled all pyx files to c."""
 
-    _pyxfiles = ['pandas/lib.pyx',
-                 'pandas/hashtable.pyx',
-                 'pandas/tslib.pyx',
-                 'pandas/index.pyx',
-                 'pandas/algos.pyx',
-                 'pandas/parser.pyx',
-                 'pandas/src/period.pyx',
-                 'pandas/src/sparse.pyx',
-                 'pandas/src/testing.pyx']
+    _pyxfiles = ['pandas/_libs/lib.pyx',
+                 'pandas/_libs/hashtable.pyx',
+                 'pandas/_libs/tslib.pyx',
+                 'pandas/_libs/index.pyx',
+                 'pandas/_libs/internals.pyx',
+                 'pandas/_libs/algos.pyx',
+                 'pandas/_libs/join.pyx',
+                 'pandas/_libs/indexing.pyx',
+                 'pandas/_libs/interval.pyx',
+                 'pandas/_libs/hashing.pyx',
+                 'pandas/_libs/missing.pyx',
+                 'pandas/_libs/reduction.pyx',
+                 'pandas/_libs/testing.pyx',
+                 'pandas/_libs/skiplist.pyx',
+                 'pandas/_libs/sparse.pyx',
+                 'pandas/_libs/ops.pyx',
+                 'pandas/_libs/parsers.pyx',
+                 'pandas/_libs/tslibs/ccalendar.pyx',
+                 'pandas/_libs/tslibs/period.pyx',
+                 'pandas/_libs/tslibs/strptime.pyx',
+                 'pandas/_libs/tslibs/np_datetime.pyx',
+                 'pandas/_libs/tslibs/timedeltas.pyx',
+                 'pandas/_libs/tslibs/timestamps.pyx',
+                 'pandas/_libs/tslibs/timezones.pyx',
+                 'pandas/_libs/tslibs/conversion.pyx',
+                 'pandas/_libs/tslibs/fields.pyx',
+                 'pandas/_libs/tslibs/offsets.pyx',
+                 'pandas/_libs/tslibs/frequencies.pyx',
+                 'pandas/_libs/tslibs/resolution.pyx',
+                 'pandas/_libs/tslibs/parsing.pyx',
+                 'pandas/_libs/writers.pyx',
+                 'pandas/io/sas/sas.pyx']
+
+    _cpp_pyxfiles = ['pandas/_libs/window.pyx',
+                     'pandas/io/msgpack/_packer.pyx',
+                     'pandas/io/msgpack/_unpacker.pyx']
 
     def initialize_options(self):
         sdist_class.initialize_options(self)
 
-        '''
-        self._pyxfiles = []
-        for root, dirs, files in os.walk('pandas'):
-            for f in files:
-                if f.endswith('.pyx'):
-                    self._pyxfiles.append(pjoin(root, f))
-        '''
-
     def run(self):
         if 'cython' in cmdclass:
             self.run_command('cython')
         else:
-            for pyxfile in self._pyxfiles:
-                cfile = pyxfile[:-3] + 'c'
-                msg = "C-source file '%s' not found." % (cfile) +\
-                    " Run 'setup.py cython' before sdist."
-                assert os.path.isfile(cfile), msg
+            # If we are not running cython then
+            # compile the extensions correctly
+            pyx_files = [(self._pyxfiles, 'c'), (self._cpp_pyxfiles, 'cpp')]
+
+            for pyxfiles, extension in pyx_files:
+                for pyxfile in pyxfiles:
+                    sourcefile = pyxfile[:-3] + extension
+                    msg = ("{extension}-source file '{source}' not found.\n"
+                           "Run 'setup.py cython' before sdist.".format(
+                               source=sourcefile, extension=extension))
+                    assert os.path.isfile(sourcefile), msg
         sdist_class.run(self)
 
 
 class CheckingBuildExt(build_ext):
-    """Subclass build_ext to get clearer report if Cython is necessary."""
+    """
+    Subclass build_ext to get clearer report if Cython is necessary.
+
+    """
 
     def check_cython_extensions(self, extensions):
         for ext in extensions:
             for src in ext.sources:
                 if not os.path.exists(src):
-                    raise Exception("""Cython-generated file '%s' not found.
+                    print("{}: -> [{}]".format(ext.name, ext.sources))
+                    raise Exception("""Cython-generated file '{src}' not found.
                 Cython is required to compile pandas from a development branch.
                 Please install Cython or download a release package of pandas.
-                """ % src)
+                """.format(src=src))
 
     def build_extensions(self):
         self.check_cython_extensions(self.extensions)
@@ -327,6 +400,7 @@ def finalize_options(self):
     def run(self):
         pass
 
+
 cmdclass.update({'clean': CleanCommand,
                  'build': build})
 
@@ -353,73 +427,255 @@ def get_tag(self):
     cmdclass['build_src'] = DummyBuildSrc
     cmdclass['build_ext'] = CheckingBuildExt
 
-lib_depends = ['reduce', 'inference', 'properties']
+if sys.byteorder == 'big':
+    endian_macro = [('__BIG_ENDIAN__', '1')]
+else:
+    endian_macro = [('__LITTLE_ENDIAN__', '1')]
+
+lib_depends = ['inference']
 
 
 def srcpath(name=None, suffix='.pyx', subdir='src'):
     return pjoin('pandas', subdir, name + suffix)
 
+
 if suffix == '.pyx':
-    lib_depends = [srcpath(f, suffix='.pyx') for f in lib_depends]
-    lib_depends.append('pandas/src/util.pxd')
+    lib_depends = [srcpath(f, suffix='.pyx', subdir='_libs/src')
+                   for f in lib_depends]
+    lib_depends.append('pandas/_libs/src/util.pxd')
 else:
     lib_depends = []
     plib_depends = []
 
-common_include = ['pandas/src/klib', 'pandas/src']
+common_include = ['pandas/_libs/src/klib', 'pandas/_libs/src']
 
 
 def pxd(name):
-    return os.path.abspath(pjoin('pandas', name + '.pxd'))
+    return pjoin('pandas', name + '.pxd')
 
 
-lib_depends = lib_depends + ['pandas/src/numpy_helper.h',
-                             'pandas/src/parse_helper.h']
+if is_platform_windows():
+    extra_compile_args = []
+else:
+    # args to ignore warnings
+    extra_compile_args = ['-Wno-unused-function']
 
+lib_depends = lib_depends + ['pandas/_libs/src/numpy_helper.h',
+                             'pandas/_libs/src/parse_helper.h',
+                             'pandas/_libs/src/compat_helper.h']
 
-tseries_depends = ['pandas/src/datetime/np_datetime.h',
-                   'pandas/src/datetime/np_datetime_strings.h',
-                   'pandas/src/period_helper.h']
+np_datetime_headers = ['pandas/_libs/src/datetime/np_datetime.h',
+                       'pandas/_libs/src/datetime/np_datetime_strings.h']
+np_datetime_sources = ['pandas/_libs/src/datetime/np_datetime.c',
+                       'pandas/_libs/src/datetime/np_datetime_strings.c']
 
+tseries_depends = np_datetime_headers + ['pandas/_libs/tslibs/np_datetime.pxd']
 
 # some linux distros require it
-libraries = ['m'] if 'win32' not in sys.platform else []
-
-ext_data = dict(
-    lib={'pyxfile': 'lib',
-         'pxdfiles': [],
-         'depends': lib_depends},
-    hashtable={'pyxfile': 'hashtable',
-               'pxdfiles': ['hashtable'],
-               'depends': ['pandas/src/klib/khash_python.h']},
-    tslib={'pyxfile': 'tslib',
-           'depends': tseries_depends,
-           'sources': ['pandas/src/datetime/np_datetime.c',
-                       'pandas/src/datetime/np_datetime_strings.c',
-                       'pandas/src/period_helper.c']},
-    _period={'pyxfile': 'src/period',
-             'depends': tseries_depends,
-             'sources': ['pandas/src/datetime/np_datetime.c',
-                         'pandas/src/datetime/np_datetime_strings.c',
-                         'pandas/src/period_helper.c']},
-    index={'pyxfile': 'index',
-           'sources': ['pandas/src/datetime/np_datetime.c',
-                       'pandas/src/datetime/np_datetime_strings.c']},
-    algos={'pyxfile': 'algos',
-           'depends': [srcpath('generated', suffix='.pyx'),
-                       srcpath('join', suffix='.pyx')]},
-    parser={'pyxfile': 'parser',
-            'depends': ['pandas/src/parser/tokenizer.h',
-                        'pandas/src/parser/io.h',
-                        'pandas/src/numpy_helper.h'],
-            'sources': ['pandas/src/parser/tokenizer.c',
-                        'pandas/src/parser/io.c']}
-)
+libraries = ['m'] if not is_platform_windows() else []
+
+ext_data = {
+    '_libs.algos': {
+        'pyxfile': '_libs/algos',
+        'pxdfiles': ['_libs/src/util', '_libs/algos', '_libs/hashtable'],
+        'depends': _pxi_dep['algos']},
+    '_libs.groupby': {
+        'pyxfile': '_libs/groupby',
+        'pxdfiles': ['_libs/src/util', '_libs/algos'],
+        'depends': _pxi_dep['groupby']},
+    '_libs.hashing': {
+        'pyxfile': '_libs/hashing'},
+    '_libs.hashtable': {
+        'pyxfile': '_libs/hashtable',
+        'pxdfiles': ['_libs/hashtable', '_libs/missing', '_libs/khash'],
+        'depends': (['pandas/_libs/src/klib/khash_python.h'] +
+                    _pxi_dep['hashtable'])},
+    '_libs.index': {
+        'pyxfile': '_libs/index',
+        'pxdfiles': ['_libs/src/util', '_libs/hashtable'],
+        'depends': _pxi_dep['index'],
+        'sources': np_datetime_sources},
+    '_libs.indexing': {
+        'pyxfile': '_libs/indexing'},
+    '_libs.internals': {
+        'pyxfile': '_libs/internals'},
+    '_libs.interval': {
+        'pyxfile': '_libs/interval',
+        'pxdfiles': ['_libs/hashtable'],
+        'depends': _pxi_dep['interval']},
+    '_libs.join': {
+        'pyxfile': '_libs/join',
+        'pxdfiles': ['_libs/src/util', '_libs/hashtable'],
+        'depends': _pxi_dep['join']},
+    '_libs.lib': {
+        'pyxfile': '_libs/lib',
+        'pxdfiles': ['_libs/src/util',
+                     '_libs/missing',
+                     '_libs/tslibs/conversion'],
+        'depends': lib_depends + tseries_depends},
+    '_libs.missing': {
+        'pyxfile': '_libs/missing',
+        'pxdfiles': ['_libs/src/util'],
+        'depends': tseries_depends},
+    '_libs.parsers': {
+        'pyxfile': '_libs/parsers',
+        'depends': ['pandas/_libs/src/parser/tokenizer.h',
+                    'pandas/_libs/src/parser/io.h',
+                    'pandas/_libs/src/numpy_helper.h'],
+        'sources': ['pandas/_libs/src/parser/tokenizer.c',
+                    'pandas/_libs/src/parser/io.c']},
+    '_libs.reduction': {
+        'pyxfile': '_libs/reduction',
+        'pxdfiles': ['_libs/src/util']},
+    '_libs.ops': {
+        'pyxfile': '_libs/ops',
+        'pxdfiles': ['_libs/src/util',
+                     '_libs/missing']},
+    '_libs.tslibs.period': {
+        'pyxfile': '_libs/tslibs/period',
+        'pxdfiles': ['_libs/src/util',
+                     '_libs/missing',
+                     '_libs/tslibs/ccalendar',
+                     '_libs/tslibs/timedeltas',
+                     '_libs/tslibs/timezones',
+                     '_libs/tslibs/nattype'],
+        'depends': tseries_depends + ['pandas/_libs/src/period_helper.h'],
+        'sources': np_datetime_sources + ['pandas/_libs/src/period_helper.c']},
+    '_libs.properties': {
+        'pyxfile': '_libs/properties',
+        'include': []},
+    '_libs.reshape': {
+        'pyxfile': '_libs/reshape',
+        'depends': _pxi_dep['reshape']},
+    '_libs.skiplist': {
+        'pyxfile': '_libs/skiplist',
+        'depends': ['pandas/_libs/src/skiplist.h']},
+    '_libs.sparse': {
+        'pyxfile': '_libs/sparse',
+        'depends': _pxi_dep['sparse']},
+    '_libs.tslib': {
+        'pyxfile': '_libs/tslib',
+        'pxdfiles': ['_libs/src/util',
+                     '_libs/tslibs/conversion',
+                     '_libs/tslibs/timedeltas',
+                     '_libs/tslibs/timestamps',
+                     '_libs/tslibs/timezones',
+                     '_libs/tslibs/nattype'],
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.ccalendar': {
+        'pyxfile': '_libs/tslibs/ccalendar'},
+    '_libs.tslibs.conversion': {
+        'pyxfile': '_libs/tslibs/conversion',
+        'pxdfiles': ['_libs/src/util',
+                     '_libs/tslibs/nattype',
+                     '_libs/tslibs/timezones',
+                     '_libs/tslibs/timedeltas'],
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.fields': {
+        'pyxfile': '_libs/tslibs/fields',
+        'pxdfiles': ['_libs/tslibs/ccalendar',
+                     '_libs/tslibs/nattype'],
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.frequencies': {
+        'pyxfile': '_libs/tslibs/frequencies',
+        'pxdfiles': ['_libs/src/util']},
+    '_libs.tslibs.nattype': {
+        'pyxfile': '_libs/tslibs/nattype',
+        'pxdfiles': ['_libs/src/util']},
+    '_libs.tslibs.np_datetime': {
+        'pyxfile': '_libs/tslibs/np_datetime',
+        'depends': np_datetime_headers,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.offsets': {
+        'pyxfile': '_libs/tslibs/offsets',
+        'pxdfiles': ['_libs/src/util',
+                     '_libs/tslibs/ccalendar',
+                     '_libs/tslibs/conversion',
+                     '_libs/tslibs/frequencies',
+                     '_libs/tslibs/nattype'],
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.parsing': {
+        'pyxfile': '_libs/tslibs/parsing',
+        'pxdfiles': ['_libs/src/util']},
+    '_libs.tslibs.resolution': {
+        'pyxfile': '_libs/tslibs/resolution',
+        'pxdfiles': ['_libs/src/util',
+                     '_libs/khash',
+                     '_libs/tslibs/ccalendar',
+                     '_libs/tslibs/frequencies',
+                     '_libs/tslibs/timezones'],
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.strptime': {
+        'pyxfile': '_libs/tslibs/strptime',
+        'pxdfiles': ['_libs/src/util',
+                     '_libs/tslibs/nattype'],
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.timedeltas': {
+        'pyxfile': '_libs/tslibs/timedeltas',
+        'pxdfiles': ['_libs/src/util',
+                     '_libs/tslibs/nattype'],
+        'depends': np_datetime_headers,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.timestamps': {
+        'pyxfile': '_libs/tslibs/timestamps',
+        'pxdfiles': ['_libs/src/util',
+                     '_libs/tslibs/ccalendar',
+                     '_libs/tslibs/conversion',
+                     '_libs/tslibs/nattype',
+                     '_libs/tslibs/timedeltas',
+                     '_libs/tslibs/timezones'],
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.timezones': {
+        'pyxfile': '_libs/tslibs/timezones',
+        'pxdfiles': ['_libs/src/util']},
+    '_libs.testing': {
+        'pyxfile': '_libs/testing'},
+    '_libs.window': {
+        'pyxfile': '_libs/window',
+        'pxdfiles': ['_libs/skiplist', '_libs/src/util'],
+        'language': 'c++',
+        'suffix': '.cpp'},
+    '_libs.writers': {
+        'pyxfile': '_libs/writers',
+        'pxdfiles': ['_libs/src/util']},
+    'io.sas._sas': {
+        'pyxfile': 'io/sas/sas'},
+    'io.msgpack._packer': {
+        'macros': endian_macro,
+        'depends': ['pandas/_libs/src/msgpack/pack.h',
+                    'pandas/_libs/src/msgpack/pack_template.h'],
+        'include': ['pandas/_libs/src/msgpack'] + common_include,
+        'language': 'c++',
+        'suffix': '.cpp',
+        'pyxfile': 'io/msgpack/_packer',
+        'subdir': 'io/msgpack'},
+    'io.msgpack._unpacker': {
+        'depends': ['pandas/_libs/src/msgpack/unpack.h',
+                    'pandas/_libs/src/msgpack/unpack_define.h',
+                    'pandas/_libs/src/msgpack/unpack_template.h'],
+        'macros': endian_macro,
+        'include': ['pandas/_libs/src/msgpack'] + common_include,
+        'language': 'c++',
+        'suffix': '.cpp',
+        'pyxfile': 'io/msgpack/_unpacker',
+        'subdir': 'io/msgpack'
+    }
+}
 
 extensions = []
 
 for name, data in ext_data.items():
-    sources = [srcpath(data['pyxfile'], suffix=suffix, subdir='')]
+    source_suffix = suffix if suffix == '.pyx' else data.get('suffix', '.c')
+
+    sources = [srcpath(data['pyxfile'], suffix=source_suffix, subdir='')]
+
     pxds = [pxd(x) for x in data.get('pxdfiles', [])]
     if suffix == '.pyx' and pxds:
         sources.extend(pxds)
@@ -428,81 +684,50 @@ def pxd(name):
 
     include = data.get('include', common_include)
 
-    obj = Extension('pandas.%s' % name,
+    obj = Extension('pandas.{name}'.format(name=name),
                     sources=sources,
                     depends=data.get('depends', []),
-                    include_dirs=include)
+                    include_dirs=include,
+                    language=data.get('language', 'c'),
+                    define_macros=data.get('macros', []),
+                    extra_compile_args=extra_compile_args)
 
     extensions.append(obj)
 
+# ----------------------------------------------------------------------
+# ujson
 
-sparse_ext = Extension('pandas._sparse',
-                       sources=[srcpath('sparse', suffix=suffix)],
-                       include_dirs=[],
-                       libraries=libraries)
-
-extensions.extend([sparse_ext])
-
-testing_ext = Extension('pandas._testing',
-                       sources=[srcpath('testing', suffix=suffix)],
-                       include_dirs=[],
-                       libraries=libraries)
-
-extensions.extend([testing_ext])
-
-#----------------------------------------------------------------------
-# msgpack stuff here
-
-if sys.byteorder == 'big':
-    macros = [('__BIG_ENDIAN__', '1')]
-else:
-    macros = [('__LITTLE_ENDIAN__', '1')]
-
-packer_ext = Extension('pandas.msgpack._packer',
-                        sources = [srcpath('_packer',
-                                   suffix=suffix if suffix == '.pyx' else '.cpp',
-                                   subdir='msgpack')],
-                        language='c++',
-                        include_dirs=['pandas/src/msgpack'] + common_include,
-                        define_macros=macros)
-unpacker_ext = Extension('pandas.msgpack._unpacker',
-                        sources = [srcpath('_unpacker',
-                                   suffix=suffix if suffix == '.pyx' else '.cpp',
-                                   subdir='msgpack')],
-                        language='c++',
-                        include_dirs=['pandas/src/msgpack'] + common_include,
-                        define_macros=macros)
-extensions.append(packer_ext)
-extensions.append(unpacker_ext)
-
-if suffix == '.pyx' and 'setuptools' in sys.modules:
+if suffix == '.pyx':
     # undo dumb setuptools bug clobbering .pyx sources back to .c
     for ext in extensions:
-        if ext.sources[0].endswith(('.c','.cpp')):
+        if ext.sources[0].endswith(('.c', '.cpp')):
             root, _ = os.path.splitext(ext.sources[0])
             ext.sources[0] = root + suffix
 
-ujson_ext = Extension('pandas.json',
-                      depends=['pandas/src/ujson/lib/ultrajson.h',
-                               'pandas/src/numpy_helper.h'],
-                      sources=['pandas/src/ujson/python/ujson.c',
-                               'pandas/src/ujson/python/objToJSON.c',
-                               'pandas/src/ujson/python/JSONtoObj.c',
-                               'pandas/src/ujson/lib/ultrajsonenc.c',
-                               'pandas/src/ujson/lib/ultrajsondec.c',
-                               'pandas/src/datetime/np_datetime.c',
-                               'pandas/src/datetime/np_datetime_strings.c'],
-                      include_dirs=['pandas/src/ujson/python',
-                                    'pandas/src/ujson/lib',
-                                    'pandas/src/datetime'] + common_include,
-                      extra_compile_args=['-D_GNU_SOURCE'])
+ujson_ext = Extension('pandas._libs.json',
+                      depends=['pandas/_libs/src/ujson/lib/ultrajson.h'],
+                      sources=(['pandas/_libs/src/ujson/python/ujson.c',
+                                'pandas/_libs/src/ujson/python/objToJSON.c',
+                                'pandas/_libs/src/ujson/python/JSONtoObj.c',
+                                'pandas/_libs/src/ujson/lib/ultrajsonenc.c',
+                                'pandas/_libs/src/ujson/lib/ultrajsondec.c'] +
+                               np_datetime_sources),
+                      include_dirs=['pandas/_libs/src/ujson/python',
+                                    'pandas/_libs/src/ujson/lib',
+                                    'pandas/_libs/src/datetime'],
+                      extra_compile_args=(['-D_GNU_SOURCE'] +
+                                          extra_compile_args))
 
 
 extensions.append(ujson_ext)
 
-
-if _have_setuptools:
-    setuptools_kwargs["test_suite"] = "nose.collector"
+# ----------------------------------------------------------------------
+# util
+# extension for pseudo-safely moving bytes into mutable buffers
+_move_ext = Extension('pandas.util._move',
+                      depends=[],
+                      sources=['pandas/util/move.c'])
+extensions.append(_move_ext)
 
 # The build cache system does string matching below this point.
 # if you change something, be careful.
@@ -510,49 +735,8 @@ def pxd(name):
 setup(name=DISTNAME,
       maintainer=AUTHOR,
       version=versioneer.get_version(),
-      packages=['pandas',
-                'pandas.compat',
-                'pandas.computation',
-                'pandas.computation.tests',
-                'pandas.core',
-                'pandas.io',
-                'pandas.rpy',
-                'pandas.sandbox',
-                'pandas.sparse',
-                'pandas.sparse.tests',
-                'pandas.stats',
-                'pandas.util',
-                'pandas.tests',
-                'pandas.tests.test_msgpack',
-                'pandas.tools',
-                'pandas.tools.tests',
-                'pandas.tseries',
-                'pandas.tseries.tests',
-                'pandas.io.tests',
-                'pandas.io.tests.test_json',
-                'pandas.stats.tests',
-                'pandas.msgpack'
-                ],
-      package_data={'pandas.io': ['tests/data/legacy_hdf/*.h5',
-                                  'tests/data/legacy_pickle/*/*.pickle',
-                                  'tests/data/legacy_msgpack/*/*.msgpack',
-                                  'tests/data/*.csv*',
-                                  'tests/data/*.XPT',
-                                  'tests/data/*.dta',
-                                  'tests/data/*.txt',
-                                  'tests/data/*.xls',
-                                  'tests/data/*.xlsx',
-                                  'tests/data/*.xlsm',
-                                  'tests/data/*.table',
-                                  'tests/data/*.html',
-                                  'tests/data/html_encoding/*.html',
-                                  'tests/test_json/data/*.json'],
-                    'pandas.tools': ['tests/*.csv'],
-                    'pandas.tests': ['data/*.pickle',
-                                     'data/*.csv'],
-                    'pandas.tseries.tests': ['data/*.pickle',
-                                             'data/*.csv']
-                    },
+      packages=find_packages(include=['pandas', 'pandas.*']),
+      package_data={'': ['templates/*', '_libs/*.dll']},
       ext_modules=extensions,
       maintainer_email=EMAIL,
       description=DESCRIPTION,
@@ -563,4 +747,5 @@ def pxd(name):
       long_description=LONG_DESCRIPTION,
       classifiers=CLASSIFIERS,
       platforms='any',
+      python_requires='>=2.7,!=3.0.*,!=3.1.*,!=3.2.*,!=3.3.*,!=3.4.*',
       **setuptools_kwargs)
diff --git a/test.bat b/test.bat
index 16aa6c9105ec3..e07c84f257a69 100644
--- a/test.bat
+++ b/test.bat
@@ -1,3 +1,3 @@
 :: test on windows
 
-nosetests --exe -A "not slow and not network and not disabled" pandas %*
+pytest --skip-slow --skip-network pandas -n 2 -r sxX --strict %*
diff --git a/test.sh b/test.sh
index 4a9ffd7be98b1..1255a39816f78 100755
--- a/test.sh
+++ b/test.sh
@@ -1,11 +1,4 @@
 #!/bin/sh
 command -v coverage >/dev/null && coverage erase
 command -v python-coverage >/dev/null && python-coverage erase
-# nosetests pandas/tests/test_index.py --with-coverage --cover-package=pandas.core --pdb-failure --pdb
-#nosetests -w pandas --with-coverage --cover-package=pandas --pdb-failure --pdb #--cover-inclusive
-#nosetests -A "not slow" -w pandas/tseries --with-coverage --cover-package=pandas.tseries $* #--cover-inclusive
-nosetests -w pandas --with-coverage --cover-package=pandas $*
-# nosetests -w pandas/io --with-coverage --cover-package=pandas.io --pdb-failure --pdb
-# nosetests -w pandas/core --with-coverage --cover-package=pandas.core --pdb-failure --pdb
-# nosetests -w pandas/stats --with-coverage --cover-package=pandas.stats
-# coverage run runtests.py
+pytest pandas --cov=pandas -r sxX --strict
diff --git a/test_fast.bat b/test_fast.bat
new file mode 100644
index 0000000000000..81f30dd310e28
--- /dev/null
+++ b/test_fast.bat
@@ -0,0 +1,3 @@
+:: test on windows
+set PYTHONHASHSEED=314159265
+pytest --skip-slow --skip-network -m "not single" -n 4 -r sXX --strict pandas
diff --git a/test_fast.sh b/test_fast.sh
index b390705f901ad..1fb55e581d292 100755
--- a/test_fast.sh
+++ b/test_fast.sh
@@ -1 +1,8 @@
-nosetests -A "not slow and not network" pandas --with-id $*
+#!/bin/bash
+
+# Workaround for pytest-xdist flaky collection order
+# https://github.com/pytest-dev/pytest/issues/920
+# https://github.com/pytest-dev/pytest/issues/1075
+export PYTHONHASHSEED=$(python -c 'import random; print(random.randint(1, 4294967295))')
+
+pytest pandas --skip-slow --skip-network -m "not single" -n 4 -r sxX --strict "$@"
diff --git a/test_multi.sh b/test_multi.sh
deleted file mode 100755
index 5d77945c66a26..0000000000000
--- a/test_multi.sh
+++ /dev/null
@@ -1 +0,0 @@
-nosetests -A "not slow and not network" pandas --processes=4 $*
diff --git a/test_perf.sh b/test_perf.sh
deleted file mode 100755
index 022de25bca8fc..0000000000000
--- a/test_perf.sh
+++ /dev/null
@@ -1,5 +0,0 @@
-#!/bin/sh
-
-CURDIR=$(pwd)
-BASEDIR=$(cd "$(dirname "$0")"; pwd)
-python "$BASEDIR"/vb_suite/test_perf.py $@
diff --git a/test_rebuild.sh b/test_rebuild.sh
index d3710c5ff67d3..65aa1098811a1 100755
--- a/test_rebuild.sh
+++ b/test_rebuild.sh
@@ -3,10 +3,4 @@
 python setup.py clean
 python setup.py build_ext --inplace
 coverage erase
-# nosetests pandas/tests/test_index.py --with-coverage --cover-package=pandas.core --pdb-failure --pdb
-#nosetests -w pandas --with-coverage --cover-package=pandas --pdb-failure --pdb #--cover-inclusive
-nosetests -w pandas --with-coverage --cover-package=pandas $* #--cover-inclusive
-# nosetests -w pandas/io --with-coverage --cover-package=pandas.io --pdb-failure --pdb
-# nosetests -w pandas/core --with-coverage --cover-package=pandas.core --pdb-failure --pdb
-# nosetests -w pandas/stats --with-coverage --cover-package=pandas.stats
-# coverage run runtests.py
+pytest pandas --cov=pandas
diff --git a/tox.ini b/tox.ini
index 9fbb15087c4d5..f055251581a93 100644
--- a/tox.ini
+++ b/tox.ini
@@ -4,12 +4,13 @@
 # and then run "tox" from this directory.
 
 [tox]
-envlist = py26, py27, py32, py33, py34
+envlist = py27, py35, py36
 
 [testenv]
 deps =
     cython
     nose
+    pytest
     pytz>=2011k
     python-dateutil
     beautifulsoup4
@@ -18,6 +19,7 @@ deps =
     xlrd
     six
     sqlalchemy
+    moto
 
 # cd to anything but the default {toxinidir} which
 # contains the pandas subdirectory and confuses
@@ -26,7 +28,7 @@ changedir = {envdir}
 
 commands =
     # TODO:  --exe because of GH #761
-    {envbindir}/nosetests --exe pandas {posargs:-A "not network and not disabled"}
+    {envbindir}/pytest pandas {posargs:-A "not network and not disabled"}
     # cleanup the temp. build dir created by the tox build
 #    /bin/rm -rf {toxinidir}/build
 
@@ -41,13 +43,6 @@ commands =
     # tox should provide a preinstall-commands hook.
     pip uninstall pandas -qy
 
-[testenv:py26]
-deps =
-    numpy==1.6.1
-    boto
-    bigquery
-    {[testenv]deps}
-
 [testenv:py27]
 deps =
     numpy==1.8.1
@@ -55,19 +50,14 @@ deps =
     bigquery
     {[testenv]deps}
 
-[testenv:py32]
-deps =
-    numpy==1.7.1
-    {[testenv]deps}
-
-[testenv:py33]
+[testenv:py35]
 deps =
-    numpy==1.8.0
+    numpy==1.10.0
     {[testenv]deps}
 
-[testenv:py34]
+[testenv:py36]
 deps =
-    numpy==1.8.0
+    numpy
     {[testenv]deps}
 
 [testenv:openpyxl1]
@@ -75,18 +65,18 @@ usedevelop = True
 deps =
     {[testenv]deps}
     openpyxl<2.0.0
-commands = {envbindir}/nosetests {toxinidir}/pandas/io/tests/test_excel.py
+commands = {envbindir}/pytest {toxinidir}/pandas/io/tests/test_excel.py
 
 [testenv:openpyxl20]
 usedevelop = True
 deps =
     {[testenv]deps}
     openpyxl<2.2.0
-commands = {envbindir}/nosetests {posargs} {toxinidir}/pandas/io/tests/test_excel.py
+commands = {envbindir}/pytest {posargs} {toxinidir}/pandas/io/tests/test_excel.py
 
 [testenv:openpyxl22]
 usedevelop = True
 deps =
     {[testenv]deps}
     openpyxl>=2.2.0
-commands = {envbindir}/nosetests {posargs} {toxinidir}/pandas/io/tests/test_excel.py
+commands = {envbindir}/pytest {posargs} {toxinidir}/pandas/io/tests/test_excel.py
diff --git a/vb_suite/.gitignore b/vb_suite/.gitignore
deleted file mode 100644
index cc110f04e1225..0000000000000
--- a/vb_suite/.gitignore
+++ /dev/null
@@ -1,4 +0,0 @@
-benchmarks.db
-build/*
-source/vbench/*
-source/*.rst
\ No newline at end of file
diff --git a/vb_suite/attrs_caching.py b/vb_suite/attrs_caching.py
deleted file mode 100644
index a7e3ed7094ed6..0000000000000
--- a/vb_suite/attrs_caching.py
+++ /dev/null
@@ -1,20 +0,0 @@
-from vbench.benchmark import Benchmark
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# DataFrame.index / columns property lookup time
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(10, 6))
-cur_index = df.index
-"""
-stmt = "foo = df.index"
-
-getattr_dataframe_index = Benchmark(stmt, setup,
-                                    name="getattr_dataframe_index")
-
-stmt = "df.index = cur_index"
-setattr_dataframe_index = Benchmark(stmt, setup,
-                                    name="setattr_dataframe_index")
diff --git a/vb_suite/binary_ops.py b/vb_suite/binary_ops.py
deleted file mode 100644
index 7c821374a83ab..0000000000000
--- a/vb_suite/binary_ops.py
+++ /dev/null
@@ -1,199 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-SECTION = 'Binary ops'
-
-#----------------------------------------------------------------------
-# binary ops
-
-#----------------------------------------------------------------------
-# add
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-"""
-frame_add = \
-    Benchmark("df + df2", setup, name='frame_add',
-              start_date=datetime(2012, 1, 1))
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-expr.set_numexpr_threads(1)
-"""
-
-frame_add_st = \
-    Benchmark("df + df2", setup, name='frame_add_st',cleanup="expr.set_numexpr_threads()",
-              start_date=datetime(2013, 2, 26))
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-expr.set_use_numexpr(False)
-"""
-frame_add_no_ne = \
-    Benchmark("df + df2", setup, name='frame_add_no_ne',cleanup="expr.set_use_numexpr(True)",
-              start_date=datetime(2013, 2, 26))
-
-#----------------------------------------------------------------------
-# mult
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-"""
-frame_mult = \
-    Benchmark("df * df2", setup, name='frame_mult',
-              start_date=datetime(2012, 1, 1))
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-expr.set_numexpr_threads(1)
-"""
-frame_mult_st = \
-    Benchmark("df * df2", setup, name='frame_mult_st',cleanup="expr.set_numexpr_threads()",
-              start_date=datetime(2013, 2, 26))
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-expr.set_use_numexpr(False)
-"""
-frame_mult_no_ne = \
-    Benchmark("df * df2", setup, name='frame_mult_no_ne',cleanup="expr.set_use_numexpr(True)",
-              start_date=datetime(2013, 2, 26))
-
-#----------------------------------------------------------------------
-# division
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(1000, 1000))
-"""
-frame_float_div_by_zero = \
-    Benchmark("df / 0", setup, name='frame_float_div_by_zero')
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(1000, 1000))
-"""
-frame_float_floor_by_zero = \
-    Benchmark("df // 0", setup, name='frame_float_floor_by_zero')
-
-setup = common_setup + """
-df  = DataFrame(np.random.random_integers(np.iinfo(np.int16).min, np.iinfo(np.int16).max, size=(1000, 1000)))
-"""
-frame_int_div_by_zero = \
-    Benchmark("df / 0", setup, name='frame_int_div_by_zero')
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(1000, 1000))
-df2 = DataFrame(np.random.randn(1000, 1000))
-"""
-frame_float_div = \
-    Benchmark("df // df2", setup, name='frame_float_div')
-
-#----------------------------------------------------------------------
-# modulo
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(1000, 1000))
-df2 = DataFrame(np.random.randn(1000, 1000))
-"""
-frame_float_mod = \
-    Benchmark("df / df2", setup, name='frame_float_mod')
-
-setup = common_setup + """
-df  = DataFrame(np.random.random_integers(np.iinfo(np.int16).min, np.iinfo(np.int16).max, size=(1000, 1000)))
-df2 = DataFrame(np.random.random_integers(np.iinfo(np.int16).min, np.iinfo(np.int16).max, size=(1000, 1000)))
-"""
-frame_int_mod = \
-    Benchmark("df / df2", setup, name='frame_int_mod')
-
-#----------------------------------------------------------------------
-# multi and
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-"""
-frame_multi_and = \
-    Benchmark("df[(df>0) & (df2>0)]", setup, name='frame_multi_and',
-              start_date=datetime(2012, 1, 1))
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-expr.set_numexpr_threads(1)
-"""
-frame_multi_and_st = \
-    Benchmark("df[(df>0) & (df2>0)]", setup, name='frame_multi_and_st',cleanup="expr.set_numexpr_threads()",
-              start_date=datetime(2013, 2, 26))
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-expr.set_use_numexpr(False)
-"""
-frame_multi_and_no_ne = \
-    Benchmark("df[(df>0) & (df2>0)]", setup, name='frame_multi_and_no_ne',cleanup="expr.set_use_numexpr(True)",
-              start_date=datetime(2013, 2, 26))
-
-#----------------------------------------------------------------------
-# timeseries
-
-setup = common_setup + """
-N = 1000000
-halfway = N // 2 - 1
-s = Series(date_range('20010101', periods=N, freq='T'))
-ts = s[halfway]
-"""
-
-timestamp_series_compare = Benchmark("ts >= s", setup,
-                                     start_date=datetime(2013, 9, 27))
-series_timestamp_compare = Benchmark("s <= ts", setup,
-                                     start_date=datetime(2012, 2, 21))
-
-setup = common_setup + """
-N = 1000000
-s = Series(date_range('20010101', periods=N, freq='s'))
-"""
-
-timestamp_ops_diff1 = Benchmark("s.diff()", setup,
-                                start_date=datetime(2013, 1, 1))
-timestamp_ops_diff2 = Benchmark("s-s.shift()", setup,
-                                start_date=datetime(2013, 1, 1))
-
-#----------------------------------------------------------------------
-# timeseries with tz
-
-setup = common_setup + """
-N = 10000
-halfway = N // 2 - 1
-s = Series(date_range('20010101', periods=N, freq='T', tz='US/Eastern'))
-ts = s[halfway]
-"""
-
-timestamp_tz_series_compare = Benchmark("ts >= s", setup,
-                                        start_date=datetime(2013, 9, 27))
-series_timestamp_tz_compare = Benchmark("s <= ts", setup,
-                                        start_date=datetime(2012, 2, 21))
-
-setup = common_setup + """
-N = 10000
-s = Series(date_range('20010101', periods=N, freq='s', tz='US/Eastern'))
-"""
-
-timestamp_tz_ops_diff1 = Benchmark("s.diff()", setup,
-                                   start_date=datetime(2013, 1, 1))
-timestamp_tz_ops_diff2 = Benchmark("s-s.shift()", setup,
-                                   start_date=datetime(2013, 1, 1))
diff --git a/vb_suite/categoricals.py b/vb_suite/categoricals.py
deleted file mode 100644
index a08d479df20cb..0000000000000
--- a/vb_suite/categoricals.py
+++ /dev/null
@@ -1,16 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# Series constructors
-
-setup = common_setup + """
-s = pd.Series(list('aabbcd') * 1000000).astype('category')
-"""
-
-concat_categorical = \
-    Benchmark("concat([s, s])", setup=setup, name='concat_categorical',
-              start_date=datetime(year=2015, month=7, day=15))
diff --git a/vb_suite/ctors.py b/vb_suite/ctors.py
deleted file mode 100644
index 8123322383f0a..0000000000000
--- a/vb_suite/ctors.py
+++ /dev/null
@@ -1,39 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# Series constructors
-
-setup = common_setup + """
-data = np.random.randn(100)
-index = Index(np.arange(100))
-"""
-
-ctor_series_ndarray = \
-    Benchmark("Series(data, index=index)", setup=setup,
-              name='series_constructor_ndarray')
-
-setup = common_setup + """
-arr = np.random.randn(100, 100)
-"""
-
-ctor_frame_ndarray = \
-    Benchmark("DataFrame(arr)", setup=setup,
-              name='frame_constructor_ndarray')
-
-setup = common_setup + """
-data = np.array(['foo', 'bar', 'baz'], dtype=object)
-"""
-
-ctor_index_array_string = Benchmark('Index(data)', setup=setup)
-
-# index constructors
-setup = common_setup + """
-s = Series([Timestamp('20110101'),Timestamp('20120101'),Timestamp('20130101')]*1000)
-"""
-index_from_series_ctor = Benchmark('Index(s)', setup=setup)
-
-dtindex_from_series_ctor = Benchmark('DatetimeIndex(s)', setup=setup)
diff --git a/vb_suite/eval.py b/vb_suite/eval.py
deleted file mode 100644
index bf80aad956184..0000000000000
--- a/vb_suite/eval.py
+++ /dev/null
@@ -1,150 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-import pandas as pd
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-df3 = DataFrame(np.random.randn(20000, 100))
-df4 = DataFrame(np.random.randn(20000, 100))
-"""
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-expr.set_numexpr_threads(1)
-"""
-
-SECTION = 'Eval'
-
-#----------------------------------------------------------------------
-# binary ops
-
-#----------------------------------------------------------------------
-# add
-eval_frame_add_all_threads = \
-    Benchmark("pd.eval('df + df2 + df3 + df4')", common_setup,
-              name='eval_frame_add_all_threads',
-              start_date=datetime(2013, 7, 21))
-
-
-
-eval_frame_add_one_thread = \
-    Benchmark("pd.eval('df + df2 + df3 + df4')", setup,
-              name='eval_frame_add_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-eval_frame_add_python = \
-    Benchmark("pd.eval('df + df2 + df3 + df4', engine='python')", common_setup,
-              name='eval_frame_add_python', start_date=datetime(2013, 7, 21))
-
-eval_frame_add_python_one_thread = \
-    Benchmark("pd.eval('df + df2 + df3 + df4', engine='python')", setup,
-              name='eval_frame_add_python_one_thread',
-              start_date=datetime(2013, 7, 26))
-#----------------------------------------------------------------------
-# mult
-
-eval_frame_mult_all_threads = \
-    Benchmark("pd.eval('df * df2 * df3 * df4')", common_setup,
-              name='eval_frame_mult_all_threads',
-              start_date=datetime(2013, 7, 21))
-
-eval_frame_mult_one_thread = \
-    Benchmark("pd.eval('df * df2 * df3 * df4')", setup,
-              name='eval_frame_mult_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-eval_frame_mult_python = \
-    Benchmark("pd.eval('df * df2 * df3 * df4', engine='python')",
-              common_setup,
-              name='eval_frame_mult_python', start_date=datetime(2013, 7, 21))
-
-eval_frame_mult_python_one_thread = \
-    Benchmark("pd.eval('df * df2 * df3 * df4', engine='python')", setup,
-              name='eval_frame_mult_python_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-#----------------------------------------------------------------------
-# multi and
-
-eval_frame_and_all_threads = \
-    Benchmark("pd.eval('(df > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)')",
-              common_setup,
-              name='eval_frame_and_all_threads',
-              start_date=datetime(2013, 7, 21))
-
-eval_frame_and_one_thread = \
-    Benchmark("pd.eval('(df > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)')", setup,
-              name='eval_frame_and_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-eval_frame_and_python = \
-    Benchmark("pd.eval('(df > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)', engine='python')",
-              common_setup, name='eval_frame_and_python',
-              start_date=datetime(2013, 7, 21))
-
-eval_frame_and_one_thread = \
-    Benchmark("pd.eval('(df > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)', engine='python')",
-              setup,
-              name='eval_frame_and_python_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-#--------------------------------------------------------------------
-# chained comp
-eval_frame_chained_cmp_all_threads = \
-    Benchmark("pd.eval('df < df2 < df3 < df4')", common_setup,
-              name='eval_frame_chained_cmp_all_threads',
-              start_date=datetime(2013, 7, 21))
-
-eval_frame_chained_cmp_one_thread = \
-    Benchmark("pd.eval('df < df2 < df3 < df4')", setup,
-              name='eval_frame_chained_cmp_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-eval_frame_chained_cmp_python = \
-    Benchmark("pd.eval('df < df2 < df3 < df4', engine='python')",
-              common_setup, name='eval_frame_chained_cmp_python',
-              start_date=datetime(2013, 7, 26))
-
-eval_frame_chained_cmp_one_thread = \
-    Benchmark("pd.eval('df < df2 < df3 < df4', engine='python')", setup,
-              name='eval_frame_chained_cmp_python_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-setup = common_setup + """
-N = 1000000
-halfway = N // 2 - 1
-index = date_range('20010101', periods=N, freq='T')
-s = Series(index)
-ts = s.iloc[halfway]
-"""
-
-series_setup = setup + """
-df = DataFrame({'dates': s.values})
-"""
-
-query_datetime_series = Benchmark("df.query('dates < @ts')",
-                                  series_setup,
-                                  start_date=datetime(2013, 9, 27))
-
-index_setup = setup + """
-df = DataFrame({'a': np.random.randn(N)}, index=index)
-"""
-
-query_datetime_index = Benchmark("df.query('index < @ts')",
-                                 index_setup, start_date=datetime(2013, 9, 27))
-
-setup = setup + """
-N = 1000000
-df = DataFrame({'a': np.random.randn(N)})
-min_val = df['a'].min()
-max_val = df['a'].max()
-"""
-
-query_with_boolean_selection = Benchmark("df.query('(a >= @min_val) & (a <= @max_val)')",
-                                         setup, start_date=datetime(2013, 9, 27))
-
diff --git a/vb_suite/frame_ctor.py b/vb_suite/frame_ctor.py
deleted file mode 100644
index 0d57da7b88d3b..0000000000000
--- a/vb_suite/frame_ctor.py
+++ /dev/null
@@ -1,123 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-try:
-    import pandas.tseries.offsets as offsets
-except:
-    import pandas.core.datetools as offsets
-
-common_setup = """from .pandas_vb_common import *
-try:
-    from pandas.tseries.offsets import *
-except:
-    from pandas.core.datetools import *
-"""
-
-#----------------------------------------------------------------------
-# Creation from nested dict
-
-setup = common_setup + """
-N, K = 5000, 50
-index = tm.makeStringIndex(N)
-columns = tm.makeStringIndex(K)
-frame = DataFrame(np.random.randn(N, K), index=index, columns=columns)
-
-try:
-    data = frame.to_dict()
-except:
-    data = frame.toDict()
-
-some_dict = data.values()[0]
-dict_list = [dict(zip(columns, row)) for row in frame.values]
-"""
-
-frame_ctor_nested_dict = Benchmark("DataFrame(data)", setup)
-
-# From JSON-like stuff
-frame_ctor_list_of_dict = Benchmark("DataFrame(dict_list)", setup,
-                                    start_date=datetime(2011, 12, 20))
-
-series_ctor_from_dict = Benchmark("Series(some_dict)", setup)
-
-# nested dict, integer indexes, regression described in #621
-setup = common_setup + """
-data = dict((i,dict((j,float(j)) for j in range(100))) for i in xrange(2000))
-"""
-frame_ctor_nested_dict_int64 = Benchmark("DataFrame(data)", setup)
-
-# dynamically generate benchmarks for every offset
-#
-# get_period_count & get_index_for_offset are there because blindly taking each
-# offset times 1000 can easily go out of Timestamp bounds and raise errors.
-dynamic_benchmarks = {}
-n_steps = [1, 2]
-offset_kwargs = {'WeekOfMonth': {'weekday': 1, 'week': 1},
-                 'LastWeekOfMonth': {'weekday': 1, 'week': 1},
-                 'FY5253': {'startingMonth': 1, 'weekday': 1},
-                 'FY5253Quarter': {'qtr_with_extra_week': 1, 'startingMonth': 1, 'weekday': 1}}
-
-offset_extra_cases = {'FY5253': {'variation': ['nearest', 'last']},
-                      'FY5253Quarter': {'variation': ['nearest', 'last']}}
-
-for offset in offsets.__all__:
-    for n in n_steps:
-        kwargs = {}
-        if offset in offset_kwargs:
-            kwargs = offset_kwargs[offset]
-
-        if offset in offset_extra_cases:
-            extras = offset_extra_cases[offset]
-        else:
-            extras = {'': ['']}
-
-        for extra_arg in extras:
-            for extra in extras[extra_arg]:
-                if extra:
-                    kwargs[extra_arg] = extra
-                setup = common_setup + """
-
-def get_period_count(start_date, off):
-    ten_offsets_in_days = ((start_date + off * 10) - start_date).days
-    if ten_offsets_in_days == 0:
-        return 1000
-    else:
-        return min(9 * ((Timestamp.max - start_date).days //
-                        ten_offsets_in_days),
-                   1000)
-
-def get_index_for_offset(off):
-    start_date = Timestamp('1/1/1900')
-    return date_range(start_date,
-                      periods=min(1000, get_period_count(start_date, off)),
-                      freq=off)
-
-idx = get_index_for_offset({}({}, **{}))
-df = DataFrame(np.random.randn(len(idx),10), index=idx)
-d = dict([ (col,df[col]) for col in df.columns ])
-""".format(offset, n, kwargs)
-                key = 'frame_ctor_dtindex_{}x{}'.format(offset, n)
-                if extra:
-                    key += '__{}_{}'.format(extra_arg, extra)
-                dynamic_benchmarks[key] = Benchmark("DataFrame(d)", setup, name=key)
-
-# Have to stuff them in globals() so vbench detects them
-globals().update(dynamic_benchmarks)
-
-# from a mi-series
-setup = common_setup + """
-mi = MultiIndex.from_tuples([(x,y) for x in range(100) for y in range(100)])
-s = Series(randn(10000), index=mi)
-"""
-frame_from_series = Benchmark("DataFrame(s)", setup)
-
-#----------------------------------------------------------------------
-# get_numeric_data
-
-setup = common_setup + """
-df = DataFrame(randn(10000, 25))
-df['foo'] = 'bar'
-df['bar'] = 'baz'
-df = df.consolidate()
-"""
-
-frame_get_numeric_data = Benchmark('df._get_numeric_data()', setup,
-                                   start_date=datetime(2011, 11, 1))
diff --git a/vb_suite/frame_methods.py b/vb_suite/frame_methods.py
deleted file mode 100644
index 46343e9c607fd..0000000000000
--- a/vb_suite/frame_methods.py
+++ /dev/null
@@ -1,525 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# lookup
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(10000, 8), columns=list('abcdefgh'))
-df['foo'] = 'bar'
-
-row_labels = list(df.index[::10])[:900]
-col_labels = list(df.columns) * 100
-row_labels_all = np.array(list(df.index) * len(df.columns), dtype='object')
-col_labels_all = np.array(list(df.columns) * len(df.index), dtype='object')
-"""
-
-frame_fancy_lookup = Benchmark('df.lookup(row_labels, col_labels)', setup,
-                               start_date=datetime(2012, 1, 12))
-
-frame_fancy_lookup_all = Benchmark('df.lookup(row_labels_all, col_labels_all)',
-                                   setup,
-                                   start_date=datetime(2012, 1, 12))
-
-#----------------------------------------------------------------------
-# fillna in place
-
-setup = common_setup + """
-df = DataFrame(randn(10000, 100))
-df.values[::2] = np.nan
-"""
-
-frame_fillna_inplace = Benchmark('df.fillna(0, inplace=True)', setup,
-                                 start_date=datetime(2012, 4, 4))
-
-
-#----------------------------------------------------------------------
-# reindex both axes
-
-setup = common_setup + """
-df = DataFrame(randn(10000, 10000))
-idx = np.arange(4000, 7000)
-"""
-
-frame_reindex_axis0 = Benchmark('df.reindex(idx)', setup)
-
-frame_reindex_axis1 = Benchmark('df.reindex(columns=idx)', setup)
-
-frame_reindex_both_axes = Benchmark('df.reindex(index=idx, columns=idx)',
-                                    setup, start_date=datetime(2011, 1, 1))
-
-frame_reindex_both_axes_ix = Benchmark('df.ix[idx, idx]', setup,
-                                       start_date=datetime(2011, 1, 1))
-
-#----------------------------------------------------------------------
-# reindex with upcasts
-setup = common_setup + """
-df=DataFrame(dict([(c, {
-        0: randint(0, 2, 1000).astype(np.bool_),
-        1: randint(0, 1000, 1000).astype(np.int16),
-        2: randint(0, 1000, 1000).astype(np.int32),
-        3: randint(0, 1000, 1000).astype(np.int64)
-    }[randint(0, 4)]) for c in range(1000)]))
-"""
-
-frame_reindex_upcast = Benchmark('df.reindex(permutation(range(1200)))', setup)
-
-#----------------------------------------------------------------------
-# boolean indexing
-
-setup = common_setup + """
-df = DataFrame(randn(10000, 100))
-bool_arr = np.zeros(10000, dtype=bool)
-bool_arr[:1000] = True
-"""
-
-frame_boolean_row_select = Benchmark('df[bool_arr]', setup,
-                                     start_date=datetime(2011, 1, 1))
-
-#----------------------------------------------------------------------
-# iteritems (monitor no-copying behaviour)
-
-setup = common_setup + """
-df = DataFrame(randn(10000, 1000))
-df2 = DataFrame(randn(3000,1),columns=['A'])
-df3 = DataFrame(randn(3000,1))
-
-def f():
-    if hasattr(df, '_item_cache'):
-        df._item_cache.clear()
-    for name, col in df.iteritems():
-        pass
-
-def g():
-    for name, col in df.iteritems():
-        pass
-
-def h():
-    for i in range(10000):
-        df2['A']
-
-def j():
-    for i in range(10000):
-        df3[0]
-
-"""
-
-# as far back as the earliest test currently in the suite
-frame_iteritems = Benchmark('f()', setup,
-                            start_date=datetime(2010, 6, 1))
-
-frame_iteritems_cached = Benchmark('g()', setup,
-                                   start_date=datetime(2010, 6, 1))
-
-frame_getitem_single_column = Benchmark('h()', setup,
-                                        start_date=datetime(2010, 6, 1))
-
-frame_getitem_single_column2 = Benchmark('j()', setup,
-                                         start_date=datetime(2010, 6, 1))
-
-#----------------------------------------------------------------------
-# assignment
-
-setup = common_setup + """
-idx = date_range('1/1/2000', periods=100000, freq='D')
-df = DataFrame(randn(100000, 1),columns=['A'],index=idx)
-def f(df):
-    x = df.copy()
-    x['date'] = x.index
-"""
-
-frame_assign_timeseries_index = Benchmark('f(df)', setup,
-                                          start_date=datetime(2013, 10, 1))
-
-
-#----------------------------------------------------------------------
-# to_string
-
-setup = common_setup + """
-df = DataFrame(randn(100, 10))
-"""
-
-frame_to_string_floats = Benchmark('df.to_string()', setup,
-                                   start_date=datetime(2010, 6, 1))
-
-#----------------------------------------------------------------------
-# to_html
-
-setup = common_setup + """
-nrows=500
-df = DataFrame(randn(nrows, 10))
-df[0]=period_range("2000","2010",nrows)
-df[1]=range(nrows)
-
-"""
-
-frame_to_html_mixed = Benchmark('df.to_html()', setup,
-                                   start_date=datetime(2011, 11, 18))
-
-
-# truncated repr_html, single index
-
-setup = common_setup + """
-nrows=10000
-data=randn(nrows,10)
-idx=MultiIndex.from_arrays(np.tile(randn(3,nrows/100),100))
-df=DataFrame(data,index=idx)
-
-"""
-
-frame_html_repr_trunc_mi = Benchmark('df._repr_html_()', setup,
-                                   start_date=datetime(2013, 11, 25))
-
-# truncated repr_html, MultiIndex
-
-setup = common_setup + """
-nrows=10000
-data=randn(nrows,10)
-idx=randn(nrows)
-df=DataFrame(data,index=idx)
-
-"""
-
-frame_html_repr_trunc_si = Benchmark('df._repr_html_()', setup,
-                                   start_date=datetime(2013, 11, 25))
-
-
-# insert many columns
-
-setup = common_setup + """
-N = 1000
-
-def f(K=500):
-    df = DataFrame(index=range(N))
-    new_col = np.random.randn(N)
-    for i in range(K):
-        df[i] = new_col
-"""
-
-frame_insert_500_columns_end = Benchmark('f()', setup, start_date=datetime(2011, 1, 1))
-
-setup = common_setup + """
-N = 1000
-
-def f(K=100):
-    df = DataFrame(index=range(N))
-    new_col = np.random.randn(N)
-    for i in range(K):
-        df.insert(0,i,new_col)
-"""
-
-frame_insert_100_columns_begin = Benchmark('f()', setup, start_date=datetime(2011, 1, 1))
-
-#----------------------------------------------------------------------
-# strings methods, #2602
-
-setup = common_setup + """
-s = Series(['abcdefg', np.nan]*500000)
-"""
-
-series_string_vector_slice = Benchmark('s.str[:5]', setup,
-                                       start_date=datetime(2012, 8, 1))
-
-#----------------------------------------------------------------------
-# df.info() and get_dtype_counts() # 2807
-
-setup = common_setup + """
-df = pandas.DataFrame(np.random.randn(10,10000))
-"""
-
-frame_get_dtype_counts = Benchmark('df.get_dtype_counts()', setup,
-                                       start_date=datetime(2012, 8, 1))
-
-##
-setup = common_setup + """
-df = pandas.DataFrame(np.random.randn(10,10000))
-"""
-
-frame_repr_wide = Benchmark('repr(df)', setup,
-                            start_date=datetime(2012, 8, 1))
-
-##
-setup = common_setup + """
-df = pandas.DataFrame(np.random.randn(10000, 10))
-"""
-
-frame_repr_tall = Benchmark('repr(df)', setup,
-                            start_date=datetime(2012, 8, 1))
-
-##
-setup = common_setup + """
-df = DataFrame(randn(100000, 1))
-"""
-
-frame_xs_row = Benchmark('df.xs(50000)', setup)
-
-##
-setup = common_setup + """
-df = DataFrame(randn(1,100000))
-"""
-
-frame_xs_col = Benchmark('df.xs(50000,axis = 1)', setup)
-
-#----------------------------------------------------------------------
-# nulls/masking
-
-## masking
-setup = common_setup + """
-data = np.random.randn(1000, 500)
-df = DataFrame(data)
-df = df.where(df > 0) # create nans
-bools = df > 0
-mask = isnull(df)
-"""
-
-frame_mask_bools = Benchmark('bools.mask(mask)', setup,
-                             start_date=datetime(2013,1,1))
-
-frame_mask_floats  = Benchmark('bools.astype(float).mask(mask)', setup,
-                             start_date=datetime(2013,1,1))
-
-## isnull
-setup = common_setup + """
-data = np.random.randn(1000, 1000)
-df = DataFrame(data)
-"""
-frame_isnull  = Benchmark('isnull(df)', setup,
-                           start_date=datetime(2012,1,1))
-
-## dropna
-dropna_setup = common_setup + """
-data = np.random.randn(10000, 1000)
-df = DataFrame(data)
-df.ix[50:1000,20:50] = np.nan
-df.ix[2000:3000] = np.nan
-df.ix[:,60:70] = np.nan
-"""
-frame_dropna_axis0_any  = Benchmark('df.dropna(how="any",axis=0)', dropna_setup,
-                                     start_date=datetime(2012,1,1))
-frame_dropna_axis0_all  = Benchmark('df.dropna(how="all",axis=0)', dropna_setup,
-                                     start_date=datetime(2012,1,1))
-
-frame_dropna_axis1_any  = Benchmark('df.dropna(how="any",axis=1)', dropna_setup,
-                                    start_date=datetime(2012,1,1))
-
-frame_dropna_axis1_all  = Benchmark('df.dropna(how="all",axis=1)', dropna_setup,
-                                    start_date=datetime(2012,1,1))
-
-# dropna on mixed dtypes
-dropna_mixed_setup = common_setup + """
-data = np.random.randn(10000, 1000)
-df = DataFrame(data)
-df.ix[50:1000,20:50] = np.nan
-df.ix[2000:3000] = np.nan
-df.ix[:,60:70] = np.nan
-df['foo'] = 'bar'
-"""
-frame_dropna_axis0_any_mixed_dtypes  = Benchmark('df.dropna(how="any",axis=0)', dropna_mixed_setup,
-                                                 start_date=datetime(2012,1,1))
-frame_dropna_axis0_all_mixed_dtypes  = Benchmark('df.dropna(how="all",axis=0)', dropna_mixed_setup,
-                                                 start_date=datetime(2012,1,1))
-
-frame_dropna_axis1_any_mixed_dtypes  = Benchmark('df.dropna(how="any",axis=1)', dropna_mixed_setup,
-                                                 start_date=datetime(2012,1,1))
-
-frame_dropna_axis1_all_mixed_dtypes  = Benchmark('df.dropna(how="all",axis=1)', dropna_mixed_setup,
-                                                 start_date=datetime(2012,1,1))
-
-## dropna multi
-dropna_setup = common_setup + """
-data = np.random.randn(10000, 1000)
-df = DataFrame(data)
-df.ix[50:1000,20:50] = np.nan
-df.ix[2000:3000] = np.nan
-df.ix[:,60:70] = np.nan
-df.index = MultiIndex.from_tuples(df.index.map(lambda x: (x, x)))
-df.columns = MultiIndex.from_tuples(df.columns.map(lambda x: (x, x)))
-"""
-frame_count_level_axis0_multi = Benchmark('df.count(axis=0, level=1)', dropna_setup,
-                                          start_date=datetime(2012,1,1))
-
-frame_count_level_axis1_multi = Benchmark('df.count(axis=1, level=1)', dropna_setup,
-                                          start_date=datetime(2012,1,1))
-
-# dropna on mixed dtypes
-dropna_mixed_setup = common_setup + """
-data = np.random.randn(10000, 1000)
-df = DataFrame(data)
-df.ix[50:1000,20:50] = np.nan
-df.ix[2000:3000] = np.nan
-df.ix[:,60:70] = np.nan
-df['foo'] = 'bar'
-df.index = MultiIndex.from_tuples(df.index.map(lambda x: (x, x)))
-df.columns = MultiIndex.from_tuples(df.columns.map(lambda x: (x, x)))
-"""
-frame_count_level_axis0_mixed_dtypes_multi  = Benchmark('df.count(axis=0, level=1)', dropna_mixed_setup,
-                                                        start_date=datetime(2012,1,1))
-
-frame_count_level_axis1_mixed_dtypes_multi  = Benchmark('df.count(axis=1, level=1)', dropna_mixed_setup,
-                                                        start_date=datetime(2012,1,1))
-
-#----------------------------------------------------------------------
-# apply
-
-setup = common_setup + """
-s = Series(np.arange(1028.))
-df = DataFrame({ i:s for i in range(1028) })
-"""
-frame_apply_user_func = Benchmark('df.apply(lambda x: np.corrcoef(x,s)[0,1])', setup,
-                           name = 'frame_apply_user_func',
-                           start_date=datetime(2012,1,1))
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000,100))
-"""
-frame_apply_lambda_mean = Benchmark('df.apply(lambda x: x.sum())', setup,
-                                    name = 'frame_apply_lambda_mean',
-                                    start_date=datetime(2012,1,1))
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000,100))
-"""
-frame_apply_np_mean = Benchmark('df.apply(np.mean)', setup,
-                               name = 'frame_apply_np_mean',
-                               start_date=datetime(2012,1,1))
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000,100))
-"""
-frame_apply_pass_thru = Benchmark('df.apply(lambda x: x)', setup,
-                                  name = 'frame_apply_pass_thru',
-                                  start_date=datetime(2012,1,1))
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000,100))
-"""
-frame_apply_axis_1 = Benchmark('df.apply(lambda x: x+1,axis=1)', setup,
-                               name = 'frame_apply_axis_1',
-                               start_date=datetime(2012,1,1))
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000,3),columns=list('ABC'))
-"""
-frame_apply_ref_by_name = Benchmark('df.apply(lambda x: x["A"] + x["B"],axis=1)', setup,
-                                     name = 'frame_apply_ref_by_name',
-                                     start_date=datetime(2012,1,1))
-
-#----------------------------------------------------------------------
-# dtypes
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000,1000))
-"""
-frame_dtypes = Benchmark('df.dtypes', setup,
-                         start_date=datetime(2012,1,1))
-
-#----------------------------------------------------------------------
-# equals
-setup = common_setup + """
-def make_pair(frame):
-    df = frame
-    df2 = df.copy()
-    df2.ix[-1,-1] = np.nan
-    return df, df2
-
-def test_equal(name):
-    df, df2 = pairs[name]
-    return df.equals(df)
-
-def test_unequal(name):
-    df, df2 = pairs[name]
-    return df.equals(df2)
-
-float_df = DataFrame(np.random.randn(1000, 1000))
-object_df = DataFrame([['foo']*1000]*1000)
-nonunique_cols = object_df.copy()
-nonunique_cols.columns = ['A']*len(nonunique_cols.columns)
-
-pairs = dict([(name, make_pair(frame))
-         for name, frame in (('float_df', float_df), ('object_df', object_df), ('nonunique_cols', nonunique_cols))])
-"""
-frame_float_equal = Benchmark('test_equal("float_df")', setup)
-frame_object_equal = Benchmark('test_equal("object_df")', setup)
-frame_nonunique_equal = Benchmark('test_equal("nonunique_cols")', setup)
-
-frame_float_unequal = Benchmark('test_unequal("float_df")', setup)
-frame_object_unequal = Benchmark('test_unequal("object_df")', setup)
-frame_nonunique_unequal = Benchmark('test_unequal("nonunique_cols")', setup)
-
-#-----------------------------------------------------------------------------
-# interpolate
-# this is the worst case, where every column has NaNs.
-setup = common_setup + """
-df = DataFrame(randn(10000, 100))
-df.values[::2] = np.nan
-"""
-
-frame_interpolate = Benchmark('df.interpolate()', setup,
-                               start_date=datetime(2014, 2, 7))
-
-setup = common_setup + """
-df = DataFrame({'A': np.arange(0, 10000),
-                'B': np.random.randint(0, 100, 10000),
-                'C': randn(10000),
-                'D': randn(10000)})
-df.loc[1::5, 'A'] = np.nan
-df.loc[1::5, 'C'] = np.nan
-"""
-
-frame_interpolate_some_good = Benchmark('df.interpolate()', setup,
-                                        start_date=datetime(2014, 2, 7))
-frame_interpolate_some_good_infer = Benchmark('df.interpolate(downcast="infer")',
-                                              setup,
-                                              start_date=datetime(2014, 2, 7))
-
-
-#-------------------------------------------------------------------------
-# frame shift speedup issue-5609
-
-setup = common_setup + """
-df = DataFrame(np.random.rand(10000,500))
-# note: df._data.blocks are f_contigous
-"""
-frame_shift_axis0 = Benchmark('df.shift(1,axis=0)', setup,
-                    start_date=datetime(2014,1,1))
-frame_shift_axis1 = Benchmark('df.shift(1,axis=1)', setup,
-                    name = 'frame_shift_axis_1',
-                    start_date=datetime(2014,1,1))
-
-
-#-----------------------------------------------------------------------------
-# from_records issue-6700
-
-setup = common_setup + """
-def get_data(n=100000):
-    return ((x, x*20, x*100) for x in range(n))
-"""
-
-frame_from_records_generator = Benchmark('df = DataFrame.from_records(get_data())',
-                                setup,
-                                name='frame_from_records_generator',
-                                start_date=datetime(2013,10,4))  # issue-4911
-
-frame_from_records_generator_nrows = Benchmark('df = DataFrame.from_records(get_data(), nrows=1000)',
-                                setup,
-                                name='frame_from_records_generator_nrows',
-                                start_date=datetime(2013,10,04))  # issue-4911
-
-#-----------------------------------------------------------------------------
-# duplicated
-
-setup = common_setup + '''
-n = 1 << 20
-
-t = date_range('2015-01-01', freq='S', periods=n // 64)
-xs = np.random.randn(n // 64).round(2)
-
-df = DataFrame({'a':np.random.randint(- 1 << 8, 1 << 8, n),
-                'b':np.random.choice(t, n),
-                'c':np.random.choice(xs, n)})
-'''
-
-frame_duplicated = Benchmark('df.duplicated()', setup,
-                             name='frame_duplicated')
diff --git a/vb_suite/generate_rst_files.py b/vb_suite/generate_rst_files.py
deleted file mode 100644
index 92e7cd4d59b71..0000000000000
--- a/vb_suite/generate_rst_files.py
+++ /dev/null
@@ -1,2 +0,0 @@
-from suite import benchmarks, generate_rst_files
-generate_rst_files(benchmarks)
diff --git a/vb_suite/gil.py b/vb_suite/gil.py
deleted file mode 100644
index df2bd2dcd8db4..0000000000000
--- a/vb_suite/gil.py
+++ /dev/null
@@ -1,110 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-basic = common_setup + """
-try:
-    from pandas.util.testing import test_parallel
-    have_real_test_parallel = True
-except ImportError:
-    have_real_test_parallel = False
-    def test_parallel(num_threads=1):
-        def wrapper(fname):
-            return fname
-
-        return wrapper
-
-N = 1000000
-ngroups = 1000
-np.random.seed(1234)
-
-df = DataFrame({'key' : np.random.randint(0,ngroups,size=N),
-                'data' : np.random.randn(N) })
-
-if not have_real_test_parallel:
-    raise NotImplementedError
-"""
-
-setup = basic + """
-
-def f():
-    df.groupby('key')['data'].sum()
-
-# run consecutivily
-def g2():
-    for i in range(2):
-        f()
-def g4():
-    for i in range(4):
-        f()
-def g8():
-    for i in range(8):
-        f()
-
-# run in parallel
-@test_parallel(num_threads=2)
-def pg2():
-    f()
-
-@test_parallel(num_threads=4)
-def pg4():
-    f()
-
-@test_parallel(num_threads=8)
-def pg8():
-    f()
-
-"""
-
-nogil_groupby_sum_4 = Benchmark(
-    'pg4()', setup,
-    start_date=datetime(2015, 1, 1))
-
-nogil_groupby_sum_8 = Benchmark(
-    'pg8()', setup,
-    start_date=datetime(2015, 1, 1))
-
-
-#### test all groupby funcs ####
-
-setup = basic + """
-
-@test_parallel(num_threads=2)
-def pg2():
-    df.groupby('key')['data'].func()
-
-"""
-
-for f in ['sum','prod','var','count','min','max','mean','last']:
-
-    name = "nogil_groupby_{f}_2".format(f=f)
-    bmark = Benchmark('pg2()', setup.replace('func',f), start_date=datetime(2015, 1, 1))
-    bmark.name = name
-    globals()[name] = bmark
-
-del bmark
-
-
-#### test take_1d ####
-setup = basic + """
-from pandas.core import common as com
-
-N = 1e7
-df = DataFrame({'int64' : np.arange(N,dtype='int64'),
-                'float64' : np.arange(N,dtype='float64')})
-indexer = np.arange(100,len(df)-100)
-
-@test_parallel(num_threads=2)
-def take_1d_pg2_int64():
-    com.take_1d(df.int64.values,indexer)
-
-@test_parallel(num_threads=2)
-def take_1d_pg2_float64():
-    com.take_1d(df.float64.values,indexer)
-
-"""
-
-nogil_take1d_float64 = Benchmark('take_1d_pg2_int64()', setup, start_date=datetime(2015, 1, 1))
-nogil_take1d_int64 = Benchmark('take_1d_pg2_float64()', setup, start_date=datetime(2015, 1, 1))
diff --git a/vb_suite/groupby.py b/vb_suite/groupby.py
deleted file mode 100644
index bc21372225322..0000000000000
--- a/vb_suite/groupby.py
+++ /dev/null
@@ -1,620 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-setup = common_setup + """
-N = 100000
-ngroups = 100
-
-def get_test_data(ngroups=100, n=100000):
-    unique_groups = range(ngroups)
-    arr = np.asarray(np.tile(unique_groups, n / ngroups), dtype=object)
-
-    if len(arr) < n:
-        arr = np.asarray(list(arr) + unique_groups[:n - len(arr)],
-                         dtype=object)
-
-    random.shuffle(arr)
-    return arr
-
-# aggregate multiple columns
-df = DataFrame({'key1' : get_test_data(ngroups=ngroups),
-                'key2' : get_test_data(ngroups=ngroups),
-                'data1' : np.random.randn(N),
-                'data2' : np.random.randn(N)})
-def f():
-    df.groupby(['key1', 'key2']).agg(lambda x: x.values.sum())
-
-simple_series = Series(np.random.randn(N))
-key1 = df['key1']
-"""
-
-stmt1 = "df.groupby(['key1', 'key2'])['data1'].agg(lambda x: x.values.sum())"
-groupby_multi_python = Benchmark(stmt1, setup,
-                                 start_date=datetime(2011, 7, 1))
-
-stmt3 = "df.groupby(['key1', 'key2']).sum()"
-groupby_multi_cython = Benchmark(stmt3, setup,
-                                 start_date=datetime(2011, 7, 1))
-
-stmt = "df.groupby(['key1', 'key2'])['data1'].agg(np.std)"
-groupby_multi_series_op = Benchmark(stmt, setup,
-                                    start_date=datetime(2011, 8, 1))
-
-groupby_series_simple_cython = \
-    Benchmark('simple_series.groupby(key1).sum()', setup,
-              start_date=datetime(2011, 3, 1))
-
-
-stmt4 = "df.groupby('key1').rank(pct=True)"
-groupby_series_simple_cython = Benchmark(stmt4, setup,
-                                    start_date=datetime(2014, 1, 16))
-
-#----------------------------------------------------------------------
-# 2d grouping, aggregate many columns
-
-setup = common_setup + """
-labels = np.random.randint(0, 100, size=1000)
-df = DataFrame(randn(1000, 1000))
-"""
-
-groupby_frame_cython_many_columns = Benchmark(
-    'df.groupby(labels).sum()', setup,
-    start_date=datetime(2011, 8, 1),
-    logy=True)
-
-#----------------------------------------------------------------------
-# single key, long, integer key
-
-setup = common_setup + """
-data = np.random.randn(100000, 1)
-labels = np.random.randint(0, 1000, size=100000)
-df = DataFrame(data)
-"""
-
-groupby_frame_singlekey_integer = \
-    Benchmark('df.groupby(labels).sum()', setup,
-              start_date=datetime(2011, 8, 1), logy=True)
-
-#----------------------------------------------------------------------
-# group with different functions per column
-
-setup = common_setup + """
-fac1 = np.array(['A', 'B', 'C'], dtype='O')
-fac2 = np.array(['one', 'two'], dtype='O')
-
-df = DataFrame({'key1': fac1.take(np.random.randint(0, 3, size=100000)),
-                'key2': fac2.take(np.random.randint(0, 2, size=100000)),
-                'value1' : np.random.randn(100000),
-                'value2' : np.random.randn(100000),
-                'value3' : np.random.randn(100000)})
-"""
-
-groupby_multi_different_functions = \
-    Benchmark("""df.groupby(['key1', 'key2']).agg({'value1' : 'mean',
-                                                   'value2' : 'var',
-                                                   'value3' : 'sum'})""",
-              setup, start_date=datetime(2011, 9, 1))
-
-groupby_multi_different_numpy_functions = \
-    Benchmark("""df.groupby(['key1', 'key2']).agg({'value1' : np.mean,
-                                                   'value2' : np.var,
-                                                   'value3' : np.sum})""",
-              setup, start_date=datetime(2011, 9, 1))
-
-#----------------------------------------------------------------------
-# size() speed
-
-setup = common_setup + """
-n = 100000
-offsets = np.random.randint(n, size=n).astype('timedelta64[ns]')
-dates = np.datetime64('now') + offsets
-df = DataFrame({'key1': np.random.randint(0, 500, size=n),
-                'key2': np.random.randint(0, 100, size=n),
-                'value1' : np.random.randn(n),
-                'value2' : np.random.randn(n),
-                'value3' : np.random.randn(n),
-                'dates' : dates})
-"""
-
-groupby_multi_size = Benchmark("df.groupby(['key1', 'key2']).size()",
-                               setup, start_date=datetime(2011, 10, 1))
-
-groupby_dt_size = Benchmark("df.groupby(['dates']).size()",
-                            setup, start_date=datetime(2011, 10, 1))
-
-groupby_dt_timegrouper_size = Benchmark("df.groupby(TimeGrouper(key='dates', freq='M')).size()",
-                                        setup, start_date=datetime(2011, 10, 1))
-
-#----------------------------------------------------------------------
-# count() speed
-
-setup = common_setup + """
-n = 10000
-offsets = np.random.randint(n, size=n).astype('timedelta64[ns]')
-
-dates = np.datetime64('now') + offsets
-dates[np.random.rand(n) > 0.5] = np.datetime64('nat')
-
-offsets[np.random.rand(n) > 0.5] = np.timedelta64('nat')
-
-value2 = np.random.randn(n)
-value2[np.random.rand(n) > 0.5] = np.nan
-
-obj = tm.choice(list('ab'), size=n).astype(object)
-obj[np.random.randn(n) > 0.5] = np.nan
-
-df = DataFrame({'key1': np.random.randint(0, 500, size=n),
-                'key2': np.random.randint(0, 100, size=n),
-                'dates': dates,
-                'value2' : value2,
-                'value3' : np.random.randn(n),
-                'ints': np.random.randint(0, 1000, size=n),
-                'obj': obj,
-                'offsets': offsets})
-"""
-
-groupby_multi_count = Benchmark("df.groupby(['key1', 'key2']).count()",
-                                setup, name='groupby_multi_count',
-                                start_date=datetime(2014, 5, 5))
-
-setup = common_setup + """
-n = 10000
-
-df = DataFrame({'key1': randint(0, 500, size=n),
-                'key2': randint(0, 100, size=n),
-                'ints': randint(0, 1000, size=n),
-                'ints2': randint(0, 1000, size=n)})
-"""
-
-groupby_int_count = Benchmark("df.groupby(['key1', 'key2']).count()",
-                              setup, name='groupby_int_count',
-                              start_date=datetime(2014, 5, 6))
-#----------------------------------------------------------------------
-# Series.value_counts
-
-setup = common_setup + """
-s = Series(np.random.randint(0, 1000, size=100000))
-"""
-
-series_value_counts_int64 = Benchmark('s.value_counts()', setup,
-                                      start_date=datetime(2011, 10, 21))
-
-# value_counts on lots of strings
-
-setup = common_setup + """
-K = 1000
-N = 100000
-uniques = tm.makeStringIndex(K).values
-s = Series(np.tile(uniques, N // K))
-"""
-
-series_value_counts_strings = Benchmark('s.value_counts()', setup,
-                                        start_date=datetime(2011, 10, 21))
-
-#value_counts on float dtype
-
-setup = common_setup + """
-s = Series(np.random.randint(0, 1000, size=100000)).astype(float)
-"""
-
-series_value_counts_float64 = Benchmark('s.value_counts()', setup,
-                                      start_date=datetime(2015, 8, 17))
-
-#----------------------------------------------------------------------
-# pivot_table
-
-setup = common_setup + """
-fac1 = np.array(['A', 'B', 'C'], dtype='O')
-fac2 = np.array(['one', 'two'], dtype='O')
-
-ind1 = np.random.randint(0, 3, size=100000)
-ind2 = np.random.randint(0, 2, size=100000)
-
-df = DataFrame({'key1': fac1.take(ind1),
-'key2': fac2.take(ind2),
-'key3': fac2.take(ind2),
-'value1' : np.random.randn(100000),
-'value2' : np.random.randn(100000),
-'value3' : np.random.randn(100000)})
-"""
-
-stmt = "df.pivot_table(index='key1', columns=['key2', 'key3'])"
-groupby_pivot_table = Benchmark(stmt, setup, start_date=datetime(2011, 12, 15))
-
-
-#----------------------------------------------------------------------
-# dict return values
-
-setup = common_setup + """
-labels = np.arange(1000).repeat(10)
-data = Series(randn(len(labels)))
-f = lambda x: {'first': x.values[0], 'last': x.values[-1]}
-"""
-
-groupby_apply_dict_return = Benchmark('data.groupby(labels).apply(f)',
-                                      setup, start_date=datetime(2011, 12, 15))
-
-#----------------------------------------------------------------------
-# First / last functions
-
-setup = common_setup + """
-labels = np.arange(10000).repeat(10)
-data = Series(randn(len(labels)))
-data[::3] = np.nan
-data[1::3] = np.nan
-data2 = Series(randn(len(labels)),dtype='float32')
-data2[::3] = np.nan
-data2[1::3] = np.nan
-labels = labels.take(np.random.permutation(len(labels)))
-"""
-
-groupby_first_float64 = Benchmark('data.groupby(labels).first()', setup,
-                                  start_date=datetime(2012, 5, 1))
-
-groupby_first_float32 = Benchmark('data2.groupby(labels).first()', setup,
-                                  start_date=datetime(2013, 1, 1))
-
-groupby_last_float64 = Benchmark('data.groupby(labels).last()', setup,
-                                 start_date=datetime(2012, 5, 1))
-
-groupby_last_float32 = Benchmark('data2.groupby(labels).last()', setup,
-                                 start_date=datetime(2013, 1, 1))
-
-groupby_nth_float64_none = Benchmark('data.groupby(labels).nth(0)', setup,
-                                     start_date=datetime(2012, 5, 1))
-groupby_nth_float32_none = Benchmark('data2.groupby(labels).nth(0)', setup,
-                                     start_date=datetime(2013, 1, 1))
-groupby_nth_float64_any = Benchmark('data.groupby(labels).nth(0,dropna="all")', setup,
-                                    start_date=datetime(2012, 5, 1))
-groupby_nth_float32_any = Benchmark('data2.groupby(labels).nth(0,dropna="all")', setup,
-                                    start_date=datetime(2013, 1, 1))
-
-# with datetimes (GH7555)
-setup = common_setup + """
-df = DataFrame({'a' : date_range('1/1/2011',periods=100000,freq='s'),'b' : range(100000)})
-"""
-
-groupby_first_datetimes = Benchmark('df.groupby("b").first()', setup,
-                                    start_date=datetime(2013, 5, 1))
-groupby_last_datetimes = Benchmark('df.groupby("b").last()', setup,
-                                   start_date=datetime(2013, 5, 1))
-groupby_nth_datetimes_none = Benchmark('df.groupby("b").nth(0)', setup,
-                                       start_date=datetime(2013, 5, 1))
-groupby_nth_datetimes_any = Benchmark('df.groupby("b").nth(0,dropna="all")', setup,
-                                      start_date=datetime(2013, 5, 1))
-
-# with object
-setup = common_setup + """
-df = DataFrame({'a' : ['foo']*100000,'b' : range(100000)})
-"""
-
-groupby_first_object = Benchmark('df.groupby("b").first()', setup,
-                                 start_date=datetime(2013, 5, 1))
-groupby_last_object = Benchmark('df.groupby("b").last()', setup,
-                                 start_date=datetime(2013, 5, 1))
-groupby_nth_object_none = Benchmark('df.groupby("b").nth(0)', setup,
-                                    start_date=datetime(2013, 5, 1))
-groupby_nth_object_any = Benchmark('df.groupby("b").nth(0,dropna="any")', setup,
-                                   start_date=datetime(2013, 5, 1))
-
-#----------------------------------------------------------------------
-# groupby_indices replacement, chop up Series
-
-setup = common_setup + """
-try:
-    rng = date_range('1/1/2000', '12/31/2005', freq='H')
-    year, month, day = rng.year, rng.month, rng.day
-except:
-    rng = date_range('1/1/2000', '12/31/2000', offset=datetools.Hour())
-    year = rng.map(lambda x: x.year)
-    month = rng.map(lambda x: x.month)
-    day = rng.map(lambda x: x.day)
-
-ts = Series(np.random.randn(len(rng)), index=rng)
-"""
-
-groupby_indices = Benchmark('len(ts.groupby([year, month, day]))',
-                            setup, start_date=datetime(2012, 1, 1))
-
-#----------------------------------------------------------------------
-# median
-
-#----------------------------------------------------------------------
-# single key, long, integer key
-
-setup = common_setup + """
-data = np.random.randn(100000, 2)
-labels = np.random.randint(0, 1000, size=100000)
-df = DataFrame(data)
-"""
-
-groupby_frame_median = \
-    Benchmark('df.groupby(labels).median()', setup,
-              start_date=datetime(2011, 8, 1), logy=True)
-
-
-setup = common_setup + """
-data = np.random.randn(1000000, 2)
-labels = np.random.randint(0, 1000, size=1000000)
-df = DataFrame(data)
-"""
-
-groupby_simple_compress_timing = \
-    Benchmark('df.groupby(labels).mean()', setup,
-              start_date=datetime(2011, 8, 1))
-
-
-#----------------------------------------------------------------------
-# DataFrame Apply overhead
-
-setup = common_setup + """
-N = 10000
-labels = np.random.randint(0, 2000, size=N)
-labels2 = np.random.randint(0, 3, size=N)
-df = DataFrame({'key': labels,
-'key2': labels2,
-'value1': randn(N),
-'value2': ['foo', 'bar', 'baz', 'qux'] * (N / 4)})
-def f(g):
-    return 1
-"""
-
-groupby_frame_apply_overhead = Benchmark("df.groupby('key').apply(f)", setup,
-                                         start_date=datetime(2011, 10, 1))
-
-groupby_frame_apply = Benchmark("df.groupby(['key', 'key2']).apply(f)", setup,
-                                start_date=datetime(2011, 10, 1))
-
-
-#----------------------------------------------------------------------
-# DataFrame nth
-
-setup = common_setup + """
-df = DataFrame(np.random.randint(1, 100, (10000, 2)))
-"""
-
-# Not really a fair test as behaviour has changed!
-groupby_frame_nth_none = Benchmark("df.groupby(0).nth(0)", setup,
-                                   start_date=datetime(2014, 3, 1))
-
-groupby_series_nth_none = Benchmark("df[1].groupby(df[0]).nth(0)", setup,
-                                    start_date=datetime(2014, 3, 1))
-groupby_frame_nth_any= Benchmark("df.groupby(0).nth(0,dropna='any')", setup,
-                                 start_date=datetime(2014, 3, 1))
-
-groupby_series_nth_any = Benchmark("df[1].groupby(df[0]).nth(0,dropna='any')", setup,
-                                   start_date=datetime(2014, 3, 1))
-
-
-#----------------------------------------------------------------------
-# Sum booleans #2692
-
-setup = common_setup + """
-N = 500
-df = DataFrame({'ii':range(N),'bb':[True for x in range(N)]})
-"""
-
-groupby_sum_booleans = Benchmark("df.groupby('ii').sum()", setup)
-
-
-#----------------------------------------------------------------------
-# multi-indexed group sum #9049
-
-setup = common_setup + """
-N = 50
-df = DataFrame({'A': range(N) * 2, 'B': range(N*2), 'C': 1}).set_index(["A", "B"])
-"""
-
-groupby_sum_multiindex = Benchmark("df.groupby(level=[0, 1]).sum()", setup)
-
-
-#----------------------------------------------------------------------
-# Transform testing
-
-setup = common_setup + """
-n_dates = 400
-n_securities = 250
-n_columns = 3
-share_na = 0.1
-
-dates = date_range('1997-12-31', periods=n_dates, freq='B')
-dates = Index(map(lambda x: x.year * 10000 + x.month * 100 + x.day, dates))
-
-secid_min = int('10000000', 16)
-secid_max = int('F0000000', 16)
-step = (secid_max - secid_min) // (n_securities - 1)
-security_ids = map(lambda x: hex(x)[2:10].upper(), range(secid_min, secid_max + 1, step))
-
-data_index = MultiIndex(levels=[dates.values, security_ids],
-    labels=[[i for i in range(n_dates) for _ in xrange(n_securities)], range(n_securities) * n_dates],
-    names=['date', 'security_id'])
-n_data = len(data_index)
-
-columns = Index(['factor{}'.format(i) for i in range(1, n_columns + 1)])
-
-data = DataFrame(np.random.randn(n_data, n_columns), index=data_index, columns=columns)
-
-step = int(n_data * share_na)
-for column_index in range(n_columns):
-    index = column_index
-    while index < n_data:
-        data.set_value(data_index[index], columns[column_index], np.nan)
-        index += step
-
-f_fillna = lambda x: x.fillna(method='pad')
-"""
-
-groupby_transform = Benchmark("data.groupby(level='security_id').transform(f_fillna)", setup)
-groupby_transform_ufunc = Benchmark("data.groupby(level='date').transform(np.max)", setup)
-
-setup = common_setup + """
-np.random.seed(0)
-
-N = 120000
-N_TRANSITIONS = 1400
-
-# generate groups
-transition_points = np.random.permutation(np.arange(N))[:N_TRANSITIONS]
-transition_points.sort()
-transitions = np.zeros((N,), dtype=np.bool)
-transitions[transition_points] = True
-g = transitions.cumsum()
-
-df = DataFrame({ 'signal' : np.random.rand(N)})
-"""
-groupby_transform_series = Benchmark("df['signal'].groupby(g).transform(np.mean)", setup)
-
-setup = common_setup + """
-np.random.seed(0)
-
-df=DataFrame( { 'id' : np.arange( 100000 ) / 3,
-                'val': np.random.randn( 100000) } )
-"""
-
-groupby_transform_series2 = Benchmark("df.groupby('id')['val'].transform(np.mean)", setup)
-
-setup = common_setup + '''
-np.random.seed(2718281)
-n = 20000
-df = DataFrame(np.random.randint(1, n, (n, 3)),
-        columns=['jim', 'joe', 'jolie'])
-'''
-
-stmt = "df.groupby(['jim', 'joe'])['jolie'].transform('max')";
-groupby_transform_multi_key1 = Benchmark(stmt, setup)
-groupby_transform_multi_key2 = Benchmark(stmt, setup + "df['jim'] = df['joe']")
-
-setup = common_setup + '''
-np.random.seed(2718281)
-n = 200000
-df = DataFrame(np.random.randint(1, n / 10, (n, 3)),
-        columns=['jim', 'joe', 'jolie'])
-'''
-groupby_transform_multi_key3 = Benchmark(stmt, setup)
-groupby_transform_multi_key4 = Benchmark(stmt, setup + "df['jim'] = df['joe']")
-
-setup = common_setup + '''
-np.random.seed(27182)
-n = 100000
-df = DataFrame(np.random.randint(1, n / 100, (n, 3)),
-        columns=['jim', 'joe', 'jolie'])
-'''
-
-groupby_agg_builtins1 = Benchmark("df.groupby('jim').agg([sum, min, max])", setup)
-groupby_agg_builtins2 = Benchmark("df.groupby(['jim', 'joe']).agg([sum, min, max])", setup)
-
-
-setup = common_setup + '''
-arr = np.random.randint(- 1 << 12, 1 << 12, (1 << 17, 5))
-i = np.random.choice(len(arr), len(arr) * 5)
-arr = np.vstack((arr, arr[i]))  # add sume duplicate rows
-
-i = np.random.permutation(len(arr))
-arr = arr[i]  # shuffle rows
-
-df = DataFrame(arr, columns=list('abcde'))
-df['jim'], df['joe'] = np.random.randn(2, len(df)) * 10
-'''
-
-groupby_int64_overflow = Benchmark("df.groupby(list('abcde')).max()", setup,
-                                   name='groupby_int64_overflow')
-
-
-setup = common_setup + '''
-from itertools import product
-from string import ascii_letters, digits
-
-n = 5 * 7 * 11 * (1 << 9)
-alpha = list(map(''.join, product(ascii_letters + digits, repeat=4)))
-f = lambda k: np.repeat(np.random.choice(alpha, n // k), k)
-
-df = DataFrame({'a': f(11), 'b': f(7), 'c': f(5), 'd': f(1)})
-df['joe'] = (np.random.randn(len(df)) * 10).round(3)
-
-i = np.random.permutation(len(df))
-df = df.iloc[i].reset_index(drop=True).copy()
-'''
-
-groupby_multi_index = Benchmark("df.groupby(list('abcd')).max()", setup,
-                                name='groupby_multi_index')
-
-#----------------------------------------------------------------------
-# groupby with a variable value for ngroups
-
-
-ngroups_list = [100, 10000]
-no_arg_func_list = [
-    'all',
-    'any',
-    'count',
-    'cumcount',
-    'cummax',
-    'cummin',
-    'cumprod',
-    'cumsum',
-    'describe',
-    'diff',
-    'first',
-    'head',
-    'last',
-    'mad',
-    'max',
-    'mean',
-    'median',
-    'min',
-    'nunique',
-    'pct_change',
-    'prod',
-    'rank',
-    'sem',
-    'size',
-    'skew',
-    'std',
-    'sum',
-    'tail',
-    'unique',
-    'var',
-    'value_counts',
-]
-
-
-_stmt_template = "df.groupby('value')['timestamp'].%s"
-_setup_template = common_setup + """
-np.random.seed(1234)
-ngroups = %s
-size = ngroups * 2
-rng = np.arange(ngroups)
-df = DataFrame(dict(
-    timestamp=rng.take(np.random.randint(0, ngroups, size=size)),
-    value=np.random.randint(0, size, size=size)
-))
-"""
-START_DATE = datetime(2011, 7, 1)
-
-
-def make_large_ngroups_bmark(ngroups, func_name, func_args=''):
-    bmark_name = 'groupby_ngroups_%s_%s' % (ngroups, func_name)
-    stmt = _stmt_template % ('%s(%s)' % (func_name, func_args))
-    setup = _setup_template % ngroups
-    bmark = Benchmark(stmt, setup, start_date=START_DATE)
-    # MUST set name
-    bmark.name = bmark_name
-    return bmark
-
-
-def inject_bmark_into_globals(bmark):
-    if not bmark.name:
-        raise AssertionError('benchmark must have a name')
-    globals()[bmark.name] = bmark
-
-
-for ngroups in ngroups_list:
-    for func_name in no_arg_func_list:
-        bmark = make_large_ngroups_bmark(ngroups, func_name)
-        inject_bmark_into_globals(bmark)
-
-# avoid bmark to be collected as Benchmark object
-del bmark
diff --git a/vb_suite/hdfstore_bench.py b/vb_suite/hdfstore_bench.py
deleted file mode 100644
index 393fd4cc77e66..0000000000000
--- a/vb_suite/hdfstore_bench.py
+++ /dev/null
@@ -1,278 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-start_date = datetime(2012, 7, 1)
-
-common_setup = """from .pandas_vb_common import *
-import os
-
-f = '__test__.h5'
-def remove(f):
-   try:
-       os.remove(f)
-   except:
-       pass
-
-"""
-
-#----------------------------------------------------------------------
-# get from a store
-
-setup1 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000)},
-               index=index)
-remove(f)
-store = HDFStore(f)
-store.put('df1',df)
-"""
-
-read_store = Benchmark("store.get('df1')", setup1, cleanup="store.close()",
-                       start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# write to a store
-
-setup2 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000)},
-               index=index)
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store = Benchmark(
-    "store.put('df2',df)", setup2, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# get from a store (mixed)
-
-setup3 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000),
-                'string1' : ['foo'] * 25000,
-                'bool1' : [True] * 25000,
-                'int1' : np.random.randint(0, 250000, size=25000)},
-               index=index)
-remove(f)
-store = HDFStore(f)
-store.put('df3',df)
-"""
-
-read_store_mixed = Benchmark(
-    "store.get('df3')", setup3, cleanup="store.close()",
-    start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# write to a store (mixed)
-
-setup4 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000),
-                'string1' : ['foo'] * 25000,
-                'bool1' : [True] * 25000,
-                'int1' : np.random.randint(0, 250000, size=25000)},
-               index=index)
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store_mixed = Benchmark(
-    "store.put('df4',df)", setup4, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# get from a table (mixed)
-
-setup5 = common_setup + """
-N=10000
-index = tm.makeStringIndex(N)
-df = DataFrame({'float1' : randn(N),
-                'float2' : randn(N),
-                'string1' : ['foo'] * N,
-                'bool1' : [True] * N,
-                'int1' : np.random.randint(0, N, size=N)},
-               index=index)
-
-remove(f)
-store = HDFStore(f)
-store.append('df5',df)
-"""
-
-read_store_table_mixed = Benchmark(
-    "store.select('df5')", setup5, cleanup="store.close()",
-    start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# write to a table (mixed)
-
-setup6 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000),
-                'string1' : ['foo'] * 25000,
-                'bool1' : [True] * 25000,
-                'int1' : np.random.randint(0, 25000, size=25000)},
-               index=index)
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store_table_mixed = Benchmark(
-    "store.append('df6',df)", setup6, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# select from a table
-
-setup7 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000) },
-               index=index)
-
-remove(f)
-store = HDFStore(f)
-store.append('df7',df)
-"""
-
-read_store_table = Benchmark(
-    "store.select('df7')", setup7, cleanup="store.close()",
-    start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# write to a table
-
-setup8 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000) },
-               index=index)
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store_table = Benchmark(
-    "store.append('df8',df)", setup8, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# get from a table (wide)
-
-setup9 = common_setup + """
-df = DataFrame(np.random.randn(25000,100))
-
-remove(f)
-store = HDFStore(f)
-store.append('df9',df)
-"""
-
-read_store_table_wide = Benchmark(
-    "store.select('df9')", setup9, cleanup="store.close()",
-    start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# write to a table (wide)
-
-setup10 = common_setup + """
-df = DataFrame(np.random.randn(25000,100))
-
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store_table_wide = Benchmark(
-    "store.append('df10',df)", setup10, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# get from a table (wide)
-
-setup11 = common_setup + """
-index = date_range('1/1/2000', periods = 25000)
-df = DataFrame(np.random.randn(25000,100), index = index)
-
-remove(f)
-store = HDFStore(f)
-store.append('df11',df)
-"""
-
-query_store_table_wide = Benchmark(
-    "store.select('df11', [ ('index', '>', df.index[10000]), ('index', '<', df.index[15000]) ])", setup11, cleanup="store.close()",
-    start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# query from a table
-
-setup12 = common_setup + """
-index = date_range('1/1/2000', periods = 25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000) },
-               index=index)
-
-remove(f)
-store = HDFStore(f)
-store.append('df12',df)
-"""
-
-query_store_table = Benchmark(
-    "store.select('df12', [ ('index', '>', df.index[10000]), ('index', '<', df.index[15000]) ])", setup12, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# select from a panel table
-
-setup13 = common_setup + """
-p = Panel(randn(20, 1000, 25), items= [ 'Item%03d' % i for i in range(20) ],
-                   major_axis=date_range('1/1/2000', periods=1000), minor_axis = [ 'E%03d' % i for i in range(25) ])
-
-remove(f)
-store = HDFStore(f)
-store.append('p1',p)
-"""
-
-read_store_table_panel = Benchmark(
-    "store.select('p1')", setup13, cleanup="store.close()",
-    start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# write to a panel table
-
-setup14 = common_setup + """
-p = Panel(randn(20, 1000, 25), items= [ 'Item%03d' % i for i in range(20) ],
-                   major_axis=date_range('1/1/2000', periods=1000), minor_axis = [ 'E%03d' % i for i in range(25) ])
-
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store_table_panel = Benchmark(
-    "store.append('p2',p)", setup14, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# write to a table (data_columns)
-
-setup15 = common_setup + """
-df = DataFrame(np.random.randn(10000,10),columns = [ 'C%03d' % i for i in range(10) ])
-
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store_table_dc = Benchmark(
-    "store.append('df15',df,data_columns=True)", setup15, cleanup="store.close()",
-    start_date=start_date)
-
diff --git a/vb_suite/index_object.py b/vb_suite/index_object.py
deleted file mode 100644
index 2ab2bc15f3853..0000000000000
--- a/vb_suite/index_object.py
+++ /dev/null
@@ -1,173 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-SECTION = "Index / MultiIndex objects"
-
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# intersection, union
-
-setup = common_setup + """
-rng = DatetimeIndex(start='1/1/2000', periods=10000, freq=datetools.Minute())
-if rng.dtype == object:
-    rng = rng.view(Index)
-else:
-    rng = rng.asobject
-rng2 = rng[:-1]
-"""
-
-index_datetime_intersection = Benchmark("rng.intersection(rng2)", setup)
-index_datetime_union = Benchmark("rng.union(rng2)", setup)
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=10000, freq='T')
-rng2 = rng[:-1]
-"""
-
-datetime_index_intersection = Benchmark("rng.intersection(rng2)", setup,
-                                        start_date=datetime(2013, 9, 27))
-datetime_index_union = Benchmark("rng.union(rng2)", setup,
-                                 start_date=datetime(2013, 9, 27))
-
-# integers
-setup = common_setup + """
-N = 1000000
-options = np.arange(N)
-
-left = Index(options.take(np.random.permutation(N)[:N // 2]))
-right = Index(options.take(np.random.permutation(N)[:N // 2]))
-"""
-
-index_int64_union = Benchmark('left.union(right)', setup,
-                              start_date=datetime(2011, 1, 1))
-
-index_int64_intersection = Benchmark('left.intersection(right)', setup,
-                                     start_date=datetime(2011, 1, 1))
-
-#----------------------------------------------------------------------
-# string index slicing
-setup = common_setup + """
-idx = tm.makeStringIndex(1000000)
-
-mask = np.arange(1000000) % 3 == 0
-series_mask = Series(mask)
-"""
-index_str_slice_indexer_basic = Benchmark('idx[:-1]', setup)
-index_str_slice_indexer_even = Benchmark('idx[::2]', setup)
-index_str_boolean_indexer = Benchmark('idx[mask]', setup)
-index_str_boolean_series_indexer = Benchmark('idx[series_mask]', setup)
-
-#----------------------------------------------------------------------
-# float64 index
-#----------------------------------------------------------------------
-# construction
-setup = common_setup + """
-baseidx = np.arange(1e6)
-"""
-
-index_float64_construct = Benchmark('Index(baseidx)', setup,
-                                    name='index_float64_construct',
-                                    start_date=datetime(2014, 4, 13))
-
-setup = common_setup + """
-idx = tm.makeFloatIndex(1000000)
-
-mask = np.arange(idx.size) % 3 == 0
-series_mask = Series(mask)
-"""
-#----------------------------------------------------------------------
-# getting
-index_float64_get = Benchmark('idx[1]', setup, name='index_float64_get',
-                              start_date=datetime(2014, 4, 13))
-
-
-#----------------------------------------------------------------------
-# slicing
-index_float64_slice_indexer_basic = Benchmark('idx[:-1]', setup,
-                                              name='index_float64_slice_indexer_basic',
-                                              start_date=datetime(2014, 4, 13))
-index_float64_slice_indexer_even = Benchmark('idx[::2]', setup,
-                                             name='index_float64_slice_indexer_even',
-                                             start_date=datetime(2014, 4, 13))
-index_float64_boolean_indexer = Benchmark('idx[mask]', setup,
-                                          name='index_float64_boolean_indexer',
-                                          start_date=datetime(2014, 4, 13))
-index_float64_boolean_series_indexer = Benchmark('idx[series_mask]', setup,
-                                                 name='index_float64_boolean_series_indexer',
-                                                 start_date=datetime(2014, 4, 13))
-
-#----------------------------------------------------------------------
-# arith ops
-index_float64_mul = Benchmark('idx * 2', setup, name='index_float64_mul',
-                              start_date=datetime(2014, 4, 13))
-index_float64_div = Benchmark('idx / 2', setup, name='index_float64_div',
-                              start_date=datetime(2014, 4, 13))
-
-
-# Constructing MultiIndex from cartesian product of iterables
-#
-
-setup = common_setup + """
-iterables = [tm.makeStringIndex(10000), range(20)]
-"""
-
-multiindex_from_product = Benchmark('MultiIndex.from_product(iterables)',
-                                    setup, name='multiindex_from_product',
-                                    start_date=datetime(2014, 6, 30))
-
-#----------------------------------------------------------------------
-# MultiIndex with DatetimeIndex level
-
-setup = common_setup + """
-level1 = range(1000)
-level2 = date_range(start='1/1/2012', periods=100)
-mi = MultiIndex.from_product([level1, level2])
-"""
-
-multiindex_with_datetime_level_full = \
-    Benchmark("mi.copy().values", setup,
-              name='multiindex_with_datetime_level_full',
-              start_date=datetime(2014, 10, 11))
-
-
-multiindex_with_datetime_level_sliced = \
-    Benchmark("mi[:10].values", setup,
-              name='multiindex_with_datetime_level_sliced',
-              start_date=datetime(2014, 10, 11))
-
-# multi-index duplicated
-setup = common_setup + """
-n, k = 200, 5000
-levels = [np.arange(n), tm.makeStringIndex(n).values, 1000 + np.arange(n)]
-labels = [np.random.choice(n, k * n) for lev in levels]
-mi = MultiIndex(levels=levels, labels=labels)
-"""
-
-multiindex_duplicated = Benchmark('mi.duplicated()', setup,
-                                  name='multiindex_duplicated')
-
-#----------------------------------------------------------------------
-# repr
-
-setup = common_setup + """
-dr = pd.date_range('20000101', freq='D', periods=100000)
-"""
-
-datetime_index_repr = \
-    Benchmark("dr._is_dates_only", setup,
-              start_date=datetime(2012, 1, 11))
-
-setup = common_setup + """
-n = 3 * 5 * 7 * 11 * (1 << 10)
-low, high = - 1 << 12, 1 << 12
-f = lambda k: np.repeat(np.random.randint(low, high, n // k), k)
-
-i = np.random.permutation(n)
-mi = MultiIndex.from_arrays([f(11), f(7), f(5), f(3), f(1)])[i]
-"""
-
-multiindex_sortlevel_int64 = Benchmark('mi.sortlevel()', setup,
-                                       name='multiindex_sortlevel_int64')
diff --git a/vb_suite/indexing.py b/vb_suite/indexing.py
deleted file mode 100644
index 3d95d52dccd71..0000000000000
--- a/vb_suite/indexing.py
+++ /dev/null
@@ -1,292 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-SECTION = 'Indexing and scalar value access'
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# Series.__getitem__, get_value, __getitem__(slice)
-
-setup = common_setup + """
-tm.N = 1000
-ts = tm.makeTimeSeries()
-dt = ts.index[500]
-"""
-statement = "ts[dt]"
-bm_getitem = Benchmark(statement, setup, ncalls=100000,
-                       name='time_series_getitem_scalar')
-
-setup = common_setup + """
-index = tm.makeStringIndex(1000)
-s = Series(np.random.rand(1000), index=index)
-idx = index[100]
-"""
-statement = "s.get_value(idx)"
-bm_get_value = Benchmark(statement, setup,
-                         name='series_get_value',
-                         start_date=datetime(2011, 11, 12))
-
-
-setup = common_setup + """
-index = tm.makeStringIndex(1000000)
-s = Series(np.random.rand(1000000), index=index)
-"""
-series_getitem_pos_slice = Benchmark("s[:800000]", setup,
-                                     name="series_getitem_pos_slice")
-
-
-setup = common_setup + """
-index = tm.makeStringIndex(1000000)
-s = Series(np.random.rand(1000000), index=index)
-lbl = s.index[800000]
-"""
-series_getitem_label_slice = Benchmark("s[:lbl]", setup,
-                                       name="series_getitem_label_slice")
-
-
-#----------------------------------------------------------------------
-# DataFrame __getitem__
-
-setup = common_setup + """
-index = tm.makeStringIndex(1000)
-columns = tm.makeStringIndex(30)
-df = DataFrame(np.random.rand(1000, 30), index=index,
-               columns=columns)
-idx = index[100]
-col = columns[10]
-"""
-statement = "df[col][idx]"
-bm_df_getitem = Benchmark(statement, setup,
-                          name='dataframe_getitem_scalar')
-
-setup = common_setup + """
-try:
-    klass = DataMatrix
-except:
-    klass = DataFrame
-
-index = tm.makeStringIndex(1000)
-columns = tm.makeStringIndex(30)
-df = klass(np.random.rand(1000, 30), index=index, columns=columns)
-idx = index[100]
-col = columns[10]
-"""
-statement = "df[col][idx]"
-bm_df_getitem2 = Benchmark(statement, setup,
-                           name='datamatrix_getitem_scalar')
-
-
-#----------------------------------------------------------------------
-# ix get scalar
-
-setup = common_setup + """
-index = tm.makeStringIndex(1000)
-columns = tm.makeStringIndex(30)
-df = DataFrame(np.random.randn(1000, 30), index=index, columns=columns)
-idx = index[100]
-col = columns[10]
-"""
-
-indexing_frame_get_value_ix = Benchmark("df.ix[idx,col]", setup,
-                                        name='indexing_frame_get_value_ix',
-                                        start_date=datetime(2011, 11, 12))
-
-indexing_frame_get_value = Benchmark("df.get_value(idx,col)", setup,
-                                     name='indexing_frame_get_value',
-                                     start_date=datetime(2011, 11, 12))
-
-setup = common_setup + """
-mi = MultiIndex.from_tuples([(x,y) for x in range(1000) for y in range(1000)])
-s =  Series(np.random.randn(1000000), index=mi)
-"""
-
-series_xs_mi_ix = Benchmark("s.ix[999]", setup,
-                            name='series_xs_mi_ix',
-                            start_date=datetime(2013, 1, 1))
-
-setup = common_setup + """
-mi = MultiIndex.from_tuples([(x,y) for x in range(1000) for y in range(1000)])
-s =  Series(np.random.randn(1000000), index=mi)
-df = DataFrame(s)
-"""
-
-frame_xs_mi_ix = Benchmark("df.ix[999]", setup,
-                           name='frame_xs_mi_ix',
-                           start_date=datetime(2013, 1, 1))
-
-#----------------------------------------------------------------------
-# Boolean DataFrame row selection
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(10000, 4), columns=['A', 'B', 'C', 'D'])
-indexer = df['B'] > 0
-obj_indexer = indexer.astype('O')
-"""
-indexing_dataframe_boolean_rows = \
-    Benchmark("df[indexer]", setup, name='indexing_dataframe_boolean_rows')
-
-indexing_dataframe_boolean_rows_object = \
-    Benchmark("df[obj_indexer]", setup,
-              name='indexing_dataframe_boolean_rows_object')
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(50000, 100))
-df2 = DataFrame(np.random.randn(50000, 100))
-"""
-indexing_dataframe_boolean = \
-    Benchmark("df > df2", setup, name='indexing_dataframe_boolean',
-              start_date=datetime(2012, 1, 1))
-
-setup = common_setup + """
-try:
-    import pandas.computation.expressions as expr
-except:
-    expr = None
-
-if expr is None:
-    raise NotImplementedError
-df  = DataFrame(np.random.randn(50000, 100))
-df2 = DataFrame(np.random.randn(50000, 100))
-expr.set_numexpr_threads(1)
-"""
-
-indexing_dataframe_boolean_st = \
-    Benchmark("df > df2", setup, name='indexing_dataframe_boolean_st',cleanup="expr.set_numexpr_threads()",
-              start_date=datetime(2013, 2, 26))
-
-
-setup = common_setup + """
-try:
-    import pandas.computation.expressions as expr
-except:
-    expr = None
-
-if expr is None:
-    raise NotImplementedError
-df  = DataFrame(np.random.randn(50000, 100))
-df2 = DataFrame(np.random.randn(50000, 100))
-expr.set_use_numexpr(False)
-"""
-
-indexing_dataframe_boolean_no_ne = \
-    Benchmark("df > df2", setup, name='indexing_dataframe_boolean_no_ne',cleanup="expr.set_use_numexpr(True)",
-              start_date=datetime(2013, 2, 26))
-#----------------------------------------------------------------------
-# MultiIndex sortlevel
-
-setup = common_setup + """
-a = np.repeat(np.arange(100), 1000)
-b = np.tile(np.arange(1000), 100)
-midx = MultiIndex.from_arrays([a, b])
-midx = midx.take(np.random.permutation(np.arange(100000)))
-"""
-sort_level_zero = Benchmark("midx.sortlevel(0)", setup,
-                            start_date=datetime(2012, 1, 1))
-sort_level_one = Benchmark("midx.sortlevel(1)", setup,
-                           start_date=datetime(2012, 1, 1))
-
-#----------------------------------------------------------------------
-# Panel subset selection
-
-setup = common_setup + """
-p = Panel(np.random.randn(100, 100, 100))
-inds = range(0, 100, 10)
-"""
-
-indexing_panel_subset = Benchmark('p.ix[inds, inds, inds]', setup,
-                                  start_date=datetime(2012, 1, 1))
-
-#----------------------------------------------------------------------
-# Iloc
-
-setup = common_setup + """
-df = DataFrame({'A' : [0.1] * 3000, 'B' : [1] * 3000})
-idx = np.array(range(30)) * 99
-df2 = DataFrame({'A' : [0.1] * 1000, 'B' : [1] * 1000})
-df2 = concat([df2, 2*df2, 3*df2])
-"""
-
-frame_iloc_dups = Benchmark('df2.iloc[idx]', setup,
-                            start_date=datetime(2013, 1, 1))
-
-frame_loc_dups = Benchmark('df2.loc[idx]', setup,
-                            start_date=datetime(2013, 1, 1))
-
-setup = common_setup + """
-df = DataFrame(dict( A = [ 'foo'] * 1000000))
-"""
-
-frame_iloc_big = Benchmark('df.iloc[:100,0]', setup,
-                            start_date=datetime(2013, 1, 1))
-
-#----------------------------------------------------------------------
-# basic tests for [], .loc[], .iloc[] and .ix[]
-
-setup = common_setup + """
-s = Series(np.random.rand(1000000))
-"""
-
-series_getitem_scalar = Benchmark("s[800000]", setup)
-series_getitem_slice = Benchmark("s[:800000]", setup)
-series_getitem_list_like = Benchmark("s[[800000]]", setup)
-series_getitem_array = Benchmark("s[np.arange(10000)]", setup)
-
-series_loc_scalar = Benchmark("s.loc[800000]", setup)
-series_loc_slice = Benchmark("s.loc[:800000]", setup)
-series_loc_list_like = Benchmark("s.loc[[800000]]", setup)
-series_loc_array = Benchmark("s.loc[np.arange(10000)]", setup)
-
-series_iloc_scalar = Benchmark("s.iloc[800000]", setup)
-series_iloc_slice = Benchmark("s.iloc[:800000]", setup)
-series_iloc_list_like = Benchmark("s.iloc[[800000]]", setup)
-series_iloc_array = Benchmark("s.iloc[np.arange(10000)]", setup)
-
-series_ix_scalar = Benchmark("s.ix[800000]", setup)
-series_ix_slice = Benchmark("s.ix[:800000]", setup)
-series_ix_list_like = Benchmark("s.ix[[800000]]", setup)
-series_ix_array = Benchmark("s.ix[np.arange(10000)]", setup)
-
-
-# multi-index slicing
-setup = common_setup + """
-np.random.seed(1234)
-idx=pd.IndexSlice
-n=100000
-mdt = pandas.DataFrame()
-mdt['A'] = np.random.choice(range(10000,45000,1000), n)
-mdt['B'] = np.random.choice(range(10,400), n)
-mdt['C'] = np.random.choice(range(1,150), n)
-mdt['D'] = np.random.choice(range(10000,45000), n)
-mdt['x'] = np.random.choice(range(400), n)
-mdt['y'] = np.random.choice(range(25), n)
-
-
-test_A = 25000
-test_B = 25
-test_C = 40
-test_D = 35000
-
-eps_A = 5000
-eps_B = 5
-eps_C = 5
-eps_D = 5000
-mdt2 = mdt.set_index(['A','B','C','D']).sortlevel()
-"""
-
-multiindex_slicers = Benchmark('mdt2.loc[idx[test_A-eps_A:test_A+eps_A,test_B-eps_B:test_B+eps_B,test_C-eps_C:test_C+eps_C,test_D-eps_D:test_D+eps_D],:]', setup,
-                               start_date=datetime(2015, 1, 1))
-
-#----------------------------------------------------------------------
-# take
-
-setup = common_setup + """
-s = Series(np.random.rand(100000))
-ts = Series(np.random.rand(100000),
-            index=date_range('2011-01-01', freq='S', periods=100000))
-indexer = [True, False, True, True, False] * 20000
-"""
-
-series_take_intindex = Benchmark("s.take(indexer)", setup)
-series_take_dtindex = Benchmark("ts.take(indexer)", setup)
diff --git a/vb_suite/inference.py b/vb_suite/inference.py
deleted file mode 100644
index aaa51aa5163ce..0000000000000
--- a/vb_suite/inference.py
+++ /dev/null
@@ -1,36 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-import sys
-
-# from GH 7332
-
-setup = """from .pandas_vb_common import *
-import pandas as pd
-N = 500000
-df_int64 = DataFrame(dict(A = np.arange(N,dtype='int64'), B = np.arange(N,dtype='int64')))
-df_int32 = DataFrame(dict(A = np.arange(N,dtype='int32'), B = np.arange(N,dtype='int32')))
-df_uint32 = DataFrame(dict(A = np.arange(N,dtype='uint32'), B = np.arange(N,dtype='uint32')))
-df_float64 = DataFrame(dict(A = np.arange(N,dtype='float64'), B = np.arange(N,dtype='float64')))
-df_float32 = DataFrame(dict(A = np.arange(N,dtype='float32'), B = np.arange(N,dtype='float32')))
-df_datetime64 = DataFrame(dict(A = pd.to_datetime(np.arange(N,dtype='int64'),unit='ms'),
-                               B = pd.to_datetime(np.arange(N,dtype='int64'),unit='ms')))
-df_timedelta64 = DataFrame(dict(A = df_datetime64['A']-df_datetime64['B'],
-                                B = df_datetime64['B']))
-"""
-
-dtype_infer_int64 = Benchmark('df_int64["A"] + df_int64["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_int32 = Benchmark('df_int32["A"] + df_int32["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_uint32 = Benchmark('df_uint32["A"] + df_uint32["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_float64 = Benchmark('df_float64["A"] + df_float64["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_float32 = Benchmark('df_float32["A"] + df_float32["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_datetime64 = Benchmark('df_datetime64["A"] - df_datetime64["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_timedelta64_1 = Benchmark('df_timedelta64["A"] + df_timedelta64["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_timedelta64_2 = Benchmark('df_timedelta64["A"] + df_timedelta64["A"]', setup,
-                               start_date=datetime(2014, 1, 1))
diff --git a/vb_suite/io_bench.py b/vb_suite/io_bench.py
deleted file mode 100644
index af5f6076515cc..0000000000000
--- a/vb_suite/io_bench.py
+++ /dev/null
@@ -1,150 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-from io import StringIO
-"""
-
-#----------------------------------------------------------------------
-# read_csv
-
-setup1 = common_setup + """
-index = tm.makeStringIndex(10000)
-df = DataFrame({'float1' : randn(10000),
-                'float2' : randn(10000),
-                'string1' : ['foo'] * 10000,
-                'bool1' : [True] * 10000,
-                'int1' : np.random.randint(0, 100000, size=10000)},
-               index=index)
-df.to_csv('__test__.csv')
-"""
-
-read_csv_standard = Benchmark("read_csv('__test__.csv')", setup1,
-                              start_date=datetime(2011, 9, 15))
-
-#----------------------------------
-# skiprows
-
-setup1 = common_setup + """
-index = tm.makeStringIndex(20000)
-df = DataFrame({'float1' : randn(20000),
-                'float2' : randn(20000),
-                'string1' : ['foo'] * 20000,
-                'bool1' : [True] * 20000,
-                'int1' : np.random.randint(0, 200000, size=20000)},
-               index=index)
-df.to_csv('__test__.csv')
-"""
-
-read_csv_skiprows = Benchmark("read_csv('__test__.csv', skiprows=10000)", setup1,
-                              start_date=datetime(2011, 9, 15))
-
-#----------------------------------------------------------------------
-# write_csv
-
-setup2 = common_setup + """
-index = tm.makeStringIndex(10000)
-df = DataFrame({'float1' : randn(10000),
-                'float2' : randn(10000),
-                'string1' : ['foo'] * 10000,
-                'bool1' : [True] * 10000,
-                'int1' : np.random.randint(0, 100000, size=10000)},
-               index=index)
-"""
-
-write_csv_standard = Benchmark("df.to_csv('__test__.csv')", setup2,
-                               start_date=datetime(2011, 9, 15))
-
-#----------------------------------
-setup = common_setup + """
-df = DataFrame(np.random.randn(3000, 30))
-"""
-frame_to_csv = Benchmark("df.to_csv('__test__.csv')", setup,
-                         start_date=datetime(2011, 1, 1))
-#----------------------------------
-
-setup = common_setup + """
-df=DataFrame({'A':range(50000)})
-df['B'] = df.A + 1.0
-df['C'] = df.A + 2.0
-df['D'] = df.A + 3.0
-"""
-frame_to_csv2 = Benchmark("df.to_csv('__test__.csv')", setup,
-                         start_date=datetime(2011, 1, 1))
-
-#----------------------------------
-setup = common_setup + """
-from pandas import concat, Timestamp
-
-def create_cols(name):
-    return [ "%s%03d" % (name,i) for i in range(5) ]
-df_float  = DataFrame(np.random.randn(5000, 5),dtype='float64',columns=create_cols('float'))
-df_int    = DataFrame(np.random.randn(5000, 5),dtype='int64',columns=create_cols('int'))
-df_bool   = DataFrame(True,index=df_float.index,columns=create_cols('bool'))
-df_object = DataFrame('foo',index=df_float.index,columns=create_cols('object'))
-df_dt     = DataFrame(Timestamp('20010101'),index=df_float.index,columns=create_cols('date'))
-
-# add in some nans
-df_float.ix[30:500,1:3] = np.nan
-
-df        = concat([ df_float, df_int, df_bool, df_object, df_dt ], axis=1)
-
-"""
-frame_to_csv_mixed = Benchmark("df.to_csv('__test__.csv')", setup,
-                               start_date=datetime(2012, 6, 1))
-
-#----------------------------------------------------------------------
-# parse dates, ISO8601 format
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=1000)
-data = '\\n'.join(rng.map(lambda x: x.strftime("%Y-%m-%d %H:%M:%S")))
-"""
-
-stmt = ("read_csv(StringIO(data), header=None, names=['foo'], "
-        "         parse_dates=['foo'])")
-read_parse_dates_iso8601 = Benchmark(stmt, setup,
-                                     start_date=datetime(2012, 3, 1))
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=1000)
-data = DataFrame(rng, index=rng)
-"""
-
-stmt = ("data.to_csv('__test__.csv', date_format='%Y%m%d')")
-
-frame_to_csv_date_formatting = Benchmark(stmt, setup,
-                                     start_date=datetime(2013, 9, 1))
-
-#----------------------------------------------------------------------
-# infer datetime format
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=1000)
-data = '\\n'.join(rng.map(lambda x: x.strftime("%Y-%m-%d %H:%M:%S")))
-"""
-
-stmt = ("read_csv(StringIO(data), header=None, names=['foo'], "
-        "         parse_dates=['foo'], infer_datetime_format=True)")
-
-read_csv_infer_datetime_format_iso8601 = Benchmark(stmt, setup)
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=1000)
-data = '\\n'.join(rng.map(lambda x: x.strftime("%Y%m%d")))
-"""
-
-stmt = ("read_csv(StringIO(data), header=None, names=['foo'], "
-        "         parse_dates=['foo'], infer_datetime_format=True)")
-
-read_csv_infer_datetime_format_ymd = Benchmark(stmt, setup)
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=1000)
-data = '\\n'.join(rng.map(lambda x: x.strftime("%m/%d/%Y %H:%M:%S.%f")))
-"""
-
-stmt = ("read_csv(StringIO(data), header=None, names=['foo'], "
-        "         parse_dates=['foo'], infer_datetime_format=True)")
-
-read_csv_infer_datetime_format_custom = Benchmark(stmt, setup)
diff --git a/vb_suite/io_sql.py b/vb_suite/io_sql.py
deleted file mode 100644
index ba8367e7e356b..0000000000000
--- a/vb_suite/io_sql.py
+++ /dev/null
@@ -1,126 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-import sqlite3
-import sqlalchemy
-from sqlalchemy import create_engine
-
-engine = create_engine('sqlite:///:memory:')
-con = sqlite3.connect(':memory:')
-"""
-
-sdate = datetime(2014, 6, 1)
-
-
-#-------------------------------------------------------------------------------
-# to_sql
-
-setup = common_setup + """
-index = tm.makeStringIndex(10000)
-df = DataFrame({'float1' : randn(10000),
-                'float2' : randn(10000),
-                'string1' : ['foo'] * 10000,
-                'bool1' : [True] * 10000,
-                'int1' : np.random.randint(0, 100000, size=10000)},
-               index=index)
-"""
-
-sql_write_sqlalchemy = Benchmark("df.to_sql('test1', engine, if_exists='replace')",
-                                 setup, start_date=sdate)
-
-sql_write_fallback = Benchmark("df.to_sql('test1', con, if_exists='replace')",
-                               setup, start_date=sdate)
-
-
-#-------------------------------------------------------------------------------
-# read_sql
-
-setup = common_setup + """
-index = tm.makeStringIndex(10000)
-df = DataFrame({'float1' : randn(10000),
-                'float2' : randn(10000),
-                'string1' : ['foo'] * 10000,
-                'bool1' : [True] * 10000,
-                'int1' : np.random.randint(0, 100000, size=10000)},
-            index=index)
-df.to_sql('test2', engine, if_exists='replace')
-df.to_sql('test2', con, if_exists='replace')
-"""
-
-sql_read_query_sqlalchemy = Benchmark("read_sql_query('SELECT * FROM test2', engine)",
-                                      setup, start_date=sdate)
-
-sql_read_query_fallback = Benchmark("read_sql_query('SELECT * FROM test2', con)",
-                                    setup, start_date=sdate)
-
-sql_read_table_sqlalchemy = Benchmark("read_sql_table('test2', engine)",
-                                      setup, start_date=sdate)
-
-
-#-------------------------------------------------------------------------------
-# type specific write
-
-setup = common_setup + """
-df = DataFrame({'float' : randn(10000),
-                'string' : ['foo'] * 10000,
-                'bool' : [True] * 10000,
-                'datetime' : date_range('2000-01-01', periods=10000, freq='s')})
-df.loc[1000:3000, 'float'] = np.nan
-"""
-
-sql_float_write_sqlalchemy = \
-    Benchmark("df[['float']].to_sql('test_float', engine, if_exists='replace')",
-              setup, start_date=sdate)
-
-sql_float_write_fallback = \
-    Benchmark("df[['float']].to_sql('test_float', con, if_exists='replace')",
-              setup, start_date=sdate)
-
-sql_string_write_sqlalchemy = \
-    Benchmark("df[['string']].to_sql('test_string', engine, if_exists='replace')",
-              setup, start_date=sdate)
-
-sql_string_write_fallback = \
-    Benchmark("df[['string']].to_sql('test_string', con, if_exists='replace')",
-              setup, start_date=sdate)
-
-sql_datetime_write_sqlalchemy = \
-    Benchmark("df[['datetime']].to_sql('test_datetime', engine, if_exists='replace')",
-            setup, start_date=sdate)
-
-#sql_datetime_write_fallback = \
-#   Benchmark("df[['datetime']].to_sql('test_datetime', con, if_exists='replace')",
-#           setup3, start_date=sdate)
-
-#-------------------------------------------------------------------------------
-# type specific read
-
-setup = common_setup + """
-df = DataFrame({'float' : randn(10000),
-                'datetime' : date_range('2000-01-01', periods=10000, freq='s')})
-df['datetime_string'] = df['datetime'].map(str)
-
-df.to_sql('test_type', engine, if_exists='replace')
-df[['float', 'datetime_string']].to_sql('test_type', con, if_exists='replace')
-"""
-
-sql_float_read_query_sqlalchemy = \
-    Benchmark("read_sql_query('SELECT float FROM test_type', engine)",
-            setup, start_date=sdate)
-
-sql_float_read_table_sqlalchemy = \
-    Benchmark("read_sql_table('test_type', engine, columns=['float'])",
-            setup, start_date=sdate)
-
-sql_float_read_query_fallback = \
-    Benchmark("read_sql_query('SELECT float FROM test_type', con)",
-            setup, start_date=sdate)
-
-sql_datetime_read_as_native_sqlalchemy = \
-    Benchmark("read_sql_table('test_type', engine, columns=['datetime'])",
-            setup, start_date=sdate)
-
-sql_datetime_read_and_parse_sqlalchemy = \
-    Benchmark("read_sql_table('test_type', engine, columns=['datetime_string'], parse_dates=['datetime_string'])",
-            setup, start_date=sdate)
diff --git a/vb_suite/join_merge.py b/vb_suite/join_merge.py
deleted file mode 100644
index 238a129552e90..0000000000000
--- a/vb_suite/join_merge.py
+++ /dev/null
@@ -1,270 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-setup = common_setup + """
-level1 = tm.makeStringIndex(10).values
-level2 = tm.makeStringIndex(1000).values
-label1 = np.arange(10).repeat(1000)
-label2 = np.tile(np.arange(1000), 10)
-
-key1 = np.tile(level1.take(label1), 10)
-key2 = np.tile(level2.take(label2), 10)
-
-shuf = np.arange(100000)
-random.shuffle(shuf)
-try:
-    index2 = MultiIndex(levels=[level1, level2], labels=[label1, label2])
-    index3 = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)],
-                        labels=[np.arange(10).repeat(10000),
-                                np.tile(np.arange(100).repeat(100), 10),
-                                np.tile(np.tile(np.arange(100), 100), 10)])
-    df_multi = DataFrame(np.random.randn(len(index2), 4), index=index2,
-                         columns=['A', 'B', 'C', 'D'])
-except:  # pre-MultiIndex
-    pass
-
-try:
-    DataFrame = DataMatrix
-except:
-    pass
-
-df = pd.DataFrame({'data1' : np.random.randn(100000),
-                'data2' : np.random.randn(100000),
-                'key1' : key1,
-                'key2' : key2})
-
-
-df_key1 = pd.DataFrame(np.random.randn(len(level1), 4), index=level1,
-                    columns=['A', 'B', 'C', 'D'])
-df_key2 = pd.DataFrame(np.random.randn(len(level2), 4), index=level2,
-                    columns=['A', 'B', 'C', 'D'])
-
-df_shuf = df.reindex(df.index[shuf])
-"""
-
-#----------------------------------------------------------------------
-# DataFrame joins on key
-
-join_dataframe_index_single_key_small = \
-    Benchmark("df.join(df_key1, on='key1')", setup,
-              name='join_dataframe_index_single_key_small')
-
-join_dataframe_index_single_key_bigger = \
-    Benchmark("df.join(df_key2, on='key2')", setup,
-              name='join_dataframe_index_single_key_bigger')
-
-join_dataframe_index_single_key_bigger_sort = \
-    Benchmark("df_shuf.join(df_key2, on='key2', sort=True)", setup,
-              name='join_dataframe_index_single_key_bigger_sort',
-              start_date=datetime(2012, 2, 5))
-
-join_dataframe_index_multi = \
-    Benchmark("df.join(df_multi, on=['key1', 'key2'])", setup,
-              name='join_dataframe_index_multi',
-              start_date=datetime(2011, 10, 20))
-
-#----------------------------------------------------------------------
-# Joins on integer keys
-setup = common_setup + """
-df = pd.DataFrame({'key1': np.tile(np.arange(500).repeat(10), 2),
-                'key2': np.tile(np.arange(250).repeat(10), 4),
-                'value': np.random.randn(10000)})
-df2 = pd.DataFrame({'key1': np.arange(500), 'value2': randn(500)})
-df3 = df[:5000]
-"""
-
-
-join_dataframe_integer_key = Benchmark("merge(df, df2, on='key1')", setup,
-                                       start_date=datetime(2011, 10, 20))
-join_dataframe_integer_2key = Benchmark("merge(df, df3)", setup,
-                                        start_date=datetime(2011, 10, 20))
-
-#----------------------------------------------------------------------
-# DataFrame joins on index
-
-
-#----------------------------------------------------------------------
-# Merges
-setup = common_setup + """
-N = 10000
-
-indices = tm.makeStringIndex(N).values
-indices2 = tm.makeStringIndex(N).values
-key = np.tile(indices[:8000], 10)
-key2 = np.tile(indices2[:8000], 10)
-
-left = pd.DataFrame({'key' : key, 'key2':key2,
-                  'value' : np.random.randn(80000)})
-right = pd.DataFrame({'key': indices[2000:], 'key2':indices2[2000:],
-                   'value2' : np.random.randn(8000)})
-"""
-
-merge_2intkey_nosort = Benchmark('merge(left, right, sort=False)', setup,
-                                 start_date=datetime(2011, 10, 20))
-
-merge_2intkey_sort = Benchmark('merge(left, right, sort=True)', setup,
-                               start_date=datetime(2011, 10, 20))
-
-#----------------------------------------------------------------------
-# Appending DataFrames
-
-setup = common_setup + """
-df1 = pd.DataFrame(np.random.randn(10000, 4), columns=['A', 'B', 'C', 'D'])
-df2 = df1.copy()
-df2.index = np.arange(10000, 20000)
-mdf1 = df1.copy()
-mdf1['obj1'] = 'bar'
-mdf1['obj2'] = 'bar'
-mdf1['int1'] = 5
-try:
-    mdf1.consolidate(inplace=True)
-except:
-    pass
-mdf2 = mdf1.copy()
-mdf2.index = df2.index
-"""
-
-stmt = "df1.append(df2)"
-append_frame_single_homogenous = \
-    Benchmark(stmt, setup, name='append_frame_single_homogenous',
-              ncalls=500, repeat=1)
-
-stmt = "mdf1.append(mdf2)"
-append_frame_single_mixed = Benchmark(stmt, setup,
-                                      name='append_frame_single_mixed',
-                                      ncalls=500, repeat=1)
-
-#----------------------------------------------------------------------
-# data alignment
-
-setup = common_setup + """n = 1000000
-# indices = tm.makeStringIndex(n)
-def sample(values, k):
-    sampler = np.random.permutation(len(values))
-    return values.take(sampler[:k])
-sz = 500000
-rng = np.arange(0, 10000000000000, 10000000)
-stamps = np.datetime64(datetime.now()).view('i8') + rng
-idx1 = np.sort(sample(stamps, sz))
-idx2 = np.sort(sample(stamps, sz))
-ts1 = Series(np.random.randn(sz), idx1)
-ts2 = Series(np.random.randn(sz), idx2)
-"""
-stmt = "ts1 + ts2"
-series_align_int64_index = \
-    Benchmark(stmt, setup,
-              name="series_align_int64_index",
-              start_date=datetime(2010, 6, 1), logy=True)
-
-stmt = "ts1.align(ts2, join='left')"
-series_align_left_monotonic = \
-    Benchmark(stmt, setup,
-              name="series_align_left_monotonic",
-              start_date=datetime(2011, 12, 1), logy=True)
-
-#----------------------------------------------------------------------
-# Concat Series axis=1
-
-setup = common_setup + """
-n = 1000
-indices = tm.makeStringIndex(1000)
-s = Series(n, index=indices)
-pieces = [s[i:-i] for i in range(1, 10)]
-pieces = pieces * 50
-"""
-
-concat_series_axis1 = Benchmark('concat(pieces, axis=1)', setup,
-                                start_date=datetime(2012, 2, 27))
-
-setup = common_setup + """
-df = pd.DataFrame(randn(5, 4))
-"""
-
-concat_small_frames = Benchmark('concat([df] * 1000)', setup,
-                                start_date=datetime(2012, 1, 1))
-
-
-#----------------------------------------------------------------------
-# Concat empty
-
-setup = common_setup + """
-df = pd.DataFrame(dict(A = range(10000)),index=date_range('20130101',periods=10000,freq='s'))
-empty = pd.DataFrame()
-"""
-
-concat_empty_frames1 = Benchmark('concat([df,empty])', setup,
-                                start_date=datetime(2012, 1, 1))
-concat_empty_frames2 = Benchmark('concat([empty,df])', setup,
-                                start_date=datetime(2012, 1, 1))
-
-
-#----------------------------------------------------------------------
-# Ordered merge
-
-setup = common_setup + """
-groups = tm.makeStringIndex(10).values
-
-left = pd.DataFrame({'group': groups.repeat(5000),
-                  'key' : np.tile(np.arange(0, 10000, 2), 10),
-                  'lvalue': np.random.randn(50000)})
-
-right = pd.DataFrame({'key' : np.arange(10000),
-                   'rvalue' : np.random.randn(10000)})
-
-"""
-
-stmt = "ordered_merge(left, right, on='key', left_by='group')"
-
-#----------------------------------------------------------------------
-# outer join of non-unique
-# GH 6329
-
-setup = common_setup + """
-date_index = date_range('01-Jan-2013', '23-Jan-2013', freq='T')
-daily_dates = date_index.to_period('D').to_timestamp('S','S')
-fracofday = date_index.view(np.ndarray) - daily_dates.view(np.ndarray)
-fracofday = fracofday.astype('timedelta64[ns]').astype(np.float64)/864e11
-fracofday = TimeSeries(fracofday, daily_dates)
-index = date_range(date_index.min().to_period('A').to_timestamp('D','S'),
-                      date_index.max().to_period('A').to_timestamp('D','E'),
-                      freq='D')
-temp = TimeSeries(1.0, index)
-"""
-
-join_non_unique_equal = Benchmark('fracofday * temp[fracofday.index]', setup,
-                                   start_date=datetime(2013, 1, 1))
-
-
-setup = common_setup + '''
-np.random.seed(2718281)
-n = 50000
-
-left = pd.DataFrame(np.random.randint(1, n/500, (n, 2)),
-        columns=['jim', 'joe'])
-
-right = pd.DataFrame(np.random.randint(1, n/500, (n, 2)),
-        columns=['jolie', 'jolia']).set_index('jolie')
-'''
-
-left_outer_join_index = Benchmark("left.join(right, on='jim')", setup,
-                                  name='left_outer_join_index')
-
-
-setup = common_setup + """
-low, high, n = -1 << 10, 1 << 10, 1 << 20
-left = pd.DataFrame(np.random.randint(low, high, (n, 7)),
-                    columns=list('ABCDEFG'))
-left['left'] = left.sum(axis=1)
-
-i = np.random.permutation(len(left))
-right = left.iloc[i].copy()
-right.columns = right.columns[:-1].tolist() + ['right']
-right.index = np.arange(len(right))
-right['right'] *= -1
-"""
-
-i8merge = Benchmark("merge(left, right, how='outer')", setup,
-                    name='i8merge')
diff --git a/vb_suite/make.py b/vb_suite/make.py
deleted file mode 100755
index 5a8a8215db9a4..0000000000000
--- a/vb_suite/make.py
+++ /dev/null
@@ -1,167 +0,0 @@
-#!/usr/bin/env python
-
-"""
-Python script for building documentation.
-
-To build the docs you must have all optional dependencies for statsmodels
-installed. See the installation instructions for a list of these.
-
-Note: currently latex builds do not work because of table formats that are not
-supported in the latex generation.
-
-Usage
------
-python make.py clean
-python make.py html
-"""
-
-import glob
-import os
-import shutil
-import sys
-import sphinx
-
-os.environ['PYTHONPATH'] = '..'
-
-SPHINX_BUILD = 'sphinxbuild'
-
-
-def upload():
-    'push a copy to the site'
-    os.system('cd build/html; rsync -avz . pandas@pandas.pydata.org'
-              ':/usr/share/nginx/pandas/pandas-docs/vbench/ -essh')
-
-
-def clean():
-    if os.path.exists('build'):
-        shutil.rmtree('build')
-
-    if os.path.exists('source/generated'):
-        shutil.rmtree('source/generated')
-
-
-def html():
-    check_build()
-    if os.system('sphinx-build -P -b html -d build/doctrees '
-                 'source build/html'):
-        raise SystemExit("Building HTML failed.")
-
-
-def check_build():
-    build_dirs = [
-        'build', 'build/doctrees', 'build/html',
-        'build/plots', 'build/_static',
-        'build/_templates']
-    for d in build_dirs:
-        try:
-            os.mkdir(d)
-        except OSError:
-            pass
-
-
-def all():
-    clean()
-    html()
-
-
-def auto_update():
-    msg = ''
-    try:
-        clean()
-        html()
-        upload()
-        sendmail()
-    except (Exception, SystemExit), inst:
-        msg += str(inst) + '\n'
-        sendmail(msg)
-
-
-def sendmail(err_msg=None):
-    from_name, to_name = _get_config()
-
-    if err_msg is None:
-        msgstr = 'Daily vbench uploaded successfully'
-        subject = "VB: daily update successful"
-    else:
-        msgstr = err_msg
-        subject = "VB: daily update failed"
-
-    import smtplib
-    from email.MIMEText import MIMEText
-    msg = MIMEText(msgstr)
-    msg['Subject'] = subject
-    msg['From'] = from_name
-    msg['To'] = to_name
-
-    server_str, port, login, pwd = _get_credentials()
-    server = smtplib.SMTP(server_str, port)
-    server.ehlo()
-    server.starttls()
-    server.ehlo()
-
-    server.login(login, pwd)
-    try:
-        server.sendmail(from_name, to_name, msg.as_string())
-    finally:
-        server.close()
-
-
-def _get_dir(subdir=None):
-    import getpass
-    USERNAME = getpass.getuser()
-    if sys.platform == 'darwin':
-        HOME = '/Users/%s' % USERNAME
-    else:
-        HOME = '/home/%s' % USERNAME
-
-    if subdir is None:
-        subdir = '/code/scripts'
-    conf_dir = '%s%s' % (HOME, subdir)
-    return conf_dir
-
-
-def _get_credentials():
-    tmp_dir = _get_dir()
-    cred = '%s/credentials' % tmp_dir
-    with open(cred, 'r') as fh:
-        server, port, un, domain = fh.read().split(',')
-    port = int(port)
-    login = un + '@' + domain + '.com'
-
-    import base64
-    with open('%s/cron_email_pwd' % tmp_dir, 'r') as fh:
-        pwd = base64.b64decode(fh.read())
-
-    return server, port, login, pwd
-
-
-def _get_config():
-    tmp_dir = _get_dir()
-    with open('%s/addresses' % tmp_dir, 'r') as fh:
-        from_name, to_name = fh.read().split(',')
-    return from_name, to_name
-
-funcd = {
-    'html': html,
-    'clean': clean,
-    'upload': upload,
-    'auto_update': auto_update,
-    'all': all,
-}
-
-small_docs = False
-
-# current_dir = os.getcwd()
-# os.chdir(os.path.dirname(os.path.join(current_dir, __file__)))
-
-if len(sys.argv) > 1:
-    for arg in sys.argv[1:]:
-        func = funcd.get(arg)
-        if func is None:
-            raise SystemExit('Do not know how to handle %s; valid args are %s' % (
-                arg, funcd.keys()))
-        func()
-else:
-    small_docs = False
-    all()
-# os.chdir(current_dir)
diff --git a/vb_suite/measure_memory_consumption.py b/vb_suite/measure_memory_consumption.py
deleted file mode 100755
index bb73cf5da4302..0000000000000
--- a/vb_suite/measure_memory_consumption.py
+++ /dev/null
@@ -1,55 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-from __future__ import print_function
-
-"""Short one-line summary
-
-long summary
-"""
-
-
-def main():
-    import shutil
-    import tempfile
-    import warnings
-
-    from pandas import Series
-
-    from vbench.api import BenchmarkRunner
-    from suite import (REPO_PATH, BUILD, DB_PATH, PREPARE,
-                       dependencies, benchmarks)
-
-    from memory_profiler import memory_usage
-
-    warnings.filterwarnings('ignore', category=FutureWarning)
-
-    try:
-        TMP_DIR = tempfile.mkdtemp()
-        runner = BenchmarkRunner(
-            benchmarks, REPO_PATH, REPO_PATH, BUILD, DB_PATH,
-            TMP_DIR, PREPARE, always_clean=True,
-            # run_option='eod', start_date=START_DATE,
-            module_dependencies=dependencies)
-        results = {}
-        for b in runner.benchmarks:
-            k = b.name
-            try:
-                vs = memory_usage((b.run,))
-                v = max(vs)
-                # print(k, v)
-                results[k] = v
-            except Exception as e:
-                print("Exception caught in %s\n" % k)
-                print(str(e))
-
-        s = Series(results)
-        s.sort()
-        print((s))
-
-    finally:
-        shutil.rmtree(TMP_DIR)
-
-
-if __name__ == "__main__":
-    main()
diff --git a/vb_suite/miscellaneous.py b/vb_suite/miscellaneous.py
deleted file mode 100644
index da2c736e79ea7..0000000000000
--- a/vb_suite/miscellaneous.py
+++ /dev/null
@@ -1,32 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# cache_readonly
-
-setup = common_setup + """
-from pandas.util.decorators import cache_readonly
-
-class Foo:
-
-    @cache_readonly
-    def prop(self):
-        return 5
-obj = Foo()
-"""
-misc_cache_readonly = Benchmark("obj.prop", setup, name="misc_cache_readonly",
-                                ncalls=2000000)
-
-#----------------------------------------------------------------------
-# match
-
-setup = common_setup + """
-uniques = tm.makeStringIndex(1000).values
-all = uniques.repeat(10)
-"""
-
-match_strings = Benchmark("match(all, uniques)", setup,
-                          start_date=datetime(2012, 5, 12))
diff --git a/vb_suite/packers.py b/vb_suite/packers.py
deleted file mode 100644
index 69ec10822b392..0000000000000
--- a/vb_suite/packers.py
+++ /dev/null
@@ -1,252 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-start_date = datetime(2013, 5, 1)
-
-common_setup = """from .pandas_vb_common import *
-import os
-import pandas as pd
-from pandas.core import common as com
-from pandas.compat import BytesIO
-from random import randrange
-
-f = '__test__.msg'
-def remove(f):
-   try:
-       os.remove(f)
-   except:
-       pass
-
-N=100000
-C=5
-index = date_range('20000101',periods=N,freq='H')
-df = DataFrame(dict([ ("float{0}".format(i),randn(N)) for i in range(C) ]),
-               index=index)
-
-N=100000
-C=5
-index = date_range('20000101',periods=N,freq='H')
-df2 = DataFrame(dict([ ("float{0}".format(i),randn(N)) for i in range(C) ]),
-                index=index)
-df2['object'] = ['%08x'%randrange(16**8) for _ in range(N)]
-remove(f)
-"""
-
-#----------------------------------------------------------------------
-# msgpack
-
-setup = common_setup + """
-df2.to_msgpack(f)
-"""
-
-packers_read_pack = Benchmark("pd.read_msgpack(f)", setup, start_date=start_date)
-
-setup = common_setup + """
-"""
-
-packers_write_pack = Benchmark("df2.to_msgpack(f)", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# pickle
-
-setup = common_setup + """
-df2.to_pickle(f)
-"""
-
-packers_read_pickle = Benchmark("pd.read_pickle(f)", setup, start_date=start_date)
-
-setup = common_setup + """
-"""
-
-packers_write_pickle = Benchmark("df2.to_pickle(f)", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# csv
-
-setup = common_setup + """
-df.to_csv(f)
-"""
-
-packers_read_csv = Benchmark("pd.read_csv(f)", setup, start_date=start_date)
-
-setup = common_setup + """
-"""
-
-packers_write_csv = Benchmark("df.to_csv(f)", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# hdf store
-
-setup = common_setup + """
-df2.to_hdf(f,'df')
-"""
-
-packers_read_hdf_store = Benchmark("pd.read_hdf(f,'df')", setup, start_date=start_date)
-
-setup = common_setup + """
-"""
-
-packers_write_hdf_store = Benchmark("df2.to_hdf(f,'df')", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# hdf table
-
-setup = common_setup + """
-df2.to_hdf(f,'df',format='table')
-"""
-
-packers_read_hdf_table = Benchmark("pd.read_hdf(f,'df')", setup, start_date=start_date)
-
-setup = common_setup + """
-"""
-
-packers_write_hdf_table = Benchmark("df2.to_hdf(f,'df',table=True)", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# sql
-
-setup = common_setup + """
-import sqlite3
-from sqlalchemy import create_engine
-engine = create_engine('sqlite:///:memory:')
-
-df2.to_sql('table', engine, if_exists='replace')
-"""
-
-packers_read_sql= Benchmark("pd.read_sql_table('table', engine)", setup, start_date=start_date)
-
-setup = common_setup + """
-import sqlite3
-from sqlalchemy import create_engine
-engine = create_engine('sqlite:///:memory:')
-"""
-
-packers_write_sql = Benchmark("df2.to_sql('table', engine, if_exists='replace')", setup, start_date=start_date)
-
-#----------------------------------------------------------------------
-# json
-
-setup_int_index = """
-import numpy as np
-df.index = np.arange(N)
-"""
-
-setup = common_setup + """
-df.to_json(f,orient='split')
-"""
-packers_read_json_date_index = Benchmark("pd.read_json(f, orient='split')", setup, start_date=start_date)
-setup = setup + setup_int_index
-packers_read_json = Benchmark("pd.read_json(f, orient='split')", setup, start_date=start_date)
-
-setup = common_setup + """
-"""
-packers_write_json_date_index = Benchmark("df.to_json(f,orient='split')", setup, cleanup="remove(f)", start_date=start_date)
-
-setup = setup + setup_int_index
-packers_write_json = Benchmark("df.to_json(f,orient='split')", setup, cleanup="remove(f)", start_date=start_date)
-packers_write_json_T = Benchmark("df.to_json(f,orient='columns')", setup, cleanup="remove(f)", start_date=start_date)
-
-setup = common_setup + """
-from numpy.random import randint
-from collections import OrderedDict
-
-cols = [
-  lambda i: ("{0}_timedelta".format(i), [pd.Timedelta('%d seconds' % randrange(1e6)) for _ in range(N)]),
-  lambda i: ("{0}_int".format(i), randint(1e8, size=N)),
-  lambda i: ("{0}_timestamp".format(i), [pd.Timestamp( 1418842918083256000 + randrange(1e9, 1e18, 200)) for _ in range(N)])
-  ]
-df_mixed = DataFrame(OrderedDict([cols[i % len(cols)](i) for i in range(C)]),
-                     index=index)
-"""
-packers_write_json_mixed_delta_int_tstamp = Benchmark("df_mixed.to_json(f,orient='split')", setup, cleanup="remove(f)", start_date=start_date)
-
-setup = common_setup + """
-from numpy.random import randint
-from collections import OrderedDict
-cols = [
-  lambda i: ("{0}_float".format(i), randn(N)),
-  lambda i: ("{0}_int".format(i), randint(1e8, size=N))
-  ]
-df_mixed = DataFrame(OrderedDict([cols[i % len(cols)](i) for i in range(C)]),
-                     index=index)
-"""
-packers_write_json_mixed_float_int = Benchmark("df_mixed.to_json(f,orient='index')", setup, cleanup="remove(f)", start_date=start_date)
-packers_write_json_mixed_float_int_T = Benchmark("df_mixed.to_json(f,orient='columns')", setup, cleanup="remove(f)", start_date=start_date)
-
-setup = common_setup + """
-from numpy.random import randint
-from collections import OrderedDict
-cols = [
-  lambda i: ("{0}_float".format(i), randn(N)),
-  lambda i: ("{0}_int".format(i), randint(1e8, size=N)),
-  lambda i: ("{0}_str".format(i), ['%08x'%randrange(16**8) for _ in range(N)])
-  ]
-df_mixed = DataFrame(OrderedDict([cols[i % len(cols)](i) for i in range(C)]),
-                     index=index)
-"""
-packers_write_json_mixed_float_int_str = Benchmark("df_mixed.to_json(f,orient='split')", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# stata
-
-setup = common_setup + """
-df.to_stata(f, {'index': 'tc'})
-"""
-packers_read_stata = Benchmark("pd.read_stata(f)", setup, start_date=start_date)
-
-packers_write_stata = Benchmark("df.to_stata(f, {'index': 'tc'})", setup, cleanup="remove(f)", start_date=start_date)
-
-setup = common_setup + """
-df['int8_'] = [randint(np.iinfo(np.int8).min, np.iinfo(np.int8).max - 27) for _ in range(N)]
-df['int16_'] = [randint(np.iinfo(np.int16).min, np.iinfo(np.int16).max - 27) for _ in range(N)]
-df['int32_'] = [randint(np.iinfo(np.int32).min, np.iinfo(np.int32).max - 27) for _ in range(N)]
-df['float32_'] = np.array(randn(N), dtype=np.float32)
-df.to_stata(f, {'index': 'tc'})
-"""
-
-packers_read_stata_with_validation = Benchmark("pd.read_stata(f)", setup, start_date=start_date)
-
-packers_write_stata_with_validation = Benchmark("df.to_stata(f, {'index': 'tc'})", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# Excel - alternative writers
-setup = common_setup + """
-bio = BytesIO()
-"""
-
-excel_writer_bench = """
-bio.seek(0)
-writer = pd.io.excel.ExcelWriter(bio, engine='{engine}')
-df[:2000].to_excel(writer)
-writer.save()
-"""
-
-benchmark_xlsxwriter = excel_writer_bench.format(engine='xlsxwriter')
-
-packers_write_excel_xlsxwriter = Benchmark(benchmark_xlsxwriter, setup)
-
-benchmark_openpyxl = excel_writer_bench.format(engine='openpyxl')
-
-packers_write_excel_openpyxl = Benchmark(benchmark_openpyxl, setup)
-
-benchmark_xlwt = excel_writer_bench.format(engine='xlwt')
-
-packers_write_excel_xlwt = Benchmark(benchmark_xlwt, setup)
-
-
-#----------------------------------------------------------------------
-# Excel - reader
-
-setup = common_setup + """
-bio = BytesIO()
-writer = pd.io.excel.ExcelWriter(bio, engine='xlsxwriter')
-df[:2000].to_excel(writer)
-writer.save()
-"""
-
-benchmark_read_excel="""
-bio.seek(0)
-pd.read_excel(bio)
-"""
-
-packers_read_excel = Benchmark(benchmark_read_excel, setup)
diff --git a/vb_suite/pandas_vb_common.py b/vb_suite/pandas_vb_common.py
deleted file mode 100644
index a1326d63a112a..0000000000000
--- a/vb_suite/pandas_vb_common.py
+++ /dev/null
@@ -1,30 +0,0 @@
-from pandas import *
-import pandas as pd
-from datetime import timedelta
-from numpy.random import randn
-from numpy.random import randint
-from numpy.random import permutation
-import pandas.util.testing as tm
-import random
-import numpy as np
-try:
-    from pandas.compat import range
-except ImportError:
-    pass
-
-np.random.seed(1234)
-try:
-    import pandas._tseries as lib
-except:
-    import pandas.lib as lib
-
-try:
-    Panel = WidePanel
-except Exception:
-    pass
-
-# didn't add to namespace until later
-try:
-    from pandas.core.index import MultiIndex
-except ImportError:
-    pass
diff --git a/vb_suite/panel_ctor.py b/vb_suite/panel_ctor.py
deleted file mode 100644
index 9f497e7357a61..0000000000000
--- a/vb_suite/panel_ctor.py
+++ /dev/null
@@ -1,76 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# Panel.from_dict homogenization time
-
-START_DATE = datetime(2011, 6, 1)
-
-setup_same_index = common_setup + """
-# create 100 dataframes with the same index
-dr = np.asarray(DatetimeIndex(start=datetime(1990,1,1), end=datetime(2012,1,1),
-                              freq=datetools.Day(1)))
-data_frames = {}
-for x in range(100):
-   df = DataFrame({"a": [0]*len(dr), "b": [1]*len(dr),
-                   "c": [2]*len(dr)}, index=dr)
-   data_frames[x] = df
-"""
-
-panel_from_dict_same_index = \
-    Benchmark("Panel.from_dict(data_frames)",
-              setup_same_index, name='panel_from_dict_same_index',
-              start_date=START_DATE, repeat=1, logy=True)
-
-setup_equiv_indexes = common_setup + """
-data_frames = {}
-for x in range(100):
-   dr = np.asarray(DatetimeIndex(start=datetime(1990,1,1), end=datetime(2012,1,1),
-                                 freq=datetools.Day(1)))
-   df = DataFrame({"a": [0]*len(dr), "b": [1]*len(dr),
-                   "c": [2]*len(dr)}, index=dr)
-   data_frames[x] = df
-"""
-
-panel_from_dict_equiv_indexes = \
-    Benchmark("Panel.from_dict(data_frames)",
-              setup_equiv_indexes, name='panel_from_dict_equiv_indexes',
-              start_date=START_DATE, repeat=1, logy=True)
-
-setup_all_different_indexes = common_setup + """
-data_frames = {}
-start = datetime(1990,1,1)
-end = datetime(2012,1,1)
-for x in range(100):
-   end += timedelta(days=1)
-   dr = np.asarray(date_range(start, end))
-   df = DataFrame({"a": [0]*len(dr), "b": [1]*len(dr),
-                   "c": [2]*len(dr)}, index=dr)
-   data_frames[x] = df
-"""
-panel_from_dict_all_different_indexes = \
-    Benchmark("Panel.from_dict(data_frames)",
-              setup_all_different_indexes,
-              name='panel_from_dict_all_different_indexes',
-              start_date=START_DATE, repeat=1, logy=True)
-
-setup_two_different_indexes = common_setup + """
-data_frames = {}
-start = datetime(1990,1,1)
-end = datetime(2012,1,1)
-for x in range(100):
-   if x == 50:
-       end += timedelta(days=1)
-   dr = np.asarray(date_range(start, end))
-   df = DataFrame({"a": [0]*len(dr), "b": [1]*len(dr),
-                   "c": [2]*len(dr)}, index=dr)
-   data_frames[x] = df
-"""
-panel_from_dict_two_different_indexes = \
-    Benchmark("Panel.from_dict(data_frames)",
-              setup_two_different_indexes,
-              name='panel_from_dict_two_different_indexes',
-              start_date=START_DATE, repeat=1, logy=True)
diff --git a/vb_suite/panel_methods.py b/vb_suite/panel_methods.py
deleted file mode 100644
index 28586422a66e3..0000000000000
--- a/vb_suite/panel_methods.py
+++ /dev/null
@@ -1,28 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# shift
-
-setup = common_setup + """
-index = date_range(start="2000", freq="D", periods=1000)
-panel = Panel(np.random.randn(100, len(index), 1000))
-"""
-
-panel_shift = Benchmark('panel.shift(1)', setup,
-                               start_date=datetime(2012, 1, 12))
-
-panel_shift_minor = Benchmark('panel.shift(1, axis="minor")', setup,
-                               start_date=datetime(2012, 1, 12))
-
-panel_pct_change_major = Benchmark('panel.pct_change(1, axis="major")', setup,
-                                   start_date=datetime(2014, 4, 19))
-
-panel_pct_change_minor = Benchmark('panel.pct_change(1, axis="minor")', setup,
-                                   start_date=datetime(2014, 4, 19))
-
-panel_pct_change_items = Benchmark('panel.pct_change(1, axis="items")', setup,
-                                   start_date=datetime(2014, 4, 19))
diff --git a/vb_suite/parser_vb.py b/vb_suite/parser_vb.py
deleted file mode 100644
index bb9ccbdb5e854..0000000000000
--- a/vb_suite/parser_vb.py
+++ /dev/null
@@ -1,112 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-from pandas import read_csv, read_table
-"""
-
-setup = common_setup + """
-import os
-N = 10000
-K = 8
-df = DataFrame(np.random.randn(N, K) * np.random.randint(100, 10000, (N, K)))
-df.to_csv('test.csv', sep='|')
-"""
-
-read_csv_vb = Benchmark("read_csv('test.csv', sep='|')", setup,
-                        cleanup="os.remove('test.csv')",
-                        start_date=datetime(2012, 5, 7))
-
-
-setup = common_setup + """
-import os
-N = 10000
-K = 8
-format = lambda x: '{:,}'.format(x)
-df = DataFrame(np.random.randn(N, K) * np.random.randint(100, 10000, (N, K)))
-df = df.applymap(format)
-df.to_csv('test.csv', sep='|')
-"""
-
-read_csv_thou_vb = Benchmark("read_csv('test.csv', sep='|', thousands=',')",
-                             setup,
-                             cleanup="os.remove('test.csv')",
-                             start_date=datetime(2012, 5, 7))
-
-setup = common_setup + """
-data = ['A,B,C']
-data = data + ['1,2,3 # comment'] * 100000
-data = '\\n'.join(data)
-"""
-
-stmt = "read_csv(StringIO(data), comment='#')"
-read_csv_comment2 = Benchmark(stmt, setup,
-                              start_date=datetime(2011, 11, 1))
-
-setup = common_setup + """
-try:
-    from cStringIO import StringIO
-except ImportError:
-    from io import StringIO
-
-import os
-N = 10000
-K = 8
-data = '''\
-KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-'''
-data = data * 200
-"""
-cmd = ("read_table(StringIO(data), sep=',', header=None, "
-       "parse_dates=[[1,2], [1,3]])")
-sdate = datetime(2012, 5, 7)
-read_table_multiple_date = Benchmark(cmd, setup, start_date=sdate)
-
-setup = common_setup + """
-try:
-    from cStringIO import StringIO
-except ImportError:
-    from io import StringIO
-
-import os
-N = 10000
-K = 8
-data = '''\
-KORD,19990127 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-'''
-data = data * 200
-"""
-cmd = "read_table(StringIO(data), sep=',', header=None, parse_dates=[1])"
-sdate = datetime(2012, 5, 7)
-read_table_multiple_date_baseline = Benchmark(cmd, setup, start_date=sdate)
-
-setup = common_setup + """
-try:
-    from cStringIO import StringIO
-except ImportError:
-    from io import StringIO
-
-data = '''\
-0.1213700904466425978256438611,0.0525708283766902484401839501,0.4174092731488769913994474336
-0.4096341697147408700274695547,0.1587830198973579909349496119,0.1292545832485494372576795285
-0.8323255650024565799327547210,0.9694902427379478160318626578,0.6295047811546814475747169126
-0.4679375305798131323697930383,0.2963942381834381301075609371,0.5268936082160610157032465394
-0.6685382761849776311890991564,0.6721207066140679753374342908,0.6519975277021627935170045020
-'''
-data = data * 200
-"""
-cmd = "read_csv(StringIO(data), sep=',', header=None, float_precision=None)"
-sdate = datetime(2014, 8, 20)
-read_csv_default_converter = Benchmark(cmd, setup, start_date=sdate)
-cmd = "read_csv(StringIO(data), sep=',', header=None, float_precision='high')"
-read_csv_precise_converter = Benchmark(cmd, setup, start_date=sdate)
-cmd = "read_csv(StringIO(data), sep=',', header=None, float_precision='round_trip')"
-read_csv_roundtrip_converter = Benchmark(cmd, setup, start_date=sdate)
diff --git a/vb_suite/perf_HEAD.py b/vb_suite/perf_HEAD.py
deleted file mode 100755
index c14a1795f01e0..0000000000000
--- a/vb_suite/perf_HEAD.py
+++ /dev/null
@@ -1,243 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-from __future__ import print_function
-
-"""Run all the vbenches in `suite`, and post the results as a json blob to gist
-
-"""
-
-import urllib2
-from contextlib import closing
-from urllib2 import urlopen
-import json
-
-import pandas as pd
-
-WEB_TIMEOUT = 10
-
-
-def get_travis_data():
-    """figure out what worker we're running on,  and the number of jobs it's running
-    """
-    import os
-    jobid = os.environ.get("TRAVIS_JOB_ID")
-    if not jobid:
-        return None, None
-
-    with closing(urlopen("https://api.travis-ci.org/workers/")) as resp:
-        workers = json.loads(resp.read())
-
-    host = njobs = None
-    for item in workers:
-        host = item.get("host")
-        id = ((item.get("payload") or {}).get("job") or {}).get("id")
-        if id and str(id) == str(jobid):
-            break
-        if host:
-            njobs = len(
-                [x for x in workers if host in x['host'] and x['payload']])
-
-    return host, njobs
-
-
-def get_utcdatetime():
-    try:
-        from datetime import datetime
-        return datetime.utcnow().isoformat(" ")
-    except:
-        pass
-
-
-def dump_as_gist(data, desc="The Commit", njobs=None):
-    host, njobs2 = get_travis_data()[:2]
-
-    if njobs:  # be slightly more reliable
-        njobs = max(njobs, njobs2)
-
-    content = dict(version="0.1.1",
-                   timings=data,
-                   datetime=get_utcdatetime(),   # added in 0.1.1
-                   hostname=host,   # added in 0.1.1
-                   njobs=njobs    # added in 0.1.1, a measure of load on the travis box
-                   )
-
-    payload = dict(description=desc,
-                   public=True,
-                   files={'results.json': dict(content=json.dumps(content))})
-    try:
-        with closing(urlopen("https://api.github.com/gists",
-                             json.dumps(payload), timeout=WEB_TIMEOUT)) as r:
-            if 200 <= r.getcode() < 300:
-                print("\n\n" + "-" * 80)
-
-                gist = json.loads(r.read())
-                file_raw_url = gist['files'].items()[0][1]['raw_url']
-                print("[vbench-gist-raw_url] %s" % file_raw_url)
-                print("[vbench-html-url] %s" % gist['html_url'])
-                print("[vbench-api-url] %s" % gist['url'])
-
-                print("-" * 80 + "\n\n")
-            else:
-                print("api.github.com returned status %d" % r.getcode())
-    except:
-        print("Error occured while dumping to gist")
-
-
-def main():
-    import warnings
-    from suite import benchmarks
-
-    exit_code = 0
-    warnings.filterwarnings('ignore', category=FutureWarning)
-
-    host, njobs = get_travis_data()[:2]
-    results = []
-    for b in benchmarks:
-        try:
-            d = b.run()
-            d.update(dict(name=b.name))
-            results.append(d)
-            msg = "{name:<40}: {timing:> 10.4f} [ms]"
-            print(msg.format(name=results[-1]['name'],
-                             timing=results[-1]['timing']))
-
-        except Exception as e:
-            exit_code = 1
-            if (type(e) == KeyboardInterrupt or
-                    'KeyboardInterrupt' in str(d)):
-                raise KeyboardInterrupt()
-
-            msg = "{name:<40}: ERROR:\n<-------"
-            print(msg.format(name=b.name))
-            if isinstance(d, dict):
-                if d['succeeded']:
-                    print("\nException:\n%s\n" % str(e))
-                else:
-                    for k, v in sorted(d.iteritems()):
-                        print("{k}: {v}".format(k=k, v=v))
-
-            print("------->\n")
-
-    dump_as_gist(results, "testing", njobs=njobs)
-
-    return exit_code
-
-
-if __name__ == "__main__":
-    import sys
-    sys.exit(main())
-
-#####################################################
-# functions for retrieving and processing the results
-
-
-def get_vbench_log(build_url):
-    with closing(urllib2.urlopen(build_url)) as r:
-        if not (200 <= r.getcode() < 300):
-            return
-
-        s = json.loads(r.read())
-        s = [x for x in s['matrix'] if "VBENCH" in ((x.get('config', {})
-                                                    or {}).get('env', {}) or {})]
-                # s=[x for x in s['matrix']]
-        if not s:
-            return
-        id = s[0]['id']  # should be just one for now
-        with closing(urllib2.urlopen("https://api.travis-ci.org/jobs/%s" % id)) as r2:
-            if not 200 <= r.getcode() < 300:
-                return
-            s2 = json.loads(r2.read())
-            return s2.get('log')
-
-
-def get_results_raw_url(build):
-    "Taks a Travis a build number, retrieves the build log and extracts the gist url"
-    import re
-    log = get_vbench_log("https://api.travis-ci.org/builds/%s" % build)
-    if not log:
-        return
-    l = [x.strip(
-    ) for x in log.split("\n") if re.match(".vbench-gist-raw_url", x)]
-    if l:
-        s = l[0]
-        m = re.search("(https://[^\s]+)", s)
-        if m:
-            return m.group(0)
-
-
-def convert_json_to_df(results_url):
-    """retrieve json results file from url and return df
-
-    df contains timings for all successful vbenchmarks
-    """
-
-    with closing(urlopen(results_url)) as resp:
-        res = json.loads(resp.read())
-    timings = res.get("timings")
-    if not timings:
-        return
-    res = [x for x in timings if x.get('succeeded')]
-    df = pd.DataFrame(res)
-    df = df.set_index("name")
-    return df
-
-
-def get_build_results(build):
-    "Returns a df with the results of the VBENCH job associated with the travis build"
-    r_url = get_results_raw_url(build)
-    if not r_url:
-        return
-
-    return convert_json_to_df(r_url)
-
-
-def get_all_results(repo_id=53976):  # travis pydata/pandas id
-    """Fetches the VBENCH results for all travis builds, and returns a list of result df
-
-   unsuccesful individual vbenches are dropped.
-    """
-    from collections import OrderedDict
-
-    def get_results_from_builds(builds):
-        dfs = OrderedDict()
-        for build in builds:
-            build_id = build['id']
-            build_number = build['number']
-            print(build_number)
-            res = get_build_results(build_id)
-            if res is not None:
-                dfs[build_number] = res
-        return dfs
-
-    base_url = 'https://api.travis-ci.org/builds?url=%2Fbuilds&repository_id={repo_id}'
-    url = base_url.format(repo_id=repo_id)
-    url_after = url + '&after_number={after}'
-    dfs = OrderedDict()
-
-    while True:
-        with closing(urlopen(url)) as r:
-            if not (200 <= r.getcode() < 300):
-                break
-            builds = json.loads(r.read())
-        res = get_results_from_builds(builds)
-        if not res:
-            break
-        last_build_number = min(res.keys())
-        dfs.update(res)
-        url = url_after.format(after=last_build_number)
-
-    return dfs
-
-
-def get_all_results_joined(repo_id=53976):
-    def mk_unique(df):
-        for dupe in df.index.get_duplicates():
-            df = df.ix[df.index != dupe]
-        return df
-    dfs = get_all_results(repo_id)
-    for k in dfs:
-        dfs[k] = mk_unique(dfs[k])
-    ss = [pd.Series(v.timing, name=k) for k, v in dfs.iteritems()]
-    results = pd.concat(reversed(ss), 1)
-    return results
diff --git a/vb_suite/plotting.py b/vb_suite/plotting.py
deleted file mode 100644
index 79e81e9eea8f4..0000000000000
--- a/vb_suite/plotting.py
+++ /dev/null
@@ -1,25 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-
-try:
-    from pandas import date_range
-except ImportError:
-    def date_range(start=None, end=None, periods=None, freq=None):
-        return DatetimeIndex(start, end, periods=periods, offset=freq)
-
-"""
-
-#-----------------------------------------------------------------------------
-# Timeseries plotting
-
-setup = common_setup + """
-N = 2000
-M = 5
-df = DataFrame(np.random.randn(N,M), index=date_range('1/1/1975', periods=N))
-"""
-
-plot_timeseries_period = Benchmark("df.plot()", setup=setup, 
-                                   name='plot_timeseries_period')
-
diff --git a/vb_suite/reindex.py b/vb_suite/reindex.py
deleted file mode 100644
index 443eb43835745..0000000000000
--- a/vb_suite/reindex.py
+++ /dev/null
@@ -1,225 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# DataFrame reindex columns
-
-setup = common_setup + """
-df = DataFrame(index=range(10000), data=np.random.rand(10000,30),
-               columns=range(30))
-"""
-statement = "df.reindex(columns=df.columns[1:5])"
-
-frame_reindex_columns = Benchmark(statement, setup)
-
-#----------------------------------------------------------------------
-
-setup = common_setup + """
-rng = DatetimeIndex(start='1/1/1970', periods=10000, freq=datetools.Minute())
-df = DataFrame(np.random.rand(10000, 10), index=rng,
-               columns=range(10))
-df['foo'] = 'bar'
-rng2 = Index(rng[::2])
-"""
-statement = "df.reindex(rng2)"
-dataframe_reindex = Benchmark(statement, setup)
-
-#----------------------------------------------------------------------
-# multiindex reindexing
-
-setup = common_setup + """
-N = 1000
-K = 20
-
-level1 = tm.makeStringIndex(N).values.repeat(K)
-level2 = np.tile(tm.makeStringIndex(K).values, N)
-index = MultiIndex.from_arrays([level1, level2])
-
-s1 = Series(np.random.randn(N * K), index=index)
-s2 = s1[::2]
-"""
-statement = "s1.reindex(s2.index)"
-reindex_multi = Benchmark(statement, setup,
-                          name='reindex_multiindex',
-                          start_date=datetime(2011, 9, 1))
-
-#----------------------------------------------------------------------
-# Pad / backfill
-
-def pad(source_series, target_index):
-    try:
-        source_series.reindex(target_index, method='pad')
-    except:
-        source_series.reindex(target_index, fillMethod='pad')
-
-def backfill(source_series, target_index):
-    try:
-        source_series.reindex(target_index, method='backfill')
-    except:
-        source_series.reindex(target_index, fillMethod='backfill')
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=100000, freq=datetools.Minute())
-
-ts = Series(np.random.randn(len(rng)), index=rng)
-ts2 = ts[::2]
-ts3 = ts2.reindex(ts.index)
-ts4 = ts3.astype('float32')
-
-def pad(source_series, target_index):
-    try:
-        source_series.reindex(target_index, method='pad')
-    except:
-        source_series.reindex(target_index, fillMethod='pad')
-def backfill(source_series, target_index):
-    try:
-        source_series.reindex(target_index, method='backfill')
-    except:
-        source_series.reindex(target_index, fillMethod='backfill')
-"""
-
-statement = "pad(ts2, ts.index)"
-reindex_daterange_pad = Benchmark(statement, setup,
-                                  name="reindex_daterange_pad")
-
-statement = "backfill(ts2, ts.index)"
-reindex_daterange_backfill = Benchmark(statement, setup,
-                                       name="reindex_daterange_backfill")
-
-reindex_fillna_pad = Benchmark("ts3.fillna(method='pad')", setup,
-                               name="reindex_fillna_pad",
-                               start_date=datetime(2011, 3, 1))
-
-reindex_fillna_pad_float32 = Benchmark("ts4.fillna(method='pad')", setup,
-                                       name="reindex_fillna_pad_float32",
-                                       start_date=datetime(2013, 1, 1))
-
-reindex_fillna_backfill = Benchmark("ts3.fillna(method='backfill')", setup,
-                                    name="reindex_fillna_backfill",
-                                    start_date=datetime(2011, 3, 1))
-reindex_fillna_backfill_float32 = Benchmark("ts4.fillna(method='backfill')", setup,
-                                            name="reindex_fillna_backfill_float32",
-                                            start_date=datetime(2013, 1, 1))
-
-#----------------------------------------------------------------------
-# align on level
-
-setup = common_setup + """
-index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)],
-                   labels=[np.arange(10).repeat(10000),
-                           np.tile(np.arange(100).repeat(100), 10),
-                           np.tile(np.tile(np.arange(100), 100), 10)])
-random.shuffle(index.values)
-df = DataFrame(np.random.randn(len(index), 4), index=index)
-df_level = DataFrame(np.random.randn(100, 4), index=index.levels[1])
-"""
-
-reindex_frame_level_align = \
-    Benchmark("df.align(df_level, level=1, copy=False)", setup,
-              name='reindex_frame_level_align',
-              start_date=datetime(2011, 12, 27))
-
-reindex_frame_level_reindex = \
-    Benchmark("df_level.reindex(df.index, level=1)", setup,
-              name='reindex_frame_level_reindex',
-              start_date=datetime(2011, 12, 27))
-
-
-#----------------------------------------------------------------------
-# sort_index, drop_duplicates
-
-# pathological, but realistic
-setup = common_setup + """
-N = 10000
-K = 10
-
-key1 = tm.makeStringIndex(N).values.repeat(K)
-key2 = tm.makeStringIndex(N).values.repeat(K)
-
-df = DataFrame({'key1' : key1, 'key2' : key2,
-                'value' : np.random.randn(N * K)})
-col_array_list = list(df.values.T)
-"""
-statement = "df.sort_index(by=['key1', 'key2'])"
-frame_sort_index_by_columns = Benchmark(statement, setup,
-                                        start_date=datetime(2011, 11, 1))
-
-# drop_duplicates
-
-statement = "df.drop_duplicates(['key1', 'key2'])"
-frame_drop_duplicates = Benchmark(statement, setup,
-                                  start_date=datetime(2011, 11, 15))
-
-statement = "df.drop_duplicates(['key1', 'key2'], inplace=True)"
-frame_drop_dup_inplace = Benchmark(statement, setup,
-                                   start_date=datetime(2012, 5, 16))
-
-lib_fast_zip = Benchmark('lib.fast_zip(col_array_list)', setup,
-                         name='lib_fast_zip',
-                         start_date=datetime(2012, 1, 1))
-
-setup = setup + """
-df.ix[:10000, :] = np.nan
-"""
-statement2 = "df.drop_duplicates(['key1', 'key2'])"
-frame_drop_duplicates_na = Benchmark(statement2, setup,
-                                     start_date=datetime(2012, 5, 15))
-
-lib_fast_zip_fillna = Benchmark('lib.fast_zip_fillna(col_array_list)', setup,
-                                start_date=datetime(2012, 5, 15))
-
-statement2 = "df.drop_duplicates(['key1', 'key2'], inplace=True)"
-frame_drop_dup_na_inplace = Benchmark(statement2, setup,
-                                      start_date=datetime(2012, 5, 16))
-
-setup = common_setup + """
-s = Series(np.random.randint(0, 1000, size=10000))
-s2 = Series(np.tile(tm.makeStringIndex(1000).values, 10))
-"""
-
-series_drop_duplicates_int = Benchmark('s.drop_duplicates()', setup,
-                                       start_date=datetime(2012, 11, 27))
-
-series_drop_duplicates_string = \
-    Benchmark('s2.drop_duplicates()', setup,
-              start_date=datetime(2012, 11, 27))
-
-#----------------------------------------------------------------------
-# fillna, many columns
-
-
-setup = common_setup + """
-values = np.random.randn(1000, 1000)
-values[::2] = np.nan
-df = DataFrame(values)
-"""
-
-frame_fillna_many_columns_pad = Benchmark("df.fillna(method='pad')",
-                                          setup,
-                                          start_date=datetime(2011, 3, 1))
-
-#----------------------------------------------------------------------
-# blog "pandas escaped the zoo"
-
-setup = common_setup + """
-n = 50000
-indices = tm.makeStringIndex(n)
-
-def sample(values, k):
-    from random import shuffle
-    sampler = np.arange(len(values))
-    shuffle(sampler)
-    return values.take(sampler[:k])
-
-subsample_size = 40000
-
-x = Series(np.random.randn(50000), indices)
-y = Series(np.random.randn(subsample_size),
-           index=sample(indices, subsample_size))
-"""
-
-series_align_irregular_string = Benchmark("x + y", setup,
-                                          start_date=datetime(2010, 6, 1))
diff --git a/vb_suite/replace.py b/vb_suite/replace.py
deleted file mode 100644
index 9326aa5becca9..0000000000000
--- a/vb_suite/replace.py
+++ /dev/null
@@ -1,36 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-from datetime import timedelta
-
-N = 1000000
-
-try:
-    rng = date_range('1/1/2000', periods=N, freq='min')
-except NameError:
-    rng = DatetimeIndex('1/1/2000', periods=N, offset=datetools.Minute())
-    date_range = DateRange
-
-ts = Series(np.random.randn(N), index=rng)
-"""
-
-large_dict_setup = """from .pandas_vb_common import *
-from pandas.compat import range
-n = 10 ** 6
-start_value = 10 ** 5
-to_rep = dict((i, start_value + i) for i in range(n))
-s = Series(np.random.randint(n, size=10 ** 3))
-"""
-
-replace_fillna = Benchmark('ts.fillna(0., inplace=True)', common_setup,
-                           name='replace_fillna',
-                           start_date=datetime(2012, 4, 4))
-replace_replacena = Benchmark('ts.replace(np.nan, 0., inplace=True)',
-                              common_setup,
-                              name='replace_replacena',
-                              start_date=datetime(2012, 5, 15))
-replace_large_dict = Benchmark('s.replace(to_rep, inplace=True)',
-                               large_dict_setup,
-                               name='replace_large_dict',
-                               start_date=datetime(2014, 4, 6))
diff --git a/vb_suite/reshape.py b/vb_suite/reshape.py
deleted file mode 100644
index daab96103f2c5..0000000000000
--- a/vb_suite/reshape.py
+++ /dev/null
@@ -1,65 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-index = MultiIndex.from_arrays([np.arange(100).repeat(100),
-                               np.roll(np.tile(np.arange(100), 100), 25)])
-df = DataFrame(np.random.randn(10000, 4), index=index)
-"""
-
-reshape_unstack_simple = Benchmark('df.unstack(1)', common_setup,
-                                   start_date=datetime(2011, 10, 1))
-
-setup = common_setup + """
-udf = df.unstack(1)
-"""
-
-reshape_stack_simple = Benchmark('udf.stack()', setup,
-                                 start_date=datetime(2011, 10, 1))
-
-setup = common_setup + """
-def unpivot(frame):
-    N, K = frame.shape
-    data = {'value' : frame.values.ravel('F'),
-            'variable' : np.asarray(frame.columns).repeat(N),
-            'date' : np.tile(np.asarray(frame.index), K)}
-    return DataFrame(data, columns=['date', 'variable', 'value'])
-index = date_range('1/1/2000', periods=10000, freq='h')
-df = DataFrame(randn(10000, 50), index=index, columns=range(50))
-pdf = unpivot(df)
-f = lambda: pdf.pivot('date', 'variable', 'value')
-"""
-
-reshape_pivot_time_series = Benchmark('f()', setup,
-                                      start_date=datetime(2012, 5, 1))
-
-# Sparse key space, re: #2278
-
-setup = common_setup + """
-NUM_ROWS = 1000
-for iter in range(10):
-    df = DataFrame({'A' : np.random.randint(50, size=NUM_ROWS),
-                    'B' : np.random.randint(50, size=NUM_ROWS),
-                    'C' : np.random.randint(-10,10, size=NUM_ROWS),
-                    'D' : np.random.randint(-10,10, size=NUM_ROWS),
-                    'E' : np.random.randint(10, size=NUM_ROWS),
-                    'F' : np.random.randn(NUM_ROWS)})
-    idf = df.set_index(['A', 'B', 'C', 'D', 'E'])
-    if len(idf.index.unique()) == NUM_ROWS:
-        break
-"""
-
-unstack_sparse_keyspace = Benchmark('idf.unstack()', setup,
-                                    start_date=datetime(2011, 10, 1))
-
-# Melt
-
-setup = common_setup + """
-from pandas.core.reshape import melt
-df = DataFrame(np.random.randn(10000, 3), columns=['A', 'B', 'C'])
-df['id1'] = np.random.randint(0, 10, 10000)
-df['id2'] = np.random.randint(100, 1000, 10000)
-"""
-
-melt_dataframe = Benchmark("melt(df, id_vars=['id1', 'id2'])", setup,
-                           start_date=datetime(2012, 8, 1))
diff --git a/vb_suite/run_suite.py b/vb_suite/run_suite.py
deleted file mode 100755
index 43bf24faae43a..0000000000000
--- a/vb_suite/run_suite.py
+++ /dev/null
@@ -1,15 +0,0 @@
-#!/usr/bin/env python
-from vbench.api import BenchmarkRunner
-from suite import *
-
-
-def run_process():
-    runner = BenchmarkRunner(benchmarks, REPO_PATH, REPO_URL,
-                             BUILD, DB_PATH, TMP_DIR, PREPARE,
-                             always_clean=True,
-                             run_option='eod', start_date=START_DATE,
-                             module_dependencies=dependencies)
-    runner.run()
-
-if __name__ == '__main__':
-    run_process()
diff --git a/vb_suite/series_methods.py b/vb_suite/series_methods.py
deleted file mode 100644
index cd8688495fa09..0000000000000
--- a/vb_suite/series_methods.py
+++ /dev/null
@@ -1,39 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-setup = common_setup + """
-s1 = Series(np.random.randn(10000))
-s2 = Series(np.random.randint(1, 10, 10000))
-s3 = Series(np.random.randint(1, 10, 100000)).astype('int64')
-values = [1,2]
-s4 = s3.astype('object')
-"""
-
-series_nlargest1 = Benchmark('s1.nlargest(3, take_last=True);'
-                             's1.nlargest(3, take_last=False)',
-                             setup,
-                             start_date=datetime(2014, 1, 25))
-series_nlargest2 = Benchmark('s2.nlargest(3, take_last=True);'
-                             's2.nlargest(3, take_last=False)',
-                             setup,
-                             start_date=datetime(2014, 1, 25))
-
-series_nsmallest2 = Benchmark('s1.nsmallest(3, take_last=True);'
-                              's1.nsmallest(3, take_last=False)',
-                              setup,
-                              start_date=datetime(2014, 1, 25))
-
-series_nsmallest2 = Benchmark('s2.nsmallest(3, take_last=True);'
-                              's2.nsmallest(3, take_last=False)',
-                              setup,
-                              start_date=datetime(2014, 1, 25))
-
-series_isin_int64 = Benchmark('s3.isin(values)',
-                              setup,
-                              start_date=datetime(2014, 1, 25))
-series_isin_object = Benchmark('s4.isin(values)',
-                               setup,
-                               start_date=datetime(2014, 1, 25))
diff --git a/vb_suite/source/conf.py b/vb_suite/source/conf.py
deleted file mode 100644
index d83448fd97d09..0000000000000
--- a/vb_suite/source/conf.py
+++ /dev/null
@@ -1,225 +0,0 @@
-# -*- coding: utf-8 -*-
-#
-# pandas documentation build configuration file, created by
-#
-# This file is execfile()d with the current directory set to its containing dir.
-#
-# Note that not all possible configuration values are present in this
-# autogenerated file.
-#
-# All configuration values have a default; values that are commented out
-# serve to show the default.
-
-import sys
-import os
-
-# If extensions (or modules to document with autodoc) are in another directory,
-# add these directories to sys.path here. If the directory is relative to the
-# documentation root, use os.path.abspath to make it absolute, like shown here.
-# sys.path.append(os.path.abspath('.'))
-sys.path.insert(0, os.path.abspath('../sphinxext'))
-
-sys.path.extend([
-
-    # numpy standard doc extensions
-    os.path.join(os.path.dirname(__file__),
-                 '..', '../..',
-                 'sphinxext')
-
-])
-
-# -- General configuration -----------------------------------------------
-
-# Add any Sphinx extension module names here, as strings. They can be extensions
-# coming with Sphinx (named 'sphinx.ext.*') or your custom ones.  sphinxext.
-
-extensions = ['sphinx.ext.autodoc',
-              'sphinx.ext.doctest']
-
-# Add any paths that contain templates here, relative to this directory.
-templates_path = ['_templates', '_templates/autosummary']
-
-# The suffix of source filenames.
-source_suffix = '.rst'
-
-# The encoding of source files.
-# source_encoding = 'utf-8'
-
-# The master toctree document.
-master_doc = 'index'
-
-# General information about the project.
-project = u'pandas'
-copyright = u'2008-2011, the pandas development team'
-
-# The version info for the project you're documenting, acts as replacement for
-# |version| and |release|, also used in various other places throughout the
-# built documents.
-#
-# The short X.Y version.
-import pandas
-
-# version = '%s r%s' % (pandas.__version__, svn_version())
-version = '%s' % (pandas.__version__)
-
-# The full version, including alpha/beta/rc tags.
-release = version
-
-# JP: added from sphinxdocs
-autosummary_generate = True
-
-# The language for content autogenerated by Sphinx. Refer to documentation
-# for a list of supported languages.
-# language = None
-
-# There are two options for replacing |today|: either, you set today to some
-# non-false value, then it is used:
-# today = ''
-# Else, today_fmt is used as the format for a strftime call.
-# today_fmt = '%B %d, %Y'
-
-# List of documents that shouldn't be included in the build.
-# unused_docs = []
-
-# List of directories, relative to source directory, that shouldn't be searched
-# for source files.
-exclude_trees = []
-
-# The reST default role (used for this markup: `text`) to use for all documents.
-# default_role = None
-
-# If true, '()' will be appended to :func: etc. cross-reference text.
-# add_function_parentheses = True
-
-# If true, the current module name will be prepended to all description
-# unit titles (such as .. function::).
-# add_module_names = True
-
-# If true, sectionauthor and moduleauthor directives will be shown in the
-# output. They are ignored by default.
-# show_authors = False
-
-# The name of the Pygments (syntax highlighting) style to use.
-pygments_style = 'sphinx'
-
-# A list of ignored prefixes for module index sorting.
-# modindex_common_prefix = []
-
-
-# -- Options for HTML output ---------------------------------------------
-
-# The theme to use for HTML and HTML Help pages.  Major themes that come with
-# Sphinx are currently 'default' and 'sphinxdoc'.
-html_theme = 'agogo'
-
-# The style sheet to use for HTML and HTML Help pages. A file of that name
-# must exist either in Sphinx' static/ path, or in one of the custom paths
-# given in html_static_path.
-# html_style = 'statsmodels.css'
-
-# Theme options are theme-specific and customize the look and feel of a theme
-# further.  For a list of options available for each theme, see the
-# documentation.
-# html_theme_options = {}
-
-# Add any paths that contain custom themes here, relative to this directory.
-html_theme_path = ['themes']
-
-# The name for this set of Sphinx documents.  If None, it defaults to
-# "<project> v<release> documentation".
-html_title = 'Vbench performance benchmarks for pandas'
-
-# A shorter title for the navigation bar.  Default is the same as html_title.
-# html_short_title = None
-
-# The name of an image file (relative to this directory) to place at the top
-# of the sidebar.
-# html_logo = None
-
-# The name of an image file (within the static path) to use as favicon of the
-# docs.  This file should be a Windows icon file (.ico) being 16x16 or 32x32
-# pixels large.
-# html_favicon = None
-
-# Add any paths that contain custom static files (such as style sheets) here,
-# relative to this directory. They are copied after the builtin static files,
-# so a file named "default.css" will overwrite the builtin "default.css".
-html_static_path = ['_static']
-
-# If not '', a 'Last updated on:' timestamp is inserted at every page bottom,
-# using the given strftime format.
-# html_last_updated_fmt = '%b %d, %Y'
-
-# If true, SmartyPants will be used to convert quotes and dashes to
-# typographically correct entities.
-# html_use_smartypants = True
-
-# Custom sidebar templates, maps document names to template names.
-# html_sidebars = {}
-
-# Additional templates that should be rendered to pages, maps page names to
-# template names.
-# html_additional_pages = {}
-
-# If false, no module index is generated.
-html_use_modindex = True
-
-# If false, no index is generated.
-# html_use_index = True
-
-# If true, the index is split into individual pages for each letter.
-# html_split_index = False
-
-# If true, links to the reST sources are added to the pages.
-# html_show_sourcelink = True
-
-# If true, an OpenSearch description file will be output, and all pages will
-# contain a <link> tag referring to it.  The value of this option must be the
-# base URL from which the finished HTML is served.
-# html_use_opensearch = ''
-
-# If nonempty, this is the file name suffix for HTML files (e.g. ".xhtml").
-# html_file_suffix = ''
-
-# Output file base name for HTML help builder.
-htmlhelp_basename = 'performance'
-
-
-# -- Options for LaTeX output --------------------------------------------
-
-# The paper size ('letter' or 'a4').
-# latex_paper_size = 'letter'
-
-# The font size ('10pt', '11pt' or '12pt').
-# latex_font_size = '10pt'
-
-# Grouping the document tree into LaTeX files. List of tuples
-# (source start file, target name, title, author, documentclass [howto/manual]).
-latex_documents = [
-    ('index', 'performance.tex',
-     u'pandas vbench Performance Benchmarks',
-     u'Wes McKinney', 'manual'),
-]
-
-# The name of an image file (relative to this directory) to place at the top of
-# the title page.
-# latex_logo = None
-
-# For "manual" documents, if this is true, then toplevel headings are parts,
-# not chapters.
-# latex_use_parts = False
-
-# Additional stuff for the LaTeX preamble.
-# latex_preamble = ''
-
-# Documents to append as an appendix to all manuals.
-# latex_appendices = []
-
-# If false, no module index is generated.
-# latex_use_modindex = True
-
-
-# Example configuration for intersphinx: refer to the Python standard library.
-# intersphinx_mapping = {'http://docs.scipy.org/': None}
-import glob
-autosummary_generate = glob.glob("*.rst")
diff --git a/vb_suite/source/themes/agogo/layout.html b/vb_suite/source/themes/agogo/layout.html
deleted file mode 100644
index cd0f3d7ffc9c7..0000000000000
--- a/vb_suite/source/themes/agogo/layout.html
+++ /dev/null
@@ -1,95 +0,0 @@
-{#
-    agogo/layout.html
-    ~~~~~~~~~~~~~~~~~
-
-    Sphinx layout template for the agogo theme, originally written
-    by Andi Albrecht.
-
-    :copyright: Copyright 2007-2011 by the Sphinx team, see AUTHORS.
-    :license: BSD, see LICENSE for details.
-#}
-{% extends "basic/layout.html" %}
-
-{% block header %}
-    <div class="header-wrapper">
-      <div class="header">
-        {%- if logo %}
-          <p class="logo"><a href="{{ pathto(master_doc) }}">
-            <img class="logo" src="{{ pathto('_static/' + logo, 1) }}" alt="Logo"/>
-          </a></p>
-        {%- endif %}
-        {%- block headertitle %}
-        <h1><a href="{{ pathto(master_doc) }}">{{ shorttitle|e }}</a></h1>
-        {%- endblock %}
-        <div class="rel">
-          {%- for rellink in rellinks|reverse %}
-          <a href="{{ pathto(rellink[0]) }}" title="{{ rellink[1]|striptags|e }}"
-             {{ accesskey(rellink[2]) }}>{{ rellink[3] }}</a>
-          {%- if not loop.last %}{{ reldelim2 }}{% endif %}
-          {%- endfor %}
-        </div>
-       </div>
-    </div>
-{% endblock %}
-
-{% block content %}
-    <div class="content-wrapper">
-      <div class="content">
-        <div class="sidebar">
-          {%- block sidebartoc %}
-          <h3>{{ _('Table Of Contents') }}</h3>
-          {{ toctree() }}
-          {%- endblock %}
-          {%- block sidebarsearch %}
-          <h3 style="margin-top: 1.5em;">{{ _('Search') }}</h3>
-          <form class="search" action="{{ pathto('search') }}" method="get">
-            <input type="text" name="q" size="18" />
-            <input type="submit" value="{{ _('Go') }}" />
-            <input type="hidden" name="check_keywords" value="yes" />
-            <input type="hidden" name="area" value="default" />
-          </form>
-          <p class="searchtip" style="font-size: 90%">
-            {{ _('Enter search terms or a module, class or function name.') }}
-          </p>
-		  <p>
-		  <p>
-			<script type="text/javascript" src="http://www.ohloh.net/p/482908/widgets/project_partner_badge.js"></script>
-	      </p>
-          {%- endblock %}
-        </div>
-        <div class="document">
-          {%- block document %}
-            {{ super() }}
-          {%- endblock %}
-        </div>
-        <div class="clearer"></div>
-      </div>
-    </div>
-{% endblock %}
-
-{% block footer %}
-    <div class="footer-wrapper">
-      <div class="footer">
-        <div class="left">
-          {%- for rellink in rellinks|reverse %}
-          <a href="{{ pathto(rellink[0]) }}" title="{{ rellink[1]|striptags|e }}"
-             {{ accesskey(rellink[2]) }}>{{ rellink[3] }}</a>
-          {%- if not loop.last %}{{ reldelim2 }}{% endif %}
-          {%- endfor %}
-          {%- if show_source and has_source and sourcename %}
-            <br/>
-            <a href="{{ pathto('_sources/' + sourcename, true)|e }}"
-               rel="nofollow">{{ _('Show Source') }}</a>
-          {%- endif %}
-        </div>
-
-        <div class="right">
-          {{ super() }}
-        </div>
-        <div class="clearer"></div>
-      </div>
-    </div>
-{% endblock %}
-
-{% block relbar1 %}{% endblock %}
-{% block relbar2 %}{% endblock %}
diff --git a/vb_suite/source/themes/agogo/static/agogo.css_t b/vb_suite/source/themes/agogo/static/agogo.css_t
deleted file mode 100644
index ef909b72e20f6..0000000000000
--- a/vb_suite/source/themes/agogo/static/agogo.css_t
+++ /dev/null
@@ -1,476 +0,0 @@
-/*
- * agogo.css_t
- * ~~~~~~~~~~~
- *
- * Sphinx stylesheet -- agogo theme.
- *
- * :copyright: Copyright 2007-2011 by the Sphinx team, see AUTHORS.
- * :license: BSD, see LICENSE for details.
- *
- */
-
-* {
-  margin: 0px;
-  padding: 0px;
-}
-
-body {
-  font-family: {{ theme_bodyfont }};
-  line-height: 1.4em;
-  color: black;
-  background-color: {{ theme_bgcolor }};
-}
-
-
-/* Page layout */
-
-div.header, div.content, div.footer {
-  max-width: {{ theme_pagewidth }};
-  margin-left: auto;
-  margin-right: auto;
-}
-
-div.header-wrapper {
-  background: {{ theme_headerbg }};
-  padding: 1em 1em 0;
-  border-bottom: 3px solid #2e3436;
-  min-height: 0px;
-}
-
-
-/* Default body styles */
-a {
-  color: {{ theme_linkcolor }};
-}
-
-div.bodywrapper a, div.footer a {
-  text-decoration: underline;
-}
-
-.clearer {
-  clear: both;
-}
-
-.left {
-  float: left;
-}
-
-.right {
-  float: right;
-}
-
-.line-block {
-    display: block;
-    margin-top: 1em;
-    margin-bottom: 1em;
-}
-
-.line-block .line-block {
-    margin-top: 0;
-    margin-bottom: 0;
-    margin-left: 1.5em;
-}
-
-h1, h2, h3, h4 {
-  font-family: {{ theme_headerfont }};
-  font-weight: normal;
-  color: {{ theme_headercolor2 }};
-  margin-bottom: .8em;
-}
-
-h1 {
-  color: {{ theme_headercolor1 }};
-}
-
-h2 {
-  padding-bottom: .5em;
-  border-bottom: 1px solid {{ theme_headercolor2 }};
-}
-
-a.headerlink {
-  visibility: hidden;
-  color: #dddddd;
-  padding-left: .3em;
-}
-
-h1:hover > a.headerlink,
-h2:hover > a.headerlink,
-h3:hover > a.headerlink,
-h4:hover > a.headerlink,
-h5:hover > a.headerlink,
-h6:hover > a.headerlink,
-dt:hover > a.headerlink {
-  visibility: visible;
-}
-
-img {
-  border: 0;
-}
-
-pre {
-  background-color: #EEE;
-  padding: 0.5em;
-}
-
-div.admonition {
-  margin-top: 10px;
-  margin-bottom: 10px;
-  padding: 2px 7px 1px 7px;
-  border-left: 0.2em solid black;
-}
-
-p.admonition-title {
-  margin: 0px 10px 5px 0px;
-  font-weight: bold;
-}
-
-dt:target, .highlighted {
-  background-color: #fbe54e;
-}
-
-/* Header */
-
-/*
-div.header {
-  padding-top: 10px;
-  padding-bottom: 10px;
-}
-*/
-
-div.header {}
-
-div.header h1 {
-  font-family: {{ theme_headerfont }};
-  font-weight: normal;
-  font-size: 180%;
-  letter-spacing: .08em;
-}
-
-div.header h1 a {
-  color: white;
-}
-
-div.header div.rel {
-  text-decoration: none;
-}
-/*  margin-top: 1em; */
-
-div.header div.rel a {
-  margin-top: 1em;
-  color: {{ theme_headerlinkcolor }};
-  letter-spacing: .1em;
-  text-transform: uppercase;
-  padding: 3px 1em;
-}
-
-p.logo {
-    float: right;
-}
-
-img.logo {
-    border: 0;
-}
-
-
-/* Content */
-div.content-wrapper {
-  background-color: white;
-  padding: 1em;
-}
-/*
-  padding-top: 20px;
-  padding-bottom: 20px;
-*/
-
-/*  float: left; */
-
-div.document {
-  max-width: {{ theme_documentwidth }};
-}
-
-div.body {
-  padding-right: 2em;
-  text-align: {{ theme_textalign }};
-}
-
-div.document ul {
-  margin: 1.5em;
-  list-style-type: square;
-}
-
-div.document dd {
-  margin-left: 1.2em;
-  margin-top: .4em;
-  margin-bottom: 1em;
-}
-
-div.document .section {
-  margin-top: 1.7em;
-}
-div.document .section:first-child {
-  margin-top: 0px;
-}
-
-div.document div.highlight {
-  padding: 3px;
-  background-color: #eeeeec;
-  border-top: 2px solid #dddddd;
-  border-bottom: 2px solid #dddddd;
-  margin-top: .8em;
-  margin-bottom: .8em;
-}
-
-div.document h2 {
-  margin-top: .7em;
-}
-
-div.document p {
-  margin-bottom: .5em;
-}
-
-div.document li.toctree-l1 {
-  margin-bottom: 1em;
-}
-
-div.document .descname {
-  font-weight: bold;
-}
-
-div.document .docutils.literal {
-  background-color: #eeeeec;
-  padding: 1px;
-}
-
-div.document .docutils.xref.literal {
-  background-color: transparent;
-  padding: 0px;
-}
-
-div.document blockquote {
-  margin: 1em;
-}
-
-div.document ol {
-  margin: 1.5em;
-}
-
-
-/* Sidebar */
-
-
-div.sidebar {
-  width: {{ theme_sidebarwidth }};
-  padding: 0 1em;
-  float: right;
-  font-size: .93em;
-}
-
-div.sidebar a, div.header a {
-  text-decoration: none;
-}
-
-div.sidebar a:hover, div.header a:hover {
-  text-decoration: underline;
-}
-
-div.sidebar h3 {
-  color: #2e3436;
-  text-transform: uppercase;
-  font-size: 130%;
-  letter-spacing: .1em;
-}
-
-div.sidebar ul {
-  list-style-type: none;
-}
-
-div.sidebar li.toctree-l1 a {
-  display: block;
-  padding: 1px;
-  border: 1px solid #dddddd;
-  background-color: #eeeeec;
-  margin-bottom: .4em;
-  padding-left: 3px;
-  color: #2e3436;
-}
-
-div.sidebar li.toctree-l2 a {
-  background-color: transparent;
-  border: none;
-  margin-left: 1em;
-  border-bottom: 1px solid #dddddd;
-}
-
-div.sidebar li.toctree-l3 a {
-  background-color: transparent;
-  border: none;
-  margin-left: 2em;
-  border-bottom: 1px solid #dddddd;
-}
-
-div.sidebar li.toctree-l2:last-child a {
-  border-bottom: none;
-}
-
-div.sidebar li.toctree-l1.current a {
-  border-right: 5px solid {{ theme_headerlinkcolor }};
-}
-
-div.sidebar li.toctree-l1.current li.toctree-l2 a {
-  border-right: none;
-}
-
-
-/* Footer */
-
-div.footer-wrapper {
-  background: {{ theme_footerbg }};
-  border-top: 4px solid #babdb6;
-  padding-top: 10px;
-  padding-bottom: 10px;
-  min-height: 80px;
-}
-
-div.footer, div.footer a {
-  color: #888a85;
-}
-
-div.footer .right {
-  text-align: right;
-}
-
-div.footer .left {
-  text-transform: uppercase;
-}
-
-
-/* Styles copied from basic theme */
-
-img.align-left, .figure.align-left, object.align-left {
-    clear: left;
-    float: left;
-    margin-right: 1em;
-}
-
-img.align-right, .figure.align-right, object.align-right {
-    clear: right;
-    float: right;
-    margin-left: 1em;
-}
-
-img.align-center, .figure.align-center, object.align-center {
-  display: block;
-  margin-left: auto;
-  margin-right: auto;
-}
-
-.align-left {
-    text-align: left;
-}
-
-.align-center {
-    clear: both;
-    text-align: center;
-}
-
-.align-right {
-    text-align: right;
-}
-
-/* -- search page ----------------------------------------------------------- */
-
-ul.search {
-    margin: 10px 0 0 20px;
-    padding: 0;
-}
-
-ul.search li {
-    padding: 5px 0 5px 20px;
-    background-image: url(file.png);
-    background-repeat: no-repeat;
-    background-position: 0 7px;
-}
-
-ul.search li a {
-    font-weight: bold;
-}
-
-ul.search li div.context {
-    color: #888;
-    margin: 2px 0 0 30px;
-    text-align: left;
-}
-
-ul.keywordmatches li.goodmatch a {
-    font-weight: bold;
-}
-
-/* -- index page ------------------------------------------------------------ */
-
-table.contentstable {
-    width: 90%;
-}
-
-table.contentstable p.biglink {
-    line-height: 150%;
-}
-
-a.biglink {
-    font-size: 1.3em;
-}
-
-span.linkdescr {
-    font-style: italic;
-    padding-top: 5px;
-    font-size: 90%;
-}
-
-/* -- general index --------------------------------------------------------- */
-
-table.indextable td {
-    text-align: left;
-    vertical-align: top;
-}
-
-table.indextable dl, table.indextable dd {
-    margin-top: 0;
-    margin-bottom: 0;
-}
-
-table.indextable tr.pcap {
-    height: 10px;
-}
-
-table.indextable tr.cap {
-    margin-top: 10px;
-    background-color: #f2f2f2;
-}
-
-img.toggler {
-    margin-right: 3px;
-    margin-top: 3px;
-    cursor: pointer;
-}
-
-/* -- viewcode extension ---------------------------------------------------- */
-
-.viewcode-link {
-    float: right;
-}
-
-.viewcode-back {
-    float: right;
-    font-family:: {{ theme_bodyfont }};
-}
-
-div.viewcode-block:target {
-    margin: -1px -3px;
-    padding: 0 3px;
-    background-color: #f4debf;
-    border-top: 1px solid #ac9;
-    border-bottom: 1px solid #ac9;
-}
-
-th.field-name {
-    white-space: nowrap;
-}
diff --git a/vb_suite/source/themes/agogo/static/bgfooter.png b/vb_suite/source/themes/agogo/static/bgfooter.png
deleted file mode 100644
index 9ce5bdd902943..0000000000000
Binary files a/vb_suite/source/themes/agogo/static/bgfooter.png and /dev/null differ
diff --git a/vb_suite/source/themes/agogo/static/bgtop.png b/vb_suite/source/themes/agogo/static/bgtop.png
deleted file mode 100644
index a0d4709bac8f7..0000000000000
Binary files a/vb_suite/source/themes/agogo/static/bgtop.png and /dev/null differ
diff --git a/vb_suite/source/themes/agogo/theme.conf b/vb_suite/source/themes/agogo/theme.conf
deleted file mode 100644
index 3fc88580f1ab4..0000000000000
--- a/vb_suite/source/themes/agogo/theme.conf
+++ /dev/null
@@ -1,19 +0,0 @@
-[theme]
-inherit = basic
-stylesheet = agogo.css
-pygments_style = tango
-
-[options]
-bodyfont = "Verdana", Arial, sans-serif
-headerfont = "Georgia", "Times New Roman", serif
-pagewidth = 70em
-documentwidth = 50em
-sidebarwidth = 20em
-bgcolor = #eeeeec
-headerbg = url(bgtop.png) top left repeat-x
-footerbg = url(bgfooter.png) top left repeat-x
-linkcolor = #ce5c00
-headercolor1 = #204a87
-headercolor2 = #3465a4
-headerlinkcolor = #fcaf3e
-textalign = justify
\ No newline at end of file
diff --git a/vb_suite/sparse.py b/vb_suite/sparse.py
deleted file mode 100644
index 53e2778ee0865..0000000000000
--- a/vb_suite/sparse.py
+++ /dev/null
@@ -1,65 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-
-setup = common_setup + """
-from pandas.core.sparse import SparseSeries, SparseDataFrame
-
-K = 50
-N = 50000
-rng = np.asarray(date_range('1/1/2000', periods=N,
-                           freq='T'))
-
-# rng2 = np.asarray(rng).astype('M8[ns]').astype('i8')
-
-series = {}
-for i in range(1, K + 1):
-    data = np.random.randn(N)[:-i]
-    this_rng = rng[:-i]
-    data[100:] = np.nan
-    series[i] = SparseSeries(data, index=this_rng)
-"""
-stmt = "SparseDataFrame(series)"
-
-bm_sparse1 = Benchmark(stmt, setup, name="sparse_series_to_frame",
-                       start_date=datetime(2011, 6, 1))
-
-
-setup = common_setup + """
-from pandas.core.sparse import SparseDataFrame
-"""
-
-stmt = "SparseDataFrame(columns=np.arange(100), index=np.arange(1000))"
-
-sparse_constructor = Benchmark(stmt, setup, name="sparse_frame_constructor",
-                               start_date=datetime(2012, 6, 1))
-
-
-setup = common_setup + """
-s = pd.Series([np.nan] * 10000)
-s[0] = 3.0
-s[100] = -1.0
-s[999] = 12.1
-s.index = pd.MultiIndex.from_product((range(10), range(10), range(10), range(10)))
-ss = s.to_sparse()
-"""
-
-stmt = "ss.to_coo(row_levels=[0, 1], column_levels=[2, 3], sort_labels=True)"
-
-sparse_series_to_coo = Benchmark(stmt, setup, name="sparse_series_to_coo",
-                               start_date=datetime(2015, 1, 3))
-
-setup = common_setup + """
-import scipy.sparse
-import pandas.sparse.series
-A = scipy.sparse.coo_matrix(([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])), shape=(100, 100))
-"""
-
-stmt = "ss = pandas.sparse.series.SparseSeries.from_coo(A)"
-
-sparse_series_from_coo = Benchmark(stmt, setup, name="sparse_series_from_coo",
-                               start_date=datetime(2015, 1, 3))
diff --git a/vb_suite/stat_ops.py b/vb_suite/stat_ops.py
deleted file mode 100644
index 8d7c30dc9fdcf..0000000000000
--- a/vb_suite/stat_ops.py
+++ /dev/null
@@ -1,126 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# nanops
-
-setup = common_setup + """
-s = Series(np.random.randn(100000), index=np.arange(100000))
-s[::2] = np.nan
-"""
-
-stat_ops_series_std = Benchmark("s.std()", setup)
-
-#----------------------------------------------------------------------
-# ops by level
-
-setup = common_setup + """
-index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)],
-                   labels=[np.arange(10).repeat(10000),
-                           np.tile(np.arange(100).repeat(100), 10),
-                           np.tile(np.tile(np.arange(100), 100), 10)])
-random.shuffle(index.values)
-df = DataFrame(np.random.randn(len(index), 4), index=index)
-df_level = DataFrame(np.random.randn(100, 4), index=index.levels[1])
-"""
-
-stat_ops_level_frame_sum = \
-    Benchmark("df.sum(level=1)", setup,
-              start_date=datetime(2011, 11, 15))
-
-stat_ops_level_frame_sum_multiple = \
-    Benchmark("df.sum(level=[0, 1])", setup, repeat=1,
-              start_date=datetime(2011, 11, 15))
-
-stat_ops_level_series_sum = \
-    Benchmark("df[1].sum(level=1)", setup,
-              start_date=datetime(2011, 11, 15))
-
-stat_ops_level_series_sum_multiple = \
-    Benchmark("df[1].sum(level=[0, 1])", setup, repeat=1,
-              start_date=datetime(2011, 11, 15))
-
-sum_setup = common_setup + """
-df = DataFrame(np.random.randn(100000, 4))
-dfi = DataFrame(np.random.randint(1000, size=df.shape))
-"""
-
-stat_ops_frame_sum_int_axis_0 = \
-    Benchmark("dfi.sum()", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_sum_float_axis_0 = \
-    Benchmark("df.sum()", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_mean_int_axis_0 = \
-    Benchmark("dfi.mean()", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_mean_float_axis_0 = \
-    Benchmark("df.mean()", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_sum_int_axis_1 = \
-    Benchmark("dfi.sum(1)", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_sum_float_axis_1 = \
-    Benchmark("df.sum(1)", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_mean_int_axis_1 = \
-    Benchmark("dfi.mean(1)", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_mean_float_axis_1 = \
-    Benchmark("df.mean(1)", sum_setup, start_date=datetime(2013, 7, 25))
-
-#----------------------------------------------------------------------
-# rank
-
-setup = common_setup + """
-values = np.concatenate([np.arange(100000),
-                         np.random.randn(100000),
-                         np.arange(100000)])
-s = Series(values)
-"""
-
-stats_rank_average = Benchmark('s.rank()', setup,
-                               start_date=datetime(2011, 12, 12))
-
-stats_rank_pct_average = Benchmark('s.rank(pct=True)', setup,
-                                   start_date=datetime(2014, 1, 16))
-stats_rank_pct_average_old = Benchmark('s.rank() / len(s)', setup,
-                                       start_date=datetime(2014, 1, 16))
-setup = common_setup + """
-values = np.random.randint(0, 100000, size=200000)
-s = Series(values)
-"""
-
-stats_rank_average_int = Benchmark('s.rank()', setup,
-                                   start_date=datetime(2011, 12, 12))
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(5000, 50))
-"""
-
-stats_rank2d_axis1_average = Benchmark('df.rank(1)', setup,
-                                       start_date=datetime(2011, 12, 12))
-
-stats_rank2d_axis0_average = Benchmark('df.rank()', setup,
-                                       start_date=datetime(2011, 12, 12))
-
-# rolling functions
-
-setup = common_setup + """
-arr = np.random.randn(100000)
-"""
-
-stats_rolling_mean = Benchmark('rolling_mean(arr, 100)', setup,
-                               start_date=datetime(2011, 6, 1))
-
-# spearman correlation
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000, 30))
-"""
-
-stats_corr_spearman = Benchmark("df.corr(method='spearman')", setup,
-                                start_date=datetime(2011, 12, 4))
diff --git a/vb_suite/strings.py b/vb_suite/strings.py
deleted file mode 100644
index 0948df5673a0d..0000000000000
--- a/vb_suite/strings.py
+++ /dev/null
@@ -1,59 +0,0 @@
-from vbench.api import Benchmark
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-setup = common_setup + """
-import string
-import itertools as IT
-
-def make_series(letters, strlen, size):
-    return Series(
-        [str(x) for x in np.fromiter(IT.cycle(letters), count=size*strlen, dtype='|S1')
-        .view('|S{}'.format(strlen))])
-
-many = make_series('matchthis'+string.ascii_uppercase, strlen=19, size=10000) # 31% matches
-few = make_series('matchthis'+string.ascii_uppercase*42, strlen=19, size=10000) # 1% matches
-"""
-
-strings_cat = Benchmark("many.str.cat(sep=',')", setup)
-strings_title = Benchmark("many.str.title()", setup)
-strings_count = Benchmark("many.str.count('matchthis')", setup)
-strings_contains_many = Benchmark("many.str.contains('matchthis')", setup)
-strings_contains_few = Benchmark("few.str.contains('matchthis')", setup)
-strings_contains_many_noregex = Benchmark(
-    "many.str.contains('matchthis', regex=False)", setup)
-strings_contains_few_noregex = Benchmark(
-    "few.str.contains('matchthis', regex=False)", setup)
-strings_startswith = Benchmark("many.str.startswith('matchthis')", setup)
-strings_endswith = Benchmark("many.str.endswith('matchthis')", setup)
-strings_lower = Benchmark("many.str.lower()", setup)
-strings_upper = Benchmark("many.str.upper()", setup)
-strings_replace = Benchmark("many.str.replace(r'(matchthis)', r'\1\1')", setup)
-strings_repeat = Benchmark(
-    "many.str.repeat(list(IT.islice(IT.cycle(range(1,4)),len(many))))", setup)
-strings_match = Benchmark("many.str.match(r'mat..this')", setup)
-strings_extract = Benchmark("many.str.extract(r'(\w*)matchthis(\w*)')", setup)
-strings_join_split = Benchmark("many.str.join(r'--').str.split('--')", setup)
-strings_join_split_expand = Benchmark("many.str.join(r'--').str.split('--',expand=True)", setup)
-strings_len = Benchmark("many.str.len()", setup)
-strings_findall = Benchmark("many.str.findall(r'[A-Z]+')", setup)
-strings_pad = Benchmark("many.str.pad(100, side='both')", setup)
-strings_center = Benchmark("many.str.center(100)", setup)
-strings_slice = Benchmark("many.str.slice(5,15,2)", setup)
-strings_strip = Benchmark("many.str.strip('matchthis')", setup)
-strings_lstrip = Benchmark("many.str.lstrip('matchthis')", setup)
-strings_rstrip = Benchmark("many.str.rstrip('matchthis')", setup)
-strings_get = Benchmark("many.str.get(0)", setup)
-
-setup = setup + """
-s = make_series(string.ascii_uppercase, strlen=10, size=10000).str.join('|')
-"""
-strings_get_dummies = Benchmark("s.str.get_dummies('|')", setup)
-
-setup = common_setup + """
-import pandas.util.testing as testing
-ser = Series(testing.makeUnicodeIndex())
-"""
-
-strings_encode_decode = Benchmark("ser.str.encode('utf-8').str.decode('utf-8')", setup)
diff --git a/vb_suite/suite.py b/vb_suite/suite.py
deleted file mode 100644
index 70a6278c0852d..0000000000000
--- a/vb_suite/suite.py
+++ /dev/null
@@ -1,164 +0,0 @@
-from vbench.api import Benchmark, GitRepo
-from datetime import datetime
-
-import os
-
-modules = ['attrs_caching',
-           'binary_ops',
-           'ctors',
-           'frame_ctor',
-           'frame_methods',
-           'groupby',
-           'index_object',
-           'indexing',
-           'io_bench',
-           'io_sql',
-           'inference',
-           'hdfstore_bench',
-           'join_merge',
-           'gil',
-           'miscellaneous',
-           'panel_ctor',
-           'packers',
-           'parser_vb',
-           'panel_methods',
-           'plotting',
-           'reindex',
-           'replace',
-           'sparse',
-           'strings',
-           'reshape',
-           'stat_ops',
-           'timeseries',
-           'timedelta',
-           'eval']
-
-by_module = {}
-benchmarks = []
-
-for modname in modules:
-    ref = __import__(modname)
-    by_module[modname] = [v for v in ref.__dict__.values()
-                          if isinstance(v, Benchmark)]
-    benchmarks.extend(by_module[modname])
-
-for bm in benchmarks:
-    assert(bm.name is not None)
-
-import getpass
-import sys
-
-USERNAME = getpass.getuser()
-
-if sys.platform == 'darwin':
-    HOME = '/Users/%s' % USERNAME
-else:
-    HOME = '/home/%s' % USERNAME
-
-try:
-    import ConfigParser
-
-    config = ConfigParser.ConfigParser()
-    config.readfp(open(os.path.expanduser('~/.vbenchcfg')))
-
-    REPO_PATH = config.get('setup', 'repo_path')
-    REPO_URL = config.get('setup', 'repo_url')
-    DB_PATH = config.get('setup', 'db_path')
-    TMP_DIR = config.get('setup', 'tmp_dir')
-except:
-    REPO_PATH = os.path.abspath(os.path.join(os.path.dirname(__file__), "../"))
-    REPO_URL = 'git@github.com:pydata/pandas.git'
-    DB_PATH = os.path.join(REPO_PATH, 'vb_suite/benchmarks.db')
-    TMP_DIR = os.path.join(HOME, 'tmp/vb_pandas')
-
-PREPARE = """
-python setup.py clean
-"""
-BUILD = """
-python setup.py build_ext --inplace
-"""
-dependencies = ['pandas_vb_common.py']
-
-START_DATE = datetime(2010, 6, 1)
-
-# repo = GitRepo(REPO_PATH)
-
-RST_BASE = 'source'
-
-# HACK!
-
-# timespan = [datetime(2011, 1, 1), datetime(2012, 1, 1)]
-
-
-def generate_rst_files(benchmarks):
-    import matplotlib as mpl
-    mpl.use('Agg')
-    import matplotlib.pyplot as plt
-
-    vb_path = os.path.join(RST_BASE, 'vbench')
-    fig_base_path = os.path.join(vb_path, 'figures')
-
-    if not os.path.exists(vb_path):
-        print('creating %s' % vb_path)
-        os.makedirs(vb_path)
-
-    if not os.path.exists(fig_base_path):
-        print('creating %s' % fig_base_path)
-        os.makedirs(fig_base_path)
-
-    for bmk in benchmarks:
-        print('Generating rst file for %s' % bmk.name)
-        rst_path = os.path.join(RST_BASE, 'vbench/%s.txt' % bmk.name)
-
-        fig_full_path = os.path.join(fig_base_path, '%s.png' % bmk.name)
-
-        # make the figure
-        plt.figure(figsize=(10, 6))
-        ax = plt.gca()
-        bmk.plot(DB_PATH, ax=ax)
-
-        start, end = ax.get_xlim()
-
-        plt.xlim([start - 30, end + 30])
-        plt.savefig(fig_full_path, bbox_inches='tight')
-        plt.close('all')
-
-        fig_rel_path = 'vbench/figures/%s.png' % bmk.name
-        rst_text = bmk.to_rst(image_path=fig_rel_path)
-        with open(rst_path, 'w') as f:
-            f.write(rst_text)
-
-    with open(os.path.join(RST_BASE, 'index.rst'), 'w') as f:
-        print >> f, """
-Performance Benchmarks
-======================
-
-These historical benchmark graphs were produced with `vbench
-<http://github.com/pydata/vbench>`__.
-
-The ``.pandas_vb_common`` setup script can be found here_
-
-.. _here: https://github.com/pydata/pandas/tree/master/vb_suite
-
-Produced on a machine with
-
-  - Intel Core i7 950 processor
-  - (K)ubuntu Linux 12.10
-  - Python 2.7.2 64-bit (Enthought Python Distribution 7.1-2)
-  - NumPy 1.6.1
-
-.. toctree::
-    :hidden:
-    :maxdepth: 3
-"""
-        for modname, mod_bmks in sorted(by_module.items()):
-            print >> f, '    vb_%s' % modname
-            modpath = os.path.join(RST_BASE, 'vb_%s.rst' % modname)
-            with open(modpath, 'w') as mh:
-                header = '%s\n%s\n\n' % (modname, '=' * len(modname))
-                print >> mh, header
-
-                for bmk in mod_bmks:
-                    print >> mh, bmk.name
-                    print >> mh, '-' * len(bmk.name)
-                    print >> mh, '.. include:: vbench/%s.txt\n' % bmk.name
diff --git a/vb_suite/test.py b/vb_suite/test.py
deleted file mode 100644
index da30c3e1a5f76..0000000000000
--- a/vb_suite/test.py
+++ /dev/null
@@ -1,67 +0,0 @@
-from pandas import *
-import matplotlib.pyplot as plt
-
-import sqlite3
-
-from vbench.git import GitRepo
-
-
-REPO_PATH = '/home/adam/code/pandas'
-repo = GitRepo(REPO_PATH)
-
-con = sqlite3.connect('vb_suite/benchmarks.db')
-
-bmk = '36900a889961162138c140ce4ae3c205'
-# bmk = '9d7b8c04b532df6c2d55ef497039b0ce'
-bmk = '4481aa4efa9926683002a673d2ed3dac'
-bmk = '00593cd8c03d769669d7b46585161726'
-bmk = '3725ab7cd0a0657d7ae70f171c877cea'
-bmk = '3cd376d6d6ef802cdea49ac47a67be21'
-bmk2 = '459225186023853494bc345fd180f395'
-bmk = 'c22ca82e0cfba8dc42595103113c7da3'
-bmk = 'e0e651a8e9fbf0270ab68137f8b9df5f'
-bmk = '96bda4b9a60e17acf92a243580f2a0c3'
-
-
-def get_results(bmk):
-    results = con.execute(
-        "select * from results where checksum='%s'" % bmk).fetchall()
-    x = Series(dict((t[1], t[3]) for t in results))
-    x.index = x.index.map(repo.timestamps.get)
-    x = x.sort_index()
-    return x
-
-x = get_results(bmk)
-
-
-def graph1():
-    dm_getitem = get_results('459225186023853494bc345fd180f395')
-    dm_getvalue = get_results('c22ca82e0cfba8dc42595103113c7da3')
-
-    plt.figure()
-    ax = plt.gca()
-
-    dm_getitem.plot(label='df[col][idx]', ax=ax)
-    dm_getvalue.plot(label='df.get_value(idx, col)', ax=ax)
-
-    plt.ylabel('ms')
-    plt.legend(loc='best')
-
-
-def graph2():
-    bm = get_results('96bda4b9a60e17acf92a243580f2a0c3')
-    plt.figure()
-    ax = plt.gca()
-
-    bm.plot(ax=ax)
-    plt.ylabel('ms')
-
-bm = get_results('36900a889961162138c140ce4ae3c205')
-fig = plt.figure()
-ax = plt.gca()
-bm.plot(ax=ax)
-fig.autofmt_xdate()
-
-plt.xlim([bm.dropna().index[0] - datetools.MonthEnd(),
-          bm.dropna().index[-1] + datetools.MonthEnd()])
-plt.ylabel('ms')
diff --git a/vb_suite/test_perf.py b/vb_suite/test_perf.py
deleted file mode 100755
index be546b72f9465..0000000000000
--- a/vb_suite/test_perf.py
+++ /dev/null
@@ -1,616 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-"""
-What
-----
-vbench is a library which can be used to benchmark the performance
-of a codebase over time.
-Although vbench can collect data over many commites, generate plots
-and other niceties, for Pull-Requests the important thing is the
-performance of the HEAD commit against a known-good baseline.
-
-This script tries to automate the process of comparing these
-two commits, and is meant to run out of the box on a fresh
-clone.
-
-How
----
-These are the steps taken:
-1) create a temp directory into which vbench will clone the temporary repo.
-2) instantiate a vbench runner, using the local repo as the source repo.
-3) perform a vbench run for the baseline commit, then the target commit.
-4) pull the results for both commits from the db. use pandas to align
-everything and calculate a ration for the timing information.
-5) print the results to the log file and to stdout.
-
-"""
-
-# IMPORTANT NOTE
-#
-# This script should run on pandas versions at least as far back as 0.9.1.
-# devs should be able to use the latest version of this script with
-# any dusty old commit and expect it to "just work".
-# One way in which this is useful is when collecting historical data,
-# where writing some logic around this script may prove easier
-# in some cases then running vbench directly (think perf bisection).
-#
-# *please*, when you modify this script for whatever reason,
-# make sure you do not break its functionality when running under older
-# pandas versions.
-# Note that depreaction warnings are turned off in main(), so there's
-# no need to change the actual code to supress such warnings.
-
-import shutil
-import os
-import sys
-import argparse
-import tempfile
-import time
-import re
-
-import random
-import numpy as np
-
-import pandas as pd
-from pandas import DataFrame, Series
-
-from suite import REPO_PATH
-VB_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
-DEFAULT_MIN_DURATION = 0.01
-HEAD_COL="head[ms]"
-BASE_COL="base[ms]"
-
-try:
-    import git # gitpython
-except Exception:
-    print("Error: Please install the `gitpython` package\n")
-    sys.exit(1)
-
-class RevParseAction(argparse.Action):
-    def __call__(self, parser, namespace, values, option_string=None):
-        import subprocess
-        cmd = 'git rev-parse --short -verify {0}^{{commit}}'.format(values)
-        rev_parse = subprocess.check_output(cmd, shell=True)
-        setattr(namespace, self.dest, rev_parse.strip())
-
-
-parser = argparse.ArgumentParser(description='Use vbench to measure and compare the performance of commits.')
-parser.add_argument('-H', '--head',
-                    help='Execute vbenches using the currently checked out copy.',
-                    dest='head',
-                    action='store_true',
-                    default=False)
-parser.add_argument('-b', '--base-commit',
-                    help='The commit serving as performance baseline ',
-                    type=str, action=RevParseAction)
-parser.add_argument('-t', '--target-commit',
-                    help='The commit to compare against the baseline (default: HEAD).',
-                    type=str, action=RevParseAction)
-parser.add_argument('--base-pickle',
-                    help='name of pickle file with timings data generated by a former `-H -d FILE` run. '\
-                    'filename must be of the form <hash>-*.* or specify --base-commit seperately',
-                    type=str)
-parser.add_argument('--target-pickle',
-                    help='name of pickle file with timings data generated by a former `-H -d FILE` run '\
-                    'filename must be of the form <hash>-*.* or specify --target-commit seperately',
-                    type=str)
-parser.add_argument('-m', '--min-duration',
-                    help='Minimum duration (in ms) of baseline test for inclusion in report (default: %.3f).' % DEFAULT_MIN_DURATION,
-                    type=float,
-                    default=0.01)
-parser.add_argument('-o', '--output',
-                    metavar="<file>",
-                    dest='log_file',
-                    help='Path of file in which to save the textual report (default: vb_suite.log).')
-parser.add_argument('-d', '--outdf',
-                    metavar="FNAME",
-                    dest='outdf',
-                    default=None,
-                    help='Name of file to df.save() the result table into. Will overwrite')
-parser.add_argument('-r', '--regex',
-                    metavar="REGEX",
-                    dest='regex',
-                    default="",
-                    help='Regex pat, only tests whose name matches the regext will be run.')
-parser.add_argument('-s', '--seed',
-                    metavar="SEED",
-                    dest='seed',
-                    default=1234,
-                    type=int,
-                    help='Integer value to seed PRNG with')
-parser.add_argument('-n', '--repeats',
-                    metavar="N",
-                    dest='repeats',
-                    default=3,
-                    type=int,
-                    help='Number of times to run each vbench, result value is the best of')
-parser.add_argument('-c', '--ncalls',
-                    metavar="N",
-                    dest='ncalls',
-                    default=3,
-                    type=int,
-                    help='Number of calls to in each repetition of a vbench')
-parser.add_argument('-N', '--hrepeats',
-                    metavar="N",
-                    dest='hrepeats',
-                    default=1,
-                    type=int,
-                    help='implies -H, number of times to run the vbench suite on the head commit.\n'
-                    'Each iteration will yield another column in the output' )
-parser.add_argument('-a', '--affinity',
-                    metavar="a",
-                    dest='affinity',
-                    default=1,
-                    type=int,
-                    help='set processor affinity of process by default bind to cpu/core #1 only. '
-                         'Requires the "affinity" or "psutil" python module, will raise Warning otherwise')
-parser.add_argument('-u', '--burnin',
-                    metavar="u",
-                    dest='burnin',
-                    default=1,
-                    type=int,
-                    help='Number of extra iteration per benchmark to perform first, then throw away. '  )
-
-parser.add_argument('-S', '--stats',
-                    default=False,
-                    action='store_true',
-                    help='when specified with -N, prints the output of describe() per vbench results. '  )
-
-parser.add_argument('--temp-dir',
-                    metavar="PATH",
-                    default=None,
-                    help='Specify temp work dir to use. ccache depends on builds being invoked from consistent directory.'  )
-
-parser.add_argument('-q', '--quiet',
-                    default=False,
-                    action='store_true',
-                    help='Suppress report output to stdout. '  )
-
-def get_results_df(db, rev):
-    """Takes a git commit hash and returns a Dataframe of benchmark results
-    """
-    bench = DataFrame(db.get_benchmarks())
-    results = DataFrame(map(list,db.get_rev_results(rev).values()))
-
-    # Sinch vbench.db._reg_rev_results returns an unlabeled dict,
-    # we have to break encapsulation a bit.
-    results.columns = db._results.c.keys()
-    results = results.join(bench['name'], on='checksum').set_index("checksum")
-    return results
-
-
-def prprint(s):
-    print("*** %s" % s)
-
-def pre_hook():
-    import gc
-    gc.disable()
-
-def post_hook():
-    import gc
-    gc.enable()
-
-def profile_comparative(benchmarks):
-
-    from vbench.api import BenchmarkRunner
-    from vbench.db import BenchmarkDB
-    from vbench.git import GitRepo
-    from suite import BUILD, DB_PATH, PREPARE, dependencies
-
-    TMP_DIR = args.temp_dir or tempfile.mkdtemp()
-
-    try:
-
-        prprint("Opening DB at '%s'...\n" % DB_PATH)
-        db = BenchmarkDB(DB_PATH)
-
-        prprint("Initializing Runner...")
-
-        # all in a good cause...
-        GitRepo._parse_commit_log = _parse_wrapper(args.base_commit)
-
-        runner = BenchmarkRunner(
-            benchmarks, REPO_PATH, REPO_PATH, BUILD, DB_PATH,
-            TMP_DIR, PREPARE, always_clean=True,
-            # run_option='eod', start_date=START_DATE,
-            module_dependencies=dependencies)
-
-        repo = runner.repo  # (steal the parsed git repo used by runner)
-        h_head = args.target_commit or repo.shas[-1]
-        h_baseline = args.base_commit
-
-        # ARGH. reparse the repo, without discarding any commits,
-        # then overwrite the previous parse results
-        # prprint("Slaughtering kittens...")
-        (repo.shas, repo.messages,
-         repo.timestamps, repo.authors) = _parse_commit_log(None,REPO_PATH,
-                                                                args.base_commit)
-
-        prprint('Target [%s] : %s\n' % (h_head, repo.messages.get(h_head, "")))
-        prprint('Baseline [%s] : %s\n' % (h_baseline,
-                repo.messages.get(h_baseline, "")))
-
-        prprint("Removing any previous measurements for the commits.")
-        db.delete_rev_results(h_baseline)
-        db.delete_rev_results(h_head)
-
-        # TODO: we could skip this, but we need to make sure all
-        # results are in the DB, which is a little tricky with
-        # start dates and so on.
-        prprint("Running benchmarks for baseline [%s]" % h_baseline)
-        runner._run_and_write_results(h_baseline)
-
-        prprint("Running benchmarks for target [%s]" % h_head)
-        runner._run_and_write_results(h_head)
-
-        prprint('Processing results...')
-
-        head_res = get_results_df(db, h_head)
-        baseline_res = get_results_df(db, h_baseline)
-
-        report_comparative(head_res,baseline_res)
-
-    finally:
-        #        print("Disposing of TMP_DIR: %s" % TMP_DIR)
-        shutil.rmtree(TMP_DIR)
-
-def prep_pickle_for_total(df, agg_name='median'):
-    """
-    accepts a datafram resulting from invocation with -H -d o.pickle
-    If multiple data columns are present (-N was used), the
-    `agg_name` attr of the datafram will be used to reduce
-    them to a single value per vbench, df.median is used by defa
-    ult.
-
-    Returns a datadrame of the form expected by prep_totals
-    """
-    def prep(df):
-        agg = getattr(df,agg_name)
-        df = DataFrame(agg(1))
-        cols = list(df.columns)
-        cols[0]='timing'
-        df.columns=cols
-        df['name'] = list(df.index)
-        return df
-
-    return prep(df)
-
-def prep_totals(head_res, baseline_res):
-    """
-    Each argument should be a dataframe with  'timing' and 'name' columns
-    where name is the name of the vbench.
-
-    returns a 'totals' dataframe, suitable as input for print_report.
-    """
-    head_res, baseline_res = head_res.align(baseline_res)
-    ratio = head_res['timing'] / baseline_res['timing']
-    totals = DataFrame({HEAD_COL:head_res['timing'],
-                        BASE_COL:baseline_res['timing'],
-                        'ratio':ratio,
-                        'name':baseline_res.name},
-                        columns=[HEAD_COL, BASE_COL, "ratio", "name"])
-    totals = totals.ix[totals[HEAD_COL] > args.min_duration]
-    # ignore below threshold
-    totals = totals.dropna(
-    ).sort("ratio").set_index('name')  # sort in ascending order
-    return totals
-
-def report_comparative(head_res,baseline_res):
-    try:
-        r=git.Repo(VB_DIR)
-    except:
-        import pdb
-        pdb.set_trace()
-
-    totals = prep_totals(head_res,baseline_res)
-
-    h_head = args.target_commit
-    h_baseline = args.base_commit
-    h_msg = b_msg = "Unknown"
-    try:
-        h_msg =  r.commit(h_head).message.strip()
-    except git.exc.BadObject:
-        pass
-    try:
-        b_msg =  r.commit(h_baseline).message.strip()
-    except git.exc.BadObject:
-        pass
-
-
-    print_report(totals,h_head=h_head,h_msg=h_msg,
-             h_baseline=h_baseline,b_msg=b_msg)
-
-    if args.outdf:
-        prprint("The results DataFrame was written to '%s'\n" %  args.outdf)
-        totals.save(args.outdf)
-
-def profile_head_single(benchmark):
-    import gc
-    results = []
-
-    # just in case
-    gc.collect()
-
-    try:
-        from ctypes import cdll, CDLL
-        cdll.LoadLibrary("libc.so.6")
-        libc = CDLL("libc.so.6")
-        libc.malloc_trim(0)
-    except:
-        pass
-
-
-    N =  args.hrepeats + args.burnin
-
-    results = []
-    try:
-        for i in range(N):
-            gc.disable()
-            d=dict()
-
-            try:
-                d = benchmark.run()
-
-            except KeyboardInterrupt:
-                raise
-            except Exception as e: # if a single vbench bursts into flames, don't die.
-                err=""
-                try:
-                    err =  d.get("traceback")
-                    if err is None:
-                        err = str(e)
-                except:
-                    pass
-                print("%s died with:\n%s\nSkipping...\n" % (benchmark.name, err))
-
-            results.append(d.get('timing',np.nan))
-            gc.enable()
-            gc.collect()
-
-    finally:
-        gc.enable()
-
-    if results:
-        # throw away the burn_in
-        results = results[args.burnin:]
-    sys.stdout.write('.')
-    sys.stdout.flush()
-    return Series(results, name=benchmark.name)
-
-    # df = DataFrame(results)
-    # df.columns = ["name",HEAD_COL]
-    # return df.set_index("name")[HEAD_COL]
-
-def profile_head(benchmarks):
-    print( "Performing %d benchmarks (%d runs each)" % ( len(benchmarks), args.hrepeats))
-
-    ss= [profile_head_single(b) for b in benchmarks]
-    print("\n")
-
-    results = DataFrame(ss)
-    results.columns=[ "#%d" %i for i in range(args.hrepeats)]
-    # results.index = ["#%d" % i for i in range(len(ss))]
-    # results = results.T
-
-    shas, messages, _,_  = _parse_commit_log(None,REPO_PATH,base_commit="HEAD^")
-    print_report(results,h_head=shas[-1],h_msg=messages[-1])
-
-
-    if args.outdf:
-        prprint("The results DataFrame was written to '%s'\n" %  args.outdf)
-        DataFrame(results).save(args.outdf)
-
-def print_report(df,h_head=None,h_msg="",h_baseline=None,b_msg=""):
-
-    name_width=45
-    col_width = 10
-
-    hdr = ("{:%s}" % name_width).format("Test name")
-    hdr += ("|{:^%d}"  % col_width)* len(df.columns)
-    hdr += "|"
-    hdr = hdr.format(*df.columns)
-    hdr = "-"*len(hdr) + "\n" + hdr + "\n" + "-"*len(hdr) + "\n"
-    ftr=hdr
-    s = "\n"
-    s+= "Invoked with :\n"
-    s+= "--ncalls: %s\n" % (args.ncalls or 'Auto')
-    s+= "--repeats: %s\n" % (args.repeats)
-    s+= "\n\n"
-
-    s += hdr
-    # import ipdb
-    # ipdb.set_trace()
-    for i in range(len(df)):
-        lfmt = ("{:%s}" % name_width)
-        lfmt += ("| {:%d.4f} " % (col_width-2))* len(df.columns)
-        lfmt += "|\n"
-        s += lfmt.format(df.index[i],*list(df.iloc[i].values))
-
-    s+= ftr + "\n"
-
-    s += "Ratio < 1.0 means the target commit is faster then the baseline.\n"
-    s += "Seed used: %d\n\n" % args.seed
-
-    if  h_head:
-        s += 'Target [%s] : %s\n' % (h_head, h_msg)
-    if  h_baseline:
-        s += 'Base   [%s] : %s\n\n' % (
-            h_baseline, b_msg)
-
-    stats_footer = "\n"
-    if args.stats :
-        try:
-            pd.options.display.expand_frame_repr=False
-        except:
-            pass
-        stats_footer += str(df.T.describe().T) + "\n\n"
-
-    s+= stats_footer
-    logfile = open(args.log_file, 'w')
-    logfile.write(s)
-    logfile.close()
-
-    if not args.quiet:
-        prprint(s)
-
-    if args.stats and args.quiet:
-        prprint(stats_footer)
-
-    prprint("Results were also written to the logfile at '%s'" %
-            args.log_file)
-
-
-
-def main():
-    from suite import benchmarks
-
-    if not args.log_file:
-        args.log_file = os.path.abspath(
-            os.path.join(REPO_PATH, 'vb_suite.log'))
-
-    saved_dir = os.path.curdir
-    if args.outdf:
-        # not bullet-proof but enough for us
-        args.outdf = os.path.realpath(args.outdf)
-
-    if args.log_file:
-        # not bullet-proof but enough for us
-        args.log_file = os.path.realpath(args.log_file)
-
-    random.seed(args.seed)
-    np.random.seed(args.seed)
-
-    if args.base_pickle and args.target_pickle:
-        baseline_res = prep_pickle_for_total(pd.load(args.base_pickle))
-        target_res = prep_pickle_for_total(pd.load(args.target_pickle))
-
-        report_comparative(target_res, baseline_res)
-        sys.exit(0)
-
-    if args.affinity is not None:
-        try: # use psutil rather then stale affinity module. Thanks @yarikoptic
-            import psutil
-            if hasattr(psutil.Process, 'set_cpu_affinity'):
-                psutil.Process(os.getpid()).set_cpu_affinity([args.affinity])
-                print("CPU affinity set to %d" % args.affinity)
-        except ImportError:
-            print("-a/--affinity specified, but the 'psutil' module is not available, aborting.\n")
-            sys.exit(1)
-
-    print("\n")
-    prprint("LOG_FILE = %s" % args.log_file)
-    if args.outdf:
-        prprint("PICKE_FILE = %s" % args.outdf)
-
-    print("\n")
-
-    # move away from the pandas root dir, to avoid possible import
-    # surprises
-    os.chdir(os.path.dirname(os.path.abspath(__file__)))
-
-    benchmarks = [x for x in benchmarks if re.search(args.regex,x.name)]
-
-    for b in benchmarks:
-        b.repeat = args.repeats
-        if args.ncalls:
-            b.ncalls = args.ncalls
-
-    if benchmarks:
-        if args.head:
-            profile_head(benchmarks)
-        else:
-            profile_comparative(benchmarks)
-    else:
-        print( "No matching benchmarks")
-
-    os.chdir(saved_dir)
-
-# hack , vbench.git ignores some commits, but we
-# need to be able to reference any commit.
-# modified from vbench.git
-def _parse_commit_log(this,repo_path,base_commit=None):
-    from vbench.git import _convert_timezones
-    from pandas import Series
-    from dateutil import parser as dparser
-
-    git_cmd = 'git --git-dir=%s/.git --work-tree=%s ' % (repo_path, repo_path)
-    githist = git_cmd + ('log --graph --pretty=format:'+
-                         '\"::%h::%cd::%s::%an\"'+
-                         ('%s..' % base_commit)+
-                         '> githist.txt')
-    os.system(githist)
-    githist = open('githist.txt').read()
-    os.remove('githist.txt')
-
-    shas = []
-    timestamps = []
-    messages = []
-    authors = []
-    for line in githist.split('\n'):
-        if '*' not in line.split("::")[0]:  # skip non-commit lines
-            continue
-
-        _, sha, stamp, message, author = line.split('::', 4)
-
-        # parse timestamp into datetime object
-        stamp = dparser.parse(stamp)
-
-        shas.append(sha)
-        timestamps.append(stamp)
-        messages.append(message)
-        authors.append(author)
-
-    # to UTC for now
-    timestamps = _convert_timezones(timestamps)
-
-    shas = Series(shas, timestamps)
-    messages = Series(messages, shas)
-    timestamps = Series(timestamps, shas)
-    authors = Series(authors, shas)
-    return shas[::-1], messages[::-1], timestamps[::-1], authors[::-1]
-
-# even worse, monkey patch vbench
-def _parse_wrapper(base_commit):
-    def inner(repo_path):
-        return _parse_commit_log(repo_path,base_commit)
-    return inner
-
-if __name__ == '__main__':
-    args = parser.parse_args()
-    if (not args.head
-        and not (args.base_commit and args.target_commit)
-        and not (args.base_pickle and args.target_pickle)):
-        parser.print_help()
-        sys.exit(1)
-    elif ((args.base_pickle or args.target_pickle) and not
-        (args.base_pickle and args.target_pickle)):
-        print("Must specify Both --base-pickle and --target-pickle.")
-        sys.exit(1)
-
-    if ((args.base_pickle or args.target_pickle) and not
-        (args.base_commit and args.target_commit)):
-        if not args.base_commit:
-            print("base_commit not specified, Assuming base_pickle is named <commit>-foo.*")
-            args.base_commit = args.base_pickle.split('-')[0]
-        if not args.target_commit:
-            print("target_commit not specified, Assuming target_pickle is named <commit>-foo.*")
-            args.target_commit = args.target_pickle.split('-')[0]
-
-    import warnings
-    warnings.filterwarnings('ignore',category=FutureWarning)
-    warnings.filterwarnings('ignore',category=DeprecationWarning)
-
-    if args.base_commit and args.target_commit:
-        print("Verifying specified commits exist in repo...")
-        r=git.Repo(VB_DIR)
-        for c in [ args.base_commit, args.target_commit ]:
-            try:
-                msg =  r.commit(c).message.strip()
-            except git.BadObject:
-                print("The commit '%s' was not found, aborting..." % c)
-                sys.exit(1)
-            else:
-                print("%s: %s" % (c,msg))
-
-    main()
diff --git a/vb_suite/timedelta.py b/vb_suite/timedelta.py
deleted file mode 100644
index 378968ea1379a..0000000000000
--- a/vb_suite/timedelta.py
+++ /dev/null
@@ -1,32 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-from pandas import to_timedelta
-"""
-
-#----------------------------------------------------------------------
-# conversion
-
-setup = common_setup + """
-arr = np.random.randint(0,1000,size=10000)
-"""
-
-stmt = "to_timedelta(arr,unit='s')"
-timedelta_convert_int = Benchmark(stmt, setup, start_date=datetime(2014, 1, 1))
-
-setup = common_setup + """
-arr = np.random.randint(0,1000,size=10000)
-arr = [ '{0} days'.format(i) for i in arr ]
-"""
-
-stmt = "to_timedelta(arr)"
-timedelta_convert_string = Benchmark(stmt, setup, start_date=datetime(2014, 1, 1))
-
-setup = common_setup + """
-arr = np.random.randint(0,60,size=10000)
-arr = [ '00:00:{0:02d}'.format(i) for i in arr ]
-"""
-
-stmt = "to_timedelta(arr)"
-timedelta_convert_string_seconds = Benchmark(stmt, setup, start_date=datetime(2014, 1, 1))
diff --git a/vb_suite/timeseries.py b/vb_suite/timeseries.py
deleted file mode 100644
index 15bc89d62305f..0000000000000
--- a/vb_suite/timeseries.py
+++ /dev/null
@@ -1,445 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-from pandas import *
-
-N = 100000
-try:
-    rng = date_range(start='1/1/2000', periods=N, freq='min')
-except NameError:
-    rng = DatetimeIndex(start='1/1/2000', periods=N, freq='T')
-    def date_range(start=None, end=None, periods=None, freq=None):
-        return DatetimeIndex(start=start, end=end, periods=periods, offset=freq)
-
-
-common_setup = """from .pandas_vb_common import *
-from datetime import timedelta
-N = 100000
-
-rng = date_range(start='1/1/2000', periods=N, freq='T')
-
-if hasattr(Series, 'convert'):
-    Series.resample = Series.convert
-
-ts = Series(np.random.randn(N), index=rng)
-"""
-
-#----------------------------------------------------------------------
-# Lookup value in large time series, hash map population
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=1500000, freq='S')
-ts = Series(1, index=rng)
-"""
-
-stmt = "ts[ts.index[len(ts) // 2]]; ts.index._cleanup()"
-timeseries_large_lookup_value = Benchmark(stmt, setup,
-                                          start_date=datetime(2012, 1, 1))
-
-#----------------------------------------------------------------------
-# Test slice minutely series
-
-timeseries_slice_minutely = Benchmark('ts[:10000]', common_setup)
-
-#----------------------------------------------------------------------
-# Test conversion
-
-setup = common_setup + """
-
-"""
-
-timeseries_1min_5min_ohlc = Benchmark(
-    "ts[:10000].resample('5min', how='ohlc')",
-    common_setup,
-    start_date=datetime(2012, 5, 1))
-
-timeseries_1min_5min_mean = Benchmark(
-    "ts[:10000].resample('5min', how='mean')",
-    common_setup,
-    start_date=datetime(2012, 5, 1))
-
-#----------------------------------------------------------------------
-# Irregular alignment
-
-setup = common_setup + """
-lindex = np.random.permutation(N)[:N // 2]
-rindex = np.random.permutation(N)[:N // 2]
-left = Series(ts.values.take(lindex), index=ts.index.take(lindex))
-right = Series(ts.values.take(rindex), index=ts.index.take(rindex))
-"""
-
-timeseries_add_irregular = Benchmark('left + right', setup)
-
-#----------------------------------------------------------------------
-# Sort large irregular time series
-
-setup = common_setup + """
-N = 100000
-rng = date_range(start='1/1/2000', periods=N, freq='s')
-rng = rng.take(np.random.permutation(N))
-ts = Series(np.random.randn(N), index=rng)
-"""
-
-timeseries_sort_index = Benchmark('ts.sort_index()', setup,
-                                  start_date=datetime(2012, 4, 1))
-
-#----------------------------------------------------------------------
-# Shifting, add offset
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=10000, freq='T')
-"""
-
-datetimeindex_add_offset = Benchmark('rng + timedelta(minutes=2)', setup,
-                                     start_date=datetime(2012, 4, 1))
-
-setup = common_setup + """
-N = 10000
-rng = date_range(start='1/1/1990', periods=N, freq='53s')
-ts = Series(np.random.randn(N), index=rng)
-dates = date_range(start='1/1/1990', periods=N * 10, freq='5s')
-"""
-timeseries_asof_single = Benchmark('ts.asof(dates[0])', setup,
-                                   start_date=datetime(2012, 4, 27))
-
-timeseries_asof = Benchmark('ts.asof(dates)', setup,
-                            start_date=datetime(2012, 4, 27))
-
-setup = setup + 'ts[250:5000] = np.nan'
-
-timeseries_asof_nan = Benchmark('ts.asof(dates)', setup,
-                                start_date=datetime(2012, 4, 27))
-
-#----------------------------------------------------------------------
-# Time zone
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', end='3/1/2000', tz='US/Eastern')
-"""
-
-timeseries_timestamp_tzinfo_cons = \
-    Benchmark('rng[0]', setup, start_date=datetime(2012, 5, 5))
-
-#----------------------------------------------------------------------
-# Resampling period
-
-setup = common_setup + """
-rng = period_range(start='1/1/2000', end='1/1/2001', freq='T')
-ts = Series(np.random.randn(len(rng)), index=rng)
-"""
-
-timeseries_period_downsample_mean = \
-    Benchmark("ts.resample('D', how='mean')", setup,
-              start_date=datetime(2012, 4, 25))
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', end='1/1/2001', freq='T')
-ts = Series(np.random.randn(len(rng)), index=rng)
-"""
-
-timeseries_timestamp_downsample_mean = \
-    Benchmark("ts.resample('D', how='mean')", setup,
-              start_date=datetime(2012, 4, 25))
-
-# GH 7754
-setup = common_setup + """
-rng = date_range(start='2000-01-01 00:00:00',
-                    end='2000-01-01 10:00:00', freq='555000U')
-int_ts = Series(5, rng, dtype='int64')
-ts = int_ts.astype('datetime64[ns]')
-"""
-
-timeseries_resample_datetime64 = Benchmark("ts.resample('1S', how='last')", setup)
-
-#----------------------------------------------------------------------
-# to_datetime
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=20000, freq='H')
-strings = [x.strftime('%Y-%m-%d %H:%M:%S') for x in rng]
-"""
-
-timeseries_to_datetime_iso8601 = \
-    Benchmark('to_datetime(strings)', setup,
-              start_date=datetime(2012, 7, 11))
-
-timeseries_to_datetime_iso8601_format = \
-    Benchmark("to_datetime(strings, format='%Y-%m-%d %H:%M:%S')", setup,
-              start_date=datetime(2012, 7, 11))
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=10000, freq='D')
-strings = Series(rng.year*10000+rng.month*100+rng.day,dtype=np.int64).apply(str)
-"""
-
-timeseries_to_datetime_YYYYMMDD = \
-    Benchmark('to_datetime(strings,format="%Y%m%d")', setup,
-              start_date=datetime(2012, 7, 1))
-
-setup = common_setup + """
-s = Series(['19MAY11','19MAY11:00:00:00']*100000)
-"""
-timeseries_with_format_no_exact = Benchmark("to_datetime(s,format='%d%b%y',exact=False)", \
-     setup, start_date=datetime(2014, 11, 26))
-timeseries_with_format_replace = Benchmark("to_datetime(s.str.replace(':\S+$',''),format='%d%b%y')", \
-     setup, start_date=datetime(2014, 11, 26))
-
-# ---- infer_freq
-# infer_freq
-
-setup = common_setup + """
-from pandas.tseries.frequencies import infer_freq
-rng = date_range(start='1/1/1700', freq='D', periods=100000)
-a = rng[:50000].append(rng[50002:])
-"""
-
-timeseries_infer_freq = \
-    Benchmark('infer_freq(a)', setup, start_date=datetime(2012, 7, 1))
-
-# setitem PeriodIndex
-
-setup = common_setup + """
-rng = period_range(start='1/1/1990', freq='S', periods=20000)
-df = DataFrame(index=range(len(rng)))
-"""
-
-period_setitem = \
-    Benchmark("df['col'] = rng", setup,
-              start_date=datetime(2012, 8, 1))
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000 9:30', periods=10000, freq='S', tz='US/Eastern')
-"""
-
-datetimeindex_normalize = \
-    Benchmark('rng.normalize()', setup,
-              start_date=datetime(2012, 9, 1))
-
-setup = common_setup + """
-from pandas.tseries.offsets import Second
-s1 = date_range(start='1/1/2000', periods=100, freq='S')
-curr = s1[-1]
-slst = []
-for i in range(100):
-    slst.append(curr + Second()), periods=100, freq='S')
-    curr = slst[-1][-1]
-"""
-
-# dti_append_tz = \
-#     Benchmark('s1.append(slst)', setup, start_date=datetime(2012, 9, 1))
-
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=1000, freq='H')
-df = DataFrame(np.random.randn(len(rng), 2), rng)
-"""
-
-dti_reset_index = \
-    Benchmark('df.reset_index()', setup, start_date=datetime(2012, 9, 1))
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=1000, freq='H',
-                 tz='US/Eastern')
-df = DataFrame(np.random.randn(len(rng), 2), index=rng)
-"""
-
-dti_reset_index_tz = \
-    Benchmark('df.reset_index()', setup, start_date=datetime(2012, 9, 1))
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=1000, freq='T')
-index = rng.repeat(10)
-"""
-
-datetimeindex_unique = Benchmark('index.unique()', setup,
-                                 start_date=datetime(2012, 7, 1))
-
-# tz_localize with infer argument.  This is an attempt to emulate the results
-# of read_csv with duplicated data.  Not passing infer_dst will fail
-setup = common_setup + """
-dst_rng = date_range(start='10/29/2000 1:00:00',
-                     end='10/29/2000 1:59:59', freq='S')
-index = date_range(start='10/29/2000', end='10/29/2000 00:59:59', freq='S')
-index = index.append(dst_rng)
-index = index.append(dst_rng)
-index = index.append(date_range(start='10/29/2000 2:00:00',
-                                end='10/29/2000 3:00:00', freq='S'))
-"""
-
-datetimeindex_infer_dst = \
-Benchmark('index.tz_localize("US/Eastern", infer_dst=True)',
-          setup, start_date=datetime(2013, 9, 30))
-
-
-#----------------------------------------------------------------------
-# Resampling: fast-path various functions
-
-setup = common_setup + """
-rng = date_range(start='20130101',periods=100000,freq='50L')
-df = DataFrame(np.random.randn(100000,2),index=rng)
-"""
-
-dataframe_resample_mean_string = \
-    Benchmark("df.resample('1s', how='mean')", setup)
-
-dataframe_resample_mean_numpy = \
-    Benchmark("df.resample('1s', how=np.mean)", setup)
-
-dataframe_resample_min_string = \
-    Benchmark("df.resample('1s', how='min')", setup)
-
-dataframe_resample_min_numpy = \
-    Benchmark("df.resample('1s', how=np.min)", setup)
-
-dataframe_resample_max_string = \
-    Benchmark("df.resample('1s', how='max')", setup)
-
-dataframe_resample_max_numpy = \
-    Benchmark("df.resample('1s', how=np.max)", setup)
-
-
-#----------------------------------------------------------------------
-# DatetimeConverter
-
-setup = common_setup + """
-from pandas.tseries.converter import DatetimeConverter
-"""
-
-datetimeindex_converter = \
-    Benchmark('DatetimeConverter.convert(rng, None, None)',
-              setup, start_date=datetime(2013, 1, 1))
-
-# Adding custom business day
-setup = common_setup + """
-import datetime as dt
-import pandas as pd
-try:
-    import pandas.tseries.holiday
-except ImportError:
-    pass
-import numpy as np
-
-date = dt.datetime(2011,1,1)
-dt64 = np.datetime64('2011-01-01 09:00Z')
-hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-
-day = pd.offsets.Day()
-year = pd.offsets.YearBegin()
-cday = pd.offsets.CustomBusinessDay()
-cmb = pd.offsets.CustomBusinessMonthBegin(calendar=hcal)
-cme = pd.offsets.CustomBusinessMonthEnd(calendar=hcal)
-
-cdayh = pd.offsets.CustomBusinessDay(calendar=hcal)
-"""
-timeseries_day_incr = Benchmark("date + day",setup)
-
-timeseries_day_apply = Benchmark("day.apply(date)",setup)
-
-timeseries_year_incr = Benchmark("date + year",setup)
-
-timeseries_year_apply = Benchmark("year.apply(date)",setup)
-
-timeseries_custom_bday_incr = \
-    Benchmark("date + cday",setup)
-
-timeseries_custom_bday_decr = \
-    Benchmark("date - cday",setup)
-
-timeseries_custom_bday_apply = \
-    Benchmark("cday.apply(date)",setup)
-
-timeseries_custom_bday_apply_dt64 = \
-    Benchmark("cday.apply(dt64)",setup)
-
-timeseries_custom_bday_cal_incr = \
-    Benchmark("date + 1 * cdayh",setup)
-
-timeseries_custom_bday_cal_decr = \
-    Benchmark("date - 1 * cdayh",setup)
-
-timeseries_custom_bday_cal_incr_n = \
-    Benchmark("date + 10 * cdayh",setup)
-
-timeseries_custom_bday_cal_incr_neg_n = \
-    Benchmark("date - 10 * cdayh",setup)
-
-# Increment custom business month
-timeseries_custom_bmonthend_incr = \
-    Benchmark("date + cme",setup)
-
-timeseries_custom_bmonthend_incr_n = \
-    Benchmark("date + 10 * cme",setup)
-
-timeseries_custom_bmonthend_decr_n = \
-    Benchmark("date - 10 * cme",setup)
-
-timeseries_custom_bmonthbegin_incr_n = \
-    Benchmark("date + 10 * cmb",setup)
-
-timeseries_custom_bmonthbegin_decr_n = \
-    Benchmark("date - 10 * cmb",setup)
-
-
-#----------------------------------------------------------------------
-# month/quarter/year start/end accessors
-
-setup = common_setup + """
-N = 10000
-rng = date_range(start='1/1/1', periods=N, freq='B')
-"""
-
-timeseries_is_month_start = Benchmark('rng.is_month_start', setup,
-                                  start_date=datetime(2014, 4, 1))
-
-#----------------------------------------------------------------------
-# iterate over DatetimeIndex/PeriodIndex
-setup = common_setup + """
-N = 1000000
-M = 10000
-idx1 = date_range(start='20140101', freq='T', periods=N)
-idx2 = period_range(start='20140101', freq='T', periods=N)
-
-def iter_n(iterable, n=None):
-  i = 0
-  for _ in iterable:
-    i += 1
-    if n is not None and i > n:
-      break
-"""
-
-timeseries_iter_datetimeindex = Benchmark('iter_n(idx1)', setup)
-
-timeseries_iter_periodindex = Benchmark('iter_n(idx2)', setup)
-
-timeseries_iter_datetimeindex_preexit = Benchmark('iter_n(idx1, M)', setup)
-
-timeseries_iter_periodindex_preexit = Benchmark('iter_n(idx2, M)', setup)
-
-
-#----------------------------------------------------------------------
-# apply an Offset to a  DatetimeIndex
-setup = common_setup + """
-N = 100000
-idx1 = date_range(start='20140101', freq='T', periods=N)
-delta_offset = pd.offsets.Day()
-fast_offset = pd.offsets.DateOffset(months=2, days=2)
-slow_offset = pd.offsets.BusinessDay()
-
-"""
-
-timeseries_datetimeindex_offset_delta = Benchmark('idx1 + delta_offset', setup)
-timeseries_datetimeindex_offset_fast = Benchmark('idx1 + fast_offset', setup)
-timeseries_datetimeindex_offset_slow = Benchmark('idx1 + slow_offset', setup)
-
-# apply an Offset to a Series containing datetime64 values
-setup = common_setup + """
-N = 100000
-s = Series(date_range(start='20140101', freq='T', periods=N))
-delta_offset = pd.offsets.Day()
-fast_offset = pd.offsets.DateOffset(months=2, days=2)
-slow_offset = pd.offsets.BusinessDay()
-
-"""
-
-timeseries_series_offset_delta = Benchmark('s + delta_offset', setup)
-timeseries_series_offset_fast = Benchmark('s + fast_offset', setup)
-timeseries_series_offset_slow = Benchmark('s + slow_offset', setup)
diff --git a/versioneer.py b/versioneer.py
index c010f63e3ead8..2725fe98641a4 100644
--- a/versioneer.py
+++ b/versioneer.py
@@ -12,7 +12,7 @@
 * Compatible With: python2.6, 2.7, 3.2, 3.3, 3.4, and pypy
 * [![Latest Version]
 (https://pypip.in/version/versioneer/badge.svg?style=flat)
-](https://pypi.python.org/pypi/versioneer/)
+](https://pypi.org/project/versioneer/)
 * [![Build Status]
 (https://travis-ci.org/warner/python-versioneer.png?branch=master)
 ](https://travis-ci.org/warner/python-versioneer)
@@ -352,7 +352,7 @@
 import sys
 
 
-class VersioneerConfig:
+class VersioneerConfig(object):
     pass
 
 
@@ -606,11 +606,11 @@ def git_versions_from_keywords(keywords, tag_prefix, verbose):
         if verbose:
             print("keywords are unexpanded, not using")
         raise NotThisMethod("unexpanded keywords, not a git-archive tarball")
-    refs = set([r.strip() for r in refnames.strip("()").split(",")])
+    refs = {r.strip() for r in refnames.strip("()").split(",")}
     # starting in git-1.8.3, tags are listed as "tag: foo-1.0" instead of
     # just "foo-1.0". If we see a "tag: " prefix, prefer those.
     TAG = "tag: "
-    tags = set([r[len(TAG):] for r in refs if r.startswith(TAG)])
+    tags = {r[len(TAG):] for r in refs if r.startswith(TAG)}
     if not tags:
         # Either we're using git < 1.8.3, or there really are no tags. We use
         # a heuristic: assume all version tags have a digit. The old git %%d
@@ -619,7 +619,7 @@ def git_versions_from_keywords(keywords, tag_prefix, verbose):
         # between branches and tags. By ignoring refnames without digits, we
         # filter out many common branch names like "release" and
         # "stabilization", as well as "HEAD" and "master".
-        tags = set([r for r in refs if re.search(r'\d', r)])
+        tags = {r for r in refs if re.search(r'\d', r)}
         if verbose:
             print("discarding '%%s', no digits" %% ",".join(refs-tags))
     if verbose:
@@ -960,11 +960,11 @@ def git_versions_from_keywords(keywords, tag_prefix, verbose):
         if verbose:
             print("keywords are unexpanded, not using")
         raise NotThisMethod("unexpanded keywords, not a git-archive tarball")
-    refs = set([r.strip() for r in refnames.strip("()").split(",")])
+    refs = {r.strip() for r in refnames.strip("()").split(",")}
     # starting in git-1.8.3, tags are listed as "tag: foo-1.0" instead of
     # just "foo-1.0". If we see a "tag: " prefix, prefer those.
     TAG = "tag: "
-    tags = set([r[len(TAG):] for r in refs if r.startswith(TAG)])
+    tags = {r[len(TAG):] for r in refs if r.startswith(TAG)}
     if not tags:
         # Either we're using git < 1.8.3, or there really are no tags. We use
         # a heuristic: assume all version tags have a digit. The old git %d
@@ -973,7 +973,7 @@ def git_versions_from_keywords(keywords, tag_prefix, verbose):
         # between branches and tags. By ignoring refnames without digits, we
         # filter out many common branch names like "release" and
         # "stabilization", as well as "HEAD" and "master".
-        tags = set([r for r in refs if re.search(r'\d', r)])
+        tags = {r for r in refs if re.search(r'\d', r)}
         if verbose:
             print("discarding '%s', no digits" % ",".join(refs-tags))
     if verbose:
@@ -1130,7 +1130,9 @@ def versions_from_parentdir(parentdir_prefix, root, verbose):
 # unpacked source archive. Distribution tarballs contain a pre-generated copy
 # of this file.
 
-import json
+from warnings import catch_warnings
+with catch_warnings(record=True):
+    import json
 import sys
 
 version_json = '''